diff --git a/.coveragerc b/.coveragerc
deleted file mode 100644
index 3f630aa6cf8f5..0000000000000
--- a/.coveragerc
+++ /dev/null
@@ -1,27 +0,0 @@
-# .coveragerc to control coverage.py
-[run]
-branch = False
-omit = */tests/*
-
-[report]
-# Regexes for lines to exclude from consideration
-exclude_lines =
-    # Have to re-enable the standard pragma
-    pragma: no cover
-
-    # Don't complain about missing debug-only code:
-    def __repr__
-    if self\.debug
-
-    # Don't complain if tests don't hit defensive assertion code:
-    raise AssertionError
-    raise NotImplementedError
-
-    # Don't complain if non-runnable code isn't run:
-    if 0:
-    if __name__ == .__main__.:
-
-ignore_errors = False
-
-[html]
-directory = coverage_html_report
diff --git a/.github/CODE_OF_CONDUCT.md b/.github/CODE_OF_CONDUCT.md
new file mode 100644
index 0000000000000..a1fbece3284ec
--- /dev/null
+++ b/.github/CODE_OF_CONDUCT.md
@@ -0,0 +1,63 @@
+# Contributor Code of Conduct
+
+As contributors and maintainers of this project, and in the interest of
+fostering an open and welcoming community, we pledge to respect all people who
+contribute through reporting issues, posting feature requests, updating
+documentation, submitting pull requests or patches, and other activities.
+
+We are committed to making participation in this project a harassment-free
+experience for everyone, regardless of level of experience, gender, gender
+identity and expression, sexual orientation, disability, personal appearance,
+body size, race, ethnicity, age, religion, or nationality.
+
+Examples of unacceptable behavior by participants include:
+
+* The use of sexualized language or imagery
+* Personal attacks
+* Trolling or insulting/derogatory comments
+* Public or private harassment
+* Publishing other's private information, such as physical or electronic
+  addresses, without explicit permission
+* Other unethical or unprofessional conduct
+
+Project maintainers have the right and responsibility to remove, edit, or
+reject comments, commits, code, wiki edits, issues, and other contributions
+that are not aligned to this Code of Conduct, or to ban temporarily or
+permanently any contributor for other behaviors that they deem inappropriate,
+threatening, offensive, or harmful.
+
+By adopting this Code of Conduct, project maintainers commit themselves to
+fairly and consistently applying these principles to every aspect of managing
+this project. Project maintainers who do not follow or enforce the Code of
+Conduct may be permanently removed from the project team.
+
+This Code of Conduct applies both within project spaces and in public spaces
+when an individual is representing the project or its community.
+
+A working group of community members is committed to promptly addressing any
+reported issues. The working group is made up of pandas contributors and users.
+Instances of abusive, harassing, or otherwise unacceptable behavior may be
+reported by contacting the working group by e-mail (pandas-coc@googlegroups.com).
+Messages sent to this e-mail address will not be publicly visible but only to
+the working group members. The working group currently includes
+
+- Safia Abdalla
+- Tom Augspurger
+- Joris Van den Bossche
+- Camille Scott
+- Nathaniel Smith
+
+All complaints will be reviewed and investigated and will result in a response
+that is deemed necessary and appropriate to the circumstances. Maintainers are
+obligated to maintain confidentiality with regard to the reporter of an
+incident.
+
+This Code of Conduct is adapted from the [Contributor Covenant][homepage],
+version 1.3.0, available at
+[http://contributor-covenant.org/version/1/3/0/][version],
+and the [Swift Code of Conduct][swift].
+
+[homepage]: http://contributor-covenant.org
+[version]: http://contributor-covenant.org/version/1/3/0/
+[swift]: https://swift.org/community/#code-of-conduct
+
diff --git a/.github/CONTRIBUTING.md b/.github/CONTRIBUTING.md
index 95729f845ff5c..faff68b636109 100644
--- a/.github/CONTRIBUTING.md
+++ b/.github/CONTRIBUTING.md
@@ -1,24 +1,23 @@
-Contributing to pandas
-======================
+# Contributing to pandas
 
 Whether you are a novice or experienced software developer, all contributions and suggestions are welcome!
 
-Our main contribution docs can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst), but if you do not want to read it in its entirety, we will summarize the main ways in which you can contribute and point to relevant places in the docs for further information.
+Our main contributing guide can be found [in this repo](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst) or [on the website](https://pandas-docs.github.io/pandas-docs-travis/contributing.html). If you do not want to read it in its entirety, we will summarize the main ways in which you can contribute and point to relevant sections of that document for further information.
+
+## Getting Started
 
-Getting Started
----------------
 If you are looking to contribute to the *pandas* codebase, the best place to start is the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues). This is also a great place for filing bug reports and making suggestions for ways in which we can improve the code and documentation.
 
-If you have additional questions, feel free to ask them on the [mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata) or on [Gitter](https://gitter.im/pydata/pandas). Further information can also be found in our [Getting Started](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#where-to-start) section of our main contribution doc.
+If you have additional questions, feel free to ask them on the [mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata) or on [Gitter](https://gitter.im/pydata/pandas). Further information can also be found in the "[Where to start?](https://github.com/pandas-dev/pandas/blob/master/doc/source/development/contributing.rst#where-to-start)" section.
+
+## Filing Issues
+
+If you notice a bug in the code or documentation, or have suggestions for how we can improve either, feel free to create an issue on the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues) using [GitHub's "issue" form](https://github.com/pandas-dev/pandas/issues/new). The form contains some questions that will help us best address your issue. For more information regarding how to file issues against *pandas*, please refer to the "[Bug reports and enhancement requests](https://github.com/pandas-dev/pandas/blob/master/doc/source/development/contributing.rst#bug-reports-and-enhancement-requests)" section.
 
-Filing Issues
--------------
-If you notice a bug in the code or in docs or have suggestions for how we can improve either, feel free to create an issue on the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues) using [GitHub's "issue" form](https://github.com/pandas-dev/pandas/issues/new). The form contains some questions that will help us best address your issue. For more information regarding how to file issues against *pandas*, please refer to the [Bug reports and enhancement requests](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#bug-reports-and-enhancement-requests) section of our main contribution doc.
+## Contributing to the Codebase
 
-Contributing to the Codebase
-----------------------------
-The code is hosted on [GitHub](https://www.github.com/pandas-dev/pandas), so you will need to use [Git](http://git-scm.com/) to clone the project and make changes to the codebase. Once you have obtained a copy of the code, you should create a development environment that is separate from your existing Python environment so that you can make and test changes without compromising your own work environment. For more information, please refer to our [Working with the code](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#working-with-the-code) section of our main contribution docs.
+The code is hosted on [GitHub](https://www.github.com/pandas-dev/pandas), so you will need to use [Git](http://git-scm.com/) to clone the project and make changes to the codebase. Once you have obtained a copy of the code, you should create a development environment that is separate from your existing Python environment so that you can make and test changes without compromising your own work environment. For more information, please refer to the "[Working with the code](https://github.com/pandas-dev/pandas/blob/master/doc/source/development/contributing.rst#working-with-the-code)" section.
 
-Before submitting your changes for review, make sure to check that your changes do not break any tests. You can find more information about our test suites can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#test-driven-development-code-writing). We also have guidelines regarding coding style that will be enforced during testing. Details about coding style can be found [here](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#code-standards).
+Before submitting your changes for review, make sure to check that your changes do not break any tests. You can find more information about our test suites in the "[Test-driven development/code writing](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#test-driven-development-code-writing)" section. We also have guidelines regarding coding style that will be enforced during testing, which can be found in the "[Code standards](https://github.com/pandas-dev/pandas/blob/master/doc/source/development/contributing.rst#code-standards)" section.
 
-Once your changes are ready to be submitted, make sure to push your changes to GitHub before creating a pull request. Details about how to do that can be found in the [Contributing your changes to pandas](https://github.com/pandas-dev/pandas/blob/master/doc/source/contributing.rst#contributing-your-changes-to-pandas) section of our main contribution docs. We will review your changes, and you will most likely be asked to make additional changes before it is finally ready to merge. However, once it's ready, we will merge it, and you will have successfully contributed to the codebase!
+Once your changes are ready to be submitted, make sure to push your changes to GitHub before creating a pull request. Details about how to do that can be found in the "[Contributing your changes to pandas](https://github.com/pandas-dev/pandas/blob/master/doc/source/development/contributing.rst#contributing-your-changes-to-pandas)" section. We will review your changes, and you will most likely be asked to make additional changes before it is finally ready to merge. However, once it's ready, we will merge it, and you will have successfully contributed to the codebase!
diff --git a/.github/ISSUE_TEMPLATE.md b/.github/ISSUE_TEMPLATE.md
index 1f614b54b1f71..e33835c462511 100644
--- a/.github/ISSUE_TEMPLATE.md
+++ b/.github/ISSUE_TEMPLATE.md
@@ -8,11 +8,22 @@
 
 [this should explain **why** the current behaviour is a problem and why the expected output is a better solution.]
 
+**Note**: We receive a lot of issues on our GitHub tracker, so it is very possible that your issue has been posted before. Please check first before submitting so that we do not have to handle and close duplicates!
+
+**Note**: Many problems can be resolved by simply upgrading `pandas` to the latest version. Before submitting, please check if that solution works for you. If possible, you may want to check if `master` addresses this issue, but that is not necessary.
+
+For documentation-related issues, you can check the latest versions of the docs on `master` here:
+
+https://pandas-docs.github.io/pandas-docs-travis/
+
+If the issue has not been resolved there, go ahead and file it in the issue tracker.
+
 #### Expected Output
 
 #### Output of ``pd.show_versions()``
 
 <details>
-# Paste the output here pd.show_versions() here
+
+[paste the output of ``pd.show_versions()`` here below this line]
 
 </details>
diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
index 9281c51059087..4e1e9ce017408 100644
--- a/.github/PULL_REQUEST_TEMPLATE.md
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -1,4 +1,4 @@
- - [ ] closes #xxxx
- - [ ] tests added / passed
- - [ ] passes ``git diff upstream/master --name-only -- '*.py' | flake8 --diff``
- - [ ] whatsnew entry
+- [ ] closes #xxxx
+- [ ] tests added / passed
+- [ ] passes `git diff upstream/master -u -- "*.py" | flake8 --diff`
+- [ ] whatsnew entry
diff --git a/.gitignore b/.gitignore
index a509fcf736ea8..816aff376fc83 100644
--- a/.gitignore
+++ b/.gitignore
@@ -7,6 +7,7 @@
 *$
 *.bak
 *flymake*
+*.iml
 *.kdev4
 *.log
 *.swp
@@ -20,6 +21,7 @@
 .ipynb_checkpoints
 .tags
 .cache/
+.vscode/
 
 # Compiled source #
 ###################
@@ -59,6 +61,9 @@ dist
 .coverage
 coverage.xml
 coverage_html_report
+*.pytest_cache
+# hypothesis test database
+.hypothesis/
 
 # OS generated files #
 ######################
@@ -86,8 +91,8 @@ scikits
 *.c
 *.cpp
 
-# Performance Testing #
-#######################
+# Unit / Performance Testing #
+##############################
 asv_bench/env/
 asv_bench/html/
 asv_bench/results/
@@ -96,6 +101,8 @@ asv_bench/pandas/
 # Documentation generated files #
 #################################
 doc/source/generated
+doc/source/user_guide/styled.xlsx
+doc/source/reference/api
 doc/source/_static
 doc/source/vbench
 doc/source/vbench.rst
@@ -103,3 +110,5 @@ doc/source/index.rst
 doc/build/html/index.html
 # Windows specific leftover:
 doc/tmp.sv
+env/
+doc/source/savefig/
diff --git a/.pep8speaks.yml b/.pep8speaks.yml
new file mode 100644
index 0000000000000..cbcb098c47125
--- /dev/null
+++ b/.pep8speaks.yml
@@ -0,0 +1,19 @@
+# File : .pep8speaks.yml
+
+scanner:
+    diff_only: True  # If True, errors caused by only the patch are shown
+
+# Opened issue in pep8speaks, so we can directly use the config in setup.cfg
+# (and avoid having to duplicate it here):
+# https://github.com/OrkoHunter/pep8speaks/issues/95
+
+pycodestyle:
+    max-line-length: 79
+    ignore:
+        - W503,  # line break before binary operator
+        - W504,  # line break after binary operator
+        - E402,  # module level import not at top of file
+        - E731,  # do not assign a lambda expression, use a def
+        - C406,  # Unnecessary list literal - rewrite as a dict literal.
+        - C408,  # Unnecessary dict call - rewrite as a literal.
+        - C409   # Unnecessary list passed to tuple() - rewrite as a tuple literal.
diff --git a/.travis.yml b/.travis.yml
index d864b755541de..e478d71a5c350 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -7,7 +7,7 @@ python: 3.5
 # set NOCACHE-true
 # To delete caches go to https://travis-ci.org/OWNER/REPOSITORY/caches or run
 # travis cache --delete inside the project directory from the travis command line client
-# The cash directories will be deleted if anything in ci/ changes in a commit
+# The cache directories will be deleted if anything in ci/ changes in a commit
 cache:
  ccache: true
  directories:
@@ -16,80 +16,64 @@ cache:
 
 env:
   global:
-
-  # pandas-docs-travis GH
-  - secure: "YvvTc+FrSYHgdxqoxn9s8VOaCWjvZzlkaf6k55kkmQqCYR9dPiLMsot1F96/N7o3YlD1s0znPQCak93Du8HHi/8809zAXloTaMSZrWz4R4qn96xlZFRE88O/w/Z1t3VVYpKX3MHlCggBc8MtXrqmvWKJMAqXyysZ4TTzoiJDPvE="
+    # create a github personal access token
+    # cd pandas-dev/pandas
+    # travis encrypt 'PANDAS_GH_TOKEN=personal_access_token' -r pandas-dev/pandas
+    - secure: "EkWLZhbrp/mXJOx38CHjs7BnjXafsqHtwxPQrqWy457VDFWhIY1DMnIR/lOWG+a20Qv52sCsFtiZEmMfUjf0pLGXOqurdxbYBGJ7/ikFLk9yV2rDwiArUlVM9bWFnFxHvdz9zewBH55WurrY4ShZWyV+x2dWjjceWG5VpWeI6sA="
 
 git:
     # for cloning
-    depth: 1000
+    depth: 2000
 
 matrix:
     fast_finish: true
     exclude:
       # Exclude the default Python 3.5 build
       - python: 3.5
+
     include:
-    - os: osx
-      language: generic
-      env:
-        - JOB="3.5_OSX" TEST_ARGS="--skip-slow --skip-network"
-    - os: linux
+    - dist: trusty
       env:
-        - JOB="2.7_LOCALE" TEST_ARGS="--only-slow --skip-network" LOCALE_OVERRIDE="zh_CN.UTF-8"
-      addons:
-        apt:
-          packages:
-          - language-pack-zh-hans
-    - os: linux
+        - JOB="3.7" ENV_FILE="ci/deps/travis-37.yaml" PATTERN="(not slow and not network)"
+
+    - dist: trusty
       env:
-        - JOB="2.7" TEST_ARGS="--skip-slow" LINT=true
+        - JOB="2.7" ENV_FILE="ci/deps/travis-27.yaml" PATTERN="(not slow or (single and db))"
       addons:
         apt:
           packages:
           - python-gtk2
-    - os: linux
-      env:
-        - JOB="3.5" TEST_ARGS="--skip-slow --skip-network" COVERAGE=true
-      addons:
-        apt:
-          packages:
-          - xsel
-    - os: linux
-      env:
-        - JOB="3.6" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate" CONDA_FORGE=true
-    # In allow_failures
-    - os: linux
+
+    - dist: trusty
       env:
-        - JOB="2.7_SLOW" TEST_ARGS="--only-slow --skip-network"
-    # In allow_failures
-    - os: linux
+        - JOB="3.6, locale" ENV_FILE="ci/deps/travis-36-locale.yaml" PATTERN="((not slow and not network) or (single and db))" LOCALE_OVERRIDE="zh_CN.UTF-8"
+
+    - dist: trusty
       env:
-        - JOB="2.7_BUILD_TEST" TEST_ARGS="--skip-slow" BUILD_TEST=true
+        - JOB="3.6, coverage" ENV_FILE="ci/deps/travis-36.yaml" PATTERN="((not slow and not network) or (single and db))" PANDAS_TESTING_MODE="deprecate" COVERAGE=true
+
     # In allow_failures
-    - os: linux
+    - dist: trusty
       env:
-        - JOB="3.6_NUMPY_DEV" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate"
+        - JOB="3.6, slow" ENV_FILE="ci/deps/travis-36-slow.yaml" PATTERN="slow"
+
     # In allow_failures
-    - os: linux
+    - dist: trusty
       env:
-        - JOB="3.5_DOC" DOC=true
+        - JOB="3.6, doc" ENV_FILE="ci/deps/travis-36-doc.yaml" DOC=true
     allow_failures:
-      - os: linux
+      - dist: trusty
         env:
-          - JOB="2.7_SLOW" TEST_ARGS="--only-slow --skip-network"
-      - os: linux
+          - JOB="3.6, slow" ENV_FILE="ci/deps/travis-36-slow.yaml" PATTERN="slow"
+      - dist: trusty
         env:
-          - JOB="2.7_BUILD_TEST" TEST_ARGS="--skip-slow" BUILD_TEST=true
-      - os: linux
-        env:
-          - JOB="3.6_NUMPY_DEV" TEST_ARGS="--skip-slow --skip-network" PANDAS_TESTING_MODE="deprecate"
-      - os: linux
-        env:
-          - JOB="3.5_DOC" DOC=true
+          - JOB="3.6, doc" ENV_FILE="ci/deps/travis-36-doc.yaml" DOC=true
 
 before_install:
   - echo "before_install"
+  # set non-blocking IO on travis
+  # https://github.com/travis-ci/travis-ci/issues/8920#issuecomment-352661024
+  - python -c 'import os,sys,fcntl; flags = fcntl.fcntl(sys.stdout, fcntl.F_GETFL); fcntl.fcntl(sys.stdout, fcntl.F_SETFL, flags&~os.O_NONBLOCK);'
   - source ci/travis_process_gbq_encryption.sh
   - export PATH="$HOME/miniconda3/bin:$PATH"
   - df -h
@@ -97,8 +81,12 @@ before_install:
   - uname -a
   - git --version
   - git tag
-  - ci/before_install_travis.sh
-  - export DISPLAY=":99.0"
+  # Because travis runs on Google Cloud and has a /etc/boto.cfg,
+  # it breaks moto import, see:
+  # https://github.com/spulec/moto/issues/1771
+  # https://github.com/boto/boto/issues/3741
+  # This overrides travis and tells it to look nowhere.
+  - export BOTO_CONFIG=/dev/null
 
 install:
   - echo "install start"
@@ -109,25 +97,22 @@ install:
 
 before_script:
   - ci/install_db_travis.sh
+  - export DISPLAY=":99.0"
+  - ci/before_script_travis.sh
 
 script:
   - echo "script start"
-  - ci/run_build_docs.sh
-  - ci/script_single.sh
-  - ci/script_multi.sh
-  - ci/lint.sh
-  - echo "script done"
-
-after_success:
-  -  ci/upload_coverage.sh
+  - source activate pandas-dev
+  - ci/build_docs.sh
+  - ci/run_tests.sh
 
 after_script:
   - echo "after_script start"
-  - source activate pandas && python -c "import pandas; pandas.show_versions();"
-  - if [ -e /tmp/single.xml ]; then
-    ci/print_skipped.py /tmp/single.xml;
+  - source activate pandas-dev && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
+  - if [ -e test-data-single.xml ]; then
+        ci/print_skipped.py test-data-single.xml;
     fi
-  - if [ -e /tmp/multiple.xml ]; then
-    ci/print_skipped.py /tmp/multiple.xml;
+  - if [ -e test-data-multiple.xml ]; then
+        ci/print_skipped.py test-data-multiple.xml;
     fi
   - echo "after_script done"
diff --git a/AUTHORS.md b/AUTHORS.md
new file mode 100644
index 0000000000000..dcaaea101f4c8
--- /dev/null
+++ b/AUTHORS.md
@@ -0,0 +1,57 @@
+About the Copyright Holders
+===========================
+
+*   Copyright (c) 2008-2011 AQR Capital Management, LLC
+
+    AQR Capital Management began pandas development in 2008. Development was
+    led by Wes McKinney. AQR released the source under this license in 2009.
+*   Copyright (c) 2011-2012, Lambda Foundry, Inc.
+
+    Wes is now an employee of Lambda Foundry, and remains the pandas project
+    lead.
+*   Copyright (c) 2011-2012, PyData Development Team
+
+    The PyData Development Team is the collection of developers of the PyData
+    project. This includes all of the PyData sub-projects, including pandas. The
+    core team that coordinates development on GitHub can be found here:
+    http://github.com/pydata.
+
+Full credits for pandas contributors can be found in the documentation.
+
+Our Copyright Policy
+====================
+
+PyData uses a shared copyright model. Each contributor maintains copyright
+over their contributions to PyData. However, it is important to note that
+these contributions are typically only changes to the repositories. Thus,
+the PyData source code, in its entirety, is not the copyright of any single
+person or institution. Instead, it is the collective copyright of the
+entire PyData Development Team. If individual contributors want to maintain
+a record of what changes/contributions they have specific copyright on,
+they should indicate their copyright in the commit message of the change
+when they commit the change to one of the PyData repositories.
+
+With this in mind, the following banner should be used in any source code
+file to indicate the copyright and license terms:
+
+```
+#-----------------------------------------------------------------------------
+# Copyright (c) 2012, PyData Development Team
+# All rights reserved.
+#
+# Distributed under the terms of the BSD Simplified License.
+#
+# The full license is in the LICENSE file, distributed with this software.
+#-----------------------------------------------------------------------------
+```
+
+Other licenses can be found in the LICENSES directory.
+
+License
+=======
+
+pandas is distributed under a 3-clause ("Simplified" or "New") BSD
+license. Parts of NumPy, SciPy, numpydoc, bottleneck, which all have
+BSD-compatible licenses, are included. Their licenses follow the pandas
+license.
+
diff --git a/LICENSE b/LICENSE
index c9b8834e8774b..924de26253bf4 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,87 +1,29 @@
-=======
-License
-=======
+BSD 3-Clause License
 
-pandas is distributed under a 3-clause ("Simplified" or "New") BSD
-license. Parts of NumPy, SciPy, numpydoc, bottleneck, which all have
-BSD-compatible licenses, are included. Their licenses follow the pandas
-license.
-
-pandas license
-==============
-
-Copyright (c) 2011-2012, Lambda Foundry, Inc. and PyData Development Team
-All rights reserved.
-
-Copyright (c) 2008-2011 AQR Capital Management, LLC
+Copyright (c) 2008-2012, AQR Capital Management, LLC, Lambda Foundry, Inc. and PyData Development Team
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are
-met:
-
-    * Redistributions of source code must retain the above copyright
-       notice, this list of conditions and the following disclaimer.
-
-    * Redistributions in binary form must reproduce the above
-       copyright notice, this list of conditions and the following
-       disclaimer in the documentation and/or other materials provided
-       with the distribution.
-
-    * Neither the name of the copyright holder nor the names of any
-       contributors may be used to endorse or promote products derived
-       from this software without specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER AND CONTRIBUTORS
-"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
-OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-About the Copyright Holders
-===========================
-
-AQR Capital Management began pandas development in 2008. Development was
-led by Wes McKinney. AQR released the source under this license in 2009.
-Wes is now an employee of Lambda Foundry, and remains the pandas project
-lead.
-
-The PyData Development Team is the collection of developers of the PyData
-project. This includes all of the PyData sub-projects, including pandas. The
-core team that coordinates development on GitHub can be found here:
-http://github.com/pydata.
-
-Full credits for pandas contributors can be found in the documentation.
-
-Our Copyright Policy
-====================
-
-PyData uses a shared copyright model. Each contributor maintains copyright
-over their contributions to PyData. However, it is important to note that
-these contributions are typically only changes to the repositories. Thus,
-the PyData source code, in its entirety, is not the copyright of any single
-person or institution. Instead, it is the collective copyright of the
-entire PyData Development Team. If individual contributors want to maintain
-a record of what changes/contributions they have specific copyright on,
-they should indicate their copyright in the commit message of the change
-when they commit the change to one of the PyData repositories.
-
-With this in mind, the following banner should be used in any source code
-file to indicate the copyright and license terms:
-
-#-----------------------------------------------------------------------------
-# Copyright (c) 2012, PyData Development Team
-# All rights reserved.
-#
-# Distributed under the terms of the BSD Simplified License.
-#
-# The full license is in the LICENSE file, distributed with this software.
-#-----------------------------------------------------------------------------
-
-Other licenses can be found in the LICENSES directory.
\ No newline at end of file
diff --git a/LICENSES/DATEUTIL_LICENSE b/LICENSES/DATEUTIL_LICENSE
new file mode 100644
index 0000000000000..6053d35cfc60b
--- /dev/null
+++ b/LICENSES/DATEUTIL_LICENSE
@@ -0,0 +1,54 @@
+Copyright 2017- Paul Ganssle <paul@ganssle.io>
+Copyright 2017- dateutil contributors (see AUTHORS file)
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+
+The above license applies to all contributions after 2017-12-01, as well as
+all contributions that have been re-licensed (see AUTHORS file for the list of
+contributors who have re-licensed their code).
+--------------------------------------------------------------------------------
+dateutil - Extensions to the standard Python datetime module.
+
+Copyright (c) 2003-2011 - Gustavo Niemeyer <gustavo@niemeyer.net>
+Copyright (c) 2012-2014 - Tomi Pieviläinen <tomi.pievilainen@iki.fi>
+Copyright (c) 2014-2016 - Yaron de Leeuw <me@jarondl.net>
+Copyright (c) 2015-     - Paul Ganssle <paul@ganssle.io>
+Copyright (c) 2015-     - dateutil contributors (see AUTHORS file)
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright notice,
+      this list of conditions and the following disclaimer in the documentation
+      and/or other materials provided with the distribution.
+    * Neither the name of the copyright holder nor the names of its
+      contributors may be used to endorse or promote products derived from
+      this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+The above BSD License Applies to all code, even that also covered by Apache 2.0.
diff --git a/LICENSES/MUSL_LICENSE b/LICENSES/MUSL_LICENSE
new file mode 100644
index 0000000000000..a8833d4bc4744
--- /dev/null
+++ b/LICENSES/MUSL_LICENSE
@@ -0,0 +1,132 @@
+musl as a whole is licensed under the following standard MIT license:
+
+----------------------------------------------------------------------
+Copyright © 2005-2014 Rich Felker, et al.
+
+Permission is hereby granted, free of charge, to any person obtaining
+a copy of this software and associated documentation files (the
+"Software"), to deal in the Software without restriction, including
+without limitation the rights to use, copy, modify, merge, publish,
+distribute, sublicense, and/or sell copies of the Software, and to
+permit persons to whom the Software is furnished to do so, subject to
+the following conditions:
+
+The above copyright notice and this permission notice shall be
+included in all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
+MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
+IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
+CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
+TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
+SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+----------------------------------------------------------------------
+
+Authors/contributors include:
+
+Anthony G. Basile
+Arvid Picciani
+Bobby Bingham
+Boris Brezillon
+Brent Cook
+Chris Spiegel
+Clément Vasseur
+Emil Renner Berthing
+Hiltjo Posthuma
+Isaac Dunham
+Jens Gustedt
+Jeremy Huntwork
+John Spencer
+Justin Cormack
+Luca Barbato
+Luka Perkov
+M Farkas-Dyck (Strake)
+Michael Forney
+Nicholas J. Kain
+orc
+Pascal Cuoq
+Pierre Carrier
+Rich Felker
+Richard Pennington
+sin
+Solar Designer
+Stefan Kristiansson
+Szabolcs Nagy
+Timo Teräs
+Valentin Ochs
+William Haddon
+
+Portions of this software are derived from third-party works licensed
+under terms compatible with the above MIT license:
+
+The TRE regular expression implementation (src/regex/reg* and
+src/regex/tre*) is Copyright © 2001-2008 Ville Laurikari and licensed
+under a 2-clause BSD license (license text in the source files). The
+included version has been heavily modified by Rich Felker in 2012, in
+the interests of size, simplicity, and namespace cleanliness.
+
+Much of the math library code (src/math/* and src/complex/*) is
+Copyright © 1993,2004 Sun Microsystems or
+Copyright © 2003-2011 David Schultz or
+Copyright © 2003-2009 Steven G. Kargl or
+Copyright © 2003-2009 Bruce D. Evans or
+Copyright © 2008 Stephen L. Moshier
+and labelled as such in comments in the individual source files. All
+have been licensed under extremely permissive terms.
+
+The ARM memcpy code (src/string/armel/memcpy.s) is Copyright © 2008
+The Android Open Source Project and is licensed under a two-clause BSD
+license. It was taken from Bionic libc, used on Android.
+
+The implementation of DES for crypt (src/misc/crypt_des.c) is
+Copyright © 1994 David Burren. It is licensed under a BSD license.
+
+The implementation of blowfish crypt (src/misc/crypt_blowfish.c) was
+originally written by Solar Designer and placed into the public
+domain. The code also comes with a fallback permissive license for use
+in jurisdictions that may not recognize the public domain.
+
+The smoothsort implementation (src/stdlib/qsort.c) is Copyright © 2011
+Valentin Ochs and is licensed under an MIT-style license.
+
+The BSD PRNG implementation (src/prng/random.c) and XSI search API
+(src/search/*.c) functions are Copyright © 2011 Szabolcs Nagy and
+licensed under following terms: "Permission to use, copy, modify,
+and/or distribute this code for any purpose with or without fee is
+hereby granted. There is no warranty."
+
+The x86_64 port was written by Nicholas J. Kain. Several files (crt)
+were released into the public domain; others are licensed under the
+standard MIT license terms at the top of this file. See individual
+files for their copyright status.
+
+The mips and microblaze ports were originally written by Richard
+Pennington for use in the ellcc project. The original code was adapted
+by Rich Felker for build system and code conventions during upstream
+integration. It is licensed under the standard MIT terms.
+
+The powerpc port was also originally written by Richard Pennington,
+and later supplemented and integrated by John Spencer. It is licensed
+under the standard MIT terms.
+
+All other files which have no copyright comments are original works
+produced specifically for use as part of this library, written either
+by Rich Felker, the main author of the library, or by one or more
+contibutors listed above. Details on authorship of individual files
+can be found in the git version control history of the project. The
+omission of copyright and license comments in each file is in the
+interest of source tree size.
+
+All public header files (include/* and arch/*/bits/*) should be
+treated as Public Domain as they intentionally contain no content
+which can be covered by copyright. Some source modules may fall in
+this category as well. If you believe that a file is so trivial that
+it should be in the Public Domain, please contact the authors and
+request an explicit statement releasing it from copyright.
+
+The following files are trivial, believed not to be copyrightable in
+the first place, and hereby explicitly released to the Public Domain:
+
+All public headers: include/*, arch/*/bits/*
+Startup files: crt/*
diff --git a/LICENSES/XARRAY_LICENSE b/LICENSES/XARRAY_LICENSE
new file mode 100644
index 0000000000000..37ec93a14fdcd
--- /dev/null
+++ b/LICENSES/XARRAY_LICENSE
@@ -0,0 +1,191 @@
+Apache License
+Version 2.0, January 2004
+http://www.apache.org/licenses/
+
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+1. Definitions.
+
+"License" shall mean the terms and conditions for use, reproduction, and
+distribution as defined by Sections 1 through 9 of this document.
+
+"Licensor" shall mean the copyright owner or entity authorized by the copyright
+owner that is granting the License.
+
+"Legal Entity" shall mean the union of the acting entity and all other entities
+that control, are controlled by, or are under common control with that entity.
+For the purposes of this definition, "control" means (i) the power, direct or
+indirect, to cause the direction or management of such entity, whether by
+contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the
+outstanding shares, or (iii) beneficial ownership of such entity.
+
+"You" (or "Your") shall mean an individual or Legal Entity exercising
+permissions granted by this License.
+
+"Source" form shall mean the preferred form for making modifications, including
+but not limited to software source code, documentation source, and configuration
+files.
+
+"Object" form shall mean any form resulting from mechanical transformation or
+translation of a Source form, including but not limited to compiled object code,
+generated documentation, and conversions to other media types.
+
+"Work" shall mean the work of authorship, whether in Source or Object form, made
+available under the License, as indicated by a copyright notice that is included
+in or attached to the work (an example is provided in the Appendix below).
+
+"Derivative Works" shall mean any work, whether in Source or Object form, that
+is based on (or derived from) the Work and for which the editorial revisions,
+annotations, elaborations, or other modifications represent, as a whole, an
+original work of authorship. For the purposes of this License, Derivative Works
+shall not include works that remain separable from, or merely link (or bind by
+name) to the interfaces of, the Work and Derivative Works thereof.
+
+"Contribution" shall mean any work of authorship, including the original version
+of the Work and any modifications or additions to that Work or Derivative Works
+thereof, that is intentionally submitted to Licensor for inclusion in the Work
+by the copyright owner or by an individual or Legal Entity authorized to submit
+on behalf of the copyright owner. For the purposes of this definition,
+"submitted" means any form of electronic, verbal, or written communication sent
+to the Licensor or its representatives, including but not limited to
+communication on electronic mailing lists, source code control systems, and
+issue tracking systems that are managed by, or on behalf of, the Licensor for
+the purpose of discussing and improving the Work, but excluding communication
+that is conspicuously marked or otherwise designated in writing by the copyright
+owner as "Not a Contribution."
+
+"Contributor" shall mean Licensor and any individual or Legal Entity on behalf
+of whom a Contribution has been received by Licensor and subsequently
+incorporated within the Work.
+
+2. Grant of Copyright License.
+
+Subject to the terms and conditions of this License, each Contributor hereby
+grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
+irrevocable copyright license to reproduce, prepare Derivative Works of,
+publicly display, publicly perform, sublicense, and distribute the Work and such
+Derivative Works in Source or Object form.
+
+3. Grant of Patent License.
+
+Subject to the terms and conditions of this License, each Contributor hereby
+grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free,
+irrevocable (except as stated in this section) patent license to make, have
+made, use, offer to sell, sell, import, and otherwise transfer the Work, where
+such license applies only to those patent claims licensable by such Contributor
+that are necessarily infringed by their Contribution(s) alone or by combination
+of their Contribution(s) with the Work to which such Contribution(s) was
+submitted. If You institute patent litigation against any entity (including a
+cross-claim or counterclaim in a lawsuit) alleging that the Work or a
+Contribution incorporated within the Work constitutes direct or contributory
+patent infringement, then any patent licenses granted to You under this License
+for that Work shall terminate as of the date such litigation is filed.
+
+4. Redistribution.
+
+You may reproduce and distribute copies of the Work or Derivative Works thereof
+in any medium, with or without modifications, and in Source or Object form,
+provided that You meet the following conditions:
+
+You must give any other recipients of the Work or Derivative Works a copy of
+this License; and
+You must cause any modified files to carry prominent notices stating that You
+changed the files; and
+You must retain, in the Source form of any Derivative Works that You distribute,
+all copyright, patent, trademark, and attribution notices from the Source form
+of the Work, excluding those notices that do not pertain to any part of the
+Derivative Works; and
+If the Work includes a "NOTICE" text file as part of its distribution, then any
+Derivative Works that You distribute must include a readable copy of the
+attribution notices contained within such NOTICE file, excluding those notices
+that do not pertain to any part of the Derivative Works, in at least one of the
+following places: within a NOTICE text file distributed as part of the
+Derivative Works; within the Source form or documentation, if provided along
+with the Derivative Works; or, within a display generated by the Derivative
+Works, if and wherever such third-party notices normally appear. The contents of
+the NOTICE file are for informational purposes only and do not modify the
+License. You may add Your own attribution notices within Derivative Works that
+You distribute, alongside or as an addendum to the NOTICE text from the Work,
+provided that such additional attribution notices cannot be construed as
+modifying the License.
+You may add Your own copyright statement to Your modifications and may provide
+additional or different license terms and conditions for use, reproduction, or
+distribution of Your modifications, or for any such Derivative Works as a whole,
+provided Your use, reproduction, and distribution of the Work otherwise complies
+with the conditions stated in this License.
+
+5. Submission of Contributions.
+
+Unless You explicitly state otherwise, any Contribution intentionally submitted
+for inclusion in the Work by You to the Licensor shall be under the terms and
+conditions of this License, without any additional terms or conditions.
+Notwithstanding the above, nothing herein shall supersede or modify the terms of
+any separate license agreement you may have executed with Licensor regarding
+such Contributions.
+
+6. Trademarks.
+
+This License does not grant permission to use the trade names, trademarks,
+service marks, or product names of the Licensor, except as required for
+reasonable and customary use in describing the origin of the Work and
+reproducing the content of the NOTICE file.
+
+7. Disclaimer of Warranty.
+
+Unless required by applicable law or agreed to in writing, Licensor provides the
+Work (and each Contributor provides its Contributions) on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied,
+including, without limitation, any warranties or conditions of TITLE,
+NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are
+solely responsible for determining the appropriateness of using or
+redistributing the Work and assume any risks associated with Your exercise of
+permissions under this License.
+
+8. Limitation of Liability.
+
+In no event and under no legal theory, whether in tort (including negligence),
+contract, or otherwise, unless required by applicable law (such as deliberate
+and grossly negligent acts) or agreed to in writing, shall any Contributor be
+liable to You for damages, including any direct, indirect, special, incidental,
+or consequential damages of any character arising as a result of this License or
+out of the use or inability to use the Work (including but not limited to
+damages for loss of goodwill, work stoppage, computer failure or malfunction, or
+any and all other commercial damages or losses), even if such Contributor has
+been advised of the possibility of such damages.
+
+9. Accepting Warranty or Additional Liability.
+
+While redistributing the Work or Derivative Works thereof, You may choose to
+offer, and charge a fee for, acceptance of support, warranty, indemnity, or
+other liability obligations and/or rights consistent with this License. However,
+in accepting such obligations, You may act only on Your own behalf and on Your
+sole responsibility, not on behalf of any other Contributor, and only if You
+agree to indemnify, defend, and hold each Contributor harmless for any liability
+incurred by, or claims asserted against, such Contributor by reason of your
+accepting any such warranty or additional liability.
+
+END OF TERMS AND CONDITIONS
+
+APPENDIX: How to apply the Apache License to your work
+
+To apply the Apache License to your work, attach the following boilerplate
+notice, with the fields enclosed by brackets "[]" replaced with your own
+identifying information. (Don't include the brackets!) The text should be
+enclosed in the appropriate comment syntax for the file format. We also
+recommend that a file or class name and description of purpose be included on
+the same "printed page" as the copyright notice for easier identification within
+third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/MANIFEST.in b/MANIFEST.in
index b7a7e6039ac9a..b417b8890fa24 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,27 +1,41 @@
 include MANIFEST.in
 include LICENSE
 include RELEASE.md
-include README.rst
+include README.md
 include setup.py
 
 graft doc
 prune doc/build
 
+graft LICENSES
+
 graft pandas
 
-global-exclude *.so
-global-exclude *.pyd
+global-exclude *.bz2
+global-exclude *.csv
+global-exclude *.dta
+global-exclude *.gz
+global-exclude *.h5
+global-exclude *.html
+global-exclude *.json
+global-exclude *.msgpack
+global-exclude *.pickle
+global-exclude *.png
 global-exclude *.pyc
+global-exclude *.pyd
+global-exclude *.sas7bdat
+global-exclude *.so
+global-exclude *.xls
+global-exclude *.xlsm
+global-exclude *.xlsx
+global-exclude *.xpt
+global-exclude *.xz
+global-exclude *.zip
 global-exclude *~
-global-exclude \#*
-global-exclude .git*
 global-exclude .DS_Store
-global-exclude *.png
+global-exclude .git*
+global-exclude \#*
 
-# include examples/data/*
-# recursive-include examples *.py
-# recursive-include doc/source *
-# recursive-include doc/sphinxext *
-# recursive-include LICENSES *
 include versioneer.py
 include pandas/_version.py
+include pandas/io/formats/templates/*.tpl
diff --git a/Makefile b/Makefile
index 194a8861715b7..956ff52338839 100644
--- a/Makefile
+++ b/Makefile
@@ -12,6 +12,9 @@ clean_pyc:
 build: clean_pyc
 	python setup.py build_ext --inplace
 
+lint-diff:
+	git diff upstream/master --name-only -- "*.py" | xargs flake8
+
 develop: build
 	-python setup.py develop
 
diff --git a/README.md b/README.md
index e05f1405419fc..ce22818705865 100644
--- a/README.md
+++ b/README.md
@@ -9,18 +9,33 @@
 <table>
 <tr>
   <td>Latest Release</td>
-  <td><img src="https://img.shields.io/pypi/v/pandas.svg" alt="latest release" /></td>
+  <td>
+    <a href="https://pypi.org/project/pandas/">
+    <img src="https://img.shields.io/pypi/v/pandas.svg" alt="latest release" />
+    </a>
+  </td>
 </tr>
   <td></td>
-  <td><img src="https://anaconda.org/conda-forge/pandas/badges/version.svg" alt="latest release" /></td>
+  <td>
+    <a href="https://anaconda.org/anaconda/pandas/">
+    <img src="https://anaconda.org/conda-forge/pandas/badges/version.svg" alt="latest release" />
+    </a>
+</td>
 </tr>
 <tr>
   <td>Package Status</td>
-  <td><img src="https://img.shields.io/pypi/status/pandas.svg" alt="status" /></td>
+  <td>
+		<a href="https://pypi.org/project/pandas/">
+		<img src="https://img.shields.io/pypi/status/pandas.svg" alt="status" /></td>
+		</a>
 </tr>
 <tr>
   <td>License</td>
-  <td><img src="https://img.shields.io/pypi/l/pandas.svg" alt="license" /></td>
+  <td>
+    <a href="https://github.com/pandas-dev/pandas/blob/master/LICENSE">
+    <img src="https://img.shields.io/pypi/l/pandas.svg" alt="license" />
+    </a>
+</td>
 </tr>
 <tr>
   <td>Build Status</td>
@@ -33,52 +48,40 @@
 <tr>
   <td></td>
   <td>
-    <a href="https://circleci.com/gh/pandas-dev/pandas">
-    <img src="https://circleci.com/gh/circleci/mongofinil/tree/master.svg?style=shield&circle-token=223d8cafa7b02902c3e150242520af8944e34671" alt="circleci build status" />
-    </a>
-  </td>
-</tr>
-<tr>
-  <td></td>
-  <td>
-    <a href="https://ci.appveyor.com/project/pandas-dev/pandas">
-    <img src="https://ci.appveyor.com/api/projects/status/86vn83mxgnl4xf1s/branch/master?svg=true" alt="appveyor build status" />
+    <a href="https://dev.azure.com/pandas-dev/pandas/_build/latest?definitionId=1&branch=master">
+      <img src="https://dev.azure.com/pandas-dev/pandas/_apis/build/status/pandas-dev.pandas?branch=master" alt="Azure Pipelines build status" />
     </a>
   </td>
 </tr>
 <tr>
   <td>Coverage</td>
-  <td><img src="https://codecov.io/github/pandas-dev/pandas/coverage.svg?branch=master" alt="coverage" /></td>
-</tr>
-<tr>
-  <td>Conda</td>
-  <td>
-    <a href="http://pandas.pydata.org">
-    <img src="http://pubbadges.s3-website-us-east-1.amazonaws.com/pkgs-downloads-pandas.png" alt="conda default downloads" />
+  <td>
+    <a href="https://codecov.io/gh/pandas-dev/pandas">
+    <img src="https://codecov.io/github/pandas-dev/pandas/coverage.svg?branch=master" alt="coverage" />
     </a>
   </td>
 </tr>
 <tr>
-  <td>Conda-forge</td>
+  <td>Downloads</td>
   <td>
-    <a href="http://pandas.pydata.org">
+    <a href="https://pandas.pydata.org">
     <img src="https://anaconda.org/conda-forge/pandas/badges/downloads.svg" alt="conda-forge downloads" />
     </a>
   </td>
 </tr>
 <tr>
-  <td>PyPI</td>
-  <td>
-    <a href="https://pypi.python.org/pypi/pandas/">
-    <img src="https://img.shields.io/pypi/dm/pandas.svg" alt="pypi downloads" />
-    </a>
-  </td>
+	<td>Gitter</td>
+	<td>
+		<a href="https://gitter.im/pydata/pandas">
+		<img src="https://badges.gitter.im/Join%20Chat.svg"
+	</a>
+	</td>
 </tr>
 </table>
 
-[![https://gitter.im/pydata/pandas](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/pydata/pandas?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
 
-## What is it
+
+## What is it?
 
 **pandas** is a Python package providing fast, flexible, and expressive data
 structures designed to make working with "relational" or "labeled" data both
@@ -86,7 +89,7 @@ easy and intuitive. It aims to be the fundamental high-level building block for
 doing practical, **real world** data analysis in Python. Additionally, it has
 the broader goal of becoming **the most powerful and flexible open source data
 analysis / manipulation tool available in any language**. It is already well on
-its way toward this goal.
+its way towards this goal.
 
 ## Main Features
 Here are just a few of the things that pandas does well:
@@ -123,31 +126,31 @@ Here are just a few of the things that pandas does well:
     moving window linear regressions, date shifting and lagging, etc.
 
 
-   [missing-data]: http://pandas.pydata.org/pandas-docs/stable/missing_data.html#working-with-missing-data
-   [insertion-deletion]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html#column-selection-addition-deletion
-   [alignment]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html?highlight=alignment#intro-to-data-structures
-   [groupby]: http://pandas.pydata.org/pandas-docs/stable/groupby.html#group-by-split-apply-combine
-   [conversion]: http://pandas.pydata.org/pandas-docs/stable/dsintro.html#dataframe
-   [slicing]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#slicing-ranges
-   [fancy-indexing]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#advanced-indexing-with-ix
-   [subsetting]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing
-   [merging]: http://pandas.pydata.org/pandas-docs/stable/merging.html#database-style-dataframe-joining-merging
-   [joining]: http://pandas.pydata.org/pandas-docs/stable/merging.html#joining-on-index
-   [reshape]: http://pandas.pydata.org/pandas-docs/stable/reshaping.html#reshaping-and-pivot-tables
-   [pivot-table]: http://pandas.pydata.org/pandas-docs/stable/reshaping.html#pivot-tables-and-cross-tabulations
-   [mi]: http://pandas.pydata.org/pandas-docs/stable/indexing.html#hierarchical-indexing-multiindex
-   [flat-files]: http://pandas.pydata.org/pandas-docs/stable/io.html#csv-text-files
-   [excel]: http://pandas.pydata.org/pandas-docs/stable/io.html#excel-files
-   [db]: http://pandas.pydata.org/pandas-docs/stable/io.html#sql-queries
-   [hdfstore]: http://pandas.pydata.org/pandas-docs/stable/io.html#hdf5-pytables
-   [timeseries]: http://pandas.pydata.org/pandas-docs/stable/timeseries.html#time-series-date-functionality
+   [missing-data]: https://pandas.pydata.org/pandas-docs/stable/missing_data.html#working-with-missing-data
+   [insertion-deletion]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html#column-selection-addition-deletion
+   [alignment]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html?highlight=alignment#intro-to-data-structures
+   [groupby]: https://pandas.pydata.org/pandas-docs/stable/groupby.html#group-by-split-apply-combine
+   [conversion]: https://pandas.pydata.org/pandas-docs/stable/dsintro.html#dataframe
+   [slicing]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#slicing-ranges
+   [fancy-indexing]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#advanced-indexing-with-ix
+   [subsetting]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing
+   [merging]: https://pandas.pydata.org/pandas-docs/stable/merging.html#database-style-dataframe-joining-merging
+   [joining]: https://pandas.pydata.org/pandas-docs/stable/merging.html#joining-on-index
+   [reshape]: https://pandas.pydata.org/pandas-docs/stable/reshaping.html#reshaping-and-pivot-tables
+   [pivot-table]: https://pandas.pydata.org/pandas-docs/stable/reshaping.html#pivot-tables-and-cross-tabulations
+   [mi]: https://pandas.pydata.org/pandas-docs/stable/indexing.html#hierarchical-indexing-multiindex
+   [flat-files]: https://pandas.pydata.org/pandas-docs/stable/io.html#csv-text-files
+   [excel]: https://pandas.pydata.org/pandas-docs/stable/io.html#excel-files
+   [db]: https://pandas.pydata.org/pandas-docs/stable/io.html#sql-queries
+   [hdfstore]: https://pandas.pydata.org/pandas-docs/stable/io.html#hdf5-pytables
+   [timeseries]: https://pandas.pydata.org/pandas-docs/stable/timeseries.html#time-series-date-functionality
 
 ## Where to get it
 The source code is currently hosted on GitHub at:
-http://github.com/pandas-dev/pandas
+https://github.com/pandas-dev/pandas
 
 Binary installers for the latest released version are available at the [Python
-package index](http://pypi.python.org/pypi/pandas/) and on conda.
+package index](https://pypi.org/project/pandas) and on conda.
 
 ```sh
 # conda
@@ -160,12 +163,11 @@ pip install pandas
 ```
 
 ## Dependencies
-- [NumPy](http://www.numpy.org): 1.7.0 or higher
-- [python-dateutil](http://labix.org/python-dateutil): 1.5 or higher
-- [pytz](http://pytz.sourceforge.net)
-    - Needed for time zone support with ``pandas.date_range``
+- [NumPy](https://www.numpy.org): 1.12.0 or higher
+- [python-dateutil](https://labix.org/python-dateutil): 2.5.0 or higher
+- [pytz](https://pythonhosted.org/pytz): 2011k or higher
 
-See the [full installation instructions](http://pandas.pydata.org/pandas-docs/stable/install.html#dependencies)
+See the [full installation instructions](https://pandas.pydata.org/pandas-docs/stable/install.html#dependencies)
 for recommended and optional dependencies.
 
 ## Installation from sources
@@ -197,32 +199,36 @@ mode](https://pip.pypa.io/en/latest/reference/pip_install.html#editable-installs
 pip install -e .
 ```
 
-On Windows, you will need to install MinGW and execute:
-
-```sh
-python setup.py build --compiler=mingw32
-python setup.py install
-```
-
-See http://pandas.pydata.org/ for more information.
+See the full instructions for [installing from source](https://pandas.pydata.org/pandas-docs/stable/install.html#installing-from-source).
 
 ## License
-BSD
+[BSD 3](LICENSE)
 
 ## Documentation
-The official documentation is hosted on PyData.org: http://pandas.pydata.org/
-
-The Sphinx documentation should provide a good starting point for learning how
-to use the library. Expect the docs to continue to expand as time goes on.
+The official documentation is hosted on PyData.org: https://pandas.pydata.org/pandas-docs/stable
 
 ## Background
 Work on ``pandas`` started at AQR (a quantitative hedge fund) in 2008 and
 has been under active development since then.
 
+## Getting Help
+
+For usage questions, the best place to go to is [StackOverflow](https://stackoverflow.com/questions/tagged/pandas).
+Further, general questions and discussions can also take place on the [pydata mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata).
+
 ## Discussion and Development
-Since pandas development is related to a number of other scientific
-Python projects, questions are welcome on the scipy-user mailing
-list. Specialized discussions or design issues should take place on
-the PyData mailing list / Google group:
+Most development discussion is taking place on github in this repo. Further, the [pandas-dev mailing list](https://mail.python.org/mailman/listinfo/pandas-dev) can also be used for specialized discussions or design issues, and a [Gitter channel](https://gitter.im/pydata/pandas) is available for quick development related questions.
+
+## Contributing to pandas [![Open Source Helpers](https://www.codetriage.com/pandas-dev/pandas/badges/users.svg)](https://www.codetriage.com/pandas-dev/pandas)
+
+All contributions, bug reports, bug fixes, documentation improvements, enhancements and ideas are welcome.
+
+A detailed overview on how to contribute can be found in the **[contributing guide](https://pandas-docs.github.io/pandas-docs-travis/contributing.html)**. There is also an [overview](.github/CONTRIBUTING.md) on GitHub.
+
+If you are simply looking to start working with the pandas codebase, navigate to the [GitHub "issues" tab](https://github.com/pandas-dev/pandas/issues) and start looking through interesting issues. There are a number of issues listed under [Docs](https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open) and [good first issue](https://github.com/pandas-dev/pandas/issues?labels=good+first+issue&sort=updated&state=open) where you could start out.
+
+You can also triage issues which may include reproducing bug reports, or asking for vital information such as version numbers or reproduction instructions. If you would like to start triaging issues, one easy way to get started is to [subscribe to pandas on CodeTriage](https://www.codetriage.com/pandas-dev/pandas).
+
+Or maybe through using pandas you have an idea of your own or are looking for something in the documentation and thinking ‘this can be improved’...you can do something about it!
 
-https://groups.google.com/forum/#!forum/pydata
+Feel free to ask questions on the [mailing list](https://groups.google.com/forum/?fromgroups#!forum/pydata) or on [Gitter](https://gitter.im/pydata/pandas).
diff --git a/appveyor.yml b/appveyor.yml
deleted file mode 100644
index db729b3005be6..0000000000000
--- a/appveyor.yml
+++ /dev/null
@@ -1,89 +0,0 @@
-# With infos from
-# http://tjelvarolsson.com/blog/how-to-continuously-test-your-python-code-on-windows-using-appveyor/
-# https://packaging.python.org/en/latest/appveyor/
-# https://github.com/rmcgibbo/python-appveyor-conda-example
-
-# Backslashes in quotes need to be escaped: \ -> "\\"
-
-matrix:
-  fast_finish: true     # immediately finish build once one of the jobs fails.
-
-environment:
-  global:
-    # SDK v7.0 MSVC Express 2008's SetEnv.cmd script will fail if the
-    # /E:ON and /V:ON options are not enabled in the batch script intepreter
-    # See: http://stackoverflow.com/a/13751649/163740
-    CMD_IN_ENV: "cmd /E:ON /V:ON /C .\\ci\\run_with_env.cmd"
-    clone_folder: C:\projects\pandas
-
-  matrix:
-
-    - CONDA_ROOT: "C:\\Miniconda3_64"
-      PYTHON_VERSION: "3.6"
-      PYTHON_ARCH: "64"
-      CONDA_PY: "36"
-      CONDA_NPY: "112"
-
-    - CONDA_ROOT: "C:\\Miniconda3_64"
-      PYTHON_VERSION: "2.7"
-      PYTHON_ARCH: "64"
-      CONDA_PY: "27"
-      CONDA_NPY: "110"
-
-# We always use a 64-bit machine, but can build x86 distributions
-# with the PYTHON_ARCH variable (which is used by CMD_IN_ENV).
-platform:
-    - x64
-
-# all our python builds have to happen in tests_script...
-build: false
-
-install:
-  # cancel older builds for the same PR
-  - ps: if ($env:APPVEYOR_PULL_REQUEST_NUMBER -and $env:APPVEYOR_BUILD_NUMBER -ne ((Invoke-RestMethod `
-        https://ci.appveyor.com/api/projects/$env:APPVEYOR_ACCOUNT_NAME/$env:APPVEYOR_PROJECT_SLUG/history?recordsNumber=50).builds | `
-        Where-Object pullRequestId -eq $env:APPVEYOR_PULL_REQUEST_NUMBER)[0].buildNumber) { `
-        throw "There are newer queued builds for this pull request, failing early." }
-
-  # this installs the appropriate Miniconda (Py2/Py3, 32/64 bit)
-  # updates conda & installs: conda-build jinja2 anaconda-client
-  - powershell .\ci\install.ps1
-  - SET PATH=%CONDA_ROOT%;%CONDA_ROOT%\Scripts;%PATH%
-  - echo "install"
-  - cd
-  - ls -ltr
-  - git tag --sort v:refname
-
-  # this can conflict with git
-  - cmd: rmdir C:\cygwin /s /q
-
-  # install our build environment
-  - cmd: conda config --set show_channel_urls true --set always_yes true --set changeps1 false
-  - cmd: conda update -q conda
-  - cmd: conda config --set ssl_verify false
-
-  # add the pandas channel *before* defaults to have defaults take priority
-  - cmd: conda config --add channels conda-forge
-  - cmd: conda config --add channels pandas
-  - cmd: conda config --remove channels defaults
-  - cmd: conda config --add channels defaults
-
-  # this is now the downloaded conda...
-  - cmd: conda info -a
-
-  # create our env
-  - cmd: conda create -n pandas python=%PYTHON_VERSION% cython pytest
-  - cmd: activate pandas
-  - SET REQ=ci\requirements-%PYTHON_VERSION%_WIN.run
-  - cmd: echo "installing requirements from %REQ%"
-  - cmd: conda install -n pandas --file=%REQ%
-  - cmd: conda list -n pandas
-  - cmd: echo "installing requirements from %REQ% - done"
-
-  # build em using the local source checkout in the correct windows env
-  - cmd: '%CMD_IN_ENV% python setup.py build_ext --inplace'
-
-test_script:
-  # tests
-  - cmd: activate pandas
-  - cmd: test.bat
diff --git a/asv_bench/asv.conf.json b/asv_bench/asv.conf.json
index 4fc6f9f634426..fa098e2455683 100644
--- a/asv_bench/asv.conf.json
+++ b/asv_bench/asv.conf.json
@@ -26,7 +26,7 @@
     // The Pythons you'd like to test against.  If not provided, defaults
     // to the current version of Python used to run `asv`.
     // "pythons": ["2.7", "3.4"],
-    "pythons": ["2.7"],
+    "pythons": ["3.6"],
 
     // The matrix of dependencies to test.  Each key is the name of a
     // package (in PyPI) and the values are version numbers.  An empty
@@ -46,12 +46,14 @@
         "numexpr": [],
         "pytables": [null, ""],  // platform dependent, see excludes below
         "tables": [null, ""],
-        "libpython": [null, ""],
         "openpyxl": [],
         "xlsxwriter": [],
         "xlrd": [],
         "xlwt": [],
         "pytest": [],
+        // If using Windows with python 2.7 and want to build using the
+        // mingw toolchain (rather than MSVC), uncomment the following line.
+        // "libpython": [],
     },
 
     // Combinations of libraries/python versions can be excluded/included
@@ -80,10 +82,6 @@
         {"environment_type": "conda", "pytables": null},
         {"environment_type": "(?!conda).*", "tables": null},
         {"environment_type": "(?!conda).*", "pytables": ""},
-        // On conda&win32, install libpython
-        {"sys_platform": "(?!win32).*", "libpython": ""},
-        {"environment_type": "conda", "sys_platform": "win32", "libpython": null},
-        {"environment_type": "(?!conda).*", "libpython": ""}
     ],
     "include": [],
 
@@ -119,8 +117,9 @@
     // with results. If the commit is `null`, regression detection is
     // skipped for the matching benchmark.
     //
-    // "regressions_first_commits": {
-    //    "some_benchmark": "352cdf",  // Consider regressions only after this commit
-    //    "another_benchmark": null,   // Skip regression detection altogether
-    // }
+    "regressions_first_commits": {
+        ".*": "0409521665"
+    },
+    "regression_thresholds": {
+    }
 }
diff --git a/asv_bench/benchmarks/__init__.py b/asv_bench/benchmarks/__init__.py
index e69de29bb2d1d..eada147852fe1 100644
--- a/asv_bench/benchmarks/__init__.py
+++ b/asv_bench/benchmarks/__init__.py
@@ -0,0 +1 @@
+"""Pandas benchmarks."""
diff --git a/asv_bench/benchmarks/algorithms.py b/asv_bench/benchmarks/algorithms.py
index fe657936c403e..74849d330f2bc 100644
--- a/asv_bench/benchmarks/algorithms.py
+++ b/asv_bench/benchmarks/algorithms.py
@@ -1,115 +1,144 @@
+from importlib import import_module
+
 import numpy as np
+
 import pandas as pd
 from pandas.util import testing as tm
 
+for imp in ['pandas.util', 'pandas.tools.hashing']:
+    try:
+        hashing = import_module(imp)
+        break
+    except (ImportError, TypeError, ValueError):
+        pass
+
+
+class Factorize(object):
+
+    params = [[True, False], ['int', 'uint', 'float', 'string']]
+    param_names = ['sort', 'dtype']
+
+    def setup(self, sort, dtype):
+        N = 10**5
+        data = {'int': pd.Int64Index(np.arange(N).repeat(5)),
+                'uint': pd.UInt64Index(np.arange(N).repeat(5)),
+                'float': pd.Float64Index(np.random.randn(N).repeat(5)),
+                'string': tm.makeStringIndex(N).repeat(5)}
+        self.idx = data[dtype]
+
+    def time_factorize(self, sort, dtype):
+        self.idx.factorize(sort=sort)
+
 
-class Algorithms(object):
-    goal_time = 0.2
+class FactorizeUnique(object):
 
-    def setup(self):
-        N = 100000
-        np.random.seed(1234)
+    params = [[True, False], ['int', 'uint', 'float', 'string']]
+    param_names = ['sort', 'dtype']
 
-        self.int_unique = pd.Int64Index(np.arange(N * 5))
+    def setup(self, sort, dtype):
+        N = 10**5
+        data = {'int': pd.Int64Index(np.arange(N)),
+                'uint': pd.UInt64Index(np.arange(N)),
+                'float': pd.Float64Index(np.arange(N)),
+                'string': tm.makeStringIndex(N)}
+        self.idx = data[dtype]
+        assert self.idx.is_unique
+
+    def time_factorize(self, sort, dtype):
+        self.idx.factorize(sort=sort)
+
+
+class Duplicated(object):
+
+    params = [['first', 'last', False], ['int', 'uint', 'float', 'string']]
+    param_names = ['keep', 'dtype']
+
+    def setup(self, keep, dtype):
+        N = 10**5
+        data = {'int': pd.Int64Index(np.arange(N).repeat(5)),
+                'uint': pd.UInt64Index(np.arange(N).repeat(5)),
+                'float': pd.Float64Index(np.random.randn(N).repeat(5)),
+                'string': tm.makeStringIndex(N).repeat(5)}
+        self.idx = data[dtype]
         # cache is_unique
-        self.int_unique.is_unique
+        self.idx.is_unique
 
-        self.int = pd.Int64Index(np.arange(N).repeat(5))
-        self.float = pd.Float64Index(np.random.randn(N).repeat(5))
+    def time_duplicated(self, keep, dtype):
+        self.idx.duplicated(keep=keep)
 
-        # Convenience naming.
-        self.checked_add = pd.core.algorithms.checked_add_with_arr
 
-        self.arr = np.arange(1000000)
-        self.arrpos = np.arange(1000000)
-        self.arrneg = np.arange(-1000000, 0)
-        self.arrmixed = np.array([1, -1]).repeat(500000)
-        self.strings = tm.makeStringIndex(100000)
+class DuplicatedUniqueIndex(object):
 
-        self.arr_nan = np.random.choice([True, False], size=1000000)
-        self.arrmixed_nan = np.random.choice([True, False], size=1000000)
+    params = ['int', 'uint', 'float', 'string']
+    param_names = ['dtype']
 
-        # match
-        self.uniques = tm.makeStringIndex(1000).values
-        self.all = self.uniques.repeat(10)
+    def setup(self, dtype):
+        N = 10**5
+        data = {'int': pd.Int64Index(np.arange(N)),
+                'uint': pd.UInt64Index(np.arange(N)),
+                'float': pd.Float64Index(np.random.randn(N)),
+                'string': tm.makeStringIndex(N)}
+        self.idx = data[dtype]
+        # cache is_unique
+        self.idx.is_unique
 
-    def time_factorize_string(self):
-        self.strings.factorize()
+    def time_duplicated_unique(self, dtype):
+        self.idx.duplicated()
 
-    def time_factorize_int(self):
-        self.int.factorize()
 
-    def time_factorize_float(self):
-        self.int.factorize()
+class Hashing(object):
 
-    def time_duplicated_int_unique(self):
-        self.int_unique.duplicated()
+    def setup_cache(self):
+        N = 10**5
 
-    def time_duplicated_int(self):
-        self.int.duplicated()
+        df = pd.DataFrame(
+            {'strings': pd.Series(tm.makeStringIndex(10000).take(
+                np.random.randint(0, 10000, size=N))),
+             'floats': np.random.randn(N),
+             'ints': np.arange(N),
+             'dates': pd.date_range('20110101', freq='s', periods=N),
+             'timedeltas': pd.timedelta_range('1 day', freq='s', periods=N)})
+        df['categories'] = df['strings'].astype('category')
+        df.iloc[10:20] = np.nan
+        return df
 
-    def time_duplicated_float(self):
-        self.float.duplicated()
+    def time_frame(self, df):
+        hashing.hash_pandas_object(df)
 
-    def time_match_strings(self):
-        pd.match(self.all, self.uniques)
+    def time_series_int(self, df):
+        hashing.hash_pandas_object(df['ints'])
 
-    def time_add_overflow_pos_scalar(self):
-        self.checked_add(self.arr, 1)
+    def time_series_string(self, df):
+        hashing.hash_pandas_object(df['strings'])
 
-    def time_add_overflow_neg_scalar(self):
-        self.checked_add(self.arr, -1)
+    def time_series_float(self, df):
+        hashing.hash_pandas_object(df['floats'])
 
-    def time_add_overflow_zero_scalar(self):
-        self.checked_add(self.arr, 0)
+    def time_series_categorical(self, df):
+        hashing.hash_pandas_object(df['categories'])
 
-    def time_add_overflow_pos_arr(self):
-        self.checked_add(self.arr, self.arrpos)
+    def time_series_timedeltas(self, df):
+        hashing.hash_pandas_object(df['timedeltas'])
 
-    def time_add_overflow_neg_arr(self):
-        self.checked_add(self.arr, self.arrneg)
+    def time_series_dates(self, df):
+        hashing.hash_pandas_object(df['dates'])
 
-    def time_add_overflow_mixed_arr(self):
-        self.checked_add(self.arr, self.arrmixed)
 
-    def time_add_overflow_first_arg_nan(self):
-        self.checked_add(self.arr, self.arrmixed, arr_mask=self.arr_nan)
+class Quantile(object):
+    params = [[0, 0.5, 1],
+              ['linear', 'nearest', 'lower', 'higher', 'midpoint'],
+              ['float', 'int', 'uint']]
+    param_names = ['quantile', 'interpolation', 'dtype']
 
-    def time_add_overflow_second_arg_nan(self):
-        self.checked_add(self.arr, self.arrmixed, b_mask=self.arrmixed_nan)
+    def setup(self, quantile, interpolation, dtype):
+        N = 10**5
+        data = {'int': np.arange(N),
+                'uint': np.arange(N).astype(np.uint64),
+                'float': np.random.randn(N)}
+        self.idx = pd.Series(data[dtype].repeat(5))
 
-    def time_add_overflow_both_arg_nan(self):
-        self.checked_add(self.arr, self.arrmixed, arr_mask=self.arr_nan,
-                         b_mask=self.arrmixed_nan)
+    def time_quantile(self, quantile, interpolation, dtype):
+        self.idx.quantile(quantile, interpolation=interpolation)
 
 
-class Hashing(object):
-    goal_time = 0.2
-
-    def setup(self):
-        N = 100000
-
-        self.df = pd.DataFrame(
-            {'A': pd.Series(tm.makeStringIndex(100).take(
-                np.random.randint(0, 100, size=N))),
-             'B': pd.Series(tm.makeStringIndex(10000).take(
-                 np.random.randint(0, 10000, size=N))),
-             'D': np.random.randn(N),
-             'E': np.arange(N),
-             'F': pd.date_range('20110101', freq='s', periods=N),
-             'G': pd.timedelta_range('1 day', freq='s', periods=N),
-             })
-        self.df['C'] = self.df['B'].astype('category')
-        self.df.iloc[10:20] = np.nan
-
-    def time_frame(self):
-        self.df.hash()
-
-    def time_series_int(self):
-        self.df.E.hash()
-
-    def time_series_string(self):
-        self.df.B.hash()
-
-    def time_series_categorical(self):
-        self.df.C.hash()
+from .pandas_vb_common import setup  # noqa: F401 isort:skip
diff --git a/asv_bench/benchmarks/attrs_caching.py b/asv_bench/benchmarks/attrs_caching.py
index 9210f1f2878d4..d061755208c9e 100644
--- a/asv_bench/benchmarks/attrs_caching.py
+++ b/asv_bench/benchmarks/attrs_caching.py
@@ -1,9 +1,12 @@
-from .pandas_vb_common import *
-from pandas.util.decorators import cache_readonly
+import numpy as np
+from pandas import DataFrame
+try:
+    from pandas.util import cache_readonly
+except ImportError:
+    from pandas.util.decorators import cache_readonly
 
 
 class DataFrameAttributes(object):
-    goal_time = 0.2
 
     def setup(self):
         self.df = DataFrame(np.random.randn(10, 6))
@@ -17,7 +20,6 @@ def time_set_index(self):
 
 
 class CacheReadonly(object):
-    goal_time = 0.2
 
     def setup(self):
 
@@ -30,3 +32,6 @@ def prop(self):
 
     def time_cache_readonly(self):
         self.obj.prop
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/binary_ops.py b/asv_bench/benchmarks/binary_ops.py
index 72700c3de282e..22b8ed80f3d07 100644
--- a/asv_bench/benchmarks/binary_ops.py
+++ b/asv_bench/benchmarks/binary_ops.py
@@ -1,9 +1,13 @@
-from .pandas_vb_common import *
-import pandas.computation.expressions as expr
+import numpy as np
+from pandas import DataFrame, Series, date_range
+from pandas.core.algorithms import checked_add_with_arr
+try:
+    import pandas.core.computation.expressions as expr
+except ImportError:
+    import pandas.computation.expressions as expr
 
 
 class Ops(object):
-    goal_time = 0.2
 
     params = [[True, False], ['default', 1]]
     param_names = ['use_numexpr', 'threads']
@@ -17,18 +21,17 @@ def setup(self, use_numexpr, threads):
         if not use_numexpr:
             expr.set_use_numexpr(False)
 
-
     def time_frame_add(self, use_numexpr, threads):
-        (self.df + self.df2)
+        self.df + self.df2
 
     def time_frame_mult(self, use_numexpr, threads):
-        (self.df * self.df2)
+        self.df * self.df2
 
     def time_frame_multi_and(self, use_numexpr, threads):
-        self.df[((self.df > 0) & (self.df2 > 0))]
+        self.df[(self.df > 0) & (self.df2 > 0)]
 
     def time_frame_comparison(self, use_numexpr, threads):
-        (self.df > self.df2)
+        self.df > self.df2
 
     def teardown(self, use_numexpr, threads):
         expr.set_use_numexpr(True)
@@ -36,75 +39,117 @@ def teardown(self, use_numexpr, threads):
 
 
 class Ops2(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 1000))
-        self.df2 = DataFrame(np.random.randn(1000, 1000))
+        N = 10**3
+        self.df = DataFrame(np.random.randn(N, N))
+        self.df2 = DataFrame(np.random.randn(N, N))
+
+        self.df_int = DataFrame(np.random.randint(np.iinfo(np.int16).min,
+                                                  np.iinfo(np.int16).max,
+                                                  size=(N, N)))
+        self.df2_int = DataFrame(np.random.randint(np.iinfo(np.int16).min,
+                                                   np.iinfo(np.int16).max,
+                                                   size=(N, N)))
 
-        self.df_int = DataFrame(
-            np.random.random_integers(np.iinfo(np.int16).min,
-                                      np.iinfo(np.int16).max,
-                                      size=(1000, 1000)))
-        self.df2_int = DataFrame(
-            np.random.random_integers(np.iinfo(np.int16).min,
-                                      np.iinfo(np.int16).max,
-                                      size=(1000, 1000)))
+        self.s = Series(np.random.randn(N))
 
-    ## Division
+    # Division
 
     def time_frame_float_div(self):
-        (self.df // self.df2)
+        self.df // self.df2
 
     def time_frame_float_div_by_zero(self):
-        (self.df / 0)
+        self.df / 0
 
     def time_frame_float_floor_by_zero(self):
-        (self.df // 0)
+        self.df // 0
 
     def time_frame_int_div_by_zero(self):
-        (self.df_int / 0)
+        self.df_int / 0
 
-    ## Modulo
+    # Modulo
 
     def time_frame_int_mod(self):
-        (self.df / self.df2)
+        self.df_int % self.df2_int
 
     def time_frame_float_mod(self):
-        (self.df / self.df2)
+        self.df % self.df2
+
+    # Dot product
+
+    def time_frame_dot(self):
+        self.df.dot(self.df2)
+
+    def time_series_dot(self):
+        self.s.dot(self.s)
+
+    def time_frame_series_dot(self):
+        self.df.dot(self.s)
 
 
 class Timeseries(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.s = Series(date_range('20010101', periods=self.N, freq='T'))
-        self.ts = self.s[self.halfway]
+    params = [None, 'US/Eastern']
+    param_names = ['tz']
 
-        self.s2 = Series(date_range('20010101', periods=self.N, freq='s'))
+    def setup(self, tz):
+        N = 10**6
+        halfway = (N // 2) - 1
+        self.s = Series(date_range('20010101', periods=N, freq='T', tz=tz))
+        self.ts = self.s[halfway]
 
-    def time_series_timestamp_compare(self):
-        (self.s <= self.ts)
+        self.s2 = Series(date_range('20010101', periods=N, freq='s', tz=tz))
 
-    def time_timestamp_series_compare(self):
-        (self.ts >= self.s)
+    def time_series_timestamp_compare(self, tz):
+        self.s <= self.ts
 
-    def time_timestamp_ops_diff1(self):
+    def time_timestamp_series_compare(self, tz):
+        self.ts >= self.s
+
+    def time_timestamp_ops_diff(self, tz):
         self.s2.diff()
 
-    def time_timestamp_ops_diff2(self):
-        (self.s - self.s.shift())
+    def time_timestamp_ops_diff_with_shift(self, tz):
+        self.s - self.s.shift()
+
 
+class AddOverflowScalar(object):
 
+    params = [1, -1, 0]
+    param_names = ['scalar']
 
-class TimeseriesTZ(Timeseries):
+    def setup(self, scalar):
+        N = 10**6
+        self.arr = np.arange(N)
+
+    def time_add_overflow_scalar(self, scalar):
+        checked_add_with_arr(self.arr, scalar)
+
+
+class AddOverflowArray(object):
 
     def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.s = Series(date_range('20010101', periods=self.N, freq='T', tz='US/Eastern'))
-        self.ts = self.s[self.halfway]
+        N = 10**6
+        self.arr = np.arange(N)
+        self.arr_rev = np.arange(-N, 0)
+        self.arr_mixed = np.array([1, -1]).repeat(N / 2)
+        self.arr_nan_1 = np.random.choice([True, False], size=N)
+        self.arr_nan_2 = np.random.choice([True, False], size=N)
+
+    def time_add_overflow_arr_rev(self):
+        checked_add_with_arr(self.arr, self.arr_rev)
+
+    def time_add_overflow_arr_mask_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed, arr_mask=self.arr_nan_1)
+
+    def time_add_overflow_b_mask_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed,
+                             b_mask=self.arr_nan_1)
+
+    def time_add_overflow_both_arg_nan(self):
+        checked_add_with_arr(self.arr, self.arr_mixed, arr_mask=self.arr_nan_1,
+                             b_mask=self.arr_nan_2)
+
 
-        self.s2 = Series(date_range('20010101', periods=self.N, freq='s',  tz='US/Eastern'))
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/categoricals.py b/asv_bench/benchmarks/categoricals.py
index 153107911ca2c..4b5b2848f7e0f 100644
--- a/asv_bench/benchmarks/categoricals.py
+++ b/asv_bench/benchmarks/categoricals.py
@@ -1,99 +1,296 @@
-from .pandas_vb_common import *
+import warnings
+
+import numpy as np
+import pandas as pd
+import pandas.util.testing as tm
 try:
-    from pandas.types.concat import union_categoricals
+    from pandas.api.types import union_categoricals
 except ImportError:
-    pass
+    try:
+        from pandas.types.concat import union_categoricals
+    except ImportError:
+        pass
 
 
-class Categoricals(object):
-    goal_time = 0.2
+class Concat(object):
 
     def setup(self):
-        N = 100000
-        self.s = pd.Series((list('aabbcd') * N)).astype('category')
+        N = 10**5
+        self.s = pd.Series(list('aabbcd') * N).astype('category')
+
+        self.a = pd.Categorical(list('aabbcd') * N)
+        self.b = pd.Categorical(list('bbcdjk') * N)
+
+    def time_concat(self):
+        pd.concat([self.s, self.s])
+
+    def time_union(self):
+        union_categoricals([self.a, self.b])
+
 
-        self.a = pd.Categorical((list('aabbcd') * N))
-        self.b = pd.Categorical((list('bbcdjk') * N))
+class Constructor(object):
 
+    def setup(self):
+        N = 10**5
         self.categories = list('abcde')
-        self.cat_idx = Index(self.categories)
+        self.cat_idx = pd.Index(self.categories)
         self.values = np.tile(self.categories, N)
         self.codes = np.tile(range(len(self.categories)), N)
 
-        self.datetimes = pd.Series(pd.date_range(
-            '1995-01-01 00:00:00', periods=10000, freq='s'))
+        self.datetimes = pd.Series(pd.date_range('1995-01-01 00:00:00',
+                                                 periods=N / 10,
+                                                 freq='s'))
+        self.datetimes_with_nat = self.datetimes.copy()
+        self.datetimes_with_nat.iloc[-1] = pd.NaT
 
-    def time_concat(self):
-        concat([self.s, self.s])
+        self.values_some_nan = list(np.tile(self.categories + [np.nan], N))
+        self.values_all_nan = [np.nan] * len(self.values)
+        self.values_all_int8 = np.ones(N, 'int8')
+        self.categorical = pd.Categorical(self.values, self.categories)
+        self.series = pd.Series(self.categorical)
 
-    def time_union(self):
-        union_categoricals([self.a, self.b])
+    def time_regular(self):
+        pd.Categorical(self.values, self.categories)
 
-    def time_constructor_regular(self):
-        Categorical(self.values, self.categories)
+    def time_fastpath(self):
+        pd.Categorical(self.codes, self.cat_idx, fastpath=True)
 
-    def time_constructor_fastpath(self):
-        Categorical(self.codes, self.cat_idx, fastpath=True)
+    def time_datetimes(self):
+        pd.Categorical(self.datetimes)
 
-    def time_constructor_datetimes(self):
-        Categorical(self.datetimes)
+    def time_datetimes_with_nat(self):
+        pd.Categorical(self.datetimes_with_nat)
 
-    def time_constructor_datetimes_with_nat(self):
-        t = self.datetimes
-        t.iloc[-1] = pd.NaT
-        Categorical(t)
+    def time_with_nan(self):
+        pd.Categorical(self.values_some_nan)
 
+    def time_all_nan(self):
+        pd.Categorical(self.values_all_nan)
 
-class Categoricals2(object):
-    goal_time = 0.2
+    def time_from_codes_all_int8(self):
+        pd.Categorical.from_codes(self.values_all_int8, self.categories)
+
+    def time_existing_categorical(self):
+        pd.Categorical(self.categorical)
+
+    def time_existing_series(self):
+        pd.Categorical(self.series)
 
-    def setup(self):
-        n = 500000
-        np.random.seed(2718281)
-        arr = ['s%04d' % i for i in np.random.randint(0, n // 10, size=n)]
-        self.ts = Series(arr).astype('category')
 
-        self.sel = self.ts.loc[[0]]
+class ValueCounts(object):
 
-    def time_value_counts(self):
-        self.ts.value_counts(dropna=False)
+    params = [True, False]
+    param_names = ['dropna']
 
-    def time_value_counts_dropna(self):
-        self.ts.value_counts(dropna=True)
+    def setup(self, dropna):
+        n = 5 * 10**5
+        arr = ['s{:04d}'.format(i) for i in np.random.randint(0, n // 10,
+                                                              size=n)]
+        self.ts = pd.Series(arr).astype('category')
+
+    def time_value_counts(self, dropna):
+        self.ts.value_counts(dropna=dropna)
+
+
+class Repr(object):
+
+    def setup(self):
+        self.sel = pd.Series(['s1234']).astype('category')
 
     def time_rendering(self):
         str(self.sel)
 
 
-class Categoricals3(object):
-    goal_time = 0.2
+class SetCategories(object):
+
+    def setup(self):
+        n = 5 * 10**5
+        arr = ['s{:04d}'.format(i) for i in np.random.randint(0, n // 10,
+                                                              size=n)]
+        self.ts = pd.Series(arr).astype('category')
+
+    def time_set_categories(self):
+        self.ts.cat.set_categories(self.ts.cat.categories[::2])
+
+
+class RemoveCategories(object):
+
+    def setup(self):
+        n = 5 * 10**5
+        arr = ['s{:04d}'.format(i) for i in np.random.randint(0, n // 10,
+                                                              size=n)]
+        self.ts = pd.Series(arr).astype('category')
+
+    def time_remove_categories(self):
+        self.ts.cat.remove_categories(self.ts.cat.categories[::2])
+
+
+class Rank(object):
 
     def setup(self):
-        N = 100000
+        N = 10**5
         ncats = 100
 
-        self.s1 = Series(np.array(tm.makeCategoricalIndex(N, ncats)))
-        self.s1_cat = self.s1.astype('category')
-        self.s1_cat_ordered = self.s1.astype('category', ordered=True)
+        self.s_str = pd.Series(tm.makeCategoricalIndex(N, ncats)).astype(str)
+        self.s_str_cat = self.s_str.astype('category')
+        with warnings.catch_warnings(record=True):
+            self.s_str_cat_ordered = self.s_str.astype('category',
+                                                       ordered=True)
 
-        self.s2 = Series(np.random.randint(0, ncats, size=N))
-        self.s2_cat = self.s2.astype('category')
-        self.s2_cat_ordered = self.s2.astype('category', ordered=True)
+        self.s_int = pd.Series(np.random.randint(0, ncats, size=N))
+        self.s_int_cat = self.s_int.astype('category')
+        with warnings.catch_warnings(record=True):
+            self.s_int_cat_ordered = self.s_int.astype('category',
+                                                       ordered=True)
 
     def time_rank_string(self):
-        self.s1.rank()
+        self.s_str.rank()
 
     def time_rank_string_cat(self):
-        self.s1_cat.rank()
+        self.s_str_cat.rank()
 
     def time_rank_string_cat_ordered(self):
-        self.s1_cat_ordered.rank()
+        self.s_str_cat_ordered.rank()
 
     def time_rank_int(self):
-        self.s2.rank()
+        self.s_int.rank()
 
     def time_rank_int_cat(self):
-        self.s2_cat.rank()
+        self.s_int_cat.rank()
 
     def time_rank_int_cat_ordered(self):
-        self.s2_cat_ordered.rank()
+        self.s_int_cat_ordered.rank()
+
+
+class Isin(object):
+
+    params = ['object', 'int64']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        np.random.seed(1234)
+        n = 5 * 10**5
+        sample_size = 100
+        arr = [i for i in np.random.randint(0, n // 10, size=n)]
+        if dtype == 'object':
+            arr = ['s{:04d}'.format(i) for i in arr]
+        self.sample = np.random.choice(arr, sample_size)
+        self.series = pd.Series(arr).astype('category')
+
+    def time_isin_categorical(self, dtype):
+        self.series.isin(self.sample)
+
+
+class IsMonotonic(object):
+
+    def setup(self):
+        N = 1000
+        self.c = pd.CategoricalIndex(list('a' * N + 'b' * N + 'c' * N))
+        self.s = pd.Series(self.c)
+
+    def time_categorical_index_is_monotonic_increasing(self):
+        self.c.is_monotonic_increasing
+
+    def time_categorical_index_is_monotonic_decreasing(self):
+        self.c.is_monotonic_decreasing
+
+    def time_categorical_series_is_monotonic_increasing(self):
+        self.s.is_monotonic_increasing
+
+    def time_categorical_series_is_monotonic_decreasing(self):
+        self.s.is_monotonic_decreasing
+
+
+class Contains(object):
+
+    def setup(self):
+        N = 10**5
+        self.ci = tm.makeCategoricalIndex(N)
+        self.c = self.ci.values
+        self.key = self.ci.categories[0]
+
+    def time_categorical_index_contains(self):
+        self.key in self.ci
+
+    def time_categorical_contains(self):
+        self.key in self.c
+
+
+class CategoricalSlicing(object):
+
+    params = ['monotonic_incr', 'monotonic_decr', 'non_monotonic']
+    param_names = ['index']
+
+    def setup(self, index):
+        N = 10**6
+        categories = ['a', 'b', 'c']
+        values = [0] * N + [1] * N + [2] * N
+        if index == 'monotonic_incr':
+            self.data = pd.Categorical.from_codes(values,
+                                                  categories=categories)
+        elif index == 'monotonic_decr':
+            self.data = pd.Categorical.from_codes(list(reversed(values)),
+                                                  categories=categories)
+        elif index == 'non_monotonic':
+            self.data = pd.Categorical.from_codes([0, 1, 2] * N,
+                                                  categories=categories)
+        else:
+            raise ValueError('Invalid index param: {}'.format(index))
+
+        self.scalar = 10000
+        self.list = list(range(10000))
+        self.cat_scalar = 'b'
+
+    def time_getitem_scalar(self, index):
+        self.data[self.scalar]
+
+    def time_getitem_slice(self, index):
+        self.data[:self.scalar]
+
+    def time_getitem_list_like(self, index):
+        self.data[[self.scalar]]
+
+    def time_getitem_list(self, index):
+        self.data[self.list]
+
+    def time_getitem_bool_array(self, index):
+        self.data[self.data == self.cat_scalar]
+
+
+class Indexing(object):
+
+    def setup(self):
+        N = 10**5
+        self.index = pd.CategoricalIndex(range(N), range(N))
+        self.series = pd.Series(range(N), index=self.index).sort_index()
+        self.category = self.index[500]
+
+    def time_get_loc(self):
+        self.index.get_loc(self.category)
+
+    def time_shape(self):
+        self.index.shape
+
+    def time_shallow_copy(self):
+        self.index._shallow_copy()
+
+    def time_align(self):
+        pd.DataFrame({'a': self.series, 'b': self.series[:500]})
+
+    def time_intersection(self):
+        self.index[:750].intersection(self.index[250:])
+
+    def time_unique(self):
+        self.index.unique()
+
+    def time_reindex(self):
+        self.index.reindex(self.index[:500])
+
+    def time_reindex_missing(self):
+        self.index.reindex(['a', 'b', 'c', 'd'])
+
+    def time_sort_values(self):
+        self.index.sort_values(ascending=False)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/ctors.py b/asv_bench/benchmarks/ctors.py
index b5694a3a21502..5715c4fb2d0d4 100644
--- a/asv_bench/benchmarks/ctors.py
+++ b/asv_bench/benchmarks/ctors.py
@@ -1,30 +1,103 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import Series, Index, DatetimeIndex, Timestamp, MultiIndex
 
 
-class Constructors(object):
-    goal_time = 0.2
+def no_change(arr):
+    return arr
+
+
+def list_of_str(arr):
+    return list(arr.astype(str))
+
+
+def gen_of_str(arr):
+    return (x for x in arr.astype(str))
+
+
+def arr_dict(arr):
+    return dict(zip(range(len(arr)), arr))
+
+
+def list_of_tuples(arr):
+    return [(i, -i) for i in arr]
+
+
+def gen_of_tuples(arr):
+    return ((i, -i) for i in arr)
+
+
+def list_of_lists(arr):
+    return [[i, -i] for i in arr]
+
+
+def list_of_tuples_with_none(arr):
+    return [(i, -i) for i in arr][:-1] + [None]
 
-    def setup(self):
-        self.arr = np.random.randn(100, 100)
-        self.arr_str = np.array(['foo', 'bar', 'baz'], dtype=object)
 
-        self.data = np.random.randn(100)
-        self.index = Index(np.arange(100))
+def list_of_lists_with_none(arr):
+    return [[i, -i] for i in arr][:-1] + [None]
 
-        self.s = Series(([Timestamp('20110101'), Timestamp('20120101'),
-                          Timestamp('20130101')] * 1000))
 
-    def time_frame_from_ndarray(self):
-        DataFrame(self.arr)
+class SeriesConstructors(object):
 
-    def time_series_from_ndarray(self):
-        pd.Series(self.data, index=self.index)
+    param_names = ["data_fmt", "with_index", "dtype"]
+    params = [[no_change,
+               list,
+               list_of_str,
+               gen_of_str,
+               arr_dict,
+               list_of_tuples,
+               gen_of_tuples,
+               list_of_lists,
+               list_of_tuples_with_none,
+               list_of_lists_with_none],
+              [False, True],
+              ['float', 'int']]
+
+    def setup(self, data_fmt, with_index, dtype):
+        N = 10**4
+        if dtype == 'float':
+            arr = np.random.randn(N)
+        else:
+            arr = np.arange(N)
+        self.data = data_fmt(arr)
+        self.index = np.arange(N) if with_index else None
+
+    def time_series_constructor(self, data_fmt, with_index, dtype):
+        Series(self.data, index=self.index)
+
+
+class SeriesDtypesConstructors(object):
+
+    def setup(self):
+        N = 10**4
+        self.arr = np.random.randn(N)
+        self.arr_str = np.array(['foo', 'bar', 'baz'], dtype=object)
+        self.s = Series([Timestamp('20110101'), Timestamp('20120101'),
+                         Timestamp('20130101')] * N * 10)
 
     def time_index_from_array_string(self):
         Index(self.arr_str)
 
+    def time_index_from_array_floats(self):
+        Index(self.arr)
+
     def time_dtindex_from_series(self):
         DatetimeIndex(self.s)
 
-    def time_dtindex_from_series2(self):
+    def time_dtindex_from_index_with_series(self):
         Index(self.s)
+
+
+class MultiIndexConstructor(object):
+
+    def setup(self):
+        N = 10**4
+        self.iterables = [tm.makeStringIndex(N), range(20)]
+
+    def time_multiindex_from_iterables(self):
+        MultiIndex.from_product(self.iterables)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/dtypes.py b/asv_bench/benchmarks/dtypes.py
new file mode 100644
index 0000000000000..e59154cd99965
--- /dev/null
+++ b/asv_bench/benchmarks/dtypes.py
@@ -0,0 +1,39 @@
+from pandas.api.types import pandas_dtype
+
+import numpy as np
+from .pandas_vb_common import (
+    numeric_dtypes, datetime_dtypes, string_dtypes, extension_dtypes)
+
+
+_numpy_dtypes = [np.dtype(dtype)
+                 for dtype in (numeric_dtypes +
+                               datetime_dtypes +
+                               string_dtypes)]
+_dtypes = _numpy_dtypes + extension_dtypes
+
+
+class Dtypes(object):
+    params = (_dtypes +
+              list(map(lambda dt: dt.name, _dtypes)))
+    param_names = ['dtype']
+
+    def time_pandas_dtype(self, dtype):
+        pandas_dtype(dtype)
+
+
+class DtypesInvalid(object):
+    param_names = ['dtype']
+    params = ['scalar-string', 'scalar-int', 'list-string', 'array-string']
+    data_dict = {'scalar-string': 'foo',
+                 'scalar-int': 1,
+                 'list-string': ['foo'] * 1000,
+                 'array-string': np.array(['foo'] * 1000)}
+
+    def time_pandas_dtype_invalid(self, dtype):
+        try:
+            pandas_dtype(self.data_dict[dtype])
+        except TypeError:
+            pass
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/eval.py b/asv_bench/benchmarks/eval.py
index a0819e33dc254..68df38cd50742 100644
--- a/asv_bench/benchmarks/eval.py
+++ b/asv_bench/benchmarks/eval.py
@@ -1,67 +1,64 @@
-from .pandas_vb_common import *
+import numpy as np
 import pandas as pd
-import pandas.computation.expressions as expr
+try:
+    import pandas.core.computation.expressions as expr
+except ImportError:
+    import pandas.computation.expressions as expr
 
 
 class Eval(object):
-    goal_time = 0.2
 
     params = [['numexpr', 'python'], [1, 'all']]
     param_names = ['engine', 'threads']
 
     def setup(self, engine, threads):
-        self.df = DataFrame(np.random.randn(20000, 100))
-        self.df2 = DataFrame(np.random.randn(20000, 100))
-        self.df3 = DataFrame(np.random.randn(20000, 100))
-        self.df4 = DataFrame(np.random.randn(20000, 100))
+        self.df = pd.DataFrame(np.random.randn(20000, 100))
+        self.df2 = pd.DataFrame(np.random.randn(20000, 100))
+        self.df3 = pd.DataFrame(np.random.randn(20000, 100))
+        self.df4 = pd.DataFrame(np.random.randn(20000, 100))
 
         if threads == 1:
             expr.set_numexpr_threads(1)
 
     def time_add(self, engine, threads):
-        df, df2, df3, df4 = self.df, self.df2, self.df3, self.df4
-        pd.eval('df + df2 + df3 + df4', engine=engine)
+        pd.eval('self.df + self.df2 + self.df3 + self.df4', engine=engine)
 
     def time_and(self, engine, threads):
-        df, df2, df3, df4 = self.df, self.df2, self.df3, self.df4
-        pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine=engine)
+        pd.eval('(self.df > 0) & (self.df2 > 0) & '
+                '(self.df3 > 0) & (self.df4 > 0)', engine=engine)
 
     def time_chained_cmp(self, engine, threads):
-        df, df2, df3, df4 = self.df, self.df2, self.df3, self.df4
-        pd.eval('df < df2 < df3 < df4', engine=engine)
+        pd.eval('self.df < self.df2 < self.df3 < self.df4', engine=engine)
 
     def time_mult(self, engine, threads):
-        df, df2, df3, df4 = self.df, self.df2, self.df3, self.df4
-        pd.eval('df * df2 * df3 * df4', engine=engine)
+        pd.eval('self.df * self.df2 * self.df3 * self.df4', engine=engine)
 
     def teardown(self, engine, threads):
         expr.set_numexpr_threads()
 
 
 class Query(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.N = 1000000
-        self.halfway = ((self.N // 2) - 1)
-        self.index = date_range('20010101', periods=self.N, freq='T')
-        self.s = Series(self.index)
-        self.ts = self.s.iloc[self.halfway]
-        self.df = DataFrame({'a': np.random.randn(self.N), }, index=self.index)
-        self.df2 = DataFrame({'dates': self.s.values,})
-
-        self.df3 = DataFrame({'a': np.random.randn(self.N),})
-        self.min_val = self.df3['a'].min()
-        self.max_val = self.df3['a'].max()
+        N = 10**6
+        halfway = (N // 2) - 1
+        index = pd.date_range('20010101', periods=N, freq='T')
+        s = pd.Series(index)
+        self.ts = s.iloc[halfway]
+        self.df = pd.DataFrame({'a': np.random.randn(N), 'dates': index},
+                               index=index)
+        data = np.random.randn(N)
+        self.min_val = data.min()
+        self.max_val = data.max()
 
     def time_query_datetime_index(self):
-        ts = self.ts
-        self.df.query('index < @ts')
+        self.df.query('index < @self.ts')
 
-    def time_query_datetime_series(self):
-        ts = self.ts
-        self.df2.query('dates < @ts')
+    def time_query_datetime_column(self):
+        self.df.query('dates < @self.ts')
 
     def time_query_with_boolean_selection(self):
-        min_val, max_val = self.min_val, self.max_val
-        self.df.query('(a >= @min_val) & (a <= @max_val)')
+        self.df.query('(a >= @self.min_val) & (a <= @self.max_val)')
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/frame_ctor.py b/asv_bench/benchmarks/frame_ctor.py
index 05c1a27fdf8ca..dfb6ab5b189b2 100644
--- a/asv_bench/benchmarks/frame_ctor.py
+++ b/asv_bench/benchmarks/frame_ctor.py
@@ -1,138 +1,107 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, MultiIndex, Timestamp, date_range
 try:
-    from pandas.tseries.offsets import *
-except:
-    from pandas.core.datetools import *
+    from pandas.tseries.offsets import Nano, Hour
+except ImportError:
+    # For compatibility with older versions
+    from pandas.core.datetools import * # noqa
 
 
-#----------------------------------------------------------------------
-# Creation from nested dict
-
 class FromDicts(object):
-    goal_time = 0.2
 
     def setup(self):
-        (N, K) = (5000, 50)
+        N, K = 5000, 50
         self.index = tm.makeStringIndex(N)
         self.columns = tm.makeStringIndex(K)
-        self.frame = DataFrame(np.random.randn(N, K), index=self.index, columns=self.columns)
-        try:
-            self.data = self.frame.to_dict()
-        except:
-            self.data = self.frame.toDict()
-        self.some_dict = self.data.values()[0]
-        self.dict_list = [dict(zip(self.columns, row)) for row in self.frame.values]
-
-        self.data2 = dict(
-            ((i, dict(((j, float(j)) for j in range(100)))) for i in
-             xrange(2000)))
-
-    def time_frame_ctor_list_of_dict(self):
+        frame = DataFrame(np.random.randn(N, K), index=self.index,
+                          columns=self.columns)
+        self.data = frame.to_dict()
+        self.dict_list = frame.to_dict(orient='records')
+        self.data2 = {i: {j: float(j) for j in range(100)}
+                      for i in range(2000)}
+
+    def time_list_of_dict(self):
         DataFrame(self.dict_list)
 
-    def time_frame_ctor_nested_dict(self):
+    def time_nested_dict(self):
         DataFrame(self.data)
 
-    def time_series_ctor_from_dict(self):
-        Series(self.some_dict)
+    def time_nested_dict_index(self):
+        DataFrame(self.data, index=self.index)
 
-    def time_frame_ctor_nested_dict_int64(self):
-        # nested dict, integer indexes, regression described in #621
-        DataFrame(self.data)
+    def time_nested_dict_columns(self):
+        DataFrame(self.data, columns=self.columns)
 
+    def time_nested_dict_index_columns(self):
+        DataFrame(self.data, index=self.index, columns=self.columns)
 
-# from a mi-series
+    def time_nested_dict_int64(self):
+        # nested dict, integer indexes, regression described in #621
+        DataFrame(self.data2)
 
-class frame_from_series(object):
-    goal_time = 0.2
+
+class FromSeries(object):
 
     def setup(self):
-        self.mi = MultiIndex.from_tuples([(x, y) for x in range(100) for y in range(100)])
-        self.s = Series(randn(10000), index=self.mi)
+        mi = MultiIndex.from_product([range(100), range(100)])
+        self.s = Series(np.random.randn(10000), index=mi)
 
-    def time_frame_from_mi_series(self):
+    def time_mi_series(self):
         DataFrame(self.s)
 
 
-#----------------------------------------------------------------------
-# get_numeric_data
-
-class frame_get_numeric_data(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 25))
-        self.df['foo'] = 'bar'
-        self.df['bar'] = 'baz'
-        self.df = self.df.consolidate()
-
-    def time_frame_get_numeric_data(self):
-        self.df._get_numeric_data()
+class FromDictwithTimestamp(object):
 
+    params = [Nano(1), Hour(1)]
+    param_names = ['offset']
 
-# ----------------------------------------------------------------------
-# From dict with DatetimeIndex with all offsets
-
-# dynamically generate benchmarks for every offset
-#
-# get_period_count & get_index_for_offset are there because blindly taking each
-# offset times 1000 can easily go out of Timestamp bounds and raise errors.
+    def setup(self, offset):
+        N = 10**3
+        np.random.seed(1234)
+        idx = date_range(Timestamp('1/1/1900'), freq=offset, periods=N)
+        df = DataFrame(np.random.randn(N, 10), index=idx)
+        self.d = df.to_dict()
 
+    def time_dict_with_timestamp_offsets(self, offset):
+        DataFrame(self.d)
 
-def get_period_count(start_date, off):
-    ten_offsets_in_days = ((start_date + (off * 10)) - start_date).days
-    if (ten_offsets_in_days == 0):
-        return 1000
-    else:
-        return min((9 * ((Timestamp.max - start_date).days // ten_offsets_in_days)), 1000)
 
+class FromRecords(object):
 
-def get_index_for_offset(off):
-    start_date = Timestamp('1/1/1900')
-    return date_range(start_date, periods=min(1000, get_period_count(
-        start_date, off)), freq=off)
+    params = [None, 1000]
+    param_names = ['nrows']
 
+    def setup(self, nrows):
+        N = 100000
+        self.gen = ((x, (x * 20), (x * 100)) for x in range(N))
 
-all_offsets = offsets.__all__
-# extra cases
-for off in ['FY5253', 'FY5253Quarter']:
-    all_offsets.pop(all_offsets.index(off))
-    all_offsets.extend([off + '_1', off + '_2'])
+    def time_frame_from_records_generator(self, nrows):
+        # issue-6700
+        self.df = DataFrame.from_records(self.gen, nrows=nrows)
 
 
-class FrameConstructorDTIndexFromOffsets(object):
+class FromNDArray(object):
 
-    params = [all_offsets, [1, 2]]
-    param_names = ['offset', 'n_steps']
+    def setup(self):
+        N = 100000
+        self.data = np.random.randn(N)
 
-    offset_kwargs = {'WeekOfMonth': {'weekday': 1, 'week': 1},
-                     'LastWeekOfMonth': {'weekday': 1, 'week': 1},
-                     'FY5253': {'startingMonth': 1, 'weekday': 1},
-                     'FY5253Quarter': {'qtr_with_extra_week': 1, 'startingMonth': 1, 'weekday': 1}}
+    def time_frame_from_ndarray(self):
+        self.df = DataFrame(self.data)
 
-    offset_extra_cases = {'FY5253': {'variation': ['nearest', 'last']},
-                          'FY5253Quarter': {'variation': ['nearest', 'last']}}
 
-    def setup(self, offset, n_steps):
+class FromLists(object):
 
-        extra = False
-        if offset.endswith("_", None, -1):
-            extra = int(offset[-1])
-            offset = offset[:-2]
+    goal_time = 0.2
 
-        kwargs = {}
-        if offset in self.offset_kwargs:
-            kwargs = self.offset_kwargs[offset]
+    def setup(self):
+        N = 1000
+        M = 100
+        self.data = [[j for j in range(M)] for i in range(N)]
 
-        if extra:
-            extras = self.offset_extra_cases[offset]
-            for extra_arg in extras:
-                kwargs[extra_arg] = extras[extra_arg][extra -1]
+    def time_frame_from_lists(self):
+        self.df = DataFrame(self.data)
 
-        offset = getattr(offsets, offset)
-        self.idx = get_index_for_offset(offset(n_steps, **kwargs))
-        self.df = DataFrame(np.random.randn(len(self.idx), 10), index=self.idx)
-        self.d = dict([(col, self.df[col]) for col in self.df.columns])
 
-    def time_frame_ctor(self, offset, n_steps):
-        DataFrame(self.d)
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/frame_methods.py b/asv_bench/benchmarks/frame_methods.py
index 9f491302a4d6f..ba2e63c20d3f8 100644
--- a/asv_bench/benchmarks/frame_methods.py
+++ b/asv_bench/benchmarks/frame_methods.py
@@ -1,20 +1,36 @@
-from .pandas_vb_common import *
 import string
 
+import numpy as np
 
-#----------------------------------------------------------------------
-# lookup
+from pandas import (
+    DataFrame, MultiIndex, NaT, Series, date_range, isnull, period_range)
+import pandas.util.testing as tm
 
-class frame_fancy_lookup(object):
-    goal_time = 0.2
+
+class GetNumericData(object):
+
+    def setup(self):
+        self.df = DataFrame(np.random.randn(10000, 25))
+        self.df['foo'] = 'bar'
+        self.df['bar'] = 'baz'
+        self.df = self.df._consolidate()
+
+    def time_frame_get_numeric_data(self):
+        self.df._get_numeric_data()
+
+
+class Lookup(object):
 
     def setup(self):
-        self.df = DataFrame(np.random.randn(10000, 8), columns=list('abcdefgh'))
+        self.df = DataFrame(np.random.randn(10000, 8),
+                            columns=list('abcdefgh'))
         self.df['foo'] = 'bar'
         self.row_labels = list(self.df.index[::10])[:900]
-        self.col_labels = (list(self.df.columns) * 100)
-        self.row_labels_all = np.array((list(self.df.index) * len(self.df.columns)), dtype='object')
-        self.col_labels_all = np.array((list(self.df.columns) * len(self.df.index)), dtype='object')
+        self.col_labels = list(self.df.columns) * 100
+        self.row_labels_all = np.array(
+            list(self.df.index) * len(self.df.columns), dtype='object')
+        self.col_labels_all = np.array(
+            list(self.df.columns) * len(self.df.index), dtype='object')
 
     def time_frame_fancy_lookup(self):
         self.df.lookup(self.row_labels, self.col_labels)
@@ -23,25 +39,18 @@ def time_frame_fancy_lookup_all(self):
         self.df.lookup(self.row_labels_all, self.col_labels_all)
 
 
-#----------------------------------------------------------------------
-# reindex
-
 class Reindex(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.idx = np.arange(4000, 7000)
-
+        N = 10**3
+        self.df = DataFrame(np.random.randn(N * 10, N))
+        self.idx = np.arange(4 * N, 7 * N)
         self.df2 = DataFrame(
-            dict([(c, {0: randint(0, 2, 1000).astype(np.bool_),
-                       1: randint(0, 1000, 1000).astype(
-                           np.int16),
-                       2: randint(0, 1000, 1000).astype(
-                           np.int32),
-                       3: randint(0, 1000, 1000).astype(
-                           np.int64),}[randint(0, 4)]) for c in
-                  range(1000)]))
+            {c: {0: np.random.randint(0, 2, N).astype(np.bool_),
+                 1: np.random.randint(0, N, N).astype(np.int16),
+                 2: np.random.randint(0, N, N).astype(np.int32),
+                 3: np.random.randint(0, N, N).astype(np.int64)}
+                [np.random.randint(0, 4)] for c in range(N)})
 
     def time_reindex_axis0(self):
         self.df.reindex(self.idx)
@@ -52,82 +61,167 @@ def time_reindex_axis1(self):
     def time_reindex_both_axes(self):
         self.df.reindex(index=self.idx, columns=self.idx)
 
-    def time_reindex_both_axes_ix(self):
-        self.df.ix[(self.idx, self.idx)]
-
     def time_reindex_upcast(self):
-        self.df2.reindex(permutation(range(1200)))
+        self.df2.reindex(np.random.permutation(range(1200)))
 
 
-#----------------------------------------------------------------------
-# iteritems (monitor no-copying behaviour)
+class Rename(object):
+
+    def setup(self):
+        N = 10**3
+        self.df = DataFrame(np.random.randn(N * 10, N))
+        self.idx = np.arange(4 * N, 7 * N)
+        self.dict_idx = {k: k for k in self.idx}
+        self.df2 = DataFrame(
+            {c: {0: np.random.randint(0, 2, N).astype(np.bool_),
+                 1: np.random.randint(0, N, N).astype(np.int16),
+                 2: np.random.randint(0, N, N).astype(np.int32),
+                 3: np.random.randint(0, N, N).astype(np.int64)}
+                [np.random.randint(0, 4)] for c in range(N)})
+
+    def time_rename_single(self):
+        self.df.rename({0: 0})
+
+    def time_rename_axis0(self):
+        self.df.rename(self.dict_idx)
+
+    def time_rename_axis1(self):
+        self.df.rename(columns=self.dict_idx)
+
+    def time_rename_both_axes(self):
+        self.df.rename(index=self.dict_idx, columns=self.dict_idx)
+
+    def time_dict_rename_both_axes(self):
+        self.df.rename(index=self.dict_idx, columns=self.dict_idx)
+
 
 class Iteration(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(np.random.randn(50000, 10))
-        self.df3 = pd.DataFrame(np.random.randn(1000,5000),
-                                columns=['C'+str(c) for c in range(5000)])
+        N = 1000
+        self.df = DataFrame(np.random.randn(N * 10, N))
+        self.df2 = DataFrame(np.random.randn(N * 50, 10))
+        self.df3 = DataFrame(np.random.randn(N, 5 * N),
+                             columns=['C' + str(c) for c in range(N * 5)])
+        self.df4 = DataFrame(np.random.randn(N * 1000, 10))
 
-    def f(self):
+    def time_iteritems(self):
+        # (monitor no-copying behaviour)
         if hasattr(self.df, '_item_cache'):
             self.df._item_cache.clear()
-        for (name, col) in self.df.iteritems():
+        for name, col in self.df.iteritems():
             pass
 
-    def g(self):
-        for (name, col) in self.df.iteritems():
+    def time_iteritems_cached(self):
+        for name, col in self.df.iteritems():
             pass
 
-    def time_iteritems(self):
-        self.f()
+    def time_iteritems_indexing(self):
+        for col in self.df3:
+            self.df3[col]
 
-    def time_iteritems_cached(self):
-        self.g()
+    def time_itertuples_start(self):
+        self.df4.itertuples()
 
-    def time_iteritems_indexing(self):
-        df = self.df3
-        for col in df:
-            df[col]
+    def time_itertuples_read_first(self):
+        next(self.df4.itertuples())
 
     def time_itertuples(self):
-        for row in self.df2.itertuples():
+        for row in self.df4.itertuples():
             pass
 
+    def time_itertuples_to_list(self):
+        list(self.df4.itertuples())
 
-#----------------------------------------------------------------------
-# to_string, to_html, repr
+    def mem_itertuples_start(self):
+        return self.df4.itertuples()
 
-class Formatting(object):
-    goal_time = 0.2
+    def peakmem_itertuples_start(self):
+        self.df4.itertuples()
 
-    def setup(self):
-        self.df = DataFrame(randn(100, 10))
+    def mem_itertuples_read_first(self):
+        return next(self.df4.itertuples())
+
+    def peakmem_itertuples(self):
+        for row in self.df4.itertuples():
+            pass
+
+    def mem_itertuples_to_list(self):
+        return list(self.df4.itertuples())
+
+    def peakmem_itertuples_to_list(self):
+        list(self.df4.itertuples())
+
+    def time_itertuples_raw_start(self):
+        self.df4.itertuples(index=False, name=None)
+
+    def time_itertuples_raw_read_first(self):
+        next(self.df4.itertuples(index=False, name=None))
+
+    def time_itertuples_raw_tuples(self):
+        for row in self.df4.itertuples(index=False, name=None):
+            pass
+
+    def time_itertuples_raw_tuples_to_list(self):
+        list(self.df4.itertuples(index=False, name=None))
+
+    def mem_itertuples_raw_start(self):
+        return self.df4.itertuples(index=False, name=None)
+
+    def peakmem_itertuples_raw_start(self):
+        self.df4.itertuples(index=False, name=None)
+
+    def peakmem_itertuples_raw_read_first(self):
+        next(self.df4.itertuples(index=False, name=None))
+
+    def peakmem_itertuples_raw(self):
+        for row in self.df4.itertuples(index=False, name=None):
+            pass
+
+    def mem_itertuples_raw_to_list(self):
+        return list(self.df4.itertuples(index=False, name=None))
 
-        self.nrows = 500
-        self.df2 = DataFrame(randn(self.nrows, 10))
-        self.df2[0] = period_range('2000', '2010', self.nrows)
-        self.df2[1] = range(self.nrows)
+    def peakmem_itertuples_raw_to_list(self):
+        list(self.df4.itertuples(index=False, name=None))
 
-        self.nrows = 10000
-        self.data = randn(self.nrows, 10)
-        self.idx = MultiIndex.from_arrays(np.tile(randn(3, int(self.nrows / 100)), 100))
-        self.df3 = DataFrame(self.data, index=self.idx)
-        self.idx = randn(self.nrows)
-        self.df4 = DataFrame(self.data, index=self.idx)
+    def time_iterrows(self):
+        for row in self.df.iterrows():
+            pass
 
-        self.df_tall = pandas.DataFrame(np.random.randn(10000, 10))
 
-        self.df_wide = pandas.DataFrame(np.random.randn(10, 10000))
+class ToString(object):
+
+    def setup(self):
+        self.df = DataFrame(np.random.randn(100, 10))
 
     def time_to_string_floats(self):
         self.df.to_string()
 
+
+class ToHTML(object):
+
+    def setup(self):
+        nrows = 500
+        self.df2 = DataFrame(np.random.randn(nrows, 10))
+        self.df2[0] = period_range('2000', periods=nrows)
+        self.df2[1] = range(nrows)
+
     def time_to_html_mixed(self):
         self.df2.to_html()
 
+
+class Repr(object):
+
+    def setup(self):
+        nrows = 10000
+        data = np.random.randn(nrows, 10)
+        arrays = np.tile(np.random.randn(3, int(nrows / 100)), 100)
+        idx = MultiIndex.from_arrays(arrays)
+        self.df3 = DataFrame(data, index=idx)
+        self.df4 = DataFrame(data, index=np.random.randn(nrows))
+        self.df_tall = DataFrame(np.random.randn(nrows, 10))
+        self.df_wide = DataFrame(np.random.randn(10, nrows))
+
     def time_html_repr_trunc_mi(self):
         self.df3._repr_html_()
 
@@ -141,21 +235,14 @@ def time_frame_repr_wide(self):
         repr(self.df_wide)
 
 
-#----------------------------------------------------------------------
-# nulls/masking
-
-
-## masking
-
-class frame_mask_bools(object):
-    goal_time = 0.2
+class MaskBool(object):
 
     def setup(self):
-        self.data = np.random.randn(1000, 500)
-        self.df = DataFrame(self.data)
-        self.df = self.df.where((self.df > 0))
-        self.bools = (self.df > 0)
-        self.mask = isnull(self.df)
+        data = np.random.randn(1000, 500)
+        df = DataFrame(data)
+        df = df.where(df > 0)
+        self.bools = df > 0
+        self.mask = isnull(df)
 
     def time_frame_mask_bools(self):
         self.bools.mask(self.mask)
@@ -164,31 +251,24 @@ def time_frame_mask_floats(self):
         self.bools.astype(float).mask(self.mask)
 
 
-## isnull
-
-class FrameIsnull(object):
-    goal_time = 0.2
+class Isnull(object):
 
     def setup(self):
-        self.df_no_null = DataFrame(np.random.randn(1000, 1000))
-
-        np.random.seed(1234)
-        self.sample = np.array([np.nan, 1.0])
-        self.data = np.random.choice(self.sample, (1000, 1000))
-        self.df = DataFrame(self.data)
-
-        np.random.seed(1234)
-        self.sample = np.array(list(string.ascii_lowercase) +
-                               list(string.ascii_uppercase) +
-                               list(string.whitespace))
-        self.data = np.random.choice(self.sample, (1000, 1000))
-        self.df_strings= DataFrame(self.data)
-
-        np.random.seed(1234)
-        self.sample = np.array([NaT, np.nan, None, np.datetime64('NaT'),
-                                np.timedelta64('NaT'), 0, 1, 2.0, '', 'abcd'])
-        self.data = np.random.choice(self.sample, (1000, 1000))
-        self.df_obj = DataFrame(self.data)
+        N = 10**3
+        self.df_no_null = DataFrame(np.random.randn(N, N))
+
+        sample = np.array([np.nan, 1.0])
+        data = np.random.choice(sample, (N, N))
+        self.df = DataFrame(data)
+
+        sample = np.array(list(string.ascii_letters + string.whitespace))
+        data = np.random.choice(sample, (N, N))
+        self.df_strings = DataFrame(data)
+
+        sample = np.array([NaT, np.nan, None, np.datetime64('NaT'),
+                           np.timedelta64('NaT'), 0, 1, 2.0, '', 'abcd'])
+        data = np.random.choice(sample, (N, N))
+        self.df_obj = DataFrame(data)
 
     def time_isnull_floats_no_null(self):
         isnull(self.df_no_null)
@@ -203,126 +283,97 @@ def time_isnull_obj(self):
         isnull(self.df_obj)
 
 
-# ----------------------------------------------------------------------
-# fillna in place
-
-class frame_fillna_inplace(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 100))
-        self.df.values[::2] = np.nan
-
-    def time_frame_fillna_inplace(self):
-        self.df.fillna(0, inplace=True)
+class Fillna(object):
 
+    params = ([True, False], ['pad', 'bfill'])
+    param_names = ['inplace', 'method']
 
+    def setup(self, inplace, method):
+        values = np.random.randn(10000, 100)
+        values[::2] = np.nan
+        self.df = DataFrame(values)
 
-class frame_fillna_many_columns_pad(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.random.randn(1000, 1000)
-        self.values[::2] = np.nan
-        self.df = DataFrame(self.values)
-
-    def time_frame_fillna_many_columns_pad(self):
-        self.df.fillna(method='pad')
-
+    def time_frame_fillna(self, inplace, method):
+        self.df.fillna(inplace=inplace, method=method)
 
 
 class Dropna(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
+    params = (['all', 'any'], [0, 1])
+    param_names = ['how', 'axis']
+
+    def setup(self, how, axis):
+        self.df = DataFrame(np.random.randn(10000, 1000))
         self.df.ix[50:1000, 20:50] = np.nan
         self.df.ix[2000:3000] = np.nan
         self.df.ix[:, 60:70] = np.nan
         self.df_mixed = self.df.copy()
         self.df_mixed['foo'] = 'bar'
 
-        self.df_mi = self.df.copy()
-        self.df_mi.index = MultiIndex.from_tuples(self.df_mi.index.map((lambda x: (x, x))))
-        self.df_mi.columns = MultiIndex.from_tuples(self.df_mi.columns.map((lambda x: (x, x))))
-
-        self.df_mixed_mi = self.df_mixed.copy()
-        self.df_mixed_mi.index = MultiIndex.from_tuples(self.df_mixed_mi.index.map((lambda x: (x, x))))
-        self.df_mixed_mi.columns = MultiIndex.from_tuples(self.df_mixed_mi.columns.map((lambda x: (x, x))))
-
-    def time_dropna_axis0_all(self):
-        self.df.dropna(how='all', axis=0)
-
-    def time_dropna_axis0_any(self):
-        self.df.dropna(how='any', axis=0)
-
-    def time_dropna_axis1_all(self):
-        self.df.dropna(how='all', axis=1)
+    def time_dropna(self, how, axis):
+        self.df.dropna(how=how, axis=axis)
 
-    def time_dropna_axis1_any(self):
-        self.df.dropna(how='any', axis=1)
+    def time_dropna_axis_mixed_dtypes(self, how, axis):
+        self.df_mixed.dropna(how=how, axis=axis)
 
-    def time_dropna_axis0_all_mixed_dtypes(self):
-        self.df_mixed.dropna(how='all', axis=0)
 
-    def time_dropna_axis0_any_mixed_dtypes(self):
-        self.df_mixed.dropna(how='any', axis=0)
+class Count(object):
 
-    def time_dropna_axis1_all_mixed_dtypes(self):
-        self.df_mixed.dropna(how='all', axis=1)
+    params = [0, 1]
+    param_names = ['axis']
 
-    def time_dropna_axis1_any_mixed_dtypes(self):
-        self.df_mixed.dropna(how='any', axis=1)
-
-    def time_count_level_axis0_multi(self):
-        self.df_mi.count(axis=0, level=1)
+    def setup(self, axis):
+        self.df = DataFrame(np.random.randn(10000, 1000))
+        self.df.ix[50:1000, 20:50] = np.nan
+        self.df.ix[2000:3000] = np.nan
+        self.df.ix[:, 60:70] = np.nan
+        self.df_mixed = self.df.copy()
+        self.df_mixed['foo'] = 'bar'
 
-    def time_count_level_axis1_multi(self):
-        self.df_mi.count(axis=1, level=1)
+        self.df.index = MultiIndex.from_arrays([self.df.index, self.df.index])
+        self.df.columns = MultiIndex.from_arrays([self.df.columns,
+                                                  self.df.columns])
+        self.df_mixed.index = MultiIndex.from_arrays([self.df_mixed.index,
+                                                      self.df_mixed.index])
+        self.df_mixed.columns = MultiIndex.from_arrays([self.df_mixed.columns,
+                                                        self.df_mixed.columns])
 
-    def time_count_level_axis0_mixed_dtypes_multi(self):
-        self.df_mixed_mi.count(axis=0, level=1)
+    def time_count_level_multi(self, axis):
+        self.df.count(axis=axis, level=1)
 
-    def time_count_level_axis1_mixed_dtypes_multi(self):
-        self.df_mixed_mi.count(axis=1, level=1)
+    def time_count_level_mixed_dtypes_multi(self, axis):
+        self.df_mixed.count(axis=axis, level=1)
 
 
 class Apply(object):
-    goal_time = 0.2
 
     def setup(self):
         self.df = DataFrame(np.random.randn(1000, 100))
 
         self.s = Series(np.arange(1028.0))
         self.df2 = DataFrame({i: self.s for i in range(1028)})
-
         self.df3 = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
 
     def time_apply_user_func(self):
-        self.df2.apply((lambda x: np.corrcoef(x, self.s)[(0, 1)]))
+        self.df2.apply(lambda x: np.corrcoef(x, self.s)[(0, 1)])
 
     def time_apply_axis_1(self):
-        self.df.apply((lambda x: (x + 1)), axis=1)
+        self.df.apply(lambda x: x + 1, axis=1)
 
     def time_apply_lambda_mean(self):
-        self.df.apply((lambda x: x.mean()))
+        self.df.apply(lambda x: x.mean())
 
     def time_apply_np_mean(self):
         self.df.apply(np.mean)
 
     def time_apply_pass_thru(self):
-        self.df.apply((lambda x: x))
+        self.df.apply(lambda x: x)
 
     def time_apply_ref_by_name(self):
-        self.df3.apply((lambda x: (x['A'] + x['B'])), axis=1)
+        self.df3.apply(lambda x: x['A'] + x['B'], axis=1)
 
 
-#----------------------------------------------------------------------
-# dtypes
-
-class frame_dtypes(object):
-    goal_time = 0.2
+class Dtypes(object):
 
     def setup(self):
         self.df = DataFrame(np.random.randn(1000, 1000))
@@ -330,331 +381,205 @@ def setup(self):
     def time_frame_dtypes(self):
         self.df.dtypes
 
-#----------------------------------------------------------------------
-# equals
 
 class Equals(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.float_df = DataFrame(np.random.randn(1000, 1000))
-        self.object_df = DataFrame(([(['foo'] * 1000)] * 1000))
-        self.nonunique_cols = self.object_df.copy()
-        self.nonunique_cols.columns = (['A'] * len(self.nonunique_cols.columns))
-        self.pairs = dict([(name, self.make_pair(frame)) for (name, frame) in (
-            ('float_df', self.float_df), ('object_df', self.object_df),
-            ('nonunique_cols', self.nonunique_cols))])
+        N = 10**3
+        self.float_df = DataFrame(np.random.randn(N, N))
+        self.float_df_nan = self.float_df.copy()
+        self.float_df_nan.iloc[-1, -1] = np.nan
 
-    def make_pair(self, frame):
-        self.df = frame
-        self.df2 = self.df.copy()
-        self.df2.ix[((-1), (-1))] = np.nan
-        return (self.df, self.df2)
+        self.object_df = DataFrame('foo', index=range(N), columns=range(N))
+        self.object_df_nan = self.object_df.copy()
+        self.object_df_nan.iloc[-1, -1] = np.nan
 
-    def test_equal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df)
-
-    def test_unequal(self, name):
-        (self.df, self.df2) = self.pairs[name]
-        return self.df.equals(self.df2)
+        self.nonunique_cols = self.object_df.copy()
+        self.nonunique_cols.columns = ['A'] * len(self.nonunique_cols.columns)
+        self.nonunique_cols_nan = self.nonunique_cols.copy()
+        self.nonunique_cols_nan.iloc[-1, -1] = np.nan
 
     def time_frame_float_equal(self):
-        self.test_equal('float_df')
+        self.float_df.equals(self.float_df)
 
     def time_frame_float_unequal(self):
-        self.test_unequal('float_df')
+        self.float_df.equals(self.float_df_nan)
 
     def time_frame_nonunique_equal(self):
-        self.test_equal('nonunique_cols')
+        self.nonunique_cols.equals(self.nonunique_cols)
 
     def time_frame_nonunique_unequal(self):
-        self.test_unequal('nonunique_cols')
+        self.nonunique_cols.equals(self.nonunique_cols_nan)
 
     def time_frame_object_equal(self):
-        self.test_equal('object_df')
+        self.object_df.equals(self.object_df)
 
     def time_frame_object_unequal(self):
-        self.test_unequal('object_df')
+        self.object_df.equals(self.object_df_nan)
 
 
 class Interpolate(object):
-    goal_time = 0.2
 
-    def setup(self):
+    params = [None, 'infer']
+    param_names = ['downcast']
+
+    def setup(self, downcast):
+        N = 10000
         # this is the worst case, where every column has NaNs.
-        self.df = DataFrame(randn(10000, 100))
+        self.df = DataFrame(np.random.randn(N, 100))
         self.df.values[::2] = np.nan
 
-        self.df2 = DataFrame(
-            {'A': np.arange(0, 10000), 'B': np.random.randint(0, 100, 10000),
-             'C': randn(10000), 'D': randn(10000),})
+        self.df2 = DataFrame({'A': np.arange(0, N),
+                              'B': np.random.randint(0, 100, N),
+                              'C': np.random.randn(N),
+                              'D': np.random.randn(N)})
         self.df2.loc[1::5, 'A'] = np.nan
         self.df2.loc[1::5, 'C'] = np.nan
 
-    def time_interpolate(self):
-        self.df.interpolate()
+    def time_interpolate(self, downcast):
+        self.df.interpolate(downcast=downcast)
 
-    def time_interpolate_some_good(self):
-        self.df2.interpolate()
-
-    def time_interpolate_some_good_infer(self):
-        self.df2.interpolate(downcast='infer')
+    def time_interpolate_some_good(self, downcast):
+        self.df2.interpolate(downcast=downcast)
 
 
 class Shift(object):
     # frame shift speedup issue-5609
-    goal_time = 0.2
+    params = [0, 1]
+    param_names = ['axis']
 
-    def setup(self):
+    def setup(self, axis):
         self.df = DataFrame(np.random.rand(10000, 500))
 
-    def time_shift_axis0(self):
-        self.df.shift(1, axis=0)
-
-    def time_shift_axis_1(self):
-        self.df.shift(1, axis=1)
-
-
-#-----------------------------------------------------------------------------
-# from_records issue-6700
-
-class frame_from_records_generator(object):
-    goal_time = 0.2
-
-    def get_data(self, n=100000):
-        return ((x, (x * 20), (x * 100)) for x in range(n))
-
-    def time_frame_from_records_generator(self):
-        self.df = DataFrame.from_records(self.get_data())
-
-    def time_frame_from_records_generator_nrows(self):
-        self.df = DataFrame.from_records(self.get_data(), nrows=1000)
-
+    def time_shift(self, axis):
+        self.df.shift(1, axis=axis)
 
 
-#-----------------------------------------------------------------------------
-# nunique
-
-class frame_nunique(object):
+class Nunique(object):
 
     def setup(self):
-        self.data = np.random.randn(10000, 1000)
-        self.df = DataFrame(self.data)
+        self.df = DataFrame(np.random.randn(10000, 1000))
 
     def time_frame_nunique(self):
         self.df.nunique()
 
 
-
-#-----------------------------------------------------------------------------
-# duplicated
-
-class frame_duplicated(object):
-    goal_time = 0.2
+class Duplicated(object):
 
     def setup(self):
-        self.n = (1 << 20)
-        self.t = date_range('2015-01-01', freq='S', periods=(self.n // 64))
-        self.xs = np.random.randn((self.n // 64)).round(2)
-        self.df = DataFrame({'a': np.random.randint(((-1) << 8), (1 << 8), self.n), 'b': np.random.choice(self.t, self.n), 'c': np.random.choice(self.xs, self.n), })
-
-        self.df2 = DataFrame(np.random.randn(1000, 100).astype(str))
+        n = (1 << 20)
+        t = date_range('2015-01-01', freq='S', periods=(n // 64))
+        xs = np.random.randn(n // 64).round(2)
+        self.df = DataFrame({'a': np.random.randint(-1 << 8, 1 << 8, n),
+                             'b': np.random.choice(t, n),
+                             'c': np.random.choice(xs, n)})
+        self.df2 = DataFrame(np.random.randn(1000, 100).astype(str)).T
 
     def time_frame_duplicated(self):
         self.df.duplicated()
 
     def time_frame_duplicated_wide(self):
-        self.df2.T.duplicated()
-
+        self.df2.duplicated()
 
 
+class XS(object):
 
+    params = [0, 1]
+    param_names = ['axis']
 
+    def setup(self, axis):
+        self.N = 10**4
+        self.df = DataFrame(np.random.randn(self.N, self.N))
 
+    def time_frame_xs(self, axis):
+        self.df.xs(self.N / 2, axis=axis)
 
 
+class SortValues(object):
 
+    params = [True, False]
+    param_names = ['ascending']
 
+    def setup(self, ascending):
+        self.df = DataFrame(np.random.randn(1000000, 2), columns=list('AB'))
 
+    def time_frame_sort_values(self, ascending):
+        self.df.sort_values(by='A', ascending=ascending)
 
 
-
-
-
-
-class frame_xs_col(object):
-    goal_time = 0.2
+class SortIndexByColumns(object):
 
     def setup(self):
-        self.df = DataFrame(randn(1, 100000))
+        N = 10000
+        K = 10
+        self.df = DataFrame({'key1': tm.makeStringIndex(N).values.repeat(K),
+                             'key2': tm.makeStringIndex(N).values.repeat(K),
+                             'value': np.random.randn(N * K)})
 
-    def time_frame_xs_col(self):
-        self.df.xs(50000, axis=1)
+    def time_frame_sort_values_by_columns(self):
+        self.df.sort_values(by=['key1', 'key2'])
 
 
-class frame_xs_row(object):
-    goal_time = 0.2
+class Quantile(object):
 
-    def setup(self):
-        self.df = DataFrame(randn(100000, 1))
+    params = [0, 1]
+    param_names = ['axis']
 
-    def time_frame_xs_row(self):
-        self.df.xs(50000)
+    def setup(self, axis):
+        self.df = DataFrame(np.random.randn(1000, 3), columns=list('ABC'))
 
+    def time_frame_quantile(self, axis):
+        self.df.quantile([0.1, 0.5], axis=axis)
 
-class frame_sort_index(object):
-    goal_time = 0.2
 
+class GetDtypeCounts(object):
+    # 2807
     def setup(self):
-        self.df = DataFrame(randn(1000000, 2), columns=list('AB'))
-
-    def time_frame_sort_index(self):
-        self.df.sort_index()
+        self.df = DataFrame(np.random.randn(10, 10000))
 
+    def time_frame_get_dtype_counts(self):
+        self.df.get_dtype_counts()
 
-class frame_sort_index_by_columns(object):
-    goal_time = 0.2
+    def time_info(self):
+        self.df.info()
 
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
 
-    def time_frame_sort_index_by_columns(self):
-        self.df.sort_index(by=['key1', 'key2'])
+class NSort(object):
 
+    params = ['first', 'last', 'all']
+    param_names = ['keep']
 
-class frame_quantile_axis1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 3),
+    def setup(self, keep):
+        self.df = DataFrame(np.random.randn(100000, 3),
                             columns=list('ABC'))
 
-    def time_frame_quantile_axis1(self):
-        self.df.quantile([0.1, 0.5], axis=1)
-
-
-#----------------------------------------------------------------------
-# boolean indexing
+    def time_nlargest_one_column(self, keep):
+        self.df.nlargest(100, 'A', keep=keep)
 
-class frame_boolean_row_select(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 100))
-        self.bool_arr = np.zeros(10000, dtype=bool)
-        self.bool_arr[:1000] = True
-
-    def time_frame_boolean_row_select(self):
-        self.df[self.bool_arr]
-
-class frame_getitem_single_column(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(randn(10000, 1000))
-        self.df2 = DataFrame(randn(3000, 1), columns=['A'])
-        self.df3 = DataFrame(randn(3000, 1))
-
-    def h(self):
-        for i in range(10000):
-            self.df2['A']
-
-    def j(self):
-        for i in range(10000):
-            self.df3[0]
-
-    def time_frame_getitem_single_column(self):
-        self.h()
-
-    def time_frame_getitem_single_column2(self):
-        self.j()
+    def time_nlargest_two_columns(self, keep):
+        self.df.nlargest(100, ['A', 'B'], keep=keep)
 
+    def time_nsmallest_one_column(self, keep):
+        self.df.nsmallest(100, 'A', keep=keep)
 
-#----------------------------------------------------------------------
-# assignment
-
-class frame_assign_timeseries_index(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = date_range('1/1/2000', periods=100000, freq='D')
-        self.df = DataFrame(randn(100000, 1), columns=['A'], index=self.idx)
-
-    def time_frame_assign_timeseries_index(self):
-        self.f(self.df)
-
-    def f(self, df):
-        self.x = self.df.copy()
-        self.x['date'] = self.x.index
+    def time_nsmallest_two_columns(self, keep):
+        self.df.nsmallest(100, ['A', 'B'], keep=keep)
 
 
-
-# insert many columns
-
-class frame_insert_100_columns_begin(object):
-    goal_time = 0.2
+class Describe(object):
 
     def setup(self):
-        self.N = 1000
-
-    def f(self, K=100):
-        self.df = DataFrame(index=range(self.N))
-        self.new_col = np.random.randn(self.N)
-        for i in range(K):
-            self.df.insert(0, i, self.new_col)
-
-    def g(self, K=500):
-        self.df = DataFrame(index=range(self.N))
-        self.new_col = np.random.randn(self.N)
-        for i in range(K):
-            self.df[i] = self.new_col
-
-    def time_frame_insert_100_columns_begin(self):
-        self.f()
+        self.df = DataFrame({
+            'a': np.random.randint(0, 100, int(1e6)),
+            'b': np.random.randint(0, 100, int(1e6)),
+            'c': np.random.randint(0, 100, int(1e6))
+        })
 
-    def time_frame_insert_500_columns_end(self):
-        self.g()
+    def time_series_describe(self):
+        self.df['a'].describe()
 
+    def time_dataframe_describe(self):
+        self.df.describe()
 
 
-#----------------------------------------------------------------------
-# strings methods, #2602
-
-class series_string_vector_slice(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series((['abcdefg', np.nan] * 500000))
-
-    def time_series_string_vector_slice(self):
-        self.s.str[:5]
-
-
-#----------------------------------------------------------------------
-# df.info() and get_dtype_counts() # 2807
-
-class frame_get_dtype_counts(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(10, 10000))
-
-    def time_frame_get_dtype_counts(self):
-        self.df.get_dtype_counts()
-
-
-class frame_nlargest(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 3),
-                            columns=list('ABC'))
-
-    def time_frame_nlargest(self):
-        self.df.nlargest(100, 'A')
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/gil.py b/asv_bench/benchmarks/gil.py
index 1c5e59672cb57..6819a296c81df 100644
--- a/asv_bench/benchmarks/gil.py
+++ b/asv_bench/benchmarks/gil.py
@@ -1,235 +1,134 @@
-from .pandas_vb_common import *
-from pandas.core import common as com
-
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, read_csv, factorize, date_range
+from pandas.core.algorithms import take_1d
 try:
-    from cStringIO import StringIO
+    from pandas import (rolling_median, rolling_mean, rolling_min, rolling_max,
+                        rolling_var, rolling_skew, rolling_kurt, rolling_std)
+    have_rolling_methods = True
 except ImportError:
-    from io import StringIO
-
+    have_rolling_methods = False
+try:
+    from pandas._libs import algos
+except ImportError:
+    from pandas import algos
 try:
     from pandas.util.testing import test_parallel
-
     have_real_test_parallel = True
 except ImportError:
     have_real_test_parallel = False
 
-
     def test_parallel(num_threads=1):
-
         def wrapper(fname):
             return fname
-
         return wrapper
 
+from .pandas_vb_common import BaseIO
 
-class NoGilGroupby(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
+class ParallelGroupbyMethods(object):
 
-        np.random.seed(1234)
-        self.size = 2 ** 22
-        self.ngroups = 100
-        self.data = Series(np.random.randint(0, self.ngroups, size=self.size))
+    params = ([2, 4, 8], ['count', 'last', 'max', 'mean', 'min', 'prod',
+                          'sum', 'var'])
+    param_names = ['threads', 'method']
 
-        if (not have_real_test_parallel):
+    def setup(self, threads, method):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**6
+        ngroups = 10**3
+        df = DataFrame({'key': np.random.randint(0, ngroups, size=N),
+                        'data': np.random.randn(N)})
 
-    @test_parallel(num_threads=2)
-    def _pg2_count(self):
-        self.df.groupby('key')['data'].count()
-
-    def time_count_2(self):
-        self._pg2_count()
-
-    @test_parallel(num_threads=2)
-    def _pg2_last(self):
-        self.df.groupby('key')['data'].last()
-
-    def time_last_2(self):
-        self._pg2_last()
-
-    @test_parallel(num_threads=2)
-    def _pg2_max(self):
-        self.df.groupby('key')['data'].max()
-
-    def time_max_2(self):
-        self._pg2_max()
-
-    @test_parallel(num_threads=2)
-    def _pg2_mean(self):
-        self.df.groupby('key')['data'].mean()
-
-    def time_mean_2(self):
-        self._pg2_mean()
-
-    @test_parallel(num_threads=2)
-    def _pg2_min(self):
-        self.df.groupby('key')['data'].min()
-
-    def time_min_2(self):
-        self._pg2_min()
-
-    @test_parallel(num_threads=2)
-    def _pg2_prod(self):
-        self.df.groupby('key')['data'].prod()
-
-    def time_prod_2(self):
-        self._pg2_prod()
-
-    @test_parallel(num_threads=2)
-    def _pg2_sum(self):
-        self.df.groupby('key')['data'].sum()
-
-    def time_sum_2(self):
-        self._pg2_sum()
-
-    @test_parallel(num_threads=4)
-    def _pg4_sum(self):
-        self.df.groupby('key')['data'].sum()
-
-    def time_sum_4(self):
-        self._pg4_sum()
-
-    def time_sum_4_notp(self):
-        for i in range(4):
-            self.df.groupby('key')['data'].sum()
-
-    def _f_sum(self):
-        self.df.groupby('key')['data'].sum()
-
-    @test_parallel(num_threads=8)
-    def _pg8_sum(self):
-        self._f_sum()
-
-    def time_sum_8(self):
-        self._pg8_sum()
-
-    def time_sum_8_notp(self):
-        for i in range(8):
-            self._f_sum()
-
-    @test_parallel(num_threads=2)
-    def _pg2_var(self):
-        self.df.groupby('key')['data'].var()
-
-    def time_var_2(self):
-        self._pg2_var()
-
-    # get groups
-
-    def _groups(self):
-        self.data.groupby(self.data).groups
-
-    @test_parallel(num_threads=2)
-    def _pg2_groups(self):
-        self._groups()
-
-    def time_groups_2(self):
-        self._pg2_groups()
-
-    @test_parallel(num_threads=4)
-    def _pg4_groups(self):
-        self._groups()
+        @test_parallel(num_threads=threads)
+        def parallel():
+            getattr(df.groupby('key')['data'], method)()
+        self.parallel = parallel
 
-    def time_groups_4(self):
-        self._pg4_groups()
+        def loop():
+            getattr(df.groupby('key')['data'], method)()
+        self.loop = loop
 
-    @test_parallel(num_threads=8)
-    def _pg8_groups(self):
-        self._groups()
+    def time_parallel(self, threads, method):
+        self.parallel()
 
-    def time_groups_8(self):
-        self._pg8_groups()
+    def time_loop(self, threads, method):
+        for i in range(threads):
+            self.loop()
 
 
+class ParallelGroups(object):
 
-class nogil_take1d_float64(object):
-    goal_time = 0.2
+    params = [2, 4, 8]
+    param_names = ['threads']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, threads):
+        if not have_real_test_parallel:
             raise NotImplementedError
-        self.N = 10000000.0
-        self.df = DataFrame({'int64': np.arange(self.N, dtype='int64'), 'float64': np.arange(self.N, dtype='float64'), })
-        self.indexer = np.arange(100, (len(self.df) - 100))
+        size = 2**22
+        ngroups = 10**3
+        data = Series(np.random.randint(0, ngroups, size=size))
 
-    def time_nogil_take1d_float64(self):
-        self.take_1d_pg2_int64()
+        @test_parallel(num_threads=threads)
+        def get_groups():
+            data.groupby(data).groups
+        self.get_groups = get_groups
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_int64(self):
-        com.take_1d(self.df.int64.values, self.indexer)
+    def time_get_groups(self, threads):
+        self.get_groups()
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_float64(self):
-        com.take_1d(self.df.float64.values, self.indexer)
 
+class ParallelTake1D(object):
 
-class nogil_take1d_int64(object):
-    goal_time = 0.2
+    params = ['int64', 'float64']
+    param_names = ['dtype']
 
-    def setup(self):
-        self.N = 1000000
-        self.ngroups = 1000
-        np.random.seed(1234)
-        self.df = DataFrame({'key': np.random.randint(0, self.ngroups, size=self.N), 'data': np.random.randn(self.N), })
-        if (not have_real_test_parallel):
+    def setup(self, dtype):
+        if not have_real_test_parallel:
             raise NotImplementedError
-        self.N = 10000000.0
-        self.df = DataFrame({'int64': np.arange(self.N, dtype='int64'), 'float64': np.arange(self.N, dtype='float64'), })
-        self.indexer = np.arange(100, (len(self.df) - 100))
+        N = 10**6
+        df = DataFrame({'col': np.arange(N, dtype=dtype)})
+        indexer = np.arange(100, len(df) - 100)
 
-    def time_nogil_take1d_int64(self):
-        self.take_1d_pg2_float64()
+        @test_parallel(num_threads=2)
+        def parallel_take1d():
+            take_1d(df['col'].values, indexer)
+        self.parallel_take1d = parallel_take1d
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_int64(self):
-        com.take_1d(self.df.int64.values, self.indexer)
+    def time_take1d(self, dtype):
+        self.parallel_take1d()
 
-    @test_parallel(num_threads=2)
-    def take_1d_pg2_float64(self):
-        com.take_1d(self.df.float64.values, self.indexer)
 
+class ParallelKth(object):
 
-class nogil_kth_smallest(object):
     number = 1
     repeat = 5
 
     def setup(self):
-        if (not have_real_test_parallel):
+        if not have_real_test_parallel:
             raise NotImplementedError
-        np.random.seed(1234)
-        self.N = 10000000
-        self.k = 500000
-        self.a = np.random.randn(self.N)
-        self.b = self.a.copy()
-        self.kwargs_list = [{'arr': self.a}, {'arr': self.b}]
+        N = 10**7
+        k = 5 * 10**5
+        kwargs_list = [{'arr': np.random.randn(N)},
+                       {'arr': np.random.randn(N)}]
 
-    def time_nogil_kth_smallest(self):
-        @test_parallel(num_threads=2, kwargs_list=self.kwargs_list)
-        def run(arr):
-            algos.kth_smallest(arr, self.k)
-        run()
+        @test_parallel(num_threads=2, kwargs_list=kwargs_list)
+        def parallel_kth_smallest(arr):
+            algos.kth_smallest(arr, k)
+        self.parallel_kth_smallest = parallel_kth_smallest
 
+    def time_kth_smallest(self):
+        self.parallel_kth_smallest()
 
-class nogil_datetime_fields(object):
-    goal_time = 0.2
+
+class ParallelDatetimeFields(object):
 
     def setup(self):
-        self.N = 100000000
-        self.dti = pd.date_range('1900-01-01', periods=self.N, freq='D')
-        self.period = self.dti.to_period('D')
-        if (not have_real_test_parallel):
+        if not have_real_test_parallel:
             raise NotImplementedError
+        N = 10**6
+        self.dti = date_range('1900-01-01', periods=N, freq='T')
+        self.period = self.dti.to_period('D')
 
     def time_datetime_field_year(self):
         @test_parallel(num_threads=2)
@@ -268,149 +167,106 @@ def run(period):
         run(self.period)
 
 
-class nogil_rolling_algos_slow(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.win = 100
-        np.random.seed(1234)
-        self.arr = np.random.rand(100000)
-        if (not have_real_test_parallel):
-            raise NotImplementedError
-
-    def time_nogil_rolling_median(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_median(arr, win)
-        run(self.arr, self.win)
-
+class ParallelRolling(object):
 
-class nogil_rolling_algos_fast(object):
-    goal_time = 0.2
+    params = ['median', 'mean', 'min', 'max', 'var', 'skew', 'kurt', 'std']
+    param_names = ['method']
 
-    def setup(self):
-        self.win = 100
-        np.random.seed(1234)
-        self.arr = np.random.rand(1000000)
-        if (not have_real_test_parallel):
+    def setup(self, method):
+        if not have_real_test_parallel:
+            raise NotImplementedError
+        win = 100
+        arr = np.random.rand(100000)
+        if hasattr(DataFrame, 'rolling'):
+            df = DataFrame(arr).rolling(win)
+
+            @test_parallel(num_threads=2)
+            def parallel_rolling():
+                getattr(df, method)()
+            self.parallel_rolling = parallel_rolling
+        elif have_rolling_methods:
+            rolling = {'median': rolling_median,
+                       'mean': rolling_mean,
+                       'min': rolling_min,
+                       'max': rolling_max,
+                       'var': rolling_var,
+                       'skew': rolling_skew,
+                       'kurt': rolling_kurt,
+                       'std': rolling_std}
+
+            @test_parallel(num_threads=2)
+            def parallel_rolling():
+                rolling[method](arr, win)
+            self.parallel_rolling = parallel_rolling
+        else:
             raise NotImplementedError
 
-    def time_nogil_rolling_mean(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_mean(arr, win)
-        run(self.arr, self.win)
-
-    def time_nogil_rolling_min(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_min(arr, win)
-        run(self.arr, self.win)
-
-    def time_nogil_rolling_max(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_max(arr, win)
-        run(self.arr, self.win)
-
-    def time_nogil_rolling_var(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_var(arr, win)
-        run(self.arr, self.win)
-
-    def time_nogil_rolling_skew(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_skew(arr, win)
-        run(self.arr, self.win)
-
-    def time_nogil_rolling_kurt(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_kurt(arr, win)
-        run(self.arr, self.win)
+    def time_rolling(self, method):
+        self.parallel_rolling()
 
-    def time_nogil_rolling_std(self):
-        @test_parallel(num_threads=2)
-        def run(arr, win):
-            rolling_std(arr, win)
-        run(self.arr, self.win)
 
+class ParallelReadCSV(BaseIO):
 
-class nogil_read_csv(object):
     number = 1
     repeat = 5
+    params = ['float', 'object', 'datetime']
+    param_names = ['dtype']
 
-    def setup(self):
-        if (not have_real_test_parallel):
+    def setup(self, dtype):
+        if not have_real_test_parallel:
             raise NotImplementedError
-        # Using the values
-        self.df = DataFrame(np.random.randn(10000, 50))
-        self.df.to_csv('__test__.csv')
+        rows = 10000
+        cols = 50
+        data = {'float': DataFrame(np.random.randn(rows, cols)),
+                'datetime': DataFrame(np.random.randn(rows, cols),
+                                      index=date_range('1/1/2000',
+                                                       periods=rows)),
+                'object': DataFrame('foo',
+                                    index=range(rows),
+                                    columns=['object%03d'.format(i)
+                                             for i in range(5)])}
+
+        self.fname = '__test_{}__.csv'.format(dtype)
+        df = data[dtype]
+        df.to_csv(self.fname)
 
-        self.rng = date_range('1/1/2000', periods=10000)
-        self.df_date_time = DataFrame(np.random.randn(10000, 50), index=self.rng)
-        self.df_date_time.to_csv('__test_datetime__.csv')
-
-        self.df_object = DataFrame('foo', index=self.df.index, columns=self.create_cols('object'))
-        self.df_object.to_csv('__test_object__.csv')
-
-    def create_cols(self, name):
-        return [('%s%03d' % (name, i)) for i in range(5)]
-
-    @test_parallel(num_threads=2)
-    def pg_read_csv(self):
-        read_csv('__test__.csv', sep=',', header=None, float_precision=None)
-
-    def time_read_csv(self):
-        self.pg_read_csv()
-
-    @test_parallel(num_threads=2)
-    def pg_read_csv_object(self):
-        read_csv('__test_object__.csv', sep=',')
-
-    def time_read_csv_object(self):
-        self.pg_read_csv_object()
+        @test_parallel(num_threads=2)
+        def parallel_read_csv():
+            read_csv(self.fname)
+        self.parallel_read_csv = parallel_read_csv
 
-    @test_parallel(num_threads=2)
-    def pg_read_csv_datetime(self):
-        read_csv('__test_datetime__.csv', sep=',', header=None)
+    def time_read_csv(self, dtype):
+        self.parallel_read_csv()
 
-    def time_read_csv_datetime(self):
-        self.pg_read_csv_datetime()
 
+class ParallelFactorize(object):
 
-class nogil_factorize(object):
     number = 1
     repeat = 5
+    params = [2, 4, 8]
+    param_names = ['threads']
 
-    def setup(self):
-        if (not have_real_test_parallel):
+    def setup(self, threads):
+        if not have_real_test_parallel:
             raise NotImplementedError
 
-        np.random.seed(1234)
-        self.strings = tm.makeStringIndex(100000)
+        strings = tm.makeStringIndex(100000)
 
-    def factorize_strings(self):
-        pd.factorize(self.strings)
+        @test_parallel(num_threads=threads)
+        def parallel():
+            factorize(strings)
+        self.parallel = parallel
 
-    @test_parallel(num_threads=4)
-    def _pg_factorize_strings_4(self):
-        self.factorize_strings()
+        def loop():
+            factorize(strings)
+        self.loop = loop
 
-    def time_factorize_strings_4(self):
-        for i in range(2):
-            self._pg_factorize_strings_4()
+    def time_parallel(self, threads):
+        self.parallel()
 
-    @test_parallel(num_threads=2)
-    def _pg_factorize_strings_2(self):
-        self.factorize_strings()
+    def time_loop(self, threads):
+        for i in range(threads):
+            self.loop()
 
-    def time_factorize_strings_2(self):
-        for i in range(4):
-            self._pg_factorize_strings_2()
 
-    def time_factorize_strings(self):
-        for i in range(8):
-            self.factorize_strings()
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/groupby.py b/asv_bench/benchmarks/groupby.py
index b8d8e8b7912d7..27d279bb90a31 100644
--- a/asv_bench/benchmarks/groupby.py
+++ b/asv_bench/benchmarks/groupby.py
@@ -1,129 +1,54 @@
-from .pandas_vb_common import *
-from string import ascii_letters, digits
+from functools import partial
 from itertools import product
+from string import ascii_letters
+import warnings
 
+import numpy as np
 
-class groupby_agg_builtins(object):
-    goal_time = 0.2
+from pandas import (
+    Categorical, DataFrame, MultiIndex, Series, TimeGrouper, Timestamp,
+    date_range, period_range)
+import pandas.util.testing as tm
 
-    def setup(self):
-        np.random.seed(27182)
-        self.n = 100000
-        self.df = DataFrame(np.random.randint(1, (self.n / 100), (self.n, 3)), columns=['jim', 'joe', 'jolie'])
-
-    def time_groupby_agg_builtins1(self):
-        self.df.groupby('jim').agg([sum, min, max])
-
-    def time_groupby_agg_builtins2(self):
-        self.df.groupby(['jim', 'joe']).agg([sum, min, max])
 
-#----------------------------------------------------------------------
-# dict return values
+method_blacklist = {
+    'object': {'median', 'prod', 'sem', 'cumsum', 'sum', 'cummin', 'mean',
+               'max', 'skew', 'cumprod', 'cummax', 'rank', 'pct_change', 'min',
+               'var', 'mad', 'describe', 'std', 'quantile'},
+    'datetime': {'median', 'prod', 'sem', 'cumsum', 'sum', 'mean', 'skew',
+                 'cumprod', 'cummax', 'pct_change', 'var', 'mad', 'describe',
+                 'std'}
+}
 
-class groupby_apply_dict_return(object):
-    goal_time = 0.2
 
+class ApplyDictReturn(object):
     def setup(self):
         self.labels = np.arange(1000).repeat(10)
-        self.data = Series(randn(len(self.labels)))
-        self.f = (lambda x: {'first': x.values[0], 'last': x.values[(-1)], })
+        self.data = Series(np.random.randn(len(self.labels)))
 
     def time_groupby_apply_dict_return(self):
-        self.data.groupby(self.labels).apply(self.f)
-
-
-#----------------------------------------------------------------------
-# groups
-
-class Groups(object):
-    goal_time = 0.1
-
-    size = 2 ** 22
-    data = {
-        'int64_small': Series(np.random.randint(0, 100, size=size)),
-        'int64_large' : Series(np.random.randint(0, 10000, size=size)),
-        'object_small': Series(tm.makeStringIndex(100).take(np.random.randint(0, 100, size=size))),
-        'object_large': Series(tm.makeStringIndex(10000).take(np.random.randint(0, 10000, size=size)))
-    }
-
-    param_names = ['df']
-    params = ['int64_small', 'int64_large', 'object_small', 'object_large']
-
-    def setup(self, df):
-        self.df = self.data[df]
-
-    def time_groupby_groups(self, df):
-        self.df.groupby(self.df).groups
-
-
-#----------------------------------------------------------------------
-# First / last functions
-
-class FirstLast(object):
-    goal_time = 0.2
-
-    param_names = ['dtype']
-    params = ['float32', 'float64', 'datetime', 'object']
-
-    # with datetimes (GH7555)
+        self.data.groupby(self.labels).apply(lambda x: {'first': x.values[0],
+                                                        'last': x.values[-1]})
 
-    def setup(self, dtype):
-
-        if dtype == 'datetime':
-            self.df = DataFrame(
-                {'values': date_range('1/1/2011', periods=100000, freq='s'),
-                 'key': range(100000),})
-        elif dtype == 'object':
-            self.df = DataFrame(
-                {'values': (['foo'] * 100000),
-                 'key': range(100000)})
-        else:
-            labels = np.arange(10000).repeat(10)
-            data = Series(randn(len(labels)), dtype=dtype)
-            data[::3] = np.nan
-            data[1::3] = np.nan
-            labels = labels.take(np.random.permutation(len(labels)))
-            self.df = DataFrame({'values': data, 'key': labels})
 
-    def time_groupby_first(self, dtype):
-        self.df.groupby('key').first()
-
-    def time_groupby_last(self, dtype):
-        self.df.groupby('key').last()
-
-    def time_groupby_nth_any(self, dtype):
-        self.df.groupby('key').nth(0, dropna='all')
-
-    def time_groupby_nth_none(self, dtype):
-        self.df.groupby('key').nth(0)
+class Apply(object):
 
+    def setup_cache(self):
+        N = 10**4
+        labels = np.random.randint(0, 2000, size=N)
+        labels2 = np.random.randint(0, 3, size=N)
+        df = DataFrame({'key': labels,
+                        'key2': labels2,
+                        'value1': np.random.randn(N),
+                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)
+                        })
+        return df
 
-#----------------------------------------------------------------------
-# DataFrame Apply overhead
+    def time_scalar_function_multi_col(self, df):
+        df.groupby(['key', 'key2']).apply(lambda x: 1)
 
-class groupby_frame_apply(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.labels = np.random.randint(0, 2000, size=self.N)
-        self.labels2 = np.random.randint(0, 3, size=self.N)
-        self.df = DataFrame({
-            'key': self.labels,
-            'key2': self.labels2,
-            'value1': np.random.randn(self.N),
-            'value2': (['foo', 'bar', 'baz', 'qux'] * (self.N // 4)),
-        })
-
-    @staticmethod
-    def scalar_function(g):
-        return 1
-
-    def time_groupby_frame_apply_scalar_function(self):
-        self.df.groupby(['key', 'key2']).apply(self.scalar_function)
-
-    def time_groupby_frame_apply_scalar_function_overhead(self):
-        self.df.groupby('key').apply(self.scalar_function)
+    def time_scalar_function_single_col(self, df):
+        df.groupby('key').apply(lambda x: 1)
 
     @staticmethod
     def df_copy_function(g):
@@ -131,374 +56,329 @@ def df_copy_function(g):
         g.name
         return g.copy()
 
-    def time_groupby_frame_df_copy_function(self):
-        self.df.groupby(['key', 'key2']).apply(self.df_copy_function)
-
-    def time_groupby_frame_apply_df_copy_overhead(self):
-        self.df.groupby('key').apply(self.df_copy_function)
-
-
-#----------------------------------------------------------------------
-# 2d grouping, aggregate many columns
+    def time_copy_function_multi_col(self, df):
+        df.groupby(['key', 'key2']).apply(self.df_copy_function)
 
-class groupby_frame_cython_many_columns(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.labels = np.random.randint(0, 100, size=1000)
-        self.df = DataFrame(randn(1000, 1000))
-
-    def time_sum(self):
-        self.df.groupby(self.labels).sum()
+    def time_copy_overhead_single_col(self, df):
+        df.groupby('key').apply(self.df_copy_function)
 
 
-#----------------------------------------------------------------------
-# single key, long, integer key
-
-class groupby_frame_singlekey_integer(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = np.random.randn(100000, 1)
-        self.labels = np.random.randint(0, 1000, size=100000)
-        self.df = DataFrame(self.data)
-
-    def time_sum(self):
-        self.df.groupby(self.labels).sum()
-
-
-#----------------------------------------------------------------------
-# DataFrame nth
-
-class groupby_nth(object):
-    goal_time = 0.2
+class Groups(object):
 
-    def setup(self):
-        self.df = DataFrame(np.random.randint(1, 100, (10000, 2)))
+    param_names = ['key']
+    params = ['int64_small', 'int64_large', 'object_small', 'object_large']
 
-    def time_groupby_frame_nth_any(self):
-        self.df.groupby(0).nth(0, dropna='any')
+    def setup_cache(self):
+        size = 10**6
+        data = {'int64_small': Series(np.random.randint(0, 100, size=size)),
+                'int64_large': Series(np.random.randint(0, 10000, size=size)),
+                'object_small': Series(
+                    tm.makeStringIndex(100).take(
+                        np.random.randint(0, 100, size=size))),
+                'object_large': Series(
+                    tm.makeStringIndex(10000).take(
+                        np.random.randint(0, 10000, size=size)))}
+        return data
 
-    def time_groupby_frame_nth_none(self):
-        self.df.groupby(0).nth(0)
+    def setup(self, data, key):
+        self.ser = data[key]
 
-    def time_groupby_series_nth_any(self):
-        self.df[1].groupby(self.df[0]).nth(0, dropna='any')
+    def time_series_groups(self, data, key):
+        self.ser.groupby(self.ser).groups
 
-    def time_groupby_series_nth_none(self):
-        self.df[1].groupby(self.df[0]).nth(0)
 
+class GroupManyLabels(object):
 
-#----------------------------------------------------------------------
-# groupby_indices replacement, chop up Series
+    params = [1, 1000]
+    param_names = ['ncols']
 
-class groupby_indices(object):
-    goal_time = 0.2
+    def setup(self, ncols):
+        N = 1000
+        data = np.random.randn(N, ncols)
+        self.labels = np.random.randint(0, 100, size=N)
+        self.df = DataFrame(data)
 
-    def setup(self):
-        try:
-            self.rng = date_range('1/1/2000', '12/31/2005', freq='H')
-            (self.year, self.month, self.day) = (self.rng.year, self.rng.month, self.rng.day)
-        except:
-            self.rng = date_range('1/1/2000', '12/31/2000', offset=datetools.Hour())
-            self.year = self.rng.map((lambda x: x.year))
-            self.month = self.rng.map((lambda x: x.month))
-            self.day = self.rng.map((lambda x: x.day))
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-
-    def time_groupby_indices(self):
-        len(self.ts.groupby([self.year, self.month, self.day]))
+    def time_sum(self, ncols):
+        self.df.groupby(self.labels).sum()
 
 
-class groupby_int64_overflow(object):
-    goal_time = 0.2
+class Nth(object):
 
-    def setup(self):
-        self.arr = np.random.randint(((-1) << 12), (1 << 12), ((1 << 17), 5))
-        self.i = np.random.choice(len(self.arr), (len(self.arr) * 5))
-        self.arr = np.vstack((self.arr, self.arr[self.i]))
-        self.i = np.random.permutation(len(self.arr))
-        self.arr = self.arr[self.i]
-        self.df = DataFrame(self.arr, columns=list('abcde'))
-        (self.df['jim'], self.df['joe']) = (np.random.randn(2, len(self.df)) * 10)
+    param_names = ['dtype']
+    params = ['float32', 'float64', 'datetime', 'object']
 
-    def time_groupby_int64_overflow(self):
-        self.df.groupby(list('abcde')).max()
+    def setup(self, dtype):
+        N = 10**5
+        # with datetimes (GH7555)
+        if dtype == 'datetime':
+            values = date_range('1/1/2011', periods=N, freq='s')
+        elif dtype == 'object':
+            values = ['foo'] * N
+        else:
+            values = np.arange(N).astype(dtype)
 
+        key = np.arange(N)
+        self.df = DataFrame({'key': key, 'values': values})
+        self.df.iloc[1, 1] = np.nan  # insert missing data
 
-#----------------------------------------------------------------------
-# count() speed
+    def time_frame_nth_any(self, dtype):
+        self.df.groupby('key').nth(0, dropna='any')
 
-class groupby_multi_count(object):
-    goal_time = 0.2
+    def time_groupby_nth_all(self, dtype):
+        self.df.groupby('key').nth(0, dropna='all')
 
-    def setup(self):
-        self.n = 10000
-        self.offsets = np.random.randint(self.n, size=self.n).astype('timedelta64[ns]')
-        self.dates = (np.datetime64('now') + self.offsets)
-        self.dates[(np.random.rand(self.n) > 0.5)] = np.datetime64('nat')
-        self.offsets[(np.random.rand(self.n) > 0.5)] = np.timedelta64('nat')
-        self.value2 = np.random.randn(self.n)
-        self.value2[(np.random.rand(self.n) > 0.5)] = np.nan
-        self.obj = np.random.choice(list('ab'), size=self.n).astype(object)
-        self.obj[(np.random.randn(self.n) > 0.5)] = np.nan
-        self.df = DataFrame({'key1': np.random.randint(0, 500, size=self.n),
-                             'key2': np.random.randint(0, 100, size=self.n),
-                             'dates': self.dates,
-                             'value2': self.value2,
-                             'value3': np.random.randn(self.n),
-                             'ints': np.random.randint(0, 1000, size=self.n),
-                             'obj': self.obj,
-                             'offsets': self.offsets, })
-
-    def time_groupby_multi_count(self):
-        self.df.groupby(['key1', 'key2']).count()
-
-
-class groupby_int_count(object):
-    goal_time = 0.2
+    def time_frame_nth(self, dtype):
+        self.df.groupby('key').nth(0)
 
-    def setup(self):
-        self.n = 10000
-        self.df = DataFrame({'key1': randint(0, 500, size=self.n),
-                             'key2': randint(0, 100, size=self.n),
-                             'ints': randint(0, 1000, size=self.n),
-                             'ints2': randint(0, 1000, size=self.n), })
+    def time_series_nth_any(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0, dropna='any')
 
-    def time_groupby_int_count(self):
-        self.df.groupby(['key1', 'key2']).count()
+    def time_series_nth_all(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0, dropna='all')
 
+    def time_series_nth(self, dtype):
+        self.df['values'].groupby(self.df['key']).nth(0)
 
-#----------------------------------------------------------------------
-# nunique() speed
 
-class groupby_nunique(object):
+class DateAttributes(object):
 
     def setup(self):
-        self.n = 10000
-        self.df = DataFrame({'key1': randint(0, 500, size=self.n),
-                             'key2': randint(0, 100, size=self.n),
-                             'ints': randint(0, 1000, size=self.n),
-                             'ints2': randint(0, 1000, size=self.n), })
-
-    def time_groupby_nunique(self):
-        self.df.groupby(['key1', 'key2']).nunique()
+        rng = date_range('1/1/2000', '12/31/2005', freq='H')
+        self.year, self.month, self.day = rng.year, rng.month, rng.day
+        self.ts = Series(np.random.randn(len(rng)), index=rng)
 
+    def time_len_groupby_object(self):
+        len(self.ts.groupby([self.year, self.month, self.day]))
 
-#----------------------------------------------------------------------
-# group with different functions per column
 
-class groupby_agg_multi(object):
-    goal_time = 0.2
+class Int64(object):
 
     def setup(self):
-        self.fac1 = np.array(['A', 'B', 'C'], dtype='O')
-        self.fac2 = np.array(['one', 'two'], dtype='O')
-        self.df = DataFrame({'key1': self.fac1.take(np.random.randint(0, 3, size=100000)), 'key2': self.fac2.take(np.random.randint(0, 2, size=100000)), 'value1': np.random.randn(100000), 'value2': np.random.randn(100000), 'value3': np.random.randn(100000), })
-
-    def time_groupby_multi_different_functions(self):
-        self.df.groupby(['key1', 'key2']).agg({'value1': 'mean', 'value2': 'var', 'value3': 'sum'})
-
-    def time_groupby_multi_different_numpy_functions(self):
-        self.df.groupby(['key1', 'key2']).agg({'value1': np.mean, 'value2': np.var, 'value3': np.sum})
-
-
-class groupby_multi_index(object):
-    goal_time = 0.2
+        arr = np.random.randint(-1 << 12, 1 << 12, (1 << 17, 5))
+        i = np.random.choice(len(arr), len(arr) * 5)
+        arr = np.vstack((arr, arr[i]))
+        i = np.random.permutation(len(arr))
+        arr = arr[i]
+        self.cols = list('abcde')
+        self.df = DataFrame(arr, columns=self.cols)
+        self.df['jim'], self.df['joe'] = np.random.randn(2, len(self.df)) * 10
+
+    def time_overflow(self):
+        self.df.groupby(self.cols).max()
+
+
+class CountMultiDtype(object):
+
+    def setup_cache(self):
+        n = 10000
+        offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
+        dates = np.datetime64('now') + offsets
+        dates[np.random.rand(n) > 0.5] = np.datetime64('nat')
+        offsets[np.random.rand(n) > 0.5] = np.timedelta64('nat')
+        value2 = np.random.randn(n)
+        value2[np.random.rand(n) > 0.5] = np.nan
+        obj = np.random.choice(list('ab'), size=n).astype(object)
+        obj[np.random.randn(n) > 0.5] = np.nan
+        df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                        'key2': np.random.randint(0, 100, size=n),
+                        'dates': dates,
+                        'value2': value2,
+                        'value3': np.random.randn(n),
+                        'ints': np.random.randint(0, 1000, size=n),
+                        'obj': obj,
+                        'offsets': offsets})
+        return df
+
+    def time_multi_count(self, df):
+        df.groupby(['key1', 'key2']).count()
+
+
+class CountMultiInt(object):
+
+    def setup_cache(self):
+        n = 10000
+        df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                        'key2': np.random.randint(0, 100, size=n),
+                        'ints': np.random.randint(0, 1000, size=n),
+                        'ints2': np.random.randint(0, 1000, size=n)})
+        return df
+
+    def time_multi_int_count(self, df):
+        df.groupby(['key1', 'key2']).count()
+
+    def time_multi_int_nunique(self, df):
+        df.groupby(['key1', 'key2']).nunique()
+
+
+class AggFunctions(object):
+
+    def setup_cache(self):
+        N = 10**5
+        fac1 = np.array(['A', 'B', 'C'], dtype='O')
+        fac2 = np.array(['one', 'two'], dtype='O')
+        df = DataFrame({'key1': fac1.take(np.random.randint(0, 3, size=N)),
+                        'key2': fac2.take(np.random.randint(0, 2, size=N)),
+                        'value1': np.random.randn(N),
+                        'value2': np.random.randn(N),
+                        'value3': np.random.randn(N)})
+        return df
+
+    def time_different_str_functions(self, df):
+        df.groupby(['key1', 'key2']).agg({'value1': 'mean',
+                                          'value2': 'var',
+                                          'value3': 'sum'})
+
+    def time_different_numpy_functions(self, df):
+        df.groupby(['key1', 'key2']).agg({'value1': np.mean,
+                                          'value2': np.var,
+                                          'value3': np.sum})
+
+    def time_different_python_functions_multicol(self, df):
+        df.groupby(['key1', 'key2']).agg([sum, min, max])
+
+    def time_different_python_functions_singlecol(self, df):
+        df.groupby('key1').agg([sum, min, max])
+
+
+class GroupStrings(object):
 
     def setup(self):
-        self.n = (((5 * 7) * 11) * (1 << 9))
-        self.alpha = list(map(''.join, product((ascii_letters + digits), repeat=4)))
-        self.f = (lambda k: np.repeat(np.random.choice(self.alpha, (self.n // k)), k))
-        self.df = DataFrame({'a': self.f(11), 'b': self.f(7), 'c': self.f(5), 'd': self.f(1), })
+        n = 2 * 10**5
+        alpha = list(map(''.join, product(ascii_letters, repeat=4)))
+        data = np.random.choice(alpha, (n // 5, 4), replace=False)
+        data = np.repeat(data, 5, axis=0)
+        self.df = DataFrame(data, columns=list('abcd'))
         self.df['joe'] = (np.random.randn(len(self.df)) * 10).round(3)
-        self.i = np.random.permutation(len(self.df))
-        self.df = self.df.iloc[self.i].reset_index(drop=True).copy()
+        self.df = self.df.sample(frac=1).reset_index(drop=True)
 
-    def time_groupby_multi_index(self):
+    def time_multi_columns(self):
         self.df.groupby(list('abcd')).max()
 
 
-class groupby_multi(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 100000
-        self.ngroups = 100
-        self.df = DataFrame({'key1': self.get_test_data(ngroups=self.ngroups), 'key2': self.get_test_data(ngroups=self.ngroups), 'data1': np.random.randn(self.N), 'data2': np.random.randn(self.N), })
-        self.simple_series = Series(np.random.randn(self.N))
-        self.key1 = self.df['key1']
-
-    def get_test_data(self, ngroups=100, n=100000):
-        self.unique_groups = range(self.ngroups)
-        self.arr = np.asarray(np.tile(self.unique_groups, (n / self.ngroups)), dtype=object)
-        if (len(self.arr) < n):
-            self.arr = np.asarray((list(self.arr) + self.unique_groups[:(n - len(self.arr))]), dtype=object)
-        random.shuffle(self.arr)
-        return self.arr
-
-    def f(self):
-        self.df.groupby(['key1', 'key2']).agg((lambda x: x.values.sum()))
+class MultiColumn(object):
 
-    def time_groupby_multi_cython(self):
-        self.df.groupby(['key1', 'key2']).sum()
+    def setup_cache(self):
+        N = 10**5
+        key1 = np.tile(np.arange(100, dtype=object), 1000)
+        key2 = key1.copy()
+        np.random.shuffle(key1)
+        np.random.shuffle(key2)
+        df = DataFrame({'key1': key1,
+                        'key2': key2,
+                        'data1': np.random.randn(N),
+                        'data2': np.random.randn(N)})
+        return df
 
-    def time_groupby_multi_python(self):
-        self.df.groupby(['key1', 'key2'])['data1'].agg((lambda x: x.values.sum()))
+    def time_lambda_sum(self, df):
+        df.groupby(['key1', 'key2']).agg(lambda x: x.values.sum())
 
-    def time_groupby_multi_series_op(self):
-        self.df.groupby(['key1', 'key2'])['data1'].agg(np.std)
+    def time_cython_sum(self, df):
+        df.groupby(['key1', 'key2']).sum()
 
-    def time_groupby_series_simple_cython(self):
-        self.simple_series.groupby(self.key1).sum()
+    def time_col_select_lambda_sum(self, df):
+        df.groupby(['key1', 'key2'])['data1'].agg(lambda x: x.values.sum())
 
-    def time_groupby_series_simple_rank(self):
-        self.df.groupby('key1').rank(pct=True)
+    def time_col_select_numpy_sum(self, df):
+        df.groupby(['key1', 'key2'])['data1'].agg(np.sum)
 
 
-#----------------------------------------------------------------------
-# size() speed
-
-class groupby_size(object):
-    goal_time = 0.2
+class Size(object):
 
     def setup(self):
-        self.n = 100000
-        self.offsets = np.random.randint(self.n, size=self.n).astype('timedelta64[ns]')
-        self.dates = (np.datetime64('now') + self.offsets)
-        self.df = DataFrame({'key1': np.random.randint(0, 500, size=self.n), 'key2': np.random.randint(0, 100, size=self.n), 'value1': np.random.randn(self.n), 'value2': np.random.randn(self.n), 'value3': np.random.randn(self.n), 'dates': self.dates, })
-
-    def time_groupby_multi_size(self):
+        n = 10**5
+        offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
+        dates = np.datetime64('now') + offsets
+        self.df = DataFrame({'key1': np.random.randint(0, 500, size=n),
+                             'key2': np.random.randint(0, 100, size=n),
+                             'value1': np.random.randn(n),
+                             'value2': np.random.randn(n),
+                             'value3': np.random.randn(n),
+                             'dates': dates})
+        self.draws = Series(np.random.randn(n))
+        labels = Series(['foo', 'bar', 'baz', 'qux'] * (n // 4))
+        self.cats = labels.astype('category')
+
+    def time_multi_size(self):
         self.df.groupby(['key1', 'key2']).size()
 
-    def time_groupby_dt_size(self):
-        self.df.groupby(['dates']).size()
+    def time_dt_timegrouper_size(self):
+        with warnings.catch_warnings(record=True):
+            self.df.groupby(TimeGrouper(key='dates', freq='M')).size()
 
-    def time_groupby_dt_timegrouper_size(self):
-        self.df.groupby(TimeGrouper(key='dates', freq='M')).size()
+    def time_category_size(self):
+        self.draws.groupby(self.cats).size()
 
 
-#----------------------------------------------------------------------
-# groupby with a variable value for ngroups
+class GroupByMethods(object):
 
-class GroupBySuite(object):
-    goal_time = 0.2
+    param_names = ['dtype', 'method', 'application']
+    params = [['int', 'float', 'object', 'datetime'],
+              ['all', 'any', 'bfill', 'count', 'cumcount', 'cummax', 'cummin',
+               'cumprod', 'cumsum', 'describe', 'ffill', 'first', 'head',
+               'last', 'mad', 'max', 'min', 'median', 'mean', 'nunique',
+               'pct_change', 'prod', 'quantile', 'rank', 'sem', 'shift',
+               'size', 'skew', 'std', 'sum', 'tail', 'unique', 'value_counts',
+               'var'],
+              ['direct', 'transformation']]
 
-    param_names = ['dtype', 'ngroups']
-    params = [['int', 'float'], [100, 10000]]
-
-    def setup(self, dtype, ngroups):
-        np.random.seed(1234)
+    def setup(self, dtype, method, application):
+        if method in method_blacklist.get(dtype, {}):
+            raise NotImplementedError  # skip benchmark
+        ngroups = 1000
         size = ngroups * 2
         rng = np.arange(ngroups)
         values = rng.take(np.random.randint(0, ngroups, size=size))
         if dtype == 'int':
             key = np.random.randint(0, size, size=size)
-        else:
+        elif dtype == 'float':
             key = np.concatenate([np.random.random(ngroups) * 0.1,
                                   np.random.random(ngroups) * 10.0])
+        elif dtype == 'object':
+            key = ['foo'] * size
+        elif dtype == 'datetime':
+            key = date_range('1/1/2011', periods=size, freq='s')
 
-        self.df = DataFrame({'values': values,
-                             'key': key})
-
-    def time_all(self, dtype, ngroups):
-        self.df.groupby('key')['values'].all()
-
-    def time_any(self, dtype, ngroups):
-        self.df.groupby('key')['values'].any()
-
-    def time_count(self, dtype, ngroups):
-        self.df.groupby('key')['values'].count()
-
-    def time_cumcount(self, dtype, ngroups):
-        self.df.groupby('key')['values'].cumcount()
-
-    def time_cummax(self, dtype, ngroups):
-        self.df.groupby('key')['values'].cummax()
-
-    def time_cummin(self, dtype, ngroups):
-        self.df.groupby('key')['values'].cummin()
-
-    def time_cumprod(self, dtype, ngroups):
-        self.df.groupby('key')['values'].cumprod()
-
-    def time_cumsum(self, dtype, ngroups):
-        self.df.groupby('key')['values'].cumsum()
-
-    def time_describe(self, dtype, ngroups):
-        self.df.groupby('key')['values'].describe()
-
-    def time_diff(self, dtype, ngroups):
-        self.df.groupby('key')['values'].diff()
-
-    def time_first(self, dtype, ngroups):
-        self.df.groupby('key')['values'].first()
-
-    def time_head(self, dtype, ngroups):
-        self.df.groupby('key')['values'].head()
-
-    def time_last(self, dtype, ngroups):
-        self.df.groupby('key')['values'].last()
-
-    def time_mad(self, dtype, ngroups):
-        self.df.groupby('key')['values'].mad()
-
-    def time_max(self, dtype, ngroups):
-        self.df.groupby('key')['values'].max()
-
-    def time_mean(self, dtype, ngroups):
-        self.df.groupby('key')['values'].mean()
-
-    def time_median(self, dtype, ngroups):
-        self.df.groupby('key')['values'].median()
-
-    def time_min(self, dtype, ngroups):
-        self.df.groupby('key')['values'].min()
-
-    def time_nunique(self, dtype, ngroups):
-        self.df.groupby('key')['values'].nunique()
-
-    def time_pct_change(self, dtype, ngroups):
-        self.df.groupby('key')['values'].pct_change()
-
-    def time_prod(self, dtype, ngroups):
-        self.df.groupby('key')['values'].prod()
-
-    def time_rank(self, dtype, ngroups):
-        self.df.groupby('key')['values'].rank()
-
-    def time_sem(self, dtype, ngroups):
-        self.df.groupby('key')['values'].sem()
+        df = DataFrame({'values': values, 'key': key})
 
-    def time_size(self, dtype, ngroups):
-        self.df.groupby('key')['values'].size()
+        if application == 'transform':
+            if method == 'describe':
+                raise NotImplementedError
 
-    def time_skew(self, dtype, ngroups):
-        self.df.groupby('key')['values'].skew()
+            self.as_group_method = lambda: df.groupby(
+                'key')['values'].transform(method)
+            self.as_field_method = lambda: df.groupby(
+                'values')['key'].transform(method)
+        else:
+            self.as_group_method = getattr(df.groupby('key')['values'], method)
+            self.as_field_method = getattr(df.groupby('values')['key'], method)
 
-    def time_std(self, dtype, ngroups):
-        self.df.groupby('key')['values'].std()
+    def time_dtype_as_group(self, dtype, method, application):
+        self.as_group_method()
 
-    def time_sum(self, dtype, ngroups):
-        self.df.groupby('key')['values'].sum()
+    def time_dtype_as_field(self, dtype, method, application):
+        self.as_field_method()
 
-    def time_tail(self, dtype, ngroups):
-        self.df.groupby('key')['values'].tail()
 
-    def time_unique(self, dtype, ngroups):
-        self.df.groupby('key')['values'].unique()
+class RankWithTies(object):
+    # GH 21237
+    param_names = ['dtype', 'tie_method']
+    params = [['float64', 'float32', 'int64', 'datetime64'],
+              ['first', 'average', 'dense', 'min', 'max']]
 
-    def time_value_counts(self, dtype, ngroups):
-        self.df.groupby('key')['values'].value_counts()
+    def setup(self, dtype, tie_method):
+        N = 10**4
+        if dtype == 'datetime64':
+            data = np.array([Timestamp("2011/01/01")] * N, dtype=dtype)
+        else:
+            data = np.array([1] * N, dtype=dtype)
+        self.df = DataFrame({'values': data, 'key': ['foo'] * N})
 
-    def time_var(self, dtype, ngroups):
-        self.df.groupby('key')['values'].var()
+    def time_rank_ties(self, dtype, tie_method):
+        self.df.groupby('key').rank(method=tie_method)
 
 
-class groupby_float32(object):
+class Float32(object):
     # GH 13335
-    goal_time = 0.2
-
     def setup(self):
         tmp1 = (np.random.random(10000) * 0.1).astype(np.float32)
         tmp2 = (np.random.random(10000) * 10.0).astype(np.float32)
@@ -506,27 +386,26 @@ def setup(self):
         arr = np.repeat(tmp, 10)
         self.df = DataFrame(dict(a=arr, b=arr))
 
-    def time_groupby_sum(self):
+    def time_sum(self):
         self.df.groupby(['a'])['b'].sum()
 
 
-class groupby_categorical(object):
-    goal_time = 0.2
+class Categories(object):
 
     def setup(self):
-        N = 100000
+        N = 10**5
         arr = np.random.random(N)
-
-        self.df = DataFrame(dict(
-            a=Categorical(np.random.randint(10000, size=N)),
-            b=arr))
-        self.df_ordered = DataFrame(dict(
-            a=Categorical(np.random.randint(10000, size=N), ordered=True),
-            b=arr))
-        self.df_extra_cat = DataFrame(dict(
-            a=Categorical(np.random.randint(100, size=N),
-                          categories=np.arange(10000)),
-            b=arr))
+        data = {'a': Categorical(np.random.randint(10000, size=N)),
+                'b': arr}
+        self.df = DataFrame(data)
+        data = {'a': Categorical(np.random.randint(10000, size=N),
+                                 ordered=True),
+                'b': arr}
+        self.df_ordered = DataFrame(data)
+        data = {'a': Categorical(np.random.randint(100, size=N),
+                                 categories=np.arange(10000)),
+                'b': arr}
+        self.df_extra_cat = DataFrame(data)
 
     def time_groupby_sort(self):
         self.df.groupby('a')['b'].count()
@@ -547,130 +426,64 @@ def time_groupby_extra_cat_nosort(self):
         self.df_extra_cat.groupby('a', sort=False)['b'].count()
 
 
-class groupby_period(object):
+class Datelike(object):
     # GH 14338
-    goal_time = 0.2
-
-    def make_grouper(self, N):
-        return pd.period_range('1900-01-01', freq='D', periods=N)
-
-    def setup(self):
-        N = 10000
-        self.grouper = self.make_grouper(N)
-        self.df = pd.DataFrame(np.random.randn(N, 2))
-
-    def time_groupby_sum(self):
+    params = ['period_range', 'date_range', 'date_range_tz']
+    param_names = ['grouper']
+
+    def setup(self, grouper):
+        N = 10**4
+        rng_map = {'period_range': period_range,
+                   'date_range': date_range,
+                   'date_range_tz': partial(date_range, tz='US/Central')}
+        self.grouper = rng_map[grouper]('1900-01-01', freq='D', periods=N)
+        self.df = DataFrame(np.random.randn(10**4, 2))
+
+    def time_sum(self, grouper):
         self.df.groupby(self.grouper).sum()
 
 
-class groupby_datetime(groupby_period):
-    def make_grouper(self, N):
-        return pd.date_range('1900-01-01', freq='D', periods=N)
-
-
-class groupby_datetimetz(groupby_period):
-    def make_grouper(self, N):
-        return pd.date_range('1900-01-01', freq='D', periods=N,
-                             tz='US/Central')
-
-#----------------------------------------------------------------------
-# Series.value_counts
-
-class series_value_counts(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.random.randint(0, 1000, size=100000))
-        self.s2 = self.s.astype(float)
-
-        self.K = 1000
-        self.N = 100000
-        self.uniques = tm.makeStringIndex(self.K).values
-        self.s3 = Series(np.tile(self.uniques, (self.N // self.K)))
-
-    def time_value_counts_int64(self):
-        self.s.value_counts()
-
-    def time_value_counts_float64(self):
-        self.s2.value_counts()
-
-    def time_value_counts_strings(self):
-        self.s.value_counts()
-
-
-#----------------------------------------------------------------------
-# pivot_table
-
-class groupby_pivot_table(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.fac1 = np.array(['A', 'B', 'C'], dtype='O')
-        self.fac2 = np.array(['one', 'two'], dtype='O')
-        self.ind1 = np.random.randint(0, 3, size=100000)
-        self.ind2 = np.random.randint(0, 2, size=100000)
-        self.df = DataFrame({'key1': self.fac1.take(self.ind1), 'key2': self.fac2.take(self.ind2), 'key3': self.fac2.take(self.ind2), 'value1': np.random.randn(100000), 'value2': np.random.randn(100000), 'value3': np.random.randn(100000), })
-
-    def time_groupby_pivot_table(self):
-        self.df.pivot_table(index='key1', columns=['key2', 'key3'])
-
-
-#----------------------------------------------------------------------
-# Sum booleans #2692
-
-class groupby_sum_booleans(object):
-    goal_time = 0.2
-
+class SumBools(object):
+    # GH 2692
     def setup(self):
-        self.N = 500
-        self.df = DataFrame({'ii': range(self.N), 'bb': [True for x in range(self.N)], })
+        N = 500
+        self.df = DataFrame({'ii': range(N),
+                             'bb': [True] * N})
 
     def time_groupby_sum_booleans(self):
         self.df.groupby('ii').sum()
 
 
-#----------------------------------------------------------------------
-# multi-indexed group sum #9049
-
-class groupby_sum_multiindex(object):
-    goal_time = 0.2
+class SumMultiLevel(object):
+    # GH 9049
+    timeout = 120.0
 
     def setup(self):
-        self.N = 50
-        self.df = DataFrame({'A': (list(range(self.N)) * 2), 'B': list(range((self.N * 2))), 'C': 1, }).set_index(['A', 'B'])
+        N = 50
+        self.df = DataFrame({'A': list(range(N)) * 2,
+                             'B': range(N * 2),
+                             'C': 1}).set_index(['A', 'B'])
 
     def time_groupby_sum_multiindex(self):
         self.df.groupby(level=[0, 1]).sum()
 
 
-#-------------------------------------------------------------------------------
-# Transform testing
-
 class Transform(object):
-    goal_time = 0.2
 
     def setup(self):
         n1 = 400
         n2 = 250
-
-        index = MultiIndex(
-            levels=[np.arange(n1), pd.util.testing.makeStringIndex(n2)],
-            labels=[[i for i in range(n1) for _ in range(n2)],
-                    (list(range(n2)) * n1)],
-            names=['lev1', 'lev2'])
-
-        data = DataFrame(np.random.randn(n1 * n2, 3),
-                         index=index, columns=['col1', 'col20', 'col3'])
-        step = int((n1 * n2 * 0.1))
-        for col in range(len(data.columns)):
-            idx = col
-            while (idx < len(data)):
-                data.set_value(data.index[idx], data.columns[col], np.nan)
-                idx += step
+        index = MultiIndex(levels=[np.arange(n1), tm.makeStringIndex(n2)],
+                           codes=[np.repeat(range(n1), n2).tolist(),
+                                  list(range(n2)) * n1],
+                           names=['lev1', 'lev2'])
+        arr = np.random.randn(n1 * n2, 3)
+        arr[::10000, 0] = np.nan
+        arr[1::10000, 1] = np.nan
+        arr[2::10000, 2] = np.nan
+        data = DataFrame(arr, index=index, columns=['col1', 'col20', 'col3'])
         self.df = data
-        self.f_fillna = (lambda x: x.fillna(method='pad'))
 
-        np.random.seed(2718281)
         n = 20000
         self.df1 = DataFrame(np.random.randint(1, n, (n, 3)),
                              columns=['jim', 'joe', 'jolie'])
@@ -682,10 +495,10 @@ def setup(self):
         self.df4 = self.df3.copy()
         self.df4['jim'] = self.df4['joe']
 
-    def time_transform_func(self):
-        self.df.groupby(level='lev2').transform(self.f_fillna)
+    def time_transform_lambda_max(self):
+        self.df.groupby(level='lev1').transform(lambda x: max(x))
 
-    def time_transform_ufunc(self):
+    def time_transform_ufunc_max(self):
         self.df.groupby(level='lev1').transform(np.max)
 
     def time_transform_multi_key1(self):
@@ -701,63 +514,30 @@ def time_transform_multi_key4(self):
         self.df4.groupby(['jim', 'joe'])['jolie'].transform('max')
 
 
-
-
-np.random.seed(0)
-N = 120000
-N_TRANSITIONS = 1400
-transition_points = np.random.permutation(np.arange(N))[:N_TRANSITIONS]
-transition_points.sort()
-transitions = np.zeros((N,), dtype=np.bool)
-transitions[transition_points] = True
-g = transitions.cumsum()
-df = DataFrame({'signal': np.random.rand(N), })
-
-
-
-
-
-class groupby_transform_series(object):
-    goal_time = 0.2
+class TransformBools(object):
 
     def setup(self):
-        np.random.seed(0)
         N = 120000
         transition_points = np.sort(np.random.choice(np.arange(N), 1400))
-        transitions = np.zeros((N,), dtype=np.bool)
+        transitions = np.zeros(N, dtype=np.bool)
         transitions[transition_points] = True
         self.g = transitions.cumsum()
         self.df = DataFrame({'signal': np.random.rand(N)})
 
-    def time_groupby_transform_series(self):
+    def time_transform_mean(self):
         self.df['signal'].groupby(self.g).transform(np.mean)
 
 
-class groupby_transform_series2(object):
-    goal_time = 0.2
-
+class TransformNaN(object):
+    # GH 12737
     def setup(self):
-        np.random.seed(0)
-        self.df = DataFrame({'key': (np.arange(100000) // 3),
-                             'val': np.random.randn(100000)})
-
-        self.df_nans = pd.DataFrame({'key': np.repeat(np.arange(1000), 10),
-                                     'B': np.nan,
-                                     'C': np.nan})
-        self.df_nans.ix[4::10, 'B':'C'] = 5
+        self.df_nans = DataFrame({'key': np.repeat(np.arange(1000), 10),
+                                  'B': np.nan,
+                                  'C': np.nan})
+        self.df_nans.loc[4::10, 'B':'C'] = 5
 
-    def time_transform_series2(self):
-        self.df.groupby('key')['val'].transform(np.mean)
-
-    def time_cumprod(self):
-        self.df.groupby('key').cumprod()
-
-    def time_cumsum(self):
-        self.df.groupby('key').cumsum()
+    def time_first(self):
+        self.df_nans.groupby('key').transform('first')
 
-    def time_shift(self):
-        self.df.groupby('key').shift()
 
-    def time_transform_dataframe(self):
-        # GH 12737
-        self.df_nans.groupby('key').transform('first')
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/hdfstore_bench.py b/asv_bench/benchmarks/hdfstore_bench.py
deleted file mode 100644
index 78de5267a2969..0000000000000
--- a/asv_bench/benchmarks/hdfstore_bench.py
+++ /dev/null
@@ -1,122 +0,0 @@
-from .pandas_vb_common import *
-import os
-
-
-class HDF5(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(25000)
-        self.df = DataFrame({'float1': randn(25000), 'float2': randn(25000),},
-                            index=self.index)
-
-        self.df_mixed = DataFrame(
-            {'float1': randn(25000), 'float2': randn(25000),
-             'string1': (['foo'] * 25000),
-             'bool1': ([True] * 25000),
-             'int1': np.random.randint(0, 250000, size=25000),},
-            index=self.index)
-
-        self.df_wide = DataFrame(np.random.randn(25000, 100))
-
-        self.df2 = DataFrame({'float1': randn(25000), 'float2': randn(25000)},
-                             index=date_range('1/1/2000', periods=25000))
-        self.df_wide2 = DataFrame(np.random.randn(25000, 100),
-                                  index=date_range('1/1/2000', periods=25000))
-
-        self.df_dc = DataFrame(np.random.randn(10000, 10),
-                               columns=[('C%03d' % i) for i in range(10)])
-
-        self.f = '__test__.h5'
-        self.remove(self.f)
-
-        self.store = HDFStore(self.f)
-        self.store.put('df1', self.df)
-        self.store.put('df_mixed', self.df_mixed)
-
-        self.store.append('df5', self.df_mixed)
-        self.store.append('df7', self.df)
-
-        self.store.append('df9', self.df_wide)
-
-        self.store.append('df11', self.df_wide2)
-        self.store.append('df12', self.df2)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-    def time_read_store(self):
-        self.store.get('df1')
-
-    def time_read_store_mixed(self):
-        self.store.get('df_mixed')
-
-    def time_write_store(self):
-        self.store.put('df2', self.df)
-
-    def time_write_store_mixed(self):
-        self.store.put('df_mixed2', self.df_mixed)
-
-    def time_read_store_table_mixed(self):
-        self.store.select('df5')
-
-    def time_write_store_table_mixed(self):
-        self.store.append('df6', self.df_mixed)
-
-    def time_read_store_table(self):
-        self.store.select('df7')
-
-    def time_write_store_table(self):
-        self.store.append('df8', self.df)
-
-    def time_read_store_table_wide(self):
-        self.store.select('df9')
-
-    def time_write_store_table_wide(self):
-        self.store.append('df10', self.df_wide)
-
-    def time_write_store_table_dc(self):
-        self.store.append('df15', self.df, data_columns=True)
-
-    def time_query_store_table_wide(self):
-        self.store.select('df11', [('index', '>', self.df_wide2.index[10000]),
-                                   ('index', '<', self.df_wide2.index[15000])])
-
-    def time_query_store_table(self):
-        self.store.select('df12', [('index', '>', self.df2.index[10000]),
-                                   ('index', '<', self.df2.index[15000])])
-
-
-class HDF5Panel(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.f = '__test__.h5'
-        self.p = Panel(randn(20, 1000, 25),
-                       items=[('Item%03d' % i) for i in range(20)],
-                       major_axis=date_range('1/1/2000', periods=1000),
-                       minor_axis=[('E%03d' % i) for i in range(25)])
-        self.remove(self.f)
-        self.store = HDFStore(self.f)
-        self.store.append('p1', self.p)
-
-    def teardown(self):
-        self.store.close()
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-    def time_read_store_table_panel(self):
-        self.store.select('p1')
-
-    def time_write_store_table_panel(self):
-        self.store.append('p2', self.p)
diff --git a/asv_bench/benchmarks/index_object.py b/asv_bench/benchmarks/index_object.py
index 3fb53ce9b3c98..bbe164d4858ab 100644
--- a/asv_bench/benchmarks/index_object.py
+++ b/asv_bench/benchmarks/index_object.py
@@ -1,201 +1,184 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (Series, date_range, DatetimeIndex, Index, RangeIndex,
+                    Float64Index)
 
 
 class SetOperations(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=10000, freq='T')
-        self.rng2 = self.rng[:(-1)]
+    params = (['datetime', 'date_string', 'int', 'strings'],
+              ['intersection', 'union', 'symmetric_difference'])
+    param_names = ['dtype', 'method']
 
-        # object index with datetime values
-        if (self.rng.dtype == object):
-            self.idx_rng = self.rng.view(Index)
-        else:
-            self.idx_rng = self.rng.asobject
-        self.idx_rng2 = self.idx_rng[:(-1)]
+    def setup(self, dtype, method):
+        N = 10**5
+        dates_left = date_range('1/1/2000', periods=N, freq='T')
+        fmt = '%Y-%m-%d %H:%M:%S'
+        date_str_left = Index(dates_left.strftime(fmt))
+        int_left = Index(np.arange(N))
+        str_left = tm.makeStringIndex(N)
+        data = {'datetime': {'left': dates_left, 'right': dates_left[:-1]},
+                'date_string': {'left': date_str_left,
+                                'right': date_str_left[:-1]},
+                'int': {'left': int_left, 'right': int_left[:-1]},
+                'strings': {'left': str_left, 'right': str_left[:-1]}}
+        self.left = data[dtype]['left']
+        self.right = data[dtype]['right']
 
-        # other datetime
-        N = 100000
-        A = N - 20000
-        B = N + 20000
-        self.dtidx1 = DatetimeIndex(range(N))
-        self.dtidx2 = DatetimeIndex(range(A, B))
-        self.dtidx3 = DatetimeIndex(range(N, B))
-
-        # integer
-        self.N = 1000000
-        self.options = np.arange(self.N)
-        self.left = Index(
-            self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
-        self.right = Index(
-            self.options.take(np.random.permutation(self.N)[:(self.N // 2)]))
-
-        # strings
-        N = 10000
-        strs = tm.rands_array(10, N)
-        self.leftstr = Index(strs[:N * 2 // 3])
-        self.rightstr = Index(strs[N // 3:])
+    def time_operation(self, dtype, method):
+        getattr(self.left, method)(self.right)
 
-    def time_datetime_intersection(self):
-        self.rng.intersection(self.rng2)
 
-    def time_datetime_union(self):
-        self.rng.union(self.rng2)
+class SetDisjoint(object):
 
-    def time_datetime_difference(self):
-        self.dtidx1.difference(self.dtidx2)
+    def setup(self):
+        N = 10**5
+        B = N + 20000
+        self.datetime_left = DatetimeIndex(range(N))
+        self.datetime_right = DatetimeIndex(range(N, B))
 
     def time_datetime_difference_disjoint(self):
-        self.dtidx1.difference(self.dtidx3)
-
-    def time_datetime_symmetric_difference(self):
-        self.dtidx1.symmetric_difference(self.dtidx2)
-
-    def time_index_datetime_intersection(self):
-        self.idx_rng.intersection(self.idx_rng2)
-
-    def time_index_datetime_union(self):
-        self.idx_rng.union(self.idx_rng2)
-
-    def time_int64_intersection(self):
-        self.left.intersection(self.right)
-
-    def time_int64_union(self):
-        self.left.union(self.right)
-
-    def time_int64_difference(self):
-        self.left.difference(self.right)
-
-    def time_int64_symmetric_difference(self):
-        self.left.symmetric_difference(self.right)
-
-    def time_str_difference(self):
-        self.leftstr.difference(self.rightstr)
-
-    def time_str_symmetric_difference(self):
-        self.leftstr.symmetric_difference(self.rightstr)
+        self.datetime_left.difference(self.datetime_right)
 
 
 class Datetime(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.dr = pd.date_range('20000101', freq='D', periods=10000)
+        self.dr = date_range('20000101', freq='D', periods=10000)
 
     def time_is_dates_only(self):
         self.dr._is_dates_only
 
 
-class Float64(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.idx = tm.makeFloatIndex(1000000)
-        self.mask = ((np.arange(self.idx.size) % 3) == 0)
-        self.series_mask = Series(self.mask)
-
-        self.baseidx = np.arange(1000000.0)
+class Ops(object):
 
-    def time_boolean_indexer(self):
-        self.idx[self.mask]
+    sample_time = 0.2
+    params = ['float', 'int']
+    param_names = ['dtype']
 
-    def time_boolean_series_indexer(self):
-        self.idx[self.series_mask]
+    def setup(self, dtype):
+        N = 10**6
+        indexes = {'int': 'makeIntIndex', 'float': 'makeFloatIndex'}
+        self.index = getattr(tm, indexes[dtype])(N)
 
-    def time_construct(self):
-        Index(self.baseidx)
+    def time_add(self, dtype):
+        self.index + 2
 
-    def time_div(self):
-        (self.idx / 2)
+    def time_subtract(self, dtype):
+        self.index - 2
 
-    def time_get(self):
-        self.idx[1]
+    def time_multiply(self, dtype):
+        self.index * 2
 
-    def time_mul(self):
-        (self.idx * 2)
+    def time_divide(self, dtype):
+        self.index / 2
 
-    def time_slice_indexer_basic(self):
-        self.idx[:(-1)]
-
-    def time_slice_indexer_even(self):
-        self.idx[::2]
+    def time_modulo(self, dtype):
+        self.index % 2
 
 
-class StringIndex(object):
-    goal_time = 0.2
+class Range(object):
 
     def setup(self):
-        self.idx = tm.makeStringIndex(1000000)
-        self.mask = ((np.arange(1000000) % 3) == 0)
-        self.series_mask = Series(self.mask)
+        self.idx_inc = RangeIndex(start=0, stop=10**7, step=3)
+        self.idx_dec = RangeIndex(start=10**7, stop=-1, step=-3)
 
-    def time_boolean_indexer(self):
-        self.idx[self.mask]
+    def time_max(self):
+        self.idx_inc.max()
 
-    def time_boolean_series_indexer(self):
-        self.idx[self.series_mask]
+    def time_max_trivial(self):
+        self.idx_dec.max()
 
-    def time_slice_indexer_basic(self):
-        self.idx[:(-1)]
+    def time_min(self):
+        self.idx_dec.min()
 
-    def time_slice_indexer_even(self):
-        self.idx[::2]
+    def time_min_trivial(self):
+        self.idx_inc.min()
 
 
-class Multi1(object):
-    goal_time = 0.2
+class IndexAppend(object):
 
     def setup(self):
-        (n, k) = (200, 5000)
-        self.levels = [np.arange(n), tm.makeStringIndex(n).values, (1000 + np.arange(n))]
-        self.labels = [np.random.choice(n, (k * n)) for lev in self.levels]
-        self.mi = MultiIndex(levels=self.levels, labels=self.labels)
-
-        self.iterables = [tm.makeStringIndex(10000), range(20)]
-
-    def time_duplicated(self):
-        self.mi.duplicated()
-
-    def time_from_product(self):
-        MultiIndex.from_product(self.iterables)
 
+        N = 10000
+        self.range_idx = RangeIndex(0, 100)
+        self.int_idx = self.range_idx.astype(int)
+        self.obj_idx = self.int_idx.astype(str)
+        self.range_idxs = []
+        self.int_idxs = []
+        self.object_idxs = []
+        for i in range(1, N):
+            r_idx = RangeIndex(i * 100, (i + 1) * 100)
+            self.range_idxs.append(r_idx)
+            i_idx = r_idx.astype(int)
+            self.int_idxs.append(i_idx)
+            o_idx = i_idx.astype(str)
+            self.object_idxs.append(o_idx)
+
+    def time_append_range_list(self):
+        self.range_idx.append(self.range_idxs)
+
+    def time_append_int_list(self):
+        self.int_idx.append(self.int_idxs)
+
+    def time_append_obj_list(self):
+        self.obj_idx.append(self.object_idxs)
+
+
+class Indexing(object):
+
+    params = ['String', 'Float', 'Int']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10**6
+        self.idx = getattr(tm, 'make{}Index'.format(dtype))(N)
+        self.array_mask = (np.arange(N) % 3) == 0
+        self.series_mask = Series(self.array_mask)
+        self.sorted = self.idx.sort_values()
+        half = N // 2
+        self.non_unique = self.idx[:half].append(self.idx[:half])
+        self.non_unique_sorted = (self.sorted[:half].append(self.sorted[:half])
+                                  .sort_values())
+        self.key = self.sorted[N // 4]
+
+    def time_boolean_array(self, dtype):
+        self.idx[self.array_mask]
+
+    def time_boolean_series(self, dtype):
+        self.idx[self.series_mask]
 
-class Multi2(object):
-    goal_time = 0.2
+    def time_get(self, dtype):
+        self.idx[1]
 
-    def setup(self):
-        self.n = ((((3 * 5) * 7) * 11) * (1 << 10))
-        (low, high) = (((-1) << 12), (1 << 12))
-        self.f = (lambda k: np.repeat(np.random.randint(low, high, (self.n // k)), k))
-        self.i = np.random.permutation(self.n)
-        self.mi = MultiIndex.from_arrays([self.f(11), self.f(7), self.f(5), self.f(3), self.f(1)])[self.i]
+    def time_slice(self, dtype):
+        self.idx[:-1]
 
-        self.a = np.repeat(np.arange(100), 1000)
-        self.b = np.tile(np.arange(1000), 100)
-        self.midx2 = MultiIndex.from_arrays([self.a, self.b])
-        self.midx2 = self.midx2.take(np.random.permutation(np.arange(100000)))
+    def time_slice_step(self, dtype):
+        self.idx[::2]
 
-    def time_sortlevel_int64(self):
-        self.mi.sortlevel()
+    def time_get_loc(self, dtype):
+        self.idx.get_loc(self.key)
 
-    def time_sortlevel_zero(self):
-        self.midx2.sortlevel(0)
+    def time_get_loc_sorted(self, dtype):
+        self.sorted.get_loc(self.key)
 
-    def time_sortlevel_one(self):
-        self.midx2.sortlevel(1)
+    def time_get_loc_non_unique(self, dtype):
+        self.non_unique.get_loc(self.key)
 
+    def time_get_loc_non_unique_sorted(self, dtype):
+        self.non_unique_sorted.get_loc(self.key)
 
-class Multi3(object):
-    goal_time = 0.2
 
+class Float64IndexMethod(object):
+    # GH 13166
     def setup(self):
-        self.level1 = range(1000)
-        self.level2 = date_range(start='1/1/2012', periods=100)
-        self.mi = MultiIndex.from_product([self.level1, self.level2])
+        N = 100000
+        a = np.arange(N)
+        self.ind = Float64Index(a * 4.8000000418824129e-08)
+
+    def time_get_loc(self):
+        self.ind.get_loc(0)
 
-    def time_datetime_level_values_full(self):
-        self.mi.copy().values
 
-    def time_datetime_level_values_sliced(self):
-        self.mi[:10].values
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/indexing.py b/asv_bench/benchmarks/indexing.py
index d938cc6a6dc4d..57ba9cd80e55c 100644
--- a/asv_bench/benchmarks/indexing.py
+++ b/asv_bench/benchmarks/indexing.py
@@ -1,237 +1,350 @@
-from .pandas_vb_common import *
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
+import warnings
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (Series, DataFrame, Panel, MultiIndex,
+                    Int64Index, UInt64Index, Float64Index,
+                    IntervalIndex, CategoricalIndex,
+                    IndexSlice, concat, date_range)
 
-class Int64Indexing(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.s = Series(np.random.rand(1000000))
-
-    def time_getitem_scalar(self):
-        self.s[800000]
+class NumericSeriesIndexing(object):
 
-    def time_getitem_slice(self):
-        self.s[:800000]
+    params = [
+        (Int64Index, UInt64Index, Float64Index),
+        ('unique_monotonic_inc', 'nonunique_monotonic_inc'),
+    ]
+    param_names = ['index_dtype', 'index_structure']
 
-    def time_getitem_list_like(self):
-        self.s[[800000]]
+    def setup(self, index, index_structure):
+        N = 10**6
+        indices = {
+            'unique_monotonic_inc': index(range(N)),
+            'nonunique_monotonic_inc': index(
+                list(range(55)) + [54] + list(range(55, N - 1))),
+        }
+        self.data = Series(np.random.rand(N), index=indices[index_structure])
+        self.array = np.arange(10000)
+        self.array_list = self.array.tolist()
 
-    def time_getitem_array(self):
-        self.s[np.arange(10000)]
+    def time_getitem_scalar(self, index, index_structure):
+        self.data[800000]
 
-    def time_iloc_array(self):
-        self.s.iloc[np.arange(10000)]
+    def time_getitem_slice(self, index, index_structure):
+        self.data[:800000]
 
-    def time_iloc_list_like(self):
-        self.s.iloc[[800000]]
+    def time_getitem_list_like(self, index, index_structure):
+        self.data[[800000]]
 
-    def time_iloc_scalar(self):
-        self.s.iloc[800000]
+    def time_getitem_array(self, index, index_structure):
+        self.data[self.array]
 
-    def time_iloc_slice(self):
-        self.s.iloc[:800000]
+    def time_getitem_lists(self, index, index_structure):
+        self.data[self.array_list]
 
-    def time_ix_array(self):
-        self.s.ix[np.arange(10000)]
+    def time_iloc_array(self, index, index_structure):
+        self.data.iloc[self.array]
 
-    def time_ix_list_like(self):
-        self.s.ix[[800000]]
+    def time_iloc_list_like(self, index, index_structure):
+        self.data.iloc[[800000]]
 
-    def time_ix_scalar(self):
-        self.s.ix[800000]
+    def time_iloc_scalar(self, index, index_structure):
+        self.data.iloc[800000]
 
-    def time_ix_slice(self):
-        self.s.ix[:800000]
+    def time_iloc_slice(self, index, index_structure):
+        self.data.iloc[:800000]
 
-    def time_loc_array(self):
-        self.s.loc[np.arange(10000)]
+    def time_ix_array(self, index, index_structure):
+        self.data.ix[self.array]
 
-    def time_loc_list_like(self):
-        self.s.loc[[800000]]
+    def time_ix_list_like(self, index, index_structure):
+        self.data.ix[[800000]]
 
-    def time_loc_scalar(self):
-        self.s.loc[800000]
+    def time_ix_scalar(self, index, index_structure):
+        self.data.ix[800000]
 
-    def time_loc_slice(self):
-        self.s.loc[:800000]
+    def time_ix_slice(self, index, index_structure):
+        self.data.ix[:800000]
 
+    def time_loc_array(self, index, index_structure):
+        self.data.loc[self.array]
 
-class StringIndexing(object):
-    goal_time = 0.2
+    def time_loc_list_like(self, index, index_structure):
+        self.data.loc[[800000]]
 
-    def setup(self):
-        self.index = tm.makeStringIndex(1000000)
-        self.s = Series(np.random.rand(1000000), index=self.index)
-        self.lbl = self.s.index[800000]
+    def time_loc_scalar(self, index, index_structure):
+        self.data.loc[800000]
 
-    def time_getitem_label_slice(self):
-        self.s[:self.lbl]
+    def time_loc_slice(self, index, index_structure):
+        self.data.loc[:800000]
 
-    def time_getitem_pos_slice(self):
-        self.s[:800000]
 
-    def time_get_value(self):
-        self.s.get_value(self.lbl)
+class NonNumericSeriesIndexing(object):
 
+    params = [
+        ('string', 'datetime'),
+        ('unique_monotonic_inc', 'nonunique_monotonic_inc'),
+    ]
+    param_names = ['index_dtype', 'index_structure']
 
-class DatetimeIndexing(object):
-    goal_time = 0.2
+    def setup(self, index, index_structure):
+        N = 10**6
+        indexes = {'string': tm.makeStringIndex(N),
+                   'datetime': date_range('1900', periods=N, freq='s')}
+        index = indexes[index]
+        if index_structure == 'nonunique_monotonic_inc':
+            index = index.insert(item=index[2], loc=2)[:-1]
+        self.s = Series(np.random.rand(N), index=index)
+        self.lbl = index[80000]
 
-    def setup(self):
-        tm.N = 1000
-        self.ts = tm.makeTimeSeries()
-        self.dt = self.ts.index[500]
+    def time_getitem_label_slice(self, index, index_structure):
+        self.s[:self.lbl]
 
-    def time_getitem_scalar(self):
-        self.ts[self.dt]
+    def time_getitem_pos_slice(self, index, index_structure):
+        self.s[:80000]
 
+    def time_get_value(self, index, index_structure):
+        with warnings.catch_warnings(record=True):
+            self.s.get_value(self.lbl)
 
-class DataFrameIndexing(object):
-    goal_time = 0.2
+    def time_getitem_scalar(self, index, index_structure):
+        self.s[self.lbl]
 
-    def setup(self):
-        self.index = tm.makeStringIndex(1000)
-        self.columns = tm.makeStringIndex(30)
-        self.df = DataFrame(np.random.randn(1000, 30), index=self.index,
-                            columns=self.columns)
-        self.idx = self.index[100]
-        self.col = self.columns[10]
+    def time_getitem_list_like(self, index, index_structure):
+        self.s[[self.lbl]]
 
-        self.df2 = DataFrame(np.random.randn(10000, 4),
-                             columns=['A', 'B', 'C', 'D'])
-        self.indexer = (self.df2['B'] > 0)
-        self.obj_indexer = self.indexer.astype('O')
 
-        # duptes
-        self.idx_dupe = (np.array(range(30)) * 99)
-        self.df3 = DataFrame({'A': ([0.1] * 1000), 'B': ([1] * 1000),})
-        self.df3 = concat([self.df3, (2 * self.df3), (3 * self.df3)])
+class DataFrameStringIndexing(object):
 
-        self.df_big = DataFrame(dict(A=(['foo'] * 1000000)))
+    def setup(self):
+        index = tm.makeStringIndex(1000)
+        columns = tm.makeStringIndex(30)
+        self.df = DataFrame(np.random.randn(1000, 30), index=index,
+                            columns=columns)
+        self.idx_scalar = index[100]
+        self.col_scalar = columns[10]
+        self.bool_indexer = self.df[self.col_scalar] > 0
+        self.bool_obj_indexer = self.bool_indexer.astype(object)
 
     def time_get_value(self):
-        self.df.get_value(self.idx, self.col)
+        with warnings.catch_warnings(record=True):
+            self.df.get_value(self.idx_scalar, self.col_scalar)
+
+    def time_ix(self):
+        self.df.ix[self.idx_scalar, self.col_scalar]
 
-    def time_get_value_ix(self):
-        self.df.ix[(self.idx, self.col)]
+    def time_loc(self):
+        self.df.loc[self.idx_scalar, self.col_scalar]
 
     def time_getitem_scalar(self):
-        self.df[self.col][self.idx]
+        self.df[self.col_scalar][self.idx_scalar]
 
     def time_boolean_rows(self):
-        self.df2[self.indexer]
+        self.df[self.bool_indexer]
 
     def time_boolean_rows_object(self):
-        self.df2[self.obj_indexer]
+        self.df[self.bool_obj_indexer]
+
+
+class DataFrameNumericIndexing(object):
+
+    def setup(self):
+        self.idx_dupe = np.array(range(30)) * 99
+        self.df = DataFrame(np.random.randn(10000, 5))
+        self.df_dup = concat([self.df, 2 * self.df, 3 * self.df])
+        self.bool_indexer = [True] * 5000 + [False] * 5000
 
     def time_iloc_dups(self):
-        self.df3.iloc[self.idx_dupe]
+        self.df_dup.iloc[self.idx_dupe]
 
     def time_loc_dups(self):
-        self.df3.loc[self.idx_dupe]
+        self.df_dup.loc[self.idx_dupe]
 
-    def time_iloc_big(self):
-        self.df_big.iloc[:100, 0]
+    def time_iloc(self):
+        self.df.iloc[:100, 0]
 
+    def time_loc(self):
+        self.df.loc[:100, 0]
 
-class IndexingMethods(object):
-    # GH 13166
-    goal_time = 0.2
+    def time_bool_indexer(self):
+        self.df[self.bool_indexer]
 
-    def setup(self):
-        a = np.arange(100000)
-        self.ind = pd.Float64Index(a * 4.8000000418824129e-08)
 
-        self.s = Series(np.random.rand(100000))
-        self.ts = Series(np.random.rand(100000),
-                         index=date_range('2011-01-01', freq='S', periods=100000))
-        self.indexer = ([True, False, True, True, False] * 20000)
+class Take(object):
 
-    def time_get_loc_float(self):
-        self.ind.get_loc(0)
+    params = ['int', 'datetime']
+    param_names = ['index']
 
-    def time_take_dtindex(self):
-        self.ts.take(self.indexer)
+    def setup(self, index):
+        N = 100000
+        indexes = {'int': Int64Index(np.arange(N)),
+                   'datetime': date_range('2011-01-01', freq='S', periods=N)}
+        index = indexes[index]
+        self.s = Series(np.random.rand(N), index=index)
+        self.indexer = [True, False, True, True, False] * 20000
 
-    def time_take_intindex(self):
+    def time_take(self, index):
         self.s.take(self.indexer)
 
 
 class MultiIndexing(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.mi = MultiIndex.from_tuples([(x, y) for x in range(1000) for y in range(1000)])
-        self.s = Series(np.random.randn(1000000), index=self.mi)
+        mi = MultiIndex.from_product([range(1000), range(1000)])
+        self.s = Series(np.random.randn(1000000), index=mi)
         self.df = DataFrame(self.s)
 
-        # slicers
-        np.random.seed(1234)
-        self.idx = pd.IndexSlice
-        self.n = 100000
-        self.mdt = pandas.DataFrame()
-        self.mdt['A'] = np.random.choice(range(10000, 45000, 1000), self.n)
-        self.mdt['B'] = np.random.choice(range(10, 400), self.n)
-        self.mdt['C'] = np.random.choice(range(1, 150), self.n)
-        self.mdt['D'] = np.random.choice(range(10000, 45000), self.n)
-        self.mdt['x'] = np.random.choice(range(400), self.n)
-        self.mdt['y'] = np.random.choice(range(25), self.n)
-        self.test_A = 25000
-        self.test_B = 25
-        self.test_C = 40
-        self.test_D = 35000
-        self.eps_A = 5000
-        self.eps_B = 5
-        self.eps_C = 5
-        self.eps_D = 5000
-        self.mdt2 = self.mdt.set_index(['A', 'B', 'C', 'D']).sortlevel()
-        self.miint = MultiIndex.from_product(
-            [np.arange(1000),
-             np.arange(1000)], names=['one', 'two'])
-
-        import string
-        self.mistring = MultiIndex.from_product(
-            [np.arange(1000),
-             np.arange(20), list(string.ascii_letters)],
-            names=['one', 'two', 'three'])
-
-    def time_series_xs_mi_ix(self):
+        n = 100000
+        self.mdt = DataFrame({'A': np.random.choice(range(10000, 45000, 1000),
+                                                    n),
+                              'B': np.random.choice(range(10, 400), n),
+                              'C': np.random.choice(range(1, 150), n),
+                              'D': np.random.choice(range(10000, 45000), n),
+                              'x': np.random.choice(range(400), n),
+                              'y': np.random.choice(range(25), n)})
+        self.idx = IndexSlice[20000:30000, 20:30, 35:45, 30000:40000]
+        self.mdt = self.mdt.set_index(['A', 'B', 'C', 'D']).sort_index()
+
+    def time_series_ix(self):
         self.s.ix[999]
 
-    def time_frame_xs_mi_ix(self):
+    def time_frame_ix(self):
         self.df.ix[999]
 
-    def time_multiindex_slicers(self):
-        self.mdt2.loc[self.idx[
-            (self.test_A - self.eps_A):(self.test_A + self.eps_A),
-            (self.test_B - self.eps_B):(self.test_B + self.eps_B),
-            (self.test_C - self.eps_C):(self.test_C + self.eps_C),
-            (self.test_D - self.eps_D):(self.test_D + self.eps_D)], :]
+    def time_index_slice(self):
+        self.mdt.loc[self.idx, :]
+
+
+class IntervalIndexing(object):
+
+    def setup_cache(self):
+        idx = IntervalIndex.from_breaks(np.arange(1000001))
+        monotonic = Series(np.arange(1000000), index=idx)
+        return monotonic
+
+    def time_getitem_scalar(self, monotonic):
+        monotonic[80000]
+
+    def time_loc_scalar(self, monotonic):
+        monotonic.loc[80000]
+
+    def time_getitem_list(self, monotonic):
+        monotonic[80000:]
+
+    def time_loc_list(self, monotonic):
+        monotonic.loc[80000:]
+
+
+class CategoricalIndexIndexing(object):
+
+    params = ['monotonic_incr', 'monotonic_decr', 'non_monotonic']
+    param_names = ['index']
+
+    def setup(self, index):
+        N = 10**5
+        values = list('a' * N + 'b' * N + 'c' * N)
+        indices = {
+            'monotonic_incr': CategoricalIndex(values),
+            'monotonic_decr': CategoricalIndex(reversed(values)),
+            'non_monotonic': CategoricalIndex(list('abc' * N))}
+        self.data = indices[index]
+
+        self.int_scalar = 10000
+        self.int_list = list(range(10000))
+
+        self.cat_scalar = 'b'
+        self.cat_list = ['a', 'c']
 
-    def time_multiindex_get_indexer(self):
-        self.miint.get_indexer(
-            np.array([(0, 10), (0, 11), (0, 12),
-                      (0, 13), (0, 14), (0, 15),
-                      (0, 16), (0, 17), (0, 18),
-                      (0, 19)], dtype=object))
+    def time_getitem_scalar(self, index):
+        self.data[self.int_scalar]
 
-    def time_multiindex_string_get_loc(self):
-        self.mistring.get_loc((999, 19, 'Z'))
+    def time_getitem_slice(self, index):
+        self.data[:self.int_scalar]
 
-    def time_is_monotonic(self):
-        self.miint.is_monotonic
+    def time_getitem_list_like(self, index):
+        self.data[[self.int_scalar]]
+
+    def time_getitem_list(self, index):
+        self.data[self.int_list]
+
+    def time_getitem_bool_array(self, index):
+        self.data[self.data == self.cat_scalar]
+
+    def time_get_loc_scalar(self, index):
+        self.data.get_loc(self.cat_scalar)
+
+    def time_get_indexer_list(self, index):
+        self.data.get_indexer(self.cat_list)
 
 
 class PanelIndexing(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.p = Panel(np.random.randn(100, 100, 100))
-        self.inds = range(0, 100, 10)
+        with warnings.catch_warnings(record=True):
+            self.p = Panel(np.random.randn(100, 100, 100))
+            self.inds = range(0, 100, 10)
 
     def time_subset(self):
-        self.p.ix[(self.inds, self.inds, self.inds)]
+        with warnings.catch_warnings(record=True):
+            self.p.ix[(self.inds, self.inds, self.inds)]
+
+
+class MethodLookup(object):
+
+    def setup_cache(self):
+        s = Series()
+        return s
+
+    def time_lookup_iloc(self, s):
+        s.iloc
+
+    def time_lookup_ix(self, s):
+        s.ix
+
+    def time_lookup_loc(self, s):
+        s.loc
+
+
+class GetItemSingleColumn(object):
+
+    def setup(self):
+        self.df_string_col = DataFrame(np.random.randn(3000, 1), columns=['A'])
+        self.df_int_col = DataFrame(np.random.randn(3000, 1))
+
+    def time_frame_getitem_single_column_label(self):
+        self.df_string_col['A']
+
+    def time_frame_getitem_single_column_int(self):
+        self.df_int_col[0]
+
+
+class AssignTimeseriesIndex(object):
+
+    def setup(self):
+        N = 100000
+        idx = date_range('1/1/2000', periods=N, freq='H')
+        self.df = DataFrame(np.random.randn(N, 1), columns=['A'], index=idx)
+
+    def time_frame_assign_timeseries_index(self):
+        self.df['date'] = self.df.index
+
+
+class InsertColumns(object):
+
+    def setup(self):
+        self.N = 10**3
+        self.df = DataFrame(index=range(self.N))
+
+    def time_insert(self):
+        np.random.seed(1234)
+        for i in range(100):
+            self.df.insert(0, i, np.random.randn(self.N),
+                           allow_duplicates=True)
+
+    def time_assign_with_setitem(self):
+        np.random.seed(1234)
+        for i in range(100):
+            self.df[i] = np.random.randn(self.N)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/indexing_engines.py b/asv_bench/benchmarks/indexing_engines.py
new file mode 100644
index 0000000000000..f3d063ee31bc8
--- /dev/null
+++ b/asv_bench/benchmarks/indexing_engines.py
@@ -0,0 +1,64 @@
+import numpy as np
+
+from pandas._libs import index as libindex
+
+
+def _get_numeric_engines():
+    engine_names = [
+        ('Int64Engine', np.int64), ('Int32Engine', np.int32),
+        ('Int16Engine', np.int16), ('Int8Engine', np.int8),
+        ('UInt64Engine', np.uint64), ('UInt32Engine', np.uint32),
+        ('UInt16engine', np.uint16), ('UInt8Engine', np.uint8),
+        ('Float64Engine', np.float64), ('Float32Engine', np.float32),
+    ]
+    return [(getattr(libindex, engine_name), dtype)
+            for engine_name, dtype in engine_names
+            if hasattr(libindex, engine_name)]
+
+
+class NumericEngineIndexing(object):
+
+    params = [_get_numeric_engines(),
+              ['monotonic_incr', 'monotonic_decr', 'non_monotonic'],
+              ]
+    param_names = ['engine_and_dtype', 'index_type']
+
+    def setup(self, engine_and_dtype, index_type):
+        engine, dtype = engine_and_dtype
+        N = 10**5
+        values = list([1] * N + [2] * N + [3] * N)
+        arr = {
+            'monotonic_incr': np.array(values, dtype=dtype),
+            'monotonic_decr': np.array(list(reversed(values)),
+                                       dtype=dtype),
+            'non_monotonic': np.array([1, 2, 3] * N, dtype=dtype),
+        }[index_type]
+
+        self.data = engine(lambda: arr, len(arr))
+        # code belows avoids populating the mapping etc. while timing.
+        self.data.get_loc(2)
+
+    def time_get_loc(self, engine_and_dtype, index_type):
+        self.data.get_loc(2)
+
+
+class ObjectEngineIndexing(object):
+
+    params = [('monotonic_incr', 'monotonic_decr', 'non_monotonic')]
+    param_names = ['index_type']
+
+    def setup(self, index_type):
+        N = 10**5
+        values = list('a' * N + 'b' * N + 'c' * N)
+        arr = {
+            'monotonic_incr': np.array(values, dtype=object),
+            'monotonic_decr': np.array(list(reversed(values)), dtype=object),
+            'non_monotonic': np.array(list('abc') * N, dtype=object),
+        }[index_type]
+
+        self.data = libindex.ObjectEngine(lambda: arr, len(arr))
+        # code belows avoids populating the mapping etc. while timing.
+        self.data.get_loc('b')
+
+    def time_get_loc(self, index_type):
+        self.data.get_loc('b')
diff --git a/asv_bench/benchmarks/inference.py b/asv_bench/benchmarks/inference.py
index 3635438a7f76b..423bd02b93596 100644
--- a/asv_bench/benchmarks/inference.py
+++ b/asv_bench/benchmarks/inference.py
@@ -1,77 +1,76 @@
-from .pandas_vb_common import *
-import pandas as pd
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Series, to_numeric
 
+from .pandas_vb_common import numeric_dtypes, lib
 
-class DtypeInfer(object):
-    goal_time = 0.2
 
+class NumericInferOps(object):
     # from GH 7332
+    params = numeric_dtypes
+    param_names = ['dtype']
 
-    def setup(self):
-        self.N = 500000
-        self.df_int64 = DataFrame(dict(A=np.arange(self.N, dtype='int64'),
-                                       B=np.arange(self.N, dtype='int64')))
-        self.df_int32 = DataFrame(dict(A=np.arange(self.N, dtype='int32'),
-                                       B=np.arange(self.N, dtype='int32')))
-        self.df_uint32 = DataFrame(dict(A=np.arange(self.N, dtype='uint32'),
-                                        B=np.arange(self.N, dtype='uint32')))
-        self.df_float64 = DataFrame(dict(A=np.arange(self.N, dtype='float64'),
-                                         B=np.arange(self.N, dtype='float64')))
-        self.df_float32 = DataFrame(dict(A=np.arange(self.N, dtype='float32'),
-                                         B=np.arange(self.N, dtype='float32')))
-        self.df_datetime64 = DataFrame(dict(A=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms'),
-                                            B=pd.to_datetime(np.arange(self.N, dtype='int64'), unit='ms')))
-        self.df_timedelta64 = DataFrame(dict(A=(self.df_datetime64['A'] - self.df_datetime64['B']),
-                                             B=self.df_datetime64['B']))
+    def setup(self, dtype):
+        N = 5 * 10**5
+        self.df = DataFrame({'A': np.arange(N).astype(dtype),
+                             'B': np.arange(N).astype(dtype)})
 
-    def time_int64(self):
-        (self.df_int64['A'] + self.df_int64['B'])
+    def time_add(self, dtype):
+        self.df['A'] + self.df['B']
 
-    def time_int32(self):
-        (self.df_int32['A'] + self.df_int32['B'])
+    def time_subtract(self, dtype):
+        self.df['A'] - self.df['B']
 
-    def time_uint32(self):
-        (self.df_uint32['A'] + self.df_uint32['B'])
+    def time_multiply(self, dtype):
+        self.df['A'] * self.df['B']
 
-    def time_float64(self):
-        (self.df_float64['A'] + self.df_float64['B'])
+    def time_divide(self, dtype):
+        self.df['A'] / self.df['B']
 
-    def time_float32(self):
-        (self.df_float32['A'] + self.df_float32['B'])
+    def time_modulo(self, dtype):
+        self.df['A'] % self.df['B']
 
-    def time_datetime64(self):
-        (self.df_datetime64['A'] - self.df_datetime64['B'])
 
-    def time_timedelta64_1(self):
-        (self.df_timedelta64['A'] + self.df_timedelta64['B'])
+class DateInferOps(object):
+    # from GH 7332
+    def setup_cache(self):
+        N = 5 * 10**5
+        df = DataFrame({'datetime64': np.arange(N).astype('datetime64[ms]')})
+        df['timedelta'] = df['datetime64'] - df['datetime64']
+        return df
 
-    def time_timedelta64_2(self):
-        (self.df_timedelta64['A'] + self.df_timedelta64['A'])
+    def time_subtract_datetimes(self, df):
+        df['datetime64'] - df['datetime64']
 
+    def time_timedelta_plus_datetime(self, df):
+        df['timedelta'] + df['datetime64']
 
-class to_numeric(object):
-    goal_time = 0.2
+    def time_add_timedeltas(self, df):
+        df['timedelta'] + df['timedelta']
 
-    def setup(self):
-        self.n = 10000
-        self.float = Series(np.random.randn(self.n * 100))
-        self.numstr = self.float.astype('str')
-        self.str = Series(tm.makeStringIndex(self.n))
 
-    def time_from_float(self):
-        pd.to_numeric(self.float)
+class ToNumeric(object):
+
+    params = ['ignore', 'coerce']
+    param_names = ['errors']
+
+    def setup(self, errors):
+        N = 10000
+        self.float = Series(np.random.randn(N))
+        self.numstr = self.float.astype('str')
+        self.str = Series(tm.makeStringIndex(N))
 
-    def time_from_numeric_str(self):
-        pd.to_numeric(self.numstr)
+    def time_from_float(self, errors):
+        to_numeric(self.float, errors=errors)
 
-    def time_from_str_ignore(self):
-        pd.to_numeric(self.str, errors='ignore')
+    def time_from_numeric_str(self, errors):
+        to_numeric(self.numstr, errors=errors)
 
-    def time_from_str_coerce(self):
-        pd.to_numeric(self.str, errors='coerce')
+    def time_from_str(self, errors):
+        to_numeric(self.str, errors=errors)
 
 
-class to_numeric_downcast(object):
+class ToNumericDowncast(object):
 
     param_names = ['dtype', 'downcast']
     params = [['string-float', 'string-int', 'string-nint', 'datetime64',
@@ -81,37 +80,33 @@ class to_numeric_downcast(object):
     N = 500000
     N2 = int(N / 2)
 
-    data_dict = {
-        'string-int': (['1'] * N2) + ([2] * N2),
-        'string-nint': (['-1'] * N2) + ([2] * N2),
-        'datetime64': np.repeat(np.array(['1970-01-01', '1970-01-02'],
-                                         dtype='datetime64[D]'), N),
-        'string-float': (['1.1'] * N2) + ([2] * N2),
-        'int-list': ([1] * N2) + ([2] * N2),
-        'int32': np.repeat(np.int32(1), N)
-        }
+    data_dict = {'string-int': ['1'] * N2 + [2] * N2,
+                 'string-nint': ['-1'] * N2 + [2] * N2,
+                 'datetime64': np.repeat(np.array(['1970-01-01', '1970-01-02'],
+                                                  dtype='datetime64[D]'), N),
+                 'string-float': ['1.1'] * N2 + [2] * N2,
+                 'int-list': [1] * N2 + [2] * N2,
+                 'int32': np.repeat(np.int32(1), N)}
 
     def setup(self, dtype, downcast):
         self.data = self.data_dict[dtype]
 
     def time_downcast(self, dtype, downcast):
-        pd.to_numeric(self.data, downcast=downcast)
+        to_numeric(self.data, downcast=downcast)
 
 
 class MaybeConvertNumeric(object):
 
-    def setup(self):
-        n = 1000000
-        arr = np.repeat([2**63], n)
-        arr = arr + np.arange(n).astype('uint64')
-        arr = np.array([arr[i] if i%2 == 0 else
-                        str(arr[i]) for i in range(n)],
-                       dtype=object)
-
-        arr[-1] = -1
-        self.data = arr
-        self.na_values = set()
-
-    def time_convert(self):
-        pd.lib.maybe_convert_numeric(self.data, self.na_values,
-                                     coerce_numeric=False)
+    def setup_cache(self):
+        N = 10**6
+        arr = np.repeat([2**63], N) + np.arange(N).astype('uint64')
+        data = arr.astype(object)
+        data[1::2] = arr[1::2].astype(str)
+        data[-1] = -1
+        return data
+
+    def time_convert(self, data):
+        lib.maybe_convert_numeric(data, set(), coerce_numeric=False)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/doc/sphinxext/ipython_sphinxext/__init__.py b/asv_bench/benchmarks/io/__init__.py
similarity index 100%
rename from doc/sphinxext/ipython_sphinxext/__init__.py
rename to asv_bench/benchmarks/io/__init__.py
diff --git a/asv_bench/benchmarks/io/csv.py b/asv_bench/benchmarks/io/csv.py
new file mode 100644
index 0000000000000..d42a15d61fb0d
--- /dev/null
+++ b/asv_bench/benchmarks/io/csv.py
@@ -0,0 +1,236 @@
+import random
+import string
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, Categorical, date_range, read_csv
+from pandas.compat import cStringIO as StringIO
+
+from ..pandas_vb_common import BaseIO
+
+
+class ToCSV(BaseIO):
+
+    fname = '__test__.csv'
+    params = ['wide', 'long', 'mixed']
+    param_names = ['kind']
+
+    def setup(self, kind):
+        wide_frame = DataFrame(np.random.randn(3000, 30))
+        long_frame = DataFrame({'A': np.arange(50000),
+                                'B': np.arange(50000) + 1.,
+                                'C': np.arange(50000) + 2.,
+                                'D': np.arange(50000) + 3.})
+        mixed_frame = DataFrame({'float': np.random.randn(5000),
+                                 'int': np.random.randn(5000).astype(int),
+                                 'bool': (np.arange(5000) % 2) == 0,
+                                 'datetime': date_range('2001',
+                                                        freq='s',
+                                                        periods=5000),
+                                 'object': ['foo'] * 5000})
+        mixed_frame.loc[30:500, 'float'] = np.nan
+        data = {'wide': wide_frame,
+                'long': long_frame,
+                'mixed': mixed_frame}
+        self.df = data[kind]
+
+    def time_frame(self, kind):
+        self.df.to_csv(self.fname)
+
+
+class ToCSVDatetime(BaseIO):
+
+    fname = '__test__.csv'
+
+    def setup(self):
+        rng = date_range('1/1/2000', periods=1000)
+        self.data = DataFrame(rng, index=rng)
+
+    def time_frame_date_formatting(self):
+        self.data.to_csv(self.fname, date_format='%Y%m%d')
+
+
+class StringIORewind(object):
+
+    def data(self, stringio_object):
+        stringio_object.seek(0)
+        return stringio_object
+
+
+class ReadCSVDInferDatetimeFormat(StringIORewind):
+
+    params = ([True, False], ['custom', 'iso8601', 'ymd'])
+    param_names = ['infer_datetime_format', 'format']
+
+    def setup(self, infer_datetime_format, format):
+        rng = date_range('1/1/2000', periods=1000)
+        formats = {'custom': '%m/%d/%Y %H:%M:%S.%f',
+                   'iso8601': '%Y-%m-%d %H:%M:%S',
+                   'ymd': '%Y%m%d'}
+        dt_format = formats[format]
+        self.StringIO_input = StringIO('\n'.join(
+                                       rng.strftime(dt_format).tolist()))
+
+    def time_read_csv(self, infer_datetime_format, format):
+        read_csv(self.data(self.StringIO_input),
+                 header=None, names=['foo'], parse_dates=['foo'],
+                 infer_datetime_format=infer_datetime_format)
+
+
+class ReadCSVSkipRows(BaseIO):
+
+    fname = '__test__.csv'
+    params = [None, 10000]
+    param_names = ['skiprows']
+
+    def setup(self, skiprows):
+        N = 20000
+        index = tm.makeStringIndex(N)
+        df = DataFrame({'float1': np.random.randn(N),
+                        'float2': np.random.randn(N),
+                        'string1': ['foo'] * N,
+                        'bool1': [True] * N,
+                        'int1': np.random.randint(0, N, size=N)},
+                       index=index)
+        df.to_csv(self.fname)
+
+    def time_skipprows(self, skiprows):
+        read_csv(self.fname, skiprows=skiprows)
+
+
+class ReadUint64Integers(StringIORewind):
+
+    def setup(self):
+        self.na_values = [2**63 + 500]
+        arr = np.arange(10000).astype('uint64') + 2**63
+        self.data1 = StringIO('\n'.join(arr.astype(str).tolist()))
+        arr = arr.astype(object)
+        arr[500] = -1
+        self.data2 = StringIO('\n'.join(arr.astype(str).tolist()))
+
+    def time_read_uint64(self):
+        read_csv(self.data(self.data1), header=None, names=['foo'])
+
+    def time_read_uint64_neg_values(self):
+        read_csv(self.data(self.data2), header=None, names=['foo'])
+
+    def time_read_uint64_na_values(self):
+        read_csv(self.data(self.data1), header=None, names=['foo'],
+                 na_values=self.na_values)
+
+
+class ReadCSVThousands(BaseIO):
+
+    fname = '__test__.csv'
+    params = ([',', '|'], [None, ','])
+    param_names = ['sep', 'thousands']
+
+    def setup(self, sep, thousands):
+        N = 10000
+        K = 8
+        data = np.random.randn(N, K) * np.random.randint(100, 10000, (N, K))
+        df = DataFrame(data)
+        if thousands is not None:
+            fmt = ':{}'.format(thousands)
+            fmt = '{' + fmt + '}'
+            df = df.applymap(lambda x: fmt.format(x))
+        df.to_csv(self.fname, sep=sep)
+
+    def time_thousands(self, sep, thousands):
+        read_csv(self.fname, sep=sep, thousands=thousands)
+
+
+class ReadCSVComment(StringIORewind):
+
+    def setup(self):
+        data = ['A,B,C'] + (['1,2,3 # comment'] * 100000)
+        self.StringIO_input = StringIO('\n'.join(data))
+
+    def time_comment(self):
+        read_csv(self.data(self.StringIO_input), comment='#',
+                 header=None, names=list('abc'))
+
+
+class ReadCSVFloatPrecision(StringIORewind):
+
+    params = ([',', ';'], ['.', '_'], [None, 'high', 'round_trip'])
+    param_names = ['sep', 'decimal', 'float_precision']
+
+    def setup(self, sep, decimal, float_precision):
+        floats = [''.join(random.choice(string.digits) for _ in range(28))
+                  for _ in range(15)]
+        rows = sep.join(['0{}'.format(decimal) + '{}'] * 3) + '\n'
+        data = rows * 5
+        data = data.format(*floats) * 200  # 1000 x 3 strings csv
+        self.StringIO_input = StringIO(data)
+
+    def time_read_csv(self, sep, decimal, float_precision):
+        read_csv(self.data(self.StringIO_input), sep=sep, header=None,
+                 names=list('abc'), float_precision=float_precision)
+
+    def time_read_csv_python_engine(self, sep, decimal, float_precision):
+        read_csv(self.data(self.StringIO_input), sep=sep, header=None,
+                 engine='python', float_precision=None, names=list('abc'))
+
+
+class ReadCSVCategorical(BaseIO):
+
+    fname = '__test__.csv'
+
+    def setup(self):
+        N = 100000
+        group1 = ['aaaaaaaa', 'bbbbbbb', 'cccccccc', 'dddddddd', 'eeeeeeee']
+        df = DataFrame(np.random.choice(group1, (N, 3)), columns=list('abc'))
+        df.to_csv(self.fname, index=False)
+
+    def time_convert_post(self):
+        read_csv(self.fname).apply(Categorical)
+
+    def time_convert_direct(self):
+        read_csv(self.fname, dtype='category')
+
+
+class ReadCSVParseDates(StringIORewind):
+
+    def setup(self):
+        data = """{},19:00:00,18:56:00,0.8100,2.8100,7.2000,0.0000,280.0000\n
+                  {},20:00:00,19:56:00,0.0100,2.2100,7.2000,0.0000,260.0000\n
+                  {},21:00:00,20:56:00,-0.5900,2.2100,5.7000,0.0000,280.0000\n
+                  {},21:00:00,21:18:00,-0.9900,2.0100,3.6000,0.0000,270.0000\n
+                  {},22:00:00,21:56:00,-0.5900,1.7100,5.1000,0.0000,290.0000\n
+               """
+        two_cols = ['KORD,19990127'] * 5
+        data = data.format(*two_cols)
+        self.StringIO_input = StringIO(data)
+
+    def time_multiple_date(self):
+        read_csv(self.data(self.StringIO_input), sep=',', header=None,
+                 names=list(string.digits[:9]),
+                 parse_dates=[[1, 2], [1, 3]])
+
+    def time_baseline(self):
+        read_csv(self.data(self.StringIO_input), sep=',', header=None,
+                 parse_dates=[1],
+                 names=list(string.digits[:9]))
+
+
+class ReadCSVMemoryGrowth(BaseIO):
+
+    chunksize = 20
+    num_rows = 1000
+    fname = "__test__.csv"
+
+    def setup(self):
+        with open(self.fname, "w") as f:
+            for i in range(self.num_rows):
+                f.write("{i}\n".format(i=i))
+
+    def mem_parser_chunks(self):
+        # see gh-24805.
+        result = read_csv(self.fname, chunksize=self.chunksize)
+
+        for _ in result:
+            pass
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/excel.py b/asv_bench/benchmarks/io/excel.py
new file mode 100644
index 0000000000000..1bee864fbcf2d
--- /dev/null
+++ b/asv_bench/benchmarks/io/excel.py
@@ -0,0 +1,36 @@
+import numpy as np
+from pandas import DataFrame, date_range, ExcelWriter, read_excel
+from pandas.compat import BytesIO
+import pandas.util.testing as tm
+
+
+class Excel(object):
+
+    params = ['openpyxl', 'xlsxwriter', 'xlwt']
+    param_names = ['engine']
+
+    def setup(self, engine):
+        N = 2000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.bio_read = BytesIO()
+        self.writer_read = ExcelWriter(self.bio_read, engine=engine)
+        self.df.to_excel(self.writer_read, sheet_name='Sheet1')
+        self.writer_read.save()
+        self.bio_read.seek(0)
+
+    def time_read_excel(self, engine):
+        read_excel(self.bio_read)
+
+    def time_write_excel(self, engine):
+        bio_write = BytesIO()
+        bio_write.seek(0)
+        writer_write = ExcelWriter(bio_write, engine=engine)
+        self.df.to_excel(writer_write, sheet_name='Sheet1')
+        writer_write.save()
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/hdf.py b/asv_bench/benchmarks/io/hdf.py
new file mode 100644
index 0000000000000..a5dc28eb9508c
--- /dev/null
+++ b/asv_bench/benchmarks/io/hdf.py
@@ -0,0 +1,122 @@
+import numpy as np
+from pandas import DataFrame, date_range, HDFStore, read_hdf
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO
+
+
+class HDFStoreDataFrame(BaseIO):
+
+    def setup(self):
+        N = 25000
+        index = tm.makeStringIndex(N)
+        self.df = DataFrame({'float1': np.random.randn(N),
+                             'float2': np.random.randn(N)},
+                            index=index)
+        self.df_mixed = DataFrame({'float1': np.random.randn(N),
+                                   'float2': np.random.randn(N),
+                                   'string1': ['foo'] * N,
+                                   'bool1': [True] * N,
+                                   'int1': np.random.randint(0, N, size=N)},
+                                  index=index)
+        self.df_wide = DataFrame(np.random.randn(N, 100))
+        self.start_wide = self.df_wide.index[10000]
+        self.stop_wide = self.df_wide.index[15000]
+        self.df2 = DataFrame({'float1': np.random.randn(N),
+                              'float2': np.random.randn(N)},
+                             index=date_range('1/1/2000', periods=N))
+        self.start = self.df2.index[10000]
+        self.stop = self.df2.index[15000]
+        self.df_wide2 = DataFrame(np.random.randn(N, 100),
+                                  index=date_range('1/1/2000', periods=N))
+        self.df_dc = DataFrame(np.random.randn(N, 10),
+                               columns=['C%03d' % i for i in range(10)])
+
+        self.fname = '__test__.h5'
+
+        self.store = HDFStore(self.fname)
+        self.store.put('fixed', self.df)
+        self.store.put('fixed_mixed', self.df_mixed)
+        self.store.append('table', self.df2)
+        self.store.append('table_mixed', self.df_mixed)
+        self.store.append('table_wide', self.df_wide)
+        self.store.append('table_wide2', self.df_wide2)
+
+    def teardown(self):
+        self.store.close()
+        self.remove(self.fname)
+
+    def time_read_store(self):
+        self.store.get('fixed')
+
+    def time_read_store_mixed(self):
+        self.store.get('fixed_mixed')
+
+    def time_write_store(self):
+        self.store.put('fixed_write', self.df)
+
+    def time_write_store_mixed(self):
+        self.store.put('fixed_mixed_write', self.df_mixed)
+
+    def time_read_store_table_mixed(self):
+        self.store.select('table_mixed')
+
+    def time_write_store_table_mixed(self):
+        self.store.append('table_mixed_write', self.df_mixed)
+
+    def time_read_store_table(self):
+        self.store.select('table')
+
+    def time_write_store_table(self):
+        self.store.append('table_write', self.df)
+
+    def time_read_store_table_wide(self):
+        self.store.select('table_wide')
+
+    def time_write_store_table_wide(self):
+        self.store.append('table_wide_write', self.df_wide)
+
+    def time_write_store_table_dc(self):
+        self.store.append('table_dc_write', self.df_dc, data_columns=True)
+
+    def time_query_store_table_wide(self):
+        self.store.select('table_wide', where="index > self.start_wide and "
+                                              "index < self.stop_wide")
+
+    def time_query_store_table(self):
+        self.store.select('table', where="index > self.start and "
+                                         "index < self.stop")
+
+    def time_store_repr(self):
+        repr(self.store)
+
+    def time_store_str(self):
+        str(self.store)
+
+    def time_store_info(self):
+        self.store.info()
+
+
+class HDF(BaseIO):
+
+    params = ['table', 'fixed']
+    param_names = ['format']
+
+    def setup(self, format):
+        self.fname = '__test__.h5'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_hdf(self.fname, 'df', format=format)
+
+    def time_read_hdf(self, format):
+        read_hdf(self.fname, 'df')
+
+    def time_write_hdf(self, format):
+        self.df.to_hdf(self.fname, 'df', format=format)
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/json.py b/asv_bench/benchmarks/io/json.py
new file mode 100644
index 0000000000000..ec2ddc11b7c1d
--- /dev/null
+++ b/asv_bench/benchmarks/io/json.py
@@ -0,0 +1,127 @@
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, date_range, timedelta_range, concat, read_json
+
+from ..pandas_vb_common import BaseIO
+
+
+class ReadJSON(BaseIO):
+
+    fname = "__test__.json"
+    params = (['split', 'index', 'records'], ['int', 'datetime'])
+    param_names = ['orient', 'index']
+
+    def setup(self, orient, index):
+        N = 100000
+        indexes = {'int': np.arange(N),
+                   'datetime': date_range('20000101', periods=N, freq='H')}
+        df = DataFrame(np.random.randn(N, 5),
+                       columns=['float_{}'.format(i) for i in range(5)],
+                       index=indexes[index])
+        df.to_json(self.fname, orient=orient)
+
+    def time_read_json(self, orient, index):
+        read_json(self.fname, orient=orient)
+
+
+class ReadJSONLines(BaseIO):
+
+    fname = "__test_lines__.json"
+    params = ['int', 'datetime']
+    param_names = ['index']
+
+    def setup(self, index):
+        N = 100000
+        indexes = {'int': np.arange(N),
+                   'datetime': date_range('20000101', periods=N, freq='H')}
+        df = DataFrame(np.random.randn(N, 5),
+                       columns=['float_{}'.format(i) for i in range(5)],
+                       index=indexes[index])
+        df.to_json(self.fname, orient='records', lines=True)
+
+    def time_read_json_lines(self, index):
+        read_json(self.fname, orient='records', lines=True)
+
+    def time_read_json_lines_concat(self, index):
+        concat(read_json(self.fname, orient='records', lines=True,
+                         chunksize=25000))
+
+    def peakmem_read_json_lines(self, index):
+        read_json(self.fname, orient='records', lines=True)
+
+    def peakmem_read_json_lines_concat(self, index):
+        concat(read_json(self.fname, orient='records', lines=True,
+                         chunksize=25000))
+
+
+class ToJSON(BaseIO):
+
+    fname = "__test__.json"
+    params = ['split', 'columns', 'index']
+    param_names = ['orient']
+
+    def setup(self, lines_orient):
+        N = 10**5
+        ncols = 5
+        index = date_range('20000101', periods=N, freq='H')
+        timedeltas = timedelta_range(start=1, periods=N, freq='s')
+        datetimes = date_range(start=1, periods=N, freq='s')
+        ints = np.random.randint(100000000, size=N)
+        floats = np.random.randn(N)
+        strings = tm.makeStringIndex(N)
+        self.df = DataFrame(np.random.randn(N, ncols), index=np.arange(N))
+        self.df_date_idx = DataFrame(np.random.randn(N, ncols), index=index)
+        self.df_td_int_ts = DataFrame({'td_1': timedeltas,
+                                       'td_2': timedeltas,
+                                       'int_1': ints,
+                                       'int_2': ints,
+                                       'ts_1': datetimes,
+                                       'ts_2': datetimes},
+                                      index=index)
+        self.df_int_floats = DataFrame({'int_1': ints,
+                                        'int_2': ints,
+                                        'int_3': ints,
+                                        'float_1': floats,
+                                        'float_2': floats,
+                                        'float_3': floats},
+                                       index=index)
+        self.df_int_float_str = DataFrame({'int_1': ints,
+                                           'int_2': ints,
+                                           'float_1': floats,
+                                           'float_2': floats,
+                                           'str_1': strings,
+                                           'str_2': strings},
+                                          index=index)
+
+    def time_floats_with_int_index(self, orient):
+        self.df.to_json(self.fname, orient=orient)
+
+    def time_floats_with_dt_index(self, orient):
+        self.df_date_idx.to_json(self.fname, orient=orient)
+
+    def time_delta_int_tstamp(self, orient):
+        self.df_td_int_ts.to_json(self.fname, orient=orient)
+
+    def time_float_int(self, orient):
+        self.df_int_floats.to_json(self.fname, orient=orient)
+
+    def time_float_int_str(self, orient):
+        self.df_int_float_str.to_json(self.fname, orient=orient)
+
+    def time_floats_with_int_idex_lines(self, orient):
+        self.df.to_json(self.fname, orient='records', lines=True)
+
+    def time_floats_with_dt_index_lines(self, orient):
+        self.df_date_idx.to_json(self.fname, orient='records', lines=True)
+
+    def time_delta_int_tstamp_lines(self, orient):
+        self.df_td_int_ts.to_json(self.fname, orient='records', lines=True)
+
+    def time_float_int_lines(self, orient):
+        self.df_int_floats.to_json(self.fname, orient='records', lines=True)
+
+    def time_float_int_str_lines(self, orient):
+        self.df_int_float_str.to_json(self.fname, orient='records', lines=True)
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/msgpack.py b/asv_bench/benchmarks/io/msgpack.py
new file mode 100644
index 0000000000000..dc2642d920fd0
--- /dev/null
+++ b/asv_bench/benchmarks/io/msgpack.py
@@ -0,0 +1,27 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_msgpack
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO
+
+
+class MSGPack(BaseIO):
+
+    def setup(self):
+        self.fname = '__test__.msg'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_msgpack(self.fname)
+
+    def time_read_msgpack(self):
+        read_msgpack(self.fname)
+
+    def time_write_msgpack(self):
+        self.df.to_msgpack(self.fname)
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/pickle.py b/asv_bench/benchmarks/io/pickle.py
new file mode 100644
index 0000000000000..74a58bbb946aa
--- /dev/null
+++ b/asv_bench/benchmarks/io/pickle.py
@@ -0,0 +1,27 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_pickle
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO
+
+
+class Pickle(BaseIO):
+
+    def setup(self):
+        self.fname = '__test__.pkl'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df.to_pickle(self.fname)
+
+    def time_read_pickle(self):
+        read_pickle(self.fname)
+
+    def time_write_pickle(self):
+        self.df.to_pickle(self.fname)
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/sas.py b/asv_bench/benchmarks/io/sas.py
new file mode 100644
index 0000000000000..2783f42cad895
--- /dev/null
+++ b/asv_bench/benchmarks/io/sas.py
@@ -0,0 +1,20 @@
+import os
+
+from pandas import read_sas
+
+
+class SAS(object):
+
+    params = ['sas7bdat', 'xport']
+    param_names = ['format']
+
+    def setup(self, format):
+        # Read files that are located in 'pandas/io/tests/sas/data'
+        files = {'sas7bdat': 'test1.sas7bdat', 'xport': 'paxraw_d_short.xpt'}
+        file = files[format]
+        paths = [os.path.dirname(__file__), '..', '..', '..', 'pandas',
+                 'tests', 'io', 'sas', 'data', file]
+        self.f = os.path.join(*paths)
+
+    def time_read_msgpack(self, format):
+        read_sas(self.f, format=format)
diff --git a/asv_bench/benchmarks/io/sql.py b/asv_bench/benchmarks/io/sql.py
new file mode 100644
index 0000000000000..075d3bdda5ed9
--- /dev/null
+++ b/asv_bench/benchmarks/io/sql.py
@@ -0,0 +1,127 @@
+import sqlite3
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import DataFrame, date_range, read_sql_query, read_sql_table
+from sqlalchemy import create_engine
+
+
+class SQL(object):
+
+    params = ['sqlalchemy', 'sqlite']
+    param_names = ['connection']
+
+    def setup(self, connection):
+        N = 10000
+        con = {'sqlalchemy': create_engine('sqlite:///:memory:'),
+               'sqlite': sqlite3.connect(':memory:')}
+        self.table_name = 'test_type'
+        self.query_all = 'SELECT * FROM {}'.format(self.table_name)
+        self.con = con[connection]
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_to_sql_dataframe(self, connection):
+        self.df.to_sql('test1', self.con, if_exists='replace')
+
+    def time_read_sql_query(self, connection):
+        read_sql_query(self.query_all, self.con)
+
+
+class WriteSQLDtypes(object):
+
+    params = (['sqlalchemy', 'sqlite'],
+              ['float', 'float_with_nan', 'string', 'bool', 'int', 'datetime'])
+    param_names = ['connection', 'dtype']
+
+    def setup(self, connection, dtype):
+        N = 10000
+        con = {'sqlalchemy': create_engine('sqlite:///:memory:'),
+               'sqlite': sqlite3.connect(':memory:')}
+        self.table_name = 'test_type'
+        self.query_col = 'SELECT {} FROM {}'.format(dtype, self.table_name)
+        self.con = con[connection]
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_to_sql_dataframe_column(self, connection, dtype):
+        self.df[[dtype]].to_sql('test1', self.con, if_exists='replace')
+
+    def time_read_sql_query_select_column(self, connection, dtype):
+        read_sql_query(self.query_col, self.con)
+
+
+class ReadSQLTable(object):
+
+    def setup(self):
+        N = 10000
+        self.table_name = 'test'
+        self.con = create_engine('sqlite:///:memory:')
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_read_sql_table_all(self):
+        read_sql_table(self.table_name, self.con)
+
+    def time_read_sql_table_parse_dates(self):
+        read_sql_table(self.table_name, self.con, columns=['datetime_string'],
+                       parse_dates=['datetime_string'])
+
+
+class ReadSQLTableDtypes(object):
+
+    params = ['float', 'float_with_nan', 'string', 'bool', 'int', 'datetime']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10000
+        self.table_name = 'test'
+        self.con = create_engine('sqlite:///:memory:')
+        self.df = DataFrame({'float': np.random.randn(N),
+                             'float_with_nan': np.random.randn(N),
+                             'string': ['foo'] * N,
+                             'bool': [True] * N,
+                             'int': np.random.randint(0, N, size=N),
+                             'datetime': date_range('2000-01-01',
+                                                    periods=N,
+                                                    freq='s')},
+                            index=tm.makeStringIndex(N))
+        self.df.loc[1000:3000, 'float_with_nan'] = np.nan
+        self.df['datetime_string'] = self.df['datetime'].astype(str)
+        self.df.to_sql(self.table_name, self.con, if_exists='replace')
+
+    def time_read_sql_table_column(self, dtype):
+        read_sql_table(self.table_name, self.con, columns=[dtype])
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io/stata.py b/asv_bench/benchmarks/io/stata.py
new file mode 100644
index 0000000000000..a7f854a853f50
--- /dev/null
+++ b/asv_bench/benchmarks/io/stata.py
@@ -0,0 +1,39 @@
+import numpy as np
+from pandas import DataFrame, date_range, read_stata
+import pandas.util.testing as tm
+
+from ..pandas_vb_common import BaseIO
+
+
+class Stata(BaseIO):
+
+    params = ['tc', 'td', 'tm', 'tw', 'th', 'tq', 'ty']
+    param_names = ['convert_dates']
+
+    def setup(self, convert_dates):
+        self.fname = '__test__.dta'
+        N = 100000
+        C = 5
+        self.df = DataFrame(np.random.randn(N, C),
+                            columns=['float{}'.format(i) for i in range(C)],
+                            index=date_range('20000101', periods=N, freq='H'))
+        self.df['object'] = tm.makeStringIndex(N)
+        self.df['int8_'] = np.random.randint(np.iinfo(np.int8).min,
+                                             np.iinfo(np.int8).max - 27, N)
+        self.df['int16_'] = np.random.randint(np.iinfo(np.int16).min,
+                                              np.iinfo(np.int16).max - 27, N)
+        self.df['int32_'] = np.random.randint(np.iinfo(np.int32).min,
+                                              np.iinfo(np.int32).max - 27, N)
+        self.df['float32_'] = np.array(np.random.randn(N),
+                                       dtype=np.float32)
+        self.convert_dates = {'index': convert_dates}
+        self.df.to_stata(self.fname, self.convert_dates)
+
+    def time_read_stata(self, convert_dates):
+        read_stata(self.fname)
+
+    def time_write_stata(self, convert_dates):
+        self.df.to_stata(self.fname, self.convert_dates)
+
+
+from ..pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/io_bench.py b/asv_bench/benchmarks/io_bench.py
deleted file mode 100644
index 52064d2cdb8a2..0000000000000
--- a/asv_bench/benchmarks/io_bench.py
+++ /dev/null
@@ -1,194 +0,0 @@
-from .pandas_vb_common import *
-from pandas import concat, Timestamp, compat
-try:
-    from StringIO import StringIO
-except ImportError:
-    from io import StringIO
-import timeit
-
-
-class frame_to_csv(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(3000, 30))
-
-    def time_frame_to_csv(self):
-        self.df.to_csv('__test__.csv')
-
-
-class frame_to_csv2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame({'A': range(50000), })
-        self.df['B'] = (self.df.A + 1.0)
-        self.df['C'] = (self.df.A + 2.0)
-        self.df['D'] = (self.df.A + 3.0)
-
-    def time_frame_to_csv2(self):
-        self.df.to_csv('__test__.csv')
-
-
-class frame_to_csv_date_formatting(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = DataFrame(self.rng, index=self.rng)
-
-    def time_frame_to_csv_date_formatting(self):
-        self.data.to_csv('__test__.csv', date_format='%Y%m%d')
-
-
-class frame_to_csv_mixed(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df_float = DataFrame(np.random.randn(5000, 5), dtype='float64', columns=self.create_cols('float'))
-        self.df_int = DataFrame(np.random.randn(5000, 5), dtype='int64', columns=self.create_cols('int'))
-        self.df_bool = DataFrame(True, index=self.df_float.index, columns=self.create_cols('bool'))
-        self.df_object = DataFrame('foo', index=self.df_float.index, columns=self.create_cols('object'))
-        self.df_dt = DataFrame(Timestamp('20010101'), index=self.df_float.index, columns=self.create_cols('date'))
-        self.df_float.ix[30:500, 1:3] = np.nan
-        self.df = concat([self.df_float, self.df_int, self.df_bool, self.df_object, self.df_dt], axis=1)
-
-    def time_frame_to_csv_mixed(self):
-        self.df.to_csv('__test__.csv')
-
-    def create_cols(self, name):
-        return [('%s%03d' % (name, i)) for i in range(5)]
-
-
-class read_csv_infer_datetime_format_custom(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%m/%d/%Y %H:%M:%S.%f'))))
-
-    def time_read_csv_infer_datetime_format_custom(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_infer_datetime_format_iso8601(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y-%m-%d %H:%M:%S'))))
-
-    def time_read_csv_infer_datetime_format_iso8601(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_infer_datetime_format_ymd(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y%m%d'))))
-
-    def time_read_csv_infer_datetime_format_ymd(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'], infer_datetime_format=True)
-
-
-class read_csv_skiprows(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(20000)
-        self.df = DataFrame({'float1': randn(20000), 'float2': randn(20000), 'string1': (['foo'] * 20000), 'bool1': ([True] * 20000), 'int1': np.random.randint(0, 200000, size=20000), }, index=self.index)
-        self.df.to_csv('__test__.csv')
-
-    def time_read_csv_skiprows(self):
-        read_csv('__test__.csv', skiprows=10000)
-
-
-class read_csv_standard(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_csv('__test__.csv')
-
-    def time_read_csv_standard(self):
-        read_csv('__test__.csv')
-
-
-class read_parse_dates_iso8601(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=1000)
-        self.data = '\n'.join(self.rng.map((lambda x: x.strftime('%Y-%m-%d %H:%M:%S'))))
-
-    def time_read_parse_dates_iso8601(self):
-        read_csv(StringIO(self.data), header=None, names=['foo'], parse_dates=['foo'])
-
-
-class read_uint64_integers(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.na_values = [2**63 + 500]
-
-        self.arr1 = np.arange(10000).astype('uint64') + 2**63
-        self.data1 = '\n'.join(map(lambda x: str(x), self.arr1))
-
-        self.arr2 = self.arr1.copy().astype(object)
-        self.arr2[500] = -1
-        self.data2 = '\n'.join(map(lambda x: str(x), self.arr2))
-
-    def time_read_uint64(self):
-        read_csv(StringIO(self.data1), header=None)
-
-    def time_read_uint64_neg_values(self):
-        read_csv(StringIO(self.data2), header=None)
-
-    def time_read_uint64_na_values(self):
-        read_csv(StringIO(self.data1), header=None, na_values=self.na_values)
-
-
-class write_csv_standard(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-
-    def time_write_csv_standard(self):
-        self.df.to_csv('__test__.csv')
-
-
-class read_csv_from_s3(object):
-    # Make sure that we can read part of a file from S3 without
-    # needing to download the entire thing. Use the timeit.default_timer
-    # to measure wall time instead of CPU time -- we want to see
-    # how long it takes to download the data.
-    timer = timeit.default_timer
-    params = ([None, "gzip", "bz2"], ["python", "c"])
-    param_names = ["compression", "engine"]
-
-    def setup(self, compression, engine):
-        if compression == "bz2" and engine == "c" and compat.PY2:
-            # The Python 2 C parser can't read bz2 from open files.
-            raise NotImplementedError
-        try:
-            import s3fs
-        except ImportError:
-            # Skip these benchmarks if `boto` is not installed.
-            raise NotImplementedError
-
-        self.big_fname = "s3://pandas-test/large_random.csv"
-
-    def time_read_nrows(self, compression, engine):
-        # Read a small number of rows from a huge (100,000 x 50) table.
-        ext = ""
-        if compression == "gzip":
-            ext = ".gz"
-        elif compression == "bz2":
-            ext = ".bz2"
-        pd.read_csv(self.big_fname + ext, nrows=10,
-                    compression=compression, engine=engine)
diff --git a/asv_bench/benchmarks/io_sql.py b/asv_bench/benchmarks/io_sql.py
deleted file mode 100644
index ec855e5d33525..0000000000000
--- a/asv_bench/benchmarks/io_sql.py
+++ /dev/null
@@ -1,105 +0,0 @@
-import sqlalchemy
-from .pandas_vb_common import *
-import sqlite3
-from sqlalchemy import create_engine
-
-
-#-------------------------------------------------------------------------------
-# to_sql
-
-class WriteSQL(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-
-    def time_fallback(self):
-        self.df.to_sql('test1', self.con, if_exists='replace')
-
-    def time_sqlalchemy(self):
-        self.df.to_sql('test1', self.engine, if_exists='replace')
-
-
-#-------------------------------------------------------------------------------
-# read_sql
-
-class ReadSQL(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.index = tm.makeStringIndex(10000)
-        self.df = DataFrame({'float1': randn(10000), 'float2': randn(10000), 'string1': (['foo'] * 10000), 'bool1': ([True] * 10000), 'int1': np.random.randint(0, 100000, size=10000), }, index=self.index)
-        self.df.to_sql('test2', self.engine, if_exists='replace')
-        self.df.to_sql('test2', self.con, if_exists='replace')
-
-    def time_read_query_fallback(self):
-        read_sql_query('SELECT * FROM test2', self.con)
-
-    def time_read_query_sqlalchemy(self):
-        read_sql_query('SELECT * FROM test2', self.engine)
-
-    def time_read_table_sqlalchemy(self):
-        read_sql_table('test2', self.engine)
-
-
-#-------------------------------------------------------------------------------
-# type specific write
-
-class WriteSQLTypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'string': (['foo'] * 10000), 'bool': ([True] * 10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df.loc[1000:3000, 'float'] = np.nan
-
-    def time_string_fallback(self):
-        self.df[['string']].to_sql('test_string', self.con, if_exists='replace')
-
-    def time_string_sqlalchemy(self):
-        self.df[['string']].to_sql('test_string', self.engine, if_exists='replace')
-
-    def time_float_fallback(self):
-        self.df[['float']].to_sql('test_float', self.con, if_exists='replace')
-
-    def time_float_sqlalchemy(self):
-        self.df[['float']].to_sql('test_float', self.engine, if_exists='replace')
-
-    def time_datetime_sqlalchemy(self):
-        self.df[['datetime']].to_sql('test_datetime', self.engine, if_exists='replace')
-
-
-#-------------------------------------------------------------------------------
-# type specific read
-
-class ReadSQLTypes(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.engine = create_engine('sqlite:///:memory:')
-        self.con = sqlite3.connect(':memory:')
-        self.df = DataFrame({'float': randn(10000), 'datetime': date_range('2000-01-01', periods=10000, freq='s'), })
-        self.df['datetime_string'] = self.df['datetime'].map(str)
-        self.df.to_sql('test_type', self.engine, if_exists='replace')
-        self.df[['float', 'datetime_string']].to_sql('test_type', self.con, if_exists='replace')
-
-    def time_datetime_read_and_parse_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['datetime_string'], parse_dates=['datetime_string'])
-
-    def time_datetime_read_as_native_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['datetime'])
-
-    def time_float_read_query_fallback(self):
-        read_sql_query('SELECT float FROM test_type', self.con)
-
-    def time_float_read_query_sqlalchemy(self):
-        read_sql_query('SELECT float FROM test_type', self.engine)
-
-    def time_float_read_table_sqlalchemy(self):
-        read_sql_table('test_type', self.engine, columns=['float'])
diff --git a/asv_bench/benchmarks/join_merge.py b/asv_bench/benchmarks/join_merge.py
index 776316343e009..6da8287a06d80 100644
--- a/asv_bench/benchmarks/join_merge.py
+++ b/asv_bench/benchmarks/join_merge.py
@@ -1,4 +1,10 @@
-from .pandas_vb_common import *
+import warnings
+import string
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (DataFrame, Series, Panel, MultiIndex,
+                    date_range, concat, merge, merge_asof)
 
 try:
     from pandas import merge_ordered
@@ -6,25 +12,18 @@
     from pandas import ordered_merge as merge_ordered
 
 
-# ----------------------------------------------------------------------
-# Append
-
 class Append(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.df1 = pd.DataFrame(np.random.randn(10000, 4),
-                                columns=['A', 'B', 'C', 'D'])
+        self.df1 = DataFrame(np.random.randn(10000, 4),
+                             columns=['A', 'B', 'C', 'D'])
         self.df2 = self.df1.copy()
         self.df2.index = np.arange(10000, 20000)
         self.mdf1 = self.df1.copy()
         self.mdf1['obj1'] = 'bar'
         self.mdf1['obj2'] = 'bar'
         self.mdf1['int1'] = 5
-        try:
-            self.mdf1.consolidate(inplace=True)
-        except:
-            pass
+        self.mdf1 = self.mdf1._consolidate()
         self.mdf2 = self.mdf1.copy()
         self.mdf2.index = self.df2.index
 
@@ -35,237 +34,220 @@ def time_append_mixed(self):
         self.mdf1.append(self.mdf2)
 
 
-# ----------------------------------------------------------------------
-# Concat
-
 class Concat(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.n = 1000
-        self.indices = tm.makeStringIndex(1000)
-        self.s = Series(self.n, index=self.indices)
-        self.pieces = [self.s[i:(- i)] for i in range(1, 10)]
-        self.pieces = (self.pieces * 50)
+    params = [0, 1]
+    param_names = ['axis']
 
-        self.df_small = pd.DataFrame(randn(5, 4))
+    def setup(self, axis):
+        N = 1000
+        s = Series(N, index=tm.makeStringIndex(N))
+        self.series = [s[i:- i] for i in range(1, 10)] * 50
+        self.small_frames = [DataFrame(np.random.randn(5, 4))] * 1000
+        df = DataFrame({'A': range(N)},
+                       index=date_range('20130101', periods=N, freq='s'))
+        self.empty_left = [DataFrame(), df]
+        self.empty_right = [df, DataFrame()]
+        self.mixed_ndims = [df, df.head(N // 2)]
 
-        # empty
-        self.df = pd.DataFrame(dict(A=range(10000)), index=date_range('20130101', periods=10000, freq='s'))
-        self.empty = pd.DataFrame()
+    def time_concat_series(self, axis):
+        concat(self.series, axis=axis, sort=False)
 
-    def time_concat_series_axis1(self):
-        concat(self.pieces, axis=1)
+    def time_concat_small_frames(self, axis):
+        concat(self.small_frames, axis=axis)
 
-    def time_concat_small_frames(self):
-        concat(([self.df_small] * 1000))
+    def time_concat_empty_right(self, axis):
+        concat(self.empty_right, axis=axis)
 
-    def time_concat_empty_frames1(self):
-        concat([self.df, self.empty])
+    def time_concat_empty_left(self, axis):
+        concat(self.empty_left, axis=axis)
 
-    def time_concat_empty_frames2(self):
-        concat([self.empty, self.df])
+    def time_concat_mixed_ndims(self, axis):
+        concat(self.mixed_ndims, axis=axis)
 
 
 class ConcatPanels(object):
-    goal_time = 0.2
 
-    def setup(self):
-        dataset = np.zeros((10000, 200, 2), dtype=np.float32)
-        self.panels_f = [pd.Panel(np.copy(dataset, order='F'))
-                         for i in range(20)]
-        self.panels_c = [pd.Panel(np.copy(dataset, order='C'))
-                         for i in range(20)]
+    params = ([0, 1, 2], [True, False])
+    param_names = ['axis', 'ignore_index']
 
-    def time_c_ordered_axis0(self):
-        concat(self.panels_c, axis=0, ignore_index=True)
+    def setup(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            panel_c = Panel(np.zeros((10000, 200, 2),
+                                     dtype=np.float32,
+                                     order='C'))
+            self.panels_c = [panel_c] * 20
+            panel_f = Panel(np.zeros((10000, 200, 2),
+                            dtype=np.float32,
+                            order='F'))
+            self.panels_f = [panel_f] * 20
 
-    def time_f_ordered_axis0(self):
-        concat(self.panels_f, axis=0, ignore_index=True)
+    def time_c_ordered(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            concat(self.panels_c, axis=axis, ignore_index=ignore_index)
 
-    def time_c_ordered_axis1(self):
-        concat(self.panels_c, axis=1, ignore_index=True)
+    def time_f_ordered(self, axis, ignore_index):
+        with warnings.catch_warnings(record=True):
+            concat(self.panels_f, axis=axis, ignore_index=ignore_index)
 
-    def time_f_ordered_axis1(self):
-        concat(self.panels_f, axis=1, ignore_index=True)
 
-    def time_c_ordered_axis2(self):
-        concat(self.panels_c, axis=2, ignore_index=True)
+class ConcatDataFrames(object):
 
-    def time_f_ordered_axis2(self):
-        concat(self.panels_f, axis=2, ignore_index=True)
+    params = ([0, 1], [True, False])
+    param_names = ['axis', 'ignore_index']
 
+    def setup(self, axis, ignore_index):
+        frame_c = DataFrame(np.zeros((10000, 200),
+                            dtype=np.float32, order='C'))
+        self.frame_c = [frame_c] * 20
+        frame_f = DataFrame(np.zeros((10000, 200),
+                            dtype=np.float32, order='F'))
+        self.frame_f = [frame_f] * 20
 
-class ConcatFrames(object):
-    goal_time = 0.2
+    def time_c_ordered(self, axis, ignore_index):
+        concat(self.frame_c, axis=axis, ignore_index=ignore_index)
 
-    def setup(self):
-        dataset = np.zeros((10000, 200), dtype=np.float32)
+    def time_f_ordered(self, axis, ignore_index):
+        concat(self.frame_f, axis=axis, ignore_index=ignore_index)
 
-        self.frames_f = [pd.DataFrame(np.copy(dataset, order='F'))
-                         for i in range(20)]
-        self.frames_c = [pd.DataFrame(np.copy(dataset, order='C'))
-                         for i in range(20)]
 
-    def time_c_ordered_axis0(self):
-        concat(self.frames_c, axis=0, ignore_index=True)
+class Join(object):
 
-    def time_f_ordered_axis0(self):
-        concat(self.frames_f, axis=0, ignore_index=True)
+    params = [True, False]
+    param_names = ['sort']
 
-    def time_c_ordered_axis1(self):
-        concat(self.frames_c, axis=1, ignore_index=True)
+    def setup(self, sort):
+        level1 = tm.makeStringIndex(10).values
+        level2 = tm.makeStringIndex(1000).values
+        codes1 = np.arange(10).repeat(1000)
+        codes2 = np.tile(np.arange(1000), 10)
+        index2 = MultiIndex(levels=[level1, level2],
+                            codes=[codes1, codes2])
+        self.df_multi = DataFrame(np.random.randn(len(index2), 4),
+                                  index=index2,
+                                  columns=['A', 'B', 'C', 'D'])
 
-    def time_f_ordered_axis1(self):
-        concat(self.frames_f, axis=1, ignore_index=True)
+        self.key1 = np.tile(level1.take(codes1), 10)
+        self.key2 = np.tile(level2.take(codes2), 10)
+        self.df = DataFrame({'data1': np.random.randn(100000),
+                             'data2': np.random.randn(100000),
+                             'key1': self.key1,
+                             'key2': self.key2})
 
+        self.df_key1 = DataFrame(np.random.randn(len(level1), 4),
+                                 index=level1,
+                                 columns=['A', 'B', 'C', 'D'])
+        self.df_key2 = DataFrame(np.random.randn(len(level2), 4),
+                                 index=level2,
+                                 columns=['A', 'B', 'C', 'D'])
 
-# ----------------------------------------------------------------------
-# Joins
+        shuf = np.arange(100000)
+        np.random.shuffle(shuf)
+        self.df_shuf = self.df.reindex(self.df.index[shuf])
 
-class Join(object):
-    goal_time = 0.2
+    def time_join_dataframe_index_multi(self, sort):
+        self.df.join(self.df_multi, on=['key1', 'key2'], sort=sort)
 
-    def setup(self):
-        self.level1 = tm.makeStringIndex(10).values
-        self.level2 = tm.makeStringIndex(1000).values
-        self.label1 = np.arange(10).repeat(1000)
-        self.label2 = np.tile(np.arange(1000), 10)
-        self.key1 = np.tile(self.level1.take(self.label1), 10)
-        self.key2 = np.tile(self.level2.take(self.label2), 10)
-        self.shuf = np.arange(100000)
-        random.shuffle(self.shuf)
-        try:
-            self.index2 = MultiIndex(levels=[self.level1, self.level2],
-                                     labels=[self.label1, self.label2])
-            self.index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                                     labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-            self.df_multi = DataFrame(np.random.randn(len(self.index2), 4),
-                                      index=self.index2,
-                                      columns=['A', 'B', 'C', 'D'])
-        except:
-            pass
-        self.df = pd.DataFrame({'data1': np.random.randn(100000),
-                                'data2': np.random.randn(100000),
-                                'key1': self.key1,
-                                'key2': self.key2})
-        self.df_key1 = pd.DataFrame(np.random.randn(len(self.level1), 4),
-                                    index=self.level1,
-                                    columns=['A', 'B', 'C', 'D'])
-        self.df_key2 = pd.DataFrame(np.random.randn(len(self.level2), 4),
-                                    index=self.level2,
-                                    columns=['A', 'B', 'C', 'D'])
-        self.df_shuf = self.df.reindex(self.df.index[self.shuf])
-
-    def time_join_dataframe_index_multi(self):
-        self.df.join(self.df_multi, on=['key1', 'key2'])
-
-    def time_join_dataframe_index_single_key_bigger(self):
-        self.df.join(self.df_key2, on='key2')
-
-    def time_join_dataframe_index_single_key_bigger_sort(self):
-        self.df_shuf.join(self.df_key2, on='key2', sort=True)
-
-    def time_join_dataframe_index_single_key_small(self):
-        self.df.join(self.df_key1, on='key1')
+    def time_join_dataframe_index_single_key_bigger(self, sort):
+        self.df.join(self.df_key2, on='key2', sort=sort)
+
+    def time_join_dataframe_index_single_key_small(self, sort):
+        self.df.join(self.df_key1, on='key1', sort=sort)
+
+    def time_join_dataframe_index_shuffle_key_bigger_sort(self, sort):
+        self.df_shuf.join(self.df_key2, on='key2', sort=sort)
 
 
 class JoinIndex(object):
-    goal_time = 0.2
 
     def setup(self):
-        np.random.seed(2718281)
-        self.n = 50000
-        self.left = pd.DataFrame(np.random.randint(1, (self.n / 500), (self.n, 2)), columns=['jim', 'joe'])
-        self.right = pd.DataFrame(np.random.randint(1, (self.n / 500), (self.n, 2)), columns=['jolie', 'jolia']).set_index('jolie')
+        N = 50000
+        self.left = DataFrame(np.random.randint(1, N / 500, (N, 2)),
+                              columns=['jim', 'joe'])
+        self.right = DataFrame(np.random.randint(1, N / 500, (N, 2)),
+                               columns=['jolie', 'jolia']).set_index('jolie')
 
     def time_left_outer_join_index(self):
         self.left.join(self.right, on='jim')
 
 
-class join_non_unique_equal(object):
+class JoinNonUnique(object):
     # outer join of non-unique
     # GH 6329
-
-    goal_time = 0.2
-
     def setup(self):
-        self.date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
-        self.daily_dates = self.date_index.to_period('D').to_timestamp('S', 'S')
-        self.fracofday = (self.date_index.view(np.ndarray) - self.daily_dates.view(np.ndarray))
-        self.fracofday = (self.fracofday.astype('timedelta64[ns]').astype(np.float64) / 86400000000000.0)
-        self.fracofday = Series(self.fracofday, self.daily_dates)
-        self.index = date_range(self.date_index.min().to_period('A').to_timestamp('D', 'S'), self.date_index.max().to_period('A').to_timestamp('D', 'E'), freq='D')
-        self.temp = Series(1.0, self.index)
+        date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
+        daily_dates = date_index.to_period('D').to_timestamp('S', 'S')
+        self.fracofday = date_index.values - daily_dates.values
+        self.fracofday = self.fracofday.astype('timedelta64[ns]')
+        self.fracofday = self.fracofday.astype(np.float64) / 86400000000000.0
+        self.fracofday = Series(self.fracofday, daily_dates)
+        index = date_range(date_index.min(), date_index.max(), freq='D')
+        self.temp = Series(1.0, index)[self.fracofday.index]
 
     def time_join_non_unique_equal(self):
-        (self.fracofday * self.temp[self.fracofday.index])
+        self.fracofday * self.temp
 
 
-# ----------------------------------------------------------------------
-# Merges
-
 class Merge(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 10000
-        self.indices = tm.makeStringIndex(self.N).values
-        self.indices2 = tm.makeStringIndex(self.N).values
-        self.key = np.tile(self.indices[:8000], 10)
-        self.key2 = np.tile(self.indices2[:8000], 10)
-        self.left = pd.DataFrame({'key': self.key, 'key2': self.key2,
-                                  'value': np.random.randn(80000)})
-        self.right = pd.DataFrame({'key': self.indices[2000:],
-                                   'key2': self.indices2[2000:],
-                                   'value2': np.random.randn(8000)})
-
-        self.df = pd.DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2),
-                                'key2': np.tile(np.arange(250).repeat(10), 4),
-                                'value': np.random.randn(10000)})
-        self.df2 = pd.DataFrame({'key1': np.arange(500), 'value2': randn(500)})
+    params = [True, False]
+    param_names = ['sort']
+
+    def setup(self, sort):
+        N = 10000
+        indices = tm.makeStringIndex(N).values
+        indices2 = tm.makeStringIndex(N).values
+        key = np.tile(indices[:8000], 10)
+        key2 = np.tile(indices2[:8000], 10)
+        self.left = DataFrame({'key': key, 'key2': key2,
+                               'value': np.random.randn(80000)})
+        self.right = DataFrame({'key': indices[2000:],
+                                'key2': indices2[2000:],
+                                'value2': np.random.randn(8000)})
+
+        self.df = DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2),
+                             'key2': np.tile(np.arange(250).repeat(10), 4),
+                             'value': np.random.randn(10000)})
+        self.df2 = DataFrame({'key1': np.arange(500),
+                              'value2': np.random.randn(500)})
         self.df3 = self.df[:5000]
 
-    def time_merge_2intkey_nosort(self):
-        merge(self.left, self.right, sort=False)
+    def time_merge_2intkey(self, sort):
+        merge(self.left, self.right, sort=sort)
 
-    def time_merge_2intkey_sort(self):
-        merge(self.left, self.right, sort=True)
+    def time_merge_dataframe_integer_2key(self, sort):
+        merge(self.df, self.df3, sort=sort)
 
-    def time_merge_dataframe_integer_2key(self):
-        merge(self.df, self.df3)
+    def time_merge_dataframe_integer_key(self, sort):
+        merge(self.df, self.df2, on='key1', sort=sort)
 
-    def time_merge_dataframe_integer_key(self):
-        merge(self.df, self.df2, on='key1')
 
+class I8Merge(object):
 
-class i8merge(object):
-    goal_time = 0.2
+    params = ['inner', 'outer', 'left', 'right']
+    param_names = ['how']
 
-    def setup(self):
-        (low, high, n) = (((-1) << 10), (1 << 10), (1 << 20))
-        self.left = pd.DataFrame(np.random.randint(low, high, (n, 7)),
-                                 columns=list('ABCDEFG'))
+    def setup(self, how):
+        low, high, n = -1000, 1000, 10**6
+        self.left = DataFrame(np.random.randint(low, high, (n, 7)),
+                              columns=list('ABCDEFG'))
         self.left['left'] = self.left.sum(axis=1)
-        self.i = np.random.permutation(len(self.left))
-        self.right = self.left.iloc[self.i].copy()
-        self.right.columns = (self.right.columns[:(-1)].tolist() + ['right'])
-        self.right.index = np.arange(len(self.right))
-        self.right['right'] *= (-1)
+        self.right = self.left.sample(frac=1).rename({'left': 'right'}, axis=1)
+        self.right = self.right.reset_index(drop=True)
+        self.right['right'] *= -1
 
-    def time_i8merge(self):
-        merge(self.left, self.right, how='outer')
+    def time_i8merge(self, how):
+        merge(self.left, self.right, how=how)
 
 
 class MergeCategoricals(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.left_object = pd.DataFrame(
+        self.left_object = DataFrame(
             {'X': np.random.choice(range(0, 10), size=(10000,)),
              'Y': np.random.choice(['one', 'two', 'three'], size=(10000,))})
 
-        self.right_object = pd.DataFrame(
+        self.right_object = DataFrame(
             {'X': np.random.choice(range(0, 10), size=(10000,)),
              'Z': np.random.choice(['jjj', 'kkk', 'sss'], size=(10000,))})
 
@@ -281,103 +263,91 @@ def time_merge_cat(self):
         merge(self.left_cat, self.right_cat, on='X')
 
 
-# ----------------------------------------------------------------------
-# Ordered merge
-
 class MergeOrdered(object):
 
     def setup(self):
-
         groups = tm.makeStringIndex(10).values
-
-        self.left = pd.DataFrame({'group': groups.repeat(5000),
-                                  'key' : np.tile(np.arange(0, 10000, 2), 10),
-                                  'lvalue': np.random.randn(50000)})
-
-        self.right = pd.DataFrame({'key' : np.arange(10000),
-                                   'rvalue' : np.random.randn(10000)})
+        self.left = DataFrame({'group': groups.repeat(5000),
+                               'key': np.tile(np.arange(0, 10000, 2), 10),
+                               'lvalue': np.random.randn(50000)})
+        self.right = DataFrame({'key': np.arange(10000),
+                                'rvalue': np.random.randn(10000)})
 
     def time_merge_ordered(self):
         merge_ordered(self.left, self.right, on='key', left_by='group')
 
 
-# ----------------------------------------------------------------------
-# asof merge
-
 class MergeAsof(object):
+    params = [['backward', 'forward', 'nearest']]
+    param_names = ['direction']
 
-    def setup(self):
-        import string
-        np.random.seed(0)
+    def setup(self, direction):
         one_count = 200000
         two_count = 1000000
 
-        self.df1 = pd.DataFrame(
+        df1 = DataFrame(
             {'time': np.random.randint(0, one_count / 20, one_count),
-             'key': np.random.choice(list(string.uppercase), one_count),
+             'key': np.random.choice(list(string.ascii_uppercase), one_count),
              'key2': np.random.randint(0, 25, one_count),
              'value1': np.random.randn(one_count)})
-        self.df2 = pd.DataFrame(
+        df2 = DataFrame(
             {'time': np.random.randint(0, two_count / 20, two_count),
-             'key': np.random.choice(list(string.uppercase), two_count),
+             'key': np.random.choice(list(string.ascii_uppercase), two_count),
              'key2': np.random.randint(0, 25, two_count),
              'value2': np.random.randn(two_count)})
 
-        self.df1 = self.df1.sort_values('time')
-        self.df2 = self.df2.sort_values('time')
+        df1 = df1.sort_values('time')
+        df2 = df2.sort_values('time')
 
-        self.df1['time32'] = np.int32(self.df1.time)
-        self.df2['time32'] = np.int32(self.df2.time)
+        df1['time32'] = np.int32(df1.time)
+        df2['time32'] = np.int32(df2.time)
 
-        self.df1a = self.df1[['time', 'value1']]
-        self.df2a = self.df2[['time', 'value2']]
-        self.df1b = self.df1[['time', 'key', 'value1']]
-        self.df2b = self.df2[['time', 'key', 'value2']]
-        self.df1c = self.df1[['time', 'key2', 'value1']]
-        self.df2c = self.df2[['time', 'key2', 'value2']]
-        self.df1d = self.df1[['time32', 'value1']]
-        self.df2d = self.df2[['time32', 'value2']]
-        self.df1e = self.df1[['time', 'key', 'key2', 'value1']]
-        self.df2e = self.df2[['time', 'key', 'key2', 'value2']]
+        self.df1a = df1[['time', 'value1']]
+        self.df2a = df2[['time', 'value2']]
+        self.df1b = df1[['time', 'key', 'value1']]
+        self.df2b = df2[['time', 'key', 'value2']]
+        self.df1c = df1[['time', 'key2', 'value1']]
+        self.df2c = df2[['time', 'key2', 'value2']]
+        self.df1d = df1[['time32', 'value1']]
+        self.df2d = df2[['time32', 'value2']]
+        self.df1e = df1[['time', 'key', 'key2', 'value1']]
+        self.df2e = df2[['time', 'key', 'key2', 'value2']]
 
-    def time_noby(self):
-        merge_asof(self.df1a, self.df2a, on='time')
+    def time_on_int(self, direction):
+        merge_asof(self.df1a, self.df2a, on='time', direction=direction)
 
-    def time_by_object(self):
-        merge_asof(self.df1b, self.df2b, on='time', by='key')
+    def time_on_int32(self, direction):
+        merge_asof(self.df1d, self.df2d, on='time32', direction=direction)
 
-    def time_by_int(self):
-        merge_asof(self.df1c, self.df2c, on='time', by='key2')
+    def time_by_object(self, direction):
+        merge_asof(self.df1b, self.df2b, on='time', by='key',
+                   direction=direction)
 
-    def time_on_int32(self):
-        merge_asof(self.df1d, self.df2d, on='time32')
+    def time_by_int(self, direction):
+        merge_asof(self.df1c, self.df2c, on='time', by='key2',
+                   direction=direction)
 
-    def time_multiby(self):
-        merge_asof(self.df1e, self.df2e, on='time', by=['key', 'key2'])
+    def time_multiby(self, direction):
+        merge_asof(self.df1e, self.df2e, on='time', by=['key', 'key2'],
+                   direction=direction)
 
 
-# ----------------------------------------------------------------------
-# data alignment
-
 class Align(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.n = 1000000
-        self.sz = 500000
-        self.rng = np.arange(0, 10000000000000, 10000000)
-        self.stamps = (np.datetime64(datetime.now()).view('i8') + self.rng)
-        self.idx1 = np.sort(self.sample(self.stamps, self.sz))
-        self.idx2 = np.sort(self.sample(self.stamps, self.sz))
-        self.ts1 = Series(np.random.randn(self.sz), self.idx1)
-        self.ts2 = Series(np.random.randn(self.sz), self.idx2)
-
-    def sample(self, values, k):
-        self.sampler = np.random.permutation(len(values))
-        return values.take(self.sampler[:k])
+        size = 5 * 10**5
+        rng = np.arange(0, 10**13, 10**7)
+        stamps = np.datetime64('now').view('i8') + rng
+        idx1 = np.sort(np.random.choice(stamps, size, replace=False))
+        idx2 = np.sort(np.random.choice(stamps, size, replace=False))
+        self.ts1 = Series(np.random.randn(size), idx1)
+        self.ts2 = Series(np.random.randn(size), idx2)
 
     def time_series_align_int64_index(self):
-        (self.ts1 + self.ts2)
+        self.ts1 + self.ts2
 
     def time_series_align_left_monotonic(self):
         self.ts1.align(self.ts2, join='left')
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/multiindex_object.py b/asv_bench/benchmarks/multiindex_object.py
new file mode 100644
index 0000000000000..adc6730dcd946
--- /dev/null
+++ b/asv_bench/benchmarks/multiindex_object.py
@@ -0,0 +1,129 @@
+import string
+
+import numpy as np
+import pandas.util.testing as tm
+from pandas import date_range, MultiIndex
+
+
+class GetLoc(object):
+
+    def setup(self):
+        self.mi_large = MultiIndex.from_product(
+            [np.arange(1000), np.arange(20), list(string.ascii_letters)],
+            names=['one', 'two', 'three'])
+        self.mi_med = MultiIndex.from_product(
+            [np.arange(1000), np.arange(10), list('A')],
+            names=['one', 'two', 'three'])
+        self.mi_small = MultiIndex.from_product(
+            [np.arange(100), list('A'), list('A')],
+            names=['one', 'two', 'three'])
+
+    def time_large_get_loc(self):
+        self.mi_large.get_loc((999, 19, 'Z'))
+
+    def time_large_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_large.get_loc((999, 19, 'Z'))
+
+    def time_med_get_loc(self):
+        self.mi_med.get_loc((999, 9, 'A'))
+
+    def time_med_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_med.get_loc((999, 9, 'A'))
+
+    def time_string_get_loc(self):
+        self.mi_small.get_loc((99, 'A', 'A'))
+
+    def time_small_get_loc_warm(self):
+        for _ in range(1000):
+            self.mi_small.get_loc((99, 'A', 'A'))
+
+
+class Duplicates(object):
+
+    def setup(self):
+        size = 65536
+        arrays = [np.random.randint(0, 8192, size),
+                  np.random.randint(0, 1024, size)]
+        mask = np.random.rand(size) < 0.1
+        self.mi_unused_levels = MultiIndex.from_arrays(arrays)
+        self.mi_unused_levels = self.mi_unused_levels[mask]
+
+    def time_remove_unused_levels(self):
+        self.mi_unused_levels.remove_unused_levels()
+
+
+class Integer(object):
+
+    def setup(self):
+        self.mi_int = MultiIndex.from_product([np.arange(1000),
+                                               np.arange(1000)],
+                                              names=['one', 'two'])
+        self.obj_index = np.array([(0, 10), (0, 11), (0, 12),
+                                   (0, 13), (0, 14), (0, 15),
+                                   (0, 16), (0, 17), (0, 18),
+                                   (0, 19)], dtype=object)
+
+    def time_get_indexer(self):
+        self.mi_int.get_indexer(self.obj_index)
+
+    def time_is_monotonic(self):
+        self.mi_int.is_monotonic
+
+
+class Duplicated(object):
+
+    def setup(self):
+        n, k = 200, 5000
+        levels = [np.arange(n),
+                  tm.makeStringIndex(n).values,
+                  1000 + np.arange(n)]
+        codes = [np.random.choice(n, (k * n)) for lev in levels]
+        self.mi = MultiIndex(levels=levels, codes=codes)
+
+    def time_duplicated(self):
+        self.mi.duplicated()
+
+
+class Sortlevel(object):
+
+    def setup(self):
+        n = 1182720
+        low, high = -4096, 4096
+        arrs = [np.repeat(np.random.randint(low, high, (n // k)), k)
+                for k in [11, 7, 5, 3, 1]]
+        self.mi_int = MultiIndex.from_arrays(arrs)[np.random.permutation(n)]
+
+        a = np.repeat(np.arange(100), 1000)
+        b = np.tile(np.arange(1000), 100)
+        self.mi = MultiIndex.from_arrays([a, b])
+        self.mi = self.mi.take(np.random.permutation(np.arange(100000)))
+
+    def time_sortlevel_int64(self):
+        self.mi_int.sortlevel()
+
+    def time_sortlevel_zero(self):
+        self.mi.sortlevel(0)
+
+    def time_sortlevel_one(self):
+        self.mi.sortlevel(1)
+
+
+class Values(object):
+
+    def setup_cache(self):
+
+        level1 = range(1000)
+        level2 = date_range(start='1/1/2012', periods=100)
+        mi = MultiIndex.from_product([level1, level2])
+        return mi
+
+    def time_datetime_level_values_copy(self, mi):
+        mi.copy().values
+
+    def time_datetime_level_values_sliced(self, mi):
+        mi[:10].values
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/offset.py b/asv_bench/benchmarks/offset.py
new file mode 100644
index 0000000000000..4570e73cccc71
--- /dev/null
+++ b/asv_bench/benchmarks/offset.py
@@ -0,0 +1,118 @@
+# -*- coding: utf-8 -*-
+import warnings
+from datetime import datetime
+
+import numpy as np
+import pandas as pd
+try:
+    import pandas.tseries.holiday  # noqa
+except ImportError:
+    pass
+
+hcal = pd.tseries.holiday.USFederalHolidayCalendar()
+# These offests currently raise a NotImplimentedError with .apply_index()
+non_apply = [pd.offsets.Day(),
+             pd.offsets.BYearEnd(),
+             pd.offsets.BYearBegin(),
+             pd.offsets.BQuarterEnd(),
+             pd.offsets.BQuarterBegin(),
+             pd.offsets.BMonthEnd(),
+             pd.offsets.BMonthBegin(),
+             pd.offsets.CustomBusinessDay(),
+             pd.offsets.CustomBusinessDay(calendar=hcal),
+             pd.offsets.CustomBusinessMonthBegin(calendar=hcal),
+             pd.offsets.CustomBusinessMonthEnd(calendar=hcal),
+             pd.offsets.CustomBusinessMonthEnd(calendar=hcal)]
+other_offsets = [pd.offsets.YearEnd(), pd.offsets.YearBegin(),
+                 pd.offsets.QuarterEnd(), pd.offsets.QuarterBegin(),
+                 pd.offsets.MonthEnd(), pd.offsets.MonthBegin(),
+                 pd.offsets.DateOffset(months=2, days=2),
+                 pd.offsets.BusinessDay(), pd.offsets.SemiMonthEnd(),
+                 pd.offsets.SemiMonthBegin()]
+offsets = non_apply + other_offsets
+
+
+class ApplyIndex(object):
+
+    params = other_offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 10000
+        self.rng = pd.date_range(start='1/1/2000', periods=N, freq='T')
+
+    def time_apply_index(self, offset):
+        offset.apply_index(self.rng)
+
+
+class OnOffset(object):
+
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        self.dates = [datetime(2016, m, d)
+                      for m in [10, 11, 12]
+                      for d in [1, 2, 3, 28, 29, 30, 31]
+                      if not (m == 11 and d == 31)]
+
+    def time_on_offset(self, offset):
+        for date in self.dates:
+            offset.onOffset(date)
+
+
+class OffsetSeriesArithmetic(object):
+
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 1000
+        rng = pd.date_range(start='1/1/2000', periods=N, freq='T')
+        self.data = pd.Series(rng)
+
+    def time_add_offset(self, offset):
+        with warnings.catch_warnings(record=True):
+            self.data + offset
+
+
+class OffsetDatetimeIndexArithmetic(object):
+
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        N = 1000
+        self.data = pd.date_range(start='1/1/2000', periods=N, freq='T')
+
+    def time_add_offset(self, offset):
+        with warnings.catch_warnings(record=True):
+            self.data + offset
+
+
+class OffestDatetimeArithmetic(object):
+
+    params = offsets
+    param_names = ['offset']
+
+    def setup(self, offset):
+        self.date = datetime(2011, 1, 1)
+        self.dt64 = np.datetime64('2011-01-01 09:00Z')
+
+    def time_apply(self, offset):
+        offset.apply(self.date)
+
+    def time_apply_np_dt64(self, offset):
+        offset.apply(self.dt64)
+
+    def time_add(self, offset):
+        self.date + offset
+
+    def time_add_10(self, offset):
+        self.date + (10 * offset)
+
+    def time_subtract(self, offset):
+        self.date - offset
+
+    def time_subtract_10(self, offset):
+        self.date - (10 * offset)
diff --git a/asv_bench/benchmarks/packers.py b/asv_bench/benchmarks/packers.py
deleted file mode 100644
index cd43e305ead8f..0000000000000
--- a/asv_bench/benchmarks/packers.py
+++ /dev/null
@@ -1,316 +0,0 @@
-from .pandas_vb_common import *
-from numpy.random import randint
-import pandas as pd
-from collections import OrderedDict
-from pandas.compat import BytesIO
-import sqlite3
-import os
-from sqlalchemy import create_engine
-import numpy as np
-from random import randrange
-
-class _Packers(object):
-    goal_time = 0.2
-
-    def _setup(self):
-        self.f = '__test__.msg'
-        self.N = 100000
-        self.C = 5
-        self.index = date_range('20000101', periods=self.N, freq='H')
-        self.df = DataFrame(dict([('float{0}'.format(i), randn(self.N)) for i in range(self.C)]), index=self.index)
-        self.df2 = self.df.copy()
-        self.df2['object'] = [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]
-        self.remove(self.f)
-
-    def remove(self, f):
-        try:
-            os.remove(self.f)
-        except:
-            pass
-
-class Packers(_Packers):
-    goal_time = 0.2
-
-    def setup(self):
-        self._setup()
-        self.df.to_csv(self.f)
-
-    def time_packers_read_csv(self):
-        pd.read_csv(self.f)
-
-class packers_read_excel(_Packers):
-    goal_time = 0.2
-
-    def setup(self):
-        self._setup()
-        self.bio = BytesIO()
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlsxwriter')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def time_packers_read_excel(self):
-        self.bio.seek(0)
-        pd.read_excel(self.bio)
-
-
-class packers_read_hdf_store(_Packers):
-    goal_time = 0.2
-
-    def setup(self):
-        self._setup()
-        self.df2.to_hdf(self.f, 'df')
-
-    def time_packers_read_hdf_store(self):
-        pd.read_hdf(self.f, 'df')
-
-
-class packers_read_hdf_table(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df2.to_hdf(self.f, 'df', format='table')
-
-    def time_packers_read_hdf_table(self):
-        pd.read_hdf(self.f, 'df')
-
-
-class packers_read_json(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df.to_json(self.f, orient='split')
-        self.df.index = np.arange(self.N)
-
-    def time_packers_read_json(self):
-        pd.read_json(self.f, orient='split')
-
-
-class packers_read_json_date_index(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.remove(self.f)
-        self.df.to_json(self.f, orient='split')
-
-    def time_packers_read_json_date_index(self):
-        pd.read_json(self.f, orient='split')
-
-
-class packers_read_pack(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df2.to_msgpack(self.f)
-
-    def time_packers_read_pack(self):
-        pd.read_msgpack(self.f)
-
-
-class packers_read_pickle(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df2.to_pickle(self.f)
-
-    def time_packers_read_pickle(self):
-        pd.read_pickle(self.f)
-
-class packers_read_sql(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.engine = create_engine('sqlite:///:memory:')
-        self.df2.to_sql('table', self.engine, if_exists='replace')
-
-    def time_packers_read_sql(self):
-        pd.read_sql_table('table', self.engine)
-
-
-class packers_read_stata(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_read_stata(self):
-        pd.read_stata(self.f)
-
-
-class packers_read_stata_with_validation(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df['int8_'] = [randint(np.iinfo(np.int8).min, (np.iinfo(np.int8).max - 27)) for _ in range(self.N)]
-        self.df['int16_'] = [randint(np.iinfo(np.int16).min, (np.iinfo(np.int16).max - 27)) for _ in range(self.N)]
-        self.df['int32_'] = [randint(np.iinfo(np.int32).min, (np.iinfo(np.int32).max - 27)) for _ in range(self.N)]
-        self.df['float32_'] = np.array(randn(self.N), dtype=np.float32)
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_packers_read_stata_with_validation(self):
-        pd.read_stata(self.f)
-
-
-class packers_read_sas(_Packers):
-
-    def setup(self):
-        self.f = os.path.join(os.path.dirname(__file__), '..', '..',
-                              'pandas', 'io', 'tests', 'sas', 'data',
-                              'test1.sas7bdat')
-        self.f2 = os.path.join(os.path.dirname(__file__), '..', '..',
-                               'pandas', 'io', 'tests', 'sas', 'data',
-                               'paxraw_d_short.xpt')
-
-    def time_read_sas7bdat(self):
-        pd.read_sas(self.f, format='sas7bdat')
-
-    def time_read_xport(self):
-        pd.read_sas(self.f, format='xport')
-
-
-class CSV(_Packers):
-
-    def setup(self):
-        self._setup()
-
-    def time_write_csv(self):
-        self.df.to_csv(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-
-class Excel(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.bio = BytesIO()
-
-    def time_write_excel_openpyxl(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='openpyxl')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def time_write_excel_xlsxwriter(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlsxwriter')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-    def time_write_excel_xlwt(self):
-        self.bio.seek(0)
-        self.writer = pd.io.excel.ExcelWriter(self.bio, engine='xlwt')
-        self.df[:2000].to_excel(self.writer)
-        self.writer.save()
-
-
-class HDF(_Packers):
-
-    def setup(self):
-        self._setup()
-
-    def time_write_hdf_store(self):
-        self.df2.to_hdf(self.f, 'df')
-
-    def time_write_hdf_table(self):
-        self.df2.to_hdf(self.f, 'df', table=True)
-
-    def teardown(self):
-        self.remove(self.f)
-
-class JSON(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.df_date = self.df.copy()
-        self.df.index = np.arange(self.N)
-        self.cols = [(lambda i: ('{0}_timedelta'.format(i), [pd.Timedelta(('%d seconds' % randrange(1000000.0))) for _ in range(self.N)])), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N))), (lambda i: ('{0}_timestamp'.format(i), [pd.Timestamp((1418842918083256000 + randrange(1000000000.0, 1e+18, 200))) for _ in range(self.N)]))]
-        self.df_mixed = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-        self.cols = [(lambda i: ('{0}_float'.format(i), randn(self.N))), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N)))]
-        self.df_mixed2 = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-        self.cols = [(lambda i: ('{0}_float'.format(i), randn(self.N))), (lambda i: ('{0}_int'.format(i), randint(100000000.0, size=self.N))), (lambda i: ('{0}_str'.format(i), [('%08x' % randrange((16 ** 8))) for _ in range(self.N)]))]
-        self.df_mixed3 = DataFrame(OrderedDict([self.cols[(i % len(self.cols))](i) for i in range(self.C)]), index=self.index)
-
-    def time_write_json(self):
-        self.df.to_json(self.f, orient='split')
-
-    def time_write_json_T(self):
-        self.df.to_json(self.f, orient='columns')
-
-    def time_write_json_date_index(self):
-        self.df_date.to_json(self.f, orient='split')
-
-    def time_write_json_mixed_delta_int_tstamp(self):
-        self.df_mixed.to_json(self.f, orient='split')
-
-    def time_write_json_mixed_float_int(self):
-        self.df_mixed2.to_json(self.f, orient='index')
-
-    def time_write_json_mixed_float_int_T(self):
-        self.df_mixed2.to_json(self.f, orient='columns')
-
-    def time_write_json_mixed_float_int_str(self):
-        self.df_mixed3.to_json(self.f, orient='split')
-
-    def time_write_json_lines(self):
-        self.df.to_json(self.f, orient="records", lines=True)
-
-    def teardown(self):
-        self.remove(self.f)
-
-
-class MsgPack(_Packers):
-
-    def setup(self):
-        self._setup()
-
-    def time_write_msgpack(self):
-        self.df2.to_msgpack(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-
-class Pickle(_Packers):
-
-    def setup(self):
-        self._setup()
-
-    def time_write_pickle(self):
-        self.df2.to_pickle(self.f)
-
-    def teardown(self):
-        self.remove(self.f)
-
-
-class SQL(_Packers):
-
-    def setup(self):
-        self._setup()
-        self.engine = create_engine('sqlite:///:memory:')
-
-    def time_write_sql(self):
-        self.df2.to_sql('table', self.engine, if_exists='replace')
-
-
-class STATA(_Packers):
-
-    def setup(self):
-        self._setup()
-
-        self.df3=self.df.copy()
-        self.df3['int8_'] = [randint(np.iinfo(np.int8).min, (np.iinfo(np.int8).max - 27)) for _ in range(self.N)]
-        self.df3['int16_'] = [randint(np.iinfo(np.int16).min, (np.iinfo(np.int16).max - 27)) for _ in range(self.N)]
-        self.df3['int32_'] = [randint(np.iinfo(np.int32).min, (np.iinfo(np.int32).max - 27)) for _ in range(self.N)]
-        self.df3['float32_'] = np.array(randn(self.N), dtype=np.float32)
-
-    def time_write_stata(self):
-        self.df.to_stata(self.f, {'index': 'tc', })
-
-    def time_write_stata_with_validation(self):
-        self.df3.to_stata(self.f, {'index': 'tc', })
-
-    def teardown(self):
-        self.remove(self.f)
diff --git a/asv_bench/benchmarks/pandas_vb_common.py b/asv_bench/benchmarks/pandas_vb_common.py
index 56ccc94c414fb..d479952cbfbf6 100644
--- a/asv_bench/benchmarks/pandas_vb_common.py
+++ b/asv_bench/benchmarks/pandas_vb_common.py
@@ -1,37 +1,55 @@
-from pandas import *
-import pandas as pd
-from datetime import timedelta
-from numpy.random import randn
-from numpy.random import randint
-from numpy.random import permutation
-import pandas.util.testing as tm
-import random
-import numpy as np
-import threading
+import os
 from importlib import import_module
 
-try:
-    from pandas.compat import range
-except ImportError:
-    pass
-
-np.random.seed(1234)
+import numpy as np
+import pandas as pd
 
-# try em until it works!
-for imp in ['pandas_tseries', 'pandas.lib', 'pandas._libs.lib']:
+# Compatibility import for lib
+for imp in ['pandas._libs.lib', 'pandas.lib']:
     try:
         lib = import_module(imp)
         break
-    except:
+    except (ImportError, TypeError, ValueError):
         pass
 
+numeric_dtypes = [np.int64, np.int32, np.uint32, np.uint64, np.float32,
+                  np.float64, np.int16, np.int8, np.uint16, np.uint8]
+datetime_dtypes = [np.datetime64, np.timedelta64]
+string_dtypes = [np.object]
 try:
-    Panel = Panel
-except Exception:
-    Panel = WidePanel
+    extension_dtypes = [pd.Int8Dtype, pd.Int16Dtype,
+                        pd.Int32Dtype, pd.Int64Dtype,
+                        pd.UInt8Dtype, pd.UInt16Dtype,
+                        pd.UInt32Dtype, pd.UInt64Dtype,
+                        pd.CategoricalDtype,
+                        pd.IntervalDtype,
+                        pd.DatetimeTZDtype('ns', 'UTC'),
+                        pd.PeriodDtype('D')]
+except AttributeError:
+    extension_dtypes = []
 
-# didn't add to namespace until later
-try:
-    from pandas.core.index import MultiIndex
-except ImportError:
-    pass
+
+def setup(*args, **kwargs):
+    # This function just needs to be imported into each benchmark file to
+    # set up the random seed before each function.
+    # http://asv.readthedocs.io/en/latest/writing_benchmarks.html
+    np.random.seed(1234)
+
+
+class BaseIO(object):
+    """
+    Base class for IO benchmarks
+    """
+    fname = None
+
+    def remove(self, f):
+        """Remove created files"""
+        try:
+            os.remove(f)
+        except OSError:
+            # On Windows, attempting to remove a file that is in use
+            # causes an exception to be raised
+            pass
+
+    def teardown(self, *args, **kwargs):
+        self.remove(self.fname)
diff --git a/asv_bench/benchmarks/panel_ctor.py b/asv_bench/benchmarks/panel_ctor.py
index faedce6c574ec..627705284481b 100644
--- a/asv_bench/benchmarks/panel_ctor.py
+++ b/asv_bench/benchmarks/panel_ctor.py
@@ -1,64 +1,55 @@
-from .pandas_vb_common import *
+import warnings
+from datetime import datetime, timedelta
 
+from pandas import DataFrame, Panel, date_range
 
-class Constructors1(object):
-    goal_time = 0.2
 
+class DifferentIndexes(object):
     def setup(self):
         self.data_frames = {}
-        self.start = datetime(1990, 1, 1)
-        self.end = datetime(2012, 1, 1)
+        start = datetime(1990, 1, 1)
+        end = datetime(2012, 1, 1)
         for x in range(100):
-            self.end += timedelta(days=1)
-            self.dr = np.asarray(date_range(self.start, self.end))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
+            end += timedelta(days=1)
+            idx = date_range(start, end)
+            df = DataFrame({'a': 0, 'b': 1, 'c': 2}, index=idx)
+            self.data_frames[x] = df
 
-    def time_panel_from_dict_all_different_indexes(self):
-        Panel.from_dict(self.data_frames)
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
 
 
-class Constructors2(object):
-    goal_time = 0.2
+class SameIndexes(object):
 
     def setup(self):
-        self.data_frames = {}
-        for x in range(100):
-            self.dr = np.asarray(DatetimeIndex(start=datetime(1990, 1, 1), end=datetime(2012, 1, 1), freq=datetools.Day(1)))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
-
-    def time_panel_from_dict_equiv_indexes(self):
-        Panel.from_dict(self.data_frames)
-
-
-class Constructors3(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.dr = np.asarray(DatetimeIndex(start=datetime(1990, 1, 1), end=datetime(2012, 1, 1), freq=datetools.Day(1)))
-        self.data_frames = {}
-        for x in range(100):
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
+        idx = date_range(start=datetime(1990, 1, 1),
+                         end=datetime(2012, 1, 1),
+                         freq='D')
+        df = DataFrame({'a': 0, 'b': 1, 'c': 2}, index=idx)
+        self.data_frames = dict(enumerate([df] * 100))
 
-    def time_panel_from_dict_same_index(self):
-        Panel.from_dict(self.data_frames)
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
 
 
-class Constructors4(object):
-    goal_time = 0.2
+class TwoIndexes(object):
 
     def setup(self):
-        self.data_frames = {}
-        self.start = datetime(1990, 1, 1)
-        self.end = datetime(2012, 1, 1)
-        for x in range(100):
-            if (x == 50):
-                self.end += timedelta(days=1)
-            self.dr = np.asarray(date_range(self.start, self.end))
-            self.df = DataFrame({'a': ([0] * len(self.dr)), 'b': ([1] * len(self.dr)), 'c': ([2] * len(self.dr)), }, index=self.dr)
-            self.data_frames[x] = self.df
-
-    def time_panel_from_dict_two_different_indexes(self):
-        Panel.from_dict(self.data_frames)
+        start = datetime(1990, 1, 1)
+        end = datetime(2012, 1, 1)
+        df1 = DataFrame({'a': 0, 'b': 1, 'c': 2},
+                        index=date_range(start=start, end=end, freq='D'))
+        end += timedelta(days=1)
+        df2 = DataFrame({'a': 0, 'b': 1, 'c': 2},
+                        index=date_range(start=start, end=end, freq='D'))
+        dfs = [df1] * 50 + [df2] * 50
+        self.data_frames = dict(enumerate(dfs))
+
+    def time_from_dict(self):
+        with warnings.catch_warnings(record=True):
+            Panel.from_dict(self.data_frames)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/panel_methods.py b/asv_bench/benchmarks/panel_methods.py
index 6609305502011..a4c12c082236e 100644
--- a/asv_bench/benchmarks/panel_methods.py
+++ b/asv_bench/benchmarks/panel_methods.py
@@ -1,24 +1,25 @@
-from .pandas_vb_common import *
+import warnings
+
+import numpy as np
+from pandas import Panel
 
 
 class PanelMethods(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.index = date_range(start='2000', freq='D', periods=1000)
-        self.panel = Panel(np.random.randn(100, len(self.index), 1000))
+    params = ['items', 'major', 'minor']
+    param_names = ['axis']
 
-    def time_pct_change_items(self):
-        self.panel.pct_change(1, axis='items')
+    def setup(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel = Panel(np.random.randn(100, 1000, 100))
 
-    def time_pct_change_major(self):
-        self.panel.pct_change(1, axis='major')
+    def time_pct_change(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel.pct_change(1, axis=axis)
 
-    def time_pct_change_minor(self):
-        self.panel.pct_change(1, axis='minor')
+    def time_shift(self, axis):
+        with warnings.catch_warnings(record=True):
+            self.panel.shift(1, axis=axis)
 
-    def time_shift(self):
-        self.panel.shift(1)
 
-    def time_shift_minor(self):
-        self.panel.shift(1, axis='minor')
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/parser_vb.py b/asv_bench/benchmarks/parser_vb.py
deleted file mode 100644
index 32bf7e50d1a89..0000000000000
--- a/asv_bench/benchmarks/parser_vb.py
+++ /dev/null
@@ -1,121 +0,0 @@
-from .pandas_vb_common import *
-import os
-from pandas import read_csv
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-
-class read_csv1(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.df = DataFrame((np.random.randn(self.N, self.K) * np.random.randint(100, 10000, (self.N, self.K))))
-        self.df.to_csv('test.csv', sep='|')
-
-        self.format = (lambda x: '{:,}'.format(x))
-        self.df2 = self.df.applymap(self.format)
-        self.df2.to_csv('test2.csv', sep='|')
-
-    def time_sep(self):
-        read_csv('test.csv', sep='|')
-
-    def time_thousands(self):
-        read_csv('test.csv', sep='|', thousands=',')
-
-    def teardown(self):
-        os.remove('test.csv')
-        os.remove('test2.csv')
-
-
-class read_csv2(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = ['A,B,C']
-        self.data = (self.data + (['1,2,3 # comment'] * 100000))
-        self.data = '\n'.join(self.data)
-
-    def time_comment(self):
-        read_csv(StringIO(self.data), comment='#')
-
-
-class read_csv3(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.data = """0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336\n
-0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285\n
-0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126\n
-0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394\n
-0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020\n"""
-        self.data2 = self.data.replace(',', ';').replace('.', ',')
-        self.data = (self.data * 200)
-        self.data2 = (self.data2 * 200)
-
-    def time_default_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None,
-                 float_precision=None)
-
-    def time_default_converter_with_decimal(self):
-        read_csv(StringIO(self.data2), sep=';', header=None,
-                 float_precision=None, decimal=',')
-
-    def time_default_converter_python_engine(self):
-        read_csv(StringIO(self.data), sep=',', header=None,
-                 float_precision=None, engine='python')
-
-    def time_default_converter_with_decimal_python_engine(self):
-        read_csv(StringIO(self.data2), sep=';', header=None,
-                 float_precision=None, decimal=',', engine='python')
-
-    def time_precise_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None,
-                 float_precision='high')
-
-    def time_roundtrip_converter(self):
-        read_csv(StringIO(self.data), sep=',', header=None,
-                 float_precision='round_trip')
-
-
-class read_csv_categorical(object):
-    goal_time = 0.2
-
-    def setup(self):
-        N = 100000
-        group1 = ['aaaaaaaa', 'bbbbbbb', 'cccccccc', 'dddddddd', 'eeeeeeee']
-        df = DataFrame({'a': np.random.choice(group1, N).astype('object'),
-                        'b': np.random.choice(group1, N).astype('object'),
-                        'c': np.random.choice(group1, N).astype('object')})
-        df.to_csv('strings.csv', index=False)
-
-    def time_convert_post(self):
-        read_csv('strings.csv').apply(pd.Categorical)
-
-    def time_convert_direct(self):
-        read_csv('strings.csv', dtype='category')
-
-    def teardown(self):
-        os.remove('strings.csv')
-
-
-class read_csv_dateparsing(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 10000
-        self.K = 8
-        self.data = 'KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000\n        KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000\n        KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000\n        KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000\n        KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000\n        '
-        self.data = (self.data * 200)
-        self.data2 = 'KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000\n        KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000\n        KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000\n        KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000\n        KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000\n        '
-        self.data2 = (self.data2 * 200)
-
-    def time_multiple_date(self):
-        read_csv(StringIO(self.data), sep=',', header=None,
-                 parse_dates=[[1, 2], [1, 3]])
-
-    def time_baseline(self):
-        read_csv(StringIO(self.data2), sep=',', header=None, parse_dates=[1])
diff --git a/asv_bench/benchmarks/period.py b/asv_bench/benchmarks/period.py
index f9837191a7bae..6d2c7156a0a3d 100644
--- a/asv_bench/benchmarks/period.py
+++ b/asv_bench/benchmarks/period.py
@@ -1,59 +1,124 @@
-import pandas as pd
-from pandas import Series, Period, PeriodIndex, date_range
+from pandas import (
+    DataFrame, Period, PeriodIndex, Series, date_range, period_range)
+from pandas.tseries.frequencies import to_offset
 
 
-class Constructor(object):
-    goal_time = 0.2
+class PeriodProperties(object):
 
-    def setup(self):
+    params = (['M', 'min'],
+              ['year', 'month', 'day', 'hour', 'minute', 'second',
+               'is_leap_year', 'quarter', 'qyear', 'week', 'daysinmonth',
+               'dayofweek', 'dayofyear', 'start_time', 'end_time'])
+    param_names = ['freq', 'attr']
+
+    def setup(self, freq, attr):
+        self.per = Period('2012-06-01', freq=freq)
+
+    def time_property(self, freq, attr):
+        getattr(self.per, attr)
+
+
+class PeriodUnaryMethods(object):
+
+    params = ['M', 'min']
+    param_names = ['freq']
+
+    def setup(self, freq):
+        self.per = Period('2012-06-01', freq=freq)
+
+    def time_to_timestamp(self, freq):
+        self.per.to_timestamp()
+
+    def time_now(self, freq):
+        self.per.now(freq)
+
+    def time_asfreq(self, freq):
+        self.per.asfreq('A')
+
+
+class PeriodConstructor(object):
+    params = [['D'], [True, False]]
+    param_names = ['freq', 'is_offset']
+
+    def setup(self, freq, is_offset):
+        if is_offset:
+            self.freq = to_offset(freq)
+        else:
+            self.freq = freq
+
+    def time_period_constructor(self, freq, is_offset):
+        Period('2012-06-01', freq=freq)
+
+
+class PeriodIndexConstructor(object):
+
+    params = [['D'], [True, False]]
+    param_names = ['freq', 'is_offset']
+
+    def setup(self, freq, is_offset):
         self.rng = date_range('1985', periods=1000)
         self.rng2 = date_range('1985', periods=1000).to_pydatetime()
+        self.ints = list(range(2000, 3000))
+        self.daily_ints = date_range('1/1/2000', periods=1000,
+                                     freq=freq).strftime('%Y%m%d').map(int)
+        if is_offset:
+            self.freq = to_offset(freq)
+        else:
+            self.freq = freq
+
+    def time_from_date_range(self, freq, is_offset):
+        PeriodIndex(self.rng, freq=freq)
 
-    def time_from_date_range(self):
-        PeriodIndex(self.rng, freq='D')
+    def time_from_pydatetime(self, freq, is_offset):
+        PeriodIndex(self.rng2, freq=freq)
 
-    def time_from_pydatetime(self):
-        PeriodIndex(self.rng2, freq='D')
+    def time_from_ints(self, freq, is_offset):
+        PeriodIndex(self.ints, freq=freq)
 
+    def time_from_ints_daily(self, freq, is_offset):
+        PeriodIndex(self.daily_ints, freq=freq)
 
-class DataFrame(object):
-    goal_time = 0.2
+
+class DataFramePeriodColumn(object):
 
     def setup(self):
-        self.rng = pd.period_range(start='1/1/1990', freq='S', periods=20000)
-        self.df = pd.DataFrame(index=range(len(self.rng)))
+        self.rng = period_range(start='1/1/1990', freq='S', periods=20000)
+        self.df = DataFrame(index=range(len(self.rng)))
 
     def time_setitem_period_column(self):
         self.df['col'] = self.rng
 
+    def time_set_index(self):
+        # GH#21582 limited by comparisons of Period objects
+        self.df['col2'] = self.rng
+        self.df.set_index('col2', append=True)
+
 
 class Algorithms(object):
-    goal_time = 0.2
 
-    def setup(self):
+    params = ['index', 'series']
+    param_names = ['typ']
+
+    def setup(self, typ):
         data = [Period('2011-01', freq='M'), Period('2011-02', freq='M'),
                 Period('2011-03', freq='M'), Period('2011-04', freq='M')]
-        self.s = Series(data * 1000)
-        self.i = PeriodIndex(data, freq='M')
-
-    def time_drop_duplicates_pseries(self):
-        self.s.drop_duplicates()
 
-    def time_drop_duplicates_pindex(self):
-        self.i.drop_duplicates()
+        if typ == 'index':
+            self.vector = PeriodIndex(data * 1000, freq='M')
+        elif typ == 'series':
+            self.vector = Series(data * 1000)
 
-    def time_value_counts_pseries(self):
-        self.s.value_counts()
+    def time_drop_duplicates(self, typ):
+        self.vector.drop_duplicates()
 
-    def time_value_counts_pindex(self):
-        self.i.value_counts()
+    def time_value_counts(self, typ):
+        self.vector.value_counts()
 
 
-class period_standard_indexing(object):
-    goal_time = 0.2
+class Indexing(object):
 
     def setup(self):
-        self.index = PeriodIndex(start='1985', periods=1000, freq='D')
+        self.index = period_range(start='1985', periods=1000, freq='D')
         self.series = Series(range(1000), index=self.index)
         self.period = self.index[500]
 
@@ -70,7 +135,10 @@ def time_series_loc(self):
         self.series.loc[self.period]
 
     def time_align(self):
-        pd.DataFrame({'a': self.series, 'b': self.series[:500]})
+        DataFrame({'a': self.series, 'b': self.series[:500]})
 
     def time_intersection(self):
         self.index[:750].intersection(self.index[250:])
+
+    def time_unique(self):
+        self.index.unique()
diff --git a/asv_bench/benchmarks/plotting.py b/asv_bench/benchmarks/plotting.py
index 757c3e27dd333..8a67af0bdabd1 100644
--- a/asv_bench/benchmarks/plotting.py
+++ b/asv_bench/benchmarks/plotting.py
@@ -1,21 +1,69 @@
-from .pandas_vb_common import *
+import numpy as np
+from pandas import DataFrame, Series, DatetimeIndex, date_range
 try:
-    from pandas import date_range
+    from pandas.plotting import andrews_curves
 except ImportError:
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start, end, periods=periods, offset=freq)
-from pandas.tools.plotting import andrews_curves
+    from pandas.tools.plotting import andrews_curves
+import matplotlib
+matplotlib.use('Agg')
+
+
+class SeriesPlotting(object):
+    params = [['line', 'bar', 'area', 'barh', 'hist', 'kde', 'pie']]
+    param_names = ['kind']
+
+    def setup(self, kind):
+        if kind in ['bar', 'barh', 'pie']:
+            n = 100
+        elif kind in ['kde']:
+            n = 10000
+        else:
+            n = 1000000
+
+        self.s = Series(np.random.randn(n))
+        if kind in ['area', 'pie']:
+            self.s = self.s.abs()
+
+    def time_series_plot(self, kind):
+        self.s.plot(kind=kind)
+
+
+class FramePlotting(object):
+    params = [['line', 'bar', 'area', 'barh', 'hist', 'kde', 'pie', 'scatter',
+               'hexbin']]
+    param_names = ['kind']
+
+    def setup(self, kind):
+        if kind in ['bar', 'barh', 'pie']:
+            n = 100
+        elif kind in ['kde', 'scatter', 'hexbin']:
+            n = 10000
+        else:
+            n = 1000000
+
+        self.x = Series(np.random.randn(n))
+        self.y = Series(np.random.randn(n))
+        if kind in ['area', 'pie']:
+            self.x = self.x.abs()
+            self.y = self.y.abs()
+        self.df = DataFrame({'x': self.x, 'y': self.y})
+
+    def time_frame_plot(self, kind):
+        self.df.plot(x='x', y='y', kind=kind)
 
 
 class TimeseriesPlotting(object):
-    goal_time = 0.2
 
     def setup(self):
-        import matplotlib
-        matplotlib.use('Agg')
-        self.N = 2000
-        self.M = 5
-        self.df = DataFrame(np.random.randn(self.N, self.M), index=date_range('1/1/1975', periods=self.N))
+        N = 2000
+        M = 5
+        idx = date_range('1/1/1975', periods=N)
+        self.df = DataFrame(np.random.randn(N, M), index=idx)
+
+        idx_irregular = DatetimeIndex(np.concatenate((idx.values[0:10],
+                                                      idx.values[12:])))
+        self.df2 = DataFrame(np.random.randn(len(idx_irregular), M),
+                             index=idx_irregular)
 
     def time_plot_regular(self):
         self.df.plot()
@@ -23,18 +71,23 @@ def time_plot_regular(self):
     def time_plot_regular_compat(self):
         self.df.plot(x_compat=True)
 
+    def time_plot_irregular(self):
+        self.df2.plot()
+
+    def time_plot_table(self):
+        self.df.plot(table=True)
+
 
 class Misc(object):
-    goal_time = 0.6
 
     def setup(self):
-        import matplotlib
-        matplotlib.use('Agg')
-        self.N = 500
-        self.M = 10
-        data_dict = {x: np.random.randn(self.N) for x in range(self.M)}
-        data_dict["Name"] = ["A"] * self.N
-        self.df = DataFrame(data_dict)
+        N = 500
+        M = 10
+        self.df = DataFrame(np.random.randn(N, M))
+        self.df['Name'] = ["A"] * N
 
     def time_plot_andrews_curves(self):
         andrews_curves(self.df, "Name")
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/reindex.py b/asv_bench/benchmarks/reindex.py
index 537d275e7c727..3080b34024a33 100644
--- a/asv_bench/benchmarks/reindex.py
+++ b/asv_bench/benchmarks/reindex.py
@@ -1,98 +1,79 @@
-from .pandas_vb_common import *
-from random import shuffle
+import numpy as np
+import pandas.util.testing as tm
+from pandas import (DataFrame, Series, MultiIndex, Index, date_range,
+                    period_range)
+from .pandas_vb_common import lib
 
 
-class Reindexing(object):
-    goal_time = 0.2
+class Reindex(object):
 
     def setup(self):
-        self.rng = DatetimeIndex(start='1/1/1970', periods=10000, freq='1min')
-        self.df = DataFrame(np.random.rand(10000, 10), index=self.rng,
+        rng = date_range(start='1/1/1970', periods=10000, freq='1min')
+        self.df = DataFrame(np.random.rand(10000, 10), index=rng,
                             columns=range(10))
         self.df['foo'] = 'bar'
-        self.rng2 = Index(self.rng[::2])
-
+        self.rng_subset = Index(rng[::2])
         self.df2 = DataFrame(index=range(10000),
                              data=np.random.rand(10000, 30), columns=range(30))
-
-        # multi-index
         N = 5000
         K = 200
         level1 = tm.makeStringIndex(N).values.repeat(K)
         level2 = np.tile(tm.makeStringIndex(K).values, N)
         index = MultiIndex.from_arrays([level1, level2])
-        self.s1 = Series(np.random.randn((N * K)), index=index)
-        self.s2 = self.s1[::2]
+        self.s = Series(np.random.randn(N * K), index=index)
+        self.s_subset = self.s[::2]
 
     def time_reindex_dates(self):
-        self.df.reindex(self.rng2)
+        self.df.reindex(self.rng_subset)
 
     def time_reindex_columns(self):
         self.df2.reindex(columns=self.df.columns[1:5])
 
     def time_reindex_multiindex(self):
-        self.s1.reindex(self.s2.index)
-
+        self.s.reindex(self.s_subset.index)
 
-#----------------------------------------------------------------------
-# Pad / backfill
 
+class ReindexMethod(object):
 
-class FillMethod(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range('1/1/2000', periods=100000, freq='1min')
-        self.ts = Series(np.random.randn(len(self.rng)), index=self.rng)
-        self.ts2 = self.ts[::2]
-        self.ts3 = self.ts2.reindex(self.ts.index)
-        self.ts4 = self.ts3.astype('float32')
+    params = [['pad', 'backfill'], [date_range, period_range]]
+    param_names = ['method', 'constructor']
 
-    def pad(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='pad')
-        except:
-            source_series.reindex(target_index, fillMethod='pad')
+    def setup(self, method, constructor):
+        N = 100000
+        self.idx = constructor('1/1/2000', periods=N, freq='1min')
+        self.ts = Series(np.random.randn(N), index=self.idx)[::2]
 
-    def backfill(self, source_series, target_index):
-        try:
-            source_series.reindex(target_index, method='backfill')
-        except:
-            source_series.reindex(target_index, fillMethod='backfill')
+    def time_reindex_method(self, method, constructor):
+        self.ts.reindex(self.idx, method=method)
 
-    def time_backfill_dates(self):
-        self.backfill(self.ts2, self.ts.index)
 
-    def time_pad_daterange(self):
-        self.pad(self.ts2, self.ts.index)
+class Fillna(object):
 
-    def time_backfill(self):
-        self.ts3.fillna(method='backfill')
+    params = ['pad', 'backfill']
+    param_names = ['method']
 
-    def time_backfill_float32(self):
-        self.ts4.fillna(method='backfill')
+    def setup(self, method):
+        N = 100000
+        self.idx = date_range('1/1/2000', periods=N, freq='1min')
+        ts = Series(np.random.randn(N), index=self.idx)[::2]
+        self.ts_reindexed = ts.reindex(self.idx)
+        self.ts_float32 = self.ts_reindexed.astype('float32')
 
-    def time_pad(self):
-        self.ts3.fillna(method='pad')
+    def time_reindexed(self, method):
+        self.ts_reindexed.fillna(method=method)
 
-    def time_pad_float32(self):
-        self.ts4.fillna(method='pad')
-
-
-#----------------------------------------------------------------------
-# align on level
+    def time_float_32(self, method):
+        self.ts_float32.fillna(method=method)
 
 
 class LevelAlign(object):
-    goal_time = 0.2
 
     def setup(self):
         self.index = MultiIndex(
             levels=[np.arange(10), np.arange(100), np.arange(100)],
-            labels=[np.arange(10).repeat(10000),
-                    np.tile(np.arange(100).repeat(100), 10),
-                    np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
+            codes=[np.arange(10).repeat(10000),
+                   np.tile(np.arange(100).repeat(100), 10),
+                   np.tile(np.tile(np.arange(100), 100), 10)])
         self.df = DataFrame(np.random.randn(len(self.index), 4),
                             index=self.index)
         self.df_level = DataFrame(np.random.randn(100, 4),
@@ -102,106 +83,82 @@ def time_align_level(self):
         self.df.align(self.df_level, level=1, copy=False)
 
     def time_reindex_level(self):
-        self.df_level.reindex(self.df.index, level=1)
-
-
-#----------------------------------------------------------------------
-# drop_duplicates
+        self.df_level.reindex(self.index, level=1)
 
 
-class Duplicates(object):
-    goal_time = 0.2
+class DropDuplicates(object):
 
-    def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2,
-                             'value': np.random.randn((self.N * self.K)),})
-        self.col_array_list = list(self.df.values.T)
+    params = [True, False]
+    param_names = ['inplace']
 
-        self.df2 = self.df.copy()
-        self.df2.ix[:10000, :] = np.nan
+    def setup(self, inplace):
+        N = 10000
+        K = 10
+        key1 = tm.makeStringIndex(N).values.repeat(K)
+        key2 = tm.makeStringIndex(N).values.repeat(K)
+        self.df = DataFrame({'key1': key1, 'key2': key2,
+                             'value': np.random.randn(N * K)})
+        self.df_nan = self.df.copy()
+        self.df_nan.iloc[:10000, :] = np.nan
 
         self.s = Series(np.random.randint(0, 1000, size=10000))
-        self.s2 = Series(np.tile(tm.makeStringIndex(1000).values, 10))
-
-        np.random.seed(1234)
-        self.N = 1000000
-        self.K = 10000
-        self.key1 = np.random.randint(0, self.K, size=self.N)
-        self.df_int = DataFrame({'key1': self.key1})
-        self.df_bool = DataFrame({i: np.random.randint(0, 2, size=self.K,
-                                                       dtype=bool)
-                                  for i in range(10)})
-
-    def time_frame_drop_dups(self):
-        self.df.drop_duplicates(['key1', 'key2'])
+        self.s_str = Series(np.tile(tm.makeStringIndex(1000).values, 10))
 
-    def time_frame_drop_dups_inplace(self):
-        self.df.drop_duplicates(['key1', 'key2'], inplace=True)
+        N = 1000000
+        K = 10000
+        key1 = np.random.randint(0, K, size=N)
+        self.df_int = DataFrame({'key1': key1})
+        self.df_bool = DataFrame(np.random.randint(0, 2, size=(K, 10),
+                                                   dtype=bool))
 
-    def time_frame_drop_dups_na(self):
-        self.df2.drop_duplicates(['key1', 'key2'])
+    def time_frame_drop_dups(self, inplace):
+        self.df.drop_duplicates(['key1', 'key2'], inplace=inplace)
 
-    def time_frame_drop_dups_na_inplace(self):
-        self.df2.drop_duplicates(['key1', 'key2'], inplace=True)
+    def time_frame_drop_dups_na(self, inplace):
+        self.df_nan.drop_duplicates(['key1', 'key2'], inplace=inplace)
 
-    def time_series_drop_dups_int(self):
-        self.s.drop_duplicates()
+    def time_series_drop_dups_int(self, inplace):
+        self.s.drop_duplicates(inplace=inplace)
 
-    def time_series_drop_dups_string(self):
-        self.s2.drop_duplicates()
+    def time_series_drop_dups_string(self, inplace):
+        self.s_str.drop_duplicates(inplace=inplace)
 
-    def time_frame_drop_dups_int(self):
-        self.df_int.drop_duplicates()
+    def time_frame_drop_dups_int(self, inplace):
+        self.df_int.drop_duplicates(inplace=inplace)
 
-    def time_frame_drop_dups_bool(self):
-        self.df_bool.drop_duplicates()
-
-#----------------------------------------------------------------------
-# blog "pandas escaped the zoo"
+    def time_frame_drop_dups_bool(self, inplace):
+        self.df_bool.drop_duplicates(inplace=inplace)
 
 
 class Align(object):
-    goal_time = 0.2
-
+    # blog "pandas escaped the zoo"
     def setup(self):
         n = 50000
         indices = tm.makeStringIndex(n)
         subsample_size = 40000
-
-        def sample(values, k):
-            sampler = np.arange(len(values))
-            shuffle(sampler)
-            return values.take(sampler[:k])
-
-        self.x = Series(np.random.randn(50000), indices)
+        self.x = Series(np.random.randn(n), indices)
         self.y = Series(np.random.randn(subsample_size),
-                        index=sample(indices, subsample_size))
+                        index=np.random.choice(indices, subsample_size,
+                                               replace=False))
 
     def time_align_series_irregular_string(self):
-        (self.x + self.y)
+        self.x + self.y
 
 
 class LibFastZip(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.N = 10000
-        self.K = 10
-        self.key1 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.key2 = tm.makeStringIndex(self.N).values.repeat(self.K)
-        self.df = DataFrame({'key1': self.key1, 'key2': self.key2, 'value': np.random.randn((self.N * self.K)), })
-        self.col_array_list = list(self.df.values.T)
-
-        self.df2 = self.df.copy()
-        self.df2.ix[:10000, :] = np.nan
-        self.col_array_list2 = list(self.df2.values.T)
+        N = 10000
+        K = 10
+        key1 = tm.makeStringIndex(N).values.repeat(K)
+        key2 = tm.makeStringIndex(N).values.repeat(K)
+        col_array = np.vstack([key1, key2, np.random.randn(N * K)])
+        col_array2 = col_array.copy()
+        col_array2[:, :10000] = np.nan
+        self.col_array_list = list(col_array)
 
     def time_lib_fast_zip(self):
         lib.fast_zip(self.col_array_list)
 
-    def time_lib_fast_zip_fillna(self):
-        lib.fast_zip_fillna(self.col_array_list2)
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/replace.py b/asv_bench/benchmarks/replace.py
index 66b8af53801ac..d8efaf99e2c4d 100644
--- a/asv_bench/benchmarks/replace.py
+++ b/asv_bench/benchmarks/replace.py
@@ -1,72 +1,56 @@
-from .pandas_vb_common import *
-from pandas.compat import range
-from datetime import timedelta
+import numpy as np
+import pandas as pd
 
 
-class replace_fillna(object):
-    goal_time = 0.2
+class FillNa(object):
 
-    def setup(self):
-        self.N = 1000000
-        try:
-            self.rng = date_range('1/1/2000', periods=self.N, freq='min')
-        except NameError:
-            self.rng = DatetimeIndex('1/1/2000', periods=self.N, offset=datetools.Minute())
-            self.date_range = DateRange
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
+    params = [True, False]
+    param_names = ['inplace']
 
-    def time_replace_fillna(self):
-        self.ts.fillna(0.0, inplace=True)
+    def setup(self, inplace):
+        N = 10**6
+        rng = pd.date_range('1/1/2000', periods=N, freq='min')
+        data = np.random.randn(N)
+        data[::2] = np.nan
+        self.ts = pd.Series(data, index=rng)
 
+    def time_fillna(self, inplace):
+        self.ts.fillna(0.0, inplace=inplace)
 
-class replace_large_dict(object):
-    goal_time = 0.2
+    def time_replace(self, inplace):
+        self.ts.replace(np.nan, 0.0, inplace=inplace)
 
-    def setup(self):
-        self.n = (10 ** 6)
-        self.start_value = (10 ** 5)
-        self.to_rep = dict(((i, (self.start_value + i)) for i in range(self.n)))
-        self.s = Series(np.random.randint(self.n, size=(10 ** 3)))
 
-    def time_replace_large_dict(self):
-        self.s.replace(self.to_rep, inplace=True)
+class ReplaceDict(object):
 
+    params = [True, False]
+    param_names = ['inplace']
 
-class replace_convert(object):
-    goal_time = 0.5
+    def setup(self, inplace):
+        N = 10**5
+        start_value = 10**5
+        self.to_rep = dict(enumerate(np.arange(N) + start_value))
+        self.s = pd.Series(np.random.randint(N, size=10**3))
 
-    def setup(self):
-        self.n = (10 ** 3)
-        self.to_ts = dict(((i, pd.Timestamp(i)) for i in range(self.n)))
-        self.to_td = dict(((i, pd.Timedelta(i)) for i in range(self.n)))
-        self.s = Series(np.random.randint(self.n, size=(10 ** 3)))
-        self.df = DataFrame({'A': np.random.randint(self.n, size=(10 ** 3)),
-                             'B': np.random.randint(self.n, size=(10 ** 3))})
+    def time_replace_series(self, inplace):
+        self.s.replace(self.to_rep, inplace=inplace)
 
-    def time_replace_series_timestamp(self):
-        self.s.replace(self.to_ts)
 
-    def time_replace_series_timedelta(self):
-        self.s.replace(self.to_td)
+class Convert(object):
 
-    def time_replace_frame_timestamp(self):
-        self.df.replace(self.to_ts)
+    params = (['DataFrame', 'Series'], ['Timestamp', 'Timedelta'])
+    param_names = ['constructor', 'replace_data']
 
-    def time_replace_frame_timedelta(self):
-        self.df.replace(self.to_td)
+    def setup(self, constructor, replace_data):
+        N = 10**3
+        data = {'Series': pd.Series(np.random.randint(N, size=N)),
+                'DataFrame': pd.DataFrame({'A': np.random.randint(N, size=N),
+                                           'B': np.random.randint(N, size=N)})}
+        self.to_replace = {i: getattr(pd, replace_data) for i in range(N)}
+        self.data = data[constructor]
 
+    def time_replace(self, constructor, replace_data):
+        self.data.replace(self.to_replace)
 
-class replace_replacena(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 1000000
-        try:
-            self.rng = date_range('1/1/2000', periods=self.N, freq='min')
-        except NameError:
-            self.rng = DatetimeIndex('1/1/2000', periods=self.N, offset=datetools.Minute())
-            self.date_range = DateRange
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-
-    def time_replace_replacena(self):
-        self.ts.replace(np.nan, 0.0, inplace=True)
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/reshape.py b/asv_bench/benchmarks/reshape.py
index b9346c497b9ef..f6ee107ab618e 100644
--- a/asv_bench/benchmarks/reshape.py
+++ b/asv_bench/benchmarks/reshape.py
@@ -1,13 +1,14 @@
-from .pandas_vb_common import *
-from pandas.core.reshape import melt, wide_to_long
+import string
+from itertools import product
 
+import numpy as np
+from pandas import DataFrame, MultiIndex, date_range, melt, wide_to_long
+import pandas as pd
 
-class melt_dataframe(object):
-    goal_time = 0.2
+
+class Melt(object):
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
         self.df = DataFrame(np.random.randn(10000, 3), columns=['A', 'B', 'C'])
         self.df['id1'] = np.random.randint(0, 10, 10000)
         self.df['id2'] = np.random.randint(100, 1000, 10000)
@@ -16,104 +17,203 @@ def time_melt_dataframe(self):
         melt(self.df, id_vars=['id1', 'id2'])
 
 
-class reshape_pivot_time_series(object):
-    goal_time = 0.2
+class Pivot(object):
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
-        self.index = date_range('1/1/2000', periods=10000, freq='h')
-        self.df = DataFrame(randn(10000, 50), index=self.index, columns=range(50))
-        self.pdf = self.unpivot(self.df)
-        self.f = (lambda : self.pdf.pivot('date', 'variable', 'value'))
+        N = 10000
+        index = date_range('1/1/2000', periods=N, freq='h')
+        data = {'value': np.random.randn(N * 50),
+                'variable': np.arange(50).repeat(N),
+                'date': np.tile(index.values, 50)}
+        self.df = DataFrame(data)
 
     def time_reshape_pivot_time_series(self):
-        self.f()
-
-    def unpivot(self, frame):
-        (N, K) = frame.shape
-        self.data = {'value': frame.values.ravel('F'), 'variable': np.asarray(frame.columns).repeat(N), 'date': np.tile(np.asarray(frame.index), K), }
-        return DataFrame(self.data, columns=['date', 'variable', 'value'])
+        self.df.pivot('date', 'variable', 'value')
 
 
-class reshape_stack_simple(object):
-    goal_time = 0.2
+class SimpleReshape(object):
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
+        arrays = [np.arange(100).repeat(100),
+                  np.roll(np.tile(np.arange(100), 100), 25)]
+        index = MultiIndex.from_arrays(arrays)
+        self.df = DataFrame(np.random.randn(10000, 4), index=index)
         self.udf = self.df.unstack(1)
 
-    def time_reshape_stack_simple(self):
+    def time_stack(self):
         self.udf.stack()
 
-
-class reshape_unstack_simple(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
-
-    def time_reshape_unstack_simple(self):
+    def time_unstack(self):
         self.df.unstack(1)
 
 
-class reshape_unstack_large_single_dtype(object):
-    goal_time = 0.2
+class Unstack(object):
 
-    def setup(self):
+    params = ['int', 'category']
+
+    def setup(self, dtype):
         m = 100
         n = 1000
 
         levels = np.arange(m)
-        index = pd.MultiIndex.from_product([levels]*2)
+        index = MultiIndex.from_product([levels] * 2)
         columns = np.arange(n)
-        values = np.arange(m*m*n).reshape(m*m, n)
-        self.df = pd.DataFrame(values, index, columns)
+        if dtype == 'int':
+            values = np.arange(m * m * n).reshape(m * m, n)
+        else:
+            # the category branch is ~20x slower than int. So we
+            # cut down the size a bit. Now it's only ~3x slower.
+            n = 50
+            columns = columns[:n]
+            indices = np.random.randint(0, 52, size=(m * m, n))
+            values = np.take(list(string.ascii_letters), indices)
+            values = [pd.Categorical(v) for v in values.T]
+
+        self.df = DataFrame(values, index, columns)
         self.df2 = self.df.iloc[:-1]
 
-    def time_unstack_full_product(self):
+    def time_full_product(self, dtype):
         self.df.unstack()
 
-    def time_unstack_with_mask(self):
+    def time_without_last_row(self, dtype):
         self.df2.unstack()
 
 
-class unstack_sparse_keyspace(object):
-    goal_time = 0.2
+class SparseIndex(object):
 
     def setup(self):
-        self.index = MultiIndex.from_arrays([np.arange(100).repeat(100), np.roll(np.tile(np.arange(100), 100), 25)])
-        self.df = DataFrame(np.random.randn(10000, 4), index=self.index)
-        self.NUM_ROWS = 1000
-        for iter in range(10):
-            self.df = DataFrame({'A': np.random.randint(50, size=self.NUM_ROWS), 'B': np.random.randint(50, size=self.NUM_ROWS), 'C': np.random.randint((-10), 10, size=self.NUM_ROWS), 'D': np.random.randint((-10), 10, size=self.NUM_ROWS), 'E': np.random.randint(10, size=self.NUM_ROWS), 'F': np.random.randn(self.NUM_ROWS), })
-            self.idf = self.df.set_index(['A', 'B', 'C', 'D', 'E'])
-            if (len(self.idf.index.unique()) == self.NUM_ROWS):
-                break
-
-    def time_unstack_sparse_keyspace(self):
-        self.idf.unstack()
+        NUM_ROWS = 1000
+        self.df = DataFrame({'A': np.random.randint(50, size=NUM_ROWS),
+                             'B': np.random.randint(50, size=NUM_ROWS),
+                             'C': np.random.randint(-10, 10, size=NUM_ROWS),
+                             'D': np.random.randint(-10, 10, size=NUM_ROWS),
+                             'E': np.random.randint(10, size=NUM_ROWS),
+                             'F': np.random.randn(NUM_ROWS)})
+        self.df = self.df.set_index(['A', 'B', 'C', 'D', 'E'])
+
+    def time_unstack(self):
+        self.df.unstack()
 
 
-class wide_to_long_big(object):
-    goal_time = 0.2
+class WideToLong(object):
 
     def setup(self):
-        vars = 'ABCD'
         nyrs = 20
         nidvars = 20
         N = 5000
-        yrvars = []
-        for var in vars:
-            for yr in range(1, nyrs + 1):
-                yrvars.append(var + str(yr))
-
-        self.df = pd.DataFrame(np.random.randn(N, nidvars + len(yrvars)),
-                               columns=list(range(nidvars)) + yrvars)
-        self.vars = vars
+        self.letters = list('ABCD')
+        yrvars = [l + str(num)
+                  for l, num in product(self.letters, range(1, nyrs + 1))]
+        columns = [str(i) for i in range(nidvars)] + yrvars
+        self.df = DataFrame(np.random.randn(N, nidvars + len(yrvars)),
+                            columns=columns)
+        self.df['id'] = self.df.index
 
     def time_wide_to_long_big(self):
-        self.df['id'] = self.df.index
-        wide_to_long(self.df, list(self.vars), i='id', j='year')
+        wide_to_long(self.df, self.letters, i='id', j='year')
+
+
+class PivotTable(object):
+
+    def setup(self):
+        N = 100000
+        fac1 = np.array(['A', 'B', 'C'], dtype='O')
+        fac2 = np.array(['one', 'two'], dtype='O')
+        ind1 = np.random.randint(0, 3, size=N)
+        ind2 = np.random.randint(0, 2, size=N)
+        self.df = DataFrame({'key1': fac1.take(ind1),
+                             'key2': fac2.take(ind2),
+                             'key3': fac2.take(ind2),
+                             'value1': np.random.randn(N),
+                             'value2': np.random.randn(N),
+                             'value3': np.random.randn(N)})
+
+    def time_pivot_table(self):
+        self.df.pivot_table(index='key1', columns=['key2', 'key3'])
+
+    def time_pivot_table_agg(self):
+        self.df.pivot_table(index='key1', columns=['key2', 'key3'],
+                            aggfunc=['sum', 'mean'])
+
+    def time_pivot_table_margins(self):
+        self.df.pivot_table(index='key1', columns=['key2', 'key3'],
+                            margins=True)
+
+
+class Crosstab(object):
+
+    def setup(self):
+        N = 100000
+        fac1 = np.array(['A', 'B', 'C'], dtype='O')
+        fac2 = np.array(['one', 'two'], dtype='O')
+        self.ind1 = np.random.randint(0, 3, size=N)
+        self.ind2 = np.random.randint(0, 2, size=N)
+        self.vec1 = fac1.take(self.ind1)
+        self.vec2 = fac2.take(self.ind2)
+
+    def time_crosstab(self):
+        pd.crosstab(self.vec1, self.vec2)
+
+    def time_crosstab_values(self):
+        pd.crosstab(self.vec1, self.vec2, values=self.ind1, aggfunc='sum')
+
+    def time_crosstab_normalize(self):
+        pd.crosstab(self.vec1, self.vec2, normalize=True)
+
+    def time_crosstab_normalize_margins(self):
+        pd.crosstab(self.vec1, self.vec2, normalize=True, margins=True)
+
+
+class GetDummies(object):
+    def setup(self):
+        categories = list(string.ascii_letters[:12])
+        s = pd.Series(np.random.choice(categories, size=1000000),
+                      dtype=pd.api.types.CategoricalDtype(categories))
+        self.s = s
+
+    def time_get_dummies_1d(self):
+        pd.get_dummies(self.s, sparse=False)
+
+    def time_get_dummies_1d_sparse(self):
+        pd.get_dummies(self.s, sparse=True)
+
+
+class Cut(object):
+    params = [[4, 10, 1000]]
+    param_names = ['bins']
+
+    def setup(self, bins):
+        N = 10**5
+        self.int_series = pd.Series(np.arange(N).repeat(5))
+        self.float_series = pd.Series(np.random.randn(N).repeat(5))
+        self.timedelta_series = pd.Series(np.random.randint(N, size=N),
+                                          dtype='timedelta64[ns]')
+        self.datetime_series = pd.Series(np.random.randint(N, size=N),
+                                         dtype='datetime64[ns]')
+
+    def time_cut_int(self, bins):
+        pd.cut(self.int_series, bins)
+
+    def time_cut_float(self, bins):
+        pd.cut(self.float_series, bins)
+
+    def time_cut_timedelta(self, bins):
+        pd.cut(self.timedelta_series, bins)
+
+    def time_cut_datetime(self, bins):
+        pd.cut(self.datetime_series, bins)
+
+    def time_qcut_int(self, bins):
+        pd.qcut(self.int_series, bins)
+
+    def time_qcut_float(self, bins):
+        pd.qcut(self.float_series, bins)
+
+    def time_qcut_timedelta(self, bins):
+        pd.qcut(self.timedelta_series, bins)
+
+    def time_qcut_datetime(self, bins):
+        pd.qcut(self.datetime_series, bins)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/rolling.py b/asv_bench/benchmarks/rolling.py
new file mode 100644
index 0000000000000..659b6591fbd4b
--- /dev/null
+++ b/asv_bench/benchmarks/rolling.py
@@ -0,0 +1,116 @@
+import pandas as pd
+import numpy as np
+
+
+class Methods(object):
+
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              [10, 1000],
+              ['int', 'float'],
+              ['median', 'mean', 'max', 'min', 'std', 'count', 'skew', 'kurt',
+               'sum'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, window, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        self.roll = getattr(pd, constructor)(arr).rolling(window)
+
+    def time_rolling(self, constructor, window, dtype, method):
+        getattr(self.roll, method)()
+
+
+class ExpandingMethods(object):
+
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              ['int', 'float'],
+              ['median', 'mean', 'max', 'min', 'std', 'count', 'skew', 'kurt',
+               'sum'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        self.expanding = getattr(pd, constructor)(arr).expanding()
+
+    def time_expanding(self, constructor, dtype, method):
+        getattr(self.expanding, method)()
+
+
+class EWMMethods(object):
+
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              [10, 1000],
+              ['int', 'float'],
+              ['mean', 'std'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, window, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        self.ewm = getattr(pd, constructor)(arr).ewm(halflife=window)
+
+    def time_ewm(self, constructor, window, dtype, method):
+        getattr(self.ewm, method)()
+
+
+class VariableWindowMethods(Methods):
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              ['50s', '1h', '1d'],
+              ['int', 'float'],
+              ['median', 'mean', 'max', 'min', 'std', 'count', 'skew', 'kurt',
+               'sum'])
+    param_names = ['contructor', 'window', 'dtype', 'method']
+
+    def setup(self, constructor, window, dtype, method):
+        N = 10**5
+        arr = (100 * np.random.random(N)).astype(dtype)
+        index = pd.date_range('2017-01-01', periods=N, freq='5s')
+        self.roll = getattr(pd, constructor)(arr, index=index).rolling(window)
+
+
+class Pairwise(object):
+
+    sample_time = 0.2
+    params = ([10, 1000, None],
+              ['corr', 'cov'],
+              [True, False])
+    param_names = ['window', 'method', 'pairwise']
+
+    def setup(self, window, method, pairwise):
+        N = 10**4
+        arr = np.random.random(N)
+        self.df = pd.DataFrame(arr)
+
+    def time_pairwise(self, window, method, pairwise):
+        if window is None:
+            r = self.df.expanding()
+        else:
+            r = self.df.rolling(window=window)
+        getattr(r, method)(self.df, pairwise=pairwise)
+
+
+class Quantile(object):
+    sample_time = 0.2
+    params = (['DataFrame', 'Series'],
+              [10, 1000],
+              ['int', 'float'],
+              [0, 0.5, 1],
+              ['linear', 'nearest', 'lower', 'higher', 'midpoint'])
+    param_names = ['constructor', 'window', 'dtype', 'percentile']
+
+    def setup(self, constructor, window, dtype, percentile, interpolation):
+        N = 10 ** 5
+        arr = np.random.random(N).astype(dtype)
+        self.roll = getattr(pd, constructor)(arr).rolling(window)
+
+    def time_quantile(self, constructor, window, dtype, percentile,
+                      interpolation):
+        self.roll.quantile(percentile, interpolation=interpolation)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/series_methods.py b/asv_bench/benchmarks/series_methods.py
index c66654ee1e006..3303483c50e20 100644
--- a/asv_bench/benchmarks/series_methods.py
+++ b/asv_bench/benchmarks/series_methods.py
@@ -1,122 +1,204 @@
-from .pandas_vb_common import *
+from datetime import datetime
 
+import numpy as np
+import pandas.util.testing as tm
+from pandas import Series, date_range, NaT
 
-class series_constructor_no_data_datetime_index(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.dr = pd.date_range(
-            start=datetime(2015,10,26),
-            end=datetime(2016,1,1),
-            freq='50s'
-        )  # ~100k long
+class SeriesConstructor(object):
 
-    def time_series_constructor_no_data_datetime_index(self):
-        Series(data=None, index=self.dr)
+    params = [None, 'dict']
+    param_names = ['data']
 
+    def setup(self, data):
+        self.idx = date_range(start=datetime(2015, 10, 26),
+                              end=datetime(2016, 1, 1),
+                              freq='50s')
+        dict_data = dict(zip(self.idx, range(len(self.idx))))
+        self.data = None if data is None else dict_data
 
-class series_constructor_dict_data_datetime_index(object):
-    goal_time = 0.2
+    def time_constructor(self, data):
+        Series(data=self.data, index=self.idx)
 
-    def setup(self):
-        self.dr = pd.date_range(
-            start=datetime(2015, 10, 26),
-            end=datetime(2016, 1, 1),
-            freq='50s'
-        )  # ~100k long
-        self.data = {d: v for d, v in zip(self.dr, range(len(self.dr)))}
 
-    def time_series_constructor_no_data_datetime_index(self):
-        Series(data=self.data, index=self.dr)
+class IsIn(object):
 
+    params = ['int64', 'uint64', 'object']
+    param_names = ['dtype']
 
-class series_isin_int64(object):
-    goal_time = 0.2
+    def setup(self, dtype):
+        self.s = Series(np.random.randint(1, 10, 100000)).astype(dtype)
+        self.values = [1, 2]
+
+    def time_isin(self, dtypes):
+        self.s.isin(self.values)
+
+
+class IsInFloat64(object):
 
     def setup(self):
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.s4 = Series(np.random.randint(1, 100, 10000000)).astype('int64')
-        self.values = [1, 2]
+        self.small = Series([1, 2], dtype=np.float64)
+        self.many_different_values = np.arange(10**6, dtype=np.float64)
+        self.few_different_values = np.zeros(10**7, dtype=np.float64)
+        self.only_nans_values = np.full(10**7, np.nan, dtype=np.float64)
 
-    def time_series_isin_int64(self):
-        self.s3.isin(self.values)
+    def time_isin_many_different(self):
+        # runtime is dominated by creation of the lookup-table
+        self.small.isin(self.many_different_values)
 
-    def time_series_isin_int64_large(self):
-        self.s4.isin(self.values)
+    def time_isin_few_different(self):
+        # runtime is dominated by creation of the lookup-table
+        self.small.isin(self.few_different_values)
 
+    def time_isin_nan_values(self):
+        # runtime is dominated by creation of the lookup-table
+        self.small.isin(self.few_different_values)
 
-class series_isin_object(object):
-    goal_time = 0.2
+
+class IsInForObjects(object):
 
     def setup(self):
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+        self.s_nans = Series(np.full(10**4, np.nan)).astype(np.object)
+        self.vals_nans = np.full(10**4, np.nan).astype(np.object)
+        self.s_short = Series(np.arange(2)).astype(np.object)
+        self.s_long = Series(np.arange(10**5)).astype(np.object)
+        self.vals_short = np.arange(2).astype(np.object)
+        self.vals_long = np.arange(10**5).astype(np.object)
+        # because of nans floats are special:
+        self.s_long_floats = Series(np.arange(10**5,
+                                    dtype=np.float)).astype(np.object)
+        self.vals_long_floats = np.arange(10**5,
+                                          dtype=np.float).astype(np.object)
 
-    def time_series_isin_object(self):
-        self.s4.isin(self.values)
+    def time_isin_nans(self):
+        # if nan-objects are different objects,
+        # this has the potential to trigger O(n^2) running time
+        self.s_nans.isin(self.vals_nans)
 
+    def time_isin_short_series_long_values(self):
+        # running time dominated by the preprocessing
+        self.s_short.isin(self.vals_long)
 
-class series_nlargest1(object):
-    goal_time = 0.2
+    def time_isin_long_series_short_values(self):
+        # running time dominated by look-up
+        self.s_long.isin(self.vals_short)
 
-    def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+    def time_isin_long_series_long_values(self):
+        # no dominating part
+        self.s_long.isin(self.vals_long)
 
-    def time_series_nlargest1(self):
-        self.s1.nlargest(3, keep='last')
-        self.s1.nlargest(3, keep='first')
+    def time_isin_long_series_long_values_floats(self):
+        # no dominating part
+        self.s_long_floats.isin(self.vals_long_floats)
 
 
-class series_nlargest2(object):
-    goal_time = 0.2
+class NSort(object):
 
-    def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
+    params = ['first', 'last', 'all']
+    param_names = ['keep']
 
-    def time_series_nlargest2(self):
-        self.s2.nlargest(3, keep='last')
-        self.s2.nlargest(3, keep='first')
+    def setup(self, keep):
+        self.s = Series(np.random.randint(1, 10, 100000))
 
+    def time_nlargest(self, keep):
+        self.s.nlargest(3, keep=keep)
 
-class series_nsmallest2(object):
-    goal_time = 0.2
+    def time_nsmallest(self, keep):
+        self.s.nsmallest(3, keep=keep)
 
-    def setup(self):
-        self.s1 = Series(np.random.randn(10000))
-        self.s2 = Series(np.random.randint(1, 10, 10000))
-        self.s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-        self.values = [1, 2]
-        self.s4 = self.s3.astype('object')
 
-    def time_series_nsmallest2(self):
-        self.s2.nsmallest(3, keep='last')
-        self.s2.nsmallest(3, keep='first')
+class Dropna(object):
+
+    params = ['int', 'datetime']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10**6
+        data = {'int': np.random.randint(1, 10, N),
+                'datetime': date_range('2000-01-01', freq='S', periods=N)}
+        self.s = Series(data[dtype])
+        if dtype == 'datetime':
+            self.s[np.random.randint(1, N, 100)] = NaT
+
+    def time_dropna(self, dtype):
+        self.s.dropna()
+
 
+class SearchSorted(object):
 
-class series_dropna_int64(object):
     goal_time = 0.2
+    params = ['int8', 'int16', 'int32', 'int64',
+              'uint8', 'uint16', 'uint32', 'uint64',
+              'float16', 'float32', 'float64',
+              'str']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        N = 10**5
+        data = np.array([1] * N + [2] * N + [3] * N).astype(dtype)
+        self.s = Series(data)
+
+    def time_searchsorted(self, dtype):
+        key = '2' if dtype == 'str' else 2
+        self.s.searchsorted(key)
+
+
+class Map(object):
+
+    params = ['dict', 'Series']
+    param_names = 'mapper'
+
+    def setup(self, mapper):
+        map_size = 1000
+        map_data = Series(map_size - np.arange(map_size))
+        self.map_data = map_data if mapper == 'Series' else map_data.to_dict()
+        self.s = Series(np.random.randint(0, map_size, 10000))
+
+    def time_map(self, mapper):
+        self.s.map(self.map_data)
+
+
+class Clip(object):
+    params = [50, 1000, 10**5]
+    param_names = ['n']
+
+    def setup(self, n):
+        self.s = Series(np.random.randn(n))
+
+    def time_clip(self, n):
+        self.s.clip(0, 1)
+
+
+class ValueCounts(object):
+
+    params = ['int', 'uint', 'float', 'object']
+    param_names = ['dtype']
+
+    def setup(self, dtype):
+        self.s = Series(np.random.randint(0, 1000, size=100000)).astype(dtype)
+
+    def time_value_counts(self, dtype):
+        self.s.value_counts()
+
+
+class Dir(object):
 
     def setup(self):
-        self.s = Series(np.random.randint(1, 10, 1000000))
+        self.s = Series(index=tm.makeStringIndex(10000))
 
-    def time_series_dropna_int64(self):
-        self.s.dropna()
+    def time_dir_strings(self):
+        dir(self.s)
 
-class series_dropna_datetime(object):
-    goal_time = 0.2
 
+class SeriesGetattr(object):
+    # https://github.com/pandas-dev/pandas/issues/19764
     def setup(self):
-        self.s = Series(pd.date_range('2000-01-01', freq='S', periods=1000000))
-        self.s[np.random.randint(1, 1000000, 100)] = pd.NaT
+        self.s = Series(1,
+                        index=date_range("2012-01-01", freq='s',
+                                         periods=int(1e6)))
 
-    def time_series_dropna_datetime(self):
-        self.s.dropna()
+    def time_series_datetimeindex_repr(self):
+        getattr(self.s, 'a', None)
+
+
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/sparse.py b/asv_bench/benchmarks/sparse.py
index 717fe7218ceda..64f87c1670170 100644
--- a/asv_bench/benchmarks/sparse.py
+++ b/asv_bench/benchmarks/sparse.py
@@ -1,142 +1,152 @@
-from .pandas_vb_common import *
-import pandas.sparse.series
+import itertools
+
+import numpy as np
 import scipy.sparse
-from pandas.core.sparse import SparseSeries, SparseDataFrame
-from pandas.core.sparse import SparseDataFrame
+from pandas import (SparseSeries, SparseDataFrame, SparseArray, Series,
+                    date_range, MultiIndex)
+
 
+def make_array(size, dense_proportion, fill_value, dtype):
+    dense_size = int(size * dense_proportion)
+    arr = np.full(size, fill_value, dtype)
+    indexer = np.random.choice(np.arange(size), dense_size, replace=False)
+    arr[indexer] = np.random.choice(np.arange(100, dtype=dtype), dense_size)
+    return arr
 
-class sparse_series_to_frame(object):
-    goal_time = 0.2
+
+class SparseSeriesToFrame(object):
 
     def setup(self):
-        self.K = 50
-        self.N = 50000
-        self.rng = np.asarray(date_range('1/1/2000', periods=self.N, freq='T'))
+        K = 50
+        N = 50001
+        rng = date_range('1/1/2000', periods=N, freq='T')
         self.series = {}
-        for i in range(1, (self.K + 1)):
-            self.data = np.random.randn(self.N)[:(- i)]
-            self.this_rng = self.rng[:(- i)]
-            self.data[100:] = np.nan
-            self.series[i] = SparseSeries(self.data, index=self.this_rng)
+        for i in range(1, K):
+            data = np.random.randn(N)[:-i]
+            idx = rng[:-i]
+            data[100:] = np.nan
+            self.series[i] = SparseSeries(data, index=idx)
 
-    def time_sparse_series_to_frame(self):
+    def time_series_to_frame(self):
         SparseDataFrame(self.series)
 
 
-class sparse_frame_constructor(object):
-    goal_time = 0.2
+class SparseArrayConstructor(object):
 
-    def time_sparse_frame_constructor(self):
-        SparseDataFrame(columns=np.arange(100), index=np.arange(1000))
+    params = ([0.1, 0.01], [0, np.nan],
+              [np.int64, np.float64, np.object])
+    param_names = ['dense_proportion', 'fill_value', 'dtype']
 
+    def setup(self, dense_proportion, fill_value, dtype):
+        N = 10**6
+        self.array = make_array(N, dense_proportion, fill_value, dtype)
 
-class sparse_series_from_coo(object):
-    goal_time = 0.2
+    def time_sparse_array(self, dense_proportion, fill_value, dtype):
+        SparseArray(self.array, fill_value=fill_value, dtype=dtype)
 
-    def setup(self):
-        self.A = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(100, 100))
 
-    def time_sparse_series_from_coo(self):
-        self.ss = pandas.sparse.series.SparseSeries.from_coo(self.A)
+class SparseDataFrameConstructor(object):
 
+    def setup(self):
+        N = 1000
+        self.arr = np.arange(N)
+        self.sparse = scipy.sparse.rand(N, N, 0.005)
+        self.dict = dict(zip(range(N), itertools.repeat([0])))
 
-class sparse_series_to_coo(object):
-    goal_time = 0.2
+    def time_constructor(self):
+        SparseDataFrame(columns=self.arr, index=self.arr)
 
-    def setup(self):
-        self.s = pd.Series(([np.nan] * 10000))
-        self.s[0] = 3.0
-        self.s[100] = (-1.0)
-        self.s[999] = 12.1
-        self.s.index = pd.MultiIndex.from_product((range(10), range(10), range(10), range(10)))
-        self.ss = self.s.to_sparse()
+    def time_from_scipy(self):
+        SparseDataFrame(self.sparse)
 
-    def time_sparse_series_to_coo(self):
-        self.ss.to_coo(row_levels=[0, 1], column_levels=[2, 3], sort_labels=True)
+    def time_from_dict(self):
+        SparseDataFrame(self.dict)
 
 
-class sparse_arithmetic_int(object):
-    goal_time = 0.2
+class FromCoo(object):
 
     def setup(self):
-        np.random.seed(1)
-        self.a_10percent = self.make_sparse_array(length=1000000, dense_size=100000, fill_value=np.nan)
-        self.b_10percent = self.make_sparse_array(length=1000000, dense_size=100000, fill_value=np.nan)
+        self.matrix = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0],
+                                               ([1, 0, 0], [0, 2, 3])),
+                                              shape=(100, 100))
+
+    def time_sparse_series_from_coo(self):
+        SparseSeries.from_coo(self.matrix)
 
-        self.a_10percent_zero = self.make_sparse_array(length=1000000, dense_size=100000, fill_value=0)
-        self.b_10percent_zero = self.make_sparse_array(length=1000000, dense_size=100000, fill_value=0)
 
-        self.a_1percent = self.make_sparse_array(length=1000000, dense_size=10000, fill_value=np.nan)
-        self.b_1percent = self.make_sparse_array(length=1000000, dense_size=10000, fill_value=np.nan)
+class ToCoo(object):
 
-    def make_sparse_array(self, length, dense_size, fill_value):
-        arr = np.array([fill_value] * length, dtype=np.float64)
-        indexer = np.unique(np.random.randint(0, length, dense_size))
-        arr[indexer] = np.random.randint(0, 100, len(indexer))
-        return pd.SparseArray(arr, fill_value=fill_value)
+    def setup(self):
+        s = Series([np.nan] * 10000)
+        s[0] = 3.0
+        s[100] = -1.0
+        s[999] = 12.1
+        s.index = MultiIndex.from_product([range(10)] * 4)
+        self.ss = s.to_sparse()
 
-    def time_sparse_make_union(self):
-        self.a_10percent.sp_index.make_union(self.b_10percent.sp_index)
+    def time_sparse_series_to_coo(self):
+        self.ss.to_coo(row_levels=[0, 1],
+                       column_levels=[2, 3],
+                       sort_labels=True)
 
-    def time_sparse_intersect(self):
-        self.a_10percent.sp_index.intersect(self.b_10percent.sp_index)
 
-    def time_sparse_addition_10percent(self):
-        self.a_10percent + self.b_10percent
+class Arithmetic(object):
 
-    def time_sparse_addition_10percent_zero(self):
-        self.a_10percent_zero + self.b_10percent_zero
+    params = ([0.1, 0.01], [0, np.nan])
+    param_names = ['dense_proportion', 'fill_value']
 
-    def time_sparse_addition_1percent(self):
-        self.a_1percent + self.b_1percent
+    def setup(self, dense_proportion, fill_value):
+        N = 10**6
+        arr1 = make_array(N, dense_proportion, fill_value, np.int64)
+        self.array1 = SparseArray(arr1, fill_value=fill_value)
+        arr2 = make_array(N, dense_proportion, fill_value, np.int64)
+        self.array2 = SparseArray(arr2, fill_value=fill_value)
 
-    def time_sparse_division_10percent(self):
-        self.a_10percent / self.b_10percent
+    def time_make_union(self, dense_proportion, fill_value):
+        self.array1.sp_index.make_union(self.array2.sp_index)
 
-    def time_sparse_division_10percent_zero(self):
-        self.a_10percent_zero / self.b_10percent_zero
+    def time_intersect(self, dense_proportion, fill_value):
+        self.array1.sp_index.intersect(self.array2.sp_index)
 
-    def time_sparse_division_1percent(self):
-        self.a_1percent / self.b_1percent
+    def time_add(self, dense_proportion, fill_value):
+        self.array1 + self.array2
 
+    def time_divide(self, dense_proportion, fill_value):
+        self.array1 / self.array2
 
 
-class sparse_arithmetic_block(object):
-    goal_time = 0.2
+class ArithmeticBlock(object):
 
-    def setup(self):
-        np.random.seed(1)
-        self.a = self.make_sparse_array(length=1000000, num_blocks=1000,
-                                        block_size=10, fill_value=np.nan)
-        self.b = self.make_sparse_array(length=1000000, num_blocks=1000,
-                                        block_size=10, fill_value=np.nan)
+    params = [np.nan, 0]
+    param_names = ['fill_value']
 
-        self.a_zero = self.make_sparse_array(length=1000000, num_blocks=1000,
-                                             block_size=10, fill_value=0)
-        self.b_zero = self.make_sparse_array(length=1000000, num_blocks=1000,
-                                             block_size=10, fill_value=np.nan)
+    def setup(self, fill_value):
+        N = 10**6
+        self.arr1 = self.make_block_array(length=N, num_blocks=1000,
+                                          block_size=10, fill_value=fill_value)
+        self.arr2 = self.make_block_array(length=N, num_blocks=1000,
+                                          block_size=10, fill_value=fill_value)
 
-    def make_sparse_array(self, length, num_blocks, block_size, fill_value):
-        a = np.array([fill_value] * length)
-        for block in range(num_blocks):
-            i = np.random.randint(0, length)
-            a[i:i + block_size] = np.random.randint(0, 100, len(a[i:i + block_size]))
-        return pd.SparseArray(a, fill_value=fill_value)
+    def make_block_array(self, length, num_blocks, block_size, fill_value):
+        arr = np.full(length, fill_value)
+        indicies = np.random.choice(np.arange(0, length, block_size),
+                                    num_blocks,
+                                    replace=False)
+        for ind in indicies:
+            arr[ind:ind + block_size] = np.random.randint(0, 100, block_size)
+        return SparseArray(arr, fill_value=fill_value)
 
-    def time_sparse_make_union(self):
-        self.a.sp_index.make_union(self.b.sp_index)
+    def time_make_union(self, fill_value):
+        self.arr1.sp_index.make_union(self.arr2.sp_index)
 
-    def time_sparse_intersect(self):
-        self.a.sp_index.intersect(self.b.sp_index)
+    def time_intersect(self, fill_value):
+        self.arr2.sp_index.intersect(self.arr2.sp_index)
 
-    def time_sparse_addition(self):
-        self.a + self.b
+    def time_addition(self, fill_value):
+        self.arr1 + self.arr2
 
-    def time_sparse_addition_zero(self):
-        self.a_zero + self.b_zero
+    def time_division(self, fill_value):
+        self.arr1 / self.arr2
 
-    def time_sparse_division(self):
-        self.a / self.b
 
-    def time_sparse_division_zero(self):
-        self.a_zero / self.b_zero
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/stat_ops.py b/asv_bench/benchmarks/stat_ops.py
index 12fbb2478c2a5..7fdc713f076ed 100644
--- a/asv_bench/benchmarks/stat_ops.py
+++ b/asv_bench/benchmarks/stat_ops.py
@@ -1,261 +1,144 @@
-from .pandas_vb_common import *
+import numpy as np
+import pandas as pd
 
 
-class stat_ops_frame_mean_float_axis_0(object):
-    goal_time = 0.2
+ops = ['mean', 'sum', 'median', 'std', 'skew', 'kurt', 'mad', 'prod', 'sem',
+       'var']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
 
-    def time_stat_ops_frame_mean_float_axis_0(self):
-        self.df.mean()
+class FrameOps(object):
 
+    params = [ops, ['float', 'int'], [0, 1], [True, False]]
+    param_names = ['op', 'dtype', 'axis', 'use_bottleneck']
 
-class stat_ops_frame_mean_float_axis_1(object):
-    goal_time = 0.2
+    def setup(self, op, dtype, axis, use_bottleneck):
+        df = pd.DataFrame(np.random.randn(100000, 4)).astype(dtype)
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except TypeError:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.df_func = getattr(df, op)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def time_op(self, op, dtype, axis, use_bottleneck):
+        self.df_func(axis=axis)
 
-    def time_stat_ops_frame_mean_float_axis_1(self):
-        self.df.mean(1)
 
+class FrameMultiIndexOps(object):
 
-class stat_ops_frame_mean_int_axis_0(object):
-    goal_time = 0.2
+    params = ([0, 1, [0, 1]], ops)
+    param_names = ['level', 'op']
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def setup(self, level, op):
+        levels = [np.arange(10), np.arange(100), np.arange(100)]
+        codes = [np.arange(10).repeat(10000),
+                 np.tile(np.arange(100).repeat(100), 10),
+                 np.tile(np.tile(np.arange(100), 100), 10)]
+        index = pd.MultiIndex(levels=levels, codes=codes)
+        df = pd.DataFrame(np.random.randn(len(index), 4), index=index)
+        self.df_func = getattr(df, op)
 
-    def time_stat_ops_frame_mean_int_axis_0(self):
-        self.dfi.mean()
+    def time_op(self, level, op):
+        self.df_func(level=level)
 
 
-class stat_ops_frame_mean_int_axis_1(object):
-    goal_time = 0.2
+class SeriesOps(object):
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    params = [ops, ['float', 'int'], [True, False]]
+    param_names = ['op', 'dtype', 'use_bottleneck']
 
-    def time_stat_ops_frame_mean_int_axis_1(self):
-        self.dfi.mean(1)
+    def setup(self, op, dtype, use_bottleneck):
+        s = pd.Series(np.random.randn(100000)).astype(dtype)
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except TypeError:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.s_func = getattr(s, op)
 
+    def time_op(self, op, dtype, use_bottleneck):
+        self.s_func()
 
-class stat_ops_frame_sum_float_axis_0(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+class SeriesMultiIndexOps(object):
 
-    def time_stat_ops_frame_sum_float_axis_0(self):
-        self.df.sum()
+    params = ([0, 1, [0, 1]], ops)
+    param_names = ['level', 'op']
 
+    def setup(self, level, op):
+        levels = [np.arange(10), np.arange(100), np.arange(100)]
+        codes = [np.arange(10).repeat(10000),
+                 np.tile(np.arange(100).repeat(100), 10),
+                 np.tile(np.tile(np.arange(100), 100), 10)]
+        index = pd.MultiIndex(levels=levels, codes=codes)
+        s = pd.Series(np.random.randn(len(index)), index=index)
+        self.s_func = getattr(s, op)
 
-class stat_ops_frame_sum_float_axis_1(object):
-    goal_time = 0.2
+    def time_op(self, level, op):
+        self.s_func(level=level)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
 
-    def time_stat_ops_frame_sum_float_axis_1(self):
-        self.df.sum(1)
+class Rank(object):
 
+    params = [['DataFrame', 'Series'], [True, False]]
+    param_names = ['constructor', 'pct']
 
-class stat_ops_frame_sum_int_axis_0(object):
-    goal_time = 0.2
+    def setup(self, constructor, pct):
+        values = np.random.randn(10**5)
+        self.data = getattr(pd, constructor)(values)
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    def time_rank(self, constructor, pct):
+        self.data.rank(pct=pct)
 
-    def time_stat_ops_frame_sum_int_axis_0(self):
-        self.dfi.sum()
+    def time_average_old(self, constructor, pct):
+        self.data.rank(pct=pct) / len(self.data)
 
 
-class stat_ops_frame_sum_int_axis_1(object):
-    goal_time = 0.2
+class Correlation(object):
 
-    def setup(self):
-        self.df = DataFrame(np.random.randn(100000, 4))
-        self.dfi = DataFrame(np.random.randint(1000, size=self.df.shape))
+    params = [['spearman', 'kendall', 'pearson'], [True, False]]
+    param_names = ['method', 'use_bottleneck']
 
-    def time_stat_ops_frame_sum_int_axis_1(self):
-        self.dfi.sum(1)
+    def setup(self, method, use_bottleneck):
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except TypeError:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.df = pd.DataFrame(np.random.randn(1000, 30))
+        self.df2 = pd.DataFrame(np.random.randn(1000, 30))
+        self.s = pd.Series(np.random.randn(1000))
+        self.s2 = pd.Series(np.random.randn(1000))
 
+    def time_corr(self, method, use_bottleneck):
+        self.df.corr(method=method)
 
-class stat_ops_level_frame_sum(object):
-    goal_time = 0.2
+    def time_corr_series(self, method, use_bottleneck):
+        self.s.corr(self.s2, method=method)
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
+    def time_corrwith_cols(self, method, use_bottleneck):
+        self.df.corrwith(self.df2, method=method)
 
-    def time_stat_ops_level_frame_sum(self):
-        self.df.sum(level=1)
+    def time_corrwith_rows(self, method, use_bottleneck):
+        self.df.corrwith(self.df2, axis=1, method=method)
 
 
-class stat_ops_level_frame_sum_multiple(object):
-    goal_time = 0.2
+class Covariance(object):
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
+    params = [[True, False]]
+    param_names = ['use_bottleneck']
 
-    def time_stat_ops_level_frame_sum_multiple(self):
-        self.df.sum(level=[0, 1])
+    def setup(self, use_bottleneck):
+        try:
+            pd.options.compute.use_bottleneck = use_bottleneck
+        except TypeError:
+            from pandas.core import nanops
+            nanops._USE_BOTTLENECK = use_bottleneck
+        self.s = pd.Series(np.random.randn(100000))
+        self.s2 = pd.Series(np.random.randn(100000))
 
+    def time_cov_series(self, use_bottleneck):
+        self.s.cov(self.s2)
 
-class stat_ops_level_series_sum(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
-
-    def time_stat_ops_level_series_sum(self):
-        self.df[1].sum(level=1)
-
-
-class stat_ops_level_series_sum_multiple(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)], labels=[np.arange(10).repeat(10000), np.tile(np.arange(100).repeat(100), 10), np.tile(np.tile(np.arange(100), 100), 10)])
-        random.shuffle(self.index.values)
-        self.df = DataFrame(np.random.randn(len(self.index), 4), index=self.index)
-        self.df_level = DataFrame(np.random.randn(100, 4), index=self.index.levels[1])
-
-    def time_stat_ops_level_series_sum_multiple(self):
-        self.df[1].sum(level=[0, 1])
-
-
-class stat_ops_series_std(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.s = Series(np.random.randn(100000), index=np.arange(100000))
-        self.s[::2] = np.nan
-
-    def time_stat_ops_series_std(self):
-        self.s.std()
-
-
-class stats_corr_spearman(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(1000, 30))
-
-    def time_stats_corr_spearman(self):
-        self.df.corr(method='spearman')
-
-
-class stats_rank2d_axis0_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(5000, 50))
-
-    def time_stats_rank2d_axis0_average(self):
-        self.df.rank()
-
-
-class stats_rank2d_axis1_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.df = DataFrame(np.random.randn(5000, 50))
-
-    def time_stats_rank2d_axis1_average(self):
-        self.df.rank(1)
-
-
-class stats_rank_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
-
-    def time_stats_rank_average(self):
-        self.s.rank()
-
-
-class stats_rank_average_int(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.random.randint(0, 100000, size=200000)
-        self.s = Series(self.values)
-
-    def time_stats_rank_average_int(self):
-        self.s.rank()
-
-
-class stats_rank_pct_average(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
-
-    def time_stats_rank_pct_average(self):
-        self.s.rank(pct=True)
-
-
-class stats_rank_pct_average_old(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.values = np.concatenate([np.arange(100000), np.random.randn(100000), np.arange(100000)])
-        self.s = Series(self.values)
-
-    def time_stats_rank_pct_average_old(self):
-        (self.s.rank() / len(self.s))
-
-
-class stats_rolling_mean(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.arr = np.random.randn(100000)
-        self.win = 100
-
-    def time_rolling_mean(self):
-        rolling_mean(self.arr, self.win)
-
-    def time_rolling_median(self):
-        rolling_median(self.arr, self.win)
-
-    def time_rolling_min(self):
-        rolling_min(self.arr, self.win)
-
-    def time_rolling_max(self):
-        rolling_max(self.arr, self.win)
-
-    def time_rolling_sum(self):
-        rolling_sum(self.arr, self.win)
-
-    def time_rolling_std(self):
-        rolling_std(self.arr, self.win)
-
-    def time_rolling_var(self):
-        rolling_var(self.arr, self.win)
-
-    def time_rolling_skew(self):
-        rolling_skew(self.arr, self.win)
-
-    def time_rolling_kurt(self):
-        rolling_kurt(self.arr, self.win)
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/strings.py b/asv_bench/benchmarks/strings.py
index c1600d4e07f58..b5b2c955f0133 100644
--- a/asv_bench/benchmarks/strings.py
+++ b/asv_bench/benchmarks/strings.py
@@ -1,107 +1,188 @@
-from .pandas_vb_common import *
-import string
-import itertools as IT
-import pandas.util.testing as testing
+import warnings
 
+import numpy as np
+from pandas import Series, DataFrame
+import pandas.util.testing as tm
 
-class StringMethods(object):
-    goal_time = 0.2
 
-    def make_series(self, letters, strlen, size):
-        return Series([str(x) for x in np.fromiter(IT.cycle(letters), count=(size * strlen), dtype='|S1').view('|S{}'.format(strlen))])
+class Methods(object):
 
     def setup(self):
-        self.many = self.make_series(('matchthis' + string.ascii_uppercase), strlen=19, size=10000)
-        self.few = self.make_series(('matchthis' + (string.ascii_uppercase * 42)), strlen=19, size=10000)
-        self.s = self.make_series(string.ascii_uppercase, strlen=10, size=10000).str.join('|')
-
-    def time_cat(self):
-        self.many.str.cat(sep=',')
+        self.s = Series(tm.makeStringIndex(10**5))
 
     def time_center(self):
-        self.many.str.center(100)
-
-    def time_contains_few(self):
-        self.few.str.contains('matchthis')
-
-    def time_contains_few_noregex(self):
-        self.few.str.contains('matchthis', regex=False)
-
-    def time_contains_many(self):
-        self.many.str.contains('matchthis')
-
-    def time_contains_many_noregex(self):
-        self.many.str.contains('matchthis', regex=False)
+        self.s.str.center(100)
 
     def time_count(self):
-        self.many.str.count('matchthis')
+        self.s.str.count('A')
 
     def time_endswith(self):
-        self.many.str.endswith('matchthis')
+        self.s.str.endswith('A')
 
     def time_extract(self):
-        self.many.str.extract('(\\w*)matchthis(\\w*)')
+        with warnings.catch_warnings(record=True):
+            self.s.str.extract('(\\w*)A(\\w*)')
 
     def time_findall(self):
-        self.many.str.findall('[A-Z]+')
+        self.s.str.findall('[A-Z]+')
 
-    def time_get(self):
-        self.many.str.get(0)
+    def time_find(self):
+        self.s.str.find('[A-Z]+')
 
-    def time_join_split(self):
-        self.many.str.join('--').str.split('--')
+    def time_rfind(self):
+        self.s.str.rfind('[A-Z]+')
 
-    def time_join_split_expand(self):
-        self.many.str.join('--').str.split('--', expand=True)
+    def time_get(self):
+        self.s.str.get(0)
 
     def time_len(self):
-        self.many.str.len()
+        self.s.str.len()
+
+    def time_join(self):
+        self.s.str.join(' ')
 
     def time_match(self):
-        self.many.str.match('mat..this')
+        self.s.str.match('A')
+
+    def time_normalize(self):
+        self.s.str.normalize('NFC')
 
     def time_pad(self):
-        self.many.str.pad(100, side='both')
+        self.s.str.pad(100, side='both')
 
-    def time_repeat(self):
-        self.many.str.repeat(list(IT.islice(IT.cycle(range(1, 4)), len(self.many))))
+    def time_partition(self):
+        self.s.str.partition('A')
+
+    def time_rpartition(self):
+        self.s.str.rpartition('A')
 
     def time_replace(self):
-        self.many.str.replace('(matchthis)', '\x01\x01')
+        self.s.str.replace('A', '\x01\x01')
+
+    def time_translate(self):
+        self.s.str.translate({'A': '\x01\x01'})
 
     def time_slice(self):
-        self.many.str.slice(5, 15, 2)
+        self.s.str.slice(5, 15, 2)
 
     def time_startswith(self):
-        self.many.str.startswith('matchthis')
+        self.s.str.startswith('A')
 
     def time_strip(self):
-        self.many.str.strip('matchthis')
+        self.s.str.strip('A')
 
     def time_rstrip(self):
-        self.many.str.rstrip('matchthis')
+        self.s.str.rstrip('A')
 
     def time_lstrip(self):
-        self.many.str.lstrip('matchthis')
+        self.s.str.lstrip('A')
 
     def time_title(self):
-        self.many.str.title()
+        self.s.str.title()
 
     def time_upper(self):
-        self.many.str.upper()
+        self.s.str.upper()
 
     def time_lower(self):
-        self.many.str.lower()
+        self.s.str.lower()
+
+    def time_wrap(self):
+        self.s.str.wrap(10)
+
+    def time_zfill(self):
+        self.s.str.zfill(10)
+
+
+class Repeat(object):
+
+    params = ['int', 'array']
+    param_names = ['repeats']
+
+    def setup(self, repeats):
+        N = 10**5
+        self.s = Series(tm.makeStringIndex(N))
+        repeat = {'int': 1, 'array': np.random.randint(1, 3, N)}
+        self.values = repeat[repeats]
+
+    def time_repeat(self, repeats):
+        self.s.str.repeat(self.values)
+
+
+class Cat(object):
+
+    params = ([0, 3], [None, ','], [None, '-'], [0.0, 0.001, 0.15])
+    param_names = ['other_cols', 'sep', 'na_rep', 'na_frac']
+
+    def setup(self, other_cols, sep, na_rep, na_frac):
+        N = 10 ** 5
+        mask_gen = lambda: np.random.choice([True, False], N,
+                                            p=[1 - na_frac, na_frac])
+        self.s = Series(tm.makeStringIndex(N)).where(mask_gen())
+        if other_cols == 0:
+            # str.cat self-concatenates only for others=None
+            self.others = None
+        else:
+            self.others = DataFrame({i: tm.makeStringIndex(N).where(mask_gen())
+                                     for i in range(other_cols)})
+
+    def time_cat(self, other_cols, sep, na_rep, na_frac):
+        # before the concatenation (one caller + other_cols columns), the total
+        # expected fraction of rows containing any NaN is:
+        # reduce(lambda t, _: t + (1 - t) * na_frac, range(other_cols + 1), 0)
+        # for other_cols=3 and na_frac=0.15, this works out to ~48%
+        self.s.str.cat(others=self.others, sep=sep, na_rep=na_rep)
+
+
+class Contains(object):
+
+    params = [True, False]
+    param_names = ['regex']
+
+    def setup(self, regex):
+        self.s = Series(tm.makeStringIndex(10**5))
+
+    def time_contains(self, regex):
+        self.s.str.contains('A', regex=regex)
+
+
+class Split(object):
+
+    params = [True, False]
+    param_names = ['expand']
+
+    def setup(self, expand):
+        self.s = Series(tm.makeStringIndex(10**5)).str.join('--')
+
+    def time_split(self, expand):
+        self.s.str.split('--', expand=expand)
+
+    def time_rsplit(self, expand):
+        self.s.str.rsplit('--', expand=expand)
+
+
+class Dummies(object):
+
+    def setup(self):
+        self.s = Series(tm.makeStringIndex(10**5)).str.join('|')
 
     def time_get_dummies(self):
         self.s.str.get_dummies('|')
 
 
-class StringEncode(object):
-    goal_time = 0.2
+class Encode(object):
 
     def setup(self):
-        self.ser = Series(testing.makeUnicodeIndex())
+        self.ser = Series(tm.makeUnicodeIndex())
 
     def time_encode_decode(self):
         self.ser.str.encode('utf-8').str.decode('utf-8')
+
+
+class Slice(object):
+
+    def setup(self):
+        self.s = Series(['abcdefg', np.nan] * 500000)
+
+    def time_vector_slice(self):
+        # GH 2602
+        self.s.str[:5]
diff --git a/asv_bench/benchmarks/timedelta.py b/asv_bench/benchmarks/timedelta.py
index c112d1ef72eb8..0cfbbd536bc8b 100644
--- a/asv_bench/benchmarks/timedelta.py
+++ b/asv_bench/benchmarks/timedelta.py
@@ -1,42 +1,153 @@
-from .pandas_vb_common import *
-from pandas import to_timedelta, Timestamp
+import datetime
 
+import numpy as np
 
-class ToTimedelta(object):
-    goal_time = 0.2
+from pandas import (
+    DataFrame, Series, Timedelta, Timestamp, timedelta_range, to_timedelta)
 
-    def setup(self):
-        self.arr = np.random.randint(0, 1000, size=10000)
-        self.arr2 = ['{0} days'.format(i) for i in self.arr]
 
-        self.arr3 = np.random.randint(0, 60, size=10000)
-        self.arr3 = ['00:00:{0:02d}'.format(i) for i in self.arr3]
+class TimedeltaConstructor(object):
+
+    def time_from_int(self):
+        Timedelta(123456789)
+
+    def time_from_unit(self):
+        Timedelta(1, unit='d')
+
+    def time_from_components(self):
+        Timedelta(days=1, hours=2, minutes=3, seconds=4, milliseconds=5,
+                  microseconds=6, nanoseconds=7)
+
+    def time_from_datetime_timedelta(self):
+        Timedelta(datetime.timedelta(days=1, seconds=1))
+
+    def time_from_np_timedelta(self):
+        Timedelta(np.timedelta64(1, 'ms'))
+
+    def time_from_string(self):
+        Timedelta('1 days')
+
+    def time_from_iso_format(self):
+        Timedelta('P4DT12H30M5S')
+
+    def time_from_missing(self):
+        Timedelta('nat')
+
 
-        self.arr4 = list(self.arr2)
-        self.arr4[-1] = 'apple'
+class ToTimedelta(object):
+
+    def setup(self):
+        self.ints = np.random.randint(0, 60, size=10000)
+        self.str_days = []
+        self.str_seconds = []
+        for i in self.ints:
+            self.str_days.append('{0} days'.format(i))
+            self.str_seconds.append('00:00:{0:02d}'.format(i))
 
     def time_convert_int(self):
-        to_timedelta(self.arr, unit='s')
+        to_timedelta(self.ints, unit='s')
 
-    def time_convert_string(self):
-        to_timedelta(self.arr2)
+    def time_convert_string_days(self):
+        to_timedelta(self.str_days)
 
     def time_convert_string_seconds(self):
-        to_timedelta(self.arr3)
+        to_timedelta(self.str_seconds)
+
+
+class ToTimedeltaErrors(object):
+
+    params = ['coerce', 'ignore']
+    param_names = ['errors']
 
-    def time_convert_coerce(self):
-        to_timedelta(self.arr4, errors='coerce')
+    def setup(self, errors):
+        ints = np.random.randint(0, 60, size=10000)
+        self.arr = ['{0} days'.format(i) for i in ints]
+        self.arr[-1] = 'apple'
 
-    def time_convert_ignore(self):
-        to_timedelta(self.arr4, errors='ignore')
+    def time_convert(self, errors):
+        to_timedelta(self.arr, errors=errors)
 
 
-class Ops(object):
-    goal_time = 0.2
+class TimedeltaOps(object):
 
     def setup(self):
         self.td = to_timedelta(np.arange(1000000))
         self.ts = Timestamp('2000')
 
-    def test_add_td_ts(self):
+    def time_add_td_ts(self):
         self.td + self.ts
+
+
+class TimedeltaProperties(object):
+
+    def setup_cache(self):
+        td = Timedelta(days=365, minutes=35, seconds=25, milliseconds=35)
+        return td
+
+    def time_timedelta_days(self, td):
+        td.days
+
+    def time_timedelta_seconds(self, td):
+        td.seconds
+
+    def time_timedelta_microseconds(self, td):
+        td.microseconds
+
+    def time_timedelta_nanoseconds(self, td):
+        td.nanoseconds
+
+
+class DatetimeAccessor(object):
+
+    def setup_cache(self):
+        N = 100000
+        series = Series(timedelta_range('1 days', periods=N, freq='h'))
+        return series
+
+    def time_dt_accessor(self, series):
+        series.dt
+
+    def time_timedelta_days(self, series):
+        series.dt.days
+
+    def time_timedelta_seconds(self, series):
+        series.dt.seconds
+
+    def time_timedelta_microseconds(self, series):
+        series.dt.microseconds
+
+    def time_timedelta_nanoseconds(self, series):
+        series.dt.nanoseconds
+
+
+class TimedeltaIndexing(object):
+
+    def setup(self):
+        self.index = timedelta_range(start='1985', periods=1000, freq='D')
+        self.index2 = timedelta_range(start='1986', periods=1000, freq='D')
+        self.series = Series(range(1000), index=self.index)
+        self.timedelta = self.index[500]
+
+    def time_get_loc(self):
+        self.index.get_loc(self.timedelta)
+
+    def time_shape(self):
+        self.index.shape
+
+    def time_shallow_copy(self):
+        self.index._shallow_copy()
+
+    def time_series_loc(self):
+        self.series.loc[self.timedelta]
+
+    def time_align(self):
+        DataFrame({'a': self.series, 'b': self.series[:500]})
+
+    def time_intersection(self):
+        self.index.intersection(self.index2)
+
+    def time_union(self):
+        self.index.union(self.index2)
+
+    def time_unique(self):
+        self.index.unique()
diff --git a/asv_bench/benchmarks/timeseries.py b/asv_bench/benchmarks/timeseries.py
index 6e9ef4b10273c..6efd720d1acdd 100644
--- a/asv_bench/benchmarks/timeseries.py
+++ b/asv_bench/benchmarks/timeseries.py
@@ -1,349 +1,313 @@
-from pandas.tseries.converter import DatetimeConverter
-from .pandas_vb_common import *
-import pandas as pd
 from datetime import timedelta
-import datetime as dt
+
+import dateutil
+import numpy as np
+from pandas import to_datetime, date_range, Series, DataFrame, period_range
+from pandas.tseries.frequencies import infer_freq
 try:
-    import pandas.tseries.holiday
+    from pandas.plotting._converter import DatetimeConverter
 except ImportError:
-    pass
-from pandas.tseries.frequencies import infer_freq
-import numpy as np
-
-if hasattr(Series, 'convert'):
-    Series.resample = Series.convert
+    from pandas.tseries.converter import DatetimeConverter
 
 
 class DatetimeIndex(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
+    params = ['dst', 'repeated', 'tz_aware', 'tz_local', 'tz_naive']
+    param_names = ['index_type']
 
-        self.rng2 = date_range(start='1/1/2000 9:30', periods=10000, freq='S', tz='US/Eastern')
+    def setup(self, index_type):
+        N = 100000
+        dtidxes = {'dst': date_range(start='10/29/2000 1:00:00',
+                                     end='10/29/2000 1:59:59', freq='S'),
+                   'repeated': date_range(start='2000',
+                                          periods=N / 10,
+                                          freq='s').repeat(10),
+                   'tz_aware': date_range(start='2000',
+                                          periods=N,
+                                          freq='s',
+                                          tz='US/Eastern'),
+                   'tz_local': date_range(start='2000',
+                                          periods=N,
+                                          freq='s',
+                                          tz=dateutil.tz.tzlocal()),
+                   'tz_naive': date_range(start='2000',
+                                          periods=N,
+                                          freq='s')}
+        self.index = dtidxes[index_type]
 
-        self.index_repeated = date_range(start='1/1/2000', periods=1000, freq='T').repeat(10)
+    def time_add_timedelta(self, index_type):
+        self.index + timedelta(minutes=2)
 
-        self.rng3 = date_range(start='1/1/2000', periods=1000, freq='H')
-        self.df = DataFrame(np.random.randn(len(self.rng3), 2), self.rng3)
+    def time_normalize(self, index_type):
+        self.index.normalize()
 
-        self.rng4 = date_range(start='1/1/2000', periods=1000, freq='H', tz='US/Eastern')
-        self.df2 = DataFrame(np.random.randn(len(self.rng4), 2), index=self.rng4)
+    def time_unique(self, index_type):
+        self.index.unique()
 
-        N = 100000
-        self.dti = pd.date_range('2011-01-01', freq='H', periods=N).repeat(5)
-        self.dti_tz = pd.date_range('2011-01-01', freq='H', periods=N,
-                                    tz='Asia/Tokyo').repeat(5)
+    def time_to_time(self, index_type):
+        self.index.time
+
+    def time_get(self, index_type):
+        self.index[0]
 
-        self.rng5 = date_range(start='1/1/2000', end='3/1/2000', tz='US/Eastern')
+    def time_timeseries_is_month_start(self, index_type):
+        self.index.is_month_start
 
-        self.dst_rng = date_range(start='10/29/2000 1:00:00', end='10/29/2000 1:59:59', freq='S')
-        self.index = date_range(start='10/29/2000', end='10/29/2000 00:59:59', freq='S')
-        self.index = self.index.append(self.dst_rng)
-        self.index = self.index.append(self.dst_rng)
-        self.index = self.index.append(date_range(start='10/29/2000 2:00:00', end='10/29/2000 3:00:00', freq='S'))
+    def time_to_date(self, index_type):
+        self.index.date
 
-        self.N = 10000
-        self.rng6 = date_range(start='1/1/1', periods=self.N, freq='B')
+    def time_to_pydatetime(self, index_type):
+        self.index.to_pydatetime()
 
-        self.rng7 = date_range(start='1/1/1700', freq='D', periods=100000)
-        self.a = self.rng7[:50000].append(self.rng7[50002:])
 
-    def time_add_timedelta(self):
-        (self.rng + timedelta(minutes=2))
+class TzLocalize(object):
 
-    def time_add_offset_delta(self):
-        (self.rng + self.delta_offset)
+    params = [None, 'US/Eastern', 'UTC', dateutil.tz.tzutc()]
+    param_names = 'tz'
 
-    def time_add_offset_fast(self):
-        (self.rng + self.fast_offset)
+    def setup(self, tz):
+        dst_rng = date_range(start='10/29/2000 1:00:00',
+                             end='10/29/2000 1:59:59', freq='S')
+        self.index = date_range(start='10/29/2000',
+                                end='10/29/2000 00:59:59', freq='S')
+        self.index = self.index.append(dst_rng)
+        self.index = self.index.append(dst_rng)
+        self.index = self.index.append(date_range(start='10/29/2000 2:00:00',
+                                                  end='10/29/2000 3:00:00',
+                                                  freq='S'))
 
-    def time_add_offset_slow(self):
-        (self.rng + self.slow_offset)
+    def time_infer_dst(self, tz):
+        self.index.tz_localize(tz, ambiguous='infer')
 
-    def time_normalize(self):
-        self.rng2.normalize()
 
-    def time_unique(self):
-        self.index_repeated.unique()
+class ResetIndex(object):
 
-    def time_reset_index(self):
+    params = [None, 'US/Eastern']
+    param_names = 'tz'
+
+    def setup(self, tz):
+        idx = date_range(start='1/1/2000', periods=1000, freq='H', tz=tz)
+        self.df = DataFrame(np.random.randn(1000, 2), index=idx)
+
+    def time_reest_datetimeindex(self, tz):
         self.df.reset_index()
 
-    def time_reset_index_tz(self):
-        self.df2.reset_index()
 
-    def time_dti_factorize(self):
+class Factorize(object):
+
+    params = [None, 'Asia/Tokyo']
+    param_names = 'tz'
+
+    def setup(self, tz):
+        N = 100000
+        self.dti = date_range('2011-01-01', freq='H', periods=N, tz=tz)
+        self.dti = self.dti.repeat(5)
+
+    def time_factorize(self, tz):
         self.dti.factorize()
 
-    def time_dti_tz_factorize(self):
-        self.dti_tz.factorize()
 
-    def time_timestamp_tzinfo_cons(self):
-        self.rng5[0]
+class InferFreq(object):
 
-    def time_infer_dst(self):
-        self.index.tz_localize('US/Eastern', infer_dst=True)
+    params = [None, 'D', 'B']
+    param_names = ['freq']
 
-    def time_timeseries_is_month_start(self):
-        self.rng6.is_month_start
+    def setup(self, freq):
+        if freq is None:
+            self.idx = date_range(start='1/1/1700', freq='D', periods=10000)
+            self.idx.freq = None
+        else:
+            self.idx = date_range(start='1/1/1700', freq=freq, periods=10000)
 
-    def time_infer_freq(self):
-        infer_freq(self.a)
+    def time_infer_freq(self, freq):
+        infer_freq(self.idx)
 
 
 class TimeDatetimeConverter(object):
-    goal_time = 0.2
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
+        N = 100000
+        self.rng = date_range(start='1/1/2000', periods=N, freq='T')
 
     def time_convert(self):
         DatetimeConverter.convert(self.rng, None, None)
 
 
 class Iteration(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.N = 1000000
-        self.M = 10000
-        self.idx1 = date_range(start='20140101', freq='T', periods=self.N)
-        self.idx2 = period_range(start='20140101', freq='T', periods=self.N)
-
-    def iter_n(self, iterable, n=None):
-        self.i = 0
-        for _ in iterable:
-            self.i += 1
-            if ((n is not None) and (self.i > n)):
-                break
 
-    def time_iter_datetimeindex(self):
-        self.iter_n(self.idx1)
+    params = [date_range, period_range]
+    param_names = ['time_index']
 
-    def time_iter_datetimeindex_preexit(self):
-        self.iter_n(self.idx1, self.M)
+    def setup(self, time_index):
+        N = 10**6
+        self.idx = time_index(start='20140101', freq='T', periods=N)
+        self.exit = 10000
 
-    def time_iter_periodindex(self):
-        self.iter_n(self.idx2)
-
-    def time_iter_periodindex_preexit(self):
-        self.iter_n(self.idx2, self.M)
+    def time_iter(self, time_index):
+        for _ in self.idx:
+            pass
 
+    def time_iter_preexit(self, time_index):
+        for i, _ in enumerate(self.idx):
+            if i > self.exit:
+                break
 
-#----------------------------------------------------------------------
-# Resampling
 
 class ResampleDataFrame(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng = date_range(start='20130101', periods=100000, freq='50L')
-        self.df = DataFrame(np.random.randn(100000, 2), index=self.rng)
-
-    def time_max_numpy(self):
-        self.df.resample('1s', how=np.max)
 
-    def time_max_string(self):
-        self.df.resample('1s', how='max')
+    params = ['max', 'mean', 'min']
+    param_names = ['method']
 
-    def time_mean_numpy(self):
-        self.df.resample('1s', how=np.mean)
+    def setup(self, method):
+        rng = date_range(start='20130101', periods=100000, freq='50L')
+        df = DataFrame(np.random.randn(100000, 2), index=rng)
+        self.resample = getattr(df.resample('1s'), method)
 
-    def time_mean_string(self):
-        self.df.resample('1s', how='mean')
-
-    def time_min_numpy(self):
-        self.df.resample('1s', how=np.min)
-
-    def time_min_string(self):
-        self.df.resample('1s', how='min')
+    def time_method(self, method):
+        self.resample()
 
 
 class ResampleSeries(object):
-    goal_time = 0.2
-
-    def setup(self):
-        self.rng1 = period_range(start='1/1/2000', end='1/1/2001', freq='T')
-        self.ts1 = Series(np.random.randn(len(self.rng1)), index=self.rng1)
-
-        self.rng2 = date_range(start='1/1/2000', end='1/1/2001', freq='T')
-        self.ts2 = Series(np.random.randn(len(self.rng2)), index=self.rng2)
 
-        self.rng3 = date_range(start='2000-01-01 00:00:00', end='2000-01-01 10:00:00', freq='555000U')
-        self.int_ts = Series(5, self.rng3, dtype='int64')
-        self.dt_ts = self.int_ts.astype('datetime64[ns]')
+    params = (['period', 'datetime'], ['5min', '1D'], ['mean', 'ohlc'])
+    param_names = ['index', 'freq', 'method']
 
-    def time_period_downsample_mean(self):
-        self.ts1.resample('D', how='mean')
+    def setup(self, index, freq, method):
+        indexes = {'period': period_range(start='1/1/2000',
+                                          end='1/1/2001',
+                                          freq='T'),
+                   'datetime': date_range(start='1/1/2000',
+                                          end='1/1/2001',
+                                          freq='T')}
+        idx = indexes[index]
+        ts = Series(np.random.randn(len(idx)), index=idx)
+        self.resample = getattr(ts.resample(freq), method)
 
-    def time_timestamp_downsample_mean(self):
-        self.ts2.resample('D', how='mean')
+    def time_resample(self, index, freq, method):
+        self.resample()
 
-    def time_resample_datetime64(self):
-        # GH 7754
-        self.dt_ts.resample('1S', how='last')
 
-    def time_1min_5min_mean(self):
-        self.ts2[:10000].resample('5min', how='mean')
+class ResampleDatetetime64(object):
+    # GH 7754
+    def setup(self):
+        rng3 = date_range(start='2000-01-01 00:00:00',
+                          end='2000-01-01 10:00:00', freq='555000U')
+        self.dt_ts = Series(5, rng3, dtype='datetime64[ns]')
 
-    def time_1min_5min_ohlc(self):
-        self.ts2[:10000].resample('5min', how='ohlc')
+    def time_resample(self):
+        self.dt_ts.resample('1S').last()
 
 
 class AsOf(object):
-    goal_time = 0.2
 
-    def setup(self):
-        self.N = 10000
-        self.rng = date_range(start='1/1/1990', periods=self.N, freq='53s')
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-        self.dates = date_range(start='1/1/1990', periods=(self.N * 10), freq='5s')
+    params = ['DataFrame', 'Series']
+    param_names = ['constructor']
+
+    def setup(self, constructor):
+        N = 10000
+        M = 10
+        rng = date_range(start='1/1/1990', periods=N, freq='53s')
+        data = {'DataFrame': DataFrame(np.random.randn(N, M)),
+                'Series': Series(np.random.randn(N))}
+        self.ts = data[constructor]
+        self.ts.index = rng
         self.ts2 = self.ts.copy()
-        self.ts2[250:5000] = np.nan
+        self.ts2.iloc[250:5000] = np.nan
         self.ts3 = self.ts.copy()
-        self.ts3[-5000:] = np.nan
+        self.ts3.iloc[-5000:] = np.nan
+        self.dates = date_range(start='1/1/1990', periods=N * 10, freq='5s')
+        self.date = self.dates[0]
+        self.date_last = self.dates[-1]
+        self.date_early = self.date - timedelta(10)
 
     # test speed of pre-computing NAs.
-    def time_asof(self):
+    def time_asof(self, constructor):
         self.ts.asof(self.dates)
 
     # should be roughly the same as above.
-    def time_asof_nan(self):
+    def time_asof_nan(self, constructor):
         self.ts2.asof(self.dates)
 
     # test speed of the code path for a scalar index
     # without *while* loop
-    def time_asof_single(self):
-        self.ts.asof(self.dates[0])
+    def time_asof_single(self, constructor):
+        self.ts.asof(self.date)
 
     # test speed of the code path for a scalar index
     # before the start. should be the same as above.
-    def time_asof_single_early(self):
-        self.ts.asof(self.dates[0] - dt.timedelta(10))
+    def time_asof_single_early(self, constructor):
+        self.ts.asof(self.date_early)
 
     # test the speed of the code path for a scalar index
     # with a long *while* loop. should still be much
     # faster than pre-computing all the NAs.
-    def time_asof_nan_single(self):
-        self.ts3.asof(self.dates[-1])
+    def time_asof_nan_single(self, constructor):
+        self.ts3.asof(self.date_last)
 
 
-class AsOfDataFrame(object):
-    goal_time = 0.2
+class SortIndex(object):
 
-    def setup(self):
-        self.N = 10000
-        self.M = 100
-        self.rng = date_range(start='1/1/1990', periods=self.N, freq='53s')
-        self.dates = date_range(start='1/1/1990', periods=(self.N * 10), freq='5s')
-        self.ts = DataFrame(np.random.randn(self.N, self.M), index=self.rng)
-        self.ts2 = self.ts.copy()
-        self.ts2.iloc[250:5000] = np.nan
-        self.ts3 = self.ts.copy()
-        self.ts3.iloc[-5000:] = np.nan
+    params = [True, False]
+    param_names = ['monotonic']
 
-    # test speed of pre-computing NAs.
-    def time_asof(self):
-        self.ts.asof(self.dates)
-
-    # should be roughly the same as above.
-    def time_asof_nan(self):
-        self.ts2.asof(self.dates)
+    def setup(self, monotonic):
+        N = 10**5
+        idx = date_range(start='1/1/2000', periods=N, freq='s')
+        self.s = Series(np.random.randn(N), index=idx)
+        if not monotonic:
+            self.s = self.s.sample(frac=1)
 
-    # test speed of the code path for a scalar index
-    # with pre-computing all NAs.
-    def time_asof_single(self):
-        self.ts.asof(self.dates[0])
+    def time_sort_index(self, monotonic):
+        self.s.sort_index()
 
-    # should be roughly the same as above.
-    def time_asof_nan_single(self):
-        self.ts3.asof(self.dates[-1])
+    def time_get_slice(self, monotonic):
+        self.s[:10000]
 
-    # test speed of the code path for a scalar index
-    # before the start. should be without the cost of
-    # pre-computing all the NAs.
-    def time_asof_single_early(self):
-        self.ts.asof(self.dates[0] - dt.timedelta(10))
 
-
-class TimeSeries(object):
-    goal_time = 0.2
+class IrregularOps(object):
 
     def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='s')
-        self.rng = self.rng.take(np.random.permutation(self.N))
-        self.ts = Series(np.random.randn(self.N), index=self.rng)
-
-        self.rng2 = date_range(start='1/1/2000', periods=self.N, freq='T')
-        self.ts2 = Series(np.random.randn(self.N), index=self.rng2)
+        N = 10**5
+        idx = date_range(start='1/1/2000', periods=N, freq='s')
+        s = Series(np.random.randn(N), index=idx)
+        self.left = s.sample(frac=1)
+        self.right = s.sample(frac=1)
 
-        self.lindex = np.random.permutation(self.N)[:(self.N // 2)]
-        self.rindex = np.random.permutation(self.N)[:(self.N // 2)]
-        self.left = Series(self.ts2.values.take(self.lindex), index=self.ts2.index.take(self.lindex))
-        self.right = Series(self.ts2.values.take(self.rindex), index=self.ts2.index.take(self.rindex))
+    def time_add(self):
+        self.left + self.right
 
-        self.rng3 = date_range(start='1/1/2000', periods=1500000, freq='S')
-        self.ts3 = Series(1, index=self.rng3)
 
-    def time_sort_index(self):
-        self.ts.sort_index()
+class Lookup(object):
 
-    def time_timeseries_slice_minutely(self):
-        self.ts2[:10000]
-
-    def time_add_irregular(self):
-        (self.left + self.right)
+    def setup(self):
+        N = 1500000
+        rng = date_range(start='1/1/2000', periods=N, freq='S')
+        self.ts = Series(1, index=rng)
+        self.lookup_val = rng[N // 2]
 
-    def time_large_lookup_value(self):
-        self.ts3[self.ts3.index[(len(self.ts3) // 2)]]
-        self.ts3.index._cleanup()
+    def time_lookup_and_cleanup(self):
+        self.ts[self.lookup_val]
+        self.ts.index._cleanup()
 
 
-class SeriesArithmetic(object):
-    goal_time = 0.2
+class ToDatetimeYYYYMMDD(object):
 
     def setup(self):
-        self.N = 100000
-        self.s = Series(date_range(start='20140101', freq='T', periods=self.N))
-        self.delta_offset = pd.offsets.Day()
-        self.fast_offset = pd.offsets.DateOffset(months=2, days=2)
-        self.slow_offset = pd.offsets.BusinessDay()
-
-    def time_add_offset_delta(self):
-        (self.s + self.delta_offset)
+        rng = date_range(start='1/1/2000', periods=10000, freq='D')
+        self.stringsD = Series(rng.strftime('%Y%m%d'))
 
-    def time_add_offset_fast(self):
-        (self.s + self.fast_offset)
-
-    def time_add_offset_slow(self):
-        (self.s + self.slow_offset)
+    def time_format_YYYYMMDD(self):
+        to_datetime(self.stringsD, format='%Y%m%d')
 
 
-class ToDatetime(object):
-    goal_time = 0.2
+class ToDatetimeISO8601(object):
 
     def setup(self):
-        self.rng = date_range(start='1/1/2000', periods=10000, freq='D')
-        self.stringsD = Series((((self.rng.year * 10000) + (self.rng.month * 100)) + self.rng.day), dtype=np.int64).apply(str)
-
-        self.rng = date_range(start='1/1/2000', periods=20000, freq='H')
-        self.strings = [x.strftime('%Y-%m-%d %H:%M:%S') for x in self.rng]
-        self.strings_nosep = [x.strftime('%Y%m%d %H:%M:%S') for x in self.rng]
+        rng = date_range(start='1/1/2000', periods=20000, freq='H')
+        self.strings = rng.strftime('%Y-%m-%d %H:%M:%S').tolist()
+        self.strings_nosep = rng.strftime('%Y%m%d %H:%M:%S').tolist()
         self.strings_tz_space = [x.strftime('%Y-%m-%d %H:%M:%S') + ' -0800'
-                                 for x in self.rng]
-
-        self.s = Series((['19MAY11', '19MAY11:00:00:00'] * 100000))
-        self.s2 = self.s.str.replace(':\\S+$', '')
-
-    def time_format_YYYYMMDD(self):
-        to_datetime(self.stringsD, format='%Y%m%d')
+                                 for x in rng]
 
     def time_iso8601(self):
         to_datetime(self.strings)
@@ -360,138 +324,105 @@ def time_iso8601_format_no_sep(self):
     def time_iso8601_tz_spaceformat(self):
         to_datetime(self.strings_tz_space)
 
-    def time_format_exact(self):
-        to_datetime(self.s2, format='%d%b%y')
-
-    def time_format_no_exact(self):
-        to_datetime(self.s, format='%d%b%y', exact=False)
-
 
-class Offsets(object):
-    goal_time = 0.2
+class ToDatetimeNONISO8601(object):
 
     def setup(self):
-        self.date = dt.datetime(2011, 1, 1)
-        self.dt64 = np.datetime64('2011-01-01 09:00Z')
-        self.hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-        self.day = pd.offsets.Day()
-        self.year = pd.offsets.YearBegin()
-        self.cday = pd.offsets.CustomBusinessDay()
-        self.cmb = pd.offsets.CustomBusinessMonthBegin(calendar=self.hcal)
-        self.cme = pd.offsets.CustomBusinessMonthEnd(calendar=self.hcal)
-        self.cdayh = pd.offsets.CustomBusinessDay(calendar=self.hcal)
-
-    def time_timeseries_day_apply(self):
-        self.day.apply(self.date)
-
-    def time_timeseries_day_incr(self):
-        (self.date + self.day)
-
-    def time_timeseries_year_apply(self):
-        self.year.apply(self.date)
+        N = 10000
+        half = int(N / 2)
+        ts_string_1 = 'March 1, 2018 12:00:00+0400'
+        ts_string_2 = 'March 1, 2018 12:00:00+0500'
+        self.same_offset = [ts_string_1] * N
+        self.diff_offset = [ts_string_1] * half + [ts_string_2] * half
 
-    def time_timeseries_year_incr(self):
-        (self.date + self.year)
+    def time_same_offset(self):
+        to_datetime(self.same_offset)
 
-    # custom business offsets
+    def time_different_offset(self):
+        to_datetime(self.diff_offset)
 
-    def time_custom_bday_decr(self):
-        (self.date - self.cday)
 
-    def time_custom_bday_incr(self):
-        (self.date + self.cday)
+class ToDatetimeFormatQuarters(object):
 
-    def time_custom_bday_apply(self):
-        self.cday.apply(self.date)
-
-    def time_custom_bday_apply_dt64(self):
-        self.cday.apply(self.dt64)
-
-    def time_custom_bday_cal_incr(self):
-        self.date + 1 * self.cdayh
+    def setup(self):
+        self.s = Series(['2Q2005', '2Q05', '2005Q1', '05Q1'] * 10000)
 
-    def time_custom_bday_cal_decr(self):
-        self.date - 1 * self.cdayh
+    def time_infer_quarter(self):
+        to_datetime(self.s)
 
-    def time_custom_bday_cal_incr_n(self):
-        self.date + 10 * self.cdayh
 
-    def time_custom_bday_cal_incr_neg_n(self):
-        self.date - 10 * self.cdayh
+class ToDatetimeFormat(object):
 
-    # Increment custom business month
+    def setup(self):
+        self.s = Series(['19MAY11', '19MAY11:00:00:00'] * 100000)
+        self.s2 = self.s.str.replace(':\\S+$', '')
 
-    def time_custom_bmonthend_incr(self):
-        (self.date + self.cme)
+    def time_exact(self):
+        to_datetime(self.s2, format='%d%b%y')
 
-    def time_custom_bmonthend_incr_n(self):
-        (self.date + (10 * self.cme))
+    def time_no_exact(self):
+        to_datetime(self.s, format='%d%b%y', exact=False)
 
-    def time_custom_bmonthend_decr_n(self):
-        (self.date - (10 * self.cme))
 
-    def time_custom_bmonthbegin_decr_n(self):
-        (self.date - (10 * self.cmb))
+class ToDatetimeCache(object):
 
-    def time_custom_bmonthbegin_incr_n(self):
-        (self.date + (10 * self.cmb))
+    params = [True, False]
+    param_names = ['cache']
 
+    def setup(self, cache):
+        N = 10000
+        self.unique_numeric_seconds = list(range(N))
+        self.dup_numeric_seconds = [1000] * N
+        self.dup_string_dates = ['2000-02-11'] * N
+        self.dup_string_with_tz = ['2000-02-11 15:00:00-0800'] * N
 
-class SemiMonthOffset(object):
-    goal_time = 0.2
+    def time_unique_seconds_and_unit(self, cache):
+        to_datetime(self.unique_numeric_seconds, unit='s', cache=cache)
 
-    def setup(self):
-        self.N = 100000
-        self.rng = date_range(start='1/1/2000', periods=self.N, freq='T')
-        # date is not on an offset which will be slowest case
-        self.date = dt.datetime(2011, 1, 2)
-        self.semi_month_end = pd.offsets.SemiMonthEnd()
-        self.semi_month_begin = pd.offsets.SemiMonthBegin()
+    def time_dup_seconds_and_unit(self, cache):
+        to_datetime(self.dup_numeric_seconds, unit='s', cache=cache)
 
-    def time_end_apply(self):
-        self.semi_month_end.apply(self.date)
+    def time_dup_string_dates(self, cache):
+        to_datetime(self.dup_string_dates, cache=cache)
 
-    def time_end_incr(self):
-        self.date + self.semi_month_end
+    def time_dup_string_dates_and_format(self, cache):
+        to_datetime(self.dup_string_dates, format='%Y-%m-%d', cache=cache)
 
-    def time_end_incr_n(self):
-        self.date + 10 * self.semi_month_end
+    def time_dup_string_tzoffset_dates(self, cache):
+        to_datetime(self.dup_string_with_tz, cache=cache)
 
-    def time_end_decr(self):
-        self.date - self.semi_month_end
 
-    def time_end_decr_n(self):
-        self.date - 10 * self.semi_month_end
+class DatetimeAccessor(object):
 
-    def time_end_apply_index(self):
-        self.semi_month_end.apply_index(self.rng)
+    params = [None, 'US/Eastern', 'UTC', dateutil.tz.tzutc()]
+    param_names = 'tz'
 
-    def time_end_incr_rng(self):
-        self.rng + self.semi_month_end
+    def setup(self, tz):
+        N = 100000
+        self.series = Series(
+            date_range(start='1/1/2000', periods=N, freq='T', tz=tz)
+        )
 
-    def time_end_decr_rng(self):
-        self.rng - self.semi_month_end
+    def time_dt_accessor(self, tz):
+        self.series.dt
 
-    def time_begin_apply(self):
-        self.semi_month_begin.apply(self.date)
+    def time_dt_accessor_normalize(self, tz):
+        self.series.dt.normalize()
 
-    def time_begin_incr(self):
-        self.date + self.semi_month_begin
+    def time_dt_accessor_month_name(self, tz):
+        self.series.dt.month_name()
 
-    def time_begin_incr_n(self):
-        self.date + 10 * self.semi_month_begin
+    def time_dt_accessor_day_name(self, tz):
+        self.series.dt.day_name()
 
-    def time_begin_decr(self):
-        self.date - self.semi_month_begin
+    def time_dt_accessor_time(self, tz):
+        self.series.dt.time
 
-    def time_begin_decr_n(self):
-        self.date - 10 * self.semi_month_begin
+    def time_dt_accessor_date(self, tz):
+        self.series.dt.date
 
-    def time_begin_apply_index(self):
-        self.semi_month_begin.apply_index(self.rng)
+    def time_dt_accessor_year(self, tz):
+        self.series.dt.year
 
-    def time_begin_incr_rng(self):
-        self.rng + self.semi_month_begin
 
-    def time_begin_decr_rng(self):
-        self.rng - self.semi_month_begin
+from .pandas_vb_common import setup  # noqa: F401
diff --git a/asv_bench/benchmarks/timestamp.py b/asv_bench/benchmarks/timestamp.py
new file mode 100644
index 0000000000000..b45ae22650e17
--- /dev/null
+++ b/asv_bench/benchmarks/timestamp.py
@@ -0,0 +1,140 @@
+import datetime
+
+import dateutil
+import pytz
+
+from pandas import Timestamp
+
+
+class TimestampConstruction(object):
+
+    def time_parse_iso8601_no_tz(self):
+        Timestamp('2017-08-25 08:16:14')
+
+    def time_parse_iso8601_tz(self):
+        Timestamp('2017-08-25 08:16:14-0500')
+
+    def time_parse_dateutil(self):
+        Timestamp('2017/08/25 08:16:14 AM')
+
+    def time_parse_today(self):
+        Timestamp('today')
+
+    def time_parse_now(self):
+        Timestamp('now')
+
+    def time_fromordinal(self):
+        Timestamp.fromordinal(730120)
+
+    def time_fromtimestamp(self):
+        Timestamp.fromtimestamp(1515448538)
+
+
+class TimestampProperties(object):
+    _tzs = [None, pytz.timezone('Europe/Amsterdam'), pytz.UTC,
+            dateutil.tz.tzutc()]
+    _freqs = [None, 'B']
+    params = [_tzs, _freqs]
+    param_names = ['tz', 'freq']
+
+    def setup(self, tz, freq):
+        self.ts = Timestamp('2017-08-25 08:16:14', tzinfo=tz, freq=freq)
+
+    def time_tz(self, tz, freq):
+        self.ts.tz
+
+    def time_dayofweek(self, tz, freq):
+        self.ts.dayofweek
+
+    def time_weekday_name(self, tz, freq):
+        self.ts.day_name
+
+    def time_dayofyear(self, tz, freq):
+        self.ts.dayofyear
+
+    def time_week(self, tz, freq):
+        self.ts.week
+
+    def time_quarter(self, tz, freq):
+        self.ts.quarter
+
+    def time_days_in_month(self, tz, freq):
+        self.ts.days_in_month
+
+    def time_freqstr(self, tz, freq):
+        self.ts.freqstr
+
+    def time_is_month_start(self, tz, freq):
+        self.ts.is_month_start
+
+    def time_is_month_end(self, tz, freq):
+        self.ts.is_month_end
+
+    def time_is_quarter_start(self, tz, freq):
+        self.ts.is_quarter_start
+
+    def time_is_quarter_end(self, tz, freq):
+        self.ts.is_quarter_end
+
+    def time_is_year_start(self, tz, freq):
+        self.ts.is_year_start
+
+    def time_is_year_end(self, tz, freq):
+        self.ts.is_year_end
+
+    def time_is_leap_year(self, tz, freq):
+        self.ts.is_leap_year
+
+    def time_microsecond(self, tz, freq):
+        self.ts.microsecond
+
+    def time_month_name(self, tz, freq):
+        self.ts.month_name()
+
+
+class TimestampOps(object):
+    params = [None, 'US/Eastern', pytz.UTC,
+              dateutil.tz.tzutc()]
+    param_names = ['tz']
+
+    def setup(self, tz):
+        self.ts = Timestamp('2017-08-25 08:16:14', tz=tz)
+
+    def time_replace_tz(self, tz):
+        self.ts.replace(tzinfo=pytz.timezone('US/Eastern'))
+
+    def time_replace_None(self, tz):
+        self.ts.replace(tzinfo=None)
+
+    def time_to_pydatetime(self, tz):
+        self.ts.to_pydatetime()
+
+    def time_normalize(self, tz):
+        self.ts.normalize()
+
+    def time_tz_convert(self, tz):
+        if self.ts.tz is not None:
+            self.ts.tz_convert(tz)
+
+    def time_tz_localize(self, tz):
+        if self.ts.tz is None:
+            self.ts.tz_localize(tz)
+
+    def time_to_julian_date(self, tz):
+        self.ts.to_julian_date()
+
+    def time_floor(self, tz):
+        self.ts.floor('5T')
+
+    def time_ceil(self, tz):
+        self.ts.ceil('5T')
+
+
+class TimestampAcrossDst(object):
+    def setup(self):
+        dt = datetime.datetime(2016, 3, 27, 1)
+        self.tzinfo = pytz.timezone('CET').localize(dt, is_dst=False).tzinfo
+        self.ts2 = Timestamp(dt)
+
+    def time_replace_across_dst(self):
+        self.ts2.replace(tzinfo=self.tzinfo)
diff --git a/asv_bench/vbench_to_asv.py b/asv_bench/vbench_to_asv.py
deleted file mode 100644
index c3041ec2b1ba1..0000000000000
--- a/asv_bench/vbench_to_asv.py
+++ /dev/null
@@ -1,163 +0,0 @@
-import ast
-import vbench
-import os
-import sys
-import astor
-import glob
-
-
-def vbench_to_asv_source(bench, kinds=None):
-    tab = ' ' * 4
-    if kinds is None:
-        kinds = ['time']
-
-    output = 'class {}(object):\n'.format(bench.name)
-    output += tab + 'goal_time = 0.2\n\n'
-
-    if bench.setup:
-        indented_setup = [tab * 2 + '{}\n'.format(x) for x in bench.setup.splitlines()]
-        output += tab + 'def setup(self):\n' + ''.join(indented_setup) + '\n'
-
-    for kind in kinds:
-        output += tab + 'def {}_{}(self):\n'.format(kind, bench.name)
-        for line in bench.code.splitlines():
-            output += tab * 2 + line + '\n'
-        output += '\n\n'
-
-    if bench.cleanup:
-        output += tab + 'def teardown(self):\n' + tab * 2 + bench.cleanup
-
-    output += '\n\n'
-    return output
-
-
-class AssignToSelf(ast.NodeTransformer):
-    def __init__(self):
-        super(AssignToSelf, self).__init__()
-        self.transforms = {}
-        self.imports = []
-
-        self.in_class_define = False
-        self.in_setup = False
-
-    def visit_ClassDef(self, node):
-        self.transforms = {}
-        self.in_class_define = True
-
-        functions_to_promote = []
-        setup_func = None
-
-        for class_func in ast.iter_child_nodes(node):
-            if isinstance(class_func, ast.FunctionDef):
-                if class_func.name == 'setup':
-                    setup_func = class_func
-                    for anon_func in ast.iter_child_nodes(class_func):
-                        if isinstance(anon_func, ast.FunctionDef):
-                            functions_to_promote.append(anon_func)
-
-        if setup_func:
-            for func in functions_to_promote:
-                setup_func.body.remove(func)
-                func.args.args.insert(0, ast.Name(id='self', ctx=ast.Load()))
-                node.body.append(func)
-                self.transforms[func.name] = 'self.' + func.name
-
-            ast.fix_missing_locations(node)
-
-        self.generic_visit(node)
-
-        return node
-
-    def visit_TryExcept(self, node):
-        if any([isinstance(x, (ast.Import, ast.ImportFrom)) for x in node.body]):
-            self.imports.append(node)
-        else:
-            self.generic_visit(node)
-            return node
-
-    def visit_Assign(self, node):
-        for target in node.targets:
-            if isinstance(target, ast.Name) and not isinstance(target.ctx, ast.Param) and not self.in_class_define:
-                self.transforms[target.id] = 'self.' + target.id
-        self.generic_visit(node)
-
-        return node
-
-    def visit_Name(self, node):
-        new_node = node
-        if node.id in self.transforms:
-            if not isinstance(node.ctx, ast.Param):
-                new_node = ast.Attribute(value=ast.Name(id='self', ctx=node.ctx), attr=node.id, ctx=node.ctx)
-
-        self.generic_visit(node)
-
-        return ast.copy_location(new_node, node)
-
-    def visit_Import(self, node):
-        self.imports.append(node)
-
-    def visit_ImportFrom(self, node):
-        self.imports.append(node)
-
-    def visit_FunctionDef(self, node):
-        """Delete functions that are empty due to imports being moved"""
-        self.in_class_define = False
-
-        self.generic_visit(node)
-
-        if node.body:
-            return node
-
-
-def translate_module(target_module):
-    g_vars = {}
-    l_vars = {}
-    exec('import ' + target_module) in g_vars
-
-    print target_module
-    module = eval(target_module, g_vars)
-
-    benchmarks = []
-    for obj_str in dir(module):
-        obj = getattr(module, obj_str)
-        if isinstance(obj, vbench.benchmark.Benchmark):
-            benchmarks.append(obj)
-
-    if not benchmarks:
-        return
-
-    rewritten_output = ''
-    for bench in benchmarks:
-        rewritten_output += vbench_to_asv_source(bench)
-
-    with open('rewrite.py', 'w') as f:
-        f.write(rewritten_output)
-
-    ast_module = ast.parse(rewritten_output)
-
-    transformer = AssignToSelf()
-    transformed_module = transformer.visit(ast_module)
-
-    unique_imports = {astor.to_source(node): node for node in transformer.imports}
-
-    transformed_module.body = unique_imports.values() + transformed_module.body
-
-    transformed_source = astor.to_source(transformed_module)
-
-    with open('benchmarks/{}.py'.format(target_module), 'w') as f:
-        f.write(transformed_source)
-
-
-if __name__ == '__main__':
-    cwd = os.getcwd()
-    new_dir = os.path.join(os.path.dirname(__file__), '../vb_suite')
-    sys.path.insert(0, new_dir)
-
-    for module in glob.glob(os.path.join(new_dir, '*.py')):
-        mod = os.path.basename(module)
-        if mod in ['make.py', 'measure_memory_consumption.py', 'perf_HEAD.py', 'run_suite.py', 'test_perf.py', 'generate_rst_files.py', 'test.py', 'suite.py']:
-            continue
-        print
-        print mod
-
-        translate_module(mod.replace('.py', ''))
diff --git a/azure-pipelines.yml b/azure-pipelines.yml
new file mode 100644
index 0000000000000..f0567d76659b6
--- /dev/null
+++ b/azure-pipelines.yml
@@ -0,0 +1,119 @@
+# Adapted from https://github.com/numba/numba/blob/master/azure-pipelines.yml
+jobs:
+# Mac and Linux use the same template
+- template: ci/azure/posix.yml
+  parameters:
+    name: macOS
+    vmImage: xcode9-macos10.13
+- template: ci/azure/posix.yml
+  parameters:
+    name: Linux
+    vmImage: ubuntu-16.04
+
+# Windows Python 2.7 needs VC 9.0 installed, handled in the template
+- template: ci/azure/windows.yml
+  parameters:
+    name: Windows
+    vmImage: vs2017-win2016
+
+- job: 'Checks_and_doc'
+  pool:
+    vmImage: ubuntu-16.04
+  timeoutInMinutes: 90
+  steps:
+  - script: |
+      # XXX next command should avoid redefining the path in every step, but
+      # made the process crash as it couldn't find deactivate
+      #echo '##vso[task.prependpath]$HOME/miniconda3/bin'
+      echo '##vso[task.setvariable variable=CONDA_ENV]pandas-dev'
+      echo '##vso[task.setvariable variable=ENV_FILE]environment.yml'
+      echo '##vso[task.setvariable variable=AZURE]true'
+    displayName: 'Setting environment variables'
+
+  # Do not require a conda environment
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      ci/code_checks.sh patterns
+    displayName: 'Looking for unwanted patterns'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      sudo apt-get install -y libc6-dev-i386
+      ci/incremental/install_miniconda.sh
+      ci/incremental/setup_conda_environment.sh
+    displayName: 'Set up environment'
+    condition: true
+
+  # Do not require pandas
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/code_checks.sh lint
+    displayName: 'Linting'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/code_checks.sh dependencies
+    displayName: 'Dependencies consistency'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/incremental/build.sh
+    displayName: 'Build'
+    condition: true
+
+  # Require pandas
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/code_checks.sh code
+    displayName: 'Checks on imported code'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/code_checks.sh doctests
+    displayName: 'Running doctests'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      ci/code_checks.sh docstrings
+    displayName: 'Docstring validation'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      pytest --capture=no --strict scripts
+    displayName: 'Testing docstring validaton script'
+    condition: true
+
+  - script: |
+      export PATH=$HOME/miniconda3/bin:$PATH
+      source activate pandas-dev
+      git remote add upstream https://github.com/pandas-dev/pandas.git
+      git fetch upstream
+      if git diff upstream/master --name-only | grep -q "^asv_bench/"; then
+          cd asv_bench
+          asv machine --yes
+          ASV_OUTPUT="$(asv dev)"
+          if [[ $(echo "$ASV_OUTPUT" | grep "failed") ]]; then
+              echo "##vso[task.logissue type=error]Benchmarks run with errors"
+              echo "$ASV_OUTPUT"
+              exit 1
+          else
+              echo "Benchmarks run without errors"
+          fi
+      else
+          echo "Benchmarks did not run, no changes detected"
+      fi
+    displayName: 'Running benchmarks'
+    condition: true
diff --git a/bench/alignment.py b/bench/alignment.py
deleted file mode 100644
index bc3134f597ee0..0000000000000
--- a/bench/alignment.py
+++ /dev/null
@@ -1,22 +0,0 @@
-# Setup
-from pandas.compat import range, lrange
-import numpy as np
-import pandas
-import la
-N = 1000
-K = 50
-arr1 = np.random.randn(N, K)
-arr2 = np.random.randn(N, K)
-idx1 = lrange(N)
-idx2 = lrange(K)
-
-# pandas
-dma1 = pandas.DataFrame(arr1, idx1, idx2)
-dma2 = pandas.DataFrame(arr2, idx1[::-1], idx2[::-1])
-
-# larry
-lar1 = la.larry(arr1, [idx1, idx2])
-lar2 = la.larry(arr2, [idx1[::-1], idx2[::-1]])
-
-for i in range(100):
-    result = lar1 + lar2
diff --git a/bench/bench_dense_to_sparse.py b/bench/bench_dense_to_sparse.py
deleted file mode 100644
index e1dcd3456e88d..0000000000000
--- a/bench/bench_dense_to_sparse.py
+++ /dev/null
@@ -1,14 +0,0 @@
-from pandas import *
-
-K = 100
-N = 100000
-rng = DatetimeIndex('1/1/2000', periods=N, offset=datetools.Minute())
-
-rng2 = np.asarray(rng).astype('M8[us]').astype('i8')
-
-series = {}
-for i in range(1, K + 1):
-    data = np.random.randn(N)[:-i]
-    this_rng = rng2[:-i]
-    data[100:] = np.nan
-    series[i] = SparseSeries(data, index=this_rng)
diff --git a/bench/bench_get_put_value.py b/bench/bench_get_put_value.py
deleted file mode 100644
index 427e0b1b10a22..0000000000000
--- a/bench/bench_get_put_value.py
+++ /dev/null
@@ -1,56 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-N = 1000
-K = 50
-
-
-def _random_index(howmany):
-    return Index([rands(10) for _ in range(howmany)])
-
-df = DataFrame(np.random.randn(N, K), index=_random_index(N),
-               columns=_random_index(K))
-
-
-def get1():
-    for col in df.columns:
-        for row in df.index:
-            _ = df[col][row]
-
-
-def get2():
-    for col in df.columns:
-        for row in df.index:
-            _ = df.get_value(row, col)
-
-
-def put1():
-    for col in df.columns:
-        for row in df.index:
-            df[col][row] = 0
-
-
-def put2():
-    for col in df.columns:
-        for row in df.index:
-            df.set_value(row, col, 0)
-
-
-def resize1():
-    buf = DataFrame()
-    for col in df.columns:
-        for row in df.index:
-            buf = buf.set_value(row, col, 5.)
-    return buf
-
-
-def resize2():
-    from collections import defaultdict
-
-    buf = defaultdict(dict)
-    for col in df.columns:
-        for row in df.index:
-            buf[col][row] = 5.
-
-    return DataFrame(buf)
diff --git a/bench/bench_groupby.py b/bench/bench_groupby.py
deleted file mode 100644
index d7a2853e1e7b2..0000000000000
--- a/bench/bench_groupby.py
+++ /dev/null
@@ -1,66 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-import string
-import random
-
-k = 20000
-n = 10
-
-foo = np.tile(np.array([rands(10) for _ in range(k)], dtype='O'), n)
-foo2 = list(foo)
-random.shuffle(foo)
-random.shuffle(foo2)
-
-df = DataFrame({'A': foo,
-                'B': foo2,
-                'C': np.random.randn(n * k)})
-
-import pandas._sandbox as sbx
-
-
-def f():
-    table = sbx.StringHashTable(len(df))
-    ret = table.factorize(df['A'])
-    return ret
-
-
-def g():
-    table = sbx.PyObjectHashTable(len(df))
-    ret = table.factorize(df['A'])
-    return ret
-
-ret = f()
-
-"""
-import pandas._tseries as lib
-
-f = np.std
-
-
-grouped = df.groupby(['A', 'B'])
-
-label_list = [ping.labels for ping in grouped.groupings]
-shape = [len(ping.ids) for ping in grouped.groupings]
-
-from pandas.core.groupby import get_group_index
-
-
-group_index = get_group_index(label_list, shape,
-                              sort=True, xnull=True).astype('i4')
-
-ngroups = np.prod(shape)
-
-indexer = lib.groupsort_indexer(group_index, ngroups)
-
-values = df['C'].values.take(indexer)
-group_index = group_index.take(indexer)
-
-f = lambda x: x.std(ddof=1)
-
-grouper = lib.Grouper(df['C'], np.ndarray.std, group_index, ngroups)
-result = grouper.get_result()
-
-expected = grouped.std()
-"""
diff --git a/bench/bench_join_panel.py b/bench/bench_join_panel.py
deleted file mode 100644
index f3c3f8ba15f70..0000000000000
--- a/bench/bench_join_panel.py
+++ /dev/null
@@ -1,85 +0,0 @@
-# reasonably efficient
-
-
-def create_panels_append(cls, panels):
-        """ return an append list of panels """
-        panels = [a for a in panels if a is not None]
-        # corner cases
-        if len(panels) == 0:
-                return None
-        elif len(panels) == 1:
-                return panels[0]
-        elif len(panels) == 2 and panels[0] == panels[1]:
-                return panels[0]
-        # import pdb; pdb.set_trace()
-        # create a joint index for the axis
-
-        def joint_index_for_axis(panels, axis):
-                s = set()
-                for p in panels:
-                        s.update(list(getattr(p, axis)))
-                return sorted(list(s))
-
-        def reindex_on_axis(panels, axis, axis_reindex):
-                new_axis = joint_index_for_axis(panels, axis)
-                new_panels = [p.reindex(**{axis_reindex: new_axis,
-                                        'copy': False}) for p in panels]
-                return new_panels, new_axis
-        # create the joint major index, dont' reindex the sub-panels - we are
-        # appending
-        major = joint_index_for_axis(panels, 'major_axis')
-        # reindex on minor axis
-        panels, minor = reindex_on_axis(panels, 'minor_axis', 'minor')
-        # reindex on items
-        panels, items = reindex_on_axis(panels, 'items', 'items')
-        # concatenate values
-        try:
-                values = np.concatenate([p.values for p in panels], axis=1)
-        except Exception as detail:
-                raise Exception("cannot append values that dont' match dimensions! -> [%s] %s"
-                                % (','.join(["%s" % p for p in panels]), str(detail)))
-        # pm('append - create_panel')
-        p = Panel(values, items=items, major_axis=major,
-                  minor_axis=minor)
-        # pm('append - done')
-        return p
-
-
-# does the job but inefficient (better to handle like you read a table in
-# pytables...e.g create a LongPanel then convert to Wide)
-def create_panels_join(cls, panels):
-        """ given an array of panels's, create a single panel """
-        panels = [a for a in panels if a is not None]
-        # corner cases
-        if len(panels) == 0:
-                return None
-        elif len(panels) == 1:
-                return panels[0]
-        elif len(panels) == 2 and panels[0] == panels[1]:
-                return panels[0]
-        d = dict()
-        minor, major, items = set(), set(), set()
-        for panel in panels:
-                items.update(panel.items)
-                major.update(panel.major_axis)
-                minor.update(panel.minor_axis)
-                values = panel.values
-                for item, item_index in panel.items.indexMap.items():
-                        for minor_i, minor_index in panel.minor_axis.indexMap.items():
-                                for major_i, major_index in panel.major_axis.indexMap.items():
-                                        try:
-                                                d[(minor_i, major_i, item)] = values[item_index, major_index, minor_index]
-                                        except:
-                                                pass
-        # stack the values
-        minor = sorted(list(minor))
-        major = sorted(list(major))
-        items = sorted(list(items))
-        # create the 3d stack (items x columns x indicies)
-        data = np.dstack([np.asarray([np.asarray([d.get((minor_i, major_i, item), np.nan)
-                                                  for item in items])
-                                      for major_i in major]).transpose()
-                          for minor_i in minor])
-        # construct the panel
-        return Panel(data, items, major, minor)
-add_class_method(Panel, create_panels_join, 'join_many')
diff --git a/bench/bench_khash_dict.py b/bench/bench_khash_dict.py
deleted file mode 100644
index 054fc36131b65..0000000000000
--- a/bench/bench_khash_dict.py
+++ /dev/null
@@ -1,89 +0,0 @@
-"""
-Some comparisons of khash.h to Python dict
-"""
-from __future__ import print_function
-
-import numpy as np
-import os
-
-from vbench.api import Benchmark
-from pandas.util.testing import rands
-from pandas.compat import range
-import pandas._tseries as lib
-import pandas._sandbox as sbx
-import time
-
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-
-def object_test_data(n):
-    pass
-
-
-def string_test_data(n):
-    return np.array([rands(10) for _ in range(n)], dtype='O')
-
-
-def int_test_data(n):
-    return np.arange(n, dtype='i8')
-
-N = 1000000
-
-#----------------------------------------------------------------------
-# Benchmark 1: map_locations
-
-
-def map_locations_python_object():
-    arr = string_test_data(N)
-    return _timeit(lambda: lib.map_indices_object(arr))
-
-
-def map_locations_khash_object():
-    arr = string_test_data(N)
-
-    def f():
-        table = sbx.PyObjectHashTable(len(arr))
-        table.map_locations(arr)
-    return _timeit(f)
-
-
-def _timeit(f, iterations=10):
-    start = time.time()
-    for _ in range(iterations):
-        foo = f()
-    elapsed = time.time() - start
-    return elapsed
-
-#----------------------------------------------------------------------
-# Benchmark 2: lookup_locations
-
-
-def lookup_python(values):
-    table = lib.map_indices_object(values)
-    return _timeit(lambda: lib.merge_indexer_object(values, table))
-
-
-def lookup_khash(values):
-    table = sbx.PyObjectHashTable(len(values))
-    table.map_locations(values)
-    locs = table.lookup_locations(values)
-    # elapsed = _timeit(lambda: table.lookup_locations2(values))
-    return table
-
-
-def leak(values):
-    for _ in range(100):
-        print(proc.get_memory_info())
-        table = lookup_khash(values)
-        # table.destroy()
-
-arr = string_test_data(N)
-
-#----------------------------------------------------------------------
-# Benchmark 3: unique
-
-#----------------------------------------------------------------------
-# Benchmark 4: factorize
diff --git a/bench/bench_merge.R b/bench/bench_merge.R
deleted file mode 100644
index 3ed4618494857..0000000000000
--- a/bench/bench_merge.R
+++ /dev/null
@@ -1,161 +0,0 @@
-library(plyr)
-library(data.table)
-N <- 10000
-indices = rep(NA, N)
-indices2 = rep(NA, N)
-for (i in 1:N) {
-  indices[i] <- paste(sample(letters, 10), collapse="")
-  indices2[i] <- paste(sample(letters, 10), collapse="")
-}
-left <- data.frame(key=rep(indices[1:8000], 10),
-                   key2=rep(indices2[1:8000], 10),
-                   value=rnorm(80000))
-right <- data.frame(key=indices[2001:10000],
-                    key2=indices2[2001:10000],
-                    value2=rnorm(8000))
-
-right2 <- data.frame(key=rep(right$key, 2),
-                     key2=rep(right$key2, 2),
-                     value2=rnorm(16000))
-
-left.dt <- data.table(left, key=c("key", "key2"))
-right.dt <- data.table(right, key=c("key", "key2"))
-right2.dt <- data.table(right2, key=c("key", "key2"))
-
-# left.dt2 <- data.table(left)
-# right.dt2 <- data.table(right)
-
-## left <- data.frame(key=rep(indices[1:1000], 10),
-##                    key2=rep(indices2[1:1000], 10),
-##                    value=rnorm(100000))
-## right <- data.frame(key=indices[1:1000],
-##                     key2=indices2[1:1000],
-##                     value2=rnorm(10000))
-
-timeit <- function(func, niter=10) {
-  timing = rep(NA, niter)
-  for (i in 1:niter) {
-    gc()
-    timing[i] <- system.time(func())[3]
-  }
-  mean(timing)
-}
-
-left.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all.x=TRUE, sort=sort)
-}
-
-right.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all.y=TRUE, sort=sort)
-}
-
-outer.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all=TRUE, sort=sort)
-}
-
-inner.join <- function(sort=FALSE) {
-  result <- base::merge(left, right, all=FALSE, sort=sort)
-}
-
-left.join.dt <- function(sort=FALSE) {
-  result <- right.dt[left.dt]
-}
-
-right.join.dt <- function(sort=FALSE) {
-  result <- left.dt[right.dt]
-}
-
-outer.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right.dt, all=TRUE, sort=sort)
-}
-
-inner.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right.dt, all=FALSE, sort=sort)
-}
-
-plyr.join <- function(type) {
-  result <- plyr::join(left, right, by=c("key", "key2"),
-                       type=type, match="first")
-}
-
-sort.options <- c(FALSE, TRUE)
-
-# many-to-one
-
-results <- matrix(nrow=4, ncol=3)
-colnames(results) <- c("base::merge", "plyr", "data.table")
-rownames(results) <- c("inner", "outer", "left", "right")
-
-base.functions <- c(inner.join, outer.join, left.join, right.join)
-plyr.functions <- c(function() plyr.join("inner"),
-                    function() plyr.join("full"),
-                    function() plyr.join("left"),
-					function() plyr.join("right"))
-dt.functions <- c(inner.join.dt, outer.join.dt, left.join.dt, right.join.dt)
-for (i in 1:4) {
-  base.func <- base.functions[[i]]
-  plyr.func <- plyr.functions[[i]]
-  dt.func <- dt.functions[[i]]
-  results[i, 1] <- timeit(base.func)
-  results[i, 2] <- timeit(plyr.func)
-  results[i, 3] <- timeit(dt.func)
-}
-
-
-# many-to-many
-
-left.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all.x=TRUE, sort=sort)
-}
-
-right.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all.y=TRUE, sort=sort)
-}
-
-outer.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all=TRUE, sort=sort)
-}
-
-inner.join <- function(sort=FALSE) {
-  result <- base::merge(left, right2, all=FALSE, sort=sort)
-}
-
-left.join.dt <- function(sort=FALSE) {
-  result <- right2.dt[left.dt]
-}
-
-right.join.dt <- function(sort=FALSE) {
-  result <- left.dt[right2.dt]
-}
-
-outer.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right2.dt, all=TRUE, sort=sort)
-}
-
-inner.join.dt <- function(sort=FALSE) {
-  result <- merge(left.dt, right2.dt, all=FALSE, sort=sort)
-}
-
-sort.options <- c(FALSE, TRUE)
-
-# many-to-one
-
-results <- matrix(nrow=4, ncol=3)
-colnames(results) <- c("base::merge", "plyr", "data.table")
-rownames(results) <- c("inner", "outer", "left", "right")
-
-base.functions <- c(inner.join, outer.join, left.join, right.join)
-plyr.functions <- c(function() plyr.join("inner"),
-                    function() plyr.join("full"),
-                    function() plyr.join("left"),
-					function() plyr.join("right"))
-dt.functions <- c(inner.join.dt, outer.join.dt, left.join.dt, right.join.dt)
-for (i in 1:4) {
-  base.func <- base.functions[[i]]
-  plyr.func <- plyr.functions[[i]]
-  dt.func <- dt.functions[[i]]
-  results[i, 1] <- timeit(base.func)
-  results[i, 2] <- timeit(plyr.func)
-  results[i, 3] <- timeit(dt.func)
-}
-
diff --git a/bench/bench_merge.py b/bench/bench_merge.py
deleted file mode 100644
index 330dba7b9af69..0000000000000
--- a/bench/bench_merge.py
+++ /dev/null
@@ -1,105 +0,0 @@
-import random
-import gc
-import time
-from pandas import *
-from pandas.compat import range, lrange, StringIO
-from pandas.util.testing import rands
-
-N = 10000
-ngroups = 10
-
-
-def get_test_data(ngroups=100, n=N):
-    unique_groups = lrange(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    random.shuffle(arr)
-    return arr
-
-# aggregate multiple columns
-# df = DataFrame({'key1' : get_test_data(ngroups=ngroups),
-#                 'key2' : get_test_data(ngroups=ngroups),
-#                 'data1' : np.random.randn(N),
-#                 'data2' : np.random.randn(N)})
-
-# df2 = DataFrame({'key1'  : get_test_data(ngroups=ngroups, n=N//10),
-#                  'key2'  : get_test_data(ngroups=ngroups//2, n=N//10),
-#                  'value' : np.random.randn(N // 10)})
-# result = merge.merge(df, df2, on='key2')
-
-N = 10000
-
-indices = np.array([rands(10) for _ in range(N)], dtype='O')
-indices2 = np.array([rands(10) for _ in range(N)], dtype='O')
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = DataFrame({'key': key, 'key2': key2,
-                  'value': np.random.randn(80000)})
-right = DataFrame({'key': indices[2000:], 'key2': indices2[2000:],
-                   'value2': np.random.randn(8000)})
-
-right2 = right.append(right, ignore_index=True)
-
-
-join_methods = ['inner', 'outer', 'left', 'right']
-results = DataFrame(index=join_methods, columns=[False, True])
-niter = 10
-for sort in [False, True]:
-    for join_method in join_methods:
-        f = lambda: merge(left, right, how=join_method, sort=sort)
-        gc.disable()
-        start = time.time()
-        for _ in range(niter):
-            f()
-        elapsed = (time.time() - start) / niter
-        gc.enable()
-        results[sort][join_method] = elapsed
-# results.columns = ['pandas']
-results.columns = ['dont_sort', 'sort']
-
-
-# R results
-# many to one
-r_results = read_table(StringIO("""      base::merge   plyr data.table
-inner      0.2475 0.1183     0.1100
-outer      0.4213 0.1916     0.2090
-left       0.2998 0.1188     0.0572
-right      0.3102 0.0536     0.0376
-"""), sep='\s+')
-
-presults = results[['dont_sort']].rename(columns={'dont_sort': 'pandas'})
-all_results = presults.join(r_results)
-
-all_results = all_results.div(all_results['pandas'], axis=0)
-
-all_results = all_results.ix[:, ['pandas', 'data.table', 'plyr',
-                                 'base::merge']]
-
-sort_results = DataFrame.from_items([('pandas', results['sort']),
-                                     ('R', r_results['base::merge'])])
-sort_results['Ratio'] = sort_results['R'] / sort_results['pandas']
-
-
-nosort_results = DataFrame.from_items([('pandas', results['dont_sort']),
-                                       ('R', r_results['base::merge'])])
-nosort_results['Ratio'] = nosort_results['R'] / nosort_results['pandas']
-
-# many to many
-
-# many to one
-r_results = read_table(StringIO("""base::merge   plyr data.table
-inner      0.4610 0.1276     0.1269
-outer      0.9195 0.1881     0.2725
-left       0.6559 0.1257     0.0678
-right      0.6425 0.0522     0.0428
-"""), sep='\s+')
-
-all_results = presults.join(r_results)
-all_results = all_results.div(all_results['pandas'], axis=0)
-all_results = all_results.ix[:, ['pandas', 'data.table', 'plyr',
-                                 'base::merge']]
diff --git a/bench/bench_merge_sqlite.py b/bench/bench_merge_sqlite.py
deleted file mode 100644
index 3ad4b810119c3..0000000000000
--- a/bench/bench_merge_sqlite.py
+++ /dev/null
@@ -1,87 +0,0 @@
-import numpy as np
-from collections import defaultdict
-import gc
-import time
-from pandas import DataFrame
-from pandas.util.testing import rands
-from pandas.compat import range, zip
-import random
-
-N = 10000
-
-indices = np.array([rands(10) for _ in range(N)], dtype='O')
-indices2 = np.array([rands(10) for _ in range(N)], dtype='O')
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = DataFrame({'key': key, 'key2': key2,
-                  'value': np.random.randn(80000)})
-right = DataFrame({'key': indices[2000:], 'key2': indices2[2000:],
-                   'value2': np.random.randn(8000)})
-
-# right2 = right.append(right, ignore_index=True)
-# right = right2
-
-# random.shuffle(key2)
-# indices2 = indices.copy()
-# random.shuffle(indices2)
-
-# Prepare Database
-import sqlite3
-create_sql_indexes = True
-
-conn = sqlite3.connect(':memory:')
-conn.execute(
-    'create table left( key varchar(10), key2 varchar(10), value int);')
-conn.execute(
-    'create table right( key varchar(10), key2 varchar(10), value2 int);')
-conn.executemany('insert into left values (?, ?, ?)',
-                 zip(key, key2, left['value']))
-conn.executemany('insert into right values (?, ?, ?)',
-                 zip(right['key'], right['key2'], right['value2']))
-
-# Create Indices
-if create_sql_indexes:
-    conn.execute('create index left_ix on left(key, key2)')
-    conn.execute('create index right_ix on right(key, key2)')
-
-
-join_methods = ['inner', 'left outer', 'left']  # others not supported
-sql_results = DataFrame(index=join_methods, columns=[False])
-niter = 5
-for sort in [False]:
-    for join_method in join_methods:
-        sql = """CREATE TABLE test as select *
-        from left
-           %s join right
-             on left.key=right.key
-               and left.key2 = right.key2;""" % join_method
-        sql = """select *
-        from left
-           %s join right
-             on left.key=right.key
-               and left.key2 = right.key2;""" % join_method
-
-        if sort:
-            sql = '%s order by key, key2' % sql
-        f = lambda: list(conn.execute(sql))  # list fetches results
-        g = lambda: conn.execute(sql)  # list fetches results
-        gc.disable()
-        start = time.time()
-        # for _ in range(niter):
-        g()
-        elapsed = (time.time() - start) / niter
-        gc.enable()
-
-        cur = conn.execute("DROP TABLE test")
-        conn.commit()
-
-        sql_results[sort][join_method] = elapsed
-        sql_results.columns = ['sqlite3']  # ['dont_sort', 'sort']
-        sql_results.index = ['inner', 'outer', 'left']
-
-        sql = """select *
-        from left
-           inner join right
-             on left.key=right.key
-               and left.key2 = right.key2;"""
diff --git a/bench/bench_pivot.R b/bench/bench_pivot.R
deleted file mode 100644
index 06dc6a105bc43..0000000000000
--- a/bench/bench_pivot.R
+++ /dev/null
@@ -1,27 +0,0 @@
-library(reshape2)
-
-
-n <- 100000
-a.size <- 5
-b.size <- 5
-
-data <- data.frame(a=sample(letters[1:a.size], n, replace=T),
-                   b=sample(letters[1:b.size], n, replace=T),
-                   c=rnorm(n),
-                   d=rnorm(n))
-
-timings <- numeric()
-
-# acast(melt(data, id=c("a", "b")), a ~ b, mean)
-# acast(melt(data, id=c("a", "b")), a + b ~ variable, mean)
-
-for (i in 1:10) {
-  gc()
-  tim <- system.time(acast(melt(data, id=c("a", "b")), a ~ b, mean,
-                           subset=.(variable=="c")))
-  timings[i] = tim[3]
-}
-
-mean(timings)
-
-acast(melt(data, id=c("a", "b")), a ~ b, mean, subset=.(variable="c"))
diff --git a/bench/bench_pivot.py b/bench/bench_pivot.py
deleted file mode 100644
index 007bd0aaebc2f..0000000000000
--- a/bench/bench_pivot.py
+++ /dev/null
@@ -1,16 +0,0 @@
-from pandas import *
-import string
-
-
-n = 100000
-asize = 5
-bsize = 5
-
-letters = np.asarray(list(string.letters), dtype=object)
-
-data = DataFrame(dict(foo=letters[:asize][np.random.randint(0, asize, n)],
-                      bar=letters[:bsize][np.random.randint(0, bsize, n)],
-                      baz=np.random.randn(n),
-                      qux=np.random.randn(n)))
-
-table = pivot_table(data, xby=['foo', 'bar'])
diff --git a/bench/bench_take_indexing.py b/bench/bench_take_indexing.py
deleted file mode 100644
index 5fb584bcfe45f..0000000000000
--- a/bench/bench_take_indexing.py
+++ /dev/null
@@ -1,55 +0,0 @@
-from __future__ import print_function
-import numpy as np
-
-from pandas import *
-import pandas._tseries as lib
-
-from pandas import DataFrame
-import timeit
-from pandas.compat import zip
-
-setup = """
-from pandas import Series
-import pandas._tseries as lib
-import random
-import numpy as np
-
-import random
-n = %d
-k = %d
-arr = np.random.randn(n, k)
-indexer = np.arange(n, dtype=np.int32)
-indexer = indexer[::-1]
-"""
-
-sizes = [100, 1000, 10000, 100000]
-iters = [1000, 1000, 100, 1]
-
-fancy_2d = []
-take_2d = []
-cython_2d = []
-
-n = 1000
-
-
-def _timeit(stmt, size, k=5, iters=1000):
-    timer = timeit.Timer(stmt=stmt, setup=setup % (sz, k))
-    return timer.timeit(n) / n
-
-for sz, its in zip(sizes, iters):
-    print(sz)
-    fancy_2d.append(_timeit('arr[indexer]', sz, iters=its))
-    take_2d.append(_timeit('arr.take(indexer, axis=0)', sz, iters=its))
-    cython_2d.append(_timeit('lib.take_axis0(arr, indexer)', sz, iters=its))
-
-df = DataFrame({'fancy': fancy_2d,
-                'take': take_2d,
-                'cython': cython_2d})
-
-print(df)
-
-from pandas.rpy.common import r
-r('mat <- matrix(rnorm(50000), nrow=10000, ncol=5)')
-r('set.seed(12345')
-r('indexer <- sample(1:10000)')
-r('mat[indexer,]')
diff --git a/bench/bench_unique.py b/bench/bench_unique.py
deleted file mode 100644
index 87bd2f2df586c..0000000000000
--- a/bench/bench_unique.py
+++ /dev/null
@@ -1,278 +0,0 @@
-from __future__ import print_function
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range, zip
-import pandas._tseries as lib
-import numpy as np
-import matplotlib.pyplot as plt
-
-N = 50000
-K = 10000
-
-groups = np.array([rands(10) for _ in range(K)], dtype='O')
-groups2 = np.array([rands(10) for _ in range(K)], dtype='O')
-
-labels = np.tile(groups, N // K)
-labels2 = np.tile(groups2, N // K)
-data = np.random.randn(N)
-
-
-def timeit(f, niter):
-    import gc
-    import time
-    gc.disable()
-    start = time.time()
-    for _ in range(niter):
-        f()
-    elapsed = (time.time() - start) / niter
-    gc.enable()
-    return elapsed
-
-
-def algo1():
-    unique_labels = np.unique(labels)
-    result = np.empty(len(unique_labels))
-    for i, label in enumerate(unique_labels):
-        result[i] = data[labels == label].sum()
-
-
-def algo2():
-    unique_labels = np.unique(labels)
-    indices = lib.groupby_indices(labels)
-    result = np.empty(len(unique_labels))
-
-    for i, label in enumerate(unique_labels):
-        result[i] = data.take(indices[label]).sum()
-
-
-def algo3_nosort():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(labels, sort=False)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-
-def algo3_sort():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(labels, sort=True)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-import numpy as np
-import random
-
-
-# dict to hold results
-counts = {}
-
-# a hack to generate random key, value pairs.
-# 5k keys, 100k values
-x = np.tile(np.arange(5000, dtype='O'), 20)
-random.shuffle(x)
-xarr = x
-x = [int(y) for y in x]
-data = np.random.uniform(0, 1, 100000)
-
-
-def f():
-    # groupby sum
-    for k, v in zip(x, data):
-        try:
-            counts[k] += v
-        except KeyError:
-            counts[k] = v
-
-
-def f2():
-    rizer = lib.DictFactorizer()
-    labs, counts = rizer.factorize(xarr, sort=False)
-    k = len(rizer.uniques)
-    out = np.empty(k)
-    lib.group_add(out, counts, data, labs)
-
-
-def algo4():
-    rizer = lib.DictFactorizer()
-    labs1, _ = rizer.factorize(labels, sort=False)
-    k1 = len(rizer.uniques)
-
-    rizer = lib.DictFactorizer()
-    labs2, _ = rizer.factorize(labels2, sort=False)
-    k2 = len(rizer.uniques)
-
-    group_id = labs1 * k2 + labs2
-    max_group = k1 * k2
-
-    if max_group > 1e6:
-        rizer = lib.Int64Factorizer(len(group_id))
-        group_id, _ = rizer.factorize(group_id.astype('i8'), sort=True)
-        max_group = len(rizer.uniques)
-
-    out = np.empty(max_group)
-    counts = np.zeros(max_group, dtype='i4')
-    lib.group_add(out, counts, data, group_id)
-
-# cumtime  percall filename:lineno(function)
-#   0.592    0.592 <string>:1(<module>)
-  # 0.584    0.006 groupby_ex.py:37(algo3_nosort)
-  # 0.535    0.005 {method 'factorize' of DictFactorizer' objects}
-  # 0.047    0.000 {pandas._tseries.group_add}
-  # 0.002    0.000 numeric.py:65(zeros_like)
-  # 0.001    0.000 {method 'fill' of 'numpy.ndarray' objects}
-  # 0.000    0.000 {numpy.core.multiarray.empty_like}
-  # 0.000    0.000 {numpy.core.multiarray.empty}
-
-# UNIQUE timings
-
-# N = 10000000
-# K = 500000
-
-# groups = np.array([rands(10) for _ in range(K)], dtype='O')
-
-# labels = np.tile(groups, N // K)
-data = np.random.randn(N)
-
-data = np.random.randn(N)
-
-Ks = [100, 1000, 5000, 10000, 25000, 50000, 100000]
-
-# Ks = [500000, 1000000, 2500000, 5000000, 10000000]
-
-import psutil
-import os
-import gc
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-
-def dict_unique(values, expected_K, sort=False, memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    rizer = lib.DictFactorizer()
-    result = rizer.unique_int64(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-    return result
-
-
-def khash_unique(values, expected_K, size_hint=False, sort=False,
-                 memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    if size_hint:
-        rizer = lib.Factorizer(len(values))
-    else:
-        rizer = lib.Factorizer(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def khash_unique_str(values, expected_K, size_hint=False, sort=False,
-                     memory=False):
-    if memory:
-        gc.collect()
-        before_mem = proc.get_memory_info().rss
-
-    if size_hint:
-        rizer = lib.StringHashTable(len(values))
-    else:
-        rizer = lib.StringHashTable(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if memory:
-        result = proc.get_memory_info().rss - before_mem
-        return result
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def khash_unique_int64(values, expected_K, size_hint=False, sort=False):
-    if size_hint:
-        rizer = lib.Int64HashTable(len(values))
-    else:
-        rizer = lib.Int64HashTable(100)
-
-    result = []
-    result = rizer.unique(values)
-
-    if sort:
-        result.sort()
-    assert(len(result) == expected_K)
-
-
-def hash_bench():
-    numpy = []
-    dict_based = []
-    dict_based_sort = []
-    khash_hint = []
-    khash_nohint = []
-    for K in Ks:
-        print(K)
-        # groups = np.array([rands(10) for _ in range(K)])
-        # labels = np.tile(groups, N // K).astype('O')
-
-        groups = np.random.randint(0, long(100000000000), size=K)
-        labels = np.tile(groups, N // K)
-        dict_based.append(timeit(lambda: dict_unique(labels, K), 20))
-        khash_nohint.append(timeit(lambda: khash_unique_int64(labels, K), 20))
-        khash_hint.append(timeit(lambda: khash_unique_int64(labels, K,
-                                                            size_hint=True), 20))
-
-        # memory, hard to get
-        # dict_based.append(np.mean([dict_unique(labels, K, memory=True)
-        #                            for _ in range(10)]))
-        # khash_nohint.append(np.mean([khash_unique(labels, K, memory=True)
-        #                              for _ in range(10)]))
-        # khash_hint.append(np.mean([khash_unique(labels, K, size_hint=True, memory=True)
-        #                            for _ in range(10)]))
-
-        # dict_based_sort.append(timeit(lambda: dict_unique(labels, K,
-        #                                                   sort=True), 10))
-        # numpy.append(timeit(lambda: np.unique(labels), 10))
-
-    # unique_timings = DataFrame({'numpy.unique' : numpy,
-    #                             'dict, no sort' : dict_based,
-    #                             'dict, sort' : dict_based_sort},
-    #                            columns=['dict, no sort',
-    #                                     'dict, sort', 'numpy.unique'],
-    #                            index=Ks)
-
-    unique_timings = DataFrame({'dict': dict_based,
-                                'khash, preallocate': khash_hint,
-                                'khash': khash_nohint},
-                               columns=['khash, preallocate', 'khash', 'dict'],
-                               index=Ks)
-
-    unique_timings.plot(kind='bar', legend=False)
-    plt.legend(loc='best')
-    plt.title('Unique on 100,000 values, int64')
-    plt.xlabel('Number of unique labels')
-    plt.ylabel('Mean execution time')
-
-    plt.show()
diff --git a/bench/bench_with_subset.R b/bench/bench_with_subset.R
deleted file mode 100644
index 69d0f7a9eec63..0000000000000
--- a/bench/bench_with_subset.R
+++ /dev/null
@@ -1,53 +0,0 @@
-library(microbenchmark)
-library(data.table)
-
-
-data.frame.subset.bench <- function (n=1e7, times=30) {
-    df <- data.frame(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(subset(df, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c),
-                         times=times))
-}
-
-
-# data.table allows something very similar to query with an expression
-# but we have chained comparisons AND we're faster BOO YAH!
-data.table.subset.expression.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(dt[, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c],
-                         times=times))
-}
-
-
-# compare against subset with data.table for good measure
-data.table.subset.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(subset(dt, a <= b & b <= (c ^ 2 + b ^ 2 - a) & b > c),
-                         times=times))
-}
-
-
-data.frame.with.bench <- function (n=1e7, times=30) {
-    df <- data.frame(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-
-    print(microbenchmark(with(df, a + b * (c ^ 2 + b ^ 2 - a) / (a * c) ^ 3),
-                         times=times))
-}
-
-
-data.table.with.bench <- function (n=1e7, times=30) {
-    dt <- data.table(a=rnorm(n), b=rnorm(n), c=rnorm(n))
-    print(microbenchmark(with(dt, a + b * (c ^ 2 + b ^ 2 - a) / (a * c) ^ 3),
-                         times=times))
-}
-
-
-bench <- function () {
-    data.frame.subset.bench()
-    data.table.subset.expression.bench()
-    data.table.subset.bench()
-    data.frame.with.bench()
-    data.table.with.bench()
-}
-
-
-bench()
diff --git a/bench/bench_with_subset.py b/bench/bench_with_subset.py
deleted file mode 100644
index 017401df3f7f3..0000000000000
--- a/bench/bench_with_subset.py
+++ /dev/null
@@ -1,116 +0,0 @@
-#!/usr/bin/env python
-
-"""
-Microbenchmarks for comparison with R's "with" and "subset" functions
-"""
-
-from __future__ import print_function
-import numpy as np
-from numpy import array
-from timeit import repeat as timeit
-from pandas.compat import range, zip
-from pandas import DataFrame
-
-
-setup_common = """from pandas import DataFrame
-from numpy.random import randn
-df = DataFrame(randn(%d, 3), columns=list('abc'))
-%s"""
-
-
-setup_with = "s = 'a + b * (c ** 2 + b ** 2 - a) / (a * c) ** 3'"
-
-
-def bench_with(n, times=10, repeat=3, engine='numexpr'):
-    return np.array(timeit('df.eval(s, engine=%r)' % engine,
-                           setup=setup_common % (n, setup_with),
-                           repeat=repeat, number=times)) / times
-
-
-setup_subset = "s = 'a <= b <= c ** 2 + b ** 2 - a and b > c'"
-
-
-def bench_subset(n, times=10, repeat=3, engine='numexpr'):
-    return np.array(timeit('df.query(s, engine=%r)' % engine,
-                           setup=setup_common % (n, setup_subset),
-                           repeat=repeat, number=times)) / times
-
-
-def bench(mn=1, mx=7, num=100, engines=('python', 'numexpr'), verbose=False):
-    r = np.logspace(mn, mx, num=num).round().astype(int)
-
-    ev = DataFrame(np.empty((num, len(engines))), columns=engines)
-    qu = ev.copy(deep=True)
-
-    ev['size'] = qu['size'] = r
-
-    for engine in engines:
-        for i, n in enumerate(r):
-            if verbose:
-                print('engine: %r, i == %d' % (engine, i))
-            ev.loc[i, engine] = bench_with(n, times=1, repeat=1, engine=engine)
-            qu.loc[i, engine] = bench_subset(n, times=1, repeat=1,
-                                             engine=engine)
-
-    return ev, qu
-
-
-def plot_perf(df, engines, title, filename=None):
-    from matplotlib.pyplot import figure, rc
-
-    try:
-        from mpltools import style
-    except ImportError:
-        pass
-    else:
-        style.use('ggplot')
-
-    rc('text', usetex=True)
-
-    fig = figure(figsize=(4, 3), dpi=100)
-    ax = fig.add_subplot(111)
-
-    for engine in engines:
-        ax.plot(df.size, df[engine], label=engine, lw=2)
-
-    ax.set_xlabel('Number of Rows')
-    ax.set_ylabel('Time (s)')
-    ax.set_title(title)
-    ax.legend(loc='best')
-    ax.tick_params(top=False, right=False)
-
-    fig.tight_layout()
-
-    if filename is not None:
-        fig.savefig(filename)
-
-
-if __name__ == '__main__':
-    import os
-    import pandas as pd
-
-    pandas_dir = os.path.dirname(os.path.abspath(os.path.dirname(__file__)))
-    static_path = os.path.join(pandas_dir, 'doc', 'source', '_static')
-
-    join = lambda p: os.path.join(static_path, p)
-
-    fn = join('eval-query-perf-data.h5')
-
-    engines = 'python', 'numexpr'
-
-    if not os.path.exists(fn):
-        ev, qu = bench(verbose=True)
-        ev.to_hdf(fn, 'eval')
-        qu.to_hdf(fn, 'query')
-    else:
-        ev = pd.read_hdf(fn, 'eval')
-        qu = pd.read_hdf(fn, 'query')
-
-    plot_perf(ev, engines, 'DataFrame.eval()', filename=join('eval-perf.png'))
-    plot_perf(qu, engines, 'DataFrame.query()',
-              filename=join('query-perf.png'))
-
-    plot_perf(ev[ev.size <= 50000], engines, 'DataFrame.eval()',
-              filename=join('eval-perf-small.png'))
-    plot_perf(qu[qu.size <= 500000], engines, 'DataFrame.query()',
-              filename=join('query-perf-small.png'))
diff --git a/bench/better_unique.py b/bench/better_unique.py
deleted file mode 100644
index e03a4f433ce66..0000000000000
--- a/bench/better_unique.py
+++ /dev/null
@@ -1,80 +0,0 @@
-from __future__ import print_function
-from pandas import DataFrame
-from pandas.compat import range, zip
-import timeit
-
-setup = """
-from pandas import Series
-import pandas._tseries as _tseries
-from pandas.compat import range
-import random
-import numpy as np
-
-def better_unique(values):
-    uniques = _tseries.fast_unique(values)
-    id_map = _tseries.map_indices_buf(uniques)
-    labels = _tseries.get_unique_labels(values, id_map)
-    return uniques, labels
-
-tot = 100000
-
-def get_test_data(ngroups=100, n=tot):
-    unique_groups = range(ngroups)
-    random.shuffle(unique_groups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    return arr
-
-arr = get_test_data(ngroups=%d)
-"""
-
-group_sizes = [10, 100, 1000, 10000,
-               20000, 30000, 40000,
-               50000, 60000, 70000,
-               80000, 90000, 100000]
-
-numbers = [100, 100, 50] + [10] * 10
-
-numpy = []
-wes = []
-
-for sz, n in zip(group_sizes, numbers):
-    # wes_timer =  timeit.Timer(stmt='better_unique(arr)',
-    #                           setup=setup % sz)
-    wes_timer = timeit.Timer(stmt='_tseries.fast_unique(arr)',
-                             setup=setup % sz)
-
-    numpy_timer = timeit.Timer(stmt='np.unique(arr)',
-                               setup=setup % sz)
-
-    print(n)
-    numpy_result = numpy_timer.timeit(number=n) / n
-    wes_result = wes_timer.timeit(number=n) / n
-
-    print('Groups: %d, NumPy: %s, Wes: %s' % (sz, numpy_result, wes_result))
-
-    wes.append(wes_result)
-    numpy.append(numpy_result)
-
-result = DataFrame({'wes': wes, 'numpy': numpy}, index=group_sizes)
-
-
-def make_plot(numpy, wes):
-    pass
-
-# def get_test_data(ngroups=100, n=100000):
-#     unique_groups = range(ngroups)
-#     random.shuffle(unique_groups)
-#     arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-#     if len(arr) < n:
-#         arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-#                          dtype=object)
-
-#     return arr
-
-# arr = get_test_data(ngroups=1000)
diff --git a/bench/duplicated.R b/bench/duplicated.R
deleted file mode 100644
index eb2376df2932a..0000000000000
--- a/bench/duplicated.R
+++ /dev/null
@@ -1,22 +0,0 @@
-N <- 100000
-
-k1 = rep(NA, N)
-k2 = rep(NA, N)
-for (i in 1:N){
-  k1[i] <- paste(sample(letters, 1), collapse="")
-  k2[i] <- paste(sample(letters, 1), collapse="")
-}
-df <- data.frame(a=k1, b=k2, c=rep(1:100, N / 100))
-df2 <- data.frame(a=k1, b=k2)
-
-timings <- numeric()
-timings2 <- numeric()
-for (i in 1:50) {
-  gc()
-  timings[i] = system.time(deduped <- df[!duplicated(df),])[3]
-  gc()
-  timings2[i] = system.time(deduped <- df[!duplicated(df[,c("a", "b")]),])[3]
-}
-
-mean(timings)
-mean(timings2)
diff --git a/bench/io_roundtrip.py b/bench/io_roundtrip.py
deleted file mode 100644
index d87da0ec6321a..0000000000000
--- a/bench/io_roundtrip.py
+++ /dev/null
@@ -1,116 +0,0 @@
-from __future__ import print_function
-import time
-import os
-import numpy as np
-
-import la
-import pandas
-from pandas.compat import range
-from pandas import datetools, DatetimeIndex
-
-
-def timeit(f, iterations):
-    start = time.clock()
-
-    for i in range(iterations):
-        f()
-
-    return time.clock() - start
-
-
-def rountrip_archive(N, K=50, iterations=10):
-    # Create data
-    arr = np.random.randn(N, K)
-    # lar = la.larry(arr)
-    dma = pandas.DataFrame(arr,
-                           DatetimeIndex('1/1/2000', periods=N,
-                                     offset=datetools.Minute()))
-    dma[201] = 'bar'
-
-    # filenames
-    filename_numpy = '/Users/wesm/tmp/numpy.npz'
-    filename_larry = '/Users/wesm/tmp/archive.hdf5'
-    filename_pandas = '/Users/wesm/tmp/pandas_tmp'
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-    # Time a round trip save and load
-    # numpy_f = lambda: numpy_roundtrip(filename_numpy, arr, arr)
-    # numpy_time = timeit(numpy_f, iterations) / iterations
-
-    # larry_f = lambda: larry_roundtrip(filename_larry, lar, lar)
-    # larry_time = timeit(larry_f, iterations) / iterations
-
-    pandas_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pandas_time = timeit(pandas_f, iterations) / iterations
-    print('pandas (HDF5) %7.4f seconds' % pandas_time)
-
-    pickle_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pickle_time = timeit(pickle_f, iterations) / iterations
-    print('pandas (pickle) %7.4f seconds' % pickle_time)
-
-    # print('Numpy (npz)   %7.4f seconds' % numpy_time)
-    # print('larry (HDF5)  %7.4f seconds' % larry_time)
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-
-def numpy_roundtrip(filename, arr1, arr2):
-    np.savez(filename, arr1=arr1, arr2=arr2)
-    npz = np.load(filename)
-    arr1 = npz['arr1']
-    arr2 = npz['arr2']
-
-
-def larry_roundtrip(filename, lar1, lar2):
-    io = la.IO(filename)
-    io['lar1'] = lar1
-    io['lar2'] = lar2
-    lar1 = io['lar1']
-    lar2 = io['lar2']
-
-
-def pandas_roundtrip(filename, dma1, dma2):
-    # What's the best way to code this?
-    from pandas.io.pytables import HDFStore
-    store = HDFStore(filename)
-    store['dma1'] = dma1
-    store['dma2'] = dma2
-    dma1 = store['dma1']
-    dma2 = store['dma2']
-
-
-def pandas_roundtrip_pickle(filename, dma1, dma2):
-    dma1.save(filename)
-    dma1 = pandas.DataFrame.load(filename)
-    dma2.save(filename)
-    dma2 = pandas.DataFrame.load(filename)
-
-if __name__ == '__main__':
-    rountrip_archive(10000, K=200)
diff --git a/bench/serialize.py b/bench/serialize.py
deleted file mode 100644
index b0edd6a5752d2..0000000000000
--- a/bench/serialize.py
+++ /dev/null
@@ -1,89 +0,0 @@
-from __future__ import print_function
-from pandas.compat import range, lrange
-import time
-import os
-import numpy as np
-
-import la
-import pandas
-
-
-def timeit(f, iterations):
-    start = time.clock()
-
-    for i in range(iterations):
-        f()
-
-    return time.clock() - start
-
-
-def roundtrip_archive(N, iterations=10):
-
-    # Create data
-    arr = np.random.randn(N, N)
-    lar = la.larry(arr)
-    dma = pandas.DataFrame(arr, lrange(N), lrange(N))
-
-    # filenames
-    filename_numpy = '/Users/wesm/tmp/numpy.npz'
-    filename_larry = '/Users/wesm/tmp/archive.hdf5'
-    filename_pandas = '/Users/wesm/tmp/pandas_tmp'
-
-    # Delete old files
-    try:
-        os.unlink(filename_numpy)
-    except:
-        pass
-    try:
-        os.unlink(filename_larry)
-    except:
-        pass
-    try:
-        os.unlink(filename_pandas)
-    except:
-        pass
-
-    # Time a round trip save and load
-    numpy_f = lambda: numpy_roundtrip(filename_numpy, arr, arr)
-    numpy_time = timeit(numpy_f, iterations) / iterations
-
-    larry_f = lambda: larry_roundtrip(filename_larry, lar, lar)
-    larry_time = timeit(larry_f, iterations) / iterations
-
-    pandas_f = lambda: pandas_roundtrip(filename_pandas, dma, dma)
-    pandas_time = timeit(pandas_f, iterations) / iterations
-
-    print('Numpy (npz)   %7.4f seconds' % numpy_time)
-    print('larry (HDF5)  %7.4f seconds' % larry_time)
-    print('pandas (HDF5) %7.4f seconds' % pandas_time)
-
-
-def numpy_roundtrip(filename, arr1, arr2):
-    np.savez(filename, arr1=arr1, arr2=arr2)
-    npz = np.load(filename)
-    arr1 = npz['arr1']
-    arr2 = npz['arr2']
-
-
-def larry_roundtrip(filename, lar1, lar2):
-    io = la.IO(filename)
-    io['lar1'] = lar1
-    io['lar2'] = lar2
-    lar1 = io['lar1']
-    lar2 = io['lar2']
-
-
-def pandas_roundtrip(filename, dma1, dma2):
-    from pandas.io.pytables import HDFStore
-    store = HDFStore(filename)
-    store['dma1'] = dma1
-    store['dma2'] = dma2
-    dma1 = store['dma1']
-    dma2 = store['dma2']
-
-
-def pandas_roundtrip_pickle(filename, dma1, dma2):
-    dma1.save(filename)
-    dma1 = pandas.DataFrame.load(filename)
-    dma2.save(filename)
-    dma2 = pandas.DataFrame.load(filename)
diff --git a/bench/test.py b/bench/test.py
deleted file mode 100644
index 2339deab313a1..0000000000000
--- a/bench/test.py
+++ /dev/null
@@ -1,70 +0,0 @@
-import numpy as np
-import itertools
-import collections
-import scipy.ndimage as ndi
-from pandas.compat import zip, range
-
-N = 10000
-
-lat = np.random.randint(0, 360, N)
-lon = np.random.randint(0, 360, N)
-data = np.random.randn(N)
-
-
-def groupby1(lat, lon, data):
-    indexer = np.lexsort((lon, lat))
-    lat = lat.take(indexer)
-    lon = lon.take(indexer)
-    sorted_data = data.take(indexer)
-
-    keys = 1000. * lat + lon
-    unique_keys = np.unique(keys)
-    bounds = keys.searchsorted(unique_keys)
-
-    result = group_agg(sorted_data, bounds, lambda x: x.mean())
-
-    decoder = keys.searchsorted(unique_keys)
-
-    return dict(zip(zip(lat.take(decoder), lon.take(decoder)), result))
-
-
-def group_mean(lat, lon, data):
-    indexer = np.lexsort((lon, lat))
-    lat = lat.take(indexer)
-    lon = lon.take(indexer)
-    sorted_data = data.take(indexer)
-
-    keys = 1000 * lat + lon
-    unique_keys = np.unique(keys)
-
-    result = ndi.mean(sorted_data, labels=keys, index=unique_keys)
-    decoder = keys.searchsorted(unique_keys)
-
-    return dict(zip(zip(lat.take(decoder), lon.take(decoder)), result))
-
-
-def group_mean_naive(lat, lon, data):
-    grouped = collections.defaultdict(list)
-    for lt, ln, da in zip(lat, lon, data):
-        grouped[(lt, ln)].append(da)
-
-    averaged = dict((ltln, np.mean(da)) for ltln, da in grouped.items())
-
-    return averaged
-
-
-def group_agg(values, bounds, f):
-    N = len(values)
-    result = np.empty(len(bounds), dtype=float)
-    for i, left_bound in enumerate(bounds):
-        if i == len(bounds) - 1:
-            right_bound = N
-        else:
-            right_bound = bounds[i + 1]
-
-        result[i] = f(values[left_bound: right_bound])
-
-    return result
-
-# for i in range(10):
-#     groupby1(lat, lon, data)
diff --git a/bench/zoo_bench.R b/bench/zoo_bench.R
deleted file mode 100644
index 294d55f51a9ab..0000000000000
--- a/bench/zoo_bench.R
+++ /dev/null
@@ -1,71 +0,0 @@
-library(zoo)
-library(xts)
-library(fts)
-library(tseries)
-library(its)
-library(xtable)
-
-## indices = rep(NA, 100000)
-## for (i in 1:100000)
-##   indices[i] <- paste(sample(letters, 10), collapse="")
-
-
-
-## x <- zoo(rnorm(100000), indices)
-## y <- zoo(rnorm(90000), indices[sample(1:100000, 90000)])
-
-## indices <- as.POSIXct(1:100000)
-
-indices <- as.POSIXct(Sys.Date()) + seq(1, 100000000, 100)
-
-sz <- 500000
-
-## x <- xts(rnorm(sz), sample(indices, sz))
-## y <- xts(rnorm(sz), sample(indices, sz))
-
-zoo.bench <- function(){
-    x <- zoo(rnorm(sz), sample(indices, sz))
-    y <- zoo(rnorm(sz), sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-xts.bench <- function(){
-    x <- xts(rnorm(sz), sample(indices, sz))
-    y <- xts(rnorm(sz), sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-fts.bench <- function(){
-    x <- fts(rnorm(sz), sort(sample(indices, sz)))
-    y <- fts(rnorm(sz), sort(sample(indices, sz))
-    timeit(function() {x + y})
-}
-
-its.bench <- function(){
-    x <- its(rnorm(sz), sort(sample(indices, sz)))
-    y <- its(rnorm(sz), sort(sample(indices, sz)))
-    timeit(function() {x + y})
-}
-
-irts.bench <- function(){
-    x <- irts(sort(sample(indices, sz)), rnorm(sz))
-    y <- irts(sort(sample(indices, sz)), rnorm(sz))
-    timeit(function() {x + y})
-}
-
-timeit <- function(f){
-  timings <- numeric()
-  for (i in 1:10) {
-    gc()
-    timings[i] = system.time(f())[3]
-  }
-  mean(timings)
-}
-
-bench <- function(){
-  results <- c(xts.bench(), fts.bench(), its.bench(), zoo.bench())
-  names <- c("xts", "fts", "its", "zoo")
-  data.frame(results, names)
-}
-
-result <- bench()
diff --git a/bench/zoo_bench.py b/bench/zoo_bench.py
deleted file mode 100644
index 74cb1952a5a2a..0000000000000
--- a/bench/zoo_bench.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-
-n = 1000000
-# indices = Index([rands(10) for _ in xrange(n)])
-
-
-def sample(values, k):
-    sampler = np.random.permutation(len(values))
-    return values.take(sampler[:k])
-sz = 500000
-rng = np.arange(0, 10000000000000, 10000000)
-stamps = np.datetime64(datetime.now()).view('i8') + rng
-idx1 = np.sort(sample(stamps, sz))
-idx2 = np.sort(sample(stamps, sz))
-ts1 = Series(np.random.randn(sz), idx1)
-ts2 = Series(np.random.randn(sz), idx2)
-
-
-# subsample_size = 90000
-
-# x = Series(np.random.randn(100000), indices)
-# y = Series(np.random.randn(subsample_size),
-#            index=sample(indices, subsample_size))
-
-
-# lx = larry(np.random.randn(100000), [list(indices)])
-# ly = larry(np.random.randn(subsample_size), [list(y.index)])
-
-# Benchmark 1: Two 1-million length time series (int64-based index) with
-# randomly chosen timestamps
-
-# Benchmark 2: Join two 5-variate time series DataFrames (outer and inner join)
-
-# df1 = DataFrame(np.random.randn(1000000, 5), idx1, columns=range(5))
-# df2 = DataFrame(np.random.randn(1000000, 5), idx2, columns=range(5, 10))
diff --git a/ci/README.txt b/ci/README.txt
deleted file mode 100644
index bb71dc25d6093..0000000000000
--- a/ci/README.txt
+++ /dev/null
@@ -1,17 +0,0 @@
-Travis is a ci service that's well-integrated with GitHub.
-The following types of breakage should be detected
-by Travis builds:
-
-1) Failing tests on any supported version of Python.
-2) Pandas should install and the tests should run if no optional deps are installed.
-That also means tests which rely on optional deps need to raise SkipTest()
-if the dep is missing.
-3) unicode related fails when running under exotic locales.
-
-We tried running the vbench suite for a while, but with varying load
-on Travis machines, that wasn't useful.
-
-Travis currently (4/2013) has a 5-job concurrency limit. Exceeding it
-basically doubles the total runtime for a commit through travis, and
-since dep+pandas installation is already quite long, this should become
-a hard limit on concurrent travis runs.
diff --git a/ci/azure/posix.yml b/ci/azure/posix.yml
new file mode 100644
index 0000000000000..b9e0cd0b9258c
--- /dev/null
+++ b/ci/azure/posix.yml
@@ -0,0 +1,100 @@
+parameters:
+  name: ''
+  vmImage: ''
+
+jobs:
+- job: ${{ parameters.name }}
+  pool:
+    vmImage: ${{ parameters.vmImage }}
+  strategy:
+    matrix:
+      ${{ if eq(parameters.name, 'macOS') }}:
+        py35_np_120:
+          ENV_FILE: ci/deps/azure-macos-35.yaml
+          CONDA_PY: "35"
+          PATTERN: "not slow and not network"
+
+      ${{ if eq(parameters.name, 'Linux') }}:
+        py27_np_120:
+          ENV_FILE: ci/deps/azure-27-compat.yaml
+          CONDA_PY: "27"
+          PATTERN: "not slow and not network"
+
+        py27_locale_slow_old_np:
+          ENV_FILE: ci/deps/azure-27-locale.yaml
+          CONDA_PY: "27"
+          PATTERN: "slow"
+          LOCALE_OVERRIDE: "zh_CN.UTF-8"
+          EXTRA_APT: "language-pack-zh-hans"
+
+        py36_locale_slow:
+          ENV_FILE: ci/deps/azure-36-locale_slow.yaml
+          CONDA_PY: "36"
+          PATTERN: "not slow and not network"
+          LOCALE_OVERRIDE: "it_IT.UTF-8"
+
+        py37_locale:
+          ENV_FILE: ci/deps/azure-37-locale.yaml
+          CONDA_PY: "37"
+          PATTERN: "not slow and not network"
+          LOCALE_OVERRIDE: "zh_CN.UTF-8"
+
+        py37_np_dev:
+          ENV_FILE: ci/deps/azure-37-numpydev.yaml
+          CONDA_PY: "37"
+          PATTERN: "not slow and not network"
+          TEST_ARGS: "-W error"
+          PANDAS_TESTING_MODE: "deprecate"
+          EXTRA_APT: "xsel"
+
+  steps:
+    - script: |
+        if [ "$(uname)" == "Linux" ]; then sudo apt-get install -y libc6-dev-i386 $EXTRA_APT; fi
+        echo "Installing Miniconda"
+        ci/incremental/install_miniconda.sh
+        export PATH=$HOME/miniconda3/bin:$PATH
+        echo "Setting up Conda environment"
+        ci/incremental/setup_conda_environment.sh
+      displayName: 'Before Install'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        source activate pandas-dev
+        ci/incremental/build.sh
+      displayName: 'Build'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        source activate pandas-dev
+        ci/run_tests.sh
+      displayName: 'Test'
+    - script: |
+        export PATH=$HOME/miniconda3/bin:$PATH
+        source activate pandas-dev && pushd /tmp && python -c "import pandas; pandas.show_versions();" && popd
+    - task: PublishTestResults@2
+      inputs:
+        testResultsFiles: 'test-data-*.xml'
+        testRunTitle: ${{ format('{0}-$(CONDA_PY)', parameters.name) }}
+    - powershell: |
+        $junitXml = "test-data-single.xml"
+        $(Get-Content $junitXml | Out-String) -match 'failures="(.*?)"'
+        if ($matches[1] -eq 0)
+        {
+          Write-Host "No test failures in test-data-single"
+        }
+        else
+        {
+          # note that this will produce $LASTEXITCODE=1
+          Write-Error "$($matches[1]) tests failed"
+        }
+
+        $junitXmlMulti = "test-data-multiple.xml"
+        $(Get-Content $junitXmlMulti | Out-String) -match 'failures="(.*?)"'
+        if ($matches[1] -eq 0)
+        {
+          Write-Host "No test failures in test-data-multi"
+        }
+        else
+        {
+          # note that this will produce $LASTEXITCODE=1
+          Write-Error "$($matches[1]) tests failed"
+        }
+      displayName: Check for test failures
diff --git a/ci/azure/windows.yml b/ci/azure/windows.yml
new file mode 100644
index 0000000000000..cece002024936
--- /dev/null
+++ b/ci/azure/windows.yml
@@ -0,0 +1,59 @@
+parameters:
+  name: ''
+  vmImage: ''
+
+jobs:
+- job: ${{ parameters.name }}
+  pool:
+    vmImage: ${{ parameters.vmImage }}
+  strategy:
+    matrix:
+      py36_np14:
+        ENV_FILE: ci/deps/azure-windows-36.yaml
+        CONDA_PY: "36"
+
+      py27_np121:
+        ENV_FILE: ci/deps/azure-windows-27.yaml
+        CONDA_PY: "27"
+
+  steps:
+    - task: CondaEnvironment@1
+      inputs:
+        updateConda: no
+        packageSpecs: ''
+
+    - powershell: |
+        $wc = New-Object net.webclient
+        $wc.Downloadfile("https://download.microsoft.com/download/7/9/6/796EF2E4-801B-4FC4-AB28-B59FBF6D907B/VCForPython27.msi", "VCForPython27.msi")
+        Start-Process "VCForPython27.msi" /qn -Wait
+      displayName: 'Install VC 9.0 only for Python 2.7'
+      condition: eq(variables.CONDA_PY, '27')
+
+    - script: |
+        ci\\incremental\\setup_conda_environment.cmd
+      displayName: 'Before Install'
+    - script: |
+        call activate pandas-dev
+        ci\\incremental\\build.cmd
+      displayName: 'Build'
+    - script: |
+        call activate pandas-dev
+        pytest -m "not slow and not network" --junitxml=test-data.xml pandas -n 2 -r sxX --strict --durations=10 %*
+      displayName: 'Test'
+    - task: PublishTestResults@2
+      inputs:
+        testResultsFiles: 'test-data.xml'
+        testRunTitle: 'Windows-$(CONDA_PY)'
+    - powershell: |
+        $junitXml = "test-data.xml"
+        $(Get-Content $junitXml | Out-String) -match 'failures="(.*?)"'
+        if ($matches[1] -eq 0)
+        {
+          Write-Host "No test failures in test-data"
+        }
+        else
+        {
+          # note that this will produce $LASTEXITCODE=1
+          Write-Error "$($matches[1]) tests failed"
+        }
+      displayName: Check for test failures
diff --git a/ci/before_install_travis.sh b/ci/before_install_travis.sh
deleted file mode 100755
index f90427f97d3b7..0000000000000
--- a/ci/before_install_travis.sh
+++ /dev/null
@@ -1,15 +0,0 @@
-#!/bin/bash
-
-# If envars.sh determined we're running  in an authorized fork
-# and the user opted in to the network cache,and that cached versions
-# are available on the cache server, download and deploy the cached
-# files to the local filesystem
-
-echo "inside $0"
-
-# overview
-if [ "${TRAVIS_OS_NAME}" == "linux" ]; then
-   sh -e /etc/init.d/xvfb start
-fi
-
-true # never fail because bad things happened here
diff --git a/ci/before_script_travis.sh b/ci/before_script_travis.sh
new file mode 100755
index 0000000000000..0b3939b1906a2
--- /dev/null
+++ b/ci/before_script_travis.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+
+echo "inside $0"
+
+if [ "${TRAVIS_OS_NAME}" == "linux" ]; then
+   sh -e /etc/init.d/xvfb start
+   sleep 3
+fi
+
+# Never fail because bad things happened here.
+true
diff --git a/ci/build_docs.sh b/ci/build_docs.sh
index 1356d097025c9..bf22f0764144c 100755
--- a/ci/build_docs.sh
+++ b/ci/build_docs.sh
@@ -1,31 +1,19 @@
 #!/bin/bash
 
+set -e
+
 if [ "${TRAVIS_OS_NAME}" != "linux" ]; then
    echo "not doing build_docs on non-linux"
    exit 0
 fi
 
-cd "$TRAVIS_BUILD_DIR"
+cd "$TRAVIS_BUILD_DIR"/doc
 echo "inside $0"
 
-git show --pretty="format:" --name-only HEAD~5.. --first-parent | grep -P "rst|txt|doc"
-
-if [ "$?" != "0" ]; then
-    echo "Skipping doc build, none were modified"
-    # nope, skip docs build
-    exit 0
-fi
-
-
 if [ "$DOC" ]; then
 
     echo "Will build docs"
 
-    source activate pandas
-
-    mv "$TRAVIS_BUILD_DIR"/doc /tmp
-    cd /tmp/doc
-
     echo ###############################
     echo # Log file for the doc build  #
     echo ###############################
@@ -37,24 +25,32 @@ if [ "$DOC" ]; then
     echo # Create and send docs #
     echo ########################
 
-    cd /tmp/doc/build/html
-    git config --global user.email "pandas-docs-bot@localhost.foo"
-    git config --global user.name "pandas-docs-bot"
-    git config --global credential.helper cache
-
-    # create the repo
-    git init
-    touch README
-    git add README
-    git commit -m "Initial commit" --allow-empty
-    git branch gh-pages
-    git checkout gh-pages
-    touch .nojekyll
-    git add --all .
-    git commit -m "Version" --allow-empty
-    git remote remove origin
-    git remote add origin "https://${PANDAS_GH_TOKEN}@github.com/pandas-docs/pandas-docs-travis.git"
-    git push origin gh-pages -f
+    echo "Only uploading docs when TRAVIS_PULL_REQUEST is 'false'"
+    echo "TRAVIS_PULL_REQUEST: ${TRAVIS_PULL_REQUEST}"
+
+    if [ "${TRAVIS_PULL_REQUEST}" == "false" ]; then
+        cd build/html
+        git config --global user.email "pandas-docs-bot@localhost.foo"
+        git config --global user.name "pandas-docs-bot"
+
+        # create the repo
+        git init
+
+        touch README
+        git add README
+        git commit -m "Initial commit" --allow-empty
+        git branch gh-pages
+        git checkout gh-pages
+        touch .nojekyll
+        git add --all .
+        git commit -m "Version" --allow-empty
+
+        git remote add origin "https://${PANDAS_GH_TOKEN}@github.com/pandas-dev/pandas-docs-travis.git"
+        git fetch origin
+        git remote -v
+
+        git push origin gh-pages -f
+    fi
 fi
 
 exit 0
diff --git a/ci/code_checks.sh b/ci/code_checks.sh
new file mode 100755
index 0000000000000..c4840f1e836c4
--- /dev/null
+++ b/ci/code_checks.sh
@@ -0,0 +1,259 @@
+#!/bin/bash
+#
+# Run checks related to code quality.
+#
+# This script is intended for both the CI and to check locally that code standards are
+# respected. We are currently linting (PEP-8 and similar), looking for patterns of
+# common mistakes (sphinx directives with missing blank lines, old style classes,
+# unwanted imports...), we run doctests here (currently some files only), and we
+# validate formatting error in docstrings.
+#
+# Usage:
+#   $ ./ci/code_checks.sh               # run all checks
+#   $ ./ci/code_checks.sh lint          # run linting only
+#   $ ./ci/code_checks.sh patterns      # check for patterns that should not exist
+#   $ ./ci/code_checks.sh code          # checks on imported code
+#   $ ./ci/code_checks.sh doctests      # run doctests
+#   $ ./ci/code_checks.sh docstrings    # validate docstring errors
+#   $ ./ci/code_checks.sh dependencies  # check that dependencies are consistent
+
+[[ -z "$1" || "$1" == "lint" || "$1" == "patterns" || "$1" == "code" || "$1" == "doctests" || "$1" == "docstrings" || "$1" == "dependencies" ]] || \
+    { echo "Unknown command $1. Usage: $0 [lint|patterns|code|doctests|docstrings|dependencies]"; exit 9999; }
+
+BASE_DIR="$(dirname $0)/.."
+RET=0
+CHECK=$1
+
+function invgrep {
+    # grep with inverse exist status and formatting for azure-pipelines
+    #
+    # This function works exactly as grep, but with opposite exit status:
+    # - 0 (success) when no patterns are found
+    # - 1 (fail) when the patterns are found
+    #
+    # This is useful for the CI, as we want to fail if one of the patterns
+    # that we want to avoid is found by grep.
+    if [[ "$AZURE" == "true" ]]; then
+        set -o pipefail
+        grep -n "$@" | awk -F ":" '{print "##vso[task.logissue type=error;sourcepath=" $1 ";linenumber=" $2 ";] Found unwanted pattern: " $3}'
+    else
+        grep "$@"
+    fi
+    return $((! $?))
+}
+
+if [[ "$AZURE" == "true" ]]; then
+    FLAKE8_FORMAT="##vso[task.logissue type=error;sourcepath=%(path)s;linenumber=%(row)s;columnnumber=%(col)s;code=%(code)s;]%(text)s"
+else
+    FLAKE8_FORMAT="default"
+fi
+
+### LINTING ###
+if [[ -z "$CHECK" || "$CHECK" == "lint" ]]; then
+
+    # `setup.cfg` contains the list of error codes that are being ignored in flake8
+
+    echo "flake8 --version"
+    flake8 --version
+
+    # pandas/_libs/src is C code, so no need to search there.
+    MSG='Linting .py code' ; echo $MSG
+    flake8 --format="$FLAKE8_FORMAT" .
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Linting .pyx code' ; echo $MSG
+    flake8 --format="$FLAKE8_FORMAT" pandas --filename=*.pyx --select=E501,E302,E203,E111,E114,E221,E303,E128,E231,E126,E265,E305,E301,E127,E261,E271,E129,W291,E222,E241,E123,F403,C400,C401,C402,C403,C404,C405,C406,C407,C408,C409,C410,C411
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Linting .pxd and .pxi.in' ; echo $MSG
+    flake8 --format="$FLAKE8_FORMAT" pandas/_libs --filename=*.pxi.in,*.pxd --select=E501,E302,E203,E111,E114,E221,E303,E231,E126,F403
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    echo "flake8-rst --version"
+    flake8-rst --version
+
+    MSG='Linting code-blocks in .rst documentation' ; echo $MSG
+    flake8-rst doc/source --filename=*.rst --format="$FLAKE8_FORMAT"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # Check that cython casting is of the form `<type>obj` as opposed to `<type> obj`;
+    # it doesn't make a difference, but we want to be internally consistent.
+    # Note: this grep pattern is (intended to be) equivalent to the python
+    # regex r'(?<![ ->])> '
+    MSG='Linting .pyx code for spacing conventions in casting' ; echo $MSG
+    invgrep -r -E --include '*.pyx' --include '*.pxi.in' '[a-zA-Z0-9*]> ' pandas/_libs
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # readability/casting: Warnings about C casting instead of C++ casting
+    # runtime/int: Warnings about using C number types instead of C++ ones
+    # build/include_subdir: Warnings about prefacing included header files with directory
+
+    # We don't lint all C files because we don't want to lint any that are built
+    # from Cython files nor do we want to lint C files that we didn't modify for
+    # this particular codebase (e.g. src/headers, src/klib, src/msgpack). However,
+    # we can lint all header files since they aren't "generated" like C files are.
+    MSG='Linting .c and .h' ; echo $MSG
+    cpplint --quiet --extensions=c,h --headers=h --recursive --filter=-readability/casting,-runtime/int,-build/include_subdir pandas/_libs/src/*.h pandas/_libs/src/parser pandas/_libs/ujson pandas/_libs/tslibs/src/datetime pandas/io/msgpack pandas/_libs/*.cpp pandas/util
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    echo "isort --version-number"
+    isort --version-number
+
+    # Imports - Check formatting using isort see setup.cfg for settings
+    MSG='Check import format using isort ' ; echo $MSG
+    isort --recursive --check-only pandas asv_bench
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+fi
+
+### PATTERNS ###
+if [[ -z "$CHECK" || "$CHECK" == "patterns" ]]; then
+
+    # Check for imports from pandas.core.common instead of `import pandas.core.common as com`
+    MSG='Check for non-standard imports' ; echo $MSG
+    invgrep -R --include="*.py*" -E "from pandas.core.common import " pandas
+    # invgrep -R --include="*.py*" -E "from numpy import nan " pandas  # GH#24822 not yet implemented since the offending imports have not all been removed
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for pytest warns' ; echo $MSG
+    invgrep -r -E --include '*.py' 'pytest\.warns' pandas/tests/
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # Check for the following code in testing: `np.testing` and `np.array_equal`
+    MSG='Check for invalid testing' ; echo $MSG
+    invgrep -r -E --include '*.py' --exclude testing.py '(numpy|np)(\.testing|\.array_equal)' pandas/tests/
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # Check for the following code in the extension array base tests: `tm.assert_frame_equal` and `tm.assert_series_equal`
+    MSG='Check for invalid EA testing' ; echo $MSG
+    invgrep -r -E --include '*.py' --exclude base.py 'tm.assert_(series|frame)_equal' pandas/tests/extension/base
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for deprecated messages without sphinx directive' ; echo $MSG
+    invgrep -R --include="*.py" --include="*.pyx" -E "(DEPRECATED|DEPRECATE|Deprecated)(:|,|\.)" pandas
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for old-style classes' ; echo $MSG
+    invgrep -R --include="*.py" -E "class\s\S*[^)]:" pandas scripts
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for backticks incorrectly rendering because of missing spaces' ; echo $MSG
+    invgrep -R --include="*.rst" -E "[a-zA-Z0-9]\`\`?[a-zA-Z0-9]" doc/source/
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for incorrect sphinx directives' ; echo $MSG
+    invgrep -R --include="*.py" --include="*.pyx" --include="*.rst" -E "\.\. (autosummary|contents|currentmodule|deprecated|function|image|important|include|ipython|literalinclude|math|module|note|raw|seealso|toctree|versionadded|versionchanged|warning):[^:]" ./pandas ./doc/source
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check that the deprecated `assert_raises_regex` is not used (`pytest.raises(match=pattern)` should be used instead)' ; echo $MSG
+    invgrep -R --exclude=*.pyc --exclude=testing.py --exclude=test_util.py assert_raises_regex pandas
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # Check for the following code in testing: `unittest.mock`, `mock.Mock()` or `mock.patch`
+    MSG='Check that unittest.mock is not used (pytest builtin monkeypatch fixture should be used instead)' ; echo $MSG
+    invgrep -r -E --include '*.py' '(unittest(\.| import )mock|mock\.Mock\(\)|mock\.patch)' pandas/tests/
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    # Check that we use pytest.raises only as a context manager
+    #
+    # For any flake8-compliant code, the only way this regex gets
+    # matched is if there is no "with" statement preceding "pytest.raises"
+    MSG='Check for pytest.raises as context manager (a line starting with `pytest.raises` is invalid, needs a `with` to precede it)' ; echo $MSG
+    MSG='TODO: This check is currently skipped because so many files fail this. Please enable when all are corrected (xref gh-24332)' ; echo $MSG
+    # invgrep -R --include '*.py' -E '[[:space:]] pytest.raises' pandas/tests
+    # RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for wrong space after code-block directive and before colon (".. code-block ::" instead of ".. code-block::")' ; echo $MSG
+    invgrep -R --include="*.rst" ".. code-block ::" doc/source
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check for wrong space after ipython directive and before colon (".. ipython ::" instead of ".. ipython::")' ; echo $MSG
+    invgrep -R --include="*.rst" ".. ipython ::" doc/source
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Check that no file in the repo contains tailing whitespaces' ; echo $MSG
+    set -o pipefail
+    if [[ "$AZURE" == "true" ]]; then
+        # we exclude all c/cpp files as the c/cpp files of pandas code base are tested when Linting .c and .h files
+        ! grep -n '--exclude=*.'{svg,c,cpp,html} -RI "\s$" * | awk -F ":" '{print "##vso[task.logissue type=error;sourcepath=" $1 ";linenumber=" $2 ";] Tailing whitespaces found: " $3}'
+    else
+        ! grep -n '--exclude=*.'{svg,c,cpp,html}  -RI "\s$" * | awk -F ":" '{print $1 ":" $2 ":Tailing whitespaces found: " $3}'
+    fi
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+fi
+
+### CODE ###
+if [[ -z "$CHECK" || "$CHECK" == "code" ]]; then
+
+    MSG='Check import. No warnings, and blacklist some optional dependencies' ; echo $MSG
+    python -W error -c "
+import sys
+import pandas
+
+blacklist = {'bs4', 'gcsfs', 'html5lib', 'ipython', 'jinja2' 'hypothesis',
+             'lxml', 'numexpr', 'openpyxl', 'py', 'pytest', 's3fs', 'scipy',
+             'tables', 'xlrd', 'xlsxwriter', 'xlwt'}
+mods = blacklist & set(m.split('.')[0] for m in sys.modules)
+if mods:
+    sys.stderr.write('err: pandas should not import: {}\n'.format(', '.join(mods)))
+    sys.exit(len(mods))
+    "
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+fi
+
+### DOCTESTS ###
+if [[ -z "$CHECK" || "$CHECK" == "doctests" ]]; then
+
+    MSG='Doctests frame.py' ; echo $MSG
+    pytest -q --doctest-modules pandas/core/frame.py \
+        -k" -itertuples -join -reindex -reindex_axis -round"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Doctests series.py' ; echo $MSG
+    pytest -q --doctest-modules pandas/core/series.py \
+        -k"-nonzero -reindex -searchsorted -to_dict"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Doctests generic.py' ; echo $MSG
+    pytest -q --doctest-modules pandas/core/generic.py \
+        -k"-_set_axis_name -_xs -describe -droplevel -groupby -interpolate -pct_change -pipe -reindex -reindex_axis -to_json -transpose -values -xs -to_clipboard"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Doctests top-level reshaping functions' ; echo $MSG
+    pytest -q --doctest-modules \
+        pandas/core/reshape/concat.py \
+        pandas/core/reshape/pivot.py \
+        pandas/core/reshape/reshape.py \
+        pandas/core/reshape/tile.py \
+        -k"-crosstab -pivot_table -cut"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+    MSG='Doctests interval classes' ; echo $MSG
+    pytest --doctest-modules -v \
+        pandas/core/indexes/interval.py \
+        pandas/core/arrays/interval.py \
+        -k"-from_arrays -from_breaks -from_intervals -from_tuples -get_loc -set_closed -to_tuples -interval_range"
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+fi
+
+### DOCSTRINGS ###
+if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
+
+    MSG='Validate docstrings (GL06, GL07, GL09, SS04, SS05, PR03, PR04, PR05, PR10, EX04, RT04, RT05, SA05)' ; echo $MSG
+    $BASE_DIR/scripts/validate_docstrings.py --format=azure --errors=GL06,GL07,GL09,SS04,SS05,PR03,PR04,PR05,PR10,EX04,RT04,RT05,SA05
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+fi
+
+### DEPENDENCIES ###
+if [[ -z "$CHECK" || "$CHECK" == "dependencies" ]]; then
+
+    MSG='Check that requirements-dev.txt has been generated from environment.yml' ; echo $MSG
+    $BASE_DIR/scripts/generate_pip_deps_from_conda.py --compare --azure
+    RET=$(($RET + $?)) ; echo $MSG "DONE"
+
+fi
+
+exit $RET
diff --git a/ci/deps/azure-27-compat.yaml b/ci/deps/azure-27-compat.yaml
new file mode 100644
index 0000000000000..a7784f17d1956
--- /dev/null
+++ b/ci/deps/azure-27-compat.yaml
@@ -0,0 +1,28 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - bottleneck=1.2.0
+  - cython=0.28.2
+  - jinja2=2.8
+  - numexpr=2.6.1
+  - numpy=1.12.0
+  - openpyxl=2.5.5
+  - pytables=3.4.2
+  - python-dateutil=2.5.0
+  - python=2.7*
+  - pytz=2013b
+  - scipy=0.18.1
+  - xlrd=1.0.0
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - isort
+  - pip:
+    - html5lib==1.0b2
+    - beautifulsoup4==4.2.1
+    - hypothesis>=3.58.0
diff --git a/ci/deps/azure-27-locale.yaml b/ci/deps/azure-27-locale.yaml
new file mode 100644
index 0000000000000..8636a63d02fed
--- /dev/null
+++ b/ci/deps/azure-27-locale.yaml
@@ -0,0 +1,30 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - bottleneck=1.2.0
+  - cython=0.28.2
+  - lxml
+  - matplotlib=2.0.0
+  - numpy=1.12.0
+  - openpyxl=2.4.0
+  - python-dateutil
+  - python-blosc
+  - python=2.7
+  - pytz
+  - pytz=2013b
+  - scipy
+  - sqlalchemy=0.8.1
+  - xlrd=1.0.0
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - hypothesis>=3.58.0
+  - isort
+  - pip:
+    - html5lib==1.0b2
+    - beautifulsoup4==4.2.1
diff --git a/ci/deps/azure-36-locale_slow.yaml b/ci/deps/azure-36-locale_slow.yaml
new file mode 100644
index 0000000000000..3f788e5ddcf39
--- /dev/null
+++ b/ci/deps/azure-36-locale_slow.yaml
@@ -0,0 +1,35 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython>=0.28.2
+  - gcsfs
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - moto
+  - isort
+  - pip:
+    - hypothesis>=3.58.0
diff --git a/ci/deps/azure-37-locale.yaml b/ci/deps/azure-37-locale.yaml
new file mode 100644
index 0000000000000..9d598cddce91a
--- /dev/null
+++ b/ci/deps/azure-37-locale.yaml
@@ -0,0 +1,34 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython>=0.28.2
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - pytables
+  - python-dateutil
+  - python=3.7*
+  - pytz
+  - s3fs
+  - scipy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - isort
+  - pip:
+    - hypothesis>=3.58.0
+    - moto  # latest moto in conda-forge fails with 3.7, move to conda dependencies when this is fixed
diff --git a/ci/deps/azure-37-numpydev.yaml b/ci/deps/azure-37-numpydev.yaml
new file mode 100644
index 0000000000000..e58c1f599279c
--- /dev/null
+++ b/ci/deps/azure-37-numpydev.yaml
@@ -0,0 +1,19 @@
+name: pandas-dev
+channels:
+  - defaults
+dependencies:
+  - python=3.7*
+  - pytz
+  - Cython>=0.28.2
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - hypothesis>=3.58.0
+  - isort
+  - pip:
+    - "git+git://github.com/dateutil/dateutil.git"
+    - "-f https://7933911d6844c6c53a7d-47bd50c35cd79bd838daf386af554a83.ssl.cf2.rackcdn.com"
+    - "--pre"
+    - "numpy"
+    - "scipy"
diff --git a/ci/deps/azure-macos-35.yaml b/ci/deps/azure-macos-35.yaml
new file mode 100644
index 0000000000000..2326e8092cc85
--- /dev/null
+++ b/ci/deps/azure-macos-35.yaml
@@ -0,0 +1,31 @@
+name: pandas-dev
+channels:
+  - defaults
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython>=0.28.2
+  - html5lib
+  - jinja2
+  - lxml
+  - matplotlib=2.2.0
+  - nomkl
+  - numexpr
+  - numpy=1.12.0
+  - openpyxl=2.5.5
+  - pyarrow
+  - pytables
+  - python=3.5*
+  - pytz
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  - isort
+  - pip:
+    - python-dateutil==2.5.3
+    # universal
+    - pytest>=4.0.2
+    - pytest-xdist
+    - pytest-mock
+    - hypothesis>=3.58.0
diff --git a/ci/deps/azure-windows-27.yaml b/ci/deps/azure-windows-27.yaml
new file mode 100644
index 0000000000000..f40efdfca3cbd
--- /dev/null
+++ b/ci/deps/azure-windows-27.yaml
@@ -0,0 +1,33 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - dateutil
+  - gcsfs
+  - html5lib
+  - jinja2=2.8
+  - lxml
+  - matplotlib=2.0.1
+  - numexpr
+  - numpy=1.12*
+  - openpyxl
+  - pytables
+  - python=2.7.*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - cython>=0.28.2
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - moto
+  - hypothesis>=3.58.0
+  - isort
diff --git a/ci/deps/azure-windows-36.yaml b/ci/deps/azure-windows-36.yaml
new file mode 100644
index 0000000000000..8517d340f2ba8
--- /dev/null
+++ b/ci/deps/azure-windows-36.yaml
@@ -0,0 +1,30 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - blosc
+  - bottleneck
+  - boost-cpp<1.67
+  - fastparquet>=0.2.1
+  - matplotlib
+  - numexpr
+  - numpy=1.14*
+  - openpyxl
+  - parquet-cpp
+  - pyarrow
+  - pytables
+  - python-dateutil
+  - python=3.6.6
+  - pytz
+  - scipy
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - cython>=0.28.2
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - hypothesis>=3.58.0
+  - isort
diff --git a/ci/deps/travis-27.yaml b/ci/deps/travis-27.yaml
new file mode 100644
index 0000000000000..a910af36a6b10
--- /dev/null
+++ b/ci/deps/travis-27.yaml
@@ -0,0 +1,51 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython=0.28.2
+  - fastparquet>=0.2.1
+  - gcsfs
+  - html5lib
+  - ipython
+  - jemalloc=4.5.0.post
+  - jinja2=2.8
+  - lxml
+  - matplotlib=2.2.2
+  - mock
+  - nomkl
+  - numexpr
+  - numpy=1.13*
+  - openpyxl=2.4.0
+  - patsy
+  - psycopg2
+  - py
+  - pyarrow=0.9.0
+  - PyCrypto
+  - pymysql=0.6.3
+  - pytables
+  - blosc=1.14.3
+  - python-blosc
+  - python-dateutil=2.5.0
+  - python=2.7*
+  - pytz=2013b
+  - s3fs
+  - scipy
+  - sqlalchemy=0.9.6
+  - xarray=0.9.6
+  - xlrd=1.0.0
+  - xlsxwriter=0.5.2
+  - xlwt=0.7.5
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - moto==1.3.4
+  - hypothesis>=3.58.0
+  - isort
+  - pip:
+    - backports.lzma
+    - pandas-gbq
+    - pathlib
diff --git a/ci/deps/travis-36-doc.yaml b/ci/deps/travis-36-doc.yaml
new file mode 100644
index 0000000000000..6f33bc58a8b21
--- /dev/null
+++ b/ci/deps/travis-36-doc.yaml
@@ -0,0 +1,46 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - bottleneck
+  - cython>=0.28.2
+  - fastparquet>=0.2.1
+  - gitpython
+  - html5lib
+  - hypothesis>=3.58.0
+  - ipykernel
+  - ipython
+  - ipywidgets
+  - lxml
+  - matplotlib
+  - nbconvert
+  - nbformat
+  - nbsphinx
+  - notebook
+  - numexpr
+  - numpy=1.13*
+  - numpydoc
+  - openpyxl
+  - pandoc
+  - pyarrow
+  - pyqt
+  - pytables
+  - python-dateutil
+  - python-snappy
+  - python=3.6*
+  - pytz
+  - scipy
+  - seaborn
+  - sphinx
+  - sqlalchemy
+  - statsmodels
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - isort
diff --git a/ci/deps/travis-36-locale.yaml b/ci/deps/travis-36-locale.yaml
new file mode 100644
index 0000000000000..34b289e6c0c2f
--- /dev/null
+++ b/ci/deps/travis-36-locale.yaml
@@ -0,0 +1,37 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython>=0.28.2
+  - html5lib
+  - ipython
+  - jinja2
+  - lxml
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - moto
+  - isort
+  - pip:
+    - hypothesis>=3.58.0
diff --git a/ci/deps/travis-36-slow.yaml b/ci/deps/travis-36-slow.yaml
new file mode 100644
index 0000000000000..46875d59411d9
--- /dev/null
+++ b/ci/deps/travis-36-slow.yaml
@@ -0,0 +1,33 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - cython>=0.28.2
+  - html5lib
+  - lxml
+  - matplotlib
+  - numexpr
+  - numpy
+  - openpyxl
+  - patsy
+  - psycopg2
+  - pymysql
+  - pytables
+  - python-dateutil
+  - python=3.6*
+  - pytz
+  - s3fs
+  - scipy
+  - sqlalchemy
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - moto
+  - hypothesis>=3.58.0
+  - isort
diff --git a/ci/deps/travis-36.yaml b/ci/deps/travis-36.yaml
new file mode 100644
index 0000000000000..06fc0d76a3d16
--- /dev/null
+++ b/ci/deps/travis-36.yaml
@@ -0,0 +1,47 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  - beautifulsoup4
+  - botocore>=1.11
+  - cython>=0.28.2
+  - dask
+  - fastparquet>=0.2.1
+  - gcsfs
+  - geopandas
+  - html5lib
+  - matplotlib
+  - nomkl
+  - numexpr
+  - numpy
+  - openpyxl
+  - psycopg2
+  - pyarrow=0.9.0
+  - pymysql
+  - pytables
+  - python-snappy
+  - python=3.6.6
+  - pytz
+  - s3fs
+  - scikit-learn
+  - scipy
+  - sqlalchemy
+  - statsmodels
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  # universal
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-cov
+  - pytest-mock
+  - hypothesis>=3.58.0
+  - isort
+  - pip:
+    - brotlipy
+    - coverage
+    - moto
+    - pandas-datareader
+    - python-dateutil
diff --git a/ci/deps/travis-37.yaml b/ci/deps/travis-37.yaml
new file mode 100644
index 0000000000000..f71d29fe13378
--- /dev/null
+++ b/ci/deps/travis-37.yaml
@@ -0,0 +1,22 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+  - c3i_test
+dependencies:
+  - python=3.7
+  - botocore>=1.11
+  - cython>=0.28.2
+  - numpy
+  - python-dateutil
+  - nomkl
+  - pyarrow
+  - pytz
+  - pytest>=4.0.2
+  - pytest-xdist
+  - pytest-mock
+  - hypothesis>=3.58.0
+  - s3fs
+  - isort
+  - pip:
+    - moto
diff --git a/ci/incremental/build.cmd b/ci/incremental/build.cmd
new file mode 100644
index 0000000000000..2cce38c03f406
--- /dev/null
+++ b/ci/incremental/build.cmd
@@ -0,0 +1,9 @@
+@rem https://github.com/numba/numba/blob/master/buildscripts/incremental/build.cmd
+
+@rem Build numba extensions without silencing compile errors
+python setup.py build_ext -q --inplace
+
+@rem Install pandas locally
+python -m pip install -e .
+
+if %errorlevel% neq 0 exit /b %errorlevel%
diff --git a/ci/incremental/build.sh b/ci/incremental/build.sh
new file mode 100755
index 0000000000000..05648037935a3
--- /dev/null
+++ b/ci/incremental/build.sh
@@ -0,0 +1,16 @@
+#!/bin/bash
+
+# Make sure any error below is reported as such
+set -v -e
+
+echo "[building extensions]"
+python setup.py build_ext -q --inplace
+python -m pip install -e .
+
+echo
+echo "[show environment]"
+conda list
+
+echo
+echo "[done]"
+exit 0
diff --git a/ci/incremental/install_miniconda.sh b/ci/incremental/install_miniconda.sh
new file mode 100755
index 0000000000000..a47dfdb324b34
--- /dev/null
+++ b/ci/incremental/install_miniconda.sh
@@ -0,0 +1,19 @@
+#!/bin/bash
+
+set -v -e
+
+# Install Miniconda
+unamestr=`uname`
+if [[ "$unamestr" == 'Linux' ]]; then
+    if [[ "$BITS32" == "yes" ]]; then
+        wget -q https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86.sh -O miniconda.sh
+    else
+        wget -q https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -O miniconda.sh
+    fi
+elif [[ "$unamestr" == 'Darwin' ]]; then
+    wget -q https://repo.continuum.io/miniconda/Miniconda3-latest-MacOSX-x86_64.sh -O miniconda.sh
+else
+  echo Error
+fi
+chmod +x miniconda.sh
+./miniconda.sh -b
diff --git a/ci/incremental/setup_conda_environment.cmd b/ci/incremental/setup_conda_environment.cmd
new file mode 100644
index 0000000000000..c104d78591384
--- /dev/null
+++ b/ci/incremental/setup_conda_environment.cmd
@@ -0,0 +1,21 @@
+@rem https://github.com/numba/numba/blob/master/buildscripts/incremental/setup_conda_environment.cmd
+@rem The cmd /C hack circumvents a regression where conda installs a conda.bat
+@rem script in non-root environments.
+set CONDA_INSTALL=cmd /C conda install -q -y
+set PIP_INSTALL=pip install -q
+
+@echo on
+
+@rem Deactivate any environment
+call deactivate
+@rem Display root environment (for debugging)
+conda list
+@rem Clean up any left-over from a previous build
+conda remove --all -q -y -n pandas-dev
+@rem Scipy, CFFI, jinja2 and IPython are optional dependencies, but exercised in the test suite
+conda env create --file=ci\deps\azure-windows-%CONDA_PY%.yaml
+
+call activate pandas-dev
+conda list
+
+if %errorlevel% neq 0 exit /b %errorlevel%
diff --git a/ci/incremental/setup_conda_environment.sh b/ci/incremental/setup_conda_environment.sh
new file mode 100755
index 0000000000000..f174c17a614d8
--- /dev/null
+++ b/ci/incremental/setup_conda_environment.sh
@@ -0,0 +1,52 @@
+#!/bin/bash
+
+set -v -e
+
+CONDA_INSTALL="conda install -q -y"
+PIP_INSTALL="pip install -q"
+
+
+# Deactivate any environment
+source deactivate
+# Display root environment (for debugging)
+conda list
+# Clean up any left-over from a previous build
+# (note workaround for https://github.com/conda/conda/issues/2679:
+#  `conda env remove` issue)
+conda remove --all -q -y -n pandas-dev
+
+echo
+echo "[create env]"
+time conda env create -q --file="${ENV_FILE}" || exit 1
+
+set +v
+source activate pandas-dev
+set -v
+
+# remove any installed pandas package
+# w/o removing anything else
+echo
+echo "[removing installed pandas]"
+conda remove pandas -y --force || true
+pip uninstall -y pandas || true
+
+echo
+echo "[no installed pandas]"
+conda list pandas
+
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    sudo locale-gen "$LOCALE_OVERRIDE"
+fi
+
+# # Install the compiler toolchain
+# if [[ $(uname) == Linux ]]; then
+#     if [[ "$CONDA_SUBDIR" == "linux-32" || "$BITS32" == "yes" ]] ; then
+#         $CONDA_INSTALL gcc_linux-32 gxx_linux-32
+#     else
+#         $CONDA_INSTALL gcc_linux-64 gxx_linux-64
+#     fi
+# elif  [[ $(uname) == Darwin ]]; then
+#     $CONDA_INSTALL clang_osx-64 clangxx_osx-64
+#     # Install llvm-openmp and intel-openmp on OSX too
+#     $CONDA_INSTALL llvm-openmp intel-openmp
+# fi
diff --git a/ci/install.ps1 b/ci/install.ps1
deleted file mode 100644
index 64ec7f81884cd..0000000000000
--- a/ci/install.ps1
+++ /dev/null
@@ -1,92 +0,0 @@
-# Sample script to install Miniconda under Windows
-# Authors: Olivier Grisel, Jonathan Helmus and Kyle Kastner, Robert McGibbon
-# License: CC0 1.0 Universal: http://creativecommons.org/publicdomain/zero/1.0/
-
-$MINICONDA_URL = "http://repo.continuum.io/miniconda/"
-
-
-function DownloadMiniconda ($python_version, $platform_suffix) {
-    $webclient = New-Object System.Net.WebClient
-    $filename = "Miniconda3-latest-Windows-" + $platform_suffix + ".exe"
-    $url = $MINICONDA_URL + $filename
-
-    $basedir = $pwd.Path + "\"
-    $filepath = $basedir + $filename
-    if (Test-Path $filename) {
-        Write-Host "Reusing" $filepath
-        return $filepath
-    }
-
-    # Download and retry up to 3 times in case of network transient errors.
-    Write-Host "Downloading" $filename "from" $url
-    $retry_attempts = 2
-    for($i=0; $i -lt $retry_attempts; $i++){
-        try {
-            $webclient.DownloadFile($url, $filepath)
-            break
-        }
-        Catch [Exception]{
-            Start-Sleep 1
-        }
-   }
-   if (Test-Path $filepath) {
-       Write-Host "File saved at" $filepath
-   } else {
-       # Retry once to get the error message if any at the last try
-       $webclient.DownloadFile($url, $filepath)
-   }
-   return $filepath
-}
-
-
-function InstallMiniconda ($python_version, $architecture, $python_home) {
-    Write-Host "Installing Python" $python_version "for" $architecture "bit architecture to" $python_home
-    if (Test-Path $python_home) {
-        Write-Host $python_home "already exists, skipping."
-        return $false
-    }
-    if ($architecture -match "32") {
-        $platform_suffix = "x86"
-    } else {
-        $platform_suffix = "x86_64"
-    }
-
-    $filepath = DownloadMiniconda $python_version $platform_suffix
-    Write-Host "Installing" $filepath "to" $python_home
-    $install_log = $python_home + ".log"
-    $args = "/S /D=$python_home"
-    Write-Host $filepath $args
-    Start-Process -FilePath $filepath -ArgumentList $args -Wait -Passthru
-    if (Test-Path $python_home) {
-        Write-Host "Python $python_version ($architecture) installation complete"
-    } else {
-        Write-Host "Failed to install Python in $python_home"
-        Get-Content -Path $install_log
-        Exit 1
-    }
-}
-
-
-function InstallCondaPackages ($python_home, $spec) {
-    $conda_path = $python_home + "\Scripts\conda.exe"
-    $args = "install --yes " + $spec
-    Write-Host ("conda " + $args)
-    Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait -Passthru
-}
-
-function UpdateConda ($python_home) {
-    $conda_path = $python_home + "\Scripts\conda.exe"
-    Write-Host "Updating conda..."
-    $args = "update --yes conda"
-    Write-Host $conda_path $args
-    Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait -Passthru
-}
-
-
-function main () {
-    InstallMiniconda "3.5" $env:PYTHON_ARCH $env:CONDA_ROOT
-    UpdateConda $env:CONDA_ROOT
-    InstallCondaPackages $env:CONDA_ROOT "conda-build jinja2 anaconda-client"
-}
-
-main
diff --git a/ci/install_circle.sh b/ci/install_circle.sh
deleted file mode 100755
index 00e14b10ebbd6..0000000000000
--- a/ci/install_circle.sh
+++ /dev/null
@@ -1,85 +0,0 @@
-#!/usr/bin/env bash
-
-home_dir=$(pwd)
-echo "[home_dir: $home_dir]"
-
-echo "[ls -ltr]"
-ls -ltr
-
-echo "[Using clean Miniconda install]"
-rm -rf "$MINICONDA_DIR"
-
-# install miniconda
-wget http://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -q -O miniconda.sh || exit 1
-bash miniconda.sh -b -p "$MINICONDA_DIR" || exit 1
-
-export PATH="$MINICONDA_DIR/bin:$PATH"
-
-echo "[update conda]"
-conda config --set ssl_verify false || exit 1
-conda config --set always_yes true --set changeps1 false || exit 1
-conda update -q conda
-
-# add the pandas channel to take priority
-# to add extra packages
-echo "[add channels]"
-conda config --add channels pandas || exit 1
-conda config --remove channels defaults || exit 1
-conda config --add channels defaults || exit 1
-
-# Useful for debugging any issues with conda
-conda info -a || exit 1
-
-# support env variables passed
-export ENVS_FILE=".envs"
-
-# make sure that the .envs file exists. it is ok if it is empty
-touch $ENVS_FILE
-
-# assume all command line arguments are environmental variables
-for var in "$@"
-do
-    echo "export $var" >> $ENVS_FILE
-done
-
-echo "[environmental variable file]"
-cat $ENVS_FILE
-source $ENVS_FILE
-
-export REQ_BUILD=ci/requirements-${JOB}.build
-export REQ_RUN=ci/requirements-${JOB}.run
-export REQ_PIP=ci/requirements-${JOB}.pip
-
-# edit the locale override if needed
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    echo "[Adding locale to the first line of pandas/__init__.py]"
-    rm -f pandas/__init__.pyc
-    sedc="3iimport locale\nlocale.setlocale(locale.LC_ALL, '$LOCALE_OVERRIDE')\n"
-    sed -i "$sedc" pandas/__init__.py
-    echo "[head -4 pandas/__init__.py]"
-    head -4 pandas/__init__.py
-    echo
-fi
-
-# create envbuild deps
-echo "[create env: ${REQ_BUILD}]"
-time conda create -n pandas -q --file=${REQ_BUILD} || exit 1
-time conda install -n pandas pytest || exit 1
-
-source activate pandas
-
-# build but don't install
-echo "[build em]"
-time python setup.py build_ext --inplace || exit 1
-
-# we may have run installations
-echo "[conda installs: ${REQ_RUN}]"
-if [ -e ${REQ_RUN} ]; then
-    time conda install -q --file=${REQ_RUN} || exit 1
-fi
-
-# we may have additional pip installs
-echo "[pip installs: ${REQ_PIP}]"
-if [ -e ${REQ_PIP} ]; then
-   pip install -r $REQ_PIP
-fi
diff --git a/ci/install_db_circle.sh b/ci/install_db_circle.sh
deleted file mode 100755
index a00f74f009f54..0000000000000
--- a/ci/install_db_circle.sh
+++ /dev/null
@@ -1,8 +0,0 @@
-#!/bin/bash
-
-echo "installing dbs"
-mysql -e 'create database pandas_nosetest;'
-psql -c 'create database pandas_nosetest;' -U postgres
-
-echo "done"
-exit 0
diff --git a/ci/install_travis.sh b/ci/install_travis.sh
index f71df979c9df0..d1a940f119228 100755
--- a/ci/install_travis.sh
+++ b/ci/install_travis.sh
@@ -34,9 +34,9 @@ fi
 
 # install miniconda
 if [ "${TRAVIS_OS_NAME}" == "osx" ]; then
-    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-MacOSX-x86_64.sh -O miniconda.sh || exit 1
+    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-MacOSX-x86_64.sh -q -O miniconda.sh || exit 1
 else
-    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -O miniconda.sh || exit 1
+    time wget http://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh -q -O miniconda.sh || exit 1
 fi
 time bash miniconda.sh -b -p "$MINICONDA_DIR" || exit 1
 
@@ -47,22 +47,9 @@ which conda
 echo
 echo "[update conda]"
 conda config --set ssl_verify false || exit 1
-conda config --set always_yes true --set changeps1 false || exit 1
+conda config --set quiet true --set always_yes true --set changeps1 false || exit 1
 conda update -q conda
 
-echo
-echo "[add channels]"
-# add the pandas channel to take priority
-# to add extra packages
-conda config --add channels pandas || exit 1
-conda config --remove channels defaults || exit 1
-conda config --add channels defaults || exit 1
-
-if [ "$CONDA_FORGE" ]; then
-    # add conda-forge channel as priority
-    conda config --add channels conda-forge || exit 1
-fi
-
 # Useful for debugging any issues with conda
 conda info -a || exit 1
 
@@ -93,89 +80,29 @@ echo
 echo "[create env]"
 
 # create our environment
-REQ="ci/requirements-${JOB}.build"
-time conda create -n pandas --file=${REQ} || exit 1
+time conda env create -q --file="${ENV_FILE}" || exit 1
 
-source activate pandas
+source activate pandas-dev
 
-# may have addtl installation instructions for this build
+# remove any installed pandas package
+# w/o removing anything else
 echo
-echo "[build addtl installs]"
-REQ="ci/requirements-${JOB}.build.sh"
-if [ -e ${REQ} ]; then
-    time bash $REQ || exit 1
-fi
-
-time conda install -n pandas pytest
-time pip install pytest-xdist
-
-if [ "$LINT" ]; then
-   conda install flake8
-   pip install cpplint
-fi
-
-if [ "$COVERAGE" ]; then
-    pip install coverage pytest-cov
-fi
-
-echo
-if [ "$BUILD_TEST" ]; then
-
-    # build & install testing
-    echo ["Starting installation test."]
-    python setup.py clean
-    python setup.py build_ext --inplace
-    python setup.py sdist --formats=gztar
-    conda uninstall cython
-    pip install dist/*tar.gz || exit 1
-
-else
-
-    # build but don't install
-    echo "[build em]"
-    time python setup.py build_ext --inplace || exit 1
-
-fi
+echo "[removing installed pandas]"
+conda remove pandas -y --force
+pip uninstall -y pandas
 
-# we may have run installations
 echo
-echo "[conda installs]"
-REQ="ci/requirements-${JOB}.run"
-if [ -e ${REQ} ]; then
-    time conda install -n pandas --file=${REQ} || exit 1
-fi
+echo "[no installed pandas]"
+conda list pandas
+pip list --format columns |grep pandas
 
-# we may have additional pip installs
-echo
-echo "[pip installs]"
-REQ="ci/requirements-${JOB}.pip"
-if [ -e ${REQ} ]; then
-   pip install -r $REQ
-fi
+# build and install
+echo "[running setup.py develop]"
+python setup.py develop  || exit 1
 
-# may have addtl installation instructions for this build
 echo
-echo "[addtl installs]"
-REQ="ci/requirements-${JOB}.sh"
-if [ -e ${REQ} ]; then
-    time bash $REQ || exit 1
-fi
-
-# finish install if we are not doing a build-testk
-if [ -z "$BUILD_TEST" ]; then
-
-    # remove any installed pandas package
-    # w/o removing anything else
-    echo
-    echo "[removing installed pandas]"
-    conda remove pandas --force
-
-    # install our pandas
-    echo
-    echo "[running setup.py develop]"
-    python setup.py develop  || exit 1
-
-fi
+echo "[show environment]"
+conda list
 
 echo
 echo "[done]"
diff --git a/ci/lint.sh b/ci/lint.sh
deleted file mode 100755
index ed3af2568811c..0000000000000
--- a/ci/lint.sh
+++ /dev/null
@@ -1,68 +0,0 @@
-#!/bin/bash
-
-echo "inside $0"
-
-source activate pandas
-
-RET=0
-
-if [ "$LINT" ]; then
-
-    # pandas/_libs/src is C code, so no need to search there.
-    echo "Linting  *.py"
-    flake8 pandas --filename=*.py --exclude pandas/_libs/src
-    if [ $? -ne "0" ]; then
-        RET=1
-    fi
-    echo "Linting *.py DONE"
-
-    echo "Linting *.pyx"
-    flake8 pandas --filename=*.pyx --select=E501,E302,E203,E111,E114,E221,E303,E128,E231,E126
-    if [ $? -ne "0" ]; then
-        RET=1
-    fi
-    echo "Linting *.pyx DONE"
-
-    echo "Linting *.pxi.in"
-    for path in 'src'
-    do
-        echo "linting -> pandas/$path"
-        flake8 pandas/$path --filename=*.pxi.in --select=E501,E302,E203,E111,E114,E221,E303,E231,E126
-        if [ $? -ne "0" ]; then
-            RET=1
-        fi
-
-    done
-    echo "Linting *.pxi.in DONE"
-
-    # readability/casting: Warnings about C casting instead of C++ casting
-    # runtime/int: Warnings about using C number types instead of C++ ones
-    # build/include_subdir: Warnings about prefacing included header files with directory
-
-    # We don't lint all C files because we don't want to lint any that are built
-    # from Cython files nor do we want to lint C files that we didn't modify for
-    # this particular codebase (e.g. src/headers, src/klib, src/msgpack). However,
-    # we can lint all header files since they aren't "generated" like C files are.
-    echo "Linting *.c and *.h"
-    for path in '*.h' 'period_helper.c' 'datetime' 'parser' 'ujson'
-    do
-        echo "linting -> pandas/_libs/src/$path"
-        cpplint --quiet --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir --recursive pandas/_libs/src/$path
-        if [ $? -ne "0" ]; then
-            RET=1
-        fi
-    done
-    echo "Linting *.c and *.h DONE"
-
-    echo "Check for invalid testing"
-    grep -r -E --include '*.py' --exclude testing.py '(numpy|np)\.testing' pandas
-    if [ $? = "0" ]; then
-        RET=1
-    fi
-    echo "Check for invalid testing DONE"
-
-else
-    echo "NOT Linting"
-fi
-
-exit $RET
diff --git a/ci/print_skipped.py b/ci/print_skipped.py
index dd2180f6eeb19..67bc7b556cd43 100755
--- a/ci/print_skipped.py
+++ b/ci/print_skipped.py
@@ -10,7 +10,7 @@ def parse_results(filename):
     root = tree.getroot()
     skipped = []
 
-    current_class = old_class = ''
+    current_class = ''
     i = 1
     assert i - 1 == len(skipped)
     for el in root.findall('testcase'):
@@ -24,7 +24,9 @@ def parse_results(filename):
             out = ''
             if old_class != current_class:
                 ndigits = int(math.log(i, 10) + 1)
-                out += ('-' * (len(name + msg) + 4 + ndigits) + '\n') # 4 for : + space + # + space
+
+                # 4 for : + space + # + space
+                out += ('-' * (len(name + msg) + 4 + ndigits) + '\n')
             out += '#{i} {name}: {msg}'.format(i=i, name=name, msg=msg)
             skipped.append(out)
             i += 1
diff --git a/ci/print_versions.py b/ci/print_versions.py
deleted file mode 100755
index 8be795174d76d..0000000000000
--- a/ci/print_versions.py
+++ /dev/null
@@ -1,28 +0,0 @@
-#!/usr/bin/env python
-
-
-def show_versions(as_json=False):
-    import imp
-    import os
-    fn = __file__
-    this_dir = os.path.dirname(fn)
-    pandas_dir = os.path.abspath(os.path.join(this_dir, ".."))
-    sv_path = os.path.join(pandas_dir, 'pandas', 'util')
-    mod = imp.load_module(
-        'pvmod', *imp.find_module('print_versions', [sv_path]))
-    return mod.show_versions(as_json)
-
-
-if __name__ == '__main__':
-    # optparse is 2.6-safe
-    from optparse import OptionParser
-    parser = OptionParser()
-    parser.add_option("-j", "--json", metavar="FILE", nargs=1,
-                      help="Save output as JSON into file, pass in '-' to output to stdout")
-
-    (options, args) = parser.parse_args()
-
-    if options.json == "-":
-        options.json = True
-
-    show_versions(as_json=options.json)
diff --git a/ci/requirements-2.7.build b/ci/requirements-2.7.build
deleted file mode 100644
index 415df13179fcf..0000000000000
--- a/ci/requirements-2.7.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=2.7*
-python-dateutil=2.4.1
-pytz=2013b
-nomkl
-numpy
-cython=0.23
diff --git a/ci/requirements-2.7.pip b/ci/requirements-2.7.pip
deleted file mode 100644
index eb796368e7820..0000000000000
--- a/ci/requirements-2.7.pip
+++ /dev/null
@@ -1,8 +0,0 @@
-blosc
-pandas-gbq
-pathlib
-backports.lzma
-py
-PyCrypto
-mock
-ipython
diff --git a/ci/requirements-2.7.run b/ci/requirements-2.7.run
deleted file mode 100644
index 62e31e4ae24e3..0000000000000
--- a/ci/requirements-2.7.run
+++ /dev/null
@@ -1,22 +0,0 @@
-python-dateutil=2.4.1
-pytz=2013b
-numpy
-xlwt=0.7.5
-numexpr
-pytables
-matplotlib
-openpyxl=1.6.2
-xlrd=0.9.2
-sqlalchemy=0.9.6
-lxml=3.2.1
-scipy
-xlsxwriter=0.4.6
-s3fs
-bottleneck
-psycopg2=2.5.2
-patsy
-pymysql=0.6.3
-html5lib=1.0b2
-beautiful-soup=4.2.1
-jinja2=2.8
-xarray=0.8.0
diff --git a/ci/requirements-2.7.sh b/ci/requirements-2.7.sh
deleted file mode 100644
index 64d470e5c6e0e..0000000000000
--- a/ci/requirements-2.7.sh
+++ /dev/null
@@ -1,7 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "install 27"
-
-conda install -n pandas -c conda-forge feather-format
diff --git a/ci/requirements-2.7_BUILD_TEST.build b/ci/requirements-2.7_BUILD_TEST.build
deleted file mode 100644
index aadec00cb7ebf..0000000000000
--- a/ci/requirements-2.7_BUILD_TEST.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=2.7*
-dateutil
-pytz
-nomkl
-numpy
-cython
diff --git a/ci/requirements-2.7_COMPAT.build b/ci/requirements-2.7_COMPAT.build
deleted file mode 100644
index 0e1ccf9eac9bf..0000000000000
--- a/ci/requirements-2.7_COMPAT.build
+++ /dev/null
@@ -1,5 +0,0 @@
-python=2.7*
-numpy=1.7.1
-cython=0.23
-dateutil=1.5
-pytz=2013b
diff --git a/ci/requirements-2.7_COMPAT.pip b/ci/requirements-2.7_COMPAT.pip
deleted file mode 100644
index 9533a630d06a4..0000000000000
--- a/ci/requirements-2.7_COMPAT.pip
+++ /dev/null
@@ -1,2 +0,0 @@
-openpyxl
-argparse
diff --git a/ci/requirements-2.7_COMPAT.run b/ci/requirements-2.7_COMPAT.run
deleted file mode 100644
index d27b6a72c2d15..0000000000000
--- a/ci/requirements-2.7_COMPAT.run
+++ /dev/null
@@ -1,16 +0,0 @@
-numpy=1.7.1
-dateutil=1.5
-pytz=2013b
-scipy=0.11.0
-xlwt=0.7.5
-xlrd=0.9.2
-bottleneck=0.8.0
-numexpr=2.2.2
-pytables=3.0.0
-html5lib=1.0b2
-beautiful-soup=4.2.0
-psycopg2=2.5.1
-pymysql=0.6.0
-sqlalchemy=0.7.8
-xlsxwriter=0.4.6
-jinja2=2.8
diff --git a/ci/requirements-2.7_LOCALE.build b/ci/requirements-2.7_LOCALE.build
deleted file mode 100644
index 4a37ce8fbe161..0000000000000
--- a/ci/requirements-2.7_LOCALE.build
+++ /dev/null
@@ -1,5 +0,0 @@
-python=2.7*
-python-dateutil
-pytz=2013b
-numpy=1.8.2
-cython=0.23
diff --git a/ci/requirements-2.7_LOCALE.pip b/ci/requirements-2.7_LOCALE.pip
deleted file mode 100644
index cf8e6b8b3d3a6..0000000000000
--- a/ci/requirements-2.7_LOCALE.pip
+++ /dev/null
@@ -1 +0,0 @@
-blosc
diff --git a/ci/requirements-2.7_LOCALE.run b/ci/requirements-2.7_LOCALE.run
deleted file mode 100644
index 5d7cc31b7d55e..0000000000000
--- a/ci/requirements-2.7_LOCALE.run
+++ /dev/null
@@ -1,14 +0,0 @@
-python-dateutil
-pytz=2013b
-numpy=1.8.2
-xlwt=0.7.5
-openpyxl=1.6.2
-xlsxwriter=0.4.6
-xlrd=0.9.2
-bottleneck=0.8.0
-matplotlib=1.3.1
-sqlalchemy=0.8.1
-html5lib=1.0b2
-lxml=3.2.1
-scipy
-beautiful-soup=4.2.1
diff --git a/ci/requirements-2.7_SLOW.build b/ci/requirements-2.7_SLOW.build
deleted file mode 100644
index 0f4a2c6792e6b..0000000000000
--- a/ci/requirements-2.7_SLOW.build
+++ /dev/null
@@ -1,5 +0,0 @@
-python=2.7*
-python-dateutil
-pytz
-numpy=1.8.2
-cython
diff --git a/ci/requirements-2.7_SLOW.run b/ci/requirements-2.7_SLOW.run
deleted file mode 100644
index c2d2a14285ad6..0000000000000
--- a/ci/requirements-2.7_SLOW.run
+++ /dev/null
@@ -1,20 +0,0 @@
-python-dateutil
-pytz
-numpy=1.8.2
-matplotlib=1.3.1
-scipy
-patsy
-xlwt
-openpyxl
-xlsxwriter
-xlrd
-numexpr
-pytables
-sqlalchemy
-lxml
-s3fs
-bottleneck
-psycopg2
-pymysql
-html5lib
-beautiful-soup
diff --git a/ci/requirements-2.7_WIN.run b/ci/requirements-2.7_WIN.run
deleted file mode 100644
index f953682f52d45..0000000000000
--- a/ci/requirements-2.7_WIN.run
+++ /dev/null
@@ -1,18 +0,0 @@
-dateutil
-pytz
-numpy=1.10*
-xlwt
-numexpr
-pytables==3.2.2
-matplotlib
-openpyxl
-xlrd
-sqlalchemy
-lxml=3.2.1
-scipy
-xlsxwriter
-s3fs
-bottleneck
-html5lib
-beautiful-soup
-jinja2=2.8
diff --git a/ci/requirements-3.4.build b/ci/requirements-3.4.build
deleted file mode 100644
index e8a957f70d40e..0000000000000
--- a/ci/requirements-3.4.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python=3.4*
-numpy=1.8.1
-cython=0.24.1
-libgfortran=1.0
diff --git a/ci/requirements-3.4.pip b/ci/requirements-3.4.pip
deleted file mode 100644
index 4e5fe52d56cf1..0000000000000
--- a/ci/requirements-3.4.pip
+++ /dev/null
@@ -1,2 +0,0 @@
-python-dateutil==2.2
-blosc
diff --git a/ci/requirements-3.4.run b/ci/requirements-3.4.run
deleted file mode 100644
index 3e12adae7dd9f..0000000000000
--- a/ci/requirements-3.4.run
+++ /dev/null
@@ -1,18 +0,0 @@
-pytz=2015.7
-numpy=1.8.1
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-scipy
-numexpr
-pytables
-lxml
-sqlalchemy
-bottleneck
-pymysql=0.6.3
-psycopg2
-jinja2=2.8
diff --git a/ci/requirements-3.4_SLOW.build b/ci/requirements-3.4_SLOW.build
deleted file mode 100644
index 88212053af472..0000000000000
--- a/ci/requirements-3.4_SLOW.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=3.4*
-python-dateutil
-pytz
-nomkl
-numpy=1.10*
-cython
diff --git a/ci/requirements-3.4_SLOW.run b/ci/requirements-3.4_SLOW.run
deleted file mode 100644
index 90156f62c6e71..0000000000000
--- a/ci/requirements-3.4_SLOW.run
+++ /dev/null
@@ -1,20 +0,0 @@
-python-dateutil
-pytz
-numpy=1.10*
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-scipy
-numexpr=2.4.6
-pytables
-matplotlib
-lxml
-sqlalchemy
-bottleneck
-pymysql
-psycopg2
-jinja2=2.8
diff --git a/ci/requirements-3.4_SLOW.sh b/ci/requirements-3.4_SLOW.sh
deleted file mode 100644
index 24f1e042ed69e..0000000000000
--- a/ci/requirements-3.4_SLOW.sh
+++ /dev/null
@@ -1,7 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "install 34_slow"
-
-conda install -n pandas -c conda-forge matplotlib
diff --git a/ci/requirements-3.5.build b/ci/requirements-3.5.build
deleted file mode 100644
index 76227e106e1fd..0000000000000
--- a/ci/requirements-3.5.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=3.5*
-python-dateutil
-pytz
-nomkl
-numpy=1.11.3
-cython
diff --git a/ci/requirements-3.5.pip b/ci/requirements-3.5.pip
deleted file mode 100644
index 6e4f7b65f9728..0000000000000
--- a/ci/requirements-3.5.pip
+++ /dev/null
@@ -1,2 +0,0 @@
-xarray==0.9.1
-pandas-gbq
diff --git a/ci/requirements-3.5.run b/ci/requirements-3.5.run
deleted file mode 100644
index 43e6814ed6c8e..0000000000000
--- a/ci/requirements-3.5.run
+++ /dev/null
@@ -1,21 +0,0 @@
-python-dateutil
-pytz
-numpy=1.11.3
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-scipy
-numexpr
-pytables
-html5lib
-lxml
-matplotlib
-jinja2
-bottleneck
-sqlalchemy
-pymysql
-psycopg2
-s3fs
-beautifulsoup4
-ipython
diff --git a/ci/requirements-3.5.sh b/ci/requirements-3.5.sh
deleted file mode 100644
index d0f0b81802dc6..0000000000000
--- a/ci/requirements-3.5.sh
+++ /dev/null
@@ -1,7 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "install 35"
-
-conda install -n pandas -c conda-forge feather-format
diff --git a/ci/requirements-3.5_ASCII.build b/ci/requirements-3.5_ASCII.build
deleted file mode 100644
index f7befe3b31865..0000000000000
--- a/ci/requirements-3.5_ASCII.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=3.5*
-python-dateutil
-pytz
-nomkl
-numpy
-cython
diff --git a/ci/requirements-3.5_ASCII.run b/ci/requirements-3.5_ASCII.run
deleted file mode 100644
index b9d543f557d06..0000000000000
--- a/ci/requirements-3.5_ASCII.run
+++ /dev/null
@@ -1,3 +0,0 @@
-python-dateutil
-pytz
-numpy
diff --git a/ci/requirements-3.5_DOC.build b/ci/requirements-3.5_DOC.build
deleted file mode 100644
index 73aeb3192242f..0000000000000
--- a/ci/requirements-3.5_DOC.build
+++ /dev/null
@@ -1,5 +0,0 @@
-python=3.5*
-python-dateutil
-pytz
-numpy
-cython
diff --git a/ci/requirements-3.5_DOC.run b/ci/requirements-3.5_DOC.run
deleted file mode 100644
index 644a16f51f4b6..0000000000000
--- a/ci/requirements-3.5_DOC.run
+++ /dev/null
@@ -1,21 +0,0 @@
-ipython
-ipykernel
-sphinx
-nbconvert
-nbformat
-notebook
-matplotlib
-scipy
-lxml
-beautifulsoup4
-html5lib
-pytables
-openpyxl=1.8.5
-xlrd
-xlwt
-xlsxwriter
-sqlalchemy
-numexpr
-bottleneck
-statsmodels
-pyqt=4.11.4
diff --git a/ci/requirements-3.5_DOC.sh b/ci/requirements-3.5_DOC.sh
deleted file mode 100644
index 1a5d4643edcf2..0000000000000
--- a/ci/requirements-3.5_DOC.sh
+++ /dev/null
@@ -1,11 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "[install DOC_BUILD deps]"
-
-pip install pandas-gbq
-
-conda install -n pandas -c conda-forge feather-format
-
-conda install -n pandas -c r r rpy2 --yes
diff --git a/ci/requirements-3.5_OSX.build b/ci/requirements-3.5_OSX.build
deleted file mode 100644
index f5bc01b67a20a..0000000000000
--- a/ci/requirements-3.5_OSX.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python=3.5*
-nomkl
-numpy=1.10.4
-cython
diff --git a/ci/requirements-3.5_OSX.pip b/ci/requirements-3.5_OSX.pip
deleted file mode 100644
index d1fc1fe24a079..0000000000000
--- a/ci/requirements-3.5_OSX.pip
+++ /dev/null
@@ -1 +0,0 @@
-python-dateutil==2.5.3
diff --git a/ci/requirements-3.5_OSX.run b/ci/requirements-3.5_OSX.run
deleted file mode 100644
index 1d83474d10f2f..0000000000000
--- a/ci/requirements-3.5_OSX.run
+++ /dev/null
@@ -1,16 +0,0 @@
-pytz
-numpy=1.10.4
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-numexpr
-pytables
-html5lib
-lxml
-matplotlib
-jinja2
-bottleneck
-xarray
-s3fs
-beautifulsoup4
diff --git a/ci/requirements-3.5_OSX.sh b/ci/requirements-3.5_OSX.sh
deleted file mode 100644
index cfbd2882a8a2d..0000000000000
--- a/ci/requirements-3.5_OSX.sh
+++ /dev/null
@@ -1,7 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "install 35_OSX"
-
-conda install -n pandas -c conda-forge feather-format
diff --git a/ci/requirements-3.6.build b/ci/requirements-3.6.build
deleted file mode 100644
index 1c4b46aea3865..0000000000000
--- a/ci/requirements-3.6.build
+++ /dev/null
@@ -1,6 +0,0 @@
-python=3.6*
-python-dateutil
-pytz
-nomkl
-numpy
-cython
diff --git a/ci/requirements-3.6.run b/ci/requirements-3.6.run
deleted file mode 100644
index 41c9680ce1b7e..0000000000000
--- a/ci/requirements-3.6.run
+++ /dev/null
@@ -1,22 +0,0 @@
-python-dateutil
-pytz
-numpy
-scipy
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-numexpr
-pytables
-matplotlib
-lxml
-html5lib
-jinja2
-sqlalchemy
-pymysql
-feather-format
-# psycopg2 (not avail on defaults ATM)
-beautifulsoup4
-s3fs
-xarray
-ipython
diff --git a/ci/requirements-3.6_NUMPY_DEV.build b/ci/requirements-3.6_NUMPY_DEV.build
deleted file mode 100644
index 738366867a217..0000000000000
--- a/ci/requirements-3.6_NUMPY_DEV.build
+++ /dev/null
@@ -1,4 +0,0 @@
-python=3.6*
-python-dateutil
-pytz
-cython
diff --git a/ci/requirements-3.6_NUMPY_DEV.build.sh b/ci/requirements-3.6_NUMPY_DEV.build.sh
deleted file mode 100644
index 4af1307f26a18..0000000000000
--- a/ci/requirements-3.6_NUMPY_DEV.build.sh
+++ /dev/null
@@ -1,14 +0,0 @@
-#!/bin/bash
-
-source activate pandas
-
-echo "install numpy master wheel"
-
-# remove the system installed numpy
-pip uninstall numpy -y
-
-# install numpy wheel from master
-PRE_WHEELS="https://7933911d6844c6c53a7d-47bd50c35cd79bd838daf386af554a83.ssl.cf2.rackcdn.com"
-pip install --pre --upgrade --timeout=60 -f $PRE_WHEELS numpy scipy
-
-true
diff --git a/ci/requirements-3.6_NUMPY_DEV.run b/ci/requirements-3.6_NUMPY_DEV.run
deleted file mode 100644
index 0aa987baefb1d..0000000000000
--- a/ci/requirements-3.6_NUMPY_DEV.run
+++ /dev/null
@@ -1,2 +0,0 @@
-python-dateutil
-pytz
diff --git a/ci/requirements-3.6_WIN.run b/ci/requirements-3.6_WIN.run
deleted file mode 100644
index 840d2867e9297..0000000000000
--- a/ci/requirements-3.6_WIN.run
+++ /dev/null
@@ -1,13 +0,0 @@
-python-dateutil
-pytz
-numpy=1.12*
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-scipy
-feather-format
-numexpr
-pytables
-matplotlib
-blosc
diff --git a/ci/requirements_all.txt b/ci/requirements_all.txt
deleted file mode 100644
index 4ff80a478f247..0000000000000
--- a/ci/requirements_all.txt
+++ /dev/null
@@ -1,26 +0,0 @@
-pytest
-pytest-cov
-pytest-xdist
-flake8
-sphinx
-ipython
-python-dateutil
-pytz
-openpyxl
-xlsxwriter
-xlrd
-xlwt
-html5lib
-patsy
-beautiful-soup
-numpy
-cython
-scipy
-numexpr
-pytables
-matplotlib
-lxml
-sqlalchemy
-bottleneck
-pymysql
-Jinja2
diff --git a/ci/requirements_dev.txt b/ci/requirements_dev.txt
deleted file mode 100644
index 1e051802ec9f8..0000000000000
--- a/ci/requirements_dev.txt
+++ /dev/null
@@ -1,7 +0,0 @@
-python-dateutil
-pytz
-numpy
-cython
-pytest
-pytest-cov
-flake8
diff --git a/ci/run_build_docs.sh b/ci/run_build_docs.sh
deleted file mode 100755
index 2909b9619552e..0000000000000
--- a/ci/run_build_docs.sh
+++ /dev/null
@@ -1,10 +0,0 @@
-#!/bin/bash
-
-echo "inside $0"
-
-"$TRAVIS_BUILD_DIR"/ci/build_docs.sh 2>&1
-
-# wait until subprocesses finish (build_docs.sh)
-wait
-
-exit 0
diff --git a/ci/run_circle.sh b/ci/run_circle.sh
deleted file mode 100755
index 0e46d28ab6fc4..0000000000000
--- a/ci/run_circle.sh
+++ /dev/null
@@ -1,9 +0,0 @@
-#!/usr/bin/env bash
-
-echo "[running tests]"
-export PATH="$MINICONDA_DIR/bin:$PATH"
-
-source activate pandas
-
-echo "pytest --junitxml=$CIRCLE_TEST_REPORTS/reports/junit.xml $@ pandas"
-pytest --junitxml=$CIRCLE_TEST_REPORTS/reports/junit.xml $@ pandas
diff --git a/ci/run_tests.sh b/ci/run_tests.sh
new file mode 100755
index 0000000000000..ee46da9f52eab
--- /dev/null
+++ b/ci/run_tests.sh
@@ -0,0 +1,58 @@
+#!/bin/bash
+
+set -e
+
+if [ "$DOC" ]; then
+    echo "We are not running pytest as this is a doc-build"
+    exit 0
+fi
+
+# Workaround for pytest-xdist flaky collection order
+# https://github.com/pytest-dev/pytest/issues/920
+# https://github.com/pytest-dev/pytest/issues/1075
+export PYTHONHASHSEED=$(python -c 'import random; print(random.randint(1, 4294967295))')
+
+if [ -n "$LOCALE_OVERRIDE" ]; then
+    export LC_ALL="$LOCALE_OVERRIDE"
+    export LANG="$LOCALE_OVERRIDE"
+    PANDAS_LOCALE=`python -c 'import pandas; pandas.get_option("display.encoding")'`
+    if [[ "$LOCALE_OVERIDE" != "$PANDAS_LOCALE" ]]; then
+        echo "pandas could not detect the locale. System locale: $LOCALE_OVERRIDE, pandas detected: $PANDAS_LOCALE"
+        # TODO Not really aborting the tests until https://github.com/pandas-dev/pandas/issues/23923 is fixed
+        # exit 1
+    fi
+fi
+if [[ "not network" == *"$PATTERN"* ]]; then
+    export http_proxy=http://1.2.3.4 https_proxy=http://1.2.3.4;
+fi
+
+
+if [ -n "$PATTERN" ]; then
+    PATTERN=" and $PATTERN"
+fi
+
+for TYPE in single multiple
+do
+    if [ "$COVERAGE" ]; then
+        COVERAGE_FNAME="/tmp/coc-$TYPE.xml"
+        COVERAGE="-s --cov=pandas --cov-report=xml:$COVERAGE_FNAME"
+    fi
+
+    TYPE_PATTERN=$TYPE
+    NUM_JOBS=1
+    if [[ "$TYPE_PATTERN" == "multiple" ]]; then
+        TYPE_PATTERN="not single"
+        NUM_JOBS=2
+    fi
+
+    PYTEST_CMD="pytest -m \"$TYPE_PATTERN$PATTERN\" -n $NUM_JOBS -s --strict --durations=10 --junitxml=test-data-$TYPE.xml $TEST_ARGS $COVERAGE pandas"
+    echo $PYTEST_CMD
+    # if no tests are found (the case of "single and slow"), pytest exits with code 5, and would make the script fail, if not for the below code
+    sh -c "$PYTEST_CMD; ret=\$?; [ \$ret = 5 ] && exit 0 || exit \$ret"
+
+    if [[ "$COVERAGE" && $? == 0 ]]; then
+        echo "uploading coverage for $TYPE tests"
+        echo "bash <(curl -s https://codecov.io/bash) -Z -c -F $TYPE -f $COVERAGE_FNAME"
+              bash <(curl -s https://codecov.io/bash) -Z -c -F $TYPE -f $COVERAGE_FNAME
+    fi
+done
diff --git a/ci/script_multi.sh b/ci/script_multi.sh
deleted file mode 100755
index 88ecaf344a410..0000000000000
--- a/ci/script_multi.sh
+++ /dev/null
@@ -1,36 +0,0 @@
-#!/bin/bash
-
-echo "[script multi]"
-
-source activate pandas
-
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    export LC_ALL="$LOCALE_OVERRIDE";
-    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
-
-    pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
-    python -c "$pycmd"
-fi
-
-# Workaround for pytest-xdist flaky collection order
-# https://github.com/pytest-dev/pytest/issues/920
-# https://github.com/pytest-dev/pytest/issues/1075
-export PYTHONHASHSEED=$(python -c 'import random; print(random.randint(1, 4294967295))')
-echo PYTHONHASHSEED=$PYTHONHASHSEED
-
-if [ "$BUILD_TEST" ]; then
-    cd /tmp
-    python -c "import pandas; pandas.test(['-n 2'])"
-elif [ "$DOC" ]; then
-    echo "We are not running pytest as this is a doc-build"
-elif [ "$COVERAGE" ]; then
-    echo pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml $TEST_ARGS pandas
-    pytest -s -n 2 -m "not single" --cov=pandas --cov-report xml:/tmp/cov-multiple.xml --junitxml=/tmp/multiple.xml $TEST_ARGS pandas
-else
-    echo pytest -n 2 -m "not single" --junitxml=/tmp/multiple.xml $TEST_ARGS pandas
-    pytest -n 2 -m "not single" --junitxml=/tmp/multiple.xml $TEST_ARGS pandas # TODO: doctest
-fi
-
-RET="$?"
-
-exit "$RET"
diff --git a/ci/script_single.sh b/ci/script_single.sh
deleted file mode 100755
index db637679f0e0f..0000000000000
--- a/ci/script_single.sh
+++ /dev/null
@@ -1,29 +0,0 @@
-#!/bin/bash
-
-echo "[script_single]"
-
-source activate pandas
-
-if [ -n "$LOCALE_OVERRIDE" ]; then
-    export LC_ALL="$LOCALE_OVERRIDE";
-    echo "Setting LC_ALL to $LOCALE_OVERRIDE"
-
-    pycmd='import pandas; print("pandas detected console encoding: %s" % pandas.get_option("display.encoding"))'
-    python -c "$pycmd"
-fi
-
-if [ "$BUILD_TEST" ]; then
-    echo "We are not running pytest as this is a build test."
-elif [ "$DOC" ]; then
-    echo "We are not running pytest as this is a doc-build"
-elif [ "$COVERAGE" ]; then
-    echo pytest -s -m "single" --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
-    pytest -s -m "single" --cov=pandas --cov-report xml:/tmp/cov-single.xml --junitxml=/tmp/single.xml $TEST_ARGS pandas
-else
-    echo pytest -m "single" --junitxml=/tmp/single.xml $TEST_ARGS pandas
-    pytest -m "single" --junitxml=/tmp/single.xml $TEST_ARGS pandas # TODO: doctest
-fi
-
-RET="$?"
-
-exit "$RET"
diff --git a/ci/show_circle.sh b/ci/show_circle.sh
deleted file mode 100755
index bfaa65c1d84f2..0000000000000
--- a/ci/show_circle.sh
+++ /dev/null
@@ -1,8 +0,0 @@
-#!/usr/bin/env bash
-
-echo "[installed versions]"
-
-export PATH="$MINICONDA_DIR/bin:$PATH"
-source activate pandas
-
-python -c "import pandas; pandas.show_versions();"
diff --git a/ci/upload_coverage.sh b/ci/upload_coverage.sh
deleted file mode 100755
index a7ef2fa908079..0000000000000
--- a/ci/upload_coverage.sh
+++ /dev/null
@@ -1,12 +0,0 @@
-#!/bin/bash
-
-if [ -z "$COVERAGE" ]; then
-   echo "coverage is not selected for this build"
-   exit 0
-fi
-
-source activate pandas
-
-echo "uploading coverage"
-bash <(curl -s https://codecov.io/bash) -Z -c -F single -f /tmp/cov-single.xml
-bash <(curl -s https://codecov.io/bash) -Z -c -F multiple -f /tmp/cov-multiple.xml
diff --git a/circle.yml b/circle.yml
deleted file mode 100644
index fa2da0680f388..0000000000000
--- a/circle.yml
+++ /dev/null
@@ -1,38 +0,0 @@
-machine:
-  environment:
-    # these are globally set
-    MINICONDA_DIR: /home/ubuntu/miniconda3
-
-
-database:
-  override:
-    - ./ci/install_db_circle.sh
-
-
-checkout:
-  post:
-    # since circleci does a shallow fetch
-    # we need to populate our tags
-    - git fetch --depth=1000
-
-
-dependencies:
-  override:
-    - >
-      case $CIRCLE_NODE_INDEX in
-       0)
-         sudo apt-get install language-pack-it && ./ci/install_circle.sh JOB="2.7_COMPAT" LOCALE_OVERRIDE="it_IT.UTF-8" ;;
-       1)
-         sudo apt-get install language-pack-zh-hans && ./ci/install_circle.sh JOB="3.4_SLOW" LOCALE_OVERRIDE="zh_CN.UTF-8" ;;
-       2)
-         sudo apt-get install language-pack-zh-hans && ./ci/install_circle.sh JOB="3.4" LOCALE_OVERRIDE="zh_CN.UTF-8" ;;
-       3)
-         ./ci/install_circle.sh JOB="3.5_ASCII" LOCALE_OVERRIDE="C" ;;
-      esac
-    - ./ci/show_circle.sh
-
-
-test:
-  override:
-      - case $CIRCLE_NODE_INDEX in 0) ./ci/run_circle.sh --skip-slow --skip-network ;; 1) ./ci/run_circle.sh --only-slow --skip-network ;; 2) ./ci/run_circle.sh --skip-slow --skip-network ;; 3) ./ci/run_circle.sh --skip-slow --skip-network ;; esac:
-          parallel: true
diff --git a/codecov.yml b/codecov.yml
index b4552563deeaa..512bc2e82a736 100644
--- a/codecov.yml
+++ b/codecov.yml
@@ -5,7 +5,9 @@ coverage:
   status:
     project:
       default:
+        enabled: no
         target: '82'
     patch:
       default:
+        enabled: no
         target: '50'
diff --git a/conda.recipe/meta.yaml b/conda.recipe/meta.yaml
index 2aee11772896f..f92090fecccf3 100644
--- a/conda.recipe/meta.yaml
+++ b/conda.recipe/meta.yaml
@@ -1,9 +1,9 @@
 package:
     name: pandas
-    version: {{ GIT_DESCRIBE_TAG|replace("v","") }}
+    version: {{ environ.get('GIT_DESCRIBE_TAG','').replace('v', '', 1) }}
 
 build:
-    number: {{ GIT_DESCRIBE_NUMBER|int }}
+    number: {{ environ.get('GIT_DESCRIBE_NUMBER', 0) }}
     {% if GIT_DESCRIBE_NUMBER|int == 0 %}string: np{{ CONDA_NPY }}py{{ CONDA_PY }}_0
     {% else %}string: np{{ CONDA_NPY }}py{{ CONDA_PY }}_{{ GIT_BUILD_STR }}{% endif %}
 
@@ -12,22 +12,28 @@ source:
 
 requirements:
   build:
+    - {{ compiler('c') }}
+    - {{ compiler('cxx') }}
+  host:
     - python
+    - pip
     - cython
-    - numpy x.x
-    - setuptools
+    - numpy
+    - setuptools >=3.3
+    - python-dateutil >=2.5.0
     - pytz
-    - python-dateutil
-
   run:
-    - python
-    - numpy x.x
-    - python-dateutil
+    - python {{ python }}
+    - {{ pin_compatible('numpy') }}
+    - python-dateutil >=2.5.0
     - pytz
 
 test:
-  imports:
-    - pandas
+  requires:
+    - pytest
+  commands:
+    - python -c "import pandas; pandas.test()"
+
 
 about:
   home: http://pandas.pydata.org
diff --git a/doc/README.rst b/doc/README.rst
index a3733846d9ed1..5423e7419d03b 100644
--- a/doc/README.rst
+++ b/doc/README.rst
@@ -1,169 +1 @@
-.. _contributing.docs:
-
-Contributing to the documentation
-=================================
-
-If you're not the developer type, contributing to the documentation is still
-of huge value. You don't even have to be an expert on
-*pandas* to do so! Something as simple as rewriting small passages for clarity
-as you reference the docs is a simple but effective way to contribute. The
-next person to read that passage will be in your debt!
-
-Actually, there are sections of the docs that are worse off by being written
-by experts. If something in the docs doesn't make sense to you, updating the
-relevant section after you figure it out is a simple way to ensure it will
-help the next person.
-
-.. contents:: Table of contents:
-   :local:
-
-
-About the pandas documentation
-------------------------------
-
-The documentation is written in **reStructuredText**, which is almost like writing
-in plain English, and built using `Sphinx <http://sphinx.pocoo.org/>`__. The
-Sphinx Documentation has an excellent `introduction to reST
-<http://sphinx.pocoo.org/rest.html>`__. Review the Sphinx docs to perform more
-complex changes to the documentation as well.
-
-Some other important things to know about the docs:
-
-- The pandas documentation consists of two parts: the docstrings in the code
-  itself and the docs in this folder ``pandas/doc/``.
-
-  The docstrings provide a clear explanation of the usage of the individual
-  functions, while the documentation in this folder consists of tutorial-like
-  overviews per topic together with some other information (what's new,
-  installation, etc).
-
-- The docstrings follow the **Numpy Docstring Standard** which is used widely
-  in the Scientific Python community. This standard specifies the format of
-  the different sections of the docstring. See `this document
-  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_
-  for a detailed explanation, or look at some of the existing functions to
-  extend it in a similar manner.
-
-- The tutorials make heavy use of the `ipython directive
-  <http://matplotlib.org/sampledoc/ipython_directive.html>`_ sphinx extension.
-  This directive lets you put code in the documentation which will be run
-  during the doc build. For example:
-
-  ::
-
-      .. ipython:: python
-
-          x = 2
-          x**3
-
-  will be rendered as
-
-  ::
-
-      In [1]: x = 2
-
-      In [2]: x**3
-      Out[2]: 8
-
-  This means that almost all code examples in the docs are always run (and the
-  output saved) during the doc build. This way, they will always be up to date,
-  but it makes the doc building a bit more complex.
-
-
-How to build the pandas documentation
--------------------------------------
-
-Requirements
-^^^^^^^^^^^^
-
-To build the pandas docs there are some extra requirements: you will need to
-have ``sphinx`` and ``ipython`` installed. `numpydoc
-<https://github.com/numpy/numpydoc>`_ is used to parse the docstrings that
-follow the Numpy Docstring Standard (see above), but you don't need to install
-this because a local copy of ``numpydoc`` is included in the pandas source
-code.
-
-Furthermore, it is recommended to have all `optional dependencies
-<http://pandas.pydata.org/pandas-docs/dev/install.html#optional-dependencies>`_
-installed. This is not needed, but be aware that you will see some error
-messages. Because all the code in the documentation is executed during the doc
-build, the examples using this optional dependencies will generate errors.
-Run ``pd.show_versions()`` to get an overview of the installed version of all
-dependencies.
-
-.. warning::
-
-   Sphinx version >= 1.2.2 or the older 1.1.3 is required.
-
-Building pandas
-^^^^^^^^^^^^^^^
-
-For a step-by-step overview on how to set up your environment, to work with
-the pandas code and git, see `the developer pages
-<http://pandas.pydata.org/developers.html#working-with-the-code>`_.
-When you start to work on some docs, be sure to update your code to the latest
-development version ('master')::
-
-    git fetch upstream
-    git rebase upstream/master
-
-Often it will be necessary to rebuild the C extension after updating::
-
-    python setup.py build_ext --inplace
-
-Building the documentation
-^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-So how do you build the docs? Navigate to your local folder
-``pandas/doc/`` directory in the console and run::
-
-    python make.py html
-
-And then you can find the html output in the folder ``pandas/doc/build/html/``.
-
-The first time it will take quite a while, because it has to run all the code
-examples in the documentation and build all generated docstring pages.
-In subsequent evocations, sphinx will try to only build the pages that have
-been modified.
-
-If you want to do a full clean build, do::
-
-    python make.py clean
-    python make.py build
-
-
-Starting with 0.13.1 you can tell ``make.py`` to compile only a single section
-of the docs, greatly reducing the turn-around time for checking your changes.
-You will be prompted to delete `.rst` files that aren't required, since the
-last committed version can always be restored from git.
-
-::
-
-    #omit autosummary and API section
-    python make.py clean
-    python make.py --no-api
-
-    # compile the docs with only a single
-    # section, that which is in indexing.rst
-    python make.py clean
-    python make.py --single indexing
-
-For comparison, a full doc build may take 10 minutes. a ``-no-api`` build
-may take 3 minutes and a single section may take 15 seconds.
-
-Where to start?
----------------
-
-There are a number of issues listed under `Docs
-<https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open>`_
-and `Good as first PR
-<https://github.com/pandas-dev/pandas/issues?labels=Good+as+first+PR&sort=updated&state=open>`_
-where you could start out.
-
-Or maybe you have an idea of your own, by using pandas, looking for something
-in the documentation and thinking 'this can be improved', let's do something
-about that!
-
-Feel free to ask questions on `mailing list
-<https://groups.google.com/forum/?fromgroups#!forum/pydata>`_ or submit an
-issue on Github.
+See `contributing.rst <https://pandas-docs.github.io/pandas-docs-travis/contributing.html>`_ in this repo.
diff --git a/doc/_templates/api_redirect.html b/doc/_templates/api_redirect.html
index 24bdd8363830f..c04a8b58ce544 100644
--- a/doc/_templates/api_redirect.html
+++ b/doc/_templates/api_redirect.html
@@ -1,15 +1,10 @@
-{% set pgn = pagename.split('.') -%}
-{% if pgn[-2][0].isupper() -%}
-    {% set redirect = ["pandas", pgn[-2], pgn[-1], 'html']|join('.') -%}
-{% else -%}
-    {% set redirect = ["pandas", pgn[-1], 'html']|join('.') -%}
-{% endif -%}
+{% set redirect = redirects[pagename.split("/")[-1]] %}
 <html>
     <head>
-        <meta http-equiv="Refresh" content="0; url={{ redirect }}" />
+        <meta http-equiv="Refresh" content="0; url={{ redirect }}.html" />
         <title>This API page has moved</title>
     </head>
     <body>
-        <p>This API page has moved <a href="{{ redirect }}">here</a>.</p>
+        <p>This API page has moved <a href="{{ redirect }}.html">here</a>.</p>
     </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet.pdf b/doc/cheatsheet/Pandas_Cheat_Sheet.pdf
index d504926d22580..48da05d053b96 100644
Binary files a/doc/cheatsheet/Pandas_Cheat_Sheet.pdf and b/doc/cheatsheet/Pandas_Cheat_Sheet.pdf differ
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet.pptx b/doc/cheatsheet/Pandas_Cheat_Sheet.pptx
index 76ae8f1e39d4e..039b3898fa301 100644
Binary files a/doc/cheatsheet/Pandas_Cheat_Sheet.pptx and b/doc/cheatsheet/Pandas_Cheat_Sheet.pptx differ
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pdf b/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pdf
new file mode 100644
index 0000000000000..cf1e40e627f33
Binary files /dev/null and b/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pdf differ
diff --git a/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pptx b/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pptx
new file mode 100644
index 0000000000000..564d92ddbb56a
Binary files /dev/null and b/doc/cheatsheet/Pandas_Cheat_Sheet_JA.pptx differ
diff --git a/doc/cheatsheet/README.txt b/doc/cheatsheet/README.txt
index e2f6ec042e9cc..d32fe5bcd05a6 100644
--- a/doc/cheatsheet/README.txt
+++ b/doc/cheatsheet/README.txt
@@ -2,3 +2,7 @@ The Pandas Cheat Sheet was created using Microsoft Powerpoint 2013.
 To create the PDF version, within Powerpoint, simply do a "Save As"
 and pick "PDF' as the format.
 
+This cheat sheet was inspired by the RstudioData Wrangling Cheatsheet[1], written by Irv Lustig, Princeton Consultants[2].
+
+[1]: https://www.rstudio.com/wp-content/uploads/2015/02/data-wrangling-cheatsheet.pdf
+[2]: http://www.princetonoptimization.com/
diff --git a/doc/make.py b/doc/make.py
index 30cd2ad8b61c9..6ffbd3ef86e68 100755
--- a/doc/make.py
+++ b/doc/make.py
@@ -1,476 +1,341 @@
 #!/usr/bin/env python
-
 """
 Python script for building documentation.
 
 To build the docs you must have all optional dependencies for pandas
 installed. See the installation instructions for a list of these.
 
-<del>Note: currently latex builds do not work because of table formats that are not
-supported in the latex generation.</del>
-
-2014-01-30: Latex has some issues but 'latex_forced' works ok for 0.13.0-400 or so
-
 Usage
 -----
-python make.py clean
-python make.py html
+    $ python make.py clean
+    $ python make.py html
+    $ python make.py latex
 """
-from __future__ import print_function
-
-import io
-import glob  # noqa
+import importlib
+import sys
 import os
 import shutil
-import sys
-from contextlib import contextmanager
-
-import sphinx  # noqa
+import csv
+import subprocess
 import argparse
-import jinja2  # noqa
-
-os.environ['PYTHONPATH'] = '..'
-
-SPHINX_BUILD = 'sphinxbuild'
-
-
-def upload_dev(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/html; rsync -avz . {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/dev/ -essh'.format(user)):
-        raise SystemExit('Upload to Pydata Dev failed')
-
-
-def upload_dev_pdf(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/latex; scp pandas.pdf {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/dev/'.format(user)):
-        raise SystemExit('PDF upload to Pydata Dev failed')
-
-
-def upload_stable(user='pandas'):
-    'push a copy to the pydata stable directory'
-    if os.system('cd build/html; rsync -avz . {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/stable/ -essh'.format(user)):
-        raise SystemExit('Upload to stable failed')
-
-
-def upload_stable_pdf(user='pandas'):
-    'push a copy to the pydata dev directory'
-    if os.system('cd build/latex; scp pandas.pdf {0}@pandas.pydata.org'
-                 ':/usr/share/nginx/pandas/pandas-docs/stable/'.format(user)):
-        raise SystemExit('PDF upload to stable failed')
-
-
-def upload_prev(ver, doc_root='./', user='pandas'):
-    'push a copy of older release to appropriate version directory'
-    local_dir = doc_root + 'build/html'
-    remote_dir = '/usr/share/nginx/pandas/pandas-docs/version/%s/' % ver
-    cmd = 'cd %s; rsync -avz . %s@pandas.pydata.org:%s -essh'
-    cmd = cmd % (local_dir, user, remote_dir)
-    print(cmd)
-    if os.system(cmd):
-        raise SystemExit(
-            'Upload to %s from %s failed' % (remote_dir, local_dir))
-
-    local_dir = doc_root + 'build/latex'
-    pdf_cmd = 'cd %s; scp pandas.pdf %s@pandas.pydata.org:%s'
-    pdf_cmd = pdf_cmd % (local_dir, user, remote_dir)
-    if os.system(pdf_cmd):
-        raise SystemExit('Upload PDF to %s from %s failed' % (ver, doc_root))
-
-def build_pandas():
-    os.chdir('..')
-    os.system('python setup.py clean')
-    os.system('python setup.py build_ext --inplace')
-    os.chdir('doc')
-
-def build_prev(ver):
-    if os.system('git checkout v%s' % ver) != 1:
-        os.chdir('..')
-        os.system('python setup.py clean')
-        os.system('python setup.py build_ext --inplace')
-        os.chdir('doc')
-        os.system('python make.py clean')
-        os.system('python make.py html')
-        os.system('python make.py latex')
-        os.system('git checkout master')
-
-
-def clean():
-    if os.path.exists('build'):
-        shutil.rmtree('build')
-
-    if os.path.exists('source/generated'):
-        shutil.rmtree('source/generated')
-
+import webbrowser
+import docutils
+import docutils.parsers.rst
 
-@contextmanager
-def cleanup_nb(nb):
-    try:
-        yield
-    finally:
-        try:
-            os.remove(nb + '.executed')
-        except OSError:
-            pass
 
+DOC_PATH = os.path.dirname(os.path.abspath(__file__))
+SOURCE_PATH = os.path.join(DOC_PATH, 'source')
+BUILD_PATH = os.path.join(DOC_PATH, 'build')
+REDIRECTS_FILE = os.path.join(DOC_PATH, 'redirects.csv')
 
-def get_kernel():
-    """Find the kernel name for your python version"""
-    return 'python%s' % sys.version_info.major
 
-
-def execute_nb(src, dst, allow_errors=False, timeout=1000, kernel_name=''):
-    """
-    Execute notebook in `src` and write the output to `dst`
-
-    Parameters
-    ----------
-    src, dst: str
-        path to notebook
-    allow_errors: bool
-    timeout: int
-    kernel_name: str
-        defualts to value set in notebook metadata
-
-    Returns
-    -------
-    dst: str
+class DocBuilder:
     """
-    import nbformat
-    from nbconvert.preprocessors import ExecutePreprocessor
-
-    with io.open(src, encoding='utf-8') as f:
-        nb = nbformat.read(f, as_version=4)
-
-    ep = ExecutePreprocessor(allow_errors=allow_errors,
-                             timeout=timeout,
-                             kernel_name=kernel_name)
-    ep.preprocess(nb, resources={})
+    Class to wrap the different commands of this script.
 
-    with io.open(dst, 'wt', encoding='utf-8') as f:
-        nbformat.write(nb, f)
-    return dst
-
-
-def convert_nb(src, dst, to='html', template_file='basic'):
-    """
-    Convert a notebook `src`.
-
-    Parameters
-    ----------
-    src, dst: str
-        filepaths
-    to: {'rst', 'html'}
-        format to export to
-    template_file: str
-        name of template file to use. Default 'basic'
+    All public methods of this class can be called as parameters of the
+    script.
     """
-    from nbconvert import HTMLExporter, RSTExporter
-
-    dispatch = {'rst': RSTExporter, 'html': HTMLExporter}
-    exporter = dispatch[to.lower()](template_file=template_file)
-
-    (body, resources) = exporter.from_filename(src)
-    with io.open(dst, 'wt', encoding='utf-8') as f:
-        f.write(body)
-    return dst
-
-
-def html():
-    check_build()
-
-    notebooks = [
-        'source/html-styling.ipynb',
-    ]
+    def __init__(self, num_jobs=0, include_api=True, single_doc=None,
+                 verbosity=0, warnings_are_errors=False):
+        self.num_jobs = num_jobs
+        self.verbosity = verbosity
+        self.warnings_are_errors = warnings_are_errors
+
+        if single_doc:
+            single_doc = self._process_single_doc(single_doc)
+            include_api = False
+            os.environ['SPHINX_PATTERN'] = single_doc
+        elif not include_api:
+            os.environ['SPHINX_PATTERN'] = '-api'
+
+        self.single_doc_html = None
+        if single_doc and single_doc.endswith('.rst'):
+            self.single_doc_html = os.path.splitext(single_doc)[0] + '.html'
+        elif single_doc:
+            self.single_doc_html = 'reference/api/pandas.{}.html'.format(
+                single_doc)
+
+    def _process_single_doc(self, single_doc):
+        """
+        Make sure the provided value for --single is a path to an existing
+        .rst/.ipynb file, or a pandas object that can be imported.
+
+        For example, categorial.rst or pandas.DataFrame.head. For the latter,
+        return the corresponding file path
+        (e.g. reference/api/pandas.DataFrame.head.rst).
+        """
+        base_name, extension = os.path.splitext(single_doc)
+        if extension in ('.rst', '.ipynb'):
+            if os.path.exists(os.path.join(SOURCE_PATH, single_doc)):
+                return single_doc
+            else:
+                raise FileNotFoundError('File {} not found'.format(single_doc))
 
-    for nb in notebooks:
-        with cleanup_nb(nb):
+        elif single_doc.startswith('pandas.'):
             try:
-                print("Converting %s" % nb)
-                kernel_name = get_kernel()
-                executed = execute_nb(nb, nb + '.executed', allow_errors=True,
-                                      kernel_name=kernel_name)
-                convert_nb(executed, nb.rstrip('.ipynb') + '.html')
-            except (ImportError, IndexError) as e:
-                print(e)
-                print("Failed to convert %s" % nb)
-
-    if os.system('sphinx-build -P -b html -d build/doctrees '
-                 'source build/html'):
-        raise SystemExit("Building HTML failed.")
-    try:
-        # remove stale file
-        os.remove('source/html-styling.html')
-        os.remove('build/html/pandas.zip')
-    except:
-        pass
-
-
-def zip_html():
-    try:
-        print("\nZipping up HTML docs...")
-        # just in case the wonky build box doesn't have zip
-        # don't fail this.
-        os.system('cd build; rm -f html/pandas.zip; zip html/pandas.zip -r -q html/* ')
-        print("\n")
-    except:
-        pass
-
-def latex():
-    check_build()
-    if sys.platform != 'win32':
-        # LaTeX format.
-        if os.system('sphinx-build -j 2 -b latex -d build/doctrees '
-                     'source build/latex'):
-            raise SystemExit("Building LaTeX failed.")
-        # Produce pdf.
-
-        os.chdir('build/latex')
-
-        # Call the makefile produced by sphinx...
-        if os.system('make'):
-            print("Rendering LaTeX failed.")
-            print("You may still be able to get a usable PDF file by going into 'build/latex'")
-            print("and executing 'pdflatex pandas.tex' for the requisite number of passes.")
-            print("Or using the 'latex_forced' target")
-            raise SystemExit
-
-        os.chdir('../..')
-    else:
-        print('latex build has not been tested on windows')
-
-def latex_forced():
-    check_build()
-    if sys.platform != 'win32':
-        # LaTeX format.
-        if os.system('sphinx-build -j 2 -b latex -d build/doctrees '
-                     'source build/latex'):
-            raise SystemExit("Building LaTeX failed.")
-        # Produce pdf.
-
-        os.chdir('build/latex')
-
-        # Manually call pdflatex, 3 passes should ensure latex fixes up
-        # all the required cross-references and such.
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        os.system('pdflatex -interaction=nonstopmode pandas.tex')
-        raise SystemExit("You should check the file 'build/latex/pandas.pdf' for problems.")
-
-        os.chdir('../..')
-    else:
-        print('latex build has not been tested on windows')
-
-
-def check_build():
-    build_dirs = [
-        'build', 'build/doctrees', 'build/html',
-        'build/latex', 'build/plots', 'build/_static',
-        'build/_templates']
-    for d in build_dirs:
-        try:
-            os.mkdir(d)
-        except OSError:
-            pass
-
-
-def all():
-    # clean()
-    html()
-
-
-def auto_dev_build(debug=False):
-    msg = ''
-    try:
-        step = 'clean'
-        clean()
-        step = 'html'
-        html()
-        step = 'upload dev'
-        upload_dev()
-        if not debug:
-            sendmail(step)
-
-        step = 'latex'
-        latex()
-        step = 'upload pdf'
-        upload_dev_pdf()
-        if not debug:
-            sendmail(step)
-    except (Exception, SystemExit) as inst:
-        msg = str(inst) + '\n'
-        sendmail(step, '[ERROR] ' + msg)
-
-
-def sendmail(step=None, err_msg=None):
-    from_name, to_name = _get_config()
-
-    if step is None:
-        step = ''
-
-    if err_msg is None or '[ERROR]' not in err_msg:
-        msgstr = 'Daily docs %s completed successfully' % step
-        subject = "DOC: %s successful" % step
-    else:
-        msgstr = err_msg
-        subject = "DOC: %s failed" % step
-
-    import smtplib
-    from email.MIMEText import MIMEText
-    msg = MIMEText(msgstr)
-    msg['Subject'] = subject
-    msg['From'] = from_name
-    msg['To'] = to_name
-
-    server_str, port, login, pwd = _get_credentials()
-    server = smtplib.SMTP(server_str, port)
-    server.ehlo()
-    server.starttls()
-    server.ehlo()
-
-    server.login(login, pwd)
-    try:
-        server.sendmail(from_name, to_name, msg.as_string())
-    finally:
-        server.close()
-
-
-def _get_dir(subdir=None):
-    import getpass
-    USERNAME = getpass.getuser()
-    if sys.platform == 'darwin':
-        HOME = '/Users/%s' % USERNAME
-    else:
-        HOME = '/home/%s' % USERNAME
-
-    if subdir is None:
-        subdir = '/code/scripts/config'
-    conf_dir = '%s/%s' % (HOME, subdir)
-    return conf_dir
-
-
-def _get_credentials():
-    tmp_dir = _get_dir()
-    cred = '%s/credentials' % tmp_dir
-    with open(cred, 'r') as fh:
-        server, port, un, domain = fh.read().split(',')
-    port = int(port)
-    login = un + '@' + domain + '.com'
-
-    import base64
-    with open('%s/cron_email_pwd' % tmp_dir, 'r') as fh:
-        pwd = base64.b64decode(fh.read())
-
-    return server, port, login, pwd
-
-
-def _get_config():
-    tmp_dir = _get_dir()
-    with open('%s/addresses' % tmp_dir, 'r') as fh:
-        from_name, to_name = fh.read().split(',')
-    return from_name, to_name
-
-funcd = {
-    'html': html,
-    'zip_html': zip_html,
-    'upload_dev': upload_dev,
-    'upload_stable': upload_stable,
-    'upload_dev_pdf': upload_dev_pdf,
-    'upload_stable_pdf': upload_stable_pdf,
-    'latex': latex,
-    'latex_forced': latex_forced,
-    'clean': clean,
-    'auto_dev': auto_dev_build,
-    'auto_debug': lambda: auto_dev_build(True),
-    'build_pandas': build_pandas,
-    'all': all,
-}
-
-small_docs = False
-
-# current_dir = os.getcwd()
-# os.chdir(os.path.dirname(os.path.join(current_dir, __file__)))
-
-import argparse
-argparser = argparse.ArgumentParser(description="""
-pandas documentation builder
-""".strip())
-
-# argparser.add_argument('-arg_name', '--arg_name',
-#                    metavar='label for arg help',
-#                    type=str|etc,
-#                    nargs='N|*|?|+|argparse.REMAINDER',
-#                    required=False,
-#                    #choices='abc',
-#                    help='help string',
-#                    action='store|store_true')
-
-# args = argparser.parse_args()
-
-#print args.accumulate(args.integers)
-
-def generate_index(api=True, single=False, **kwds):
-    from jinja2 import Template
-    with open("source/index.rst.template") as f:
-        t = Template(f.read())
-
-    with open("source/index.rst","w") as f:
-        f.write(t.render(api=api,single=single,**kwds))
+                obj = pandas  # noqa: F821
+                for name in single_doc.split('.'):
+                    obj = getattr(obj, name)
+            except AttributeError:
+                raise ImportError('Could not import {}'.format(single_doc))
+            else:
+                return single_doc[len('pandas.'):]
+        else:
+            raise ValueError(('--single={} not understood. Value should be a '
+                              'valid path to a .rst or .ipynb file, or a '
+                              'valid pandas object (e.g. categorical.rst or '
+                              'pandas.DataFrame.head)').format(single_doc))
+
+    @staticmethod
+    def _run_os(*args):
+        """
+        Execute a command as a OS terminal.
+
+        Parameters
+        ----------
+        *args : list of str
+            Command and parameters to be executed
+
+        Examples
+        --------
+        >>> DocBuilder()._run_os('python', '--version')
+        """
+        subprocess.check_call(args, stdout=sys.stdout, stderr=sys.stderr)
+
+    def _sphinx_build(self, kind):
+        """
+        Call sphinx to build documentation.
+
+        Attribute `num_jobs` from the class is used.
+
+        Parameters
+        ----------
+        kind : {'html', 'latex'}
+
+        Examples
+        --------
+        >>> DocBuilder(num_jobs=4)._sphinx_build('html')
+        """
+        if kind not in ('html', 'latex'):
+            raise ValueError('kind must be html or latex, '
+                             'not {}'.format(kind))
+
+        cmd = ['sphinx-build', '-b', kind]
+        if self.num_jobs:
+            cmd += ['-j', str(self.num_jobs)]
+        if self.warnings_are_errors:
+            cmd += ['-W', '--keep-going']
+        if self.verbosity:
+            cmd.append('-{}'.format('v' * self.verbosity))
+        cmd += ['-d', os.path.join(BUILD_PATH, 'doctrees'),
+                SOURCE_PATH, os.path.join(BUILD_PATH, kind)]
+        return subprocess.call(cmd)
+
+    def _open_browser(self, single_doc_html):
+        """
+        Open a browser tab showing single
+        """
+        url = os.path.join('file://', DOC_PATH, 'build', 'html',
+                           single_doc_html)
+        webbrowser.open(url, new=2)
+
+    def _get_page_title(self, page):
+        """
+        Open the rst file `page` and extract its title.
+        """
+        fname = os.path.join(SOURCE_PATH, '{}.rst'.format(page))
+        option_parser = docutils.frontend.OptionParser(
+            components=(docutils.parsers.rst.Parser,))
+        doc = docutils.utils.new_document(
+            '<doc>',
+            option_parser.get_default_values())
+        with open(fname) as f:
+            data = f.read()
+
+        parser = docutils.parsers.rst.Parser()
+        # do not generate any warning when parsing the rst
+        with open(os.devnull, 'a') as f:
+            doc.reporter.stream = f
+            parser.parse(data, doc)
+
+        section = next(node for node in doc.children
+                       if isinstance(node, docutils.nodes.section))
+        title = next(node for node in section.children
+                     if isinstance(node, docutils.nodes.title))
+
+        return title.astext()
+
+    def _add_redirects(self):
+        """
+        Create in the build directory an html file with a redirect,
+        for every row in REDIRECTS_FILE.
+        """
+        html = '''
+        <html>
+            <head>
+                <meta http-equiv="refresh" content="0;URL={url}"/>
+            </head>
+            <body>
+                <p>
+                    The page has been moved to <a href="{url}">{title}</a>
+                </p>
+            </body>
+        <html>
+        '''
+        with open(REDIRECTS_FILE) as mapping_fd:
+            reader = csv.reader(mapping_fd)
+            for row in reader:
+                if not row or row[0].strip().startswith('#'):
+                    continue
+
+                path = os.path.join(BUILD_PATH,
+                                    'html',
+                                    *row[0].split('/')) + '.html'
+
+                try:
+                    title = self._get_page_title(row[1])
+                except Exception:
+                    # the file can be an ipynb and not an rst, or docutils
+                    # may not be able to read the rst because it has some
+                    # sphinx specific stuff
+                    title = 'this page'
+
+                if os.path.exists(path):
+                    raise RuntimeError((
+                        'Redirection would overwrite an existing file: '
+                        '{}').format(path))
+
+                with open(path, 'w') as moved_page_fd:
+                    moved_page_fd.write(
+                        html.format(url='{}.html'.format(row[1]),
+                                    title=title))
+
+    def html(self):
+        """
+        Build HTML documentation.
+        """
+        ret_code = self._sphinx_build('html')
+        zip_fname = os.path.join(BUILD_PATH, 'html', 'pandas.zip')
+        if os.path.exists(zip_fname):
+            os.remove(zip_fname)
+
+        if self.single_doc_html is not None:
+            self._open_browser(self.single_doc_html)
+        else:
+            self._add_redirects()
+        return ret_code
+
+    def latex(self, force=False):
+        """
+        Build PDF documentation.
+        """
+        if sys.platform == 'win32':
+            sys.stderr.write('latex build has not been tested on windows\n')
+        else:
+            ret_code = self._sphinx_build('latex')
+            os.chdir(os.path.join(BUILD_PATH, 'latex'))
+            if force:
+                for i in range(3):
+                    self._run_os('pdflatex',
+                                 '-interaction=nonstopmode',
+                                 'pandas.tex')
+                raise SystemExit('You should check the file '
+                                 '"build/latex/pandas.pdf" for problems.')
+            else:
+                self._run_os('make')
+            return ret_code
+
+    def latex_forced(self):
+        """
+        Build PDF documentation with retries to find missing references.
+        """
+        return self.latex(force=True)
+
+    @staticmethod
+    def clean():
+        """
+        Clean documentation generated files.
+        """
+        shutil.rmtree(BUILD_PATH, ignore_errors=True)
+        shutil.rmtree(os.path.join(SOURCE_PATH, 'reference', 'api'),
+                      ignore_errors=True)
+
+    def zip_html(self):
+        """
+        Compress HTML documentation into a zip file.
+        """
+        zip_fname = os.path.join(BUILD_PATH, 'html', 'pandas.zip')
+        if os.path.exists(zip_fname):
+            os.remove(zip_fname)
+        dirname = os.path.join(BUILD_PATH, 'html')
+        fnames = os.listdir(dirname)
+        os.chdir(dirname)
+        self._run_os('zip',
+                     zip_fname,
+                     '-r',
+                     '-q',
+                     *fnames)
 
-import argparse
-argparser = argparse.ArgumentParser(description="pandas documentation builder",
-                                    epilog="Targets : %s" % funcd.keys())
-
-argparser.add_argument('--no-api',
-                   default=False,
-                   help='Ommit api and autosummary',
-                   action='store_true')
-argparser.add_argument('--single',
-                   metavar='FILENAME',
-                   type=str,
-                   default=False,
-                   help='filename of section to compile, e.g. "indexing"')
-argparser.add_argument('--user',
-                   type=str,
-                   default=False,
-                   help='Username to connect to the pydata server')
 
 def main():
-    args, unknown = argparser.parse_known_args()
-    sys.argv = [sys.argv[0]] + unknown
-    if args.single:
-        args.single = os.path.basename(args.single).split(".rst")[0]
-
-    if 'clean' in unknown:
-        args.single=False
-
-    generate_index(api=not args.no_api and not args.single, single=args.single)
-
-    if len(sys.argv) > 2:
-        ftype = sys.argv[1]
-        ver = sys.argv[2]
-
-        if ftype == 'build_previous':
-            build_prev(ver, user=args.user)
-        if ftype == 'upload_previous':
-            upload_prev(ver, user=args.user)
-    elif len(sys.argv) == 2:
-        for arg in sys.argv[1:]:
-            func = funcd.get(arg)
-            if func is None:
-                raise SystemExit('Do not know how to handle %s; valid args are %s' % (
-                    arg, list(funcd.keys())))
-            if args.user:
-                func(user=args.user)
-            else:
-                func()
-    else:
-        small_docs = False
-        all()
-# os.chdir(current_dir)
+    cmds = [method for method in dir(DocBuilder) if not method.startswith('_')]
+
+    argparser = argparse.ArgumentParser(
+        description='pandas documentation builder',
+        epilog='Commands: {}'.format(','.join(cmds)))
+    argparser.add_argument('command',
+                           nargs='?',
+                           default='html',
+                           help='command to run: {}'.format(', '.join(cmds)))
+    argparser.add_argument('--num-jobs',
+                           type=int,
+                           default=0,
+                           help='number of jobs used by sphinx-build')
+    argparser.add_argument('--no-api',
+                           default=False,
+                           help='omit api and autosummary',
+                           action='store_true')
+    argparser.add_argument('--single',
+                           metavar='FILENAME',
+                           type=str,
+                           default=None,
+                           help=('filename (relative to the "source" folder)'
+                                 ' of section or method name to compile, e.g. '
+                                 '"development/contributing.rst",'
+                                 ' "ecosystem.rst", "pandas.DataFrame.join"'))
+    argparser.add_argument('--python-path',
+                           type=str,
+                           default=os.path.dirname(DOC_PATH),
+                           help='path')
+    argparser.add_argument('-v', action='count', dest='verbosity', default=0,
+                           help=('increase verbosity (can be repeated), '
+                                 'passed to the sphinx build command'))
+    argparser.add_argument('--warnings-are-errors', '-W',
+                           action='store_true',
+                           help='fail if warnings are raised')
+    args = argparser.parse_args()
+
+    if args.command not in cmds:
+        raise ValueError('Unknown command {}. Available options: {}'.format(
+            args.command, ', '.join(cmds)))
+
+    # Below we update both os.environ and sys.path. The former is used by
+    # external libraries (namely Sphinx) to compile this module and resolve
+    # the import of `python_path` correctly. The latter is used to resolve
+    # the import within the module, injecting it into the global namespace
+    os.environ['PYTHONPATH'] = args.python_path
+    sys.path.insert(0, args.python_path)
+    globals()['pandas'] = importlib.import_module('pandas')
+
+    # Set the matplotlib backend to the non-interactive Agg backend for all
+    # child processes.
+    os.environ['MPLBACKEND'] = 'module://matplotlib.backends.backend_agg'
+
+    builder = DocBuilder(args.num_jobs, not args.no_api, args.single,
+                         args.verbosity, args.warnings_are_errors)
+    return getattr(builder, args.command)()
+
 
 if __name__ == '__main__':
-    import sys
     sys.exit(main())
diff --git a/doc/plots/stats/moment_plots.py b/doc/plots/stats/moment_plots.py
deleted file mode 100644
index 9e3a902592c6b..0000000000000
--- a/doc/plots/stats/moment_plots.py
+++ /dev/null
@@ -1,30 +0,0 @@
-import numpy as np
-
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-
-def test_series(n=1000):
-    t.N = n
-    s = t.makeTimeSeries()
-    return s
-
-
-def plot_timeseries(*args, **kwds):
-    n = len(args)
-
-    fig, axes = plt.subplots(n, 1, figsize=kwds.get('size', (10, 5)),
-                             sharex=True)
-    titles = kwds.get('titles', None)
-
-    for k in range(1, n + 1):
-        ax = axes[k - 1]
-        ts = args[k - 1]
-        ax.plot(ts.index, ts.values)
-
-        if titles:
-            ax.set_title(titles[k - 1])
-
-    fig.autofmt_xdate()
-    fig.subplots_adjust(bottom=0.10, top=0.95)
diff --git a/doc/plots/stats/moments_ewma.py b/doc/plots/stats/moments_ewma.py
deleted file mode 100644
index 3e521ed60bb8f..0000000000000
--- a/doc/plots/stats/moments_ewma.py
+++ /dev/null
@@ -1,15 +0,0 @@
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-t.N = 200
-s = t.makeTimeSeries().cumsum()
-
-plt.figure(figsize=(10, 5))
-plt.plot(s.index, s.values)
-plt.plot(s.index, m.ewma(s, 20, min_periods=1).values)
-f = plt.gcf()
-f.autofmt_xdate()
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_ewmvol.py b/doc/plots/stats/moments_ewmvol.py
deleted file mode 100644
index 093f62868fc4e..0000000000000
--- a/doc/plots/stats/moments_ewmvol.py
+++ /dev/null
@@ -1,23 +0,0 @@
-import matplotlib.pyplot as plt
-import pandas.util.testing as t
-import pandas.stats.moments as m
-
-t.N = 500
-ts = t.makeTimeSeries()
-ts[::100] = 20
-
-s = ts.cumsum()
-
-
-plt.figure(figsize=(10, 5))
-plt.plot(s.index, m.ewmvol(s, span=50, min_periods=1).values, color='b')
-plt.plot(s.index, m.rolling_std(s, 50, min_periods=1).values, color='r')
-
-plt.title('Exp-weighted std with shocks')
-plt.legend(('Exp-weighted', 'Equal-weighted'))
-
-f = plt.gcf()
-f.autofmt_xdate()
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_expw.py b/doc/plots/stats/moments_expw.py
deleted file mode 100644
index 5fff419b3a940..0000000000000
--- a/doc/plots/stats/moments_expw.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from moment_plots import *
-
-np.random.seed(1)
-
-ts = test_series(500) * 10
-
-# ts[::100] = 20
-
-s = ts.cumsum()
-
-fig, axes = plt.subplots(3, 1, figsize=(8, 10), sharex=True)
-
-ax0, ax1, ax2 = axes
-
-ax0.plot(s.index, s.values)
-ax0.set_title('time series')
-
-ax1.plot(s.index, m.ewma(s, span=50, min_periods=1).values, color='b')
-ax1.plot(s.index, m.rolling_mean(s, 50, min_periods=1).values, color='r')
-ax1.set_title('rolling_mean vs. ewma')
-
-line1 = ax2.plot(
-    s.index, m.ewmstd(s, span=50, min_periods=1).values, color='b')
-line2 = ax2.plot(
-    s.index, m.rolling_std(s, 50, min_periods=1).values, color='r')
-ax2.set_title('rolling_std vs. ewmstd')
-
-fig.legend((line1, line2),
-           ('Exp-weighted', 'Equal-weighted'),
-           loc='upper right')
-fig.autofmt_xdate()
-fig.subplots_adjust(bottom=0.10, top=0.95)
-
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_rolling.py b/doc/plots/stats/moments_rolling.py
deleted file mode 100644
index 30a6c5f53e20c..0000000000000
--- a/doc/plots/stats/moments_rolling.py
+++ /dev/null
@@ -1,24 +0,0 @@
-from moment_plots import *
-
-ts = test_series()
-s = ts.cumsum()
-
-s[20:50] = np.NaN
-s[120:150] = np.NaN
-plot_timeseries(s,
-                m.rolling_count(s, 50),
-                m.rolling_sum(s, 50, min_periods=10),
-                m.rolling_mean(s, 50, min_periods=10),
-                m.rolling_std(s, 50, min_periods=10),
-                m.rolling_skew(s, 50, min_periods=10),
-                m.rolling_kurt(s, 50, min_periods=10),
-                size=(10, 12),
-                titles=('time series',
-                        'rolling_count',
-                        'rolling_sum',
-                        'rolling_mean',
-                        'rolling_std',
-                        'rolling_skew',
-                        'rolling_kurt'))
-plt.show()
-plt.close('all')
diff --git a/doc/plots/stats/moments_rolling_binary.py b/doc/plots/stats/moments_rolling_binary.py
deleted file mode 100644
index ab6b7b1c8ff49..0000000000000
--- a/doc/plots/stats/moments_rolling_binary.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from moment_plots import *
-
-np.random.seed(1)
-
-ts = test_series()
-s = ts.cumsum()
-ts2 = test_series()
-s2 = ts2.cumsum()
-
-s[20:50] = np.NaN
-s[120:150] = np.NaN
-fig, axes = plt.subplots(3, 1, figsize=(8, 10), sharex=True)
-
-ax0, ax1, ax2 = axes
-
-ax0.plot(s.index, s.values)
-ax0.plot(s2.index, s2.values)
-ax0.set_title('time series')
-
-ax1.plot(s.index, m.rolling_corr(s, s2, 50, min_periods=1).values)
-ax1.set_title('rolling_corr')
-
-ax2.plot(s.index, m.rolling_cov(s, s2, 50, min_periods=1).values)
-ax2.set_title('rolling_cov')
-
-fig.autofmt_xdate()
-fig.subplots_adjust(bottom=0.10, top=0.95)
-
-plt.show()
-plt.close('all')
diff --git a/doc/redirects.csv b/doc/redirects.csv
new file mode 100644
index 0000000000000..a7886779c97d5
--- /dev/null
+++ b/doc/redirects.csv
@@ -0,0 +1,1581 @@
+# This file should contain all the redirects in the documentation
+# in the format `<old_path>,<new_path>`
+
+# whatsnew
+whatsnew,whatsnew/index
+release,whatsnew/index
+
+# getting started
+10min,getting_started/10min
+basics,getting_started/basics
+comparison_with_r,getting_started/comparison/comparison_with_r
+comparison_with_sql,getting_started/comparison/comparison_with_sql
+comparison_with_sas,getting_started/comparison/comparison_with_sas
+comparison_with_stata,getting_started/comparison/comparison_with_stata
+dsintro,getting_started/dsintro
+overview,getting_started/overview
+tutorials,getting_started/tutorials
+
+# user guide
+advanced,user_guide/advanced
+categorical,user_guide/categorical
+computation,user_guide/computation
+cookbook,user_guide/cookbook
+enhancingperf,user_guide/enhancingperf
+gotchas,user_guide/gotchas
+groupby,user_guide/groupby
+indexing,user_guide/indexing
+integer_na,user_guide/integer_na
+io,user_guide/io
+merging,user_guide/merging
+missing_data,user_guide/missing_data
+options,user_guide/options
+reshaping,user_guide/reshaping
+sparse,user_guide/sparse
+style,user_guide/style
+text,user_guide/text
+timedeltas,user_guide/timedeltas
+timeseries,user_guide/timeseries
+visualization,user_guide/visualization
+
+# development
+contributing,development/contributing
+contributing_docstring,development/contributing_docstring
+developer,development/developer
+extending,development/extending
+internals,development/internals
+
+# api
+api,reference/index
+generated/pandas.api.extensions.ExtensionArray.argsort,../reference/api/pandas.api.extensions.ExtensionArray.argsort
+generated/pandas.api.extensions.ExtensionArray.astype,../reference/api/pandas.api.extensions.ExtensionArray.astype
+generated/pandas.api.extensions.ExtensionArray.copy,../reference/api/pandas.api.extensions.ExtensionArray.copy
+generated/pandas.api.extensions.ExtensionArray.dropna,../reference/api/pandas.api.extensions.ExtensionArray.dropna
+generated/pandas.api.extensions.ExtensionArray.dtype,../reference/api/pandas.api.extensions.ExtensionArray.dtype
+generated/pandas.api.extensions.ExtensionArray.factorize,../reference/api/pandas.api.extensions.ExtensionArray.factorize
+generated/pandas.api.extensions.ExtensionArray.fillna,../reference/api/pandas.api.extensions.ExtensionArray.fillna
+generated/pandas.api.extensions.ExtensionArray,../reference/api/pandas.api.extensions.ExtensionArray
+generated/pandas.api.extensions.ExtensionArray.isna,../reference/api/pandas.api.extensions.ExtensionArray.isna
+generated/pandas.api.extensions.ExtensionArray.nbytes,../reference/api/pandas.api.extensions.ExtensionArray.nbytes
+generated/pandas.api.extensions.ExtensionArray.ndim,../reference/api/pandas.api.extensions.ExtensionArray.ndim
+generated/pandas.api.extensions.ExtensionArray.shape,../reference/api/pandas.api.extensions.ExtensionArray.shape
+generated/pandas.api.extensions.ExtensionArray.take,../reference/api/pandas.api.extensions.ExtensionArray.take
+generated/pandas.api.extensions.ExtensionArray.unique,../reference/api/pandas.api.extensions.ExtensionArray.unique
+generated/pandas.api.extensions.ExtensionDtype.construct_array_type,../reference/api/pandas.api.extensions.ExtensionDtype.construct_array_type
+generated/pandas.api.extensions.ExtensionDtype.construct_from_string,../reference/api/pandas.api.extensions.ExtensionDtype.construct_from_string
+generated/pandas.api.extensions.ExtensionDtype,../reference/api/pandas.api.extensions.ExtensionDtype
+generated/pandas.api.extensions.ExtensionDtype.is_dtype,../reference/api/pandas.api.extensions.ExtensionDtype.is_dtype
+generated/pandas.api.extensions.ExtensionDtype.kind,../reference/api/pandas.api.extensions.ExtensionDtype.kind
+generated/pandas.api.extensions.ExtensionDtype.name,../reference/api/pandas.api.extensions.ExtensionDtype.name
+generated/pandas.api.extensions.ExtensionDtype.names,../reference/api/pandas.api.extensions.ExtensionDtype.names
+generated/pandas.api.extensions.ExtensionDtype.na_value,../reference/api/pandas.api.extensions.ExtensionDtype.na_value
+generated/pandas.api.extensions.ExtensionDtype.type,../reference/api/pandas.api.extensions.ExtensionDtype.type
+generated/pandas.api.extensions.register_dataframe_accessor,../reference/api/pandas.api.extensions.register_dataframe_accessor
+generated/pandas.api.extensions.register_extension_dtype,../reference/api/pandas.api.extensions.register_extension_dtype
+generated/pandas.api.extensions.register_index_accessor,../reference/api/pandas.api.extensions.register_index_accessor
+generated/pandas.api.extensions.register_series_accessor,../reference/api/pandas.api.extensions.register_series_accessor
+generated/pandas.api.types.infer_dtype,../reference/api/pandas.api.types.infer_dtype
+generated/pandas.api.types.is_bool_dtype,../reference/api/pandas.api.types.is_bool_dtype
+generated/pandas.api.types.is_bool,../reference/api/pandas.api.types.is_bool
+generated/pandas.api.types.is_categorical_dtype,../reference/api/pandas.api.types.is_categorical_dtype
+generated/pandas.api.types.is_categorical,../reference/api/pandas.api.types.is_categorical
+generated/pandas.api.types.is_complex_dtype,../reference/api/pandas.api.types.is_complex_dtype
+generated/pandas.api.types.is_complex,../reference/api/pandas.api.types.is_complex
+generated/pandas.api.types.is_datetime64_any_dtype,../reference/api/pandas.api.types.is_datetime64_any_dtype
+generated/pandas.api.types.is_datetime64_dtype,../reference/api/pandas.api.types.is_datetime64_dtype
+generated/pandas.api.types.is_datetime64_ns_dtype,../reference/api/pandas.api.types.is_datetime64_ns_dtype
+generated/pandas.api.types.is_datetime64tz_dtype,../reference/api/pandas.api.types.is_datetime64tz_dtype
+generated/pandas.api.types.is_datetimetz,../reference/api/pandas.api.types.is_datetimetz
+generated/pandas.api.types.is_dict_like,../reference/api/pandas.api.types.is_dict_like
+generated/pandas.api.types.is_extension_array_dtype,../reference/api/pandas.api.types.is_extension_array_dtype
+generated/pandas.api.types.is_extension_type,../reference/api/pandas.api.types.is_extension_type
+generated/pandas.api.types.is_file_like,../reference/api/pandas.api.types.is_file_like
+generated/pandas.api.types.is_float_dtype,../reference/api/pandas.api.types.is_float_dtype
+generated/pandas.api.types.is_float,../reference/api/pandas.api.types.is_float
+generated/pandas.api.types.is_hashable,../reference/api/pandas.api.types.is_hashable
+generated/pandas.api.types.is_int64_dtype,../reference/api/pandas.api.types.is_int64_dtype
+generated/pandas.api.types.is_integer_dtype,../reference/api/pandas.api.types.is_integer_dtype
+generated/pandas.api.types.is_integer,../reference/api/pandas.api.types.is_integer
+generated/pandas.api.types.is_interval_dtype,../reference/api/pandas.api.types.is_interval_dtype
+generated/pandas.api.types.is_interval,../reference/api/pandas.api.types.is_interval
+generated/pandas.api.types.is_iterator,../reference/api/pandas.api.types.is_iterator
+generated/pandas.api.types.is_list_like,../reference/api/pandas.api.types.is_list_like
+generated/pandas.api.types.is_named_tuple,../reference/api/pandas.api.types.is_named_tuple
+generated/pandas.api.types.is_number,../reference/api/pandas.api.types.is_number
+generated/pandas.api.types.is_numeric_dtype,../reference/api/pandas.api.types.is_numeric_dtype
+generated/pandas.api.types.is_object_dtype,../reference/api/pandas.api.types.is_object_dtype
+generated/pandas.api.types.is_period_dtype,../reference/api/pandas.api.types.is_period_dtype
+generated/pandas.api.types.is_period,../reference/api/pandas.api.types.is_period
+generated/pandas.api.types.is_re_compilable,../reference/api/pandas.api.types.is_re_compilable
+generated/pandas.api.types.is_re,../reference/api/pandas.api.types.is_re
+generated/pandas.api.types.is_scalar,../reference/api/pandas.api.types.is_scalar
+generated/pandas.api.types.is_signed_integer_dtype,../reference/api/pandas.api.types.is_signed_integer_dtype
+generated/pandas.api.types.is_sparse,../reference/api/pandas.api.types.is_sparse
+generated/pandas.api.types.is_string_dtype,../reference/api/pandas.api.types.is_string_dtype
+generated/pandas.api.types.is_timedelta64_dtype,../reference/api/pandas.api.types.is_timedelta64_dtype
+generated/pandas.api.types.is_timedelta64_ns_dtype,../reference/api/pandas.api.types.is_timedelta64_ns_dtype
+generated/pandas.api.types.is_unsigned_integer_dtype,../reference/api/pandas.api.types.is_unsigned_integer_dtype
+generated/pandas.api.types.pandas_dtype,../reference/api/pandas.api.types.pandas_dtype
+generated/pandas.api.types.union_categoricals,../reference/api/pandas.api.types.union_categoricals
+generated/pandas.bdate_range,../reference/api/pandas.bdate_range
+generated/pandas.Categorical.__array__,../reference/api/pandas.Categorical.__array__
+generated/pandas.Categorical.categories,../reference/api/pandas.Categorical.categories
+generated/pandas.Categorical.codes,../reference/api/pandas.Categorical.codes
+generated/pandas.CategoricalDtype.categories,../reference/api/pandas.CategoricalDtype.categories
+generated/pandas.Categorical.dtype,../reference/api/pandas.Categorical.dtype
+generated/pandas.CategoricalDtype,../reference/api/pandas.CategoricalDtype
+generated/pandas.CategoricalDtype.ordered,../reference/api/pandas.CategoricalDtype.ordered
+generated/pandas.Categorical.from_codes,../reference/api/pandas.Categorical.from_codes
+generated/pandas.Categorical,../reference/api/pandas.Categorical
+generated/pandas.CategoricalIndex.add_categories,../reference/api/pandas.CategoricalIndex.add_categories
+generated/pandas.CategoricalIndex.as_ordered,../reference/api/pandas.CategoricalIndex.as_ordered
+generated/pandas.CategoricalIndex.as_unordered,../reference/api/pandas.CategoricalIndex.as_unordered
+generated/pandas.CategoricalIndex.categories,../reference/api/pandas.CategoricalIndex.categories
+generated/pandas.CategoricalIndex.codes,../reference/api/pandas.CategoricalIndex.codes
+generated/pandas.CategoricalIndex.equals,../reference/api/pandas.CategoricalIndex.equals
+generated/pandas.CategoricalIndex,../reference/api/pandas.CategoricalIndex
+generated/pandas.CategoricalIndex.map,../reference/api/pandas.CategoricalIndex.map
+generated/pandas.CategoricalIndex.ordered,../reference/api/pandas.CategoricalIndex.ordered
+generated/pandas.CategoricalIndex.remove_categories,../reference/api/pandas.CategoricalIndex.remove_categories
+generated/pandas.CategoricalIndex.remove_unused_categories,../reference/api/pandas.CategoricalIndex.remove_unused_categories
+generated/pandas.CategoricalIndex.rename_categories,../reference/api/pandas.CategoricalIndex.rename_categories
+generated/pandas.CategoricalIndex.reorder_categories,../reference/api/pandas.CategoricalIndex.reorder_categories
+generated/pandas.CategoricalIndex.set_categories,../reference/api/pandas.CategoricalIndex.set_categories
+generated/pandas.Categorical.ordered,../reference/api/pandas.Categorical.ordered
+generated/pandas.concat,../reference/api/pandas.concat
+generated/pandas.core.groupby.DataFrameGroupBy.all,../reference/api/pandas.core.groupby.DataFrameGroupBy.all
+generated/pandas.core.groupby.DataFrameGroupBy.any,../reference/api/pandas.core.groupby.DataFrameGroupBy.any
+generated/pandas.core.groupby.DataFrameGroupBy.bfill,../reference/api/pandas.core.groupby.DataFrameGroupBy.bfill
+generated/pandas.core.groupby.DataFrameGroupBy.boxplot,../reference/api/pandas.core.groupby.DataFrameGroupBy.boxplot
+generated/pandas.core.groupby.DataFrameGroupBy.corr,../reference/api/pandas.core.groupby.DataFrameGroupBy.corr
+generated/pandas.core.groupby.DataFrameGroupBy.corrwith,../reference/api/pandas.core.groupby.DataFrameGroupBy.corrwith
+generated/pandas.core.groupby.DataFrameGroupBy.count,../reference/api/pandas.core.groupby.DataFrameGroupBy.count
+generated/pandas.core.groupby.DataFrameGroupBy.cov,../reference/api/pandas.core.groupby.DataFrameGroupBy.cov
+generated/pandas.core.groupby.DataFrameGroupBy.cummax,../reference/api/pandas.core.groupby.DataFrameGroupBy.cummax
+generated/pandas.core.groupby.DataFrameGroupBy.cummin,../reference/api/pandas.core.groupby.DataFrameGroupBy.cummin
+generated/pandas.core.groupby.DataFrameGroupBy.cumprod,../reference/api/pandas.core.groupby.DataFrameGroupBy.cumprod
+generated/pandas.core.groupby.DataFrameGroupBy.cumsum,../reference/api/pandas.core.groupby.DataFrameGroupBy.cumsum
+generated/pandas.core.groupby.DataFrameGroupBy.describe,../reference/api/pandas.core.groupby.DataFrameGroupBy.describe
+generated/pandas.core.groupby.DataFrameGroupBy.diff,../reference/api/pandas.core.groupby.DataFrameGroupBy.diff
+generated/pandas.core.groupby.DataFrameGroupBy.ffill,../reference/api/pandas.core.groupby.DataFrameGroupBy.ffill
+generated/pandas.core.groupby.DataFrameGroupBy.fillna,../reference/api/pandas.core.groupby.DataFrameGroupBy.fillna
+generated/pandas.core.groupby.DataFrameGroupBy.filter,../reference/api/pandas.core.groupby.DataFrameGroupBy.filter
+generated/pandas.core.groupby.DataFrameGroupBy.hist,../reference/api/pandas.core.groupby.DataFrameGroupBy.hist
+generated/pandas.core.groupby.DataFrameGroupBy.idxmax,../reference/api/pandas.core.groupby.DataFrameGroupBy.idxmax
+generated/pandas.core.groupby.DataFrameGroupBy.idxmin,../reference/api/pandas.core.groupby.DataFrameGroupBy.idxmin
+generated/pandas.core.groupby.DataFrameGroupBy.mad,../reference/api/pandas.core.groupby.DataFrameGroupBy.mad
+generated/pandas.core.groupby.DataFrameGroupBy.pct_change,../reference/api/pandas.core.groupby.DataFrameGroupBy.pct_change
+generated/pandas.core.groupby.DataFrameGroupBy.plot,../reference/api/pandas.core.groupby.DataFrameGroupBy.plot
+generated/pandas.core.groupby.DataFrameGroupBy.quantile,../reference/api/pandas.core.groupby.DataFrameGroupBy.quantile
+generated/pandas.core.groupby.DataFrameGroupBy.rank,../reference/api/pandas.core.groupby.DataFrameGroupBy.rank
+generated/pandas.core.groupby.DataFrameGroupBy.resample,../reference/api/pandas.core.groupby.DataFrameGroupBy.resample
+generated/pandas.core.groupby.DataFrameGroupBy.shift,../reference/api/pandas.core.groupby.DataFrameGroupBy.shift
+generated/pandas.core.groupby.DataFrameGroupBy.size,../reference/api/pandas.core.groupby.DataFrameGroupBy.size
+generated/pandas.core.groupby.DataFrameGroupBy.skew,../reference/api/pandas.core.groupby.DataFrameGroupBy.skew
+generated/pandas.core.groupby.DataFrameGroupBy.take,../reference/api/pandas.core.groupby.DataFrameGroupBy.take
+generated/pandas.core.groupby.DataFrameGroupBy.tshift,../reference/api/pandas.core.groupby.DataFrameGroupBy.tshift
+generated/pandas.core.groupby.GroupBy.agg,../reference/api/pandas.core.groupby.GroupBy.agg
+generated/pandas.core.groupby.GroupBy.aggregate,../reference/api/pandas.core.groupby.GroupBy.aggregate
+generated/pandas.core.groupby.GroupBy.all,../reference/api/pandas.core.groupby.GroupBy.all
+generated/pandas.core.groupby.GroupBy.any,../reference/api/pandas.core.groupby.GroupBy.any
+generated/pandas.core.groupby.GroupBy.apply,../reference/api/pandas.core.groupby.GroupBy.apply
+generated/pandas.core.groupby.GroupBy.bfill,../reference/api/pandas.core.groupby.GroupBy.bfill
+generated/pandas.core.groupby.GroupBy.count,../reference/api/pandas.core.groupby.GroupBy.count
+generated/pandas.core.groupby.GroupBy.cumcount,../reference/api/pandas.core.groupby.GroupBy.cumcount
+generated/pandas.core.groupby.GroupBy.ffill,../reference/api/pandas.core.groupby.GroupBy.ffill
+generated/pandas.core.groupby.GroupBy.first,../reference/api/pandas.core.groupby.GroupBy.first
+generated/pandas.core.groupby.GroupBy.get_group,../reference/api/pandas.core.groupby.GroupBy.get_group
+generated/pandas.core.groupby.GroupBy.groups,../reference/api/pandas.core.groupby.GroupBy.groups
+generated/pandas.core.groupby.GroupBy.head,../reference/api/pandas.core.groupby.GroupBy.head
+generated/pandas.core.groupby.GroupBy.indices,../reference/api/pandas.core.groupby.GroupBy.indices
+generated/pandas.core.groupby.GroupBy.__iter__,../reference/api/pandas.core.groupby.GroupBy.__iter__
+generated/pandas.core.groupby.GroupBy.last,../reference/api/pandas.core.groupby.GroupBy.last
+generated/pandas.core.groupby.GroupBy.max,../reference/api/pandas.core.groupby.GroupBy.max
+generated/pandas.core.groupby.GroupBy.mean,../reference/api/pandas.core.groupby.GroupBy.mean
+generated/pandas.core.groupby.GroupBy.median,../reference/api/pandas.core.groupby.GroupBy.median
+generated/pandas.core.groupby.GroupBy.min,../reference/api/pandas.core.groupby.GroupBy.min
+generated/pandas.core.groupby.GroupBy.ngroup,../reference/api/pandas.core.groupby.GroupBy.ngroup
+generated/pandas.core.groupby.GroupBy.nth,../reference/api/pandas.core.groupby.GroupBy.nth
+generated/pandas.core.groupby.GroupBy.ohlc,../reference/api/pandas.core.groupby.GroupBy.ohlc
+generated/pandas.core.groupby.GroupBy.pct_change,../reference/api/pandas.core.groupby.GroupBy.pct_change
+generated/pandas.core.groupby.GroupBy.pipe,../reference/api/pandas.core.groupby.GroupBy.pipe
+generated/pandas.core.groupby.GroupBy.prod,../reference/api/pandas.core.groupby.GroupBy.prod
+generated/pandas.core.groupby.GroupBy.rank,../reference/api/pandas.core.groupby.GroupBy.rank
+generated/pandas.core.groupby.GroupBy.sem,../reference/api/pandas.core.groupby.GroupBy.sem
+generated/pandas.core.groupby.GroupBy.size,../reference/api/pandas.core.groupby.GroupBy.size
+generated/pandas.core.groupby.GroupBy.std,../reference/api/pandas.core.groupby.GroupBy.std
+generated/pandas.core.groupby.GroupBy.sum,../reference/api/pandas.core.groupby.GroupBy.sum
+generated/pandas.core.groupby.GroupBy.tail,../reference/api/pandas.core.groupby.GroupBy.tail
+generated/pandas.core.groupby.GroupBy.transform,../reference/api/pandas.core.groupby.GroupBy.transform
+generated/pandas.core.groupby.GroupBy.var,../reference/api/pandas.core.groupby.GroupBy.var
+generated/pandas.core.groupby.SeriesGroupBy.is_monotonic_decreasing,../reference/api/pandas.core.groupby.SeriesGroupBy.is_monotonic_decreasing
+generated/pandas.core.groupby.SeriesGroupBy.is_monotonic_increasing,../reference/api/pandas.core.groupby.SeriesGroupBy.is_monotonic_increasing
+generated/pandas.core.groupby.SeriesGroupBy.nlargest,../reference/api/pandas.core.groupby.SeriesGroupBy.nlargest
+generated/pandas.core.groupby.SeriesGroupBy.nsmallest,../reference/api/pandas.core.groupby.SeriesGroupBy.nsmallest
+generated/pandas.core.groupby.SeriesGroupBy.nunique,../reference/api/pandas.core.groupby.SeriesGroupBy.nunique
+generated/pandas.core.groupby.SeriesGroupBy.unique,../reference/api/pandas.core.groupby.SeriesGroupBy.unique
+generated/pandas.core.groupby.SeriesGroupBy.value_counts,../reference/api/pandas.core.groupby.SeriesGroupBy.value_counts
+generated/pandas.core.resample.Resampler.aggregate,../reference/api/pandas.core.resample.Resampler.aggregate
+generated/pandas.core.resample.Resampler.apply,../reference/api/pandas.core.resample.Resampler.apply
+generated/pandas.core.resample.Resampler.asfreq,../reference/api/pandas.core.resample.Resampler.asfreq
+generated/pandas.core.resample.Resampler.backfill,../reference/api/pandas.core.resample.Resampler.backfill
+generated/pandas.core.resample.Resampler.bfill,../reference/api/pandas.core.resample.Resampler.bfill
+generated/pandas.core.resample.Resampler.count,../reference/api/pandas.core.resample.Resampler.count
+generated/pandas.core.resample.Resampler.ffill,../reference/api/pandas.core.resample.Resampler.ffill
+generated/pandas.core.resample.Resampler.fillna,../reference/api/pandas.core.resample.Resampler.fillna
+generated/pandas.core.resample.Resampler.first,../reference/api/pandas.core.resample.Resampler.first
+generated/pandas.core.resample.Resampler.get_group,../reference/api/pandas.core.resample.Resampler.get_group
+generated/pandas.core.resample.Resampler.groups,../reference/api/pandas.core.resample.Resampler.groups
+generated/pandas.core.resample.Resampler.indices,../reference/api/pandas.core.resample.Resampler.indices
+generated/pandas.core.resample.Resampler.interpolate,../reference/api/pandas.core.resample.Resampler.interpolate
+generated/pandas.core.resample.Resampler.__iter__,../reference/api/pandas.core.resample.Resampler.__iter__
+generated/pandas.core.resample.Resampler.last,../reference/api/pandas.core.resample.Resampler.last
+generated/pandas.core.resample.Resampler.max,../reference/api/pandas.core.resample.Resampler.max
+generated/pandas.core.resample.Resampler.mean,../reference/api/pandas.core.resample.Resampler.mean
+generated/pandas.core.resample.Resampler.median,../reference/api/pandas.core.resample.Resampler.median
+generated/pandas.core.resample.Resampler.min,../reference/api/pandas.core.resample.Resampler.min
+generated/pandas.core.resample.Resampler.nearest,../reference/api/pandas.core.resample.Resampler.nearest
+generated/pandas.core.resample.Resampler.nunique,../reference/api/pandas.core.resample.Resampler.nunique
+generated/pandas.core.resample.Resampler.ohlc,../reference/api/pandas.core.resample.Resampler.ohlc
+generated/pandas.core.resample.Resampler.pad,../reference/api/pandas.core.resample.Resampler.pad
+generated/pandas.core.resample.Resampler.pipe,../reference/api/pandas.core.resample.Resampler.pipe
+generated/pandas.core.resample.Resampler.prod,../reference/api/pandas.core.resample.Resampler.prod
+generated/pandas.core.resample.Resampler.quantile,../reference/api/pandas.core.resample.Resampler.quantile
+generated/pandas.core.resample.Resampler.sem,../reference/api/pandas.core.resample.Resampler.sem
+generated/pandas.core.resample.Resampler.size,../reference/api/pandas.core.resample.Resampler.size
+generated/pandas.core.resample.Resampler.std,../reference/api/pandas.core.resample.Resampler.std
+generated/pandas.core.resample.Resampler.sum,../reference/api/pandas.core.resample.Resampler.sum
+generated/pandas.core.resample.Resampler.transform,../reference/api/pandas.core.resample.Resampler.transform
+generated/pandas.core.resample.Resampler.var,../reference/api/pandas.core.resample.Resampler.var
+generated/pandas.core.window.EWM.corr,../reference/api/pandas.core.window.EWM.corr
+generated/pandas.core.window.EWM.cov,../reference/api/pandas.core.window.EWM.cov
+generated/pandas.core.window.EWM.mean,../reference/api/pandas.core.window.EWM.mean
+generated/pandas.core.window.EWM.std,../reference/api/pandas.core.window.EWM.std
+generated/pandas.core.window.EWM.var,../reference/api/pandas.core.window.EWM.var
+generated/pandas.core.window.Expanding.aggregate,../reference/api/pandas.core.window.Expanding.aggregate
+generated/pandas.core.window.Expanding.apply,../reference/api/pandas.core.window.Expanding.apply
+generated/pandas.core.window.Expanding.corr,../reference/api/pandas.core.window.Expanding.corr
+generated/pandas.core.window.Expanding.count,../reference/api/pandas.core.window.Expanding.count
+generated/pandas.core.window.Expanding.cov,../reference/api/pandas.core.window.Expanding.cov
+generated/pandas.core.window.Expanding.kurt,../reference/api/pandas.core.window.Expanding.kurt
+generated/pandas.core.window.Expanding.max,../reference/api/pandas.core.window.Expanding.max
+generated/pandas.core.window.Expanding.mean,../reference/api/pandas.core.window.Expanding.mean
+generated/pandas.core.window.Expanding.median,../reference/api/pandas.core.window.Expanding.median
+generated/pandas.core.window.Expanding.min,../reference/api/pandas.core.window.Expanding.min
+generated/pandas.core.window.Expanding.quantile,../reference/api/pandas.core.window.Expanding.quantile
+generated/pandas.core.window.Expanding.skew,../reference/api/pandas.core.window.Expanding.skew
+generated/pandas.core.window.Expanding.std,../reference/api/pandas.core.window.Expanding.std
+generated/pandas.core.window.Expanding.sum,../reference/api/pandas.core.window.Expanding.sum
+generated/pandas.core.window.Expanding.var,../reference/api/pandas.core.window.Expanding.var
+generated/pandas.core.window.Rolling.aggregate,../reference/api/pandas.core.window.Rolling.aggregate
+generated/pandas.core.window.Rolling.apply,../reference/api/pandas.core.window.Rolling.apply
+generated/pandas.core.window.Rolling.corr,../reference/api/pandas.core.window.Rolling.corr
+generated/pandas.core.window.Rolling.count,../reference/api/pandas.core.window.Rolling.count
+generated/pandas.core.window.Rolling.cov,../reference/api/pandas.core.window.Rolling.cov
+generated/pandas.core.window.Rolling.kurt,../reference/api/pandas.core.window.Rolling.kurt
+generated/pandas.core.window.Rolling.max,../reference/api/pandas.core.window.Rolling.max
+generated/pandas.core.window.Rolling.mean,../reference/api/pandas.core.window.Rolling.mean
+generated/pandas.core.window.Rolling.median,../reference/api/pandas.core.window.Rolling.median
+generated/pandas.core.window.Rolling.min,../reference/api/pandas.core.window.Rolling.min
+generated/pandas.core.window.Rolling.quantile,../reference/api/pandas.core.window.Rolling.quantile
+generated/pandas.core.window.Rolling.skew,../reference/api/pandas.core.window.Rolling.skew
+generated/pandas.core.window.Rolling.std,../reference/api/pandas.core.window.Rolling.std
+generated/pandas.core.window.Rolling.sum,../reference/api/pandas.core.window.Rolling.sum
+generated/pandas.core.window.Rolling.var,../reference/api/pandas.core.window.Rolling.var
+generated/pandas.core.window.Window.mean,../reference/api/pandas.core.window.Window.mean
+generated/pandas.core.window.Window.sum,../reference/api/pandas.core.window.Window.sum
+generated/pandas.crosstab,../reference/api/pandas.crosstab
+generated/pandas.cut,../reference/api/pandas.cut
+generated/pandas.DataFrame.abs,../reference/api/pandas.DataFrame.abs
+generated/pandas.DataFrame.add,../reference/api/pandas.DataFrame.add
+generated/pandas.DataFrame.add_prefix,../reference/api/pandas.DataFrame.add_prefix
+generated/pandas.DataFrame.add_suffix,../reference/api/pandas.DataFrame.add_suffix
+generated/pandas.DataFrame.agg,../reference/api/pandas.DataFrame.agg
+generated/pandas.DataFrame.aggregate,../reference/api/pandas.DataFrame.aggregate
+generated/pandas.DataFrame.align,../reference/api/pandas.DataFrame.align
+generated/pandas.DataFrame.all,../reference/api/pandas.DataFrame.all
+generated/pandas.DataFrame.any,../reference/api/pandas.DataFrame.any
+generated/pandas.DataFrame.append,../reference/api/pandas.DataFrame.append
+generated/pandas.DataFrame.apply,../reference/api/pandas.DataFrame.apply
+generated/pandas.DataFrame.applymap,../reference/api/pandas.DataFrame.applymap
+generated/pandas.DataFrame.as_blocks,../reference/api/pandas.DataFrame.as_blocks
+generated/pandas.DataFrame.asfreq,../reference/api/pandas.DataFrame.asfreq
+generated/pandas.DataFrame.as_matrix,../reference/api/pandas.DataFrame.as_matrix
+generated/pandas.DataFrame.asof,../reference/api/pandas.DataFrame.asof
+generated/pandas.DataFrame.assign,../reference/api/pandas.DataFrame.assign
+generated/pandas.DataFrame.astype,../reference/api/pandas.DataFrame.astype
+generated/pandas.DataFrame.at,../reference/api/pandas.DataFrame.at
+generated/pandas.DataFrame.at_time,../reference/api/pandas.DataFrame.at_time
+generated/pandas.DataFrame.axes,../reference/api/pandas.DataFrame.axes
+generated/pandas.DataFrame.between_time,../reference/api/pandas.DataFrame.between_time
+generated/pandas.DataFrame.bfill,../reference/api/pandas.DataFrame.bfill
+generated/pandas.DataFrame.blocks,../reference/api/pandas.DataFrame.blocks
+generated/pandas.DataFrame.bool,../reference/api/pandas.DataFrame.bool
+generated/pandas.DataFrame.boxplot,../reference/api/pandas.DataFrame.boxplot
+generated/pandas.DataFrame.clip,../reference/api/pandas.DataFrame.clip
+generated/pandas.DataFrame.clip_lower,../reference/api/pandas.DataFrame.clip_lower
+generated/pandas.DataFrame.clip_upper,../reference/api/pandas.DataFrame.clip_upper
+generated/pandas.DataFrame.columns,../reference/api/pandas.DataFrame.columns
+generated/pandas.DataFrame.combine_first,../reference/api/pandas.DataFrame.combine_first
+generated/pandas.DataFrame.combine,../reference/api/pandas.DataFrame.combine
+generated/pandas.DataFrame.compound,../reference/api/pandas.DataFrame.compound
+generated/pandas.DataFrame.convert_objects,../reference/api/pandas.DataFrame.convert_objects
+generated/pandas.DataFrame.copy,../reference/api/pandas.DataFrame.copy
+generated/pandas.DataFrame.corr,../reference/api/pandas.DataFrame.corr
+generated/pandas.DataFrame.corrwith,../reference/api/pandas.DataFrame.corrwith
+generated/pandas.DataFrame.count,../reference/api/pandas.DataFrame.count
+generated/pandas.DataFrame.cov,../reference/api/pandas.DataFrame.cov
+generated/pandas.DataFrame.cummax,../reference/api/pandas.DataFrame.cummax
+generated/pandas.DataFrame.cummin,../reference/api/pandas.DataFrame.cummin
+generated/pandas.DataFrame.cumprod,../reference/api/pandas.DataFrame.cumprod
+generated/pandas.DataFrame.cumsum,../reference/api/pandas.DataFrame.cumsum
+generated/pandas.DataFrame.describe,../reference/api/pandas.DataFrame.describe
+generated/pandas.DataFrame.diff,../reference/api/pandas.DataFrame.diff
+generated/pandas.DataFrame.div,../reference/api/pandas.DataFrame.div
+generated/pandas.DataFrame.divide,../reference/api/pandas.DataFrame.divide
+generated/pandas.DataFrame.dot,../reference/api/pandas.DataFrame.dot
+generated/pandas.DataFrame.drop_duplicates,../reference/api/pandas.DataFrame.drop_duplicates
+generated/pandas.DataFrame.drop,../reference/api/pandas.DataFrame.drop
+generated/pandas.DataFrame.droplevel,../reference/api/pandas.DataFrame.droplevel
+generated/pandas.DataFrame.dropna,../reference/api/pandas.DataFrame.dropna
+generated/pandas.DataFrame.dtypes,../reference/api/pandas.DataFrame.dtypes
+generated/pandas.DataFrame.duplicated,../reference/api/pandas.DataFrame.duplicated
+generated/pandas.DataFrame.empty,../reference/api/pandas.DataFrame.empty
+generated/pandas.DataFrame.eq,../reference/api/pandas.DataFrame.eq
+generated/pandas.DataFrame.equals,../reference/api/pandas.DataFrame.equals
+generated/pandas.DataFrame.eval,../reference/api/pandas.DataFrame.eval
+generated/pandas.DataFrame.ewm,../reference/api/pandas.DataFrame.ewm
+generated/pandas.DataFrame.expanding,../reference/api/pandas.DataFrame.expanding
+generated/pandas.DataFrame.ffill,../reference/api/pandas.DataFrame.ffill
+generated/pandas.DataFrame.fillna,../reference/api/pandas.DataFrame.fillna
+generated/pandas.DataFrame.filter,../reference/api/pandas.DataFrame.filter
+generated/pandas.DataFrame.first,../reference/api/pandas.DataFrame.first
+generated/pandas.DataFrame.first_valid_index,../reference/api/pandas.DataFrame.first_valid_index
+generated/pandas.DataFrame.floordiv,../reference/api/pandas.DataFrame.floordiv
+generated/pandas.DataFrame.from_csv,../reference/api/pandas.DataFrame.from_csv
+generated/pandas.DataFrame.from_dict,../reference/api/pandas.DataFrame.from_dict
+generated/pandas.DataFrame.from_items,../reference/api/pandas.DataFrame.from_items
+generated/pandas.DataFrame.from_records,../reference/api/pandas.DataFrame.from_records
+generated/pandas.DataFrame.ftypes,../reference/api/pandas.DataFrame.ftypes
+generated/pandas.DataFrame.ge,../reference/api/pandas.DataFrame.ge
+generated/pandas.DataFrame.get_dtype_counts,../reference/api/pandas.DataFrame.get_dtype_counts
+generated/pandas.DataFrame.get_ftype_counts,../reference/api/pandas.DataFrame.get_ftype_counts
+generated/pandas.DataFrame.get,../reference/api/pandas.DataFrame.get
+generated/pandas.DataFrame.get_value,../reference/api/pandas.DataFrame.get_value
+generated/pandas.DataFrame.get_values,../reference/api/pandas.DataFrame.get_values
+generated/pandas.DataFrame.groupby,../reference/api/pandas.DataFrame.groupby
+generated/pandas.DataFrame.gt,../reference/api/pandas.DataFrame.gt
+generated/pandas.DataFrame.head,../reference/api/pandas.DataFrame.head
+generated/pandas.DataFrame.hist,../reference/api/pandas.DataFrame.hist
+generated/pandas.DataFrame,../reference/api/pandas.DataFrame
+generated/pandas.DataFrame.iat,../reference/api/pandas.DataFrame.iat
+generated/pandas.DataFrame.idxmax,../reference/api/pandas.DataFrame.idxmax
+generated/pandas.DataFrame.idxmin,../reference/api/pandas.DataFrame.idxmin
+generated/pandas.DataFrame.iloc,../reference/api/pandas.DataFrame.iloc
+generated/pandas.DataFrame.index,../reference/api/pandas.DataFrame.index
+generated/pandas.DataFrame.infer_objects,../reference/api/pandas.DataFrame.infer_objects
+generated/pandas.DataFrame.info,../reference/api/pandas.DataFrame.info
+generated/pandas.DataFrame.insert,../reference/api/pandas.DataFrame.insert
+generated/pandas.DataFrame.interpolate,../reference/api/pandas.DataFrame.interpolate
+generated/pandas.DataFrame.is_copy,../reference/api/pandas.DataFrame.is_copy
+generated/pandas.DataFrame.isin,../reference/api/pandas.DataFrame.isin
+generated/pandas.DataFrame.isna,../reference/api/pandas.DataFrame.isna
+generated/pandas.DataFrame.isnull,../reference/api/pandas.DataFrame.isnull
+generated/pandas.DataFrame.items,../reference/api/pandas.DataFrame.items
+generated/pandas.DataFrame.__iter__,../reference/api/pandas.DataFrame.__iter__
+generated/pandas.DataFrame.iteritems,../reference/api/pandas.DataFrame.iteritems
+generated/pandas.DataFrame.iterrows,../reference/api/pandas.DataFrame.iterrows
+generated/pandas.DataFrame.itertuples,../reference/api/pandas.DataFrame.itertuples
+generated/pandas.DataFrame.ix,../reference/api/pandas.DataFrame.ix
+generated/pandas.DataFrame.join,../reference/api/pandas.DataFrame.join
+generated/pandas.DataFrame.keys,../reference/api/pandas.DataFrame.keys
+generated/pandas.DataFrame.kurt,../reference/api/pandas.DataFrame.kurt
+generated/pandas.DataFrame.kurtosis,../reference/api/pandas.DataFrame.kurtosis
+generated/pandas.DataFrame.last,../reference/api/pandas.DataFrame.last
+generated/pandas.DataFrame.last_valid_index,../reference/api/pandas.DataFrame.last_valid_index
+generated/pandas.DataFrame.le,../reference/api/pandas.DataFrame.le
+generated/pandas.DataFrame.loc,../reference/api/pandas.DataFrame.loc
+generated/pandas.DataFrame.lookup,../reference/api/pandas.DataFrame.lookup
+generated/pandas.DataFrame.lt,../reference/api/pandas.DataFrame.lt
+generated/pandas.DataFrame.mad,../reference/api/pandas.DataFrame.mad
+generated/pandas.DataFrame.mask,../reference/api/pandas.DataFrame.mask
+generated/pandas.DataFrame.max,../reference/api/pandas.DataFrame.max
+generated/pandas.DataFrame.mean,../reference/api/pandas.DataFrame.mean
+generated/pandas.DataFrame.median,../reference/api/pandas.DataFrame.median
+generated/pandas.DataFrame.melt,../reference/api/pandas.DataFrame.melt
+generated/pandas.DataFrame.memory_usage,../reference/api/pandas.DataFrame.memory_usage
+generated/pandas.DataFrame.merge,../reference/api/pandas.DataFrame.merge
+generated/pandas.DataFrame.min,../reference/api/pandas.DataFrame.min
+generated/pandas.DataFrame.mode,../reference/api/pandas.DataFrame.mode
+generated/pandas.DataFrame.mod,../reference/api/pandas.DataFrame.mod
+generated/pandas.DataFrame.mul,../reference/api/pandas.DataFrame.mul
+generated/pandas.DataFrame.multiply,../reference/api/pandas.DataFrame.multiply
+generated/pandas.DataFrame.ndim,../reference/api/pandas.DataFrame.ndim
+generated/pandas.DataFrame.ne,../reference/api/pandas.DataFrame.ne
+generated/pandas.DataFrame.nlargest,../reference/api/pandas.DataFrame.nlargest
+generated/pandas.DataFrame.notna,../reference/api/pandas.DataFrame.notna
+generated/pandas.DataFrame.notnull,../reference/api/pandas.DataFrame.notnull
+generated/pandas.DataFrame.nsmallest,../reference/api/pandas.DataFrame.nsmallest
+generated/pandas.DataFrame.nunique,../reference/api/pandas.DataFrame.nunique
+generated/pandas.DataFrame.pct_change,../reference/api/pandas.DataFrame.pct_change
+generated/pandas.DataFrame.pipe,../reference/api/pandas.DataFrame.pipe
+generated/pandas.DataFrame.pivot,../reference/api/pandas.DataFrame.pivot
+generated/pandas.DataFrame.pivot_table,../reference/api/pandas.DataFrame.pivot_table
+generated/pandas.DataFrame.plot.barh,../reference/api/pandas.DataFrame.plot.barh
+generated/pandas.DataFrame.plot.bar,../reference/api/pandas.DataFrame.plot.bar
+generated/pandas.DataFrame.plot.box,../reference/api/pandas.DataFrame.plot.box
+generated/pandas.DataFrame.plot.density,../reference/api/pandas.DataFrame.plot.density
+generated/pandas.DataFrame.plot.hexbin,../reference/api/pandas.DataFrame.plot.hexbin
+generated/pandas.DataFrame.plot.hist,../reference/api/pandas.DataFrame.plot.hist
+generated/pandas.DataFrame.plot,../reference/api/pandas.DataFrame.plot
+generated/pandas.DataFrame.plot.kde,../reference/api/pandas.DataFrame.plot.kde
+generated/pandas.DataFrame.plot.line,../reference/api/pandas.DataFrame.plot.line
+generated/pandas.DataFrame.plot.pie,../reference/api/pandas.DataFrame.plot.pie
+generated/pandas.DataFrame.plot.scatter,../reference/api/pandas.DataFrame.plot.scatter
+generated/pandas.DataFrame.pop,../reference/api/pandas.DataFrame.pop
+generated/pandas.DataFrame.pow,../reference/api/pandas.DataFrame.pow
+generated/pandas.DataFrame.prod,../reference/api/pandas.DataFrame.prod
+generated/pandas.DataFrame.product,../reference/api/pandas.DataFrame.product
+generated/pandas.DataFrame.quantile,../reference/api/pandas.DataFrame.quantile
+generated/pandas.DataFrame.query,../reference/api/pandas.DataFrame.query
+generated/pandas.DataFrame.radd,../reference/api/pandas.DataFrame.radd
+generated/pandas.DataFrame.rank,../reference/api/pandas.DataFrame.rank
+generated/pandas.DataFrame.rdiv,../reference/api/pandas.DataFrame.rdiv
+generated/pandas.DataFrame.reindex_axis,../reference/api/pandas.DataFrame.reindex_axis
+generated/pandas.DataFrame.reindex,../reference/api/pandas.DataFrame.reindex
+generated/pandas.DataFrame.reindex_like,../reference/api/pandas.DataFrame.reindex_like
+generated/pandas.DataFrame.rename_axis,../reference/api/pandas.DataFrame.rename_axis
+generated/pandas.DataFrame.rename,../reference/api/pandas.DataFrame.rename
+generated/pandas.DataFrame.reorder_levels,../reference/api/pandas.DataFrame.reorder_levels
+generated/pandas.DataFrame.replace,../reference/api/pandas.DataFrame.replace
+generated/pandas.DataFrame.resample,../reference/api/pandas.DataFrame.resample
+generated/pandas.DataFrame.reset_index,../reference/api/pandas.DataFrame.reset_index
+generated/pandas.DataFrame.rfloordiv,../reference/api/pandas.DataFrame.rfloordiv
+generated/pandas.DataFrame.rmod,../reference/api/pandas.DataFrame.rmod
+generated/pandas.DataFrame.rmul,../reference/api/pandas.DataFrame.rmul
+generated/pandas.DataFrame.rolling,../reference/api/pandas.DataFrame.rolling
+generated/pandas.DataFrame.round,../reference/api/pandas.DataFrame.round
+generated/pandas.DataFrame.rpow,../reference/api/pandas.DataFrame.rpow
+generated/pandas.DataFrame.rsub,../reference/api/pandas.DataFrame.rsub
+generated/pandas.DataFrame.rtruediv,../reference/api/pandas.DataFrame.rtruediv
+generated/pandas.DataFrame.sample,../reference/api/pandas.DataFrame.sample
+generated/pandas.DataFrame.select_dtypes,../reference/api/pandas.DataFrame.select_dtypes
+generated/pandas.DataFrame.select,../reference/api/pandas.DataFrame.select
+generated/pandas.DataFrame.sem,../reference/api/pandas.DataFrame.sem
+generated/pandas.DataFrame.set_axis,../reference/api/pandas.DataFrame.set_axis
+generated/pandas.DataFrame.set_index,../reference/api/pandas.DataFrame.set_index
+generated/pandas.DataFrame.set_value,../reference/api/pandas.DataFrame.set_value
+generated/pandas.DataFrame.shape,../reference/api/pandas.DataFrame.shape
+generated/pandas.DataFrame.shift,../reference/api/pandas.DataFrame.shift
+generated/pandas.DataFrame.size,../reference/api/pandas.DataFrame.size
+generated/pandas.DataFrame.skew,../reference/api/pandas.DataFrame.skew
+generated/pandas.DataFrame.slice_shift,../reference/api/pandas.DataFrame.slice_shift
+generated/pandas.DataFrame.sort_index,../reference/api/pandas.DataFrame.sort_index
+generated/pandas.DataFrame.sort_values,../reference/api/pandas.DataFrame.sort_values
+generated/pandas.DataFrame.squeeze,../reference/api/pandas.DataFrame.squeeze
+generated/pandas.DataFrame.stack,../reference/api/pandas.DataFrame.stack
+generated/pandas.DataFrame.std,../reference/api/pandas.DataFrame.std
+generated/pandas.DataFrame.style,../reference/api/pandas.DataFrame.style
+generated/pandas.DataFrame.sub,../reference/api/pandas.DataFrame.sub
+generated/pandas.DataFrame.subtract,../reference/api/pandas.DataFrame.subtract
+generated/pandas.DataFrame.sum,../reference/api/pandas.DataFrame.sum
+generated/pandas.DataFrame.swapaxes,../reference/api/pandas.DataFrame.swapaxes
+generated/pandas.DataFrame.swaplevel,../reference/api/pandas.DataFrame.swaplevel
+generated/pandas.DataFrame.tail,../reference/api/pandas.DataFrame.tail
+generated/pandas.DataFrame.take,../reference/api/pandas.DataFrame.take
+generated/pandas.DataFrame.T,../reference/api/pandas.DataFrame.T
+generated/pandas.DataFrame.timetuple,../reference/api/pandas.DataFrame.timetuple
+generated/pandas.DataFrame.to_clipboard,../reference/api/pandas.DataFrame.to_clipboard
+generated/pandas.DataFrame.to_csv,../reference/api/pandas.DataFrame.to_csv
+generated/pandas.DataFrame.to_dense,../reference/api/pandas.DataFrame.to_dense
+generated/pandas.DataFrame.to_dict,../reference/api/pandas.DataFrame.to_dict
+generated/pandas.DataFrame.to_excel,../reference/api/pandas.DataFrame.to_excel
+generated/pandas.DataFrame.to_feather,../reference/api/pandas.DataFrame.to_feather
+generated/pandas.DataFrame.to_gbq,../reference/api/pandas.DataFrame.to_gbq
+generated/pandas.DataFrame.to_hdf,../reference/api/pandas.DataFrame.to_hdf
+generated/pandas.DataFrame.to,../reference/api/pandas.DataFrame.to
+generated/pandas.DataFrame.to_json,../reference/api/pandas.DataFrame.to_json
+generated/pandas.DataFrame.to_latex,../reference/api/pandas.DataFrame.to_latex
+generated/pandas.DataFrame.to_msgpack,../reference/api/pandas.DataFrame.to_msgpack
+generated/pandas.DataFrame.to_numpy,../reference/api/pandas.DataFrame.to_numpy
+generated/pandas.DataFrame.to_panel,../reference/api/pandas.DataFrame.to_panel
+generated/pandas.DataFrame.to_parquet,../reference/api/pandas.DataFrame.to_parquet
+generated/pandas.DataFrame.to_period,../reference/api/pandas.DataFrame.to_period
+generated/pandas.DataFrame.to_pickle,../reference/api/pandas.DataFrame.to_pickle
+generated/pandas.DataFrame.to_records,../reference/api/pandas.DataFrame.to_records
+generated/pandas.DataFrame.to_sparse,../reference/api/pandas.DataFrame.to_sparse
+generated/pandas.DataFrame.to_sql,../reference/api/pandas.DataFrame.to_sql
+generated/pandas.DataFrame.to_stata,../reference/api/pandas.DataFrame.to_stata
+generated/pandas.DataFrame.to_string,../reference/api/pandas.DataFrame.to_string
+generated/pandas.DataFrame.to_timestamp,../reference/api/pandas.DataFrame.to_timestamp
+generated/pandas.DataFrame.to_xarray,../reference/api/pandas.DataFrame.to_xarray
+generated/pandas.DataFrame.transform,../reference/api/pandas.DataFrame.transform
+generated/pandas.DataFrame.transpose,../reference/api/pandas.DataFrame.transpose
+generated/pandas.DataFrame.truediv,../reference/api/pandas.DataFrame.truediv
+generated/pandas.DataFrame.truncate,../reference/api/pandas.DataFrame.truncate
+generated/pandas.DataFrame.tshift,../reference/api/pandas.DataFrame.tshift
+generated/pandas.DataFrame.tz_convert,../reference/api/pandas.DataFrame.tz_convert
+generated/pandas.DataFrame.tz_localize,../reference/api/pandas.DataFrame.tz_localize
+generated/pandas.DataFrame.unstack,../reference/api/pandas.DataFrame.unstack
+generated/pandas.DataFrame.update,../reference/api/pandas.DataFrame.update
+generated/pandas.DataFrame.values,../reference/api/pandas.DataFrame.values
+generated/pandas.DataFrame.var,../reference/api/pandas.DataFrame.var
+generated/pandas.DataFrame.where,../reference/api/pandas.DataFrame.where
+generated/pandas.DataFrame.xs,../reference/api/pandas.DataFrame.xs
+generated/pandas.date_range,../reference/api/pandas.date_range
+generated/pandas.DatetimeIndex.ceil,../reference/api/pandas.DatetimeIndex.ceil
+generated/pandas.DatetimeIndex.date,../reference/api/pandas.DatetimeIndex.date
+generated/pandas.DatetimeIndex.day,../reference/api/pandas.DatetimeIndex.day
+generated/pandas.DatetimeIndex.day_name,../reference/api/pandas.DatetimeIndex.day_name
+generated/pandas.DatetimeIndex.dayofweek,../reference/api/pandas.DatetimeIndex.dayofweek
+generated/pandas.DatetimeIndex.dayofyear,../reference/api/pandas.DatetimeIndex.dayofyear
+generated/pandas.DatetimeIndex.floor,../reference/api/pandas.DatetimeIndex.floor
+generated/pandas.DatetimeIndex.freq,../reference/api/pandas.DatetimeIndex.freq
+generated/pandas.DatetimeIndex.freqstr,../reference/api/pandas.DatetimeIndex.freqstr
+generated/pandas.DatetimeIndex.hour,../reference/api/pandas.DatetimeIndex.hour
+generated/pandas.DatetimeIndex,../reference/api/pandas.DatetimeIndex
+generated/pandas.DatetimeIndex.indexer_at_time,../reference/api/pandas.DatetimeIndex.indexer_at_time
+generated/pandas.DatetimeIndex.indexer_between_time,../reference/api/pandas.DatetimeIndex.indexer_between_time
+generated/pandas.DatetimeIndex.inferred_freq,../reference/api/pandas.DatetimeIndex.inferred_freq
+generated/pandas.DatetimeIndex.is_leap_year,../reference/api/pandas.DatetimeIndex.is_leap_year
+generated/pandas.DatetimeIndex.is_month_end,../reference/api/pandas.DatetimeIndex.is_month_end
+generated/pandas.DatetimeIndex.is_month_start,../reference/api/pandas.DatetimeIndex.is_month_start
+generated/pandas.DatetimeIndex.is_quarter_end,../reference/api/pandas.DatetimeIndex.is_quarter_end
+generated/pandas.DatetimeIndex.is_quarter_start,../reference/api/pandas.DatetimeIndex.is_quarter_start
+generated/pandas.DatetimeIndex.is_year_end,../reference/api/pandas.DatetimeIndex.is_year_end
+generated/pandas.DatetimeIndex.is_year_start,../reference/api/pandas.DatetimeIndex.is_year_start
+generated/pandas.DatetimeIndex.microsecond,../reference/api/pandas.DatetimeIndex.microsecond
+generated/pandas.DatetimeIndex.minute,../reference/api/pandas.DatetimeIndex.minute
+generated/pandas.DatetimeIndex.month,../reference/api/pandas.DatetimeIndex.month
+generated/pandas.DatetimeIndex.month_name,../reference/api/pandas.DatetimeIndex.month_name
+generated/pandas.DatetimeIndex.nanosecond,../reference/api/pandas.DatetimeIndex.nanosecond
+generated/pandas.DatetimeIndex.normalize,../reference/api/pandas.DatetimeIndex.normalize
+generated/pandas.DatetimeIndex.quarter,../reference/api/pandas.DatetimeIndex.quarter
+generated/pandas.DatetimeIndex.round,../reference/api/pandas.DatetimeIndex.round
+generated/pandas.DatetimeIndex.second,../reference/api/pandas.DatetimeIndex.second
+generated/pandas.DatetimeIndex.snap,../reference/api/pandas.DatetimeIndex.snap
+generated/pandas.DatetimeIndex.strftime,../reference/api/pandas.DatetimeIndex.strftime
+generated/pandas.DatetimeIndex.time,../reference/api/pandas.DatetimeIndex.time
+generated/pandas.DatetimeIndex.timetz,../reference/api/pandas.DatetimeIndex.timetz
+generated/pandas.DatetimeIndex.to_frame,../reference/api/pandas.DatetimeIndex.to_frame
+generated/pandas.DatetimeIndex.to_perioddelta,../reference/api/pandas.DatetimeIndex.to_perioddelta
+generated/pandas.DatetimeIndex.to_period,../reference/api/pandas.DatetimeIndex.to_period
+generated/pandas.DatetimeIndex.to_pydatetime,../reference/api/pandas.DatetimeIndex.to_pydatetime
+generated/pandas.DatetimeIndex.to_series,../reference/api/pandas.DatetimeIndex.to_series
+generated/pandas.DatetimeIndex.tz_convert,../reference/api/pandas.DatetimeIndex.tz_convert
+generated/pandas.DatetimeIndex.tz,../reference/api/pandas.DatetimeIndex.tz
+generated/pandas.DatetimeIndex.tz_localize,../reference/api/pandas.DatetimeIndex.tz_localize
+generated/pandas.DatetimeIndex.weekday,../reference/api/pandas.DatetimeIndex.weekday
+generated/pandas.DatetimeIndex.week,../reference/api/pandas.DatetimeIndex.week
+generated/pandas.DatetimeIndex.weekofyear,../reference/api/pandas.DatetimeIndex.weekofyear
+generated/pandas.DatetimeIndex.year,../reference/api/pandas.DatetimeIndex.year
+generated/pandas.DatetimeTZDtype.base,../reference/api/pandas.DatetimeTZDtype.base
+generated/pandas.DatetimeTZDtype.construct_array_type,../reference/api/pandas.DatetimeTZDtype.construct_array_type
+generated/pandas.DatetimeTZDtype.construct_from_string,../reference/api/pandas.DatetimeTZDtype.construct_from_string
+generated/pandas.DatetimeTZDtype,../reference/api/pandas.DatetimeTZDtype
+generated/pandas.DatetimeTZDtype.isbuiltin,../reference/api/pandas.DatetimeTZDtype.isbuiltin
+generated/pandas.DatetimeTZDtype.is_dtype,../reference/api/pandas.DatetimeTZDtype.is_dtype
+generated/pandas.DatetimeTZDtype.isnative,../reference/api/pandas.DatetimeTZDtype.isnative
+generated/pandas.DatetimeTZDtype.itemsize,../reference/api/pandas.DatetimeTZDtype.itemsize
+generated/pandas.DatetimeTZDtype.kind,../reference/api/pandas.DatetimeTZDtype.kind
+generated/pandas.DatetimeTZDtype.name,../reference/api/pandas.DatetimeTZDtype.name
+generated/pandas.DatetimeTZDtype.names,../reference/api/pandas.DatetimeTZDtype.names
+generated/pandas.DatetimeTZDtype.na_value,../reference/api/pandas.DatetimeTZDtype.na_value
+generated/pandas.DatetimeTZDtype.num,../reference/api/pandas.DatetimeTZDtype.num
+generated/pandas.DatetimeTZDtype.reset_cache,../reference/api/pandas.DatetimeTZDtype.reset_cache
+generated/pandas.DatetimeTZDtype.shape,../reference/api/pandas.DatetimeTZDtype.shape
+generated/pandas.DatetimeTZDtype.str,../reference/api/pandas.DatetimeTZDtype.str
+generated/pandas.DatetimeTZDtype.subdtype,../reference/api/pandas.DatetimeTZDtype.subdtype
+generated/pandas.DatetimeTZDtype.tz,../reference/api/pandas.DatetimeTZDtype.tz
+generated/pandas.DatetimeTZDtype.unit,../reference/api/pandas.DatetimeTZDtype.unit
+generated/pandas.describe_option,../reference/api/pandas.describe_option
+generated/pandas.errors.DtypeWarning,../reference/api/pandas.errors.DtypeWarning
+generated/pandas.errors.EmptyDataError,../reference/api/pandas.errors.EmptyDataError
+generated/pandas.errors.OutOfBoundsDatetime,../reference/api/pandas.errors.OutOfBoundsDatetime
+generated/pandas.errors.ParserError,../reference/api/pandas.errors.ParserError
+generated/pandas.errors.ParserWarning,../reference/api/pandas.errors.ParserWarning
+generated/pandas.errors.PerformanceWarning,../reference/api/pandas.errors.PerformanceWarning
+generated/pandas.errors.UnsortedIndexError,../reference/api/pandas.errors.UnsortedIndexError
+generated/pandas.errors.UnsupportedFunctionCall,../reference/api/pandas.errors.UnsupportedFunctionCall
+generated/pandas.eval,../reference/api/pandas.eval
+generated/pandas.ExcelFile.parse,../reference/api/pandas.ExcelFile.parse
+generated/pandas.ExcelWriter,../reference/api/pandas.ExcelWriter
+generated/pandas.factorize,../reference/api/pandas.factorize
+generated/pandas.Float64Index,../reference/api/pandas.Float64Index
+generated/pandas.get_dummies,../reference/api/pandas.get_dummies
+generated/pandas.get_option,../reference/api/pandas.get_option
+generated/pandas.Grouper,../reference/api/pandas.Grouper
+generated/pandas.HDFStore.append,../reference/api/pandas.HDFStore.append
+generated/pandas.HDFStore.get,../reference/api/pandas.HDFStore.get
+generated/pandas.HDFStore.groups,../reference/api/pandas.HDFStore.groups
+generated/pandas.HDFStore.info,../reference/api/pandas.HDFStore.info
+generated/pandas.HDFStore.keys,../reference/api/pandas.HDFStore.keys
+generated/pandas.HDFStore.put,../reference/api/pandas.HDFStore.put
+generated/pandas.HDFStore.select,../reference/api/pandas.HDFStore.select
+generated/pandas.HDFStore.walk,../reference/api/pandas.HDFStore.walk
+generated/pandas.Index.all,../reference/api/pandas.Index.all
+generated/pandas.Index.any,../reference/api/pandas.Index.any
+generated/pandas.Index.append,../reference/api/pandas.Index.append
+generated/pandas.Index.argmax,../reference/api/pandas.Index.argmax
+generated/pandas.Index.argmin,../reference/api/pandas.Index.argmin
+generated/pandas.Index.argsort,../reference/api/pandas.Index.argsort
+generated/pandas.Index.array,../reference/api/pandas.Index.array
+generated/pandas.Index.asi8,../reference/api/pandas.Index.asi8
+generated/pandas.Index.asof,../reference/api/pandas.Index.asof
+generated/pandas.Index.asof_locs,../reference/api/pandas.Index.asof_locs
+generated/pandas.Index.astype,../reference/api/pandas.Index.astype
+generated/pandas.Index.base,../reference/api/pandas.Index.base
+generated/pandas.Index.contains,../reference/api/pandas.Index.contains
+generated/pandas.Index.copy,../reference/api/pandas.Index.copy
+generated/pandas.Index.data,../reference/api/pandas.Index.data
+generated/pandas.Index.delete,../reference/api/pandas.Index.delete
+generated/pandas.Index.difference,../reference/api/pandas.Index.difference
+generated/pandas.Index.drop_duplicates,../reference/api/pandas.Index.drop_duplicates
+generated/pandas.Index.drop,../reference/api/pandas.Index.drop
+generated/pandas.Index.droplevel,../reference/api/pandas.Index.droplevel
+generated/pandas.Index.dropna,../reference/api/pandas.Index.dropna
+generated/pandas.Index.dtype,../reference/api/pandas.Index.dtype
+generated/pandas.Index.dtype_str,../reference/api/pandas.Index.dtype_str
+generated/pandas.Index.duplicated,../reference/api/pandas.Index.duplicated
+generated/pandas.Index.empty,../reference/api/pandas.Index.empty
+generated/pandas.Index.equals,../reference/api/pandas.Index.equals
+generated/pandas.Index.factorize,../reference/api/pandas.Index.factorize
+generated/pandas.Index.fillna,../reference/api/pandas.Index.fillna
+generated/pandas.Index.flags,../reference/api/pandas.Index.flags
+generated/pandas.Index.format,../reference/api/pandas.Index.format
+generated/pandas.Index.get_duplicates,../reference/api/pandas.Index.get_duplicates
+generated/pandas.Index.get_indexer_for,../reference/api/pandas.Index.get_indexer_for
+generated/pandas.Index.get_indexer,../reference/api/pandas.Index.get_indexer
+generated/pandas.Index.get_indexer_non_unique,../reference/api/pandas.Index.get_indexer_non_unique
+generated/pandas.Index.get_level_values,../reference/api/pandas.Index.get_level_values
+generated/pandas.Index.get_loc,../reference/api/pandas.Index.get_loc
+generated/pandas.Index.get_slice_bound,../reference/api/pandas.Index.get_slice_bound
+generated/pandas.Index.get_value,../reference/api/pandas.Index.get_value
+generated/pandas.Index.get_values,../reference/api/pandas.Index.get_values
+generated/pandas.Index.groupby,../reference/api/pandas.Index.groupby
+generated/pandas.Index.has_duplicates,../reference/api/pandas.Index.has_duplicates
+generated/pandas.Index.hasnans,../reference/api/pandas.Index.hasnans
+generated/pandas.Index.holds_integer,../reference/api/pandas.Index.holds_integer
+generated/pandas.Index,../reference/api/pandas.Index
+generated/pandas.Index.identical,../reference/api/pandas.Index.identical
+generated/pandas.Index.inferred_type,../reference/api/pandas.Index.inferred_type
+generated/pandas.Index.insert,../reference/api/pandas.Index.insert
+generated/pandas.Index.intersection,../reference/api/pandas.Index.intersection
+generated/pandas.Index.is_all_dates,../reference/api/pandas.Index.is_all_dates
+generated/pandas.Index.is_boolean,../reference/api/pandas.Index.is_boolean
+generated/pandas.Index.is_categorical,../reference/api/pandas.Index.is_categorical
+generated/pandas.Index.is_floating,../reference/api/pandas.Index.is_floating
+generated/pandas.Index.is_,../reference/api/pandas.Index.is_
+generated/pandas.Index.isin,../reference/api/pandas.Index.isin
+generated/pandas.Index.is_integer,../reference/api/pandas.Index.is_integer
+generated/pandas.Index.is_interval,../reference/api/pandas.Index.is_interval
+generated/pandas.Index.is_lexsorted_for_tuple,../reference/api/pandas.Index.is_lexsorted_for_tuple
+generated/pandas.Index.is_mixed,../reference/api/pandas.Index.is_mixed
+generated/pandas.Index.is_monotonic_decreasing,../reference/api/pandas.Index.is_monotonic_decreasing
+generated/pandas.Index.is_monotonic,../reference/api/pandas.Index.is_monotonic
+generated/pandas.Index.is_monotonic_increasing,../reference/api/pandas.Index.is_monotonic_increasing
+generated/pandas.Index.isna,../reference/api/pandas.Index.isna
+generated/pandas.Index.isnull,../reference/api/pandas.Index.isnull
+generated/pandas.Index.is_numeric,../reference/api/pandas.Index.is_numeric
+generated/pandas.Index.is_object,../reference/api/pandas.Index.is_object
+generated/pandas.Index.is_type_compatible,../reference/api/pandas.Index.is_type_compatible
+generated/pandas.Index.is_unique,../reference/api/pandas.Index.is_unique
+generated/pandas.Index.item,../reference/api/pandas.Index.item
+generated/pandas.Index.itemsize,../reference/api/pandas.Index.itemsize
+generated/pandas.Index.join,../reference/api/pandas.Index.join
+generated/pandas.Index.map,../reference/api/pandas.Index.map
+generated/pandas.Index.max,../reference/api/pandas.Index.max
+generated/pandas.Index.memory_usage,../reference/api/pandas.Index.memory_usage
+generated/pandas.Index.min,../reference/api/pandas.Index.min
+generated/pandas.Index.name,../reference/api/pandas.Index.name
+generated/pandas.Index.names,../reference/api/pandas.Index.names
+generated/pandas.Index.nbytes,../reference/api/pandas.Index.nbytes
+generated/pandas.Index.ndim,../reference/api/pandas.Index.ndim
+generated/pandas.Index.nlevels,../reference/api/pandas.Index.nlevels
+generated/pandas.Index.notna,../reference/api/pandas.Index.notna
+generated/pandas.Index.notnull,../reference/api/pandas.Index.notnull
+generated/pandas.Index.nunique,../reference/api/pandas.Index.nunique
+generated/pandas.Index.putmask,../reference/api/pandas.Index.putmask
+generated/pandas.Index.ravel,../reference/api/pandas.Index.ravel
+generated/pandas.Index.reindex,../reference/api/pandas.Index.reindex
+generated/pandas.Index.rename,../reference/api/pandas.Index.rename
+generated/pandas.Index.repeat,../reference/api/pandas.Index.repeat
+generated/pandas.Index.searchsorted,../reference/api/pandas.Index.searchsorted
+generated/pandas.Index.set_names,../reference/api/pandas.Index.set_names
+generated/pandas.Index.set_value,../reference/api/pandas.Index.set_value
+generated/pandas.Index.shape,../reference/api/pandas.Index.shape
+generated/pandas.Index.shift,../reference/api/pandas.Index.shift
+generated/pandas.Index.size,../reference/api/pandas.Index.size
+generated/pandas.IndexSlice,../reference/api/pandas.IndexSlice
+generated/pandas.Index.slice_indexer,../reference/api/pandas.Index.slice_indexer
+generated/pandas.Index.slice_locs,../reference/api/pandas.Index.slice_locs
+generated/pandas.Index.sort,../reference/api/pandas.Index.sort
+generated/pandas.Index.sortlevel,../reference/api/pandas.Index.sortlevel
+generated/pandas.Index.sort_values,../reference/api/pandas.Index.sort_values
+generated/pandas.Index.str,../reference/api/pandas.Index.str
+generated/pandas.Index.strides,../reference/api/pandas.Index.strides
+generated/pandas.Index.summary,../reference/api/pandas.Index.summary
+generated/pandas.Index.symmetric_difference,../reference/api/pandas.Index.symmetric_difference
+generated/pandas.Index.take,../reference/api/pandas.Index.take
+generated/pandas.Index.T,../reference/api/pandas.Index.T
+generated/pandas.Index.to_flat_index,../reference/api/pandas.Index.to_flat_index
+generated/pandas.Index.to_frame,../reference/api/pandas.Index.to_frame
+generated/pandas.Index.to_list,../reference/api/pandas.Index.to_list
+generated/pandas.Index.tolist,../reference/api/pandas.Index.tolist
+generated/pandas.Index.to_native_types,../reference/api/pandas.Index.to_native_types
+generated/pandas.Index.to_numpy,../reference/api/pandas.Index.to_numpy
+generated/pandas.Index.to_series,../reference/api/pandas.Index.to_series
+generated/pandas.Index.transpose,../reference/api/pandas.Index.transpose
+generated/pandas.Index.union,../reference/api/pandas.Index.union
+generated/pandas.Index.unique,../reference/api/pandas.Index.unique
+generated/pandas.Index.value_counts,../reference/api/pandas.Index.value_counts
+generated/pandas.Index.values,../reference/api/pandas.Index.values
+generated/pandas.Index.view,../reference/api/pandas.Index.view
+generated/pandas.Index.where,../reference/api/pandas.Index.where
+generated/pandas.infer_freq,../reference/api/pandas.infer_freq
+generated/pandas.Interval.closed,../reference/api/pandas.Interval.closed
+generated/pandas.Interval.closed_left,../reference/api/pandas.Interval.closed_left
+generated/pandas.Interval.closed_right,../reference/api/pandas.Interval.closed_right
+generated/pandas.Interval,../reference/api/pandas.Interval
+generated/pandas.IntervalIndex.closed,../reference/api/pandas.IntervalIndex.closed
+generated/pandas.IntervalIndex.contains,../reference/api/pandas.IntervalIndex.contains
+generated/pandas.IntervalIndex.from_arrays,../reference/api/pandas.IntervalIndex.from_arrays
+generated/pandas.IntervalIndex.from_breaks,../reference/api/pandas.IntervalIndex.from_breaks
+generated/pandas.IntervalIndex.from_tuples,../reference/api/pandas.IntervalIndex.from_tuples
+generated/pandas.IntervalIndex.get_indexer,../reference/api/pandas.IntervalIndex.get_indexer
+generated/pandas.IntervalIndex.get_loc,../reference/api/pandas.IntervalIndex.get_loc
+generated/pandas.IntervalIndex,../reference/api/pandas.IntervalIndex
+generated/pandas.IntervalIndex.is_non_overlapping_monotonic,../reference/api/pandas.IntervalIndex.is_non_overlapping_monotonic
+generated/pandas.IntervalIndex.is_overlapping,../reference/api/pandas.IntervalIndex.is_overlapping
+generated/pandas.IntervalIndex.left,../reference/api/pandas.IntervalIndex.left
+generated/pandas.IntervalIndex.length,../reference/api/pandas.IntervalIndex.length
+generated/pandas.IntervalIndex.mid,../reference/api/pandas.IntervalIndex.mid
+generated/pandas.IntervalIndex.overlaps,../reference/api/pandas.IntervalIndex.overlaps
+generated/pandas.IntervalIndex.right,../reference/api/pandas.IntervalIndex.right
+generated/pandas.IntervalIndex.set_closed,../reference/api/pandas.IntervalIndex.set_closed
+generated/pandas.IntervalIndex.to_tuples,../reference/api/pandas.IntervalIndex.to_tuples
+generated/pandas.IntervalIndex.values,../reference/api/pandas.IntervalIndex.values
+generated/pandas.Interval.left,../reference/api/pandas.Interval.left
+generated/pandas.Interval.length,../reference/api/pandas.Interval.length
+generated/pandas.Interval.mid,../reference/api/pandas.Interval.mid
+generated/pandas.Interval.open_left,../reference/api/pandas.Interval.open_left
+generated/pandas.Interval.open_right,../reference/api/pandas.Interval.open_right
+generated/pandas.Interval.overlaps,../reference/api/pandas.Interval.overlaps
+generated/pandas.interval_range,../reference/api/pandas.interval_range
+generated/pandas.Interval.right,../reference/api/pandas.Interval.right
+generated/pandas.io.formats.style.Styler.apply,../reference/api/pandas.io.formats.style.Styler.apply
+generated/pandas.io.formats.style.Styler.applymap,../reference/api/pandas.io.formats.style.Styler.applymap
+generated/pandas.io.formats.style.Styler.background_gradient,../reference/api/pandas.io.formats.style.Styler.background_gradient
+generated/pandas.io.formats.style.Styler.bar,../reference/api/pandas.io.formats.style.Styler.bar
+generated/pandas.io.formats.style.Styler.clear,../reference/api/pandas.io.formats.style.Styler.clear
+generated/pandas.io.formats.style.Styler.env,../reference/api/pandas.io.formats.style.Styler.env
+generated/pandas.io.formats.style.Styler.export,../reference/api/pandas.io.formats.style.Styler.export
+generated/pandas.io.formats.style.Styler.format,../reference/api/pandas.io.formats.style.Styler.format
+generated/pandas.io.formats.style.Styler.from_custom_template,../reference/api/pandas.io.formats.style.Styler.from_custom_template
+generated/pandas.io.formats.style.Styler.hide_columns,../reference/api/pandas.io.formats.style.Styler.hide_columns
+generated/pandas.io.formats.style.Styler.hide_index,../reference/api/pandas.io.formats.style.Styler.hide_index
+generated/pandas.io.formats.style.Styler.highlight_max,../reference/api/pandas.io.formats.style.Styler.highlight_max
+generated/pandas.io.formats.style.Styler.highlight_min,../reference/api/pandas.io.formats.style.Styler.highlight_min
+generated/pandas.io.formats.style.Styler.highlight_null,../reference/api/pandas.io.formats.style.Styler.highlight_null
+generated/pandas.io.formats.style.Styler,../reference/api/pandas.io.formats.style.Styler
+generated/pandas.io.formats.style.Styler.loader,../reference/api/pandas.io.formats.style.Styler.loader
+generated/pandas.io.formats.style.Styler.pipe,../reference/api/pandas.io.formats.style.Styler.pipe
+generated/pandas.io.formats.style.Styler.render,../reference/api/pandas.io.formats.style.Styler.render
+generated/pandas.io.formats.style.Styler.set_caption,../reference/api/pandas.io.formats.style.Styler.set_caption
+generated/pandas.io.formats.style.Styler.set_precision,../reference/api/pandas.io.formats.style.Styler.set_precision
+generated/pandas.io.formats.style.Styler.set_properties,../reference/api/pandas.io.formats.style.Styler.set_properties
+generated/pandas.io.formats.style.Styler.set_table_attributes,../reference/api/pandas.io.formats.style.Styler.set_table_attributes
+generated/pandas.io.formats.style.Styler.set_table_styles,../reference/api/pandas.io.formats.style.Styler.set_table_styles
+generated/pandas.io.formats.style.Styler.set_uuid,../reference/api/pandas.io.formats.style.Styler.set_uuid
+generated/pandas.io.formats.style.Styler.template,../reference/api/pandas.io.formats.style.Styler.template
+generated/pandas.io.formats.style.Styler.to_excel,../reference/api/pandas.io.formats.style.Styler.to_excel
+generated/pandas.io.formats.style.Styler.use,../reference/api/pandas.io.formats.style.Styler.use
+generated/pandas.io.formats.style.Styler.where,../reference/api/pandas.io.formats.style.Styler.where
+generated/pandas.io.json.build_table_schema,../reference/api/pandas.io.json.build_table_schema
+generated/pandas.io.json.json_normalize,../reference/api/pandas.io.json.json_normalize
+generated/pandas.io.stata.StataReader.data,../reference/api/pandas.io.stata.StataReader.data
+generated/pandas.io.stata.StataReader.data_label,../reference/api/pandas.io.stata.StataReader.data_label
+generated/pandas.io.stata.StataReader.value_labels,../reference/api/pandas.io.stata.StataReader.value_labels
+generated/pandas.io.stata.StataReader.variable_labels,../reference/api/pandas.io.stata.StataReader.variable_labels
+generated/pandas.io.stata.StataWriter.write_file,../reference/api/pandas.io.stata.StataWriter.write_file
+generated/pandas.isna,../reference/api/pandas.isna
+generated/pandas.isnull,../reference/api/pandas.isnull
+generated/pandas.melt,../reference/api/pandas.melt
+generated/pandas.merge_asof,../reference/api/pandas.merge_asof
+generated/pandas.merge,../reference/api/pandas.merge
+generated/pandas.merge_ordered,../reference/api/pandas.merge_ordered
+generated/pandas.MultiIndex.codes,../reference/api/pandas.MultiIndex.codes
+generated/pandas.MultiIndex.droplevel,../reference/api/pandas.MultiIndex.droplevel
+generated/pandas.MultiIndex.from_arrays,../reference/api/pandas.MultiIndex.from_arrays
+generated/pandas.MultiIndex.from_frame,../reference/api/pandas.MultiIndex.from_frame
+generated/pandas.MultiIndex.from_product,../reference/api/pandas.MultiIndex.from_product
+generated/pandas.MultiIndex.from_tuples,../reference/api/pandas.MultiIndex.from_tuples
+generated/pandas.MultiIndex.get_indexer,../reference/api/pandas.MultiIndex.get_indexer
+generated/pandas.MultiIndex.get_level_values,../reference/api/pandas.MultiIndex.get_level_values
+generated/pandas.MultiIndex.get_loc,../reference/api/pandas.MultiIndex.get_loc
+generated/pandas.MultiIndex.get_loc_level,../reference/api/pandas.MultiIndex.get_loc_level
+generated/pandas.MultiIndex,../reference/api/pandas.MultiIndex
+generated/pandas.MultiIndex.is_lexsorted,../reference/api/pandas.MultiIndex.is_lexsorted
+generated/pandas.MultiIndex.levels,../reference/api/pandas.MultiIndex.levels
+generated/pandas.MultiIndex.levshape,../reference/api/pandas.MultiIndex.levshape
+generated/pandas.MultiIndex.names,../reference/api/pandas.MultiIndex.names
+generated/pandas.MultiIndex.nlevels,../reference/api/pandas.MultiIndex.nlevels
+generated/pandas.MultiIndex.remove_unused_levels,../reference/api/pandas.MultiIndex.remove_unused_levels
+generated/pandas.MultiIndex.reorder_levels,../reference/api/pandas.MultiIndex.reorder_levels
+generated/pandas.MultiIndex.set_codes,../reference/api/pandas.MultiIndex.set_codes
+generated/pandas.MultiIndex.set_levels,../reference/api/pandas.MultiIndex.set_levels
+generated/pandas.MultiIndex.sortlevel,../reference/api/pandas.MultiIndex.sortlevel
+generated/pandas.MultiIndex.swaplevel,../reference/api/pandas.MultiIndex.swaplevel
+generated/pandas.MultiIndex.to_flat_index,../reference/api/pandas.MultiIndex.to_flat_index
+generated/pandas.MultiIndex.to_frame,../reference/api/pandas.MultiIndex.to_frame
+generated/pandas.MultiIndex.to_hierarchical,../reference/api/pandas.MultiIndex.to_hierarchical
+generated/pandas.notna,../reference/api/pandas.notna
+generated/pandas.notnull,../reference/api/pandas.notnull
+generated/pandas.option_context,../reference/api/pandas.option_context
+generated/pandas.Panel.abs,../reference/api/pandas.Panel.abs
+generated/pandas.Panel.add,../reference/api/pandas.Panel.add
+generated/pandas.Panel.add_prefix,../reference/api/pandas.Panel.add_prefix
+generated/pandas.Panel.add_suffix,../reference/api/pandas.Panel.add_suffix
+generated/pandas.Panel.agg,../reference/api/pandas.Panel.agg
+generated/pandas.Panel.aggregate,../reference/api/pandas.Panel.aggregate
+generated/pandas.Panel.align,../reference/api/pandas.Panel.align
+generated/pandas.Panel.all,../reference/api/pandas.Panel.all
+generated/pandas.Panel.any,../reference/api/pandas.Panel.any
+generated/pandas.Panel.apply,../reference/api/pandas.Panel.apply
+generated/pandas.Panel.as_blocks,../reference/api/pandas.Panel.as_blocks
+generated/pandas.Panel.asfreq,../reference/api/pandas.Panel.asfreq
+generated/pandas.Panel.as_matrix,../reference/api/pandas.Panel.as_matrix
+generated/pandas.Panel.asof,../reference/api/pandas.Panel.asof
+generated/pandas.Panel.astype,../reference/api/pandas.Panel.astype
+generated/pandas.Panel.at,../reference/api/pandas.Panel.at
+generated/pandas.Panel.at_time,../reference/api/pandas.Panel.at_time
+generated/pandas.Panel.axes,../reference/api/pandas.Panel.axes
+generated/pandas.Panel.between_time,../reference/api/pandas.Panel.between_time
+generated/pandas.Panel.bfill,../reference/api/pandas.Panel.bfill
+generated/pandas.Panel.blocks,../reference/api/pandas.Panel.blocks
+generated/pandas.Panel.bool,../reference/api/pandas.Panel.bool
+generated/pandas.Panel.clip,../reference/api/pandas.Panel.clip
+generated/pandas.Panel.clip_lower,../reference/api/pandas.Panel.clip_lower
+generated/pandas.Panel.clip_upper,../reference/api/pandas.Panel.clip_upper
+generated/pandas.Panel.compound,../reference/api/pandas.Panel.compound
+generated/pandas.Panel.conform,../reference/api/pandas.Panel.conform
+generated/pandas.Panel.convert_objects,../reference/api/pandas.Panel.convert_objects
+generated/pandas.Panel.copy,../reference/api/pandas.Panel.copy
+generated/pandas.Panel.count,../reference/api/pandas.Panel.count
+generated/pandas.Panel.cummax,../reference/api/pandas.Panel.cummax
+generated/pandas.Panel.cummin,../reference/api/pandas.Panel.cummin
+generated/pandas.Panel.cumprod,../reference/api/pandas.Panel.cumprod
+generated/pandas.Panel.cumsum,../reference/api/pandas.Panel.cumsum
+generated/pandas.Panel.describe,../reference/api/pandas.Panel.describe
+generated/pandas.Panel.div,../reference/api/pandas.Panel.div
+generated/pandas.Panel.divide,../reference/api/pandas.Panel.divide
+generated/pandas.Panel.drop,../reference/api/pandas.Panel.drop
+generated/pandas.Panel.droplevel,../reference/api/pandas.Panel.droplevel
+generated/pandas.Panel.dropna,../reference/api/pandas.Panel.dropna
+generated/pandas.Panel.dtypes,../reference/api/pandas.Panel.dtypes
+generated/pandas.Panel.empty,../reference/api/pandas.Panel.empty
+generated/pandas.Panel.eq,../reference/api/pandas.Panel.eq
+generated/pandas.Panel.equals,../reference/api/pandas.Panel.equals
+generated/pandas.Panel.ffill,../reference/api/pandas.Panel.ffill
+generated/pandas.Panel.fillna,../reference/api/pandas.Panel.fillna
+generated/pandas.Panel.filter,../reference/api/pandas.Panel.filter
+generated/pandas.Panel.first,../reference/api/pandas.Panel.first
+generated/pandas.Panel.first_valid_index,../reference/api/pandas.Panel.first_valid_index
+generated/pandas.Panel.floordiv,../reference/api/pandas.Panel.floordiv
+generated/pandas.Panel.from_dict,../reference/api/pandas.Panel.from_dict
+generated/pandas.Panel.fromDict,../reference/api/pandas.Panel.fromDict
+generated/pandas.Panel.ftypes,../reference/api/pandas.Panel.ftypes
+generated/pandas.Panel.ge,../reference/api/pandas.Panel.ge
+generated/pandas.Panel.get_dtype_counts,../reference/api/pandas.Panel.get_dtype_counts
+generated/pandas.Panel.get_ftype_counts,../reference/api/pandas.Panel.get_ftype_counts
+generated/pandas.Panel.get,../reference/api/pandas.Panel.get
+generated/pandas.Panel.get_value,../reference/api/pandas.Panel.get_value
+generated/pandas.Panel.get_values,../reference/api/pandas.Panel.get_values
+generated/pandas.Panel.groupby,../reference/api/pandas.Panel.groupby
+generated/pandas.Panel.gt,../reference/api/pandas.Panel.gt
+generated/pandas.Panel.head,../reference/api/pandas.Panel.head
+generated/pandas.Panel,../reference/api/pandas.Panel
+generated/pandas.Panel.iat,../reference/api/pandas.Panel.iat
+generated/pandas.Panel.iloc,../reference/api/pandas.Panel.iloc
+generated/pandas.Panel.infer_objects,../reference/api/pandas.Panel.infer_objects
+generated/pandas.Panel.interpolate,../reference/api/pandas.Panel.interpolate
+generated/pandas.Panel.is_copy,../reference/api/pandas.Panel.is_copy
+generated/pandas.Panel.isna,../reference/api/pandas.Panel.isna
+generated/pandas.Panel.isnull,../reference/api/pandas.Panel.isnull
+generated/pandas.Panel.items,../reference/api/pandas.Panel.items
+generated/pandas.Panel.__iter__,../reference/api/pandas.Panel.__iter__
+generated/pandas.Panel.iteritems,../reference/api/pandas.Panel.iteritems
+generated/pandas.Panel.ix,../reference/api/pandas.Panel.ix
+generated/pandas.Panel.join,../reference/api/pandas.Panel.join
+generated/pandas.Panel.keys,../reference/api/pandas.Panel.keys
+generated/pandas.Panel.kurt,../reference/api/pandas.Panel.kurt
+generated/pandas.Panel.kurtosis,../reference/api/pandas.Panel.kurtosis
+generated/pandas.Panel.last,../reference/api/pandas.Panel.last
+generated/pandas.Panel.last_valid_index,../reference/api/pandas.Panel.last_valid_index
+generated/pandas.Panel.le,../reference/api/pandas.Panel.le
+generated/pandas.Panel.loc,../reference/api/pandas.Panel.loc
+generated/pandas.Panel.lt,../reference/api/pandas.Panel.lt
+generated/pandas.Panel.mad,../reference/api/pandas.Panel.mad
+generated/pandas.Panel.major_axis,../reference/api/pandas.Panel.major_axis
+generated/pandas.Panel.major_xs,../reference/api/pandas.Panel.major_xs
+generated/pandas.Panel.mask,../reference/api/pandas.Panel.mask
+generated/pandas.Panel.max,../reference/api/pandas.Panel.max
+generated/pandas.Panel.mean,../reference/api/pandas.Panel.mean
+generated/pandas.Panel.median,../reference/api/pandas.Panel.median
+generated/pandas.Panel.min,../reference/api/pandas.Panel.min
+generated/pandas.Panel.minor_axis,../reference/api/pandas.Panel.minor_axis
+generated/pandas.Panel.minor_xs,../reference/api/pandas.Panel.minor_xs
+generated/pandas.Panel.mod,../reference/api/pandas.Panel.mod
+generated/pandas.Panel.mul,../reference/api/pandas.Panel.mul
+generated/pandas.Panel.multiply,../reference/api/pandas.Panel.multiply
+generated/pandas.Panel.ndim,../reference/api/pandas.Panel.ndim
+generated/pandas.Panel.ne,../reference/api/pandas.Panel.ne
+generated/pandas.Panel.notna,../reference/api/pandas.Panel.notna
+generated/pandas.Panel.notnull,../reference/api/pandas.Panel.notnull
+generated/pandas.Panel.pct_change,../reference/api/pandas.Panel.pct_change
+generated/pandas.Panel.pipe,../reference/api/pandas.Panel.pipe
+generated/pandas.Panel.pop,../reference/api/pandas.Panel.pop
+generated/pandas.Panel.pow,../reference/api/pandas.Panel.pow
+generated/pandas.Panel.prod,../reference/api/pandas.Panel.prod
+generated/pandas.Panel.product,../reference/api/pandas.Panel.product
+generated/pandas.Panel.radd,../reference/api/pandas.Panel.radd
+generated/pandas.Panel.rank,../reference/api/pandas.Panel.rank
+generated/pandas.Panel.rdiv,../reference/api/pandas.Panel.rdiv
+generated/pandas.Panel.reindex_axis,../reference/api/pandas.Panel.reindex_axis
+generated/pandas.Panel.reindex,../reference/api/pandas.Panel.reindex
+generated/pandas.Panel.reindex_like,../reference/api/pandas.Panel.reindex_like
+generated/pandas.Panel.rename_axis,../reference/api/pandas.Panel.rename_axis
+generated/pandas.Panel.rename,../reference/api/pandas.Panel.rename
+generated/pandas.Panel.replace,../reference/api/pandas.Panel.replace
+generated/pandas.Panel.resample,../reference/api/pandas.Panel.resample
+generated/pandas.Panel.rfloordiv,../reference/api/pandas.Panel.rfloordiv
+generated/pandas.Panel.rmod,../reference/api/pandas.Panel.rmod
+generated/pandas.Panel.rmul,../reference/api/pandas.Panel.rmul
+generated/pandas.Panel.round,../reference/api/pandas.Panel.round
+generated/pandas.Panel.rpow,../reference/api/pandas.Panel.rpow
+generated/pandas.Panel.rsub,../reference/api/pandas.Panel.rsub
+generated/pandas.Panel.rtruediv,../reference/api/pandas.Panel.rtruediv
+generated/pandas.Panel.sample,../reference/api/pandas.Panel.sample
+generated/pandas.Panel.select,../reference/api/pandas.Panel.select
+generated/pandas.Panel.sem,../reference/api/pandas.Panel.sem
+generated/pandas.Panel.set_axis,../reference/api/pandas.Panel.set_axis
+generated/pandas.Panel.set_value,../reference/api/pandas.Panel.set_value
+generated/pandas.Panel.shape,../reference/api/pandas.Panel.shape
+generated/pandas.Panel.shift,../reference/api/pandas.Panel.shift
+generated/pandas.Panel.size,../reference/api/pandas.Panel.size
+generated/pandas.Panel.skew,../reference/api/pandas.Panel.skew
+generated/pandas.Panel.slice_shift,../reference/api/pandas.Panel.slice_shift
+generated/pandas.Panel.sort_index,../reference/api/pandas.Panel.sort_index
+generated/pandas.Panel.sort_values,../reference/api/pandas.Panel.sort_values
+generated/pandas.Panel.squeeze,../reference/api/pandas.Panel.squeeze
+generated/pandas.Panel.std,../reference/api/pandas.Panel.std
+generated/pandas.Panel.sub,../reference/api/pandas.Panel.sub
+generated/pandas.Panel.subtract,../reference/api/pandas.Panel.subtract
+generated/pandas.Panel.sum,../reference/api/pandas.Panel.sum
+generated/pandas.Panel.swapaxes,../reference/api/pandas.Panel.swapaxes
+generated/pandas.Panel.swaplevel,../reference/api/pandas.Panel.swaplevel
+generated/pandas.Panel.tail,../reference/api/pandas.Panel.tail
+generated/pandas.Panel.take,../reference/api/pandas.Panel.take
+generated/pandas.Panel.timetuple,../reference/api/pandas.Panel.timetuple
+generated/pandas.Panel.to_clipboard,../reference/api/pandas.Panel.to_clipboard
+generated/pandas.Panel.to_csv,../reference/api/pandas.Panel.to_csv
+generated/pandas.Panel.to_dense,../reference/api/pandas.Panel.to_dense
+generated/pandas.Panel.to_excel,../reference/api/pandas.Panel.to_excel
+generated/pandas.Panel.to_frame,../reference/api/pandas.Panel.to_frame
+generated/pandas.Panel.to_hdf,../reference/api/pandas.Panel.to_hdf
+generated/pandas.Panel.to_json,../reference/api/pandas.Panel.to_json
+generated/pandas.Panel.to_latex,../reference/api/pandas.Panel.to_latex
+generated/pandas.Panel.to_msgpack,../reference/api/pandas.Panel.to_msgpack
+generated/pandas.Panel.to_pickle,../reference/api/pandas.Panel.to_pickle
+generated/pandas.Panel.to_sparse,../reference/api/pandas.Panel.to_sparse
+generated/pandas.Panel.to_sql,../reference/api/pandas.Panel.to_sql
+generated/pandas.Panel.to_xarray,../reference/api/pandas.Panel.to_xarray
+generated/pandas.Panel.transform,../reference/api/pandas.Panel.transform
+generated/pandas.Panel.transpose,../reference/api/pandas.Panel.transpose
+generated/pandas.Panel.truediv,../reference/api/pandas.Panel.truediv
+generated/pandas.Panel.truncate,../reference/api/pandas.Panel.truncate
+generated/pandas.Panel.tshift,../reference/api/pandas.Panel.tshift
+generated/pandas.Panel.tz_convert,../reference/api/pandas.Panel.tz_convert
+generated/pandas.Panel.tz_localize,../reference/api/pandas.Panel.tz_localize
+generated/pandas.Panel.update,../reference/api/pandas.Panel.update
+generated/pandas.Panel.values,../reference/api/pandas.Panel.values
+generated/pandas.Panel.var,../reference/api/pandas.Panel.var
+generated/pandas.Panel.where,../reference/api/pandas.Panel.where
+generated/pandas.Panel.xs,../reference/api/pandas.Panel.xs
+generated/pandas.Period.asfreq,../reference/api/pandas.Period.asfreq
+generated/pandas.Period.day,../reference/api/pandas.Period.day
+generated/pandas.Period.dayofweek,../reference/api/pandas.Period.dayofweek
+generated/pandas.Period.dayofyear,../reference/api/pandas.Period.dayofyear
+generated/pandas.Period.days_in_month,../reference/api/pandas.Period.days_in_month
+generated/pandas.Period.daysinmonth,../reference/api/pandas.Period.daysinmonth
+generated/pandas.Period.end_time,../reference/api/pandas.Period.end_time
+generated/pandas.Period.freq,../reference/api/pandas.Period.freq
+generated/pandas.Period.freqstr,../reference/api/pandas.Period.freqstr
+generated/pandas.Period.hour,../reference/api/pandas.Period.hour
+generated/pandas.Period,../reference/api/pandas.Period
+generated/pandas.PeriodIndex.asfreq,../reference/api/pandas.PeriodIndex.asfreq
+generated/pandas.PeriodIndex.day,../reference/api/pandas.PeriodIndex.day
+generated/pandas.PeriodIndex.dayofweek,../reference/api/pandas.PeriodIndex.dayofweek
+generated/pandas.PeriodIndex.dayofyear,../reference/api/pandas.PeriodIndex.dayofyear
+generated/pandas.PeriodIndex.days_in_month,../reference/api/pandas.PeriodIndex.days_in_month
+generated/pandas.PeriodIndex.daysinmonth,../reference/api/pandas.PeriodIndex.daysinmonth
+generated/pandas.PeriodIndex.end_time,../reference/api/pandas.PeriodIndex.end_time
+generated/pandas.PeriodIndex.freq,../reference/api/pandas.PeriodIndex.freq
+generated/pandas.PeriodIndex.freqstr,../reference/api/pandas.PeriodIndex.freqstr
+generated/pandas.PeriodIndex.hour,../reference/api/pandas.PeriodIndex.hour
+generated/pandas.PeriodIndex,../reference/api/pandas.PeriodIndex
+generated/pandas.PeriodIndex.is_leap_year,../reference/api/pandas.PeriodIndex.is_leap_year
+generated/pandas.PeriodIndex.minute,../reference/api/pandas.PeriodIndex.minute
+generated/pandas.PeriodIndex.month,../reference/api/pandas.PeriodIndex.month
+generated/pandas.PeriodIndex.quarter,../reference/api/pandas.PeriodIndex.quarter
+generated/pandas.PeriodIndex.qyear,../reference/api/pandas.PeriodIndex.qyear
+generated/pandas.PeriodIndex.second,../reference/api/pandas.PeriodIndex.second
+generated/pandas.PeriodIndex.start_time,../reference/api/pandas.PeriodIndex.start_time
+generated/pandas.PeriodIndex.strftime,../reference/api/pandas.PeriodIndex.strftime
+generated/pandas.PeriodIndex.to_timestamp,../reference/api/pandas.PeriodIndex.to_timestamp
+generated/pandas.PeriodIndex.weekday,../reference/api/pandas.PeriodIndex.weekday
+generated/pandas.PeriodIndex.week,../reference/api/pandas.PeriodIndex.week
+generated/pandas.PeriodIndex.weekofyear,../reference/api/pandas.PeriodIndex.weekofyear
+generated/pandas.PeriodIndex.year,../reference/api/pandas.PeriodIndex.year
+generated/pandas.Period.is_leap_year,../reference/api/pandas.Period.is_leap_year
+generated/pandas.Period.minute,../reference/api/pandas.Period.minute
+generated/pandas.Period.month,../reference/api/pandas.Period.month
+generated/pandas.Period.now,../reference/api/pandas.Period.now
+generated/pandas.Period.ordinal,../reference/api/pandas.Period.ordinal
+generated/pandas.Period.quarter,../reference/api/pandas.Period.quarter
+generated/pandas.Period.qyear,../reference/api/pandas.Period.qyear
+generated/pandas.period_range,../reference/api/pandas.period_range
+generated/pandas.Period.second,../reference/api/pandas.Period.second
+generated/pandas.Period.start_time,../reference/api/pandas.Period.start_time
+generated/pandas.Period.strftime,../reference/api/pandas.Period.strftime
+generated/pandas.Period.to_timestamp,../reference/api/pandas.Period.to_timestamp
+generated/pandas.Period.weekday,../reference/api/pandas.Period.weekday
+generated/pandas.Period.week,../reference/api/pandas.Period.week
+generated/pandas.Period.weekofyear,../reference/api/pandas.Period.weekofyear
+generated/pandas.Period.year,../reference/api/pandas.Period.year
+generated/pandas.pivot,../reference/api/pandas.pivot
+generated/pandas.pivot_table,../reference/api/pandas.pivot_table
+generated/pandas.plotting.andrews_curves,../reference/api/pandas.plotting.andrews_curves
+generated/pandas.plotting.bootstrap_plot,../reference/api/pandas.plotting.bootstrap_plot
+generated/pandas.plotting.deregister_matplotlib_converters,../reference/api/pandas.plotting.deregister_matplotlib_converters
+generated/pandas.plotting.lag_plot,../reference/api/pandas.plotting.lag_plot
+generated/pandas.plotting.parallel_coordinates,../reference/api/pandas.plotting.parallel_coordinates
+generated/pandas.plotting.radviz,../reference/api/pandas.plotting.radviz
+generated/pandas.plotting.register_matplotlib_converters,../reference/api/pandas.plotting.register_matplotlib_converters
+generated/pandas.plotting.scatter_matrix,../reference/api/pandas.plotting.scatter_matrix
+generated/pandas.qcut,../reference/api/pandas.qcut
+generated/pandas.RangeIndex.from_range,../reference/api/pandas.RangeIndex.from_range
+generated/pandas.RangeIndex,../reference/api/pandas.RangeIndex
+generated/pandas.read_clipboard,../reference/api/pandas.read_clipboard
+generated/pandas.read_csv,../reference/api/pandas.read_csv
+generated/pandas.read_excel,../reference/api/pandas.read_excel
+generated/pandas.read_feather,../reference/api/pandas.read_feather
+generated/pandas.read_fwf,../reference/api/pandas.read_fwf
+generated/pandas.read_gbq,../reference/api/pandas.read_gbq
+generated/pandas.read_hdf,../reference/api/pandas.read_hdf
+generated/pandas.read,../reference/api/pandas.read
+generated/pandas.read_json,../reference/api/pandas.read_json
+generated/pandas.read_msgpack,../reference/api/pandas.read_msgpack
+generated/pandas.read_parquet,../reference/api/pandas.read_parquet
+generated/pandas.read_pickle,../reference/api/pandas.read_pickle
+generated/pandas.read_sas,../reference/api/pandas.read_sas
+generated/pandas.read_sql,../reference/api/pandas.read_sql
+generated/pandas.read_sql_query,../reference/api/pandas.read_sql_query
+generated/pandas.read_sql_table,../reference/api/pandas.read_sql_table
+generated/pandas.read_stata,../reference/api/pandas.read_stata
+generated/pandas.read_table,../reference/api/pandas.read_table
+generated/pandas.reset_option,../reference/api/pandas.reset_option
+generated/pandas.Series.abs,../reference/api/pandas.Series.abs
+generated/pandas.Series.add,../reference/api/pandas.Series.add
+generated/pandas.Series.add_prefix,../reference/api/pandas.Series.add_prefix
+generated/pandas.Series.add_suffix,../reference/api/pandas.Series.add_suffix
+generated/pandas.Series.agg,../reference/api/pandas.Series.agg
+generated/pandas.Series.aggregate,../reference/api/pandas.Series.aggregate
+generated/pandas.Series.align,../reference/api/pandas.Series.align
+generated/pandas.Series.all,../reference/api/pandas.Series.all
+generated/pandas.Series.any,../reference/api/pandas.Series.any
+generated/pandas.Series.append,../reference/api/pandas.Series.append
+generated/pandas.Series.apply,../reference/api/pandas.Series.apply
+generated/pandas.Series.argmax,../reference/api/pandas.Series.argmax
+generated/pandas.Series.argmin,../reference/api/pandas.Series.argmin
+generated/pandas.Series.argsort,../reference/api/pandas.Series.argsort
+generated/pandas.Series.__array__,../reference/api/pandas.Series.__array__
+generated/pandas.Series.array,../reference/api/pandas.Series.array
+generated/pandas.Series.as_blocks,../reference/api/pandas.Series.as_blocks
+generated/pandas.Series.asfreq,../reference/api/pandas.Series.asfreq
+generated/pandas.Series.as_matrix,../reference/api/pandas.Series.as_matrix
+generated/pandas.Series.asobject,../reference/api/pandas.Series.asobject
+generated/pandas.Series.asof,../reference/api/pandas.Series.asof
+generated/pandas.Series.astype,../reference/api/pandas.Series.astype
+generated/pandas.Series.at,../reference/api/pandas.Series.at
+generated/pandas.Series.at_time,../reference/api/pandas.Series.at_time
+generated/pandas.Series.autocorr,../reference/api/pandas.Series.autocorr
+generated/pandas.Series.axes,../reference/api/pandas.Series.axes
+generated/pandas.Series.base,../reference/api/pandas.Series.base
+generated/pandas.Series.between,../reference/api/pandas.Series.between
+generated/pandas.Series.between_time,../reference/api/pandas.Series.between_time
+generated/pandas.Series.bfill,../reference/api/pandas.Series.bfill
+generated/pandas.Series.blocks,../reference/api/pandas.Series.blocks
+generated/pandas.Series.bool,../reference/api/pandas.Series.bool
+generated/pandas.Series.cat.add_categories,../reference/api/pandas.Series.cat.add_categories
+generated/pandas.Series.cat.as_ordered,../reference/api/pandas.Series.cat.as_ordered
+generated/pandas.Series.cat.as_unordered,../reference/api/pandas.Series.cat.as_unordered
+generated/pandas.Series.cat.categories,../reference/api/pandas.Series.cat.categories
+generated/pandas.Series.cat.codes,../reference/api/pandas.Series.cat.codes
+generated/pandas.Series.cat,../reference/api/pandas.Series.cat
+generated/pandas.Series.cat.ordered,../reference/api/pandas.Series.cat.ordered
+generated/pandas.Series.cat.remove_categories,../reference/api/pandas.Series.cat.remove_categories
+generated/pandas.Series.cat.remove_unused_categories,../reference/api/pandas.Series.cat.remove_unused_categories
+generated/pandas.Series.cat.rename_categories,../reference/api/pandas.Series.cat.rename_categories
+generated/pandas.Series.cat.reorder_categories,../reference/api/pandas.Series.cat.reorder_categories
+generated/pandas.Series.cat.set_categories,../reference/api/pandas.Series.cat.set_categories
+generated/pandas.Series.clip,../reference/api/pandas.Series.clip
+generated/pandas.Series.clip_lower,../reference/api/pandas.Series.clip_lower
+generated/pandas.Series.clip_upper,../reference/api/pandas.Series.clip_upper
+generated/pandas.Series.combine_first,../reference/api/pandas.Series.combine_first
+generated/pandas.Series.combine,../reference/api/pandas.Series.combine
+generated/pandas.Series.compound,../reference/api/pandas.Series.compound
+generated/pandas.Series.compress,../reference/api/pandas.Series.compress
+generated/pandas.Series.convert_objects,../reference/api/pandas.Series.convert_objects
+generated/pandas.Series.copy,../reference/api/pandas.Series.copy
+generated/pandas.Series.corr,../reference/api/pandas.Series.corr
+generated/pandas.Series.count,../reference/api/pandas.Series.count
+generated/pandas.Series.cov,../reference/api/pandas.Series.cov
+generated/pandas.Series.cummax,../reference/api/pandas.Series.cummax
+generated/pandas.Series.cummin,../reference/api/pandas.Series.cummin
+generated/pandas.Series.cumprod,../reference/api/pandas.Series.cumprod
+generated/pandas.Series.cumsum,../reference/api/pandas.Series.cumsum
+generated/pandas.Series.data,../reference/api/pandas.Series.data
+generated/pandas.Series.describe,../reference/api/pandas.Series.describe
+generated/pandas.Series.diff,../reference/api/pandas.Series.diff
+generated/pandas.Series.div,../reference/api/pandas.Series.div
+generated/pandas.Series.divide,../reference/api/pandas.Series.divide
+generated/pandas.Series.divmod,../reference/api/pandas.Series.divmod
+generated/pandas.Series.dot,../reference/api/pandas.Series.dot
+generated/pandas.Series.drop_duplicates,../reference/api/pandas.Series.drop_duplicates
+generated/pandas.Series.drop,../reference/api/pandas.Series.drop
+generated/pandas.Series.droplevel,../reference/api/pandas.Series.droplevel
+generated/pandas.Series.dropna,../reference/api/pandas.Series.dropna
+generated/pandas.Series.dt.ceil,../reference/api/pandas.Series.dt.ceil
+generated/pandas.Series.dt.components,../reference/api/pandas.Series.dt.components
+generated/pandas.Series.dt.date,../reference/api/pandas.Series.dt.date
+generated/pandas.Series.dt.day,../reference/api/pandas.Series.dt.day
+generated/pandas.Series.dt.day_name,../reference/api/pandas.Series.dt.day_name
+generated/pandas.Series.dt.dayofweek,../reference/api/pandas.Series.dt.dayofweek
+generated/pandas.Series.dt.dayofyear,../reference/api/pandas.Series.dt.dayofyear
+generated/pandas.Series.dt.days,../reference/api/pandas.Series.dt.days
+generated/pandas.Series.dt.days_in_month,../reference/api/pandas.Series.dt.days_in_month
+generated/pandas.Series.dt.daysinmonth,../reference/api/pandas.Series.dt.daysinmonth
+generated/pandas.Series.dt.end_time,../reference/api/pandas.Series.dt.end_time
+generated/pandas.Series.dt.floor,../reference/api/pandas.Series.dt.floor
+generated/pandas.Series.dt.freq,../reference/api/pandas.Series.dt.freq
+generated/pandas.Series.dt.hour,../reference/api/pandas.Series.dt.hour
+generated/pandas.Series.dt,../reference/api/pandas.Series.dt
+generated/pandas.Series.dt.is_leap_year,../reference/api/pandas.Series.dt.is_leap_year
+generated/pandas.Series.dt.is_month_end,../reference/api/pandas.Series.dt.is_month_end
+generated/pandas.Series.dt.is_month_start,../reference/api/pandas.Series.dt.is_month_start
+generated/pandas.Series.dt.is_quarter_end,../reference/api/pandas.Series.dt.is_quarter_end
+generated/pandas.Series.dt.is_quarter_start,../reference/api/pandas.Series.dt.is_quarter_start
+generated/pandas.Series.dt.is_year_end,../reference/api/pandas.Series.dt.is_year_end
+generated/pandas.Series.dt.is_year_start,../reference/api/pandas.Series.dt.is_year_start
+generated/pandas.Series.dt.microsecond,../reference/api/pandas.Series.dt.microsecond
+generated/pandas.Series.dt.microseconds,../reference/api/pandas.Series.dt.microseconds
+generated/pandas.Series.dt.minute,../reference/api/pandas.Series.dt.minute
+generated/pandas.Series.dt.month,../reference/api/pandas.Series.dt.month
+generated/pandas.Series.dt.month_name,../reference/api/pandas.Series.dt.month_name
+generated/pandas.Series.dt.nanosecond,../reference/api/pandas.Series.dt.nanosecond
+generated/pandas.Series.dt.nanoseconds,../reference/api/pandas.Series.dt.nanoseconds
+generated/pandas.Series.dt.normalize,../reference/api/pandas.Series.dt.normalize
+generated/pandas.Series.dt.quarter,../reference/api/pandas.Series.dt.quarter
+generated/pandas.Series.dt.qyear,../reference/api/pandas.Series.dt.qyear
+generated/pandas.Series.dt.round,../reference/api/pandas.Series.dt.round
+generated/pandas.Series.dt.second,../reference/api/pandas.Series.dt.second
+generated/pandas.Series.dt.seconds,../reference/api/pandas.Series.dt.seconds
+generated/pandas.Series.dt.start_time,../reference/api/pandas.Series.dt.start_time
+generated/pandas.Series.dt.strftime,../reference/api/pandas.Series.dt.strftime
+generated/pandas.Series.dt.time,../reference/api/pandas.Series.dt.time
+generated/pandas.Series.dt.timetz,../reference/api/pandas.Series.dt.timetz
+generated/pandas.Series.dt.to_period,../reference/api/pandas.Series.dt.to_period
+generated/pandas.Series.dt.to_pydatetime,../reference/api/pandas.Series.dt.to_pydatetime
+generated/pandas.Series.dt.to_pytimedelta,../reference/api/pandas.Series.dt.to_pytimedelta
+generated/pandas.Series.dt.total_seconds,../reference/api/pandas.Series.dt.total_seconds
+generated/pandas.Series.dt.tz_convert,../reference/api/pandas.Series.dt.tz_convert
+generated/pandas.Series.dt.tz,../reference/api/pandas.Series.dt.tz
+generated/pandas.Series.dt.tz_localize,../reference/api/pandas.Series.dt.tz_localize
+generated/pandas.Series.dt.weekday,../reference/api/pandas.Series.dt.weekday
+generated/pandas.Series.dt.week,../reference/api/pandas.Series.dt.week
+generated/pandas.Series.dt.weekofyear,../reference/api/pandas.Series.dt.weekofyear
+generated/pandas.Series.dt.year,../reference/api/pandas.Series.dt.year
+generated/pandas.Series.dtype,../reference/api/pandas.Series.dtype
+generated/pandas.Series.dtypes,../reference/api/pandas.Series.dtypes
+generated/pandas.Series.duplicated,../reference/api/pandas.Series.duplicated
+generated/pandas.Series.empty,../reference/api/pandas.Series.empty
+generated/pandas.Series.eq,../reference/api/pandas.Series.eq
+generated/pandas.Series.equals,../reference/api/pandas.Series.equals
+generated/pandas.Series.ewm,../reference/api/pandas.Series.ewm
+generated/pandas.Series.expanding,../reference/api/pandas.Series.expanding
+generated/pandas.Series.factorize,../reference/api/pandas.Series.factorize
+generated/pandas.Series.ffill,../reference/api/pandas.Series.ffill
+generated/pandas.Series.fillna,../reference/api/pandas.Series.fillna
+generated/pandas.Series.filter,../reference/api/pandas.Series.filter
+generated/pandas.Series.first,../reference/api/pandas.Series.first
+generated/pandas.Series.first_valid_index,../reference/api/pandas.Series.first_valid_index
+generated/pandas.Series.flags,../reference/api/pandas.Series.flags
+generated/pandas.Series.floordiv,../reference/api/pandas.Series.floordiv
+generated/pandas.Series.from_array,../reference/api/pandas.Series.from_array
+generated/pandas.Series.from_csv,../reference/api/pandas.Series.from_csv
+generated/pandas.Series.ftype,../reference/api/pandas.Series.ftype
+generated/pandas.Series.ftypes,../reference/api/pandas.Series.ftypes
+generated/pandas.Series.ge,../reference/api/pandas.Series.ge
+generated/pandas.Series.get_dtype_counts,../reference/api/pandas.Series.get_dtype_counts
+generated/pandas.Series.get_ftype_counts,../reference/api/pandas.Series.get_ftype_counts
+generated/pandas.Series.get,../reference/api/pandas.Series.get
+generated/pandas.Series.get_value,../reference/api/pandas.Series.get_value
+generated/pandas.Series.get_values,../reference/api/pandas.Series.get_values
+generated/pandas.Series.groupby,../reference/api/pandas.Series.groupby
+generated/pandas.Series.gt,../reference/api/pandas.Series.gt
+generated/pandas.Series.hasnans,../reference/api/pandas.Series.hasnans
+generated/pandas.Series.head,../reference/api/pandas.Series.head
+generated/pandas.Series.hist,../reference/api/pandas.Series.hist
+generated/pandas.Series,../reference/api/pandas.Series
+generated/pandas.Series.iat,../reference/api/pandas.Series.iat
+generated/pandas.Series.idxmax,../reference/api/pandas.Series.idxmax
+generated/pandas.Series.idxmin,../reference/api/pandas.Series.idxmin
+generated/pandas.Series.iloc,../reference/api/pandas.Series.iloc
+generated/pandas.Series.imag,../reference/api/pandas.Series.imag
+generated/pandas.Series.index,../reference/api/pandas.Series.index
+generated/pandas.Series.infer_objects,../reference/api/pandas.Series.infer_objects
+generated/pandas.Series.interpolate,../reference/api/pandas.Series.interpolate
+generated/pandas.Series.is_copy,../reference/api/pandas.Series.is_copy
+generated/pandas.Series.isin,../reference/api/pandas.Series.isin
+generated/pandas.Series.is_monotonic_decreasing,../reference/api/pandas.Series.is_monotonic_decreasing
+generated/pandas.Series.is_monotonic,../reference/api/pandas.Series.is_monotonic
+generated/pandas.Series.is_monotonic_increasing,../reference/api/pandas.Series.is_monotonic_increasing
+generated/pandas.Series.isna,../reference/api/pandas.Series.isna
+generated/pandas.Series.isnull,../reference/api/pandas.Series.isnull
+generated/pandas.Series.is_unique,../reference/api/pandas.Series.is_unique
+generated/pandas.Series.item,../reference/api/pandas.Series.item
+generated/pandas.Series.items,../reference/api/pandas.Series.items
+generated/pandas.Series.itemsize,../reference/api/pandas.Series.itemsize
+generated/pandas.Series.__iter__,../reference/api/pandas.Series.__iter__
+generated/pandas.Series.iteritems,../reference/api/pandas.Series.iteritems
+generated/pandas.Series.ix,../reference/api/pandas.Series.ix
+generated/pandas.Series.keys,../reference/api/pandas.Series.keys
+generated/pandas.Series.kurt,../reference/api/pandas.Series.kurt
+generated/pandas.Series.kurtosis,../reference/api/pandas.Series.kurtosis
+generated/pandas.Series.last,../reference/api/pandas.Series.last
+generated/pandas.Series.last_valid_index,../reference/api/pandas.Series.last_valid_index
+generated/pandas.Series.le,../reference/api/pandas.Series.le
+generated/pandas.Series.loc,../reference/api/pandas.Series.loc
+generated/pandas.Series.lt,../reference/api/pandas.Series.lt
+generated/pandas.Series.mad,../reference/api/pandas.Series.mad
+generated/pandas.Series.map,../reference/api/pandas.Series.map
+generated/pandas.Series.mask,../reference/api/pandas.Series.mask
+generated/pandas.Series.max,../reference/api/pandas.Series.max
+generated/pandas.Series.mean,../reference/api/pandas.Series.mean
+generated/pandas.Series.median,../reference/api/pandas.Series.median
+generated/pandas.Series.memory_usage,../reference/api/pandas.Series.memory_usage
+generated/pandas.Series.min,../reference/api/pandas.Series.min
+generated/pandas.Series.mode,../reference/api/pandas.Series.mode
+generated/pandas.Series.mod,../reference/api/pandas.Series.mod
+generated/pandas.Series.mul,../reference/api/pandas.Series.mul
+generated/pandas.Series.multiply,../reference/api/pandas.Series.multiply
+generated/pandas.Series.name,../reference/api/pandas.Series.name
+generated/pandas.Series.nbytes,../reference/api/pandas.Series.nbytes
+generated/pandas.Series.ndim,../reference/api/pandas.Series.ndim
+generated/pandas.Series.ne,../reference/api/pandas.Series.ne
+generated/pandas.Series.nlargest,../reference/api/pandas.Series.nlargest
+generated/pandas.Series.nonzero,../reference/api/pandas.Series.nonzero
+generated/pandas.Series.notna,../reference/api/pandas.Series.notna
+generated/pandas.Series.notnull,../reference/api/pandas.Series.notnull
+generated/pandas.Series.nsmallest,../reference/api/pandas.Series.nsmallest
+generated/pandas.Series.nunique,../reference/api/pandas.Series.nunique
+generated/pandas.Series.pct_change,../reference/api/pandas.Series.pct_change
+generated/pandas.Series.pipe,../reference/api/pandas.Series.pipe
+generated/pandas.Series.plot.area,../reference/api/pandas.Series.plot.area
+generated/pandas.Series.plot.barh,../reference/api/pandas.Series.plot.barh
+generated/pandas.Series.plot.bar,../reference/api/pandas.Series.plot.bar
+generated/pandas.Series.plot.box,../reference/api/pandas.Series.plot.box
+generated/pandas.Series.plot.density,../reference/api/pandas.Series.plot.density
+generated/pandas.Series.plot.hist,../reference/api/pandas.Series.plot.hist
+generated/pandas.Series.plot,../reference/api/pandas.Series.plot
+generated/pandas.Series.plot.kde,../reference/api/pandas.Series.plot.kde
+generated/pandas.Series.plot.line,../reference/api/pandas.Series.plot.line
+generated/pandas.Series.plot.pie,../reference/api/pandas.Series.plot.pie
+generated/pandas.Series.pop,../reference/api/pandas.Series.pop
+generated/pandas.Series.pow,../reference/api/pandas.Series.pow
+generated/pandas.Series.prod,../reference/api/pandas.Series.prod
+generated/pandas.Series.product,../reference/api/pandas.Series.product
+generated/pandas.Series.ptp,../reference/api/pandas.Series.ptp
+generated/pandas.Series.put,../reference/api/pandas.Series.put
+generated/pandas.Series.quantile,../reference/api/pandas.Series.quantile
+generated/pandas.Series.radd,../reference/api/pandas.Series.radd
+generated/pandas.Series.rank,../reference/api/pandas.Series.rank
+generated/pandas.Series.ravel,../reference/api/pandas.Series.ravel
+generated/pandas.Series.rdiv,../reference/api/pandas.Series.rdiv
+generated/pandas.Series.rdivmod,../reference/api/pandas.Series.rdivmod
+generated/pandas.Series.real,../reference/api/pandas.Series.real
+generated/pandas.Series.reindex_axis,../reference/api/pandas.Series.reindex_axis
+generated/pandas.Series.reindex,../reference/api/pandas.Series.reindex
+generated/pandas.Series.reindex_like,../reference/api/pandas.Series.reindex_like
+generated/pandas.Series.rename_axis,../reference/api/pandas.Series.rename_axis
+generated/pandas.Series.rename,../reference/api/pandas.Series.rename
+generated/pandas.Series.reorder_levels,../reference/api/pandas.Series.reorder_levels
+generated/pandas.Series.repeat,../reference/api/pandas.Series.repeat
+generated/pandas.Series.replace,../reference/api/pandas.Series.replace
+generated/pandas.Series.resample,../reference/api/pandas.Series.resample
+generated/pandas.Series.reset_index,../reference/api/pandas.Series.reset_index
+generated/pandas.Series.rfloordiv,../reference/api/pandas.Series.rfloordiv
+generated/pandas.Series.rmod,../reference/api/pandas.Series.rmod
+generated/pandas.Series.rmul,../reference/api/pandas.Series.rmul
+generated/pandas.Series.rolling,../reference/api/pandas.Series.rolling
+generated/pandas.Series.round,../reference/api/pandas.Series.round
+generated/pandas.Series.rpow,../reference/api/pandas.Series.rpow
+generated/pandas.Series.rsub,../reference/api/pandas.Series.rsub
+generated/pandas.Series.rtruediv,../reference/api/pandas.Series.rtruediv
+generated/pandas.Series.sample,../reference/api/pandas.Series.sample
+generated/pandas.Series.searchsorted,../reference/api/pandas.Series.searchsorted
+generated/pandas.Series.select,../reference/api/pandas.Series.select
+generated/pandas.Series.sem,../reference/api/pandas.Series.sem
+generated/pandas.Series.set_axis,../reference/api/pandas.Series.set_axis
+generated/pandas.Series.set_value,../reference/api/pandas.Series.set_value
+generated/pandas.Series.shape,../reference/api/pandas.Series.shape
+generated/pandas.Series.shift,../reference/api/pandas.Series.shift
+generated/pandas.Series.size,../reference/api/pandas.Series.size
+generated/pandas.Series.skew,../reference/api/pandas.Series.skew
+generated/pandas.Series.slice_shift,../reference/api/pandas.Series.slice_shift
+generated/pandas.Series.sort_index,../reference/api/pandas.Series.sort_index
+generated/pandas.Series.sort_values,../reference/api/pandas.Series.sort_values
+generated/pandas.Series.sparse.density,../reference/api/pandas.Series.sparse.density
+generated/pandas.Series.sparse.fill_value,../reference/api/pandas.Series.sparse.fill_value
+generated/pandas.Series.sparse.from_coo,../reference/api/pandas.Series.sparse.from_coo
+generated/pandas.Series.sparse.npoints,../reference/api/pandas.Series.sparse.npoints
+generated/pandas.Series.sparse.sp_values,../reference/api/pandas.Series.sparse.sp_values
+generated/pandas.Series.sparse.to_coo,../reference/api/pandas.Series.sparse.to_coo
+generated/pandas.Series.squeeze,../reference/api/pandas.Series.squeeze
+generated/pandas.Series.std,../reference/api/pandas.Series.std
+generated/pandas.Series.str.capitalize,../reference/api/pandas.Series.str.capitalize
+generated/pandas.Series.str.cat,../reference/api/pandas.Series.str.cat
+generated/pandas.Series.str.center,../reference/api/pandas.Series.str.center
+generated/pandas.Series.str.contains,../reference/api/pandas.Series.str.contains
+generated/pandas.Series.str.count,../reference/api/pandas.Series.str.count
+generated/pandas.Series.str.decode,../reference/api/pandas.Series.str.decode
+generated/pandas.Series.str.encode,../reference/api/pandas.Series.str.encode
+generated/pandas.Series.str.endswith,../reference/api/pandas.Series.str.endswith
+generated/pandas.Series.str.extractall,../reference/api/pandas.Series.str.extractall
+generated/pandas.Series.str.extract,../reference/api/pandas.Series.str.extract
+generated/pandas.Series.str.findall,../reference/api/pandas.Series.str.findall
+generated/pandas.Series.str.find,../reference/api/pandas.Series.str.find
+generated/pandas.Series.str.get_dummies,../reference/api/pandas.Series.str.get_dummies
+generated/pandas.Series.str.get,../reference/api/pandas.Series.str.get
+generated/pandas.Series.str,../reference/api/pandas.Series.str
+generated/pandas.Series.strides,../reference/api/pandas.Series.strides
+generated/pandas.Series.str.index,../reference/api/pandas.Series.str.index
+generated/pandas.Series.str.isalnum,../reference/api/pandas.Series.str.isalnum
+generated/pandas.Series.str.isalpha,../reference/api/pandas.Series.str.isalpha
+generated/pandas.Series.str.isdecimal,../reference/api/pandas.Series.str.isdecimal
+generated/pandas.Series.str.isdigit,../reference/api/pandas.Series.str.isdigit
+generated/pandas.Series.str.islower,../reference/api/pandas.Series.str.islower
+generated/pandas.Series.str.isnumeric,../reference/api/pandas.Series.str.isnumeric
+generated/pandas.Series.str.isspace,../reference/api/pandas.Series.str.isspace
+generated/pandas.Series.str.istitle,../reference/api/pandas.Series.str.istitle
+generated/pandas.Series.str.isupper,../reference/api/pandas.Series.str.isupper
+generated/pandas.Series.str.join,../reference/api/pandas.Series.str.join
+generated/pandas.Series.str.len,../reference/api/pandas.Series.str.len
+generated/pandas.Series.str.ljust,../reference/api/pandas.Series.str.ljust
+generated/pandas.Series.str.lower,../reference/api/pandas.Series.str.lower
+generated/pandas.Series.str.lstrip,../reference/api/pandas.Series.str.lstrip
+generated/pandas.Series.str.match,../reference/api/pandas.Series.str.match
+generated/pandas.Series.str.normalize,../reference/api/pandas.Series.str.normalize
+generated/pandas.Series.str.pad,../reference/api/pandas.Series.str.pad
+generated/pandas.Series.str.partition,../reference/api/pandas.Series.str.partition
+generated/pandas.Series.str.repeat,../reference/api/pandas.Series.str.repeat
+generated/pandas.Series.str.replace,../reference/api/pandas.Series.str.replace
+generated/pandas.Series.str.rfind,../reference/api/pandas.Series.str.rfind
+generated/pandas.Series.str.rindex,../reference/api/pandas.Series.str.rindex
+generated/pandas.Series.str.rjust,../reference/api/pandas.Series.str.rjust
+generated/pandas.Series.str.rpartition,../reference/api/pandas.Series.str.rpartition
+generated/pandas.Series.str.rsplit,../reference/api/pandas.Series.str.rsplit
+generated/pandas.Series.str.rstrip,../reference/api/pandas.Series.str.rstrip
+generated/pandas.Series.str.slice,../reference/api/pandas.Series.str.slice
+generated/pandas.Series.str.slice_replace,../reference/api/pandas.Series.str.slice_replace
+generated/pandas.Series.str.split,../reference/api/pandas.Series.str.split
+generated/pandas.Series.str.startswith,../reference/api/pandas.Series.str.startswith
+generated/pandas.Series.str.strip,../reference/api/pandas.Series.str.strip
+generated/pandas.Series.str.swapcase,../reference/api/pandas.Series.str.swapcase
+generated/pandas.Series.str.title,../reference/api/pandas.Series.str.title
+generated/pandas.Series.str.translate,../reference/api/pandas.Series.str.translate
+generated/pandas.Series.str.upper,../reference/api/pandas.Series.str.upper
+generated/pandas.Series.str.wrap,../reference/api/pandas.Series.str.wrap
+generated/pandas.Series.str.zfill,../reference/api/pandas.Series.str.zfill
+generated/pandas.Series.sub,../reference/api/pandas.Series.sub
+generated/pandas.Series.subtract,../reference/api/pandas.Series.subtract
+generated/pandas.Series.sum,../reference/api/pandas.Series.sum
+generated/pandas.Series.swapaxes,../reference/api/pandas.Series.swapaxes
+generated/pandas.Series.swaplevel,../reference/api/pandas.Series.swaplevel
+generated/pandas.Series.tail,../reference/api/pandas.Series.tail
+generated/pandas.Series.take,../reference/api/pandas.Series.take
+generated/pandas.Series.T,../reference/api/pandas.Series.T
+generated/pandas.Series.timetuple,../reference/api/pandas.Series.timetuple
+generated/pandas.Series.to_clipboard,../reference/api/pandas.Series.to_clipboard
+generated/pandas.Series.to_csv,../reference/api/pandas.Series.to_csv
+generated/pandas.Series.to_dense,../reference/api/pandas.Series.to_dense
+generated/pandas.Series.to_dict,../reference/api/pandas.Series.to_dict
+generated/pandas.Series.to_excel,../reference/api/pandas.Series.to_excel
+generated/pandas.Series.to_frame,../reference/api/pandas.Series.to_frame
+generated/pandas.Series.to_hdf,../reference/api/pandas.Series.to_hdf
+generated/pandas.Series.to_json,../reference/api/pandas.Series.to_json
+generated/pandas.Series.to_latex,../reference/api/pandas.Series.to_latex
+generated/pandas.Series.to_list,../reference/api/pandas.Series.to_list
+generated/pandas.Series.tolist,../reference/api/pandas.Series.tolist
+generated/pandas.Series.to_msgpack,../reference/api/pandas.Series.to_msgpack
+generated/pandas.Series.to_numpy,../reference/api/pandas.Series.to_numpy
+generated/pandas.Series.to_period,../reference/api/pandas.Series.to_period
+generated/pandas.Series.to_pickle,../reference/api/pandas.Series.to_pickle
+generated/pandas.Series.to_sparse,../reference/api/pandas.Series.to_sparse
+generated/pandas.Series.to_sql,../reference/api/pandas.Series.to_sql
+generated/pandas.Series.to_string,../reference/api/pandas.Series.to_string
+generated/pandas.Series.to_timestamp,../reference/api/pandas.Series.to_timestamp
+generated/pandas.Series.to_xarray,../reference/api/pandas.Series.to_xarray
+generated/pandas.Series.transform,../reference/api/pandas.Series.transform
+generated/pandas.Series.transpose,../reference/api/pandas.Series.transpose
+generated/pandas.Series.truediv,../reference/api/pandas.Series.truediv
+generated/pandas.Series.truncate,../reference/api/pandas.Series.truncate
+generated/pandas.Series.tshift,../reference/api/pandas.Series.tshift
+generated/pandas.Series.tz_convert,../reference/api/pandas.Series.tz_convert
+generated/pandas.Series.tz_localize,../reference/api/pandas.Series.tz_localize
+generated/pandas.Series.unique,../reference/api/pandas.Series.unique
+generated/pandas.Series.unstack,../reference/api/pandas.Series.unstack
+generated/pandas.Series.update,../reference/api/pandas.Series.update
+generated/pandas.Series.valid,../reference/api/pandas.Series.valid
+generated/pandas.Series.value_counts,../reference/api/pandas.Series.value_counts
+generated/pandas.Series.values,../reference/api/pandas.Series.values
+generated/pandas.Series.var,../reference/api/pandas.Series.var
+generated/pandas.Series.view,../reference/api/pandas.Series.view
+generated/pandas.Series.where,../reference/api/pandas.Series.where
+generated/pandas.Series.xs,../reference/api/pandas.Series.xs
+generated/pandas.set_option,../reference/api/pandas.set_option
+generated/pandas.SparseDataFrame.to_coo,../reference/api/pandas.SparseDataFrame.to_coo
+generated/pandas.SparseSeries.from_coo,../reference/api/pandas.SparseSeries.from_coo
+generated/pandas.SparseSeries.to_coo,../reference/api/pandas.SparseSeries.to_coo
+generated/pandas.test,../reference/api/pandas.test
+generated/pandas.testing.assert_frame_equal,../reference/api/pandas.testing.assert_frame_equal
+generated/pandas.testing.assert_index_equal,../reference/api/pandas.testing.assert_index_equal
+generated/pandas.testing.assert_series_equal,../reference/api/pandas.testing.assert_series_equal
+generated/pandas.Timedelta.asm8,../reference/api/pandas.Timedelta.asm8
+generated/pandas.Timedelta.ceil,../reference/api/pandas.Timedelta.ceil
+generated/pandas.Timedelta.components,../reference/api/pandas.Timedelta.components
+generated/pandas.Timedelta.days,../reference/api/pandas.Timedelta.days
+generated/pandas.Timedelta.delta,../reference/api/pandas.Timedelta.delta
+generated/pandas.Timedelta.floor,../reference/api/pandas.Timedelta.floor
+generated/pandas.Timedelta.freq,../reference/api/pandas.Timedelta.freq
+generated/pandas.Timedelta,../reference/api/pandas.Timedelta
+generated/pandas.TimedeltaIndex.ceil,../reference/api/pandas.TimedeltaIndex.ceil
+generated/pandas.TimedeltaIndex.components,../reference/api/pandas.TimedeltaIndex.components
+generated/pandas.TimedeltaIndex.days,../reference/api/pandas.TimedeltaIndex.days
+generated/pandas.TimedeltaIndex.floor,../reference/api/pandas.TimedeltaIndex.floor
+generated/pandas.TimedeltaIndex,../reference/api/pandas.TimedeltaIndex
+generated/pandas.TimedeltaIndex.inferred_freq,../reference/api/pandas.TimedeltaIndex.inferred_freq
+generated/pandas.TimedeltaIndex.microseconds,../reference/api/pandas.TimedeltaIndex.microseconds
+generated/pandas.TimedeltaIndex.nanoseconds,../reference/api/pandas.TimedeltaIndex.nanoseconds
+generated/pandas.TimedeltaIndex.round,../reference/api/pandas.TimedeltaIndex.round
+generated/pandas.TimedeltaIndex.seconds,../reference/api/pandas.TimedeltaIndex.seconds
+generated/pandas.TimedeltaIndex.to_frame,../reference/api/pandas.TimedeltaIndex.to_frame
+generated/pandas.TimedeltaIndex.to_pytimedelta,../reference/api/pandas.TimedeltaIndex.to_pytimedelta
+generated/pandas.TimedeltaIndex.to_series,../reference/api/pandas.TimedeltaIndex.to_series
+generated/pandas.Timedelta.isoformat,../reference/api/pandas.Timedelta.isoformat
+generated/pandas.Timedelta.is_populated,../reference/api/pandas.Timedelta.is_populated
+generated/pandas.Timedelta.max,../reference/api/pandas.Timedelta.max
+generated/pandas.Timedelta.microseconds,../reference/api/pandas.Timedelta.microseconds
+generated/pandas.Timedelta.min,../reference/api/pandas.Timedelta.min
+generated/pandas.Timedelta.nanoseconds,../reference/api/pandas.Timedelta.nanoseconds
+generated/pandas.timedelta_range,../reference/api/pandas.timedelta_range
+generated/pandas.Timedelta.resolution,../reference/api/pandas.Timedelta.resolution
+generated/pandas.Timedelta.round,../reference/api/pandas.Timedelta.round
+generated/pandas.Timedelta.seconds,../reference/api/pandas.Timedelta.seconds
+generated/pandas.Timedelta.to_pytimedelta,../reference/api/pandas.Timedelta.to_pytimedelta
+generated/pandas.Timedelta.total_seconds,../reference/api/pandas.Timedelta.total_seconds
+generated/pandas.Timedelta.to_timedelta64,../reference/api/pandas.Timedelta.to_timedelta64
+generated/pandas.Timedelta.value,../reference/api/pandas.Timedelta.value
+generated/pandas.Timedelta.view,../reference/api/pandas.Timedelta.view
+generated/pandas.Timestamp.asm8,../reference/api/pandas.Timestamp.asm8
+generated/pandas.Timestamp.astimezone,../reference/api/pandas.Timestamp.astimezone
+generated/pandas.Timestamp.ceil,../reference/api/pandas.Timestamp.ceil
+generated/pandas.Timestamp.combine,../reference/api/pandas.Timestamp.combine
+generated/pandas.Timestamp.ctime,../reference/api/pandas.Timestamp.ctime
+generated/pandas.Timestamp.date,../reference/api/pandas.Timestamp.date
+generated/pandas.Timestamp.day,../reference/api/pandas.Timestamp.day
+generated/pandas.Timestamp.day_name,../reference/api/pandas.Timestamp.day_name
+generated/pandas.Timestamp.dayofweek,../reference/api/pandas.Timestamp.dayofweek
+generated/pandas.Timestamp.dayofyear,../reference/api/pandas.Timestamp.dayofyear
+generated/pandas.Timestamp.days_in_month,../reference/api/pandas.Timestamp.days_in_month
+generated/pandas.Timestamp.daysinmonth,../reference/api/pandas.Timestamp.daysinmonth
+generated/pandas.Timestamp.dst,../reference/api/pandas.Timestamp.dst
+generated/pandas.Timestamp.floor,../reference/api/pandas.Timestamp.floor
+generated/pandas.Timestamp.fold,../reference/api/pandas.Timestamp.fold
+generated/pandas.Timestamp.freq,../reference/api/pandas.Timestamp.freq
+generated/pandas.Timestamp.freqstr,../reference/api/pandas.Timestamp.freqstr
+generated/pandas.Timestamp.fromisoformat,../reference/api/pandas.Timestamp.fromisoformat
+generated/pandas.Timestamp.fromordinal,../reference/api/pandas.Timestamp.fromordinal
+generated/pandas.Timestamp.fromtimestamp,../reference/api/pandas.Timestamp.fromtimestamp
+generated/pandas.Timestamp.hour,../reference/api/pandas.Timestamp.hour
+generated/pandas.Timestamp,../reference/api/pandas.Timestamp
+generated/pandas.Timestamp.is_leap_year,../reference/api/pandas.Timestamp.is_leap_year
+generated/pandas.Timestamp.is_month_end,../reference/api/pandas.Timestamp.is_month_end
+generated/pandas.Timestamp.is_month_start,../reference/api/pandas.Timestamp.is_month_start
+generated/pandas.Timestamp.isocalendar,../reference/api/pandas.Timestamp.isocalendar
+generated/pandas.Timestamp.isoformat,../reference/api/pandas.Timestamp.isoformat
+generated/pandas.Timestamp.isoweekday,../reference/api/pandas.Timestamp.isoweekday
+generated/pandas.Timestamp.is_quarter_end,../reference/api/pandas.Timestamp.is_quarter_end
+generated/pandas.Timestamp.is_quarter_start,../reference/api/pandas.Timestamp.is_quarter_start
+generated/pandas.Timestamp.is_year_end,../reference/api/pandas.Timestamp.is_year_end
+generated/pandas.Timestamp.is_year_start,../reference/api/pandas.Timestamp.is_year_start
+generated/pandas.Timestamp.max,../reference/api/pandas.Timestamp.max
+generated/pandas.Timestamp.microsecond,../reference/api/pandas.Timestamp.microsecond
+generated/pandas.Timestamp.min,../reference/api/pandas.Timestamp.min
+generated/pandas.Timestamp.minute,../reference/api/pandas.Timestamp.minute
+generated/pandas.Timestamp.month,../reference/api/pandas.Timestamp.month
+generated/pandas.Timestamp.month_name,../reference/api/pandas.Timestamp.month_name
+generated/pandas.Timestamp.nanosecond,../reference/api/pandas.Timestamp.nanosecond
+generated/pandas.Timestamp.normalize,../reference/api/pandas.Timestamp.normalize
+generated/pandas.Timestamp.now,../reference/api/pandas.Timestamp.now
+generated/pandas.Timestamp.quarter,../reference/api/pandas.Timestamp.quarter
+generated/pandas.Timestamp.replace,../reference/api/pandas.Timestamp.replace
+generated/pandas.Timestamp.resolution,../reference/api/pandas.Timestamp.resolution
+generated/pandas.Timestamp.round,../reference/api/pandas.Timestamp.round
+generated/pandas.Timestamp.second,../reference/api/pandas.Timestamp.second
+generated/pandas.Timestamp.strftime,../reference/api/pandas.Timestamp.strftime
+generated/pandas.Timestamp.strptime,../reference/api/pandas.Timestamp.strptime
+generated/pandas.Timestamp.time,../reference/api/pandas.Timestamp.time
+generated/pandas.Timestamp.timestamp,../reference/api/pandas.Timestamp.timestamp
+generated/pandas.Timestamp.timetuple,../reference/api/pandas.Timestamp.timetuple
+generated/pandas.Timestamp.timetz,../reference/api/pandas.Timestamp.timetz
+generated/pandas.Timestamp.to_datetime64,../reference/api/pandas.Timestamp.to_datetime64
+generated/pandas.Timestamp.today,../reference/api/pandas.Timestamp.today
+generated/pandas.Timestamp.to_julian_date,../reference/api/pandas.Timestamp.to_julian_date
+generated/pandas.Timestamp.toordinal,../reference/api/pandas.Timestamp.toordinal
+generated/pandas.Timestamp.to_period,../reference/api/pandas.Timestamp.to_period
+generated/pandas.Timestamp.to_pydatetime,../reference/api/pandas.Timestamp.to_pydatetime
+generated/pandas.Timestamp.tz_convert,../reference/api/pandas.Timestamp.tz_convert
+generated/pandas.Timestamp.tz,../reference/api/pandas.Timestamp.tz
+generated/pandas.Timestamp.tzinfo,../reference/api/pandas.Timestamp.tzinfo
+generated/pandas.Timestamp.tz_localize,../reference/api/pandas.Timestamp.tz_localize
+generated/pandas.Timestamp.tzname,../reference/api/pandas.Timestamp.tzname
+generated/pandas.Timestamp.utcfromtimestamp,../reference/api/pandas.Timestamp.utcfromtimestamp
+generated/pandas.Timestamp.utcnow,../reference/api/pandas.Timestamp.utcnow
+generated/pandas.Timestamp.utcoffset,../reference/api/pandas.Timestamp.utcoffset
+generated/pandas.Timestamp.utctimetuple,../reference/api/pandas.Timestamp.utctimetuple
+generated/pandas.Timestamp.value,../reference/api/pandas.Timestamp.value
+generated/pandas.Timestamp.weekday,../reference/api/pandas.Timestamp.weekday
+generated/pandas.Timestamp.weekday_name,../reference/api/pandas.Timestamp.weekday_name
+generated/pandas.Timestamp.week,../reference/api/pandas.Timestamp.week
+generated/pandas.Timestamp.weekofyear,../reference/api/pandas.Timestamp.weekofyear
+generated/pandas.Timestamp.year,../reference/api/pandas.Timestamp.year
+generated/pandas.to_datetime,../reference/api/pandas.to_datetime
+generated/pandas.to_numeric,../reference/api/pandas.to_numeric
+generated/pandas.to_timedelta,../reference/api/pandas.to_timedelta
+generated/pandas.tseries.frequencies.to_offset,../reference/api/pandas.tseries.frequencies.to_offset
+generated/pandas.unique,../reference/api/pandas.unique
+generated/pandas.util.hash_array,../reference/api/pandas.util.hash_array
+generated/pandas.util.hash_pandas_object,../reference/api/pandas.util.hash_pandas_object
+generated/pandas.wide_to_long,../reference/api/pandas.wide_to_long
diff --git a/doc/source/10min.rst b/doc/source/10min.rst
deleted file mode 100644
index 8482eef552c17..0000000000000
--- a/doc/source/10min.rst
+++ /dev/null
@@ -1,812 +0,0 @@
-.. _10min:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   import os
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   pd.options.display.max_rows = 15
-
-   #### portions of this were borrowed from the
-   #### Pandas cheatsheet
-   #### created during the PyData Workshop-Sprint 2012
-   #### Hannah Chen, Henry Chow, Eric Cox, Robert Mauriello
-
-
-********************
-10 Minutes to pandas
-********************
-
-This is a short introduction to pandas, geared mainly for new users.
-You can see more complex recipes in the :ref:`Cookbook<cookbook>`
-
-Customarily, we import as follows:
-
-.. ipython:: python
-
-   import pandas as pd
-   import numpy as np
-   import matplotlib.pyplot as plt
-
-Object Creation
----------------
-
-See the :ref:`Data Structure Intro section <dsintro>`
-
-Creating a :class:`Series` by passing a list of values, letting pandas create
-a default integer index:
-
-.. ipython:: python
-
-   s = pd.Series([1,3,5,np.nan,6,8])
-   s
-
-Creating a :class:`DataFrame` by passing a numpy array, with a datetime index
-and labeled columns:
-
-.. ipython:: python
-
-   dates = pd.date_range('20130101', periods=6)
-   dates
-   df = pd.DataFrame(np.random.randn(6,4), index=dates, columns=list('ABCD'))
-   df
-
-Creating a ``DataFrame`` by passing a dict of objects that can be converted to series-like.
-
-.. ipython:: python
-
-   df2 = pd.DataFrame({ 'A' : 1.,
-                        'B' : pd.Timestamp('20130102'),
-                        'C' : pd.Series(1,index=list(range(4)),dtype='float32'),
-                        'D' : np.array([3] * 4,dtype='int32'),
-                        'E' : pd.Categorical(["test","train","test","train"]),
-                        'F' : 'foo' })
-   df2
-
-Having specific :ref:`dtypes <basics.dtypes>`
-
-.. ipython:: python
-
-   df2.dtypes
-
-If you're using IPython, tab completion for column names (as well as public
-attributes) is automatically enabled. Here's a subset of the attributes that
-will be completed:
-
-.. ipython::
-
-   @verbatim
-   In [1]: df2.<TAB>
-   df2.A                  df2.bool
-   df2.abs                df2.boxplot
-   df2.add                df2.C
-   df2.add_prefix         df2.clip
-   df2.add_suffix         df2.clip_lower
-   df2.align              df2.clip_upper
-   df2.all                df2.columns
-   df2.any                df2.combine
-   df2.append             df2.combine_first
-   df2.apply              df2.compound
-   df2.applymap           df2.consolidate
-   df2.as_blocks          df2.convert_objects
-   df2.asfreq             df2.copy
-   df2.as_matrix          df2.corr
-   df2.astype             df2.corrwith
-   df2.at                 df2.count
-   df2.at_time            df2.cov
-   df2.axes               df2.cummax
-   df2.B                  df2.cummin
-   df2.between_time       df2.cumprod
-   df2.bfill              df2.cumsum
-   df2.blocks             df2.D
-
-As you can see, the columns ``A``, ``B``, ``C``, and ``D`` are automatically
-tab completed. ``E`` is there as well; the rest of the attributes have been
-truncated for brevity.
-
-Viewing Data
-------------
-
-See the :ref:`Basics section <basics>`
-
-See the top & bottom rows of the frame
-
-.. ipython:: python
-
-   df.head()
-   df.tail(3)
-
-Display the index, columns, and the underlying numpy data
-
-.. ipython:: python
-
-   df.index
-   df.columns
-   df.values
-
-Describe shows a quick statistic summary of your data
-
-.. ipython:: python
-
-   df.describe()
-
-Transposing your data
-
-.. ipython:: python
-
-   df.T
-
-Sorting by an axis
-
-.. ipython:: python
-
-   df.sort_index(axis=1, ascending=False)
-
-Sorting by values
-
-.. ipython:: python
-
-   df.sort_values(by='B')
-
-Selection
----------
-
-.. note::
-
-   While standard Python / Numpy expressions for selecting and setting are
-   intuitive and come in handy for interactive work, for production code, we
-   recommend the optimized pandas data access methods, ``.at``, ``.iat``,
-   ``.loc``, ``.iloc`` and ``.ix``.
-
-See the indexing documentation :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
-
-Getting
-~~~~~~~
-
-Selecting a single column, which yields a ``Series``,
-equivalent to ``df.A``
-
-.. ipython:: python
-
-   df['A']
-
-Selecting via ``[]``, which slices the rows.
-
-.. ipython:: python
-
-   df[0:3]
-   df['20130102':'20130104']
-
-Selection by Label
-~~~~~~~~~~~~~~~~~~
-
-See more in :ref:`Selection by Label <indexing.label>`
-
-For getting a cross section using a label
-
-.. ipython:: python
-
-   df.loc[dates[0]]
-
-Selecting on a multi-axis by label
-
-.. ipython:: python
-
-   df.loc[:,['A','B']]
-
-Showing label slicing, both endpoints are *included*
-
-.. ipython:: python
-
-   df.loc['20130102':'20130104',['A','B']]
-
-Reduction in the dimensions of the returned object
-
-.. ipython:: python
-
-   df.loc['20130102',['A','B']]
-
-For getting a scalar value
-
-.. ipython:: python
-
-   df.loc[dates[0],'A']
-
-For getting fast access to a scalar (equiv to the prior method)
-
-.. ipython:: python
-
-   df.at[dates[0],'A']
-
-Selection by Position
-~~~~~~~~~~~~~~~~~~~~~
-
-See more in :ref:`Selection by Position <indexing.integer>`
-
-Select via the position of the passed integers
-
-.. ipython:: python
-
-   df.iloc[3]
-
-By integer slices, acting similar to numpy/python
-
-.. ipython:: python
-
-   df.iloc[3:5,0:2]
-
-By lists of integer position locations, similar to the numpy/python style
-
-.. ipython:: python
-
-   df.iloc[[1,2,4],[0,2]]
-
-For slicing rows explicitly
-
-.. ipython:: python
-
-   df.iloc[1:3,:]
-
-For slicing columns explicitly
-
-.. ipython:: python
-
-   df.iloc[:,1:3]
-
-For getting a value explicitly
-
-.. ipython:: python
-
-   df.iloc[1,1]
-
-For getting fast access to a scalar (equiv to the prior method)
-
-.. ipython:: python
-
-   df.iat[1,1]
-
-Boolean Indexing
-~~~~~~~~~~~~~~~~
-
-Using a single column's values to select data.
-
-.. ipython:: python
-
-   df[df.A > 0]
-
-Selecting values from a DataFrame where a boolean condition is met.
-
-.. ipython:: python
-
-   df[df > 0]
-
-Using the :func:`~Series.isin` method for filtering:
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2['E'] = ['one', 'one','two','three','four','three']
-   df2
-   df2[df2['E'].isin(['two','four'])]
-
-Setting
-~~~~~~~
-
-Setting a new column automatically aligns the data
-by the indexes
-
-.. ipython:: python
-
-   s1 = pd.Series([1,2,3,4,5,6], index=pd.date_range('20130102', periods=6))
-   s1
-   df['F'] = s1
-
-Setting values by label
-
-.. ipython:: python
-
-   df.at[dates[0],'A'] = 0
-
-Setting values by position
-
-.. ipython:: python
-
-   df.iat[0,1] = 0
-
-Setting by assigning with a numpy array
-
-.. ipython:: python
-
-   df.loc[:,'D'] = np.array([5] * len(df))
-
-The result of the prior setting operations
-
-.. ipython:: python
-
-   df
-
-A ``where`` operation with setting.
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2[df2 > 0] = -df2
-   df2
-
-
-Missing Data
-------------
-
-pandas primarily uses the value ``np.nan`` to represent missing data. It is by
-default not included in computations. See the :ref:`Missing Data section
-<missing_data>`
-
-Reindexing allows you to change/add/delete the index on a specified axis. This
-returns a copy of the data.
-
-.. ipython:: python
-
-   df1 = df.reindex(index=dates[0:4], columns=list(df.columns) + ['E'])
-   df1.loc[dates[0]:dates[1],'E'] = 1
-   df1
-
-To drop any rows that have missing data.
-
-.. ipython:: python
-
-   df1.dropna(how='any')
-
-Filling missing data
-
-.. ipython:: python
-
-   df1.fillna(value=5)
-
-To get the boolean mask where values are ``nan``
-
-.. ipython:: python
-
-   pd.isnull(df1)
-
-
-Operations
-----------
-
-See the :ref:`Basic section on Binary Ops <basics.binop>`
-
-Stats
-~~~~~
-
-Operations in general *exclude* missing data.
-
-Performing a descriptive statistic
-
-.. ipython:: python
-
-   df.mean()
-
-Same operation on the other axis
-
-.. ipython:: python
-
-   df.mean(1)
-
-Operating with objects that have different dimensionality and need alignment.
-In addition, pandas automatically broadcasts along the specified dimension.
-
-.. ipython:: python
-
-   s = pd.Series([1,3,5,np.nan,6,8], index=dates).shift(2)
-   s
-   df.sub(s, axis='index')
-
-
-Apply
-~~~~~
-
-Applying functions to the data
-
-.. ipython:: python
-
-   df.apply(np.cumsum)
-   df.apply(lambda x: x.max() - x.min())
-
-Histogramming
-~~~~~~~~~~~~~
-
-See more at :ref:`Histogramming and Discretization <basics.discretization>`
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randint(0, 7, size=10))
-   s
-   s.value_counts()
-
-String Methods
-~~~~~~~~~~~~~~
-
-Series is equipped with a set of string processing methods in the `str`
-attribute that make it easy to operate on each element of the array, as in the
-code snippet below. Note that pattern-matching in `str` generally uses `regular
-expressions <https://docs.python.org/2/library/re.html>`__ by default (and in
-some cases always uses them). See more at :ref:`Vectorized String Methods
-<text.string_methods>`.
-
-.. ipython:: python
-
-   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
-   s.str.lower()
-
-Merge
------
-
-Concat
-~~~~~~
-
-pandas provides various facilities for easily combining together Series,
-DataFrame, and Panel objects with various kinds of set logic for the indexes
-and relational algebra functionality in the case of join / merge-type
-operations.
-
-See the :ref:`Merging section <merging>`
-
-Concatenating pandas objects together with :func:`concat`:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10, 4))
-   df
-
-   # break it into pieces
-   pieces = [df[:3], df[3:7], df[7:]]
-
-   pd.concat(pieces)
-
-Join
-~~~~
-
-SQL style merges. See the :ref:`Database style joining <merging.join>`
-
-.. ipython:: python
-
-   left = pd.DataFrame({'key': ['foo', 'foo'], 'lval': [1, 2]})
-   right = pd.DataFrame({'key': ['foo', 'foo'], 'rval': [4, 5]})
-   left
-   right
-   pd.merge(left, right, on='key')
-
-Another example that can be given is:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'key': ['foo', 'bar'], 'lval': [1, 2]})
-   right = pd.DataFrame({'key': ['foo', 'bar'], 'rval': [4, 5]})
-   left
-   right
-   pd.merge(left, right, on='key')
-
-
-Append
-~~~~~~
-
-Append rows to a dataframe. See the :ref:`Appending <merging.concatenation>`
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(8, 4), columns=['A','B','C','D'])
-   df
-   s = df.iloc[3]
-   df.append(s, ignore_index=True)
-
-
-Grouping
---------
-
-By "group by" we are referring to a process involving one or more of the
-following steps
-
- - **Splitting** the data into groups based on some criteria
- - **Applying** a function to each group independently
- - **Combining** the results into a data structure
-
-See the :ref:`Grouping section <groupby>`
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-                             'foo', 'bar', 'foo', 'foo'],
-                      'B' : ['one', 'one', 'two', 'three',
-                             'two', 'two', 'one', 'three'],
-                      'C' : np.random.randn(8),
-                      'D' : np.random.randn(8)})
-   df
-
-Grouping and then applying a function ``sum`` to the resulting groups.
-
-.. ipython:: python
-
-   df.groupby('A').sum()
-
-Grouping by multiple columns forms a hierarchical index, which we then apply
-the function.
-
-.. ipython:: python
-
-   df.groupby(['A','B']).sum()
-
-Reshaping
----------
-
-See the sections on :ref:`Hierarchical Indexing <advanced.hierarchical>` and
-:ref:`Reshaping <reshaping.stacking>`.
-
-Stack
-~~~~~
-
-.. ipython:: python
-
-   tuples = list(zip(*[['bar', 'bar', 'baz', 'baz',
-                        'foo', 'foo', 'qux', 'qux'],
-                       ['one', 'two', 'one', 'two',
-                        'one', 'two', 'one', 'two']]))
-   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
-   df = pd.DataFrame(np.random.randn(8, 2), index=index, columns=['A', 'B'])
-   df2 = df[:4]
-   df2
-
-The :meth:`~DataFrame.stack` method "compresses" a level in the DataFrame's
-columns.
-
-.. ipython:: python
-
-   stacked = df2.stack()
-   stacked
-
-With a "stacked" DataFrame or Series (having a ``MultiIndex`` as the
-``index``), the inverse operation of :meth:`~DataFrame.stack` is
-:meth:`~DataFrame.unstack`, which by default unstacks the **last level**:
-
-.. ipython:: python
-
-   stacked.unstack()
-   stacked.unstack(1)
-   stacked.unstack(0)
-
-Pivot Tables
-~~~~~~~~~~~~
-See the section on :ref:`Pivot Tables <reshaping.pivot>`.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A' : ['one', 'one', 'two', 'three'] * 3,
-                      'B' : ['A', 'B', 'C'] * 4,
-                      'C' : ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 2,
-                      'D' : np.random.randn(12),
-                      'E' : np.random.randn(12)})
-   df
-
-We can produce pivot tables from this data very easily:
-
-.. ipython:: python
-
-   pd.pivot_table(df, values='D', index=['A', 'B'], columns=['C'])
-
-
-Time Series
------------
-
-pandas has simple, powerful, and efficient functionality for performing
-resampling operations during frequency conversion (e.g., converting secondly
-data into 5-minutely data). This is extremely common in, but not limited to,
-financial applications. See the :ref:`Time Series section <timeseries>`
-
-.. ipython:: python
-
-   rng = pd.date_range('1/1/2012', periods=100, freq='S')
-   ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
-   ts.resample('5Min').sum()
-
-Time zone representation
-
-.. ipython:: python
-
-   rng = pd.date_range('3/6/2012 00:00', periods=5, freq='D')
-   ts = pd.Series(np.random.randn(len(rng)), rng)
-   ts
-   ts_utc = ts.tz_localize('UTC')
-   ts_utc
-
-Convert to another time zone
-
-.. ipython:: python
-
-   ts_utc.tz_convert('US/Eastern')
-
-Converting between time span representations
-
-.. ipython:: python
-
-   rng = pd.date_range('1/1/2012', periods=5, freq='M')
-   ts = pd.Series(np.random.randn(len(rng)), index=rng)
-   ts
-   ps = ts.to_period()
-   ps
-   ps.to_timestamp()
-
-Converting between period and timestamp enables some convenient arithmetic
-functions to be used. In the following example, we convert a quarterly
-frequency with year ending in November to 9am of the end of the month following
-the quarter end:
-
-.. ipython:: python
-
-   prng = pd.period_range('1990Q1', '2000Q4', freq='Q-NOV')
-   ts = pd.Series(np.random.randn(len(prng)), prng)
-   ts.index = (prng.asfreq('M', 'e') + 1).asfreq('H', 's') + 9
-   ts.head()
-
-Categoricals
-------------
-
-Since version 0.15, pandas can include categorical data in a ``DataFrame``. For full docs, see the
-:ref:`categorical introduction <categorical>` and the :ref:`API documentation <api.categorical>`.
-
-.. ipython:: python
-
-    df = pd.DataFrame({"id":[1,2,3,4,5,6], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
-
-Convert the raw grades to a categorical data type.
-
-.. ipython:: python
-
-    df["grade"] = df["raw_grade"].astype("category")
-    df["grade"]
-
-Rename the categories to more meaningful names (assigning to ``Series.cat.categories`` is inplace!)
-
-.. ipython:: python
-
-    df["grade"].cat.categories = ["very good", "good", "very bad"]
-
-Reorder the categories and simultaneously add the missing categories (methods under ``Series
-.cat`` return a new ``Series`` per default).
-
-.. ipython:: python
-
-    df["grade"] = df["grade"].cat.set_categories(["very bad", "bad", "medium", "good", "very good"])
-    df["grade"]
-
-Sorting is per order in the categories, not lexical order.
-
-.. ipython:: python
-
-    df.sort_values(by="grade")
-
-Grouping by a categorical column shows also empty categories.
-
-.. ipython:: python
-
-    df.groupby("grade").size()
-
-
-Plotting
---------
-
-:ref:`Plotting <visualization>` docs.
-
-.. ipython:: python
-   :suppress:
-
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-.. ipython:: python
-
-   ts = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
-   ts = ts.cumsum()
-
-   @savefig series_plot_basic.png
-   ts.plot()
-
-On DataFrame, :meth:`~DataFrame.plot` is a convenience to plot all of the
-columns with labels:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index,
-                     columns=['A', 'B', 'C', 'D'])
-   df = df.cumsum()
-
-   @savefig frame_plot_basic.png
-   plt.figure(); df.plot(); plt.legend(loc='best')
-
-Getting Data In/Out
--------------------
-
-CSV
-~~~
-
-:ref:`Writing to a csv file <io.store_in_csv>`
-
-.. ipython:: python
-
-   df.to_csv('foo.csv')
-
-:ref:`Reading from a csv file <io.read_csv_table>`
-
-.. ipython:: python
-
-   pd.read_csv('foo.csv')
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.csv')
-
-HDF5
-~~~~
-
-Reading and writing to :ref:`HDFStores <io.hdf5>`
-
-Writing to a HDF5 Store
-
-.. ipython:: python
-
-   df.to_hdf('foo.h5','df')
-
-Reading from a HDF5 Store
-
-.. ipython:: python
-
-   pd.read_hdf('foo.h5','df')
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.h5')
-
-Excel
-~~~~~
-
-Reading and writing to :ref:`MS Excel <io.excel>`
-
-Writing to an excel file
-
-.. ipython:: python
-
-   df.to_excel('foo.xlsx', sheet_name='Sheet1')
-
-Reading from an excel file
-
-.. ipython:: python
-
-   pd.read_excel('foo.xlsx', 'Sheet1', index_col=None, na_values=['NA'])
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.xlsx')
-
-Gotchas
--------
-
-If you are trying an operation and you see an exception like:
-
-.. code-block:: python
-
-    >>> if pd.Series([False, True, False]):
-        print("I was true")
-    Traceback
-        ...
-    ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
-
-See :ref:`Comparisons<basics.compare>` for an explanation and what to do.
-
-See :ref:`Gotchas<gotchas>` as well.
diff --git a/doc/source/_static/banklist.html b/doc/source/_static/banklist.html
index 8ec1561f8c394..cb07c332acbe7 100644
--- a/doc/source/_static/banklist.html
+++ b/doc/source/_static/banklist.html
@@ -7,7 +7,7 @@
 <meta charset="UTF-8">
 <!-- Unicode character encoding -->
 <meta http-equiv="X-UA-Compatible" content="IE=edge">
-<!-- Turns off IE Compatiblity Mode -->
+<!-- Turns off IE Compatibility Mode -->
 <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
 <!-- Makes it so phones don't auto zoom out. -->
 <meta name="author" content="DRR">
@@ -37,7 +37,7 @@
 	else var sValue = li.selectValue;
 
 	$('#googlesearch').submit();
-	
+
 }
 function findValue2(li) {
 	if( li == null ) return alert("No match!");
@@ -47,7 +47,7 @@
 
 	// otherwise, let's just display the value in the text box
 	else var sValue = li.selectValue;
-	
+
 	$('#googlesearch2').submit();
 }
 function selectItem(li) {
@@ -62,7 +62,7 @@
 	function log(event, data, formatted) {
 		$("<li>").html( !data ? "No match!" : "Selected: " + formatted).appendTo("#result");
 	}
-	
+
 	function formatItem(row) {
 		return row[0] + " (<strong>id: " + row[1] + "</strong>)";
 	}
@@ -81,7 +81,7 @@
 		selectFirst: false
 
 	});
-	
+
 	$("#search2").autocomplete("/searchjs.asp", {
 		width: 160,
 		autoFill: false,
@@ -93,7 +93,7 @@
 		selectFirst: false
 
 	});
-	
+
 });
 
 </script>
@@ -232,16 +232,16 @@ <h2>Each depositor insured to at least $250,000 per insured bank</h2>
 	<h1 class="page_title">Failed Bank List</h1>
 
 	<p>The FDIC is often appointed as receiver for failed banks. This page contains useful information for the customers and vendors of these banks. This includes information on the acquiring bank (if applicable), how your accounts and loans are affected, and how vendors can file claims against the receivership. <a href="http://www2.fdic.gov/drrip/cs/index.asp">Failed Financial Institution Contact Search</a> displays point of contact information related to failed banks.</p>
-	
+
 	<p>This list includes banks which have failed since October 1, 2000. To search for banks that failed prior to those on this page, visit this link: <a href="http://www2.fdic.gov/hsob/SelectRpt.asp?EntryTyp=30">Failures and Assistance Transactions</a></p>
-	
+
 	<p><a href="banklist.csv">Failed Bank List</a> - CSV file (Updated on Mondays. Also opens in Excel - <a href="/excel.html">Excel Help</a>)</p>
-	
+
 	<p class="small_screen_warning">Due to the small screen size some information is no longer visible.<br>Full information available when viewed on a larger screen.</p>
 
 	<script type="text/javascript">
 	<!--
-	document.writeln("<p><em>Click arrows next to headers to sort in Ascending or Descending order.</em></p>"); 
+	document.writeln("<p><em>Click arrows next to headers to sort in Ascending or Descending order.</em></p>");
 	//-->
 	</script>
 
@@ -253,7 +253,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<th id="city" class="nosort" scope="col">City</th>
 				<th id="state" scope="col">ST</th>
 				<th id="cert" class="nosort" scope="col">CERT</th>
-				<th id="ai" scope="col">Acquiring Institution</th>    
+				<th id="ai" scope="col">Acquiring Institution</th>
 				<th id="closing" scope="col">Closing Date</th>
 				<th id="updated" scope="col">Updated Date</th>
 			</tr>
@@ -294,7 +294,7 @@ <h1 class="page_title">Failed Bank List</h1>
 			  <td class="ai">Capital Bank, N.A.</td>
 			  <td class="closing">May 10, 2013</td>
 			  <td class="updated">May 14, 2013</td>
-			</tr>			
+			</tr>
 			<tr>
 				<td class="institution"><a href="douglascb.html">Douglas County Bank</a></td>
 				<td class="city">Douglasville</td>
@@ -383,7 +383,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Sunwest Bank</td>
 				<td class="closing">January 11, 2013</td>
 				<td class="updated">January 24, 2013</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="cmbkozarks.html">Community Bank of the Ozarks</a></td>
 				<td class="city">Sunrise Beach</td>
@@ -392,7 +392,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Bank of Sullivan</td>
 				<td class="closing">December 14, 2012</td>
 				<td class="updated">January 24, 2013</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="hometown.html">Hometown Community Bank</a></td>
 				<td class="city">Braselton</td>
@@ -401,7 +401,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CertusBank, National Association</td>
 				<td class="closing">November 16, 2012</td>
 				<td class="updated">January 24, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="cfnb.html">Citizens First National Bank</a></td>
 				<td class="city">Princeton</td>
@@ -518,7 +518,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Metcalf Bank</td>
 				<td class="closing">July 20, 2012</td>
 				<td class="updated">December 17, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="cherokee.html">First Cherokee State Bank</a></td>
 				<td class="city">Woodstock</td>
@@ -635,7 +635,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Southern States Bank</td>
 				<td class="closing">May 18, 2012</td>
 				<td class="updated">May 20, 2013</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="securitybank.html">Security Bank, National Association</a></td>
 				<td class="city">North Lauderdale</td>
@@ -644,7 +644,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Banesco USA</td>
 				<td class="closing">May 4, 2012</td>
 				<td class="updated">October 31, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="palmdesert.html">Palm Desert National Bank</a></td>
 				<td class="city">Palm Desert</td>
@@ -734,7 +734,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">No Acquirer</td>
 				<td class="closing">March 9, 2012</td>
 				<td class="updated">October 29, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="global.html">Global Commerce Bank</a></td>
 				<td class="city">Doraville</td>
@@ -752,7 +752,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">No Acquirer</td>
 				<td class="closing">February 24, 2012</td>
 				<td class="updated">December 17, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="cbg.html">Central Bank of Georgia</a></td>
 				<td class="city">Ellaville</td>
@@ -761,7 +761,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Ameris Bank</td>
 				<td class="closing">February 24, 2012</td>
 				<td class="updated">August 9, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="scbbank.html">SCB Bank</a></td>
 				<td class="city">Shelbyville</td>
@@ -770,7 +770,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Merchants Bank, National Association</td>
 				<td class="closing">February 10, 2012</td>
 				<td class="updated">March 25, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="cnbt.html">Charter National Bank and Trust</a></td>
 				<td class="city">Hoffman Estates</td>
@@ -779,7 +779,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Barrington Bank &amp; Trust Company, National Association</td>
 				<td class="closing">February 10, 2012</td>
 				<td class="updated">March 25, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankeast.html">BankEast</a></td>
 				<td class="city">Knoxville</td>
@@ -788,7 +788,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">U.S.Bank National Association</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">March 8, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="patriot-mn.html">Patriot Bank Minnesota</a></td>
 				<td class="city">Forest Lake</td>
@@ -797,7 +797,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Resource Bank</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="tcb.html">Tennessee Commerce Bank</a></td>
 				<td class="city">Franklin</td>
@@ -806,7 +806,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Republic Bank &amp; Trust Company</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">November 20, 2012</td>
-			</tr>     
+			</tr>
 			<tr>
 				<td class="institution"><a href="fgbtcj.html">First Guaranty Bank and Trust Company of Jacksonville</a></td>
 				<td class="city">Jacksonville</td>
@@ -815,7 +815,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CenterState Bank of Florida, N.A.</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="americaneagle.html">American Eagle Savings Bank</a></td>
 				<td class="city">Boothwyn</td>
@@ -824,7 +824,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Capital Bank, N.A.</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>      
+			</tr>
 			<tr>
 				<td class="institution"><a href="firststatebank-ga.html">The First State Bank</a></td>
 				<td class="city">Stockbridge</td>
@@ -833,7 +833,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Hamilton State Bank</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>      
+			</tr>
 			<tr>
 				<td class="institution"><a href="cfsb.html">Central Florida State Bank</a></td>
 				<td class="city">Belleview</td>
@@ -842,7 +842,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CenterState Bank of Florida, N.A.</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="westernnatl.html">Western National Bank</a></td>
 				<td class="city">Phoenix</td>
@@ -869,7 +869,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First NBC Bank</td>
 				<td class="closing">November 18, 2011</td>
 				<td class="updated">August 13, 2012</td>
-			</tr>     
+			</tr>
 			<tr>
 				<td class="institution"><a href="polkcounty.html">Polk County Bank</a></td>
 				<td class="city">Johnston</td>
@@ -887,7 +887,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Century Bank of Georgia</td>
 				<td class="closing">November 10, 2011</td>
 				<td class="updated">August 13, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="sunfirst.html">SunFirst Bank</a></td>
 				<td class="city">Saint George</td>
@@ -896,7 +896,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Cache Valley Bank</td>
 				<td class="closing">November 4, 2011</td>
 				<td class="updated">November 16, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="midcity.html">Mid City Bank, Inc.</a></td>
 				<td class="city">Omaha</td>
@@ -905,7 +905,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Premier Bank</td>
 				<td class="closing">November 4, 2011</td>
 				<td class="updated">August 15, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="allamerican.html ">All American Bank</a></td>
 				<td class="city">Des Plaines</td>
@@ -914,7 +914,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">International Bank of Chicago</td>
 				<td class="closing">October 28, 2011</td>
 				<td class="updated">August 15, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="commbanksco.html">Community Banks of Colorado</a></td>
 				<td class="city">Greenwood Village</td>
@@ -959,7 +959,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Blackhawk Bank &amp; Trust</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">August 15, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="firststatebank-nj.html">First State Bank</a></td>
  				<td class="city">Cranford</td>
@@ -968,7 +968,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Northfield Bank</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">November 8, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="blueridge.html">Blue Ridge Savings Bank, Inc.</a></td>
  				<td class="city">Asheville</td>
@@ -977,7 +977,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Bank of North Carolina</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">November 8, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="piedmont-ga.html">Piedmont Community Bank</a></td>
  				<td class="city">Gray</td>
@@ -986,7 +986,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">State Bank and Trust Company</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">January 22, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="sunsecurity.html">Sun Security Bank</a></td>
  				<td class="city">Ellington</td>
@@ -1202,7 +1202,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Ameris Bank</td>
 				<td class="closing">July 15, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="onegeorgia.html">One Georgia Bank</a></td>
 				<td class="city">Atlanta</td>
@@ -1247,7 +1247,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First American Bank and Trust Company</td>
 				<td class="closing">June 24, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="fcbtb.html">First Commercial Bank of Tampa Bay</a></td>
 				<td class="city">Tampa</td>
@@ -1256,7 +1256,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Stonegate Bank</td>
 				<td class="closing">June 17, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="mcintoshstate.html">McIntosh State Bank</a></td>
 				<td class="city">Jackson</td>
@@ -1265,7 +1265,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Hamilton State Bank</td>
 				<td class="closing">June 17, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="atlanticbanktrust.html">Atlantic Bank and Trust</a></td>
 				<td class="city">Charleston</td>
@@ -1274,7 +1274,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Citizens Bank and Trust Company, Inc.</td>
 				<td class="closing">June 3, 2011</td>
 				<td class="updated">October 31, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="firstheritage.html">First Heritage Bank</a></td>
 				<td class="city">Snohomish</td>
@@ -1283,7 +1283,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Columbia State Bank</td>
 				<td class="closing">May 27, 2011</td>
 				<td class="updated">January 28, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="summit.html">Summit Bank</a></td>
 				<td class="city">Burlington</td>
@@ -1292,7 +1292,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Columbia State Bank</td>
 				<td class="closing">May 20, 2011</td>
 				<td class="updated">January 22, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="fgbc.html">First Georgia Banking Company</a></td>
 				<td class="city">Franklin</td>
@@ -2030,7 +2030,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Westamerica Bank</td>
 				<td class="closing">August 20, 2010</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>	 
+			</tr>
 			<tr>
 				<td class="institution"><a href="lospadres.html">Los Padres Bank</a></td>
 				<td class="city">Solvang</td>
@@ -2624,7 +2624,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">MB Financial Bank, N.A.</td>
 				<td class="closing">April 23, 2010</td>
 				<td class="updated">August 23, 2012</td>
-			</tr> 	 	 	 
+			</tr>
 			<tr>
 				<td class="institution"><a href="amcore.html">Amcore Bank, National Association</a></td>
 				<td class="city">Rockford</td>
@@ -2768,7 +2768,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Citizens Bank</td>
 				<td class="closing">March 19, 2010</td>
 				<td class="updated">August 23, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankofhiawassee.html">Bank of Hiawassee</a></td>
 				<td class="city">Hiawassee</td>
@@ -3480,7 +3480,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="closing">October 2, 2009</td>
 				<td class="updated">August 21, 2012</td>
 			</tr>
-			<tr> 
+			<tr>
 				<td class="institution"><a href="warren-mi.html">Warren Bank</a></td>
 				<td class="city">Warren</td>
 				<td class="state">MI</td>
@@ -3767,7 +3767,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Herring Bank</td>
 				<td class="closing">July 31, 2009</td>
 				<td class="updated">August 20, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="sb-jones.html">Security Bank of Jones County</a></td>
 				<td class="city">Gray</td>
@@ -3848,7 +3848,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">California Bank &amp; Trust</td>
 				<td class="closing">July 17, 2009</td>
 				<td class="updated">August 20, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankfirst.html">BankFirst</a></td>
 				<td class="city">Sioux Falls</td>
@@ -4811,7 +4811,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Bank of the Orient</td>
 				<td class="closing">October 13, 2000</td>
 				<td class="updated">March 17, 2005</td>
-			</tr> 	 
+			</tr>
 		</tbody>
 	</table>
 	</div>
@@ -4849,12 +4849,12 @@ <h1 class="page_title">Failed Bank List</h1>
 		<ul>
 			<li><a href="/about/freedom/" title="Freedom of Information Act (FOIA) Service Center">Freedom of Information Act (FOIA) Service Center</a></li>
 			<li><a href="/open/" title="FDIC Open Government Webpage">FDIC Open Government Webpage</a></li>
-			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No  FEAR Act Data</a></li>
+			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No FEAR Act Data</a></li>
 		</ul>
 	</div>
 	<div id="responsive_footer-small">
 		<ul>
-			<li><a href="/" title="Home">Home</a></li> 
+			<li><a href="/" title="Home">Home</a></li>
 			<li><a href="/about/contact/ask/" title="Contact Us">Contact Us</a></li>
 			<li><a href="/about/policies/" title="Website Policies">Website Policies</a></li>
 			<li><a href="/search/" title="Search">Search</a></li>
diff --git a/doc/source/_static/ci.png b/doc/source/_static/ci.png
new file mode 100644
index 0000000000000..3a4225e3ce1eb
Binary files /dev/null and b/doc/source/_static/ci.png differ
diff --git a/doc/source/_static/favicon.ico b/doc/source/_static/favicon.ico
new file mode 100644
index 0000000000000..d15c4803b62e6
Binary files /dev/null and b/doc/source/_static/favicon.ico differ
diff --git a/doc/source/_static/print_df_new.png b/doc/source/_static/print_df_new.png
new file mode 100644
index 0000000000000..767d7d3f0ef06
Binary files /dev/null and b/doc/source/_static/print_df_new.png differ
diff --git a/doc/source/_static/print_df_old.png b/doc/source/_static/print_df_old.png
new file mode 100644
index 0000000000000..5f458722f1269
Binary files /dev/null and b/doc/source/_static/print_df_old.png differ
diff --git a/doc/source/_static/reshaping_melt.png b/doc/source/_static/reshaping_melt.png
new file mode 100644
index 0000000000000..d0c4e77655e60
Binary files /dev/null and b/doc/source/_static/reshaping_melt.png differ
diff --git a/doc/source/_static/reshaping_pivot.png b/doc/source/_static/reshaping_pivot.png
new file mode 100644
index 0000000000000..c6c37a80744d4
Binary files /dev/null and b/doc/source/_static/reshaping_pivot.png differ
diff --git a/doc/source/_static/reshaping_stack.png b/doc/source/_static/reshaping_stack.png
new file mode 100644
index 0000000000000..924f916ae0d37
Binary files /dev/null and b/doc/source/_static/reshaping_stack.png differ
diff --git a/doc/source/_static/reshaping_unstack.png b/doc/source/_static/reshaping_unstack.png
new file mode 100644
index 0000000000000..3e14cdd1ee1f7
Binary files /dev/null and b/doc/source/_static/reshaping_unstack.png differ
diff --git a/doc/source/_static/reshaping_unstack_0.png b/doc/source/_static/reshaping_unstack_0.png
new file mode 100644
index 0000000000000..eceddf73eea9e
Binary files /dev/null and b/doc/source/_static/reshaping_unstack_0.png differ
diff --git a/doc/source/_static/reshaping_unstack_1.png b/doc/source/_static/reshaping_unstack_1.png
new file mode 100644
index 0000000000000..ab0ae3796dcc1
Binary files /dev/null and b/doc/source/_static/reshaping_unstack_1.png differ
diff --git a/doc/source/_static/style-excel.png b/doc/source/_static/style-excel.png
new file mode 100644
index 0000000000000..f946949e8bcf9
Binary files /dev/null and b/doc/source/_static/style-excel.png differ
diff --git a/doc/source/advanced.rst b/doc/source/advanced.rst
deleted file mode 100644
index f380070ddac79..0000000000000
--- a/doc/source/advanced.rst
+++ /dev/null
@@ -1,980 +0,0 @@
-.. _advanced:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows=15
-
-******************************
-MultiIndex / Advanced Indexing
-******************************
-
-This section covers indexing with a ``MultiIndex`` and more advanced indexing features.
-
-See the :ref:`Indexing and Selecting Data <indexing>` for general indexing documentation.
-
-.. warning::
-
-   Whether a copy or a reference is returned for a setting operation, may
-   depend on the context.  This is sometimes called ``chained assignment`` and
-   should be avoided.  See :ref:`Returning a View versus Copy
-   <indexing.view_versus_copy>`
-
-.. warning::
-
-   In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
-
-See the :ref:`cookbook<cookbook.selection>` for some advanced strategies
-
-.. _advanced.hierarchical:
-
-Hierarchical indexing (MultiIndex)
-----------------------------------
-
-Hierarchical / Multi-level indexing is very exciting as it opens the door to some
-quite sophisticated data analysis and manipulation, especially for working with
-higher dimensional data. In essence, it enables you to store and manipulate
-data with an arbitrary number of dimensions in lower dimensional data
-structures like Series (1d) and DataFrame (2d).
-
-In this section, we will show what exactly we mean by "hierarchical" indexing
-and how it integrates with the all of the pandas indexing functionality
-described above and in prior sections. Later, when discussing :ref:`group by
-<groupby>` and :ref:`pivoting and reshaping data <reshaping>`, we'll show
-non-trivial applications to illustrate how it aids in structuring data for
-analysis.
-
-See the :ref:`cookbook<cookbook.multi_index>` for some advanced strategies
-
-Creating a MultiIndex (hierarchical index) object
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ``MultiIndex`` object is the hierarchical analogue of the standard
-``Index`` object which typically stores the axis labels in pandas objects. You
-can think of ``MultiIndex`` as an array of tuples where each tuple is unique. A
-``MultiIndex`` can be created from a list of arrays (using
-``MultiIndex.from_arrays``), an array of tuples (using
-``MultiIndex.from_tuples``), or a crossed set of iterables (using
-``MultiIndex.from_product``).  The ``Index`` constructor will attempt to return
-a ``MultiIndex`` when it is passed a list of tuples.  The following examples
-demo different ways to initialize MultiIndexes.
-
-
-.. ipython:: python
-
-   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-   tuples = list(zip(*arrays))
-   tuples
-
-   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
-   index
-
-   s = pd.Series(np.random.randn(8), index=index)
-   s
-
-When you want every pairing of the elements in two iterables, it can be easier
-to use the ``MultiIndex.from_product`` function:
-
-.. ipython:: python
-
-   iterables = [['bar', 'baz', 'foo', 'qux'], ['one', 'two']]
-   pd.MultiIndex.from_product(iterables, names=['first', 'second'])
-
-As a convenience, you can pass a list of arrays directly into Series or
-DataFrame to construct a MultiIndex automatically:
-
-.. ipython:: python
-
-   arrays = [np.array(['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux']),
-             np.array(['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two'])]
-   s = pd.Series(np.random.randn(8), index=arrays)
-   s
-   df = pd.DataFrame(np.random.randn(8, 4), index=arrays)
-   df
-
-All of the ``MultiIndex`` constructors accept a ``names`` argument which stores
-string names for the levels themselves. If no names are provided, ``None`` will
-be assigned:
-
-.. ipython:: python
-
-   df.index.names
-
-This index can back any axis of a pandas object, and the number of **levels**
-of the index is up to you:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(3, 8), index=['A', 'B', 'C'], columns=index)
-   df
-   pd.DataFrame(np.random.randn(6, 6), index=index[:6], columns=index[:6])
-
-We've "sparsified" the higher levels of the indexes to make the console output a
-bit easier on the eyes.
-
-It's worth keeping in mind that there's nothing preventing you from using
-tuples as atomic labels on an axis:
-
-.. ipython:: python
-
-   pd.Series(np.random.randn(8), index=tuples)
-
-The reason that the ``MultiIndex`` matters is that it can allow you to do
-grouping, selection, and reshaping operations as we will describe below and in
-subsequent areas of the documentation. As you will see in later sections, you
-can find yourself working with hierarchically-indexed data without creating a
-``MultiIndex`` explicitly yourself. However, when loading data from a file, you
-may wish to generate your own ``MultiIndex`` when preparing the data set.
-
-Note that how the index is displayed by be controlled using the
-``multi_sparse`` option in ``pandas.set_printoptions``:
-
-.. ipython:: python
-
-   pd.set_option('display.multi_sparse', False)
-   df
-   pd.set_option('display.multi_sparse', True)
-
-.. _advanced.get_level_values:
-
-Reconstructing the level labels
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The method ``get_level_values`` will return a vector of the labels for each
-location at a particular level:
-
-.. ipython:: python
-
-   index.get_level_values(0)
-   index.get_level_values('second')
-
-Basic indexing on axis with MultiIndex
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-One of the important features of hierarchical indexing is that you can select
-data by a "partial" label identifying a subgroup in the data. **Partial**
-selection "drops" levels of the hierarchical index in the result in a
-completely analogous way to selecting a column in a regular DataFrame:
-
-.. ipython:: python
-
-   df['bar']
-   df['bar', 'one']
-   df['bar']['one']
-   s['qux']
-
-See :ref:`Cross-section with hierarchical index <advanced.xs>` for how to select
-on a deeper level.
-
-.. note::
-
-   The repr of a ``MultiIndex`` shows ALL the defined levels of an index, even
-   if the they are not actually used. When slicing an index, you may notice this.
-   For example:
-
-   .. ipython:: python
-
-      # original multi-index
-      df.columns
-
-      # sliced
-      df[['foo','qux']].columns
-
-   This is done to avoid a recomputation of the levels in order to make slicing
-   highly performant. If you want to see the actual used levels.
-
-   .. ipython:: python
-
-      df[['foo','qux']].columns.values
-
-      # for a specific level
-      df[['foo','qux']].columns.get_level_values(0)
-
-   To reconstruct the multiindex with only the used levels
-
-   .. ipython:: python
-
-      pd.MultiIndex.from_tuples(df[['foo','qux']].columns.values)
-
-Data alignment and using ``reindex``
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Operations between differently-indexed objects having ``MultiIndex`` on the
-axes will work as you expect; data alignment will work the same as an Index of
-tuples:
-
-.. ipython:: python
-
-   s + s[:-2]
-   s + s[::2]
-
-``reindex`` can be called with another ``MultiIndex`` or even a list or array
-of tuples:
-
-.. ipython:: python
-
-   s.reindex(index[:3])
-   s.reindex([('foo', 'two'), ('bar', 'one'), ('qux', 'one'), ('baz', 'one')])
-
-.. _advanced.advanced_hierarchical:
-
-Advanced indexing with hierarchical index
------------------------------------------
-
-Syntactically integrating ``MultiIndex`` in advanced indexing with ``.loc`` is a
-bit challenging, but we've made every effort to do so. for example the
-following works as you would expect:
-
-.. ipython:: python
-
-   df = df.T
-   df
-   df.loc['bar']
-   df.loc['bar', 'two']
-
-"Partial" slicing also works quite nicely.
-
-.. ipython:: python
-
-   df.loc['baz':'foo']
-
-You can slice with a 'range' of values, by providing a slice of tuples.
-
-.. ipython:: python
-
-   df.loc[('baz', 'two'):('qux', 'one')]
-   df.loc[('baz', 'two'):'foo']
-
-Passing a list of labels or tuples works similar to reindexing:
-
-.. ipython:: python
-
-   df.loc[[('bar', 'two'), ('qux', 'one')]]
-
-.. _advanced.mi_slicers:
-
-Using slicers
-~~~~~~~~~~~~~
-
-.. versionadded:: 0.14.0
-
-In 0.14.0 we added a new way to slice multi-indexed objects.
-You can slice a multi-index by providing multiple indexers.
-
-You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
-including slices, lists of labels, labels, and boolean indexers.
-
-You can use ``slice(None)`` to select all the contents of *that* level. You do not need to specify all the
-*deeper* levels, they will be implied as ``slice(None)``.
-
-As usual, **both sides** of the slicers are included as this is label indexing.
-
-.. warning::
-
-   You should specify all axes in the ``.loc`` specifier, meaning the indexer for the **index** and
-   for the **columns**. There are some ambiguous cases where the passed indexer could be mis-interpreted
-   as indexing *both* axes, rather than into say the MuliIndex for the rows.
-
-   You should do this:
-
-   .. code-block:: python
-
-      df.loc[(slice('A1','A3'),.....),:]
-
-   rather than this:
-
-   .. code-block:: python
-
-      df.loc[(slice('A1','A3'),.....)]
-
-.. ipython:: python
-
-   def mklbl(prefix,n):
-       return ["%s%s" % (prefix,i)  for i in range(n)]
-
-   miindex = pd.MultiIndex.from_product([mklbl('A',4),
-                                         mklbl('B',2),
-                                         mklbl('C',4),
-                                         mklbl('D',2)])
-   micolumns = pd.MultiIndex.from_tuples([('a','foo'),('a','bar'),
-                                          ('b','foo'),('b','bah')],
-                                         names=['lvl0', 'lvl1'])
-   dfmi = pd.DataFrame(np.arange(len(miindex)*len(micolumns)).reshape((len(miindex),len(micolumns))),
-                       index=miindex,
-                       columns=micolumns).sort_index().sort_index(axis=1)
-   dfmi
-
-Basic multi-index slicing using slices, lists, and labels.
-
-.. ipython:: python
-
-   dfmi.loc[(slice('A1','A3'),slice(None), ['C1','C3']),:]
-
-You can use a ``pd.IndexSlice`` to have a more natural syntax using ``:`` rather than using ``slice(None)``
-
-.. ipython:: python
-
-   idx = pd.IndexSlice
-   dfmi.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
-
-It is possible to perform quite complicated selections using this method on multiple
-axes at the same time.
-
-.. ipython:: python
-
-   dfmi.loc['A1',(slice(None),'foo')]
-   dfmi.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
-
-Using a boolean indexer you can provide selection related to the *values*.
-
-.. ipython:: python
-
-   mask = dfmi[('a','foo')]>200
-   dfmi.loc[idx[mask,:,['C1','C3']],idx[:,'foo']]
-
-You can also specify the ``axis`` argument to ``.loc`` to interpret the passed
-slicers on a single axis.
-
-.. ipython:: python
-
-   dfmi.loc(axis=0)[:,:,['C1','C3']]
-
-Furthermore you can *set* the values using these methods
-
-.. ipython:: python
-
-   df2 = dfmi.copy()
-   df2.loc(axis=0)[:,:,['C1','C3']] = -10
-   df2
-
-You can use a right-hand-side of an alignable object as well.
-
-.. ipython:: python
-
-   df2 = dfmi.copy()
-   df2.loc[idx[:,:,['C1','C3']],:] = df2*1000
-   df2
-
-.. _advanced.xs:
-
-Cross-section
-~~~~~~~~~~~~~
-
-The ``xs`` method of ``DataFrame`` additionally takes a level argument to make
-selecting data at a particular level of a MultiIndex easier.
-
-.. ipython:: python
-
-   df
-   df.xs('one', level='second')
-
-.. ipython:: python
-
-   # using the slicers (new in 0.14.0)
-   df.loc[(slice(None),'one'),:]
-
-You can also select on the columns with :meth:`~pandas.MultiIndex.xs`, by
-providing the axis argument
-
-.. ipython:: python
-
-   df = df.T
-   df.xs('one', level='second', axis=1)
-
-.. ipython:: python
-
-   # using the slicers (new in 0.14.0)
-   df.loc[:,(slice(None),'one')]
-
-:meth:`~pandas.MultiIndex.xs` also allows selection with multiple keys
-
-.. ipython:: python
-
-   df.xs(('one', 'bar'), level=('second', 'first'), axis=1)
-
-.. ipython:: python
-
-   # using the slicers (new in 0.14.0)
-   df.loc[:,('bar','one')]
-
-.. versionadded:: 0.13.0
-
-You can pass ``drop_level=False`` to :meth:`~pandas.MultiIndex.xs` to retain
-the level that was selected
-
-.. ipython:: python
-
-   df.xs('one', level='second', axis=1, drop_level=False)
-
-versus the result with ``drop_level=True`` (the default value)
-
-.. ipython:: python
-
-   df.xs('one', level='second', axis=1, drop_level=True)
-
-.. ipython:: python
-   :suppress:
-
-   df = df.T
-
-.. _advanced.advanced_reindex:
-
-Advanced reindexing and alignment
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The parameter ``level`` has been added to the ``reindex`` and ``align`` methods
-of pandas objects. This is useful to broadcast values across a level. For
-instance:
-
-.. ipython:: python
-
-   midx = pd.MultiIndex(levels=[['zero', 'one'], ['x','y']],
-                        labels=[[1,1,0,0],[1,0,1,0]])
-   df = pd.DataFrame(np.random.randn(4,2), index=midx)
-   df
-   df2 = df.mean(level=0)
-   df2
-   df2.reindex(df.index, level=0)
-
-   # aligning
-   df_aligned, df2_aligned = df.align(df2, level=0)
-   df_aligned
-   df2_aligned
-
-
-Swapping levels with :meth:`~pandas.MultiIndex.swaplevel`
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ``swaplevel`` function can switch the order of two levels:
-
-.. ipython:: python
-
-   df[:5]
-   df[:5].swaplevel(0, 1, axis=0)
-
-.. _advanced.reorderlevels:
-
-Reordering levels with :meth:`~pandas.MultiIndex.reorder_levels`
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ``reorder_levels`` function generalizes the ``swaplevel`` function,
-allowing you to permute the hierarchical index levels in one step:
-
-.. ipython:: python
-
-   df[:5].reorder_levels([1,0], axis=0)
-
-Sorting a :class:`~pandas.MultiIndex`
--------------------------------------
-
-For MultiIndex-ed objects to be indexed & sliced effectively, they need
-to be sorted. As with any index, you can use ``sort_index``.
-
-.. ipython:: python
-
-   import random; random.shuffle(tuples)
-   s = pd.Series(np.random.randn(8), index=pd.MultiIndex.from_tuples(tuples))
-   s
-   s.sort_index()
-   s.sort_index(level=0)
-   s.sort_index(level=1)
-
-.. _advanced.sortlevel_byname:
-
-You may also pass a level name to ``sort_index`` if the MultiIndex levels
-are named.
-
-.. ipython:: python
-
-   s.index.set_names(['L1', 'L2'], inplace=True)
-   s.sort_index(level='L1')
-   s.sort_index(level='L2')
-
-On higher dimensional objects, you can sort any of the other axes by level if
-they have a MultiIndex:
-
-.. ipython:: python
-
-   df.T.sort_index(level=1, axis=1)
-
-Indexing will work even if the data are not sorted, but will be rather
-inefficient (and show a ``PerformanceWarning``). It will also
-return a copy of the data rather than a view:
-
-.. ipython:: python
-
-   dfm = pd.DataFrame({'jim': [0, 0, 1, 1],
-                       'joe': ['x', 'x', 'z', 'y'],
-                       'jolie': np.random.rand(4)})
-   dfm = dfm.set_index(['jim', 'joe'])
-   dfm
-
-.. code-block:: ipython
-
-   In [4]: dfm.loc[(1, 'z')]
-   PerformanceWarning: indexing past lexsort depth may impact performance.
-
-   Out[4]:
-              jolie
-   jim joe
-   1   z    0.64094
-
-.. _advanced.unsorted:
-
-Furthermore if you try to index something that is not fully lexsorted, this can raise:
-
-.. code-block:: ipython
-
-    In [5]: dfm.loc[(0,'y'):(1, 'z')]
-    UnsortedIndexError: 'Key length (2) was greater than MultiIndex lexsort depth (1)'
-
-The ``is_lexsorted()`` method on an ``Index`` show if the index is sorted, and the ``lexsort_depth`` property returns the sort depth:
-
-.. ipython:: python
-
-   dfm.index.is_lexsorted()
-   dfm.index.lexsort_depth
-
-.. ipython:: python
-
-   dfm = dfm.sort_index()
-   dfm
-   dfm.index.is_lexsorted()
-   dfm.index.lexsort_depth
-
-And now selection works as expected.
-
-.. ipython:: python
-
-   dfm.loc[(0,'y'):(1, 'z')]
-
-Take Methods
-------------
-
-.. _advanced.take:
-
-Similar to numpy ndarrays, pandas Index, Series, and DataFrame also provides
-the ``take`` method that retrieves elements along a given axis at the given
-indices. The given indices must be either a list or an ndarray of integer
-index positions. ``take`` will also accept negative integers as relative positions to the end of the object.
-
-.. ipython:: python
-
-   index = pd.Index(np.random.randint(0, 1000, 10))
-   index
-
-   positions = [0, 9, 3]
-
-   index[positions]
-   index.take(positions)
-
-   ser = pd.Series(np.random.randn(10))
-
-   ser.iloc[positions]
-   ser.take(positions)
-
-For DataFrames, the given indices should be a 1d list or ndarray that specifies
-row or column positions.
-
-.. ipython:: python
-
-   frm = pd.DataFrame(np.random.randn(5, 3))
-
-   frm.take([1, 4, 3])
-
-   frm.take([0, 2], axis=1)
-
-It is important to note that the ``take`` method on pandas objects are not
-intended to work on boolean indices and may return unexpected results.
-
-.. ipython:: python
-
-   arr = np.random.randn(10)
-   arr.take([False, False, True, True])
-   arr[[0, 1]]
-
-   ser = pd.Series(np.random.randn(10))
-   ser.take([False, False, True, True])
-   ser.iloc[[0, 1]]
-
-Finally, as a small note on performance, because the ``take`` method handles
-a narrower range of inputs, it can offer performance that is a good deal
-faster than fancy indexing.
-
-.. ipython::
-
-   arr = np.random.randn(10000, 5)
-   indexer = np.arange(10000)
-   random.shuffle(indexer)
-
-   timeit arr[indexer]
-   timeit arr.take(indexer, axis=0)
-
-   ser = pd.Series(arr[:, 0])
-   timeit ser.iloc[indexer]
-   timeit ser.take(indexer)
-
-.. _indexing.index_types:
-
-Index Types
------------
-
-We have discussed ``MultiIndex`` in the previous sections pretty extensively. ``DatetimeIndex`` and ``PeriodIndex``
-are shown :ref:`here <timeseries.overview>`. ``TimedeltaIndex`` are :ref:`here <timedeltas.timedeltas>`.
-
-In the following sub-sections we will highlite some other index types.
-
-.. _indexing.categoricalindex:
-
-CategoricalIndex
-~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.16.1
-
-We introduce a ``CategoricalIndex``, a new type of index object that is useful for supporting
-indexing with duplicates. This is a container around a ``Categorical`` (introduced in v0.15.0)
-and allows efficient indexing and storage of an index with a large number of duplicated elements. Prior to 0.16.1,
-setting the index of a ``DataFrame/Series`` with a ``category`` dtype would convert this to regular object-based ``Index``.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': np.arange(6),
-                      'B': list('aabbca')})
-   df['B'] = df['B'].astype('category', categories=list('cab'))
-   df
-   df.dtypes
-   df.B.cat.categories
-
-Setting the index, will create create a ``CategoricalIndex``
-
-.. ipython:: python
-
-   df2 = df.set_index('B')
-   df2.index
-
-Indexing with ``__getitem__/.iloc/.loc`` works similarly to an ``Index`` with duplicates.
-The indexers MUST be in the category or the operation will raise.
-
-.. ipython:: python
-
-   df2.loc['a']
-
-These PRESERVE the ``CategoricalIndex``
-
-.. ipython:: python
-
-   df2.loc['a'].index
-
-Sorting will order by the order of the categories
-
-.. ipython:: python
-
-   df2.sort_index()
-
-Groupby operations on the index will preserve the index nature as well
-
-.. ipython:: python
-
-   df2.groupby(level=0).sum()
-   df2.groupby(level=0).sum().index
-
-Reindexing operations, will return a resulting index based on the type of the passed
-indexer, meaning that passing a list will return a plain-old-``Index``; indexing with
-a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the categories
-of the PASSED ``Categorical`` dtype. This allows one to arbitrarly index these even with
-values NOT in the categories, similarly to how you can reindex ANY pandas index.
-
-.. ipython :: python
-
-   df2.reindex(['a','e'])
-   df2.reindex(['a','e']).index
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde')))
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde'))).index
-
-.. warning::
-
-   Reshaping and Comparison operations on a ``CategoricalIndex`` must have the same categories
-   or a ``TypeError`` will be raised.
-
-   .. code-block:: python
-
-      In [9]: df3 = pd.DataFrame({'A' : np.arange(6),
-                                  'B' : pd.Series(list('aabbca')).astype('category')})
-
-      In [11]: df3 = df3.set_index('B')
-
-      In [11]: df3.index
-      Out[11]: CategoricalIndex([u'a', u'a', u'b', u'b', u'c', u'a'], categories=[u'a', u'b', u'c'], ordered=False, name=u'B', dtype='category')
-
-      In [12]: pd.concat([df2, df3]
-      TypeError: categories must match existing categories when appending
-
-.. _indexing.rangeindex:
-
-Int64Index and RangeIndex
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. warning::
-
-   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
-
-``Int64Index`` is a fundamental basic index in *pandas*. This is an Immutable array implementing an ordered, sliceable set.
-Prior to 0.18.0, the ``Int64Index`` would provide the default index for all ``NDFrame`` objects.
-
-``RangeIndex`` is a sub-class of ``Int64Index`` added in version 0.18.0, now providing the default index for all ``NDFrame`` objects.
-``RangeIndex`` is an optimized version of ``Int64Index`` that can represent a monotonic ordered set. These are analagous to python `range types <https://docs.python.org/3/library/stdtypes.html#typesseq-range>`__.
-
-.. _indexing.float64index:
-
-Float64Index
-~~~~~~~~~~~~
-
-.. note::
-
-   As of 0.14.0, ``Float64Index`` is backed by a native ``float64`` dtype
-   array. Prior to 0.14.0, ``Float64Index`` was backed by an ``object`` dtype
-   array. Using a ``float64`` dtype in the backend speeds up arithmetic
-   operations by about 30x and boolean indexing operations on the
-   ``Float64Index`` itself are about 2x as fast.
-
-.. versionadded:: 0.13.0
-
-By default a ``Float64Index`` will be automatically created when passing floating, or mixed-integer-floating values in index creation.
-This enables a pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar indexing and slicing work exactly the
-same.
-
-.. ipython:: python
-
-   indexf = pd.Index([1.5, 2, 3, 4.5, 5])
-   indexf
-   sf = pd.Series(range(5), index=indexf)
-   sf
-
-Scalar selection for ``[],.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``)
-
-.. ipython:: python
-
-   sf[3]
-   sf[3.0]
-   sf.loc[3]
-   sf.loc[3.0]
-
-The only positional indexing is via ``iloc``
-
-.. ipython:: python
-
-   sf.iloc[3]
-
-A scalar index that is not found will raise ``KeyError``
-
-Slicing is ALWAYS on the values of the index, for ``[],ix,loc`` and ALWAYS positional with ``iloc``
-
-.. ipython:: python
-
-   sf[2:4]
-   sf.loc[2:4]
-   sf.iloc[2:4]
-
-In float indexes, slicing using floats is allowed
-
-.. ipython:: python
-
-   sf[2.1:4.6]
-   sf.loc[2.1:4.6]
-
-In non-float indexes, slicing using floats will raise a ``TypeError``
-
-.. code-block:: ipython
-
-   In [1]: pd.Series(range(5))[3.5]
-   TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
-
-   In [1]: pd.Series(range(5))[3.5:4.5]
-   TypeError: the slice start [3.5] is not a proper indexer for this index type (Int64Index)
-
-.. warning::
-
-   Using a scalar float indexer for ``.iloc`` has been removed in 0.18.0, so the following will raise a ``TypeError``
-
-   .. code-block:: ipython
-
-      In [3]: pd.Series(range(5)).iloc[3.0]
-      TypeError: cannot do positional indexing on <class 'pandas.indexes.range.RangeIndex'> with these indexers [3.0] of <type 'float'>
-
-
-Here is a typical use-case for using this type of indexing. Imagine that you have a somewhat
-irregular timedelta-like indexing scheme, but the data is recorded as floats. This could for
-example be millisecond offsets.
-
-.. ipython:: python
-
-   dfir = pd.concat([pd.DataFrame(np.random.randn(5,2),
-                                  index=np.arange(5) * 250.0,
-                                  columns=list('AB')),
-                     pd.DataFrame(np.random.randn(6,2),
-                                  index=np.arange(4,10) * 250.1,
-                                  columns=list('AB'))])
-   dfir
-
-Selection operations then will always work on a value basis, for all selection operators.
-
-.. ipython:: python
-
-   dfir[0:1000.4]
-   dfir.loc[0:1001,'A']
-   dfir.loc[1000.4]
-
-You could then easily pick out the first 1 second (1000 ms) of data then.
-
-.. ipython:: python
-
-   dfir[0:1000]
-
-Of course if you need integer based selection, then use ``iloc``
-
-.. ipython:: python
-
-   dfir.iloc[0:5]
-
-Miscellaneous indexing FAQ
---------------------------
-
-Integer indexing
-~~~~~~~~~~~~~~~~
-
-Label-based indexing with integer axis labels is a thorny topic. It has been
-discussed heavily on mailing lists and among various members of the scientific
-Python community. In pandas, our general viewpoint is that labels matter more
-than integer locations. Therefore, with an integer axis index *only*
-label-based indexing is possible with the standard tools like ``.loc``. The
-following code will generate exceptions:
-
-.. code-block:: python
-
-   s = pd.Series(range(5))
-   s[-1]
-   df = pd.DataFrame(np.random.randn(5, 4))
-   df
-   df.loc[-2:]
-
-This deliberate decision was made to prevent ambiguities and subtle bugs (many
-users reported finding bugs when the API change was made to stop "falling back"
-on position-based indexing).
-
-Non-monotonic indexes require exact matches
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-If the index of a ``Series`` or ``DataFrame`` is monotonically increasing or decreasing, then the bounds
-of a label-based slice can be outside the range of the index, much like slice indexing a
-normal Python ``list``. Monotonicity of an index can be tested with the ``is_monotonic_increasing`` and
-``is_monotonic_decreasing`` attributes.
-
-.. ipython:: python
-
-    df = pd.DataFrame(index=[2,3,3,4,5], columns=['data'], data=list(range(5)))
-    df.index.is_monotonic_increasing
-
-    # no rows 0 or 1, but still returns rows 2, 3 (both of them), and 4:
-    df.loc[0:4, :]
-
-    # slice is are outside the index, so empty DataFrame is returned
-    df.loc[13:15, :]
-
-On the other hand, if the index is not monotonic, then both slice bounds must be
-*unique* members of the index.
-
-.. ipython:: python
-
-    df = pd.DataFrame(index=[2,3,1,4,3,5], columns=['data'], data=list(range(6)))
-    df.index.is_monotonic_increasing
-
-    # OK because 2 and 4 are in the index
-    df.loc[2:4, :]
-
-.. code-block:: python
-
-    # 0 is not in the index
-    In [9]: df.loc[0:4, :]
-    KeyError: 0
-
-    # 3 is not a unique label
-    In [11]: df.loc[2:3, :]
-    KeyError: 'Cannot get right slice bound for non-unique label: 3'
-
-
-Endpoints are inclusive
-~~~~~~~~~~~~~~~~~~~~~~~
-
-Compared with standard Python sequence slicing in which the slice endpoint is
-not inclusive, label-based slicing in pandas **is inclusive**. The primary
-reason for this is that it is often not possible to easily determine the
-"successor" or next element after a particular label in an index. For example,
-consider the following Series:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(6), index=list('abcdef'))
-   s
-
-Suppose we wished to slice from ``c`` to ``e``, using integers this would be
-
-.. ipython:: python
-
-   s[2:5]
-
-However, if you only had ``c`` and ``e``, determining the next element in the
-index can be somewhat complicated. For example, the following does not work:
-
-::
-
-    s.loc['c':'e'+1]
-
-A very common use case is to limit a time series to start and end at two
-specific dates. To enable this, we made the design design to make label-based
-slicing include both endpoints:
-
-.. ipython:: python
-
-    s.loc['c':'e']
-
-This is most definitely a "practicality beats purity" sort of thing, but it is
-something to watch out for if you expect label-based slicing to behave exactly
-in the way that standard Python integer slicing works.
-
-
-Indexing potentially changes underlying Series dtype
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The different indexing operation can potentially change the dtype of a ``Series``.
-
-.. ipython:: python
-
-   series1 = pd.Series([1, 2, 3])
-   series1.dtype
-   res = series1[[0,4]]
-   res.dtype
-   res
-
-.. ipython:: python
-
-   series2 = pd.Series([True])
-   series2.dtype
-   res = series2.reindex_like(series1)
-   res.dtype
-   res
-
-This is because the (re)indexing operations above silently inserts ``NaNs`` and the ``dtype``
-changes accordingly.  This can cause some issues when using ``numpy`` ``ufuncs``
-such as ``numpy.logical_and``.
-
-See the `this old issue <https://github.com/pydata/pandas/issues/2388>`__ for a more
-detailed discussion.
diff --git a/doc/source/api.rst b/doc/source/api.rst
deleted file mode 100644
index dfeaf8e60feb1..0000000000000
--- a/doc/source/api.rst
+++ /dev/null
@@ -1,1860 +0,0 @@
-.. currentmodule:: pandas
-.. _api:
-
-*************
-API Reference
-*************
-
-.. _api.functions:
-
-Input/Output
-------------
-
-Pickling
-~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_pickle
-
-Flat File
-~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_table
-   read_csv
-   read_fwf
-   read_msgpack
-
-Clipboard
-~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_clipboard
-
-Excel
-~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_excel
-   ExcelFile.parse
-
-JSON
-~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_json
-
-.. currentmodule:: pandas.io.json
-
-.. autosummary::
-   :toctree: generated/
-
-   json_normalize
-   build_table_schema
-
-.. currentmodule:: pandas
-
-HTML
-~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_html
-
-HDFStore: PyTables (HDF5)
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_hdf
-   HDFStore.put
-   HDFStore.append
-   HDFStore.get
-   HDFStore.select
-
-Feather
-~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_feather
-
-SAS
-~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_sas
-
-SQL
-~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_sql_table
-   read_sql_query
-   read_sql
-
-Google BigQuery
-~~~~~~~~~~~~~~~
-.. currentmodule:: pandas.io.gbq
-
-.. autosummary::
-   :toctree: generated/
-
-   read_gbq
-
-
-.. currentmodule:: pandas
-
-
-STATA
-~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   read_stata
-
-.. currentmodule:: pandas.io.stata
-
-.. autosummary::
-   :toctree: generated/
-
-   StataReader.data
-   StataReader.data_label
-   StataReader.value_labels
-   StataReader.variable_labels
-   StataWriter.write_file
-
-.. currentmodule:: pandas
-
-General functions
------------------
-
-Data manipulations
-~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   melt
-   pivot
-   pivot_table
-   crosstab
-   cut
-   qcut
-   merge
-   merge_ordered
-   merge_asof
-   concat
-   get_dummies
-   factorize
-   wide_to_long
-
-Top-level missing data
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   isnull
-   notnull
-
-Top-level conversions
-~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   to_numeric
-
-Top-level dealing with datetimelike
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   to_datetime
-   to_timedelta
-   date_range
-   bdate_range
-   period_range
-   timedelta_range
-   infer_freq
-
-Top-level evaluation
-~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   eval
-
-Testing
-~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   test
-
-.. _api.series:
-
-Series
-------
-
-Constructor
-~~~~~~~~~~~
-
-.. currentmodule:: pandas
-
-.. autosummary::
-   :toctree: generated/
-
-   Series
-
-Attributes
-~~~~~~~~~~
-**Axes**
-  * **index**: axis labels
-
-.. autosummary::
-   :toctree: generated/
-
-   Series.values
-   Series.dtype
-   Series.ftype
-   Series.shape
-   Series.nbytes
-   Series.ndim
-   Series.size
-   Series.strides
-   Series.itemsize
-   Series.base
-   Series.T
-   Series.memory_usage
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.astype
-   Series.copy
-   Series.isnull
-   Series.notnull
-
-Indexing, iteration
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.get
-   Series.at
-   Series.iat
-   Series.loc
-   Series.iloc
-   Series.__iter__
-   Series.iteritems
-
-For more information on ``.at``, ``.iat``, ``.loc``, and
-``.iloc``,  see the :ref:`indexing documentation <indexing>`.
-
-Binary operator functions
-~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.add
-   Series.sub
-   Series.mul
-   Series.div
-   Series.truediv
-   Series.floordiv
-   Series.mod
-   Series.pow
-   Series.radd
-   Series.rsub
-   Series.rmul
-   Series.rdiv
-   Series.rtruediv
-   Series.rfloordiv
-   Series.rmod
-   Series.rpow
-   Series.combine
-   Series.combine_first
-   Series.round
-   Series.lt
-   Series.gt
-   Series.le
-   Series.ge
-   Series.ne
-   Series.eq
-
-Function application, GroupBy & Window
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.apply
-   Series.map
-   Series.groupby
-   Series.rolling
-   Series.expanding
-   Series.ewm
-
-.. _api.series.stats:
-
-Computations / Descriptive Stats
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.abs
-   Series.all
-   Series.any
-   Series.autocorr
-   Series.between
-   Series.clip
-   Series.clip_lower
-   Series.clip_upper
-   Series.corr
-   Series.count
-   Series.cov
-   Series.cummax
-   Series.cummin
-   Series.cumprod
-   Series.cumsum
-   Series.describe
-   Series.diff
-   Series.factorize
-   Series.kurt
-   Series.mad
-   Series.max
-   Series.mean
-   Series.median
-   Series.min
-   Series.mode
-   Series.nlargest
-   Series.nsmallest
-   Series.pct_change
-   Series.prod
-   Series.quantile
-   Series.rank
-   Series.sem
-   Series.skew
-   Series.std
-   Series.sum
-   Series.var
-   Series.unique
-   Series.nunique
-   Series.is_unique
-   Series.is_monotonic
-   Series.is_monotonic_increasing
-   Series.is_monotonic_decreasing
-   Series.value_counts
-
-Reindexing / Selection / Label manipulation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.align
-   Series.drop
-   Series.drop_duplicates
-   Series.duplicated
-   Series.equals
-   Series.first
-   Series.head
-   Series.idxmax
-   Series.idxmin
-   Series.isin
-   Series.last
-   Series.reindex
-   Series.reindex_like
-   Series.rename
-   Series.rename_axis
-   Series.reset_index
-   Series.sample
-   Series.select
-   Series.take
-   Series.tail
-   Series.truncate
-   Series.where
-   Series.mask
-
-Missing data handling
-~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.dropna
-   Series.fillna
-   Series.interpolate
-
-Reshaping, sorting
-~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.argsort
-   Series.reorder_levels
-   Series.sort_values
-   Series.sort_index
-   Series.swaplevel
-   Series.unstack
-   Series.searchsorted
-
-Combining / joining / merging
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.append
-   Series.replace
-   Series.update
-
-Time series-related
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.asfreq
-   Series.asof
-   Series.shift
-   Series.first_valid_index
-   Series.last_valid_index
-   Series.resample
-   Series.tz_convert
-   Series.tz_localize
-
-Datetimelike Properties
-~~~~~~~~~~~~~~~~~~~~~~~
-
-``Series.dt`` can be used to access the values of the series as
-datetimelike and return several properties.
-These can be accessed like ``Series.dt.<property>``.
-
-**Datetime Properties**
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_attribute.rst
-
-   Series.dt.date
-   Series.dt.time
-   Series.dt.year
-   Series.dt.month
-   Series.dt.day
-   Series.dt.hour
-   Series.dt.minute
-   Series.dt.second
-   Series.dt.microsecond
-   Series.dt.nanosecond
-   Series.dt.week
-   Series.dt.weekofyear
-   Series.dt.dayofweek
-   Series.dt.weekday
-   Series.dt.weekday_name
-   Series.dt.dayofyear
-   Series.dt.quarter
-   Series.dt.is_month_start
-   Series.dt.is_month_end
-   Series.dt.is_quarter_start
-   Series.dt.is_quarter_end
-   Series.dt.is_year_start
-   Series.dt.is_year_end
-   Series.dt.is_leap_year
-   Series.dt.daysinmonth
-   Series.dt.days_in_month
-   Series.dt.tz
-   Series.dt.freq
-
-**Datetime Methods**
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   Series.dt.to_period
-   Series.dt.to_pydatetime
-   Series.dt.tz_localize
-   Series.dt.tz_convert
-   Series.dt.normalize
-   Series.dt.strftime
-   Series.dt.round
-   Series.dt.floor
-   Series.dt.ceil
-
-**Timedelta Properties**
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_attribute.rst
-
-   Series.dt.days
-   Series.dt.seconds
-   Series.dt.microseconds
-   Series.dt.nanoseconds
-   Series.dt.components
-
-**Timedelta Methods**
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   Series.dt.to_pytimedelta
-   Series.dt.total_seconds
-
-String handling
-~~~~~~~~~~~~~~~
-``Series.str`` can be used to access the values of the series as
-strings and apply several methods to it. These can be accessed like
-``Series.str.<function/property>``.
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   Series.str.capitalize
-   Series.str.cat
-   Series.str.center
-   Series.str.contains
-   Series.str.count
-   Series.str.decode
-   Series.str.encode
-   Series.str.endswith
-   Series.str.extract
-   Series.str.extractall
-   Series.str.find
-   Series.str.findall
-   Series.str.get
-   Series.str.index
-   Series.str.join
-   Series.str.len
-   Series.str.ljust
-   Series.str.lower
-   Series.str.lstrip
-   Series.str.match
-   Series.str.normalize
-   Series.str.pad
-   Series.str.partition
-   Series.str.repeat
-   Series.str.replace
-   Series.str.rfind
-   Series.str.rindex
-   Series.str.rjust
-   Series.str.rpartition
-   Series.str.rstrip
-   Series.str.slice
-   Series.str.slice_replace
-   Series.str.split
-   Series.str.rsplit
-   Series.str.startswith
-   Series.str.strip
-   Series.str.swapcase
-   Series.str.title
-   Series.str.translate
-   Series.str.upper
-   Series.str.wrap
-   Series.str.zfill
-   Series.str.isalnum
-   Series.str.isalpha
-   Series.str.isdigit
-   Series.str.isspace
-   Series.str.islower
-   Series.str.isupper
-   Series.str.istitle
-   Series.str.isnumeric
-   Series.str.isdecimal
-   Series.str.get_dummies
-
-..
-    The following is needed to ensure the generated pages are created with the
-    correct template (otherwise they would be created in the Series/Index class page)
-
-..
-    .. autosummary::
-       :toctree: generated/
-       :template: autosummary/accessor.rst
-
-       Series.str
-       Series.cat
-       Series.dt
-       Index.str
-       CategoricalIndex.str
-       MultiIndex.str
-       DatetimeIndex.str
-       TimedeltaIndex.str
-
-
-.. _api.categorical:
-
-Categorical
-~~~~~~~~~~~
-
-If the Series is of dtype ``category``, ``Series.cat`` can be used to change the the categorical
-data. This accessor is similar to the ``Series.dt`` or ``Series.str`` and has the
-following usable methods and properties:
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_attribute.rst
-
-   Series.cat.categories
-   Series.cat.ordered
-   Series.cat.codes
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   Series.cat.rename_categories
-   Series.cat.reorder_categories
-   Series.cat.add_categories
-   Series.cat.remove_categories
-   Series.cat.remove_unused_categories
-   Series.cat.set_categories
-   Series.cat.as_ordered
-   Series.cat.as_unordered
-
-To create a Series of dtype ``category``, use ``cat = s.astype("category")``.
-
-The following two ``Categorical`` constructors are considered API but should only be used when
-adding ordering information or special categories is need at creation time of the categorical data:
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/class_without_autosummary.rst
-
-   Categorical
-
-.. autosummary::
-   :toctree: generated/
-
-   Categorical.from_codes
-
-``np.asarray(categorical)`` works by implementing the array interface. Be aware, that this converts
-the Categorical back to a numpy array, so levels and order information is not preserved!
-
-.. autosummary::
-   :toctree: generated/
-
-   Categorical.__array__
-
-Plotting
-~~~~~~~~
-
-``Series.plot`` is both a callable method and a namespace attribute for
-specific plotting methods of the form ``Series.plot.<kind>``.
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_callable.rst
-
-   Series.plot
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   Series.plot.area
-   Series.plot.bar
-   Series.plot.barh
-   Series.plot.box
-   Series.plot.density
-   Series.plot.hist
-   Series.plot.kde
-   Series.plot.line
-   Series.plot.pie
-
-.. autosummary::
-   :toctree: generated/
-
-   Series.hist
-
-Serialization / IO / Conversion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Series.from_csv
-   Series.to_pickle
-   Series.to_csv
-   Series.to_dict
-   Series.to_excel
-   Series.to_frame
-   Series.to_xarray
-   Series.to_hdf
-   Series.to_sql
-   Series.to_msgpack
-   Series.to_json
-   Series.to_sparse
-   Series.to_dense
-   Series.to_string
-   Series.to_clipboard
-
-Sparse
-~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   SparseSeries.to_coo
-   SparseSeries.from_coo
-
-.. _api.dataframe:
-
-DataFrame
----------
-
-Constructor
-~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame
-
-Attributes and underlying data
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-**Axes**
-
-  * **index**: row labels
-  * **columns**: column labels
-
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.as_matrix
-   DataFrame.dtypes
-   DataFrame.ftypes
-   DataFrame.get_dtype_counts
-   DataFrame.get_ftype_counts
-   DataFrame.select_dtypes
-   DataFrame.values
-   DataFrame.axes
-   DataFrame.ndim
-   DataFrame.size
-   DataFrame.shape
-   DataFrame.memory_usage
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.astype
-   DataFrame.convert_objects
-   DataFrame.copy
-   DataFrame.isnull
-   DataFrame.notnull
-
-Indexing, iteration
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.head
-   DataFrame.at
-   DataFrame.iat
-   DataFrame.loc
-   DataFrame.iloc
-   DataFrame.insert
-   DataFrame.__iter__
-   DataFrame.iteritems
-   DataFrame.iterrows
-   DataFrame.itertuples
-   DataFrame.lookup
-   DataFrame.pop
-   DataFrame.tail
-   DataFrame.xs
-   DataFrame.isin
-   DataFrame.where
-   DataFrame.mask
-   DataFrame.query
-
-For more information on ``.at``, ``.iat``, ``.loc``, and
-``.iloc``,  see the :ref:`indexing documentation <indexing>`.
-
-
-Binary operator functions
-~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.add
-   DataFrame.sub
-   DataFrame.mul
-   DataFrame.div
-   DataFrame.truediv
-   DataFrame.floordiv
-   DataFrame.mod
-   DataFrame.pow
-   DataFrame.radd
-   DataFrame.rsub
-   DataFrame.rmul
-   DataFrame.rdiv
-   DataFrame.rtruediv
-   DataFrame.rfloordiv
-   DataFrame.rmod
-   DataFrame.rpow
-   DataFrame.lt
-   DataFrame.gt
-   DataFrame.le
-   DataFrame.ge
-   DataFrame.ne
-   DataFrame.eq
-   DataFrame.combine
-   DataFrame.combine_first
-
-Function application, GroupBy & Window
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.apply
-   DataFrame.applymap
-   DataFrame.groupby
-   DataFrame.rolling
-   DataFrame.expanding
-   DataFrame.ewm
-
-.. _api.dataframe.stats:
-
-Computations / Descriptive Stats
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.abs
-   DataFrame.all
-   DataFrame.any
-   DataFrame.clip
-   DataFrame.clip_lower
-   DataFrame.clip_upper
-   DataFrame.corr
-   DataFrame.corrwith
-   DataFrame.count
-   DataFrame.cov
-   DataFrame.cummax
-   DataFrame.cummin
-   DataFrame.cumprod
-   DataFrame.cumsum
-   DataFrame.describe
-   DataFrame.diff
-   DataFrame.eval
-   DataFrame.kurt
-   DataFrame.mad
-   DataFrame.max
-   DataFrame.mean
-   DataFrame.median
-   DataFrame.min
-   DataFrame.mode
-   DataFrame.pct_change
-   DataFrame.prod
-   DataFrame.quantile
-   DataFrame.rank
-   DataFrame.round
-   DataFrame.sem
-   DataFrame.skew
-   DataFrame.sum
-   DataFrame.std
-   DataFrame.var
-
-Reindexing / Selection / Label manipulation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.add_prefix
-   DataFrame.add_suffix
-   DataFrame.align
-   DataFrame.drop
-   DataFrame.drop_duplicates
-   DataFrame.duplicated
-   DataFrame.equals
-   DataFrame.filter
-   DataFrame.first
-   DataFrame.head
-   DataFrame.idxmax
-   DataFrame.idxmin
-   DataFrame.last
-   DataFrame.reindex
-   DataFrame.reindex_axis
-   DataFrame.reindex_like
-   DataFrame.rename
-   DataFrame.rename_axis
-   DataFrame.reset_index
-   DataFrame.sample
-   DataFrame.select
-   DataFrame.set_index
-   DataFrame.tail
-   DataFrame.take
-   DataFrame.truncate
-
-.. _api.dataframe.missing:
-
-Missing data handling
-~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.dropna
-   DataFrame.fillna
-   DataFrame.replace
-
-Reshaping, sorting, transposing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.pivot
-   DataFrame.reorder_levels
-   DataFrame.sort_values
-   DataFrame.sort_index
-   DataFrame.nlargest
-   DataFrame.nsmallest
-   DataFrame.swaplevel
-   DataFrame.stack
-   DataFrame.unstack
-   DataFrame.T
-   DataFrame.to_panel
-   DataFrame.to_xarray
-   DataFrame.transpose
-
-Combining / joining / merging
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.append
-   DataFrame.assign
-   DataFrame.join
-   DataFrame.merge
-   DataFrame.update
-
-Time series-related
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.asfreq
-   DataFrame.asof
-   DataFrame.shift
-   DataFrame.first_valid_index
-   DataFrame.last_valid_index
-   DataFrame.resample
-   DataFrame.to_period
-   DataFrame.to_timestamp
-   DataFrame.tz_convert
-   DataFrame.tz_localize
-
-.. _api.dataframe.plotting:
-
-Plotting
-~~~~~~~~
-
-``DataFrame.plot`` is both a callable method and a namespace attribute for
-specific plotting methods of the form ``DataFrame.plot.<kind>``.
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_callable.rst
-
-   DataFrame.plot
-
-.. autosummary::
-   :toctree: generated/
-   :template: autosummary/accessor_method.rst
-
-   DataFrame.plot.area
-   DataFrame.plot.bar
-   DataFrame.plot.barh
-   DataFrame.plot.box
-   DataFrame.plot.density
-   DataFrame.plot.hexbin
-   DataFrame.plot.hist
-   DataFrame.plot.kde
-   DataFrame.plot.line
-   DataFrame.plot.pie
-   DataFrame.plot.scatter
-
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.boxplot
-   DataFrame.hist
-
-Serialization / IO / Conversion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DataFrame.from_csv
-   DataFrame.from_dict
-   DataFrame.from_items
-   DataFrame.from_records
-   DataFrame.info
-   DataFrame.to_pickle
-   DataFrame.to_csv
-   DataFrame.to_hdf
-   DataFrame.to_sql
-   DataFrame.to_dict
-   DataFrame.to_excel
-   DataFrame.to_json
-   DataFrame.to_html
-   DataFrame.to_feather
-   DataFrame.to_latex
-   DataFrame.to_stata
-   DataFrame.to_msgpack
-   DataFrame.to_gbq
-   DataFrame.to_records
-   DataFrame.to_sparse
-   DataFrame.to_dense
-   DataFrame.to_string
-   DataFrame.to_clipboard
-
-Sparse
-~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   SparseDataFrame.to_coo
-
-.. _api.panel:
-
-Panel
-------
-
-Constructor
-~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel
-
-Attributes and underlying data
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-**Axes**
-
-  * **items**: axis 0; each item corresponds to a DataFrame contained inside
-  * **major_axis**: axis 1; the index (rows) of each of the DataFrames
-  * **minor_axis**: axis 2; the columns of each of the DataFrames
-
-.. autosummary::
-   :toctree: generated/
-
-   Panel.values
-   Panel.axes
-   Panel.ndim
-   Panel.size
-   Panel.shape
-   Panel.dtypes
-   Panel.ftypes
-   Panel.get_dtype_counts
-   Panel.get_ftype_counts
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.astype
-   Panel.copy
-   Panel.isnull
-   Panel.notnull
-
-Getting and setting
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.get_value
-   Panel.set_value
-
-Indexing, iteration, slicing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.at
-   Panel.iat
-   Panel.loc
-   Panel.iloc
-   Panel.__iter__
-   Panel.iteritems
-   Panel.pop
-   Panel.xs
-   Panel.major_xs
-   Panel.minor_xs
-
-For more information on ``.at``, ``.iat``, ``.loc``, and
-``.iloc``,  see the :ref:`indexing documentation <indexing>`.
-
-Binary operator functions
-~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.add
-   Panel.sub
-   Panel.mul
-   Panel.div
-   Panel.truediv
-   Panel.floordiv
-   Panel.mod
-   Panel.pow
-   Panel.radd
-   Panel.rsub
-   Panel.rmul
-   Panel.rdiv
-   Panel.rtruediv
-   Panel.rfloordiv
-   Panel.rmod
-   Panel.rpow
-   Panel.lt
-   Panel.gt
-   Panel.le
-   Panel.ge
-   Panel.ne
-   Panel.eq
-
-Function application, GroupBy
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.apply
-   Panel.groupby
-
-.. _api.panel.stats:
-
-Computations / Descriptive Stats
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.abs
-   Panel.clip
-   Panel.clip_lower
-   Panel.clip_upper
-   Panel.count
-   Panel.cummax
-   Panel.cummin
-   Panel.cumprod
-   Panel.cumsum
-   Panel.max
-   Panel.mean
-   Panel.median
-   Panel.min
-   Panel.pct_change
-   Panel.prod
-   Panel.sem
-   Panel.skew
-   Panel.sum
-   Panel.std
-   Panel.var
-
-Reindexing / Selection / Label manipulation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.add_prefix
-   Panel.add_suffix
-   Panel.drop
-   Panel.equals
-   Panel.filter
-   Panel.first
-   Panel.last
-   Panel.reindex
-   Panel.reindex_axis
-   Panel.reindex_like
-   Panel.rename
-   Panel.sample
-   Panel.select
-   Panel.take
-   Panel.truncate
-
-Missing data handling
-~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.dropna
-   Panel.fillna
-
-Reshaping, sorting, transposing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.sort_index
-   Panel.swaplevel
-   Panel.transpose
-   Panel.swapaxes
-   Panel.conform
-
-Combining / joining / merging
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.join
-   Panel.update
-
-Time series-related
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.asfreq
-   Panel.shift
-   Panel.resample
-   Panel.tz_convert
-   Panel.tz_localize
-
-Serialization / IO / Conversion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Panel.from_dict
-   Panel.to_pickle
-   Panel.to_excel
-   Panel.to_hdf
-   Panel.to_sparse
-   Panel.to_frame
-   Panel.to_xarray
-   Panel.to_clipboard
-
-.. _api.index:
-
-Index
------
-
-**Many of these methods or variants thereof are available on the objects
-that contain an index (Series/Dataframe) and those should most likely be
-used before calling these methods directly.**
-
-.. autosummary::
-   :toctree: generated/
-
-   Index
-
-Attributes
-~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   Index.values
-   Index.is_monotonic
-   Index.is_monotonic_increasing
-   Index.is_monotonic_decreasing
-   Index.is_unique
-   Index.has_duplicates
-   Index.dtype
-   Index.inferred_type
-   Index.is_all_dates
-   Index.shape
-   Index.nbytes
-   Index.ndim
-   Index.size
-   Index.empty
-   Index.strides
-   Index.itemsize
-   Index.base
-   Index.T
-   Index.memory_usage
-
-Modifying and Computations
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.all
-   Index.any
-   Index.argmin
-   Index.argmax
-   Index.copy
-   Index.delete
-   Index.drop
-   Index.drop_duplicates
-   Index.duplicated
-   Index.equals
-   Index.factorize
-   Index.identical
-   Index.insert
-   Index.min
-   Index.max
-   Index.reindex
-   Index.repeat
-   Index.where
-   Index.take
-   Index.putmask
-   Index.set_names
-   Index.unique
-   Index.nunique
-   Index.value_counts
-
-Missing Values
-~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.fillna
-   Index.dropna
-   Index.isnull
-   Index.notnull
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.astype
-   Index.tolist
-   Index.to_datetime
-   Index.to_series
-
-Sorting
-~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.argsort
-   Index.sort_values
-
-Time-specific operations
-~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.shift
-
-Combining / joining / set operations
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.append
-   Index.join
-   Index.intersection
-   Index.union
-   Index.difference
-   Index.symmetric_difference
-
-Selecting
-~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Index.get_indexer
-   Index.get_indexer_non_unique
-   Index.get_level_values
-   Index.get_loc
-   Index.get_value
-   Index.isin
-   Index.slice_indexer
-   Index.slice_locs
-
-.. _api.categoricalindex:
-
-CategoricalIndex
-----------------
-
-.. autosummary::
-   :toctree: generated/
-
-   CategoricalIndex
-
-Categorical Components
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   CategoricalIndex.codes
-   CategoricalIndex.categories
-   CategoricalIndex.ordered
-   CategoricalIndex.rename_categories
-   CategoricalIndex.reorder_categories
-   CategoricalIndex.add_categories
-   CategoricalIndex.remove_categories
-   CategoricalIndex.remove_unused_categories
-   CategoricalIndex.set_categories
-   CategoricalIndex.as_ordered
-   CategoricalIndex.as_unordered
-
-.. _api.multiindex:
-
-MultiIndex
-----------
-
-.. autosummary::
-   :toctree: generated/
-
-   MultiIndex
-   IndexSlice
-
-MultiIndex Components
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   MultiIndex.from_arrays
-   MultiIndex.from_tuples
-   MultiIndex.from_product
-   MultiIndex.set_levels
-   MultiIndex.set_labels
-   MultiIndex.to_hierarchical
-   MultiIndex.to_frame
-   MultiIndex.is_lexsorted
-   MultiIndex.droplevel
-   MultiIndex.swaplevel
-   MultiIndex.reorder_levels
-
-.. _api.datetimeindex:
-
-DatetimeIndex
--------------
-
-.. autosummary::
-   :toctree: generated/
-
-   DatetimeIndex
-
-Time/Date Components
-~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   DatetimeIndex.year
-   DatetimeIndex.month
-   DatetimeIndex.day
-   DatetimeIndex.hour
-   DatetimeIndex.minute
-   DatetimeIndex.second
-   DatetimeIndex.microsecond
-   DatetimeIndex.nanosecond
-   DatetimeIndex.date
-   DatetimeIndex.time
-   DatetimeIndex.dayofyear
-   DatetimeIndex.weekofyear
-   DatetimeIndex.week
-   DatetimeIndex.dayofweek
-   DatetimeIndex.weekday
-   DatetimeIndex.weekday_name
-   DatetimeIndex.quarter
-   DatetimeIndex.tz
-   DatetimeIndex.freq
-   DatetimeIndex.freqstr
-   DatetimeIndex.is_month_start
-   DatetimeIndex.is_month_end
-   DatetimeIndex.is_quarter_start
-   DatetimeIndex.is_quarter_end
-   DatetimeIndex.is_year_start
-   DatetimeIndex.is_year_end
-   DatetimeIndex.is_leap_year
-   DatetimeIndex.inferred_freq
-
-Selecting
-~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DatetimeIndex.indexer_at_time
-   DatetimeIndex.indexer_between_time
-
-
-Time-specific operations
-~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DatetimeIndex.normalize
-   DatetimeIndex.strftime
-   DatetimeIndex.snap
-   DatetimeIndex.tz_convert
-   DatetimeIndex.tz_localize
-   DatetimeIndex.round
-   DatetimeIndex.floor
-   DatetimeIndex.ceil
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   DatetimeIndex.to_datetime
-   DatetimeIndex.to_period
-   DatetimeIndex.to_perioddelta
-   DatetimeIndex.to_pydatetime
-   DatetimeIndex.to_series
-
-TimedeltaIndex
---------------
-
-.. autosummary::
-   :toctree: generated/
-
-   TimedeltaIndex
-
-Components
-~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   TimedeltaIndex.days
-   TimedeltaIndex.seconds
-   TimedeltaIndex.microseconds
-   TimedeltaIndex.nanoseconds
-   TimedeltaIndex.components
-   TimedeltaIndex.inferred_freq
-
-Conversion
-~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   TimedeltaIndex.to_pytimedelta
-   TimedeltaIndex.to_series
-   TimedeltaIndex.round
-   TimedeltaIndex.floor
-   TimedeltaIndex.ceil
-
-Window
-------
-.. currentmodule:: pandas.core.window
-
-Rolling objects are returned by ``.rolling`` calls: :func:`pandas.DataFrame.rolling`, :func:`pandas.Series.rolling`, etc.
-Expanding objects are returned by ``.expanding`` calls: :func:`pandas.DataFrame.expanding`, :func:`pandas.Series.expanding`, etc.
-EWM objects are returned by ``.ewm`` calls: :func:`pandas.DataFrame.ewm`, :func:`pandas.Series.ewm`, etc.
-
-Standard moving window functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. currentmodule:: pandas.core.window
-
-.. autosummary::
-   :toctree: generated/
-
-   Rolling.count
-   Rolling.sum
-   Rolling.mean
-   Rolling.median
-   Rolling.var
-   Rolling.std
-   Rolling.min
-   Rolling.max
-   Rolling.corr
-   Rolling.cov
-   Rolling.skew
-   Rolling.kurt
-   Rolling.apply
-   Rolling.quantile
-   Window.mean
-   Window.sum
-
-.. _api.functions_expanding:
-
-Standard expanding window functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. currentmodule:: pandas.core.window
-
-.. autosummary::
-   :toctree: generated/
-
-   Expanding.count
-   Expanding.sum
-   Expanding.mean
-   Expanding.median
-   Expanding.var
-   Expanding.std
-   Expanding.min
-   Expanding.max
-   Expanding.corr
-   Expanding.cov
-   Expanding.skew
-   Expanding.kurt
-   Expanding.apply
-   Expanding.quantile
-
-Exponentially-weighted moving window functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. currentmodule:: pandas.core.window
-
-.. autosummary::
-   :toctree: generated/
-
-   EWM.mean
-   EWM.std
-   EWM.var
-   EWM.corr
-   EWM.cov
-
-GroupBy
--------
-.. currentmodule:: pandas.core.groupby
-
-GroupBy objects are returned by groupby calls: :func:`pandas.DataFrame.groupby`, :func:`pandas.Series.groupby`, etc.
-
-Indexing, iteration
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   GroupBy.__iter__
-   GroupBy.groups
-   GroupBy.indices
-   GroupBy.get_group
-
-.. currentmodule:: pandas
-
-.. autosummary::
-   :toctree: generated/
-
-   Grouper
-
-.. currentmodule:: pandas.core.groupby
-
-Function application
-~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   GroupBy.apply
-   GroupBy.aggregate
-   GroupBy.transform
-
-Computations / Descriptive Stats
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   GroupBy.count
-   GroupBy.cumcount
-   GroupBy.first
-   GroupBy.head
-   GroupBy.last
-   GroupBy.max
-   GroupBy.mean
-   GroupBy.median
-   GroupBy.min
-   GroupBy.nth
-   GroupBy.ohlc
-   GroupBy.prod
-   GroupBy.size
-   GroupBy.sem
-   GroupBy.std
-   GroupBy.sum
-   GroupBy.var
-   GroupBy.tail
-
-The following methods are available in both ``SeriesGroupBy`` and
-``DataFrameGroupBy`` objects, but may differ slightly, usually in that
-the ``DataFrameGroupBy`` version usually permits the specification of an
-axis argument, and often an argument indicating whether to restrict
-application to columns of a specific data type.
-
-.. autosummary::
-   :toctree: generated/
-
-   DataFrameGroupBy.agg
-   DataFrameGroupBy.all
-   DataFrameGroupBy.any
-   DataFrameGroupBy.bfill
-   DataFrameGroupBy.corr
-   DataFrameGroupBy.count
-   DataFrameGroupBy.cov
-   DataFrameGroupBy.cummax
-   DataFrameGroupBy.cummin
-   DataFrameGroupBy.cumprod
-   DataFrameGroupBy.cumsum
-   DataFrameGroupBy.describe
-   DataFrameGroupBy.diff
-   DataFrameGroupBy.ffill
-   DataFrameGroupBy.fillna
-   DataFrameGroupBy.hist
-   DataFrameGroupBy.idxmax
-   DataFrameGroupBy.idxmin
-   DataFrameGroupBy.mad
-   DataFrameGroupBy.pct_change
-   DataFrameGroupBy.plot
-   DataFrameGroupBy.quantile
-   DataFrameGroupBy.rank
-   DataFrameGroupBy.resample
-   DataFrameGroupBy.shift
-   DataFrameGroupBy.size
-   DataFrameGroupBy.skew
-   DataFrameGroupBy.take
-   DataFrameGroupBy.tshift
-
-The following methods are available only for ``SeriesGroupBy`` objects.
-
-.. autosummary::
-   :toctree: generated/
-
-   SeriesGroupBy.nlargest
-   SeriesGroupBy.nsmallest
-   SeriesGroupBy.nunique
-   SeriesGroupBy.unique
-   SeriesGroupBy.value_counts
-
-The following methods are available only for ``DataFrameGroupBy`` objects.
-
-.. autosummary::
-   :toctree: generated/
-
-   DataFrameGroupBy.corrwith
-   DataFrameGroupBy.boxplot
-
-Resampling
-----------
-.. currentmodule:: pandas.tseries.resample
-
-Resampler objects are returned by resample calls: :func:`pandas.DataFrame.resample`, :func:`pandas.Series.resample`.
-
-Indexing, iteration
-~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Resampler.__iter__
-   Resampler.groups
-   Resampler.indices
-   Resampler.get_group
-
-Function application
-~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Resampler.apply
-   Resampler.aggregate
-   Resampler.transform
-
-Upsampling
-~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   Resampler.ffill
-   Resampler.backfill
-   Resampler.bfill
-   Resampler.pad
-   Resampler.fillna
-   Resampler.asfreq
-   Resampler.interpolate
-
-Computations / Descriptive Stats
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Resampler.count
-   Resampler.nunique
-   Resampler.first
-   Resampler.last
-   Resampler.max
-   Resampler.mean
-   Resampler.median
-   Resampler.min
-   Resampler.ohlc
-   Resampler.prod
-   Resampler.size
-   Resampler.sem
-   Resampler.std
-   Resampler.sum
-   Resampler.var
-
-Style
------
-.. currentmodule:: pandas.formats.style
-
-``Styler`` objects are returned by :attr:`pandas.DataFrame.style`.
-
-
-Constructor
-~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Styler
-
-Style Application
-~~~~~~~~~~~~~~~~~
-.. autosummary::
-   :toctree: generated/
-
-   Styler.apply
-   Styler.applymap
-   Styler.format
-   Styler.set_precision
-   Styler.set_table_styles
-   Styler.set_caption
-   Styler.set_properties
-   Styler.set_uuid
-   Styler.clear
-
-Builtin Styles
-~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   Styler.highlight_max
-   Styler.highlight_min
-   Styler.highlight_null
-   Styler.background_gradient
-   Styler.bar
-
-Style Export and Import
-~~~~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   Styler.render
-   Styler.export
-   Styler.use
-
-.. currentmodule:: pandas
-
-General utility functions
--------------------------
-
-Working with options
-~~~~~~~~~~~~~~~~~~~~
-
-.. autosummary::
-   :toctree: generated/
-
-   describe_option
-   reset_option
-   get_option
-   set_option
-   option_context
diff --git a/doc/source/basics.rst b/doc/source/basics.rst
deleted file mode 100644
index f649b3fd8a9a3..0000000000000
--- a/doc/source/basics.rst
+++ /dev/null
@@ -1,2008 +0,0 @@
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows = 15
-
-.. _basics:
-
-==============================
- Essential Basic Functionality
-==============================
-
-Here we discuss a lot of the essential functionality common to the pandas data
-structures. Here's how to create some of the objects used in the examples from
-the previous section:
-
-.. ipython:: python
-
-   index = pd.date_range('1/1/2000', periods=8)
-   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   df = pd.DataFrame(np.random.randn(8, 3), index=index,
-                     columns=['A', 'B', 'C'])
-   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                 major_axis=pd.date_range('1/1/2000', periods=5),
-                 minor_axis=['A', 'B', 'C', 'D'])
-
-.. _basics.head_tail:
-
-Head and Tail
--------------
-
-To view a small sample of a Series or DataFrame object, use the
-:meth:`~DataFrame.head` and :meth:`~DataFrame.tail` methods. The default number
-of elements to display is five, but you may pass a custom number.
-
-.. ipython:: python
-
-   long_series = pd.Series(np.random.randn(1000))
-   long_series.head()
-   long_series.tail(3)
-
-.. _basics.attrs:
-
-Attributes and the raw ndarray(s)
----------------------------------
-
-pandas objects have a number of attributes enabling you to access the metadata
-
-  * **shape**: gives the axis dimensions of the object, consistent with ndarray
-  * Axis labels
-
-    * **Series**: *index* (only axis)
-    * **DataFrame**: *index* (rows) and *columns*
-    * **Panel**: *items*, *major_axis*, and *minor_axis*
-
-Note, **these attributes can be safely assigned to**!
-
-.. ipython:: python
-
-   df[:2]
-   df.columns = [x.lower() for x in df.columns]
-   df
-
-To get the actual data inside a data structure, one need only access the
-**values** property:
-
-.. ipython:: python
-
-    s.values
-    df.values
-    wp.values
-
-If a DataFrame or Panel contains homogeneously-typed data, the ndarray can
-actually be modified in-place, and the changes will be reflected in the data
-structure. For heterogeneous data (e.g. some of the DataFrame's columns are not
-all the same dtype), this will not be the case. The values attribute itself,
-unlike the axis labels, cannot be assigned to.
-
-.. note::
-
-    When working with heterogeneous data, the dtype of the resulting ndarray
-    will be chosen to accommodate all of the data involved. For example, if
-    strings are involved, the result will be of object dtype. If there are only
-    floats and integers, the resulting array will be of float dtype.
-
-.. _basics.accelerate:
-
-Accelerated operations
-----------------------
-
-pandas has support for accelerating certain types of binary numerical and boolean operations using
-the ``numexpr`` library (starting in 0.11.0) and the ``bottleneck`` libraries.
-
-These libraries are especially useful when dealing with large data sets, and provide large
-speedups. ``numexpr`` uses smart chunking, caching, and multiple cores. ``bottleneck`` is
-a set of specialized cython routines that are especially fast when dealing with arrays that have
-``nans``.
-
-Here is a sample (using 100 column x 100,000 row ``DataFrames``):
-
-.. csv-table::
-    :header: "Operation", "0.11.0 (ms)", "Prior Version (ms)", "Ratio to Prior"
-    :widths: 25, 25, 25, 25
-    :delim: ;
-
-    ``df1 > df2``; 13.32; 125.35;  0.1063
-    ``df1 * df2``; 21.71;  36.63;  0.5928
-    ``df1 + df2``; 22.04;  36.50;  0.6039
-
-You are highly encouraged to install both libraries. See the section
-:ref:`Recommended Dependencies <install.recommended_dependencies>` for more installation info.
-
-.. _basics.binop:
-
-Flexible binary operations
---------------------------
-
-With binary operations between pandas data structures, there are two key points
-of interest:
-
-  * Broadcasting behavior between higher- (e.g. DataFrame) and
-    lower-dimensional (e.g. Series) objects.
-  * Missing data in computations
-
-We will demonstrate how to manage these issues independently, though they can
-be handled simultaneously.
-
-Matching / broadcasting behavior
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-DataFrame has the methods :meth:`~DataFrame.add`, :meth:`~DataFrame.sub`,
-:meth:`~DataFrame.mul`, :meth:`~DataFrame.div` and related functions
-:meth:`~DataFrame.radd`, :meth:`~DataFrame.rsub`, ...
-for carrying out binary operations. For broadcasting behavior,
-Series input is of primary interest. Using these functions, you can use to
-either match on the *index* or *columns* via the **axis** keyword:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'one' : pd.Series(np.random.randn(3), index=['a', 'b', 'c']),
-                      'two' : pd.Series(np.random.randn(4), index=['a', 'b', 'c', 'd']),
-                      'three' : pd.Series(np.random.randn(3), index=['b', 'c', 'd'])})
-   df
-   row = df.iloc[1]
-   column = df['two']
-
-   df.sub(row, axis='columns')
-   df.sub(row, axis=1)
-
-   df.sub(column, axis='index')
-   df.sub(column, axis=0)
-
-.. ipython:: python
-   :suppress:
-
-   df_orig = df
-
-Furthermore you can align a level of a multi-indexed DataFrame with a Series.
-
-.. ipython:: python
-
-   dfmi = df.copy()
-   dfmi.index = pd.MultiIndex.from_tuples([(1,'a'),(1,'b'),(1,'c'),(2,'a')],
-                                          names=['first','second'])
-   dfmi.sub(column, axis=0, level='second')
-
-With Panel, describing the matching behavior is a bit more difficult, so
-the arithmetic methods instead (and perhaps confusingly?) give you the option
-to specify the *broadcast axis*. For example, suppose we wished to demean the
-data over a particular axis. This can be accomplished by taking the mean over
-an axis and broadcasting over the same axis:
-
-.. ipython:: python
-
-   major_mean = wp.mean(axis='major')
-   major_mean
-   wp.sub(major_mean, axis='major')
-
-And similarly for ``axis="items"`` and ``axis="minor"``.
-
-.. note::
-
-   I could be convinced to make the **axis** argument in the DataFrame methods
-   match the broadcasting behavior of Panel. Though it would require a
-   transition period so users can change their code...
-
-Series and Index also support the :func:`divmod` builtin. This function takes
-the floor division and modulo operation at the same time returning a two-tuple
-of the same type as the left hand side. For example:
-
-.. ipython:: python
-
-   s = pd.Series(np.arange(10))
-   s
-   div, rem = divmod(s, 3)
-   div
-   rem
-
-   idx = pd.Index(np.arange(10))
-   idx
-   div, rem = divmod(idx, 3)
-   div
-   rem
-
-We can also do elementwise :func:`divmod`:
-
-.. ipython:: python
-
-   div, rem = divmod(s, [2, 2, 3, 3, 4, 4, 5, 5, 6, 6])
-   div
-   rem
-
-Missing data / operations with fill values
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In Series and DataFrame (though not yet in Panel), the arithmetic functions
-have the option of inputting a *fill_value*, namely a value to substitute when
-at most one of the values at a location are missing. For example, when adding
-two DataFrame objects, you may wish to treat NaN as 0 unless both DataFrames
-are missing that value, in which case the result will be NaN (you can later
-replace NaN with some other value using ``fillna`` if you wish).
-
-.. ipython:: python
-   :suppress:
-
-   df2 = df.copy()
-   df2['three']['a'] = 1.
-
-.. ipython:: python
-
-   df
-   df2
-   df + df2
-   df.add(df2, fill_value=0)
-
-.. _basics.compare:
-
-Flexible Comparisons
-~~~~~~~~~~~~~~~~~~~~
-
-Starting in v0.8, pandas introduced binary comparison methods eq, ne, lt, gt,
-le, and ge to Series and DataFrame whose behavior is analogous to the binary
-arithmetic operations described above:
-
-.. ipython:: python
-
-   df.gt(df2)
-   df2.ne(df)
-
-These operations produce a pandas object the same type as the left-hand-side input
-that if of dtype ``bool``. These ``boolean`` objects can be used in indexing operations,
-see :ref:`here<indexing.boolean>`
-
-.. _basics.reductions:
-
-Boolean Reductions
-~~~~~~~~~~~~~~~~~~
-
-You can apply the reductions: :attr:`~DataFrame.empty`, :meth:`~DataFrame.any`,
-:meth:`~DataFrame.all`, and :meth:`~DataFrame.bool` to provide a
-way to summarize a boolean result.
-
-.. ipython:: python
-
-   (df > 0).all()
-   (df > 0).any()
-
-You can reduce to a final boolean value.
-
-.. ipython:: python
-
-   (df > 0).any().any()
-
-You can test if a pandas object is empty, via the :attr:`~DataFrame.empty` property.
-
-.. ipython:: python
-
-   df.empty
-   pd.DataFrame(columns=list('ABC')).empty
-
-To evaluate single-element pandas objects in a boolean context, use the method
-:meth:`~DataFrame.bool`:
-
-.. ipython:: python
-
-   pd.Series([True]).bool()
-   pd.Series([False]).bool()
-   pd.DataFrame([[True]]).bool()
-   pd.DataFrame([[False]]).bool()
-
-.. warning::
-
-   You might be tempted to do the following:
-
-   .. code-block:: python
-
-       >>> if df:
-            ...
-
-   Or
-
-   .. code-block:: python
-
-       >>> df and df2
-
-   These both will raise as you are trying to compare multiple values.
-
-   .. code-block:: python
-
-       ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
-
-See :ref:`gotchas<gotchas.truth>` for a more detailed discussion.
-
-.. _basics.equals:
-
-Comparing if objects are equivalent
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Often you may find there is more than one way to compute the same
-result.  As a simple example, consider ``df+df`` and ``df*2``. To test
-that these two computations produce the same result, given the tools
-shown above, you might imagine using ``(df+df == df*2).all()``. But in
-fact, this expression is False:
-
-.. ipython:: python
-
-   df+df == df*2
-   (df+df == df*2).all()
-
-Notice that the boolean DataFrame ``df+df == df*2`` contains some False values!
-That is because NaNs do not compare as equals:
-
-.. ipython:: python
-
-   np.nan == np.nan
-
-So, as of v0.13.1, NDFrames (such as Series, DataFrames, and Panels)
-have an :meth:`~DataFrame.equals` method for testing equality, with NaNs in
-corresponding locations treated as equal.
-
-.. ipython:: python
-
-   (df+df).equals(df*2)
-
-Note that the Series or DataFrame index needs to be in the same order for
-equality to be True:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'col':['foo', 0, np.nan]})
-   df2 = pd.DataFrame({'col':[np.nan, 0, 'foo']}, index=[2,1,0])
-   df1.equals(df2)
-   df1.equals(df2.sort_index())
-
-Comparing array-like objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You can conveniently do element-wise comparisons when comparing a pandas
-data structure with a scalar value:
-
-.. ipython:: python
-
-   pd.Series(['foo', 'bar', 'baz']) == 'foo'
-   pd.Index(['foo', 'bar', 'baz']) == 'foo'
-
-Pandas also handles element-wise comparisons between different array-like
-objects of the same length:
-
-.. ipython:: python
-
-    pd.Series(['foo', 'bar', 'baz']) == pd.Index(['foo', 'bar', 'qux'])
-    pd.Series(['foo', 'bar', 'baz']) == np.array(['foo', 'bar', 'qux'])
-
-Trying to compare ``Index`` or ``Series`` objects of different lengths will
-raise a ValueError:
-
-.. code-block:: ipython
-
-    In [55]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo', 'bar'])
-    ValueError: Series lengths must match to compare
-
-    In [56]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo'])
-    ValueError: Series lengths must match to compare
-
-Note that this is different from the numpy behavior where a comparison can
-be broadcast:
-
-.. ipython:: python
-
-    np.array([1, 2, 3]) == np.array([2])
-
-or it can return False if broadcasting can not be done:
-
-.. ipython:: python
-   :okwarning:
-
-    np.array([1, 2, 3]) == np.array([1, 2])
-
-Combining overlapping data sets
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A problem occasionally arising is the combination of two similar data sets
-where values in one are preferred over the other. An example would be two data
-series representing a particular economic indicator where one is considered to
-be of "higher quality". However, the lower quality series might extend further
-back in history or have more complete data coverage. As such, we would like to
-combine two DataFrame objects where missing values in one DataFrame are
-conditionally filled with like-labeled values from the other DataFrame. The
-function implementing this operation is :meth:`~DataFrame.combine_first`,
-which we illustrate:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'A' : [1., np.nan, 3., 5., np.nan],
-                       'B' : [np.nan, 2., 3., np.nan, 6.]})
-   df2 = pd.DataFrame({'A' : [5., 2., 4., np.nan, 3., 7.],
-                       'B' : [np.nan, np.nan, 3., 4., 6., 8.]})
-   df1
-   df2
-   df1.combine_first(df2)
-
-General DataFrame Combine
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The :meth:`~DataFrame.combine_first` method above calls the more general
-DataFrame method :meth:`~DataFrame.combine`. This method takes another DataFrame
-and a combiner function, aligns the input DataFrame and then passes the combiner
-function pairs of Series (i.e., columns whose names are the same).
-
-So, for instance, to reproduce :meth:`~DataFrame.combine_first` as above:
-
-.. ipython:: python
-
-   combiner = lambda x, y: np.where(pd.isnull(x), y, x)
-   df1.combine(df2, combiner)
-
-.. _basics.stats:
-
-Descriptive statistics
-----------------------
-
-A large number of methods for computing descriptive statistics and other related
-operations on :ref:`Series <api.series.stats>`, :ref:`DataFrame
-<api.dataframe.stats>`, and :ref:`Panel <api.panel.stats>`. Most of these
-are aggregations (hence producing a lower-dimensional result) like
-:meth:`~DataFrame.sum`, :meth:`~DataFrame.mean`, and :meth:`~DataFrame.quantile`,
-but some of them, like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod`,
-produce an object of the same size. Generally speaking, these methods take an
-**axis** argument, just like *ndarray.{sum, std, ...}*, but the axis can be
-specified by name or integer:
-
-  - **Series**: no axis argument needed
-  - **DataFrame**: "index" (axis=0, default), "columns" (axis=1)
-  - **Panel**: "items" (axis=0), "major" (axis=1, default), "minor"
-    (axis=2)
-
-For example:
-
-.. ipython:: python
-
-   df
-   df.mean(0)
-   df.mean(1)
-
-All such methods have a ``skipna`` option signaling whether to exclude missing
-data (``True`` by default):
-
-.. ipython:: python
-
-   df.sum(0, skipna=False)
-   df.sum(axis=1, skipna=True)
-
-Combined with the broadcasting / arithmetic behavior, one can describe various
-statistical procedures, like standardization (rendering data zero mean and
-standard deviation 1), very concisely:
-
-.. ipython:: python
-
-   ts_stand = (df - df.mean()) / df.std()
-   ts_stand.std()
-   xs_stand = df.sub(df.mean(1), axis=0).div(df.std(1), axis=0)
-   xs_stand.std(1)
-
-Note that methods like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod`
-preserve the location of ``NaN`` values. This is somewhat different from
-:meth:`~DataFrame.expanding` and :meth:`~DataFrame.rolling`.
-For more details please see :ref:`this note <stats.moments.expanding.note>`.
-
-.. ipython:: python
-
-   df.cumsum()
-
-Here is a quick reference summary table of common functions. Each also takes an
-optional ``level`` parameter which applies only if the object has a
-:ref:`hierarchical index<advanced.hierarchical>`.
-
-.. csv-table::
-    :header: "Function", "Description"
-    :widths: 20, 80
-
-    ``count``, Number of non-null observations
-    ``sum``, Sum of values
-    ``mean``, Mean of values
-    ``mad``, Mean absolute deviation
-    ``median``, Arithmetic median of values
-    ``min``, Minimum
-    ``max``, Maximum
-    ``mode``, Mode
-    ``abs``, Absolute Value
-    ``prod``, Product of values
-    ``std``, Bessel-corrected sample standard deviation
-    ``var``, Unbiased variance
-    ``sem``, Standard error of the mean
-    ``skew``, Sample skewness (3rd moment)
-    ``kurt``, Sample kurtosis (4th moment)
-    ``quantile``, Sample quantile (value at %)
-    ``cumsum``, Cumulative sum
-    ``cumprod``, Cumulative product
-    ``cummax``, Cumulative maximum
-    ``cummin``, Cumulative minimum
-
-Note that by chance some NumPy methods, like ``mean``, ``std``, and ``sum``,
-will exclude NAs on Series input by default:
-
-.. ipython:: python
-
-   np.mean(df['one'])
-   np.mean(df['one'].values)
-
-``Series`` also has a method :meth:`~Series.nunique` which will return the
-number of unique non-null values:
-
-.. ipython:: python
-
-   series = pd.Series(np.random.randn(500))
-   series[20:500] = np.nan
-   series[10:20]  = 5
-   series.nunique()
-
-.. _basics.describe:
-
-Summarizing data: describe
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-There is a convenient :meth:`~DataFrame.describe` function which computes a variety of summary
-statistics about a Series or the columns of a DataFrame (excluding NAs of
-course):
-
-.. ipython:: python
-
-    series = pd.Series(np.random.randn(1000))
-    series[::2] = np.nan
-    series.describe()
-    frame = pd.DataFrame(np.random.randn(1000, 5), columns=['a', 'b', 'c', 'd', 'e'])
-    frame.iloc[::2] = np.nan
-    frame.describe()
-
-You can select specific percentiles to include in the output:
-
-.. ipython:: python
-
-    series.describe(percentiles=[.05, .25, .75, .95])
-
-By default, the median is always included.
-
-For a non-numerical Series object, :meth:`~Series.describe` will give a simple
-summary of the number of unique values and most frequently occurring values:
-
-.. ipython:: python
-
-   s = pd.Series(['a', 'a', 'b', 'b', 'a', 'a', np.nan, 'c', 'd', 'a'])
-   s.describe()
-
-Note that on a mixed-type DataFrame object, :meth:`~DataFrame.describe` will
-restrict the summary to include only numerical columns or, if none are, only
-categorical columns:
-
-.. ipython:: python
-
-    frame = pd.DataFrame({'a': ['Yes', 'Yes', 'No', 'No'], 'b': range(4)})
-    frame.describe()
-
-This behaviour can be controlled by providing a list of types as ``include``/``exclude``
-arguments. The special value ``all`` can also be used:
-
-.. ipython:: python
-
-    frame.describe(include=['object'])
-    frame.describe(include=['number'])
-    frame.describe(include='all')
-
-That feature relies on :ref:`select_dtypes <basics.selectdtypes>`. Refer to
-there for details about accepted inputs.
-
-.. _basics.idxmin:
-
-Index of Min/Max Values
-~~~~~~~~~~~~~~~~~~~~~~~
-
-The :meth:`~DataFrame.idxmin` and :meth:`~DataFrame.idxmax` functions on Series
-and DataFrame compute the index labels with the minimum and maximum
-corresponding values:
-
-.. ipython:: python
-
-   s1 = pd.Series(np.random.randn(5))
-   s1
-   s1.idxmin(), s1.idxmax()
-
-   df1 = pd.DataFrame(np.random.randn(5,3), columns=['A','B','C'])
-   df1
-   df1.idxmin(axis=0)
-   df1.idxmax(axis=1)
-
-When there are multiple rows (or columns) matching the minimum or maximum
-value, :meth:`~DataFrame.idxmin` and :meth:`~DataFrame.idxmax` return the first
-matching index:
-
-.. ipython:: python
-
-   df3 = pd.DataFrame([2, 1, 1, 3, np.nan], columns=['A'], index=list('edcba'))
-   df3
-   df3['A'].idxmin()
-
-.. note::
-
-   ``idxmin`` and ``idxmax`` are called ``argmin`` and ``argmax`` in NumPy.
-
-.. _basics.discretization:
-
-Value counts (histogramming) / Mode
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The :meth:`~Series.value_counts` Series method and top-level function computes a histogram
-of a 1D array of values. It can also be used as a function on regular arrays:
-
-.. ipython:: python
-
-   data = np.random.randint(0, 7, size=50)
-   data
-   s = pd.Series(data)
-   s.value_counts()
-   pd.value_counts(data)
-
-Similarly, you can get the most frequently occurring value(s) (the mode) of the values in a Series or DataFrame:
-
-.. ipython:: python
-
-    s5 = pd.Series([1, 1, 3, 3, 3, 5, 5, 7, 7, 7])
-    s5.mode()
-    df5 = pd.DataFrame({"A": np.random.randint(0, 7, size=50),
-                        "B": np.random.randint(-10, 15, size=50)})
-    df5.mode()
-
-
-Discretization and quantiling
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Continuous values can be discretized using the :func:`cut` (bins based on values)
-and :func:`qcut` (bins based on sample quantiles) functions:
-
-.. ipython:: python
-
-   arr = np.random.randn(20)
-   factor = pd.cut(arr, 4)
-   factor
-
-   factor = pd.cut(arr, [-5, -1, 0, 1, 5])
-   factor
-
-:func:`qcut` computes sample quantiles. For example, we could slice up some
-normally distributed data into equal-size quartiles like so:
-
-.. ipython:: python
-
-   arr = np.random.randn(30)
-   factor = pd.qcut(arr, [0, .25, .5, .75, 1])
-   factor
-   pd.value_counts(factor)
-
-We can also pass infinite values to define the bins:
-
-.. ipython:: python
-
-   arr = np.random.randn(20)
-   factor = pd.cut(arr, [-np.inf, 0, np.inf])
-   factor
-
-.. _basics.apply:
-
-Function application
---------------------
-
-To apply your own or another library's functions to pandas objects,
-you should be aware of the three methods below. The appropriate
-method to use depends on whether your function expects to operate
-on an entire ``DataFrame`` or ``Series``, row- or column-wise, or elementwise.
-
-1. `Tablewise Function Application`_: :meth:`~DataFrame.pipe`
-2. `Row or Column-wise Function Application`_: :meth:`~DataFrame.apply`
-3. Elementwise_ function application: :meth:`~DataFrame.applymap`
-
-.. _basics.pipe:
-
-Tablewise Function Application
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.16.2
-
-``DataFrames`` and ``Series`` can of course just be passed into functions.
-However, if the function needs to be called in a chain, consider using the :meth:`~DataFrame.pipe` method.
-Compare the following
-
-.. code-block:: python
-
-   # f, g, and h are functions taking and returning ``DataFrames``
-   >>> f(g(h(df), arg1=1), arg2=2, arg3=3)
-
-with the equivalent
-
-.. code-block:: python
-
-   >>> (df.pipe(h)
-          .pipe(g, arg1=1)
-          .pipe(f, arg2=2, arg3=3)
-       )
-
-Pandas encourages the second style, which is known as method chaining.
-``pipe`` makes it easy to use your own or another library's functions
-in method chains, alongside pandas' methods.
-
-In the example above, the functions ``f``, ``g``, and ``h`` each expected the ``DataFrame`` as the first positional argument.
-What if the function you wish to apply takes its data as, say, the second argument?
-In this case, provide ``pipe`` with a tuple of ``(callable, data_keyword)``.
-``.pipe`` will route the ``DataFrame`` to the argument specified in the tuple.
-
-For example, we can fit a regression using statsmodels. Their API expects a formula first and a ``DataFrame`` as the second argument, ``data``. We pass in the function, keyword pair ``(sm.poisson, 'data')`` to ``pipe``:
-
-.. ipython:: python
-
-   import statsmodels.formula.api as sm
-
-   bb = pd.read_csv('data/baseball.csv', index_col='id')
-
-   (bb.query('h > 0')
-      .assign(ln_h = lambda df: np.log(df.h))
-      .pipe((sm.poisson, 'data'), 'hr ~ ln_h + year + g + C(lg)')
-      .fit()
-      .summary()
-   )
-
-The pipe method is inspired by unix pipes and more recently dplyr_ and magrittr_, which
-have introduced the popular ``(%>%)`` (read pipe) operator for R_.
-The implementation of ``pipe`` here is quite clean and feels right at home in python.
-We encourage you to view the source code (``pd.DataFrame.pipe??`` in IPython).
-
-.. _dplyr: https://github.com/hadley/dplyr
-.. _magrittr: https://github.com/smbache/magrittr
-.. _R: http://www.r-project.org
-
-
-Row or Column-wise Function Application
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Arbitrary functions can be applied along the axes of a DataFrame or Panel
-using the :meth:`~DataFrame.apply` method, which, like the descriptive
-statistics methods, take an optional ``axis`` argument:
-
-.. ipython:: python
-
-   df.apply(np.mean)
-   df.apply(np.mean, axis=1)
-   df.apply(lambda x: x.max() - x.min())
-   df.apply(np.cumsum)
-   df.apply(np.exp)
-
-Depending on the return type of the function passed to :meth:`~DataFrame.apply`,
-the result will either be of lower dimension or the same dimension.
-
-:meth:`~DataFrame.apply` combined with some cleverness can be used to answer many questions
-about a data set. For example, suppose we wanted to extract the date where the
-maximum value for each column occurred:
-
-.. ipython:: python
-
-   tsdf = pd.DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
-                       index=pd.date_range('1/1/2000', periods=1000))
-   tsdf.apply(lambda x: x.idxmax())
-
-You may also pass additional arguments and keyword arguments to the :meth:`~DataFrame.apply`
-method. For instance, consider the following function you would like to apply:
-
-.. code-block:: python
-
-   def subtract_and_divide(x, sub, divide=1):
-       return (x - sub) / divide
-
-You may then apply this function as follows:
-
-.. code-block:: python
-
-   df.apply(subtract_and_divide, args=(5,), divide=3)
-
-Another useful feature is the ability to pass Series methods to carry out some
-Series operation on each column or row:
-
-.. ipython:: python
-   :suppress:
-
-   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
-                       index=pd.date_range('1/1/2000', periods=10))
-   tsdf.values[3:7] = np.nan
-
-.. ipython:: python
-
-   tsdf
-   tsdf.apply(pd.Series.interpolate)
-
-
-Finally, :meth:`~DataFrame.apply` takes an argument ``raw`` which is False by default, which
-converts each row or column into a Series before applying the function. When
-set to True, the passed function will instead receive an ndarray object, which
-has positive performance implications if you do not need the indexing
-functionality.
-
-.. seealso::
-
-   The section on :ref:`GroupBy <groupby>` demonstrates related, flexible
-   functionality for grouping by some criterion, applying, and combining the
-   results into a Series, DataFrame, etc.
-
-.. _Elementwise:
-
-Applying elementwise Python functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Since not all functions can be vectorized (accept NumPy arrays and return
-another array or value), the methods :meth:`~DataFrame.applymap` on DataFrame
-and analogously :meth:`~Series.map` on Series accept any Python function taking
-a single value and returning a single value. For example:
-
-.. ipython:: python
-   :suppress:
-
-   df4 = df_orig.copy()
-
-.. ipython:: python
-
-   df4
-   f = lambda x: len(str(x))
-   df4['one'].map(f)
-   df4.applymap(f)
-
-:meth:`Series.map` has an additional feature which is that it can be used to easily
-"link" or "map" values defined by a secondary series. This is closely related
-to :ref:`merging/joining functionality <merging>`:
-
-.. ipython:: python
-
-   s = pd.Series(['six', 'seven', 'six', 'seven', 'six'],
-                 index=['a', 'b', 'c', 'd', 'e'])
-   t = pd.Series({'six' : 6., 'seven' : 7.})
-   s
-   s.map(t)
-
-
-.. _basics.apply_panel:
-
-Applying with a Panel
-~~~~~~~~~~~~~~~~~~~~~
-
-Applying with a ``Panel`` will pass a ``Series`` to the applied function. If the applied
-function returns a ``Series``, the result of the application will be a ``Panel``. If the applied function
-reduces to a scalar, the result of the application will be a ``DataFrame``.
-
-.. note::
-
-   Prior to 0.13.1 ``apply`` on a ``Panel`` would only work on ``ufuncs`` (e.g. ``np.sum/np.max``).
-
-.. ipython:: python
-
-   import pandas.util.testing as tm
-   panel = tm.makePanel(5)
-   panel
-   panel['ItemA']
-
-A transformational apply.
-
-.. ipython:: python
-
-   result = panel.apply(lambda x: x*2, axis='items')
-   result
-   result['ItemA']
-
-A reduction operation.
-
-.. ipython:: python
-
-   panel.apply(lambda x: x.dtype, axis='items')
-
-A similar reduction type operation
-
-.. ipython:: python
-
-   panel.apply(lambda x: x.sum(), axis='major_axis')
-
-This last reduction is equivalent to
-
-.. ipython:: python
-
-   panel.sum('major_axis')
-
-A transformation operation that returns a ``Panel``, but is computing
-the z-score across the ``major_axis``.
-
-.. ipython:: python
-
-   result = panel.apply(
-              lambda x: (x-x.mean())/x.std(),
-              axis='major_axis')
-   result
-   result['ItemA']
-
-Apply can also accept multiple axes in the ``axis`` argument. This will pass a
-``DataFrame`` of the cross-section to the applied function.
-
-.. ipython:: python
-
-   f = lambda x: ((x.T-x.mean(1))/x.std(1)).T
-
-   result = panel.apply(f, axis = ['items','major_axis'])
-   result
-   result.loc[:,:,'ItemA']
-
-This is equivalent to the following
-
-.. ipython:: python
-
-   result = pd.Panel(dict([ (ax, f(panel.loc[:,:,ax]))
-                           for ax in panel.minor_axis ]))
-   result
-   result.loc[:,:,'ItemA']
-
-
-.. _basics.reindexing:
-
-Reindexing and altering labels
-------------------------------
-
-:meth:`~Series.reindex` is the fundamental data alignment method in pandas.
-It is used to implement nearly all other features relying on label-alignment
-functionality. To *reindex* means to conform the data to match a given set of
-labels along a particular axis. This accomplishes several things:
-
-  * Reorders the existing data to match a new set of labels
-  * Inserts missing value (NA) markers in label locations where no data for
-    that label existed
-  * If specified, **fill** data for missing labels using logic (highly relevant
-    to working with time series data)
-
-Here is a simple example:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   s
-   s.reindex(['e', 'b', 'f', 'd'])
-
-Here, the ``f`` label was not contained in the Series and hence appears as
-``NaN`` in the result.
-
-With a DataFrame, you can simultaneously reindex the index and columns:
-
-.. ipython:: python
-
-   df
-   df.reindex(index=['c', 'f', 'b'], columns=['three', 'two', 'one'])
-
-For convenience, you may utilize the :meth:`~Series.reindex_axis` method, which
-takes the labels and a keyword ``axis`` parameter.
-
-Note that the ``Index`` objects containing the actual axis labels can be
-**shared** between objects. So if we have a Series and a DataFrame, the
-following can be done:
-
-.. ipython:: python
-
-   rs = s.reindex(df.index)
-   rs
-   rs.index is df.index
-
-This means that the reindexed Series's index is the same Python object as the
-DataFrame's index.
-
-
-.. seealso::
-
-   :ref:`MultiIndex / Advanced Indexing <advanced>` is an even more concise way of
-   doing reindexing.
-
-.. note::
-
-    When writing performance-sensitive code, there is a good reason to spend
-    some time becoming a reindexing ninja: **many operations are faster on
-    pre-aligned data**. Adding two unaligned DataFrames internally triggers a
-    reindexing step. For exploratory analysis you will hardly notice the
-    difference (because ``reindex`` has been heavily optimized), but when CPU
-    cycles matter sprinkling a few explicit ``reindex`` calls here and there can
-    have an impact.
-
-.. _basics.reindex_like:
-
-Reindexing to align with another object
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You may wish to take an object and reindex its axes to be labeled the same as
-another object. While the syntax for this is straightforward albeit verbose, it
-is a common enough operation that the :meth:`~DataFrame.reindex_like` method is
-available to make this simpler:
-
-.. ipython:: python
-   :suppress:
-
-   df2 = df.reindex(['a', 'b', 'c'], columns=['one', 'two'])
-   df3 = df2 - df2.mean()
-
-
-.. ipython:: python
-
-   df2
-   df3
-   df.reindex_like(df2)
-
-.. _basics.align:
-
-Aligning objects with each other with ``align``
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The :meth:`~Series.align` method is the fastest way to simultaneously align two objects. It
-supports a ``join`` argument (related to :ref:`joining and merging <merging>`):
-
-  - ``join='outer'``: take the union of the indexes (default)
-  - ``join='left'``: use the calling object's index
-  - ``join='right'``: use the passed object's index
-  - ``join='inner'``: intersect the indexes
-
-It returns a tuple with both of the reindexed Series:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   s1 = s[:4]
-   s2 = s[1:]
-   s1.align(s2)
-   s1.align(s2, join='inner')
-   s1.align(s2, join='left')
-
-.. _basics.df_join:
-
-For DataFrames, the join method will be applied to both the index and the
-columns by default:
-
-.. ipython:: python
-
-   df.align(df2, join='inner')
-
-You can also pass an ``axis`` option to only align on the specified axis:
-
-.. ipython:: python
-
-   df.align(df2, join='inner', axis=0)
-
-.. _basics.align.frame.series:
-
-If you pass a Series to :meth:`DataFrame.align`, you can choose to align both
-objects either on the DataFrame's index or columns using the ``axis`` argument:
-
-.. ipython:: python
-
-   df.align(df2.iloc[0], axis=1)
-
-.. _basics.reindex_fill:
-
-Filling while reindexing
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-:meth:`~Series.reindex` takes an optional parameter ``method`` which is a
-filling method chosen from the following table:
-
-.. csv-table::
-    :header: "Method", "Action"
-    :widths: 30, 50
-
-    pad / ffill, Fill values forward
-    bfill / backfill, Fill values backward
-    nearest, Fill from the nearest index value
-
-We illustrate these fill methods on a simple Series:
-
-.. ipython:: python
-
-   rng = pd.date_range('1/3/2000', periods=8)
-   ts = pd.Series(np.random.randn(8), index=rng)
-   ts2 = ts[[0, 3, 6]]
-   ts
-   ts2
-
-   ts2.reindex(ts.index)
-   ts2.reindex(ts.index, method='ffill')
-   ts2.reindex(ts.index, method='bfill')
-   ts2.reindex(ts.index, method='nearest')
-
-These methods require that the indexes are **ordered** increasing or
-decreasing.
-
-Note that the same result could have been achieved using
-:ref:`fillna <missing_data.fillna>` (except for ``method='nearest'``) or
-:ref:`interpolate <missing_data.interpolate>`:
-
-.. ipython:: python
-
-   ts2.reindex(ts.index).fillna(method='ffill')
-
-:meth:`~Series.reindex` will raise a ValueError if the index is not monotonic
-increasing or decreasing. :meth:`~Series.fillna` and :meth:`~Series.interpolate`
-will not make any checks on the order of the index.
-
-.. _basics.limits_on_reindex_fill:
-
-Limits on filling while reindexing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ``limit`` and ``tolerance`` arguments provide additional control over
-filling while reindexing. Limit specifies the maximum count of consecutive
-matches:
-
-.. ipython:: python
-
-   ts2.reindex(ts.index, method='ffill', limit=1)
-
-In contrast, tolerance specifies the maximum distance between the index and
-indexer values:
-
-.. ipython:: python
-
-   ts2.reindex(ts.index, method='ffill', tolerance='1 day')
-
-Notice that when used on a ``DatetimeIndex``, ``TimedeltaIndex`` or
-``PeriodIndex``, ``tolerance`` will coerced into a ``Timedelta`` if possible.
-This allows you to specify tolerance with appropriate strings.
-
-.. _basics.drop:
-
-Dropping labels from an axis
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A method closely related to ``reindex`` is the :meth:`~DataFrame.drop` function.
-It removes a set of labels from an axis:
-
-.. ipython:: python
-
-   df
-   df.drop(['a', 'd'], axis=0)
-   df.drop(['one'], axis=1)
-
-Note that the following also works, but is a bit less obvious / clean:
-
-.. ipython:: python
-
-   df.reindex(df.index.difference(['a', 'd']))
-
-.. _basics.rename:
-
-Renaming / mapping labels
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The :meth:`~DataFrame.rename` method allows you to relabel an axis based on some
-mapping (a dict or Series) or an arbitrary function.
-
-.. ipython:: python
-
-   s
-   s.rename(str.upper)
-
-If you pass a function, it must return a value when called with any of the
-labels (and must produce a set of unique values). A dict or
-Series can also be used:
-
-.. ipython:: python
-
-   df.rename(columns={'one' : 'foo', 'two' : 'bar'},
-             index={'a' : 'apple', 'b' : 'banana', 'd' : 'durian'})
-
-If the mapping doesn't include a column/index label, it isn't renamed. Also
-extra labels in the mapping don't throw an error.
-
-The :meth:`~DataFrame.rename` method also provides an ``inplace`` named
-parameter that is by default ``False`` and copies the underlying data. Pass
-``inplace=True`` to rename the data in place.
-
-.. versionadded:: 0.18.0
-
-Finally, :meth:`~Series.rename` also accepts a scalar or list-like
-for altering the ``Series.name`` attribute.
-
-.. ipython:: python
-
-   s.rename("scalar-name")
-
-.. _basics.rename_axis:
-
-The Panel class has a related :meth:`~Panel.rename_axis` class which can rename
-any of its three axes.
-
-.. _basics.iteration:
-
-Iteration
----------
-
-The behavior of basic iteration over pandas objects depends on the type.
-When iterating over a Series, it is regarded as array-like, and basic iteration
-produces the values. Other data structures, like DataFrame and Panel,
-follow the dict-like convention of iterating over the "keys" of the
-objects.
-
-In short, basic iteration (``for i in object``) produces:
-
-* **Series**: values
-* **DataFrame**: column labels
-* **Panel**: item labels
-
-Thus, for example, iterating over a DataFrame gives you the column names:
-
-.. ipython::
-
-    In [0]: df = pd.DataFrame({'col1' : np.random.randn(3), 'col2' : np.random.randn(3)},
-       ...:                   index=['a', 'b', 'c'])
-
-    In [0]: for col in df:
-       ...:     print(col)
-       ...:
-
-Pandas objects also have the dict-like :meth:`~DataFrame.iteritems` method to
-iterate over the (key, value) pairs.
-
-To iterate over the rows of a DataFrame, you can use the following methods:
-
-* :meth:`~DataFrame.iterrows`: Iterate over the rows of a DataFrame as (index, Series) pairs.
-  This converts the rows to Series objects, which can change the dtypes and has some
-  performance implications.
-* :meth:`~DataFrame.itertuples`: Iterate over the rows of a DataFrame
-  as namedtuples of the values.  This is a lot faster than
-  :meth:`~DataFrame.iterrows`, and is in most cases preferable to use
-  to iterate over the values of a DataFrame.
-
-.. warning::
-
-  Iterating through pandas objects is generally **slow**. In many cases,
-  iterating manually over the rows is not needed and can be avoided with
-  one of the following approaches:
-
-  * Look for a *vectorized* solution: many operations can be performed using
-    built-in methods or numpy functions, (boolean) indexing, ...
-
-  * When you have a function that cannot work on the full DataFrame/Series
-    at once, it is better to use :meth:`~DataFrame.apply` instead of iterating
-    over the values. See the docs on :ref:`function application <basics.apply>`.
-
-  * If you need to do iterative manipulations on the values but performance is
-    important, consider writing the inner loop using e.g. cython or numba.
-    See the :ref:`enhancing performance <enhancingperf>` section for some
-    examples of this approach.
-
-.. warning::
-
-  You should **never modify** something you are iterating over.
-  This is not guaranteed to work in all cases. Depending on the
-  data types, the iterator returns a copy and not a view, and writing
-  to it will have no effect!
-
-  For example, in the following case setting the value has no effect:
-
-  .. ipython:: python
-
-    df = pd.DataFrame({'a': [1, 2, 3], 'b': ['a', 'b', 'c']})
-
-    for index, row in df.iterrows():
-        row['a'] = 10
-
-    df
-
-iteritems
-~~~~~~~~~
-
-Consistent with the dict-like interface, :meth:`~DataFrame.iteritems` iterates
-through key-value pairs:
-
-* **Series**: (index, scalar value) pairs
-* **DataFrame**: (column, Series) pairs
-* **Panel**: (item, DataFrame) pairs
-
-For example:
-
-.. ipython::
-
-   In [0]: for item, frame in wp.iteritems():
-      ...:     print(item)
-      ...:     print(frame)
-      ...:
-
-.. _basics.iterrows:
-
-iterrows
-~~~~~~~~
-
-:meth:`~DataFrame.iterrows` allows you to iterate through the rows of a
-DataFrame as Series objects. It returns an iterator yielding each
-index value along with a Series containing the data in each row:
-
-.. ipython::
-
-   In [0]: for row_index, row in df.iterrows():
-      ...:     print('%s\n%s' % (row_index, row))
-      ...:
-
-.. note::
-
-   Because :meth:`~DataFrame.iterrows` returns a Series for each row,
-   it does **not** preserve dtypes across the rows (dtypes are
-   preserved across columns for DataFrames). For example,
-
-   .. ipython:: python
-
-      df_orig = pd.DataFrame([[1, 1.5]], columns=['int', 'float'])
-      df_orig.dtypes
-      row = next(df_orig.iterrows())[1]
-      row
-
-   All values in ``row``, returned as a Series, are now upcasted
-   to floats, also the original integer value in column `x`:
-
-   .. ipython:: python
-
-      row['int'].dtype
-      df_orig['int'].dtype
-
-   To preserve dtypes while iterating over the rows, it is better
-   to use :meth:`~DataFrame.itertuples` which returns namedtuples of the values
-   and which is generally much faster as ``iterrows``.
-
-For instance, a contrived way to transpose the DataFrame would be:
-
-.. ipython:: python
-
-   df2 = pd.DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
-   print(df2)
-   print(df2.T)
-
-   df2_t = pd.DataFrame(dict((idx,values) for idx, values in df2.iterrows()))
-   print(df2_t)
-
-itertuples
-~~~~~~~~~~
-
-The :meth:`~DataFrame.itertuples` method will return an iterator
-yielding a namedtuple for each row in the DataFrame. The first element
-of the tuple will be the row's corresponding index value, while the
-remaining values are the row values.
-
-For instance,
-
-.. ipython:: python
-
-   for row in df.itertuples():
-       print(row)
-
-This method does not convert the row to a Series object but just
-returns the values inside a namedtuple. Therefore,
-:meth:`~DataFrame.itertuples` preserves the data type of the values
-and is generally faster as :meth:`~DataFrame.iterrows`.
-
-.. note::
-
-   The column names will be renamed to positional names if they are
-   invalid Python identifiers, repeated, or start with an underscore.
-   With a large number of columns (>255), regular tuples are returned.
-
-.. _basics.dt_accessors:
-
-.dt accessor
-------------
-
-``Series`` has an accessor to succinctly return datetime like properties for the
-*values* of the Series, if it is a datetime/period like Series.
-This will return a Series, indexed like the existing Series.
-
-.. ipython:: python
-
-   # datetime
-   s = pd.Series(pd.date_range('20130101 09:10:12', periods=4))
-   s
-   s.dt.hour
-   s.dt.second
-   s.dt.day
-
-This enables nice expressions like this:
-
-.. ipython:: python
-
-   s[s.dt.day==2]
-
-You can easily produces tz aware transformations:
-
-.. ipython:: python
-
-   stz = s.dt.tz_localize('US/Eastern')
-   stz
-   stz.dt.tz
-
-You can also chain these types of operations:
-
-.. ipython:: python
-
-   s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
-
-You can also format datetime values as strings with :meth:`Series.dt.strftime` which
-supports the same format as the standard :meth:`~datetime.datetime.strftime`.
-
-.. ipython:: python
-
-   # DatetimeIndex
-   s = pd.Series(pd.date_range('20130101', periods=4))
-   s
-   s.dt.strftime('%Y/%m/%d')
-
-.. ipython:: python
-
-   # PeriodIndex
-   s = pd.Series(pd.period_range('20130101', periods=4))
-   s
-   s.dt.strftime('%Y/%m/%d')
-
-The ``.dt`` accessor works for period and timedelta dtypes.
-
-.. ipython:: python
-
-   # period
-   s = pd.Series(pd.period_range('20130101', periods=4, freq='D'))
-   s
-   s.dt.year
-   s.dt.day
-
-.. ipython:: python
-
-   # timedelta
-   s = pd.Series(pd.timedelta_range('1 day 00:00:05', periods=4, freq='s'))
-   s
-   s.dt.days
-   s.dt.seconds
-   s.dt.components
-
-.. note::
-
-   ``Series.dt`` will raise a ``TypeError`` if you access with a non-datetimelike values
-
-Vectorized string methods
--------------------------
-
-Series is equipped with a set of string processing methods that make it easy to
-operate on each element of the array. Perhaps most importantly, these methods
-exclude missing/NA values automatically. These are accessed via the Series's
-``str`` attribute and generally have names matching the equivalent (scalar)
-built-in string methods. For example:
-
- .. ipython:: python
-
-  s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
-  s.str.lower()
-
-Powerful pattern-matching methods are provided as well, but note that
-pattern-matching generally uses `regular expressions
-<https://docs.python.org/2/library/re.html>`__ by default (and in some cases
-always uses them).
-
-Please see :ref:`Vectorized String Methods <text.string_methods>` for a complete
-description.
-
-.. _basics.sorting:
-
-Sorting
--------
-
-.. warning::
-
-   The sorting API is substantially changed in 0.17.0, see :ref:`here <whatsnew_0170.api_breaking.sorting>` for these changes.
-   In particular, all sorting methods now return a new object by default, and **DO NOT** operate in-place (except by passing ``inplace=True``).
-
-There are two obvious kinds of sorting that you may be interested in: sorting
-by label and sorting by actual values.
-
-By Index
-~~~~~~~~
-
-The primary method for sorting axis
-labels (indexes) are the ``Series.sort_index()`` and the ``DataFrame.sort_index()`` methods.
-
-.. ipython:: python
-
-   unsorted_df = df.reindex(index=['a', 'd', 'c', 'b'],
-                            columns=['three', 'two', 'one'])
-
-   # DataFrame
-   unsorted_df.sort_index()
-   unsorted_df.sort_index(ascending=False)
-   unsorted_df.sort_index(axis=1)
-
-   # Series
-   unsorted_df['three'].sort_index()
-
-By Values
-~~~~~~~~~
-
-The :meth:`Series.sort_values` and :meth:`DataFrame.sort_values` are the entry points for **value** sorting (that is the values in a column or row).
-:meth:`DataFrame.sort_values` can accept an optional ``by`` argument for ``axis=0``
-which will use an arbitrary vector or a column name of the DataFrame to
-determine the sort order:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'one':[2,1,1,1],'two':[1,3,2,4],'three':[5,4,3,2]})
-   df1.sort_values(by='two')
-
-The ``by`` argument can take a list of column names, e.g.:
-
-.. ipython:: python
-
-   df1[['one', 'two', 'three']].sort_values(by=['one','two'])
-
-These methods have special treatment of NA values via the ``na_position``
-argument:
-
-.. ipython:: python
-
-   s[2] = np.nan
-   s.sort_values()
-   s.sort_values(na_position='first')
-
-
-.. _basics.searchsorted:
-
-searchsorted
-~~~~~~~~~~~~
-
-Series has the :meth:`~Series.searchsorted` method, which works similar to
-:meth:`numpy.ndarray.searchsorted`.
-
-.. ipython:: python
-
-   ser = pd.Series([1, 2, 3])
-   ser.searchsorted([0, 3])
-   ser.searchsorted([0, 4])
-   ser.searchsorted([1, 3], side='right')
-   ser.searchsorted([1, 3], side='left')
-   ser = pd.Series([3, 1, 2])
-   ser.searchsorted([0, 3], sorter=np.argsort(ser))
-
-.. _basics.nsorted:
-
-smallest / largest values
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.14.0
-
-``Series`` has the :meth:`~Series.nsmallest` and :meth:`~Series.nlargest` methods which return the
-smallest or largest :math:`n` values. For a large ``Series`` this can be much
-faster than sorting the entire Series and calling ``head(n)`` on the result.
-
-.. ipython:: python
-
-   s = pd.Series(np.random.permutation(10))
-   s
-   s.sort_values()
-   s.nsmallest(3)
-   s.nlargest(3)
-
-.. versionadded:: 0.17.0
-
-``DataFrame`` also has the ``nlargest`` and ``nsmallest`` methods.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': [-2, -1, 1, 10, 8, 11, -1],
-                      'b': list('abdceff'),
-                      'c': [1.0, 2.0, 4.0, 3.2, np.nan, 3.0, 4.0]})
-   df.nlargest(3, 'a')
-   df.nlargest(5, ['a', 'c'])
-   df.nsmallest(3, 'a')
-   df.nsmallest(5, ['a', 'c'])
-
-
-.. _basics.multi-index_sorting:
-
-Sorting by a multi-index column
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You must be explicit about sorting when the column is a multi-index, and fully specify
-all levels to ``by``.
-
-.. ipython:: python
-
-   df1.columns = pd.MultiIndex.from_tuples([('a','one'),('a','two'),('b','three')])
-   df1.sort_values(by=('a','two'))
-
-
-Copying
--------
-
-The :meth:`~DataFrame.copy` method on pandas objects copies the underlying data (though not
-the axis indexes, since they are immutable) and returns a new object. Note that
-**it is seldom necessary to copy objects**. For example, there are only a
-handful of ways to alter a DataFrame *in-place*:
-
-  * Inserting, deleting, or modifying a column
-  * Assigning to the ``index`` or ``columns`` attributes
-  * For homogeneous data, directly modifying the values via the ``values``
-    attribute or advanced indexing
-
-To be clear, no pandas methods have the side effect of modifying your data;
-almost all methods return new objects, leaving the original object
-untouched. If data is modified, it is because you did so explicitly.
-
-.. _basics.dtypes:
-
-dtypes
-------
-
-The main types stored in pandas objects are ``float``, ``int``, ``bool``,
-``datetime64[ns]`` and ``datetime64[ns, tz]`` (in >= 0.17.0), ``timedelta[ns]``, ``category`` (in >= 0.15.0), and ``object``. In addition these dtypes
-have item sizes, e.g. ``int64`` and ``int32``. See :ref:`Series with TZ <timeseries.timezone_series>` for more detail on ``datetime64[ns, tz]`` dtypes.
-
-A convenient :attr:`~DataFrame.dtypes` attribute for DataFrames returns a Series with the data type of each column.
-
-.. ipython:: python
-
-   dft = pd.DataFrame(dict(A = np.random.rand(3),
-                           B = 1,
-                           C = 'foo',
-                           D = pd.Timestamp('20010102'),
-                           E = pd.Series([1.0]*3).astype('float32'),
-			               F = False,
-			               G = pd.Series([1]*3,dtype='int8')))
-   dft
-   dft.dtypes
-
-On a ``Series`` use the :attr:`~Series.dtype` attribute.
-
-.. ipython:: python
-
-   dft['A'].dtype
-
-If a pandas object contains data multiple dtypes *IN A SINGLE COLUMN*, the dtype of the
-column will be chosen to accommodate all of the data types (``object`` is the most
-general).
-
-.. ipython:: python
-
-   # these ints are coerced to floats
-   pd.Series([1, 2, 3, 4, 5, 6.])
-
-   # string data forces an ``object`` dtype
-   pd.Series([1, 2, 3, 6., 'foo'])
-
-The method :meth:`~DataFrame.get_dtype_counts` will return the number of columns of
-each type in a ``DataFrame``:
-
-.. ipython:: python
-
-   dft.get_dtype_counts()
-
-Numeric dtypes will propagate and can coexist in DataFrames (starting in v0.11.0).
-If a dtype is passed (either directly via the ``dtype`` keyword, a passed ``ndarray``,
-or a passed ``Series``, then it will be preserved in DataFrame operations. Furthermore,
-different numeric dtypes will **NOT** be combined. The following example will give you a taste.
-
-.. ipython:: python
-
-   df1 = pd.DataFrame(np.random.randn(8, 1), columns=['A'], dtype='float32')
-   df1
-   df1.dtypes
-   df2 = pd.DataFrame(dict( A = pd.Series(np.random.randn(8), dtype='float16'),
-                           B = pd.Series(np.random.randn(8)),
-                           C = pd.Series(np.array(np.random.randn(8), dtype='uint8')) ))
-   df2
-   df2.dtypes
-
-defaults
-~~~~~~~~
-
-By default integer types are ``int64`` and float types are ``float64``,
-*REGARDLESS* of platform (32-bit or 64-bit). The following will all result in ``int64`` dtypes.
-
-.. ipython:: python
-
-   pd.DataFrame([1, 2], columns=['a']).dtypes
-   pd.DataFrame({'a': [1, 2]}).dtypes
-   pd.DataFrame({'a': 1 }, index=list(range(2))).dtypes
-
-Numpy, however will choose *platform-dependent* types when creating arrays.
-The following **WILL** result in ``int32`` on 32-bit platform.
-
-.. ipython:: python
-
-   frame = pd.DataFrame(np.array([1, 2]))
-
-
-upcasting
-~~~~~~~~~
-
-Types can potentially be *upcasted* when combined with other types, meaning they are promoted
-from the current type (say ``int`` to ``float``)
-
-.. ipython:: python
-
-   df3 = df1.reindex_like(df2).fillna(value=0.0) + df2
-   df3
-   df3.dtypes
-
-The ``values`` attribute on a DataFrame return the *lower-common-denominator* of the dtypes, meaning
-the dtype that can accommodate **ALL** of the types in the resulting homogeneous dtyped numpy array. This can
-force some *upcasting*.
-
-.. ipython:: python
-
-   df3.values.dtype
-
-astype
-~~~~~~
-
-.. _basics.cast:
-
-You can use the :meth:`~DataFrame.astype` method to explicitly convert dtypes from one to another. These will by default return a copy,
-even if the dtype was unchanged (pass ``copy=False`` to change this behavior). In addition, they will raise an
-exception if the astype operation is invalid.
-
-Upcasting is always according to the **numpy** rules. If two different dtypes are involved in an operation,
-then the more *general* one will be used as the result of the operation.
-
-.. ipython:: python
-
-   df3
-   df3.dtypes
-
-   # conversion of dtypes
-   df3.astype('float32').dtypes
-
-
-Convert a subset of columns to a specified type using :meth:`~DataFrame.astype`
-
-.. ipython:: python
-
-   dft = pd.DataFrame({'a': [1,2,3], 'b': [4,5,6], 'c': [7, 8, 9]})
-   dft[['a','b']] = dft[['a','b']].astype(np.uint8)
-   dft
-   dft.dtypes
-
-.. versionadded:: 0.19.0
-
-Convert certain columns to a specific dtype by passing a dict to :meth:`~DataFrame.astype`
-
-.. ipython:: python
-
-   dft1 = pd.DataFrame({'a': [1,0,1], 'b': [4,5,6], 'c': [7, 8, 9]})
-   dft1 = dft1.astype({'a': np.bool, 'c': np.float64})
-   dft1
-   dft1.dtypes
-
-.. note::
-
-    When trying to convert a subset of columns to a specified type using :meth:`~DataFrame.astype`  and :meth:`~DataFrame.loc`, upcasting occurs.
-
-    :meth:`~DataFrame.loc` tries to fit in what we are assigning to the current dtypes, while ``[]`` will overwrite them taking the dtype from the right hand side. Therefore the following piece of code produces the unintended result.
-
-    .. ipython:: python
-
-       dft = pd.DataFrame({'a': [1,2,3], 'b': [4,5,6], 'c': [7, 8, 9]})
-       dft.loc[:, ['a', 'b']].astype(np.uint8).dtypes
-       dft.loc[:, ['a', 'b']] = dft.loc[:, ['a', 'b']].astype(np.uint8)
-       dft.dtypes
-
-.. _basics.object_conversion:
-
-object conversion
-~~~~~~~~~~~~~~~~~
-
-pandas offers various functions to try to force conversion of types from the ``object`` dtype to other types.
-The following functions are available for one dimensional object arrays or scalars:
-
-- :meth:`~pandas.to_numeric` (conversion to numeric dtypes)
-
-  .. ipython:: python
-
-     m = ['1.1', 2, 3]
-     pd.to_numeric(m)
-
-- :meth:`~pandas.to_datetime` (conversion to datetime objects)
-
-  .. ipython:: python
-
-     import datetime
-     m = ['2016-07-09', datetime.datetime(2016, 3, 2)]
-     pd.to_datetime(m)
-
-- :meth:`~pandas.to_timedelta` (conversion to timedelta objects)
-
-  .. ipython:: python
-
-     m = ['5us', pd.Timedelta('1day')]
-     pd.to_timedelta(m)
-
-To force a conversion, we can pass in an ``errors`` argument, which specifies how pandas should deal with elements
-that cannot be converted to desired dtype or object. By default, ``errors='raise'``, meaning that any errors encountered
-will be raised during the conversion process. However, if ``errors='coerce'``, these errors will be ignored and pandas
-will convert problematic elements to ``pd.NaT`` (for datetime and timedelta) or ``np.nan`` (for numeric). This might be
-useful if you are reading in data which is mostly of the desired dtype (e.g. numeric, datetime), but occasionally has
-non-conforming elements intermixed that you want to represent as missing:
-
-.. ipython:: python
-
-    import datetime
-    m = ['apple', datetime.datetime(2016, 3, 2)]
-    pd.to_datetime(m, errors='coerce')
-
-    m = ['apple', 2, 3]
-    pd.to_numeric(m, errors='coerce')
-
-    m = ['apple', pd.Timedelta('1day')]
-    pd.to_timedelta(m, errors='coerce')
-
-The ``errors`` parameter has a third option of ``errors='ignore'``, which will simply return the passed in data if it
-encounters any errors with the conversion to a desired data type:
-
-.. ipython:: python
-
-    import datetime
-    m = ['apple', datetime.datetime(2016, 3, 2)]
-    pd.to_datetime(m, errors='ignore')
-
-    m = ['apple', 2, 3]
-    pd.to_numeric(m, errors='ignore')
-
-    m = ['apple', pd.Timedelta('1day')]
-    pd.to_timedelta(m, errors='ignore')
-
-In addition to object conversion, :meth:`~pandas.to_numeric` provides another argument ``downcast``, which gives the
-option of downcasting the newly (or already) numeric data to a smaller dtype, which can conserve memory:
-
-.. ipython:: python
-
-    m = ['1', 2, 3]
-    pd.to_numeric(m, downcast='integer')   # smallest signed int dtype
-    pd.to_numeric(m, downcast='signed')    # same as 'integer'
-    pd.to_numeric(m, downcast='unsigned')  # smallest unsigned int dtype
-    pd.to_numeric(m, downcast='float')     # smallest float dtype
-
-As these methods apply only to one-dimensional arrays, lists or scalars; they cannot be used directly on multi-dimensional objects such
-as DataFrames. However, with :meth:`~pandas.DataFrame.apply`, we can "apply" the function over each column efficiently:
-
-.. ipython:: python
-
-    import datetime
-    df = pd.DataFrame([['2016-07-09', datetime.datetime(2016, 3, 2)]] * 2, dtype='O')
-    df
-    df.apply(pd.to_datetime)
-
-    df = pd.DataFrame([['1.1', 2, 3]] * 2, dtype='O')
-    df
-    df.apply(pd.to_numeric)
-
-    df = pd.DataFrame([['5us', pd.Timedelta('1day')]] * 2, dtype='O')
-    df
-    df.apply(pd.to_timedelta)
-
-gotchas
-~~~~~~~
-
-Performing selection operations on ``integer`` type data can easily upcast the data to ``floating``.
-The dtype of the input data will be preserved in cases where ``nans`` are not introduced (starting in 0.11.0)
-See also :ref:`Support for integer NA <gotchas.intna>`
-
-.. ipython:: python
-
-   dfi = df3.astype('int32')
-   dfi['E'] = 1
-   dfi
-   dfi.dtypes
-
-   casted = dfi[dfi>0]
-   casted
-   casted.dtypes
-
-While float dtypes are unchanged.
-
-.. ipython:: python
-
-   dfa = df3.copy()
-   dfa['A'] = dfa['A'].astype('float32')
-   dfa.dtypes
-
-   casted = dfa[df2>0]
-   casted
-   casted.dtypes
-
-Selecting columns based on ``dtype``
-------------------------------------
-
-.. _basics.selectdtypes:
-
-.. versionadded:: 0.14.1
-
-The :meth:`~DataFrame.select_dtypes` method implements subsetting of columns
-based on their ``dtype``.
-
-First, let's create a :class:`DataFrame` with a slew of different
-dtypes:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'string': list('abc'),
-                      'int64': list(range(1, 4)),
-                      'uint8': np.arange(3, 6).astype('u1'),
-                      'float64': np.arange(4.0, 7.0),
-                      'bool1': [True, False, True],
-                      'bool2': [False, True, False],
-                      'dates': pd.date_range('now', periods=3).values,
-                      'category': pd.Series(list("ABC")).astype('category')})
-   df['tdeltas'] = df.dates.diff()
-   df['uint64'] = np.arange(3, 6).astype('u8')
-   df['other_dates'] = pd.date_range('20130101', periods=3).values
-   df['tz_aware_dates'] = pd.date_range('20130101', periods=3, tz='US/Eastern')
-   df
-
-And the dtypes
-
-.. ipython:: python
-
-   df.dtypes
-
-:meth:`~DataFrame.select_dtypes` has two parameters ``include`` and ``exclude`` that allow you to
-say "give me the columns WITH these dtypes" (``include``) and/or "give the
-columns WITHOUT these dtypes" (``exclude``).
-
-For example, to select ``bool`` columns
-
-.. ipython:: python
-
-   df.select_dtypes(include=[bool])
-
-You can also pass the name of a dtype in the `numpy dtype hierarchy
-<http://docs.scipy.org/doc/numpy/reference/arrays.scalars.html>`__:
-
-.. ipython:: python
-
-   df.select_dtypes(include=['bool'])
-
-:meth:`~pandas.DataFrame.select_dtypes` also works with generic dtypes as well.
-
-For example, to select all numeric and boolean columns while excluding unsigned
-integers
-
-.. ipython:: python
-
-   df.select_dtypes(include=['number', 'bool'], exclude=['unsignedinteger'])
-
-To select string columns you must use the ``object`` dtype:
-
-.. ipython:: python
-
-   df.select_dtypes(include=['object'])
-
-To see all the child dtypes of a generic ``dtype`` like ``numpy.number`` you
-can define a function that returns a tree of child dtypes:
-
-.. ipython:: python
-
-   def subdtypes(dtype):
-       subs = dtype.__subclasses__()
-       if not subs:
-           return dtype
-       return [dtype, [subdtypes(dt) for dt in subs]]
-
-All numpy dtypes are subclasses of ``numpy.generic``:
-
-.. ipython:: python
-
-    subdtypes(np.generic)
-
-.. note::
-
-    Pandas also defines the types ``category``, and ``datetime64[ns, tz]``, which are not integrated into the normal
-    numpy hierarchy and wont show up with the above function.
-
-.. note::
-
-   The ``include`` and ``exclude`` parameters must be non-string sequences.
diff --git a/doc/source/categorical.rst b/doc/source/categorical.rst
deleted file mode 100644
index 411f973e9a71f..0000000000000
--- a/doc/source/categorical.rst
+++ /dev/null
@@ -1,1070 +0,0 @@
-.. _categorical:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows = 15
-
-
-****************
-Categorical Data
-****************
-
-.. versionadded:: 0.15
-
-.. note::
-    While there was `pandas.Categorical` in earlier versions, the ability to use
-    categorical data in `Series` and `DataFrame` is new.
-
-
-This is an introduction to pandas categorical data type, including a short comparison
-with R's ``factor``.
-
-`Categoricals` are a pandas data type, which correspond to categorical variables in
-statistics: a variable, which can take on only a limited, and usually fixed,
-number of possible values (`categories`; `levels` in R). Examples are gender, social class,
-blood types, country affiliations, observation time or ratings via Likert scales.
-
-In contrast to statistical categorical variables, categorical data might have an order (e.g.
-'strongly agree' vs 'agree' or 'first observation' vs. 'second observation'), but numerical
-operations (additions, divisions, ...) are not possible.
-
-All values of categorical data are either in `categories` or `np.nan`. Order is defined by
-the order of `categories`, not lexical order of the values. Internally, the data structure
-consists of a `categories` array and an integer array of `codes` which point to the real value in
-the `categories` array.
-
-The categorical data type is useful in the following cases:
-
-* A string variable consisting of only a few different values. Converting such a string
-  variable to a categorical variable will save some memory, see :ref:`here <categorical.memory>`.
-* The lexical order of a variable is not the same as the logical order ("one", "two", "three").
-  By converting to a categorical and specifying an order on the categories, sorting and
-  min/max will use the logical order instead of the lexical order, see :ref:`here <categorical.sort>`.
-* As a signal to other python libraries that this column should be treated as a categorical
-  variable (e.g. to use suitable statistical methods or plot types).
-
-See also the :ref:`API docs on categoricals<api.categorical>`.
-
-Object Creation
----------------
-
-Categorical `Series` or columns in a `DataFrame` can be created in several ways:
-
-By specifying ``dtype="category"`` when constructing a `Series`:
-
-.. ipython:: python
-
-    s = pd.Series(["a","b","c","a"], dtype="category")
-    s
-
-By converting an existing `Series` or column to a ``category`` dtype:
-
-.. ipython:: python
-
-    df = pd.DataFrame({"A":["a","b","c","a"]})
-    df["B"] = df["A"].astype('category')
-    df
-
-By using some special functions:
-
-.. ipython:: python
-
-    df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
-    labels = [ "{0} - {1}".format(i, i + 9) for i in range(0, 100, 10) ]
-
-    df['group'] = pd.cut(df.value, range(0, 105, 10), right=False, labels=labels)
-    df.head(10)
-
-See :ref:`documentation <reshaping.tile.cut>` for :func:`~pandas.cut`.
-
-By passing a :class:`pandas.Categorical` object to a `Series` or assigning it to a `DataFrame`.
-
-.. ipython:: python
-
-    raw_cat = pd.Categorical(["a","b","c","a"], categories=["b","c","d"],
-                             ordered=False)
-    s = pd.Series(raw_cat)
-    s
-    df = pd.DataFrame({"A":["a","b","c","a"]})
-    df["B"] = raw_cat
-    df
-
-You can also specify differently ordered categories or make the resulting data ordered, by passing these arguments to ``astype()``:
-
-.. ipython:: python
-
-    s = pd.Series(["a","b","c","a"])
-    s_cat = s.astype("category", categories=["b","c","d"], ordered=False)
-    s_cat
-
-Categorical data has a specific ``category`` :ref:`dtype <basics.dtypes>`:
-
-.. ipython:: python
-
-    df.dtypes
-
-.. note::
-
-    In contrast to R's `factor` function, categorical data is not converting input values to
-    strings and categories will end up the same data type as the original values.
-
-.. note::
-
-    In contrast to R's `factor` function, there is currently no way to assign/change labels at
-    creation time. Use `categories` to change the categories after creation time.
-
-To get back to the original Series or `numpy` array, use ``Series.astype(original_dtype)`` or
-``np.asarray(categorical)``:
-
-.. ipython:: python
-
-    s = pd.Series(["a","b","c","a"])
-    s
-    s2 = s.astype('category')
-    s2
-    s2.astype(str)
-    np.asarray(s2)
-
-If you have already `codes` and `categories`, you can use the :func:`~pandas.Categorical.from_codes`
-constructor to save the factorize step during normal constructor mode:
-
-.. ipython:: python
-
-    splitter = np.random.choice([0,1], 5, p=[0.5,0.5])
-    s = pd.Series(pd.Categorical.from_codes(splitter, categories=["train", "test"]))
-
-Description
------------
-
-Using ``.describe()`` on categorical data will produce similar output to a `Series` or
-`DataFrame` of type ``string``.
-
-.. ipython:: python
-
-    cat = pd.Categorical(["a", "c", "c", np.nan], categories=["b", "a", "c"])
-    df = pd.DataFrame({"cat":cat, "s":["a", "c", "c", np.nan]})
-    df.describe()
-    df["cat"].describe()
-
-Working with categories
------------------------
-
-Categorical data has a `categories` and a `ordered` property, which list their possible values and
-whether the ordering matters or not. These properties are exposed as ``s.cat.categories`` and
-``s.cat.ordered``. If you don't manually specify categories and ordering, they are inferred from the
-passed in values.
-
-.. ipython:: python
-
-    s = pd.Series(["a","b","c","a"], dtype="category")
-    s.cat.categories
-    s.cat.ordered
-
-It's also possible to pass in the categories in a specific order:
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical(["a","b","c","a"], categories=["c","b","a"]))
-    s.cat.categories
-    s.cat.ordered
-
-.. note::
-
-    New categorical data are NOT automatically ordered. You must explicitly pass ``ordered=True`` to
-    indicate an ordered ``Categorical``.
-
-
-.. note::
-
-    The result of ``Series.unique()`` is not always the same as ``Series.cat.categories``,
-    because ``Series.unique()`` has a couple of guarantees, namely that it returns categories
-    in the order of appearance, and it only includes values that are actually present.
-
-    .. ipython:: python
-
-         s = pd.Series(list('babc')).astype('category', categories=list('abcd'))
-         s
-
-         # categories
-         s.cat.categories
-
-         # uniques
-         s.unique()
-
-Renaming categories
-~~~~~~~~~~~~~~~~~~~
-
-Renaming categories is done by assigning new values to the ``Series.cat.categories`` property or
-by using the :func:`Categorical.rename_categories` method:
-
-.. ipython:: python
-
-    s = pd.Series(["a","b","c","a"], dtype="category")
-    s
-    s.cat.categories = ["Group %s" % g for g in s.cat.categories]
-    s
-    s.cat.rename_categories([1,2,3])
-
-.. note::
-
-    In contrast to R's `factor`, categorical data can have categories of other types than string.
-
-.. note::
-
-    Be aware that assigning new categories is an inplace operations, while most other operation
-    under ``Series.cat`` per default return a new Series of dtype `category`.
-
-Categories must be unique or a `ValueError` is raised:
-
-.. ipython:: python
-
-    try:
-        s.cat.categories = [1,1,1]
-    except ValueError as e:
-        print("ValueError: " + str(e))
-
-Categories must also not be ``NaN`` or a `ValueError` is raised:
-
-.. ipython:: python
-
-    try:
-        s.cat.categories = [1,2,np.nan]
-    except ValueError as e:
-        print("ValueError: " + str(e))
-
-Appending new categories
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-Appending categories can be done by using the :func:`Categorical.add_categories` method:
-
-.. ipython:: python
-
-    s = s.cat.add_categories([4])
-    s.cat.categories
-    s
-
-Removing categories
-~~~~~~~~~~~~~~~~~~~
-
-Removing categories can be done by using the :func:`Categorical.remove_categories` method. Values
-which are removed are replaced by ``np.nan``.:
-
-.. ipython:: python
-
-    s = s.cat.remove_categories([4])
-    s
-
-Removing unused categories
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Removing unused categories can also be done:
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical(["a","b","a"], categories=["a","b","c","d"]))
-    s
-    s.cat.remove_unused_categories()
-
-Setting categories
-~~~~~~~~~~~~~~~~~~
-
-If you want to do remove and add new categories in one step (which has some speed advantage),
-or simply set the categories to a predefined scale, use :func:`Categorical.set_categories`.
-
-.. ipython:: python
-
-    s = pd.Series(["one","two","four", "-"], dtype="category")
-    s
-    s = s.cat.set_categories(["one","two","three","four"])
-    s
-
-.. note::
-    Be aware that :func:`Categorical.set_categories` cannot know whether some category is omitted
-    intentionally or because it is misspelled or (under Python3) due to a type difference (e.g.,
-    numpys S1 dtype and python strings). This can result in surprising behaviour!
-
-Sorting and Order
------------------
-
-.. _categorical.sort:
-
-.. warning::
-
-   The default for construction has changed in v0.16.0 to ``ordered=False``, from the prior implicit ``ordered=True``
-
-If categorical data is ordered (``s.cat.ordered == True``), then the order of the categories has a
-meaning and certain operations are possible. If the categorical is unordered, ``.min()/.max()`` will raise a `TypeError`.
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical(["a","b","c","a"], ordered=False))
-    s.sort_values(inplace=True)
-    s = pd.Series(["a","b","c","a"]).astype('category', ordered=True)
-    s.sort_values(inplace=True)
-    s
-    s.min(), s.max()
-
-You can set categorical data to be ordered by using ``as_ordered()`` or unordered by using ``as_unordered()``. These will by
-default return a *new* object.
-
-.. ipython:: python
-
-    s.cat.as_ordered()
-    s.cat.as_unordered()
-
-Sorting will use the order defined by categories, not any lexical order present on the data type.
-This is even true for strings and numeric data:
-
-.. ipython:: python
-
-    s = pd.Series([1,2,3,1], dtype="category")
-    s = s.cat.set_categories([2,3,1], ordered=True)
-    s
-    s.sort_values(inplace=True)
-    s
-    s.min(), s.max()
-
-
-Reordering
-~~~~~~~~~~
-
-Reordering the categories is possible via the :func:`Categorical.reorder_categories` and
-the :func:`Categorical.set_categories` methods. For :func:`Categorical.reorder_categories`, all
-old categories must be included in the new categories and no new categories are allowed. This will
-necessarily make the sort order the same as the categories order.
-
-.. ipython:: python
-
-    s = pd.Series([1,2,3,1], dtype="category")
-    s = s.cat.reorder_categories([2,3,1], ordered=True)
-    s
-    s.sort_values(inplace=True)
-    s
-    s.min(), s.max()
-
-.. note::
-
-    Note the difference between assigning new categories and reordering the categories: the first
-    renames categories and therefore the individual values in the `Series`, but if the first
-    position was sorted last, the renamed value will still be sorted last. Reordering means that the
-    way values are sorted is different afterwards, but not that individual values in the
-    `Series` are changed.
-
-.. note::
-
-    If the `Categorical` is not ordered, ``Series.min()`` and ``Series.max()`` will raise
-    ``TypeError``. Numeric operations like ``+``, ``-``, ``*``, ``/`` and operations based on them
-    (e.g. ``Series.median()``, which would need to compute the mean between two values if the length
-    of an array is even) do not work and raise a ``TypeError``.
-
-Multi Column Sorting
-~~~~~~~~~~~~~~~~~~~~
-
-A categorical dtyped column will participate in a multi-column sort in a similar manner to other columns.
-The ordering of the categorical is determined by the ``categories`` of that column.
-
-.. ipython:: python
-
-   dfs = pd.DataFrame({'A' : pd.Categorical(list('bbeebbaa'), categories=['e','a','b'], ordered=True),
-                       'B' : [1,2,1,2,2,1,2,1] })
-   dfs.sort_values(by=['A', 'B'])
-
-Reordering the ``categories`` changes a future sort.
-
-.. ipython:: python
-
-   dfs['A'] = dfs['A'].cat.reorder_categories(['a','b','e'])
-   dfs.sort_values(by=['A','B'])
-
-Comparisons
------------
-
-Comparing categorical data with other objects is possible in three cases:
-
- * comparing equality (``==`` and ``!=``) to a list-like object (list, Series, array,
-   ...) of the same length as the categorical data.
- * all comparisons (``==``, ``!=``, ``>``, ``>=``, ``<``, and ``<=``) of categorical data to
-   another categorical Series, when ``ordered==True`` and the `categories` are the same.
- * all comparisons of a categorical data to a scalar.
-
-All other comparisons, especially "non-equality" comparisons of two categoricals with different
-categories or a categorical with any list-like object, will raise a TypeError.
-
-.. note::
-
-    Any "non-equality" comparisons of categorical data with a `Series`, `np.array`, `list` or
-    categorical data with different categories or ordering will raise an `TypeError` because custom
-    categories ordering could be interpreted in two ways: one with taking into account the
-    ordering and one without.
-
-.. ipython:: python
-
-    cat = pd.Series([1,2,3]).astype("category", categories=[3,2,1], ordered=True)
-    cat_base = pd.Series([2,2,2]).astype("category", categories=[3,2,1], ordered=True)
-    cat_base2 = pd.Series([2,2,2]).astype("category", ordered=True)
-
-    cat
-    cat_base
-    cat_base2
-
-Comparing to a categorical with the same categories and ordering or to a scalar works:
-
-.. ipython:: python
-
-    cat > cat_base
-    cat > 2
-
-Equality comparisons work with any list-like object of same length and scalars:
-
-.. ipython:: python
-
-    cat == cat_base
-    cat == np.array([1,2,3])
-    cat == 2
-
-This doesn't work because the categories are not the same:
-
-.. ipython:: python
-
-    try:
-        cat > cat_base2
-    except TypeError as e:
-         print("TypeError: " + str(e))
-
-If you want to do a "non-equality" comparison of a categorical series with a list-like object
-which is not categorical data, you need to be explicit and convert the categorical data back to
-the original values:
-
-.. ipython:: python
-
-    base = np.array([1,2,3])
-
-    try:
-        cat > base
-    except TypeError as e:
-         print("TypeError: " + str(e))
-
-    np.asarray(cat) > base
-
-Operations
-----------
-
-Apart from ``Series.min()``, ``Series.max()`` and ``Series.mode()``, the following operations are
-possible with categorical data:
-
-`Series` methods like `Series.value_counts()` will use all categories, even if some categories are not
-present in the data:
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical(["a","b","c","c"], categories=["c","a","b","d"]))
-    s.value_counts()
-
-Groupby will also show "unused" categories:
-
-.. ipython:: python
-
-    cats = pd.Categorical(["a","b","b","b","c","c","c"], categories=["a","b","c","d"])
-    df = pd.DataFrame({"cats":cats,"values":[1,2,2,2,3,4,5]})
-    df.groupby("cats").mean()
-
-    cats2 = pd.Categorical(["a","a","b","b"], categories=["a","b","c"])
-    df2 = pd.DataFrame({"cats":cats2,"B":["c","d","c","d"], "values":[1,2,3,4]})
-    df2.groupby(["cats","B"]).mean()
-
-
-Pivot tables:
-
-.. ipython:: python
-
-    raw_cat = pd.Categorical(["a","a","b","b"], categories=["a","b","c"])
-    df = pd.DataFrame({"A":raw_cat,"B":["c","d","c","d"], "values":[1,2,3,4]})
-    pd.pivot_table(df, values='values', index=['A', 'B'])
-
-Data munging
-------------
-
-The optimized pandas data access methods  ``.loc``, ``.iloc``, ``.at``, and ``.iat``,
-work as normal. The only difference is the return type (for getting) and
-that only values already in `categories` can be assigned.
-
-Getting
-~~~~~~~
-
-If the slicing operation returns either a `DataFrame` or a column of type `Series`,
-the ``category`` dtype is preserved.
-
-.. ipython:: python
-
-    idx = pd.Index(["h","i","j","k","l","m","n",])
-    cats = pd.Series(["a","b","b","b","c","c","c"], dtype="category", index=idx)
-    values= [1,2,2,2,3,4,5]
-    df = pd.DataFrame({"cats":cats,"values":values}, index=idx)
-    df.iloc[2:4,:]
-    df.iloc[2:4,:].dtypes
-    df.loc["h":"j","cats"]
-    df[df["cats"] == "b"]
-
-An example where the category type is not preserved is if you take one single row: the
-resulting `Series` is of dtype ``object``:
-
-.. ipython:: python
-
-    # get the complete "h" row as a Series
-    df.loc["h", :]
-
-Returning a single item from categorical data will also return the value, not a categorical
-of length "1".
-
-.. ipython:: python
-
-    df.iat[0,0]
-    df["cats"].cat.categories = ["x","y","z"]
-    df.at["h","cats"] # returns a string
-
-.. note::
-    This is a difference to R's `factor` function, where ``factor(c(1,2,3))[1]``
-    returns a single value `factor`.
-
-To get a single value `Series` of type ``category`` pass in a list with a single value:
-
-.. ipython:: python
-
-    df.loc[["h"],"cats"]
-
-String and datetime accessors
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.17.1
-
-The accessors  ``.dt`` and ``.str`` will work if the ``s.cat.categories`` are of an appropriate
-type:
-
-
-.. ipython:: python
-
-    str_s = pd.Series(list('aabb'))
-    str_cat = str_s.astype('category')
-    str_cat
-    str_cat.str.contains("a")
-
-    date_s = pd.Series(pd.date_range('1/1/2015', periods=5))
-    date_cat = date_s.astype('category')
-    date_cat
-    date_cat.dt.day
-
-.. note::
-
-    The returned ``Series`` (or ``DataFrame``) is of the same type as if you used the
-    ``.str.<method>`` / ``.dt.<method>`` on a ``Series`` of that type (and not of
-    type ``category``!).
-
-That means, that the returned values from methods and properties on the accessors of a
-``Series`` and the returned values from methods and properties on the accessors of this
-``Series`` transformed to one of type `category` will be equal:
-
-.. ipython:: python
-
-    ret_s = str_s.str.contains("a")
-    ret_cat = str_cat.str.contains("a")
-    ret_s.dtype == ret_cat.dtype
-    ret_s == ret_cat
-
-.. note::
-
-    The work is done on the ``categories`` and then a new ``Series`` is constructed. This has
-    some performance implication if you have a ``Series`` of type string, where lots of elements
-    are repeated (i.e. the number of unique elements in the ``Series`` is a lot smaller than the
-    length of the ``Series``). In this case it can be faster to convert the original ``Series``
-    to one of type ``category`` and use ``.str.<method>`` or ``.dt.<property>`` on that.
-
-Setting
-~~~~~~~
-
-Setting values in a categorical column (or `Series`) works as long as the value is included in the
-`categories`:
-
-.. ipython:: python
-
-    idx = pd.Index(["h","i","j","k","l","m","n"])
-    cats = pd.Categorical(["a","a","a","a","a","a","a"], categories=["a","b"])
-    values = [1,1,1,1,1,1,1]
-    df = pd.DataFrame({"cats":cats,"values":values}, index=idx)
-
-    df.iloc[2:4,:] = [["b",2],["b",2]]
-    df
-    try:
-        df.iloc[2:4,:] = [["c",3],["c",3]]
-    except ValueError as e:
-        print("ValueError: " + str(e))
-
-Setting values by assigning categorical data will also check that the `categories` match:
-
-.. ipython:: python
-
-    df.loc["j":"k","cats"] = pd.Categorical(["a","a"], categories=["a","b"])
-    df
-    try:
-        df.loc["j":"k","cats"] = pd.Categorical(["b","b"], categories=["a","b","c"])
-    except ValueError as e:
-        print("ValueError: " + str(e))
-
-Assigning a `Categorical` to parts of a column of other types will use the values:
-
-.. ipython:: python
-
-    df = pd.DataFrame({"a":[1,1,1,1,1], "b":["a","a","a","a","a"]})
-    df.loc[1:2,"a"] = pd.Categorical(["b","b"], categories=["a","b"])
-    df.loc[2:3,"b"] = pd.Categorical(["b","b"], categories=["a","b"])
-    df
-    df.dtypes
-
-.. _categorical.merge:
-
-Merging
-~~~~~~~
-
-You can concat two `DataFrames` containing categorical data together,
-but the categories of these categoricals need to be the same:
-
-.. ipython:: python
-
-    cat = pd.Series(["a","b"], dtype="category")
-    vals = [1,2]
-    df = pd.DataFrame({"cats":cat, "vals":vals})
-    res = pd.concat([df,df])
-    res
-    res.dtypes
-
-In this case the categories are not the same and so an error is raised:
-
-.. ipython:: python
-
-    df_different = df.copy()
-    df_different["cats"].cat.categories = ["c","d"]
-    try:
-        pd.concat([df,df_different])
-    except ValueError as e:
-        print("ValueError: " + str(e))
-
-The same applies to ``df.append(df_different)``.
-
-See also the section on :ref:`merge dtypes<merging.dtypes>` for notes about preserving merge dtypes and performance.
-
-
-.. _categorical.union:
-
-Unioning
-~~~~~~~~
-
-.. versionadded:: 0.19.0
-
-If you want to combine categoricals that do not necessarily have
-the same categories, the ``union_categoricals`` function will
-combine a list-like of categoricals. The new categories
-will be the union of the categories being combined.
-
-.. ipython:: python
-
-    from pandas.types.concat import union_categoricals
-    a = pd.Categorical(["b", "c"])
-    b = pd.Categorical(["a", "b"])
-    union_categoricals([a, b])
-
-By default, the resulting categories will be ordered as
-they appear in the data. If you want the categories to
-be lexsorted, use ``sort_categories=True`` argument.
-
-.. ipython:: python
-
-    union_categoricals([a, b], sort_categories=True)
-
-``union_categoricals`` also works with the "easy" case of combining two
-categoricals of the same categories and order information
-(e.g. what you could also ``append`` for).
-
-.. ipython:: python
-
-    a = pd.Categorical(["a", "b"], ordered=True)
-    b = pd.Categorical(["a", "b", "a"], ordered=True)
-    union_categoricals([a, b])
-
-The below raises ``TypeError`` because the categories are ordered and not identical.
-
-.. code-block:: ipython
-
-   In [1]: a = pd.Categorical(["a", "b"], ordered=True)
-   In [2]: b = pd.Categorical(["a", "b", "c"], ordered=True)
-   In [3]: union_categoricals([a, b])
-   Out[3]:
-   TypeError: to union ordered Categoricals, all categories must be the same
-
-.. versionadded:: 0.20.0
-
-Ordered categoricals with different categories or orderings can be combined by
-using the ``ignore_ordered=True`` argument.
-
-.. ipython:: python
-
-    a = pd.Categorical(["a", "b", "c"], ordered=True)
-    b = pd.Categorical(["c", "b", "a"], ordered=True)
-    union_categoricals([a, b], ignore_order=True)
-
-``union_categoricals`` also works with a ``CategoricalIndex``, or ``Series`` containing
-categorical data, but note that the resulting array will always be a plain ``Categorical``
-
-.. ipython:: python
-
-    a = pd.Series(["b", "c"], dtype='category')
-    b = pd.Series(["a", "b"], dtype='category')
-    union_categoricals([a, b])
-
-.. note::
-
-   ``union_categoricals`` may recode the integer codes for categories
-   when combining categoricals.  This is likely what you want,
-   but if you are relying on the exact numbering of the categories, be
-   aware.
-
-   .. ipython:: python
-
-      c1 = pd.Categorical(["b", "c"])
-      c2 = pd.Categorical(["a", "b"])
-
-      c1
-      # "b" is coded to 0
-      c1.codes
-
-      c2
-      # "b" is coded to 1
-      c2.codes
-
-      c = union_categoricals([c1, c2])
-      c
-      # "b" is coded to 0 throughout, same as c1, different from c2
-      c.codes
-
-.. _categorical.concat:
-
-Concatenation
-~~~~~~~~~~~~~
-
-This section describes concatenations specific to ``category`` dtype. See :ref:`Concatenating objects<merging.concat>` for general description.
-
-By default, ``Series`` or ``DataFrame`` concatenation which contains the same categories
-results in ``category`` dtype, otherwise results in ``object`` dtype.
-Use ``.astype`` or ``union_categoricals`` to get ``category`` result.
-
-.. ipython:: python
-
-   # same categories
-   s1 = pd.Series(['a', 'b'], dtype='category')
-   s2 = pd.Series(['a', 'b', 'a'], dtype='category')
-   pd.concat([s1, s2])
-
-   # different categories
-   s3 = pd.Series(['b', 'c'], dtype='category')
-   pd.concat([s1, s3])
-
-   pd.concat([s1, s3]).astype('category')
-   union_categoricals([s1.values, s3.values])
-
-
-Following table summarizes the results of ``Categoricals`` related concatenations.
-
-+----------+--------------------------------------------------------+----------------------------+
-| arg1     | arg2                                                   | result                     |
-+==========+========================================================+============================+
-| category | category (identical categories)                        | category                   |
-+----------+--------------------------------------------------------+----------------------------+
-| category | category (different categories, both not ordered)      | object (dtype is inferred) |
-+----------+--------------------------------------------------------+----------------------------+
-| category | category (different categories, either one is ordered) | object (dtype is inferred) |
-+----------+--------------------------------------------------------+----------------------------+
-| category | not category                                           | object (dtype is inferred) |
-+----------+--------------------------------------------------------+----------------------------+
-
-
-Getting Data In/Out
--------------------
-
-.. versionadded:: 0.15.2
-
-Writing data (`Series`, `Frames`) to a HDF store that contains a ``category`` dtype was implemented
-in 0.15.2. See :ref:`here <io.hdf5-categorical>` for an example and caveats.
-
-Writing data to and reading data from *Stata* format files was implemented in
-0.15.2. See :ref:`here <io.stata-categorical>` for an example and caveats.
-
-Writing to a CSV file will convert the data, effectively removing any information about the
-categorical (categories and ordering). So if you read back the CSV file you have to convert the
-relevant columns back to `category` and assign the right categories and categories ordering.
-
-.. ipython:: python
-    :suppress:
-
-    from pandas.compat import StringIO
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical(['a', 'b', 'b', 'a', 'a', 'd']))
-    # rename the categories
-    s.cat.categories = ["very good", "good", "bad"]
-    # reorder the categories and add missing categories
-    s = s.cat.set_categories(["very bad", "bad", "medium", "good", "very good"])
-    df = pd.DataFrame({"cats":s, "vals":[1,2,3,4,5,6]})
-    csv = StringIO()
-    df.to_csv(csv)
-    df2 = pd.read_csv(StringIO(csv.getvalue()))
-    df2.dtypes
-    df2["cats"]
-    # Redo the category
-    df2["cats"] = df2["cats"].astype("category")
-    df2["cats"].cat.set_categories(["very bad", "bad", "medium", "good", "very good"],
-                                   inplace=True)
-    df2.dtypes
-    df2["cats"]
-
-The same holds for writing to a SQL database with ``to_sql``.
-
-Missing Data
-------------
-
-pandas primarily uses the value `np.nan` to represent missing data. It is by
-default not included in computations. See the :ref:`Missing Data section
-<missing_data>`.
-
-Missing values should **not** be included in the Categorical's ``categories``,
-only in the ``values``.
-Instead, it is understood that NaN is different, and is always a possibility.
-When working with the Categorical's ``codes``, missing values will always have
-a code of ``-1``.
-
-.. ipython:: python
-
-    s = pd.Series(["a", "b", np.nan, "a"], dtype="category")
-    # only two categories
-    s
-    s.cat.codes
-
-
-Methods for working with missing data, e.g. :meth:`~Series.isnull`, :meth:`~Series.fillna`,
-:meth:`~Series.dropna`, all work normally:
-
-.. ipython:: python
-
-    s = pd.Series(["a", "b", np.nan], dtype="category")
-    s
-    pd.isnull(s)
-    s.fillna("a")
-
-Differences to R's `factor`
----------------------------
-
-The following differences to R's factor functions can be observed:
-
-* R's `levels` are named `categories`
-* R's `levels` are always of type string, while `categories` in pandas can be of any dtype.
-* It's not possible to specify labels at creation time. Use ``s.cat.rename_categories(new_labels)``
-  afterwards.
-* In contrast to R's `factor` function, using categorical data as the sole input to create a
-  new categorical series will *not* remove unused categories but create a new categorical series
-  which is equal to the passed in one!
-* R allows for missing values to be included in its `levels` (pandas' `categories`). Pandas
-  does not allow `NaN` categories, but missing values can still be in the `values`.
-
-
-Gotchas
--------
-
-.. _categorical.rfactor:
-
-Memory Usage
-~~~~~~~~~~~~
-
-.. _categorical.memory:
-
-The memory usage of a ``Categorical`` is proportional to the number of categories times the length of the data. In contrast,
-an ``object`` dtype is a constant times the length of the data.
-
-.. ipython:: python
-
-   s = pd.Series(['foo','bar']*1000)
-
-   # object dtype
-   s.nbytes
-
-   # category dtype
-   s.astype('category').nbytes
-
-.. note::
-
-   If the number of categories approaches the length of the data, the ``Categorical`` will use nearly the same or
-   more memory than an equivalent ``object`` dtype representation.
-
-   .. ipython:: python
-
-      s = pd.Series(['foo%04d' % i for i in range(2000)])
-
-      # object dtype
-      s.nbytes
-
-      # category dtype
-      s.astype('category').nbytes
-
-
-Old style constructor usage
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In earlier versions than pandas 0.15, a `Categorical` could be constructed by passing in precomputed
-`codes` (called then `labels`) instead of values with categories. The `codes` were interpreted as
-pointers to the categories with `-1` as `NaN`. This type of constructor usage is replaced by
-the special constructor :func:`Categorical.from_codes`.
-
-Unfortunately, in some special cases, using code which assumes the old style constructor usage
-will work with the current pandas version, resulting in subtle bugs:
-
-.. code-block:: python
-
-    >>> cat = pd.Categorical([1,2], [1,2,3])
-    >>> # old version
-    >>> cat.get_values()
-    array([2, 3], dtype=int64)
-    >>> # new version
-    >>> cat.get_values()
-    array([1, 2], dtype=int64)
-
-.. warning::
-    If you used `Categoricals` with older versions of pandas, please audit your code before
-    upgrading and change your code to use the :func:`~pandas.Categorical.from_codes`
-    constructor.
-
-`Categorical` is not a `numpy` array
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Currently, categorical data and the underlying `Categorical` is implemented as a python
-object and not as a low-level `numpy` array dtype. This leads to some problems.
-
-`numpy` itself doesn't know about the new `dtype`:
-
-.. ipython:: python
-
-    try:
-        np.dtype("category")
-    except TypeError as e:
-        print("TypeError: " + str(e))
-
-    dtype = pd.Categorical(["a"]).dtype
-    try:
-        np.dtype(dtype)
-    except TypeError as e:
-         print("TypeError: " + str(e))
-
-Dtype comparisons work:
-
-.. ipython:: python
-
-    dtype == np.str_
-    np.str_ == dtype
-
-To check if a Series contains Categorical data, with pandas 0.16 or later, use
-``hasattr(s, 'cat')``:
-
-.. ipython:: python
-
-    hasattr(pd.Series(['a'], dtype='category'), 'cat')
-    hasattr(pd.Series(['a']), 'cat')
-
-Using `numpy` functions on a `Series` of type ``category`` should not work as `Categoricals`
-are not numeric data (even in the case that ``.categories`` is numeric).
-
-.. ipython:: python
-
-    s = pd.Series(pd.Categorical([1,2,3,4]))
-    try:
-        np.sum(s)
-        #same with np.log(s),..
-    except TypeError as e:
-         print("TypeError: " + str(e))
-
-.. note::
-    If such a function works, please file a bug at https://github.com/pandas-dev/pandas!
-
-dtype in apply
-~~~~~~~~~~~~~~
-
-Pandas currently does not preserve the dtype in apply functions: If you apply along rows you get
-a `Series` of ``object`` `dtype` (same as getting a row -> getting one element will return a
-basic type) and applying along columns will also convert to object.
-
-.. ipython:: python
-
-    df = pd.DataFrame({"a":[1,2,3,4],
-                       "b":["a","b","c","d"],
-                       "cats":pd.Categorical([1,2,3,2])})
-    df.apply(lambda row: type(row["cats"]), axis=1)
-    df.apply(lambda col: col.dtype, axis=0)
-
-Categorical Index
-~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.16.1
-
-A new ``CategoricalIndex`` index type is introduced in version 0.16.1. See the
-:ref:`advanced indexing docs <indexing.categoricalindex>` for a more detailed
-explanation.
-
-Setting the index, will create create a ``CategoricalIndex``
-
-.. ipython:: python
-
-    cats = pd.Categorical([1,2,3,4], categories=[4,2,3,1])
-    strings = ["a","b","c","d"]
-    values = [4,2,3,1]
-    df = pd.DataFrame({"strings":strings, "values":values}, index=cats)
-    df.index
-    # This now sorts by the categories order
-    df.sort_index()
-
-In previous versions (<0.16.1) there is no index of type ``category``, so
-setting the index to categorical column will convert the categorical data to a
-"normal" dtype first and therefore remove any custom ordering of the categories.
-
-Side Effects
-~~~~~~~~~~~~
-
-Constructing a `Series` from a `Categorical` will not copy the input `Categorical`. This
-means that changes to the `Series` will in most cases change the original `Categorical`:
-
-.. ipython:: python
-
-    cat = pd.Categorical([1,2,3,10], categories=[1,2,3,4,10])
-    s = pd.Series(cat, name="cat")
-    cat
-    s.iloc[0:2] = 10
-    cat
-    df = pd.DataFrame(s)
-    df["cat"].cat.categories = [1,2,3,4,5]
-    cat
-
-Use ``copy=True`` to prevent such a behaviour or simply don't reuse `Categoricals`:
-
-.. ipython:: python
-
-    cat = pd.Categorical([1,2,3,10], categories=[1,2,3,4,10])
-    s = pd.Series(cat, name="cat", copy=True)
-    cat
-    s.iloc[0:2] = 10
-    cat
-
-.. note::
-    This also happens in some cases when you supply a `numpy` array instead of a `Categorical`:
-    using an int array (e.g. ``np.array([1,2,3,4])``) will exhibit the same behaviour, while using
-    a string array (e.g. ``np.array(["a","b","c","a"])``) will not.
diff --git a/doc/source/comparison_with_sas.rst b/doc/source/comparison_with_sas.rst
deleted file mode 100644
index 7ec91d251f15d..0000000000000
--- a/doc/source/comparison_with_sas.rst
+++ /dev/null
@@ -1,607 +0,0 @@
-.. currentmodule:: pandas
-.. _compare_with_sas:
-
-Comparison with SAS
-********************
-For potential users coming from `SAS <https://en.wikipedia.org/wiki/SAS_(software)>`__
-this page is meant to demonstrate how different SAS operations would be
-performed in pandas.
-
-If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
-to familiarize yourself with the library.
-
-As is customary, we import pandas and numpy as follows:
-
-.. ipython:: python
-
-    import pandas as pd
-    import numpy as np
-
-
-.. note::
-
-   Throughout this tutorial, the pandas ``DataFrame`` will be displayed by calling
-   ``df.head()``, which displays the first N (default 5) rows of the ``DataFrame``.
-   This is often used in interactive work (e.g. `Jupyter notebook
-   <https://jupyter.org/>`_ or terminal) - the equivalent in SAS would be:
-
-   .. code-block:: none
-
-      proc print data=df(obs=5);
-      run;
-
-Data Structures
----------------
-
-General Terminology Translation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. csv-table::
-    :header: "pandas", "SAS"
-    :widths: 20, 20
-
-    ``DataFrame``, data set
-    column, variable
-    row, observation
-    groupby, BY-group
-    ``NaN``, ``.``
-
-
-``DataFrame`` / ``Series``
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A ``DataFrame`` in pandas is analogous to a SAS data set - a two-dimensional
-data source with labeled columns that can be of different types. As will be
-shown in this document, almost any operation that can be applied to a data set
-using SAS's ``DATA`` step, can also be accomplished in pandas.
-
-A ``Series`` is the data structure that represents one column of a
-``DataFrame``. SAS doesn't have a separate data structure for a single column,
-but in general, working with a ``Series`` is analogous to referencing a column
-in the ``DATA`` step.
-
-``Index``
-~~~~~~~~~
-
-Every ``DataFrame`` and ``Series`` has an ``Index`` - which are labels on the
-*rows* of the data. SAS does not have an exactly analogous concept. A data set's
-row are essentially unlabeled, other than an implicit integer index that can be
-accessed during the ``DATA`` step (``_N_``).
-
-In pandas, if no index is specified, an integer index is also used by default
-(first row = 0, second row = 1, and so on). While using a labeled ``Index`` or
-``MultiIndex`` can enable sophisticated analyses and is ultimately an important
-part of pandas to understand, for this comparison we will essentially ignore the
-``Index`` and just treat the ``DataFrame`` as a collection of columns. Please
-see the :ref:`indexing documentation<indexing>` for much more on how to use an
-``Index`` effectively.
-
-
-Data Input / Output
--------------------
-
-Constructing a DataFrame from Values
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A SAS data set can be built from specified values by
-placing the data after a ``datalines`` statement and
-specifying the column names.
-
-.. code-block:: none
-
-   data df;
-       input x y;
-       datalines;
-       1 2
-       3 4
-       5 6
-       ;
-   run;
-
-A pandas ``DataFrame`` can be constructed in many different ways,
-but for a small number of values, it is often convenient to specify it as
-a python dictionary, where the keys are the column names
-and the values are the data.
-
-.. ipython:: python
-
-   df = pd.DataFrame({
-             'x': [1, 3, 5],
-             'y': [2, 4, 6]})
-   df
-
-
-Reading External Data
-~~~~~~~~~~~~~~~~~~~~~
-
-Like SAS, pandas provides utilities for reading in data from
-many formats.  The ``tips`` dataset, found within the pandas
-tests (`csv <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv>`_)
-will be used in many of the following examples.
-
-SAS provides ``PROC IMPORT`` to read csv data into a data set.
-
-.. code-block:: none
-
-   proc import datafile='tips.csv' dbms=csv out=tips replace;
-       getnames=yes;
-   run;
-
-The pandas method is :func:`read_csv`, which works similarly.
-
-.. ipython:: python
-
-   url = 'https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv'
-   tips = pd.read_csv(url)
-   tips.head()
-
-
-Like ``PROC IMPORT``, ``read_csv`` can take a number of parameters to specify
-how the data should be parsed.  For example, if the data was instead tab delimited,
-and did not have column names, the pandas command would be:
-
-.. code-block:: python
-
-   tips = pd.read_csv('tips.csv', sep='\t', header=None)
-
-   # alternatively, read_table is an alias to read_csv with tab delimiter
-   tips = pd.read_table('tips.csv', header=None)
-
-In addition to text/csv, pandas supports a variety of other data formats
-such as Excel, HDF5, and SQL databases.  These are all read via a ``pd.read_*``
-function.  See the :ref:`IO documentation<io>` for more details.
-
-Exporting Data
-~~~~~~~~~~~~~~
-
-The inverse of ``PROC IMPORT`` in SAS is ``PROC EXPORT``
-
-.. code-block:: none
-
-   proc export data=tips outfile='tips2.csv' dbms=csv;
-   run;
-
-Similarly in pandas, the opposite of ``read_csv`` is :meth:`~DataFrame.to_csv`,
-and other data formats follow a similar api.
-
-.. code-block:: python
-
-   tips.to_csv('tips2.csv')
-
-
-Data Operations
----------------
-
-Operations on Columns
-~~~~~~~~~~~~~~~~~~~~~
-
-In the ``DATA`` step, arbitrary math expressions can
-be used on new or existing columns.
-
-.. code-block:: none
-
-   data tips;
-       set tips;
-       total_bill = total_bill - 2;
-       new_bill = total_bill / 2;
-   run;
-
-pandas provides similar vectorized operations by
-specifying the individual ``Series`` in the ``DataFrame``.
-New columns can be assigned in the same way.
-
-.. ipython:: python
-
-   tips['total_bill'] = tips['total_bill'] - 2
-   tips['new_bill'] = tips['total_bill'] / 2.0
-   tips.head()
-
-.. ipython:: python
-   :suppress:
-
-   tips = tips.drop('new_bill', axis=1)
-
-Filtering
-~~~~~~~~~
-
-Filtering in SAS is done with an ``if`` or ``where`` statement, on one
-or more columns.
-
-.. code-block:: none
-
-   data tips;
-       set tips;
-       if total_bill > 10;
-   run;
-
-   data tips;
-       set tips;
-       where total_bill > 10;
-       /* equivalent in this case - where happens before the
-          DATA step begins and can also be used in PROC statements */
-   run;
-
-DataFrames can be filtered in multiple ways; the most intuitive of which is using
-:ref:`boolean indexing <indexing.boolean>`
-
-.. ipython:: python
-
-   tips[tips['total_bill'] > 10].head()
-
-If/Then Logic
-~~~~~~~~~~~~~
-
-In SAS, if/then logic can be used to create new columns.
-
-.. code-block:: none
-
-   data tips;
-       set tips;
-       format bucket $4.;
-
-       if total_bill < 10 then bucket = 'low';
-       else bucket = 'high';
-   run;
-
-The same operation in pandas can be accomplished using
-the ``where`` method from ``numpy``.
-
-.. ipython:: python
-
-   tips['bucket'] = np.where(tips['total_bill'] < 10, 'low', 'high')
-   tips.head()
-
-.. ipython:: python
-   :suppress:
-
-   tips = tips.drop('bucket', axis=1)
-
-Date Functionality
-~~~~~~~~~~~~~~~~~~
-
-SAS provides a variety of functions to do operations on
-date/datetime columns.
-
-.. code-block:: none
-
-   data tips;
-       set tips;
-       format date1 date2 date1_plusmonth mmddyy10.;
-       date1 = mdy(1, 15, 2013);
-       date2 = mdy(2, 15, 2015);
-       date1_year = year(date1);
-       date2_month = month(date2);
-       * shift date to beginning of next interval;
-       date1_next = intnx('MONTH', date1, 1);
-       * count intervals between dates;
-       months_between = intck('MONTH', date1, date2);
-   run;
-
-The equivalent pandas operations are shown below.  In addition to these
-functions pandas supports other Time Series features
-not available in Base SAS (such as resampling and and custom offsets) -
-see the :ref:`timeseries documentation<timeseries>` for more details.
-
-.. ipython:: python
-
-   tips['date1'] = pd.Timestamp('2013-01-15')
-   tips['date2'] = pd.Timestamp('2015-02-15')
-   tips['date1_year'] = tips['date1'].dt.year
-   tips['date2_month'] = tips['date2'].dt.month
-   tips['date1_next'] = tips['date1'] + pd.offsets.MonthBegin()
-   tips['months_between'] = (tips['date2'].dt.to_period('M') -
-                             tips['date1'].dt.to_period('M'))
-
-   tips[['date1','date2','date1_year','date2_month',
-         'date1_next','months_between']].head()
-
-.. ipython:: python
-   :suppress:
-
-   tips = tips.drop(['date1','date2','date1_year',
-      'date2_month','date1_next','months_between'], axis=1)
-
-Selection of Columns
-~~~~~~~~~~~~~~~~~~~~
-
-SAS provides keywords in the ``DATA`` step to select,
-drop, and rename columns.
-
-.. code-block:: none
-
-   data tips;
-       set tips;
-       keep sex total_bill tip;
-   run;
-
-   data tips;
-       set tips;
-       drop sex;
-   run;
-
-   data tips;
-       set tips;
-       rename total_bill=total_bill_2;
-   run;
-
-The same operations are expressed in pandas below.
-
-.. ipython:: python
-
-   # keep
-   tips[['sex', 'total_bill', 'tip']].head()
-
-   # drop
-   tips.drop('sex', axis=1).head()
-
-   # rename
-   tips.rename(columns={'total_bill':'total_bill_2'}).head()
-
-
-Sorting by Values
-~~~~~~~~~~~~~~~~~
-
-Sorting in SAS is accomplished via ``PROC SORT``
-
-.. code-block:: none
-
-   proc sort data=tips;
-       by sex total_bill;
-   run;
-
-pandas objects have a :meth:`~DataFrame.sort_values` method, which
-takes a list of columns to sort by.
-
-.. ipython:: python
-
-   tips = tips.sort_values(['sex', 'total_bill'])
-   tips.head()
-
-Merging
--------
-
-The following tables will be used in the merge examples
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'key': ['A', 'B', 'C', 'D'],
-                       'value': np.random.randn(4)})
-   df1
-   df2 = pd.DataFrame({'key': ['B', 'D', 'D', 'E'],
-                        'value': np.random.randn(4)})
-   df2
-
-In SAS, data must be explicitly sorted before merging.  Different
-types of joins are accomplished using the ``in=`` dummy
-variables to track whether a match was found in one or both
-input frames.
-
-.. code-block:: none
-
-   proc sort data=df1;
-       by key;
-   run;
-
-   proc sort data=df2;
-       by key;
-   run;
-
-   data left_join inner_join right_join outer_join;
-       merge df1(in=a) df2(in=b);
-
-       if a and b then output inner_join;
-       if a then output left_join;
-       if b then output right_join;
-       if a or b then output outer_join;
-   run;
-
-pandas DataFrames have a :meth:`~DataFrame.merge` method, which provides
-similar functionality.  Note that the data does not have
-to be sorted ahead of time, and different join
-types are accomplished via the ``how`` keyword.
-
-.. ipython:: python
-
-   inner_join = df1.merge(df2, on=['key'], how='inner')
-   inner_join
-
-   left_join = df1.merge(df2, on=['key'], how='left')
-   left_join
-
-   right_join = df1.merge(df2, on=['key'], how='right')
-   right_join
-
-   outer_join = df1.merge(df2, on=['key'], how='outer')
-   outer_join
-
-
-Missing Data
-------------
-
-Like SAS, pandas has a representation for missing data - which is the
-special float value ``NaN`` (not a number).  Many of the semantics
-are the same, for example missing data propagates through numeric
-operations, and is ignored by default for aggregations.
-
-.. ipython:: python
-
-   outer_join
-   outer_join['value_x'] + outer_join['value_y']
-   outer_join['value_x'].sum()
-
-One difference is that missing data cannot be compared to its sentinel value.
-For example, in SAS you could do this to filter missing values.
-
-.. code-block:: none
-
-   data outer_join_nulls;
-       set outer_join;
-       if value_x = .;
-   run;
-
-   data outer_join_no_nulls;
-       set outer_join;
-       if value_x ^= .;
-   run;
-
-Which doesn't work in in pandas.  Instead, the ``pd.isnull`` or ``pd.notnull`` functions
-should be used for comparisons.
-
-.. ipython:: python
-
-   outer_join[pd.isnull(outer_join['value_x'])]
-   outer_join[pd.notnull(outer_join['value_x'])]
-
-pandas also provides a variety of methods to work with missing data - some of
-which would be challenging to express in SAS. For example, there are methods to
-drop all rows with any missing values, replacing missing values with a specified
-value, like the mean, or forward filling from previous rows. See the
-:ref:`missing data documentation<missing_data>` for more.
-
-.. ipython:: python
-
-   outer_join.dropna()
-   outer_join.fillna(method='ffill')
-   outer_join['value_x'].fillna(outer_join['value_x'].mean())
-
-
-GroupBy
--------
-
-Aggregation
-~~~~~~~~~~~
-
-SAS's PROC SUMMARY can be used to group by one or
-more key variables and compute aggregations on
-numeric columns.
-
-.. code-block:: none
-
-   proc summary data=tips nway;
-       class sex smoker;
-       var total_bill tip;
-       output out=tips_summed sum=;
-   run;
-
-pandas provides a flexible ``groupby`` mechanism that
-allows similar aggregations.  See the :ref:`groupby documentation<groupby>`
-for more details and examples.
-
-.. ipython:: python
-
-   tips_summed = tips.groupby(['sex', 'smoker'])['total_bill', 'tip'].sum()
-   tips_summed.head()
-
-
-Transformation
-~~~~~~~~~~~~~~
-
-In SAS, if the group aggregations need to be used with
-the original frame, it must be merged back together.  For
-example, to subtract the mean for each observation by smoker group.
-
-.. code-block:: none
-
-   proc summary data=tips missing nway;
-       class smoker;
-       var total_bill;
-       output out=smoker_means mean(total_bill)=group_bill;
-   run;
-
-   proc sort data=tips;
-       by smoker;
-   run;
-
-   data tips;
-       merge tips(in=a) smoker_means(in=b);
-       by smoker;
-       adj_total_bill = total_bill - group_bill;
-       if a and b;
-   run;
-
-
-pandas ``groubpy`` provides a ``transform`` mechanism that allows
-these type of operations to be succinctly expressed in one
-operation.
-
-.. ipython:: python
-
-   gb = tips.groupby('smoker')['total_bill']
-   tips['adj_total_bill'] = tips['total_bill'] - gb.transform('mean')
-   tips.head()
-
-
-By Group Processing
-~~~~~~~~~~~~~~~~~~~
-
-In addition to aggregation, pandas ``groupby`` can be used to
-replicate most other by group processing from SAS. For example,
-this ``DATA`` step reads the data by sex/smoker group and filters to
-the first entry for each.
-
-.. code-block:: none
-
-   proc sort data=tips;
-      by sex smoker;
-   run;
-
-   data tips_first;
-       set tips;
-       by sex smoker;
-       if FIRST.sex or FIRST.smoker then output;
-   run;
-
-In pandas this would be written as:
-
-.. ipython:: python
-
-   tips.groupby(['sex','smoker']).first()
-
-
-Other Considerations
---------------------
-
-Disk vs Memory
-~~~~~~~~~~~~~~
-
-pandas operates exclusively in memory, where a SAS data set exists on disk.
-This means that the size of data able to be loaded in pandas is limited by your
-machine's memory, but also that the operations on that data may be faster.
-
-If out of core processing is needed, one possibility is the
-`dask.dataframe <http://dask.pydata.org/en/latest/dataframe.html>`_
-library (currently in development) which 
-provides a subset of pandas functionality for an on-disk ``DataFrame``
-
-Data Interop
-~~~~~~~~~~~~
-
-pandas provides a :func:`read_sas` method that can read SAS data saved in
-the XPORT format.  The ability to read SAS's binary format is planned for a
-future release.
-
-.. code-block:: none
-
-   libname xportout xport 'transport-file.xpt';
-   data xportout.tips;
-       set tips(rename=(total_bill=tbill));
-       * xport variable names limited to 6 characters;
-   run;
-
-.. code-block:: python
-
-   df = pd.read_sas('transport-file.xpt')
-
-XPORT is a relatively limited format and the parsing of it is not as
-optimized as some of the other pandas readers. An alternative way
-to interop data between SAS and pandas is to serialize to csv.
-
-.. code-block:: python
-
-   # version 0.17, 10M rows
-
-   In [8]: %time df = pd.read_sas('big.xpt')
-   Wall time: 14.6 s
-
-   In [9]: %time df = pd.read_csv('big.csv')
-   Wall time: 4.86 s
diff --git a/doc/source/computation.rst b/doc/source/computation.rst
deleted file mode 100644
index 57480a244f308..0000000000000
--- a/doc/source/computation.rst
+++ /dev/null
@@ -1,918 +0,0 @@
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-   plt.close('all')
-   pd.options.display.max_rows=15
-
-.. _computation:
-
-Computational tools
-===================
-
-Statistical Functions
----------------------
-
-.. _computation.pct_change:
-
-Percent Change
-~~~~~~~~~~~~~~
-
-``Series``, ``DataFrame``, and ``Panel`` all have a method ``pct_change`` to compute the
-percent change over a given number of periods (using ``fill_method`` to fill
-NA/null values *before* computing the percent change).
-
-.. ipython:: python
-
-   ser = pd.Series(np.random.randn(8))
-
-   ser.pct_change()
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10, 4))
-
-   df.pct_change(periods=3)
-
-.. _computation.covariance:
-
-Covariance
-~~~~~~~~~~
-
-The ``Series`` object has a method ``cov`` to compute covariance between series
-(excluding NA/null values).
-
-.. ipython:: python
-
-   s1 = pd.Series(np.random.randn(1000))
-   s2 = pd.Series(np.random.randn(1000))
-   s1.cov(s2)
-
-Analogously, ``DataFrame`` has a method ``cov`` to compute pairwise covariances
-among the series in the DataFrame, also excluding NA/null values.
-
-.. _computation.covariance.caveats:
-
-.. note::
-
-    Assuming the missing data are missing at random this results in an estimate
-    for the covariance matrix which is unbiased. However, for many applications
-    this estimate may not be acceptable because the estimated covariance matrix
-    is not guaranteed to be positive semi-definite. This could lead to
-    estimated correlations having absolute values which are greater than one,
-    and/or a non-invertible covariance matrix. See `Estimation of covariance
-    matrices <http://en.wikipedia.org/w/index.php?title=Estimation_of_covariance_matrices>`_
-    for more details.
-
-.. ipython:: python
-
-   frame = pd.DataFrame(np.random.randn(1000, 5), columns=['a', 'b', 'c', 'd', 'e'])
-   frame.cov()
-
-``DataFrame.cov`` also supports an optional ``min_periods`` keyword that
-specifies the required minimum number of observations for each column pair
-in order to have a valid result.
-
-.. ipython:: python
-
-   frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
-   frame.loc[frame.index[:5], 'a'] = np.nan
-   frame.loc[frame.index[5:10], 'b'] = np.nan
-
-   frame.cov()
-
-   frame.cov(min_periods=12)
-
-
-.. _computation.correlation:
-
-Correlation
-~~~~~~~~~~~
-
-Several methods for computing correlations are provided:
-
-.. csv-table::
-    :header: "Method name", "Description"
-    :widths: 20, 80
-
-    ``pearson (default)``, Standard correlation coefficient
-    ``kendall``, Kendall Tau correlation coefficient
-    ``spearman``, Spearman rank correlation coefficient
-
-.. \rho = \cov(x, y) / \sigma_x \sigma_y
-
-All of these are currently computed using pairwise complete observations.
-
-.. note::
-
-    Please see the :ref:`caveats <computation.covariance.caveats>` associated
-    with this method of calculating correlation matrices in the
-    :ref:`covariance section <computation.covariance>`.
-
-.. ipython:: python
-
-   frame = pd.DataFrame(np.random.randn(1000, 5), columns=['a', 'b', 'c', 'd', 'e'])
-   frame.iloc[::2] = np.nan
-
-   # Series with Series
-   frame['a'].corr(frame['b'])
-   frame['a'].corr(frame['b'], method='spearman')
-
-   # Pairwise correlation of DataFrame columns
-   frame.corr()
-
-Note that non-numeric columns will be automatically excluded from the
-correlation calculation.
-
-Like ``cov``, ``corr`` also supports the optional ``min_periods`` keyword:
-
-.. ipython:: python
-
-   frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
-   frame.loc[frame.index[:5], 'a'] = np.nan
-   frame.loc[frame.index[5:10], 'b'] = np.nan
-
-   frame.corr()
-
-   frame.corr(min_periods=12)
-
-
-A related method ``corrwith`` is implemented on DataFrame to compute the
-correlation between like-labeled Series contained in different DataFrame
-objects.
-
-.. ipython:: python
-
-   index = ['a', 'b', 'c', 'd', 'e']
-   columns = ['one', 'two', 'three', 'four']
-   df1 = pd.DataFrame(np.random.randn(5, 4), index=index, columns=columns)
-   df2 = pd.DataFrame(np.random.randn(4, 4), index=index[:4], columns=columns)
-   df1.corrwith(df2)
-   df2.corrwith(df1, axis=1)
-
-.. _computation.ranking:
-
-Data ranking
-~~~~~~~~~~~~
-
-The ``rank`` method produces a data ranking with ties being assigned the mean
-of the ranks (by default) for the group:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.np.random.randn(5), index=list('abcde'))
-   s['d'] = s['b'] # so there's a tie
-   s.rank()
-
-``rank`` is also a DataFrame method and can rank either the rows (``axis=0``)
-or the columns (``axis=1``). ``NaN`` values are excluded from the ranking.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.np.random.randn(10, 6))
-   df[4] = df[2][:5] # some ties
-   df
-   df.rank(1)
-
-``rank`` optionally takes a parameter ``ascending`` which by default is true;
-when false, data is reverse-ranked, with larger values assigned a smaller rank.
-
-``rank`` supports different tie-breaking methods, specified with the ``method``
-parameter:
-
-  - ``average`` : average rank of tied group
-  - ``min`` : lowest rank in the group
-  - ``max`` : highest rank in the group
-  - ``first`` : ranks assigned in the order they appear in the array
-
-.. _stats.moments:
-
-Window Functions
-----------------
-
-.. currentmodule:: pandas.core.window
-
-.. warning::
-
-   Prior to version 0.18.0, ``pd.rolling_*``, ``pd.expanding_*``, and ``pd.ewm*`` were module level
-   functions and are now deprecated. These are replaced by using the :class:`~pandas.core.window.Rolling`, :class:`~pandas.core.window.Expanding` and :class:`~pandas.core.window.EWM`. objects and a corresponding method call.
-
-   The deprecation warning will show the new syntax, see an example :ref:`here <whatsnew_0180.window_deprecations>`
-   You can view the previous documentation
-   `here <http://pandas.pydata.org/pandas-docs/version/0.17.1/computation.html#moving-rolling-statistics-moments>`__
-
-For working with data, a number of windows functions are provided for
-computing common *window* or *rolling* statistics. Among these are count, sum,
-mean, median, correlation, variance, covariance, standard deviation, skewness,
-and kurtosis.
-
-Starting in version 0.18.1, the ``rolling()`` and ``expanding()``
-functions can be used directly from DataFrameGroupBy objects,
-see the :ref:`groupby docs <groupby.transform.window_resample>`.
-
-
-.. note::
-
-   The API for window statistics is quite similar to the way one works with ``GroupBy`` objects, see the documentation :ref:`here <groupby>`
-
-We work with ``rolling``, ``expanding`` and ``exponentially weighted`` data through the corresponding
-objects, :class:`~pandas.core.window.Rolling`, :class:`~pandas.core.window.Expanding` and :class:`~pandas.core.window.EWM`.
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
-   s = s.cumsum()
-   s
-
-These are created from methods on ``Series`` and ``DataFrame``.
-
-.. ipython:: python
-
-   r = s.rolling(window=60)
-   r
-
-These object provide tab-completion of the avaible methods and properties.
-
-.. code-block:: ipython
-
-   In [14]: r.
-   r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
-   r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
-
-Generally these methods all have the same interface. They all
-accept the following arguments:
-
-- ``window``: size of moving window
-- ``min_periods``: threshold of non-null data points to require (otherwise
-  result is NA)
-- ``center``: boolean, whether to set the labels at the center (default is False)
-
-.. warning::
-
-   The ``freq`` and ``how`` arguments were in the API prior to 0.18.0 changes. These are deprecated in the new API. You can simply resample the input prior to creating a window function.
-
-   For example, instead of ``s.rolling(window=5,freq='D').max()`` to get the max value on a rolling 5 Day window, one could use ``s.resample('D').max().rolling(window=5).max()``, which first resamples the data to daily data, then provides a rolling 5 day window.
-
-We can then call methods on these ``rolling`` objects. These return like-indexed objects:
-
-.. ipython:: python
-
-   r.mean()
-
-.. ipython:: python
-
-   s.plot(style='k--')
-
-   @savefig rolling_mean_ex.png
-   r.mean().plot(style='k')
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-They can also be applied to DataFrame objects. This is really just syntactic
-sugar for applying the moving window operator to all of the DataFrame's columns:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(1000, 4),
-                     index=pd.date_range('1/1/2000', periods=1000),
-                     columns=['A', 'B', 'C', 'D'])
-   df = df.cumsum()
-
-   @savefig rolling_mean_frame.png
-   df.rolling(window=60).sum().plot(subplots=True)
-
-.. _stats.summary:
-
-Method Summary
-~~~~~~~~~~~~~~
-
-We provide a number of the common statistical functions:
-
-.. currentmodule:: pandas.core.window
-
-.. csv-table::
-    :header: "Method", "Description"
-    :widths: 20, 80
-
-    :meth:`~Rolling.count`, Number of non-null observations
-    :meth:`~Rolling.sum`, Sum of values
-    :meth:`~Rolling.mean`, Mean of values
-    :meth:`~Rolling.median`, Arithmetic median of values
-    :meth:`~Rolling.min`, Minimum
-    :meth:`~Rolling.max`, Maximum
-    :meth:`~Rolling.std`, Bessel-corrected sample standard deviation
-    :meth:`~Rolling.var`, Unbiased variance
-    :meth:`~Rolling.skew`, Sample skewness (3rd moment)
-    :meth:`~Rolling.kurt`, Sample kurtosis (4th moment)
-    :meth:`~Rolling.quantile`, Sample quantile (value at %)
-    :meth:`~Rolling.apply`, Generic apply
-    :meth:`~Rolling.cov`, Unbiased covariance (binary)
-    :meth:`~Rolling.corr`, Correlation (binary)
-
-The :meth:`~Rolling.apply` function takes an extra ``func`` argument and performs
-generic rolling computations. The ``func`` argument should be a single function
-that produces a single value from an ndarray input. Suppose we wanted to
-compute the mean absolute deviation on a rolling basis:
-
-.. ipython:: python
-
-   mad = lambda x: np.fabs(x - x.mean()).mean()
-   @savefig rolling_apply_ex.png
-   s.rolling(window=60).apply(mad).plot(style='k')
-
-.. _stats.rolling_window:
-
-Rolling Windows
-~~~~~~~~~~~~~~~
-
-Passing ``win_type`` to ``.rolling`` generates a generic rolling window computation, that is weighted according the ``win_type``.
-The following methods are available:
-
-.. csv-table::
-    :header: "Method", "Description"
-    :widths: 20, 80
-
-    :meth:`~Window.sum`, Sum of values
-    :meth:`~Window.mean`, Mean of values
-
-The weights used in the window are specified by the ``win_type`` keyword. The list of recognized types are:
-
-- ``boxcar``
-- ``triang``
-- ``blackman``
-- ``hamming``
-- ``bartlett``
-- ``parzen``
-- ``bohman``
-- ``blackmanharris``
-- ``nuttall``
-- ``barthann``
-- ``kaiser`` (needs beta)
-- ``gaussian`` (needs std)
-- ``general_gaussian`` (needs power, width)
-- ``slepian`` (needs width).
-
-.. ipython:: python
-
-   ser = pd.Series(np.random.randn(10), index=pd.date_range('1/1/2000', periods=10))
-
-   ser.rolling(window=5, win_type='triang').mean()
-
-Note that the ``boxcar`` window is equivalent to :meth:`~Rolling.mean`.
-
-.. ipython:: python
-
-   ser.rolling(window=5, win_type='boxcar').mean()
-   ser.rolling(window=5).mean()
-
-For some windowing functions, additional parameters must be specified:
-
-.. ipython:: python
-
-   ser.rolling(window=5, win_type='gaussian').mean(std=0.1)
-
-.. _stats.moments.normalization:
-
-.. note::
-
-    For ``.sum()`` with a ``win_type``, there is no normalization done to the
-    weights for the window. Passing custom weights of ``[1, 1, 1]`` will yield a different
-    result than passing weights of ``[2, 2, 2]``, for example. When passing a
-    ``win_type`` instead of explicitly specifying the weights, the weights are
-    already normalized so that the largest weight is 1.
-
-    In contrast, the nature of the ``.mean()`` calculation is
-    such that the weights are normalized with respect to each other. Weights
-    of ``[1, 1, 1]`` and ``[2, 2, 2]`` yield the same result.
-
-.. _stats.moments.ts:
-
-Time-aware Rolling
-~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.19.0
-
-New in version 0.19.0 are the ability to pass an offset (or convertible) to a ``.rolling()`` method and have it produce
-variable sized windows based on the passed time window. For each time point, this includes all preceding values occurring
-within the indicated time delta.
-
-This can be particularly useful for a non-regular time frequency index.
-
-.. ipython:: python
-
-   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
-                      index=pd.date_range('20130101 09:00:00', periods=5, freq='s'))
-   dft
-
-This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
-
-.. ipython:: python
-
-   dft.rolling(2).sum()
-   dft.rolling(2, min_periods=1).sum()
-
-Specifying an offset allows a more intuitive specification of the rolling frequency.
-
-.. ipython:: python
-
-   dft.rolling('2s').sum()
-
-Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
-
-
-.. ipython:: python
-
-   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
-                      index = pd.Index([pd.Timestamp('20130101 09:00:00'),
-                                        pd.Timestamp('20130101 09:00:02'),
-                                        pd.Timestamp('20130101 09:00:03'),
-                                        pd.Timestamp('20130101 09:00:05'),
-                                        pd.Timestamp('20130101 09:00:06')],
-                                       name='foo'))
-   dft
-   dft.rolling(2).sum()
-
-
-Using the time-specification generates variable windows for this sparse data.
-
-.. ipython:: python
-
-   dft.rolling('2s').sum()
-
-Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
-default of the index) in a DataFrame.
-
-.. ipython:: python
-
-   dft = dft.reset_index()
-   dft
-   dft.rolling('2s', on='foo').sum()
-
-.. _stats.moments.ts-versus-resampling:
-
-Time-aware Rolling vs. Resampling
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Using ``.rolling()`` with a time-based index is quite similar to :ref:`resampling <timeseries.resampling>`. They
-both operate and perform reductive operations on time-indexed pandas objects.
-
-When using ``.rolling()`` with an offset. The offset is a time-delta. Take a backwards-in-time looking window, and
-aggregate all of the values in that window (including the end-point, but not the start-point). This is the new value
-at that point in the result. These are variable sized windows in time-space for each point of the input. You will get
-a same sized result as the input.
-
-When using ``.resample()`` with an offset. Construct a new index that is the frequency of the offset. For each frequency
-bin, aggregate points from the input within a backwards-in-time looking window that fall in that bin. The result of this
-aggregation is the output for that frequency point. The windows are fixed size size in the frequency space. Your result
-will have the shape of a regular frequency between the min and the max of the original input object.
-
-To summarize, ``.rolling()`` is a time-based window operation, while ``.resample()`` is a frequency-based window operation.
-
-Centering Windows
-~~~~~~~~~~~~~~~~~
-
-By default the labels are set to the right edge of the window, but a
-``center`` keyword is available so the labels can be set at the center.
-
-.. ipython:: python
-
-   ser.rolling(window=5).mean()
-   ser.rolling(window=5, center=True).mean()
-
-.. _stats.moments.binary:
-
-Binary Window Functions
-~~~~~~~~~~~~~~~~~~~~~~~
-
-:meth:`~Rolling.cov` and :meth:`~Rolling.corr` can compute moving window statistics about
-two ``Series`` or any combination of ``DataFrame/Series`` or
-``DataFrame/DataFrame``. Here is the behavior in each case:
-
-- two ``Series``: compute the statistic for the pairing.
-- ``DataFrame/Series``: compute the statistics for each column of the DataFrame
-  with the passed Series, thus returning a DataFrame.
-- ``DataFrame/DataFrame``: by default compute the statistic for matching column
-  names, returning a DataFrame. If the keyword argument ``pairwise=True`` is
-  passed then computes the statistic for each pair of columns, returning a
-  ``Panel`` whose ``items`` are the dates in question (see :ref:`the next section
-  <stats.moments.corr_pairwise>`).
-
-For example:
-
-.. ipython:: python
-
-   df2 = df[:20]
-   df2.rolling(window=5).corr(df2['B'])
-
-.. _stats.moments.corr_pairwise:
-
-Computing rolling pairwise covariances and correlations
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In financial data analysis and other fields it's common to compute covariance
-and correlation matrices for a collection of time series. Often one is also
-interested in moving-window covariance and correlation matrices. This can be
-done by passing the ``pairwise`` keyword argument, which in the case of
-``DataFrame`` inputs will yield a ``Panel`` whose ``items`` are the dates in
-question. In the case of a single DataFrame argument the ``pairwise`` argument
-can even be omitted:
-
-.. note::
-
-    Missing values are ignored and each entry is computed using the pairwise
-    complete observations.  Please see the :ref:`covariance section
-    <computation.covariance>` for :ref:`caveats
-    <computation.covariance.caveats>` associated with this method of
-    calculating covariance and correlation matrices.
-
-.. ipython:: python
-
-   covs = df[['B','C','D']].rolling(window=50).cov(df[['A','B','C']], pairwise=True)
-   covs[df.index[-50]]
-
-.. ipython:: python
-
-   correls = df.rolling(window=50).corr()
-   correls[df.index[-50]]
-
-You can efficiently retrieve the time series of correlations between two
-columns using ``.loc`` indexing:
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-.. ipython:: python
-
-   @savefig rolling_corr_pairwise_ex.png
-   correls.loc[:, 'A', 'C'].plot()
-
-.. _stats.aggregate:
-
-Aggregation
------------
-
-Once the ``Rolling``, ``Expanding`` or ``EWM`` objects have been created, several methods are available to
-perform multiple computations on the data. This is very similar to a ``.groupby(...).agg`` seen :ref:`here <groupby.aggregate>`.
-
-.. ipython:: python
-
-   dfa = pd.DataFrame(np.random.randn(1000, 3),
-                      index=pd.date_range('1/1/2000', periods=1000),
-                      columns=['A', 'B', 'C'])
-   r = dfa.rolling(window=60,min_periods=1)
-   r
-
-We can aggregate by passing a function to the entire DataFrame, or select a Series (or multiple Series) via standard getitem.
-
-.. ipython:: python
-
-   r.aggregate(np.sum)
-
-   r['A'].aggregate(np.sum)
-
-   r[['A','B']].aggregate(np.sum)
-
-As you can see, the result of the aggregation will have the selected columns, or all
-columns if none are selected.
-
-.. _stats.aggregate.multifunc:
-
-Applying multiple functions at once
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-With windowed Series you can also pass a list or dict of functions to do
-aggregation with, outputting a DataFrame:
-
-.. ipython:: python
-
-   r['A'].agg([np.sum, np.mean, np.std])
-
-If a dict is passed, the keys will be used to name the columns. Otherwise the
-function's name (stored in the function object) will be used.
-
-.. ipython:: python
-
-   r['A'].agg({'result1' : np.sum,
-               'result2' : np.mean})
-
-On a widowed DataFrame, you can pass a list of functions to apply to each
-column, which produces an aggregated result with a hierarchical index:
-
-.. ipython:: python
-
-   r.agg([np.sum, np.mean])
-
-Passing a dict of functions has different behavior by default, see the next
-section.
-
-Applying different functions to DataFrame columns
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-By passing a dict to ``aggregate`` you can apply a different aggregation to the
-columns of a DataFrame:
-
-.. ipython:: python
-   :okexcept:
-
-   r.agg({'A' : np.sum,
-          'B' : lambda x: np.std(x, ddof=1)})
-
-The function names can also be strings. In order for a string to be valid it
-must be implemented on the windowed object
-
-.. ipython:: python
-
-   r.agg({'A' : 'sum', 'B' : 'std'})
-
-Furthermore you can pass a nested dict to indicate different aggregations on different columns.
-
-.. ipython:: python
-
-   r.agg({'A' : ['sum','std'], 'B' : ['mean','std'] })
-
-
-.. _stats.moments.expanding:
-
-Expanding Windows
------------------
-
-A common alternative to rolling statistics is to use an *expanding* window,
-which yields the value of the statistic with all the data available up to that
-point in time.
-
-These follow a similar interface to ``.rolling``, with the ``.expanding`` method
-returning an :class:`~pandas.core.window.Expanding` object.
-
-As these calculations are a special case of rolling statistics,
-they are implemented in pandas such that the following two calls are equivalent:
-
-.. ipython:: python
-
-   df.rolling(window=len(df), min_periods=1).mean()[:5]
-
-   df.expanding(min_periods=1).mean()[:5]
-
-These have a similar set of methods to ``.rolling`` methods.
-
-Method Summary
-~~~~~~~~~~~~~~
-
-.. currentmodule:: pandas.core.window
-
-.. csv-table::
-    :header: "Function", "Description"
-    :widths: 20, 80
-
-    :meth:`~Expanding.count`, Number of non-null observations
-    :meth:`~Expanding.sum`, Sum of values
-    :meth:`~Expanding.mean`, Mean of values
-    :meth:`~Expanding.median`, Arithmetic median of values
-    :meth:`~Expanding.min`, Minimum
-    :meth:`~Expanding.max`, Maximum
-    :meth:`~Expanding.std`, Unbiased standard deviation
-    :meth:`~Expanding.var`, Unbiased variance
-    :meth:`~Expanding.skew`, Unbiased skewness (3rd moment)
-    :meth:`~Expanding.kurt`, Unbiased kurtosis (4th moment)
-    :meth:`~Expanding.quantile`, Sample quantile (value at %)
-    :meth:`~Expanding.apply`, Generic apply
-    :meth:`~Expanding.cov`, Unbiased covariance (binary)
-    :meth:`~Expanding.corr`, Correlation (binary)
-
-.. currentmodule:: pandas
-
-Aside from not having a ``window`` parameter, these functions have the same
-interfaces as their ``.rolling`` counterparts. Like above, the parameters they
-all accept are:
-
-- ``min_periods``: threshold of non-null data points to require. Defaults to
-  minimum needed to compute statistic. No ``NaNs`` will be output once
-  ``min_periods`` non-null data points have been seen.
-- ``center``: boolean, whether to set the labels at the center (default is False)
-
-.. _stats.moments.expanding.note:
-.. note::
-
-   The output of the ``.rolling`` and ``.expanding`` methods do not return a
-   ``NaN`` if there are at least ``min_periods`` non-null values in the current
-   window. For example,
-
-   .. ipython:: python
-
-        sn = pd.Series([1, 2, np.nan, 3, np.nan, 4])
-        sn
-        sn.rolling(2).max()
-        sn.rolling(2, min_periods=1).max()
-
-   In case of expanding functions, this differs from :meth:`~DataFrame.cumsum`,
-   :meth:`~DataFrame.cumprod`, :meth:`~DataFrame.cummax`,
-   and :meth:`~DataFrame.cummin`, which return ``NaN`` in the output wherever
-   a ``NaN`` is encountered in the input. In order to match the output of ``cumsum``
-   with ``expanding``, use :meth:`~DataFrame.fillna`:
-
-   .. ipython:: python
-
-        sn.expanding().sum()
-        sn.cumsum()
-        sn.cumsum().fillna(method='ffill')
-
-
-An expanding window statistic will be more stable (and less responsive) than
-its rolling window counterpart as the increasing window size decreases the
-relative impact of an individual data point. As an example, here is the
-:meth:`~core.window.Expanding.mean` output for the previous time series dataset:
-
-.. ipython:: python
-   :suppress:
-
-   plt.close('all')
-
-.. ipython:: python
-
-   s.plot(style='k--')
-
-   @savefig expanding_mean_frame.png
-   s.expanding().mean().plot(style='k')
-
-
-.. _stats.moments.exponentially_weighted:
-
-Exponentially Weighted Windows
-------------------------------
-
-.. currentmodule:: pandas.core.window
-
-A related set of functions are exponentially weighted versions of several of
-the above statistics. A similar interface to ``.rolling`` and ``.expanding`` is accessed
-through the ``.ewm`` method to receive an :class:`~EWM` object.
-A number of expanding EW (exponentially weighted)
-methods are provided:
-
-
-.. csv-table::
-    :header: "Function", "Description"
-    :widths: 20, 80
-
-    :meth:`~EWM.mean`, EW moving average
-    :meth:`~EWM.var`, EW moving variance
-    :meth:`~EWM.std`, EW moving standard deviation
-    :meth:`~EWM.corr`, EW moving correlation
-    :meth:`~EWM.cov`, EW moving covariance
-
-In general, a weighted moving average is calculated as
-
-.. math::
-
-    y_t = \frac{\sum_{i=0}^t w_i x_{t-i}}{\sum_{i=0}^t w_i},
-
-where :math:`x_t` is the input and :math:`y_t` is the result.
-
-The EW functions support two variants of exponential weights.
-The default, ``adjust=True``, uses the weights :math:`w_i = (1 - \alpha)^i`
-which gives
-
-.. math::
-
-    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...
-    + (1 - \alpha)^t x_{0}}{1 + (1 - \alpha) + (1 - \alpha)^2 + ...
-    + (1 - \alpha)^t}
-
-When ``adjust=False`` is specified, moving averages are calculated as
-
-.. math::
-
-    y_0 &= x_0 \\
-    y_t &= (1 - \alpha) y_{t-1} + \alpha x_t,
-
-which is equivalent to using weights
-
-.. math::
-
-    w_i = \begin{cases}
-        \alpha (1 - \alpha)^i & \text{if } i < t \\
-        (1 - \alpha)^i        & \text{if } i = t.
-    \end{cases}
-
-.. note::
-
-   These equations are sometimes written in terms of :math:`\alpha' = 1 - \alpha`, e.g.
-
-   .. math::
-
-      y_t = \alpha' y_{t-1} + (1 - \alpha') x_t.
-
-The difference between the above two variants arises because we are
-dealing with series which have finite history. Consider a series of infinite
-history:
-
-.. math::
-
-    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
-    {1 + (1 - \alpha) + (1 - \alpha)^2 + ...}
-
-Noting that the denominator is a geometric series with initial term equal to 1
-and a ratio of :math:`1 - \alpha` we have
-
-.. math::
-
-    y_t &= \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
-    {\frac{1}{1 - (1 - \alpha)}}\\
-    &= [x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...] \alpha \\
-    &= \alpha x_t + [(1-\alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...]\alpha \\
-    &= \alpha x_t + (1 - \alpha)[x_{t-1} + (1 - \alpha) x_{t-2} + ...]\alpha\\
-    &= \alpha x_t + (1 - \alpha) y_{t-1}
-
-which shows the equivalence of the above two variants for infinite series.
-When ``adjust=True`` we have :math:`y_0 = x_0` and from the last
-representation above we have :math:`y_t = \alpha x_t + (1 - \alpha) y_{t-1}`,
-therefore there is an assumption that :math:`x_0` is not an ordinary value
-but rather an exponentially weighted moment of the infinite series up to that
-point.
-
-One must have :math:`0 < \alpha \leq 1`, and while since version 0.18.0
-it has been possible to pass :math:`\alpha` directly, it's often easier
-to think about either the **span**, **center of mass (com)** or **half-life**
-of an EW moment:
-
-.. math::
-
-   \alpha =
-    \begin{cases}
-        \frac{2}{s + 1},               & \text{for span}\ s \geq 1\\
-        \frac{1}{1 + c},               & \text{for center of mass}\ c \geq 0\\
-        1 - \exp^{\frac{\log 0.5}{h}}, & \text{for half-life}\ h > 0
-    \end{cases}
-
-One must specify precisely one of **span**, **center of mass**, **half-life**
-and **alpha** to the EW functions:
-
-- **Span** corresponds to what is commonly called an "N-day EW moving average".
-- **Center of mass** has a more physical interpretation and can be thought of
-  in terms of span: :math:`c = (s - 1) / 2`.
-- **Half-life** is the period of time for the exponential weight to reduce to
-  one half.
-- **Alpha** specifies the smoothing factor directly.
-
-Here is an example for a univariate time series:
-
-.. ipython:: python
-
-   s.plot(style='k--')
-
-   @savefig ewma_ex.png
-   s.ewm(span=20).mean().plot(style='k')
-
-EWM has a ``min_periods`` argument, which has the same
-meaning it does for all the ``.expanding`` and ``.rolling`` methods:
-no output values will be set until at least ``min_periods`` non-null values
-are encountered in the (expanding) window.
-(This is a change from versions prior to 0.15.0, in which the ``min_periods``
-argument affected only the ``min_periods`` consecutive entries starting at the
-first non-null value.)
-
-EWM also has an ``ignore_na`` argument, which deterines how
-intermediate null values affect the calculation of the weights.
-When ``ignore_na=False`` (the default), weights are calculated based on absolute
-positions, so that intermediate null values affect the result.
-When ``ignore_na=True`` (which reproduces the behavior in versions prior to 0.15.0),
-weights are calculated by ignoring intermediate null values.
-For example, assuming ``adjust=True``, if ``ignore_na=False``, the weighted
-average of ``3, NaN, 5`` would be calculated as
-
-.. math::
-
-	\frac{(1-\alpha)^2 \cdot 3 + 1 \cdot 5}{(1-\alpha)^2 + 1}
-
-Whereas if ``ignore_na=True``, the weighted average would be calculated as
-
-.. math::
-
-	\frac{(1-\alpha) \cdot 3 + 1 \cdot 5}{(1-\alpha) + 1}.
-
-The :meth:`~Ewm.var`, :meth:`~Ewm.std`, and :meth:`~Ewm.cov` functions have a ``bias`` argument,
-specifying whether the result should contain biased or unbiased statistics.
-For example, if ``bias=True``, ``ewmvar(x)`` is calculated as
-``ewmvar(x) = ewma(x**2) - ewma(x)**2``;
-whereas if ``bias=False`` (the default), the biased variance statistics
-are scaled by debiasing factors
-
-.. math::
-
-    \frac{\left(\sum_{i=0}^t w_i\right)^2}{\left(\sum_{i=0}^t w_i\right)^2 - \sum_{i=0}^t w_i^2}.
-
-(For :math:`w_i = 1`, this reduces to the usual :math:`N / (N - 1)` factor,
-with :math:`N = t + 1`.)
-See `Weighted Sample Variance <http://en.wikipedia.org/wiki/Weighted_arithmetic_mean#Weighted_sample_variance>`__
-for further details.
diff --git a/doc/source/conf.py b/doc/source/conf.py
index 0b0de16411e9b..c59d28a6dc3ea 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -2,7 +2,8 @@
 #
 # pandas documentation build configuration file, created by
 #
-# This file is execfile()d with the current directory set to its containing dir.
+# This file is execfile()d with the current directory set to its containing
+# dir.
 #
 # Note that not all possible configuration values are present in this
 # autogenerated file.
@@ -12,9 +13,16 @@
 
 import sys
 import os
-import re
 import inspect
-from pandas.compat import u, PY3
+import importlib
+import logging
+import warnings
+import jinja2
+from sphinx.ext.autosummary import _import_by_name
+from numpydoc.docscrape import NumpyDocString
+from numpydoc.docscrape_sphinx import SphinxDocString
+
+logger = logging.getLogger(__name__)
 
 # https://github.com/sphinx-doc/sphinx/pull/2325/files
 # Workaround for sphinx-build recursion limit overflow:
@@ -29,7 +37,6 @@
 # documentation root, use os.path.abspath to make it absolute, like shown here.
 # sys.path.append(os.path.abspath('.'))
 sys.path.insert(0, os.path.abspath('../sphinxext'))
-
 sys.path.extend([
 
     # numpy standard doc extensions
@@ -41,72 +48,85 @@
 
 # -- General configuration -----------------------------------------------
 
-# Add any Sphinx extension module names here, as strings. They can be extensions
-# coming with Sphinx (named 'sphinx.ext.*') or your custom ones.  sphinxext.
+# Add any Sphinx extension module names here, as strings. They can be
+# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom ones.
+# sphinxext.
 
 extensions = ['sphinx.ext.autodoc',
               'sphinx.ext.autosummary',
               'sphinx.ext.doctest',
               'sphinx.ext.extlinks',
               'sphinx.ext.todo',
-              'numpydoc', # used to parse numpy-style docstrings for autodoc
-              'ipython_sphinxext.ipython_directive',
-              'ipython_sphinxext.ipython_console_highlighting',
+              'numpydoc',  # handle NumPy documentation formatted docstrings
+              'IPython.sphinxext.ipython_directive',
+              'IPython.sphinxext.ipython_console_highlighting',
+              'matplotlib.sphinxext.plot_directive',
               'sphinx.ext.intersphinx',
               'sphinx.ext.coverage',
               'sphinx.ext.mathjax',
               'sphinx.ext.ifconfig',
               'sphinx.ext.linkcode',
+              'nbsphinx',
+              'contributors',  # custom pandas extension
               ]
 
-
-
-with open("index.rst") as f:
-    index_rst_lines = f.readlines()
-
-# only include the slow autosummary feature if we're building the API section
-# of the docs
-
-# JP: added from sphinxdocs
-autosummary_generate = False
-
-if any([re.match("\s*api\s*",l) for l in index_rst_lines]):
-    autosummary_generate = True
-
-files_to_delete = []
-for f in os.listdir(os.path.dirname(__file__)):
-    if not f.endswith('.rst') or f.startswith('.') or os.path.basename(f) == 'index.rst':
-        continue
-
-    _file_basename = f.split('.rst')[0]
-    _regex_to_match = "\s*{}\s*$".format(_file_basename)
-    if not any([re.match(_regex_to_match, line) for line in index_rst_lines]):
-        files_to_delete.append(f)
-
-if files_to_delete:
-    print("I'm about to DELETE the following:\n%s\n" % list(sorted(files_to_delete)))
-    sys.stdout.write("WARNING: I'd like to delete those to speed up processing (yes/no)? ")
-    if PY3:
-        answer = input()
-    else:
-        answer = raw_input()
-
-    if answer.lower().strip() in ('y','yes'):
-        for f in files_to_delete:
-            f = os.path.join(os.path.join(os.path.dirname(__file__),f))
-            f= os.path.abspath(f)
-            try:
-                print("Deleting %s" % f)
-                os.unlink(f)
-            except:
-                print("Error deleting %s" % f)
-                pass
+exclude_patterns = ['**.ipynb_checkpoints']
+try:
+    import nbconvert
+except ImportError:
+    logger.warn('nbconvert not installed. Skipping notebooks.')
+    exclude_patterns.append('**/*.ipynb')
+else:
+    try:
+        nbconvert.utils.pandoc.get_pandoc_version()
+    except nbconvert.utils.pandoc.PandocMissing:
+        logger.warn('Pandoc not installed. Skipping notebooks.')
+        exclude_patterns.append('**/*.ipynb')
+
+# sphinx_pattern can be '-api' to exclude the API pages,
+# the path to a file, or a Python object
+# (e.g. '10min.rst' or 'pandas.DataFrame.head')
+source_path = os.path.dirname(os.path.abspath(__file__))
+pattern = os.environ.get('SPHINX_PATTERN')
+if pattern:
+    for dirname, dirs, fnames in os.walk(source_path):
+        for fname in fnames:
+            if os.path.splitext(fname)[-1] in ('.rst', '.ipynb'):
+                fname = os.path.relpath(os.path.join(dirname, fname),
+                                        source_path)
+
+                if (fname == 'index.rst'
+                        and os.path.abspath(dirname) == source_path):
+                    continue
+                elif pattern == '-api' and dirname == 'reference':
+                    exclude_patterns.append(fname)
+                elif pattern != '-api' and fname != pattern:
+                    exclude_patterns.append(fname)
+
+with open(os.path.join(source_path, 'index.rst.template')) as f:
+    t = jinja2.Template(f.read())
+with open(os.path.join(source_path, 'index.rst'), 'w') as f:
+    f.write(t.render(include_api=pattern is None,
+                     single_doc=(pattern
+                                 if pattern is not None and pattern != '-api'
+                                 else None)))
+autosummary_generate = True if pattern is None else ['index']
+
+# matplotlib plot directive
+plot_include_source = True
+plot_formats = [("png", 90)]
+plot_html_show_formats = False
+plot_html_show_source_link = False
+plot_pre_code = """import numpy as np
+import pandas as pd"""
 
 # Add any paths that contain templates here, relative to this directory.
 templates_path = ['../_templates']
 
 # The suffix of source filenames.
-source_suffix = '.rst'
+source_suffix = [
+    '.rst',
+]
 
 # The encoding of source files.
 source_encoding = 'utf-8'
@@ -115,8 +135,8 @@
 master_doc = 'index'
 
 # General information about the project.
-project = u('pandas')
-copyright = u('2008-2014, the pandas development team')
+project = u'pandas'
+copyright = u'2008-2014, the pandas development team'
 
 # The version info for the project you're documenting, acts as replacement for
 # |version| and |release|, also used in various other places throughout the
@@ -126,7 +146,7 @@
 import pandas
 
 # version = '%s r%s' % (pandas.__version__, svn_version())
-version = '%s' % (pandas.__version__)
+version = str(pandas.__version__)
 
 # The full version, including alpha/beta/rc tags.
 release = version
@@ -148,8 +168,8 @@
 # for source files.
 exclude_trees = []
 
-# The reST default role (used for this markup: `text`) to use for all documents.
-# default_role = None
+# The reST default role (used for this markup: `text`) to use for all
+# documents. default_role = None
 
 # If true, '()' will be appended to :func: etc. cross-reference text.
 # add_function_parentheses = True
@@ -199,16 +219,16 @@
 # of the sidebar.
 # html_logo = None
 
-# The name of an image file (within the static path) to use as favicon of the
-# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
-# pixels large.
-# html_favicon = None
-
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
 # so a file named "default.css" will overwrite the builtin "default.css".
 html_static_path = ['_static']
 
+# The name of an image file (within the static path) to use as favicon of the
+# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
+# pixels large.
+html_favicon = os.path.join(html_static_path[0], 'favicon.ico')
+
 # If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
 # using the given strftime format.
 # html_last_updated_fmt = '%b %d, %Y'
@@ -223,20 +243,92 @@
 # Additional templates that should be rendered to pages, maps page names to
 # template names.
 
-# Add redirect for previously existing API pages (which are now included in
-# the API pages as top-level functions) based on a template (GH9911)
+# Add redirect for previously existing API pages
+# each item is like `(from_old, to_new)`
+# To redirect a class and all its methods, see below
+# https://github.com/pandas-dev/pandas/issues/16186
+
 moved_api_pages = [
-    'pandas.core.common.isnull', 'pandas.core.common.notnull', 'pandas.core.reshape.get_dummies',
-    'pandas.tools.merge.concat', 'pandas.tools.merge.merge', 'pandas.tools.pivot.pivot_table',
-    'pandas.tseries.tools.to_datetime', 'pandas.io.clipboard.read_clipboard', 'pandas.io.excel.ExcelFile.parse',
-    'pandas.io.excel.read_excel', 'pandas.io.html.read_html', 'pandas.io.json.read_json',
-    'pandas.io.parsers.read_csv', 'pandas.io.parsers.read_fwf', 'pandas.io.parsers.read_table',
-    'pandas.io.pickle.read_pickle', 'pandas.io.pytables.HDFStore.append', 'pandas.io.pytables.HDFStore.get',
-    'pandas.io.pytables.HDFStore.put', 'pandas.io.pytables.HDFStore.select', 'pandas.io.pytables.read_hdf',
-    'pandas.io.sql.read_sql', 'pandas.io.sql.read_frame', 'pandas.io.sql.write_frame',
-    'pandas.io.stata.read_stata']
-
-html_additional_pages = {'generated/' + page: 'api_redirect.html' for page in moved_api_pages}
+    ('pandas.core.common.isnull', 'pandas.isna'),
+    ('pandas.core.common.notnull', 'pandas.notna'),
+    ('pandas.core.reshape.get_dummies', 'pandas.get_dummies'),
+    ('pandas.tools.merge.concat', 'pandas.concat'),
+    ('pandas.tools.merge.merge', 'pandas.merge'),
+    ('pandas.tools.pivot.pivot_table', 'pandas.pivot_table'),
+    ('pandas.tseries.tools.to_datetime', 'pandas.to_datetime'),
+    ('pandas.io.clipboard.read_clipboard', 'pandas.read_clipboard'),
+    ('pandas.io.excel.ExcelFile.parse', 'pandas.ExcelFile.parse'),
+    ('pandas.io.excel.read_excel', 'pandas.read_excel'),
+    ('pandas.io.gbq.read_gbq', 'pandas.read_gbq'),
+    ('pandas.io.html.read_html', 'pandas.read_html'),
+    ('pandas.io.json.read_json', 'pandas.read_json'),
+    ('pandas.io.parsers.read_csv', 'pandas.read_csv'),
+    ('pandas.io.parsers.read_fwf', 'pandas.read_fwf'),
+    ('pandas.io.parsers.read_table', 'pandas.read_table'),
+    ('pandas.io.pickle.read_pickle', 'pandas.read_pickle'),
+    ('pandas.io.pytables.HDFStore.append', 'pandas.HDFStore.append'),
+    ('pandas.io.pytables.HDFStore.get', 'pandas.HDFStore.get'),
+    ('pandas.io.pytables.HDFStore.put', 'pandas.HDFStore.put'),
+    ('pandas.io.pytables.HDFStore.select', 'pandas.HDFStore.select'),
+    ('pandas.io.pytables.read_hdf', 'pandas.read_hdf'),
+    ('pandas.io.sql.read_sql', 'pandas.read_sql'),
+    ('pandas.io.sql.read_frame', 'pandas.read_frame'),
+    ('pandas.io.sql.write_frame', 'pandas.write_frame'),
+    ('pandas.io.stata.read_stata', 'pandas.read_stata'),
+]
+
+# Again, tuples of (from_old, to_new)
+moved_classes = [
+    ('pandas.tseries.resample.Resampler', 'pandas.core.resample.Resampler'),
+    ('pandas.formats.style.Styler', 'pandas.io.formats.style.Styler'),
+]
+
+for old, new in moved_classes:
+    # the class itself...
+    moved_api_pages.append((old, new))
+
+    mod, classname = new.rsplit('.', 1)
+    klass = getattr(importlib.import_module(mod), classname)
+    methods = [x for x in dir(klass)
+               if not x.startswith('_') or x in ('__iter__', '__array__')]
+
+    for method in methods:
+        # ... and each of its public methods
+        moved_api_pages.append(
+            ("{old}.{method}".format(old=old, method=method),
+             "{new}.{method}".format(new=new, method=method))
+        )
+
+if pattern is None:
+    html_additional_pages = {
+        'generated/' + page[0]: 'api_redirect.html'
+        for page in moved_api_pages
+    }
+
+
+header = """\
+.. currentmodule:: pandas
+
+.. ipython:: python
+   :suppress:
+
+   import numpy as np
+   import pandas as pd
+
+   randn = np.random.randn
+   np.random.seed(123456)
+   np.set_printoptions(precision=4, suppress=True)
+   pd.options.display.max_rows = 15
+
+   import os
+   os.chdir('{}')
+""".format(os.path.dirname(os.path.dirname(__file__)))
+
+
+html_context = {
+    'redirects': {old: new for old, new in moved_api_pages},
+    'header': header
+}
 
 # If false, no module index is generated.
 html_use_modindex = True
@@ -261,21 +353,26 @@
 # Output file base name for HTML help builder.
 htmlhelp_basename = 'pandas'
 
+# -- Options for nbsphinx ------------------------------------------------
+
+nbsphinx_allow_errors = True
 
 # -- Options for LaTeX output --------------------------------------------
 
+latex_elements = {}
+
 # The paper size ('letter' or 'a4').
 # latex_paper_size = 'letter'
 
 # The font size ('10pt', '11pt' or '12pt').
 # latex_font_size = '10pt'
 
-# Grouping the document tree into LaTeX files. List of tuples
-# (source start file, target name, title, author, documentclass [howto/manual]).
+# Grouping the document tree into LaTeX files. List of tuples (source start
+# file, target name, title, author, documentclass [howto/manual]).
 latex_documents = [
     ('index', 'pandas.tex',
-     u('pandas: powerful Python data analysis toolkit'),
-     u('Wes McKinney\n\& PyData Development Team'), 'manual'),
+     'pandas: powerful Python data analysis toolkit',
+     r'Wes McKinney\n\& PyData Development Team', 'manual'),
 ]
 
 # The name of an image file (relative to this directory) to place at the top of
@@ -296,17 +393,17 @@
 # latex_use_modindex = True
 
 
-# Example configuration for intersphinx: refer to the Python standard library.
-intersphinx_mapping = {
-    'statsmodels': ('http://www.statsmodels.org/devel/', None),
-    'matplotlib': ('http://matplotlib.org/', None),
-    'python': ('http://docs.python.org/3', None),
-    'numpy': ('http://docs.scipy.org/doc/numpy', None),
-    'scipy': ('http://docs.scipy.org/doc/scipy/reference', None),
-    'py': ('https://pylib.readthedocs.io/en/latest/', None)
-}
-import glob
-autosummary_generate = glob.glob("*.rst")
+if pattern is None:
+    intersphinx_mapping = {
+        'dateutil': ("https://dateutil.readthedocs.io/en/latest/", None),
+        'matplotlib': ('https://matplotlib.org/', None),
+        'numpy': ('https://docs.scipy.org/doc/numpy/', None),
+        'pandas-gbq': ('https://pandas-gbq.readthedocs.io/en/latest/', None),
+        'py': ('https://pylib.readthedocs.io/en/latest/', None),
+        'python': ('https://docs.python.org/3/', None),
+        'scipy': ('https://docs.scipy.org/doc/scipy/reference/', None),
+        'statsmodels': ('http://www.statsmodels.org/devel/', None),
+    }
 
 # extlinks alias
 extlinks = {'issue': ('https://github.com/pandas-dev/pandas/issues/%s',
@@ -314,23 +411,88 @@
             'wiki': ('https://github.com/pandas-dev/pandas/wiki/%s',
                      'wiki ')}
 
+
+# ignore all deprecation warnings from Panel during doc build
+# (to avoid the need to add :okwarning: in many places)
+warnings.filterwarnings("ignore", message="\nPanel is deprecated",
+                        category=FutureWarning)
+
+
+ipython_warning_is_error = False
 ipython_exec_lines = [
     'import numpy as np',
     'import pandas as pd',
     # This ensures correct rendering on system with console encoding != utf8
     # (windows). It forces pandas to encode its output reprs using utf8
-    # whereever the docs are built. The docs' target is the browser, not
+    # wherever the docs are built. The docs' target is the browser, not
     # the console, so this is fine.
     'pd.options.display.encoding="utf8"'
-    ]
+]
+
 
+def sphinxdocstring_str(self, indent=0, func_role="obj"):
+    # Pandas displays Attributes section in style like Methods section
+
+    # Function is copy of `SphinxDocString.__str__`
+    ns = {
+        'signature': self._str_signature(),
+        'index': self._str_index(),
+        'summary': self._str_summary(),
+        'extended_summary': self._str_extended_summary(),
+        'parameters': self._str_param_list('Parameters'),
+        'returns': self._str_returns('Returns'),
+        'yields': self._str_returns('Yields'),
+        'other_parameters': self._str_param_list('Other Parameters'),
+        'raises': self._str_param_list('Raises'),
+        'warns': self._str_param_list('Warns'),
+        'warnings': self._str_warnings(),
+        'see_also': self._str_see_also(func_role),
+        'notes': self._str_section('Notes'),
+        'references': self._str_references(),
+        'examples': self._str_examples(),
+        # Replaced `self._str_param_list('Attributes', fake_autosummary=True)`
+        # with `self._str_member_list('Attributes')`
+        'attributes': self._str_member_list('Attributes'),
+        'methods': self._str_member_list('Methods'),
+    }
+    ns = {k: '\n'.join(v) for k, v in ns.items()}
+
+    rendered = self.template.render(**ns)
+    return '\n'.join(self._str_indent(rendered.split('\n'), indent))
+
+
+SphinxDocString.__str__ = sphinxdocstring_str
+
+
+# Fix "WARNING: Inline strong start-string without end-string."
+# PR #155 "Escape the * in *args and **kwargs" from numpydoc
+# Can be removed after PR merges in v0.9.0
+def decorate_process_param(func):
+    def _escape_args_and_kwargs(name):
+        if name[:2] == '**':
+            return r'\*\*' + name[2:]
+        elif name[:1] == '*':
+            return r'\*' + name[1:]
+        else:
+            return name
+
+    def func_wrapper(self, param, desc, fake_autosummary):
+        param = _escape_args_and_kwargs(param.strip())
+        return func(self, param, desc, fake_autosummary)
+
+    return func_wrapper
+
+
+func = SphinxDocString._process_param
+SphinxDocString._process_param = decorate_process_param(func)
 
 # Add custom Documenter to handle attributes/methods of an AccessorProperty
 # eg pandas.Series.str and pandas.Series.dt (see GH9322)
 
 import sphinx
 from sphinx.util import rpartition
-from sphinx.ext.autodoc import Documenter, MethodDocumenter, AttributeDocumenter
+from sphinx.ext.autodoc import (
+    Documenter, MethodDocumenter, AttributeDocumenter)
 from sphinx.ext.autosummary import Autosummary
 
 
@@ -338,7 +500,6 @@ class AccessorDocumenter(MethodDocumenter):
     """
     Specialized Documenter subclass for accessors.
     """
-
     objtype = 'accessor'
     directivetype = 'method'
 
@@ -356,7 +517,6 @@ class AccessorLevelDocumenter(Documenter):
     Specialized Documenter subclass for objects on accessor level (methods,
     attributes).
     """
-
     # This is the simple straightforward version
     # modname is None, base the last elements (eg 'hour')
     # and path the part before (eg 'Series.dt')
@@ -366,7 +526,6 @@ class AccessorLevelDocumenter(Documenter):
     #     mod_cls = mod_cls.split('.')
     #
     #     return modname, mod_cls + [base]
-
     def resolve_name(self, modname, parents, path, base):
         if modname is None:
             if path:
@@ -401,16 +560,17 @@ def resolve_name(self, modname, parents, path, base):
         return modname, parents + [base]
 
 
-class AccessorAttributeDocumenter(AccessorLevelDocumenter, AttributeDocumenter):
-
+class AccessorAttributeDocumenter(AccessorLevelDocumenter,
+                                  AttributeDocumenter):
     objtype = 'accessorattribute'
     directivetype = 'attribute'
 
-    # lower than AttributeDocumenter so this is not chosen for normal attributes
+    # lower than AttributeDocumenter so this is not chosen for normal
+    # attributes
     priority = 0.6
 
-class AccessorMethodDocumenter(AccessorLevelDocumenter, MethodDocumenter):
 
+class AccessorMethodDocumenter(AccessorLevelDocumenter, MethodDocumenter):
     objtype = 'accessormethod'
     directivetype = 'method'
 
@@ -438,7 +598,6 @@ class PandasAutosummary(Autosummary):
     This alternative autosummary class lets us override the table summary for
     Series.plot and DataFrame.plot in the API docs.
     """
-
     def _replace_pandas_items(self, display_name, sig, summary, real_name):
         # this a hack: ideally we should extract the signature from the
         # .__call__ method instead of hard coding this
@@ -450,9 +609,27 @@ def _replace_pandas_items(self, display_name, sig, summary, real_name):
             summary = 'Series plotting accessor and method'
         return (display_name, sig, summary, real_name)
 
+    @staticmethod
+    def _is_deprecated(real_name):
+        try:
+            obj, parent, modname = _import_by_name(real_name)
+        except ImportError:
+            return False
+        doc = NumpyDocString(obj.__doc__ or '')
+        summary = ''.join(doc['Summary'] + doc['Extended Summary'])
+        return '.. deprecated::' in summary
+
+    def _add_deprecation_prefixes(self, items):
+        for item in items:
+            display_name, sig, summary, real_name = item
+            if self._is_deprecated(real_name):
+                summary = '(DEPRECATED) %s' % summary
+            yield display_name, sig, summary, real_name
+
     def get_items(self, names):
         items = Autosummary.get_items(self, names)
         items = [self._replace_pandas_items(*item) for item in items]
+        items = list(self._add_deprecation_prefixes(items))
         return items
 
 
@@ -475,34 +652,38 @@ def linkcode_resolve(domain, info):
     for part in fullname.split('.'):
         try:
             obj = getattr(obj, part)
-        except:
+        except AttributeError:
             return None
 
     try:
-        fn = inspect.getsourcefile(obj)
-    except:
+        # inspect.unwrap() was added in Python version 3.4
+        if sys.version_info >= (3, 5):
+            fn = inspect.getsourcefile(inspect.unwrap(obj))
+        else:
+            fn = inspect.getsourcefile(obj)
+    except TypeError:
         fn = None
     if not fn:
         return None
 
     try:
         source, lineno = inspect.getsourcelines(obj)
-    except:
+    except OSError:
         lineno = None
 
     if lineno:
-        linespec = "#L%d-L%d" % (lineno, lineno + len(source) - 1)
+        linespec = "#L{:d}-L{:d}".format(lineno, lineno + len(source) - 1)
     else:
         linespec = ""
 
     fn = os.path.relpath(fn, start=os.path.dirname(pandas.__file__))
 
     if '+' in pandas.__version__:
-        return "http://github.com/pandas-dev/pandas/blob/master/pandas/%s%s" % (
-            fn, linespec)
+        return ("http://github.com/pandas-dev/pandas/blob/master/pandas/"
+                "{}{}".format(fn, linespec))
     else:
-        return "http://github.com/pandas-dev/pandas/blob/v%s/pandas/%s%s" % (
-            pandas.__version__, fn, linespec)
+        return ("http://github.com/pandas-dev/pandas/blob/"
+                "v{}/pandas/{}{}".format(pandas.__version__, fn, linespec))
 
 
 # remove the docstring of the flags attribute (inherited from numpy ndarray)
@@ -511,8 +692,77 @@ def remove_flags_docstring(app, what, name, obj, options, lines):
     if what == "attribute" and name.endswith(".flags"):
         del lines[:]
 
+
+def process_class_docstrings(app, what, name, obj, options, lines):
+    """
+    For those classes for which we use ::
+
+    :template: autosummary/class_without_autosummary.rst
+
+    the documented attributes/methods have to be listed in the class
+    docstring. However, if one of those lists is empty, we use 'None',
+    which then generates warnings in sphinx / ugly html output.
+    This "autodoc-process-docstring" event connector removes that part
+    from the processed docstring.
+
+    """
+    if what == "class":
+        joined = '\n'.join(lines)
+
+        templates = [
+            """.. rubric:: Attributes
+
+.. autosummary::
+   :toctree:
+
+   None
+""",
+            """.. rubric:: Methods
+
+.. autosummary::
+   :toctree:
+
+   None
+"""
+        ]
+
+        for template in templates:
+            if template in joined:
+                joined = joined.replace(template, '')
+        lines[:] = joined.split('\n')
+
+
+suppress_warnings = [
+    # We "overwrite" autosummary with our PandasAutosummary, but
+    # still want the regular autosummary setup to run. So we just
+    # suppress this warning.
+    'app.add_directive'
+]
+if pattern:
+    # When building a single document we don't want to warn because references
+    # to other documents are unknown, as it's expected
+    suppress_warnings.append('ref.ref')
+
+
+def rstjinja(app, docname, source):
+    """
+    Render our pages as a jinja template for fancy templating goodness.
+    """
+    # http://ericholscher.com/blog/2016/jul/25/integrating-jinja-rst-sphinx/
+    # Make sure we're outputting HTML
+    if app.builder.format != 'html':
+        return
+    src = source[0]
+    rendered = app.builder.templates.render_string(
+        src, app.config.html_context
+    )
+    source[0] = rendered
+
+
 def setup(app):
+    app.connect("source-read", rstjinja)
     app.connect("autodoc-process-docstring", remove_flags_docstring)
+    app.connect("autodoc-process-docstring", process_class_docstrings)
     app.add_autodocumenter(AccessorDocumenter)
     app.add_autodocumenter(AccessorAttributeDocumenter)
     app.add_autodocumenter(AccessorMethodDocumenter)
diff --git a/doc/source/contributing.rst b/doc/source/contributing.rst
deleted file mode 100644
index 5e551a7fd5349..0000000000000
--- a/doc/source/contributing.rst
+++ /dev/null
@@ -1,978 +0,0 @@
-.. _contributing:
-
-**********************
-Contributing to pandas
-**********************
-
-.. contents:: Table of contents:
-   :local:
-
-Where to start?
-===============
-
-All contributions, bug reports, bug fixes, documentation improvements,
-enhancements and ideas are welcome.
-
-If you are simply looking to start working with the *pandas* codebase, navigate to the
-`GitHub "issues" tab <https://github.com/pandas-dev/pandas/issues>`_ and start looking through
-interesting issues.  There are a number of issues listed under `Docs
-<https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open>`_
-and `Difficulty Novice
-<https://github.com/pandas-dev/pandas/issues?q=is%3Aopen+is%3Aissue+label%3A%22Difficulty+Novice%22>`_
-where you could start out.
-
-Or maybe through using *pandas* you have an idea of your own or are looking for something
-in the documentation and thinking 'this can be improved'...you can do something
-about it!
-
-Feel free to ask questions on the `mailing list
-<https://groups.google.com/forum/?fromgroups#!forum/pydata>`_ or on `Gitter
-<https://gitter.im/pydata/pandas>`_.
-
-Bug reports and enhancement requests
-====================================
-
-Bug reports are an important part of making *pandas* more stable.  Having a complete bug report
-will allow others to reproduce the bug and provide insight into fixing.  Because many versions of
-*pandas* are supported, knowing version information will also identify improvements made since
-previous versions. Trying the bug-producing code out on the *master* branch is often a worthwhile exercise
-to confirm the bug still exists.  It is also worth searching existing bug reports and pull requests
-to see if the issue has already been reported and/or fixed.
-
-Bug reports must:
-
-#. Include a short, self-contained Python snippet reproducing the problem.
-   You can format the code nicely by using `GitHub Flavored Markdown
-   <http://github.github.com/github-flavored-markdown/>`_::
-
-      ```python
-      >>> from pandas import DataFrame
-      >>> df = DataFrame(...)
-      ...
-      ```
-
-#. Include the full version string of *pandas* and its dependencies. In versions
-   of *pandas* after 0.12 you can use a built in function::
-
-      >>> from pandas.util.print_versions import show_versions
-      >>> show_versions()
-
-   and in *pandas* 0.13.1 onwards::
-
-      >>> pd.show_versions()
-
-#. Explain why the current behavior is wrong/not desired and what you expect instead.
-
-The issue will then show up to the *pandas* community and be open to comments/ideas from others.
-
-Working with the code
-=====================
-
-Now that you have an issue you want to fix, enhancement to add, or documentation to improve,
-you need to learn how to work with GitHub and the *pandas* code base.
-
-Version control, Git, and GitHub
---------------------------------
-
-To the new user, working with Git is one of the more daunting aspects of contributing to *pandas*.
-It can very quickly become overwhelming, but sticking to the guidelines below will help keep the process
-straightforward and mostly trouble free.  As always, if you are having difficulties please
-feel free to ask for help.
-
-The code is hosted on `GitHub <https://www.github.com/pandas-dev/pandas>`_. To
-contribute you will need to sign up for a `free GitHub account
-<https://github.com/signup/free>`_. We use `Git <http://git-scm.com/>`_ for
-version control to allow many people to work together on the project.
-
-Some great resources for learning Git:
-
-* the `GitHub help pages <http://help.github.com/>`_.
-* the `NumPy's documentation <http://docs.scipy.org/doc/numpy/dev/index.html>`_.
-* Matthew Brett's `Pydagogue <http://matthew-brett.github.com/pydagogue/>`_.
-
-Getting started with Git
-------------------------
-
-`GitHub has instructions <http://help.github.com/set-up-git-redirect>`__ for installing git,
-setting up your SSH key, and configuring git.  All these steps need to be completed before
-you can work seamlessly between your local repository and GitHub.
-
-.. _contributing.forking:
-
-Forking
--------
-
-You will need your own fork to work on the code. Go to the `pandas project
-page <https://github.com/pandas-dev/pandas>`_ and hit the ``Fork`` button. You will
-want to clone your fork to your machine::
-
-    git clone git@github.com:your-user-name/pandas.git pandas-yourname
-    cd pandas-yourname
-    git remote add upstream git://github.com/pandas-dev/pandas.git
-
-This creates the directory `pandas-yourname` and connects your repository to
-the upstream (main project) *pandas* repository.
-
-The testing suite will run automatically on Travis-CI and Appveyor once your
-pull request is submitted.  However, if you wish to run the test suite on a
-branch prior to submitting the pull request, then Travis-CI and/or AppVeyor
-need to be hooked up to your GitHub repository.  Instructions for doing so
-are `here <http://about.travis-ci.org/docs/user/getting-started/>`__ for
-Travis-CI and `here <https://www.appveyor.com/docs/>`__ for AppVeyor.
-
-Creating a branch
------------------
-
-You want your master branch to reflect only production-ready code, so create a
-feature branch for making your changes. For example::
-
-    git branch shiny-new-feature
-    git checkout shiny-new-feature
-
-The above can be simplified to::
-
-    git checkout -b shiny-new-feature
-
-This changes your working directory to the shiny-new-feature branch.  Keep any
-changes in this branch specific to one bug or feature so it is clear
-what the branch brings to *pandas*. You can have many shiny-new-features
-and switch in between them using the git checkout command.
-
-To update this branch, you need to retrieve the changes from the master branch::
-
-    git fetch upstream
-    git rebase upstream/master
-
-This will replay your commits on top of the latest pandas git master.  If this
-leads to merge conflicts, you must resolve these before submitting your pull
-request.  If you have uncommitted changes, you will need to ``stash`` them prior
-to updating.  This will effectively store your changes and they can be reapplied
-after updating.
-
-.. _contributing.dev_env:
-
-Creating a development environment
-----------------------------------
-
-An easy way to create a *pandas* development environment is as follows.
-
-- Install either :ref:`Anaconda <install.anaconda>` or :ref:`miniconda <install.miniconda>`
-- Make sure that you have :ref:`cloned the repository <contributing.forking>`
-- ``cd`` to the *pandas* source directory
-
-Tell conda to create a new environment, named ``pandas_dev``, or any other name you would like
-for this environment, by running::
-
-      conda create -n pandas_dev --file ci/requirements_dev.txt
-
-
-For a python 3 environment::
-
-      conda create -n pandas_dev python=3 --file ci/requirements_dev.txt
-
-.. warning::
-
-   If you are on Windows, see :ref:`here for a fully compliant Windows environment <contributing.windows>`.
-
-This will create the new environment, and not touch any of your existing environments,
-nor any existing python installation. It will install all of the basic dependencies of
-*pandas*, as well as the development and testing tools. If you would like to install
-other dependencies, you can install them as follows::
-
-      conda install -n pandas_dev -c pandas pytables scipy
-
-To install *all* pandas dependencies you can do the following::
-
-      conda install -n pandas_dev -c pandas --file ci/requirements_all.txt
-
-To work in this environment, Windows users should ``activate`` it as follows::
-
-      activate pandas_dev
-
-Mac OSX / Linux users should use::
-
-      source activate pandas_dev
-
-You will then see a confirmation message to indicate you are in the new development environment.
-
-To view your environments::
-
-      conda info -e
-
-To return to your home root environment in Windows::
-
-      deactivate
-
-To return to your home root environment in OSX / Linux::
-
-      source deactivate
-
-See the full conda docs `here <http://conda.pydata.org/docs>`__.
-
-At this point you can easily do an *in-place* install, as detailed in the next section.
-
-.. _contributing.windows:
-
-Creating a Windows development environment
-------------------------------------------
-
-To build on Windows, you need to have compilers installed to build the extensions. You will need to install the appropriate Visual Studio compilers, VS 2008 for Python 2.7, VS 2010 for 3.4, and VS 2015 for Python 3.5.
-
-For Python 2.7, you can install the ``mingw`` compiler which will work equivalently to VS 2008::
-
-      conda install -n pandas_dev libpython
-
-or use the `Microsoft Visual Studio VC++ compiler for Python <https://www.microsoft.com/en-us/download/details.aspx?id=44266>`__. Note that you have to check the ``x64`` box to install the ``x64`` extension building capability as this is not installed by default.
-
-For Python 3.4, you can download and install the `Windows 7.1 SDK <https://www.microsoft.com/en-us/download/details.aspx?id=8279>`__. Read the references below as there may be various gotchas during the installation.
-
-For Python 3.5, you can download and install the `Visual Studio 2015 Community Edition <https://www.visualstudio.com/en-us/downloads/visual-studio-2015-downloads-vs.aspx>`__.
-
-Here are some references and blogs:
-
-- https://blogs.msdn.microsoft.com/pythonengineering/2016/04/11/unable-to-find-vcvarsall-bat/
-- https://github.com/conda/conda-recipes/wiki/Building-from-Source-on-Windows-32-bit-and-64-bit
-- https://cowboyprogrammer.org/building-python-wheels-for-windows/
-- https://blog.ionelmc.ro/2014/12/21/compiling-python-extensions-on-windows/
-- https://support.enthought.com/hc/en-us/articles/204469260-Building-Python-extensions-with-Canopy
-
-.. _contributing.getting_source:
-
-Making changes
---------------
-
-Before making your code changes, it is often necessary to build the code that was
-just checked out.  There are two primary methods of doing this.
-
-#. The best way to develop *pandas* is to build the C extensions in-place by
-   running::
-
-      python setup.py build_ext --inplace
-
-   If you startup the Python interpreter in the *pandas* source directory you
-   will call the built C extensions
-
-#. Another very common option is to do a ``develop`` install of *pandas*::
-
-      python setup.py develop
-
-   This makes a symbolic link that tells the Python interpreter to import *pandas*
-   from your development directory. Thus, you can always be using the development
-   version on your system without being inside the clone directory.
-
-
-.. _contributing.documentation:
-
-Contributing to the documentation
-=================================
-
-If you're not the developer type, contributing to the documentation is still
-of huge value. You don't even have to be an expert on
-*pandas* to do so! Something as simple as rewriting small passages for clarity
-as you reference the docs is a simple but effective way to contribute. The
-next person to read that passage will be in your debt!
-
-In fact, there are sections of the docs that are worse off after being written
-by experts. If something in the docs doesn't make sense to you, updating the
-relevant section after you figure it out is a simple way to ensure it will
-help the next person.
-
-.. contents:: Documentation:
-   :local:
-
-
-About the *pandas* documentation
---------------------------------
-
-The documentation is written in **reStructuredText**, which is almost like writing
-in plain English, and built using `Sphinx <http://sphinx.pocoo.org/>`__. The
-Sphinx Documentation has an excellent `introduction to reST
-<http://sphinx.pocoo.org/rest.html>`__. Review the Sphinx docs to perform more
-complex changes to the documentation as well.
-
-Some other important things to know about the docs:
-
-- The *pandas* documentation consists of two parts: the docstrings in the code
-  itself and the docs in this folder ``pandas/doc/``.
-
-  The docstrings provide a clear explanation of the usage of the individual
-  functions, while the documentation in this folder consists of tutorial-like
-  overviews per topic together with some other information (what's new,
-  installation, etc).
-
-- The docstrings follow the **Numpy Docstring Standard**, which is used widely
-  in the Scientific Python community. This standard specifies the format of
-  the different sections of the docstring. See `this document
-  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_
-  for a detailed explanation, or look at some of the existing functions to
-  extend it in a similar manner.
-
-- The tutorials make heavy use of the `ipython directive
-  <http://matplotlib.org/sampledoc/ipython_directive.html>`_ sphinx extension.
-  This directive lets you put code in the documentation which will be run
-  during the doc build. For example::
-
-      .. ipython:: python
-
-          x = 2
-          x**3
-
-  will be rendered as::
-
-      In [1]: x = 2
-
-      In [2]: x**3
-      Out[2]: 8
-
-  Almost all code examples in the docs are run (and the output saved) during the
-  doc build. This approach means that code examples will always be up to date,
-  but it does make the doc building a bit more complex.
-
-.. note::
-
-    The ``.rst`` files are used to automatically generate Markdown and HTML versions
-    of the docs. For this reason, please do not edit ``CONTRIBUTING.md`` directly,
-    but instead make any changes to ``doc/source/contributing.rst``. Then, to
-    generate ``CONTRIBUTING.md``, use `pandoc <http://johnmacfarlane.net/pandoc/>`_
-    with the following command::
-
-      pandoc doc/source/contributing.rst -t markdown_github > CONTRIBUTING.md
-
-The utility script ``scripts/api_rst_coverage.py`` can be used to compare
-the list of methods documented in ``doc/source/api.rst`` (which is used to generate
-the `API Reference <http://pandas.pydata.org/pandas-docs/stable/api.html>`_ page)
-and the actual public methods.
-This will identify methods documented in in ``doc/source/api.rst`` that are not actually
-class methods, and existing methods that are not documented in ``doc/source/api.rst``.
-
-
-How to build the *pandas* documentation
----------------------------------------
-
-Requirements
-~~~~~~~~~~~~
-
-First, you need to have a development environment to be able to build pandas
-(see the docs on :ref:`creating a development environment above <contributing.dev_env>`).
-Further, to build the docs, there are some extra requirements: you will need to
-have ``sphinx`` and ``ipython`` installed. `numpydoc
-<https://github.com/numpy/numpydoc>`_ is used to parse the docstrings that
-follow the Numpy Docstring Standard (see above), but you don't need to install
-this because a local copy of numpydoc is included in the *pandas* source
-code.
-`nbconvert <https://nbconvert.readthedocs.io/en/latest/>`_ and
-`nbformat <https://nbformat.readthedocs.io/en/latest/>`_ are required to build
-the Jupyter notebooks included in the documentation.
-
-If you have a conda environment named ``pandas_dev``, you can install the extra
-requirements with::
-
-      conda install -n pandas_dev sphinx ipython nbconvert nbformat
-
-Furthermore, it is recommended to have all :ref:`optional dependencies <install.optional_dependencies>`.
-installed. This is not strictly necessary, but be aware that you will see some error
-messages when building the docs. This happens because all the code in the documentation
-is executed during the doc build, and so code examples using optional dependencies
-will generate errors. Run ``pd.show_versions()`` to get an overview of the installed
-version of all dependencies.
-
-.. warning::
-
-   You need to have ``sphinx`` version >= 1.3.2.
-
-Building the documentation
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-So how do you build the docs? Navigate to your local
-``pandas/doc/`` directory in the console and run::
-
-    python make.py html
-
-Then you can find the HTML output in the folder ``pandas/doc/build/html/``.
-
-The first time you build the docs, it will take quite a while because it has to run
-all the code examples and build all the generated docstring pages. In subsequent
-evocations, sphinx will try to only build the pages that have been modified.
-
-If you want to do a full clean build, do::
-
-    python make.py clean
-    python make.py html
-
-Starting with *pandas* 0.13.1 you can tell ``make.py`` to compile only a single section
-of the docs, greatly reducing the turn-around time for checking your changes.
-You will be prompted to delete ``.rst`` files that aren't required. This is okay because
-the prior versions of these files can be checked out from git. However, you must make sure
-not to commit the file deletions to your Git repository!
-
-::
-
-    #omit autosummary and API section
-    python make.py clean
-    python make.py --no-api
-
-    # compile the docs with only a single
-    # section, that which is in indexing.rst
-    python make.py clean
-    python make.py --single indexing
-
-For comparison, a full documentation build may take 10 minutes, a ``-no-api`` build
-may take 3 minutes and a single section may take 15 seconds.  Subsequent builds, which
-only process portions you have changed, will be faster. Open the following file in a web
-browser to see the full documentation you just built::
-
-    pandas/docs/build/html/index.html
-
-And you'll have the satisfaction of seeing your new and improved documentation!
-
-.. _contributing.dev_docs:
-
-Building master branch documentation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-When pull requests are merged into the *pandas* ``master`` branch, the main parts of
-the documentation are also built by Travis-CI. These docs are then hosted `here
-<http://pandas-docs.github.io/pandas-docs-travis>`__.
-
-Contributing to the code base
-=============================
-
-.. contents:: Code Base:
-   :local:
-
-Code standards
---------------
-
-Writing good code is not just about what you write. It is also about *how* you
-write it. During testing on Travis-CI, several tools will be run to check your
-code for stylistic errors. Generating any warnings will cause the test to fail.
-Thus, good style is a requirement for submitting code to *pandas*.
-
-In addition, because a lot of people use our library, it is important that we
-do not make sudden changes to the code that could have the potential to break
-a lot of user code as a result, that is, we need it to be as *backwards compatible*
-as possible to avoid mass breakages.
-
-Additional standards are outlined on the `code style wiki
-page <https://github.com/pandas-dev/pandas/wiki/Code-Style-and-Conventions>`_.
-
-C (cpplint)
-~~~~~~~~~~~
-
-*pandas* uses the `Google <https://google.github.io/styleguide/cppguide.html>`_
-standard. Google provides an open source style checker called ``cpplint``, but we
-use a fork of it that can be found `here <https://github.com/cpplint/cpplint>`__.
-Here are *some* of the more common ``cpplint`` issues:
-
-  - we restrict line-length to 80 characters to promote readability
-  - every header file must include a header guard to avoid name collisions if re-included
-
-Travis-CI will run the `cpplint <https://pypi.python.org/pypi/cpplint>`_ tool
-and report any stylistic errors in your code. Therefore, it is helpful before
-submitting code to run the check yourself::
-
-   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir modified-c-file
-
-You can also run this command on an entire directory if necessary::
-
-   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir --recursive modified-c-directory
-
-To make your commits compliant with this standard, you can install the
-`ClangFormat <http://clang.llvm.org/docs/ClangFormat.html>`_ tool, which can be
-downloaded `here <http://llvm.org/builds/>`__. To configure, in your home directory,
-run the following command::
-
-    clang-format style=google -dump-config  > .clang-format
-
-Then modify the file to ensure that any indentation width parameters are at least four.
-Once configured, you can run the tool as follows::
-
-    clang-format modified-c-file
-
-This will output what your file will look like if the changes are made, and to apply
-them, just run the following command::
-
-    clang-format -i modified-c-file
-
-To run the tool on an entire directory, you can run the following analogous commands::
-
-    clang-format modified-c-directory/*.c modified-c-directory/*.h
-    clang-format -i modified-c-directory/*.c modified-c-directory/*.h
-
-Do note that this tool is best-effort, meaning that it will try to correct as
-many errors as possible, but it may not correct *all* of them. Thus, it is
-recommended that you run ``cpplint`` to double check and make any other style
-fixes manually.
-
-Python (PEP8)
-~~~~~~~~~~~~~
-
-*pandas* uses the `PEP8 <http://www.python.org/dev/peps/pep-0008/>`_ standard.
-There are several tools to ensure you abide by this standard. Here are *some* of
-the more common ``PEP8`` issues:
-
-  - we restrict line-length to 79 characters to promote readability
-  - passing arguments should have spaces after commas, e.g. ``foo(arg1, arg2, kw1='bar')``
-
-Travis-CI will run the `flake8 <http://pypi.python.org/pypi/flake8>`_ tool
-and report any stylistic errors in your code. Therefore, it is helpful before
-submitting code to run the check yourself on the diff::
-
-   git diff master --name-only -- '*.py' | flake8 --diff
-
-This command will catch any stylistic errors in your changes specifically, but
-be beware it may not catch all of them. For example, if you delete the only
-usage of an imported function, it is stylistically incorrect to import an
-unused function. However, style-checking the diff will not catch this because
-the actual import is not part of the diff. Thus, for completeness, you should
-run this command, though it will take longer::
-
-   git diff master --name-only -- '*.py' | grep 'pandas/' | xargs -r flake8
-
-Note that on OSX, the ``-r`` flag is not available, so you have to omit it and
-run this slightly modified command::
-
-   git diff master --name-only -- '*.py' | grep 'pandas/' | xargs flake8
-
-Backwards Compatibility
-~~~~~~~~~~~~~~~~~~~~~~~
-
-Please try to maintain backward compatibility. *pandas* has lots of users with lots of
-existing code, so don't break it if at all possible.  If you think breakage is required,
-clearly state why as part of the pull request.  Also, be careful when changing method
-signatures and add deprecation warnings where needed.
-
-Test-driven development/code writing
-------------------------------------
-
-*pandas* is serious about testing and strongly encourages contributors to embrace
-`test-driven development (TDD) <http://en.wikipedia.org/wiki/Test-driven_development>`_.
-This development process "relies on the repetition of a very short development cycle:
-first the developer writes an (initially failing) automated test case that defines a desired
-improvement or new function, then produces the minimum amount of code to pass that test."
-So, before actually writing any code, you should write your tests.  Often the test can be
-taken from the original GitHub issue.  However, it is always worth considering additional
-use cases and writing corresponding tests.
-
-Adding tests is one of the most common requests after code is pushed to *pandas*.  Therefore,
-it is worth getting in the habit of writing tests ahead of time so this is never an issue.
-
-Like many packages, *pandas* uses `pytest
-<http://doc.pytest.org/en/latest/>`_ and the convenient
-extensions in `numpy.testing
-<http://docs.scipy.org/doc/numpy/reference/routines.testing.html>`_.
-
-Writing tests
-~~~~~~~~~~~~~
-
-All tests should go into the ``tests`` subdirectory of the specific package.
-This folder contains many current examples of tests, and we suggest looking to these for
-inspiration.  If your test requires working with files or
-network connectivity, there is more information on the `testing page
-<https://github.com/pandas-dev/pandas/wiki/Testing>`_ of the wiki.
-
-The ``pandas.util.testing`` module has many special ``assert`` functions that
-make it easier to make statements about whether Series or DataFrame objects are
-equivalent. The easiest way to verify that your code is correct is to
-explicitly construct the result you expect, then compare the actual result to
-the expected correct result::
-
-    def test_pivot(self):
-        data = {
-            'index' : ['A', 'B', 'C', 'C', 'B', 'A'],
-            'columns' : ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values' : [1., 2., 3., 3., 2., 1.]
-        }
-
-        frame = DataFrame(data)
-        pivoted = frame.pivot(index='index', columns='columns', values='values')
-
-        expected = DataFrame({
-            'One' : {'A' : 1., 'B' : 2., 'C' : 3.},
-            'Two' : {'A' : 1., 'B' : 2., 'C' : 3.}
-        })
-
-        assert_frame_equal(pivoted, expected)
-
-Running the test suite
-~~~~~~~~~~~~~~~~~~~~~~
-
-The tests can then be run directly inside your Git clone (without having to
-install *pandas*) by typing::
-
-    pytest pandas
-
-The tests suite is exhaustive and takes around 20 minutes to run.  Often it is
-worth running only a subset of tests first around your changes before running the
-entire suite.
-
-The easiest way to do this is with::
-
-    pytest pandas/path/to/test.py -k regex_matching_test_name
-
-Or with one of the following constructs::
-
-    pytest pandas/tests/[test-module].py
-    pytest pandas/tests/[test-module].py::[TestClass]
-    pytest pandas/tests/[test-module].py::[TestClass]::[test_method]
-
-Using `pytest-xdist <https://pypi.python.org/pypi/pytest-xdist>`_, one can 
-speed up local testing on multicore machines. To use this feature, you will
-need to install `pytest-xdist` via::
-
-    pip install pytest-xdist
-    
-Two scripts are provided to assist with this.  These scripts distribute 
-testing across 4 threads.
-
-On Unix variants, one can type::
-
-    test_fast.sh
-    
-On Windows, one can type::
-
-    test_fast.bat
-    
-This can significantly reduce the time it takes to locally run tests before
-submitting a pull request.
-
-For more, see the `pytest <http://doc.pytest.org/en/latest/>`_ documentation.
-
-    .. versionadded:: 0.20.0
-
-Furthermore one can run
-
-.. code-block:: python
-
-   pd.test()
-
-with an imported pandas to run tests similarly.
-
-Running the performance test suite
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-Performance matters and it is worth considering whether your code has introduced
-performance regressions.  *pandas* is in the process of migrating to
-`asv benchmarks <https://github.com/spacetelescope/asv>`__
-to enable easy monitoring of the performance of critical *pandas* operations.
-These benchmarks are all found in the ``pandas/asv_bench`` directory.  asv
-supports both python2 and python3.
-
-.. note::
-
-    The asv benchmark suite was translated from the previous framework, vbench,
-    so many stylistic issues are likely a result of automated transformation of the
-    code.
-
-To use all features of asv, you will need either ``conda`` or
-``virtualenv``. For more details please check the `asv installation
-webpage <https://asv.readthedocs.io/en/latest/installing.html>`_.
-
-To install asv::
-
-    pip install git+https://github.com/spacetelescope/asv
-
-If you need to run a benchmark, change your directory to ``asv_bench/`` and run::
-
-    asv continuous -f 1.1 upstream/master HEAD
-
-You can replace ``HEAD`` with the name of the branch you are working on,
-and report benchmarks that changed by more than 10%.
-The command uses ``conda`` by default for creating the benchmark
-environments. If you want to use virtualenv instead, write::
-
-    asv continuous -f 1.1 -E virtualenv upstream/master HEAD
-
-The ``-E virtualenv`` option should be added to all ``asv`` commands
-that run benchmarks. The default value is defined in ``asv.conf.json``.
-
-Running the full test suite can take up to one hour and use up to 3GB of RAM.
-Usually it is sufficient to paste only a subset of the results into the pull
-request to show that the committed changes do not cause unexpected performance
-regressions.  You can run specific benchmarks using the ``-b`` flag, which
-takes a regular expression.  For example, this will only run tests from a
-``pandas/asv_bench/benchmarks/groupby.py`` file::
-
-    asv continuous -f 1.1 upstream/master HEAD -b ^groupby
-
-If you want to only run a specific group of tests from a file, you can do it
-using ``.`` as a separator. For example::
-
-    asv continuous -f 1.1 upstream/master HEAD -b groupby.groupby_agg_builtins
-
-will only run the ``groupby_agg_builtins`` benchmark defined in ``groupby.py``.
-
-You can also run the benchmark suite using the version of ``pandas``
-already installed in your current Python environment. This can be
-useful if you do not have virtualenv or conda, or are using the
-``setup.py develop`` approach discussed above; for the in-place build
-you need to set ``PYTHONPATH``, e.g.
-``PYTHONPATH="$PWD/.." asv [remaining arguments]``.
-You can run benchmarks using an existing Python
-environment by::
-
-    asv run -e -E existing
-
-or, to use a specific Python interpreter,::
-
-    asv run -e -E existing:python3.5
-
-This will display stderr from the benchmarks, and use your local
-``python`` that comes from your ``$PATH``.
-
-Information on how to write a benchmark and how to use asv can be found in the
-`asv documentation <https://asv.readthedocs.io/en/latest/writing_benchmarks.html>`_.
-
-.. _contributing.gbq_integration_tests:
-
-Running Google BigQuery Integration Tests
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You will need to create a Google BigQuery private key in JSON format in
-order to run Google BigQuery integration tests on your local machine and
-on Travis-CI. The first step is to create a `service account
-<https://console.developers.google.com/iam-admin/serviceaccounts/>`__.
-
-Integration tests for ``pandas.io.gbq`` are skipped in pull requests because
-the credentials that are required for running Google BigQuery integration
-tests are `encrypted <https://docs.travis-ci.com/user/encrypting-files/>`__
-on Travis-CI and are only accessible from the pandas-dev/pandas repository. The
-credentials won't be available on forks of pandas. Here are the steps to run
-gbq integration tests on a forked repository:
-
-#. Go to `Travis CI <https://travis-ci.org/>`__ and sign in with your GitHub
-   account.
-#. Click on the ``+`` icon next to the ``My Repositories`` list and enable
-   Travis builds for your fork.
-#. Click on the gear icon to edit your travis build, and add two environment
-   variables:
-
-   - ``GBQ_PROJECT_ID`` with the value being the ID of your BigQuery project.
-
-   - ``SERVICE_ACCOUNT_KEY`` with the value being the contents of the JSON key
-     that you downloaded for your service account. Use single quotes around
-     your JSON key to ensure that it is treated as a string.
-
-   For both environment variables, keep the "Display value in build log" option
-   DISABLED. These variables contain sensitive data and you do not want their
-   contents being exposed in build logs.
-#. Your branch should be tested automatically once it is pushed. You can check
-   the status by visiting your Travis branches page which exists at the
-   following location: https://travis-ci.org/your-user-name/pandas/branches .
-   Click on a build job for your branch. Expand the following line in the
-   build log: ``ci/print_skipped.py /tmp/pytest.xml`` . Search for the
-   term ``test_gbq`` and confirm that gbq integration tests are not skipped.
-
-Running the vbench performance test suite (phasing out)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Historically, *pandas* used `vbench library <https://github.com/pydata/vbench>`_
-to enable easy monitoring of the performance of critical *pandas* operations.
-These benchmarks are all found in the ``pandas/vb_suite`` directory.  vbench
-currently only works on python2.
-
-To install vbench::
-
-    pip install git+https://github.com/pydata/vbench
-
-Vbench also requires ``sqlalchemy``, ``gitpython``, and ``psutil``, which can all be installed
-using pip.  If you need to run a benchmark, change your directory to the *pandas* root and run::
-
-    ./test_perf.sh -b master -t HEAD
-
-This will check out the master revision and run the suite on both master and
-your commit.  Running the full test suite can take up to one hour and use up
-to 3GB of RAM.  Usually it is sufficient to paste a subset of the results into the Pull Request to show that the committed changes do not cause unexpected
-performance regressions.
-
-You can run specific benchmarks using the ``-r`` flag, which takes a regular expression.
-
-See the `performance testing wiki <https://github.com/pandas-dev/pandas/wiki/Performance-Testing>`_ for information
-on how to write a benchmark.
-
-Documenting your code
----------------------
-
-Changes should be reflected in the release notes located in ``doc/source/whatsnew/vx.y.z.txt``.
-This file contains an ongoing change log for each release.  Add an entry to this file to
-document your fix, enhancement or (unavoidable) breaking change.  Make sure to include the
-GitHub issue number when adding your entry (using `` :issue:`1234` `` where `1234` is the
-issue/pull request number).
-
-If your code is an enhancement, it is most likely necessary to add usage
-examples to the existing documentation.  This can be done following the section
-regarding documentation :ref:`above <contributing.documentation>`.
-Further, to let users know when this feature was added, the ``versionadded``
-directive is used. The sphinx syntax for that is:
-
-.. code-block:: rst
-
-  .. versionadded:: 0.17.0
-
-This will put the text *New in version 0.17.0* wherever you put the sphinx
-directive. This should also be put in the docstring when adding a new function
-or method (`example <https://github.com/pandas-dev/pandas/blob/v0.16.2/pandas/core/generic.py#L1959>`__)
-or a new keyword argument (`example <https://github.com/pandas-dev/pandas/blob/v0.16.2/pandas/core/frame.py#L1171>`__).
-
-Contributing your changes to *pandas*
-=====================================
-
-Committing your code
---------------------
-
-Keep style fixes to a separate commit to make your pull request more readable.
-
-Once you've made changes, you can see them by typing::
-
-    git status
-
-If you have created a new file, it is not being tracked by git. Add it by typing::
-
-    git add path/to/file-to-be-added.py
-
-Doing 'git status' again should give something like::
-
-    # On branch shiny-new-feature
-    #
-    #       modified:   /relative/path/to/file-you-added.py
-    #
-
-Finally, commit your changes to your local repository with an explanatory message.  *Pandas*
-uses a convention for commit message prefixes and layout.  Here are
-some common prefixes along with general guidelines for when to use them:
-
-    * ENH: Enhancement, new functionality
-    * BUG: Bug fix
-    * DOC: Additions/updates to documentation
-    * TST: Additions/updates to tests
-    * BLD: Updates to the build process/scripts
-    * PERF: Performance improvement
-    * CLN: Code cleanup
-
-The following defines how a commit message should be structured.  Please reference the
-relevant GitHub issues in your commit message using GH1234 or #1234.  Either style
-is fine, but the former is generally preferred:
-
-    * a subject line with `< 80` chars.
-    * One blank line.
-    * Optionally, a commit message body.
-
-Now you can commit your changes in your local repository::
-
-    git commit -m
-
-Combining commits
------------------
-
-If you have multiple commits, you may want to combine them into one commit, often
-referred to as "squashing" or "rebasing".  This is a common request by package maintainers
-when submitting a pull request as it maintains a more compact commit history.  To rebase
-your commits::
-
-    git rebase -i HEAD~#
-
-Where # is the number of commits you want to combine.  Then you can pick the relevant
-commit message and discard others.
-
-To squash to the master branch do::
-
-    git rebase -i master
-
-Use the ``s`` option on a commit to ``squash``, meaning to keep the commit messages,
-or ``f`` to ``fixup``, meaning to merge the commit messages.
-
-Then you will need to push the branch (see below) forcefully to replace the current
-commits with the new ones::
-
-    git push origin shiny-new-feature -f
-
-
-Pushing your changes
---------------------
-
-When you want your changes to appear publicly on your GitHub page, push your
-forked feature branch's commits::
-
-    git push origin shiny-new-feature
-
-Here ``origin`` is the default name given to your remote repository on GitHub.
-You can see the remote repositories::
-
-    git remote -v
-
-If you added the upstream repository as described above you will see something
-like::
-
-    origin  git@github.com:yourname/pandas.git (fetch)
-    origin  git@github.com:yourname/pandas.git (push)
-    upstream        git://github.com/pandas-dev/pandas.git (fetch)
-    upstream        git://github.com/pandas-dev/pandas.git (push)
-
-Now your code is on GitHub, but it is not yet a part of the *pandas* project.  For that to
-happen, a pull request needs to be submitted on GitHub.
-
-Review your code
-----------------
-
-When you're ready to ask for a code review, file a pull request. Before you do, once
-again make sure that you have followed all the guidelines outlined in this document
-regarding code style, tests, performance tests, and documentation. You should also
-double check your branch changes against the branch it was based on:
-
-#. Navigate to your repository on GitHub -- https://github.com/your-user-name/pandas
-#. Click on ``Branches``
-#. Click on the ``Compare`` button for your feature branch
-#. Select the ``base`` and ``compare`` branches, if necessary. This will be ``master`` and
-   ``shiny-new-feature``, respectively.
-
-Finally, make the pull request
-------------------------------
-
-If everything looks good, you are ready to make a pull request.  A pull request is how
-code from a local repository becomes available to the GitHub community and can be looked
-at and eventually merged into the master version.  This pull request and its associated
-changes will eventually be committed to the master branch and available in the next
-release.  To submit a pull request:
-
-#. Navigate to your repository on GitHub
-#. Click on the ``Pull Request`` button
-#. You can then click on ``Commits`` and ``Files Changed`` to make sure everything looks
-   okay one last time
-#. Write a description of your changes in the ``Preview Discussion`` tab
-#. Click ``Send Pull Request``.
-
-This request then goes to the repository maintainers, and they will review
-the code. If you need to make more changes, you can make them in
-your branch, push them to GitHub, and the pull request will be automatically
-updated.  Pushing them to GitHub again is done by::
-
-    git push -f origin shiny-new-feature
-
-This will automatically update your pull request with the latest code and restart the
-Travis-CI tests.
-
-If your pull request is related to the ``pandas.io.gbq`` module, please see
-the section on :ref:`Running Google BigQuery Integration Tests
-<contributing.gbq_integration_tests>` to configure a Google BigQuery service
-account for your pull request on Travis-CI.
-
-Delete your merged branch (optional)
-------------------------------------
-
-Once your feature branch is accepted into upstream, you'll probably want to get rid of
-the branch. First, merge upstream master into your branch so git knows it is safe to
-delete your branch::
-
-    git fetch upstream
-    git checkout master
-    git merge upstream/master
-
-Then you can just do::
-
-    git branch -d shiny-new-feature
-
-Make sure you use a lower-case ``-d``, or else git won't warn you if your feature
-branch has not actually been merged.
-
-The branch will still exist on GitHub, so to delete it there do::
-
-    git push origin --delete shiny-new-feature
diff --git a/doc/source/cookbook.rst b/doc/source/cookbook.rst
deleted file mode 100644
index 8fa1283ffc924..0000000000000
--- a/doc/source/cookbook.rst
+++ /dev/null
@@ -1,1297 +0,0 @@
-.. _cookbook:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   import numpy as np
-   from pandas.compat import StringIO
-
-   import random
-   import os
-   import itertools
-   import functools
-   import datetime
-
-   np.random.seed(123456)
-
-   pd.options.display.max_rows=15
-
-   import matplotlib
-   matplotlib.style.use('ggplot')
-
-   np.set_printoptions(precision=4, suppress=True)
-
-
-********
-Cookbook
-********
-
-This is a repository for *short and sweet* examples and links for useful pandas recipes.
-We encourage users to add to this documentation.
-
-Adding interesting links and/or inline examples to this section is a great *First Pull Request*.
-
-Simplified, condensed, new-user friendly, in-line examples have been inserted where possible to
-augment the Stack-Overflow and GitHub links.  Many of the links contain expanded information,
-above what the in-line examples offer.
-
-Pandas (pd) and Numpy (np) are the only two abbreviated imported modules. The rest are kept
-explicitly imported for newer users.
-
-These examples are written for python 3.4.  Minor tweaks might be necessary for earlier python
-versions.
-
-Idioms
-------
-
-.. _cookbook.idioms:
-
-These are some neat pandas ``idioms``
-
-`if-then/if-then-else on one column, and assignment to another one or more columns:
-<http://stackoverflow.com/questions/17128302/python-pandas-idiom-for-if-then-else>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-if-then...
-**********
-
-An if-then on one column
-
-.. ipython:: python
-
-   df.loc[df.AAA >= 5,'BBB'] = -1; df
-
-An if-then with assignment to 2 columns:
-
-.. ipython:: python
-
-   df.loc[df.AAA >= 5,['BBB','CCC']] = 555; df
-
-Add another line with different logic, to do the -else
-
-.. ipython:: python
-
-   df.loc[df.AAA < 5,['BBB','CCC']] = 2000; df
-
-Or use pandas where after you've set up a mask
-
-.. ipython:: python
-
-   df_mask = pd.DataFrame({'AAA' : [True] * 4, 'BBB' : [False] * 4,'CCC' : [True,False] * 2})
-   df.where(df_mask,-1000)
-
-`if-then-else using numpy's where()
-<http://stackoverflow.com/questions/19913659/pandas-conditional-creation-of-a-series-dataframe-column>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-   df['logic'] = np.where(df['AAA'] > 5,'high','low'); df
-
-Splitting
-*********
-
-`Split a frame with a boolean criterion
-<http://stackoverflow.com/questions/14957116/how-to-split-a-dataframe-according-to-a-boolean-criterion>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-   dflow = df[df.AAA <= 5]; dflow
-   dfhigh = df[df.AAA > 5]; dfhigh
-
-Building Criteria
-*****************
-
-`Select with multi-column criteria
-<http://stackoverflow.com/questions/15315452/selecting-with-complex-criteria-from-pandas-dataframe>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-...and (without assignment returns a Series)
-
-.. ipython:: python
-
-   newseries = df.loc[(df['BBB'] < 25) & (df['CCC'] >= -40), 'AAA']; newseries
-
-...or (without assignment returns a Series)
-
-.. ipython:: python
-
-   newseries = df.loc[(df['BBB'] > 25) | (df['CCC'] >= -40), 'AAA']; newseries;
-
-...or (with assignment modifies the DataFrame.)
-
-.. ipython:: python
-
-   df.loc[(df['BBB'] > 25) | (df['CCC'] >= 75), 'AAA'] = 0.1; df
-
-`Select rows with data closest to certain value using argsort
-<http://stackoverflow.com/questions/17758023/return-rows-in-a-dataframe-closest-to-a-user-defined-number>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-   aValue = 43.0
-   df.loc[(df.CCC-aValue).abs().argsort()]
-
-`Dynamically reduce a list of criteria using a binary operators
-<http://stackoverflow.com/questions/21058254/pandas-boolean-operation-in-a-python-list/21058331>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-   Crit1 = df.AAA <= 5.5
-   Crit2 = df.BBB == 10.0
-   Crit3 = df.CCC > -40.0
-
-One could hard code:
-
-.. ipython:: python
-
-   AllCrit = Crit1 & Crit2 & Crit3
-
-...Or it can be done with a list of dynamically built criteria
-
-.. ipython:: python
-
-   CritList = [Crit1,Crit2,Crit3]
-   AllCrit = functools.reduce(lambda x,y: x & y, CritList)
-
-   df[AllCrit]
-
-.. _cookbook.selection:
-
-Selection
----------
-
-DataFrames
-**********
-
-The :ref:`indexing <indexing>` docs.
-
-`Using both row labels and value conditionals
-<http://stackoverflow.com/questions/14725068/pandas-using-row-labels-in-boolean-indexing>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}); df
-
-   df[(df.AAA <= 6) & (df.index.isin([0,2,4]))]
-
-`Use loc for label-oriented slicing and iloc positional slicing
-<https://github.com/pandas-dev/pandas/issues/2904>`__
-
-.. ipython:: python
-
-   data = {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40],'CCC' : [100,50,-30,-50]}
-   df = pd.DataFrame(data=data,index=['foo','bar','boo','kar']); df
-
-There are 2 explicit slicing methods, with a third general case
-
-1. Positional-oriented (Python slicing style : exclusive of end)
-2. Label-oriented (Non-Python slicing style : inclusive of end)
-3. General (Either slicing style : depends on if the slice contains labels or positions)
-
-.. ipython:: python
-   df.iloc[0:3] #Positional
-
-   df.loc['bar':'kar'] #Label
-
-   # Generic
-   df.iloc[0:3]
-   df.loc['bar':'kar']
-
-Ambiguity arises when an index consists of integers with a non-zero start or non-unit increment.
-
-.. ipython:: python
-
-   df2 = pd.DataFrame(data=data,index=[1,2,3,4]); #Note index starts at 1.
-
-   df2.iloc[1:3] #Position-oriented
-
-   df2.loc[1:3] #Label-oriented
-
-`Using inverse operator (~) to take the complement of a mask
-<http://stackoverflow.com/questions/14986510/picking-out-elements-based-on-complement-of-indices-in-python-pandas>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [4,5,6,7], 'BBB' : [10,20,30,40], 'CCC' : [100,50,-30,-50]}); df
-
-   df[~((df.AAA <= 6) & (df.index.isin([0,2,4])))]
-
-Panels
-******
-
-`Extend a panel frame by transposing, adding a new dimension, and transposing back to the original dimensions
-<http://stackoverflow.com/questions/15364050/extending-a-pandas-panel-frame-along-the-minor-axis>`__
-
-.. ipython:: python
-
-   rng = pd.date_range('1/1/2013',periods=100,freq='D')
-   data = np.random.randn(100, 4)
-   cols = ['A','B','C','D']
-   df1, df2, df3 = pd.DataFrame(data, rng, cols), pd.DataFrame(data, rng, cols), pd.DataFrame(data, rng, cols)
-
-   pf = pd.Panel({'df1':df1,'df2':df2,'df3':df3});pf
-
-   #Assignment using Transpose  (pandas < 0.15)
-   pf = pf.transpose(2,0,1)
-   pf['E'] = pd.DataFrame(data, rng, cols)
-   pf = pf.transpose(1,2,0);pf
-
-   #Direct assignment (pandas > 0.15)
-   pf.loc[:,:,'F'] = pd.DataFrame(data, rng, cols);pf
-
-`Mask a panel by using np.where and then reconstructing the panel with the new masked values
-<http://stackoverflow.com/questions/14650341/boolean-mask-in-pandas-panel>`__
-
-New Columns
-***********
-
-`Efficiently and dynamically creating new columns using applymap
-<http://stackoverflow.com/questions/16575868/efficiently-creating-additional-columns-in-a-pandas-dataframe-using-map>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [1,2,1,3], 'BBB' : [1,1,2,2], 'CCC' : [2,1,3,1]}); df
-
-   source_cols = df.columns # or some subset would work too.
-   new_cols = [str(x) + "_cat" for x in source_cols]
-   categories = {1 : 'Alpha', 2 : 'Beta', 3 : 'Charlie' }
-
-   df[new_cols] = df[source_cols].applymap(categories.get);df
-
-`Keep other columns when using min() with groupby
-<http://stackoverflow.com/questions/23394476/keep-other-columns-when-using-min-with-groupby>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {'AAA' : [1,1,1,2,2,2,3,3], 'BBB' : [2,1,3,4,5,1,2,3]}); df
-
-Method 1 : idxmin() to get the index of the mins
-
-.. ipython:: python
-
-   df.loc[df.groupby("AAA")["BBB"].idxmin()]
-
-Method 2 : sort then take first of each
-
-.. ipython:: python
-
-   df.sort_values(by="BBB").groupby("AAA", as_index=False).first()
-
-Notice the same results, with the exception of the index.
-
-.. _cookbook.multi_index:
-
-MultiIndexing
--------------
-
-The :ref:`multindexing <advanced.hierarchical>` docs.
-
-`Creating a multi-index from a labeled frame
-<http://stackoverflow.com/questions/14916358/reshaping-dataframes-in-pandas-based-on-column-labels>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'row' : [0,1,2],
-                      'One_X' : [1.1,1.1,1.1],
-                      'One_Y' : [1.2,1.2,1.2],
-                      'Two_X' : [1.11,1.11,1.11],
-                      'Two_Y' : [1.22,1.22,1.22]}); df
-
-   # As Labelled Index
-   df = df.set_index('row');df
-   # With Hierarchical Columns
-   df.columns = pd.MultiIndex.from_tuples([tuple(c.split('_')) for c in df.columns]);df
-   # Now stack & Reset
-   df = df.stack(0).reset_index(1);df
-   # And fix the labels (Notice the label 'level_1' got added automatically)
-   df.columns = ['Sample','All_X','All_Y'];df
-
-Arithmetic
-**********
-
-`Performing arithmetic with a multi-index that needs broadcasting
-<http://stackoverflow.com/questions/19501510/divide-entire-pandas-multiindex-dataframe-by-dataframe-variable/19502176#19502176>`__
-
-.. ipython:: python
-
-   cols = pd.MultiIndex.from_tuples([ (x,y) for x in ['A','B','C'] for y in ['O','I']])
-   df = pd.DataFrame(np.random.randn(2,6),index=['n','m'],columns=cols); df
-   df = df.div(df['C'],level=1); df
-
-Slicing
-*******
-
-`Slicing a multi-index with xs
-<http://stackoverflow.com/questions/12590131/how-to-slice-multindex-columns-in-pandas-dataframes>`__
-
-.. ipython:: python
-
-   coords = [('AA','one'),('AA','six'),('BB','one'),('BB','two'),('BB','six')]
-   index = pd.MultiIndex.from_tuples(coords)
-   df = pd.DataFrame([11,22,33,44,55],index,['MyData']); df
-
-To take the cross section of the 1st level and 1st axis the index:
-
-.. ipython:: python
-
-   df.xs('BB',level=0,axis=0)  #Note : level and axis are optional, and default to zero
-
-...and now the 2nd level of the 1st axis.
-
-.. ipython:: python
-
-   df.xs('six',level=1,axis=0)
-
-`Slicing a multi-index with xs, method #2
-<http://stackoverflow.com/questions/14964493/multiindex-based-indexing-in-pandas>`__
-
-.. ipython:: python
-
-   index = list(itertools.product(['Ada','Quinn','Violet'],['Comp','Math','Sci']))
-   headr = list(itertools.product(['Exams','Labs'],['I','II']))
-
-   indx = pd.MultiIndex.from_tuples(index,names=['Student','Course'])
-   cols = pd.MultiIndex.from_tuples(headr) #Notice these are un-named
-
-   data = [[70+x+y+(x*y)%3 for x in range(4)] for y in range(9)]
-
-   df = pd.DataFrame(data,indx,cols); df
-
-   All = slice(None)
-
-   df.loc['Violet']
-   df.loc[(All,'Math'),All]
-   df.loc[(slice('Ada','Quinn'),'Math'),All]
-   df.loc[(All,'Math'),('Exams')]
-   df.loc[(All,'Math'),(All,'II')]
-
-`Setting portions of a multi-index with xs
-<http://stackoverflow.com/questions/19319432/pandas-selecting-a-lower-level-in-a-dataframe-to-do-a-ffill>`__
-
-Sorting
-*******
-
-`Sort by specific column or an ordered list of columns, with a multi-index
-<http://stackoverflow.com/questions/14733871/mutli-index-sorting-in-pandas>`__
-
-.. ipython:: python
-
-   df.sort_values(by=('Labs', 'II'), ascending=False)
-
-`Partial Selection, the need for sortedness;
-<https://github.com/pandas-dev/pandas/issues/2995>`__
-
-Levels
-******
-
-`Prepending a level to a multiindex
-<http://stackoverflow.com/questions/14744068/prepend-a-level-to-a-pandas-multiindex>`__
-
-`Flatten Hierarchical columns
-<http://stackoverflow.com/questions/14507794/python-pandas-how-to-flatten-a-hierarchical-index-in-columns>`__
-
-panelnd
-*******
-
-The :ref:`panelnd<dsintro.panelnd>` docs.
-
-`Construct a 5D panelnd
-<http://stackoverflow.com/questions/18748598/why-my-panelnd-factory-throwing-a-keyerror>`__
-
-.. _cookbook.missing_data:
-
-Missing Data
-------------
-
-The :ref:`missing data<missing_data>` docs.
-
-Fill forward a reversed timeseries
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(6,1), index=pd.date_range('2013-08-01', periods=6, freq='B'), columns=list('A'))
-   df.loc[df.index[3], 'A'] = np.nan
-   df
-   df.reindex(df.index[::-1]).ffill()
-
-`cumsum reset at NaN values
-<http://stackoverflow.com/questions/18196811/cumsum-reset-at-nan>`__
-
-Replace
-*******
-
-`Using replace with backrefs
-<http://stackoverflow.com/questions/16818871/extracting-value-and-creating-new-column-out-of-it>`__
-
-.. _cookbook.grouping:
-
-Grouping
---------
-
-The :ref:`grouping <groupby>` docs.
-
-`Basic grouping with apply
-<http://stackoverflow.com/questions/15322632/python-pandas-df-groupy-agg-column-reference-in-agg>`__
-
-Unlike agg, apply's callable is passed a sub-DataFrame which gives you access to all the columns
-
-.. ipython:: python
-
-   df = pd.DataFrame({'animal': 'cat dog cat fish dog cat cat'.split(),
-                      'size': list('SSMMMLL'),
-                      'weight': [8, 10, 11, 1, 20, 12, 12],
-                      'adult' : [False] * 5 + [True] * 2}); df
-
-   #List the size of the animals with the highest weight.
-   df.groupby('animal').apply(lambda subf: subf['size'][subf['weight'].idxmax()])
-
-`Using get_group
-<http://stackoverflow.com/questions/14734533/how-to-access-pandas-groupby-dataframe-by-key>`__
-
-.. ipython:: python
-
-   gb = df.groupby(['animal'])
-
-   gb.get_group('cat')
-
-`Apply to different items in a group
-<http://stackoverflow.com/questions/15262134/apply-different-functions-to-different-items-in-group-object-python-pandas>`__
-
-.. ipython:: python
-
-   def GrowUp(x):
-      avg_weight =  sum(x[x['size'] == 'S'].weight * 1.5)
-      avg_weight += sum(x[x['size'] == 'M'].weight * 1.25)
-      avg_weight += sum(x[x['size'] == 'L'].weight)
-      avg_weight /= len(x)
-      return pd.Series(['L',avg_weight,True], index=['size', 'weight', 'adult'])
-
-   expected_df = gb.apply(GrowUp)
-
-   expected_df
-
-`Expanding Apply
-<http://stackoverflow.com/questions/14542145/reductions-down-a-column-in-pandas>`__
-
-.. ipython:: python
-
-   S = pd.Series([i / 100.0 for i in range(1,11)])
-
-   def CumRet(x,y):
-      return x * (1 + y)
-
-   def Red(x):
-      return functools.reduce(CumRet,x,1.0)
-
-   S.expanding().apply(Red)
-
-
-`Replacing some values with mean of the rest of a group
-<http://stackoverflow.com/questions/14760757/replacing-values-with-groupby-means>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A' : [1, 1, 2, 2], 'B' : [1, -1, 1, 2]})
-
-   gb = df.groupby('A')
-
-   def replace(g):
-      mask = g < 0
-      g.loc[mask] = g[~mask].mean()
-      return g
-
-   gb.transform(replace)
-
-`Sort groups by aggregated data
-<http://stackoverflow.com/questions/14941366/pandas-sort-by-group-aggregate-and-column>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'code': ['foo', 'bar', 'baz'] * 2,
-                      'data': [0.16, -0.21, 0.33, 0.45, -0.59, 0.62],
-                      'flag': [False, True] * 3})
-
-   code_groups = df.groupby('code')
-
-   agg_n_sort_order = code_groups[['data']].transform(sum).sort_values(by='data')
-
-   sorted_df = df.loc[agg_n_sort_order.index]
-
-   sorted_df
-
-`Create multiple aggregated columns
-<http://stackoverflow.com/questions/14897100/create-multiple-columns-in-pandas-aggregation-function>`__
-
-.. ipython:: python
-
-   rng = pd.date_range(start="2014-10-07",periods=10,freq='2min')
-   ts = pd.Series(data = list(range(10)), index = rng)
-
-   def MyCust(x):
-      if len(x) > 2:
-         return x[1] * 1.234
-      return pd.NaT
-
-   mhc = {'Mean' : np.mean, 'Max' : np.max, 'Custom' : MyCust}
-   ts.resample("5min").apply(mhc)
-   ts
-
-`Create a value counts column and reassign back to the DataFrame
-<http://stackoverflow.com/questions/17709270/i-want-to-create-a-column-of-value-counts-in-my-pandas-dataframe>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'Color': 'Red Red Red Blue'.split(),
-                      'Value': [100, 150, 50, 50]}); df
-   df['Counts'] = df.groupby(['Color']).transform(len)
-   df
-
-`Shift groups of the values in a column based on the index
-<http://stackoverflow.com/q/23198053/190597>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-      {u'line_race': [10, 10, 8, 10, 10, 8],
-       u'beyer': [99, 102, 103, 103, 88, 100]},
-       index=[u'Last Gunfighter', u'Last Gunfighter', u'Last Gunfighter',
-              u'Paynter', u'Paynter', u'Paynter']); df
-   df['beyer_shifted'] = df.groupby(level=0)['beyer'].shift(1)
-   df
-
-`Select row with maximum value from each group
-<http://stackoverflow.com/q/26701849/190597>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'host':['other','other','that','this','this'],
-                      'service':['mail','web','mail','mail','web'],
-                      'no':[1, 2, 1, 2, 1]}).set_index(['host', 'service'])
-   mask = df.groupby(level=0).agg('idxmax')
-   df_count = df.loc[mask['no']].reset_index()
-   df_count
-
-`Grouping like Python's itertools.groupby
-<http://stackoverflow.com/q/29142487/846892>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame([0, 1, 0, 1, 1, 1, 0, 1, 1], columns=['A'])
-   df.A.groupby((df.A != df.A.shift()).cumsum()).groups
-   df.A.groupby((df.A != df.A.shift()).cumsum()).cumsum()
-
-Expanding Data
-**************
-
-`Alignment and to-date
-<http://stackoverflow.com/questions/15489011/python-time-series-alignment-and-to-date-functions>`__
-
-`Rolling Computation window based on values instead of counts
-<http://stackoverflow.com/questions/14300768/pandas-rolling-computation-with-window-based-on-values-instead-of-counts>`__
-
-`Rolling Mean by Time Interval
-<http://stackoverflow.com/questions/15771472/pandas-rolling-mean-by-time-interval>`__
-
-Splitting
-*********
-
-`Splitting a frame
-<http://stackoverflow.com/questions/13353233/best-way-to-split-a-dataframe-given-an-edge/15449992#15449992>`__
-
-Create a list of dataframes, split using a delineation based on logic included in rows.
-
-.. ipython:: python
-
-   df = pd.DataFrame(data={'Case' : ['A','A','A','B','A','A','B','A','A'],
-                           'Data' : np.random.randn(9)})
-
-   dfs = list(zip(*df.groupby((1*(df['Case']=='B')).cumsum().rolling(window=3,min_periods=1).median())))[-1]
-
-   dfs[0]
-   dfs[1]
-   dfs[2]
-
-.. _cookbook.pivot:
-
-Pivot
-*****
-The :ref:`Pivot <reshaping.pivot>` docs.
-
-`Partial sums and subtotals
-<http://stackoverflow.com/questions/15570099/pandas-pivot-tables-row-subtotals/15574875#15574875>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(data={'Province' : ['ON','QC','BC','AL','AL','MN','ON'],
-                            'City' : ['Toronto','Montreal','Vancouver','Calgary','Edmonton','Winnipeg','Windsor'],
-                            'Sales' : [13,6,16,8,4,3,1]})
-   table = pd.pivot_table(df,values=['Sales'],index=['Province'],columns=['City'],aggfunc=np.sum,margins=True)
-   table.stack('City')
-
-`Frequency table like plyr in R
-<http://stackoverflow.com/questions/15589354/frequency-tables-in-pandas-like-plyr-in-r>`__
-
-.. ipython:: python
-
-   grades = [48,99,75,80,42,80,72,68,36,78]
-   df = pd.DataFrame( {'ID': ["x%d" % r for r in range(10)],
-                       'Gender' : ['F', 'M', 'F', 'M', 'F', 'M', 'F', 'M', 'M', 'M'],
-                       'ExamYear': ['2007','2007','2007','2008','2008','2008','2008','2009','2009','2009'],
-                       'Class': ['algebra', 'stats', 'bio', 'algebra', 'algebra', 'stats', 'stats', 'algebra', 'bio', 'bio'],
-                       'Participated': ['yes','yes','yes','yes','no','yes','yes','yes','yes','yes'],
-                       'Passed': ['yes' if x > 50 else 'no' for x in grades],
-                       'Employed': [True,True,True,False,False,False,False,True,True,False],
-                       'Grade': grades})
-
-   df.groupby('ExamYear').agg({'Participated': lambda x: x.value_counts()['yes'],
-                       'Passed': lambda x: sum(x == 'yes'),
-                       'Employed' : lambda x : sum(x),
-                       'Grade' : lambda x : sum(x) / len(x)})
-
-`Plot pandas DataFrame with year over year data
-<http://stackoverflow.com/questions/30379789/plot-pandas-data-frame-with-year-over-year-data>`__
-
-To create year and month crosstabulation:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'value': np.random.randn(36)},
-                     index=pd.date_range('2011-01-01', freq='M', periods=36))
-
-   pd.pivot_table(df, index=df.index.month, columns=df.index.year,
-                  values='value', aggfunc='sum')
-
-Apply
-*****
-
-`Rolling Apply to Organize - Turning embedded lists into a multi-index frame
-<http://stackoverflow.com/questions/17349981/converting-pandas-dataframe-with-categorical-values-into-binary-values>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(data={'A' : [[2,4,8,16],[100,200],[10,20,30]], 'B' : [['a','b','c'],['jj','kk'],['ccc']]},index=['I','II','III'])
-
-   def SeriesFromSubList(aList):
-      return pd.Series(aList)
-
-   df_orgz = pd.concat(dict([ (ind,row.apply(SeriesFromSubList)) for ind,row in df.iterrows() ]))
-
-`Rolling Apply with a DataFrame returning a Series
-<http://stackoverflow.com/questions/19121854/using-rolling-apply-on-a-dataframe-object>`__
-
-Rolling Apply to multiple columns where function calculates a Series before a Scalar from the Series is returned
-
-.. ipython:: python
-
-   df = pd.DataFrame(data=np.random.randn(2000,2)/10000,
-                     index=pd.date_range('2001-01-01',periods=2000),
-                     columns=['A','B']); df
-
-   def gm(aDF,Const):
-      v = ((((aDF.A+aDF.B)+1).cumprod())-1)*Const
-      return (aDF.index[0],v.iloc[-1])
-
-   S = pd.Series(dict([ gm(df.iloc[i:min(i+51,len(df)-1)],5) for i in range(len(df)-50) ])); S
-
-`Rolling apply with a DataFrame returning a Scalar
-<http://stackoverflow.com/questions/21040766/python-pandas-rolling-apply-two-column-input-into-function/21045831#21045831>`__
-
-Rolling Apply to multiple columns where function returns a Scalar (Volume Weighted Average Price)
-
-.. ipython:: python
-
-   rng = pd.date_range(start = '2014-01-01',periods = 100)
-   df = pd.DataFrame({'Open' : np.random.randn(len(rng)),
-                      'Close' : np.random.randn(len(rng)),
-                      'Volume' : np.random.randint(100,2000,len(rng))}, index=rng); df
-
-   def vwap(bars): return ((bars.Close*bars.Volume).sum()/bars.Volume.sum())
-   window = 5
-   s = pd.concat([ (pd.Series(vwap(df.iloc[i:i+window]), index=[df.index[i+window]])) for i in range(len(df)-window) ]);
-   s.round(2)
-
-Timeseries
-----------
-
-`Between times
-<http://stackoverflow.com/questions/14539992/pandas-drop-rows-outside-of-time-range>`__
-
-`Using indexer between time
-<http://stackoverflow.com/questions/17559885/pandas-dataframe-mask-based-on-index>`__
-
-`Constructing a datetime range that excludes weekends and includes only certain times
-<http://stackoverflow.com/questions/24010830/pandas-generate-sequential-timestamp-with-jump/24014440#24014440?>`__
-
-`Vectorized Lookup
-<http://stackoverflow.com/questions/13893227/vectorized-look-up-of-values-in-pandas-dataframe>`__
-
-`Aggregation and plotting time series
-<http://nipunbatra.github.io/2015/06/timeseries/>`__
-
-Turn a matrix with hours in columns and days in rows into a continuous row sequence in the form of a time series.
-`How to rearrange a python pandas DataFrame?
-<http://stackoverflow.com/questions/15432659/how-to-rearrange-a-python-pandas-dataframe>`__
-
-`Dealing with duplicates when reindexing a timeseries to a specified frequency
-<http://stackoverflow.com/questions/22244383/pandas-df-refill-adding-two-columns-of-different-shape>`__
-
-Calculate the first day of the month for each entry in a DatetimeIndex
-
-.. ipython:: python
-
-   dates = pd.date_range('2000-01-01', periods=5)
-   dates.to_period(freq='M').to_timestamp()
-
-.. _cookbook.resample:
-
-Resampling
-**********
-
-The :ref:`Resample <timeseries.resampling>` docs.
-
-`TimeGrouping of values grouped across time
-<http://stackoverflow.com/questions/15297053/how-can-i-divide-single-values-of-a-dataframe-by-monthly-averages>`__
-
-`TimeGrouping #2
-<http://stackoverflow.com/questions/14569223/timegrouper-pandas>`__
-
-`Using TimeGrouper and another grouping to create subgroups, then apply a custom function
-<https://github.com/pandas-dev/pandas/issues/3791>`__
-
-`Resampling with custom periods
-<http://stackoverflow.com/questions/15408156/resampling-with-custom-periods>`__
-
-`Resample intraday frame without adding new days
-<http://stackoverflow.com/questions/14898574/resample-intrday-pandas-dataframe-without-add-new-days>`__
-
-`Resample minute data
-<http://stackoverflow.com/questions/14861023/resampling-minute-data>`__
-
-`Resample with groupby <http://stackoverflow.com/q/18677271/564538>`__
-
-.. _cookbook.merge:
-
-Merge
------
-
-The :ref:`Concat <merging.concatenation>` docs. The :ref:`Join <merging.join>` docs.
-
-`Append two dataframes with overlapping index (emulate R rbind)
-<http://stackoverflow.com/questions/14988480/pandas-version-of-rbind>`__
-
-.. ipython:: python
-
-   rng = pd.date_range('2000-01-01', periods=6)
-   df1 = pd.DataFrame(np.random.randn(6, 3), index=rng, columns=['A', 'B', 'C'])
-   df2 = df1.copy()
-
-ignore_index is needed in pandas < v0.13, and depending on df construction
-
-.. ipython:: python
-
-   df = df1.append(df2,ignore_index=True); df
-
-`Self Join of a DataFrame
-<https://github.com/pandas-dev/pandas/issues/2996>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(data={'Area' : ['A'] * 5 + ['C'] * 2,
-                           'Bins' : [110] * 2 + [160] * 3 + [40] * 2,
-                           'Test_0' : [0, 1, 0, 1, 2, 0, 1],
-                           'Data' : np.random.randn(7)});df
-
-   df['Test_1'] = df['Test_0'] - 1
-
-   pd.merge(df, df, left_on=['Bins', 'Area','Test_0'], right_on=['Bins', 'Area','Test_1'],suffixes=('_L','_R'))
-
-`How to set the index and join
-<http://stackoverflow.com/questions/14341805/pandas-merge-pd-merge-how-to-set-the-index-and-join>`__
-
-`KDB like asof join
-<http://stackoverflow.com/questions/12322289/kdb-like-asof-join-for-timeseries-data-in-pandas/12336039#12336039>`__
-
-`Join with a criteria based on the values
-<http://stackoverflow.com/questions/15581829/how-to-perform-an-inner-or-outer-join-of-dataframes-with-pandas-on-non-simplisti>`__
-
-`Using searchsorted to merge based on values inside a range
-<http://stackoverflow.com/questions/25125626/pandas-merge-with-logic/2512764>`__
-
-.. _cookbook.plotting:
-
-Plotting
---------
-
-The :ref:`Plotting <visualization>` docs.
-
-`Make Matplotlib look like R
-<http://stackoverflow.com/questions/14349055/making-matplotlib-graphs-look-like-r-by-default>`__
-
-`Setting x-axis major and minor labels
-<http://stackoverflow.com/questions/12945971/pandas-timeseries-plot-setting-x-axis-major-and-minor-ticks-and-labels>`__
-
-`Plotting multiple charts in an ipython notebook
-<http://stackoverflow.com/questions/16392921/make-more-than-one-chart-in-same-ipython-notebook-cell>`__
-
-`Creating a multi-line plot
-<http://stackoverflow.com/questions/16568964/make-a-multiline-plot-from-csv-file-in-matplotlib>`__
-
-`Plotting a heatmap
-<http://stackoverflow.com/questions/17050202/plot-timeseries-of-histograms-in-python>`__
-
-`Annotate a time-series plot
-<http://stackoverflow.com/questions/11067368/annotate-time-series-plot-in-matplotlib>`__
-
-`Annotate a time-series plot #2
-<http://stackoverflow.com/questions/17891493/annotating-points-from-a-pandas-dataframe-in-matplotlib-plot>`__
-
-`Generate Embedded plots in excel files using Pandas, Vincent and xlsxwriter
-<https://pandas-xlsxwriter-charts.readthedocs.io/>`__
-
-`Boxplot for each quartile of a stratifying variable
-<http://stackoverflow.com/questions/23232989/boxplot-stratified-by-column-in-python-pandas>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-        {u'stratifying_var': np.random.uniform(0, 100, 20),
-         u'price': np.random.normal(100, 5, 20)})
-
-   df[u'quartiles'] = pd.qcut(
-       df[u'stratifying_var'],
-       4,
-       labels=[u'0-25%', u'25-50%', u'50-75%', u'75-100%'])
-
-   @savefig quartile_boxplot.png
-   df.boxplot(column=u'price', by=u'quartiles')
-
-Data In/Out
------------
-
-`Performance comparison of SQL vs HDF5
-<http://stackoverflow.com/questions/16628329/hdf5-and-sqlite-concurrency-compression-i-o-performance>`__
-
-.. _cookbook.csv:
-
-CSV
-***
-
-The :ref:`CSV <io.read_csv_table>` docs
-
-`read_csv in action <http://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/>`__
-
-`appending to a csv
-<http://stackoverflow.com/questions/17134942/pandas-dataframe-output-end-of-csv>`__
-
-`how to read in multiple files, appending to create a single dataframe
-<http://stackoverflow.com/questions/25210819/speeding-up-data-import-function-pandas-and-appending-to-dataframe/25210900#25210900>`__
-
-`Reading a csv chunk-by-chunk
-<http://stackoverflow.com/questions/11622652/large-persistent-dataframe-in-pandas/12193309#12193309>`__
-
-`Reading only certain rows of a csv chunk-by-chunk
-<http://stackoverflow.com/questions/19674212/pandas-data-frame-select-rows-and-clear-memory>`__
-
-`Reading the first few lines of a frame
-<http://stackoverflow.com/questions/15008970/way-to-read-first-few-lines-for-pandas-dataframe>`__
-
-Reading a file that is compressed but not by ``gzip/bz2`` (the native compressed formats which ``read_csv`` understands).
-This example shows a ``WinZipped`` file, but is a general application of opening the file within a context manager and
-using that handle to read.
-`See here
-<http://stackoverflow.com/questions/17789907/pandas-convert-winzipped-csv-file-to-data-frame>`__
-
-`Inferring dtypes from a file
-<http://stackoverflow.com/questions/15555005/get-inferred-dataframe-types-iteratively-using-chunksize>`__
-
-`Dealing with bad lines
-<http://github.com/pandas-dev/pandas/issues/2886>`__
-
-`Dealing with bad lines II
-<http://nipunbatra.github.io/2013/06/reading-unclean-data-csv-using-pandas/>`__
-
-`Reading CSV with Unix timestamps and converting to local timezone
-<http://nipunbatra.github.io/2013/06/pandas-reading-csv-with-unix-timestamps-and-converting-to-local-timezone/>`__
-
-`Write a multi-row index CSV without writing duplicates
-<http://stackoverflow.com/questions/17349574/pandas-write-multiindex-rows-with-to-csv>`__
-
-Parsing date components in multi-columns is faster with a format
-
-.. code-block:: python
-
-    In [30]: i = pd.date_range('20000101',periods=10000)
-
-    In [31]: df = pd.DataFrame(dict(year = i.year, month = i.month, day = i.day))
-
-    In [32]: df.head()
-    Out[32]:
-       day  month  year
-    0    1      1  2000
-    1    2      1  2000
-    2    3      1  2000
-    3    4      1  2000
-    4    5      1  2000
-
-    In [33]: %timeit pd.to_datetime(df.year*10000+df.month*100+df.day,format='%Y%m%d')
-    100 loops, best of 3: 7.08 ms per loop
-
-    # simulate combinging into a string, then parsing
-    In [34]: ds = df.apply(lambda x: "%04d%02d%02d" % (x['year'],x['month'],x['day']),axis=1)
-
-    In [35]: ds.head()
-    Out[35]:
-    0    20000101
-    1    20000102
-    2    20000103
-    3    20000104
-    4    20000105
-    dtype: object
-
-    In [36]: %timeit pd.to_datetime(ds)
-    1 loops, best of 3: 488 ms per loop
-
-Skip row between header and data
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. ipython:: python
-
-    data = """;;;;
-     ;;;;
-     ;;;;
-     ;;;;
-     ;;;;
-     ;;;;
-    ;;;;
-     ;;;;
-     ;;;;
-    ;;;;
-    date;Param1;Param2;Param4;Param5
-        ;m²;°C;m²;m
-    ;;;;
-    01.01.1990 00:00;1;1;2;3
-    01.01.1990 01:00;5;3;4;5
-    01.01.1990 02:00;9;5;6;7
-    01.01.1990 03:00;13;7;8;9
-    01.01.1990 04:00;17;9;10;11
-    01.01.1990 05:00;21;11;12;13
-    """
-
-Option 1: pass rows explicitly to skiprows
-""""""""""""""""""""""""""""""""""""""""""
-
-.. ipython:: python
-
-    pd.read_csv(StringIO(data), sep=';', skiprows=[11,12],
-            index_col=0, parse_dates=True, header=10)
-
-Option 2: read column names and then data
-"""""""""""""""""""""""""""""""""""""""""
-
-.. ipython:: python
-
-    pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
-    columns = pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
-    pd.read_csv(StringIO(data), sep=';', index_col=0,
-                header=12, parse_dates=True, names=columns)
-
-
-.. _cookbook.sql:
-
-SQL
-***
-
-The :ref:`SQL <io.sql>` docs
-
-`Reading from databases with SQL
-<http://stackoverflow.com/questions/10065051/python-pandas-and-databases-like-mysql>`__
-
-.. _cookbook.excel:
-
-Excel
-*****
-
-The :ref:`Excel <io.excel>` docs
-
-`Reading from a filelike handle
-<http://stackoverflow.com/questions/15588713/sheets-of-excel-workbook-from-a-url-into-a-pandas-dataframe>`__
-
-`Modifying formatting in XlsxWriter output
-<http://pbpython.com/improve-pandas-excel-output.html>`__
-
-.. _cookbook.html:
-
-HTML
-****
-
-`Reading HTML tables from a server that cannot handle the default request
-header <http://stackoverflow.com/a/18939272/564538>`__
-
-.. _cookbook.hdf:
-
-HDFStore
-********
-
-The :ref:`HDFStores <io.hdf5>` docs
-
-`Simple Queries with a Timestamp Index
-<http://stackoverflow.com/questions/13926089/selecting-columns-from-pandas-hdfstore-table>`__
-
-`Managing heterogeneous data using a linked multiple table hierarchy
-<http://github.com/pandas-dev/pandas/issues/3032>`__
-
-`Merging on-disk tables with millions of rows
-<http://stackoverflow.com/questions/14614512/merging-two-tables-with-millions-of-rows-in-python/14617925#14617925>`__
-
-`Avoiding inconsistencies when writing to a store from multiple processes/threads
-<http://stackoverflow.com/a/29014295/2858145>`__
-
-De-duplicating a large store by chunks, essentially a recursive reduction operation. Shows a function for taking in data from
-csv file and creating a store by chunks, with date parsing as well.
-`See here
-<http://stackoverflow.com/questions/16110252/need-to-compare-very-large-files-around-1-5gb-in-python/16110391#16110391>`__
-
-`Creating a store chunk-by-chunk from a csv file
-<http://stackoverflow.com/questions/20428355/appending-column-to-frame-of-hdf-file-in-pandas/20428786#20428786>`__
-
-`Appending to a store, while creating a unique index
-<http://stackoverflow.com/questions/16997048/how-does-one-append-large-amounts-of-data-to-a-pandas-hdfstore-and-get-a-natural/16999397#16999397>`__
-
-`Large Data work flows
-<http://stackoverflow.com/questions/14262433/large-data-work-flows-using-pandas>`__
-
-`Reading in a sequence of files, then providing a global unique index to a store while appending
-<http://stackoverflow.com/questions/16997048/how-does-one-append-large-amounts-of-data-to-a-pandas-hdfstore-and-get-a-natural>`__
-
-`Groupby on a HDFStore with low group density
-<http://stackoverflow.com/questions/15798209/pandas-group-by-query-on-large-data-in-hdfstore>`__
-
-`Groupby on a HDFStore with high group density
-<http://stackoverflow.com/questions/25459982/trouble-with-grouby-on-millions-of-keys-on-a-chunked-file-in-python-pandas/25471765#25471765>`__
-
-`Hierarchical queries on a HDFStore
-<http://stackoverflow.com/questions/22777284/improve-query-performance-from-a-large-hdfstore-table-with-pandas/22820780#22820780>`__
-
-`Counting with a HDFStore
-<http://stackoverflow.com/questions/20497897/converting-dict-of-dicts-into-pandas-dataframe-memory-issues>`__
-
-`Troubleshoot HDFStore exceptions
-<http://stackoverflow.com/questions/15488809/how-to-trouble-shoot-hdfstore-exception-cannot-find-the-correct-atom-type>`__
-
-`Setting min_itemsize with strings
-<http://stackoverflow.com/questions/15988871/hdfstore-appendstring-dataframe-fails-when-string-column-contents-are-longer>`__
-
-`Using ptrepack to create a completely-sorted-index on a store
-<http://stackoverflow.com/questions/17893370/ptrepack-sortby-needs-full-index>`__
-
-Storing Attributes to a group node
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(8,3))
-   store = pd.HDFStore('test.h5')
-   store.put('df',df)
-
-   # you can store an arbitrary python object via pickle
-   store.get_storer('df').attrs.my_attribute = dict(A = 10)
-   store.get_storer('df').attrs.my_attribute
-
-.. ipython:: python
-   :suppress:
-
-   store.close()
-   os.remove('test.h5')
-
-.. _cookbook.binary:
-
-Binary Files
-************
-
-pandas readily accepts numpy record arrays, if you need to read in a binary
-file consisting of an array of C structs. For example, given this C program
-in a file called ``main.c`` compiled with ``gcc main.c -std=gnu99`` on a
-64-bit machine,
-
-.. code-block:: c
-
-   #include <stdio.h>
-   #include <stdint.h>
-
-   typedef struct _Data
-   {
-       int32_t count;
-       double avg;
-       float scale;
-   } Data;
-
-   int main(int argc, const char *argv[])
-   {
-       size_t n = 10;
-       Data d[n];
-
-       for (int i = 0; i < n; ++i)
-       {
-           d[i].count = i;
-           d[i].avg = i + 1.0;
-           d[i].scale = (float) i + 2.0f;
-       }
-
-       FILE *file = fopen("binary.dat", "wb");
-       fwrite(&d, sizeof(Data), n, file);
-       fclose(file);
-
-       return 0;
-   }
-
-the following Python code will read the binary file ``'binary.dat'`` into a
-pandas ``DataFrame``, where each element of the struct corresponds to a column
-in the frame:
-
-.. code-block:: python
-
-   names = 'count', 'avg', 'scale'
-
-   # note that the offsets are larger than the size of the type because of
-   # struct padding
-   offsets = 0, 8, 16
-   formats = 'i4', 'f8', 'f4'
-   dt = np.dtype({'names': names, 'offsets': offsets, 'formats': formats},
-                 align=True)
-   df = pd.DataFrame(np.fromfile('binary.dat', dt))
-
-.. note::
-
-   The offsets of the structure elements may be different depending on the
-   architecture of the machine on which the file was created. Using a raw
-   binary file format like this for general data storage is not recommended, as
-   it is not cross platform. We recommended either HDF5 or msgpack, both of
-   which are supported by pandas' IO facilities.
-
-Computation
------------
-
-`Numerical integration (sample-based) of a time series
-<http://nbviewer.ipython.org/5720498>`__
-
-Timedeltas
-----------
-
-The :ref:`Timedeltas <timedeltas.timedeltas>` docs.
-
-`Using timedeltas
-<http://github.com/pandas-dev/pandas/pull/2899>`__
-
-.. ipython:: python
-
-   s  = pd.Series(pd.date_range('2012-1-1', periods=3, freq='D'))
-
-   s - s.max()
-
-   s.max() - s
-
-   s - datetime.datetime(2011,1,1,3,5)
-
-   s + datetime.timedelta(minutes=5)
-
-   datetime.datetime(2011,1,1,3,5) - s
-
-   datetime.timedelta(minutes=5) + s
-
-`Adding and subtracting deltas and dates
-<http://stackoverflow.com/questions/16385785/add-days-to-dates-in-dataframe>`__
-
-.. ipython:: python
-
-   deltas = pd.Series([ datetime.timedelta(days=i) for i in range(3) ])
-
-   df = pd.DataFrame(dict(A = s, B = deltas)); df
-
-   df['New Dates'] = df['A'] + df['B'];
-
-   df['Delta'] = df['A'] - df['New Dates']; df
-
-   df.dtypes
-
-`Another example
-<http://stackoverflow.com/questions/15683588/iterating-through-a-pandas-dataframe>`__
-
-Values can be set to NaT using np.nan, similar to datetime
-
-.. ipython:: python
-
-   y = s - s.shift(); y
-
-   y[1] = np.nan; y
-
-Aliasing Axis Names
--------------------
-
-To globally provide aliases for axis names, one can define these 2 functions:
-
-.. ipython:: python
-
-   def set_axis_alias(cls, axis, alias):
-      if axis not in cls._AXIS_NUMBERS:
-         raise Exception("invalid axis [%s] for alias [%s]" % (axis, alias))
-      cls._AXIS_ALIASES[alias] = axis
-
-.. ipython:: python
-
-   def clear_axis_alias(cls, axis, alias):
-      if axis not in cls._AXIS_NUMBERS:
-         raise Exception("invalid axis [%s] for alias [%s]" % (axis, alias))
-      cls._AXIS_ALIASES.pop(alias,None)
-
-.. ipython:: python
-
-   set_axis_alias(pd.DataFrame,'columns', 'myaxis2')
-   df2 = pd.DataFrame(np.random.randn(3,2),columns=['c1','c2'],index=['i1','i2','i3'])
-   df2.sum(axis='myaxis2')
-   clear_axis_alias(pd.DataFrame,'columns', 'myaxis2')
-
-Creating Example Data
----------------------
-
-To create a dataframe from every combination of some given values, like R's ``expand.grid()``
-function, we can create a dict where the keys are column names and the values are lists
-of the data values:
-
-.. ipython:: python
-
-
-   def expand_grid(data_dict):
-      rows = itertools.product(*data_dict.values())
-      return pd.DataFrame.from_records(rows, columns=data_dict.keys())
-
-   df = expand_grid(
-      {'height': [60, 70],
-       'weight': [100, 140, 180],
-       'sex': ['Male', 'Female']})
-   df
diff --git a/doc/source/development/contributing.rst b/doc/source/development/contributing.rst
new file mode 100644
index 0000000000000..434df772ae9d1
--- /dev/null
+++ b/doc/source/development/contributing.rst
@@ -0,0 +1,1291 @@
+.. _contributing:
+
+{{ header }}
+
+**********************
+Contributing to pandas
+**********************
+
+.. contents:: Table of contents:
+   :local:
+
+Where to start?
+===============
+
+All contributions, bug reports, bug fixes, documentation improvements,
+enhancements, and ideas are welcome.
+
+If you are brand new to pandas or open-source development, we recommend going
+through the `GitHub "issues" tab <https://github.com/pandas-dev/pandas/issues>`_
+to find issues that interest you. There are a number of issues listed under `Docs
+<https://github.com/pandas-dev/pandas/issues?labels=Docs&sort=updated&state=open>`_
+and `good first issue
+<https://github.com/pandas-dev/pandas/issues?labels=good+first+issue&sort=updated&state=open>`_
+where you could start out. Once you've found an interesting issue, you can
+return here to get your development environment setup.
+
+Feel free to ask questions on the `mailing list
+<https://groups.google.com/forum/?fromgroups#!forum/pydata>`_ or on `Gitter`_.
+
+.. _contributing.bug_reports:
+
+Bug reports and enhancement requests
+====================================
+
+Bug reports are an important part of making *pandas* more stable. Having a complete bug report
+will allow others to reproduce the bug and provide insight into fixing. See
+`this stackoverflow article <https://stackoverflow.com/help/mcve>`_ and
+`this blogpost <http://matthewrocklin.com/blog/work/2018/02/28/minimal-bug-reports>`_
+for tips on writing a good bug report.
+
+Trying the bug-producing code out on the *master* branch is often a worthwhile exercise
+to confirm the bug still exists. It is also worth searching existing bug reports and pull requests
+to see if the issue has already been reported and/or fixed.
+
+Bug reports must:
+
+#. Include a short, self-contained Python snippet reproducing the problem.
+   You can format the code nicely by using `GitHub Flavored Markdown
+   <http://github.github.com/github-flavored-markdown/>`_::
+
+      ```python
+      >>> from pandas import DataFrame
+      >>> df = DataFrame(...)
+      ...
+      ```
+
+#. Include the full version string of *pandas* and its dependencies. You can use the built-in function::
+
+      >>> import pandas as pd
+      >>> pd.show_versions()
+
+#. Explain why the current behavior is wrong/not desired and what you expect instead.
+
+The issue will then show up to the *pandas* community and be open to comments/ideas from others.
+
+.. _contributing.github:
+
+Working with the code
+=====================
+
+Now that you have an issue you want to fix, enhancement to add, or documentation to improve,
+you need to learn how to work with GitHub and the *pandas* code base.
+
+.. _contributing.version_control:
+
+Version control, Git, and GitHub
+--------------------------------
+
+To the new user, working with Git is one of the more daunting aspects of contributing to *pandas*.
+It can very quickly become overwhelming, but sticking to the guidelines below will help keep the process
+straightforward and mostly trouble free.  As always, if you are having difficulties please
+feel free to ask for help.
+
+The code is hosted on `GitHub <https://www.github.com/pandas-dev/pandas>`_. To
+contribute you will need to sign up for a `free GitHub account
+<https://github.com/signup/free>`_. We use `Git <http://git-scm.com/>`_ for
+version control to allow many people to work together on the project.
+
+Some great resources for learning Git:
+
+* the `GitHub help pages <http://help.github.com/>`_.
+* the `NumPy's documentation <http://docs.scipy.org/doc/numpy/dev/index.html>`_.
+* Matthew Brett's `Pydagogue <http://matthew-brett.github.com/pydagogue/>`_.
+
+Getting started with Git
+------------------------
+
+`GitHub has instructions <http://help.github.com/set-up-git-redirect>`__ for installing git,
+setting up your SSH key, and configuring git.  All these steps need to be completed before
+you can work seamlessly between your local repository and GitHub.
+
+.. _contributing.forking:
+
+Forking
+-------
+
+You will need your own fork to work on the code. Go to the `pandas project
+page <https://github.com/pandas-dev/pandas>`_ and hit the ``Fork`` button. You will
+want to clone your fork to your machine::
+
+    git clone https://github.com/your-user-name/pandas.git pandas-yourname
+    cd pandas-yourname
+    git remote add upstream https://github.com/pandas-dev/pandas.git
+
+This creates the directory `pandas-yourname` and connects your repository to
+the upstream (main project) *pandas* repository.
+
+.. _contributing.dev_env:
+
+Creating a development environment
+----------------------------------
+
+To test out code changes, you'll need to build pandas from source, which
+requires a C compiler and Python environment. If you're making documentation
+changes, you can skip to :ref:`contributing.documentation` but you won't be able
+to build the documentation locally before pushing your changes.
+
+.. _contributing.dev_c:
+
+Installing a C Compiler
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas uses C extensions (mostly written using Cython) to speed up certain
+operations. To install pandas from source, you need to compile these C
+extensions, which means you need a C compiler. This process depends on which
+platform you're using. Follow the `CPython contributing guide
+<https://devguide.python.org/setup/#compile-and-build>`_ for getting a
+compiler installed. You don't need to do any of the ``./configure`` or ``make``
+steps; you only need to install the compiler.
+
+For Windows developers, when using Python 3.5 and later, it is sufficient to
+install `Visual Studio 2017 <https://visualstudio.com/>`_ with the
+**Python development workload** and the **Python native development tools**
+option. Otherwise, the following links may be helpful.
+
+* https://blogs.msdn.microsoft.com/pythonengineering/2017/03/07/python-support-in-vs2017/
+* https://blogs.msdn.microsoft.com/pythonengineering/2016/04/11/unable-to-find-vcvarsall-bat/
+* https://github.com/conda/conda-recipes/wiki/Building-from-Source-on-Windows-32-bit-and-64-bit
+* https://cowboyprogrammer.org/building-python-wheels-for-windows/
+* https://blog.ionelmc.ro/2014/12/21/compiling-python-extensions-on-windows/
+* https://support.enthought.com/hc/en-us/articles/204469260-Building-Python-extensions-with-Canopy
+
+Let us know if you have any difficulties by opening an issue or reaching out on
+`Gitter`_.
+
+.. _contributing.dev_python:
+
+Creating a Python Environment
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Now that you have a C compiler, create an isolated pandas development
+environment:
+
+* Install either `Anaconda <https://www.anaconda.com/download/>`_ or `miniconda
+  <https://conda.io/miniconda.html>`_
+* Make sure your conda is up to date (``conda update conda``)
+* Make sure that you have :ref:`cloned the repository <contributing.forking>`
+* ``cd`` to the *pandas* source directory
+
+We'll now kick off a three-step process:
+
+1. Install the build dependencies
+2. Build and install pandas
+3. Install the optional dependencies
+
+.. code-block:: none
+
+   # Create and activate the build environment
+   conda env create -f environment.yml
+   conda activate pandas-dev
+   conda uninstall --force pandas
+
+   # or with older versions of Anaconda:
+   source activate pandas-dev
+
+   # Build and install pandas
+   python setup.py build_ext --inplace -j 4
+   python -m pip install -e .
+
+At this point you should be able to import pandas from your locally built version::
+
+   $ python  # start an interpreter
+   >>> import pandas
+   >>> print(pandas.__version__)
+   0.22.0.dev0+29.g4ad6d4d74
+
+This will create the new environment, and not touch any of your existing environments,
+nor any existing Python installation.
+
+To view your environments::
+
+      conda info -e
+
+To return to your root environment::
+
+      conda deactivate
+
+See the full conda docs `here <http://conda.pydata.org/docs>`__.
+
+.. _contributing.pip:
+
+Creating a Python Environment (pip)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If you aren't using conda for your development environment, follow these instructions.
+You'll need to have at least python3.5 installed on your system.
+
+.. code-block:: none
+
+   # Create a virtual environment
+   # Use an ENV_DIR of your choice. We'll use ~/virtualenvs/pandas-dev
+   # Any parent directories should already exist
+   python3 -m venv ~/virtualenvs/pandas-dev
+   # Activate the virtulaenv
+   . ~/virtualenvs/pandas-dev/bin/activate
+
+   # Install the build dependencies
+   python -m pip install -r requirements-dev.txt
+
+   # Build and install pandas
+   python setup.py build_ext --inplace -j 4
+   python -m pip install -e .
+
+Creating a branch
+-----------------
+
+You want your master branch to reflect only production-ready code, so create a
+feature branch for making your changes. For example::
+
+    git branch shiny-new-feature
+    git checkout shiny-new-feature
+
+The above can be simplified to::
+
+    git checkout -b shiny-new-feature
+
+This changes your working directory to the shiny-new-feature branch.  Keep any
+changes in this branch specific to one bug or feature so it is clear
+what the branch brings to *pandas*. You can have many shiny-new-features
+and switch in between them using the git checkout command.
+
+When creating this branch, make sure your master branch is up to date with
+the latest upstream master version. To update your local master branch, you
+can do::
+
+    git checkout master
+    git pull upstream master --ff-only
+
+When you want to update the feature branch with changes in master after
+you created the branch, check the section on
+:ref:`updating a PR <contributing.update-pr>`.
+
+.. _contributing.documentation:
+
+Contributing to the documentation
+=================================
+
+Contributing to the documentation benefits everyone who uses *pandas*.
+We encourage you to help us improve the documentation, and
+you don't have to be an expert on *pandas* to do so! In fact,
+there are sections of the docs that are worse off after being written by
+experts. If something in the docs doesn't make sense to you, updating the
+relevant section after you figure it out is a great way to ensure it will help
+the next person.
+
+.. contents:: Documentation:
+   :local:
+
+
+About the *pandas* documentation
+--------------------------------
+
+The documentation is written in **reStructuredText**, which is almost like writing
+in plain English, and built using `Sphinx <http://sphinx.pocoo.org/>`__. The
+Sphinx Documentation has an excellent `introduction to reST
+<http://sphinx.pocoo.org/rest.html>`__. Review the Sphinx docs to perform more
+complex changes to the documentation as well.
+
+Some other important things to know about the docs:
+
+* The *pandas* documentation consists of two parts: the docstrings in the code
+  itself and the docs in this folder ``pandas/doc/``.
+
+  The docstrings provide a clear explanation of the usage of the individual
+  functions, while the documentation in this folder consists of tutorial-like
+  overviews per topic together with some other information (what's new,
+  installation, etc).
+
+* The docstrings follow a pandas convention, based on the **Numpy Docstring
+  Standard**. Follow the :ref:`pandas docstring guide <docstring>` for detailed
+  instructions on how to write a correct docstring.
+
+  .. toctree::
+     :maxdepth: 2
+
+     contributing_docstring.rst
+
+* The tutorials make heavy use of the `ipython directive
+  <http://matplotlib.org/sampledoc/ipython_directive.html>`_ sphinx extension.
+  This directive lets you put code in the documentation which will be run
+  during the doc build. For example::
+
+      .. ipython:: python
+
+          x = 2
+          x**3
+
+  will be rendered as::
+
+      In [1]: x = 2
+
+      In [2]: x**3
+      Out[2]: 8
+
+  Almost all code examples in the docs are run (and the output saved) during the
+  doc build. This approach means that code examples will always be up to date,
+  but it does make the doc building a bit more complex.
+
+* Our API documentation in ``doc/source/api.rst`` houses the auto-generated
+  documentation from the docstrings. For classes, there are a few subtleties
+  around controlling which methods and attributes have pages auto-generated.
+
+  We have two autosummary templates for classes.
+
+  1. ``_templates/autosummary/class.rst``. Use this when you want to
+     automatically generate a page for every public method and attribute on the
+     class. The ``Attributes`` and ``Methods`` sections will be automatically
+     added to the class' rendered documentation by numpydoc. See ``DataFrame``
+     for an example.
+
+  2. ``_templates/autosummary/class_without_autosummary``. Use this when you
+     want to pick a subset of methods / attributes to auto-generate pages for.
+     When using this template, you should include an ``Attributes`` and
+     ``Methods`` section in the class docstring. See ``CategoricalIndex`` for an
+     example.
+
+  Every method should be included in a ``toctree`` in ``api.rst``, else Sphinx
+  will emit a warning.
+
+.. note::
+
+    The ``.rst`` files are used to automatically generate Markdown and HTML versions
+    of the docs. For this reason, please do not edit ``CONTRIBUTING.md`` directly,
+    but instead make any changes to ``doc/source/contributing.rst``. Then, to
+    generate ``CONTRIBUTING.md``, use `pandoc <http://johnmacfarlane.net/pandoc/>`_
+    with the following command::
+
+      pandoc doc/source/contributing.rst -t markdown_github > CONTRIBUTING.md
+
+The utility script ``scripts/validate_docstrings.py`` can be used to get a csv
+summary of the API documentation. And also validate common errors in the docstring
+of a specific class, function or method. The summary also compares the list of
+methods documented in ``doc/source/api.rst`` (which is used to generate
+the `API Reference <http://pandas.pydata.org/pandas-docs/stable/api.html>`_ page)
+and the actual public methods.
+This will identify methods documented in ``doc/source/api.rst`` that are not actually
+class methods, and existing methods that are not documented in ``doc/source/api.rst``.
+
+
+Updating a *pandas* docstring
+-----------------------------
+
+When improving a single function or method's docstring, it is not necessarily
+needed to build the full documentation (see next section).
+However, there is a script that checks a docstring (for example for the ``DataFrame.mean`` method)::
+
+    python scripts/validate_docstrings.py pandas.DataFrame.mean
+
+This script will indicate some formatting errors if present, and will also
+run and test the examples included in the docstring.
+Check the :ref:`pandas docstring guide <docstring>` for a detailed guide
+on how to format the docstring.
+
+The examples in the docstring ('doctests') must be valid Python code,
+that in a deterministic way returns the presented output, and that can be
+copied and run by users. This can be checked with the script above, and is
+also tested on Travis. A failing doctest will be a blocker for merging a PR.
+Check the :ref:`examples <docstring.examples>` section in the docstring guide
+for some tips and tricks to get the doctests passing.
+
+When doing a PR with a docstring update, it is good to post the
+output of the validation script in a comment on github.
+
+
+How to build the *pandas* documentation
+---------------------------------------
+
+Requirements
+~~~~~~~~~~~~
+
+First, you need to have a development environment to be able to build pandas
+(see the docs on :ref:`creating a development environment above <contributing.dev_env>`).
+
+Building the documentation
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+So how do you build the docs? Navigate to your local
+``pandas/doc/`` directory in the console and run::
+
+    python make.py html
+
+Then you can find the HTML output in the folder ``pandas/doc/build/html/``.
+
+The first time you build the docs, it will take quite a while because it has to run
+all the code examples and build all the generated docstring pages. In subsequent
+evocations, sphinx will try to only build the pages that have been modified.
+
+If you want to do a full clean build, do::
+
+    python make.py clean
+    python make.py html
+
+You can tell ``make.py`` to compile only a single section of the docs, greatly
+reducing the turn-around time for checking your changes.
+
+::
+
+    # omit autosummary and API section
+    python make.py clean
+    python make.py --no-api
+
+    # compile the docs with only a single section, relative to the "source" folder.
+    # For example, compiling only this guide (docs/source/development/contributing.rst)
+    python make.py clean
+    python make.py --single development/contributing.rst
+
+    # compile the reference docs for a single function
+    python make.py clean
+    python make.py --single pandas.DataFrame.join
+
+For comparison, a full documentation build may take 15 minutes, but a single
+section may take 15 seconds. Subsequent builds, which only process portions
+you have changed, will be faster.
+
+You can also specify to use multiple cores to speed up the documentation build::
+
+    python make.py html --num-jobs 4
+
+Open the following file in a web browser to see the full documentation you
+just built::
+
+    pandas/docs/build/html/index.html
+
+And you'll have the satisfaction of seeing your new and improved documentation!
+
+.. _contributing.dev_docs:
+
+Building master branch documentation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When pull requests are merged into the *pandas* ``master`` branch, the main parts of
+the documentation are also built by Travis-CI. These docs are then hosted `here
+<http://pandas-docs.github.io/pandas-docs-travis>`__, see also
+the :ref:`Continuous Integration <contributing.ci>` section.
+
+.. _contributing.code:
+
+Contributing to the code base
+=============================
+
+.. contents:: Code Base:
+   :local:
+
+Code standards
+--------------
+
+Writing good code is not just about what you write. It is also about *how* you
+write it. During :ref:`Continuous Integration <contributing.ci>` testing, several
+tools will be run to check your code for stylistic errors.
+Generating any warnings will cause the test to fail.
+Thus, good style is a requirement for submitting code to *pandas*.
+
+There is a tool in pandas to help contributors verify their changes before
+contributing them to the project::
+
+   ./ci/code_checks.sh
+
+The script verifies the linting of code files, it looks for common mistake patterns
+(like missing spaces around sphinx directives that make the documentation not
+being rendered properly) and it also validates the doctests. It is possible to
+run the checks independently by using the parameters ``lint``, ``patterns`` and
+``doctests`` (e.g. ``./ci/code_checks.sh lint``).
+
+In addition, because a lot of people use our library, it is important that we
+do not make sudden changes to the code that could have the potential to break
+a lot of user code as a result, that is, we need it to be as *backwards compatible*
+as possible to avoid mass breakages.
+
+Additional standards are outlined on the `code style wiki
+page <https://github.com/pandas-dev/pandas/wiki/Code-Style-and-Conventions>`_.
+
+C (cpplint)
+~~~~~~~~~~~
+
+*pandas* uses the `Google <https://google.github.io/styleguide/cppguide.html>`_
+standard. Google provides an open source style checker called ``cpplint``, but we
+use a fork of it that can be found `here <https://github.com/cpplint/cpplint>`__.
+Here are *some* of the more common ``cpplint`` issues:
+
+* we restrict line-length to 80 characters to promote readability
+* every header file must include a header guard to avoid name collisions if re-included
+
+:ref:`Continuous Integration <contributing.ci>` will run the
+`cpplint <https://pypi.org/project/cpplint>`_ tool
+and report any stylistic errors in your code. Therefore, it is helpful before
+submitting code to run the check yourself::
+
+   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir modified-c-file
+
+You can also run this command on an entire directory if necessary::
+
+   cpplint --extensions=c,h --headers=h --filter=-readability/casting,-runtime/int,-build/include_subdir --recursive modified-c-directory
+
+To make your commits compliant with this standard, you can install the
+`ClangFormat <http://clang.llvm.org/docs/ClangFormat.html>`_ tool, which can be
+downloaded `here <http://llvm.org/builds/>`__. To configure, in your home directory,
+run the following command::
+
+    clang-format style=google -dump-config  > .clang-format
+
+Then modify the file to ensure that any indentation width parameters are at least four.
+Once configured, you can run the tool as follows::
+
+    clang-format modified-c-file
+
+This will output what your file will look like if the changes are made, and to apply
+them, run the following command::
+
+    clang-format -i modified-c-file
+
+To run the tool on an entire directory, you can run the following analogous commands::
+
+    clang-format modified-c-directory/*.c modified-c-directory/*.h
+    clang-format -i modified-c-directory/*.c modified-c-directory/*.h
+
+Do note that this tool is best-effort, meaning that it will try to correct as
+many errors as possible, but it may not correct *all* of them. Thus, it is
+recommended that you run ``cpplint`` to double check and make any other style
+fixes manually.
+
+Python (PEP8)
+~~~~~~~~~~~~~
+
+*pandas* uses the `PEP8 <http://www.python.org/dev/peps/pep-0008/>`_ standard.
+There are several tools to ensure you abide by this standard. Here are *some* of
+the more common ``PEP8`` issues:
+
+* we restrict line-length to 79 characters to promote readability
+* passing arguments should have spaces after commas, e.g. ``foo(arg1, arg2, kw1='bar')``
+
+:ref:`Continuous Integration <contributing.ci>` will run
+the `flake8 <https://pypi.org/project/flake8>`_ tool
+and report any stylistic errors in your code. Therefore, it is helpful before
+submitting code to run the check yourself on the diff::
+
+   git diff upstream/master -u -- "*.py" | flake8 --diff
+
+This command will catch any stylistic errors in your changes specifically, but
+be beware it may not catch all of them. For example, if you delete the only
+usage of an imported function, it is stylistically incorrect to import an
+unused function. However, style-checking the diff will not catch this because
+the actual import is not part of the diff. Thus, for completeness, you should
+run this command, though it will take longer::
+
+   git diff upstream/master --name-only -- "*.py" | xargs -r flake8
+
+Note that on OSX, the ``-r`` flag is not available, so you have to omit it and
+run this slightly modified command::
+
+   git diff upstream/master --name-only -- "*.py" | xargs flake8
+
+Windows does not support the ``xargs`` command (unless installed for example
+via the `MinGW <http://www.mingw.org/>`__ toolchain), but one can imitate the
+behaviour as follows::
+
+    for /f %i in ('git diff upstream/master --name-only -- "*.py"') do flake8 %i
+
+This will get all the files being changed by the PR (and ending with ``.py``),
+and run ``flake8`` on them, one after the other.
+
+.. _contributing.import-formatting:
+
+Import Formatting
+~~~~~~~~~~~~~~~~~
+*pandas* uses `isort <https://pypi.org/project/isort/>`__ to standardise import
+formatting across the codebase.
+
+A guide to import layout as per pep8 can be found `here <https://www.python.org/dev/peps/pep-0008/#imports/>`__.
+
+A summary of our current import sections ( in order ):
+
+* Future
+* Python Standard Library
+* Third Party
+* ``pandas._libs``, ``pandas.compat``, ``pandas.util._*``, ``pandas.errors`` (largely not dependent on ``pandas.core``)
+* ``pandas.core.dtypes`` (largely not dependent on the rest of ``pandas.core``)
+* Rest of ``pandas.core.*``
+* Non-core ``pandas.io``, ``pandas.plotting``, ``pandas.tseries``
+* Local application/library specific imports
+
+Imports are alphabetically sorted within these sections.
+
+
+As part of :ref:`Continuous Integration <contributing.ci>` checks we run::
+
+    isort --recursive --check-only pandas
+
+to check that imports are correctly formatted as per the `setup.cfg`.
+
+If you see output like the below in :ref:`Continuous Integration <contributing.ci>` checks:
+
+.. code-block:: shell
+
+   Check import format using isort
+   ERROR: /home/travis/build/pandas-dev/pandas/pandas/io/pytables.py Imports are incorrectly sorted
+   Check import format using isort DONE
+   The command "ci/code_checks.sh" exited with 1
+
+You should run::
+
+    isort pandas/io/pytables.py
+
+to automatically format imports correctly. This will modify your local copy of the files.
+
+The `--recursive` flag can be passed to sort all files in a directory.
+
+You can then verify the changes look ok, then git :ref:`commit <contributing.commit-code>` and :ref:`push <contributing.push-code>`.
+
+Backwards Compatibility
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Please try to maintain backward compatibility. *pandas* has lots of users with lots of
+existing code, so don't break it if at all possible.  If you think breakage is required,
+clearly state why as part of the pull request.  Also, be careful when changing method
+signatures and add deprecation warnings where needed. Also, add the deprecated sphinx
+directive to the deprecated functions or methods.
+
+If a function with the same arguments as the one being deprecated exist, you can use
+the ``pandas.util._decorators.deprecate``:
+
+.. code-block:: python
+
+    from pandas.util._decorators import deprecate
+
+    deprecate('old_func', 'new_func', '0.21.0')
+
+Otherwise, you need to do it manually:
+
+.. code-block:: python
+
+    import warnings
+
+
+    def old_func():
+        """Summary of the function.
+
+        .. deprecated:: 0.21.0
+           Use new_func instead.
+        """
+        warnings.warn('Use new_func instead.', FutureWarning, stacklevel=2)
+        new_func()
+
+
+    def new_func():
+        pass
+
+You'll also need to
+
+1. Write a new test that asserts a warning is issued when calling with the deprecated argument
+2. Update all of pandas existing tests and code to use the new argument
+
+See :ref:`contributing.warnings` for more.
+
+
+.. _contributing.ci:
+
+Testing With Continuous Integration
+-----------------------------------
+
+The *pandas* test suite will run automatically on `Travis-CI <https://travis-ci.org/>`__ and
+`Azure Pipelines <https://azure.microsoft.com/en-us/services/devops/pipelines/>`__
+continuous integration services, once your pull request is submitted.
+However, if you wish to run the test suite on a branch prior to submitting the pull request,
+then the continuous integration services need to be hooked to your GitHub repository. Instructions are here
+for `Travis-CI <http://about.travis-ci.org/docs/user/getting-started/>`__ and
+`Azure Pipelines <https://docs.microsoft.com/en-us/azure/devops/pipelines/>`__.
+
+A pull-request will be considered for merging when you have an all 'green' build. If any tests are failing,
+then you will get a red 'X', where you can click through to see the individual failed tests.
+This is an example of a green build.
+
+.. image:: ../_static/ci.png
+
+.. note::
+
+   Each time you push to *your* fork, a *new* run of the tests will be triggered on the CI.
+   You can enable the auto-cancel feature, which removes any non-currently-running tests for that same pull-request, for
+   `Travis-CI here <https://docs.travis-ci.com/user/customizing-the-build/#Building-only-the-latest-commit>`__.
+
+.. _contributing.tdd:
+
+
+Test-driven development/code writing
+------------------------------------
+
+*pandas* is serious about testing and strongly encourages contributors to embrace
+`test-driven development (TDD) <https://en.wikipedia.org/wiki/Test-driven_development>`_.
+This development process "relies on the repetition of a very short development cycle:
+first the developer writes an (initially failing) automated test case that defines a desired
+improvement or new function, then produces the minimum amount of code to pass that test."
+So, before actually writing any code, you should write your tests.  Often the test can be
+taken from the original GitHub issue.  However, it is always worth considering additional
+use cases and writing corresponding tests.
+
+Adding tests is one of the most common requests after code is pushed to *pandas*.  Therefore,
+it is worth getting in the habit of writing tests ahead of time so this is never an issue.
+
+Like many packages, *pandas* uses `pytest
+<http://docs.pytest.org/en/latest/>`_ and the convenient
+extensions in `numpy.testing
+<http://docs.scipy.org/doc/numpy/reference/routines.testing.html>`_.
+
+.. note::
+
+   The earliest supported pytest version is 4.0.2.
+
+Writing tests
+~~~~~~~~~~~~~
+
+All tests should go into the ``tests`` subdirectory of the specific package.
+This folder contains many current examples of tests, and we suggest looking to these for
+inspiration.  If your test requires working with files or
+network connectivity, there is more information on the `testing page
+<https://github.com/pandas-dev/pandas/wiki/Testing>`_ of the wiki.
+
+The ``pandas.util.testing`` module has many special ``assert`` functions that
+make it easier to make statements about whether Series or DataFrame objects are
+equivalent. The easiest way to verify that your code is correct is to
+explicitly construct the result you expect, then compare the actual result to
+the expected correct result::
+
+    def test_pivot(self):
+        data = {
+            'index' : ['A', 'B', 'C', 'C', 'B', 'A'],
+            'columns' : ['One', 'One', 'One', 'Two', 'Two', 'Two'],
+            'values' : [1., 2., 3., 3., 2., 1.]
+        }
+
+        frame = DataFrame(data)
+        pivoted = frame.pivot(index='index', columns='columns', values='values')
+
+        expected = DataFrame({
+            'One' : {'A' : 1., 'B' : 2., 'C' : 3.},
+            'Two' : {'A' : 1., 'B' : 2., 'C' : 3.}
+        })
+
+        assert_frame_equal(pivoted, expected)
+
+Transitioning to ``pytest``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+*pandas* existing test structure is *mostly* classed based, meaning that you will typically find tests wrapped in a class.
+
+.. code-block:: python
+
+    class TestReallyCoolFeature(object):
+        pass
+
+Going forward, we are moving to a more *functional* style using the `pytest <http://docs.pytest.org/en/latest/>`__ framework, which offers a richer testing
+framework that will facilitate testing and developing. Thus, instead of writing test classes, we will write test functions like this:
+
+.. code-block:: python
+
+    def test_really_cool_feature():
+        pass
+
+Using ``pytest``
+~~~~~~~~~~~~~~~~
+
+Here is an example of a self-contained set of tests that illustrate multiple features that we like to use.
+
+* functional style: tests are like ``test_*`` and *only* take arguments that are either fixtures or parameters
+* ``pytest.mark`` can be used to set metadata on test functions, e.g. ``skip`` or ``xfail``.
+* using ``parametrize``: allow testing of multiple cases
+* to set a mark on a parameter, ``pytest.param(..., marks=...)`` syntax should be used
+* ``fixture``, code for object construction, on a per-test basis
+* using bare ``assert`` for scalars and truth-testing
+* ``tm.assert_series_equal`` (and its counter part ``tm.assert_frame_equal``), for pandas object comparisons.
+* the typical pattern of constructing an ``expected`` and comparing versus the ``result``
+
+We would name this file ``test_cool_feature.py`` and put in an appropriate place in the ``pandas/tests/`` structure.
+
+.. code-block:: python
+
+   import pytest
+   import numpy as np
+   import pandas as pd
+
+
+   @pytest.mark.parametrize('dtype', ['int8', 'int16', 'int32', 'int64'])
+   def test_dtypes(dtype):
+       assert str(np.dtype(dtype)) == dtype
+
+
+   @pytest.mark.parametrize(
+       'dtype', ['float32', pytest.param('int16', marks=pytest.mark.skip),
+                 pytest.param('int32', marks=pytest.mark.xfail(
+                     reason='to show how it works'))])
+   def test_mark(dtype):
+       assert str(np.dtype(dtype)) == 'float32'
+
+
+   @pytest.fixture
+   def series():
+       return pd.Series([1, 2, 3])
+
+
+   @pytest.fixture(params=['int8', 'int16', 'int32', 'int64'])
+   def dtype(request):
+       return request.param
+
+
+   def test_series(series, dtype):
+       result = series.astype(dtype)
+       assert result.dtype == dtype
+
+       expected = pd.Series([1, 2, 3], dtype=dtype)
+       tm.assert_series_equal(result, expected)
+
+
+A test run of this yields
+
+.. code-block:: shell
+
+   ((pandas) bash-3.2$ pytest  test_cool_feature.py  -v
+   =========================== test session starts ===========================
+   platform darwin -- Python 3.6.2, pytest-3.6.0, py-1.4.31, pluggy-0.4.0
+   collected 11 items
+
+   tester.py::test_dtypes[int8] PASSED
+   tester.py::test_dtypes[int16] PASSED
+   tester.py::test_dtypes[int32] PASSED
+   tester.py::test_dtypes[int64] PASSED
+   tester.py::test_mark[float32] PASSED
+   tester.py::test_mark[int16] SKIPPED
+   tester.py::test_mark[int32] xfail
+   tester.py::test_series[int8] PASSED
+   tester.py::test_series[int16] PASSED
+   tester.py::test_series[int32] PASSED
+   tester.py::test_series[int64] PASSED
+
+Tests that we have ``parametrized`` are now accessible via the test name, for example we could run these with ``-k int8`` to sub-select *only* those tests which match ``int8``.
+
+
+.. code-block:: shell
+
+   ((pandas) bash-3.2$ pytest  test_cool_feature.py  -v -k int8
+   =========================== test session starts ===========================
+   platform darwin -- Python 3.6.2, pytest-3.6.0, py-1.4.31, pluggy-0.4.0
+   collected 11 items
+
+   test_cool_feature.py::test_dtypes[int8] PASSED
+   test_cool_feature.py::test_series[int8] PASSED
+
+
+.. _using-hypothesis:
+
+Using ``hypothesis``
+~~~~~~~~~~~~~~~~~~~~
+
+Hypothesis is a library for property-based testing.  Instead of explicitly
+parametrizing a test, you can describe *all* valid inputs and let Hypothesis
+try to find a failing input.  Even better, no matter how many random examples
+it tries, Hypothesis always reports a single minimal counterexample to your
+assertions - often an example that you would never have thought to test.
+
+See `Getting Started with Hypothesis <https://hypothesis.works/articles/getting-started-with-hypothesis/>`_
+for more of an introduction, then `refer to the Hypothesis documentation
+for details <https://hypothesis.readthedocs.io/en/latest/index.html>`_.
+
+.. code-block:: python
+
+    import json
+    from hypothesis import given, strategies as st
+
+    any_json_value = st.deferred(lambda: st.one_of(
+        st.none(), st.booleans(), st.floats(allow_nan=False), st.text(),
+        st.lists(any_json_value), st.dictionaries(st.text(), any_json_value)
+    ))
+
+
+    @given(value=any_json_value)
+    def test_json_roundtrip(value):
+        result = json.loads(json.dumps(value))
+        assert value == result
+
+This test shows off several useful features of Hypothesis, as well as
+demonstrating a good use-case: checking properties that should hold over
+a large or complicated domain of inputs.
+
+To keep the Pandas test suite running quickly, parametrized tests are
+preferred if the inputs or logic are simple, with Hypothesis tests reserved
+for cases with complex logic or where there are too many combinations of
+options or subtle interactions to test (or think of!) all of them.
+
+.. _contributing.warnings:
+
+Testing Warnings
+~~~~~~~~~~~~~~~~
+
+By default, one of pandas CI workers will fail if any unhandled warnings are emitted.
+
+If your change involves checking that a warning is actually emitted, use
+``tm.assert_produces_warning(ExpectedWarning)``.
+
+
+.. code-block:: python
+
+   import pandas.util.testing as tm
+
+
+   df = pd.DataFrame()
+   with tm.assert_produces_warning(FutureWarning):
+       df.some_operation()
+
+We prefer this to the ``pytest.warns`` context manager because ours checks that the warning's
+stacklevel is set correctly. The stacklevel is what ensure the *user's* file name and line number
+is printed in the warning, rather than something internal to pandas. It represents the number of
+function calls from user code (e.g. ``df.some_operation()``) to the function that actually emits
+the warning. Our linter will fail the build if you use ``pytest.warns`` in a test.
+
+If you have a test that would emit a warning, but you aren't actually testing the
+warning itself (say because it's going to be removed in the future, or because we're
+matching a 3rd-party library's behavior), then use ``pytest.mark.filterwarnings`` to
+ignore the error.
+
+.. code-block:: python
+
+   @pytest.mark.filterwarnings("ignore:msg:category")
+   def test_thing(self):
+       ...
+
+If the test generates a warning of class ``category`` whose message starts
+with ``msg``, the warning will be ignored and the test will pass.
+
+If you need finer-grained control, you can use Python's usual
+`warnings module <https://docs.python.org/3/library/warnings.html>`__
+to control whether a warning is ignored / raised at different places within
+a single test.
+
+.. code-block:: python
+
+   with warnings.catch_warnings():
+       warnings.simplefilter("ignore", FutureWarning)
+       # Or use warnings.filterwarnings(...)
+
+Alternatively, consider breaking up the unit test.
+
+
+Running the test suite
+----------------------
+
+The tests can then be run directly inside your Git clone (without having to
+install *pandas*) by typing::
+
+    pytest pandas
+
+The tests suite is exhaustive and takes around 20 minutes to run.  Often it is
+worth running only a subset of tests first around your changes before running the
+entire suite.
+
+The easiest way to do this is with::
+
+    pytest pandas/path/to/test.py -k regex_matching_test_name
+
+Or with one of the following constructs::
+
+    pytest pandas/tests/[test-module].py
+    pytest pandas/tests/[test-module].py::[TestClass]
+    pytest pandas/tests/[test-module].py::[TestClass]::[test_method]
+
+Using `pytest-xdist <https://pypi.org/project/pytest-xdist>`_, one can
+speed up local testing on multicore machines. To use this feature, you will
+need to install `pytest-xdist` via::
+
+    pip install pytest-xdist
+
+Two scripts are provided to assist with this.  These scripts distribute
+testing across 4 threads.
+
+On Unix variants, one can type::
+
+    test_fast.sh
+
+On Windows, one can type::
+
+    test_fast.bat
+
+This can significantly reduce the time it takes to locally run tests before
+submitting a pull request.
+
+For more, see the `pytest <http://docs.pytest.org/en/latest/>`_ documentation.
+
+    .. versionadded:: 0.20.0
+
+Furthermore one can run
+
+.. code-block:: python
+
+   pd.test()
+
+with an imported pandas to run tests similarly.
+
+Running the performance test suite
+----------------------------------
+
+Performance matters and it is worth considering whether your code has introduced
+performance regressions.  *pandas* is in the process of migrating to
+`asv benchmarks <https://github.com/spacetelescope/asv>`__
+to enable easy monitoring of the performance of critical *pandas* operations.
+These benchmarks are all found in the ``pandas/asv_bench`` directory.  asv
+supports both python2 and python3.
+
+To use all features of asv, you will need either ``conda`` or
+``virtualenv``. For more details please check the `asv installation
+webpage <https://asv.readthedocs.io/en/latest/installing.html>`_.
+
+To install asv::
+
+    pip install git+https://github.com/spacetelescope/asv
+
+If you need to run a benchmark, change your directory to ``asv_bench/`` and run::
+
+    asv continuous -f 1.1 upstream/master HEAD
+
+You can replace ``HEAD`` with the name of the branch you are working on,
+and report benchmarks that changed by more than 10%.
+The command uses ``conda`` by default for creating the benchmark
+environments. If you want to use virtualenv instead, write::
+
+    asv continuous -f 1.1 -E virtualenv upstream/master HEAD
+
+The ``-E virtualenv`` option should be added to all ``asv`` commands
+that run benchmarks. The default value is defined in ``asv.conf.json``.
+
+Running the full test suite can take up to one hour and use up to 3GB of RAM.
+Usually it is sufficient to paste only a subset of the results into the pull
+request to show that the committed changes do not cause unexpected performance
+regressions.  You can run specific benchmarks using the ``-b`` flag, which
+takes a regular expression.  For example, this will only run tests from a
+``pandas/asv_bench/benchmarks/groupby.py`` file::
+
+    asv continuous -f 1.1 upstream/master HEAD -b ^groupby
+
+If you want to only run a specific group of tests from a file, you can do it
+using ``.`` as a separator. For example::
+
+    asv continuous -f 1.1 upstream/master HEAD -b groupby.GroupByMethods
+
+will only run the ``GroupByMethods`` benchmark defined in ``groupby.py``.
+
+You can also run the benchmark suite using the version of ``pandas``
+already installed in your current Python environment. This can be
+useful if you do not have virtualenv or conda, or are using the
+``setup.py develop`` approach discussed above; for the in-place build
+you need to set ``PYTHONPATH``, e.g.
+``PYTHONPATH="$PWD/.." asv [remaining arguments]``.
+You can run benchmarks using an existing Python
+environment by::
+
+    asv run -e -E existing
+
+or, to use a specific Python interpreter,::
+
+    asv run -e -E existing:python3.5
+
+This will display stderr from the benchmarks, and use your local
+``python`` that comes from your ``$PATH``.
+
+Information on how to write a benchmark and how to use asv can be found in the
+`asv documentation <https://asv.readthedocs.io/en/latest/writing_benchmarks.html>`_.
+
+Documenting your code
+---------------------
+
+Changes should be reflected in the release notes located in ``doc/source/whatsnew/vx.y.z.rst``.
+This file contains an ongoing change log for each release.  Add an entry to this file to
+document your fix, enhancement or (unavoidable) breaking change.  Make sure to include the
+GitHub issue number when adding your entry (using ``:issue:`1234``` where ``1234`` is the
+issue/pull request number).
+
+If your code is an enhancement, it is most likely necessary to add usage
+examples to the existing documentation.  This can be done following the section
+regarding documentation :ref:`above <contributing.documentation>`.
+Further, to let users know when this feature was added, the ``versionadded``
+directive is used. The sphinx syntax for that is:
+
+.. code-block:: rst
+
+  .. versionadded:: 0.21.0
+
+This will put the text *New in version 0.21.0* wherever you put the sphinx
+directive. This should also be put in the docstring when adding a new function
+or method (`example <https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495>`__)
+or a new keyword argument (`example <https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568>`__).
+
+Contributing your changes to *pandas*
+=====================================
+
+.. _contributing.commit-code:
+
+Committing your code
+--------------------
+
+Keep style fixes to a separate commit to make your pull request more readable.
+
+Once you've made changes, you can see them by typing::
+
+    git status
+
+If you have created a new file, it is not being tracked by git. Add it by typing::
+
+    git add path/to/file-to-be-added.py
+
+Doing 'git status' again should give something like::
+
+    # On branch shiny-new-feature
+    #
+    #       modified:   /relative/path/to/file-you-added.py
+    #
+
+Finally, commit your changes to your local repository with an explanatory message.  *Pandas*
+uses a convention for commit message prefixes and layout.  Here are
+some common prefixes along with general guidelines for when to use them:
+
+* ENH: Enhancement, new functionality
+* BUG: Bug fix
+* DOC: Additions/updates to documentation
+* TST: Additions/updates to tests
+* BLD: Updates to the build process/scripts
+* PERF: Performance improvement
+* CLN: Code cleanup
+
+The following defines how a commit message should be structured.  Please reference the
+relevant GitHub issues in your commit message using GH1234 or #1234.  Either style
+is fine, but the former is generally preferred:
+
+* a subject line with `< 80` chars.
+* One blank line.
+* Optionally, a commit message body.
+
+Now you can commit your changes in your local repository::
+
+    git commit -m
+
+.. _contributing.push-code:
+
+Pushing your changes
+--------------------
+
+When you want your changes to appear publicly on your GitHub page, push your
+forked feature branch's commits::
+
+    git push origin shiny-new-feature
+
+Here ``origin`` is the default name given to your remote repository on GitHub.
+You can see the remote repositories::
+
+    git remote -v
+
+If you added the upstream repository as described above you will see something
+like::
+
+    origin  git@github.com:yourname/pandas.git (fetch)
+    origin  git@github.com:yourname/pandas.git (push)
+    upstream        git://github.com/pandas-dev/pandas.git (fetch)
+    upstream        git://github.com/pandas-dev/pandas.git (push)
+
+Now your code is on GitHub, but it is not yet a part of the *pandas* project.  For that to
+happen, a pull request needs to be submitted on GitHub.
+
+Review your code
+----------------
+
+When you're ready to ask for a code review, file a pull request. Before you do, once
+again make sure that you have followed all the guidelines outlined in this document
+regarding code style, tests, performance tests, and documentation. You should also
+double check your branch changes against the branch it was based on:
+
+#. Navigate to your repository on GitHub -- https://github.com/your-user-name/pandas
+#. Click on ``Branches``
+#. Click on the ``Compare`` button for your feature branch
+#. Select the ``base`` and ``compare`` branches, if necessary. This will be ``master`` and
+   ``shiny-new-feature``, respectively.
+
+Finally, make the pull request
+------------------------------
+
+If everything looks good, you are ready to make a pull request.  A pull request is how
+code from a local repository becomes available to the GitHub community and can be looked
+at and eventually merged into the master version.  This pull request and its associated
+changes will eventually be committed to the master branch and available in the next
+release.  To submit a pull request:
+
+#. Navigate to your repository on GitHub
+#. Click on the ``Pull Request`` button
+#. You can then click on ``Commits`` and ``Files Changed`` to make sure everything looks
+   okay one last time
+#. Write a description of your changes in the ``Preview Discussion`` tab
+#. Click ``Send Pull Request``.
+
+This request then goes to the repository maintainers, and they will review
+the code.
+
+.. _contributing.update-pr:
+
+Updating your pull request
+--------------------------
+
+Based on the review you get on your pull request, you will probably need to make
+some changes to the code. In that case, you can make them in your branch,
+add a new commit to that branch, push it to GitHub, and the pull request will be
+automatically updated.  Pushing them to GitHub again is done by::
+
+    git push origin shiny-new-feature
+
+This will automatically update your pull request with the latest code and restart the
+:ref:`Continuous Integration <contributing.ci>` tests.
+
+Another reason you might need to update your pull request is to solve conflicts
+with changes that have been merged into the master branch since you opened your
+pull request.
+
+To do this, you need to "merge upstream master" in your branch::
+
+    git checkout shiny-new-feature
+    git fetch upstream
+    git merge upstream/master
+
+If there are no conflicts (or they could be fixed automatically), a file with a
+default commit message will open, and you can simply save and quit this file.
+
+If there are merge conflicts, you need to solve those conflicts. See for
+example at https://help.github.com/articles/resolving-a-merge-conflict-using-the-command-line/
+for an explanation on how to do this.
+Once the conflicts are merged and the files where the conflicts were solved are
+added, you can run ``git commit`` to save those fixes.
+
+If you have uncommitted changes at the moment you want to update the branch with
+master, you will need to ``stash`` them prior to updating (see the
+`stash docs <https://git-scm.com/book/en/v2/Git-Tools-Stashing-and-Cleaning>`__).
+This will effectively store your changes and they can be reapplied after updating.
+
+After the feature branch has been update locally, you can now update your pull
+request by pushing to the branch on GitHub::
+
+    git push origin shiny-new-feature
+
+Delete your merged branch (optional)
+------------------------------------
+
+Once your feature branch is accepted into upstream, you'll probably want to get rid of
+the branch. First, merge upstream master into your branch so git knows it is safe to
+delete your branch::
+
+    git fetch upstream
+    git checkout master
+    git merge upstream/master
+
+Then you can do::
+
+    git branch -d shiny-new-feature
+
+Make sure you use a lower-case ``-d``, or else git won't warn you if your feature
+branch has not actually been merged.
+
+The branch will still exist on GitHub, so to delete it there do::
+
+    git push origin --delete shiny-new-feature
+
+.. _Gitter: https://gitter.im/pydata/pandas
diff --git a/doc/source/development/contributing_docstring.rst b/doc/source/development/contributing_docstring.rst
new file mode 100644
index 0000000000000..f7e2b42a1ccbd
--- /dev/null
+++ b/doc/source/development/contributing_docstring.rst
@@ -0,0 +1,1006 @@
+.. _docstring:
+
+{{ header }}
+
+======================
+pandas docstring guide
+======================
+
+About docstrings and standards
+------------------------------
+
+A Python docstring is a string used to document a Python module, class,
+function or method, so programmers can understand what it does without having
+to read the details of the implementation.
+
+Also, it is a common practice to generate online (html) documentation
+automatically from docstrings. `Sphinx <https://www.sphinx-doc.org>`_ serves
+this purpose.
+
+Next example gives an idea on how a docstring looks like:
+
+.. code-block:: python
+
+    def add(num1, num2):
+    """
+    Add up two integer numbers.
+
+    This function simply wraps the `+` operator, and does not
+    do anything interesting, except for illustrating what is
+    the docstring of a very simple function.
+
+    Parameters
+    ----------
+    num1 : int
+        First number to add
+    num2 : int
+        Second number to add
+
+    Returns
+    -------
+    int
+        The sum of `num1` and `num2`
+
+    See Also
+    --------
+    subtract : Subtract one integer from another
+
+    Examples
+    --------
+    >>> add(2, 2)
+    4
+    >>> add(25, 0)
+    25
+    >>> add(10, -10)
+    0
+    """
+    return num1 + num2
+
+Some standards exist about docstrings, so they are easier to read, and they can
+be exported to other formats such as html or pdf.
+
+The first conventions every Python docstring should follow are defined in
+`PEP-257 <https://www.python.org/dev/peps/pep-0257/>`_.
+
+As PEP-257 is quite open, and some other standards exist on top of it. In the
+case of pandas, the numpy docstring convention is followed. The conventions is
+explained in this document:
+
+* `numpydoc docstring guide <https://numpydoc.readthedocs.io/en/latest/format.html>`_
+  (which is based in the original `Guide to NumPy/SciPy documentation
+  <https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt>`_)
+
+numpydoc is a Sphinx extension to support the numpy docstring convention.
+
+The standard uses reStructuredText (reST). reStructuredText is a markup
+language that allows encoding styles in plain text files. Documentation
+about reStructuredText can be found in:
+
+* `Sphinx reStructuredText primer <https://www.sphinx-doc.org/en/stable/rest.html>`_
+* `Quick reStructuredText reference <http://docutils.sourceforge.net/docs/user/rst/quickref.html>`_
+* `Full reStructuredText specification <http://docutils.sourceforge.net/docs/ref/rst/restructuredtext.html>`_
+
+Pandas has some helpers for sharing docstrings between related classes, see
+:ref:`docstring.sharing`.
+
+The rest of this document will summarize all the above guides, and will
+provide additional convention specific to the pandas project.
+
+.. _docstring.tutorial:
+
+Writing a docstring
+-------------------
+
+.. _docstring.general:
+
+General rules
+~~~~~~~~~~~~~
+
+Docstrings must be defined with three double-quotes. No blank lines should be
+left before or after the docstring. The text starts in the next line after the
+opening quotes. The closing quotes have their own line
+(meaning that they are not at the end of the last sentence).
+
+In rare occasions reST styles like bold text or italics will be used in
+docstrings, but is it common to have inline code, which is presented between
+backticks. It is considered inline code:
+
+* The name of a parameter
+* Python code, a module, function, built-in, type, literal... (e.g. ``os``,
+  ``list``, ``numpy.abs``, ``datetime.date``, ``True``)
+* A pandas class (in the form ``:class:`pandas.Series```)
+* A pandas method (in the form ``:meth:`pandas.Series.sum```)
+* A pandas function (in the form ``:func:`pandas.to_datetime```)
+
+.. note::
+    To display only the last component of the linked class, method or
+    function, prefix it with ``~``. For example, ``:class:`~pandas.Series```
+    will link to ``pandas.Series`` but only display the last part, ``Series``
+    as the link text. See `Sphinx cross-referencing syntax
+    <https://www.sphinx-doc.org/en/stable/domains.html#cross-referencing-syntax>`_
+    for details.
+
+**Good:**
+
+.. code-block:: python
+
+    def add_values(arr):
+        """
+        Add the values in `arr`.
+
+        This is equivalent to Python `sum` of :meth:`pandas.Series.sum`.
+
+        Some sections are omitted here for simplicity.
+        """
+        return sum(arr)
+
+**Bad:**
+
+.. code-block:: python
+
+    def func():
+
+        """Some function.
+
+        With several mistakes in the docstring.
+
+        It has a blank like after the signature `def func():`.
+
+        The text 'Some function' should go in the line after the
+        opening quotes of the docstring, not in the same line.
+
+        There is a blank line between the docstring and the first line
+        of code `foo = 1`.
+
+        The closing quotes should be in the next line, not in this one."""
+
+        foo = 1
+        bar = 2
+        return foo + bar
+
+.. _docstring.short_summary:
+
+Section 1: Short summary
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+The short summary is a single sentence that expresses what the function does in
+a concise way.
+
+The short summary must start with a capital letter, end with a dot, and fit in
+a single line. It needs to express what the object does without providing
+details. For functions and methods, the short summary must start with an
+infinitive verb.
+
+**Good:**
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Cast Series type.
+
+        This section will provide further details.
+        """
+        pass
+
+**Bad:**
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Casts Series type.
+
+        Verb in third-person of the present simple, should be infinitive.
+        """
+        pass
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Method to cast Series type.
+
+        Does not start with verb.
+        """
+        pass
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Cast Series type
+
+        Missing dot at the end.
+        """
+        pass
+
+.. code-block:: python
+
+    def astype(dtype):
+        """
+        Cast Series type from its current type to the new type defined in
+        the parameter dtype.
+
+        Summary is too verbose and doesn't fit in a single line.
+        """
+        pass
+
+.. _docstring.extended_summary:
+
+Section 2: Extended summary
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The extended summary provides details on what the function does. It should not
+go into the details of the parameters, or discuss implementation notes, which
+go in other sections.
+
+A blank line is left between the short summary and the extended summary. And
+every paragraph in the extended summary is finished by a dot.
+
+The extended summary should provide details on why the function is useful and
+their use cases, if it is not too generic.
+
+.. code-block:: python
+
+    def unstack():
+        """
+        Pivot a row index to columns.
+
+        When using a MultiIndex, a level can be pivoted so each value in
+        the index becomes a column. This is especially useful when a subindex
+        is repeated for the main index, and data is easier to visualize as a
+        pivot table.
+
+        The index level will be automatically removed from the index when added
+        as columns.
+        """
+        pass
+
+.. _docstring.parameters:
+
+Section 3: Parameters
+~~~~~~~~~~~~~~~~~~~~~
+
+The details of the parameters will be added in this section. This section has
+the title "Parameters", followed by a line with a hyphen under each letter of
+the word "Parameters". A blank line is left before the section title, but not
+after, and not between the line with the word "Parameters" and the one with
+the hyphens.
+
+After the title, each parameter in the signature must be documented, including
+`*args` and `**kwargs`, but not `self`.
+
+The parameters are defined by their name, followed by a space, a colon, another
+space, and the type (or types). Note that the space between the name and the
+colon is important. Types are not defined for `*args` and `**kwargs`, but must
+be defined for all other parameters. After the parameter definition, it is
+required to have a line with the parameter description, which is indented, and
+can have multiple lines. The description must start with a capital letter, and
+finish with a dot.
+
+For keyword arguments with a default value, the default will be listed after a
+comma at the end of the type. The exact form of the type in this case will be
+"int, default 0". In some cases it may be useful to explain what the default
+argument means, which can be added after a comma "int, default -1, meaning all
+cpus".
+
+In cases where the default value is `None`, meaning that the value will not be
+used. Instead of "str, default None", it is preferred to write "str, optional".
+When `None` is a value being used, we will keep the form "str, default None".
+For example, in `df.to_csv(compression=None)`, `None` is not a value being used,
+but means that compression is optional, and no compression is being used if not
+provided. In this case we will use `str, optional`. Only in cases like
+`func(value=None)` and `None` is being used in the same way as `0` or `foo`
+would be used, then we will specify "str, int or None, default None".
+
+**Good:**
+
+.. code-block:: python
+
+    class Series:
+        def plot(self, kind, color='blue', **kwargs):
+            """
+            Generate a plot.
+
+            Render the data in the Series as a matplotlib plot of the
+            specified kind.
+
+            Parameters
+            ----------
+            kind : str
+                Kind of matplotlib plot.
+            color : str, default 'blue'
+                Color name or rgb code.
+            **kwargs
+                These parameters will be passed to the matplotlib plotting
+                function.
+            """
+            pass
+
+**Bad:**
+
+.. code-block:: python
+
+    class Series:
+        def plot(self, kind, **kwargs):
+            """
+            Generate a plot.
+
+            Render the data in the Series as a matplotlib plot of the
+            specified kind.
+
+            Note the blank line between the parameters title and the first
+            parameter. Also, note that after the name of the parameter `kind`
+            and before the colon, a space is missing.
+
+            Also, note that the parameter descriptions do not start with a
+            capital letter, and do not finish with a dot.
+
+            Finally, the `**kwargs` parameter is missing.
+
+            Parameters
+            ----------
+
+            kind: str
+                kind of matplotlib plot
+            """
+            pass
+
+.. _docstring.parameter_types:
+
+Parameter types
+^^^^^^^^^^^^^^^
+
+When specifying the parameter types, Python built-in data types can be used
+directly (the Python type is preferred to the more verbose string, integer,
+boolean, etc):
+
+* int
+* float
+* str
+* bool
+
+For complex types, define the subtypes. For `dict` and `tuple`, as more than
+one type is present, we use the brackets to help read the type (curly brackets
+for `dict` and normal brackets for `tuple`):
+
+* list of int
+* dict of {str : int}
+* tuple of (str, int, int)
+* tuple of (str,)
+* set of str
+
+In case where there are just a set of values allowed, list them in curly
+brackets and separated by commas (followed by a space). If the values are
+ordinal and they have an order, list them in this order. Otherwise, list
+the default value first, if there is one:
+
+* {0, 10, 25}
+* {'simple', 'advanced'}
+* {'low', 'medium', 'high'}
+* {'cat', 'dog', 'bird'}
+
+If the type is defined in a Python module, the module must be specified:
+
+* datetime.date
+* datetime.datetime
+* decimal.Decimal
+
+If the type is in a package, the module must be also specified:
+
+* numpy.ndarray
+* scipy.sparse.coo_matrix
+
+If the type is a pandas type, also specify pandas except for Series and
+DataFrame:
+
+* Series
+* DataFrame
+* pandas.Index
+* pandas.Categorical
+* pandas.SparseArray
+
+If the exact type is not relevant, but must be compatible with a numpy
+array, array-like can be specified. If Any type that can be iterated is
+accepted, iterable can be used:
+
+* array-like
+* iterable
+
+If more than one type is accepted, separate them by commas, except the
+last two types, that need to be separated by the word 'or':
+
+* int or float
+* float, decimal.Decimal or None
+* str or list of str
+
+If ``None`` is one of the accepted values, it always needs to be the last in
+the list.
+
+For axis, the convention is to use something like:
+
+* axis : {0 or 'index', 1 or 'columns', None}, default None
+
+.. _docstring.returns:
+
+Section 4: Returns or Yields
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If the method returns a value, it will be documented in this section. Also
+if the method yields its output.
+
+The title of the section will be defined in the same way as the "Parameters".
+With the names "Returns" or "Yields" followed by a line with as many hyphens
+as the letters in the preceding word.
+
+The documentation of the return is also similar to the parameters. But in this
+case, no name will be provided, unless the method returns or yields more than
+one value (a tuple of values).
+
+The types for "Returns" and "Yields" are the same as the ones for the
+"Parameters". Also, the description must finish with a dot.
+
+For example, with a single value:
+
+.. code-block:: python
+
+    def sample():
+        """
+        Generate and return a random number.
+
+        The value is sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Returns
+        -------
+        float
+            Random number generated.
+        """
+        return np.random.random()
+
+With more than one value:
+
+.. code-block:: python
+
+    import string
+
+    def random_letters():
+        """
+        Generate and return a sequence of random letters.
+
+        The length of the returned string is also random, and is also
+        returned.
+
+        Returns
+        -------
+        length : int
+            Length of the returned string.
+        letters : str
+            String of random letters.
+        """
+        length = np.random.randint(1, 10)
+        letters = ''.join(np.random.choice(string.ascii_lowercase)
+                          for i in range(length))
+        return length, letters
+
+If the method yields its value:
+
+.. code-block:: python
+
+    def sample_values():
+        """
+        Generate an infinite sequence of random numbers.
+
+        The values are sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Yields
+        ------
+        float
+            Random number generated.
+        """
+        while True:
+            yield np.random.random()
+
+.. _docstring.see_also:
+
+Section 5: See Also
+~~~~~~~~~~~~~~~~~~~
+
+This section is used to let users know about pandas functionality
+related to the one being documented. In rare cases, if no related methods
+or functions can be found at all, this section can be skipped.
+
+An obvious example would be the `head()` and `tail()` methods. As `tail()` does
+the equivalent as `head()` but at the end of the `Series` or `DataFrame`
+instead of at the beginning, it is good to let the users know about it.
+
+To give an intuition on what can be considered related, here there are some
+examples:
+
+* ``loc`` and ``iloc``, as they do the same, but in one case providing indices
+  and in the other positions
+* ``max`` and ``min``, as they do the opposite
+* ``iterrows``, ``itertuples`` and ``iteritems``, as it is easy that a user
+  looking for the method to iterate over columns ends up in the method to
+  iterate over rows, and vice-versa
+* ``fillna`` and ``dropna``, as both methods are used to handle missing values
+* ``read_csv`` and ``to_csv``, as they are complementary
+* ``merge`` and ``join``, as one is a generalization of the other
+* ``astype`` and ``pandas.to_datetime``, as users may be reading the
+  documentation of ``astype`` to know how to cast as a date, and the way to do
+  it is with ``pandas.to_datetime``
+* ``where`` is related to ``numpy.where``, as its functionality is based on it
+
+When deciding what is related, you should mainly use your common sense and
+think about what can be useful for the users reading the documentation,
+especially the less experienced ones.
+
+When relating to other libraries (mainly ``numpy``), use the name of the module
+first (not an alias like ``np``). If the function is in a module which is not
+the main one, like ``scipy.sparse``, list the full module (e.g.
+``scipy.sparse.coo_matrix``).
+
+This section, as the previous, also has a header, "See Also" (note the capital
+S and A). Also followed by the line with hyphens, and preceded by a blank line.
+
+After the header, we will add a line for each related method or function,
+followed by a space, a colon, another space, and a short description that
+illustrated what this method or function does, why is it relevant in this
+context, and what are the key differences between the documented function and
+the one referencing. The description must also finish with a dot.
+
+Note that in "Returns" and "Yields", the description is located in the
+following line than the type. But in this section it is located in the same
+line, with a colon in between. If the description does not fit in the same
+line, it can continue in the next ones, but it has to be indented in them.
+
+For example:
+
+.. code-block:: python
+
+    class Series:
+        def head(self):
+            """
+            Return the first 5 elements of the Series.
+
+            This function is mainly useful to preview the values of the
+            Series without displaying the whole of it.
+
+            Returns
+            -------
+            Series
+                Subset of the original series with the 5 first values.
+
+            See Also
+            --------
+            Series.tail : Return the last 5 elements of the Series.
+            Series.iloc : Return a slice of the elements in the Series,
+                which can also be used to return the first or last n.
+            """
+            return self.iloc[:5]
+
+.. _docstring.notes:
+
+Section 6: Notes
+~~~~~~~~~~~~~~~~
+
+This is an optional section used for notes about the implementation of the
+algorithm. Or to document technical aspects of the function behavior.
+
+Feel free to skip it, unless you are familiar with the implementation of the
+algorithm, or you discover some counter-intuitive behavior while writing the
+examples for the function.
+
+This section follows the same format as the extended summary section.
+
+.. _docstring.examples:
+
+Section 7: Examples
+~~~~~~~~~~~~~~~~~~~
+
+This is one of the most important sections of a docstring, even if it is
+placed in the last position. As often, people understand concepts better
+with examples, than with accurate explanations.
+
+Examples in docstrings, besides illustrating the usage of the function or
+method, must be valid Python code, that in a deterministic way returns the
+presented output, and that can be copied and run by users.
+
+They are presented as a session in the Python terminal. `>>>` is used to
+present code. `...` is used for code continuing from the previous line.
+Output is presented immediately after the last line of code generating the
+output (no blank lines in between). Comments describing the examples can
+be added with blank lines before and after them.
+
+The way to present examples is as follows:
+
+1. Import required libraries (except ``numpy`` and ``pandas``)
+
+2. Create the data required for the example
+
+3. Show a very basic example that gives an idea of the most common use case
+
+4. Add examples with explanations that illustrate how the parameters can be
+   used for extended functionality
+
+A simple example could be:
+
+.. code-block:: python
+
+    class Series:
+
+        def head(self, n=5):
+            """
+            Return the first elements of the Series.
+
+            This function is mainly useful to preview the values of the
+            Series without displaying the whole of it.
+
+            Parameters
+            ----------
+            n : int
+                Number of values to return.
+
+            Return
+            ------
+            pandas.Series
+                Subset of the original series with the n first values.
+
+            See Also
+            --------
+            tail : Return the last n elements of the Series.
+
+            Examples
+            --------
+            >>> s = pd.Series(['Ant', 'Bear', 'Cow', 'Dog', 'Falcon',
+            ...                'Lion', 'Monkey', 'Rabbit', 'Zebra'])
+            >>> s.head()
+            0   Ant
+            1   Bear
+            2   Cow
+            3   Dog
+            4   Falcon
+            dtype: object
+
+            With the `n` parameter, we can change the number of returned rows:
+
+            >>> s.head(n=3)
+            0   Ant
+            1   Bear
+            2   Cow
+            dtype: object
+            """
+            return self.iloc[:n]
+
+The examples should be as concise as possible. In cases where the complexity of
+the function requires long examples, is recommended to use blocks with headers
+in bold. Use double star ``**`` to make a text bold, like in ``**this example**``.
+
+.. _docstring.example_conventions:
+
+Conventions for the examples
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Code in examples is assumed to always start with these two lines which are not
+shown:
+
+.. code-block:: python
+
+    import numpy as np
+    import pandas as pd
+
+Any other module used in the examples must be explicitly imported, one per line (as
+recommended in :pep:`8#imports`)
+and avoiding aliases. Avoid excessive imports, but if needed, imports from
+the standard library go first, followed by third-party libraries (like
+matplotlib).
+
+When illustrating examples with a single ``Series`` use the name ``s``, and if
+illustrating with a single ``DataFrame`` use the name ``df``. For indices,
+``idx`` is the preferred name. If a set of homogeneous ``Series`` or
+``DataFrame`` is used, name them ``s1``, ``s2``, ``s3``...  or ``df1``,
+``df2``, ``df3``... If the data is not homogeneous, and more than one structure
+is needed, name them with something meaningful, for example ``df_main`` and
+``df_to_join``.
+
+Data used in the example should be as compact as possible. The number of rows
+is recommended to be around 4, but make it a number that makes sense for the
+specific example. For example in the ``head`` method, it requires to be higher
+than 5, to show the example with the default values. If doing the ``mean``, we
+could use something like ``[1, 2, 3]``, so it is easy to see that the value
+returned is the mean.
+
+For more complex examples (grouping for example), avoid using data without
+interpretation, like a matrix of random numbers with columns A, B, C, D...
+And instead use a meaningful example, which makes it easier to understand the
+concept. Unless required by the example, use names of animals, to keep examples
+consistent. And numerical properties of them.
+
+When calling the method, keywords arguments ``head(n=3)`` are preferred to
+positional arguments ``head(3)``.
+
+**Good:**
+
+.. code-block:: python
+
+    class Series:
+
+        def mean(self):
+            """
+            Compute the mean of the input.
+
+            Examples
+            --------
+            >>> s = pd.Series([1, 2, 3])
+            >>> s.mean()
+            2
+            """
+            pass
+
+
+        def fillna(self, value):
+            """
+            Replace missing values by `value`.
+
+            Examples
+            --------
+            >>> s = pd.Series([1, np.nan, 3])
+            >>> s.fillna(0)
+            [1, 0, 3]
+            """
+            pass
+
+        def groupby_mean(self):
+            """
+            Group by index and return mean.
+
+            Examples
+            --------
+            >>> s = pd.Series([380., 370., 24., 26],
+            ...               name='max_speed',
+            ...               index=['falcon', 'falcon', 'parrot', 'parrot'])
+            >>> s.groupby_mean()
+            index
+            falcon    375.0
+            parrot     25.0
+            Name: max_speed, dtype: float64
+            """
+            pass
+
+        def contains(self, pattern, case_sensitive=True, na=numpy.nan):
+            """
+            Return whether each value contains `pattern`.
+
+            In this case, we are illustrating how to use sections, even
+            if the example is simple enough and does not require them.
+
+            Examples
+            --------
+            >>> s = pd.Series('Antelope', 'Lion', 'Zebra', np.nan)
+            >>> s.contains(pattern='a')
+            0    False
+            1    False
+            2     True
+            3      NaN
+            dtype: bool
+
+            **Case sensitivity**
+
+            With `case_sensitive` set to `False` we can match `a` with both
+            `a` and `A`:
+
+            >>> s.contains(pattern='a', case_sensitive=False)
+            0     True
+            1    False
+            2     True
+            3      NaN
+            dtype: bool
+
+            **Missing values**
+
+            We can fill missing values in the output using the `na` parameter:
+
+            >>> s.contains(pattern='a', na=False)
+            0    False
+            1    False
+            2     True
+            3    False
+            dtype: bool
+            """
+            pass
+
+**Bad:**
+
+.. code-block:: python
+
+    def method(foo=None, bar=None):
+        """
+        A sample DataFrame method.
+
+        Do not import numpy and pandas.
+
+        Try to use meaningful data, when it makes the example easier
+        to understand.
+
+        Try to avoid positional arguments like in `df.method(1)`. They
+        can be all right if previously defined with a meaningful name,
+        like in `present_value(interest_rate)`, but avoid them otherwise.
+
+        When presenting the behavior with different parameters, do not place
+        all the calls one next to the other. Instead, add a short sentence
+        explaining what the example shows.
+
+        Examples
+        --------
+        >>> import numpy as np
+        >>> import pandas as pd
+        >>> df = pd.DataFrame(np.random.randn(3, 3),
+        ...                   columns=('a', 'b', 'c'))
+        >>> df.method(1)
+        21
+        >>> df.method(bar=14)
+        123
+        """
+        pass
+
+
+.. _docstring.doctest_tips:
+
+Tips for getting your examples pass the doctests
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Getting the examples pass the doctests in the validation script can sometimes
+be tricky. Here are some attention points:
+
+* Import all needed libraries (except for pandas and numpy, those are already
+  imported as ``import pandas as pd`` and ``import numpy as np``) and define
+  all variables you use in the example.
+
+* Try to avoid using random data. However random data might be OK in some
+  cases, like if the function you are documenting deals with probability
+  distributions, or if the amount of data needed to make the function result
+  meaningful is too much, such that creating it manually is very cumbersome.
+  In those cases, always use a fixed random seed to make the generated examples
+  predictable. Example::
+
+    >>> np.random.seed(42)
+    >>> df = pd.DataFrame({'normal': np.random.normal(100, 5, 20)})
+
+* If you have a code snippet that wraps multiple lines, you need to use '...'
+  on the continued lines: ::
+
+    >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], index=['a', 'b', 'c'],
+    ...                   columns=['A', 'B'])
+
+* If you want to show a case where an exception is raised, you can do::
+
+    >>> pd.to_datetime(["712-01-01"])
+    Traceback (most recent call last):
+    OutOfBoundsDatetime: Out of bounds nanosecond timestamp: 712-01-01 00:00:00
+
+  It is essential to include the "Traceback (most recent call last):", but for
+  the actual error only the error name is sufficient.
+
+* If there is a small part of the result that can vary (e.g. a hash in an object
+  representation), you can use ``...`` to represent this part.
+
+  If you want to show that ``s.plot()`` returns a matplotlib AxesSubplot object,
+  this will fail the doctest ::
+
+    >>> s.plot()
+    <matplotlib.axes._subplots.AxesSubplot at 0x7efd0c0b0690>
+
+  However, you can do (notice the comment that needs to be added) ::
+
+    >>> s.plot()  # doctest: +ELLIPSIS
+    <matplotlib.axes._subplots.AxesSubplot at ...>
+
+
+.. _docstring.example_plots:
+
+Plots in examples
+^^^^^^^^^^^^^^^^^
+
+There are some methods in pandas returning plots. To render the plots generated
+by the examples in the documentation, the ``.. plot::`` directive exists.
+
+To use it, place the next code after the "Examples" header as shown below. The
+plot will be generated automatically when building the documentation.
+
+.. code-block:: python
+
+    class Series:
+        def plot(self):
+            """
+            Generate a plot with the `Series` data.
+
+            Examples
+            --------
+
+            .. plot::
+                :context: close-figs
+
+                >>> s = pd.Series([1, 2, 3])
+                >>> s.plot()
+            """
+            pass
+
+.. _docstring.sharing:
+
+Sharing Docstrings
+------------------
+
+Pandas has a system for sharing docstrings, with slight variations, between
+classes. This helps us keep docstrings consistent, while keeping things clear
+for the user reading. It comes at the cost of some complexity when writing.
+
+Each shared docstring will have a base template with variables, like
+``%(klass)s``. The variables filled in later on using the ``Substitution``
+decorator. Finally, docstrings can be appended to with the ``Appender``
+decorator.
+
+In this example, we'll create a parent docstring normally (this is like
+``pandas.core.generic.NDFrame``. Then we'll have two children (like
+``pandas.core.series.Series`` and ``pandas.core.frame.DataFrame``). We'll
+substitute the children's class names in this docstring.
+
+.. code-block:: python
+
+   class Parent:
+       def my_function(self):
+           """Apply my function to %(klass)s."""
+           ...
+
+
+   class ChildA(Parent):
+       @Substitution(klass="ChildA")
+       @Appender(Parent.my_function.__doc__)
+       def my_function(self):
+           ...
+
+
+   class ChildB(Parent):
+       @Substitution(klass="ChildB")
+       @Appender(Parent.my_function.__doc__)
+       def my_function(self):
+           ...
+
+The resulting docstrings are
+
+.. code-block:: python
+
+   >>> print(Parent.my_function.__doc__)
+   Apply my function to %(klass)s.
+   >>> print(ChildA.my_function.__doc__)
+   Apply my function to ChildA.
+   >>> print(ChildB.my_function.__doc__)
+   Apply my function to ChildB.
+
+Notice two things:
+
+1. We "append" the parent docstring to the children docstrings, which are
+   initially empty.
+2. Python decorators are applied inside out. So the order is Append then
+   Substitution, even though Substitution comes first in the file.
+
+Our files will often contain a module-level ``_shared_doc_kwargs`` with some
+common substitution values (things like ``klass``, ``axes``, etc).
+
+You can substitute and append in one shot with something like
+
+.. code-block:: python
+
+   @Appender(template % _shared_doc_kwargs)
+   def my_function(self):
+       ...
+
+where ``template`` may come from a module-level ``_shared_docs`` dictionary
+mapping function names to docstrings. Wherever possible, we prefer using
+``Appender`` and ``Substitution``, since the docstring-writing processes is
+slightly closer to normal.
+
+See ``pandas.core.generic.NDFrame.fillna`` for an example template, and
+``pandas.core.series.Series.fillna`` and ``pandas.core.generic.frame.fillna``
+for the filled versions.
diff --git a/doc/source/development/developer.rst b/doc/source/development/developer.rst
new file mode 100644
index 0000000000000..a283920ae4377
--- /dev/null
+++ b/doc/source/development/developer.rst
@@ -0,0 +1,164 @@
+.. _developer:
+
+{{ header }}
+
+.. currentmodule:: pandas
+
+*********
+Developer
+*********
+
+This section will focus on downstream applications of pandas.
+
+.. _apache.parquet:
+
+Storing pandas DataFrame objects in Apache Parquet format
+---------------------------------------------------------
+
+The `Apache Parquet <https://github.com/apache/parquet-format>`__ format
+provides key-value metadata at the file and column level, stored in the footer
+of the Parquet file:
+
+.. code-block:: shell
+
+  5: optional list<KeyValue> key_value_metadata
+
+where ``KeyValue`` is
+
+.. code-block:: shell
+
+   struct KeyValue {
+     1: required string key
+     2: optional string value
+   }
+
+So that a ``pandas.DataFrame`` can be faithfully reconstructed, we store a
+``pandas`` metadata key in the ``FileMetaData`` with the value stored as :
+
+.. code-block:: text
+
+   {'index_columns': ['__index_level_0__', '__index_level_1__', ...],
+    'column_indexes': [<ci0>, <ci1>, ..., <ciN>],
+    'columns': [<c0>, <c1>, ...],
+    'pandas_version': $VERSION}
+
+Here, ``<c0>``/``<ci0>`` and so forth are dictionaries containing the metadata
+for each column, *including the index columns*. This has JSON form:
+
+.. code-block:: text
+
+   {'name': column_name,
+    'field_name': parquet_column_name,
+    'pandas_type': pandas_type,
+    'numpy_type': numpy_type,
+    'metadata': metadata}
+
+.. note::
+
+   Every index column is stored with a name matching the pattern
+   ``__index_level_\d+__`` and its corresponding column information is can be
+   found with the following code snippet.
+
+   Following this naming convention isn't strictly necessary, but strongly
+   suggested for compatibility with Arrow.
+
+   Here's an example of how the index metadata is structured in pyarrow:
+
+    .. code-block:: python
+
+       # assuming there's at least 3 levels in the index
+       index_columns = metadata['index_columns']  # noqa: F821
+       columns = metadata['columns']  # noqa: F821
+       ith_index = 2
+       assert index_columns[ith_index] == '__index_level_2__'
+       ith_index_info = columns[-len(index_columns):][ith_index]
+       ith_index_level_name = ith_index_info['name']
+
+``pandas_type`` is the logical type of the column, and is one of:
+
+* Boolean: ``'bool'``
+* Integers: ``'int8', 'int16', 'int32', 'int64', 'uint8', 'uint16', 'uint32', 'uint64'``
+* Floats: ``'float16', 'float32', 'float64'``
+* Date and Time Types: ``'datetime', 'datetimetz'``, ``'timedelta'``
+* String: ``'unicode', 'bytes'``
+* Categorical: ``'categorical'``
+* Other Python objects: ``'object'``
+
+The ``numpy_type`` is the physical storage type of the column, which is the
+result of ``str(dtype)`` for the underlying NumPy array that holds the data. So
+for ``datetimetz`` this is ``datetime64[ns]`` and for categorical, it may be
+any of the supported integer categorical types.
+
+The ``metadata`` field is ``None`` except for:
+
+* ``datetimetz``: ``{'timezone': zone, 'unit': 'ns'}``, e.g. ``{'timezone',
+  'America/New_York', 'unit': 'ns'}``. The ``'unit'`` is optional, and if
+  omitted it is assumed to be nanoseconds.
+* ``categorical``: ``{'num_categories': K, 'ordered': is_ordered, 'type': $TYPE}``
+
+    * Here ``'type'`` is optional, and can be a nested pandas type specification
+      here (but not categorical)
+
+* ``unicode``: ``{'encoding': encoding}``
+
+    * The encoding is optional, and if not present is UTF-8
+
+* ``object``: ``{'encoding': encoding}``. Objects can be serialized and stored
+  in ``BYTE_ARRAY`` Parquet columns. The encoding can be one of:
+
+    * ``'pickle'``
+    * ``'msgpack'``
+    * ``'bson'``
+    * ``'json'``
+
+* ``timedelta``: ``{'unit': 'ns'}``. The ``'unit'`` is optional, and if omitted
+  it is assumed to be nanoseconds. This metadata is optional altogether
+
+For types other than these, the ``'metadata'`` key can be
+omitted. Implementations can assume ``None`` if the key is not present.
+
+As an example of fully-formed metadata:
+
+.. code-block:: text
+
+   {'index_columns': ['__index_level_0__'],
+    'column_indexes': [
+        {'name': None,
+         'field_name': 'None',
+         'pandas_type': 'unicode',
+         'numpy_type': 'object',
+         'metadata': {'encoding': 'UTF-8'}}
+    ],
+    'columns': [
+        {'name': 'c0',
+         'field_name': 'c0',
+         'pandas_type': 'int8',
+         'numpy_type': 'int8',
+         'metadata': None},
+        {'name': 'c1',
+         'field_name': 'c1',
+         'pandas_type': 'bytes',
+         'numpy_type': 'object',
+         'metadata': None},
+        {'name': 'c2',
+         'field_name': 'c2',
+         'pandas_type': 'categorical',
+         'numpy_type': 'int16',
+         'metadata': {'num_categories': 1000, 'ordered': False}},
+        {'name': 'c3',
+         'field_name': 'c3',
+         'pandas_type': 'datetimetz',
+         'numpy_type': 'datetime64[ns]',
+         'metadata': {'timezone': 'America/Los_Angeles'}},
+        {'name': 'c4',
+         'field_name': 'c4',
+         'pandas_type': 'object',
+         'numpy_type': 'object',
+         'metadata': {'encoding': 'pickle'}},
+        {'name': None,
+         'field_name': '__index_level_0__',
+         'pandas_type': 'int64',
+         'numpy_type': 'int64',
+         'metadata': None}
+    ],
+    'pandas_version': '0.20.0'}
diff --git a/doc/source/development/extending.rst b/doc/source/development/extending.rst
new file mode 100644
index 0000000000000..9e5034f6d3db0
--- /dev/null
+++ b/doc/source/development/extending.rst
@@ -0,0 +1,399 @@
+.. _extending:
+
+{{ header }}
+
+****************
+Extending Pandas
+****************
+
+While pandas provides a rich set of methods, containers, and data types, your
+needs may not be fully satisfied. Pandas offers a few options for extending
+pandas.
+
+.. _extending.register-accessors:
+
+Registering Custom Accessors
+----------------------------
+
+Libraries can use the decorators
+:func:`pandas.api.extensions.register_dataframe_accessor`,
+:func:`pandas.api.extensions.register_series_accessor`, and
+:func:`pandas.api.extensions.register_index_accessor`, to add additional
+"namespaces" to pandas objects. All of these follow a similar convention: you
+decorate a class, providing the name of attribute to add. The class's
+``__init__`` method gets the object being decorated. For example:
+
+.. code-block:: python
+
+   @pd.api.extensions.register_dataframe_accessor("geo")
+   class GeoAccessor(object):
+       def __init__(self, pandas_obj):
+           self._validate(pandas_obj)
+           self._obj = pandas_obj
+
+       @staticmethod
+       def _validate(obj):
+           # verify there is a column latitude and a column longitude
+           if 'latitude' not in obj.columns or 'longitude' not in obj.columns:
+               raise AttributeError("Must have 'latitude' and 'longitude'.")
+
+       @property
+       def center(self):
+           # return the geographic center point of this DataFrame
+           lat = self._obj.latitude
+           lon = self._obj.longitude
+           return (float(lon.mean()), float(lat.mean()))
+
+       def plot(self):
+           # plot this array's data on a map, e.g., using Cartopy
+           pass
+
+Now users can access your methods using the ``geo`` namespace:
+
+      >>> ds = pd.DataFrame({'longitude': np.linspace(0, 10),
+      ...                    'latitude': np.linspace(0, 20)})
+      >>> ds.geo.center
+      (5.0, 10.0)
+      >>> ds.geo.plot()
+      # plots data on a map
+
+This can be a convenient way to extend pandas objects without subclassing them.
+If you write a custom accessor, make a pull request adding it to our
+:ref:`ecosystem` page.
+
+We highly recommend validating the data in your accessor's `__init__`.
+In our ``GeoAccessor``, we validate that the data contains the expected columns,
+raising an ``AttributeError`` when the validation fails.
+For a ``Series`` accessor, you should validate the ``dtype`` if the accessor
+applies only to certain dtypes.
+
+
+.. _extending.extension-types:
+
+Extension Types
+---------------
+
+.. versionadded:: 0.23.0
+
+.. warning::
+
+   The :class:`pandas.api.extensions.ExtensionDtype` and :class:`pandas.api.extensions.ExtensionArray` APIs are new and
+   experimental. They may change between versions without warning.
+
+Pandas defines an interface for implementing data types and arrays that *extend*
+NumPy's type system. Pandas itself uses the extension system for some types
+that aren't built into NumPy (categorical, period, interval, datetime with
+timezone).
+
+Libraries can define a custom array and data type. When pandas encounters these
+objects, they will be handled properly (i.e. not converted to an ndarray of
+objects). Many methods like :func:`pandas.isna` will dispatch to the extension
+type's implementation.
+
+If you're building a library that implements the interface, please publicize it
+on :ref:`ecosystem.extensions`.
+
+The interface consists of two classes.
+
+:class:`~pandas.api.extensions.ExtensionDtype`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A :class:`pandas.api.extensions.ExtensionDtype` is similar to a ``numpy.dtype`` object. It describes the
+data type. Implementors are responsible for a few unique items like the name.
+
+One particularly important item is the ``type`` property. This should be the
+class that is the scalar type for your data. For example, if you were writing an
+extension array for IP Address data, this might be ``ipaddress.IPv4Address``.
+
+See the `extension dtype source`_ for interface definition.
+
+.. versionadded:: 0.24.0
+
+:class:`pandas.api.extension.ExtensionDtype` can be registered to pandas to allow creation via a string dtype name.
+This allows one to instantiate ``Series`` and ``.astype()`` with a registered string name, for
+example ``'category'`` is a registered string accessor for the ``CategoricalDtype``.
+
+See the `extension dtype dtypes`_ for more on how to register dtypes.
+
+:class:`~pandas.api.extensions.ExtensionArray`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+This class provides all the array-like functionality. ExtensionArrays are
+limited to 1 dimension. An ExtensionArray is linked to an ExtensionDtype via the
+``dtype`` attribute.
+
+Pandas makes no restrictions on how an extension array is created via its
+``__new__`` or ``__init__``, and puts no restrictions on how you store your
+data. We do require that your array be convertible to a NumPy array, even if
+this is relatively expensive (as it is for ``Categorical``).
+
+They may be backed by none, one, or many NumPy arrays. For example,
+``pandas.Categorical`` is an extension array backed by two arrays,
+one for codes and one for categories. An array of IPv6 addresses may
+be backed by a NumPy structured array with two fields, one for the
+lower 64 bits and one for the upper 64 bits. Or they may be backed
+by some other storage type, like Python lists.
+
+See the `extension array source`_ for the interface definition. The docstrings
+and comments contain guidance for properly implementing the interface.
+
+.. _extending.extension.operator:
+
+:class:`~pandas.api.extensions.ExtensionArray` Operator Support
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.24.0
+
+By default, there are no operators defined for the class :class:`~pandas.api.extensions.ExtensionArray`.
+There are two approaches for providing operator support for your ExtensionArray:
+
+1. Define each of the operators on your ``ExtensionArray`` subclass.
+2. Use an operator implementation from pandas that depends on operators that are already defined
+   on the underlying elements (scalars) of the ExtensionArray.
+
+.. note::
+
+   Regardless of the approach, you may want to set ``__array_priority__``
+   if you want your implementation to be called when involved in binary operations
+   with NumPy arrays.
+
+For the first approach, you define selected operators, e.g., ``__add__``, ``__le__``, etc. that
+you want your ``ExtensionArray`` subclass to support.
+
+The second approach assumes that the underlying elements (i.e., scalar type) of the ``ExtensionArray``
+have the individual operators already defined.  In other words, if your ``ExtensionArray``
+named ``MyExtensionArray`` is implemented so that each element is an instance
+of the class ``MyExtensionElement``, then if the operators are defined
+for ``MyExtensionElement``, the second approach will automatically
+define the operators for ``MyExtensionArray``.
+
+A mixin class, :class:`~pandas.api.extensions.ExtensionScalarOpsMixin` supports this second
+approach.  If developing an ``ExtensionArray`` subclass, for example ``MyExtensionArray``,
+can simply include ``ExtensionScalarOpsMixin`` as a parent class of ``MyExtensionArray``,
+and then call the methods :meth:`~MyExtensionArray._add_arithmetic_ops` and/or
+:meth:`~MyExtensionArray._add_comparison_ops` to hook the operators into
+your ``MyExtensionArray`` class, as follows:
+
+.. code-block:: python
+
+    from pandas.api.extensions import ExtensionArray, ExtensionScalarOpsMixin
+
+    class MyExtensionArray(ExtensionArray, ExtensionScalarOpsMixin):
+        pass
+
+
+    MyExtensionArray._add_arithmetic_ops()
+    MyExtensionArray._add_comparison_ops()
+
+
+.. note::
+
+   Since ``pandas`` automatically calls the underlying operator on each
+   element one-by-one, this might not be as performant as implementing your own
+   version of the associated operators directly on the ``ExtensionArray``.
+
+For arithmetic operations, this implementation will try to reconstruct a new
+``ExtensionArray`` with the result of the element-wise operation. Whether
+or not that succeeds depends on whether the operation returns a result
+that's valid for the ``ExtensionArray``. If an ``ExtensionArray`` cannot
+be reconstructed, an ndarray containing the scalars returned instead.
+
+For ease of implementation and consistency with operations between pandas
+and NumPy ndarrays, we recommend *not* handling Series and Indexes in your binary ops.
+Instead, you should detect these cases and return ``NotImplemented``.
+When pandas encounters an operation like ``op(Series, ExtensionArray)``, pandas
+will
+
+1. unbox the array from the ``Series`` (``Series.array``)
+2. call ``result = op(values, ExtensionArray)``
+3. re-box the result in a ``Series``
+
+.. _extending.extension.testing:
+
+Testing Extension Arrays
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+We provide a test suite for ensuring that your extension arrays satisfy the expected
+behavior. To use the test suite, you must provide several pytest fixtures and inherit
+from the base test class. The required fixtures are found in
+https://github.com/pandas-dev/pandas/blob/master/pandas/tests/extension/conftest.py.
+
+To use a test, subclass it:
+
+.. code-block:: python
+
+   from pandas.tests.extension import base
+
+
+   class TestConstructors(base.BaseConstructorsTests):
+       pass
+
+
+See https://github.com/pandas-dev/pandas/blob/master/pandas/tests/extension/base/__init__.py
+for a list of all the tests available.
+
+.. _extension dtype dtypes: https://github.com/pandas-dev/pandas/blob/master/pandas/core/dtypes/dtypes.py
+.. _extension dtype source: https://github.com/pandas-dev/pandas/blob/master/pandas/core/dtypes/base.py
+.. _extension array source: https://github.com/pandas-dev/pandas/blob/master/pandas/core/arrays/base.py
+
+.. _extending.subclassing-pandas:
+
+Subclassing pandas Data Structures
+----------------------------------
+
+.. warning:: There are some easier alternatives before considering subclassing ``pandas`` data structures.
+
+  1. Extensible method chains with :ref:`pipe <basics.pipe>`
+
+  2. Use *composition*. See `here <http://en.wikipedia.org/wiki/Composition_over_inheritance>`_.
+
+  3. Extending by :ref:`registering an accessor <extending.register-accessors>`
+
+  4. Extending by :ref:`extension type <extending.extension-types>`
+
+This section describes how to subclass ``pandas`` data structures to meet more specific needs. There are two points that need attention:
+
+1. Override constructor properties.
+2. Define original properties
+
+.. note::
+
+   You can find a nice example in `geopandas <https://github.com/geopandas/geopandas>`_ project.
+
+Override Constructor Properties
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Each data structure has several *constructor properties* for returning a new
+data structure as the result of an operation. By overriding these properties,
+you can retain subclasses through ``pandas`` data manipulations.
+
+There are 3 constructor properties to be defined:
+
+* ``_constructor``: Used when a manipulation result has the same dimensions as the original.
+* ``_constructor_sliced``: Used when a manipulation result has one lower dimension(s) as the original, such as ``DataFrame`` single columns slicing.
+* ``_constructor_expanddim``: Used when a manipulation result has one higher dimension as the original, such as ``Series.to_frame()`` and ``DataFrame.to_panel()``.
+
+Following table shows how ``pandas`` data structures define constructor properties by default.
+
+===========================  ======================= =============
+Property Attributes          ``Series``              ``DataFrame``
+===========================  ======================= =============
+``_constructor``             ``Series``              ``DataFrame``
+``_constructor_sliced``      ``NotImplementedError`` ``Series``
+``_constructor_expanddim``   ``DataFrame``           ``Panel``
+===========================  ======================= =============
+
+Below example shows how to define ``SubclassedSeries`` and ``SubclassedDataFrame`` overriding constructor properties.
+
+.. code-block:: python
+
+   class SubclassedSeries(pd.Series):
+
+       @property
+       def _constructor(self):
+           return SubclassedSeries
+
+       @property
+       def _constructor_expanddim(self):
+           return SubclassedDataFrame
+
+
+   class SubclassedDataFrame(pd.DataFrame):
+
+       @property
+       def _constructor(self):
+           return SubclassedDataFrame
+
+       @property
+       def _constructor_sliced(self):
+           return SubclassedSeries
+
+.. code-block:: python
+
+   >>> s = SubclassedSeries([1, 2, 3])
+   >>> type(s)
+   <class '__main__.SubclassedSeries'>
+
+   >>> to_framed = s.to_frame()
+   >>> type(to_framed)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> df = SubclassedDataFrame({'A': [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
+   >>> df
+      A  B  C
+   0  1  4  7
+   1  2  5  8
+   2  3  6  9
+
+   >>> type(df)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> sliced1 = df[['A', 'B']]
+   >>> sliced1
+      A  B
+   0  1  4
+   1  2  5
+   2  3  6
+
+   >>> type(sliced1)
+   <class '__main__.SubclassedDataFrame'>
+
+   >>> sliced2 = df['A']
+   >>> sliced2
+   0    1
+   1    2
+   2    3
+   Name: A, dtype: int64
+
+   >>> type(sliced2)
+   <class '__main__.SubclassedSeries'>
+
+Define Original Properties
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+To let original data structures have additional properties, you should let ``pandas`` know what properties are added. ``pandas`` maps unknown properties to data names overriding ``__getattribute__``. Defining original properties can be done in one of 2 ways:
+
+1. Define ``_internal_names`` and ``_internal_names_set`` for temporary properties which WILL NOT be passed to manipulation results.
+2. Define ``_metadata`` for normal properties which will be passed to manipulation results.
+
+Below is an example to define two original properties, "internal_cache" as a temporary property and "added_property" as a normal property
+
+.. code-block:: python
+
+   class SubclassedDataFrame2(pd.DataFrame):
+
+       # temporary properties
+       _internal_names = pd.DataFrame._internal_names + ['internal_cache']
+       _internal_names_set = set(_internal_names)
+
+       # normal properties
+       _metadata = ['added_property']
+
+       @property
+       def _constructor(self):
+           return SubclassedDataFrame2
+
+.. code-block:: python
+
+   >>> df = SubclassedDataFrame2({'A': [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
+   >>> df
+      A  B  C
+   0  1  4  7
+   1  2  5  8
+   2  3  6  9
+
+   >>> df.internal_cache = 'cached'
+   >>> df.added_property = 'property'
+
+   >>> df.internal_cache
+   cached
+   >>> df.added_property
+   property
+
+   # properties defined in _internal_names is reset after manipulation
+   >>> df[['A', 'B']].internal_cache
+   AttributeError: 'SubclassedDataFrame2' object has no attribute 'internal_cache'
+
+   # properties defined in _metadata are retained
+   >>> df[['A', 'B']].added_property
+   property
diff --git a/doc/source/development/index.rst b/doc/source/development/index.rst
new file mode 100644
index 0000000000000..d67a6c3a2ca04
--- /dev/null
+++ b/doc/source/development/index.rst
@@ -0,0 +1,15 @@
+{{ header }}
+
+.. _development:
+
+===========
+Development
+===========
+
+.. toctree::
+    :maxdepth: 2
+
+    contributing
+    internals
+    extending
+    developer
diff --git a/doc/source/development/internals.rst b/doc/source/development/internals.rst
new file mode 100644
index 0000000000000..9c434928c214e
--- /dev/null
+++ b/doc/source/development/internals.rst
@@ -0,0 +1,108 @@
+.. _internals:
+
+{{ header }}
+
+*********
+Internals
+*********
+
+This section will provide a look into some of pandas internals. It's primarily
+intended for developers of pandas itself.
+
+Indexing
+--------
+
+In pandas there are a few objects implemented which can serve as valid
+containers for the axis labels:
+
+* ``Index``: the generic "ordered set" object, an ndarray of object dtype
+  assuming nothing about its contents. The labels must be hashable (and
+  likely immutable) and unique. Populates a dict of label to location in
+  Cython to do ``O(1)`` lookups.
+* ``Int64Index``: a version of ``Index`` highly optimized for 64-bit integer
+  data, such as time stamps
+* ``Float64Index``: a version of ``Index`` highly optimized for 64-bit float data
+* ``MultiIndex``: the standard hierarchical index object
+* ``DatetimeIndex``: An Index object with ``Timestamp`` boxed elements (impl are the int64 values)
+* ``TimedeltaIndex``: An Index object with ``Timedelta`` boxed elements (impl are the in64 values)
+* ``PeriodIndex``: An Index object with Period elements
+
+There are functions that make the creation of a regular index easy:
+
+* ``date_range``: fixed frequency date range generated from a time rule or
+  DateOffset. An ndarray of Python datetime objects
+* ``period_range``: fixed frequency date range generated from a time rule or
+  DateOffset. An ndarray of ``Period`` objects, representing timespans
+
+The motivation for having an ``Index`` class in the first place was to enable
+different implementations of indexing. This means that it's possible for you,
+the user, to implement a custom ``Index`` subclass that may be better suited to
+a particular application than the ones provided in pandas.
+
+From an internal implementation point of view, the relevant methods that an
+``Index`` must define are one or more of the following (depending on how
+incompatible the new object internals are with the ``Index`` functions):
+
+* ``get_loc``: returns an "indexer" (an integer, or in some cases a
+  slice object) for a label
+* ``slice_locs``: returns the "range" to slice between two labels
+* ``get_indexer``: Computes the indexing vector for reindexing / data
+  alignment purposes. See the source / docstrings for more on this
+* ``get_indexer_non_unique``: Computes the indexing vector for reindexing / data
+  alignment purposes when the index is non-unique. See the source / docstrings
+  for more on this
+* ``reindex``: Does any pre-conversion of the input index then calls
+  ``get_indexer``
+* ``union``, ``intersection``: computes the union or intersection of two
+  Index objects
+* ``insert``: Inserts a new label into an Index, yielding a new object
+* ``delete``: Delete a label, yielding a new object
+* ``drop``: Deletes a set of labels
+* ``take``: Analogous to ndarray.take
+
+MultiIndex
+~~~~~~~~~~
+
+Internally, the ``MultiIndex`` consists of a few things: the **levels**, the
+integer **codes** (until version 0.24 named *labels*), and the level **names**:
+
+.. ipython:: python
+
+   index = pd.MultiIndex.from_product([range(3), ['one', 'two']],
+                                      names=['first', 'second'])
+   index
+   index.levels
+   index.codes
+   index.names
+
+You can probably guess that the codes determine which unique element is
+identified with that location at each layer of the index. It's important to
+note that sortedness is determined **solely** from the integer codes and does
+not check (or care) whether the levels themselves are sorted. Fortunately, the
+constructors ``from_tuples`` and ``from_arrays`` ensure that this is true, but
+if you compute the levels and codes yourself, please be careful.
+
+Values
+~~~~~~
+
+Pandas extends NumPy's type system with custom types, like ``Categorical`` or
+datetimes with a timezone, so we have multiple notions of "values". For 1-D
+containers (``Index`` classes and ``Series``) we have the following convention:
+
+* ``cls._ndarray_values`` is *always* a NumPy ``ndarray``. Ideally,
+  ``_ndarray_values`` is cheap to compute. For example, for a ``Categorical``,
+  this returns the codes, not the array of objects.
+* ``cls._values`` refers is the "best possible" array. This could be an
+  ``ndarray``, ``ExtensionArray``, or in ``Index`` subclass (note: we're in the
+  process of removing the index subclasses here so that it's always an
+  ``ndarray`` or ``ExtensionArray``).
+
+So, for example, ``Series[category]._values`` is a ``Categorical``, while
+``Series[category]._ndarray_values`` is the underlying codes.
+
+.. _ref-subclassing-pandas:
+
+Subclassing pandas Data Structures
+----------------------------------
+
+This section has been moved to :ref:`extending.subclassing-pandas`.
diff --git a/doc/source/dsintro.rst b/doc/source/dsintro.rst
deleted file mode 100644
index cc69367017aed..0000000000000
--- a/doc/source/dsintro.rst
+++ /dev/null
@@ -1,948 +0,0 @@
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.set_option('display.precision', 4, 'display.max_columns', 8)
-   pd.options.display.max_rows = 15
-
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-.. _dsintro:
-
-************************
-Intro to Data Structures
-************************
-
-We'll start with a quick, non-comprehensive overview of the fundamental data
-structures in pandas to get you started. The fundamental behavior about data
-types, indexing, and axis labeling / alignment apply across all of the
-objects. To get started, import numpy and load pandas into your namespace:
-
-.. ipython:: python
-
-   import numpy as np
-   import pandas as pd
-
-Here is a basic tenet to keep in mind: **data alignment is intrinsic**. The link
-between labels and data will not be broken unless done so explicitly by you.
-
-We'll give a brief intro to the data structures, then consider all of the broad
-categories of functionality and methods in separate sections.
-
-.. _basics.series:
-
-Series
-------
-
-:class:`Series` is a one-dimensional labeled array capable of holding any data
-type (integers, strings, floating point numbers, Python objects, etc.). The axis
-labels are collectively referred to as the **index**. The basic method to create a Series is to call:
-
-::
-
-    >>> s = pd.Series(data, index=index)
-
-Here, ``data`` can be many different things:
-
- - a Python dict
- - an ndarray
- - a scalar value (like 5)
-
-The passed **index** is a list of axis labels. Thus, this separates into a few
-cases depending on what **data is**:
-
-**From ndarray**
-
-If ``data`` is an ndarray, **index** must be the same length as **data**. If no
-index is passed, one will be created having values ``[0, ..., len(data) - 1]``.
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   s
-   s.index
-
-   pd.Series(np.random.randn(5))
-
-.. note::
-
-    Starting in v0.8.0, pandas supports non-unique index values. If an operation
-    that does not support duplicate index values is attempted, an exception
-    will be raised at that time. The reason for being lazy is nearly all performance-based
-    (there are many instances in computations, like parts of GroupBy, where the index
-    is not used).
-
-**From dict**
-
-If ``data`` is a dict, if **index** is passed the values in data corresponding
-to the labels in the index will be pulled out. Otherwise, an index will be
-constructed from the sorted keys of the dict, if possible.
-
-.. ipython:: python
-
-   d = {'a' : 0., 'b' : 1., 'c' : 2.}
-   pd.Series(d)
-   pd.Series(d, index=['b', 'c', 'd', 'a'])
-
-.. note::
-
-    NaN (not a number) is the standard missing data marker used in pandas
-
-**From scalar value** If ``data`` is a scalar value, an index must be
-provided. The value will be repeated to match the length of **index**
-
-.. ipython:: python
-
-   pd.Series(5., index=['a', 'b', 'c', 'd', 'e'])
-
-Series is ndarray-like
-~~~~~~~~~~~~~~~~~~~~~~
-
-``Series`` acts very similarly to a ``ndarray``, and is a valid argument to most NumPy functions.
-However, things like slicing also slice the index.
-
-.. ipython :: python
-
-    s[0]
-    s[:3]
-    s[s > s.median()]
-    s[[4, 3, 1]]
-    np.exp(s)
-
-We will address array-based indexing in a separate :ref:`section <indexing>`.
-
-Series is dict-like
-~~~~~~~~~~~~~~~~~~~
-
-A Series is like a fixed-size dict in that you can get and set values by index
-label:
-
-.. ipython :: python
-
-    s['a']
-    s['e'] = 12.
-    s
-    'e' in s
-    'f' in s
-
-If a label is not contained, an exception is raised:
-
-.. code-block:: python
-
-    >>> s['f']
-    KeyError: 'f'
-
-Using the ``get`` method, a missing label will return None or specified default:
-
-.. ipython:: python
-
-   s.get('f')
-
-   s.get('f', np.nan)
-
-See also the :ref:`section on attribute access<indexing.attribute_access>`.
-
-Vectorized operations and label alignment with Series
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-When doing data analysis, as with raw NumPy arrays looping through Series
-value-by-value is usually not necessary. Series can be also be passed into most
-NumPy methods expecting an ndarray.
-
-
-.. ipython:: python
-
-    s + s
-    s * 2
-    np.exp(s)
-
-A key difference between Series and ndarray is that operations between Series
-automatically align the data based on label. Thus, you can write computations
-without giving consideration to whether the Series involved have the same
-labels.
-
-.. ipython:: python
-
-    s[1:] + s[:-1]
-
-The result of an operation between unaligned Series will have the **union** of
-the indexes involved. If a label is not found in one Series or the other, the
-result will be marked as missing ``NaN``. Being able to write code without doing
-any explicit data alignment grants immense freedom and flexibility in
-interactive data analysis and research. The integrated data alignment features
-of the pandas data structures set pandas apart from the majority of related
-tools for working with labeled data.
-
-.. note::
-
-    In general, we chose to make the default result of operations between
-    differently indexed objects yield the **union** of the indexes in order to
-    avoid loss of information. Having an index label, though the data is
-    missing, is typically important information as part of a computation. You
-    of course have the option of dropping labels with missing data via the
-    **dropna** function.
-
-Name attribute
-~~~~~~~~~~~~~~
-
-.. _dsintro.name_attribute:
-
-Series can also have a ``name`` attribute:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5), name='something')
-   s
-   s.name
-
-The Series ``name`` will be assigned automatically in many cases, in particular
-when taking 1D slices of DataFrame as you will see below.
-
-.. versionadded:: 0.18.0
-
-You can rename a Series with the :meth:`pandas.Series.rename` method.
-
-.. ipython:: python
-
-   s2 = s.rename("different")
-   s2.name
-
-Note that ``s`` and ``s2`` refer to different objects.
-
-.. _basics.dataframe:
-
-DataFrame
----------
-
-**DataFrame** is a 2-dimensional labeled data structure with columns of
-potentially different types. You can think of it like a spreadsheet or SQL
-table, or a dict of Series objects. It is generally the most commonly used
-pandas object. Like Series, DataFrame accepts many different kinds of input:
-
- - Dict of 1D ndarrays, lists, dicts, or Series
- - 2-D numpy.ndarray
- - `Structured or record
-   <http://docs.scipy.org/doc/numpy/user/basics.rec.html>`__ ndarray
- - A ``Series``
- - Another ``DataFrame``
-
-Along with the data, you can optionally pass **index** (row labels) and
-**columns** (column labels) arguments. If you pass an index and / or columns,
-you are guaranteeing the index and / or columns of the resulting
-DataFrame. Thus, a dict of Series plus a specific index will discard all data
-not matching up to the passed index.
-
-If axis labels are not passed, they will be constructed from the input data
-based on common sense rules.
-
-From dict of Series or dicts
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The result **index** will be the **union** of the indexes of the various
-Series. If there are any nested dicts, these will be first converted to
-Series. If no columns are passed, the columns will be the sorted list of dict
-keys.
-
-.. ipython:: python
-
-    d = {'one' : pd.Series([1., 2., 3.], index=['a', 'b', 'c']),
-         'two' : pd.Series([1., 2., 3., 4.], index=['a', 'b', 'c', 'd'])}
-    df = pd.DataFrame(d)
-    df
-
-    pd.DataFrame(d, index=['d', 'b', 'a'])
-    pd.DataFrame(d, index=['d', 'b', 'a'], columns=['two', 'three'])
-
-The row and column labels can be accessed respectively by accessing the
-**index** and **columns** attributes:
-
-.. note::
-
-   When a particular set of columns is passed along with a dict of data, the
-   passed columns override the keys in the dict.
-
-.. ipython:: python
-
-   df.index
-   df.columns
-
-From dict of ndarrays / lists
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ndarrays must all be the same length. If an index is passed, it must
-clearly also be the same length as the arrays. If no index is passed, the
-result will be ``range(n)``, where ``n`` is the array length.
-
-.. ipython:: python
-
-   d = {'one' : [1., 2., 3., 4.],
-        'two' : [4., 3., 2., 1.]}
-   pd.DataFrame(d)
-   pd.DataFrame(d, index=['a', 'b', 'c', 'd'])
-
-From structured or record array
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-This case is handled identically to a dict of arrays.
-
-.. ipython:: python
-
-   data = np.zeros((2,), dtype=[('A', 'i4'),('B', 'f4'),('C', 'a10')])
-   data[:] = [(1,2.,'Hello'), (2,3.,"World")]
-
-   pd.DataFrame(data)
-   pd.DataFrame(data, index=['first', 'second'])
-   pd.DataFrame(data, columns=['C', 'A', 'B'])
-
-.. note::
-
-    DataFrame is not intended to work exactly like a 2-dimensional NumPy
-    ndarray.
-
-.. _basics.dataframe.from_list_of_dicts:
-
-From a list of dicts
-~~~~~~~~~~~~~~~~~~~~
-
-.. ipython:: python
-
-   data2 = [{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]
-   pd.DataFrame(data2)
-   pd.DataFrame(data2, index=['first', 'second'])
-   pd.DataFrame(data2, columns=['a', 'b'])
-
-.. _basics.dataframe.from_dict_of_tuples:
-
-From a dict of tuples
-~~~~~~~~~~~~~~~~~~~~~
-
-You can automatically create a multi-indexed frame by passing a tuples dictionary
-
-.. ipython:: python
-
-   pd.DataFrame({('a', 'b'): {('A', 'B'): 1, ('A', 'C'): 2},
-                 ('a', 'a'): {('A', 'C'): 3, ('A', 'B'): 4},
-                 ('a', 'c'): {('A', 'B'): 5, ('A', 'C'): 6},
-                 ('b', 'a'): {('A', 'C'): 7, ('A', 'B'): 8},
-                 ('b', 'b'): {('A', 'D'): 9, ('A', 'B'): 10}})
-
-.. _basics.dataframe.from_series:
-
-From a Series
-~~~~~~~~~~~~~
-
-The result will be a DataFrame with the same index as the input Series, and
-with one column whose name is the original name of the Series (only if no other
-column name provided).
-
-**Missing Data**
-
-Much more will be said on this topic in the :ref:`Missing data <missing_data>`
-section. To construct a DataFrame with missing data, use ``np.nan`` for those
-values which are missing. Alternatively, you may pass a ``numpy.MaskedArray``
-as the data argument to the DataFrame constructor, and its masked entries will
-be considered missing.
-
-Alternate Constructors
-~~~~~~~~~~~~~~~~~~~~~~
-
-.. _basics.dataframe.from_dict:
-
-**DataFrame.from_dict**
-
-``DataFrame.from_dict`` takes a dict of dicts or a dict of array-like sequences
-and returns a DataFrame. It operates like the ``DataFrame`` constructor except
-for the ``orient`` parameter which is ``'columns'`` by default, but which can be
-set to ``'index'`` in order to use the dict keys as row labels.
-
-.. _basics.dataframe.from_records:
-
-**DataFrame.from_records**
-
-``DataFrame.from_records`` takes a list of tuples or an ndarray with structured
-dtype. Works analogously to the normal ``DataFrame`` constructor, except that
-index maybe be a specific field of the structured dtype to use as the index.
-For example:
-
-.. ipython:: python
-
-   data
-   pd.DataFrame.from_records(data, index='C')
-
-.. _basics.dataframe.from_items:
-
-**DataFrame.from_items**
-
-``DataFrame.from_items`` works analogously to the form of the ``dict``
-constructor that takes a sequence of ``(key, value)`` pairs, where the keys are
-column (or row, in the case of ``orient='index'``) names, and the value are the
-column values (or row values). This can be useful for constructing a DataFrame
-with the columns in a particular order without having to pass an explicit list
-of columns:
-
-.. ipython:: python
-
-   pd.DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])])
-
-If you pass ``orient='index'``, the keys will be the row labels. But in this
-case you must also pass the desired column names:
-
-.. ipython:: python
-
-   pd.DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
-                           orient='index', columns=['one', 'two', 'three'])
-
-Column selection, addition, deletion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You can treat a DataFrame semantically like a dict of like-indexed Series
-objects. Getting, setting, and deleting columns works with the same syntax as
-the analogous dict operations:
-
-.. ipython:: python
-
-   df['one']
-   df['three'] = df['one'] * df['two']
-   df['flag'] = df['one'] > 2
-   df
-
-Columns can be deleted or popped like with a dict:
-
-.. ipython:: python
-
-   del df['two']
-   three = df.pop('three')
-   df
-
-When inserting a scalar value, it will naturally be propagated to fill the
-column:
-
-.. ipython:: python
-
-   df['foo'] = 'bar'
-   df
-
-When inserting a Series that does not have the same index as the DataFrame, it
-will be conformed to the DataFrame's index:
-
-.. ipython:: python
-
-   df['one_trunc'] = df['one'][:2]
-   df
-
-You can insert raw ndarrays but their length must match the length of the
-DataFrame's index.
-
-By default, columns get inserted at the end. The ``insert`` function is
-available to insert at a particular location in the columns:
-
-.. ipython:: python
-
-   df.insert(1, 'bar', df['one'])
-   df
-
-.. _dsintro.chained_assignment:
-
-Assigning New Columns in Method Chains
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.16.0
-
-Inspired by `dplyr's
-<http://cran.rstudio.com/web/packages/dplyr/vignettes/introduction.html#mutate>`__
-``mutate`` verb, DataFrame has an :meth:`~pandas.DataFrame.assign`
-method that allows you to easily create new columns that are potentially
-derived from existing columns.
-
-.. ipython:: python
-
-   iris = pd.read_csv('data/iris.data')
-   iris.head()
-
-   (iris.assign(sepal_ratio = iris['SepalWidth'] / iris['SepalLength'])
-        .head())
-
-Above was an example of inserting a precomputed value. We can also pass in
-a function of one argument to be evalutated on the DataFrame being assigned to.
-
-.. ipython:: python
-
-   iris.assign(sepal_ratio = lambda x: (x['SepalWidth'] /
-                                        x['SepalLength'])).head()
-
-``assign`` **always** returns a copy of the data, leaving the original
-DataFrame untouched.
-
-Passing a callable, as opposed to an actual value to be inserted, is
-useful when you don't have a reference to the DataFrame at hand. This is
-common when using ``assign`` in chains of operations. For example,
-we can limit the DataFrame to just those observations with a Sepal Length
-greater than 5, calculate the ratio, and plot:
-
-.. ipython:: python
-
-   @savefig basics_assign.png
-   (iris.query('SepalLength > 5')
-        .assign(SepalRatio = lambda x: x.SepalWidth / x.SepalLength,
-                PetalRatio = lambda x: x.PetalWidth / x.PetalLength)
-        .plot(kind='scatter', x='SepalRatio', y='PetalRatio'))
-
-Since a function is passed in, the function is computed on the DataFrame
-being assigned to. Importantly, this is the DataFrame that's been filtered
-to those rows with sepal length greater than 5. The filtering happens first,
-and then the ratio calculations. This is an example where we didn't
-have a reference to the *filtered* DataFrame available.
-
-The function signature for ``assign`` is simply ``**kwargs``. The keys
-are the column names for the new fields, and the values are either a value
-to be inserted (for example, a ``Series`` or NumPy array), or a function
-of one argument to be called on the ``DataFrame``. A *copy* of the original
-DataFrame is returned, with the new values inserted.
-
-.. warning::
-
-  Since the function signature of ``assign`` is ``**kwargs``, a dictionary,
-  the order of the new columns in the resulting DataFrame cannot be guaranteed
-  to match the order you pass in. To make things predictable, items are inserted
-  alphabetically (by key) at the end of the DataFrame.
-
-  All expressions are computed first, and then assigned. So you can't refer
-  to another column being assigned in the same call to ``assign``. For example:
-
-   .. ipython::
-       :verbatim:
-
-       In [1]: # Don't do this, bad reference to `C`
-               df.assign(C = lambda x: x['A'] + x['B'],
-                         D = lambda x: x['A'] + x['C'])
-       In [2]: # Instead, break it into two assigns
-               (df.assign(C = lambda x: x['A'] + x['B'])
-                  .assign(D = lambda x: x['A'] + x['C']))
-
-Indexing / Selection
-~~~~~~~~~~~~~~~~~~~~
-The basics of indexing are as follows:
-
-.. csv-table::
-    :header: "Operation", "Syntax", "Result"
-    :widths: 30, 20, 10
-
-    Select column, ``df[col]``, Series
-    Select row by label, ``df.loc[label]``, Series
-    Select row by integer location, ``df.iloc[loc]``, Series
-    Slice rows, ``df[5:10]``, DataFrame
-    Select rows by boolean vector, ``df[bool_vec]``, DataFrame
-
-Row selection, for example, returns a Series whose index is the columns of the
-DataFrame:
-
-.. ipython:: python
-
-   df.loc['b']
-   df.iloc[2]
-
-For a more exhaustive treatment of more sophisticated label-based indexing and
-slicing, see the :ref:`section on indexing <indexing>`. We will address the
-fundamentals of reindexing / conforming to new sets of labels in the
-:ref:`section on reindexing <basics.reindexing>`.
-
-Data alignment and arithmetic
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Data alignment between DataFrame objects automatically align on **both the
-columns and the index (row labels)**. Again, the resulting object will have the
-union of the column and row labels.
-
-.. ipython:: python
-
-    df = pd.DataFrame(np.random.randn(10, 4), columns=['A', 'B', 'C', 'D'])
-    df2 = pd.DataFrame(np.random.randn(7, 3), columns=['A', 'B', 'C'])
-    df + df2
-
-When doing an operation between DataFrame and Series, the default behavior is
-to align the Series **index** on the DataFrame **columns**, thus `broadcasting
-<http://docs.scipy.org/doc/numpy/user/basics.broadcasting.html>`__
-row-wise. For example:
-
-.. ipython:: python
-
-   df - df.iloc[0]
-
-In the special case of working with time series data, and the DataFrame index
-also contains dates, the broadcasting will be column-wise:
-
-.. ipython:: python
-   :okwarning:
-
-   index = pd.date_range('1/1/2000', periods=8)
-   df = pd.DataFrame(np.random.randn(8, 3), index=index, columns=list('ABC'))
-   df
-   type(df['A'])
-   df - df['A']
-
-.. warning::
-
-   .. code-block:: python
-
-      df - df['A']
-
-   is now deprecated and will be removed in a future release. The preferred way
-   to replicate this behavior is
-
-   .. code-block:: python
-
-      df.sub(df['A'], axis=0)
-
-For explicit control over the matching and broadcasting behavior, see the
-section on :ref:`flexible binary operations <basics.binop>`.
-
-Operations with scalars are just as you would expect:
-
-.. ipython:: python
-
-   df * 5 + 2
-   1 / df
-   df ** 4
-
-.. _dsintro.boolean:
-
-Boolean operators work as well:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'a' : [1, 0, 1], 'b' : [0, 1, 1] }, dtype=bool)
-   df2 = pd.DataFrame({'a' : [0, 1, 1], 'b' : [1, 1, 0] }, dtype=bool)
-   df1 & df2
-   df1 | df2
-   df1 ^ df2
-   -df1
-
-Transposing
-~~~~~~~~~~~
-
-To transpose, access the ``T`` attribute (also the ``transpose`` function),
-similar to an ndarray:
-
-.. ipython:: python
-
-   # only show the first 5 rows
-   df[:5].T
-
-DataFrame interoperability with NumPy functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _dsintro.numpy_interop:
-
-Elementwise NumPy ufuncs (log, exp, sqrt, ...) and various other NumPy functions
-can be used with no issues on DataFrame, assuming the data within are numeric:
-
-.. ipython:: python
-
-   np.exp(df)
-   np.asarray(df)
-
-The dot method on DataFrame implements matrix multiplication:
-
-.. ipython:: python
-
-   df.T.dot(df)
-
-Similarly, the dot method on Series implements dot product:
-
-.. ipython:: python
-
-   s1 = pd.Series(np.arange(5,10))
-   s1.dot(s1)
-
-DataFrame is not intended to be a drop-in replacement for ndarray as its
-indexing semantics are quite different in places from a matrix.
-
-Console display
-~~~~~~~~~~~~~~~
-
-Very large DataFrames will be truncated to display them in the console.
-You can also get a summary using :meth:`~pandas.DataFrame.info`.
-(Here I am reading a CSV version of the **baseball** dataset from the **plyr**
-R package):
-
-.. ipython:: python
-   :suppress:
-
-   # force a summary to be printed
-   pd.set_option('display.max_rows', 5)
-
-.. ipython:: python
-
-   baseball = pd.read_csv('data/baseball.csv')
-   print(baseball)
-   baseball.info()
-
-.. ipython:: python
-   :suppress:
-   :okwarning:
-
-   # restore GlobalPrintConfig
-   pd.reset_option('^display\.')
-
-However, using ``to_string`` will return a string representation of the
-DataFrame in tabular form, though it won't always fit the console width:
-
-.. ipython:: python
-
-   print(baseball.iloc[-20:, :12].to_string())
-
-New since 0.10.0, wide DataFrames will now be printed across multiple rows by
-default:
-
-.. ipython:: python
-
-   pd.DataFrame(np.random.randn(3, 12))
-
-You can change how much to print on a single row by setting the ``display.width``
-option:
-
-.. ipython:: python
-
-   pd.set_option('display.width', 40) # default is 80
-
-   pd.DataFrame(np.random.randn(3, 12))
-
-You can adjust the max width of the individual columns by setting ``display.max_colwidth``
-
-.. ipython:: python
-
-   datafile={'filename': ['filename_01','filename_02'],
-             'path': ["media/user_name/storage/folder_01/filename_01",
-                      "media/user_name/storage/folder_02/filename_02"]}
-
-   pd.set_option('display.max_colwidth',30)
-   pd.DataFrame(datafile)
-
-   pd.set_option('display.max_colwidth',100)
-   pd.DataFrame(datafile)
-
-.. ipython:: python
-   :suppress:
-
-   pd.reset_option('display.width')
-   pd.reset_option('display.max_colwidth')
-
-You can also disable this feature via the ``expand_frame_repr`` option.
-This will print the table in one block.
-
-DataFrame column attribute access and IPython completion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-If a DataFrame column label is a valid Python variable name, the column can be
-accessed like attributes:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'foo1' : np.random.randn(5),
-                      'foo2' : np.random.randn(5)})
-   df
-   df.foo1
-
-The columns are also connected to the `IPython <http://ipython.org>`__
-completion mechanism so they can be tab-completed:
-
-.. code-block:: ipython
-
-    In [5]: df.fo<TAB>
-    df.foo1  df.foo2
-
-.. _basics.panel:
-
-Panel
------
-
-Panel is a somewhat less-used, but still important container for 3-dimensional
-data. The term `panel data <http://en.wikipedia.org/wiki/Panel_data>`__ is
-derived from econometrics and is partially responsible for the name pandas:
-pan(el)-da(ta)-s. The names for the 3 axes are intended to give some semantic
-meaning to describing operations involving panel data and, in particular,
-econometric analysis of panel data. However, for the strict purposes of slicing
-and dicing a collection of DataFrame objects, you may find the axis names
-slightly arbitrary:
-
-  - **items**: axis 0, each item corresponds to a DataFrame contained inside
-  - **major_axis**: axis 1, it is the **index** (rows) of each of the
-    DataFrames
-  - **minor_axis**: axis 2, it is the **columns** of each of the DataFrames
-
-Construction of Panels works about like you would expect:
-
-From 3D ndarray with optional axis labels
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. ipython:: python
-
-   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                 major_axis=pd.date_range('1/1/2000', periods=5),
-                 minor_axis=['A', 'B', 'C', 'D'])
-   wp
-
-
-From dict of DataFrame objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. ipython:: python
-
-   data = {'Item1' : pd.DataFrame(np.random.randn(4, 3)),
-           'Item2' : pd.DataFrame(np.random.randn(4, 2))}
-   pd.Panel(data)
-
-Note that the values in the dict need only be **convertible to
-DataFrame**. Thus, they can be any of the other valid inputs to DataFrame as
-per above.
-
-One helpful factory method is ``Panel.from_dict``, which takes a
-dictionary of DataFrames as above, and the following named parameters:
-
-.. csv-table::
-   :header: "Parameter", "Default", "Description"
-   :widths: 10, 10, 40
-
-   intersect, ``False``, drops elements whose indices do not align
-   orient, ``items``, use ``minor`` to use DataFrames' columns as panel items
-
-For example, compare to the construction above:
-
-.. ipython:: python
-
-   pd.Panel.from_dict(data, orient='minor')
-
-Orient is especially useful for mixed-type DataFrames. If you pass a dict of
-DataFrame objects with mixed-type columns, all of the data will get upcasted to
-``dtype=object`` unless you pass ``orient='minor'``:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': ['foo', 'bar', 'baz'],
-                      'b': np.random.randn(3)})
-   df
-   data = {'item1': df, 'item2': df}
-   panel = pd.Panel.from_dict(data, orient='minor')
-   panel['a']
-   panel['b']
-   panel['b'].dtypes
-
-.. note::
-
-   Unfortunately Panel, being less commonly used than Series and DataFrame,
-   has been slightly neglected feature-wise. A number of methods and options
-   available in DataFrame are not available in Panel. This will get worked
-   on, of course, in future releases. And faster if you join me in working on
-   the codebase.
-
-.. _dsintro.to_panel:
-
-From DataFrame using ``to_panel`` method
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-This method was introduced in v0.7 to replace ``LongPanel.to_long``, and converts
-a DataFrame with a two-level index to a Panel.
-
-.. ipython:: python
-
-   midx = pd.MultiIndex(levels=[['one', 'two'], ['x','y']], labels=[[1,1,0,0],[1,0,1,0]])
-   df = pd.DataFrame({'A' : [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=midx)
-   df.to_panel()
-
-.. _dsintro.panel_item_selection:
-
-Item selection / addition / deletion
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Similar to DataFrame functioning as a dict of Series, Panel is like a dict
-of DataFrames:
-
-.. ipython:: python
-
-   wp['Item1']
-   wp['Item3'] = wp['Item1'] / wp['Item2']
-
-The API for insertion and deletion is the same as for DataFrame. And as with
-DataFrame, if the item is a valid python identifier, you can access it as an
-attribute and tab-complete it in IPython.
-
-Transposing
-~~~~~~~~~~~
-
-A Panel can be rearranged using its ``transpose`` method (which does not make a
-copy by default unless the data are heterogeneous):
-
-.. ipython:: python
-
-   wp.transpose(2, 0, 1)
-
-Indexing / Selection
-~~~~~~~~~~~~~~~~~~~~
-
-.. csv-table::
-    :header: "Operation", "Syntax", "Result"
-    :widths: 30, 20, 10
-
-    Select item, ``wp[item]``, DataFrame
-    Get slice at major_axis label, ``wp.major_xs(val)``, DataFrame
-    Get slice at minor_axis label, ``wp.minor_xs(val)``, DataFrame
-
-For example, using the earlier example data, we could do:
-
-.. ipython:: python
-
-    wp['Item1']
-    wp.major_xs(wp.major_axis[2])
-    wp.minor_axis
-    wp.minor_xs('C')
-
-Squeezing
-~~~~~~~~~
-
-Another way to change the dimensionality of an object is to ``squeeze`` a 1-len object, similar to ``wp['Item1']``
-
-.. ipython:: python
-
-   wp.reindex(items=['Item1']).squeeze()
-   wp.reindex(items=['Item1'], minor=['B']).squeeze()
-
-
-Conversion to DataFrame
-~~~~~~~~~~~~~~~~~~~~~~~
-
-A Panel can be represented in 2D form as a hierarchically indexed
-DataFrame. See the section :ref:`hierarchical indexing <advanced.hierarchical>`
-for more on this. To convert a Panel to a DataFrame, use the ``to_frame``
-method:
-
-.. ipython:: python
-
-   panel = pd.Panel(np.random.randn(3, 5, 4), items=['one', 'two', 'three'],
-                    major_axis=pd.date_range('1/1/2000', periods=5),
-                    minor_axis=['a', 'b', 'c', 'd'])
-   panel.to_frame()
-
-.. _dsintro.panelnd:
-.. _dsintro.panel4d:
-
-Panel4D and PanelND (Deprecated)
---------------------------------
-
-.. warning::
-
-    In 0.19.0 ``Panel4D`` and ``PanelND`` are deprecated and will be removed in
-    a future version. The recommended way to represent these types of
-    n-dimensional data are with the
-    `xarray package <http://xarray.pydata.org/en/stable/>`__.
-    Pandas provides a :meth:`~Panel4D.to_xarray` method to automate
-    this conversion.
-
-See the `docs of a previous version <http://pandas.pydata.org/pandas-docs/version/0.18.1/dsintro.html#panel4d-experimental>`__
-for documentation on these objects.
diff --git a/doc/source/ecosystem.rst b/doc/source/ecosystem.rst
index ee0ea60c6f220..833308ec9fcc6 100644
--- a/doc/source/ecosystem.rst
+++ b/doc/source/ecosystem.rst
@@ -1,5 +1,7 @@
 .. _ecosystem:
 
+{{ header }}
+
 ****************
 pandas Ecosystem
 ****************
@@ -12,10 +14,13 @@ build powerful and more focused data tools.
 The creation of libraries that complement pandas' functionality also allows pandas
 development to remain focused around it's original requirements.
 
-This is an in-exhaustive list of projects that build on pandas in order to provide
-tools in the PyData space.
+This is an inexhaustive list of projects that build on pandas in order to provide
+tools in the PyData space. For a list of projects that depend on pandas,
+see the
+`libraries.io usage page for pandas <https://libraries.io/pypi/pandas/usage>`_
+or `search pypi for pandas <https://pypi.org/search/?q=pandas>`_.
 
-We'd like to make it easier for users to find these project, if you know of other
+We'd like to make it easier for users to find these projects, if you know of other
 substantial projects that you feel should be on this list, please let us know.
 
 
@@ -24,10 +29,10 @@ substantial projects that you feel should be on this list, please let us know.
 Statistics and Machine Learning
 -------------------------------
 
-`Statsmodels <http://www.statsmodels.org/>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`Statsmodels <https://www.statsmodels.org/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Statsmodels is the prominent python "statistics and econometrics library" and it has
+Statsmodels is the prominent Python "statistics and econometrics library" and it has
 a long-standing special relationship with pandas. Statsmodels provides powerful statistics,
 econometrics, analysis and modeling functionality that is out of pandas' scope.
 Statsmodels leverages pandas objects as the underlying data container for computation.
@@ -35,63 +40,71 @@ Statsmodels leverages pandas objects as the underlying data container for comput
 `sklearn-pandas <https://github.com/paulgb/sklearn-pandas>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Use pandas DataFrames in your `scikit-learn <http://scikit-learn.org/>`__
+Use pandas DataFrames in your `scikit-learn <https://scikit-learn.org/>`__
 ML pipeline.
 
+`Featuretools <https://github.com/featuretools/featuretools/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
+Featuretools is a Python library for automated feature engineering built on top of pandas. It excels at transforming temporal and relational datasets into feature matrices for machine learning using reusable feature engineering "primitives". Users can contribute their own primitives in Python and share them with the rest of the community.
 
 .. _ecosystem.visualization:
 
 Visualization
 -------------
 
-`Bokeh <http://bokeh.pydata.org>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`Altair <https://altair-viz.github.io/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Altair is a declarative statistical visualization library for Python.
+With Altair, you can spend more time understanding your data and its
+meaning. Altair's API is simple, friendly and consistent and built on
+top of the powerful Vega-Lite JSON specification. This elegant
+simplicity produces beautiful and effective visualizations with a
+minimal amount of code. Altair works with Pandas DataFrames.
+
+
+`Bokeh <https://bokeh.pydata.org>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Bokeh is a Python interactive visualization library for large datasets that natively uses
 the latest web technologies. Its goal is to provide elegant, concise construction of novel
 graphics in the style of Protovis/D3, while delivering high-performance interactivity over
 large data to thin clients.
 
-`yhat/ggplot <https://github.com/yhat/ggplot>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`seaborn <https://seaborn.pydata.org>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Hadley Wickham's `ggplot2 <http://ggplot2.org/>`__ is a foundational exploratory visualization package for the R language.
-Based on `"The Grammar of Graphics" <http://www.cs.uic.edu/~wilkinson/TheGrammarOfGraphics/GOG.html>`__ it
+Seaborn is a Python visualization library based on
+`matplotlib <https://matplotlib.org>`__. It provides a high-level, dataset-oriented
+interface for creating attractive statistical graphics. The plotting functions
+in seaborn understand pandas objects and leverage pandas grouping operations
+internally to support concise specification of complex visualizations. Seaborn
+also goes beyond matplotlib and pandas with the option to perform statistical
+estimation while plotting, aggregating across observations and visualizing the
+fit of statistical models to emphasize patterns in a dataset.
+
+`yhat/ggpy <https://github.com/yhat/ggpy>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Hadley Wickham's `ggplot2 <https://ggplot2.tidyverse.org/>`__ is a foundational exploratory visualization package for the R language.
+Based on `"The Grammar of Graphics" <https://www.cs.uic.edu/~wilkinson/TheGrammarOfGraphics/GOG.html>`__ it
 provides a powerful, declarative and extremely general way to generate bespoke plots of any kind of data.
 It's really quite incredible. Various implementations to other languages are available,
-but a faithful implementation for python users has long been missing. Although still young
-(as of Jan-2014), the `yhat/ggplot <https://github.com/yhat/ggplot>`__ project has been
+but a faithful implementation for Python users has long been missing. Although still young
+(as of Jan-2014), the `yhat/ggpy <https://github.com/yhat/ggpy>`__ project has been
 progressing quickly in that direction.
 
-`Seaborn <https://github.com/mwaskom/seaborn>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Although pandas has quite a bit of "just plot it" functionality built-in, visualization and
-in particular statistical graphics is a vast field with a long tradition and lots of ground
-to cover. The `Seaborn <https://github.com/mwaskom/seaborn>`__ project builds on top of pandas
-and `matplotlib <http://matplotlib.org>`__ to provide easy plotting of data which extends to
-more advanced types of plots then those offered by pandas.
-
-`Vincent <https://github.com/wrobstory/vincent>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The `Vincent <https://github.com/wrobstory/vincent>`__ project leverages `Vega <https://github.com/trifacta/vega>`__
-(that in turn, leverages `d3 <http://d3js.org/>`__) to create
-plots. Although functional, as of Summer 2016 the Vincent project has not been updated
-in over two years and is `unlikely to receive further updates <https://github.com/wrobstory/vincent#2015-08-12-update>`__.
-
 `IPython Vega <https://github.com/vega/ipyvega>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Like Vincent, the `IPython Vega <https://github.com/vega/ipyvega>`__ project leverages `Vega
-<https://github.com/trifacta/vega>`__ to create plots, but primarily
-targets the IPython Notebook environment.
+`IPython Vega <https://github.com/vega/ipyvega>`__ leverages `Vega
+<https://github.com/trifacta/vega>`__ to create plots within Jupyter Notebook.
 
 `Plotly <https://plot.ly/python>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-`Plotly’s <https://plot.ly/>`__ `Python API <https://plot.ly/python/>`__ enables interactive figures and web shareability. Maps, 2D, 3D, and live-streaming graphs are rendered with WebGL and `D3.js <http://d3js.org/>`__. The library supports plotting directly from a pandas DataFrame and cloud-based collaboration. Users of `matplotlib, ggplot for Python, and Seaborn <https://plot.ly/python/matplotlib-to-plotly-tutorial/>`__ can convert figures into interactive web-based plots. Plots can be drawn in `IPython Notebooks <https://plot.ly/ipython-notebooks/>`__ , edited with R or MATLAB, modified in a GUI, or embedded in apps and dashboards. Plotly is free for unlimited sharing, and has `cloud <https://plot.ly/product/plans/>`__, `offline <https://plot.ly/python/offline/>`__, or `on-premise <https://plot.ly/product/enterprise/>`__ accounts for private use.
+`Plotly’s <https://plot.ly/>`__ `Python API <https://plot.ly/python/>`__ enables interactive figures and web shareability. Maps, 2D, 3D, and live-streaming graphs are rendered with WebGL and `D3.js <https://d3js.org/>`__. The library supports plotting directly from a pandas DataFrame and cloud-based collaboration. Users of `matplotlib, ggplot for Python, and Seaborn <https://plot.ly/python/matplotlib-to-plotly-tutorial/>`__ can convert figures into interactive web-based plots. Plots can be drawn in `IPython Notebooks <https://plot.ly/ipython-notebooks/>`__ , edited with R or MATLAB, modified in a GUI, or embedded in apps and dashboards. Plotly is free for unlimited sharing, and has `cloud <https://plot.ly/product/plans/>`__, `offline <https://plot.ly/python/offline/>`__, or `on-premise <https://plot.ly/product/enterprise/>`__ accounts for private use.
 
 `QtPandas <https://github.com/draperjames/qtpandas>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -105,24 +118,33 @@ library enables DataFrame visualization and manipulation in PyQt4 and PySide app
 IDE
 ------
 
-`IPython <http://ipython.org/documentation.html>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`IPython <https://ipython.org/documentation.html>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 IPython is an interactive command shell and distributed computing
-environment.
-IPython Notebook is a web application for creating IPython notebooks.
-An IPython notebook is a JSON document containing an ordered list
+environment. IPython tab completion works with Pandas methods and also
+attributes like DataFrame columns.
+
+`Jupyter Notebook / Jupyter Lab <https://jupyter.org>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Jupyter Notebook is a web application for creating Jupyter notebooks.
+A Jupyter notebook is a JSON document containing an ordered list
 of input/output cells which can contain code, text, mathematics, plots
 and rich media.
-IPython notebooks can be converted to a number of open standard output formats
+Jupyter notebooks can be converted to a number of open standard output formats
 (HTML, HTML presentation slides, LaTeX, PDF, ReStructuredText, Markdown,
-Python) through 'Download As' in the web interface and ``ipython nbconvert``
+Python) through 'Download As' in the web interface and ``jupyter convert``
 in a shell.
 
-Pandas DataFrames implement ``_repr_html_`` methods
-which are utilized by IPython Notebook for displaying
-(abbreviated) HTML tables.  (Note: HTML tables may or may not be
-compatible with non-HTML IPython output formats.)
+Pandas DataFrames implement ``_repr_html_``and ``_repr_latex`` methods
+which are utilized by Jupyter Notebook for displaying
+(abbreviated) HTML or LaTeX tables. LaTeX output is properly escaped.
+(Note: HTML tables may or may not be
+compatible with non-HTML Jupyter output formats.)
+
+See :ref:`Options and Settings <options>` and
+:ref:`Available Options <options.available>`
+for pandas ``display.`` settings.
 
 `quantopian/qgrid <https://github.com/quantopian/qgrid>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -130,34 +152,61 @@ compatible with non-HTML IPython output formats.)
 qgrid is "an interactive grid for sorting and filtering
 DataFrames in IPython Notebook" built with SlickGrid.
 
-`Spyder <https://github.com/spyder-ide/spyder/>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+`Spyder <https://www.spyder-ide.org/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Spyder is a cross-platform PyQt-based IDE combining the editing, analysis,
+debugging and profiling functionality of a software development tool with the
+data exploration, interactive execution, deep inspection and rich visualization
+capabilities of a scientific environment like MATLAB or Rstudio.
+
+Its `Variable Explorer <https://docs.spyder-ide.org/variableexplorer.html>`__
+allows users to view, manipulate and edit pandas ``Index``, ``Series``,
+and ``DataFrame`` objects like a "spreadsheet", including copying and modifying
+values, sorting, displaying a "heatmap", converting data types and more.
+Pandas objects can also be renamed, duplicated, new columns added,
+copyed/pasted to/from the clipboard (as TSV), and saved/loaded to/from a file.
+Spyder can also import data from a variety of plain text and binary files
+or the clipboard into a new pandas DataFrame via a sophisticated import wizard.
 
-Spyder is a cross-platform Qt-based open-source Python IDE with
-editing, testing, debugging, and introspection features.
-Spyder can now introspect and display Pandas DataFrames and show
-both "column wise min/max and global min/max coloring."
+Most pandas classes, methods and data attributes can be autocompleted in
+Spyder's `Editor <https://docs.spyder-ide.org/editor.html>`__ and
+`IPython Console <https://docs.spyder-ide.org/ipythonconsole.html>`__,
+and Spyder's `Help pane <https://docs.spyder-ide.org/help.html>`__ can retrieve
+and render Numpydoc documentation on pandas objects in rich text with Sphinx
+both automatically and on-demand.
 
 
 .. _ecosystem.api:
 
 API
------
+---
 
 `pandas-datareader <https://github.com/pydata/pandas-datareader>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-``pandas-datareader`` is a remote data access library for pandas. ``pandas.io`` from pandas < 0.17.0 is now refactored/split-off to and importable from ``pandas_datareader`` (PyPI:``pandas-datareader``). Many/most of the supported APIs have at least a documentation paragraph in the `pandas-datareader docs <https://pandas-datareader.readthedocs.io/en/latest/>`_:
+``pandas-datareader`` is a remote data access library for pandas (PyPI:``pandas-datareader``).
+It is based on functionality that was located in ``pandas.io.data`` and ``pandas.io.wb`` but was
+split off in v0.19.
+See more in the  `pandas-datareader docs <https://pandas-datareader.readthedocs.io/en/latest/>`_:
 
 The following data feeds are available:
 
-  * Yahoo! Finance
-  * Google Finance
-  * FRED
-  * Fama/French
-  * World Bank
-  * OECD
-  * Eurostat
-  * EDGAR Index
+ * Google Finance
+ * Tiingo
+ * Morningstar
+ * IEX
+ * Robinhood
+ * Enigma
+ * Quandl
+ * FRED
+ * Fama/French
+ * World Bank
+ * OECD
+ * Eurostat
+ * TSP Fund Data
+ * Nasdaq Trader Symbol Definitions
+ * Stooq Index Data
+ * MOEX Data
 
 `quandl/Python <https://github.com/quandl/Python>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -173,18 +222,20 @@ This package requires valid credentials for this API (non free).
 
 `pandaSDMX <https://pandasdmx.readthedocs.io>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-pandaSDMX is an extensible library to retrieve and acquire statistical data
+pandaSDMX is a library to retrieve and acquire statistical data
 and metadata disseminated in
-`SDMX <http://www.sdmx.org>`_ 2.1. This standard is currently supported by
-the European statistics office (Eurostat)
-and the European Central Bank (ECB). Datasets may be returned as pandas Series
-or multi-indexed DataFrames.
+`SDMX <https://www.sdmx.org>`_ 2.1, an ISO-standard
+widely used by institutions such as statistics offices, central banks,
+and international organisations. pandaSDMX can expose datasets and related
+structural metadata including data flows, code-lists,
+and data structure definitions as pandas Series
+or MultiIndexed DataFrames.
 
 `fredapi <https://github.com/mortada/fredapi>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-fredapi is a Python interface to the `Federal Reserve Economic Data (FRED) <http://research.stlouisfed.org/fred2/>`__
+fredapi is a Python interface to the `Federal Reserve Economic Data (FRED) <https://fred.stlouisfed.org/>`__
 provided by the Federal Reserve Bank of St. Louis. It works with both the FRED database and ALFRED database that
-contains point-in-time data (i.e. historic data revisions). fredapi provides a wrapper in python to the FRED
+contains point-in-time data (i.e. historic data revisions). fredapi provides a wrapper in Python to the FRED
 HTTP API, and also provides several convenient methods for parsing and analyzing point-in-time data from ALFRED.
 fredapi makes use of pandas and returns data in a Series or DataFrame. This module requires a FRED API key that
 you can obtain for free on the FRED website.
@@ -216,12 +267,6 @@ dimensional arrays, rather than the tabular data for which pandas excels.
 Out-of-core
 -------------
 
-`Dask <https://dask.readthedocs.io/en/latest/>`__
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Dask is a flexible parallel computing library for analytics. Dask
-allow a familiar ``DataFrame`` interface to out-of-core, parallel and distributed computing.
-
 `Blaze <http://blaze.pydata.org/>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -229,6 +274,17 @@ Blaze provides a standard API for doing computations with various
 in-memory and on-disk backends: NumPy, Pandas, SQLAlchemy, MongoDB, PyTables,
 PySpark.
 
+`Dask <https://dask.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Dask is a flexible parallel computing library for analytics. Dask
+provides a familiar ``DataFrame`` interface for out-of-core, parallel and distributed computing.
+
+`Dask-ML <https://dask-ml.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Dask-ML enables parallel and distributed machine learning using Dask alongside existing machine learning libraries like Scikit-Learn, XGBoost, and TensorFlow.
+
 `Odo <http://odo.pydata.org>`__
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
@@ -237,3 +293,69 @@ pandas own ``read_csv`` for CSV IO and leverages many existing packages such as
 PyTables, h5py, and pymongo to move data between non pandas formats. Its graph
 based approach is also extensible by end users for custom formats that may be
 too specific for the core of odo.
+
+`Ray <https://ray.readthedocs.io/en/latest/pandas_on_ray.html>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas on Ray is an early stage DataFrame library that wraps Pandas and transparently distributes the data and computation. The user does not need to know how many cores their system has, nor do they need to specify how to distribute the data. In fact, users can continue using their previous Pandas notebooks while experiencing a considerable speedup from Pandas on Ray, even on a single machine. Only a modification of the import statement is needed, as we demonstrate below. Once you’ve changed your import statement, you’re ready to use Pandas on Ray just like you would Pandas.
+
+.. code:: python
+
+    # import pandas as pd
+    import ray.dataframe as pd
+
+
+`Vaex <https://docs.vaex.io/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Increasingly, packages are being built on top of pandas to address specific needs in data preparation, analysis and visualization. Vaex is a python library for Out-of-Core DataFrames (similar to Pandas), to visualize and explore big tabular datasets. It can calculate statistics such as mean, sum, count, standard deviation etc, on an N-dimensional grid up to a billion (10\ :sup:`9`) objects/rows per second. Visualization is done using histograms, density plots and 3d volume rendering, allowing interactive exploration of big data. Vaex uses memory mapping, zero memory copy policy and lazy computations for best performance (no memory wasted).
+
+ * vaex.from_pandas
+ * vaex.to_pandas_df
+
+
+.. _ecosystem.data_validation:
+
+Data validation
+---------------
+
+`Engarde <https://engarde.readthedocs.io/en/latest/>`__
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Engarde is a lightweight library used to explicitly state your assumptions about your datasets
+and check that they're *actually* true.
+
+.. _ecosystem.extensions:
+
+Extension Data Types
+--------------------
+
+Pandas provides an interface for defining
+:ref:`extension types <extending.extension-types>` to extend NumPy's type
+system. The following libraries implement that interface to provide types not
+found in NumPy or pandas, which work well with pandas' data containers.
+
+`cyberpandas`_
+~~~~~~~~~~~~~~
+
+Cyberpandas provides an extension type for storing arrays of IP Addresses. These
+arrays can be stored inside pandas' Series and DataFrame.
+
+.. _ecosystem.accessors:
+
+Accessors
+---------
+
+A directory of projects providing
+:ref:`extension accessors <extending.register-accessors>`. This is for users to
+discover new accessors and for library authors to coordinate on the namespace.
+
+============== ========== =========================
+Library        Accessor   Classes
+============== ========== =========================
+`cyberpandas`_ ``ip``     ``Series``
+`pdvega`_      ``vgplot`` ``Series``, ``DataFrame``
+============== ========== =========================
+
+.. _cyberpandas: https://cyberpandas.readthedocs.io/en/latest
+.. _pdvega: https://jakevdp.github.io/pdvega/
diff --git a/doc/source/enhancingperf.rst b/doc/source/enhancingperf.rst
deleted file mode 100644
index 685a8690a53d5..0000000000000
--- a/doc/source/enhancingperf.rst
+++ /dev/null
@@ -1,821 +0,0 @@
-.. _enhancingperf:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows=15
-
-   import os
-   import csv
-
-
-*********************
-Enhancing Performance
-*********************
-
-.. _enhancingperf.cython:
-
-Cython (Writing C extensions for pandas)
-----------------------------------------
-
-For many use cases writing pandas in pure python and numpy is sufficient. In some
-computationally heavy applications however, it can be possible to achieve sizeable
-speed-ups by offloading work to `cython <http://cython.org/>`__.
-
-This tutorial assumes you have refactored as much as possible in python, for example
-trying to remove for loops and making use of numpy vectorization, it's always worth
-optimising in python first.
-
-This tutorial walks through a "typical" process of cythonizing a slow computation.
-We use an `example from the cython documentation <http://docs.cython.org/src/quickstart/cythonize.html>`__
-but in the context of pandas. Our final cythonized solution is around 100 times
-faster than the pure python.
-
-.. _enhancingperf.pure:
-
-Pure python
-~~~~~~~~~~~
-
-We have a DataFrame to which we want to apply a function row-wise.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': np.random.randn(1000),
-                      'b': np.random.randn(1000),
-                      'N': np.random.randint(100, 1000, (1000)),
-                      'x': 'x'})
-   df
-
-Here's the function in pure python:
-
-.. ipython:: python
-
-   def f(x):
-       return x * (x - 1)
-
-   def integrate_f(a, b, N):
-       s = 0
-       dx = (b - a) / N
-       for i in range(N):
-           s += f(a + i * dx)
-       return s * dx
-
-We achieve our result by using ``apply`` (row-wise):
-
-.. code-block:: ipython
-
-   In [7]: %timeit df.apply(lambda x: integrate_f(x['a'], x['b'], x['N']), axis=1)
-   10 loops, best of 3: 174 ms per loop
-
-But clearly this isn't fast enough for us. Let's take a look and see where the
-time is spent during this operation (limited to the most time consuming
-four calls) using the `prun ipython magic function <http://ipython.org/ipython-doc/stable/api/generated/IPython.core.magics.execution.html#IPython.core.magics.execution.ExecutionMagics.prun>`__:
-
-.. ipython:: python
-
-   %prun -l 4 df.apply(lambda x: integrate_f(x['a'], x['b'], x['N']), axis=1)
-
-By far the majority of time is spend inside either ``integrate_f`` or ``f``,
-hence we'll concentrate our efforts cythonizing these two functions.
-
-.. note::
-
-  In python 2 replacing the ``range`` with its generator counterpart (``xrange``)
-  would mean the ``range`` line would vanish. In python 3 ``range`` is already a generator.
-
-.. _enhancingperf.plain:
-
-Plain cython
-~~~~~~~~~~~~
-
-First we're going to need to import the cython magic function to ipython (for
-cython versions  < 0.21 you can use ``%load_ext cythonmagic``):
-
-.. ipython:: python
-   :okwarning:
-
-   %load_ext Cython
-
-
-Now, let's simply copy our functions over to cython as is (the suffix
-is here to distinguish between function versions):
-
-.. ipython::
-
-   In [2]: %%cython
-      ...: def f_plain(x):
-      ...:     return x * (x - 1)
-      ...: def integrate_f_plain(a, b, N):
-      ...:     s = 0
-      ...:     dx = (b - a) / N
-      ...:     for i in range(N):
-      ...:         s += f_plain(a + i * dx)
-      ...:     return s * dx
-      ...:
-
-.. note::
-
-  If you're having trouble pasting the above into your ipython, you may need
-  to be using bleeding edge ipython for paste to play well with cell magics.
-
-
-.. code-block:: ipython
-
-   In [4]: %timeit df.apply(lambda x: integrate_f_plain(x['a'], x['b'], x['N']), axis=1)
-   10 loops, best of 3: 85.5 ms per loop
-
-Already this has shaved a third off, not too bad for a simple copy and paste.
-
-.. _enhancingperf.type:
-
-Adding type
-~~~~~~~~~~~
-
-We get another huge improvement simply by providing type information:
-
-.. ipython::
-
-   In [3]: %%cython
-      ...: cdef double f_typed(double x) except? -2:
-      ...:     return x * (x - 1)
-      ...: cpdef double integrate_f_typed(double a, double b, int N):
-      ...:     cdef int i
-      ...:     cdef double s, dx
-      ...:     s = 0
-      ...:     dx = (b - a) / N
-      ...:     for i in range(N):
-      ...:         s += f_typed(a + i * dx)
-      ...:     return s * dx
-      ...:
-
-.. code-block:: ipython
-
-   In [4]: %timeit df.apply(lambda x: integrate_f_typed(x['a'], x['b'], x['N']), axis=1)
-   10 loops, best of 3: 20.3 ms per loop
-
-Now, we're talking! It's now over ten times faster than the original python
-implementation, and we haven't *really* modified the code. Let's have another
-look at what's eating up time:
-
-.. ipython:: python
-
-   %prun -l 4 df.apply(lambda x: integrate_f_typed(x['a'], x['b'], x['N']), axis=1)
-
-.. _enhancingperf.ndarray:
-
-Using ndarray
-~~~~~~~~~~~~~
-
-It's calling series... a lot! It's creating a Series from each row, and get-ting from both
-the index and the series (three times for each row). Function calls are expensive
-in python, so maybe we could minimise these by cythonizing the apply part.
-
-.. note::
-
-  We are now passing ndarrays into the cython function, fortunately cython plays
-  very nicely with numpy.
-
-.. ipython::
-
-   In [4]: %%cython
-      ...: cimport numpy as np
-      ...: import numpy as np
-      ...: cdef double f_typed(double x) except? -2:
-      ...:     return x * (x - 1)
-      ...: cpdef double integrate_f_typed(double a, double b, int N):
-      ...:     cdef int i
-      ...:     cdef double s, dx
-      ...:     s = 0
-      ...:     dx = (b - a) / N
-      ...:     for i in range(N):
-      ...:         s += f_typed(a + i * dx)
-      ...:     return s * dx
-      ...: cpdef np.ndarray[double] apply_integrate_f(np.ndarray col_a, np.ndarray col_b, np.ndarray col_N):
-      ...:     assert (col_a.dtype == np.float and col_b.dtype == np.float and col_N.dtype == np.int)
-      ...:     cdef Py_ssize_t i, n = len(col_N)
-      ...:     assert (len(col_a) == len(col_b) == n)
-      ...:     cdef np.ndarray[double] res = np.empty(n)
-      ...:     for i in range(len(col_a)):
-      ...:         res[i] = integrate_f_typed(col_a[i], col_b[i], col_N[i])
-      ...:     return res
-      ...:
-
-
-The implementation is simple, it creates an array of zeros and loops over
-the rows, applying our ``integrate_f_typed``, and putting this in the zeros array.
-
-
-.. warning::
-
-   In 0.13.0 since ``Series`` has internaly been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``NDFrame``, you can **not pass** a ``Series`` directly as a ``ndarray`` typed parameter
-   to a cython function. Instead pass the actual ``ndarray`` using the ``.values`` attribute of the Series.
-
-   Prior to 0.13.0
-
-   .. code-block:: python
-
-        apply_integrate_f(df['a'], df['b'], df['N'])
-
-   Use ``.values`` to get the underlying ``ndarray``
-
-   .. code-block:: python
-
-        apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
-
-.. note::
-
-    Loops like this would be *extremely* slow in python, but in Cython looping
-    over numpy arrays is *fast*.
-
-.. code-block:: ipython
-
-   In [4]: %timeit apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
-   1000 loops, best of 3: 1.25 ms per loop
-
-We've gotten another big improvement. Let's check again where the time is spent:
-
-.. ipython:: python
-
-   %prun -l 4 apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
-
-As one might expect, the majority of the time is now spent in ``apply_integrate_f``,
-so if we wanted to make anymore efficiencies we must continue to concentrate our
-efforts here.
-
-.. _enhancingperf.boundswrap:
-
-More advanced techniques
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-There is still hope for improvement. Here's an example of using some more
-advanced cython techniques:
-
-.. ipython::
-
-   In [5]: %%cython
-      ...: cimport cython
-      ...: cimport numpy as np
-      ...: import numpy as np
-      ...: cdef double f_typed(double x) except? -2:
-      ...:     return x * (x - 1)
-      ...: cpdef double integrate_f_typed(double a, double b, int N):
-      ...:     cdef int i
-      ...:     cdef double s, dx
-      ...:     s = 0
-      ...:     dx = (b - a) / N
-      ...:     for i in range(N):
-      ...:         s += f_typed(a + i * dx)
-      ...:     return s * dx
-      ...: @cython.boundscheck(False)
-      ...: @cython.wraparound(False)
-      ...: cpdef np.ndarray[double] apply_integrate_f_wrap(np.ndarray[double] col_a, np.ndarray[double] col_b, np.ndarray[int] col_N):
-      ...:     cdef int i, n = len(col_N)
-      ...:     assert len(col_a) == len(col_b) == n
-      ...:     cdef np.ndarray[double] res = np.empty(n)
-      ...:     for i in range(n):
-      ...:         res[i] = integrate_f_typed(col_a[i], col_b[i], col_N[i])
-      ...:     return res
-      ...:
-
-.. code-block:: ipython
-
-   In [4]: %timeit apply_integrate_f_wrap(df['a'].values, df['b'].values, df['N'].values)
-   1000 loops, best of 3: 987 us per loop
-
-Even faster, with the caveat that a bug in our cython code (an off-by-one error,
-for example) might cause a segfault because memory access isn't checked.
-
-
-.. _enhancingperf.numba:
-
-Using numba
------------
-
-A recent alternative to statically compiling cython code, is to use a *dynamic jit-compiler*, ``numba``.
-
-Numba gives you the power to speed up your applications with high performance functions written directly in Python. With a few annotations, array-oriented and math-heavy Python code can be just-in-time compiled to native machine instructions, similar in performance to C, C++ and Fortran, without having to switch languages or Python interpreters.
-
-Numba works by generating optimized machine code using the LLVM compiler infrastructure at import time, runtime, or statically (using the included pycc tool). Numba supports compilation of Python to run on either CPU or GPU hardware, and is designed to integrate with the Python scientific software stack.
-
-.. note::
-
-    You will need to install ``numba``. This is easy with ``conda``, by using: ``conda install numba``, see :ref:`installing using miniconda<install.miniconda>`.
-
-.. note::
-
-    As of ``numba`` version 0.20, pandas objects cannot be passed directly to numba-compiled functions. Instead, one must pass the ``numpy`` array underlying the ``pandas`` object to the numba-compiled function as demonstrated below.
-
-Jit
-~~~
-
-Using ``numba`` to just-in-time compile your code. We simply take the plain python code from above and annotate with the ``@jit`` decorator.
-
-.. code-block:: python
-
-    import numba
-
-    @numba.jit
-    def f_plain(x):
-       return x * (x - 1)
-
-    @numba.jit
-    def integrate_f_numba(a, b, N):
-       s = 0
-       dx = (b - a) / N
-       for i in range(N):
-           s += f_plain(a + i * dx)
-       return s * dx
-
-    @numba.jit
-    def apply_integrate_f_numba(col_a, col_b, col_N):
-       n = len(col_N)
-       result = np.empty(n, dtype='float64')
-       assert len(col_a) == len(col_b) == n
-       for i in range(n):
-          result[i] = integrate_f_numba(col_a[i], col_b[i], col_N[i])
-       return result
-
-    def compute_numba(df):
-       result = apply_integrate_f_numba(df['a'].values, df['b'].values, df['N'].values)
-       return pd.Series(result, index=df.index, name='result')
-
-Note that we directly pass ``numpy`` arrays to the numba function. ``compute_numba`` is just a wrapper that provides a nicer interface by passing/returning pandas objects.
-
-.. code-block:: ipython
-
-    In [4]: %timeit compute_numba(df)
-    1000 loops, best of 3: 798 us per loop
-
-Vectorize
-~~~~~~~~~
-
-``numba`` can also be used to write vectorized functions that do not require the user to explicitly
-loop over the observations of a vector; a vectorized function will be applied to each row automatically.
-Consider the following toy example of doubling each observation:
-
-.. code-block:: python
-
-    import numba
-
-    def double_every_value_nonumba(x):
-        return x*2
-
-    @numba.vectorize
-    def double_every_value_withnumba(x):
-        return x*2
-
-
-    # Custom function without numba
-    In [5]: %timeit df['col1_doubled'] = df.a.apply(double_every_value_nonumba)
-    1000 loops, best of 3: 797 us per loop
-
-    # Standard implementation (faster than a custom function)
-    In [6]: %timeit df['col1_doubled'] = df.a*2
-    1000 loops, best of 3: 233 us per loop
-
-    # Custom function with numba
-    In [7]: %timeit df['col1_doubled'] = double_every_value_withnumba(df.a.values)
-    1000 loops, best of 3: 145 us per loop
-
-Caveats
-~~~~~~~
-
-.. note::
-
-    ``numba`` will execute on any function, but can only accelerate certain classes of functions.
-
-``numba`` is best at accelerating functions that apply numerical functions to numpy arrays. When passed a function that only uses operations it knows how to accelerate, it will execute in ``nopython`` mode.
-
-If ``numba`` is passed a function that includes something it doesn't know how to work with -- a category that currently includes sets, lists, dictionaries, or string functions -- it will revert to ``object mode``. In ``object mode``, numba will execute but your code will not speed up significantly. If you would prefer that ``numba`` throw an error if it cannot compile a function in a way that speeds up your code, pass numba the argument ``nopython=True`` (e.g.  ``@numba.jit(nopython=True)``). For more on troubleshooting ``numba`` modes, see the `numba troubleshooting page <http://numba.pydata.org/numba-doc/0.20.0/user/troubleshoot.html#the-compiled-code-is-too-slow>`__.
-
-Read more in the `numba docs <http://numba.pydata.org/>`__.
-
-.. _enhancingperf.eval:
-
-Expression Evaluation via :func:`~pandas.eval` (Experimental)
--------------------------------------------------------------
-
-.. versionadded:: 0.13
-
-The top-level function :func:`pandas.eval` implements expression evaluation of
-:class:`~pandas.Series` and :class:`~pandas.DataFrame` objects.
-
-.. note::
-
-   To benefit from using :func:`~pandas.eval` you need to
-   install ``numexpr``. See the :ref:`recommended dependencies section
-   <install.recommended_dependencies>` for more details.
-
-The point of using :func:`~pandas.eval` for expression evaluation rather than
-plain Python is two-fold: 1) large :class:`~pandas.DataFrame` objects are
-evaluated more efficiently and 2) large arithmetic and boolean expressions are
-evaluated all at once by the underlying engine (by default ``numexpr`` is used
-for evaluation).
-
-.. note::
-
-   You should not use :func:`~pandas.eval` for simple
-   expressions or for expressions involving small DataFrames. In fact,
-   :func:`~pandas.eval` is many orders of magnitude slower for
-   smaller expressions/objects than plain ol' Python. A good rule of thumb is
-   to only use :func:`~pandas.eval` when you have a
-   :class:`~pandas.core.frame.DataFrame` with more than 10,000 rows.
-
-
-:func:`~pandas.eval` supports all arithmetic expressions supported by the
-engine in addition to some extensions available only in pandas.
-
-.. note::
-
-   The larger the frame and the larger the expression the more speedup you will
-   see from using :func:`~pandas.eval`.
-
-Supported Syntax
-~~~~~~~~~~~~~~~~
-
-These operations are supported by :func:`pandas.eval`:
-
-- Arithmetic operations except for the left shift (``<<``) and right shift
-  (``>>``) operators, e.g., ``df + 2 * pi / s ** 4 % 42 - the_golden_ratio``
-- Comparison operations, including chained comparisons, e.g., ``2 < df < df2``
-- Boolean operations, e.g., ``df < df2 and df3 < df4 or not df_bool``
-- ``list`` and ``tuple`` literals, e.g., ``[1, 2]`` or ``(1, 2)``
-- Attribute access, e.g., ``df.a``
-- Subscript expressions, e.g., ``df[0]``
-- Simple variable evaluation, e.g., ``pd.eval('df')`` (this is not very useful)
-- Math functions, `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
-  `sqrt`, `sinh`, `cosh`, `tanh`, `arcsin`, `arccos`, `arctan`, `arccosh`,
-  `arcsinh`, `arctanh`, `abs` and `arctan2`.
-
-This Python syntax is **not** allowed:
-
-* Expressions
-
-  - Function calls other than math functions.
-  - ``is``/``is not`` operations
-  - ``if`` expressions
-  - ``lambda`` expressions
-  - ``list``/``set``/``dict`` comprehensions
-  - Literal ``dict`` and ``set`` expressions
-  - ``yield`` expressions
-  - Generator expressions
-  - Boolean expressions consisting of only scalar values
-
-* Statements
-
-  - Neither `simple <http://docs.python.org/2/reference/simple_stmts.html>`__
-    nor `compound <http://docs.python.org/2/reference/compound_stmts.html>`__
-    statements are allowed. This includes things like ``for``, ``while``, and
-    ``if``.
-
-
-
-:func:`~pandas.eval` Examples
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-:func:`pandas.eval` works well with expressions containing large arrays.
-
-First let's create a few decent-sized arrays to play with:
-
-.. ipython:: python
-
-   nrows, ncols = 20000, 100
-   df1, df2, df3, df4 = [pd.DataFrame(np.random.randn(nrows, ncols)) for _ in range(4)]
-
-
-Now let's compare adding them together using plain ol' Python versus
-:func:`~pandas.eval`:
-
-.. ipython:: python
-
-   %timeit df1 + df2 + df3 + df4
-
-.. ipython:: python
-
-   %timeit pd.eval('df1 + df2 + df3 + df4')
-
-
-Now let's do the same thing but with comparisons:
-
-.. ipython:: python
-
-   %timeit (df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)
-
-.. ipython:: python
-
-   %timeit pd.eval('(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')
-
-
-:func:`~pandas.eval` also works with unaligned pandas objects:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(50))
-   %timeit df1 + df2 + df3 + df4 + s
-
-.. ipython:: python
-
-   %timeit pd.eval('df1 + df2 + df3 + df4 + s')
-
-.. note::
-
-   Operations such as
-
-      .. code-block:: python
-
-         1 and 2  # would parse to 1 & 2, but should evaluate to 2
-         3 or 4  # would parse to 3 | 4, but should evaluate to 3
-         ~1  # this is okay, but slower when using eval
-
-   should be performed in Python. An exception will be raised if you try to
-   perform any boolean/bitwise operations with scalar operands that are not
-   of type ``bool`` or ``np.bool_``. Again, you should perform these kinds of
-   operations in plain Python.
-
-The ``DataFrame.eval`` method (Experimental)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.13
-
-In addition to the top level :func:`pandas.eval` function you can also
-evaluate an expression in the "context" of a :class:`~pandas.DataFrame`.
-
-.. ipython:: python
-   :suppress:
-
-   try:
-      del a
-   except NameError:
-      pass
-
-   try:
-      del b
-   except NameError:
-      pass
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5, 2), columns=['a', 'b'])
-   df.eval('a + b')
-
-Any expression that is a valid :func:`pandas.eval` expression is also a valid
-:meth:`DataFrame.eval` expression, with the added benefit that you don't have to
-prefix the name of the :class:`~pandas.DataFrame` to the column(s) you're
-interested in evaluating.
-
-In addition, you can perform assignment of columns within an expression.
-This allows for *formulaic evaluation*.  The assignment target can be a
-new column name or an existing column name, and it must be a valid Python
-identifier.
-
-.. versionadded:: 0.18.0
-
-The ``inplace`` keyword determines whether this assignment will performed
-on the original ``DataFrame`` or return a copy with the new column.
-
-.. warning::
-
-   For backwards compatability, ``inplace`` defaults to ``True`` if not
-   specified. This will change in a future version of pandas - if your
-   code depends on an inplace assignment you should update to explicitly
-   set ``inplace=True``
-
-.. ipython:: python
-
-   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
-   df.eval('c = a + b', inplace=True)
-   df.eval('d = a + b + c', inplace=True)
-   df.eval('a = 1', inplace=True)
-   df
-
-When ``inplace`` is set to ``False``, a copy of the ``DataFrame`` with the
-new or modified columns is returned and the original frame is unchanged.
-
-.. ipython:: python
-
-   df
-   df.eval('e = a - c', inplace=False)
-   df
-
-.. versionadded:: 0.18.0
-
-As a convenience, multiple assignments can be performed by using a
-multi-line string.
-
-.. ipython:: python
-
-   df.eval("""
-   c = a + b
-   d = a + b + c
-   a = 1""", inplace=False)
-
-The equivalent in standard Python would be
-
-.. ipython:: python
-
-   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
-   df['c'] = df.a + df.b
-   df['d'] = df.a + df.b + df.c
-   df['a'] = 1
-   df
-
-.. versionadded:: 0.18.0
-
-The ``query`` method gained the ``inplace`` keyword which determines
-whether the query modifies the original frame.
-
-.. ipython:: python
-
-   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
-   df.query('a > 2')
-   df.query('a > 2', inplace=True)
-   df
-
-.. warning::
-
-   Unlike with ``eval``, the default value for ``inplace`` for ``query``
-   is ``False``.  This is consistent with prior versions of pandas.
-
-Local Variables
-~~~~~~~~~~~~~~~
-
-In pandas version 0.14 the local variable API has changed. In pandas 0.13.x,
-you could refer to local variables the same way you would in standard Python.
-For example,
-
-.. code-block:: python
-
-   df = pd.DataFrame(np.random.randn(5, 2), columns=['a', 'b'])
-   newcol = np.random.randn(len(df))
-   df.eval('b + newcol')
-
-   UndefinedVariableError: name 'newcol' is not defined
-
-As you can see from the exception generated, this syntax is no longer allowed.
-You must *explicitly reference* any local variable that you want to use in an
-expression by placing the ``@`` character in front of the name. For example,
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5, 2), columns=list('ab'))
-   newcol = np.random.randn(len(df))
-   df.eval('b + @newcol')
-   df.query('b < @newcol')
-
-If you don't prefix the local variable with ``@``, pandas will raise an
-exception telling you the variable is undefined.
-
-When using :meth:`DataFrame.eval` and :meth:`DataFrame.query`, this allows you
-to have a local variable and a :class:`~pandas.DataFrame` column with the same
-name in an expression.
-
-
-.. ipython:: python
-
-   a = np.random.randn()
-   df.query('@a < a')
-   df.loc[a < df.a]  # same as the previous expression
-
-With :func:`pandas.eval` you cannot use the ``@`` prefix *at all*, because it
-isn't defined in that context. ``pandas`` will let you know this if you try to
-use ``@`` in a top-level call to :func:`pandas.eval`. For example,
-
-.. ipython:: python
-   :okexcept:
-
-   a, b = 1, 2
-   pd.eval('@a + b')
-
-In this case, you should simply refer to the variables like you would in
-standard Python.
-
-.. ipython:: python
-
-   pd.eval('a + b')
-
-
-:func:`pandas.eval` Parsers
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-There are two different parsers and two different engines you can use as
-the backend.
-
-The default ``'pandas'`` parser allows a more intuitive syntax for expressing
-query-like operations (comparisons, conjunctions and disjunctions). In
-particular, the precedence of the ``&`` and ``|`` operators is made equal to
-the precedence of the corresponding boolean operations ``and`` and ``or``.
-
-For example, the above conjunction can be written without parentheses.
-Alternatively, you can use the ``'python'`` parser to enforce strict Python
-semantics.
-
-.. ipython:: python
-
-   expr = '(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)'
-   x = pd.eval(expr, parser='python')
-   expr_no_parens = 'df1 > 0 & df2 > 0 & df3 > 0 & df4 > 0'
-   y = pd.eval(expr_no_parens, parser='pandas')
-   np.all(x == y)
-
-
-The same expression can be "anded" together with the word :keyword:`and` as
-well:
-
-.. ipython:: python
-
-   expr = '(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)'
-   x = pd.eval(expr, parser='python')
-   expr_with_ands = 'df1 > 0 and df2 > 0 and df3 > 0 and df4 > 0'
-   y = pd.eval(expr_with_ands, parser='pandas')
-   np.all(x == y)
-
-
-The ``and`` and ``or`` operators here have the same precedence that they would
-in vanilla Python.
-
-
-:func:`pandas.eval` Backends
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-There's also the option to make :func:`~pandas.eval` operate identical to plain
-ol' Python.
-
-.. note::
-
-   Using the ``'python'`` engine is generally *not* useful, except for testing
-   other evaluation engines against it. You will achieve **no** performance
-   benefits using :func:`~pandas.eval` with ``engine='python'`` and in fact may
-   incur a performance hit.
-
-You can see this by using :func:`pandas.eval` with the ``'python'`` engine. It
-is a bit slower (not by much) than evaluating the same expression in Python
-
-.. ipython:: python
-
-   %timeit df1 + df2 + df3 + df4
-
-.. ipython:: python
-
-   %timeit pd.eval('df1 + df2 + df3 + df4', engine='python')
-
-
-:func:`pandas.eval` Performance
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-:func:`~pandas.eval` is intended to speed up certain kinds of operations. In
-particular, those operations involving complex expressions with large
-:class:`~pandas.DataFrame`/:class:`~pandas.Series` objects should see a
-significant performance benefit.  Here is a plot showing the running time of
-:func:`pandas.eval` as function of the size of the frame involved in the
-computation. The two lines are two different engines.
-
-
-.. image:: _static/eval-perf.png
-
-
-.. note::
-
-   Operations with smallish objects (around 15k-20k rows) are faster using
-   plain Python:
-
-       .. image:: _static/eval-perf-small.png
-
-
-This plot was created using a ``DataFrame`` with 3 columns each containing
-floating point values generated using ``numpy.random.randn()``.
-
-Technical Minutia Regarding Expression Evaluation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Expressions that would result in an object dtype or involve datetime operations
-(because of ``NaT``) must be evaluated in Python space. The main reason for
-this behavior is to maintain backwards compatibility with versions of numpy <
-1.7. In those versions of ``numpy`` a call to ``ndarray.astype(str)`` will
-truncate any strings that are more than 60 characters in length. Second, we
-can't pass ``object`` arrays to ``numexpr`` thus string comparisons must be
-evaluated in Python space.
-
-The upshot is that this *only* applies to object-dtype'd expressions. So, if
-you have an expression--for example
-
-.. ipython:: python
-
-   df = pd.DataFrame({'strings': np.repeat(list('cba'), 3),
-                      'nums': np.repeat(range(3), 3)})
-   df
-   df.query('strings == "a" and nums == 1')
-
-the numeric part of the comparison (``nums == 1``) will be evaluated by
-``numexpr``.
-
-In general, :meth:`DataFrame.query`/:func:`pandas.eval` will
-evaluate the subexpressions that *can* be evaluated by ``numexpr`` and those
-that must be evaluated in Python space transparently to the user. This is done
-by inferring the result type of an expression from its arguments and operators.
diff --git a/doc/source/getting_started/10min.rst b/doc/source/getting_started/10min.rst
new file mode 100644
index 0000000000000..50c53a56174c8
--- /dev/null
+++ b/doc/source/getting_started/10min.rst
@@ -0,0 +1,820 @@
+.. _10min:
+
+{{ header }}
+
+********************
+10 Minutes to pandas
+********************
+
+This is a short introduction to pandas, geared mainly for new users.
+You can see more complex recipes in the :ref:`Cookbook<cookbook>`.
+
+Customarily, we import as follows:
+
+.. ipython:: python
+
+   import numpy as np
+   import pandas as pd
+
+Object Creation
+---------------
+
+See the :ref:`Data Structure Intro section <dsintro>`.
+
+Creating a :class:`Series` by passing a list of values, letting pandas create
+a default integer index:
+
+.. ipython:: python
+
+   s = pd.Series([1, 3, 5, np.nan, 6, 8])
+   s
+
+Creating a :class:`DataFrame` by passing a NumPy array, with a datetime index
+and labeled columns:
+
+.. ipython:: python
+
+   dates = pd.date_range('20130101', periods=6)
+   dates
+   df = pd.DataFrame(np.random.randn(6, 4), index=dates, columns=list('ABCD'))
+   df
+
+Creating a ``DataFrame`` by passing a dict of objects that can be converted to series-like.
+
+.. ipython:: python
+
+   df2 = pd.DataFrame({'A': 1.,
+                       'B': pd.Timestamp('20130102'),
+                       'C': pd.Series(1, index=list(range(4)), dtype='float32'),
+                       'D': np.array([3] * 4, dtype='int32'),
+                       'E': pd.Categorical(["test", "train", "test", "train"]),
+                       'F': 'foo'})
+   df2
+
+The columns of the resulting ``DataFrame`` have different
+:ref:`dtypes <basics.dtypes>`.
+
+.. ipython:: python
+
+   df2.dtypes
+
+If you're using IPython, tab completion for column names (as well as public
+attributes) is automatically enabled. Here's a subset of the attributes that
+will be completed:
+
+.. ipython::
+
+   @verbatim
+   In [1]: df2.<TAB>  # noqa: E225, E999
+   df2.A                  df2.bool
+   df2.abs                df2.boxplot
+   df2.add                df2.C
+   df2.add_prefix         df2.clip
+   df2.add_suffix         df2.clip_lower
+   df2.align              df2.clip_upper
+   df2.all                df2.columns
+   df2.any                df2.combine
+   df2.append             df2.combine_first
+   df2.apply              df2.compound
+   df2.applymap           df2.consolidate
+   df2.D
+
+As you can see, the columns ``A``, ``B``, ``C``, and ``D`` are automatically
+tab completed. ``E`` is there as well; the rest of the attributes have been
+truncated for brevity.
+
+Viewing Data
+------------
+
+See the :ref:`Basics section <basics>`.
+
+Here is how to view the top and bottom rows of the frame:
+
+.. ipython:: python
+
+   df.head()
+   df.tail(3)
+
+Display the index, columns:
+
+.. ipython:: python
+
+   df.index
+   df.columns
+
+:meth:`DataFrame.to_numpy` gives a NumPy representation of the underlying data.
+Note that this can be an expensive operation when your :class:`DataFrame` has
+columns with different data types, which comes down to a fundamental difference
+between pandas and NumPy: **NumPy arrays have one dtype for the entire array,
+while pandas DataFrames have one dtype per column**. When you call
+:meth:`DataFrame.to_numpy`, pandas will find the NumPy dtype that can hold *all*
+of the dtypes in the DataFrame. This may end up being ``object``, which requires
+casting every value to a Python object.
+
+For ``df``, our :class:`DataFrame` of all floating-point values,
+:meth:`DataFrame.to_numpy` is fast and doesn't require copying data.
+
+.. ipython:: python
+
+   df.to_numpy()
+
+For ``df2``, the :class:`DataFrame` with multiple dtypes,
+:meth:`DataFrame.to_numpy` is relatively expensive.
+
+.. ipython:: python
+
+   df2.to_numpy()
+
+.. note::
+
+   :meth:`DataFrame.to_numpy` does *not* include the index or column
+   labels in the output.
+
+:func:`~DataFrame.describe` shows a quick statistic summary of your data:
+
+.. ipython:: python
+
+   df.describe()
+
+Transposing your data:
+
+.. ipython:: python
+
+   df.T
+
+Sorting by an axis:
+
+.. ipython:: python
+
+   df.sort_index(axis=1, ascending=False)
+
+Sorting by values:
+
+.. ipython:: python
+
+   df.sort_values(by='B')
+
+Selection
+---------
+
+.. note::
+
+   While standard Python / Numpy expressions for selecting and setting are
+   intuitive and come in handy for interactive work, for production code, we
+   recommend the optimized pandas data access methods, ``.at``, ``.iat``,
+   ``.loc`` and ``.iloc``.
+
+See the indexing documentation :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`.
+
+Getting
+~~~~~~~
+
+Selecting a single column, which yields a ``Series``,
+equivalent to ``df.A``:
+
+.. ipython:: python
+
+   df['A']
+
+Selecting via ``[]``, which slices the rows.
+
+.. ipython:: python
+
+   df[0:3]
+   df['20130102':'20130104']
+
+Selection by Label
+~~~~~~~~~~~~~~~~~~
+
+See more in :ref:`Selection by Label <indexing.label>`.
+
+For getting a cross section using a label:
+
+.. ipython:: python
+
+   df.loc[dates[0]]
+
+Selecting on a multi-axis by label:
+
+.. ipython:: python
+
+   df.loc[:, ['A', 'B']]
+
+Showing label slicing, both endpoints are *included*:
+
+.. ipython:: python
+
+   df.loc['20130102':'20130104', ['A', 'B']]
+
+Reduction in the dimensions of the returned object:
+
+.. ipython:: python
+
+   df.loc['20130102', ['A', 'B']]
+
+For getting a scalar value:
+
+.. ipython:: python
+
+   df.loc[dates[0], 'A']
+
+For getting fast access to a scalar (equivalent to the prior method):
+
+.. ipython:: python
+
+   df.at[dates[0], 'A']
+
+Selection by Position
+~~~~~~~~~~~~~~~~~~~~~
+
+See more in :ref:`Selection by Position <indexing.integer>`.
+
+Select via the position of the passed integers:
+
+.. ipython:: python
+
+   df.iloc[3]
+
+By integer slices, acting similar to numpy/python:
+
+.. ipython:: python
+
+   df.iloc[3:5, 0:2]
+
+By lists of integer position locations, similar to the numpy/python style:
+
+.. ipython:: python
+
+   df.iloc[[1, 2, 4], [0, 2]]
+
+For slicing rows explicitly:
+
+.. ipython:: python
+
+   df.iloc[1:3, :]
+
+For slicing columns explicitly:
+
+.. ipython:: python
+
+   df.iloc[:, 1:3]
+
+For getting a value explicitly:
+
+.. ipython:: python
+
+   df.iloc[1, 1]
+
+For getting fast access to a scalar (equivalent to the prior method):
+
+.. ipython:: python
+
+   df.iat[1, 1]
+
+Boolean Indexing
+~~~~~~~~~~~~~~~~
+
+Using a single column's values to select data.
+
+.. ipython:: python
+
+   df[df.A > 0]
+
+Selecting values from a DataFrame where a boolean condition is met.
+
+.. ipython:: python
+
+   df[df > 0]
+
+Using the :func:`~Series.isin` method for filtering:
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2['E'] = ['one', 'one', 'two', 'three', 'four', 'three']
+   df2
+   df2[df2['E'].isin(['two', 'four'])]
+
+Setting
+~~~~~~~
+
+Setting a new column automatically aligns the data
+by the indexes.
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3, 4, 5, 6], index=pd.date_range('20130102', periods=6))
+   s1
+   df['F'] = s1
+
+Setting values by label:
+
+.. ipython:: python
+
+   df.at[dates[0], 'A'] = 0
+
+Setting values by position:
+
+.. ipython:: python
+
+   df.iat[0, 1] = 0
+
+Setting by assigning with a NumPy array:
+
+.. ipython:: python
+
+   df.loc[:, 'D'] = np.array([5] * len(df))
+
+The result of the prior setting operations.
+
+.. ipython:: python
+
+   df
+
+A ``where`` operation with setting.
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2[df2 > 0] = -df2
+   df2
+
+
+Missing Data
+------------
+
+pandas primarily uses the value ``np.nan`` to represent missing data. It is by
+default not included in computations. See the :ref:`Missing Data section
+<missing_data>`.
+
+Reindexing allows you to change/add/delete the index on a specified axis. This
+returns a copy of the data.
+
+.. ipython:: python
+
+   df1 = df.reindex(index=dates[0:4], columns=list(df.columns) + ['E'])
+   df1.loc[dates[0]:dates[1], 'E'] = 1
+   df1
+
+To drop any rows that have missing data.
+
+.. ipython:: python
+
+   df1.dropna(how='any')
+
+Filling missing data.
+
+.. ipython:: python
+
+   df1.fillna(value=5)
+
+To get the boolean mask where values are ``nan``.
+
+.. ipython:: python
+
+   pd.isna(df1)
+
+
+Operations
+----------
+
+See the :ref:`Basic section on Binary Ops <basics.binop>`.
+
+Stats
+~~~~~
+
+Operations in general *exclude* missing data.
+
+Performing a descriptive statistic:
+
+.. ipython:: python
+
+   df.mean()
+
+Same operation on the other axis:
+
+.. ipython:: python
+
+   df.mean(1)
+
+Operating with objects that have different dimensionality and need alignment.
+In addition, pandas automatically broadcasts along the specified dimension.
+
+.. ipython:: python
+
+   s = pd.Series([1, 3, 5, np.nan, 6, 8], index=dates).shift(2)
+   s
+   df.sub(s, axis='index')
+
+
+Apply
+~~~~~
+
+Applying functions to the data:
+
+.. ipython:: python
+
+   df.apply(np.cumsum)
+   df.apply(lambda x: x.max() - x.min())
+
+Histogramming
+~~~~~~~~~~~~~
+
+See more at :ref:`Histogramming and Discretization <basics.discretization>`.
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randint(0, 7, size=10))
+   s
+   s.value_counts()
+
+String Methods
+~~~~~~~~~~~~~~
+
+Series is equipped with a set of string processing methods in the `str`
+attribute that make it easy to operate on each element of the array, as in the
+code snippet below. Note that pattern-matching in `str` generally uses `regular
+expressions <https://docs.python.org/3/library/re.html>`__ by default (and in
+some cases always uses them). See more at :ref:`Vectorized String Methods
+<text.string_methods>`.
+
+.. ipython:: python
+
+   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
+   s.str.lower()
+
+Merge
+-----
+
+Concat
+~~~~~~
+
+pandas provides various facilities for easily combining together Series,
+DataFrame, and Panel objects with various kinds of set logic for the indexes
+and relational algebra functionality in the case of join / merge-type
+operations.
+
+See the :ref:`Merging section <merging>`.
+
+Concatenating pandas objects together with :func:`concat`:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 4))
+   df
+
+   # break it into pieces
+   pieces = [df[:3], df[3:7], df[7:]]
+
+   pd.concat(pieces)
+
+Join
+~~~~
+
+SQL style merges. See the :ref:`Database style joining <merging.join>` section.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': ['foo', 'foo'], 'lval': [1, 2]})
+   right = pd.DataFrame({'key': ['foo', 'foo'], 'rval': [4, 5]})
+   left
+   right
+   pd.merge(left, right, on='key')
+
+Another example that can be given is:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': ['foo', 'bar'], 'lval': [1, 2]})
+   right = pd.DataFrame({'key': ['foo', 'bar'], 'rval': [4, 5]})
+   left
+   right
+   pd.merge(left, right, on='key')
+
+
+Append
+~~~~~~
+
+Append rows to a dataframe. See the :ref:`Appending <merging.concatenation>`
+section.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
+   df
+   s = df.iloc[3]
+   df.append(s, ignore_index=True)
+
+
+Grouping
+--------
+
+By "group by" we are referring to a process involving one or more of the
+following steps:
+
+ - **Splitting** the data into groups based on some criteria
+ - **Applying** a function to each group independently
+ - **Combining** the results into a data structure
+
+See the :ref:`Grouping section <groupby>`.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'foo', 'foo'],
+                      'B': ['one', 'one', 'two', 'three',
+                            'two', 'two', 'one', 'three'],
+                      'C': np.random.randn(8),
+                      'D': np.random.randn(8)})
+   df
+
+Grouping and then applying the :meth:`~DataFrame.sum` function to the resulting
+groups.
+
+.. ipython:: python
+
+   df.groupby('A').sum()
+
+Grouping by multiple columns forms a hierarchical index, and again we can
+apply the ``sum`` function.
+
+.. ipython:: python
+
+   df.groupby(['A', 'B']).sum()
+
+Reshaping
+---------
+
+See the sections on :ref:`Hierarchical Indexing <advanced.hierarchical>` and
+:ref:`Reshaping <reshaping.stacking>`.
+
+Stack
+~~~~~
+
+.. ipython:: python
+
+   tuples = list(zip(*[['bar', 'bar', 'baz', 'baz',
+                        'foo', 'foo', 'qux', 'qux'],
+                       ['one', 'two', 'one', 'two',
+                        'one', 'two', 'one', 'two']]))
+   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
+   df = pd.DataFrame(np.random.randn(8, 2), index=index, columns=['A', 'B'])
+   df2 = df[:4]
+   df2
+
+The :meth:`~DataFrame.stack` method "compresses" a level in the DataFrame's
+columns.
+
+.. ipython:: python
+
+   stacked = df2.stack()
+   stacked
+
+With a "stacked" DataFrame or Series (having a ``MultiIndex`` as the
+``index``), the inverse operation of :meth:`~DataFrame.stack` is
+:meth:`~DataFrame.unstack`, which by default unstacks the **last level**:
+
+.. ipython:: python
+
+   stacked.unstack()
+   stacked.unstack(1)
+   stacked.unstack(0)
+
+Pivot Tables
+~~~~~~~~~~~~
+See the section on :ref:`Pivot Tables <reshaping.pivot>`.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 3,
+                      'B': ['A', 'B', 'C'] * 4,
+                      'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 2,
+                      'D': np.random.randn(12),
+                      'E': np.random.randn(12)})
+   df
+
+We can produce pivot tables from this data very easily:
+
+.. ipython:: python
+
+   pd.pivot_table(df, values='D', index=['A', 'B'], columns=['C'])
+
+
+Time Series
+-----------
+
+pandas has simple, powerful, and efficient functionality for performing
+resampling operations during frequency conversion (e.g., converting secondly
+data into 5-minutely data). This is extremely common in, but not limited to,
+financial applications. See the :ref:`Time Series section <timeseries>`.
+
+.. ipython:: python
+
+   rng = pd.date_range('1/1/2012', periods=100, freq='S')
+   ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
+   ts.resample('5Min').sum()
+
+Time zone representation:
+
+.. ipython:: python
+
+   rng = pd.date_range('3/6/2012 00:00', periods=5, freq='D')
+   ts = pd.Series(np.random.randn(len(rng)), rng)
+   ts
+   ts_utc = ts.tz_localize('UTC')
+   ts_utc
+
+Converting to another time zone:
+
+.. ipython:: python
+
+   ts_utc.tz_convert('US/Eastern')
+
+Converting between time span representations:
+
+.. ipython:: python
+
+   rng = pd.date_range('1/1/2012', periods=5, freq='M')
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
+   ts
+   ps = ts.to_period()
+   ps
+   ps.to_timestamp()
+
+Converting between period and timestamp enables some convenient arithmetic
+functions to be used. In the following example, we convert a quarterly
+frequency with year ending in November to 9am of the end of the month following
+the quarter end:
+
+.. ipython:: python
+
+   prng = pd.period_range('1990Q1', '2000Q4', freq='Q-NOV')
+   ts = pd.Series(np.random.randn(len(prng)), prng)
+   ts.index = (prng.asfreq('M', 'e') + 1).asfreq('H', 's') + 9
+   ts.head()
+
+Categoricals
+------------
+
+pandas can include categorical data in a ``DataFrame``. For full docs, see the
+:ref:`categorical introduction <categorical>` and the :ref:`API documentation <api.arrays.categorical>`.
+
+.. ipython:: python
+
+    df = pd.DataFrame({"id": [1, 2, 3, 4, 5, 6],
+                       "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+
+Convert the raw grades to a categorical data type.
+
+.. ipython:: python
+
+    df["grade"] = df["raw_grade"].astype("category")
+    df["grade"]
+
+Rename the categories to more meaningful names (assigning to
+``Series.cat.categories`` is inplace!).
+
+.. ipython:: python
+
+    df["grade"].cat.categories = ["very good", "good", "very bad"]
+
+Reorder the categories and simultaneously add the missing categories (methods under ``Series
+.cat`` return a new ``Series`` by default).
+
+.. ipython:: python
+
+    df["grade"] = df["grade"].cat.set_categories(["very bad", "bad", "medium",
+                                                  "good", "very good"])
+    df["grade"]
+
+Sorting is per order in the categories, not lexical order.
+
+.. ipython:: python
+
+    df.sort_values(by="grade")
+
+Grouping by a categorical column also shows empty categories.
+
+.. ipython:: python
+
+    df.groupby("grade").size()
+
+
+Plotting
+--------
+
+See the :ref:`Plotting <visualization>` docs.
+
+.. ipython:: python
+   :suppress:
+
+   import matplotlib.pyplot as plt
+   plt.close('all')
+
+.. ipython:: python
+
+   ts = pd.Series(np.random.randn(1000),
+                  index=pd.date_range('1/1/2000', periods=1000))
+   ts = ts.cumsum()
+
+   @savefig series_plot_basic.png
+   ts.plot()
+
+On a DataFrame, the :meth:`~DataFrame.plot` method is a convenience to plot all
+of the columns with labels:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index,
+                     columns=['A', 'B', 'C', 'D'])
+   df = df.cumsum()
+
+   plt.figure()
+   df.plot()
+   @savefig frame_plot_basic.png
+   plt.legend(loc='best')
+
+Getting Data In/Out
+-------------------
+
+CSV
+~~~
+
+:ref:`Writing to a csv file. <io.store_in_csv>`
+
+.. ipython:: python
+
+   df.to_csv('foo.csv')
+
+:ref:`Reading from a csv file. <io.read_csv_table>`
+
+.. ipython:: python
+
+   pd.read_csv('foo.csv')
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('foo.csv')
+
+HDF5
+~~~~
+
+Reading and writing to :ref:`HDFStores <io.hdf5>`.
+
+Writing to a HDF5 Store.
+
+.. ipython:: python
+
+   df.to_hdf('foo.h5', 'df')
+
+Reading from a HDF5 Store.
+
+.. ipython:: python
+
+   pd.read_hdf('foo.h5', 'df')
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('foo.h5')
+
+Excel
+~~~~~
+
+Reading and writing to :ref:`MS Excel <io.excel>`.
+
+Writing to an excel file.
+
+.. ipython:: python
+
+   df.to_excel('foo.xlsx', sheet_name='Sheet1')
+
+Reading from an excel file.
+
+.. ipython:: python
+
+   pd.read_excel('foo.xlsx', 'Sheet1', index_col=None, na_values=['NA'])
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('foo.xlsx')
+
+Gotchas
+-------
+
+If you are attempting to perform an operation you might see an exception like:
+
+.. code-block:: python
+
+    >>> if pd.Series([False, True, False]):
+    ...     print("I was true")
+    Traceback
+        ...
+    ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
+
+See :ref:`Comparisons<basics.compare>` for an explanation and what to do.
+
+See :ref:`Gotchas<gotchas>` as well.
diff --git a/doc/source/getting_started/basics.rst b/doc/source/getting_started/basics.rst
new file mode 100644
index 0000000000000..bbec7b5de1d2e
--- /dev/null
+++ b/doc/source/getting_started/basics.rst
@@ -0,0 +1,2350 @@
+.. _basics:
+
+{{ header }}
+
+==============================
+ Essential Basic Functionality
+==============================
+
+Here we discuss a lot of the essential functionality common to the pandas data
+structures. Here's how to create some of the objects used in the examples from
+the previous section:
+
+.. ipython:: python
+
+   index = pd.date_range('1/1/2000', periods=8)
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   df = pd.DataFrame(np.random.randn(8, 3), index=index,
+                     columns=['A', 'B', 'C'])
+   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                 major_axis=pd.date_range('1/1/2000', periods=5),
+                 minor_axis=['A', 'B', 'C', 'D'])
+
+.. _basics.head_tail:
+
+Head and Tail
+-------------
+
+To view a small sample of a Series or DataFrame object, use the
+:meth:`~DataFrame.head` and :meth:`~DataFrame.tail` methods. The default number
+of elements to display is five, but you may pass a custom number.
+
+.. ipython:: python
+
+   long_series = pd.Series(np.random.randn(1000))
+   long_series.head()
+   long_series.tail(3)
+
+.. _basics.attrs:
+
+Attributes and Underlying Data
+------------------------------
+
+pandas objects have a number of attributes enabling you to access the metadata
+
+* **shape**: gives the axis dimensions of the object, consistent with ndarray
+* Axis labels
+    * **Series**: *index* (only axis)
+    * **DataFrame**: *index* (rows) and *columns*
+    * **Panel**: *items*, *major_axis*, and *minor_axis*
+
+Note, **these attributes can be safely assigned to**!
+
+.. ipython:: python
+
+   df[:2]
+   df.columns = [x.lower() for x in df.columns]
+   df
+
+Pandas objects (:class:`Index`, :class:`Series`, :class:`DataFrame`) can be
+thought of as containers for arrays, which hold the actual data and do the
+actual computation. For many types, the underlying array is a
+:class:`numpy.ndarray`. However, pandas and 3rd party libraries may *extend*
+NumPy's type system to add support for custom arrays
+(see :ref:`basics.dtypes`).
+
+To get the actual data inside a :class:`Index` or :class:`Series`, use
+the ``.array`` property
+
+.. ipython:: python
+
+   s.array
+   s.index.array
+
+:attr:`~Series.array` will always be an :class:`~pandas.api.extensions.ExtensionArray`.
+The exact details of what an :class:`~pandas.api.extensions.ExtensionArray` is and why pandas uses them is a bit
+beyond the scope of this introduction. See :ref:`basics.dtypes` for more.
+
+If you know you need a NumPy array, use :meth:`~Series.to_numpy`
+or :meth:`numpy.asarray`.
+
+.. ipython:: python
+
+   s.to_numpy()
+   np.asarray(s)
+
+When the Series or Index is backed by
+an :class:`~pandas.api.extensions.ExtensionArray`, :meth:`~Series.to_numpy`
+may involve copying data and coercing values. See :ref:`basics.dtypes` for more.
+
+:meth:`~Series.to_numpy` gives some control over the ``dtype`` of the
+resulting :class:`numpy.ndarray`. For example, consider datetimes with timezones.
+NumPy doesn't have a dtype to represent timezone-aware datetimes, so there
+are two possibly useful representations:
+
+1. An object-dtype :class:`numpy.ndarray` with :class:`Timestamp` objects, each
+   with the correct ``tz``
+2. A ``datetime64[ns]`` -dtype :class:`numpy.ndarray`, where the values have
+   been converted to UTC and the timezone discarded
+
+Timezones may be preserved with ``dtype=object``
+
+.. ipython:: python
+
+   ser = pd.Series(pd.date_range('2000', periods=2, tz="CET"))
+   ser.to_numpy(dtype=object)
+
+Or thrown away with ``dtype='datetime64[ns]'``
+
+.. ipython:: python
+
+   ser.to_numpy(dtype="datetime64[ns]")
+
+Getting the "raw data" inside a :class:`DataFrame` is possibly a bit more
+complex. When your ``DataFrame`` only has a single data type for all the
+columns, :meth:`DataFrame.to_numpy` will return the underlying data:
+
+.. ipython:: python
+
+   df.to_numpy()
+
+If a DataFrame or Panel contains homogeneously-typed data, the ndarray can
+actually be modified in-place, and the changes will be reflected in the data
+structure. For heterogeneous data (e.g. some of the DataFrame's columns are not
+all the same dtype), this will not be the case. The values attribute itself,
+unlike the axis labels, cannot be assigned to.
+
+.. note::
+
+    When working with heterogeneous data, the dtype of the resulting ndarray
+    will be chosen to accommodate all of the data involved. For example, if
+    strings are involved, the result will be of object dtype. If there are only
+    floats and integers, the resulting array will be of float dtype.
+
+In the past, pandas recommended :attr:`Series.values` or :attr:`DataFrame.values`
+for extracting the data from a Series or DataFrame. You'll still find references
+to these in old code bases and online. Going forward, we recommend avoiding
+``.values`` and using ``.array`` or ``.to_numpy()``. ``.values`` has the following
+drawbacks:
+
+1. When your Series contains an :ref:`extension type <extending.extension-types>`, it's
+   unclear whether :attr:`Series.values` returns a NumPy array or the extension array.
+   :attr:`Series.array` will always return an :class:`~pandas.api.extensions.ExtensionArray`, and will never
+   copy data. :meth:`Series.to_numpy` will always return a NumPy array,
+   potentially at the cost of copying / coercing values.
+2. When your DataFrame contains a mixture of data types, :attr:`DataFrame.values` may
+   involve copying data and coercing values to a common dtype, a relatively expensive
+   operation. :meth:`DataFrame.to_numpy`, being a method, makes it clearer that the
+   returned NumPy array may not be a view on the same data in the DataFrame.
+
+.. _basics.accelerate:
+
+Accelerated operations
+----------------------
+
+pandas has support for accelerating certain types of binary numerical and boolean operations using
+the ``numexpr`` library and the ``bottleneck`` libraries.
+
+These libraries are especially useful when dealing with large data sets, and provide large
+speedups. ``numexpr`` uses smart chunking, caching, and multiple cores. ``bottleneck`` is
+a set of specialized cython routines that are especially fast when dealing with arrays that have
+``nans``.
+
+Here is a sample (using 100 column x 100,000 row ``DataFrames``):
+
+.. csv-table::
+    :header: "Operation", "0.11.0 (ms)", "Prior Version (ms)", "Ratio to Prior"
+    :widths: 25, 25, 25, 25
+    :delim: ;
+
+    ``df1 > df2``; 13.32; 125.35;  0.1063
+    ``df1 * df2``; 21.71;  36.63;  0.5928
+    ``df1 + df2``; 22.04;  36.50;  0.6039
+
+You are highly encouraged to install both libraries. See the section
+:ref:`Recommended Dependencies <install.recommended_dependencies>` for more installation info.
+
+These are both enabled to be used by default, you can control this by setting the options:
+
+.. versionadded:: 0.20.0
+
+.. code-block:: python
+
+   pd.set_option('compute.use_bottleneck', False)
+   pd.set_option('compute.use_numexpr', False)
+
+.. _basics.binop:
+
+Flexible binary operations
+--------------------------
+
+With binary operations between pandas data structures, there are two key points
+of interest:
+
+* Broadcasting behavior between higher- (e.g. DataFrame) and
+  lower-dimensional (e.g. Series) objects.
+* Missing data in computations.
+
+We will demonstrate how to manage these issues independently, though they can
+be handled simultaneously.
+
+Matching / broadcasting behavior
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+DataFrame has the methods :meth:`~DataFrame.add`, :meth:`~DataFrame.sub`,
+:meth:`~DataFrame.mul`, :meth:`~DataFrame.div` and related functions
+:meth:`~DataFrame.radd`, :meth:`~DataFrame.rsub`, ...
+for carrying out binary operations. For broadcasting behavior,
+Series input is of primary interest. Using these functions, you can use to
+either match on the *index* or *columns* via the **axis** keyword:
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+       'one': pd.Series(np.random.randn(3), index=['a', 'b', 'c']),
+       'two': pd.Series(np.random.randn(4), index=['a', 'b', 'c', 'd']),
+       'three': pd.Series(np.random.randn(3), index=['b', 'c', 'd'])})
+   df
+   row = df.iloc[1]
+   column = df['two']
+
+   df.sub(row, axis='columns')
+   df.sub(row, axis=1)
+
+   df.sub(column, axis='index')
+   df.sub(column, axis=0)
+
+.. ipython:: python
+   :suppress:
+
+   df_orig = df
+
+Furthermore you can align a level of a MultiIndexed DataFrame with a Series.
+
+.. ipython:: python
+
+   dfmi = df.copy()
+   dfmi.index = pd.MultiIndex.from_tuples([(1, 'a'), (1, 'b'),
+                                           (1, 'c'), (2, 'a')],
+                                          names=['first', 'second'])
+   dfmi.sub(column, axis=0, level='second')
+
+With Panel, describing the matching behavior is a bit more difficult, so
+the arithmetic methods instead (and perhaps confusingly?) give you the option
+to specify the *broadcast axis*. For example, suppose we wished to demean the
+data over a particular axis. This can be accomplished by taking the mean over
+an axis and broadcasting over the same axis:
+
+.. ipython:: python
+
+   major_mean = wp.mean(axis='major')
+   major_mean
+   wp.sub(major_mean, axis='major')
+
+And similarly for ``axis="items"`` and ``axis="minor"``.
+
+.. note::
+
+   I could be convinced to make the **axis** argument in the DataFrame methods
+   match the broadcasting behavior of Panel. Though it would require a
+   transition period so users can change their code...
+
+Series and Index also support the :func:`divmod` builtin. This function takes
+the floor division and modulo operation at the same time returning a two-tuple
+of the same type as the left hand side. For example:
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(10))
+   s
+   div, rem = divmod(s, 3)
+   div
+   rem
+
+   idx = pd.Index(np.arange(10))
+   idx
+   div, rem = divmod(idx, 3)
+   div
+   rem
+
+We can also do elementwise :func:`divmod`:
+
+.. ipython:: python
+
+   div, rem = divmod(s, [2, 2, 3, 3, 4, 4, 5, 5, 6, 6])
+   div
+   rem
+
+Missing data / operations with fill values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In Series and DataFrame, the arithmetic functions have the option of inputting
+a *fill_value*, namely a value to substitute when at most one of the values at
+a location are missing. For example, when adding two DataFrame objects, you may
+wish to treat NaN as 0 unless both DataFrames are missing that value, in which
+case the result will be NaN (you can later replace NaN with some other value
+using ``fillna`` if you wish).
+
+.. ipython:: python
+   :suppress:
+
+   df2 = df.copy()
+   df2['three']['a'] = 1.
+
+.. ipython:: python
+
+   df
+   df2
+   df + df2
+   df.add(df2, fill_value=0)
+
+.. _basics.compare:
+
+Flexible Comparisons
+~~~~~~~~~~~~~~~~~~~~
+
+Series and DataFrame have the binary comparison methods ``eq``, ``ne``, ``lt``, ``gt``,
+``le``, and ``ge`` whose behavior is analogous to the binary
+arithmetic operations described above:
+
+.. ipython:: python
+
+   df.gt(df2)
+   df2.ne(df)
+
+These operations produce a pandas object of the same type as the left-hand-side
+input that is of dtype ``bool``. These ``boolean`` objects can be used in
+indexing operations, see the section on :ref:`Boolean indexing<indexing.boolean>`.
+
+.. _basics.reductions:
+
+Boolean Reductions
+~~~~~~~~~~~~~~~~~~
+
+You can apply the reductions: :attr:`~DataFrame.empty`, :meth:`~DataFrame.any`,
+:meth:`~DataFrame.all`, and :meth:`~DataFrame.bool` to provide a
+way to summarize a boolean result.
+
+.. ipython:: python
+
+   (df > 0).all()
+   (df > 0).any()
+
+You can reduce to a final boolean value.
+
+.. ipython:: python
+
+   (df > 0).any().any()
+
+You can test if a pandas object is empty, via the :attr:`~DataFrame.empty` property.
+
+.. ipython:: python
+
+   df.empty
+   pd.DataFrame(columns=list('ABC')).empty
+
+To evaluate single-element pandas objects in a boolean context, use the method
+:meth:`~DataFrame.bool`:
+
+.. ipython:: python
+
+   pd.Series([True]).bool()
+   pd.Series([False]).bool()
+   pd.DataFrame([[True]]).bool()
+   pd.DataFrame([[False]]).bool()
+
+.. warning::
+
+   You might be tempted to do the following:
+
+   .. code-block:: python
+
+      >>> if df:
+      ...     pass
+
+   Or
+
+   .. code-block:: python
+
+      >>> df and df2
+
+   These will both raise errors, as you are trying to compare multiple values.::
+
+       ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
+
+See :ref:`gotchas<gotchas.truth>` for a more detailed discussion.
+
+.. _basics.equals:
+
+Comparing if objects are equivalent
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Often you may find that there is more than one way to compute the same
+result.  As a simple example, consider ``df + df`` and ``df * 2``. To test
+that these two computations produce the same result, given the tools
+shown above, you might imagine using ``(df + df == df * 2).all()``. But in
+fact, this expression is False:
+
+.. ipython:: python
+
+   df + df == df * 2
+   (df + df == df * 2).all()
+
+Notice that the boolean DataFrame ``df + df == df * 2`` contains some False values!
+This is because NaNs do not compare as equals:
+
+.. ipython:: python
+
+   np.nan == np.nan
+
+So, NDFrames (such as Series, DataFrames, and Panels)
+have an :meth:`~DataFrame.equals` method for testing equality, with NaNs in
+corresponding locations treated as equal.
+
+.. ipython:: python
+
+   (df + df).equals(df * 2)
+
+Note that the Series or DataFrame index needs to be in the same order for
+equality to be True:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'col': ['foo', 0, np.nan]})
+   df2 = pd.DataFrame({'col': [np.nan, 0, 'foo']}, index=[2, 1, 0])
+   df1.equals(df2)
+   df1.equals(df2.sort_index())
+
+Comparing array-like objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can conveniently perform element-wise comparisons when comparing a pandas
+data structure with a scalar value:
+
+.. ipython:: python
+
+   pd.Series(['foo', 'bar', 'baz']) == 'foo'
+   pd.Index(['foo', 'bar', 'baz']) == 'foo'
+
+Pandas also handles element-wise comparisons between different array-like
+objects of the same length:
+
+.. ipython:: python
+
+    pd.Series(['foo', 'bar', 'baz']) == pd.Index(['foo', 'bar', 'qux'])
+    pd.Series(['foo', 'bar', 'baz']) == np.array(['foo', 'bar', 'qux'])
+
+Trying to compare ``Index`` or ``Series`` objects of different lengths will
+raise a ValueError:
+
+.. code-block:: ipython
+
+    In [55]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo', 'bar'])
+    ValueError: Series lengths must match to compare
+
+    In [56]: pd.Series(['foo', 'bar', 'baz']) == pd.Series(['foo'])
+    ValueError: Series lengths must match to compare
+
+Note that this is different from the NumPy behavior where a comparison can
+be broadcast:
+
+.. ipython:: python
+
+    np.array([1, 2, 3]) == np.array([2])
+
+or it can return False if broadcasting can not be done:
+
+.. ipython:: python
+   :okwarning:
+
+    np.array([1, 2, 3]) == np.array([1, 2])
+
+Combining overlapping data sets
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A problem occasionally arising is the combination of two similar data sets
+where values in one are preferred over the other. An example would be two data
+series representing a particular economic indicator where one is considered to
+be of "higher quality". However, the lower quality series might extend further
+back in history or have more complete data coverage. As such, we would like to
+combine two DataFrame objects where missing values in one DataFrame are
+conditionally filled with like-labeled values from the other DataFrame. The
+function implementing this operation is :meth:`~DataFrame.combine_first`,
+which we illustrate:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'A': [1., np.nan, 3., 5., np.nan],
+                       'B': [np.nan, 2., 3., np.nan, 6.]})
+   df2 = pd.DataFrame({'A': [5., 2., 4., np.nan, 3., 7.],
+                       'B': [np.nan, np.nan, 3., 4., 6., 8.]})
+   df1
+   df2
+   df1.combine_first(df2)
+
+General DataFrame Combine
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~DataFrame.combine_first` method above calls the more general
+:meth:`DataFrame.combine`. This method takes another DataFrame
+and a combiner function, aligns the input DataFrame and then passes the combiner
+function pairs of Series (i.e., columns whose names are the same).
+
+So, for instance, to reproduce :meth:`~DataFrame.combine_first` as above:
+
+.. ipython:: python
+
+   def combiner(x, y):
+       return np.where(pd.isna(x), y, x)
+   df1.combine(df2, combiner)
+
+.. _basics.stats:
+
+Descriptive statistics
+----------------------
+
+There exists a large number of methods for computing descriptive statistics and
+other related operations on :ref:`Series <api.series.stats>`, :ref:`DataFrame
+<api.dataframe.stats>`, and :ref:`Panel <api.panel.stats>`. Most of these
+are aggregations (hence producing a lower-dimensional result) like
+:meth:`~DataFrame.sum`, :meth:`~DataFrame.mean`, and :meth:`~DataFrame.quantile`,
+but some of them, like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod`,
+produce an object of the same size. Generally speaking, these methods take an
+**axis** argument, just like *ndarray.{sum, std, ...}*, but the axis can be
+specified by name or integer:
+
+* **Series**: no axis argument needed
+* **DataFrame**: "index" (axis=0, default), "columns" (axis=1)
+* **Panel**: "items" (axis=0), "major" (axis=1, default), "minor"
+  (axis=2)
+
+For example:
+
+.. ipython:: python
+
+   df
+   df.mean(0)
+   df.mean(1)
+
+All such methods have a ``skipna`` option signaling whether to exclude missing
+data (``True`` by default):
+
+.. ipython:: python
+
+   df.sum(0, skipna=False)
+   df.sum(axis=1, skipna=True)
+
+Combined with the broadcasting / arithmetic behavior, one can describe various
+statistical procedures, like standardization (rendering data zero mean and
+standard deviation 1), very concisely:
+
+.. ipython:: python
+
+   ts_stand = (df - df.mean()) / df.std()
+   ts_stand.std()
+   xs_stand = df.sub(df.mean(1), axis=0).div(df.std(1), axis=0)
+   xs_stand.std(1)
+
+Note that methods like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod`
+preserve the location of ``NaN`` values. This is somewhat different from
+:meth:`~DataFrame.expanding` and :meth:`~DataFrame.rolling`.
+For more details please see :ref:`this note <stats.moments.expanding.note>`.
+
+.. ipython:: python
+
+   df.cumsum()
+
+Here is a quick reference summary table of common functions. Each also takes an
+optional ``level`` parameter which applies only if the object has a
+:ref:`hierarchical index<advanced.hierarchical>`.
+
+.. csv-table::
+    :header: "Function", "Description"
+    :widths: 20, 80
+
+    ``count``, Number of non-NA observations
+    ``sum``, Sum of values
+    ``mean``, Mean of values
+    ``mad``, Mean absolute deviation
+    ``median``, Arithmetic median of values
+    ``min``, Minimum
+    ``max``, Maximum
+    ``mode``, Mode
+    ``abs``, Absolute Value
+    ``prod``, Product of values
+    ``std``, Bessel-corrected sample standard deviation
+    ``var``, Unbiased variance
+    ``sem``, Standard error of the mean
+    ``skew``, Sample skewness (3rd moment)
+    ``kurt``, Sample kurtosis (4th moment)
+    ``quantile``, Sample quantile (value at %)
+    ``cumsum``, Cumulative sum
+    ``cumprod``, Cumulative product
+    ``cummax``, Cumulative maximum
+    ``cummin``, Cumulative minimum
+
+Note that by chance some NumPy methods, like ``mean``, ``std``, and ``sum``,
+will exclude NAs on Series input by default:
+
+.. ipython:: python
+
+   np.mean(df['one'])
+   np.mean(df['one'].to_numpy())
+
+:meth:`Series.nunique` will return the number of unique non-NA values in a
+Series:
+
+.. ipython:: python
+
+   series = pd.Series(np.random.randn(500))
+   series[20:500] = np.nan
+   series[10:20] = 5
+   series.nunique()
+
+.. _basics.describe:
+
+Summarizing data: describe
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+There is a convenient :meth:`~DataFrame.describe` function which computes a variety of summary
+statistics about a Series or the columns of a DataFrame (excluding NAs of
+course):
+
+.. ipython:: python
+
+    series = pd.Series(np.random.randn(1000))
+    series[::2] = np.nan
+    series.describe()
+    frame = pd.DataFrame(np.random.randn(1000, 5),
+                         columns=['a', 'b', 'c', 'd', 'e'])
+    frame.iloc[::2] = np.nan
+    frame.describe()
+
+You can select specific percentiles to include in the output:
+
+.. ipython:: python
+
+    series.describe(percentiles=[.05, .25, .75, .95])
+
+By default, the median is always included.
+
+For a non-numerical Series object, :meth:`~Series.describe` will give a simple
+summary of the number of unique values and most frequently occurring values:
+
+.. ipython:: python
+
+   s = pd.Series(['a', 'a', 'b', 'b', 'a', 'a', np.nan, 'c', 'd', 'a'])
+   s.describe()
+
+Note that on a mixed-type DataFrame object, :meth:`~DataFrame.describe` will
+restrict the summary to include only numerical columns or, if none are, only
+categorical columns:
+
+.. ipython:: python
+
+    frame = pd.DataFrame({'a': ['Yes', 'Yes', 'No', 'No'], 'b': range(4)})
+    frame.describe()
+
+This behavior can be controlled by providing a list of types as ``include``/``exclude``
+arguments. The special value ``all`` can also be used:
+
+.. ipython:: python
+
+    frame.describe(include=['object'])
+    frame.describe(include=['number'])
+    frame.describe(include='all')
+
+That feature relies on :ref:`select_dtypes <basics.selectdtypes>`. Refer to
+there for details about accepted inputs.
+
+.. _basics.idxmin:
+
+Index of Min/Max Values
+~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~DataFrame.idxmin` and :meth:`~DataFrame.idxmax` functions on Series
+and DataFrame compute the index labels with the minimum and maximum
+corresponding values:
+
+.. ipython:: python
+
+   s1 = pd.Series(np.random.randn(5))
+   s1
+   s1.idxmin(), s1.idxmax()
+
+   df1 = pd.DataFrame(np.random.randn(5, 3), columns=['A', 'B', 'C'])
+   df1
+   df1.idxmin(axis=0)
+   df1.idxmax(axis=1)
+
+When there are multiple rows (or columns) matching the minimum or maximum
+value, :meth:`~DataFrame.idxmin` and :meth:`~DataFrame.idxmax` return the first
+matching index:
+
+.. ipython:: python
+
+   df3 = pd.DataFrame([2, 1, 1, 3, np.nan], columns=['A'], index=list('edcba'))
+   df3
+   df3['A'].idxmin()
+
+.. note::
+
+   ``idxmin`` and ``idxmax`` are called ``argmin`` and ``argmax`` in NumPy.
+
+.. _basics.discretization:
+
+Value counts (histogramming) / Mode
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~Series.value_counts` Series method and top-level function computes a histogram
+of a 1D array of values. It can also be used as a function on regular arrays:
+
+.. ipython:: python
+
+   data = np.random.randint(0, 7, size=50)
+   data
+   s = pd.Series(data)
+   s.value_counts()
+   pd.value_counts(data)
+
+Similarly, you can get the most frequently occurring value(s) (the mode) of the values in a Series or DataFrame:
+
+.. ipython:: python
+
+    s5 = pd.Series([1, 1, 3, 3, 3, 5, 5, 7, 7, 7])
+    s5.mode()
+    df5 = pd.DataFrame({"A": np.random.randint(0, 7, size=50),
+                        "B": np.random.randint(-10, 15, size=50)})
+    df5.mode()
+
+
+Discretization and quantiling
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Continuous values can be discretized using the :func:`cut` (bins based on values)
+and :func:`qcut` (bins based on sample quantiles) functions:
+
+.. ipython:: python
+
+   arr = np.random.randn(20)
+   factor = pd.cut(arr, 4)
+   factor
+
+   factor = pd.cut(arr, [-5, -1, 0, 1, 5])
+   factor
+
+:func:`qcut` computes sample quantiles. For example, we could slice up some
+normally distributed data into equal-size quartiles like so:
+
+.. ipython:: python
+
+   arr = np.random.randn(30)
+   factor = pd.qcut(arr, [0, .25, .5, .75, 1])
+   factor
+   pd.value_counts(factor)
+
+We can also pass infinite values to define the bins:
+
+.. ipython:: python
+
+   arr = np.random.randn(20)
+   factor = pd.cut(arr, [-np.inf, 0, np.inf])
+   factor
+
+.. _basics.apply:
+
+Function application
+--------------------
+
+To apply your own or another library's functions to pandas objects,
+you should be aware of the three methods below. The appropriate
+method to use depends on whether your function expects to operate
+on an entire ``DataFrame`` or ``Series``, row- or column-wise, or elementwise.
+
+1. `Tablewise Function Application`_: :meth:`~DataFrame.pipe`
+2. `Row or Column-wise Function Application`_: :meth:`~DataFrame.apply`
+3. `Aggregation API`_: :meth:`~DataFrame.agg` and :meth:`~DataFrame.transform`
+4. `Applying Elementwise Functions`_: :meth:`~DataFrame.applymap`
+
+.. _basics.pipe:
+
+Tablewise Function Application
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``DataFrames`` and ``Series`` can of course just be passed into functions.
+However, if the function needs to be called in a chain, consider using the :meth:`~DataFrame.pipe` method.
+Compare the following
+
+.. code-block:: python
+
+   # f, g, and h are functions taking and returning ``DataFrames``
+   >>> f(g(h(df), arg1=1), arg2=2, arg3=3)
+
+with the equivalent
+
+.. code-block:: python
+
+   >>> (df.pipe(h)
+   ...    .pipe(g, arg1=1)
+   ...    .pipe(f, arg2=2, arg3=3))
+
+Pandas encourages the second style, which is known as method chaining.
+``pipe`` makes it easy to use your own or another library's functions
+in method chains, alongside pandas' methods.
+
+In the example above, the functions ``f``, ``g``, and ``h`` each expected the ``DataFrame`` as the first positional argument.
+What if the function you wish to apply takes its data as, say, the second argument?
+In this case, provide ``pipe`` with a tuple of ``(callable, data_keyword)``.
+``.pipe`` will route the ``DataFrame`` to the argument specified in the tuple.
+
+For example, we can fit a regression using statsmodels. Their API expects a formula first and a ``DataFrame`` as the second argument, ``data``. We pass in the function, keyword pair ``(sm.ols, 'data')`` to ``pipe``:
+
+.. ipython:: python
+
+   import statsmodels.formula.api as sm
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+
+   (bb.query('h > 0')
+      .assign(ln_h=lambda df: np.log(df.h))
+      .pipe((sm.ols, 'data'), 'hr ~ ln_h + year + g + C(lg)')
+      .fit()
+      .summary()
+    )
+
+The pipe method is inspired by unix pipes and more recently dplyr_ and magrittr_, which
+have introduced the popular ``(%>%)`` (read pipe) operator for R_.
+The implementation of ``pipe`` here is quite clean and feels right at home in python.
+We encourage you to view the source code of :meth:`~DataFrame.pipe`.
+
+.. _dplyr: https://github.com/hadley/dplyr
+.. _magrittr: https://github.com/smbache/magrittr
+.. _R: https://www.r-project.org
+
+
+Row or Column-wise Function Application
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Arbitrary functions can be applied along the axes of a DataFrame
+using the :meth:`~DataFrame.apply` method, which, like the descriptive
+statistics methods, takes an optional ``axis`` argument:
+
+.. ipython:: python
+
+   df.apply(np.mean)
+   df.apply(np.mean, axis=1)
+   df.apply(lambda x: x.max() - x.min())
+   df.apply(np.cumsum)
+   df.apply(np.exp)
+
+The :meth:`~DataFrame.apply` method will also dispatch on a string method name.
+
+.. ipython:: python
+
+   df.apply('mean')
+   df.apply('mean', axis=1)
+
+The return type of the function passed to :meth:`~DataFrame.apply` affects the
+type of the final output from ``DataFrame.apply`` for the default behaviour:
+
+* If the applied function returns a ``Series``, the final output is a ``DataFrame``.
+  The columns match the index of the ``Series`` returned by the applied function.
+* If the applied function returns any other type, the final output is a ``Series``.
+
+This default behaviour can be overridden using the ``result_type``, which
+accepts three options: ``reduce``, ``broadcast``, and ``expand``.
+These will determine how list-likes return values expand (or not) to a ``DataFrame``.
+
+:meth:`~DataFrame.apply` combined with some cleverness can be used to answer many questions
+about a data set. For example, suppose we wanted to extract the date where the
+maximum value for each column occurred:
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=1000))
+   tsdf.apply(lambda x: x.idxmax())
+
+You may also pass additional arguments and keyword arguments to the :meth:`~DataFrame.apply`
+method. For instance, consider the following function you would like to apply:
+
+.. code-block:: python
+
+   def subtract_and_divide(x, sub, divide=1):
+       return (x - sub) / divide
+
+You may then apply this function as follows:
+
+.. code-block:: python
+
+   df.apply(subtract_and_divide, args=(5,), divide=3)
+
+Another useful feature is the ability to pass Series methods to carry out some
+Series operation on each column or row:
+
+.. ipython:: python
+   :suppress:
+
+   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=10))
+   tsdf.iloc[3:7] = np.nan
+
+.. ipython:: python
+
+   tsdf
+   tsdf.apply(pd.Series.interpolate)
+
+
+Finally, :meth:`~DataFrame.apply` takes an argument ``raw`` which is False by default, which
+converts each row or column into a Series before applying the function. When
+set to True, the passed function will instead receive an ndarray object, which
+has positive performance implications if you do not need the indexing
+functionality.
+
+.. _basics.aggregate:
+
+Aggregation API
+~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The aggregation API allows one to express possibly multiple aggregation operations in a single concise way.
+This API is similar across pandas objects, see :ref:`groupby API <groupby.aggregate>`, the
+:ref:`window functions API <stats.aggregate>`, and the :ref:`resample API <timeseries.aggregate>`.
+The entry point for aggregation is :meth:`DataFrame.aggregate`, or the alias
+:meth:`DataFrame.agg`.
+
+We will use a similar starting frame from above:
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=10))
+   tsdf.iloc[3:7] = np.nan
+   tsdf
+
+Using a single function is equivalent to :meth:`~DataFrame.apply`. You can also
+pass named methods as strings. These will return a ``Series`` of the aggregated
+output:
+
+.. ipython:: python
+
+   tsdf.agg(np.sum)
+
+   tsdf.agg('sum')
+
+   # these are equivalent to a ``.sum()`` because we are aggregating
+   # on a single function
+   tsdf.sum()
+
+Single aggregations on a ``Series`` this will return a scalar value:
+
+.. ipython:: python
+
+   tsdf.A.agg('sum')
+
+
+Aggregating with multiple functions
++++++++++++++++++++++++++++++++++++
+
+You can pass multiple aggregation arguments as a list.
+The results of each of the passed functions will be a row in the resulting ``DataFrame``.
+These are naturally named from the aggregation function.
+
+.. ipython:: python
+
+   tsdf.agg(['sum'])
+
+Multiple functions yield multiple rows:
+
+.. ipython:: python
+
+   tsdf.agg(['sum', 'mean'])
+
+On a ``Series``, multiple functions return a ``Series``, indexed by the function names:
+
+.. ipython:: python
+
+   tsdf.A.agg(['sum', 'mean'])
+
+Passing a ``lambda`` function will yield a ``<lambda>`` named row:
+
+.. ipython:: python
+
+   tsdf.A.agg(['sum', lambda x: x.mean()])
+
+Passing a named function will yield that name for the row:
+
+.. ipython:: python
+
+   def mymean(x):
+       return x.mean()
+
+   tsdf.A.agg(['sum', mymean])
+
+Aggregating with a dict
++++++++++++++++++++++++
+
+Passing a dictionary of column names to a scalar or a list of scalars, to ``DataFrame.agg``
+allows you to customize which functions are applied to which columns. Note that the results
+are not in any particular order, you can use an ``OrderedDict`` instead to guarantee ordering.
+
+.. ipython:: python
+
+   tsdf.agg({'A': 'mean', 'B': 'sum'})
+
+Passing a list-like will generate a ``DataFrame`` output. You will get a matrix-like output
+of all of the aggregators. The output will consist of all unique functions. Those that are
+not noted for a particular column will be ``NaN``:
+
+.. ipython:: python
+
+   tsdf.agg({'A': ['mean', 'min'], 'B': 'sum'})
+
+.. _basics.aggregation.mixed_dtypes:
+
+Mixed Dtypes
+++++++++++++
+
+When presented with mixed dtypes that cannot aggregate, ``.agg`` will only take the valid
+aggregations. This is similar to how groupby ``.agg`` works.
+
+.. ipython:: python
+
+   mdf = pd.DataFrame({'A': [1, 2, 3],
+                       'B': [1., 2., 3.],
+                       'C': ['foo', 'bar', 'baz'],
+                       'D': pd.date_range('20130101', periods=3)})
+   mdf.dtypes
+
+.. ipython:: python
+
+   mdf.agg(['min', 'sum'])
+
+.. _basics.aggregation.custom_describe:
+
+Custom describe
++++++++++++++++
+
+With ``.agg()`` is it possible to easily create a custom describe function, similar
+to the built in :ref:`describe function <basics.describe>`.
+
+.. ipython:: python
+
+   from functools import partial
+
+   q_25 = partial(pd.Series.quantile, q=0.25)
+   q_25.__name__ = '25%'
+   q_75 = partial(pd.Series.quantile, q=0.75)
+   q_75.__name__ = '75%'
+
+   tsdf.agg(['count', 'mean', 'std', 'min', q_25, 'median', q_75, 'max'])
+
+.. _basics.transform:
+
+Transform API
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The :meth:`~DataFrame.transform` method returns an object that is indexed the same (same size)
+as the original. This API allows you to provide *multiple* operations at the same
+time rather than one-by-one. Its API is quite similar to the ``.agg`` API.
+
+We create a frame similar to the one used in the above sections.
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                       index=pd.date_range('1/1/2000', periods=10))
+   tsdf.iloc[3:7] = np.nan
+   tsdf
+
+Transform the entire frame. ``.transform()`` allows input functions as: a NumPy function, a string
+function name or a user defined function.
+
+.. ipython:: python
+   :okwarning:
+
+   tsdf.transform(np.abs)
+   tsdf.transform('abs')
+   tsdf.transform(lambda x: x.abs())
+
+Here :meth:`~DataFrame.transform` received a single function; this is equivalent to a ufunc application.
+
+.. ipython:: python
+
+   np.abs(tsdf)
+
+Passing a single function to ``.transform()`` with a ``Series`` will yield a single ``Series`` in return.
+
+.. ipython:: python
+
+   tsdf.A.transform(np.abs)
+
+
+Transform with multiple functions
++++++++++++++++++++++++++++++++++
+
+Passing multiple functions will yield a column MultiIndexed DataFrame.
+The first level will be the original frame column names; the second level
+will be the names of the transforming functions.
+
+.. ipython:: python
+
+   tsdf.transform([np.abs, lambda x: x + 1])
+
+Passing multiple functions to a Series will yield a DataFrame. The
+resulting column names will be the transforming functions.
+
+.. ipython:: python
+
+   tsdf.A.transform([np.abs, lambda x: x + 1])
+
+
+Transforming with a dict
+++++++++++++++++++++++++
+
+
+Passing a dict of functions will allow selective transforming per column.
+
+.. ipython:: python
+
+   tsdf.transform({'A': np.abs, 'B': lambda x: x + 1})
+
+Passing a dict of lists will generate a MultiIndexed DataFrame with these
+selective transforms.
+
+.. ipython:: python
+   :okwarning:
+
+   tsdf.transform({'A': np.abs, 'B': [lambda x: x + 1, 'sqrt']})
+
+.. _basics.elementwise:
+
+Applying Elementwise Functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Since not all functions can be vectorized (accept NumPy arrays and return
+another array or value), the methods :meth:`~DataFrame.applymap` on DataFrame
+and analogously :meth:`~Series.map` on Series accept any Python function taking
+a single value and returning a single value. For example:
+
+.. ipython:: python
+   :suppress:
+
+   df4 = df_orig.copy()
+
+.. ipython:: python
+
+   df4
+
+   def f(x):
+       return len(str(x))
+
+   df4['one'].map(f)
+   df4.applymap(f)
+
+:meth:`Series.map` has an additional feature; it can be used to easily
+"link" or "map" values defined by a secondary series. This is closely related
+to :ref:`merging/joining functionality <merging>`:
+
+.. ipython:: python
+
+   s = pd.Series(['six', 'seven', 'six', 'seven', 'six'],
+                 index=['a', 'b', 'c', 'd', 'e'])
+   t = pd.Series({'six': 6., 'seven': 7.})
+   s
+   s.map(t)
+
+
+.. _basics.reindexing:
+
+Reindexing and altering labels
+------------------------------
+
+:meth:`~Series.reindex` is the fundamental data alignment method in pandas.
+It is used to implement nearly all other features relying on label-alignment
+functionality. To *reindex* means to conform the data to match a given set of
+labels along a particular axis. This accomplishes several things:
+
+* Reorders the existing data to match a new set of labels
+* Inserts missing value (NA) markers in label locations where no data for
+  that label existed
+* If specified, **fill** data for missing labels using logic (highly relevant
+  to working with time series data)
+
+Here is a simple example:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   s
+   s.reindex(['e', 'b', 'f', 'd'])
+
+Here, the ``f`` label was not contained in the Series and hence appears as
+``NaN`` in the result.
+
+With a DataFrame, you can simultaneously reindex the index and columns:
+
+.. ipython:: python
+
+   df
+   df.reindex(index=['c', 'f', 'b'], columns=['three', 'two', 'one'])
+
+You may also use ``reindex`` with an ``axis`` keyword:
+
+.. ipython:: python
+
+   df.reindex(['c', 'f', 'b'], axis='index')
+
+Note that the ``Index`` objects containing the actual axis labels can be
+**shared** between objects. So if we have a Series and a DataFrame, the
+following can be done:
+
+.. ipython:: python
+
+   rs = s.reindex(df.index)
+   rs
+   rs.index is df.index
+
+This means that the reindexed Series's index is the same Python object as the
+DataFrame's index.
+
+.. versionadded:: 0.21.0
+
+:meth:`DataFrame.reindex` also supports an "axis-style" calling convention,
+where you specify a single ``labels`` argument and the ``axis`` it applies to.
+
+.. ipython:: python
+
+   df.reindex(['c', 'f', 'b'], axis='index')
+   df.reindex(['three', 'two', 'one'], axis='columns')
+
+.. seealso::
+
+   :ref:`MultiIndex / Advanced Indexing <advanced>` is an even more concise way of
+   doing reindexing.
+
+.. note::
+
+    When writing performance-sensitive code, there is a good reason to spend
+    some time becoming a reindexing ninja: **many operations are faster on
+    pre-aligned data**. Adding two unaligned DataFrames internally triggers a
+    reindexing step. For exploratory analysis you will hardly notice the
+    difference (because ``reindex`` has been heavily optimized), but when CPU
+    cycles matter sprinkling a few explicit ``reindex`` calls here and there can
+    have an impact.
+
+.. _basics.reindex_like:
+
+Reindexing to align with another object
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You may wish to take an object and reindex its axes to be labeled the same as
+another object. While the syntax for this is straightforward albeit verbose, it
+is a common enough operation that the :meth:`~DataFrame.reindex_like` method is
+available to make this simpler:
+
+.. ipython:: python
+   :suppress:
+
+   df2 = df.reindex(['a', 'b', 'c'], columns=['one', 'two'])
+   df3 = df2 - df2.mean()
+
+
+.. ipython:: python
+
+   df2
+   df3
+   df.reindex_like(df2)
+
+.. _basics.align:
+
+Aligning objects with each other with ``align``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~Series.align` method is the fastest way to simultaneously align two objects. It
+supports a ``join`` argument (related to :ref:`joining and merging <merging>`):
+
+  - ``join='outer'``: take the union of the indexes (default)
+  - ``join='left'``: use the calling object's index
+  - ``join='right'``: use the passed object's index
+  - ``join='inner'``: intersect the indexes
+
+It returns a tuple with both of the reindexed Series:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   s1 = s[:4]
+   s2 = s[1:]
+   s1.align(s2)
+   s1.align(s2, join='inner')
+   s1.align(s2, join='left')
+
+.. _basics.df_join:
+
+For DataFrames, the join method will be applied to both the index and the
+columns by default:
+
+.. ipython:: python
+
+   df.align(df2, join='inner')
+
+You can also pass an ``axis`` option to only align on the specified axis:
+
+.. ipython:: python
+
+   df.align(df2, join='inner', axis=0)
+
+.. _basics.align.frame.series:
+
+If you pass a Series to :meth:`DataFrame.align`, you can choose to align both
+objects either on the DataFrame's index or columns using the ``axis`` argument:
+
+.. ipython:: python
+
+   df.align(df2.iloc[0], axis=1)
+
+.. _basics.reindex_fill:
+
+Filling while reindexing
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`~Series.reindex` takes an optional parameter ``method`` which is a
+filling method chosen from the following table:
+
+.. csv-table::
+    :header: "Method", "Action"
+    :widths: 30, 50
+
+    pad / ffill, Fill values forward
+    bfill / backfill, Fill values backward
+    nearest, Fill from the nearest index value
+
+We illustrate these fill methods on a simple Series:
+
+.. ipython:: python
+
+   rng = pd.date_range('1/3/2000', periods=8)
+   ts = pd.Series(np.random.randn(8), index=rng)
+   ts2 = ts[[0, 3, 6]]
+   ts
+   ts2
+
+   ts2.reindex(ts.index)
+   ts2.reindex(ts.index, method='ffill')
+   ts2.reindex(ts.index, method='bfill')
+   ts2.reindex(ts.index, method='nearest')
+
+These methods require that the indexes are **ordered** increasing or
+decreasing.
+
+Note that the same result could have been achieved using
+:ref:`fillna <missing_data.fillna>` (except for ``method='nearest'``) or
+:ref:`interpolate <missing_data.interpolate>`:
+
+.. ipython:: python
+
+   ts2.reindex(ts.index).fillna(method='ffill')
+
+:meth:`~Series.reindex` will raise a ValueError if the index is not monotonically
+increasing or decreasing. :meth:`~Series.fillna` and :meth:`~Series.interpolate`
+will not perform any checks on the order of the index.
+
+.. _basics.limits_on_reindex_fill:
+
+Limits on filling while reindexing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The ``limit`` and ``tolerance`` arguments provide additional control over
+filling while reindexing. Limit specifies the maximum count of consecutive
+matches:
+
+.. ipython:: python
+
+   ts2.reindex(ts.index, method='ffill', limit=1)
+
+In contrast, tolerance specifies the maximum distance between the index and
+indexer values:
+
+.. ipython:: python
+
+   ts2.reindex(ts.index, method='ffill', tolerance='1 day')
+
+Notice that when used on a ``DatetimeIndex``, ``TimedeltaIndex`` or
+``PeriodIndex``, ``tolerance`` will coerced into a ``Timedelta`` if possible.
+This allows you to specify tolerance with appropriate strings.
+
+.. _basics.drop:
+
+Dropping labels from an axis
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A method closely related to ``reindex`` is the :meth:`~DataFrame.drop` function.
+It removes a set of labels from an axis:
+
+.. ipython:: python
+
+   df
+   df.drop(['a', 'd'], axis=0)
+   df.drop(['one'], axis=1)
+
+Note that the following also works, but is a bit less obvious / clean:
+
+.. ipython:: python
+
+   df.reindex(df.index.difference(['a', 'd']))
+
+.. _basics.rename:
+
+Renaming / mapping labels
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~DataFrame.rename` method allows you to relabel an axis based on some
+mapping (a dict or Series) or an arbitrary function.
+
+.. ipython:: python
+
+   s
+   s.rename(str.upper)
+
+If you pass a function, it must return a value when called with any of the
+labels (and must produce a set of unique values). A dict or
+Series can also be used:
+
+.. ipython:: python
+
+   df.rename(columns={'one': 'foo', 'two': 'bar'},
+             index={'a': 'apple', 'b': 'banana', 'd': 'durian'})
+
+If the mapping doesn't include a column/index label, it isn't renamed. Note that
+extra labels in the mapping don't throw an error.
+
+.. versionadded:: 0.21.0
+
+:meth:`DataFrame.rename` also supports an "axis-style" calling convention, where
+you specify a single ``mapper`` and the ``axis`` to apply that mapping to.
+
+.. ipython:: python
+
+   df.rename({'one': 'foo', 'two': 'bar'}, axis='columns')
+   df.rename({'a': 'apple', 'b': 'banana', 'd': 'durian'}, axis='index')
+
+
+The :meth:`~DataFrame.rename` method also provides an ``inplace`` named
+parameter that is by default ``False`` and copies the underlying data. Pass
+``inplace=True`` to rename the data in place.
+
+.. versionadded:: 0.18.0
+
+Finally, :meth:`~Series.rename` also accepts a scalar or list-like
+for altering the ``Series.name`` attribute.
+
+.. ipython:: python
+
+   s.rename("scalar-name")
+
+.. _basics.rename_axis:
+
+.. versionadded:: 0.24.0
+
+The methods :meth:`~DataFrame.rename_axis` and :meth:`~Series.rename_axis`
+allow specific names of a `MultiIndex` to be changed (as opposed to the
+labels).
+
+.. ipython:: python
+
+   df = pd.DataFrame({'x': [1, 2, 3, 4, 5, 6],
+                      'y': [10, 20, 30, 40, 50, 60]},
+                     index=pd.MultiIndex.from_product([['a', 'b', 'c'], [1, 2]],
+                     names=['let', 'num']))
+   df
+   df.rename_axis(index={'let': 'abc'})
+   df.rename_axis(index=str.upper)
+
+.. _basics.iteration:
+
+Iteration
+---------
+
+The behavior of basic iteration over pandas objects depends on the type.
+When iterating over a Series, it is regarded as array-like, and basic iteration
+produces the values. Other data structures, like DataFrame and Panel,
+follow the dict-like convention of iterating over the "keys" of the
+objects.
+
+In short, basic iteration (``for i in object``) produces:
+
+* **Series**: values
+* **DataFrame**: column labels
+* **Panel**: item labels
+
+Thus, for example, iterating over a DataFrame gives you the column names:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'col1': np.random.randn(3),
+                      'col2': np.random.randn(3)}, index=['a', 'b', 'c'])
+
+   for col in df:
+       print(col)
+
+
+Pandas objects also have the dict-like :meth:`~DataFrame.iteritems` method to
+iterate over the (key, value) pairs.
+
+To iterate over the rows of a DataFrame, you can use the following methods:
+
+* :meth:`~DataFrame.iterrows`: Iterate over the rows of a DataFrame as (index, Series) pairs.
+  This converts the rows to Series objects, which can change the dtypes and has some
+  performance implications.
+* :meth:`~DataFrame.itertuples`: Iterate over the rows of a DataFrame
+  as namedtuples of the values.  This is a lot faster than
+  :meth:`~DataFrame.iterrows`, and is in most cases preferable to use
+  to iterate over the values of a DataFrame.
+
+.. warning::
+
+  Iterating through pandas objects is generally **slow**. In many cases,
+  iterating manually over the rows is not needed and can be avoided with
+  one of the following approaches:
+
+  * Look for a *vectorized* solution: many operations can be performed using
+    built-in methods or NumPy functions, (boolean) indexing, ...
+
+  * When you have a function that cannot work on the full DataFrame/Series
+    at once, it is better to use :meth:`~DataFrame.apply` instead of iterating
+    over the values. See the docs on :ref:`function application <basics.apply>`.
+
+  * If you need to do iterative manipulations on the values but performance is
+    important, consider writing the inner loop with cython or numba.
+    See the :ref:`enhancing performance <enhancingperf>` section for some
+    examples of this approach.
+
+.. warning::
+
+  You should **never modify** something you are iterating over.
+  This is not guaranteed to work in all cases. Depending on the
+  data types, the iterator returns a copy and not a view, and writing
+  to it will have no effect!
+
+  For example, in the following case setting the value has no effect:
+
+  .. ipython:: python
+
+    df = pd.DataFrame({'a': [1, 2, 3], 'b': ['a', 'b', 'c']})
+
+    for index, row in df.iterrows():
+        row['a'] = 10
+
+    df
+
+iteritems
+~~~~~~~~~
+
+Consistent with the dict-like interface, :meth:`~DataFrame.iteritems` iterates
+through key-value pairs:
+
+* **Series**: (index, scalar value) pairs
+* **DataFrame**: (column, Series) pairs
+* **Panel**: (item, DataFrame) pairs
+
+For example:
+
+.. ipython:: python
+
+   for item, frame in wp.iteritems():
+       print(item)
+       print(frame)
+
+.. _basics.iterrows:
+
+iterrows
+~~~~~~~~
+
+:meth:`~DataFrame.iterrows` allows you to iterate through the rows of a
+DataFrame as Series objects. It returns an iterator yielding each
+index value along with a Series containing the data in each row:
+
+.. ipython:: python
+
+   for row_index, row in df.iterrows():
+       print(row_index, row, sep='\n')
+
+.. note::
+
+   Because :meth:`~DataFrame.iterrows` returns a Series for each row,
+   it does **not** preserve dtypes across the rows (dtypes are
+   preserved across columns for DataFrames). For example,
+
+   .. ipython:: python
+
+      df_orig = pd.DataFrame([[1, 1.5]], columns=['int', 'float'])
+      df_orig.dtypes
+      row = next(df_orig.iterrows())[1]
+      row
+
+   All values in ``row``, returned as a Series, are now upcasted
+   to floats, also the original integer value in column `x`:
+
+   .. ipython:: python
+
+      row['int'].dtype
+      df_orig['int'].dtype
+
+   To preserve dtypes while iterating over the rows, it is better
+   to use :meth:`~DataFrame.itertuples` which returns namedtuples of the values
+   and which is generally much faster than :meth:`~DataFrame.iterrows`.
+
+For instance, a contrived way to transpose the DataFrame would be:
+
+.. ipython:: python
+
+   df2 = pd.DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+   print(df2)
+   print(df2.T)
+
+   df2_t = pd.DataFrame({idx: values for idx, values in df2.iterrows()})
+   print(df2_t)
+
+itertuples
+~~~~~~~~~~
+
+The :meth:`~DataFrame.itertuples` method will return an iterator
+yielding a namedtuple for each row in the DataFrame. The first element
+of the tuple will be the row's corresponding index value, while the
+remaining values are the row values.
+
+For instance:
+
+.. ipython:: python
+
+   for row in df.itertuples():
+       print(row)
+
+This method does not convert the row to a Series object; it merely
+returns the values inside a namedtuple. Therefore,
+:meth:`~DataFrame.itertuples` preserves the data type of the values
+and is generally faster as :meth:`~DataFrame.iterrows`.
+
+.. note::
+
+   The column names will be renamed to positional names if they are
+   invalid Python identifiers, repeated, or start with an underscore.
+   With a large number of columns (>255), regular tuples are returned.
+
+.. _basics.dt_accessors:
+
+.dt accessor
+------------
+
+``Series`` has an accessor to succinctly return datetime like properties for the
+*values* of the Series, if it is a datetime/period like Series.
+This will return a Series, indexed like the existing Series.
+
+.. ipython:: python
+
+   # datetime
+   s = pd.Series(pd.date_range('20130101 09:10:12', periods=4))
+   s
+   s.dt.hour
+   s.dt.second
+   s.dt.day
+
+This enables nice expressions like this:
+
+.. ipython:: python
+
+   s[s.dt.day == 2]
+
+You can easily produces tz aware transformations:
+
+.. ipython:: python
+
+   stz = s.dt.tz_localize('US/Eastern')
+   stz
+   stz.dt.tz
+
+You can also chain these types of operations:
+
+.. ipython:: python
+
+   s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
+
+You can also format datetime values as strings with :meth:`Series.dt.strftime` which
+supports the same format as the standard :meth:`~datetime.datetime.strftime`.
+
+.. ipython:: python
+
+   # DatetimeIndex
+   s = pd.Series(pd.date_range('20130101', periods=4))
+   s
+   s.dt.strftime('%Y/%m/%d')
+
+.. ipython:: python
+
+   # PeriodIndex
+   s = pd.Series(pd.period_range('20130101', periods=4))
+   s
+   s.dt.strftime('%Y/%m/%d')
+
+The ``.dt`` accessor works for period and timedelta dtypes.
+
+.. ipython:: python
+
+   # period
+   s = pd.Series(pd.period_range('20130101', periods=4, freq='D'))
+   s
+   s.dt.year
+   s.dt.day
+
+.. ipython:: python
+
+   # timedelta
+   s = pd.Series(pd.timedelta_range('1 day 00:00:05', periods=4, freq='s'))
+   s
+   s.dt.days
+   s.dt.seconds
+   s.dt.components
+
+.. note::
+
+   ``Series.dt`` will raise a ``TypeError`` if you access with a non-datetime-like values.
+
+Vectorized string methods
+-------------------------
+
+Series is equipped with a set of string processing methods that make it easy to
+operate on each element of the array. Perhaps most importantly, these methods
+exclude missing/NA values automatically. These are accessed via the Series's
+``str`` attribute and generally have names matching the equivalent (scalar)
+built-in string methods. For example:
+
+ .. ipython:: python
+
+  s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
+  s.str.lower()
+
+Powerful pattern-matching methods are provided as well, but note that
+pattern-matching generally uses `regular expressions
+<https://docs.python.org/3/library/re.html>`__ by default (and in some cases
+always uses them).
+
+Please see :ref:`Vectorized String Methods <text.string_methods>` for a complete
+description.
+
+.. _basics.sorting:
+
+Sorting
+-------
+
+Pandas supports three kinds of sorting: sorting by index labels,
+sorting by column values, and sorting by a combination of both.
+
+.. _basics.sort_index:
+
+By Index
+~~~~~~~~
+
+The :meth:`Series.sort_index` and :meth:`DataFrame.sort_index` methods are
+used to sort a pandas object by its index levels.
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+       'one': pd.Series(np.random.randn(3), index=['a', 'b', 'c']),
+       'two': pd.Series(np.random.randn(4), index=['a', 'b', 'c', 'd']),
+       'three': pd.Series(np.random.randn(3), index=['b', 'c', 'd'])})
+
+   unsorted_df = df.reindex(index=['a', 'd', 'c', 'b'],
+                            columns=['three', 'two', 'one'])
+   unsorted_df
+
+   # DataFrame
+   unsorted_df.sort_index()
+   unsorted_df.sort_index(ascending=False)
+   unsorted_df.sort_index(axis=1)
+
+   # Series
+   unsorted_df['three'].sort_index()
+
+.. _basics.sort_values:
+
+By Values
+~~~~~~~~~
+
+The :meth:`Series.sort_values` method is used to sort a `Series` by its values. The
+:meth:`DataFrame.sort_values` method is used to sort a `DataFrame` by its column or row values.
+The optional ``by`` parameter to :meth:`DataFrame.sort_values` may used to specify one or more columns
+to use to determine the sorted order.
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'one': [2, 1, 1, 1],
+                       'two': [1, 3, 2, 4],
+                       'three': [5, 4, 3, 2]})
+   df1.sort_values(by='two')
+
+The ``by`` parameter can take a list of column names, e.g.:
+
+.. ipython:: python
+
+   df1[['one', 'two', 'three']].sort_values(by=['one', 'two'])
+
+These methods have special treatment of NA values via the ``na_position``
+argument:
+
+.. ipython:: python
+
+   s[2] = np.nan
+   s.sort_values()
+   s.sort_values(na_position='first')
+
+.. _basics.sort_indexes_and_values:
+
+By Indexes and Values
+~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.23.0
+
+Strings passed as the ``by`` parameter to :meth:`DataFrame.sort_values` may
+refer to either columns or index level names.
+
+.. ipython:: python
+
+   # Build MultiIndex
+   idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 2),
+                                   ('b', 2), ('b', 1), ('b', 1)])
+   idx.names = ['first', 'second']
+
+   # Build DataFrame
+   df_multi = pd.DataFrame({'A': np.arange(6, 0, -1)},
+                           index=idx)
+   df_multi
+
+Sort by 'second' (index) and 'A' (column)
+
+.. ipython:: python
+
+   df_multi.sort_values(by=['second', 'A'])
+
+.. note::
+
+   If a string matches both a column name and an index level name then a
+   warning is issued and the column takes precedence. This will result in an
+   ambiguity error in a future version.
+
+.. _basics.searchsorted:
+
+searchsorted
+~~~~~~~~~~~~
+
+Series has the :meth:`~Series.searchsorted` method, which works similarly to
+:meth:`numpy.ndarray.searchsorted`.
+
+.. ipython:: python
+
+   ser = pd.Series([1, 2, 3])
+   ser.searchsorted([0, 3])
+   ser.searchsorted([0, 4])
+   ser.searchsorted([1, 3], side='right')
+   ser.searchsorted([1, 3], side='left')
+   ser = pd.Series([3, 1, 2])
+   ser.searchsorted([0, 3], sorter=np.argsort(ser))
+
+.. _basics.nsorted:
+
+smallest / largest values
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``Series`` has the :meth:`~Series.nsmallest` and :meth:`~Series.nlargest` methods which return the
+smallest or largest :math:`n` values. For a large ``Series`` this can be much
+faster than sorting the entire Series and calling ``head(n)`` on the result.
+
+.. ipython:: python
+
+   s = pd.Series(np.random.permutation(10))
+   s
+   s.sort_values()
+   s.nsmallest(3)
+   s.nlargest(3)
+
+``DataFrame`` also has the ``nlargest`` and ``nsmallest`` methods.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [-2, -1, 1, 10, 8, 11, -1],
+                      'b': list('abdceff'),
+                      'c': [1.0, 2.0, 4.0, 3.2, np.nan, 3.0, 4.0]})
+   df.nlargest(3, 'a')
+   df.nlargest(5, ['a', 'c'])
+   df.nsmallest(3, 'a')
+   df.nsmallest(5, ['a', 'c'])
+
+
+.. _basics.multiindex_sorting:
+
+Sorting by a MultiIndex column
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You must be explicit about sorting when the column is a MultiIndex, and fully specify
+all levels to ``by``.
+
+.. ipython:: python
+
+   df1.columns = pd.MultiIndex.from_tuples([('a', 'one'),
+                                            ('a', 'two'),
+                                            ('b', 'three')])
+   df1.sort_values(by=('a', 'two'))
+
+
+Copying
+-------
+
+The :meth:`~DataFrame.copy` method on pandas objects copies the underlying data (though not
+the axis indexes, since they are immutable) and returns a new object. Note that
+**it is seldom necessary to copy objects**. For example, there are only a
+handful of ways to alter a DataFrame *in-place*:
+
+* Inserting, deleting, or modifying a column.
+* Assigning to the ``index`` or ``columns`` attributes.
+* For homogeneous data, directly modifying the values via the ``values``
+  attribute or advanced indexing.
+
+To be clear, no pandas method has the side effect of modifying your data;
+almost every method returns a new object, leaving the original object
+untouched. If the data is modified, it is because you did so explicitly.
+
+.. _basics.dtypes:
+
+dtypes
+------
+
+For the most part, pandas uses NumPy arrays and dtypes for Series or individual
+columns of a DataFrame. NumPy provides support for ``float``,
+``int``, ``bool``, ``timedelta64[ns]`` and ``datetime64[ns]`` (note that NumPy
+does not support timezone-aware datetimes).
+
+Pandas and third-party libraries *extend* NumPy's type system in a few places.
+This section describes the extensions pandas has made internally.
+See :ref:`extending.extension-types` for how to write your own extension that
+works with pandas. See :ref:`ecosystem.extensions` for a list of third-party
+libraries that have implemented an extension.
+
+The following table lists all of pandas extension types. See the respective
+documentation sections for more on each type.
+
+=================== ========================= ================== ============================= =============================
+Kind of Data        Data Type                 Scalar             Array                         Documentation
+=================== ========================= ================== ============================= =============================
+tz-aware datetime   :class:`DatetimeTZDtype`  :class:`Timestamp` :class:`arrays.DatetimeArray` :ref:`timeseries.timezone`
+Categorical         :class:`CategoricalDtype` (none)             :class:`Categorical`          :ref:`categorical`
+period (time spans) :class:`PeriodDtype`      :class:`Period`    :class:`arrays.PeriodArray`   :ref:`timeseries.periods`
+sparse              :class:`SparseDtype`      (none)             :class:`arrays.SparseArray`   :ref:`sparse`
+intervals           :class:`IntervalDtype`    :class:`Interval`  :class:`arrays.IntervalArray` :ref:`advanced.intervalindex`
+nullable integer    :class:`Int64Dtype`, ...  (none)             :class:`arrays.IntegerArray`  :ref:`integer_na`
+=================== ========================= ================== ============================= =============================
+
+Pandas uses the ``object`` dtype for storing strings.
+
+Finally, arbitrary objects may be stored using the ``object`` dtype, but should
+be avoided to the extent possible (for performance and interoperability with
+other libraries and methods. See :ref:`basics.object_conversion`).
+
+A convenient :attr:`~DataFrame.dtypes` attribute for DataFrame returns a Series
+with the data type of each column.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'A': np.random.rand(3),
+                       'B': 1,
+                       'C': 'foo',
+                       'D': pd.Timestamp('20010102'),
+                       'E': pd.Series([1.0] * 3).astype('float32'),
+                       'F': False,
+                       'G': pd.Series([1] * 3, dtype='int8')})
+   dft
+   dft.dtypes
+
+On a ``Series`` object, use the :attr:`~Series.dtype` attribute.
+
+.. ipython:: python
+
+   dft['A'].dtype
+
+If a pandas object contains data with multiple dtypes *in a single column*, the
+dtype of the column will be chosen to accommodate all of the data types
+(``object`` is the most general).
+
+.. ipython:: python
+
+   # these ints are coerced to floats
+   pd.Series([1, 2, 3, 4, 5, 6.])
+
+   # string data forces an ``object`` dtype
+   pd.Series([1, 2, 3, 6., 'foo'])
+
+The number of columns of each type in a ``DataFrame`` can be found by calling
+:meth:`~DataFrame.get_dtype_counts`.
+
+.. ipython:: python
+
+   dft.get_dtype_counts()
+
+Numeric dtypes will propagate and can coexist in DataFrames.
+If a dtype is passed (either directly via the ``dtype`` keyword, a passed ``ndarray``,
+or a passed ``Series``, then it will be preserved in DataFrame operations. Furthermore,
+different numeric dtypes will **NOT** be combined. The following example will give you a taste.
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(8, 1), columns=['A'], dtype='float32')
+   df1
+   df1.dtypes
+   df2 = pd.DataFrame({'A': pd.Series(np.random.randn(8), dtype='float16'),
+                       'B': pd.Series(np.random.randn(8)),
+                       'C': pd.Series(np.array(np.random.randn(8),
+                                               dtype='uint8'))})
+   df2
+   df2.dtypes
+
+defaults
+~~~~~~~~
+
+By default integer types are ``int64`` and float types are ``float64``,
+*regardless* of platform (32-bit or 64-bit).
+The following will all result in ``int64`` dtypes.
+
+.. ipython:: python
+
+   pd.DataFrame([1, 2], columns=['a']).dtypes
+   pd.DataFrame({'a': [1, 2]}).dtypes
+   pd.DataFrame({'a': 1}, index=list(range(2))).dtypes
+
+Note that Numpy will choose *platform-dependent* types when creating arrays.
+The following **WILL** result in ``int32`` on 32-bit platform.
+
+.. ipython:: python
+
+   frame = pd.DataFrame(np.array([1, 2]))
+
+
+upcasting
+~~~~~~~~~
+
+Types can potentially be *upcasted* when combined with other types, meaning they are promoted
+from the current type (e.g. ``int`` to ``float``).
+
+.. ipython:: python
+
+   df3 = df1.reindex_like(df2).fillna(value=0.0) + df2
+   df3
+   df3.dtypes
+
+:meth:`DataFrame.to_numpy` will return the *lower-common-denominator* of the dtypes, meaning
+the dtype that can accommodate **ALL** of the types in the resulting homogeneous dtyped NumPy array. This can
+force some *upcasting*.
+
+.. ipython:: python
+
+   df3.to_numpy().dtype
+
+astype
+~~~~~~
+
+.. _basics.cast:
+
+You can use the :meth:`~DataFrame.astype` method to explicitly convert dtypes from one to another. These will by default return a copy,
+even if the dtype was unchanged (pass ``copy=False`` to change this behavior). In addition, they will raise an
+exception if the astype operation is invalid.
+
+Upcasting is always according to the **numpy** rules. If two different dtypes are involved in an operation,
+then the more *general* one will be used as the result of the operation.
+
+.. ipython:: python
+
+   df3
+   df3.dtypes
+
+   # conversion of dtypes
+   df3.astype('float32').dtypes
+
+
+Convert a subset of columns to a specified type using :meth:`~DataFrame.astype`.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6], 'c': [7, 8, 9]})
+   dft[['a', 'b']] = dft[['a', 'b']].astype(np.uint8)
+   dft
+   dft.dtypes
+
+.. versionadded:: 0.19.0
+
+Convert certain columns to a specific dtype by passing a dict to :meth:`~DataFrame.astype`.
+
+.. ipython:: python
+
+   dft1 = pd.DataFrame({'a': [1, 0, 1], 'b': [4, 5, 6], 'c': [7, 8, 9]})
+   dft1 = dft1.astype({'a': np.bool, 'c': np.float64})
+   dft1
+   dft1.dtypes
+
+.. note::
+
+    When trying to convert a subset of columns to a specified type using :meth:`~DataFrame.astype`  and :meth:`~DataFrame.loc`, upcasting occurs.
+
+    :meth:`~DataFrame.loc` tries to fit in what we are assigning to the current dtypes, while ``[]`` will overwrite them taking the dtype from the right hand side. Therefore the following piece of code produces the unintended result.
+
+    .. ipython:: python
+
+       dft = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6], 'c': [7, 8, 9]})
+       dft.loc[:, ['a', 'b']].astype(np.uint8).dtypes
+       dft.loc[:, ['a', 'b']] = dft.loc[:, ['a', 'b']].astype(np.uint8)
+       dft.dtypes
+
+.. _basics.object_conversion:
+
+object conversion
+~~~~~~~~~~~~~~~~~
+
+pandas offers various functions to try to force conversion of types from the ``object`` dtype to other types.
+In cases where the data is already of the correct type, but stored in an ``object`` array, the
+:meth:`DataFrame.infer_objects` and :meth:`Series.infer_objects` methods can be used to soft convert
+to the correct type.
+
+  .. ipython:: python
+
+     import datetime
+     df = pd.DataFrame([[1, 2],
+                        ['a', 'b'],
+                        [datetime.datetime(2016, 3, 2),
+                         datetime.datetime(2016, 3, 2)]])
+     df = df.T
+     df
+     df.dtypes
+
+Because the data was transposed the original inference stored all columns as object, which
+``infer_objects`` will correct.
+
+  .. ipython:: python
+
+     df.infer_objects().dtypes
+
+The following functions are available for one dimensional object arrays or scalars to perform
+hard conversion of objects to a specified type:
+
+* :meth:`~pandas.to_numeric` (conversion to numeric dtypes)
+
+  .. ipython:: python
+
+     m = ['1.1', 2, 3]
+     pd.to_numeric(m)
+
+* :meth:`~pandas.to_datetime` (conversion to datetime objects)
+
+  .. ipython:: python
+
+     import datetime
+     m = ['2016-07-09', datetime.datetime(2016, 3, 2)]
+     pd.to_datetime(m)
+
+* :meth:`~pandas.to_timedelta` (conversion to timedelta objects)
+
+  .. ipython:: python
+
+     m = ['5us', pd.Timedelta('1day')]
+     pd.to_timedelta(m)
+
+To force a conversion, we can pass in an ``errors`` argument, which specifies how pandas should deal with elements
+that cannot be converted to desired dtype or object. By default, ``errors='raise'``, meaning that any errors encountered
+will be raised during the conversion process. However, if ``errors='coerce'``, these errors will be ignored and pandas
+will convert problematic elements to ``pd.NaT`` (for datetime and timedelta) or ``np.nan`` (for numeric). This might be
+useful if you are reading in data which is mostly of the desired dtype (e.g. numeric, datetime), but occasionally has
+non-conforming elements intermixed that you want to represent as missing:
+
+.. ipython:: python
+
+    import datetime
+    m = ['apple', datetime.datetime(2016, 3, 2)]
+    pd.to_datetime(m, errors='coerce')
+
+    m = ['apple', 2, 3]
+    pd.to_numeric(m, errors='coerce')
+
+    m = ['apple', pd.Timedelta('1day')]
+    pd.to_timedelta(m, errors='coerce')
+
+The ``errors`` parameter has a third option of ``errors='ignore'``, which will simply return the passed in data if it
+encounters any errors with the conversion to a desired data type:
+
+.. ipython:: python
+
+    import datetime
+    m = ['apple', datetime.datetime(2016, 3, 2)]
+    pd.to_datetime(m, errors='ignore')
+
+    m = ['apple', 2, 3]
+    pd.to_numeric(m, errors='ignore')
+
+    m = ['apple', pd.Timedelta('1day')]
+    pd.to_timedelta(m, errors='ignore')
+
+In addition to object conversion, :meth:`~pandas.to_numeric` provides another argument ``downcast``, which gives the
+option of downcasting the newly (or already) numeric data to a smaller dtype, which can conserve memory:
+
+.. ipython:: python
+
+    m = ['1', 2, 3]
+    pd.to_numeric(m, downcast='integer')   # smallest signed int dtype
+    pd.to_numeric(m, downcast='signed')    # same as 'integer'
+    pd.to_numeric(m, downcast='unsigned')  # smallest unsigned int dtype
+    pd.to_numeric(m, downcast='float')     # smallest float dtype
+
+As these methods apply only to one-dimensional arrays, lists or scalars; they cannot be used directly on multi-dimensional objects such
+as DataFrames. However, with :meth:`~pandas.DataFrame.apply`, we can "apply" the function over each column efficiently:
+
+.. ipython:: python
+
+    import datetime
+    df = pd.DataFrame([
+        ['2016-07-09', datetime.datetime(2016, 3, 2)]] * 2, dtype='O')
+    df
+    df.apply(pd.to_datetime)
+
+    df = pd.DataFrame([['1.1', 2, 3]] * 2, dtype='O')
+    df
+    df.apply(pd.to_numeric)
+
+    df = pd.DataFrame([['5us', pd.Timedelta('1day')]] * 2, dtype='O')
+    df
+    df.apply(pd.to_timedelta)
+
+gotchas
+~~~~~~~
+
+Performing selection operations on ``integer`` type data can easily upcast the data to ``floating``.
+The dtype of the input data will be preserved in cases where ``nans`` are not introduced.
+See also :ref:`Support for integer NA <gotchas.intna>`.
+
+.. ipython:: python
+
+   dfi = df3.astype('int32')
+   dfi['E'] = 1
+   dfi
+   dfi.dtypes
+
+   casted = dfi[dfi > 0]
+   casted
+   casted.dtypes
+
+While float dtypes are unchanged.
+
+.. ipython:: python
+
+   dfa = df3.copy()
+   dfa['A'] = dfa['A'].astype('float32')
+   dfa.dtypes
+
+   casted = dfa[df2 > 0]
+   casted
+   casted.dtypes
+
+Selecting columns based on ``dtype``
+------------------------------------
+
+.. _basics.selectdtypes:
+
+The :meth:`~DataFrame.select_dtypes` method implements subsetting of columns
+based on their ``dtype``.
+
+First, let's create a :class:`DataFrame` with a slew of different
+dtypes:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'string': list('abc'),
+                      'int64': list(range(1, 4)),
+                      'uint8': np.arange(3, 6).astype('u1'),
+                      'float64': np.arange(4.0, 7.0),
+                      'bool1': [True, False, True],
+                      'bool2': [False, True, False],
+                      'dates': pd.date_range('now', periods=3),
+                      'category': pd.Series(list("ABC")).astype('category')})
+   df['tdeltas'] = df.dates.diff()
+   df['uint64'] = np.arange(3, 6).astype('u8')
+   df['other_dates'] = pd.date_range('20130101', periods=3)
+   df['tz_aware_dates'] = pd.date_range('20130101', periods=3, tz='US/Eastern')
+   df
+
+And the dtypes:
+
+.. ipython:: python
+
+   df.dtypes
+
+:meth:`~DataFrame.select_dtypes` has two parameters ``include`` and ``exclude`` that allow you to
+say "give me the columns *with* these dtypes" (``include``) and/or "give the
+columns *without* these dtypes" (``exclude``).
+
+For example, to select ``bool`` columns:
+
+.. ipython:: python
+
+   df.select_dtypes(include=[bool])
+
+You can also pass the name of a dtype in the `NumPy dtype hierarchy
+<https://docs.scipy.org/doc/numpy/reference/arrays.scalars.html>`__:
+
+.. ipython:: python
+
+   df.select_dtypes(include=['bool'])
+
+:meth:`~pandas.DataFrame.select_dtypes` also works with generic dtypes as well.
+
+For example, to select all numeric and boolean columns while excluding unsigned
+integers:
+
+.. ipython:: python
+
+   df.select_dtypes(include=['number', 'bool'], exclude=['unsignedinteger'])
+
+To select string columns you must use the ``object`` dtype:
+
+.. ipython:: python
+
+   df.select_dtypes(include=['object'])
+
+To see all the child dtypes of a generic ``dtype`` like ``numpy.number`` you
+can define a function that returns a tree of child dtypes:
+
+.. ipython:: python
+
+   def subdtypes(dtype):
+       subs = dtype.__subclasses__()
+       if not subs:
+           return dtype
+       return [dtype, [subdtypes(dt) for dt in subs]]
+
+All NumPy dtypes are subclasses of ``numpy.generic``:
+
+.. ipython:: python
+
+    subdtypes(np.generic)
+
+.. note::
+
+    Pandas also defines the types ``category``, and ``datetime64[ns, tz]``, which are not integrated into the normal
+    NumPy hierarchy and won't show up with the above function.
diff --git a/doc/source/comparison_with_r.rst b/doc/source/getting_started/comparison/comparison_with_r.rst
similarity index 86%
rename from doc/source/comparison_with_r.rst
rename to doc/source/getting_started/comparison/comparison_with_r.rst
index 194e022e34c7c..dfd388125708e 100644
--- a/doc/source/comparison_with_r.rst
+++ b/doc/source/getting_started/comparison/comparison_with_r.rst
@@ -1,12 +1,6 @@
-.. currentmodule:: pandas
 .. _compare_with_r:
 
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   import numpy as np
-   pd.options.display.max_rows=15
+{{ header }}
 
 Comparison with R / R libraries
 *******************************
@@ -18,11 +12,11 @@ was started to provide a more detailed look at the `R language
 party libraries as they relate to ``pandas``. In comparisons with R and CRAN
 libraries, we care about the following things:
 
-  - **Functionality / flexibility**: what can/cannot be done with each tool
-  - **Performance**: how fast are operations. Hard numbers/benchmarks are
-    preferable
-  - **Ease-of-use**: Is one tool easier/harder to use (you may have to be
-    the judge of this, given side-by-side code comparisons)
+* **Functionality / flexibility**: what can/cannot be done with each tool
+* **Performance**: how fast are operations. Hard numbers/benchmarks are
+  preferable
+* **Ease-of-use**: Is one tool easier/harder to use (you may have to be
+  the judge of this, given side-by-side code comparisons)
 
 This page is also here to offer a bit of a translation guide for users of these
 R packages.
@@ -165,16 +159,15 @@ function.
 
 .. ipython:: python
 
-   df = pd.DataFrame({
-     'v1': [1,3,5,7,8,3,5,np.nan,4,5,7,9],
-     'v2': [11,33,55,77,88,33,55,np.nan,44,55,77,99],
-     'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan, 12],
-     'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99, np.nan,
-             np.nan]
-   })
+   df = pd.DataFrame(
+       {'v1': [1, 3, 5, 7, 8, 3, 5, np.nan, 4, 5, 7, 9],
+        'v2': [11, 33, 55, 77, 88, 33, 55, np.nan, 44, 55, 77, 99],
+        'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan, 12],
+        'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99, np.nan,
+                np.nan]})
 
-   g = df.groupby(['by1','by2'])
-   g[['v1','v2']].mean()
+   g = df.groupby(['by1', 'by2'])
+   g[['v1', 'v2']].mean()
 
 For more details and examples see :ref:`the groupby documentation
 <groupby.split>`.
@@ -195,7 +188,7 @@ The :meth:`~pandas.DataFrame.isin` method is similar to R ``%in%`` operator:
 
 .. ipython:: python
 
-   s = pd.Series(np.arange(5),dtype=np.float32)
+   s = pd.Series(np.arange(5), dtype=np.float32)
    s.isin([2, 4])
 
 The ``match`` function returns a vector of the positions of matches
@@ -234,11 +227,11 @@ In ``pandas`` we may use :meth:`~pandas.pivot_table` method to handle this:
    import random
    import string
 
-   baseball = pd.DataFrame({
-      'team': ["team %d" % (x+1) for x in range(5)]*5,
-      'player': random.sample(list(string.ascii_lowercase),25),
-      'batting avg': np.random.uniform(.200, .400, 25)
-      })
+   baseball = pd.DataFrame(
+       {'team': ["team %d" % (x + 1) for x in range(5)] * 5,
+        'player': random.sample(list(string.ascii_lowercase), 25),
+        'batting avg': np.random.uniform(.200, .400, 25)})
+
    baseball.pivot_table(values='batting avg', columns='team', aggfunc=np.max)
 
 For more details and examples see :ref:`the reshaping documentation
@@ -247,8 +240,6 @@ For more details and examples see :ref:`the reshaping documentation
 |subset|_
 ~~~~~~~~~~
 
-.. versionadded:: 0.13
-
 The :meth:`~pandas.DataFrame.query` method is similar to the base R ``subset``
 function. In R you might want to get the rows of a ``data.frame`` where one
 column's values are less than another column's values:
@@ -277,8 +268,6 @@ For more details and examples see :ref:`the query documentation
 |with|_
 ~~~~~~~~
 
-.. versionadded:: 0.13
-
 An expression using a data.frame called ``df`` in R with the columns ``a`` and
 ``b`` would be evaluated using ``with`` like so:
 
@@ -345,15 +334,13 @@ In ``pandas`` the equivalent expression, using the
 
 .. ipython:: python
 
-   df = pd.DataFrame({
-       'x': np.random.uniform(1., 168., 120),
-       'y': np.random.uniform(7., 334., 120),
-       'z': np.random.uniform(1.7, 20.7, 120),
-       'month': [5,6,7,8]*30,
-       'week': np.random.randint(1,4, 120)
-   })
+   df = pd.DataFrame({'x': np.random.uniform(1., 168., 120),
+                      'y': np.random.uniform(7., 334., 120),
+                      'z': np.random.uniform(1.7, 20.7, 120),
+                      'month': [5, 6, 7, 8] * 30,
+                      'week': np.random.randint(1, 4, 120)})
 
-   grouped = df.groupby(['month','week'])
+   grouped = df.groupby(['month', 'week'])
    grouped['x'].agg([np.mean, np.std])
 
 
@@ -378,8 +365,8 @@ In Python, since ``a`` is a list, you can simply use list comprehension.
 
 .. ipython:: python
 
-   a = np.array(list(range(1,24))+[np.NAN]).reshape(2,3,4)
-   pd.DataFrame([tuple(list(x)+[val]) for x, val in np.ndenumerate(a)])
+   a = np.array(list(range(1, 24)) + [np.NAN]).reshape(2, 3, 4)
+   pd.DataFrame([tuple(list(x) + [val]) for x, val in np.ndenumerate(a)])
 
 |meltlist|_
 ~~~~~~~~~~~~
@@ -397,11 +384,11 @@ In Python, this list would be a list of tuples, so
 
 .. ipython:: python
 
-   a = list(enumerate(list(range(1,5))+[np.NAN]))
+   a = list(enumerate(list(range(1, 5)) + [np.NAN]))
    pd.DataFrame(a)
 
 For more details and examples see :ref:`the Into to Data Structures
-documentation <basics.dataframe.from_items>`.
+documentation <dsintro>`.
 
 |meltdf|_
 ~~~~~~~~~~~~~~~~
@@ -423,12 +410,13 @@ In Python, the :meth:`~pandas.melt` method is the R equivalent:
 
 .. ipython:: python
 
-   cheese = pd.DataFrame({'first' : ['John', 'Mary'],
-                       'last' : ['Doe', 'Bo'],
-                       'height' : [5.5, 6.0],
-                       'weight' : [130, 150]})
+   cheese = pd.DataFrame({'first': ['John', 'Mary'],
+                          'last': ['Doe', 'Bo'],
+                          'height': [5.5, 6.0],
+                          'weight': [130, 150]})
+
    pd.melt(cheese, id_vars=['first', 'last'])
-   cheese.set_index(['first', 'last']).stack() # alternative way
+   cheese.set_index(['first', 'last']).stack()  # alternative way
 
 For more details and examples see :ref:`the reshaping documentation
 <reshaping.melt>`.
@@ -456,16 +444,15 @@ In Python the best way is to make use of :meth:`~pandas.pivot_table`:
 
 .. ipython:: python
 
-   df = pd.DataFrame({
-        'x': np.random.uniform(1., 168., 12),
-        'y': np.random.uniform(7., 334., 12),
-        'z': np.random.uniform(1.7, 20.7, 12),
-        'month': [5,6,7]*4,
-        'week': [1,2]*6
-   })
+   df = pd.DataFrame({'x': np.random.uniform(1., 168., 12),
+                      'y': np.random.uniform(7., 334., 12),
+                      'z': np.random.uniform(1.7, 20.7, 12),
+                      'month': [5, 6, 7] * 4,
+                      'week': [1, 2] * 6})
+
    mdf = pd.melt(df, id_vars=['month', 'week'])
-   pd.pivot_table(mdf, values='value', index=['variable','week'],
-                    columns=['month'], aggfunc=np.mean)
+   pd.pivot_table(mdf, values='value', index=['variable', 'week'],
+                  columns=['month'], aggfunc=np.mean)
 
 Similarly for ``dcast`` which uses a data.frame called ``df`` in R to
 aggregate information based on ``Animal`` and ``FeedType``:
@@ -495,13 +482,14 @@ using :meth:`~pandas.pivot_table`:
        'Amount': [10, 7, 4, 2, 5, 6, 2],
    })
 
-   df.pivot_table(values='Amount', index='Animal', columns='FeedType', aggfunc='sum')
+   df.pivot_table(values='Amount', index='Animal', columns='FeedType',
+                  aggfunc='sum')
 
 The second approach is to use the :meth:`~pandas.DataFrame.groupby` method:
 
 .. ipython:: python
 
-   df.groupby(['Animal','FeedType'])['Amount'].sum()
+   df.groupby(['Animal', 'FeedType'])['Amount'].sum()
 
 For more details and examples see :ref:`the reshaping documentation
 <reshaping.pivot>` or :ref:`the groupby documentation<groupby.split>`.
@@ -509,8 +497,6 @@ For more details and examples see :ref:`the reshaping documentation
 |factor|_
 ~~~~~~~~~
 
-.. versionadded:: 0.15
-
 pandas has a data type for categorical data.
 
 .. code-block:: r
@@ -522,11 +508,11 @@ In pandas this is accomplished with ``pd.cut`` and ``astype("category")``:
 
 .. ipython:: python
 
-   pd.cut(pd.Series([1,2,3,4,5,6]), 3)
-   pd.Series([1,2,3,2,2,3]).astype("category")
+   pd.cut(pd.Series([1, 2, 3, 4, 5, 6]), 3)
+   pd.Series([1, 2, 3, 2, 2, 3]).astype("category")
 
 For more details and examples see :ref:`categorical introduction <categorical>` and the
-:ref:`API documentation <api.categorical>`. There is also a documentation regarding the
+:ref:`API documentation <api.arrays.categorical>`. There is also a documentation regarding the
 :ref:`differences to R's factor <categorical.rfactor>`.
 
 
diff --git a/doc/source/getting_started/comparison/comparison_with_sas.rst b/doc/source/getting_started/comparison/comparison_with_sas.rst
new file mode 100644
index 0000000000000..fc12c8524d3bf
--- /dev/null
+++ b/doc/source/getting_started/comparison/comparison_with_sas.rst
@@ -0,0 +1,755 @@
+.. _compare_with_sas:
+
+{{ header }}
+
+Comparison with SAS
+********************
+For potential users coming from `SAS <https://en.wikipedia.org/wiki/SAS_(software)>`__
+this page is meant to demonstrate how different SAS operations would be
+performed in pandas.
+
+If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
+to familiarize yourself with the library.
+
+As is customary, we import pandas and NumPy as follows:
+
+.. ipython:: python
+
+    import pandas as pd
+    import numpy as np
+
+
+.. note::
+
+   Throughout this tutorial, the pandas ``DataFrame`` will be displayed by calling
+   ``df.head()``, which displays the first N (default 5) rows of the ``DataFrame``.
+   This is often used in interactive work (e.g. `Jupyter notebook
+   <https://jupyter.org/>`_ or terminal) - the equivalent in SAS would be:
+
+   .. code-block:: sas
+
+      proc print data=df(obs=5);
+      run;
+
+Data Structures
+---------------
+
+General Terminology Translation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. csv-table::
+    :header: "pandas", "SAS"
+    :widths: 20, 20
+
+    ``DataFrame``, data set
+    column, variable
+    row, observation
+    groupby, BY-group
+    ``NaN``, ``.``
+
+
+``DataFrame`` / ``Series``
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A ``DataFrame`` in pandas is analogous to a SAS data set - a two-dimensional
+data source with labeled columns that can be of different types. As will be
+shown in this document, almost any operation that can be applied to a data set
+using SAS's ``DATA`` step, can also be accomplished in pandas.
+
+A ``Series`` is the data structure that represents one column of a
+``DataFrame``. SAS doesn't have a separate data structure for a single column,
+but in general, working with a ``Series`` is analogous to referencing a column
+in the ``DATA`` step.
+
+``Index``
+~~~~~~~~~
+
+Every ``DataFrame`` and ``Series`` has an ``Index`` - which are labels on the
+*rows* of the data. SAS does not have an exactly analogous concept. A data set's
+rows are essentially unlabeled, other than an implicit integer index that can be
+accessed during the ``DATA`` step (``_N_``).
+
+In pandas, if no index is specified, an integer index is also used by default
+(first row = 0, second row = 1, and so on). While using a labeled ``Index`` or
+``MultiIndex`` can enable sophisticated analyses and is ultimately an important
+part of pandas to understand, for this comparison we will essentially ignore the
+``Index`` and just treat the ``DataFrame`` as a collection of columns. Please
+see the :ref:`indexing documentation<indexing>` for much more on how to use an
+``Index`` effectively.
+
+
+Data Input / Output
+-------------------
+
+Constructing a DataFrame from Values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A SAS data set can be built from specified values by
+placing the data after a ``datalines`` statement and
+specifying the column names.
+
+.. code-block:: sas
+
+   data df;
+       input x y;
+       datalines;
+       1 2
+       3 4
+       5 6
+       ;
+   run;
+
+A pandas ``DataFrame`` can be constructed in many different ways,
+but for a small number of values, it is often convenient to specify it as
+a Python dictionary, where the keys are the column names
+and the values are the data.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'x': [1, 3, 5], 'y': [2, 4, 6]})
+   df
+
+
+Reading External Data
+~~~~~~~~~~~~~~~~~~~~~
+
+Like SAS, pandas provides utilities for reading in data from
+many formats.  The ``tips`` dataset, found within the pandas
+tests (`csv <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv>`_)
+will be used in many of the following examples.
+
+SAS provides ``PROC IMPORT`` to read csv data into a data set.
+
+.. code-block:: sas
+
+   proc import datafile='tips.csv' dbms=csv out=tips replace;
+       getnames=yes;
+   run;
+
+The pandas method is :func:`read_csv`, which works similarly.
+
+.. ipython:: python
+
+   url = ('https://raw.github.com/pandas-dev/'
+          'pandas/master/pandas/tests/data/tips.csv')
+   tips = pd.read_csv(url)
+   tips.head()
+
+
+Like ``PROC IMPORT``, ``read_csv`` can take a number of parameters to specify
+how the data should be parsed.  For example, if the data was instead tab delimited,
+and did not have column names, the pandas command would be:
+
+.. code-block:: python
+
+   tips = pd.read_csv('tips.csv', sep='\t', header=None)
+
+   # alternatively, read_table is an alias to read_csv with tab delimiter
+   tips = pd.read_table('tips.csv', header=None)
+
+In addition to text/csv, pandas supports a variety of other data formats
+such as Excel, HDF5, and SQL databases.  These are all read via a ``pd.read_*``
+function.  See the :ref:`IO documentation<io>` for more details.
+
+Exporting Data
+~~~~~~~~~~~~~~
+
+The inverse of ``PROC IMPORT`` in SAS is ``PROC EXPORT``
+
+.. code-block:: sas
+
+   proc export data=tips outfile='tips2.csv' dbms=csv;
+   run;
+
+Similarly in pandas, the opposite of ``read_csv`` is :meth:`~DataFrame.to_csv`,
+and other data formats follow a similar api.
+
+.. code-block:: python
+
+   tips.to_csv('tips2.csv')
+
+
+Data Operations
+---------------
+
+Operations on Columns
+~~~~~~~~~~~~~~~~~~~~~
+
+In the ``DATA`` step, arbitrary math expressions can
+be used on new or existing columns.
+
+.. code-block:: sas
+
+   data tips;
+       set tips;
+       total_bill = total_bill - 2;
+       new_bill = total_bill / 2;
+   run;
+
+pandas provides similar vectorized operations by
+specifying the individual ``Series`` in the ``DataFrame``.
+New columns can be assigned in the same way.
+
+.. ipython:: python
+
+   tips['total_bill'] = tips['total_bill'] - 2
+   tips['new_bill'] = tips['total_bill'] / 2.0
+   tips.head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop('new_bill', axis=1)
+
+Filtering
+~~~~~~~~~
+
+Filtering in SAS is done with an ``if`` or ``where`` statement, on one
+or more columns.
+
+.. code-block:: sas
+
+   data tips;
+       set tips;
+       if total_bill > 10;
+   run;
+
+   data tips;
+       set tips;
+       where total_bill > 10;
+       /* equivalent in this case - where happens before the
+          DATA step begins and can also be used in PROC statements */
+   run;
+
+DataFrames can be filtered in multiple ways; the most intuitive of which is using
+:ref:`boolean indexing <indexing.boolean>`
+
+.. ipython:: python
+
+   tips[tips['total_bill'] > 10].head()
+
+If/Then Logic
+~~~~~~~~~~~~~
+
+In SAS, if/then logic can be used to create new columns.
+
+.. code-block:: sas
+
+   data tips;
+       set tips;
+       format bucket $4.;
+
+       if total_bill < 10 then bucket = 'low';
+       else bucket = 'high';
+   run;
+
+The same operation in pandas can be accomplished using
+the ``where`` method from ``numpy``.
+
+.. ipython:: python
+
+   tips['bucket'] = np.where(tips['total_bill'] < 10, 'low', 'high')
+   tips.head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop('bucket', axis=1)
+
+Date Functionality
+~~~~~~~~~~~~~~~~~~
+
+SAS provides a variety of functions to do operations on
+date/datetime columns.
+
+.. code-block:: sas
+
+   data tips;
+       set tips;
+       format date1 date2 date1_plusmonth mmddyy10.;
+       date1 = mdy(1, 15, 2013);
+       date2 = mdy(2, 15, 2015);
+       date1_year = year(date1);
+       date2_month = month(date2);
+       * shift date to beginning of next interval;
+       date1_next = intnx('MONTH', date1, 1);
+       * count intervals between dates;
+       months_between = intck('MONTH', date1, date2);
+   run;
+
+The equivalent pandas operations are shown below.  In addition to these
+functions pandas supports other Time Series features
+not available in Base SAS (such as resampling and custom offsets) -
+see the :ref:`timeseries documentation<timeseries>` for more details.
+
+.. ipython:: python
+
+   tips['date1'] = pd.Timestamp('2013-01-15')
+   tips['date2'] = pd.Timestamp('2015-02-15')
+   tips['date1_year'] = tips['date1'].dt.year
+   tips['date2_month'] = tips['date2'].dt.month
+   tips['date1_next'] = tips['date1'] + pd.offsets.MonthBegin()
+   tips['months_between'] = (
+       tips['date2'].dt.to_period('M') - tips['date1'].dt.to_period('M'))
+
+   tips[['date1', 'date2', 'date1_year', 'date2_month',
+         'date1_next', 'months_between']].head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop(['date1', 'date2', 'date1_year',
+                     'date2_month', 'date1_next', 'months_between'], axis=1)
+
+Selection of Columns
+~~~~~~~~~~~~~~~~~~~~
+
+SAS provides keywords in the ``DATA`` step to select,
+drop, and rename columns.
+
+.. code-block:: sas
+
+   data tips;
+       set tips;
+       keep sex total_bill tip;
+   run;
+
+   data tips;
+       set tips;
+       drop sex;
+   run;
+
+   data tips;
+       set tips;
+       rename total_bill=total_bill_2;
+   run;
+
+The same operations are expressed in pandas below.
+
+.. ipython:: python
+
+   # keep
+   tips[['sex', 'total_bill', 'tip']].head()
+
+   # drop
+   tips.drop('sex', axis=1).head()
+
+   # rename
+   tips.rename(columns={'total_bill': 'total_bill_2'}).head()
+
+
+Sorting by Values
+~~~~~~~~~~~~~~~~~
+
+Sorting in SAS is accomplished via ``PROC SORT``
+
+.. code-block:: sas
+
+   proc sort data=tips;
+       by sex total_bill;
+   run;
+
+pandas objects have a :meth:`~DataFrame.sort_values` method, which
+takes a list of columns to sort by.
+
+.. ipython:: python
+
+   tips = tips.sort_values(['sex', 'total_bill'])
+   tips.head()
+
+
+String Processing
+-----------------
+
+Length
+~~~~~~
+
+SAS determines the length of a character string with the
+`LENGTHN <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm>`__
+and `LENGTHC <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm>`__
+functions. ``LENGTHN`` excludes trailing blanks and ``LENGTHC`` includes trailing blanks.
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(LENGTHN(time));
+   put(LENGTHC(time));
+   run;
+
+Python determines the length of a character string with the ``len`` function.
+``len`` includes trailing blanks.  Use ``len`` and ``rstrip`` to exclude
+trailing blanks.
+
+.. ipython:: python
+
+   tips['time'].str.len().head()
+   tips['time'].str.rstrip().str.len().head()
+
+
+Find
+~~~~
+
+SAS determines the position of a character in a string with the
+`FINDW <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm>`__ function.
+``FINDW`` takes the string defined by the first argument and searches for the first position of the substring
+you supply as the second argument.
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(FINDW(sex,'ale'));
+   run;
+
+Python determines the position of a character in a string with the
+``find`` function.  ``find`` searches for the first position of the
+substring.  If the substring is found, the function returns its
+position.  Keep in mind that Python indexes are zero-based and
+the function will return -1 if it fails to find the substring.
+
+.. ipython:: python
+
+   tips['sex'].str.find("ale").head()
+
+
+Substring
+~~~~~~~~~
+
+SAS extracts a substring from a string based on its position with the
+`SUBSTR <https://www2.sas.com/proceedings/sugi25/25/cc/25p088.pdf>`__ function.
+
+.. code-block:: sas
+
+   data _null_;
+   set tips;
+   put(substr(sex,1,1));
+   run;
+
+With pandas you can use ``[]`` notation to extract a substring
+from a string by position locations.  Keep in mind that Python
+indexes are zero-based.
+
+.. ipython:: python
+
+   tips['sex'].str[0:1].head()
+
+
+Scan
+~~~~
+
+The SAS `SCAN <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm>`__
+function returns the nth word from a string. The first argument is the string you want to parse and the
+second argument specifies which word you want to extract.
+
+.. code-block:: sas
+
+   data firstlast;
+   input String $60.;
+   First_Name = scan(string, 1);
+   Last_Name = scan(string, -1);
+   datalines2;
+   John Smith;
+   Jane Cook;
+   ;;;
+   run;
+
+Python extracts a substring from a string based on its text
+by using regular expressions. There are much more powerful
+approaches, but this just shows a simple approach.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'String': ['John Smith', 'Jane Cook']})
+   firstlast['First_Name'] = firstlast['String'].str.split(" ", expand=True)[0]
+   firstlast['Last_Name'] = firstlast['String'].str.rsplit(" ", expand=True)[0]
+   firstlast
+
+
+Upcase, Lowcase, and Propcase
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The SAS `UPCASE <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm>`__
+`LOWCASE <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm>`__ and
+`PROPCASE <https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/a002598106.htm>`__
+functions change the case of the argument.
+
+.. code-block:: sas
+
+   data firstlast;
+   input String $60.;
+   string_up = UPCASE(string);
+   string_low = LOWCASE(string);
+   string_prop = PROPCASE(string);
+   datalines2;
+   John Smith;
+   Jane Cook;
+   ;;;
+   run;
+
+The equivalent Python functions are ``upper``, ``lower``, and ``title``.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'String': ['John Smith', 'Jane Cook']})
+   firstlast['string_up'] = firstlast['String'].str.upper()
+   firstlast['string_low'] = firstlast['String'].str.lower()
+   firstlast['string_prop'] = firstlast['String'].str.title()
+   firstlast
+
+Merging
+-------
+
+The following tables will be used in the merge examples
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'key': ['A', 'B', 'C', 'D'],
+                       'value': np.random.randn(4)})
+   df1
+   df2 = pd.DataFrame({'key': ['B', 'D', 'D', 'E'],
+                       'value': np.random.randn(4)})
+   df2
+
+In SAS, data must be explicitly sorted before merging.  Different
+types of joins are accomplished using the ``in=`` dummy
+variables to track whether a match was found in one or both
+input frames.
+
+.. code-block:: sas
+
+   proc sort data=df1;
+       by key;
+   run;
+
+   proc sort data=df2;
+       by key;
+   run;
+
+   data left_join inner_join right_join outer_join;
+       merge df1(in=a) df2(in=b);
+
+       if a and b then output inner_join;
+       if a then output left_join;
+       if b then output right_join;
+       if a or b then output outer_join;
+   run;
+
+pandas DataFrames have a :meth:`~DataFrame.merge` method, which provides
+similar functionality.  Note that the data does not have
+to be sorted ahead of time, and different join
+types are accomplished via the ``how`` keyword.
+
+.. ipython:: python
+
+   inner_join = df1.merge(df2, on=['key'], how='inner')
+   inner_join
+
+   left_join = df1.merge(df2, on=['key'], how='left')
+   left_join
+
+   right_join = df1.merge(df2, on=['key'], how='right')
+   right_join
+
+   outer_join = df1.merge(df2, on=['key'], how='outer')
+   outer_join
+
+
+Missing Data
+------------
+
+Like SAS, pandas has a representation for missing data - which is the
+special float value ``NaN`` (not a number).  Many of the semantics
+are the same, for example missing data propagates through numeric
+operations, and is ignored by default for aggregations.
+
+.. ipython:: python
+
+   outer_join
+   outer_join['value_x'] + outer_join['value_y']
+   outer_join['value_x'].sum()
+
+One difference is that missing data cannot be compared to its sentinel value.
+For example, in SAS you could do this to filter missing values.
+
+.. code-block:: sas
+
+   data outer_join_nulls;
+       set outer_join;
+       if value_x = .;
+   run;
+
+   data outer_join_no_nulls;
+       set outer_join;
+       if value_x ^= .;
+   run;
+
+Which doesn't work in pandas.  Instead, the ``pd.isna`` or ``pd.notna`` functions
+should be used for comparisons.
+
+.. ipython:: python
+
+   outer_join[pd.isna(outer_join['value_x'])]
+   outer_join[pd.notna(outer_join['value_x'])]
+
+pandas also provides a variety of methods to work with missing data - some of
+which would be challenging to express in SAS. For example, there are methods to
+drop all rows with any missing values, replacing missing values with a specified
+value, like the mean, or forward filling from previous rows. See the
+:ref:`missing data documentation<missing_data>` for more.
+
+.. ipython:: python
+
+   outer_join.dropna()
+   outer_join.fillna(method='ffill')
+   outer_join['value_x'].fillna(outer_join['value_x'].mean())
+
+
+GroupBy
+-------
+
+Aggregation
+~~~~~~~~~~~
+
+SAS's PROC SUMMARY can be used to group by one or
+more key variables and compute aggregations on
+numeric columns.
+
+.. code-block:: sas
+
+   proc summary data=tips nway;
+       class sex smoker;
+       var total_bill tip;
+       output out=tips_summed sum=;
+   run;
+
+pandas provides a flexible ``groupby`` mechanism that
+allows similar aggregations.  See the :ref:`groupby documentation<groupby>`
+for more details and examples.
+
+.. ipython:: python
+
+   tips_summed = tips.groupby(['sex', 'smoker'])['total_bill', 'tip'].sum()
+   tips_summed.head()
+
+
+Transformation
+~~~~~~~~~~~~~~
+
+In SAS, if the group aggregations need to be used with
+the original frame, it must be merged back together.  For
+example, to subtract the mean for each observation by smoker group.
+
+.. code-block:: sas
+
+   proc summary data=tips missing nway;
+       class smoker;
+       var total_bill;
+       output out=smoker_means mean(total_bill)=group_bill;
+   run;
+
+   proc sort data=tips;
+       by smoker;
+   run;
+
+   data tips;
+       merge tips(in=a) smoker_means(in=b);
+       by smoker;
+       adj_total_bill = total_bill - group_bill;
+       if a and b;
+   run;
+
+
+pandas ``groubpy`` provides a ``transform`` mechanism that allows
+these type of operations to be succinctly expressed in one
+operation.
+
+.. ipython:: python
+
+   gb = tips.groupby('smoker')['total_bill']
+   tips['adj_total_bill'] = tips['total_bill'] - gb.transform('mean')
+   tips.head()
+
+
+By Group Processing
+~~~~~~~~~~~~~~~~~~~
+
+In addition to aggregation, pandas ``groupby`` can be used to
+replicate most other by group processing from SAS. For example,
+this ``DATA`` step reads the data by sex/smoker group and filters to
+the first entry for each.
+
+.. code-block:: sas
+
+   proc sort data=tips;
+      by sex smoker;
+   run;
+
+   data tips_first;
+       set tips;
+       by sex smoker;
+       if FIRST.sex or FIRST.smoker then output;
+   run;
+
+In pandas this would be written as:
+
+.. ipython:: python
+
+   tips.groupby(['sex', 'smoker']).first()
+
+
+Other Considerations
+--------------------
+
+Disk vs Memory
+~~~~~~~~~~~~~~
+
+pandas operates exclusively in memory, where a SAS data set exists on disk.
+This means that the size of data able to be loaded in pandas is limited by your
+machine's memory, but also that the operations on that data may be faster.
+
+If out of core processing is needed, one possibility is the
+`dask.dataframe <https://dask.pydata.org/en/latest/dataframe.html>`_
+library (currently in development) which
+provides a subset of pandas functionality for an on-disk ``DataFrame``
+
+Data Interop
+~~~~~~~~~~~~
+
+pandas provides a :func:`read_sas` method that can read SAS data saved in
+the XPORT or SAS7BDAT binary format.
+
+.. code-block:: sas
+
+   libname xportout xport 'transport-file.xpt';
+   data xportout.tips;
+       set tips(rename=(total_bill=tbill));
+       * xport variable names limited to 6 characters;
+   run;
+
+.. code-block:: python
+
+   df = pd.read_sas('transport-file.xpt')
+   df = pd.read_sas('binary-file.sas7bdat')
+
+You can also specify the file format directly. By default, pandas will try
+to infer the file format based on its extension.
+
+.. code-block:: python
+
+   df = pd.read_sas('transport-file.xpt', format='xport')
+   df = pd.read_sas('binary-file.sas7bdat', format='sas7bdat')
+
+XPORT is a relatively limited format and the parsing of it is not as
+optimized as some of the other pandas readers. An alternative way
+to interop data between SAS and pandas is to serialize to csv.
+
+.. code-block:: ipython
+
+   # version 0.17, 10M rows
+
+   In [8]: %time df = pd.read_sas('big.xpt')
+   Wall time: 14.6 s
+
+   In [9]: %time df = pd.read_csv('big.csv')
+   Wall time: 4.86 s
diff --git a/doc/source/comparison_with_sql.rst b/doc/source/getting_started/comparison/comparison_with_sql.rst
similarity index 92%
rename from doc/source/comparison_with_sql.rst
rename to doc/source/getting_started/comparison/comparison_with_sql.rst
index 7962e0e69faa1..366fdd546f58b 100644
--- a/doc/source/comparison_with_sql.rst
+++ b/doc/source/getting_started/comparison/comparison_with_sql.rst
@@ -1,16 +1,17 @@
-.. currentmodule:: pandas
 .. _compare_with_sql:
 
+{{ header }}
+
 Comparison with SQL
 ********************
 Since many potential pandas users have some familiarity with
-`SQL <http://en.wikipedia.org/wiki/SQL>`_, this page is meant to provide some examples of how
+`SQL <https://en.wikipedia.org/wiki/SQL>`_, this page is meant to provide some examples of how
 various SQL operations would be performed using pandas.
 
 If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
 to familiarize yourself with the library.
 
-As is customary, we import pandas and numpy as follows:
+As is customary, we import pandas and NumPy as follows:
 
 .. ipython:: python
 
@@ -23,7 +24,8 @@ structure.
 
 .. ipython:: python
 
-    url = 'https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv'
+    url = ('https://raw.github.com/pandas-dev'
+           '/pandas/master/pandas/tests/data/tips.csv')
     tips = pd.read_csv(url)
     tips.head()
 
@@ -59,7 +61,7 @@ Filtering in SQL is done via a WHERE clause.
     LIMIT 5;
 
 DataFrames can be filtered in multiple ways; the most intuitive of which is using
-`boolean indexing <http://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing>`_.
+`boolean indexing <https://pandas.pydata.org/pandas-docs/stable/indexing.html#boolean-indexing>`_.
 
 .. ipython:: python
 
@@ -101,7 +103,7 @@ Just like SQL's OR and AND, multiple conditions can be passed to a DataFrame usi
     # tips by parties of at least 5 diners OR bill total was more than $45
     tips[(tips['size'] >= 5) | (tips['total_bill'] > 45)]
 
-NULL checking is done using the :meth:`~pandas.Series.notnull` and :meth:`~pandas.Series.isnull`
+NULL checking is done using the :meth:`~pandas.Series.notna` and :meth:`~pandas.Series.isna`
 methods.
 
 .. ipython:: python
@@ -121,9 +123,9 @@ where ``col2`` IS NULL with the following query:
 
 .. ipython:: python
 
-    frame[frame['col2'].isnull()]
+    frame[frame['col2'].isna()]
 
-Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.notnull`.
+Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.notna`.
 
 .. code-block:: sql
 
@@ -133,7 +135,7 @@ Getting items where ``col1`` IS NOT NULL can be done with :meth:`~pandas.Series.
 
 .. ipython:: python
 
-    frame[frame['col1'].notnull()]
+    frame[frame['col1'].notna()]
 
 
 GROUP BY
@@ -387,7 +389,7 @@ Top N rows with offset
 
 .. ipython:: python
 
-    tips.nlargest(10+5, columns='tip').tail(10)
+    tips.nlargest(10 + 5, columns='tip').tail(10)
 
 Top N rows per group
 ~~~~~~~~~~~~~~~~~~~~
@@ -411,8 +413,7 @@ Top N rows per group
                         .groupby(['day'])
                         .cumcount() + 1)
          .query('rn < 3')
-         .sort_values(['day','rn'])
-    )
+         .sort_values(['day', 'rn']))
 
 the same using `rank(method='first')` function
 
@@ -421,8 +422,7 @@ the same using `rank(method='first')` function
     (tips.assign(rnk=tips.groupby(['day'])['total_bill']
                          .rank(method='first', ascending=False))
          .query('rnk < 3')
-         .sort_values(['day','rnk'])
-    )
+         .sort_values(['day', 'rnk']))
 
 .. code-block:: sql
 
@@ -445,11 +445,10 @@ Notice that when using ``rank(method='min')`` function
 .. ipython:: python
 
     (tips[tips['tip'] < 2]
-         .assign(rnk_min=tips.groupby(['sex'])['tip']
-                             .rank(method='min'))
-         .query('rnk_min < 3')
-         .sort_values(['sex','rnk_min'])
-    )
+        .assign(rnk_min=tips.groupby(['sex'])['tip']
+                            .rank(method='min'))
+        .query('rnk_min < 3')
+        .sort_values(['sex', 'rnk_min']))
 
 
 UPDATE
diff --git a/doc/source/getting_started/comparison/comparison_with_stata.rst b/doc/source/getting_started/comparison/comparison_with_stata.rst
new file mode 100644
index 0000000000000..bf2b03176ecd8
--- /dev/null
+++ b/doc/source/getting_started/comparison/comparison_with_stata.rst
@@ -0,0 +1,678 @@
+.. _compare_with_stata:
+
+{{ header }}
+
+Comparison with Stata
+*********************
+For potential users coming from `Stata <https://en.wikipedia.org/wiki/Stata>`__
+this page is meant to demonstrate how different Stata operations would be
+performed in pandas.
+
+If you're new to pandas, you might want to first read through :ref:`10 Minutes to pandas<10min>`
+to familiarize yourself with the library.
+
+As is customary, we import pandas and NumPy as follows. This means that we can refer to the
+libraries as ``pd`` and ``np``, respectively, for the rest of the document.
+
+.. ipython:: python
+
+    import pandas as pd
+    import numpy as np
+
+
+.. note::
+
+   Throughout this tutorial, the pandas ``DataFrame`` will be displayed by calling
+   ``df.head()``, which displays the first N (default 5) rows of the ``DataFrame``.
+   This is often used in interactive work (e.g. `Jupyter notebook
+   <https://jupyter.org/>`_ or terminal) -- the equivalent in Stata would be:
+
+   .. code-block:: stata
+
+      list in 1/5
+
+Data Structures
+---------------
+
+General Terminology Translation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. csv-table::
+    :header: "pandas", "Stata"
+    :widths: 20, 20
+
+    ``DataFrame``, data set
+    column, variable
+    row, observation
+    groupby, bysort
+    ``NaN``, ``.``
+
+
+``DataFrame`` / ``Series``
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A ``DataFrame`` in pandas is analogous to a Stata data set -- a two-dimensional
+data source with labeled columns that can be of different types. As will be
+shown in this document, almost any operation that can be applied to a data set
+in Stata can also be accomplished in pandas.
+
+A ``Series`` is the data structure that represents one column of a
+``DataFrame``. Stata doesn't have a separate data structure for a single column,
+but in general, working with a ``Series`` is analogous to referencing a column
+of a data set in Stata.
+
+``Index``
+~~~~~~~~~
+
+Every ``DataFrame`` and ``Series`` has an ``Index`` -- labels on the
+*rows* of the data. Stata does not have an exactly analogous concept. In Stata, a data set's
+rows are essentially unlabeled, other than an implicit integer index that can be
+accessed with ``_n``.
+
+In pandas, if no index is specified, an integer index is also used by default
+(first row = 0, second row = 1, and so on). While using a labeled ``Index`` or
+``MultiIndex`` can enable sophisticated analyses and is ultimately an important
+part of pandas to understand, for this comparison we will essentially ignore the
+``Index`` and just treat the ``DataFrame`` as a collection of columns. Please
+see the :ref:`indexing documentation<indexing>` for much more on how to use an
+``Index`` effectively.
+
+
+Data Input / Output
+-------------------
+
+Constructing a DataFrame from Values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A Stata data set can be built from specified values by
+placing the data after an ``input`` statement and
+specifying the column names.
+
+.. code-block:: stata
+
+   input x y
+   1 2
+   3 4
+   5 6
+   end
+
+A pandas ``DataFrame`` can be constructed in many different ways,
+but for a small number of values, it is often convenient to specify it as
+a Python dictionary, where the keys are the column names
+and the values are the data.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'x': [1, 3, 5], 'y': [2, 4, 6]})
+   df
+
+
+Reading External Data
+~~~~~~~~~~~~~~~~~~~~~
+
+Like Stata, pandas provides utilities for reading in data from
+many formats.  The ``tips`` data set, found within the pandas
+tests (`csv <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/tips.csv>`_)
+will be used in many of the following examples.
+
+Stata provides ``import delimited`` to read csv data into a data set in memory.
+If the ``tips.csv`` file is in the current working directory, we can import it as follows.
+
+.. code-block:: stata
+
+   import delimited tips.csv
+
+The pandas method is :func:`read_csv`, which works similarly. Additionally, it will automatically download
+the data set if presented with a url.
+
+.. ipython:: python
+
+   url = ('https://raw.github.com/pandas-dev'
+          '/pandas/master/pandas/tests/data/tips.csv')
+   tips = pd.read_csv(url)
+   tips.head()
+
+Like ``import delimited``, :func:`read_csv` can take a number of parameters to specify
+how the data should be parsed.  For example, if the data were instead tab delimited,
+did not have column names, and existed in the current working directory,
+the pandas command would be:
+
+.. code-block:: python
+
+   tips = pd.read_csv('tips.csv', sep='\t', header=None)
+
+   # alternatively, read_table is an alias to read_csv with tab delimiter
+   tips = pd.read_table('tips.csv', header=None)
+
+Pandas can also read Stata data sets in ``.dta`` format with the :func:`read_stata` function.
+
+.. code-block:: python
+
+   df = pd.read_stata('data.dta')
+
+In addition to text/csv and Stata files, pandas supports a variety of other data formats
+such as Excel, SAS, HDF5, Parquet, and SQL databases.  These are all read via a ``pd.read_*``
+function.  See the :ref:`IO documentation<io>` for more details.
+
+
+Exporting Data
+~~~~~~~~~~~~~~
+
+The inverse of ``import delimited`` in Stata is ``export delimited``
+
+.. code-block:: stata
+
+   export delimited tips2.csv
+
+Similarly in pandas, the opposite of ``read_csv`` is :meth:`DataFrame.to_csv`.
+
+.. code-block:: python
+
+   tips.to_csv('tips2.csv')
+
+Pandas can also export to Stata file format with the :meth:`DataFrame.to_stata` method.
+
+.. code-block:: python
+
+   tips.to_stata('tips2.dta')
+
+
+Data Operations
+---------------
+
+Operations on Columns
+~~~~~~~~~~~~~~~~~~~~~
+
+In Stata, arbitrary math expressions can be used with the ``generate`` and
+``replace`` commands on new or existing columns. The ``drop`` command drops
+the column from the data set.
+
+.. code-block:: stata
+
+   replace total_bill = total_bill - 2
+   generate new_bill = total_bill / 2
+   drop new_bill
+
+pandas provides similar vectorized operations by
+specifying the individual ``Series`` in the ``DataFrame``.
+New columns can be assigned in the same way. The :meth:`DataFrame.drop` method
+drops a column from the ``DataFrame``.
+
+.. ipython:: python
+
+   tips['total_bill'] = tips['total_bill'] - 2
+   tips['new_bill'] = tips['total_bill'] / 2
+   tips.head()
+
+   tips = tips.drop('new_bill', axis=1)
+
+Filtering
+~~~~~~~~~
+
+Filtering in Stata is done with an ``if`` clause on one or more columns.
+
+.. code-block:: stata
+
+   list if total_bill > 10
+
+DataFrames can be filtered in multiple ways; the most intuitive of which is using
+:ref:`boolean indexing <indexing.boolean>`.
+
+.. ipython:: python
+
+   tips[tips['total_bill'] > 10].head()
+
+If/Then Logic
+~~~~~~~~~~~~~
+
+In Stata, an ``if`` clause can also be used to create new columns.
+
+.. code-block:: stata
+
+   generate bucket = "low" if total_bill < 10
+   replace bucket = "high" if total_bill >= 10
+
+The same operation in pandas can be accomplished using
+the ``where`` method from ``numpy``.
+
+.. ipython:: python
+
+   tips['bucket'] = np.where(tips['total_bill'] < 10, 'low', 'high')
+   tips.head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop('bucket', axis=1)
+
+Date Functionality
+~~~~~~~~~~~~~~~~~~
+
+Stata provides a variety of functions to do operations on
+date/datetime columns.
+
+.. code-block:: stata
+
+   generate date1 = mdy(1, 15, 2013)
+   generate date2 = date("Feb152015", "MDY")
+
+   generate date1_year = year(date1)
+   generate date2_month = month(date2)
+
+   * shift date to beginning of next month
+   generate date1_next = mdy(month(date1) + 1, 1, year(date1)) if month(date1) != 12
+   replace date1_next = mdy(1, 1, year(date1) + 1) if month(date1) == 12
+   generate months_between = mofd(date2) - mofd(date1)
+
+   list date1 date2 date1_year date2_month date1_next months_between
+
+The equivalent pandas operations are shown below.  In addition to these
+functions, pandas supports other Time Series features
+not available in Stata (such as time zone handling and custom offsets) --
+see the :ref:`timeseries documentation<timeseries>` for more details.
+
+.. ipython:: python
+
+   tips['date1'] = pd.Timestamp('2013-01-15')
+   tips['date2'] = pd.Timestamp('2015-02-15')
+   tips['date1_year'] = tips['date1'].dt.year
+   tips['date2_month'] = tips['date2'].dt.month
+   tips['date1_next'] = tips['date1'] + pd.offsets.MonthBegin()
+   tips['months_between'] = (tips['date2'].dt.to_period('M')
+                             - tips['date1'].dt.to_period('M'))
+
+   tips[['date1', 'date2', 'date1_year', 'date2_month', 'date1_next',
+         'months_between']].head()
+
+.. ipython:: python
+   :suppress:
+
+   tips = tips.drop(['date1', 'date2', 'date1_year', 'date2_month',
+                     'date1_next', 'months_between'], axis=1)
+
+Selection of Columns
+~~~~~~~~~~~~~~~~~~~~
+
+Stata provides keywords to select, drop, and rename columns.
+
+.. code-block:: stata
+
+   keep sex total_bill tip
+
+   drop sex
+
+   rename total_bill total_bill_2
+
+The same operations are expressed in pandas below. Note that in contrast to Stata, these
+operations do not happen in place. To make these changes persist, assign the operation back
+to a variable.
+
+.. ipython:: python
+
+   # keep
+   tips[['sex', 'total_bill', 'tip']].head()
+
+   # drop
+   tips.drop('sex', axis=1).head()
+
+   # rename
+   tips.rename(columns={'total_bill': 'total_bill_2'}).head()
+
+
+Sorting by Values
+~~~~~~~~~~~~~~~~~
+
+Sorting in Stata is accomplished via ``sort``
+
+.. code-block:: stata
+
+   sort sex total_bill
+
+pandas objects have a :meth:`DataFrame.sort_values` method, which
+takes a list of columns to sort by.
+
+.. ipython:: python
+
+   tips = tips.sort_values(['sex', 'total_bill'])
+   tips.head()
+
+
+String Processing
+-----------------
+
+Finding Length of String
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata determines the length of a character string with the :func:`strlen` and
+:func:`ustrlen` functions for ASCII and Unicode strings, respectively.
+
+.. code-block:: stata
+
+   generate strlen_time = strlen(time)
+   generate ustrlen_time = ustrlen(time)
+
+Python determines the length of a character string with the ``len`` function.
+In Python 3, all strings are Unicode strings. ``len`` includes trailing blanks.
+Use ``len`` and ``rstrip`` to exclude trailing blanks.
+
+.. ipython:: python
+
+   tips['time'].str.len().head()
+   tips['time'].str.rstrip().str.len().head()
+
+
+Finding Position of Substring
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata determines the position of a character in a string with the :func:`strpos` function.
+This takes the string defined by the first argument and searches for the
+first position of the substring you supply as the second argument.
+
+.. code-block:: stata
+
+   generate str_position = strpos(sex, "ale")
+
+Python determines the position of a character in a string with the
+:func:`find` function.  ``find`` searches for the first position of the
+substring.  If the substring is found, the function returns its
+position.  Keep in mind that Python indexes are zero-based and
+the function will return -1 if it fails to find the substring.
+
+.. ipython:: python
+
+   tips['sex'].str.find("ale").head()
+
+
+Extracting Substring by Position
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Stata extracts a substring from a string based on its position with the :func:`substr` function.
+
+.. code-block:: stata
+
+   generate short_sex = substr(sex, 1, 1)
+
+With pandas you can use ``[]`` notation to extract a substring
+from a string by position locations.  Keep in mind that Python
+indexes are zero-based.
+
+.. ipython:: python
+
+   tips['sex'].str[0:1].head()
+
+
+Extracting nth Word
+~~~~~~~~~~~~~~~~~~~
+
+The Stata :func:`word` function returns the nth word from a string.
+The first argument is the string you want to parse and the
+second argument specifies which word you want to extract.
+
+.. code-block:: stata
+
+   clear
+   input str20 string
+   "John Smith"
+   "Jane Cook"
+   end
+
+   generate first_name = word(name, 1)
+   generate last_name = word(name, -1)
+
+Python extracts a substring from a string based on its text
+by using regular expressions. There are much more powerful
+approaches, but this just shows a simple approach.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'string': ['John Smith', 'Jane Cook']})
+   firstlast['First_Name'] = firstlast['string'].str.split(" ", expand=True)[0]
+   firstlast['Last_Name'] = firstlast['string'].str.rsplit(" ", expand=True)[0]
+   firstlast
+
+
+Changing Case
+~~~~~~~~~~~~~
+
+The Stata :func:`strupper`, :func:`strlower`, :func:`strproper`,
+:func:`ustrupper`, :func:`ustrlower`, and :func:`ustrtitle` functions
+change the case of ASCII and Unicode strings, respectively.
+
+.. code-block:: stata
+
+   clear
+   input str20 string
+   "John Smith"
+   "Jane Cook"
+   end
+
+   generate upper = strupper(string)
+   generate lower = strlower(string)
+   generate title = strproper(string)
+   list
+
+The equivalent Python functions are ``upper``, ``lower``, and ``title``.
+
+.. ipython:: python
+
+   firstlast = pd.DataFrame({'string': ['John Smith', 'Jane Cook']})
+   firstlast['upper'] = firstlast['string'].str.upper()
+   firstlast['lower'] = firstlast['string'].str.lower()
+   firstlast['title'] = firstlast['string'].str.title()
+   firstlast
+
+Merging
+-------
+
+The following tables will be used in the merge examples
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'key': ['A', 'B', 'C', 'D'],
+                       'value': np.random.randn(4)})
+   df1
+   df2 = pd.DataFrame({'key': ['B', 'D', 'D', 'E'],
+                       'value': np.random.randn(4)})
+   df2
+
+In Stata, to perform a merge, one data set must be in memory
+and the other must be referenced as a file name on disk. In
+contrast, Python must have both ``DataFrames`` already in memory.
+
+By default, Stata performs an outer join, where all observations
+from both data sets are left in memory after the merge. One can
+keep only observations from the initial data set, the merged data set,
+or the intersection of the two by using the values created in the
+``_merge`` variable.
+
+.. code-block:: stata
+
+   * First create df2 and save to disk
+   clear
+   input str1 key
+   B
+   D
+   D
+   E
+   end
+   generate value = rnormal()
+   save df2.dta
+
+   * Now create df1 in memory
+   clear
+   input str1 key
+   A
+   B
+   C
+   D
+   end
+   generate value = rnormal()
+
+   preserve
+
+   * Left join
+   merge 1:n key using df2.dta
+   keep if _merge == 1
+
+   * Right join
+   restore, preserve
+   merge 1:n key using df2.dta
+   keep if _merge == 2
+
+   * Inner join
+   restore, preserve
+   merge 1:n key using df2.dta
+   keep if _merge == 3
+
+   * Outer join
+   restore
+   merge 1:n key using df2.dta
+
+pandas DataFrames have a :meth:`DataFrame.merge` method, which provides
+similar functionality. Note that different join
+types are accomplished via the ``how`` keyword.
+
+.. ipython:: python
+
+   inner_join = df1.merge(df2, on=['key'], how='inner')
+   inner_join
+
+   left_join = df1.merge(df2, on=['key'], how='left')
+   left_join
+
+   right_join = df1.merge(df2, on=['key'], how='right')
+   right_join
+
+   outer_join = df1.merge(df2, on=['key'], how='outer')
+   outer_join
+
+
+Missing Data
+------------
+
+Like Stata, pandas has a representation for missing data -- the
+special float value ``NaN`` (not a number).  Many of the semantics
+are the same; for example missing data propagates through numeric
+operations, and is ignored by default for aggregations.
+
+.. ipython:: python
+
+   outer_join
+   outer_join['value_x'] + outer_join['value_y']
+   outer_join['value_x'].sum()
+
+One difference is that missing data cannot be compared to its sentinel value.
+For example, in Stata you could do this to filter missing values.
+
+.. code-block:: stata
+
+   * Keep missing values
+   list if value_x == .
+   * Keep non-missing values
+   list if value_x != .
+
+This doesn't work in pandas.  Instead, the :func:`pd.isna` or :func:`pd.notna` functions
+should be used for comparisons.
+
+.. ipython:: python
+
+   outer_join[pd.isna(outer_join['value_x'])]
+   outer_join[pd.notna(outer_join['value_x'])]
+
+Pandas also provides a variety of methods to work with missing data -- some of
+which would be challenging to express in Stata. For example, there are methods to
+drop all rows with any missing values, replacing missing values with a specified
+value, like the mean, or forward filling from previous rows. See the
+:ref:`missing data documentation<missing_data>` for more.
+
+.. ipython:: python
+
+   # Drop rows with any missing value
+   outer_join.dropna()
+
+   # Fill forwards
+   outer_join.fillna(method='ffill')
+
+   # Impute missing values with the mean
+   outer_join['value_x'].fillna(outer_join['value_x'].mean())
+
+
+GroupBy
+-------
+
+Aggregation
+~~~~~~~~~~~
+
+Stata's ``collapse`` can be used to group by one or
+more key variables and compute aggregations on
+numeric columns.
+
+.. code-block:: stata
+
+   collapse (sum) total_bill tip, by(sex smoker)
+
+pandas provides a flexible ``groupby`` mechanism that
+allows similar aggregations.  See the :ref:`groupby documentation<groupby>`
+for more details and examples.
+
+.. ipython:: python
+
+   tips_summed = tips.groupby(['sex', 'smoker'])['total_bill', 'tip'].sum()
+   tips_summed.head()
+
+
+Transformation
+~~~~~~~~~~~~~~
+
+In Stata, if the group aggregations need to be used with the
+original data set, one would usually use ``bysort`` with :func:`egen`.
+For example, to subtract the mean for each observation by smoker group.
+
+.. code-block:: stata
+
+   bysort sex smoker: egen group_bill = mean(total_bill)
+   generate adj_total_bill = total_bill - group_bill
+
+
+pandas ``groubpy`` provides a ``transform`` mechanism that allows
+these type of operations to be succinctly expressed in one
+operation.
+
+.. ipython:: python
+
+   gb = tips.groupby('smoker')['total_bill']
+   tips['adj_total_bill'] = tips['total_bill'] - gb.transform('mean')
+   tips.head()
+
+
+By Group Processing
+~~~~~~~~~~~~~~~~~~~
+
+In addition to aggregation, pandas ``groupby`` can be used to
+replicate most other ``bysort`` processing from Stata. For example,
+the following example lists the first observation in the current
+sort order by sex/smoker group.
+
+.. code-block:: stata
+
+   bysort sex smoker: list if _n == 1
+
+In pandas this would be written as:
+
+.. ipython:: python
+
+   tips.groupby(['sex', 'smoker']).first()
+
+
+Other Considerations
+--------------------
+
+Disk vs Memory
+~~~~~~~~~~~~~~
+
+Pandas and Stata both operate exclusively in memory. This means that the size of
+data able to be loaded in pandas is limited by your machine's memory.
+If out of core processing is needed, one possibility is the
+`dask.dataframe <http://dask.pydata.org/en/latest/dataframe.html>`_
+library, which provides a subset of pandas functionality for an
+on-disk ``DataFrame``.
diff --git a/doc/source/getting_started/comparison/index.rst b/doc/source/getting_started/comparison/index.rst
new file mode 100644
index 0000000000000..998706ce0c639
--- /dev/null
+++ b/doc/source/getting_started/comparison/index.rst
@@ -0,0 +1,15 @@
+{{ header }}
+
+.. _comparison:
+
+===========================
+Comparison with other tools
+===========================
+
+.. toctree::
+    :maxdepth: 2
+
+    comparison_with_r
+    comparison_with_sql
+    comparison_with_sas
+    comparison_with_stata
diff --git a/doc/source/getting_started/dsintro.rst b/doc/source/getting_started/dsintro.rst
new file mode 100644
index 0000000000000..c8a2399739cd5
--- /dev/null
+++ b/doc/source/getting_started/dsintro.rst
@@ -0,0 +1,1076 @@
+.. _dsintro:
+
+{{ header }}
+
+************************
+Intro to Data Structures
+************************
+
+We'll start with a quick, non-comprehensive overview of the fundamental data
+structures in pandas to get you started. The fundamental behavior about data
+types, indexing, and axis labeling / alignment apply across all of the
+objects. To get started, import NumPy and load pandas into your namespace:
+
+.. ipython:: python
+
+   import numpy as np
+   import pandas as pd
+
+Here is a basic tenet to keep in mind: **data alignment is intrinsic**. The link
+between labels and data will not be broken unless done so explicitly by you.
+
+We'll give a brief intro to the data structures, then consider all of the broad
+categories of functionality and methods in separate sections.
+
+.. _basics.series:
+
+Series
+------
+
+:class:`Series` is a one-dimensional labeled array capable of holding any data
+type (integers, strings, floating point numbers, Python objects, etc.). The axis
+labels are collectively referred to as the **index**. The basic method to create a Series is to call:
+
+::
+
+    >>> s = pd.Series(data, index=index)
+
+Here, ``data`` can be many different things:
+
+* a Python dict
+* an ndarray
+* a scalar value (like 5)
+
+The passed **index** is a list of axis labels. Thus, this separates into a few
+cases depending on what **data is**:
+
+**From ndarray**
+
+If ``data`` is an ndarray, **index** must be the same length as **data**. If no
+index is passed, one will be created having values ``[0, ..., len(data) - 1]``.
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   s
+   s.index
+
+   pd.Series(np.random.randn(5))
+
+.. note::
+
+    pandas supports non-unique index values. If an operation
+    that does not support duplicate index values is attempted, an exception
+    will be raised at that time. The reason for being lazy is nearly all performance-based
+    (there are many instances in computations, like parts of GroupBy, where the index
+    is not used).
+
+**From dict**
+
+Series can be instantiated from dicts:
+
+.. ipython:: python
+
+   d = {'b': 1, 'a': 0, 'c': 2}
+   pd.Series(d)
+
+.. note::
+
+   When the data is a dict, and an index is not passed, the ``Series`` index
+   will be ordered by the dict's insertion order, if you're using Python
+   version >= 3.6 and Pandas version >= 0.23.
+
+   If you're using Python < 3.6 or Pandas < 0.23, and an index is not passed,
+   the ``Series`` index will be the lexically ordered list of dict keys.
+
+In the example above, if you were on a Python version lower than 3.6 or a
+Pandas version lower than 0.23, the ``Series`` would be ordered by the lexical
+order of the dict keys (i.e. ``['a', 'b', 'c']`` rather than ``['b', 'a', 'c']``).
+
+If an index is passed, the values in data corresponding to the labels in the
+index will be pulled out.
+
+.. ipython:: python
+
+   d = {'a': 0., 'b': 1., 'c': 2.}
+   pd.Series(d)
+   pd.Series(d, index=['b', 'c', 'd', 'a'])
+
+.. note::
+
+    NaN (not a number) is the standard missing data marker used in pandas.
+
+**From scalar value**
+
+If ``data`` is a scalar value, an index must be
+provided. The value will be repeated to match the length of **index**.
+
+.. ipython:: python
+
+   pd.Series(5., index=['a', 'b', 'c', 'd', 'e'])
+
+Series is ndarray-like
+~~~~~~~~~~~~~~~~~~~~~~
+
+``Series`` acts very similarly to a ``ndarray``, and is a valid argument to most NumPy functions.
+However, operations such as slicing will also slice the index.
+
+.. ipython:: python
+
+    s[0]
+    s[:3]
+    s[s > s.median()]
+    s[[4, 3, 1]]
+    np.exp(s)
+
+.. note::
+
+   We will address array-based indexing like ``s[[4, 3, 1]]``
+   in :ref:`section <indexing>`.
+
+Like a NumPy array, a pandas Series has a :attr:`~Series.dtype`.
+
+.. ipython:: python
+
+   s.dtype
+
+This is often a NumPy dtype. However, pandas and 3rd-party libraries
+extend NumPy's type system in a few places, in which case the dtype would
+be a :class:`~pandas.api.extensions.ExtensionDtype`. Some examples within
+pandas are :ref:`categorical` and :ref:`integer_na`. See :ref:`basics.dtypes`
+for more.
+
+If you need the actual array backing a ``Series``, use :attr:`Series.array`.
+
+.. ipython:: python
+
+   s.array
+
+Accessing the array can be useful when you need to do some operation without the
+index (to disable :ref:`automatic alignment <dsintro.alignment>`, for example).
+
+:attr:`Series.array` will always be an :class:`~pandas.api.extensions.ExtensionArray`.
+Briefly, an ExtensionArray is a thin wrapper around one or more *concrete* arrays like a
+:class:`numpy.ndarray`. Pandas knows how to take an ``ExtensionArray`` and
+store it in a ``Series`` or a column of a ``DataFrame``.
+See :ref:`basics.dtypes` for more.
+
+While Series is ndarray-like, if you need an *actual* ndarray, then use
+:meth:`Series.to_numpy`.
+
+.. ipython:: python
+
+   s.to_numpy()
+
+Even if the Series is backed by a :class:`~pandas.api.extensions.ExtensionArray`,
+:meth:`Series.to_numpy` will return a NumPy ndarray.
+
+Series is dict-like
+~~~~~~~~~~~~~~~~~~~
+
+A Series is like a fixed-size dict in that you can get and set values by index
+label:
+
+.. ipython:: python
+
+    s['a']
+    s['e'] = 12.
+    s
+    'e' in s
+    'f' in s
+
+If a label is not contained, an exception is raised:
+
+.. code-block:: python
+
+    >>> s['f']
+    KeyError: 'f'
+
+Using the ``get`` method, a missing label will return None or specified default:
+
+.. ipython:: python
+
+   s.get('f')
+
+   s.get('f', np.nan)
+
+See also the :ref:`section on attribute access<indexing.attribute_access>`.
+
+Vectorized operations and label alignment with Series
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When working with raw NumPy arrays, looping through value-by-value is usually
+not necessary. The same is true when working with Series in pandas.
+Series can also be passed into most NumPy methods expecting an ndarray.
+
+.. ipython:: python
+
+    s + s
+    s * 2
+    np.exp(s)
+
+A key difference between Series and ndarray is that operations between Series
+automatically align the data based on label. Thus, you can write computations
+without giving consideration to whether the Series involved have the same
+labels.
+
+.. ipython:: python
+
+    s[1:] + s[:-1]
+
+The result of an operation between unaligned Series will have the **union** of
+the indexes involved. If a label is not found in one Series or the other, the
+result will be marked as missing ``NaN``. Being able to write code without doing
+any explicit data alignment grants immense freedom and flexibility in
+interactive data analysis and research. The integrated data alignment features
+of the pandas data structures set pandas apart from the majority of related
+tools for working with labeled data.
+
+.. note::
+
+    In general, we chose to make the default result of operations between
+    differently indexed objects yield the **union** of the indexes in order to
+    avoid loss of information. Having an index label, though the data is
+    missing, is typically important information as part of a computation. You
+    of course have the option of dropping labels with missing data via the
+    **dropna** function.
+
+Name attribute
+~~~~~~~~~~~~~~
+
+.. _dsintro.name_attribute:
+
+Series can also have a ``name`` attribute:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5), name='something')
+   s
+   s.name
+
+The Series ``name`` will be assigned automatically in many cases, in particular
+when taking 1D slices of DataFrame as you will see below.
+
+.. versionadded:: 0.18.0
+
+You can rename a Series with the :meth:`pandas.Series.rename` method.
+
+.. ipython:: python
+
+   s2 = s.rename("different")
+   s2.name
+
+Note that ``s`` and ``s2`` refer to different objects.
+
+.. _basics.dataframe:
+
+DataFrame
+---------
+
+**DataFrame** is a 2-dimensional labeled data structure with columns of
+potentially different types. You can think of it like a spreadsheet or SQL
+table, or a dict of Series objects. It is generally the most commonly used
+pandas object. Like Series, DataFrame accepts many different kinds of input:
+
+* Dict of 1D ndarrays, lists, dicts, or Series
+* 2-D numpy.ndarray
+* `Structured or record
+  <https://docs.scipy.org/doc/numpy/user/basics.rec.html>`__ ndarray
+* A ``Series``
+* Another ``DataFrame``
+
+Along with the data, you can optionally pass **index** (row labels) and
+**columns** (column labels) arguments. If you pass an index and / or columns,
+you are guaranteeing the index and / or columns of the resulting
+DataFrame. Thus, a dict of Series plus a specific index will discard all data
+not matching up to the passed index.
+
+If axis labels are not passed, they will be constructed from the input data
+based on common sense rules.
+
+.. note::
+
+   When the data is a dict, and ``columns`` is not specified, the ``DataFrame``
+   columns will be ordered by the dict's insertion order, if you are using
+   Python version >= 3.6 and Pandas >= 0.23.
+
+   If you are using Python < 3.6 or Pandas < 0.23, and ``columns`` is not
+   specified, the ``DataFrame`` columns will be the lexically ordered list of dict
+   keys.
+
+From dict of Series or dicts
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The resulting **index** will be the **union** of the indexes of the various
+Series. If there are any nested dicts, these will first be converted to
+Series. If no columns are passed, the columns will be the ordered list of dict
+keys.
+
+.. ipython:: python
+
+    d = {'one': pd.Series([1., 2., 3.], index=['a', 'b', 'c']),
+         'two': pd.Series([1., 2., 3., 4.], index=['a', 'b', 'c', 'd'])}
+    df = pd.DataFrame(d)
+    df
+
+    pd.DataFrame(d, index=['d', 'b', 'a'])
+    pd.DataFrame(d, index=['d', 'b', 'a'], columns=['two', 'three'])
+
+The row and column labels can be accessed respectively by accessing the
+**index** and **columns** attributes:
+
+.. note::
+
+   When a particular set of columns is passed along with a dict of data, the
+   passed columns override the keys in the dict.
+
+.. ipython:: python
+
+   df.index
+   df.columns
+
+From dict of ndarrays / lists
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The ndarrays must all be the same length. If an index is passed, it must
+clearly also be the same length as the arrays. If no index is passed, the
+result will be ``range(n)``, where ``n`` is the array length.
+
+.. ipython:: python
+
+   d = {'one': [1., 2., 3., 4.],
+        'two': [4., 3., 2., 1.]}
+   pd.DataFrame(d)
+   pd.DataFrame(d, index=['a', 'b', 'c', 'd'])
+
+From structured or record array
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This case is handled identically to a dict of arrays.
+
+.. ipython:: python
+
+   data = np.zeros((2, ), dtype=[('A', 'i4'), ('B', 'f4'), ('C', 'a10')])
+   data[:] = [(1, 2., 'Hello'), (2, 3., "World")]
+
+   pd.DataFrame(data)
+   pd.DataFrame(data, index=['first', 'second'])
+   pd.DataFrame(data, columns=['C', 'A', 'B'])
+
+.. note::
+
+    DataFrame is not intended to work exactly like a 2-dimensional NumPy
+    ndarray.
+
+.. _basics.dataframe.from_list_of_dicts:
+
+From a list of dicts
+~~~~~~~~~~~~~~~~~~~~
+
+.. ipython:: python
+
+   data2 = [{'a': 1, 'b': 2}, {'a': 5, 'b': 10, 'c': 20}]
+   pd.DataFrame(data2)
+   pd.DataFrame(data2, index=['first', 'second'])
+   pd.DataFrame(data2, columns=['a', 'b'])
+
+.. _basics.dataframe.from_dict_of_tuples:
+
+From a dict of tuples
+~~~~~~~~~~~~~~~~~~~~~
+
+You can automatically create a MultiIndexed frame by passing a tuples
+dictionary.
+
+.. ipython:: python
+
+   pd.DataFrame({('a', 'b'): {('A', 'B'): 1, ('A', 'C'): 2},
+                 ('a', 'a'): {('A', 'C'): 3, ('A', 'B'): 4},
+                 ('a', 'c'): {('A', 'B'): 5, ('A', 'C'): 6},
+                 ('b', 'a'): {('A', 'C'): 7, ('A', 'B'): 8},
+                 ('b', 'b'): {('A', 'D'): 9, ('A', 'B'): 10}})
+
+.. _basics.dataframe.from_series:
+
+From a Series
+~~~~~~~~~~~~~
+
+The result will be a DataFrame with the same index as the input Series, and
+with one column whose name is the original name of the Series (only if no other
+column name provided).
+
+**Missing Data**
+
+Much more will be said on this topic in the :ref:`Missing data <missing_data>`
+section. To construct a DataFrame with missing data, we use ``np.nan`` to
+represent missing values. Alternatively, you may pass a ``numpy.MaskedArray``
+as the data argument to the DataFrame constructor, and its masked entries will
+be considered missing.
+
+Alternate Constructors
+~~~~~~~~~~~~~~~~~~~~~~
+
+.. _basics.dataframe.from_dict:
+
+**DataFrame.from_dict**
+
+``DataFrame.from_dict`` takes a dict of dicts or a dict of array-like sequences
+and returns a DataFrame. It operates like the ``DataFrame`` constructor except
+for the ``orient`` parameter which is ``'columns'`` by default, but which can be
+set to ``'index'`` in order to use the dict keys as row labels.
+
+
+.. ipython:: python
+
+   pd.DataFrame.from_dict(dict([('A', [1, 2, 3]), ('B', [4, 5, 6])]))
+
+If you pass ``orient='index'``, the keys will be the row labels. In this
+case, you can also pass the desired column names:
+
+.. ipython:: python
+
+   pd.DataFrame.from_dict(dict([('A', [1, 2, 3]), ('B', [4, 5, 6])]),
+                          orient='index', columns=['one', 'two', 'three'])
+
+.. _basics.dataframe.from_records:
+
+**DataFrame.from_records**
+
+``DataFrame.from_records`` takes a list of tuples or an ndarray with structured
+dtype. It works analogously to the normal ``DataFrame`` constructor, except that
+the resulting DataFrame index may be a specific field of the structured
+dtype. For example:
+
+.. ipython:: python
+
+   data
+   pd.DataFrame.from_records(data, index='C')
+
+
+Column selection, addition, deletion
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can treat a DataFrame semantically like a dict of like-indexed Series
+objects. Getting, setting, and deleting columns works with the same syntax as
+the analogous dict operations:
+
+.. ipython:: python
+
+   df['one']
+   df['three'] = df['one'] * df['two']
+   df['flag'] = df['one'] > 2
+   df
+
+Columns can be deleted or popped like with a dict:
+
+.. ipython:: python
+
+   del df['two']
+   three = df.pop('three')
+   df
+
+When inserting a scalar value, it will naturally be propagated to fill the
+column:
+
+.. ipython:: python
+
+   df['foo'] = 'bar'
+   df
+
+When inserting a Series that does not have the same index as the DataFrame, it
+will be conformed to the DataFrame's index:
+
+.. ipython:: python
+
+   df['one_trunc'] = df['one'][:2]
+   df
+
+You can insert raw ndarrays but their length must match the length of the
+DataFrame's index.
+
+By default, columns get inserted at the end. The ``insert`` function is
+available to insert at a particular location in the columns:
+
+.. ipython:: python
+
+   df.insert(1, 'bar', df['one'])
+   df
+
+.. _dsintro.chained_assignment:
+
+Assigning New Columns in Method Chains
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Inspired by `dplyr's
+<https://dplyr.tidyverse.org/reference/mutate.html>`__
+``mutate`` verb, DataFrame has an :meth:`~pandas.DataFrame.assign`
+method that allows you to easily create new columns that are potentially
+derived from existing columns.
+
+.. ipython:: python
+
+   iris = pd.read_csv('data/iris.data')
+   iris.head()
+   (iris.assign(sepal_ratio=iris['SepalWidth'] / iris['SepalLength'])
+        .head())
+
+In the example above, we inserted a precomputed value. We can also pass in
+a function of one argument to be evaluated on the DataFrame being assigned to.
+
+.. ipython:: python
+
+   iris.assign(sepal_ratio=lambda x: (x['SepalWidth'] / x['SepalLength'])).head()
+
+``assign`` **always** returns a copy of the data, leaving the original
+DataFrame untouched.
+
+Passing a callable, as opposed to an actual value to be inserted, is
+useful when you don't have a reference to the DataFrame at hand. This is
+common when using ``assign`` in a chain of operations. For example,
+we can limit the DataFrame to just those observations with a Sepal Length
+greater than 5, calculate the ratio, and plot:
+
+.. ipython:: python
+
+   @savefig basics_assign.png
+   (iris.query('SepalLength > 5')
+        .assign(SepalRatio=lambda x: x.SepalWidth / x.SepalLength,
+                PetalRatio=lambda x: x.PetalWidth / x.PetalLength)
+        .plot(kind='scatter', x='SepalRatio', y='PetalRatio'))
+
+Since a function is passed in, the function is computed on the DataFrame
+being assigned to. Importantly, this is the DataFrame that's been filtered
+to those rows with sepal length greater than 5. The filtering happens first,
+and then the ratio calculations. This is an example where we didn't
+have a reference to the *filtered* DataFrame available.
+
+The function signature for ``assign`` is simply ``**kwargs``. The keys
+are the column names for the new fields, and the values are either a value
+to be inserted (for example, a ``Series`` or NumPy array), or a function
+of one argument to be called on the ``DataFrame``. A *copy* of the original
+DataFrame is returned, with the new values inserted.
+
+.. versionchanged:: 0.23.0
+
+Starting with Python 3.6 the order of ``**kwargs`` is preserved. This allows
+for *dependent* assignment, where an expression later in ``**kwargs`` can refer
+to a column created earlier in the same :meth:`~DataFrame.assign`.
+
+.. ipython:: python
+
+   dfa = pd.DataFrame({"A": [1, 2, 3],
+                       "B": [4, 5, 6]})
+   dfa.assign(C=lambda x: x['A'] + x['B'],
+              D=lambda x: x['A'] + x['C'])
+
+In the second expression, ``x['C']`` will refer to the newly created column,
+that's equal to ``dfa['A'] + dfa['B']``.
+
+To write code compatible with all versions of Python, split the assignment in two.
+
+.. ipython:: python
+
+   dependent = pd.DataFrame({"A": [1, 1, 1]})
+   (dependent.assign(A=lambda x: x['A'] + 1)
+             .assign(B=lambda x: x['A'] + 2))
+
+.. warning::
+
+   Dependent assignment may subtly change the behavior of your code between
+   Python 3.6 and older versions of Python.
+
+   If you wish to write code that supports versions of python before and after 3.6,
+   you'll need to take care when passing ``assign`` expressions that
+
+   * Update an existing column
+   * Refer to the newly updated column in the same ``assign``
+
+   For example, we'll update column "A" and then refer to it when creating "B".
+
+   .. code-block:: python
+
+      >>> dependent = pd.DataFrame({"A": [1, 1, 1]})
+      >>> dependent.assign(A=lambda x: x["A"] + 1, B=lambda x: x["A"] + 2)
+
+   For Python 3.5 and earlier the expression creating ``B`` refers to the
+   "old" value of ``A``, ``[1, 1, 1]``. The output is then
+
+   .. code-block:: console
+
+         A  B
+      0  2  3
+      1  2  3
+      2  2  3
+
+   For Python 3.6 and later, the expression creating ``A`` refers to the
+   "new" value of ``A``, ``[2, 2, 2]``, which results in
+
+   .. code-block:: console
+
+         A  B
+      0  2  4
+      1  2  4
+      2  2  4
+
+
+
+Indexing / Selection
+~~~~~~~~~~~~~~~~~~~~
+The basics of indexing are as follows:
+
+.. csv-table::
+    :header: "Operation", "Syntax", "Result"
+    :widths: 30, 20, 10
+
+    Select column, ``df[col]``, Series
+    Select row by label, ``df.loc[label]``, Series
+    Select row by integer location, ``df.iloc[loc]``, Series
+    Slice rows, ``df[5:10]``, DataFrame
+    Select rows by boolean vector, ``df[bool_vec]``, DataFrame
+
+Row selection, for example, returns a Series whose index is the columns of the
+DataFrame:
+
+.. ipython:: python
+
+   df.loc['b']
+   df.iloc[2]
+
+For a more exhaustive treatment of sophisticated label-based indexing and
+slicing, see the :ref:`section on indexing <indexing>`. We will address the
+fundamentals of reindexing / conforming to new sets of labels in the
+:ref:`section on reindexing <basics.reindexing>`.
+
+.. _dsintro.alignment:
+
+Data alignment and arithmetic
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Data alignment between DataFrame objects automatically align on **both the
+columns and the index (row labels)**. Again, the resulting object will have the
+union of the column and row labels.
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.random.randn(10, 4), columns=['A', 'B', 'C', 'D'])
+    df2 = pd.DataFrame(np.random.randn(7, 3), columns=['A', 'B', 'C'])
+    df + df2
+
+When doing an operation between DataFrame and Series, the default behavior is
+to align the Series **index** on the DataFrame **columns**, thus `broadcasting
+<http://docs.scipy.org/doc/numpy/user/basics.broadcasting.html>`__
+row-wise. For example:
+
+.. ipython:: python
+
+   df - df.iloc[0]
+
+In the special case of working with time series data, if the DataFrame index
+contains dates, the broadcasting will be column-wise:
+
+.. ipython:: python
+   :okwarning:
+
+   index = pd.date_range('1/1/2000', periods=8)
+   df = pd.DataFrame(np.random.randn(8, 3), index=index, columns=list('ABC'))
+   df
+   type(df['A'])
+   df - df['A']
+
+.. warning::
+
+   .. code-block:: python
+
+      df - df['A']
+
+   is now deprecated and will be removed in a future release. The preferred way
+   to replicate this behavior is
+
+   .. code-block:: python
+
+      df.sub(df['A'], axis=0)
+
+For explicit control over the matching and broadcasting behavior, see the
+section on :ref:`flexible binary operations <basics.binop>`.
+
+Operations with scalars are just as you would expect:
+
+.. ipython:: python
+
+   df * 5 + 2
+   1 / df
+   df ** 4
+
+.. _dsintro.boolean:
+
+Boolean operators work as well:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'a': [1, 0, 1], 'b': [0, 1, 1]}, dtype=bool)
+   df2 = pd.DataFrame({'a': [0, 1, 1], 'b': [1, 1, 0]}, dtype=bool)
+   df1 & df2
+   df1 | df2
+   df1 ^ df2
+   -df1
+
+Transposing
+~~~~~~~~~~~
+
+To transpose, access the ``T`` attribute (also the ``transpose`` function),
+similar to an ndarray:
+
+.. ipython:: python
+
+   # only show the first 5 rows
+   df[:5].T
+
+DataFrame interoperability with NumPy functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _dsintro.numpy_interop:
+
+Elementwise NumPy ufuncs (log, exp, sqrt, ...) and various other NumPy functions
+can be used with no issues on DataFrame, assuming the data within are numeric:
+
+.. ipython:: python
+
+   np.exp(df)
+   np.asarray(df)
+
+The dot method on DataFrame implements matrix multiplication:
+
+.. ipython:: python
+
+   df.T.dot(df)
+
+Similarly, the dot method on Series implements dot product:
+
+.. ipython:: python
+
+   s1 = pd.Series(np.arange(5, 10))
+   s1.dot(s1)
+
+DataFrame is not intended to be a drop-in replacement for ndarray as its
+indexing semantics are quite different in places from a matrix.
+
+Console display
+~~~~~~~~~~~~~~~
+
+Very large DataFrames will be truncated to display them in the console.
+You can also get a summary using :meth:`~pandas.DataFrame.info`.
+(Here I am reading a CSV version of the **baseball** dataset from the **plyr**
+R package):
+
+.. ipython:: python
+   :suppress:
+
+   # force a summary to be printed
+   pd.set_option('display.max_rows', 5)
+
+.. ipython:: python
+
+   baseball = pd.read_csv('data/baseball.csv')
+   print(baseball)
+   baseball.info()
+
+.. ipython:: python
+   :suppress:
+   :okwarning:
+
+   # restore GlobalPrintConfig
+   pd.reset_option(r'^display\.')
+
+However, using ``to_string`` will return a string representation of the
+DataFrame in tabular form, though it won't always fit the console width:
+
+.. ipython:: python
+
+   print(baseball.iloc[-20:, :12].to_string())
+
+Wide DataFrames will be printed across multiple rows by
+default:
+
+.. ipython:: python
+
+   pd.DataFrame(np.random.randn(3, 12))
+
+You can change how much to print on a single row by setting the ``display.width``
+option:
+
+.. ipython:: python
+
+   pd.set_option('display.width', 40)  # default is 80
+
+   pd.DataFrame(np.random.randn(3, 12))
+
+You can adjust the max width of the individual columns by setting ``display.max_colwidth``
+
+.. ipython:: python
+
+   datafile = {'filename': ['filename_01', 'filename_02'],
+               'path': ["media/user_name/storage/folder_01/filename_01",
+                        "media/user_name/storage/folder_02/filename_02"]}
+
+   pd.set_option('display.max_colwidth', 30)
+   pd.DataFrame(datafile)
+
+   pd.set_option('display.max_colwidth', 100)
+   pd.DataFrame(datafile)
+
+.. ipython:: python
+   :suppress:
+
+   pd.reset_option('display.width')
+   pd.reset_option('display.max_colwidth')
+
+You can also disable this feature via the ``expand_frame_repr`` option.
+This will print the table in one block.
+
+DataFrame column attribute access and IPython completion
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If a DataFrame column label is a valid Python variable name, the column can be
+accessed like an attribute:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'foo1': np.random.randn(5),
+                      'foo2': np.random.randn(5)})
+   df
+   df.foo1
+
+The columns are also connected to the `IPython <https://ipython.org>`__
+completion mechanism so they can be tab-completed:
+
+.. code-block:: ipython
+
+    In [5]: df.fo<TAB>  # noqa: E225, E999
+    df.foo1  df.foo2
+
+.. _basics.panel:
+
+Panel
+-----
+
+.. warning::
+
+    In 0.20.0, ``Panel`` is deprecated and will be removed in
+    a future version. See the section :ref:`Deprecate Panel <dsintro.deprecate_panel>`.
+
+Panel is a somewhat less-used, but still important container for 3-dimensional
+data. The term `panel data <https://en.wikipedia.org/wiki/Panel_data>`__ is
+derived from econometrics and is partially responsible for the name pandas:
+pan(el)-da(ta)-s. The names for the 3 axes are intended to give some semantic
+meaning to describing operations involving panel data and, in particular,
+econometric analysis of panel data. However, for the strict purposes of slicing
+and dicing a collection of DataFrame objects, you may find the axis names
+slightly arbitrary:
+
+* **items**: axis 0, each item corresponds to a DataFrame contained inside
+* **major_axis**: axis 1, it is the **index** (rows) of each of the
+  DataFrames
+* **minor_axis**: axis 2, it is the **columns** of each of the DataFrames
+
+Construction of Panels works about like you would expect:
+
+From 3D ndarray with optional axis labels
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. ipython:: python
+   :okwarning:
+
+   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                 major_axis=pd.date_range('1/1/2000', periods=5),
+                 minor_axis=['A', 'B', 'C', 'D'])
+   wp
+
+
+From dict of DataFrame objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. ipython:: python
+   :okwarning:
+
+   data = {'Item1': pd.DataFrame(np.random.randn(4, 3)),
+           'Item2': pd.DataFrame(np.random.randn(4, 2))}
+   pd.Panel(data)
+
+Note that the values in the dict need only be **convertible to
+DataFrame**. Thus, they can be any of the other valid inputs to DataFrame as
+per above.
+
+One helpful factory method is ``Panel.from_dict``, which takes a
+dictionary of DataFrames as above, and the following named parameters:
+
+.. csv-table::
+   :header: "Parameter", "Default", "Description"
+   :widths: 10, 10, 40
+
+   intersect, ``False``, drops elements whose indices do not align
+   orient, ``items``, use ``minor`` to use DataFrames' columns as panel items
+
+For example, compare to the construction above:
+
+.. ipython:: python
+   :okwarning:
+
+   pd.Panel.from_dict(data, orient='minor')
+
+Orient is especially useful for mixed-type DataFrames. If you pass a dict of
+DataFrame objects with mixed-type columns, all of the data will get upcasted to
+``dtype=object`` unless you pass ``orient='minor'``:
+
+.. ipython:: python
+   :okwarning:
+
+   df = pd.DataFrame({'a': ['foo', 'bar', 'baz'],
+                      'b': np.random.randn(3)})
+   df
+   data = {'item1': df, 'item2': df}
+   panel = pd.Panel.from_dict(data, orient='minor')
+   panel['a']
+   panel['b']
+   panel['b'].dtypes
+
+.. note::
+
+   Panel, being less commonly used than Series and DataFrame,
+   has been slightly neglected feature-wise. A number of methods and options
+   available in DataFrame are not available in Panel.
+
+.. _dsintro.to_panel:
+
+From DataFrame using ``to_panel`` method
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``to_panel`` converts a DataFrame with a two-level index to a Panel.
+
+.. ipython:: python
+   :okwarning:
+
+   midx = pd.MultiIndex(levels=[['one', 'two'], ['x', 'y']],
+                        codes=[[1, 1, 0, 0], [1, 0, 1, 0]])
+   df = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=midx)
+   df.to_panel()
+
+.. _dsintro.panel_item_selection:
+
+Item selection / addition / deletion
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Similar to DataFrame functioning as a dict of Series, Panel is like a dict
+of DataFrames:
+
+.. ipython:: python
+
+   wp['Item1']
+   wp['Item3'] = wp['Item1'] / wp['Item2']
+
+The API for insertion and deletion is the same as for DataFrame. And as with
+DataFrame, if the item is a valid Python identifier, you can access it as an
+attribute and tab-complete it in IPython.
+
+Transposing
+~~~~~~~~~~~
+
+A Panel can be rearranged using its ``transpose`` method (which does not make a
+copy by default unless the data are heterogeneous):
+
+.. ipython:: python
+   :okwarning:
+
+   wp.transpose(2, 0, 1)
+
+Indexing / Selection
+~~~~~~~~~~~~~~~~~~~~
+
+.. csv-table::
+    :header: "Operation", "Syntax", "Result"
+    :widths: 30, 20, 10
+
+    Select item, ``wp[item]``, DataFrame
+    Get slice at major_axis label, ``wp.major_xs(val)``, DataFrame
+    Get slice at minor_axis label, ``wp.minor_xs(val)``, DataFrame
+
+For example, using the earlier example data, we could do:
+
+.. ipython:: python
+
+    wp['Item1']
+    wp.major_xs(wp.major_axis[2])
+    wp.minor_axis
+    wp.minor_xs('C')
+
+Squeezing
+~~~~~~~~~
+
+Another way to change the dimensionality of an object is to ``squeeze`` a 1-len
+object, similar to ``wp['Item1']``.
+
+.. ipython:: python
+   :okwarning:
+
+   wp.reindex(items=['Item1']).squeeze()
+   wp.reindex(items=['Item1'], minor=['B']).squeeze()
+
+
+Conversion to DataFrame
+~~~~~~~~~~~~~~~~~~~~~~~
+
+A Panel can be represented in 2D form as a hierarchically indexed
+DataFrame. See the section :ref:`hierarchical indexing <advanced.hierarchical>`
+for more on this. To convert a Panel to a DataFrame, use the ``to_frame``
+method:
+
+.. ipython:: python
+   :okwarning:
+
+   panel = pd.Panel(np.random.randn(3, 5, 4), items=['one', 'two', 'three'],
+                    major_axis=pd.date_range('1/1/2000', periods=5),
+                    minor_axis=['a', 'b', 'c', 'd'])
+   panel.to_frame()
+
+
+.. _dsintro.deprecate_panel:
+
+Deprecate Panel
+---------------
+
+Over the last few years, pandas has increased in both breadth and depth, with new features,
+datatype support, and manipulation routines. As a result, supporting efficient indexing and functional
+routines for ``Series``, ``DataFrame`` and ``Panel`` has contributed to an increasingly fragmented and
+difficult-to-understand code base.
+
+The 3-D structure of a ``Panel`` is much less common for many types of data analysis,
+than the 1-D of the ``Series`` or the 2-D of the ``DataFrame``. Going forward it makes sense for
+pandas to focus on these areas exclusively.
+
+Oftentimes, one can simply use a MultiIndex ``DataFrame`` for easily working with higher dimensional data.
+
+In addition, the ``xarray`` package was built from the ground up, specifically in order to
+support the multi-dimensional analysis that is one of ``Panel`` s main use cases.
+`Here is a link to the xarray panel-transition documentation <https://xarray.pydata.org/en/stable/pandas.html#panel-transition>`__.
+
+.. ipython:: python
+   :okwarning:
+
+   import pandas.util.testing as tm
+   p = tm.makePanel()
+   p
+
+Convert to a MultiIndex DataFrame.
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_frame()
+
+Alternatively, one can convert to an xarray ``DataArray``.
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_xarray()
+
+You can see the full-documentation for the `xarray package <https://xarray.pydata.org/en/stable/>`__.
diff --git a/doc/source/getting_started/index.rst b/doc/source/getting_started/index.rst
new file mode 100644
index 0000000000000..4c5d26461a667
--- /dev/null
+++ b/doc/source/getting_started/index.rst
@@ -0,0 +1,17 @@
+{{ header }}
+
+.. _getting_started:
+
+===============
+Getting started
+===============
+
+.. toctree::
+    :maxdepth: 2
+
+    overview
+    10min
+    basics
+    dsintro
+    comparison/index
+    tutorials
diff --git a/doc/source/getting_started/overview.rst b/doc/source/getting_started/overview.rst
new file mode 100644
index 0000000000000..b531f686951fc
--- /dev/null
+++ b/doc/source/getting_started/overview.rst
@@ -0,0 +1,178 @@
+.. _overview:
+
+{{ header }}
+
+****************
+Package overview
+****************
+
+**pandas** is a `Python <https://www.python.org>`__ package providing fast,
+flexible, and expressive data structures designed to make working with
+"relational" or "labeled" data both easy and intuitive. It aims to be the
+fundamental high-level building block for doing practical, **real world** data
+analysis in Python. Additionally, it has the broader goal of becoming **the
+most powerful and flexible open source data analysis / manipulation tool
+available in any language**. It is already well on its way toward this goal.
+
+pandas is well suited for many different kinds of data:
+
+  - Tabular data with heterogeneously-typed columns, as in an SQL table or
+    Excel spreadsheet
+  - Ordered and unordered (not necessarily fixed-frequency) time series data.
+  - Arbitrary matrix data (homogeneously typed or heterogeneous) with row and
+    column labels
+  - Any other form of observational / statistical data sets. The data actually
+    need not be labeled at all to be placed into a pandas data structure
+
+The two primary data structures of pandas, :class:`Series` (1-dimensional)
+and :class:`DataFrame` (2-dimensional), handle the vast majority of typical use
+cases in finance, statistics, social science, and many areas of
+engineering. For R users, :class:`DataFrame` provides everything that R's
+``data.frame`` provides and much more. pandas is built on top of `NumPy
+<https://www.numpy.org>`__ and is intended to integrate well within a scientific
+computing environment with many other 3rd party libraries.
+
+Here are just a few of the things that pandas does well:
+
+  - Easy handling of **missing data** (represented as NaN) in floating point as
+    well as non-floating point data
+  - Size mutability: columns can be **inserted and deleted** from DataFrame and
+    higher dimensional objects
+  - Automatic and explicit **data alignment**: objects can be explicitly
+    aligned to a set of labels, or the user can simply ignore the labels and
+    let `Series`, `DataFrame`, etc. automatically align the data for you in
+    computations
+  - Powerful, flexible **group by** functionality to perform
+    split-apply-combine operations on data sets, for both aggregating and
+    transforming data
+  - Make it **easy to convert** ragged, differently-indexed data in other
+    Python and NumPy data structures into DataFrame objects
+  - Intelligent label-based **slicing**, **fancy indexing**, and **subsetting**
+    of large data sets
+  - Intuitive **merging** and **joining** data sets
+  - Flexible **reshaping** and pivoting of data sets
+  - **Hierarchical** labeling of axes (possible to have multiple labels per
+    tick)
+  - Robust IO tools for loading data from **flat files** (CSV and delimited),
+    Excel files, databases, and saving / loading data from the ultrafast **HDF5
+    format**
+  - **Time series**-specific functionality: date range generation and frequency
+    conversion, moving window statistics, moving window linear regressions,
+    date shifting and lagging, etc.
+
+Many of these principles are here to address the shortcomings frequently
+experienced using other languages / scientific research environments. For data
+scientists, working with data is typically divided into multiple stages:
+munging and cleaning data, analyzing / modeling it, then organizing the results
+of the analysis into a form suitable for plotting or tabular display. pandas
+is the ideal tool for all of these tasks.
+
+Some other notes
+
+ - pandas is **fast**. Many of the low-level algorithmic bits have been
+   extensively tweaked in `Cython <https://cython.org>`__ code. However, as with
+   anything else generalization usually sacrifices performance. So if you focus
+   on one feature for your application you may be able to create a faster
+   specialized tool.
+
+ - pandas is a dependency of `statsmodels
+   <https://www.statsmodels.org/stable/index.html>`__, making it an important part of the
+   statistical computing ecosystem in Python.
+
+ - pandas has been used extensively in production in financial applications.
+
+Data Structures
+---------------
+
+.. csv-table::
+    :header: "Dimensions", "Name", "Description"
+    :widths: 15, 20, 50
+
+    1, "Series", "1D labeled homogeneously-typed array"
+    2, "DataFrame", "General 2D labeled, size-mutable tabular structure with potentially heterogeneously-typed column"
+
+Why more than one data structure?
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The best way to think about the pandas data structures is as flexible
+containers for lower dimensional data. For example, DataFrame is a container
+for Series, and Series is a container for scalars. We would like to be
+able to insert and remove objects from these containers in a dictionary-like
+fashion.
+
+Also, we would like sensible default behaviors for the common API functions
+which take into account the typical orientation of time series and
+cross-sectional data sets. When using ndarrays to store 2- and 3-dimensional
+data, a burden is placed on the user to consider the orientation of the data
+set when writing functions; axes are considered more or less equivalent (except
+when C- or Fortran-contiguousness matters for performance). In pandas, the axes
+are intended to lend more semantic meaning to the data; i.e., for a particular
+data set there is likely to be a "right" way to orient the data. The goal,
+then, is to reduce the amount of mental effort required to code up data
+transformations in downstream functions.
+
+For example, with tabular data (DataFrame) it is more semantically helpful to
+think of the **index** (the rows) and the **columns** rather than axis 0 and
+axis 1. Iterating through the columns of the DataFrame thus results in more
+readable code:
+
+::
+
+    for col in df.columns:
+        series = df[col]
+        # do something with series
+
+Mutability and copying of data
+------------------------------
+
+All pandas data structures are value-mutable (the values they contain can be
+altered) but not always size-mutable. The length of a Series cannot be
+changed, but, for example, columns can be inserted into a DataFrame. However,
+the vast majority of methods produce new objects and leave the input data
+untouched. In general we like to **favor immutability** where sensible.
+
+Getting Support
+---------------
+
+The first stop for pandas issues and ideas is the `Github Issue Tracker
+<https://github.com/pandas-dev/pandas/issues>`__. If you have a general question,
+pandas community experts can answer through `Stack Overflow
+<https://stackoverflow.com/questions/tagged/pandas>`__.
+
+Community
+---------
+
+pandas is actively supported today by a community of like-minded individuals around
+the world who contribute their valuable time and energy to help make open source
+pandas possible. Thanks to `all of our contributors <https://github.com/pandas-dev/pandas/graphs/contributors>`__.
+
+If you're interested in contributing, please visit the :ref:`contributing guide <contributing>`.
+
+pandas is a `NumFOCUS <https://www.numfocus.org/open-source-projects/>`__ sponsored project.
+This will help ensure the success of development of pandas as a world-class open-source
+project, and makes it possible to `donate <https://pandas.pydata.org/donate.html>`__ to the project.
+
+Project Governance
+------------------
+
+The governance process that pandas project has used informally since its inception in 2008 is formalized in `Project Governance documents <https://github.com/pandas-dev/pandas-governance>`__.
+The documents clarify how decisions are made and how the various elements of our community interact, including the relationship between open source collaborative development and work that may be funded by for-profit or non-profit entities.
+
+Wes McKinney is the Benevolent Dictator for Life (BDFL).
+
+Development Team
+-----------------
+
+The list of the Core Team members and more detailed information can be found on the `people’s page <https://github.com/pandas-dev/pandas-governance/blob/master/people.md>`__ of the governance repo.
+
+
+Institutional Partners
+----------------------
+
+The information about current institutional partners can be found on `pandas website page <https://pandas.pydata.org/about.html>`__.
+
+License
+-------
+
+.. literalinclude:: ../../../LICENSE
+
diff --git a/doc/source/getting_started/tutorials.rst b/doc/source/getting_started/tutorials.rst
new file mode 100644
index 0000000000000..8e23c643280c1
--- /dev/null
+++ b/doc/source/getting_started/tutorials.rst
@@ -0,0 +1,109 @@
+.. _tutorials:
+
+{{ header }}
+
+*********
+Tutorials
+*********
+
+This is a guide to many pandas tutorials, geared mainly for new users.
+
+Internal Guides
+===============
+
+pandas' own :ref:`10 Minutes to pandas<10min>`.
+
+More complex recipes are in the :ref:`Cookbook<cookbook>`.
+
+A handy pandas `cheat sheet <http://pandas.pydata.org/Pandas_Cheat_Sheet.pdf>`_.
+
+Community Guides
+================
+
+pandas Cookbook by Julia Evans
+------------------------------
+
+The goal of this 2015 cookbook (by `Julia Evans <http://jvns.ca>`_) is to
+give you some concrete examples for getting started with pandas. These
+are examples with real-world data, and all the bugs and weirdness that
+entails.
+For the table of contents, see the `pandas-cookbook GitHub
+repository <http://github.com/jvns/pandas-cookbook>`_.
+
+Learn Pandas by Hernan Rojas
+----------------------------
+
+A set of lesson for new pandas users: https://bitbucket.org/hrojas/learn-pandas
+
+Practical data analysis with Python
+-----------------------------------
+
+This `guide <http://wavedatalab.github.io/datawithpython>`_ is an introduction to the data analysis process using the Python data ecosystem and an interesting open dataset.
+There are four sections covering selected topics as `munging data <http://wavedatalab.github.io/datawithpython/munge.html>`__,
+`aggregating data <http://wavedatalab.github.io/datawithpython/aggregate.html>`_, `visualizing data <http://wavedatalab.github.io/datawithpython/visualize.html>`_
+and `time series <http://wavedatalab.github.io/datawithpython/timeseries.html>`_.
+
+.. _tutorial-exercises-new-users:
+
+Exercises for new users
+-----------------------
+Practice your skills with real data sets and exercises.
+For more resources, please visit the main `repository <https://github.com/guipsamora/pandas_exercises>`__.
+
+
+.. _tutorial-modern:
+
+Modern pandas
+-------------
+
+Tutorial series written in 2016 by
+`Tom Augspurger <https://github.com/TomAugspurger>`_.
+The source may be found in the GitHub repository
+`TomAugspurger/effective-pandas <https://github.com/TomAugspurger/effective-pandas>`_.
+
+* `Modern Pandas <http://tomaugspurger.github.io/modern-1-intro.html>`_
+* `Method Chaining <http://tomaugspurger.github.io/method-chaining.html>`_
+* `Indexes <http://tomaugspurger.github.io/modern-3-indexes.html>`_
+* `Performance <http://tomaugspurger.github.io/modern-4-performance.html>`_
+* `Tidy Data <http://tomaugspurger.github.io/modern-5-tidy.html>`_
+* `Visualization <http://tomaugspurger.github.io/modern-6-visualization.html>`_
+* `Timeseries <http://tomaugspurger.github.io/modern-7-timeseries.html>`_
+
+Excel charts with pandas, vincent and xlsxwriter
+------------------------------------------------
+
+*  `Using Pandas and XlsxWriter to create Excel charts <https://pandas-xlsxwriter-charts.readthedocs.io/>`_
+
+Video Tutorials
+---------------
+
+* `Pandas From The Ground Up <https://www.youtube.com/watch?v=5JnMutdy6Fw>`_
+  (2015) (2:24)
+  `GitHub repo <https://github.com/brandon-rhodes/pycon-pandas-tutorial>`__
+* `Introduction Into Pandas <https://www.youtube.com/watch?v=-NR-ynQg0YM>`_
+  (2016) (1:28)
+  `GitHub repo <https://github.com/chendaniely/2016-pydata-carolinas-pandas>`__
+* `Pandas: .head() to .tail() <https://www.youtube.com/watch?v=7vuO9QXDN50>`_
+  (2016) (1:26)
+  `GitHub repo <https://github.com/TomAugspurger/pydata-chi-h2t>`__
+* `Data analysis in Python with pandas <https://www.youtube.com/playlist?list=PL5-da3qGB5ICCsgW1MxlZ0Hq8LL5U3u9y>`_
+  (2016-2018)
+  `GitHub repo <https://github.com/justmarkham/pandas-videos>`__ and
+  `Jupyter Notebook <http://nbviewer.jupyter.org/github/justmarkham/pandas-videos/blob/master/pandas.ipynb>`__
+* `Best practices with pandas <https://www.youtube.com/playlist?list=PL5-da3qGB5IBITZj_dYSFqnd_15JgqwA6>`_
+  (2018)
+  `GitHub repo <https://github.com/justmarkham/pycon-2018-tutorial>`__ and
+  `Jupyter Notebook <http://nbviewer.jupyter.org/github/justmarkham/pycon-2018-tutorial/blob/master/tutorial.ipynb>`__
+
+
+Various Tutorials
+-----------------
+
+* `Wes McKinney's (pandas BDFL) blog <http://blog.wesmckinney.com/>`_
+* `Statistical analysis made easy in Python with SciPy and pandas DataFrames, by Randal Olson <http://www.randalolson.com/2012/08/06/statistical-analysis-made-easy-in-python/>`_
+* `Statistical Data Analysis in Python, tutorial videos, by Christopher Fonnesbeck from SciPy 2013 <http://conference.scipy.org/scipy2013/tutorial_detail.php?id=109>`_
+* `Financial analysis in Python, by Thomas Wiecki <http://nbviewer.ipython.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
+* `Intro to pandas data structures, by Greg Reda <http://www.gregreda.com/2013/10/26/intro-to-pandas-data-structures/>`_
+* `Pandas and Python: Top 10, by Manish Amde <http://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/>`_
+* `Pandas DataFrames Tutorial, by Karlijn Willems <http://www.datacamp.com/community/tutorials/pandas-tutorial-dataframe-python>`_
+* `A concise tutorial with real life examples <https://tutswiki.com/pandas-cookbook/chapter1>`_
diff --git a/doc/source/gotchas.rst b/doc/source/gotchas.rst
deleted file mode 100644
index 11827fe2776cf..0000000000000
--- a/doc/source/gotchas.rst
+++ /dev/null
@@ -1,336 +0,0 @@
-.. currentmodule:: pandas
-.. _gotchas:
-
-********************************
-Frequently Asked Questions (FAQ)
-********************************
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows = 15
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-.. _df-memory-usage:
-
-DataFrame memory usage
-----------------------
-As of pandas version 0.15.0, the memory usage of a dataframe (including
-the index) is shown when accessing the ``info`` method of a dataframe. A
-configuration option, ``display.memory_usage`` (see :ref:`options`),
-specifies if the dataframe's memory usage will be displayed when
-invoking the ``df.info()`` method.
-
-For example, the memory usage of the dataframe below is shown
-when calling ``df.info()``:
-
-.. ipython:: python
-
-    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
-              'complex128', 'object', 'bool']
-    n = 5000
-    data = dict([ (t, np.random.randint(100, size=n).astype(t))
-                    for t in dtypes])
-    df = pd.DataFrame(data)
-    df['categorical'] = df['object'].astype('category')
-
-    df.info()
-
-The ``+`` symbol indicates that the true memory usage could be higher, because
-pandas does not count the memory used by values in columns with
-``dtype=object``.
-
-.. versionadded:: 0.17.1
-
-Passing ``memory_usage='deep'`` will enable a more accurate memory usage report,
-that accounts for the full usage of the contained objects. This is optional
-as it can be expensive to do this deeper introspection.
-
-.. ipython:: python
-
-   df.info(memory_usage='deep')
-
-By default the display option is set to ``True`` but can be explicitly
-overridden by passing the ``memory_usage`` argument when invoking ``df.info()``.
-
-The memory usage of each column can be found by calling the ``memory_usage``
-method. This returns a Series with an index represented by column names
-and memory usage of each column shown in bytes. For the dataframe above,
-the memory usage of each column and the total memory usage of the
-dataframe can be found with the memory_usage method:
-
-.. ipython:: python
-
-    df.memory_usage()
-
-    # total memory usage of dataframe
-    df.memory_usage().sum()
-
-By default the memory usage of the dataframe's index is shown in the
-returned Series, the memory usage of the index can be suppressed by passing
-the ``index=False`` argument:
-
-.. ipython:: python
-
-    df.memory_usage(index=False)
-
-The memory usage displayed by the ``info`` method utilizes the
-``memory_usage`` method to determine the memory usage of a dataframe
-while also formatting the output in human-readable units (base-2
-representation; i.e., 1KB = 1024 bytes).
-
-See also :ref:`Categorical Memory Usage <categorical.memory>`.
-
-.. _gotchas.truth:
-
-Using If/Truth Statements with pandas
--------------------------------------
-
-pandas follows the numpy convention of raising an error when you try to convert something to a ``bool``.
-This happens in a ``if`` or when using the boolean operations, ``and``, ``or``, or ``not``.  It is not clear
-what the result of
-
-.. code-block:: python
-
-    >>> if pd.Series([False, True, False]):
-         ...
-
-should be. Should it be ``True`` because it's not zero-length? ``False`` because there are ``False`` values?
-It is unclear, so instead, pandas raises a ``ValueError``:
-
-.. code-block:: python
-
-    >>> if pd.Series([False, True, False]):
-        print("I was true")
-    Traceback
-        ...
-    ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
-
-
-If you see that, you need to explicitly choose what you want to do with it (e.g., use `any()`, `all()` or `empty`).
-or, you might want to compare if the pandas object is ``None``
-
-.. code-block:: python
-
-    >>> if pd.Series([False, True, False]) is not None:
-           print("I was not None")
-    >>> I was not None
-
-
-or return if ``any`` value is ``True``.
-
-.. code-block:: python
-
-    >>> if pd.Series([False, True, False]).any():
-           print("I am any")
-    >>> I am any
-
-To evaluate single-element pandas objects in a boolean context, use the method ``.bool()``:
-
-.. ipython:: python
-
-   pd.Series([True]).bool()
-   pd.Series([False]).bool()
-   pd.DataFrame([[True]]).bool()
-   pd.DataFrame([[False]]).bool()
-
-Bitwise boolean
-~~~~~~~~~~~~~~~
-
-Bitwise boolean operators like ``==`` and ``!=`` will return a boolean ``Series``,
-which is almost always what you want anyways.
-
-.. code-block:: python
-
-   >>> s = pd.Series(range(5))
-   >>> s == 4
-   0    False
-   1    False
-   2    False
-   3    False
-   4     True
-   dtype: bool
-
-See :ref:`boolean comparisons<basics.compare>` for more examples.
-
-Using the ``in`` operator
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Using the Python ``in`` operator on a Series tests for membership in the
-index, not membership among the values.
-
-.. ipython::
-
-    s = pd.Series(range(5), index=list('abcde'))
-    2 in s
-    'b' in s
-
-If this behavior is surprising, keep in mind that using ``in`` on a Python
-dictionary tests keys, not values, and Series are dict-like.
-To test for membership in the values, use the method :func:`~pandas.Series.isin`:
-
-.. ipython::
-
-    s.isin([2])
-    s.isin([2]).any()
-
-For DataFrames, likewise, ``in`` applies to the column axis,
-testing for membership in the list of column names.
-
-``NaN``, Integer ``NA`` values and ``NA`` type promotions
----------------------------------------------------------
-
-Choice of ``NA`` representation
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-For lack of ``NA`` (missing) support from the ground up in NumPy and Python in
-general, we were given the difficult choice between either
-
-- A *masked array* solution: an array of data and an array of boolean values
-  indicating whether a value
-- Using a special sentinel value, bit pattern, or set of sentinel values to
-  denote ``NA`` across the dtypes
-
-For many reasons we chose the latter. After years of production use it has
-proven, at least in my opinion, to be the best decision given the state of
-affairs in NumPy and Python in general. The special value ``NaN``
-(Not-A-Number) is used everywhere as the ``NA`` value, and there are API
-functions ``isnull`` and ``notnull`` which can be used across the dtypes to
-detect NA values.
-
-However, it comes with it a couple of trade-offs which I most certainly have
-not ignored.
-
-.. _gotchas.intna:
-
-Support for integer ``NA``
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In the absence of high performance ``NA`` support being built into NumPy from
-the ground up, the primary casualty is the ability to represent NAs in integer
-arrays. For example:
-
-.. ipython:: python
-
-   s = pd.Series([1, 2, 3, 4, 5], index=list('abcde'))
-   s
-   s.dtype
-
-   s2 = s.reindex(['a', 'b', 'c', 'f', 'u'])
-   s2
-   s2.dtype
-
-This trade-off is made largely for memory and performance reasons, and also so
-that the resulting Series continues to be "numeric". One possibility is to use
-``dtype=object`` arrays instead.
-
-``NA`` type promotions
-~~~~~~~~~~~~~~~~~~~~~~
-
-When introducing NAs into an existing Series or DataFrame via ``reindex`` or
-some other means, boolean and integer types will be promoted to a different
-dtype in order to store the NAs. These are summarized by this table:
-
-.. csv-table::
-   :header: "Typeclass","Promotion dtype for storing NAs"
-   :widths: 40,60
-
-   ``floating``, no change
-   ``object``, no change
-   ``integer``, cast to ``float64``
-   ``boolean``, cast to ``object``
-
-While this may seem like a heavy trade-off, I have found very few
-cases where this is an issue in practice. Some explanation for the motivation
-here in the next section.
-
-Why not make NumPy like R?
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Many people have suggested that NumPy should simply emulate the ``NA`` support
-present in the more domain-specific statistical programming language `R
-<http://r-project.org>`__. Part of the reason is the NumPy type hierarchy:
-
-.. csv-table::
-   :header: "Typeclass","Dtypes"
-   :widths: 30,70
-   :delim: |
-
-   ``numpy.floating`` | ``float16, float32, float64, float128``
-   ``numpy.integer`` | ``int8, int16, int32, int64``
-   ``numpy.unsignedinteger`` | ``uint8, uint16, uint32, uint64``
-   ``numpy.object_`` | ``object_``
-   ``numpy.bool_`` | ``bool_``
-   ``numpy.character`` | ``string_, unicode_``
-
-The R language, by contrast, only has a handful of built-in data types:
-``integer``, ``numeric`` (floating-point), ``character``, and
-``boolean``. ``NA`` types are implemented by reserving special bit patterns for
-each type to be used as the missing value. While doing this with the full NumPy
-type hierarchy would be possible, it would be a more substantial trade-off
-(especially for the 8- and 16-bit data types) and implementation undertaking.
-
-An alternate approach is that of using masked arrays. A masked array is an
-array of data with an associated boolean *mask* denoting whether each value
-should be considered ``NA`` or not. I am personally not in love with this
-approach as I feel that overall it places a fairly heavy burden on the user and
-the library implementer. Additionally, it exacts a fairly high performance cost
-when working with numerical data compared with the simple approach of using
-``NaN``. Thus, I have chosen the Pythonic "practicality beats purity" approach
-and traded integer ``NA`` capability for a much simpler approach of using a
-special value in float and object arrays to denote ``NA``, and promoting
-integer arrays to floating when NAs must be introduced.
-
-
-Differences with NumPy
-----------------------
-For Series and DataFrame objects, ``var`` normalizes by ``N-1`` to produce
-unbiased estimates of the sample variance, while NumPy's ``var`` normalizes
-by N, which measures the variance of the sample. Note that ``cov``
-normalizes by ``N-1`` in both pandas and NumPy.
-
-
-Thread-safety
--------------
-
-As of pandas 0.11, pandas is not 100% thread safe. The known issues relate to
-the ``DataFrame.copy`` method. If you are doing a lot of copying of DataFrame
-objects shared among threads, we recommend holding locks inside the threads
-where the data copying occurs.
-
-See `this link <http://stackoverflow.com/questions/13592618/python-pandas-dataframe-thread-safe>`__
-for more information.
-
-
-Byte-Ordering Issues
---------------------
-Occasionally you may have to deal with data that were created on a machine with
-a different byte order than the one on which you are running Python. A common symptom of this issue is an error like
-
-.. code-block:: python
-
-    Traceback
-        ...
-    ValueError: Big-endian buffer not supported on little-endian compiler
-
-To deal
-with this issue you should convert the underlying NumPy array to the native
-system byte order *before* passing it to Series/DataFrame/Panel constructors
-using something similar to the following:
-
-.. ipython:: python
-
-   x = np.array(list(range(10)), '>i4') # big endian
-   newx = x.byteswap().newbyteorder() # force native byteorder
-   s = pd.Series(newx)
-
-See `the NumPy documentation on byte order
-<http://docs.scipy.org/doc/numpy/user/basics.byteswapping.html>`__ for more
-details.
diff --git a/doc/source/groupby.rst b/doc/source/groupby.rst
deleted file mode 100644
index cbe3588104439..0000000000000
--- a/doc/source/groupby.rst
+++ /dev/null
@@ -1,1208 +0,0 @@
-.. currentmodule:: pandas
-.. _groupby:
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows = 15
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-   plt.close('all')
-   from collections import OrderedDict
-
-*****************************
-Group By: split-apply-combine
-*****************************
-
-By "group by" we are referring to a process involving one or more of the following
-steps
-
- - **Splitting** the data into groups based on some criteria
- - **Applying** a function to each group independently
- - **Combining** the results into a data structure
-
-Of these, the split step is the most straightforward. In fact, in many
-situations you may wish to split the data set into groups and do something with
-those groups yourself. In the apply step, we might wish to one of the
-following:
-
- - **Aggregation**: computing a summary statistic (or statistics) about each
-   group. Some examples:
-
-    - Compute group sums or means
-    - Compute group sizes / counts
-
- - **Transformation**: perform some group-specific computations and return a
-   like-indexed. Some examples:
-
-    - Standardizing data (zscore) within group
-    - Filling NAs within groups with a value derived from each group
-
- - **Filtration**: discard some groups, according to a group-wise computation
-   that evaluates True or False. Some examples:
-
-    - Discarding data that belongs to groups with only a few members
-    - Filtering out data based on the group sum or mean
-
- - Some combination of the above: GroupBy will examine the results of the apply
-   step and try to return a sensibly combined result if it doesn't fit into
-   either of the above two categories
-
-Since the set of object instance methods on pandas data structures are generally
-rich and expressive, we often simply want to invoke, say, a DataFrame function
-on each group. The name GroupBy should be quite familiar to those who have used
-a SQL-based tool (or ``itertools``), in which you can write code like:
-
-.. code-block:: sql
-
-   SELECT Column1, Column2, mean(Column3), sum(Column4)
-   FROM SomeTable
-   GROUP BY Column1, Column2
-
-We aim to make operations like this natural and easy to express using
-pandas. We'll address each area of GroupBy functionality then provide some
-non-trivial examples / use cases.
-
-See the :ref:`cookbook<cookbook.grouping>` for some advanced strategies
-
-.. _groupby.split:
-
-Splitting an object into groups
--------------------------------
-
-pandas objects can be split on any of their axes. The abstract definition of
-grouping is to provide a mapping of labels to group names. To create a GroupBy
-object (more on what the GroupBy object is later), you do the following:
-
-.. code-block:: ipython
-
-   # default is axis=0
-   >>> grouped = obj.groupby(key)
-   >>> grouped = obj.groupby(key, axis=1)
-   >>> grouped = obj.groupby([key1, key2])
-
-The mapping can be specified many different ways:
-
-  - A Python function, to be called on each of the axis labels
-  - A list or NumPy array of the same length as the selected axis
-  - A dict or Series, providing a ``label -> group name`` mapping
-  - For DataFrame objects, a string indicating a column to be used to group. Of
-    course ``df.groupby('A')`` is just syntactic sugar for
-    ``df.groupby(df['A'])``, but it makes life simpler
-  - For DataFrame objects, a string indicating an index level to be used to group.
-  - A list of any of the above things
-
-Collectively we refer to the grouping objects as the **keys**. For example,
-consider the following DataFrame:
-
-.. note::
-
-   .. versionadded:: 0.20
-
-   A string passed to ``groupby`` may refer to either a column or an index level.
-   If a string matches both a column name and an index level name then a warning is
-   issued and the column takes precedence. This will result in an ambiguity error
-   in a future version.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-                             'foo', 'bar', 'foo', 'foo'],
-                      'B' : ['one', 'one', 'two', 'three',
-                             'two', 'two', 'one', 'three'],
-                      'C' : np.random.randn(8),
-                      'D' : np.random.randn(8)})
-   df
-
-We could naturally group by either the ``A`` or ``B`` columns or both:
-
-.. ipython:: python
-
-   grouped = df.groupby('A')
-   grouped = df.groupby(['A', 'B'])
-
-These will split the DataFrame on its index (rows). We could also split by the
-columns:
-
-.. ipython::
-
-    In [4]: def get_letter_type(letter):
-       ...:     if letter.lower() in 'aeiou':
-       ...:         return 'vowel'
-       ...:     else:
-       ...:         return 'consonant'
-       ...:
-
-    In [5]: grouped = df.groupby(get_letter_type, axis=1)
-
-Starting with 0.8, pandas Index objects now support duplicate values. If a
-non-unique index is used as the group key in a groupby operation, all values
-for the same index value will be considered to be in one group and thus the
-output of aggregation functions will only contain unique index values:
-
-.. ipython:: python
-
-   lst = [1, 2, 3, 1, 2, 3]
-
-   s = pd.Series([1, 2, 3, 10, 20, 30], lst)
-
-   grouped = s.groupby(level=0)
-
-   grouped.first()
-
-   grouped.last()
-
-   grouped.sum()
-
-Note that **no splitting occurs** until it's needed. Creating the GroupBy object
-only verifies that you've passed a valid mapping.
-
-.. note::
-
-   Many kinds of complicated data manipulations can be expressed in terms of
-   GroupBy operations (though can't be guaranteed to be the most
-   efficient). You can get quite creative with the label mapping functions.
-
-.. _groupby.sorting:
-
-GroupBy sorting
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-By default the group keys are sorted during the ``groupby`` operation. You may however pass ``sort=False`` for potential speedups:
-
-.. ipython:: python
-
-   df2 = pd.DataFrame({'X' : ['B', 'B', 'A', 'A'], 'Y' : [1, 2, 3, 4]})
-   df2.groupby(['X']).sum()
-   df2.groupby(['X'], sort=False).sum()
-
-
-Note that ``groupby`` will preserve the order in which *observations* are sorted *within* each group.
-For example, the groups created by ``groupby()`` below are in the order they appeared in the original ``DataFrame``:
-
-.. ipython:: python
-
-   df3 = pd.DataFrame({'X' : ['A', 'B', 'A', 'B'], 'Y' : [1, 4, 3, 2]})
-   df3.groupby(['X']).get_group('A')
-
-   df3.groupby(['X']).get_group('B')
-
-
-
-.. _groupby.attributes:
-
-GroupBy object attributes
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The ``groups`` attribute is a dict whose keys are the computed unique groups
-and corresponding values being the axis labels belonging to each group. In the
-above example we have:
-
-.. ipython:: python
-
-   df.groupby('A').groups
-   df.groupby(get_letter_type, axis=1).groups
-
-Calling the standard Python ``len`` function on the GroupBy object just returns
-the length of the ``groups`` dict, so it is largely just a convenience:
-
-.. ipython:: python
-
-   grouped = df.groupby(['A', 'B'])
-   grouped.groups
-   len(grouped)
-
-
-.. _groupby.tabcompletion:
-
-``GroupBy`` will tab complete column names (and other attributes)
-
-.. ipython:: python
-   :suppress:
-
-   n = 10
-   weight = np.random.normal(166, 20, size=n)
-   height = np.random.normal(60, 10, size=n)
-   time = pd.date_range('1/1/2000', periods=n)
-   gender = np.random.choice(['male', 'female'], size=n)
-   df = pd.DataFrame({'height': height, 'weight': weight,
-                      'gender': gender}, index=time)
-
-.. ipython:: python
-
-   df
-   gb = df.groupby('gender')
-
-
-.. ipython::
-
-   @verbatim
-   In [1]: gb.<TAB>
-   gb.agg        gb.boxplot    gb.cummin     gb.describe   gb.filter     gb.get_group  gb.height     gb.last       gb.median     gb.ngroups    gb.plot       gb.rank       gb.std        gb.transform
-   gb.aggregate  gb.count      gb.cumprod    gb.dtype      gb.first      gb.groups     gb.hist       gb.max        gb.min        gb.nth        gb.prod       gb.resample   gb.sum        gb.var
-   gb.apply      gb.cummax     gb.cumsum     gb.fillna     gb.gender     gb.head       gb.indices    gb.mean       gb.name       gb.ohlc       gb.quantile   gb.size       gb.tail       gb.weight
-
-.. _groupby.multiindex:
-
-GroupBy with MultiIndex
-~~~~~~~~~~~~~~~~~~~~~~~
-
-With :ref:`hierarchically-indexed data <advanced.hierarchical>`, it's quite
-natural to group by one of the levels of the hierarchy.
-
-Let's create a Series with a two-level ``MultiIndex``.
-
-.. ipython:: python
-
-
-   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
-   s = pd.Series(np.random.randn(8), index=index)
-   s
-
-We can then group by one of the levels in ``s``.
-
-.. ipython:: python
-
-   grouped = s.groupby(level=0)
-   grouped.sum()
-
-If the MultiIndex has names specified, these can be passed instead of the level
-number:
-
-.. ipython:: python
-
-   s.groupby(level='second').sum()
-
-The aggregation functions such as ``sum`` will take the level parameter
-directly. Additionally, the resulting index will be named according to the
-chosen level:
-
-.. ipython:: python
-
-   s.sum(level='second')
-
-.. versionadded:: 0.6
-
-Grouping with multiple levels is supported.
-
-.. ipython:: python
-   :suppress:
-
-   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-             ['doo', 'doo', 'bee', 'bee', 'bop', 'bop', 'bop', 'bop'],
-             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-   tuples = list(zip(*arrays))
-   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second', 'third'])
-   s = pd.Series(np.random.randn(8), index=index)
-
-.. ipython:: python
-
-   s
-   s.groupby(level=['first', 'second']).sum()
-
-.. versionadded:: 0.20
-
-Index level names may be supplied as keys.
-
-.. ipython:: python
-
-   s.groupby(['first', 'second']).sum()
-
-More on the ``sum`` function and aggregation later.
-
-Grouping DataFrame with Index Levels and Columns
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-A DataFrame may be grouped by a combination of columns and index levels by
-specifying the column names as strings and the index levels as ``pd.Grouper``
-objects.
-
-.. ipython:: python
-
-   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-
-   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
-
-   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
-                      'B': np.arange(8)},
-                     index=index)
-
-   df
-
-The following example groups ``df`` by the ``second`` index level and
-the ``A`` column.
-
-.. ipython:: python
-
-   df.groupby([pd.Grouper(level=1), 'A']).sum()
-
-Index levels may also be specified by name.
-
-.. ipython:: python
-
-   df.groupby([pd.Grouper(level='second'), 'A']).sum()
-
-.. versionadded:: 0.20
-
-Index level names may be specified as keys directly to ``groupby``.
-
-.. ipython:: python
-
-   df.groupby(['second', 'A']).sum()
-
-DataFrame column selection in GroupBy
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Once you have created the GroupBy object from a DataFrame, for example, you
-might want to do something different for each of the columns. Thus, using
-``[]`` similar to getting a column from a DataFrame, you can do:
-
-.. ipython:: python
-   :suppress:
-
-   df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-                             'foo', 'bar', 'foo', 'foo'],
-                      'B' : ['one', 'one', 'two', 'three',
-                             'two', 'two', 'one', 'three'],
-                      'C' : np.random.randn(8),
-                      'D' : np.random.randn(8)})
-
-.. ipython:: python
-
-   grouped = df.groupby(['A'])
-   grouped_C = grouped['C']
-   grouped_D = grouped['D']
-
-This is mainly syntactic sugar for the alternative and much more verbose:
-
-.. ipython:: python
-
-   df['C'].groupby(df['A'])
-
-Additionally this method avoids recomputing the internal grouping information
-derived from the passed key.
-
-.. _groupby.iterating:
-
-Iterating through groups
-------------------------
-
-With the GroupBy object in hand, iterating through the grouped data is very
-natural and functions similarly to ``itertools.groupby``:
-
-.. ipython::
-
-   In [4]: grouped = df.groupby('A')
-
-   In [5]: for name, group in grouped:
-      ...:        print(name)
-      ...:        print(group)
-      ...:
-
-In the case of grouping by multiple keys, the group name will be a tuple:
-
-.. ipython::
-
-   In [5]: for name, group in df.groupby(['A', 'B']):
-      ...:        print(name)
-      ...:        print(group)
-      ...:
-
-It's standard Python-fu but remember you can unpack the tuple in the for loop
-statement if you wish: ``for (k1, k2), group in grouped:``.
-
-Selecting a group
------------------
-
-A single group can be selected using ``GroupBy.get_group()``:
-
-.. ipython:: python
-
-   grouped.get_group('bar')
-
-Or for an object grouped on multiple columns:
-
-.. ipython:: python
-
-   df.groupby(['A', 'B']).get_group(('bar', 'one'))
-
-.. _groupby.aggregate:
-
-Aggregation
------------
-
-Once the GroupBy object has been created, several methods are available to
-perform a computation on the grouped data.
-
-An obvious one is aggregation via the ``aggregate`` or equivalently ``agg`` method:
-
-.. ipython:: python
-
-   grouped = df.groupby('A')
-   grouped.aggregate(np.sum)
-
-   grouped = df.groupby(['A', 'B'])
-   grouped.aggregate(np.sum)
-
-As you can see, the result of the aggregation will have the group names as the
-new index along the grouped axis. In the case of multiple keys, the result is a
-:ref:`MultiIndex <advanced.hierarchical>` by default, though this can be
-changed by using the ``as_index`` option:
-
-.. ipython:: python
-
-   grouped = df.groupby(['A', 'B'], as_index=False)
-   grouped.aggregate(np.sum)
-
-   df.groupby('A', as_index=False).sum()
-
-Note that you could use the ``reset_index`` DataFrame function to achieve the
-same result as the column names are stored in the resulting ``MultiIndex``:
-
-.. ipython:: python
-
-   df.groupby(['A', 'B']).sum().reset_index()
-
-Another simple aggregation example is to compute the size of each group.
-This is included in GroupBy as the ``size`` method. It returns a Series whose
-index are the group names and whose values are the sizes of each group.
-
-.. ipython:: python
-
-   grouped.size()
-
-.. ipython:: python
-
-   grouped.describe()
-
-.. note::
-
-   Aggregation functions **will not** return the groups that you are aggregating over
-   if they are named *columns*, when ``as_index=True``, the default. The grouped columns will
-   be the **indices** of the returned object.
-
-   Passing ``as_index=False`` **will** return the groups that you are aggregating over, if they are
-   named *columns*.
-
-   Aggregating functions are ones that reduce the dimension of the returned objects,
-   for example: ``mean, sum, size, count, std, var, sem, describe, first, last, nth, min, max``. This is
-   what happens when you do for example ``DataFrame.sum()`` and get back a ``Series``.
-
-   ``nth`` can act as a reducer *or* a filter, see :ref:`here <groupby.nth>`
-
-.. _groupby.aggregate.multifunc:
-
-Applying multiple functions at once
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-With grouped Series you can also pass a list or dict of functions to do
-aggregation with, outputting a DataFrame:
-
-.. ipython:: python
-
-   grouped = df.groupby('A')
-   grouped['C'].agg([np.sum, np.mean, np.std])
-
-If a dict is passed, the keys will be used to name the columns. Otherwise the
-function's name (stored in the function object) will be used.
-
-.. ipython:: python
-
-   grouped['D'].agg({'result1' : np.sum,
-                     'result2' : np.mean})
-
-On a grouped DataFrame, you can pass a list of functions to apply to each
-column, which produces an aggregated result with a hierarchical index:
-
-.. ipython:: python
-
-   grouped.agg([np.sum, np.mean, np.std])
-
-Passing a dict of functions has different behavior by default, see the next
-section.
-
-Applying different functions to DataFrame columns
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-By passing a dict to ``aggregate`` you can apply a different aggregation to the
-columns of a DataFrame:
-
-.. ipython:: python
-
-   grouped.agg({'C' : np.sum,
-                'D' : lambda x: np.std(x, ddof=1)})
-
-The function names can also be strings. In order for a string to be valid it
-must be either implemented on GroupBy or available via :ref:`dispatching
-<groupby.dispatch>`:
-
-.. ipython:: python
-
-   grouped.agg({'C' : 'sum', 'D' : 'std'})
-
-.. note::
-
-    If you pass a dict to ``aggregate``, the ordering of the output colums is
-    non-deterministic. If you want to be sure the output columns will be in a specific
-    order, you can use an ``OrderedDict``.  Compare the output of the following two commands:
-
-.. ipython:: python
-
-   grouped.agg({'D': 'std', 'C': 'mean'})
-   grouped.agg(OrderedDict([('D', 'std'), ('C', 'mean')]))
-
-.. _groupby.aggregate.cython:
-
-Cython-optimized aggregation functions
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Some common aggregations, currently only ``sum``, ``mean``, ``std``, and ``sem``, have
-optimized Cython implementations:
-
-.. ipython:: python
-
-   df.groupby('A').sum()
-   df.groupby(['A', 'B']).mean()
-
-Of course ``sum`` and ``mean`` are implemented on pandas objects, so the above
-code would work even without the special versions via dispatching (see below).
-
-.. _groupby.transform:
-
-Transformation
---------------
-
-The ``transform`` method returns an object that is indexed the same (same size)
-as the one being grouped. The transform function must:
-
-* Return a result that is either the same size as the group chunk or
-  broadcastable to the size of the group chunk (e.g., a scalar,
-  ``grouped.transform(lambda x: x.iloc[-1])``).
-* Operate column-by-column on the group chunk.  The transform is applied to
-  the first group chunk using chunk.apply.
-* Not perform in-place operations on the group chunk. Group chunks should
-  be treated as immutable, and changes to a group chunk may produce unexpected
-  results. For example, when using ``fillna``, ``inplace`` must be ``False``
-  (``grouped.transform(lambda x: x.fillna(inplace=False))``).
-* (Optionally) operates on the entire group chunk. If this is supported, a
-  fast path is used starting from the *second* chunk.
-
-For example, suppose we wished to standardize the data within each group:
-
-.. ipython:: python
-
-   index = pd.date_range('10/1/1999', periods=1100)
-   ts = pd.Series(np.random.normal(0.5, 2, 1100), index)
-   ts = ts.rolling(window=100,min_periods=100).mean().dropna()
-
-   ts.head()
-   ts.tail()
-   key = lambda x: x.year
-   zscore = lambda x: (x - x.mean()) / x.std()
-   transformed = ts.groupby(key).transform(zscore)
-
-We would expect the result to now have mean 0 and standard deviation 1 within
-each group, which we can easily check:
-
-.. ipython:: python
-
-   # Original Data
-   grouped = ts.groupby(key)
-   grouped.mean()
-   grouped.std()
-
-   # Transformed Data
-   grouped_trans = transformed.groupby(key)
-   grouped_trans.mean()
-   grouped_trans.std()
-
-We can also visually compare the original and transformed data sets.
-
-.. ipython:: python
-
-   compare = pd.DataFrame({'Original': ts, 'Transformed': transformed})
-
-   @savefig groupby_transform_plot.png
-   compare.plot()
-
-Transformation functions that have lower dimension outputs are broadcast to
-match the shape of the input array.
-
-.. ipython:: python
-
-   data_range = lambda x: x.max() - x.min()
-   ts.groupby(key).transform(data_range)
-
-Alternatively the built-in methods can be could be used to produce the same
-outputs
-
-.. ipython:: python
-
-   ts.groupby(key).transform('max') - ts.groupby(key).transform('min')
-
-Another common data transform is to replace missing data with the group mean.
-
-.. ipython:: python
-   :suppress:
-
-   cols = ['A', 'B', 'C']
-   values = np.random.randn(1000, 3)
-   values[np.random.randint(0, 1000, 100), 0] = np.nan
-   values[np.random.randint(0, 1000, 50), 1] = np.nan
-   values[np.random.randint(0, 1000, 200), 2] = np.nan
-   data_df = pd.DataFrame(values, columns=cols)
-
-.. ipython:: python
-
-   data_df
-
-   countries = np.array(['US', 'UK', 'GR', 'JP'])
-   key = countries[np.random.randint(0, 4, 1000)]
-
-   grouped = data_df.groupby(key)
-
-   # Non-NA count in each group
-   grouped.count()
-
-   f = lambda x: x.fillna(x.mean())
-
-   transformed = grouped.transform(f)
-
-We can verify that the group means have not changed in the transformed data
-and that the transformed data contains no NAs.
-
-.. ipython:: python
-
-   grouped_trans = transformed.groupby(key)
-
-   grouped.mean() # original group means
-   grouped_trans.mean() # transformation did not change group means
-
-   grouped.count() # original has some missing data points
-   grouped_trans.count() # counts after transformation
-   grouped_trans.size() # Verify non-NA count equals group size
-
-.. note::
-
-   Some functions when applied to a groupby object will automatically transform
-   the input, returning an object of the same shape as the original. Passing
-   ``as_index=False`` will not affect these transformation methods.
-
-   For example: ``fillna, ffill, bfill, shift``.
-
-   .. ipython:: python
-
-      grouped.ffill()
-
-
-.. _groupby.transform.window_resample:
-
-New syntax to window and resample operations
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-.. versionadded:: 0.18.1
-
-Working with the resample, expanding or rolling operations on the groupby
-level used to require the application of helper functions. However,
-now it is possible to use ``resample()``, ``expanding()`` and
-``rolling()`` as methods on groupbys.
-
-The example below will apply the ``rolling()`` method on the samples of
-the column B based on the groups of column A.
-
-.. ipython:: python
-
-   df_re = pd.DataFrame({'A': [1] * 10 + [5] * 10,
-                         'B': np.arange(20)})
-   df_re
-
-   df_re.groupby('A').rolling(4).B.mean()
-
-
-The ``expanding()`` method will accumulate a given operation
-(``sum()`` in the example) for all the members of each particular
-group.
-
-.. ipython:: python
-
-   df_re.groupby('A').expanding().sum()
-
-
-Suppose you want to use the ``resample()`` method to get a daily
-frequency in each group of your dataframe and wish to complete the
-missing values with the ``ffill()`` method.
-
-.. ipython:: python
-
-   df_re = pd.DataFrame({'date': pd.date_range(start='2016-01-01',
-                                 periods=4,
-                         freq='W'),
-                        'group': [1, 1, 2, 2],
-                        'val': [5, 6, 7, 8]}).set_index('date')
-   df_re
-
-   df_re.groupby('group').resample('1D').ffill()
-
-.. _groupby.filter:
-
-Filtration
-----------
-
-.. versionadded:: 0.12
-
-The ``filter`` method returns a subset of the original object. Suppose we
-want to take only elements that belong to groups with a group sum greater
-than 2.
-
-.. ipython:: python
-
-   sf = pd.Series([1, 1, 2, 3, 3, 3])
-   sf.groupby(sf).filter(lambda x: x.sum() > 2)
-
-The argument of ``filter`` must be a function that, applied to the group as a
-whole, returns ``True`` or ``False``.
-
-Another useful operation is filtering out elements that belong to groups
-with only a couple members.
-
-.. ipython:: python
-
-   dff = pd.DataFrame({'A': np.arange(8), 'B': list('aabbbbcc')})
-   dff.groupby('B').filter(lambda x: len(x) > 2)
-
-Alternatively, instead of dropping the offending groups, we can return a
-like-indexed objects where the groups that do not pass the filter are filled
-with NaNs.
-
-.. ipython:: python
-
-   dff.groupby('B').filter(lambda x: len(x) > 2, dropna=False)
-
-For DataFrames with multiple columns, filters should explicitly specify a column as the filter criterion.
-
-.. ipython:: python
-
-   dff['C'] = np.arange(8)
-   dff.groupby('B').filter(lambda x: len(x['C']) > 2)
-
-.. note::
-
-   Some functions when applied to a groupby object will act as a **filter** on the input, returning
-   a reduced shape of the original (and potentially eliminating groups), but with the index unchanged.
-   Passing ``as_index=False`` will not affect these transformation methods.
-
-   For example: ``head, tail``.
-
-   .. ipython:: python
-
-      dff.groupby('B').head(2)
-
-
-.. _groupby.dispatch:
-
-Dispatching to instance methods
--------------------------------
-
-When doing an aggregation or transformation, you might just want to call an
-instance method on each data group. This is pretty easy to do by passing lambda
-functions:
-
-.. ipython:: python
-
-   grouped = df.groupby('A')
-   grouped.agg(lambda x: x.std())
-
-But, it's rather verbose and can be untidy if you need to pass additional
-arguments. Using a bit of metaprogramming cleverness, GroupBy now has the
-ability to "dispatch" method calls to the groups:
-
-.. ipython:: python
-
-   grouped.std()
-
-What is actually happening here is that a function wrapper is being
-generated. When invoked, it takes any passed arguments and invokes the function
-with any arguments on each group (in the above example, the ``std``
-function). The results are then combined together much in the style of ``agg``
-and ``transform`` (it actually uses ``apply`` to infer the gluing, documented
-next). This enables some operations to be carried out rather succinctly:
-
-.. ipython:: python
-
-   tsdf = pd.DataFrame(np.random.randn(1000, 3),
-                       index=pd.date_range('1/1/2000', periods=1000),
-                       columns=['A', 'B', 'C'])
-   tsdf.iloc[::2] = np.nan
-   grouped = tsdf.groupby(lambda x: x.year)
-   grouped.fillna(method='pad')
-
-In this example, we chopped the collection of time series into yearly chunks
-then independently called :ref:`fillna <missing_data.fillna>` on the
-groups.
-
-.. versionadded:: 0.14.1
-
-The ``nlargest`` and ``nsmallest`` methods work on ``Series`` style groupbys:
-
-.. ipython:: python
-
-   s = pd.Series([9, 8, 7, 5, 19, 1, 4.2, 3.3])
-   g = pd.Series(list('abababab'))
-   gb = s.groupby(g)
-   gb.nlargest(3)
-   gb.nsmallest(3)
-
-.. _groupby.apply:
-
-Flexible ``apply``
-------------------
-
-Some operations on the grouped data might not fit into either the aggregate or
-transform categories. Or, you may simply want GroupBy to infer how to combine
-the results. For these, use the ``apply`` function, which can be substituted
-for both ``aggregate`` and ``transform`` in many standard use cases. However,
-``apply`` can handle some exceptional use cases, for example:
-
-.. ipython:: python
-
-   df
-   grouped = df.groupby('A')
-
-   # could also just call .describe()
-   grouped['C'].apply(lambda x: x.describe())
-
-The dimension of the returned result can also change:
-
-.. ipython::
-
-    In [8]: grouped = df.groupby('A')['C']
-
-    In [10]: def f(group):
-       ....:     return pd.DataFrame({'original' : group,
-       ....:                          'demeaned' : group - group.mean()})
-       ....:
-
-    In [11]: grouped.apply(f)
-
-``apply`` on a Series can operate on a returned value from the applied function, that is itself a series, and possibly upcast the result to a DataFrame
-
-.. ipython:: python
-
-    def f(x):
-      return pd.Series([ x, x**2 ], index = ['x', 'x^2'])
-    s = pd.Series(np.random.rand(5))
-    s
-    s.apply(f)
-
-
-.. note::
-
-   ``apply`` can act as a reducer, transformer, *or* filter function, depending on exactly what is passed to it.
-   So depending on the path taken, and exactly what you are grouping. Thus the grouped columns(s) may be included in
-   the output as well as set the indices.
-
-.. warning::
-
-    In the current implementation apply calls func twice on the
-    first group to decide whether it can take a fast or slow code
-    path. This can lead to unexpected behavior if func has
-    side-effects, as they will take effect twice for the first
-    group.
-
-    .. ipython:: python
-
-        d = pd.DataFrame({"a":["x", "y"], "b":[1,2]})
-        def identity(df):
-            print df
-            return df
-
-        d.groupby("a").apply(identity)
-
-
-Other useful features
----------------------
-
-Automatic exclusion of "nuisance" columns
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Again consider the example DataFrame we've been looking at:
-
-.. ipython:: python
-
-   df
-
-Suppose we wish to compute the standard deviation grouped by the ``A``
-column. There is a slight problem, namely that we don't care about the data in
-column ``B``. We refer to this as a "nuisance" column. If the passed
-aggregation function can't be applied to some columns, the troublesome columns
-will be (silently) dropped. Thus, this does not pose any problems:
-
-.. ipython:: python
-
-   df.groupby('A').std()
-
-.. _groupby.missing:
-
-NA and NaT group handling
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-If there are any NaN or NaT values in the grouping key, these will be automatically
-excluded. So there will never be an "NA group" or "NaT group". This was not the case in older
-versions of pandas, but users were generally discarding the NA group anyway
-(and supporting it was an implementation headache).
-
-Grouping with ordered factors
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Categorical variables represented as instance of pandas's ``Categorical`` class
-can be used as group keys. If so, the order of the levels will be preserved:
-
-.. ipython:: python
-
-   data = pd.Series(np.random.randn(100))
-
-   factor = pd.qcut(data, [0, .25, .5, .75, 1.])
-
-   data.groupby(factor).mean()
-
-.. _groupby.specify:
-
-Grouping with a Grouper specification
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You may need to specify a bit more data to properly group. You can
-use the ``pd.Grouper`` to provide this local control.
-
-.. ipython:: python
-
-   import datetime
-
-   df = pd.DataFrame({
-            'Branch' : 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1,3,5,1,8,1,9,3],
-            'Date' : [
-                datetime.datetime(2013,1,1,13,0),
-                datetime.datetime(2013,1,1,13,5),
-                datetime.datetime(2013,10,1,20,0),
-                datetime.datetime(2013,10,2,10,0),
-                datetime.datetime(2013,10,1,20,0),
-                datetime.datetime(2013,10,2,10,0),
-                datetime.datetime(2013,12,2,12,0),
-                datetime.datetime(2013,12,2,14,0),
-                ]
-            })
-
-   df
-
-Groupby a specific column with the desired frequency. This is like resampling.
-
-.. ipython:: python
-
-   df.groupby([pd.Grouper(freq='1M',key='Date'),'Buyer']).sum()
-
-You have an ambiguous specification in that you have a named index and a column
-that could be potential groupers.
-
-.. ipython:: python
-
-   df = df.set_index('Date')
-   df['Date'] = df.index + pd.offsets.MonthEnd(2)
-   df.groupby([pd.Grouper(freq='6M',key='Date'),'Buyer']).sum()
-
-   df.groupby([pd.Grouper(freq='6M',level='Date'),'Buyer']).sum()
-
-
-Taking the first rows of each group
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Just like for a DataFrame or Series you can call head and tail on a groupby:
-
-.. ipython:: python
-
-   df = pd.DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
-   df
-
-   g = df.groupby('A')
-   g.head(1)
-
-   g.tail(1)
-
-This shows the first or last n rows from each group.
-
-.. warning::
-
-   Before 0.14.0 this was implemented with a fall-through apply,
-   so the result would incorrectly respect the as_index flag:
-
-   .. code-block:: python
-
-       >>> g.head(1):  # was equivalent to g.apply(lambda x: x.head(1))
-             A  B
-        A
-        1 0  1  2
-        5 2  5  6
-
-.. _groupby.nth:
-
-Taking the nth row of each group
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To select from a DataFrame or Series the nth item, use the nth method. This is a reduction method, and will return a single row (or no row) per group if you pass an int for n:
-
-.. ipython:: python
-
-   df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-   g = df.groupby('A')
-
-   g.nth(0)
-   g.nth(-1)
-   g.nth(1)
-
-If you want to select the nth not-null item, use the ``dropna`` kwarg. For a DataFrame this should be either ``'any'`` or ``'all'`` just like you would pass to dropna, for a Series this just needs to be truthy.
-
-.. ipython:: python
-
-   # nth(0) is the same as g.first()
-   g.nth(0, dropna='any')
-   g.first()
-
-   # nth(-1) is the same as g.last()
-   g.nth(-1, dropna='any')  # NaNs denote group exhausted when using dropna
-   g.last()
-
-   g.B.nth(0, dropna=True)
-
-As with other methods, passing ``as_index=False``, will achieve a filtration, which returns the grouped row.
-
-.. ipython:: python
-
-   df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-   g = df.groupby('A',as_index=False)
-
-   g.nth(0)
-   g.nth(-1)
-
-You can also select multiple rows from each group by specifying multiple nth values as a list of ints.
-
-.. ipython:: python
-
-   business_dates = pd.date_range(start='4/1/2014', end='6/30/2014', freq='B')
-   df = pd.DataFrame(1, index=business_dates, columns=['a', 'b'])
-   # get the first, 4th, and last date index for each month
-   df.groupby((df.index.year, df.index.month)).nth([0, 3, -1])
-
-Enumerate group items
-~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.13.0
-
-To see the order in which each row appears within its group, use the
-``cumcount`` method:
-
-.. ipython:: python
-
-   df = pd.DataFrame(list('aaabba'), columns=['A'])
-   df
-
-   df.groupby('A').cumcount()
-
-   df.groupby('A').cumcount(ascending=False)  # kwarg only
-
-Plotting
-~~~~~~~~
-
-Groupby also works with some plotting methods.  For example, suppose we
-suspect that some features in a DataFrame may differ by group, in this case,
-the values in column 1 where the group is "B" are 3 higher on average.
-
-.. ipython:: python
-
-   np.random.seed(1234)
-   df = pd.DataFrame(np.random.randn(50, 2))
-   df['g'] = np.random.choice(['A', 'B'], size=50)
-   df.loc[df['g'] == 'B', 1] += 3
-
-We can easily visualize this with a boxplot:
-
-.. ipython:: python
-   :okwarning:
-
-   @savefig groupby_boxplot.png
-   df.groupby('g').boxplot()
-
-The result of calling ``boxplot`` is a dictionary whose keys are the values
-of our grouping column ``g`` ("A" and "B"). The values of the resulting dictionary
-can be controlled by the ``return_type`` keyword of ``boxplot``.
-See the :ref:`visualization documentation<visualization.box>` for more.
-
-.. warning::
-
-  For historical reasons, ``df.groupby("g").boxplot()`` is not equivalent
-  to ``df.boxplot(by="g")``. See :ref:`here<visualization.box.return>` for
-  an explanation.
-
-Examples
---------
-
-Regrouping by factor
-~~~~~~~~~~~~~~~~~~~~
-
-Regroup columns of a DataFrame according to their sum, and sum the aggregated ones.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a':[1,0,0], 'b':[0,1,0], 'c':[1,0,0], 'd':[2,3,4]})
-   df
-   df.groupby(df.sum(), axis=1).sum()
-
-Groupby by Indexer to 'resample' data
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Resampling produces new hypothetical samples(resamples) from already existing observed data or from a model that generates data. These new samples are similar to the pre-existing samples.
-
-In order to resample to work on indices that are non-datetimelike , the following procedure can be utilized.
-
-In the following examples, **df.index // 5** returns a binary array which is used to determine what get's selected for the groupby operation.
-
-.. note:: The below example shows how we can downsample by consolidation of samples into fewer samples. Here by using **df.index // 5**, we are aggregating the samples in bins. By applying **std()** function, we aggregate the information contained in many samples into a small subset of values which is their standard deviation thereby reducing the number of samples.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10,2))
-   df
-   df.index // 5
-   df.groupby(df.index // 5).std()
-
-Returning a Series to propagate names
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Group DataFrame columns, compute a set of metrics and return a named Series.
-The Series name is used as the name for the column index. This is especially
-useful in conjunction with reshaping operations such as stacking in which the
-column index name will be used as the name of the inserted column:
-
-.. ipython:: python
-
-   df = pd.DataFrame({
-            'a':  [0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2],
-            'b':  [0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1],
-            'c':  [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0],
-            'd':  [0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1],
-            })
-
-   def compute_metrics(x):
-       result = {'b_sum': x['b'].sum(), 'c_mean': x['c'].mean()}
-       return pd.Series(result, name='metrics')
-
-   result = df.groupby('a').apply(compute_metrics)
-
-   result
-
-   result.stack()
diff --git a/doc/source/html-styling.ipynb b/doc/source/html-styling.ipynb
deleted file mode 100644
index 1a97378fd30b1..0000000000000
--- a/doc/source/html-styling.ipynb
+++ /dev/null
@@ -1,969 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "*New in version 0.17.1*\n",
-    "\n",
-    "<p style=\"color: red\">*Provisional: This is a new feature and still under development. We'll be adding features and possibly making breaking changes in future releases. We'd love to hear your [feedback](https://github.com/pandas-dev/pandas/issues).*<p style=\"color: red\">\n",
-    "\n",
-    "This document is written as a Jupyter Notebook, and can be viewed or downloaded [here](http://nbviewer.ipython.org/github/pandas-dev/pandas/blob/master/doc/source/html-styling.ipynb).\n",
-    "\n",
-    "You can apply **conditional formatting**, the visual styling of a DataFrame\n",
-    "depending on the data within, by using the ``DataFrame.style`` property.\n",
-    "This is a property that returns a ``pandas.Styler`` object, which has\n",
-    "useful methods for formatting and displaying DataFrames.\n",
-    "\n",
-    "The styling is accomplished using CSS.\n",
-    "You write \"style functions\" that take scalars, `DataFrame`s or `Series`, and return *like-indexed* DataFrames or Series with CSS `\"attribute: value\"` pairs for the values.\n",
-    "These functions can be incrementally passed to the `Styler` which collects the styles before rendering.\n",
-    "\n",
-    "### Contents\n",
-    "\n",
-    "- [Building Styles](#Building-Styles)\n",
-    "- [Finer Control: Slicing](#Finer-Control:-Slicing)\n",
-    "- [Builtin Styles](#Builtin-Styles)\n",
-    "- [Other options](#Other-options)\n",
-    "- [Sharing Styles](#Sharing-Styles)\n",
-    "- [Limitations](#Limitations)\n",
-    "- [Terms](#Terms)\n",
-    "- [Extensibility](#Extensibility)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Building Styles\n",
-    "\n",
-    "Pass your style functions into one of the following methods:\n",
-    "\n",
-    "- `Styler.applymap`: elementwise\n",
-    "- `Styler.apply`: column-/row-/table-wise\n",
-    "\n",
-    "Both of those methods take a function (and some other keyword arguments) and applies your function to the DataFrame in a certain way.\n",
-    "`Styler.applymap` works through the DataFrame elementwise.\n",
-    "`Styler.apply` passes each column or row into your DataFrame one-at-a-time or the entire table at once, depending on the `axis` keyword argument.\n",
-    "For columnwise use `axis=0`, rowwise use `axis=1`, and for the entire table at once use `axis=None`.\n",
-    "\n",
-    "For `Styler.applymap` your function should take a scalar and return a single string with the CSS attribute-value pair.\n",
-    "\n",
-    "For `Styler.apply` your function should take a Series or DataFrame (depending on the axis parameter), and return a Series or DataFrame with an identical shape where each value is a string with a CSS attribute-value pair.\n",
-    "\n",
-    "Let's see some examples."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "import numpy as np\n",
-    "\n",
-    "np.random.seed(24)\n",
-    "df = pd.DataFrame({'A': np.linspace(1, 10, 10)})\n",
-    "df = pd.concat([df, pd.DataFrame(np.random.randn(10, 4), columns=list('BCDE'))],\n",
-    "               axis=1)\n",
-    "df.iloc[0, 2] = np.nan"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Here's a boring example of rendering a DataFrame, without any (visible) styles:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "*Note*: The `DataFrame.style` attribute is a propetry that returns a `Styler` object. `Styler` has a `_repr_html_` method defined on it so they are rendered automatically. If you want the actual HTML back for further processing or for writing to file call the `.render()` method which returns a string.\n",
-    "\n",
-    "The above output looks very similar to the standard DataFrame HTML representation. But we've done some work behind the scenes to attach CSS classes to each cell. We can view these by calling the `.render` method."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.highlight_null().render().split('\\n')[:10]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The `row0_col2` is the identifier for that particular cell. We've also prepended each row/column identifier with a UUID unique to each DataFrame so that the style from one doesn't collide with the styling from another within the same notebook or page (you can set the `uuid` if you'd like to tie together the styling of two DataFrames).\n",
-    "\n",
-    "When writing style functions, you take care of producing the CSS attribute / value pairs you want. Pandas matches those up with the CSS classes that identify each cell."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's write a simple style function that will color negative numbers red and positive numbers black."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": true
-   },
-   "outputs": [],
-   "source": [
-    "def color_negative_red(val):\n",
-    "    \"\"\"\n",
-    "    Takes a scalar and returns a string with\n",
-    "    the css property `'color: red'` for negative\n",
-    "    strings, black otherwise.\n",
-    "    \"\"\"\n",
-    "    color = 'red' if val < 0 else 'black'\n",
-    "    return 'color: %s' % color"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In this case, the cell's style depends only on it's own value.\n",
-    "That means we should use the `Styler.applymap` method which works elementwise."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "s = df.style.applymap(color_negative_red)\n",
-    "s"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Notice the similarity with the standard `df.applymap`, which operates on DataFrames elementwise. We want you to be able to resuse your existing knowledge of how to interact with DataFrames.\n",
-    "\n",
-    "Notice also that our function returned a string containing the CSS attribute and value, separated by a colon just like in a `<style>` tag. This will be a common theme.\n",
-    "\n",
-    "Finally, the input shapes matched. `Styler.applymap` calls the function on each scalar input, and the function returns a scalar output."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now suppose you wanted to highlight the maximum value in each column.\n",
-    "We can't use `.applymap` anymore since that operated elementwise.\n",
-    "Instead, we'll turn to `.apply` which operates columnwise (or rowwise using the `axis` keyword). Later on we'll see that something like `highlight_max` is already defined on `Styler` so you wouldn't need to write this yourself."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": true
-   },
-   "outputs": [],
-   "source": [
-    "def highlight_max(s):\n",
-    "    '''\n",
-    "    highlight the maximum in a Series yellow.\n",
-    "    '''\n",
-    "    is_max = s == s.max()\n",
-    "    return ['background-color: yellow' if v else '' for v in is_max]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.apply(highlight_max)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In this case the input is a `Series`, one column at a time.\n",
-    "Notice that the output shape of `highlight_max` matches the input shape, an array with `len(s)` items."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We encourage you to use method chains to build up a style piecewise, before finally rending at the end of the chain."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.\\\n",
-    "    applymap(color_negative_red).\\\n",
-    "    apply(highlight_max)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Above we used `Styler.apply` to pass in each column one at a time.\n",
-    "\n",
-    "<p style=\"background-color: #DEDEBE\">*Debugging Tip*: If you're having trouble writing your style function, try just passing it into <code style=\"background-color: #DEDEBE\">DataFrame.apply</code>. Internally, <code style=\"background-color: #DEDEBE\">Styler.apply</code> uses <code style=\"background-color: #DEDEBE\">DataFrame.apply</code> so the result should be the same.</p>\n",
-    "\n",
-    "What if you wanted to highlight just the maximum value in the entire table?\n",
-    "Use `.apply(function, axis=None)` to indicate that your function wants the entire table, not one column or row at a time. Let's try that next.\n",
-    "\n",
-    "We'll rewrite our `highlight-max` to handle either Series (from `.apply(axis=0 or 1)`) or DataFrames (from `.apply(axis=None)`). We'll also allow the color to be adjustable, to demonstrate that `.apply`, and `.applymap` pass along keyword arguments."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": true
-   },
-   "outputs": [],
-   "source": [
-    "def highlight_max(data, color='yellow'):\n",
-    "    '''\n",
-    "    highlight the maximum in a Series or DataFrame\n",
-    "    '''\n",
-    "    attr = 'background-color: {}'.format(color)\n",
-    "    if data.ndim == 1:  # Series from .apply(axis=0) or axis=1\n",
-    "        is_max = data == data.max()\n",
-    "        return [attr if v else '' for v in is_max]\n",
-    "    else:  # from .apply(axis=None)\n",
-    "        is_max = data == data.max().max()\n",
-    "        return pd.DataFrame(np.where(is_max, attr, ''),\n",
-    "                            index=data.index, columns=data.columns)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "When using ``Styler.apply(func, axis=None)``, the function must return a DataFrame with the same index and column labels."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.apply(highlight_max, color='darkorange', axis=None)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Building Styles Summary\n",
-    "\n",
-    "Style functions should return strings with one or more CSS `attribute: value` delimited by semicolons. Use\n",
-    "\n",
-    "- `Styler.applymap(func)` for elementwise styles\n",
-    "- `Styler.apply(func, axis=0)` for columnwise styles\n",
-    "- `Styler.apply(func, axis=1)` for rowwise styles\n",
-    "- `Styler.apply(func, axis=None)` for tablewise styles\n",
-    "\n",
-    "And crucially the input and output shapes of `func` must match. If `x` is the input then ``func(x).shape == x.shape``."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Finer Control: Slicing"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Both `Styler.apply`, and `Styler.applymap` accept a `subset` keyword.\n",
-    "This allows you to apply styles to specific rows or columns, without having to code that logic into your `style` function.\n",
-    "\n",
-    "The value passed to `subset` behaves simlar to slicing a DataFrame.\n",
-    "\n",
-    "- A scalar is treated as a column label\n",
-    "- A list (or series or numpy array)\n",
-    "- A tuple is treated as `(row_indexer, column_indexer)`\n",
-    "\n",
-    "Consider using `pd.IndexSlice` to construct the tuple for the last one."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.apply(highlight_max, subset=['B', 'C', 'D'])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "For row and column slicing, any valid indexer to `.loc` will work."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.applymap(color_negative_red,\n",
-    "                  subset=pd.IndexSlice[2:5, ['B', 'D']])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Only label-based slicing is supported right now, not positional.\n",
-    "\n",
-    "If your style function uses a `subset` or `axis` keyword argument, consider wrapping your function in a `functools.partial`, partialing out that keyword.\n",
-    "\n",
-    "```python\n",
-    "my_func2 = functools.partial(my_func, subset=42)\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Finer Control: Display Values\n",
-    "\n",
-    "We distinguish the *display* value from the *actual* value in `Styler`.\n",
-    "To control the display value, the text is printed in each cell, use `Styler.format`. Cells can be formatted according to a [format spec string](https://docs.python.org/3/library/string.html#format-specification-mini-language) or a callable that takes a single value and returns a string."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.format(\"{:.2%}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use a dictionary to format specific columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.format({'B': \"{:0<4.0f}\", 'D': '{:+.2f}'})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Or pass in a callable (or dictionary of callables) for more flexible handling."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.format({\"B\": lambda x: \"±{:.2f}\".format(abs(x))})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Builtin Styles"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Finally, we expect certain styling functions to be common enough that we've included a few \"built-in\" to the `Styler`, so you don't have to write them yourself."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.highlight_null(null_color='red')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can create \"heatmaps\" with the `background_gradient` method. These require matplotlib, and we'll use [Seaborn](http://stanford.edu/~mwaskom/software/seaborn/) to get a nice colormap."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "import seaborn as sns\n",
-    "\n",
-    "cm = sns.light_palette(\"green\", as_cmap=True)\n",
-    "\n",
-    "s = df.style.background_gradient(cmap=cm)\n",
-    "s"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "`Styler.background_gradient` takes the keyword arguments `low` and `high`. Roughly speaking these extend the range of your data by `low` and `high` percent so that when we convert the colors, the colormap's entire range isn't used. This is useful so that you can actually read the text still."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "# Uses the full color range\n",
-    "df.loc[:4].style.background_gradient(cmap='viridis')"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "# Compreess the color range\n",
-    "(df.loc[:4]\n",
-    "    .style\n",
-    "    .background_gradient(cmap='viridis', low=.5, high=0)\n",
-    "    .highlight_null('red'))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can include \"bar charts\" in your DataFrame."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.bar(subset=['A', 'B'], color='#d65f5f')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "There's also `.highlight_min` and `.highlight_max`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.highlight_max(axis=0)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.highlight_min(axis=0)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use `Styler.set_properties` when the style doesn't actually depend on the values."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.set_properties(**{'background-color': 'black',\n",
-    "                           'color': 'lawngreen',\n",
-    "                           'border-color': 'white'})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Sharing Styles"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Say you have a lovely style built up for a DataFrame, and now you want to apply the same style to a second DataFrame. Export the style with `df1.style.export`, and import it on the second DataFrame with `df1.style.set`"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df2 = -df\n",
-    "style1 = df.style.applymap(color_negative_red)\n",
-    "style1"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "style2 = df2.style\n",
-    "style2.use(style1.export())\n",
-    "style2"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Notice that you're able share the styles even though they're data aware. The styles are re-evaluated on the new DataFrame they've been `use`d upon."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Other options\n",
-    "\n",
-    "You've seen a few methods for data-driven styling.\n",
-    "`Styler` also provides a few other options for styles that don't depend on the data.\n",
-    "\n",
-    "- precision\n",
-    "- captions\n",
-    "- table-wide styles\n",
-    "\n",
-    "Each of these can be specified in two ways:\n",
-    "\n",
-    "- A keyword argument to `pandas.core.Styler`\n",
-    "- A call to one of the `.set_` methods, e.g. `.set_caption`\n",
-    "\n",
-    "The best method to use depends on the context. Use the `Styler` constructor when building many styled DataFrames that should all share the same properties. For interactive use, the`.set_` methods are more convenient."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Precision"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can control the precision of floats using pandas' regular `display.precision` option."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "with pd.option_context('display.precision', 2):\n",
-    "    html = (df.style\n",
-    "              .applymap(color_negative_red)\n",
-    "              .apply(highlight_max))\n",
-    "html"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Or through a `set_precision` method."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style\\\n",
-    "  .applymap(color_negative_red)\\\n",
-    "  .apply(highlight_max)\\\n",
-    "  .set_precision(2)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Setting the precision only affects the printed number; the full-precision values are always passed to your style functions. You can always use `df.round(2).style` if you'd prefer to round from the start."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Captions"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Regular table captions can be added in a few ways."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "df.style.set_caption('Colormaps, with a caption.')\\\n",
-    "    .background_gradient(cmap=cm)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "### Table Styles"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The next option you have are \"table styles\".\n",
-    "These are styles that apply to the table as a whole, but don't look at the data.\n",
-    "Certain sytlings, including pseudo-selectors like `:hover` can only be used this way."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "from IPython.display import HTML\n",
-    "\n",
-    "def hover(hover_color=\"#ffff99\"):\n",
-    "    return dict(selector=\"tr:hover\",\n",
-    "                props=[(\"background-color\", \"%s\" % hover_color)])\n",
-    "\n",
-    "styles = [\n",
-    "    hover(),\n",
-    "    dict(selector=\"th\", props=[(\"font-size\", \"150%\"),\n",
-    "                               (\"text-align\", \"center\")]),\n",
-    "    dict(selector=\"caption\", props=[(\"caption-side\", \"bottom\")])\n",
-    "]\n",
-    "html = (df.style.set_table_styles(styles)\n",
-    "          .set_caption(\"Hover to highlight.\"))\n",
-    "html"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "`table_styles` should be a list of dictionaries.\n",
-    "Each dictionary should have the `selector` and `props` keys.\n",
-    "The value for `selector` should be a valid CSS selector.\n",
-    "Recall that all the styles are already attached to an `id`, unique to\n",
-    "each `Styler`. This selector is in addition to that `id`.\n",
-    "The value for `props` should be a list of tuples of `('attribute', 'value')`.\n",
-    "\n",
-    "`table_styles` are extremely flexible, but not as fun to type out by hand.\n",
-    "We hope to collect some useful ones either in pandas, or preferable in a new package that [builds on top](#Extensibility) the tools here."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# CSS Classes\n",
-    "\n",
-    "Certain CSS classes are attached to cells.\n",
-    "\n",
-    "- Index and Column names include `index_name` and `level<k>` where `k` is its level in a MultiIndex\n",
-    "- Index label cells include\n",
-    "  + `row_heading`\n",
-    "  + `row<n>` where `n` is the numeric position of the row\n",
-    "  + `level<k>` where `k` is the level in a MultiIndex\n",
-    "- Column label cells include\n",
-    "  + `col_heading`\n",
-    "  + `col<n>` where `n` is the numeric position of the column\n",
-    "  + `level<k>` where `k` is the level in a MultiIndex\n",
-    "- Blank cells include `blank`\n",
-    "- Data cells include `data`"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Limitations\n",
-    "\n",
-    "- DataFrame only `(use Series.to_frame().style)`\n",
-    "- The index and columns must be unique\n",
-    "- No large repr, and performance isn't great; this is intended for summary DataFrames\n",
-    "- You can only style the *values*, not the index or columns\n",
-    "- You can only apply styles, you can't insert new HTML entities\n",
-    "\n",
-    "Some of these will be addressed in the future.\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Terms\n",
-    "\n",
-    "- Style function: a function that's passed into `Styler.apply` or `Styler.applymap` and returns values like `'css attribute: value'`\n",
-    "- Builtin style functions: style functions that are methods on `Styler`\n",
-    "- table style: a dictionary with the two keys `selector` and `props`. `selector` is the CSS selector that `props` will apply to. `props` is a list of `(attribute, value)` tuples. A list of table styles passed into `Styler`."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Fun stuff\n",
-    "\n",
-    "Here are a few interesting examples.\n",
-    "\n",
-    "`Styler` interacts pretty well with widgets. If you're viewing this online instead of running the notebook yourself, you're missing out on interactively adjusting the color palette."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "from IPython.html import widgets\n",
-    "@widgets.interact\n",
-    "def f(h_neg=(0, 359, 1), h_pos=(0, 359), s=(0., 99.9), l=(0., 99.9)):\n",
-    "    return df.style.background_gradient(\n",
-    "        cmap=sns.palettes.diverging_palette(h_neg=h_neg, h_pos=h_pos, s=s, l=l,\n",
-    "                                            as_cmap=True)\n",
-    "    )"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "def magnify():\n",
-    "    return [dict(selector=\"th\",\n",
-    "                 props=[(\"font-size\", \"4pt\")]),\n",
-    "            dict(selector=\"td\",\n",
-    "                 props=[('padding', \"0em 0em\")]),\n",
-    "            dict(selector=\"th:hover\",\n",
-    "                 props=[(\"font-size\", \"12pt\")]),\n",
-    "            dict(selector=\"tr:hover td:hover\",\n",
-    "                 props=[('max-width', '200px'),\n",
-    "                        ('font-size', '12pt')])\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "collapsed": false
-   },
-   "outputs": [],
-   "source": [
-    "np.random.seed(25)\n",
-    "cmap = cmap=sns.diverging_palette(5, 250, as_cmap=True)\n",
-    "df = pd.DataFrame(np.random.randn(20, 25)).cumsum()\n",
-    "\n",
-    "df.style.background_gradient(cmap, axis=1)\\\n",
-    "    .set_properties(**{'max-width': '80px', 'font-size': '1pt'})\\\n",
-    "    .set_caption(\"Hover to magify\")\\\n",
-    "    .set_precision(2)\\\n",
-    "    .set_table_styles(magnify())"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Extensibility\n",
-    "\n",
-    "The core of pandas is, and will remain, its \"high-performance, easy-to-use data structures\".\n",
-    "With that in mind, we hope that `DataFrame.style` accomplishes two goals\n",
-    "\n",
-    "- Provide an API that is pleasing to use interactively and is \"good enough\" for many tasks\n",
-    "- Provide the foundations for dedicated libraries to build on\n",
-    "\n",
-    "If you build a great library on top of this, let us know and we'll [link](http://pandas.pydata.org/pandas-docs/stable/ecosystem.html) to it.\n",
-    "\n",
-    "## Subclassing\n",
-    "\n",
-    "This section contains a bit of information about the implementation of `Styler`.\n",
-    "Since the feature is so new all of this is subject to change, even more so than the end-use API.\n",
-    "\n",
-    "As users apply styles (via `.apply`, `.applymap` or one of the builtins), we don't actually calculate anything.\n",
-    "Instead, we append functions and arguments to a list `self._todo`.\n",
-    "When asked (typically in `.render` we'll walk through the list and execute each function (this is in `self._compute()`.\n",
-    "These functions update an internal `defaultdict(list)`, `self.ctx` which maps DataFrame row / column positions to CSS attribute, value pairs.\n",
-    "\n",
-    "We take the extra step through `self._todo` so that we can export styles and set them on other `Styler`s.\n",
-    "\n",
-    "Rendering uses [Jinja](http://jinja.pocoo.org/) templates.\n",
-    "The `.translate` method takes `self.ctx` and builds another dictionary ready to be passed into `Styler.template.render`, the Jinja template.\n",
-    "\n",
-    "\n",
-    "## Alternate templates\n",
-    "\n",
-    "We've used [Jinja](http://jinja.pocoo.org/) templates to build up the HTML.\n",
-    "The template is stored as a class variable ``Styler.template.``. Subclasses can override that.\n",
-    "\n",
-    "```python\n",
-    "class CustomStyle(Styler):\n",
-    "    template = Template(\"\"\"...\"\"\")\n",
-    "```"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.5.1"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 0
-}
diff --git a/doc/source/index.rst.template b/doc/source/index.rst.template
index 0bfb2b635f53a..d04e9194e71dc 100644
--- a/doc/source/index.rst.template
+++ b/doc/source/index.rst.template
@@ -1,156 +1,54 @@
 .. pandas documentation master file, created by
 
+.. module:: pandas
+
 *********************************************
 pandas: powerful Python data analysis toolkit
 *********************************************
 
-`PDF Version <pandas.pdf>`__
-
-`Zipped HTML <pandas.zip>`__
-
-.. module:: pandas
-
 **Date**: |today| **Version**: |version|
 
-**Binary Installers:** http://pypi.python.org/pypi/pandas
-
-**Source Repository:** http://github.com/pandas-dev/pandas
-
-**Issues & Ideas:** https://github.com/pandas-dev/pandas/issues
-
-**Q&A Support:** http://stackoverflow.com/questions/tagged/pandas
-
-**Developer Mailing List:** http://groups.google.com/group/pydata
-
-**pandas** is a `Python <http://www.python.org>`__ package providing fast,
-flexible, and expressive data structures designed to make working with
-"relational" or "labeled" data both easy and intuitive. It aims to be the
-fundamental high-level building block for doing practical, **real world** data
-analysis in Python. Additionally, it has the broader goal of becoming **the
-most powerful and flexible open source data analysis / manipulation tool
-available in any language**. It is already well on its way toward this goal.
+**Download documentation**: `PDF Version <pandas.pdf>`__ | `Zipped HTML <pandas.zip>`__
 
-pandas is well suited for many different kinds of data:
+**Useful links**:
+`Binary Installers <https://pypi.org/project/pandas>`__ |
+`Source Repository <https://github.com/pandas-dev/pandas>`__ |
+`Issues & Ideas <https://github.com/pandas-dev/pandas/issues>`__ |
+`Q&A Support <https://stackoverflow.com/questions/tagged/pandas>`__ |
+`Mailing List <https://groups.google.com/forum/#!forum/pydata>`__
 
-  - Tabular data with heterogeneously-typed columns, as in an SQL table or
-    Excel spreadsheet
-  - Ordered and unordered (not necessarily fixed-frequency) time series data.
-  - Arbitrary matrix data (homogeneously typed or heterogeneous) with row and
-    column labels
-  - Any other form of observational / statistical data sets. The data actually
-    need not be labeled at all to be placed into a pandas data structure
+:mod:`pandas` is an open source, BSD-licensed library providing high-performance,
+easy-to-use data structures and data analysis tools for the `Python <https://www.python.org/>`__
+programming language.
 
-The two primary data structures of pandas, :class:`Series` (1-dimensional)
-and :class:`DataFrame` (2-dimensional), handle the vast majority of typical use
-cases in finance, statistics, social science, and many areas of
-engineering. For R users, :class:`DataFrame` provides everything that R's
-``data.frame`` provides and much more. pandas is built on top of `NumPy
-<http://www.numpy.org>`__ and is intended to integrate well within a scientific
-computing environment with many other 3rd party libraries.
+See the :ref:`overview` for more detail about what's in the library.
 
-Here are just a few of the things that pandas does well:
-
-  - Easy handling of **missing data** (represented as NaN) in floating point as
-    well as non-floating point data
-  - Size mutability: columns can be **inserted and deleted** from DataFrame and
-    higher dimensional objects
-  - Automatic and explicit **data alignment**: objects can be explicitly
-    aligned to a set of labels, or the user can simply ignore the labels and
-    let `Series`, `DataFrame`, etc. automatically align the data for you in
-    computations
-  - Powerful, flexible **group by** functionality to perform
-    split-apply-combine operations on data sets, for both aggregating and
-    transforming data
-  - Make it **easy to convert** ragged, differently-indexed data in other
-    Python and NumPy data structures into DataFrame objects
-  - Intelligent label-based **slicing**, **fancy indexing**, and **subsetting**
-    of large data sets
-  - Intuitive **merging** and **joining** data sets
-  - Flexible **reshaping** and pivoting of data sets
-  - **Hierarchical** labeling of axes (possible to have multiple labels per
-    tick)
-  - Robust IO tools for loading data from **flat files** (CSV and delimited),
-    Excel files, databases, and saving / loading data from the ultrafast **HDF5
-    format**
-  - **Time series**-specific functionality: date range generation and frequency
-    conversion, moving window statistics, moving window linear regressions,
-    date shifting and lagging, etc.
-
-Many of these principles are here to address the shortcomings frequently
-experienced using other languages / scientific research environments. For data
-scientists, working with data is typically divided into multiple stages:
-munging and cleaning data, analyzing / modeling it, then organizing the results
-of the analysis into a form suitable for plotting or tabular display. pandas
-is the ideal tool for all of these tasks.
-
-Some other notes
-
- - pandas is **fast**. Many of the low-level algorithmic bits have been
-   extensively tweaked in `Cython <http://cython.org>`__ code. However, as with
-   anything else generalization usually sacrifices performance. So if you focus
-   on one feature for your application you may be able to create a faster
-   specialized tool.
-
- - pandas is a dependency of `statsmodels
-   <http://www.statsmodels.org/stable/index.html>`__, making it an important part of the
-   statistical computing ecosystem in Python.
-
- - pandas has been used extensively in production in financial applications.
-
-.. note::
-
-   This documentation assumes general familiarity with NumPy. If you haven't
-   used NumPy much or at all, do invest some time in `learning about NumPy
-   <http://docs.scipy.org>`__ first.
-
-See the package overview for more detail about what's in the library.
+{% if single_doc and single_doc.endswith('.rst') -%}
+.. toctree::
+    :maxdepth: 2
 
+    {{ single_doc[:-4] }}
+{% elif single_doc %}
+.. autosummary::
+    :toctree: reference/api/
 
+    {{ single_doc }}
+{% else -%}
 .. toctree::
-    :maxdepth: 4
+    :maxdepth: 2
+{% endif %}
 
-    {% if single -%}
-    {{ single }}
-    {% endif -%}
-    {%if not single -%}
-    whatsnew
+    {% if not single_doc -%}
+    What's New in 0.25.0 <whatsnew/v0.25.0>
     install
-    contributing
-    overview
-    10min
-    tutorials
-    cookbook
-    dsintro
-    basics
-    text
-    options
-    indexing
-    advanced
-    computation
-    missing_data
-    groupby
-    merging
-    reshaping
-    timeseries
-    timedeltas
-    categorical
-    visualization
-    style
-    io
-    remote_data
-    enhancingperf
-    sparse
-    gotchas
-    r_interface
+    getting_started/index
+    user_guide/index
     ecosystem
-    comparison_with_r
-    comparison_with_sql
-    comparison_with_sas
     {% endif -%}
-    {% if api -%}
-    api
+    {% if include_api -%}
+    reference/index
     {% endif -%}
-    {%if not single -%}
-    internals
-    release
+    {% if not single_doc -%}
+    development/index
+    whatsnew/index
     {% endif -%}
diff --git a/doc/source/indexing.rst b/doc/source/indexing.rst
deleted file mode 100644
index bc8997b313053..0000000000000
--- a/doc/source/indexing.rst
+++ /dev/null
@@ -1,1802 +0,0 @@
-.. _indexing:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows=15
-
-***************************
-Indexing and Selecting Data
-***************************
-
-The axis labeling information in pandas objects serves many purposes:
-
-  - Identifies data (i.e. provides *metadata*) using known indicators,
-    important for analysis, visualization, and interactive console display
-  - Enables automatic and explicit data alignment
-  - Allows intuitive getting and setting of subsets of the data set
-
-In this section, we will focus on the final point: namely, how to slice, dice,
-and generally get and set subsets of pandas objects. The primary focus will be
-on Series and DataFrame as they have received more development attention in
-this area. Expect more work to be invested in higher-dimensional data
-structures (including ``Panel``) in the future, especially in label-based
-advanced indexing.
-
-.. note::
-
-   The Python and NumPy indexing operators ``[]`` and attribute operator ``.``
-   provide quick and easy access to pandas data structures across a wide range
-   of use cases. This makes interactive work intuitive, as there's little new
-   to learn if you already know how to deal with Python dictionaries and NumPy
-   arrays. However, since the type of the data to be accessed isn't known in
-   advance, directly using standard operators has some optimization limits. For
-   production code, we recommended that you take advantage of the optimized
-   pandas data access methods exposed in this chapter.
-
-.. warning::
-
-   Whether a copy or a reference is returned for a setting operation, may
-   depend on the context.  This is sometimes called ``chained assignment`` and
-   should be avoided.  See :ref:`Returning a View versus Copy
-   <indexing.view_versus_copy>`
-
-.. warning::
-
-   In 0.15.0 ``Index`` has internally been refactored to no longer subclass ``ndarray``
-   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
-
-.. warning::
-
-   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
-
-See the :ref:`MultiIndex / Advanced Indexing <advanced>` for ``MultiIndex`` and more advanced indexing documentation.
-
-See the :ref:`cookbook<cookbook.selection>` for some advanced strategies
-
-.. _indexing.choice:
-
-Different Choices for Indexing
-------------------------------
-
-.. versionadded:: 0.11.0
-
-Object selection has had a number of user-requested additions in order to
-support more explicit location based indexing. pandas now supports three types
-of multi-axis indexing.
-
-- ``.loc`` is primarily label based, but may also be used with a boolean array. ``.loc`` will raise ``KeyError`` when the items are not found. Allowed inputs are:
-
-  - A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a
-    *label* of the index. This use is **not** an integer position along the
-    index)
-  - A list or array of labels ``['a', 'b', 'c']``
-  - A slice object with labels ``'a':'f'``, (note that contrary to usual python
-    slices, **both** the start and the stop are included!)
-  - A boolean array
-  - A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
-    that returns valid output for indexing (one of the above)
-
-      .. versionadded:: 0.18.1
-
-  See more at :ref:`Selection by Label <indexing.label>`
-
-- ``.iloc`` is primarily integer position based (from ``0`` to
-  ``length-1`` of the axis), but may also be used with a boolean
-  array.  ``.iloc`` will raise ``IndexError`` if a requested
-  indexer is out-of-bounds, except *slice* indexers which allow
-  out-of-bounds indexing.  (this conforms with python/numpy *slice*
-  semantics).  Allowed inputs are:
-
-  - An integer e.g. ``5``
-  - A list or array of integers ``[4, 3, 0]``
-  - A slice object with ints ``1:7``
-  - A boolean array
-  - A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
-    that returns valid output for indexing (one of the above)
-
-      .. versionadded:: 0.18.1
-
-  See more at :ref:`Selection by Position <indexing.integer>`
-
-  See more at :ref:`Advanced Indexing <advanced>` and :ref:`Advanced
-  Hierarchical <advanced.advanced_hierarchical>`.
-
-- ``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer. See more at :ref:`Selection By Callable <indexing.callable>`.
-
-Getting values from an object with multi-axes selection uses the following
-notation (using ``.loc`` as an example, but applies to ``.iloc`` as
-well). Any of the axes accessors may be the null slice ``:``. Axes left out of
-the specification are assumed to be ``:``. (e.g. ``p.loc['a']`` is equiv to
-``p.loc['a', :, :]``)
-
-.. csv-table::
-    :header: "Object Type", "Indexers"
-    :widths: 30, 50
-    :delim: ;
-
-    Series; ``s.loc[indexer]``
-    DataFrame; ``df.loc[row_indexer,column_indexer]``
-    Panel; ``p.loc[item_indexer,major_indexer,minor_indexer]``
-
-.. _indexing.basics:
-
-Basics
-------
-
-As mentioned when introducing the data structures in the :ref:`last section
-<basics>`, the primary function of indexing with ``[]`` (a.k.a. ``__getitem__``
-for those familiar with implementing class behavior in Python) is selecting out
-lower-dimensional slices. Thus,
-
-.. csv-table::
-    :header: "Object Type", "Selection", "Return Value Type"
-    :widths: 30, 30, 60
-    :delim: ;
-
-    Series; ``series[label]``; scalar value
-    DataFrame; ``frame[colname]``; ``Series`` corresponding to colname
-    Panel; ``panel[itemname]``; ``DataFrame`` corresponding to the itemname
-
-Here we construct a simple time series data set to use for illustrating the
-indexing functionality:
-
-.. ipython:: python
-
-   dates = pd.date_range('1/1/2000', periods=8)
-   df = pd.DataFrame(np.random.randn(8, 4), index=dates, columns=['A', 'B', 'C', 'D'])
-   df
-   panel = pd.Panel({'one' : df, 'two' : df - df.mean()})
-   panel
-
-.. note::
-
-   None of the indexing functionality is time series specific unless
-   specifically stated.
-
-Thus, as per above, we have the most basic indexing using ``[]``:
-
-.. ipython:: python
-
-   s = df['A']
-   s[dates[5]]
-   panel['two']
-
-You can pass a list of columns to ``[]`` to select columns in that order.
-If a column is not contained in the DataFrame, an exception will be
-raised. Multiple columns can also be set in this manner:
-
-.. ipython:: python
-
-   df
-   df[['B', 'A']] = df[['A', 'B']]
-   df
-
-You may find this useful for applying a transform (in-place) to a subset of the
-columns.
-
-.. warning::
-
-   pandas aligns all AXES when setting ``Series`` and ``DataFrame`` from ``.loc``, and ``.iloc``.
-
-   This will **not** modify ``df`` because the column alignment is before value assignment.
-
-   .. ipython:: python
-
-      df[['A', 'B']]
-      df.loc[:,['B', 'A']] = df[['A', 'B']]
-      df[['A', 'B']]
-
-   The correct way is to use raw values
-
-   .. ipython:: python
-
-      df.loc[:,['B', 'A']] = df[['A', 'B']].values
-      df[['A', 'B']]
-
-
-Attribute Access
-----------------
-
-.. _indexing.columns.multiple:
-
-.. _indexing.df_cols:
-
-.. _indexing.attribute_access:
-
-You may access an index on a ``Series``, column on a ``DataFrame``, and an item on a ``Panel`` directly
-as an attribute:
-
-.. ipython:: python
-
-   sa = pd.Series([1,2,3],index=list('abc'))
-   dfa = df.copy()
-
-.. ipython:: python
-
-   sa.b
-   dfa.A
-   panel.one
-
-You can use attribute access to modify an existing element of a Series or column of a DataFrame, but be careful;
-if you try to use attribute access to create a new column, it fails silently, creating a new attribute rather than a
-new column.
-
-.. ipython:: python
-
-   sa.a = 5
-   sa
-   dfa.A = list(range(len(dfa.index)))  # ok if A already exists
-   dfa
-   dfa['A'] = list(range(len(dfa.index)))  # use this form to create a new column
-   dfa
-
-.. warning::
-
-   - You can use this access only if the index element is a valid python identifier, e.g. ``s.1`` is not allowed.
-     See `here for an explanation of valid identifiers
-     <http://docs.python.org/2.7/reference/lexical_analysis.html#identifiers>`__.
-
-   - The attribute will not be available if it conflicts with an existing method name, e.g. ``s.min`` is not allowed.
-
-   - Similarly, the attribute will not be available if it conflicts with any of the following list: ``index``,
-     ``major_axis``, ``minor_axis``, ``items``, ``labels``.
-
-   - In any of these cases, standard indexing will still work, e.g. ``s['1']``, ``s['min']``, and ``s['index']`` will
-     access the corresponding element or column.
-
-   - The ``Series/Panel`` accesses are available starting in 0.13.0.
-
-If you are using the IPython environment, you may also use tab-completion to
-see these accessible attributes.
-
-You can also assign a ``dict`` to a row of a ``DataFrame``:
-
-.. ipython:: python
-
-   x = pd.DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
-   x.iloc[1] = dict(x=9, y=99)
-   x
-
-Slicing ranges
---------------
-
-The most robust and consistent way of slicing ranges along arbitrary axes is
-described in the :ref:`Selection by Position <indexing.integer>` section
-detailing the ``.iloc`` method. For now, we explain the semantics of slicing using the ``[]`` operator.
-
-With Series, the syntax works exactly as with an ndarray, returning a slice of
-the values and the corresponding labels:
-
-.. ipython:: python
-
-   s[:5]
-   s[::2]
-   s[::-1]
-
-Note that setting works as well:
-
-.. ipython:: python
-
-   s2 = s.copy()
-   s2[:5] = 0
-   s2
-
-With DataFrame, slicing inside of ``[]`` **slices the rows**. This is provided
-largely as a convenience since it is such a common operation.
-
-.. ipython:: python
-
-   df[:3]
-   df[::-1]
-
-.. _indexing.label:
-
-Selection By Label
-------------------
-
-.. warning::
-
-   Whether a copy or a reference is returned for a setting operation, may depend on the context.
-   This is sometimes called ``chained assignment`` and should be avoided.
-   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`
-
-.. warning::
-
-   ``.loc`` is strict when you present slicers that are not compatible (or convertible) with the index type. For example
-   using integers in a ``DatetimeIndex``. These will raise a ``TypeError``.
-
-  .. ipython:: python
-
-     dfl = pd.DataFrame(np.random.randn(5,4), columns=list('ABCD'), index=pd.date_range('20130101',periods=5))
-     dfl
-
-  .. code-block:: ipython
-
-     In [4]: dfl.loc[2:3]
-     TypeError: cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with these indexers [2] of <type 'int'>
-
-  String likes in slicing *can* be convertible to the type of the index and lead to natural slicing.
-
-  .. ipython:: python
-
-     dfl.loc['20130102':'20130104']
-
-pandas provides a suite of methods in order to have **purely label based indexing**. This is a strict inclusion based protocol.
-**At least 1** of the labels for which you ask, must be in the index or a ``KeyError`` will be raised! When slicing, the start bound is *included*, **AND** the stop bound is *included*. Integers are valid labels, but they refer to the label **and not the position**.
-
-The ``.loc`` attribute is the primary access method. The following are valid inputs:
-
-- A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index)
-- A list or array of labels ``['a', 'b', 'c']``
-- A slice object with labels ``'a':'f'`` (note that contrary to usual python slices, **both** the start and the stop are included!)
-- A boolean array
-- A ``callable``, see :ref:`Selection By Callable <indexing.callable>`
-
-.. ipython:: python
-
-   s1 = pd.Series(np.random.randn(6),index=list('abcdef'))
-   s1
-   s1.loc['c':]
-   s1.loc['b']
-
-Note that setting works as well:
-
-.. ipython:: python
-
-   s1.loc['c':] = 0
-   s1
-
-With a DataFrame
-
-.. ipython:: python
-
-   df1 = pd.DataFrame(np.random.randn(6,4),
-                      index=list('abcdef'),
-                      columns=list('ABCD'))
-   df1
-   df1.loc[['a', 'b', 'd'], :]
-
-Accessing via label slices
-
-.. ipython:: python
-
-   df1.loc['d':, 'A':'C']
-
-For getting a cross section using a label (equiv to ``df.xs('a')``)
-
-.. ipython:: python
-
-   df1.loc['a']
-
-For getting values with a boolean array
-
-.. ipython:: python
-
-   df1.loc['a'] > 0
-   df1.loc[:, df1.loc['a'] > 0]
-
-For getting a value explicitly (equiv to deprecated ``df.get_value('a','A')``)
-
-.. ipython:: python
-
-   # this is also equivalent to ``df1.at['a','A']``
-   df1.loc['a', 'A']
-
-.. _indexing.integer:
-
-Selection By Position
----------------------
-
-.. warning::
-
-   Whether a copy or a reference is returned for a setting operation, may depend on the context.
-   This is sometimes called ``chained assignment`` and should be avoided.
-   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`
-
-pandas provides a suite of methods in order to get **purely integer based indexing**. The semantics follow closely python and numpy slicing. These are ``0-based`` indexing. When slicing, the start bounds is *included*, while the upper bound is *excluded*. Trying to use a non-integer, even a **valid** label will raise a ``IndexError``.
-
-The ``.iloc`` attribute is the primary access method. The following are valid inputs:
-
-- An integer e.g. ``5``
-- A list or array of integers ``[4, 3, 0]``
-- A slice object with ints ``1:7``
-- A boolean array
-- A ``callable``, see :ref:`Selection By Callable <indexing.callable>`
-
-.. ipython:: python
-
-   s1 = pd.Series(np.random.randn(5), index=list(range(0,10,2)))
-   s1
-   s1.iloc[:3]
-   s1.iloc[3]
-
-Note that setting works as well:
-
-.. ipython:: python
-
-   s1.iloc[:3] = 0
-   s1
-
-With a DataFrame
-
-.. ipython:: python
-
-   df1 = pd.DataFrame(np.random.randn(6,4),
-                      index=list(range(0,12,2)),
-                      columns=list(range(0,8,2)))
-   df1
-
-Select via integer slicing
-
-.. ipython:: python
-
-   df1.iloc[:3]
-   df1.iloc[1:5, 2:4]
-
-Select via integer list
-
-.. ipython:: python
-
-   df1.iloc[[1, 3, 5], [1, 3]]
-
-.. ipython:: python
-
-   df1.iloc[1:3, :]
-
-.. ipython:: python
-
-   df1.iloc[:, 1:3]
-
-.. ipython:: python
-
-   # this is also equivalent to ``df1.iat[1,1]``
-   df1.iloc[1, 1]
-
-For getting a cross section using an integer position (equiv to ``df.xs(1)``)
-
-.. ipython:: python
-
-   df1.iloc[1]
-
-Out of range slice indexes are handled gracefully just as in Python/Numpy.
-
-.. ipython:: python
-
-    # these are allowed in python/numpy.
-    # Only works in Pandas starting from v0.14.0.
-    x = list('abcdef')
-    x
-    x[4:10]
-    x[8:10]
-    s = pd.Series(x)
-    s
-    s.iloc[4:10]
-    s.iloc[8:10]
-
-.. note::
-
-    Prior to v0.14.0, ``iloc`` would not accept out of bounds indexers for
-    slices, e.g. a value that exceeds the length of the object being indexed.
-
-
-Note that this could result in an empty axis (e.g. an empty DataFrame being
-returned)
-
-.. ipython:: python
-
-   dfl = pd.DataFrame(np.random.randn(5,2), columns=list('AB'))
-   dfl
-   dfl.iloc[:, 2:3]
-   dfl.iloc[:, 1:3]
-   dfl.iloc[4:6]
-
-A single indexer that is out of bounds will raise an ``IndexError``.
-A list of indexers where any element is out of bounds will raise an
-``IndexError``
-
-.. code-block:: python
-
-   dfl.iloc[[4, 5, 6]]
-   IndexError: positional indexers are out-of-bounds
-
-   dfl.iloc[:, 4]
-   IndexError: single positional indexer is out-of-bounds
-
-.. _indexing.callable:
-
-Selection By Callable
----------------------
-
-.. versionadded:: 0.18.1
-
-``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer.
-The ``callable`` must be a function with one argument (the calling Series, DataFrame or Panel) and that returns valid output for indexing.
-
-.. ipython:: python
-
-   df1 = pd.DataFrame(np.random.randn(6, 4),
-                      index=list('abcdef'),
-                      columns=list('ABCD'))
-   df1
-
-   df1.loc[lambda df: df.A > 0, :]
-   df1.loc[:, lambda df: ['A', 'B']]
-
-   df1.iloc[:, lambda df: [0, 1]]
-
-   df1[lambda df: df.columns[0]]
-
-
-You can use callable indexing in ``Series``.
-
-.. ipython:: python
-
-   df1.A.loc[lambda s: s > 0]
-
-Using these methods / indexers, you can chain data selection operations
-without using temporary variable.
-
-.. ipython:: python
-
-   bb = pd.read_csv('data/baseball.csv', index_col='id')
-   (bb.groupby(['year', 'team']).sum()
-      .loc[lambda df: df.r > 100])
-
-.. _indexing.deprecate_ix:
-
-IX Indexer is Deprecated
-------------------------
-
-.. warning::
-
-   Starting in 0.20.0, the ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc``
-   and ``.loc`` indexers.
-
-``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide
-to index *positionally* OR via *labels* depending on the data type of the index. This has caused quite a
-bit of user confusion over the years.
-
-The recommended methods of indexing are:
-
-- ``.loc`` if you want to *label* index
-- ``.iloc`` if you want to *positionally* index.
-
-.. ipython:: python
-
-  dfd = pd.DataFrame({'A': [1, 2, 3],
-                      'B': [4, 5, 6]},
-                     index=list('abc'))
-
-  dfd
-
-Previous Behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
-
-.. code-block:: ipython
-
-  In [3]: dfd.ix[[0, 2], 'A']
-  Out[3]:
-  a    1
-  c    3
-  Name: A, dtype: int64
-
-Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
-
-.. ipython:: python
-
-  dfd.loc[dfd.index[[0, 2]], 'A']
-
-This can also be expressed using ``.iloc``, by explicitly getting locations on the indexers, and using
-*positional* indexing to select things.
-
-.. ipython:: python
-
-  dfd.iloc[[0, 2], dfd.columns.get_loc('A')]
-
-For getting *multiple* indexers, using ``.get_indexer``
-
-.. ipython:: python
-
-  dfd.iloc[[0, 2], dfd.columns.get_indexer(['A', 'B'])]
-
-
-.. _indexing.basics.partial_setting:
-
-Selecting Random Samples
-------------------------
-.. versionadded::0.16.1
-
-A random selection of rows or columns from a Series, DataFrame, or Panel with the :meth:`~DataFrame.sample` method. The method will sample rows by default, and accepts a specific number of rows/columns to return, or a fraction of rows.
-
-.. ipython :: python
-
-    s = pd.Series([0,1,2,3,4,5])
-
-    # When no arguments are passed, returns 1 row.
-    s.sample()
-
-    # One may specify either a number of rows:
-    s.sample(n=3)
-
-    # Or a fraction of the rows:
-    s.sample(frac=0.5)
-
-By default, ``sample`` will return each row at most once, but one can also sample with replacement
-using the ``replace`` option:
-
-.. ipython :: python
-
-   s = pd.Series([0,1,2,3,4,5])
-
-    # Without replacement (default):
-    s.sample(n=6, replace=False)
-
-    # With replacement:
-    s.sample(n=6, replace=True)
-
-
-By default, each row has an equal probability of being selected, but if you want rows
-to have different probabilities, you can pass the ``sample`` function sampling weights as
-``weights``. These weights can be a list, a numpy array, or a Series, but they must be of the same length as the object you are sampling. Missing values will be treated as a weight of zero, and inf values are not allowed. If weights do not sum to 1, they will be re-normalized by dividing all weights by the sum of the weights. For example:
-
-.. ipython :: python
-
-    s = pd.Series([0,1,2,3,4,5])
-    example_weights = [0, 0, 0.2, 0.2, 0.2, 0.4]
-    s.sample(n=3, weights=example_weights)
-
-    # Weights will be re-normalized automatically
-    example_weights2 = [0.5, 0, 0, 0, 0, 0]
-    s.sample(n=1, weights=example_weights2)
-
-When applied to a DataFrame, you can use a column of the DataFrame as sampling weights
-(provided you are sampling rows and not columns) by simply passing the name of the column
-as a string.
-
-.. ipython :: python
-
-    df2 = pd.DataFrame({'col1':[9,8,7,6], 'weight_column':[0.5, 0.4, 0.1, 0]})
-    df2.sample(n = 3, weights = 'weight_column')
-
-``sample`` also allows users to sample columns instead of rows using the ``axis`` argument.
-
-.. 	ipython :: python
-
-    df3 = pd.DataFrame({'col1':[1,2,3], 'col2':[2,3,4]})
-    df3.sample(n=1, axis=1)
-
-Finally, one can also set a seed for ``sample``'s random number generator using the ``random_state`` argument, which will accept either an integer (as a seed) or a numpy RandomState object.
-
-.. 	ipython :: python
-
-    df4 = pd.DataFrame({'col1':[1,2,3], 'col2':[2,3,4]})
-
-    # With a given seed, the sample will always draw the same rows.
-    df4.sample(n=2, random_state=2)
-    df4.sample(n=2, random_state=2)
-
-
-
-Setting With Enlargement
-------------------------
-
-.. versionadded:: 0.13
-
-The ``.loc/[]`` operations can perform enlargement when setting a non-existant key for that axis.
-
-In the ``Series`` case this is effectively an appending operation
-
-.. ipython:: python
-
-   se = pd.Series([1,2,3])
-   se
-   se[5] = 5.
-   se
-
-A ``DataFrame`` can be enlarged on either axis via ``.loc``
-
-.. ipython:: python
-
-   dfi = pd.DataFrame(np.arange(6).reshape(3,2),
-                   columns=['A','B'])
-   dfi
-   dfi.loc[:,'C'] = dfi.loc[:,'A']
-   dfi
-
-This is like an ``append`` operation on the ``DataFrame``.
-
-.. ipython:: python
-
-   dfi.loc[3] = 5
-   dfi
-
-.. _indexing.basics.get_value:
-
-Fast scalar value getting and setting
--------------------------------------
-
-Since indexing with ``[]`` must handle a lot of cases (single-label access,
-slicing, boolean indexing, etc.), it has a bit of overhead in order to figure
-out what you're asking for. If you only want to access a scalar value, the
-fastest way is to use the ``at`` and ``iat`` methods, which are implemented on
-all of the data structures.
-
-Similarly to ``loc``, ``at`` provides **label** based scalar lookups, while, ``iat`` provides **integer** based lookups analogously to ``iloc``
-
-.. ipython:: python
-
-   s.iat[5]
-   df.at[dates[5], 'A']
-   df.iat[3, 0]
-
-You can also set using these same indexers.
-
-.. ipython:: python
-
-   df.at[dates[5], 'E'] = 7
-   df.iat[3, 0] = 7
-
-``at`` may enlarge the object in-place as above if the indexer is missing.
-
-.. ipython:: python
-
-   df.at[dates[-1]+1, 0] = 7
-   df
-
-Boolean indexing
-----------------
-
-.. _indexing.boolean:
-
-Another common operation is the use of boolean vectors to filter the data.
-The operators are: ``|`` for ``or``, ``&`` for ``and``, and ``~`` for ``not``. These **must** be grouped by using parentheses.
-
-Using a boolean vector to index a Series works exactly as in a numpy ndarray:
-
-.. ipython:: python
-
-   s = pd.Series(range(-3, 4))
-   s
-   s[s > 0]
-   s[(s < -1) | (s > 0.5)]
-   s[~(s < 0)]
-
-You may select rows from a DataFrame using a boolean vector the same length as
-the DataFrame's index (for example, something derived from one of the columns
-of the DataFrame):
-
-.. ipython:: python
-
-   df[df['A'] > 0]
-
-List comprehensions and ``map`` method of Series can also be used to produce
-more complex criteria:
-
-.. ipython:: python
-
-   df2 = pd.DataFrame({'a' : ['one', 'one', 'two', 'three', 'two', 'one', 'six'],
-                       'b' : ['x', 'y', 'y', 'x', 'y', 'x', 'x'],
-                       'c' : np.random.randn(7)})
-
-   # only want 'two' or 'three'
-   criterion = df2['a'].map(lambda x: x.startswith('t'))
-
-   df2[criterion]
-
-   # equivalent but slower
-   df2[[x.startswith('t') for x in df2['a']]]
-
-   # Multiple criteria
-   df2[criterion & (df2['b'] == 'x')]
-
-Note, with the choice methods :ref:`Selection by Label <indexing.label>`, :ref:`Selection by Position <indexing.integer>`,
-and :ref:`Advanced Indexing <advanced>` you may select along more than one axis using boolean vectors combined with other indexing expressions.
-
-.. ipython:: python
-
-   df2.loc[criterion & (df2['b'] == 'x'),'b':'c']
-
-.. _indexing.basics.indexing_isin:
-
-Indexing with isin
-------------------
-
-Consider the ``isin`` method of Series, which returns a boolean vector that is
-true wherever the Series elements exist in the passed list. This allows you to
-select rows where one or more columns have values you want:
-
-.. ipython:: python
-
-   s = pd.Series(np.arange(5), index=np.arange(5)[::-1], dtype='int64')
-   s
-   s.isin([2, 4, 6])
-   s[s.isin([2, 4, 6])]
-
-The same method is available for ``Index`` objects and is useful for the cases
-when you don't know which of the sought labels are in fact present:
-
-.. ipython:: python
-
-   s[s.index.isin([2, 4, 6])]
-
-   # compare it to the following
-   s[[2, 4, 6]]
-
-In addition to that, ``MultiIndex`` allows selecting a separate level to use
-in the membership check:
-
-.. ipython:: python
-
-   s_mi = pd.Series(np.arange(6),
-                    index=pd.MultiIndex.from_product([[0, 1], ['a', 'b', 'c']]))
-   s_mi
-   s_mi.iloc[s_mi.index.isin([(1, 'a'), (2, 'b'), (0, 'c')])]
-   s_mi.iloc[s_mi.index.isin(['a', 'c', 'e'], level=1)]
-
-DataFrame also has an ``isin`` method.  When calling ``isin``, pass a set of
-values as either an array or dict.  If values is an array, ``isin`` returns
-a DataFrame of booleans that is the same shape as the original DataFrame, with True
-wherever the element is in the sequence of values.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
-                      'ids2': ['a', 'n', 'c', 'n']})
-
-   values = ['a', 'b', 1, 3]
-
-   df.isin(values)
-
-Oftentimes you'll want to match certain values with certain columns.
-Just make values a ``dict`` where the key is the column, and the value is
-a list of items you want to check for.
-
-.. ipython:: python
-
-   values = {'ids': ['a', 'b'], 'vals': [1, 3]}
-
-   df.isin(values)
-
-Combine DataFrame's ``isin`` with the ``any()`` and ``all()`` methods to
-quickly select subsets of your data that meet a given criteria.
-To select a row where each column meets its own criterion:
-
-.. ipython:: python
-
-  values = {'ids': ['a', 'b'], 'ids2': ['a', 'c'], 'vals': [1, 3]}
-
-  row_mask = df.isin(values).all(1)
-
-  df[row_mask]
-
-.. _indexing.where_mask:
-
-The :meth:`~pandas.DataFrame.where` Method and Masking
-------------------------------------------------------
-
-Selecting values from a Series with a boolean vector generally returns a
-subset of the data. To guarantee that selection output has the same shape as
-the original data, you can use the ``where`` method in ``Series`` and ``DataFrame``.
-
-To return only the selected rows
-
-.. ipython:: python
-
-   s[s > 0]
-
-To return a Series of the same shape as the original
-
-.. ipython:: python
-
-   s.where(s > 0)
-
-Selecting values from a DataFrame with a boolean criterion now also preserves
-input data shape. ``where`` is used under the hood as the implementation.
-Equivalent is ``df.where(df < 0)``
-
-.. ipython:: python
-   :suppress:
-
-   dates = pd.date_range('1/1/2000', periods=8)
-   df = pd.DataFrame(np.random.randn(8, 4), index=dates, columns=['A', 'B', 'C', 'D'])
-
-.. ipython:: python
-
-   df[df < 0]
-
-In addition, ``where`` takes an optional ``other`` argument for replacement of
-values where the condition is False, in the returned copy.
-
-.. ipython:: python
-
-   df.where(df < 0, -df)
-
-You may wish to set values based on some boolean criteria.
-This can be done intuitively like so:
-
-.. ipython:: python
-
-   s2 = s.copy()
-   s2[s2 < 0] = 0
-   s2
-
-   df2 = df.copy()
-   df2[df2 < 0] = 0
-   df2
-
-By default, ``where`` returns a modified copy of the data. There is an
-optional parameter ``inplace`` so that the original data can be modified
-without creating a copy:
-
-.. ipython:: python
-
-   df_orig = df.copy()
-   df_orig.where(df > 0, -df, inplace=True);
-   df_orig
-
-.. note::
-
-   The signature for :func:`DataFrame.where` differs from :func:`numpy.where`.
-   Roughly ``df1.where(m, df2)`` is equivalent to ``np.where(m, df1, df2)``.
-
-   .. ipython:: python
-
-      df.where(df < 0, -df) == np.where(df < 0, df, -df)
-
-**alignment**
-
-Furthermore, ``where`` aligns the input boolean condition (ndarray or DataFrame),
-such that partial selection with setting is possible. This is analogous to
-partial setting via ``.loc`` (but on the contents rather than the axis labels)
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2[ df2[1:4] > 0 ] = 3
-   df2
-
-.. versionadded:: 0.13
-
-Where can also accept ``axis`` and ``level`` parameters to align the input when
-performing the ``where``.
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2.where(df2>0,df2['A'],axis='index')
-
-This is equivalent (but faster than) the following.
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df.apply(lambda x, y: x.where(x>0,y), y=df['A'])
-
-.. versionadded:: 0.18.1
-
-Where can accept a callable as condition and ``other`` arguments. The function must
-be with one argument (the calling Series or DataFrame) and that returns valid output
-as condition and ``other`` argument.
-
-.. ipython:: python
-
-   df3 = pd.DataFrame({'A': [1, 2, 3],
-                       'B': [4, 5, 6],
-                       'C': [7, 8, 9]})
-   df3.where(lambda x: x > 4, lambda x: x + 10)
-
-**mask**
-
-``mask`` is the inverse boolean operation of ``where``.
-
-.. ipython:: python
-
-   s.mask(s >= 0)
-   df.mask(df >= 0)
-
-.. _indexing.query:
-
-The :meth:`~pandas.DataFrame.query` Method (Experimental)
----------------------------------------------------------
-
-.. versionadded:: 0.13
-
-:class:`~pandas.DataFrame` objects have a :meth:`~pandas.DataFrame.query`
-method that allows selection using an expression.
-
-You can get the value of the frame where column ``b`` has values
-between the values of columns ``a`` and ``c``. For example:
-
-.. ipython:: python
-
-   n = 10
-   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
-   df
-
-   # pure python
-   df[(df.a < df.b) & (df.b < df.c)]
-
-   # query
-   df.query('(a < b) & (b < c)')
-
-Do the same thing but fall back on a named index if there is no column
-with the name ``a``.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randint(n / 2, size=(n, 2)), columns=list('bc'))
-   df.index.name = 'a'
-   df
-   df.query('a < b and b < c')
-
-If instead you don't want to or cannot name your index, you can use the name
-``index`` in your query expression:
-
-.. ipython:: python
-   :suppress:
-
-   old_index = index
-   del index
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randint(n, size=(n, 2)), columns=list('bc'))
-   df
-   df.query('index < b < c')
-
-.. ipython:: python
-   :suppress:
-
-   index = old_index
-   del old_index
-
-
-.. note::
-
-   If the name of your index overlaps with a column name, the column name is
-   given precedence. For example,
-
-   .. ipython:: python
-
-      df = pd.DataFrame({'a': np.random.randint(5, size=5)})
-      df.index.name = 'a'
-      df.query('a > 2') # uses the column 'a', not the index
-
-   You can still use the index in a query expression by using the special
-   identifier 'index':
-
-   .. ipython:: python
-
-      df.query('index > 2')
-
-   If for some reason you have a column named ``index``, then you can refer to
-   the index as ``ilevel_0`` as well, but at this point you should consider
-   renaming your columns to something less ambiguous.
-
-
-:class:`~pandas.MultiIndex` :meth:`~pandas.DataFrame.query` Syntax
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You can also use the levels of a ``DataFrame`` with a
-:class:`~pandas.MultiIndex` as if they were columns in the frame:
-
-.. ipython:: python
-
-   n = 10
-   colors = np.random.choice(['red', 'green'], size=n)
-   foods = np.random.choice(['eggs', 'ham'], size=n)
-   colors
-   foods
-
-   index = pd.MultiIndex.from_arrays([colors, foods], names=['color', 'food'])
-   df = pd.DataFrame(np.random.randn(n, 2), index=index)
-   df
-   df.query('color == "red"')
-
-If the levels of the ``MultiIndex`` are unnamed, you can refer to them using
-special names:
-
-.. ipython:: python
-
-   df.index.names = [None, None]
-   df
-   df.query('ilevel_0 == "red"')
-
-
-The convention is ``ilevel_0``, which means "index level 0" for the 0th level
-of the ``index``.
-
-
-:meth:`~pandas.DataFrame.query` Use Cases
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A use case for :meth:`~pandas.DataFrame.query` is when you have a collection of
-:class:`~pandas.DataFrame` objects that have a subset of column names (or index
-levels/names) in common. You can pass the same query to both frames *without*
-having to specify which frame you're interested in querying
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
-   df
-   df2 = pd.DataFrame(np.random.rand(n + 2, 3), columns=df.columns)
-   df2
-   expr = '0.0 <= a <= c <= 0.5'
-   map(lambda frame: frame.query(expr), [df, df2])
-
-:meth:`~pandas.DataFrame.query` Python versus pandas Syntax Comparison
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Full numpy-like syntax
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randint(n, size=(n, 3)), columns=list('abc'))
-   df
-   df.query('(a < b) & (b < c)')
-   df[(df.a < df.b) & (df.b < df.c)]
-
-Slightly nicer by removing the parentheses (by binding making comparison
-operators bind tighter than ``&``/``|``)
-
-.. ipython:: python
-
-   df.query('a < b & b < c')
-
-Use English instead of symbols
-
-.. ipython:: python
-
-   df.query('a < b and b < c')
-
-Pretty close to how you might write it on paper
-
-.. ipython:: python
-
-   df.query('a < b < c')
-
-The ``in`` and ``not in`` operators
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-:meth:`~pandas.DataFrame.query` also supports special use of Python's ``in`` and
-``not in`` comparison operators, providing a succinct syntax for calling the
-``isin`` method of a ``Series`` or ``DataFrame``.
-
-.. ipython:: python
-   :suppress:
-
-   try:
-       old_d = d
-       del d
-   except NameError:
-       pass
-
-.. ipython:: python
-
-   # get all rows where columns "a" and "b" have overlapping values
-   df = pd.DataFrame({'a': list('aabbccddeeff'), 'b': list('aaaabbbbcccc'),
-                      'c': np.random.randint(5, size=12),
-                      'd': np.random.randint(9, size=12)})
-   df
-   df.query('a in b')
-
-   # How you'd do it in pure Python
-   df[df.a.isin(df.b)]
-
-   df.query('a not in b')
-
-   # pure Python
-   df[~df.a.isin(df.b)]
-
-
-You can combine this with other expressions for very succinct queries:
-
-
-.. ipython:: python
-
-   # rows where cols a and b have overlapping values and col c's values are less than col d's
-   df.query('a in b and c < d')
-
-   # pure Python
-   df[df.b.isin(df.a) & (df.c < df.d)]
-
-
-.. note::
-
-   Note that ``in`` and ``not in`` are evaluated in Python, since ``numexpr``
-   has no equivalent of this operation. However, **only the** ``in``/``not in``
-   **expression itself** is evaluated in vanilla Python. For example, in the
-   expression
-
-   .. code-block:: python
-
-      df.query('a in b + c + d')
-
-   ``(b + c + d)`` is evaluated by ``numexpr`` and *then* the ``in``
-   operation is evaluated in plain Python. In general, any operations that can
-   be evaluated using ``numexpr`` will be.
-
-Special use of the ``==`` operator with ``list`` objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Comparing a ``list`` of values to a column using ``==``/``!=`` works similarly
-to ``in``/``not in``
-
-.. ipython:: python
-
-   df.query('b == ["a", "b", "c"]')
-
-   # pure Python
-   df[df.b.isin(["a", "b", "c"])]
-
-   df.query('c == [1, 2]')
-
-   df.query('c != [1, 2]')
-
-   # using in/not in
-   df.query('[1, 2] in c')
-
-   df.query('[1, 2] not in c')
-
-   # pure Python
-   df[df.c.isin([1, 2])]
-
-
-Boolean Operators
-~~~~~~~~~~~~~~~~~
-
-You can negate boolean expressions with the word ``not`` or the ``~`` operator.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
-   df['bools'] = np.random.rand(len(df)) > 0.5
-   df.query('~bools')
-   df.query('not bools')
-   df.query('not bools') == df[~df.bools]
-
-Of course, expressions can be arbitrarily complex too
-
-.. ipython:: python
-
-   # short query syntax
-   shorter = df.query('a < b < c and (not bools) or bools > 2')
-
-   # equivalent in pure Python
-   longer = df[(df.a < df.b) & (df.b < df.c) & (~df.bools) | (df.bools > 2)]
-
-   shorter
-   longer
-
-   shorter == longer
-
-.. ipython:: python
-   :suppress:
-
-   try:
-       d = old_d
-       del old_d
-   except NameError:
-       pass
-
-
-Performance of :meth:`~pandas.DataFrame.query`
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-``DataFrame.query()`` using ``numexpr`` is slightly faster than Python for
-large frames
-
-.. image:: _static/query-perf.png
-
-.. note::
-
-   You will only see the performance benefits of using the ``numexpr`` engine
-   with ``DataFrame.query()`` if your frame has more than approximately 200,000
-   rows
-
-      .. image:: _static/query-perf-small.png
-
-This plot was created using a ``DataFrame`` with 3 columns each containing
-floating point values generated using ``numpy.random.randn()``.
-
-.. ipython:: python
-   :suppress:
-
-   df = pd.DataFrame(np.random.randn(8, 4), index=dates, columns=['A', 'B', 'C', 'D'])
-   df2 = df.copy()
-
-
-Duplicate Data
---------------
-
-.. _indexing.duplicate:
-
-If you want to identify and remove duplicate rows in a DataFrame,  there are
-two methods that will help: ``duplicated`` and ``drop_duplicates``. Each
-takes as an argument the columns to use to identify duplicated rows.
-
-- ``duplicated`` returns a boolean vector whose length is the number of rows, and which indicates whether a row is duplicated.
-- ``drop_duplicates`` removes duplicate rows.
-
-By default, the first observed row of a duplicate set is considered unique, but
-each method has a ``keep`` parameter to specify targets to be kept.
-
-- ``keep='first'`` (default): mark / drop duplicates except for the first occurrence.
-- ``keep='last'``: mark / drop duplicates except for the last occurrence.
-- ``keep=False``: mark  / drop all duplicates.
-
-.. ipython:: python
-
-   df2 = pd.DataFrame({'a': ['one', 'one', 'two', 'two', 'two', 'three', 'four'],
-                       'b': ['x', 'y', 'x', 'y', 'x', 'x', 'x'],
-                       'c': np.random.randn(7)})
-   df2
-   df2.duplicated('a')
-   df2.duplicated('a', keep='last')
-   df2.duplicated('a', keep=False)
-   df2.drop_duplicates('a')
-   df2.drop_duplicates('a', keep='last')
-   df2.drop_duplicates('a', keep=False)
-
-Also, you can pass a list of columns to identify duplications.
-
-.. ipython:: python
-
-   df2.duplicated(['a', 'b'])
-   df2.drop_duplicates(['a', 'b'])
-
-To drop duplicates by index value, use ``Index.duplicated`` then perform slicing.
-Same options are available in ``keep`` parameter.
-
-.. ipython:: python
-
-   df3 = pd.DataFrame({'a': np.arange(6),
-                       'b': np.random.randn(6)},
-                      index=['a', 'a', 'b', 'c', 'b', 'a'])
-   df3
-   df3.index.duplicated()
-   df3[~df3.index.duplicated()]
-   df3[~df3.index.duplicated(keep='last')]
-   df3[~df3.index.duplicated(keep=False)]
-
-.. _indexing.dictionarylike:
-
-Dictionary-like :meth:`~pandas.DataFrame.get` method
-----------------------------------------------------
-
-Each of Series, DataFrame, and Panel have a ``get`` method which can return a
-default value.
-
-.. ipython:: python
-
-   s = pd.Series([1,2,3], index=['a','b','c'])
-   s.get('a')               # equivalent to s['a']
-   s.get('x', default=-1)
-
-The :meth:`~pandas.DataFrame.select` Method
--------------------------------------------
-
-Another way to extract slices from an object is with the ``select`` method of
-Series, DataFrame, and Panel. This method should be used only when there is no
-more direct way.  ``select`` takes a function which operates on labels along
-``axis`` and returns a boolean.  For instance:
-
-.. ipython:: python
-
-   df.select(lambda x: x == 'A', axis=1)
-
-The :meth:`~pandas.DataFrame.lookup` Method
--------------------------------------------
-
-Sometimes you want to extract a set of values given a sequence of row labels
-and column labels, and the ``lookup`` method allows for this and returns a
-numpy array.  For instance,
-
-.. ipython:: python
-
-  dflookup = pd.DataFrame(np.random.rand(20,4), columns = ['A','B','C','D'])
-  dflookup.lookup(list(range(0,10,2)), ['B','C','A','B','D'])
-
-.. _indexing.class:
-
-Index objects
--------------
-
-The pandas :class:`~pandas.Index` class and its subclasses can be viewed as
-implementing an *ordered multiset*. Duplicates are allowed. However, if you try
-to convert an :class:`~pandas.Index` object with duplicate entries into a
-``set``, an exception will be raised.
-
-:class:`~pandas.Index` also provides the infrastructure necessary for
-lookups, data alignment, and reindexing. The easiest way to create an
-:class:`~pandas.Index` directly is to pass a ``list`` or other sequence to
-:class:`~pandas.Index`:
-
-.. ipython:: python
-
-   index = pd.Index(['e', 'd', 'a', 'b'])
-   index
-   'd' in index
-
-You can also pass a ``name`` to be stored in the index:
-
-
-.. ipython:: python
-
-   index = pd.Index(['e', 'd', 'a', 'b'], name='something')
-   index.name
-
-The name, if set, will be shown in the console display:
-
-.. ipython:: python
-
-   index = pd.Index(list(range(5)), name='rows')
-   columns = pd.Index(['A', 'B', 'C'], name='cols')
-   df = pd.DataFrame(np.random.randn(5, 3), index=index, columns=columns)
-   df
-   df['A']
-
-.. _indexing.set_metadata:
-
-Setting metadata
-~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.13.0
-
-Indexes are "mostly immutable", but it is possible to set and change their
-metadata, like the index ``name`` (or, for ``MultiIndex``, ``levels`` and
-``labels``).
-
-You can use the ``rename``, ``set_names``, ``set_levels``, and ``set_labels``
-to set these attributes directly. They default to returning a copy; however,
-you can specify ``inplace=True`` to have the data change in place.
-
-See :ref:`Advanced Indexing <advanced>` for usage of MultiIndexes.
-
-.. ipython:: python
-
-  ind = pd.Index([1, 2, 3])
-  ind.rename("apple")
-  ind
-  ind.set_names(["apple"], inplace=True)
-  ind.name = "bob"
-  ind
-
-.. versionadded:: 0.15.0
-
-``set_names``, ``set_levels``, and ``set_labels`` also take an optional
-`level`` argument
-
-.. ipython:: python
-
-  index = pd.MultiIndex.from_product([range(3), ['one', 'two']], names=['first', 'second'])
-  index
-  index.levels[1]
-  index.set_levels(["a", "b"], level=1)
-
-Set operations on Index objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _indexing.set_ops:
-
-.. warning::
-
-   In 0.15.0. the set operations ``+`` and ``-`` were deprecated in order to provide these for numeric type operations on certain
-   index types. ``+`` can be replace by ``.union()`` or ``|``, and ``-`` by ``.difference()``.
-
-The two main operations are ``union (|)``, ``intersection (&)``
-These can be directly called as instance methods or used via overloaded
-operators. Difference is provided via the ``.difference()`` method.
-
-.. ipython:: python
-
-   a = pd.Index(['c', 'b', 'a'])
-   b = pd.Index(['c', 'e', 'd'])
-   a | b
-   a & b
-   a.difference(b)
-
-Also available is the ``symmetric_difference (^)`` operation, which returns elements
-that appear in either ``idx1`` or ``idx2`` but not both. This is
-equivalent to the Index created by ``idx1.difference(idx2).union(idx2.difference(idx1))``,
-with duplicates dropped.
-
-.. ipython:: python
-
-   idx1 = pd.Index([1, 2, 3, 4])
-   idx2 = pd.Index([2, 3, 4, 5])
-   idx1.symmetric_difference(idx2)
-   idx1 ^ idx2
-
-.. note::
-
-   The resulting index from a set operation will be sorted in ascending order.
-
-Missing values
-~~~~~~~~~~~~~~
-
-.. _indexing.missing:
-
-.. versionadded:: 0.17.1
-
-.. important::
-
-   Even though ``Index`` can hold missing values (``NaN``), it should be avoided
-   if you do not want any unexpected results. For example, some operations
-   exclude missing values implicitly.
-
-``Index.fillna`` fills missing values with specified scalar value.
-
-.. ipython:: python
-
-   idx1 = pd.Index([1, np.nan, 3, 4])
-   idx1
-   idx1.fillna(2)
-
-   idx2 = pd.DatetimeIndex([pd.Timestamp('2011-01-01'), pd.NaT, pd.Timestamp('2011-01-03')])
-   idx2
-   idx2.fillna(pd.Timestamp('2011-01-02'))
-
-Set / Reset Index
------------------
-
-Occasionally you will load or create a data set into a DataFrame and want to
-add an index after you've already done so. There are a couple of different
-ways.
-
-Set an index
-~~~~~~~~~~~~
-
-.. _indexing.set_index:
-
-DataFrame has a ``set_index`` method which takes a column name (for a regular
-``Index``) or a list of column names (for a ``MultiIndex``), to create a new,
-indexed DataFrame:
-
-.. ipython:: python
-   :suppress:
-
-   data = pd.DataFrame({'a' : ['bar', 'bar', 'foo', 'foo'],
-                        'b' : ['one', 'two', 'one', 'two'],
-                        'c' : ['z', 'y', 'x', 'w'],
-                        'd' : [1., 2., 3, 4]})
-
-.. ipython:: python
-
-   data
-   indexed1 = data.set_index('c')
-   indexed1
-   indexed2 = data.set_index(['a', 'b'])
-   indexed2
-
-The ``append`` keyword option allow you to keep the existing index and append
-the given columns to a MultiIndex:
-
-.. ipython:: python
-
-   frame = data.set_index('c', drop=False)
-   frame = frame.set_index(['a', 'b'], append=True)
-   frame
-
-Other options in ``set_index`` allow you not drop the index columns or to add
-the index in-place (without creating a new object):
-
-.. ipython:: python
-
-   data.set_index('c', drop=False)
-   data.set_index(['a', 'b'], inplace=True)
-   data
-
-Reset the index
-~~~~~~~~~~~~~~~
-
-As a convenience, there is a new function on DataFrame called ``reset_index``
-which transfers the index values into the DataFrame's columns and sets a simple
-integer index. This is the inverse operation to ``set_index``
-
-.. ipython:: python
-
-   data
-   data.reset_index()
-
-The output is more similar to a SQL table or a record array. The names for the
-columns derived from the index are the ones stored in the ``names`` attribute.
-
-You can use the ``level`` keyword to remove only a portion of the index:
-
-.. ipython:: python
-
-   frame
-   frame.reset_index(level=1)
-
-
-``reset_index`` takes an optional parameter ``drop`` which if true simply
-discards the index, instead of putting index values in the DataFrame's columns.
-
-.. note::
-
-   The ``reset_index`` method used to be called ``delevel`` which is now
-   deprecated.
-
-Adding an ad hoc index
-~~~~~~~~~~~~~~~~~~~~~~
-
-If you create an index yourself, you can just assign it to the ``index`` field:
-
-.. code-block:: python
-
-   data.index = index
-
-.. _indexing.view_versus_copy:
-
-Returning a view versus a copy
-------------------------------
-
-When setting values in a pandas object, care must be taken to avoid what is called
-``chained indexing``. Here is an example.
-
-.. ipython:: python
-
-   dfmi = pd.DataFrame([list('abcd'),
-                        list('efgh'),
-                        list('ijkl'),
-                        list('mnop')],
-                       columns=pd.MultiIndex.from_product([['one','two'],
-                                                           ['first','second']]))
-   dfmi
-
-Compare these two access methods:
-
-.. ipython:: python
-
-   dfmi['one']['second']
-
-.. ipython:: python
-
-   dfmi.loc[:,('one','second')]
-
-These both yield the same results, so which should you use? It is instructive to understand the order
-of operations on these and why method 2 (``.loc``) is much preferred over method 1 (chained ``[]``)
-
-``dfmi['one']`` selects the first level of the columns and returns a DataFrame that is singly-indexed.
-Then another python operation ``dfmi_with_one['second']`` selects the series indexed by ``'second'`` happens.
-This is indicated by the variable ``dfmi_with_one`` because pandas sees these operations as separate events.
-e.g. separate calls to ``__getitem__``, so it has to treat them as linear operations, they happen one after another.
-
-Contrast this to ``df.loc[:,('one','second')]`` which passes a nested tuple of ``(slice(None),('one','second'))`` to a single call to
-``__getitem__``. This allows pandas to deal with this as a single entity. Furthermore this order of operations *can* be significantly
-faster, and allows one to index *both* axes if so desired.
-
-Why does assignment fail when using chained indexing?
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The problem in the previous section is just a performance issue. What's up with
-the ``SettingWithCopy`` warning? We don't **usually** throw warnings around when
-you do something that might cost a few extra milliseconds!
-
-But it turns out that assigning to the product of chained indexing has
-inherently unpredictable results. To see this, think about how the Python
-interpreter executes this code:
-
-.. code-block:: python
-
-   dfmi.loc[:,('one','second')] = value
-   # becomes
-   dfmi.loc.__setitem__((slice(None), ('one', 'second')), value)
-
-But this code is handled differently:
-
-.. code-block:: python
-
-   dfmi['one']['second'] = value
-   # becomes
-   dfmi.__getitem__('one').__setitem__('second', value)
-
-See that ``__getitem__`` in there? Outside of simple cases, it's very hard to
-predict whether it will return a view or a copy (it depends on the memory layout
-of the array, about which *pandas* makes no guarantees), and therefore whether
-the ``__setitem__`` will modify ``dfmi`` or a temporary object that gets thrown
-out immediately afterward. **That's** what ``SettingWithCopy`` is warning you
-about!
-
-.. note:: You may be wondering whether we should be concerned about the ``loc``
-   property in the first example. But ``dfmi.loc`` is guaranteed to be ``dfmi``
-   itself with modified indexing behavior, so ``dfmi.loc.__getitem__`` /
-   ``dfmi.loc.__setitem__`` operate on ``dfmi`` directly. Of course,
-   ``dfmi.loc.__getitem__(idx)`` may be a view or a copy of ``dfmi``.
-
-Sometimes a ``SettingWithCopy`` warning will arise at times when there's no
-obvious chained indexing going on. **These** are the bugs that
-``SettingWithCopy`` is designed to catch! Pandas is probably trying to warn you
-that you've done this:
-
-.. code-block:: python
-
-   def do_something(df):
-      foo = df[['bar', 'baz']]  # Is foo a view? A copy? Nobody knows!
-      # ... many lines here ...
-      foo['quux'] = value       # We don't know whether this will modify df or not!
-      return foo
-
-Yikes!
-
-Evaluation order matters
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-Furthermore, in chained expressions, the order may determine whether a copy is returned or not.
-If an expression will set values on a copy of a slice, then a ``SettingWithCopy``
-exception will be raised (this raise/warn behavior is new starting in 0.13.0)
-
-You can control the action of a chained assignment via the option ``mode.chained_assignment``,
-which can take the values ``['raise','warn',None]``, where showing a warning is the default.
-
-.. ipython:: python
-   :okwarning:
-
-   dfb = pd.DataFrame({'a' : ['one', 'one', 'two',
-                              'three', 'two', 'one', 'six'],
-                       'c' : np.arange(7)})
-
-   # This will show the SettingWithCopyWarning
-   # but the frame values will be set
-   dfb['c'][dfb.a.str.startswith('o')] = 42
-
-This however is operating on a copy and will not work.
-
-::
-
-   >>> pd.set_option('mode.chained_assignment','warn')
-   >>> dfb[dfb.a.str.startswith('o')]['c'] = 42
-   Traceback (most recent call last)
-        ...
-   SettingWithCopyWarning:
-        A value is trying to be set on a copy of a slice from a DataFrame.
-        Try using .loc[row_index,col_indexer] = value instead
-
-A chained assignment can also crop up in setting in a mixed dtype frame.
-
-.. note::
-
-   These setting rules apply to all of ``.loc/.iloc``
-
-This is the correct access method
-
-.. ipython:: python
-
-   dfc = pd.DataFrame({'A':['aaa','bbb','ccc'],'B':[1,2,3]})
-   dfc.loc[0,'A'] = 11
-   dfc
-
-This *can* work at times, but is not guaranteed, and so should be avoided
-
-.. ipython:: python
-   :okwarning:
-
-   dfc = dfc.copy()
-   dfc['A'][0] = 111
-   dfc
-
-This will **not** work at all, and so should be avoided
-
-::
-
-   >>> pd.set_option('mode.chained_assignment','raise')
-   >>> dfc.loc[0]['A'] = 1111
-   Traceback (most recent call last)
-        ...
-   SettingWithCopyException:
-        A value is trying to be set on a copy of a slice from a DataFrame.
-        Try using .loc[row_index,col_indexer] = value instead
-
-.. warning::
-
-   The chained assignment warnings / exceptions are aiming to inform the user of a possibly invalid
-   assignment. There may be false positives; situations where a chained assignment is inadvertently
-   reported.
diff --git a/doc/source/install.rst b/doc/source/install.rst
index 578caae605471..5310667c403e5 100644
--- a/doc/source/install.rst
+++ b/doc/source/install.rst
@@ -1,32 +1,57 @@
 .. _install:
 
-.. currentmodule:: pandas
+{{ header }}
 
 ============
 Installation
 ============
 
-The easiest way for the majority of users to install pandas is to install it
+The easiest way to install pandas is to install it
 as part of the `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution, a
 cross platform distribution for data analysis and scientific computing.
 This is the recommended installation method for most users.
 
 Instructions for installing from source,
-`PyPI <http://pypi.python.org/pypi/pandas>`__, various Linux distributions, or a
+`PyPI <https://pypi.org/project/pandas>`__, `ActivePython <https://www.activestate.com/activepython/downloads>`__, various Linux distributions, or a
 `development version <http://github.com/pandas-dev/pandas>`__ are also provided.
 
+.. _install.dropping-27:
+
+Plan for dropping Python 2.7
+----------------------------
+
+The Python core team plans to stop supporting Python 2.7 on January 1st, 2020.
+In line with `NumPy's plans`_, all pandas releases through December 31, 2018
+will support Python 2.
+
+The 0.24.x feature release will be the last release to
+support Python 2. The released package will continue to be available on
+PyPI and through conda.
+
+ Starting **January 1, 2019**, all new feature releases (> 0.24) will be Python 3 only.
+
+If there are people interested in continued support for Python 2.7 past December
+31, 2018 (either backporting bug fixes or funding) please reach out to the
+maintainers on the issue tracker.
+
+For more information, see the `Python 3 statement`_ and the `Porting to Python 3 guide`_.
+
+.. _NumPy's plans: https://github.com/numpy/numpy/blob/master/doc/neps/nep-0014-dropping-python2.7-proposal.rst#plan-for-dropping-python-27-support
+.. _Python 3 statement: http://python3statement.org/
+.. _Porting to Python 3 guide: https://docs.python.org/3/howto/pyporting.html
+
 Python version support
 ----------------------
 
-Officially Python 2.7, 3.4, 3.5, and 3.6
+Officially Python 2.7, 3.5, 3.6, and 3.7.
 
 Installing pandas
 -----------------
 
 .. _install.anaconda:
 
-Installing pandas with Anaconda
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Installing with Anaconda
+~~~~~~~~~~~~~~~~~~~~~~~~
 
 Installing pandas and the rest of the `NumPy <http://www.numpy.org/>`__ and
 `SciPy <http://www.scipy.org/>`__ stack can be a little
@@ -40,7 +65,7 @@ packages that make up the `SciPy <http://www.scipy.org/>`__ stack
 (Linux, Mac OS X, Windows) Python distribution for data analytics and
 scientific computing.
 
-After running a simple installer, the user will have access to pandas and the
+After running the installer, the user will have access to pandas and the
 rest of the `SciPy <http://www.scipy.org/>`__ stack without needing to install
 anything else, and without needing to wait for any software to be compiled.
 
@@ -51,15 +76,15 @@ A full list of the packages available as part of the
 `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution
 `can be found here <http://docs.continuum.io/anaconda/pkg-docs.html>`__.
 
-An additional advantage of installing with Anaconda is that you don't require
-admin rights to install it, it will install in the user's home directory, and
-this also makes it trivial to delete Anaconda at a later date (just delete
+Another advantage to installing Anaconda is that you don't need
+admin rights to install it. Anaconda can install in the user's home directory,
+which makes it trivial to delete Anaconda if you decide (just delete
 that folder).
 
 .. _install.miniconda:
 
-Installing pandas with Miniconda
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Installing with Miniconda
+~~~~~~~~~~~~~~~~~~~~~~~~~
 
 The previous section outlined how to get pandas installed as part of the
 `Anaconda <http://docs.continuum.io/anaconda/>`__ distribution.
@@ -85,9 +110,9 @@ downloading and running the `Miniconda
 will do this for you. The installer
 `can be found here <http://conda.pydata.org/miniconda.html>`__
 
-The next step is to create a new conda environment (these are analogous to a
-virtualenv but they also allow you to specify precisely which Python version
-to install also). Run the following commands from a terminal window::
+The next step is to create a new conda environment. A conda environment is like a
+virtualenv that allows you to specify a specific version of Python and set of libraries.
+Run the following commands from a terminal window::
 
     conda create -n name_of_my_env python
 
@@ -107,7 +132,7 @@ following command::
 
 To install a specific pandas version::
 
-    conda install pandas=0.13.1
+    conda install pandas=0.20.3
 
 To install other packages, IPython for example::
 
@@ -118,8 +143,8 @@ distribution::
 
     conda install anaconda
 
-If you require any packages that are available to pip but not conda, simply
-install pip, and use pip to install these packages::
+If you need packages that are available to pip but not conda, then
+install pip, and then use pip to install those packages::
 
     conda install pip
     pip install django
@@ -128,84 +153,80 @@ Installing from PyPI
 ~~~~~~~~~~~~~~~~~~~~
 
 pandas can be installed via pip from
-`PyPI <http://pypi.python.org/pypi/pandas>`__.
+`PyPI <https://pypi.org/project/pandas>`__.
 
 ::
 
     pip install pandas
 
-This will likely require the installation of a number of dependencies,
-including NumPy, will require a compiler to compile required bits of code,
-and can take a few minutes to complete.
+Installing with ActivePython
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Installation instructions for
+`ActivePython <https://www.activestate.com/activepython>`__ can be found
+`here <https://www.activestate.com/activepython/downloads>`__. Versions
+2.7 and 3.5 include pandas.
 
 Installing using your Linux distribution's package manager.
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The commands in this table will install pandas for Python 2 from your distribution.
-To install pandas for Python 3 you may need to use the package ``python3-pandas``.
+The commands in this table will install pandas for Python 3 from your distribution.
+To install pandas for Python 2, you may need to use the ``python-pandas`` package.
 
 .. csv-table::
     :header: "Distribution", "Status", "Download / Repository Link", "Install method"
     :widths: 10, 10, 20, 50
 
 
-    Debian, stable, `official Debian repository <http://packages.debian.org/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python-pandas``
-    Debian & Ubuntu, unstable (latest packages), `NeuroDebian <http://neuro.debian.net/index.html#how-to-use-this-repository>`__ , ``sudo apt-get install python-pandas``
-    Ubuntu, stable, `official Ubuntu repository <http://packages.ubuntu.com/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python-pandas``
-    Ubuntu, unstable (daily builds), `PythonXY PPA  <https://code.launchpad.net/~pythonxy/+archive/pythonxy-devel>`__; activate by: ``sudo add-apt-repository ppa:pythonxy/pythonxy-devel && sudo apt-get update``, ``sudo apt-get install python-pandas``
-    OpenSuse, stable, `OpenSuse Repository  <http://software.opensuse.org/package/python-pandas?search_term=pandas>`__ , ``zypper in  python-pandas``
-    Fedora, stable, `official Fedora repository  <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``dnf install python-pandas``
-    Centos/RHEL, stable, `EPEL repository <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``yum install python-pandas``
-
-
-
-
-
-
+    Debian, stable, `official Debian repository <http://packages.debian.org/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python3-pandas``
+    Debian & Ubuntu, unstable (latest packages), `NeuroDebian <http://neuro.debian.net/index.html#how-to-use-this-repository>`__ , ``sudo apt-get install python3-pandas``
+    Ubuntu, stable, `official Ubuntu repository <http://packages.ubuntu.com/search?keywords=pandas&searchon=names&suite=all&section=all>`__ , ``sudo apt-get install python3-pandas``
+    OpenSuse, stable, `OpenSuse Repository  <http://software.opensuse.org/package/python-pandas?search_term=pandas>`__ , ``zypper in python3-pandas``
+    Fedora, stable, `official Fedora repository  <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``dnf install python3-pandas``
+    Centos/RHEL, stable, `EPEL repository <https://admin.fedoraproject.org/pkgdb/package/rpms/python-pandas/>`__ , ``yum install python3-pandas``
 
+**However**, the packages in the linux package managers are often a few versions behind, so
+to get the newest version of pandas, it's recommended to install using the ``pip`` or ``conda``
+methods described above.
 
 
 Installing from source
 ~~~~~~~~~~~~~~~~~~~~~~
 
-See the :ref:`contributing documentation <contributing>` for complete instructions on building from the git source tree. Further, see :ref:`creating a development environment <contributing.dev_env>` if you wish to create a *pandas* development environment.
+See the :ref:`contributing guide <contributing>` for complete instructions on building from the git source tree. Further, see :ref:`creating a development environment <contributing.dev_env>` if you wish to create a *pandas* development environment.
 
 Running the test suite
-~~~~~~~~~~~~~~~~~~~~~~
+----------------------
 
-pandas is equipped with an exhaustive set of unit tests covering about 97% of
-the codebase as of this writing. To run it on your machine to verify that
-everything is working (and you have all of the dependencies, soft and hard,
+pandas is equipped with an exhaustive set of unit tests, covering about 97% of
+the code base as of this writing. To run it on your machine to verify that
+everything is working (and that you have all of the dependencies, soft and hard,
 installed), make sure you have `pytest
-<http://doc.pytest.org/en/latest/>`__ and run:
+<http://docs.pytest.org/en/latest/>`__ >= 4.0.2 and `Hypothesis
+<https://hypothesis.readthedocs.io/>`__ >= 3.58, then run:
 
 ::
 
-    >>> import pandas as pd
     >>> pd.test()
-    Running unit tests for pandas
-    pandas version 0.18.0
-    numpy version 1.10.2
-    pandas is installed in pandas
-    Python version 2.7.11 |Continuum Analytics, Inc.|
-       (default, Dec  6 2015, 18:57:58) [GCC 4.2.1 (Apple Inc. build 5577)]
-    nose version 1.3.7
+    running: pytest --skip-slow --skip-network C:\Users\TP\Anaconda3\envs\py36\lib\site-packages\pandas
+    ============================= test session starts =============================
+    platform win32 -- Python 3.6.2, pytest-3.6.0, py-1.4.34, pluggy-0.4.0
+    rootdir: C:\Users\TP\Documents\Python\pandasdev\pandas, inifile: setup.cfg
+    collected 12145 items / 3 skipped
+
     ..................................................................S......
     ........S................................................................
     .........................................................................
 
-    ----------------------------------------------------------------------
-    Ran 9252 tests in 368.339s
-
-    OK (SKIP=117)
+    ==================== 12130 passed, 12 skipped in 368.339 seconds =====================
 
 Dependencies
 ------------
 
-* `setuptools <http://pythonhosted.org/setuptools>`__
-* `NumPy <http://www.numpy.org>`__: 1.7.1 or higher
-* `python-dateutil <http://labix.org/python-dateutil>`__: 1.5 or higher
-* `pytz <http://pytz.sourceforge.net/>`__: Needed for time zone support
+* `setuptools <https://setuptools.readthedocs.io/en/latest/>`__: 24.2.0 or higher
+* `NumPy <http://www.numpy.org>`__: 1.12.0 or higher
+* `python-dateutil <https://dateutil.readthedocs.io/en/stable/>`__: 2.5.0 or higher
+* `pytz <http://pytz.sourceforge.net/>`__
 
 .. _install.recommended_dependencies:
 
@@ -214,15 +235,16 @@ Recommended Dependencies
 
 * `numexpr <https://github.com/pydata/numexpr>`__: for accelerating certain numerical operations.
   ``numexpr`` uses multiple cores as well as smart chunking and caching to achieve large speedups.
-  If installed, must be Version 2.4.6 or higher.
+  If installed, must be Version 2.6.1 or higher.
 
-* `bottleneck <http://berkeleyanalytics.com/bottleneck>`__: for accelerating certain types of ``nan``
-  evaluations. ``bottleneck`` uses specialized cython routines to achieve large speedups.
+* `bottleneck <https://github.com/kwgoodman/bottleneck>`__: for accelerating certain types of ``nan``
+  evaluations. ``bottleneck`` uses specialized cython routines to achieve large speedups. If installed,
+  must be Version 1.2.0 or higher.
 
 .. note::
 
-   You are highly encouraged to install these libraries, as they provide large speedups, especially
-   if working with large data sets.
+   You are highly encouraged to install these libraries, as they provide speed improvements, especially
+   when working with large data sets.
 
 
 .. _install.optional_dependencies:
@@ -231,41 +253,53 @@ Optional Dependencies
 ~~~~~~~~~~~~~~~~~~~~~
 
 * `Cython <http://www.cython.org>`__: Only necessary to build development
-  version. Version 0.23 or higher.
-* `SciPy <http://www.scipy.org>`__: miscellaneous statistical functions
+  version. Version 0.28.2 or higher.
+* `SciPy <http://www.scipy.org>`__: miscellaneous statistical functions, Version 0.18.1 or higher
 * `xarray <http://xarray.pydata.org>`__: pandas like handling for > 2 dims, needed for converting Panels to xarray objects. Version 0.7.0 or higher is recommended.
-* `PyTables <http://www.pytables.org>`__: necessary for HDF5-based storage. Version 3.0.0 or higher required, Version 3.2.1 or higher highly recommended.
-* `Feather Format <https://github.com/wesm/feather>`__: necessary for feather-based storage, version 0.3.1 or higher.
+* `PyTables <http://www.pytables.org>`__: necessary for HDF5-based storage, Version 3.4.2 or higher
+* `pyarrow <http://arrow.apache.org/docs/python/>`__ (>= 0.9.0): necessary for feather-based storage.
+* `Apache Parquet <https://parquet.apache.org/>`__, either `pyarrow <http://arrow.apache.org/docs/python/>`__ (>= 0.7.0) or `fastparquet <https://fastparquet.readthedocs.io/en/latest>`__ (>= 0.2.1) for parquet-based storage. The `snappy <https://pypi.org/project/python-snappy>`__ and `brotli <https://pypi.org/project/brotlipy>`__ are available for compression support.
 * `SQLAlchemy <http://www.sqlalchemy.org>`__: for SQL database support. Version 0.8.1 or higher recommended. Besides SQLAlchemy, you also need a database specific driver. You can find an overview of supported drivers for each SQL dialect in the `SQLAlchemy docs <http://docs.sqlalchemy.org/en/latest/dialects/index.html>`__. Some common drivers are:
 
-  * `psycopg2 <http://initd.org/psycopg/>`__: for PostgreSQL
-  * `pymysql <https://github.com/PyMySQL/PyMySQL>`__: for MySQL.
-  * `SQLite <https://docs.python.org/3.5/library/sqlite3.html>`__: for SQLite, this is included in Python's standard library by default.
+    * `psycopg2 <http://initd.org/psycopg/>`__: for PostgreSQL
+    * `pymysql <https://github.com/PyMySQL/PyMySQL>`__: for MySQL.
+    * `SQLite <https://docs.python.org/3/library/sqlite3.html>`__: for SQLite, this is included in Python's standard library by default.
 
-* `matplotlib <http://matplotlib.org/>`__: for plotting
+* `matplotlib <http://matplotlib.org/>`__: for plotting, Version 2.0.0 or higher.
 * For Excel I/O:
 
-  * `xlrd/xlwt <http://www.python-excel.org/>`__: Excel reading (xlrd) and writing (xlwt)
-  * `openpyxl <http://packages.python.org/openpyxl/>`__: openpyxl version 1.6.1
-    or higher (but lower than 2.0.0), or version 2.2 or higher, for writing .xlsx files (xlrd >= 0.9.0)
-  * `XlsxWriter <https://pypi.python.org/pypi/XlsxWriter>`__: Alternative Excel writer
+    * `xlrd/xlwt <http://www.python-excel.org/>`__: Excel reading (xlrd), version 1.0.0 or higher required, and writing (xlwt)
+    * `openpyxl <https://openpyxl.readthedocs.io/en/stable/>`__: openpyxl version 2.4.0
+      for writing .xlsx files (xlrd >= 0.9.0)
+    * `XlsxWriter <https://pypi.org/project/XlsxWriter>`__: Alternative Excel writer
 
 * `Jinja2 <http://jinja.pocoo.org/>`__: Template engine for conditional HTML formatting.
 * `s3fs <http://s3fs.readthedocs.io/>`__: necessary for Amazon S3 access (s3fs >= 0.0.7).
-* `blosc <https://pypi.python.org/pypi/blosc>`__: for msgpack compression using ``blosc``
-* One of `PyQt4
-  <http://www.riverbankcomputing.com/software/pyqt/download>`__, `PySide
-  <http://qt-project.org/wiki/Category:LanguageBindings::PySide>`__, `pygtk
-  <http://www.pygtk.org/>`__, `xsel
-  <http://www.vergenet.net/~conrad/software/xsel/>`__, or `xclip
-  <https://github.com/astrand/xclip/>`__: necessary to use
+* `blosc <https://pypi.org/project/blosc>`__: for msgpack compression using ``blosc``
+* `gcsfs <http://gcsfs.readthedocs.io/>`__: necessary for Google Cloud Storage access (gcsfs >= 0.1.0).
+* One of
+  `qtpy  <https://github.com/spyder-ide/qtpy>`__ (requires PyQt or PySide),
+  `PyQt5 <https://www.riverbankcomputing.com/software/pyqt/download5>`__,
+  `PyQt4 <http://www.riverbankcomputing.com/software/pyqt/download>`__,
+  `pygtk <http://www.pygtk.org/>`__,
+  `xsel <http://www.vergenet.net/~conrad/software/xsel/>`__, or
+  `xclip <https://github.com/astrand/xclip/>`__: necessary to use
   :func:`~pandas.read_clipboard`. Most package managers on Linux distributions will have ``xclip`` and/or ``xsel`` immediately available for installation.
-* For Google BigQuery I/O - see `here <https://pandas-gbq.readthedocs.io/en/latest/install.html#dependencies>`__
+* `pandas-gbq
+  <https://pandas-gbq.readthedocs.io/en/latest/install.html#dependencies>`__:
+  for Google BigQuery I/O. (pandas-gbq >= 0.8.0)
+
 
-* `Backports.lzma <https://pypi.python.org/pypi/backports.lzma/>`__: Only for Python 2, for writing to and/or reading from an xz compressed DataFrame in CSV; Python 3 support is built into the standard library.
+* `Backports.lzma <https://pypi.org/project/backports.lzma/>`__: Only for Python 2, for writing to and/or reading from an xz compressed DataFrame in CSV; Python 3 support is built into the standard library.
 * One of the following combinations of libraries is needed to use the
   top-level :func:`~pandas.read_html` function:
 
+  .. versionchanged:: 0.23.0
+
+  .. note::
+
+     If using BeautifulSoup4 a minimum version of 4.2.1 is required
+
   * `BeautifulSoup4`_ and `html5lib`_ (Any recent version of `html5lib`_ is
     okay.)
   * `BeautifulSoup4`_ and `lxml`_
@@ -282,9 +316,6 @@ Optional Dependencies
      * You are highly encouraged to read :ref:`HTML Table Parsing gotchas <io.html.gotchas>`.
        It explains issues surrounding the installation and
        usage of the above three libraries.
-     * You may need to install an older version of `BeautifulSoup4`_:
-       Versions 4.2.1, 4.1.3 and 4.0.2 have been confirmed for 64 and 32-bit
-       Ubuntu/Debian
 
   .. note::
 
@@ -306,5 +337,5 @@ Optional Dependencies
 
    Without the optional dependencies, many useful features will not
    work. Hence, it is highly recommended that you install these. A packaged
-   distribution like `Anaconda <http://docs.continuum.io/anaconda/>`__, or `Enthought Canopy
+   distribution like `Anaconda <http://docs.continuum.io/anaconda/>`__, `ActivePython <https://www.activestate.com/activepython/downloads>`__  (version 2.7 or 3.5), or `Enthought Canopy
    <http://enthought.com/products/canopy>`__ may be worth considering.
diff --git a/doc/source/internals.rst b/doc/source/internals.rst
deleted file mode 100644
index 3d96b93de4cc9..0000000000000
--- a/doc/source/internals.rst
+++ /dev/null
@@ -1,241 +0,0 @@
-.. _internals:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import pandas as pd
-   pd.options.display.max_rows = 15
-
-*********
-Internals
-*********
-
-This section will provide a look into some of pandas internals.
-
-Indexing
---------
-
-In pandas there are a few objects implemented which can serve as valid
-containers for the axis labels:
-
-- ``Index``: the generic "ordered set" object, an ndarray of object dtype
-  assuming nothing about its contents. The labels must be hashable (and
-  likely immutable) and unique. Populates a dict of label to location in
-  Cython to do ``O(1)`` lookups.
-- ``Int64Index``: a version of ``Index`` highly optimized for 64-bit integer
-  data, such as time stamps
-- ``Float64Index``: a version of ``Index`` highly optimized for 64-bit float data
-- ``MultiIndex``: the standard hierarchical index object
-- ``DatetimeIndex``: An Index object with ``Timestamp`` boxed elements (impl are the int64 values)
-- ``TimedeltaIndex``: An Index object with ``Timedelta`` boxed elements (impl are the in64 values)
-- ``PeriodIndex``: An Index object with Period elements
-
-There are functions that make the creation of a regular index easy:
-
-- ``date_range``: fixed frequency date range generated from a time rule or
-  DateOffset. An ndarray of Python datetime objects
-- ``period_range``: fixed frequency date range generated from a time rule or
-  DateOffset. An ndarray of ``Period`` objects, representing Timespans
-
-The motivation for having an ``Index`` class in the first place was to enable
-different implementations of indexing. This means that it's possible for you,
-the user, to implement a custom ``Index`` subclass that may be better suited to
-a particular application than the ones provided in pandas.
-
-From an internal implementation point of view, the relevant methods that an
-``Index`` must define are one or more of the following (depending on how
-incompatible the new object internals are with the ``Index`` functions):
-
-- ``get_loc``: returns an "indexer" (an integer, or in some cases a
-  slice object) for a label
-- ``slice_locs``: returns the "range" to slice between two labels
-- ``get_indexer``: Computes the indexing vector for reindexing / data
-  alignment purposes. See the source / docstrings for more on this
-- ``get_indexer_non_unique``: Computes the indexing vector for reindexing / data
-  alignment purposes when the index is non-unique. See the source / docstrings
-  for more on this
-- ``reindex``: Does any pre-conversion of the input index then calls
-  ``get_indexer``
-- ``union``, ``intersection``: computes the union or intersection of two
-  Index objects
-- ``insert``: Inserts a new label into an Index, yielding a new object
-- ``delete``: Delete a label, yielding a new object
-- ``drop``: Deletes a set of labels
-- ``take``: Analogous to ndarray.take
-
-MultiIndex
-~~~~~~~~~~
-
-Internally, the ``MultiIndex`` consists of a few things: the **levels**, the
-integer **labels**, and the level **names**:
-
-.. ipython:: python
-
-   index = pd.MultiIndex.from_product([range(3), ['one', 'two']], names=['first', 'second'])
-   index
-   index.levels
-   index.labels
-   index.names
-
-You can probably guess that the labels determine which unique element is
-identified with that location at each layer of the index. It's important to
-note that sortedness is determined **solely** from the integer labels and does
-not check (or care) whether the levels themselves are sorted. Fortunately, the
-constructors ``from_tuples`` and ``from_arrays`` ensure that this is true, but
-if you compute the levels and labels yourself, please be careful.
-
-.. _ref-subclassing-pandas:
-
-Subclassing pandas Data Structures
-----------------------------------
-
-.. warning:: There are some easier alternatives before considering subclassing ``pandas`` data structures.
-
-  1. Extensible method chains with :ref:`pipe <basics.pipe>`
-
-  2. Use *composition*. See `here <http://en.wikipedia.org/wiki/Composition_over_inheritance>`_.
-
-This section describes how to subclass ``pandas`` data structures to meet more specific needs. There are 2 points which need attention:
-
-1. Override constructor properties.
-2. Define original properties
-
-.. note:: You can find a nice example in `geopandas <https://github.com/geopandas/geopandas>`_ project.
-
-Override Constructor Properties
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Each data structure has constructor properties to specifying data constructors. By overriding these properties, you can retain defined-classes through ``pandas`` data manipulations.
-
-There are 3 constructors to be defined:
-
-- ``_constructor``: Used when a manipulation result has the same dimesions as the original.
-- ``_constructor_sliced``: Used when a manipulation result has one lower dimension(s) as the original, such as ``DataFrame`` single columns slicing.
-- ``_constructor_expanddim``: Used when a manipulation result has one higher dimension as the original, such as ``Series.to_frame()`` and ``DataFrame.to_panel()``.
-
-Following table shows how ``pandas`` data structures define constructor properties by default.
-
-===========================  ======================= =================== =======================
-Property Attributes          ``Series``              ``DataFrame``       ``Panel``
-===========================  ======================= =================== =======================
-``_constructor``             ``Series``              ``DataFrame``       ``Panel``
-``_constructor_sliced``      ``NotImplementedError`` ``Series``          ``DataFrame``
-``_constructor_expanddim``   ``DataFrame``           ``Panel``           ``NotImplementedError``
-===========================  ======================= =================== =======================
-
-Below example shows how to define ``SubclassedSeries`` and ``SubclassedDataFrame`` overriding constructor properties.
-
-.. code-block:: python
-
-   class SubclassedSeries(Series):
-
-       @property
-       def _constructor(self):
-           return SubclassedSeries
-
-       @property
-       def _constructor_expanddim(self):
-           return SubclassedDataFrame
-
-   class SubclassedDataFrame(DataFrame):
-
-       @property
-       def _constructor(self):
-           return SubclassedDataFrame
-
-       @property
-       def _constructor_sliced(self):
-           return SubclassedSeries
-
-.. code-block:: python
-
-   >>> s = SubclassedSeries([1, 2, 3])
-   >>> type(s)
-   <class '__main__.SubclassedSeries'>
-
-   >>> to_framed = s.to_frame()
-   >>> type(to_framed)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> df = SubclassedDataFrame({'A', [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
-   >>> df
-      A  B  C
-   0  1  4  7
-   1  2  5  8
-   2  3  6  9
-
-   >>> type(df)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> sliced1 = df[['A', 'B']]
-   >>> sliced1
-      A  B
-   0  1  4
-   1  2  5
-   2  3  6
-   >>> type(sliced1)
-   <class '__main__.SubclassedDataFrame'>
-
-   >>> sliced2 = df['A']
-   >>> sliced2
-   0    1
-   1    2
-   2    3
-   Name: A, dtype: int64
-   >>> type(sliced2)
-   <class '__main__.SubclassedSeries'>
-
-Define Original Properties
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-To let original data structures have additional properties, you should let ``pandas`` know what properties are added. ``pandas`` maps unknown properties to data names overriding ``__getattribute__``. Defining original properties can be done in one of 2 ways:
-
-1. Define ``_internal_names`` and ``_internal_names_set`` for temporary properties which WILL NOT be passed to manipulation results.
-2. Define ``_metadata`` for normal properties which will be passed to manipulation results.
-
-Below is an example to define 2 original properties, "internal_cache" as a temporary property and "added_property" as a normal property
-
-.. code-block:: python
-
-   class SubclassedDataFrame2(DataFrame):
-
-       # temporary properties
-       _internal_names = pd.DataFrame._internal_names + ['internal_cache']
-       _internal_names_set = set(_internal_names)
-
-       # normal properties
-       _metadata = ['added_property']
-
-       @property
-       def _constructor(self):
-           return SubclassedDataFrame2
-
-.. code-block:: python
-
-   >>> df = SubclassedDataFrame2({'A', [1, 2, 3], 'B': [4, 5, 6], 'C': [7, 8, 9]})
-   >>> df
-      A  B  C
-   0  1  4  7
-   1  2  5  8
-   2  3  6  9
-
-   >>> df.internal_cache = 'cached'
-   >>> df.added_property = 'property'
-
-   >>> df.internal_cache
-   cached
-   >>> df.added_property
-   property
-
-   # properties defined in _internal_names is reset after manipulation
-   >>> df[['A', 'B']].internal_cache
-   AttributeError: 'SubclassedDataFrame2' object has no attribute 'internal_cache'
-
-   # properties defined in _metadata are retained
-   >>> df[['A', 'B']].added_property
-   property
diff --git a/doc/source/io.rst b/doc/source/io.rst
deleted file mode 100644
index 5cec27c329a7f..0000000000000
--- a/doc/source/io.rst
+++ /dev/null
@@ -1,5211 +0,0 @@
-.. _io:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   import csv
-   from pandas.compat import StringIO, BytesIO
-   import pandas as pd
-   ExcelWriter = pd.ExcelWriter
-
-   import numpy as np
-   np.random.seed(123456)
-   randn = np.random.randn
-   np.set_printoptions(precision=4, suppress=True)
-
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-   import pandas.util.testing as tm
-   pd.options.display.max_rows=15
-   clipdf = pd.DataFrame({'A':[1,2,3],'B':[4,5,6],'C':['p','q','r']},
-                         index=['x','y','z'])
-
-===============================
-IO Tools (Text, CSV, HDF5, ...)
-===============================
-
-The pandas I/O API is a set of top level ``reader`` functions accessed like ``pd.read_csv()`` that generally return a ``pandas``
-object. The corresponding ``writer`` functions are object methods that are accessed like ``df.to_csv()``
-
-.. csv-table::
-    :header: "Format Type", "Data Description", "Reader", "Writer"
-    :widths: 30, 100, 60, 60
-    :delim: ;
-
-    text;`CSV <https://en.wikipedia.org/wiki/Comma-separated_values>`__;:ref:`read_csv<io.read_csv_table>`;:ref:`to_csv<io.store_in_csv>`
-    text;`JSON <http://www.json.org/>`__;:ref:`read_json<io.json_reader>`;:ref:`to_json<io.json_writer>`
-    text;`HTML <https://en.wikipedia.org/wiki/HTML>`__;:ref:`read_html<io.read_html>`;:ref:`to_html<io.html>`
-    text; Local clipboard;:ref:`read_clipboard<io.clipboard>`;:ref:`to_clipboard<io.clipboard>`
-    binary;`MS Excel <https://en.wikipedia.org/wiki/Microsoft_Excel>`__;:ref:`read_excel<io.excel_reader>`;:ref:`to_excel<io.excel_writer>`
-    binary;`HDF5 Format <https://support.hdfgroup.org/HDF5/whatishdf5.html>`__;:ref:`read_hdf<io.hdf5>`;:ref:`to_hdf<io.hdf5>`
-    binary;`Feather Format <https://github.com/wesm/feather>`__;:ref:`read_feather<io.feather>`;:ref:`to_feather<io.feather>`
-    binary;`Msgpack <http://msgpack.org/index.html>`__;:ref:`read_msgpack<io.msgpack>`;:ref:`to_msgpack<io.msgpack>`
-    binary;`Stata <https://en.wikipedia.org/wiki/Stata>`__;:ref:`read_stata<io.stata_reader>`;:ref:`to_stata<io.stata_writer>`
-    binary;`SAS <https://en.wikipedia.org/wiki/SAS_(software)>`__;:ref:`read_sas<io.sas_reader>`;
-    binary;`Python Pickle Format <https://docs.python.org/3/library/pickle.html>`__;:ref:`read_pickle<io.pickle>`;:ref:`to_pickle<io.pickle>`
-    SQL;`SQL <https://en.wikipedia.org/wiki/SQL>`__;:ref:`read_sql<io.sql>`;:ref:`to_sql<io.sql>`
-    SQL;`Google Big Query <https://en.wikipedia.org/wiki/BigQuery>`__;:ref:`read_gbq<io.bigquery>`;:ref:`to_gbq<io.bigquery>`
-
-:ref:`Here <io.perf>` is an informal performance comparison for some of these IO methods.
-
-.. note::
-   For examples that use the ``StringIO`` class, make sure you import it
-   according to your Python version, i.e. ``from StringIO import StringIO`` for
-   Python 2 and ``from io import StringIO`` for Python 3.
-
-.. _io.read_csv_table:
-
-CSV & Text files
-----------------
-
-The two workhorse functions for reading text files (a.k.a. flat files) are
-:func:`read_csv` and :func:`read_table`. They both use the same parsing code to
-intelligently convert tabular data into a DataFrame object. See the
-:ref:`cookbook<cookbook.csv>` for some advanced strategies.
-
-Parsing options
-'''''''''''''''
-
-:func:`read_csv` and :func:`read_table` accept the following arguments:
-
-Basic
-+++++
-
-filepath_or_buffer : various
-  Either a path to a file (a :class:`python:str`, :class:`python:pathlib.Path`,
-  or :class:`py:py._path.local.LocalPath`), URL (including http, ftp, and S3
-  locations), or any object with a ``read()`` method (such as an open file or
-  :class:`~python:io.StringIO`).
-sep : str, defaults to ``','`` for :func:`read_csv`, ``\t`` for :func:`read_table`
-  Delimiter to use. If sep is ``None``, the C engine cannot automatically detect
-  the separator, but the Python parsing engine can, meaning the latter will be
-  used automatically. In addition, separators longer than 1 character and
-  different from ``'\s+'`` will be interpreted as regular expressions and
-  will also force the use of the Python parsing engine. Note that regex
-  delimiters are prone to ignoring quoted data. Regex example: ``'\\r\\t'``.
-delimiter : str, default ``None``
-  Alternative argument name for sep.
-delim_whitespace : boolean, default False
-  Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``)
-  will be used as the delimiter. Equivalent to setting ``sep='\s+'``.
-  If this option is set to True, nothing should be passed in for the
-  ``delimiter`` parameter.
-
-  .. versionadded:: 0.18.1 support for the Python parser.
-
-Column and Index Locations and Names
-++++++++++++++++++++++++++++++++++++
-
-header : int or list of ints, default ``'infer'``
-  Row number(s) to use as the column names, and the start of the data. Default
-  behavior is as if ``header=0`` if no ``names`` passed, otherwise as if
-  ``header=None``. Explicitly pass ``header=0`` to be able to replace existing
-  names. The header can be a list of ints that specify row locations for a
-  multi-index on the columns e.g. ``[0,1,3]``. Intervening rows that are not
-  specified will be skipped (e.g. 2 in this example is skipped). Note that
-  this parameter ignores commented lines and empty lines if
-  ``skip_blank_lines=True``, so header=0 denotes the first line of data
-  rather than the first line of the file.
-names : array-like, default ``None``
-  List of column names to use. If file contains no header row, then you should
-  explicitly pass ``header=None``. Duplicates in this list are not allowed unless
-  ``mangle_dupe_cols=True``, which is the default.
-index_col :  int or sequence or ``False``, default ``None``
-  Column to use as the row labels of the DataFrame. If a sequence is given, a
-  MultiIndex is used. If you have a malformed file with delimiters at the end of
-  each line, you might consider ``index_col=False`` to force pandas to *not* use
-  the first column as the index (row names).
-usecols : array-like or callable, default ``None``
-  Return a subset of the columns. If array-like, all elements must either
-  be positional (i.e. integer indices into the document columns) or strings
-  that correspond to column names provided either by the user in `names` or
-  inferred from the document header row(s). For example, a valid array-like
-  `usecols` parameter would be [0, 1, 2] or ['foo', 'bar', 'baz'].
-
-  If callable, the callable function will be evaluated against the column names,
-  returning names where the callable function evaluates to True:
-
-  .. ipython:: python
-
-     data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
-     pd.read_csv(StringIO(data))
-     pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['COL1', 'COL3'])
-
-  Using this parameter results in much faster parsing time and lower memory usage.
-as_recarray : boolean, default ``False``
-  DEPRECATED: this argument will be removed in a future version. Please call
-  ``pd.read_csv(...).to_records()`` instead.
-
-  Return a NumPy recarray instead of a DataFrame after parsing the data. If
-  set to ``True``, this option takes precedence over the ``squeeze`` parameter.
-  In addition, as row indices are not available in such a format, the ``index_col``
-  parameter will be ignored.
-squeeze : boolean, default ``False``
-  If the parsed data only contains one column then return a Series.
-prefix : str, default ``None``
-  Prefix to add to column numbers when no header, e.g. 'X' for X0, X1, ...
-mangle_dupe_cols : boolean, default ``True``
-  Duplicate columns will be specified as 'X.0'...'X.N', rather than 'X'...'X'.
-  Passing in False will cause data to be overwritten if there are duplicate
-  names in the columns.
-
-General Parsing Configuration
-+++++++++++++++++++++++++++++
-
-dtype : Type name or dict of column -> type, default ``None``
-  Data type for data or columns. E.g. ``{'a': np.float64, 'b': np.int32}``
-  (unsupported with ``engine='python'``). Use `str` or `object` to preserve and
-  not interpret dtype.
-
-  .. versionadded:: 0.20.0 support for the Python parser.
-
-engine : {``'c'``, ``'python'``}
-  Parser engine to use. The C engine is faster while the python engine is
-  currently more feature-complete.
-converters : dict, default ``None``
-  Dict of functions for converting values in certain columns. Keys can either be
-  integers or column labels.
-true_values : list, default ``None``
-  Values to consider as ``True``.
-false_values : list, default ``None``
-  Values to consider as ``False``.
-skipinitialspace : boolean, default ``False``
-  Skip spaces after delimiter.
-skiprows : list-like or integer, default ``None``
-  Line numbers to skip (0-indexed) or number of lines to skip (int) at the start
-  of the file.
-
-  If callable, the callable function will be evaluated against the row
-  indices, returning True if the row should be skipped and False otherwise:
-
-  .. ipython:: python
-
-     data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
-     pd.read_csv(StringIO(data))
-     pd.read_csv(StringIO(data), skiprows=lambda x: x % 2 != 0)
-
-skipfooter : int, default ``0``
-  Number of lines at bottom of file to skip (unsupported with engine='c').
-skip_footer : int, default ``0``
-  DEPRECATED: use the ``skipfooter`` parameter instead, as they are identical
-nrows : int, default ``None``
-  Number of rows of file to read. Useful for reading pieces of large files.
-low_memory : boolean, default ``True``
-  Internally process the file in chunks, resulting in lower memory use
-  while parsing, but possibly mixed type inference.  To ensure no mixed
-  types either set ``False``, or specify the type with the ``dtype`` parameter.
-  Note that the entire file is read into a single DataFrame regardless,
-  use the ``chunksize`` or ``iterator`` parameter to return the data in chunks.
-  (Only valid with C parser)
-buffer_lines : int, default None
-    DEPRECATED: this argument will be removed in a future version because its
-    value is not respected by the parser
-compact_ints : boolean, default False
-  DEPRECATED: this argument will be removed in a future version
-
-  If ``compact_ints`` is ``True``, then for any column that is of integer dtype, the
-  parser will attempt to cast it as the smallest integer ``dtype`` possible, either
-  signed or unsigned depending on the specification from the ``use_unsigned`` parameter.
-use_unsigned : boolean, default False
-  DEPRECATED: this argument will be removed in a future version
-
-  If integer columns are being compacted (i.e. ``compact_ints=True``), specify whether
-  the column should be compacted to the smallest signed or unsigned integer dtype.
-memory_map : boolean, default False
-  If a filepath is provided for ``filepath_or_buffer``, map the file object
-  directly onto memory and access the data directly from there. Using this
-  option can improve performance because there is no longer any I/O overhead.
-
-NA and Missing Data Handling
-++++++++++++++++++++++++++++
-
-na_values : scalar, str, list-like, or dict, default ``None``
-  Additional strings to recognize as NA/NaN. If dict passed, specific per-column
-  NA values. By default the following values are interpreted as NaN:
-  ``'-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A', 'N/A', 'NA',
-  '#NA', 'NULL', 'NaN', '-NaN', 'nan', '-nan', ''``.
-keep_default_na : boolean, default ``True``
-  If na_values are specified and keep_default_na is ``False`` the default NaN
-  values are overridden, otherwise they're appended to.
-na_filter : boolean, default ``True``
-  Detect missing value markers (empty strings and the value of na_values). In
-  data without any NAs, passing ``na_filter=False`` can improve the performance
-  of reading a large file.
-verbose : boolean, default ``False``
-  Indicate number of NA values placed in non-numeric columns.
-skip_blank_lines : boolean, default ``True``
-  If ``True``, skip over blank lines rather than interpreting as NaN values.
-
-Datetime Handling
-+++++++++++++++++
-
-parse_dates : boolean or list of ints or names or list of lists or dict, default ``False``.
-  - If ``True`` -> try parsing the index.
-  - If ``[1, 2, 3]`` ->  try parsing columns 1, 2, 3 each as a separate date
-    column.
-  - If ``[[1, 3]]`` -> combine columns 1 and 3 and parse as a single date
-    column.
-  - If ``{'foo' : [1, 3]}`` -> parse columns 1, 3 as date and call result 'foo'.
-    A fast-path exists for iso8601-formatted dates.
-infer_datetime_format : boolean, default ``False``
-  If ``True`` and parse_dates is enabled for a column, attempt to infer the
-  datetime format to speed up the processing.
-keep_date_col : boolean, default ``False``
-  If ``True`` and parse_dates specifies combining multiple columns then keep the
-  original columns.
-date_parser : function, default ``None``
-  Function to use for converting a sequence of string columns to an array of
-  datetime instances. The default uses ``dateutil.parser.parser`` to do the
-  conversion. Pandas will try to call date_parser in three different ways,
-  advancing to the next if an exception occurs: 1) Pass one or more arrays (as
-  defined by parse_dates) as arguments; 2) concatenate (row-wise) the string
-  values from the columns defined by parse_dates into a single array and pass
-  that; and 3) call date_parser once for each row using one or more strings
-  (corresponding to the columns defined by parse_dates) as arguments.
-dayfirst : boolean, default ``False``
-  DD/MM format dates, international and European format.
-
-Iteration
-+++++++++
-
-iterator : boolean, default ``False``
-  Return `TextFileReader` object for iteration or getting chunks with
-  ``get_chunk()``.
-chunksize : int, default ``None``
-  Return `TextFileReader` object for iteration. See :ref:`iterating and chunking
-  <io.chunking>` below.
-
-Quoting, Compression, and File Format
-+++++++++++++++++++++++++++++++++++++
-
-compression : {``'infer'``, ``'gzip'``, ``'bz2'``, ``'zip'``, ``'xz'``, ``None``}, default ``'infer'``
-  For on-the-fly decompression of on-disk data. If 'infer', then use gzip,
-  bz2, zip, or xz if filepath_or_buffer is a string ending in '.gz', '.bz2',
-  '.zip', or '.xz', respectively, and no decompression otherwise. If using 'zip',
-  the ZIP file must contain only one data file to be read in.
-  Set to ``None`` for no decompression.
-
-  .. versionadded:: 0.18.1 support for 'zip' and 'xz' compression.
-
-thousands : str, default ``None``
-  Thousands separator.
-decimal : str, default ``'.'``
-  Character to recognize as decimal point. E.g. use ``','`` for European data.
-float_precision : string, default None
-  Specifies which converter the C engine should use for floating-point values.
-  The options are ``None`` for the ordinary converter, ``high`` for the
-  high-precision converter, and ``round_trip`` for the round-trip converter.
-lineterminator : str (length 1), default ``None``
-  Character to break file into lines. Only valid with C parser.
-quotechar : str (length 1)
-  The character used to denote the start and end of a quoted item. Quoted items
-  can include the delimiter and it will be ignored.
-quoting : int or ``csv.QUOTE_*`` instance, default ``0``
-  Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
-  ``QUOTE_MINIMAL`` (0), ``QUOTE_ALL`` (1), ``QUOTE_NONNUMERIC`` (2) or
-  ``QUOTE_NONE`` (3).
-doublequote : boolean, default ``True``
-   When ``quotechar`` is specified and ``quoting`` is not ``QUOTE_NONE``,
-   indicate whether or not to interpret two consecutive ``quotechar`` elements
-   **inside** a field as a single ``quotechar`` element.
-escapechar : str (length 1), default ``None``
-  One-character string used to escape delimiter when quoting is ``QUOTE_NONE``.
-comment : str, default ``None``
-  Indicates remainder of line should not be parsed. If found at the beginning of
-  a line, the line will be ignored altogether. This parameter must be a single
-  character. Like empty lines (as long as ``skip_blank_lines=True``), fully
-  commented lines are ignored by the parameter `header` but not by `skiprows`.
-  For example, if ``comment='#'``, parsing '#empty\\na,b,c\\n1,2,3' with
-  `header=0` will result in 'a,b,c' being treated as the header.
-encoding : str, default ``None``
-  Encoding to use for UTF when reading/writing (e.g. ``'utf-8'``). `List of
-  Python standard encodings
-  <https://docs.python.org/3/library/codecs.html#standard-encodings>`_.
-dialect : str or :class:`python:csv.Dialect` instance, default ``None``
-  If provided, this parameter will override values (default or not) for the
-  following parameters: `delimiter`, `doublequote`, `escapechar`,
-  `skipinitialspace`, `quotechar`, and `quoting`. If it is necessary to
-  override values, a ParserWarning will be issued. See :class:`python:csv.Dialect`
-  documentation for more details.
-tupleize_cols : boolean, default ``False``
-  Leave a list of tuples on columns as is (default is to convert to a MultiIndex
-  on the columns).
-
-Error Handling
-++++++++++++++
-
-error_bad_lines : boolean, default ``True``
-  Lines with too many fields (e.g. a csv line with too many commas) will by
-  default cause an exception to be raised, and no DataFrame will be returned. If
-  ``False``, then these "bad lines" will dropped from the DataFrame that is
-  returned (only valid with C parser). See :ref:`bad lines <io.bad_lines>`
-  below.
-warn_bad_lines : boolean, default ``True``
-  If error_bad_lines is ``False``, and warn_bad_lines is ``True``, a warning for
-  each "bad line" will be output (only valid with C parser).
-
-.. _io.dtypes:
-
-Specifying column data types
-''''''''''''''''''''''''''''
-
-Starting with v0.10, you can indicate the data type for the whole DataFrame or
-individual columns:
-
-.. ipython:: python
-
-    data = 'a,b,c\n1,2,3\n4,5,6\n7,8,9'
-    print(data)
-
-    df = pd.read_csv(StringIO(data), dtype=object)
-    df
-    df['a'][0]
-    df = pd.read_csv(StringIO(data), dtype={'b': object, 'c': np.float64})
-    df.dtypes
-
-Fortunately, ``pandas`` offers more than one way to ensure that your column(s)
-contain only one ``dtype``. If you're unfamiliar with these concepts, you can
-see :ref:`here<basics.dtypes>` to learn more about dtypes, and
-:ref:`here<basics.object_conversion>` to learn more about ``object`` conversion in
-``pandas``.
-
-
-For instance, you can use the ``converters`` argument
-of :func:`~pandas.read_csv`:
-
-.. ipython:: python
-
-    data = "col_1\n1\n2\n'A'\n4.22"
-    df = pd.read_csv(StringIO(data), converters={'col_1':str})
-    df
-    df['col_1'].apply(type).value_counts()
-
-Or you can use the :func:`~pandas.to_numeric` function to coerce the
-dtypes after reading in the data,
-
-.. ipython:: python
-
-    df2 = pd.read_csv(StringIO(data))
-    df2['col_1'] = pd.to_numeric(df2['col_1'], errors='coerce')
-    df2
-    df2['col_1'].apply(type).value_counts()
-
-which would convert all valid parsing to floats, leaving the invalid parsing
-as ``NaN``.
-
-Ultimately, how you deal with reading in columns containing mixed dtypes
-depends on your specific needs. In the case above, if you wanted to ``NaN`` out
-the data anomalies, then :func:`~pandas.to_numeric` is probably your best option.
-However, if you wanted for all the data to be coerced, no matter the type, then
-using the ``converters`` argument of :func:`~pandas.read_csv` would certainly be
-worth trying.
-
-  .. versionadded:: 0.20.0 support for the Python parser.
-
-     The ``dtype`` option is supported by the 'python' engine
-
-.. note::
-   In some cases, reading in abnormal data with columns containing mixed dtypes
-   will result in an inconsistent dataset. If you rely on pandas to infer the
-   dtypes of your columns, the parsing engine will go and infer the dtypes for
-   different chunks of the data, rather than the whole dataset at once. Consequently,
-   you can end up with column(s) with mixed dtypes. For example,
-
-   .. ipython:: python
-        :okwarning:
-
-        df = pd.DataFrame({'col_1': list(range(500000)) + ['a', 'b'] + list(range(500000))})
-        df.to_csv('foo.csv')
-        mixed_df = pd.read_csv('foo.csv')
-        mixed_df['col_1'].apply(type).value_counts()
-        mixed_df['col_1'].dtype
-
-   will result with `mixed_df` containing an ``int`` dtype for certain chunks
-   of the column, and ``str`` for others due to the mixed dtypes from the
-   data that was read in. It is important to note that the overall column will be
-   marked with a ``dtype`` of ``object``, which is used for columns with mixed dtypes.
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.csv')
-
-.. _io.categorical:
-
-Specifying Categorical dtype
-''''''''''''''''''''''''''''
-
-.. versionadded:: 0.19.0
-
-``Categorical`` columns can be parsed directly by specifying ``dtype='category'``
-
-.. ipython:: python
-
-   data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
-
-   pd.read_csv(StringIO(data))
-   pd.read_csv(StringIO(data)).dtypes
-   pd.read_csv(StringIO(data), dtype='category').dtypes
-
-Individual columns can be parsed as a ``Categorical`` using a dict specification
-
-.. ipython:: python
-
-   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
-
-.. note::
-
-   The resulting categories will always be parsed as strings (object dtype).
-   If the categories are numeric they can be converted using the
-   :func:`to_numeric` function, or as appropriate, another converter
-   such as :func:`to_datetime`.
-
-   .. ipython:: python
-
-      df = pd.read_csv(StringIO(data), dtype='category')
-      df.dtypes
-      df['col3']
-      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
-      df['col3']
-
-
-Naming and Using Columns
-''''''''''''''''''''''''
-
-.. _io.headers:
-
-Handling column names
-+++++++++++++++++++++
-
-A file may or may not have a header row. pandas assumes the first row should be
-used as the column names:
-
-.. ipython:: python
-
-    data = 'a,b,c\n1,2,3\n4,5,6\n7,8,9'
-    print(data)
-    pd.read_csv(StringIO(data))
-
-By specifying the ``names`` argument in conjunction with ``header`` you can
-indicate other names to use and whether or not to throw away the header row (if
-any):
-
-.. ipython:: python
-
-    print(data)
-    pd.read_csv(StringIO(data), names=['foo', 'bar', 'baz'], header=0)
-    pd.read_csv(StringIO(data), names=['foo', 'bar', 'baz'], header=None)
-
-If the header is in a row other than the first, pass the row number to
-``header``. This will skip the preceding rows:
-
-.. ipython:: python
-
-    data = 'skip this skip it\na,b,c\n1,2,3\n4,5,6\n7,8,9'
-    pd.read_csv(StringIO(data), header=1)
-
-.. _io.dupe_names:
-
-Duplicate names parsing
-'''''''''''''''''''''''
-
-If the file or header contains duplicate names, pandas by default will deduplicate
-these names so as to prevent data overwrite:
-
-.. ipython :: python
-
-   data = 'a,b,a\n0,1,2\n3,4,5'
-   pd.read_csv(StringIO(data))
-
-There is no more duplicate data because ``mangle_dupe_cols=True`` by default, which modifies
-a series of duplicate columns 'X'...'X' to become 'X.0'...'X.N'.  If ``mangle_dupe_cols
-=False``, duplicate data can arise:
-
-.. code-block :: python
-
-   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
-   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
-   Out[3]:
-      a  b  a
-   0  2  1  2
-   1  5  4  5
-
-To prevent users from encountering this problem with duplicate data, a ``ValueError``
-exception is raised if ``mangle_dupe_cols != True``:
-
-.. code-block :: python
-
-   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
-   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
-   ...
-   ValueError: Setting mangle_dupe_cols=False is not supported yet
-
-.. _io.usecols:
-
-Filtering columns (``usecols``)
-+++++++++++++++++++++++++++++++
-
-The ``usecols`` argument allows you to select any subset of the columns in a
-file, either using the column names, position numbers or a callable:
-
-.. versionadded:: 0.20.0 support for callable `usecols` arguments
-
-.. ipython:: python
-
-    data = 'a,b,c,d\n1,2,3,foo\n4,5,6,bar\n7,8,9,baz'
-    pd.read_csv(StringIO(data))
-    pd.read_csv(StringIO(data), usecols=['b', 'd'])
-    pd.read_csv(StringIO(data), usecols=[0, 2, 3])
-    pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['A', 'C'])
-
-The ``usecols`` argument can also be used to specify which columns not to
-use in the final result:
-
-.. ipython:: python
-
-   pd.read_csv(StringIO(data), usecols=lambda x: x not in ['a', 'c'])
-
-In this case, the callable is specifying that we exclude the "a" and "c"
-columns from the output.
-
-Comments and Empty Lines
-''''''''''''''''''''''''
-
-.. _io.skiplines:
-
-Ignoring line comments and empty lines
-++++++++++++++++++++++++++++++++++++++
-
-If the ``comment`` parameter is specified, then completely commented lines will
-be ignored. By default, completely blank lines will be ignored as well. Both of
-these are API changes introduced in version 0.15.
-
-.. ipython:: python
-
-   data = '\na,b,c\n  \n# commented line\n1,2,3\n\n4,5,6'
-   print(data)
-   pd.read_csv(StringIO(data), comment='#')
-
-If ``skip_blank_lines=False``, then ``read_csv`` will not ignore blank lines:
-
-.. ipython:: python
-
-   data = 'a,b,c\n\n1,2,3\n\n\n4,5,6'
-   pd.read_csv(StringIO(data), skip_blank_lines=False)
-
-.. warning::
-
-   The presence of ignored lines might create ambiguities involving line numbers;
-   the parameter ``header`` uses row numbers (ignoring commented/empty
-   lines), while ``skiprows`` uses line numbers (including commented/empty lines):
-
-   .. ipython:: python
-
-      data = '#comment\na,b,c\nA,B,C\n1,2,3'
-      pd.read_csv(StringIO(data), comment='#', header=1)
-      data = 'A,B,C\n#comment\na,b,c\n1,2,3'
-      pd.read_csv(StringIO(data), comment='#', skiprows=2)
-
-   If both ``header`` and ``skiprows`` are specified, ``header`` will be
-   relative to the end of ``skiprows``. For example:
-
-   .. ipython:: python
-
-      data = '# empty\n# second empty line\n# third empty' \
-                'line\nX,Y,Z\n1,2,3\nA,B,C\n1,2.,4.\n5.,NaN,10.0'
-      print(data)
-      pd.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
-
-.. _io.comments:
-
-Comments
-++++++++
-
-Sometimes comments or meta data may be included in a file:
-
-.. ipython:: python
-   :suppress:
-
-   data =  ("ID,level,category\n"
-            "Patient1,123000,x # really unpleasant\n"
-            "Patient2,23000,y # wouldn't take his medicine\n"
-            "Patient3,1234018,z # awesome")
-
-   with open('tmp.csv', 'w') as fh:
-       fh.write(data)
-
-.. ipython:: python
-
-   print(open('tmp.csv').read())
-
-By default, the parser includes the comments in the output:
-
-.. ipython:: python
-
-   df = pd.read_csv('tmp.csv')
-   df
-
-We can suppress the comments using the ``comment`` keyword:
-
-.. ipython:: python
-
-   df = pd.read_csv('tmp.csv', comment='#')
-   df
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('tmp.csv')
-
-.. _io.unicode:
-
-Dealing with Unicode Data
-'''''''''''''''''''''''''
-
-The ``encoding`` argument should be used for encoded unicode data, which will
-result in byte strings being decoded to unicode in the result:
-
-.. ipython:: python
-
-   data = b'word,length\nTr\xc3\xa4umen,7\nGr\xc3\xbc\xc3\x9fe,5'.decode('utf8').encode('latin-1')
-   df = pd.read_csv(BytesIO(data), encoding='latin-1')
-   df
-   df['word'][1]
-
-Some formats which encode all characters as multiple bytes, like UTF-16, won't
-parse correctly at all without specifying the encoding. `Full list of Python
-standard encodings
-<https://docs.python.org/3/library/codecs.html#standard-encodings>`_
-
-.. _io.index_col:
-
-Index columns and trailing delimiters
-'''''''''''''''''''''''''''''''''''''
-
-If a file has one more column of data than the number of column names, the
-first column will be used as the DataFrame's row names:
-
-.. ipython:: python
-
-    data = 'a,b,c\n4,apple,bat,5.7\n8,orange,cow,10'
-    pd.read_csv(StringIO(data))
-
-.. ipython:: python
-
-    data = 'index,a,b,c\n4,apple,bat,5.7\n8,orange,cow,10'
-    pd.read_csv(StringIO(data), index_col=0)
-
-Ordinarily, you can achieve this behavior using the ``index_col`` option.
-
-There are some exception cases when a file has been prepared with delimiters at
-the end of each data line, confusing the parser. To explicitly disable the
-index column inference and discard the last column, pass ``index_col=False``:
-
-.. ipython:: python
-
-    data = 'a,b,c\n4,apple,bat,\n8,orange,cow,'
-    print(data)
-    pd.read_csv(StringIO(data))
-    pd.read_csv(StringIO(data), index_col=False)
-
-.. _io.parse_dates:
-
-Date Handling
-'''''''''''''
-
-Specifying Date Columns
-+++++++++++++++++++++++
-
-To better facilitate working with datetime data, :func:`read_csv` and
-:func:`read_table` use the keyword arguments ``parse_dates`` and ``date_parser``
-to allow users to specify a variety of columns and date/time formats to turn the
-input text data into ``datetime`` objects.
-
-The simplest case is to just pass in ``parse_dates=True``:
-
-.. ipython:: python
-   :suppress:
-
-   f = open('foo.csv','w')
-   f.write('date,A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
-   f.close()
-
-.. ipython:: python
-
-   # Use a column as an index, and parse it as dates.
-   df = pd.read_csv('foo.csv', index_col=0, parse_dates=True)
-   df
-
-   # These are python datetime objects
-   df.index
-
-It is often the case that we may want to store date and time data separately,
-or store various date fields separately. the ``parse_dates`` keyword can be
-used to specify a combination of columns to parse the dates and/or times from.
-
-You can specify a list of column lists to ``parse_dates``, the resulting date
-columns will be prepended to the output (so as to not affect the existing column
-order) and the new column names will be the concatenation of the component
-column names:
-
-.. ipython:: python
-   :suppress:
-
-   data =  ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-            "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-            "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-            "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-            "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-            "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-
-   with open('tmp.csv', 'w') as fh:
-       fh.write(data)
-
-.. ipython:: python
-
-    print(open('tmp.csv').read())
-    df = pd.read_csv('tmp.csv', header=None, parse_dates=[[1, 2], [1, 3]])
-    df
-
-By default the parser removes the component date columns, but you can choose
-to retain them via the ``keep_date_col`` keyword:
-
-.. ipython:: python
-
-   df = pd.read_csv('tmp.csv', header=None, parse_dates=[[1, 2], [1, 3]],
-                    keep_date_col=True)
-   df
-
-Note that if you wish to combine multiple columns into a single date column, a
-nested list must be used. In other words, ``parse_dates=[1, 2]`` indicates that
-the second and third columns should each be parsed as separate date columns
-while ``parse_dates=[[1, 2]]`` means the two columns should be parsed into a
-single column.
-
-You can also use a dict to specify custom name columns:
-
-.. ipython:: python
-
-   date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec)
-   df
-
-It is important to remember that if multiple text columns are to be parsed into
-a single date column, then a new column is prepended to the data. The `index_col`
-specification is based off of this new set of columns rather than the original
-data columns:
-
-
-.. ipython:: python
-
-   date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec,
-                    index_col=0) #index is the nominal column
-   df
-
-.. note::
-   If a column or index contains an unparseable date, the entire column or
-   index will be returned unaltered as an object data type. For non-standard
-   datetime parsing, use :func:`to_datetime` after ``pd.read_csv``.
-
-
-.. note::
-   read_csv has a fast_path for parsing datetime strings in iso8601 format,
-   e.g "2000-01-01T00:01:02+00:00" and similar variations. If you can arrange
-   for your data to store datetimes in this format, load times will be
-   significantly faster, ~20x has been observed.
-
-
-.. note::
-
-   When passing a dict as the `parse_dates` argument, the order of
-   the columns prepended is not guaranteed, because `dict` objects do not impose
-   an ordering on their keys. On Python 2.7+ you may use `collections.OrderedDict`
-   instead of a regular `dict` if this matters to you. Because of this, when using a
-   dict for 'parse_dates' in conjunction with the `index_col` argument, it's best to
-   specify `index_col` as a column label rather then as an index on the resulting frame.
-
-
-Date Parsing Functions
-++++++++++++++++++++++
-
-Finally, the parser allows you to specify a custom ``date_parser`` function to
-take full advantage of the flexibility of the date parsing API:
-
-.. ipython:: python
-
-   import pandas.io.date_converters as conv
-   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec,
-                    date_parser=conv.parse_date_time)
-   df
-
-Pandas will try to call the ``date_parser`` function in three different ways. If
-an exception is raised, the next one is tried:
-
-1. ``date_parser`` is first called with one or more arrays as arguments,
-   as defined using `parse_dates` (e.g., ``date_parser(['2013', '2013'], ['1', '2'])``)
-
-2. If #1 fails, ``date_parser`` is called with all the columns
-   concatenated row-wise into a single array (e.g., ``date_parser(['2013 1', '2013 2'])``)
-
-3. If #2 fails, ``date_parser`` is called once for every row with one or more
-   string arguments from the columns indicated with `parse_dates`
-   (e.g., ``date_parser('2013', '1')`` for the first row, ``date_parser('2013', '2')``
-   for the second, etc.)
-
-Note that performance-wise, you should try these methods of parsing dates in order:
-
-1. Try to infer the format using ``infer_datetime_format=True`` (see section below)
-
-2. If you know the format, use ``pd.to_datetime()``:
-   ``date_parser=lambda x: pd.to_datetime(x, format=...)``
-
-3. If you have a really non-standard format, use a custom ``date_parser`` function.
-   For optimal performance, this should be vectorized, i.e., it should accept arrays
-   as arguments.
-
-You can explore the date parsing functionality in ``date_converters.py`` and
-add your own. We would love to turn this module into a community supported set
-of date/time parsers. To get you started, ``date_converters.py`` contains
-functions to parse dual date and time columns, year/month/day columns,
-and year/month/day/hour/minute/second columns. It also contains a
-``generic_parser`` function so you can curry it with a function that deals with
-a single date rather than the entire array.
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('tmp.csv')
-
-.. _io.dayfirst:
-
-
-Inferring Datetime Format
-+++++++++++++++++++++++++
-
-If you have ``parse_dates`` enabled for some or all of your columns, and your
-datetime strings are all formatted the same way, you may get a large speed
-up by setting ``infer_datetime_format=True``.  If set, pandas will attempt
-to guess the format of your datetime strings, and then use a faster means
-of parsing the strings.  5-10x parsing speeds have been observed.  pandas
-will fallback to the usual parsing if either the format cannot be guessed
-or the format that was guessed cannot properly parse the entire column
-of strings.  So in general, ``infer_datetime_format`` should not have any
-negative consequences if enabled.
-
-Here are some examples of datetime strings that can be guessed (All
-representing December 30th, 2011 at 00:00:00)
-
-- "20111230"
-- "2011/12/30"
-- "20111230 00:00:00"
-- "12/30/2011 00:00:00"
-- "30/Dec/2011 00:00:00"
-- "30/December/2011 00:00:00"
-
-``infer_datetime_format`` is sensitive to ``dayfirst``.  With
-``dayfirst=True``, it will guess "01/12/2011" to be December 1st. With
-``dayfirst=False`` (default) it will guess "01/12/2011" to be January 12th.
-
-.. ipython:: python
-
-   # Try to infer the format for the index column
-   df = pd.read_csv('foo.csv', index_col=0, parse_dates=True,
-                    infer_datetime_format=True)
-   df
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.csv')
-
-International Date Formats
-++++++++++++++++++++++++++
-
-While US date formats tend to be MM/DD/YYYY, many international formats use
-DD/MM/YYYY instead. For convenience, a ``dayfirst`` keyword is provided:
-
-.. ipython:: python
-   :suppress:
-
-   data = "date,value,cat\n1/6/2000,5,a\n2/6/2000,10,b\n3/6/2000,15,c"
-   with open('tmp.csv', 'w') as fh:
-        fh.write(data)
-
-.. ipython:: python
-
-   print(open('tmp.csv').read())
-
-   pd.read_csv('tmp.csv', parse_dates=[0])
-   pd.read_csv('tmp.csv', dayfirst=True, parse_dates=[0])
-
-.. _io.float_precision:
-
-Specifying method for floating-point conversion
-'''''''''''''''''''''''''''''''''''''''''''''''
-
-The parameter ``float_precision`` can be specified in order to use
-a specific floating-point converter during parsing with the C engine.
-The options are the ordinary converter, the high-precision converter, and
-the round-trip converter (which is guaranteed to round-trip values after
-writing to a file). For example:
-
-.. ipython:: python
-
-   val = '0.3066101993807095471566981359501369297504425048828125'
-   data = 'a,b,c\n1,2,{0}'.format(val)
-   abs(pd.read_csv(StringIO(data), engine='c', float_precision=None)['c'][0] - float(val))
-   abs(pd.read_csv(StringIO(data), engine='c', float_precision='high')['c'][0] - float(val))
-   abs(pd.read_csv(StringIO(data), engine='c', float_precision='round_trip')['c'][0] - float(val))
-
-
-.. _io.thousands:
-
-Thousand Separators
-'''''''''''''''''''
-
-For large numbers that have been written with a thousands separator, you can
-set the ``thousands`` keyword to a string of length 1 so that integers will be parsed
-correctly:
-
-.. ipython:: python
-   :suppress:
-
-   data =  ("ID|level|category\n"
-            "Patient1|123,000|x\n"
-            "Patient2|23,000|y\n"
-            "Patient3|1,234,018|z")
-
-   with open('tmp.csv', 'w') as fh:
-       fh.write(data)
-
-By default, numbers with a thousands separator will be parsed as strings
-
-.. ipython:: python
-
-    print(open('tmp.csv').read())
-    df = pd.read_csv('tmp.csv', sep='|')
-    df
-
-    df.level.dtype
-
-The ``thousands`` keyword allows integers to be parsed correctly
-
-.. ipython:: python
-
-    print(open('tmp.csv').read())
-    df = pd.read_csv('tmp.csv', sep='|', thousands=',')
-    df
-
-    df.level.dtype
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('tmp.csv')
-
-.. _io.na_values:
-
-NA Values
-'''''''''
-
-To control which values are parsed as missing values (which are signified by ``NaN``), specifiy a
-string in ``na_values``. If you specify a list of strings, then all values in
-it are considered to be missing values. If you specify a number (a ``float``, like ``5.0`` or an ``integer`` like ``5``),
-the corresponding equivalent values will also imply a missing value (in this case effectively
-``[5.0,5]`` are recognized as ``NaN``.
-
-To completely override the default values that are recognized as missing, specify ``keep_default_na=False``.
-The default ``NaN`` recognized values are ``['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A','N/A', 'NA',
-'#NA', 'NULL', 'NaN', '-NaN', 'nan', '-nan']``. Although a 0-length string
-``''`` is not included in the default ``NaN`` values list, it is still treated
-as a missing value.
-
-.. code-block:: python
-
-   read_csv(path, na_values=[5])
-
-the default values, in addition to ``5`` , ``5.0`` when interpreted as numbers are recognized as ``NaN``
-
-.. code-block:: python
-
-   read_csv(path, keep_default_na=False, na_values=[""])
-
-only an empty field will be ``NaN``
-
-.. code-block:: python
-
-   read_csv(path, keep_default_na=False, na_values=["NA", "0"])
-
-only ``NA`` and ``0`` as strings are ``NaN``
-
-.. code-block:: python
-
-   read_csv(path, na_values=["Nope"])
-
-the default values, in addition to the string ``"Nope"`` are recognized as ``NaN``
-
-.. _io.infinity:
-
-Infinity
-''''''''
-
-``inf`` like values will be parsed as ``np.inf`` (positive infinity), and ``-inf`` as ``-np.inf`` (negative infinity).
-These will ignore the case of the value, meaning ``Inf``, will also be parsed as ``np.inf``.
-
-
-Returning Series
-''''''''''''''''
-
-Using the ``squeeze`` keyword, the parser will return output with a single column
-as a ``Series``:
-
-.. ipython:: python
-   :suppress:
-
-   data =  ("level\n"
-            "Patient1,123000\n"
-            "Patient2,23000\n"
-            "Patient3,1234018")
-
-   with open('tmp.csv', 'w') as fh:
-       fh.write(data)
-
-.. ipython:: python
-
-   print(open('tmp.csv').read())
-
-   output =  pd.read_csv('tmp.csv', squeeze=True)
-   output
-
-   type(output)
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('tmp.csv')
-
-.. _io.boolean:
-
-Boolean values
-''''''''''''''
-
-The common values ``True``, ``False``, ``TRUE``, and ``FALSE`` are all
-recognized as boolean. Sometime you would want to recognize some other values
-as being boolean. To do this use the ``true_values`` and ``false_values``
-options:
-
-.. ipython:: python
-
-    data= 'a,b,c\n1,Yes,2\n3,No,4'
-    print(data)
-    pd.read_csv(StringIO(data))
-    pd.read_csv(StringIO(data), true_values=['Yes'], false_values=['No'])
-
-.. _io.bad_lines:
-
-Handling "bad" lines
-''''''''''''''''''''
-
-Some files may have malformed lines with too few fields or too many. Lines with
-too few fields will have NA values filled in the trailing fields. Lines with
-too many will cause an error by default:
-
-.. ipython:: python
-   :suppress:
-
-    data = 'a,b,c\n1,2,3\n4,5,6,7\n8,9,10'
-
-.. code-block:: ipython
-
-    In [27]: data = 'a,b,c\n1,2,3\n4,5,6,7\n8,9,10'
-
-    In [28]: pd.read_csv(StringIO(data))
-    ---------------------------------------------------------------------------
-    ParserError                              Traceback (most recent call last)
-    ParserError: Error tokenizing data. C error: Expected 3 fields in line 3, saw 4
-
-You can elect to skip bad lines:
-
-.. code-block:: ipython
-
-    In [29]: pd.read_csv(StringIO(data), error_bad_lines=False)
-    Skipping line 3: expected 3 fields, saw 4
-
-    Out[29]:
-       a  b   c
-    0  1  2   3
-    1  8  9  10
-
-You can also use the ``usecols`` parameter to eliminate extraneous column
-data that appear in some lines but not others:
-
-.. code-block:: ipython
-
-   In [30]: pd.read_csv(StringIO(data), usecols=[0, 1, 2])
-
-    Out[30]:
-       a  b   c
-    0  1  2   3
-    1  4  5   6
-    2  8  9  10
-
-.. _io.dialect:
-
-Dialect
-'''''''
-
-The ``dialect`` keyword gives greater flexibility in specifying the file format.
-By default it uses the Excel dialect but you can specify either the dialect name
-or a :class:`python:csv.Dialect` instance.
-
-.. ipython:: python
-   :suppress:
-
-   data = ('label1,label2,label3\n'
-           'index1,"a,c,e\n'
-           'index2,b,d,f')
-
-Suppose you had data with unenclosed quotes:
-
-.. ipython:: python
-
-   print(data)
-
-By default, ``read_csv`` uses the Excel dialect and treats the double quote as
-the quote character, which causes it to fail when it finds a newline before it
-finds the closing double quote.
-
-We can get around this using ``dialect``
-
-.. ipython:: python
-   :okwarning:
-
-   dia = csv.excel()
-   dia.quoting = csv.QUOTE_NONE
-   pd.read_csv(StringIO(data), dialect=dia)
-
-All of the dialect options can be specified separately by keyword arguments:
-
-.. ipython:: python
-
-    data = 'a,b,c~1,2,3~4,5,6'
-    pd.read_csv(StringIO(data), lineterminator='~')
-
-Another common dialect option is ``skipinitialspace``, to skip any whitespace
-after a delimiter:
-
-.. ipython:: python
-
-   data = 'a, b, c\n1, 2, 3\n4, 5, 6'
-   print(data)
-   pd.read_csv(StringIO(data), skipinitialspace=True)
-
-The parsers make every attempt to "do the right thing" and not be very
-fragile. Type inference is a pretty big deal. So if a column can be coerced to
-integer dtype without altering the contents, it will do so. Any non-numeric
-columns will come through as object dtype as with the rest of pandas objects.
-
-.. _io.quoting:
-
-Quoting and Escape Characters
-'''''''''''''''''''''''''''''
-
-Quotes (and other escape characters) in embedded fields can be handled in any
-number of ways. One way is to use backslashes; to properly parse this data, you
-should pass the ``escapechar`` option:
-
-.. ipython:: python
-
-   data = 'a,b\n"hello, \\"Bob\\", nice to see you",5'
-   print(data)
-   pd.read_csv(StringIO(data), escapechar='\\')
-
-.. _io.fwf:
-
-Files with Fixed Width Columns
-''''''''''''''''''''''''''''''
-
-While ``read_csv`` reads delimited data, the :func:`read_fwf` function works
-with data files that have known and fixed column widths. The function parameters
-to ``read_fwf`` are largely the same as `read_csv` with two extra parameters:
-
-  - ``colspecs``: A list of pairs (tuples) giving the extents of the
-    fixed-width fields of each line as half-open intervals (i.e.,  [from, to[ ).
-    String value 'infer' can be used to instruct the parser to try detecting
-    the column specifications from the first 100 rows of the data. Default
-    behaviour, if not specified, is to infer.
-  - ``widths``: A list of field widths which can be used instead of 'colspecs'
-    if the intervals are contiguous.
-
-.. ipython:: python
-   :suppress:
-
-   f = open('bar.csv', 'w')
-   data1 = ("id8141    360.242940   149.910199   11950.7\n"
-            "id1594    444.953632   166.985655   11788.4\n"
-            "id1849    364.136849   183.628767   11806.2\n"
-            "id1230    413.836124   184.375703   11916.8\n"
-            "id1948    502.953953   173.237159   12468.3")
-   f.write(data1)
-   f.close()
-
-Consider a typical fixed-width data file:
-
-.. ipython:: python
-
-   print(open('bar.csv').read())
-
-In order to parse this file into a DataFrame, we simply need to supply the
-column specifications to the `read_fwf` function along with the file name:
-
-.. ipython:: python
-
-   #Column specifications are a list of half-intervals
-   colspecs = [(0, 6), (8, 20), (21, 33), (34, 43)]
-   df = pd.read_fwf('bar.csv', colspecs=colspecs, header=None, index_col=0)
-   df
-
-Note how the parser automatically picks column names X.<column number> when
-``header=None`` argument is specified. Alternatively, you can supply just the
-column widths for contiguous columns:
-
-.. ipython:: python
-
-   #Widths are a list of integers
-   widths = [6, 14, 13, 10]
-   df = pd.read_fwf('bar.csv', widths=widths, header=None)
-   df
-
-The parser will take care of extra white spaces around the columns
-so it's ok to have extra separation between the columns in the file.
-
-.. versionadded:: 0.13.0
-
-By default, ``read_fwf`` will try to infer the file's ``colspecs`` by using the
-first 100 rows of the file. It can do it only in cases when the columns are
-aligned and correctly separated by the provided ``delimiter`` (default delimiter
-is whitespace).
-
-.. ipython:: python
-
-   df = pd.read_fwf('bar.csv', header=None, index_col=0)
-   df
-
-.. versionadded:: 0.20.0
-
-``read_fwf`` supports the ``dtype`` parameter for specifying the types of
-parsed columns to be different from the inferred type.
-
-.. ipython:: python
-
-   pd.read_fwf('bar.csv', header=None, index_col=0).dtypes
-   pd.read_fwf('bar.csv', header=None, dtype={2: 'object'}).dtypes
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('bar.csv')
-
-
-Indexes
-'''''''
-
-Files with an "implicit" index column
-+++++++++++++++++++++++++++++++++++++
-
-.. ipython:: python
-   :suppress:
-
-   f = open('foo.csv', 'w')
-   f.write('A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
-   f.close()
-
-Consider a file with one less entry in the header than the number of data
-column:
-
-.. ipython:: python
-
-   print(open('foo.csv').read())
-
-In this special case, ``read_csv`` assumes that the first column is to be used
-as the index of the DataFrame:
-
-.. ipython:: python
-
-   pd.read_csv('foo.csv')
-
-Note that the dates weren't automatically parsed. In that case you would need
-to do as before:
-
-.. ipython:: python
-
-   df = pd.read_csv('foo.csv', parse_dates=True)
-   df.index
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('foo.csv')
-
-
-Reading an index with a ``MultiIndex``
-++++++++++++++++++++++++++++++++++++++
-
-.. _io.csv_multiindex:
-
-Suppose you have data indexed by two columns:
-
-.. ipython:: python
-
-   print(open('data/mindex_ex.csv').read())
-
-The ``index_col`` argument to ``read_csv`` and ``read_table`` can take a list of
-column numbers to turn multiple columns into a ``MultiIndex`` for the index of the
-returned object:
-
-.. ipython:: python
-
-   df = pd.read_csv("data/mindex_ex.csv", index_col=[0,1])
-   df
-   df.loc[1978]
-
-.. _io.multi_index_columns:
-
-Reading columns with a ``MultiIndex``
-+++++++++++++++++++++++++++++++++++++
-
-By specifying list of row locations for the ``header`` argument, you
-can read in a ``MultiIndex`` for the columns. Specifying non-consecutive
-rows will skip the intervening rows. In order to have the pre-0.13 behavior
-of tupleizing columns, specify ``tupleize_cols=True``.
-
-.. ipython:: python
-
-   from pandas.util.testing import makeCustomDataframe as mkdf
-   df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-   df.to_csv('mi.csv')
-   print(open('mi.csv').read())
-   pd.read_csv('mi.csv',header=[0,1,2,3],index_col=[0,1])
-
-Starting in 0.13.0, ``read_csv`` will be able to interpret a more common format
-of multi-columns indices.
-
-.. ipython:: python
-   :suppress:
-
-   data = ",a,a,a,b,c,c\n,q,r,s,t,u,v\none,1,2,3,4,5,6\ntwo,7,8,9,10,11,12"
-   fh = open('mi2.csv','w')
-   fh.write(data)
-   fh.close()
-
-.. ipython:: python
-
-   print(open('mi2.csv').read())
-   pd.read_csv('mi2.csv',header=[0,1],index_col=0)
-
-Note: If an ``index_col`` is not specified (e.g. you don't have an index, or wrote it
-with ``df.to_csv(..., index=False``), then any ``names`` on the columns index will be *lost*.
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('mi.csv')
-   os.remove('mi2.csv')
-
-.. _io.sniff:
-
-Automatically "sniffing" the delimiter
-''''''''''''''''''''''''''''''''''''''
-
-``read_csv`` is capable of inferring delimited (not necessarily
-comma-separated) files, as pandas uses the :class:`python:csv.Sniffer`
-class of the csv module. For this, you have to specify ``sep=None``.
-
-.. ipython:: python
-   :suppress:
-
-   df = pd.DataFrame(np.random.randn(10, 4))
-   df.to_csv('tmp.sv', sep='|')
-   df.to_csv('tmp2.sv', sep=':')
-
-.. ipython:: python
-
-    print(open('tmp2.sv').read())
-    pd.read_csv('tmp2.sv', sep=None, engine='python')
-
-.. _io.chunking:
-
-Iterating through files chunk by chunk
-''''''''''''''''''''''''''''''''''''''
-
-Suppose you wish to iterate through a (potentially very large) file lazily
-rather than reading the entire file into memory, such as the following:
-
-
-.. ipython:: python
-
-   print(open('tmp.sv').read())
-   table = pd.read_table('tmp.sv', sep='|')
-   table
-
-
-By specifying a ``chunksize`` to ``read_csv`` or ``read_table``, the return
-value will be an iterable object of type ``TextFileReader``:
-
-.. ipython:: python
-
-   reader = pd.read_table('tmp.sv', sep='|', chunksize=4)
-   reader
-
-   for chunk in reader:
-       print(chunk)
-
-
-Specifying ``iterator=True`` will also return the ``TextFileReader`` object:
-
-.. ipython:: python
-
-   reader = pd.read_table('tmp.sv', sep='|', iterator=True)
-   reader.get_chunk(5)
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('tmp.sv')
-   os.remove('tmp2.sv')
-
-Specifying the parser engine
-''''''''''''''''''''''''''''
-
-Under the hood pandas uses a fast and efficient parser implemented in C as well
-as a python implementation which is currently more feature-complete. Where
-possible pandas uses the C parser (specified as ``engine='c'``), but may fall
-back to python if C-unsupported options are specified. Currently, C-unsupported
-options include:
-
-- ``sep`` other than a single character (e.g. regex separators)
-- ``skipfooter``
-- ``sep=None`` with ``delim_whitespace=False``
-
-Specifying any of the above options will produce a ``ParserWarning`` unless the
-python engine is selected explicitly using ``engine='python'``.
-
-Reading remote files
-''''''''''''''''''''
-
-You can pass in a URL to a CSV file:
-
-.. code-block:: python
-
-   df = pd.read_csv('https://download.bls.gov/pub/time.series/cu/cu.item',
-                    sep='\t')
-
-S3 URLs are handled as well:
-
-.. code-block:: python
-
-   df = pd.read_csv('s3://pandas-test/tips.csv')
-
-
-Writing out Data
-''''''''''''''''
-
-.. _io.store_in_csv:
-
-Writing to CSV format
-+++++++++++++++++++++
-
-The Series and DataFrame objects have an instance method ``to_csv`` which
-allows storing the contents of the object as a comma-separated-values file. The
-function takes a number of arguments. Only the first is required.
-
-  - ``path_or_buf``: A string path to the file to write or a StringIO
-  - ``sep`` : Field delimiter for the output file (default ",")
-  - ``na_rep``: A string representation of a missing value (default '')
-  - ``float_format``: Format string for floating point numbers
-  - ``cols``: Columns to write (default None)
-  - ``header``: Whether to write out the column names (default True)
-  - ``index``: whether to write row (index) names (default True)
-  - ``index_label``: Column label(s) for index column(s) if desired. If None
-    (default), and `header` and `index` are True, then the index names are
-    used. (A sequence should be given if the DataFrame uses MultiIndex).
-  - ``mode`` : Python write mode, default 'w'
-  - ``encoding``: a string representing the encoding to use if the contents are
-    non-ASCII, for python versions prior to 3
-  - ``line_terminator``: Character sequence denoting line end (default '\\n')
-  - ``quoting``: Set quoting rules as in csv module (default csv.QUOTE_MINIMAL). Note that if you have set a `float_format` then floats are converted to strings and csv.QUOTE_NONNUMERIC will treat them as non-numeric
-  - ``quotechar``: Character used to quote fields (default '"')
-  - ``doublequote``: Control quoting of ``quotechar`` in fields (default True)
-  - ``escapechar``: Character used to escape ``sep`` and ``quotechar`` when
-    appropriate (default None)
-  - ``chunksize``: Number of rows to write at a time
-  - ``tupleize_cols``: If False (default), write as a list of tuples, otherwise
-    write in an expanded line format suitable for ``read_csv``
-  - ``date_format``: Format string for datetime objects
-
-Writing a formatted string
-++++++++++++++++++++++++++
-
-.. _io.formatting:
-
-The DataFrame object has an instance method ``to_string`` which allows control
-over the string representation of the object. All arguments are optional:
-
-  - ``buf`` default None, for example a StringIO object
-  - ``columns`` default None, which columns to write
-  - ``col_space`` default None, minimum width of each column.
-  - ``na_rep`` default ``NaN``, representation of NA value
-  - ``formatters`` default None, a dictionary (by column) of functions each of
-    which takes a single argument and returns a formatted string
-  - ``float_format`` default None, a function which takes a single (float)
-    argument and returns a formatted string; to be applied to floats in the
-    DataFrame.
-  - ``sparsify`` default True, set to False for a DataFrame with a hierarchical
-    index to print every multiindex key at each row.
-  - ``index_names`` default True, will print the names of the indices
-  - ``index`` default True, will print the index (ie, row labels)
-  - ``header`` default True, will print the column labels
-  - ``justify`` default ``left``, will print column headers left- or
-    right-justified
-
-The Series object also has a ``to_string`` method, but with only the ``buf``,
-``na_rep``, ``float_format`` arguments. There is also a ``length`` argument
-which, if set to ``True``, will additionally output the length of the Series.
-
-.. _io.json:
-
-JSON
-----
-
-Read and write ``JSON`` format files and strings.
-
-.. _io.json_writer:
-
-Writing JSON
-''''''''''''
-
-A ``Series`` or ``DataFrame`` can be converted to a valid JSON string. Use ``to_json``
-with optional parameters:
-
-- ``path_or_buf`` : the pathname or buffer to write the output
-  This can be ``None`` in which case a JSON string is returned
-- ``orient`` :
-
-  Series :
-      - default is ``index``
-      - allowed values are {``split``, ``records``, ``index``}
-
-  DataFrame
-      - default is ``columns``
-      - allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``}
-
-  The format of the JSON string
-
-  .. csv-table::
-     :widths: 20, 150
-     :delim: ;
-
-     ``split``; dict like {index -> [index], columns -> [columns], data -> [values]}
-     ``records``; list like [{column -> value}, ... , {column -> value}]
-     ``index``; dict like {index -> {column -> value}}
-     ``columns``; dict like {column -> {index -> value}}
-     ``values``; just the values array
-
-- ``date_format`` : string, type of date conversion, 'epoch' for timestamp, 'iso' for ISO8601.
-- ``double_precision`` : The number of decimal places to use when encoding floating point values, default 10.
-- ``force_ascii`` : force encoded string to be ASCII, default True.
-- ``date_unit`` : The time unit to encode to, governs timestamp and ISO8601 precision. One of 's', 'ms', 'us' or 'ns' for seconds, milliseconds, microseconds and nanoseconds respectively. Default 'ms'.
-- ``default_handler`` : The handler to call if an object cannot otherwise be converted to a suitable format for JSON. Takes a single argument, which is the object to convert, and returns a serializable object.
-- ``lines`` : If ``records`` orient, then will write each record per line as json.
-
-Note ``NaN``'s, ``NaT``'s and ``None`` will be converted to ``null`` and ``datetime`` objects will be converted based on the ``date_format`` and ``date_unit`` parameters.
-
-.. ipython:: python
-
-   dfj = pd.DataFrame(randn(5, 2), columns=list('AB'))
-   json = dfj.to_json()
-   json
-
-Orient Options
-++++++++++++++
-
-There are a number of different options for the format of the resulting JSON
-file / string. Consider the following DataFrame and Series:
-
-.. ipython:: python
-
-  dfjo = pd.DataFrame(dict(A=range(1, 4), B=range(4, 7), C=range(7, 10)),
-                      columns=list('ABC'), index=list('xyz'))
-  dfjo
-  sjo = pd.Series(dict(x=15, y=16, z=17), name='D')
-  sjo
-
-**Column oriented** (the default for ``DataFrame``) serializes the data as
-nested JSON objects with column labels acting as the primary index:
-
-.. ipython:: python
-
-  dfjo.to_json(orient="columns")
-  # Not available for Series
-
-**Index oriented** (the default for ``Series``) similar to column oriented
-but the index labels are now primary:
-
-.. ipython:: python
-
-  dfjo.to_json(orient="index")
-  sjo.to_json(orient="index")
-
-**Record oriented** serializes the data to a JSON array of column -> value records,
-index labels are not included. This is useful for passing DataFrame data to plotting
-libraries, for example the JavaScript library d3.js:
-
-.. ipython:: python
-
-  dfjo.to_json(orient="records")
-  sjo.to_json(orient="records")
-
-**Value oriented** is a bare-bones option which serializes to nested JSON arrays of
-values only, column and index labels are not included:
-
-.. ipython:: python
-
-  dfjo.to_json(orient="values")
-  # Not available for Series
-
-**Split oriented** serializes to a JSON object containing separate entries for
-values, index and columns. Name is also included for ``Series``:
-
-.. ipython:: python
-
-  dfjo.to_json(orient="split")
-  sjo.to_json(orient="split")
-
-.. note::
-
-  Any orient option that encodes to a JSON object will not preserve the ordering of
-  index and column labels during round-trip serialization. If you wish to preserve
-  label ordering use the `split` option as it uses ordered containers.
-
-Date Handling
-+++++++++++++
-
-Writing in ISO date format
-
-.. ipython:: python
-
-   dfd = pd.DataFrame(randn(5, 2), columns=list('AB'))
-   dfd['date'] = pd.Timestamp('20130101')
-   dfd = dfd.sort_index(1, ascending=False)
-   json = dfd.to_json(date_format='iso')
-   json
-
-Writing in ISO date format, with microseconds
-
-.. ipython:: python
-
-   json = dfd.to_json(date_format='iso', date_unit='us')
-   json
-
-Epoch timestamps, in seconds
-
-.. ipython:: python
-
-   json = dfd.to_json(date_format='epoch', date_unit='s')
-   json
-
-Writing to a file, with a date index and a date column
-
-.. ipython:: python
-
-   dfj2 = dfj.copy()
-   dfj2['date'] = pd.Timestamp('20130101')
-   dfj2['ints'] = list(range(5))
-   dfj2['bools'] = True
-   dfj2.index = pd.date_range('20130101', periods=5)
-   dfj2.to_json('test.json')
-   open('test.json').read()
-
-Fallback Behavior
-+++++++++++++++++
-
-If the JSON serializer cannot handle the container contents directly it will fallback in the following manner:
-
-- if the dtype is unsupported (e.g. ``np.complex``) then the ``default_handler``, if provided, will be called
-  for each value, otherwise an exception is raised.
-
-- if an object is unsupported it will attempt the following:
-
-
-  * check if the object has defined a ``toDict`` method and call it.
-    A ``toDict`` method should return a ``dict`` which will then be JSON serialized.
-
-  * invoke the ``default_handler`` if one was provided.
-
-  * convert the object to a ``dict`` by traversing its contents. However this will often fail
-    with an ``OverflowError`` or give unexpected results.
-
-In general the best approach for unsupported objects or dtypes is to provide a ``default_handler``.
-For example:
-
-.. code-block:: python
-
-  DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json()  # raises
-
-  RuntimeError: Unhandled numpy dtype 15
-
-can be dealt with by specifying a simple ``default_handler``:
-
-.. ipython:: python
-
-   pd.DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json(default_handler=str)
-
-.. _io.json_reader:
-
-Reading JSON
-''''''''''''
-
-Reading a JSON string to pandas object can take a number of parameters.
-The parser will try to parse a ``DataFrame`` if ``typ`` is not supplied or
-is ``None``. To explicitly force ``Series`` parsing, pass ``typ=series``
-
-- ``filepath_or_buffer`` : a **VALID** JSON string or file handle / StringIO. The string could be
-  a URL. Valid URL schemes include http, ftp, S3, and file. For file URLs, a host
-  is expected. For instance, a local file could be
-  file ://localhost/path/to/table.json
-- ``typ``    : type of object to recover (series or frame), default 'frame'
-- ``orient`` :
-
-  Series :
-      - default is ``index``
-      - allowed values are {``split``, ``records``, ``index``}
-
-  DataFrame
-      - default is ``columns``
-      - allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``}
-
-  The format of the JSON string
-
-  .. csv-table::
-     :widths: 20, 150
-     :delim: ;
-
-     ``split``; dict like {index -> [index], columns -> [columns], data -> [values]}
-     ``records``; list like [{column -> value}, ... , {column -> value}]
-     ``index``; dict like {index -> {column -> value}}
-     ``columns``; dict like {column -> {index -> value}}
-     ``values``; just the values array
-
-- ``dtype`` : if True, infer dtypes, if a dict of column to dtype, then use those, if False, then don't infer dtypes at all, default is True, apply only to the data
-- ``convert_axes`` : boolean, try to convert the axes to the proper dtypes, default is True
-- ``convert_dates`` : a list of columns to parse for dates; If True, then try to parse date-like columns, default is True
-- ``keep_default_dates`` : boolean, default True. If parsing dates, then parse the default date-like columns
-- ``numpy`` : direct decoding to numpy arrays. default is False;
-  Supports numeric data only, although labels may be non-numeric. Also note that the JSON ordering **MUST** be the same for each term if ``numpy=True``
-- ``precise_float`` : boolean, default ``False``. Set to enable usage of higher precision (strtod) function when decoding string to double values. Default (``False``) is to use fast but less precise builtin functionality
-- ``date_unit`` : string, the timestamp unit to detect if converting dates. Default
-  None. By default the timestamp precision will be detected, if this is not desired
-  then pass one of 's', 'ms', 'us' or 'ns' to force timestamp precision to
-  seconds, milliseconds, microseconds or nanoseconds respectively.
-- ``lines`` : reads file as one json object per line.
-- ``encoding`` : The encoding to use to decode py3 bytes.
-
-The parser will raise one of ``ValueError/TypeError/AssertionError`` if the JSON is not parseable.
-
-If a non-default ``orient`` was used when encoding to JSON be sure to pass the same
-option here so that decoding produces sensible results, see `Orient Options`_ for an
-overview.
-
-Data Conversion
-+++++++++++++++
-
-The default of ``convert_axes=True``, ``dtype=True``, and ``convert_dates=True`` will try to parse the axes, and all of the data
-into appropriate types, including dates. If you need to override specific dtypes, pass a dict to ``dtype``. ``convert_axes`` should only
-be set to ``False`` if you need to preserve string-like numbers (e.g. '1', '2') in an axes.
-
-.. note::
-
-  Large integer values may be converted to dates if ``convert_dates=True`` and the data and / or column labels appear 'date-like'. The exact threshold depends on the ``date_unit`` specified. 'date-like' means that the column label meets one of the following criteria:
-
-     * it ends with ``'_at'``
-     * it ends with ``'_time'``
-     * it begins with ``'timestamp'``
-     * it is ``'modified'``
-     * it is ``'date'``
-
-.. warning::
-
-   When reading JSON data, automatic coercing into dtypes has some quirks:
-
-     * an index can be reconstructed in a different order from serialization, that is, the returned order is not guaranteed to be the same as before serialization
-     * a column that was ``float`` data will be converted to ``integer`` if it can be done safely, e.g. a column of ``1.``
-     * bool columns will be converted to ``integer`` on reconstruction
-
-   Thus there are times where you may want to specify specific dtypes via the ``dtype`` keyword argument.
-
-Reading from a JSON string:
-
-.. ipython:: python
-
-   pd.read_json(json)
-
-Reading from a file:
-
-.. ipython:: python
-
-   pd.read_json('test.json')
-
-Don't convert any data (but still convert axes and dates):
-
-.. ipython:: python
-
-   pd.read_json('test.json', dtype=object).dtypes
-
-Specify dtypes for conversion:
-
-.. ipython:: python
-
-   pd.read_json('test.json', dtype={'A' : 'float32', 'bools' : 'int8'}).dtypes
-
-Preserve string indices:
-
-.. ipython:: python
-
-   si = pd.DataFrame(np.zeros((4, 4)),
-            columns=list(range(4)),
-            index=[str(i) for i in range(4)])
-   si
-   si.index
-   si.columns
-   json = si.to_json()
-
-   sij = pd.read_json(json, convert_axes=False)
-   sij
-   sij.index
-   sij.columns
-
-Dates written in nanoseconds need to be read back in nanoseconds:
-
-.. ipython:: python
-
-   json = dfj2.to_json(date_unit='ns')
-
-   # Try to parse timestamps as millseconds -> Won't Work
-   dfju = pd.read_json(json, date_unit='ms')
-   dfju
-
-   # Let pandas detect the correct precision
-   dfju = pd.read_json(json)
-   dfju
-
-   # Or specify that all timestamps are in nanoseconds
-   dfju = pd.read_json(json, date_unit='ns')
-   dfju
-
-The Numpy Parameter
-+++++++++++++++++++
-
-.. note::
-  This supports numeric data only. Index and columns labels may be non-numeric, e.g. strings, dates etc.
-
-If ``numpy=True`` is passed to ``read_json`` an attempt will be made to sniff
-an appropriate dtype during deserialization and to subsequently decode directly
-to numpy arrays, bypassing the need for intermediate Python objects.
-
-This can provide speedups if you are deserialising a large amount of numeric
-data:
-
-.. ipython:: python
-
-   randfloats = np.random.uniform(-100, 1000, 10000)
-   randfloats.shape = (1000, 10)
-   dffloats = pd.DataFrame(randfloats, columns=list('ABCDEFGHIJ'))
-
-   jsonfloats = dffloats.to_json()
-
-.. ipython:: python
-
-   timeit pd.read_json(jsonfloats)
-
-.. ipython:: python
-
-   timeit pd.read_json(jsonfloats, numpy=True)
-
-The speedup is less noticeable for smaller datasets:
-
-.. ipython:: python
-
-   jsonfloats = dffloats.head(100).to_json()
-
-.. ipython:: python
-
-   timeit pd.read_json(jsonfloats)
-
-.. ipython:: python
-
-   timeit pd.read_json(jsonfloats, numpy=True)
-
-.. warning::
-
-   Direct numpy decoding makes a number of assumptions and may fail or produce
-   unexpected output if these assumptions are not satisfied:
-
-    - data is numeric.
-
-    - data is uniform. The dtype is sniffed from the first value decoded.
-      A ``ValueError`` may be raised, or incorrect output may be produced
-      if this condition is not satisfied.
-
-    - labels are ordered. Labels are only read from the first container, it is assumed
-      that each subsequent row / column has been encoded in the same order. This should be satisfied if the
-      data was encoded using ``to_json`` but may not be the case if the JSON
-      is from another source.
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('test.json')
-
-.. _io.json_normalize:
-
-Normalization
-'''''''''''''
-
-.. versionadded:: 0.13.0
-
-pandas provides a utility function to take a dict or list of dicts and *normalize* this semi-structured data
-into a flat table.
-
-.. ipython:: python
-
-   from pandas.io.json import json_normalize
-   data = [{'state': 'Florida',
-             'shortname': 'FL',
-             'info': {
-                  'governor': 'Rick Scott'
-             },
-             'counties': [{'name': 'Dade', 'population': 12345},
-                         {'name': 'Broward', 'population': 40000},
-                         {'name': 'Palm Beach', 'population': 60000}]},
-            {'state': 'Ohio',
-             'shortname': 'OH',
-             'info': {
-                  'governor': 'John Kasich'
-             },
-             'counties': [{'name': 'Summit', 'population': 1234},
-                          {'name': 'Cuyahoga', 'population': 1337}]}]
-
-   json_normalize(data, 'counties', ['state', 'shortname', ['info', 'governor']])
-
-.. _io.jsonl:
-
-Line delimited json
-'''''''''''''''''''
-
-.. versionadded:: 0.19.0
-
-pandas is able to read and write line-delimited json files that are common in data processing pipelines
-using Hadoop or Spark.
-
-.. ipython:: python
-
-  jsonl = '''
-      {"a":1,"b":2}
-      {"a":3,"b":4}
-  '''
-  df = pd.read_json(jsonl, lines=True)
-  df
-  df.to_json(orient='records', lines=True)
-
-
-.. _io.table_schema:
-
-Table Schema
-''''''''''''
-
-.. versionadded:: 0.20.0
-
-`Table Schema`_ is a spec for describing tabular datasets as a JSON
-object. The JSON includes information on the field names, types, and
-other attributes. You can use the orient ``table`` to build
-a JSON string with two fields, ``schema`` and ``data``.
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-       {'A': [1, 2, 3],
-        'B': ['a', 'b', 'c'],
-        'C': pd.date_range('2016-01-01', freq='d', periods=3),
-       }, index=pd.Index(range(3), name='idx'))
-   df
-   df.to_json(orient='table', date_format="iso")
-
-The ``schema`` field contains the ``fields`` key, which itself contains
-a list of column name to type pairs, including the ``Index`` or ``MultiIndex``
-(see below for a list of types).
-The ``schema`` field also contains a ``primaryKey`` field if the (Multi)index
-is unique.
-
-The second field, ``data``, contains the serialized data with the ``records``
-orient.
-The index is included, and any datetimes are ISO 8601 formatted, as required
-by the Table Schema spec.
-
-The full list of types supported are described in the Table Schema
-spec. This table shows the mapping from pandas types:
-
-=============== =================
-Pandas type     Table Schema type
-=============== =================
-int64           integer
-float64         number
-bool            boolean
-datetime64[ns]  datetime
-timedelta64[ns] duration
-categorical     any
-object          str
-=============== =================
-
-A few notes on the generated table schema:
-
-- The ``schema`` object contains a ``pandas_version`` field. This contains
-  the version of pandas' dialect of the schema, and will be incremented
-  with each revision.
-- All dates are converted to UTC when serializing. Even timezone naïve values,
-  which are treated as UTC with an offset of 0.
-
-  .. ipython:: python
-
-     from pandas.io.json import build_table_schema
-     s = pd.Series(pd.date_range('2016', periods=4))
-     build_table_schema(s)
-
-- datetimes with a timezone (before serializing), include an additional field
-  ``tz`` with the time zone name (e.g. ``'US/Central'``).
-
-  .. ipython:: python
-
-     s_tz = pd.Series(pd.date_range('2016', periods=12,
-                                    tz='US/Central'))
-     build_table_schema(s_tz)
-
-- Periods are converted to timestamps before serialization, and so have the
-  same behavior of being converted to UTC. In addition, periods will contain
-  and additional field ``freq`` with the period's frequency, e.g. ``'A-DEC'``
-
-  .. ipython:: python
-
-     s_per = pd.Series(1, index=pd.period_range('2016', freq='A-DEC',
-                                                periods=4))
-     build_table_schema(s_per)
-
-- Categoricals use the ``any`` type and an ``enum`` constraint listing
-  the set of possible values. Additionally, an ``ordered`` field is included
-
-  .. ipython:: python
-
-     s_cat = pd.Series(pd.Categorical(['a', 'b', 'a']))
-     build_table_schema(s_cat)
-
-- A ``primaryKey`` field, containing an array of labels, is included
-  *if the index is unique*:
-
-  .. ipython:: python
-
-     s_dupe = pd.Series([1, 2], index=[1, 1])
-     build_table_schema(s_dupe)
-
-- The ``primaryKey`` behavior is the same with MultiIndexes, but in this
-  case the ``primaryKey`` is an array:
-
-  .. ipython:: python
-
-     s_multi = pd.Series(1, index=pd.MultiIndex.from_product([('a', 'b'),
-                                                              (0, 1)]))
-     build_table_schema(s_multi)
-
-- The default naming roughly follows these rules:
-
-  + For series, the ``object.name`` is used. If that's none, then the
-    name is ``values``
-  + For DataFrames, the stringified version of the column name is used
-  + For ``Index`` (not ``MultiIndex``), ``index.name`` is used, with a
-    fallback to ``index`` if that is None.
-  + For ``MultiIndex``, ``mi.names`` is used. If any level has no name,
-    then ``level_<i>`` is used.
-
-
-_Table Schema: http://specs.frictionlessdata.io/json-table-schema/
-
-HTML
-----
-
-.. _io.read_html:
-
-Reading HTML Content
-''''''''''''''''''''''
-
-.. warning::
-
-   We **highly encourage** you to read the :ref:`HTML Table Parsing gotchas <io.html.gotchas>`
-   below regarding the issues surrounding the BeautifulSoup4/html5lib/lxml parsers.
-
-.. versionadded:: 0.12.0
-
-The top-level :func:`~pandas.io.html.read_html` function can accept an HTML
-string/file/URL and will parse HTML tables into list of pandas DataFrames.
-Let's look at a few examples.
-
-.. note::
-
-   ``read_html`` returns a ``list`` of ``DataFrame`` objects, even if there is
-   only a single table contained in the HTML content
-
-Read a URL with no options
-
-.. ipython:: python
-
-   url = 'http://www.fdic.gov/bank/individual/failed/banklist.html'
-   dfs = pd.read_html(url)
-   dfs
-
-.. note::
-
-   The data from the above URL changes every Monday so the resulting data above
-   and the data below may be slightly different.
-
-Read in the content of the file from the above URL and pass it to ``read_html``
-as a string
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   file_path = os.path.abspath(os.path.join('source', '_static', 'banklist.html'))
-
-.. ipython:: python
-
-   with open(file_path, 'r') as f:
-       dfs = pd.read_html(f.read())
-   dfs
-
-You can even pass in an instance of ``StringIO`` if you so desire
-
-.. ipython:: python
-
-   with open(file_path, 'r') as f:
-       sio = StringIO(f.read())
-
-   dfs = pd.read_html(sio)
-   dfs
-
-.. note::
-
-   The following examples are not run by the IPython evaluator due to the fact
-   that having so many network-accessing functions slows down the documentation
-   build. If you spot an error or an example that doesn't run, please do not
-   hesitate to report it over on `pandas GitHub issues page
-   <http://www.github.com/pandas-dev/pandas/issues>`__.
-
-
-Read a URL and match a table that contains specific text
-
-.. code-block:: python
-
-   match = 'Metcalf Bank'
-   df_list = pd.read_html(url, match=match)
-
-Specify a header row (by default ``<th>`` or ``<td>`` elements located within a
-``<thead>`` are used to form the column index, if multiple rows are contained within
-``<thead>`` then a multiindex is created); if specified, the header row is taken
-from the data minus the parsed header elements (``<th>`` elements).
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, header=0)
-
-Specify an index column
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, index_col=0)
-
-Specify a number of rows to skip
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, skiprows=0)
-
-Specify a number of rows to skip using a list (``xrange`` (Python 2 only) works
-as well)
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, skiprows=range(2))
-
-Specify an HTML attribute
-
-.. code-block:: python
-
-   dfs1 = pd.read_html(url, attrs={'id': 'table'})
-   dfs2 = pd.read_html(url, attrs={'class': 'sortable'})
-   print(np.array_equal(dfs1[0], dfs2[0]))  # Should be True
-
-Specify values that should be converted to NaN
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, na_values=['No Acquirer'])
-
-.. versionadded:: 0.19
-
-Specify whether to keep the default set of NaN values
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, keep_default_na=False)
-
-.. versionadded:: 0.19
-
-Specify converters for columns. This is useful for numerical text data that has
-leading zeros.  By default columns that are numerical are cast to numeric
-types and the leading zeros are lost.  To avoid this, we can convert these
-columns to strings.
-
-.. code-block:: python
-
-   url_mcc = 'https://en.wikipedia.org/wiki/Mobile_country_code'
-   dfs = pd.read_html(url_mcc, match='Telekom Albania', header=0, converters={'MNC':
-   str})
-
-.. versionadded:: 0.19
-
-Use some combination of the above
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, match='Metcalf Bank', index_col=0)
-
-Read in pandas ``to_html`` output (with some loss of floating point precision)
-
-.. code-block:: python
-
-   df = pd.DataFrame(randn(2, 2))
-   s = df.to_html(float_format='{0:.40g}'.format)
-   dfin = pd.read_html(s, index_col=0)
-
-The ``lxml`` backend will raise an error on a failed parse if that is the only
-parser you provide (if you only have a single parser you can provide just a
-string, but it is considered good practice to pass a list with one string if,
-for example, the function expects a sequence of strings)
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml'])
-
-or
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor='lxml')
-
-However, if you have bs4 and html5lib installed and pass ``None`` or ``['lxml',
-'bs4']`` then the parse will most likely succeed. Note that *as soon as a parse
-succeeds, the function will return*.
-
-.. code-block:: python
-
-   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml', 'bs4'])
-
-
-.. _io.html:
-
-Writing to HTML files
-''''''''''''''''''''''
-
-``DataFrame`` objects have an instance method ``to_html`` which renders the
-contents of the ``DataFrame`` as an HTML table. The function arguments are as
-in the method ``to_string`` described above.
-
-.. note::
-
-   Not all of the possible options for ``DataFrame.to_html`` are shown here for
-   brevity's sake. See :func:`~pandas.core.frame.DataFrame.to_html` for the
-   full set of options.
-
-.. ipython:: python
-   :suppress:
-
-   def write_html(df, filename, *args, **kwargs):
-       static = os.path.abspath(os.path.join('source', '_static'))
-       with open(os.path.join(static, filename + '.html'), 'w') as f:
-           df.to_html(f, *args, **kwargs)
-
-.. ipython:: python
-
-   df = pd.DataFrame(randn(2, 2))
-   df
-   print(df.to_html())  # raw html
-
-.. ipython:: python
-   :suppress:
-
-   write_html(df, 'basic')
-
-HTML:
-
-.. raw:: html
-   :file: _static/basic.html
-
-The ``columns`` argument will limit the columns shown
-
-.. ipython:: python
-
-   print(df.to_html(columns=[0]))
-
-.. ipython:: python
-   :suppress:
-
-   write_html(df, 'columns', columns=[0])
-
-HTML:
-
-.. raw:: html
-   :file: _static/columns.html
-
-``float_format`` takes a Python callable to control the precision of floating
-point values
-
-.. ipython:: python
-
-   print(df.to_html(float_format='{0:.10f}'.format))
-
-.. ipython:: python
-   :suppress:
-
-   write_html(df, 'float_format', float_format='{0:.10f}'.format)
-
-HTML:
-
-.. raw:: html
-   :file: _static/float_format.html
-
-``bold_rows`` will make the row labels bold by default, but you can turn that
-off
-
-.. ipython:: python
-
-   print(df.to_html(bold_rows=False))
-
-.. ipython:: python
-   :suppress:
-
-   write_html(df, 'nobold', bold_rows=False)
-
-.. raw:: html
-   :file: _static/nobold.html
-
-The ``classes`` argument provides the ability to give the resulting HTML
-table CSS classes. Note that these classes are *appended* to the existing
-``'dataframe'`` class.
-
-.. ipython:: python
-
-   print(df.to_html(classes=['awesome_table_class', 'even_more_awesome_class']))
-
-Finally, the ``escape`` argument allows you to control whether the
-"<", ">" and "&" characters escaped in the resulting HTML (by default it is
-``True``). So to get the HTML without escaped characters pass ``escape=False``
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': list('&<>'), 'b': randn(3)})
-
-
-.. ipython:: python
-   :suppress:
-
-   write_html(df, 'escape')
-   write_html(df, 'noescape', escape=False)
-
-Escaped:
-
-.. ipython:: python
-
-   print(df.to_html())
-
-.. raw:: html
-   :file: _static/escape.html
-
-Not escaped:
-
-.. ipython:: python
-
-   print(df.to_html(escape=False))
-
-.. raw:: html
-   :file: _static/noescape.html
-
-.. note::
-
-   Some browsers may not show a difference in the rendering of the previous two
-   HTML tables.
-
-
-.. _io.html.gotchas:
-
-HTML Table Parsing Gotchas
-''''''''''''''''''''''''''
-
-There are some versioning issues surrounding the libraries that are used to
-parse HTML tables in the top-level pandas io function ``read_html``.
-
-**Issues with** |lxml|_
-
-   * Benefits
-
-     * |lxml|_ is very fast
-
-     * |lxml|_ requires Cython to install correctly.
-
-   * Drawbacks
-
-     * |lxml|_ does *not* make any guarantees about the results of its parse
-       *unless* it is given |svm|_.
-
-     * In light of the above, we have chosen to allow you, the user, to use the
-       |lxml|_ backend, but **this backend will use** |html5lib|_ if |lxml|_
-       fails to parse
-
-     * It is therefore *highly recommended* that you install both
-       |BeautifulSoup4|_ and |html5lib|_, so that you will still get a valid
-       result (provided everything else is valid) even if |lxml|_ fails.
-
-**Issues with** |BeautifulSoup4|_ **using** |lxml|_ **as a backend**
-
-   * The above issues hold here as well since |BeautifulSoup4|_ is essentially
-     just a wrapper around a parser backend.
-
-**Issues with** |BeautifulSoup4|_ **using** |html5lib|_ **as a backend**
-
-   * Benefits
-
-     * |html5lib|_ is far more lenient than |lxml|_ and consequently deals
-       with *real-life markup* in a much saner way rather than just, e.g.,
-       dropping an element without notifying you.
-
-     * |html5lib|_ *generates valid HTML5 markup from invalid markup
-       automatically*. This is extremely important for parsing HTML tables,
-       since it guarantees a valid document. However, that does NOT mean that
-       it is "correct", since the process of fixing markup does not have a
-       single definition.
-
-     * |html5lib|_ is pure Python and requires no additional build steps beyond
-       its own installation.
-
-   * Drawbacks
-
-     * The biggest drawback to using |html5lib|_ is that it is slow as
-       molasses.  However consider the fact that many tables on the web are not
-       big enough for the parsing algorithm runtime to matter. It is more
-       likely that the bottleneck will be in the process of reading the raw
-       text from the URL over the web, i.e., IO (input-output). For very large
-       tables, this might not be true.
-
-
-.. |svm| replace:: **strictly valid markup**
-.. _svm: http://validator.w3.org/docs/help.html#validation_basics
-
-.. |html5lib| replace:: **html5lib**
-.. _html5lib: https://github.com/html5lib/html5lib-python
-
-.. |BeautifulSoup4| replace:: **BeautifulSoup4**
-.. _BeautifulSoup4: http://www.crummy.com/software/BeautifulSoup
-
-.. |lxml| replace:: **lxml**
-.. _lxml: http://lxml.de
-
-
-
-
-.. _io.excel:
-
-Excel files
------------
-
-The :func:`~pandas.read_excel` method can read Excel 2003 (``.xls``) and
-Excel 2007+ (``.xlsx``) files using the ``xlrd`` Python
-module.  The :meth:`~DataFrame.to_excel` instance method is used for
-saving a ``DataFrame`` to Excel.  Generally the semantics are
-similar to working with :ref:`csv<io.read_csv_table>` data.  See the :ref:`cookbook<cookbook.excel>` for some
-advanced strategies
-
-.. _io.excel_reader:
-
-Reading Excel Files
-'''''''''''''''''''
-
-In the most basic use-case, ``read_excel`` takes a path to an Excel
-file, and the ``sheetname`` indicating which sheet to parse.
-
-.. code-block:: python
-
-   # Returns a DataFrame
-   read_excel('path_to_file.xls', sheetname='Sheet1')
-
-
-.. _io.excel.excelfile_class:
-
-``ExcelFile`` class
-+++++++++++++++++++
-
-To facilitate working with multiple sheets from the same file, the ``ExcelFile``
-class can be used to wrap the file and can be be passed into ``read_excel``
-There will be a performance benefit for reading multiple sheets as the file is
-read into memory only once.
-
-.. code-block:: python
-
-   xlsx = pd.ExcelFile('path_to_file.xls')
-   df = pd.read_excel(xlsx, 'Sheet1')
-
-The ``ExcelFile`` class can also be used as a context manager.
-
-.. code-block:: python
-
-   with pd.ExcelFile('path_to_file.xls') as xls:
-       df1 = pd.read_excel(xls, 'Sheet1')
-       df2 = pd.read_excel(xls, 'Sheet2')
-
-The ``sheet_names`` property will generate
-a list of the sheet names in the file.
-
-The primary use-case for an ``ExcelFile`` is parsing multiple sheets with
-different parameters
-
-.. code-block:: python
-
-    data = {}
-    # For when Sheet1's format differs from Sheet2
-    with pd.ExcelFile('path_to_file.xls') as xls:
-        data['Sheet1'] = pd.read_excel(xls, 'Sheet1', index_col=None, na_values=['NA'])
-        data['Sheet2'] = pd.read_excel(xls, 'Sheet2', index_col=1)
-
-Note that if the same parsing parameters are used for all sheets, a list
-of sheet names can simply be passed to ``read_excel`` with no loss in performance.
-
-.. code-block:: python
-
-    # using the ExcelFile class
-    data = {}
-    with pd.ExcelFile('path_to_file.xls') as xls:
-        data['Sheet1'] = read_excel(xls, 'Sheet1', index_col=None, na_values=['NA'])
-        data['Sheet2'] = read_excel(xls, 'Sheet2', index_col=None, na_values=['NA'])
-
-    # equivalent using the read_excel function
-    data = read_excel('path_to_file.xls', ['Sheet1', 'Sheet2'], index_col=None, na_values=['NA'])
-
-.. versionadded:: 0.12
-
-``ExcelFile`` has been moved to the top level namespace.
-
-.. versionadded:: 0.17
-
-``read_excel`` can take an ``ExcelFile`` object as input
-
-
-.. _io.excel.specifying_sheets:
-
-Specifying Sheets
-+++++++++++++++++
-
-.. note :: The second argument is ``sheetname``, not to be confused with ``ExcelFile.sheet_names``
-
-.. note :: An ExcelFile's attribute ``sheet_names`` provides access to a list of sheets.
-
-- The arguments ``sheetname`` allows specifying the sheet or sheets to read.
-- The default value for ``sheetname`` is 0, indicating to read the first sheet
-- Pass a string to refer to the name of a particular sheet in the workbook.
-- Pass an integer to refer to the index of a sheet. Indices follow Python
-  convention, beginning at 0.
-- Pass a list of either strings or integers, to return a dictionary of specified sheets.
-- Pass a ``None`` to return a dictionary of all available sheets.
-
-.. code-block:: python
-
-   # Returns a DataFrame
-   read_excel('path_to_file.xls', 'Sheet1', index_col=None, na_values=['NA'])
-
-Using the sheet index:
-
-.. code-block:: python
-
-   # Returns a DataFrame
-   read_excel('path_to_file.xls', 0, index_col=None, na_values=['NA'])
-
-Using all default values:
-
-.. code-block:: python
-
-   # Returns a DataFrame
-   read_excel('path_to_file.xls')
-
-Using None to get all sheets:
-
-.. code-block:: python
-
-   # Returns a dictionary of DataFrames
-   read_excel('path_to_file.xls',sheetname=None)
-
-Using a list to get multiple sheets:
-
-.. code-block:: python
-
-   # Returns the 1st and 4th sheet, as a dictionary of DataFrames.
-   read_excel('path_to_file.xls',sheetname=['Sheet1',3])
-
-.. versionadded:: 0.16
-
-``read_excel`` can read more than one sheet, by setting ``sheetname`` to either
-a list of sheet names, a list of sheet positions, or ``None`` to read all sheets.
-
-.. versionadded:: 0.13
-
-Sheets can be specified by sheet index or sheet name, using an integer or string,
-respectively.
-
-.. _io.excel.reading_multiindex:
-
-Reading a ``MultiIndex``
-++++++++++++++++++++++++
-
-.. versionadded:: 0.17
-
-``read_excel`` can read a ``MultiIndex`` index, by passing a list of columns to ``index_col``
-and a ``MultiIndex`` column by passing a list of rows to ``header``.  If either the ``index``
-or ``columns`` have serialized level names those will be read in as well by specifying
-the rows/columns that make up the levels.
-
-For example, to read in a ``MultiIndex`` index without names:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a':[1,2,3,4], 'b':[5,6,7,8]},
-                     index=pd.MultiIndex.from_product([['a','b'],['c','d']]))
-   df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx', index_col=[0,1])
-   df
-
-If the index has level names, they will parsed as well, using the same
-parameters.
-
-.. ipython:: python
-
-   df.index = df.index.set_names(['lvl1', 'lvl2'])
-   df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx', index_col=[0,1])
-   df
-
-
-If the source file has both ``MultiIndex`` index and columns, lists specifying each
-should be passed to ``index_col`` and ``header``
-
-.. ipython:: python
-
-   df.columns = pd.MultiIndex.from_product([['a'],['b', 'd']], names=['c1', 'c2'])
-   df.to_excel('path_to_file.xlsx')
-   df = pd.read_excel('path_to_file.xlsx',
-                       index_col=[0,1], header=[0,1])
-   df
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('path_to_file.xlsx')
-
-.. warning::
-
-   Excel files saved in version 0.16.2 or prior that had index names will still able to be read in,
-   but the ``has_index_names`` argument must specified to ``True``.
-
-
-Parsing Specific Columns
-++++++++++++++++++++++++
-
-It is often the case that users will insert columns to do temporary computations
-in Excel and you may not want to read in those columns. `read_excel` takes
-a `parse_cols` keyword to allow you to specify a subset of columns to parse.
-
-If `parse_cols` is an integer, then it is assumed to indicate the last column
-to be parsed.
-
-.. code-block:: python
-
-   read_excel('path_to_file.xls', 'Sheet1', parse_cols=2)
-
-If `parse_cols` is a list of integers, then it is assumed to be the file column
-indices to be parsed.
-
-.. code-block:: python
-
-   read_excel('path_to_file.xls', 'Sheet1', parse_cols=[0, 2, 3])
-
-
-Parsing Dates
-+++++++++++++
-
-Datetime-like values are normally automatically converted to the appropriate
-dtype when reading the excel file. But if you have a column of strings that
-*look* like dates (but are not actually formatted as dates in excel), you can
-use the `parse_dates` keyword to parse those strings to datetimes:
-
-.. code-block:: python
-
-   read_excel('path_to_file.xls', 'Sheet1', parse_dates=['date_strings'])
-
-
-Cell Converters
-+++++++++++++++
-
-It is possible to transform the contents of Excel cells via the `converters`
-option. For instance, to convert a column to boolean:
-
-.. code-block:: python
-
-   read_excel('path_to_file.xls', 'Sheet1', converters={'MyBools': bool})
-
-This options handles missing values and treats exceptions in the converters
-as missing data. Transformations are applied cell by cell rather than to the
-column as a whole, so the array dtype is not guaranteed. For instance, a
-column of integers with missing values cannot be transformed to an array
-with integer dtype, because NaN is strictly a float. You can manually mask
-missing data to recover integer dtype:
-
-.. code-block:: python
-
-   cfun = lambda x: int(x) if x else -1
-   read_excel('path_to_file.xls', 'Sheet1', converters={'MyInts': cfun})
-
-dtype Specifications
-++++++++++++++++++++
-
-.. versionadded:: 0.20
-
-As an alternative to converters, the type for an entire column can
-be specified using the `dtype` keyword, which takes a dictionary
-mapping column names to types.  To interpret data with
-no type inference, use the type ``str`` or ``object``.
-
-.. code-block:: python
-
-   read_excel('path_to_file.xls', dtype={'MyInts': 'int64', 'MyText': str})
-
-.. _io.excel_writer:
-
-Writing Excel Files
-'''''''''''''''''''
-
-Writing Excel Files to Disk
-+++++++++++++++++++++++++++
-
-To write a DataFrame object to a sheet of an Excel file, you can use the
-``to_excel`` instance method.  The arguments are largely the same as ``to_csv``
-described above, the first argument being the name of the excel file, and the
-optional second argument the name of the sheet to which the DataFrame should be
-written.  For example:
-
-.. code-block:: python
-
-   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1')
-
-Files with a ``.xls`` extension will be written using ``xlwt`` and those with a
-``.xlsx`` extension will be written using ``xlsxwriter`` (if available) or
-``openpyxl``.
-
-The DataFrame will be written in a way that tries to mimic the REPL output. One
-difference from 0.12.0 is that the ``index_label`` will be placed in the second
-row instead of the first. You can get the previous behaviour by setting the
-``merge_cells`` option in ``to_excel()`` to ``False``:
-
-.. code-block:: python
-
-   df.to_excel('path_to_file.xlsx', index_label='label', merge_cells=False)
-
-The Panel class also has a ``to_excel`` instance method,
-which writes each DataFrame in the Panel to a separate sheet.
-
-In order to write separate DataFrames to separate sheets in a single Excel file,
-one can pass an :class:`~pandas.io.excel.ExcelWriter`.
-
-.. code-block:: python
-
-   with ExcelWriter('path_to_file.xlsx') as writer:
-       df1.to_excel(writer, sheet_name='Sheet1')
-       df2.to_excel(writer, sheet_name='Sheet2')
-
-.. note::
-
-    Wringing a little more performance out of ``read_excel``
-    Internally, Excel stores all numeric data as floats. Because this can
-    produce unexpected behavior when reading in data, pandas defaults to trying
-    to convert integers to floats if it doesn't lose information (``1.0 -->
-    1``).  You can pass ``convert_float=False`` to disable this behavior, which
-    may give a slight performance improvement.
-
-.. _io.excel_writing_buffer:
-
-Writing Excel Files to Memory
-+++++++++++++++++++++++++++++
-
-.. versionadded:: 0.17
-
-Pandas supports writing Excel files to buffer-like objects such as ``StringIO`` or
-``BytesIO`` using :class:`~pandas.io.excel.ExcelWriter`.
-
-.. versionadded:: 0.17
-
-Added support for Openpyxl >= 2.2
-
-.. code-block:: python
-
-   # Safe import for either Python 2.x or 3.x
-   try:
-       from io import BytesIO
-   except ImportError:
-       from cStringIO import StringIO as BytesIO
-
-   bio = BytesIO()
-
-   # By setting the 'engine' in the ExcelWriter constructor.
-   writer = ExcelWriter(bio, engine='xlsxwriter')
-   df.to_excel(writer, sheet_name='Sheet1')
-
-   # Save the workbook
-   writer.save()
-
-   # Seek to the beginning and read to copy the workbook to a variable in memory
-   bio.seek(0)
-   workbook = bio.read()
-
-.. note::
-
-    ``engine`` is optional but recommended.  Setting the engine determines
-    the version of workbook produced. Setting ``engine='xlrd'`` will produce an
-    Excel 2003-format workbook (xls).  Using either ``'openpyxl'`` or
-    ``'xlsxwriter'`` will produce an Excel 2007-format workbook (xlsx). If
-    omitted, an Excel 2007-formatted workbook is produced.
-
-
-.. _io.excel.writers:
-
-Excel writer engines
-''''''''''''''''''''
-
-.. versionadded:: 0.13
-
-``pandas`` chooses an Excel writer via two methods:
-
-1. the ``engine`` keyword argument
-2. the filename extension (via the default specified in config options)
-
-By default, ``pandas`` uses the `XlsxWriter`_  for ``.xlsx`` and `openpyxl`_
-for ``.xlsm`` files and `xlwt`_ for ``.xls`` files.  If you have multiple
-engines installed, you can set the default engine through :ref:`setting the
-config options <options>` ``io.excel.xlsx.writer`` and
-``io.excel.xls.writer``. pandas will fall back on `openpyxl`_ for ``.xlsx``
-files if `Xlsxwriter`_ is not available.
-
-.. _XlsxWriter: https://xlsxwriter.readthedocs.io
-.. _openpyxl: https://openpyxl.readthedocs.io/
-.. _xlwt: http://www.python-excel.org
-
-To specify which writer you want to use, you can pass an engine keyword
-argument to ``to_excel`` and to ``ExcelWriter``. The built-in engines are:
-
-- ``openpyxl``: This includes stable support for Openpyxl from 1.6.1. However,
-  it is advised to use version 2.2 and higher, especially when working with
-  styles.
-- ``xlsxwriter``
-- ``xlwt``
-
-.. code-block:: python
-
-   # By setting the 'engine' in the DataFrame and Panel 'to_excel()' methods.
-   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1', engine='xlsxwriter')
-
-   # By setting the 'engine' in the ExcelWriter constructor.
-   writer = ExcelWriter('path_to_file.xlsx', engine='xlsxwriter')
-
-   # Or via pandas configuration.
-   from pandas import options
-   options.io.excel.xlsx.writer = 'xlsxwriter'
-
-   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1')
-
-.. _io.excel.style:
-
-Style and Formatting
-''''''''''''''''''''
-
-The look and feel of Excel worksheets created from pandas can be modified using the following parameters on the ``DataFrame``'s ``to_excel`` method.
-
-- ``float_format`` : Format string for floating point numbers (default None)
-- ``freeze_panes`` : A tuple of two integers representing the bottommost row and rightmost column to freeze. Each of these parameters is one-based, so (1, 1) will freeze the first row and first column (default None)
-
-
-
-.. _io.clipboard:
-
-Clipboard
----------
-
-A handy way to grab data is to use the ``read_clipboard`` method, which takes
-the contents of the clipboard buffer and passes them to the ``read_table``
-method. For instance, you can copy the following
-text to the clipboard (CTRL-C on many operating systems):
-
-.. code-block:: python
-
-     A B C
-   x 1 4 p
-   y 2 5 q
-   z 3 6 r
-
-And then import the data directly to a DataFrame by calling:
-
-.. code-block:: python
-
-   clipdf = pd.read_clipboard()
-
-.. ipython:: python
-
-   clipdf
-
-The ``to_clipboard`` method can be used to write the contents of a DataFrame to
-the clipboard. Following which you can paste the clipboard contents into other
-applications (CTRL-V on many operating systems). Here we illustrate writing a
-DataFrame into clipboard and reading it back.
-
-.. ipython:: python
-
-    df = pd.DataFrame(randn(5,3))
-    df
-    df.to_clipboard()
-    pd.read_clipboard()
-
-We can see that we got the same content back, which we had earlier written to the clipboard.
-
-.. note::
-
-   You may need to install xclip or xsel (with gtk or PyQt4 modules) on Linux to use these methods.
-
-.. _io.pickle:
-
-Pickling
---------
-
-All pandas objects are equipped with ``to_pickle`` methods which use Python's
-``cPickle`` module to save data structures to disk using the pickle format.
-
-.. ipython:: python
-
-   df
-   df.to_pickle('foo.pkl')
-
-The ``read_pickle`` function in the ``pandas`` namespace can be used to load
-any pickled pandas object (or any other pickled object) from file:
-
-
-.. ipython:: python
-
-   pd.read_pickle('foo.pkl')
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('foo.pkl')
-
-.. warning::
-
-   Loading pickled data received from untrusted sources can be unsafe.
-
-   See: http://docs.python.org/2.7/library/pickle.html
-
-.. warning::
-
-   Several internal refactorings, 0.13 (:ref:`Series Refactoring <whatsnew_0130.refactoring>`), and 0.15 (:ref:`Index Refactoring <whatsnew_0150.refactoring>`),
-   preserve compatibility with pickles created prior to these versions. However, these must
-   be read with ``pd.read_pickle``, rather than the default python ``pickle.load``.
-   See `this question <http://stackoverflow.com/questions/20444593/pandas-compiled-from-source-default-pickle-behavior-changed>`__
-   for a detailed explanation.
-
-.. _io.pickle.compression:
-
-Compressed pickle files
-'''''''''''''''''''''''
-
-.. versionadded:: 0.20.0
-
-:func:`read_pickle`, :meth:`DataFame.to_pickle` and :meth:`Series.to_pickle` can read
-and write compressed pickle files. The compression types of ``gzip``, ``bz2``, ``xz`` are supported for reading and writing.
-`zip`` file supports read only and must contain only one data file
-to be read in.
-
-The compression type can be an explicit parameter or be inferred from the file extension.
-If 'infer', then use ``gzip``, ``bz2``, ``zip``, or ``xz`` if filename ends in ``'.gz'``, ``'.bz2'``, ``'.zip'``, or
-``'.xz'``, respectively.
-
-.. ipython:: python
-
-   df = pd.DataFrame({
-       'A': np.random.randn(1000),
-       'B': 'foo',
-       'C': pd.date_range('20130101', periods=1000, freq='s')})
-   df
-
-Using an explicit compression type
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.compress", compression="gzip")
-   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
-   rt
-
-Inferring compression type from the extension
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.xz", compression="infer")
-   rt = pd.read_pickle("data.pkl.xz", compression="infer")
-   rt
-
-The default is to 'infer
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.gz")
-   rt = pd.read_pickle("data.pkl.gz")
-   rt
-
-   df["A"].to_pickle("s1.pkl.bz2")
-   rt = pd.read_pickle("s1.pkl.bz2")
-   rt
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove("data.pkl.compress")
-   os.remove("data.pkl.xz")
-   os.remove("data.pkl.gz")
-   os.remove("s1.pkl.bz2")
-
-.. _io.msgpack:
-
-msgpack
--------
-
-.. versionadded:: 0.13.0
-
-Starting in 0.13.0, pandas is supporting the ``msgpack`` format for
-object serialization. This is a lightweight portable binary format, similar
-to binary JSON, that is highly space efficient, and provides good performance
-both on the writing (serialization), and reading (deserialization).
-
-.. warning::
-
-   This is a very new feature of pandas. We intend to provide certain
-   optimizations in the io of the ``msgpack`` data. Since this is marked
-   as an EXPERIMENTAL LIBRARY, the storage format may not be stable until a future release.
-
-   As a result of writing format changes and other issues:
-
-   +----------------------+------------------------+
-   | Packed with          | Can be unpacked with   |
-   +======================+========================+
-   | pre-0.17 / Python 2  | any                    |
-   +----------------------+------------------------+
-   | pre-0.17 / Python 3  | any                    |
-   +----------------------+------------------------+
-   | 0.17 / Python 2      | - 0.17 / Python 2      |
-   |                      | - >=0.18 / any Python  |
-   +----------------------+------------------------+
-   | 0.17 / Python 3      | >=0.18 / any Python    |
-   +----------------------+------------------------+
-   | 0.18                 | >= 0.18                |
-   +----------------------+------------------------+
-
-   Reading (files packed by older versions) is backward-compatibile, except for files packed with 0.17 in Python 2, in which case only they can only be unpacked in Python 2.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.rand(5,2),columns=list('AB'))
-   df.to_msgpack('foo.msg')
-   pd.read_msgpack('foo.msg')
-   s = pd.Series(np.random.rand(5),index=pd.date_range('20130101',periods=5))
-
-You can pass a list of objects and you will receive them back on deserialization.
-
-.. ipython:: python
-
-   pd.to_msgpack('foo.msg', df, 'foo', np.array([1,2,3]), s)
-   pd.read_msgpack('foo.msg')
-
-You can pass ``iterator=True`` to iterate over the unpacked results
-
-.. ipython:: python
-
-   for o in pd.read_msgpack('foo.msg',iterator=True):
-       print o
-
-You can pass ``append=True`` to the writer to append to an existing pack
-
-.. ipython:: python
-
-   df.to_msgpack('foo.msg',append=True)
-   pd.read_msgpack('foo.msg')
-
-Unlike other io methods, ``to_msgpack`` is available on both a per-object basis,
-``df.to_msgpack()`` and using the top-level ``pd.to_msgpack(...)`` where you
-can pack arbitrary collections of python lists, dicts, scalars, while intermixing
-pandas objects.
-
-.. ipython:: python
-
-   pd.to_msgpack('foo2.msg', { 'dict' : [ { 'df' : df }, { 'string' : 'foo' }, { 'scalar' : 1. }, { 's' : s } ] })
-   pd.read_msgpack('foo2.msg')
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('foo.msg')
-   os.remove('foo2.msg')
-
-Read/Write API
-''''''''''''''
-
-Msgpacks can also be read from and written to strings.
-
-.. ipython:: python
-
-   df.to_msgpack()
-
-Furthermore you can concatenate the strings to produce a list of the original objects.
-
-.. ipython:: python
-
-  pd.read_msgpack(df.to_msgpack() + s.to_msgpack())
-
-.. _io.hdf5:
-
-HDF5 (PyTables)
----------------
-
-``HDFStore`` is a dict-like object which reads and writes pandas using
-the high performance HDF5 format using the excellent `PyTables
-<http://www.pytables.org/>`__ library. See the :ref:`cookbook <cookbook.hdf>`
-for some advanced strategies
-
-.. warning::
-
-   As of version 0.15.0, pandas requires ``PyTables`` >= 3.0.0. Stores written with prior versions of pandas / ``PyTables`` >= 2.3 are fully compatible (this was the previous minimum ``PyTables`` required version).
-
-.. warning::
-
-   There is a ``PyTables`` indexing bug which may appear when querying stores using an index.  If you see a subset of results being returned, upgrade to ``PyTables`` >= 3.2.  Stores created previously will need to be rewritten using the updated version.
-
-.. warning::
-
-   As of version 0.17.0, ``HDFStore`` will not drop rows that have all missing values by default. Previously, if all values (except the index) were missing, ``HDFStore`` would not write those rows to disk.
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('store.h5')
-
-.. ipython:: python
-
-   store = pd.HDFStore('store.h5')
-   print(store)
-
-Objects can be written to the file just like adding key-value pairs to a
-dict:
-
-.. ipython:: python
-
-   np.random.seed(1234)
-   index = pd.date_range('1/1/2000', periods=8)
-   s = pd.Series(randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   df = pd.DataFrame(randn(8, 3), index=index,
-                     columns=['A', 'B', 'C'])
-   wp = pd.Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
-                 major_axis=pd.date_range('1/1/2000', periods=5),
-                 minor_axis=['A', 'B', 'C', 'D'])
-
-   # store.put('s', s) is an equivalent method
-   store['s'] = s
-
-   store['df'] = df
-
-   store['wp'] = wp
-
-   # the type of stored data
-   store.root.wp._v_attrs.pandas_type
-
-   store
-
-In a current or later Python session, you can retrieve stored objects:
-
-.. ipython:: python
-
-   # store.get('df') is an equivalent method
-   store['df']
-
-   # dotted (attribute) access provides get as well
-   store.df
-
-Deletion of the object specified by the key
-
-.. ipython:: python
-
-   # store.remove('wp') is an equivalent method
-   del store['wp']
-
-   store
-
-Closing a Store, Context Manager
-
-.. ipython:: python
-
-   store.close()
-   store
-   store.is_open
-
-   # Working with, and automatically closing the store with the context
-   # manager
-   with pd.HDFStore('store.h5') as store:
-       store.keys()
-
-.. ipython:: python
-   :suppress:
-
-   store.close()
-   import os
-   os.remove('store.h5')
-
-
-
-Read/Write API
-''''''''''''''
-
-``HDFStore`` supports an top-level API using  ``read_hdf`` for reading and ``to_hdf`` for writing,
-similar to how ``read_csv`` and ``to_csv`` work. (new in 0.11.0)
-
-.. ipython:: python
-
-   df_tl = pd.DataFrame(dict(A=list(range(5)), B=list(range(5))))
-   df_tl.to_hdf('store_tl.h5','table',append=True)
-   pd.read_hdf('store_tl.h5', 'table', where = ['index>2'])
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('store_tl.h5')
-
-
-As of version 0.17.0, HDFStore will no longer drop rows that are all missing by default. This behavior can be enabled by setting ``dropna=True``.
-
-.. ipython:: python
-   :suppress:
-
-   import os
-
-.. ipython:: python
-
-   df_with_missing = pd.DataFrame({'col1':[0, np.nan, 2],
-                                   'col2':[1, np.nan, np.nan]})
-   df_with_missing
-
-   df_with_missing.to_hdf('file.h5', 'df_with_missing',
-                           format = 'table', mode='w')
-
-   pd.read_hdf('file.h5', 'df_with_missing')
-
-   df_with_missing.to_hdf('file.h5', 'df_with_missing',
-                           format = 'table', mode='w', dropna=True)
-   pd.read_hdf('file.h5', 'df_with_missing')
-
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('file.h5')
-
-This is also true for the major axis of a ``Panel``:
-
-.. ipython:: python
-
-   matrix = [[[np.nan, np.nan, np.nan],[1,np.nan,np.nan]],
-          [[np.nan, np.nan, np.nan], [np.nan,5,6]],
-          [[np.nan, np.nan, np.nan],[np.nan,3,np.nan]]]
-
-   panel_with_major_axis_all_missing = pd.Panel(matrix,
-           items=['Item1', 'Item2','Item3'],
-           major_axis=[1,2],
-           minor_axis=['A', 'B', 'C'])
-
-   panel_with_major_axis_all_missing
-
-   panel_with_major_axis_all_missing.to_hdf('file.h5', 'panel',
-                                           dropna = True,
-                                           format='table',
-                                           mode='w')
-   reloaded = pd.read_hdf('file.h5', 'panel')
-   reloaded
-
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('file.h5')
-
-
-
-.. _io.hdf5-fixed:
-
-Fixed Format
-''''''''''''
-
-.. note::
-
-   This was prior to 0.13.0 the ``Storer`` format.
-
-The examples above show storing using ``put``, which write the HDF5 to ``PyTables`` in a fixed array format, called
-the ``fixed`` format. These types of stores are are **not** appendable once written (though you can simply
-remove them and rewrite). Nor are they **queryable**; they must be
-retrieved in their entirety. They also do not support dataframes with non-unique column names.
-The ``fixed`` format stores offer very fast writing and slightly faster reading than ``table`` stores.
-This format is specified by default when using ``put`` or ``to_hdf`` or by ``format='fixed'`` or ``format='f'``
-
-.. warning::
-
-   A ``fixed`` format will raise a ``TypeError`` if you try to retrieve using a ``where`` .
-
-   .. code-block:: python
-
-       pd.DataFrame(randn(10,2)).to_hdf('test_fixed.h5','df')
-
-       pd.read_hdf('test_fixed.h5','df',where='index>5')
-       TypeError: cannot pass a where specification when reading a fixed format.
-                  this store must be selected in its entirety
-
-
-.. _io.hdf5-table:
-
-Table Format
-''''''''''''
-
-``HDFStore`` supports another ``PyTables`` format on disk, the ``table``
-format. Conceptually a ``table`` is shaped very much like a DataFrame,
-with rows and columns. A ``table`` may be appended to in the same or
-other sessions.  In addition, delete & query type operations are
-supported. This format is specified by ``format='table'`` or ``format='t'``
-to ``append`` or ``put`` or ``to_hdf``
-
-.. versionadded:: 0.13
-
-This format can be set as an option as well ``pd.set_option('io.hdf.default_format','table')`` to
-enable ``put/append/to_hdf`` to by default store in the ``table`` format.
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('store.h5')
-
-.. ipython:: python
-
-   store = pd.HDFStore('store.h5')
-   df1 = df[0:4]
-   df2 = df[4:]
-
-   # append data (creates a table automatically)
-   store.append('df', df1)
-   store.append('df', df2)
-   store
-
-   # select the entire object
-   store.select('df')
-
-   # the type of stored data
-   store.root.df._v_attrs.pandas_type
-
-.. note::
-
-   You can also create a ``table`` by passing ``format='table'`` or ``format='t'`` to a ``put`` operation.
-
-.. _io.hdf5-keys:
-
-Hierarchical Keys
-'''''''''''''''''
-
-Keys to a store can be specified as a string. These can be in a
-hierarchical path-name like format (e.g. ``foo/bar/bah``), which will
-generate a hierarchy of sub-stores (or ``Groups`` in PyTables
-parlance). Keys can be specified with out the leading '/' and are ALWAYS
-absolute (e.g. 'foo' refers to '/foo'). Removal operations can remove
-everything in the sub-store and BELOW, so be *careful*.
-
-.. ipython:: python
-
-   store.put('foo/bar/bah', df)
-   store.append('food/orange', df)
-   store.append('food/apple',  df)
-   store
-
-   # a list of keys are returned
-   store.keys()
-
-   # remove all nodes under this level
-   store.remove('food')
-   store
-
-.. warning::
-
-    Hierarchical keys cannot be retrieved as dotted (attribute) access as described above for items stored under the root node.
-
-    .. code-block:: python
-
-       In [8]: store.foo.bar.bah
-       AttributeError: 'HDFStore' object has no attribute 'foo'
-
-       # you can directly access the actual PyTables node but using the root node
-       In [9]: store.root.foo.bar.bah
-       Out[9]:
-       /foo/bar/bah (Group) ''
-         children := ['block0_items' (Array), 'block0_values' (Array), 'axis0' (Array), 'axis1' (Array)]
-
-    Instead, use explicit string based keys
-
-    .. ipython:: python
-
-       store['foo/bar/bah']
-
-
-.. _io.hdf5-types:
-
-Storing Types
-'''''''''''''
-
-Storing Mixed Types in a Table
-++++++++++++++++++++++++++++++
-
-Storing mixed-dtype data is supported. Strings are stored as a
-fixed-width using the maximum size of the appended column. Subsequent attempts
-at appending longer strings will raise a ``ValueError``.
-
-Passing ``min_itemsize={`values`: size}`` as a parameter to append
-will set a larger minimum for the string columns. Storing ``floats,
-strings, ints, bools, datetime64`` are currently supported. For string
-columns, passing ``nan_rep = 'nan'`` to append will change the default
-nan representation on disk (which converts to/from `np.nan`), this
-defaults to `nan`.
-
-.. ipython:: python
-
-    df_mixed = pd.DataFrame({ 'A' : randn(8),
-                              'B' : randn(8),
-                              'C' : np.array(randn(8),dtype='float32'),
-                              'string' :'string',
-                              'int' : 1,
-                              'bool' : True,
-                              'datetime64' : pd.Timestamp('20010102')},
-                            index=list(range(8)))
-    df_mixed.loc[df_mixed.index[3:5], ['A', 'B', 'string', 'datetime64']] = np.nan
-
-    store.append('df_mixed', df_mixed, min_itemsize = {'values': 50})
-    df_mixed1 = store.select('df_mixed')
-    df_mixed1
-    df_mixed1.get_dtype_counts()
-
-    # we have provided a minimum string column size
-    store.root.df_mixed.table
-
-Storing Multi-Index DataFrames
-++++++++++++++++++++++++++++++
-
-Storing multi-index dataframes as tables is very similar to
-storing/selecting from homogeneous index DataFrames.
-
-.. ipython:: python
-
-        index = pd.MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                      ['one', 'two', 'three']],
-                              labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                      [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                              names=['foo', 'bar'])
-        df_mi = pd.DataFrame(np.random.randn(10, 3), index=index,
-                             columns=['A', 'B', 'C'])
-        df_mi
-
-        store.append('df_mi',df_mi)
-        store.select('df_mi')
-
-        # the levels are automatically included as data columns
-        store.select('df_mi', 'foo=bar')
-
-
-.. _io.hdf5-query:
-
-Querying
-''''''''
-
-Querying a Table
-++++++++++++++++
-
-.. warning::
-
-   This query capabilities have changed substantially starting in ``0.13.0``.
-   Queries from prior version are accepted (with a ``DeprecationWarning``) printed
-   if its not string-like.
-
-``select`` and ``delete`` operations have an optional criterion that can
-be specified to select/delete only a subset of the data. This allows one
-to have a very large on-disk table and retrieve only a portion of the
-data.
-
-A query is specified using the ``Term`` class under the hood, as a boolean expression.
-
-- ``index`` and ``columns`` are supported indexers of a DataFrame
-- ``major_axis``, ``minor_axis``, and ``items`` are supported indexers of
-  the Panel
-- if ``data_columns`` are specified, these can be used as additional indexers
-
-Valid comparison operators are:
-
-``=, ==, !=, >, >=, <, <=``
-
-Valid boolean expressions are combined with:
-
-- ``|`` : or
-- ``&`` : and
-- ``(`` and ``)`` : for grouping
-
-These rules are similar to how boolean expressions are used in pandas for indexing.
-
-.. note::
-
-   - ``=`` will be automatically expanded to the comparison operator ``==``
-   - ``~`` is the not operator, but can only be used in very limited
-     circumstances
-   - If a list/tuple of expressions is passed they will be combined via ``&``
-
-The following are valid expressions:
-
-- ``'index>=date'``
-- ``"columns=['A', 'D']"``
-- ``"columns in ['A', 'D']"``
-- ``'columns=A'``
-- ``'columns==A'``
-- ``"~(columns=['A','B'])"``
-- ``'index>df.index[3] & string="bar"'``
-- ``'(index>df.index[3] & index<=df.index[6]) | string="bar"'``
-- ``"ts>=Timestamp('2012-02-01')"``
-- ``"major_axis>=20130101"``
-
-The ``indexers`` are on the left-hand side of the sub-expression:
-
-``columns``, ``major_axis``, ``ts``
-
-The right-hand side of the sub-expression (after a comparison operator) can be:
-
-- functions that will be evaluated, e.g. ``Timestamp('2012-02-01')``
-- strings, e.g. ``"bar"``
-- date-like, e.g. ``20130101``, or ``"20130101"``
-- lists, e.g. ``"['A','B']"``
-- variables that are defined in the local names space, e.g. ``date``
-
-.. note::
-
-   Passing a string to a query by interpolating it into the query
-   expression is not recommended. Simply assign the string of interest to a
-   variable and use that variable in an expression. For example, do this
-
-   .. code-block:: python
-
-      string = "HolyMoly'"
-      store.select('df', 'index == string')
-
-   instead of this
-
-   .. code-block:: python
-
-      string = "HolyMoly'"
-      store.select('df',  'index == %s' % string)
-
-   The latter will **not** work and will raise a ``SyntaxError``.Note that
-   there's a single quote followed by a double quote in the ``string``
-   variable.
-
-   If you *must* interpolate, use the ``'%r'`` format specifier
-
-   .. code-block:: python
-
-      store.select('df', 'index == %r' % string)
-
-   which will quote ``string``.
-
-
-Here are some examples:
-
-.. ipython:: python
-
-    dfq = pd.DataFrame(randn(10,4),columns=list('ABCD'),index=pd.date_range('20130101',periods=10))
-    store.append('dfq',dfq,format='table',data_columns=True)
-
-Use boolean expressions, with in-line function evaluation.
-
-.. ipython:: python
-
-    store.select('dfq',"index>pd.Timestamp('20130104') & columns=['A', 'B']")
-
-Use and inline column reference
-
-.. ipython:: python
-
-   store.select('dfq',where="A>0 or C>0")
-
-Works with a Panel as well.
-
-.. ipython:: python
-
-   store.append('wp',wp)
-   store
-   store.select('wp', "major_axis>pd.Timestamp('20000102') & minor_axis=['A', 'B']")
-
-The ``columns`` keyword can be supplied to select a list of columns to be
-returned, this is equivalent to passing a
-``'columns=list_of_columns_to_filter'``:
-
-.. ipython:: python
-
-   store.select('df', "columns=['A', 'B']")
-
-``start`` and ``stop`` parameters can be specified to limit the total search
-space. These are in terms of the total number of rows in a table.
-
-.. ipython:: python
-
-   # this is effectively what the storage of a Panel looks like
-   wp.to_frame()
-
-   # limiting the search
-   store.select('wp',"major_axis>20000102 & minor_axis=['A','B']",
-                start=0, stop=10)
-
-.. note::
-
-   ``select`` will raise a ``ValueError`` if the query expression has an unknown
-   variable reference. Usually this means that you are trying to select on a column
-   that is **not** a data_column.
-
-   ``select`` will raise a ``SyntaxError`` if the query expression is not valid.
-
-
-.. _io.hdf5-timedelta:
-
-Using timedelta64[ns]
-+++++++++++++++++++++
-
-.. versionadded:: 0.13
-
-Beginning in 0.13.0, you can store and query using the ``timedelta64[ns]`` type. Terms can be
-specified in the format: ``<float>(<unit>)``, where float may be signed (and fractional), and unit can be
-``D,s,ms,us,ns`` for the timedelta. Here's an example:
-
-.. ipython:: python
-
-   from datetime import timedelta
-   dftd = pd.DataFrame(dict(A = pd.Timestamp('20130101'), B = [ pd.Timestamp('20130101') + timedelta(days=i,seconds=10) for i in range(10) ]))
-   dftd['C'] = dftd['A']-dftd['B']
-   dftd
-   store.append('dftd',dftd,data_columns=True)
-   store.select('dftd',"C<'-3.5D'")
-
-Indexing
-++++++++
-
-You can create/modify an index for a table with ``create_table_index``
-after data is already in the table (after and ``append/put``
-operation). Creating a table index is **highly** encouraged. This will
-speed your queries a great deal when you use a ``select`` with the
-indexed dimension as the ``where``.
-
-.. note::
-
-   Indexes are automagically created (starting ``0.10.1``) on the indexables
-   and any data columns you specify. This behavior can be turned off by passing
-   ``index=False`` to ``append``.
-
-.. ipython:: python
-
-   # we have automagically already created an index (in the first section)
-   i = store.root.df.table.cols.index.index
-   i.optlevel, i.kind
-
-   # change an index by passing new parameters
-   store.create_table_index('df', optlevel=9, kind='full')
-   i = store.root.df.table.cols.index.index
-   i.optlevel, i.kind
-
-Oftentimes when appending large amounts of data to a store, it is useful to turn off index creation for each append, then recreate at the end.
-
-.. ipython:: python
-
-   df_1 = pd.DataFrame(randn(10,2),columns=list('AB'))
-   df_2 = pd.DataFrame(randn(10,2),columns=list('AB'))
-
-   st = pd.HDFStore('appends.h5',mode='w')
-   st.append('df', df_1, data_columns=['B'], index=False)
-   st.append('df', df_2, data_columns=['B'], index=False)
-   st.get_storer('df').table
-
-Then create the index when finished appending.
-
-.. ipython:: python
-
-   st.create_table_index('df', columns=['B'], optlevel=9, kind='full')
-   st.get_storer('df').table
-
-   st.close()
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('appends.h5')
-
-See `here <http://stackoverflow.com/questions/17893370/ptrepack-sortby-needs-full-index>`__ for how to create a completely-sorted-index (CSI) on an existing store.
-
-Query via Data Columns
-++++++++++++++++++++++
-
-You can designate (and index) certain columns that you want to be able
-to perform queries (other than the `indexable` columns, which you can
-always query). For instance say you want to perform this common
-operation, on-disk, and return just the frame that matches this
-query. You can specify ``data_columns = True`` to force all columns to
-be data_columns
-
-.. ipython:: python
-
-   df_dc = df.copy()
-   df_dc['string'] = 'foo'
-   df_dc.loc[df_dc.index[4:6], 'string'] = np.nan
-   df_dc.loc[df_dc.index[7:9], 'string'] = 'bar'
-   df_dc['string2'] = 'cool'
-   df_dc.loc[df_dc.index[1:3], ['B','C']] = 1.0
-   df_dc
-
-   # on-disk operations
-   store.append('df_dc', df_dc, data_columns = ['B', 'C', 'string', 'string2'])
-   store.select('df_dc', where='B>0')
-
-   # getting creative
-   store.select('df_dc', 'B > 0 & C > 0 & string == foo')
-
-   # this is in-memory version of this type of selection
-   df_dc[(df_dc.B > 0) & (df_dc.C > 0) & (df_dc.string == 'foo')]
-
-   # we have automagically created this index and the B/C/string/string2
-   # columns are stored separately as ``PyTables`` columns
-   store.root.df_dc.table
-
-There is some performance degradation by making lots of columns into
-`data columns`, so it is up to the user to designate these. In addition,
-you cannot change data columns (nor indexables) after the first
-append/put operation (Of course you can simply read in the data and
-create a new table!)
-
-Iterator
-++++++++
-
-Starting in ``0.11.0``, you can pass, ``iterator=True`` or ``chunksize=number_in_a_chunk``
-to ``select`` and ``select_as_multiple`` to return an iterator on the results.
-The default is 50,000 rows returned in a chunk.
-
-.. ipython:: python
-
-   for df in store.select('df', chunksize=3):
-      print(df)
-
-.. note::
-
-   .. versionadded:: 0.12.0
-
-   You can also use the iterator with ``read_hdf`` which will open, then
-   automatically close the store when finished iterating.
-
-   .. code-block:: python
-
-      for df in pd.read_hdf('store.h5','df', chunksize=3):
-          print(df)
-
-Note, that the chunksize keyword applies to the **source** rows. So if you
-are doing a query, then the chunksize will subdivide the total rows in the table
-and the query applied, returning an iterator on potentially unequal sized chunks.
-
-Here is a recipe for generating a query and using it to create equal sized return
-chunks.
-
-.. ipython:: python
-
-   dfeq = pd.DataFrame({'number': np.arange(1,11)})
-   dfeq
-
-   store.append('dfeq', dfeq, data_columns=['number'])
-
-   def chunks(l, n):
-        return [l[i:i+n] for i in range(0, len(l), n)]
-
-   evens = [2,4,6,8,10]
-   coordinates = store.select_as_coordinates('dfeq','number=evens')
-   for c in chunks(coordinates, 2):
-        print store.select('dfeq',where=c)
-
-Advanced Queries
-++++++++++++++++
-
-Select a Single Column
-^^^^^^^^^^^^^^^^^^^^^^
-
-To retrieve a single indexable or data column, use the
-method ``select_column``. This will, for example, enable you to get the index
-very quickly. These return a ``Series`` of the result, indexed by the row number.
-These do not currently accept the ``where`` selector.
-
-.. ipython:: python
-
-   store.select_column('df_dc', 'index')
-   store.select_column('df_dc', 'string')
-
-.. _io.hdf5-selecting_coordinates:
-
-Selecting coordinates
-^^^^^^^^^^^^^^^^^^^^^
-
-Sometimes you want to get the coordinates (a.k.a the index locations) of your query. This returns an
-``Int64Index`` of the resulting locations. These coordinates can also be passed to subsequent
-``where`` operations.
-
-.. ipython:: python
-
-   df_coord = pd.DataFrame(np.random.randn(1000,2),index=pd.date_range('20000101',periods=1000))
-   store.append('df_coord',df_coord)
-   c = store.select_as_coordinates('df_coord','index>20020101')
-   c.summary()
-   store.select('df_coord',where=c)
-
-.. _io.hdf5-where_mask:
-
-Selecting using a where mask
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Sometime your query can involve creating a list of rows to select. Usually this ``mask`` would
-be a resulting ``index`` from an indexing operation. This example selects the months of
-a datetimeindex which are 5.
-
-.. ipython:: python
-
-   df_mask = pd.DataFrame(np.random.randn(1000,2),index=pd.date_range('20000101',periods=1000))
-   store.append('df_mask',df_mask)
-   c = store.select_column('df_mask','index')
-   where = c[pd.DatetimeIndex(c).month==5].index
-   store.select('df_mask',where=where)
-
-Storer Object
-^^^^^^^^^^^^^
-
-If you want to inspect the stored object, retrieve via
-``get_storer``. You could use this programmatically to say get the number
-of rows in an object.
-
-.. ipython:: python
-
-   store.get_storer('df_dc').nrows
-
-
-Multiple Table Queries
-++++++++++++++++++++++
-
-New in 0.10.1 are the methods ``append_to_multiple`` and
-``select_as_multiple``, that can perform appending/selecting from
-multiple tables at once. The idea is to have one table (call it the
-selector table) that you index most/all of the columns, and perform your
-queries. The other table(s) are data tables with an index matching the
-selector table's index. You can then perform a very fast query
-on the selector table, yet get lots of data back. This method is similar to
-having a very wide table, but enables more efficient queries.
-
-The ``append_to_multiple`` method splits a given single DataFrame
-into multiple tables according to ``d``, a dictionary that maps the
-table names to a list of 'columns' you want in that table. If `None`
-is used in place of a list, that table will have the remaining
-unspecified columns of the given DataFrame. The argument ``selector``
-defines which table is the selector table (which you can make queries from).
-The argument ``dropna`` will drop rows from the input DataFrame to ensure
-tables are synchronized.  This means that if a row for one of the tables
-being written to is entirely ``np.NaN``, that row will be dropped from all tables.
-
-If ``dropna`` is False, **THE USER IS RESPONSIBLE FOR SYNCHRONIZING THE TABLES**.
-Remember that entirely ``np.Nan`` rows are not written to the HDFStore, so if
-you choose to call ``dropna=False``, some tables may have more rows than others,
-and therefore ``select_as_multiple`` may not work or it may return unexpected
-results.
-
-.. ipython:: python
-
-   df_mt = pd.DataFrame(randn(8, 6), index=pd.date_range('1/1/2000', periods=8),
-                                     columns=['A', 'B', 'C', 'D', 'E', 'F'])
-   df_mt['foo'] = 'bar'
-   df_mt.loc[df_mt.index[1], ('A', 'B')] = np.nan
-
-   # you can also create the tables individually
-   store.append_to_multiple({'df1_mt': ['A', 'B'], 'df2_mt': None },
-                             df_mt, selector='df1_mt')
-   store
-
-   # individual tables were created
-   store.select('df1_mt')
-   store.select('df2_mt')
-
-   # as a multiple
-   store.select_as_multiple(['df1_mt', 'df2_mt'], where=['A>0', 'B>0'],
-                             selector = 'df1_mt')
-
-
-Delete from a Table
-'''''''''''''''''''
-
-You can delete from a table selectively by specifying a ``where``. In
-deleting rows, it is important to understand the ``PyTables`` deletes
-rows by erasing the rows, then **moving** the following data. Thus
-deleting can potentially be a very expensive operation depending on the
-orientation of your data. This is especially true in higher dimensional
-objects (``Panel`` and ``Panel4D``). To get optimal performance, it's
-worthwhile to have the dimension you are deleting be the first of the
-``indexables``.
-
-Data is ordered (on the disk) in terms of the ``indexables``. Here's a
-simple use case. You store panel-type data, with dates in the
-``major_axis`` and ids in the ``minor_axis``. The data is then
-interleaved like this:
-
-- date_1
-  - id_1
-  - id_2
-  -  .
-  - id_n
-- date_2
-  - id_1
-  -  .
-  - id_n
-
-It should be clear that a delete operation on the ``major_axis`` will be
-fairly quick, as one chunk is removed, then the following data moved. On
-the other hand a delete operation on the ``minor_axis`` will be very
-expensive. In this case it would almost certainly be faster to rewrite
-the table using a ``where`` that selects all but the missing data.
-
-.. ipython:: python
-
-   # returns the number of rows deleted
-   store.remove('wp', 'major_axis>20000102' )
-   store.select('wp')
-
-.. warning::
-
-   Please note that HDF5 **DOES NOT RECLAIM SPACE** in the h5 files
-   automatically. Thus, repeatedly deleting (or removing nodes) and adding
-   again, **WILL TEND TO INCREASE THE FILE SIZE**.
-
-   To *repack and clean* the file, use :ref:`ptrepack <io.hdf5-ptrepack>`
-
-.. _io.hdf5-notes:
-
-Notes & Caveats
-'''''''''''''''
-
-
-Compression
-+++++++++++
-
-``PyTables`` allows the stored data to be compressed. This applies to
-all kinds of stores, not just tables.
-
-- Pass ``complevel=int`` for a compression level (1-9, with 0 being no
-  compression, and the default)
-- Pass ``complib=lib`` where lib is any of ``zlib, bzip2, lzo, blosc`` for
-  whichever compression library you prefer.
-
-``HDFStore`` will use the file based compression scheme if no overriding
-``complib`` or ``complevel`` options are provided. ``blosc`` offers very
-fast compression, and is my most used. Note that ``lzo`` and ``bzip2``
-may not be installed (by Python) by default.
-
-Compression for all objects within the file
-
-.. code-block:: python
-
-   store_compressed = pd.HDFStore('store_compressed.h5', complevel=9, complib='blosc')
-
-Or on-the-fly compression (this only applies to tables). You can turn
-off file compression for a specific table by passing ``complevel=0``
-
-.. code-block:: python
-
-   store.append('df', df, complib='zlib', complevel=5)
-
-.. _io.hdf5-ptrepack:
-
-ptrepack
-++++++++
-
-``PyTables`` offers better write performance when tables are compressed after
-they are written, as opposed to turning on compression at the very
-beginning. You can use the supplied ``PyTables`` utility
-``ptrepack``. In addition, ``ptrepack`` can change compression levels
-after the fact.
-
-.. code-block:: console
-
-   ptrepack --chunkshape=auto --propindexes --complevel=9 --complib=blosc in.h5 out.h5
-
-Furthermore ``ptrepack in.h5 out.h5`` will *repack* the file to allow
-you to reuse previously deleted space. Alternatively, one can simply
-remove the file and write again, or use the ``copy`` method.
-
-.. _io.hdf5-caveats:
-
-Caveats
-+++++++
-
-.. warning::
-
-   ``HDFStore`` is **not-threadsafe for writing**. The underlying
-   ``PyTables`` only supports concurrent reads (via threading or
-   processes). If you need reading and writing *at the same time*, you
-   need to serialize these operations in a single thread in a single
-   process. You will corrupt your data otherwise. See the (:issue:`2397`) for more information.
-
-- If you use locks to manage write access between multiple processes, you
-  may want to use :py:func:`~os.fsync` before releasing write locks. For
-  convenience you can use ``store.flush(fsync=True)`` to do this for you.
-- Once a ``table`` is created its items (Panel) / columns (DataFrame)
-  are fixed; only exactly the same columns can be appended
-- Be aware that timezones (e.g., ``pytz.timezone('US/Eastern')``)
-  are not necessarily equal across timezone versions.  So if data is
-  localized to a specific timezone in the HDFStore using one version
-  of a timezone library and that data is updated with another version, the data
-  will be converted to UTC since these timezones are not considered
-  equal.  Either use the same version of timezone library or use ``tz_convert`` with
-  the updated timezone definition.
-
-.. warning::
-
-   ``PyTables`` will show a ``NaturalNameWarning`` if a  column name
-   cannot be used as an attribute selector.
-   *Natural* identifiers contain only letters, numbers, and underscores,
-   and may not begin with a number.
-   Other identifiers cannot be used in a ``where`` clause
-   and are generally a bad idea.
-
-.. _io.hdf5-data_types:
-
-DataTypes
-'''''''''
-
-``HDFStore`` will map an object dtype to the ``PyTables`` underlying
-dtype. This means the following types are known to work:
-
-======================================================  =========================
-Type                                                    Represents missing values
-======================================================  =========================
-floating : ``float64, float32, float16``                ``np.nan``
-integer : ``int64, int32, int8, uint64,uint32, uint8``
-boolean
-``datetime64[ns]``                                      ``NaT``
-``timedelta64[ns]``                                     ``NaT``
-categorical : see the section below
-object : ``strings``                                    ``np.nan``
-======================================================  =========================
-
-``unicode`` columns are not supported, and **WILL FAIL**.
-
-.. _io.hdf5-categorical:
-
-Categorical Data
-++++++++++++++++
-
-.. versionadded:: 0.15.2
-
-Writing data to a ``HDFStore`` that contains a ``category`` dtype was implemented
-in 0.15.2. Queries work the same as if it was an object array. However, the ``category`` dtyped data is
-stored in a more efficient manner.
-
-.. ipython:: python
-
-   dfcat = pd.DataFrame({ 'A' : pd.Series(list('aabbcdba')).astype('category'),
-                          'B' : np.random.randn(8) })
-   dfcat
-   dfcat.dtypes
-   cstore = pd.HDFStore('cats.h5', mode='w')
-   cstore.append('dfcat', dfcat, format='table', data_columns=['A'])
-   result = cstore.select('dfcat', where="A in ['b','c']")
-   result
-   result.dtypes
-
-.. warning::
-
-   The format of the ``Categorical`` is readable by prior versions of pandas (< 0.15.2), but will retrieve
-   the data as an integer based column (e.g. the ``codes``). However, the ``categories`` *can* be retrieved
-   but require the user to select them manually using the explicit meta path.
-
-   The data is stored like so:
-
-   .. ipython:: python
-
-      cstore
-
-      # to get the categories
-      cstore.select('dfcat/meta/A/meta')
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   cstore.close()
-   import os
-   os.remove('cats.h5')
-
-
-String Columns
-++++++++++++++
-
-**min_itemsize**
-
-The underlying implementation of ``HDFStore`` uses a fixed column width (itemsize) for string columns.
-A string column itemsize is calculated as the maximum of the
-length of data (for that column) that is passed to the ``HDFStore``, **in the first append**. Subsequent appends,
-may introduce a string for a column **larger** than the column can hold, an Exception will be raised (otherwise you
-could have a silent truncation of these columns, leading to loss of information). In the future we may relax this and
-allow a user-specified truncation to occur.
-
-Pass ``min_itemsize`` on the first table creation to a-priori specify the minimum length of a particular string column.
-``min_itemsize`` can be an integer, or a dict mapping a column name to an integer. You can pass ``values`` as a key to
-allow all *indexables* or *data_columns* to have this min_itemsize.
-
-Starting in 0.11.0, passing a ``min_itemsize`` dict will cause all passed columns to be created as *data_columns* automatically.
-
-.. note::
-
-   If you are not passing any ``data_columns``, then the ``min_itemsize`` will be the maximum of the length of any string passed
-
-.. ipython:: python
-
-   dfs = pd.DataFrame(dict(A = 'foo', B = 'bar'),index=list(range(5)))
-   dfs
-
-   # A and B have a size of 30
-   store.append('dfs', dfs, min_itemsize = 30)
-   store.get_storer('dfs').table
-
-   # A is created as a data_column with a size of 30
-   # B is size is calculated
-   store.append('dfs2', dfs, min_itemsize = { 'A' : 30 })
-   store.get_storer('dfs2').table
-
-**nan_rep**
-
-String columns will serialize a ``np.nan`` (a missing value) with the ``nan_rep`` string representation. This defaults to the string value ``nan``.
-You could inadvertently turn an actual ``nan`` value into a missing value.
-
-.. ipython:: python
-
-   dfss = pd.DataFrame(dict(A = ['foo','bar','nan']))
-   dfss
-
-   store.append('dfss', dfss)
-   store.select('dfss')
-
-   # here you need to specify a different nan rep
-   store.append('dfss2', dfss, nan_rep='_nan_')
-   store.select('dfss2')
-
-.. _io.external_compatibility:
-
-External Compatibility
-''''''''''''''''''''''
-
-``HDFStore`` writes ``table`` format objects in specific formats suitable for
-producing loss-less round trips to pandas objects. For external
-compatibility, ``HDFStore`` can read native ``PyTables`` format
-tables.
-
-It is possible to write an ``HDFStore`` object that can easily be imported into ``R`` using the
-``rhdf5`` library (`Package website`_). Create a table format store like this:
-
-.. _package website: http://www.bioconductor.org/packages/release/bioc/html/rhdf5.html
-
-.. ipython:: python
-
-   np.random.seed(1)
-   df_for_r = pd.DataFrame({"first": np.random.rand(100),
-                            "second": np.random.rand(100),
-                            "class": np.random.randint(0, 2, (100,))},
-                            index=range(100))
-   df_for_r.head()
-
-   store_export = pd.HDFStore('export.h5')
-   store_export.append('df_for_r', df_for_r, data_columns=df_dc.columns)
-   store_export
-
-.. ipython:: python
-   :suppress:
-
-   store_export.close()
-   import os
-   os.remove('export.h5')
-
-In R this file can be read into a ``data.frame`` object using the ``rhdf5``
-library. The following example function reads the corresponding column names
-and data values from the values and assembles them into a ``data.frame``:
-
-.. code-block:: R
-
-   # Load values and column names for all datasets from corresponding nodes and
-   # insert them into one data.frame object.
-
-   library(rhdf5)
-
-   loadhdf5data <- function(h5File) {
-
-   listing <- h5ls(h5File)
-   # Find all data nodes, values are stored in *_values and corresponding column
-   # titles in *_items
-   data_nodes <- grep("_values", listing$name)
-   name_nodes <- grep("_items", listing$name)
-   data_paths = paste(listing$group[data_nodes], listing$name[data_nodes], sep = "/")
-   name_paths = paste(listing$group[name_nodes], listing$name[name_nodes], sep = "/")
-   columns = list()
-   for (idx in seq(data_paths)) {
-     # NOTE: matrices returned by h5read have to be transposed to obtain
-     # required Fortran order!
-     data <- data.frame(t(h5read(h5File, data_paths[idx])))
-     names <- t(h5read(h5File, name_paths[idx]))
-     entry <- data.frame(data)
-     colnames(entry) <- names
-     columns <- append(columns, entry)
-   }
-
-   data <- data.frame(columns)
-
-   return(data)
-   }
-
-Now you can import the ``DataFrame`` into R:
-
-.. code-block:: R
-
-   > data = loadhdf5data("transfer.hdf5")
-   > head(data)
-            first    second class
-   1 0.4170220047 0.3266449     0
-   2 0.7203244934 0.5270581     0
-   3 0.0001143748 0.8859421     1
-   4 0.3023325726 0.3572698     1
-   5 0.1467558908 0.9085352     1
-   6 0.0923385948 0.6233601     1
-
-.. note::
-   The R function lists the entire HDF5 file's contents and assembles the
-   ``data.frame`` object from all matching nodes, so use this only as a
-   starting point if you have stored multiple ``DataFrame`` objects to a
-   single HDF5 file.
-
-Backwards Compatibility
-'''''''''''''''''''''''
-
-0.10.1 of ``HDFStore`` can read tables created in a prior version of pandas,
-however query terms using the
-prior (undocumented) methodology are unsupported. ``HDFStore`` will
-issue a warning if you try to use a legacy-format file. You must
-read in the entire file and write it out using the new format, using the
-method ``copy`` to take advantage of the updates. The group attribute
-``pandas_version`` contains the version information. ``copy`` takes a
-number of options, please see the docstring.
-
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   legacy_file_path = os.path.abspath('source/_static/legacy_0.10.h5')
-
-.. ipython:: python
-   :okwarning:
-
-   # a legacy store
-   legacy_store = pd.HDFStore(legacy_file_path,'r')
-   legacy_store
-
-   # copy (and return the new handle)
-   new_store = legacy_store.copy('store_new.h5')
-   new_store
-   new_store.close()
-
-.. ipython:: python
-   :suppress:
-
-   legacy_store.close()
-   import os
-   os.remove('store_new.h5')
-
-
-Performance
-'''''''''''
-
-- ``tables`` format come with a writing performance penalty as compared to
-  ``fixed`` stores. The benefit is the ability to append/delete and
-  query (potentially very large amounts of data).  Write times are
-  generally longer as compared with regular stores. Query times can
-  be quite fast, especially on an indexed axis.
-- You can pass ``chunksize=<int>`` to ``append``, specifying the
-  write chunksize (default is 50000). This will significantly lower
-  your memory usage on writing.
-- You can pass ``expectedrows=<int>`` to the first ``append``,
-  to set the TOTAL number of expected rows that ``PyTables`` will
-  expected. This will optimize read/write performance.
-- Duplicate rows can be written to tables, but are filtered out in
-  selection (with the last items being selected; thus a table is
-  unique on major, minor pairs)
-- A ``PerformanceWarning`` will be raised if you are attempting to
-  store types that will be pickled by PyTables (rather than stored as
-  endemic types). See
-  `Here <http://stackoverflow.com/questions/14355151/how-to-make-pandas-hdfstore-put-operation-faster/14370190#14370190>`__
-  for more information and some solutions.
-
-Experimental
-''''''''''''
-
-HDFStore supports ``Panel4D`` storage.
-
-.. ipython:: python
-   :okwarning:
-
-   wp = pd.Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
-                 major_axis=pd.date_range('1/1/2000', periods=5),
-                 minor_axis=['A', 'B', 'C', 'D'])
-   p4d = pd.Panel4D({ 'l1' : wp })
-   p4d
-   store.append('p4d', p4d)
-   store
-
-These, by default, index the three axes ``items, major_axis,
-minor_axis``. On an ``AppendableTable`` it is possible to setup with the
-first append a different indexing scheme, depending on how you want to
-store your data. Pass the ``axes`` keyword with a list of dimensions
-(currently must by exactly 1 less than the total dimensions of the
-object). This cannot be changed after table creation.
-
-.. ipython:: python
-   :okwarning:
-
-   store.append('p4d2', p4d, axes=['labels', 'major_axis', 'minor_axis'])
-   store.select('p4d2', where='labels=l1 and items=Item1 and minor_axis=A')
-
-.. ipython:: python
-   :suppress:
-
-   store.close()
-   import os
-   os.remove('store.h5')
-
-
-.. _io.feather:
-
-Feather
--------
-
-.. versionadded:: 0.20.0
-
-Feather provides binary columnar serialization for data frames. It is designed to make reading and writing data
-frames efficient, and to make sharing data across data analysis languages easy.
-
-Feather is designed to faithfully serialize and de-serialize DataFrames, supporting all of the pandas
-dtypes, including extension dtypes such as categorical and datetime with tz.
-
-Several caveats.
-
-- This is a newer library, and the format, though stable, is not guaranteed to be backward compatible
-  to the earlier versions.
-- The format will NOT write an ``Index``, or ``MultiIndex`` for the ``DataFrame`` and will raise an
-  error if a non-default one is provided. You can simply ``.reset_index()`` in order to store the index.
-- Duplicate column names and non-string columns names are not supported
-- Non supported types include ``Period`` and actual python object types. These will raise a helpful error message
-  on an attempt at serialization.
-
-See the `Full Documentation <https://github.com/wesm/feather>`__
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': list('abc'),
-                      'b': list(range(1, 4)),
-                      'c': np.arange(3, 6).astype('u1'),
-                      'd': np.arange(4.0, 7.0, dtype='float64'),
-                      'e': [True, False, True],
-                      'f': pd.Categorical(list('abc')),
-                      'g': pd.date_range('20130101', periods=3),
-                      'h': pd.date_range('20130101', periods=3, tz='US/Eastern'),
-                      'i': pd.date_range('20130101', periods=3, freq='ns')})
-
-   df
-   df.dtypes
-
-Write to a feather file.
-
-.. ipython:: python
-
-   df.to_feather('example.feather')
-
-Read from a feather file.
-
-.. ipython:: python
-
-   result = pd.read_feather('example.feather')
-   result
-
-   # we preserve dtypes
-   result.dtypes
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('example.feather')
-
-.. _io.sql:
-
-SQL Queries
------------
-
-The :mod:`pandas.io.sql` module provides a collection of query wrappers to both
-facilitate data retrieval and to reduce dependency on DB-specific API. Database abstraction
-is provided by SQLAlchemy if installed. In addition you will need a driver library for
-your database. Examples of such drivers are `psycopg2 <http://initd.org/psycopg/>`__
-for PostgreSQL or `pymysql <https://github.com/PyMySQL/PyMySQL>`__ for MySQL.
-For `SQLite <https://docs.python.org/3.5/library/sqlite3.html>`__ this is
-included in Python's standard library by default.
-You can find an overview of supported drivers for each SQL dialect in the
-`SQLAlchemy docs <http://docs.sqlalchemy.org/en/latest/dialects/index.html>`__.
-
-.. versionadded:: 0.14.0
-
-If SQLAlchemy is not installed, a fallback is only provided for sqlite (and
-for mysql for backwards compatibility, but this is deprecated and will be
-removed in a future version).
-This mode requires a Python database adapter which respect the `Python
-DB-API <http://www.python.org/dev/peps/pep-0249/>`__.
-
-See also some :ref:`cookbook examples <cookbook.sql>` for some advanced strategies.
-
-The key functions are:
-
-.. autosummary::
-    :toctree: generated/
-
-    read_sql_table
-    read_sql_query
-    read_sql
-    DataFrame.to_sql
-
-.. note::
-
-    The function :func:`~pandas.read_sql` is a convenience wrapper around
-    :func:`~pandas.read_sql_table` and :func:`~pandas.read_sql_query` (and for
-    backward compatibility) and will delegate to specific function depending on
-    the provided input (database table name or sql query).
-    Table names do not need to be quoted if they have special characters.
-
-In the following example, we use the `SQlite <http://www.sqlite.org/>`__ SQL database
-engine. You can use a temporary SQLite database where data are stored in
-"memory".
-
-To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
-object from database URI. You only need to create the engine once per database you are
-connecting to.
-For more information on :func:`create_engine` and the URI formatting, see the examples
-below and the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/latest/core/engines.html>`__
-
-.. ipython:: python
-
-   from sqlalchemy import create_engine
-   # Create your engine.
-   engine = create_engine('sqlite:///:memory:')
-
-If you want to manage your own connections you can pass one of those instead:
-
-.. code-block:: python
-
-   with engine.connect() as conn, conn.begin():
-       data = pd.read_sql_table('data', conn)
-
-Writing DataFrames
-''''''''''''''''''
-
-Assuming the following data is in a DataFrame ``data``, we can insert it into
-the database using :func:`~pandas.DataFrame.to_sql`.
-
-+-----+------------+-------+-------+-------+
-| id  |    Date    | Col_1 | Col_2 | Col_3 |
-+=====+============+=======+=======+=======+
-| 26  | 2012-10-18 |   X   |  25.7 | True  |
-+-----+------------+-------+-------+-------+
-| 42  | 2012-10-19 |   Y   | -12.4 | False |
-+-----+------------+-------+-------+-------+
-| 63  | 2012-10-20 |   Z   |  5.73 | True  |
-+-----+------------+-------+-------+-------+
-
-
-.. ipython:: python
-   :suppress:
-
-   import datetime
-   c = ['id', 'Date', 'Col_1', 'Col_2', 'Col_3']
-   d = [(26, datetime.datetime(2010,10,18), 'X', 27.5, True),
-   (42, datetime.datetime(2010,10,19), 'Y', -12.5, False),
-   (63, datetime.datetime(2010,10,20), 'Z', 5.73, True)]
-
-   data  = pd.DataFrame(d, columns=c)
-
-.. ipython:: python
-
-    data.to_sql('data', engine)
-
-With some databases, writing large DataFrames can result in errors due to
-packet size limitations being exceeded. This can be avoided by setting the
-``chunksize`` parameter when calling ``to_sql``.  For example, the following
-writes ``data`` to the database in batches of 1000 rows at a time:
-
-.. ipython:: python
-
-    data.to_sql('data_chunked', engine, chunksize=1000)
-
-SQL data types
-++++++++++++++
-
-:func:`~pandas.DataFrame.to_sql` will try to map your data to an appropriate
-SQL data type based on the dtype of the data. When you have columns of dtype
-``object``, pandas will try to infer the data type.
-
-You can always override the default type by specifying the desired SQL type of
-any of the columns by using the ``dtype`` argument. This argument needs a
-dictionary mapping column names to SQLAlchemy types (or strings for the sqlite3
-fallback mode).
-For example, specifying to use the sqlalchemy ``String`` type instead of the
-default ``Text`` type for string columns:
-
-.. ipython:: python
-
-    from sqlalchemy.types import String
-    data.to_sql('data_dtype', engine, dtype={'Col_1': String})
-
-.. note::
-
-    Due to the limited support for timedelta's in the different database
-    flavors, columns with type ``timedelta64`` will be written as integer
-    values as nanoseconds to the database and a warning will be raised.
-
-.. note::
-
-    Columns of ``category`` dtype will be converted to the dense representation
-    as you would get with ``np.asarray(categorical)`` (e.g. for string categories
-    this gives an array of strings).
-    Because of this, reading the database table back in does **not** generate
-    a categorical.
-
-Reading Tables
-''''''''''''''
-
-:func:`~pandas.read_sql_table` will read a database table given the
-table name and optionally a subset of columns to read.
-
-.. note::
-
-    In order to use :func:`~pandas.read_sql_table`, you **must** have the
-    SQLAlchemy optional dependency installed.
-
-.. ipython:: python
-
-   pd.read_sql_table('data', engine)
-
-You can also specify the name of the column as the DataFrame index,
-and specify a subset of columns to be read.
-
-.. ipython:: python
-
-   pd.read_sql_table('data', engine, index_col='id')
-   pd.read_sql_table('data', engine, columns=['Col_1', 'Col_2'])
-
-And you can explicitly force columns to be parsed as dates:
-
-.. ipython:: python
-
-   pd.read_sql_table('data', engine, parse_dates=['Date'])
-
-If needed you can explicitly specify a format string, or a dict of arguments
-to pass to :func:`pandas.to_datetime`:
-
-.. code-block:: python
-
-   pd.read_sql_table('data', engine, parse_dates={'Date': '%Y-%m-%d'})
-   pd.read_sql_table('data', engine, parse_dates={'Date': {'format': '%Y-%m-%d %H:%M:%S'}})
-
-
-You can check if a table exists using :func:`~pandas.io.sql.has_table`
-
-Schema support
-''''''''''''''
-
-.. versionadded:: 0.15.0
-
-Reading from and writing to different schema's is supported through the ``schema``
-keyword in the :func:`~pandas.read_sql_table` and :func:`~pandas.DataFrame.to_sql`
-functions. Note however that this depends on the database flavor (sqlite does not
-have schema's). For example:
-
-.. code-block:: python
-
-   df.to_sql('table', engine, schema='other_schema')
-   pd.read_sql_table('table', engine, schema='other_schema')
-
-Querying
-''''''''
-
-You can query using raw SQL in the :func:`~pandas.read_sql_query` function.
-In this case you must use the SQL variant appropriate for your database.
-When using SQLAlchemy, you can also pass SQLAlchemy Expression language constructs,
-which are database-agnostic.
-
-.. ipython:: python
-
-   pd.read_sql_query('SELECT * FROM data', engine)
-
-Of course, you can specify a more "complex" query.
-
-.. ipython:: python
-
-   pd.read_sql_query("SELECT id, Col_1, Col_2 FROM data WHERE id = 42;", engine)
-
-The :func:`~pandas.read_sql_query` function supports a ``chunksize`` argument.
-Specifying this will return an iterator through chunks of the query result:
-
-.. ipython:: python
-
-    df = pd.DataFrame(np.random.randn(20, 3), columns=list('abc'))
-    df.to_sql('data_chunks', engine, index=False)
-
-.. ipython:: python
-
-    for chunk in pd.read_sql_query("SELECT * FROM data_chunks", engine, chunksize=5):
-        print(chunk)
-
-You can also run a plain query without creating a dataframe with
-:func:`~pandas.io.sql.execute`. This is useful for queries that don't return values,
-such as INSERT. This is functionally equivalent to calling ``execute`` on the
-SQLAlchemy engine or db connection object. Again, you must use the SQL syntax
-variant appropriate for your database.
-
-.. code-block:: python
-
-   from pandas.io import sql
-   sql.execute('SELECT * FROM table_name', engine)
-   sql.execute('INSERT INTO table_name VALUES(?, ?, ?)', engine, params=[('id', 1, 12.2, True)])
-
-
-Engine connection examples
-''''''''''''''''''''''''''
-
-To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
-object from database URI. You only need to create the engine once per database you are
-connecting to.
-
-.. code-block:: python
-
-   from sqlalchemy import create_engine
-
-   engine = create_engine('postgresql://scott:tiger@localhost:5432/mydatabase')
-
-   engine = create_engine('mysql+mysqldb://scott:tiger@localhost/foo')
-
-   engine = create_engine('oracle://scott:tiger@127.0.0.1:1521/sidname')
-
-   engine = create_engine('mssql+pyodbc://mydsn')
-
-   # sqlite://<nohostname>/<path>
-   # where <path> is relative:
-   engine = create_engine('sqlite:///foo.db')
-
-   # or absolute, starting with a slash:
-   engine = create_engine('sqlite:////absolute/path/to/foo.db')
-
-For more information see the examples the SQLAlchemy `documentation <http://docs.sqlalchemy.org/en/latest/core/engines.html>`__
-
-
-Advanced SQLAlchemy queries
-'''''''''''''''''''''''''''
-
-You can use SQLAlchemy constructs to describe your query.
-
-Use :func:`sqlalchemy.text` to specify query parameters in a backend-neutral way
-
-.. ipython:: python
-
-   import sqlalchemy as sa
-   pd.read_sql(sa.text('SELECT * FROM data where Col_1=:col1'), engine, params={'col1': 'X'})
-
-If you have an SQLAlchemy description of your database you can express where conditions using SQLAlchemy expressions
-
-.. ipython:: python
-
-   metadata = sa.MetaData()
-   data_table = sa.Table('data', metadata,
-       sa.Column('index', sa.Integer),
-       sa.Column('Date', sa.DateTime),
-       sa.Column('Col_1', sa.String),
-       sa.Column('Col_2', sa.Float),
-       sa.Column('Col_3', sa.Boolean),
-   )
-
-   pd.read_sql(sa.select([data_table]).where(data_table.c.Col_3 == True), engine)
-
-You can combine SQLAlchemy expressions with parameters passed to :func:`read_sql` using :func:`sqlalchemy.bindparam`
-
-.. ipython:: python
-
-    import datetime as dt
-    expr = sa.select([data_table]).where(data_table.c.Date > sa.bindparam('date'))
-    pd.read_sql(expr, engine, params={'date': dt.datetime(2010, 10, 18)})
-
-
-Sqlite fallback
-'''''''''''''''
-
-The use of sqlite is supported without using SQLAlchemy.
-This mode requires a Python database adapter which respect the `Python
-DB-API <http://www.python.org/dev/peps/pep-0249/>`__.
-
-You can create connections like so:
-
-.. code-block:: python
-
-   import sqlite3
-   con = sqlite3.connect(':memory:')
-
-And then issue the following queries:
-
-.. code-block:: python
-
-   data.to_sql('data', cnx)
-   pd.read_sql_query("SELECT * FROM data", con)
-
-
-.. _io.bigquery:
-
-Google BigQuery
----------------
-
-.. warning::
-
-   Starting in 0.20.0, pandas has split off Google BigQuery support into the
-   separate package ``pandas-gbq``. You can ``pip install pandas-gbq`` to get it.
-
-The ``pandas-gbq`` package provides functionality to read/write from Google BigQuery.
-
-pandas integrates with this external package. if ``pandas-gbq`` is installed, you can
-use the pandas methods ``pd.read_gbq`` and ``DataFrame.to_gbq``, which will call the
-respective functions from ``pandas-gbq``.
-
-Full cocumentation can be found `here <https://pandas-gbq.readthedocs.io/>`__
-
-.. _io.stata:
-
-Stata Format
-------------
-
-.. versionadded:: 0.12.0
-
-.. _io.stata_writer:
-
-Writing to Stata format
-'''''''''''''''''''''''
-
-The method :func:`~pandas.core.frame.DataFrame.to_stata` will write a DataFrame
-into a .dta file. The format version of this file is always 115 (Stata 12).
-
-.. ipython:: python
-
-   df = pd.DataFrame(randn(10, 2), columns=list('AB'))
-   df.to_stata('stata.dta')
-
-*Stata* data files have limited data type support; only strings with
-244 or fewer characters, ``int8``, ``int16``, ``int32``, ``float32``
-and ``float64`` can be stored in ``.dta`` files.  Additionally,
-*Stata* reserves certain values to represent missing data. Exporting a
-non-missing value that is outside of the permitted range in Stata for
-a particular data type will retype the variable to the next larger
-size.  For example, ``int8`` values are restricted to lie between -127
-and 100 in Stata, and so variables with values above 100 will trigger
-a conversion to ``int16``. ``nan`` values in floating points data
-types are stored as the basic missing data type (``.`` in *Stata*).
-
-.. note::
-
-    It is not possible to export missing data values for integer data types.
-
-
-The *Stata* writer gracefully handles other data types including ``int64``,
-``bool``, ``uint8``, ``uint16``, ``uint32`` by casting to
-the smallest supported type that can represent the data.  For example, data
-with a type of ``uint8`` will be cast to ``int8`` if all values are less than
-100 (the upper bound for non-missing ``int8`` data in *Stata*), or, if values are
-outside of this range, the variable is cast to ``int16``.
-
-
-.. warning::
-
-   Conversion from ``int64`` to ``float64`` may result in a loss of precision
-   if ``int64`` values are larger than 2**53.
-
-.. warning::
-
-  :class:`~pandas.io.stata.StataWriter` and
-  :func:`~pandas.core.frame.DataFrame.to_stata` only support fixed width
-  strings containing up to 244 characters, a limitation imposed by the version
-  115 dta file format. Attempting to write *Stata* dta files with strings
-  longer than 244 characters raises a ``ValueError``.
-
-.. _io.stata_reader:
-
-Reading from Stata format
-'''''''''''''''''''''''''
-
-The top-level function ``read_stata`` will read a dta file and return
-either a DataFrame or a :class:`~pandas.io.stata.StataReader` that can
-be used to read the file incrementally.
-
-.. ipython:: python
-
-   pd.read_stata('stata.dta')
-
-.. versionadded:: 0.16.0
-
-Specifying a ``chunksize`` yields a
-:class:`~pandas.io.stata.StataReader` instance that can be used to
-read ``chunksize`` lines from the file at a time.  The ``StataReader``
-object can be used as an iterator.
-
-.. ipython:: python
-
-  reader = pd.read_stata('stata.dta', chunksize=3)
-  for df in reader:
-      print(df.shape)
-
-For more fine-grained control, use ``iterator=True`` and specify
-``chunksize`` with each call to
-:func:`~pandas.io.stata.StataReader.read`.
-
-.. ipython:: python
-
-  reader = pd.read_stata('stata.dta', iterator=True)
-  chunk1 = reader.read(5)
-  chunk2 = reader.read(5)
-
-Currently the ``index`` is retrieved as a column.
-
-The parameter ``convert_categoricals`` indicates whether value labels should be
-read and used to create a ``Categorical`` variable from them. Value labels can
-also be retrieved by the function ``value_labels``, which requires :func:`~pandas.io.stata.StataReader.read`
-to be called before use.
-
-The parameter ``convert_missing`` indicates whether missing value
-representations in Stata should be preserved.  If ``False`` (the default),
-missing values are represented as ``np.nan``.  If ``True``, missing values are
-represented using ``StataMissingValue`` objects, and columns containing missing
-values will have ``object`` data type.
-
-.. note::
-
-   :func:`~pandas.read_stata` and
-   :class:`~pandas.io.stata.StataReader` support .dta formats 113-115
-   (Stata 10-12), 117 (Stata 13), and 118 (Stata 14).
-
-.. note::
-
-   Setting ``preserve_dtypes=False`` will upcast to the standard pandas data types:
-   ``int64`` for all integer types and ``float64`` for floating point data.  By default,
-   the Stata data types are preserved when importing.
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('stata.dta')
-
-.. _io.stata-categorical:
-
-Categorical Data
-++++++++++++++++
-
-.. versionadded:: 0.15.2
-
-``Categorical`` data can be exported to *Stata* data files as value labeled data.
-The exported data consists of the underlying category codes as integer data values
-and the categories as value labels.  *Stata* does not have an explicit equivalent
-to a ``Categorical`` and information about *whether* the variable is ordered
-is lost when exporting.
-
-.. warning::
-
-    *Stata* only supports string value labels, and so ``str`` is called on the
-    categories when exporting data.  Exporting ``Categorical`` variables with
-    non-string categories produces a warning, and can result a loss of
-    information if the ``str`` representations of the categories are not unique.
-
-Labeled data can similarly be imported from *Stata* data files as ``Categorical``
-variables using the keyword argument ``convert_categoricals`` (``True`` by default).
-The keyword argument ``order_categoricals`` (``True`` by default) determines
-whether imported ``Categorical`` variables are ordered.
-
-.. note::
-
-    When importing categorical data, the values of the variables in the *Stata*
-    data file are not preserved since ``Categorical`` variables always
-    use integer data types between ``-1`` and ``n-1`` where ``n`` is the number
-    of categories. If the original values in the *Stata* data file are required,
-    these can be imported by setting ``convert_categoricals=False``, which will
-    import original data (but not the variable labels). The original values can
-    be matched to the imported categorical data since there is a simple mapping
-    between the original *Stata* data values and the category codes of imported
-    Categorical variables: missing values are assigned code ``-1``, and the
-    smallest original value is assigned ``0``, the second smallest is assigned
-    ``1`` and so on until the largest original value is assigned the code ``n-1``.
-
-.. note::
-
-    *Stata* supports partially labeled series.  These series have value labels for
-    some but not all data values. Importing a partially labeled series will produce
-    a ``Categorical`` with string categories for the values that are labeled and
-    numeric categories for values with no label.
-
-.. _io.sas:
-
-.. _io.sas_reader:
-
-SAS Formats
------------
-
-.. versionadded:: 0.17.0
-
-The top-level function :func:`read_sas` can read (but not write) SAS
-`xport` (.XPT) and `SAS7BDAT` (.sas7bdat) format files were added in *v0.18.0*.
-
-SAS files only contain two value types: ASCII text and floating point
-values (usually 8 bytes but sometimes truncated).  For xport files,
-there is no automatic type conversion to integers, dates, or
-categoricals.  For SAS7BDAT files, the format codes may allow date
-variables to be automatically converted to dates.  By default the
-whole file is read and returned as a ``DataFrame``.
-
-Specify a ``chunksize`` or use ``iterator=True`` to obtain reader
-objects (``XportReader`` or ``SAS7BDATReader``) for incrementally
-reading the file.  The reader objects also have attributes that
-contain additional information about the file and its variables.
-
-Read a SAS7BDAT file:
-
-.. code-block:: python
-
-    df = pd.read_sas('sas_data.sas7bdat')
-
-Obtain an iterator and read an XPORT file 100,000 lines at a time:
-
-.. code-block:: python
-
-    rdr = pd.read_sas('sas_xport.xpt', chunk=100000)
-    for chunk in rdr:
-        do_something(chunk)
-
-The specification_ for the xport file format is available from the SAS
-web site.
-
-.. _specification: https://support.sas.com/techsup/technote/ts140.pdf
-
-No official documentation is available for the SAS7BDAT format.
-
-.. _io.other:
-
-Other file formats
-------------------
-
-pandas itself only supports IO with a limited set of file formats that map
-cleanly to its tabular data model. For reading and writing other file formats
-into and from pandas, we recommend these packages from the broader community.
-
-netCDF
-''''''
-
-xarray_ provides data structures inspired by the pandas DataFrame for working
-with multi-dimensional datasets, with a focus on the netCDF file format and
-easy conversion to and from pandas.
-
-.. _xarray: http://xarray.pydata.org/
-
-.. _io.perf:
-
-Performance Considerations
---------------------------
-
-This is an informal comparison of various IO methods, using pandas 0.13.1.
-
-.. code-block:: ipython
-
-   In [1]: df = pd.DataFrame(randn(1000000,2),columns=list('AB'))
-
-   In [2]: df.info()
-   <class 'pandas.core.frame.DataFrame'>
-   Int64Index: 1000000 entries, 0 to 999999
-   Data columns (total 2 columns):
-   A    1000000 non-null float64
-   B    1000000 non-null float64
-   dtypes: float64(2)
-   memory usage: 22.9 MB
-
-Writing
-
-.. code-block:: ipython
-
-   In [14]: %timeit test_sql_write(df)
-   1 loops, best of 3: 6.24 s per loop
-
-   In [15]: %timeit test_hdf_fixed_write(df)
-   1 loops, best of 3: 237 ms per loop
-
-   In [26]: %timeit test_hdf_fixed_write_compress(df)
-   1 loops, best of 3: 245 ms per loop
-
-   In [16]: %timeit test_hdf_table_write(df)
-   1 loops, best of 3: 901 ms per loop
-
-   In [27]: %timeit test_hdf_table_write_compress(df)
-   1 loops, best of 3: 952 ms per loop
-
-   In [17]: %timeit test_csv_write(df)
-   1 loops, best of 3: 3.44 s per loop
-
-Reading
-
-.. code-block:: ipython
-
-   In [18]: %timeit test_sql_read()
-   1 loops, best of 3: 766 ms per loop
-
-   In [19]: %timeit test_hdf_fixed_read()
-   10 loops, best of 3: 19.1 ms per loop
-
-   In [28]: %timeit test_hdf_fixed_read_compress()
-   10 loops, best of 3: 36.3 ms per loop
-
-   In [20]: %timeit test_hdf_table_read()
-   10 loops, best of 3: 39 ms per loop
-
-   In [29]: %timeit test_hdf_table_read_compress()
-   10 loops, best of 3: 60.6 ms per loop
-
-   In [22]: %timeit test_csv_read()
-   1 loops, best of 3: 620 ms per loop
-
-Space on disk (in bytes)
-
-.. code-block:: none
-
-    25843712 Apr  8 14:11 test.sql
-    24007368 Apr  8 14:11 test_fixed.hdf
-    15580682 Apr  8 14:11 test_fixed_compress.hdf
-    24458444 Apr  8 14:11 test_table.hdf
-    16797283 Apr  8 14:11 test_table_compress.hdf
-    46152810 Apr  8 14:11 test.csv
-
-And here's the code
-
-.. code-block:: python
-
-   import sqlite3
-   import os
-   from pandas.io import sql
-
-   df = pd.DataFrame(randn(1000000,2),columns=list('AB'))
-
-   def test_sql_write(df):
-       if os.path.exists('test.sql'):
-           os.remove('test.sql')
-       sql_db = sqlite3.connect('test.sql')
-       df.to_sql(name='test_table', con=sql_db)
-       sql_db.close()
-
-   def test_sql_read():
-       sql_db = sqlite3.connect('test.sql')
-       pd.read_sql_query("select * from test_table", sql_db)
-       sql_db.close()
-
-   def test_hdf_fixed_write(df):
-       df.to_hdf('test_fixed.hdf','test',mode='w')
-
-   def test_hdf_fixed_read():
-       pd.read_hdf('test_fixed.hdf','test')
-
-   def test_hdf_fixed_write_compress(df):
-       df.to_hdf('test_fixed_compress.hdf','test',mode='w',complib='blosc')
-
-   def test_hdf_fixed_read_compress():
-       pd.read_hdf('test_fixed_compress.hdf','test')
-
-   def test_hdf_table_write(df):
-       df.to_hdf('test_table.hdf','test',mode='w',format='table')
-
-   def test_hdf_table_read():
-       pd.read_hdf('test_table.hdf','test')
-
-   def test_hdf_table_write_compress(df):
-       df.to_hdf('test_table_compress.hdf','test',mode='w',complib='blosc',format='table')
-
-   def test_hdf_table_read_compress():
-       pd.read_hdf('test_table_compress.hdf','test')
-
-   def test_csv_write(df):
-       df.to_csv('test.csv',mode='w')
-
-   def test_csv_read():
-       pd.read_csv('test.csv',index_col=0)
diff --git a/doc/source/merging.rst b/doc/source/merging.rst
deleted file mode 100644
index fb020727d077e..0000000000000
--- a/doc/source/merging.rst
+++ /dev/null
@@ -1,1308 +0,0 @@
-.. currentmodule:: pandas
-.. _merging:
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   import pandas as pd
-   pd.options.display.max_rows=15
-   randn = np.random.randn
-   np.set_printoptions(precision=4, suppress=True)
-
-   import matplotlib.pyplot as plt
-   plt.close('all')
-   import pandas.util.doctools as doctools
-   p = doctools.TablePlotter()
-
-
-****************************
-Merge, join, and concatenate
-****************************
-
-pandas provides various facilities for easily combining together Series,
-DataFrame, and Panel objects with various kinds of set logic for the indexes
-and relational algebra functionality in the case of join / merge-type
-operations.
-
-.. _merging.concat:
-
-Concatenating objects
----------------------
-
-The ``concat`` function (in the main pandas namespace) does all of the heavy
-lifting of performing concatenation operations along an axis while performing
-optional set logic (union or intersection) of the indexes (if any) on the other
-axes. Note that I say "if any" because there is only a single possible axis of
-concatenation for Series.
-
-Before diving into all of the details of ``concat`` and what it can do, here is
-a simple example:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
-                       'B': ['B0', 'B1', 'B2', 'B3'],
-                       'C': ['C0', 'C1', 'C2', 'C3'],
-                       'D': ['D0', 'D1', 'D2', 'D3']},
-                       index=[0, 1, 2, 3])
-
-   df2 = pd.DataFrame({'A': ['A4', 'A5', 'A6', 'A7'],
-                       'B': ['B4', 'B5', 'B6', 'B7'],
-                       'C': ['C4', 'C5', 'C6', 'C7'],
-                       'D': ['D4', 'D5', 'D6', 'D7']},
-                        index=[4, 5, 6, 7])
-
-   df3 = pd.DataFrame({'A': ['A8', 'A9', 'A10', 'A11'],
-                       'B': ['B8', 'B9', 'B10', 'B11'],
-                       'C': ['C8', 'C9', 'C10', 'C11'],
-                       'D': ['D8', 'D9', 'D10', 'D11']},
-                       index=[8, 9, 10, 11])
-
-   frames = [df1, df2, df3]
-   result = pd.concat(frames)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_basic.png
-   p.plot(frames, result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-Like its sibling function on ndarrays, ``numpy.concatenate``, ``pandas.concat``
-takes a list or dict of homogeneously-typed objects and concatenates them with
-some configurable handling of "what to do with the other axes":
-
-::
-
-    pd.concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
-              keys=None, levels=None, names=None, verify_integrity=False,
-              copy=True)
-
-- ``objs`` : a sequence or mapping of Series, DataFrame, or Panel objects. If a
-  dict is passed, the sorted keys will be used as the `keys` argument, unless
-  it is passed, in which case the values will be selected (see below). Any None
-  objects will be dropped silently unless they are all None in which case a
-  ValueError will be raised.
-- ``axis`` : {0, 1, ...}, default 0. The axis to concatenate along.
-- ``join`` : {'inner', 'outer'}, default 'outer'. How to handle indexes on
-  other axis(es). Outer for union and inner for intersection.
-- ``ignore_index`` : boolean, default False. If True, do not use the index
-  values on the concatenation axis. The resulting axis will be labeled 0, ...,
-  n - 1. This is useful if you are concatenating objects where the
-  concatenation axis does not have meaningful indexing information. Note
-  the index values on the other axes are still respected in the join.
-- ``join_axes`` : list of Index objects. Specific indexes to use for the other
-  n - 1 axes instead of performing inner/outer set logic.
-- ``keys`` : sequence, default None. Construct hierarchical index using the
-  passed keys as the outermost level. If multiple levels passed, should
-  contain tuples.
-- ``levels`` : list of sequences, default None. Specific levels (unique values)
-  to use for constructing a MultiIndex. Otherwise they will be inferred from the
-  keys.
-- ``names`` : list, default None. Names for the levels in the resulting
-  hierarchical index.
-- ``verify_integrity`` : boolean, default False. Check whether the new
-  concatenated axis contains duplicates. This can be very expensive relative
-  to the actual data concatenation.
-- ``copy`` : boolean, default True. If False, do not copy data unnecessarily.
-
-Without a little bit of context and example many of these arguments don't make
-much sense. Let's take the above example. Suppose we wanted to associate
-specific keys with each of the pieces of the chopped up DataFrame. We can do
-this using the ``keys`` argument:
-
-.. ipython:: python
-
-   result = pd.concat(frames, keys=['x', 'y', 'z'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_keys.png
-   p.plot(frames, result,
-          labels=['df1', 'df2', 'df3'], vertical=True)
-   plt.close('all');
-
-As you can see (if you've read the rest of the documentation), the resulting
-object's index has a :ref:`hierarchical index <advanced.hierarchical>`. This
-means that we can now do stuff like select out each chunk by key:
-
-.. ipython:: python
-
-   result.loc['y']
-
-It's not a stretch to see how this can be very useful. More detail on this
-functionality below.
-
-.. note::
-   It is worth noting however, that ``concat`` (and therefore ``append``) makes
-   a full copy of the data, and that constantly reusing this function can
-   create a significant performance hit. If you need to use the operation over
-   several datasets, use a list comprehension.
-
-::
-
-   frames = [ process_your_file(f) for f in files ]
-   result = pd.concat(frames)
-
-
-Set logic on the other axes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-When gluing together multiple DataFrames (or Panels or...), for example, you
-have a choice of how to handle the other axes (other than the one being
-concatenated). This can be done in three ways:
-
-- Take the (sorted) union of them all, ``join='outer'``. This is the default
-  option as it results in zero information loss.
-- Take the intersection, ``join='inner'``.
-- Use a specific index (in the case of DataFrame) or indexes (in the case of
-  Panel or future higher dimensional objects), i.e. the ``join_axes`` argument
-
-Here is a example of each of these methods. First, the default ``join='outer'``
-behavior:
-
-.. ipython:: python
-
-   df4 = pd.DataFrame({'B': ['B2', 'B3', 'B6', 'B7'],
-                    'D': ['D2', 'D3', 'D6', 'D7'],
-                    'F': ['F2', 'F3', 'F6', 'F7']},
-                   index=[2, 3, 6, 7])
-   result = pd.concat([df1, df4], axis=1)
-
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_axis1.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=False);
-   plt.close('all');
-
-Note that the row indexes have been unioned and sorted. Here is the same thing
-with ``join='inner'``:
-
-.. ipython:: python
-
-   result = pd.concat([df1, df4], axis=1, join='inner')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_axis1_inner.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=False);
-   plt.close('all');
-
-Lastly, suppose we just wanted to reuse the *exact index* from the original
-DataFrame:
-
-.. ipython:: python
-
-   result = pd.concat([df1, df4], axis=1, join_axes=[df1.index])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_axis1_join_axes.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=False);
-   plt.close('all');
-
-.. _merging.concatenation:
-
-Concatenating using ``append``
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A useful shortcut to ``concat`` are the ``append`` instance methods on Series
-and DataFrame. These methods actually predated ``concat``. They concatenate
-along ``axis=0``, namely the index:
-
-.. ipython:: python
-
-   result = df1.append(df2)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append1.png
-   p.plot([df1, df2], result,
-          labels=['df1', 'df2'], vertical=True);
-   plt.close('all');
-
-In the case of DataFrame, the indexes must be disjoint but the columns do not
-need to be:
-
-.. ipython:: python
-
-   result = df1.append(df4)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append2.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=True);
-   plt.close('all');
-
-``append`` may take multiple objects to concatenate:
-
-.. ipython:: python
-
-   result = df1.append([df2, df3])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append3.png
-   p.plot([df1, df2, df3], result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-.. note::
-
-   Unlike `list.append` method, which appends to the original list and
-   returns nothing, ``append`` here **does not** modify ``df1`` and
-   returns its copy with ``df2`` appended.
-
-.. _merging.ignore_index:
-
-Ignoring indexes on the concatenation axis
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-For DataFrames which don't have a meaningful index, you may wish to append them
-and ignore the fact that they may have overlapping indexes:
-
-To do this, use the ``ignore_index`` argument:
-
-.. ipython:: python
-
-   result = pd.concat([df1, df4], ignore_index=True)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_ignore_index.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=True);
-   plt.close('all');
-
-This is also a valid argument to ``DataFrame.append``:
-
-.. ipython:: python
-
-   result = df1.append(df4, ignore_index=True)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append_ignore_index.png
-   p.plot([df1, df4], result,
-          labels=['df1', 'df4'], vertical=True);
-   plt.close('all');
-
-.. _merging.mixed_ndims:
-
-Concatenating with mixed ndims
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You can concatenate a mix of Series and DataFrames. The
-Series will be transformed to DataFrames with the column name as
-the name of the Series.
-
-.. ipython:: python
-
-   s1 = pd.Series(['X0', 'X1', 'X2', 'X3'], name='X')
-   result = pd.concat([df1, s1], axis=1)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_mixed_ndim.png
-   p.plot([df1, s1], result,
-          labels=['df1', 's1'], vertical=False);
-   plt.close('all');
-
-If unnamed Series are passed they will be numbered consecutively.
-
-.. ipython:: python
-
-   s2 = pd.Series(['_0', '_1', '_2', '_3'])
-   result = pd.concat([df1, s2, s2, s2], axis=1)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_unnamed_series.png
-   p.plot([df1, s2], result,
-          labels=['df1', 's2'], vertical=False);
-   plt.close('all');
-
-Passing ``ignore_index=True`` will drop all name references.
-
-.. ipython:: python
-
-   result = pd.concat([df1, s1], axis=1, ignore_index=True)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_series_ignore_index.png
-   p.plot([df1, s1], result,
-          labels=['df1', 's1'], vertical=False);
-   plt.close('all');
-
-More concatenating with group keys
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A fairly common use of the ``keys`` argument is to override the column names when creating a new DataFrame based on existing Series.
-Notice how the default behaviour consists on letting the resulting DataFrame inherits the parent Series' name, when these existed.
-
-.. ipython:: python
-
-   s3 = pd.Series([0, 1, 2, 3], name='foo')
-   s4 = pd.Series([0, 1, 2, 3])
-   s5 = pd.Series([0, 1, 4, 5])
-
-   pd.concat([s3, s4, s5], axis=1)
-
-Through the ``keys`` argument we can override the existing column names.
-
-.. ipython:: python
-
-   pd.concat([s3, s4, s5], axis=1, keys=['red','blue','yellow'])
-
-Let's consider now a variation on the very first example presented:
-
-.. ipython:: python
-
-   result = pd.concat(frames, keys=['x', 'y', 'z'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_group_keys2.png
-   p.plot(frames, result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-You can also pass a dict to ``concat`` in which case the dict keys will be used
-for the ``keys`` argument (unless other keys are specified):
-
-.. ipython:: python
-
-   pieces = {'x': df1, 'y': df2, 'z': df3}
-   result = pd.concat(pieces)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_dict.png
-   p.plot([df1, df2, df3], result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.concat(pieces, keys=['z', 'y'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_dict_keys.png
-   p.plot([df1, df2, df3], result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-The MultiIndex created has levels that are constructed from the passed keys and
-the index of the DataFrame pieces:
-
-.. ipython:: python
-
-   result.index.levels
-
-If you wish to specify other levels (as will occasionally be the case), you can
-do so using the ``levels`` argument:
-
-.. ipython:: python
-
-   result = pd.concat(pieces, keys=['x', 'y', 'z'],
-                   levels=[['z', 'y', 'x', 'w']],
-                   names=['group_key'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_concat_dict_keys_names.png
-   p.plot([df1, df2, df3], result,
-          labels=['df1', 'df2', 'df3'], vertical=True);
-   plt.close('all');
-
-.. ipython:: python
-
-   result.index.levels
-
-Yes, this is fairly esoteric, but is actually necessary for implementing things
-like GroupBy where the order of a categorical variable is meaningful.
-
-.. _merging.append.row:
-
-Appending rows to a DataFrame
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-While not especially efficient (since a new object must be created), you can
-append a single row to a DataFrame by passing a Series or dict to ``append``,
-which returns a new DataFrame as above.
-
-.. ipython:: python
-
-   s2 = pd.Series(['X0', 'X1', 'X2', 'X3'], index=['A', 'B', 'C', 'D'])
-   result = df1.append(s2, ignore_index=True)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append_series_as_row.png
-   p.plot([df1, s2], result,
-          labels=['df1', 's2'], vertical=True);
-   plt.close('all');
-
-You should use ``ignore_index`` with this method to instruct DataFrame to
-discard its index. If you wish to preserve the index, you should construct an
-appropriately-indexed DataFrame and append or concatenate those objects.
-
-You can also pass a list of dicts or Series:
-
-.. ipython:: python
-
-   dicts = [{'A': 1, 'B': 2, 'C': 3, 'X': 4},
-            {'A': 5, 'B': 6, 'C': 7, 'Y': 8}]
-   result = df1.append(dicts, ignore_index=True)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_append_dits.png
-   p.plot([df1, pd.DataFrame(dicts)], result,
-          labels=['df1', 'dicts'], vertical=True);
-   plt.close('all');
-
-.. _merging.join:
-
-Database-style DataFrame joining/merging
-----------------------------------------
-
-pandas has full-featured, **high performance** in-memory join operations
-idiomatically very similar to relational databases like SQL. These methods
-perform significantly better (in some cases well over an order of magnitude
-better) than other open source implementations (like ``base::merge.data.frame``
-in R). The reason for this is careful algorithmic design and internal layout of
-the data in DataFrame.
-
-See the :ref:`cookbook<cookbook.merge>` for some advanced strategies.
-
-Users who are familiar with SQL but new to pandas might be interested in a
-:ref:`comparison with SQL<compare_with_sql.join>`.
-
-pandas provides a single function, ``merge``, as the entry point for all
-standard database join operations between DataFrame objects:
-
-::
-
-    pd.merge(left, right, how='inner', on=None, left_on=None, right_on=None,
-             left_index=False, right_index=False, sort=True,
-             suffixes=('_x', '_y'), copy=True, indicator=False)
-
-- ``left``: A DataFrame object
-- ``right``: Another DataFrame object
-- ``on``: Columns (names) to join on. Must be found in both the left and
-  right DataFrame objects. If not passed and ``left_index`` and
-  ``right_index`` are ``False``, the intersection of the columns in the
-  DataFrames will be inferred to be the join keys
-- ``left_on``: Columns from the left DataFrame to use as keys. Can either be
-  column names or arrays with length equal to the length of the DataFrame
-- ``right_on``: Columns from the right DataFrame to use as keys. Can either be
-  column names or arrays with length equal to the length of the DataFrame
-- ``left_index``: If ``True``, use the index (row labels) from the left
-  DataFrame as its join key(s). In the case of a DataFrame with a MultiIndex
-  (hierarchical), the number of levels must match the number of join keys
-  from the right DataFrame
-- ``right_index``: Same usage as ``left_index`` for the right DataFrame
-- ``how``: One of ``'left'``, ``'right'``, ``'outer'``, ``'inner'``. Defaults
-  to ``inner``. See below for more detailed description of each method
-- ``sort``: Sort the result DataFrame by the join keys in lexicographical
-  order. Defaults to ``True``, setting to ``False`` will improve performance
-  substantially in many cases
-- ``suffixes``: A tuple of string suffixes to apply to overlapping
-  columns. Defaults to ``('_x', '_y')``.
-- ``copy``: Always copy data (default ``True``) from the passed DataFrame
-  objects, even when reindexing is not necessary. Cannot be avoided in many
-  cases but may improve performance / memory usage. The cases where copying
-  can be avoided are somewhat pathological but this option is provided
-  nonetheless.
-- ``indicator``: Add a column to the output DataFrame called ``_merge``
-  with information on the source of each row. ``_merge`` is Categorical-type
-  and takes on a value of ``left_only`` for observations whose merge key
-  only appears in ``'left'`` DataFrame, ``right_only`` for observations whose
-  merge key only appears in ``'right'`` DataFrame, and ``both`` if the
-  observation's merge key is found in both.
-
-  .. versionadded:: 0.17.0
-
-The return type will be the same as ``left``. If ``left`` is a ``DataFrame``
-and ``right`` is a subclass of DataFrame, the return type will still be
-``DataFrame``.
-
-``merge`` is a function in the pandas namespace, and it is also available as a
-DataFrame instance method, with the calling DataFrame being implicitly
-considered the left object in the join.
-
-The related ``DataFrame.join`` method, uses ``merge`` internally for the
-index-on-index (by default) and column(s)-on-index join. If you are joining on
-index only, you may wish to use ``DataFrame.join`` to save yourself some typing.
-
-Brief primer on merge methods (relational algebra)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Experienced users of relational databases like SQL will be familiar with the
-terminology used to describe join operations between two SQL-table like
-structures (DataFrame objects). There are several cases to consider which are
-very important to understand:
-
-- **one-to-one** joins: for example when joining two DataFrame objects on
-  their indexes (which must contain unique values)
-- **many-to-one** joins: for example when joining an index (unique) to one or
-  more columns in a DataFrame
-- **many-to-many** joins: joining columns on columns.
-
-.. note::
-
-   When joining columns on columns (potentially a many-to-many join), any
-   indexes on the passed DataFrame objects **will be discarded**.
-
-
-It is worth spending some time understanding the result of the **many-to-many**
-join case. In SQL / standard relational algebra, if a key combination appears
-more than once in both tables, the resulting table will have the **Cartesian
-product** of the associated data. Here is a very basic example with one unique
-key combination:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3'],
-                        'A': ['A0', 'A1', 'A2', 'A3'],
-                        'B': ['B0', 'B1', 'B2', 'B3']})
-
-   right = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3'],
-                         'C': ['C0', 'C1', 'C2', 'C3'],
-                         'D': ['D0', 'D1', 'D2', 'D3']})
-   result = pd.merge(left, right, on='key')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-Here is a more complicated example with multiple join keys:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'key1': ['K0', 'K0', 'K1', 'K2'],
-                        'key2': ['K0', 'K1', 'K0', 'K1'],
-                        'A': ['A0', 'A1', 'A2', 'A3'],
-                        'B': ['B0', 'B1', 'B2', 'B3']})
-
-   right = pd.DataFrame({'key1': ['K0', 'K1', 'K1', 'K2'],
-                         'key2': ['K0', 'K0', 'K0', 'K0'],
-                         'C': ['C0', 'C1', 'C2', 'C3'],
-                         'D': ['D0', 'D1', 'D2', 'D3']})
-
-   result = pd.merge(left, right, on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_multiple.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-The ``how`` argument to ``merge`` specifies how to determine which keys are to
-be included in the resulting table. If a key combination **does not appear** in
-either the left or right tables, the values in the joined table will be
-``NA``. Here is a summary of the ``how`` options and their SQL equivalent names:
-
-.. csv-table::
-    :header: "Merge method", "SQL Join Name", "Description"
-    :widths: 20, 20, 60
-
-    ``left``, ``LEFT OUTER JOIN``, Use keys from left frame only
-    ``right``, ``RIGHT OUTER JOIN``, Use keys from right frame only
-    ``outer``, ``FULL OUTER JOIN``, Use union of keys from both frames
-    ``inner``, ``INNER JOIN``, Use intersection of keys from both frames
-
-.. ipython:: python
-
-   result = pd.merge(left, right, how='left', on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_left.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.merge(left, right, how='right', on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_right.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-
-.. ipython:: python
-
-   result = pd.merge(left, right, how='outer', on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_outer.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.merge(left, right, how='inner', on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_inner.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-Here is another example with duplicate join keys in DataFrames:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'A' : [1,2], 'B' : [2, 2]})
-
-   right = pd.DataFrame({'A' : [4,5,6], 'B': [2,2,2]})
-
-   result = pd.merge(left, right, on='B', how='outer')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_on_key_dup.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. warning::
-
-  Joining / merging on duplicate keys can cause a returned frame that is the multiplication of the row dimensions,
-  may result in memory overflow. It is the user' s responsibility to manage duplicate values in keys before joining large DataFrames.
-
-.. _merging.indicator:
-
-The merge indicator
-~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.17.0
-
-``merge`` now accepts the argument ``indicator``. If ``True``, a Categorical-type column called ``_merge`` will be added to the output object that takes on values:
-
-  ===================================   ================
-  Observation Origin                    ``_merge`` value
-  ===================================   ================
-  Merge key only in ``'left'`` frame    ``left_only``
-  Merge key only in ``'right'`` frame   ``right_only``
-  Merge key in both frames              ``both``
-  ===================================   ================
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'col1': [0, 1], 'col_left':['a', 'b']})
-   df2 = pd.DataFrame({'col1': [1, 2, 2],'col_right':[2, 2, 2]})
-   pd.merge(df1, df2, on='col1', how='outer', indicator=True)
-
-The ``indicator`` argument will also accept string arguments, in which case the indicator function will use the value of the passed string as the name for the indicator column.
-
-.. ipython:: python
-
-   pd.merge(df1, df2, on='col1', how='outer', indicator='indicator_column')
-
-
-.. _merging.dtypes:
-
-Merge Dtypes
-~~~~~~~~~~~~
-
-.. versionadded:: 0.19.0
-
-Merging will preserve the dtype of the join keys.
-
-.. ipython:: python
-
-   left = pd.DataFrame({'key': [1], 'v1': [10]})
-   left
-   right = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
-   right
-
-We are able to preserve the join keys
-
-.. ipython:: python
-
-   pd.merge(left, right, how='outer')
-   pd.merge(left, right, how='outer').dtypes
-
-Of course if you have missing values that are introduced, then the
-resulting dtype will be upcast.
-
-.. ipython:: python
-
-   pd.merge(left, right, how='outer', on='key')
-   pd.merge(left, right, how='outer', on='key').dtypes
-
-.. versionadded:: 0.20.0
-
-Merging will preserve ``category`` dtypes of the mergands. See also the section on :ref:`categoricals <categorical.merge>`
-
-The left frame.
-
-.. ipython:: python
-
-   X = pd.Series(np.random.choice(['foo', 'bar'], size=(10,)))
-   X = X.astype('category', categories=['foo', 'bar'])
-
-   left = pd.DataFrame({'X': X,
-                        'Y': np.random.choice(['one', 'two', 'three'], size=(10,))})
-   left
-   left.dtypes
-
-The right frame.
-
-.. ipython:: python
-
-   right = pd.DataFrame({'X': pd.Series(['foo', 'bar']).astype('category', categories=['foo', 'bar']),
-                         'Z': [1, 2]})
-   right
-   right.dtypes
-
-The merged result
-
-.. ipython:: python
-
-   result = pd.merge(left, right, how='outer')
-   result
-   result.dtypes
-
-.. note::
-
-   The category dtypes must be *exactly* the same, meaning the same categories and the ordered attribute.
-   Otherwise the result will coerce to ``object`` dtype.
-
-.. note::
-
-   Merging on ``category`` dtypes that are the same can be quite performant compared to ``object`` dtype merging.
-
-.. _merging.join.index:
-
-Joining on index
-~~~~~~~~~~~~~~~~
-
-``DataFrame.join`` is a convenient method for combining the columns of two
-potentially differently-indexed DataFrames into a single result DataFrame. Here
-is a very basic example:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
-                        'B': ['B0', 'B1', 'B2']},
-                        index=['K0', 'K1', 'K2'])
-
-   right = pd.DataFrame({'C': ['C0', 'C2', 'C3'],
-                         'D': ['D0', 'D2', 'D3']},
-                         index=['K0', 'K2', 'K3'])
-
-   result = left.join(right)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = left.join(right, how='outer')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_outer.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = left.join(right, how='inner')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_inner.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-The data alignment here is on the indexes (row labels). This same behavior can
-be achieved using ``merge`` plus additional arguments instructing it to use the
-indexes:
-
-.. ipython:: python
-
-   result = pd.merge(left, right, left_index=True, right_index=True, how='outer')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_index_outer.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.merge(left, right, left_index=True, right_index=True, how='inner');
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_index_inner.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-Joining key columns on an index
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-``join`` takes an optional ``on`` argument which may be a column or multiple
-column names, which specifies that the passed DataFrame is to be aligned on
-that column in the DataFrame. These two function calls are completely
-equivalent:
-
-::
-
-    left.join(right, on=key_or_keys)
-    pd.merge(left, right, left_on=key_or_keys, right_index=True,
-          how='left', sort=False)
-
-Obviously you can choose whichever form you find more convenient. For
-many-to-one joins (where one of the DataFrame's is already indexed by the join
-key), using ``join`` may be more convenient. Here is a simple example:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
-                        'B': ['B0', 'B1', 'B2', 'B3'],
-                        'key': ['K0', 'K1', 'K0', 'K1']})
-
-   right = pd.DataFrame({'C': ['C0', 'C1'],
-                         'D': ['D0', 'D1']},
-                         index=['K0', 'K1'])
-
-   result = left.join(right, on='key')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_key_columns.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.merge(left, right, left_on='key', right_index=True,
-                     how='left', sort=False);
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_key_columns.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. _merging.multikey_join:
-
-To join on multiple keys, the passed DataFrame must have a ``MultiIndex``:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
-                        'B': ['B0', 'B1', 'B2', 'B3'],
-                        'key1': ['K0', 'K0', 'K1', 'K2'],
-                        'key2': ['K0', 'K1', 'K0', 'K1']})
-
-   index = pd.MultiIndex.from_tuples([('K0', 'K0'), ('K1', 'K0'),
-                                     ('K2', 'K0'), ('K2', 'K1')])
-   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
-                      'D': ['D0', 'D1', 'D2', 'D3']},
-                     index=index)
-
-Now this can be joined by passing the two key column names:
-
-.. ipython:: python
-
-   result = left.join(right, on=['key1', 'key2'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_multikeys.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. _merging.df_inner_join:
-
-The default for ``DataFrame.join`` is to perform a left join (essentially a
-"VLOOKUP" operation, for Excel users), which uses only the keys found in the
-calling DataFrame. Other join types, for example inner join, can be just as
-easily performed:
-
-.. ipython:: python
-
-   result = left.join(right, on=['key1', 'key2'], how='inner')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_multikeys_inner.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-As you can see, this drops any rows where there was no match.
-
-.. _merging.join_on_mi:
-
-Joining a single Index to a Multi-index
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.14.0
-
-You can join a singly-indexed ``DataFrame`` with a level of a multi-indexed ``DataFrame``.
-The level will match on the name of the index of the singly-indexed frame against
-a level name of the multi-indexed frame.
-
-..  ipython:: python
-
-   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
-                        'B': ['B0', 'B1', 'B2']},
-                        index=pd.Index(['K0', 'K1', 'K2'], name='key'))
-
-   index = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
-                                     ('K2', 'Y2'), ('K2', 'Y3')],
-                                      names=['key', 'Y'])
-   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
-                         'D': ['D0', 'D1', 'D2', 'D3']},
-                         index=index)
-
-   result = left.join(right, how='inner')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_multiindex_inner.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-This is equivalent but less verbose and more memory efficient / faster than this.
-
-..  ipython:: python
-
-    result = pd.merge(left.reset_index(), right.reset_index(),
-          on=['key'], how='inner').set_index(['key','Y'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_multiindex_alternative.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-Joining with two multi-indexes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-This is not Implemented via ``join`` at-the-moment, however it can be done using the following.
-
-.. ipython:: python
-
-   index = pd.MultiIndex.from_tuples([('K0', 'X0'), ('K0', 'X1'),
-                                      ('K1', 'X2')],
-                                       names=['key', 'X'])
-   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
-                        'B': ['B0', 'B1', 'B2']},
-                         index=index)
-
-   result = pd.merge(left.reset_index(), right.reset_index(),
-                     on=['key'], how='inner').set_index(['key','X','Y'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_two_multiindex.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-Overlapping value columns
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The merge ``suffixes`` argument takes a tuple of list of strings to append to
-overlapping column names in the input DataFrames to disambiguate the result
-columns:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'k': ['K0', 'K1', 'K2'], 'v': [1, 2, 3]})
-   right = pd.DataFrame({'k': ['K0', 'K0', 'K3'], 'v': [4, 5, 6]})
-
-   result = pd.merge(left, right, on='k')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_overlapped.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. ipython:: python
-
-   result = pd.merge(left, right, on='k', suffixes=['_l', '_r'])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_overlapped_suffix.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-``DataFrame.join`` has ``lsuffix`` and ``rsuffix`` arguments which behave
-similarly.
-
-.. ipython:: python
-
-   left = left.set_index('k')
-   right = right.set_index('k')
-   result = left.join(right, lsuffix='_l', rsuffix='_r')
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_merge_overlapped_multi_suffix.png
-   p.plot([left, right], result,
-          labels=['left', 'right'], vertical=False);
-   plt.close('all');
-
-.. _merging.multiple_join:
-
-Joining multiple DataFrame or Panel objects
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A list or tuple of DataFrames can also be passed to ``DataFrame.join`` to join
-them together on their indexes. The same is true for ``Panel.join``.
-
-.. ipython:: python
-
-   right2 = pd.DataFrame({'v': [7, 8, 9]}, index=['K1', 'K1', 'K2'])
-   result = left.join([right, right2])
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_join_multi_df.png
-   p.plot([left, right, right2], result,
-          labels=['left', 'right', 'right2'], vertical=False);
-   plt.close('all');
-
-.. _merging.combine_first.update:
-
-Merging together values within Series or DataFrame columns
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Another fairly common situation is to have two like-indexed (or similarly
-indexed) Series or DataFrame objects and wanting to "patch" values in one
-object from values for matching indices in the other. Here is an example:
-
-.. ipython:: python
-
-   df1 = pd.DataFrame([[np.nan, 3., 5.], [-4.6, np.nan, np.nan],
-                      [np.nan, 7., np.nan]])
-   df2 = pd.DataFrame([[-42.6, np.nan, -8.2], [-5., 1.6, 4]],
-                      index=[1, 2])
-
-For this, use the ``combine_first`` method:
-
-.. ipython:: python
-
-   result = df1.combine_first(df2)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_combine_first.png
-   p.plot([df1, df2], result,
-          labels=['df1', 'df2'], vertical=False);
-   plt.close('all');
-
-Note that this method only takes values from the right DataFrame if they are
-missing in the left DataFrame. A related method, ``update``, alters non-NA
-values inplace:
-
-.. ipython:: python
-   :suppress:
-
-   df1_copy = df1.copy()
-
-.. ipython:: python
-
-   df1.update(df2)
-
-.. ipython:: python
-   :suppress:
-
-   @savefig merging_update.png
-   p.plot([df1_copy, df2], df1,
-          labels=['df1', 'df2'], vertical=False);
-   plt.close('all');
-
-.. _merging.time_series:
-
-Timeseries friendly merging
----------------------------
-
-.. _merging.merge_ordered:
-
-Merging Ordered Data
-~~~~~~~~~~~~~~~~~~~~
-
-A :func:`merge_ordered` function allows combining time series and other
-ordered data. In particular it has an optional ``fill_method`` keyword to
-fill/interpolate missing data:
-
-.. ipython:: python
-
-   left = pd.DataFrame({'k': ['K0', 'K1', 'K1', 'K2'],
-                        'lv': [1, 2, 3, 4],
-                        's': ['a', 'b', 'c', 'd']})
-
-   right = pd.DataFrame({'k': ['K1', 'K2', 'K4'],
-                         'rv': [1, 2, 3]})
-
-   pd.merge_ordered(left, right, fill_method='ffill', left_by='s')
-
-.. _merging.merge_asof:
-
-Merging AsOf
-~~~~~~~~~~~~
-
-.. versionadded:: 0.19.0
-
-A :func:`merge_asof` is similar to an ordered left-join except that we match on nearest key rather than equal keys. For each row in the ``left`` DataFrame, we select the last row in the ``right`` DataFrame whose ``on`` key is less than the left's key. Both DataFrames must be sorted by the key.
-
-Optionally an asof merge can perform a group-wise merge. This matches the ``by`` key equally,
-in addition to the nearest match on the ``on`` key.
-
-For example; we might have ``trades`` and ``quotes`` and we want to ``asof`` merge them.
-
-.. ipython:: python
-
-   trades = pd.DataFrame({
-       'time': pd.to_datetime(['20160525 13:30:00.023',
-                               '20160525 13:30:00.038',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.048']),
-       'ticker': ['MSFT', 'MSFT',
-                  'GOOG', 'GOOG', 'AAPL'],
-       'price': [51.95, 51.95,
-                 720.77, 720.92, 98.00],
-       'quantity': [75, 155,
-                    100, 100, 100]},
-       columns=['time', 'ticker', 'price', 'quantity'])
-
-   quotes = pd.DataFrame({
-       'time': pd.to_datetime(['20160525 13:30:00.023',
-                               '20160525 13:30:00.023',
-                               '20160525 13:30:00.030',
-                               '20160525 13:30:00.041',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.049',
-                               '20160525 13:30:00.072',
-                               '20160525 13:30:00.075']),
-       'ticker': ['GOOG', 'MSFT', 'MSFT',
-                  'MSFT', 'GOOG', 'AAPL', 'GOOG',
-                  'MSFT'],
-       'bid': [720.50, 51.95, 51.97, 51.99,
-               720.50, 97.99, 720.50, 52.01],
-       'ask': [720.93, 51.96, 51.98, 52.00,
-               720.93, 98.01, 720.88, 52.03]},
-       columns=['time', 'ticker', 'bid', 'ask'])
-
-.. ipython:: python
-
-   trades
-   quotes
-
-By default we are taking the asof of the quotes.
-
-.. ipython:: python
-
-   pd.merge_asof(trades, quotes,
-                 on='time',
-                 by='ticker')
-
-We only asof within ``2ms`` betwen the quote time and the trade time.
-
-.. ipython:: python
-
-   pd.merge_asof(trades, quotes,
-                 on='time',
-                 by='ticker',
-                 tolerance=pd.Timedelta('2ms'))
-
-We only asof within ``10ms`` betwen the quote time and the trade time and we exclude exact matches on time.
-Note that though we exclude the exact matches (of the quotes), prior quotes DO propogate to that point
-in time.
-
-.. ipython:: python
-
-   pd.merge_asof(trades, quotes,
-                 on='time',
-                 by='ticker',
-                 tolerance=pd.Timedelta('10ms'),
-                 allow_exact_matches=False)
diff --git a/doc/source/missing_data.rst b/doc/source/missing_data.rst
deleted file mode 100644
index 37930775885e3..0000000000000
--- a/doc/source/missing_data.rst
+++ /dev/null
@@ -1,723 +0,0 @@
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   pd.options.display.max_rows=15
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-
-.. _missing_data:
-
-*************************
-Working with missing data
-*************************
-
-In this section, we will discuss missing (also referred to as NA) values in
-pandas.
-
-.. note::
-
-    The choice of using ``NaN`` internally to denote missing data was largely
-    for simplicity and performance reasons. It differs from the MaskedArray
-    approach of, for example, :mod:`scikits.timeseries`. We are hopeful that
-    NumPy will soon be able to provide a native NA type solution (similar to R)
-    performant enough to be used in pandas.
-
-See the :ref:`cookbook<cookbook.missing_data>` for some advanced strategies
-
-Missing data basics
--------------------
-
-When / why does data become missing?
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Some might quibble over our usage of *missing*. By "missing" we simply mean
-**null** or "not present for whatever reason". Many data sets simply arrive with
-missing data, either because it exists and was not collected or it never
-existed. For example, in a collection of financial time series, some of the time
-series might start on different dates. Thus, values prior to the start date
-would generally be marked as missing.
-
-In pandas, one of the most common ways that missing data is **introduced** into
-a data set is by reindexing. For example
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5, 3), index=['a', 'c', 'e', 'f', 'h'],
-                     columns=['one', 'two', 'three'])
-   df['four'] = 'bar'
-   df['five'] = df['one'] > 0
-   df
-   df2 = df.reindex(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'])
-   df2
-
-Values considered "missing"
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-As data comes in many shapes and forms, pandas aims to be flexible with regard
-to handling missing data. While ``NaN`` is the default missing value marker for
-reasons of computational speed and convenience, we need to be able to easily
-detect this value with data of different types: floating point, integer,
-boolean, and general object. In many cases, however, the Python ``None`` will
-arise and we wish to also consider that "missing" or "null".
-
-.. note::
-
-   Prior to version v0.10.0 ``inf`` and ``-inf`` were also
-   considered to be "null" in computations. This is no longer the case by
-   default; use the ``mode.use_inf_as_null`` option to recover it.
-
-.. _missing.isnull:
-
-To make detecting missing values easier (and across different array dtypes),
-pandas provides the :func:`~pandas.core.common.isnull` and
-:func:`~pandas.core.common.notnull` functions, which are also methods on
-``Series`` and ``DataFrame`` objects:
-
-.. ipython:: python
-
-   df2['one']
-   pd.isnull(df2['one'])
-   df2['four'].notnull()
-   df2.isnull()
-
-.. warning::
-
-   One has to be mindful that in python (and numpy), the ``nan's`` don't compare equal, but ``None's`` **do**.
-   Note that Pandas/numpy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
-
-   .. ipython:: python
-
-      None == None
-      np.nan == np.nan
-
-   So as compared to above, a scalar equality comparison versus a ``None/np.nan`` doesn't provide useful information.
-
-   .. ipython:: python
-
-      df2['one'] == np.nan
-
-Datetimes
----------
-
-For datetime64[ns] types, ``NaT`` represents missing values. This is a pseudo-native
-sentinel value that can be represented by numpy in a singular dtype (datetime64[ns]).
-pandas objects provide intercompatibility between ``NaT`` and ``NaN``.
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2['timestamp'] = pd.Timestamp('20120101')
-   df2
-   df2.loc[['a','c','h'],['one','timestamp']] = np.nan
-   df2
-   df2.get_dtype_counts()
-
-.. _missing.inserting:
-
-Inserting missing data
-----------------------
-
-You can insert missing values by simply assigning to containers. The
-actual missing value used will be chosen based on the dtype.
-
-For example, numeric containers will always use ``NaN`` regardless of
-the missing value type chosen:
-
-.. ipython:: python
-
-   s = pd.Series([1, 2, 3])
-   s.loc[0] = None
-   s
-
-Likewise, datetime containers will always use ``NaT``.
-
-For object containers, pandas will use the value given:
-
-.. ipython:: python
-
-   s = pd.Series(["a", "b", "c"])
-   s.loc[0] = None
-   s.loc[1] = np.nan
-   s
-
-
-Calculations with missing data
-------------------------------
-
-Missing values propagate naturally through arithmetic operations between pandas
-objects.
-
-.. ipython:: python
-   :suppress:
-
-   df = df2.loc[:, ['one', 'two', 'three']]
-   a = df2.loc[df2.index[:5], ['one', 'two']].fillna(method='pad')
-   b = df2.loc[df2.index[:5], ['one', 'two', 'three']]
-
-.. ipython:: python
-
-   a
-   b
-   a + b
-
-The descriptive statistics and computational methods discussed in the
-:ref:`data structure overview <basics.stats>` (and listed :ref:`here
-<api.series.stats>` and :ref:`here <api.dataframe.stats>`) are all written to
-account for missing data. For example:
-
-* When summing data, NA (missing) values will be treated as zero
-* If the data are all NA, the result will be NA
-* Methods like **cumsum** and **cumprod** ignore NA values, but preserve them
-  in the resulting arrays
-
-.. ipython:: python
-
-   df
-   df['one'].sum()
-   df.mean(1)
-   df.cumsum()
-
-NA values in GroupBy
-~~~~~~~~~~~~~~~~~~~~
-
-NA groups in GroupBy are automatically excluded. This behavior is consistent
-with R, for example:
-
-.. ipython:: python
-
-    df
-    df.groupby('one').mean()
-
-See the groupby section :ref:`here <groupby.missing>` for more information.
-
-Cleaning / filling missing data
---------------------------------
-
-pandas objects are equipped with various data manipulation methods for dealing
-with missing data.
-
-.. _missing_data.fillna:
-
-Filling missing values: fillna
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The **fillna** function can "fill in" NA values with non-null data in a couple
-of ways, which we illustrate:
-
-**Replace NA with a scalar value**
-
-.. ipython:: python
-
-   df2
-   df2.fillna(0)
-   df2['four'].fillna('missing')
-
-**Fill gaps forward or backward**
-
-Using the same filling arguments as :ref:`reindexing <basics.reindexing>`, we
-can propagate non-null values forward or backward:
-
-.. ipython:: python
-
-   df
-   df.fillna(method='pad')
-
-.. _missing_data.fillna.limit:
-
-**Limit the amount of filling**
-
-If we only want consecutive gaps filled up to a certain number of data points,
-we can use the `limit` keyword:
-
-.. ipython:: python
-   :suppress:
-
-   df.iloc[2:4, :] = np.nan
-
-.. ipython:: python
-
-   df
-   df.fillna(method='pad', limit=1)
-
-To remind you, these are the available filling methods:
-
-.. csv-table::
-    :header: "Method", "Action"
-    :widths: 30, 50
-
-    pad / ffill, Fill values forward
-    bfill / backfill, Fill values backward
-
-With time series data, using pad/ffill is extremely common so that the "last
-known value" is available at every time point.
-
-The ``ffill()`` function is equivalent to ``fillna(method='ffill')``
-and ``bfill()`` is equivalent to ``fillna(method='bfill')``
-
-.. _missing_data.PandasObject:
-
-Filling with a PandasObject
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.12
-
-You can also fillna using a dict or Series that is alignable. The labels of the dict or index of the Series
-must match the columns of the frame you wish to fill. The
-use case of this is to fill a DataFrame with the mean of that column.
-
-.. ipython:: python
-
-        dff = pd.DataFrame(np.random.randn(10,3), columns=list('ABC'))
-        dff.iloc[3:5,0] = np.nan
-        dff.iloc[4:6,1] = np.nan
-        dff.iloc[5:8,2] = np.nan
-        dff
-
-        dff.fillna(dff.mean())
-        dff.fillna(dff.mean()['B':'C'])
-
-.. versionadded:: 0.13
-
-Same result as above, but is aligning the 'fill' value which is
-a Series in this case.
-
-.. ipython:: python
-
-        dff.where(pd.notnull(dff), dff.mean(), axis='columns')
-
-
-.. _missing_data.dropna:
-
-Dropping axis labels with missing data: dropna
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You may wish to simply exclude labels from a data set which refer to missing
-data. To do this, use the **dropna** method:
-
-.. ipython:: python
-   :suppress:
-
-   df['two'] = df['two'].fillna(0)
-   df['three'] = df['three'].fillna(0)
-
-.. ipython:: python
-
-   df
-   df.dropna(axis=0)
-   df.dropna(axis=1)
-   df['one'].dropna()
-
-Series.dropna is a simpler method as it only has one axis to consider.
-DataFrame.dropna has considerably more options than Series.dropna, which can be
-examined :ref:`in the API <api.dataframe.missing>`.
-
-.. _missing_data.interpolate:
-
-Interpolation
-~~~~~~~~~~~~~
-
-.. versionadded:: 0.13.0
-
-  :meth:`~pandas.DataFrame.interpolate`, and :meth:`~pandas.Series.interpolate` have
-  revamped interpolation methods and functionality.
-
-.. versionadded:: 0.17.0
-
-  The ``limit_direction`` keyword argument was added.
-
-Both Series and Dataframe objects have an ``interpolate`` method that, by default,
-performs linear interpolation at missing datapoints.
-
-.. ipython:: python
-   :suppress:
-
-   np.random.seed(123456)
-   idx = pd.date_range('1/1/2000', periods=100, freq='BM')
-   ts = pd.Series(np.random.randn(100), index=idx)
-   ts[1:20] = np.nan
-   ts[60:80] = np.nan
-   ts = ts.cumsum()
-
-.. ipython:: python
-
-   ts
-   ts.count()
-   ts.interpolate().count()
-
-   @savefig series_interpolate.png
-   ts.interpolate().plot()
-
-Index aware interpolation is available via the ``method`` keyword:
-
-.. ipython:: python
-   :suppress:
-
-   ts2 = ts[[0, 1, 30, 60, 99]]
-
-.. ipython:: python
-
-   ts2
-   ts2.interpolate()
-   ts2.interpolate(method='time')
-
-For a floating-point index, use ``method='values'``:
-
-.. ipython:: python
-   :suppress:
-
-   idx = [0., 1., 10.]
-   ser = pd.Series([0., np.nan, 10.], idx)
-
-.. ipython:: python
-
-   ser
-   ser.interpolate()
-   ser.interpolate(method='values')
-
-You can also interpolate with a DataFrame:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [1, 2.1, np.nan, 4.7, 5.6, 6.8],
-                      'B': [.25, np.nan, np.nan, 4, 12.2, 14.4]})
-   df
-   df.interpolate()
-
-The ``method`` argument gives access to fancier interpolation methods.
-If you have scipy_ installed, you can set pass the name of a 1-d interpolation routine to ``method``.
-You'll want to consult the full scipy interpolation documentation_ and reference guide_ for details.
-The appropriate interpolation method will depend on the type of data you are working with.
-
-* If you are dealing with a time series that is growing at an increasing rate,
-  ``method='quadratic'`` may be appropriate.
-* If you have values approximating a cumulative distribution function,
-  then ``method='pchip'`` should work well.
-* To fill missing values with goal of smooth plotting, use ``method='akima'``.
-
-.. warning::
-
-   These methods require ``scipy``.
-
-.. ipython:: python
-
-   df.interpolate(method='barycentric')
-
-   df.interpolate(method='pchip')
-
-   df.interpolate(method='akima')
-
-When interpolating via a polynomial or spline approximation, you must also specify
-the degree or order of the approximation:
-
-.. ipython:: python
-
-   df.interpolate(method='spline', order=2)
-
-   df.interpolate(method='polynomial', order=2)
-
-Compare several methods:
-
-.. ipython:: python
-
-   np.random.seed(2)
-
-   ser = pd.Series(np.arange(1, 10.1, .25)**2 + np.random.randn(37))
-   bad = np.array([4, 13, 14, 15, 16, 17, 18, 20, 29])
-   ser[bad] = np.nan
-   methods = ['linear', 'quadratic', 'cubic']
-
-   df = pd.DataFrame({m: ser.interpolate(method=m) for m in methods})
-   @savefig compare_interpolations.png
-   df.plot()
-
-Another use case is interpolation at *new* values.
-Suppose you have 100 observations from some distribution. And let's suppose
-that you're particularly interested in what's happening around the middle.
-You can mix pandas' ``reindex`` and ``interpolate`` methods to interpolate
-at the new values.
-
-.. ipython:: python
-
-   ser = pd.Series(np.sort(np.random.uniform(size=100)))
-
-   # interpolate at new_index
-   new_index = ser.index | pd.Index([49.25, 49.5, 49.75, 50.25, 50.5, 50.75])
-   interp_s = ser.reindex(new_index).interpolate(method='pchip')
-   interp_s[49:51]
-
-.. _scipy: http://www.scipy.org
-.. _documentation: http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation
-.. _guide: http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html
-
-Interpolation Limits
-^^^^^^^^^^^^^^^^^^^^
-
-Like other pandas fill methods, ``interpolate`` accepts a ``limit`` keyword
-argument. Use this argument to limit the number of consecutive interpolations,
-keeping ``NaN`` values for interpolations that are too far from the last valid
-observation:
-
-.. ipython:: python
-
-   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13])
-   ser.interpolate(limit=2)
-
-By default, ``limit`` applies in a forward direction, so that only ``NaN``
-values after a non-``NaN`` value can be filled. If you provide ``'backward'`` or
-``'both'`` for the ``limit_direction`` keyword argument, you can fill ``NaN``
-values before non-``NaN`` values, or both before and after non-``NaN`` values,
-respectively:
-
-.. ipython:: python
-
-   ser.interpolate(limit=1)  # limit_direction == 'forward'
-
-   ser.interpolate(limit=1, limit_direction='backward')
-
-   ser.interpolate(limit=1, limit_direction='both')
-
-.. _missing_data.replace:
-
-Replacing Generic Values
-~~~~~~~~~~~~~~~~~~~~~~~~
-Often times we want to replace arbitrary values with other values. New in v0.8
-is the ``replace`` method in Series/DataFrame that provides an efficient yet
-flexible way to perform such replacements.
-
-For a Series, you can replace a single value or a list of values by another
-value:
-
-.. ipython:: python
-
-   ser = pd.Series([0., 1., 2., 3., 4.])
-
-   ser.replace(0, 5)
-
-You can replace a list of values by a list of other values:
-
-.. ipython:: python
-
-   ser.replace([0, 1, 2, 3, 4], [4, 3, 2, 1, 0])
-
-You can also specify a mapping dict:
-
-.. ipython:: python
-
-   ser.replace({0: 10, 1: 100})
-
-For a DataFrame, you can specify individual values by column:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': [0, 1, 2, 3, 4], 'b': [5, 6, 7, 8, 9]})
-
-   df.replace({'a': 0, 'b': 5}, 100)
-
-Instead of replacing with specified values, you can treat all given values as
-missing and interpolate over them:
-
-.. ipython:: python
-
-   ser.replace([1, 2, 3], method='pad')
-
-.. _missing_data.replace_expression:
-
-String/Regular Expression Replacement
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. note::
-
-   Python strings prefixed with the ``r`` character such as ``r'hello world'``
-   are so-called "raw" strings. They have different semantics regarding
-   backslashes than strings without this prefix. Backslashes in raw strings
-   will be interpreted as an escaped backslash, e.g., ``r'\' == '\\'``. You
-   should `read about them
-   <http://docs.python.org/2/reference/lexical_analysis.html#string-literals>`__
-   if this is unclear.
-
-Replace the '.' with ``nan`` (str -> str)
-
-.. ipython:: python
-
-   d = {'a': list(range(4)), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
-   df = pd.DataFrame(d)
-   df.replace('.', np.nan)
-
-Now do it with a regular expression that removes surrounding whitespace
-(regex -> regex)
-
-.. ipython:: python
-
-   df.replace(r'\s*\.\s*', np.nan, regex=True)
-
-Replace a few different values (list -> list)
-
-.. ipython:: python
-
-   df.replace(['a', '.'], ['b', np.nan])
-
-list of regex -> list of regex
-
-.. ipython:: python
-
-   df.replace([r'\.', r'(a)'], ['dot', '\1stuff'], regex=True)
-
-Only search in column ``'b'`` (dict -> dict)
-
-.. ipython:: python
-
-   df.replace({'b': '.'}, {'b': np.nan})
-
-Same as the previous example, but use a regular expression for
-searching instead (dict of regex -> dict)
-
-.. ipython:: python
-
-   df.replace({'b': r'\s*\.\s*'}, {'b': np.nan}, regex=True)
-
-You can pass nested dictionaries of regular expressions that use ``regex=True``
-
-.. ipython:: python
-
-   df.replace({'b': {'b': r''}}, regex=True)
-
-or you can pass the nested dictionary like so
-
-.. ipython:: python
-
-   df.replace(regex={'b': {r'\s*\.\s*': np.nan}})
-
-You can also use the group of a regular expression match when replacing (dict
-of regex -> dict of regex), this works for lists as well
-
-.. ipython:: python
-
-   df.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, regex=True)
-
-You can pass a list of regular expressions, of which those that match
-will be replaced with a scalar (list of regex -> regex)
-
-.. ipython:: python
-
-   df.replace([r'\s*\.\s*', r'a|b'], np.nan, regex=True)
-
-All of the regular expression examples can also be passed with the
-``to_replace`` argument as the ``regex`` argument. In this case the ``value``
-argument must be passed explicitly by name or ``regex`` must be a nested
-dictionary. The previous example, in this case, would then be
-
-.. ipython:: python
-
-   df.replace(regex=[r'\s*\.\s*', r'a|b'], value=np.nan)
-
-This can be convenient if you do not want to pass ``regex=True`` every time you
-want to use a regular expression.
-
-.. note::
-
-   Anywhere in the above ``replace`` examples that you see a regular expression
-   a compiled regular expression is valid as well.
-
-Numeric Replacement
-~~~~~~~~~~~~~~~~~~~
-
-Similar to ``DataFrame.fillna``
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10, 2))
-   df[np.random.rand(df.shape[0]) > 0.5] = 1.5
-   df.replace(1.5, np.nan)
-
-Replacing more than one value via lists works as well
-
-.. ipython:: python
-
-   df00 = df.values[0, 0]
-   df.replace([1.5, df00], [np.nan, 'a'])
-   df[1].dtype
-
-You can also operate on the DataFrame in place
-
-.. ipython:: python
-
-   df.replace(1.5, np.nan, inplace=True)
-
-.. warning::
-
-   When replacing multiple ``bool`` or ``datetime64`` objects, the first
-   argument to ``replace`` (``to_replace``) must match the type of the value
-   being replaced type. For example,
-
-   .. code-block:: python
-
-      s = pd.Series([True, False, True])
-      s.replace({'a string': 'new value', True: False})  # raises
-
-      TypeError: Cannot compare types 'ndarray(dtype=bool)' and 'str'
-
-   will raise a ``TypeError`` because one of the ``dict`` keys is not of the
-   correct type for replacement.
-
-   However, when replacing a *single* object such as,
-
-   .. ipython:: python
-
-      s = pd.Series([True, False, True])
-      s.replace('a string', 'another string')
-
-   the original ``NDFrame`` object will be returned untouched. We're working on
-   unifying this API, but for backwards compatibility reasons we cannot break
-   the latter behavior. See :issue:`6354` for more details.
-
-Missing data casting rules and indexing
----------------------------------------
-
-While pandas supports storing arrays of integer and boolean type, these types
-are not capable of storing missing data. Until we can switch to using a native
-NA type in NumPy, we've established some "casting rules" when reindexing will
-cause missing data to be introduced into, say, a Series or DataFrame. Here they
-are:
-
-.. csv-table::
-    :header: "data type", "Cast to"
-    :widths: 40, 40
-
-	integer, float
-    boolean, object
-    float, no cast
-    object, no cast
-
-For example:
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5), index=[0, 2, 4, 6, 7])
-   s > 0
-   (s > 0).dtype
-   crit = (s > 0).reindex(list(range(8)))
-   crit
-   crit.dtype
-
-Ordinarily NumPy will complain if you try to use an object array (even if it
-contains boolean values) instead of a boolean array to get or set values from
-an ndarray (e.g. selecting values based on some criteria). If a boolean vector
-contains NAs, an exception will be generated:
-
-.. ipython:: python
-   :okexcept:
-
-   reindexed = s.reindex(list(range(8))).fillna(0)
-   reindexed[crit]
-
-However, these can be filled in using **fillna** and it will work fine:
-
-.. ipython:: python
-
-   reindexed[crit.fillna(False)]
-   reindexed[crit.fillna(True)]
diff --git a/doc/source/options.rst b/doc/source/options.rst
deleted file mode 100644
index 1b219f640cc87..0000000000000
--- a/doc/source/options.rst
+++ /dev/null
@@ -1,541 +0,0 @@
-.. _options:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   import numpy as np
-   np.random.seed(123456)
-
-********************
-Options and Settings
-********************
-
-Overview
---------
-pandas has an options system that lets you customize some aspects of its behaviour,
-display-related options being those the user is most likely to adjust.
-
-Options have a full "dotted-style", case-insensitive name (e.g. ``display.max_rows``).
-You can get/set options directly as attributes of the top-level ``options`` attribute:
-
-.. ipython:: python
-
-   import pandas as pd
-   pd.options.display.max_rows
-   pd.options.display.max_rows = 999
-   pd.options.display.max_rows
-
-There is also an API composed of 5 relevant functions, available directly from the ``pandas``
-namespace:
-
-- :func:`~pandas.get_option` / :func:`~pandas.set_option` - get/set the value of a single option.
-- :func:`~pandas.reset_option` - reset one or more options to their default value.
-- :func:`~pandas.describe_option` - print the descriptions of one or more options.
-- :func:`~pandas.option_context` - execute a codeblock with a set of options
-  that revert to prior settings after execution.
-
-**Note:** developers can check out pandas/core/config.py for more info.
-
-All of the functions above accept a regexp pattern (``re.search`` style) as an argument,
-and so passing in a substring will work - as long as it is unambiguous :
-
-.. ipython:: python
-
-   pd.get_option("display.max_rows")
-   pd.set_option("display.max_rows",101)
-   pd.get_option("display.max_rows")
-   pd.set_option("max_r",102)
-   pd.get_option("display.max_rows")
-
-
-The following will **not work** because it matches multiple option names, e.g.
-``display.max_colwidth``, ``display.max_rows``, ``display.max_columns``:
-
-.. ipython:: python
-   :okexcept:
-
-   try:
-       pd.get_option("column")
-   except KeyError as e:
-       print(e)
-
-
-**Note:** Using this form of shorthand may cause your code to break if new options with similar names are added in future versions.
-
-
-You can get a list of available options and their descriptions with ``describe_option``. When called
-with no argument ``describe_option`` will print out the descriptions for all available options.
-
-.. ipython:: python
-   :suppress:
-   :okwarning:
-
-   pd.reset_option("all")
-
-Getting and Setting Options
----------------------------
-
-As described above, ``get_option()`` and ``set_option()`` are available from the
-pandas namespace.  To change an option, call ``set_option('option regex', new_value)``
-
-.. ipython:: python
-
-   pd.get_option('mode.sim_interactive')
-   pd.set_option('mode.sim_interactive', True)
-   pd.get_option('mode.sim_interactive')
-
-**Note:** that the option 'mode.sim_interactive' is mostly used for debugging purposes.
-
-All options also have a default value, and you can use ``reset_option`` to do just that:
-
-.. ipython:: python
-   :suppress:
-
-   pd.reset_option("display.max_rows")
-
-.. ipython:: python
-
-   pd.get_option("display.max_rows")
-   pd.set_option("display.max_rows",999)
-   pd.get_option("display.max_rows")
-   pd.reset_option("display.max_rows")
-   pd.get_option("display.max_rows")
-
-
-It's also possible to reset multiple options at once (using a regex):
-
-.. ipython:: python
-   :okwarning:
-
-   pd.reset_option("^display")
-
-
-``option_context`` context manager has been exposed through
-the top-level API, allowing you to execute code with given option values. Option values
-are restored automatically when you exit the `with` block:
-
-.. ipython:: python
-
-   with pd.option_context("display.max_rows",10,"display.max_columns", 5):
-        print(pd.get_option("display.max_rows"))
-        print(pd.get_option("display.max_columns"))
-   print(pd.get_option("display.max_rows"))
-   print(pd.get_option("display.max_columns"))
-
-
-Setting Startup Options in python/ipython Environment
------------------------------------------------------
-
-Using startup scripts for the python/ipython environment to import pandas and set options makes working with pandas more efficient.  To do this, create a .py or .ipy script in the startup directory of the desired profile.  An example where the startup folder is in a default ipython profile can be found at:
-
-.. code-block:: none
-
-  $IPYTHONDIR/profile_default/startup
-
-More information can be found in the `ipython documentation
-<http://ipython.org/ipython-doc/stable/interactive/tutorial.html#startup-files>`__.  An example startup script for pandas is displayed below:
-
-.. code-block:: python
-
-  import pandas as pd
-  pd.set_option('display.max_rows', 999)
-  pd.set_option('precision', 5)
-
-.. _options.frequently_used:
-
-Frequently Used Options
------------------------
-The following is a walkthrough of the more frequently used display options.
-
-``display.max_rows`` and ``display.max_columns`` sets the maximum number
-of rows and columns displayed when a frame is pretty-printed.  Truncated
-lines are replaced by an ellipsis.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(7,2))
-   pd.set_option('max_rows', 7)
-   df
-   pd.set_option('max_rows', 5)
-   df
-   pd.reset_option('max_rows')
-
-``display.expand_frame_repr`` allows for the the representation of
-dataframes to stretch across pages, wrapped over the full column vs row-wise.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5,10))
-   pd.set_option('expand_frame_repr', True)
-   df
-   pd.set_option('expand_frame_repr', False)
-   df
-   pd.reset_option('expand_frame_repr')
-
-``display.large_repr`` lets you select whether to display dataframes that exceed
-``max_columns`` or ``max_rows`` as a truncated frame, or as a summary.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10,10))
-   pd.set_option('max_rows', 5)
-   pd.set_option('large_repr', 'truncate')
-   df
-   pd.set_option('large_repr', 'info')
-   df
-   pd.reset_option('large_repr')
-   pd.reset_option('max_rows')
-
-``display.max_colwidth`` sets the maximum width of columns.  Cells
-of this length or longer will be truncated with an ellipsis.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.array([['foo', 'bar', 'bim', 'uncomfortably long string'],
-                               ['horse', 'cow', 'banana', 'apple']]))
-   pd.set_option('max_colwidth',40)
-   df
-   pd.set_option('max_colwidth', 6)
-   df
-   pd.reset_option('max_colwidth')
-
-``display.max_info_columns`` sets a threshold for when by-column info
-will be given.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(10,10))
-   pd.set_option('max_info_columns', 11)
-   df.info()
-   pd.set_option('max_info_columns', 5)
-   df.info()
-   pd.reset_option('max_info_columns')
-
-``display.max_info_rows``: ``df.info()`` will usually show null-counts for each column.
-For large frames this can be quite slow. ``max_info_rows`` and ``max_info_cols``
-limit this null check only to frames with smaller dimensions then specified. Note that you
-can specify the option ``df.info(null_counts=True)`` to override on showing a particular frame.
-
-.. ipython:: python
-
-   df  =pd.DataFrame(np.random.choice([0,1,np.nan], size=(10,10)))
-   df
-   pd.set_option('max_info_rows', 11)
-   df.info()
-   pd.set_option('max_info_rows', 5)
-   df.info()
-   pd.reset_option('max_info_rows')
-
-``display.precision`` sets the output display precision in terms of decimal places. This is only a
-suggestion.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5,5))
-   pd.set_option('precision',7)
-   df
-   pd.set_option('precision',4)
-   df
-
-``display.chop_threshold`` sets at what level pandas rounds to zero when
-it displays a Series of DataFrame.  Note, this does not effect the
-precision at which the number is stored.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(6,6))
-   pd.set_option('chop_threshold', 0)
-   df
-   pd.set_option('chop_threshold', .5)
-   df
-   pd.reset_option('chop_threshold')
-
-``display.colheader_justify`` controls the justification of the headers.
-Options are 'right', and 'left'.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.array([np.random.randn(6), np.random.randint(1,9,6)*.1, np.zeros(6)]).T,
-                     columns=['A', 'B', 'C'], dtype='float')
-   pd.set_option('colheader_justify', 'right')
-   df
-   pd.set_option('colheader_justify', 'left')
-   df
-   pd.reset_option('colheader_justify')
-
-
-
-.. _options.available:
-
-Available Options
------------------
-
-=================================== ============ ==================================
-Option                              Default      Function
-=================================== ============ ==================================
-display.chop_threshold              None         If set to a float value, all float
-                                                 values smaller then the given
-                                                 threshold will be displayed as
-                                                 exactly 0 by repr and friends.
-display.colheader_justify           right        Controls the justification of
-                                                 column headers. used by DataFrameFormatter.
-display.column_space                12           No description available.
-display.date_dayfirst               False        When True, prints and parses dates
-                                                 with the day first, eg 20/01/2005
-display.date_yearfirst              False        When True, prints and parses dates
-                                                 with the year first, eg 2005/01/20
-display.encoding                    UTF-8        Defaults to the detected encoding
-                                                 of the console. Specifies the encoding
-                                                 to be used for strings returned by
-                                                 to_string, these are generally strings
-                                                 meant to be displayed on the console.
-display.expand_frame_repr           True         Whether to print out the full DataFrame
-                                                 repr for wide DataFrames across
-                                                 multiple lines, `max_columns` is
-                                                 still respected, but the output will
-                                                 wrap-around across multiple "pages"
-                                                 if its width exceeds `display.width`.
-display.float_format                None         The callable should accept a floating
-                                                 point number and return a string with
-                                                 the desired format of the number.
-                                                 This is used in some places like
-                                                 SeriesFormatter.
-                                                 See core.format.EngFormatter for an example.
-display.height                      60           Deprecated. Use `display.max_rows` instead.
-display.large_repr                  truncate     For DataFrames exceeding max_rows/max_cols,
-                                                 the repr (and HTML repr) can show
-                                                 a truncated table (the default from 0.13),
-                                                 or switch to the view from df.info()
-                                                 (the behaviour in earlier versions of pandas).
-                                                 allowable settings, ['truncate', 'info']
-display.latex.repr                  False        Whether to produce a latex DataFrame
-                                                 representation for jupyter frontends
-                                                 that support it.
-display.latex.escape                True         Escapes special caracters in Dataframes, when
-                                                 using the to_latex method.
-display.latex.longtable             False        Specifies if the to_latex method of a Dataframe
-                                                 uses the longtable format.
-display.latex.multicolumn           True         Combines columns when using a MultiIndex
-display.latex.multicolumn_format    'l'          Alignment of multicolumn labels
-display.latex.multirow              False        Combines rows when using a MultiIndex.
-                                                 Centered instead of top-aligned,
-                                                 separated by clines.
-display.line_width                  80           Deprecated. Use `display.width` instead.
-display.max_columns                 20           max_rows and max_columns are used
-                                                 in __repr__() methods to decide if
-                                                 to_string() or info() is used to
-                                                 render an object to a string.  In
-                                                 case python/IPython is running in
-                                                 a terminal this can be set to 0 and
-                                                 pandas will correctly auto-detect
-                                                 the width the terminal and swap to
-                                                 a smaller format in case all columns
-                                                 would not fit vertically. The IPython
-                                                 notebook, IPython qtconsole, or IDLE
-                                                 do not run in a terminal and hence
-                                                 it is not possible to do correct
-                                                 auto-detection. 'None' value means
-                                                 unlimited.
-display.max_colwidth                50           The maximum width in characters of
-                                                 a column in the repr of a pandas
-                                                 data structure. When the column overflows,
-                                                 a "..." placeholder is embedded in
-                                                 the output.
-display.max_info_columns            100          max_info_columns is used in DataFrame.info
-                                                 method to decide if per column information
-                                                 will be printed.
-display.max_info_rows               1690785      df.info() will usually show null-counts
-                                                 for each column. For large frames
-                                                 this can be quite slow. max_info_rows
-                                                 and max_info_cols limit this null
-                                                 check only to frames with smaller
-                                                 dimensions then specified.
-display.max_rows                    60           This sets the maximum number of rows
-                                                 pandas should output when printing
-                                                 out various output. For example,
-                                                 this value determines whether the
-                                                 repr() for a dataframe prints out
-                                                 fully or just a summary repr.
-                                                 'None' value means unlimited.
-display.max_seq_items               100          when pretty-printing a long sequence,
-                                                 no more then `max_seq_items` will
-                                                 be printed. If items are omitted,
-                                                 they will be denoted by the addition
-                                                 of "..." to the resulting string.
-                                                 If set to None, the number of items
-                                                 to be printed is unlimited.
-display.memory_usage                True         This specifies if the memory usage of
-                                                 a DataFrame should be displayed when the
-                                                 df.info() method is invoked.
-display.multi_sparse                True         "Sparsify" MultiIndex display (don't
-                                                 display repeated elements in outer
-                                                 levels within groups)
-display.notebook_repr_html          True         When True, IPython notebook will
-                                                 use html representation for
-                                                 pandas objects (if it is available).
-display.pprint_nest_depth           3            Controls the number of nested levels
-                                                 to process when pretty-printing
-display.precision                   6            Floating point output precision in
-                                                 terms of number of places after the
-                                                 decimal, for regular formatting as well
-                                                 as scientific notation. Similar to
-                                                 numpy's ``precision`` print option
-display.show_dimensions             truncate     Whether to print out dimensions
-                                                 at the end of DataFrame repr.
-                                                 If 'truncate' is specified, only
-                                                 print out the dimensions if the
-                                                 frame is truncated (e.g. not display
-                                                 all rows and/or columns)
-display.width                       80           Width of the display in characters.
-                                                 In case python/IPython is running in
-                                                 a terminal this can be set to None
-                                                 and pandas will correctly auto-detect
-                                                 the width. Note that the IPython notebook,
-                                                 IPython qtconsole, or IDLE do not run in a
-                                                 terminal and hence it is not possible
-                                                 to correctly detect the width.
-display.html.table_schema           False        Whether to publish a Table Schema
-                                                 representation for frontends that
-                                                 support it.
-html.border                         1            A ``border=value`` attribute is
-                                                 inserted in the ``<table>`` tag
-                                                 for the DataFrame HTML repr.
-io.excel.xls.writer                 xlwt         The default Excel writer engine for
-                                                 'xls' files.
-io.excel.xlsm.writer                openpyxl     The default Excel writer engine for
-                                                 'xlsm' files. Available options:
-                                                 'openpyxl' (the default).
-io.excel.xlsx.writer                openpyxl     The default Excel writer engine for
-                                                 'xlsx' files.
-io.hdf.default_format               None         default format writing format, if
-                                                 None, then put will default to
-                                                 'fixed' and append will default to
-                                                 'table'
-io.hdf.dropna_table                 True         drop ALL nan rows when appending
-                                                 to a table
-mode.chained_assignment             warn         Raise an exception, warn, or no
-                                                 action if trying to use chained
-                                                 assignment, The default is warn
-mode.sim_interactive                False        Whether to simulate interactive mode
-                                                 for purposes of testing
-mode.use_inf_as_null                False        True means treat None, NaN, -INF,
-                                                 INF as null (old way), False means
-                                                 None and NaN are null, but INF, -INF
-                                                 are not null (new way).
-=================================== ============ ==================================
-
-
-.. _basics.console_output:
-
-Number Formatting
-------------------
-
-pandas also allows you to set how numbers are displayed in the console.
-This option is not set through the ``set_options`` API.
-
-Use the ``set_eng_float_format`` function
-to alter the floating-point formatting of pandas objects to produce a particular
-format.
-
-For instance:
-
-.. ipython:: python
-
-   import numpy as np
-
-   pd.set_eng_float_format(accuracy=3, use_eng_prefix=True)
-   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
-   s/1.e3
-   s/1.e6
-
-.. ipython:: python
-   :suppress:
-   :okwarning:
-
-   pd.reset_option('^display\.')
-
-To round floats on a case-by-case basis, you can also use :meth:`~pandas.Series.round` and :meth:`~pandas.DataFrame.round`.
-
-.. _options.east_asian_width:
-
-Unicode Formatting
-------------------
-
-.. warning::
-
-   Enabling this option will affect the performance for printing of DataFrame and Series (about 2 times slower).
-   Use only when it is actually required.
-
-Some East Asian countries use Unicode characters its width is corresponding to 2 alphabets.
-If DataFrame or Series contains these characters, default output cannot be aligned properly.
-
-.. note:: Screen captures are attached for each outputs to show the actual results.
-
-.. ipython:: python
-
-   df = pd.DataFrame({u'国籍': ['UK', u'日本'], u'名前': ['Alice', u'しのぶ']})
-   df;
-
-.. image:: _static/option_unicode01.png
-
-Enable ``display.unicode.east_asian_width`` allows pandas to check each character's "East Asian Width" property.
-These characters can be aligned properly by checking this property, but it takes longer time than standard ``len`` function.
-
-.. ipython:: python
-
-   pd.set_option('display.unicode.east_asian_width', True)
-   df;
-
-.. image:: _static/option_unicode02.png
-
-In addition, Unicode contains characters which width is "Ambiguous". These character's width should be either 1 or 2 depending on terminal setting or encoding. Because this cannot be distinguished from Python, ``display.unicode.ambiguous_as_wide`` option is added to handle this.
-
-By default, "Ambiguous" character's width, "¡" (inverted exclamation) in below example, is regarded as 1.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': ['xxx', u'¡¡'], 'b': ['yyy', u'¡¡']})
-   df;
-
-.. image:: _static/option_unicode03.png
-
-Enabling ``display.unicode.ambiguous_as_wide`` lets pandas to figure these character's width as 2. Note that this option will be effective only when ``display.unicode.east_asian_width`` is enabled. Confirm starting position has been changed, but is not aligned properly because the setting is mismatched with this environment.
-
-.. ipython:: python
-
-   pd.set_option('display.unicode.ambiguous_as_wide', True)
-   df;
-
-.. image:: _static/option_unicode04.png
-
-.. ipython:: python
-   :suppress:
-
-   pd.set_option('display.unicode.east_asian_width', False)
-   pd.set_option('display.unicode.ambiguous_as_wide', False)
-
-.. _options.table_schema:
-
-Table Schema Display
---------------------
-
-.. versionadded:: 0.20.0
-
-``DataFrame`` and ``Series`` will publish a Table Schema representation
-by default. False by default, this can be enabled globally with the
-``display.html.table_schema`` option:
-
-.. ipython:: python
-
-  pd.set_option('display.html.table_schema', True)
-
-Only ``'display.max_rows'`` are serialized and published.
-
-
-.. ipython:: python
-    :suppress:
-
-    pd.reset_option('display.html.table_schema')
\ No newline at end of file
diff --git a/doc/source/overview.rst b/doc/source/overview.rst
deleted file mode 100644
index 92caeec319169..0000000000000
--- a/doc/source/overview.rst
+++ /dev/null
@@ -1,120 +0,0 @@
-.. _overview:
-
-.. currentmodule:: pandas
-
-****************
-Package overview
-****************
-
-:mod:`pandas` consists of the following things
-
- * A set of labeled array data structures, the primary of which are
-   Series and DataFrame
- * Index objects enabling both simple axis indexing and multi-level /
-   hierarchical axis indexing
- * An integrated group by engine for aggregating and transforming data sets
- * Date range generation (date_range) and custom date offsets enabling the
-   implementation of customized frequencies
- * Input/Output tools: loading tabular data from flat files (CSV, delimited,
-   Excel 2003), and saving and loading pandas objects from the fast and
-   efficient PyTables/HDF5 format.
- * Memory-efficient "sparse" versions of the standard data structures for storing
-   data that is mostly missing or mostly constant (some fixed value)
- * Moving window statistics (rolling mean, rolling standard deviation, etc.)
- * Static and moving window linear and `panel regression
-   <http://en.wikipedia.org/wiki/Panel_data>`__
-
-Data structures at a glance
----------------------------
-
-.. csv-table::
-    :header: "Dimensions", "Name", "Description"
-    :widths: 15, 20, 50
-
-    1, Series, "1D labeled homogeneously-typed array"
-    2, DataFrame, "General 2D labeled, size-mutable tabular structure with
-    potentially heterogeneously-typed columns"
-    3, Panel, "General 3D labeled, also size-mutable array"
-
-Why more than 1 data structure?
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The best way to think about the pandas data structures is as flexible
-containers for lower dimensional data. For example, DataFrame is a container
-for Series, and Panel is a container for DataFrame objects. We would like to be
-able to insert and remove objects from these containers in a dictionary-like
-fashion.
-
-Also, we would like sensible default behaviors for the common API functions
-which take into account the typical orientation of time series and
-cross-sectional data sets. When using ndarrays to store 2- and 3-dimensional
-data, a burden is placed on the user to consider the orientation of the data
-set when writing functions; axes are considered more or less equivalent (except
-when C- or Fortran-contiguousness matters for performance). In pandas, the axes
-are intended to lend more semantic meaning to the data; i.e., for a particular
-data set there is likely to be a "right" way to orient the data. The goal,
-then, is to reduce the amount of mental effort required to code up data
-transformations in downstream functions.
-
-For example, with tabular data (DataFrame) it is more semantically helpful to
-think of the **index** (the rows) and the **columns** rather than axis 0 and
-axis 1. And iterating through the columns of the DataFrame thus results in more
-readable code:
-
-::
-
-    for col in df.columns:
-        series = df[col]
-        # do something with series
-
-Mutability and copying of data
-------------------------------
-
-All pandas data structures are value-mutable (the values they contain can be
-altered) but not always size-mutable. The length of a Series cannot be
-changed, but, for example, columns can be inserted into a DataFrame. However,
-the vast majority of methods produce new objects and leave the input data
-untouched. In general, though, we like to **favor immutability** where
-sensible.
-
-Getting Support
----------------
-
-The first stop for pandas issues and ideas is the `Github Issue Tracker
-<https://github.com/pandas-dev/pandas/issues>`__. If you have a general question,
-pandas community experts can answer through `Stack Overflow
-<http://stackoverflow.com/questions/tagged/pandas>`__.
-
-Longer discussions occur on the `developer mailing list
-<http://groups.google.com/group/pystatsmodels>`__, and commercial support
-inquiries for Lambda Foundry should be sent to: support@lambdafoundry.com
-
-Credits
--------
-
-pandas development began at `AQR Capital Management <http://www.aqr.com>`__ in
-April 2008. It was open-sourced at the end of 2009. AQR continued to provide
-resources for development through the end of 2011, and continues to contribute
-bug reports today.
-
-Since January 2012, `Lambda Foundry <http://www.lambdafoundry.com>`__, has
-been providing development resources, as well as commercial support,
-training, and consulting for pandas.
-
-pandas is only made possible by a group of people around the world like you
-who have contributed new code, bug reports, fixes, comments and ideas. A
-complete list can be found `on Github <http://www.github.com/pandas-dev/pandas/contributors>`__.
-
-Development Team
-----------------
-
-pandas is a part of the PyData project. The PyData Development Team is a
-collection of developers focused on the improvement of Python's data
-libraries. The core team that coordinates development can be found on `Github
-<http://github.com/pydata>`__. If you're interested in contributing, please
-visit the `project website <http://pandas.pydata.org>`__.
-
-License
--------
-
-.. literalinclude:: ../../LICENSE
diff --git a/doc/source/r_interface.rst b/doc/source/r_interface.rst
deleted file mode 100644
index 88634d7f75c63..0000000000000
--- a/doc/source/r_interface.rst
+++ /dev/null
@@ -1,76 +0,0 @@
-.. _rpy:
-
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   pd.options.display.max_rows = 15
-
-
-******************
-rpy2 / R interface
-******************
-
-.. warning::
-
-    Up to pandas 0.19, a ``pandas.rpy`` module existed with functionality to
-    convert between pandas and ``rpy2`` objects. This functionality now lives in
-    the `rpy2 <https://rpy2.readthedocs.io/>`__ project itself.
-    See the `updating section <http://pandas.pydata.org/pandas-docs/version/0.19.0/r_interface.html#updating-your-code-to-use-rpy2-functions>`__
-    of the previous documentation for a guide to port your code from the
-    removed ``pandas.rpy`` to ``rpy2`` functions.
-
-
-`rpy2 <http://rpy2.bitbucket.org/>`__ is an interface to R running embedded in a Python process, and also includes functionality to deal with pandas DataFrames.
-Converting data frames back and forth between rpy2 and pandas should be largely
-automated (no need to convert explicitly, it will be done on the fly in most
-rpy2 functions).
-To convert explicitly, the functions are ``pandas2ri.py2ri()`` and
-``pandas2ri.ri2py()``.
-
-
-See also the documentation of the `rpy2 <http://rpy2.bitbucket.org/>`__ project: https://rpy2.readthedocs.io.
-
-In the remainder of this page, a few examples of explicit conversion is given. The pandas conversion of rpy2 needs first to be activated:
-
-.. ipython:: python
-
-   from rpy2.robjects import r, pandas2ri
-   pandas2ri.activate()
-
-Transferring R data sets into Python
-------------------------------------
-
-Once the pandas conversion is activated (``pandas2ri.activate()``), many conversions
-of R to pandas objects will be done automatically. For example, to obtain the 'iris' dataset as a pandas DataFrame:
-
-.. ipython:: python
-
-    r.data('iris')
-    r['iris'].head()
-
-If the pandas conversion was not activated, the above could also be accomplished
-by explicitly converting it with the ``pandas2ri.ri2py`` function
-(``pandas2ri.ri2py(r['iris'])``).
-
-Converting DataFrames into R objects
-------------------------------------
-
-The ``pandas2ri.py2ri`` function support the reverse operation to convert
-DataFrames into the equivalent R object (that is, **data.frame**):
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6], 'C':[7,8,9]},
-                     index=["one", "two", "three"])
-   r_dataframe = pandas2ri.py2ri(df)
-   print(type(r_dataframe))
-   print(r_dataframe)
-
-The DataFrame's index is stored as the ``rownames`` attribute of the
-data.frame instance.
-
-
-..
-   Calling R functions with pandas objects
-   High-level interface to R estimators
diff --git a/doc/source/reference/arrays.rst b/doc/source/reference/arrays.rst
new file mode 100644
index 0000000000000..a129b75636536
--- /dev/null
+++ b/doc/source/reference/arrays.rst
@@ -0,0 +1,403 @@
+{{ header }}
+
+.. _api.arrays:
+
+=============
+Pandas Arrays
+=============
+
+.. currentmodule:: pandas
+
+For most data types, pandas uses NumPy arrays as the concrete
+objects contained with a :class:`Index`, :class:`Series`, or
+:class:`DataFrame`.
+
+For some data types, pandas extends NumPy's type system.
+
+=================== ========================= ================== =============================
+Kind of Data        Pandas Data Type          Scalar             Array
+=================== ========================= ================== =============================
+TZ-aware datetime   :class:`DatetimeTZDtype`  :class:`Timestamp` :ref:`api.arrays.datetime`
+Timedeltas          (none)                    :class:`Timedelta` :ref:`api.arrays.timedelta`
+Period (time spans) :class:`PeriodDtype`      :class:`Period`    :ref:`api.arrays.period`
+Intervals           :class:`IntervalDtype`    :class:`Interval`  :ref:`api.arrays.interval`
+Nullable Integer    :class:`Int64Dtype`, ...  (none)             :ref:`api.arrays.integer_na`
+Categorical         :class:`CategoricalDtype` (none)             :ref:`api.arrays.categorical`
+Sparse              :class:`SparseDtype`      (none)             :ref:`api.arrays.sparse`
+=================== ========================= ================== =============================
+
+Pandas and third-party libraries can extend NumPy's type system (see :ref:`extending.extension-types`).
+The top-level :meth:`array` method can be used to create a new array, which may be
+stored in a :class:`Series`, :class:`Index`, or as a column in a :class:`DataFrame`.
+
+.. autosummary::
+   :toctree: api/
+
+   array
+
+.. _api.arrays.datetime:
+
+Datetime Data
+-------------
+
+NumPy cannot natively represent timezone-aware datetimes. Pandas supports this
+with the :class:`arrays.DatetimeArray` extension array, which can hold timezone-naive
+or timezone-aware values.
+
+:class:`Timestamp`, a subclass of :class:`datetime.datetime`, is pandas'
+scalar type for timezone-naive or timezone-aware datetime data.
+
+.. autosummary::
+   :toctree: api/
+
+   Timestamp
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Timestamp.asm8
+   Timestamp.day
+   Timestamp.dayofweek
+   Timestamp.dayofyear
+   Timestamp.days_in_month
+   Timestamp.daysinmonth
+   Timestamp.fold
+   Timestamp.hour
+   Timestamp.is_leap_year
+   Timestamp.is_month_end
+   Timestamp.is_month_start
+   Timestamp.is_quarter_end
+   Timestamp.is_quarter_start
+   Timestamp.is_year_end
+   Timestamp.is_year_start
+   Timestamp.max
+   Timestamp.microsecond
+   Timestamp.min
+   Timestamp.minute
+   Timestamp.month
+   Timestamp.nanosecond
+   Timestamp.quarter
+   Timestamp.resolution
+   Timestamp.second
+   Timestamp.tz
+   Timestamp.tzinfo
+   Timestamp.value
+   Timestamp.week
+   Timestamp.weekofyear
+   Timestamp.year
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Timestamp.astimezone
+   Timestamp.ceil
+   Timestamp.combine
+   Timestamp.ctime
+   Timestamp.date
+   Timestamp.day_name
+   Timestamp.dst
+   Timestamp.floor
+   Timestamp.freq
+   Timestamp.freqstr
+   Timestamp.fromordinal
+   Timestamp.fromtimestamp
+   Timestamp.isocalendar
+   Timestamp.isoformat
+   Timestamp.isoweekday
+   Timestamp.month_name
+   Timestamp.normalize
+   Timestamp.now
+   Timestamp.replace
+   Timestamp.round
+   Timestamp.strftime
+   Timestamp.strptime
+   Timestamp.time
+   Timestamp.timestamp
+   Timestamp.timetuple
+   Timestamp.timetz
+   Timestamp.to_datetime64
+   Timestamp.to_numpy
+   Timestamp.to_julian_date
+   Timestamp.to_period
+   Timestamp.to_pydatetime
+   Timestamp.today
+   Timestamp.toordinal
+   Timestamp.tz_convert
+   Timestamp.tz_localize
+   Timestamp.tzname
+   Timestamp.utcfromtimestamp
+   Timestamp.utcnow
+   Timestamp.utcoffset
+   Timestamp.utctimetuple
+   Timestamp.weekday
+
+A collection of timestamps may be stored in a :class:`arrays.DatetimeArray`.
+For timezone-aware data, the ``.dtype`` of a ``DatetimeArray`` is a
+:class:`DatetimeTZDtype`. For timezone-naive data, ``np.dtype("datetime64[ns]")``
+is used.
+
+If the data are tz-aware, then every value in the array must have the same timezone.
+
+.. autosummary::
+   :toctree: api/
+
+   arrays.DatetimeArray
+   DatetimeTZDtype
+
+.. _api.arrays.timedelta:
+
+Timedelta Data
+--------------
+
+NumPy can natively represent timedeltas. Pandas provides :class:`Timedelta`
+for symmetry with :class:`Timestamp`.
+
+.. autosummary::
+   :toctree: api/
+
+   Timedelta
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Timedelta.asm8
+   Timedelta.components
+   Timedelta.days
+   Timedelta.delta
+   Timedelta.freq
+   Timedelta.is_populated
+   Timedelta.max
+   Timedelta.microseconds
+   Timedelta.min
+   Timedelta.nanoseconds
+   Timedelta.resolution
+   Timedelta.seconds
+   Timedelta.value
+   Timedelta.view
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Timedelta.ceil
+   Timedelta.floor
+   Timedelta.isoformat
+   Timedelta.round
+   Timedelta.to_pytimedelta
+   Timedelta.to_timedelta64
+   Timedelta.to_numpy
+   Timedelta.total_seconds
+
+A collection of timedeltas may be stored in a :class:`TimedeltaArray`.
+
+.. autosummary::
+   :toctree: api/
+
+   arrays.TimedeltaArray
+
+.. _api.arrays.period:
+
+Timespan Data
+-------------
+
+Pandas represents spans of times as :class:`Period` objects.
+
+Period
+------
+.. autosummary::
+   :toctree: api/
+
+   Period
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Period.day
+   Period.dayofweek
+   Period.dayofyear
+   Period.days_in_month
+   Period.daysinmonth
+   Period.end_time
+   Period.freq
+   Period.freqstr
+   Period.hour
+   Period.is_leap_year
+   Period.minute
+   Period.month
+   Period.ordinal
+   Period.quarter
+   Period.qyear
+   Period.second
+   Period.start_time
+   Period.week
+   Period.weekday
+   Period.weekofyear
+   Period.year
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Period.asfreq
+   Period.now
+   Period.strftime
+   Period.to_timestamp
+
+A collection of timedeltas may be stored in a :class:`arrays.PeriodArray`.
+Every period in a ``PeriodArray`` must have the same ``freq``.
+
+.. autosummary::
+   :toctree: api/
+
+   arrays.DatetimeArray
+   PeriodDtype
+
+.. _api.arrays.interval:
+
+Interval Data
+-------------
+
+Arbitrary intervals can be represented as :class:`Interval` objects.
+
+.. autosummary::
+   :toctree: api/
+
+    Interval
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Interval.closed
+   Interval.closed_left
+   Interval.closed_right
+   Interval.left
+   Interval.length
+   Interval.mid
+   Interval.open_left
+   Interval.open_right
+   Interval.overlaps
+   Interval.right
+
+A collection of intervals may be stored in an :class:`arrays.IntervalArray`.
+
+.. autosummary::
+   :toctree: api/
+
+   arrays.IntervalArray
+   IntervalDtype
+
+.. _api.arrays.integer_na:
+
+Nullable Integer
+----------------
+
+:class:`numpy.ndarray` cannot natively represent integer-data with missing values.
+Pandas provides this through :class:`arrays.IntegerArray`.
+
+.. autosummary::
+   :toctree: api/
+
+   arrays.IntegerArray
+   Int8Dtype
+   Int16Dtype
+   Int32Dtype
+   Int64Dtype
+   UInt8Dtype
+   UInt16Dtype
+   UInt32Dtype
+   UInt64Dtype
+
+.. _api.arrays.categorical:
+
+Categorical Data
+----------------
+
+Pandas defines a custom data type for representing data that can take only a
+limited, fixed set of values. The dtype of a ``Categorical`` can be described by
+a :class:`pandas.api.types.CategoricalDtype`.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   CategoricalDtype
+
+.. autosummary::
+   :toctree: api/
+
+   CategoricalDtype.categories
+   CategoricalDtype.ordered
+
+Categorical data can be stored in a :class:`pandas.Categorical`
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   Categorical
+
+The alternative :meth:`Categorical.from_codes` constructor can be used when you
+have the categories and integer codes already:
+
+.. autosummary::
+   :toctree: api/
+
+   Categorical.from_codes
+
+The dtype information is available on the ``Categorical``
+
+.. autosummary::
+   :toctree: api/
+
+   Categorical.dtype
+   Categorical.categories
+   Categorical.ordered
+   Categorical.codes
+
+``np.asarray(categorical)`` works by implementing the array interface. Be aware, that this converts
+the Categorical back to a NumPy array, so categories and order information is not preserved!
+
+.. autosummary::
+   :toctree: api/
+
+   Categorical.__array__
+
+A ``Categorical`` can be stored in a ``Series`` or ``DataFrame``.
+To create a Series of dtype ``category``, use ``cat = s.astype(dtype)`` or
+``Series(..., dtype=dtype)`` where ``dtype`` is either
+
+* the string ``'category'``
+* an instance of :class:`~pandas.api.types.CategoricalDtype`.
+
+If the Series is of dtype ``CategoricalDtype``, ``Series.cat`` can be used to change the categorical
+data. See :ref:`api.series.cat` for more.
+
+.. _api.arrays.sparse:
+
+Sparse Data
+-----------
+
+Data where a single value is repeated many times (e.g. ``0`` or ``NaN``) may
+be stored efficiently as a :class:`SparseArray`.
+
+.. autosummary::
+   :toctree: api/
+
+   SparseArray
+   SparseDtype
+
+The ``Series.sparse`` accessor may be used to access sparse-specific attributes
+and methods if the :class:`Series` contains sparse values. See
+:ref:`api.series.sparse` for more.
diff --git a/doc/source/reference/extensions.rst b/doc/source/reference/extensions.rst
new file mode 100644
index 0000000000000..6146e34fab274
--- /dev/null
+++ b/doc/source/reference/extensions.rst
@@ -0,0 +1,22 @@
+{{ header }}
+
+.. _api.extensions:
+
+==========
+Extensions
+==========
+.. currentmodule:: pandas
+
+These are primarily intended for library authors looking to extend pandas
+objects.
+
+.. autosummary::
+   :toctree: api/
+
+   api.extensions.register_extension_dtype
+   api.extensions.register_dataframe_accessor
+   api.extensions.register_series_accessor
+   api.extensions.register_index_accessor
+   api.extensions.ExtensionDtype
+   api.extensions.ExtensionArray
+   arrays.PandasArray
diff --git a/doc/source/reference/frame.rst b/doc/source/reference/frame.rst
new file mode 100644
index 0000000000000..568acd5207bd1
--- /dev/null
+++ b/doc/source/reference/frame.rst
@@ -0,0 +1,351 @@
+{{ header }}
+
+.. _api.dataframe:
+
+=========
+DataFrame
+=========
+.. currentmodule:: pandas
+
+Constructor
+~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame
+
+Attributes and underlying data
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+**Axes**
+
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.index
+   DataFrame.columns
+
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.dtypes
+   DataFrame.ftypes
+   DataFrame.get_dtype_counts
+   DataFrame.get_ftype_counts
+   DataFrame.select_dtypes
+   DataFrame.values
+   DataFrame.get_values
+   DataFrame.axes
+   DataFrame.ndim
+   DataFrame.size
+   DataFrame.shape
+   DataFrame.memory_usage
+   DataFrame.empty
+   DataFrame.is_copy
+
+Conversion
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.astype
+   DataFrame.convert_objects
+   DataFrame.infer_objects
+   DataFrame.copy
+   DataFrame.isna
+   DataFrame.notna
+   DataFrame.bool
+
+Indexing, iteration
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.head
+   DataFrame.at
+   DataFrame.iat
+   DataFrame.loc
+   DataFrame.iloc
+   DataFrame.insert
+   DataFrame.__iter__
+   DataFrame.items
+   DataFrame.keys
+   DataFrame.iteritems
+   DataFrame.iterrows
+   DataFrame.itertuples
+   DataFrame.lookup
+   DataFrame.pop
+   DataFrame.tail
+   DataFrame.xs
+   DataFrame.get
+   DataFrame.isin
+   DataFrame.where
+   DataFrame.mask
+   DataFrame.query
+
+For more information on ``.at``, ``.iat``, ``.loc``, and
+``.iloc``,  see the :ref:`indexing documentation <indexing>`.
+
+Binary operator functions
+~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.add
+   DataFrame.sub
+   DataFrame.mul
+   DataFrame.div
+   DataFrame.truediv
+   DataFrame.floordiv
+   DataFrame.mod
+   DataFrame.pow
+   DataFrame.dot
+   DataFrame.radd
+   DataFrame.rsub
+   DataFrame.rmul
+   DataFrame.rdiv
+   DataFrame.rtruediv
+   DataFrame.rfloordiv
+   DataFrame.rmod
+   DataFrame.rpow
+   DataFrame.lt
+   DataFrame.gt
+   DataFrame.le
+   DataFrame.ge
+   DataFrame.ne
+   DataFrame.eq
+   DataFrame.combine
+   DataFrame.combine_first
+
+Function application, GroupBy & Window
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.apply
+   DataFrame.applymap
+   DataFrame.pipe
+   DataFrame.agg
+   DataFrame.aggregate
+   DataFrame.transform
+   DataFrame.groupby
+   DataFrame.rolling
+   DataFrame.expanding
+   DataFrame.ewm
+
+.. _api.dataframe.stats:
+
+Computations / Descriptive Stats
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.abs
+   DataFrame.all
+   DataFrame.any
+   DataFrame.clip
+   DataFrame.clip_lower
+   DataFrame.clip_upper
+   DataFrame.compound
+   DataFrame.corr
+   DataFrame.corrwith
+   DataFrame.count
+   DataFrame.cov
+   DataFrame.cummax
+   DataFrame.cummin
+   DataFrame.cumprod
+   DataFrame.cumsum
+   DataFrame.describe
+   DataFrame.diff
+   DataFrame.eval
+   DataFrame.kurt
+   DataFrame.kurtosis
+   DataFrame.mad
+   DataFrame.max
+   DataFrame.mean
+   DataFrame.median
+   DataFrame.min
+   DataFrame.mode
+   DataFrame.pct_change
+   DataFrame.prod
+   DataFrame.product
+   DataFrame.quantile
+   DataFrame.rank
+   DataFrame.round
+   DataFrame.sem
+   DataFrame.skew
+   DataFrame.sum
+   DataFrame.std
+   DataFrame.var
+   DataFrame.nunique
+
+Reindexing / Selection / Label manipulation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.add_prefix
+   DataFrame.add_suffix
+   DataFrame.align
+   DataFrame.at_time
+   DataFrame.between_time
+   DataFrame.drop
+   DataFrame.drop_duplicates
+   DataFrame.duplicated
+   DataFrame.equals
+   DataFrame.filter
+   DataFrame.first
+   DataFrame.head
+   DataFrame.idxmax
+   DataFrame.idxmin
+   DataFrame.last
+   DataFrame.reindex
+   DataFrame.reindex_axis
+   DataFrame.reindex_like
+   DataFrame.rename
+   DataFrame.rename_axis
+   DataFrame.reset_index
+   DataFrame.sample
+   DataFrame.select
+   DataFrame.set_axis
+   DataFrame.set_index
+   DataFrame.tail
+   DataFrame.take
+   DataFrame.truncate
+
+.. _api.dataframe.missing:
+
+Missing data handling
+~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.dropna
+   DataFrame.fillna
+   DataFrame.replace
+   DataFrame.interpolate
+
+Reshaping, sorting, transposing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.droplevel
+   DataFrame.pivot
+   DataFrame.pivot_table
+   DataFrame.reorder_levels
+   DataFrame.sort_values
+   DataFrame.sort_index
+   DataFrame.nlargest
+   DataFrame.nsmallest
+   DataFrame.swaplevel
+   DataFrame.stack
+   DataFrame.unstack
+   DataFrame.swapaxes
+   DataFrame.melt
+   DataFrame.squeeze
+   DataFrame.to_panel
+   DataFrame.to_xarray
+   DataFrame.T
+   DataFrame.transpose
+
+Combining / joining / merging
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.append
+   DataFrame.assign
+   DataFrame.join
+   DataFrame.merge
+   DataFrame.update
+
+Time series-related
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.asfreq
+   DataFrame.asof
+   DataFrame.shift
+   DataFrame.slice_shift
+   DataFrame.tshift
+   DataFrame.first_valid_index
+   DataFrame.last_valid_index
+   DataFrame.resample
+   DataFrame.to_period
+   DataFrame.to_timestamp
+   DataFrame.tz_convert
+   DataFrame.tz_localize
+
+.. _api.dataframe.plotting:
+
+Plotting
+~~~~~~~~
+``DataFrame.plot`` is both a callable method and a namespace attribute for
+specific plotting methods of the form ``DataFrame.plot.<kind>``.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_callable.rst
+
+   DataFrame.plot
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   DataFrame.plot.area
+   DataFrame.plot.bar
+   DataFrame.plot.barh
+   DataFrame.plot.box
+   DataFrame.plot.density
+   DataFrame.plot.hexbin
+   DataFrame.plot.hist
+   DataFrame.plot.kde
+   DataFrame.plot.line
+   DataFrame.plot.pie
+   DataFrame.plot.scatter
+
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.boxplot
+   DataFrame.hist
+
+Serialization / IO / Conversion
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DataFrame.from_csv
+   DataFrame.from_dict
+   DataFrame.from_items
+   DataFrame.from_records
+   DataFrame.info
+   DataFrame.to_parquet
+   DataFrame.to_pickle
+   DataFrame.to_csv
+   DataFrame.to_hdf
+   DataFrame.to_sql
+   DataFrame.to_dict
+   DataFrame.to_excel
+   DataFrame.to_json
+   DataFrame.to_html
+   DataFrame.to_feather
+   DataFrame.to_latex
+   DataFrame.to_stata
+   DataFrame.to_msgpack
+   DataFrame.to_gbq
+   DataFrame.to_records
+   DataFrame.to_sparse
+   DataFrame.to_dense
+   DataFrame.to_string
+   DataFrame.to_clipboard
+   DataFrame.style
+
+Sparse
+~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   SparseDataFrame.to_coo
diff --git a/doc/source/reference/general_functions.rst b/doc/source/reference/general_functions.rst
new file mode 100644
index 0000000000000..b5832cb8aa591
--- /dev/null
+++ b/doc/source/reference/general_functions.rst
@@ -0,0 +1,87 @@
+{{ header }}
+
+.. _api.general_functions:
+
+=================
+General functions
+=================
+.. currentmodule:: pandas
+
+Data manipulations
+~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   melt
+   pivot
+   pivot_table
+   crosstab
+   cut
+   qcut
+   merge
+   merge_ordered
+   merge_asof
+   concat
+   get_dummies
+   factorize
+   unique
+   wide_to_long
+
+Top-level missing data
+~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   isna
+   isnull
+   notna
+   notnull
+
+Top-level conversions
+~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   to_numeric
+
+Top-level dealing with datetimelike
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   to_datetime
+   to_timedelta
+   date_range
+   bdate_range
+   period_range
+   timedelta_range
+   infer_freq
+
+Top-level dealing with intervals
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   interval_range
+
+Top-level evaluation
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   eval
+
+Hashing
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   util.hash_array
+   util.hash_pandas_object
+
+Testing
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   test
diff --git a/doc/source/reference/general_utility_functions.rst b/doc/source/reference/general_utility_functions.rst
new file mode 100644
index 0000000000000..9c69770c0f1b7
--- /dev/null
+++ b/doc/source/reference/general_utility_functions.rst
@@ -0,0 +1,109 @@
+{{ header }}
+
+.. _api.general_utility_functions:
+
+=========================
+General utility functions
+=========================
+.. currentmodule:: pandas
+
+Working with options
+--------------------
+.. autosummary::
+   :toctree: api/
+
+   describe_option
+   reset_option
+   get_option
+   set_option
+   option_context
+
+Testing functions
+-----------------
+.. autosummary::
+   :toctree: api/
+
+   testing.assert_frame_equal
+   testing.assert_series_equal
+   testing.assert_index_equal
+
+Exceptions and warnings
+-----------------------
+.. autosummary::
+   :toctree: api/
+
+   errors.DtypeWarning
+   errors.EmptyDataError
+   errors.OutOfBoundsDatetime
+   errors.ParserError
+   errors.ParserWarning
+   errors.PerformanceWarning
+   errors.UnsortedIndexError
+   errors.UnsupportedFunctionCall
+
+Data types related functionality
+--------------------------------
+.. autosummary::
+   :toctree: api/
+
+   api.types.union_categoricals
+   api.types.infer_dtype
+   api.types.pandas_dtype
+
+Dtype introspection
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    api.types.is_bool_dtype
+    api.types.is_categorical_dtype
+    api.types.is_complex_dtype
+    api.types.is_datetime64_any_dtype
+    api.types.is_datetime64_dtype
+    api.types.is_datetime64_ns_dtype
+    api.types.is_datetime64tz_dtype
+    api.types.is_extension_type
+    api.types.is_extension_array_dtype
+    api.types.is_float_dtype
+    api.types.is_int64_dtype
+    api.types.is_integer_dtype
+    api.types.is_interval_dtype
+    api.types.is_numeric_dtype
+    api.types.is_object_dtype
+    api.types.is_period_dtype
+    api.types.is_signed_integer_dtype
+    api.types.is_string_dtype
+    api.types.is_timedelta64_dtype
+    api.types.is_timedelta64_ns_dtype
+    api.types.is_unsigned_integer_dtype
+    api.types.is_sparse
+
+Iterable introspection
+~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    api.types.is_dict_like
+    api.types.is_file_like
+    api.types.is_list_like
+    api.types.is_named_tuple
+    api.types.is_iterator
+
+Scalar introspection
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    api.types.is_bool
+    api.types.is_categorical
+    api.types.is_complex
+    api.types.is_datetimetz
+    api.types.is_float
+    api.types.is_hashable
+    api.types.is_integer
+    api.types.is_interval
+    api.types.is_number
+    api.types.is_period
+    api.types.is_re
+    api.types.is_re_compilable
+    api.types.is_scalar
diff --git a/doc/source/reference/groupby.rst b/doc/source/reference/groupby.rst
new file mode 100644
index 0000000000000..c7f9113b53c22
--- /dev/null
+++ b/doc/source/reference/groupby.rst
@@ -0,0 +1,133 @@
+{{ header }}
+
+.. _api.groupby:
+
+=======
+GroupBy
+=======
+.. currentmodule:: pandas.core.groupby
+
+GroupBy objects are returned by groupby calls: :func:`pandas.DataFrame.groupby`, :func:`pandas.Series.groupby`, etc.
+
+Indexing, iteration
+-------------------
+.. autosummary::
+   :toctree: api/
+
+   GroupBy.__iter__
+   GroupBy.groups
+   GroupBy.indices
+   GroupBy.get_group
+
+.. currentmodule:: pandas
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   Grouper
+
+.. currentmodule:: pandas.core.groupby
+
+Function application
+--------------------
+.. autosummary::
+   :toctree: api/
+
+   GroupBy.apply
+   GroupBy.agg
+   GroupBy.aggregate
+   GroupBy.transform
+   GroupBy.pipe
+
+Computations / Descriptive Stats
+--------------------------------
+.. autosummary::
+   :toctree: api/
+
+   GroupBy.all
+   GroupBy.any
+   GroupBy.bfill
+   GroupBy.count
+   GroupBy.cumcount
+   GroupBy.ffill
+   GroupBy.first
+   GroupBy.head
+   GroupBy.last
+   GroupBy.max
+   GroupBy.mean
+   GroupBy.median
+   GroupBy.min
+   GroupBy.ngroup
+   GroupBy.nth
+   GroupBy.ohlc
+   GroupBy.prod
+   GroupBy.rank
+   GroupBy.pct_change
+   GroupBy.size
+   GroupBy.sem
+   GroupBy.std
+   GroupBy.sum
+   GroupBy.var
+   GroupBy.tail
+
+The following methods are available in both ``SeriesGroupBy`` and
+``DataFrameGroupBy`` objects, but may differ slightly, usually in that
+the ``DataFrameGroupBy`` version usually permits the specification of an
+axis argument, and often an argument indicating whether to restrict
+application to columns of a specific data type.
+
+.. autosummary::
+   :toctree: api/
+
+   DataFrameGroupBy.all
+   DataFrameGroupBy.any
+   DataFrameGroupBy.bfill
+   DataFrameGroupBy.corr
+   DataFrameGroupBy.count
+   DataFrameGroupBy.cov
+   DataFrameGroupBy.cummax
+   DataFrameGroupBy.cummin
+   DataFrameGroupBy.cumprod
+   DataFrameGroupBy.cumsum
+   DataFrameGroupBy.describe
+   DataFrameGroupBy.diff
+   DataFrameGroupBy.ffill
+   DataFrameGroupBy.fillna
+   DataFrameGroupBy.filter
+   DataFrameGroupBy.hist
+   DataFrameGroupBy.idxmax
+   DataFrameGroupBy.idxmin
+   DataFrameGroupBy.mad
+   DataFrameGroupBy.nunique
+   DataFrameGroupBy.pct_change
+   DataFrameGroupBy.plot
+   DataFrameGroupBy.quantile
+   DataFrameGroupBy.rank
+   DataFrameGroupBy.resample
+   DataFrameGroupBy.shift
+   DataFrameGroupBy.size
+   DataFrameGroupBy.skew
+   DataFrameGroupBy.take
+   DataFrameGroupBy.tshift
+
+The following methods are available only for ``SeriesGroupBy`` objects.
+
+.. autosummary::
+   :toctree: api/
+
+   SeriesGroupBy.nlargest
+   SeriesGroupBy.nsmallest
+   SeriesGroupBy.nunique
+   SeriesGroupBy.unique
+   SeriesGroupBy.value_counts
+   SeriesGroupBy.is_monotonic_increasing
+   SeriesGroupBy.is_monotonic_decreasing
+
+The following methods are available only for ``DataFrameGroupBy`` objects.
+
+.. autosummary::
+   :toctree: api/
+
+   DataFrameGroupBy.corrwith
+   DataFrameGroupBy.boxplot
diff --git a/doc/source/reference/index.rst b/doc/source/reference/index.rst
new file mode 100644
index 0000000000000..ef4676054473a
--- /dev/null
+++ b/doc/source/reference/index.rst
@@ -0,0 +1,80 @@
+{{ header }}
+
+.. _api:
+
+=============
+API Reference
+=============
+
+This page gives an overview of all public pandas objects, functions and
+methods. All classes and functions exposed in ``pandas.*`` namespace are public.
+
+Some subpackages are public which include ``pandas.errors``,
+``pandas.plotting``, and ``pandas.testing``. Public functions in
+``pandas.io`` and ``pandas.tseries`` submodules are mentioned in
+the documentation. ``pandas.api.types`` subpackage holds some
+public functions related to data types in pandas.
+
+.. warning::
+
+    The ``pandas.core``, ``pandas.compat``, and ``pandas.util`` top-level modules are PRIVATE. Stable functionality in such modules is not guaranteed.
+
+.. toctree::
+   :maxdepth: 2
+
+   io
+   general_functions
+   series
+   frame
+   arrays
+   panel
+   indexing
+   offset_frequency
+   window
+   groupby
+   resampling
+   style
+   plotting
+   general_utility_functions
+   extensions
+
+.. This is to prevent warnings in the doc build. We don't want to encourage
+.. these methods.
+
+.. toctree::
+   :hidden:
+
+   api/pandas.DataFrame.blocks
+   api/pandas.DataFrame.as_matrix
+   api/pandas.DataFrame.ix
+   api/pandas.Index.asi8
+   api/pandas.Index.data
+   api/pandas.Index.flags
+   api/pandas.Index.holds_integer
+   api/pandas.Index.is_type_compatible
+   api/pandas.Index.nlevels
+   api/pandas.Index.sort
+   api/pandas.Panel.agg
+   api/pandas.Panel.aggregate
+   api/pandas.Panel.blocks
+   api/pandas.Panel.empty
+   api/pandas.Panel.is_copy
+   api/pandas.Panel.items
+   api/pandas.Panel.ix
+   api/pandas.Panel.major_axis
+   api/pandas.Panel.minor_axis
+   api/pandas.Series.asobject
+   api/pandas.Series.blocks
+   api/pandas.Series.from_array
+   api/pandas.Series.ix
+   api/pandas.Series.imag
+   api/pandas.Series.real
+
+
+.. Can't convince sphinx to generate toctree for this class attribute.
+.. So we do it manually to avoid a warning
+
+.. toctree::
+   :hidden:
+
+   api/pandas.api.extensions.ExtensionDtype.na_value
diff --git a/doc/source/reference/indexing.rst b/doc/source/reference/indexing.rst
new file mode 100644
index 0000000000000..680cb7e3dac91
--- /dev/null
+++ b/doc/source/reference/indexing.rst
@@ -0,0 +1,481 @@
+{{ header }}
+
+.. _api.indexing:
+
+========
+Indexing
+========
+
+Index
+-----
+.. currentmodule:: pandas
+
+**Many of these methods or variants thereof are available on the objects
+that contain an index (Series/DataFrame) and those should most likely be
+used before calling these methods directly.**
+
+.. autosummary::
+   :toctree: api/
+
+   Index
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.values
+   Index.is_monotonic
+   Index.is_monotonic_increasing
+   Index.is_monotonic_decreasing
+   Index.is_unique
+   Index.has_duplicates
+   Index.hasnans
+   Index.dtype
+   Index.dtype_str
+   Index.inferred_type
+   Index.is_all_dates
+   Index.shape
+   Index.name
+   Index.names
+   Index.nbytes
+   Index.ndim
+   Index.size
+   Index.empty
+   Index.strides
+   Index.itemsize
+   Index.base
+   Index.T
+   Index.memory_usage
+
+Modifying and Computations
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.all
+   Index.any
+   Index.argmin
+   Index.argmax
+   Index.copy
+   Index.delete
+   Index.drop
+   Index.drop_duplicates
+   Index.duplicated
+   Index.equals
+   Index.factorize
+   Index.identical
+   Index.insert
+   Index.is_
+   Index.is_boolean
+   Index.is_categorical
+   Index.is_floating
+   Index.is_integer
+   Index.is_interval
+   Index.is_mixed
+   Index.is_numeric
+   Index.is_object
+   Index.min
+   Index.max
+   Index.reindex
+   Index.rename
+   Index.repeat
+   Index.where
+   Index.take
+   Index.putmask
+   Index.unique
+   Index.nunique
+   Index.value_counts
+
+Compatibility with MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.set_names
+   Index.is_lexsorted_for_tuple
+   Index.droplevel
+
+Missing Values
+~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.fillna
+   Index.dropna
+   Index.isna
+   Index.notna
+
+Conversion
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.astype
+   Index.item
+   Index.map
+   Index.ravel
+   Index.to_list
+   Index.to_native_types
+   Index.to_series
+   Index.to_frame
+   Index.view
+
+Sorting
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.argsort
+   Index.searchsorted
+   Index.sort_values
+
+Time-specific operations
+~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.shift
+
+Combining / joining / set operations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.append
+   Index.join
+   Index.intersection
+   Index.union
+   Index.difference
+   Index.symmetric_difference
+
+Selecting
+~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Index.asof
+   Index.asof_locs
+   Index.contains
+   Index.get_duplicates
+   Index.get_indexer
+   Index.get_indexer_for
+   Index.get_indexer_non_unique
+   Index.get_level_values
+   Index.get_loc
+   Index.get_slice_bound
+   Index.get_value
+   Index.get_values
+   Index.set_value
+   Index.isin
+   Index.slice_indexer
+   Index.slice_locs
+
+.. _api.numericindex:
+
+Numeric Index
+-------------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   RangeIndex
+   Int64Index
+   UInt64Index
+   Float64Index
+
+.. We need this autosummary so that the methods are generated.
+.. Separate block, since they aren't classes.
+
+.. autosummary::
+   :toctree: api/
+
+   RangeIndex.from_range
+
+.. _api.categoricalindex:
+
+CategoricalIndex
+----------------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   CategoricalIndex
+
+Categorical Components
+~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   CategoricalIndex.codes
+   CategoricalIndex.categories
+   CategoricalIndex.ordered
+   CategoricalIndex.rename_categories
+   CategoricalIndex.reorder_categories
+   CategoricalIndex.add_categories
+   CategoricalIndex.remove_categories
+   CategoricalIndex.remove_unused_categories
+   CategoricalIndex.set_categories
+   CategoricalIndex.as_ordered
+   CategoricalIndex.as_unordered
+
+Modifying and Computations
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   CategoricalIndex.map
+   CategoricalIndex.equals
+
+.. _api.intervalindex:
+
+IntervalIndex
+-------------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   IntervalIndex
+
+IntervalIndex Components
+~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   IntervalIndex.from_arrays
+   IntervalIndex.from_tuples
+   IntervalIndex.from_breaks
+   IntervalIndex.contains
+   IntervalIndex.left
+   IntervalIndex.right
+   IntervalIndex.mid
+   IntervalIndex.closed
+   IntervalIndex.length
+   IntervalIndex.values
+   IntervalIndex.is_non_overlapping_monotonic
+   IntervalIndex.is_overlapping
+   IntervalIndex.get_loc
+   IntervalIndex.get_indexer
+   IntervalIndex.set_closed
+   IntervalIndex.overlaps
+   IntervalIndex.to_tuples
+
+.. _api.multiindex:
+
+MultiIndex
+----------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   MultiIndex
+
+.. autosummary::
+   :toctree: api/
+
+   IndexSlice
+
+MultiIndex Constructors
+~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   MultiIndex.from_arrays
+   MultiIndex.from_tuples
+   MultiIndex.from_product
+   MultiIndex.from_frame
+
+MultiIndex Properties
+~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   MultiIndex.names
+   MultiIndex.levels
+   MultiIndex.codes
+   MultiIndex.nlevels
+   MultiIndex.levshape
+
+MultiIndex Components
+~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   MultiIndex.set_levels
+   MultiIndex.set_codes
+   MultiIndex.to_hierarchical
+   MultiIndex.to_flat_index
+   MultiIndex.to_frame
+   MultiIndex.is_lexsorted
+   MultiIndex.sortlevel
+   MultiIndex.droplevel
+   MultiIndex.swaplevel
+   MultiIndex.reorder_levels
+   MultiIndex.remove_unused_levels
+
+MultiIndex Selecting
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   MultiIndex.get_loc
+   MultiIndex.get_loc_level
+   MultiIndex.get_indexer
+   MultiIndex.get_level_values
+
+.. _api.datetimeindex:
+
+DatetimeIndex
+-------------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   DatetimeIndex
+
+Time/Date Components
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DatetimeIndex.year
+   DatetimeIndex.month
+   DatetimeIndex.day
+   DatetimeIndex.hour
+   DatetimeIndex.minute
+   DatetimeIndex.second
+   DatetimeIndex.microsecond
+   DatetimeIndex.nanosecond
+   DatetimeIndex.date
+   DatetimeIndex.time
+   DatetimeIndex.timetz
+   DatetimeIndex.dayofyear
+   DatetimeIndex.weekofyear
+   DatetimeIndex.week
+   DatetimeIndex.dayofweek
+   DatetimeIndex.weekday
+   DatetimeIndex.quarter
+   DatetimeIndex.tz
+   DatetimeIndex.freq
+   DatetimeIndex.freqstr
+   DatetimeIndex.is_month_start
+   DatetimeIndex.is_month_end
+   DatetimeIndex.is_quarter_start
+   DatetimeIndex.is_quarter_end
+   DatetimeIndex.is_year_start
+   DatetimeIndex.is_year_end
+   DatetimeIndex.is_leap_year
+   DatetimeIndex.inferred_freq
+
+Selecting
+~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DatetimeIndex.indexer_at_time
+   DatetimeIndex.indexer_between_time
+
+
+Time-specific operations
+~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DatetimeIndex.normalize
+   DatetimeIndex.strftime
+   DatetimeIndex.snap
+   DatetimeIndex.tz_convert
+   DatetimeIndex.tz_localize
+   DatetimeIndex.round
+   DatetimeIndex.floor
+   DatetimeIndex.ceil
+   DatetimeIndex.month_name
+   DatetimeIndex.day_name
+
+Conversion
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   DatetimeIndex.to_period
+   DatetimeIndex.to_perioddelta
+   DatetimeIndex.to_pydatetime
+   DatetimeIndex.to_series
+   DatetimeIndex.to_frame
+
+TimedeltaIndex
+--------------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   TimedeltaIndex
+
+Components
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   TimedeltaIndex.days
+   TimedeltaIndex.seconds
+   TimedeltaIndex.microseconds
+   TimedeltaIndex.nanoseconds
+   TimedeltaIndex.components
+   TimedeltaIndex.inferred_freq
+
+Conversion
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   TimedeltaIndex.to_pytimedelta
+   TimedeltaIndex.to_series
+   TimedeltaIndex.round
+   TimedeltaIndex.floor
+   TimedeltaIndex.ceil
+   TimedeltaIndex.to_frame
+
+.. currentmodule:: pandas
+
+PeriodIndex
+-----------
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   PeriodIndex
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+    :toctree: api/
+
+    PeriodIndex.day
+    PeriodIndex.dayofweek
+    PeriodIndex.dayofyear
+    PeriodIndex.days_in_month
+    PeriodIndex.daysinmonth
+    PeriodIndex.end_time
+    PeriodIndex.freq
+    PeriodIndex.freqstr
+    PeriodIndex.hour
+    PeriodIndex.is_leap_year
+    PeriodIndex.minute
+    PeriodIndex.month
+    PeriodIndex.quarter
+    PeriodIndex.qyear
+    PeriodIndex.second
+    PeriodIndex.start_time
+    PeriodIndex.week
+    PeriodIndex.weekday
+    PeriodIndex.weekofyear
+    PeriodIndex.year
+
+Methods
+~~~~~~~
+.. autosummary::
+    :toctree: api/
+
+    PeriodIndex.asfreq
+    PeriodIndex.strftime
+    PeriodIndex.to_timestamp
diff --git a/doc/source/reference/io.rst b/doc/source/reference/io.rst
new file mode 100644
index 0000000000000..9c776e3ff8a82
--- /dev/null
+++ b/doc/source/reference/io.rst
@@ -0,0 +1,140 @@
+{{ header }}
+
+.. _api.io:
+
+============
+Input/Output
+============
+.. currentmodule:: pandas
+
+Pickling
+~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_pickle
+
+Flat File
+~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_table
+   read_csv
+   read_fwf
+   read_msgpack
+
+Clipboard
+~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_clipboard
+
+Excel
+~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_excel
+   ExcelFile.parse
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/class_without_autosummary.rst
+
+   ExcelWriter
+
+JSON
+~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_json
+
+.. currentmodule:: pandas.io.json
+
+.. autosummary::
+   :toctree: api/
+
+   json_normalize
+   build_table_schema
+
+.. currentmodule:: pandas
+
+HTML
+~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_html
+
+HDFStore: PyTables (HDF5)
+~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_hdf
+   HDFStore.put
+   HDFStore.append
+   HDFStore.get
+   HDFStore.select
+   HDFStore.info
+   HDFStore.keys
+   HDFStore.groups
+   HDFStore.walk
+
+Feather
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_feather
+
+Parquet
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_parquet
+
+SAS
+~~~
+.. autosummary::
+   :toctree: api/
+
+   read_sas
+
+SQL
+~~~
+.. autosummary::
+   :toctree: api/
+
+   read_sql_table
+   read_sql_query
+   read_sql
+
+Google BigQuery
+~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_gbq
+
+STATA
+~~~~~
+.. autosummary::
+   :toctree: api/
+
+   read_stata
+
+.. currentmodule:: pandas.io.stata
+
+.. autosummary::
+   :toctree: api/
+
+   StataReader.data
+   StataReader.data_label
+   StataReader.value_labels
+   StataReader.variable_labels
+   StataWriter.write_file
diff --git a/doc/source/reference/offset_frequency.rst b/doc/source/reference/offset_frequency.rst
new file mode 100644
index 0000000000000..ccc1c7e171d22
--- /dev/null
+++ b/doc/source/reference/offset_frequency.rst
@@ -0,0 +1,1387 @@
+{{ header }}
+
+.. _api.dateoffsets:
+
+============
+Date Offsets
+============
+.. currentmodule:: pandas.tseries.offsets
+
+DateOffset
+----------
+.. autosummary::
+   :toctree: api/
+
+    DateOffset
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    DateOffset.freqstr
+    DateOffset.kwds
+    DateOffset.name
+    DateOffset.nanos
+    DateOffset.normalize
+    DateOffset.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    DateOffset.apply
+    DateOffset.copy
+    DateOffset.isAnchored
+    DateOffset.onOffset
+
+BusinessDay
+-----------
+.. autosummary::
+   :toctree: api/
+
+    BusinessDay
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessDay.freqstr
+    BusinessDay.kwds
+    BusinessDay.name
+    BusinessDay.nanos
+    BusinessDay.normalize
+    BusinessDay.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessDay.apply
+    BusinessDay.apply_index
+    BusinessDay.copy
+    BusinessDay.isAnchored
+    BusinessDay.onOffset
+
+BusinessHour
+------------
+.. autosummary::
+   :toctree: api/
+
+    BusinessHour
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessHour.freqstr
+    BusinessHour.kwds
+    BusinessHour.name
+    BusinessHour.nanos
+    BusinessHour.normalize
+    BusinessHour.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessHour.apply
+    BusinessHour.copy
+    BusinessHour.isAnchored
+    BusinessHour.onOffset
+
+CustomBusinessDay
+-----------------
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessDay
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessDay.freqstr
+    CustomBusinessDay.kwds
+    CustomBusinessDay.name
+    CustomBusinessDay.nanos
+    CustomBusinessDay.normalize
+    CustomBusinessDay.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessDay.apply
+    CustomBusinessDay.copy
+    CustomBusinessDay.isAnchored
+    CustomBusinessDay.onOffset
+
+CustomBusinessHour
+------------------
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessHour
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessHour.freqstr
+    CustomBusinessHour.kwds
+    CustomBusinessHour.name
+    CustomBusinessHour.nanos
+    CustomBusinessHour.normalize
+    CustomBusinessHour.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessHour.apply
+    CustomBusinessHour.copy
+    CustomBusinessHour.isAnchored
+    CustomBusinessHour.onOffset
+
+MonthOffset
+-----------
+.. autosummary::
+   :toctree: api/
+
+    MonthOffset
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthOffset.freqstr
+    MonthOffset.kwds
+    MonthOffset.name
+    MonthOffset.nanos
+    MonthOffset.normalize
+    MonthOffset.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthOffset.apply
+    MonthOffset.apply_index
+    MonthOffset.copy
+    MonthOffset.isAnchored
+    MonthOffset.onOffset
+
+MonthEnd
+--------
+.. autosummary::
+   :toctree: api/
+
+    MonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthEnd.freqstr
+    MonthEnd.kwds
+    MonthEnd.name
+    MonthEnd.nanos
+    MonthEnd.normalize
+    MonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthEnd.apply
+    MonthEnd.apply_index
+    MonthEnd.copy
+    MonthEnd.isAnchored
+    MonthEnd.onOffset
+
+MonthBegin
+----------
+.. autosummary::
+   :toctree: api/
+
+    MonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthBegin.freqstr
+    MonthBegin.kwds
+    MonthBegin.name
+    MonthBegin.nanos
+    MonthBegin.normalize
+    MonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    MonthBegin.apply
+    MonthBegin.apply_index
+    MonthBegin.copy
+    MonthBegin.isAnchored
+    MonthBegin.onOffset
+
+BusinessMonthEnd
+----------------
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthEnd.freqstr
+    BusinessMonthEnd.kwds
+    BusinessMonthEnd.name
+    BusinessMonthEnd.nanos
+    BusinessMonthEnd.normalize
+    BusinessMonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthEnd.apply
+    BusinessMonthEnd.apply_index
+    BusinessMonthEnd.copy
+    BusinessMonthEnd.isAnchored
+    BusinessMonthEnd.onOffset
+
+BusinessMonthBegin
+------------------
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthBegin.freqstr
+    BusinessMonthBegin.kwds
+    BusinessMonthBegin.name
+    BusinessMonthBegin.nanos
+    BusinessMonthBegin.normalize
+    BusinessMonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BusinessMonthBegin.apply
+    BusinessMonthBegin.apply_index
+    BusinessMonthBegin.copy
+    BusinessMonthBegin.isAnchored
+    BusinessMonthBegin.onOffset
+
+CustomBusinessMonthEnd
+----------------------
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthEnd.freqstr
+    CustomBusinessMonthEnd.kwds
+    CustomBusinessMonthEnd.m_offset
+    CustomBusinessMonthEnd.name
+    CustomBusinessMonthEnd.nanos
+    CustomBusinessMonthEnd.normalize
+    CustomBusinessMonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthEnd.apply
+    CustomBusinessMonthEnd.copy
+    CustomBusinessMonthEnd.isAnchored
+    CustomBusinessMonthEnd.onOffset
+
+CustomBusinessMonthBegin
+------------------------
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthBegin.freqstr
+    CustomBusinessMonthBegin.kwds
+    CustomBusinessMonthBegin.m_offset
+    CustomBusinessMonthBegin.name
+    CustomBusinessMonthBegin.nanos
+    CustomBusinessMonthBegin.normalize
+    CustomBusinessMonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CustomBusinessMonthBegin.apply
+    CustomBusinessMonthBegin.copy
+    CustomBusinessMonthBegin.isAnchored
+    CustomBusinessMonthBegin.onOffset
+
+SemiMonthOffset
+---------------
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthOffset
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthOffset.freqstr
+    SemiMonthOffset.kwds
+    SemiMonthOffset.name
+    SemiMonthOffset.nanos
+    SemiMonthOffset.normalize
+    SemiMonthOffset.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthOffset.apply
+    SemiMonthOffset.apply_index
+    SemiMonthOffset.copy
+    SemiMonthOffset.isAnchored
+    SemiMonthOffset.onOffset
+
+SemiMonthEnd
+------------
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthEnd.freqstr
+    SemiMonthEnd.kwds
+    SemiMonthEnd.name
+    SemiMonthEnd.nanos
+    SemiMonthEnd.normalize
+    SemiMonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthEnd.apply
+    SemiMonthEnd.apply_index
+    SemiMonthEnd.copy
+    SemiMonthEnd.isAnchored
+    SemiMonthEnd.onOffset
+
+SemiMonthBegin
+--------------
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthBegin.freqstr
+    SemiMonthBegin.kwds
+    SemiMonthBegin.name
+    SemiMonthBegin.nanos
+    SemiMonthBegin.normalize
+    SemiMonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    SemiMonthBegin.apply
+    SemiMonthBegin.apply_index
+    SemiMonthBegin.copy
+    SemiMonthBegin.isAnchored
+    SemiMonthBegin.onOffset
+
+Week
+----
+.. autosummary::
+   :toctree: api/
+
+    Week
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Week.freqstr
+    Week.kwds
+    Week.name
+    Week.nanos
+    Week.normalize
+    Week.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Week.apply
+    Week.apply_index
+    Week.copy
+    Week.isAnchored
+    Week.onOffset
+
+WeekOfMonth
+-----------
+.. autosummary::
+   :toctree: api/
+
+    WeekOfMonth
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    WeekOfMonth.freqstr
+    WeekOfMonth.kwds
+    WeekOfMonth.name
+    WeekOfMonth.nanos
+    WeekOfMonth.normalize
+    WeekOfMonth.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    WeekOfMonth.apply
+    WeekOfMonth.copy
+    WeekOfMonth.isAnchored
+    WeekOfMonth.onOffset
+
+LastWeekOfMonth
+---------------
+.. autosummary::
+   :toctree: api/
+
+    LastWeekOfMonth
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    LastWeekOfMonth.freqstr
+    LastWeekOfMonth.kwds
+    LastWeekOfMonth.name
+    LastWeekOfMonth.nanos
+    LastWeekOfMonth.normalize
+    LastWeekOfMonth.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    LastWeekOfMonth.apply
+    LastWeekOfMonth.copy
+    LastWeekOfMonth.isAnchored
+    LastWeekOfMonth.onOffset
+
+QuarterOffset
+-------------
+.. autosummary::
+   :toctree: api/
+
+    QuarterOffset
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterOffset.freqstr
+    QuarterOffset.kwds
+    QuarterOffset.name
+    QuarterOffset.nanos
+    QuarterOffset.normalize
+    QuarterOffset.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterOffset.apply
+    QuarterOffset.apply_index
+    QuarterOffset.copy
+    QuarterOffset.isAnchored
+    QuarterOffset.onOffset
+
+BQuarterEnd
+-----------
+.. autosummary::
+   :toctree: api/
+
+    BQuarterEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BQuarterEnd.freqstr
+    BQuarterEnd.kwds
+    BQuarterEnd.name
+    BQuarterEnd.nanos
+    BQuarterEnd.normalize
+    BQuarterEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BQuarterEnd.apply
+    BQuarterEnd.apply_index
+    BQuarterEnd.copy
+    BQuarterEnd.isAnchored
+    BQuarterEnd.onOffset
+
+BQuarterBegin
+-------------
+.. autosummary::
+   :toctree: api/
+
+    BQuarterBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BQuarterBegin.freqstr
+    BQuarterBegin.kwds
+    BQuarterBegin.name
+    BQuarterBegin.nanos
+    BQuarterBegin.normalize
+    BQuarterBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BQuarterBegin.apply
+    BQuarterBegin.apply_index
+    BQuarterBegin.copy
+    BQuarterBegin.isAnchored
+    BQuarterBegin.onOffset
+
+QuarterEnd
+----------
+.. autosummary::
+   :toctree: api/
+
+    QuarterEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterEnd.freqstr
+    QuarterEnd.kwds
+    QuarterEnd.name
+    QuarterEnd.nanos
+    QuarterEnd.normalize
+    QuarterEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterEnd.apply
+    QuarterEnd.apply_index
+    QuarterEnd.copy
+    QuarterEnd.isAnchored
+    QuarterEnd.onOffset
+
+QuarterBegin
+------------
+.. autosummary::
+   :toctree: api/
+
+    QuarterBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterBegin.freqstr
+    QuarterBegin.kwds
+    QuarterBegin.name
+    QuarterBegin.nanos
+    QuarterBegin.normalize
+    QuarterBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    QuarterBegin.apply
+    QuarterBegin.apply_index
+    QuarterBegin.copy
+    QuarterBegin.isAnchored
+    QuarterBegin.onOffset
+
+YearOffset
+----------
+.. autosummary::
+   :toctree: api/
+
+    YearOffset
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearOffset.freqstr
+    YearOffset.kwds
+    YearOffset.name
+    YearOffset.nanos
+    YearOffset.normalize
+    YearOffset.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearOffset.apply
+    YearOffset.apply_index
+    YearOffset.copy
+    YearOffset.isAnchored
+    YearOffset.onOffset
+
+BYearEnd
+--------
+.. autosummary::
+   :toctree: api/
+
+    BYearEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BYearEnd.freqstr
+    BYearEnd.kwds
+    BYearEnd.name
+    BYearEnd.nanos
+    BYearEnd.normalize
+    BYearEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BYearEnd.apply
+    BYearEnd.apply_index
+    BYearEnd.copy
+    BYearEnd.isAnchored
+    BYearEnd.onOffset
+
+BYearBegin
+----------
+.. autosummary::
+   :toctree: api/
+
+    BYearBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BYearBegin.freqstr
+    BYearBegin.kwds
+    BYearBegin.name
+    BYearBegin.nanos
+    BYearBegin.normalize
+    BYearBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BYearBegin.apply
+    BYearBegin.apply_index
+    BYearBegin.copy
+    BYearBegin.isAnchored
+    BYearBegin.onOffset
+
+YearEnd
+-------
+.. autosummary::
+   :toctree: api/
+
+    YearEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearEnd.freqstr
+    YearEnd.kwds
+    YearEnd.name
+    YearEnd.nanos
+    YearEnd.normalize
+    YearEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearEnd.apply
+    YearEnd.apply_index
+    YearEnd.copy
+    YearEnd.isAnchored
+    YearEnd.onOffset
+
+YearBegin
+---------
+.. autosummary::
+   :toctree: api/
+
+    YearBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearBegin.freqstr
+    YearBegin.kwds
+    YearBegin.name
+    YearBegin.nanos
+    YearBegin.normalize
+    YearBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    YearBegin.apply
+    YearBegin.apply_index
+    YearBegin.copy
+    YearBegin.isAnchored
+    YearBegin.onOffset
+
+FY5253
+------
+.. autosummary::
+   :toctree: api/
+
+    FY5253
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    FY5253.freqstr
+    FY5253.kwds
+    FY5253.name
+    FY5253.nanos
+    FY5253.normalize
+    FY5253.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    FY5253.apply
+    FY5253.copy
+    FY5253.get_rule_code_suffix
+    FY5253.get_year_end
+    FY5253.isAnchored
+    FY5253.onOffset
+
+FY5253Quarter
+-------------
+.. autosummary::
+   :toctree: api/
+
+    FY5253Quarter
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    FY5253Quarter.freqstr
+    FY5253Quarter.kwds
+    FY5253Quarter.name
+    FY5253Quarter.nanos
+    FY5253Quarter.normalize
+    FY5253Quarter.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    FY5253Quarter.apply
+    FY5253Quarter.copy
+    FY5253Quarter.get_weeks
+    FY5253Quarter.isAnchored
+    FY5253Quarter.onOffset
+    FY5253Quarter.year_has_extra_week
+
+Easter
+------
+.. autosummary::
+   :toctree: api/
+
+    Easter
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Easter.freqstr
+    Easter.kwds
+    Easter.name
+    Easter.nanos
+    Easter.normalize
+    Easter.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Easter.apply
+    Easter.copy
+    Easter.isAnchored
+    Easter.onOffset
+
+Tick
+----
+.. autosummary::
+   :toctree: api/
+
+    Tick
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Tick.delta
+    Tick.freqstr
+    Tick.kwds
+    Tick.name
+    Tick.nanos
+    Tick.normalize
+    Tick.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Tick.copy
+    Tick.isAnchored
+    Tick.onOffset
+
+Day
+---
+.. autosummary::
+   :toctree: api/
+
+    Day
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Day.delta
+    Day.freqstr
+    Day.kwds
+    Day.name
+    Day.nanos
+    Day.normalize
+    Day.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Day.copy
+    Day.isAnchored
+    Day.onOffset
+
+Hour
+----
+.. autosummary::
+   :toctree: api/
+
+    Hour
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Hour.delta
+    Hour.freqstr
+    Hour.kwds
+    Hour.name
+    Hour.nanos
+    Hour.normalize
+    Hour.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Hour.copy
+    Hour.isAnchored
+    Hour.onOffset
+
+Minute
+------
+.. autosummary::
+   :toctree: api/
+
+    Minute
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Minute.delta
+    Minute.freqstr
+    Minute.kwds
+    Minute.name
+    Minute.nanos
+    Minute.normalize
+    Minute.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Minute.copy
+    Minute.isAnchored
+    Minute.onOffset
+
+Second
+------
+.. autosummary::
+   :toctree: api/
+
+    Second
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Second.delta
+    Second.freqstr
+    Second.kwds
+    Second.name
+    Second.nanos
+    Second.normalize
+    Second.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Second.copy
+    Second.isAnchored
+    Second.onOffset
+
+Milli
+-----
+.. autosummary::
+   :toctree: api/
+
+    Milli
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Milli.delta
+    Milli.freqstr
+    Milli.kwds
+    Milli.name
+    Milli.nanos
+    Milli.normalize
+    Milli.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Milli.copy
+    Milli.isAnchored
+    Milli.onOffset
+
+Micro
+-----
+.. autosummary::
+   :toctree: api/
+
+    Micro
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Micro.delta
+    Micro.freqstr
+    Micro.kwds
+    Micro.name
+    Micro.nanos
+    Micro.normalize
+    Micro.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Micro.copy
+    Micro.isAnchored
+    Micro.onOffset
+
+Nano
+----
+.. autosummary::
+   :toctree: api/
+
+    Nano
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Nano.delta
+    Nano.freqstr
+    Nano.kwds
+    Nano.name
+    Nano.nanos
+    Nano.normalize
+    Nano.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    Nano.copy
+    Nano.isAnchored
+    Nano.onOffset
+
+BDay
+----
+.. autosummary::
+   :toctree: api/
+
+    BDay
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BDay.base
+    BDay.freqstr
+    BDay.kwds
+    BDay.name
+    BDay.nanos
+    BDay.normalize
+    BDay.offset
+    BDay.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BDay.apply
+    BDay.apply_index
+    BDay.copy
+    BDay.isAnchored
+    BDay.onOffset
+    BDay.rollback
+    BDay.rollforward
+
+BMonthEnd
+---------
+.. autosummary::
+   :toctree: api/
+
+    BMonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BMonthEnd.base
+    BMonthEnd.freqstr
+    BMonthEnd.kwds
+    BMonthEnd.name
+    BMonthEnd.nanos
+    BMonthEnd.normalize
+    BMonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BMonthEnd.apply
+    BMonthEnd.apply_index
+    BMonthEnd.copy
+    BMonthEnd.isAnchored
+    BMonthEnd.onOffset
+    BMonthEnd.rollback
+    BMonthEnd.rollforward
+
+BMonthBegin
+-----------
+.. autosummary::
+   :toctree: api/
+
+    BMonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BMonthBegin.base
+    BMonthBegin.freqstr
+    BMonthBegin.kwds
+    BMonthBegin.name
+    BMonthBegin.nanos
+    BMonthBegin.normalize
+    BMonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    BMonthBegin.apply
+    BMonthBegin.apply_index
+    BMonthBegin.copy
+    BMonthBegin.isAnchored
+    BMonthBegin.onOffset
+    BMonthBegin.rollback
+    BMonthBegin.rollforward
+
+CBMonthEnd
+----------
+.. autosummary::
+   :toctree: api/
+
+    CBMonthEnd
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CBMonthEnd.base
+    CBMonthEnd.cbday_roll
+    CBMonthEnd.freqstr
+    CBMonthEnd.kwds
+    CBMonthEnd.m_offset
+    CBMonthEnd.month_roll
+    CBMonthEnd.name
+    CBMonthEnd.nanos
+    CBMonthEnd.normalize
+    CBMonthEnd.offset
+    CBMonthEnd.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CBMonthEnd.apply
+    CBMonthEnd.apply_index
+    CBMonthEnd.copy
+    CBMonthEnd.isAnchored
+    CBMonthEnd.onOffset
+    CBMonthEnd.rollback
+    CBMonthEnd.rollforward
+
+CBMonthBegin
+------------
+.. autosummary::
+   :toctree: api/
+
+    CBMonthBegin
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CBMonthBegin.base
+    CBMonthBegin.cbday_roll
+    CBMonthBegin.freqstr
+    CBMonthBegin.kwds
+    CBMonthBegin.m_offset
+    CBMonthBegin.month_roll
+    CBMonthBegin.name
+    CBMonthBegin.nanos
+    CBMonthBegin.normalize
+    CBMonthBegin.offset
+    CBMonthBegin.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CBMonthBegin.apply
+    CBMonthBegin.apply_index
+    CBMonthBegin.copy
+    CBMonthBegin.isAnchored
+    CBMonthBegin.onOffset
+    CBMonthBegin.rollback
+    CBMonthBegin.rollforward
+
+CDay
+----
+.. autosummary::
+   :toctree: api/
+
+    CDay
+
+Properties
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CDay.base
+    CDay.freqstr
+    CDay.kwds
+    CDay.name
+    CDay.nanos
+    CDay.normalize
+    CDay.offset
+    CDay.rule_code
+
+Methods
+~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+    CDay.apply
+    CDay.apply_index
+    CDay.copy
+    CDay.isAnchored
+    CDay.onOffset
+    CDay.rollback
+    CDay.rollforward
+
+.. _api.frequencies:
+
+===========
+Frequencies
+===========
+.. currentmodule:: pandas.tseries.frequencies
+
+.. _api.offsets:
+
+.. autosummary::
+   :toctree: api/
+
+   to_offset
diff --git a/doc/source/reference/panel.rst b/doc/source/reference/panel.rst
new file mode 100644
index 0000000000000..39c8ba0828859
--- /dev/null
+++ b/doc/source/reference/panel.rst
@@ -0,0 +1,208 @@
+{{ header }}
+
+.. _api.panel:
+
+=====
+Panel
+=====
+.. currentmodule:: pandas
+
+Constructor
+~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel
+
+Properties and underlying data
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+**Axes**
+
+* **items**: axis 0; each item corresponds to a DataFrame contained inside
+* **major_axis**: axis 1; the index (rows) of each of the DataFrames
+* **minor_axis**: axis 2; the columns of each of the DataFrames
+
+.. autosummary::
+   :toctree: api/
+
+   Panel.values
+   Panel.axes
+   Panel.ndim
+   Panel.size
+   Panel.shape
+   Panel.dtypes
+   Panel.ftypes
+   Panel.get_dtype_counts
+   Panel.get_ftype_counts
+
+Conversion
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.astype
+   Panel.copy
+   Panel.isna
+   Panel.notna
+
+Getting and setting
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.get_value
+   Panel.set_value
+
+Indexing, iteration, slicing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.at
+   Panel.iat
+   Panel.loc
+   Panel.iloc
+   Panel.__iter__
+   Panel.iteritems
+   Panel.pop
+   Panel.xs
+   Panel.major_xs
+   Panel.minor_xs
+
+For more information on ``.at``, ``.iat``, ``.loc``, and
+``.iloc``,  see the :ref:`indexing documentation <indexing>`.
+
+Binary operator functions
+~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.add
+   Panel.sub
+   Panel.mul
+   Panel.div
+   Panel.truediv
+   Panel.floordiv
+   Panel.mod
+   Panel.pow
+   Panel.radd
+   Panel.rsub
+   Panel.rmul
+   Panel.rdiv
+   Panel.rtruediv
+   Panel.rfloordiv
+   Panel.rmod
+   Panel.rpow
+   Panel.lt
+   Panel.gt
+   Panel.le
+   Panel.ge
+   Panel.ne
+   Panel.eq
+
+Function application, GroupBy
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.apply
+   Panel.groupby
+
+.. _api.panel.stats:
+
+Computations / Descriptive Stats
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.abs
+   Panel.clip
+   Panel.clip_lower
+   Panel.clip_upper
+   Panel.count
+   Panel.cummax
+   Panel.cummin
+   Panel.cumprod
+   Panel.cumsum
+   Panel.max
+   Panel.mean
+   Panel.median
+   Panel.min
+   Panel.pct_change
+   Panel.prod
+   Panel.sem
+   Panel.skew
+   Panel.sum
+   Panel.std
+   Panel.var
+
+Reindexing / Selection / Label manipulation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.add_prefix
+   Panel.add_suffix
+   Panel.drop
+   Panel.equals
+   Panel.filter
+   Panel.first
+   Panel.last
+   Panel.reindex
+   Panel.reindex_axis
+   Panel.reindex_like
+   Panel.rename
+   Panel.sample
+   Panel.select
+   Panel.take
+   Panel.truncate
+
+Missing data handling
+~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.dropna
+
+Reshaping, sorting, transposing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.sort_index
+   Panel.swaplevel
+   Panel.transpose
+   Panel.swapaxes
+   Panel.conform
+
+Combining / joining / merging
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.join
+   Panel.update
+
+Time series-related
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.asfreq
+   Panel.shift
+   Panel.resample
+   Panel.tz_convert
+   Panel.tz_localize
+
+Serialization / IO / Conversion
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Panel.from_dict
+   Panel.to_pickle
+   Panel.to_excel
+   Panel.to_hdf
+   Panel.to_sparse
+   Panel.to_frame
+   Panel.to_clipboard
diff --git a/doc/source/reference/plotting.rst b/doc/source/reference/plotting.rst
new file mode 100644
index 0000000000000..7615e1d20f5e2
--- /dev/null
+++ b/doc/source/reference/plotting.rst
@@ -0,0 +1,22 @@
+{{ header }}
+
+.. _api.plotting:
+
+========
+Plotting
+========
+.. currentmodule:: pandas.plotting
+
+The following functions are contained in the `pandas.plotting` module.
+
+.. autosummary::
+   :toctree: api/
+
+   andrews_curves
+   bootstrap_plot
+   deregister_matplotlib_converters
+   lag_plot
+   parallel_coordinates
+   radviz
+   register_matplotlib_converters
+   scatter_matrix
diff --git a/doc/source/reference/resampling.rst b/doc/source/reference/resampling.rst
new file mode 100644
index 0000000000000..2a52defa3c68f
--- /dev/null
+++ b/doc/source/reference/resampling.rst
@@ -0,0 +1,66 @@
+{{ header }}
+
+.. _api.resampling:
+
+==========
+Resampling
+==========
+.. currentmodule:: pandas.core.resample
+
+Resampler objects are returned by resample calls: :func:`pandas.DataFrame.resample`, :func:`pandas.Series.resample`.
+
+Indexing, iteration
+~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Resampler.__iter__
+   Resampler.groups
+   Resampler.indices
+   Resampler.get_group
+
+Function application
+~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Resampler.apply
+   Resampler.aggregate
+   Resampler.transform
+   Resampler.pipe
+
+Upsampling
+~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Resampler.ffill
+   Resampler.backfill
+   Resampler.bfill
+   Resampler.pad
+   Resampler.nearest
+   Resampler.fillna
+   Resampler.asfreq
+   Resampler.interpolate
+
+Computations / Descriptive Stats
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autosummary::
+   :toctree: api/
+
+   Resampler.count
+   Resampler.nunique
+   Resampler.first
+   Resampler.last
+   Resampler.max
+   Resampler.mean
+   Resampler.median
+   Resampler.min
+   Resampler.ohlc
+   Resampler.prod
+   Resampler.size
+   Resampler.sem
+   Resampler.std
+   Resampler.sum
+   Resampler.var
+   Resampler.quantile
diff --git a/doc/source/reference/series.rst b/doc/source/reference/series.rst
new file mode 100644
index 0000000000000..b406893e3414a
--- /dev/null
+++ b/doc/source/reference/series.rst
@@ -0,0 +1,593 @@
+{{ header }}
+
+.. _api.series:
+
+======
+Series
+======
+.. currentmodule:: pandas
+
+Constructor
+-----------
+.. autosummary::
+   :toctree: api/
+
+   Series
+
+Attributes
+----------
+**Axes**
+
+.. autosummary::
+   :toctree: api/
+
+   Series.index
+
+.. autosummary::
+   :toctree: api/
+
+   Series.array
+   Series.values
+   Series.dtype
+   Series.ftype
+   Series.shape
+   Series.nbytes
+   Series.ndim
+   Series.size
+   Series.strides
+   Series.itemsize
+   Series.base
+   Series.T
+   Series.memory_usage
+   Series.hasnans
+   Series.flags
+   Series.empty
+   Series.dtypes
+   Series.ftypes
+   Series.data
+   Series.is_copy
+   Series.name
+   Series.put
+
+Conversion
+----------
+.. autosummary::
+   :toctree: api/
+
+   Series.astype
+   Series.infer_objects
+   Series.convert_objects
+   Series.copy
+   Series.bool
+   Series.to_numpy
+   Series.to_period
+   Series.to_timestamp
+   Series.to_list
+   Series.get_values
+   Series.__array__
+
+Indexing, iteration
+-------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.get
+   Series.at
+   Series.iat
+   Series.loc
+   Series.iloc
+   Series.__iter__
+   Series.iteritems
+   Series.items
+   Series.keys
+   Series.pop
+   Series.item
+   Series.xs
+
+For more information on ``.at``, ``.iat``, ``.loc``, and
+``.iloc``,  see the :ref:`indexing documentation <indexing>`.
+
+Binary operator functions
+-------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.add
+   Series.sub
+   Series.mul
+   Series.div
+   Series.truediv
+   Series.floordiv
+   Series.mod
+   Series.pow
+   Series.radd
+   Series.rsub
+   Series.rmul
+   Series.rdiv
+   Series.rtruediv
+   Series.rfloordiv
+   Series.rmod
+   Series.rpow
+   Series.combine
+   Series.combine_first
+   Series.round
+   Series.lt
+   Series.gt
+   Series.le
+   Series.ge
+   Series.ne
+   Series.eq
+   Series.product
+   Series.dot
+
+Function application, GroupBy & Window
+--------------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.apply
+   Series.agg
+   Series.aggregate
+   Series.transform
+   Series.map
+   Series.groupby
+   Series.rolling
+   Series.expanding
+   Series.ewm
+   Series.pipe
+
+.. _api.series.stats:
+
+Computations / Descriptive Stats
+--------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.abs
+   Series.all
+   Series.any
+   Series.autocorr
+   Series.between
+   Series.clip
+   Series.clip_lower
+   Series.clip_upper
+   Series.corr
+   Series.count
+   Series.cov
+   Series.cummax
+   Series.cummin
+   Series.cumprod
+   Series.cumsum
+   Series.describe
+   Series.diff
+   Series.factorize
+   Series.kurt
+   Series.mad
+   Series.max
+   Series.mean
+   Series.median
+   Series.min
+   Series.mode
+   Series.nlargest
+   Series.nsmallest
+   Series.pct_change
+   Series.prod
+   Series.quantile
+   Series.rank
+   Series.sem
+   Series.skew
+   Series.std
+   Series.sum
+   Series.var
+   Series.kurtosis
+   Series.unique
+   Series.nunique
+   Series.is_unique
+   Series.is_monotonic
+   Series.is_monotonic_increasing
+   Series.is_monotonic_decreasing
+   Series.value_counts
+   Series.compound
+
+Reindexing / Selection / Label manipulation
+-------------------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.align
+   Series.drop
+   Series.droplevel
+   Series.drop_duplicates
+   Series.duplicated
+   Series.equals
+   Series.first
+   Series.head
+   Series.idxmax
+   Series.idxmin
+   Series.isin
+   Series.last
+   Series.reindex
+   Series.reindex_like
+   Series.rename
+   Series.rename_axis
+   Series.reset_index
+   Series.sample
+   Series.select
+   Series.set_axis
+   Series.take
+   Series.tail
+   Series.truncate
+   Series.where
+   Series.mask
+   Series.add_prefix
+   Series.add_suffix
+   Series.filter
+
+Missing data handling
+---------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.isna
+   Series.notna
+   Series.dropna
+   Series.fillna
+   Series.interpolate
+
+Reshaping, sorting
+------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.argsort
+   Series.argmin
+   Series.argmax
+   Series.reorder_levels
+   Series.sort_values
+   Series.sort_index
+   Series.swaplevel
+   Series.unstack
+   Series.searchsorted
+   Series.ravel
+   Series.repeat
+   Series.squeeze
+   Series.view
+
+Combining / joining / merging
+-----------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.append
+   Series.replace
+   Series.update
+
+Time series-related
+-------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.asfreq
+   Series.asof
+   Series.shift
+   Series.first_valid_index
+   Series.last_valid_index
+   Series.resample
+   Series.tz_convert
+   Series.tz_localize
+   Series.at_time
+   Series.between_time
+   Series.tshift
+   Series.slice_shift
+
+Accessors
+---------
+
+Pandas provides dtype-specific methods under various accessors.
+These are separate namespaces within :class:`Series` that only apply
+to specific data types.
+
+=========================== =================================
+Data Type                   Accessor
+=========================== =================================
+Datetime, Timedelta, Period :ref:`dt <api.series.dt>`
+String                      :ref:`str <api.series.str>`
+Categorical                 :ref:`cat <api.series.cat>`
+Sparse                      :ref:`sparse <api.series.sparse>`
+=========================== =================================
+
+.. _api.series.dt:
+
+Datetimelike Properties
+~~~~~~~~~~~~~~~~~~~~~~~
+
+``Series.dt`` can be used to access the values of the series as
+datetimelike and return several properties.
+These can be accessed like ``Series.dt.<property>``.
+
+Datetime Properties
+^^^^^^^^^^^^^^^^^^^
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.dt.date
+   Series.dt.time
+   Series.dt.timetz
+   Series.dt.year
+   Series.dt.month
+   Series.dt.day
+   Series.dt.hour
+   Series.dt.minute
+   Series.dt.second
+   Series.dt.microsecond
+   Series.dt.nanosecond
+   Series.dt.week
+   Series.dt.weekofyear
+   Series.dt.dayofweek
+   Series.dt.weekday
+   Series.dt.dayofyear
+   Series.dt.quarter
+   Series.dt.is_month_start
+   Series.dt.is_month_end
+   Series.dt.is_quarter_start
+   Series.dt.is_quarter_end
+   Series.dt.is_year_start
+   Series.dt.is_year_end
+   Series.dt.is_leap_year
+   Series.dt.daysinmonth
+   Series.dt.days_in_month
+   Series.dt.tz
+   Series.dt.freq
+
+Datetime Methods
+^^^^^^^^^^^^^^^^
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   Series.dt.to_period
+   Series.dt.to_pydatetime
+   Series.dt.tz_localize
+   Series.dt.tz_convert
+   Series.dt.normalize
+   Series.dt.strftime
+   Series.dt.round
+   Series.dt.floor
+   Series.dt.ceil
+   Series.dt.month_name
+   Series.dt.day_name
+
+Period Properties
+^^^^^^^^^^^^^^^^^
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.dt.qyear
+   Series.dt.start_time
+   Series.dt.end_time
+
+Timedelta Properties
+^^^^^^^^^^^^^^^^^^^^
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.dt.days
+   Series.dt.seconds
+   Series.dt.microseconds
+   Series.dt.nanoseconds
+   Series.dt.components
+
+Timedelta Methods
+^^^^^^^^^^^^^^^^^
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   Series.dt.to_pytimedelta
+   Series.dt.total_seconds
+
+
+.. _api.series.str:
+
+String handling
+~~~~~~~~~~~~~~~
+
+``Series.str`` can be used to access the values of the series as
+strings and apply several methods to it. These can be accessed like
+``Series.str.<function/property>``.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   Series.str.capitalize
+   Series.str.casefold
+   Series.str.cat
+   Series.str.center
+   Series.str.contains
+   Series.str.count
+   Series.str.decode
+   Series.str.encode
+   Series.str.endswith
+   Series.str.extract
+   Series.str.extractall
+   Series.str.find
+   Series.str.findall
+   Series.str.get
+   Series.str.index
+   Series.str.join
+   Series.str.len
+   Series.str.ljust
+   Series.str.lower
+   Series.str.lstrip
+   Series.str.match
+   Series.str.normalize
+   Series.str.pad
+   Series.str.partition
+   Series.str.repeat
+   Series.str.replace
+   Series.str.rfind
+   Series.str.rindex
+   Series.str.rjust
+   Series.str.rpartition
+   Series.str.rstrip
+   Series.str.slice
+   Series.str.slice_replace
+   Series.str.split
+   Series.str.rsplit
+   Series.str.startswith
+   Series.str.strip
+   Series.str.swapcase
+   Series.str.title
+   Series.str.translate
+   Series.str.upper
+   Series.str.wrap
+   Series.str.zfill
+   Series.str.isalnum
+   Series.str.isalpha
+   Series.str.isdigit
+   Series.str.isspace
+   Series.str.islower
+   Series.str.isupper
+   Series.str.istitle
+   Series.str.isnumeric
+   Series.str.isdecimal
+   Series.str.get_dummies
+
+..
+    The following is needed to ensure the generated pages are created with the
+    correct template (otherwise they would be created in the Series/Index class page)
+
+..
+    .. autosummary::
+       :toctree: api/
+       :template: autosummary/accessor.rst
+
+       Series.str
+       Series.cat
+       Series.dt
+       Index.str
+
+.. _api.series.cat:
+
+Categorical Accessor
+~~~~~~~~~~~~~~~~~~~~
+
+Categorical-dtype specific methods and attributes are available under
+the ``Series.cat`` accessor.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.cat.categories
+   Series.cat.ordered
+   Series.cat.codes
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   Series.cat.rename_categories
+   Series.cat.reorder_categories
+   Series.cat.add_categories
+   Series.cat.remove_categories
+   Series.cat.remove_unused_categories
+   Series.cat.set_categories
+   Series.cat.as_ordered
+   Series.cat.as_unordered
+
+
+.. _api.series.sparse:
+
+Sparse Accessor
+~~~~~~~~~~~~~~~
+
+Sparse-dtype specific methods and attributes are provided under the
+``Series.sparse`` accessor.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_attribute.rst
+
+   Series.sparse.npoints
+   Series.sparse.density
+   Series.sparse.fill_value
+   Series.sparse.sp_values
+
+.. autosummary::
+   :toctree: api/
+
+   Series.sparse.from_coo
+   Series.sparse.to_coo
+
+
+Plotting
+--------
+``Series.plot`` is both a callable method and a namespace attribute for
+specific plotting methods of the form ``Series.plot.<kind>``.
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_callable.rst
+
+   Series.plot
+
+.. autosummary::
+   :toctree: api/
+   :template: autosummary/accessor_method.rst
+
+   Series.plot.area
+   Series.plot.bar
+   Series.plot.barh
+   Series.plot.box
+   Series.plot.density
+   Series.plot.hist
+   Series.plot.kde
+   Series.plot.line
+   Series.plot.pie
+
+.. autosummary::
+   :toctree: api/
+
+   Series.hist
+
+Serialization / IO / Conversion
+-------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Series.to_pickle
+   Series.to_csv
+   Series.to_dict
+   Series.to_excel
+   Series.to_frame
+   Series.to_xarray
+   Series.to_hdf
+   Series.to_sql
+   Series.to_msgpack
+   Series.to_json
+   Series.to_sparse
+   Series.to_dense
+   Series.to_string
+   Series.to_clipboard
+   Series.to_latex
+
+
+Sparse
+------
+
+.. autosummary::
+   :toctree: api/
+
+   SparseSeries.to_coo
+   SparseSeries.from_coo
+
diff --git a/doc/source/reference/style.rst b/doc/source/reference/style.rst
new file mode 100644
index 0000000000000..bd9635b41e343
--- /dev/null
+++ b/doc/source/reference/style.rst
@@ -0,0 +1,66 @@
+{{ header }}
+
+.. _api.style:
+
+=====
+Style
+=====
+.. currentmodule:: pandas.io.formats.style
+
+``Styler`` objects are returned by :attr:`pandas.DataFrame.style`.
+
+Styler Constructor
+------------------
+.. autosummary::
+   :toctree: api/
+
+   Styler
+   Styler.from_custom_template
+
+Styler Properties
+-----------------
+.. autosummary::
+   :toctree: api/
+
+   Styler.env
+   Styler.template
+   Styler.loader
+
+Style Application
+-----------------
+.. autosummary::
+   :toctree: api/
+
+   Styler.apply
+   Styler.applymap
+   Styler.where
+   Styler.format
+   Styler.set_precision
+   Styler.set_table_styles
+   Styler.set_table_attributes
+   Styler.set_caption
+   Styler.set_properties
+   Styler.set_uuid
+   Styler.clear
+   Styler.pipe
+
+Builtin Styles
+--------------
+.. autosummary::
+   :toctree: api/
+
+   Styler.highlight_max
+   Styler.highlight_min
+   Styler.highlight_null
+   Styler.background_gradient
+   Styler.bar
+
+Style Export and Import
+-----------------------
+.. autosummary::
+   :toctree: api/
+
+   Styler.render
+   Styler.export
+   Styler.use
+   Styler.to_excel
diff --git a/doc/source/reference/window.rst b/doc/source/reference/window.rst
new file mode 100644
index 0000000000000..9e1374a3bd8e4
--- /dev/null
+++ b/doc/source/reference/window.rst
@@ -0,0 +1,69 @@
+{{ header }}
+
+.. _api.window:
+
+======
+Window
+======
+.. currentmodule:: pandas.core.window
+
+Rolling objects are returned by ``.rolling`` calls: :func:`pandas.DataFrame.rolling`, :func:`pandas.Series.rolling`, etc.
+Expanding objects are returned by ``.expanding`` calls: :func:`pandas.DataFrame.expanding`, :func:`pandas.Series.expanding`, etc.
+EWM objects are returned by ``.ewm`` calls: :func:`pandas.DataFrame.ewm`, :func:`pandas.Series.ewm`, etc.
+
+Standard moving window functions
+--------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Rolling.count
+   Rolling.sum
+   Rolling.mean
+   Rolling.median
+   Rolling.var
+   Rolling.std
+   Rolling.min
+   Rolling.max
+   Rolling.corr
+   Rolling.cov
+   Rolling.skew
+   Rolling.kurt
+   Rolling.apply
+   Rolling.aggregate
+   Rolling.quantile
+   Window.mean
+   Window.sum
+
+.. _api.functions_expanding:
+
+Standard expanding window functions
+-----------------------------------
+.. autosummary::
+   :toctree: api/
+
+   Expanding.count
+   Expanding.sum
+   Expanding.mean
+   Expanding.median
+   Expanding.var
+   Expanding.std
+   Expanding.min
+   Expanding.max
+   Expanding.corr
+   Expanding.cov
+   Expanding.skew
+   Expanding.kurt
+   Expanding.apply
+   Expanding.aggregate
+   Expanding.quantile
+
+Exponentially-weighted moving window functions
+----------------------------------------------
+.. autosummary::
+   :toctree: api/
+
+   EWM.mean
+   EWM.std
+   EWM.var
+   EWM.corr
+   EWM.cov
diff --git a/doc/source/release.rst b/doc/source/release.rst
deleted file mode 100644
index f89fec9fb86e6..0000000000000
--- a/doc/source/release.rst
+++ /dev/null
@@ -1,5353 +0,0 @@
-.. _release:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   import numpy as np
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   import matplotlib.pyplot as plt
-   plt.close('all')
-
-   pd.options.display.max_rows=15
-   import pandas.util.testing as tm
-
-*************
-Release Notes
-*************
-
-This is the list of changes to pandas between each release. For full details,
-see the commit logs at http://github.com/pandas-dev/pandas
-
-**What is it**
-
-pandas is a Python package providing fast, flexible, and expressive data
-structures designed to make working with “relational” or “labeled” data both
-easy and intuitive. It aims to be the fundamental high-level building block for
-doing practical, real world data analysis in Python. Additionally, it has the
-broader goal of becoming the most powerful and flexible open source data
-analysis / manipulation tool available in any language.
-
-**Where to get it**
-
-* Source code: http://github.com/pandas-dev/pandas
-* Binary installers on PyPI: http://pypi.python.org/pypi/pandas
-* Documentation: http://pandas.pydata.org
-
-
-pandas 0.19.2
--------------
-
-**Release date:** December 24, 2016
-
-This is a minor bug-fix release in the 0.19.x series and includes some small regression fixes,
-bug fixes and performance improvements.
-
-Highlights include:
-
-- Compatibility with Python 3.6
-- Added a `Pandas Cheat Sheet <https://github.com/pandas-dev/pandas/tree/master/doc/cheatsheet/Pandas_Cheat_Sheet.pdf>`__. (:issue:`13202`).
-
-See the :ref:`v0.19.2 Whatsnew <whatsnew_0192>` page for an overview of all
-bugs that have been fixed in 0.19.2.
-
-Thanks
-~~~~~~
-
-- Ajay Saxena
-- Ben Kandel
-- Chris
-- Chris Ham
-- Christopher C. Aycock
-- Daniel Himmelstein
-- Dave Willmer
-- Dr-Irv
-- gfyoung
-- hesham shabana
-- Jeff Carey
-- Jeff Reback
-- Joe Jevnik
-- Joris Van den Bossche
-- Julian Santander
-- Kerby Shedden
-- Keshav Ramaswamy
-- Kevin Sheppard
-- Luca Scarabello
-- Matti Picus
-- Matt Roeschke
-- Maximilian Roos
-- Mykola Golubyev
-- Nate Yoder
-- Nicholas Ver Halen
-- Pawel Kordek
-- Pietro Battiston
-- Rodolfo Fernandez
-- sinhrks
-- Tara Adiseshan
-- Tom Augspurger
-- wandersoncferreira
-- Yaroslav Halchenko
-
-
-pandas 0.19.1
--------------
-
-**Release date:** November 3, 2016
-
-This is a minor bug-fix release from 0.19.0 and includes some small regression fixes,
-bug fixes and performance improvements.
-
-See the :ref:`v0.19.1 Whatsnew <whatsnew_0191>` page for an overview of all
-bugs that have been fixed in 0.19.1.
-
-Thanks
-~~~~~~
-
-- Adam Chainz
-- Anthonios Partheniou
-- Arash Rouhani
-- Ben Kandel
-- Brandon M. Burroughs
-- Chris
-- chris-b1
-- Chris Warth
-- David Krych
-- dubourg
-- gfyoung
-- Iván Vallés Pérez
-- Jeff Reback
-- Joe Jevnik
-- Jon M. Mease
-- Joris Van den Bossche
-- Josh Owen
-- Keshav Ramaswamy
-- Larry Ren
-- mattrijk
-- Michael Felt
-- paul-mannino
-- Piotr Chromiec
-- Robert Bradshaw
-- Sinhrks
-- Thiago Serafim
-- Tom Bird
-
-
-pandas 0.19.0
--------------
-
-**Release date:** October 2, 2016
-
-This is a major release from 0.18.1 and includes number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- :func:`merge_asof` for asof-style time-series joining, see :ref:`here <whatsnew_0190.enhancements.asof_merge>`
-- ``.rolling()`` is now time-series aware, see :ref:`here <whatsnew_0190.enhancements.rolling_ts>`
-- :func:`read_csv` now supports parsing ``Categorical`` data, see :ref:`here <whatsnew_0190.enhancements.read_csv_categorical>`
-- A function :func:`union_categorical` has been added for combining categoricals, see :ref:`here <whatsnew_0190.enhancements.union_categoricals>`
-- ``PeriodIndex`` now has its own ``period`` dtype, and changed to be more consistent with other ``Index`` classes. See :ref:`here <whatsnew_0190.api.period>`
-- Sparse data structures gained enhanced support of ``int`` and ``bool`` dtypes, see :ref:`here <whatsnew_0190.sparse>`
-- Comparison operations with ``Series`` no longer ignores the index, see :ref:`here <whatsnew_0190.api.series_ops>` for an overview of the API changes.
-- Introduction of a pandas development API for utility functions, see :ref:`here <whatsnew_0190.dev_api>`.
-- Deprecation of ``Panel4D`` and ``PanelND``. We recommend to represent these types of n-dimensional data with the `xarray package <http://xarray.pydata.org/en/stable/>`__.
-- Removal of the previously deprecated modules ``pandas.io.data``, ``pandas.io.wb``, ``pandas.tools.rplot``.
-
-See the :ref:`v0.19.0 Whatsnew <whatsnew_0190>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.19.0.
-
-Thanks
-~~~~~~
-
-- adneu
-- Adrien Emery
-- agraboso
-- Alex Alekseyev
-- Alex Vig
-- Allen Riddell
-- Amol
-- Amol Agrawal
-- Andy R. Terrel
-- Anthonios Partheniou
-- babakkeyvani
-- Ben Kandel
-- Bob Baxley
-- Brett Rosen
-- c123w
-- Camilo Cota
-- Chris
-- chris-b1
-- Chris Grinolds
-- Christian Hudon
-- Christopher C. Aycock
-- Chris Warth
-- cmazzullo
-- conquistador1492
-- cr3
-- Daniel Siladji
-- Douglas McNeil
-- Drewrey Lupton
-- dsm054
-- Eduardo Blancas Reyes
-- Elliot Marsden
-- Evan Wright
-- Felix Marczinowski
-- Francis T. O'Donovan
-- Gábor Lipták
-- Geraint Duck
-- gfyoung
-- Giacomo Ferroni
-- Grant Roch
-- Haleemur Ali
-- harshul1610
-- Hassan Shamim
-- iamsimha
-- Iulius Curt
-- Ivan Nazarov
-- jackieleng
-- Jeff Reback
-- Jeffrey Gerard
-- Jenn Olsen
-- Jim Crist
-- Joe Jevnik
-- John Evans
-- John Freeman
-- John Liekezer
-- Johnny Gill
-- John W. O'Brien
-- John Zwinck
-- Jordan Erenrich
-- Joris Van den Bossche
-- Josh Howes
-- Jozef Brandys
-- Kamil Sindi
-- Ka Wo Chen
-- Kerby Shedden
-- Kernc
-- Kevin Sheppard
-- Matthieu Brucher
-- Maximilian Roos
-- Michael Scherer
-- Mike Graham
-- Mortada Mehyar
-- mpuels
-- Muhammad Haseeb Tariq
-- Nate George
-- Neil Parley
-- Nicolas Bonnotte
-- OXPHOS
-- Pan Deng / Zora
-- Paul
-- Pauli Virtanen
-- Paul Mestemaker
-- Pawel Kordek
-- Pietro Battiston
-- pijucha
-- Piotr Jucha
-- priyankjain
-- Ravi Kumar Nimmi
-- Robert Gieseke
-- Robert Kern
-- Roger Thomas
-- Roy Keyes
-- Russell Smith
-- Sahil Dua
-- Sanjiv Lobo
-- Sašo Stanovnik
-- Shawn Heide
-- sinhrks
-- Sinhrks
-- Stephen Kappel
-- Steve Choi
-- Stewart Henderson
-- Sudarshan Konge
-- Thomas A Caswell
-- Tom Augspurger
-- Tom Bird
-- Uwe Hoffmann
-- wcwagner
-- WillAyd
-- Xiang Zhang
-- Yadunandan
-- Yaroslav Halchenko
-- YG-Riku
-- Yuichiro Kaneko
-- yui-knk
-- zhangjinjie
-- znmean
-- 颜发才（Yan Facai）
-
-pandas 0.18.1
--------------
-
-**Release date:** (May 3, 2016)
-
-This is a minor release from 0.18.0 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-
-Highlights include:
-
-- ``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see :ref:`here <whatsnew_0181.deferred_ops>`
-- ``pd.to_datetime()`` has gained the ability to assemble dates from a ``DataFrame``, see :ref:`here <whatsnew_0181.enhancements.assembling>`
-- Method chaining improvements, see :ref:`here <whatsnew_0181.enhancements.method_chain>`.
-- Custom business hour offset, see :ref:`here <whatsnew_0181.enhancements.custombusinesshour>`.
-- Many bug fixes in the handling of ``sparse``, see :ref:`here <whatsnew_0181.sparse>`
-- Expanded the :ref:`Tutorials section <tutorial-modern>` with a feature on modern pandas, courtesy of `@TomAugsburger <https://twitter.com/TomAugspurger>`__. (:issue:`13045`).
-
-See the :ref:`v0.18.1 Whatsnew <whatsnew_0181>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.18.1.
-
-Thanks
-~~~~~~
-
-- Andrew Fiore-Gartland
-- Bastiaan
-- Benoît Vinot
-- Brandon Rhodes
-- DaCoEx
-- Drew Fustin
-- Ernesto Freitas
-- Filip Ter
-- Gregory Livschitz
-- Gábor Lipták
-- Hassan Kibirige
-- Iblis Lin
-- Israel Saeta Pérez
-- Jason Wolosonovich
-- Jeff Reback
-- Joe Jevnik
-- Joris Van den Bossche
-- Joshua Storck
-- Ka Wo Chen
-- Kerby Shedden
-- Kieran O'Mahony
-- Leif Walsh
-- Mahmoud Lababidi
-- Maoyuan Liu
-- Mark Roth
-- Matt Wittmann
-- MaxU
-- Maximilian Roos
-- Michael Droettboom
-- Nick Eubank
-- Nicolas Bonnotte
-- OXPHOS
-- Pauli Virtanen
-- Peter Waller
-- Pietro Battiston
-- Prabhjot Singh
-- Robin Wilson
-- Roger Thomas
-- Sebastian Bank
-- Stephen Hoover
-- Tim Hopper
-- Tom Augspurger
-- WANG Aiyong
-- Wes Turner
-- Winand
-- Xbar
-- Yan Facai
-- adneu
-- ajenkins-cargometrics
-- behzad nouri
-- chinskiy
-- gfyoung
-- jeps-journal
-- jonaslb
-- kotrfa
-- nileracecrew
-- onesandzeroes
-- rs2
-- sinhrks
-- tsdlovell
-
-pandas 0.18.0
--------------
-
-**Release date:** (March 13, 2016)
-
-This is a major release from 0.17.1 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- Moving and expanding window functions are now methods on Series and DataFrame,
-  similar to ``.groupby``, see :ref:`here <whatsnew_0180.enhancements.moments>`.
-- Adding support for a ``RangeIndex`` as a specialized form of the ``Int64Index``
-  for memory savings, see :ref:`here <whatsnew_0180.enhancements.rangeindex>`.
-- API breaking change to the ``.resample`` method to make it more ``.groupby``
-  like, see :ref:`here <whatsnew_0180.breaking.resample>`.
-- Removal of support for positional indexing with floats, which was deprecated
-  since 0.14.0. This will now raise a ``TypeError``, see :ref:`here <whatsnew_0180.float_indexers>`.
-- The ``.to_xarray()`` function has been added for compatibility with the
-  `xarray package <http://xarray.pydata.org/en/stable/>`__, see :ref:`here <whatsnew_0180.enhancements.xarray>`.
-- The ``read_sas`` function has been enhanced to read ``sas7bdat`` files, see :ref:`here <whatsnew_0180.enhancements.sas>`.
-- Addition of the :ref:`.str.extractall() method <whatsnew_0180.enhancements.extract>`,
-  and API changes to the :ref:`.str.extract() method <whatsnew_0180.enhancements.extract>`
-  and :ref:`.str.cat() method <whatsnew_0180.enhancements.strcat>`.
-- ``pd.test()`` top-level nose test runner is available (:issue:`4327`).
-
-See the :ref:`v0.18.0 Whatsnew <whatsnew_0180>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.18.0.
-
-Thanks
-~~~~~~
-
-- ARF
-- Alex Alekseyev
-- Andrew McPherson
-- Andrew Rosenfeld
-- Anthonios Partheniou
-- Anton I. Sipos
-- Ben
-- Ben North
-- Bran Yang
-- Chris
-- Chris Carroux
-- Christopher C. Aycock
-- Christopher Scanlin
-- Cody
-- Da Wang
-- Daniel Grady
-- Dorozhko Anton
-- Dr-Irv
-- Erik M. Bray
-- Evan Wright
-- Francis T. O'Donovan
-- Frank Cleary
-- Gianluca Rossi
-- Graham Jeffries
-- Guillaume Horel
-- Henry Hammond
-- Isaac Schwabacher
-- Jean-Mathieu Deschenes
-- Jeff Reback
-- Joe Jevnik
-- John Freeman
-- John Fremlin
-- Jonas Hoersch
-- Joris Van den Bossche
-- Joris Vankerschaver
-- Justin Lecher
-- Justin Lin
-- Ka Wo Chen
-- Keming Zhang
-- Kerby Shedden
-- Kyle
-- Marco Farrugia
-- MasonGallo
-- MattRijk
-- Matthew Lurie
-- Maximilian Roos
-- Mayank Asthana
-- Mortada Mehyar
-- Moussa Taifi
-- Navreet Gill
-- Nicolas Bonnotte
-- Paul Reiners
-- Philip Gura
-- Pietro Battiston
-- RahulHP
-- Randy Carnevale
-- Rinoc Johnson
-- Rishipuri
-- Sangmin Park
-- Scott E Lasley
-- Sereger13
-- Shannon Wang
-- Skipper Seabold
-- Thierry Moisan
-- Thomas A Caswell
-- Toby Dylan Hocking
-- Tom Augspurger
-- Travis
-- Trent Hauck
-- Tux1
-- Varun
-- Wes McKinney
-- Will Thompson
-- Yoav Ram
-- Yoong Kang Lim
-- Yoshiki Vázquez Baeza
-- Young Joong Kim
-- Younggun Kim
-- Yuval Langer
-- alex argunov
-- behzad nouri
-- boombard
-- brian-pantano
-- chromy
-- daniel
-- dgram0
-- gfyoung
-- hack-c
-- hcontrast
-- jfoo
-- kaustuv deolal
-- llllllllll
-- ranarag
-- rockg
-- scls19fr
-- seales
-- sinhrks
-- srib
-- surveymedia.ca
-- tworec
-
-pandas 0.17.1
--------------
-
-**Release date:** (November 21, 2015)
-
-This is a minor release from 0.17.0 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-
-Highlights include:
-
-- Support for Conditional HTML Formatting, see :ref:`here <whatsnew_0171.style>`
-- Releasing the GIL on the csv reader & other ops, see :ref:`here <whatsnew_0171.performance>`
-- Regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
-
-See the :ref:`v0.17.1 Whatsnew <whatsnew_0171>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.17.1.
-
-Thanks
-~~~~~~
-
-- Aleksandr Drozd
-- Alex Chase
-- Anthonios Partheniou
-- BrenBarn
-- Brian J. McGuirk
-- Chris
-- Christian Berendt
-- Christian Perez
-- Cody Piersall
-- Data & Code Expert Experimenting with Code on Data
-- DrIrv
-- Evan Wright
-- Guillaume Gay
-- Hamed Saljooghinejad
-- Iblis Lin
-- Jake VanderPlas
-- Jan Schulz
-- Jean-Mathieu Deschenes
-- Jeff Reback
-- Jimmy Callin
-- Joris Van den Bossche
-- K.-Michael Aye
-- Ka Wo Chen
-- Loïc Séguin-C
-- Luo Yicheng
-- Magnus Jöud
-- Manuel Leonhardt
-- Matthew Gilbert
-- Maximilian Roos
-- Michael
-- Nicholas Stahl
-- Nicolas Bonnotte
-- Pastafarianist
-- Petra Chong
-- Phil Schaf
-- Philipp A
-- Rob deCarvalho
-- Roman Khomenko
-- Rémy Léone
-- Sebastian Bank
-- Thierry Moisan
-- Tom Augspurger
-- Tux1
-- Varun
-- Wieland Hoffmann
-- Winterflower
-- Yoav Ram
-- Younggun Kim
-- Zeke
-- ajcr
-- azuranski
-- behzad nouri
-- cel4
-- emilydolson
-- hironow
-- lexual
-- llllllllll
-- rockg
-- silentquasar
-- sinhrks
-- taeold
-
-pandas 0.17.0
--------------
-
-**Release date:** (October 9, 2015)
-
-This is a major release from 0.16.2 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- Release the Global Interpreter Lock (GIL) on some cython operations, see :ref:`here <whatsnew_0170.gil>`
-- Plotting methods are now available as attributes of the ``.plot`` accessor, see :ref:`here <whatsnew_0170.plot>`
-- The sorting API has been revamped to remove some long-time inconsistencies, see :ref:`here <whatsnew_0170.api_breaking.sorting>`
-- Support for a ``datetime64[ns]`` with timezones as a first-class dtype, see :ref:`here <whatsnew_0170.tz>`
-- The default for ``to_datetime`` will now be to ``raise`` when presented with unparseable formats,
-  previously this would return the original input. Also, date parse
-  functions now return consistent results. See :ref:`here <whatsnew_0170.api_breaking.to_datetime>`
-- The default for ``dropna`` in ``HDFStore`` has changed to ``False``, to store by default all rows even
-  if they are all ``NaN``, see :ref:`here <whatsnew_0170.api_breaking.hdf_dropna>`
-- Datetime accessor (``dt``) now supports ``Series.dt.strftime`` to generate formatted strings for datetime-likes, and ``Series.dt.total_seconds`` to generate each duration of the timedelta in seconds. See :ref:`here <whatsnew_0170.strftime>`
-- ``Period`` and ``PeriodIndex`` can handle multiplied freq like ``3D``, which corresponding to 3 days span. See :ref:`here <whatsnew_0170.periodfreq>`
-- Development installed versions of pandas will now have ``PEP440`` compliant version strings (:issue:`9518`)
-- Development support for benchmarking with the `Air Speed Velocity library <https://github.com/spacetelescope/asv/>`_ (:issue:`8316`)
-- Support for reading SAS xport files, see :ref:`here <whatsnew_0170.enhancements.sas_xport>`
-- Documentation comparing SAS to *pandas*, see :ref:`here <compare_with_sas>`
-- Removal of the automatic TimeSeries broadcasting, deprecated since 0.8.0, see :ref:`here <whatsnew_0170.prior_deprecations>`
-- Display format with plain text can optionally align with Unicode East Asian Width, see :ref:`here <whatsnew_0170.east_asian_width>`
-- Compatibility with Python 3.5 (:issue:`11097`)
-- Compatibility with matplotlib 1.5.0 (:issue:`11111`)
-
-See the :ref:`v0.17.0 Whatsnew <whatsnew_0170>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.17.0.
-
-Thanks
-~~~~~~
-
-- Alex Rothberg
-- Andrea Bedini
-- Andrew Rosenfeld
-- Andy Li
-- Anthonios Partheniou
-- Artemy Kolchinsky
-- Bernard Willers
-- Charlie Clark
-- Chris
-- Chris Whelan
-- Christoph Gohlke
-- Christopher Whelan
-- Clark Fitzgerald
-- Clearfield Christopher
-- Dan Ringwalt
-- Daniel Ni
-- Data & Code Expert Experimenting with Code on Data
-- David Cottrell
-- David John Gagne
-- David Kelly
-- ETF
-- Eduardo Schettino
-- Egor
-- Egor Panfilov
-- Evan Wright
-- Frank Pinter
-- Gabriel Araujo
-- Garrett-R
-- Gianluca Rossi
-- Guillaume Gay
-- Guillaume Poulin
-- Harsh Nisar
-- Ian Henriksen
-- Ian Hoegen
-- Jaidev Deshpande
-- Jan Rudolph
-- Jan Schulz
-- Jason Swails
-- Jeff Reback
-- Jonas Buyl
-- Joris Van den Bossche
-- Joris Vankerschaver
-- Josh Levy-Kramer
-- Julien Danjou
-- Ka Wo Chen
-- Karrie Kehoe
-- Kelsey Jordahl
-- Kerby Shedden
-- Kevin Sheppard
-- Lars Buitinck
-- Leif Johnson
-- Luis Ortiz
-- Mac
-- Matt Gambogi
-- Matt Savoie
-- Matthew Gilbert
-- Maximilian Roos
-- Michelangelo D'Agostino
-- Mortada Mehyar
-- Nick Eubank
-- Nipun Batra
-- Ondřej Čertík
-- Phillip Cloud
-- Pratap Vardhan
-- Rafal Skolasinski
-- Richard Lewis
-- Rinoc Johnson
-- Rob Levy
-- Robert Gieseke
-- Safia Abdalla
-- Samuel Denny
-- Saumitra Shahapure
-- Sebastian Pölsterl
-- Sebastian Rubbert
-- Sheppard, Kevin
-- Sinhrks
-- Siu Kwan Lam
-- Skipper Seabold
-- Spencer Carrucciu
-- Stephan Hoyer
-- Stephen Hoover
-- Stephen Pascoe
-- Terry Santegoeds
-- Thomas Grainger
-- Tjerk Santegoeds
-- Tom Augspurger
-- Vincent Davis
-- Winterflower
-- Yaroslav Halchenko
-- Yuan Tang (Terry)
-- agijsberts
-- ajcr
-- behzad nouri
-- cel4
-- cyrusmaher
-- davidovitch
-- ganego
-- jreback
-- juricast
-- larvian
-- maximilianr
-- msund
-- rekcahpassyla
-- robertzk
-- scls19fr
-- seth-p
-- sinhrks
-- springcoil
-- terrytangyuan
-- tzinckgraf
-
-pandas 0.16.2
--------------
-
-**Release date:** (June 12, 2015)
-
-This is a minor release from 0.16.1 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-
-Highlights include:
-
-- A new ``pipe`` method, see :ref:`here <whatsnew_0162.enhancements.pipe>`
-- Documentation on how to use `numba <http://numba.pydata.org>`_ with *pandas*, see :ref:`here <enhancingperf.numba>`
-
-See the :ref:`v0.16.2 Whatsnew <whatsnew_0162>` overview for an extensive list
-of all enhancements and bugs that have been fixed in 0.16.2.
-
-Thanks
-~~~~~~
-
-- Andrew Rosenfeld
-- Artemy Kolchinsky
-- Bernard Willers
-- Christer van der Meeren
-- Christian Hudon
-- Constantine Glen Evans
-- Daniel Julius Lasiman
-- Evan Wright
-- Francesco Brundu
-- Gaëtan de Menten
-- Jake VanderPlas
-- James Hiebert
-- Jeff Reback
-- Joris Van den Bossche
-- Justin Lecher
-- Ka Wo Chen
-- Kevin Sheppard
-- Mortada Mehyar
-- Morton Fox
-- Robin Wilson
-- Thomas Grainger
-- Tom Ajamian
-- Tom Augspurger
-- Yoshiki Vázquez Baeza
-- Younggun Kim
-- austinc
-- behzad nouri
-- jreback
-- lexual
-- rekcahpassyla
-- scls19fr
-- sinhrks
-
-pandas 0.16.1
--------------
-
-**Release date:** (May 11, 2015)
-
-This is a minor release from 0.16.0 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-A small number of API changes were necessary to fix existing bugs.
-
-See the :ref:`v0.16.1 Whatsnew <whatsnew_0161>` overview for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.16.1.
-
-Thanks
-~~~~~~
-
-- Alfonso MHC
-- Andy Hayden
-- Artemy Kolchinsky
-- Chris Gilmer
-- Chris Grinolds
-- Dan Birken
-- David BROCHART
-- David Hirschfeld
-- David Stephens
-- Dr. Leo
-- Evan Wright
-- Frans van Dunné
-- Hatem Nassrat
-- Henning Sperr
-- Hugo Herter
-- Jan Schulz
-- Jeff Blackburne
-- Jeff Reback
-- Jim Crist
-- Jonas Abernot
-- Joris Van den Bossche
-- Kerby Shedden
-- Leo Razoumov
-- Manuel Riel
-- Mortada Mehyar
-- Nick Burns
-- Nick Eubank
-- Olivier Grisel
-- Phillip Cloud
-- Pietro Battiston
-- Roy Hyunjin Han
-- Sam Zhang
-- Scott Sanderson
-- Stephan Hoyer
-- Tiago Antao
-- Tom Ajamian
-- Tom Augspurger
-- Tomaz Berisa
-- Vikram Shirgur
-- Vladimir Filimonov
-- William Hogman
-- Yasin A
-- Younggun Kim
-- behzad nouri
-- dsm054
-- floydsoft
-- flying-sheep
-- gfr
-- jnmclarty
-- jreback
-- ksanghai
-- lucas
-- mschmohl
-- ptype
-- rockg
-- scls19fr
-- sinhrks
-
-
-pandas 0.16.0
--------------
-
-**Release date:** (March 22, 2015)
-
-This is a major release from 0.15.2 and includes a number of API changes, several new features, enhancements, and
-performance improvements along with a large number of bug fixes.
-
-Highlights include:
-
-- ``DataFrame.assign`` method, see :ref:`here <whatsnew_0160.enhancements.assign>`
-- ``Series.to_coo/from_coo`` methods to interact with ``scipy.sparse``, see :ref:`here <whatsnew_0160.enhancements.sparse>`
-- Backwards incompatible change to ``Timedelta`` to conform the ``.seconds`` attribute with ``datetime.timedelta``, see :ref:`here <whatsnew_0160.api_breaking.timedelta>`
-- Changes to the ``.loc`` slicing API to conform with the behavior of ``.ix`` see :ref:`here <whatsnew_0160.api_breaking.indexing>`
-- Changes to the default for ordering in the ``Categorical`` constructor, see :ref:`here <whatsnew_0160.api_breaking.categorical>`
-- The ``pandas.tools.rplot``, ``pandas.sandbox.qtpandas`` and ``pandas.rpy``
-  modules are deprecated. We refer users to external packages like
-  `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_,
-  `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_ and
-  `rpy2 <http://rpy2.bitbucket.org/>`_ for similar or equivalent
-  functionality, see :ref:`here <whatsnew_0160.deprecations>`
-
-See the :ref:`v0.16.0 Whatsnew <whatsnew_0160>` overview or the issue tracker on GitHub for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.16.0.
-
-Thanks
-~~~~~~
-
-- Aaron Toth
-- Alan Du
-- Alessandro Amici
-- Artemy Kolchinsky
-- Ashwini Chaudhary
-- Ben Schiller
-- Bill Letson
-- Brandon Bradley
-- Chau Hoang
-- Chris Reynolds
-- Chris Whelan
-- Christer van der Meeren
-- David Cottrell
-- David Stephens
-- Ehsan Azarnasab
-- Garrett-R
-- Guillaume Gay
-- Jake Torcasso
-- Jason Sexauer
-- Jeff Reback
-- John McNamara
-- Joris Van den Bossche
-- Joschka zur Jacobsmühlen
-- Juarez Bochi
-- Junya Hayashi
-- K.-Michael Aye
-- Kerby Shedden
-- Kevin Sheppard
-- Kieran O'Mahony
-- Kodi Arfer
-- Matti Airas
-- Min RK
-- Mortada Mehyar
-- Robert
-- Scott E Lasley
-- Scott Lasley
-- Sergio Pascual
-- Skipper Seabold
-- Stephan Hoyer
-- Thomas Grainger
-- Tom Augspurger
-- TomAugspurger
-- Vladimir Filimonov
-- Vyomkesh Tripathi
-- Will Holmgren
-- Yulong Yang
-- behzad nouri
-- bertrandhaut
-- bjonen
-- cel4
-- clham
-- hsperr
-- ischwabacher
-- jnmclarty
-- josham
-- jreback
-- omtinez
-- roch
-- sinhrks
-- unutbu
-
-pandas 0.15.2
--------------
-
-**Release date:** (December 12, 2014)
-
-This is a minor release from 0.15.1 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-A small number of API changes were necessary to fix existing bugs.
-
-See the :ref:`v0.15.2 Whatsnew <whatsnew_0152>` overview for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.15.2.
-
-Thanks
-~~~~~~
-
-- Aaron Staple
-- Angelos Evripiotis
-- Artemy Kolchinsky
-- Benoit Pointet
-- Brian Jacobowski
-- Charalampos Papaloizou
-- Chris Warth
-- David Stephens
-- Fabio Zanini
-- Francesc Via
-- Henry Kleynhans
-- Jake VanderPlas
-- Jan Schulz
-- Jeff Reback
-- Jeff Tratner
-- Joris Van den Bossche
-- Kevin Sheppard
-- Matt Suggit
-- Matthew Brett
-- Phillip Cloud
-- Rupert Thompson
-- Scott E Lasley
-- Stephan Hoyer
-- Stephen Simmons
-- Sylvain Corlay
-- Thomas Grainger
-- Tiago Antao
-- Trent Hauck
-- Victor Chaves
-- Victor Salgado
-- Vikram Bhandoh
-- WANG Aiyong
-- Will Holmgren
-- behzad nouri
-- broessli
-- charalampos papaloizou
-- immerrr
-- jnmclarty
-- jreback
-- mgilbert
-- onesandzeroes
-- peadarcoyle
-- rockg
-- seth-p
-- sinhrks
-- unutbu
-- wavedatalab
-- Åsmund Hjulstad
-
-pandas 0.15.1
--------------
-
-**Release date:** (November 9, 2014)
-
-This is a minor release from 0.15.0 and includes a small number of API changes, several new features, enhancements, and
-performance improvements along with a large number of bug fixes.
-
-See the :ref:`v0.15.1 Whatsnew <whatsnew_0151>` overview for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.15.1.
-
-Thanks
-~~~~~~
-
-- Aaron Staple
-- Andrew Rosenfeld
-- Anton I. Sipos
-- Artemy Kolchinsky
-- Bill Letson
-- Dave Hughes
-- David Stephens
-- Guillaume Horel
-- Jeff Reback
-- Joris Van den Bossche
-- Kevin Sheppard
-- Nick Stahl
-- Sanghee Kim
-- Stephan Hoyer
-- TomAugspurger
-- WANG Aiyong
-- behzad nouri
-- immerrr
-- jnmclarty
-- jreback
-- pallav-fdsi
-- unutbu
-
-pandas 0.15.0
--------------
-
-**Release date:** (October 18, 2014)
-
-This is a major release from 0.14.1 and includes a number of API changes, several new features, enhancements, and
-performance improvements along with a large number of bug fixes.
-
-Highlights include:
-
-- Drop support for numpy < 1.7.0 (:issue:`7711`)
-- The ``Categorical`` type was integrated as a first-class pandas type, see :ref:`here <whatsnew_0150.cat>`
-- New scalar type ``Timedelta``, and a new index type ``TimedeltaIndex``, see :ref:`here <whatsnew_0150.timedeltaindex>`
-- New DataFrame default display for ``df.info()`` to include memory usage, see :ref:`Memory Usage <whatsnew_0150.memory>`
-- New datetimelike properties accessor ``.dt`` for Series, see :ref:`Datetimelike Properties <whatsnew_0150.dt>`
-- Split indexing documentation into :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
-- Split out string methods documentation into :ref:`Working with Text Data <text>`
-- ``read_csv`` will now by default ignore blank lines when parsing, see :ref:`here <whatsnew_0150.blanklines>`
-- API change in using Indexes in set operations, see :ref:`here <whatsnew_0150.index_set_ops>`
-- Internal refactoring of the ``Index`` class to no longer sub-class ``ndarray``, see :ref:`Internal Refactoring <whatsnew_0150.refactoring>`
-- dropping support for ``PyTables`` less than version 3.0.0, and ``numexpr`` less than version 2.1 (:issue:`7990`)
-
-See the :ref:`v0.15.0 Whatsnew <whatsnew_0150>` overview or the issue tracker on GitHub for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.15.0.
-
-Thanks
-~~~~~~
-
-- Aaron Schumacher
-- Adam Greenhall
-- Andy Hayden
-- Anthony O'Brien
-- Artemy Kolchinsky
-- behzad nouri
-- Benedikt Sauer
-- benjamin
-- Benjamin Thyreau
-- Ben Schiller
-- bjonen
-- BorisVerk
-- Chris Reynolds
-- Chris Stoafer
-- Dav Clark
-- dlovell
-- DSM
-- dsm054
-- FragLegs
-- German Gomez-Herrero
-- Hsiaoming Yang
-- Huan Li
-- hunterowens
-- Hyungtae Kim
-- immerrr
-- Isaac Slavitt
-- ischwabacher
-- Jacob Schaer
-- Jacob Wasserman
-- Jan Schulz
-- Jeff Tratner
-- Jesse Farnham
-- jmorris0x0
-- jnmclarty
-- Joe Bradish
-- Joerg Rittinger
-- John W. O'Brien
-- Joris Van den Bossche
-- jreback
-- Kevin Sheppard
-- klonuo
-- Kyle Meyer
-- lexual
-- Max Chang
-- mcjcode
-- Michael Mueller
-- Michael W Schatzow
-- Mike Kelly
-- Mortada Mehyar
-- mtrbean
-- Nathan Sanders
-- Nathan Typanski
-- onesandzeroes
-- Paul Masurel
-- Phillip Cloud
-- Pietro Battiston
-- RenzoBertocchi
-- rockg
-- Ross Petchler
-- seth-p
-- Shahul Hameed
-- Shashank Agarwal
-- sinhrks
-- someben
-- stahlous
-- stas-sl
-- Stephan Hoyer
-- thatneat
-- tom-alcorn
-- TomAugspurger
-- Tom Augspurger
-- Tony Lorenzo
-- unknown
-- unutbu
-- Wes Turner
-- Wilfred Hughes
-- Yevgeniy Grechka
-- Yoshiki VÃ¡zquez Baeza
-- zachcp
-
-pandas 0.14.1
--------------
-
-**Release date:** (July 11, 2014)
-
-This is a minor release from 0.14.0 and includes a small number of API changes, several new features, enhancements, and
-performance improvements along with a large number of bug fixes.
-
-Highlights include:
-
-- New methods :meth:`~pandas.DataFrame.select_dtypes` to select columns
-  based on the dtype and :meth:`~pandas.Series.sem` to calculate the
-  standard error of the mean.
-- Support for dateutil timezones (see :ref:`docs <timeseries.timezone>`).
-- Support for ignoring full line comments in the :func:`~pandas.read_csv`
-  text parser.
-- New documentation section on :ref:`Options and Settings <options>`.
-- Lots of bug fixes.
-
-See the :ref:`v0.14.1 Whatsnew <whatsnew_0141>` overview or the issue tracker on GitHub for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.14.1.
-
-Thanks
-~~~~~~
-
-- Andrew Rosenfeld
-- Andy Hayden
-- Benjamin Adams
-- Benjamin M. Gross
-- Brian Quistorff
-- Brian Wignall
-- bwignall
-- clham
-- Daniel Waeber
-- David Bew
-- David Stephens
-- DSM
-- dsm054
-- helger
-- immerrr
-- Jacob Schaer
-- jaimefrio
-- Jan Schulz
-- John David Reaver
-- John W. O'Brien
-- Joris Van den Bossche
-- jreback
-- Julien Danjou
-- Kevin Sheppard
-- K.-Michael Aye
-- Kyle Meyer
-- lexual
-- Matthew Brett
-- Matt Wittmann
-- Michael Mueller
-- Mortada Mehyar
-- onesandzeroes
-- Phillip Cloud
-- Rob Levy
-- rockg
-- sanguineturtle
-- Schaer, Jacob C
-- seth-p
-- sinhrks
-- Stephan Hoyer
-- Thomas Kluyver
-- Todd Jennings
-- TomAugspurger
-- unknown
-- yelite
-
-pandas 0.14.0
--------------
-
-**Release date:** (May 31, 2014)
-
-This is a major release from 0.13.1 and includes a number of API changes, several new features, enhancements, and
-performance improvements along with a large number of bug fixes.
-
-Highlights include:
-
-- Officially support Python 3.4
-- SQL interfaces updated to use ``sqlalchemy``, see :ref:`here<whatsnew_0140.sql>`.
-- Display interface changes, see :ref:`here<whatsnew_0140.display>`
-- MultiIndexing using Slicers, see :ref:`here<whatsnew_0140.slicers>`.
-- Ability to join a singly-indexed DataFrame with a multi-indexed DataFrame, see :ref:`here <merging.join_on_mi>`
-- More consistency in groupby results and more flexible groupby specifications, see :ref:`here<whatsnew_0140.groupby>`
-- Holiday calendars are now supported in ``CustomBusinessDay``, see :ref:`here <timeseries.holiday>`
-- Several improvements in plotting functions, including: hexbin, area and pie plots, see :ref:`here<whatsnew_0140.plotting>`.
-- Performance doc section on I/O operations, see :ref:`here <io.perf>`
-
-See the :ref:`v0.14.0 Whatsnew <whatsnew_0140>` overview or the issue tracker on GitHub for an extensive list
-of all API changes, enhancements and bugs that have been fixed in 0.14.0.
-
-Thanks
-~~~~~~
-
-- Acanthostega
-- Adam Marcus
-- agijsberts
-- akittredge
-- Alex Gaudio
-- Alex Rothberg
-- AllenDowney
-- Andrew Rosenfeld
-- Andy Hayden
-- ankostis
-- anomrake
-- Antoine Mazières
-- anton-d
-- bashtage
-- Benedikt Sauer
-- benjamin
-- Brad Buran
-- bwignall
-- cgohlke
-- chebee7i
-- Christopher Whelan
-- Clark Fitzgerald
-- clham
-- Dale Jung
-- Dan Allan
-- Dan Birken
-- danielballan
-- Daniel Waeber
-- David Jung
-- David Stephens
-- Douglas McNeil
-- DSM
-- Garrett Drapala
-- Gouthaman Balaraman
-- Guillaume Poulin
-- hshimizu77
-- hugo
-- immerrr
-- ischwabacher
-- Jacob Howard
-- Jacob Schaer
-- jaimefrio
-- Jason Sexauer
-- Jeff Reback
-- Jeffrey Starr
-- Jeff Tratner
-- John David Reaver
-- John McNamara
-- John W. O'Brien
-- Jonathan Chambers
-- Joris Van den Bossche
-- jreback
-- jsexauer
-- Julia Evans
-- Júlio
-- Katie Atkinson
-- kdiether
-- Kelsey Jordahl
-- Kevin Sheppard
-- K.-Michael Aye
-- Matthias Kuhn
-- Matt Wittmann
-- Max Grender-Jones
-- Michael E. Gruen
-- michaelws
-- mikebailey
-- Mike Kelly
-- Nipun Batra
-- Noah Spies
-- ojdo
-- onesandzeroes
-- Patrick O'Keeffe
-- phaebz
-- Phillip Cloud
-- Pietro Battiston
-- PKEuS
-- Randy Carnevale
-- ribonoous
-- Robert Gibboni
-- rockg
-- sinhrks
-- Skipper Seabold
-- SplashDance
-- Stephan Hoyer
-- Tim Cera
-- Tobias Brandt
-- Todd Jennings
-- TomAugspurger
-- Tom Augspurger
-- unutbu
-- westurner
-- Yaroslav Halchenko
-- y-p
-- zach powers
-
-pandas 0.13.1
--------------
-
-**Release date:** (February 3, 2014)
-
-New Features
-~~~~~~~~~~~~
-
-- Added ``date_format`` and ``datetime_format`` attribute to ``ExcelWriter``.
-  (:issue:`4133`)
-
-API Changes
-~~~~~~~~~~~
-
-- ``Series.sort`` will raise a ``ValueError`` (rather than a ``TypeError``) on sorting an
-  object that is a view of another (:issue:`5856`, :issue:`5853`)
-- Raise/Warn ``SettingWithCopyError`` (according to the option ``chained_assignment`` in more cases,
-  when detecting chained assignment, related (:issue:`5938`, :issue:`6025`)
-- DataFrame.head(0) returns self instead of empty frame (:issue:`5846`)
-- ``autocorrelation_plot`` now accepts ``**kwargs``. (:issue:`5623`)
-- ``convert_objects`` now accepts a ``convert_timedeltas='coerce'`` argument to allow forced dtype conversion of
-  timedeltas (:issue:`5458`,:issue:`5689`)
-- Add ``-NaN`` and ``-nan`` to the default set of NA values
-  (:issue:`5952`).  See :ref:`NA Values <io.na_values>`.
-- ``NDFrame`` now has an ``equals`` method. (:issue:`5283`)
-- ``DataFrame.apply`` will use the ``reduce`` argument to determine whether a
-  ``Series`` or a ``DataFrame`` should be returned when the ``DataFrame`` is
-  empty (:issue:`6007`).
-
-Experimental Features
-~~~~~~~~~~~~~~~~~~~~~
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- perf improvements in Series datetime/timedelta binary operations (:issue:`5801`)
-- `option_context` context manager now available as top-level API (:issue:`5752`)
-- df.info() view now display dtype info per column (:issue:`5682`)
-- df.info() now honors option max_info_rows, disable null counts for large frames (:issue:`5974`)
-- perf improvements in DataFrame ``count/dropna`` for ``axis=1``
-- Series.str.contains now has a `regex=False` keyword which can be faster for plain (non-regex) string patterns. (:issue:`5879`)
-- support ``dtypes`` property on ``Series/Panel/Panel4D``
-- extend ``Panel.apply`` to allow arbitrary functions (rather than only ufuncs) (:issue:`1148`)
-  allow multiple axes to be used to operate on slabs of a ``Panel``
-- The ``ArrayFormatter`` for ``datetime`` and ``timedelta64`` now intelligently
-  limit precision based on the values in the array (:issue:`3401`)
-- ``pd.show_versions()`` is now available for convenience when reporting issues.
-- perf improvements to Series.str.extract (:issue:`5944`)
-- perf improvements in ``dtypes/ftypes`` methods (:issue:`5968`)
-- perf improvements in indexing with object dtypes (:issue:`5968`)
-- improved dtype inference for ``timedelta`` like passed to constructors (:issue:`5458`, :issue:`5689`)
-- escape special characters when writing to latex (:issue: `5374`)
-- perf improvements in ``DataFrame.apply`` (:issue:`6013`)
-- ``pd.read_csv`` and ``pd.to_datetime`` learned a new ``infer_datetime_format`` keyword which greatly
-  improves parsing perf in many cases. Thanks to @lexual for suggesting and @danbirken
-  for rapidly implementing. (:issue:`5490`,:issue:`6021`)
-- add ability to recognize '%p' format code (am/pm) to date parsers when the specific format
-  is supplied (:issue:`5361`)
-- Fix performance regression in JSON IO (:issue:`5765`)
-- performance regression in Index construction from Series (:issue:`6150`)
-
-.. _release.bug_fixes-0.13.1:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in ``io.wb.get_countries`` not including all countries (:issue:`6008`)
-- Bug in Series replace with timestamp dict (:issue:`5797`)
-- read_csv/read_table now respects the `prefix` kwarg (:issue:`5732`).
-- Bug in selection with missing values via ``.ix`` from a duplicate indexed DataFrame failing (:issue:`5835`)
-- Fix issue of boolean comparison on empty DataFrames (:issue:`5808`)
-- Bug in isnull handling ``NaT`` in an object array (:issue:`5443`)
-- Bug in ``to_datetime`` when passed a ``np.nan`` or integer datelike and a format string (:issue:`5863`)
-- Bug in groupby dtype conversion with datetimelike (:issue:`5869`)
-- Regression in handling of empty Series as indexers to Series  (:issue:`5877`)
-- Bug in internal caching, related to (:issue:`5727`)
-- Testing bug in reading JSON/msgpack from a non-filepath on windows under py3 (:issue:`5874`)
-- Bug when assigning to .ix[tuple(...)] (:issue:`5896`)
-- Bug in fully reindexing a Panel (:issue:`5905`)
-- Bug in idxmin/max with object dtypes (:issue:`5914`)
-- Bug in ``BusinessDay`` when adding n days to a date not on offset when n>5 and n%5==0 (:issue:`5890`)
-- Bug in assigning to chained series with a series via ix (:issue:`5928`)
-- Bug in creating an empty DataFrame, copying, then assigning (:issue:`5932`)
-- Bug in DataFrame.tail with empty frame (:issue:`5846`)
-- Bug in propagating metadata on ``resample`` (:issue:`5862`)
-- Fixed string-representation of ``NaT`` to be "NaT" (:issue:`5708`)
-- Fixed string-representation for Timestamp to show nanoseconds if present (:issue:`5912`)
-- ``pd.match`` not returning passed sentinel
-- ``Panel.to_frame()`` no longer fails when ``major_axis`` is a
-  ``MultiIndex`` (:issue:`5402`).
-- Bug in ``pd.read_msgpack`` with inferring a ``DateTimeIndex`` frequency
-  incorrectly (:issue:`5947`)
-- Fixed ``to_datetime`` for array with both Tz-aware datetimes and ``NaT``'s  (:issue:`5961`)
-- Bug in rolling skew/kurtosis when passed a Series with bad data (:issue:`5749`)
-- Bug in scipy ``interpolate`` methods with a datetime index (:issue:`5975`)
-- Bug in NaT comparison if a mixed datetime/np.datetime64 with NaT were passed (:issue:`5968`)
-- Fixed bug with ``pd.concat`` losing dtype information if all inputs are empty (:issue:`5742`)
-- Recent changes in IPython cause warnings to be emitted when using previous versions
-  of pandas in QTConsole, now fixed. If you're using an older version and
-  need to suppress the warnings, see (:issue:`5922`).
-- Bug in merging ``timedelta`` dtypes (:issue:`5695`)
-- Bug in plotting.scatter_matrix function. Wrong alignment among diagonal
-  and off-diagonal plots, see (:issue:`5497`).
-- Regression in Series with a multi-index via ix (:issue:`6018`)
-- Bug in Series.xs with a multi-index (:issue:`6018`)
-- Bug in Series construction of mixed type with datelike and an integer (which should result in
-  object type and not automatic conversion) (:issue:`6028`)
-- Possible segfault when chained indexing with an object array under numpy 1.7.1 (:issue:`6026`, :issue:`6056`)
-- Bug in setting using fancy indexing a single element with a non-scalar (e.g. a list),
-  (:issue:`6043`)
-- ``to_sql`` did not respect ``if_exists`` (:issue:`4110` :issue:`4304`)
-- Regression in ``.get(None)`` indexing from 0.12 (:issue:`5652`)
-- Subtle ``iloc`` indexing bug, surfaced in (:issue:`6059`)
-- Bug with insert of strings into DatetimeIndex (:issue:`5818`)
-- Fixed unicode bug in to_html/HTML repr (:issue:`6098`)
-- Fixed missing arg validation in get_options_data (:issue:`6105`)
-- Bug in assignment with duplicate columns in a frame where the locations
-  are a slice (e.g. next to each other) (:issue:`6120`)
-- Bug in propogating _ref_locs during construction of a DataFrame with dups
-  index/columns (:issue:`6121`)
-- Bug in ``DataFrame.apply`` when using mixed datelike reductions (:issue:`6125`)
-- Bug in ``DataFrame.append`` when appending a row with different columns (:issue:`6129`)
-- Bug in DataFrame construction with recarray and non-ns datetime dtype (:issue:`6140`)
-- Bug in ``.loc`` setitem indexing with a dataframe on rhs, multiple item setting, and
-  a datetimelike (:issue:`6152`)
-- Fixed a bug in ``query``/``eval`` during lexicographic string comparisons (:issue:`6155`).
-- Fixed a bug in ``query`` where the index of a single-element ``Series`` was
-  being thrown away (:issue:`6148`).
-- Bug in ``HDFStore`` on appending a dataframe with multi-indexed columns to
-  an existing table (:issue:`6167`)
-- Consistency with dtypes in setting an empty DataFrame (:issue:`6171`)
-- Bug in  selecting on a multi-index ``HDFStore`` even in the presence of under
-  specified column spec (:issue:`6169`)
-- Bug in ``nanops.var`` with ``ddof=1`` and 1 elements would sometimes return ``inf``
-  rather than ``nan`` on some platforms (:issue:`6136`)
-- Bug in Series and DataFrame bar plots ignoring the ``use_index`` keyword (:issue:`6209`)
-- Bug in groupby with mixed str/int under python3 fixed; ``argsort`` was failing (:issue:`6212`)
-
-pandas 0.13.0
--------------
-
-**Release date:** January 3, 2014
-
-New Features
-~~~~~~~~~~~~
-
-- ``plot(kind='kde')`` now accepts the optional parameters ``bw_method`` and
-  ``ind``, passed to scipy.stats.gaussian_kde() (for scipy >= 0.11.0) to set
-  the bandwidth, and to gkde.evaluate() to specify the indicies at which it
-  is evaluated, respectively. See scipy docs. (:issue:`4298`)
-- Added ``isin`` method to DataFrame (:issue:`4211`)
-- ``df.to_clipboard()`` learned a new ``excel`` keyword that let's you
-  paste df data directly into excel (enabled by default). (:issue:`5070`).
-- Clipboard functionality now works with PySide (:issue:`4282`)
-- New ``extract`` string method returns regex matches more conveniently
-  (:issue:`4685`)
-- Auto-detect field widths in read_fwf when unspecified (:issue:`4488`)
-- ``to_csv()`` now outputs datetime objects according to a specified format
-  string via the ``date_format`` keyword (:issue:`4313`)
-- Added ``LastWeekOfMonth`` DateOffset (:issue:`4637`)
-- Added ``cumcount`` groupby method (:issue:`4646`)
-- Added ``FY5253``, and ``FY5253Quarter`` DateOffsets (:issue:`4511`)
-- Added ``mode()`` method to ``Series`` and ``DataFrame`` to get the
-  statistical mode(s) of a column/series. (:issue:`5367`)
-
-Experimental Features
-~~~~~~~~~~~~~~~~~~~~~
-
-- The new :func:`~pandas.eval` function implements expression evaluation
-  using ``numexpr`` behind the scenes. This results in large speedups for
-  complicated expressions involving large DataFrames/Series.
-- :class:`~pandas.DataFrame` has a new :meth:`~pandas.DataFrame.eval` that
-  evaluates an expression in the context of the ``DataFrame``; allows
-  inline expression assignment
-- A :meth:`~pandas.DataFrame.query` method has been added that allows
-  you to select elements of a ``DataFrame`` using a natural query syntax
-  nearly identical to Python syntax.
-- ``pd.eval`` and friends now evaluate operations involving ``datetime64``
-  objects in Python space because ``numexpr`` cannot handle ``NaT`` values
-  (:issue:`4897`).
-- Add msgpack support via ``pd.read_msgpack()`` and ``pd.to_msgpack()`` /
-  ``df.to_msgpack()`` for serialization of arbitrary pandas (and python
-  objects) in a lightweight portable binary format (:issue:`686`, :issue:`5506`)
-- Added PySide support for the qtpandas DataFrameModel and DataFrameWidget.
-- Added :mod:`pandas.io.gbq` for reading from (and writing to) Google
-  BigQuery into a DataFrame. (:issue:`4140`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- ``read_html`` now raises a ``URLError`` instead of catching and raising a
-  ``ValueError`` (:issue:`4303`, :issue:`4305`)
-- ``read_excel`` now supports an integer in its ``sheetname`` argument giving
-  the index of the sheet to read in (:issue:`4301`).
-- ``get_dummies`` works with NaN (:issue:`4446`)
-- Added a test for ``read_clipboard()`` and ``to_clipboard()``
-  (:issue:`4282`)
-- Added bins argument to ``value_counts`` (:issue:`3945`), also sort and
-  ascending, now available in Series method as well as top-level function.
-- Text parser now treats anything that reads like inf ("inf", "Inf", "-Inf",
-  "iNf", etc.) to infinity. (:issue:`4220`, :issue:`4219`), affecting
-  ``read_table``, ``read_csv``, etc.
-- Added a more informative error message when plot arguments contain
-  overlapping color and style arguments (:issue:`4402`)
-- Significant table writing performance improvements in ``HDFStore``
-- JSON date serialization now performed in low-level C code.
-- JSON support for encoding datetime.time
-- Expanded JSON docs, more info about orient options and the use of the numpy
-  param when decoding.
-- Add ``drop_level`` argument to xs (:issue:`4180`)
-- Can now resample a DataFrame with ohlc (:issue:`2320`)
-- ``Index.copy()`` and ``MultiIndex.copy()`` now accept keyword arguments to
-  change attributes (i.e., ``names``, ``levels``, ``labels``)
-  (:issue:`4039`)
-- Add ``rename`` and ``set_names`` methods to ``Index`` as well as
-  ``set_names``, ``set_levels``, ``set_labels`` to ``MultiIndex``.
-  (:issue:`4039`) with improved validation for all (:issue:`4039`,
-  :issue:`4794`)
-- A Series of dtype ``timedelta64[ns]`` can now be divided/multiplied
-  by an integer series (:issue:`4521`)
-- A Series of dtype ``timedelta64[ns]`` can now be divided by another
-  ``timedelta64[ns]`` object to yield a ``float64`` dtyped Series. This
-  is frequency conversion; astyping is also supported.
-- Timedelta64 support ``fillna/ffill/bfill`` with an integer interpreted as
-  seconds, or a ``timedelta`` (:issue:`3371`)
-- Box numeric ops on ``timedelta`` Series (:issue:`4984`)
-- Datetime64 support ``ffill/bfill``
-- Performance improvements with ``__getitem__`` on ``DataFrames`` with
-  when the key is a column
-- Support for using a ``DatetimeIndex/PeriodsIndex`` directly in a datelike
-  calculation e.g. s-s.index (:issue:`4629`)
-- Better/cleaned up exceptions in core/common, io/excel and core/format
-  (:issue:`4721`, :issue:`3954`), as well as cleaned up test cases in
-  tests/test_frame, tests/test_multilevel (:issue:`4732`).
-- Performance improvement of timeseries plotting with PeriodIndex and added
-  test to vbench (:issue:`4705` and :issue:`4722`)
-- Add ``axis`` and ``level`` keywords to ``where``, so that the ``other``
-  argument can now be an alignable pandas object.
-- ``to_datetime`` with a format of '%Y%m%d' now parses much faster
-- It's now easier to hook new Excel writers into pandas (just subclass
-  ``ExcelWriter`` and register your engine). You can specify an ``engine`` in
-  ``to_excel`` or in ``ExcelWriter``.  You can also specify which writers you
-  want to use by default with config options ``io.excel.xlsx.writer`` and
-  ``io.excel.xls.writer``. (:issue:`4745`, :issue:`4750`)
-- ``Panel.to_excel()`` now accepts keyword arguments that will be passed to
-  its ``DataFrame``'s ``to_excel()`` methods. (:issue:`4750`)
-- Added XlsxWriter as an optional ``ExcelWriter``  engine. This is about 5x
-  faster than the default openpyxl xlsx writer and is equivalent in speed
-  to the xlwt xls writer module. (:issue:`4542`)
-- allow DataFrame constructor to accept more list-like objects, e.g. list of
-  ``collections.Sequence`` and ``array.Array`` objects (:issue:`3783`,
-  :issue:`4297`, :issue:`4851`), thanks @lgautier
-- DataFrame constructor now accepts a numpy masked record array
-  (:issue:`3478`), thanks @jnothman
-- ``__getitem__`` with ``tuple`` key (e.g., ``[:, 2]``) on ``Series``
-  without ``MultiIndex`` raises ``ValueError`` (:issue:`4759`, :issue:`4837`)
-- ``read_json`` now raises a (more informative) ``ValueError`` when the dict
-  contains a bad key and ``orient='split'`` (:issue:`4730`, :issue:`4838`)
-- ``read_stata`` now accepts Stata 13 format (:issue:`4291`)
-- ``ExcelWriter`` and ``ExcelFile`` can be used as contextmanagers.
-  (:issue:`3441`, :issue:`4933`)
-- ``pandas`` is now tested with two different versions of ``statsmodels``
-  (0.4.3 and 0.5.0) (:issue:`4981`).
-- Better string representations of ``MultiIndex`` (including ability to
-  roundtrip via ``repr``). (:issue:`3347`, :issue:`4935`)
-- Both ExcelFile and read_excel to accept an xlrd.Book for the io
-  (formerly path_or_buf) argument; this requires engine to be set.
-  (:issue:`4961`).
-- ``concat`` now gives a more informative error message when passed objects
-  that cannot be concatenated (:issue:`4608`).
-- Add ``halflife`` option to exponentially weighted moving functions (PR
-  :issue:`4998`)
-- ``to_dict`` now takes ``records`` as a possible outtype.  Returns an array
-  of column-keyed dictionaries. (:issue:`4936`)
-- ``tz_localize`` can infer a fall daylight savings transition based on the
-  structure of unlocalized data (:issue:`4230`)
-- DatetimeIndex is now in the API documentation
-- Improve support for converting R datasets to pandas objects (more
-  informative index for timeseries and numeric, support for factors, dist,
-  and high-dimensional arrays).
-- :func:`~pandas.read_html` now supports the ``parse_dates``,
-  ``tupleize_cols`` and ``thousands`` parameters (:issue:`4770`).
-- :meth:`~pandas.io.json.json_normalize` is a new method to allow you to
-  create a flat table from semi-structured JSON data. :ref:`See the
-  docs<io.json_normalize>` (:issue:`1067`)
-- ``DataFrame.from_records()`` will now accept generators (:issue:`4910`)
-- ``DataFrame.interpolate()`` and ``Series.interpolate()`` have been expanded
-  to include interpolation methods from scipy. (:issue:`4434`, :issue:`1892`)
-- ``Series`` now supports a ``to_frame`` method to convert it to a
-  single-column DataFrame (:issue:`5164`)
-- DatetimeIndex (and date_range) can now be constructed in a left- or
-  right-open fashion using the ``closed`` parameter (:issue:`4579`)
-- Python csv parser now supports usecols (:issue:`4335`)
-- Added support for Google Analytics v3 API segment IDs that also supports v2
-  IDs. (:issue:`5271`)
-- ``NDFrame.drop()`` now accepts names as well as integers for the axis
-  argument. (:issue:`5354`)
-- Added short docstrings to a few methods that were missing them + fixed the
-  docstrings for Panel flex methods. (:issue:`5336`)
-- ``NDFrame.drop()``, ``NDFrame.dropna()``, and ``.drop_duplicates()`` all
-  accept ``inplace`` as a keyword argument; however, this only means that the
-  wrapper is updated inplace, a copy is still made internally.
-  (:issue:`1960`, :issue:`5247`, :issue:`5628`, and related :issue:`2325` [still not
-  closed])
-- Fixed bug in `tools.plotting.andrews_curvres` so that lines are drawn grouped
-  by color as expected.
-- ``read_excel()`` now tries to convert integral floats (like ``1.0``) to int
-  by default. (:issue:`5394`)
-- Excel writers now have a default option ``merge_cells`` in ``to_excel()``
-  to merge cells in MultiIndex and Hierarchical Rows. Note: using this
-  option it is no longer possible to round trip Excel files with merged
-  MultiIndex and Hierarchical Rows. Set the ``merge_cells`` to ``False`` to
-  restore the previous behaviour.  (:issue:`5254`)
-- The FRED DataReader now accepts multiple series (:issue`3413`)
-- StataWriter adjusts variable names to Stata's limitations (:issue:`5709`)
-
-API Changes
-~~~~~~~~~~~
-
-- ``DataFrame.reindex()`` and forward/backward filling now raises ValueError
-  if either index is not monotonic (:issue:`4483`, :issue:`4484`).
-- ``pandas`` now is Python 2/3 compatible without the need for 2to3 thanks to
-  @jtratner. As a result, pandas now uses iterators more extensively. This
-  also led to the introduction of substantive parts of the Benjamin
-  Peterson's ``six`` library into compat. (:issue:`4384`, :issue:`4375`,
-  :issue:`4372`)
-- ``pandas.util.compat`` and ``pandas.util.py3compat`` have been merged into
-  ``pandas.compat``. ``pandas.compat`` now includes many functions allowing
-  2/3 compatibility. It contains both list and iterator versions of range,
-  filter, map and zip, plus other necessary elements for Python 3
-  compatibility. ``lmap``, ``lzip``, ``lrange`` and ``lfilter`` all produce
-  lists instead of iterators, for compatibility with ``numpy``, subscripting
-  and ``pandas`` constructors.(:issue:`4384`, :issue:`4375`, :issue:`4372`)
-- deprecated ``iterkv``, which will be removed in a future release (was just
-  an alias of iteritems used to get around ``2to3``'s changes).
-  (:issue:`4384`, :issue:`4375`, :issue:`4372`)
-- ``Series.get`` with negative indexers now returns the same as ``[]``
-  (:issue:`4390`)
-- allow ``ix/loc`` for Series/DataFrame/Panel to set on any axis even when
-  the single-key is not currently contained in the index for that axis
-  (:issue:`2578`, :issue:`5226`, :issue:`5632`, :issue:`5720`,
-  :issue:`5744`, :issue:`5756`)
-- Default export for ``to_clipboard`` is now csv with a sep of `\t` for
-  compat (:issue:`3368`)
-- ``at`` now will enlarge the object inplace (and return the same)
-  (:issue:`2578`)
-- ``DataFrame.plot`` will scatter plot x versus y by passing
-  ``kind='scatter'`` (:issue:`2215`)
-
-- ``HDFStore``
-
-  - ``append_to_multiple`` automatically synchronizes writing rows to multiple
-    tables and adds a ``dropna`` kwarg (:issue:`4698`)
-  - handle a passed ``Series`` in table format (:issue:`4330`)
-  - added an ``is_open`` property to indicate if the underlying file handle
-    is_open; a closed store will now report 'CLOSED' when viewing the store
-    (rather than raising an error) (:issue:`4409`)
-  - a close of a ``HDFStore`` now will close that instance of the
-    ``HDFStore`` but will only close the actual file if the ref count (by
-    ``PyTables``) w.r.t. all of the open handles are 0. Essentially you have
-    a local instance of ``HDFStore`` referenced by a variable. Once you close
-    it, it will report closed. Other references (to the same file) will
-    continue to operate until they themselves are closed. Performing an
-    action on a closed file will raise ``ClosedFileError``
-  - removed the ``_quiet`` attribute, replace by a ``DuplicateWarning`` if
-    retrieving duplicate rows from a table (:issue:`4367`)
-  - removed the ``warn`` argument from ``open``. Instead a
-    ``PossibleDataLossError`` exception will be raised if you try to use
-    ``mode='w'`` with an OPEN file handle (:issue:`4367`)
-  - allow a passed locations array or mask as a ``where`` condition
-    (:issue:`4467`)
-  - add the keyword ``dropna=True`` to ``append`` to change whether ALL nan
-    rows are not written to the store (default is ``True``, ALL nan rows are
-    NOT written), also settable via the option ``io.hdf.dropna_table``
-    (:issue:`4625`)
-  - the ``format`` keyword now replaces the ``table`` keyword; allowed values
-    are ``fixed(f)|table(t)`` the ``Storer`` format has been renamed to
-    ``Fixed``
-  - a column multi-index will be recreated properly (:issue:`4710`); raise on
-    trying to use a multi-index with data_columns on the same axis
-  - ``select_as_coordinates`` will now return an ``Int64Index`` of the
-    resultant selection set
-  - support ``timedelta64[ns]`` as a serialization type (:issue:`3577`)
-  - store `datetime.date` objects as ordinals rather then timetuples to avoid
-    timezone issues (:issue:`2852`), thanks @tavistmorph and @numpand
-  - ``numexpr`` 2.2.2 fixes incompatibility in PyTables 2.4 (:issue:`4908`)
-  - ``flush`` now accepts an ``fsync`` parameter, which defaults to ``False``
-    (:issue:`5364`)
-  - ``unicode`` indices not supported on ``table`` formats (:issue:`5386`)
-  - pass thru store creation arguments; can be used to support in-memory stores
-- ``JSON``
-
-  - added ``date_unit`` parameter to specify resolution of timestamps.
-    Options are seconds, milliseconds, microseconds and nanoseconds.
-    (:issue:`4362`, :issue:`4498`).
-  - added ``default_handler`` parameter to allow a callable to be passed
-    which will be responsible for handling otherwise unserialiable objects.
-    (:issue:`5138`)
-
-- ``Index`` and ``MultiIndex`` changes (:issue:`4039`):
-
-  - Setting ``levels`` and ``labels`` directly on ``MultiIndex`` is now
-    deprecated. Instead, you can use the ``set_levels()`` and
-    ``set_labels()`` methods.
-  - ``levels``, ``labels`` and ``names`` properties no longer return lists,
-    but instead return containers that do not allow setting of items
-    ('mostly immutable')
-  - ``levels``, ``labels`` and ``names`` are validated upon setting and are
-    either copied or shallow-copied.
-  - inplace setting of ``levels`` or ``labels`` now correctly invalidates the
-    cached properties. (:issue:`5238`).
-  - ``__deepcopy__`` now returns a shallow copy (currently: a view) of the
-    data - allowing metadata changes.
-  - ``MultiIndex.astype()`` now only allows ``np.object_``-like dtypes and
-    now returns a ``MultiIndex`` rather than an ``Index``. (:issue:`4039`)
-  - Added ``is_`` method to ``Index`` that allows fast equality comparison of
-    views (similar to ``np.may_share_memory`` but no false positives, and
-    changes on ``levels`` and ``labels`` setting on ``MultiIndex``).
-    (:issue:`4859` , :issue:`4909`)
-  - Aliased ``__iadd__`` to ``__add__``. (:issue:`4996`)
-  - Added ``is_`` method to ``Index`` that allows fast equality comparison of
-    views (similar to ``np.may_share_memory`` but no false positives, and
-    changes on ``levels`` and ``labels`` setting on ``MultiIndex``).
-    (:issue:`4859`, :issue:`4909`)
-
-- Infer and downcast dtype if ``downcast='infer'`` is passed to
-  ``fillna/ffill/bfill`` (:issue:`4604`)
-- ``__nonzero__`` for all NDFrame objects, will now raise a ``ValueError``,
-  this reverts back to (:issue:`1073`, :issue:`4633`) behavior. Add
-  ``.bool()`` method to ``NDFrame`` objects to facilitate evaluating of
-  single-element boolean Series
-- ``DataFrame.update()`` no longer raises a ``DataConflictError``, it now
-  will raise a ``ValueError`` instead (if necessary) (:issue:`4732`)
-- ``Series.isin()`` and ``DataFrame.isin()``  now raise a ``TypeError`` when
-  passed a string (:issue:`4763`). Pass a ``list`` of one element (containing
-  the string) instead.
-- Remove undocumented/unused ``kind`` keyword argument from ``read_excel``,
-  and ``ExcelFile``. (:issue:`4713`, :issue:`4712`)
-- The ``method`` argument of ``NDFrame.replace()`` is valid again, so that a
-  a list can be passed to ``to_replace`` (:issue:`4743`).
-- provide automatic dtype conversions on _reduce operations (:issue:`3371`)
-- exclude non-numerics if mixed types with datelike in _reduce operations
-  (:issue:`3371`)
-- default for ``tupleize_cols`` is now ``False`` for both ``to_csv`` and
-  ``read_csv``. Fair warning in 0.12 (:issue:`3604`)
-- moved timedeltas support to pandas.tseries.timedeltas.py; add timedeltas
-  string parsing, add top-level ``to_timedelta`` function
-- ``NDFrame`` now is compatible with Python's toplevel ``abs()`` function
-  (:issue:`4821`).
-- raise a ``TypeError`` on invalid comparison ops on Series/DataFrame (e.g.
-  integer/datetime) (:issue:`4968`)
-- Added a new index type, ``Float64Index``. This will be automatically
-  created when passing floating values in index creation.  This enables a
-  pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar
-  indexing and slicing work exactly the same.  Indexing on other index types
-  are preserved (and positional fallback for ``[],ix``), with the exception,
-  that floating point slicing on indexes on non ``Float64Index`` will raise a
-  ``TypeError``, e.g. ``Series(range(5))[3.5:4.5]`` (:issue:`263`,:issue:`5375`)
-- Make Categorical repr nicer (:issue:`4368`)
-- Remove deprecated ``Factor`` (:issue:`3650`)
-- Remove deprecated ``set_printoptions/reset_printoptions`` (:issue:``3046``)
-- Remove deprecated ``_verbose_info`` (:issue:`3215`)
-- Begin removing methods that don't make sense on ``GroupBy`` objects
-  (:issue:`4887`).
-- Remove deprecated ``read_clipboard/to_clipboard/ExcelFile/ExcelWriter``
-  from ``pandas.io.parsers`` (:issue:`3717`)
-- All non-Index NDFrames (``Series``, ``DataFrame``, ``Panel``, ``Panel4D``,
-  ``SparsePanel``, etc.), now support the entire set of arithmetic operators
-  and arithmetic flex methods (add, sub, mul, etc.). ``SparsePanel`` does not
-  support ``pow`` or ``mod`` with non-scalars. (:issue:`3765`)
-- Arithmetic func factories are now passed real names (suitable for using
-  with super) (:issue:`5240`)
-- Provide numpy compatibility with 1.7 for a calling convention like
-  ``np.prod(pandas_object)`` as numpy call with additional keyword args
-  (:issue:`4435`)
-- Provide __dir__ method (and local context) for tab completion / remove
-  ipython completers code (:issue:`4501`)
-- Support non-unique axes in a Panel via indexing operations (:issue:`4960`)
-- ``.truncate`` will raise a ``ValueError`` if invalid before and afters
-  dates are given (:issue:`5242`)
-- ``Timestamp`` now supports ``now/today/utcnow`` class methods
-  (:issue:`5339`)
-- default for `display.max_seq_len` is now 100 rather then `None`. This activates
-  truncated display ("...") of long sequences in various places. (:issue:`3391`)
-- **All** division with ``NDFrame`` - likes is now truedivision, regardless
-  of the future import. You can use ``//`` and ``floordiv`` to do integer
-  division.
-
-.. code-block:: ipython
-
-   In [3]: arr = np.array([1, 2, 3, 4])
-
-   In [4]: arr2 = np.array([5, 3, 2, 1])
-
-   In [5]: arr / arr2
-   Out[5]: array([0, 0, 1, 4])
-
-   In [6]: pd.Series(arr) / pd.Series(arr2) # no future import required
-   Out[6]:
-   0    0.200000
-   1    0.666667
-   2    1.500000
-   3    4.000000
-   dtype: float64
-
-- raise/warn ``SettingWithCopyError/Warning`` exception/warning when setting of a
-  copy thru chained assignment is detected, settable via option ``mode.chained_assignment``
-- test the list of ``NA`` values in the csv parser. add ``N/A``, ``#NA`` as independent default
-  na values (:issue:`5521`)
-- The refactoring involving``Series`` deriving from ``NDFrame`` breaks ``rpy2<=2.3.8``. an Issue
-  has been opened against rpy2 and a workaround is detailed in :issue:`5698`. Thanks @JanSchulz.
-- ``Series.argmin`` and ``Series.argmax`` are now aliased to ``Series.idxmin`` and ``Series.idxmax``.
-  These return the *index* of the  min or max element respectively. Prior to 0.13.0 these would return
-  the position of the min / max element (:issue:`6214`)
-
-Internal Refactoring
-~~~~~~~~~~~~~~~~~~~~
-
-In 0.13.0 there is a major refactor primarily to subclass ``Series`` from
-``NDFrame``, which is the base class currently for ``DataFrame`` and ``Panel``,
-to unify methods and behaviors. Series formerly subclassed directly from
-``ndarray``. (:issue:`4080`, :issue:`3862`, :issue:`816`)
-See :ref:`Internal Refactoring<whatsnew_0130.refactoring>`
-
-- Refactor of series.py/frame.py/panel.py to move common code to generic.py
-
- - added ``_setup_axes`` to created generic NDFrame structures
- - moved methods
-
-   - ``from_axes``, ``_wrap_array``, ``axes``, ``ix``, ``loc``, ``iloc``,
-     ``shape``, ``empty``, ``swapaxes``, ``transpose``, ``pop``
-   - ``__iter__``, ``keys``, ``__contains__``, ``__len__``, ``__neg__``,
-     ``__invert__``
-   - ``convert_objects``, ``as_blocks``, ``as_matrix``, ``values``
-   - ``__getstate__``, ``__setstate__`` (compat remains in frame/panel)
-   - ``__getattr__``, ``__setattr__``
-   - ``_indexed_same``, ``reindex_like``, ``align``, ``where``, ``mask``
-   - ``fillna``, ``replace`` (``Series`` replace is now consistent with
-     ``DataFrame``)
-   - ``filter`` (also added axis argument to selectively filter on a different
-     axis)
-   - ``reindex``, ``reindex_axis``, ``take``
-   - ``truncate`` (moved to become part of ``NDFrame``)
-   - ``isnull/notnull`` now available on ``NDFrame`` objects
-
-- These are API changes which make ``Panel`` more consistent with ``DataFrame``
-
- - ``swapaxes`` on a ``Panel`` with the same axes specified now return a copy
- - support attribute access for setting
- - ``filter`` supports same API as original ``DataFrame`` filter
- - ``fillna`` refactored to ``core/generic.py``, while > 3ndim is
-   ``NotImplemented``
-
-- Series now inherits from ``NDFrame`` rather than directly from ``ndarray``.
-  There are several minor changes that affect the API.
-
- - numpy functions that do not support the array interface will now return
-   ``ndarrays`` rather than series, e.g. ``np.diff``, ``np.ones_like``,
-   ``np.where``
- - ``Series(0.5)`` would previously return the scalar ``0.5``, this is no
-   longer supported
- - ``TimeSeries`` is now an alias for ``Series``. the property
-   ``is_time_series`` can be used to distinguish (if desired)
-
-- Refactor of Sparse objects to use BlockManager
-
- - Created a new block type in internals, ``SparseBlock``, which can hold
-   multi-dtypes and is non-consolidatable. ``SparseSeries`` and
-   ``SparseDataFrame`` now inherit more methods from there hierarchy
-   (Series/DataFrame), and no longer inherit from ``SparseArray`` (which
-   instead is the object of the ``SparseBlock``)
- - Sparse suite now supports integration with non-sparse data. Non-float
-   sparse data is supportable (partially implemented)
- - Operations on sparse structures within DataFrames should preserve
-   sparseness, merging type operations will convert to dense (and back to
-   sparse), so might be somewhat inefficient
- - enable setitem on ``SparseSeries`` for boolean/integer/slices
- - ``SparsePanels`` implementation is unchanged (e.g. not using BlockManager,
-   needs work)
-
-- added ``ftypes`` method to Series/DataFame, similar to ``dtypes``, but
-  indicates if the underlying is sparse/dense (as well as the dtype)
-- All ``NDFrame`` objects now have a ``_prop_attributes``, which can be used
-  to indicate various values to propagate to a new object from an existing
-  (e.g. name in ``Series`` will follow more automatically now)
-- Internal type checking is now done via a suite of generated classes,
-  allowing ``isinstance(value, klass)`` without having to directly import the
-  klass, courtesy of @jtratner
-- Bug in Series update where the parent frame is not updating its cache based
-  on changes (:issue:`4080`, :issue:`5216`) or types (:issue:`3217`), fillna
-  (:issue:`3386`)
-- Indexing with dtype conversions fixed (:issue:`4463`, :issue:`4204`)
-- Refactor ``Series.reindex`` to core/generic.py (:issue:`4604`,
-  :issue:`4618`), allow ``method=`` in reindexing on a Series to work
-- ``Series.copy`` no longer accepts the ``order`` parameter and is now
-  consistent with ``NDFrame`` copy
-- Refactor ``rename`` methods to core/generic.py; fixes ``Series.rename`` for
-  (:issue:`4605`), and adds ``rename`` with the same signature for ``Panel``
-- Series (for index) / Panel (for items) now as attribute access to its
-  elements  (:issue:`1903`)
-- Refactor ``clip`` methods to core/generic.py (:issue:`4798`)
-- Refactor of ``_get_numeric_data/_get_bool_data`` to core/generic.py,
-  allowing Series/Panel functionality
-- Refactor of Series arithmetic with time-like objects
-  (datetime/timedelta/time etc.) into a separate, cleaned up wrapper class.
-  (:issue:`4613`)
-- Complex compat for ``Series`` with ``ndarray``. (:issue:`4819`)
-- Removed unnecessary ``rwproperty`` from codebase in favor of builtin
-  property. (:issue:`4843`)
-- Refactor object level numeric methods (mean/sum/min/max...) from object
-  level modules to ``core/generic.py`` (:issue:`4435`).
-- Refactor cum objects to core/generic.py (:issue:`4435`), note that these
-  have a more numpy-like function signature.
-- :func:`~pandas.read_html` now uses ``TextParser`` to parse HTML data from
-  bs4/lxml (:issue:`4770`).
-- Removed the ``keep_internal`` keyword parameter in
-  ``pandas/core/groupby.py`` because it wasn't being used (:issue:`5102`).
-- Base ``DateOffsets`` are no longer all instantiated on importing pandas,
-  instead they are generated and cached on the fly. The internal
-  representation and handling of DateOffsets has also been clarified.
-  (:issue:`5189`, related :issue:`5004`)
-- ``MultiIndex`` constructor now validates that passed levels and labels are
-  compatible. (:issue:`5213`, :issue:`5214`)
-- Unity ``dropna`` for Series/DataFrame signature (:issue:`5250`),
-  tests from :issue:`5234`, courtesy of @rockg
-- Rewrite assert_almost_equal() in cython for performance (:issue:`4398`)
-- Added an internal ``_update_inplace`` method to facilitate updating
-  ``NDFrame`` wrappers on inplace ops (only is for convenience of caller,
-  doesn't actually prevent copies). (:issue:`5247`)
-
-.. _release.bug_fixes-0.13.0:
-
-
-Bug Fixes
-~~~~~~~~~
-
-- ``HDFStore``
-
-  - raising an invalid ``TypeError`` rather than ``ValueError`` when
-    appending with a different block ordering (:issue:`4096`)
-  - ``read_hdf`` was not respecting as passed ``mode`` (:issue:`4504`)
-  - appending a 0-len table will work correctly (:issue:`4273`)
-  - ``to_hdf`` was raising when passing both arguments ``append`` and
-    ``table`` (:issue:`4584`)
-  - reading from a store with duplicate columns across dtypes would raise
-    (:issue:`4767`)
-  - Fixed a bug where ``ValueError`` wasn't correctly raised when column
-    names weren't strings (:issue:`4956`)
-  - A zero length series written in Fixed format not deserializing properly.
-    (:issue:`4708`)
-  - Fixed decoding perf issue on pyt3 (:issue:`5441`)
-  - Validate levels in a multi-index before storing (:issue:`5527`)
-  - Correctly handle ``data_columns`` with a Panel (:issue:`5717`)
-- Fixed bug in tslib.tz_convert(vals, tz1, tz2): it could raise IndexError
-  exception while trying to access trans[pos + 1] (:issue:`4496`)
-- The ``by`` argument now works correctly with the ``layout`` argument
-  (:issue:`4102`, :issue:`4014`) in ``*.hist`` plotting methods
-- Fixed bug in ``PeriodIndex.map`` where using ``str`` would return the str
-  representation of the index (:issue:`4136`)
-- Fixed test failure ``test_time_series_plot_color_with_empty_kwargs`` when
-  using custom matplotlib default colors (:issue:`4345`)
-- Fix running of stata IO tests. Now uses temporary files to write
-  (:issue:`4353`)
-- Fixed an issue where ``DataFrame.sum`` was slower than ``DataFrame.mean``
-  for integer valued frames (:issue:`4365`)
-- ``read_html`` tests now work with Python 2.6 (:issue:`4351`)
-- Fixed bug where ``network`` testing was throwing ``NameError`` because a
-  local variable was undefined (:issue:`4381`)
-- In ``to_json``, raise if a passed ``orient`` would cause loss of data
-  because of a duplicate index (:issue:`4359`)
-- In ``to_json``, fix date handling so milliseconds are the default timestamp
-  as the docstring says (:issue:`4362`).
-- ``as_index`` is no longer ignored when doing groupby apply (:issue:`4648`,
-  :issue:`3417`)
-- JSON NaT handling fixed, NaTs are now serialized to `null` (:issue:`4498`)
-- Fixed JSON handling of escapable characters in JSON object keys
-  (:issue:`4593`)
-- Fixed passing ``keep_default_na=False`` when ``na_values=None``
-  (:issue:`4318`)
-- Fixed bug with ``values`` raising an error on a DataFrame with duplicate
-  columns and mixed dtypes, surfaced in (:issue:`4377`)
-- Fixed bug with duplicate columns and type conversion in ``read_json`` when
-  ``orient='split'`` (:issue:`4377`)
-- Fixed JSON bug where locales with decimal separators other than '.' threw
-  exceptions when encoding / decoding certain values. (:issue:`4918`)
-- Fix ``.iat`` indexing with a ``PeriodIndex`` (:issue:`4390`)
-- Fixed an issue where ``PeriodIndex`` joining with self was returning a new
-  instance rather than the same instance (:issue:`4379`); also adds a test
-  for this for the other index types
-- Fixed a bug with all the dtypes being converted to object when using the
-  CSV cparser with the usecols parameter (:issue:`3192`)
-- Fix an issue in merging blocks where the resulting DataFrame had partially
-  set _ref_locs (:issue:`4403`)
-- Fixed an issue where hist subplots were being overwritten when they were
-  called using the top level matplotlib API (:issue:`4408`)
-- Fixed a bug where calling ``Series.astype(str)`` would truncate the string
-  (:issue:`4405`, :issue:`4437`)
-- Fixed a py3 compat issue where bytes were being repr'd as tuples
-  (:issue:`4455`)
-- Fixed Panel attribute naming conflict if item is named 'a'
-  (:issue:`3440`)
-- Fixed an issue where duplicate indexes were raising when plotting
-  (:issue:`4486`)
-- Fixed an issue where cumsum and cumprod didn't work with bool dtypes
-  (:issue:`4170`, :issue:`4440`)
-- Fixed Panel slicing issued in ``xs`` that was returning an incorrect dimmed
-  object (:issue:`4016`)
-- Fix resampling bug where custom reduce function not used if only one group
-  (:issue:`3849`, :issue:`4494`)
-- Fixed Panel assignment with a transposed frame (:issue:`3830`)
-- Raise on set indexing with a Panel and a Panel as a value which needs
-  alignment (:issue:`3777`)
-- frozenset objects now raise in the ``Series`` constructor (:issue:`4482`,
-  :issue:`4480`)
-- Fixed issue with sorting a duplicate multi-index that has multiple dtypes
-  (:issue:`4516`)
-- Fixed bug in ``DataFrame.set_values`` which was causing name attributes to
-  be lost when expanding the index. (:issue:`3742`, :issue:`4039`)
-- Fixed issue where individual ``names``, ``levels`` and ``labels`` could be
-  set on ``MultiIndex`` without validation (:issue:`3714`, :issue:`4039`)
-- Fixed (:issue:`3334`) in pivot_table. Margins did not compute if values is
-  the index.
-- Fix bug in having a rhs of ``np.timedelta64`` or ``np.offsets.DateOffset``
-  when operating with datetimes (:issue:`4532`)
-- Fix arithmetic with series/datetimeindex and ``np.timedelta64`` not working
-  the same (:issue:`4134`) and buggy timedelta in numpy 1.6 (:issue:`4135`)
-- Fix bug in ``pd.read_clipboard`` on windows with PY3 (:issue:`4561`); not
-  decoding properly
-- ``tslib.get_period_field()`` and ``tslib.get_period_field_arr()`` now raise
-  if code argument out of range (:issue:`4519`, :issue:`4520`)
-- Fix boolean indexing on an empty series loses index names (:issue:`4235`),
-  infer_dtype works with empty arrays.
-- Fix reindexing with multiple axes; if an axes match was not replacing the
-  current axes, leading to a possible lazay frequency inference issue
-  (:issue:`3317`)
-- Fixed issue where ``DataFrame.apply`` was reraising exceptions incorrectly
-  (causing the original stack trace to be truncated).
-- Fix selection with ``ix/loc`` and non_unique selectors (:issue:`4619`)
-- Fix assignment with iloc/loc involving a dtype change in an existing column
-  (:issue:`4312`, :issue:`5702`) have internal setitem_with_indexer in core/indexing
-  to use Block.setitem
-- Fixed bug where thousands operator was not handled correctly for floating
-  point numbers in csv_import (:issue:`4322`)
-- Fix an issue with CacheableOffset not properly being used by many
-  DateOffset; this prevented the DateOffset from being cached (:issue:`4609`)
-- Fix boolean comparison with a DataFrame on the lhs, and a list/tuple on the
-  rhs (:issue:`4576`)
-- Fix error/dtype conversion with setitem of ``None`` on ``Series/DataFrame``
-  (:issue:`4667`)
-- Fix decoding based on a passed in non-default encoding in ``pd.read_stata``
-  (:issue:`4626`)
-- Fix ``DataFrame.from_records`` with a plain-vanilla ``ndarray``.
-  (:issue:`4727`)
-- Fix some inconsistencies with ``Index.rename`` and ``MultiIndex.rename``,
-  etc. (:issue:`4718`, :issue:`4628`)
-- Bug in using ``iloc/loc`` with a cross-sectional and duplicate indicies
-  (:issue:`4726`)
-- Bug with using ``QUOTE_NONE`` with ``to_csv`` causing ``Exception``.
-  (:issue:`4328`)
-- Bug with Series indexing not raising an error when the right-hand-side has
-  an incorrect length (:issue:`2702`)
-- Bug in multi-indexing with a partial string selection as one part of a
-  MultIndex (:issue:`4758`)
-- Bug with reindexing on the index with a non-unique index will now raise
-  ``ValueError`` (:issue:`4746`)
-- Bug in setting with ``loc/ix`` a single indexer with a multi-index axis and
-  a numpy array, related to (:issue:`3777`)
-- Bug in concatenation with duplicate columns across dtypes not merging with
-  axis=0 (:issue:`4771`, :issue:`4975`)
-- Bug in ``iloc`` with a slice index failing (:issue:`4771`)
-- Incorrect error message with no colspecs or width in ``read_fwf``.
-  (:issue:`4774`)
-- Fix bugs in indexing in a Series with a duplicate index (:issue:`4548`,
-  :issue:`4550`)
-- Fixed bug with reading compressed files with ``read_fwf`` in Python 3.
-  (:issue:`3963`)
-- Fixed an issue with a duplicate index and assignment with a dtype change
-  (:issue:`4686`)
-- Fixed bug with reading compressed files in as ``bytes`` rather than ``str``
-  in Python 3. Simplifies bytes-producing file-handling in Python 3
-  (:issue:`3963`, :issue:`4785`).
-- Fixed an issue related to ticklocs/ticklabels with log scale bar plots
-  across different versions of matplotlib (:issue:`4789`)
-- Suppressed DeprecationWarning associated with internal calls issued by
-  repr() (:issue:`4391`)
-- Fixed an issue with a duplicate index and duplicate selector with ``.loc``
-  (:issue:`4825`)
-- Fixed an issue with ``DataFrame.sort_index`` where, when sorting by a
-  single column and passing a list for ``ascending``, the argument for
-  ``ascending`` was being interpreted as ``True`` (:issue:`4839`,
-  :issue:`4846`)
-- Fixed ``Panel.tshift`` not working. Added `freq` support to ``Panel.shift``
-  (:issue:`4853`)
-- Fix an issue in TextFileReader w/ Python engine (i.e. PythonParser)
-  with thousands != "," (:issue:`4596`)
-- Bug in getitem with a duplicate index when using where (:issue:`4879`)
-- Fix Type inference code coerces float column into datetime (:issue:`4601`)
-- Fixed ``_ensure_numeric`` does not check for complex numbers
-  (:issue:`4902`)
-- Fixed a bug in ``Series.hist`` where two figures were being created when
-  the ``by`` argument was passed (:issue:`4112`, :issue:`4113`).
-- Fixed a bug in ``convert_objects`` for > 2 ndims (:issue:`4937`)
-- Fixed a bug in DataFrame/Panel cache insertion and subsequent indexing
-  (:issue:`4939`, :issue:`5424`)
-- Fixed string methods for ``FrozenNDArray`` and ``FrozenList``
-  (:issue:`4929`)
-- Fixed a bug with setting invalid or out-of-range values in indexing
-  enlargement scenarios (:issue:`4940`)
-- Tests for fillna on empty Series (:issue:`4346`), thanks @immerrr
-- Fixed ``copy()`` to shallow copy axes/indices as well and thereby keep
-  separate metadata. (:issue:`4202`, :issue:`4830`)
-- Fixed skiprows option in Python parser for read_csv (:issue:`4382`)
-- Fixed bug preventing ``cut`` from working with ``np.inf`` levels without
-  explicitly passing labels (:issue:`3415`)
-- Fixed wrong check for overlapping in ``DatetimeIndex.union``
-  (:issue:`4564`)
-- Fixed conflict between thousands separator and date parser in csv_parser
-  (:issue:`4678`)
-- Fix appending when dtypes are not the same (error showing mixing
-  float/np.datetime64) (:issue:`4993`)
-- Fix repr for DateOffset. No longer show duplicate entries in kwds.
-  Removed unused offset fields. (:issue:`4638`)
-- Fixed wrong index name during read_csv if using usecols. Applies to c
-  parser only. (:issue:`4201`)
-- ``Timestamp`` objects can now appear in the left hand side of a comparison
-  operation with a ``Series`` or ``DataFrame`` object (:issue:`4982`).
-- Fix a bug when indexing with ``np.nan`` via ``iloc/loc`` (:issue:`5016`)
-- Fixed a bug where low memory c parser could create different types in
-  different chunks of the same file. Now coerces to numerical type or raises
-  warning. (:issue:`3866`)
-- Fix a bug where reshaping a ``Series`` to its own shape raised
-  ``TypeError`` (:issue:`4554`) and other reshaping issues.
-- Bug in setting with ``ix/loc`` and a mixed int/string index (:issue:`4544`)
-- Make sure series-series boolean comparisons are label based (:issue:`4947`)
-- Bug in multi-level indexing with a Timestamp partial indexer
-  (:issue:`4294`)
-- Tests/fix for multi-index construction of an all-nan frame (:issue:`4078`)
-- Fixed a bug where :func:`~pandas.read_html` wasn't correctly inferring
-  values of tables with commas (:issue:`5029`)
-- Fixed a bug where :func:`~pandas.read_html` wasn't providing a stable
-  ordering of returned tables (:issue:`4770`, :issue:`5029`).
-- Fixed a bug where :func:`~pandas.read_html` was incorrectly parsing when
-  passed ``index_col=0`` (:issue:`5066`).
-- Fixed a bug where :func:`~pandas.read_html` was incorrectly inferring the
-  type of headers (:issue:`5048`).
-- Fixed a bug where ``DatetimeIndex`` joins with ``PeriodIndex`` caused a
-  stack overflow (:issue:`3899`).
-- Fixed a bug where ``groupby`` objects didn't allow plots (:issue:`5102`).
-- Fixed a bug where ``groupby`` objects weren't tab-completing column names
-  (:issue:`5102`).
-- Fixed a bug where ``groupby.plot()`` and friends were duplicating figures
-  multiple times (:issue:`5102`).
-- Provide automatic conversion of ``object`` dtypes on fillna, related
-  (:issue:`5103`)
-- Fixed a bug where default options were being overwritten in the option
-  parser cleaning (:issue:`5121`).
-- Treat a list/ndarray identically for ``iloc`` indexing with list-like
-  (:issue:`5006`)
-- Fix ``MultiIndex.get_level_values()`` with missing values (:issue:`5074`)
-- Fix bound checking for Timestamp() with datetime64 input (:issue:`4065`)
-- Fix a bug where ``TestReadHtml`` wasn't calling the correct ``read_html()``
-  function (:issue:`5150`).
-- Fix a bug with ``NDFrame.replace()`` which made replacement appear as
-  though it was (incorrectly) using regular expressions (:issue:`5143`).
-- Fix better error message for to_datetime (:issue:`4928`)
-- Made sure different locales are tested on travis-ci (:issue:`4918`). Also
-  adds a couple of utilities for getting locales and setting locales with a
-  context manager.
-- Fixed segfault on ``isnull(MultiIndex)`` (now raises an error instead)
-  (:issue:`5123`, :issue:`5125`)
-- Allow duplicate indices when performing operations that align
-  (:issue:`5185`, :issue:`5639`)
-- Compound dtypes in a constructor raise ``NotImplementedError``
-  (:issue:`5191`)
-- Bug in comparing duplicate frames (:issue:`4421`) related
-- Bug in describe on duplicate frames
-- Bug in ``to_datetime`` with a format and ``coerce=True`` not raising
-  (:issue:`5195`)
-- Bug in ``loc`` setting with multiple indexers and a rhs of a Series that
-  needs broadcasting (:issue:`5206`)
-- Fixed bug where inplace setting of levels or labels on ``MultiIndex`` would
-  not clear cached ``values`` property and therefore return wrong ``values``.
-  (:issue:`5215`)
-- Fixed bug where filtering a grouped DataFrame or Series did not maintain
-  the original ordering (:issue:`4621`).
-- Fixed ``Period`` with a business date freq to always roll-forward if on a
-  non-business date. (:issue:`5203`)
-- Fixed bug in Excel writers where frames with duplicate column names weren't
-  written correctly. (:issue:`5235`)
-- Fixed issue with ``drop`` and a non-unique index on Series (:issue:`5248`)
-- Fixed seg fault in C parser caused by passing more names than columns in
-  the file. (:issue:`5156`)
-- Fix ``Series.isin`` with date/time-like dtypes (:issue:`5021`)
-- C and Python Parser can now handle the more common multi-index column
-  format which doesn't have a row for index names (:issue:`4702`)
-- Bug when trying to use an out-of-bounds date as an object dtype
-  (:issue:`5312`)
-- Bug when trying to display an embedded PandasObject (:issue:`5324`)
-- Allows operating of Timestamps to return a datetime if the result is out-of-bounds
-  related (:issue:`5312`)
-- Fix return value/type signature of ``initObjToJSON()`` to be compatible
-  with numpy's ``import_array()`` (:issue:`5334`, :issue:`5326`)
-- Bug when renaming then set_index on a DataFrame (:issue:`5344`)
-- Test suite no longer leaves around temporary files when testing graphics. (:issue:`5347`)
-  (thanks for catching this @yarikoptic!)
-- Fixed html tests on win32. (:issue:`4580`)
-- Make sure that ``head/tail`` are ``iloc`` based, (:issue:`5370`)
-- Fixed bug for ``PeriodIndex`` string representation if there are 1 or 2
-  elements. (:issue:`5372`)
-- The GroupBy methods ``transform`` and ``filter`` can be used on Series
-  and DataFrames that have repeated (non-unique) indices. (:issue:`4620`)
-- Fix empty series not printing name in repr (:issue:`4651`)
-- Make tests create temp files in temp directory by default. (:issue:`5419`)
-- ``pd.to_timedelta`` of a scalar returns a scalar (:issue:`5410`)
-- ``pd.to_timedelta`` accepts ``NaN`` and ``NaT``, returning ``NaT`` instead of raising (:issue:`5437`)
-- performance improvements in ``isnull`` on larger size pandas objects
-- Fixed various setitem with 1d ndarray that does not have a matching
-  length to the indexer (:issue:`5508`)
-- Bug in getitem with a multi-index and ``iloc`` (:issue:`5528`)
-- Bug in delitem on a Series (:issue:`5542`)
-- Bug fix in apply when using custom function and objects are not mutated (:issue:`5545`)
-- Bug in selecting from a non-unique index with ``loc`` (:issue:`5553`)
-- Bug in groupby returning non-consistent types when user function returns a ``None``, (:issue:`5592`)
-- Work around regression in numpy 1.7.0 which erroneously raises IndexError from ``ndarray.item`` (:issue:`5666`)
-- Bug in repeated indexing of object with resultant non-unique index (:issue:`5678`)
-- Bug in fillna with Series and a passed series/dict (:issue:`5703`)
-- Bug in groupby transform with a datetime-like grouper (:issue:`5712`)
-- Bug in multi-index selection in PY3 when using certain keys (:issue:`5725`)
-- Row-wise concat of differing dtypes failing in certain cases (:issue:`5754`)
-
-pandas 0.12.0
--------------
-
-**Release date:** 2013-07-24
-
-New Features
-~~~~~~~~~~~~
-
-- ``pd.read_html()`` can now parse HTML strings, files or urls and returns a
-  list of ``DataFrame`` s courtesy of @cpcloud. (:issue:`3477`,
-  :issue:`3605`, :issue:`3606`)
-- Support for reading Amazon S3 files. (:issue:`3504`)
-- Added module for reading and writing JSON strings/files: pandas.io.json
-  includes ``to_json`` DataFrame/Series method, and a ``read_json`` top-level reader
-  various issues (:issue:`1226`, :issue:`3804`, :issue:`3876`, :issue:`3867`, :issue:`1305`)
-- Added module for reading and writing Stata files: pandas.io.stata (:issue:`1512`)
-  includes ``to_stata`` DataFrame method, and a ``read_stata`` top-level reader
-- Added support for writing in ``to_csv`` and reading in ``read_csv``,
-  multi-index columns. The ``header`` option in ``read_csv`` now accepts a
-  list of the rows from which to read the index. Added the option,
-  ``tupleize_cols`` to provide compatibility for the pre 0.12 behavior of
-  writing and reading multi-index columns via a list of tuples. The default in
-  0.12 is to write lists of tuples and *not* interpret list of tuples as a
-  multi-index column.
-  Note: The default value will change in 0.12 to make the default *to* write and
-  read multi-index columns in the new format. (:issue:`3571`, :issue:`1651`, :issue:`3141`)
-- Add iterator to ``Series.str`` (:issue:`3638`)
-- ``pd.set_option()`` now allows N option, value pairs (:issue:`3667`).
-- Added keyword parameters for different types of scatter_matrix subplots
-- A ``filter`` method on grouped Series or DataFrames returns a subset of
-  the original (:issue:`3680`, :issue:`919`)
-- Access to historical Google Finance data in pandas.io.data (:issue:`3814`)
-- DataFrame plotting methods can sample column colors from a Matplotlib
-  colormap via the ``colormap`` keyword. (:issue:`3860`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Fixed various issues with internal pprinting code, the repr() for various objects
-  including TimeStamp and Index now produces valid python code strings and
-  can be used to recreate the object, (:issue:`3038`, :issue:`3379`, :issue:`3251`, :issue:`3460`)
-- ``convert_objects`` now accepts a ``copy`` parameter (defaults to ``True``)
-- ``HDFStore``
-
-  - will retain index attributes (freq,tz,name) on recreation (:issue:`3499`,:issue:`4098`)
-  - will warn with a ``AttributeConflictWarning`` if you are attempting to append
-    an index with a different frequency than the existing, or attempting
-    to append an index with a different name than the existing
-  - support datelike columns with a timezone as data_columns (:issue:`2852`)
-  - table writing performance improvements.
-  - support python3 (via ``PyTables 3.0.0``) (:issue:`3750`)
-- Add modulo operator to Series, DataFrame
-- Add ``date`` method to DatetimeIndex
-- Add ``dropna`` argument to pivot_table (:issue: `3820`)
-- Simplified the API and added a describe method to Categorical
-- ``melt`` now accepts the optional parameters ``var_name`` and ``value_name``
-  to specify custom column names of the returned DataFrame (:issue:`3649`),
-  thanks @hoechenberger. If ``var_name`` is not specified and ``dataframe.columns.name``
-  is not None, then this will be used as the ``var_name`` (:issue:`4144`).
-  Also support for MultiIndex columns.
-- clipboard functions use pyperclip (no dependencies on Windows, alternative
-  dependencies offered for Linux) (:issue:`3837`).
-- Plotting functions now raise a ``TypeError`` before trying to plot anything
-  if the associated objects have have a dtype of ``object`` (:issue:`1818`,
-  :issue:`3572`, :issue:`3911`, :issue:`3912`), but they will try to convert object
-  arrays to numeric arrays if possible so that you can still plot, for example, an
-  object array with floats. This happens before any drawing takes place which
-  eliminates any spurious plots from showing up.
-- Added Faq section on repr display options, to help users customize their setup.
-- ``where`` operations that result in block splitting are much faster (:issue:`3733`)
-- Series and DataFrame hist methods now take a ``figsize`` argument (:issue:`3834`)
-- DatetimeIndexes no longer try to convert mixed-integer indexes during join
-  operations (:issue:`3877`)
-- Add ``unit`` keyword to ``Timestamp`` and ``to_datetime`` to enable passing of
-  integers or floats that are in an epoch unit of ``D, s, ms, us, ns``, thanks @mtkini (:issue:`3969`)
-  (e.g. unix timestamps or epoch ``s``, with fractional seconds allowed) (:issue:`3540`)
-- DataFrame corr method (spearman) is now cythonized.
-- Improved ``network`` test decorator to catch ``IOError`` (and therefore
-  ``URLError`` as well). Added ``with_connectivity_check`` decorator to allow
-  explicitly checking a website as a proxy for seeing if there is network
-  connectivity. Plus, new ``optional_args`` decorator factory for decorators.
-  (:issue:`3910`, :issue:`3914`)
-- ``read_csv`` will now throw a more informative error message when a file
-  contains no columns, e.g., all newline characters
-- Added ``layout`` keyword to DataFrame.hist() for more customizable layout (:issue:`4050`)
-- Timestamp.min and Timestamp.max now represent valid Timestamp instances instead
-  of the default datetime.min and datetime.max (respectively), thanks @SleepingPills
-- ``read_html`` now raises when no tables are found and BeautifulSoup==4.2.0
-  is detected (:issue:`4214`)
-
-API Changes
-~~~~~~~~~~~
-
-- ``HDFStore``
-
-  - When removing an object, ``remove(key)`` raises
-    ``KeyError`` if the key is not a valid store object.
-  - raise a ``TypeError`` on passing ``where`` or ``columns``
-    to select with a Storer; these are invalid parameters at this time (:issue:`4189`)
-  - can now specify an ``encoding`` option to ``append/put``
-    to enable alternate encodings (:issue:`3750`)
-  - enable support for ``iterator/chunksize`` with ``read_hdf``
-- The repr() for (Multi)Index now obeys display.max_seq_items rather
-  then numpy threshold print options. (:issue:`3426`, :issue:`3466`)
-- Added mangle_dupe_cols option to read_table/csv, allowing users
-  to control legacy behaviour re dupe cols (A, A.1, A.2 vs A, A ) (:issue:`3468`)
-  Note: The default value will change in 0.12 to the "no mangle" behaviour,
-  If your code relies on this behaviour, explicitly specify mangle_dupe_cols=True
-  in your calls.
-- Do not allow astypes on ``datetime64[ns]`` except to ``object``, and
-  ``timedelta64[ns]`` to ``object/int`` (:issue:`3425`)
-- The behavior of ``datetime64`` dtypes has changed with respect to certain
-  so-called reduction operations (:issue:`3726`). The following operations now
-  raise a ``TypeError`` when performed on a ``Series`` and return an *empty*
-  ``Series`` when performed on a ``DataFrame`` similar to performing these
-  operations on, for example, a ``DataFrame`` of ``slice`` objects:
-  - sum, prod, mean, std, var, skew, kurt, corr, and cov
-- Do not allow datetimelike/timedeltalike creation except with valid types
-  (e.g. cannot pass ``datetime64[ms]``) (:issue:`3423`)
-- Add ``squeeze`` keyword to ``groupby`` to allow reduction from
-  DataFrame -> Series if groups are unique. Regression from 0.10.1,
-  partial revert on (:issue:`2893`) with (:issue:`3596`)
-- Raise on ``iloc`` when boolean indexing with a label based indexer mask
-  e.g. a boolean Series, even with integer labels, will raise. Since ``iloc``
-  is purely positional based, the labels on the Series are not alignable (:issue:`3631`)
-- The ``raise_on_error`` option to plotting methods is obviated by :issue:`3572`,
-  so it is removed. Plots now always raise when data cannot be plotted or the
-  object being plotted has a dtype of ``object``.
-- ``DataFrame.interpolate()`` is now deprecated. Please use
-  ``DataFrame.fillna()`` and ``DataFrame.replace()`` instead (:issue:`3582`,
-  :issue:`3675`, :issue:`3676`).
-- the ``method`` and ``axis`` arguments of ``DataFrame.replace()`` are
-  deprecated
-- ``DataFrame.replace`` 's ``infer_types`` parameter is removed and now
-  performs conversion by default. (:issue:`3907`)
-- Deprecated display.height, display.width is now only a formatting option
-  does not control triggering of summary, similar to < 0.11.0.
-- Add the keyword ``allow_duplicates`` to ``DataFrame.insert`` to allow a duplicate column
-  to be inserted if ``True``, default is ``False`` (same as prior to 0.12) (:issue:`3679`)
-- io API changes
-
-  - added ``pandas.io.api`` for i/o imports
-  - removed ``Excel`` support to ``pandas.io.excel``
-  - added top-level ``pd.read_sql`` and ``to_sql`` DataFrame methods
-  - removed ``clipboard`` support to ``pandas.io.clipboard``
-  - replace top-level and instance methods ``save`` and ``load`` with
-    top-level ``read_pickle`` and ``to_pickle`` instance method, ``save`` and
-    ``load`` will give deprecation warning.
-- the ``method`` and ``axis`` arguments of ``DataFrame.replace()`` are
-  deprecated
-- set FutureWarning to require data_source, and to replace year/month with
-  expiry date in pandas.io options. This is in preparation to add options
-  data from Google (:issue:`3822`)
-- the ``method`` and ``axis`` arguments of ``DataFrame.replace()`` are
-  deprecated
-- Implement ``__nonzero__`` for ``NDFrame`` objects (:issue:`3691`, :issue:`3696`)
-- ``as_matrix`` with mixed signed and unsigned dtypes will result in 2 x the lcd of the unsigned
-  as an int, maxing with ``int64``, to avoid precision issues (:issue:`3733`)
-- ``na_values`` in a list provided to ``read_csv/read_excel`` will match string and numeric versions
-  e.g. ``na_values=['99']`` will match 99 whether the column ends up being int, float, or string (:issue:`3611`)
-- ``read_html`` now defaults to ``None`` when reading, and falls back on
-  ``bs4`` + ``html5lib`` when lxml fails to parse. a list of parsers to try
-  until success is also valid
-- more consistency in the to_datetime return types (give string/array of string inputs) (:issue:`3888`)
-- The internal ``pandas`` class hierarchy has changed (slightly). The
-  previous ``PandasObject`` now is called ``PandasContainer`` and a new
-  ``PandasObject`` has become the baseclass for ``PandasContainer`` as well
-  as ``Index``, ``Categorical``, ``GroupBy``, ``SparseList``, and
-  ``SparseArray`` (+ their base classes). Currently, ``PandasObject``
-  provides string methods (from ``StringMixin``). (:issue:`4090`, :issue:`4092`)
-- New ``StringMixin`` that, given a ``__unicode__`` method, gets python 2 and
-  python 3 compatible string methods (``__str__``, ``__bytes__``, and
-  ``__repr__``). Plus string safety throughout. Now employed in many places
-  throughout the pandas library. (:issue:`4090`, :issue:`4092`)
-
-Experimental Features
-~~~~~~~~~~~~~~~~~~~~~
-
-- Added experimental ``CustomBusinessDay`` class to support ``DateOffsets``
-  with custom holiday calendars and custom weekmasks. (:issue:`2301`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fixed an esoteric excel reading bug, xlrd>= 0.9.0 now required for excel
-  support. Should provide python3 support (for reading) which has been
-  lacking. (:issue:`3164`)
-- Disallow Series constructor called with MultiIndex which caused segfault (:issue:`4187`)
-- Allow unioning of date ranges sharing a timezone (:issue:`3491`)
-- Fix to_csv issue when having a large number of rows and ``NaT`` in some
-  columns (:issue:`3437`)
-- ``.loc`` was not raising when passed an integer list (:issue:`3449`)
-- Unordered time series selection was misbehaving when using label slicing (:issue:`3448`)
-- Fix sorting in a frame with a list of columns which contains datetime64[ns] dtypes (:issue:`3461`)
-- DataFrames fetched via FRED now handle '.' as a NaN. (:issue:`3469`)
-- Fix regression in a DataFrame apply with axis=1, objects were not being converted back
-  to base dtypes correctly (:issue:`3480`)
-- Fix issue when storing uint dtypes in an HDFStore. (:issue:`3493`)
-- Non-unique index support clarified (:issue:`3468`)
-
-  - Addressed handling of dupe columns in df.to_csv new and old (:issue:`3454`, :issue:`3457`)
-  - Fix assigning a new index to a duplicate index in a DataFrame would fail (:issue:`3468`)
-  - Fix construction of a DataFrame with a duplicate index
-  - ref_locs support to allow duplicative indices across dtypes,
-    allows iget support to always find the index (even across dtypes) (:issue:`2194`)
-  - applymap on a DataFrame with a non-unique index now works
-    (removed warning) (:issue:`2786`), and fix (:issue:`3230`)
-  - Fix to_csv to handle non-unique columns (:issue:`3495`)
-  - Duplicate indexes with getitem will return items in the correct order (:issue:`3455`, :issue:`3457`)
-    and handle missing elements like unique indices (:issue:`3561`)
-  - Duplicate indexes with and empty DataFrame.from_records will return a correct frame (:issue:`3562`)
-  - Concat to produce a non-unique columns when duplicates are across dtypes is fixed (:issue:`3602`)
-  - Non-unique indexing with a slice via ``loc`` and friends fixed (:issue:`3659`)
-  - Allow insert/delete to non-unique columns (:issue:`3679`)
-  - Extend ``reindex`` to correctly deal with non-unique indices (:issue:`3679`)
-  - ``DataFrame.itertuples()`` now works with frames with duplicate column
-    names (:issue:`3873`)
-  - Bug in non-unique indexing via ``iloc`` (:issue:`4017`); added ``takeable`` argument to
-    ``reindex`` for location-based taking
-  - Allow non-unique indexing in series via ``.ix/.loc`` and ``__getitem__`` (:issue:`4246`)
-  - Fixed non-unique indexing memory allocation issue with ``.ix/.loc`` (:issue:`4280`)
-
-- Fixed bug in groupby with empty series referencing a variable before assignment. (:issue:`3510`)
-- Allow index name to be used in groupby for non MultiIndex (:issue:`4014`)
-- Fixed bug in mixed-frame assignment with aligned series (:issue:`3492`)
-- Fixed bug in selecting month/quarter/year from a series would not select the time element
-  on the last day (:issue:`3546`)
-- Fixed a couple of MultiIndex rendering bugs in df.to_html() (:issue:`3547`, :issue:`3553`)
-- Properly convert np.datetime64 objects in a Series (:issue:`3416`)
-- Raise a ``TypeError`` on invalid datetime/timedelta operations
-  e.g. add datetimes, multiple timedelta x datetime
-- Fix ``.diff`` on datelike and timedelta operations (:issue:`3100`)
-- ``combine_first`` not returning the same dtype in cases where it can (:issue:`3552`)
-- Fixed bug with ``Panel.transpose`` argument aliases (:issue:`3556`)
-- Fixed platform bug in ``PeriodIndex.take`` (:issue:`3579`)
-- Fixed bud in incorrect conversion of datetime64[ns] in ``combine_first`` (:issue:`3593`)
-- Fixed bug in reset_index with ``NaN`` in a multi-index (:issue:`3586`)
-- ``fillna`` methods now raise a ``TypeError`` when the ``value`` parameter
-  is a ``list`` or ``tuple``.
-- Fixed bug where a time-series was being selected in preference to an actual column name
-  in a frame (:issue:`3594`)
-- Make secondary_y work properly for bar plots (:issue:`3598`)
-- Fix modulo and integer division on Series,DataFrames to act similary to ``float`` dtypes to return
-  ``np.nan`` or ``np.inf`` as appropriate (:issue:`3590`)
-- Fix incorrect dtype on groupby with ``as_index=False`` (:issue:`3610`)
-- Fix ``read_csv/read_excel`` to correctly encode identical na_values, e.g. ``na_values=[-999.0,-999]``
-  was failing (:issue:`3611`)
-- Disable HTML output in qtconsole again. (:issue:`3657`)
-- Reworked the new repr display logic, which users found confusing. (:issue:`3663`)
-- Fix indexing issue in ndim >= 3 with ``iloc`` (:issue:`3617`)
-- Correctly parse date columns with embedded (nan/NaT) into datetime64[ns] dtype in ``read_csv``
-  when ``parse_dates`` is specified (:issue:`3062`)
-- Fix not consolidating before to_csv (:issue:`3624`)
-- Fix alignment issue when setitem in a DataFrame with a piece of a DataFrame (:issue:`3626`) or
-  a mixed DataFrame and a Series (:issue:`3668`)
-- Fix plotting of unordered DatetimeIndex (:issue:`3601`)
-- ``sql.write_frame`` failing when writing a single column to sqlite (:issue:`3628`),
-  thanks to @stonebig
-- Fix pivoting with ``nan`` in the index (:issue:`3558`)
-- Fix running of bs4 tests when it is not installed (:issue:`3605`)
-- Fix parsing of html table (:issue:`3606`)
-- ``read_html()`` now only allows a single backend: ``html5lib`` (:issue:`3616`)
-- ``convert_objects`` with ``convert_dates='coerce'`` was parsing some single-letter strings into today's date
-- ``DataFrame.from_records`` did not accept empty recarrays (:issue:`3682`)
-- ``DataFrame.to_csv`` will succeed with the deprecated option ``nanRep``, @tdsmith
-- ``DataFrame.to_html`` and ``DataFrame.to_latex`` now accept a path for
-  their first argument (:issue:`3702`)
-- Fix file tokenization error with \r delimiter and quoted fields (:issue:`3453`)
-- Groupby transform with item-by-item not upcasting correctly (:issue:`3740`)
-- Incorrectly read a HDFStore multi-index Frame with a column specification (:issue:`3748`)
-- ``read_html`` now correctly skips tests (:issue:`3741`)
-- PandasObjects raise TypeError when trying to hash (:issue:`3882`)
-- Fix incorrect arguments passed to concat that are not list-like (e.g. concat(df1,df2)) (:issue:`3481`)
-- Correctly parse when passed the ``dtype=str`` (or other variable-len string dtypes)
-  in ``read_csv`` (:issue:`3795`)
-- Fix index name not propagating when using ``loc/ix`` (:issue:`3880`)
-- Fix groupby when applying a custom function resulting in a returned DataFrame was
-  not converting dtypes (:issue:`3911`)
-- Fixed a bug where ``DataFrame.replace`` with a compiled regular expression
-  in the ``to_replace`` argument wasn't working (:issue:`3907`)
-- Fixed ``__truediv__`` in Python 2.7 with ``numexpr`` installed to actually do true division when dividing
-  two integer arrays with at least 10000 cells total (:issue:`3764`)
-- Indexing with a string with seconds resolution not selecting from a time index (:issue:`3925`)
-- csv parsers would loop infinitely if ``iterator=True`` but no ``chunksize`` was
-  specified (:issue:`3967`), python parser failing with ``chunksize=1``
-- Fix index name not propagating when using ``shift``
-- Fixed dropna=False being ignored with multi-index stack (:issue:`3997`)
-- Fixed flattening of columns when renaming MultiIndex columns DataFrame (:issue:`4004`)
-- Fix ``Series.clip`` for datetime series. NA/NaN threshold values will now throw ValueError (:issue:`3996`)
-- Fixed insertion issue into DataFrame, after rename (:issue:`4032`)
-- Fixed testing issue where too many sockets where open thus leading to a
-  connection reset issue (:issue:`3982`, :issue:`3985`, :issue:`4028`,
-  :issue:`4054`)
-- Fixed failing tests in test_yahoo, test_google where symbols were not
-  retrieved but were being accessed (:issue:`3982`, :issue:`3985`,
-  :issue:`4028`, :issue:`4054`)
-- ``Series.hist`` will now take the figure from the current environment if
-  one is not passed
-- Fixed bug where a 1xN DataFrame would barf on a 1xN mask (:issue:`4071`)
-- Fixed running of ``tox`` under python3 where the pickle import was getting
-  rewritten in an incompatible way (:issue:`4062`, :issue:`4063`)
-- Fixed bug where sharex and sharey were not being passed to grouped_hist
-  (:issue:`4089`)
-- Fix bug where ``HDFStore`` will fail to append because of a different block
-  ordering on-disk (:issue:`4096`)
-- Better error messages on inserting incompatible columns to a frame (:issue:`4107`)
-- Fixed bug in ``DataFrame.replace`` where a nested dict wasn't being
-  iterated over when regex=False (:issue:`4115`)
-- Fixed bug in ``convert_objects(convert_numeric=True)`` where a mixed numeric and
-  object Series/Frame was not converting properly (:issue:`4119`)
-- Fixed bugs in multi-index selection with column multi-index and duplicates
-  (:issue:`4145`, :issue:`4146`)
-- Fixed bug in the parsing of microseconds when using the ``format``
-  argument in ``to_datetime`` (:issue:`4152`)
-- Fixed bug in ``PandasAutoDateLocator`` where ``invert_xaxis`` triggered
-  incorrectly ``MilliSecondLocator``  (:issue:`3990`)
-- Fixed bug in ``Series.where`` where broadcasting a single element input vector
-  to the length of the series resulted in multiplying the value
-  inside the input (:issue:`4192`)
-- Fixed bug in plotting that wasn't raising on invalid colormap for
-  matplotlib 1.1.1 (:issue:`4215`)
-- Fixed the legend displaying in ``DataFrame.plot(kind='kde')`` (:issue:`4216`)
-- Fixed bug where Index slices weren't carrying the name attribute
-  (:issue:`4226`)
-- Fixed bug in initializing ``DatetimeIndex`` with an array of strings
-  in a certain time zone (:issue:`4229`)
-- Fixed bug where html5lib wasn't being properly skipped (:issue:`4265`)
-- Fixed bug where get_data_famafrench wasn't using the correct file edges
-  (:issue:`4281`)
-
-pandas 0.11.0
--------------
-
-**Release date:** 2013-04-22
-
-New Features
-~~~~~~~~~~~~
-
-- New documentation section, ``10 Minutes to Pandas``
-- New documentation section, ``Cookbook``
-- Allow mixed dtypes (e.g ``float32/float64/int32/int16/int8``) to coexist in DataFrames and propagate in operations
-- Add function to pandas.io.data for retrieving stock index components from Yahoo! finance (:issue:`2795`)
-- Support slicing with time objects (:issue:`2681`)
-- Added ``.iloc`` attribute, to support strict integer based indexing, analogous to ``.ix`` (:issue:`2922`)
-- Added ``.loc`` attribute, to support strict label based indexing, analogous to ``.ix`` (:issue:`3053`)
-- Added ``.iat`` attribute, to support fast scalar access via integers (replaces ``iget_value/iset_value``)
-- Added ``.at`` attribute, to support fast scalar access via labels (replaces ``get_value/set_value``)
-- Moved functionality from ``irow,icol,iget_value/iset_value`` to ``.iloc`` indexer (via ``_ixs`` methods in each object)
-- Added support for expression evaluation using the ``numexpr`` library
-- Added ``convert=boolean`` to ``take`` routines to translate negative indices to positive, defaults to True
-- Added to_series() method to indices, to facilitate the creation of indexers (:issue:`3275`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved performance of df.to_csv() by up to 10x in some cases. (:issue:`3059`)
-- added ``blocks`` attribute to DataFrames, to return a dict of dtypes to homogeneously dtyped DataFrames
-- added keyword ``convert_numeric`` to ``convert_objects()`` to try to convert object dtypes to numeric types (default is False)
-- ``convert_dates`` in ``convert_objects`` can now be ``coerce`` which will return
-  a datetime64[ns] dtype with non-convertibles set as ``NaT``; will preserve an all-nan object
-  (e.g. strings), default is True (to perform soft-conversion
-- Series print output now includes the dtype by default
-- Optimize internal reindexing routines (:issue:`2819`, :issue:`2867`)
-- ``describe_option()`` now reports the default and current value of options.
-- Add ``format`` option to ``pandas.to_datetime`` with faster conversion of strings that can be parsed with datetime.strptime
-- Add ``axes`` property to ``Series`` for compatibility
-- Add ``xs`` function to ``Series`` for compatibility
-- Allow setitem in a frame where only mixed numerics are present (e.g. int and float), (:issue:`3037`)
-- ``HDFStore``
-
-  - Provide dotted attribute access to ``get`` from stores (e.g. store.df == store['df'])
-  - New keywords ``iterator=boolean``, and ``chunksize=number_in_a_chunk`` are provided to support iteration on ``select`` and ``select_as_multiple`` (:issue:`3076`)
-  - support ``read_hdf/to_hdf`` API similar to ``read_csv/to_csv`` (:issue:`3222`)
-
-- Add ``squeeze`` method to possibly remove length 1 dimensions from an object.
-
-  .. ipython:: python
-
-     p = pd.Panel(np.random.randn(3,4,4),items=['ItemA','ItemB','ItemC'],
-                  major_axis=pd.date_range('20010102',periods=4),
-                  minor_axis=['A','B','C','D'])
-     p
-     p.reindex(items=['ItemA']).squeeze()
-     p.reindex(items=['ItemA'],minor=['B']).squeeze()
-
-- Improvement to Yahoo API access in ``pd.io.data.Options`` (:issue:`2758`)
-- added option `display.max_seq_items` to control the number of elements printed per sequence pprinting it. (:issue:`2979`)
-- added option `display.chop_threshold` to control display of small numerical values. (:issue:`2739`)
-- added option `display.max_info_rows` to prevent verbose_info from being
-  calculated for frames above 1M rows (configurable). (:issue:`2807`, :issue:`2918`)
-- value_counts() now accepts a "normalize" argument, for normalized histograms. (:issue:`2710`).
-- DataFrame.from_records now accepts not only dicts but any instance of the collections.Mapping ABC.
-- Allow selection semantics via a string with a datelike index to work in both Series and DataFrames (:issue:`3070`)
-
-  .. ipython:: python
-
-      idx = pd.date_range("2001-10-1", periods=5, freq='M')
-      ts = pd.Series(np.random.rand(len(idx)),index=idx)
-      ts['2001']
-
-      df = pd.DataFrame(dict(A = ts))
-      df['2001']
-
-- added option `display.mpl_style` providing a sleeker visual style for plots. Based on https://gist.github.com/huyng/816622 (:issue:`3075`).
-- Improved performance across several core functions by taking memory ordering of
-  arrays into account. Courtesy of @stephenwlin (:issue:`3130`)
-- Improved performance of groupby transform method (:issue:`2121`)
-- Handle "ragged" CSV files missing trailing delimiters in rows with missing fields
-  when also providing explicit list of column names (so the parser knows how many columns to expect in the result) (:issue:`2981`)
-- On a mixed DataFrame, allow setting with indexers with ndarray/DataFrame on rhs (:issue:`3216`)
-- Treat boolean values as integers (values 1 and 0) for numeric operations. (:issue:`2641`)
-- Add ``time`` method to DatetimeIndex (:issue:`3180`)
-- Return NA when using Series.str[...] for values that are not long enough (:issue:`3223`)
-- Display cursor coordinate information in time-series plots (:issue:`1670`)
-- to_html() now accepts an optional "escape" argument to control reserved HTML character
-  escaping (enabled by default) and escapes ``&``, in addition to ``<`` and ``>``.  (:issue:`2919`)
-
-API Changes
-~~~~~~~~~~~
-
-- Do not automatically upcast numeric specified dtypes to ``int64`` or
-  ``float64`` (:issue:`622` and :issue:`797`)
-- DataFrame construction of lists and scalars, with no dtype present, will
-  result in casting to ``int64`` or ``float64``, regardless of platform.
-  This is not an apparent change in the API, but noting it.
-- Guarantee that ``convert_objects()`` for Series/DataFrame always returns a
-  copy
-- groupby operations will respect dtypes for numeric float operations
-  (float32/float64); other types will be operated on, and will try to cast
-  back to the input dtype (e.g. if an int is passed, as long as the output
-  doesn't have nans, then an int will be returned)
-- backfill/pad/take/diff/ohlc will now support ``float32/int16/int8``
-  operations
-- Block types will upcast as needed in where/masking operations (:issue:`2793`)
-- Series now automatically will try to set the correct dtype based on passed
-  datetimelike objects (datetime/Timestamp)
-
-  - timedelta64 are returned in appropriate cases (e.g. Series - Series,
-    when both are datetime64)
-  - mixed datetimes and objects (:issue:`2751`) in a constructor will be cast
-    correctly
-  - astype on datetimes to object are now handled (as well as NaT
-    conversions to np.nan)
-  - all timedelta like objects will be correctly assigned to ``timedelta64``
-    with mixed ``NaN`` and/or ``NaT`` allowed
-
-- arguments to DataFrame.clip were inconsistent to numpy and Series clipping
-  (:issue:`2747`)
-- util.testing.assert_frame_equal now checks the column and index names (:issue:`2964`)
-- Constructors will now return a more informative ValueError on failures
-  when invalid shapes are passed
-- Don't suppress TypeError in GroupBy.agg (:issue:`3238`)
-- Methods return None when inplace=True (:issue:`1893`)
-- ``HDFStore``
-
-   - added the method ``select_column`` to select a single column from a table as a Series.
-   - deprecated the ``unique`` method, can be replicated by ``select_column(key,column).unique()``
-   - ``min_itemsize`` parameter will now automatically create data_columns for passed keys
-
-- Downcast on pivot if possible (:issue:`3283`), adds argument ``downcast`` to ``fillna``
-- Introduced options `display.height/width` for explicitly specifying terminal
-  height/width in characters. Deprecated display.line_width, now replaced by display.width.
-  These defaults are in effect for scripts as well, so unless disabled, previously
-  very wide output will now be output as "expand_repr" style wrapped output.
-- Various defaults for options (including display.max_rows) have been revised,
-  after a brief survey concluded they were wrong for everyone. Now at w=80,h=60.
-- HTML repr output in IPython qtconsole is once again controlled by the option
-  `display.notebook_repr_html`, and on by default.
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix seg fault on empty data frame when fillna with ``pad`` or ``backfill``
-  (:issue:`2778`)
-- Single element ndarrays of datetimelike objects are handled
-  (e.g. np.array(datetime(2001,1,1,0,0))), w/o dtype being passed
-- 0-dim ndarrays with a passed dtype are handled correctly
-  (e.g. np.array(0.,dtype='float32'))
-- Fix some boolean indexing inconsistencies in Series.__getitem__/__setitem__
-  (:issue:`2776`)
-- Fix issues with DataFrame and Series constructor with integers that
-  overflow ``int64`` and some mixed typed type lists (:issue:`2845`)
-
-- ``HDFStore``
-
-  - Fix weird PyTables error when using too many selectors in a where
-    also correctly filter on any number of values in a Term expression
-    (so not using numexpr filtering, but isin filtering)
-  - Internally, change all variables to be private-like (now have leading
-    underscore)
-  - Fixes for query parsing to correctly interpret boolean and != (:issue:`2849`, :issue:`2973`)
-  - Fixes for pathological case on SparseSeries with 0-len array and
-    compression (:issue:`2931`)
-  - Fixes bug with writing rows if part of a block was all-nan (:issue:`3012`)
-  - Exceptions are now ValueError or TypeError as needed
-  - A table will now raise if min_itemsize contains fields which are not queryables
-
-- Bug showing up in applymap where some object type columns are converted (:issue:`2909`)
-  had an incorrect default in convert_objects
-
-- TimeDeltas
-
-  - Series ops with a Timestamp on the rhs was throwing an exception (:issue:`2898`)
-    added tests for Series ops with datetimes,timedeltas,Timestamps, and datelike
-    Series on both lhs and rhs
-  - Fixed subtle timedelta64 inference issue on py3 & numpy 1.7.0 (:issue:`3094`)
-  - Fixed some formatting issues on timedelta when negative
-  - Support null checking on timedelta64, representing (and formatting) with NaT
-  - Support setitem with np.nan value, converts to NaT
-  - Support min/max ops in a Dataframe (abs not working, nor do we error on non-supported ops)
-  - Support idxmin/idxmax/abs/max/min in a Series (:issue:`2989`, :issue:`2982`)
-
-- Bug on in-place putmasking on an ``integer`` series that needs to be converted to
-  ``float`` (:issue:`2746`)
-- Bug in argsort of ``datetime64[ns]`` Series with ``NaT`` (:issue:`2967`)
-- Bug in value_counts of ``datetime64[ns]`` Series (:issue:`3002`)
-- Fixed printing of ``NaT`` in an index
-- Bug in idxmin/idxmax of ``datetime64[ns]`` Series with ``NaT`` (:issue:`2982`)
-- Bug in ``icol, take`` with negative indicies was producing incorrect return
-  values (see :issue:`2922`, :issue:`2892`), also check for out-of-bounds indices (:issue:`3029`)
-- Bug in DataFrame column insertion when the column creation fails, existing frame is left in
-  an irrecoverable state (:issue:`3010`)
-- Bug in DataFrame update, combine_first where non-specified values could cause
-  dtype changes (:issue:`3016`, :issue:`3041`)
-- Bug in groupby with first/last where dtypes could change (:issue:`3041`, :issue:`2763`)
-- Formatting of an index that has ``nan`` was inconsistent or wrong (would fill from
-  other values), (:issue:`2850`)
-- Unstack of a frame with no nans would always cause dtype upcasting (:issue:`2929`)
-- Fix scalar datetime.datetime parsing bug in read_csv (:issue:`3071`)
-- Fixed slow printing of large Dataframes, due to inefficient dtype
-  reporting (:issue:`2807`)
-- Fixed a segfault when using a function as grouper in groupby (:issue:`3035`)
-- Fix pretty-printing of infinite data structures (closes :issue:`2978`)
-- Fixed exception when plotting timeseries bearing a timezone (closes :issue:`2877`)
-- str.contains ignored na argument (:issue:`2806`)
-- Substitute warning for segfault when grouping with categorical grouper
-  of mismatched length (:issue:`3011`)
-- Fix exception in SparseSeries.density (:issue:`2083`)
-- Fix upsampling bug with closed='left' and daily to daily data (:issue:`3020`)
-- Fixed missing tick bars on scatter_matrix plot (:issue:`3063`)
-- Fixed bug in Timestamp(d,tz=foo) when d is date() rather then datetime() (:issue:`2993`)
-- series.plot(kind='bar') now respects pylab color schem (:issue:`3115`)
-- Fixed bug in reshape if not passed correct input, now raises TypeError (:issue:`2719`)
-- Fixed a bug where Series ctor did not respect ordering if OrderedDict passed in (:issue:`3282`)
-- Fix NameError issue on RESO_US (:issue:`2787`)
-- Allow selection in an *unordered* timeseries to work similary
-  to an *ordered* timeseries (:issue:`2437`).
-- Fix implemented ``.xs`` when called with ``axes=1`` and a level parameter (:issue:`2903`)
-- Timestamp now supports the class method fromordinal similar to datetimes (:issue:`3042`)
-- Fix issue with indexing a series with a boolean key and specifiying a 1-len list on the rhs (:issue:`2745`)
-  or a list on the rhs (:issue:`3235`)
-- Fixed bug in groupby apply when kernel generate list of arrays having unequal len (:issue:`1738`)
-- fixed handling of rolling_corr with center=True which could produce corr>1 (:issue:`3155`)
-- Fixed issues where indices can be passed as 'index/column' in addition to 0/1 for the axis parameter
-- PeriodIndex.tolist now boxes to Period (:issue:`3178`)
-- PeriodIndex.get_loc KeyError now reports Period instead of ordinal (:issue:`3179`)
-- df.to_records bug when handling MultiIndex (GH3189)
-- Fix Series.__getitem__ segfault when index less than -length (:issue:`3168`)
-- Fix bug when using Timestamp as a date parser (:issue:`2932`)
-- Fix bug creating date range from Timestamp with time zone and passing same
-  time zone (:issue:`2926`)
-- Add comparison operators to Period object (:issue:`2781`)
-- Fix bug when concatenating two Series into a DataFrame when they have the
-  same name (:issue:`2797`)
-- Fix automatic color cycling when plotting consecutive timeseries
-  without color arguments (:issue:`2816`)
-- fixed bug in the pickling of PeriodIndex (:issue:`2891`)
-- Upcast/split blocks when needed in a mixed DataFrame when setitem
-  with an indexer (:issue:`3216`)
-- Invoking df.applymap on a dataframe with dupe cols now raises a ValueError (:issue:`2786`)
-- Apply with invalid returned indices raise correct Exception (:issue:`2808`)
-- Fixed a bug in plotting log-scale bar plots (:issue:`3247`)
-- df.plot() grid on/off now obeys the mpl default style, just like
-  series.plot(). (:issue:`3233`)
-- Fixed a bug in the legend of plotting.andrews_curves() (:issue:`3278`)
-- Produce a series on apply if we only generate a singular series and have
-  a simple index (:issue:`2893`)
-- Fix Python ASCII file parsing when integer falls outside of floating point
-  spacing (:issue:`3258`)
-- fixed pretty priniting of sets (:issue:`3294`)
-- Panel() and Panel.from_dict() now respects ordering when give OrderedDict (:issue:`3303`)
-- DataFrame where with a datetimelike incorrectly selecting (:issue:`3311`)
-- Ensure index casts work even in Int64Index
-- Fix set_index segfault when passing MultiIndex (:issue:`3308`)
-- Ensure pickles created in py2 can be read in py3
-- Insert ellipsis in MultiIndex summary repr (:issue:`3348`)
-- Groupby will handle mutation among an input groups columns (and fallback
-  to non-fast apply) (:issue:`3380`)
-- Eliminated unicode errors on FreeBSD when using MPL GTK backend (:issue:`3360`)
-- Period.strftime should return unicode strings always (:issue:`3363`)
-- Respect passed read_* chunksize in get_chunk function (:issue:`3406`)
-
-pandas 0.10.1
--------------
-
-**Release date:** 2013-01-22
-
-New Features
-~~~~~~~~~~~~
-
-- Add data interface to World Bank WDI pandas.io.wb (:issue:`2592`)
-
-API Changes
-~~~~~~~~~~~
-
-- Restored inplace=True behavior returning self (same object) with
-  deprecation warning until 0.11 (:issue:`1893`)
-- ``HDFStore``
-
-  - refactored HFDStore to deal with non-table stores as objects, will allow future enhancements
-  - removed keyword ``compression`` from ``put`` (replaced by keyword
-    ``complib`` to be consistent across library)
-  - warn `PerformanceWarning` if you are attempting to store types that will be pickled by PyTables
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- ``HDFStore``
-
-  - enables storing of multi-index dataframes (closes :issue:`1277`)
-  - support data column indexing and selection, via ``data_columns`` keyword
-    in append
-  - support write chunking to reduce memory footprint, via ``chunksize``
-    keyword to append
-  - support automagic indexing via ``index`` keyword to append
-  - support ``expectedrows`` keyword in append to inform ``PyTables`` about
-    the expected tablesize
-  - support ``start`` and ``stop`` keywords in select to limit the row
-    selection space
-  - added ``get_store`` context manager to automatically import with pandas
-  - added column filtering via ``columns`` keyword in select
-  - added methods append_to_multiple/select_as_multiple/select_as_coordinates
-    to do multiple-table append/selection
-  - added support for datetime64 in columns
-  - added method ``unique`` to select the unique values in an indexable or
-    data column
-  - added method ``copy`` to copy an existing store (and possibly upgrade)
-  - show the shape of the data on disk for non-table stores when printing the
-    store
-  - added ability to read PyTables flavor tables (allows compatibility to
-    other HDF5 systems)
-
-- Add ``logx`` option to DataFrame/Series.plot (:issue:`2327`, :issue:`2565`)
-- Support reading gzipped data from file-like object
-- ``pivot_table`` aggfunc can be anything used in GroupBy.aggregate (:issue:`2643`)
-- Implement DataFrame merges in case where set cardinalities might overflow
-  64-bit integer (:issue:`2690`)
-- Raise exception in C file parser if integer dtype specified and have NA
-  values. (:issue:`2631`)
-- Attempt to parse ISO8601 format dates when parse_dates=True in read_csv for
-  major performance boost in such cases (:issue:`2698`)
-- Add methods ``neg`` and ``inv`` to Series
-- Implement ``kind`` option in ``ExcelFile`` to indicate whether it's an XLS
-  or XLSX file (:issue:`2613`)
-- Documented a fast-path in pd.read_csv when parsing iso8601 datetime strings
-  yielding as much as a 20x speedup.  (:issue:`5993`)
-
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix read_csv/read_table multithreading issues (:issue:`2608`)
-- ``HDFStore``
-
-  - correctly handle ``nan`` elements in string columns; serialize via the
-    ``nan_rep`` keyword to append
-  - raise correctly on non-implemented column types (unicode/date)
-  - handle correctly ``Term`` passed types (e.g. ``index<1000``, when index
-    is ``Int64``), (closes :issue:`512`)
-  - handle Timestamp correctly in data_columns (closes :issue:`2637`)
-  - contains correctly matches on non-natural names
-  - correctly store ``float32`` dtypes in tables (if not other float types in
-    the same table)
-
-- Fix DataFrame.info bug with UTF8-encoded columns. (:issue:`2576`)
-- Fix DatetimeIndex handling of FixedOffset tz (:issue:`2604`)
-- More robust detection of being in IPython session for wide DataFrame
-  console formatting (:issue:`2585`)
-- Fix platform issues with ``file:///`` in unit test (:issue:`2564`)
-- Fix bug and possible segfault when grouping by hierarchical level that
-  contains NA values (:issue:`2616`)
-- Ensure that MultiIndex tuples can be constructed with NAs (:issue:`2616`)
-- Fix int64 overflow issue when unstacking MultiIndex with many levels
-  (:issue:`2616`)
-- Exclude non-numeric data from DataFrame.quantile by default (:issue:`2625`)
-- Fix a Cython C int64 boxing issue causing read_csv to return incorrect
-  results (:issue:`2599`)
-- Fix groupby summing performance issue on boolean data (:issue:`2692`)
-- Don't bork Series containing datetime64 values with to_datetime (:issue:`2699`)
-- Fix DataFrame.from_records corner case when passed columns, index column,
-  but empty record list (:issue:`2633`)
-- Fix C parser-tokenizer bug with trailing fields. (:issue:`2668`)
-- Don't exclude non-numeric data from GroupBy.max/min (:issue:`2700`)
-- Don't lose time zone when calling DatetimeIndex.drop (:issue:`2621`)
-- Fix setitem on a Series with a boolean key and a non-scalar as value
-  (:issue:`2686`)
-- Box datetime64 values in Series.apply/map (:issue:`2627`, :issue:`2689`)
-- Upconvert datetime + datetime64 values when concatenating frames (:issue:`2624`)
-- Raise a more helpful error message in merge operations when one DataFrame
-  has duplicate columns (:issue:`2649`)
-- Fix partial date parsing issue occuring only when code is run at EOM
-  (:issue:`2618`)
-- Prevent MemoryError when using counting sort in sortlevel with
-  high-cardinality MultiIndex objects (:issue:`2684`)
-- Fix Period resampling bug when all values fall into a single bin (:issue:`2070`)
-- Fix buggy interaction with usecols argument in read_csv when there is an
-  implicit first index column (:issue:`2654`)
-- Fix bug in ``Index.summary()`` where string format methods were being called incorrectly.
-  (:issue:`3869`)
-
-pandas 0.10.0
--------------
-
-**Release date:** 2012-12-17
-
-New Features
-~~~~~~~~~~~~
-
-- Brand new high-performance delimited file parsing engine written in C and
-  Cython. 50% or better performance in many standard use cases with a
-  fraction as much memory usage. (:issue:`407`, :issue:`821`)
-- Many new file parser (read_csv, read_table) features:
-
-  - Support for on-the-fly gzip or bz2 decompression (`compression` option)
-  - Ability to get back numpy.recarray instead of DataFrame
-    (`as_recarray=True`)
-  - `dtype` option: explicit column dtypes
-  - `usecols` option: specify list of columns to be read from a file. Good
-    for reading very wide files with many irrelevant columns (:issue:`1216` :issue:`926`, :issue:`2465`)
-  - Enhanced unicode decoding support via `encoding` option
-  - `skipinitialspace` dialect option
-  - Can specify strings to be recognized as True (`true_values`) or False
-    (`false_values`)
-  - High-performance `delim_whitespace` option for whitespace-delimited
-    files; a preferred alternative to the '\s+' regular expression delimiter
-  - Option to skip "bad" lines (wrong number of fields) that would otherwise
-    have caused an error in the past (`error_bad_lines` and `warn_bad_lines`
-    options)
-  - Substantially improved performance in the parsing of integers with
-    thousands markers and lines with comments
-  - Easy of European (and other) decimal formats (`decimal` option) (:issue:`584`, :issue:`2466`)
-  - Custom line terminators (e.g. lineterminator='~') (:issue:`2457`)
-  - Handling of no trailing commas in CSV files (:issue:`2333`)
-  - Ability to handle fractional seconds in date_converters (:issue:`2209`)
-  - read_csv allow scalar arg to na_values (:issue:`1944`)
-  - Explicit column dtype specification in read_* functions (:issue:`1858`)
-  - Easier CSV dialect specification (:issue:`1743`)
-  - Improve parser performance when handling special characters (:issue:`1204`)
-
-- Google Analytics API integration with easy oauth2 workflow (:issue:`2283`)
-- Add error handling to Series.str.encode/decode (:issue:`2276`)
-- Add ``where`` and ``mask`` to Series (:issue:`2337`)
-- Grouped histogram via `by` keyword in Series/DataFrame.hist (:issue:`2186`)
-- Support optional ``min_periods`` keyword in ``corr`` and ``cov``
-  for both Series and DataFrame (:issue:`2002`)
-- Add ``duplicated`` and ``drop_duplicates`` functions to Series (:issue:`1923`)
-- Add docs for ``HDFStore table`` format
-- 'density' property in `SparseSeries` (:issue:`2384`)
-- Add ``ffill`` and ``bfill`` convenience functions for forward- and
-  backfilling time series data (:issue:`2284`)
-- New option configuration system and functions `set_option`, `get_option`,
-  `describe_option`, and `reset_option`. Deprecate `set_printoptions` and
-  `reset_printoptions` (:issue:`2393`).
-  You can also access options as attributes via ``pandas.options.X``
-- Wide DataFrames can be viewed more easily in the console with new
-  `expand_frame_repr` and `line_width` configuration options. This is on by
-  default now (:issue:`2436`)
-- Scikits.timeseries-like moving window functions via ``rolling_window`` (:issue:`1270`)
-
-Experimental Features
-~~~~~~~~~~~~~~~~~~~~~
-
-- Add support for Panel4D, a named 4 Dimensional structure
-- Add support for ndpanel factory functions, to create custom,
-  domain-specific N-Dimensional containers
-
-API Changes
-~~~~~~~~~~~
-
-- The default binning/labeling behavior for ``resample`` has been changed to
-  `closed='left', label='left'` for daily and lower frequencies. This had
-  been a large source of confusion for users. See "what's new" page for more
-  on this. (:issue:`2410`)
-- Methods with ``inplace`` option now return None instead of the calling
-  (modified) object (:issue:`1893`)
-- The special case DataFrame - TimeSeries doing column-by-column broadcasting
-  has been deprecated. Users should explicitly do e.g. df.sub(ts, axis=0)
-  instead. This is a legacy hack and can lead to subtle bugs.
-- inf/-inf are no longer considered as NA by isnull/notnull. To be clear, this
-  is legacy cruft from early pandas. This behavior can be globally re-enabled
-  using the new option ``mode.use_inf_as_null`` (:issue:`2050`, :issue:`1919`)
-- ``pandas.merge`` will now default to ``sort=False``. For many use cases
-  sorting the join keys is not necessary, and doing it by default is wasteful
-- Specify ``header=0`` explicitly to replace existing column names in file in
-  read_* functions.
-- Default column names for header-less parsed files (yielded by read_csv,
-  etc.) are now the integers 0, 1, .... A new argument `prefix` has been
-  added; to get the v0.9.x behavior specify ``prefix='X'`` (:issue:`2034`). This API
-  change was made to make the default column names more consistent with the
-  DataFrame constructor's default column names when none are specified.
-- DataFrame selection using a boolean frame now preserves input shape
-- If function passed to Series.apply yields a Series, result will be a
-  DataFrame (:issue:`2316`)
-- Values like YES/NO/yes/no will not be considered as boolean by default any
-  longer in the file parsers. This can be customized using the new
-  ``true_values`` and ``false_values`` options (:issue:`2360`)
-- `obj.fillna()` is no longer valid; make `method='pad'` no longer the
-  default option, to be more explicit about what kind of filling to
-  perform. Add `ffill/bfill` convenience functions per above (:issue:`2284`)
-- `HDFStore.keys()` now returns an absolute path-name for each key
-- `to_string()` now always returns a unicode string. (:issue:`2224`)
-- File parsers will not handle NA sentinel values arising from passed
-  converter functions
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Add ``nrows`` option to DataFrame.from_records for iterators (:issue:`1794`)
-- Unstack/reshape algorithm rewrite to avoid high memory use in cases where
-  the number of observed key-tuples is much smaller than the total possible
-  number that could occur (:issue:`2278`). Also improves performance in most cases.
-- Support duplicate columns in DataFrame.from_records (:issue:`2179`)
-- Add ``normalize`` option to Series/DataFrame.asfreq (:issue:`2137`)
-- SparseSeries and SparseDataFrame construction from empty and scalar
-  values now no longer create dense ndarrays unnecessarily (:issue:`2322`)
-- ``HDFStore`` now supports hierarchical keys (:issue:`2397`)
-- Support multiple query selection formats for ``HDFStore tables`` (:issue:`1996`)
-- Support ``del store['df']`` syntax to delete HDFStores
-- Add multi-dtype support for ``HDFStore tables``
-- ``min_itemsize`` parameter can be specified in ``HDFStore table`` creation
-- Indexing support in ``HDFStore tables`` (:issue:`698`)
-- Add `line_terminator` option to DataFrame.to_csv (:issue:`2383`)
-- added implementation of str(x)/unicode(x)/bytes(x) to major pandas data
-  structures, which should do the right thing on both py2.x and py3.x. (:issue:`2224`)
-- Reduce groupby.apply overhead substantially by low-level manipulation of
-  internal NumPy arrays in DataFrames (:issue:`535`)
-- Implement ``value_vars`` in ``melt`` and add ``melt`` to pandas namespace
-  (:issue:`2412`)
-- Added boolean comparison operators to Panel
-- Enable ``Series.str.strip/lstrip/rstrip`` methods to take an argument (:issue:`2411`)
-- The DataFrame ctor now respects column ordering when given
-  an OrderedDict (:issue:`2455`)
-- Assigning DatetimeIndex to Series changes the class to TimeSeries (:issue:`2139`)
-- Improve performance of .value_counts method on non-integer data (:issue:`2480`)
-- ``get_level_values`` method for MultiIndex return Index instead of ndarray (:issue:`2449`)
-- ``convert_to_r_dataframe`` conversion for datetime values (:issue:`2351`)
-- Allow ``DataFrame.to_csv`` to represent inf and nan differently (:issue:`2026`)
-- Add ``min_i`` argument to ``nancorr`` to specify minimum required observations (:issue:`2002`)
-- Add ``inplace`` option to ``sortlevel`` / ``sort`` functions on DataFrame (:issue:`1873`)
-- Enable DataFrame to accept scalar constructor values like Series (:issue:`1856`)
-- DataFrame.from_records now takes optional ``size`` parameter (:issue:`1794`)
-- include iris dataset (:issue:`1709`)
-- No datetime64 DataFrame column conversion of datetime.datetime with tzinfo (:issue:`1581`)
-- Micro-optimizations in DataFrame for tracking state of internal consolidation (:issue:`217`)
-- Format parameter in DataFrame.to_csv (:issue:`1525`)
-- Partial string slicing for ``DatetimeIndex`` for daily and higher frequencies (:issue:`2306`)
-- Implement ``col_space`` parameter in ``to_html`` and ``to_string`` in DataFrame (:issue:`1000`)
-- Override ``Series.tolist`` and box datetime64 types (:issue:`2447`)
-- Optimize ``unstack`` memory usage by compressing indices (:issue:`2278`)
-- Fix HTML repr in IPython qtconsole if opening window is small (:issue:`2275`)
-- Escape more special characters in console output (:issue:`2492`)
-- df.select now invokes bool on the result of crit(x) (:issue:`2487`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix major performance regression in DataFrame.iteritems (:issue:`2273`)
-- Fixes bug when negative period passed to Series/DataFrame.diff (:issue:`2266`)
-- Escape tabs in console output to avoid alignment issues (:issue:`2038`)
-- Properly box datetime64 values when retrieving cross-section from
-  mixed-dtype DataFrame (:issue:`2272`)
-- Fix concatenation bug leading to :issue:`2057`, :issue:`2257`
-- Fix regression in Index console formatting (:issue:`2319`)
-- Box Period data when assigning PeriodIndex to frame column (:issue:`2243`, :issue:`2281`)
-- Raise exception on calling reset_index on Series with inplace=True (:issue:`2277`)
-- Enable setting multiple columns in DataFrame with hierarchical columns
-  (:issue:`2295`)
-- Respect dtype=object in DataFrame constructor (:issue:`2291`)
-- Fix DatetimeIndex.join bug with tz-aware indexes and how='outer' (:issue:`2317`)
-- pop(...) and del works with DataFrame with duplicate columns (:issue:`2349`)
-- Treat empty strings as NA in date parsing (rather than let dateutil do
-  something weird) (:issue:`2263`)
-- Prevent uint64 -> int64 overflows (:issue:`2355`)
-- Enable joins between MultiIndex and regular Index (:issue:`2024`)
-- Fix time zone metadata issue when unioning non-overlapping DatetimeIndex
-  objects (:issue:`2367`)
-- Raise/handle int64 overflows in parsers (:issue:`2247`)
-- Deleting of consecutive rows in ``HDFStore tables``` is much faster than before
-- Appending on a HDFStore would fail if the table was not first created via ``put``
-- Use `col_space` argument as minimum column width in DataFrame.to_html (:issue:`2328`)
-- Fix tz-aware DatetimeIndex.to_period (:issue:`2232`)
-- Fix DataFrame row indexing case with MultiIndex (:issue:`2314`)
-- Fix to_excel exporting issues with Timestamp objects in index (:issue:`2294`)
-- Fixes assigning scalars and array to hierarchical column chunk (:issue:`1803`)
-- Fixed a UnicodeDecodeError with series tidy_repr (:issue:`2225`)
-- Fixed issued with duplicate keys in an index (:issue:`2347`, :issue:`2380`)
-- Fixed issues re: Hash randomization, default on starting w/ py3.3 (:issue:`2331`)
-- Fixed issue with missing attributes after loading a pickled dataframe (:issue:`2431`)
-- Fix Timestamp formatting with tzoffset time zone in dateutil 2.1 (:issue:`2443`)
-- Fix GroupBy.apply issue when using BinGrouper to do ts binning (:issue:`2300`)
-- Fix issues resulting from datetime.datetime columns being converted to
-  datetime64 when calling DataFrame.apply. (:issue:`2374`)
-- Raise exception when calling to_panel on non uniquely-indexed frame (:issue:`2441`)
-- Improved detection of console encoding on IPython zmq frontends (:issue:`2458`)
-- Preserve time zone when .append-ing two time series (:issue:`2260`)
-- Box timestamps when calling reset_index on time-zone-aware index rather
-  than creating a tz-less datetime64 column (:issue:`2262`)
-- Enable searching non-string columns in DataFrame.filter(like=...) (:issue:`2467`)
-- Fixed issue with losing nanosecond precision upon conversion to DatetimeIndex(:issue:`2252`)
-- Handle timezones in Datetime.normalize (:issue:`2338`)
-- Fix test case where dtype specification with endianness causes
-  failures on big endian machines (:issue:`2318`)
-- Fix plotting bug where upsampling causes data to appear shifted in time (:issue:`2448`)
-- Fix ``read_csv`` failure for UTF-16 with BOM and skiprows(:issue:`2298`)
-- read_csv with names arg not implicitly setting header=None(:issue:`2459`)
-- Unrecognized compression mode causes segfault in read_csv(:issue:`2474`)
-- In read_csv, header=0 and passed names should discard first row(:issue:`2269`)
-- Correctly route to stdout/stderr in read_table (:issue:`2071`)
-- Fix exception when Timestamp.to_datetime is called on a Timestamp with tzoffset (:issue:`2471`)
-- Fixed unintentional conversion of datetime64 to long in groupby.first() (:issue:`2133`)
-- Union of empty DataFrames now return empty with concatenated index (:issue:`2307`)
-- DataFrame.sort_index raises more helpful exception if sorting by column
-  with duplicates (:issue:`2488`)
-- DataFrame.to_string formatters can be list, too (:issue:`2520`)
-- DataFrame.combine_first will always result in the union of the index and
-  columns, even if one DataFrame is length-zero (:issue:`2525`)
-- Fix several DataFrame.icol/irow with duplicate indices issues (:issue:`2228`, :issue:`2259`)
-- Use Series names for column names when using concat with axis=1 (:issue:`2489`)
-- Raise Exception if start, end, periods all passed to date_range (:issue:`2538`)
-- Fix Panel resampling issue (:issue:`2537`)
-
-pandas 0.9.1
-------------
-
-**Release date:** 2012-11-14
-
-New Features
-~~~~~~~~~~~~
-
-- Can specify multiple sort orders in DataFrame/Series.sort/sort_index (:issue:`928`)
-- New `top` and `bottom` options for handling NAs in rank (:issue:`1508`, :issue:`2159`)
-- Add `where` and `mask` functions to DataFrame (:issue:`2109`, :issue:`2151`)
-- Add `at_time` and `between_time` functions to DataFrame (:issue:`2149`)
-- Add flexible `pow` and `rpow` methods to DataFrame (:issue:`2190`)
-
-API Changes
-~~~~~~~~~~~
-
-- Upsampling period index "spans" intervals. Example: annual periods
-  upsampled to monthly will span all months in each year
-- Period.end_time will yield timestamp at last nanosecond in the interval
-  (:issue:`2124`, :issue:`2125`, :issue:`1764`)
-- File parsers no longer coerce to float or bool for columns that have custom
-  converters specified (:issue:`2184`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Time rule inference for week-of-month (e.g. WOM-2FRI) rules (:issue:`2140`)
-- Improve performance of datetime + business day offset with large number of
-  offset periods
-- Improve HTML display of DataFrame objects with hierarchical columns
-- Enable referencing of Excel columns by their column names (:issue:`1936`)
-- DataFrame.dot can accept ndarrays (:issue:`2042`)
-- Support negative periods in Panel.shift (:issue:`2164`)
-- Make .drop(...) work with non-unique indexes (:issue:`2101`)
-- Improve performance of Series/DataFrame.diff (re: :issue:`2087`)
-- Support unary ~ (__invert__) in DataFrame (:issue:`2110`)
-- Turn off pandas-style tick locators and formatters (:issue:`2205`)
-- DataFrame[DataFrame] uses DataFrame.where to compute masked frame (:issue:`2230`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix some duplicate-column DataFrame constructor issues (:issue:`2079`)
-- Fix bar plot color cycle issues (:issue:`2082`)
-- Fix off-center grid for stacked bar plots (:issue:`2157`)
-- Fix plotting bug if inferred frequency is offset with N > 1 (:issue:`2126`)
-- Implement comparisons on date offsets with fixed delta (:issue:`2078`)
-- Handle inf/-inf correctly in read_* parser functions (:issue:`2041`)
-- Fix matplotlib unicode interaction bug
-- Make WLS r-squared match statsmodels 0.5.0 fixed value
-- Fix zero-trimming DataFrame formatting bug
-- Correctly compute/box datetime64 min/max values from Series.min/max (:issue:`2083`)
-- Fix unstacking edge case with unrepresented groups (:issue:`2100`)
-- Fix Series.str failures when using pipe pattern '|' (:issue:`2119`)
-- Fix pretty-printing of dict entries in Series, DataFrame (:issue:`2144`)
-- Cast other datetime64 values to nanoseconds in DataFrame ctor (:issue:`2095`)
-- Alias Timestamp.astimezone to tz_convert, so will yield Timestamp (:issue:`2060`)
-- Fix timedelta64 formatting from Series (:issue:`2165`, :issue:`2146`)
-- Handle None values gracefully in dict passed to Panel constructor (:issue:`2075`)
-- Box datetime64 values as Timestamp objects in Series/DataFrame.iget (:issue:`2148`)
-- Fix Timestamp indexing bug in DatetimeIndex.insert (:issue:`2155`)
-- Use index name(s) (if any) in DataFrame.to_records (:issue:`2161`)
-- Don't lose index names in Panel.to_frame/DataFrame.to_panel (:issue:`2163`)
-- Work around length-0 boolean indexing NumPy bug (:issue:`2096`)
-- Fix partial integer indexing bug in DataFrame.xs (:issue:`2107`)
-- Fix variety of cut/qcut string-bin formatting bugs (:issue:`1978`, :issue:`1979`)
-- Raise Exception when xs view not possible of MultiIndex'd DataFrame (:issue:`2117`)
-- Fix groupby(...).first() issue with datetime64 (:issue:`2133`)
-- Better floating point error robustness in some rolling_* functions
-  (:issue:`2114`, :issue:`2527`)
-- Fix ewma NA handling in the middle of Series (:issue:`2128`)
-- Fix numerical precision issues in diff with integer data (:issue:`2087`)
-- Fix bug in MultiIndex.__getitem__ with NA values (:issue:`2008`)
-- Fix DataFrame.from_records dict-arg bug when passing columns (:issue:`2179`)
-- Fix Series and DataFrame.diff for integer dtypes (:issue:`2087`, :issue:`2174`)
-- Fix bug when taking intersection of DatetimeIndex with empty index (:issue:`2129`)
-- Pass through timezone information when calling DataFrame.align (:issue:`2127`)
-- Properly sort when joining on datetime64 values (:issue:`2196`)
-- Fix indexing bug in which False/True were being coerced to 0/1 (:issue:`2199`)
-- Many unicode formatting fixes (:issue:`2201`)
-- Fix improper MultiIndex conversion issue when assigning
-  e.g. DataFrame.index (:issue:`2200`)
-- Fix conversion of mixed-type DataFrame to ndarray with dup columns (:issue:`2236`)
-- Fix duplicate columns issue (:issue:`2218`, :issue:`2219`)
-- Fix SparseSeries.__pow__ issue with NA input (:issue:`2220`)
-- Fix icol with integer sequence failure (:issue:`2228`)
-- Fixed resampling tz-aware time series issue (:issue:`2245`)
-- SparseDataFrame.icol was not returning SparseSeries (:issue:`2227`, :issue:`2229`)
-- Enable ExcelWriter to handle PeriodIndex (:issue:`2240`)
-- Fix issue constructing DataFrame from empty Series with name (:issue:`2234`)
-- Use console-width detection in interactive sessions only (:issue:`1610`)
-- Fix parallel_coordinates legend bug with mpl 1.2.0 (:issue:`2237`)
-- Make tz_localize work in corner case of empty Series (:issue:`2248`)
-
-pandas 0.9.0
-------------
-
-**Release date:** 10/7/2012
-
-New Features
-~~~~~~~~~~~~
-
-- Add ``str.encode`` and ``str.decode`` to Series (:issue:`1706`)
-- Add `to_latex` method to DataFrame (:issue:`1735`)
-- Add convenient expanding window equivalents of all rolling_* ops (:issue:`1785`)
-- Add Options class to pandas.io.data for fetching options data from Yahoo!
-  Finance (:issue:`1748`, :issue:`1739`)
-- Recognize and convert more boolean values in file parsing (Yes, No, TRUE,
-  FALSE, variants thereof) (:issue:`1691`, :issue:`1295`)
-- Add Panel.update method, analogous to DataFrame.update (:issue:`1999`, :issue:`1988`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Proper handling of NA values in merge operations (:issue:`1990`)
-- Add ``flags`` option for ``re.compile`` in some Series.str methods (:issue:`1659`)
-- Parsing of UTC date strings in read_* functions (:issue:`1693`)
-- Handle generator input to Series (:issue:`1679`)
-- Add `na_action='ignore'` to Series.map to quietly propagate NAs (:issue:`1661`)
-- Add args/kwds options to Series.apply (:issue:`1829`)
-- Add inplace option to Series/DataFrame.reset_index (:issue:`1797`)
-- Add ``level`` parameter to ``Series.reset_index``
-- Add quoting option for DataFrame.to_csv (:issue:`1902`)
-- Indicate long column value truncation in DataFrame output with ... (:issue:`1854`)
-- DataFrame.dot will not do data alignment, and also work with Series (:issue:`1915`)
-- Add ``na`` option for missing data handling in some vectorized string
-  methods (:issue:`1689`)
-- If index_label=False in DataFrame.to_csv, do not print fields/commas in the
-  text output. Results in easier importing into R (:issue:`1583`)
-- Can pass tuple/list of axes to DataFrame.dropna to simplify repeated calls
-  (dropping both columns and rows) (:issue:`924`)
-- Improve DataFrame.to_html output for hierarchically-indexed rows (do not
-  repeat levels) (:issue:`1929`)
-- TimeSeries.between_time can now select times across midnight (:issue:`1871`)
-- Enable `skip_footer` parameter in `ExcelFile.parse` (:issue:`1843`)
-
-API Changes
-~~~~~~~~~~~
-
-- Change default header names in read_* functions to more Pythonic X0, X1,
-  etc. instead of X.1, X.2. (:issue:`2000`)
-- Deprecated ``day_of_year`` API removed from PeriodIndex, use ``dayofyear``
-  (:issue:`1723`)
-- Don't modify NumPy suppress printoption at import time
-- The internal HDF5 data arrangement for DataFrames has been
-  transposed. Legacy files will still be readable by HDFStore (:issue:`1834`, :issue:`1824`)
-- Legacy cruft removed: pandas.stats.misc.quantileTS
-- Use ISO8601 format for Period repr: monthly, daily, and on down (:issue:`1776`)
-- Empty DataFrame columns are now created as object dtype. This will prevent
-  a class of TypeErrors that was occurring in code where the dtype of a
-  column would depend on the presence of data or not (e.g. a SQL query having
-  results) (:issue:`1783`)
-- Setting parts of DataFrame/Panel using ix now aligns input Series/DataFrame
-  (:issue:`1630`)
-- `first` and `last` methods in `GroupBy` no longer drop non-numeric columns
-  (:issue:`1809`)
-- Resolved inconsistencies in specifying custom NA values in text parser.
-  `na_values` of type dict no longer override default NAs unless
-  `keep_default_na` is set to false explicitly (:issue:`1657`)
-- Enable `skipfooter` parameter in text parsers as an alias for `skip_footer`
-
-Bug Fixes
-~~~~~~~~~
-
-- Perform arithmetic column-by-column in mixed-type DataFrame to avoid type
-  upcasting issues. Caused downstream DataFrame.diff bug (:issue:`1896`)
-- Fix matplotlib auto-color assignment when no custom spectrum passed. Also
-  respect passed color keyword argument (:issue:`1711`)
-- Fix resampling logical error with closed='left' (:issue:`1726`)
-- Fix critical DatetimeIndex.union bugs (:issue:`1730`, :issue:`1719`, :issue:`1745`, :issue:`1702`, :issue:`1753`)
-- Fix critical DatetimeIndex.intersection bug with unanchored offsets (:issue:`1708`)
-- Fix MM-YYYY time series indexing case (:issue:`1672`)
-- Fix case where Categorical group key was not being passed into index in
-  GroupBy result (:issue:`1701`)
-- Handle Ellipsis in Series.__getitem__/__setitem__ (:issue:`1721`)
-- Fix some bugs with handling datetime64 scalars of other units in NumPy 1.6
-  and 1.7 (:issue:`1717`)
-- Fix performance issue in MultiIndex.format (:issue:`1746`)
-- Fixed GroupBy bugs interacting with DatetimeIndex asof / map methods (:issue:`1677`)
-- Handle factors with NAs in pandas.rpy (:issue:`1615`)
-- Fix statsmodels import in pandas.stats.var (:issue:`1734`)
-- Fix DataFrame repr/info summary with non-unique columns (:issue:`1700`)
-- Fix Series.iget_value for non-unique indexes (:issue:`1694`)
-- Don't lose tzinfo when passing DatetimeIndex as DataFrame column (:issue:`1682`)
-- Fix tz conversion with time zones that haven't had any DST transitions since
-  first date in the array (:issue:`1673`)
-- Fix field access with  UTC->local conversion on unsorted arrays (:issue:`1756`)
-- Fix isnull handling of array-like (list) inputs (:issue:`1755`)
-- Fix regression in handling of Series in Series constructor (:issue:`1671`)
-- Fix comparison of Int64Index with DatetimeIndex (:issue:`1681`)
-- Fix min_periods handling in new rolling_max/min at array start (:issue:`1695`)
-- Fix errors with how='median' and generic NumPy resampling in some cases
-  caused by SeriesBinGrouper (:issue:`1648`, :issue:`1688`)
-- When grouping by level, exclude unobserved levels (:issue:`1697`)
-- Don't lose tzinfo in DatetimeIndex when shifting by different offset (:issue:`1683`)
-- Hack to support storing data with a zero-length axis in HDFStore (:issue:`1707`)
-- Fix DatetimeIndex tz-aware range generation issue (:issue:`1674`)
-- Fix method='time' interpolation with intraday data (:issue:`1698`)
-- Don't plot all-NA DataFrame columns as zeros (:issue:`1696`)
-- Fix bug in scatter_plot with by option (:issue:`1716`)
-- Fix performance problem in infer_freq with lots of non-unique stamps (:issue:`1686`)
-- Fix handling of PeriodIndex as argument to create MultiIndex (:issue:`1705`)
-- Fix re: unicode MultiIndex level names in Series/DataFrame repr (:issue:`1736`)
-- Handle PeriodIndex in to_datetime instance method (:issue:`1703`)
-- Support StaticTzInfo in DatetimeIndex infrastructure (:issue:`1692`)
-- Allow MultiIndex setops with length-0 other type indexes (:issue:`1727`)
-- Fix handling of DatetimeIndex in DataFrame.to_records (:issue:`1720`)
-- Fix handling of general objects in isnull on which bool(...) fails (:issue:`1749`)
-- Fix .ix indexing with MultiIndex ambiguity (:issue:`1678`)
-- Fix .ix setting logic error with non-unique MultiIndex (:issue:`1750`)
-- Basic indexing now works on MultiIndex with > 1000000 elements, regression
-  from earlier version of pandas (:issue:`1757`)
-- Handle non-float64 dtypes in fast DataFrame.corr/cov code paths (:issue:`1761`)
-- Fix DatetimeIndex.isin to function properly (:issue:`1763`)
-- Fix conversion of array of tz-aware datetime.datetime to DatetimeIndex with
-  right time zone (:issue:`1777`)
-- Fix DST issues with generating ancxhored date ranges (:issue:`1778`)
-- Fix issue calling sort on result of Series.unique (:issue:`1807`)
-- Fix numerical issue leading to square root of negative number in
-  rolling_std (:issue:`1840`)
-- Let Series.str.split accept no arguments (like str.split) (:issue:`1859`)
-- Allow user to have dateutil 2.1 installed on a Python 2 system (:issue:`1851`)
-- Catch ImportError less aggressively in pandas/__init__.py (:issue:`1845`)
-- Fix pip source installation bug when installing from GitHub (:issue:`1805`)
-- Fix error when window size > array size in rolling_apply (:issue:`1850`)
-- Fix pip source installation issues via SSH from GitHub
-- Fix OLS.summary when column is a tuple (:issue:`1837`)
-- Fix bug in __doc__ patching when -OO passed to interpreter
-  (:issue:`1792` :issue:`1741` :issue:`1774`)
-- Fix unicode console encoding issue in IPython notebook (:issue:`1782`, :issue:`1768`)
-- Fix unicode formatting issue with Series.name (:issue:`1782`)
-- Fix bug in DataFrame.duplicated with datetime64 columns (:issue:`1833`)
-- Fix bug in Panel internals resulting in error when doing fillna after
-  truncate not changing size of panel (:issue:`1823`)
-- Prevent segfault due to MultiIndex not being supported in HDFStore table
-  format (:issue:`1848`)
-- Fix UnboundLocalError in Panel.__setitem__ and add better error (:issue:`1826`)
-- Fix to_csv issues with list of string entries. Isnull works on list of
-  strings now too (:issue:`1791`)
-- Fix Timestamp comparisons with datetime values outside the nanosecond range
-  (1677-2262)
-- Revert to prior behavior of normalize_date with datetime.date objects
-  (return datetime)
-- Fix broken interaction between np.nansum and Series.any/all
-- Fix bug with multiple column date parsers (:issue:`1866`)
-- DatetimeIndex.union(Int64Index) was broken
-- Make plot x vs y interface consistent with integer indexing (:issue:`1842`)
-- set_index inplace modified data even if unique check fails (:issue:`1831`)
-- Only use Q-OCT/NOV/DEC in quarterly frequency inference (:issue:`1789`)
-- Upcast to dtype=object when unstacking boolean DataFrame (:issue:`1820`)
-- Fix float64/float32 merging bug (:issue:`1849`)
-- Fixes to Period.start_time for non-daily frequencies (:issue:`1857`)
-- Fix failure when converter used on index_col in read_csv (:issue:`1835`)
-- Implement PeriodIndex.append so that pandas.concat works correctly (:issue:`1815`)
-- Avoid Cython out-of-bounds access causing segfault sometimes in pad_2d,
-  backfill_2d
-- Fix resampling error with intraday times and anchored target time (like
-  AS-DEC) (:issue:`1772`)
-- Fix .ix indexing bugs with mixed-integer indexes (:issue:`1799`)
-- Respect passed color keyword argument in Series.plot (:issue:`1890`)
-- Fix rolling_min/max when the window is larger than the size of the input
-  array. Check other malformed inputs (:issue:`1899`, :issue:`1897`)
-- Rolling variance / standard deviation with only a single observation in
-  window (:issue:`1884`)
-- Fix unicode sheet name failure in to_excel (:issue:`1828`)
-- Override DatetimeIndex.min/max to return Timestamp objects (:issue:`1895`)
-- Fix column name formatting issue in length-truncated column (:issue:`1906`)
-- Fix broken handling of copying Index metadata to new instances created by
-  view(...) calls inside the NumPy infrastructure
-- Support datetime.date again in DateOffset.rollback/rollforward
-- Raise Exception if set passed to Series constructor (:issue:`1913`)
-- Add TypeError when appending HDFStore table w/ wrong index type (:issue:`1881`)
-- Don't raise exception on empty inputs in EW functions (e.g. ewma) (:issue:`1900`)
-- Make asof work correctly with PeriodIndex (:issue:`1883`)
-- Fix extlinks in doc build
-- Fill boolean DataFrame with NaN when calling shift (:issue:`1814`)
-- Fix setuptools bug causing pip not to Cythonize .pyx files sometimes
-- Fix negative integer indexing regression in .ix from 0.7.x (:issue:`1888`)
-- Fix error while retrieving timezone and utc offset from subclasses of
-  datetime.tzinfo without .zone and ._utcoffset attributes (:issue:`1922`)
-- Fix DataFrame formatting of small, non-zero FP numbers (:issue:`1911`)
-- Various fixes by upcasting of date -> datetime (:issue:`1395`)
-- Raise better exception when passing multiple functions with the same name,
-  such as lambdas, to GroupBy.aggregate
-- Fix DataFrame.apply with axis=1 on a non-unique index (:issue:`1878`)
-- Proper handling of Index subclasses in pandas.unique (:issue:`1759`)
-- Set index names in DataFrame.from_records (:issue:`1744`)
-- Fix time series indexing error with duplicates, under and over hash table
-  size cutoff (:issue:`1821`)
-- Handle list keys in addition to tuples in DataFrame.xs when
-  partial-indexing a hierarchically-indexed DataFrame (:issue:`1796`)
-- Support multiple column selection in DataFrame.__getitem__ with duplicate
-  columns (:issue:`1943`)
-- Fix time zone localization bug causing improper fields (e.g. hours) in time
-  zones that have not had a UTC transition in a long time (:issue:`1946`)
-- Fix errors when parsing and working with with fixed offset timezones
-  (:issue:`1922`, :issue:`1928`)
-- Fix text parser bug when handling UTC datetime objects generated by
-  dateutil (:issue:`1693`)
-- Fix plotting bug when 'B' is the inferred frequency but index actually
-  contains weekends (:issue:`1668`, :issue:`1669`)
-- Fix plot styling bugs (:issue:`1666`, :issue:`1665`, :issue:`1658`)
-- Fix plotting bug with index/columns with unicode (:issue:`1685`)
-- Fix DataFrame constructor bug when passed Series with datetime64 dtype
-  in a dict (:issue:`1680`)
-- Fixed regression in generating DatetimeIndex using timezone aware
-  datetime.datetime (:issue:`1676`)
-- Fix DataFrame bug when printing concatenated DataFrames with duplicated
-  columns (:issue:`1675`)
-- Fixed bug when plotting time series with multiple intraday frequencies
-  (:issue:`1732`)
-- Fix bug in DataFrame.duplicated to enable iterables other than list-types
-  as input argument (:issue:`1773`)
-- Fix resample bug when passed list of lambdas as `how` argument (:issue:`1808`)
-- Repr fix for MultiIndex level with all NAs (:issue:`1971`)
-- Fix PeriodIndex slicing bug when slice start/end are out-of-bounds (:issue:`1977`)
-- Fix read_table bug when parsing unicode (:issue:`1975`)
-- Fix BlockManager.iget bug when dealing with non-unique MultiIndex as columns
-  (:issue:`1970`)
-- Fix reset_index bug if both drop and level are specified (:issue:`1957`)
-- Work around unsafe NumPy object->int casting with Cython function (:issue:`1987`)
-- Fix datetime64 formatting bug in DataFrame.to_csv (:issue:`1993`)
-- Default start date in pandas.io.data to 1/1/2000 as the docs say (:issue:`2011`)
-
-pandas 0.8.1
-------------
-
-**Release date:** July 22, 2012
-
-New Features
-~~~~~~~~~~~~
-
-- Add vectorized, NA-friendly string methods to Series (:issue:`1621`, :issue:`620`)
-- Can pass dict of per-column line styles to DataFrame.plot (:issue:`1559`)
-- Selective plotting to secondary y-axis on same subplot (:issue:`1640`)
-- Add new ``bootstrap_plot`` plot function
-- Add new ``parallel_coordinates`` plot function (:issue:`1488`)
-- Add ``radviz`` plot function (:issue:`1566`)
-- Add ``multi_sparse`` option to ``set_printoptions`` to modify display of
-  hierarchical indexes (:issue:`1538`)
-- Add ``dropna`` method to Panel (:issue:`171`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Use moving min/max algorithms from Bottleneck in rolling_min/rolling_max
-  for > 100x speedup. (:issue:`1504`, :issue:`50`)
-- Add Cython group median method for >15x speedup (:issue:`1358`)
-- Drastically improve ``to_datetime`` performance on ISO8601 datetime strings
-  (with no time zones) (:issue:`1571`)
-- Improve single-key groupby performance on large data sets, accelerate use of
-  groupby with a Categorical variable
-- Add ability to append hierarchical index levels with ``set_index`` and to
-  drop single levels with ``reset_index`` (:issue:`1569`, :issue:`1577`)
-- Always apply passed functions in ``resample``, even if upsampling (:issue:`1596`)
-- Avoid unnecessary copies in DataFrame constructor with explicit dtype (:issue:`1572`)
-- Cleaner DatetimeIndex string representation with 1 or 2 elements (:issue:`1611`)
-- Improve performance of array-of-Period to PeriodIndex, convert such arrays
-  to PeriodIndex inside Index (:issue:`1215`)
-- More informative string representation for weekly Period objects (:issue:`1503`)
-- Accelerate 3-axis multi data selection from homogeneous Panel (:issue:`979`)
-- Add ``adjust`` option to ewma to disable adjustment factor (:issue:`1584`)
-- Add new matplotlib converters for high frequency time series plotting (:issue:`1599`)
-- Handling of tz-aware datetime.datetime objects in to_datetime; raise
-  Exception unless utc=True given (:issue:`1581`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix NA handling in DataFrame.to_panel (:issue:`1582`)
-- Handle TypeError issues inside PyObject_RichCompareBool calls in khash
-  (:issue:`1318`)
-- Fix resampling bug to lower case daily frequency (:issue:`1588`)
-- Fix kendall/spearman DataFrame.corr bug with no overlap (:issue:`1595`)
-- Fix bug in DataFrame.set_index (:issue:`1592`)
-- Don't ignore axes in boxplot if by specified (:issue:`1565`)
-- Fix Panel .ix indexing with integers bug (:issue:`1603`)
-- Fix Partial indexing bugs (years, months, ...) with PeriodIndex (:issue:`1601`)
-- Fix MultiIndex console formatting issue (:issue:`1606`)
-- Unordered index with duplicates doesn't yield scalar location for single
-  entry (:issue:`1586`)
-- Fix resampling of tz-aware time series with "anchored" freq (:issue:`1591`)
-- Fix DataFrame.rank error on integer data (:issue:`1589`)
-- Selection of multiple SparseDataFrame columns by list in __getitem__ (:issue:`1585`)
-- Override Index.tolist for compatibility with MultiIndex (:issue:`1576`)
-- Fix hierarchical summing bug with MultiIndex of length 1 (:issue:`1568`)
-- Work around numpy.concatenate use/bug in Series.set_value (:issue:`1561`)
-- Ensure Series/DataFrame are sorted before resampling (:issue:`1580`)
-- Fix unhandled IndexError when indexing very large time series (:issue:`1562`)
-- Fix DatetimeIndex intersection logic error with irregular indexes (:issue:`1551`)
-- Fix unit test errors on Python 3 (:issue:`1550`)
-- Fix .ix indexing bugs in duplicate DataFrame index (:issue:`1201`)
-- Better handle errors with non-existing objects in HDFStore (:issue:`1254`)
-- Don't copy int64 array data in DatetimeIndex when copy=False (:issue:`1624`)
-- Fix resampling of conforming periods quarterly to annual (:issue:`1622`)
-- Don't lose index name on resampling (:issue:`1631`)
-- Support python-dateutil version 2.1 (:issue:`1637`)
-- Fix broken scatter_matrix axis labeling, esp. with time series (:issue:`1625`)
-- Fix cases where extra keywords weren't being passed on to matplotlib from
-  Series.plot (:issue:`1636`)
-- Fix BusinessMonthBegin logic for dates before 1st bday of month (:issue:`1645`)
-- Ensure string alias converted (valid in DatetimeIndex.get_loc) in
-  DataFrame.xs / __getitem__ (:issue:`1644`)
-- Fix use of string alias timestamps with tz-aware time series (:issue:`1647`)
-- Fix Series.max/min and Series.describe on len-0 series (:issue:`1650`)
-- Handle None values in dict passed to concat (:issue:`1649`)
-- Fix Series.interpolate with method='values' and DatetimeIndex (:issue:`1646`)
-- Fix IndexError in left merges on a DataFrame with 0-length (:issue:`1628`)
-- Fix DataFrame column width display with UTF-8 encoded characters (:issue:`1620`)
-- Handle case in pandas.io.data.get_data_yahoo where Yahoo! returns duplicate
-  dates for most recent business day
-- Avoid downsampling when plotting mixed frequencies on the same subplot (:issue:`1619`)
-- Fix read_csv bug when reading a single line (:issue:`1553`)
-- Fix bug in C code causing monthly periods prior to December 1969 to be off (:issue:`1570`)
-
-pandas 0.8.0
-------------
-
-**Release date:** 6/29/2012
-
-New Features
-~~~~~~~~~~~~
-
-- New unified DatetimeIndex class for nanosecond-level timestamp data
-- New Timestamp datetime.datetime subclass with easy time zone conversions,
-  and support for nanoseconds
-- New PeriodIndex class for timespans, calendar logic, and Period scalar object
-- High performance resampling of timestamp and period data. New `resample`
-  method of all pandas data structures
-- New frequency names plus shortcut string aliases like '15h', '1h30min'
-- Time series string indexing shorthand (:issue:`222`)
-- Add week, dayofyear array and other timestamp array-valued field accessor
-  functions to DatetimeIndex
-- Add GroupBy.prod optimized aggregation function and 'prod' fast time series
-  conversion method (:issue:`1018`)
-- Implement robust frequency inference function and `inferred_freq` attribute
-  on DatetimeIndex (:issue:`391`)
-- New ``tz_convert`` and ``tz_localize`` methods in Series / DataFrame
-- Convert DatetimeIndexes to UTC if time zones are different in join/setops
-  (:issue:`864`)
-- Add limit argument for forward/backward filling to reindex, fillna,
-  etc. (:issue:`825` and others)
-- Add support for indexes (dates or otherwise) with duplicates and common
-  sense indexing/selection functionality
-- Series/DataFrame.update methods, in-place variant of combine_first (:issue:`961`)
-- Add ``match`` function to API (:issue:`502`)
-- Add Cython-optimized first, last, min, max, prod functions to GroupBy (:issue:`994`,
-  :issue:`1043`)
-- Dates can be split across multiple columns (:issue:`1227`, :issue:`1186`)
-- Add experimental support for converting pandas DataFrame to R data.frame
-  via rpy2 (:issue:`350`, :issue:`1212`)
-- Can pass list of (name, function) to GroupBy.aggregate to get aggregates in
-  a particular order (:issue:`610`)
-- Can pass dicts with lists of functions or dicts to GroupBy aggregate to do
-  much more flexible multiple function aggregation (:issue:`642`, :issue:`610`)
-- New ordered_merge functions for merging DataFrames with ordered
-  data. Also supports group-wise merging for panel data (:issue:`813`)
-- Add keys() method to DataFrame
-- Add flexible replace method for replacing potentially values to Series and
-  DataFrame (:issue:`929`, :issue:`1241`)
-- Add 'kde' plot kind for Series/DataFrame.plot (:issue:`1059`)
-- More flexible multiple function aggregation with GroupBy
-- Add pct_change function to Series/DataFrame
-- Add option to interpolate by Index values in Series.interpolate (:issue:`1206`)
-- Add ``max_colwidth`` option for DataFrame, defaulting to 50
-- Conversion of DataFrame through rpy2 to R data.frame (:issue:`1282`, )
-- Add keys() method on DataFrame (:issue:`1240`)
-- Add new ``match`` function to API (similar to R) (:issue:`502`)
-- Add dayfirst option to parsers (:issue:`854`)
-- Add ``method`` argument to ``align`` method for forward/backward fillin
-  (:issue:`216`)
-- Add Panel.transpose method for rearranging axes (:issue:`695`)
-- Add new ``cut`` function (patterned after R) for discretizing data into
-  equal range-length bins or arbitrary breaks of your choosing (:issue:`415`)
-- Add new ``qcut`` for cutting with quantiles (:issue:`1378`)
-- Add ``value_counts`` top level array method (:issue:`1392`)
-- Added Andrews curves plot tupe (:issue:`1325`)
-- Add lag plot (:issue:`1440`)
-- Add autocorrelation_plot (:issue:`1425`)
-- Add support for tox and Travis CI (:issue:`1382`)
-- Add support for Categorical use in GroupBy (:issue:`292`)
-- Add ``any`` and ``all`` methods to DataFrame (:issue:`1416`)
-- Add ``secondary_y`` option to Series.plot
-- Add experimental ``lreshape`` function for reshaping wide to long
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Switch to klib/khash-based hash tables in Index classes for better
-  performance in many cases and lower memory footprint
-- Shipping some functions from scipy.stats to reduce dependency,
-  e.g. Series.describe and DataFrame.describe (:issue:`1092`)
-- Can create MultiIndex by passing list of lists or list of arrays to Series,
-  DataFrame constructor, etc. (:issue:`831`)
-- Can pass arrays in addition to column names to DataFrame.set_index (:issue:`402`)
-- Improve the speed of "square" reindexing of homogeneous DataFrame objects
-  by significant margin (:issue:`836`)
-- Handle more dtypes when passed MaskedArrays in DataFrame constructor (:issue:`406`)
-- Improved performance of join operations on integer keys (:issue:`682`)
-- Can pass multiple columns to GroupBy object, e.g. grouped[[col1, col2]] to
-  only aggregate a subset of the value columns (:issue:`383`)
-- Add histogram / kde plot options for scatter_matrix diagonals (:issue:`1237`)
-- Add inplace option to Series/DataFrame.rename and sort_index,
-  DataFrame.drop_duplicates (:issue:`805`, :issue:`207`)
-- More helpful error message when nothing passed to Series.reindex (:issue:`1267`)
-- Can mix array and scalars as dict-value inputs to DataFrame ctor (:issue:`1329`)
-- Use DataFrame columns' name for legend title in plots
-- Preserve frequency in DatetimeIndex when possible in boolean indexing
-  operations
-- Promote datetime.date values in data alignment operations (:issue:`867`)
-- Add ``order`` method to Index classes (:issue:`1028`)
-- Avoid hash table creation in large monotonic hash table indexes (:issue:`1160`)
-- Store time zones in HDFStore (:issue:`1232`)
-- Enable storage of sparse data structures in HDFStore (:issue:`85`)
-- Enable Series.asof to work with arrays of timestamp inputs
-- Cython implementation of DataFrame.corr speeds up by > 100x (:issue:`1349`, :issue:`1354`)
-- Exclude "nuisance" columns automatically in GroupBy.transform (:issue:`1364`)
-- Support functions-as-strings in GroupBy.transform (:issue:`1362`)
-- Use index name as xlabel/ylabel in plots (:issue:`1415`)
-- Add ``convert_dtype`` option to Series.apply to be able to leave data as
-  dtype=object (:issue:`1414`)
-- Can specify all index level names in concat (:issue:`1419`)
-- Add ``dialect`` keyword to parsers for quoting conventions (:issue:`1363`)
-- Enable DataFrame[bool_DataFrame] += value (:issue:`1366`)
-- Add ``retries`` argument to ``get_data_yahoo`` to try to prevent Yahoo! API
-  404s (:issue:`826`)
-- Improve performance of reshaping by using O(N) categorical sorting
-- Series names will be used for index of DataFrame if no index passed (:issue:`1494`)
-- Header argument in DataFrame.to_csv can accept a list of column names to
-  use instead of the object's columns (:issue:`921`)
-- Add ``raise_conflict`` argument to DataFrame.update (:issue:`1526`)
-- Support file-like objects in ExcelFile (:issue:`1529`)
-
-API Changes
-~~~~~~~~~~~
-
-- Rename `pandas._tseries` to `pandas.lib`
-- Rename Factor to Categorical and add improvements. Numerous Categorical bug
-  fixes
-- Frequency name overhaul, WEEKDAY/EOM and rules with @
-  deprecated. get_legacy_offset_name backwards compatibility function added
-- Raise ValueError in DataFrame.__nonzero__, so "if df" no longer works
-  (:issue:`1073`)
-- Change BDay (business day) to not normalize dates by default (:issue:`506`)
-- Remove deprecated DataMatrix name
-- Default merge suffixes for overlap now have underscores instead of periods
-  to facilitate tab completion, etc. (:issue:`1239`)
-- Deprecation of offset, time_rule timeRule parameters throughout codebase
-- Series.append and DataFrame.append no longer check for duplicate indexes
-  by default, add verify_integrity parameter (:issue:`1394`)
-- Refactor Factor class, old constructor moved to Factor.from_array
-- Modified internals of MultiIndex to use less memory (no longer represented
-  as array of tuples) internally, speed up construction time and many methods
-  which construct intermediate hierarchical indexes (:issue:`1467`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix OverflowError from storing pre-1970 dates in HDFStore by switching to
-  datetime64 (:issue:`179`)
-- Fix logical error with February leap year end in YearEnd offset
-- Series([False, nan]) was getting casted to float64 (:issue:`1074`)
-- Fix binary operations between boolean Series and object Series with
-  booleans and NAs (:issue:`1074`, :issue:`1079`)
-- Couldn't assign whole array to column in mixed-type DataFrame via .ix
-  (:issue:`1142`)
-- Fix label slicing issues with float index values (:issue:`1167`)
-- Fix segfault caused by empty groups passed to groupby (:issue:`1048`)
-- Fix occasionally misbehaved reindexing in the presence of NaN labels (:issue:`522`)
-- Fix imprecise logic causing weird Series results from .apply (:issue:`1183`)
-- Unstack multiple levels in one shot, avoiding empty columns in some
-  cases. Fix pivot table bug (:issue:`1181`)
-- Fix formatting of MultiIndex on Series/DataFrame when index name coincides
-  with label (:issue:`1217`)
-- Handle Excel 2003 #N/A as NaN from xlrd (:issue:`1213`, :issue:`1225`)
-- Fix timestamp locale-related deserialization issues with HDFStore by moving
-  to datetime64 representation (:issue:`1081`, :issue:`809`)
-- Fix DataFrame.duplicated/drop_duplicates NA value handling (:issue:`557`)
-- Actually raise exceptions in fast reducer (:issue:`1243`)
-- Fix various timezone-handling bugs from 0.7.3 (:issue:`969`)
-- GroupBy on level=0 discarded index name (:issue:`1313`)
-- Better error message with unmergeable DataFrames (:issue:`1307`)
-- Series.__repr__ alignment fix with unicode index values (:issue:`1279`)
-- Better error message if nothing passed to reindex (:issue:`1267`)
-- More robust NA handling in DataFrame.drop_duplicates (:issue:`557`)
-- Resolve locale-based and pre-epoch HDF5 timestamp deserialization issues
-  (:issue:`973`, :issue:`1081`, :issue:`179`)
-- Implement Series.repeat (:issue:`1229`)
-- Fix indexing with namedtuple and other tuple subclasses (:issue:`1026`)
-- Fix float64 slicing bug (:issue:`1167`)
-- Parsing integers with commas (:issue:`796`)
-- Fix groupby improper data type when group consists of one value (:issue:`1065`)
-- Fix negative variance possibility in nanvar resulting from floating point
-  error (:issue:`1090`)
-- Consistently set name on groupby pieces (:issue:`184`)
-- Treat dict return values as Series in GroupBy.apply (:issue:`823`)
-- Respect column selection for DataFrame in in GroupBy.transform (:issue:`1365`)
-- Fix MultiIndex partial indexing bug (:issue:`1352`)
-- Enable assignment of rows in mixed-type DataFrame via .ix (:issue:`1432`)
-- Reset index mapping when grouping Series in Cython (:issue:`1423`)
-- Fix outer/inner DataFrame.join with non-unique indexes (:issue:`1421`)
-- Fix MultiIndex groupby bugs with empty lower levels (:issue:`1401`)
-- Calling fillna with a Series will have same behavior as with dict (:issue:`1486`)
-- SparseSeries reduction bug (:issue:`1375`)
-- Fix unicode serialization issue in HDFStore (:issue:`1361`)
-- Pass keywords to pyplot.boxplot in DataFrame.boxplot (:issue:`1493`)
-- Bug fixes in MonthBegin (:issue:`1483`)
-- Preserve MultiIndex names in drop (:issue:`1513`)
-- Fix Panel DataFrame slice-assignment bug (:issue:`1533`)
-- Don't use locals() in read_* functions (:issue:`1547`)
-
-pandas 0.7.3
-------------
-
-**Release date:** April 12, 2012
-
-New Features
-~~~~~~~~~~~~
-
-- Support for non-unique indexes: indexing and selection, many-to-one and
-  many-to-many joins (:issue:`1306`)
-- Added fixed-width file reader, read_fwf (:issue:`952`)
-- Add group_keys argument to groupby to not add group names to MultiIndex in
-  result of apply (:issue:`938`)
-- DataFrame can now accept non-integer label slicing (:issue:`946`). Previously
-  only DataFrame.ix was able to do so.
-- DataFrame.apply now retains name attributes on Series objects (:issue:`983`)
-- Numeric DataFrame comparisons with non-numeric values now raises proper
-  TypeError (:issue:`943`). Previously raise "PandasError: DataFrame constructor
-  not properly called!"
-- Add ``kurt`` methods to Series and DataFrame (:issue:`964`)
-- Can pass dict of column -> list/set NA values for text parsers (:issue:`754`)
-- Allows users specified NA values in text parsers (:issue:`754`)
-- Parsers checks for openpyxl dependency and raises ImportError if not found
-  (:issue:`1007`)
-- New factory function to create HDFStore objects that can be used in a with
-  statement so users do not have to explicitly call HDFStore.close (:issue:`1005`)
-- pivot_table is now more flexible with same parameters as groupby (:issue:`941`)
-- Added stacked bar plots (:issue:`987`)
-- scatter_matrix method in pandas/tools/plotting.py (:issue:`935`)
-- DataFrame.boxplot returns plot results for ex-post styling (:issue:`985`)
-- Short version number accessible as pandas.version.short_version (:issue:`930`)
-- Additional documentation in panel.to_frame (:issue:`942`)
-- More informative Series.apply docstring regarding element-wise apply
-  (:issue:`977`)
-- Notes on rpy2 installation (:issue:`1006`)
-- Add rotation and font size options to hist method (:issue:`1012`)
-- Use exogenous / X variable index in result of OLS.y_predict. Add
-  OLS.predict method (:issue:`1027`, :issue:`1008`)
-
-API Changes
-~~~~~~~~~~~
-
-- Calling apply on grouped Series, e.g. describe(), will no longer yield
-  DataFrame by default. Will have to call unstack() to get prior behavior
-- NA handling in non-numeric comparisons has been tightened up (:issue:`933`, :issue:`953`)
-- No longer assign dummy names key_0, key_1, etc. to groupby index (:issue:`1291`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix logic error when selecting part of a row in a DataFrame with a
-  MultiIndex index (:issue:`1013`)
-- Series comparison with Series of differing length causes crash (:issue:`1016`).
-- Fix bug in indexing when selecting section of hierarchically-indexed row
-  (:issue:`1013`)
-- DataFrame.plot(logy=True) has no effect (:issue:`1011`).
-- Broken arithmetic operations between SparsePanel-Panel (:issue:`1015`)
-- Unicode repr issues in MultiIndex with non-ASCII characters (:issue:`1010`)
-- DataFrame.lookup() returns inconsistent results if exact match not present
-  (:issue:`1001`)
-- DataFrame arithmetic operations not treating None as NA (:issue:`992`)
-- DataFrameGroupBy.apply returns incorrect result (:issue:`991`)
-- Series.reshape returns incorrect result for multiple dimensions (:issue:`989`)
-- Series.std and Series.var ignores ddof parameter (:issue:`934`)
-- DataFrame.append loses index names (:issue:`980`)
-- DataFrame.plot(kind='bar') ignores color argument (:issue:`958`)
-- Inconsistent Index comparison results (:issue:`948`)
-- Improper int dtype DataFrame construction from data with NaN (:issue:`846`)
-- Removes default 'result' name in groupby results (:issue:`995`)
-- DataFrame.from_records no longer mutate input columns (:issue:`975`)
-- Use Index name when grouping by it (:issue:`1313`)
-
-pandas 0.7.2
-------------
-
-**Release date:** March 16, 2012
-
-New Features
-~~~~~~~~~~~~
-
-- Add additional tie-breaking methods in DataFrame.rank (:issue:`874`)
-- Add ascending parameter to rank in Series, DataFrame (:issue:`875`)
-- Add sort_columns parameter to allow unsorted plots (:issue:`918`)
-- IPython tab completion on GroupBy objects
-
-API Changes
-~~~~~~~~~~~
-
-- Series.sum returns 0 instead of NA when called on an empty
-  series. Analogously for a DataFrame whose rows or columns are length 0
-  (:issue:`844`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Don't use groups dict in Grouper.size (:issue:`860`)
-- Use khash for Series.value_counts, add raw function to algorithms.py (:issue:`861`)
-- Enable column access via attributes on GroupBy (:issue:`882`)
-- Enable setting existing columns (only) via attributes on DataFrame, Panel
-  (:issue:`883`)
-- Intercept __builtin__.sum in groupby (:issue:`885`)
-- Can pass dict to DataFrame.fillna to use different values per column (:issue:`661`)
-- Can select multiple hierarchical groups by passing list of values in .ix
-  (:issue:`134`)
-- Add level keyword to ``drop`` for dropping values from a level (:issue:`159`)
-- Add ``coerce_float`` option on DataFrame.from_records (:issue:`893`)
-- Raise exception if passed date_parser fails in ``read_csv``
-- Add ``axis`` option to DataFrame.fillna (:issue:`174`)
-- Fixes to Panel to make it easier to subclass (:issue:`888`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix overflow-related bugs in groupby (:issue:`850`, :issue:`851`)
-- Fix unhelpful error message in parsers (:issue:`856`)
-- Better err msg for failed boolean slicing of dataframe (:issue:`859`)
-- Series.count cannot accept a string (level name) in the level argument (:issue:`869`)
-- Group index platform int check (:issue:`870`)
-- concat on axis=1 and ignore_index=True raises TypeError (:issue:`871`)
-- Further unicode handling issues resolved (:issue:`795`)
-- Fix failure in multiindex-based access in Panel (:issue:`880`)
-- Fix DataFrame boolean slice assignment failure (:issue:`881`)
-- Fix combineAdd NotImplementedError for SparseDataFrame (:issue:`887`)
-- Fix DataFrame.to_html encoding and columns (:issue:`890`, :issue:`891`, :issue:`909`)
-- Fix na-filling handling in mixed-type DataFrame (:issue:`910`)
-- Fix to DataFrame.set_value with non-existant row/col (:issue:`911`)
-- Fix malformed block in groupby when excluding nuisance columns (:issue:`916`)
-- Fix inconsistant NA handling in dtype=object arrays (:issue:`925`)
-- Fix missing center-of-mass computation in ewmcov (:issue:`862`)
-- Don't raise exception when opening read-only HDF5 file (:issue:`847`)
-- Fix possible out-of-bounds memory access in 0-length Series (:issue:`917`)
-
-pandas 0.7.1
-------------
-
-**Release date:** February 29, 2012
-
-New Features
-~~~~~~~~~~~~
-
-- Add ``to_clipboard`` function to pandas namespace for writing objects to
-  the system clipboard (:issue:`774`)
-- Add ``itertuples`` method to DataFrame for iterating through the rows of a
-  dataframe as tuples (:issue:`818`)
-- Add ability to pass fill_value and method to DataFrame and Series align
-  method (:issue:`806`, :issue:`807`)
-- Add fill_value option to reindex, align methods (:issue:`784`)
-- Enable concat to produce DataFrame from Series (:issue:`787`)
-- Add ``between`` method to Series (:issue:`802`)
-- Add HTML representation hook to DataFrame for the IPython HTML notebook
-  (:issue:`773`)
-- Support for reading Excel 2007 XML documents using openpyxl
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improve performance and memory usage of fillna on DataFrame
-- Can concatenate a list of Series along axis=1 to obtain a DataFrame (:issue:`787`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix memory leak when inserting large number of columns into a single
-  DataFrame (:issue:`790`)
-- Appending length-0 DataFrame with new columns would not result in those new
-  columns being part of the resulting concatenated DataFrame (:issue:`782`)
-- Fixed groupby corner case when passing dictionary grouper and as_index is
-  False (:issue:`819`)
-- Fixed bug whereby bool array sometimes had object dtype (:issue:`820`)
-- Fix exception thrown on np.diff (:issue:`816`)
-- Fix to_records where columns are non-strings (:issue:`822`)
-- Fix Index.intersection where indices have incomparable types (:issue:`811`)
-- Fix ExcelFile throwing an exception for two-line file (:issue:`837`)
-- Add clearer error message in csv parser (:issue:`835`)
-- Fix loss of fractional seconds in HDFStore (:issue:`513`)
-- Fix DataFrame join where columns have datetimes (:issue:`787`)
-- Work around numpy performance issue in take (:issue:`817`)
-- Improve comparison operations for NA-friendliness (:issue:`801`)
-- Fix indexing operation for floating point values (:issue:`780`, :issue:`798`)
-- Fix groupby case resulting in malformed dataframe (:issue:`814`)
-- Fix behavior of reindex of Series dropping name (:issue:`812`)
-- Improve on redudant groupby computation (:issue:`775`)
-- Catch possible NA assignment to int/bool series with exception (:issue:`839`)
-
-pandas 0.7.0
-------------
-
-**Release date:** 2/9/2012
-
-New Features
-~~~~~~~~~~~~
-
-- New ``merge`` function for efficiently performing full gamut of database /
-  relational-algebra operations. Refactored existing join methods to use the
-  new infrastructure, resulting in substantial performance gains (:issue:`220`,
-  :issue:`249`, :issue:`267`)
-- New ``concat`` function for concatenating DataFrame or Panel objects along
-  an axis. Can form union or intersection of the other axes. Improves
-  performance of ``DataFrame.append`` (:issue:`468`, :issue:`479`, :issue:`273`)
-- Handle differently-indexed output values in ``DataFrame.apply`` (:issue:`498`)
-- Can pass list of dicts (e.g., a list of shallow JSON objects) to DataFrame
-  constructor (:issue:`526`)
-- Add ``reorder_levels`` method to Series and DataFrame (:issue:`534`)
-- Add dict-like ``get`` function to DataFrame and Panel (:issue:`521`)
-- ``DataFrame.iterrows`` method for efficiently iterating through the rows of
-  a DataFrame
-- Added ``DataFrame.to_panel`` with code adapted from ``LongPanel.to_long``
-- ``reindex_axis`` method added to DataFrame
-- Add ``level`` option to binary arithmetic functions on ``DataFrame`` and
-  ``Series``
-- Add ``level`` option to the ``reindex`` and ``align`` methods on Series and
-  DataFrame for broadcasting values across a level (:issue:`542`, :issue:`552`, others)
-- Add attribute-based item access to ``Panel`` and add IPython completion (PR
-  :issue:`554`)
-- Add ``logy`` option to ``Series.plot`` for log-scaling on the Y axis
-- Add ``index``, ``header``, and ``justify`` options to
-  ``DataFrame.to_string``. Add option to   (:issue:`570`, :issue:`571`)
-- Can pass multiple DataFrames to ``DataFrame.join`` to join on index (:issue:`115`)
-- Can pass multiple Panels to ``Panel.join`` (:issue:`115`)
-- Can pass multiple DataFrames to `DataFrame.append` to concatenate (stack)
-  and multiple Series to ``Series.append`` too
-- Added ``justify`` argument to ``DataFrame.to_string`` to allow different
-  alignment of column headers
-- Add ``sort`` option to GroupBy to allow disabling sorting of the group keys
-  for potential speedups (:issue:`595`)
-- Can pass MaskedArray to Series constructor (:issue:`563`)
-- Add Panel item access via attributes and IPython completion (:issue:`554`)
-- Implement ``DataFrame.lookup``, fancy-indexing analogue for retrieving
-  values given a sequence of row and column labels (:issue:`338`)
-- Add ``verbose`` option to ``read_csv`` and ``read_table`` to show number of
-  NA values inserted in non-numeric columns (:issue:`614`)
-- Can pass a list of dicts or Series to ``DataFrame.append`` to concatenate
-  multiple rows (:issue:`464`)
-- Add ``level`` argument to ``DataFrame.xs`` for selecting data from other
-  MultiIndex levels. Can take one or more levels with potentially a tuple of
-  keys for flexible retrieval of data (:issue:`371`, :issue:`629`)
-- New ``crosstab`` function for easily computing frequency tables (:issue:`170`)
-- Can pass a list of functions to aggregate with groupby on a DataFrame,
-  yielding an aggregated result with hierarchical columns (:issue:`166`)
-- Add integer-indexing functions ``iget`` in Series and ``irow`` / ``iget``
-  in DataFrame (:issue:`628`)
-- Add new ``Series.unique`` function, significantly faster than
-  ``numpy.unique`` (:issue:`658`)
-- Add new ``cummin`` and ``cummax`` instance methods to ``Series`` and
-  ``DataFrame`` (:issue:`647`)
-- Add new ``value_range`` function to return min/max of a dataframe (:issue:`288`)
-- Add ``drop`` parameter to ``reset_index`` method of ``DataFrame`` and added
-  method to ``Series`` as well (:issue:`699`)
-- Add ``isin`` method to Index objects, works just like ``Series.isin`` (GH
-  :issue:`657`)
-- Implement array interface on Panel so that ufuncs work (re: :issue:`740`)
-- Add ``sort`` option to ``DataFrame.join`` (:issue:`731`)
-- Improved handling of NAs (propagation) in binary operations with
-  dtype=object arrays (:issue:`737`)
-- Add ``abs`` method to Pandas objects
-- Added ``algorithms`` module to start collecting central algos
-
-API Changes
-~~~~~~~~~~~
-
-- Label-indexing with integer indexes now raises KeyError if a label is not
-  found instead of falling back on location-based indexing (:issue:`700`)
-- Label-based slicing via ``ix`` or ``[]`` on Series will now only work if
-  exact matches for the labels are found or if the index is monotonic (for
-  range selections)
-- Label-based slicing and sequences of labels can be passed to ``[]`` on a
-  Series for both getting and setting (:issue:`86`)
-- `[]` operator (``__getitem__`` and ``__setitem__``) will raise KeyError
-  with integer indexes when an index is not contained in the index. The prior
-  behavior would fall back on position-based indexing if a key was not found
-  in the index which would lead to subtle bugs. This is now consistent with
-  the behavior of ``.ix`` on DataFrame and friends (:issue:`328`)
-- Rename ``DataFrame.delevel`` to ``DataFrame.reset_index`` and add
-  deprecation warning
-- `Series.sort` (an in-place operation) called on a Series which is a view on
-  a larger array (e.g. a column in a DataFrame) will generate an Exception to
-  prevent accidentally modifying the data source (:issue:`316`)
-- Refactor to remove deprecated ``LongPanel`` class (:issue:`552`)
-- Deprecated ``Panel.to_long``, renamed to ``to_frame``
-- Deprecated ``colSpace`` argument in ``DataFrame.to_string``, renamed to
-  ``col_space``
-- Rename ``precision`` to ``accuracy`` in engineering float formatter (GH
-  :issue:`395`)
-- The default delimiter for ``read_csv`` is comma rather than letting
-  ``csv.Sniffer`` infer it
-- Rename ``col_or_columns`` argument in ``DataFrame.drop_duplicates`` (GH
-  :issue:`734`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Better error message in DataFrame constructor when passed column labels
-  don't match data (:issue:`497`)
-- Substantially improve performance of multi-GroupBy aggregation when a
-  Python function is passed, reuse ndarray object in Cython (:issue:`496`)
-- Can store objects indexed by tuples and floats in HDFStore (:issue:`492`)
-- Don't print length by default in Series.to_string, add `length` option (GH
-  :issue:`489`)
-- Improve Cython code for multi-groupby to aggregate without having to sort
-  the data (:issue:`93`)
-- Improve MultiIndex reindexing speed by storing tuples in the MultiIndex,
-  test for backwards unpickling compatibility
-- Improve column reindexing performance by using specialized Cython take
-  function
-- Further performance tweaking of Series.__getitem__ for standard use cases
-- Avoid Index dict creation in some cases (i.e. when getting slices, etc.),
-  regression from prior versions
-- Friendlier error message in setup.py if NumPy not installed
-- Use common set of NA-handling operations (sum, mean, etc.) in Panel class
-  also (:issue:`536`)
-- Default name assignment when calling ``reset_index`` on DataFrame with a
-  regular (non-hierarchical) index (:issue:`476`)
-- Use Cythonized groupers when possible in Series/DataFrame stat ops with
-  ``level`` parameter passed (:issue:`545`)
-- Ported skiplist data structure to C to speed up ``rolling_median`` by about
-  5-10x in most typical use cases (:issue:`374`)
-- Some performance enhancements in constructing a Panel from a dict of
-  DataFrame objects
-- Made ``Index._get_duplicates`` a public method by removing the underscore
-- Prettier printing of floats, and column spacing fix (:issue:`395`, :issue:`571`)
-- Add ``bold_rows`` option to DataFrame.to_html (:issue:`586`)
-- Improve the performance of ``DataFrame.sort_index`` by up to 5x or more
-  when sorting by multiple columns
-- Substantially improve performance of DataFrame and Series constructors when
-  passed a nested dict or dict, respectively (:issue:`540`, :issue:`621`)
-- Modified setup.py so that pip / setuptools will install dependencies (GH
-  :issue:`507`, various pull requests)
-- Unstack called on DataFrame with non-MultiIndex will return Series (GH
-  :issue:`477`)
-- Improve DataFrame.to_string and console formatting to be more consistent in
-  the number of displayed digits (:issue:`395`)
-- Use bottleneck if available for performing NaN-friendly statistical
-  operations that it implemented (:issue:`91`)
-- Monkey-patch context to traceback in ``DataFrame.apply`` to indicate which
-  row/column the function application failed on (:issue:`614`)
-- Improved ability of read_table and read_clipboard to parse
-  console-formatted DataFrames (can read the row of index names, etc.)
-- Can pass list of group labels (without having to convert to an ndarray
-  yourself) to ``groupby`` in some cases (:issue:`659`)
-- Use ``kind`` argument to Series.order for selecting different sort kinds
-  (:issue:`668`)
-- Add option to Series.to_csv to omit the index (:issue:`684`)
-- Add ``delimiter`` as an alternative to ``sep`` in ``read_csv`` and other
-  parsing functions
-- Substantially improved performance of groupby on DataFrames with many
-  columns by aggregating blocks of columns all at once (:issue:`745`)
-- Can pass a file handle or StringIO to Series/DataFrame.to_csv (:issue:`765`)
-- Can pass sequence of integers to DataFrame.irow(icol) and Series.iget, (GH
-  :issue:`654`)
-- Prototypes for some vectorized string functions
-- Add float64 hash table to solve the Series.unique problem with NAs (:issue:`714`)
-- Memoize objects when reading from file to reduce memory footprint
-- Can get and set a column of a DataFrame with hierarchical columns
-  containing "empty" ('') lower levels without passing the empty levels (PR
-  :issue:`768`)
-
-Bug Fixes
-~~~~~~~~~
-
-- Raise exception in out-of-bounds indexing of Series instead of
-  seg-faulting, regression from earlier releases (:issue:`495`)
-- Fix error when joining DataFrames of different dtypes within the same
-  typeclass (e.g. float32 and float64) (:issue:`486`)
-- Fix bug in Series.min/Series.max on objects like datetime.datetime (GH
-  :issue:`487`)
-- Preserve index names in Index.union (:issue:`501`)
-- Fix bug in Index joining causing subclass information (like DateRange type)
-  to be lost in some cases (:issue:`500`)
-- Accept empty list as input to DataFrame constructor, regression from 0.6.0
-  (:issue:`491`)
-- Can output DataFrame and Series with ndarray objects in a dtype=object
-  array (:issue:`490`)
-- Return empty string from Series.to_string when called on empty Series (GH
-  :issue:`488`)
-- Fix exception passing empty list to DataFrame.from_records
-- Fix Index.format bug (excluding name field) with datetimes with time info
-- Fix scalar value access in Series to always return NumPy scalars,
-  regression from prior versions (:issue:`510`)
-- Handle rows skipped at beginning of file in read_* functions (:issue:`505`)
-- Handle improper dtype casting in ``set_value`` methods
-- Unary '-' / __neg__ operator on DataFrame was returning integer values
-- Unbox 0-dim ndarrays from certain operators like all, any in Series
-- Fix handling of missing columns (was combine_first-specific) in
-  DataFrame.combine for general case (:issue:`529`)
-- Fix type inference logic with boolean lists and arrays in DataFrame indexing
-- Use centered sum of squares in R-square computation if entity_effects=True
-  in panel regression
-- Handle all NA case in Series.{corr, cov}, was raising exception (:issue:`548`)
-- Aggregating by multiple levels with ``level`` argument to DataFrame, Series
-  stat method, was broken (:issue:`545`)
-- Fix Cython buf when converter passed to read_csv produced a numeric array
-  (buffer dtype mismatch when passed to Cython type inference function) (GH
-  :issue:`546`)
-- Fix exception when setting scalar value using .ix on a DataFrame with a
-  MultiIndex (:issue:`551`)
-- Fix outer join between two DateRanges with different offsets that returned
-  an invalid DateRange
-- Cleanup DataFrame.from_records failure where index argument is an integer
-- Fix Data.from_records failure when passed a dictionary
-- Fix NA handling in {Series, DataFrame}.rank with non-floating point dtypes
-- Fix bug related to integer type-checking in .ix-based indexing
-- Handle non-string index name passed to DataFrame.from_records
-- DataFrame.insert caused the columns name(s) field to be discarded (:issue:`527`)
-- Fix erroneous in monotonic many-to-one left joins
-- Fix DataFrame.to_string to remove extra column white space (:issue:`571`)
-- Format floats to default to same number of digits (:issue:`395`)
-- Added decorator to copy docstring from one function to another (:issue:`449`)
-- Fix error in monotonic many-to-one left joins
-- Fix __eq__ comparison between DateOffsets with different relativedelta
-  keywords passed
-- Fix exception caused by parser converter returning strings (:issue:`583`)
-- Fix MultiIndex formatting bug with integer names (:issue:`601`)
-- Fix bug in handling of non-numeric aggregates in Series.groupby (:issue:`612`)
-- Fix TypeError with tuple subclasses (e.g. namedtuple) in
-  DataFrame.from_records (:issue:`611`)
-- Catch misreported console size when running IPython within Emacs
-- Fix minor bug in pivot table margins, loss of index names and length-1
-  'All' tuple in row labels
-- Add support for legacy WidePanel objects to be read from HDFStore
-- Fix out-of-bounds segfault in pad_object and backfill_object methods when
-  either source or target array are empty
-- Could not create a new column in a DataFrame from a list of tuples
-- Fix bugs preventing SparseDataFrame and SparseSeries working with groupby
-  (:issue:`666`)
-- Use sort kind in Series.sort / argsort (:issue:`668`)
-- Fix DataFrame operations on non-scalar, non-pandas objects (:issue:`672`)
-- Don't convert DataFrame column to integer type when passing integer to
-  __setitem__ (:issue:`669`)
-- Fix downstream bug in pivot_table caused by integer level names in
-  MultiIndex (:issue:`678`)
-- Fix SparseSeries.combine_first when passed a dense Series (:issue:`687`)
-- Fix performance regression in HDFStore loading when DataFrame or Panel
-  stored in table format with datetimes
-- Raise Exception in DateRange when offset with n=0 is passed (:issue:`683`)
-- Fix get/set inconsistency with .ix property and integer location but
-  non-integer index (:issue:`707`)
-- Use right dropna function for SparseSeries. Return dense Series for NA fill
-  value (:issue:`730`)
-- Fix Index.format bug causing incorrectly string-formatted Series with
-  datetime indexes (:issue:`726`, :issue:`758`)
-- Fix errors caused by object dtype arrays passed to ols (:issue:`759`)
-- Fix error where column names lost when passing list of labels to
-  DataFrame.__getitem__, (:issue:`662`)
-- Fix error whereby top-level week iterator overwrote week instance
-- Fix circular reference causing memory leak in sparse array / series /
-  frame, (:issue:`663`)
-- Fix integer-slicing from integers-as-floats (:issue:`670`)
-- Fix zero division errors in nanops from object dtype arrays in all NA case
-  (:issue:`676`)
-- Fix csv encoding when using unicode (:issue:`705`, :issue:`717`, :issue:`738`)
-- Fix assumption that each object contains every unique block type in concat,
-  (:issue:`708`)
-- Fix sortedness check of multiindex in to_panel (:issue:`719`, 720)
-- Fix that None was not treated as NA in PyObjectHashtable
-- Fix hashing dtype because of endianness confusion (:issue:`747`, :issue:`748`)
-- Fix SparseSeries.dropna to return dense Series in case of NA fill value (GH
-  :issue:`730`)
-- Use map_infer instead of np.vectorize. handle NA sentinels if converter
-  yields numeric array, (:issue:`753`)
-- Fixes and improvements to DataFrame.rank (:issue:`742`)
-- Fix catching AttributeError instead of NameError for bottleneck
-- Try to cast non-MultiIndex to better dtype when calling reset_index (:issue:`726`
-  :issue:`440`)
-- Fix #1.QNAN0' float bug on 2.6/win64
-- Allow subclasses of dicts in DataFrame constructor, with tests
-- Fix problem whereby set_index destroys column multiindex (:issue:`764`)
-- Hack around bug in generating DateRange from naive DateOffset (:issue:`770`)
-- Fix bug in DateRange.intersection causing incorrect results with some
-  overlapping ranges (:issue:`771`)
-
-Thanks
-~~~~~~
-
-- Craig Austin
-- Chris Billington
-- Marius Cobzarenco
-- Mario Gamboa-Cavazos
-- Hans-Martin Gaudecker
-- Arthur Gerigk
-- Yaroslav Halchenko
-- Jeff Hammerbacher
-- Matt Harrison
-- Andreas Hilboll
-- Luc Kesters
-- Adam Klein
-- Gregg Lind
-- Solomon Negusse
-- Wouter Overmeire
-- Christian Prinoth
-- Jeff Reback
-- Sam Reckoner
-- Craig Reeson
-- Jan Schulz
-- Skipper Seabold
-- Ted Square
-- Graham Taylor
-- Aman Thakral
-- Chris Uga
-- Dieter Vandenbussche
-- Texas P.
-- Pinxing Ye
-- ... and everyone I forgot
-
-pandas 0.6.1
-------------
-
-**Release date:** 12/13/2011
-
-API Changes
-~~~~~~~~~~~
-
-- Rename `names` argument in DataFrame.from_records to `columns`. Add
-  deprecation warning
-- Boolean get/set operations on Series with boolean Series will reindex
-  instead of requiring that the indexes be exactly equal (:issue:`429`)
-
-New Features
-~~~~~~~~~~~~
-
-- Can pass Series to DataFrame.append with ignore_index=True for appending a
-  single row (:issue:`430`)
-- Add Spearman and Kendall correlation options to Series.corr and
-  DataFrame.corr (:issue:`428`)
-- Add new `get_value` and `set_value` methods to Series, DataFrame, and Panel
-  to very low-overhead access to scalar elements. df.get_value(row, column)
-  is about 3x faster than df[column][row] by handling fewer cases (:issue:`437`,
-  :issue:`438`). Add similar methods to sparse data structures for compatibility
-- Add Qt table widget to sandbox (:issue:`435`)
-- DataFrame.align can accept Series arguments, add axis keyword (:issue:`461`)
-- Implement new SparseList and SparseArray data structures. SparseSeries now
-  derives from SparseArray (:issue:`463`)
-- max_columns / max_rows options in set_printoptions (:issue:`453`)
-- Implement Series.rank and DataFrame.rank, fast versions of
-  scipy.stats.rankdata (:issue:`428`)
-- Implement DataFrame.from_items alternate constructor (:issue:`444`)
-- DataFrame.convert_objects method for inferring better dtypes for object
-  columns (:issue:`302`)
-- Add rolling_corr_pairwise function for computing Panel of correlation
-  matrices (:issue:`189`)
-- Add `margins` option to `pivot_table` for computing subgroup aggregates (GH
-  :issue:`114`)
-- Add `Series.from_csv` function (:issue:`482`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improve memory usage of `DataFrame.describe` (do not copy data
-  unnecessarily) (:issue:`425`)
-- Use same formatting function for outputting floating point Series to console
-  as in DataFrame (:issue:`420`)
-- DataFrame.delevel will try to infer better dtype for new columns (:issue:`440`)
-- Exclude non-numeric types in DataFrame.{corr, cov}
-- Override Index.astype to enable dtype casting (:issue:`412`)
-- Use same float formatting function for Series.__repr__ (:issue:`420`)
-- Use available console width to output DataFrame columns (:issue:`453`)
-- Accept ndarrays when setting items in Panel (:issue:`452`)
-- Infer console width when printing __repr__ of DataFrame to console (PR
-  :issue:`453`)
-- Optimize scalar value lookups in the general case by 25% or more in Series
-  and DataFrame
-- Can pass DataFrame/DataFrame and DataFrame/Series to
-  rolling_corr/rolling_cov (:issue:`462`)
-- Fix performance regression in cross-sectional count in DataFrame, affecting
-  DataFrame.dropna speed
-- Column deletion in DataFrame copies no data (computes views on blocks) (GH
-  :issue:`158`)
-- MultiIndex.get_level_values can take the level name
-- More helpful error message when DataFrame.plot fails on one of the columns
-  (:issue:`478`)
-- Improve performance of DataFrame.{index, columns} attribute lookup
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix O(K^2) memory leak caused by inserting many columns without
-  consolidating, had been present since 0.4.0 (:issue:`467`)
-- `DataFrame.count` should return Series with zero instead of NA with length-0
-  axis (:issue:`423`)
-- Fix Yahoo! Finance API usage in pandas.io.data (:issue:`419`, :issue:`427`)
-- Fix upstream bug causing failure in Series.align with empty Series (:issue:`434`)
-- Function passed to DataFrame.apply can return a list, as long as it's the
-  right length. Regression from 0.4 (:issue:`432`)
-- Don't "accidentally" upcast scalar values when indexing using .ix (:issue:`431`)
-- Fix groupby exception raised with as_index=False and single column selected
-  (:issue:`421`)
-- Implement DateOffset.__ne__ causing downstream bug (:issue:`456`)
-- Fix __doc__-related issue when converting py -> pyo with py2exe
-- Bug fix in left join Cython code with duplicate monotonic labels
-- Fix bug when unstacking multiple levels described in :issue:`451`
-- Exclude NA values in dtype=object arrays, regression from 0.5.0 (:issue:`469`)
-- Use Cython map_infer function in DataFrame.applymap to properly infer
-  output type, handle tuple return values and other things that were breaking
-  (:issue:`465`)
-- Handle floating point index values in HDFStore (:issue:`454`)
-- Fixed stale column reference bug (cached Series object) caused by type
-  change / item deletion in DataFrame (:issue:`473`)
-- Index.get_loc should always raise Exception when there are duplicates
-- Handle differently-indexed Series input to DataFrame constructor (:issue:`475`)
-- Omit nuisance columns in multi-groupby with Python function
-- Buglet in handling of single grouping in general apply
-- Handle type inference properly when passing list of lists or tuples to
-  DataFrame constructor (:issue:`484`)
-- Preserve Index / MultiIndex names in GroupBy.apply concatenation step (GH
-  :issue:`481`)
-
-Thanks
-~~~~~~
-
-- Ralph Bean
-- Luca Beltrame
-- Marius Cobzarenco
-- Andreas Hilboll
-- Jev Kuznetsov
-- Adam Lichtenstein
-- Wouter Overmeire
-- Fernando Perez
-- Nathan Pinger
-- Christian Prinoth
-- Alex Reyfman
-- Joon Ro
-- Chang She
-- Ted Square
-- Chris Uga
-- Dieter Vandenbussche
-
-pandas 0.6.0
-------------
-
-**Release date:** 11/25/2011
-
-API Changes
-~~~~~~~~~~~
-
-- Arithmetic methods like `sum` will attempt to sum dtype=object values by
-  default instead of excluding them (:issue:`382`)
-
-New Features
-~~~~~~~~~~~~
-
-- Add `melt` function to `pandas.core.reshape`
-- Add `level` parameter to group by level in Series and DataFrame
-  descriptive statistics (:issue:`313`)
-- Add `head` and `tail` methods to Series, analogous to to DataFrame (PR
-  :issue:`296`)
-- Add `Series.isin` function which checks if each value is contained in a
-  passed sequence (:issue:`289`)
-- Add `float_format` option to `Series.to_string`
-- Add `skip_footer` (:issue:`291`) and `converters` (:issue:`343`) options to
-  `read_csv` and `read_table`
-- Add proper, tested weighted least squares to standard and panel OLS (GH
-  :issue:`303`)
-- Add `drop_duplicates` and `duplicated` functions for removing duplicate
-  DataFrame rows and checking for duplicate rows, respectively (:issue:`319`)
-- Implement logical (boolean) operators ``&``, ``|``, ``^`` on DataFrame
-  (:issue:`347`)
-- Add `Series.mad`, mean absolute deviation, matching DataFrame
-- Add `QuarterEnd` DateOffset (:issue:`321`)
-- Add matrix multiplication function `dot` to DataFrame (:issue:`65`)
-- Add `orient` option to `Panel.from_dict` to ease creation of mixed-type
-  Panels (:issue:`359`, :issue:`301`)
-- Add `DataFrame.from_dict` with similar `orient` option
-- Can now pass list of tuples or list of lists to `DataFrame.from_records`
-  for fast conversion to DataFrame (:issue:`357`)
-- Can pass multiple levels to groupby, e.g. `df.groupby(level=[0, 1])` (GH
-  :issue:`103`)
-- Can sort by multiple columns in `DataFrame.sort_index` (:issue:`92`, :issue:`362`)
-- Add fast `get_value` and `put_value` methods to DataFrame and
-  micro-performance tweaks (:issue:`360`)
-- Add `cov` instance methods to Series and DataFrame (:issue:`194`, :issue:`362`)
-- Add bar plot option to `DataFrame.plot` (:issue:`348`)
-- Add `idxmin` and `idxmax` functions to Series and DataFrame for computing
-  index labels achieving maximum and minimum values (:issue:`286`)
-- Add `read_clipboard` function for parsing DataFrame from OS clipboard,
-  should work across platforms (:issue:`300`)
-- Add `nunique` function to Series for counting unique elements (:issue:`297`)
-- DataFrame constructor will use Series name if no columns passed (:issue:`373`)
-- Support regular expressions and longer delimiters in read_table/read_csv,
-  but does not handle quoted strings yet (:issue:`364`)
-- Add `DataFrame.to_html` for formatting DataFrame to HTML (:issue:`387`)
-- MaskedArray can be passed to DataFrame constructor and masked values will be
-  converted to NaN (:issue:`396`)
-- Add `DataFrame.boxplot` function (:issue:`368`, others)
-- Can pass extra args, kwds to DataFrame.apply (:issue:`376`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Raise more helpful exception if date parsing fails in DateRange (:issue:`298`)
-- Vastly improved performance of GroupBy on axes with a MultiIndex (:issue:`299`)
-- Print level names in hierarchical index in Series repr (:issue:`305`)
-- Return DataFrame when performing GroupBy on selected column and
-  as_index=False (:issue:`308`)
-- Can pass vector to `on` argument in `DataFrame.join` (:issue:`312`)
-- Don't show Series name if it's None in the repr, also omit length for short
-  Series (:issue:`317`)
-- Show legend by default in `DataFrame.plot`, add `legend` boolean flag (GH
-  :issue:`324`)
-- Significantly improved performance of `Series.order`, which also makes
-  np.unique called on a Series faster (:issue:`327`)
-- Faster cythonized count by level in Series and DataFrame (:issue:`341`)
-- Raise exception if dateutil 2.0 installed on Python 2.x runtime (:issue:`346`)
-- Significant GroupBy performance enhancement with multiple keys with many
-  "empty" combinations
-- New Cython vectorized function `map_infer` speeds up `Series.apply` and
-  `Series.map` significantly when passed elementwise Python function,
-  motivated by :issue:`355`
-- Cythonized `cache_readonly`, resulting in substantial micro-performance
-  enhancements throughout the codebase (:issue:`361`)
-- Special Cython matrix iterator for applying arbitrary reduction operations
-  with 3-5x better performance than `np.apply_along_axis` (:issue:`309`)
-- Add `raw` option to `DataFrame.apply` for getting better performance when
-  the passed function only requires an ndarray (:issue:`309`)
-- Improve performance of `MultiIndex.from_tuples`
-- Can pass multiple levels to `stack` and `unstack` (:issue:`370`)
-- Can pass multiple values columns to `pivot_table` (:issue:`381`)
-- Can call `DataFrame.delevel` with standard Index with name set (:issue:`393`)
-- Use Series name in GroupBy for result index (:issue:`363`)
-- Refactor Series/DataFrame stat methods to use common set of NaN-friendly
-  function
-- Handle NumPy scalar integers at C level in Cython conversion routines
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix bug in `DataFrame.to_csv` when writing a DataFrame with an index
-  name (:issue:`290`)
-- DataFrame should clear its Series caches on consolidation, was causing
-  "stale" Series to be returned in some corner cases (:issue:`304`)
-- DataFrame constructor failed if a column had a list of tuples (:issue:`293`)
-- Ensure that `Series.apply` always returns a Series and implement
-  `Series.round` (:issue:`314`)
-- Support boolean columns in Cythonized groupby functions (:issue:`315`)
-- `DataFrame.describe` should not fail if there are no numeric columns,
-  instead return categorical describe (:issue:`323`)
-- Fixed bug which could cause columns to be printed in wrong order in
-  `DataFrame.to_string` if specific list of columns passed (:issue:`325`)
-- Fix legend plotting failure if DataFrame columns are integers (:issue:`326`)
-- Shift start date back by one month for Yahoo! Finance API in pandas.io.data
-  (:issue:`329`)
-- Fix `DataFrame.join` failure on unconsolidated inputs (:issue:`331`)
-- DataFrame.min/max will no longer fail on mixed-type DataFrame (:issue:`337`)
-- Fix `read_csv` / `read_table` failure when passing list to index_col that is
-  not in ascending order (:issue:`349`)
-- Fix failure passing Int64Index to Index.union when both are monotonic
-- Fix error when passing SparseSeries to (dense) DataFrame constructor
-- Added missing bang at top of setup.py (:issue:`352`)
-- Change `is_monotonic` on MultiIndex so it properly compares the tuples
-- Fix MultiIndex outer join logic (:issue:`351`)
-- Set index name attribute with single-key groupby (:issue:`358`)
-- Bug fix in reflexive binary addition in Series and DataFrame for
-  non-commutative operations (like string concatenation) (:issue:`353`)
-- setupegg.py will invoke Cython (:issue:`192`)
-- Fix block consolidation bug after inserting column into MultiIndex (:issue:`366`)
-- Fix bug in join operations between Index and Int64Index (:issue:`367`)
-- Handle min_periods=0 case in moving window functions (:issue:`365`)
-- Fixed corner cases in DataFrame.apply/pivot with empty DataFrame (:issue:`378`)
-- Fixed repr exception when Series name is a tuple
-- Always return DateRange from `asfreq` (:issue:`390`)
-- Pass level names to `swaplavel` (:issue:`379`)
-- Don't lose index names in `MultiIndex.droplevel` (:issue:`394`)
-- Infer more proper return type in `DataFrame.apply` when no columns or rows
-  depending on whether the passed function is a reduction (:issue:`389`)
-- Always return NA/NaN from Series.min/max and DataFrame.min/max when all of a
-  row/column/values are NA (:issue:`384`)
-- Enable partial setting with .ix / advanced indexing (:issue:`397`)
-- Handle mixed-type DataFrames correctly in unstack, do not lose type
-  information (:issue:`403`)
-- Fix integer name formatting bug in Index.format and in Series.__repr__
-- Handle label types other than string passed to groupby (:issue:`405`)
-- Fix bug in .ix-based indexing with partial retrieval when a label is not
-  contained in a level
-- Index name was not being pickled (:issue:`408`)
-- Level name should be passed to result index in GroupBy.apply (:issue:`416`)
-
-Thanks
-~~~~~~
-
-- Craig Austin
-- Marius Cobzarenco
-- Joel Cross
-- Jeff Hammerbacher
-- Adam Klein
-- Thomas Kluyver
-- Jev Kuznetsov
-- Kieran O'Mahony
-- Wouter Overmeire
-- Nathan Pinger
-- Christian Prinoth
-- Skipper Seabold
-- Chang She
-- Ted Square
-- Aman Thakral
-- Chris Uga
-- Dieter Vandenbussche
-- carljv
-- rsamson
-
-pandas 0.5.0
-------------
-
-**Release date:** 10/24/2011
-
-This release of pandas includes a number of API changes (see below) and cleanup of deprecated APIs
-from pre-0.4.0 releases. There are also bug fixes, new features, numerous significant performance enhancements, and includes a new ipython
-completer hook to enable tab completion of DataFrame columns accesses and attributes (a new feature).
-
-In addition to the changes listed here from 0.4.3 to 0.5.0, the minor releases 4.1,
-0.4.2, and 0.4.3 brought some significant new functionality and performance improvements that are worth taking a look at.
-
-Thanks to all for bug reports, contributed patches and generally providing feedback on the library.
-
-API Changes
-~~~~~~~~~~~
-
-- `read_table`, `read_csv`, and `ExcelFile.parse` default arguments for
-  `index_col` is now None. To use one or more of the columns as the resulting
-  DataFrame's index, these must be explicitly specified now
-- Parsing functions like `read_csv` no longer parse dates by default (GH
-  :issue:`225`)
-- Removed `weights` option in panel regression which was not doing anything
-  principled (:issue:`155`)
-- Changed `buffer` argument name in `Series.to_string` to `buf`
-- `Series.to_string` and `DataFrame.to_string` now return strings by default
-  instead of printing to sys.stdout
-- Deprecated `nanRep` argument in various `to_string` and `to_csv` functions
-  in favor of `na_rep`. Will be removed in 0.6 (:issue:`275`)
-- Renamed `delimiter` to `sep` in `DataFrame.from_csv` for consistency
-- Changed order of `Series.clip` arguments to match those of `numpy.clip` and
-  added (unimplemented) `out` argument so `numpy.clip` can be called on a
-  Series (:issue:`272`)
-- Series functions renamed (and thus deprecated) in 0.4 series have been
-  removed:
-
-  - `asOf`, use `asof`
-  - `toDict`, use `to_dict`
-  - `toString`, use `to_string`
-  - `toCSV`, use `to_csv`
-  - `merge`, use `map`
-  - `applymap`, use `apply`
-  - `combineFirst`, use `combine_first`
-  - `_firstTimeWithValue` use `first_valid_index`
-  - `_lastTimeWithValue` use `last_valid_index`
-
-- DataFrame functions renamed / deprecated in 0.4 series have been removed:
-
-  - `asMatrix` method, use `as_matrix` or `values` attribute
-  - `combineFirst`, use `combine_first`
-  - `getXS`, use `xs`
-  - `merge`, use `join`
-  - `fromRecords`, use `from_records`
-  - `fromcsv`, use `from_csv`
-  - `toRecords`, use `to_records`
-  - `toDict`, use `to_dict`
-  - `toString`, use `to_string`
-  - `toCSV`, use `to_csv`
-  - `_firstTimeWithValue` use `first_valid_index`
-  - `_lastTimeWithValue` use `last_valid_index`
-  - `toDataMatrix` is no longer needed
-  - `rows()` method, use `index` attribute
-  - `cols()` method, use `columns` attribute
-  - `dropEmptyRows()`, use `dropna(how='all')`
-  - `dropIncompleteRows()`, use `dropna()`
-  - `tapply(f)`, use `apply(f, axis=1)`
-  - `tgroupby(keyfunc, aggfunc)`, use `groupby` with `axis=1`
-
-Deprecations Removed
-~~~~~~~~~~~~~~~~~~~~
-
-  - `indexField` argument in `DataFrame.from_records`
-  - `missingAtEnd` argument in `Series.order`. Use `na_last` instead
-  - `Series.fromValue` classmethod, use regular `Series` constructor instead
-  - Functions `parseCSV`, `parseText`, and `parseExcel` methods in
-    `pandas.io.parsers` have been removed
-  - `Index.asOfDate` function
-  - `Panel.getMinorXS` (use `minor_xs`) and `Panel.getMajorXS` (use
-    `major_xs`)
-  - `Panel.toWide`, use `Panel.to_wide` instead
-
-New Features
-~~~~~~~~~~~~
-
-- Added `DataFrame.align` method with standard join options
-- Added `parse_dates` option to `read_csv` and `read_table` methods to
-  optionally try to parse dates in the index columns
-- Add `nrows`, `chunksize`, and `iterator` arguments to `read_csv` and
-  `read_table`. The last two return a new `TextParser` class capable of
-  lazily iterating through chunks of a flat file (:issue:`242`)
-- Added ability to join on multiple columns in `DataFrame.join` (:issue:`214`)
-- Added private `_get_duplicates` function to `Index` for identifying
-  duplicate values more easily
-- Added column attribute access to DataFrame, e.g. df.A equivalent to df['A']
-  if 'A' is a column in the DataFrame (:issue:`213`)
-- Added IPython tab completion hook for DataFrame columns. (:issue:`233`, :issue:`230`)
-- Implement `Series.describe` for Series containing objects (:issue:`241`)
-- Add inner join option to `DataFrame.join` when joining on key(s) (:issue:`248`)
-- Can select set of DataFrame columns by passing a list to `__getitem__` (GH
-  :issue:`253`)
-- Can use & and | to intersection / union Index objects, respectively (GH
-  :issue:`261`)
-- Added `pivot_table` convenience function to pandas namespace (:issue:`234`)
-- Implemented `Panel.rename_axis` function (:issue:`243`)
-- DataFrame will show index level names in console output
-- Implemented `Panel.take`
-- Add `set_eng_float_format` function for setting alternate DataFrame
-  floating point string formatting
-- Add convenience `set_index` function for creating a DataFrame index from
-  its existing columns
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Major performance improvements in file parsing functions `read_csv` and
-  `read_table`
-- Added Cython function for converting tuples to ndarray very fast. Speeds up
-  many MultiIndex-related operations
-- File parsing functions like `read_csv` and `read_table` will explicitly
-  check if a parsed index has duplicates and raise a more helpful exception
-  rather than deferring the check until later
-- Refactored merging / joining code into a tidy class and disabled unnecessary
-  computations in the float/object case, thus getting about 10% better
-  performance (:issue:`211`)
-- Improved speed of `DataFrame.xs` on mixed-type DataFrame objects by about
-  5x, regression from 0.3.0 (:issue:`215`)
-- With new `DataFrame.align` method, speeding up binary operations between
-  differently-indexed DataFrame objects by 10-25%.
-- Significantly sped up conversion of nested dict into DataFrame (:issue:`212`)
-- Can pass hierarchical index level name to `groupby` instead of the level
-  number if desired (:issue:`223`)
-- Add support for different delimiters in `DataFrame.to_csv` (:issue:`244`)
-- Add more helpful error message when importing pandas post-installation from
-  the source directory (:issue:`250`)
-- Significantly speed up DataFrame `__repr__` and `count` on large mixed-type
-  DataFrame objects
-- Better handling of pyx file dependencies in Cython module build (:issue:`271`)
-
-Bug Fixes
-~~~~~~~~~
-
-- `read_csv` / `read_table` fixes
-
-  - Be less aggressive about converting float->int in cases of floating point
-    representations of integers like 1.0, 2.0, etc.
-  - "True"/"False" will not get correctly converted to boolean
-  - Index name attribute will get set when specifying an index column
-  - Passing column names should force `header=None` (:issue:`257`)
-  - Don't modify passed column names when `index_col` is not None
-    (:issue:`258`)
-  - Can sniff CSV separator in zip file (since seek is not supported, was
-    failing before)
-
-- Worked around matplotlib "bug" in which series[:, np.newaxis] fails. Should
-  be reported upstream to matplotlib (:issue:`224`)
-- DataFrame.iteritems was not returning Series with the name attribute
-  set. Also neither was DataFrame._series
-- Can store datetime.date objects in HDFStore (:issue:`231`)
-- Index and Series names are now stored in HDFStore
-- Fixed problem in which data would get upcasted to object dtype in
-  GroupBy.apply operations (:issue:`237`)
-- Fixed outer join bug with empty DataFrame (:issue:`238`)
-- Can create empty Panel (:issue:`239`)
-- Fix join on single key when passing list with 1 entry (:issue:`246`)
-- Don't raise Exception on plotting DataFrame with an all-NA column (:issue:`251`,
-  :issue:`254`)
-- Bug min/max errors when called on integer DataFrames (:issue:`241`)
-- `DataFrame.iteritems` and `DataFrame._series` not assigning name attribute
-- Panel.__repr__ raised exception on length-0 major/minor axes
-- `DataFrame.join` on key with empty DataFrame produced incorrect columns
-- Implemented `MultiIndex.diff` (:issue:`260`)
-- `Int64Index.take` and `MultiIndex.take` lost name field, fix downstream
-  issue :issue:`262`
-- Can pass list of tuples to `Series` (:issue:`270`)
-- Can pass level name to `DataFrame.stack`
-- Support set operations between MultiIndex and Index
-- Fix many corner cases in MultiIndex set operations
-  - Fix MultiIndex-handling bug with GroupBy.apply when returned groups are not
-  indexed the same
-- Fix corner case bugs in DataFrame.apply
-- Setting DataFrame index did not cause Series cache to get cleared
-- Various int32 -> int64 platform-specific issues
-- Don't be too aggressive converting to integer when parsing file with
-  MultiIndex (:issue:`285`)
-- Fix bug when slicing Series with negative indices before beginning
-
-Thanks
-~~~~~~
-
-- Thomas Kluyver
-- Daniel Fortunov
-- Aman Thakral
-- Luca Beltrame
-- Wouter Overmeire
-
-pandas 0.4.3
-------------
-
-**Release date:** 10/9/2011
-
-is is largely a bugfix release from 0.4.2 but also includes a handful of new
-d enhanced features. Also, pandas can now be installed and used on Python 3
-hanks Thomas Kluyver!).
-
-New Features
-~~~~~~~~~~~~
-
-- Python 3 support using 2to3 (:issue:`200`, Thomas Kluyver)
-- Add `name` attribute to `Series` and added relevant logic and tests. Name
-  now prints as part of `Series.__repr__`
-- Add `name` attribute to standard Index so that stacking / unstacking does
-  not discard names and so that indexed DataFrame objects can be reliably
-  round-tripped to flat files, pickle, HDF5, etc.
-- Add `isnull` and `notnull` as instance methods on Series (:issue:`209`, :issue:`203`)
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Skip xlrd-related unit tests if not installed
-- `Index.append` and `MultiIndex.append` can accept a list of Index objects to
-  concatenate together
-- Altered binary operations on differently-indexed SparseSeries objects to use
-  the integer-based (dense) alignment logic which is faster with a larger
-  number of blocks (:issue:`205`)
-- Refactored `Series.__repr__` to be a bit more clean and consistent
-
-API Changes
-~~~~~~~~~~~
-
-- `Series.describe` and `DataFrame.describe` now bring the 25% and 75%
-  quartiles instead of the 10% and 90% deciles. The other outputs have not
-  changed
-- `Series.toString` will print deprecation warning, has been de-camelCased to
-  `to_string`
-
-Bug Fixes
-~~~~~~~~~
-
-- Fix broken interaction between `Index` and `Int64Index` when calling
-  intersection. Implement `Int64Index.intersection`
-- `MultiIndex.sortlevel` discarded the level names (:issue:`202`)
-- Fix bugs in groupby, join, and append due to improper concatenation of
-  `MultiIndex` objects (:issue:`201`)
-- Fix regression from 0.4.1, `isnull` and `notnull` ceased to work on other
-  kinds of Python scalar objects like `datetime.datetime`
-- Raise more helpful exception when attempting to write empty DataFrame or
-  LongPanel to `HDFStore` (:issue:`204`)
-- Use stdlib csv module to properly escape strings with commas in
-  `DataFrame.to_csv` (:issue:`206`, Thomas Kluyver)
-- Fix Python ndarray access in Cython code for sparse blocked index integrity
-  check
-- Fix bug writing Series to CSV in Python 3 (:issue:`209`)
-- Miscellaneous Python 3 bugfixes
-
-Thanks
-~~~~~~
-
-- Thomas Kluyver
-- rsamson
-
-pandas 0.4.2
-------------
-
-**Release date:** 10/3/2011
-
-is is a performance optimization release with several bug fixes. The new
-t64Index and new merging / joining Cython code and related Python
-frastructure are the main new additions
-
-New Features
-~~~~~~~~~~~~
-
-- Added fast `Int64Index` type with specialized join, union,
-  intersection. Will result in significant performance enhancements for
-  int64-based time series (e.g. using NumPy's datetime64 one day) and also
-  faster operations on DataFrame objects storing record array-like data.
-- Refactored `Index` classes to have a `join` method and associated data
-  alignment routines throughout the codebase to be able to leverage optimized
-  joining / merging routines.
-- Added `Series.align` method for aligning two series with choice of join
-  method
-- Wrote faster Cython data alignment / merging routines resulting in
-  substantial speed increases
-- Added `is_monotonic` property to `Index` classes with associated Cython
-  code to evaluate the monotonicity of the `Index` values
-- Add method `get_level_values` to `MultiIndex`
-- Implemented shallow copy of `BlockManager` object in `DataFrame` internals
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved performance of `isnull` and `notnull`, a regression from v0.3.0
-  (:issue:`187`)
-- Wrote templating / code generation script to auto-generate Cython code for
-  various functions which need to be available for the 4 major data types
-  used in pandas (float64, bool, object, int64)
-- Refactored code related to `DataFrame.join` so that intermediate aligned
-  copies of the data in each `DataFrame` argument do not need to be
-  created. Substantial performance increases result (:issue:`176`)
-- Substantially improved performance of generic `Index.intersection` and
-  `Index.union`
-- Improved performance of `DateRange.union` with overlapping ranges and
-  non-cacheable offsets (like Minute). Implemented analogous fast
-  `DateRange.intersection` for overlapping ranges.
-- Implemented `BlockManager.take` resulting in significantly faster `take`
-  performance on mixed-type `DataFrame` objects (:issue:`104`)
-- Improved performance of `Series.sort_index`
-- Significant groupby performance enhancement: removed unnecessary integrity
-  checks in DataFrame internals that were slowing down slicing operations to
-  retrieve groups
-- Added informative Exception when passing dict to DataFrame groupby
-  aggregation with axis != 0
-
-API Changes
-~~~~~~~~~~~
-
-Bug Fixes
-~~~~~~~~~
-
-- Fixed minor unhandled exception in Cython code implementing fast groupby
-  aggregation operations
-- Fixed bug in unstacking code manifesting with more than 3 hierarchical
-  levels
-- Throw exception when step specified in label-based slice (:issue:`185`)
-- Fix isnull to correctly work with np.float32. Fix upstream bug described in
-  :issue:`182`
-- Finish implementation of as_index=False in groupby for DataFrame
-  aggregation (:issue:`181`)
-- Raise SkipTest for pre-epoch HDFStore failure. Real fix will be sorted out
-  via datetime64 dtype
-
-Thanks
-~~~~~~
-
-- Uri Laserson
-- Scott Sinclair
-
-pandas 0.4.1
-------------
-
-**Release date:** 9/25/2011
-
-is is primarily a bug fix release but includes some new features and
-improvements
-
-New Features
-~~~~~~~~~~~~
-
-- Added new `DataFrame` methods `get_dtype_counts` and property `dtypes`
-- Setting of values using ``.ix`` indexing attribute in mixed-type DataFrame
-  objects has been implemented (fixes :issue:`135`)
-- `read_csv` can read multiple columns into a `MultiIndex`. DataFrame's
-  `to_csv` method will properly write out a `MultiIndex` which can be read
-  back (:issue:`151`, thanks to Skipper Seabold)
-- Wrote fast time series merging / joining methods in Cython. Will be
-  integrated later into DataFrame.join and related functions
-- Added `ignore_index` option to `DataFrame.append` for combining unindexed
-  records stored in a DataFrame
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Some speed enhancements with internal Index type-checking function
-- `DataFrame.rename` has a new `copy` parameter which can rename a DataFrame
-  in place
-- Enable unstacking by level name (:issue:`142`)
-- Enable sortlevel to work by level name (:issue:`141`)
-- `read_csv` can automatically "sniff" other kinds of delimiters using
-  `csv.Sniffer` (:issue:`146`)
-- Improved speed of unit test suite by about 40%
-- Exception will not be raised calling `HDFStore.remove` on non-existent node
-  with where clause
-- Optimized `_ensure_index` function resulting in performance savings in
-  type-checking Index objects
-
-API Changes
-~~~~~~~~~~~
-
-Bug Fixes
-~~~~~~~~~
-
-- Fixed DataFrame constructor bug causing downstream problems (e.g. .copy()
-  failing) when passing a Series as the values along with a column name and
-  index
-- Fixed single-key groupby on DataFrame with as_index=False (:issue:`160`)
-- `Series.shift` was failing on integer Series (:issue:`154`)
-- `unstack` methods were producing incorrect output in the case of duplicate
-  hierarchical labels. An exception will now be raised (:issue:`147`)
-- Calling `count` with level argument caused reduceat failure or segfault in
-  earlier NumPy (:issue:`169`)
-- Fixed `DataFrame.corrwith` to automatically exclude non-numeric data (GH
-  :issue:`144`)
-- Unicode handling bug fixes in `DataFrame.to_string` (:issue:`138`)
-- Excluding OLS degenerate unit test case that was causing platform specific
-  failure (:issue:`149`)
-- Skip blosc-dependent unit tests for PyTables < 2.2 (:issue:`137`)
-- Calling `copy` on `DateRange` did not copy over attributes to the new object
-  (:issue:`168`)
-- Fix bug in `HDFStore` in which Panel data could be appended to a Table with
-  different item order, thus resulting in an incorrect result read back
-
-Thanks
-~~~~~~
-
-- Yaroslav Halchenko
-- Jeff Reback
-- Skipper Seabold
-- Dan Lovell
-- Nick Pentreath
-
-pandas 0.4.0
-------------
-
-**Release date:** 9/12/2011
-
-New Features
-~~~~~~~~~~~~
-
-- `pandas.core.sparse` module: "Sparse" (mostly-NA, or some other fill value)
-  versions of `Series`, `DataFrame`, and `Panel`. For low-density data, this
-  will result in significant performance boosts, and smaller memory
-  footprint. Added `to_sparse` methods to `Series`, `DataFrame`, and
-  `Panel`. See online documentation for more on these
-- Fancy indexing operator on Series / DataFrame, e.g. via .ix operator. Both
-  getting and setting of values is supported; however, setting values will only
-  currently work on homogeneously-typed DataFrame objects. Things like:
-
-  - series.ix[[d1, d2, d3]]
-  - frame.ix[5:10, ['C', 'B', 'A']], frame.ix[5:10, 'A':'C']
-  - frame.ix[date1:date2]
-
-- Significantly enhanced `groupby` functionality
-
-  - Can groupby multiple keys, e.g. df.groupby(['key1', 'key2']). Iteration with
-    multiple groupings products a flattened tuple
-  - "Nuisance" columns (non-aggregatable) will automatically be excluded from
-    DataFrame aggregation operations
-  - Added automatic "dispatching to Series / DataFrame methods to more easily
-    invoke methods on groups. e.g. s.groupby(crit).std() will work even though
-    `std` is not implemented on the `GroupBy` class
-
-- Hierarchical / multi-level indexing
-
-  - New the `MultiIndex` class. Integrated `MultiIndex` into `Series` and
-    `DataFrame` fancy indexing, slicing, __getitem__ and __setitem,
-    reindexing, etc. Added `level` keyword argument to `groupby` to enable
-    grouping by a level of a `MultiIndex`
-
-- New data reshaping functions: `stack` and `unstack` on DataFrame and Series
-
-  - Integrate with MultiIndex to enable sophisticated reshaping of data
-
-- `Index` objects (labels for axes) are now capable of holding tuples
-- `Series.describe`, `DataFrame.describe`: produces an R-like table of summary
-  statistics about each data column
-- `DataFrame.quantile`, `Series.quantile` for computing sample quantiles of data
-  across requested axis
-- Added general `DataFrame.dropna` method to replace `dropIncompleteRows` and
-  `dropEmptyRows`, deprecated those.
-- `Series` arithmetic methods with optional fill_value for missing data,
-  e.g. a.add(b, fill_value=0). If a location is missing for both it will still
-  be missing in the result though.
-- fill_value option has been added to `DataFrame`.{add, mul, sub, div} methods
-  similar to `Series`
-- Boolean indexing with `DataFrame` objects: data[data > 0.1] = 0.1 or
-  data[data> other] = 1.
-- `pytz` / tzinfo support in `DateRange`
-
-  - `tz_localize`, `tz_normalize`, and `tz_validate` methods added
-
-- Added `ExcelFile` class to `pandas.io.parsers` for parsing multiple sheets out
-  of a single Excel 2003 document
-- `GroupBy` aggregations can now optionally *broadcast*, e.g. produce an object
-  of the same size with the aggregated value propagated
-- Added `select` function in all data structures: reindex axis based on
-  arbitrary criterion (function returning boolean value),
-  e.g. frame.select(lambda x: 'foo' in x, axis=1)
-- `DataFrame.consolidate` method, API function relating to redesigned internals
-- `DataFrame.insert` method for inserting column at a specified location rather
-  than the default __setitem__ behavior (which puts it at the end)
-- `HDFStore` class in `pandas.io.pytables` has been largely rewritten using
-  patches from Jeff Reback from others. It now supports mixed-type `DataFrame`
-  and `Series` data and can store `Panel` objects. It also has the option to
-  query `DataFrame` and `Panel` data. Loading data from legacy `HDFStore`
-  files is supported explicitly in the code
-- Added `set_printoptions` method to modify appearance of DataFrame tabular
-  output
-- `rolling_quantile` functions; a moving version of `Series.quantile` /
-  `DataFrame.quantile`
-- Generic `rolling_apply` moving window function
-- New `drop` method added to `Series`, `DataFrame`, etc. which can drop a set of
-  labels from an axis, producing a new object
-- `reindex` methods now sport a `copy` option so that data is not forced to be
-  copied then the resulting object is indexed the same
-- Added `sort_index` methods to Series and Panel. Renamed `DataFrame.sort`
-  to `sort_index`. Leaving `DataFrame.sort` for now.
-- Added ``skipna`` option to statistical instance methods on all the data
-  structures
-- `pandas.io.data` module providing a consistent interface for reading time
-  series data from several different sources
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- The 2-dimensional `DataFrame` and `DataMatrix` classes have been extensively
-  redesigned internally into a single class `DataFrame`, preserving where
-  possible their optimal performance characteristics. This should reduce
-  confusion from users about which class to use.
-
-  - Note that under the hood there is a new essentially "lazy evaluation"
-    scheme within respect to adding columns to DataFrame. During some
-    operations, like-typed blocks will be "consolidated" but not before.
-
-- `DataFrame` accessing columns repeatedly is now significantly faster than
-  `DataMatrix` used to be in 0.3.0 due to an internal Series caching mechanism
-  (which are all views on the underlying data)
-- Column ordering for mixed type data is now completely consistent in
-  `DataFrame`. In prior releases, there was inconsistent column ordering in
-  `DataMatrix`
-- Improved console / string formatting of DataMatrix with negative numbers
-- Improved tabular data parsing functions, `read_table` and `read_csv`:
-
-  - Added `skiprows` and `na_values` arguments to `pandas.io.parsers` functions
-    for more flexible IO
-  - `parseCSV` / `read_csv` functions and others in `pandas.io.parsers` now can
-    take a list of custom NA values, and also a list of rows to skip
-
-- Can slice `DataFrame` and get a view of the data (when homogeneously typed),
-  e.g. frame.xs(idx, copy=False) or frame.ix[idx]
-- Many speed optimizations throughout `Series` and `DataFrame`
-- Eager evaluation of groups when calling ``groupby`` functions, so if there is
-  an exception with the grouping function it will raised immediately versus
-  sometime later on when the groups are needed
-- `datetools.WeekOfMonth` offset can be parameterized with `n` different than 1
-  or -1.
-- Statistical methods on DataFrame like `mean`, `std`, `var`, `skew` will now
-  ignore non-numerical data. Before a not very useful error message was
-  generated. A flag `numeric_only` has been added to `DataFrame.sum` and
-  `DataFrame.count` to enable this behavior in those methods if so desired
-  (disabled by default)
-- `DataFrame.pivot` generalized to enable pivoting multiple columns into a
-  `DataFrame` with hierarchical columns
-- `DataFrame` constructor can accept structured / record arrays
-- `Panel` constructor can accept a dict of DataFrame-like objects. Do not
-  need to use `from_dict` anymore (`from_dict` is there to stay, though).
-
-API Changes
-~~~~~~~~~~~
-
-- The `DataMatrix` variable now refers to `DataFrame`, will be removed within
-  two releases
-- `WidePanel` is now known as `Panel`. The `WidePanel` variable in the pandas
-  namespace now refers to the renamed `Panel` class
-- `LongPanel` and `Panel` / `WidePanel` now no longer have a common
-  subclass. `LongPanel` is now a subclass of `DataFrame` having a number of
-  additional methods and a hierarchical index instead of the old
-  `LongPanelIndex` object, which has been removed. Legacy `LongPanel` pickles
-  may not load properly
-- Cython is now required to build `pandas` from a development branch. This was
-  done to avoid continuing to check in cythonized C files into source
-  control. Builds from released source distributions will not require Cython
-- Cython code has been moved up to a top level `pandas/src` directory. Cython
-  extension modules have been renamed and promoted from the `lib` subpackage to
-  the top level, i.e.
-
-  - `pandas.lib.tseries` -> `pandas._tseries`
-  - `pandas.lib.sparse` -> `pandas._sparse`
-
-- `DataFrame` pickling format has changed. Backwards compatibility for legacy
-  pickles is provided, but it's recommended to consider PyTables-based
-  `HDFStore` for storing data with a longer expected shelf life
-- A `copy` argument has been added to the `DataFrame` constructor to avoid
-  unnecessary copying of data. Data is no longer copied by default when passed
-  into the constructor
-- Handling of boolean dtype in `DataFrame` has been improved to support storage
-  of boolean data with NA / NaN values. Before it was being converted to float64
-  so this should not (in theory) cause API breakage
-- To optimize performance, Index objects now only check that their labels are
-  unique when uniqueness matters (i.e. when someone goes to perform a
-  lookup). This is a potentially dangerous tradeoff, but will lead to much
-  better performance in many places (like groupby).
-- Boolean indexing using Series must now have the same indices (labels)
-- Backwards compatibility support for begin/end/nPeriods keyword arguments in
-  DateRange class has been removed
-- More intuitive / shorter filling aliases `ffill` (for `pad`) and `bfill` (for
-  `backfill`) have been added to the functions that use them: `reindex`,
-  `asfreq`, `fillna`.
-- `pandas.core.mixins` code moved to `pandas.core.generic`
-- `buffer` keyword arguments (e.g. `DataFrame.toString`) renamed to `buf` to
-  avoid using Python built-in name
-- `DataFrame.rows()` removed (use `DataFrame.index`)
-- Added deprecation warning to `DataFrame.cols()`, to be removed in next release
-- `DataFrame` deprecations and de-camelCasing: `merge`, `asMatrix`,
-  `toDataMatrix`, `_firstTimeWithValue`, `_lastTimeWithValue`, `toRecords`,
-  `fromRecords`, `tgroupby`, `toString`
-- `pandas.io.parsers` method deprecations
-
-  - `parseCSV` is now `read_csv` and keyword arguments have been de-camelCased
-  - `parseText` is now `read_table`
-  - `parseExcel` is replaced by the `ExcelFile` class and its `parse` method
-
-- `fillMethod` arguments (deprecated in prior release) removed, should be
-  replaced with `method`
-- `Series.fill`, `DataFrame.fill`, and `Panel.fill` removed, use `fillna`
-  instead
-- `groupby` functions now exclude NA / NaN values from the list of groups. This
-  matches R behavior with NAs in factors e.g. with the `tapply` function
-- Removed `parseText`, `parseCSV` and `parseExcel` from pandas namespace
-- `Series.combineFunc` renamed to `Series.combine` and made a bit more general
-  with a `fill_value` keyword argument defaulting to NaN
-- Removed `pandas.core.pytools` module. Code has been moved to
-  `pandas.core.common`
-- Tacked on `groupName` attribute for groups in GroupBy renamed to `name`
-- Panel/LongPanel `dims` attribute renamed to `shape` to be more conformant
-- Slicing a `Series` returns a view now
-- More Series deprecations / renaming: `toCSV` to `to_csv`, `asOf` to `asof`,
-  `merge` to `map`, `applymap` to `apply`, `toDict` to `to_dict`,
-  `combineFirst` to `combine_first`. Will print `FutureWarning`.
-- `DataFrame.to_csv` does not write an "index" column label by default
-  anymore since the output file can be read back without it. However, there
-  is a new ``index_label`` argument. So you can do ``index_label='index'`` to
-  emulate the old behavior
-- `datetools.Week` argument renamed from `dayOfWeek` to `weekday`
-- `timeRule` argument in `shift` has been deprecated in favor of using the
-  `offset` argument for everything. So you can still pass a time rule string
-  to `offset`
-- Added optional `encoding` argument to `read_csv`, `read_table`, `to_csv`,
-  `from_csv` to handle unicode in python 2.x
-
-Bug Fixes
-~~~~~~~~~
-
-- Column ordering in `pandas.io.parsers.parseCSV` will match CSV in the presence
-  of mixed-type data
-- Fixed handling of Excel 2003 dates in `pandas.io.parsers`
-- `DateRange` caching was happening with high resolution `DateOffset` objects,
-  e.g. `DateOffset(seconds=1)`. This has been fixed
-- Fixed __truediv__ issue in `DataFrame`
-- Fixed `DataFrame.toCSV` bug preventing IO round trips in some cases
-- Fixed bug in `Series.plot` causing matplotlib to barf in exceptional cases
-- Disabled `Index` objects from being hashable, like ndarrays
-- Added `__ne__` implementation to `Index` so that operations like ts[ts != idx]
-  will work
-- Added `__ne__` implementation to `DataFrame`
-- Bug / unintuitive result when calling `fillna` on unordered labels
-- Bug calling `sum` on boolean DataFrame
-- Bug fix when creating a DataFrame from a dict with scalar values
-- Series.{sum, mean, std, ...} now return NA/NaN when the whole Series is NA
-- NumPy 1.4 through 1.6 compatibility fixes
-- Fixed bug in bias correction in `rolling_cov`, was affecting `rolling_corr`
-  too
-- R-square value was incorrect in the presence of fixed and time effects in
-  the `PanelOLS` classes
-- `HDFStore` can handle duplicates in table format, will take
-
-Thanks
-~~~~~~
-
-- Joon Ro
-- Michael Pennington
-- Chris Uga
-- Chris Withers
-- Jeff Reback
-- Ted Square
-- Craig Austin
-- William Ferreira
-- Daniel Fortunov
-- Tony Roberts
-- Martin Felder
-- John Marino
-- Tim McNamara
-- Justin Berka
-- Dieter Vandenbussche
-- Shane Conway
-- Skipper Seabold
-- Chris Jordan-Squire
-
-pandas 0.3.0
-------------
-
-**Release date:** February 20, 2011
-
-New features
-~~~~~~~~~~~~
-
-- `corrwith` function to compute column- or row-wise correlations between two
-  DataFrame objects
-- Can boolean-index DataFrame objects, e.g. df[df > 2] = 2, px[px > last_px] = 0
-- Added comparison magic methods (__lt__, __gt__, etc.)
-- Flexible explicit arithmetic methods (add, mul, sub, div, etc.)
-- Added `reindex_like` method
-- Added `reindex_like` method to WidePanel
-- Convenience functions for accessing SQL-like databases in `pandas.io.sql`
-  module
-- Added (still experimental) HDFStore class for storing pandas data
-  structures using HDF5 / PyTables in `pandas.io.pytables` module
-- Added WeekOfMonth date offset
-- `pandas.rpy` (experimental) module created, provide some interfacing /
-  conversion between rpy2 and pandas
-
-Improvements to existing features
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Unit test coverage: 100% line coverage of core data structures
-- Speed enhancement to rolling_{median, max, min}
-- Column ordering between DataFrame and DataMatrix is now consistent: before
-  DataFrame would not respect column order
-- Improved {Series, DataFrame}.plot methods to be more flexible (can pass
-  matplotlib Axis arguments, plot DataFrame columns in multiple subplots,
-  etc.)
-
-API Changes
-~~~~~~~~~~~
-
-- Exponentially-weighted moment functions in `pandas.stats.moments` have a
-  more consistent API and accept a min_periods argument like their regular
-  moving counterparts.
-- **fillMethod** argument in Series, DataFrame changed to **method**,
-  `FutureWarning` added.
-- **fill** method in Series, DataFrame/DataMatrix, WidePanel renamed to
-  **fillna**, `FutureWarning` added to **fill**
-- Renamed **DataFrame.getXS** to **xs**, `FutureWarning` added
-- Removed **cap** and **floor** functions from DataFrame, renamed to
-  **clip_upper** and **clip_lower** for consistency with NumPy
-
-Bug Fixes
-~~~~~~~~~
-
-- Fixed bug in IndexableSkiplist Cython code that was breaking rolling_max
-  function
-- Numerous numpy.int64-related indexing fixes
-- Several NumPy 1.4.0 NaN-handling fixes
-- Bug fixes to pandas.io.parsers.parseCSV
-- Fixed `DateRange` caching issue with unusual date offsets
-- Fixed bug in `DateRange.union`
-- Fixed corner case in `IndexableSkiplist` implementation
diff --git a/doc/source/remote_data.rst b/doc/source/remote_data.rst
deleted file mode 100644
index 7980133582125..0000000000000
--- a/doc/source/remote_data.rst
+++ /dev/null
@@ -1,31 +0,0 @@
-.. _remote_data:
-
-.. currentmodule:: pandas
-
-******************
-Remote Data Access
-******************
-
-.. _remote_data.pandas_datareader:
-
-DataReader
-----------
-
-The sub-package ``pandas.io.data`` is removed in favor of a separately
-installable `pandas-datareader package
-<https://github.com/pydata/pandas-datareader>`_. This will allow the data
-modules to be independently updated to your pandas installation. The API for
-``pandas-datareader v0.1.1`` is the same as in ``pandas v0.16.1``.
-(:issue:`8961`)
-
-   You should replace the imports of the following:
-
-   .. code-block:: python
-
-      from pandas.io import data, wb
-
-   With:
-
-   .. code-block:: python
-
-      from pandas_datareader import data, wb
diff --git a/doc/source/reshaping.rst b/doc/source/reshaping.rst
deleted file mode 100644
index eccaa9474bf6d..0000000000000
--- a/doc/source/reshaping.rst
+++ /dev/null
@@ -1,669 +0,0 @@
-.. currentmodule:: pandas
-.. _reshaping:
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   import pandas as pd
-   pd.options.display.max_rows=15
-   np.set_printoptions(precision=4, suppress=True)
-
-**************************
-Reshaping and Pivot Tables
-**************************
-
-Reshaping by pivoting DataFrame objects
----------------------------------------
-
-.. ipython::
-   :suppress:
-
-   In [1]: import pandas.util.testing as tm; tm.N = 3
-
-   In [2]: def unpivot(frame):
-      ...:         N, K = frame.shape
-      ...:         data = {'value' : frame.values.ravel('F'),
-      ...:                 'variable' : np.asarray(frame.columns).repeat(N),
-      ...:                 'date' : np.tile(np.asarray(frame.index), K)}
-      ...:         columns = ['date', 'variable', 'value']
-      ...:         return pd.DataFrame(data, columns=columns)
-      ...:
-
-   In [3]: df = unpivot(tm.makeTimeDataFrame())
-
-Data is often stored in CSV files or databases in so-called "stacked" or
-"record" format:
-
-.. ipython:: python
-
-   df
-
-
-For the curious here is how the above DataFrame was created:
-
-.. code-block:: python
-
-   import pandas.util.testing as tm; tm.N = 3
-   def unpivot(frame):
-       N, K = frame.shape
-       data = {'value' : frame.values.ravel('F'),
-               'variable' : np.asarray(frame.columns).repeat(N),
-               'date' : np.tile(np.asarray(frame.index), K)}
-       return pd.DataFrame(data, columns=['date', 'variable', 'value'])
-   df = unpivot(tm.makeTimeDataFrame())
-
-To select out everything for variable ``A`` we could do:
-
-.. ipython:: python
-
-   df[df['variable'] == 'A']
-
-But suppose we wish to do time series operations with the variables. A better
-representation would be where the ``columns`` are the unique variables and an
-``index`` of dates identifies individual observations. To reshape the data into
-this form, use the ``pivot`` function:
-
-.. ipython:: python
-
-   df.pivot(index='date', columns='variable', values='value')
-
-If the ``values`` argument is omitted, and the input DataFrame has more than
-one column of values which are not used as column or index inputs to ``pivot``,
-then the resulting "pivoted" DataFrame will have :ref:`hierarchical columns
-<advanced.hierarchical>` whose topmost level indicates the respective value
-column:
-
-.. ipython:: python
-
-   df['value2'] = df['value'] * 2
-   pivoted = df.pivot('date', 'variable')
-   pivoted
-
-You of course can then select subsets from the pivoted DataFrame:
-
-.. ipython:: python
-
-   pivoted['value2']
-
-Note that this returns a view on the underlying data in the case where the data
-are homogeneously-typed.
-
-.. _reshaping.stacking:
-
-Reshaping by stacking and unstacking
-------------------------------------
-
-Closely related to the ``pivot`` function are the related ``stack`` and
-``unstack`` functions currently available on Series and DataFrame. These
-functions are designed to work together with ``MultiIndex`` objects (see the
-section on :ref:`hierarchical indexing <advanced.hierarchical>`). Here are
-essentially what these functions do:
-
-  - ``stack``: "pivot" a level of the (possibly hierarchical) column labels,
-    returning a DataFrame with an index with a new inner-most level of row
-    labels.
-  - ``unstack``: inverse operation from ``stack``: "pivot" a level of the
-    (possibly hierarchical) row index to the column axis, producing a reshaped
-    DataFrame with a new inner-most level of column labels.
-
-The clearest way to explain is by example. Let's take a prior example data set
-from the hierarchical indexing section:
-
-.. ipython:: python
-
-   tuples = list(zip(*[['bar', 'bar', 'baz', 'baz',
-                        'foo', 'foo', 'qux', 'qux'],
-                       ['one', 'two', 'one', 'two',
-                        'one', 'two', 'one', 'two']]))
-   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
-   df = pd.DataFrame(np.random.randn(8, 2), index=index, columns=['A', 'B'])
-   df2 = df[:4]
-   df2
-
-The ``stack`` function "compresses" a level in the DataFrame's columns to
-produce either:
-
-  - A Series, in the case of a simple column Index
-  - A DataFrame, in the case of a ``MultiIndex`` in the columns
-
-If the columns have a ``MultiIndex``, you can choose which level to stack. The
-stacked level becomes the new lowest level in a ``MultiIndex`` on the columns:
-
-.. ipython:: python
-
-   stacked = df2.stack()
-   stacked
-
-With a "stacked" DataFrame or Series (having a ``MultiIndex`` as the
-``index``), the inverse operation of ``stack`` is ``unstack``, which by default
-unstacks the **last level**:
-
-.. ipython:: python
-
-   stacked.unstack()
-   stacked.unstack(1)
-   stacked.unstack(0)
-
-.. _reshaping.unstack_by_name:
-
-If the indexes have names, you can use the level names instead of specifying
-the level numbers:
-
-.. ipython:: python
-
-   stacked.unstack('second')
-
-Notice that the ``stack`` and ``unstack`` methods implicitly sort the index
-levels involved. Hence a call to ``stack`` and then ``unstack``, or viceversa,
-will result in a **sorted** copy of the original DataFrame or Series:
-
-.. ipython:: python
-
-   index = pd.MultiIndex.from_product([[2,1], ['a', 'b']])
-   df = pd.DataFrame(np.random.randn(4), index=index, columns=['A'])
-   df
-   all(df.unstack().stack() == df.sort_index())
-
-while the above code will raise a ``TypeError`` if the call to ``sort_index`` is
-removed.
-
-.. _reshaping.stack_multiple:
-
-Multiple Levels
-~~~~~~~~~~~~~~~
-
-You may also stack or unstack more than one level at a time by passing a list
-of levels, in which case the end result is as if each level in the list were
-processed individually.
-
-.. ipython:: python
-
-    columns = pd.MultiIndex.from_tuples([
-            ('A', 'cat', 'long'), ('B', 'cat', 'long'),
-            ('A', 'dog', 'short'), ('B', 'dog', 'short')
-        ],
-        names=['exp', 'animal', 'hair_length']
-    )
-    df = pd.DataFrame(np.random.randn(4, 4), columns=columns)
-    df
-
-    df.stack(level=['animal', 'hair_length'])
-
-The list of levels can contain either level names or level numbers (but
-not a mixture of the two).
-
-.. ipython:: python
-
-    # df.stack(level=['animal', 'hair_length'])
-    # from above is equivalent to:
-    df.stack(level=[1, 2])
-
-Missing Data
-~~~~~~~~~~~~
-
-These functions are intelligent about handling missing data and do not expect
-each subgroup within the hierarchical index to have the same set of labels.
-They also can handle the index being unsorted (but you can make it sorted by
-calling ``sort_index``, of course). Here is a more complex example:
-
-.. ipython:: python
-
-   columns = pd.MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'),
-                                        ('B', 'cat'), ('A', 'dog')],
-                                       names=['exp', 'animal'])
-   index = pd.MultiIndex.from_product([('bar', 'baz', 'foo', 'qux'),
-                                       ('one', 'two')],
-                                      names=['first', 'second'])
-   df = pd.DataFrame(np.random.randn(8, 4), index=index, columns=columns)
-   df2 = df.iloc[[0, 1, 2, 4, 5, 7]]
-   df2
-
-As mentioned above, ``stack`` can be called with a ``level`` argument to select
-which level in the columns to stack:
-
-.. ipython:: python
-
-   df2.stack('exp')
-   df2.stack('animal')
-
-Unstacking can result in missing values if subgroups do not have the same
-set of labels.  By default, missing values will be replaced with the default
-fill value for that data type, ``NaN`` for float, ``NaT`` for datetimelike,
-etc.  For integer types, by default data will converted to float and missing
-values will be set to ``NaN``.
-
-.. ipython:: python
-
-   df3 = df.iloc[[0, 1, 4, 7], [1, 2]]
-   df3
-   df3.unstack()
-
-.. versionadded: 0.18.0
-
-Alternatively, unstack takes an optional ``fill_value`` argument, for specifying
-the value of missing data.
-
-.. ipython:: python
-
-   df3.unstack(fill_value=-1e9)
-
-With a MultiIndex
-~~~~~~~~~~~~~~~~~
-
-Unstacking when the columns are a ``MultiIndex`` is also careful about doing
-the right thing:
-
-.. ipython:: python
-
-   df[:3].unstack(0)
-   df2.unstack(1)
-
-.. _reshaping.melt:
-
-Reshaping by Melt
------------------
-
-The :func:`~pandas.melt` function is useful to massage a
-DataFrame into a format where one or more columns are identifier variables,
-while all other columns, considered measured variables, are "unpivoted" to the
-row axis, leaving just two non-identifier columns, "variable" and "value". The
-names of those columns can be customized by supplying the ``var_name`` and
-``value_name`` parameters.
-
-For instance,
-
-.. ipython:: python
-
-   cheese = pd.DataFrame({'first' : ['John', 'Mary'],
-                          'last' : ['Doe', 'Bo'],
-                          'height' : [5.5, 6.0],
-                          'weight' : [130, 150]})
-   cheese
-   pd.melt(cheese, id_vars=['first', 'last'])
-   pd.melt(cheese, id_vars=['first', 'last'], var_name='quantity')
-
-Another way to transform is to use the ``wide_to_long`` panel data convenience function.
-
-.. ipython:: python
-
-  dft = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
-                      "A1980" : {0 : "d", 1 : "e", 2 : "f"},
-                      "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
-                      "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
-                      "X"     : dict(zip(range(3), np.random.randn(3)))
-                     })
-  dft["id"] = dft.index
-  dft
-  pd.wide_to_long(dft, ["A", "B"], i="id", j="year")
-
-Combining with stats and GroupBy
---------------------------------
-
-It should be no shock that combining ``pivot`` / ``stack`` / ``unstack`` with
-GroupBy and the basic Series and DataFrame statistical functions can produce
-some very expressive and fast data manipulations.
-
-.. ipython:: python
-
-   df
-   df.stack().mean(1).unstack()
-
-   # same result, another way
-   df.groupby(level=1, axis=1).mean()
-
-   df.stack().groupby(level=1).mean()
-
-   df.mean().unstack(0)
-
-
-Pivot tables
-------------
-
-.. _reshaping.pivot:
-
-While ``pivot`` provides general purpose pivoting of DataFrames with various
-data types (strings, numerics, etc.), Pandas also provides the ``pivot_table``
-function for pivoting with aggregation of numeric data.
-
-The function ``pandas.pivot_table`` can be used to create spreadsheet-style pivot
-tables. See the :ref:`cookbook<cookbook.pivot>` for some advanced strategies
-
-It takes a number of arguments
-
-- ``data``: A DataFrame object
-- ``values``: a column or a list of columns to aggregate
-- ``index``: a column, Grouper, array which has the same length as data, or list of them.
-  Keys to group by on the pivot table index. If an array is passed, it is being used as the same manner as column values.
-- ``columns``: a column, Grouper, array which has the same length as data, or list of them.
-  Keys to group by on the pivot table column. If an array is passed, it is being used as the same manner as column values.
-- ``aggfunc``: function to use for aggregation, defaulting to ``numpy.mean``
-
-Consider a data set like this:
-
-.. ipython:: python
-
-   import datetime
-   df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 6,
-                      'B': ['A', 'B', 'C'] * 8,
-                      'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 4,
-                      'D': np.random.randn(24),
-                      'E': np.random.randn(24),
-                      'F': [datetime.datetime(2013, i, 1) for i in range(1, 13)] +
-                           [datetime.datetime(2013, i, 15) for i in range(1, 13)]})
-   df
-
-We can produce pivot tables from this data very easily:
-
-.. ipython:: python
-
-   pd.pivot_table(df, values='D', index=['A', 'B'], columns=['C'])
-   pd.pivot_table(df, values='D', index=['B'], columns=['A', 'C'], aggfunc=np.sum)
-   pd.pivot_table(df, values=['D','E'], index=['B'], columns=['A', 'C'], aggfunc=np.sum)
-
-The result object is a DataFrame having potentially hierarchical indexes on the
-rows and columns. If the ``values`` column name is not given, the pivot table
-will include all of the data that can be aggregated in an additional level of
-hierarchy in the columns:
-
-.. ipython:: python
-
-   pd.pivot_table(df, index=['A', 'B'], columns=['C'])
-
-Also, you can use ``Grouper`` for ``index`` and ``columns`` keywords. For detail of ``Grouper``, see :ref:`Grouping with a Grouper specification <groupby.specify>`.
-
-.. ipython:: python
-
-   pd.pivot_table(df, values='D', index=pd.Grouper(freq='M', key='F'), columns='C')
-
-You can render a nice output of the table omitting the missing values by
-calling ``to_string`` if you wish:
-
-.. ipython:: python
-
-   table = pd.pivot_table(df, index=['A', 'B'], columns=['C'])
-   print(table.to_string(na_rep=''))
-
-Note that ``pivot_table`` is also available as an instance method on DataFrame.
-
-.. _reshaping.pivot.margins:
-
-Adding margins
-~~~~~~~~~~~~~~
-
-If you pass ``margins=True`` to ``pivot_table``, special ``All`` columns and
-rows will be added with partial group aggregates across the categories on the
-rows and columns:
-
-.. ipython:: python
-
-   df.pivot_table(index=['A', 'B'], columns='C', margins=True, aggfunc=np.std)
-
-.. _reshaping.crosstabulations:
-
-Cross tabulations
------------------
-
-Use the ``crosstab`` function to compute a cross-tabulation of two (or more)
-factors. By default ``crosstab`` computes a frequency table of the factors
-unless an array of values and an aggregation function are passed.
-
-It takes a number of arguments
-
-- ``index``: array-like, values to group by in the rows
-- ``columns``: array-like, values to group by in the columns
-- ``values``: array-like, optional, array of values to aggregate according to
-  the factors
-- ``aggfunc``: function, optional, If no values array is passed, computes a
-  frequency table
-- ``rownames``: sequence, default ``None``, must match number of row arrays passed
-- ``colnames``: sequence, default ``None``, if passed, must match number of column
-  arrays passed
-- ``margins``: boolean, default ``False``, Add row/column margins (subtotals)
-- ``normalize``: boolean, {'all', 'index', 'columns'}, or {0,1}, default ``False``.
-  Normalize by dividing all values by the sum of values.
-
-
-Any Series passed will have their name attributes used unless row or column
-names for the cross-tabulation are specified
-
-For example:
-
-.. ipython:: python
-
-    foo, bar, dull, shiny, one, two = 'foo', 'bar', 'dull', 'shiny', 'one', 'two'
-    a = np.array([foo, foo, bar, bar, foo, foo], dtype=object)
-    b = np.array([one, one, two, one, two, one], dtype=object)
-    c = np.array([dull, dull, shiny, dull, dull, shiny], dtype=object)
-    pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
-
-
-If ``crosstab`` receives only two Series, it will provide a frequency table.
-
-.. ipython:: python
-
-    df = pd.DataFrame({'A': [1, 2, 2, 2, 2], 'B': [3, 3, 4, 4, 4],
-                       'C': [1, 1, np.nan, 1, 1]})
-    df
-
-    pd.crosstab(df.A, df.B)
-
-Any input passed containing ``Categorical`` data will have **all** of its
-categories included in the cross-tabulation, even if the actual data does
-not contain any instances of a particular category.
-
-.. ipython:: python
-
-    foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
-    bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
-    pd.crosstab(foo, bar)
-
-Normalization
-~~~~~~~~~~~~~
-
-.. versionadded:: 0.18.1
-
-Frequency tables can also be normalized to show percentages rather than counts
-using the ``normalize`` argument:
-
-.. ipython:: python
-
-   pd.crosstab(df.A, df.B, normalize=True)
-
-``normalize`` can also normalize values within each row or within each column:
-
-.. ipython:: python
-
-   pd.crosstab(df.A, df.B, normalize='columns')
-
-``crosstab`` can also be passed a third Series and an aggregation function
-(``aggfunc``) that will be applied to the values of the third Series within each
-group defined by the first two Series:
-
-.. ipython:: python
-
-   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum)
-
-Adding Margins
-~~~~~~~~~~~~~~
-
-Finally, one can also add margins or normalize this output.
-
-.. ipython:: python
-
-   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum, normalize=True,
-               margins=True)
-
-.. _reshaping.tile:
-.. _reshaping.tile.cut:
-
-Tiling
-------
-
-The ``cut`` function computes groupings for the values of the input array and
-is often used to transform continuous variables to discrete or categorical
-variables:
-
-.. ipython:: python
-
-   ages = np.array([10, 15, 13, 12, 23, 25, 28, 59, 60])
-
-   pd.cut(ages, bins=3)
-
-If the ``bins`` keyword is an integer, then equal-width bins are formed.
-Alternatively we can specify custom bin-edges:
-
-.. ipython:: python
-
-   pd.cut(ages, bins=[0, 18, 35, 70])
-
-
-.. _reshaping.dummies:
-
-Computing indicator / dummy variables
--------------------------------------
-
-To convert a categorical variable into a "dummy" or "indicator" DataFrame, for example
-a column in a DataFrame (a Series) which has ``k`` distinct values, can derive a DataFrame
-containing ``k`` columns of 1s and 0s:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'key': list('bbacab'), 'data1': range(6)})
-
-   pd.get_dummies(df['key'])
-
-Sometimes it's useful to prefix the column names, for example when merging the result
-with the original DataFrame:
-
-.. ipython:: python
-
-   dummies = pd.get_dummies(df['key'], prefix='key')
-   dummies
-
-
-   df[['data1']].join(dummies)
-
-This function is often used along with discretization functions like ``cut``:
-
-.. ipython:: python
-
-   values = np.random.randn(10)
-   values
-
-
-   bins = [0, 0.2, 0.4, 0.6, 0.8, 1]
-
-
-   pd.get_dummies(pd.cut(values, bins))
-
-See also :func:`Series.str.get_dummies <pandas.Series.str.get_dummies>`.
-
-.. versionadded:: 0.15.0
-
-:func:`get_dummies` also accepts a DataFrame. By default all categorical
-variables (categorical in the statistical sense,
-those with `object` or `categorical` dtype) are encoded as dummy variables.
-
-
-.. ipython:: python
-
-    df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['c', 'c', 'b'],
-                       'C': [1, 2, 3]})
-    pd.get_dummies(df)
-
-All non-object columns are included untouched in the output.
-
-You can control the columns that are encoded with the ``columns`` keyword.
-
-.. ipython:: python
-
-    pd.get_dummies(df, columns=['A'])
-
-Notice that the ``B`` column is still included in the output, it just hasn't
-been encoded. You can drop ``B`` before calling ``get_dummies`` if you don't
-want to include it in the output.
-
-As with the Series version, you can pass values for the ``prefix`` and
-``prefix_sep``. By default the column name is used as the prefix, and '_' as
-the prefix separator. You can specify ``prefix`` and ``prefix_sep`` in 3 ways
-
-- string: Use the same value for ``prefix`` or ``prefix_sep`` for each column
-  to be encoded
-- list: Must be the same length as the number of columns being encoded.
-- dict: Mapping column name to prefix
-
-.. ipython:: python
-
-    simple = pd.get_dummies(df, prefix='new_prefix')
-    simple
-    from_list = pd.get_dummies(df, prefix=['from_A', 'from_B'])
-    from_list
-    from_dict = pd.get_dummies(df, prefix={'B': 'from_B', 'A': 'from_A'})
-    from_dict
-
-.. versionadded:: 0.18.0
-
-Sometimes it will be useful to only keep k-1 levels of a categorical
-variable to avoid collinearity when feeding the result to statistical models.
-You can switch to this mode by turn on ``drop_first``.
-
-.. ipython:: python
-
-    s = pd.Series(list('abcaa'))
-
-    pd.get_dummies(s)
-
-    pd.get_dummies(s, drop_first=True)
-
-When a column contains only one level, it will be omitted in the result.
-
-.. ipython:: python
-
-    df = pd.DataFrame({'A':list('aaaaa'),'B':list('ababc')})
-
-    pd.get_dummies(df)
-
-    pd.get_dummies(df, drop_first=True)
-
-
-
-Factorizing values
-------------------
-
-To encode 1-d values as an enumerated type use ``factorize``:
-
-.. ipython:: python
-
-   x = pd.Series(['A', 'A', np.nan, 'B', 3.14, np.inf])
-   x
-   labels, uniques = pd.factorize(x)
-   labels
-   uniques
-
-Note that ``factorize`` is similar to ``numpy.unique``, but differs in its
-handling of NaN:
-
-.. note::
-   The following ``numpy.unique`` will fail under Python 3 with a ``TypeError``
-   because of an ordering bug. See also
-   `Here <https://github.com/numpy/numpy/issues/641>`__
-
-.. code-block:: ipython
-
-    In [2]: pd.factorize(x, sort=True)
-    Out[2]:
-    (array([ 2,  2, -1,  3,  0,  1]),
-     Index([3.14, inf, u'A', u'B'], dtype='object'))
-
-    In [3]: np.unique(x, return_inverse=True)[::-1]
-    Out[3]: (array([3, 3, 0, 4, 1, 2]), array([nan, 3.14, inf, 'A', 'B'], dtype=object))
-
-
-.. note::
-    If you just want to handle one column as a categorical variable (like R's factor),
-    you can use  ``df["cat_col"] = pd.Categorical(df["col"])`` or
-    ``df["cat_col"] = df["col"].astype("category")``. For full docs on :class:`~pandas.Categorical`,
-    see the :ref:`Categorical introduction <categorical>` and the
-    :ref:`API documentation <api.categorical>`. This feature was introduced in version 0.15.
diff --git a/doc/source/style.rst b/doc/source/style.rst
deleted file mode 100644
index 506b38bf06e65..0000000000000
--- a/doc/source/style.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-.. _style:
-
-.. currentmodule:: pandas
-
-*****
-Style
-*****
-
-.. raw:: html
-   :file: html-styling.html
diff --git a/doc/source/styled.xlsx b/doc/source/styled.xlsx
new file mode 100644
index 0000000000000..1233ff2b8692b
Binary files /dev/null and b/doc/source/styled.xlsx differ
diff --git a/doc/source/text.rst b/doc/source/text.rst
deleted file mode 100644
index e3e4b24d17f44..0000000000000
--- a/doc/source/text.rst
+++ /dev/null
@@ -1,477 +0,0 @@
-.. currentmodule:: pandas
-.. _text:
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   randn = np.random.randn
-   np.set_printoptions(precision=4, suppress=True)
-   from pandas.compat import lrange
-   pd.options.display.max_rows=15
-
-======================
-Working with Text Data
-======================
-
-.. _text.string_methods:
-
-Series and Index are equipped with a set of string processing methods
-that make it easy to operate on each element of the array. Perhaps most
-importantly, these methods exclude missing/NA values automatically. These are
-accessed via the ``str`` attribute and generally have names matching
-the equivalent (scalar) built-in string methods:
-
-.. ipython:: python
-
-   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
-   s.str.lower()
-   s.str.upper()
-   s.str.len()
-
-.. ipython:: python
-
-   idx = pd.Index([' jack', 'jill ', ' jesse ', 'frank'])
-   idx.str.strip()
-   idx.str.lstrip()
-   idx.str.rstrip()
-
-The string methods on Index are especially useful for cleaning up or
-transforming DataFrame columns. For instance, you may have columns with
-leading or trailing whitespace:
-
-.. ipython:: python
-
-   df = pd.DataFrame(randn(3, 2), columns=[' Column A ', ' Column B '],
-                     index=range(3))
-   df
-
-Since ``df.columns`` is an Index object, we can use the ``.str`` accessor
-
-.. ipython:: python
-
-   df.columns.str.strip()
-   df.columns.str.lower()
-
-These string methods can then be used to clean up the columns as needed.
-Here we are removing leading and trailing whitespaces, lowercasing all names,
-and replacing any remaining whitespaces with underscores:
-
-.. ipython:: python
-
-   df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')
-   df
-
-.. note::
-
-    If you have a ``Series`` where lots of elements are repeated
-    (i.e. the number of unique elements in the ``Series`` is a lot smaller than the length of the
-    ``Series``), it can be faster to convert the original ``Series`` to one of type
-    ``category`` and then use ``.str.<method>`` or ``.dt.<property>`` on that.
-    The performance difference comes from the fact that, for ``Series`` of type ``category``, the
-    string operations are done on the ``.categories`` and not on each element of the
-    ``Series``.
-
-    Please note that a ``Series`` of type ``category`` with string ``.categories`` has
-    some limitations in comparison of ``Series`` of type string (e.g. you can't add strings to
-    each other: ``s + " " + s`` won't work if ``s`` is a ``Series`` of type ``category``). Also,
-    ``.str`` methods which operate on elements of type ``list`` are not available on such a
-    ``Series``.
-
-
-Splitting and Replacing Strings
--------------------------------
-
-.. _text.split:
-
-Methods like ``split`` return a Series of lists:
-
-.. ipython:: python
-
-   s2 = pd.Series(['a_b_c', 'c_d_e', np.nan, 'f_g_h'])
-   s2.str.split('_')
-
-Elements in the split lists can be accessed using ``get`` or ``[]`` notation:
-
-.. ipython:: python
-
-   s2.str.split('_').str.get(1)
-   s2.str.split('_').str[1]
-
-Easy to expand this to return a DataFrame using ``expand``.
-
-.. ipython:: python
-
-   s2.str.split('_', expand=True)
-
-It is also possible to limit the number of splits:
-
-.. ipython:: python
-
-   s2.str.split('_', expand=True, n=1)
-
-``rsplit`` is similar to ``split`` except it works in the reverse direction,
-i.e., from the end of the string to the beginning of the string:
-
-.. ipython:: python
-
-   s2.str.rsplit('_', expand=True, n=1)
-
-Methods like ``replace`` and ``findall`` take `regular expressions
-<https://docs.python.org/2/library/re.html>`__, too:
-
-.. ipython:: python
-
-   s3 = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca',
-                  '', np.nan, 'CABA', 'dog', 'cat'])
-   s3
-   s3.str.replace('^.a|dog', 'XX-XX ', case=False)
-
-Some caution must be taken to keep regular expressions in mind! For example, the
-following code will cause trouble because of the regular expression meaning of
-`$`:
-
-.. ipython:: python
-
-   # Consider the following badly formatted financial data
-   dollars = pd.Series(['12', '-$10', '$10,000'])
-
-   # This does what you'd naively expect:
-   dollars.str.replace('$', '')
-
-   # But this doesn't:
-   dollars.str.replace('-$', '-')
-
-   # We need to escape the special character (for >1 len patterns)
-   dollars.str.replace(r'-\$', '-')
-
-The ``replace`` method can also take a callable as replacement. It is called
-on every ``pat`` using :func:`re.sub`. The callable should expect one
-positional argument (a regex object) and return a string.
-
-.. versionadded:: 0.20.0
-
-.. ipython:: python
-
-   # Reverse every lowercase alphabetic word
-   pat = r'[a-z]+'
-   repl = lambda m: m.group(0)[::-1]
-   pd.Series(['foo 123', 'bar baz', np.nan]).str.replace(pat, repl)
-
-   # Using regex groups
-   pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
-   repl = lambda m: m.group('two').swapcase()
-   pd.Series(['Foo Bar Baz', np.nan]).str.replace(pat, repl)
-
-The ``replace`` method also accepts a compiled regular expression object
-from :func:`re.compile` as a pattern. All flags should be included in the
-compiled regular expression object.
-
-.. versionadded:: 0.20.0
-
-.. ipython:: python
-
-   import re
-   regex_pat = re.compile(r'^.a|dog', flags=re.IGNORECASE)
-   s3.str.replace(regex_pat, 'XX-XX ')
-
-Including a ``flags`` argument when calling ``replace`` with a compiled
-regular expression object will raise a ``ValueError``.
-
-.. ipython::
-
-    @verbatim
-    In [1]: s3.str.replace(regex_pat, 'XX-XX ', flags=re.IGNORECASE)
-    ---------------------------------------------------------------------------
-    ValueError: case and flags cannot be set when pat is a compiled regex
-
-Indexing with ``.str``
-----------------------
-
-.. _text.indexing:
-
-You can use ``[]`` notation to directly index by position locations. If you index past the end
-of the string, the result will be a ``NaN``.
-
-
-.. ipython:: python
-
-   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan,
-                  'CABA', 'dog', 'cat'])
-
-   s.str[0]
-   s.str[1]
-
-Extracting Substrings
----------------------
-
-.. _text.extract:
-
-Extract first match in each subject (extract)
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. versionadded:: 0.13.0
-
-.. warning::
-
-   In version 0.18.0, ``extract`` gained the ``expand`` argument. When
-   ``expand=False`` it returns a ``Series``, ``Index``, or
-   ``DataFrame``, depending on the subject and regular expression
-   pattern (same behavior as pre-0.18.0). When ``expand=True`` it
-   always returns a ``DataFrame``, which is more consistent and less
-   confusing from the perspective of a user.
-
-The ``extract`` method accepts a `regular expression
-<https://docs.python.org/2/library/re.html>`__ with at least one
-capture group.
-
-Extracting a regular expression with more than one group returns a
-DataFrame with one column per group.
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)', expand=False)
-
-Elements that do not match return a row filled with ``NaN``. Thus, a
-Series of messy strings can be "converted" into a like-indexed Series
-or DataFrame of cleaned-up or more useful strings, without
-necessitating ``get()`` to access tuples or ``re.match`` objects. The
-dtype of the result is always object, even if no match is found and
-the result only contains ``NaN``.
-
-Named groups like
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('(?P<letter>[ab])(?P<digit>\d)', expand=False)
-
-and optional groups like
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', '3']).str.extract('([ab])?(\d)', expand=False)
-
-can also be used. Note that any capture group names in the regular
-expression will be used for column names; otherwise capture group
-numbers will be used.
-
-Extracting a regular expression with one group returns a ``DataFrame``
-with one column if ``expand=True``.
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=True)
-
-It returns a Series if ``expand=False``.
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=False)
-
-Calling on an ``Index`` with a regex with exactly one capture group
-returns a ``DataFrame`` with one column if ``expand=True``,
-
-.. ipython:: python
-
-   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
-   s
-   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
-
-It returns an ``Index`` if ``expand=False``.
-
-.. ipython:: python
-
-   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
-
-Calling on an ``Index`` with a regex with more than one capture group
-returns a ``DataFrame`` if ``expand=True``.
-
-.. ipython:: python
-
-   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
-
-It raises ``ValueError`` if ``expand=False``.
-
-.. code-block:: python
-
-    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
-    ValueError: only one regex group is supported with Index
-
-The table below summarizes the behavior of ``extract(expand=False)``
-(input subject in first column, number of groups in regex in
-first row)
-
-+--------+---------+------------+
-|        | 1 group | >1 group   |
-+--------+---------+------------+
-| Index  | Index   | ValueError |
-+--------+---------+------------+
-| Series | Series  | DataFrame  |
-+--------+---------+------------+
-
-Extract all matches in each subject (extractall)
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. _text.extractall:
-
-.. versionadded:: 0.18.0
-
-Unlike ``extract`` (which returns only the first match),
-
-.. ipython:: python
-
-   s = pd.Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
-   s
-   two_groups = '(?P<letter>[a-z])(?P<digit>[0-9])'
-   s.str.extract(two_groups, expand=True)
-
-the ``extractall`` method returns every match. The result of
-``extractall`` is always a ``DataFrame`` with a ``MultiIndex`` on its
-rows. The last level of the ``MultiIndex`` is named ``match`` and
-indicates the order in the subject.
-
-.. ipython:: python
-
-   s.str.extractall(two_groups)
-
-When each subject string in the Series has exactly one match,
-
-.. ipython:: python
-
-   s = pd.Series(['a3', 'b3', 'c2'])
-   s
-
-then ``extractall(pat).xs(0, level='match')`` gives the same result as
-``extract(pat)``.
-
-.. ipython:: python
-
-   extract_result = s.str.extract(two_groups, expand=True)
-   extract_result
-   extractall_result = s.str.extractall(two_groups)
-   extractall_result
-   extractall_result.xs(0, level="match")
-
-``Index`` also supports ``.str.extractall``. It returns a ``DataFrame`` which has the
-same result as a ``Series.str.extractall`` with a default index (starts from 0).
-
-.. versionadded:: 0.19.0
-
-.. ipython:: python
-
-   pd.Index(["a1a2", "b1", "c1"]).str.extractall(two_groups)
-
-   pd.Series(["a1a2", "b1", "c1"]).str.extractall(two_groups)
-
-
-Testing for Strings that Match or Contain a Pattern
----------------------------------------------------
-
-You can check whether elements contain a pattern:
-
-.. ipython:: python
-
-   pattern = r'[0-9][a-z]'
-   pd.Series(['1', '2', '3a', '3b', '03c']).str.contains(pattern)
-
-or match a pattern:
-
-.. ipython:: python
-
-   pd.Series(['1', '2', '3a', '3b', '03c']).str.match(pattern)
-
-The distinction between ``match`` and ``contains`` is strictness: ``match``
-relies on strict ``re.match``, while ``contains`` relies on ``re.search``.
-
-Methods like ``match``, ``contains``, ``startswith``, and ``endswith`` take
-an extra ``na`` argument so missing values can be considered True or False:
-
-.. ipython:: python
-
-   s4 = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
-   s4.str.contains('A', na=False)
-
-.. _text.indicator:
-
-Creating Indicator Variables
-----------------------------
-
-You can extract dummy variables from string columns.
-For example if they are separated by a ``'|'``:
-
-.. ipython:: python
-
-    s = pd.Series(['a', 'a|b', np.nan, 'a|c'])
-    s.str.get_dummies(sep='|')
-
-String ``Index`` also supports ``get_dummies`` which returns a ``MultiIndex``.
-
-.. versionadded:: 0.18.1
-
-.. ipython:: python
-
-    idx = pd.Index(['a', 'a|b', np.nan, 'a|c'])
-    idx.str.get_dummies(sep='|')
-
-See also :func:`~pandas.get_dummies`.
-
-Method Summary
---------------
-
-.. _text.summary:
-
-.. csv-table::
-    :header: "Method", "Description"
-    :widths: 20, 80
-    :delim: ;
-
-    :meth:`~Series.str.cat`;Concatenate strings
-    :meth:`~Series.str.split`;Split strings on delimiter
-    :meth:`~Series.str.rsplit`;Split strings on delimiter working from the end of the string
-    :meth:`~Series.str.get`;Index into each element (retrieve i-th element)
-    :meth:`~Series.str.join`;Join strings in each element of the Series with passed separator
-    :meth:`~Series.str.get_dummies`;Split strings on the delimiter returning DataFrame of dummy variables
-    :meth:`~Series.str.contains`;Return boolean array if each string contains pattern/regex
-    :meth:`~Series.str.replace`;Replace occurrences of pattern/regex with some other string or the return value of a callable given the occurrence
-    :meth:`~Series.str.repeat`;Duplicate values (``s.str.repeat(3)`` equivalent to ``x * 3``)
-    :meth:`~Series.str.pad`;"Add whitespace to left, right, or both sides of strings"
-    :meth:`~Series.str.center`;Equivalent to ``str.center``
-    :meth:`~Series.str.ljust`;Equivalent to ``str.ljust``
-    :meth:`~Series.str.rjust`;Equivalent to ``str.rjust``
-    :meth:`~Series.str.zfill`;Equivalent to ``str.zfill``
-    :meth:`~Series.str.wrap`;Split long strings into lines with length less than a given width
-    :meth:`~Series.str.slice`;Slice each string in the Series
-    :meth:`~Series.str.slice_replace`;Replace slice in each string with passed value
-    :meth:`~Series.str.count`;Count occurrences of pattern
-    :meth:`~Series.str.startswith`;Equivalent to ``str.startswith(pat)`` for each element
-    :meth:`~Series.str.endswith`;Equivalent to ``str.endswith(pat)`` for each element
-    :meth:`~Series.str.findall`;Compute list of all occurrences of pattern/regex for each string
-    :meth:`~Series.str.match`;"Call ``re.match`` on each element, returning matched groups as list"
-    :meth:`~Series.str.extract`;"Call ``re.search`` on each element, returning DataFrame with one row for each element and one column for each regex capture group"
-    :meth:`~Series.str.extractall`;"Call ``re.findall`` on each element, returning DataFrame with one row for each match and one column for each regex capture group"
-    :meth:`~Series.str.len`;Compute string lengths
-    :meth:`~Series.str.strip`;Equivalent to ``str.strip``
-    :meth:`~Series.str.rstrip`;Equivalent to ``str.rstrip``
-    :meth:`~Series.str.lstrip`;Equivalent to ``str.lstrip``
-    :meth:`~Series.str.partition`;Equivalent to ``str.partition``
-    :meth:`~Series.str.rpartition`;Equivalent to ``str.rpartition``
-    :meth:`~Series.str.lower`;Equivalent to ``str.lower``
-    :meth:`~Series.str.upper`;Equivalent to ``str.upper``
-    :meth:`~Series.str.find`;Equivalent to ``str.find``
-    :meth:`~Series.str.rfind`;Equivalent to ``str.rfind``
-    :meth:`~Series.str.index`;Equivalent to ``str.index``
-    :meth:`~Series.str.rindex`;Equivalent to ``str.rindex``
-    :meth:`~Series.str.capitalize`;Equivalent to ``str.capitalize``
-    :meth:`~Series.str.swapcase`;Equivalent to ``str.swapcase``
-    :meth:`~Series.str.normalize`;Return Unicode normal form. Equivalent to ``unicodedata.normalize``
-    :meth:`~Series.str.translate`;Equivalent to ``str.translate``
-    :meth:`~Series.str.isalnum`;Equivalent to ``str.isalnum``
-    :meth:`~Series.str.isalpha`;Equivalent to ``str.isalpha``
-    :meth:`~Series.str.isdigit`;Equivalent to ``str.isdigit``
-    :meth:`~Series.str.isspace`;Equivalent to ``str.isspace``
-    :meth:`~Series.str.islower`;Equivalent to ``str.islower``
-    :meth:`~Series.str.isupper`;Equivalent to ``str.isupper``
-    :meth:`~Series.str.istitle`;Equivalent to ``str.istitle``
-    :meth:`~Series.str.isnumeric`;Equivalent to ``str.isnumeric``
-    :meth:`~Series.str.isdecimal`;Equivalent to ``str.isdecimal``
diff --git a/doc/source/themes/nature_with_gtoc/layout.html b/doc/source/themes/nature_with_gtoc/layout.html
index ddf1e861f5f81..a2106605c5562 100644
--- a/doc/source/themes/nature_with_gtoc/layout.html
+++ b/doc/source/themes/nature_with_gtoc/layout.html
@@ -94,4 +94,15 @@ <h3 style="margin-top: 1.5em;">{{ _('Search') }}</h3>
     });
 });
 </script>
+<script type="text/javascript">
+  var _gaq = _gaq || [];
+  _gaq.push(['_setAccount', 'UA-27880019-2']);
+  _gaq.push(['_trackPageview']);
+
+  (function() {
+    var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
+    ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
+    var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
+  })();
+</script>
 {% endblock %}
\ No newline at end of file
diff --git a/doc/source/themes/nature_with_gtoc/static/nature.css_t b/doc/source/themes/nature_with_gtoc/static/nature.css_t
index 2948f0d68b402..4571d97ec50ba 100644
--- a/doc/source/themes/nature_with_gtoc/static/nature.css_t
+++ b/doc/source/themes/nature_with_gtoc/static/nature.css_t
@@ -198,10 +198,18 @@ div.body p, div.body dd, div.body li {
     line-height: 1.5em;
 }
 
-div.admonition p.admonition-title + p {
+div.admonition p.admonition-title + p, div.deprecated p {
     display: inline;
 }
 
+div.deprecated {
+    margin-bottom: 10px;
+    margin-top: 10px;
+    padding: 7px;
+    background-color: #ffe4e4;
+    border: 1px solid #f66;
+}
+
 div.highlight{
     background-color: white;
 }
@@ -299,20 +307,45 @@ td.field-body blockquote {
     padding-left: 30px;
 }
 
-.rendered_html table {
+// Adapted from the new Jupyter notebook style
+// https://github.com/jupyter/notebook/blob/c8841b68c4c0739bbee1291e0214771f24194079/notebook/static/notebook/less/renderedhtml.less#L59
+table {
     margin-left: auto;
     margin-right: auto;
-    border-right: 1px solid #cbcbcb;
-    border-bottom: 1px solid #cbcbcb;
+    border: none;
+    border-collapse: collapse;
+    border-spacing: 0;
+    color: @rendered_html_border_color;
+    table-layout: fixed;
+}
+thead {
+    border-bottom: 1px solid @rendered_html_border_color;
+    vertical-align: bottom;
+}
+tr, th, td {
+    vertical-align: middle;
+    padding: 0.5em 0.5em;
+    line-height: normal;
+    white-space: normal;
+    max-width: none;
+    border: none;
+}
+th {
+    font-weight: bold;
+}
+th.col_heading {
+    text-align: right;
+}
+tbody tr:nth-child(odd) {
+    background: #f5f5f5;
 }
 
-.rendered_html td, th {
-    border-left: 1px solid #cbcbcb;
-    border-top: 1px solid #cbcbcb;
-    margin: 0;
-    padding: 0.5em .75em;
+table td.data, table th.row_heading table th.col_heading {
+    font-family: monospace;
+    text-align: right;
 }
 
+
 /**
  * See also
  */
diff --git a/doc/source/timedeltas.rst b/doc/source/timedeltas.rst
deleted file mode 100644
index 07effcfdff33b..0000000000000
--- a/doc/source/timedeltas.rst
+++ /dev/null
@@ -1,432 +0,0 @@
-.. currentmodule:: pandas
-.. _timedeltas:
-
-.. ipython:: python
-   :suppress:
-
-   import datetime
-   import numpy as np
-   import pandas as pd
-   np.random.seed(123456)
-   randn = np.random.randn
-   randint = np.random.randint
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows=15
-   import dateutil
-   import pytz
-   from dateutil.relativedelta import relativedelta
-   from pandas.tseries.offsets import *
-
-.. _timedeltas.timedeltas:
-
-***********
-Time Deltas
-***********
-
-.. note::
-
-   Starting in v0.15.0, we introduce a new scalar type ``Timedelta``, which is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
-   but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation, parsing, and attributes.
-
-Timedeltas are differences in times, expressed in difference units, e.g. days, hours, minutes, seconds.
-They can be both positive and negative.
-
-Parsing
--------
-
-You can construct a ``Timedelta`` scalar through various arguments:
-
-.. ipython:: python
-
-   # strings
-   pd.Timedelta('1 days')
-   pd.Timedelta('1 days 00:00:00')
-   pd.Timedelta('1 days 2 hours')
-   pd.Timedelta('-1 days 2 min 3us')
-
-   # like datetime.timedelta
-   # note: these MUST be specified as keyword arguments
-   pd.Timedelta(days=1, seconds=1)
-
-   # integers with a unit
-   pd.Timedelta(1, unit='d')
-
-   # from a datetime.timedelta/np.timedelta64
-   pd.Timedelta(datetime.timedelta(days=1, seconds=1))
-   pd.Timedelta(np.timedelta64(1, 'ms'))
-
-   # negative Timedeltas have this string repr
-   # to be more consistent with datetime.timedelta conventions
-   pd.Timedelta('-1us')
-
-   # a NaT
-   pd.Timedelta('nan')
-   pd.Timedelta('nat')
-
-:ref:`DateOffsets<timeseries.offsets>` (``Day, Hour, Minute, Second, Milli, Micro, Nano``) can also be used in construction.
-
-.. ipython:: python
-
-   pd.Timedelta(Second(2))
-
-Further, operations among the scalars yield another scalar ``Timedelta``.
-
-.. ipython:: python
-
-   pd.Timedelta(Day(2)) + pd.Timedelta(Second(2)) + pd.Timedelta('00:00:00.000123')
-
-to_timedelta
-~~~~~~~~~~~~
-
-.. warning::
-
-       Prior to 0.15.0 ``pd.to_timedelta`` would return a ``Series`` for list-like/Series input, and a ``np.timedelta64`` for scalar input.
-       It will now return a ``TimedeltaIndex`` for list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
-
-       The arguments to ``pd.to_timedelta`` are now ``(arg, unit='ns', box=True)``, previously were ``(arg, box=True, unit='ns')`` as these are more logical.
-
-Using the top-level ``pd.to_timedelta``, you can convert a scalar, array, list, or Series from a recognized timedelta format / value into a ``Timedelta`` type.
-It will construct Series if the input is a Series, a scalar if the input is scalar-like, otherwise will output a ``TimedeltaIndex``.
-
-You can parse a single string to a Timedelta:
-
-.. ipython:: python
-
-   pd.to_timedelta('1 days 06:05:01.00003')
-   pd.to_timedelta('15.5us')
-
-or a list/array of strings:
-
-.. ipython:: python
-
-   pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
-
-The ``unit`` keyword argument specifies the unit of the Timedelta:
-
-.. ipython:: python
-
-   pd.to_timedelta(np.arange(5), unit='s')
-   pd.to_timedelta(np.arange(5), unit='d')
-
-.. _timedeltas.limitations:
-
-Timedelta limitations
-~~~~~~~~~~~~~~~~~~~~~
-
-Pandas represents ``Timedeltas`` in nanosecond resolution using
-64 bit integers. As such, the 64 bit integer limits determine
-the ``Timedelta`` limits.
-
-.. ipython:: python
-
-   pd.Timedelta.min
-   pd.Timedelta.max
-
-.. _timedeltas.operations:
-
-Operations
-----------
-
-You can operate on Series/DataFrames and construct ``timedelta64[ns]`` Series through
-subtraction operations on ``datetime64[ns]`` Series, or ``Timestamps``.
-
-.. ipython:: python
-
-   s = pd.Series(pd.date_range('2012-1-1', periods=3, freq='D'))
-   td = pd.Series([ pd.Timedelta(days=i) for i in range(3) ])
-   df = pd.DataFrame(dict(A = s, B = td))
-   df
-   df['C'] = df['A'] + df['B']
-   df
-   df.dtypes
-
-   s - s.max()
-   s - datetime.datetime(2011, 1, 1, 3, 5)
-   s + datetime.timedelta(minutes=5)
-   s + Minute(5)
-   s + Minute(5) + Milli(5)
-
-Operations with scalars from a ``timedelta64[ns]`` series:
-
-.. ipython:: python
-
-   y = s - s[0]
-   y
-
-Series of timedeltas with ``NaT`` values are supported:
-
-.. ipython:: python
-
-   y = s - s.shift()
-   y
-
-Elements can be set to ``NaT`` using ``np.nan`` analogously to datetimes:
-
-.. ipython:: python
-
-   y[1] = np.nan
-   y
-
-Operands can also appear in a reversed order (a singular object operated with a Series):
-
-.. ipython:: python
-
-   s.max() - s
-   datetime.datetime(2011, 1, 1, 3, 5) - s
-   datetime.timedelta(minutes=5) + s
-
-``min, max`` and the corresponding ``idxmin, idxmax`` operations are supported on frames:
-
-.. ipython:: python
-
-   A = s - pd.Timestamp('20120101') - pd.Timedelta('00:05:05')
-   B = s - pd.Series(pd.date_range('2012-1-2', periods=3, freq='D'))
-
-   df = pd.DataFrame(dict(A=A, B=B))
-   df
-
-   df.min()
-   df.min(axis=1)
-
-   df.idxmin()
-   df.idxmax()
-
-``min, max, idxmin, idxmax`` operations are supported on Series as well. A scalar result will be a ``Timedelta``.
-
-.. ipython:: python
-
-   df.min().max()
-   df.min(axis=1).min()
-
-   df.min().idxmax()
-   df.min(axis=1).idxmin()
-
-You can fillna on timedeltas. Integers will be interpreted as seconds. You can
-pass a timedelta to get a particular value.
-
-.. ipython:: python
-
-   y.fillna(0)
-   y.fillna(10)
-   y.fillna(pd.Timedelta('-1 days, 00:00:05'))
-
-You can also negate, multiply and use ``abs`` on ``Timedeltas``:
-
-.. ipython:: python
-
-   td1 = pd.Timedelta('-1 days 2 hours 3 seconds')
-   td1
-   -1 * td1
-   - td1
-   abs(td1)
-
-.. _timedeltas.timedeltas_reductions:
-
-Reductions
-----------
-
-Numeric reduction operation for ``timedelta64[ns]`` will return ``Timedelta`` objects. As usual
-``NaT`` are skipped during evaluation.
-
-.. ipython:: python
-
-   y2 = pd.Series(pd.to_timedelta(['-1 days +00:00:05', 'nat', '-1 days +00:00:05', '1 days']))
-   y2
-   y2.mean()
-   y2.median()
-   y2.quantile(.1)
-   y2.sum()
-
-.. _timedeltas.timedeltas_convert:
-
-Frequency Conversion
---------------------
-
-.. versionadded:: 0.13
-
-Timedelta Series, ``TimedeltaIndex``, and ``Timedelta`` scalars can be converted to other 'frequencies' by dividing by another timedelta,
-or by astyping to a specific timedelta type. These operations yield Series and propagate ``NaT`` -> ``nan``.
-Note that division by the numpy scalar is true division, while astyping is equivalent of floor division.
-
-.. ipython:: python
-
-   td = pd.Series(pd.date_range('20130101', periods=4)) - \
-        pd.Series(pd.date_range('20121201', periods=4))
-   td[2] += datetime.timedelta(minutes=5, seconds=3)
-   td[3] = np.nan
-   td
-
-   # to days
-   td / np.timedelta64(1, 'D')
-   td.astype('timedelta64[D]')
-
-   # to seconds
-   td / np.timedelta64(1, 's')
-   td.astype('timedelta64[s]')
-
-   # to months (these are constant months)
-   td / np.timedelta64(1, 'M')
-
-Dividing or multiplying a ``timedelta64[ns]`` Series by an integer or integer Series
-yields another ``timedelta64[ns]`` dtypes Series.
-
-.. ipython:: python
-
-   td * -1
-   td * pd.Series([1, 2, 3, 4])
-
-Attributes
-----------
-
-You can access various components of the ``Timedelta`` or ``TimedeltaIndex`` directly using the attributes ``days,seconds,microseconds,nanoseconds``. These are identical to the values returned by ``datetime.timedelta``, in that, for example, the ``.seconds`` attribute represents the number of seconds >= 0 and < 1 day. These are signed according to whether the ``Timedelta`` is signed.
-
-These operations can also be directly accessed via the ``.dt`` property of the ``Series`` as well.
-
-.. note::
-
-   Note that the attributes are NOT the displayed values of the ``Timedelta``. Use ``.components`` to retrieve the displayed values.
-
-For a ``Series``:
-
-.. ipython:: python
-
-   td.dt.days
-   td.dt.seconds
-
-You can access the value of the fields for a scalar ``Timedelta`` directly.
-
-.. ipython:: python
-
-   tds = pd.Timedelta('31 days 5 min 3 sec')
-   tds.days
-   tds.seconds
-   (-tds).seconds
-
-You can use the ``.components`` property to access a reduced form of the timedelta. This returns a ``DataFrame`` indexed
-similarly to the ``Series``. These are the *displayed* values of the ``Timedelta``.
-
-.. ipython:: python
-
-   td.dt.components
-   td.dt.components.seconds
-
-.. _timedeltas.isoformat:
-
-You can convert a ``Timedelta`` to an `ISO 8601 Duration`_ string with the
-``.isoformat`` method
-
-.. versionadded:: 0.20.0
-
-.. ipython:: python
-
-    pd.Timedelta(days=6, minutes=50, seconds=3,
-                 milliseconds=10, microseconds=10,
-                 nanoseconds=12).isoformat()
-
-.. _ISO 8601 Duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
-
-.. _timedeltas.index:
-
-TimedeltaIndex
---------------
-
-.. versionadded:: 0.15.0
-
-To generate an index with time delta, you can use either the ``TimedeltaIndex`` or
-the ``timedelta_range`` constructor.
-
-Using ``TimedeltaIndex`` you can pass string-like, ``Timedelta``, ``timedelta``,
-or ``np.timedelta64`` objects. Passing ``np.nan/pd.NaT/nat`` will represent missing values.
-
-.. ipython:: python
-
-   pd.TimedeltaIndex(['1 days', '1 days, 00:00:05',
-                     np.timedelta64(2,'D'), datetime.timedelta(days=2,seconds=2)])
-
-Similarly to ``date_range``, you can construct regular ranges of a ``TimedeltaIndex``:
-
-.. ipython:: python
-
-   pd.timedelta_range(start='1 days', periods=5, freq='D')
-   pd.timedelta_range(start='1 days', end='2 days', freq='30T')
-
-Using the TimedeltaIndex
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-Similarly to other of the datetime-like indices, ``DatetimeIndex`` and ``PeriodIndex``, you can use
-``TimedeltaIndex`` as the index of pandas objects.
-
-.. ipython:: python
-
-   s = pd.Series(np.arange(100),
-                 index=pd.timedelta_range('1 days', periods=100, freq='h'))
-   s
-
-Selections work similarly, with coercion on string-likes and slices:
-
-.. ipython:: python
-
-   s['1 day':'2 day']
-   s['1 day 01:00:00']
-   s[pd.Timedelta('1 day 1h')]
-
-Furthermore you can use partial string selection and the range will be inferred:
-
-.. ipython:: python
-
-   s['1 day':'1 day 5 hours']
-
-Operations
-~~~~~~~~~~
-
-Finally, the combination of ``TimedeltaIndex`` with ``DatetimeIndex`` allow certain combination operations that are NaT preserving:
-
-.. ipython:: python
-
-   tdi = pd.TimedeltaIndex(['1 days', pd.NaT, '2 days'])
-   tdi.tolist()
-   dti = pd.date_range('20130101', periods=3)
-   dti.tolist()
-   (dti + tdi).tolist()
-   (dti - tdi).tolist()
-
-Conversions
-~~~~~~~~~~~
-
-Similarly to frequency conversion on a ``Series`` above, you can convert these indices to yield another Index.
-
-.. ipython:: python
-
-   tdi / np.timedelta64(1,'s')
-   tdi.astype('timedelta64[s]')
-
-Scalars type ops work as well. These can potentially return a *different* type of index.
-
-.. ipython:: python
-
-   # adding or timedelta and date -> datelike
-   tdi + pd.Timestamp('20130101')
-
-   # subtraction of a date and a timedelta -> datelike
-   # note that trying to subtract a date from a Timedelta will raise an exception
-   (pd.Timestamp('20130101') - tdi).tolist()
-
-   # timedelta + timedelta -> timedelta
-   tdi + pd.Timedelta('10 days')
-
-   # division can result in a Timedelta if the divisor is an integer
-   tdi / 2
-
-   # or a Float64Index if the divisor is a Timedelta
-   tdi / tdi[0]
-
-.. _timedeltas.resampling:
-
-Resampling
-----------
-
-Similar to :ref:`timeseries resampling <timeseries.resampling>`, we can resample with a ``TimedeltaIndex``.
-
-.. ipython:: python
-
-   s.resample('D').mean()
diff --git a/doc/source/timeseries.rst b/doc/source/timeseries.rst
deleted file mode 100644
index 7136b15a7633a..0000000000000
--- a/doc/source/timeseries.rst
+++ /dev/null
@@ -1,2177 +0,0 @@
-.. currentmodule:: pandas
-.. _timeseries:
-
-.. ipython:: python
-   :suppress:
-
-   from datetime import datetime, timedelta, time
-   import numpy as np
-   import pandas as pd
-   from pandas import offsets
-   np.random.seed(123456)
-   randn = np.random.randn
-   randint = np.random.randint
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows=15
-   import dateutil
-   import pytz
-   from dateutil.relativedelta import relativedelta
-
-********************************
-Time Series / Date functionality
-********************************
-
-pandas has proven very successful as a tool for working with time series data,
-especially in the financial data analysis space. Using the NumPy ``datetime64`` and ``timedelta64`` dtypes,
-we have consolidated a large number of features from other Python libraries like ``scikits.timeseries`` as well as created
-a tremendous amount of new functionality for manipulating time series data.
-
-In working with time series data, we will frequently seek to:
-
-  - generate sequences of fixed-frequency dates and time spans
-  - conform or convert time series to a particular frequency
-  - compute "relative" dates based on various non-standard time increments
-    (e.g. 5 business days before the last business day of the year), or "roll"
-    dates forward or backward
-
-pandas provides a relatively compact and self-contained set of tools for
-performing the above tasks.
-
-Create a range of dates:
-
-.. ipython:: python
-
-   # 72 hours starting with midnight Jan 1st, 2011
-   rng = pd.date_range('1/1/2011', periods=72, freq='H')
-   rng[:5]
-
-Index pandas objects with dates:
-
-.. ipython:: python
-
-   ts = pd.Series(np.random.randn(len(rng)), index=rng)
-   ts.head()
-
-Change frequency and fill gaps:
-
-.. ipython:: python
-
-   # to 45 minute frequency and forward fill
-   converted = ts.asfreq('45Min', method='pad')
-   converted.head()
-
-Resample:
-
-.. ipython:: python
-
-   # Daily means
-   ts.resample('D').mean()
-
-
-.. _timeseries.overview:
-
-Overview
---------
-
-Following table shows the type of time-related classes pandas can handle and
-how to create them.
-
-=================  =============================== ==================================================
-Class              Remarks                         How to create
-=================  =============================== ==================================================
-``Timestamp``      Represents a single time stamp   ``to_datetime``, ``Timestamp``
-``DatetimeIndex``  Index of ``Timestamp``          ``to_datetime``, ``date_range``, ``DatetimeIndex``
-``Period``         Represents a single time span   ``Period``
-``PeriodIndex``    Index of ``Period``             ``period_range``, ``PeriodIndex``
-=================  =============================== ==================================================
-
-.. _timeseries.representation:
-
-Time Stamps vs. Time Spans
---------------------------
-
-Time-stamped data is the most basic type of timeseries data that associates
-values with points in time. For pandas objects it means using the points in
-time.
-
-.. ipython:: python
-
-   pd.Timestamp(datetime(2012, 5, 1))
-   pd.Timestamp('2012-05-01')
-   pd.Timestamp(2012, 5, 1)
-
-However, in many cases it is more natural to associate things like change
-variables with a time span instead. The span represented by ``Period`` can be
-specified explicitly, or inferred from datetime string format.
-
-For example:
-
-.. ipython:: python
-
-   pd.Period('2011-01')
-
-   pd.Period('2012-05', freq='D')
-
-``Timestamp`` and ``Period`` can be the index. Lists of ``Timestamp`` and
-``Period`` are automatically coerce to ``DatetimeIndex`` and ``PeriodIndex``
-respectively.
-
-.. ipython:: python
-
-   dates = [pd.Timestamp('2012-05-01'), pd.Timestamp('2012-05-02'), pd.Timestamp('2012-05-03')]
-   ts = pd.Series(np.random.randn(3), dates)
-
-   type(ts.index)
-   ts.index
-
-   ts
-
-   periods = [pd.Period('2012-01'), pd.Period('2012-02'), pd.Period('2012-03')]
-
-   ts = pd.Series(np.random.randn(3), periods)
-
-   type(ts.index)
-   ts.index
-
-   ts
-
-pandas allows you to capture both representations and
-convert between them. Under the hood, pandas represents timestamps using
-instances of ``Timestamp`` and sequences of timestamps using instances of
-``DatetimeIndex``. For regular time spans, pandas uses ``Period`` objects for
-scalar values and ``PeriodIndex`` for sequences of spans. Better support for
-irregular intervals with arbitrary start and end points are forth-coming in
-future releases.
-
-
-.. _timeseries.converting:
-
-Converting to Timestamps
-------------------------
-
-To convert a Series or list-like object of date-like objects e.g. strings,
-epochs, or a mixture, you can use the ``to_datetime`` function. When passed
-a Series, this returns a Series (with the same index), while a list-like
-is converted to a DatetimeIndex:
-
-.. ipython:: python
-
-    pd.to_datetime(pd.Series(['Jul 31, 2009', '2010-01-10', None]))
-
-    pd.to_datetime(['2005/11/23', '2010.12.31'])
-
-If you use dates which start with the day first (i.e. European style),
-you can pass the ``dayfirst`` flag:
-
-.. ipython:: python
-
-    pd.to_datetime(['04-01-2012 10:00'], dayfirst=True)
-
-    pd.to_datetime(['14-01-2012', '01-14-2012'], dayfirst=True)
-
-.. warning::
-
-   You see in the above example that ``dayfirst`` isn't strict, so if a date
-   can't be parsed with the day being first it will be parsed as if
-   ``dayfirst`` were False.
-
-.. note::
-   Specifying a ``format`` argument will potentially speed up the conversion
-   considerably and on versions later then 0.13.0 explicitly specifying
-   a format string of '%Y%m%d' takes a faster path still.
-
-If you pass a single string to ``to_datetime``, it returns single ``Timestamp``.
-Also, ``Timestamp`` can accept the string input.
-Note that ``Timestamp`` doesn't accept string parsing option like ``dayfirst``
-or ``format``, use ``to_datetime`` if these are required.
-
-.. ipython:: python
-
-    pd.to_datetime('2010/11/12')
-
-    pd.Timestamp('2010/11/12')
-
-.. versionadded:: 0.18.1
-
-You can also pass a ``DataFrame`` of integer or string columns to assemble into a ``Series`` of ``Timestamps``.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'year': [2015, 2016],
-                      'month': [2, 3],
-                      'day': [4, 5],
-                      'hour': [2, 3]})
-   pd.to_datetime(df)
-
-
-You can pass only the columns that you need to assemble.
-
-.. ipython:: python
-
-   pd.to_datetime(df[['year', 'month', 'day']])
-
-``pd.to_datetime`` looks for standard designations of the datetime component in the column names, including:
-
-- required: ``year``, ``month``, ``day``
-- optional: ``hour``, ``minute``, ``second``, ``millisecond``, ``microsecond``, ``nanosecond``
-
-Invalid Data
-~~~~~~~~~~~~
-
-.. note::
-
-   In version 0.17.0, the default for ``to_datetime`` is now ``errors='raise'``, rather than ``errors='ignore'``. This means
-   that invalid parsing will raise rather that return the original input as in previous versions.
-
-Pass ``errors='coerce'`` to convert invalid data to ``NaT`` (not a time):
-
-Raise when unparseable, this is the default
-
-.. code-block:: ipython
-
-    In [2]: pd.to_datetime(['2009/07/31', 'asd'], errors='raise')
-    ValueError: Unknown string format
-
-Return the original input when unparseable
-
-.. code-block:: ipython
-
-    In [4]: pd.to_datetime(['2009/07/31', 'asd'], errors='ignore')
-    Out[4]: array(['2009/07/31', 'asd'], dtype=object)
-
-Return NaT for input when unparseable
-
-.. code-block:: ipython
-
-    In [6]: pd.to_datetime(['2009/07/31', 'asd'], errors='coerce')
-    Out[6]: DatetimeIndex(['2009-07-31', 'NaT'], dtype='datetime64[ns]', freq=None)
-
-
-Epoch Timestamps
-~~~~~~~~~~~~~~~~
-
-It's also possible to convert integer or float epoch times. The default unit
-for these is nanoseconds (since these are how ``Timestamp`` s are stored). However,
-often epochs are stored in another ``unit`` which can be specified:
-
-Typical epoch stored units
-
-.. ipython:: python
-
-   pd.to_datetime([1349720105, 1349806505, 1349892905,
-                   1349979305, 1350065705], unit='s')
-
-   pd.to_datetime([1349720105100, 1349720105200, 1349720105300,
-                   1349720105400, 1349720105500 ], unit='ms')
-
-These *work*, but the results may be unexpected.
-
-.. ipython:: python
-
-   pd.to_datetime([1])
-
-   pd.to_datetime([1, 3.14], unit='s')
-
-.. note::
-
-   Epoch times will be rounded to the nearest nanosecond.
-
-.. _timeseries.daterange:
-
-Generating Ranges of Timestamps
--------------------------------
-
-To generate an index with time stamps, you can use either the DatetimeIndex or
-Index constructor and pass in a list of datetime objects:
-
-.. ipython:: python
-
-   dates = [datetime(2012, 5, 1), datetime(2012, 5, 2), datetime(2012, 5, 3)]
-
-   # Note the frequency information
-   index = pd.DatetimeIndex(dates)
-   index
-
-   # Automatically converted to DatetimeIndex
-   index = pd.Index(dates)
-   index
-
-Practically, this becomes very cumbersome because we often need a very long
-index with a large number of timestamps. If we need timestamps on a regular
-frequency, we can use the pandas functions ``date_range`` and ``bdate_range``
-to create timestamp indexes.
-
-.. ipython:: python
-
-   index = pd.date_range('2000-1-1', periods=1000, freq='M')
-   index
-
-   index = pd.bdate_range('2012-1-1', periods=250)
-   index
-
-Convenience functions like ``date_range`` and ``bdate_range`` utilize a
-variety of frequency aliases. The default frequency for ``date_range`` is a
-**calendar day** while the default for ``bdate_range`` is a **business day**
-
-.. ipython:: python
-
-   start = datetime(2011, 1, 1)
-   end = datetime(2012, 1, 1)
-
-   rng = pd.date_range(start, end)
-   rng
-
-   rng = pd.bdate_range(start, end)
-   rng
-
-``date_range`` and ``bdate_range`` make it easy to generate a range of dates
-using various combinations of parameters like ``start``, ``end``,
-``periods``, and ``freq``:
-
-.. ipython:: python
-
-   pd.date_range(start, end, freq='BM')
-
-   pd.date_range(start, end, freq='W')
-
-   pd.bdate_range(end=end, periods=20)
-
-   pd.bdate_range(start=start, periods=20)
-
-The start and end dates are strictly inclusive. So it will not generate any
-dates outside of those dates if specified.
-
-.. _timeseries.timestamp-limits:
-
-Timestamp limitations
----------------------
-
-Since pandas represents timestamps in nanosecond resolution, the timespan that
-can be represented using a 64-bit integer is limited to approximately 584 years:
-
-.. ipython:: python
-
-   pd.Timestamp.min
-   pd.Timestamp.max
-
-See :ref:`here <timeseries.oob>` for ways to represent data outside these bound.
-
-.. _timeseries.datetimeindex:
-
-Indexing
---------
-
-One of the main uses for ``DatetimeIndex`` is as an index for pandas objects.
-The ``DatetimeIndex`` class contains many timeseries related optimizations:
-
-  - A large range of dates for various offsets are pre-computed and cached
-    under the hood in order to make generating subsequent date ranges very fast
-    (just have to grab a slice)
-  - Fast shifting using the ``shift`` and ``tshift`` method on pandas objects
-  - Unioning of overlapping DatetimeIndex objects with the same frequency is
-    very fast (important for fast data alignment)
-  - Quick access to date fields via properties such as ``year``, ``month``, etc.
-  - Regularization functions like ``snap`` and very fast ``asof`` logic
-
-DatetimeIndex objects has all the basic functionality of regular Index objects
-and a smorgasbord of advanced timeseries-specific methods for easy frequency
-processing.
-
-.. seealso::
-    :ref:`Reindexing methods <basics.reindexing>`
-
-.. note::
-
-    While pandas does not force you to have a sorted date index, some of these
-    methods may have unexpected or incorrect behavior if the dates are
-    unsorted. So please be careful.
-
-``DatetimeIndex`` can be used like a regular index and offers all of its
-intelligent functionality like selection, slicing, etc.
-
-.. ipython:: python
-
-   rng = pd.date_range(start, end, freq='BM')
-   ts = pd.Series(np.random.randn(len(rng)), index=rng)
-   ts.index
-   ts[:5].index
-   ts[::2].index
-
-.. _timeseries.partialindexing:
-
-Partial String Indexing
-~~~~~~~~~~~~~~~~~~~~~~~
-
-You can pass in dates and strings that parse to dates as indexing parameters:
-
-.. ipython:: python
-
-   ts['1/31/2011']
-
-   ts[datetime(2011, 12, 25):]
-
-   ts['10/31/2011':'12/31/2011']
-
-To provide convenience for accessing longer time series, you can also pass in
-the year or year and month as strings:
-
-.. ipython:: python
-
-   ts['2011']
-
-   ts['2011-6']
-
-This type of slicing will work on a DataFrame with a ``DateTimeIndex`` as well. Since the
-partial string selection is a form of label slicing, the endpoints **will be** included. This
-would include matching times on an included date. Here's an example:
-
-.. ipython:: python
-
-   dft = pd.DataFrame(randn(100000,1),
-                      columns=['A'],
-                      index=pd.date_range('20130101',periods=100000,freq='T'))
-   dft
-   dft['2013']
-
-This starts on the very first time in the month, and includes the last date & time for the month
-
-.. ipython:: python
-
-   dft['2013-1':'2013-2']
-
-This specifies a stop time **that includes all of the times on the last day**
-
-.. ipython:: python
-
-   dft['2013-1':'2013-2-28']
-
-This specifies an **exact** stop time (and is not the same as the above)
-
-.. ipython:: python
-
-   dft['2013-1':'2013-2-28 00:00:00']
-
-We are stopping on the included end-point as it is part of the index
-
-.. ipython:: python
-
-   dft['2013-1-15':'2013-1-15 12:30:00']
-
-.. versionadded:: 0.18.0
-
-DatetimeIndex Partial String Indexing also works on DataFrames with a ``MultiIndex``. For example:
-
-.. ipython:: python
-
-   dft2 = pd.DataFrame(np.random.randn(20, 1),
-                       columns=['A'],
-                       index=pd.MultiIndex.from_product([pd.date_range('20130101',
-                                                                       periods=10,
-                                                                       freq='12H'),
-                                                        ['a', 'b']]))
-   dft2
-   dft2.loc['2013-01-05']
-   idx = pd.IndexSlice
-   dft2 = dft2.swaplevel(0, 1).sort_index()
-   dft2.loc[idx[:, '2013-01-05'], :]
-
-.. _timeseries.slice_vs_exact_match:
-
-Slice vs. exact match
-~~~~~~~~~~~~~~~~~~~~~
-
-.. versionchanged:: 0.20.0
-
-The same string used as an indexing parameter can be treated either as a slice or as an exact match depending on the resolution of an index. If the string is less accurate than the index, it will be treated as a slice, otherwise as an exact match.
-
-For example, let us consider ``Series`` object which index has minute resolution.
-
-.. ipython:: python
-
-    series_minute = pd.Series([1, 2, 3],
-                              pd.DatetimeIndex(['2011-12-31 23:59:00',
-                                                '2012-01-01 00:00:00',
-                                                '2012-01-01 00:02:00']))
-    series_minute.index.resolution
-
-A timestamp string less accurate than a minute gives a ``Series`` object.
-
-.. ipython:: python
-
-    series_minute['2011-12-31 23']
-
-A timestamp string with minute resolution (or more accurate), gives a scalar instead, i.e. it is not casted to a slice.
-
-.. ipython:: python
-
-    series_minute['2011-12-31 23:59']
-    series_minute['2011-12-31 23:59:00']
-
-If index resolution is second, then, the minute-accurate timestamp gives a ``Series``.
-
-.. ipython:: python
-
-    series_second = pd.Series([1, 2, 3],
-                              pd.DatetimeIndex(['2011-12-31 23:59:59',
-                                                '2012-01-01 00:00:00',
-                                                '2012-01-01 00:00:01']))
-    series_second.index.resolution
-    series_second['2011-12-31 23:59']
-
-If the timestamp string is treated as a slice, it can be used to index ``DataFrame`` with ``[]`` as well.
-
-.. ipython:: python
-
-    dft_minute = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]},
-                               index=series_minute.index)
-    dft_minute['2011-12-31 23']
-
-
-.. warning::
-
-   However if the string is treated as an exact match, the selection in ``DataFrame``'s ``[]`` will be column-wise and not row-wise, see :ref:`Indexing Basics <indexing.basics>`. For example ``dft_minute['2011-12-31 23:59']`` will raise ``KeyError`` as ``'2012-12-31 23:59'`` has the same resolution as index and there is no column with such name:
-
-   To *always* have unambiguous selection, whether the row is treated as a slice or a single selection, use ``.loc``.
-
-   .. ipython:: python
-
-     dft_minute.loc['2011-12-31 23:59']
-
-Note also that ``DatetimeIndex`` resolution cannot be less precise than day.
-
-.. ipython:: python
-
-    series_monthly = pd.Series([1, 2, 3],
-                              pd.DatetimeIndex(['2011-12',
-                                                '2012-01',
-                                                '2012-02']))
-    series_monthly.index.resolution
-    series_monthly['2011-12'] # returns Series
-
-
-Exact Indexing
-~~~~~~~~~~~~~~
-
-As discussed in previous section, indexing a ``DateTimeIndex`` with a partial string depends on the "accuracy" of the period, in other words how specific the interval is in relation to the resolution of the index. In contrast, indexing with ``Timestamp`` or ``datetime`` objects is exact, because the objects have exact meaning. These also follow the semantics of *including both endpoints*.
-
-These ``Timestamp`` and ``datetime`` objects have exact ``hours, minutes,`` and ``seconds``, even though they were not explicitly specified (they are ``0``).
-
-.. ipython:: python
-
-   dft[datetime(2013, 1, 1):datetime(2013,2,28)]
-
-With no defaults.
-
-.. ipython:: python
-
-   dft[datetime(2013, 1, 1, 10, 12, 0):datetime(2013, 2, 28, 10, 12, 0)]
-
-
-Truncating & Fancy Indexing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-A ``truncate`` convenience function is provided that is equivalent to slicing:
-
-.. ipython:: python
-
-   ts.truncate(before='10/31/2011', after='12/31/2011')
-
-Even complicated fancy indexing that breaks the DatetimeIndex's frequency
-regularity will result in a ``DatetimeIndex`` (but frequency is lost):
-
-.. ipython:: python
-
-   ts[[0, 2, 6]].index
-
-.. _timeseries.components:
-
-Time/Date Components
---------------------
-
-There are several time/date properties that one can access from ``Timestamp`` or a collection of timestamps like a ``DateTimeIndex``.
-
-.. csv-table::
-    :header: "Property", "Description"
-    :widths: 15, 65
-
-    year, "The year of the datetime"
-    month,"The month of the datetime"
-    day,"The days of the datetime"
-    hour,"The hour of the datetime"
-    minute,"The minutes of the datetime"
-    second,"The seconds of the datetime"
-    microsecond,"The microseconds of the datetime"
-    nanosecond,"The nanoseconds of the datetime"
-    date,"Returns datetime.date (does not contain timezone information)"
-    time,"Returns datetime.time (does not contain timezone information)"
-    dayofyear,"The ordinal day of year"
-    weekofyear,"The week ordinal of the year"
-    week,"The week ordinal of the year"
-    dayofweek,"The number of the day of the week with Monday=0, Sunday=6"
-    weekday,"The number of the day of the week with Monday=0, Sunday=6"
-    weekday_name,"The name of the day in a week (ex: Friday)"
-    quarter,"Quarter of the date: Jan-Mar = 1, Apr-Jun = 2, etc."
-    days_in_month,"The number of days in the month of the datetime"
-    is_month_start,"Logical indicating if first day of month (defined by frequency)"
-    is_month_end,"Logical indicating if last day of month (defined by frequency)"
-    is_quarter_start,"Logical indicating if first day of quarter (defined by frequency)"
-    is_quarter_end,"Logical indicating if last day of quarter (defined by frequency)"
-    is_year_start,"Logical indicating if first day of year (defined by frequency)"
-    is_year_end,"Logical indicating if last day of year (defined by frequency)"
-    is_leap_year,"Logical indicating if the date belongs to a leap year"
-
-Furthermore, if you have a ``Series`` with datetimelike values, then you can access these properties via the ``.dt`` accessor, see the :ref:`docs <basics.dt_accessors>`
-
-.. _timeseries.offsets:
-
-DateOffset objects
-------------------
-
-In the preceding examples, we created DatetimeIndex objects at various
-frequencies by passing in :ref:`frequency strings <timeseries.offset_aliases>`
-like 'M', 'W', and 'BM to the ``freq`` keyword. Under the hood, these frequency
-strings are being translated into an instance of pandas ``DateOffset``,
-which represents a regular frequency increment. Specific offset logic like
-"month", "business day", or "one hour" is represented in its various subclasses.
-
-.. csv-table::
-    :header: "Class name", "Description"
-    :widths: 15, 65
-
-    DateOffset, "Generic offset class, defaults to 1 calendar day"
-    BDay, "business day (weekday)"
-    CDay, "custom business day (experimental)"
-    Week, "one week, optionally anchored on a day of the week"
-    WeekOfMonth, "the x-th day of the y-th week of each month"
-    LastWeekOfMonth, "the x-th day of the last week of each month"
-    MonthEnd, "calendar month end"
-    MonthBegin, "calendar month begin"
-    BMonthEnd, "business month end"
-    BMonthBegin, "business month begin"
-    CBMonthEnd, "custom business month end"
-    CBMonthBegin, "custom business month begin"
-    SemiMonthEnd, "15th (or other day_of_month) and calendar month end"
-    SemiMonthBegin, "15th (or other day_of_month) and calendar month begin"
-    QuarterEnd, "calendar quarter end"
-    QuarterBegin, "calendar quarter begin"
-    BQuarterEnd, "business quarter end"
-    BQuarterBegin, "business quarter begin"
-    FY5253Quarter, "retail (aka 52-53 week) quarter"
-    YearEnd, "calendar year end"
-    YearBegin, "calendar year begin"
-    BYearEnd, "business year end"
-    BYearBegin, "business year begin"
-    FY5253, "retail (aka 52-53 week) year"
-    BusinessHour, "business hour"
-    CustomBusinessHour, "custom business hour"
-    Hour, "one hour"
-    Minute, "one minute"
-    Second, "one second"
-    Milli, "one millisecond"
-    Micro, "one microsecond"
-    Nano, "one nanosecond"
-
-The basic ``DateOffset`` takes the same arguments as
-``dateutil.relativedelta``, which works like:
-
-.. ipython:: python
-
-   d = datetime(2008, 8, 18, 9, 0)
-   d + relativedelta(months=4, days=5)
-
-We could have done the same thing with ``DateOffset``:
-
-.. ipython:: python
-
-   from pandas.tseries.offsets import *
-   d + DateOffset(months=4, days=5)
-
-The key features of a ``DateOffset`` object are:
-
-- it can be added / subtracted to/from a datetime object to obtain a
-  shifted date
-- it can be multiplied by an integer (positive or negative) so that the
-  increment will be applied multiple times
-- it has ``rollforward`` and ``rollback`` methods for moving a date forward
-  or backward to the next or previous "offset date"
-
-Subclasses of ``DateOffset`` define the ``apply`` function which dictates
-custom date increment logic, such as adding business days:
-
-.. code-block:: python
-
-    class BDay(DateOffset):
-	"""DateOffset increments between business days"""
-        def apply(self, other):
-            ...
-
-.. ipython:: python
-
-   d - 5 * BDay()
-   d + BMonthEnd()
-
-The ``rollforward`` and ``rollback`` methods do exactly what you would expect:
-
-.. ipython:: python
-
-   d
-   offset = BMonthEnd()
-   offset.rollforward(d)
-   offset.rollback(d)
-
-It's definitely worth exploring the ``pandas.tseries.offsets`` module and the
-various docstrings for the classes.
-
-These operations (``apply``, ``rollforward`` and ``rollback``) preserves time (hour, minute, etc) information by default. To reset time, use ``normalize=True`` keyword when creating the offset instance. If ``normalize=True``, result is normalized after the function is applied.
-
-
-.. ipython:: python
-
-   day = Day()
-   day.apply(pd.Timestamp('2014-01-01 09:00'))
-
-   day = Day(normalize=True)
-   day.apply(pd.Timestamp('2014-01-01 09:00'))
-
-   hour = Hour()
-   hour.apply(pd.Timestamp('2014-01-01 22:00'))
-
-   hour = Hour(normalize=True)
-   hour.apply(pd.Timestamp('2014-01-01 22:00'))
-   hour.apply(pd.Timestamp('2014-01-01 23:00'))
-
-
-Parametric offsets
-~~~~~~~~~~~~~~~~~~
-
-Some of the offsets can be "parameterized" when created to result in different
-behaviors. For example, the ``Week`` offset for generating weekly data accepts a
-``weekday`` parameter which results in the generated dates always lying on a
-particular day of the week:
-
-.. ipython:: python
-
-   d
-   d + Week()
-   d + Week(weekday=4)
-   (d + Week(weekday=4)).weekday()
-
-   d - Week()
-
-``normalize`` option will be effective for addition and subtraction.
-
-.. ipython:: python
-
-   d + Week(normalize=True)
-   d - Week(normalize=True)
-
-
-Another example is parameterizing ``YearEnd`` with the specific ending month:
-
-.. ipython:: python
-
-   d + YearEnd()
-   d + YearEnd(month=6)
-
-
-.. _timeseries.offsetseries:
-
-Using offsets with ``Series`` / ``DatetimeIndex``
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Offsets can be used with either a ``Series`` or ``DatetimeIndex`` to
-apply the offset to each element.
-
-.. ipython:: python
-
-   rng = pd.date_range('2012-01-01', '2012-01-03')
-   s = pd.Series(rng)
-   rng
-   rng + DateOffset(months=2)
-   s + DateOffset(months=2)
-   s - DateOffset(months=2)
-
-If the offset class maps directly to a ``Timedelta`` (``Day``, ``Hour``,
-``Minute``, ``Second``, ``Micro``, ``Milli``, ``Nano``) it can be
-used exactly like a ``Timedelta`` - see the
-:ref:`Timedelta section<timedeltas.operations>` for more examples.
-
-.. ipython:: python
-
-   s - Day(2)
-   td = s - pd.Series(pd.date_range('2011-12-29', '2011-12-31'))
-   td
-   td + Minute(15)
-
-Note that some offsets (such as ``BQuarterEnd``) do not have a
-vectorized implementation.  They can still be used but may
-calculate significantly slower and will show a ``PerformanceWarning``
-
-.. ipython:: python
-   :okwarning:
-
-   rng + BQuarterEnd()
-
-
-.. _timeseries.custombusinessdays:
-
-Custom Business Days
-~~~~~~~~~~~~~~~~~~~~
-
-The ``CDay`` or ``CustomBusinessDay`` class provides a parametric
-``BusinessDay`` class which can be used to create customized business day
-calendars which account for local holidays and local weekend conventions.
-
-As an interesting example, let's look at Egypt where a Friday-Saturday weekend is observed.
-
-.. ipython:: python
-
-    from pandas.tseries.offsets import CustomBusinessDay
-    weekmask_egypt = 'Sun Mon Tue Wed Thu'
-
-    # They also observe International Workers' Day so let's
-    # add that for a couple of years
-
-    holidays = ['2012-05-01', datetime(2013, 5, 1), np.datetime64('2014-05-01')]
-    bday_egypt = CustomBusinessDay(holidays=holidays, weekmask=weekmask_egypt)
-    dt = datetime(2013, 4, 30)
-    dt + 2 * bday_egypt
-
-Let's map to the weekday names
-
-.. ipython:: python
-
-    dts = pd.date_range(dt, periods=5, freq=bday_egypt)
-
-    pd.Series(dts.weekday, dts).map(pd.Series('Mon Tue Wed Thu Fri Sat Sun'.split()))
-
-Holiday calendars can be used to provide the list of holidays.  See the
-:ref:`holiday calendar<timeseries.holiday>` section for more information.
-
-.. ipython:: python
-
-    from pandas.tseries.holiday import USFederalHolidayCalendar
-
-    bday_us = CustomBusinessDay(calendar=USFederalHolidayCalendar())
-
-    # Friday before MLK Day
-    dt = datetime(2014, 1, 17)
-
-    # Tuesday after MLK Day (Monday is skipped because it's a holiday)
-    dt + bday_us
-
-Monthly offsets that respect a certain holiday calendar can be defined
-in the usual way.
-
-.. ipython:: python
-
-    from pandas.tseries.offsets import CustomBusinessMonthBegin
-    bmth_us = CustomBusinessMonthBegin(calendar=USFederalHolidayCalendar())
-
-    # Skip new years
-    dt = datetime(2013, 12, 17)
-    dt + bmth_us
-
-    # Define date index with custom offset
-    pd.DatetimeIndex(start='20100101',end='20120101',freq=bmth_us)
-
-.. note::
-
-    The frequency string 'C' is used to indicate that a CustomBusinessDay
-    DateOffset is used, it is important to note that since CustomBusinessDay is
-    a parameterised type, instances of CustomBusinessDay may differ and this is
-    not detectable from the 'C' frequency string. The user therefore needs to
-    ensure that the 'C' frequency string is used consistently within the user's
-    application.
-
-.. _timeseries.businesshour:
-
-Business Hour
-~~~~~~~~~~~~~
-
-The ``BusinessHour`` class provides a business hour representation on ``BusinessDay``,
-allowing to use specific start and end times.
-
-By default, ``BusinessHour`` uses 9:00 - 17:00 as business hours.
-Adding ``BusinessHour`` will increment ``Timestamp`` by hourly.
-If target ``Timestamp`` is out of business hours, move to the next business hour then increment it.
-If the result exceeds the business hours end, remaining is added to the next business day.
-
-.. ipython:: python
-
-    bh = BusinessHour()
-    bh
-
-    # 2014-08-01 is Friday
-    pd.Timestamp('2014-08-01 10:00').weekday()
-    pd.Timestamp('2014-08-01 10:00') + bh
-
-    # Below example is the same as: pd.Timestamp('2014-08-01 09:00') + bh
-    pd.Timestamp('2014-08-01 08:00') + bh
-
-    # If the results is on the end time, move to the next business day
-    pd.Timestamp('2014-08-01 16:00') + bh
-
-    # Remainings are added to the next day
-    pd.Timestamp('2014-08-01 16:30') + bh
-
-    # Adding 2 business hours
-    pd.Timestamp('2014-08-01 10:00') + BusinessHour(2)
-
-    # Subtracting 3 business hours
-    pd.Timestamp('2014-08-01 10:00') + BusinessHour(-3)
-
-Also, you can specify ``start`` and ``end`` time by keywords.
-Argument must be ``str`` which has ``hour:minute`` representation or ``datetime.time`` instance.
-Specifying seconds, microseconds and nanoseconds as business hour results in ``ValueError``.
-
-.. ipython:: python
-
-    bh = BusinessHour(start='11:00', end=time(20, 0))
-    bh
-
-    pd.Timestamp('2014-08-01 13:00') + bh
-    pd.Timestamp('2014-08-01 09:00') + bh
-    pd.Timestamp('2014-08-01 18:00') + bh
-
-Passing ``start`` time later than ``end`` represents midnight business hour.
-In this case, business hour exceeds midnight and overlap to the next day.
-Valid business hours are distinguished by whether it started from valid ``BusinessDay``.
-
-.. ipython:: python
-
-    bh = BusinessHour(start='17:00', end='09:00')
-    bh
-
-    pd.Timestamp('2014-08-01 17:00') + bh
-    pd.Timestamp('2014-08-01 23:00') + bh
-
-    # Although 2014-08-02 is Satuaday,
-    # it is valid because it starts from 08-01 (Friday).
-    pd.Timestamp('2014-08-02 04:00') + bh
-
-    # Although 2014-08-04 is Monday,
-    # it is out of business hours because it starts from 08-03 (Sunday).
-    pd.Timestamp('2014-08-04 04:00') + bh
-
-Applying ``BusinessHour.rollforward`` and ``rollback`` to out of business hours results in
-the next business hour start or previous day's end. Different from other offsets, ``BusinessHour.rollforward``
-may output different results from ``apply`` by definition.
-
-This is because one day's business hour end is equal to next day's business hour start. For example,
-under the default business hours (9:00 - 17:00), there is no gap (0 minutes) between ``2014-08-01 17:00`` and
-``2014-08-04 09:00``.
-
-.. ipython:: python
-
-    # This adjusts a Timestamp to business hour edge
-    BusinessHour().rollback(pd.Timestamp('2014-08-02 15:00'))
-    BusinessHour().rollforward(pd.Timestamp('2014-08-02 15:00'))
-
-    # It is the same as BusinessHour().apply(pd.Timestamp('2014-08-01 17:00')).
-    # And it is the same as BusinessHour().apply(pd.Timestamp('2014-08-04 09:00'))
-    BusinessHour().apply(pd.Timestamp('2014-08-02 15:00'))
-
-    # BusinessDay results (for reference)
-    BusinessHour().rollforward(pd.Timestamp('2014-08-02'))
-
-    # It is the same as BusinessDay().apply(pd.Timestamp('2014-08-01'))
-    # The result is the same as rollworward because BusinessDay never overlap.
-    BusinessHour().apply(pd.Timestamp('2014-08-02'))
-
-``BusinessHour`` regards Saturday and Sunday as holidays. To use arbitrary holidays,
-you can use ``CustomBusinessHour`` offset, see :ref:`Custom Business Hour <timeseries.custombusinesshour>`:
-
-.. _timeseries.custombusinesshour:
-
-Custom Business Hour
-~~~~~~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.18.1
-
-The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
-allows you to specify arbitrary holidays. ``CustomBusinessHour`` works as the same
-as ``BusinessHour`` except that it skips specified custom holidays.
-
-.. ipython:: python
-
-    from pandas.tseries.holiday import USFederalHolidayCalendar
-    bhour_us = CustomBusinessHour(calendar=USFederalHolidayCalendar())
-    # Friday before MLK Day
-    dt = datetime(2014, 1, 17, 15)
-
-    dt + bhour_us
-
-    # Tuesday after MLK Day (Monday is skipped because it's a holiday)
-    dt + bhour_us * 2
-
-You can use keyword arguments suported by either ``BusinessHour`` and ``CustomBusinessDay``.
-
-.. ipython:: python
-
-    bhour_mon = CustomBusinessHour(start='10:00', weekmask='Tue Wed Thu Fri')
-
-    # Monday is skipped because it's a holiday, business hour starts from 10:00
-    dt + bhour_mon * 2
-
-.. _timeseries.offset_aliases:
-
-Offset Aliases
-~~~~~~~~~~~~~~
-
-A number of string aliases are given to useful common time series
-frequencies. We will refer to these aliases as *offset aliases*
-(referred to as *time rules* prior to v0.8.0).
-
-.. csv-table::
-    :header: "Alias", "Description"
-    :widths: 15, 100
-
-    "B", "business day frequency"
-    "C", "custom business day frequency (experimental)"
-    "D", "calendar day frequency"
-    "W", "weekly frequency"
-    "M", "month end frequency"
-    "SM", "semi-month end frequency (15th and end of month)"
-    "BM", "business month end frequency"
-    "CBM", "custom business month end frequency"
-    "MS", "month start frequency"
-    "SMS", "semi-month start frequency (1st and 15th)"
-    "BMS", "business month start frequency"
-    "CBMS", "custom business month start frequency"
-    "Q", "quarter end frequency"
-    "BQ", "business quarter endfrequency"
-    "QS", "quarter start frequency"
-    "BQS", "business quarter start frequency"
-    "A", "year end frequency"
-    "BA", "business year end frequency"
-    "AS", "year start frequency"
-    "BAS", "business year start frequency"
-    "BH", "business hour frequency"
-    "H", "hourly frequency"
-    "T, min", "minutely frequency"
-    "S", "secondly frequency"
-    "L, ms", "milliseconds"
-    "U, us", "microseconds"
-    "N", "nanoseconds"
-
-Combining Aliases
-~~~~~~~~~~~~~~~~~
-
-As we have seen previously, the alias and the offset instance are fungible in
-most functions:
-
-.. ipython:: python
-
-   pd.date_range(start, periods=5, freq='B')
-
-   pd.date_range(start, periods=5, freq=BDay())
-
-You can combine together day and intraday offsets:
-
-.. ipython:: python
-
-   pd.date_range(start, periods=10, freq='2h20min')
-
-   pd.date_range(start, periods=10, freq='1D10U')
-
-Anchored Offsets
-~~~~~~~~~~~~~~~~
-
-For some frequencies you can specify an anchoring suffix:
-
-.. csv-table::
-    :header: "Alias", "Description"
-    :widths: 15, 100
-
-    "W\-SUN", "weekly frequency (sundays). Same as 'W'"
-    "W\-MON", "weekly frequency (mondays)"
-    "W\-TUE", "weekly frequency (tuesdays)"
-    "W\-WED", "weekly frequency (wednesdays)"
-    "W\-THU", "weekly frequency (thursdays)"
-    "W\-FRI", "weekly frequency (fridays)"
-    "W\-SAT", "weekly frequency (saturdays)"
-    "(B)Q(S)\-DEC", "quarterly frequency, year ends in December. Same as 'Q'"
-    "(B)Q(S)\-JAN", "quarterly frequency, year ends in January"
-    "(B)Q(S)\-FEB", "quarterly frequency, year ends in February"
-    "(B)Q(S)\-MAR", "quarterly frequency, year ends in March"
-    "(B)Q(S)\-APR", "quarterly frequency, year ends in April"
-    "(B)Q(S)\-MAY", "quarterly frequency, year ends in May"
-    "(B)Q(S)\-JUN", "quarterly frequency, year ends in June"
-    "(B)Q(S)\-JUL", "quarterly frequency, year ends in July"
-    "(B)Q(S)\-AUG", "quarterly frequency, year ends in August"
-    "(B)Q(S)\-SEP", "quarterly frequency, year ends in September"
-    "(B)Q(S)\-OCT", "quarterly frequency, year ends in October"
-    "(B)Q(S)\-NOV", "quarterly frequency, year ends in November"
-    "(B)A(S)\-DEC", "annual frequency, anchored end of December. Same as 'A'"
-    "(B)A(S)\-JAN", "annual frequency, anchored end of January"
-    "(B)A(S)\-FEB", "annual frequency, anchored end of February"
-    "(B)A(S)\-MAR", "annual frequency, anchored end of March"
-    "(B)A(S)\-APR", "annual frequency, anchored end of April"
-    "(B)A(S)\-MAY", "annual frequency, anchored end of May"
-    "(B)A(S)\-JUN", "annual frequency, anchored end of June"
-    "(B)A(S)\-JUL", "annual frequency, anchored end of July"
-    "(B)A(S)\-AUG", "annual frequency, anchored end of August"
-    "(B)A(S)\-SEP", "annual frequency, anchored end of September"
-    "(B)A(S)\-OCT", "annual frequency, anchored end of October"
-    "(B)A(S)\-NOV", "annual frequency, anchored end of November"
-
-These can be used as arguments to ``date_range``, ``bdate_range``, constructors
-for ``DatetimeIndex``, as well as various other timeseries-related functions
-in pandas.
-
-Anchored Offset Semantics
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-For those offsets that are anchored to the start or end of specific
-frequency (``MonthEnd``, ``MonthBegin``, ``WeekEnd``, etc) the following
-rules apply to rolling forward and backwards.
-
-When ``n`` is not 0, if the given date is not on an anchor point, it snapped to the next(previous)
-anchor point, and moved ``|n|-1`` additional steps forwards or backwards.
-
-.. ipython:: python
-
-   pd.Timestamp('2014-01-02') + MonthBegin(n=1)
-   pd.Timestamp('2014-01-02') + MonthEnd(n=1)
-
-   pd.Timestamp('2014-01-02') - MonthBegin(n=1)
-   pd.Timestamp('2014-01-02') - MonthEnd(n=1)
-
-   pd.Timestamp('2014-01-02') + MonthBegin(n=4)
-   pd.Timestamp('2014-01-02') - MonthBegin(n=4)
-
-If the given date *is* on an anchor point, it is moved ``|n|`` points forwards
-or backwards.
-
-.. ipython:: python
-
-   pd.Timestamp('2014-01-01') + MonthBegin(n=1)
-   pd.Timestamp('2014-01-31') + MonthEnd(n=1)
-
-   pd.Timestamp('2014-01-01') - MonthBegin(n=1)
-   pd.Timestamp('2014-01-31') - MonthEnd(n=1)
-
-   pd.Timestamp('2014-01-01') + MonthBegin(n=4)
-   pd.Timestamp('2014-01-31') - MonthBegin(n=4)
-
-For the case when ``n=0``, the date is not moved if on an anchor point, otherwise
-it is rolled forward to the next anchor point.
-
-.. ipython:: python
-
-   pd.Timestamp('2014-01-02') + MonthBegin(n=0)
-   pd.Timestamp('2014-01-02') + MonthEnd(n=0)
-
-   pd.Timestamp('2014-01-01') + MonthBegin(n=0)
-   pd.Timestamp('2014-01-31') + MonthEnd(n=0)
-
-.. _timeseries.holiday:
-
-Holidays / Holiday Calendars
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Holidays and calendars provide a simple way to define holiday rules to be used
-with ``CustomBusinessDay`` or in other analysis that requires a predefined
-set of holidays.  The ``AbstractHolidayCalendar`` class provides all the necessary
-methods to return a list of holidays and only ``rules`` need to be defined
-in a specific holiday calendar class.  Further, ``start_date`` and ``end_date``
-class attributes determine over what date range holidays are generated.  These
-should be overwritten on the ``AbstractHolidayCalendar`` class to have the range
-apply to all calendar subclasses.  ``USFederalHolidayCalendar`` is the
-only calendar that exists and primarily serves as an example for developing
-other calendars.
-
-For holidays that occur on fixed dates (e.g., US Memorial Day or July 4th) an
-observance rule determines when that holiday is observed if it falls on a weekend
-or some other non-observed day.  Defined observance rules are:
-
-.. csv-table::
-    :header: "Rule", "Description"
-    :widths: 15, 70
-
-    "nearest_workday", "move Saturday to Friday and Sunday to Monday"
-    "sunday_to_monday", "move Sunday to following Monday"
-    "next_monday_or_tuesday", "move Saturday to Monday and Sunday/Monday to Tuesday"
-    "previous_friday", move Saturday and Sunday to previous Friday"
-    "next_monday", "move Saturday and Sunday to following Monday"
-
-An example of how holidays and holiday calendars are defined:
-
-.. ipython:: python
-
-    from pandas.tseries.holiday import Holiday, USMemorialDay,\
-        AbstractHolidayCalendar, nearest_workday, MO
-    class ExampleCalendar(AbstractHolidayCalendar):
-        rules = [
-            USMemorialDay,
-            Holiday('July 4th', month=7, day=4, observance=nearest_workday),
-            Holiday('Columbus Day', month=10, day=1,
-                offset=DateOffset(weekday=MO(2))), #same as 2*Week(weekday=2)
-            ]
-    cal = ExampleCalendar()
-    cal.holidays(datetime(2012, 1, 1), datetime(2012, 12, 31))
-
-Using this calendar, creating an index or doing offset arithmetic skips weekends
-and holidays (i.e., Memorial Day/July 4th).  For example, the below defines
-a custom business day offset using the ``ExampleCalendar``.  Like any other offset,
-it can be used to create a ``DatetimeIndex`` or added to ``datetime``
-or ``Timestamp`` objects.
-
-.. ipython:: python
-
-    from pandas.tseries.offsets import CDay
-    pd.DatetimeIndex(start='7/1/2012', end='7/10/2012',
-        freq=CDay(calendar=cal)).to_pydatetime()
-    offset = CustomBusinessDay(calendar=cal)
-    datetime(2012, 5, 25) + offset
-    datetime(2012, 7, 3) + offset
-    datetime(2012, 7, 3) + 2 * offset
-    datetime(2012, 7, 6) + offset
-
-Ranges are defined by the ``start_date`` and ``end_date`` class attributes
-of ``AbstractHolidayCalendar``.  The defaults are below.
-
-.. ipython:: python
-
-    AbstractHolidayCalendar.start_date
-    AbstractHolidayCalendar.end_date
-
-These dates can be overwritten by setting the attributes as
-datetime/Timestamp/string.
-
-.. ipython:: python
-
-    AbstractHolidayCalendar.start_date = datetime(2012, 1, 1)
-    AbstractHolidayCalendar.end_date = datetime(2012, 12, 31)
-    cal.holidays()
-
-Every calendar class is accessible by name using the ``get_calendar`` function
-which returns a holiday class instance.  Any imported calendar class will
-automatically be available by this function.  Also, ``HolidayCalendarFactory``
-provides an easy interface to create calendars that are combinations of calendars
-or calendars with additional rules.
-
-.. ipython:: python
-
-    from pandas.tseries.holiday import get_calendar, HolidayCalendarFactory,\
-        USLaborDay
-    cal = get_calendar('ExampleCalendar')
-    cal.rules
-    new_cal = HolidayCalendarFactory('NewExampleCalendar', cal, USLaborDay)
-    new_cal.rules
-
-.. _timeseries.advanced_datetime:
-
-Time series-related instance methods
-------------------------------------
-
-Shifting / lagging
-~~~~~~~~~~~~~~~~~~
-
-One may want to *shift* or *lag* the values in a time series back and forward in
-time. The method for this is ``shift``, which is available on all of the pandas
-objects.
-
-.. ipython:: python
-
-   ts = ts[:5]
-   ts.shift(1)
-
-The shift method accepts an ``freq`` argument which can accept a
-``DateOffset`` class or other ``timedelta``-like object or also a :ref:`offset alias <timeseries.offset_aliases>`:
-
-.. ipython:: python
-
-   ts.shift(5, freq=offsets.BDay())
-   ts.shift(5, freq='BM')
-
-Rather than changing the alignment of the data and the index, ``DataFrame`` and
-``Series`` objects also have a ``tshift`` convenience method that changes
-all the dates in the index by a specified number of offsets:
-
-.. ipython:: python
-
-   ts.tshift(5, freq='D')
-
-Note that with ``tshift``, the leading entry is no longer NaN because the data
-is not being realigned.
-
-Frequency conversion
-~~~~~~~~~~~~~~~~~~~~
-
-The primary function for changing frequencies is the ``asfreq`` function.
-For a ``DatetimeIndex``, this is basically just a thin, but convenient wrapper
-around ``reindex`` which generates a ``date_range`` and calls ``reindex``.
-
-.. ipython:: python
-
-   dr = pd.date_range('1/1/2010', periods=3, freq=3 * offsets.BDay())
-   ts = pd.Series(randn(3), index=dr)
-   ts
-   ts.asfreq(BDay())
-
-``asfreq`` provides a further convenience so you can specify an interpolation
-method for any gaps that may appear after the frequency conversion
-
-.. ipython:: python
-
-   ts.asfreq(BDay(), method='pad')
-
-Filling forward / backward
-~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Related to ``asfreq`` and ``reindex`` is the ``fillna`` function documented in
-the :ref:`missing data section <missing_data.fillna>`.
-
-Converting to Python datetimes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-``DatetimeIndex`` can be converted to an array of Python native datetime.datetime objects using the
-``to_pydatetime`` method.
-
-.. _timeseries.resampling:
-
-Resampling
-----------
-
-.. warning::
-
-   The interface to ``.resample`` has changed in 0.18.0 to be more groupby-like and hence more flexible.
-   See the :ref:`whatsnew docs <whatsnew_0180.breaking.resample>` for a comparison with prior versions.
-
-Pandas has a simple, powerful, and efficient functionality for
-performing resampling operations during frequency conversion (e.g., converting
-secondly data into 5-minutely data). This is extremely common in, but not
-limited to, financial applications.
-
-``.resample()`` is a time-based groupby, followed by a reduction method on each of its groups.
-See some :ref:`cookbook examples <cookbook.resample>` for some advanced strategies
-
-Starting in version 0.18.1, the ``resample()`` function can be used directly from
-``DataFrameGroupBy`` objects, see the :ref:`groupby docs <groupby.transform.window_resample>`.
-
-.. note::
-
-   ``.resample()`` is similar to using a ``.rolling()`` operation with a time-based offset, see a discussion :ref:`here <stats.moments.ts-versus-resampling>`
-
-Basics
-~~~~~~
-
-.. ipython:: python
-
-   rng = pd.date_range('1/1/2012', periods=100, freq='S')
-
-   ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
-
-   ts.resample('5Min').sum()
-
-The ``resample`` function is very flexible and allows you to specify many
-different parameters to control the frequency conversion and resampling
-operation.
-
-The ``how`` parameter can be a function name or numpy array function that takes
-an array and produces aggregated values:
-
-.. ipython:: python
-
-   ts.resample('5Min').mean()
-
-   ts.resample('5Min').ohlc()
-
-   ts.resample('5Min').max()
-
-Any function available via :ref:`dispatching <groupby.dispatch>` can be given to
-the ``how`` parameter by name, including ``sum``, ``mean``, ``std``, ``sem``,
-``max``, ``min``, ``median``, ``first``, ``last``, ``ohlc``.
-
-For downsampling, ``closed`` can be set to 'left' or 'right' to specify which
-end of the interval is closed:
-
-.. ipython:: python
-
-   ts.resample('5Min', closed='right').mean()
-
-   ts.resample('5Min', closed='left').mean()
-
-Parameters like ``label`` and ``loffset`` are used to manipulate the resulting
-labels. ``label`` specifies whether the result is labeled with the beginning or
-the end of the interval. ``loffset`` performs a time adjustment on the output
-labels.
-
-.. ipython:: python
-
-   ts.resample('5Min').mean() # by default label='right'
-
-   ts.resample('5Min', label='left').mean()
-
-   ts.resample('5Min', label='left', loffset='1s').mean()
-
-The ``axis`` parameter can be set to 0 or 1 and allows you to resample the
-specified axis for a DataFrame.
-
-``kind`` can be set to 'timestamp' or 'period' to convert the resulting index
-to/from time-stamp and time-span representations. By default ``resample``
-retains the input representation.
-
-``convention`` can be set to 'start' or 'end' when resampling period data
-(detail below). It specifies how low frequency periods are converted to higher
-frequency periods.
-
-
-Up Sampling
-~~~~~~~~~~~
-
-For upsampling, you can specify a way to upsample and the ``limit`` parameter to interpolate over the gaps that are created:
-
-.. ipython:: python
-
-   # from secondly to every 250 milliseconds
-
-   ts[:2].resample('250L').asfreq()
-
-   ts[:2].resample('250L').ffill()
-
-   ts[:2].resample('250L').ffill(limit=2)
-
-Sparse Resampling
-~~~~~~~~~~~~~~~~~
-
-Sparse timeseries are ones where you have a lot fewer points relative
-to the amount of time you are looking to resample. Naively upsampling a sparse series can potentially
-generate lots of intermediate values. When you don't want to use a method to fill these values, e.g. ``fill_method`` is ``None``,
-then intermediate values will be filled with ``NaN``.
-
-Since ``resample`` is a time-based groupby, the following is a method to efficiently
-resample only the groups that are not all ``NaN``
-
-.. ipython:: python
-
-    rng = pd.date_range('2014-1-1', periods=100, freq='D') + pd.Timedelta('1s')
-    ts = pd.Series(range(100), index=rng)
-
-If we want to resample to the full range of the series
-
-.. ipython:: python
-
-    ts.resample('3T').sum()
-
-We can instead only resample those groups where we have points as follows:
-
-.. ipython:: python
-
-    from functools import partial
-    from pandas.tseries.frequencies import to_offset
-
-    def round(t, freq):
-        # round a Timestamp to a specified freq
-        freq = to_offset(freq)
-        return pd.Timestamp((t.value // freq.delta.value) * freq.delta.value)
-
-    ts.groupby(partial(round, freq='3T')).sum()
-
-Aggregation
-~~~~~~~~~~~
-
-Similar to :ref:`groupby aggregates <groupby.aggregate>` and the :ref:`window functions <stats.aggregate>`, a ``Resampler`` can be selectively
-resampled.
-
-Resampling a ``DataFrame``, the default will be to act on all columns with the same function.
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(1000, 3),
-                     index=pd.date_range('1/1/2012', freq='S', periods=1000),
-                     columns=['A', 'B', 'C'])
-   r = df.resample('3T')
-   r.mean()
-
-We can select a specific column or columns using standard getitem.
-
-.. ipython:: python
-
-   r['A'].mean()
-
-   r[['A','B']].mean()
-
-You can pass a list or dict of functions to do aggregation with, outputting a DataFrame:
-
-.. ipython:: python
-
-   r['A'].agg([np.sum, np.mean, np.std])
-
-If a dict is passed, the keys will be used to name the columns. Otherwise the
-function's name (stored in the function object) will be used.
-
-.. ipython:: python
-
-   r['A'].agg({'result1' : np.sum,
-               'result2' : np.mean})
-
-On a resampled DataFrame, you can pass a list of functions to apply to each
-column, which produces an aggregated result with a hierarchical index:
-
-.. ipython:: python
-
-   r.agg([np.sum, np.mean])
-
-By passing a dict to ``aggregate`` you can apply a different aggregation to the
-columns of a DataFrame:
-
-.. ipython:: python
-   :okexcept:
-
-   r.agg({'A' : np.sum,
-          'B' : lambda x: np.std(x, ddof=1)})
-
-The function names can also be strings. In order for a string to be valid it
-must be implemented on the Resampled object
-
-.. ipython:: python
-
-   r.agg({'A' : 'sum', 'B' : 'std'})
-
-Furthermore, you can also specify multiple aggregation functions for each column separately.
-
-.. ipython:: python
-
-   r.agg({'A' : ['sum','std'], 'B' : ['mean','std'] })
-
-
-If a ``DataFrame`` does not have a datetimelike index, but instead you want
-to resample based on datetimelike column in the frame, it can passed to the
-``on`` keyword.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
-                      'a': np.arange(5)},
-                     index=pd.MultiIndex.from_arrays([
-                              [1,2,3,4,5],
-                              pd.date_range('2015-01-01', freq='W', periods=5)],
-                          names=['v','d']))
-   df
-   df.resample('M', on='date').sum()
-
-Similarly, if you instead want to resample by a datetimelike
-level of ``MultiIndex``, its name or location can be passed to the
-``level`` keyword.
-
-.. ipython:: python
-
-   df.resample('M', level='d').sum()
-
-
-.. _timeseries.periods:
-
-Time Span Representation
-------------------------
-
-Regular intervals of time are represented by ``Period`` objects in pandas while
-sequences of ``Period`` objects are collected in a ``PeriodIndex``, which can
-be created with the convenience function ``period_range``.
-
-Period
-~~~~~~
-
-A ``Period`` represents a span of time (e.g., a day, a month, a quarter, etc).
-You can specify the span via ``freq`` keyword using a frequency alias like below.
-Because ``freq`` represents a span of ``Period``, it cannot be negative like "-3D".
-
-.. ipython:: python
-
-   pd.Period('2012', freq='A-DEC')
-
-   pd.Period('2012-1-1', freq='D')
-
-   pd.Period('2012-1-1 19:00', freq='H')
-
-   pd.Period('2012-1-1 19:00', freq='5H')
-
-Adding and subtracting integers from periods shifts the period by its own
-frequency. Arithmetic is not allowed between ``Period`` with different ``freq`` (span).
-
-.. ipython:: python
-
-   p = pd.Period('2012', freq='A-DEC')
-   p + 1
-   p - 3
-   p = pd.Period('2012-01', freq='2M')
-   p + 2
-   p - 1
-   @okexcept
-   p == pd.Period('2012-01', freq='3M')
-
-
-If ``Period`` freq is daily or higher (``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``), ``offsets`` and ``timedelta``-like can be added if the result can have the same freq. Otherwise, ``ValueError`` will be raised.
-
-.. ipython:: python
-
-   p = pd.Period('2014-07-01 09:00', freq='H')
-   p + Hour(2)
-   p + timedelta(minutes=120)
-   p + np.timedelta64(7200, 's')
-
-.. code-block:: ipython
-
-   In [1]: p + Minute(5)
-   Traceback
-      ...
-   ValueError: Input has different freq from Period(freq=H)
-
-If ``Period`` has other freqs, only the same ``offsets`` can be added. Otherwise, ``ValueError`` will be raised.
-
-.. ipython:: python
-
-   p = pd.Period('2014-07', freq='M')
-   p + MonthEnd(3)
-
-.. code-block:: ipython
-
-   In [1]: p + MonthBegin(3)
-   Traceback
-      ...
-   ValueError: Input has different freq from Period(freq=M)
-
-Taking the difference of ``Period`` instances with the same frequency will
-return the number of frequency units between them:
-
-.. ipython:: python
-
-   pd.Period('2012', freq='A-DEC') - pd.Period('2002', freq='A-DEC')
-
-PeriodIndex and period_range
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-Regular sequences of ``Period`` objects can be collected in a ``PeriodIndex``,
-which can be constructed using the ``period_range`` convenience function:
-
-.. ipython:: python
-
-   prng = pd.period_range('1/1/2011', '1/1/2012', freq='M')
-   prng
-
-The ``PeriodIndex`` constructor can also be used directly:
-
-.. ipython:: python
-
-   pd.PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
-
-Passing multiplied frequency outputs a sequence of ``Period`` which
-has multiplied span.
-
-.. ipython:: python
-
-   pd.PeriodIndex(start='2014-01', freq='3M', periods=4)
-
-Just like ``DatetimeIndex``, a ``PeriodIndex`` can also be used to index pandas
-objects:
-
-.. ipython:: python
-
-   ps = pd.Series(np.random.randn(len(prng)), prng)
-   ps
-
-``PeriodIndex`` supports addition and subtraction with the same rule as ``Period``.
-
-.. ipython:: python
-
-   idx = pd.period_range('2014-07-01 09:00', periods=5, freq='H')
-   idx
-   idx + Hour(2)
-
-   idx = pd.period_range('2014-07', periods=5, freq='M')
-   idx
-   idx + MonthEnd(3)
-
-``PeriodIndex`` has its own dtype named ``period``, refer to :ref:`Period Dtypes <timeseries.period_dtype>`.
-
-.. _timeseries.period_dtype:
-
-Period Dtypes
-~~~~~~~~~~~~~
-
-.. versionadded:: 0.19.0
-
-``PeriodIndex`` has a custom ``period`` dtype. This is a pandas extension
-dtype similar to the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``).
-
-The ``period`` dtype holds the ``freq`` attribute and is represented with
-``period[freq]`` like ``period[D]`` or ``period[M]``, using :ref:`frequency strings <timeseries.offset_aliases>`.
-
-.. ipython:: python
-
-   pi = pd.period_range('2016-01-01', periods=3, freq='M')
-   pi
-   pi.dtype
-
-The ``period`` dtype can be used in ``.astype(...)``. It allows one to change the
-``freq`` of a ``PeriodIndex`` like ``.asfreq()`` and convert a
-``DatetimeIndex`` to ``PeriodIndex`` like ``to_period()``:
-
-.. ipython:: python
-
-   # change monthly freq to daily freq
-   pi.astype('period[D]')
-
-   # convert to DatetimeIndex
-   pi.astype('datetime64[ns]')
-
-   # convert to PeriodIndex
-   dti = pd.date_range('2011-01-01', freq='M', periods=3)
-   dti
-   dti.astype('period[M]')
-
-
-PeriodIndex Partial String Indexing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-You can pass in dates and strings to ``Series`` and ``DataFrame`` with ``PeriodIndex``, in the same manner as ``DatetimeIndex``. For details, refer to :ref:`DatetimeIndex Partial String Indexing <timeseries.partialindexing>`.
-
-.. ipython:: python
-
-   ps['2011-01']
-
-   ps[datetime(2011, 12, 25):]
-
-   ps['10/31/2011':'12/31/2011']
-
-Passing a string representing a lower frequency than ``PeriodIndex`` returns partial sliced data.
-
-.. ipython:: python
-
-   ps['2011']
-
-   dfp = pd.DataFrame(np.random.randn(600,1),
-                      columns=['A'],
-                      index=pd.period_range('2013-01-01 9:00', periods=600, freq='T'))
-   dfp
-   dfp['2013-01-01 10H']
-
-As with ``DatetimeIndex``, the endpoints will be included in the result. The example below slices data starting from 10:00 to 11:59.
-
-.. ipython:: python
-
-   dfp['2013-01-01 10H':'2013-01-01 11H']
-
-Frequency Conversion and Resampling with PeriodIndex
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-The frequency of ``Period`` and ``PeriodIndex`` can be converted via the ``asfreq``
-method. Let's start with the fiscal year 2011, ending in December:
-
-.. ipython:: python
-
-   p = pd.Period('2011', freq='A-DEC')
-   p
-
-We can convert it to a monthly frequency. Using the ``how`` parameter, we can
-specify whether to return the starting or ending month:
-
-.. ipython:: python
-
-   p.asfreq('M', how='start')
-
-   p.asfreq('M', how='end')
-
-The shorthands 's' and 'e' are provided for convenience:
-
-.. ipython:: python
-
-   p.asfreq('M', 's')
-   p.asfreq('M', 'e')
-
-Converting to a "super-period" (e.g., annual frequency is a super-period of
-quarterly frequency) automatically returns the super-period that includes the
-input period:
-
-.. ipython:: python
-
-   p = pd.Period('2011-12', freq='M')
-
-   p.asfreq('A-NOV')
-
-Note that since we converted to an annual frequency that ends the year in
-November, the monthly period of December 2011 is actually in the 2012 A-NOV
-period.
-
-.. _timeseries.quarterly:
-
-Period conversions with anchored frequencies are particularly useful for
-working with various quarterly data common to economics, business, and other
-fields. Many organizations define quarters relative to the month in which their
-fiscal year starts and ends. Thus, first quarter of 2011 could start in 2010 or
-a few months into 2011. Via anchored frequencies, pandas works for all quarterly
-frequencies ``Q-JAN`` through ``Q-DEC``.
-
-``Q-DEC`` define regular calendar quarters:
-
-.. ipython:: python
-
-   p = pd.Period('2012Q1', freq='Q-DEC')
-
-   p.asfreq('D', 's')
-
-   p.asfreq('D', 'e')
-
-``Q-MAR`` defines fiscal year end in March:
-
-.. ipython:: python
-
-   p = pd.Period('2011Q4', freq='Q-MAR')
-
-   p.asfreq('D', 's')
-
-   p.asfreq('D', 'e')
-
-.. _timeseries.interchange:
-
-Converting between Representations
-----------------------------------
-
-Timestamped data can be converted to PeriodIndex-ed data using ``to_period``
-and vice-versa using ``to_timestamp``:
-
-.. ipython:: python
-
-   rng = pd.date_range('1/1/2012', periods=5, freq='M')
-
-   ts = pd.Series(np.random.randn(len(rng)), index=rng)
-
-   ts
-
-   ps = ts.to_period()
-
-   ps
-
-   ps.to_timestamp()
-
-Remember that 's' and 'e' can be used to return the timestamps at the start or
-end of the period:
-
-.. ipython:: python
-
-   ps.to_timestamp('D', how='s')
-
-Converting between period and timestamp enables some convenient arithmetic
-functions to be used. In the following example, we convert a quarterly
-frequency with year ending in November to 9am of the end of the month following
-the quarter end:
-
-.. ipython:: python
-
-   prng = pd.period_range('1990Q1', '2000Q4', freq='Q-NOV')
-
-   ts = pd.Series(np.random.randn(len(prng)), prng)
-
-   ts.index = (prng.asfreq('M', 'e') + 1).asfreq('H', 's') + 9
-
-   ts.head()
-
-.. _timeseries.oob:
-
-Representing out-of-bounds spans
---------------------------------
-
-If you have data that is outside of the ``Timestamp`` bounds, see :ref:`Timestamp limitations <timeseries.timestamp-limits>`,
-then you can use a ``PeriodIndex`` and/or ``Series`` of ``Periods`` to do computations.
-
-.. ipython:: python
-
-   span = pd.period_range('1215-01-01', '1381-01-01', freq='D')
-   span
-
-To convert from a ``int64`` based YYYYMMDD representation.
-
-.. ipython:: python
-
-   s = pd.Series([20121231, 20141130, 99991231])
-   s
-
-   def conv(x):
-       return pd.Period(year = x // 10000, month = x//100 % 100, day = x%100, freq='D')
-
-   s.apply(conv)
-   s.apply(conv)[2]
-
-These can easily be converted to a ``PeriodIndex``
-
-.. ipython:: python
-
-   span = pd.PeriodIndex(s.apply(conv))
-   span
-
-.. _timeseries.timezone:
-
-Time Zone Handling
-------------------
-
-Pandas provides rich support for working with timestamps in different time zones using ``pytz`` and ``dateutil`` libraries.
-``dateutil`` support is new in 0.14.1 and currently only supported for fixed offset and tzfile zones. The default library is ``pytz``.
-Support for ``dateutil`` is provided for compatibility with other applications e.g. if you use ``dateutil`` in other python packages.
-
-Working with Time Zones
-~~~~~~~~~~~~~~~~~~~~~~~
-
-By default, pandas objects are time zone unaware:
-
-.. ipython:: python
-
-   rng = pd.date_range('3/6/2012 00:00', periods=15, freq='D')
-   rng.tz is None
-
-To supply the time zone, you can use the ``tz`` keyword to ``date_range`` and
-other functions. Dateutil time zone strings are distinguished from ``pytz``
-time zones by starting with ``dateutil/``.
-
-- In ``pytz`` you can find a list of common (and less common) time zones using
-  ``from pytz import common_timezones, all_timezones``.
-- ``dateutil`` uses the OS timezones so there isn't a fixed list available. For
-  common zones, the names are the same as ``pytz``.
-
-.. ipython:: python
-
-   # pytz
-   rng_pytz = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
-                            tz='Europe/London')
-   rng_pytz.tz
-
-   # dateutil
-   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
-                                tz='dateutil/Europe/London')
-   rng_dateutil.tz
-
-   # dateutil - utc special case
-   rng_utc = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
-                           tz=dateutil.tz.tzutc())
-   rng_utc.tz
-
-Note that the ``UTC`` timezone is a special case in ``dateutil`` and should be constructed explicitly
-as an instance of ``dateutil.tz.tzutc``. You can also construct other timezones explicitly first,
-which gives you more control over which time zone is used:
-
-.. ipython:: python
-
-   # pytz
-   tz_pytz = pytz.timezone('Europe/London')
-   rng_pytz = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
-                            tz=tz_pytz)
-   rng_pytz.tz == tz_pytz
-
-   # dateutil
-   tz_dateutil = dateutil.tz.gettz('Europe/London')
-   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
-                                tz=tz_dateutil)
-   rng_dateutil.tz == tz_dateutil
-
-Timestamps, like Python's ``datetime.datetime`` object can be either time zone
-naive or time zone aware. Naive time series and DatetimeIndex objects can be
-*localized* using ``tz_localize``:
-
-.. ipython:: python
-
-   ts = pd.Series(np.random.randn(len(rng)), rng)
-
-   ts_utc = ts.tz_localize('UTC')
-   ts_utc
-
-Again, you can explicitly construct the timezone object first.
-You can use the ``tz_convert`` method to convert pandas objects to convert
-tz-aware data to another time zone:
-
-.. ipython:: python
-
-   ts_utc.tz_convert('US/Eastern')
-
-.. warning::
-
-	Be wary of conversions between libraries. For some zones ``pytz`` and ``dateutil`` have different
-	definitions of the zone. This is more of a problem for unusual timezones than for
-	'standard' zones like ``US/Eastern``.
-
-.. warning::
-
-       Be aware that a timezone definition across versions of timezone libraries may not
-       be considered equal.  This may cause problems when working with stored data that
-       is localized using one version and operated on with a different version.
-       See :ref:`here<io.hdf5-notes>` for how to handle such a situation.
-
-.. warning::
-
-       It is incorrect to pass a timezone directly into the ``datetime.datetime`` constructor (e.g.,
-       ``datetime.datetime(2011, 1, 1, tz=timezone('US/Eastern'))``.  Instead, the datetime
-       needs to be localized using the the localize method on the timezone.
-
-Under the hood, all timestamps are stored in UTC. Scalar values from a
-``DatetimeIndex`` with a time zone will have their fields (day, hour, minute)
-localized to the time zone. However, timestamps with the same UTC value are
-still considered to be equal even if they are in different time zones:
-
-.. ipython:: python
-
-   rng_eastern = rng_utc.tz_convert('US/Eastern')
-   rng_berlin = rng_utc.tz_convert('Europe/Berlin')
-
-   rng_eastern[5]
-   rng_berlin[5]
-   rng_eastern[5] == rng_berlin[5]
-
-Like ``Series``, ``DataFrame``, and ``DatetimeIndex``, ``Timestamp``s can be converted to other
-time zones using ``tz_convert``:
-
-.. ipython:: python
-
-   rng_eastern[5]
-   rng_berlin[5]
-   rng_eastern[5].tz_convert('Europe/Berlin')
-
-Localization of ``Timestamp`` functions just like ``DatetimeIndex`` and ``Series``:
-
-.. ipython:: python
-
-   rng[5]
-   rng[5].tz_localize('Asia/Shanghai')
-
-
-Operations between Series in different time zones will yield UTC
-Series, aligning the data on the UTC timestamps:
-
-.. ipython:: python
-
-   eastern = ts_utc.tz_convert('US/Eastern')
-   berlin = ts_utc.tz_convert('Europe/Berlin')
-   result = eastern + berlin
-   result
-   result.index
-
-To remove timezone from tz-aware ``DatetimeIndex``, use ``tz_localize(None)`` or ``tz_convert(None)``.
-``tz_localize(None)`` will remove timezone holding local time representations.
-``tz_convert(None)`` will remove timezone after converting to UTC time.
-
-.. ipython:: python
-
-   didx = pd.DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
-   didx
-   didx.tz_localize(None)
-   didx.tz_convert(None)
-
-   # tz_convert(None) is identical with tz_convert('UTC').tz_localize(None)
-   didx.tz_convert('UCT').tz_localize(None)
-
-.. _timeseries.timezone_ambiguous:
-
-Ambiguous Times when Localizing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In some cases, localize cannot determine the DST and non-DST hours when there are
-duplicates.  This often happens when reading files or database records that simply
-duplicate the hours.  Passing ``ambiguous='infer'`` (``infer_dst`` argument in prior
-releases) into ``tz_localize`` will attempt to determine the right offset.  Below
-the top example will fail as it contains ambiguous times and the bottom will
-infer the right offset.
-
-.. ipython:: python
-
-   rng_hourly = pd.DatetimeIndex(['11/06/2011 00:00', '11/06/2011 01:00',
-                                  '11/06/2011 01:00', '11/06/2011 02:00',
-                                  '11/06/2011 03:00'])
-
-This will fail as there are ambiguous times
-
-.. code-block:: ipython
-
-   In [2]: rng_hourly.tz_localize('US/Eastern')
-   AmbiguousTimeError: Cannot infer dst time from Timestamp('2011-11-06 01:00:00'), try using the 'ambiguous' argument
-
-Infer the ambiguous times
-
-.. ipython:: python
-
-   rng_hourly_eastern = rng_hourly.tz_localize('US/Eastern', ambiguous='infer')
-   rng_hourly_eastern.tolist()
-
-In addition to 'infer', there are several other arguments supported.  Passing
-an array-like of bools or 0s/1s where True represents a DST hour and False a
-non-DST hour, allows for distinguishing more than one DST
-transition (e.g., if you have multiple records in a database each with their
-own DST transition).  Or passing 'NaT' will fill in transition times
-with not-a-time values.  These methods are available in the ``DatetimeIndex``
-constructor as well as ``tz_localize``.
-
-.. ipython:: python
-
-   rng_hourly_dst = np.array([1, 1, 0, 0, 0])
-   rng_hourly.tz_localize('US/Eastern', ambiguous=rng_hourly_dst).tolist()
-   rng_hourly.tz_localize('US/Eastern', ambiguous='NaT').tolist()
-
-   didx = pd.DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
-   didx
-   didx.tz_localize(None)
-   didx.tz_convert(None)
-
-   # tz_convert(None) is identical with tz_convert('UTC').tz_localize(None)
-   didx.tz_convert('UCT').tz_localize(None)
-
-.. _timeseries.timezone_series:
-
-TZ aware Dtypes
-~~~~~~~~~~~~~~~
-
-.. versionadded:: 0.17.0
-
-``Series/DatetimeIndex`` with a timezone **naive** value are represented with a dtype of ``datetime64[ns]``.
-
-.. ipython:: python
-
-   s_naive = pd.Series(pd.date_range('20130101',periods=3))
-   s_naive
-
-``Series/DatetimeIndex`` with a timezone **aware** value are represented with a dtype of ``datetime64[ns, tz]``.
-
-.. ipython:: python
-
-   s_aware = pd.Series(pd.date_range('20130101',periods=3,tz='US/Eastern'))
-   s_aware
-
-Both of these ``Series`` can be manipulated via the ``.dt`` accessor, see :ref:`here <basics.dt_accessors>`.
-
-For example, to localize and convert a naive stamp to timezone aware.
-
-.. ipython:: python
-
-   s_naive.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
-
-
-Further more you can ``.astype(...)`` timezone aware (and naive). This operation is effectively a localize AND convert on a naive stamp, and
-a convert on an aware stamp.
-
-.. ipython:: python
-
-   # localize and convert a naive timezone
-   s_naive.astype('datetime64[ns, US/Eastern]')
-
-   # make an aware tz naive
-   s_aware.astype('datetime64[ns]')
-
-   # convert to a new timezone
-   s_aware.astype('datetime64[ns, CET]')
-
-.. note::
-
-   Using the ``.values`` accessor on a ``Series``, returns an numpy array of the data.
-   These values are converted to UTC, as numpy does not currently support timezones (even though it is *printing* in the local timezone!).
-
-   .. ipython:: python
-
-      s_naive.values
-      s_aware.values
-
-   Further note that once converted to a numpy array these would lose the tz tenor.
-
-   .. ipython:: python
-
-      pd.Series(s_aware.values)
-
-   However, these can be easily converted
-
-   .. ipython:: python
-
-      pd.Series(s_aware.values).dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
diff --git a/doc/source/tutorials.rst b/doc/source/tutorials.rst
deleted file mode 100644
index 2489b787560d0..0000000000000
--- a/doc/source/tutorials.rst
+++ /dev/null
@@ -1,180 +0,0 @@
-.. _tutorials:
-
-*********
-Tutorials
-*********
-
-This is a guide to many pandas tutorials, geared mainly for new users.
-
-Internal Guides
----------------
-
-pandas own :ref:`10 Minutes to pandas<10min>`
-
-More complex recipes are in the :ref:`Cookbook<cookbook>`
-
-pandas Cookbook
----------------
-
-The goal of this cookbook (by `Julia Evans <http://jvns.ca>`_) is to
-give you some concrete examples for getting started with pandas. These
-are examples with real-world data, and all the bugs and weirdness that
-that entails.
-
-Here are links to the v0.1 release. For an up-to-date table of contents, see the `pandas-cookbook GitHub
-repository <http://github.com/jvns/pandas-cookbook>`_. To run the examples in this tutorial, you'll need to
-clone the GitHub repository and get IPython Notebook running.
-See `How to use this cookbook <https://github.com/jvns/pandas-cookbook#how-to-use-this-cookbook>`_.
-
--  `A quick tour of the IPython Notebook: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/A%20quick%20tour%20of%20IPython%20Notebook.ipynb>`_
-   Shows off IPython's awesome tab completion and magic functions.
--  `Chapter 1: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%201%20-%20Reading%20from%20a%20CSV.ipynb>`_
-   Reading your data into pandas is pretty much the easiest thing. Even
-   when the encoding is wrong!
--  `Chapter 2: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%202%20-%20Selecting%20data%20&%20finding%20the%20most%20common%20complaint%20type.ipynb>`_
-   It's not totally obvious how to select data from a pandas dataframe.
-   Here we explain the basics (how to take slices and get columns)
--  `Chapter 3: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%203%20-%20Which%20borough%20has%20the%20most%20noise%20complaints%3F%20%28or%2C%20more%20selecting%20data%29.ipynb>`_
-   Here we get into serious slicing and dicing and learn how to filter
-   dataframes in complicated ways, really fast.
--  `Chapter 4: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%204%20-%20Find%20out%20on%20which%20weekday%20people%20bike%20the%20most%20with%20groupby%20and%20aggregate.ipynb>`_
-   Groupby/aggregate is seriously my favorite thing about pandas
-   and I use it all the time. You should probably read this.
--  `Chapter 5:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%205%20-%20Combining%20dataframes%20and%20scraping%20Canadian%20weather%20data.ipynb>`_
-   Here you get to find out if it's cold in Montreal in the winter
-   (spoiler: yes). Web scraping with pandas is fun! Here we combine dataframes.
--  `Chapter 6:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%206%20-%20String%20operations%21%20Which%20month%20was%20the%20snowiest%3F.ipynb>`_
-   Strings with pandas are great. It has all these vectorized string
-   operations and they're the best. We will turn a bunch of strings
-   containing "Snow" into vectors of numbers in a trice.
--  `Chapter 7: <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%207%20-%20Cleaning%20up%20messy%20data.ipynb>`_
-   Cleaning up messy data is never a joy, but with pandas it's easier.
--  `Chapter 8:  <http://nbviewer.ipython.org/github/jvns/pandas-cookbook/blob/v0.1/cookbook/Chapter%208%20-%20How%20to%20deal%20with%20timestamps.ipynb>`_
-   Parsing Unix timestamps is confusing at first but it turns out
-   to be really easy.
-
-
-Lessons for New pandas Users
-----------------------------
-
-For more resources, please visit the main `repository <https://bitbucket.org/hrojas/learn-pandas>`__.
-
-- `01 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/01%20-%20Lesson.ipynb>`_
-  - Importing libraries
-  - Creating data sets
-  - Creating data frames
-  - Reading from CSV
-  - Exporting to CSV
-  - Finding maximums
-  - Plotting data
-
-- `02 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/02%20-%20Lesson.ipynb>`_
-  - Reading from TXT
-  - Exporting to TXT
-  - Selecting top/bottom records
-  - Descriptive statistics
-  - Grouping/sorting data
-
-- `03 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/03%20-%20Lesson.ipynb>`_
-  - Creating functions
-  - Reading from EXCEL
-  - Exporting to EXCEL
-  - Outliers
-  - Lambda functions
-  - Slice and dice data
-
-- `04 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/04%20-%20Lesson.ipynb>`_
-  - Adding/deleting columns
-  - Index operations
-
-- `05 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/05%20-%20Lesson.ipynb>`_
-  - Stack/Unstack/Transpose functions
-
-- `06 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/06%20-%20Lesson.ipynb>`_
-  - GroupBy function
-
-- `07 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/07%20-%20Lesson.ipynb>`_
-  - Ways to calculate outliers
-
-- `08 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/08%20-%20Lesson.ipynb>`_
-  - Read from Microsoft SQL databases
-
-- `09 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/09%20-%20Lesson.ipynb>`_
-  - Export to CSV/EXCEL/TXT
-
-- `10 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/10%20-%20Lesson.ipynb>`_
-  - Converting between different kinds of formats
-
-- `11 - Lesson: <http://nbviewer.ipython.org/urls/bitbucket.org/hrojas/learn-pandas/raw/master/lessons/11%20-%20Lesson.ipynb>`_
-  - Combining data from various sources
-
-
-Practical data analysis with Python
------------------------------------
-
-This `guide <http://wavedatalab.github.io/datawithpython>`_ is a comprehensive introduction to the data analysis process using the Python data ecosystem and an interesting open dataset.
-There are four sections covering selected topics as follows:
-
--  `Munging Data <http://wavedatalab.github.io/datawithpython/munge.html>`_
-
--  `Aggregating Data <http://wavedatalab.github.io/datawithpython/aggregate.html>`_
-
--  `Visualizing Data <http://wavedatalab.github.io/datawithpython/visualize.html>`_
-
--  `Time Series <http://wavedatalab.github.io/datawithpython/timeseries.html>`_
-
-.. _tutorial-exercises-new-users:
-
-Exercises for New Users
------------------------
-Practice your skills with real data sets and exercises.
-For more resources, please visit the main `repository <https://github.com/guipsamora/pandas_exercises>`__.
-
-- `01 - Getting & Knowing Your Data <https://github.com/guipsamora/pandas_exercises/tree/master/01_Getting_%26_Knowing_Your_Data>`_
-
-- `02 - Filtering & Sorting <https://github.com/guipsamora/pandas_exercises/tree/master/02_Filtering_%26_Sorting>`_
-
-- `03 - Grouping <https://github.com/guipsamora/pandas_exercises/tree/master/03_Grouping>`_
-
-- `04 - Apply <https://github.com/guipsamora/pandas_exercises/tree/master/04_Apply>`_
-
-- `05 - Merge <https://github.com/guipsamora/pandas_exercises/tree/master/05_Merge>`_
-
-- `06 - Stats <https://github.com/guipsamora/pandas_exercises/tree/master/06_Stats>`_
-
-- `07 - Visualization <https://github.com/guipsamora/pandas_exercises/tree/master/07_Visualization>`_
-
-- `08 - Creating Series and DataFrames <https://github.com/guipsamora/pandas_exercises/tree/master/08_Creating_Series_and_DataFrames/Pokemon>`_
-
-- `09 - Time Series <https://github.com/guipsamora/pandas_exercises/tree/master/09_Time_Series>`_
-
-- `10 - Deleting <https://github.com/guipsamora/pandas_exercises/tree/master/10_Deleting>`_
-
-.. _tutorial-modern:
-
-Modern Pandas
--------------
-
-- `Modern Pandas <http://tomaugspurger.github.io/modern-1.html>`_
-- `Method Chaining <http://tomaugspurger.github.io/method-chaining.html>`_
-- `Indexes <http://tomaugspurger.github.io/modern-3-indexes.html>`_
-- `Performance <http://tomaugspurger.github.io/modern-4-performance.html>`_
-- `Tidy Data <http://tomaugspurger.github.io/modern-5-tidy.html>`_
-- `Visualization <http://tomaugspurger.github.io/modern-6-visualization.html>`_
-
-Excel charts with pandas, vincent and xlsxwriter
-------------------------------------------------
-
--  `Using Pandas and XlsxWriter to create Excel charts <https://pandas-xlsxwriter-charts.readthedocs.io/>`_
-
-Various Tutorials
------------------
-
-- `Wes McKinney's (pandas BDFL) blog <http://blog.wesmckinney.com/>`_
-- `Statistical analysis made easy in Python with SciPy and pandas DataFrames, by Randal Olson <http://www.randalolson.com/2012/08/06/statistical-analysis-made-easy-in-python/>`_
-- `Statistical Data Analysis in Python, tutorial videos, by Christopher Fonnesbeck from SciPy 2013 <http://conference.scipy.org/scipy2013/tutorial_detail.php?id=109>`_
-- `Financial analysis in python, by Thomas Wiecki <http://nbviewer.ipython.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
-- `Intro to pandas data structures, by Greg Reda <http://www.gregreda.com/2013/10/26/intro-to-pandas-data-structures/>`_
-- `Pandas and Python: Top 10, by Manish Amde <http://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/>`_
-- `Pandas Tutorial, by Mikhail Semeniuk <http://www.bearrelroll.com/2013/05/python-pandas-tutorial>`_
-- `Pandas DataFrames Tutorial, by Karlijn Willems <http://www.datacamp.com/community/tutorials/pandas-tutorial-dataframe-python>`_
diff --git a/doc/source/user_guide/advanced.rst b/doc/source/user_guide/advanced.rst
new file mode 100644
index 0000000000000..68f17a68784c9
--- /dev/null
+++ b/doc/source/user_guide/advanced.rst
@@ -0,0 +1,1175 @@
+.. _advanced:
+
+{{ header }}
+
+******************************
+MultiIndex / Advanced Indexing
+******************************
+
+This section covers :ref:`indexing with a MultiIndex <advanced.hierarchical>`
+and :ref:`other advanced indexing features <indexing.index_types>`.
+
+See the :ref:`Indexing and Selecting Data <indexing>` for general indexing documentation.
+
+.. warning::
+
+   Whether a copy or a reference is returned for a setting operation may
+   depend on the context.  This is sometimes called ``chained assignment`` and
+   should be avoided.  See :ref:`Returning a View versus Copy
+   <indexing.view_versus_copy>`.
+
+See the :ref:`cookbook<cookbook.selection>` for some advanced strategies.
+
+.. _advanced.hierarchical:
+
+Hierarchical indexing (MultiIndex)
+----------------------------------
+
+Hierarchical / Multi-level indexing is very exciting as it opens the door to some
+quite sophisticated data analysis and manipulation, especially for working with
+higher dimensional data. In essence, it enables you to store and manipulate
+data with an arbitrary number of dimensions in lower dimensional data
+structures like ``Series`` (1d) and ``DataFrame`` (2d).
+
+In this section, we will show what exactly we mean by "hierarchical" indexing
+and how it integrates with all of the pandas indexing functionality
+described above and in prior sections. Later, when discussing :ref:`group by
+<groupby>` and :ref:`pivoting and reshaping data <reshaping>`, we'll show
+non-trivial applications to illustrate how it aids in structuring data for
+analysis.
+
+See the :ref:`cookbook<cookbook.multi_index>` for some advanced strategies.
+
+.. versionchanged:: 0.24.0
+
+   :attr:`MultiIndex.labels` has been renamed to :attr:`MultiIndex.codes`
+   and :attr:`MultiIndex.set_labels` to :attr:`MultiIndex.set_codes`.
+
+Creating a MultiIndex (hierarchical index) object
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :class:`MultiIndex` object is the hierarchical analogue of the standard
+:class:`Index` object which typically stores the axis labels in pandas objects. You
+can think of ``MultiIndex`` as an array of tuples where each tuple is unique. A
+``MultiIndex`` can be created from a list of arrays (using
+:meth:`MultiIndex.from_arrays`), an array of tuples (using
+:meth:`MultiIndex.from_tuples`), a crossed set of iterables (using
+:meth:`MultiIndex.from_product`), or a :class:`DataFrame` (using
+:meth:`MultiIndex.from_frame`).  The ``Index`` constructor will attempt to return
+a ``MultiIndex`` when it is passed a list of tuples.  The following examples
+demonstrate different ways to initialize MultiIndexes.
+
+
+.. ipython:: python
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+   tuples = list(zip(*arrays))
+   tuples
+
+   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
+   index
+
+   s = pd.Series(np.random.randn(8), index=index)
+   s
+
+When you want every pairing of the elements in two iterables, it can be easier
+to use the :meth:`MultiIndex.from_product` method:
+
+.. ipython:: python
+
+   iterables = [['bar', 'baz', 'foo', 'qux'], ['one', 'two']]
+   pd.MultiIndex.from_product(iterables, names=['first', 'second'])
+
+You can also construct a ``MultiIndex`` from a ``DataFrame`` directly, using
+the method :meth:`MultiIndex.from_frame`. This is a complementary method to
+:meth:`MultiIndex.to_frame`.
+
+.. versionadded:: 0.24.0
+
+.. ipython:: python
+
+   df = pd.DataFrame([['bar', 'one'], ['bar', 'two'],
+                      ['foo', 'one'], ['foo', 'two']],
+                     columns=['first', 'second'])
+   pd.MultiIndex.from_frame(df)
+
+As a convenience, you can pass a list of arrays directly into ``Series`` or
+``DataFrame`` to construct a ``MultiIndex`` automatically:
+
+.. ipython:: python
+
+   arrays = [np.array(['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux']),
+             np.array(['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two'])]
+   s = pd.Series(np.random.randn(8), index=arrays)
+   s
+   df = pd.DataFrame(np.random.randn(8, 4), index=arrays)
+   df
+
+All of the ``MultiIndex`` constructors accept a ``names`` argument which stores
+string names for the levels themselves. If no names are provided, ``None`` will
+be assigned:
+
+.. ipython:: python
+
+   df.index.names
+
+This index can back any axis of a pandas object, and the number of **levels**
+of the index is up to you:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(3, 8), index=['A', 'B', 'C'], columns=index)
+   df
+   pd.DataFrame(np.random.randn(6, 6), index=index[:6], columns=index[:6])
+
+We've "sparsified" the higher levels of the indexes to make the console output a
+bit easier on the eyes. Note that how the index is displayed can be controlled using the
+``multi_sparse`` option in ``pandas.set_options()``:
+
+.. ipython:: python
+
+   with pd.option_context('display.multi_sparse', False):
+       df
+
+It's worth keeping in mind that there's nothing preventing you from using
+tuples as atomic labels on an axis:
+
+.. ipython:: python
+
+   pd.Series(np.random.randn(8), index=tuples)
+
+The reason that the ``MultiIndex`` matters is that it can allow you to do
+grouping, selection, and reshaping operations as we will describe below and in
+subsequent areas of the documentation. As you will see in later sections, you
+can find yourself working with hierarchically-indexed data without creating a
+``MultiIndex`` explicitly yourself. However, when loading data from a file, you
+may wish to generate your own ``MultiIndex`` when preparing the data set.
+
+.. _advanced.get_level_values:
+
+Reconstructing the level labels
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The method :meth:`~MultiIndex.get_level_values` will return a vector of the labels for each
+location at a particular level:
+
+.. ipython:: python
+
+   index.get_level_values(0)
+   index.get_level_values('second')
+
+Basic indexing on axis with MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+One of the important features of hierarchical indexing is that you can select
+data by a "partial" label identifying a subgroup in the data. **Partial**
+selection "drops" levels of the hierarchical index in the result in a
+completely analogous way to selecting a column in a regular DataFrame:
+
+.. ipython:: python
+
+   df['bar']
+   df['bar', 'one']
+   df['bar']['one']
+   s['qux']
+
+See :ref:`Cross-section with hierarchical index <advanced.xs>` for how to select
+on a deeper level.
+
+.. _advanced.shown_levels:
+
+Defined Levels
+~~~~~~~~~~~~~~
+
+The repr of a ``MultiIndex`` shows all the defined levels of an index, even
+if they are not actually used. When slicing an index, you may notice this.
+For example:
+
+.. ipython:: python
+
+   df.columns  # original MultiIndex
+
+   df[['foo','qux']].columns  # sliced
+
+This is done to avoid a recomputation of the levels in order to make slicing
+highly performant. If you want to see only the used levels, you can use the
+:meth:`~MultiIndex.get_level_values` method.
+
+.. ipython:: python
+
+   df[['foo', 'qux']].columns.to_numpy()
+
+   # for a specific level
+   df[['foo', 'qux']].columns.get_level_values(0)
+
+To reconstruct the ``MultiIndex`` with only the used levels, the
+:meth:`~MultiIndex.remove_unused_levels` method may be used.
+
+.. versionadded:: 0.20.0
+
+.. ipython:: python
+
+   df[['foo', 'qux']].columns.remove_unused_levels()
+
+Data alignment and using ``reindex``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Operations between differently-indexed objects having ``MultiIndex`` on the
+axes will work as you expect; data alignment will work the same as an Index of
+tuples:
+
+.. ipython:: python
+
+   s + s[:-2]
+   s + s[::2]
+
+The :meth:`~DataFrame.reindex` method of ``Series``/``DataFrames`` can be
+called with another ``MultiIndex``, or even a list or array of tuples:
+
+.. ipython:: python
+
+   s.reindex(index[:3])
+   s.reindex([('foo', 'two'), ('bar', 'one'), ('qux', 'one'), ('baz', 'one')])
+
+.. _advanced.advanced_hierarchical:
+
+Advanced indexing with hierarchical index
+-----------------------------------------
+
+Syntactically integrating ``MultiIndex`` in advanced indexing with ``.loc`` is a
+bit challenging, but we've made every effort to do so. In general, MultiIndex
+keys take the form of tuples. For example, the following works as you would expect:
+
+.. ipython:: python
+
+   df = df.T
+   df
+   df.loc[('bar', 'two')]
+
+Note that ``df.loc['bar', 'two']`` would also work in this example, but this shorthand
+notation can lead to ambiguity in general.
+
+If you also want to index a specific column with ``.loc``, you must use a tuple
+like this:
+
+.. ipython:: python
+
+   df.loc[('bar', 'two'), 'A']
+
+You don't have to specify all levels of the ``MultiIndex`` by passing only the
+first elements of the tuple. For example, you can use "partial" indexing to
+get all elements with ``bar`` in the first level as follows:
+
+df.loc['bar']
+
+This is a shortcut for the slightly more verbose notation ``df.loc[('bar',),]`` (equivalent
+to ``df.loc['bar',]`` in this example).
+
+"Partial" slicing also works quite nicely.
+
+.. ipython:: python
+
+   df.loc['baz':'foo']
+
+You can slice with a 'range' of values, by providing a slice of tuples.
+
+.. ipython:: python
+
+   df.loc[('baz', 'two'):('qux', 'one')]
+   df.loc[('baz', 'two'):'foo']
+
+Passing a list of labels or tuples works similar to reindexing:
+
+.. ipython:: python
+
+   df.loc[[('bar', 'two'), ('qux', 'one')]]
+
+.. note::
+
+   It is important to note that tuples and lists are not treated identically
+   in pandas when it comes to indexing. Whereas a tuple is interpreted as one
+   multi-level key, a list is used to specify several keys. Or in other words,
+   tuples go horizontally (traversing levels), lists go vertically (scanning levels).
+
+Importantly, a list of tuples indexes several complete ``MultiIndex`` keys,
+whereas a tuple of lists refer to several values within a level:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3, 4, 5, 6],
+                 index=pd.MultiIndex.from_product([["A", "B"], ["c", "d", "e"]]))
+   s.loc[[("A", "c"), ("B", "d")]]  # list of tuples
+   s.loc[(["A", "B"], ["c", "d"])]  # tuple of lists
+
+
+.. _advanced.mi_slicers:
+
+Using slicers
+~~~~~~~~~~~~~
+
+You can slice a ``MultiIndex`` by providing multiple indexers.
+
+You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
+including slices, lists of labels, labels, and boolean indexers.
+
+You can use ``slice(None)`` to select all the contents of *that* level. You do not need to specify all the
+*deeper* levels, they will be implied as ``slice(None)``.
+
+As usual, **both sides** of the slicers are included as this is label indexing.
+
+.. warning::
+
+   You should specify all axes in the ``.loc`` specifier, meaning the indexer for the **index** and
+   for the **columns**. There are some ambiguous cases where the passed indexer could be mis-interpreted
+   as indexing *both* axes, rather than into say the ``MultiIndex`` for the rows.
+
+   You should do this:
+
+   .. code-block:: python
+
+      df.loc[(slice('A1', 'A3'), ...), :]             # noqa: E999
+
+   You should **not** do this:
+ 
+   .. code-block:: python
+
+      df.loc[(slice('A1', 'A3'), ...)]                # noqa: E999
+
+.. ipython:: python
+
+   def mklbl(prefix, n):
+       return ["%s%s" % (prefix, i) for i in range(n)]
+
+   miindex = pd.MultiIndex.from_product([mklbl('A', 4),
+                                         mklbl('B', 2),
+                                         mklbl('C', 4),
+                                         mklbl('D', 2)])
+   micolumns = pd.MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+   dfmi = pd.DataFrame(np.arange(len(miindex) * len(micolumns))
+                         .reshape((len(miindex), len(micolumns))),
+                       index=miindex,
+                       columns=micolumns).sort_index().sort_index(axis=1)
+   dfmi
+
+Basic MultiIndex slicing using slices, lists, and labels.
+
+.. ipython:: python
+
+   dfmi.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+
+
+You can use :class:`pandas.IndexSlice` to facilitate a more natural syntax
+using ``:``, rather than using ``slice(None)``.
+
+.. ipython:: python
+
+   idx = pd.IndexSlice
+   dfmi.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
+
+It is possible to perform quite complicated selections using this method on multiple
+axes at the same time.
+
+.. ipython:: python
+
+   dfmi.loc['A1', (slice(None), 'foo')]
+   dfmi.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
+
+Using a boolean indexer you can provide selection related to the *values*.
+
+.. ipython:: python
+
+   mask = dfmi[('a', 'foo')] > 200
+   dfmi.loc[idx[mask, :, ['C1', 'C3']], idx[:, 'foo']]
+
+You can also specify the ``axis`` argument to ``.loc`` to interpret the passed
+slicers on a single axis.
+
+.. ipython:: python
+
+   dfmi.loc(axis=0)[:, :, ['C1', 'C3']]
+
+Furthermore, you can *set* the values using the following methods.
+
+.. ipython:: python
+
+   df2 = dfmi.copy()
+   df2.loc(axis=0)[:, :, ['C1', 'C3']] = -10
+   df2
+
+You can use a right-hand-side of an alignable object as well.
+
+.. ipython:: python
+
+   df2 = dfmi.copy()
+   df2.loc[idx[:, :, ['C1', 'C3']], :] = df2 * 1000
+   df2
+
+.. _advanced.xs:
+
+Cross-section
+~~~~~~~~~~~~~
+
+The :meth:`~DataFrame.xs` method of ``DataFrame`` additionally takes a level argument to make
+selecting data at a particular level of a ``MultiIndex`` easier.
+
+.. ipython:: python
+
+   df
+   df.xs('one', level='second')
+
+.. ipython:: python
+
+   # using the slicers
+   df.loc[(slice(None), 'one'), :]
+
+You can also select on the columns with ``xs``, by
+providing the axis argument.
+
+.. ipython:: python
+
+   df = df.T
+   df.xs('one', level='second', axis=1)
+
+.. ipython:: python
+
+   # using the slicers
+   df.loc[:, (slice(None), 'one')]
+
+``xs`` also allows selection with multiple keys.
+
+.. ipython:: python
+
+   df.xs(('one', 'bar'), level=('second', 'first'), axis=1)
+
+.. ipython:: python
+
+   # using the slicers
+   df.loc[:, ('bar', 'one')]
+
+You can pass ``drop_level=False`` to ``xs`` to retain
+the level that was selected.
+
+.. ipython:: python
+
+   df.xs('one', level='second', axis=1, drop_level=False)
+
+Compare the above with the result using ``drop_level=True`` (the default value).
+
+.. ipython:: python
+
+   df.xs('one', level='second', axis=1, drop_level=True)
+
+.. ipython:: python
+   :suppress:
+
+   df = df.T
+
+.. _advanced.advanced_reindex:
+
+Advanced reindexing and alignment
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Using the parameter ``level`` in the :meth:`~DataFrame.reindex` and
+:meth:`~DataFrame.align` methods of pandas objects is useful to broadcast
+values across a level. For instance:
+
+.. ipython:: python
+
+   midx = pd.MultiIndex(levels=[['zero', 'one'], ['x', 'y']],
+                        codes=[[1, 1, 0, 0], [1, 0, 1, 0]])
+   df = pd.DataFrame(np.random.randn(4, 2), index=midx)
+   df
+   df2 = df.mean(level=0)
+   df2
+   df2.reindex(df.index, level=0)
+
+   # aligning
+   df_aligned, df2_aligned = df.align(df2, level=0)
+   df_aligned
+   df2_aligned
+
+
+Swapping levels with ``swaplevel``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~MultiIndex.swaplevel` method can switch the order of two levels:
+
+.. ipython:: python
+
+   df[:5]
+   df[:5].swaplevel(0, 1, axis=0)
+
+.. _advanced.reorderlevels:
+
+Reordering levels with ``reorder_levels``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~MultiIndex.reorder_levels` method generalizes the ``swaplevel``
+method, allowing you to permute the hierarchical index levels in one step:
+
+.. ipython:: python
+
+   df[:5].reorder_levels([1, 0], axis=0)
+
+.. _advanced.index_names:
+
+Renaming names of an ``Index`` or ``MultiIndex``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The :meth:`~DataFrame.rename` method is used to rename the labels of a
+``MultiIndex``, and is typically used to rename the columns of a ``DataFrame``.
+The ``columns`` argument of ``rename`` allows a dictionary to be specified
+that includes only the columns you wish to rename.
+
+.. ipython:: python
+
+   df.rename(columns={0: "col0", 1: "col1"})
+
+This method can also be used to rename specific labels of the main index
+of the ``DataFrame``.
+
+.. ipython:: python
+
+   df.rename(index={"one": "two", "y": "z"})
+
+The :meth:`~DataFrame.rename_axis` method is used to rename the name of a
+``Index`` or ``MultiIndex``. In particular, the names of the levels of a
+``MultiIndex`` can be specified, which is useful if ``reset_index()`` is later
+used to move the values from the ``MultiIndex`` to a column.
+
+.. ipython:: python
+
+   df.rename_axis(index=['abc', 'def'])
+
+Note that the columns of a ``DataFrame`` are an index, so that using
+``rename_axis`` with the ``columns`` argument will change the name of that
+index.
+
+.. ipython:: python
+
+   df.rename_axis(columns="Cols").columns
+
+Both ``rename`` and ``rename_axis`` support specifying a dictionary,
+``Series`` or a mapping function to map labels/names to new values.
+
+Sorting a ``MultiIndex``
+------------------------
+
+For :class:`MultiIndex`-ed objects to be indexed and sliced effectively,
+they need to be sorted. As with any index, you can use :meth:`~DataFrame.sort_index`.
+
+.. ipython:: python
+
+   import random
+   random.shuffle(tuples)
+   s = pd.Series(np.random.randn(8), index=pd.MultiIndex.from_tuples(tuples))
+   s
+   s.sort_index()
+   s.sort_index(level=0)
+   s.sort_index(level=1)
+
+.. _advanced.sortlevel_byname:
+
+You may also pass a level name to ``sort_index`` if the ``MultiIndex`` levels
+are named.
+
+.. ipython:: python
+
+   s.index.set_names(['L1', 'L2'], inplace=True)
+   s.sort_index(level='L1')
+   s.sort_index(level='L2')
+
+On higher dimensional objects, you can sort any of the other axes by level if
+they have a ``MultiIndex``:
+
+.. ipython:: python
+
+   df.T.sort_index(level=1, axis=1)
+
+Indexing will work even if the data are not sorted, but will be rather
+inefficient (and show a ``PerformanceWarning``). It will also
+return a copy of the data rather than a view:
+
+.. ipython:: python
+
+   dfm = pd.DataFrame({'jim': [0, 0, 1, 1],
+                       'joe': ['x', 'x', 'z', 'y'],
+                       'jolie': np.random.rand(4)})
+   dfm = dfm.set_index(['jim', 'joe'])
+   dfm
+
+.. code-block:: ipython
+
+   In [4]: dfm.loc[(1, 'z')]
+   PerformanceWarning: indexing past lexsort depth may impact performance.
+
+   Out[4]:
+              jolie
+   jim joe
+   1   z    0.64094
+
+.. _advanced.unsorted:
+
+Furthermore, if you try to index something that is not fully lexsorted, this can raise:
+
+.. code-block:: ipython
+
+    In [5]: dfm.loc[(0, 'y'):(1, 'z')]
+    UnsortedIndexError: 'Key length (2) was greater than MultiIndex lexsort depth (1)'
+
+The :meth:`~MultiIndex.is_lexsorted` method on a ``MultiIndex`` shows if the
+index is sorted, and the ``lexsort_depth`` property returns the sort depth:
+
+.. ipython:: python
+
+   dfm.index.is_lexsorted()
+   dfm.index.lexsort_depth
+
+.. ipython:: python
+
+   dfm = dfm.sort_index()
+   dfm
+   dfm.index.is_lexsorted()
+   dfm.index.lexsort_depth
+
+And now selection works as expected.
+
+.. ipython:: python
+
+   dfm.loc[(0, 'y'):(1, 'z')]
+
+Take Methods
+------------
+
+.. _advanced.take:
+
+Similar to NumPy ndarrays, pandas ``Index``, ``Series``, and ``DataFrame`` also provides
+the :meth:`~DataFrame.take` method that retrieves elements along a given axis at the given
+indices. The given indices must be either a list or an ndarray of integer
+index positions. ``take`` will also accept negative integers as relative positions to the end of the object.
+
+.. ipython:: python
+
+   index = pd.Index(np.random.randint(0, 1000, 10))
+   index
+
+   positions = [0, 9, 3]
+
+   index[positions]
+   index.take(positions)
+
+   ser = pd.Series(np.random.randn(10))
+
+   ser.iloc[positions]
+   ser.take(positions)
+
+For DataFrames, the given indices should be a 1d list or ndarray that specifies
+row or column positions.
+
+.. ipython:: python
+
+   frm = pd.DataFrame(np.random.randn(5, 3))
+
+   frm.take([1, 4, 3])
+
+   frm.take([0, 2], axis=1)
+
+It is important to note that the ``take`` method on pandas objects are not
+intended to work on boolean indices and may return unexpected results.
+
+.. ipython:: python
+
+   arr = np.random.randn(10)
+   arr.take([False, False, True, True])
+   arr[[0, 1]]
+
+   ser = pd.Series(np.random.randn(10))
+   ser.take([False, False, True, True])
+   ser.iloc[[0, 1]]
+
+Finally, as a small note on performance, because the ``take`` method handles
+a narrower range of inputs, it can offer performance that is a good deal
+faster than fancy indexing.
+
+.. ipython:: python
+
+   arr = np.random.randn(10000, 5)
+   indexer = np.arange(10000)
+   random.shuffle(indexer)
+
+   %timeit arr[indexer]
+   %timeit arr.take(indexer, axis=0)
+
+   ser = pd.Series(arr[:, 0])
+   %timeit ser.iloc[indexer]
+   %timeit ser.take(indexer)
+
+.. _indexing.index_types:
+
+Index Types
+-----------
+
+We have discussed ``MultiIndex`` in the previous sections pretty extensively.
+Documentation about ``DatetimeIndex`` and ``PeriodIndex`` are shown :ref:`here <timeseries.overview>`,
+and documentation about ``TimedeltaIndex`` is found :ref:`here <timedeltas.index>`.
+
+In the following sub-sections we will highlight some other index types.
+
+.. _indexing.categoricalindex:
+
+CategoricalIndex
+~~~~~~~~~~~~~~~~
+
+:class:`CategoricalIndex` is a type of index that is useful for supporting
+indexing with duplicates. This is a container around a :class:`Categorical`
+and allows efficient indexing and storage of an index with a large number of duplicated elements.
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+   df = pd.DataFrame({'A': np.arange(6),
+                      'B': list('aabbca')})
+   df['B'] = df['B'].astype(CategoricalDtype(list('cab')))
+   df
+   df.dtypes
+   df.B.cat.categories
+
+Setting the index will create a ``CategoricalIndex``.
+
+.. ipython:: python
+
+   df2 = df.set_index('B')
+   df2.index
+
+Indexing with ``__getitem__/.iloc/.loc`` works similarly to an ``Index`` with duplicates.
+The indexers **must** be in the category or the operation will raise a ``KeyError``.
+
+.. ipython:: python
+
+   df2.loc['a']
+
+The ``CategoricalIndex`` is **preserved** after indexing:
+
+.. ipython:: python
+
+   df2.loc['a'].index
+
+Sorting the index will sort by the order of the categories (recall that we
+created the index with ``CategoricalDtype(list('cab'))``, so the sorted
+order is ``cab``).
+
+.. ipython:: python
+
+   df2.sort_index()
+
+Groupby operations on the index will preserve the index nature as well.
+
+.. ipython:: python
+
+   df2.groupby(level=0).sum()
+   df2.groupby(level=0).sum().index
+
+Reindexing operations will return a resulting index based on the type of the passed
+indexer. Passing a list will return a plain-old ``Index``; indexing with
+a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the categories
+of the **passed** ``Categorical`` dtype. This allows one to arbitrarily index these even with
+values **not** in the categories, similarly to how you can reindex **any** pandas index.
+
+.. ipython:: python
+
+   df2.reindex(['a', 'e'])
+   df2.reindex(['a', 'e']).index
+   df2.reindex(pd.Categorical(['a', 'e'], categories=list('abcde')))
+   df2.reindex(pd.Categorical(['a', 'e'], categories=list('abcde'))).index
+
+.. warning::
+
+   Reshaping and Comparison operations on a ``CategoricalIndex`` must have the same categories
+   or a ``TypeError`` will be raised.
+
+   .. code-block:: ipython
+
+    In [9]: df3 = pd.DataFrame({'A': np.arange(6), 'B': pd.Series(list('aabbca')).astype('category')})
+
+    In [11]: df3 = df3.set_index('B')
+
+    In [11]: df3.index
+    Out[11]: CategoricalIndex([u'a', u'a', u'b', u'b', u'c', u'a'], categories=[u'a', u'b', u'c'], ordered=False, name=u'B', dtype='category')
+
+    In [12]: pd.concat([df2, df3])
+    TypeError: categories must match existing categories when appending
+
+.. _indexing.rangeindex:
+
+Int64Index and RangeIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
+
+:class:`Int64Index` is a fundamental basic index in pandas.
+This is an immutable array implementing an ordered, sliceable set.
+Prior to 0.18.0, the ``Int64Index`` would provide the default index for all ``NDFrame`` objects.
+
+:class:`RangeIndex` is a sub-class of ``Int64Index`` added in version 0.18.0, now providing the default index for all ``NDFrame`` objects.
+``RangeIndex`` is an optimized version of ``Int64Index`` that can represent a monotonic ordered set. These are analogous to Python `range types <https://docs.python.org/3/library/stdtypes.html#typesseq-range>`__.
+
+.. _indexing.float64index:
+
+Float64Index
+~~~~~~~~~~~~
+
+By default a :class:`Float64Index` will be automatically created when passing floating, or mixed-integer-floating values in index creation.
+This enables a pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar indexing and slicing work exactly the
+same.
+
+.. ipython:: python
+
+   indexf = pd.Index([1.5, 2, 3, 4.5, 5])
+   indexf
+   sf = pd.Series(range(5), index=indexf)
+   sf
+
+Scalar selection for ``[],.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``).
+
+.. ipython:: python
+
+   sf[3]
+   sf[3.0]
+   sf.loc[3]
+   sf.loc[3.0]
+
+The only positional indexing is via ``iloc``.
+
+.. ipython:: python
+
+   sf.iloc[3]
+
+A scalar index that is not found will raise a ``KeyError``.
+Slicing is primarily on the values of the index when using ``[],ix,loc``, and
+**always** positional when using ``iloc``. The exception is when the slice is
+boolean, in which case it will always be positional.
+
+.. ipython:: python
+
+   sf[2:4]
+   sf.loc[2:4]
+   sf.iloc[2:4]
+
+In float indexes, slicing using floats is allowed.
+
+.. ipython:: python
+
+   sf[2.1:4.6]
+   sf.loc[2.1:4.6]
+
+In non-float indexes, slicing using floats will raise a ``TypeError``.
+
+.. code-block:: ipython
+
+   In [1]: pd.Series(range(5))[3.5]
+   TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
+
+   In [1]: pd.Series(range(5))[3.5:4.5]
+   TypeError: the slice start [3.5] is not a proper indexer for this index type (Int64Index)
+
+.. warning::
+
+   Using a scalar float indexer for ``.iloc`` has been removed in 0.18.0, so the following will raise a ``TypeError``:
+
+   .. code-block:: ipython
+
+      In [3]: pd.Series(range(5)).iloc[3.0]
+      TypeError: cannot do positional indexing on <class 'pandas.indexes.range.RangeIndex'> with these indexers [3.0] of <type 'float'>
+
+
+Here is a typical use-case for using this type of indexing. Imagine that you have a somewhat
+irregular timedelta-like indexing scheme, but the data is recorded as floats. This could, for
+example, be millisecond offsets.
+
+.. ipython:: python
+
+   dfir = pd.concat([pd.DataFrame(np.random.randn(5, 2),
+                                  index=np.arange(5) * 250.0,
+                                  columns=list('AB')),
+                     pd.DataFrame(np.random.randn(6, 2),
+                                  index=np.arange(4, 10) * 250.1,
+                                  columns=list('AB'))])
+   dfir
+
+Selection operations then will always work on a value basis, for all selection operators.
+
+.. ipython:: python
+
+   dfir[0:1000.4]
+   dfir.loc[0:1001, 'A']
+   dfir.loc[1000.4]
+
+You could retrieve the first 1 second (1000 ms) of data as such:
+
+.. ipython:: python
+
+   dfir[0:1000]
+
+If you need integer based selection, you should use ``iloc``:
+
+.. ipython:: python
+
+   dfir.iloc[0:5]
+
+.. _advanced.intervalindex:
+
+IntervalIndex
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+:class:`IntervalIndex` together with its own dtype, :class:`~pandas.api.types.IntervalDtype`
+as well as the :class:`Interval` scalar type,  allow first-class support in pandas
+for interval notation.
+
+The ``IntervalIndex`` allows some unique indexing and is also used as a
+return type for the categories in :func:`cut` and :func:`qcut`.
+
+.. warning::
+
+   These indexing behaviors are provisional and may change in a future version of pandas.
+
+An ``IntervalIndex`` can be used in ``Series`` and in ``DataFrame`` as the index.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3, 4]},
+                     index=pd.IntervalIndex.from_breaks([0, 1, 2, 3, 4]))
+   df
+
+Label based indexing via ``.loc`` along the edges of an interval works as you would expect,
+selecting that particular interval.
+
+.. ipython:: python
+
+   df.loc[2]
+   df.loc[[2, 3]]
+
+If you select a label *contained* within an interval, this will also select the interval.
+
+.. ipython:: python
+
+   df.loc[2.5]
+   df.loc[[2.5, 3.5]]
+
+``Interval`` and ``IntervalIndex`` are used by ``cut`` and ``qcut``:
+
+.. ipython:: python
+
+   c = pd.cut(range(4), bins=2)
+   c
+   c.categories
+
+Furthermore, ``IntervalIndex`` allows one to bin *other* data with these same
+bins, with ``NaN`` representing a missing value similar to other dtypes.
+
+.. ipython:: python
+
+   pd.cut([0, 3, 5, 1], bins=c.categories)
+
+
+Generating Ranges of Intervals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+If we need intervals on a regular frequency, we can use the :func:`interval_range` function
+to create an ``IntervalIndex`` using various combinations of ``start``, ``end``, and ``periods``.
+The default frequency for ``interval_range`` is a 1 for numeric intervals, and calendar day for
+datetime-like intervals:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=5)
+
+   pd.interval_range(start=pd.Timestamp('2017-01-01'), periods=4)
+
+   pd.interval_range(end=pd.Timedelta('3 days'), periods=3)
+
+The ``freq`` parameter can used to specify non-default frequencies, and can utilize a variety
+of :ref:`frequency aliases <timeseries.offset_aliases>` with datetime-like intervals:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, periods=5, freq=1.5)
+
+   pd.interval_range(start=pd.Timestamp('2017-01-01'), periods=4, freq='W')
+
+   pd.interval_range(start=pd.Timedelta('0 days'), periods=3, freq='9H')
+
+Additionally, the ``closed`` parameter can be used to specify which side(s) the intervals
+are closed on.  Intervals are closed on the right side by default.
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=4, closed='both')
+
+   pd.interval_range(start=0, end=4, closed='neither')
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+intervals from ``start`` to ``end`` inclusively, with ``periods`` number of elements
+in the resulting ``IntervalIndex``:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=6, periods=4)
+
+   pd.interval_range(pd.Timestamp('2018-01-01'),
+                     pd.Timestamp('2018-02-28'), periods=3)
+
+Miscellaneous indexing FAQ
+--------------------------
+
+Integer indexing
+~~~~~~~~~~~~~~~~
+
+Label-based indexing with integer axis labels is a thorny topic. It has been
+discussed heavily on mailing lists and among various members of the scientific
+Python community. In pandas, our general viewpoint is that labels matter more
+than integer locations. Therefore, with an integer axis index *only*
+label-based indexing is possible with the standard tools like ``.loc``. The
+following code will generate exceptions:
+
+.. ipython:: python
+   :okexcept:
+
+   s = pd.Series(range(5))
+   s[-1]
+   df = pd.DataFrame(np.random.randn(5, 4))
+   df
+   df.loc[-2:]
+
+This deliberate decision was made to prevent ambiguities and subtle bugs (many
+users reported finding bugs when the API change was made to stop "falling back"
+on position-based indexing).
+
+Non-monotonic indexes require exact matches
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If the index of a ``Series`` or ``DataFrame`` is monotonically increasing or decreasing, then the bounds
+of a label-based slice can be outside the range of the index, much like slice indexing a
+normal Python ``list``. Monotonicity of an index can be tested with the :meth:`~Index.is_monotonic_increasing` and
+:meth:`~Index.is_monotonic_decreasing` attributes.
+
+.. ipython:: python
+
+    df = pd.DataFrame(index=[2, 3, 3, 4, 5], columns=['data'], data=list(range(5)))
+    df.index.is_monotonic_increasing
+
+    # no rows 0 or 1, but still returns rows 2, 3 (both of them), and 4:
+    df.loc[0:4, :]
+
+    # slice is are outside the index, so empty DataFrame is returned
+    df.loc[13:15, :]
+
+On the other hand, if the index is not monotonic, then both slice bounds must be
+*unique* members of the index.
+
+.. ipython:: python
+
+    df = pd.DataFrame(index=[2, 3, 1, 4, 3, 5],
+                      columns=['data'], data=list(range(6)))
+    df.index.is_monotonic_increasing
+
+    # OK because 2 and 4 are in the index
+    df.loc[2:4, :]
+
+.. code-block:: ipython
+
+    # 0 is not in the index
+    In [9]: df.loc[0:4, :]
+    KeyError: 0
+
+    # 3 is not a unique label
+    In [11]: df.loc[2:3, :]
+    KeyError: 'Cannot get right slice bound for non-unique label: 3'
+
+``Index.is_monotonic_increasing`` and ``Index.is_monotonic_decreasing`` only check that
+an index is weakly monotonic. To check for strict monotonicity, you can combine one of those with
+the :meth:`~Index.is_unique` attribute.
+
+.. ipython:: python
+
+   weakly_monotonic = pd.Index(['a', 'b', 'c', 'c'])
+   weakly_monotonic
+   weakly_monotonic.is_monotonic_increasing
+   weakly_monotonic.is_monotonic_increasing & weakly_monotonic.is_unique
+
+Endpoints are inclusive
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Compared with standard Python sequence slicing in which the slice endpoint is
+not inclusive, label-based slicing in pandas **is inclusive**. The primary
+reason for this is that it is often not possible to easily determine the
+"successor" or next element after a particular label in an index. For example,
+consider the following ``Series``:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(6), index=list('abcdef'))
+   s
+
+Suppose we wished to slice from ``c`` to ``e``, using integers this would be
+accomplished as such:
+
+.. ipython:: python
+
+   s[2:5]
+
+However, if you only had ``c`` and ``e``, determining the next element in the
+index can be somewhat complicated. For example, the following does not work:
+
+::
+
+    s.loc['c':'e' + 1]
+
+A very common use case is to limit a time series to start and end at two
+specific dates. To enable this, we made the design to make label-based
+slicing include both endpoints:
+
+.. ipython:: python
+
+    s.loc['c':'e']
+
+This is most definitely a "practicality beats purity" sort of thing, but it is
+something to watch out for if you expect label-based slicing to behave exactly
+in the way that standard Python integer slicing works.
+
+
+Indexing potentially changes underlying Series dtype
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The different indexing operation can potentially change the dtype of a ``Series``.
+
+.. ipython:: python
+
+   series1 = pd.Series([1, 2, 3])
+   series1.dtype
+   res = series1.reindex([0, 4])
+   res.dtype
+   res
+
+.. ipython:: python
+
+   series2 = pd.Series([True])
+   series2.dtype
+   res = series2.reindex_like(series1)
+   res.dtype
+   res
+
+This is because the (re)indexing operations above silently inserts ``NaNs`` and the ``dtype``
+changes accordingly.  This can cause some issues when using ``numpy`` ``ufuncs``
+such as ``numpy.logical_and``.
+
+See the `this old issue <https://github.com/pydata/pandas/issues/2388>`__ for a more
+detailed discussion.
diff --git a/doc/source/user_guide/categorical.rst b/doc/source/user_guide/categorical.rst
new file mode 100644
index 0000000000000..a6315c548b382
--- /dev/null
+++ b/doc/source/user_guide/categorical.rst
@@ -0,0 +1,1208 @@
+.. _categorical:
+
+{{ header }}
+
+****************
+Categorical Data
+****************
+
+This is an introduction to pandas categorical data type, including a short comparison
+with R's ``factor``.
+
+`Categoricals` are a pandas data type corresponding to categorical variables in
+statistics. A categorical variable takes on a limited, and usually fixed,
+number of possible values (`categories`; `levels` in R). Examples are gender,
+social class, blood type, country affiliation, observation time or rating via
+Likert scales.
+
+In contrast to statistical categorical variables, categorical data might have an order (e.g.
+'strongly agree' vs 'agree' or 'first observation' vs. 'second observation'), but numerical
+operations (additions, divisions, ...) are not possible.
+
+All values of categorical data are either in `categories` or `np.nan`. Order is defined by
+the order of `categories`, not lexical order of the values. Internally, the data structure
+consists of a `categories` array and an integer array of `codes` which point to the real value in
+the `categories` array.
+
+The categorical data type is useful in the following cases:
+
+* A string variable consisting of only a few different values. Converting such a string
+  variable to a categorical variable will save some memory, see :ref:`here <categorical.memory>`.
+* The lexical order of a variable is not the same as the logical order ("one", "two", "three").
+  By converting to a categorical and specifying an order on the categories, sorting and
+  min/max will use the logical order instead of the lexical order, see :ref:`here <categorical.sort>`.
+* As a signal to other Python libraries that this column should be treated as a categorical
+  variable (e.g. to use suitable statistical methods or plot types).
+
+See also the :ref:`API docs on categoricals<api.arrays.categorical>`.
+
+.. _categorical.objectcreation:
+
+Object Creation
+---------------
+
+Series Creation
+~~~~~~~~~~~~~~~
+
+Categorical ``Series`` or columns in a ``DataFrame`` can be created in several ways:
+
+By specifying ``dtype="category"`` when constructing a ``Series``:
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", "c", "a"], dtype="category")
+    s
+
+By converting an existing ``Series`` or column to a ``category`` dtype:
+
+.. ipython:: python
+
+    df = pd.DataFrame({"A": ["a", "b", "c", "a"]})
+    df["B"] = df["A"].astype('category')
+    df
+
+By using special functions, such as :func:`~pandas.cut`, which groups data into
+discrete bins. See the :ref:`example on tiling <reshaping.tile.cut>` in the docs.
+
+.. ipython:: python
+
+    df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
+    labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
+
+    df['group'] = pd.cut(df.value, range(0, 105, 10), right=False, labels=labels)
+    df.head(10)
+
+By passing a :class:`pandas.Categorical` object to a ``Series`` or assigning it to a ``DataFrame``.
+
+.. ipython:: python
+
+    raw_cat = pd.Categorical(["a", "b", "c", "a"], categories=["b", "c", "d"],
+                             ordered=False)
+    s = pd.Series(raw_cat)
+    s
+    df = pd.DataFrame({"A": ["a", "b", "c", "a"]})
+    df["B"] = raw_cat
+    df
+
+Categorical data has a specific ``category`` :ref:`dtype <basics.dtypes>`:
+
+.. ipython:: python
+
+    df.dtypes
+
+DataFrame Creation
+~~~~~~~~~~~~~~~~~~
+
+Similar to the previous section where a single column was converted to categorical, all columns in a
+``DataFrame`` can be batch converted to categorical either during or after construction.
+
+This can be done during construction by specifying ``dtype="category"`` in the ``DataFrame`` constructor:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')}, dtype="category")
+    df.dtypes
+
+Note that the categories present in each column differ; the conversion is done column by column, so
+only labels present in a given column are categories:
+
+.. ipython:: python
+
+    df['A']
+    df['B']
+
+
+.. versionadded:: 0.23.0
+
+Analogously, all columns in an existing ``DataFrame`` can be batch converted using :meth:`DataFrame.astype`:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    df_cat = df.astype('category')
+    df_cat.dtypes
+
+This conversion is likewise done column by column:
+
+.. ipython:: python
+
+    df_cat['A']
+    df_cat['B']
+
+
+Controlling Behavior
+~~~~~~~~~~~~~~~~~~~~
+
+In the examples above where we passed ``dtype='category'``, we used the default
+behavior:
+
+1. Categories are inferred from the data.
+2. Categories are unordered.
+
+To control those behaviors, instead of passing ``'category'``, use an instance
+of :class:`~pandas.api.types.CategoricalDtype`.
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    s = pd.Series(["a", "b", "c", "a"])
+    cat_type = CategoricalDtype(categories=["b", "c", "d"],
+                                ordered=True)
+    s_cat = s.astype(cat_type)
+    s_cat
+
+Similarly, a ``CategoricalDtype`` can be used with a ``DataFrame`` to ensure that categories
+are consistent among all columns.
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    cat_type = CategoricalDtype(categories=list('abcd'),
+                                ordered=True)
+    df_cat = df.astype(cat_type)
+    df_cat['A']
+    df_cat['B']
+
+.. note::
+
+    To perform table-wise conversion, where all labels in the entire ``DataFrame`` are used as
+    categories for each column, the ``categories`` parameter can be determined programmatically by
+    ``categories = pd.unique(df.to_numpy().ravel())``.
+
+If you already have ``codes`` and ``categories``, you can use the
+:func:`~pandas.Categorical.from_codes` constructor to save the factorize step
+during normal constructor mode:
+
+.. ipython:: python
+
+    splitter = np.random.choice([0, 1], 5, p=[0.5, 0.5])
+    s = pd.Series(pd.Categorical.from_codes(splitter,
+                                            categories=["train", "test"]))
+
+
+Regaining Original Data
+~~~~~~~~~~~~~~~~~~~~~~~
+
+To get back to the original ``Series`` or NumPy array, use
+``Series.astype(original_dtype)`` or ``np.asarray(categorical)``:
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", "c", "a"])
+    s
+    s2 = s.astype('category')
+    s2
+    s2.astype(str)
+    np.asarray(s2)
+
+.. note::
+
+    In contrast to R's `factor` function, categorical data is not converting input values to
+    strings; categories will end up the same data type as the original values.
+
+.. note::
+
+    In contrast to R's `factor` function, there is currently no way to assign/change labels at
+    creation time. Use `categories` to change the categories after creation time.
+
+.. _categorical.categoricaldtype:
+
+CategoricalDtype
+----------------
+
+.. versionchanged:: 0.21.0
+
+A categorical's type is fully described by
+
+1. ``categories``: a sequence of unique values and no missing values
+2. ``ordered``: a boolean
+
+This information can be stored in a :class:`~pandas.api.types.CategoricalDtype`.
+The ``categories`` argument is optional, which implies that the actual categories
+should be inferred from whatever is present in the data when the
+:class:`pandas.Categorical` is created. The categories are assumed to be unordered
+by default.
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+   CategoricalDtype(['a', 'b', 'c'])
+   CategoricalDtype(['a', 'b', 'c'], ordered=True)
+   CategoricalDtype()
+
+A :class:`~pandas.api.types.CategoricalDtype` can be used in any place pandas
+expects a `dtype`. For example :func:`pandas.read_csv`,
+:func:`pandas.DataFrame.astype`, or in the ``Series`` constructor.
+
+.. note::
+
+    As a convenience, you can use the string ``'category'`` in place of a
+    :class:`~pandas.api.types.CategoricalDtype` when you want the default behavior of
+    the categories being unordered, and equal to the set values present in the
+    array. In other words, ``dtype='category'`` is equivalent to
+    ``dtype=CategoricalDtype()``.
+
+Equality Semantics
+~~~~~~~~~~~~~~~~~~
+
+Two instances of :class:`~pandas.api.types.CategoricalDtype` compare equal
+whenever they have the same categories and order. When comparing two
+unordered categoricals, the order of the ``categories`` is not considered.
+
+.. ipython:: python
+
+   c1 = CategoricalDtype(['a', 'b', 'c'], ordered=False)
+
+   # Equal, since order is not considered when ordered=False
+   c1 == CategoricalDtype(['b', 'c', 'a'], ordered=False)
+
+   # Unequal, since the second CategoricalDtype is ordered
+   c1 == CategoricalDtype(['a', 'b', 'c'], ordered=True)
+
+All instances of ``CategoricalDtype`` compare equal to the string ``'category'``.
+
+.. ipython:: python
+
+   c1 == 'category'
+
+.. warning::
+
+   Since ``dtype='category'`` is essentially ``CategoricalDtype(None, False)``,
+   and since all instances ``CategoricalDtype`` compare equal to ``'category'``,
+   all instances of ``CategoricalDtype`` compare equal to a
+   ``CategoricalDtype(None, False)``, regardless of ``categories`` or
+   ``ordered``.
+
+Description
+-----------
+
+Using :meth:`~DataFrame.describe` on categorical data will produce similar
+output to a ``Series`` or ``DataFrame`` of type ``string``.
+
+.. ipython:: python
+
+    cat = pd.Categorical(["a", "c", "c", np.nan], categories=["b", "a", "c"])
+    df = pd.DataFrame({"cat": cat, "s": ["a", "c", "c", np.nan]})
+    df.describe()
+    df["cat"].describe()
+
+.. _categorical.cat:
+
+Working with categories
+-----------------------
+
+Categorical data has a `categories` and a `ordered` property, which list their
+possible values and whether the ordering matters or not. These properties are
+exposed as ``s.cat.categories`` and ``s.cat.ordered``. If you don't manually
+specify categories and ordering, they are inferred from the passed arguments.
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", "c", "a"], dtype="category")
+    s.cat.categories
+    s.cat.ordered
+
+It's also possible to pass in the categories in a specific order:
+
+.. ipython:: python
+
+    s = pd.Series(pd.Categorical(["a", "b", "c", "a"],
+                  categories=["c", "b", "a"]))
+    s.cat.categories
+    s.cat.ordered
+
+.. note::
+
+    New categorical data are **not** automatically ordered. You must explicitly
+    pass ``ordered=True`` to indicate an ordered ``Categorical``.
+
+
+.. note::
+
+    The result of :meth:`~Series.unique` is not always the same as ``Series.cat.categories``,
+    because ``Series.unique()`` has a couple of guarantees, namely that it returns categories
+    in the order of appearance, and it only includes values that are actually present.
+
+    .. ipython:: python
+
+         s = pd.Series(list('babc')).astype(CategoricalDtype(list('abcd')))
+         s
+
+         # categories
+         s.cat.categories
+
+         # uniques
+         s.unique()
+
+Renaming categories
+~~~~~~~~~~~~~~~~~~~
+
+Renaming categories is done by assigning new values to the
+``Series.cat.categories`` property or by using the
+:meth:`~pandas.Categorical.rename_categories` method:
+
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", "c", "a"], dtype="category")
+    s
+    s.cat.categories = ["Group %s" % g for g in s.cat.categories]
+    s
+    s = s.cat.rename_categories([1, 2, 3])
+    s
+    # You can also pass a dict-like object to map the renaming
+    s = s.cat.rename_categories({1: 'x', 2: 'y', 3: 'z'})
+    s
+
+.. note::
+
+    In contrast to R's `factor`, categorical data can have categories of other types than string.
+
+.. note::
+
+    Be aware that assigning new categories is an inplace operation, while most other operations
+    under ``Series.cat`` per default return a new ``Series`` of dtype `category`.
+
+Categories must be unique or a `ValueError` is raised:
+
+.. ipython:: python
+
+    try:
+        s.cat.categories = [1, 1, 1]
+    except ValueError as e:
+        print("ValueError:", str(e))
+
+Categories must also not be ``NaN`` or a `ValueError` is raised:
+
+.. ipython:: python
+
+    try:
+        s.cat.categories = [1, 2, np.nan]
+    except ValueError as e:
+        print("ValueError:", str(e))
+
+Appending new categories
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+Appending categories can be done by using the
+:meth:`~pandas.Categorical.add_categories` method:
+
+.. ipython:: python
+
+    s = s.cat.add_categories([4])
+    s.cat.categories
+    s
+
+Removing categories
+~~~~~~~~~~~~~~~~~~~
+
+Removing categories can be done by using the
+:meth:`~pandas.Categorical.remove_categories` method. Values which are removed
+are replaced by ``np.nan``.:
+
+.. ipython:: python
+
+    s = s.cat.remove_categories([4])
+    s
+
+Removing unused categories
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Removing unused categories can also be done:
+
+.. ipython:: python
+
+    s = pd.Series(pd.Categorical(["a", "b", "a"],
+                  categories=["a", "b", "c", "d"]))
+    s
+    s.cat.remove_unused_categories()
+
+Setting categories
+~~~~~~~~~~~~~~~~~~
+
+If you want to do remove and add new categories in one step (which has some
+speed advantage), or simply set the categories to a predefined scale,
+use :meth:`~pandas.Categorical.set_categories`.
+
+
+.. ipython:: python
+
+    s = pd.Series(["one", "two", "four", "-"], dtype="category")
+    s
+    s = s.cat.set_categories(["one", "two", "three", "four"])
+    s
+
+.. note::
+    Be aware that :func:`Categorical.set_categories` cannot know whether some category is omitted
+    intentionally or because it is misspelled or (under Python3) due to a type difference (e.g.,
+    NumPy S1 dtype and Python strings). This can result in surprising behaviour!
+
+Sorting and Order
+-----------------
+
+.. _categorical.sort:
+
+If categorical data is ordered (``s.cat.ordered == True``), then the order of the categories has a
+meaning and certain operations are possible. If the categorical is unordered, ``.min()/.max()`` will raise a ``TypeError``.
+
+.. ipython:: python
+
+    s = pd.Series(pd.Categorical(["a", "b", "c", "a"], ordered=False))
+    s.sort_values(inplace=True)
+    s = pd.Series(["a", "b", "c", "a"]).astype(
+        CategoricalDtype(ordered=True)
+    )
+    s.sort_values(inplace=True)
+    s
+    s.min(), s.max()
+
+You can set categorical data to be ordered by using ``as_ordered()`` or unordered by using ``as_unordered()``. These will by
+default return a *new* object.
+
+.. ipython:: python
+
+    s.cat.as_ordered()
+    s.cat.as_unordered()
+
+Sorting will use the order defined by categories, not any lexical order present on the data type.
+This is even true for strings and numeric data:
+
+.. ipython:: python
+
+    s = pd.Series([1, 2, 3, 1], dtype="category")
+    s = s.cat.set_categories([2, 3, 1], ordered=True)
+    s
+    s.sort_values(inplace=True)
+    s
+    s.min(), s.max()
+
+
+Reordering
+~~~~~~~~~~
+
+Reordering the categories is possible via the :meth:`Categorical.reorder_categories` and
+the :meth:`Categorical.set_categories` methods. For :meth:`Categorical.reorder_categories`, all
+old categories must be included in the new categories and no new categories are allowed. This will
+necessarily make the sort order the same as the categories order.
+
+.. ipython:: python
+
+    s = pd.Series([1, 2, 3, 1], dtype="category")
+    s = s.cat.reorder_categories([2, 3, 1], ordered=True)
+    s
+    s.sort_values(inplace=True)
+    s
+    s.min(), s.max()
+
+.. note::
+
+    Note the difference between assigning new categories and reordering the categories: the first
+    renames categories and therefore the individual values in the ``Series``, but if the first
+    position was sorted last, the renamed value will still be sorted last. Reordering means that the
+    way values are sorted is different afterwards, but not that individual values in the
+    ``Series`` are changed.
+
+.. note::
+
+    If the ``Categorical`` is not ordered, :meth:`Series.min` and :meth:`Series.max` will raise
+    ``TypeError``. Numeric operations like ``+``, ``-``, ``*``, ``/`` and operations based on them
+    (e.g. :meth:`Series.median`, which would need to compute the mean between two values if the length
+    of an array is even) do not work and raise a ``TypeError``.
+
+Multi Column Sorting
+~~~~~~~~~~~~~~~~~~~~
+
+A categorical dtyped column will participate in a multi-column sort in a similar manner to other columns.
+The ordering of the categorical is determined by the ``categories`` of that column.
+
+.. ipython:: python
+
+   dfs = pd.DataFrame({'A': pd.Categorical(list('bbeebbaa'),
+                                           categories=['e', 'a', 'b'],
+                                           ordered=True),
+                       'B': [1, 2, 1, 2, 2, 1, 2, 1]})
+   dfs.sort_values(by=['A', 'B'])
+
+Reordering the ``categories`` changes a future sort.
+
+.. ipython:: python
+
+   dfs['A'] = dfs['A'].cat.reorder_categories(['a', 'b', 'e'])
+   dfs.sort_values(by=['A', 'B'])
+
+Comparisons
+-----------
+
+Comparing categorical data with other objects is possible in three cases:
+
+* Comparing equality (``==`` and ``!=``) to a list-like object (list, Series, array,
+  ...) of the same length as the categorical data.
+* All comparisons (``==``, ``!=``, ``>``, ``>=``, ``<``, and ``<=``) of categorical data to
+  another categorical Series, when ``ordered==True`` and the `categories` are the same.
+* All comparisons of a categorical data to a scalar.
+
+All other comparisons, especially "non-equality" comparisons of two categoricals with different
+categories or a categorical with any list-like object, will raise a ``TypeError``.
+
+.. note::
+
+    Any "non-equality" comparisons of categorical data with a ``Series``, ``np.array``, ``list`` or
+    categorical data with different categories or ordering will raise a ``TypeError`` because custom
+    categories ordering could be interpreted in two ways: one with taking into account the
+    ordering and one without.
+
+.. ipython:: python
+
+    cat = pd.Series([1, 2, 3]).astype(
+        CategoricalDtype([3, 2, 1], ordered=True)
+    )
+    cat_base = pd.Series([2, 2, 2]).astype(
+        CategoricalDtype([3, 2, 1], ordered=True)
+    )
+    cat_base2 = pd.Series([2, 2, 2]).astype(
+        CategoricalDtype(ordered=True)
+    )
+
+    cat
+    cat_base
+    cat_base2
+
+Comparing to a categorical with the same categories and ordering or to a scalar works:
+
+.. ipython:: python
+
+    cat > cat_base
+    cat > 2
+
+Equality comparisons work with any list-like object of same length and scalars:
+
+.. ipython:: python
+
+    cat == cat_base
+    cat == np.array([1, 2, 3])
+    cat == 2
+
+This doesn't work because the categories are not the same:
+
+.. ipython:: python
+
+    try:
+        cat > cat_base2
+    except TypeError as e:
+        print("TypeError:", str(e))
+
+If you want to do a "non-equality" comparison of a categorical series with a list-like object
+which is not categorical data, you need to be explicit and convert the categorical data back to
+the original values:
+
+.. ipython:: python
+
+    base = np.array([1, 2, 3])
+
+    try:
+        cat > base
+    except TypeError as e:
+        print("TypeError:", str(e))
+
+    np.asarray(cat) > base
+
+When you compare two unordered categoricals with the same categories, the order is not considered:
+
+.. ipython:: python
+
+   c1 = pd.Categorical(['a', 'b'], categories=['a', 'b'], ordered=False)
+   c2 = pd.Categorical(['a', 'b'], categories=['b', 'a'], ordered=False)
+   c1 == c2
+
+Operations
+----------
+
+Apart from :meth:`Series.min`, :meth:`Series.max` and :meth:`Series.mode`, the
+following operations are possible with categorical data:
+
+``Series`` methods like :meth:`Series.value_counts` will use all categories,
+even if some categories are not present in the data:
+
+.. ipython:: python
+
+    s = pd.Series(pd.Categorical(["a", "b", "c", "c"],
+                  categories=["c", "a", "b", "d"]))
+    s.value_counts()
+
+Groupby will also show "unused" categories:
+
+.. ipython:: python
+
+    cats = pd.Categorical(["a", "b", "b", "b", "c", "c", "c"],
+                          categories=["a", "b", "c", "d"])
+    df = pd.DataFrame({"cats": cats, "values": [1, 2, 2, 2, 3, 4, 5]})
+    df.groupby("cats").mean()
+
+    cats2 = pd.Categorical(["a", "a", "b", "b"], categories=["a", "b", "c"])
+    df2 = pd.DataFrame({"cats": cats2,
+                        "B": ["c", "d", "c", "d"],
+                        "values": [1, 2, 3, 4]})
+    df2.groupby(["cats", "B"]).mean()
+
+
+Pivot tables:
+
+.. ipython:: python
+
+    raw_cat = pd.Categorical(["a", "a", "b", "b"], categories=["a", "b", "c"])
+    df = pd.DataFrame({"A": raw_cat,
+                       "B": ["c", "d", "c", "d"],
+                       "values": [1, 2, 3, 4]})
+    pd.pivot_table(df, values='values', index=['A', 'B'])
+
+Data munging
+------------
+
+The optimized pandas data access methods  ``.loc``, ``.iloc``, ``.at``, and ``.iat``,
+work as normal. The only difference is the return type (for getting) and
+that only values already in `categories` can be assigned.
+
+Getting
+~~~~~~~
+
+If the slicing operation returns either a ``DataFrame`` or a column of type
+``Series``, the ``category`` dtype is preserved.
+
+.. ipython:: python
+
+    idx = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
+    cats = pd.Series(["a", "b", "b", "b", "c", "c", "c"],
+                     dtype="category", index=idx)
+    values = [1, 2, 2, 2, 3, 4, 5]
+    df = pd.DataFrame({"cats": cats, "values": values}, index=idx)
+    df.iloc[2:4, :]
+    df.iloc[2:4, :].dtypes
+    df.loc["h":"j", "cats"]
+    df[df["cats"] == "b"]
+
+An example where the category type is not preserved is if you take one single
+row: the resulting ``Series`` is of dtype ``object``:
+
+.. ipython:: python
+
+    # get the complete "h" row as a Series
+    df.loc["h", :]
+
+Returning a single item from categorical data will also return the value, not a categorical
+of length "1".
+
+.. ipython:: python
+
+    df.iat[0, 0]
+    df["cats"].cat.categories = ["x", "y", "z"]
+    df.at["h", "cats"]  # returns a string
+
+.. note::
+    The is in contrast to R's `factor` function, where ``factor(c(1,2,3))[1]``
+    returns a single value `factor`.
+
+To get a single value ``Series`` of type ``category``, you pass in a list with
+a single value:
+
+.. ipython:: python
+
+    df.loc[["h"], "cats"]
+
+String and datetime accessors
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The accessors  ``.dt`` and ``.str`` will work if the ``s.cat.categories`` are of
+an appropriate type:
+
+
+.. ipython:: python
+
+    str_s = pd.Series(list('aabb'))
+    str_cat = str_s.astype('category')
+    str_cat
+    str_cat.str.contains("a")
+
+    date_s = pd.Series(pd.date_range('1/1/2015', periods=5))
+    date_cat = date_s.astype('category')
+    date_cat
+    date_cat.dt.day
+
+.. note::
+
+    The returned ``Series`` (or ``DataFrame``) is of the same type as if you used the
+    ``.str.<method>`` / ``.dt.<method>`` on a ``Series`` of that type (and not of
+    type ``category``!).
+
+That means, that the returned values from methods and properties on the accessors of a
+``Series`` and the returned values from methods and properties on the accessors of this
+``Series`` transformed to one of type `category` will be equal:
+
+.. ipython:: python
+
+    ret_s = str_s.str.contains("a")
+    ret_cat = str_cat.str.contains("a")
+    ret_s.dtype == ret_cat.dtype
+    ret_s == ret_cat
+
+.. note::
+
+    The work is done on the ``categories`` and then a new ``Series`` is constructed. This has
+    some performance implication if you have a ``Series`` of type string, where lots of elements
+    are repeated (i.e. the number of unique elements in the ``Series`` is a lot smaller than the
+    length of the ``Series``). In this case it can be faster to convert the original ``Series``
+    to one of type ``category`` and use ``.str.<method>`` or ``.dt.<property>`` on that.
+
+Setting
+~~~~~~~
+
+Setting values in a categorical column (or ``Series``) works as long as the
+value is included in the `categories`:
+
+.. ipython:: python
+
+    idx = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
+    cats = pd.Categorical(["a", "a", "a", "a", "a", "a", "a"],
+                          categories=["a", "b"])
+    values = [1, 1, 1, 1, 1, 1, 1]
+    df = pd.DataFrame({"cats": cats, "values": values}, index=idx)
+
+    df.iloc[2:4, :] = [["b", 2], ["b", 2]]
+    df
+    try:
+        df.iloc[2:4, :] = [["c", 3], ["c", 3]]
+    except ValueError as e:
+        print("ValueError:", str(e))
+
+Setting values by assigning categorical data will also check that the `categories` match:
+
+.. ipython:: python
+
+    df.loc["j":"k", "cats"] = pd.Categorical(["a", "a"], categories=["a", "b"])
+    df
+    try:
+        df.loc["j":"k", "cats"] = pd.Categorical(["b", "b"],
+                                                 categories=["a", "b", "c"])
+    except ValueError as e:
+        print("ValueError:", str(e))
+
+Assigning a ``Categorical`` to parts of a column of other types will use the values:
+
+.. ipython:: python
+
+    df = pd.DataFrame({"a": [1, 1, 1, 1, 1], "b": ["a", "a", "a", "a", "a"]})
+    df.loc[1:2, "a"] = pd.Categorical(["b", "b"], categories=["a", "b"])
+    df.loc[2:3, "b"] = pd.Categorical(["b", "b"], categories=["a", "b"])
+    df
+    df.dtypes
+
+.. _categorical.merge:
+
+Merging
+~~~~~~~
+
+You can concat two ``DataFrames`` containing categorical data together,
+but the categories of these categoricals need to be the same:
+
+.. ipython:: python
+
+    cat = pd.Series(["a", "b"], dtype="category")
+    vals = [1, 2]
+    df = pd.DataFrame({"cats": cat, "vals": vals})
+    res = pd.concat([df, df])
+    res
+    res.dtypes
+
+In this case the categories are not the same, and therefore an error is raised:
+
+.. ipython:: python
+
+    df_different = df.copy()
+    df_different["cats"].cat.categories = ["c", "d"]
+    try:
+        pd.concat([df, df_different])
+    except ValueError as e:
+        print("ValueError:", str(e))
+
+The same applies to ``df.append(df_different)``.
+
+See also the section on :ref:`merge dtypes<merging.dtypes>` for notes about preserving merge dtypes and performance.
+
+
+.. _categorical.union:
+
+Unioning
+~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+If you want to combine categoricals that do not necessarily have the same
+categories, the :func:`~pandas.api.types.union_categoricals` function will
+combine a list-like of categoricals. The new categories will be the union of
+the categories being combined.
+
+.. ipython:: python
+
+    from pandas.api.types import union_categoricals
+    a = pd.Categorical(["b", "c"])
+    b = pd.Categorical(["a", "b"])
+    union_categoricals([a, b])
+
+By default, the resulting categories will be ordered as
+they appear in the data. If you want the categories to
+be lexsorted, use ``sort_categories=True`` argument.
+
+.. ipython:: python
+
+    union_categoricals([a, b], sort_categories=True)
+
+``union_categoricals`` also works with the "easy" case of combining two
+categoricals of the same categories and order information
+(e.g. what you could also ``append`` for).
+
+.. ipython:: python
+
+    a = pd.Categorical(["a", "b"], ordered=True)
+    b = pd.Categorical(["a", "b", "a"], ordered=True)
+    union_categoricals([a, b])
+
+The below raises ``TypeError`` because the categories are ordered and not identical.
+
+.. code-block:: ipython
+
+   In [1]: a = pd.Categorical(["a", "b"], ordered=True)
+   In [2]: b = pd.Categorical(["a", "b", "c"], ordered=True)
+   In [3]: union_categoricals([a, b])
+   Out[3]:
+   TypeError: to union ordered Categoricals, all categories must be the same
+
+.. versionadded:: 0.20.0
+
+Ordered categoricals with different categories or orderings can be combined by
+using the ``ignore_ordered=True`` argument.
+
+.. ipython:: python
+
+    a = pd.Categorical(["a", "b", "c"], ordered=True)
+    b = pd.Categorical(["c", "b", "a"], ordered=True)
+    union_categoricals([a, b], ignore_order=True)
+
+:func:`~pandas.api.types.union_categoricals` also works with a
+``CategoricalIndex``, or ``Series`` containing categorical data, but note that
+the resulting array will always be a plain ``Categorical``:
+
+.. ipython:: python
+
+    a = pd.Series(["b", "c"], dtype='category')
+    b = pd.Series(["a", "b"], dtype='category')
+    union_categoricals([a, b])
+
+.. note::
+
+   ``union_categoricals`` may recode the integer codes for categories
+   when combining categoricals.  This is likely what you want,
+   but if you are relying on the exact numbering of the categories, be
+   aware.
+
+   .. ipython:: python
+
+      c1 = pd.Categorical(["b", "c"])
+      c2 = pd.Categorical(["a", "b"])
+
+      c1
+      # "b" is coded to 0
+      c1.codes
+
+      c2
+      # "b" is coded to 1
+      c2.codes
+
+      c = union_categoricals([c1, c2])
+      c
+      # "b" is coded to 0 throughout, same as c1, different from c2
+      c.codes
+
+.. _categorical.concat:
+
+Concatenation
+~~~~~~~~~~~~~
+
+This section describes concatenations specific to ``category`` dtype. See :ref:`Concatenating objects<merging.concat>` for general description.
+
+By default, ``Series`` or ``DataFrame`` concatenation which contains the same categories
+results in ``category`` dtype, otherwise results in ``object`` dtype.
+Use ``.astype`` or ``union_categoricals`` to get ``category`` result.
+
+.. ipython:: python
+
+   # same categories
+   s1 = pd.Series(['a', 'b'], dtype='category')
+   s2 = pd.Series(['a', 'b', 'a'], dtype='category')
+   pd.concat([s1, s2])
+
+   # different categories
+   s3 = pd.Series(['b', 'c'], dtype='category')
+   pd.concat([s1, s3])
+
+   pd.concat([s1, s3]).astype('category')
+   union_categoricals([s1.array, s3.array])
+
+
+Following table summarizes the results of ``Categoricals`` related concatenations.
+
++----------+--------------------------------------------------------+----------------------------+
+| arg1     | arg2                                                   | result                     |
++==========+========================================================+============================+
+| category | category (identical categories)                        | category                   |
++----------+--------------------------------------------------------+----------------------------+
+| category | category (different categories, both not ordered)      | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+| category | category (different categories, either one is ordered) | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+| category | not category                                           | object (dtype is inferred) |
++----------+--------------------------------------------------------+----------------------------+
+
+
+Getting Data In/Out
+-------------------
+
+You can write data that contains ``category`` dtypes to a ``HDFStore``.
+See :ref:`here <io.hdf5-categorical>` for an example and caveats.
+
+It is also possible to write data to and reading data from *Stata* format files.
+See :ref:`here <io.stata-categorical>` for an example and caveats.
+
+Writing to a CSV file will convert the data, effectively removing any information about the
+categorical (categories and ordering). So if you read back the CSV file you have to convert the
+relevant columns back to `category` and assign the right categories and categories ordering.
+
+.. ipython:: python
+
+    import io
+    s = pd.Series(pd.Categorical(['a', 'b', 'b', 'a', 'a', 'd']))
+    # rename the categories
+    s.cat.categories = ["very good", "good", "bad"]
+    # reorder the categories and add missing categories
+    s = s.cat.set_categories(["very bad", "bad", "medium", "good", "very good"])
+    df = pd.DataFrame({"cats": s, "vals": [1, 2, 3, 4, 5, 6]})
+    csv = io.StringIO()
+    df.to_csv(csv)
+    df2 = pd.read_csv(io.StringIO(csv.getvalue()))
+    df2.dtypes
+    df2["cats"]
+    # Redo the category
+    df2["cats"] = df2["cats"].astype("category")
+    df2["cats"].cat.set_categories(["very bad", "bad", "medium",
+                                    "good", "very good"],
+                                   inplace=True)
+    df2.dtypes
+    df2["cats"]
+
+The same holds for writing to a SQL database with ``to_sql``.
+
+Missing Data
+------------
+
+pandas primarily uses the value `np.nan` to represent missing data. It is by
+default not included in computations. See the :ref:`Missing Data section
+<missing_data>`.
+
+Missing values should **not** be included in the Categorical's ``categories``,
+only in the ``values``.
+Instead, it is understood that NaN is different, and is always a possibility.
+When working with the Categorical's ``codes``, missing values will always have
+a code of ``-1``.
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", np.nan, "a"], dtype="category")
+    # only two categories
+    s
+    s.cat.codes
+
+
+Methods for working with missing data, e.g. :meth:`~Series.isna`, :meth:`~Series.fillna`,
+:meth:`~Series.dropna`, all work normally:
+
+.. ipython:: python
+
+    s = pd.Series(["a", "b", np.nan], dtype="category")
+    s
+    pd.isna(s)
+    s.fillna("a")
+
+Differences to R's `factor`
+---------------------------
+
+The following differences to R's factor functions can be observed:
+
+* R's `levels` are named `categories`.
+* R's `levels` are always of type string, while `categories` in pandas can be of any dtype.
+* It's not possible to specify labels at creation time. Use ``s.cat.rename_categories(new_labels)``
+  afterwards.
+* In contrast to R's `factor` function, using categorical data as the sole input to create a
+  new categorical series will *not* remove unused categories but create a new categorical series
+  which is equal to the passed in one!
+* R allows for missing values to be included in its `levels` (pandas' `categories`). Pandas
+  does not allow `NaN` categories, but missing values can still be in the `values`.
+
+
+Gotchas
+-------
+
+.. _categorical.rfactor:
+
+Memory Usage
+~~~~~~~~~~~~
+
+.. _categorical.memory:
+
+The memory usage of a ``Categorical`` is proportional to the number of categories plus the length of the data. In contrast,
+an ``object`` dtype is a constant times the length of the data.
+
+.. ipython:: python
+
+   s = pd.Series(['foo', 'bar'] * 1000)
+
+   # object dtype
+   s.nbytes
+
+   # category dtype
+   s.astype('category').nbytes
+
+.. note::
+
+   If the number of categories approaches the length of the data, the ``Categorical`` will use nearly the same or
+   more memory than an equivalent ``object`` dtype representation.
+
+   .. ipython:: python
+
+      s = pd.Series(['foo%04d' % i for i in range(2000)])
+
+      # object dtype
+      s.nbytes
+
+      # category dtype
+      s.astype('category').nbytes
+
+
+`Categorical` is not a `numpy` array
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Currently, categorical data and the underlying ``Categorical`` is implemented as a Python
+object and not as a low-level NumPy array dtype. This leads to some problems.
+
+NumPy itself doesn't know about the new `dtype`:
+
+.. ipython:: python
+
+    try:
+        np.dtype("category")
+    except TypeError as e:
+        print("TypeError:", str(e))
+
+    dtype = pd.Categorical(["a"]).dtype
+    try:
+        np.dtype(dtype)
+    except TypeError as e:
+        print("TypeError:", str(e))
+
+Dtype comparisons work:
+
+.. ipython:: python
+
+    dtype == np.str_
+    np.str_ == dtype
+
+To check if a Series contains Categorical data, use ``hasattr(s, 'cat')``:
+
+.. ipython:: python
+
+    hasattr(pd.Series(['a'], dtype='category'), 'cat')
+    hasattr(pd.Series(['a']), 'cat')
+
+Using NumPy functions on a ``Series`` of type ``category`` should not work as `Categoricals`
+are not numeric data (even in the case that ``.categories`` is numeric).
+
+.. ipython:: python
+
+    s = pd.Series(pd.Categorical([1, 2, 3, 4]))
+    try:
+        np.sum(s)
+        # same with np.log(s),...
+    except TypeError as e:
+        print("TypeError:", str(e))
+
+.. note::
+    If such a function works, please file a bug at https://github.com/pandas-dev/pandas!
+
+dtype in apply
+~~~~~~~~~~~~~~
+
+Pandas currently does not preserve the dtype in apply functions: If you apply along rows you get
+a `Series` of ``object`` `dtype` (same as getting a row -> getting one element will return a
+basic type) and applying along columns will also convert to object. ``NaN`` values are unaffected.
+You can use ``fillna`` to handle missing values before applying a function.
+
+.. ipython:: python
+
+    df = pd.DataFrame({"a": [1, 2, 3, 4],
+                       "b": ["a", "b", "c", "d"],
+                       "cats": pd.Categorical([1, 2, 3, 2])})
+    df.apply(lambda row: type(row["cats"]), axis=1)
+    df.apply(lambda col: col.dtype, axis=0)
+
+Categorical Index
+~~~~~~~~~~~~~~~~~
+
+``CategoricalIndex`` is a type of index that is useful for supporting
+indexing with duplicates. This is a container around a ``Categorical``
+and allows efficient indexing and storage of an index with a large number of duplicated elements.
+See the :ref:`advanced indexing docs <indexing.categoricalindex>` for a more detailed
+explanation.
+
+Setting the index will create a ``CategoricalIndex``:
+
+.. ipython:: python
+
+    cats = pd.Categorical([1, 2, 3, 4], categories=[4, 2, 3, 1])
+    strings = ["a", "b", "c", "d"]
+    values = [4, 2, 3, 1]
+    df = pd.DataFrame({"strings": strings, "values": values}, index=cats)
+    df.index
+    # This now sorts by the categories order
+    df.sort_index()
+
+Side Effects
+~~~~~~~~~~~~
+
+Constructing a ``Series`` from a ``Categorical`` will not copy the input
+``Categorical``. This means that changes to the ``Series`` will in most cases
+change the original ``Categorical``:
+
+.. ipython:: python
+
+    cat = pd.Categorical([1, 2, 3, 10], categories=[1, 2, 3, 4, 10])
+    s = pd.Series(cat, name="cat")
+    cat
+    s.iloc[0:2] = 10
+    cat
+    df = pd.DataFrame(s)
+    df["cat"].cat.categories = [1, 2, 3, 4, 5]
+    cat
+
+Use ``copy=True`` to prevent such a behaviour or simply don't reuse ``Categoricals``:
+
+.. ipython:: python
+
+    cat = pd.Categorical([1, 2, 3, 10], categories=[1, 2, 3, 4, 10])
+    s = pd.Series(cat, name="cat", copy=True)
+    cat
+    s.iloc[0:2] = 10
+    cat
+
+.. note::
+
+    This also happens in some cases when you supply a NumPy array instead of a ``Categorical``:
+    using an int array (e.g. ``np.array([1,2,3,4])``) will exhibit the same behavior, while using
+    a string array (e.g. ``np.array(["a","b","c","a"])``) will not.
diff --git a/doc/source/user_guide/computation.rst b/doc/source/user_guide/computation.rst
new file mode 100644
index 0000000000000..95142a7b83435
--- /dev/null
+++ b/doc/source/user_guide/computation.rst
@@ -0,0 +1,969 @@
+.. _computation:
+
+{{ header }}
+
+Computational tools
+===================
+
+Statistical Functions
+---------------------
+
+.. _computation.pct_change:
+
+Percent Change
+~~~~~~~~~~~~~~
+
+``Series``, ``DataFrame``, and ``Panel`` all have a method
+:meth:`~DataFrame.pct_change` to compute the percent change over a given number
+of periods (using ``fill_method`` to fill NA/null values *before* computing
+the percent change).
+
+.. ipython:: python
+
+   ser = pd.Series(np.random.randn(8))
+
+   ser.pct_change()
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 4))
+
+   df.pct_change(periods=3)
+
+.. _computation.covariance:
+
+Covariance
+~~~~~~~~~~
+
+:meth:`Series.cov` can be used to compute covariance between series
+(excluding missing values).
+
+.. ipython:: python
+
+   s1 = pd.Series(np.random.randn(1000))
+   s2 = pd.Series(np.random.randn(1000))
+   s1.cov(s2)
+
+Analogously, :meth:`DataFrame.cov` to compute pairwise covariances among the
+series in the DataFrame, also excluding NA/null values.
+
+.. _computation.covariance.caveats:
+
+.. note::
+
+    Assuming the missing data are missing at random this results in an estimate
+    for the covariance matrix which is unbiased. However, for many applications
+    this estimate may not be acceptable because the estimated covariance matrix
+    is not guaranteed to be positive semi-definite. This could lead to
+    estimated correlations having absolute values which are greater than one,
+    and/or a non-invertible covariance matrix. See `Estimation of covariance
+    matrices <http://en.wikipedia.org/w/index.php?title=Estimation_of_covariance_matrices>`_
+    for more details.
+
+.. ipython:: python
+
+   frame = pd.DataFrame(np.random.randn(1000, 5),
+                        columns=['a', 'b', 'c', 'd', 'e'])
+   frame.cov()
+
+``DataFrame.cov`` also supports an optional ``min_periods`` keyword that
+specifies the required minimum number of observations for each column pair
+in order to have a valid result.
+
+.. ipython:: python
+
+   frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
+   frame.loc[frame.index[:5], 'a'] = np.nan
+   frame.loc[frame.index[5:10], 'b'] = np.nan
+
+   frame.cov()
+
+   frame.cov(min_periods=12)
+
+
+.. _computation.correlation:
+
+Correlation
+~~~~~~~~~~~
+
+Correlation may be computed using the :meth:`~DataFrame.corr` method.
+Using the ``method`` parameter, several methods for computing correlations are
+provided:
+
+.. csv-table::
+    :header: "Method name", "Description"
+    :widths: 20, 80
+
+    ``pearson (default)``, Standard correlation coefficient
+    ``kendall``, Kendall Tau correlation coefficient
+    ``spearman``, Spearman rank correlation coefficient
+
+.. \rho = \cov(x, y) / \sigma_x \sigma_y
+
+All of these are currently computed using pairwise complete observations.
+Wikipedia has articles covering the above correlation coefficients:
+
+* `Pearson correlation coefficient <https://en.wikipedia.org/wiki/Pearson_correlation_coefficient>`_
+* `Kendall rank correlation coefficient <https://en.wikipedia.org/wiki/Kendall_rank_correlation_coefficient>`_
+* `Spearman's rank correlation coefficient <https://en.wikipedia.org/wiki/Spearman%27s_rank_correlation_coefficient>`_
+
+.. note::
+
+    Please see the :ref:`caveats <computation.covariance.caveats>` associated
+    with this method of calculating correlation matrices in the
+    :ref:`covariance section <computation.covariance>`.
+
+.. ipython:: python
+
+   frame = pd.DataFrame(np.random.randn(1000, 5),
+                        columns=['a', 'b', 'c', 'd', 'e'])
+   frame.iloc[::2] = np.nan
+
+   # Series with Series
+   frame['a'].corr(frame['b'])
+   frame['a'].corr(frame['b'], method='spearman')
+
+   # Pairwise correlation of DataFrame columns
+   frame.corr()
+
+Note that non-numeric columns will be automatically excluded from the
+correlation calculation.
+
+Like ``cov``, ``corr`` also supports the optional ``min_periods`` keyword:
+
+.. ipython:: python
+
+   frame = pd.DataFrame(np.random.randn(20, 3), columns=['a', 'b', 'c'])
+   frame.loc[frame.index[:5], 'a'] = np.nan
+   frame.loc[frame.index[5:10], 'b'] = np.nan
+
+   frame.corr()
+
+   frame.corr(min_periods=12)
+
+
+.. versionadded:: 0.24.0
+
+The ``method`` argument can also be a callable for a generic correlation
+calculation. In this case, it should be a single function
+that produces a single value from two ndarray inputs. Suppose we wanted to
+compute the correlation based on histogram intersection:
+
+.. ipython:: python
+
+   # histogram intersection
+   def histogram_intersection(a, b):
+       return np.minimum(np.true_divide(a, a.sum()),
+                         np.true_divide(b, b.sum())).sum()
+
+   frame.corr(method=histogram_intersection)
+
+A related method :meth:`~DataFrame.corrwith` is implemented on DataFrame to
+compute the correlation between like-labeled Series contained in different
+DataFrame objects.
+
+.. ipython:: python
+
+   index = ['a', 'b', 'c', 'd', 'e']
+   columns = ['one', 'two', 'three', 'four']
+   df1 = pd.DataFrame(np.random.randn(5, 4), index=index, columns=columns)
+   df2 = pd.DataFrame(np.random.randn(4, 4), index=index[:4], columns=columns)
+   df1.corrwith(df2)
+   df2.corrwith(df1, axis=1)
+
+.. _computation.ranking:
+
+Data ranking
+~~~~~~~~~~~~
+
+The :meth:`~Series.rank` method produces a data ranking with ties being
+assigned the mean of the ranks (by default) for the group:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.np.random.randn(5), index=list('abcde'))
+   s['d'] = s['b']  # so there's a tie
+   s.rank()
+
+:meth:`~DataFrame.rank` is also a DataFrame method and can rank either the rows
+(``axis=0``) or the columns (``axis=1``). ``NaN`` values are excluded from the
+ranking.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.np.random.randn(10, 6))
+   df[4] = df[2][:5]  # some ties
+   df
+   df.rank(1)
+
+``rank`` optionally takes a parameter ``ascending`` which by default is true;
+when false, data is reverse-ranked, with larger values assigned a smaller rank.
+
+``rank`` supports different tie-breaking methods, specified with the ``method``
+parameter:
+
+  - ``average`` : average rank of tied group
+  - ``min`` : lowest rank in the group
+  - ``max`` : highest rank in the group
+  - ``first`` : ranks assigned in the order they appear in the array
+
+.. _stats.moments:
+
+Window Functions
+----------------
+
+.. currentmodule:: pandas.core.window
+
+For working with data, a number of window functions are provided for
+computing common *window* or *rolling* statistics. Among these are count, sum,
+mean, median, correlation, variance, covariance, standard deviation, skewness,
+and kurtosis.
+
+The ``rolling()`` and ``expanding()``
+functions can be used directly from DataFrameGroupBy objects,
+see the :ref:`groupby docs <groupby.transform.window_resample>`.
+
+
+.. note::
+
+   The API for window statistics is quite similar to the way one works with ``GroupBy`` objects, see the documentation :ref:`here <groupby>`.
+
+We work with ``rolling``, ``expanding`` and ``exponentially weighted`` data through the corresponding
+objects, :class:`~pandas.core.window.Rolling`, :class:`~pandas.core.window.Expanding` and :class:`~pandas.core.window.EWM`.
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(1000),
+                 index=pd.date_range('1/1/2000', periods=1000))
+   s = s.cumsum()
+   s
+
+These are created from methods on ``Series`` and ``DataFrame``.
+
+.. ipython:: python
+
+   r = s.rolling(window=60)
+   r
+
+These object provide tab-completion of the available methods and properties.
+
+.. code-block:: ipython
+
+   In [14]: r.<TAB>                                          # noqa: E225, E999
+   r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
+   r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
+
+Generally these methods all have the same interface. They all
+accept the following arguments:
+
+- ``window``: size of moving window
+- ``min_periods``: threshold of non-null data points to require (otherwise
+  result is NA)
+- ``center``: boolean, whether to set the labels at the center (default is False)
+
+We can then call methods on these ``rolling`` objects. These return like-indexed objects:
+
+.. ipython:: python
+
+   r.mean()
+
+.. ipython:: python
+
+   s.plot(style='k--')
+
+   @savefig rolling_mean_ex.png
+   r.mean().plot(style='k')
+
+.. ipython:: python
+   :suppress:
+
+   plt.close('all')
+
+They can also be applied to DataFrame objects. This is really just syntactic
+sugar for applying the moving window operator to all of the DataFrame's columns:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=pd.date_range('1/1/2000', periods=1000),
+                     columns=['A', 'B', 'C', 'D'])
+   df = df.cumsum()
+
+   @savefig rolling_mean_frame.png
+   df.rolling(window=60).sum().plot(subplots=True)
+
+.. _stats.summary:
+
+Method Summary
+~~~~~~~~~~~~~~
+
+We provide a number of common statistical functions:
+
+.. currentmodule:: pandas.core.window
+
+.. csv-table::
+    :header: "Method", "Description"
+    :widths: 20, 80
+
+    :meth:`~Rolling.count`, Number of non-null observations
+    :meth:`~Rolling.sum`, Sum of values
+    :meth:`~Rolling.mean`, Mean of values
+    :meth:`~Rolling.median`, Arithmetic median of values
+    :meth:`~Rolling.min`, Minimum
+    :meth:`~Rolling.max`, Maximum
+    :meth:`~Rolling.std`, Bessel-corrected sample standard deviation
+    :meth:`~Rolling.var`, Unbiased variance
+    :meth:`~Rolling.skew`, Sample skewness (3rd moment)
+    :meth:`~Rolling.kurt`, Sample kurtosis (4th moment)
+    :meth:`~Rolling.quantile`, Sample quantile (value at %)
+    :meth:`~Rolling.apply`, Generic apply
+    :meth:`~Rolling.cov`, Unbiased covariance (binary)
+    :meth:`~Rolling.corr`, Correlation (binary)
+
+The :meth:`~Rolling.apply` function takes an extra ``func`` argument and performs
+generic rolling computations. The ``func`` argument should be a single function
+that produces a single value from an ndarray input. Suppose we wanted to
+compute the mean absolute deviation on a rolling basis:
+
+.. ipython:: python
+
+   def mad(x):
+       return np.fabs(x - x.mean()).mean()
+
+   @savefig rolling_apply_ex.png
+   s.rolling(window=60).apply(mad, raw=True).plot(style='k')
+
+.. _stats.rolling_window:
+
+Rolling Windows
+~~~~~~~~~~~~~~~
+
+Passing ``win_type`` to ``.rolling`` generates a generic rolling window computation, that is weighted according the ``win_type``.
+The following methods are available:
+
+.. csv-table::
+    :header: "Method", "Description"
+    :widths: 20, 80
+
+    :meth:`~Window.sum`, Sum of values
+    :meth:`~Window.mean`, Mean of values
+
+The weights used in the window are specified by the ``win_type`` keyword.
+The list of recognized types are the `scipy.signal window functions
+<https://docs.scipy.org/doc/scipy/reference/signal.html#window-functions>`__:
+
+* ``boxcar``
+* ``triang``
+* ``blackman``
+* ``hamming``
+* ``bartlett``
+* ``parzen``
+* ``bohman``
+* ``blackmanharris``
+* ``nuttall``
+* ``barthann``
+* ``kaiser`` (needs beta)
+* ``gaussian`` (needs std)
+* ``general_gaussian`` (needs power, width)
+* ``slepian`` (needs width).
+
+.. ipython:: python
+
+   ser = pd.Series(np.random.randn(10),
+                   index=pd.date_range('1/1/2000', periods=10))
+
+   ser.rolling(window=5, win_type='triang').mean()
+
+Note that the ``boxcar`` window is equivalent to :meth:`~Rolling.mean`.
+
+.. ipython:: python
+
+   ser.rolling(window=5, win_type='boxcar').mean()
+   ser.rolling(window=5).mean()
+
+For some windowing functions, additional parameters must be specified:
+
+.. ipython:: python
+
+   ser.rolling(window=5, win_type='gaussian').mean(std=0.1)
+
+.. _stats.moments.normalization:
+
+.. note::
+
+    For ``.sum()`` with a ``win_type``, there is no normalization done to the
+    weights for the window. Passing custom weights of ``[1, 1, 1]`` will yield a different
+    result than passing weights of ``[2, 2, 2]``, for example. When passing a
+    ``win_type`` instead of explicitly specifying the weights, the weights are
+    already normalized so that the largest weight is 1.
+
+    In contrast, the nature of the ``.mean()`` calculation is
+    such that the weights are normalized with respect to each other. Weights
+    of ``[1, 1, 1]`` and ``[2, 2, 2]`` yield the same result.
+
+.. _stats.moments.ts:
+
+Time-aware Rolling
+~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+New in version 0.19.0 are the ability to pass an offset (or convertible) to a ``.rolling()`` method and have it produce
+variable sized windows based on the passed time window. For each time point, this includes all preceding values occurring
+within the indicated time delta.
+
+This can be particularly useful for a non-regular time frequency index.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.date_range('20130101 09:00:00',
+                                          periods=5,
+                                          freq='s'))
+   dft
+
+This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
+
+.. ipython:: python
+
+   dft.rolling(2).sum()
+   dft.rolling(2, min_periods=1).sum()
+
+Specifying an offset allows a more intuitive specification of the rolling frequency.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
+
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.Index([pd.Timestamp('20130101 09:00:00'),
+                                      pd.Timestamp('20130101 09:00:02'),
+                                      pd.Timestamp('20130101 09:00:03'),
+                                      pd.Timestamp('20130101 09:00:05'),
+                                      pd.Timestamp('20130101 09:00:06')],
+                                     name='foo'))
+   dft
+   dft.rolling(2).sum()
+
+
+Using the time-specification generates variable windows for this sparse data.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
+default of the index) in a DataFrame.
+
+.. ipython:: python
+
+   dft = dft.reset_index()
+   dft
+   dft.rolling('2s', on='foo').sum()
+
+.. _stats.rolling_window.endpoints:
+
+Rolling Window Endpoints
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+The inclusion of the interval endpoints in rolling window calculations can be specified with the ``closed``
+parameter:
+
+.. csv-table::
+    :header: "``closed``", "Description", "Default for"
+    :widths: 20, 30, 30
+
+    ``right``, close right endpoint, time-based windows
+    ``left``, close left endpoint,
+    ``both``, close both endpoints, fixed windows
+    ``neither``, open endpoints,
+
+For example, having the right endpoint open is useful in many problems that require that there is no contamination
+from present information back to past information. This allows the rolling window to compute statistics
+"up to that point in time", but not including that point in time.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'x': 1},
+                     index=[pd.Timestamp('20130101 09:00:01'),
+                            pd.Timestamp('20130101 09:00:02'),
+                            pd.Timestamp('20130101 09:00:03'),
+                            pd.Timestamp('20130101 09:00:04'),
+                            pd.Timestamp('20130101 09:00:06')])
+
+   df["right"] = df.rolling('2s', closed='right').x.sum()  # default
+   df["both"] = df.rolling('2s', closed='both').x.sum()
+   df["left"] = df.rolling('2s', closed='left').x.sum()
+   df["neither"] = df.rolling('2s', closed='neither').x.sum()
+
+   df
+
+Currently, this feature is only implemented for time-based windows.
+For fixed windows, the closed parameter cannot be set and the rolling window will always have both endpoints closed.
+
+.. _stats.moments.ts-versus-resampling:
+
+Time-aware Rolling vs. Resampling
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Using ``.rolling()`` with a time-based index is quite similar to :ref:`resampling <timeseries.resampling>`. They
+both operate and perform reductive operations on time-indexed pandas objects.
+
+When using ``.rolling()`` with an offset. The offset is a time-delta. Take a backwards-in-time looking window, and
+aggregate all of the values in that window (including the end-point, but not the start-point). This is the new value
+at that point in the result. These are variable sized windows in time-space for each point of the input. You will get
+a same sized result as the input.
+
+When using ``.resample()`` with an offset. Construct a new index that is the frequency of the offset. For each frequency
+bin, aggregate points from the input within a backwards-in-time looking window that fall in that bin. The result of this
+aggregation is the output for that frequency point. The windows are fixed size in the frequency space. Your result
+will have the shape of a regular frequency between the min and the max of the original input object.
+
+To summarize, ``.rolling()`` is a time-based window operation, while ``.resample()`` is a frequency-based window operation.
+
+Centering Windows
+~~~~~~~~~~~~~~~~~
+
+By default the labels are set to the right edge of the window, but a
+``center`` keyword is available so the labels can be set at the center.
+
+.. ipython:: python
+
+   ser.rolling(window=5).mean()
+   ser.rolling(window=5, center=True).mean()
+
+.. _stats.moments.binary:
+
+Binary Window Functions
+~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`~Rolling.cov` and :meth:`~Rolling.corr` can compute moving window statistics about
+two ``Series`` or any combination of ``DataFrame/Series`` or
+``DataFrame/DataFrame``. Here is the behavior in each case:
+
+* two ``Series``: compute the statistic for the pairing.
+* ``DataFrame/Series``: compute the statistics for each column of the DataFrame
+  with the passed Series, thus returning a DataFrame.
+* ``DataFrame/DataFrame``: by default compute the statistic for matching column
+  names, returning a DataFrame. If the keyword argument ``pairwise=True`` is
+  passed then computes the statistic for each pair of columns, returning a
+  ``MultiIndexed DataFrame`` whose ``index`` are the dates in question (see :ref:`the next section
+  <stats.moments.corr_pairwise>`).
+
+For example:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=pd.date_range('1/1/2000', periods=1000),
+                     columns=['A', 'B', 'C', 'D'])
+   df = df.cumsum()
+
+   df2 = df[:20]
+   df2.rolling(window=5).corr(df2['B'])
+
+.. _stats.moments.corr_pairwise:
+
+Computing rolling pairwise covariances and correlations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   Prior to version 0.20.0 if ``pairwise=True`` was passed, a ``Panel`` would be returned.
+   This will now return a 2-level MultiIndexed DataFrame, see the whatsnew :ref:`here <whatsnew_0200.api_breaking.rolling_pairwise>`.
+
+In financial data analysis and other fields it's common to compute covariance
+and correlation matrices for a collection of time series. Often one is also
+interested in moving-window covariance and correlation matrices. This can be
+done by passing the ``pairwise`` keyword argument, which in the case of
+``DataFrame`` inputs will yield a MultiIndexed ``DataFrame`` whose ``index`` are the dates in
+question. In the case of a single DataFrame argument the ``pairwise`` argument
+can even be omitted:
+
+.. note::
+
+    Missing values are ignored and each entry is computed using the pairwise
+    complete observations.  Please see the :ref:`covariance section
+    <computation.covariance>` for :ref:`caveats
+    <computation.covariance.caveats>` associated with this method of
+    calculating covariance and correlation matrices.
+
+.. ipython:: python
+
+   covs = (df[['B', 'C', 'D']].rolling(window=50)
+                              .cov(df[['A', 'B', 'C']], pairwise=True))
+   covs.loc['2002-09-22':]
+
+.. ipython:: python
+
+   correls = df.rolling(window=50).corr()
+   correls.loc['2002-09-22':]
+
+You can efficiently retrieve the time series of correlations between two
+columns by reshaping and indexing:
+
+.. ipython:: python
+   :suppress:
+
+   plt.close('all')
+
+.. ipython:: python
+
+   @savefig rolling_corr_pairwise_ex.png
+   correls.unstack(1)[('A', 'C')].plot()
+
+.. _stats.aggregate:
+
+Aggregation
+-----------
+
+Once the ``Rolling``, ``Expanding`` or ``EWM`` objects have been created, several methods are available to
+perform multiple computations on the data. These operations are similar to the :ref:`aggregating API <basics.aggregate>`,
+:ref:`groupby API <groupby.aggregate>`, and :ref:`resample API <timeseries.aggregate>`.
+
+
+.. ipython:: python
+
+   dfa = pd.DataFrame(np.random.randn(1000, 3),
+                      index=pd.date_range('1/1/2000', periods=1000),
+                      columns=['A', 'B', 'C'])
+   r = dfa.rolling(window=60, min_periods=1)
+   r
+
+We can aggregate by passing a function to the entire DataFrame, or select a
+Series (or multiple Series) via standard ``__getitem__``.
+
+.. ipython:: python
+
+   r.aggregate(np.sum)
+
+   r['A'].aggregate(np.sum)
+
+   r[['A', 'B']].aggregate(np.sum)
+
+As you can see, the result of the aggregation will have the selected columns, or all
+columns if none are selected.
+
+.. _stats.aggregate.multifunc:
+
+Applying multiple functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+With windowed ``Series`` you can also pass a list of functions to do
+aggregation with, outputting a DataFrame:
+
+.. ipython:: python
+
+   r['A'].agg([np.sum, np.mean, np.std])
+
+On a windowed DataFrame, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
+
+.. ipython:: python
+
+   r.agg([np.sum, np.mean])
+
+Passing a dict of functions has different behavior by default, see the next
+section.
+
+Applying different functions to DataFrame columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By passing a dict to ``aggregate`` you can apply a different aggregation to the
+columns of a ``DataFrame``:
+
+.. ipython:: python
+
+   r.agg({'A': np.sum, 'B': lambda x: np.std(x, ddof=1)})
+
+The function names can also be strings. In order for a string to be valid it
+must be implemented on the windowed object
+
+.. ipython:: python
+
+   r.agg({'A': 'sum', 'B': 'std'})
+
+Furthermore you can pass a nested dict to indicate different aggregations on different columns.
+
+.. ipython:: python
+
+   r.agg({'A': ['sum', 'std'], 'B': ['mean', 'std']})
+
+
+.. _stats.moments.expanding:
+
+Expanding Windows
+-----------------
+
+A common alternative to rolling statistics is to use an *expanding* window,
+which yields the value of the statistic with all the data available up to that
+point in time.
+
+These follow a similar interface to ``.rolling``, with the ``.expanding`` method
+returning an :class:`~pandas.core.window.Expanding` object.
+
+As these calculations are a special case of rolling statistics,
+they are implemented in pandas such that the following two calls are equivalent:
+
+.. ipython:: python
+
+   df.rolling(window=len(df), min_periods=1).mean()[:5]
+
+   df.expanding(min_periods=1).mean()[:5]
+
+These have a similar set of methods to ``.rolling`` methods.
+
+Method Summary
+~~~~~~~~~~~~~~
+
+.. currentmodule:: pandas.core.window
+
+.. csv-table::
+    :header: "Function", "Description"
+    :widths: 20, 80
+
+    :meth:`~Expanding.count`, Number of non-null observations
+    :meth:`~Expanding.sum`, Sum of values
+    :meth:`~Expanding.mean`, Mean of values
+    :meth:`~Expanding.median`, Arithmetic median of values
+    :meth:`~Expanding.min`, Minimum
+    :meth:`~Expanding.max`, Maximum
+    :meth:`~Expanding.std`, Unbiased standard deviation
+    :meth:`~Expanding.var`, Unbiased variance
+    :meth:`~Expanding.skew`, Unbiased skewness (3rd moment)
+    :meth:`~Expanding.kurt`, Unbiased kurtosis (4th moment)
+    :meth:`~Expanding.quantile`, Sample quantile (value at %)
+    :meth:`~Expanding.apply`, Generic apply
+    :meth:`~Expanding.cov`, Unbiased covariance (binary)
+    :meth:`~Expanding.corr`, Correlation (binary)
+
+.. currentmodule:: pandas
+
+Aside from not having a ``window`` parameter, these functions have the same
+interfaces as their ``.rolling`` counterparts. Like above, the parameters they
+all accept are:
+
+* ``min_periods``: threshold of non-null data points to require. Defaults to
+  minimum needed to compute statistic. No ``NaNs`` will be output once
+  ``min_periods`` non-null data points have been seen.
+* ``center``: boolean, whether to set the labels at the center (default is False).
+
+.. _stats.moments.expanding.note:
+.. note::
+
+   The output of the ``.rolling`` and ``.expanding`` methods do not return a
+   ``NaN`` if there are at least ``min_periods`` non-null values in the current
+   window. For example:
+
+   .. ipython:: python
+
+        sn = pd.Series([1, 2, np.nan, 3, np.nan, 4])
+        sn
+        sn.rolling(2).max()
+        sn.rolling(2, min_periods=1).max()
+
+   In case of expanding functions, this differs from :meth:`~DataFrame.cumsum`,
+   :meth:`~DataFrame.cumprod`, :meth:`~DataFrame.cummax`,
+   and :meth:`~DataFrame.cummin`, which return ``NaN`` in the output wherever
+   a ``NaN`` is encountered in the input. In order to match the output of ``cumsum``
+   with ``expanding``, use :meth:`~DataFrame.fillna`:
+
+   .. ipython:: python
+
+        sn.expanding().sum()
+        sn.cumsum()
+        sn.cumsum().fillna(method='ffill')
+
+
+An expanding window statistic will be more stable (and less responsive) than
+its rolling window counterpart as the increasing window size decreases the
+relative impact of an individual data point. As an example, here is the
+:meth:`~core.window.Expanding.mean` output for the previous time series dataset:
+
+.. ipython:: python
+   :suppress:
+
+   plt.close('all')
+
+.. ipython:: python
+
+   s.plot(style='k--')
+
+   @savefig expanding_mean_frame.png
+   s.expanding().mean().plot(style='k')
+
+
+.. _stats.moments.exponentially_weighted:
+
+Exponentially Weighted Windows
+------------------------------
+
+.. currentmodule:: pandas.core.window
+
+A related set of functions are exponentially weighted versions of several of
+the above statistics. A similar interface to ``.rolling`` and ``.expanding`` is accessed
+through the ``.ewm`` method to receive an :class:`~EWM` object.
+A number of expanding EW (exponentially weighted)
+methods are provided:
+
+
+.. csv-table::
+    :header: "Function", "Description"
+    :widths: 20, 80
+
+    :meth:`~EWM.mean`, EW moving average
+    :meth:`~EWM.var`, EW moving variance
+    :meth:`~EWM.std`, EW moving standard deviation
+    :meth:`~EWM.corr`, EW moving correlation
+    :meth:`~EWM.cov`, EW moving covariance
+
+In general, a weighted moving average is calculated as
+
+.. math::
+
+    y_t = \frac{\sum_{i=0}^t w_i x_{t-i}}{\sum_{i=0}^t w_i},
+
+where :math:`x_t` is the input, :math:`y_t` is the result and the :math:`w_i`
+are the weights.
+
+The EW functions support two variants of exponential weights.
+The default, ``adjust=True``, uses the weights :math:`w_i = (1 - \alpha)^i`
+which gives
+
+.. math::
+
+    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...
+    + (1 - \alpha)^t x_{0}}{1 + (1 - \alpha) + (1 - \alpha)^2 + ...
+    + (1 - \alpha)^t}
+
+When ``adjust=False`` is specified, moving averages are calculated as
+
+.. math::
+
+    y_0 &= x_0 \\
+    y_t &= (1 - \alpha) y_{t-1} + \alpha x_t,
+
+which is equivalent to using weights
+
+.. math::
+
+    w_i = \begin{cases}
+        \alpha (1 - \alpha)^i & \text{if } i < t \\
+        (1 - \alpha)^i        & \text{if } i = t.
+    \end{cases}
+
+.. note::
+
+   These equations are sometimes written in terms of :math:`\alpha' = 1 - \alpha`, e.g.
+
+   .. math::
+
+      y_t = \alpha' y_{t-1} + (1 - \alpha') x_t.
+
+The difference between the above two variants arises because we are
+dealing with series which have finite history. Consider a series of infinite
+history:
+
+.. math::
+
+    y_t = \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
+    {1 + (1 - \alpha) + (1 - \alpha)^2 + ...}
+
+Noting that the denominator is a geometric series with initial term equal to 1
+and a ratio of :math:`1 - \alpha` we have
+
+.. math::
+
+    y_t &= \frac{x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...}
+    {\frac{1}{1 - (1 - \alpha)}}\\
+    &= [x_t + (1 - \alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...] \alpha \\
+    &= \alpha x_t + [(1-\alpha)x_{t-1} + (1 - \alpha)^2 x_{t-2} + ...]\alpha \\
+    &= \alpha x_t + (1 - \alpha)[x_{t-1} + (1 - \alpha) x_{t-2} + ...]\alpha\\
+    &= \alpha x_t + (1 - \alpha) y_{t-1}
+
+which shows the equivalence of the above two variants for infinite series.
+When ``adjust=True`` we have :math:`y_0 = x_0` and from the last
+representation above we have :math:`y_t = \alpha x_t + (1 - \alpha) y_{t-1}`,
+therefore there is an assumption that :math:`x_0` is not an ordinary value
+but rather an exponentially weighted moment of the infinite series up to that
+point.
+
+One must have :math:`0 < \alpha \leq 1`, and while since version 0.18.0
+it has been possible to pass :math:`\alpha` directly, it's often easier
+to think about either the **span**, **center of mass (com)** or **half-life**
+of an EW moment:
+
+.. math::
+
+   \alpha =
+    \begin{cases}
+        \frac{2}{s + 1},               & \text{for span}\ s \geq 1\\
+        \frac{1}{1 + c},               & \text{for center of mass}\ c \geq 0\\
+        1 - \exp^{\frac{\log 0.5}{h}}, & \text{for half-life}\ h > 0
+    \end{cases}
+
+One must specify precisely one of **span**, **center of mass**, **half-life**
+and **alpha** to the EW functions:
+
+* **Span** corresponds to what is commonly called an "N-day EW moving average".
+* **Center of mass** has a more physical interpretation and can be thought of
+  in terms of span: :math:`c = (s - 1) / 2`.
+* **Half-life** is the period of time for the exponential weight to reduce to
+  one half.
+* **Alpha** specifies the smoothing factor directly.
+
+Here is an example for a univariate time series:
+
+.. ipython:: python
+
+   s.plot(style='k--')
+
+   @savefig ewma_ex.png
+   s.ewm(span=20).mean().plot(style='k')
+
+EWM has a ``min_periods`` argument, which has the same
+meaning it does for all the ``.expanding`` and ``.rolling`` methods:
+no output values will be set until at least ``min_periods`` non-null values
+are encountered in the (expanding) window.
+
+EWM also has an ``ignore_na`` argument, which determines how
+intermediate null values affect the calculation of the weights.
+When ``ignore_na=False`` (the default), weights are calculated based on absolute
+positions, so that intermediate null values affect the result.
+When ``ignore_na=True``,
+weights are calculated by ignoring intermediate null values.
+For example, assuming ``adjust=True``, if ``ignore_na=False``, the weighted
+average of ``3, NaN, 5`` would be calculated as
+
+.. math::
+
+	\frac{(1-\alpha)^2 \cdot 3 + 1 \cdot 5}{(1-\alpha)^2 + 1}.
+
+Whereas if ``ignore_na=True``, the weighted average would be calculated as
+
+.. math::
+
+	\frac{(1-\alpha) \cdot 3 + 1 \cdot 5}{(1-\alpha) + 1}.
+
+The :meth:`~Ewm.var`, :meth:`~Ewm.std`, and :meth:`~Ewm.cov` functions have a ``bias`` argument,
+specifying whether the result should contain biased or unbiased statistics.
+For example, if ``bias=True``, ``ewmvar(x)`` is calculated as
+``ewmvar(x) = ewma(x**2) - ewma(x)**2``;
+whereas if ``bias=False`` (the default), the biased variance statistics
+are scaled by debiasing factors
+
+.. math::
+
+    \frac{\left(\sum_{i=0}^t w_i\right)^2}{\left(\sum_{i=0}^t w_i\right)^2 - \sum_{i=0}^t w_i^2}.
+
+(For :math:`w_i = 1`, this reduces to the usual :math:`N / (N - 1)` factor,
+with :math:`N = t + 1`.)
+See `Weighted Sample Variance <http://en.wikipedia.org/wiki/Weighted_arithmetic_mean#Weighted_sample_variance>`__
+on Wikipedia for further details.
diff --git a/doc/source/user_guide/cookbook.rst b/doc/source/user_guide/cookbook.rst
new file mode 100644
index 0000000000000..0f9726dc94816
--- /dev/null
+++ b/doc/source/user_guide/cookbook.rst
@@ -0,0 +1,1409 @@
+.. _cookbook:
+
+{{ header }}
+
+********
+Cookbook
+********
+
+This is a repository for *short and sweet* examples and links for useful pandas recipes.
+We encourage users to add to this documentation.
+
+Adding interesting links and/or inline examples to this section is a great *First Pull Request*.
+
+Simplified, condensed, new-user friendly, in-line examples have been inserted where possible to
+augment the Stack-Overflow and GitHub links.  Many of the links contain expanded information,
+above what the in-line examples offer.
+
+Pandas (pd) and Numpy (np) are the only two abbreviated imported modules. The rest are kept
+explicitly imported for newer users.
+
+These examples are written for Python 3.  Minor tweaks might be necessary for earlier python
+versions.
+
+Idioms
+------
+
+.. _cookbook.idioms:
+
+These are some neat pandas ``idioms``
+
+`if-then/if-then-else on one column, and assignment to another one or more columns:
+<https://stackoverflow.com/questions/17128302/python-pandas-idiom-for-if-then-else>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+if-then...
+**********
+
+An if-then on one column
+
+.. ipython:: python
+
+   df.loc[df.AAA >= 5, 'BBB'] = -1
+   df
+
+An if-then with assignment to 2 columns:
+
+.. ipython:: python
+
+   df.loc[df.AAA >= 5, ['BBB', 'CCC']] = 555
+   df
+
+Add another line with different logic, to do the -else
+
+.. ipython:: python
+
+   df.loc[df.AAA < 5, ['BBB', 'CCC']] = 2000
+   df
+
+Or use pandas where after you've set up a mask
+
+.. ipython:: python
+
+   df_mask = pd.DataFrame({'AAA': [True] * 4,
+                           'BBB': [False] * 4,
+                           'CCC': [True, False] * 2})
+   df.where(df_mask, -1000)
+
+`if-then-else using numpy's where()
+<https://stackoverflow.com/questions/19913659/pandas-conditional-creation-of-a-series-dataframe-column>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+   df['logic'] = np.where(df['AAA'] > 5, 'high', 'low')
+   df
+
+Splitting
+*********
+
+`Split a frame with a boolean criterion
+<https://stackoverflow.com/questions/14957116/how-to-split-a-dataframe-according-to-a-boolean-criterion>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+   df[df.AAA <= 5]
+   df[df.AAA > 5]
+
+Building Criteria
+*****************
+
+`Select with multi-column criteria
+<https://stackoverflow.com/questions/15315452/selecting-with-complex-criteria-from-pandas-dataframe>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+...and (without assignment returns a Series)
+
+.. ipython:: python
+
+   df.loc[(df['BBB'] < 25) & (df['CCC'] >= -40), 'AAA']
+
+...or (without assignment returns a Series)
+
+.. ipython:: python
+
+   df.loc[(df['BBB'] > 25) | (df['CCC'] >= -40), 'AAA']
+
+...or (with assignment modifies the DataFrame.)
+
+.. ipython:: python
+
+   df.loc[(df['BBB'] > 25) | (df['CCC'] >= 75), 'AAA'] = 0.1
+   df
+
+`Select rows with data closest to certain value using argsort
+<https://stackoverflow.com/questions/17758023/return-rows-in-a-dataframe-closest-to-a-user-defined-number>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+   aValue = 43.0
+   df.loc[(df.CCC - aValue).abs().argsort()]
+
+`Dynamically reduce a list of criteria using a binary operators
+<https://stackoverflow.com/questions/21058254/pandas-boolean-operation-in-a-python-list/21058331>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+   Crit1 = df.AAA <= 5.5
+   Crit2 = df.BBB == 10.0
+   Crit3 = df.CCC > -40.0
+
+One could hard code:
+
+.. ipython:: python
+
+   AllCrit = Crit1 & Crit2 & Crit3
+
+...Or it can be done with a list of dynamically built criteria
+
+.. ipython:: python
+
+   import functools
+
+   CritList = [Crit1, Crit2, Crit3]
+   AllCrit = functools.reduce(lambda x, y: x & y, CritList)
+
+   df[AllCrit]
+
+.. _cookbook.selection:
+
+Selection
+---------
+
+DataFrames
+**********
+
+The :ref:`indexing <indexing>` docs.
+
+`Using both row labels and value conditionals
+<https://stackoverflow.com/questions/14725068/pandas-using-row-labels-in-boolean-indexing>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+   df[(df.AAA <= 6) & (df.index.isin([0, 2, 4]))]
+
+`Use loc for label-oriented slicing and iloc positional slicing
+<https://github.com/pandas-dev/pandas/issues/2904>`__
+
+.. ipython:: python
+
+  df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                     'BBB': [10, 20, 30, 40],
+                     'CCC': [100, 50, -30, -50]},
+                    index=['foo', 'bar', 'boo', 'kar'])
+
+
+There are 2 explicit slicing methods, with a third general case
+
+1. Positional-oriented (Python slicing style : exclusive of end)
+2. Label-oriented (Non-Python slicing style : inclusive of end)
+3. General (Either slicing style : depends on if the slice contains labels or positions)
+
+.. ipython:: python
+   df.iloc[0:3]  # Positional
+
+   df.loc['bar':'kar']  # Label
+
+   # Generic
+   df.iloc[0:3]
+   df.loc['bar':'kar']
+
+Ambiguity arises when an index consists of integers with a non-zero start or non-unit increment.
+
+.. ipython:: python
+
+   data = {'AAA': [4, 5, 6, 7],
+           'BBB': [10, 20, 30, 40],
+           'CCC': [100, 50, -30, -50]}
+   df2 = pd.DataFrame(data=data, index=[1, 2, 3, 4])  # Note index starts at 1.
+   df2.iloc[1:3]  # Position-oriented
+   df2.loc[1:3]  # Label-oriented
+
+`Using inverse operator (~) to take the complement of a mask
+<https://stackoverflow.com/questions/14986510/picking-out-elements-based-on-complement-of-indices-in-python-pandas>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [4, 5, 6, 7],
+                      'BBB': [10, 20, 30, 40],
+                      'CCC': [100, 50, -30, -50]})
+   df
+
+   df[~((df.AAA <= 6) & (df.index.isin([0, 2, 4])))]
+
+Panels
+******
+
+`Extend a panel frame by transposing, adding a new dimension, and transposing back to the original dimensions
+<http://stackoverflow.com/questions/15364050/extending-a-pandas-panel-frame-along-the-minor-axis>`__
+
+.. ipython:: python
+
+   rng = pd.date_range('1/1/2013', periods=100, freq='D')
+   data = np.random.randn(100, 4)
+   cols = ['A', 'B', 'C', 'D']
+   df1 = pd.DataFrame(data, rng, cols)
+   df2 = pd.DataFrame(data, rng, cols)
+   df3 = pd.DataFrame(data, rng, cols)
+
+   pf = pd.Panel({'df1': df1, 'df2': df2, 'df3': df3})
+   pf
+
+   pf.loc[:, :, 'F'] = pd.DataFrame(data, rng, cols)
+   pf
+
+`Mask a panel by using np.where and then reconstructing the panel with the new masked values
+<https://stackoverflow.com/questions/14650341/boolean-mask-in-pandas-panel>`__
+
+New Columns
+***********
+
+`Efficiently and dynamically creating new columns using applymap
+<https://stackoverflow.com/questions/16575868/efficiently-creating-additional-columns-in-a-pandas-dataframe-using-map>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [1, 2, 1, 3],
+                      'BBB': [1, 1, 2, 2],
+                      'CCC': [2, 1, 3, 1]})
+   df
+
+   source_cols = df.columns   # Or some subset would work too
+   new_cols = [str(x) + "_cat" for x in source_cols]
+   categories = {1: 'Alpha', 2: 'Beta', 3: 'Charlie'}
+
+   df[new_cols] = df[source_cols].applymap(categories.get)
+   df
+
+`Keep other columns when using min() with groupby
+<https://stackoverflow.com/questions/23394476/keep-other-columns-when-using-min-with-groupby>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'AAA': [1, 1, 1, 2, 2, 2, 3, 3],
+                      'BBB': [2, 1, 3, 4, 5, 1, 2, 3]})
+   df
+
+Method 1 : idxmin() to get the index of the minimums
+
+.. ipython:: python
+
+   df.loc[df.groupby("AAA")["BBB"].idxmin()]
+
+Method 2 : sort then take first of each
+
+.. ipython:: python
+
+   df.sort_values(by="BBB").groupby("AAA", as_index=False).first()
+
+Notice the same results, with the exception of the index.
+
+.. _cookbook.multi_index:
+
+MultiIndexing
+-------------
+
+The :ref:`multindexing <advanced.hierarchical>` docs.
+
+`Creating a MultiIndex from a labeled frame
+<https://stackoverflow.com/questions/14916358/reshaping-dataframes-in-pandas-based-on-column-labels>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'row': [0, 1, 2],
+                      'One_X': [1.1, 1.1, 1.1],
+                      'One_Y': [1.2, 1.2, 1.2],
+                      'Two_X': [1.11, 1.11, 1.11],
+                      'Two_Y': [1.22, 1.22, 1.22]})
+   df
+
+   # As Labelled Index
+   df = df.set_index('row')
+   df
+   # With Hierarchical Columns
+   df.columns = pd.MultiIndex.from_tuples([tuple(c.split('_'))
+                                           for c in df.columns])
+   df
+   # Now stack & Reset
+   df = df.stack(0).reset_index(1)
+   df
+   # And fix the labels (Notice the label 'level_1' got added automatically)
+   df.columns = ['Sample', 'All_X', 'All_Y']
+   df
+
+Arithmetic
+**********
+
+`Performing arithmetic with a MultiIndex that needs broadcasting
+<https://stackoverflow.com/questions/19501510/divide-entire-pandas-multiindex-dataframe-by-dataframe-variable/19502176#19502176>`__
+
+.. ipython:: python
+
+   cols = pd.MultiIndex.from_tuples([(x, y) for x in ['A', 'B', 'C']
+                                     for y in ['O', 'I']])
+   df = pd.DataFrame(np.random.randn(2, 6), index=['n', 'm'], columns=cols)
+   df
+   df = df.div(df['C'], level=1)
+   df
+
+Slicing
+*******
+
+`Slicing a MultiIndex with xs
+<https://stackoverflow.com/questions/12590131/how-to-slice-multindex-columns-in-pandas-dataframes>`__
+
+.. ipython:: python
+
+   coords = [('AA', 'one'), ('AA', 'six'), ('BB', 'one'), ('BB', 'two'),
+             ('BB', 'six')]
+   index = pd.MultiIndex.from_tuples(coords)
+   df = pd.DataFrame([11, 22, 33, 44, 55], index, ['MyData'])
+   df
+
+To take the cross section of the 1st level and 1st axis the index:
+
+.. ipython:: python
+
+   # Note : level and axis are optional, and default to zero
+   df.xs('BB', level=0, axis=0)
+
+...and now the 2nd level of the 1st axis.
+
+.. ipython:: python
+
+   df.xs('six', level=1, axis=0)
+
+`Slicing a MultiIndex with xs, method #2
+<https://stackoverflow.com/questions/14964493/multiindex-based-indexing-in-pandas>`__
+
+.. ipython:: python
+
+   import itertools
+
+   index = list(itertools.product(['Ada', 'Quinn', 'Violet'],
+                                  ['Comp', 'Math', 'Sci']))
+   headr = list(itertools.product(['Exams', 'Labs'], ['I', 'II']))
+   indx = pd.MultiIndex.from_tuples(index, names=['Student', 'Course'])
+   cols = pd.MultiIndex.from_tuples(headr)   # Notice these are un-named
+   data = [[70 + x + y + (x * y) % 3 for x in range(4)] for y in range(9)]
+   df = pd.DataFrame(data, indx, cols)
+   df
+
+   All = slice(None)
+   df.loc['Violet']
+   df.loc[(All, 'Math'), All]
+   df.loc[(slice('Ada', 'Quinn'), 'Math'), All]
+   df.loc[(All, 'Math'), ('Exams')]
+   df.loc[(All, 'Math'), (All, 'II')]
+
+`Setting portions of a MultiIndex with xs
+<https://stackoverflow.com/questions/19319432/pandas-selecting-a-lower-level-in-a-dataframe-to-do-a-ffill>`__
+
+Sorting
+*******
+
+`Sort by specific column or an ordered list of columns, with a MultiIndex
+<https://stackoverflow.com/questions/14733871/mutli-index-sorting-in-pandas>`__
+
+.. ipython:: python
+
+   df.sort_values(by=('Labs', 'II'), ascending=False)
+
+`Partial Selection, the need for sortedness;
+<https://github.com/pandas-dev/pandas/issues/2995>`__
+
+Levels
+******
+
+`Prepending a level to a multiindex
+<http://stackoverflow.com/questions/14744068/prepend-a-level-to-a-pandas-multiindex>`__
+
+`Flatten Hierarchical columns
+<http://stackoverflow.com/questions/14507794/python-pandas-how-to-flatten-a-hierarchical-index-in-columns>`__
+
+.. _cookbook.missing_data:
+
+Missing Data
+------------
+
+The :ref:`missing data<missing_data>` docs.
+
+Fill forward a reversed timeseries
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(6, 1),
+                     index=pd.date_range('2013-08-01', periods=6, freq='B'),
+                     columns=list('A'))
+   df.loc[df.index[3], 'A'] = np.nan
+   df
+   df.reindex(df.index[::-1]).ffill()
+
+`cumsum reset at NaN values
+<http://stackoverflow.com/questions/18196811/cumsum-reset-at-nan>`__
+
+Replace
+*******
+
+`Using replace with backrefs
+<http://stackoverflow.com/questions/16818871/extracting-value-and-creating-new-column-out-of-it>`__
+
+.. _cookbook.grouping:
+
+Grouping
+--------
+
+The :ref:`grouping <groupby>` docs.
+
+`Basic grouping with apply
+<http://stackoverflow.com/questions/15322632/python-pandas-df-groupy-agg-column-reference-in-agg>`__
+
+Unlike agg, apply's callable is passed a sub-DataFrame which gives you access to all the columns
+
+.. ipython:: python
+
+   df = pd.DataFrame({'animal': 'cat dog cat fish dog cat cat'.split(),
+                      'size': list('SSMMMLL'),
+                      'weight': [8, 10, 11, 1, 20, 12, 12],
+                      'adult': [False] * 5 + [True] * 2})
+   df
+
+   # List the size of the animals with the highest weight.
+   df.groupby('animal').apply(lambda subf: subf['size'][subf['weight'].idxmax()])
+
+`Using get_group
+<http://stackoverflow.com/questions/14734533/how-to-access-pandas-groupby-dataframe-by-key>`__
+
+.. ipython:: python
+
+   gb = df.groupby(['animal'])
+   gb.get_group('cat')
+
+`Apply to different items in a group
+<http://stackoverflow.com/questions/15262134/apply-different-functions-to-different-items-in-group-object-python-pandas>`__
+
+.. ipython:: python
+
+   def GrowUp(x):
+       avg_weight = sum(x[x['size'] == 'S'].weight * 1.5)
+       avg_weight += sum(x[x['size'] == 'M'].weight * 1.25)
+       avg_weight += sum(x[x['size'] == 'L'].weight)
+       avg_weight /= len(x)
+       return pd.Series(['L', avg_weight, True],
+                        index=['size', 'weight', 'adult'])
+
+   expected_df = gb.apply(GrowUp)
+   expected_df
+
+`Expanding Apply
+<http://stackoverflow.com/questions/14542145/reductions-down-a-column-in-pandas>`__
+
+.. ipython:: python
+
+   S = pd.Series([i / 100.0 for i in range(1, 11)])
+
+   def cum_ret(x, y):
+       return x * (1 + y)
+
+   def red(x):
+       return functools.reduce(cum_ret, x, 1.0)
+
+   S.expanding().apply(red, raw=True)
+
+
+`Replacing some values with mean of the rest of a group
+<http://stackoverflow.com/questions/14760757/replacing-values-with-groupby-means>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, -1, 1, 2]})
+   gb = df.groupby('A')
+
+   def replace(g):
+       mask = g < 0
+       return g.where(mask, g[~mask].mean())
+
+   gb.transform(replace)
+
+`Sort groups by aggregated data
+<http://stackoverflow.com/questions/14941366/pandas-sort-by-group-aggregate-and-column>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'code': ['foo', 'bar', 'baz'] * 2,
+                      'data': [0.16, -0.21, 0.33, 0.45, -0.59, 0.62],
+                      'flag': [False, True] * 3})
+
+   code_groups = df.groupby('code')
+
+   agg_n_sort_order = code_groups[['data']].transform(sum).sort_values(by='data')
+
+   sorted_df = df.loc[agg_n_sort_order.index]
+
+   sorted_df
+
+`Create multiple aggregated columns
+<http://stackoverflow.com/questions/14897100/create-multiple-columns-in-pandas-aggregation-function>`__
+
+.. ipython:: python
+
+   rng = pd.date_range(start="2014-10-07", periods=10, freq='2min')
+   ts = pd.Series(data=list(range(10)), index=rng)
+
+   def MyCust(x):
+       if len(x) > 2:
+           return x[1] * 1.234
+       return pd.NaT
+
+   mhc = {'Mean': np.mean, 'Max': np.max, 'Custom': MyCust}
+   ts.resample("5min").apply(mhc)
+   ts
+
+`Create a value counts column and reassign back to the DataFrame
+<http://stackoverflow.com/questions/17709270/i-want-to-create-a-column-of-value-counts-in-my-pandas-dataframe>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'Color': 'Red Red Red Blue'.split(),
+                      'Value': [100, 150, 50, 50]})
+   df
+   df['Counts'] = df.groupby(['Color']).transform(len)
+   df
+
+`Shift groups of the values in a column based on the index
+<http://stackoverflow.com/q/23198053/190597>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'line_race': [10, 10, 8, 10, 10, 8],
+                      'beyer': [99, 102, 103, 103, 88, 100]},
+                     index=['Last Gunfighter', 'Last Gunfighter',
+                            'Last Gunfighter', 'Paynter', 'Paynter',
+                            'Paynter'])
+   df
+   df['beyer_shifted'] = df.groupby(level=0)['beyer'].shift(1)
+   df
+
+`Select row with maximum value from each group
+<http://stackoverflow.com/q/26701849/190597>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame({'host': ['other', 'other', 'that', 'this', 'this'],
+                      'service': ['mail', 'web', 'mail', 'mail', 'web'],
+                      'no': [1, 2, 1, 2, 1]}).set_index(['host', 'service'])
+   mask = df.groupby(level=0).agg('idxmax')
+   df_count = df.loc[mask['no']].reset_index()
+   df_count
+
+`Grouping like Python's itertools.groupby
+<http://stackoverflow.com/q/29142487/846892>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame([0, 1, 0, 1, 1, 1, 0, 1, 1], columns=['A'])
+   df.A.groupby((df.A != df.A.shift()).cumsum()).groups
+   df.A.groupby((df.A != df.A.shift()).cumsum()).cumsum()
+
+Expanding Data
+**************
+
+`Alignment and to-date
+<http://stackoverflow.com/questions/15489011/python-time-series-alignment-and-to-date-functions>`__
+
+`Rolling Computation window based on values instead of counts
+<http://stackoverflow.com/questions/14300768/pandas-rolling-computation-with-window-based-on-values-instead-of-counts>`__
+
+`Rolling Mean by Time Interval
+<http://stackoverflow.com/questions/15771472/pandas-rolling-mean-by-time-interval>`__
+
+Splitting
+*********
+
+`Splitting a frame
+<http://stackoverflow.com/questions/13353233/best-way-to-split-a-dataframe-given-an-edge/15449992#15449992>`__
+
+Create a list of dataframes, split using a delineation based on logic included in rows.
+
+.. ipython:: python
+
+   df = pd.DataFrame(data={'Case': ['A', 'A', 'A', 'B', 'A', 'A', 'B', 'A',
+                                    'A'],
+                           'Data': np.random.randn(9)})
+
+   dfs = list(zip(*df.groupby((1 * (df['Case'] == 'B')).cumsum()
+                  .rolling(window=3, min_periods=1).median())))[-1]
+
+   dfs[0]
+   dfs[1]
+   dfs[2]
+
+.. _cookbook.pivot:
+
+Pivot
+*****
+The :ref:`Pivot <reshaping.pivot>` docs.
+
+`Partial sums and subtotals
+<http://stackoverflow.com/questions/15570099/pandas-pivot-tables-row-subtotals/15574875#15574875>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame(data={'Province': ['ON', 'QC', 'BC', 'AL', 'AL', 'MN', 'ON'],
+                           'City': ['Toronto', 'Montreal', 'Vancouver',
+                                    'Calgary', 'Edmonton', 'Winnipeg',
+                                    'Windsor'],
+                           'Sales': [13, 6, 16, 8, 4, 3, 1]})
+   table = pd.pivot_table(df, values=['Sales'], index=['Province'],
+                          columns=['City'], aggfunc=np.sum, margins=True)
+   table.stack('City')
+
+`Frequency table like plyr in R
+<http://stackoverflow.com/questions/15589354/frequency-tables-in-pandas-like-plyr-in-r>`__
+
+.. ipython:: python
+
+   grades = [48, 99, 75, 80, 42, 80, 72, 68, 36, 78]
+   df = pd.DataFrame({'ID': ["x%d" % r for r in range(10)],
+                      'Gender': ['F', 'M', 'F', 'M', 'F',
+                                 'M', 'F', 'M', 'M', 'M'],
+                      'ExamYear': ['2007', '2007', '2007', '2008', '2008',
+                                   '2008', '2008', '2009', '2009', '2009'],
+                      'Class': ['algebra', 'stats', 'bio', 'algebra',
+                                'algebra', 'stats', 'stats', 'algebra',
+                                'bio', 'bio'],
+                      'Participated': ['yes', 'yes', 'yes', 'yes', 'no',
+                                       'yes', 'yes', 'yes', 'yes', 'yes'],
+                      'Passed': ['yes' if x > 50 else 'no' for x in grades],
+                      'Employed': [True, True, True, False,
+                                   False, False, False, True, True, False],
+                      'Grade': grades})
+
+   df.groupby('ExamYear').agg({'Participated': lambda x: x.value_counts()['yes'],
+                               'Passed': lambda x: sum(x == 'yes'),
+                               'Employed': lambda x: sum(x),
+                               'Grade': lambda x: sum(x) / len(x)})
+
+`Plot pandas DataFrame with year over year data
+<http://stackoverflow.com/questions/30379789/plot-pandas-data-frame-with-year-over-year-data>`__
+
+To create year and month cross tabulation:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'value': np.random.randn(36)},
+                     index=pd.date_range('2011-01-01', freq='M', periods=36))
+
+   pd.pivot_table(df, index=df.index.month, columns=df.index.year,
+                  values='value', aggfunc='sum')
+
+Apply
+*****
+
+`Rolling Apply to Organize - Turning embedded lists into a MultiIndex frame
+<http://stackoverflow.com/questions/17349981/converting-pandas-dataframe-with-categorical-values-into-binary-values>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame(data={'A': [[2, 4, 8, 16], [100, 200], [10, 20, 30]],
+                           'B': [['a', 'b', 'c'], ['jj', 'kk'], ['ccc']]},
+                     index=['I', 'II', 'III'])
+
+   def SeriesFromSubList(aList):
+       return pd.Series(aList)
+
+   df_orgz = pd.concat({ind: row.apply(SeriesFromSubList)
+                        for ind, row in df.iterrows()})
+   df_orgz
+
+`Rolling Apply with a DataFrame returning a Series
+<http://stackoverflow.com/questions/19121854/using-rolling-apply-on-a-dataframe-object>`__
+
+Rolling Apply to multiple columns where function calculates a Series before a Scalar from the Series is returned
+
+.. ipython:: python
+
+   df = pd.DataFrame(data=np.random.randn(2000, 2) / 10000,
+                     index=pd.date_range('2001-01-01', periods=2000),
+                     columns=['A', 'B'])
+   df
+
+   def gm(df, const):
+       v = ((((df.A + df.B) + 1).cumprod()) - 1) * const
+       return v.iloc[-1]
+
+   s = pd.Series({df.index[i]: gm(df.iloc[i:min(i + 51, len(df) - 1)], 5)
+                  for i in range(len(df) - 50)})
+   s
+
+`Rolling apply with a DataFrame returning a Scalar
+<http://stackoverflow.com/questions/21040766/python-pandas-rolling-apply-two-column-input-into-function/21045831#21045831>`__
+
+Rolling Apply to multiple columns where function returns a Scalar (Volume Weighted Average Price)
+
+.. ipython:: python
+
+   rng = pd.date_range(start='2014-01-01', periods=100)
+   df = pd.DataFrame({'Open': np.random.randn(len(rng)),
+                      'Close': np.random.randn(len(rng)),
+                      'Volume': np.random.randint(100, 2000, len(rng))},
+                     index=rng)
+   df
+
+   def vwap(bars):
+       return ((bars.Close * bars.Volume).sum() / bars.Volume.sum())
+
+   window = 5
+   s = pd.concat([(pd.Series(vwap(df.iloc[i:i + window]),
+                   index=[df.index[i + window]]))
+                  for i in range(len(df) - window)])
+   s.round(2)
+
+Timeseries
+----------
+
+`Between times
+<http://stackoverflow.com/questions/14539992/pandas-drop-rows-outside-of-time-range>`__
+
+`Using indexer between time
+<http://stackoverflow.com/questions/17559885/pandas-dataframe-mask-based-on-index>`__
+
+`Constructing a datetime range that excludes weekends and includes only certain times
+<http://stackoverflow.com/questions/24010830/pandas-generate-sequential-timestamp-with-jump/24014440#24014440?>`__
+
+`Vectorized Lookup
+<http://stackoverflow.com/questions/13893227/vectorized-look-up-of-values-in-pandas-dataframe>`__
+
+`Aggregation and plotting time series
+<http://nipunbatra.github.io/2015/06/timeseries/>`__
+
+Turn a matrix with hours in columns and days in rows into a continuous row sequence in the form of a time series.
+`How to rearrange a Python pandas DataFrame?
+<http://stackoverflow.com/questions/15432659/how-to-rearrange-a-python-pandas-dataframe>`__
+
+`Dealing with duplicates when reindexing a timeseries to a specified frequency
+<http://stackoverflow.com/questions/22244383/pandas-df-refill-adding-two-columns-of-different-shape>`__
+
+Calculate the first day of the month for each entry in a DatetimeIndex
+
+.. ipython:: python
+
+   dates = pd.date_range('2000-01-01', periods=5)
+   dates.to_period(freq='M').to_timestamp()
+
+.. _cookbook.resample:
+
+Resampling
+**********
+
+The :ref:`Resample <timeseries.resampling>` docs.
+
+`Using Grouper instead of TimeGrouper for time grouping of values
+<https://stackoverflow.com/questions/15297053/how-can-i-divide-single-values-of-a-dataframe-by-monthly-averages>`__
+
+`Time grouping with some missing values
+<https://stackoverflow.com/questions/33637312/pandas-grouper-by-frequency-with-completeness-requirement>`__
+
+`Valid frequency arguments to Grouper
+<http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__
+
+`Grouping using a MultiIndex
+<https://stackoverflow.com/questions/41483763/pandas-timegrouper-on-multiindex>`__
+
+`Using TimeGrouper and another grouping to create subgroups, then apply a custom function
+<https://github.com/pandas-dev/pandas/issues/3791>`__
+
+`Resampling with custom periods
+<http://stackoverflow.com/questions/15408156/resampling-with-custom-periods>`__
+
+`Resample intraday frame without adding new days
+<http://stackoverflow.com/questions/14898574/resample-intrday-pandas-dataframe-without-add-new-days>`__
+
+`Resample minute data
+<http://stackoverflow.com/questions/14861023/resampling-minute-data>`__
+
+`Resample with groupby <http://stackoverflow.com/q/18677271/564538>`__
+
+.. _cookbook.merge:
+
+Merge
+-----
+
+The :ref:`Concat <merging.concatenation>` docs. The :ref:`Join <merging.join>` docs.
+
+`Append two dataframes with overlapping index (emulate R rbind)
+<http://stackoverflow.com/questions/14988480/pandas-version-of-rbind>`__
+
+.. ipython:: python
+
+   rng = pd.date_range('2000-01-01', periods=6)
+   df1 = pd.DataFrame(np.random.randn(6, 3), index=rng, columns=['A', 'B', 'C'])
+   df2 = df1.copy()
+
+Depending on df construction, ``ignore_index`` may be needed
+
+.. ipython:: python
+
+   df = df1.append(df2, ignore_index=True)
+   df
+
+`Self Join of a DataFrame
+<https://github.com/pandas-dev/pandas/issues/2996>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame(data={'Area': ['A'] * 5 + ['C'] * 2,
+                           'Bins': [110] * 2 + [160] * 3 + [40] * 2,
+                           'Test_0': [0, 1, 0, 1, 2, 0, 1],
+                           'Data': np.random.randn(7)})
+   df
+
+   df['Test_1'] = df['Test_0'] - 1
+
+   pd.merge(df, df, left_on=['Bins', 'Area', 'Test_0'],
+            right_on=['Bins', 'Area', 'Test_1'],
+            suffixes=('_L', '_R'))
+
+`How to set the index and join
+<http://stackoverflow.com/questions/14341805/pandas-merge-pd-merge-how-to-set-the-index-and-join>`__
+
+`KDB like asof join
+<http://stackoverflow.com/questions/12322289/kdb-like-asof-join-for-timeseries-data-in-pandas/12336039#12336039>`__
+
+`Join with a criteria based on the values
+<http://stackoverflow.com/questions/15581829/how-to-perform-an-inner-or-outer-join-of-dataframes-with-pandas-on-non-simplisti>`__
+
+`Using searchsorted to merge based on values inside a range
+<http://stackoverflow.com/questions/25125626/pandas-merge-with-logic/2512764>`__
+
+.. _cookbook.plotting:
+
+Plotting
+--------
+
+The :ref:`Plotting <visualization>` docs.
+
+`Make Matplotlib look like R
+<http://stackoverflow.com/questions/14349055/making-matplotlib-graphs-look-like-r-by-default>`__
+
+`Setting x-axis major and minor labels
+<http://stackoverflow.com/questions/12945971/pandas-timeseries-plot-setting-x-axis-major-and-minor-ticks-and-labels>`__
+
+`Plotting multiple charts in an ipython notebook
+<http://stackoverflow.com/questions/16392921/make-more-than-one-chart-in-same-ipython-notebook-cell>`__
+
+`Creating a multi-line plot
+<http://stackoverflow.com/questions/16568964/make-a-multiline-plot-from-csv-file-in-matplotlib>`__
+
+`Plotting a heatmap
+<http://stackoverflow.com/questions/17050202/plot-timeseries-of-histograms-in-python>`__
+
+`Annotate a time-series plot
+<http://stackoverflow.com/questions/11067368/annotate-time-series-plot-in-matplotlib>`__
+
+`Annotate a time-series plot #2
+<http://stackoverflow.com/questions/17891493/annotating-points-from-a-pandas-dataframe-in-matplotlib-plot>`__
+
+`Generate Embedded plots in excel files using Pandas, Vincent and xlsxwriter
+<https://pandas-xlsxwriter-charts.readthedocs.io/>`__
+
+`Boxplot for each quartile of a stratifying variable
+<http://stackoverflow.com/questions/23232989/boxplot-stratified-by-column-in-python-pandas>`__
+
+.. ipython:: python
+
+   df = pd.DataFrame(
+       {'stratifying_var': np.random.uniform(0, 100, 20),
+        'price': np.random.normal(100, 5, 20)})
+
+   df['quartiles'] = pd.qcut(
+       df['stratifying_var'],
+       4,
+       labels=['0-25%', '25-50%', '50-75%', '75-100%'])
+
+   @savefig quartile_boxplot.png
+   df.boxplot(column='price', by='quartiles')
+
+Data In/Out
+-----------
+
+`Performance comparison of SQL vs HDF5
+<http://stackoverflow.com/questions/16628329/hdf5-and-sqlite-concurrency-compression-i-o-performance>`__
+
+.. _cookbook.csv:
+
+CSV
+***
+
+The :ref:`CSV <io.read_csv_table>` docs
+
+`read_csv in action <http://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/>`__
+
+`appending to a csv
+<http://stackoverflow.com/questions/17134942/pandas-dataframe-output-end-of-csv>`__
+
+`Reading a csv chunk-by-chunk
+<http://stackoverflow.com/questions/11622652/large-persistent-dataframe-in-pandas/12193309#12193309>`__
+
+`Reading only certain rows of a csv chunk-by-chunk
+<http://stackoverflow.com/questions/19674212/pandas-data-frame-select-rows-and-clear-memory>`__
+
+`Reading the first few lines of a frame
+<http://stackoverflow.com/questions/15008970/way-to-read-first-few-lines-for-pandas-dataframe>`__
+
+Reading a file that is compressed but not by ``gzip/bz2`` (the native compressed formats which ``read_csv`` understands).
+This example shows a ``WinZipped`` file, but is a general application of opening the file within a context manager and
+using that handle to read.
+`See here
+<http://stackoverflow.com/questions/17789907/pandas-convert-winzipped-csv-file-to-data-frame>`__
+
+`Inferring dtypes from a file
+<http://stackoverflow.com/questions/15555005/get-inferred-dataframe-types-iteratively-using-chunksize>`__
+
+`Dealing with bad lines
+<http://github.com/pandas-dev/pandas/issues/2886>`__
+
+`Dealing with bad lines II
+<http://nipunbatra.github.io/2013/06/reading-unclean-data-csv-using-pandas/>`__
+
+`Reading CSV with Unix timestamps and converting to local timezone
+<http://nipunbatra.github.io/2013/06/pandas-reading-csv-with-unix-timestamps-and-converting-to-local-timezone/>`__
+
+`Write a multi-row index CSV without writing duplicates
+<http://stackoverflow.com/questions/17349574/pandas-write-multiindex-rows-with-to-csv>`__
+
+.. _cookbook.csv.multiple_files:
+
+Reading multiple files to create a single DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The best way to combine multiple files into a single DataFrame is to read the individual frames one by one, put all
+of the individual frames into a list, and then combine the frames in the list using :func:`pd.concat`:
+
+.. ipython:: python
+
+    for i in range(3):
+        data = pd.DataFrame(np.random.randn(10, 4))
+        data.to_csv('file_{}.csv'.format(i))
+
+    files = ['file_0.csv', 'file_1.csv', 'file_2.csv']
+    result = pd.concat([pd.read_csv(f) for f in files], ignore_index=True)
+
+You can use the same approach to read all files matching a pattern.  Here is an example using ``glob``:
+
+.. ipython:: python
+
+    import glob
+    import os
+
+    files = glob.glob('file_*.csv')
+    result = pd.concat([pd.read_csv(f) for f in files], ignore_index=True)
+
+Finally, this strategy will work with the other ``pd.read_*(...)`` functions described in the :ref:`io docs<io>`.
+
+.. ipython:: python
+    :suppress:
+
+    for i in range(3):
+        os.remove('file_{}.csv'.format(i))
+
+Parsing date components in multi-columns
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Parsing date components in multi-columns is faster with a format
+
+.. ipython:: python
+
+    i = pd.date_range('20000101', periods=10000)
+    df = pd.DataFrame({'year': i.year, 'month': i.month, 'day': i.day})
+    df.head()
+    %timeit pd.to_datetime(df.year * 10000 + df.month * 100 + df.day, format='%Y%m%d')
+    ds = df.apply(lambda x: "%04d%02d%02d" % (x['year'],
+                                              x['month'], x['day']), axis=1)
+    ds.head()
+    %timeit pd.to_datetime(ds)
+
+
+Skip row between header and data
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. ipython:: python
+
+    data = """;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+     ;;;;
+    ;;;;
+     ;;;;
+     ;;;;
+    ;;;;
+    date;Param1;Param2;Param4;Param5
+        ;m²;°C;m²;m
+    ;;;;
+    01.01.1990 00:00;1;1;2;3
+    01.01.1990 01:00;5;3;4;5
+    01.01.1990 02:00;9;5;6;7
+    01.01.1990 03:00;13;7;8;9
+    01.01.1990 04:00;17;9;10;11
+    01.01.1990 05:00;21;11;12;13
+    """
+
+Option 1: pass rows explicitly to skip rows
+"""""""""""""""""""""""""""""""""""""""""""
+
+.. ipython:: python
+
+    from pandas.compat import StringIO
+
+    pd.read_csv(StringIO(data), sep=';', skiprows=[11, 12],
+                index_col=0, parse_dates=True, header=10)
+
+Option 2: read column names and then data
+"""""""""""""""""""""""""""""""""""""""""
+
+.. ipython:: python
+
+    pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
+    columns = pd.read_csv(StringIO(data), sep=';', header=10, nrows=10).columns
+    pd.read_csv(StringIO(data), sep=';', index_col=0,
+                header=12, parse_dates=True, names=columns)
+
+
+.. _cookbook.sql:
+
+SQL
+***
+
+The :ref:`SQL <io.sql>` docs
+
+`Reading from databases with SQL
+<http://stackoverflow.com/questions/10065051/python-pandas-and-databases-like-mysql>`__
+
+.. _cookbook.excel:
+
+Excel
+*****
+
+The :ref:`Excel <io.excel>` docs
+
+`Reading from a filelike handle
+<http://stackoverflow.com/questions/15588713/sheets-of-excel-workbook-from-a-url-into-a-pandas-dataframe>`__
+
+`Modifying formatting in XlsxWriter output
+<http://pbpython.com/improve-pandas-excel-output.html>`__
+
+.. _cookbook.html:
+
+HTML
+****
+
+`Reading HTML tables from a server that cannot handle the default request
+header <http://stackoverflow.com/a/18939272/564538>`__
+
+.. _cookbook.hdf:
+
+HDFStore
+********
+
+The :ref:`HDFStores <io.hdf5>` docs
+
+`Simple Queries with a Timestamp Index
+<http://stackoverflow.com/questions/13926089/selecting-columns-from-pandas-hdfstore-table>`__
+
+`Managing heterogeneous data using a linked multiple table hierarchy
+<http://github.com/pandas-dev/pandas/issues/3032>`__
+
+`Merging on-disk tables with millions of rows
+<http://stackoverflow.com/questions/14614512/merging-two-tables-with-millions-of-rows-in-python/14617925#14617925>`__
+
+`Avoiding inconsistencies when writing to a store from multiple processes/threads
+<http://stackoverflow.com/a/29014295/2858145>`__
+
+De-duplicating a large store by chunks, essentially a recursive reduction operation. Shows a function for taking in data from
+csv file and creating a store by chunks, with date parsing as well.
+`See here
+<http://stackoverflow.com/questions/16110252/need-to-compare-very-large-files-around-1-5gb-in-python/16110391#16110391>`__
+
+`Creating a store chunk-by-chunk from a csv file
+<http://stackoverflow.com/questions/20428355/appending-column-to-frame-of-hdf-file-in-pandas/20428786#20428786>`__
+
+`Appending to a store, while creating a unique index
+<http://stackoverflow.com/questions/16997048/how-does-one-append-large-amounts-of-data-to-a-pandas-hdfstore-and-get-a-natural/16999397#16999397>`__
+
+`Large Data work flows
+<http://stackoverflow.com/questions/14262433/large-data-work-flows-using-pandas>`__
+
+`Reading in a sequence of files, then providing a global unique index to a store while appending
+<http://stackoverflow.com/questions/16997048/how-does-one-append-large-amounts-of-data-to-a-pandas-hdfstore-and-get-a-natural>`__
+
+`Groupby on a HDFStore with low group density
+<http://stackoverflow.com/questions/15798209/pandas-group-by-query-on-large-data-in-hdfstore>`__
+
+`Groupby on a HDFStore with high group density
+<http://stackoverflow.com/questions/25459982/trouble-with-grouby-on-millions-of-keys-on-a-chunked-file-in-python-pandas/25471765#25471765>`__
+
+`Hierarchical queries on a HDFStore
+<http://stackoverflow.com/questions/22777284/improve-query-performance-from-a-large-hdfstore-table-with-pandas/22820780#22820780>`__
+
+`Counting with a HDFStore
+<http://stackoverflow.com/questions/20497897/converting-dict-of-dicts-into-pandas-dataframe-memory-issues>`__
+
+`Troubleshoot HDFStore exceptions
+<http://stackoverflow.com/questions/15488809/how-to-trouble-shoot-hdfstore-exception-cannot-find-the-correct-atom-type>`__
+
+`Setting min_itemsize with strings
+<http://stackoverflow.com/questions/15988871/hdfstore-appendstring-dataframe-fails-when-string-column-contents-are-longer>`__
+
+`Using ptrepack to create a completely-sorted-index on a store
+<http://stackoverflow.com/questions/17893370/ptrepack-sortby-needs-full-index>`__
+
+Storing Attributes to a group node
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(8, 3))
+   store = pd.HDFStore('test.h5')
+   store.put('df', df)
+
+   # you can store an arbitrary Python object via pickle
+   store.get_storer('df').attrs.my_attribute = {'A': 10}
+   store.get_storer('df').attrs.my_attribute
+
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   os.remove('test.h5')
+
+.. _cookbook.binary:
+
+Binary Files
+************
+
+pandas readily accepts NumPy record arrays, if you need to read in a binary
+file consisting of an array of C structs. For example, given this C program
+in a file called ``main.c`` compiled with ``gcc main.c -std=gnu99`` on a
+64-bit machine,
+
+.. code-block:: c
+
+   #include <stdio.h>
+   #include <stdint.h>
+
+   typedef struct _Data
+   {
+       int32_t count;
+       double avg;
+       float scale;
+   } Data;
+
+   int main(int argc, const char *argv[])
+   {
+       size_t n = 10;
+       Data d[n];
+
+       for (int i = 0; i < n; ++i)
+       {
+           d[i].count = i;
+           d[i].avg = i + 1.0;
+           d[i].scale = (float) i + 2.0f;
+       }
+
+       FILE *file = fopen("binary.dat", "wb");
+       fwrite(&d, sizeof(Data), n, file);
+       fclose(file);
+
+       return 0;
+   }
+
+the following Python code will read the binary file ``'binary.dat'`` into a
+pandas ``DataFrame``, where each element of the struct corresponds to a column
+in the frame:
+
+.. code-block:: python
+
+   names = 'count', 'avg', 'scale'
+
+   # note that the offsets are larger than the size of the type because of
+   # struct padding
+   offsets = 0, 8, 16
+   formats = 'i4', 'f8', 'f4'
+   dt = np.dtype({'names': names, 'offsets': offsets, 'formats': formats},
+                 align=True)
+   df = pd.DataFrame(np.fromfile('binary.dat', dt))
+
+.. note::
+
+   The offsets of the structure elements may be different depending on the
+   architecture of the machine on which the file was created. Using a raw
+   binary file format like this for general data storage is not recommended, as
+   it is not cross platform. We recommended either HDF5 or msgpack, both of
+   which are supported by pandas' IO facilities.
+
+Computation
+-----------
+
+`Numerical integration (sample-based) of a time series
+<http://nbviewer.ipython.org/5720498>`__
+
+Correlation
+***********
+
+Often it's useful to obtain the lower (or upper) triangular form of a correlation matrix calculated from :func:`DataFrame.corr`.  This can be achieved by passing a boolean mask to ``where`` as follows:
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.random.random(size=(100, 5)))
+
+    corr_mat = df.corr()
+    mask = np.tril(np.ones_like(corr_mat, dtype=np.bool), k=-1)
+
+    corr_mat.where(mask)
+
+The `method` argument within `DataFrame.corr` can accept a callable in addition to the named correlation types.  Here we compute the `distance correlation <https://en.wikipedia.org/wiki/Distance_correlation>`__ matrix for a `DataFrame` object.
+
+.. ipython:: python
+
+   def distcorr(x, y):
+       n = len(x)
+       a = np.zeros(shape=(n, n))
+       b = np.zeros(shape=(n, n))
+
+       for i in range(n):
+           for j in range(i + 1, n):
+               a[i, j] = abs(x[i] - x[j])
+               b[i, j] = abs(y[i] - y[j])
+
+       a += a.T
+       b += b.T
+
+       a_bar = np.vstack([np.nanmean(a, axis=0)] * n)
+       b_bar = np.vstack([np.nanmean(b, axis=0)] * n)
+
+       A = a - a_bar - a_bar.T + np.full(shape=(n, n), fill_value=a_bar.mean())
+       B = b - b_bar - b_bar.T + np.full(shape=(n, n), fill_value=b_bar.mean())
+       cov_ab = np.sqrt(np.nansum(A * B)) / n
+       std_a = np.sqrt(np.sqrt(np.nansum(A**2)) / n)
+       std_b = np.sqrt(np.sqrt(np.nansum(B**2)) / n)
+
+       return cov_ab / std_a / std_b
+
+   df = pd.DataFrame(np.random.normal(size=(100, 3)))
+   df.corr(method=distcorr)
+
+Timedeltas
+----------
+
+The :ref:`Timedeltas <timedeltas.timedeltas>` docs.
+
+`Using timedeltas
+<http://github.com/pandas-dev/pandas/pull/2899>`__
+
+.. ipython:: python
+
+   import datetime
+
+   s = pd.Series(pd.date_range('2012-1-1', periods=3, freq='D'))
+
+   s - s.max()
+
+   s.max() - s
+
+   s - datetime.datetime(2011, 1, 1, 3, 5)
+
+   s + datetime.timedelta(minutes=5)
+
+   datetime.datetime(2011, 1, 1, 3, 5) - s
+
+   datetime.timedelta(minutes=5) + s
+
+`Adding and subtracting deltas and dates
+<http://stackoverflow.com/questions/16385785/add-days-to-dates-in-dataframe>`__
+
+.. ipython:: python
+
+   deltas = pd.Series([datetime.timedelta(days=i) for i in range(3)])
+
+   df = pd.DataFrame({'A': s, 'B': deltas})
+   df
+
+   df['New Dates'] = df['A'] + df['B']
+
+   df['Delta'] = df['A'] - df['New Dates']
+   df
+
+   df.dtypes
+
+`Another example
+<http://stackoverflow.com/questions/15683588/iterating-through-a-pandas-dataframe>`__
+
+Values can be set to NaT using np.nan, similar to datetime
+
+.. ipython:: python
+
+   y = s - s.shift()
+   y
+
+   y[1] = np.nan
+   y
+
+Aliasing Axis Names
+-------------------
+
+To globally provide aliases for axis names, one can define these 2 functions:
+
+.. ipython:: python
+
+   def set_axis_alias(cls, axis, alias):
+       if axis not in cls._AXIS_NUMBERS:
+           raise Exception("invalid axis [%s] for alias [%s]" % (axis, alias))
+       cls._AXIS_ALIASES[alias] = axis
+
+.. ipython:: python
+
+   def clear_axis_alias(cls, axis, alias):
+       if axis not in cls._AXIS_NUMBERS:
+           raise Exception("invalid axis [%s] for alias [%s]" % (axis, alias))
+       cls._AXIS_ALIASES.pop(alias, None)
+
+.. ipython:: python
+
+   set_axis_alias(pd.DataFrame, 'columns', 'myaxis2')
+   df2 = pd.DataFrame(np.random.randn(3, 2), columns=['c1', 'c2'],
+                      index=['i1', 'i2', 'i3'])
+   df2.sum(axis='myaxis2')
+   clear_axis_alias(pd.DataFrame, 'columns', 'myaxis2')
+
+Creating Example Data
+---------------------
+
+To create a dataframe from every combination of some given values, like R's ``expand.grid()``
+function, we can create a dict where the keys are column names and the values are lists
+of the data values:
+
+.. ipython:: python
+
+   def expand_grid(data_dict):
+       rows = itertools.product(*data_dict.values())
+       return pd.DataFrame.from_records(rows, columns=data_dict.keys())
+
+   df = expand_grid({'height': [60, 70],
+                     'weight': [100, 140, 180],
+                     'sex': ['Male', 'Female']})
+   df
diff --git a/doc/source/user_guide/enhancingperf.rst b/doc/source/user_guide/enhancingperf.rst
new file mode 100644
index 0000000000000..9941ffcc9de4d
--- /dev/null
+++ b/doc/source/user_guide/enhancingperf.rst
@@ -0,0 +1,827 @@
+.. _enhancingperf:
+
+{{ header }}
+
+*********************
+Enhancing Performance
+*********************
+
+In this part of the tutorial, we will investigate how to speed up certain
+functions operating on pandas ``DataFrames`` using three different techniques:
+Cython, Numba and :func:`pandas.eval`. We will see a speed improvement of ~200
+when we use Cython and Numba on a test function operating row-wise on the
+``DataFrame``. Using :func:`pandas.eval` we will speed up a sum by an order of
+~2.
+
+.. _enhancingperf.cython:
+
+Cython (Writing C extensions for pandas)
+----------------------------------------
+
+For many use cases writing pandas in pure Python and NumPy is sufficient. In some
+computationally heavy applications however, it can be possible to achieve sizable
+speed-ups by offloading work to `cython <http://cython.org/>`__.
+
+This tutorial assumes you have refactored as much as possible in Python, for example
+by trying to remove for-loops and making use of NumPy vectorization. It's always worth
+optimising in Python first.
+
+This tutorial walks through a "typical" process of cythonizing a slow computation.
+We use an `example from the Cython documentation <http://docs.cython.org/src/quickstart/cythonize.html>`__
+but in the context of pandas. Our final cythonized solution is around 100 times
+faster than the pure Python solution.
+
+.. _enhancingperf.pure:
+
+Pure python
+~~~~~~~~~~~
+
+We have a ``DataFrame`` to which we want to apply a function row-wise.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': np.random.randn(1000),
+                      'b': np.random.randn(1000),
+                      'N': np.random.randint(100, 1000, (1000)),
+                      'x': 'x'})
+   df
+
+Here's the function in pure Python:
+
+.. ipython:: python
+
+   def f(x):
+       return x * (x - 1)
+
+   def integrate_f(a, b, N):
+       s = 0
+       dx = (b - a) / N
+       for i in range(N):
+           s += f(a + i * dx)
+       return s * dx
+
+We achieve our result by using ``apply`` (row-wise):
+
+.. code-block:: ipython
+
+   In [7]: %timeit df.apply(lambda x: integrate_f(x['a'], x['b'], x['N']), axis=1)
+   10 loops, best of 3: 174 ms per loop
+
+But clearly this isn't fast enough for us. Let's take a look and see where the
+time is spent during this operation (limited to the most time consuming
+four calls) using the `prun ipython magic function <http://ipython.org/ipython-doc/stable/api/generated/IPython.core.magics.execution.html#IPython.core.magics.execution.ExecutionMagics.prun>`__:
+
+.. ipython:: python
+
+   %prun -l 4 df.apply(lambda x: integrate_f(x['a'], x['b'], x['N']), axis=1)  # noqa E999
+
+By far the majority of time is spend inside either ``integrate_f`` or ``f``,
+hence we'll concentrate our efforts cythonizing these two functions.
+
+.. note::
+
+  In Python 2 replacing the ``range`` with its generator counterpart (``xrange``)
+  would mean the ``range`` line would vanish. In Python 3 ``range`` is already a generator.
+
+.. _enhancingperf.plain:
+
+Plain Cython
+~~~~~~~~~~~~
+
+First we're going to need to import the Cython magic function to ipython:
+
+.. ipython:: python
+   :okwarning:
+
+   %load_ext Cython
+
+
+Now, let's simply copy our functions over to Cython as is (the suffix
+is here to distinguish between function versions):
+
+.. ipython::
+
+   In [2]: %%cython
+      ...: def f_plain(x):
+      ...:     return x * (x - 1)
+      ...: def integrate_f_plain(a, b, N):
+      ...:     s = 0
+      ...:     dx = (b - a) / N
+      ...:     for i in range(N):
+      ...:         s += f_plain(a + i * dx)
+      ...:     return s * dx
+      ...:
+
+.. note::
+
+  If you're having trouble pasting the above into your ipython, you may need
+  to be using bleeding edge ipython for paste to play well with cell magics.
+
+
+.. code-block:: ipython
+
+   In [4]: %timeit df.apply(lambda x: integrate_f_plain(x['a'], x['b'], x['N']), axis=1)
+   10 loops, best of 3: 85.5 ms per loop
+
+Already this has shaved a third off, not too bad for a simple copy and paste.
+
+.. _enhancingperf.type:
+
+Adding type
+~~~~~~~~~~~
+
+We get another huge improvement simply by providing type information:
+
+.. ipython::
+
+   In [3]: %%cython
+      ...: cdef double f_typed(double x) except? -2:
+      ...:     return x * (x - 1)
+      ...: cpdef double integrate_f_typed(double a, double b, int N):
+      ...:     cdef int i
+      ...:     cdef double s, dx
+      ...:     s = 0
+      ...:     dx = (b - a) / N
+      ...:     for i in range(N):
+      ...:         s += f_typed(a + i * dx)
+      ...:     return s * dx
+      ...:
+
+.. code-block:: ipython
+
+   In [4]: %timeit df.apply(lambda x: integrate_f_typed(x['a'], x['b'], x['N']), axis=1)
+   10 loops, best of 3: 20.3 ms per loop
+
+Now, we're talking! It's now over ten times faster than the original python
+implementation, and we haven't *really* modified the code. Let's have another
+look at what's eating up time:
+
+.. ipython:: python
+
+   %prun -l 4 df.apply(lambda x: integrate_f_typed(x['a'], x['b'], x['N']), axis=1)
+
+.. _enhancingperf.ndarray:
+
+Using ndarray
+~~~~~~~~~~~~~
+
+It's calling series... a lot! It's creating a Series from each row, and get-ting from both
+the index and the series (three times for each row). Function calls are expensive
+in Python, so maybe we could minimize these by cythonizing the apply part.
+
+.. note::
+
+  We are now passing ndarrays into the Cython function, fortunately Cython plays
+  very nicely with NumPy.
+
+.. ipython::
+
+   In [4]: %%cython
+      ...: cimport numpy as np
+      ...: import numpy as np
+      ...: cdef double f_typed(double x) except? -2:
+      ...:     return x * (x - 1)
+      ...: cpdef double integrate_f_typed(double a, double b, int N):
+      ...:     cdef int i
+      ...:     cdef double s, dx
+      ...:     s = 0
+      ...:     dx = (b - a) / N
+      ...:     for i in range(N):
+      ...:         s += f_typed(a + i * dx)
+      ...:     return s * dx
+      ...: cpdef np.ndarray[double] apply_integrate_f(np.ndarray col_a, np.ndarray col_b,
+      ...:                                            np.ndarray col_N):
+      ...:     assert (col_a.dtype == np.float
+      ...:             and col_b.dtype == np.float and col_N.dtype == np.int)
+      ...:     cdef Py_ssize_t i, n = len(col_N)
+      ...:     assert (len(col_a) == len(col_b) == n)
+      ...:     cdef np.ndarray[double] res = np.empty(n)
+      ...:     for i in range(len(col_a)):
+      ...:         res[i] = integrate_f_typed(col_a[i], col_b[i], col_N[i])
+      ...:     return res
+      ...:
+
+
+The implementation is simple, it creates an array of zeros and loops over
+the rows, applying our ``integrate_f_typed``, and putting this in the zeros array.
+
+
+.. warning::
+
+   You can **not pass** a ``Series`` directly as a ``ndarray`` typed parameter
+   to a Cython function. Instead pass the actual ``ndarray`` using the
+   :meth:`Series.to_numpy`. The reason is that the Cython
+   definition is specific to an ndarray and not the passed ``Series``.
+
+   So, do not do this:
+
+   .. code-block:: python
+
+        apply_integrate_f(df['a'], df['b'], df['N'])
+
+   But rather, use :meth:`Series.to_numpy` to get the underlying ``ndarray``:
+
+   .. code-block:: python
+
+        apply_integrate_f(df['a'].to_numpy(),
+                          df['b'].to_numpy(),
+                          df['N'].to_numpy())
+
+.. note::
+
+    Loops like this would be *extremely* slow in Python, but in Cython looping
+    over NumPy arrays is *fast*.
+
+.. code-block:: ipython
+
+   In [4]: %timeit apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
+   1000 loops, best of 3: 1.25 ms per loop
+
+We've gotten another big improvement. Let's check again where the time is spent:
+
+.. ipython:: python
+
+   %prun -l 4 apply_integrate_f(df['a'].values, df['b'].values, df['N'].values)
+
+As one might expect, the majority of the time is now spent in ``apply_integrate_f``,
+so if we wanted to make anymore efficiencies we must continue to concentrate our
+efforts here.
+
+.. _enhancingperf.boundswrap:
+
+More advanced techniques
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+There is still hope for improvement. Here's an example of using some more
+advanced Cython techniques:
+
+.. ipython::
+
+   In [5]: %%cython
+      ...: cimport cython
+      ...: cimport numpy as np
+      ...: import numpy as np
+      ...: cdef double f_typed(double x) except? -2:
+      ...:     return x * (x - 1)
+      ...: cpdef double integrate_f_typed(double a, double b, int N):
+      ...:     cdef int i
+      ...:     cdef double s, dx
+      ...:     s = 0
+      ...:     dx = (b - a) / N
+      ...:     for i in range(N):
+      ...:         s += f_typed(a + i * dx)
+      ...:     return s * dx
+      ...: @cython.boundscheck(False)
+      ...: @cython.wraparound(False)
+      ...: cpdef np.ndarray[double] apply_integrate_f_wrap(np.ndarray[double] col_a,
+      ...:                                                 np.ndarray[double] col_b,
+      ...:                                                 np.ndarray[int] col_N):
+      ...:     cdef int i, n = len(col_N)
+      ...:     assert len(col_a) == len(col_b) == n
+      ...:     cdef np.ndarray[double] res = np.empty(n)
+      ...:     for i in range(n):
+      ...:         res[i] = integrate_f_typed(col_a[i], col_b[i], col_N[i])
+      ...:     return res
+      ...:
+
+.. code-block:: ipython
+
+   In [4]: %timeit apply_integrate_f_wrap(df['a'].values, df['b'].values, df['N'].values)
+   1000 loops, best of 3: 987 us per loop
+
+Even faster, with the caveat that a bug in our Cython code (an off-by-one error,
+for example) might cause a segfault because memory access isn't checked.
+For more about ``boundscheck`` and ``wraparound``, see the Cython docs on
+`compiler directives <http://cython.readthedocs.io/en/latest/src/reference/compilation.html?highlight=wraparound#compiler-directives>`__.
+
+.. _enhancingperf.numba:
+
+Using Numba
+-----------
+
+A recent alternative to statically compiling Cython code, is to use a *dynamic jit-compiler*, Numba.
+
+Numba gives you the power to speed up your applications with high performance functions written directly in Python. With a few annotations, array-oriented and math-heavy Python code can be just-in-time compiled to native machine instructions, similar in performance to C, C++ and Fortran, without having to switch languages or Python interpreters.
+
+Numba works by generating optimized machine code using the LLVM compiler infrastructure at import time, runtime, or statically (using the included pycc tool). Numba supports compilation of Python to run on either CPU or GPU hardware, and is designed to integrate with the Python scientific software stack.
+
+.. note::
+
+    You will need to install Numba. This is easy with ``conda``, by using: ``conda install numba``, see :ref:`installing using miniconda<install.miniconda>`.
+
+.. note::
+
+    As of Numba version 0.20, pandas objects cannot be passed directly to Numba-compiled functions. Instead, one must pass the NumPy array underlying the pandas object to the Numba-compiled function as demonstrated below.
+
+Jit
+~~~
+
+We demonstrate how to use Numba to just-in-time compile our code. We simply
+take the plain Python code from above and annotate with the ``@jit`` decorator.
+
+.. code-block:: python
+
+   import numba
+
+
+   @numba.jit
+   def f_plain(x):
+       return x * (x - 1)
+
+
+   @numba.jit
+   def integrate_f_numba(a, b, N):
+       s = 0
+       dx = (b - a) / N
+       for i in range(N):
+           s += f_plain(a + i * dx)
+       return s * dx
+
+
+   @numba.jit
+   def apply_integrate_f_numba(col_a, col_b, col_N):
+       n = len(col_N)
+       result = np.empty(n, dtype='float64')
+       assert len(col_a) == len(col_b) == n
+       for i in range(n):
+           result[i] = integrate_f_numba(col_a[i], col_b[i], col_N[i])
+       return result
+
+
+   def compute_numba(df):
+       result = apply_integrate_f_numba(df['a'].values, df['b'].values,
+                                        df['N'].values)
+       return pd.Series(result, index=df.index, name='result')
+
+Note that we directly pass NumPy arrays to the Numba function. ``compute_numba`` is just a wrapper that provides a
+nicer interface by passing/returning pandas objects.
+
+.. code-block:: ipython
+
+   In [4]: %timeit compute_numba(df)
+   1000 loops, best of 3: 798 us per loop
+
+In this example, using Numba was faster than Cython.
+
+Vectorize
+~~~~~~~~~
+
+Numba can also be used to write vectorized functions that do not require the user to explicitly
+loop over the observations of a vector; a vectorized function will be applied to each row automatically.
+Consider the following toy example of doubling each observation:
+
+.. code-block:: python
+
+   import numba
+
+
+   def double_every_value_nonumba(x):
+       return x * 2
+
+
+   @numba.vectorize
+   def double_every_value_withnumba(x):  # noqa E501
+       return x * 2
+
+.. code-block:: ipython
+
+   # Custom function without numba
+   In [5]: %timeit df['col1_doubled'] = df.a.apply(double_every_value_nonumba)  # noqa E501
+   1000 loops, best of 3: 797 us per loop
+
+   # Standard implementation (faster than a custom function)
+   In [6]: %timeit df['col1_doubled'] = df.a * 2
+   1000 loops, best of 3: 233 us per loop
+
+   # Custom function with numba
+   In [7]: %timeit (df['col1_doubled'] = double_every_value_withnumba(df.a.values)
+   1000 loops, best of 3: 145 us per loop
+
+Caveats
+~~~~~~~
+
+.. note::
+
+    Numba will execute on any function, but can only accelerate certain classes of functions.
+
+Numba is best at accelerating functions that apply numerical functions to NumPy
+arrays. When passed a function that only uses operations it knows how to
+accelerate, it will execute in ``nopython`` mode.
+
+If Numba is passed a function that includes something it doesn't know how to
+work with -- a category that currently includes sets, lists, dictionaries, or
+string functions -- it will revert to ``object mode``. In ``object mode``,
+Numba will execute but your code will not speed up significantly. If you would
+prefer that Numba throw an error if it cannot compile a function in a way that
+speeds up your code, pass Numba the argument
+``nopython=True`` (e.g.  ``@numba.jit(nopython=True)``). For more on
+troubleshooting Numba modes, see the `Numba troubleshooting page
+<http://numba.pydata.org/numba-doc/latest/user/troubleshoot.html#the-compiled-code-is-too-slow>`__.
+
+Read more in the `Numba docs <http://numba.pydata.org/>`__.
+
+.. _enhancingperf.eval:
+
+Expression Evaluation via :func:`~pandas.eval`
+-----------------------------------------------
+
+The top-level function :func:`pandas.eval` implements expression evaluation of
+:class:`~pandas.Series` and :class:`~pandas.DataFrame` objects.
+
+.. note::
+
+   To benefit from using :func:`~pandas.eval` you need to
+   install ``numexpr``. See the :ref:`recommended dependencies section
+   <install.recommended_dependencies>` for more details.
+
+The point of using :func:`~pandas.eval` for expression evaluation rather than
+plain Python is two-fold: 1) large :class:`~pandas.DataFrame` objects are
+evaluated more efficiently and 2) large arithmetic and boolean expressions are
+evaluated all at once by the underlying engine (by default ``numexpr`` is used
+for evaluation).
+
+.. note::
+
+   You should not use :func:`~pandas.eval` for simple
+   expressions or for expressions involving small DataFrames. In fact,
+   :func:`~pandas.eval` is many orders of magnitude slower for
+   smaller expressions/objects than plain ol' Python. A good rule of thumb is
+   to only use :func:`~pandas.eval` when you have a
+   :class:`~pandas.core.frame.DataFrame` with more than 10,000 rows.
+
+
+:func:`~pandas.eval` supports all arithmetic expressions supported by the
+engine in addition to some extensions available only in pandas.
+
+.. note::
+
+   The larger the frame and the larger the expression the more speedup you will
+   see from using :func:`~pandas.eval`.
+
+Supported Syntax
+~~~~~~~~~~~~~~~~
+
+These operations are supported by :func:`pandas.eval`:
+
+* Arithmetic operations except for the left shift (``<<``) and right shift
+  (``>>``) operators, e.g., ``df + 2 * pi / s ** 4 % 42 - the_golden_ratio``
+* Comparison operations, including chained comparisons, e.g., ``2 < df < df2``
+* Boolean operations, e.g., ``df < df2 and df3 < df4 or not df_bool``
+* ``list`` and ``tuple`` literals, e.g., ``[1, 2]`` or ``(1, 2)``
+* Attribute access, e.g., ``df.a``
+* Subscript expressions, e.g., ``df[0]``
+* Simple variable evaluation, e.g., ``pd.eval('df')`` (this is not very useful)
+* Math functions: `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
+  `sqrt`, `sinh`, `cosh`, `tanh`, `arcsin`, `arccos`, `arctan`, `arccosh`,
+  `arcsinh`, `arctanh`, `abs`, `arctan2` and `log10`.
+
+This Python syntax is **not** allowed:
+
+* Expressions
+
+    * Function calls other than math functions.
+    * ``is``/``is not`` operations
+    * ``if`` expressions
+    * ``lambda`` expressions
+    * ``list``/``set``/``dict`` comprehensions
+    * Literal ``dict`` and ``set`` expressions
+    * ``yield`` expressions
+    * Generator expressions
+    * Boolean expressions consisting of only scalar values
+
+* Statements
+
+    * Neither `simple <https://docs.python.org/3/reference/simple_stmts.html>`__
+      nor `compound <https://docs.python.org/3/reference/compound_stmts.html>`__
+      statements are allowed. This includes things like ``for``, ``while``, and
+      ``if``.
+
+
+
+:func:`~pandas.eval` Examples
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:func:`pandas.eval` works well with expressions containing large arrays.
+
+First let's create a few decent-sized arrays to play with:
+
+.. ipython:: python
+
+   nrows, ncols = 20000, 100
+   df1, df2, df3, df4 = [pd.DataFrame(np.random.randn(nrows, ncols)) for _ in range(4)]
+
+
+Now let's compare adding them together using plain ol' Python versus
+:func:`~pandas.eval`:
+
+.. ipython:: python
+
+   %timeit df1 + df2 + df3 + df4
+
+.. ipython:: python
+
+   %timeit pd.eval('df1 + df2 + df3 + df4')
+
+
+Now let's do the same thing but with comparisons:
+
+.. ipython:: python
+
+   %timeit (df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)
+
+.. ipython:: python
+
+   %timeit pd.eval('(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')
+
+
+:func:`~pandas.eval` also works with unaligned pandas objects:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(50))
+   %timeit df1 + df2 + df3 + df4 + s
+
+.. ipython:: python
+
+   %timeit pd.eval('df1 + df2 + df3 + df4 + s')
+
+.. note::
+
+   Operations such as
+
+      .. code-block:: python
+
+         1 and 2  # would parse to 1 & 2, but should evaluate to 2
+         3 or 4  # would parse to 3 | 4, but should evaluate to 3
+         ~1  # this is okay, but slower when using eval
+
+   should be performed in Python. An exception will be raised if you try to
+   perform any boolean/bitwise operations with scalar operands that are not
+   of type ``bool`` or ``np.bool_``. Again, you should perform these kinds of
+   operations in plain Python.
+
+The ``DataFrame.eval`` method
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In addition to the top level :func:`pandas.eval` function you can also
+evaluate an expression in the "context" of a :class:`~pandas.DataFrame`.
+
+.. ipython:: python
+   :suppress:
+
+   try:
+      del a
+   except NameError:
+      pass
+
+   try:
+      del b
+   except NameError:
+      pass
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 2), columns=['a', 'b'])
+   df.eval('a + b')
+
+Any expression that is a valid :func:`pandas.eval` expression is also a valid
+:meth:`DataFrame.eval` expression, with the added benefit that you don't have to
+prefix the name of the :class:`~pandas.DataFrame` to the column(s) you're
+interested in evaluating.
+
+In addition, you can perform assignment of columns within an expression.
+This allows for *formulaic evaluation*.  The assignment target can be a
+new column name or an existing column name, and it must be a valid Python
+identifier.
+
+.. versionadded:: 0.18.0
+
+The ``inplace`` keyword determines whether this assignment will performed
+on the original ``DataFrame`` or return a copy with the new column.
+
+.. warning::
+
+   For backwards compatibility, ``inplace`` defaults to ``True`` if not
+   specified. This will change in a future version of pandas - if your
+   code depends on an inplace assignment you should update to explicitly
+   set ``inplace=True``.
+
+.. ipython:: python
+
+   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
+   df.eval('c = a + b', inplace=True)
+   df.eval('d = a + b + c', inplace=True)
+   df.eval('a = 1', inplace=True)
+   df
+
+When ``inplace`` is set to ``False``, a copy of the ``DataFrame`` with the
+new or modified columns is returned and the original frame is unchanged.
+
+.. ipython:: python
+
+   df
+   df.eval('e = a - c', inplace=False)
+   df
+
+.. versionadded:: 0.18.0
+
+As a convenience, multiple assignments can be performed by using a
+multi-line string.
+
+.. ipython:: python
+
+   df.eval("""
+   c = a + b
+   d = a + b + c
+   a = 1""", inplace=False)
+
+The equivalent in standard Python would be
+
+.. ipython:: python
+
+   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
+   df['c'] = df.a + df.b
+   df['d'] = df.a + df.b + df.c
+   df['a'] = 1
+   df
+
+.. versionadded:: 0.18.0
+
+The ``query`` method gained the ``inplace`` keyword which determines
+whether the query modifies the original frame.
+
+.. ipython:: python
+
+   df = pd.DataFrame(dict(a=range(5), b=range(5, 10)))
+   df.query('a > 2')
+   df.query('a > 2', inplace=True)
+   df
+
+.. warning::
+
+   Unlike with ``eval``, the default value for ``inplace`` for ``query``
+   is ``False``.  This is consistent with prior versions of pandas.
+
+Local Variables
+~~~~~~~~~~~~~~~
+
+You must *explicitly reference* any local variable that you want to use in an
+expression by placing the ``@`` character in front of the name. For example,
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 2), columns=list('ab'))
+   newcol = np.random.randn(len(df))
+   df.eval('b + @newcol')
+   df.query('b < @newcol')
+
+If you don't prefix the local variable with ``@``, pandas will raise an
+exception telling you the variable is undefined.
+
+When using :meth:`DataFrame.eval` and :meth:`DataFrame.query`, this allows you
+to have a local variable and a :class:`~pandas.DataFrame` column with the same
+name in an expression.
+
+
+.. ipython:: python
+
+   a = np.random.randn()
+   df.query('@a < a')
+   df.loc[a < df.a]  # same as the previous expression
+
+With :func:`pandas.eval` you cannot use the ``@`` prefix *at all*, because it
+isn't defined in that context. ``pandas`` will let you know this if you try to
+use ``@`` in a top-level call to :func:`pandas.eval`. For example,
+
+.. ipython:: python
+   :okexcept:
+
+   a, b = 1, 2
+   pd.eval('@a + b')
+
+In this case, you should simply refer to the variables like you would in
+standard Python.
+
+.. ipython:: python
+
+   pd.eval('a + b')
+
+
+:func:`pandas.eval` Parsers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+There are two different parsers and two different engines you can use as
+the backend.
+
+The default ``'pandas'`` parser allows a more intuitive syntax for expressing
+query-like operations (comparisons, conjunctions and disjunctions). In
+particular, the precedence of the ``&`` and ``|`` operators is made equal to
+the precedence of the corresponding boolean operations ``and`` and ``or``.
+
+For example, the above conjunction can be written without parentheses.
+Alternatively, you can use the ``'python'`` parser to enforce strict Python
+semantics.
+
+.. ipython:: python
+
+   expr = '(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)'
+   x = pd.eval(expr, parser='python')
+   expr_no_parens = 'df1 > 0 & df2 > 0 & df3 > 0 & df4 > 0'
+   y = pd.eval(expr_no_parens, parser='pandas')
+   np.all(x == y)
+
+
+The same expression can be "anded" together with the word :keyword:`and` as
+well:
+
+.. ipython:: python
+
+   expr = '(df1 > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)'
+   x = pd.eval(expr, parser='python')
+   expr_with_ands = 'df1 > 0 and df2 > 0 and df3 > 0 and df4 > 0'
+   y = pd.eval(expr_with_ands, parser='pandas')
+   np.all(x == y)
+
+
+The ``and`` and ``or`` operators here have the same precedence that they would
+in vanilla Python.
+
+
+:func:`pandas.eval` Backends
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+There's also the option to make :func:`~pandas.eval` operate identical to plain
+ol' Python.
+
+.. note::
+
+   Using the ``'python'`` engine is generally *not* useful, except for testing
+   other evaluation engines against it. You will achieve **no** performance
+   benefits using :func:`~pandas.eval` with ``engine='python'`` and in fact may
+   incur a performance hit.
+
+You can see this by using :func:`pandas.eval` with the ``'python'`` engine. It
+is a bit slower (not by much) than evaluating the same expression in Python
+
+.. ipython:: python
+
+   %timeit df1 + df2 + df3 + df4
+
+.. ipython:: python
+
+   %timeit pd.eval('df1 + df2 + df3 + df4', engine='python')
+
+
+:func:`pandas.eval` Performance
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:func:`~pandas.eval` is intended to speed up certain kinds of operations. In
+particular, those operations involving complex expressions with large
+:class:`~pandas.DataFrame`/:class:`~pandas.Series` objects should see a
+significant performance benefit.  Here is a plot showing the running time of
+:func:`pandas.eval` as function of the size of the frame involved in the
+computation. The two lines are two different engines.
+
+
+.. image:: ../_static/eval-perf.png
+
+
+.. note::
+
+   Operations with smallish objects (around 15k-20k rows) are faster using
+   plain Python:
+
+       .. image:: ../_static/eval-perf-small.png
+
+
+This plot was created using a ``DataFrame`` with 3 columns each containing
+floating point values generated using ``numpy.random.randn()``.
+
+Technical Minutia Regarding Expression Evaluation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Expressions that would result in an object dtype or involve datetime operations
+(because of ``NaT``) must be evaluated in Python space. The main reason for
+this behavior is to maintain backwards compatibility with versions of NumPy <
+1.7. In those versions of NumPy a call to ``ndarray.astype(str)`` will
+truncate any strings that are more than 60 characters in length. Second, we
+can't pass ``object`` arrays to ``numexpr`` thus string comparisons must be
+evaluated in Python space.
+
+The upshot is that this *only* applies to object-dtype expressions. So, if
+you have an expression--for example
+
+.. ipython:: python
+
+   df = pd.DataFrame({'strings': np.repeat(list('cba'), 3),
+                      'nums': np.repeat(range(3), 3)})
+   df
+   df.query('strings == "a" and nums == 1')
+
+the numeric part of the comparison (``nums == 1``) will be evaluated by
+``numexpr``.
+
+In general, :meth:`DataFrame.query`/:func:`pandas.eval` will
+evaluate the subexpressions that *can* be evaluated by ``numexpr`` and those
+that must be evaluated in Python space transparently to the user. This is done
+by inferring the result type of an expression from its arguments and operators.
diff --git a/doc/source/user_guide/gotchas.rst b/doc/source/user_guide/gotchas.rst
new file mode 100644
index 0000000000000..3d89fe171a343
--- /dev/null
+++ b/doc/source/user_guide/gotchas.rst
@@ -0,0 +1,343 @@
+.. _gotchas:
+
+{{ header }}
+
+********************************
+Frequently Asked Questions (FAQ)
+********************************
+
+.. _df-memory-usage:
+
+DataFrame memory usage
+----------------------
+The memory usage of a ``DataFrame`` (including the index) is shown when calling
+the :meth:`~DataFrame.info`. A configuration option, ``display.memory_usage``
+(see :ref:`the list of options <options.available>`), specifies if the
+``DataFrame``'s memory usage will be displayed when invoking the ``df.info()``
+method.
+
+For example, the memory usage of the ``DataFrame`` below is shown
+when calling :meth:`~DataFrame.info`:
+
+.. ipython:: python
+
+    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
+              'complex128', 'object', 'bool']
+    n = 5000
+    data = {t: np.random.randint(100, size=n).astype(t) for t in dtypes}
+    df = pd.DataFrame(data)
+    df['categorical'] = df['object'].astype('category')
+
+    df.info()
+
+The ``+`` symbol indicates that the true memory usage could be higher, because
+pandas does not count the memory used by values in columns with
+``dtype=object``.
+
+Passing ``memory_usage='deep'`` will enable a more accurate memory usage report,
+accounting for the full usage of the contained objects. This is optional
+as it can be expensive to do this deeper introspection.
+
+.. ipython:: python
+
+   df.info(memory_usage='deep')
+
+By default the display option is set to ``True`` but can be explicitly
+overridden by passing the ``memory_usage`` argument when invoking ``df.info()``.
+
+The memory usage of each column can be found by calling the
+:meth:`~DataFrame.memory_usage` method. This returns a ``Series`` with an index
+represented by column names and memory usage of each column shown in bytes. For
+the ``DataFrame`` above, the memory usage of each column and the total memory
+usage can be found with the ``memory_usage`` method:
+
+.. ipython:: python
+
+    df.memory_usage()
+
+    # total memory usage of dataframe
+    df.memory_usage().sum()
+
+By default the memory usage of the ``DataFrame``'s index is shown in the
+returned ``Series``, the memory usage of the index can be suppressed by passing
+the ``index=False`` argument:
+
+.. ipython:: python
+
+    df.memory_usage(index=False)
+
+The memory usage displayed by the :meth:`~DataFrame.info` method utilizes the
+:meth:`~DataFrame.memory_usage` method to determine the memory usage of a
+``DataFrame`` while also formatting the output in human-readable units (base-2
+representation; i.e. 1KB = 1024 bytes).
+
+See also :ref:`Categorical Memory Usage <categorical.memory>`.
+
+.. _gotchas.truth:
+
+Using If/Truth Statements with pandas
+-------------------------------------
+
+pandas follows the NumPy convention of raising an error when you try to convert
+something to a ``bool``. This happens in an ``if``-statement or when using the
+boolean operations: ``and``, ``or``, and ``not``. It is not clear what the result
+of the following code should be:
+
+.. code-block:: python
+
+    >>> if pd.Series([False, True, False]):
+    ...     pass
+
+Should it be ``True`` because it's not zero-length, or ``False`` because there
+are ``False`` values? It is unclear, so instead, pandas raises a ``ValueError``:
+
+.. code-block:: python
+
+    >>> if pd.Series([False, True, False]):
+    ...     print("I was true")
+    Traceback
+        ...
+    ValueError: The truth value of an array is ambiguous. Use a.empty, a.any() or a.all().
+
+You need to explicitly choose what you want to do with the ``DataFrame``, e.g.
+use :meth:`~DataFrame.any`, :meth:`~DataFrame.all` or :meth:`~DataFrame.empty`.
+Alternatively, you might want to compare if the pandas object is ``None``:
+
+.. code-block:: python
+
+    >>> if pd.Series([False, True, False]) is not None:
+    ...     print("I was not None")
+    I was not None
+
+
+Below is how to check if any of the values are ``True``:
+
+.. code-block:: python
+
+    >>> if pd.Series([False, True, False]).any():
+    ...     print("I am any")
+    I am any
+
+To evaluate single-element pandas objects in a boolean context, use the method
+:meth:`~DataFrame.bool`:
+
+.. ipython:: python
+
+   pd.Series([True]).bool()
+   pd.Series([False]).bool()
+   pd.DataFrame([[True]]).bool()
+   pd.DataFrame([[False]]).bool()
+
+Bitwise boolean
+~~~~~~~~~~~~~~~
+
+Bitwise boolean operators like ``==`` and ``!=`` return a boolean ``Series``,
+which is almost always what you want anyways.
+
+.. code-block:: python
+
+   >>> s = pd.Series(range(5))
+   >>> s == 4
+   0    False
+   1    False
+   2    False
+   3    False
+   4     True
+   dtype: bool
+
+See :ref:`boolean comparisons<basics.compare>` for more examples.
+
+Using the ``in`` operator
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Using the Python ``in`` operator on a ``Series`` tests for membership in the
+index, not membership among the values.
+
+.. ipython:: python
+
+    s = pd.Series(range(5), index=list('abcde'))
+    2 in s
+    'b' in s
+
+If this behavior is surprising, keep in mind that using ``in`` on a Python
+dictionary tests keys, not values, and ``Series`` are dict-like.
+To test for membership in the values, use the method :meth:`~pandas.Series.isin`:
+
+.. ipython:: python
+
+    s.isin([2])
+    s.isin([2]).any()
+
+For ``DataFrames``, likewise, ``in`` applies to the column axis,
+testing for membership in the list of column names.
+
+``NaN``, Integer ``NA`` values and ``NA`` type promotions
+---------------------------------------------------------
+
+Choice of ``NA`` representation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+For lack of ``NA`` (missing) support from the ground up in NumPy and Python in
+general, we were given the difficult choice between either:
+
+* A *masked array* solution: an array of data and an array of boolean values
+  indicating whether a value is there or is missing.
+* Using a special sentinel value, bit pattern, or set of sentinel values to
+  denote ``NA`` across the dtypes.
+
+For many reasons we chose the latter. After years of production use it has
+proven, at least in my opinion, to be the best decision given the state of
+affairs in NumPy and Python in general. The special value ``NaN``
+(Not-A-Number) is used everywhere as the ``NA`` value, and there are API
+functions ``isna`` and ``notna`` which can be used across the dtypes to
+detect NA values.
+
+However, it comes with it a couple of trade-offs which I most certainly have
+not ignored.
+
+.. _gotchas.intna:
+
+Support for integer ``NA``
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In the absence of high performance ``NA`` support being built into NumPy from
+the ground up, the primary casualty is the ability to represent NAs in integer
+arrays. For example:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3, 4, 5], index=list('abcde'))
+   s
+   s.dtype
+
+   s2 = s.reindex(['a', 'b', 'c', 'f', 'u'])
+   s2
+   s2.dtype
+
+This trade-off is made largely for memory and performance reasons, and also so
+that the resulting ``Series`` continues to be "numeric".
+
+If you need to represent integers with possibly missing values, use one of
+the nullable-integer extension dtypes provided by pandas
+
+* :class:`Int8Dtype`
+* :class:`Int16Dtype`
+* :class:`Int32Dtype`
+* :class:`Int64Dtype`
+
+.. ipython:: python
+
+   s_int = pd.Series([1, 2, 3, 4, 5], index=list('abcde'),
+                     dtype=pd.Int64Dtype())
+   s_int
+   s_int.dtype
+
+   s2_int = s_int.reindex(['a', 'b', 'c', 'f', 'u'])
+   s2_int
+   s2_int.dtype
+
+See :ref:`integer_na` for more.
+
+``NA`` type promotions
+~~~~~~~~~~~~~~~~~~~~~~
+
+When introducing NAs into an existing ``Series`` or ``DataFrame`` via
+:meth:`~Series.reindex` or some other means, boolean and integer types will be
+promoted to a different dtype in order to store the NAs. The promotions are
+summarized in this table:
+
+.. csv-table::
+   :header: "Typeclass","Promotion dtype for storing NAs"
+   :widths: 40,60
+
+   ``floating``, no change
+   ``object``, no change
+   ``integer``, cast to ``float64``
+   ``boolean``, cast to ``object``
+
+While this may seem like a heavy trade-off, I have found very few cases where
+this is an issue in practice i.e. storing values greater than 2**53. Some
+explanation for the motivation is in the next section.
+
+Why not make NumPy like R?
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Many people have suggested that NumPy should simply emulate the ``NA`` support
+present in the more domain-specific statistical programming language `R
+<https://r-project.org>`__. Part of the reason is the NumPy type hierarchy:
+
+.. csv-table::
+   :header: "Typeclass","Dtypes"
+   :widths: 30,70
+   :delim: |
+
+   ``numpy.floating`` | ``float16, float32, float64, float128``
+   ``numpy.integer`` | ``int8, int16, int32, int64``
+   ``numpy.unsignedinteger`` | ``uint8, uint16, uint32, uint64``
+   ``numpy.object_`` | ``object_``
+   ``numpy.bool_`` | ``bool_``
+   ``numpy.character`` | ``string_, unicode_``
+
+The R language, by contrast, only has a handful of built-in data types:
+``integer``, ``numeric`` (floating-point), ``character``, and
+``boolean``. ``NA`` types are implemented by reserving special bit patterns for
+each type to be used as the missing value. While doing this with the full NumPy
+type hierarchy would be possible, it would be a more substantial trade-off
+(especially for the 8- and 16-bit data types) and implementation undertaking.
+
+An alternate approach is that of using masked arrays. A masked array is an
+array of data with an associated boolean *mask* denoting whether each value
+should be considered ``NA`` or not. I am personally not in love with this
+approach as I feel that overall it places a fairly heavy burden on the user and
+the library implementer. Additionally, it exacts a fairly high performance cost
+when working with numerical data compared with the simple approach of using
+``NaN``. Thus, I have chosen the Pythonic "practicality beats purity" approach
+and traded integer ``NA`` capability for a much simpler approach of using a
+special value in float and object arrays to denote ``NA``, and promoting
+integer arrays to floating when NAs must be introduced.
+
+
+Differences with NumPy
+----------------------
+For ``Series`` and ``DataFrame`` objects, :meth:`~DataFrame.var` normalizes by
+``N-1`` to produce unbiased estimates of the sample variance, while NumPy's
+``var`` normalizes by N, which measures the variance of the sample. Note that
+:meth:`~DataFrame.cov` normalizes by ``N-1`` in both pandas and NumPy.
+
+
+Thread-safety
+-------------
+
+As of pandas 0.11, pandas is not 100% thread safe. The known issues relate to
+the :meth:`~DataFrame.copy` method. If you are doing a lot of copying of
+``DataFrame`` objects shared among threads, we recommend holding locks inside
+the threads where the data copying occurs.
+
+See `this link <https://stackoverflow.com/questions/13592618/python-pandas-dataframe-thread-safe>`__
+for more information.
+
+
+Byte-Ordering Issues
+--------------------
+Occasionally you may have to deal with data that were created on a machine with
+a different byte order than the one on which you are running Python. A common
+symptom of this issue is an error like:::
+
+    Traceback
+        ...
+    ValueError: Big-endian buffer not supported on little-endian compiler
+
+To deal
+with this issue you should convert the underlying NumPy array to the native
+system byte order *before* passing it to ``Series`` or ``DataFrame``
+constructors using something similar to the following:
+
+.. ipython:: python
+
+   x = np.array(list(range(10)), '>i4')  # big endian
+   newx = x.byteswap().newbyteorder()  # force native byteorder
+   s = pd.Series(newx)
+
+See `the NumPy documentation on byte order
+<https://docs.scipy.org/doc/numpy/user/basics.byteswapping.html>`__ for more
+details.
diff --git a/doc/source/user_guide/groupby.rst b/doc/source/user_guide/groupby.rst
new file mode 100644
index 0000000000000..e4dd82afcdf65
--- /dev/null
+++ b/doc/source/user_guide/groupby.rst
@@ -0,0 +1,1407 @@
+.. _groupby:
+
+{{ header }}
+
+*****************************
+Group By: split-apply-combine
+*****************************
+
+By "group by" we are referring to a process involving one or more of the following
+steps:
+
+* **Splitting** the data into groups based on some criteria.
+* **Applying** a function to each group independently.
+* **Combining** the results into a data structure.
+
+Out of these, the split step is the most straightforward. In fact, in many
+situations we may wish to split the data set into groups and do something with
+those groups. In the apply step, we might wish to do one of the
+following:
+
+* **Aggregation**: compute a summary statistic (or statistics) for each
+  group. Some examples:
+
+    * Compute group sums or means.
+    * Compute group sizes / counts.
+
+* **Transformation**: perform some group-specific computations and return a
+  like-indexed object. Some examples:
+
+    * Standardize data (zscore) within a group.
+    * Filling NAs within groups with a value derived from each group.
+
+* **Filtration**: discard some groups, according to a group-wise computation
+  that evaluates True or False. Some examples:
+
+    * Discard data that belongs to groups with only a few members.
+    * Filter out data based on the group sum or mean.
+
+* Some combination of the above: GroupBy will examine the results of the apply
+  step and try to return a sensibly combined result if it doesn't fit into
+  either of the above two categories.
+
+Since the set of object instance methods on pandas data structures are generally
+rich and expressive, we often simply want to invoke, say, a DataFrame function
+on each group. The name GroupBy should be quite familiar to those who have used
+a SQL-based tool (or ``itertools``), in which you can write code like:
+
+.. code-block:: sql
+
+   SELECT Column1, Column2, mean(Column3), sum(Column4)
+   FROM SomeTable
+   GROUP BY Column1, Column2
+
+We aim to make operations like this natural and easy to express using
+pandas. We'll address each area of GroupBy functionality then provide some
+non-trivial examples / use cases.
+
+See the :ref:`cookbook<cookbook.grouping>` for some advanced strategies.
+
+.. _groupby.split:
+
+Splitting an object into groups
+-------------------------------
+
+pandas objects can be split on any of their axes. The abstract definition of
+grouping is to provide a mapping of labels to group names. To create a GroupBy
+object (more on what the GroupBy object is later), you may do the following:
+
+.. ipython:: python
+
+    df = pd.DataFrame([('bird', 'Falconiformes', 389.0),
+                       ('bird', 'Psittaciformes', 24.0),
+                       ('mammal', 'Carnivora', 80.2),
+                       ('mammal', 'Primates', np.nan),
+                       ('mammal', 'Carnivora', 58)],
+                      index=['falcon', 'parrot', 'lion', 'monkey', 'leopard'],
+                      columns=('class', 'order', 'max_speed'))
+    df
+
+    # default is axis=0
+    grouped = df.groupby('class')
+    grouped = df.groupby('order', axis='columns')
+    grouped = df.groupby(['class', 'order'])
+
+The mapping can be specified many different ways:
+
+* A Python function, to be called on each of the axis labels.
+* A list or NumPy array of the same length as the selected axis.
+* A dict or ``Series``, providing a ``label -> group name`` mapping.
+* For ``DataFrame`` objects, a string indicating a column to be used to group.
+  Of course ``df.groupby('A')`` is just syntactic sugar for
+  ``df.groupby(df['A'])``, but it makes life simpler.
+* For ``DataFrame`` objects, a string indicating an index level to be used to
+  group.
+* A list of any of the above things.
+
+Collectively we refer to the grouping objects as the **keys**. For example,
+consider the following ``DataFrame``:
+
+.. note::
+
+   A string passed to ``groupby`` may refer to either a column or an index level.
+   If a string matches both a column name and an index level name, a
+   ``ValueError`` will be raised.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'foo', 'foo'],
+                      'B': ['one', 'one', 'two', 'three',
+                            'two', 'two', 'one', 'three'],
+                      'C': np.random.randn(8),
+                      'D': np.random.randn(8)})
+   df
+
+On a DataFrame, we obtain a GroupBy object by calling :meth:`~DataFrame.groupby`.
+We could naturally group by either the ``A`` or ``B`` columns, or both:
+
+.. ipython:: python
+
+   grouped = df.groupby('A')
+   grouped = df.groupby(['A', 'B'])
+
+.. versionadded:: 0.24
+
+If we also have a MultiIndex on columns ``A`` and ``B``, we can group by all
+but the specified columns
+
+.. ipython:: python
+
+   df2 = df.set_index(['A', 'B'])
+   grouped = df2.groupby(level=df2.index.names.difference(['B']))
+   grouped.sum()
+
+These will split the DataFrame on its index (rows). We could also split by the
+columns:
+
+.. ipython::
+
+    In [4]: def get_letter_type(letter):
+       ...:     if letter.lower() in 'aeiou':
+       ...:         return 'vowel'
+       ...:     else:
+       ...:         return 'consonant'
+       ...:
+
+    In [5]: grouped = df.groupby(get_letter_type, axis=1)
+
+pandas :class:`~pandas.Index` objects support duplicate values. If a
+non-unique index is used as the group key in a groupby operation, all values
+for the same index value will be considered to be in one group and thus the
+output of aggregation functions will only contain unique index values:
+
+.. ipython:: python
+
+   lst = [1, 2, 3, 1, 2, 3]
+
+   s = pd.Series([1, 2, 3, 10, 20, 30], lst)
+
+   grouped = s.groupby(level=0)
+
+   grouped.first()
+
+   grouped.last()
+
+   grouped.sum()
+
+Note that **no splitting occurs** until it's needed. Creating the GroupBy object
+only verifies that you've passed a valid mapping.
+
+.. note::
+
+   Many kinds of complicated data manipulations can be expressed in terms of
+   GroupBy operations (though can't be guaranteed to be the most
+   efficient). You can get quite creative with the label mapping functions.
+
+.. _groupby.sorting:
+
+GroupBy sorting
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By default the group keys are sorted during the ``groupby`` operation. You may however pass ``sort=False`` for potential speedups:
+
+.. ipython:: python
+
+   df2 = pd.DataFrame({'X': ['B', 'B', 'A', 'A'], 'Y': [1, 2, 3, 4]})
+   df2.groupby(['X']).sum()
+   df2.groupby(['X'], sort=False).sum()
+
+
+Note that ``groupby`` will preserve the order in which *observations* are sorted *within* each group.
+For example, the groups created by ``groupby()`` below are in the order they appeared in the original ``DataFrame``:
+
+.. ipython:: python
+
+   df3 = pd.DataFrame({'X': ['A', 'B', 'A', 'B'], 'Y': [1, 4, 3, 2]})
+   df3.groupby(['X']).get_group('A')
+
+   df3.groupby(['X']).get_group('B')
+
+
+
+.. _groupby.attributes:
+
+GroupBy object attributes
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The ``groups`` attribute is a dict whose keys are the computed unique groups
+and corresponding values being the axis labels belonging to each group. In the
+above example we have:
+
+.. ipython:: python
+
+   df.groupby('A').groups
+   df.groupby(get_letter_type, axis=1).groups
+
+Calling the standard Python ``len`` function on the GroupBy object just returns
+the length of the ``groups`` dict, so it is largely just a convenience:
+
+.. ipython:: python
+
+   grouped = df.groupby(['A', 'B'])
+   grouped.groups
+   len(grouped)
+
+
+.. _groupby.tabcompletion:
+
+``GroupBy`` will tab complete column names (and other attributes):
+
+.. ipython:: python
+   :suppress:
+
+   n = 10
+   weight = np.random.normal(166, 20, size=n)
+   height = np.random.normal(60, 10, size=n)
+   time = pd.date_range('1/1/2000', periods=n)
+   gender = np.random.choice(['male', 'female'], size=n)
+   df = pd.DataFrame({'height': height, 'weight': weight,
+                      'gender': gender}, index=time)
+
+.. ipython:: python
+
+   df
+   gb = df.groupby('gender')
+
+
+.. ipython::
+
+   @verbatim
+   In [1]: gb.<TAB>  # noqa: E225, E999
+   gb.agg        gb.boxplot    gb.cummin     gb.describe   gb.filter     gb.get_group  gb.height     gb.last       gb.median     gb.ngroups    gb.plot       gb.rank       gb.std        gb.transform
+   gb.aggregate  gb.count      gb.cumprod    gb.dtype      gb.first      gb.groups     gb.hist       gb.max        gb.min        gb.nth        gb.prod       gb.resample   gb.sum        gb.var
+   gb.apply      gb.cummax     gb.cumsum     gb.fillna     gb.gender     gb.head       gb.indices    gb.mean       gb.name       gb.ohlc       gb.quantile   gb.size       gb.tail       gb.weight
+
+.. _groupby.multiindex:
+
+GroupBy with MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~
+
+With :ref:`hierarchically-indexed data <advanced.hierarchical>`, it's quite
+natural to group by one of the levels of the hierarchy.
+
+Let's create a Series with a two-level ``MultiIndex``.
+
+.. ipython:: python
+
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
+   s = pd.Series(np.random.randn(8), index=index)
+   s
+
+We can then group by one of the levels in ``s``.
+
+.. ipython:: python
+
+   grouped = s.groupby(level=0)
+   grouped.sum()
+
+If the MultiIndex has names specified, these can be passed instead of the level
+number:
+
+.. ipython:: python
+
+   s.groupby(level='second').sum()
+
+The aggregation functions such as ``sum`` will take the level parameter
+directly. Additionally, the resulting index will be named according to the
+chosen level:
+
+.. ipython:: python
+
+   s.sum(level='second')
+
+Grouping with multiple levels is supported.
+
+.. ipython:: python
+   :suppress:
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['doo', 'doo', 'bee', 'bee', 'bop', 'bop', 'bop', 'bop'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+   tuples = list(zip(*arrays))
+   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second', 'third'])
+   s = pd.Series(np.random.randn(8), index=index)
+
+.. ipython:: python
+
+   s
+   s.groupby(level=['first', 'second']).sum()
+
+.. versionadded:: 0.20
+
+Index level names may be supplied as keys.
+
+.. ipython:: python
+
+   s.groupby(['first', 'second']).sum()
+
+More on the ``sum`` function and aggregation later.
+
+Grouping DataFrame with Index Levels and Columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+A DataFrame may be grouped by a combination of columns and index levels by
+specifying the column names as strings and the index levels as ``pd.Grouper``
+objects.
+
+.. ipython:: python
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
+
+   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
+                      'B': np.arange(8)},
+                     index=index)
+
+   df
+
+The following example groups ``df`` by the ``second`` index level and
+the ``A`` column.
+
+.. ipython:: python
+
+   df.groupby([pd.Grouper(level=1), 'A']).sum()
+
+Index levels may also be specified by name.
+
+.. ipython:: python
+
+   df.groupby([pd.Grouper(level='second'), 'A']).sum()
+
+.. versionadded:: 0.20
+
+Index level names may be specified as keys directly to ``groupby``.
+
+.. ipython:: python
+
+   df.groupby(['second', 'A']).sum()
+
+DataFrame column selection in GroupBy
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Once you have created the GroupBy object from a DataFrame, you might want to do
+something different for each of the columns. Thus, using ``[]`` similar to
+getting a column from a DataFrame, you can do:
+
+.. ipython:: python
+   :suppress:
+
+   df = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'foo', 'foo'],
+                      'B': ['one', 'one', 'two', 'three',
+                            'two', 'two', 'one', 'three'],
+                      'C': np.random.randn(8),
+                      'D': np.random.randn(8)})
+
+.. ipython:: python
+
+   grouped = df.groupby(['A'])
+   grouped_C = grouped['C']
+   grouped_D = grouped['D']
+
+This is mainly syntactic sugar for the alternative and much more verbose:
+
+.. ipython:: python
+
+   df['C'].groupby(df['A'])
+
+Additionally this method avoids recomputing the internal grouping information
+derived from the passed key.
+
+.. _groupby.iterating-label:
+
+Iterating through groups
+------------------------
+
+With the GroupBy object in hand, iterating through the grouped data is very
+natural and functions similarly to :py:func:`itertools.groupby`:
+
+.. ipython::
+
+   In [4]: grouped = df.groupby('A')
+
+   In [5]: for name, group in grouped:
+      ...:     print(name)
+      ...:     print(group)
+      ...:
+
+In the case of grouping by multiple keys, the group name will be a tuple:
+
+.. ipython::
+
+   In [5]: for name, group in df.groupby(['A', 'B']):
+      ...:     print(name)
+      ...:     print(group)
+      ...:
+
+See :ref:`timeseries.iterating-label`.
+
+Selecting a group
+-----------------
+
+A single group can be selected using
+:meth:`~pandas.core.groupby.DataFrameGroupBy.get_group`:
+
+.. ipython:: python
+
+   grouped.get_group('bar')
+
+Or for an object grouped on multiple columns:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B']).get_group(('bar', 'one'))
+
+.. _groupby.aggregate:
+
+Aggregation
+-----------
+
+Once the GroupBy object has been created, several methods are available to
+perform a computation on the grouped data. These operations are similar to the
+:ref:`aggregating API <basics.aggregate>`, :ref:`window functions API <stats.aggregate>`,
+and :ref:`resample API <timeseries.aggregate>`.
+
+An obvious one is aggregation via the
+:meth:`~pandas.core.groupby.DataFrameGroupBy.aggregate` or equivalently
+:meth:`~pandas.core.groupby.DataFrameGroupBy.agg` method:
+
+.. ipython:: python
+
+   grouped = df.groupby('A')
+   grouped.aggregate(np.sum)
+
+   grouped = df.groupby(['A', 'B'])
+   grouped.aggregate(np.sum)
+
+As you can see, the result of the aggregation will have the group names as the
+new index along the grouped axis. In the case of multiple keys, the result is a
+:ref:`MultiIndex <advanced.hierarchical>` by default, though this can be
+changed by using the ``as_index`` option:
+
+.. ipython:: python
+
+   grouped = df.groupby(['A', 'B'], as_index=False)
+   grouped.aggregate(np.sum)
+
+   df.groupby('A', as_index=False).sum()
+
+Note that you could use the ``reset_index`` DataFrame function to achieve the
+same result as the column names are stored in the resulting ``MultiIndex``:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B']).sum().reset_index()
+
+Another simple aggregation example is to compute the size of each group.
+This is included in GroupBy as the ``size`` method. It returns a Series whose
+index are the group names and whose values are the sizes of each group.
+
+.. ipython:: python
+
+   grouped.size()
+
+.. ipython:: python
+
+   grouped.describe()
+
+.. note::
+
+   Aggregation functions **will not** return the groups that you are aggregating over
+   if they are named *columns*, when ``as_index=True``, the default. The grouped columns will
+   be the **indices** of the returned object.
+
+   Passing ``as_index=False`` **will** return the groups that you are aggregating over, if they are
+   named *columns*.
+
+Aggregating functions are the ones that reduce the dimension of the returned objects.
+Some common aggregating functions are tabulated below:
+
+.. csv-table::
+    :header: "Function", "Description"
+    :widths: 20, 80
+    :delim: ;
+
+	:meth:`~pd.core.groupby.DataFrameGroupBy.mean`;Compute mean of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.sum`;Compute sum of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.size`;Compute group sizes
+	:meth:`~pd.core.groupby.DataFrameGroupBy.count`;Compute count of group
+	:meth:`~pd.core.groupby.DataFrameGroupBy.std`;Standard deviation of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.var`;Compute variance of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.sem`;Standard error of the mean of groups
+	:meth:`~pd.core.groupby.DataFrameGroupBy.describe`;Generates descriptive statistics
+	:meth:`~pd.core.groupby.DataFrameGroupBy.first`;Compute first of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.last`;Compute last of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.nth`;Take nth value, or a subset if n is a list
+	:meth:`~pd.core.groupby.DataFrameGroupBy.min`;Compute min of group values
+	:meth:`~pd.core.groupby.DataFrameGroupBy.max`;Compute max of group values
+
+
+The aggregating functions above will exclude NA values. Any function which
+reduces a :class:`Series` to a scalar value is an aggregation function and will work,
+a trivial example is ``df.groupby('A').agg(lambda ser: 1)``. Note that
+:meth:`~pd.core.groupby.DataFrameGroupBy.nth` can act as a reducer *or* a
+filter, see :ref:`here <groupby.nth>`.
+
+.. _groupby.aggregate.multifunc:
+
+Applying multiple functions at once
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+With grouped ``Series`` you can also pass a list or dict of functions to do
+aggregation with, outputting a DataFrame:
+
+.. ipython:: python
+
+   grouped = df.groupby('A')
+   grouped['C'].agg([np.sum, np.mean, np.std])
+
+On a grouped ``DataFrame``, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
+
+.. ipython:: python
+
+   grouped.agg([np.sum, np.mean, np.std])
+
+
+The resulting aggregations are named for the functions themselves. If you
+need to rename, then you can add in a chained operation for a ``Series`` like this:
+
+.. ipython:: python
+
+   (grouped['C'].agg([np.sum, np.mean, np.std])
+                .rename(columns={'sum': 'foo',
+                                 'mean': 'bar',
+                                 'std': 'baz'}))
+
+For a grouped ``DataFrame``, you can rename in a similar manner:
+
+.. ipython:: python
+
+   (grouped.agg([np.sum, np.mean, np.std])
+           .rename(columns={'sum': 'foo',
+                            'mean': 'bar',
+                            'std': 'baz'}))
+
+
+Applying different functions to DataFrame columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By passing a dict to ``aggregate`` you can apply a different aggregation to the
+columns of a DataFrame:
+
+.. ipython:: python
+
+   grouped.agg({'C': np.sum,
+                'D': lambda x: np.std(x, ddof=1)})
+
+The function names can also be strings. In order for a string to be valid it
+must be either implemented on GroupBy or available via :ref:`dispatching
+<groupby.dispatch>`:
+
+.. ipython:: python
+
+   grouped.agg({'C': 'sum', 'D': 'std'})
+
+.. note::
+
+    If you pass a dict to ``aggregate``, the ordering of the output columns is
+    non-deterministic. If you want to be sure the output columns will be in a specific
+    order, you can use an ``OrderedDict``.  Compare the output of the following two commands:
+
+.. ipython:: python
+
+   from collections import OrderedDict
+
+   grouped.agg({'D': 'std', 'C': 'mean'})
+   grouped.agg(OrderedDict([('D', 'std'), ('C', 'mean')]))
+
+.. _groupby.aggregate.cython:
+
+Cython-optimized aggregation functions
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Some common aggregations, currently only ``sum``, ``mean``, ``std``, and ``sem``, have
+optimized Cython implementations:
+
+.. ipython:: python
+
+   df.groupby('A').sum()
+   df.groupby(['A', 'B']).mean()
+
+Of course ``sum`` and ``mean`` are implemented on pandas objects, so the above
+code would work even without the special versions via dispatching (see below).
+
+.. _groupby.transform:
+
+Transformation
+--------------
+
+The ``transform`` method returns an object that is indexed the same (same size)
+as the one being grouped. The transform function must:
+
+* Return a result that is either the same size as the group chunk or
+  broadcastable to the size of the group chunk (e.g., a scalar,
+  ``grouped.transform(lambda x: x.iloc[-1])``).
+* Operate column-by-column on the group chunk.  The transform is applied to
+  the first group chunk using chunk.apply.
+* Not perform in-place operations on the group chunk. Group chunks should
+  be treated as immutable, and changes to a group chunk may produce unexpected
+  results. For example, when using ``fillna``, ``inplace`` must be ``False``
+  (``grouped.transform(lambda x: x.fillna(inplace=False))``).
+* (Optionally) operates on the entire group chunk. If this is supported, a
+  fast path is used starting from the *second* chunk.
+
+For example, suppose we wished to standardize the data within each group:
+
+.. ipython:: python
+
+   index = pd.date_range('10/1/1999', periods=1100)
+   ts = pd.Series(np.random.normal(0.5, 2, 1100), index)
+   ts = ts.rolling(window=100, min_periods=100).mean().dropna()
+
+   ts.head()
+   ts.tail()
+
+   transformed = (ts.groupby(lambda x: x.year)
+                    .transform(lambda x: (x - x.mean()) / x.std()))
+
+We would expect the result to now have mean 0 and standard deviation 1 within
+each group, which we can easily check:
+
+.. ipython:: python
+
+   # Original Data
+   grouped = ts.groupby(lambda x: x.year)
+   grouped.mean()
+   grouped.std()
+
+   # Transformed Data
+   grouped_trans = transformed.groupby(lambda x: x.year)
+   grouped_trans.mean()
+   grouped_trans.std()
+
+We can also visually compare the original and transformed data sets.
+
+.. ipython:: python
+
+   compare = pd.DataFrame({'Original': ts, 'Transformed': transformed})
+
+   @savefig groupby_transform_plot.png
+   compare.plot()
+
+Transformation functions that have lower dimension outputs are broadcast to
+match the shape of the input array.
+
+.. ipython:: python
+
+   ts.groupby(lambda x: x.year).transform(lambda x: x.max() - x.min())
+
+Alternatively, the built-in methods could be used to produce the same outputs.
+
+.. ipython:: python
+
+   max = ts.groupby(lambda x: x.year).transform('max')
+   min = ts.groupby(lambda x: x.year).transform('min')
+
+   max - min
+
+Another common data transform is to replace missing data with the group mean.
+
+.. ipython:: python
+   :suppress:
+
+   cols = ['A', 'B', 'C']
+   values = np.random.randn(1000, 3)
+   values[np.random.randint(0, 1000, 100), 0] = np.nan
+   values[np.random.randint(0, 1000, 50), 1] = np.nan
+   values[np.random.randint(0, 1000, 200), 2] = np.nan
+   data_df = pd.DataFrame(values, columns=cols)
+
+.. ipython:: python
+
+   data_df
+
+   countries = np.array(['US', 'UK', 'GR', 'JP'])
+   key = countries[np.random.randint(0, 4, 1000)]
+
+   grouped = data_df.groupby(key)
+
+   # Non-NA count in each group
+   grouped.count()
+
+   transformed = grouped.transform(lambda x: x.fillna(x.mean()))
+
+We can verify that the group means have not changed in the transformed data
+and that the transformed data contains no NAs.
+
+.. ipython:: python
+
+   grouped_trans = transformed.groupby(key)
+
+   grouped.mean()  # original group means
+   grouped_trans.mean()  # transformation did not change group means
+
+   grouped.count()  # original has some missing data points
+   grouped_trans.count()  # counts after transformation
+   grouped_trans.size()  # Verify non-NA count equals group size
+
+.. note::
+
+   Some functions will automatically transform the input when applied to a
+   GroupBy object, but returning an object of the same shape as the original.
+   Passing ``as_index=False`` will not affect these transformation methods.
+
+   For example: ``fillna, ffill, bfill, shift.``.
+
+   .. ipython:: python
+
+      grouped.ffill()
+
+
+.. _groupby.transform.window_resample:
+
+New syntax to window and resample operations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. versionadded:: 0.18.1
+
+Working with the resample, expanding or rolling operations on the groupby
+level used to require the application of helper functions. However,
+now it is possible to use ``resample()``, ``expanding()`` and
+``rolling()`` as methods on groupbys.
+
+The example below will apply the ``rolling()`` method on the samples of
+the column B based on the groups of column A.
+
+.. ipython:: python
+
+   df_re = pd.DataFrame({'A': [1] * 10 + [5] * 10,
+                         'B': np.arange(20)})
+   df_re
+
+   df_re.groupby('A').rolling(4).B.mean()
+
+
+The ``expanding()`` method will accumulate a given operation
+(``sum()`` in the example) for all the members of each particular
+group.
+
+.. ipython:: python
+
+   df_re.groupby('A').expanding().sum()
+
+
+Suppose you want to use the ``resample()`` method to get a daily
+frequency in each group of your dataframe and wish to complete the
+missing values with the ``ffill()`` method.
+
+.. ipython:: python
+
+   df_re = pd.DataFrame({'date': pd.date_range(start='2016-01-01', periods=4,
+                                               freq='W'),
+                         'group': [1, 1, 2, 2],
+                         'val': [5, 6, 7, 8]}).set_index('date')
+   df_re
+
+   df_re.groupby('group').resample('1D').ffill()
+
+.. _groupby.filter:
+
+Filtration
+----------
+
+The ``filter`` method returns a subset of the original object. Suppose we
+want to take only elements that belong to groups with a group sum greater
+than 2.
+
+.. ipython:: python
+
+   sf = pd.Series([1, 1, 2, 3, 3, 3])
+   sf.groupby(sf).filter(lambda x: x.sum() > 2)
+
+The argument of ``filter`` must be a function that, applied to the group as a
+whole, returns ``True`` or ``False``.
+
+Another useful operation is filtering out elements that belong to groups
+with only a couple members.
+
+.. ipython:: python
+
+   dff = pd.DataFrame({'A': np.arange(8), 'B': list('aabbbbcc')})
+   dff.groupby('B').filter(lambda x: len(x) > 2)
+
+Alternatively, instead of dropping the offending groups, we can return a
+like-indexed objects where the groups that do not pass the filter are filled
+with NaNs.
+
+.. ipython:: python
+
+   dff.groupby('B').filter(lambda x: len(x) > 2, dropna=False)
+
+For DataFrames with multiple columns, filters should explicitly specify a column as the filter criterion.
+
+.. ipython:: python
+
+   dff['C'] = np.arange(8)
+   dff.groupby('B').filter(lambda x: len(x['C']) > 2)
+
+.. note::
+
+   Some functions when applied to a groupby object will act as a **filter** on the input, returning
+   a reduced shape of the original (and potentially eliminating groups), but with the index unchanged.
+   Passing ``as_index=False`` will not affect these transformation methods.
+
+   For example: ``head, tail``.
+
+   .. ipython:: python
+
+      dff.groupby('B').head(2)
+
+
+.. _groupby.dispatch:
+
+Dispatching to instance methods
+-------------------------------
+
+When doing an aggregation or transformation, you might just want to call an
+instance method on each data group. This is pretty easy to do by passing lambda
+functions:
+
+.. ipython:: python
+
+   grouped = df.groupby('A')
+   grouped.agg(lambda x: x.std())
+
+But, it's rather verbose and can be untidy if you need to pass additional
+arguments. Using a bit of metaprogramming cleverness, GroupBy now has the
+ability to "dispatch" method calls to the groups:
+
+.. ipython:: python
+
+   grouped.std()
+
+What is actually happening here is that a function wrapper is being
+generated. When invoked, it takes any passed arguments and invokes the function
+with any arguments on each group (in the above example, the ``std``
+function). The results are then combined together much in the style of ``agg``
+and ``transform`` (it actually uses ``apply`` to infer the gluing, documented
+next). This enables some operations to be carried out rather succinctly:
+
+.. ipython:: python
+
+   tsdf = pd.DataFrame(np.random.randn(1000, 3),
+                       index=pd.date_range('1/1/2000', periods=1000),
+                       columns=['A', 'B', 'C'])
+   tsdf.iloc[::2] = np.nan
+   grouped = tsdf.groupby(lambda x: x.year)
+   grouped.fillna(method='pad')
+
+In this example, we chopped the collection of time series into yearly chunks
+then independently called :ref:`fillna <missing_data.fillna>` on the
+groups.
+
+The ``nlargest`` and ``nsmallest`` methods work on ``Series`` style groupbys:
+
+.. ipython:: python
+
+   s = pd.Series([9, 8, 7, 5, 19, 1, 4.2, 3.3])
+   g = pd.Series(list('abababab'))
+   gb = s.groupby(g)
+   gb.nlargest(3)
+   gb.nsmallest(3)
+
+.. _groupby.apply:
+
+Flexible ``apply``
+------------------
+
+Some operations on the grouped data might not fit into either the aggregate or
+transform categories. Or, you may simply want GroupBy to infer how to combine
+the results. For these, use the ``apply`` function, which can be substituted
+for both ``aggregate`` and ``transform`` in many standard use cases. However,
+``apply`` can handle some exceptional use cases, for example:
+
+.. ipython:: python
+
+   df
+   grouped = df.groupby('A')
+
+   # could also just call .describe()
+   grouped['C'].apply(lambda x: x.describe())
+
+The dimension of the returned result can also change:
+
+.. ipython::
+
+    In [8]: grouped = df.groupby('A')['C']
+
+    In [10]: def f(group):
+       ....:     return pd.DataFrame({'original': group,
+       ....:                          'demeaned': group - group.mean()})
+       ....:
+
+    In [11]: grouped.apply(f)
+
+``apply`` on a Series can operate on a returned value from the applied function,
+that is itself a series, and possibly upcast the result to a DataFrame:
+
+.. ipython:: python
+
+    def f(x):
+        return pd.Series([x, x ** 2], index=['x', 'x^2'])
+
+    s = pd.Series(np.random.rand(5))
+    s
+    s.apply(f)
+
+
+.. note::
+
+   ``apply`` can act as a reducer, transformer, *or* filter function, depending on exactly what is passed to it.
+   So depending on the path taken, and exactly what you are grouping. Thus the grouped columns(s) may be included in
+   the output as well as set the indices.
+
+.. warning::
+
+    In the current implementation apply calls func twice on the
+    first group to decide whether it can take a fast or slow code
+    path. This can lead to unexpected behavior if func has
+    side-effects, as they will take effect twice for the first
+    group.
+
+    .. ipython:: python
+
+        d = pd.DataFrame({"a": ["x", "y"], "b": [1, 2]})
+        def identity(df):
+            print(df)
+            return df
+
+        d.groupby("a").apply(identity)
+
+
+Other useful features
+---------------------
+
+Automatic exclusion of "nuisance" columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Again consider the example DataFrame we've been looking at:
+
+.. ipython:: python
+
+   df
+
+Suppose we wish to compute the standard deviation grouped by the ``A``
+column. There is a slight problem, namely that we don't care about the data in
+column ``B``. We refer to this as a "nuisance" column. If the passed
+aggregation function can't be applied to some columns, the troublesome columns
+will be (silently) dropped. Thus, this does not pose any problems:
+
+.. ipython:: python
+
+   df.groupby('A').std()
+
+Note that ``df.groupby('A').colname.std().`` is more efficient than
+``df.groupby('A').std().colname``, so if the result of an aggregation function
+is only interesting over one column (here ``colname``), it may be filtered
+*before* applying the aggregation function.
+
+.. note::
+   Any object column, also if it contains numerical values such as ``Decimal``
+   objects, is considered as a "nuisance" columns. They are excluded from
+   aggregate functions automatically in groupby.
+
+   If you do wish to include decimal or object columns in an aggregation with
+   other non-nuisance data types, you must do so explicitly.
+
+.. ipython:: python
+
+    from decimal import Decimal
+    df_dec = pd.DataFrame(
+        {'id': [1, 2, 1, 2],
+         'int_column': [1, 2, 3, 4],
+         'dec_column': [Decimal('0.50'), Decimal('0.15'),
+                        Decimal('0.25'), Decimal('0.40')]
+         }
+    )
+
+    # Decimal columns can be sum'd explicitly by themselves...
+    df_dec.groupby(['id'])[['dec_column']].sum()
+
+    # ...but cannot be combined with standard data types or they will be excluded
+    df_dec.groupby(['id'])[['int_column', 'dec_column']].sum()
+
+    # Use .agg function to aggregate over standard and "nuisance" data types
+    # at the same time
+    df_dec.groupby(['id']).agg({'int_column': 'sum', 'dec_column': 'sum'})
+
+.. _groupby.observed:
+
+Handling of (un)observed Categorical values
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When using a ``Categorical`` grouper (as a single grouper, or as part of multiple groupers), the ``observed`` keyword
+controls whether to return a cartesian product of all possible groupers values (``observed=False``) or only those
+that are observed groupers (``observed=True``).
+
+Show all values:
+
+.. ipython:: python
+
+   pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'],
+                                               categories=['a', 'b']),
+                                observed=False).count()
+
+Show only the observed values:
+
+.. ipython:: python
+
+   pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'],
+                                               categories=['a', 'b']),
+                                observed=True).count()
+
+The returned dtype of the grouped will *always* include *all* of the categories that were grouped.
+
+.. ipython:: python
+
+   s = pd.Series([1, 1, 1]).groupby(pd.Categorical(['a', 'a', 'a'],
+                                                   categories=['a', 'b']),
+                                    observed=False).count()
+   s.index.dtype
+
+.. _groupby.missing:
+
+NA and NaT group handling
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+If there are any NaN or NaT values in the grouping key, these will be
+automatically excluded. In other words, there will never be an "NA group" or
+"NaT group". This was not the case in older versions of pandas, but users were
+generally discarding the NA group anyway (and supporting it was an
+implementation headache).
+
+Grouping with ordered factors
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Categorical variables represented as instance of pandas's ``Categorical`` class
+can be used as group keys. If so, the order of the levels will be preserved:
+
+.. ipython:: python
+
+   data = pd.Series(np.random.randn(100))
+
+   factor = pd.qcut(data, [0, .25, .5, .75, 1.])
+
+   data.groupby(factor).mean()
+
+.. _groupby.specify:
+
+Grouping with a Grouper specification
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You may need to specify a bit more data to properly group. You can
+use the ``pd.Grouper`` to provide this local control.
+
+.. ipython:: python
+
+   import datetime
+
+   df = pd.DataFrame({'Branch': 'A A A A A A A B'.split(),
+                      'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+                      'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+                      'Date': [
+                          datetime.datetime(2013, 1, 1, 13, 0),
+                          datetime.datetime(2013, 1, 1, 13, 5),
+                          datetime.datetime(2013, 10, 1, 20, 0),
+                          datetime.datetime(2013, 10, 2, 10, 0),
+                          datetime.datetime(2013, 10, 1, 20, 0),
+                          datetime.datetime(2013, 10, 2, 10, 0),
+                          datetime.datetime(2013, 12, 2, 12, 0),
+                          datetime.datetime(2013, 12, 2, 14, 0)]
+                      })
+
+   df
+
+Groupby a specific column with the desired frequency. This is like resampling.
+
+.. ipython:: python
+
+   df.groupby([pd.Grouper(freq='1M', key='Date'), 'Buyer']).sum()
+
+You have an ambiguous specification in that you have a named index and a column
+that could be potential groupers.
+
+.. ipython:: python
+
+   df = df.set_index('Date')
+   df['Date'] = df.index + pd.offsets.MonthEnd(2)
+   df.groupby([pd.Grouper(freq='6M', key='Date'), 'Buyer']).sum()
+
+   df.groupby([pd.Grouper(freq='6M', level='Date'), 'Buyer']).sum()
+
+
+Taking the first rows of each group
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Just like for a DataFrame or Series you can call head and tail on a groupby:
+
+.. ipython:: python
+
+   df = pd.DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+   df
+
+   g = df.groupby('A')
+   g.head(1)
+
+   g.tail(1)
+
+This shows the first or last n rows from each group.
+
+.. _groupby.nth:
+
+Taking the nth row of each group
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+To select from a DataFrame or Series the nth item, use
+:meth:`~pd.core.groupby.DataFrameGroupBy.nth`. This is a reduction method, and
+will return a single row (or no row) per group if you pass an int for n:
+
+.. ipython:: python
+
+   df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+   g = df.groupby('A')
+
+   g.nth(0)
+   g.nth(-1)
+   g.nth(1)
+
+If you want to select the nth not-null item, use the ``dropna`` kwarg. For a DataFrame this should be either ``'any'`` or ``'all'`` just like you would pass to dropna:
+
+.. ipython:: python
+
+   # nth(0) is the same as g.first()
+   g.nth(0, dropna='any')
+   g.first()
+
+   # nth(-1) is the same as g.last()
+   g.nth(-1, dropna='any')  # NaNs denote group exhausted when using dropna
+   g.last()
+
+   g.B.nth(0, dropna='all')
+
+As with other methods, passing ``as_index=False``, will achieve a filtration, which returns the grouped row.
+
+.. ipython:: python
+
+   df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+   g = df.groupby('A', as_index=False)
+
+   g.nth(0)
+   g.nth(-1)
+
+You can also select multiple rows from each group by specifying multiple nth values as a list of ints.
+
+.. ipython:: python
+
+   business_dates = pd.date_range(start='4/1/2014', end='6/30/2014', freq='B')
+   df = pd.DataFrame(1, index=business_dates, columns=['a', 'b'])
+   # get the first, 4th, and last date index for each month
+   df.groupby([df.index.year, df.index.month]).nth([0, 3, -1])
+
+Enumerate group items
+~~~~~~~~~~~~~~~~~~~~~
+
+To see the order in which each row appears within its group, use the
+``cumcount`` method:
+
+.. ipython:: python
+
+   dfg = pd.DataFrame(list('aaabba'), columns=['A'])
+   dfg
+
+   dfg.groupby('A').cumcount()
+
+   dfg.groupby('A').cumcount(ascending=False)
+
+.. _groupby.ngroup:
+
+Enumerate groups
+~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.2
+
+To see the ordering of the groups (as opposed to the order of rows
+within a group given by ``cumcount``) you can use
+:meth:`~pandas.core.groupby.DataFrameGroupBy.ngroup`.
+
+
+
+Note that the numbers given to the groups match the order in which the
+groups would be seen when iterating over the groupby object, not the
+order they are first observed.
+
+.. ipython:: python
+
+   dfg = pd.DataFrame(list('aaabba'), columns=['A'])
+   dfg
+
+   dfg.groupby('A').ngroup()
+
+   dfg.groupby('A').ngroup(ascending=False)
+
+Plotting
+~~~~~~~~
+
+Groupby also works with some plotting methods.  For example, suppose we
+suspect that some features in a DataFrame may differ by group, in this case,
+the values in column 1 where the group is "B" are 3 higher on average.
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.randn(50, 2))
+   df['g'] = np.random.choice(['A', 'B'], size=50)
+   df.loc[df['g'] == 'B', 1] += 3
+
+We can easily visualize this with a boxplot:
+
+.. ipython:: python
+   :okwarning:
+
+   @savefig groupby_boxplot.png
+   df.groupby('g').boxplot()
+
+The result of calling ``boxplot`` is a dictionary whose keys are the values
+of our grouping column ``g`` ("A" and "B"). The values of the resulting dictionary
+can be controlled by the ``return_type`` keyword of ``boxplot``.
+See the :ref:`visualization documentation<visualization.box>` for more.
+
+.. warning::
+
+  For historical reasons, ``df.groupby("g").boxplot()`` is not equivalent
+  to ``df.boxplot(by="g")``. See :ref:`here<visualization.box.return>` for
+  an explanation.
+
+.. _groupby.pipe:
+
+Piping function calls
+~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.21.0
+
+Similar to the functionality provided by ``DataFrame`` and ``Series``, functions
+that take ``GroupBy`` objects can be chained together using a ``pipe`` method to
+allow for a cleaner, more readable syntax. To read about ``.pipe`` in general terms,
+see :ref:`here <basics.pipe>`.
+
+Combining ``.groupby`` and ``.pipe`` is often useful when you need to reuse
+GroupBy objects.
+
+As an example, imagine having a DataFrame with columns for stores, products,
+revenue and quantity sold. We'd like to do a groupwise calculation of *prices*
+(i.e. revenue/quantity) per store and per product. We could do this in a
+multi-step operation, but expressing it in terms of piping can make the
+code more readable. First we set the data:
+
+.. ipython:: python
+
+   n = 1000
+   df = pd.DataFrame({'Store': np.random.choice(['Store_1', 'Store_2'], n),
+                      'Product': np.random.choice(['Product_1',
+                                                   'Product_2'], n),
+                      'Revenue': (np.random.random(n) * 50 + 10).round(2),
+                      'Quantity': np.random.randint(1, 10, size=n)})
+   df.head(2)
+
+Now, to find prices per store/product, we can simply do:
+
+.. ipython:: python
+
+   (df.groupby(['Store', 'Product'])
+      .pipe(lambda grp: grp.Revenue.sum() / grp.Quantity.sum())
+      .unstack().round(2))
+
+Piping can also be expressive when you want to deliver a grouped object to some
+arbitrary function, for example:
+
+.. ipython:: python
+
+   def mean(groupby):
+       return groupby.mean()
+
+   df.groupby(['Store', 'Product']).pipe(mean)
+
+where ``mean`` takes a GroupBy object and finds the mean of the Revenue and Quantity
+columns respectively for each Store-Product combination. The ``mean`` function can
+be any function that takes in a GroupBy object; the ``.pipe`` will pass the GroupBy
+object as a parameter into the function you specify.
+
+Examples
+--------
+
+Regrouping by factor
+~~~~~~~~~~~~~~~~~~~~
+
+Regroup columns of a DataFrame according to their sum, and sum the aggregated ones.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [1, 0, 0], 'b': [0, 1, 0],
+                      'c': [1, 0, 0], 'd': [2, 3, 4]})
+   df
+   df.groupby(df.sum(), axis=1).sum()
+
+.. _groupby.multicolumn_factorization:
+
+Multi-column factorization
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By using :meth:`~pandas.core.groupby.DataFrameGroupBy.ngroup`, we can extract
+information about the groups in a way similar to :func:`factorize` (as described
+further in the :ref:`reshaping API <reshaping.factorize>`) but which applies
+naturally to multiple columns of mixed type and different
+sources. This can be useful as an intermediate categorical-like step
+in processing, when the relationships between the group rows are more
+important than their content, or as input to an algorithm which only
+accepts the integer encoding. (For more information about support in
+pandas for full categorical data, see the :ref:`Categorical
+introduction <categorical>` and the
+:ref:`API documentation <api.arrays.categorical>`.)
+
+.. ipython:: python
+
+    dfg = pd.DataFrame({"A": [1, 1, 2, 3, 2], "B": list("aaaba")})
+
+    dfg
+
+    dfg.groupby(["A", "B"]).ngroup()
+
+    dfg.groupby(["A", [0, 0, 0, 1, 1]]).ngroup()
+
+Groupby by Indexer to 'resample' data
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Resampling produces new hypothetical samples (resamples) from already existing observed data or from a model that generates data. These new samples are similar to the pre-existing samples.
+
+In order to resample to work on indices that are non-datetimelike, the following procedure can be utilized.
+
+In the following examples, **df.index // 5** returns a binary array which is used to determine what gets selected for the groupby operation.
+
+.. note:: The below example shows how we can downsample by consolidation of samples into fewer samples. Here by using **df.index // 5**, we are aggregating the samples in bins. By applying **std()** function, we aggregate the information contained in many samples into a small subset of values which is their standard deviation thereby reducing the number of samples.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 2))
+   df
+   df.index // 5
+   df.groupby(df.index // 5).std()
+
+Returning a Series to propagate names
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Group DataFrame columns, compute a set of metrics and return a named Series.
+The Series name is used as the name for the column index. This is especially
+useful in conjunction with reshaping operations such as stacking in which the
+column index name will be used as the name of the inserted column:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 2, 2],
+                      'b': [0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1],
+                      'c': [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0],
+                      'd': [0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1]})
+
+   def compute_metrics(x):
+       result = {'b_sum': x['b'].sum(), 'c_mean': x['c'].mean()}
+       return pd.Series(result, name='metrics')
+
+   result = df.groupby('a').apply(compute_metrics)
+
+   result
+
+   result.stack()
diff --git a/doc/source/user_guide/index.rst b/doc/source/user_guide/index.rst
new file mode 100644
index 0000000000000..d39cf7103ab63
--- /dev/null
+++ b/doc/source/user_guide/index.rst
@@ -0,0 +1,40 @@
+{{ header }}
+
+.. _user_guide:
+
+==========
+User Guide
+==========
+
+The User Guide covers all of pandas by topic area. Each of the subsections
+introduces a topic (such as "working with missing data"), and discusses how
+pandas approaches the problem, with many examples throughout.
+
+Users brand-new to pandas should start with :ref:`10min`.
+
+Further information on any specific method can be obtained in the
+:ref:`api`.
+
+.. toctree::
+    :maxdepth: 2
+
+    io
+    indexing
+    advanced
+    merging
+    reshaping
+    text
+    missing_data
+    categorical
+    integer_na
+    visualization
+    computation
+    groupby
+    timeseries
+    timedeltas
+    style
+    options
+    enhancingperf
+    sparse
+    gotchas
+    cookbook
diff --git a/doc/source/user_guide/indexing.rst b/doc/source/user_guide/indexing.rst
new file mode 100644
index 0000000000000..00d4dc9efc8cc
--- /dev/null
+++ b/doc/source/user_guide/indexing.rst
@@ -0,0 +1,1896 @@
+.. _indexing:
+
+{{ header }}
+
+***************************
+Indexing and Selecting Data
+***************************
+
+The axis labeling information in pandas objects serves many purposes:
+
+* Identifies data (i.e. provides *metadata*) using known indicators,
+  important for analysis, visualization, and interactive console display.
+* Enables automatic and explicit data alignment.
+* Allows intuitive getting and setting of subsets of the data set.
+
+In this section, we will focus on the final point: namely, how to slice, dice,
+and generally get and set subsets of pandas objects. The primary focus will be
+on Series and DataFrame as they have received more development attention in
+this area.
+
+.. note::
+
+   The Python and NumPy indexing operators ``[]`` and attribute operator ``.``
+   provide quick and easy access to pandas data structures across a wide range
+   of use cases. This makes interactive work intuitive, as there's little new
+   to learn if you already know how to deal with Python dictionaries and NumPy
+   arrays. However, since the type of the data to be accessed isn't known in
+   advance, directly using standard operators has some optimization limits. For
+   production code, we recommended that you take advantage of the optimized
+   pandas data access methods exposed in this chapter.
+
+.. warning::
+
+   Whether a copy or a reference is returned for a setting operation, may
+   depend on the context. This is sometimes called ``chained assignment`` and
+   should be avoided. See :ref:`Returning a View versus Copy
+   <indexing.view_versus_copy>`.
+
+.. warning::
+
+   Indexing on an integer-based Index with floats has been clarified in 0.18.0, for a summary of the changes, see :ref:`here <whatsnew_0180.float_indexers>`.
+
+See the :ref:`MultiIndex / Advanced Indexing <advanced>` for ``MultiIndex`` and more advanced indexing documentation.
+
+See the :ref:`cookbook<cookbook.selection>` for some advanced strategies.
+
+.. _indexing.choice:
+
+Different Choices for Indexing
+------------------------------
+
+Object selection has had a number of user-requested additions in order to
+support more explicit location based indexing. Pandas now supports three types
+of multi-axis indexing.
+
+* ``.loc`` is primarily label based, but may also be used with a boolean array. ``.loc`` will raise ``KeyError`` when the items are not found. Allowed inputs are:
+
+    * A single label, e.g. ``5`` or ``'a'`` (Note that ``5`` is interpreted as a
+      *label* of the index. This use is **not** an integer position along the
+      index.).
+    * A list or array of labels ``['a', 'b', 'c']``.
+    * A slice object with labels ``'a':'f'`` (Note that contrary to usual python
+      slices, **both** the start and the stop are included, when present in the
+      index! See :ref:`Slicing with labels
+      <indexing.slicing_with_labels>`.).
+    * A boolean array
+    * A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
+      that returns valid output for indexing (one of the above).
+
+      .. versionadded:: 0.18.1
+
+  See more at :ref:`Selection by Label <indexing.label>`.
+
+* ``.iloc`` is primarily integer position based (from ``0`` to
+  ``length-1`` of the axis), but may also be used with a boolean
+  array.  ``.iloc`` will raise ``IndexError`` if a requested
+  indexer is out-of-bounds, except *slice* indexers which allow
+  out-of-bounds indexing.  (this conforms with Python/NumPy *slice*
+  semantics).  Allowed inputs are:
+
+    * An integer e.g. ``5``.
+    * A list or array of integers ``[4, 3, 0]``.
+    * A slice object with ints ``1:7``.
+    * A boolean array.
+    * A ``callable`` function with one argument (the calling Series, DataFrame or Panel) and
+      that returns valid output for indexing (one of the above).
+
+      .. versionadded:: 0.18.1
+
+  See more at :ref:`Selection by Position <indexing.integer>`,
+  :ref:`Advanced Indexing <advanced>` and :ref:`Advanced
+  Hierarchical <advanced.advanced_hierarchical>`.
+
+* ``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer. See more at :ref:`Selection By Callable <indexing.callable>`.
+
+Getting values from an object with multi-axes selection uses the following
+notation (using ``.loc`` as an example, but the following applies to ``.iloc`` as
+well). Any of the axes accessors may be the null slice ``:``. Axes left out of
+the specification are assumed to be ``:``, e.g. ``p.loc['a']`` is equivalent to
+``p.loc['a', :, :]``.
+
+.. csv-table::
+    :header: "Object Type", "Indexers"
+    :widths: 30, 50
+    :delim: ;
+
+    Series; ``s.loc[indexer]``
+    DataFrame; ``df.loc[row_indexer,column_indexer]``
+    Panel; ``p.loc[item_indexer,major_indexer,minor_indexer]``
+
+.. _indexing.basics:
+
+Basics
+------
+
+As mentioned when introducing the data structures in the :ref:`last section
+<basics>`, the primary function of indexing with ``[]`` (a.k.a. ``__getitem__``
+for those familiar with implementing class behavior in Python) is selecting out
+lower-dimensional slices. The following table shows return type values when
+indexing pandas objects with ``[]``:
+
+.. csv-table::
+    :header: "Object Type", "Selection", "Return Value Type"
+    :widths: 30, 30, 60
+    :delim: ;
+
+    Series; ``series[label]``; scalar value
+    DataFrame; ``frame[colname]``; ``Series`` corresponding to colname
+    Panel; ``panel[itemname]``; ``DataFrame`` corresponding to the itemname
+
+Here we construct a simple time series data set to use for illustrating the
+indexing functionality:
+
+.. ipython:: python
+
+   dates = pd.date_range('1/1/2000', periods=8)
+   df = pd.DataFrame(np.random.randn(8, 4),
+                     index=dates, columns=['A', 'B', 'C', 'D'])
+   df
+   panel = pd.Panel({'one': df, 'two': df - df.mean()})
+   panel
+
+.. note::
+
+   None of the indexing functionality is time series specific unless
+   specifically stated.
+
+Thus, as per above, we have the most basic indexing using ``[]``:
+
+.. ipython:: python
+
+   s = df['A']
+   s[dates[5]]
+   panel['two']
+
+You can pass a list of columns to ``[]`` to select columns in that order.
+If a column is not contained in the DataFrame, an exception will be
+raised. Multiple columns can also be set in this manner:
+
+.. ipython:: python
+
+   df
+   df[['B', 'A']] = df[['A', 'B']]
+   df
+
+You may find this useful for applying a transform (in-place) to a subset of the
+columns.
+
+.. warning::
+
+   pandas aligns all AXES when setting ``Series`` and ``DataFrame`` from ``.loc``, and ``.iloc``.
+
+   This will **not** modify ``df`` because the column alignment is before value assignment.
+
+   .. ipython:: python
+
+      df[['A', 'B']]
+      df.loc[:, ['B', 'A']] = df[['A', 'B']]
+      df[['A', 'B']]
+
+   The correct way to swap column values is by using raw values:
+
+   .. ipython:: python
+
+      df.loc[:, ['B', 'A']] = df[['A', 'B']].to_numpy()
+      df[['A', 'B']]
+
+
+Attribute Access
+----------------
+
+.. _indexing.columns.multiple:
+
+.. _indexing.df_cols:
+
+.. _indexing.attribute_access:
+
+You may access an index on a ``Series``, column on a ``DataFrame``, and an item on a ``Panel`` directly
+as an attribute:
+
+.. ipython:: python
+
+   sa = pd.Series([1, 2, 3], index=list('abc'))
+   dfa = df.copy()
+
+.. ipython:: python
+
+   sa.b
+   dfa.A
+   panel.one
+
+.. ipython:: python
+
+   sa.a = 5
+   sa
+   dfa.A = list(range(len(dfa.index)))  # ok if A already exists
+   dfa
+   dfa['A'] = list(range(len(dfa.index)))  # use this form to create a new column
+   dfa
+
+.. warning::
+
+   - You can use this access only if the index element is a valid Python identifier, e.g. ``s.1`` is not allowed.
+     See `here for an explanation of valid identifiers
+     <https://docs.python.org/3/reference/lexical_analysis.html#identifiers>`__.
+
+   - The attribute will not be available if it conflicts with an existing method name, e.g. ``s.min`` is not allowed.
+
+   - Similarly, the attribute will not be available if it conflicts with any of the following list: ``index``,
+     ``major_axis``, ``minor_axis``, ``items``.
+
+   - In any of these cases, standard indexing will still work, e.g. ``s['1']``, ``s['min']``, and ``s['index']`` will
+     access the corresponding element or column.
+
+If you are using the IPython environment, you may also use tab-completion to
+see these accessible attributes.
+
+You can also assign a ``dict`` to a row of a ``DataFrame``:
+
+.. ipython:: python
+
+   x = pd.DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
+   x.iloc[1] = {'x': 9, 'y': 99}
+   x
+
+You can use attribute access to modify an existing element of a Series or column of a DataFrame, but be careful;
+if you try to use attribute access to create a new column, it creates a new attribute rather than a
+new column. In 0.21.0 and later, this will raise a ``UserWarning``:
+
+.. code-block:: ipython
+
+    In [1]: df = pd.DataFrame({'one': [1., 2., 3.]})
+    In [2]: df.two = [4, 5, 6]
+    UserWarning: Pandas doesn't allow Series to be assigned into nonexistent columns - see https://pandas.pydata.org/pandas-docs/stable/indexing.html#attribute_access
+    In [3]: df
+    Out[3]:
+       one
+    0  1.0
+    1  2.0
+    2  3.0
+
+Slicing ranges
+--------------
+
+The most robust and consistent way of slicing ranges along arbitrary axes is
+described in the :ref:`Selection by Position <indexing.integer>` section
+detailing the ``.iloc`` method. For now, we explain the semantics of slicing using the ``[]`` operator.
+
+With Series, the syntax works exactly as with an ndarray, returning a slice of
+the values and the corresponding labels:
+
+.. ipython:: python
+
+   s[:5]
+   s[::2]
+   s[::-1]
+
+Note that setting works as well:
+
+.. ipython:: python
+
+   s2 = s.copy()
+   s2[:5] = 0
+   s2
+
+With DataFrame, slicing inside of ``[]`` **slices the rows**. This is provided
+largely as a convenience since it is such a common operation.
+
+.. ipython:: python
+
+   df[:3]
+   df[::-1]
+
+.. _indexing.label:
+
+Selection By Label
+------------------
+
+.. warning::
+
+   Whether a copy or a reference is returned for a setting operation, may depend on the context.
+   This is sometimes called ``chained assignment`` and should be avoided.
+   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`.
+
+.. warning::
+
+   ``.loc`` is strict when you present slicers that are not compatible (or convertible) with the index type. For example
+   using integers in a ``DatetimeIndex``. These will raise a ``TypeError``.
+
+  .. ipython:: python
+
+     dfl = pd.DataFrame(np.random.randn(5, 4),
+                        columns=list('ABCD'),
+                        index=pd.date_range('20130101', periods=5))
+     dfl
+
+  .. code-block:: ipython
+
+     In [4]: dfl.loc[2:3]
+     TypeError: cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with these indexers [2] of <type 'int'>
+
+  String likes in slicing *can* be convertible to the type of the index and lead to natural slicing.
+
+  .. ipython:: python
+
+     dfl.loc['20130102':'20130104']
+
+.. warning::
+
+   Starting in 0.21.0, pandas will show a ``FutureWarning`` if indexing with a list with missing labels. In the future
+   this will raise a ``KeyError``. See :ref:`list-like Using loc with missing keys in a list is Deprecated <indexing.deprecate_loc_reindex_listlike>`.
+
+pandas provides a suite of methods in order to have **purely label based indexing**. This is a strict inclusion based protocol.
+Every label asked for must be in the index, or a ``KeyError`` will be raised.
+When slicing, both the start bound **AND** the stop bound are *included*, if present in the index.
+Integers are valid labels, but they refer to the label **and not the position**.
+
+The ``.loc`` attribute is the primary access method. The following are valid inputs:
+
+* A single label, e.g. ``5`` or ``'a'`` (Note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index.).
+* A list or array of labels ``['a', 'b', 'c']``.
+* A slice object with labels ``'a':'f'`` (Note that contrary to usual python
+  slices, **both** the start and the stop are included, when present in the
+  index! See :ref:`Slicing with labels
+  <indexing.slicing_with_labels>`.).
+* A boolean array.
+* A ``callable``, see :ref:`Selection By Callable <indexing.callable>`.
+
+.. ipython:: python
+
+   s1 = pd.Series(np.random.randn(6), index=list('abcdef'))
+   s1
+   s1.loc['c':]
+   s1.loc['b']
+
+Note that setting works as well:
+
+.. ipython:: python
+
+   s1.loc['c':] = 0
+   s1
+
+With a DataFrame:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(6, 4),
+                      index=list('abcdef'),
+                      columns=list('ABCD'))
+   df1
+   df1.loc[['a', 'b', 'd'], :]
+
+Accessing via label slices:
+
+.. ipython:: python
+
+   df1.loc['d':, 'A':'C']
+
+For getting a cross section using a label (equivalent to ``df.xs('a')``):
+
+.. ipython:: python
+
+   df1.loc['a']
+
+For getting values with a boolean array:
+
+.. ipython:: python
+
+   df1.loc['a'] > 0
+   df1.loc[:, df1.loc['a'] > 0]
+
+For getting a value explicitly (equivalent to deprecated ``df.get_value('a','A')``):
+
+.. ipython:: python
+
+   # this is also equivalent to ``df1.at['a','A']``
+   df1.loc['a', 'A']
+
+.. _indexing.slicing_with_labels:
+
+Slicing with labels
+~~~~~~~~~~~~~~~~~~~
+
+When using ``.loc`` with slices, if both the start and the stop labels are
+present in the index, then elements *located* between the two (including them)
+are returned:
+
+.. ipython:: python
+
+   s = pd.Series(list('abcde'), index=[0, 3, 2, 5, 4])
+   s.loc[3:5]
+
+If at least one of the two is absent, but the index is sorted, and can be
+compared against start and stop labels, then slicing will still work as
+expected, by selecting labels which *rank* between the two:
+
+.. ipython:: python
+
+   s.sort_index()
+   s.sort_index().loc[1:6]
+
+However, if at least one of the two is absent *and* the index is not sorted, an
+error will be raised (since doing otherwise would be computationally expensive,
+as well as potentially ambiguous for mixed type indexes). For instance, in the
+above example, ``s.loc[1:6]`` would raise ``KeyError``.
+
+.. _indexing.integer:
+
+Selection By Position
+---------------------
+
+.. warning::
+
+   Whether a copy or a reference is returned for a setting operation, may depend on the context.
+   This is sometimes called ``chained assignment`` and should be avoided.
+   See :ref:`Returning a View versus Copy <indexing.view_versus_copy>`.
+
+Pandas provides a suite of methods in order to get **purely integer based indexing**. The semantics follow closely Python and NumPy slicing. These are ``0-based`` indexing. When slicing, the start bound is *included*, while the upper bound is *excluded*. Trying to use a non-integer, even a **valid** label will raise an ``IndexError``.
+
+The ``.iloc`` attribute is the primary access method. The following are valid inputs:
+
+* An integer e.g. ``5``.
+* A list or array of integers ``[4, 3, 0]``.
+* A slice object with ints ``1:7``.
+* A boolean array.
+* A ``callable``, see :ref:`Selection By Callable <indexing.callable>`.
+
+.. ipython:: python
+
+   s1 = pd.Series(np.random.randn(5), index=list(range(0, 10, 2)))
+   s1
+   s1.iloc[:3]
+   s1.iloc[3]
+
+Note that setting works as well:
+
+.. ipython:: python
+
+   s1.iloc[:3] = 0
+   s1
+
+With a DataFrame:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(6, 4),
+                      index=list(range(0, 12, 2)),
+                      columns=list(range(0, 8, 2)))
+   df1
+
+Select via integer slicing:
+
+.. ipython:: python
+
+   df1.iloc[:3]
+   df1.iloc[1:5, 2:4]
+
+Select via integer list:
+
+.. ipython:: python
+
+   df1.iloc[[1, 3, 5], [1, 3]]
+
+.. ipython:: python
+
+   df1.iloc[1:3, :]
+
+.. ipython:: python
+
+   df1.iloc[:, 1:3]
+
+.. ipython:: python
+
+   # this is also equivalent to ``df1.iat[1,1]``
+   df1.iloc[1, 1]
+
+For getting a cross section using an integer position (equiv to ``df.xs(1)``):
+
+.. ipython:: python
+
+   df1.iloc[1]
+
+Out of range slice indexes are handled gracefully just as in Python/Numpy.
+
+.. ipython:: python
+
+    # these are allowed in python/numpy.
+    x = list('abcdef')
+    x
+    x[4:10]
+    x[8:10]
+    s = pd.Series(x)
+    s
+    s.iloc[4:10]
+    s.iloc[8:10]
+
+Note that using slices that go out of bounds can result in
+an empty axis (e.g. an empty DataFrame being returned).
+
+.. ipython:: python
+
+   dfl = pd.DataFrame(np.random.randn(5, 2), columns=list('AB'))
+   dfl
+   dfl.iloc[:, 2:3]
+   dfl.iloc[:, 1:3]
+   dfl.iloc[4:6]
+
+A single indexer that is out of bounds will raise an ``IndexError``.
+A list of indexers where any element is out of bounds will raise an
+``IndexError``.
+
+.. code-block:: python
+
+   >>> dfl.iloc[[4, 5, 6]]
+   IndexError: positional indexers are out-of-bounds
+
+   >>> dfl.iloc[:, 4]
+   IndexError: single positional indexer is out-of-bounds
+
+.. _indexing.callable:
+
+Selection By Callable
+---------------------
+
+.. versionadded:: 0.18.1
+
+``.loc``, ``.iloc``, and also ``[]`` indexing can accept a ``callable`` as indexer.
+The ``callable`` must be a function with one argument (the calling Series, DataFrame or Panel) that returns valid output for indexing.
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(6, 4),
+                      index=list('abcdef'),
+                      columns=list('ABCD'))
+   df1
+
+   df1.loc[lambda df: df.A > 0, :]
+   df1.loc[:, lambda df: ['A', 'B']]
+
+   df1.iloc[:, lambda df: [0, 1]]
+
+   df1[lambda df: df.columns[0]]
+
+
+You can use callable indexing in ``Series``.
+
+.. ipython:: python
+
+   df1.A.loc[lambda s: s > 0]
+
+Using these methods / indexers, you can chain data selection operations
+without using a temporary variable.
+
+.. ipython:: python
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+   (bb.groupby(['year', 'team']).sum()
+      .loc[lambda df: df.r > 100])
+
+.. _indexing.deprecate_ix:
+
+IX Indexer is Deprecated
+------------------------
+
+.. warning::
+
+   Starting in 0.20.0, the ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc``
+   and ``.loc`` indexers.
+
+``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide
+to index *positionally* OR via *labels* depending on the data type of the index. This has caused quite a
+bit of user confusion over the years.
+
+The recommended methods of indexing are:
+
+* ``.loc`` if you want to *label* index.
+* ``.iloc`` if you want to *positionally* index.
+
+.. ipython:: python
+
+  dfd = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [4, 5, 6]},
+                     index=list('abc'))
+
+  dfd
+
+Previous behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
+
+.. code-block:: ipython
+
+  In [3]: dfd.ix[[0, 2], 'A']
+  Out[3]:
+  a    1
+  c    3
+  Name: A, dtype: int64
+
+Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
+
+.. ipython:: python
+
+  dfd.loc[dfd.index[[0, 2]], 'A']
+
+This can also be expressed using ``.iloc``, by explicitly getting locations on the indexers, and using
+*positional* indexing to select things.
+
+.. ipython:: python
+
+  dfd.iloc[[0, 2], dfd.columns.get_loc('A')]
+
+For getting *multiple* indexers, using ``.get_indexer``:
+
+.. ipython:: python
+
+  dfd.iloc[[0, 2], dfd.columns.get_indexer(['A', 'B'])]
+
+
+.. _deprecate_loc_reindex_listlike:
+.. _indexing.deprecate_loc_reindex_listlike:
+
+Indexing with list with missing labels is Deprecated
+----------------------------------------------------
+
+.. warning::
+
+   Starting in 0.21.0, using ``.loc`` or ``[]`` with a list with one or more missing labels, is deprecated, in favor of ``.reindex``.
+
+In prior versions, using ``.loc[list-of-labels]`` would work as long as *at least 1* of the keys was found (otherwise it
+would raise a ``KeyError``). This behavior is deprecated and will show a warning message pointing to this section. The
+recommended alternative is to use ``.reindex()``.
+
+For example.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Selection with all keys found is unchanged.
+
+.. ipython:: python
+
+   s.loc[[1, 2]]
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Current Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Passing list-likes to .loc with any non-matching elements will raise
+   KeyError in the future, you can use .reindex() as an alternative.
+
+   See the documentation here:
+   http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
+
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Reindexing
+~~~~~~~~~~
+
+The idiomatic way to achieve selecting potentially not-found elements is via ``.reindex()``. See also the section on :ref:`reindexing <basics.reindexing>`.
+
+.. ipython:: python
+
+  s.reindex([1, 2, 3])
+
+Alternatively, if you want to select only *valid* keys, the following is idiomatic and efficient; it is guaranteed to preserve the dtype of the selection.
+
+.. ipython:: python
+
+   labels = [1, 2, 3]
+   s.loc[s.index.intersection(labels)]
+
+Having a duplicated index will raise for a ``.reindex()``:
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(4), index=['a', 'a', 'b', 'c'])
+   labels = ['c', 'd']
+
+.. code-block:: ipython
+
+   In [17]: s.reindex(labels)
+   ValueError: cannot reindex from a duplicate axis
+
+Generally, you can intersect the desired labels with the current
+axis, and then reindex.
+
+.. ipython:: python
+
+   s.loc[s.index.intersection(labels)].reindex(labels)
+
+However, this would *still* raise if your resulting index is duplicated.
+
+.. code-block:: ipython
+
+   In [41]: labels = ['a', 'd']
+
+   In [42]: s.loc[s.index.intersection(labels)].reindex(labels)
+   ValueError: cannot reindex from a duplicate axis
+
+
+.. _indexing.basics.partial_setting:
+
+Selecting Random Samples
+------------------------
+
+A random selection of rows or columns from a Series, DataFrame, or Panel with the :meth:`~DataFrame.sample` method. The method will sample rows by default, and accepts a specific number of rows/columns to return, or a fraction of rows.
+
+.. ipython:: python
+
+    s = pd.Series([0, 1, 2, 3, 4, 5])
+
+    # When no arguments are passed, returns 1 row.
+    s.sample()
+
+    # One may specify either a number of rows:
+    s.sample(n=3)
+
+    # Or a fraction of the rows:
+    s.sample(frac=0.5)
+
+By default, ``sample`` will return each row at most once, but one can also sample with replacement
+using the ``replace`` option:
+
+.. ipython:: python
+
+    s = pd.Series([0, 1, 2, 3, 4, 5])
+
+    # Without replacement (default):
+    s.sample(n=6, replace=False)
+
+    # With replacement:
+    s.sample(n=6, replace=True)
+
+
+By default, each row has an equal probability of being selected, but if you want rows
+to have different probabilities, you can pass the ``sample`` function sampling weights as
+``weights``. These weights can be a list, a NumPy array, or a Series, but they must be of the same length as the object you are sampling. Missing values will be treated as a weight of zero, and inf values are not allowed. If weights do not sum to 1, they will be re-normalized by dividing all weights by the sum of the weights. For example:
+
+.. ipython:: python
+
+    s = pd.Series([0, 1, 2, 3, 4, 5])
+    example_weights = [0, 0, 0.2, 0.2, 0.2, 0.4]
+    s.sample(n=3, weights=example_weights)
+
+    # Weights will be re-normalized automatically
+    example_weights2 = [0.5, 0, 0, 0, 0, 0]
+    s.sample(n=1, weights=example_weights2)
+
+When applied to a DataFrame, you can use a column of the DataFrame as sampling weights
+(provided you are sampling rows and not columns) by simply passing the name of the column
+as a string.
+
+.. ipython:: python
+
+    df2 = pd.DataFrame({'col1': [9, 8, 7, 6],
+                        'weight_column': [0.5, 0.4, 0.1, 0]})
+    df2.sample(n=3, weights='weight_column')
+
+``sample`` also allows users to sample columns instead of rows using the ``axis`` argument.
+
+.. ipython:: python
+
+    df3 = pd.DataFrame({'col1': [1, 2, 3], 'col2': [2, 3, 4]})
+    df3.sample(n=1, axis=1)
+
+Finally, one can also set a seed for ``sample``'s random number generator using the ``random_state`` argument, which will accept either an integer (as a seed) or a NumPy RandomState object.
+
+.. ipython:: python
+
+    df4 = pd.DataFrame({'col1': [1, 2, 3], 'col2': [2, 3, 4]})
+
+    # With a given seed, the sample will always draw the same rows.
+    df4.sample(n=2, random_state=2)
+    df4.sample(n=2, random_state=2)
+
+
+
+Setting With Enlargement
+------------------------
+
+The ``.loc/[]`` operations can perform enlargement when setting a non-existent key for that axis.
+
+In the ``Series`` case this is effectively an appending operation.
+
+.. ipython:: python
+
+   se = pd.Series([1, 2, 3])
+   se
+   se[5] = 5.
+   se
+
+A ``DataFrame`` can be enlarged on either axis via ``.loc``.
+
+.. ipython:: python
+
+   dfi = pd.DataFrame(np.arange(6).reshape(3, 2),
+                      columns=['A', 'B'])
+   dfi
+   dfi.loc[:, 'C'] = dfi.loc[:, 'A']
+   dfi
+
+This is like an ``append`` operation on the ``DataFrame``.
+
+.. ipython:: python
+
+   dfi.loc[3] = 5
+   dfi
+
+.. _indexing.basics.get_value:
+
+Fast scalar value getting and setting
+-------------------------------------
+
+Since indexing with ``[]`` must handle a lot of cases (single-label access,
+slicing, boolean indexing, etc.), it has a bit of overhead in order to figure
+out what you're asking for. If you only want to access a scalar value, the
+fastest way is to use the ``at`` and ``iat`` methods, which are implemented on
+all of the data structures.
+
+Similarly to ``loc``, ``at`` provides **label** based scalar lookups, while, ``iat`` provides **integer** based lookups analogously to ``iloc``
+
+.. ipython:: python
+
+   s.iat[5]
+   df.at[dates[5], 'A']
+   df.iat[3, 0]
+
+You can also set using these same indexers.
+
+.. ipython:: python
+
+   df.at[dates[5], 'E'] = 7
+   df.iat[3, 0] = 7
+
+``at`` may enlarge the object in-place as above if the indexer is missing.
+
+.. ipython:: python
+
+   df.at[dates[-1] + 1, 0] = 7
+   df
+
+Boolean indexing
+----------------
+
+.. _indexing.boolean:
+
+Another common operation is the use of boolean vectors to filter the data.
+The operators are: ``|`` for ``or``, ``&`` for ``and``, and ``~`` for ``not``.
+These **must** be grouped by using parentheses, since by default Python will
+evaluate an expression such as ``df.A > 2 & df.B < 3`` as
+``df.A > (2 & df.B) < 3``, while the desired evaluation order is
+``(df.A > 2) & (df.B < 3)``.
+
+Using a boolean vector to index a Series works exactly as in a NumPy ndarray:
+
+.. ipython:: python
+
+   s = pd.Series(range(-3, 4))
+   s
+   s[s > 0]
+   s[(s < -1) | (s > 0.5)]
+   s[~(s < 0)]
+
+You may select rows from a DataFrame using a boolean vector the same length as
+the DataFrame's index (for example, something derived from one of the columns
+of the DataFrame):
+
+.. ipython:: python
+
+   df[df['A'] > 0]
+
+List comprehensions and the ``map`` method of Series can also be used to produce
+more complex criteria:
+
+.. ipython:: python
+
+   df2 = pd.DataFrame({'a': ['one', 'one', 'two', 'three', 'two', 'one', 'six'],
+                       'b': ['x', 'y', 'y', 'x', 'y', 'x', 'x'],
+                       'c': np.random.randn(7)})
+
+   # only want 'two' or 'three'
+   criterion = df2['a'].map(lambda x: x.startswith('t'))
+
+   df2[criterion]
+
+   # equivalent but slower
+   df2[[x.startswith('t') for x in df2['a']]]
+
+   # Multiple criteria
+   df2[criterion & (df2['b'] == 'x')]
+
+With the choice methods :ref:`Selection by Label <indexing.label>`, :ref:`Selection by Position <indexing.integer>`,
+and :ref:`Advanced Indexing <advanced>` you may select along more than one axis using boolean vectors combined with other indexing expressions.
+
+.. ipython:: python
+
+   df2.loc[criterion & (df2['b'] == 'x'), 'b':'c']
+
+.. _indexing.basics.indexing_isin:
+
+Indexing with isin
+------------------
+
+Consider the :meth:`~Series.isin` method of ``Series``, which returns a boolean
+vector that is true wherever the ``Series`` elements exist in the passed list.
+This allows you to select rows where one or more columns have values you want:
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5), index=np.arange(5)[::-1], dtype='int64')
+   s
+   s.isin([2, 4, 6])
+   s[s.isin([2, 4, 6])]
+
+The same method is available for ``Index`` objects and is useful for the cases
+when you don't know which of the sought labels are in fact present:
+
+.. ipython:: python
+
+   s[s.index.isin([2, 4, 6])]
+
+   # compare it to the following
+   s.reindex([2, 4, 6])
+
+In addition to that, ``MultiIndex`` allows selecting a separate level to use
+in the membership check:
+
+.. ipython:: python
+
+   s_mi = pd.Series(np.arange(6),
+                    index=pd.MultiIndex.from_product([[0, 1], ['a', 'b', 'c']]))
+   s_mi
+   s_mi.iloc[s_mi.index.isin([(1, 'a'), (2, 'b'), (0, 'c')])]
+   s_mi.iloc[s_mi.index.isin(['a', 'c', 'e'], level=1)]
+
+DataFrame also has an :meth:`~DataFrame.isin` method.  When calling ``isin``, pass a set of
+values as either an array or dict.  If values is an array, ``isin`` returns
+a DataFrame of booleans that is the same shape as the original DataFrame, with True
+wherever the element is in the sequence of values.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
+                      'ids2': ['a', 'n', 'c', 'n']})
+
+   values = ['a', 'b', 1, 3]
+
+   df.isin(values)
+
+Oftentimes you'll want to match certain values with certain columns.
+Just make values a ``dict`` where the key is the column, and the value is
+a list of items you want to check for.
+
+.. ipython:: python
+
+   values = {'ids': ['a', 'b'], 'vals': [1, 3]}
+
+   df.isin(values)
+
+Combine DataFrame's ``isin`` with the ``any()`` and ``all()`` methods to
+quickly select subsets of your data that meet a given criteria.
+To select a row where each column meets its own criterion:
+
+.. ipython:: python
+
+  values = {'ids': ['a', 'b'], 'ids2': ['a', 'c'], 'vals': [1, 3]}
+
+  row_mask = df.isin(values).all(1)
+
+  df[row_mask]
+
+.. _indexing.where_mask:
+
+The :meth:`~pandas.DataFrame.where` Method and Masking
+------------------------------------------------------
+
+Selecting values from a Series with a boolean vector generally returns a
+subset of the data. To guarantee that selection output has the same shape as
+the original data, you can use the ``where`` method in ``Series`` and ``DataFrame``.
+
+To return only the selected rows:
+
+.. ipython:: python
+
+   s[s > 0]
+
+To return a Series of the same shape as the original:
+
+.. ipython:: python
+
+   s.where(s > 0)
+
+Selecting values from a DataFrame with a boolean criterion now also preserves
+input data shape. ``where`` is used under the hood as the implementation.
+The code below is equivalent to ``df.where(df < 0)``.
+
+.. ipython:: python
+   :suppress:
+
+   dates = pd.date_range('1/1/2000', periods=8)
+   df = pd.DataFrame(np.random.randn(8, 4),
+                     index=dates, columns=['A', 'B', 'C', 'D'])
+
+.. ipython:: python
+
+   df[df < 0]
+
+In addition, ``where`` takes an optional ``other`` argument for replacement of
+values where the condition is False, in the returned copy.
+
+.. ipython:: python
+
+   df.where(df < 0, -df)
+
+You may wish to set values based on some boolean criteria.
+This can be done intuitively like so:
+
+.. ipython:: python
+
+   s2 = s.copy()
+   s2[s2 < 0] = 0
+   s2
+
+   df2 = df.copy()
+   df2[df2 < 0] = 0
+   df2
+
+By default, ``where`` returns a modified copy of the data. There is an
+optional parameter ``inplace`` so that the original data can be modified
+without creating a copy:
+
+.. ipython:: python
+
+   df_orig = df.copy()
+   df_orig.where(df > 0, -df, inplace=True)
+   df_orig
+
+.. note::
+
+   The signature for :func:`DataFrame.where` differs from :func:`numpy.where`.
+   Roughly ``df1.where(m, df2)`` is equivalent to ``np.where(m, df1, df2)``.
+
+   .. ipython:: python
+
+      df.where(df < 0, -df) == np.where(df < 0, df, -df)
+
+**alignment**
+
+Furthermore, ``where`` aligns the input boolean condition (ndarray or DataFrame),
+such that partial selection with setting is possible. This is analogous to
+partial setting via ``.loc`` (but on the contents rather than the axis labels).
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2[df2[1:4] > 0] = 3
+   df2
+
+Where can also accept ``axis`` and ``level`` parameters to align the input when
+performing the ``where``.
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2.where(df2 > 0, df2['A'], axis='index')
+
+This is equivalent to (but faster than) the following.
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df.apply(lambda x, y: x.where(x > 0, y), y=df['A'])
+
+.. versionadded:: 0.18.1
+
+Where can accept a callable as condition and ``other`` arguments. The function must
+be with one argument (the calling Series or DataFrame) and that returns valid output
+as condition and ``other`` argument.
+
+.. ipython:: python
+
+   df3 = pd.DataFrame({'A': [1, 2, 3],
+                       'B': [4, 5, 6],
+                       'C': [7, 8, 9]})
+   df3.where(lambda x: x > 4, lambda x: x + 10)
+
+Mask
+~~~~
+
+:meth:`~pandas.DataFrame.mask` is the inverse boolean operation of ``where``.
+
+.. ipython:: python
+
+   s.mask(s >= 0)
+   df.mask(df >= 0)
+
+.. _indexing.query:
+
+The :meth:`~pandas.DataFrame.query` Method
+------------------------------------------
+
+:class:`~pandas.DataFrame` objects have a :meth:`~pandas.DataFrame.query`
+method that allows selection using an expression.
+
+You can get the value of the frame where column ``b`` has values
+between the values of columns ``a`` and ``c``. For example:
+
+.. ipython:: python
+
+   n = 10
+   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
+   df
+
+   # pure python
+   df[(df.a < df.b) & (df.b < df.c)]
+
+   # query
+   df.query('(a < b) & (b < c)')
+
+Do the same thing but fall back on a named index if there is no column
+with the name ``a``.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randint(n / 2, size=(n, 2)), columns=list('bc'))
+   df.index.name = 'a'
+   df
+   df.query('a < b and b < c')
+
+If instead you don't want to or cannot name your index, you can use the name
+``index`` in your query expression:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randint(n, size=(n, 2)), columns=list('bc'))
+   df
+   df.query('index < b < c')
+
+.. note::
+
+   If the name of your index overlaps with a column name, the column name is
+   given precedence. For example,
+
+   .. ipython:: python
+
+      df = pd.DataFrame({'a': np.random.randint(5, size=5)})
+      df.index.name = 'a'
+      df.query('a > 2')  # uses the column 'a', not the index
+
+   You can still use the index in a query expression by using the special
+   identifier 'index':
+
+   .. ipython:: python
+
+      df.query('index > 2')
+
+   If for some reason you have a column named ``index``, then you can refer to
+   the index as ``ilevel_0`` as well, but at this point you should consider
+   renaming your columns to something less ambiguous.
+
+
+:class:`~pandas.MultiIndex` :meth:`~pandas.DataFrame.query` Syntax
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can also use the levels of a ``DataFrame`` with a
+:class:`~pandas.MultiIndex` as if they were columns in the frame:
+
+.. ipython:: python
+
+   n = 10
+   colors = np.random.choice(['red', 'green'], size=n)
+   foods = np.random.choice(['eggs', 'ham'], size=n)
+   colors
+   foods
+
+   index = pd.MultiIndex.from_arrays([colors, foods], names=['color', 'food'])
+   df = pd.DataFrame(np.random.randn(n, 2), index=index)
+   df
+   df.query('color == "red"')
+
+If the levels of the ``MultiIndex`` are unnamed, you can refer to them using
+special names:
+
+.. ipython:: python
+
+   df.index.names = [None, None]
+   df
+   df.query('ilevel_0 == "red"')
+
+
+The convention is ``ilevel_0``, which means "index level 0" for the 0th level
+of the ``index``.
+
+
+:meth:`~pandas.DataFrame.query` Use Cases
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A use case for :meth:`~pandas.DataFrame.query` is when you have a collection of
+:class:`~pandas.DataFrame` objects that have a subset of column names (or index
+levels/names) in common. You can pass the same query to both frames *without*
+having to specify which frame you're interested in querying
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
+   df
+   df2 = pd.DataFrame(np.random.rand(n + 2, 3), columns=df.columns)
+   df2
+   expr = '0.0 <= a <= c <= 0.5'
+   map(lambda frame: frame.query(expr), [df, df2])
+
+:meth:`~pandas.DataFrame.query` Python versus pandas Syntax Comparison
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Full numpy-like syntax:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randint(n, size=(n, 3)), columns=list('abc'))
+   df
+   df.query('(a < b) & (b < c)')
+   df[(df.a < df.b) & (df.b < df.c)]
+
+Slightly nicer by removing the parentheses (by binding making comparison
+operators bind tighter than ``&`` and ``|``).
+
+.. ipython:: python
+
+   df.query('a < b & b < c')
+
+Use English instead of symbols:
+
+.. ipython:: python
+
+   df.query('a < b and b < c')
+
+Pretty close to how you might write it on paper:
+
+.. ipython:: python
+
+   df.query('a < b < c')
+
+The ``in`` and ``not in`` operators
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`~pandas.DataFrame.query` also supports special use of Python's ``in`` and
+``not in`` comparison operators, providing a succinct syntax for calling the
+``isin`` method of a ``Series`` or ``DataFrame``.
+
+.. ipython:: python
+
+   # get all rows where columns "a" and "b" have overlapping values
+   df = pd.DataFrame({'a': list('aabbccddeeff'), 'b': list('aaaabbbbcccc'),
+                      'c': np.random.randint(5, size=12),
+                      'd': np.random.randint(9, size=12)})
+   df
+   df.query('a in b')
+
+   # How you'd do it in pure Python
+   df[df.a.isin(df.b)]
+
+   df.query('a not in b')
+
+   # pure Python
+   df[~df.a.isin(df.b)]
+
+
+You can combine this with other expressions for very succinct queries:
+
+
+.. ipython:: python
+
+   # rows where cols a and b have overlapping values
+   # and col c's values are less than col d's
+   df.query('a in b and c < d')
+
+   # pure Python
+   df[df.b.isin(df.a) & (df.c < df.d)]
+
+
+.. note::
+
+   Note that ``in`` and ``not in`` are evaluated in Python, since ``numexpr``
+   has no equivalent of this operation. However, **only the** ``in``/``not in``
+   **expression itself** is evaluated in vanilla Python. For example, in the
+   expression
+
+   .. code-block:: python
+
+      df.query('a in b + c + d')
+
+   ``(b + c + d)`` is evaluated by ``numexpr`` and *then* the ``in``
+   operation is evaluated in plain Python. In general, any operations that can
+   be evaluated using ``numexpr`` will be.
+
+Special use of the ``==`` operator with ``list`` objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Comparing a ``list`` of values to a column using ``==``/``!=`` works similarly
+to ``in``/``not in``.
+
+.. ipython:: python
+
+   df.query('b == ["a", "b", "c"]')
+
+   # pure Python
+   df[df.b.isin(["a", "b", "c"])]
+
+   df.query('c == [1, 2]')
+
+   df.query('c != [1, 2]')
+
+   # using in/not in
+   df.query('[1, 2] in c')
+
+   df.query('[1, 2] not in c')
+
+   # pure Python
+   df[df.c.isin([1, 2])]
+
+
+Boolean Operators
+~~~~~~~~~~~~~~~~~
+
+You can negate boolean expressions with the word ``not`` or the ``~`` operator.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.rand(n, 3), columns=list('abc'))
+   df['bools'] = np.random.rand(len(df)) > 0.5
+   df.query('~bools')
+   df.query('not bools')
+   df.query('not bools') == df[~df.bools]
+
+Of course, expressions can be arbitrarily complex too:
+
+.. ipython:: python
+
+   # short query syntax
+   shorter = df.query('a < b < c and (not bools) or bools > 2')
+
+   # equivalent in pure Python
+   longer = df[(df.a < df.b) & (df.b < df.c) & (~df.bools) | (df.bools > 2)]
+
+   shorter
+   longer
+
+   shorter == longer
+
+
+Performance of :meth:`~pandas.DataFrame.query`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``DataFrame.query()`` using ``numexpr`` is slightly faster than Python for
+large frames.
+
+.. image:: ../_static/query-perf.png
+
+.. note::
+
+   You will only see the performance benefits of using the ``numexpr`` engine
+   with ``DataFrame.query()`` if your frame has more than approximately 200,000
+   rows.
+
+      .. image:: ../_static/query-perf-small.png
+
+This plot was created using a ``DataFrame`` with 3 columns each containing
+floating point values generated using ``numpy.random.randn()``.
+
+.. ipython:: python
+   :suppress:
+
+   df = pd.DataFrame(np.random.randn(8, 4),
+                     index=dates, columns=['A', 'B', 'C', 'D'])
+   df2 = df.copy()
+
+
+Duplicate Data
+--------------
+
+.. _indexing.duplicate:
+
+If you want to identify and remove duplicate rows in a DataFrame,  there are
+two methods that will help: ``duplicated`` and ``drop_duplicates``. Each
+takes as an argument the columns to use to identify duplicated rows.
+
+* ``duplicated`` returns a boolean vector whose length is the number of rows, and which indicates whether a row is duplicated.
+* ``drop_duplicates`` removes duplicate rows.
+
+By default, the first observed row of a duplicate set is considered unique, but
+each method has a ``keep`` parameter to specify targets to be kept.
+
+* ``keep='first'`` (default): mark / drop duplicates except for the first occurrence.
+* ``keep='last'``: mark / drop duplicates except for the last occurrence.
+* ``keep=False``: mark  / drop all duplicates.
+
+.. ipython:: python
+
+   df2 = pd.DataFrame({'a': ['one', 'one', 'two', 'two', 'two', 'three', 'four'],
+                       'b': ['x', 'y', 'x', 'y', 'x', 'x', 'x'],
+                       'c': np.random.randn(7)})
+   df2
+   df2.duplicated('a')
+   df2.duplicated('a', keep='last')
+   df2.duplicated('a', keep=False)
+   df2.drop_duplicates('a')
+   df2.drop_duplicates('a', keep='last')
+   df2.drop_duplicates('a', keep=False)
+
+Also, you can pass a list of columns to identify duplications.
+
+.. ipython:: python
+
+   df2.duplicated(['a', 'b'])
+   df2.drop_duplicates(['a', 'b'])
+
+To drop duplicates by index value, use ``Index.duplicated`` then perform slicing.
+The same set of options are available for the ``keep`` parameter.
+
+.. ipython:: python
+
+   df3 = pd.DataFrame({'a': np.arange(6),
+                       'b': np.random.randn(6)},
+                      index=['a', 'a', 'b', 'c', 'b', 'a'])
+   df3
+   df3.index.duplicated()
+   df3[~df3.index.duplicated()]
+   df3[~df3.index.duplicated(keep='last')]
+   df3[~df3.index.duplicated(keep=False)]
+
+.. _indexing.dictionarylike:
+
+Dictionary-like :meth:`~pandas.DataFrame.get` method
+----------------------------------------------------
+
+Each of Series, DataFrame, and Panel have a ``get`` method which can return a
+default value.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=['a', 'b', 'c'])
+   s.get('a')  # equivalent to s['a']
+   s.get('x', default=-1)
+
+The :meth:`~pandas.DataFrame.lookup` Method
+-------------------------------------------
+
+Sometimes you want to extract a set of values given a sequence of row labels
+and column labels, and the ``lookup`` method allows for this and returns a
+NumPy array.  For instance:
+
+.. ipython:: python
+
+  dflookup = pd.DataFrame(np.random.rand(20, 4), columns = ['A', 'B', 'C', 'D'])
+  dflookup.lookup(list(range(0, 10, 2)), ['B', 'C', 'A', 'B', 'D'])
+
+.. _indexing.class:
+
+Index objects
+-------------
+
+The pandas :class:`~pandas.Index` class and its subclasses can be viewed as
+implementing an *ordered multiset*. Duplicates are allowed. However, if you try
+to convert an :class:`~pandas.Index` object with duplicate entries into a
+``set``, an exception will be raised.
+
+:class:`~pandas.Index` also provides the infrastructure necessary for
+lookups, data alignment, and reindexing. The easiest way to create an
+:class:`~pandas.Index` directly is to pass a ``list`` or other sequence to
+:class:`~pandas.Index`:
+
+.. ipython:: python
+
+   index = pd.Index(['e', 'd', 'a', 'b'])
+   index
+   'd' in index
+
+You can also pass a ``name`` to be stored in the index:
+
+
+.. ipython:: python
+
+   index = pd.Index(['e', 'd', 'a', 'b'], name='something')
+   index.name
+
+The name, if set, will be shown in the console display:
+
+.. ipython:: python
+
+   index = pd.Index(list(range(5)), name='rows')
+   columns = pd.Index(['A', 'B', 'C'], name='cols')
+   df = pd.DataFrame(np.random.randn(5, 3), index=index, columns=columns)
+   df
+   df['A']
+
+.. _indexing.set_metadata:
+
+Setting metadata
+~~~~~~~~~~~~~~~~
+
+Indexes are "mostly immutable", but it is possible to set and change their
+metadata, like the index ``name`` (or, for ``MultiIndex``, ``levels`` and
+``codes``).
+
+You can use the ``rename``, ``set_names``, ``set_levels``, and ``set_codes``
+to set these attributes directly. They default to returning a copy; however,
+you can specify ``inplace=True`` to have the data change in place.
+
+See :ref:`Advanced Indexing <advanced>` for usage of MultiIndexes.
+
+.. ipython:: python
+
+  ind = pd.Index([1, 2, 3])
+  ind.rename("apple")
+  ind
+  ind.set_names(["apple"], inplace=True)
+  ind.name = "bob"
+  ind
+
+``set_names``, ``set_levels``, and ``set_codes`` also take an optional
+``level`` argument
+
+.. ipython:: python
+
+  index = pd.MultiIndex.from_product([range(3), ['one', 'two']], names=['first', 'second'])
+  index
+  index.levels[1]
+  index.set_levels(["a", "b"], level=1)
+
+Set operations on Index objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _indexing.set_ops:
+
+The two main operations are ``union (|)`` and ``intersection (&)``.
+These can be directly called as instance methods or used via overloaded
+operators. Difference is provided via the ``.difference()`` method.
+
+.. ipython:: python
+
+   a = pd.Index(['c', 'b', 'a'])
+   b = pd.Index(['c', 'e', 'd'])
+   a | b
+   a & b
+   a.difference(b)
+
+Also available is the ``symmetric_difference (^)`` operation, which returns elements
+that appear in either ``idx1`` or ``idx2``, but not in both. This is
+equivalent to the Index created by ``idx1.difference(idx2).union(idx2.difference(idx1))``,
+with duplicates dropped.
+
+.. ipython:: python
+
+   idx1 = pd.Index([1, 2, 3, 4])
+   idx2 = pd.Index([2, 3, 4, 5])
+   idx1.symmetric_difference(idx2)
+   idx1 ^ idx2
+
+.. note::
+
+   The resulting index from a set operation will be sorted in ascending order.
+
+Missing values
+~~~~~~~~~~~~~~
+
+.. _indexing.missing:
+
+.. important::
+
+   Even though ``Index`` can hold missing values (``NaN``), it should be avoided
+   if you do not want any unexpected results. For example, some operations
+   exclude missing values implicitly.
+
+``Index.fillna`` fills missing values with specified scalar value.
+
+.. ipython:: python
+
+   idx1 = pd.Index([1, np.nan, 3, 4])
+   idx1
+   idx1.fillna(2)
+
+   idx2 = pd.DatetimeIndex([pd.Timestamp('2011-01-01'),
+                            pd.NaT,
+                            pd.Timestamp('2011-01-03')])
+   idx2
+   idx2.fillna(pd.Timestamp('2011-01-02'))
+
+Set / Reset Index
+-----------------
+
+Occasionally you will load or create a data set into a DataFrame and want to
+add an index after you've already done so. There are a couple of different
+ways.
+
+Set an index
+~~~~~~~~~~~~
+
+.. _indexing.set_index:
+
+DataFrame has a :meth:`~DataFrame.set_index` method which takes a column name
+(for a regular ``Index``) or a list of column names (for a ``MultiIndex``).
+To create a new, re-indexed DataFrame:
+
+.. ipython:: python
+   :suppress:
+
+   data = pd.DataFrame({'a': ['bar', 'bar', 'foo', 'foo'],
+                        'b': ['one', 'two', 'one', 'two'],
+                        'c': ['z', 'y', 'x', 'w'],
+                        'd': [1., 2., 3, 4]})
+
+.. ipython:: python
+
+   data
+   indexed1 = data.set_index('c')
+   indexed1
+   indexed2 = data.set_index(['a', 'b'])
+   indexed2
+
+The ``append`` keyword option allow you to keep the existing index and append
+the given columns to a MultiIndex:
+
+.. ipython:: python
+
+   frame = data.set_index('c', drop=False)
+   frame = frame.set_index(['a', 'b'], append=True)
+   frame
+
+Other options in ``set_index`` allow you not drop the index columns or to add
+the index in-place (without creating a new object):
+
+.. ipython:: python
+
+   data.set_index('c', drop=False)
+   data.set_index(['a', 'b'], inplace=True)
+   data
+
+Reset the index
+~~~~~~~~~~~~~~~
+
+As a convenience, there is a new function on DataFrame called
+:meth:`~DataFrame.reset_index` which transfers the index values into the
+DataFrame's columns and sets a simple integer index.
+This is the inverse operation of :meth:`~DataFrame.set_index`.
+
+
+.. ipython:: python
+
+   data
+   data.reset_index()
+
+The output is more similar to a SQL table or a record array. The names for the
+columns derived from the index are the ones stored in the ``names`` attribute.
+
+You can use the ``level`` keyword to remove only a portion of the index:
+
+.. ipython:: python
+
+   frame
+   frame.reset_index(level=1)
+
+
+``reset_index`` takes an optional parameter ``drop`` which if true simply
+discards the index, instead of putting index values in the DataFrame's columns.
+
+Adding an ad hoc index
+~~~~~~~~~~~~~~~~~~~~~~
+
+If you create an index yourself, you can just assign it to the ``index`` field:
+
+.. code-block:: python
+
+   data.index = index
+
+.. _indexing.view_versus_copy:
+
+Returning a view versus a copy
+------------------------------
+
+When setting values in a pandas object, care must be taken to avoid what is called
+``chained indexing``. Here is an example.
+
+.. ipython:: python
+
+   dfmi = pd.DataFrame([list('abcd'),
+                        list('efgh'),
+                        list('ijkl'),
+                        list('mnop')],
+                       columns=pd.MultiIndex.from_product([['one', 'two'],
+                                                           ['first', 'second']]))
+   dfmi
+
+Compare these two access methods:
+
+.. ipython:: python
+
+   dfmi['one']['second']
+
+.. ipython:: python
+
+   dfmi.loc[:, ('one', 'second')]
+
+These both yield the same results, so which should you use? It is instructive to understand the order
+of operations on these and why method 2 (``.loc``) is much preferred over method 1 (chained ``[]``).
+
+``dfmi['one']`` selects the first level of the columns and returns a DataFrame that is singly-indexed.
+Then another Python operation ``dfmi_with_one['second']`` selects the series indexed by ``'second'``.
+This is indicated by the variable ``dfmi_with_one`` because pandas sees these operations as separate events.
+e.g. separate calls to ``__getitem__``, so it has to treat them as linear operations, they happen one after another.
+
+Contrast this to ``df.loc[:,('one','second')]`` which passes a nested tuple of ``(slice(None),('one','second'))`` to a single call to
+``__getitem__``. This allows pandas to deal with this as a single entity. Furthermore this order of operations *can* be significantly
+faster, and allows one to index *both* axes if so desired.
+
+Why does assignment fail when using chained indexing?
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The problem in the previous section is just a performance issue. What's up with
+the ``SettingWithCopy`` warning? We don't **usually** throw warnings around when
+you do something that might cost a few extra milliseconds!
+
+But it turns out that assigning to the product of chained indexing has
+inherently unpredictable results. To see this, think about how the Python
+interpreter executes this code:
+
+.. ipython:: python
+    :suppress:
+
+    value = None
+
+.. code-block:: python
+
+   dfmi.loc[:, ('one', 'second')] = value
+   # becomes
+   dfmi.loc.__setitem__((slice(None), ('one', 'second')), value)
+
+But this code is handled differently:
+
+.. code-block:: python
+
+   dfmi['one']['second'] = value
+   # becomes
+   dfmi.__getitem__('one').__setitem__('second', value)
+
+See that ``__getitem__`` in there? Outside of simple cases, it's very hard to
+predict whether it will return a view or a copy (it depends on the memory layout
+of the array, about which pandas makes no guarantees), and therefore whether
+the ``__setitem__`` will modify ``dfmi`` or a temporary object that gets thrown
+out immediately afterward. **That's** what ``SettingWithCopy`` is warning you
+about!
+
+.. note:: You may be wondering whether we should be concerned about the ``loc``
+   property in the first example. But ``dfmi.loc`` is guaranteed to be ``dfmi``
+   itself with modified indexing behavior, so ``dfmi.loc.__getitem__`` /
+   ``dfmi.loc.__setitem__`` operate on ``dfmi`` directly. Of course,
+   ``dfmi.loc.__getitem__(idx)`` may be a view or a copy of ``dfmi``.
+
+Sometimes a ``SettingWithCopy`` warning will arise at times when there's no
+obvious chained indexing going on. **These** are the bugs that
+``SettingWithCopy`` is designed to catch! Pandas is probably trying to warn you
+that you've done this:
+
+.. code-block:: python
+
+   def do_something(df):
+       foo = df[['bar', 'baz']]  # Is foo a view? A copy? Nobody knows!
+       # ... many lines here ...
+       # We don't know whether this will modify df or not!
+       foo['quux'] = value
+       return foo
+
+Yikes!
+
+.. _indexing.evaluation_order:
+
+Evaluation order matters
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+When you use chained indexing, the order and type of the indexing operation
+partially determine whether the result is a slice into the original object, or
+a copy of the slice.
+
+Pandas has the ``SettingWithCopyWarning`` because assigning to a copy of a
+slice is frequently not intentional, but a mistake caused by chained indexing
+returning a copy where a slice was expected.
+
+If you would like pandas to be more or less trusting about assignment to a
+chained indexing expression, you can set the :ref:`option <options>`
+``mode.chained_assignment`` to one of these values:
+
+* ``'warn'``, the default, means a ``SettingWithCopyWarning`` is printed.
+* ``'raise'`` means pandas will raise a ``SettingWithCopyException``
+  you have to deal with.
+* ``None`` will suppress the warnings entirely.
+
+.. ipython:: python
+   :okwarning:
+
+   dfb = pd.DataFrame({'a': ['one', 'one', 'two',
+                             'three', 'two', 'one', 'six'],
+                       'c': np.arange(7)})
+
+   # This will show the SettingWithCopyWarning
+   # but the frame values will be set
+   dfb['c'][dfb.a.str.startswith('o')] = 42
+
+This however is operating on a copy and will not work.
+
+::
+
+   >>> pd.set_option('mode.chained_assignment','warn')
+   >>> dfb[dfb.a.str.startswith('o')]['c'] = 42
+   Traceback (most recent call last)
+        ...
+   SettingWithCopyWarning:
+        A value is trying to be set on a copy of a slice from a DataFrame.
+        Try using .loc[row_index,col_indexer] = value instead
+
+A chained assignment can also crop up in setting in a mixed dtype frame.
+
+.. note::
+
+   These setting rules apply to all of ``.loc/.iloc``.
+
+This is the correct access method:
+
+.. ipython:: python
+
+   dfc = pd.DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
+   dfc.loc[0, 'A'] = 11
+   dfc
+
+This *can* work at times, but it is not guaranteed to, and therefore should be avoided:
+
+.. ipython:: python
+   :okwarning:
+
+   dfc = dfc.copy()
+   dfc['A'][0] = 111
+   dfc
+
+This will **not** work at all, and so should be avoided:
+
+::
+
+   >>> pd.set_option('mode.chained_assignment','raise')
+   >>> dfc.loc[0]['A'] = 1111
+   Traceback (most recent call last)
+        ...
+   SettingWithCopyException:
+        A value is trying to be set on a copy of a slice from a DataFrame.
+        Try using .loc[row_index,col_indexer] = value instead
+
+.. warning::
+
+   The chained assignment warnings / exceptions are aiming to inform the user of a possibly invalid
+   assignment. There may be false positives; situations where a chained assignment is inadvertently
+   reported.
diff --git a/doc/source/user_guide/integer_na.rst b/doc/source/user_guide/integer_na.rst
new file mode 100644
index 0000000000000..c5667e9319ca6
--- /dev/null
+++ b/doc/source/user_guide/integer_na.rst
@@ -0,0 +1,107 @@
+.. currentmodule:: pandas
+
+{{ header }}
+
+.. _integer_na:
+
+**************************
+Nullable Integer Data Type
+**************************
+
+.. versionadded:: 0.24.0
+
+.. note::
+
+   IntegerArray is currently experimental. Its API or implementation may
+   change without warning.
+
+
+In :ref:`missing_data`, we saw that pandas primarily uses ``NaN`` to represent
+missing data. Because ``NaN`` is a float, this forces an array of integers with
+any missing values to become floating point. In some cases, this may not matter
+much. But if your integer column is, say, an identifier, casting to float can
+be problematic. Some integers cannot even be represented as floating point
+numbers.
+
+Pandas can represent integer data with possibly missing values using
+:class:`arrays.IntegerArray`. This is an :ref:`extension types <extending.extension-types>`
+implemented within pandas. It is not the default dtype for integers, and will not be inferred;
+you must explicitly pass the dtype into :meth:`array` or :class:`Series`:
+
+.. ipython:: python
+
+   arr = pd.array([1, 2, np.nan], dtype=pd.Int64Dtype())
+   arr
+
+Or the string alias ``"Int64"`` (note the capital ``"I"``, to differentiate from
+NumPy's ``'int64'`` dtype:
+
+.. ipython:: python
+
+   pd.array([1, 2, np.nan], dtype="Int64")
+
+This array can be stored in a :class:`DataFrame` or :class:`Series` like any
+NumPy array.
+
+.. ipython:: python
+
+   pd.Series(arr)
+
+You can also pass the list-like object to the :class:`Series` constructor
+with the dtype.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, np.nan], dtype="Int64")
+   s
+
+By default (if you don't specify ``dtype``), NumPy is used, and you'll end
+up with a ``float64`` dtype Series:
+
+.. ipython:: python
+
+   pd.Series([1, 2, np.nan])
+
+Operations involving an integer array will behave similar to NumPy arrays.
+Missing values will be propagated, and and the data will be coerced to another
+dtype if needed.
+
+.. ipython:: python
+
+   # arithmetic
+   s + 1
+
+   # comparison
+   s == 1
+
+   # indexing
+   s.iloc[1:3]
+
+   # operate with other dtypes
+   s + s.iloc[1:3].astype('Int8')
+
+   # coerce when needed
+   s + 0.01
+
+These dtypes can operate as part of of ``DataFrame``.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': s, 'B': [1, 1, 3], 'C': list('aab')})
+   df
+   df.dtypes
+
+
+These dtypes can be merged & reshaped & casted.
+
+.. ipython:: python
+
+   pd.concat([df[['A']], df[['B', 'C']]], axis=1).dtypes
+   df['A'].astype(float)
+
+Reduction and groupby operations such as 'sum' work as well.
+
+.. ipython:: python
+
+   df.sum()
+   df.groupby('B').A.sum()
diff --git a/doc/source/user_guide/io.rst b/doc/source/user_guide/io.rst
new file mode 100644
index 0000000000000..b23a0f10e9e2b
--- /dev/null
+++ b/doc/source/user_guide/io.rst
@@ -0,0 +1,5694 @@
+.. _io:
+
+.. currentmodule:: pandas
+
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   clipdf = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6], 'C': ['p', 'q', 'r']},
+                         index=['x', 'y', 'z'])
+
+
+===============================
+IO Tools (Text, CSV, HDF5, ...)
+===============================
+
+The pandas I/O API is a set of top level ``reader`` functions accessed like
+:func:`pandas.read_csv` that generally return a pandas object. The corresponding
+``writer`` functions are object methods that are accessed like
+:meth:`DataFrame.to_csv`. Below is a table containing available ``readers`` and
+``writers``.
+
+.. csv-table::
+    :header: "Format Type", "Data Description", "Reader", "Writer"
+    :widths: 30, 100, 60, 60
+    :delim: ;
+
+    text;`CSV <https://en.wikipedia.org/wiki/Comma-separated_values>`__;:ref:`read_csv<io.read_csv_table>`;:ref:`to_csv<io.store_in_csv>`
+    text;`JSON <https://www.json.org/>`__;:ref:`read_json<io.json_reader>`;:ref:`to_json<io.json_writer>`
+    text;`HTML <https://en.wikipedia.org/wiki/HTML>`__;:ref:`read_html<io.read_html>`;:ref:`to_html<io.html>`
+    text; Local clipboard;:ref:`read_clipboard<io.clipboard>`;:ref:`to_clipboard<io.clipboard>`
+    binary;`MS Excel <https://en.wikipedia.org/wiki/Microsoft_Excel>`__;:ref:`read_excel<io.excel_reader>`;:ref:`to_excel<io.excel_writer>`
+    binary;`HDF5 Format <https://support.hdfgroup.org/HDF5/whatishdf5.html>`__;:ref:`read_hdf<io.hdf5>`;:ref:`to_hdf<io.hdf5>`
+    binary;`Feather Format <https://github.com/wesm/feather>`__;:ref:`read_feather<io.feather>`;:ref:`to_feather<io.feather>`
+    binary;`Parquet Format <https://parquet.apache.org/>`__;:ref:`read_parquet<io.parquet>`;:ref:`to_parquet<io.parquet>`
+    binary;`Msgpack <https://msgpack.org/index.html>`__;:ref:`read_msgpack<io.msgpack>`;:ref:`to_msgpack<io.msgpack>`
+    binary;`Stata <https://en.wikipedia.org/wiki/Stata>`__;:ref:`read_stata<io.stata_reader>`;:ref:`to_stata<io.stata_writer>`
+    binary;`SAS <https://en.wikipedia.org/wiki/SAS_(software)>`__;:ref:`read_sas<io.sas_reader>`;
+    binary;`Python Pickle Format <https://docs.python.org/3/library/pickle.html>`__;:ref:`read_pickle<io.pickle>`;:ref:`to_pickle<io.pickle>`
+    SQL;`SQL <https://en.wikipedia.org/wiki/SQL>`__;:ref:`read_sql<io.sql>`;:ref:`to_sql<io.sql>`
+    SQL;`Google Big Query <https://en.wikipedia.org/wiki/BigQuery>`__;:ref:`read_gbq<io.bigquery>`;:ref:`to_gbq<io.bigquery>`
+
+:ref:`Here <io.perf>` is an informal performance comparison for some of these IO methods.
+
+.. note::
+   For examples that use the ``StringIO`` class, make sure you import it
+   according to your Python version, i.e. ``from StringIO import StringIO`` for
+   Python 2 and ``from io import StringIO`` for Python 3.
+
+.. _io.read_csv_table:
+
+CSV & Text files
+----------------
+
+The workhorse function for reading text files (a.k.a. flat files) is
+:func:`read_csv`. See the :ref:`cookbook<cookbook.csv>` for some advanced strategies.
+
+Parsing options
+'''''''''''''''
+
+:func:`read_csv` accepts the following common arguments:
+
+Basic
++++++
+
+filepath_or_buffer : various
+  Either a path to a file (a :class:`python:str`, :class:`python:pathlib.Path`,
+  or :class:`py:py._path.local.LocalPath`), URL (including http, ftp, and S3
+  locations), or any object with a ``read()`` method (such as an open file or
+  :class:`~python:io.StringIO`).
+sep : str, defaults to ``','`` for :func:`read_csv`, ``\t`` for :func:`read_table`
+  Delimiter to use. If sep is ``None``, the C engine cannot automatically detect
+  the separator, but the Python parsing engine can, meaning the latter will be
+  used and automatically detect the separator by Python's builtin sniffer tool,
+  :class:`python:csv.Sniffer`. In addition, separators longer than 1 character and
+  different from ``'\s+'`` will be interpreted as regular expressions and
+  will also force the use of the Python parsing engine. Note that regex
+  delimiters are prone to ignoring quoted data. Regex example: ``'\\r\\t'``.
+delimiter : str, default ``None``
+  Alternative argument name for sep.
+delim_whitespace : boolean, default False
+  Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``)
+  will be used as the delimiter. Equivalent to setting ``sep='\s+'``.
+  If this option is set to ``True``, nothing should be passed in for the
+  ``delimiter`` parameter.
+
+  .. versionadded:: 0.18.1 support for the Python parser.
+
+Column and Index Locations and Names
+++++++++++++++++++++++++++++++++++++
+
+header : int or list of ints, default ``'infer'``
+  Row number(s) to use as the column names, and the start of the
+  data. Default behavior is to infer the column names: if no names are
+  passed the behavior is identical to ``header=0`` and column names
+  are inferred from the first line of the file, if column names are
+  passed explicitly then the behavior is identical to
+  ``header=None``. Explicitly pass ``header=0`` to be able to replace
+  existing names.
+
+  The header can be a list of ints that specify row locations
+  for a MultiIndex on the columns e.g. ``[0,1,3]``. Intervening rows
+  that are not specified will be skipped (e.g. 2 in this example is
+  skipped). Note that this parameter ignores commented lines and empty
+  lines if ``skip_blank_lines=True``, so header=0 denotes the first
+  line of data rather than the first line of the file.
+names : array-like, default ``None``
+  List of column names to use. If file contains no header row, then you should
+  explicitly pass ``header=None``. Duplicates in this list will cause
+  a ``UserWarning`` to be issued.
+index_col :  int or sequence or ``False``, default ``None``
+  Column to use as the row labels of the ``DataFrame``. If a sequence is given, a
+  MultiIndex is used. If you have a malformed file with delimiters at the end of
+  each line, you might consider ``index_col=False`` to force pandas to *not* use
+  the first column as the index (row names).
+usecols : list-like or callable, default ``None``
+  Return a subset of the columns. If list-like, all elements must either
+  be positional (i.e. integer indices into the document columns) or strings
+  that correspond to column names provided either by the user in `names` or
+  inferred from the document header row(s). For example, a valid list-like
+  `usecols` parameter would be ``[0, 1, 2]`` or ``['foo', 'bar', 'baz']``.
+
+  Element order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``. To
+  instantiate a DataFrame from ``data`` with element order preserved use
+  ``pd.read_csv(data, usecols=['foo', 'bar'])[['foo', 'bar']]`` for columns
+  in ``['foo', 'bar']`` order or
+  ``pd.read_csv(data, usecols=['foo', 'bar'])[['bar', 'foo']]`` for
+  ``['bar', 'foo']`` order.
+
+  If callable, the callable function will be evaluated against the column names,
+  returning names where the callable function evaluates to True:
+
+  .. ipython:: python
+
+     from pandas.compat import StringIO, BytesIO
+     data = ('col1,col2,col3\n'
+             'a,b,1\n'
+             'a,b,2\n'
+             'c,d,3')
+     pd.read_csv(StringIO(data))
+     pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['COL1', 'COL3'])
+
+  Using this parameter results in much faster parsing time and lower memory usage.
+squeeze : boolean, default ``False``
+  If the parsed data only contains one column then return a ``Series``.
+prefix : str, default ``None``
+  Prefix to add to column numbers when no header, e.g. 'X' for X0, X1, ...
+mangle_dupe_cols : boolean, default ``True``
+  Duplicate columns will be specified as 'X', 'X.1'...'X.N', rather than 'X'...'X'.
+  Passing in ``False`` will cause data to be overwritten if there are duplicate
+  names in the columns.
+
+General Parsing Configuration
++++++++++++++++++++++++++++++
+
+dtype : Type name or dict of column -> type, default ``None``
+  Data type for data or columns. E.g. ``{'a': np.float64, 'b': np.int32}``
+  (unsupported with ``engine='python'``). Use `str` or `object` together
+  with suitable ``na_values`` settings to preserve and
+  not interpret dtype.
+
+  .. versionadded:: 0.20.0 support for the Python parser.
+
+engine : {``'c'``, ``'python'``}
+  Parser engine to use. The C engine is faster while the Python engine is
+  currently more feature-complete.
+converters : dict, default ``None``
+  Dict of functions for converting values in certain columns. Keys can either be
+  integers or column labels.
+true_values : list, default ``None``
+  Values to consider as ``True``.
+false_values : list, default ``None``
+  Values to consider as ``False``.
+skipinitialspace : boolean, default ``False``
+  Skip spaces after delimiter.
+skiprows : list-like or integer, default ``None``
+  Line numbers to skip (0-indexed) or number of lines to skip (int) at the start
+  of the file.
+
+  If callable, the callable function will be evaluated against the row
+  indices, returning True if the row should be skipped and False otherwise:
+
+  .. ipython:: python
+
+     data = ('col1,col2,col3\n'
+             'a,b,1\n'
+             'a,b,2\n'
+             'c,d,3')
+     pd.read_csv(StringIO(data))
+     pd.read_csv(StringIO(data), skiprows=lambda x: x % 2 != 0)
+
+skipfooter : int, default ``0``
+  Number of lines at bottom of file to skip (unsupported with engine='c').
+
+nrows : int, default ``None``
+  Number of rows of file to read. Useful for reading pieces of large files.
+low_memory : boolean, default ``True``
+  Internally process the file in chunks, resulting in lower memory use
+  while parsing, but possibly mixed type inference.  To ensure no mixed
+  types either set ``False``, or specify the type with the ``dtype`` parameter.
+  Note that the entire file is read into a single ``DataFrame`` regardless,
+  use the ``chunksize`` or ``iterator`` parameter to return the data in chunks.
+  (Only valid with C parser)
+memory_map : boolean, default False
+  If a filepath is provided for ``filepath_or_buffer``, map the file object
+  directly onto memory and access the data directly from there. Using this
+  option can improve performance because there is no longer any I/O overhead.
+
+NA and Missing Data Handling
+++++++++++++++++++++++++++++
+
+na_values : scalar, str, list-like, or dict, default ``None``
+  Additional strings to recognize as NA/NaN. If dict passed, specific per-column
+  NA values. See :ref:`na values const <io.navaluesconst>` below
+  for a list of the values interpreted as NaN by default.
+
+keep_default_na : boolean, default ``True``
+  Whether or not to include the default NaN values when parsing the data.
+  Depending on whether `na_values` is passed in, the behavior is as follows:
+
+  * If `keep_default_na` is ``True``, and `na_values` are specified, `na_values`
+    is appended to the default NaN values used for parsing.
+  * If `keep_default_na` is ``True``, and `na_values` are not specified, only
+    the default NaN values are used for parsing.
+  * If `keep_default_na` is ``False``, and `na_values` are specified, only
+    the NaN values specified `na_values` are used for parsing.
+  * If `keep_default_na` is ``False``, and `na_values` are not specified, no
+    strings will be parsed as NaN.
+
+  Note that if `na_filter` is passed in as ``False``, the `keep_default_na` and
+  `na_values` parameters will be ignored.
+na_filter : boolean, default ``True``
+  Detect missing value markers (empty strings and the value of na_values). In
+  data without any NAs, passing ``na_filter=False`` can improve the performance
+  of reading a large file.
+verbose : boolean, default ``False``
+  Indicate number of NA values placed in non-numeric columns.
+skip_blank_lines : boolean, default ``True``
+  If ``True``, skip over blank lines rather than interpreting as NaN values.
+
+Datetime Handling
++++++++++++++++++
+
+parse_dates : boolean or list of ints or names or list of lists or dict, default ``False``.
+  * If ``True`` -> try parsing the index.
+  * If ``[1, 2, 3]`` ->  try parsing columns 1, 2, 3 each as a separate date
+    column.
+  * If ``[[1, 3]]`` -> combine columns 1 and 3 and parse as a single date
+    column.
+  * If ``{'foo': [1, 3]}`` -> parse columns 1, 3 as date and call result 'foo'.
+    A fast-path exists for iso8601-formatted dates.
+infer_datetime_format : boolean, default ``False``
+  If ``True`` and parse_dates is enabled for a column, attempt to infer the
+  datetime format to speed up the processing.
+keep_date_col : boolean, default ``False``
+  If ``True`` and parse_dates specifies combining multiple columns then keep the
+  original columns.
+date_parser : function, default ``None``
+  Function to use for converting a sequence of string columns to an array of
+  datetime instances. The default uses ``dateutil.parser.parser`` to do the
+  conversion. Pandas will try to call date_parser in three different ways,
+  advancing to the next if an exception occurs: 1) Pass one or more arrays (as
+  defined by parse_dates) as arguments; 2) concatenate (row-wise) the string
+  values from the columns defined by parse_dates into a single array and pass
+  that; and 3) call date_parser once for each row using one or more strings
+  (corresponding to the columns defined by parse_dates) as arguments.
+dayfirst : boolean, default ``False``
+  DD/MM format dates, international and European format.
+
+Iteration
++++++++++
+
+iterator : boolean, default ``False``
+  Return `TextFileReader` object for iteration or getting chunks with
+  ``get_chunk()``.
+chunksize : int, default ``None``
+  Return `TextFileReader` object for iteration. See :ref:`iterating and chunking
+  <io.chunking>` below.
+
+Quoting, Compression, and File Format
++++++++++++++++++++++++++++++++++++++
+
+compression : {``'infer'``, ``'gzip'``, ``'bz2'``, ``'zip'``, ``'xz'``, ``None``}, default ``'infer'``
+  For on-the-fly decompression of on-disk data. If 'infer', then use gzip,
+  bz2, zip, or xz if filepath_or_buffer is a string ending in '.gz', '.bz2',
+  '.zip', or '.xz', respectively, and no decompression otherwise. If using 'zip',
+  the ZIP file must contain only one data file to be read in.
+  Set to ``None`` for no decompression.
+
+  .. versionadded:: 0.18.1 support for 'zip' and 'xz' compression.
+  .. versionchanged:: 0.24.0 'infer' option added and set to default.
+thousands : str, default ``None``
+  Thousands separator.
+decimal : str, default ``'.'``
+  Character to recognize as decimal point. E.g. use ``','`` for European data.
+float_precision : string, default None
+  Specifies which converter the C engine should use for floating-point values.
+  The options are ``None`` for the ordinary converter, ``high`` for the
+  high-precision converter, and ``round_trip`` for the round-trip converter.
+lineterminator : str (length 1), default ``None``
+  Character to break file into lines. Only valid with C parser.
+quotechar : str (length 1)
+  The character used to denote the start and end of a quoted item. Quoted items
+  can include the delimiter and it will be ignored.
+quoting : int or ``csv.QUOTE_*`` instance, default ``0``
+  Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
+  ``QUOTE_MINIMAL`` (0), ``QUOTE_ALL`` (1), ``QUOTE_NONNUMERIC`` (2) or
+  ``QUOTE_NONE`` (3).
+doublequote : boolean, default ``True``
+   When ``quotechar`` is specified and ``quoting`` is not ``QUOTE_NONE``,
+   indicate whether or not to interpret two consecutive ``quotechar`` elements
+   **inside** a field as a single ``quotechar`` element.
+escapechar : str (length 1), default ``None``
+  One-character string used to escape delimiter when quoting is ``QUOTE_NONE``.
+comment : str, default ``None``
+  Indicates remainder of line should not be parsed. If found at the beginning of
+  a line, the line will be ignored altogether. This parameter must be a single
+  character. Like empty lines (as long as ``skip_blank_lines=True``), fully
+  commented lines are ignored by the parameter `header` but not by `skiprows`.
+  For example, if ``comment='#'``, parsing '#empty\\na,b,c\\n1,2,3' with
+  `header=0` will result in 'a,b,c' being treated as the header.
+encoding : str, default ``None``
+  Encoding to use for UTF when reading/writing (e.g. ``'utf-8'``). `List of
+  Python standard encodings
+  <https://docs.python.org/3/library/codecs.html#standard-encodings>`_.
+dialect : str or :class:`python:csv.Dialect` instance, default ``None``
+  If provided, this parameter will override values (default or not) for the
+  following parameters: `delimiter`, `doublequote`, `escapechar`,
+  `skipinitialspace`, `quotechar`, and `quoting`. If it is necessary to
+  override values, a ParserWarning will be issued. See :class:`python:csv.Dialect`
+  documentation for more details.
+tupleize_cols : boolean, default ``False``
+    .. deprecated:: 0.21.0
+
+    This argument will be removed and will always convert to MultiIndex
+
+  Leave a list of tuples on columns as is (default is to convert to a MultiIndex
+  on the columns).
+
+Error Handling
+++++++++++++++
+
+error_bad_lines : boolean, default ``True``
+  Lines with too many fields (e.g. a csv line with too many commas) will by
+  default cause an exception to be raised, and no ``DataFrame`` will be
+  returned. If ``False``, then these "bad lines" will dropped from the
+  ``DataFrame`` that is returned. See :ref:`bad lines <io.bad_lines>`
+  below.
+warn_bad_lines : boolean, default ``True``
+  If error_bad_lines is ``False``, and warn_bad_lines is ``True``, a warning for
+  each "bad line" will be output.
+
+.. _io.dtypes:
+
+Specifying column data types
+''''''''''''''''''''''''''''
+
+You can indicate the data type for the whole ``DataFrame`` or individual
+columns:
+
+.. ipython:: python
+
+    data = ('a,b,c,d\n'
+            '1,2,3,4\n'
+            '5,6,7,8\n'
+            '9,10,11')
+    print(data)
+
+    df = pd.read_csv(StringIO(data), dtype=object)
+    df
+    df['a'][0]
+    df = pd.read_csv(StringIO(data),
+                     dtype={'b': object, 'c': np.float64, 'd': 'Int64'})
+    df.dtypes
+
+Fortunately, pandas offers more than one way to ensure that your column(s)
+contain only one ``dtype``. If you're unfamiliar with these concepts, you can
+see :ref:`here<basics.dtypes>` to learn more about dtypes, and
+:ref:`here<basics.object_conversion>` to learn more about ``object`` conversion in
+pandas.
+
+
+For instance, you can use the ``converters`` argument
+of :func:`~pandas.read_csv`:
+
+.. ipython:: python
+
+    data = ("col_1\n"
+            "1\n"
+            "2\n"
+            "'A'\n"
+            "4.22")
+    df = pd.read_csv(StringIO(data), converters={'col_1': str})
+    df
+    df['col_1'].apply(type).value_counts()
+
+Or you can use the :func:`~pandas.to_numeric` function to coerce the
+dtypes after reading in the data,
+
+.. ipython:: python
+
+    df2 = pd.read_csv(StringIO(data))
+    df2['col_1'] = pd.to_numeric(df2['col_1'], errors='coerce')
+    df2
+    df2['col_1'].apply(type).value_counts()
+
+which will convert all valid parsing to floats, leaving the invalid parsing
+as ``NaN``.
+
+Ultimately, how you deal with reading in columns containing mixed dtypes
+depends on your specific needs. In the case above, if you wanted to ``NaN`` out
+the data anomalies, then :func:`~pandas.to_numeric` is probably your best option.
+However, if you wanted for all the data to be coerced, no matter the type, then
+using the ``converters`` argument of :func:`~pandas.read_csv` would certainly be
+worth trying.
+
+  .. versionadded:: 0.20.0 support for the Python parser.
+
+     The ``dtype`` option is supported by the 'python' engine.
+
+.. note::
+   In some cases, reading in abnormal data with columns containing mixed dtypes
+   will result in an inconsistent dataset. If you rely on pandas to infer the
+   dtypes of your columns, the parsing engine will go and infer the dtypes for
+   different chunks of the data, rather than the whole dataset at once. Consequently,
+   you can end up with column(s) with mixed dtypes. For example,
+
+   .. ipython:: python
+        :okwarning:
+
+        col_1 = list(range(500000)) + ['a', 'b'] + list(range(500000))
+        df = pd.DataFrame({'col_1': col_1})
+        df.to_csv('foo.csv')
+        mixed_df = pd.read_csv('foo.csv')
+        mixed_df['col_1'].apply(type).value_counts()
+        mixed_df['col_1'].dtype
+
+   will result with `mixed_df` containing an ``int`` dtype for certain chunks
+   of the column, and ``str`` for others due to the mixed dtypes from the
+   data that was read in. It is important to note that the overall column will be
+   marked with a ``dtype`` of ``object``, which is used for columns with mixed dtypes.
+
+.. ipython:: python
+   :suppress:
+
+   import os
+
+   os.remove('foo.csv')
+
+.. _io.categorical:
+
+Specifying Categorical dtype
+''''''''''''''''''''''''''''
+
+.. versionadded:: 0.19.0
+
+``Categorical`` columns can be parsed directly by specifying ``dtype='category'`` or
+``dtype=CategoricalDtype(categories, ordered)``.
+
+.. ipython:: python
+
+   data = ('col1,col2,col3\n'
+           'a,b,1\n'
+           'a,b,2\n'
+           'c,d,3')
+
+   pd.read_csv(StringIO(data))
+   pd.read_csv(StringIO(data)).dtypes
+   pd.read_csv(StringIO(data), dtype='category').dtypes
+
+Individual columns can be parsed as a ``Categorical`` using a dict
+specification:
+
+.. ipython:: python
+
+   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
+
+.. versionadded:: 0.21.0
+
+Specifying ``dtype='cateogry'`` will result in an unordered ``Categorical``
+whose ``categories`` are the unique values observed in the data. For more
+control on the categories and order, create a
+:class:`~pandas.api.types.CategoricalDtype` ahead of time, and pass that for
+that column's ``dtype``.
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+   dtype = CategoricalDtype(['d', 'c', 'b', 'a'], ordered=True)
+   pd.read_csv(StringIO(data), dtype={'col1': dtype}).dtypes
+
+When using ``dtype=CategoricalDtype``, "unexpected" values outside of
+``dtype.categories`` are treated as missing values.
+
+.. ipython:: python
+
+   dtype = CategoricalDtype(['a', 'b', 'd'])  # No 'c'
+   pd.read_csv(StringIO(data), dtype={'col1': dtype}).col1
+
+This matches the behavior of :meth:`Categorical.set_categories`.
+
+.. note::
+
+   With ``dtype='category'``, the resulting categories will always be parsed
+   as strings (object dtype). If the categories are numeric they can be
+   converted using the :func:`to_numeric` function, or as appropriate, another
+   converter such as :func:`to_datetime`.
+
+   When ``dtype`` is a ``CategoricalDtype`` with homogeneous ``categories`` (
+   all numeric, all datetimes, etc.), the conversion is done automatically.
+
+   .. ipython:: python
+
+      df = pd.read_csv(StringIO(data), dtype='category')
+      df.dtypes
+      df['col3']
+      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
+      df['col3']
+
+
+Naming and Using Columns
+''''''''''''''''''''''''
+
+.. _io.headers:
+
+Handling column names
++++++++++++++++++++++
+
+A file may or may not have a header row. pandas assumes the first row should be
+used as the column names:
+
+.. ipython:: python
+
+    data = ('a,b,c\n'
+            '1,2,3\n'
+            '4,5,6\n'
+            '7,8,9')
+    print(data)
+    pd.read_csv(StringIO(data))
+
+By specifying the ``names`` argument in conjunction with ``header`` you can
+indicate other names to use and whether or not to throw away the header row (if
+any):
+
+.. ipython:: python
+
+    print(data)
+    pd.read_csv(StringIO(data), names=['foo', 'bar', 'baz'], header=0)
+    pd.read_csv(StringIO(data), names=['foo', 'bar', 'baz'], header=None)
+
+If the header is in a row other than the first, pass the row number to
+``header``. This will skip the preceding rows:
+
+.. ipython:: python
+
+    data = ('skip this skip it\n'
+            'a,b,c\n'
+            '1,2,3\n'
+            '4,5,6\n'
+            '7,8,9')
+    pd.read_csv(StringIO(data), header=1)
+
+.. note::
+
+  Default behavior is to infer the column names: if no names are
+  passed the behavior is identical to ``header=0`` and column names
+  are inferred from the first non-blank line of the file, if column
+  names are passed explicitly then the behavior is identical to
+  ``header=None``.
+
+.. _io.dupe_names:
+
+Duplicate names parsing
+'''''''''''''''''''''''
+
+If the file or header contains duplicate names, pandas will by default
+distinguish between them so as to prevent overwriting data:
+
+.. ipython:: python
+
+   data = ('a,b,a\n'
+           '0,1,2\n'
+           '3,4,5')
+   pd.read_csv(StringIO(data))
+
+There is no more duplicate data because ``mangle_dupe_cols=True`` by default,
+which modifies a series of duplicate columns 'X', ..., 'X' to become
+'X', 'X.1', ..., 'X.N'.  If ``mangle_dupe_cols=False``, duplicate data can
+arise:
+
+.. code-block:: ipython
+
+   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
+   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
+   Out[3]:
+      a  b  a
+   0  2  1  2
+   1  5  4  5
+
+To prevent users from encountering this problem with duplicate data, a ``ValueError``
+exception is raised if ``mangle_dupe_cols != True``:
+
+.. code-block:: ipython
+
+   In [2]: data = 'a,b,a\n0,1,2\n3,4,5'
+   In [3]: pd.read_csv(StringIO(data), mangle_dupe_cols=False)
+   ...
+   ValueError: Setting mangle_dupe_cols=False is not supported yet
+
+.. _io.usecols:
+
+Filtering columns (``usecols``)
++++++++++++++++++++++++++++++++
+
+The ``usecols`` argument allows you to select any subset of the columns in a
+file, either using the column names, position numbers or a callable:
+
+.. versionadded:: 0.20.0 support for callable `usecols` arguments
+
+.. ipython:: python
+
+    data = 'a,b,c,d\n1,2,3,foo\n4,5,6,bar\n7,8,9,baz'
+    pd.read_csv(StringIO(data))
+    pd.read_csv(StringIO(data), usecols=['b', 'd'])
+    pd.read_csv(StringIO(data), usecols=[0, 2, 3])
+    pd.read_csv(StringIO(data), usecols=lambda x: x.upper() in ['A', 'C'])
+
+The ``usecols`` argument can also be used to specify which columns not to
+use in the final result:
+
+.. ipython:: python
+
+   pd.read_csv(StringIO(data), usecols=lambda x: x not in ['a', 'c'])
+
+In this case, the callable is specifying that we exclude the "a" and "c"
+columns from the output.
+
+Comments and Empty Lines
+''''''''''''''''''''''''
+
+.. _io.skiplines:
+
+Ignoring line comments and empty lines
+++++++++++++++++++++++++++++++++++++++
+
+If the ``comment`` parameter is specified, then completely commented lines will
+be ignored. By default, completely blank lines will be ignored as well.
+
+.. ipython:: python
+
+   data = ('\n'
+           'a,b,c\n'
+           '  \n'
+           '# commented line\n'
+           '1,2,3\n'
+           '\n'
+           '4,5,6')
+   print(data)
+   pd.read_csv(StringIO(data), comment='#')
+
+If ``skip_blank_lines=False``, then ``read_csv`` will not ignore blank lines:
+
+.. ipython:: python
+
+   data = ('a,b,c\n'
+           '\n'
+           '1,2,3\n'
+           '\n'
+           '\n'
+           '4,5,6')
+   pd.read_csv(StringIO(data), skip_blank_lines=False)
+
+.. warning::
+
+   The presence of ignored lines might create ambiguities involving line numbers;
+   the parameter ``header`` uses row numbers (ignoring commented/empty
+   lines), while ``skiprows`` uses line numbers (including commented/empty lines):
+
+   .. ipython:: python
+
+      data = ('#comment\n'
+              'a,b,c\n'
+              'A,B,C\n'
+              '1,2,3')
+      pd.read_csv(StringIO(data), comment='#', header=1)
+      data = ('A,B,C\n'
+              '#comment\n'
+              'a,b,c\n'
+              '1,2,3')
+      pd.read_csv(StringIO(data), comment='#', skiprows=2)
+
+   If both ``header`` and ``skiprows`` are specified, ``header`` will be
+   relative to the end of ``skiprows``. For example:
+
+.. ipython:: python
+
+   data = ('# empty\n'
+           '# second empty line\n'
+           '# third emptyline\n'
+           'X,Y,Z\n'
+           '1,2,3\n'
+           'A,B,C\n'
+           '1,2.,4.\n'
+           '5.,NaN,10.0\n')
+   print(data)
+   pd.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
+
+.. _io.comments:
+
+Comments
+++++++++
+
+Sometimes comments or meta data may be included in a file:
+
+.. ipython:: python
+   :suppress:
+
+   data = ("ID,level,category\n"
+           "Patient1,123000,x # really unpleasant\n"
+           "Patient2,23000,y # wouldn't take his medicine\n"
+           "Patient3,1234018,z # awesome")
+
+   with open('tmp.csv', 'w') as fh:
+       fh.write(data)
+
+.. ipython:: python
+
+   print(open('tmp.csv').read())
+
+By default, the parser includes the comments in the output:
+
+.. ipython:: python
+
+   df = pd.read_csv('tmp.csv')
+   df
+
+We can suppress the comments using the ``comment`` keyword:
+
+.. ipython:: python
+
+   df = pd.read_csv('tmp.csv', comment='#')
+   df
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('tmp.csv')
+
+.. _io.unicode:
+
+Dealing with Unicode Data
+'''''''''''''''''''''''''
+
+The ``encoding`` argument should be used for encoded unicode data, which will
+result in byte strings being decoded to unicode in the result:
+
+.. ipython:: python
+
+   data = (b'word,length\n'
+           b'Tr\xc3\xa4umen,7\n'
+           b'Gr\xc3\xbc\xc3\x9fe,5')
+   data = data.decode('utf8').encode('latin-1')
+   df = pd.read_csv(BytesIO(data), encoding='latin-1')
+   df
+   df['word'][1]
+
+Some formats which encode all characters as multiple bytes, like UTF-16, won't
+parse correctly at all without specifying the encoding. `Full list of Python
+standard encodings
+<https://docs.python.org/3/library/codecs.html#standard-encodings>`_.
+
+.. _io.index_col:
+
+Index columns and trailing delimiters
+'''''''''''''''''''''''''''''''''''''
+
+If a file has one more column of data than the number of column names, the
+first column will be used as the ``DataFrame``'s row names:
+
+.. ipython:: python
+
+    data = ('a,b,c\n'
+            '4,apple,bat,5.7\n'
+            '8,orange,cow,10')
+    pd.read_csv(StringIO(data))
+
+.. ipython:: python
+
+    data = ('index,a,b,c\n'
+            '4,apple,bat,5.7\n'
+            '8,orange,cow,10')
+    pd.read_csv(StringIO(data), index_col=0)
+
+Ordinarily, you can achieve this behavior using the ``index_col`` option.
+
+There are some exception cases when a file has been prepared with delimiters at
+the end of each data line, confusing the parser. To explicitly disable the
+index column inference and discard the last column, pass ``index_col=False``:
+
+.. ipython:: python
+
+    data = ('a,b,c\n'
+            '4,apple,bat,\n'
+            '8,orange,cow,')
+    print(data)
+    pd.read_csv(StringIO(data))
+    pd.read_csv(StringIO(data), index_col=False)
+
+If a subset of data is being parsed using the ``usecols`` option, the
+``index_col`` specification is based on that subset, not the original data.
+
+.. ipython:: python
+
+    data = ('a,b,c\n'
+            '4,apple,bat,\n'
+            '8,orange,cow,')
+    print(data)
+    pd.read_csv(StringIO(data), usecols=['b', 'c'])
+    pd.read_csv(StringIO(data), usecols=['b', 'c'], index_col=0)
+
+.. _io.parse_dates:
+
+Date Handling
+'''''''''''''
+
+Specifying Date Columns
++++++++++++++++++++++++
+
+To better facilitate working with datetime data, :func:`read_csv`
+uses the keyword arguments ``parse_dates`` and ``date_parser``
+to allow users to specify a variety of columns and date/time formats to turn the
+input text data into ``datetime`` objects.
+
+The simplest case is to just pass in ``parse_dates=True``:
+
+.. ipython:: python
+   :suppress:
+
+   f = open('foo.csv', 'w')
+   f.write('date,A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
+   f.close()
+
+.. ipython:: python
+
+   # Use a column as an index, and parse it as dates.
+   df = pd.read_csv('foo.csv', index_col=0, parse_dates=True)
+   df
+
+   # These are Python datetime objects
+   df.index
+
+It is often the case that we may want to store date and time data separately,
+or store various date fields separately. the ``parse_dates`` keyword can be
+used to specify a combination of columns to parse the dates and/or times from.
+
+You can specify a list of column lists to ``parse_dates``, the resulting date
+columns will be prepended to the output (so as to not affect the existing column
+order) and the new column names will be the concatenation of the component
+column names:
+
+.. ipython:: python
+   :suppress:
+
+   data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
+           "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
+           "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
+           "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
+           "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
+           "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
+
+   with open('tmp.csv', 'w') as fh:
+       fh.write(data)
+
+.. ipython:: python
+
+    print(open('tmp.csv').read())
+    df = pd.read_csv('tmp.csv', header=None, parse_dates=[[1, 2], [1, 3]])
+    df
+
+By default the parser removes the component date columns, but you can choose
+to retain them via the ``keep_date_col`` keyword:
+
+.. ipython:: python
+
+   df = pd.read_csv('tmp.csv', header=None, parse_dates=[[1, 2], [1, 3]],
+                    keep_date_col=True)
+   df
+
+Note that if you wish to combine multiple columns into a single date column, a
+nested list must be used. In other words, ``parse_dates=[1, 2]`` indicates that
+the second and third columns should each be parsed as separate date columns
+while ``parse_dates=[[1, 2]]`` means the two columns should be parsed into a
+single column.
+
+You can also use a dict to specify custom name columns:
+
+.. ipython:: python
+
+   date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
+   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec)
+   df
+
+It is important to remember that if multiple text columns are to be parsed into
+a single date column, then a new column is prepended to the data. The `index_col`
+specification is based off of this new set of columns rather than the original
+data columns:
+
+
+.. ipython:: python
+
+   date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
+   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec,
+                    index_col=0)  # index is the nominal column
+   df
+
+.. note::
+   If a column or index contains an unparsable date, the entire column or
+   index will be returned unaltered as an object data type. For non-standard
+   datetime parsing, use :func:`to_datetime` after ``pd.read_csv``.
+
+
+.. note::
+   read_csv has a fast_path for parsing datetime strings in iso8601 format,
+   e.g "2000-01-01T00:01:02+00:00" and similar variations. If you can arrange
+   for your data to store datetimes in this format, load times will be
+   significantly faster, ~20x has been observed.
+
+
+.. note::
+
+   When passing a dict as the `parse_dates` argument, the order of
+   the columns prepended is not guaranteed, because `dict` objects do not impose
+   an ordering on their keys. On Python 2.7+ you may use `collections.OrderedDict`
+   instead of a regular `dict` if this matters to you. Because of this, when using a
+   dict for 'parse_dates' in conjunction with the `index_col` argument, it's best to
+   specify `index_col` as a column label rather then as an index on the resulting frame.
+
+
+Date Parsing Functions
+++++++++++++++++++++++
+
+Finally, the parser allows you to specify a custom ``date_parser`` function to
+take full advantage of the flexibility of the date parsing API:
+
+.. ipython:: python
+
+   df = pd.read_csv('tmp.csv', header=None, parse_dates=date_spec,
+                    date_parser=pd.io.date_converters.parse_date_time)
+   df
+
+Pandas will try to call the ``date_parser`` function in three different ways. If
+an exception is raised, the next one is tried:
+
+1. ``date_parser`` is first called with one or more arrays as arguments,
+   as defined using `parse_dates` (e.g., ``date_parser(['2013', '2013'], ['1', '2'])``).
+
+2. If #1 fails, ``date_parser`` is called with all the columns
+   concatenated row-wise into a single array (e.g., ``date_parser(['2013 1', '2013 2'])``).
+
+3. If #2 fails, ``date_parser`` is called once for every row with one or more
+   string arguments from the columns indicated with `parse_dates`
+   (e.g., ``date_parser('2013', '1')`` for the first row, ``date_parser('2013', '2')``
+   for the second, etc.).
+
+Note that performance-wise, you should try these methods of parsing dates in order:
+
+1. Try to infer the format using ``infer_datetime_format=True`` (see section below).
+
+2. If you know the format, use ``pd.to_datetime()``:
+   ``date_parser=lambda x: pd.to_datetime(x, format=...)``.
+
+3. If you have a really non-standard format, use a custom ``date_parser`` function.
+   For optimal performance, this should be vectorized, i.e., it should accept arrays
+   as arguments.
+
+You can explore the date parsing functionality in
+`date_converters.py <https://github.com/pandas-dev/pandas/blob/master/pandas/io/date_converters.py>`__
+and add your own. We would love to turn this module into a community supported
+set of date/time parsers. To get you started, ``date_converters.py`` contains
+functions to parse dual date and time columns, year/month/day columns,
+and year/month/day/hour/minute/second columns. It also contains a
+``generic_parser`` function so you can curry it with a function that deals with
+a single date rather than the entire array.
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('tmp.csv')
+
+
+.. _io.csv.mixed_timezones:
+
+Parsing a CSV with mixed Timezones
+++++++++++++++++++++++++++++++++++
+
+Pandas cannot natively represent a column or index with mixed timezones. If your CSV
+file contains columns with a mixture of timezones, the default result will be
+an object-dtype column with strings, even with ``parse_dates``.
+
+
+.. ipython:: python
+
+   content = """\
+   a
+   2000-01-01T00:00:00+05:00
+   2000-01-01T00:00:00+06:00"""
+   df = pd.read_csv(StringIO(content), parse_dates=['a'])
+   df['a']
+
+To parse the mixed-timezone values as a datetime column, pass a partially-applied
+:func:`to_datetime` with ``utc=True`` as the ``date_parser``.
+
+.. ipython:: python
+
+   df = pd.read_csv(StringIO(content), parse_dates=['a'],
+                    date_parser=lambda col: pd.to_datetime(col, utc=True))
+   df['a']
+
+
+.. _io.dayfirst:
+
+
+Inferring Datetime Format
++++++++++++++++++++++++++
+
+If you have ``parse_dates`` enabled for some or all of your columns, and your
+datetime strings are all formatted the same way, you may get a large speed
+up by setting ``infer_datetime_format=True``.  If set, pandas will attempt
+to guess the format of your datetime strings, and then use a faster means
+of parsing the strings.  5-10x parsing speeds have been observed.  pandas
+will fallback to the usual parsing if either the format cannot be guessed
+or the format that was guessed cannot properly parse the entire column
+of strings.  So in general, ``infer_datetime_format`` should not have any
+negative consequences if enabled.
+
+Here are some examples of datetime strings that can be guessed (All
+representing December 30th, 2011 at 00:00:00):
+
+* "20111230"
+* "2011/12/30"
+* "20111230 00:00:00"
+* "12/30/2011 00:00:00"
+* "30/Dec/2011 00:00:00"
+* "30/December/2011 00:00:00"
+
+Note that ``infer_datetime_format`` is sensitive to ``dayfirst``.  With
+``dayfirst=True``, it will guess "01/12/2011" to be December 1st. With
+``dayfirst=False`` (default) it will guess "01/12/2011" to be January 12th.
+
+.. ipython:: python
+
+   # Try to infer the format for the index column
+   df = pd.read_csv('foo.csv', index_col=0, parse_dates=True,
+                    infer_datetime_format=True)
+   df
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('foo.csv')
+
+International Date Formats
+++++++++++++++++++++++++++
+
+While US date formats tend to be MM/DD/YYYY, many international formats use
+DD/MM/YYYY instead. For convenience, a ``dayfirst`` keyword is provided:
+
+.. ipython:: python
+   :suppress:
+
+   data = ("date,value,cat\n"
+           "1/6/2000,5,a\n"
+           "2/6/2000,10,b\n"
+           "3/6/2000,15,c")
+   with open('tmp.csv', 'w') as fh:
+       fh.write(data)
+
+.. ipython:: python
+
+   print(open('tmp.csv').read())
+
+   pd.read_csv('tmp.csv', parse_dates=[0])
+   pd.read_csv('tmp.csv', dayfirst=True, parse_dates=[0])
+
+.. _io.float_precision:
+
+Specifying method for floating-point conversion
+'''''''''''''''''''''''''''''''''''''''''''''''
+
+The parameter ``float_precision`` can be specified in order to use
+a specific floating-point converter during parsing with the C engine.
+The options are the ordinary converter, the high-precision converter, and
+the round-trip converter (which is guaranteed to round-trip values after
+writing to a file). For example:
+
+.. ipython:: python
+
+   val = '0.3066101993807095471566981359501369297504425048828125'
+   data = 'a,b,c\n1,2,{0}'.format(val)
+   abs(pd.read_csv(StringIO(data), engine='c',
+                   float_precision=None)['c'][0] - float(val))
+   abs(pd.read_csv(StringIO(data), engine='c',
+                   float_precision='high')['c'][0] - float(val))
+   abs(pd.read_csv(StringIO(data), engine='c',
+                   float_precision='round_trip')['c'][0] - float(val))
+
+
+.. _io.thousands:
+
+Thousand Separators
+'''''''''''''''''''
+
+For large numbers that have been written with a thousands separator, you can
+set the ``thousands`` keyword to a string of length 1 so that integers will be parsed
+correctly:
+
+.. ipython:: python
+   :suppress:
+
+   data = ("ID|level|category\n"
+           "Patient1|123,000|x\n"
+           "Patient2|23,000|y\n"
+           "Patient3|1,234,018|z")
+
+   with open('tmp.csv', 'w') as fh:
+       fh.write(data)
+
+By default, numbers with a thousands separator will be parsed as strings:
+
+.. ipython:: python
+
+    print(open('tmp.csv').read())
+    df = pd.read_csv('tmp.csv', sep='|')
+    df
+
+    df.level.dtype
+
+The ``thousands`` keyword allows integers to be parsed correctly:
+
+.. ipython:: python
+
+    print(open('tmp.csv').read())
+    df = pd.read_csv('tmp.csv', sep='|', thousands=',')
+    df
+
+    df.level.dtype
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('tmp.csv')
+
+.. _io.na_values:
+
+NA Values
+'''''''''
+
+To control which values are parsed as missing values (which are signified by
+``NaN``), specify a string in ``na_values``. If you specify a list of strings,
+then all values in it are considered to be missing values. If you specify a
+number (a ``float``, like ``5.0`` or an ``integer`` like ``5``), the
+corresponding equivalent values will also imply a missing value (in this case
+effectively ``[5.0, 5]`` are recognized as ``NaN``).
+
+To completely override the default values that are recognized as missing, specify ``keep_default_na=False``.
+
+.. _io.navaluesconst:
+
+The default ``NaN`` recognized values are ``['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A', 'N/A',
+'n/a', 'NA', '#NA', 'NULL', 'null', 'NaN', '-NaN', 'nan', '-nan', '']``.
+
+Let us consider some examples:
+
+.. code-block:: python
+
+   pd.read_csv('path_to_file.csv', na_values=[5])
+
+In the example above ``5`` and ``5.0`` will be recognized as ``NaN``, in
+addition to the defaults. A string will first be interpreted as a numerical
+``5``, then as a ``NaN``.
+
+.. code-block:: python
+
+   pd.read_csv('path_to_file.csv', keep_default_na=False, na_values=[""])
+
+Above, only an empty field will be recognized as ``NaN``.
+
+.. code-block:: python
+
+   pd.read_csv('path_to_file.csv', keep_default_na=False, na_values=["NA", "0"])
+
+Above, both ``NA`` and ``0`` as strings are ``NaN``.
+
+.. code-block:: python
+
+   pd.read_csv('path_to_file.csv', na_values=["Nope"])
+
+The default values, in addition to the string ``"Nope"`` are recognized as
+``NaN``.
+
+.. _io.infinity:
+
+Infinity
+''''''''
+
+``inf`` like values will be parsed as ``np.inf`` (positive infinity), and ``-inf`` as ``-np.inf`` (negative infinity).
+These will ignore the case of the value, meaning ``Inf``, will also be parsed as ``np.inf``.
+
+
+Returning Series
+''''''''''''''''
+
+Using the ``squeeze`` keyword, the parser will return output with a single column
+as a ``Series``:
+
+.. ipython:: python
+   :suppress:
+
+   data = ("level\n"
+           "Patient1,123000\n"
+           "Patient2,23000\n"
+           "Patient3,1234018")
+
+   with open('tmp.csv', 'w') as fh:
+       fh.write(data)
+
+.. ipython:: python
+
+   print(open('tmp.csv').read())
+
+   output = pd.read_csv('tmp.csv', squeeze=True)
+   output
+
+   type(output)
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('tmp.csv')
+
+.. _io.boolean:
+
+Boolean values
+''''''''''''''
+
+The common values ``True``, ``False``, ``TRUE``, and ``FALSE`` are all
+recognized as boolean. Occasionally you might want to recognize other values
+as being boolean. To do this, use the ``true_values`` and ``false_values``
+options as follows:
+
+.. ipython:: python
+
+    data = ('a,b,c\n'
+            '1,Yes,2\n'
+            '3,No,4')
+    print(data)
+    pd.read_csv(StringIO(data))
+    pd.read_csv(StringIO(data), true_values=['Yes'], false_values=['No'])
+
+.. _io.bad_lines:
+
+Handling "bad" lines
+''''''''''''''''''''
+
+Some files may have malformed lines with too few fields or too many. Lines with
+too few fields will have NA values filled in the trailing fields. Lines with
+too many fields will raise an error by default:
+
+.. ipython:: python
+    :okexcept:
+
+    data = ('a,b,c\n'
+            '1,2,3\n'
+            '4,5,6,7\n'
+            '8,9,10')
+    pd.read_csv(StringIO(data))
+
+You can elect to skip bad lines:
+
+.. code-block:: ipython
+
+    In [29]: pd.read_csv(StringIO(data), error_bad_lines=False)
+    Skipping line 3: expected 3 fields, saw 4
+
+    Out[29]:
+       a  b   c
+    0  1  2   3
+    1  8  9  10
+
+You can also use the ``usecols`` parameter to eliminate extraneous column
+data that appear in some lines but not others:
+
+.. code-block:: ipython
+
+   In [30]: pd.read_csv(StringIO(data), usecols=[0, 1, 2])
+
+    Out[30]:
+       a  b   c
+    0  1  2   3
+    1  4  5   6
+    2  8  9  10
+
+.. _io.dialect:
+
+Dialect
+'''''''
+
+The ``dialect`` keyword gives greater flexibility in specifying the file format.
+By default it uses the Excel dialect but you can specify either the dialect name
+or a :class:`python:csv.Dialect` instance.
+
+.. ipython:: python
+   :suppress:
+
+   data = ('label1,label2,label3\n'
+           'index1,"a,c,e\n'
+           'index2,b,d,f')
+
+Suppose you had data with unenclosed quotes:
+
+.. ipython:: python
+
+   print(data)
+
+By default, ``read_csv`` uses the Excel dialect and treats the double quote as
+the quote character, which causes it to fail when it finds a newline before it
+finds the closing double quote.
+
+We can get around this using ``dialect``:
+
+.. ipython:: python
+   :okwarning:
+
+   import csv
+   dia = csv.excel()
+   dia.quoting = csv.QUOTE_NONE
+   pd.read_csv(StringIO(data), dialect=dia)
+
+All of the dialect options can be specified separately by keyword arguments:
+
+.. ipython:: python
+
+    data = 'a,b,c~1,2,3~4,5,6'
+    pd.read_csv(StringIO(data), lineterminator='~')
+
+Another common dialect option is ``skipinitialspace``, to skip any whitespace
+after a delimiter:
+
+.. ipython:: python
+
+   data = 'a, b, c\n1, 2, 3\n4, 5, 6'
+   print(data)
+   pd.read_csv(StringIO(data), skipinitialspace=True)
+
+The parsers make every attempt to "do the right thing" and not be fragile. Type
+inference is a pretty big deal. If a column can be coerced to integer dtype
+without altering the contents, the parser will do so. Any non-numeric
+columns will come through as object dtype as with the rest of pandas objects.
+
+.. _io.quoting:
+
+Quoting and Escape Characters
+'''''''''''''''''''''''''''''
+
+Quotes (and other escape characters) in embedded fields can be handled in any
+number of ways. One way is to use backslashes; to properly parse this data, you
+should pass the ``escapechar`` option:
+
+.. ipython:: python
+
+   data = 'a,b\n"hello, \\"Bob\\", nice to see you",5'
+   print(data)
+   pd.read_csv(StringIO(data), escapechar='\\')
+
+.. _io.fwf:
+
+Files with Fixed Width Columns
+''''''''''''''''''''''''''''''
+
+While :func:`read_csv` reads delimited data, the :func:`read_fwf` function works
+with data files that have known and fixed column widths. The function parameters
+to ``read_fwf`` are largely the same as `read_csv` with two extra parameters, and
+a different usage of the ``delimiter`` parameter:
+
+* ``colspecs``: A list of pairs (tuples) giving the extents of the
+  fixed-width fields of each line as half-open intervals (i.e.,  [from, to[ ).
+  String value 'infer' can be used to instruct the parser to try detecting
+  the column specifications from the first 100 rows of the data. Default
+  behavior, if not specified, is to infer.
+* ``widths``: A list of field widths which can be used instead of 'colspecs'
+  if the intervals are contiguous.
+* ``delimiter``: Characters to consider as filler characters in the fixed-width file.
+  Can be used to specify the filler character of the fields
+  if it is not spaces (e.g., '~').
+
+.. ipython:: python
+   :suppress:
+
+   f = open('bar.csv', 'w')
+   data1 = ("id8141    360.242940   149.910199   11950.7\n"
+            "id1594    444.953632   166.985655   11788.4\n"
+            "id1849    364.136849   183.628767   11806.2\n"
+            "id1230    413.836124   184.375703   11916.8\n"
+            "id1948    502.953953   173.237159   12468.3")
+   f.write(data1)
+   f.close()
+
+Consider a typical fixed-width data file:
+
+.. ipython:: python
+
+   print(open('bar.csv').read())
+
+In order to parse this file into a ``DataFrame``, we simply need to supply the
+column specifications to the `read_fwf` function along with the file name:
+
+.. ipython:: python
+
+   # Column specifications are a list of half-intervals
+   colspecs = [(0, 6), (8, 20), (21, 33), (34, 43)]
+   df = pd.read_fwf('bar.csv', colspecs=colspecs, header=None, index_col=0)
+   df
+
+Note how the parser automatically picks column names X.<column number> when
+``header=None`` argument is specified. Alternatively, you can supply just the
+column widths for contiguous columns:
+
+.. ipython:: python
+
+   # Widths are a list of integers
+   widths = [6, 14, 13, 10]
+   df = pd.read_fwf('bar.csv', widths=widths, header=None)
+   df
+
+The parser will take care of extra white spaces around the columns
+so it's ok to have extra separation between the columns in the file.
+
+By default, ``read_fwf`` will try to infer the file's ``colspecs`` by using the
+first 100 rows of the file. It can do it only in cases when the columns are
+aligned and correctly separated by the provided ``delimiter`` (default delimiter
+is whitespace).
+
+.. ipython:: python
+
+   df = pd.read_fwf('bar.csv', header=None, index_col=0)
+   df
+
+.. versionadded:: 0.20.0
+
+``read_fwf`` supports the ``dtype`` parameter for specifying the types of
+parsed columns to be different from the inferred type.
+
+.. ipython:: python
+
+   pd.read_fwf('bar.csv', header=None, index_col=0).dtypes
+   pd.read_fwf('bar.csv', header=None, dtype={2: 'object'}).dtypes
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('bar.csv')
+
+
+Indexes
+'''''''
+
+Files with an "implicit" index column
++++++++++++++++++++++++++++++++++++++
+
+.. ipython:: python
+   :suppress:
+
+   f = open('foo.csv', 'w')
+   f.write('A,B,C\n20090101,a,1,2\n20090102,b,3,4\n20090103,c,4,5')
+   f.close()
+
+Consider a file with one less entry in the header than the number of data
+column:
+
+.. ipython:: python
+
+   print(open('foo.csv').read())
+
+In this special case, ``read_csv`` assumes that the first column is to be used
+as the index of the ``DataFrame``:
+
+.. ipython:: python
+
+   pd.read_csv('foo.csv')
+
+Note that the dates weren't automatically parsed. In that case you would need
+to do as before:
+
+.. ipython:: python
+
+   df = pd.read_csv('foo.csv', parse_dates=True)
+   df.index
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('foo.csv')
+
+
+Reading an index with a ``MultiIndex``
+++++++++++++++++++++++++++++++++++++++
+
+.. _io.csv_multiindex:
+
+Suppose you have data indexed by two columns:
+
+.. ipython:: python
+
+   print(open('data/mindex_ex.csv').read())
+
+The ``index_col`` argument to ``read_csv`` can take a list of
+column numbers to turn multiple columns into a ``MultiIndex`` for the index of the
+returned object:
+
+.. ipython:: python
+
+   df = pd.read_csv("data/mindex_ex.csv", index_col=[0, 1])
+   df
+   df.loc[1978]
+
+.. _io.multi_index_columns:
+
+Reading columns with a ``MultiIndex``
++++++++++++++++++++++++++++++++++++++
+
+By specifying list of row locations for the ``header`` argument, you
+can read in a ``MultiIndex`` for the columns. Specifying non-consecutive
+rows will skip the intervening rows.
+
+.. ipython:: python
+
+   from pandas.util.testing import makeCustomDataframe as mkdf
+   df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+   df.to_csv('mi.csv')
+   print(open('mi.csv').read())
+   pd.read_csv('mi.csv', header=[0, 1, 2, 3], index_col=[0, 1])
+
+``read_csv`` is also able to interpret a more common format
+of multi-columns indices.
+
+.. ipython:: python
+   :suppress:
+
+   data = ",a,a,a,b,c,c\n,q,r,s,t,u,v\none,1,2,3,4,5,6\ntwo,7,8,9,10,11,12"
+   fh = open('mi2.csv', 'w')
+   fh.write(data)
+   fh.close()
+
+.. ipython:: python
+
+   print(open('mi2.csv').read())
+   pd.read_csv('mi2.csv', header=[0, 1], index_col=0)
+
+Note: If an ``index_col`` is not specified (e.g. you don't have an index, or wrote it
+with ``df.to_csv(..., index=False)``, then any ``names`` on the columns index will be *lost*.
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('mi.csv')
+   os.remove('mi2.csv')
+
+.. _io.sniff:
+
+Automatically "sniffing" the delimiter
+''''''''''''''''''''''''''''''''''''''
+
+``read_csv`` is capable of inferring delimited (not necessarily
+comma-separated) files, as pandas uses the :class:`python:csv.Sniffer`
+class of the csv module. For this, you have to specify ``sep=None``.
+
+.. ipython:: python
+   :suppress:
+
+   df = pd.DataFrame(np.random.randn(10, 4))
+   df.to_csv('tmp.sv', sep='|')
+   df.to_csv('tmp2.sv', sep=':')
+
+.. ipython:: python
+
+   print(open('tmp2.sv').read())
+   pd.read_csv('tmp2.sv', sep=None, engine='python')
+
+.. _io.multiple_files:
+
+Reading multiple files to create a single DataFrame
+'''''''''''''''''''''''''''''''''''''''''''''''''''
+
+It's best to use :func:`~pandas.concat` to combine multiple files.
+See the :ref:`cookbook<cookbook.csv.multiple_files>` for an example.
+
+.. _io.chunking:
+
+Iterating through files chunk by chunk
+''''''''''''''''''''''''''''''''''''''
+
+Suppose you wish to iterate through a (potentially very large) file lazily
+rather than reading the entire file into memory, such as the following:
+
+
+.. ipython:: python
+
+   print(open('tmp.sv').read())
+   table = pd.read_csv('tmp.sv', sep='|')
+   table
+
+
+By specifying a ``chunksize`` to ``read_csv``, the return
+value will be an iterable object of type ``TextFileReader``:
+
+.. ipython:: python
+
+   reader = pd.read_csv('tmp.sv', sep='|', chunksize=4)
+   reader
+
+   for chunk in reader:
+       print(chunk)
+
+
+Specifying ``iterator=True`` will also return the ``TextFileReader`` object:
+
+.. ipython:: python
+
+   reader = pd.read_csv('tmp.sv', sep='|', iterator=True)
+   reader.get_chunk(5)
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('tmp.sv')
+   os.remove('tmp2.sv')
+
+Specifying the parser engine
+''''''''''''''''''''''''''''
+
+Under the hood pandas uses a fast and efficient parser implemented in C as well
+as a Python implementation which is currently more feature-complete. Where
+possible pandas uses the C parser (specified as ``engine='c'``), but may fall
+back to Python if C-unsupported options are specified. Currently, C-unsupported
+options include:
+
+* ``sep`` other than a single character (e.g. regex separators)
+* ``skipfooter``
+* ``sep=None`` with ``delim_whitespace=False``
+
+Specifying any of the above options will produce a ``ParserWarning`` unless the
+python engine is selected explicitly using ``engine='python'``.
+
+Reading remote files
+''''''''''''''''''''
+
+You can pass in a URL to a CSV file:
+
+.. code-block:: python
+
+   df = pd.read_csv('https://download.bls.gov/pub/time.series/cu/cu.item',
+                    sep='\t')
+
+S3 URLs are handled as well but require installing the `S3Fs
+<https://pypi.org/project/s3fs/>`_ library:
+
+.. code-block:: python
+
+   df = pd.read_csv('s3://pandas-test/tips.csv')
+
+If your S3 bucket requires cedentials you will need to set them as environment
+variables or in the ``~/.aws/credentials`` config file, refer to the `S3Fs
+documentation on credentials
+<https://s3fs.readthedocs.io/en/latest/#credentials>`_.
+
+
+
+Writing out Data
+''''''''''''''''
+
+.. _io.store_in_csv:
+
+Writing to CSV format
++++++++++++++++++++++
+
+The ``Series`` and ``DataFrame`` objects have an instance method ``to_csv`` which
+allows storing the contents of the object as a comma-separated-values file. The
+function takes a number of arguments. Only the first is required.
+
+* ``path_or_buf``: A string path to the file to write or a StringIO
+* ``sep`` : Field delimiter for the output file (default ",")
+* ``na_rep``: A string representation of a missing value (default '')
+* ``float_format``: Format string for floating point numbers
+* ``columns``: Columns to write (default None)
+* ``header``: Whether to write out the column names (default True)
+* ``index``: whether to write row (index) names (default True)
+* ``index_label``: Column label(s) for index column(s) if desired. If None
+  (default), and `header` and `index` are True, then the index names are
+  used. (A sequence should be given if the ``DataFrame`` uses MultiIndex).
+* ``mode`` : Python write mode, default 'w'
+* ``encoding``: a string representing the encoding to use if the contents are
+  non-ASCII, for Python versions prior to 3
+* ``line_terminator``: Character sequence denoting line end (default '\\n')
+* ``quoting``: Set quoting rules as in csv module (default csv.QUOTE_MINIMAL). Note that if you have set a `float_format` then floats are converted to strings and csv.QUOTE_NONNUMERIC will treat them as non-numeric
+* ``quotechar``: Character used to quote fields (default '"')
+* ``doublequote``: Control quoting of ``quotechar`` in fields (default True)
+* ``escapechar``: Character used to escape ``sep`` and ``quotechar`` when
+  appropriate (default None)
+* ``chunksize``: Number of rows to write at a time
+* ``tupleize_cols``: If False (default), write as a list of tuples, otherwise
+  write in an expanded line format suitable for ``read_csv``
+* ``date_format``: Format string for datetime objects
+
+Writing a formatted string
+++++++++++++++++++++++++++
+
+.. _io.formatting:
+
+The ``DataFrame`` object has an instance method ``to_string`` which allows control
+over the string representation of the object. All arguments are optional:
+
+* ``buf`` default None, for example a StringIO object
+* ``columns`` default None, which columns to write
+* ``col_space`` default None, minimum width of each column.
+* ``na_rep`` default ``NaN``, representation of NA value
+* ``formatters`` default None, a dictionary (by column) of functions each of
+  which takes a single argument and returns a formatted string
+* ``float_format`` default None, a function which takes a single (float)
+  argument and returns a formatted string; to be applied to floats in the
+  ``DataFrame``.
+* ``sparsify`` default True, set to False for a ``DataFrame`` with a hierarchical
+  index to print every MultiIndex key at each row.
+* ``index_names`` default True, will print the names of the indices
+* ``index`` default True, will print the index (ie, row labels)
+* ``header`` default True, will print the column labels
+* ``justify`` default ``left``, will print column headers left- or
+  right-justified
+
+The ``Series`` object also has a ``to_string`` method, but with only the ``buf``,
+``na_rep``, ``float_format`` arguments. There is also a ``length`` argument
+which, if set to ``True``, will additionally output the length of the Series.
+
+.. _io.json:
+
+JSON
+----
+
+Read and write ``JSON`` format files and strings.
+
+.. _io.json_writer:
+
+Writing JSON
+''''''''''''
+
+A ``Series`` or ``DataFrame`` can be converted to a valid JSON string. Use ``to_json``
+with optional parameters:
+
+* ``path_or_buf`` : the pathname or buffer to write the output
+  This can be ``None`` in which case a JSON string is returned
+* ``orient`` :
+
+  ``Series``:
+      * default is ``index``
+      * allowed values are {``split``, ``records``, ``index``}
+
+  ``DataFrame``:
+      * default is ``columns``
+      * allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``, ``table``}
+
+  The format of the JSON string
+
+  .. csv-table::
+     :widths: 20, 150
+     :delim: ;
+
+     ``split``; dict like {index -> [index], columns -> [columns], data -> [values]}
+     ``records``; list like [{column -> value}, ... , {column -> value}]
+     ``index``; dict like {index -> {column -> value}}
+     ``columns``; dict like {column -> {index -> value}}
+     ``values``; just the values array
+
+* ``date_format`` : string, type of date conversion, 'epoch' for timestamp, 'iso' for ISO8601.
+* ``double_precision`` : The number of decimal places to use when encoding floating point values, default 10.
+* ``force_ascii`` : force encoded string to be ASCII, default True.
+* ``date_unit`` : The time unit to encode to, governs timestamp and ISO8601 precision. One of 's', 'ms', 'us' or 'ns' for seconds, milliseconds, microseconds and nanoseconds respectively. Default 'ms'.
+* ``default_handler`` : The handler to call if an object cannot otherwise be converted to a suitable format for JSON. Takes a single argument, which is the object to convert, and returns a serializable object.
+* ``lines`` : If ``records`` orient, then will write each record per line as json.
+
+Note ``NaN``'s, ``NaT``'s and ``None`` will be converted to ``null`` and ``datetime`` objects will be converted based on the ``date_format`` and ``date_unit`` parameters.
+
+.. ipython:: python
+
+   dfj = pd.DataFrame(np.random.randn(5, 2), columns=list('AB'))
+   json = dfj.to_json()
+   json
+
+Orient Options
+++++++++++++++
+
+There are a number of different options for the format of the resulting JSON
+file / string. Consider the following ``DataFrame`` and ``Series``:
+
+.. ipython:: python
+
+  dfjo = pd.DataFrame(dict(A=range(1, 4), B=range(4, 7), C=range(7, 10)),
+                      columns=list('ABC'), index=list('xyz'))
+  dfjo
+  sjo = pd.Series(dict(x=15, y=16, z=17), name='D')
+  sjo
+
+**Column oriented** (the default for ``DataFrame``) serializes the data as
+nested JSON objects with column labels acting as the primary index:
+
+.. ipython:: python
+
+  dfjo.to_json(orient="columns")
+  # Not available for Series
+
+**Index oriented** (the default for ``Series``) similar to column oriented
+but the index labels are now primary:
+
+.. ipython:: python
+
+  dfjo.to_json(orient="index")
+  sjo.to_json(orient="index")
+
+**Record oriented** serializes the data to a JSON array of column -> value records,
+index labels are not included. This is useful for passing ``DataFrame`` data to plotting
+libraries, for example the JavaScript library ``d3.js``:
+
+.. ipython:: python
+
+  dfjo.to_json(orient="records")
+  sjo.to_json(orient="records")
+
+**Value oriented** is a bare-bones option which serializes to nested JSON arrays of
+values only, column and index labels are not included:
+
+.. ipython:: python
+
+  dfjo.to_json(orient="values")
+  # Not available for Series
+
+**Split oriented** serializes to a JSON object containing separate entries for
+values, index and columns. Name is also included for ``Series``:
+
+.. ipython:: python
+
+  dfjo.to_json(orient="split")
+  sjo.to_json(orient="split")
+
+**Table oriented** serializes to the JSON `Table Schema`_, allowing for the
+preservation of metadata including but not limited to dtypes and index names.
+
+.. note::
+
+  Any orient option that encodes to a JSON object will not preserve the ordering of
+  index and column labels during round-trip serialization. If you wish to preserve
+  label ordering use the `split` option as it uses ordered containers.
+
+Date Handling
++++++++++++++
+
+Writing in ISO date format:
+
+.. ipython:: python
+
+   dfd = pd.DataFrame(np.random.randn(5, 2), columns=list('AB'))
+   dfd['date'] = pd.Timestamp('20130101')
+   dfd = dfd.sort_index(1, ascending=False)
+   json = dfd.to_json(date_format='iso')
+   json
+
+Writing in ISO date format, with microseconds:
+
+.. ipython:: python
+
+   json = dfd.to_json(date_format='iso', date_unit='us')
+   json
+
+Epoch timestamps, in seconds:
+
+.. ipython:: python
+
+   json = dfd.to_json(date_format='epoch', date_unit='s')
+   json
+
+Writing to a file, with a date index and a date column:
+
+.. ipython:: python
+
+   dfj2 = dfj.copy()
+   dfj2['date'] = pd.Timestamp('20130101')
+   dfj2['ints'] = list(range(5))
+   dfj2['bools'] = True
+   dfj2.index = pd.date_range('20130101', periods=5)
+   dfj2.to_json('test.json')
+
+   with open('test.json') as fh:
+       print(fh.read())
+
+Fallback Behavior
++++++++++++++++++
+
+If the JSON serializer cannot handle the container contents directly it will
+fall back in the following manner:
+
+* if the dtype is unsupported (e.g. ``np.complex``) then the ``default_handler``, if provided, will be called
+  for each value, otherwise an exception is raised.
+
+* if an object is unsupported it will attempt the following:
+
+
+    * check if the object has defined a ``toDict`` method and call it.
+      A ``toDict`` method should return a ``dict`` which will then be JSON serialized.
+
+    * invoke the ``default_handler`` if one was provided.
+
+    * convert the object to a ``dict`` by traversing its contents. However this will often fail
+      with an ``OverflowError`` or give unexpected results.
+
+In general the best approach for unsupported objects or dtypes is to provide a ``default_handler``.
+For example:
+
+.. code-block:: python
+
+  >>> DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json()  # raises
+  RuntimeError: Unhandled numpy dtype 15
+
+can be dealt with by specifying a simple ``default_handler``:
+
+.. ipython:: python
+
+   pd.DataFrame([1.0, 2.0, complex(1.0, 2.0)]).to_json(default_handler=str)
+
+.. _io.json_reader:
+
+Reading JSON
+''''''''''''
+
+Reading a JSON string to pandas object can take a number of parameters.
+The parser will try to parse a ``DataFrame`` if ``typ`` is not supplied or
+is ``None``. To explicitly force ``Series`` parsing, pass ``typ=series``
+
+* ``filepath_or_buffer`` : a **VALID** JSON string or file handle / StringIO. The string could be
+  a URL. Valid URL schemes include http, ftp, S3, and file. For file URLs, a host
+  is expected. For instance, a local file could be
+  file ://localhost/path/to/table.json
+* ``typ``    : type of object to recover (series or frame), default 'frame'
+* ``orient`` :
+
+  Series :
+      * default is ``index``
+      * allowed values are {``split``, ``records``, ``index``}
+
+  DataFrame
+      * default is ``columns``
+      * allowed values are {``split``, ``records``, ``index``, ``columns``, ``values``, ``table``}
+
+  The format of the JSON string
+
+  .. csv-table::
+     :widths: 20, 150
+     :delim: ;
+
+     ``split``; dict like {index -> [index], columns -> [columns], data -> [values]}
+     ``records``; list like [{column -> value}, ... , {column -> value}]
+     ``index``; dict like {index -> {column -> value}}
+     ``columns``; dict like {column -> {index -> value}}
+     ``values``; just the values array
+     ``table``; adhering to the JSON `Table Schema`_
+
+
+* ``dtype`` : if True, infer dtypes, if a dict of column to dtype, then use those, if ``False``, then don't infer dtypes at all, default is True, apply only to the data.
+* ``convert_axes`` : boolean, try to convert the axes to the proper dtypes, default is ``True``
+* ``convert_dates`` : a list of columns to parse for dates; If ``True``, then try to parse date-like columns, default is ``True``.
+* ``keep_default_dates`` : boolean, default ``True``. If parsing dates, then parse the default date-like columns.
+* ``numpy`` : direct decoding to NumPy arrays. default is ``False``;
+  Supports numeric data only, although labels may be non-numeric. Also note that the JSON ordering **MUST** be the same for each term if ``numpy=True``.
+* ``precise_float`` : boolean, default ``False``. Set to enable usage of higher precision (strtod) function when decoding string to double values. Default (``False``) is to use fast but less precise builtin functionality.
+* ``date_unit`` : string, the timestamp unit to detect if converting dates. Default
+  None. By default the timestamp precision will be detected, if this is not desired
+  then pass one of 's', 'ms', 'us' or 'ns' to force timestamp precision to
+  seconds, milliseconds, microseconds or nanoseconds respectively.
+* ``lines`` : reads file as one json object per line.
+* ``encoding`` : The encoding to use to decode py3 bytes.
+* ``chunksize`` : when used in combination with ``lines=True``, return a JsonReader which reads in ``chunksize`` lines per iteration.
+
+The parser will raise one of ``ValueError/TypeError/AssertionError`` if the JSON is not parseable.
+
+If a non-default ``orient`` was used when encoding to JSON be sure to pass the same
+option here so that decoding produces sensible results, see `Orient Options`_ for an
+overview.
+
+Data Conversion
++++++++++++++++
+
+The default of ``convert_axes=True``, ``dtype=True``, and ``convert_dates=True``
+will try to parse the axes, and all of the data into appropriate types,
+including dates. If you need to override specific dtypes, pass a dict to
+``dtype``. ``convert_axes`` should only be set to ``False`` if you need to
+preserve string-like numbers (e.g. '1', '2') in an axes.
+
+.. note::
+
+  Large integer values may be converted to dates if ``convert_dates=True`` and the data and / or column labels appear 'date-like'. The exact threshold depends on the ``date_unit`` specified. 'date-like' means that the column label meets one of the following criteria:
+
+     * it ends with ``'_at'``
+     * it ends with ``'_time'``
+     * it begins with ``'timestamp'``
+     * it is ``'modified'``
+     * it is ``'date'``
+
+.. warning::
+
+   When reading JSON data, automatic coercing into dtypes has some quirks:
+
+     * an index can be reconstructed in a different order from serialization, that is, the returned order is not guaranteed to be the same as before serialization
+     * a column that was ``float`` data will be converted to ``integer`` if it can be done safely, e.g. a column of ``1.``
+     * bool columns will be converted to ``integer`` on reconstruction
+
+   Thus there are times where you may want to specify specific dtypes via the ``dtype`` keyword argument.
+
+Reading from a JSON string:
+
+.. ipython:: python
+
+   pd.read_json(json)
+
+Reading from a file:
+
+.. ipython:: python
+
+   pd.read_json('test.json')
+
+Don't convert any data (but still convert axes and dates):
+
+.. ipython:: python
+
+   pd.read_json('test.json', dtype=object).dtypes
+
+Specify dtypes for conversion:
+
+.. ipython:: python
+
+   pd.read_json('test.json', dtype={'A': 'float32', 'bools': 'int8'}).dtypes
+
+Preserve string indices:
+
+.. ipython:: python
+
+   si = pd.DataFrame(np.zeros((4, 4)), columns=list(range(4)),
+                     index=[str(i) for i in range(4)])
+   si
+   si.index
+   si.columns
+   json = si.to_json()
+
+   sij = pd.read_json(json, convert_axes=False)
+   sij
+   sij.index
+   sij.columns
+
+Dates written in nanoseconds need to be read back in nanoseconds:
+
+.. ipython:: python
+
+   json = dfj2.to_json(date_unit='ns')
+
+   # Try to parse timestamps as millseconds -> Won't Work
+   dfju = pd.read_json(json, date_unit='ms')
+   dfju
+
+   # Let pandas detect the correct precision
+   dfju = pd.read_json(json)
+   dfju
+
+   # Or specify that all timestamps are in nanoseconds
+   dfju = pd.read_json(json, date_unit='ns')
+   dfju
+
+The Numpy Parameter
++++++++++++++++++++
+
+.. note::
+  This supports numeric data only. Index and columns labels may be non-numeric, e.g. strings, dates etc.
+
+If ``numpy=True`` is passed to ``read_json`` an attempt will be made to sniff
+an appropriate dtype during deserialization and to subsequently decode directly
+to NumPy arrays, bypassing the need for intermediate Python objects.
+
+This can provide speedups if you are deserialising a large amount of numeric
+data:
+
+.. ipython:: python
+
+   randfloats = np.random.uniform(-100, 1000, 10000)
+   randfloats.shape = (1000, 10)
+   dffloats = pd.DataFrame(randfloats, columns=list('ABCDEFGHIJ'))
+
+   jsonfloats = dffloats.to_json()
+
+.. ipython:: python
+
+   %timeit pd.read_json(jsonfloats)
+
+.. ipython:: python
+
+   %timeit pd.read_json(jsonfloats, numpy=True)
+
+The speedup is less noticeable for smaller datasets:
+
+.. ipython:: python
+
+   jsonfloats = dffloats.head(100).to_json()
+
+.. ipython:: python
+
+   %timeit pd.read_json(jsonfloats)
+
+.. ipython:: python
+
+   %timeit pd.read_json(jsonfloats, numpy=True)
+
+.. warning::
+
+   Direct NumPy decoding makes a number of assumptions and may fail or produce
+   unexpected output if these assumptions are not satisfied:
+
+    - data is numeric.
+
+    - data is uniform. The dtype is sniffed from the first value decoded.
+      A ``ValueError`` may be raised, or incorrect output may be produced
+      if this condition is not satisfied.
+
+    - labels are ordered. Labels are only read from the first container, it is assumed
+      that each subsequent row / column has been encoded in the same order. This should be satisfied if the
+      data was encoded using ``to_json`` but may not be the case if the JSON
+      is from another source.
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('test.json')
+
+.. _io.json_normalize:
+
+Normalization
+'''''''''''''
+
+pandas provides a utility function to take a dict or list of dicts and *normalize* this semi-structured data
+into a flat table.
+
+.. ipython:: python
+
+   from pandas.io.json import json_normalize
+   data = [{'id': 1, 'name': {'first': 'Coleen', 'last': 'Volk'}},
+           {'name': {'given': 'Mose', 'family': 'Regner'}},
+           {'id': 2, 'name': 'Faye Raker'}]
+   json_normalize(data)
+
+.. ipython:: python
+
+   data = [{'state': 'Florida',
+            'shortname': 'FL',
+            'info': {'governor': 'Rick Scott'},
+            'counties': [{'name': 'Dade', 'population': 12345},
+                         {'name': 'Broward', 'population': 40000},
+                         {'name': 'Palm Beach', 'population': 60000}]},
+           {'state': 'Ohio',
+            'shortname': 'OH',
+            'info': {'governor': 'John Kasich'},
+            'counties': [{'name': 'Summit', 'population': 1234},
+                         {'name': 'Cuyahoga', 'population': 1337}]}]
+
+   json_normalize(data, 'counties', ['state', 'shortname', ['info', 'governor']])
+
+.. _io.jsonl:
+
+Line delimited json
+'''''''''''''''''''
+
+.. versionadded:: 0.19.0
+
+pandas is able to read and write line-delimited json files that are common in data processing pipelines
+using Hadoop or Spark.
+
+.. versionadded:: 0.21.0
+
+For line-delimited json files, pandas can also return an iterator which reads in ``chunksize`` lines at a time. This can be useful for large files or to read from a stream.
+
+.. ipython:: python
+
+  jsonl = '''
+      {"a": 1, "b": 2}
+      {"a": 3, "b": 4}
+  '''
+  df = pd.read_json(jsonl, lines=True)
+  df
+  df.to_json(orient='records', lines=True)
+
+  # reader is an iterator that returns `chunksize` lines each iteration
+  reader = pd.read_json(StringIO(jsonl), lines=True, chunksize=1)
+  reader
+  for chunk in reader:
+      print(chunk)
+
+.. _io.table_schema:
+
+Table Schema
+''''''''''''
+
+.. versionadded:: 0.20.0
+
+`Table Schema`_ is a spec for describing tabular datasets as a JSON
+object. The JSON includes information on the field names, types, and
+other attributes. You can use the orient ``table`` to build
+a JSON string with two fields, ``schema`` and ``data``.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': ['a', 'b', 'c'],
+                      'C': pd.date_range('2016-01-01', freq='d', periods=3)},
+                     index=pd.Index(range(3), name='idx'))
+   df
+   df.to_json(orient='table', date_format="iso")
+
+The ``schema`` field contains the ``fields`` key, which itself contains
+a list of column name to type pairs, including the ``Index`` or ``MultiIndex``
+(see below for a list of types).
+The ``schema`` field also contains a ``primaryKey`` field if the (Multi)index
+is unique.
+
+The second field, ``data``, contains the serialized data with the ``records``
+orient.
+The index is included, and any datetimes are ISO 8601 formatted, as required
+by the Table Schema spec.
+
+The full list of types supported are described in the Table Schema
+spec. This table shows the mapping from pandas types:
+
+=============== =================
+Pandas type     Table Schema type
+=============== =================
+int64           integer
+float64         number
+bool            boolean
+datetime64[ns]  datetime
+timedelta64[ns] duration
+categorical     any
+object          str
+=============== =================
+
+A few notes on the generated table schema:
+
+* The ``schema`` object contains a ``pandas_version`` field. This contains
+  the version of pandas' dialect of the schema, and will be incremented
+  with each revision.
+* All dates are converted to UTC when serializing. Even timezone naive values,
+  which are treated as UTC with an offset of 0.
+
+  .. ipython:: python
+
+     from pandas.io.json import build_table_schema
+     s = pd.Series(pd.date_range('2016', periods=4))
+     build_table_schema(s)
+
+* datetimes with a timezone (before serializing), include an additional field
+  ``tz`` with the time zone name (e.g. ``'US/Central'``).
+
+  .. ipython:: python
+
+     s_tz = pd.Series(pd.date_range('2016', periods=12,
+                                    tz='US/Central'))
+     build_table_schema(s_tz)
+
+* Periods are converted to timestamps before serialization, and so have the
+  same behavior of being converted to UTC. In addition, periods will contain
+  and additional field ``freq`` with the period's frequency, e.g. ``'A-DEC'``.
+
+  .. ipython:: python
+
+     s_per = pd.Series(1, index=pd.period_range('2016', freq='A-DEC',
+                                                periods=4))
+     build_table_schema(s_per)
+
+* Categoricals use the ``any`` type and an ``enum`` constraint listing
+  the set of possible values. Additionally, an ``ordered`` field is included:
+
+  .. ipython:: python
+
+     s_cat = pd.Series(pd.Categorical(['a', 'b', 'a']))
+     build_table_schema(s_cat)
+
+* A ``primaryKey`` field, containing an array of labels, is included
+  *if the index is unique*:
+
+  .. ipython:: python
+
+     s_dupe = pd.Series([1, 2], index=[1, 1])
+     build_table_schema(s_dupe)
+
+* The ``primaryKey`` behavior is the same with MultiIndexes, but in this
+  case the ``primaryKey`` is an array:
+
+  .. ipython:: python
+
+     s_multi = pd.Series(1, index=pd.MultiIndex.from_product([('a', 'b'),
+                                                              (0, 1)]))
+     build_table_schema(s_multi)
+
+* The default naming roughly follows these rules:
+
+    * For series, the ``object.name`` is used. If that's none, then the
+      name is ``values``
+    * For ``DataFrames``, the stringified version of the column name is used
+    * For ``Index`` (not ``MultiIndex``), ``index.name`` is used, with a
+      fallback to ``index`` if that is None.
+    * For ``MultiIndex``, ``mi.names`` is used. If any level has no name,
+      then ``level_<i>`` is used.
+
+
+.. versionadded:: 0.23.0
+
+``read_json`` also accepts ``orient='table'`` as an argument. This allows for
+the preservation of metadata such as dtypes and index names in a
+round-trippable manner.
+
+  .. ipython:: python
+
+   df = pd.DataFrame({'foo': [1, 2, 3, 4],
+		      'bar': ['a', 'b', 'c', 'd'],
+		      'baz': pd.date_range('2018-01-01', freq='d', periods=4),
+		      'qux': pd.Categorical(['a', 'b', 'c', 'c'])
+		      }, index=pd.Index(range(4), name='idx'))
+   df
+   df.dtypes
+
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+Please note that the literal string 'index' as the name of an :class:`Index`
+is not round-trippable, nor are any names beginning with ``'level_'`` within a
+:class:`MultiIndex`. These are used by default in :func:`DataFrame.to_json` to
+indicate missing values and the subsequent read cannot distinguish the intent.
+
+.. ipython:: python
+   :okwarning:
+
+   df.index.name = 'index'
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   print(new_df.index.name)
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('test.json')
+
+.. _Table Schema: https://specs.frictionlessdata.io/json-table-schema/
+
+HTML
+----
+
+.. _io.read_html:
+
+Reading HTML Content
+''''''''''''''''''''''
+
+.. warning::
+
+   We **highly encourage** you to read the :ref:`HTML Table Parsing gotchas <io.html.gotchas>`
+   below regarding the issues surrounding the BeautifulSoup4/html5lib/lxml parsers.
+
+The top-level :func:`~pandas.io.html.read_html` function can accept an HTML
+string/file/URL and will parse HTML tables into list of pandas ``DataFrames``.
+Let's look at a few examples.
+
+.. note::
+
+   ``read_html`` returns a ``list`` of ``DataFrame`` objects, even if there is
+   only a single table contained in the HTML content.
+
+Read a URL with no options:
+
+.. ipython:: python
+
+   url = 'https://www.fdic.gov/bank/individual/failed/banklist.html'
+   dfs = pd.read_html(url)
+   dfs
+
+.. note::
+
+   The data from the above URL changes every Monday so the resulting data above
+   and the data below may be slightly different.
+
+Read in the content of the file from the above URL and pass it to ``read_html``
+as a string:
+
+.. ipython:: python
+   :suppress:
+
+   file_path = os.path.abspath(os.path.join('source', '_static', 'banklist.html'))
+
+.. ipython:: python
+
+   with open(file_path, 'r') as f:
+       dfs = pd.read_html(f.read())
+   dfs
+
+You can even pass in an instance of ``StringIO`` if you so desire:
+
+.. ipython:: python
+
+   with open(file_path, 'r') as f:
+       sio = StringIO(f.read())
+
+   dfs = pd.read_html(sio)
+   dfs
+
+.. note::
+
+   The following examples are not run by the IPython evaluator due to the fact
+   that having so many network-accessing functions slows down the documentation
+   build. If you spot an error or an example that doesn't run, please do not
+   hesitate to report it over on `pandas GitHub issues page
+   <https://www.github.com/pandas-dev/pandas/issues>`__.
+
+
+Read a URL and match a table that contains specific text:
+
+.. code-block:: python
+
+   match = 'Metcalf Bank'
+   df_list = pd.read_html(url, match=match)
+
+Specify a header row (by default ``<th>`` or ``<td>`` elements located within a
+``<thead>`` are used to form the column index, if multiple rows are contained within
+``<thead>`` then a MultiIndex is created); if specified, the header row is taken
+from the data minus the parsed header elements (``<th>`` elements).
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, header=0)
+
+Specify an index column:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, index_col=0)
+
+Specify a number of rows to skip:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, skiprows=0)
+
+Specify a number of rows to skip using a list (``xrange`` (Python 2 only) works
+as well):
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, skiprows=range(2))
+
+Specify an HTML attribute:
+
+.. code-block:: python
+
+   dfs1 = pd.read_html(url, attrs={'id': 'table'})
+   dfs2 = pd.read_html(url, attrs={'class': 'sortable'})
+   print(np.array_equal(dfs1[0], dfs2[0]))  # Should be True
+
+Specify values that should be converted to NaN:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, na_values=['No Acquirer'])
+
+.. versionadded:: 0.19
+
+Specify whether to keep the default set of NaN values:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, keep_default_na=False)
+
+.. versionadded:: 0.19
+
+Specify converters for columns. This is useful for numerical text data that has
+leading zeros.  By default columns that are numerical are cast to numeric
+types and the leading zeros are lost. To avoid this, we can convert these
+columns to strings.
+
+.. code-block:: python
+
+   url_mcc = 'https://en.wikipedia.org/wiki/Mobile_country_code'
+   dfs = pd.read_html(url_mcc, match='Telekom Albania', header=0,
+                      converters={'MNC': str})
+
+.. versionadded:: 0.19
+
+Use some combination of the above:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, match='Metcalf Bank', index_col=0)
+
+Read in pandas ``to_html`` output (with some loss of floating point precision):
+
+.. code-block:: python
+
+   df = pd.DataFrame(np.random.randn(2, 2))
+   s = df.to_html(float_format='{0:.40g}'.format)
+   dfin = pd.read_html(s, index_col=0)
+
+The ``lxml`` backend will raise an error on a failed parse if that is the only
+parser you provide. If you only have a single parser you can provide just a
+string, but it is considered good practice to pass a list with one string if,
+for example, the function expects a sequence of strings. You may use:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml'])
+
+Or you could pass ``flavor='lxml'`` without a list:
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor='lxml')
+
+However, if you have bs4 and html5lib installed and pass ``None`` or ``['lxml',
+'bs4']`` then the parse will most likely succeed. Note that *as soon as a parse
+succeeds, the function will return*.
+
+.. code-block:: python
+
+   dfs = pd.read_html(url, 'Metcalf Bank', index_col=0, flavor=['lxml', 'bs4'])
+
+
+.. _io.html:
+
+Writing to HTML files
+''''''''''''''''''''''
+
+``DataFrame`` objects have an instance method ``to_html`` which renders the
+contents of the ``DataFrame`` as an HTML table. The function arguments are as
+in the method ``to_string`` described above.
+
+.. note::
+
+   Not all of the possible options for ``DataFrame.to_html`` are shown here for
+   brevity's sake. See :func:`~pandas.core.frame.DataFrame.to_html` for the
+   full set of options.
+
+.. ipython:: python
+   :suppress:
+
+   def write_html(df, filename, *args, **kwargs):
+       static = os.path.abspath(os.path.join('source', '_static'))
+       with open(os.path.join(static, filename + '.html'), 'w') as f:
+           df.to_html(f, *args, **kwargs)
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(2, 2))
+   df
+   print(df.to_html())  # raw html
+
+.. ipython:: python
+   :suppress:
+
+   write_html(df, 'basic')
+
+HTML:
+
+.. raw:: html
+   :file: ../_static/basic.html
+
+The ``columns`` argument will limit the columns shown:
+
+.. ipython:: python
+
+   print(df.to_html(columns=[0]))
+
+.. ipython:: python
+   :suppress:
+
+   write_html(df, 'columns', columns=[0])
+
+HTML:
+
+.. raw:: html
+   :file: ../_static/columns.html
+
+``float_format`` takes a Python callable to control the precision of floating
+point values:
+
+.. ipython:: python
+
+   print(df.to_html(float_format='{0:.10f}'.format))
+
+.. ipython:: python
+   :suppress:
+
+   write_html(df, 'float_format', float_format='{0:.10f}'.format)
+
+HTML:
+
+.. raw:: html
+   :file: ../_static/float_format.html
+
+``bold_rows`` will make the row labels bold by default, but you can turn that
+off:
+
+.. ipython:: python
+
+   print(df.to_html(bold_rows=False))
+
+.. ipython:: python
+   :suppress:
+
+   write_html(df, 'nobold', bold_rows=False)
+
+.. raw:: html
+   :file: ../_static/nobold.html
+
+The ``classes`` argument provides the ability to give the resulting HTML
+table CSS classes. Note that these classes are *appended* to the existing
+``'dataframe'`` class.
+
+.. ipython:: python
+
+   print(df.to_html(classes=['awesome_table_class', 'even_more_awesome_class']))
+
+The ``render_links`` argument provides the ability to add hyperlinks to cells
+that contain URLs.
+
+.. versionadded:: 0.24
+
+.. ipython:: python
+
+   url_df = pd.DataFrame({
+       'name': ['Python', 'Pandas'],
+       'url': ['https://www.python.org/', 'http://pandas.pydata.org']})
+   print(url_df.to_html(render_links=True))
+
+.. ipython:: python
+   :suppress:
+
+   write_html(url_df, 'render_links', render_links=True)
+
+HTML:
+
+.. raw:: html
+   :file: ../_static/render_links.html
+
+Finally, the ``escape`` argument allows you to control whether the
+"<", ">" and "&" characters escaped in the resulting HTML (by default it is
+``True``). So to get the HTML without escaped characters pass ``escape=False``
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': list('&<>'), 'b': np.random.randn(3)})
+
+
+.. ipython:: python
+   :suppress:
+
+   write_html(df, 'escape')
+   write_html(df, 'noescape', escape=False)
+
+Escaped:
+
+.. ipython:: python
+
+   print(df.to_html())
+
+.. raw:: html
+   :file: ../_static/escape.html
+
+Not escaped:
+
+.. ipython:: python
+
+   print(df.to_html(escape=False))
+
+.. raw:: html
+   :file: ../_static/noescape.html
+
+.. note::
+
+   Some browsers may not show a difference in the rendering of the previous two
+   HTML tables.
+
+
+.. _io.html.gotchas:
+
+HTML Table Parsing Gotchas
+''''''''''''''''''''''''''
+
+There are some versioning issues surrounding the libraries that are used to
+parse HTML tables in the top-level pandas io function ``read_html``.
+
+**Issues with** |lxml|_
+
+* Benefits
+
+    * |lxml|_ is very fast.
+
+    * |lxml|_ requires Cython to install correctly.
+
+* Drawbacks
+
+    * |lxml|_ does *not* make any guarantees about the results of its parse
+      *unless* it is given |svm|_.
+
+    * In light of the above, we have chosen to allow you, the user, to use the
+      |lxml|_ backend, but **this backend will use** |html5lib|_ if |lxml|_
+      fails to parse
+
+    * It is therefore *highly recommended* that you install both
+      |BeautifulSoup4|_ and |html5lib|_, so that you will still get a valid
+      result (provided everything else is valid) even if |lxml|_ fails.
+
+**Issues with** |BeautifulSoup4|_ **using** |lxml|_ **as a backend**
+
+* The above issues hold here as well since |BeautifulSoup4|_ is essentially
+  just a wrapper around a parser backend.
+
+**Issues with** |BeautifulSoup4|_ **using** |html5lib|_ **as a backend**
+
+* Benefits
+
+    * |html5lib|_ is far more lenient than |lxml|_ and consequently deals
+      with *real-life markup* in a much saner way rather than just, e.g.,
+      dropping an element without notifying you.
+
+    * |html5lib|_ *generates valid HTML5 markup from invalid markup
+      automatically*. This is extremely important for parsing HTML tables,
+      since it guarantees a valid document. However, that does NOT mean that
+      it is "correct", since the process of fixing markup does not have a
+      single definition.
+
+    * |html5lib|_ is pure Python and requires no additional build steps beyond
+      its own installation.
+
+* Drawbacks
+
+    * The biggest drawback to using |html5lib|_ is that it is slow as
+      molasses.  However consider the fact that many tables on the web are not
+      big enough for the parsing algorithm runtime to matter. It is more
+      likely that the bottleneck will be in the process of reading the raw
+      text from the URL over the web, i.e., IO (input-output). For very large
+      tables, this might not be true.
+
+
+.. |svm| replace:: **strictly valid markup**
+.. _svm: https://validator.w3.org/docs/help.html#validation_basics
+
+.. |html5lib| replace:: **html5lib**
+.. _html5lib: https://github.com/html5lib/html5lib-python
+
+.. |BeautifulSoup4| replace:: **BeautifulSoup4**
+.. _BeautifulSoup4: https://www.crummy.com/software/BeautifulSoup
+
+.. |lxml| replace:: **lxml**
+.. _lxml: https://lxml.de
+
+
+
+
+.. _io.excel:
+
+Excel files
+-----------
+
+The :func:`~pandas.read_excel` method can read Excel 2003 (``.xls``) and
+Excel 2007+ (``.xlsx``) files using the ``xlrd`` Python
+module.  The :meth:`~DataFrame.to_excel` instance method is used for
+saving a ``DataFrame`` to Excel.  Generally the semantics are
+similar to working with :ref:`csv<io.read_csv_table>` data.
+See the :ref:`cookbook<cookbook.excel>` for some advanced strategies.
+
+.. _io.excel_reader:
+
+Reading Excel Files
+'''''''''''''''''''
+
+In the most basic use-case, ``read_excel`` takes a path to an Excel
+file, and the ``sheet_name`` indicating which sheet to parse.
+
+.. code-block:: python
+
+   # Returns a DataFrame
+   pd.read_excel('path_to_file.xls', sheet_name='Sheet1')
+
+
+.. _io.excel.excelfile_class:
+
+``ExcelFile`` class
++++++++++++++++++++
+
+To facilitate working with multiple sheets from the same file, the ``ExcelFile``
+class can be used to wrap the file and can be passed into ``read_excel``
+There will be a performance benefit for reading multiple sheets as the file is
+read into memory only once.
+
+.. code-block:: python
+
+   xlsx = pd.ExcelFile('path_to_file.xls')
+   df = pd.read_excel(xlsx, 'Sheet1')
+
+The ``ExcelFile`` class can also be used as a context manager.
+
+.. code-block:: python
+
+   with pd.ExcelFile('path_to_file.xls') as xls:
+       df1 = pd.read_excel(xls, 'Sheet1')
+       df2 = pd.read_excel(xls, 'Sheet2')
+
+The ``sheet_names`` property will generate
+a list of the sheet names in the file.
+
+The primary use-case for an ``ExcelFile`` is parsing multiple sheets with
+different parameters:
+
+.. code-block:: python
+
+    data = {}
+    # For when Sheet1's format differs from Sheet2
+    with pd.ExcelFile('path_to_file.xls') as xls:
+        data['Sheet1'] = pd.read_excel(xls, 'Sheet1', index_col=None,
+                                       na_values=['NA'])
+        data['Sheet2'] = pd.read_excel(xls, 'Sheet2', index_col=1)
+
+Note that if the same parsing parameters are used for all sheets, a list
+of sheet names can simply be passed to ``read_excel`` with no loss in performance.
+
+.. code-block:: python
+
+    # using the ExcelFile class
+    data = {}
+    with pd.ExcelFile('path_to_file.xls') as xls:
+        data['Sheet1'] = pd.read_excel(xls, 'Sheet1', index_col=None,
+                                       na_values=['NA'])
+        data['Sheet2'] = pd.read_excel(xls, 'Sheet2', index_col=None,
+                                       na_values=['NA'])
+
+    # equivalent using the read_excel function
+    data = pd.read_excel('path_to_file.xls', ['Sheet1', 'Sheet2'],
+                         index_col=None, na_values=['NA'])
+
+.. _io.excel.specifying_sheets:
+
+Specifying Sheets
++++++++++++++++++
+
+.. note :: The second argument is ``sheet_name``, not to be confused with ``ExcelFile.sheet_names``.
+
+.. note :: An ExcelFile's attribute ``sheet_names`` provides access to a list of sheets.
+
+* The arguments ``sheet_name`` allows specifying the sheet or sheets to read.
+* The default value for ``sheet_name`` is 0, indicating to read the first sheet
+* Pass a string to refer to the name of a particular sheet in the workbook.
+* Pass an integer to refer to the index of a sheet. Indices follow Python
+  convention, beginning at 0.
+* Pass a list of either strings or integers, to return a dictionary of specified sheets.
+* Pass a ``None`` to return a dictionary of all available sheets.
+
+.. code-block:: python
+
+   # Returns a DataFrame
+   pd.read_excel('path_to_file.xls', 'Sheet1', index_col=None, na_values=['NA'])
+
+Using the sheet index:
+
+.. code-block:: python
+
+   # Returns a DataFrame
+   pd.read_excel('path_to_file.xls', 0, index_col=None, na_values=['NA'])
+
+Using all default values:
+
+.. code-block:: python
+
+   # Returns a DataFrame
+   pd.read_excel('path_to_file.xls')
+
+Using None to get all sheets:
+
+.. code-block:: python
+
+   # Returns a dictionary of DataFrames
+   pd.read_excel('path_to_file.xls', sheet_name=None)
+
+Using a list to get multiple sheets:
+
+.. code-block:: python
+
+   # Returns the 1st and 4th sheet, as a dictionary of DataFrames.
+   pd.read_excel('path_to_file.xls', sheet_name=['Sheet1', 3])
+
+``read_excel`` can read more than one sheet, by setting ``sheet_name`` to either
+a list of sheet names, a list of sheet positions, or ``None`` to read all sheets.
+Sheets can be specified by sheet index or sheet name, using an integer or string,
+respectively.
+
+.. _io.excel.reading_multiindex:
+
+Reading a ``MultiIndex``
+++++++++++++++++++++++++
+
+``read_excel`` can read a ``MultiIndex`` index, by passing a list of columns to ``index_col``
+and a ``MultiIndex`` column by passing a list of rows to ``header``.  If either the ``index``
+or ``columns`` have serialized level names those will be read in as well by specifying
+the rows/columns that make up the levels.
+
+For example, to read in a ``MultiIndex`` index without names:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [1, 2, 3, 4], 'b': [5, 6, 7, 8]},
+                     index=pd.MultiIndex.from_product([['a', 'b'], ['c', 'd']]))
+   df.to_excel('path_to_file.xlsx')
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1])
+   df
+
+If the index has level names, they will parsed as well, using the same
+parameters.
+
+.. ipython:: python
+
+   df.index = df.index.set_names(['lvl1', 'lvl2'])
+   df.to_excel('path_to_file.xlsx')
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1])
+   df
+
+
+If the source file has both ``MultiIndex`` index and columns, lists specifying each
+should be passed to ``index_col`` and ``header``:
+
+.. ipython:: python
+
+   df.columns = pd.MultiIndex.from_product([['a'], ['b', 'd']],
+                                           names=['c1', 'c2'])
+   df.to_excel('path_to_file.xlsx')
+   df = pd.read_excel('path_to_file.xlsx', index_col=[0, 1], header=[0, 1])
+   df
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('path_to_file.xlsx')
+
+
+Parsing Specific Columns
+++++++++++++++++++++++++
+
+It is often the case that users will insert columns to do temporary computations
+in Excel and you may not want to read in those columns. ``read_excel`` takes
+a ``usecols`` keyword to allow you to specify a subset of columns to parse.
+
+.. deprecated:: 0.24.0
+
+Passing in an integer for ``usecols`` has been deprecated. Please pass in a list
+of ints from 0 to ``usecols`` inclusive instead.
+
+If ``usecols`` is an integer, then it is assumed to indicate the last column
+to be parsed.
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', usecols=2)
+
+You can also specify a comma-delimited set of Excel columns and ranges as a string:
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', usecols='A,C:E')
+
+If ``usecols`` is a list of integers, then it is assumed to be the file column
+indices to be parsed.
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', usecols=[0, 2, 3])
+
+Element order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``.
+
+.. versionadded:: 0.24
+
+If ``usecols`` is a list of strings, it is assumed that each string corresponds
+to a column name provided either by the user in ``names`` or inferred from the
+document header row(s). Those strings define which columns will be parsed:
+
+.. code-block:: python
+
+    pd.read_excel('path_to_file.xls', 'Sheet1', usecols=['foo', 'bar'])
+
+Element order is ignored, so ``usecols=['baz', 'joe']`` is the same as ``['joe', 'baz']``.
+
+.. versionadded:: 0.24
+
+If ``usecols`` is callable, the callable function will be evaluated against
+the column names, returning names where the callable function evaluates to ``True``.
+
+.. code-block:: python
+
+    pd.read_excel('path_to_file.xls', 'Sheet1', usecols=lambda x: x.isalpha())
+
+Parsing Dates
++++++++++++++
+
+Datetime-like values are normally automatically converted to the appropriate
+dtype when reading the excel file. But if you have a column of strings that
+*look* like dates (but are not actually formatted as dates in excel), you can
+use the ``parse_dates`` keyword to parse those strings to datetimes:
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', parse_dates=['date_strings'])
+
+
+Cell Converters
++++++++++++++++
+
+It is possible to transform the contents of Excel cells via the ``converters``
+option. For instance, to convert a column to boolean:
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', converters={'MyBools': bool})
+
+This options handles missing values and treats exceptions in the converters
+as missing data. Transformations are applied cell by cell rather than to the
+column as a whole, so the array dtype is not guaranteed. For instance, a
+column of integers with missing values cannot be transformed to an array
+with integer dtype, because NaN is strictly a float. You can manually mask
+missing data to recover integer dtype:
+
+.. code-block:: python
+
+   def cfun(x):
+       return int(x) if x else -1
+
+
+   pd.read_excel('path_to_file.xls', 'Sheet1', converters={'MyInts': cfun})
+
+dtype Specifications
+++++++++++++++++++++
+
+.. versionadded:: 0.20
+
+As an alternative to converters, the type for an entire column can
+be specified using the `dtype` keyword, which takes a dictionary
+mapping column names to types.  To interpret data with
+no type inference, use the type ``str`` or ``object``.
+
+.. code-block:: python
+
+   pd.read_excel('path_to_file.xls', dtype={'MyInts': 'int64', 'MyText': str})
+
+.. _io.excel_writer:
+
+Writing Excel Files
+'''''''''''''''''''
+
+Writing Excel Files to Disk
++++++++++++++++++++++++++++
+
+To write a ``DataFrame`` object to a sheet of an Excel file, you can use the
+``to_excel`` instance method.  The arguments are largely the same as ``to_csv``
+described above, the first argument being the name of the excel file, and the
+optional second argument the name of the sheet to which the ``DataFrame`` should be
+written. For example:
+
+.. code-block:: python
+
+   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1')
+
+Files with a ``.xls`` extension will be written using ``xlwt`` and those with a
+``.xlsx`` extension will be written using ``xlsxwriter`` (if available) or
+``openpyxl``.
+
+The ``DataFrame`` will be written in a way that tries to mimic the REPL output.
+The ``index_label`` will be placed in the second
+row instead of the first. You can place it in the first row by setting the
+``merge_cells`` option in ``to_excel()`` to ``False``:
+
+.. code-block:: python
+
+   df.to_excel('path_to_file.xlsx', index_label='label', merge_cells=False)
+
+In order to write separate ``DataFrames`` to separate sheets in a single Excel file,
+one can pass an :class:`~pandas.io.excel.ExcelWriter`.
+
+.. code-block:: python
+
+   with pd.ExcelWriter('path_to_file.xlsx') as writer:
+       df1.to_excel(writer, sheet_name='Sheet1')
+       df2.to_excel(writer, sheet_name='Sheet2')
+
+.. note::
+
+    Wringing a little more performance out of ``read_excel``
+    Internally, Excel stores all numeric data as floats. Because this can
+    produce unexpected behavior when reading in data, pandas defaults to trying
+    to convert integers to floats if it doesn't lose information (``1.0 -->
+    1``).  You can pass ``convert_float=False`` to disable this behavior, which
+    may give a slight performance improvement.
+
+.. _io.excel_writing_buffer:
+
+Writing Excel Files to Memory
++++++++++++++++++++++++++++++
+
+Pandas supports writing Excel files to buffer-like objects such as ``StringIO`` or
+``BytesIO`` using :class:`~pandas.io.excel.ExcelWriter`.
+
+.. code-block:: python
+
+   # Safe import for either Python 2.x or 3.x
+   try:
+       from io import BytesIO
+   except ImportError:
+       from cStringIO import StringIO as BytesIO
+
+   bio = BytesIO()
+
+   # By setting the 'engine' in the ExcelWriter constructor.
+   writer = pd.ExcelWriter(bio, engine='xlsxwriter')
+   df.to_excel(writer, sheet_name='Sheet1')
+
+   # Save the workbook
+   writer.save()
+
+   # Seek to the beginning and read to copy the workbook to a variable in memory
+   bio.seek(0)
+   workbook = bio.read()
+
+.. note::
+
+    ``engine`` is optional but recommended.  Setting the engine determines
+    the version of workbook produced. Setting ``engine='xlrd'`` will produce an
+    Excel 2003-format workbook (xls).  Using either ``'openpyxl'`` or
+    ``'xlsxwriter'`` will produce an Excel 2007-format workbook (xlsx). If
+    omitted, an Excel 2007-formatted workbook is produced.
+
+
+.. _io.excel.writers:
+
+Excel writer engines
+''''''''''''''''''''
+
+Pandas chooses an Excel writer via two methods:
+
+1. the ``engine`` keyword argument
+2. the filename extension (via the default specified in config options)
+
+By default, pandas uses the `XlsxWriter`_  for ``.xlsx``, `openpyxl`_
+for ``.xlsm``, and `xlwt`_ for ``.xls`` files. If you have multiple
+engines installed, you can set the default engine through :ref:`setting the
+config options <options>` ``io.excel.xlsx.writer`` and
+``io.excel.xls.writer``. pandas will fall back on `openpyxl`_ for ``.xlsx``
+files if `Xlsxwriter`_ is not available.
+
+.. _XlsxWriter: https://xlsxwriter.readthedocs.io
+.. _openpyxl: https://openpyxl.readthedocs.io/
+.. _xlwt: http://www.python-excel.org
+
+To specify which writer you want to use, you can pass an engine keyword
+argument to ``to_excel`` and to ``ExcelWriter``. The built-in engines are:
+
+* ``openpyxl``: version 2.4 or higher is required
+* ``xlsxwriter``
+* ``xlwt``
+
+.. code-block:: python
+
+   # By setting the 'engine' in the DataFrame and Panel 'to_excel()' methods.
+   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1', engine='xlsxwriter')
+
+   # By setting the 'engine' in the ExcelWriter constructor.
+   writer = pd.ExcelWriter('path_to_file.xlsx', engine='xlsxwriter')
+
+   # Or via pandas configuration.
+   from pandas import options                                     # noqa: E402
+   options.io.excel.xlsx.writer = 'xlsxwriter'
+
+   df.to_excel('path_to_file.xlsx', sheet_name='Sheet1')
+
+.. _io.excel.style:
+
+Style and Formatting
+''''''''''''''''''''
+
+The look and feel of Excel worksheets created from pandas can be modified using the following parameters on the ``DataFrame``'s ``to_excel`` method.
+
+* ``float_format`` : Format string for floating point numbers (default ``None``).
+* ``freeze_panes`` : A tuple of two integers representing the bottommost row and rightmost column to freeze. Each of these parameters is one-based, so (1, 1) will freeze the first row and first column (default ``None``).
+
+
+
+.. _io.clipboard:
+
+Clipboard
+---------
+
+A handy way to grab data is to use the :meth:`~DataFrame.read_clipboard` method,
+which takes the contents of the clipboard buffer and passes them to the
+``read_csv`` method. For instance, you can copy the following text to the
+clipboard (CTRL-C on many operating systems):
+
+.. code-block:: console
+
+     A B C
+   x 1 4 p
+   y 2 5 q
+   z 3 6 r
+
+And then import the data directly to a ``DataFrame`` by calling:
+
+.. code-block:: python
+
+   clipdf = pd.read_clipboard()
+
+.. ipython:: python
+
+   clipdf
+
+
+The ``to_clipboard`` method can be used to write the contents of a ``DataFrame`` to
+the clipboard. Following which you can paste the clipboard contents into other
+applications (CTRL-V on many operating systems). Here we illustrate writing a
+``DataFrame`` into clipboard and reading it back.
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.random.randn(5, 3))
+    df
+    df.to_clipboard()
+    pd.read_clipboard()
+
+We can see that we got the same content back, which we had earlier written to the clipboard.
+
+.. note::
+
+   You may need to install xclip or xsel (with gtk, PyQt5, PyQt4 or qtpy) on Linux to use these methods.
+
+.. _io.pickle:
+
+Pickling
+--------
+
+All pandas objects are equipped with ``to_pickle`` methods which use Python's
+``cPickle`` module to save data structures to disk using the pickle format.
+
+.. ipython:: python
+
+   df
+   df.to_pickle('foo.pkl')
+
+The ``read_pickle`` function in the ``pandas`` namespace can be used to load
+any pickled pandas object (or any other pickled object) from file:
+
+
+.. ipython:: python
+
+   pd.read_pickle('foo.pkl')
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('foo.pkl')
+
+.. warning::
+
+   Loading pickled data received from untrusted sources can be unsafe.
+
+   See: https://docs.python.org/3/library/pickle.html
+
+.. warning::
+
+   Several internal refactoring have been done while still preserving
+   compatibility with pickles created with older versions of pandas. However,
+   for such cases, pickled ``DataFrames``, ``Series`` etc, must be read with
+   ``pd.read_pickle``, rather than ``pickle.load``.
+
+   See `here <https://pandas.pydata.org/pandas-docs/stable/whatsnew.html#whatsnew-0130-refactoring>`__
+   and `here <https://pandas.pydata.org/pandas-docs/stable/whatsnew.html#whatsnew-0150-refactoring>`__
+   for some examples of compatibility-breaking changes. See
+   `this question <https://stackoverflow.com/questions/20444593/pandas-compiled-from-source-default-pickle-behavior-changed>`__
+   for a detailed explanation.
+
+.. _io.pickle.compression:
+
+Compressed pickle files
+'''''''''''''''''''''''
+
+.. versionadded:: 0.20.0
+
+:func:`read_pickle`, :meth:`DataFrame.to_pickle` and :meth:`Series.to_pickle` can read
+and write compressed pickle files. The compression types of ``gzip``, ``bz2``, ``xz`` are supported for reading and writing.
+The ``zip`` file format only supports reading and must contain only one data file
+to be read.
+
+The compression type can be an explicit parameter or be inferred from the file extension.
+If 'infer', then use ``gzip``, ``bz2``, ``zip``, or ``xz`` if filename ends in ``'.gz'``, ``'.bz2'``, ``'.zip'``, or
+``'.xz'``, respectively.
+
+.. ipython:: python
+
+   df = pd.DataFrame({
+       'A': np.random.randn(1000),
+       'B': 'foo',
+       'C': pd.date_range('20130101', periods=1000, freq='s')})
+   df
+
+Using an explicit compression type:
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.compress", compression="gzip")
+   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
+   rt
+
+Inferring compression type from the extension:
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.xz", compression="infer")
+   rt = pd.read_pickle("data.pkl.xz", compression="infer")
+   rt
+
+The default is to 'infer':
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.gz")
+   rt = pd.read_pickle("data.pkl.gz")
+   rt
+
+   df["A"].to_pickle("s1.pkl.bz2")
+   rt = pd.read_pickle("s1.pkl.bz2")
+   rt
+
+.. ipython:: python
+   :suppress:
+
+   os.remove("data.pkl.compress")
+   os.remove("data.pkl.xz")
+   os.remove("data.pkl.gz")
+   os.remove("s1.pkl.bz2")
+
+.. _io.msgpack:
+
+msgpack
+-------
+
+pandas supports the ``msgpack`` format for
+object serialization. This is a lightweight portable binary format, similar
+to binary JSON, that is highly space efficient, and provides good performance
+both on the writing (serialization), and reading (deserialization).
+
+.. warning::
+
+   This is a very new feature of pandas. We intend to provide certain
+   optimizations in the io of the ``msgpack`` data. Since this is marked
+   as an EXPERIMENTAL LIBRARY, the storage format may not be stable until a future release.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.rand(5, 2), columns=list('AB'))
+   df.to_msgpack('foo.msg')
+   pd.read_msgpack('foo.msg')
+   s = pd.Series(np.random.rand(5), index=pd.date_range('20130101', periods=5))
+
+You can pass a list of objects and you will receive them back on deserialization.
+
+.. ipython:: python
+
+   pd.to_msgpack('foo.msg', df, 'foo', np.array([1, 2, 3]), s)
+   pd.read_msgpack('foo.msg')
+
+You can pass ``iterator=True`` to iterate over the unpacked results:
+
+.. ipython:: python
+
+   for o in pd.read_msgpack('foo.msg', iterator=True):
+       print(o)
+
+You can pass ``append=True`` to the writer to append to an existing pack:
+
+.. ipython:: python
+
+   df.to_msgpack('foo.msg', append=True)
+   pd.read_msgpack('foo.msg')
+
+Unlike other io methods, ``to_msgpack`` is available on both a per-object basis,
+``df.to_msgpack()`` and using the top-level ``pd.to_msgpack(...)`` where you
+can pack arbitrary collections of Python lists, dicts, scalars, while intermixing
+pandas objects.
+
+.. ipython:: python
+
+   pd.to_msgpack('foo2.msg', {'dict': [{'df': df}, {'string': 'foo'},
+                                       {'scalar': 1.}, {'s': s}]})
+   pd.read_msgpack('foo2.msg')
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('foo.msg')
+   os.remove('foo2.msg')
+
+Read/Write API
+''''''''''''''
+
+Msgpacks can also be read from and written to strings.
+
+.. ipython:: python
+
+   df.to_msgpack()
+
+Furthermore you can concatenate the strings to produce a list of the original objects.
+
+.. ipython:: python
+
+  pd.read_msgpack(df.to_msgpack() + s.to_msgpack())
+
+.. _io.hdf5:
+
+HDF5 (PyTables)
+---------------
+
+``HDFStore`` is a dict-like object which reads and writes pandas using
+the high performance HDF5 format using the excellent `PyTables
+<https://www.pytables.org/>`__ library. See the :ref:`cookbook <cookbook.hdf>`
+for some advanced strategies
+
+.. warning::
+
+   pandas requires ``PyTables`` >= 3.0.0.
+   There is a indexing bug in ``PyTables`` < 3.2 which may appear when querying stores using an index.
+   If you see a subset of results being returned, upgrade to ``PyTables`` >= 3.2.
+   Stores created previously will need to be rewritten using the updated version.
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('store.h5')
+
+.. ipython:: python
+
+   store = pd.HDFStore('store.h5')
+   print(store)
+
+Objects can be written to the file just like adding key-value pairs to a
+dict:
+
+.. ipython:: python
+
+   index = pd.date_range('1/1/2000', periods=8)
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   df = pd.DataFrame(np.random.randn(8, 3), index=index,
+                     columns=['A', 'B', 'C'])
+   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                 major_axis=pd.date_range('1/1/2000', periods=5),
+                 minor_axis=['A', 'B', 'C', 'D'])
+
+   # store.put('s', s) is an equivalent method
+   store['s'] = s
+
+   store['df'] = df
+
+   store['wp'] = wp
+
+   # the type of stored data
+   store.root.wp._v_attrs.pandas_type
+
+   store
+
+In a current or later Python session, you can retrieve stored objects:
+
+.. ipython:: python
+
+   # store.get('df') is an equivalent method
+   store['df']
+
+   # dotted (attribute) access provides get as well
+   store.df
+
+Deletion of the object specified by the key:
+
+.. ipython:: python
+
+   # store.remove('wp') is an equivalent method
+   del store['wp']
+
+   store
+
+Closing a Store and using a context manager:
+
+.. ipython:: python
+
+   store.close()
+   store
+   store.is_open
+
+   # Working with, and automatically closing the store using a context manager
+   with pd.HDFStore('store.h5') as store:
+       store.keys()
+
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   os.remove('store.h5')
+
+
+
+Read/Write API
+''''''''''''''
+
+``HDFStore`` supports an top-level API using  ``read_hdf`` for reading and ``to_hdf`` for writing,
+similar to how ``read_csv`` and ``to_csv`` work.
+
+.. ipython:: python
+
+   df_tl = pd.DataFrame({'A': list(range(5)), 'B': list(range(5))})
+   df_tl.to_hdf('store_tl.h5', 'table', append=True)
+   pd.read_hdf('store_tl.h5', 'table', where=['index>2'])
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('store_tl.h5')
+
+
+HDFStore will by default not drop rows that are all missing. This behavior can be changed by setting ``dropna=True``.
+
+
+.. ipython:: python
+
+   df_with_missing = pd.DataFrame({'col1': [0, np.nan, 2],
+                                   'col2': [1, np.nan, np.nan]})
+   df_with_missing
+
+   df_with_missing.to_hdf('file.h5', 'df_with_missing',
+                          format='table', mode='w')
+
+   pd.read_hdf('file.h5', 'df_with_missing')
+
+   df_with_missing.to_hdf('file.h5', 'df_with_missing',
+                          format='table', mode='w', dropna=True)
+   pd.read_hdf('file.h5', 'df_with_missing')
+
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('file.h5')
+
+This is also true for the major axis of a ``Panel``:
+
+.. ipython:: python
+
+   matrix = [[[np.nan, np.nan, np.nan], [1, np.nan, np.nan]],
+             [[np.nan, np.nan, np.nan], [np.nan, 5, 6]],
+             [[np.nan, np.nan, np.nan], [np.nan, 3, np.nan]]]
+
+   panel_with_major_axis_all_missing = pd.Panel(matrix,
+                                                items=['Item1', 'Item2', 'Item3'],
+                                                major_axis=[1, 2],
+                                                minor_axis=['A', 'B', 'C'])
+
+   panel_with_major_axis_all_missing
+
+   panel_with_major_axis_all_missing.to_hdf('file.h5', 'panel',
+                                            dropna=True,
+                                            format='table',
+                                            mode='w')
+   reloaded = pd.read_hdf('file.h5', 'panel')
+   reloaded
+
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('file.h5')
+
+
+
+.. _io.hdf5-fixed:
+
+Fixed Format
+''''''''''''
+
+The examples above show storing using ``put``, which write the HDF5 to ``PyTables`` in a fixed array format, called
+the ``fixed`` format. These types of stores are **not** appendable once written (though you can simply
+remove them and rewrite). Nor are they **queryable**; they must be
+retrieved in their entirety. They also do not support dataframes with non-unique column names.
+The ``fixed`` format stores offer very fast writing and slightly faster reading than ``table`` stores.
+This format is specified by default when using ``put`` or ``to_hdf`` or by ``format='fixed'`` or ``format='f'``.
+
+.. warning::
+
+   A ``fixed`` format will raise a ``TypeError`` if you try to retrieve using a ``where``:
+
+   .. code-block:: python
+
+       >>> pd.DataFrame(np.random.randn(10, 2)).to_hdf('test_fixed.h5', 'df')
+       >>> pd.read_hdf('test_fixed.h5', 'df', where='index>5')
+       TypeError: cannot pass a where specification when reading a fixed format.
+                  this store must be selected in its entirety
+
+
+.. _io.hdf5-table:
+
+Table Format
+''''''''''''
+
+``HDFStore`` supports another ``PyTables`` format on disk, the ``table``
+format. Conceptually a ``table`` is shaped very much like a DataFrame,
+with rows and columns. A ``table`` may be appended to in the same or
+other sessions.  In addition, delete and query type operations are
+supported. This format is specified by ``format='table'`` or ``format='t'``
+to ``append`` or ``put`` or ``to_hdf``.
+
+This format can be set as an option as well ``pd.set_option('io.hdf.default_format','table')`` to
+enable ``put/append/to_hdf`` to by default store in the ``table`` format.
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('store.h5')
+
+.. ipython:: python
+
+   store = pd.HDFStore('store.h5')
+   df1 = df[0:4]
+   df2 = df[4:]
+
+   # append data (creates a table automatically)
+   store.append('df', df1)
+   store.append('df', df2)
+   store
+
+   # select the entire object
+   store.select('df')
+
+   # the type of stored data
+   store.root.df._v_attrs.pandas_type
+
+.. note::
+
+   You can also create a ``table`` by passing ``format='table'`` or ``format='t'`` to a ``put`` operation.
+
+.. _io.hdf5-keys:
+
+Hierarchical Keys
+'''''''''''''''''
+
+Keys to a store can be specified as a string. These can be in a
+hierarchical path-name like format (e.g. ``foo/bar/bah``), which will
+generate a hierarchy of sub-stores (or ``Groups`` in PyTables
+parlance). Keys can be specified with out the leading '/' and are **always**
+absolute (e.g. 'foo' refers to '/foo'). Removal operations can remove
+everything in the sub-store and **below**, so be *careful*.
+
+.. ipython:: python
+
+   store.put('foo/bar/bah', df)
+   store.append('food/orange', df)
+   store.append('food/apple', df)
+   store
+
+   # a list of keys are returned
+   store.keys()
+
+   # remove all nodes under this level
+   store.remove('food')
+   store
+
+
+You can walk through the group hierarchy using the ``walk`` method which
+will yield a tuple for each group key along with the relative keys of its contents.
+
+.. versionadded:: 0.24.0
+
+
+.. ipython:: python
+
+   for (path, subgroups, subkeys) in store.walk():
+       for subgroup in subgroups:
+           print('GROUP: {}/{}'.format(path, subgroup))
+       for subkey in subkeys:
+           key = '/'.join([path, subkey])
+           print('KEY: {}'.format(key))
+           print(store.get(key))
+
+
+
+.. warning::
+
+    Hierarchical keys cannot be retrieved as dotted (attribute) access as described above for items stored under the root node.
+
+    .. code-block:: ipython
+
+       In [8]: store.foo.bar.bah
+       AttributeError: 'HDFStore' object has no attribute 'foo'
+
+       # you can directly access the actual PyTables node but using the root node
+       In [9]: store.root.foo.bar.bah
+       Out[9]:
+       /foo/bar/bah (Group) ''
+         children := ['block0_items' (Array), 'block0_values' (Array), 'axis0' (Array), 'axis1' (Array)]
+
+    Instead, use explicit string based keys:
+
+    .. ipython:: python
+
+       store['foo/bar/bah']
+
+
+.. _io.hdf5-types:
+
+Storing Types
+'''''''''''''
+
+Storing Mixed Types in a Table
+++++++++++++++++++++++++++++++
+
+Storing mixed-dtype data is supported. Strings are stored as a
+fixed-width using the maximum size of the appended column. Subsequent attempts
+at appending longer strings will raise a ``ValueError``.
+
+Passing ``min_itemsize={`values`: size}`` as a parameter to append
+will set a larger minimum for the string columns. Storing ``floats,
+strings, ints, bools, datetime64`` are currently supported. For string
+columns, passing ``nan_rep = 'nan'`` to append will change the default
+nan representation on disk (which converts to/from `np.nan`), this
+defaults to `nan`.
+
+.. ipython:: python
+
+    df_mixed = pd.DataFrame({'A': np.random.randn(8),
+                             'B': np.random.randn(8),
+                             'C': np.array(np.random.randn(8), dtype='float32'),
+                             'string': 'string',
+                             'int': 1,
+                             'bool': True,
+                             'datetime64': pd.Timestamp('20010102')},
+                            index=list(range(8)))
+    df_mixed.loc[df_mixed.index[3:5],
+                 ['A', 'B', 'string', 'datetime64']] = np.nan
+
+    store.append('df_mixed', df_mixed, min_itemsize={'values': 50})
+    df_mixed1 = store.select('df_mixed')
+    df_mixed1
+    df_mixed1.get_dtype_counts()
+
+    # we have provided a minimum string column size
+    store.root.df_mixed.table
+
+Storing MultiIndex DataFrames
++++++++++++++++++++++++++++++
+
+Storing MultiIndex ``DataFrames`` as tables is very similar to
+storing/selecting from homogeneous index ``DataFrames``.
+
+.. ipython:: python
+
+        index = pd.MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                      ['one', 'two', 'three']],
+                              codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                     [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                              names=['foo', 'bar'])
+        df_mi = pd.DataFrame(np.random.randn(10, 3), index=index,
+                             columns=['A', 'B', 'C'])
+        df_mi
+
+        store.append('df_mi', df_mi)
+        store.select('df_mi')
+
+        # the levels are automatically included as data columns
+        store.select('df_mi', 'foo=bar')
+
+
+.. _io.hdf5-query:
+
+Querying
+''''''''
+
+Querying a Table
+++++++++++++++++
+
+``select`` and ``delete`` operations have an optional criterion that can
+be specified to select/delete only a subset of the data. This allows one
+to have a very large on-disk table and retrieve only a portion of the
+data.
+
+A query is specified using the ``Term`` class under the hood, as a boolean expression.
+
+* ``index`` and ``columns`` are supported indexers of a ``DataFrames``.
+* ``major_axis``, ``minor_axis``, and ``items`` are supported indexers of
+  the Panel.
+* if ``data_columns`` are specified, these can be used as additional indexers.
+
+Valid comparison operators are:
+
+``=, ==, !=, >, >=, <, <=``
+
+Valid boolean expressions are combined with:
+
+* ``|`` : or
+* ``&`` : and
+* ``(`` and ``)`` : for grouping
+
+These rules are similar to how boolean expressions are used in pandas for indexing.
+
+.. note::
+
+   - ``=`` will be automatically expanded to the comparison operator ``==``
+   - ``~`` is the not operator, but can only be used in very limited
+     circumstances
+   - If a list/tuple of expressions is passed they will be combined via ``&``
+
+The following are valid expressions:
+
+* ``'index >= date'``
+* ``"columns = ['A', 'D']"``
+* ``"columns in ['A', 'D']"``
+* ``'columns = A'``
+* ``'columns == A'``
+* ``"~(columns = ['A', 'B'])"``
+* ``'index > df.index[3] & string = "bar"'``
+* ``'(index > df.index[3] & index <= df.index[6]) | string = "bar"'``
+* ``"ts >= Timestamp('2012-02-01')"``
+* ``"major_axis>=20130101"``
+
+The ``indexers`` are on the left-hand side of the sub-expression:
+
+``columns``, ``major_axis``, ``ts``
+
+The right-hand side of the sub-expression (after a comparison operator) can be:
+
+* functions that will be evaluated, e.g. ``Timestamp('2012-02-01')``
+* strings, e.g. ``"bar"``
+* date-like, e.g. ``20130101``, or ``"20130101"``
+* lists, e.g. ``"['A', 'B']"``
+* variables that are defined in the local names space, e.g. ``date``
+
+.. note::
+
+   Passing a string to a query by interpolating it into the query
+   expression is not recommended. Simply assign the string of interest to a
+   variable and use that variable in an expression. For example, do this
+
+   .. code-block:: python
+
+      string = "HolyMoly'"
+      store.select('df', 'index == string')
+
+   instead of this
+
+   .. code-block:: ipython
+
+      string = "HolyMoly'"
+      store.select('df', 'index == %s' % string)
+
+   The latter will **not** work and will raise a ``SyntaxError``.Note that
+   there's a single quote followed by a double quote in the ``string``
+   variable.
+
+   If you *must* interpolate, use the ``'%r'`` format specifier
+
+   .. code-block:: python
+
+      store.select('df', 'index == %r' % string)
+
+   which will quote ``string``.
+
+
+Here are some examples:
+
+.. ipython:: python
+
+    dfq = pd.DataFrame(np.random.randn(10, 4), columns=list('ABCD'),
+                       index=pd.date_range('20130101', periods=10))
+    store.append('dfq', dfq, format='table', data_columns=True)
+
+Use boolean expressions, with in-line function evaluation.
+
+.. ipython:: python
+
+    store.select('dfq', "index>pd.Timestamp('20130104') & columns=['A', 'B']")
+
+Use and inline column reference
+
+.. ipython:: python
+
+   store.select('dfq', where="A>0 or C>0")
+
+Works with a Panel as well.
+
+.. ipython:: python
+
+   store.append('wp', wp)
+   store
+   store.select('wp',
+                "major_axis>pd.Timestamp('20000102') & minor_axis=['A', 'B']")
+
+The ``columns`` keyword can be supplied to select a list of columns to be
+returned, this is equivalent to passing a
+``'columns=list_of_columns_to_filter'``:
+
+.. ipython:: python
+
+   store.select('df', "columns=['A', 'B']")
+
+``start`` and ``stop`` parameters can be specified to limit the total search
+space. These are in terms of the total number of rows in a table.
+
+.. ipython:: python
+
+   # this is effectively what the storage of a Panel looks like
+   wp.to_frame()
+
+   # limiting the search
+   store.select('wp', "major_axis>20000102 & minor_axis=['A', 'B']",
+                start=0, stop=10)
+
+.. note::
+
+   ``select`` will raise a ``ValueError`` if the query expression has an unknown
+   variable reference. Usually this means that you are trying to select on a column
+   that is **not** a data_column.
+
+   ``select`` will raise a ``SyntaxError`` if the query expression is not valid.
+
+
+.. _io.hdf5-timedelta:
+
+Using timedelta64[ns]
++++++++++++++++++++++
+
+You can store and query using the ``timedelta64[ns]`` type. Terms can be
+specified in the format: ``<float>(<unit>)``, where float may be signed (and fractional), and unit can be
+``D,s,ms,us,ns`` for the timedelta. Here's an example:
+
+.. ipython:: python
+
+   from datetime import timedelta
+   dftd = pd.DataFrame({'A': pd.Timestamp('20130101'),
+                        'B': [pd.Timestamp('20130101') + timedelta(days=i,
+                                                                   seconds=10)
+                              for i in range(10)]})
+   dftd['C'] = dftd['A'] - dftd['B']
+   dftd
+   store.append('dftd', dftd, data_columns=True)
+   store.select('dftd', "C<'-3.5D'")
+
+Indexing
+++++++++
+
+You can create/modify an index for a table with ``create_table_index``
+after data is already in the table (after and ``append/put``
+operation). Creating a table index is **highly** encouraged. This will
+speed your queries a great deal when you use a ``select`` with the
+indexed dimension as the ``where``.
+
+.. note::
+
+   Indexes are automagically created on the indexables
+   and any data columns you specify. This behavior can be turned off by passing
+   ``index=False`` to ``append``.
+
+.. ipython:: python
+
+   # we have automagically already created an index (in the first section)
+   i = store.root.df.table.cols.index.index
+   i.optlevel, i.kind
+
+   # change an index by passing new parameters
+   store.create_table_index('df', optlevel=9, kind='full')
+   i = store.root.df.table.cols.index.index
+   i.optlevel, i.kind
+
+Oftentimes when appending large amounts of data to a store, it is useful to turn off index creation for each append, then recreate at the end.
+
+.. ipython:: python
+
+   df_1 = pd.DataFrame(np.random.randn(10, 2), columns=list('AB'))
+   df_2 = pd.DataFrame(np.random.randn(10, 2), columns=list('AB'))
+
+   st = pd.HDFStore('appends.h5', mode='w')
+   st.append('df', df_1, data_columns=['B'], index=False)
+   st.append('df', df_2, data_columns=['B'], index=False)
+   st.get_storer('df').table
+
+Then create the index when finished appending.
+
+.. ipython:: python
+
+   st.create_table_index('df', columns=['B'], optlevel=9, kind='full')
+   st.get_storer('df').table
+
+   st.close()
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   os.remove('appends.h5')
+
+See `here <https://stackoverflow.com/questions/17893370/ptrepack-sortby-needs-full-index>`__ for how to create a completely-sorted-index (CSI) on an existing store.
+
+.. _io.hdf5-query-data-columns:
+
+Query via Data Columns
+++++++++++++++++++++++
+
+You can designate (and index) certain columns that you want to be able
+to perform queries (other than the `indexable` columns, which you can
+always query). For instance say you want to perform this common
+operation, on-disk, and return just the frame that matches this
+query. You can specify ``data_columns = True`` to force all columns to
+be ``data_columns``.
+
+.. ipython:: python
+
+   df_dc = df.copy()
+   df_dc['string'] = 'foo'
+   df_dc.loc[df_dc.index[4:6], 'string'] = np.nan
+   df_dc.loc[df_dc.index[7:9], 'string'] = 'bar'
+   df_dc['string2'] = 'cool'
+   df_dc.loc[df_dc.index[1:3], ['B', 'C']] = 1.0
+   df_dc
+
+   # on-disk operations
+   store.append('df_dc', df_dc, data_columns=['B', 'C', 'string', 'string2'])
+   store.select('df_dc', where='B > 0')
+
+   # getting creative
+   store.select('df_dc', 'B > 0 & C > 0 & string == foo')
+
+   # this is in-memory version of this type of selection
+   df_dc[(df_dc.B > 0) & (df_dc.C > 0) & (df_dc.string == 'foo')]
+
+   # we have automagically created this index and the B/C/string/string2
+   # columns are stored separately as ``PyTables`` columns
+   store.root.df_dc.table
+
+There is some performance degradation by making lots of columns into
+`data columns`, so it is up to the user to designate these. In addition,
+you cannot change data columns (nor indexables) after the first
+append/put operation (Of course you can simply read in the data and
+create a new table!).
+
+Iterator
+++++++++
+
+You can pass ``iterator=True`` or ``chunksize=number_in_a_chunk``
+to ``select`` and ``select_as_multiple`` to return an iterator on the results.
+The default is 50,000 rows returned in a chunk.
+
+.. ipython:: python
+
+   for df in store.select('df', chunksize=3):
+       print(df)
+
+.. note::
+
+   You can also use the iterator with ``read_hdf`` which will open, then
+   automatically close the store when finished iterating.
+
+   .. code-block:: python
+
+      for df in pd.read_hdf('store.h5', 'df', chunksize=3):
+          print(df)
+
+Note, that the chunksize keyword applies to the **source** rows. So if you
+are doing a query, then the chunksize will subdivide the total rows in the table
+and the query applied, returning an iterator on potentially unequal sized chunks.
+
+Here is a recipe for generating a query and using it to create equal sized return
+chunks.
+
+.. ipython:: python
+
+   dfeq = pd.DataFrame({'number': np.arange(1, 11)})
+   dfeq
+
+   store.append('dfeq', dfeq, data_columns=['number'])
+
+   def chunks(l, n):
+       return [l[i:i + n] for i in range(0, len(l), n)]
+
+   evens = [2, 4, 6, 8, 10]
+   coordinates = store.select_as_coordinates('dfeq', 'number=evens')
+   for c in chunks(coordinates, 2):
+       print(store.select('dfeq', where=c))
+
+Advanced Queries
+++++++++++++++++
+
+Select a Single Column
+^^^^^^^^^^^^^^^^^^^^^^
+
+To retrieve a single indexable or data column, use the
+method ``select_column``. This will, for example, enable you to get the index
+very quickly. These return a ``Series`` of the result, indexed by the row number.
+These do not currently accept the ``where`` selector.
+
+.. ipython:: python
+
+   store.select_column('df_dc', 'index')
+   store.select_column('df_dc', 'string')
+
+.. _io.hdf5-selecting_coordinates:
+
+Selecting coordinates
+^^^^^^^^^^^^^^^^^^^^^
+
+Sometimes you want to get the coordinates (a.k.a the index locations) of your query. This returns an
+``Int64Index`` of the resulting locations. These coordinates can also be passed to subsequent
+``where`` operations.
+
+.. ipython:: python
+
+   df_coord = pd.DataFrame(np.random.randn(1000, 2),
+                           index=pd.date_range('20000101', periods=1000))
+   store.append('df_coord', df_coord)
+   c = store.select_as_coordinates('df_coord', 'index > 20020101')
+   c
+   store.select('df_coord', where=c)
+
+.. _io.hdf5-where_mask:
+
+Selecting using a where mask
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Sometime your query can involve creating a list of rows to select. Usually this ``mask`` would
+be a resulting ``index`` from an indexing operation. This example selects the months of
+a datetimeindex which are 5.
+
+.. ipython:: python
+
+   df_mask = pd.DataFrame(np.random.randn(1000, 2),
+                          index=pd.date_range('20000101', periods=1000))
+   store.append('df_mask', df_mask)
+   c = store.select_column('df_mask', 'index')
+   where = c[pd.DatetimeIndex(c).month == 5].index
+   store.select('df_mask', where=where)
+
+Storer Object
+^^^^^^^^^^^^^
+
+If you want to inspect the stored object, retrieve via
+``get_storer``. You could use this programmatically to say get the number
+of rows in an object.
+
+.. ipython:: python
+
+   store.get_storer('df_dc').nrows
+
+
+Multiple Table Queries
+++++++++++++++++++++++
+
+The methods ``append_to_multiple`` and
+``select_as_multiple`` can perform appending/selecting from
+multiple tables at once. The idea is to have one table (call it the
+selector table) that you index most/all of the columns, and perform your
+queries. The other table(s) are data tables with an index matching the
+selector table's index. You can then perform a very fast query
+on the selector table, yet get lots of data back. This method is similar to
+having a very wide table, but enables more efficient queries.
+
+The ``append_to_multiple`` method splits a given single DataFrame
+into multiple tables according to ``d``, a dictionary that maps the
+table names to a list of 'columns' you want in that table. If `None`
+is used in place of a list, that table will have the remaining
+unspecified columns of the given DataFrame. The argument ``selector``
+defines which table is the selector table (which you can make queries from).
+The argument ``dropna`` will drop rows from the input ``DataFrame`` to ensure
+tables are synchronized.  This means that if a row for one of the tables
+being written to is entirely ``np.NaN``, that row will be dropped from all tables.
+
+If ``dropna`` is False, **THE USER IS RESPONSIBLE FOR SYNCHRONIZING THE TABLES**.
+Remember that entirely ``np.Nan`` rows are not written to the HDFStore, so if
+you choose to call ``dropna=False``, some tables may have more rows than others,
+and therefore ``select_as_multiple`` may not work or it may return unexpected
+results.
+
+.. ipython:: python
+
+   df_mt = pd.DataFrame(np.random.randn(8, 6),
+                        index=pd.date_range('1/1/2000', periods=8),
+                        columns=['A', 'B', 'C', 'D', 'E', 'F'])
+   df_mt['foo'] = 'bar'
+   df_mt.loc[df_mt.index[1], ('A', 'B')] = np.nan
+
+   # you can also create the tables individually
+   store.append_to_multiple({'df1_mt': ['A', 'B'], 'df2_mt': None},
+                            df_mt, selector='df1_mt')
+   store
+
+   # individual tables were created
+   store.select('df1_mt')
+   store.select('df2_mt')
+
+   # as a multiple
+   store.select_as_multiple(['df1_mt', 'df2_mt'], where=['A>0', 'B>0'],
+                            selector='df1_mt')
+
+
+Delete from a Table
+'''''''''''''''''''
+
+You can delete from a table selectively by specifying a ``where``. In
+deleting rows, it is important to understand the ``PyTables`` deletes
+rows by erasing the rows, then **moving** the following data. Thus
+deleting can potentially be a very expensive operation depending on the
+orientation of your data. This is especially true in higher dimensional
+objects (``Panel`` and ``Panel4D``). To get optimal performance, it's
+worthwhile to have the dimension you are deleting be the first of the
+``indexables``.
+
+Data is ordered (on the disk) in terms of the ``indexables``. Here's a
+simple use case. You store panel-type data, with dates in the
+``major_axis`` and ids in the ``minor_axis``. The data is then
+interleaved like this:
+
+* date_1
+    * id_1
+    * id_2
+    *  .
+    * id_n
+* date_2
+    * id_1
+    *  .
+    * id_n
+
+It should be clear that a delete operation on the ``major_axis`` will be
+fairly quick, as one chunk is removed, then the following data moved. On
+the other hand a delete operation on the ``minor_axis`` will be very
+expensive. In this case it would almost certainly be faster to rewrite
+the table using a ``where`` that selects all but the missing data.
+
+.. ipython:: python
+
+   # returns the number of rows deleted
+   store.remove('wp', 'major_axis > 20000102')
+   store.select('wp')
+
+.. warning::
+
+   Please note that HDF5 **DOES NOT RECLAIM SPACE** in the h5 files
+   automatically. Thus, repeatedly deleting (or removing nodes) and adding
+   again, **WILL TEND TO INCREASE THE FILE SIZE**.
+
+   To *repack and clean* the file, use :ref:`ptrepack <io.hdf5-ptrepack>`.
+
+.. _io.hdf5-notes:
+
+Notes & Caveats
+'''''''''''''''
+
+
+Compression
++++++++++++
+
+``PyTables`` allows the stored data to be compressed. This applies to
+all kinds of stores, not just tables. Two parameters are used to
+control compression: ``complevel`` and ``complib``.
+
+``complevel`` specifies if and how hard data is to be compressed.
+              ``complevel=0`` and ``complevel=None`` disables
+              compression and ``0<complevel<10`` enables compression.
+
+``complib`` specifies which compression library to use. If nothing is
+            specified the default library ``zlib`` is used. A
+            compression library usually optimizes for either good
+            compression rates or speed and the results will depend on
+            the type of data. Which type of
+            compression to choose depends on your specific needs and
+            data. The list of supported compression libraries:
+
+             - `zlib <https://zlib.net/>`_: The default compression library. A classic in terms of compression, achieves good compression rates but is somewhat slow.
+             - `lzo <https://www.oberhumer.com/opensource/lzo/>`_: Fast compression and decompression.
+             - `bzip2 <http://bzip.org/>`_: Good compression rates.
+             - `blosc <http://www.blosc.org/>`_: Fast compression and decompression.
+
+             .. versionadded:: 0.20.2
+
+                Support for alternative blosc compressors:
+
+                - `blosc:blosclz <http://www.blosc.org/>`_ This is the
+                  default compressor for ``blosc``
+                - `blosc:lz4
+                  <https://fastcompression.blogspot.dk/p/lz4.html>`_:
+                  A compact, very popular and fast compressor.
+                - `blosc:lz4hc
+                  <https://fastcompression.blogspot.dk/p/lz4.html>`_:
+                  A tweaked version of LZ4, produces better
+                  compression ratios at the expense of speed.
+                - `blosc:snappy <https://google.github.io/snappy/>`_:
+                  A popular compressor used in many places.
+                - `blosc:zlib <https://zlib.net/>`_: A classic;
+                  somewhat slower than the previous ones, but
+                  achieving better compression ratios.
+                - `blosc:zstd <https://facebook.github.io/zstd/>`_: An
+                  extremely well balanced codec; it provides the best
+                  compression ratios among the others above, and at
+                  reasonably fast speed.
+
+             If ``complib`` is defined as something other than the
+             listed libraries a ``ValueError`` exception is issued.
+
+.. note::
+
+   If the library specified with the ``complib`` option is missing on your platform,
+   compression defaults to ``zlib`` without further ado.
+
+Enable compression for all objects within the file:
+
+.. code-block:: python
+
+   store_compressed = pd.HDFStore('store_compressed.h5', complevel=9,
+                                  complib='blosc:blosclz')
+
+Or on-the-fly compression (this only applies to tables) in stores where compression is not enabled:
+
+.. code-block:: python
+
+   store.append('df', df, complib='zlib', complevel=5)
+
+.. _io.hdf5-ptrepack:
+
+ptrepack
+++++++++
+
+``PyTables`` offers better write performance when tables are compressed after
+they are written, as opposed to turning on compression at the very
+beginning. You can use the supplied ``PyTables`` utility
+``ptrepack``. In addition, ``ptrepack`` can change compression levels
+after the fact.
+
+.. code-block:: console
+
+   ptrepack --chunkshape=auto --propindexes --complevel=9 --complib=blosc in.h5 out.h5
+
+Furthermore ``ptrepack in.h5 out.h5`` will *repack* the file to allow
+you to reuse previously deleted space. Alternatively, one can simply
+remove the file and write again, or use the ``copy`` method.
+
+.. _io.hdf5-caveats:
+
+Caveats
++++++++
+
+.. warning::
+
+   ``HDFStore`` is **not-threadsafe for writing**. The underlying
+   ``PyTables`` only supports concurrent reads (via threading or
+   processes). If you need reading and writing *at the same time*, you
+   need to serialize these operations in a single thread in a single
+   process. You will corrupt your data otherwise. See the (:issue:`2397`) for more information.
+
+* If you use locks to manage write access between multiple processes, you
+  may want to use :py:func:`~os.fsync` before releasing write locks. For
+  convenience you can use ``store.flush(fsync=True)`` to do this for you.
+* Once a ``table`` is created its items (Panel) / columns (DataFrame)
+  are fixed; only exactly the same columns can be appended
+* Be aware that timezones (e.g., ``pytz.timezone('US/Eastern')``)
+  are not necessarily equal across timezone versions.  So if data is
+  localized to a specific timezone in the HDFStore using one version
+  of a timezone library and that data is updated with another version, the data
+  will be converted to UTC since these timezones are not considered
+  equal.  Either use the same version of timezone library or use ``tz_convert`` with
+  the updated timezone definition.
+
+.. warning::
+
+   ``PyTables`` will show a ``NaturalNameWarning`` if a column name
+   cannot be used as an attribute selector.
+   *Natural* identifiers contain only letters, numbers, and underscores,
+   and may not begin with a number.
+   Other identifiers cannot be used in a ``where`` clause
+   and are generally a bad idea.
+
+.. _io.hdf5-data_types:
+
+DataTypes
+'''''''''
+
+``HDFStore`` will map an object dtype to the ``PyTables`` underlying
+dtype. This means the following types are known to work:
+
+======================================================  =========================
+Type                                                    Represents missing values
+======================================================  =========================
+floating : ``float64, float32, float16``                ``np.nan``
+integer : ``int64, int32, int8, uint64,uint32, uint8``
+boolean
+``datetime64[ns]``                                      ``NaT``
+``timedelta64[ns]``                                     ``NaT``
+categorical : see the section below
+object : ``strings``                                    ``np.nan``
+======================================================  =========================
+
+``unicode`` columns are not supported, and **WILL FAIL**.
+
+.. _io.hdf5-categorical:
+
+Categorical Data
+++++++++++++++++
+
+You can write data that contains ``category`` dtypes to a ``HDFStore``.
+Queries work the same as if it was an object array. However, the ``category`` dtyped data is
+stored in a more efficient manner.
+
+.. ipython:: python
+
+   dfcat = pd.DataFrame({'A': pd.Series(list('aabbcdba')).astype('category'),
+                         'B': np.random.randn(8)})
+   dfcat
+   dfcat.dtypes
+   cstore = pd.HDFStore('cats.h5', mode='w')
+   cstore.append('dfcat', dfcat, format='table', data_columns=['A'])
+   result = cstore.select('dfcat', where="A in ['b', 'c']")
+   result
+   result.dtypes
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   cstore.close()
+   os.remove('cats.h5')
+
+
+String Columns
+++++++++++++++
+
+**min_itemsize**
+
+The underlying implementation of ``HDFStore`` uses a fixed column width (itemsize) for string columns.
+A string column itemsize is calculated as the maximum of the
+length of data (for that column) that is passed to the ``HDFStore``, **in the first append**. Subsequent appends,
+may introduce a string for a column **larger** than the column can hold, an Exception will be raised (otherwise you
+could have a silent truncation of these columns, leading to loss of information). In the future we may relax this and
+allow a user-specified truncation to occur.
+
+Pass ``min_itemsize`` on the first table creation to a-priori specify the minimum length of a particular string column.
+``min_itemsize`` can be an integer, or a dict mapping a column name to an integer. You can pass ``values`` as a key to
+allow all *indexables* or *data_columns* to have this min_itemsize.
+
+Passing a ``min_itemsize`` dict will cause all passed columns to be created as *data_columns* automatically.
+
+.. note::
+
+   If you are not passing any ``data_columns``, then the ``min_itemsize`` will be the maximum of the length of any string passed
+
+.. ipython:: python
+
+   dfs = pd.DataFrame({'A': 'foo', 'B': 'bar'}, index=list(range(5)))
+   dfs
+
+   # A and B have a size of 30
+   store.append('dfs', dfs, min_itemsize=30)
+   store.get_storer('dfs').table
+
+   # A is created as a data_column with a size of 30
+   # B is size is calculated
+   store.append('dfs2', dfs, min_itemsize={'A': 30})
+   store.get_storer('dfs2').table
+
+**nan_rep**
+
+String columns will serialize a ``np.nan`` (a missing value) with the ``nan_rep`` string representation. This defaults to the string value ``nan``.
+You could inadvertently turn an actual ``nan`` value into a missing value.
+
+.. ipython:: python
+
+   dfss = pd.DataFrame({'A': ['foo', 'bar', 'nan']})
+   dfss
+
+   store.append('dfss', dfss)
+   store.select('dfss')
+
+   # here you need to specify a different nan rep
+   store.append('dfss2', dfss, nan_rep='_nan_')
+   store.select('dfss2')
+
+.. _io.external_compatibility:
+
+External Compatibility
+''''''''''''''''''''''
+
+``HDFStore`` writes ``table`` format objects in specific formats suitable for
+producing loss-less round trips to pandas objects. For external
+compatibility, ``HDFStore`` can read native ``PyTables`` format
+tables.
+
+It is possible to write an ``HDFStore`` object that can easily be imported into ``R`` using the
+``rhdf5`` library (`Package website`_). Create a table format store like this:
+
+.. _package website: https://www.bioconductor.org/packages/release/bioc/html/rhdf5.html
+
+.. ipython:: python
+
+   df_for_r = pd.DataFrame({"first": np.random.rand(100),
+                            "second": np.random.rand(100),
+                            "class": np.random.randint(0, 2, (100, ))},
+                           index=range(100))
+   df_for_r.head()
+
+   store_export = pd.HDFStore('export.h5')
+   store_export.append('df_for_r', df_for_r, data_columns=df_dc.columns)
+   store_export
+
+.. ipython:: python
+   :suppress:
+
+   store_export.close()
+   os.remove('export.h5')
+
+In R this file can be read into a ``data.frame`` object using the ``rhdf5``
+library. The following example function reads the corresponding column names
+and data values from the values and assembles them into a ``data.frame``:
+
+.. code-block:: R
+
+   # Load values and column names for all datasets from corresponding nodes and
+   # insert them into one data.frame object.
+
+   library(rhdf5)
+
+   loadhdf5data <- function(h5File) {
+
+   listing <- h5ls(h5File)
+   # Find all data nodes, values are stored in *_values and corresponding column
+   # titles in *_items
+   data_nodes <- grep("_values", listing$name)
+   name_nodes <- grep("_items", listing$name)
+   data_paths = paste(listing$group[data_nodes], listing$name[data_nodes], sep = "/")
+   name_paths = paste(listing$group[name_nodes], listing$name[name_nodes], sep = "/")
+   columns = list()
+   for (idx in seq(data_paths)) {
+     # NOTE: matrices returned by h5read have to be transposed to obtain
+     # required Fortran order!
+     data <- data.frame(t(h5read(h5File, data_paths[idx])))
+     names <- t(h5read(h5File, name_paths[idx]))
+     entry <- data.frame(data)
+     colnames(entry) <- names
+     columns <- append(columns, entry)
+   }
+
+   data <- data.frame(columns)
+
+   return(data)
+   }
+
+Now you can import the ``DataFrame`` into R:
+
+.. code-block:: R
+
+   > data = loadhdf5data("transfer.hdf5")
+   > head(data)
+            first    second class
+   1 0.4170220047 0.3266449     0
+   2 0.7203244934 0.5270581     0
+   3 0.0001143748 0.8859421     1
+   4 0.3023325726 0.3572698     1
+   5 0.1467558908 0.9085352     1
+   6 0.0923385948 0.6233601     1
+
+.. note::
+   The R function lists the entire HDF5 file's contents and assembles the
+   ``data.frame`` object from all matching nodes, so use this only as a
+   starting point if you have stored multiple ``DataFrame`` objects to a
+   single HDF5 file.
+
+
+Performance
+'''''''''''
+
+* ``tables`` format come with a writing performance penalty as compared to
+  ``fixed`` stores. The benefit is the ability to append/delete and
+  query (potentially very large amounts of data).  Write times are
+  generally longer as compared with regular stores. Query times can
+  be quite fast, especially on an indexed axis.
+* You can pass ``chunksize=<int>`` to ``append``, specifying the
+  write chunksize (default is 50000). This will significantly lower
+  your memory usage on writing.
+* You can pass ``expectedrows=<int>`` to the first ``append``,
+  to set the TOTAL number of expected rows that ``PyTables`` will
+  expected. This will optimize read/write performance.
+* Duplicate rows can be written to tables, but are filtered out in
+  selection (with the last items being selected; thus a table is
+  unique on major, minor pairs)
+* A ``PerformanceWarning`` will be raised if you are attempting to
+  store types that will be pickled by PyTables (rather than stored as
+  endemic types). See
+  `Here <https://stackoverflow.com/questions/14355151/how-to-make-pandas-hdfstore-put-operation-faster/14370190#14370190>`__
+  for more information and some solutions.
+
+
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   os.remove('store.h5')
+
+
+.. _io.feather:
+
+Feather
+-------
+
+.. versionadded:: 0.20.0
+
+Feather provides binary columnar serialization for data frames. It is designed to make reading and writing data
+frames efficient, and to make sharing data across data analysis languages easy.
+
+Feather is designed to faithfully serialize and de-serialize DataFrames, supporting all of the pandas
+dtypes, including extension dtypes such as categorical and datetime with tz.
+
+Several caveats.
+
+* This is a newer library, and the format, though stable, is not guaranteed to be backward compatible
+  to the earlier versions.
+* The format will NOT write an ``Index``, or ``MultiIndex`` for the
+  ``DataFrame`` and will raise an error if a non-default one is provided. You
+  can ``.reset_index()`` to store the index or ``.reset_index(drop=True)`` to
+  ignore it.
+* Duplicate column names and non-string columns names are not supported
+* Non supported types include ``Period`` and actual Python object types. These will raise a helpful error message
+  on an attempt at serialization.
+
+See the `Full Documentation <https://github.com/wesm/feather>`__.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': list('abc'),
+                      'b': list(range(1, 4)),
+                      'c': np.arange(3, 6).astype('u1'),
+                      'd': np.arange(4.0, 7.0, dtype='float64'),
+                      'e': [True, False, True],
+                      'f': pd.Categorical(list('abc')),
+                      'g': pd.date_range('20130101', periods=3),
+                      'h': pd.date_range('20130101', periods=3, tz='US/Eastern'),
+                      'i': pd.date_range('20130101', periods=3, freq='ns')})
+
+   df
+   df.dtypes
+
+Write to a feather file.
+
+.. ipython:: python
+   :okwarning:
+
+   df.to_feather('example.feather')
+
+Read from a feather file.
+
+.. ipython:: python
+   :okwarning:
+
+   result = pd.read_feather('example.feather')
+   result
+
+   # we preserve dtypes
+   result.dtypes
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('example.feather')
+
+
+.. _io.parquet:
+
+Parquet
+-------
+
+.. versionadded:: 0.21.0
+
+`Apache Parquet <https://parquet.apache.org/>`__ provides a partitioned binary columnar serialization for data frames. It is designed to
+make reading and writing data frames efficient, and to make sharing data across data analysis
+languages easy. Parquet can use a variety of compression techniques to shrink the file size as much as possible
+while still maintaining good read performance.
+
+Parquet is designed to faithfully serialize and de-serialize ``DataFrame`` s, supporting all of the pandas
+dtypes, including extension dtypes such as datetime with tz.
+
+Several caveats.
+
+* Duplicate column names and non-string columns names are not supported.
+* The ``pyarrow`` engine always writes the index to the output, but ``fastparquet`` only writes non-default
+  indexes. This extra column can cause problems for non-Pandas consumers that are not expecting it. You can
+  force including or omitting indexes with the ``index`` argument, regardless of the underlying engine.
+* Index level names, if specified, must be strings.
+* Categorical dtypes can be serialized to parquet, but will de-serialize as ``object`` dtype.
+* Non supported types include ``Period`` and actual Python object types. These will raise a helpful error message
+  on an attempt at serialization.
+
+You can specify an ``engine`` to direct the serialization. This can be one of ``pyarrow``, or ``fastparquet``, or ``auto``.
+If the engine is NOT specified, then the ``pd.options.io.parquet.engine`` option is checked; if this is also ``auto``,
+then ``pyarrow`` is tried, and falling back to ``fastparquet``.
+
+See the documentation for `pyarrow <https://arrow.apache.org/docs/python/>`__ and `fastparquet <https://fastparquet.readthedocs.io/en/latest/>`__.
+
+.. note::
+
+   These engines are very similar and should read/write nearly identical parquet format files.
+   Currently ``pyarrow`` does not support timedelta data, ``fastparquet>=0.1.4`` supports timezone aware datetimes.
+   These libraries differ by having different underlying dependencies (``fastparquet`` by using ``numba``, while ``pyarrow`` uses a c-library).
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': list('abc'),
+                      'b': list(range(1, 4)),
+                      'c': np.arange(3, 6).astype('u1'),
+                      'd': np.arange(4.0, 7.0, dtype='float64'),
+                      'e': [True, False, True],
+                      'f': pd.date_range('20130101', periods=3),
+                      'g': pd.date_range('20130101', periods=3, tz='US/Eastern')})
+
+   df
+   df.dtypes
+
+Write to a parquet file.
+
+.. ipython:: python
+
+   df.to_parquet('example_pa.parquet', engine='pyarrow')
+   df.to_parquet('example_fp.parquet', engine='fastparquet')
+
+Read from a parquet file.
+
+.. ipython:: python
+   :okwarning:
+
+   result = pd.read_parquet('example_fp.parquet', engine='fastparquet')
+   result = pd.read_parquet('example_pa.parquet', engine='pyarrow')
+
+   result.dtypes
+
+Read only certain columns of a parquet file.
+
+.. ipython:: python
+
+   result = pd.read_parquet('example_fp.parquet',
+                            engine='fastparquet', columns=['a', 'b'])
+
+   result.dtypes
+
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('example_pa.parquet')
+   os.remove('example_fp.parquet')
+
+
+Handling Indexes
+''''''''''''''''
+
+Serializing a ``DataFrame`` to parquet may include the implicit index as one or
+more columns in the output file. Thus, this code:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'a': [1, 2], 'b': [3, 4]})
+    df.to_parquet('test.parquet', engine='pyarrow')
+
+creates a parquet file with *three* columns if you use ``pyarrow`` for serialization:
+``a``, ``b``, and ``__index_level_0__``. If you're using ``fastparquet``, the
+index `may or may not <https://fastparquet.readthedocs.io/en/latest/api.html#fastparquet.write>`_
+be written to the file.
+
+This unexpected extra column causes some databases like Amazon Redshift to reject
+the file, because that column doesn't exist in the target table.
+
+If you want to omit a dataframe's indexes when writing, pass ``index=False`` to
+:func:`~pandas.DataFrame.to_parquet`:
+
+.. ipython:: python
+
+    df.to_parquet('test.parquet', index=False)
+
+This creates a parquet file with just the two expected columns, ``a`` and ``b``.
+If your ``DataFrame`` has a custom index, you won't get it back when you load
+this file into a ``DataFrame``.
+
+Passing ``index=True`` will *always* write the index, even if that's not the
+underlying engine's default behavior.
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('test.parquet')
+
+
+Partitioning Parquet files
+''''''''''''''''''''''''''
+
+.. versionadded:: 0.24.0
+
+Parquet supports partitioning of data based on the values of one or more columns.
+
+.. ipython:: python
+    :okwarning:
+
+    df = pd.DataFrame({'a': [0, 0, 1, 1], 'b': [0, 1, 0, 1]})
+    df.to_parquet(fname='test', engine='pyarrow',
+                  partition_cols=['a'], compression=None)
+
+The `fname` specifies the parent directory to which data will be saved.
+The `partition_cols` are the column names by which the dataset will be partitioned.
+Columns are partitioned in the order they are given. The partition splits are
+determined by the unique values in the partition columns.
+The above example creates a partitioned dataset that may look like:
+
+.. code-block:: text
+
+    test
+    ├── a=0
+    │   ├── 0bac803e32dc42ae83fddfd029cbdebc.parquet
+    │   └──  ...
+    └── a=1
+        ├── e6ab24a4f45147b49b54a662f0c412a3.parquet
+        └── ...
+
+.. ipython:: python
+   :suppress:
+
+   from shutil import rmtree
+   try:
+       rmtree('test')
+   except Exception:
+       pass
+
+.. _io.sql:
+
+SQL Queries
+-----------
+
+The :mod:`pandas.io.sql` module provides a collection of query wrappers to both
+facilitate data retrieval and to reduce dependency on DB-specific API. Database abstraction
+is provided by SQLAlchemy if installed. In addition you will need a driver library for
+your database. Examples of such drivers are `psycopg2 <http://initd.org/psycopg/>`__
+for PostgreSQL or `pymysql <https://github.com/PyMySQL/PyMySQL>`__ for MySQL.
+For `SQLite <https://docs.python.org/3/library/sqlite3.html>`__ this is
+included in Python's standard library by default.
+You can find an overview of supported drivers for each SQL dialect in the
+`SQLAlchemy docs <https://docs.sqlalchemy.org/en/latest/dialects/index.html>`__.
+
+If SQLAlchemy is not installed, a fallback is only provided for sqlite (and
+for mysql for backwards compatibility, but this is deprecated and will be
+removed in a future version).
+This mode requires a Python database adapter which respect the `Python
+DB-API <https://www.python.org/dev/peps/pep-0249/>`__.
+
+See also some :ref:`cookbook examples <cookbook.sql>` for some advanced strategies.
+
+The key functions are:
+
+.. autosummary::
+    :toctree: ../reference/api/
+
+    read_sql_table
+    read_sql_query
+    read_sql
+    DataFrame.to_sql
+
+.. note::
+
+    The function :func:`~pandas.read_sql` is a convenience wrapper around
+    :func:`~pandas.read_sql_table` and :func:`~pandas.read_sql_query` (and for
+    backward compatibility) and will delegate to specific function depending on
+    the provided input (database table name or sql query).
+    Table names do not need to be quoted if they have special characters.
+
+In the following example, we use the `SQlite <https://www.sqlite.org/>`__ SQL database
+engine. You can use a temporary SQLite database where data are stored in
+"memory".
+
+To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
+object from database URI. You only need to create the engine once per database you are
+connecting to.
+For more information on :func:`create_engine` and the URI formatting, see the examples
+below and the SQLAlchemy `documentation <https://docs.sqlalchemy.org/en/latest/core/engines.html>`__
+
+.. ipython:: python
+
+   from sqlalchemy import create_engine
+   # Create your engine.
+   engine = create_engine('sqlite:///:memory:')
+
+If you want to manage your own connections you can pass one of those instead:
+
+.. code-block:: python
+
+   with engine.connect() as conn, conn.begin():
+       data = pd.read_sql_table('data', conn)
+
+Writing DataFrames
+''''''''''''''''''
+
+Assuming the following data is in a ``DataFrame`` ``data``, we can insert it into
+the database using :func:`~pandas.DataFrame.to_sql`.
+
++-----+------------+-------+-------+-------+
+| id  |    Date    | Col_1 | Col_2 | Col_3 |
++=====+============+=======+=======+=======+
+| 26  | 2012-10-18 |   X   |  25.7 | True  |
++-----+------------+-------+-------+-------+
+| 42  | 2012-10-19 |   Y   | -12.4 | False |
++-----+------------+-------+-------+-------+
+| 63  | 2012-10-20 |   Z   |  5.73 | True  |
++-----+------------+-------+-------+-------+
+
+
+.. ipython:: python
+   :suppress:
+
+   import datetime
+   c = ['id', 'Date', 'Col_1', 'Col_2', 'Col_3']
+   d = [(26, datetime.datetime(2010, 10, 18), 'X', 27.5, True),
+        (42, datetime.datetime(2010, 10, 19), 'Y', -12.5, False),
+        (63, datetime.datetime(2010, 10, 20), 'Z', 5.73, True)]
+
+   data = pd.DataFrame(d, columns=c)
+
+.. ipython:: python
+
+    data
+    data.to_sql('data', engine)
+
+With some databases, writing large DataFrames can result in errors due to
+packet size limitations being exceeded. This can be avoided by setting the
+``chunksize`` parameter when calling ``to_sql``.  For example, the following
+writes ``data`` to the database in batches of 1000 rows at a time:
+
+.. ipython:: python
+
+    data.to_sql('data_chunked', engine, chunksize=1000)
+
+SQL data types
+++++++++++++++
+
+:func:`~pandas.DataFrame.to_sql` will try to map your data to an appropriate
+SQL data type based on the dtype of the data. When you have columns of dtype
+``object``, pandas will try to infer the data type.
+
+You can always override the default type by specifying the desired SQL type of
+any of the columns by using the ``dtype`` argument. This argument needs a
+dictionary mapping column names to SQLAlchemy types (or strings for the sqlite3
+fallback mode).
+For example, specifying to use the sqlalchemy ``String`` type instead of the
+default ``Text`` type for string columns:
+
+.. ipython:: python
+
+    from sqlalchemy.types import String
+    data.to_sql('data_dtype', engine, dtype={'Col_1': String})
+
+.. note::
+
+    Due to the limited support for timedelta's in the different database
+    flavors, columns with type ``timedelta64`` will be written as integer
+    values as nanoseconds to the database and a warning will be raised.
+
+.. note::
+
+    Columns of ``category`` dtype will be converted to the dense representation
+    as you would get with ``np.asarray(categorical)`` (e.g. for string categories
+    this gives an array of strings).
+    Because of this, reading the database table back in does **not** generate
+    a categorical.
+
+.. _io.sql_datetime_data:
+
+Datetime data types
+'''''''''''''''''''
+
+Using SQLAlchemy, :func:`~pandas.DataFrame.to_sql` is capable of writing
+datetime data that is timezone naive or timezone aware. However, the resulting
+data stored in the database ultimately depends on the supported data type
+for datetime data of the database system being used.
+
+The following table lists supported data types for datetime data for some
+common databases. Other database dialects may have different data types for
+datetime data.
+
+===========   =============================================  ===================
+Database      SQL Datetime Types                             Timezone Support
+===========   =============================================  ===================
+SQLite        ``TEXT``                                       No
+MySQL         ``TIMESTAMP`` or ``DATETIME``                  No
+PostgreSQL    ``TIMESTAMP`` or ``TIMESTAMP WITH TIME ZONE``  Yes
+===========   =============================================  ===================
+
+When writing timezone aware data to databases that do not support timezones,
+the data will be written as timezone naive timestamps that are in local time
+with respect to the timezone.
+
+:func:`~pandas.read_sql_table` is also capable of reading datetime data that is
+timezone aware or naive. When reading ``TIMESTAMP WITH TIME ZONE`` types, pandas
+will convert the data to UTC.
+
+.. _io.sql.method:
+
+Insertion Method
+++++++++++++++++
+
+.. versionadded:: 0.24.0
+
+The parameter ``method`` controls the SQL insertion clause used.
+Possible values are:
+
+- ``None``: Uses standard SQL ``INSERT`` clause (one per row).
+- ``'multi'``: Pass multiple values in a single ``INSERT`` clause.
+  It uses a *special* SQL syntax not supported by all backends.
+  This usually provides better performance for analytic databases
+  like *Presto* and *Redshift*, but has worse performance for
+  traditional SQL backend if the table contains many columns.
+  For more information check the SQLAlchemy `documention
+  <http://docs.sqlalchemy.org/en/latest/core/dml.html#sqlalchemy.sql.expression.Insert.values.params.*args>`__.
+- callable with signature ``(pd_table, conn, keys, data_iter)``:
+  This can be used to implement a more performant insertion method based on
+  specific backend dialect features.
+
+Example of a callable using PostgreSQL `COPY clause
+<https://www.postgresql.org/docs/current/static/sql-copy.html>`__::
+
+  # Alternative to_sql() *method* for DBs that support COPY FROM
+  import csv
+  from io import StringIO
+
+  def psql_insert_copy(table, conn, keys, data_iter):
+      # gets a DBAPI connection that can provide a cursor
+      dbapi_conn = conn.connection
+      with dbapi_conn.cursor() as cur:
+          s_buf = StringIO()
+          writer = csv.writer(s_buf)
+          writer.writerows(data_iter)
+          s_buf.seek(0)
+
+          columns = ', '.join('"{}"'.format(k) for k in keys)
+          if table.schema:
+              table_name = '{}.{}'.format(table.schema, table.name)
+          else:
+              table_name = table.name
+
+          sql = 'COPY {} ({}) FROM STDIN WITH CSV'.format(
+              table_name, columns)
+          cur.copy_expert(sql=sql, file=s_buf)
+
+Reading Tables
+''''''''''''''
+
+:func:`~pandas.read_sql_table` will read a database table given the
+table name and optionally a subset of columns to read.
+
+.. note::
+
+    In order to use :func:`~pandas.read_sql_table`, you **must** have the
+    SQLAlchemy optional dependency installed.
+
+.. ipython:: python
+
+   pd.read_sql_table('data', engine)
+
+You can also specify the name of the column as the ``DataFrame`` index,
+and specify a subset of columns to be read.
+
+.. ipython:: python
+
+   pd.read_sql_table('data', engine, index_col='id')
+   pd.read_sql_table('data', engine, columns=['Col_1', 'Col_2'])
+
+And you can explicitly force columns to be parsed as dates:
+
+.. ipython:: python
+
+   pd.read_sql_table('data', engine, parse_dates=['Date'])
+
+If needed you can explicitly specify a format string, or a dict of arguments
+to pass to :func:`pandas.to_datetime`:
+
+.. code-block:: python
+
+   pd.read_sql_table('data', engine, parse_dates={'Date': '%Y-%m-%d'})
+   pd.read_sql_table('data', engine,
+                     parse_dates={'Date': {'format': '%Y-%m-%d %H:%M:%S'}})
+
+
+You can check if a table exists using :func:`~pandas.io.sql.has_table`
+
+Schema support
+''''''''''''''
+
+Reading from and writing to different schema's is supported through the ``schema``
+keyword in the :func:`~pandas.read_sql_table` and :func:`~pandas.DataFrame.to_sql`
+functions. Note however that this depends on the database flavor (sqlite does not
+have schema's). For example:
+
+.. code-block:: python
+
+   df.to_sql('table', engine, schema='other_schema')
+   pd.read_sql_table('table', engine, schema='other_schema')
+
+Querying
+''''''''
+
+You can query using raw SQL in the :func:`~pandas.read_sql_query` function.
+In this case you must use the SQL variant appropriate for your database.
+When using SQLAlchemy, you can also pass SQLAlchemy Expression language constructs,
+which are database-agnostic.
+
+.. ipython:: python
+
+   pd.read_sql_query('SELECT * FROM data', engine)
+
+Of course, you can specify a more "complex" query.
+
+.. ipython:: python
+
+   pd.read_sql_query("SELECT id, Col_1, Col_2 FROM data WHERE id = 42;", engine)
+
+The :func:`~pandas.read_sql_query` function supports a ``chunksize`` argument.
+Specifying this will return an iterator through chunks of the query result:
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.random.randn(20, 3), columns=list('abc'))
+    df.to_sql('data_chunks', engine, index=False)
+
+.. ipython:: python
+
+    for chunk in pd.read_sql_query("SELECT * FROM data_chunks",
+                                   engine, chunksize=5):
+        print(chunk)
+
+You can also run a plain query without creating a ``DataFrame`` with
+:func:`~pandas.io.sql.execute`. This is useful for queries that don't return values,
+such as INSERT. This is functionally equivalent to calling ``execute`` on the
+SQLAlchemy engine or db connection object. Again, you must use the SQL syntax
+variant appropriate for your database.
+
+.. code-block:: python
+
+   from pandas.io import sql
+   sql.execute('SELECT * FROM table_name', engine)
+   sql.execute('INSERT INTO table_name VALUES(?, ?, ?)', engine,
+               params=[('id', 1, 12.2, True)])
+
+
+Engine connection examples
+''''''''''''''''''''''''''
+
+To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
+object from database URI. You only need to create the engine once per database you are
+connecting to.
+
+.. code-block:: python
+
+   from sqlalchemy import create_engine
+
+   engine = create_engine('postgresql://scott:tiger@localhost:5432/mydatabase')
+
+   engine = create_engine('mysql+mysqldb://scott:tiger@localhost/foo')
+
+   engine = create_engine('oracle://scott:tiger@127.0.0.1:1521/sidname')
+
+   engine = create_engine('mssql+pyodbc://mydsn')
+
+   # sqlite://<nohostname>/<path>
+   # where <path> is relative:
+   engine = create_engine('sqlite:///foo.db')
+
+   # or absolute, starting with a slash:
+   engine = create_engine('sqlite:////absolute/path/to/foo.db')
+
+For more information see the examples the SQLAlchemy `documentation <https://docs.sqlalchemy.org/en/latest/core/engines.html>`__
+
+
+Advanced SQLAlchemy queries
+'''''''''''''''''''''''''''
+
+You can use SQLAlchemy constructs to describe your query.
+
+Use :func:`sqlalchemy.text` to specify query parameters in a backend-neutral way
+
+.. ipython:: python
+
+   import sqlalchemy as sa
+   pd.read_sql(sa.text('SELECT * FROM data where Col_1=:col1'),
+               engine, params={'col1': 'X'})
+
+If you have an SQLAlchemy description of your database you can express where conditions using SQLAlchemy expressions
+
+.. ipython:: python
+
+   metadata = sa.MetaData()
+   data_table = sa.Table('data', metadata,
+                         sa.Column('index', sa.Integer),
+                         sa.Column('Date', sa.DateTime),
+                         sa.Column('Col_1', sa.String),
+                         sa.Column('Col_2', sa.Float),
+                         sa.Column('Col_3', sa.Boolean),
+                         )
+
+   pd.read_sql(sa.select([data_table]).where(data_table.c.Col_3 is True), engine)
+
+You can combine SQLAlchemy expressions with parameters passed to :func:`read_sql` using :func:`sqlalchemy.bindparam`
+
+.. ipython:: python
+
+    import datetime as dt
+    expr = sa.select([data_table]).where(data_table.c.Date > sa.bindparam('date'))
+    pd.read_sql(expr, engine, params={'date': dt.datetime(2010, 10, 18)})
+
+
+Sqlite fallback
+'''''''''''''''
+
+The use of sqlite is supported without using SQLAlchemy.
+This mode requires a Python database adapter which respect the `Python
+DB-API <https://www.python.org/dev/peps/pep-0249/>`__.
+
+You can create connections like so:
+
+.. code-block:: python
+
+   import sqlite3
+   con = sqlite3.connect(':memory:')
+
+And then issue the following queries:
+
+.. code-block:: python
+
+   data.to_sql('data', con)
+   pd.read_sql_query("SELECT * FROM data", con)
+
+
+.. _io.bigquery:
+
+Google BigQuery
+---------------
+
+.. warning::
+
+   Starting in 0.20.0, pandas has split off Google BigQuery support into the
+   separate package ``pandas-gbq``. You can ``pip install pandas-gbq`` to get it.
+
+The ``pandas-gbq`` package provides functionality to read/write from Google BigQuery.
+
+pandas integrates with this external package. if ``pandas-gbq`` is installed, you can
+use the pandas methods ``pd.read_gbq`` and ``DataFrame.to_gbq``, which will call the
+respective functions from ``pandas-gbq``.
+
+Full documentation can be found `here <https://pandas-gbq.readthedocs.io/>`__.
+
+.. _io.stata:
+
+Stata Format
+------------
+
+.. _io.stata_writer:
+
+Writing to Stata format
+'''''''''''''''''''''''
+
+The method :func:`~pandas.core.frame.DataFrame.to_stata` will write a DataFrame
+into a .dta file. The format version of this file is always 115 (Stata 12).
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 2), columns=list('AB'))
+   df.to_stata('stata.dta')
+
+*Stata* data files have limited data type support; only strings with
+244 or fewer characters, ``int8``, ``int16``, ``int32``, ``float32``
+and ``float64`` can be stored in ``.dta`` files.  Additionally,
+*Stata* reserves certain values to represent missing data. Exporting a
+non-missing value that is outside of the permitted range in Stata for
+a particular data type will retype the variable to the next larger
+size.  For example, ``int8`` values are restricted to lie between -127
+and 100 in Stata, and so variables with values above 100 will trigger
+a conversion to ``int16``. ``nan`` values in floating points data
+types are stored as the basic missing data type (``.`` in *Stata*).
+
+.. note::
+
+    It is not possible to export missing data values for integer data types.
+
+
+The *Stata* writer gracefully handles other data types including ``int64``,
+``bool``, ``uint8``, ``uint16``, ``uint32`` by casting to
+the smallest supported type that can represent the data.  For example, data
+with a type of ``uint8`` will be cast to ``int8`` if all values are less than
+100 (the upper bound for non-missing ``int8`` data in *Stata*), or, if values are
+outside of this range, the variable is cast to ``int16``.
+
+
+.. warning::
+
+   Conversion from ``int64`` to ``float64`` may result in a loss of precision
+   if ``int64`` values are larger than 2**53.
+
+.. warning::
+
+  :class:`~pandas.io.stata.StataWriter` and
+  :func:`~pandas.core.frame.DataFrame.to_stata` only support fixed width
+  strings containing up to 244 characters, a limitation imposed by the version
+  115 dta file format. Attempting to write *Stata* dta files with strings
+  longer than 244 characters raises a ``ValueError``.
+
+.. _io.stata_reader:
+
+Reading from Stata format
+'''''''''''''''''''''''''
+
+The top-level function ``read_stata`` will read a dta file and return
+either a ``DataFrame`` or a :class:`~pandas.io.stata.StataReader` that can
+be used to read the file incrementally.
+
+.. ipython:: python
+
+   pd.read_stata('stata.dta')
+
+Specifying a ``chunksize`` yields a
+:class:`~pandas.io.stata.StataReader` instance that can be used to
+read ``chunksize`` lines from the file at a time.  The ``StataReader``
+object can be used as an iterator.
+
+.. ipython:: python
+
+  reader = pd.read_stata('stata.dta', chunksize=3)
+  for df in reader:
+      print(df.shape)
+
+For more fine-grained control, use ``iterator=True`` and specify
+``chunksize`` with each call to
+:func:`~pandas.io.stata.StataReader.read`.
+
+.. ipython:: python
+
+  reader = pd.read_stata('stata.dta', iterator=True)
+  chunk1 = reader.read(5)
+  chunk2 = reader.read(5)
+
+Currently the ``index`` is retrieved as a column.
+
+The parameter ``convert_categoricals`` indicates whether value labels should be
+read and used to create a ``Categorical`` variable from them. Value labels can
+also be retrieved by the function ``value_labels``, which requires :func:`~pandas.io.stata.StataReader.read`
+to be called before use.
+
+The parameter ``convert_missing`` indicates whether missing value
+representations in Stata should be preserved.  If ``False`` (the default),
+missing values are represented as ``np.nan``.  If ``True``, missing values are
+represented using ``StataMissingValue`` objects, and columns containing missing
+values will have ``object`` data type.
+
+.. note::
+
+   :func:`~pandas.read_stata` and
+   :class:`~pandas.io.stata.StataReader` support .dta formats 113-115
+   (Stata 10-12), 117 (Stata 13), and 118 (Stata 14).
+
+.. note::
+
+   Setting ``preserve_dtypes=False`` will upcast to the standard pandas data types:
+   ``int64`` for all integer types and ``float64`` for floating point data.  By default,
+   the Stata data types are preserved when importing.
+
+.. ipython:: python
+   :suppress:
+
+   os.remove('stata.dta')
+
+.. _io.stata-categorical:
+
+Categorical Data
+++++++++++++++++
+
+``Categorical`` data can be exported to *Stata* data files as value labeled data.
+The exported data consists of the underlying category codes as integer data values
+and the categories as value labels.  *Stata* does not have an explicit equivalent
+to a ``Categorical`` and information about *whether* the variable is ordered
+is lost when exporting.
+
+.. warning::
+
+    *Stata* only supports string value labels, and so ``str`` is called on the
+    categories when exporting data.  Exporting ``Categorical`` variables with
+    non-string categories produces a warning, and can result a loss of
+    information if the ``str`` representations of the categories are not unique.
+
+Labeled data can similarly be imported from *Stata* data files as ``Categorical``
+variables using the keyword argument ``convert_categoricals`` (``True`` by default).
+The keyword argument ``order_categoricals`` (``True`` by default) determines
+whether imported ``Categorical`` variables are ordered.
+
+.. note::
+
+    When importing categorical data, the values of the variables in the *Stata*
+    data file are not preserved since ``Categorical`` variables always
+    use integer data types between ``-1`` and ``n-1`` where ``n`` is the number
+    of categories. If the original values in the *Stata* data file are required,
+    these can be imported by setting ``convert_categoricals=False``, which will
+    import original data (but not the variable labels). The original values can
+    be matched to the imported categorical data since there is a simple mapping
+    between the original *Stata* data values and the category codes of imported
+    Categorical variables: missing values are assigned code ``-1``, and the
+    smallest original value is assigned ``0``, the second smallest is assigned
+    ``1`` and so on until the largest original value is assigned the code ``n-1``.
+
+.. note::
+
+    *Stata* supports partially labeled series. These series have value labels for
+    some but not all data values. Importing a partially labeled series will produce
+    a ``Categorical`` with string categories for the values that are labeled and
+    numeric categories for values with no label.
+
+.. _io.sas:
+
+.. _io.sas_reader:
+
+SAS Formats
+-----------
+
+The top-level function :func:`read_sas` can read (but not write) SAS
+`xport` (.XPT) and (since *v0.18.0*) `SAS7BDAT` (.sas7bdat) format files.
+
+SAS files only contain two value types: ASCII text and floating point
+values (usually 8 bytes but sometimes truncated).  For xport files,
+there is no automatic type conversion to integers, dates, or
+categoricals.  For SAS7BDAT files, the format codes may allow date
+variables to be automatically converted to dates.  By default the
+whole file is read and returned as a ``DataFrame``.
+
+Specify a ``chunksize`` or use ``iterator=True`` to obtain reader
+objects (``XportReader`` or ``SAS7BDATReader``) for incrementally
+reading the file.  The reader objects also have attributes that
+contain additional information about the file and its variables.
+
+Read a SAS7BDAT file:
+
+.. code-block:: python
+
+    df = pd.read_sas('sas_data.sas7bdat')
+
+Obtain an iterator and read an XPORT file 100,000 lines at a time:
+
+.. code-block:: python
+
+    def do_something(chunk):
+        pass
+
+    rdr = pd.read_sas('sas_xport.xpt', chunk=100000)
+    for chunk in rdr:
+        do_something(chunk)
+
+The specification_ for the xport file format is available from the SAS
+web site.
+
+.. _specification: https://support.sas.com/techsup/technote/ts140.pdf
+
+No official documentation is available for the SAS7BDAT format.
+
+.. _io.other:
+
+Other file formats
+------------------
+
+pandas itself only supports IO with a limited set of file formats that map
+cleanly to its tabular data model. For reading and writing other file formats
+into and from pandas, we recommend these packages from the broader community.
+
+netCDF
+''''''
+
+xarray_ provides data structures inspired by the pandas ``DataFrame`` for working
+with multi-dimensional datasets, with a focus on the netCDF file format and
+easy conversion to and from pandas.
+
+.. _xarray: https://xarray.pydata.org/
+
+.. _io.perf:
+
+Performance Considerations
+--------------------------
+
+This is an informal comparison of various IO methods, using pandas
+0.20.3. Timings are machine dependent and small differences should be
+ignored.
+
+.. code-block:: ipython
+
+   In [1]: sz = 1000000
+   In [2]: df = pd.DataFrame({'A': np.random.randn(sz), 'B': [1] * sz})
+
+   In [3]: df.info()
+   <class 'pandas.core.frame.DataFrame'>
+   RangeIndex: 1000000 entries, 0 to 999999
+   Data columns (total 2 columns):
+   A    1000000 non-null float64
+   B    1000000 non-null int64
+   dtypes: float64(1), int64(1)
+   memory usage: 15.3 MB
+
+Given the next test set:
+
+.. code-block:: python
+
+   from numpy.random import randn
+
+   sz = 1000000
+   df = pd.DataFrame({'A': randn(sz), 'B': [1] * sz})
+
+
+   def test_sql_write(df):
+       if os.path.exists('test.sql'):
+           os.remove('test.sql')
+       sql_db = sqlite3.connect('test.sql')
+       df.to_sql(name='test_table', con=sql_db)
+       sql_db.close()
+
+
+   def test_sql_read():
+       sql_db = sqlite3.connect('test.sql')
+       pd.read_sql_query("select * from test_table", sql_db)
+       sql_db.close()
+
+
+   def test_hdf_fixed_write(df):
+       df.to_hdf('test_fixed.hdf', 'test', mode='w')
+
+
+   def test_hdf_fixed_read():
+       pd.read_hdf('test_fixed.hdf', 'test')
+
+
+   def test_hdf_fixed_write_compress(df):
+       df.to_hdf('test_fixed_compress.hdf', 'test', mode='w', complib='blosc')
+
+
+   def test_hdf_fixed_read_compress():
+       pd.read_hdf('test_fixed_compress.hdf', 'test')
+
+
+   def test_hdf_table_write(df):
+       df.to_hdf('test_table.hdf', 'test', mode='w', format='table')
+
+
+   def test_hdf_table_read():
+       pd.read_hdf('test_table.hdf', 'test')
+
+
+   def test_hdf_table_write_compress(df):
+       df.to_hdf('test_table_compress.hdf', 'test', mode='w',
+                 complib='blosc', format='table')
+
+
+   def test_hdf_table_read_compress():
+       pd.read_hdf('test_table_compress.hdf', 'test')
+
+
+   def test_csv_write(df):
+       df.to_csv('test.csv', mode='w')
+
+
+   def test_csv_read():
+       pd.read_csv('test.csv', index_col=0)
+
+
+   def test_feather_write(df):
+       df.to_feather('test.feather')
+
+
+   def test_feather_read():
+       pd.read_feather('test.feather')
+
+
+   def test_pickle_write(df):
+       df.to_pickle('test.pkl')
+
+
+   def test_pickle_read():
+       pd.read_pickle('test.pkl')
+
+
+   def test_pickle_write_compress(df):
+       df.to_pickle('test.pkl.compress', compression='xz')
+
+
+   def test_pickle_read_compress():
+       pd.read_pickle('test.pkl.compress', compression='xz')
+
+When writing, the top-three functions in terms of speed are are
+``test_pickle_write``, ``test_feather_write`` and ``test_hdf_fixed_write_compress``.
+
+.. code-block:: ipython
+
+   In [14]: %timeit test_sql_write(df)
+   2.37 s ± 36.6 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [15]: %timeit test_hdf_fixed_write(df)
+   194 ms ± 65.9 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [26]: %timeit test_hdf_fixed_write_compress(df)
+   119 ms ± 2.15 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [16]: %timeit test_hdf_table_write(df)
+   623 ms ± 125 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [27]: %timeit test_hdf_table_write_compress(df)
+   563 ms ± 23.7 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [17]: %timeit test_csv_write(df)
+   3.13 s ± 49.9 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [30]: %timeit test_feather_write(df)
+   103 ms ± 5.88 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [31]: %timeit test_pickle_write(df)
+   109 ms ± 3.72 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [32]: %timeit test_pickle_write_compress(df)
+   3.33 s ± 55.2 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+When reading, the top three are ``test_feather_read``, ``test_pickle_read`` and
+``test_hdf_fixed_read``.
+
+.. code-block:: ipython
+
+   In [18]: %timeit test_sql_read()
+   1.35 s ± 14.7 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [19]: %timeit test_hdf_fixed_read()
+   14.3 ms ± 438 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
+
+   In [28]: %timeit test_hdf_fixed_read_compress()
+   23.5 ms ± 672 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [20]: %timeit test_hdf_table_read()
+   35.4 ms ± 314 µs per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [29]: %timeit test_hdf_table_read_compress()
+   42.6 ms ± 2.1 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)
+
+   In [22]: %timeit test_csv_read()
+   516 ms ± 27.1 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+   In [33]: %timeit test_feather_read()
+   4.06 ms ± 115 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
+
+   In [34]: %timeit test_pickle_read()
+   6.5 ms ± 172 µs per loop (mean ± std. dev. of 7 runs, 100 loops each)
+
+   In [35]: %timeit test_pickle_read_compress()
+   588 ms ± 3.57 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
+
+Space on disk (in bytes)
+
+.. code-block:: none
+
+    34816000 Aug 21 18:00 test.sql
+    24009240 Aug 21 18:00 test_fixed.hdf
+     7919610 Aug 21 18:00 test_fixed_compress.hdf
+    24458892 Aug 21 18:00 test_table.hdf
+     8657116 Aug 21 18:00 test_table_compress.hdf
+    28520770 Aug 21 18:00 test.csv
+    16000248 Aug 21 18:00 test.feather
+    16000848 Aug 21 18:00 test.pkl
+     7554108 Aug 21 18:00 test.pkl.compress
diff --git a/doc/source/user_guide/merging.rst b/doc/source/user_guide/merging.rst
new file mode 100644
index 0000000000000..c97935803619a
--- /dev/null
+++ b/doc/source/user_guide/merging.rst
@@ -0,0 +1,1466 @@
+.. _merging:
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from matplotlib import pyplot as plt
+   import pandas.util._doctools as doctools
+   p = doctools.TablePlotter()
+
+
+****************************
+Merge, join, and concatenate
+****************************
+
+pandas provides various facilities for easily combining together Series,
+DataFrame, and Panel objects with various kinds of set logic for the indexes
+and relational algebra functionality in the case of join / merge-type
+operations.
+
+.. _merging.concat:
+
+Concatenating objects
+---------------------
+
+The :func:`~pandas.concat` function (in the main pandas namespace) does all of
+the heavy lifting of performing concatenation operations along an axis while
+performing optional set logic (union or intersection) of the indexes (if any) on
+the other axes. Note that I say "if any" because there is only a single possible
+axis of concatenation for Series.
+
+Before diving into all of the details of ``concat`` and what it can do, here is
+a simple example:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                       'B': ['B0', 'B1', 'B2', 'B3'],
+                       'C': ['C0', 'C1', 'C2', 'C3'],
+                       'D': ['D0', 'D1', 'D2', 'D3']},
+                      index=[0, 1, 2, 3])
+
+   df2 = pd.DataFrame({'A': ['A4', 'A5', 'A6', 'A7'],
+                       'B': ['B4', 'B5', 'B6', 'B7'],
+                       'C': ['C4', 'C5', 'C6', 'C7'],
+                       'D': ['D4', 'D5', 'D6', 'D7']},
+                      index=[4, 5, 6, 7])
+
+   df3 = pd.DataFrame({'A': ['A8', 'A9', 'A10', 'A11'],
+                       'B': ['B8', 'B9', 'B10', 'B11'],
+                       'C': ['C8', 'C9', 'C10', 'C11'],
+                       'D': ['D8', 'D9', 'D10', 'D11']},
+                      index=[8, 9, 10, 11])
+
+   frames = [df1, df2, df3]
+   result = pd.concat(frames)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_basic.png
+   p.plot(frames, result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+Like its sibling function on ndarrays, ``numpy.concatenate``, ``pandas.concat``
+takes a list or dict of homogeneously-typed objects and concatenates them with
+some configurable handling of "what to do with the other axes":
+
+::
+
+    pd.concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
+              keys=None, levels=None, names=None, verify_integrity=False,
+              copy=True)
+
+* ``objs`` : a sequence or mapping of Series, DataFrame, or Panel objects. If a
+  dict is passed, the sorted keys will be used as the `keys` argument, unless
+  it is passed, in which case the values will be selected (see below). Any None
+  objects will be dropped silently unless they are all None in which case a
+  ValueError will be raised.
+* ``axis`` : {0, 1, ...}, default 0. The axis to concatenate along.
+* ``join`` : {'inner', 'outer'}, default 'outer'. How to handle indexes on
+  other axis(es). Outer for union and inner for intersection.
+* ``ignore_index`` : boolean, default False. If True, do not use the index
+  values on the concatenation axis. The resulting axis will be labeled 0, ...,
+  n - 1. This is useful if you are concatenating objects where the
+  concatenation axis does not have meaningful indexing information. Note
+  the index values on the other axes are still respected in the join.
+* ``join_axes`` : list of Index objects. Specific indexes to use for the other
+  n - 1 axes instead of performing inner/outer set logic.
+* ``keys`` : sequence, default None. Construct hierarchical index using the
+  passed keys as the outermost level. If multiple levels passed, should
+  contain tuples.
+* ``levels`` : list of sequences, default None. Specific levels (unique values)
+  to use for constructing a MultiIndex. Otherwise they will be inferred from the
+  keys.
+* ``names`` : list, default None. Names for the levels in the resulting
+  hierarchical index.
+* ``verify_integrity`` : boolean, default False. Check whether the new
+  concatenated axis contains duplicates. This can be very expensive relative
+  to the actual data concatenation.
+* ``copy`` : boolean, default True. If False, do not copy data unnecessarily.
+
+Without a little bit of context many of these arguments don't make much sense.
+Let's revisit the above example. Suppose we wanted to associate specific keys
+with each of the pieces of the chopped up DataFrame. We can do this using the
+``keys`` argument:
+
+.. ipython:: python
+
+   result = pd.concat(frames, keys=['x', 'y', 'z'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_keys.png
+   p.plot(frames, result,
+          labels=['df1', 'df2', 'df3'], vertical=True)
+   plt.close('all');
+
+As you can see (if you've read the rest of the documentation), the resulting
+object's index has a :ref:`hierarchical index <advanced.hierarchical>`. This
+means that we can now select out each chunk by key:
+
+.. ipython:: python
+
+   result.loc['y']
+
+It's not a stretch to see how this can be very useful. More detail on this
+functionality below.
+
+.. note::
+   It is worth noting that :func:`~pandas.concat` (and therefore
+   :func:`~pandas.append`) makes a full copy of the data, and that constantly
+   reusing this function can create a significant performance hit. If you need
+   to use the operation over several datasets, use a list comprehension.
+
+::
+
+   frames = [ process_your_file(f) for f in files ]
+   result = pd.concat(frames)
+
+
+Set logic on the other axes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+When gluing together multiple DataFrames, you have a choice of how to handle
+the other axes (other than the one being concatenated). This can be done in
+the following three ways:
+
+* Take the union of them all, ``join='outer'``. This is the default
+  option as it results in zero information loss.
+* Take the intersection, ``join='inner'``.
+* Use a specific index, as passed to the ``join_axes`` argument.
+
+Here is an example of each of these methods. First, the default ``join='outer'``
+behavior:
+
+.. ipython:: python
+
+   df4 = pd.DataFrame({'B': ['B2', 'B3', 'B6', 'B7'],
+                       'D': ['D2', 'D3', 'D6', 'D7'],
+                       'F': ['F2', 'F3', 'F6', 'F7']},
+                      index=[2, 3, 6, 7])
+   result = pd.concat([df1, df4], axis=1, sort=False)
+
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_axis1.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=False);
+   plt.close('all');
+
+.. warning::
+
+   .. versionchanged:: 0.23.0
+
+   The default behavior with ``join='outer'`` is to sort the other axis
+   (columns in this case). In a future version of pandas, the default will
+   be to not sort. We specified ``sort=False`` to opt in to the new
+   behavior now.
+
+Here is the same thing with ``join='inner'``:
+
+.. ipython:: python
+
+   result = pd.concat([df1, df4], axis=1, join='inner')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_axis1_inner.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=False);
+   plt.close('all');
+
+Lastly, suppose we just wanted to reuse the *exact index* from the original
+DataFrame:
+
+.. ipython:: python
+
+   result = pd.concat([df1, df4], axis=1, join_axes=[df1.index])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_axis1_join_axes.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=False);
+   plt.close('all');
+
+.. _merging.concatenation:
+
+Concatenating using ``append``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A useful shortcut to :func:`~pandas.concat` are the :meth:`~DataFrame.append`
+instance methods on ``Series`` and ``DataFrame``. These methods actually predated
+``concat``. They concatenate along ``axis=0``, namely the index:
+
+.. ipython:: python
+
+   result = df1.append(df2)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append1.png
+   p.plot([df1, df2], result,
+          labels=['df1', 'df2'], vertical=True);
+   plt.close('all');
+
+In the case of ``DataFrame``, the indexes must be disjoint but the columns do not
+need to be:
+
+.. ipython:: python
+
+   result = df1.append(df4, sort=False)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append2.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=True);
+   plt.close('all');
+
+``append`` may take multiple objects to concatenate:
+
+.. ipython:: python
+
+   result = df1.append([df2, df3])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append3.png
+   p.plot([df1, df2, df3], result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+.. note::
+
+   Unlike the :py:meth:`~list.append` method, which appends to the original list
+   and returns ``None``, :meth:`~DataFrame.append`  here **does not** modify
+   ``df1`` and returns its copy with ``df2`` appended.
+
+.. _merging.ignore_index:
+
+Ignoring indexes on the concatenation axis
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+For ``DataFrame`` objects which don't have a meaningful index, you may wish
+to append them and ignore the fact that they may have overlapping indexes. To
+do this, use the ``ignore_index`` argument:
+
+.. ipython:: python
+
+   result = pd.concat([df1, df4], ignore_index=True, sort=False)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_ignore_index.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=True);
+   plt.close('all');
+
+This is also a valid argument to :meth:`DataFrame.append`:
+
+.. ipython:: python
+
+   result = df1.append(df4, ignore_index=True, sort=False)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append_ignore_index.png
+   p.plot([df1, df4], result,
+          labels=['df1', 'df4'], vertical=True);
+   plt.close('all');
+
+.. _merging.mixed_ndims:
+
+Concatenating with mixed ndims
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can concatenate a mix of ``Series`` and ``DataFrame`` objects. The
+``Series`` will be transformed to ``DataFrame`` with the column name as
+the name of the ``Series``.
+
+.. ipython:: python
+
+   s1 = pd.Series(['X0', 'X1', 'X2', 'X3'], name='X')
+   result = pd.concat([df1, s1], axis=1)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_mixed_ndim.png
+   p.plot([df1, s1], result,
+          labels=['df1', 's1'], vertical=False);
+   plt.close('all');
+
+.. note::
+
+   Since we're concatenating a ``Series`` to a ``DataFrame``, we could have
+   achieved the same result with :meth:`DataFrame.assign`. To concatenate an
+   arbitrary number of pandas objects (``DataFrame`` or ``Series``), use
+   ``concat``.
+
+If unnamed ``Series`` are passed they will be numbered consecutively.
+
+.. ipython:: python
+
+   s2 = pd.Series(['_0', '_1', '_2', '_3'])
+   result = pd.concat([df1, s2, s2, s2], axis=1)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_unnamed_series.png
+   p.plot([df1, s2], result,
+          labels=['df1', 's2'], vertical=False);
+   plt.close('all');
+
+Passing ``ignore_index=True`` will drop all name references.
+
+.. ipython:: python
+
+   result = pd.concat([df1, s1], axis=1, ignore_index=True)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_series_ignore_index.png
+   p.plot([df1, s1], result,
+          labels=['df1', 's1'], vertical=False);
+   plt.close('all');
+
+More concatenating with group keys
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A fairly common use of the ``keys`` argument is to override the column names
+when creating a new ``DataFrame`` based on existing ``Series``.
+Notice how the default behaviour consists on letting the resulting ``DataFrame``
+inherit the parent ``Series``' name, when these existed.
+
+.. ipython:: python
+
+   s3 = pd.Series([0, 1, 2, 3], name='foo')
+   s4 = pd.Series([0, 1, 2, 3])
+   s5 = pd.Series([0, 1, 4, 5])
+
+   pd.concat([s3, s4, s5], axis=1)
+
+Through the ``keys`` argument we can override the existing column names.
+
+.. ipython:: python
+
+   pd.concat([s3, s4, s5], axis=1, keys=['red', 'blue', 'yellow'])
+
+Let's consider a variation of the very first example presented:
+
+.. ipython:: python
+
+   result = pd.concat(frames, keys=['x', 'y', 'z'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_group_keys2.png
+   p.plot(frames, result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+You can also pass a dict to ``concat`` in which case the dict keys will be used
+for the ``keys`` argument (unless other keys are specified):
+
+.. ipython:: python
+
+   pieces = {'x': df1, 'y': df2, 'z': df3}
+   result = pd.concat(pieces)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_dict.png
+   p.plot([df1, df2, df3], result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.concat(pieces, keys=['z', 'y'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_dict_keys.png
+   p.plot([df1, df2, df3], result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+The MultiIndex created has levels that are constructed from the passed keys and
+the index of the ``DataFrame`` pieces:
+
+.. ipython:: python
+
+   result.index.levels
+
+If you wish to specify other levels (as will occasionally be the case), you can
+do so using the ``levels`` argument:
+
+.. ipython:: python
+
+   result = pd.concat(pieces, keys=['x', 'y', 'z'],
+                      levels=[['z', 'y', 'x', 'w']],
+                      names=['group_key'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_concat_dict_keys_names.png
+   p.plot([df1, df2, df3], result,
+          labels=['df1', 'df2', 'df3'], vertical=True);
+   plt.close('all');
+
+.. ipython:: python
+
+   result.index.levels
+
+This is fairly esoteric, but it is actually necessary for implementing things
+like GroupBy where the order of a categorical variable is meaningful.
+
+.. _merging.append.row:
+
+Appending rows to a DataFrame
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+While not especially efficient (since a new object must be created), you can
+append a single row to a ``DataFrame`` by passing a ``Series`` or dict to
+``append``, which returns a new ``DataFrame`` as above.
+
+.. ipython:: python
+
+   s2 = pd.Series(['X0', 'X1', 'X2', 'X3'], index=['A', 'B', 'C', 'D'])
+   result = df1.append(s2, ignore_index=True)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append_series_as_row.png
+   p.plot([df1, s2], result,
+          labels=['df1', 's2'], vertical=True);
+   plt.close('all');
+
+You should use ``ignore_index`` with this method to instruct DataFrame to
+discard its index. If you wish to preserve the index, you should construct an
+appropriately-indexed DataFrame and append or concatenate those objects.
+
+You can also pass a list of dicts or Series:
+
+.. ipython:: python
+
+   dicts = [{'A': 1, 'B': 2, 'C': 3, 'X': 4},
+            {'A': 5, 'B': 6, 'C': 7, 'Y': 8}]
+   result = df1.append(dicts, ignore_index=True, sort=False)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_append_dits.png
+   p.plot([df1, pd.DataFrame(dicts)], result,
+          labels=['df1', 'dicts'], vertical=True);
+   plt.close('all');
+
+.. _merging.join:
+
+Database-style DataFrame or named Series joining/merging
+--------------------------------------------------------
+
+pandas has full-featured, **high performance** in-memory join operations
+idiomatically very similar to relational databases like SQL. These methods
+perform significantly better (in some cases well over an order of magnitude
+better) than other open source implementations (like ``base::merge.data.frame``
+in R). The reason for this is careful algorithmic design and the internal layout
+of the data in ``DataFrame``.
+
+See the :ref:`cookbook<cookbook.merge>` for some advanced strategies.
+
+Users who are familiar with SQL but new to pandas might be interested in a
+:ref:`comparison with SQL<compare_with_sql.join>`.
+
+pandas provides a single function, :func:`~pandas.merge`, as the entry point for
+all standard database join operations between ``DataFrame`` or named ``Series`` objects:
+
+::
+
+    pd.merge(left, right, how='inner', on=None, left_on=None, right_on=None,
+             left_index=False, right_index=False, sort=True,
+             suffixes=('_x', '_y'), copy=True, indicator=False,
+             validate=None)
+
+* ``left``: A DataFrame or named Series object.
+* ``right``: Another DataFrame or named Series object.
+* ``on``: Column or index level names to join on. Must be found in both the left
+  and right DataFrame and/or Series objects. If not passed and ``left_index`` and
+  ``right_index`` are ``False``, the intersection of the columns in the
+  DataFrames and/or Series will be inferred to be the join keys.
+* ``left_on``: Columns or index levels from the left DataFrame or Series to use as
+  keys. Can either be column names, index level names, or arrays with length
+  equal to the length of the DataFrame or Series.
+* ``right_on``: Columns or index levels from the right DataFrame or Series to use as
+  keys. Can either be column names, index level names, or arrays with length
+  equal to the length of the DataFrame or Series.
+* ``left_index``: If ``True``, use the index (row labels) from the left
+  DataFrame or Series as its join key(s). In the case of a DataFrame or Series with a MultiIndex
+  (hierarchical), the number of levels must match the number of join keys
+  from the right DataFrame or Series.
+* ``right_index``: Same usage as ``left_index`` for the right DataFrame or Series
+* ``how``: One of ``'left'``, ``'right'``, ``'outer'``, ``'inner'``. Defaults
+  to ``inner``. See below for more detailed description of each method.
+* ``sort``: Sort the result DataFrame by the join keys in lexicographical
+  order. Defaults to ``True``, setting to ``False`` will improve performance
+  substantially in many cases.
+* ``suffixes``: A tuple of string suffixes to apply to overlapping
+  columns. Defaults to ``('_x', '_y')``.
+* ``copy``: Always copy data (default ``True``) from the passed DataFrame or named Series
+  objects, even when reindexing is not necessary. Cannot be avoided in many
+  cases but may improve performance / memory usage. The cases where copying
+  can be avoided are somewhat pathological but this option is provided
+  nonetheless.
+* ``indicator``: Add a column to the output DataFrame called ``_merge``
+  with information on the source of each row. ``_merge`` is Categorical-type
+  and takes on a value of ``left_only`` for observations whose merge key
+  only appears in ``'left'`` DataFrame or Series, ``right_only`` for observations whose
+  merge key only appears in ``'right'`` DataFrame or Series, and ``both`` if the
+  observation's merge key is found in both.
+
+* ``validate`` : string, default None.
+  If specified, checks if merge is of specified type.
+
+    * "one_to_one" or "1:1": checks if merge keys are unique in both
+      left and right datasets.
+    * "one_to_many" or "1:m": checks if merge keys are unique in left
+      dataset.
+    * "many_to_one" or "m:1": checks if merge keys are unique in right
+      dataset.
+    * "many_to_many" or "m:m": allowed, but does not result in checks.
+
+  .. versionadded:: 0.21.0
+
+.. note::
+
+   Support for specifying index levels as the ``on``, ``left_on``, and
+   ``right_on`` parameters was added in version 0.23.0.
+   Support for merging named ``Series`` objects was added in version 0.24.0.
+
+The return type will be the same as ``left``. If ``left`` is a ``DataFrame`` or named ``Series``
+and ``right`` is a subclass of ``DataFrame``, the return type will still be ``DataFrame``.
+
+``merge`` is a function in the pandas namespace, and it is also available as a
+``DataFrame`` instance method :meth:`~DataFrame.merge`, with the calling
+``DataFrame`` being implicitly considered the left object in the join.
+
+The related :meth:`~DataFrame.join` method, uses ``merge`` internally for the
+index-on-index (by default) and column(s)-on-index join. If you are joining on
+index only, you may wish to use ``DataFrame.join`` to save yourself some typing.
+
+Brief primer on merge methods (relational algebra)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Experienced users of relational databases like SQL will be familiar with the
+terminology used to describe join operations between two SQL-table like
+structures (``DataFrame`` objects). There are several cases to consider which
+are very important to understand:
+
+* **one-to-one** joins: for example when joining two ``DataFrame`` objects on
+  their indexes (which must contain unique values).
+* **many-to-one** joins: for example when joining an index (unique) to one or
+  more columns in a different ``DataFrame``.
+* **many-to-many** joins: joining columns on columns.
+
+.. note::
+
+   When joining columns on columns (potentially a many-to-many join), any
+   indexes on the passed ``DataFrame`` objects **will be discarded**.
+
+
+It is worth spending some time understanding the result of the **many-to-many**
+join case. In SQL / standard relational algebra, if a key combination appears
+more than once in both tables, the resulting table will have the **Cartesian
+product** of the associated data. Here is a very basic example with one unique
+key combination:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3'],
+                        'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3']})
+
+   right = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3'],
+                         'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']})
+   result = pd.merge(left, right, on='key')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+Here is a more complicated example with multiple join keys. Only the keys
+appearing in ``left`` and ``right`` are present (the intersection), since
+``how='inner'`` by default.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key1': ['K0', 'K0', 'K1', 'K2'],
+                        'key2': ['K0', 'K1', 'K0', 'K1'],
+                        'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3']})
+
+   right = pd.DataFrame({'key1': ['K0', 'K1', 'K1', 'K2'],
+                         'key2': ['K0', 'K0', 'K0', 'K0'],
+                         'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']})
+
+   result = pd.merge(left, right, on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_multiple.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+The ``how`` argument to ``merge`` specifies how to determine which keys are to
+be included in the resulting table. If a key combination **does not appear** in
+either the left or right tables, the values in the joined table will be
+``NA``. Here is a summary of the ``how`` options and their SQL equivalent names:
+
+.. csv-table::
+    :header: "Merge method", "SQL Join Name", "Description"
+    :widths: 20, 20, 60
+
+    ``left``, ``LEFT OUTER JOIN``, Use keys from left frame only
+    ``right``, ``RIGHT OUTER JOIN``, Use keys from right frame only
+    ``outer``, ``FULL OUTER JOIN``, Use union of keys from both frames
+    ``inner``, ``INNER JOIN``, Use intersection of keys from both frames
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='left', on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_left.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='right', on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_right.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='outer', on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_outer.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='inner', on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_inner.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+Here is another example with duplicate join keys in DataFrames:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'A': [1, 2], 'B': [2, 2]})
+
+   right = pd.DataFrame({'A': [4, 5, 6], 'B': [2, 2, 2]})
+
+   result = pd.merge(left, right, on='B', how='outer')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_on_key_dup.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+
+.. warning::
+
+  Joining / merging on duplicate keys can cause a returned frame that is the multiplication of the row dimensions, which may result in memory overflow. It is the user' s responsibility to manage duplicate values in keys before joining large DataFrames.
+
+.. _merging.validation:
+
+Checking for duplicate keys
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.21.0
+
+Users can use the ``validate`` argument to automatically check whether there
+are unexpected duplicates in their merge keys. Key uniqueness is checked before
+merge operations and so should protect against memory overflows. Checking key
+uniqueness is also a good way to ensure user data structures are as expected.
+
+In the following example, there are duplicate values of ``B`` in the right
+``DataFrame``. As this is not a one-to-one merge -- as specified in the
+``validate`` argument -- an exception will be raised.
+
+
+.. ipython:: python
+
+  left = pd.DataFrame({'A' : [1,2], 'B' : [1, 2]})
+  right = pd.DataFrame({'A' : [4,5,6], 'B': [2, 2, 2]})
+
+.. code-block:: ipython
+
+  In [53]: result = pd.merge(left, right, on='B', how='outer', validate="one_to_one")
+  ...
+  MergeError: Merge keys are not unique in right dataset; not a one-to-one merge
+
+If the user is aware of the duplicates in the right ``DataFrame`` but wants to
+ensure there are no duplicates in the left DataFrame, one can use the
+``validate='one_to_many'`` argument instead, which will not raise an exception.
+
+.. ipython:: python
+
+   pd.merge(left, right, on='B', how='outer', validate="one_to_many")
+
+
+.. _merging.indicator:
+
+The merge indicator
+~~~~~~~~~~~~~~~~~~~
+
+:func:`~pandas.merge` accepts the argument ``indicator``. If ``True``, a
+Categorical-type column called ``_merge`` will be added to the output object
+that takes on values:
+
+  ===================================   ================
+  Observation Origin                    ``_merge`` value
+  ===================================   ================
+  Merge key only in ``'left'`` frame    ``left_only``
+  Merge key only in ``'right'`` frame   ``right_only``
+  Merge key in both frames              ``both``
+  ===================================   ================
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'col1': [0, 1], 'col_left': ['a', 'b']})
+   df2 = pd.DataFrame({'col1': [1, 2, 2], 'col_right': [2, 2, 2]})
+   pd.merge(df1, df2, on='col1', how='outer', indicator=True)
+
+The ``indicator`` argument will also accept string arguments, in which case the indicator function will use the value of the passed string as the name for the indicator column.
+
+.. ipython:: python
+
+   pd.merge(df1, df2, on='col1', how='outer', indicator='indicator_column')
+
+
+.. _merging.dtypes:
+
+Merge Dtypes
+~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+Merging will preserve the dtype of the join keys.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'key': [1], 'v1': [10]})
+   left
+   right = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
+   right
+
+We are able to preserve the join keys:
+
+.. ipython:: python
+
+   pd.merge(left, right, how='outer')
+   pd.merge(left, right, how='outer').dtypes
+
+Of course if you have missing values that are introduced, then the
+resulting dtype will be upcast.
+
+.. ipython:: python
+
+   pd.merge(left, right, how='outer', on='key')
+   pd.merge(left, right, how='outer', on='key').dtypes
+
+.. versionadded:: 0.20.0
+
+Merging will preserve ``category`` dtypes of the mergands. See also the section on :ref:`categoricals <categorical.merge>`.
+
+The left frame.
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+
+   X = pd.Series(np.random.choice(['foo', 'bar'], size=(10,)))
+   X = X.astype(CategoricalDtype(categories=['foo', 'bar']))
+
+   left = pd.DataFrame({'X': X,
+                        'Y': np.random.choice(['one', 'two', 'three'],
+                                              size=(10,))})
+   left
+   left.dtypes
+
+The right frame.
+
+.. ipython:: python
+
+   right = pd.DataFrame({'X': pd.Series(['foo', 'bar'],
+                                        dtype=CategoricalDtype(['foo', 'bar'])),
+                        'Z': [1, 2]})
+   right
+   right.dtypes
+
+The merged result:
+
+.. ipython:: python
+
+   result = pd.merge(left, right, how='outer')
+   result
+   result.dtypes
+
+.. note::
+
+   The category dtypes must be *exactly* the same, meaning the same categories and the ordered attribute.
+   Otherwise the result will coerce to ``object`` dtype.
+
+.. note::
+
+   Merging on ``category`` dtypes that are the same can be quite performant compared to ``object`` dtype merging.
+
+.. _merging.join.index:
+
+Joining on index
+~~~~~~~~~~~~~~~~
+
+:meth:`DataFrame.join` is a convenient method for combining the columns of two
+potentially differently-indexed ``DataFrames`` into a single result
+``DataFrame``. Here is a very basic example:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
+                        'B': ['B0', 'B1', 'B2']},
+                       index=['K0', 'K1', 'K2'])
+
+   right = pd.DataFrame({'C': ['C0', 'C2', 'C3'],
+                         'D': ['D0', 'D2', 'D3']},
+                        index=['K0', 'K2', 'K3'])
+
+   result = left.join(right)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = left.join(right, how='outer')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_outer.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+The same as above, but with ``how='inner'``.
+
+.. ipython:: python
+
+   result = left.join(right, how='inner')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_inner.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+The data alignment here is on the indexes (row labels). This same behavior can
+be achieved using ``merge`` plus additional arguments instructing it to use the
+indexes:
+
+.. ipython:: python
+
+   result = pd.merge(left, right, left_index=True, right_index=True, how='outer')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_index_outer.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.merge(left, right, left_index=True, right_index=True, how='inner');
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_index_inner.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+Joining key columns on an index
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`~DataFrame.join` takes an optional ``on`` argument which may be a column
+or multiple column names, which specifies that the passed ``DataFrame`` is to be
+aligned on that column in the ``DataFrame``. These two function calls are
+completely equivalent:
+
+::
+
+    left.join(right, on=key_or_keys)
+    pd.merge(left, right, left_on=key_or_keys, right_index=True,
+          how='left', sort=False)
+
+Obviously you can choose whichever form you find more convenient. For
+many-to-one joins (where one of the ``DataFrame``'s is already indexed by the
+join key), using ``join`` may be more convenient. Here is a simple example:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key': ['K0', 'K1', 'K0', 'K1']})
+
+   right = pd.DataFrame({'C': ['C0', 'C1'],
+                         'D': ['D0', 'D1']},
+                        index=['K0', 'K1'])
+
+   result = left.join(right, on='key')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_key_columns.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.merge(left, right, left_on='key', right_index=True,
+                     how='left', sort=False);
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_key_columns.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. _merging.multikey_join:
+
+To join on multiple keys, the passed DataFrame must have a ``MultiIndex``:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key1': ['K0', 'K0', 'K1', 'K2'],
+                        'key2': ['K0', 'K1', 'K0', 'K1']})
+
+   index = pd.MultiIndex.from_tuples([('K0', 'K0'), ('K1', 'K0'),
+                                     ('K2', 'K0'), ('K2', 'K1')])
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']},
+                        index=index)
+
+Now this can be joined by passing the two key column names:
+
+.. ipython:: python
+
+   result = left.join(right, on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_multikeys.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. _merging.df_inner_join:
+
+The default for ``DataFrame.join`` is to perform a left join (essentially a
+"VLOOKUP" operation, for Excel users), which uses only the keys found in the
+calling DataFrame. Other join types, for example inner join, can be just as
+easily performed:
+
+.. ipython:: python
+
+   result = left.join(right, on=['key1', 'key2'], how='inner')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_multikeys_inner.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+As you can see, this drops any rows where there was no match.
+
+.. _merging.join_on_mi:
+
+Joining a single Index to a MultiIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can join a singly-indexed ``DataFrame`` with a level of a MultiIndexed ``DataFrame``.
+The level will match on the name of the index of the singly-indexed frame against
+a level name of the MultiIndexed frame.
+
+..  ipython:: python
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
+                        'B': ['B0', 'B1', 'B2']},
+                        index=pd.Index(['K0', 'K1', 'K2'], name='key'))
+
+   index = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
+                                     ('K2', 'Y2'), ('K2', 'Y3')],
+                                      names=['key', 'Y'])
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']},
+                         index=index)
+
+   result = left.join(right, how='inner')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_multiindex_inner.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+This is equivalent but less verbose and more memory efficient / faster than this.
+
+..  ipython:: python
+
+    result = pd.merge(left.reset_index(), right.reset_index(),
+          on=['key'], how='inner').set_index(['key','Y'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_multiindex_alternative.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. _merging.join_with_two_multi_indexes:
+
+Joining with two MultiIndexes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This is supported in a limited way, provided that the index for the right
+argument is completely used in the join, and is a subset of the indices in
+the left argument, as in this example:
+
+.. ipython:: python
+
+   leftindex = pd.MultiIndex.from_product([list('abc'), list('xy'), [1, 2]],
+                                          names=['abc', 'xy', 'num'])
+   left = pd.DataFrame({'v1': range(12)}, index=leftindex)
+   left
+
+   rightindex = pd.MultiIndex.from_product([list('abc'), list('xy')],
+                                           names=['abc', 'xy'])
+   right = pd.DataFrame({'v2': [100 * i for i in range(1, 7)]}, index=rightindex)
+   right
+
+   left.join(right, on=['abc', 'xy'], how='inner')
+
+If that condition is not satisfied, a join with two multi-indexes can be
+done using the following code.
+
+.. ipython:: python
+
+   leftindex = pd.MultiIndex.from_tuples([('K0', 'X0'), ('K0', 'X1'),
+                                          ('K1', 'X2')],
+                                         names=['key', 'X'])
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
+                        'B': ['B0', 'B1', 'B2']},
+                       index=leftindex)
+
+   rightindex = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
+                                           ('K2', 'Y2'), ('K2', 'Y3')],
+                                          names=['key', 'Y'])
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']},
+                        index=rightindex)
+
+   result = pd.merge(left.reset_index(), right.reset_index(),
+                     on=['key'], how='inner').set_index(['key', 'X', 'Y'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_two_multiindex.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. _merging.merge_on_columns_and_levels:
+
+Merging on a combination of columns and index levels
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.23
+
+Strings passed as the ``on``, ``left_on``, and ``right_on`` parameters
+may refer to either column names or index level names.  This enables merging
+``DataFrame`` instances on a combination of index levels and columns without
+resetting indexes.
+
+.. ipython:: python
+
+   left_index = pd.Index(['K0', 'K0', 'K1', 'K2'], name='key1')
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key2': ['K0', 'K1', 'K0', 'K1']},
+                       index=left_index)
+
+   right_index = pd.Index(['K0', 'K1', 'K2', 'K2'], name='key1')
+
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3'],
+                         'key2': ['K0', 'K0', 'K0', 'K1']},
+                        index=right_index)
+
+   result = left.merge(right, on=['key1', 'key2'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merge_on_index_and_column.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. note::
+
+   When DataFrames are merged on a string that matches an index level in both
+   frames, the index level is preserved as an index level in the resulting
+   DataFrame.
+
+.. note::
+   When DataFrames are merged using only some of the levels of a `MultiIndex`,
+   the extra levels will be dropped from the resulting merge. In order to
+   preserve those levels, use ``reset_index`` on those level names to move
+   those levels to columns prior to doing the merge.
+
+.. note::
+
+   If a string matches both a column name and an index level name, then a
+   warning is issued and the column takes precedence. This will result in an
+   ambiguity error in a future version.
+
+Overlapping value columns
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The merge ``suffixes`` argument takes a tuple of list of strings to append to
+overlapping column names in the input ``DataFrame``\ s to disambiguate the result
+columns:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'k': ['K0', 'K1', 'K2'], 'v': [1, 2, 3]})
+   right = pd.DataFrame({'k': ['K0', 'K0', 'K3'], 'v': [4, 5, 6]})
+
+   result = pd.merge(left, right, on='k')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_overlapped.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. ipython:: python
+
+   result = pd.merge(left, right, on='k', suffixes=['_l', '_r'])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_overlapped_suffix.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+:meth:`DataFrame.join` has ``lsuffix`` and ``rsuffix`` arguments which behave
+similarly.
+
+.. ipython:: python
+
+   left = left.set_index('k')
+   right = right.set_index('k')
+   result = left.join(right, lsuffix='_l', rsuffix='_r')
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_merge_overlapped_multi_suffix.png
+   p.plot([left, right], result,
+          labels=['left', 'right'], vertical=False);
+   plt.close('all');
+
+.. _merging.multiple_join:
+
+Joining multiple DataFrame or Panel objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A list or tuple of ``DataFrames`` can also be passed to :meth:`~DataFrame.join`
+to join them together on their indexes.
+
+.. ipython:: python
+
+   right2 = pd.DataFrame({'v': [7, 8, 9]}, index=['K1', 'K1', 'K2'])
+   result = left.join([right, right2])
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_join_multi_df.png
+   p.plot([left, right, right2], result,
+          labels=['left', 'right', 'right2'], vertical=False);
+   plt.close('all');
+
+.. _merging.combine_first.update:
+
+Merging together values within Series or DataFrame columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Another fairly common situation is to have two like-indexed (or similarly
+indexed) ``Series`` or ``DataFrame`` objects and wanting to "patch" values in
+one object from values for matching indices in the other. Here is an example:
+
+.. ipython:: python
+
+   df1 = pd.DataFrame([[np.nan, 3., 5.], [-4.6, np.nan, np.nan],
+                      [np.nan, 7., np.nan]])
+   df2 = pd.DataFrame([[-42.6, np.nan, -8.2], [-5., 1.6, 4]],
+                      index=[1, 2])
+
+For this, use the :meth:`~DataFrame.combine_first` method:
+
+.. ipython:: python
+
+   result = df1.combine_first(df2)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_combine_first.png
+   p.plot([df1, df2], result,
+          labels=['df1', 'df2'], vertical=False);
+   plt.close('all');
+
+Note that this method only takes values from the right ``DataFrame`` if they are
+missing in the left ``DataFrame``. A related method, :meth:`~DataFrame.update`,
+alters non-NA values in place:
+
+.. ipython:: python
+   :suppress:
+
+   df1_copy = df1.copy()
+
+.. ipython:: python
+
+   df1.update(df2)
+
+.. ipython:: python
+   :suppress:
+
+   @savefig merging_update.png
+   p.plot([df1_copy, df2], df1,
+          labels=['df1', 'df2'], vertical=False);
+   plt.close('all');
+
+.. _merging.time_series:
+
+Timeseries friendly merging
+---------------------------
+
+.. _merging.merge_ordered:
+
+Merging Ordered Data
+~~~~~~~~~~~~~~~~~~~~
+
+A :func:`merge_ordered` function allows combining time series and other
+ordered data. In particular it has an optional ``fill_method`` keyword to
+fill/interpolate missing data:
+
+.. ipython:: python
+
+   left = pd.DataFrame({'k': ['K0', 'K1', 'K1', 'K2'],
+                        'lv': [1, 2, 3, 4],
+                        's': ['a', 'b', 'c', 'd']})
+
+   right = pd.DataFrame({'k': ['K1', 'K2', 'K4'],
+                         'rv': [1, 2, 3]})
+
+   pd.merge_ordered(left, right, fill_method='ffill', left_by='s')
+
+.. _merging.merge_asof:
+
+Merging AsOf
+~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+A :func:`merge_asof` is similar to an ordered left-join except that we match on
+nearest key rather than equal keys. For each row in the ``left`` ``DataFrame``,
+we select the last row in the ``right`` ``DataFrame`` whose ``on`` key is less
+than the left's key. Both DataFrames must be sorted by the key.
+
+Optionally an asof merge can perform a group-wise merge. This matches the
+``by`` key equally, in addition to the nearest match on the ``on`` key.
+
+For example; we might have ``trades`` and ``quotes`` and we want to ``asof``
+merge them.
+
+.. ipython:: python
+
+   trades = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.038',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048']),
+       'ticker': ['MSFT', 'MSFT',
+                  'GOOG', 'GOOG', 'AAPL'],
+       'price': [51.95, 51.95,
+                 720.77, 720.92, 98.00],
+       'quantity': [75, 155,
+                    100, 100, 100]},
+       columns=['time', 'ticker', 'price', 'quantity'])
+
+   quotes = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.023',
+                               '20160525 13:30:00.030',
+                               '20160525 13:30:00.041',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.049',
+                               '20160525 13:30:00.072',
+                               '20160525 13:30:00.075']),
+       'ticker': ['GOOG', 'MSFT', 'MSFT',
+                  'MSFT', 'GOOG', 'AAPL', 'GOOG',
+                  'MSFT'],
+       'bid': [720.50, 51.95, 51.97, 51.99,
+               720.50, 97.99, 720.50, 52.01],
+       'ask': [720.93, 51.96, 51.98, 52.00,
+               720.93, 98.01, 720.88, 52.03]},
+       columns=['time', 'ticker', 'bid', 'ask'])
+
+.. ipython:: python
+
+   trades
+   quotes
+
+By default we are taking the asof of the quotes.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker')
+
+We only asof within ``2ms`` between the quote time and the trade time.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker',
+                 tolerance=pd.Timedelta('2ms'))
+
+We only asof within ``10ms`` between the quote time and the trade time and we
+exclude exact matches on time. Note that though we exclude the exact matches
+(of the quotes), prior quotes **do** propagate to that point in time.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker',
+                 tolerance=pd.Timedelta('10ms'),
+                 allow_exact_matches=False)
diff --git a/doc/source/user_guide/missing_data.rst b/doc/source/user_guide/missing_data.rst
new file mode 100644
index 0000000000000..7883814e91c94
--- /dev/null
+++ b/doc/source/user_guide/missing_data.rst
@@ -0,0 +1,765 @@
+.. _missing_data:
+
+{{ header }}
+
+*************************
+Working with missing data
+*************************
+
+In this section, we will discuss missing (also referred to as NA) values in
+pandas.
+
+.. note::
+
+    The choice of using ``NaN`` internally to denote missing data was largely
+    for simplicity and performance reasons. It differs from the MaskedArray
+    approach of, for example, :mod:`scikits.timeseries`. We are hopeful that
+    NumPy will soon be able to provide a native NA type solution (similar to R)
+    performant enough to be used in pandas.
+
+See the :ref:`cookbook<cookbook.missing_data>` for some advanced strategies.
+
+Values considered "missing"
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+As data comes in many shapes and forms, pandas aims to be flexible with regard
+to handling missing data. While ``NaN`` is the default missing value marker for
+reasons of computational speed and convenience, we need to be able to easily
+detect this value with data of different types: floating point, integer,
+boolean, and general object. In many cases, however, the Python ``None`` will
+arise and we wish to also consider that "missing" or "not available" or "NA".
+
+.. note::
+
+   If you want to consider ``inf`` and ``-inf`` to be "NA" in computations,
+   you can set ``pandas.options.mode.use_inf_as_na = True``.
+
+.. _missing.isna:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 3), index=['a', 'c', 'e', 'f', 'h'],
+                     columns=['one', 'two', 'three'])
+   df['four'] = 'bar'
+   df['five'] = df['one'] > 0
+   df
+   df2 = df.reindex(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'])
+   df2
+
+To make detecting missing values easier (and across different array dtypes),
+pandas provides the :func:`isna` and
+:func:`notna` functions, which are also methods on
+Series and DataFrame objects:
+
+.. ipython:: python
+
+   df2['one']
+   pd.isna(df2['one'])
+   df2['four'].notna()
+   df2.isna()
+
+.. warning::
+
+   One has to be mindful that in Python (and NumPy), the ``nan's`` don't compare equal, but ``None's`` **do**.
+   Note that pandas/NumPy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
+
+   .. ipython:: python
+
+      None == None                                                 # noqa: E711
+      np.nan == np.nan
+
+   So as compared to above, a scalar equality comparison versus a ``None/np.nan`` doesn't provide useful information.
+
+   .. ipython:: python
+
+      df2['one'] == np.nan
+
+Integer Dtypes and Missing Data
+-------------------------------
+
+Because ``NaN`` is a float, a column of integers with even one missing values
+is cast to floating-point dtype (see :ref:`gotchas.intna` for more). Pandas
+provides a nullable integer array, which can be used by explicitly requesting
+the dtype:
+
+.. ipython:: python
+
+   pd.Series([1, 2, np.nan, 4], dtype=pd.Int64Dtype())
+
+Alternatively, the string alias ``dtype='Int64'`` (note the capital ``"I"``) can be
+used.
+
+See :ref:`integer_na` for more.
+
+Datetimes
+---------
+
+For datetime64[ns] types, ``NaT`` represents missing values. This is a pseudo-native
+sentinel value that can be represented by NumPy in a singular dtype (datetime64[ns]).
+pandas objects provide compatibility between ``NaT`` and ``NaN``.
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2['timestamp'] = pd.Timestamp('20120101')
+   df2
+   df2.loc[['a', 'c', 'h'], ['one', 'timestamp']] = np.nan
+   df2
+   df2.get_dtype_counts()
+
+.. _missing.inserting:
+
+Inserting missing data
+----------------------
+
+You can insert missing values by simply assigning to containers. The
+actual missing value used will be chosen based on the dtype.
+
+For example, numeric containers will always use ``NaN`` regardless of
+the missing value type chosen:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s.loc[0] = None
+   s
+
+Likewise, datetime containers will always use ``NaT``.
+
+For object containers, pandas will use the value given:
+
+.. ipython:: python
+
+   s = pd.Series(["a", "b", "c"])
+   s.loc[0] = None
+   s.loc[1] = np.nan
+   s
+
+
+Calculations with missing data
+------------------------------
+
+Missing values propagate naturally through arithmetic operations between pandas
+objects.
+
+.. ipython:: python
+   :suppress:
+
+   df = df2.loc[:, ['one', 'two', 'three']]
+   a = df2.loc[df2.index[:5], ['one', 'two']].fillna(method='pad')
+   b = df2.loc[df2.index[:5], ['one', 'two', 'three']]
+
+.. ipython:: python
+
+   a
+   b
+   a + b
+
+The descriptive statistics and computational methods discussed in the
+:ref:`data structure overview <basics.stats>` (and listed :ref:`here
+<api.series.stats>` and :ref:`here <api.dataframe.stats>`) are all written to
+account for missing data. For example:
+
+* When summing data, NA (missing) values will be treated as zero.
+* If the data are all NA, the result will be 0.
+* Cumulative methods like :meth:`~DataFrame.cumsum` and :meth:`~DataFrame.cumprod` ignore NA values by default, but preserve them in the resulting arrays. To override this behaviour and include NA values, use ``skipna=False``.
+
+.. ipython:: python
+
+   df
+   df['one'].sum()
+   df.mean(1)
+   df.cumsum()
+   df.cumsum(skipna=False)
+
+
+.. _missing_data.numeric_sum:
+
+Sum/Prod of Empties/Nans
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   This behavior is now standard as of v0.22.0 and is consistent with the default in ``numpy``; previously sum/prod of all-NA or empty Series/DataFrames would return NaN.
+   See :ref:`v0.22.0 whatsnew <whatsnew_0220>` for more.
+
+The sum of an empty or all-NA Series or column of a DataFrame is 0.
+
+.. ipython:: python
+
+   pd.Series([np.nan]).sum()
+
+   pd.Series([]).sum()
+
+The product of an empty or all-NA Series or column of a DataFrame is 1.
+
+.. ipython:: python
+
+   pd.Series([np.nan]).prod()
+
+   pd.Series([]).prod()
+
+
+NA values in GroupBy
+~~~~~~~~~~~~~~~~~~~~
+
+NA groups in GroupBy are automatically excluded. This behavior is consistent
+with R, for example:
+
+.. ipython:: python
+
+    df
+    df.groupby('one').mean()
+
+See the groupby section :ref:`here <groupby.missing>` for more information.
+
+Cleaning / filling missing data
+--------------------------------
+
+pandas objects are equipped with various data manipulation methods for dealing
+with missing data.
+
+.. _missing_data.fillna:
+
+Filling missing values: fillna
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`~DataFrame.fillna` can "fill in" NA values with non-NA data in a couple
+of ways, which we illustrate:
+
+**Replace NA with a scalar value**
+
+.. ipython:: python
+
+   df2
+   df2.fillna(0)
+   df2['one'].fillna('missing')
+
+**Fill gaps forward or backward**
+
+Using the same filling arguments as :ref:`reindexing <basics.reindexing>`, we
+can propagate non-NA values forward or backward:
+
+.. ipython:: python
+
+   df
+   df.fillna(method='pad')
+
+.. _missing_data.fillna.limit:
+
+**Limit the amount of filling**
+
+If we only want consecutive gaps filled up to a certain number of data points,
+we can use the `limit` keyword:
+
+.. ipython:: python
+   :suppress:
+
+   df.iloc[2:4, :] = np.nan
+
+.. ipython:: python
+
+   df
+   df.fillna(method='pad', limit=1)
+
+To remind you, these are the available filling methods:
+
+.. csv-table::
+    :header: "Method", "Action"
+    :widths: 30, 50
+
+    pad / ffill, Fill values forward
+    bfill / backfill, Fill values backward
+
+With time series data, using pad/ffill is extremely common so that the "last
+known value" is available at every time point.
+
+:meth:`~DataFrame.ffill` is equivalent to ``fillna(method='ffill')``
+and :meth:`~DataFrame.bfill` is equivalent to ``fillna(method='bfill')``
+
+.. _missing_data.PandasObject:
+
+Filling with a PandasObject
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can also fillna using a dict or Series that is alignable. The labels of the dict or index of the Series
+must match the columns of the frame you wish to fill. The
+use case of this is to fill a DataFrame with the mean of that column.
+
+.. ipython:: python
+
+        dff = pd.DataFrame(np.random.randn(10, 3), columns=list('ABC'))
+        dff.iloc[3:5, 0] = np.nan
+        dff.iloc[4:6, 1] = np.nan
+        dff.iloc[5:8, 2] = np.nan
+        dff
+
+        dff.fillna(dff.mean())
+        dff.fillna(dff.mean()['B':'C'])
+
+Same result as above, but is aligning the 'fill' value which is
+a Series in this case.
+
+.. ipython:: python
+
+        dff.where(pd.notna(dff), dff.mean(), axis='columns')
+
+
+.. _missing_data.dropna:
+
+Dropping axis labels with missing data: dropna
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You may wish to simply exclude labels from a data set which refer to missing
+data. To do this, use :meth:`~DataFrame.dropna`:
+
+.. ipython:: python
+   :suppress:
+
+   df['two'] = df['two'].fillna(0)
+   df['three'] = df['three'].fillna(0)
+
+.. ipython:: python
+
+   df
+   df.dropna(axis=0)
+   df.dropna(axis=1)
+   df['one'].dropna()
+
+An equivalent :meth:`~Series.dropna` is available for Series.
+DataFrame.dropna has considerably more options than Series.dropna, which can be
+examined :ref:`in the API <api.dataframe.missing>`.
+
+.. _missing_data.interpolate:
+
+Interpolation
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.23.0
+
+  The ``limit_area`` keyword argument was added.
+
+Both Series and DataFrame objects have :meth:`~DataFrame.interpolate`
+that, by default, performs linear interpolation at missing data points.
+
+.. ipython:: python
+   :suppress:
+
+   np.random.seed(123456)
+   idx = pd.date_range('1/1/2000', periods=100, freq='BM')
+   ts = pd.Series(np.random.randn(100), index=idx)
+   ts[1:20] = np.nan
+   ts[60:80] = np.nan
+   ts = ts.cumsum()
+
+.. ipython:: python
+
+   ts
+   ts.count()
+   ts.interpolate().count()
+
+   @savefig series_interpolate.png
+   ts.interpolate().plot()
+
+Index aware interpolation is available via the ``method`` keyword:
+
+.. ipython:: python
+   :suppress:
+
+   ts2 = ts[[0, 1, 30, 60, 99]]
+
+.. ipython:: python
+
+   ts2
+   ts2.interpolate()
+   ts2.interpolate(method='time')
+
+For a floating-point index, use ``method='values'``:
+
+.. ipython:: python
+   :suppress:
+
+   idx = [0., 1., 10.]
+   ser = pd.Series([0., np.nan, 10.], idx)
+
+.. ipython:: python
+
+   ser
+   ser.interpolate()
+   ser.interpolate(method='values')
+
+You can also interpolate with a DataFrame:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2.1, np.nan, 4.7, 5.6, 6.8],
+                      'B': [.25, np.nan, np.nan, 4, 12.2, 14.4]})
+   df
+   df.interpolate()
+
+The ``method`` argument gives access to fancier interpolation methods.
+If you have scipy_ installed, you can pass the name of a 1-d interpolation routine to ``method``.
+You'll want to consult the full scipy interpolation documentation_ and reference guide_ for details.
+The appropriate interpolation method will depend on the type of data you are working with.
+
+* If you are dealing with a time series that is growing at an increasing rate,
+  ``method='quadratic'`` may be appropriate.
+* If you have values approximating a cumulative distribution function,
+  then ``method='pchip'`` should work well.
+* To fill missing values with goal of smooth plotting, consider ``method='akima'``.
+
+.. warning::
+
+   These methods require ``scipy``.
+
+.. ipython:: python
+
+   df.interpolate(method='barycentric')
+
+   df.interpolate(method='pchip')
+
+   df.interpolate(method='akima')
+
+When interpolating via a polynomial or spline approximation, you must also specify
+the degree or order of the approximation:
+
+.. ipython:: python
+
+   df.interpolate(method='spline', order=2)
+
+   df.interpolate(method='polynomial', order=2)
+
+Compare several methods:
+
+.. ipython:: python
+
+   np.random.seed(2)
+
+   ser = pd.Series(np.arange(1, 10.1, .25)**2 + np.random.randn(37))
+   bad = np.array([4, 13, 14, 15, 16, 17, 18, 20, 29])
+   ser[bad] = np.nan
+   methods = ['linear', 'quadratic', 'cubic']
+
+   df = pd.DataFrame({m: ser.interpolate(method=m) for m in methods})
+   @savefig compare_interpolations.png
+   df.plot()
+
+Another use case is interpolation at *new* values.
+Suppose you have 100 observations from some distribution. And let's suppose
+that you're particularly interested in what's happening around the middle.
+You can mix pandas' ``reindex`` and ``interpolate`` methods to interpolate
+at the new values.
+
+.. ipython:: python
+
+   ser = pd.Series(np.sort(np.random.uniform(size=100)))
+
+   # interpolate at new_index
+   new_index = ser.index | pd.Index([49.25, 49.5, 49.75, 50.25, 50.5, 50.75])
+   interp_s = ser.reindex(new_index).interpolate(method='pchip')
+   interp_s[49:51]
+
+.. _scipy: http://www.scipy.org
+.. _documentation: http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation
+.. _guide: http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html
+
+.. _missing_data.interp_limits:
+
+Interpolation Limits
+^^^^^^^^^^^^^^^^^^^^
+
+Like other pandas fill methods, :meth:`~DataFrame.interpolate` accepts a ``limit`` keyword
+argument. Use this argument to limit the number of consecutive ``NaN`` values
+filled since the last valid observation:
+
+.. ipython:: python
+
+   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan,
+                    np.nan, 13, np.nan, np.nan])
+
+   # fill all consecutive values in a forward direction
+   ser.interpolate()
+
+   # fill one consecutive value in a forward direction
+   ser.interpolate(limit=1)
+
+By default, ``NaN`` values are filled in a ``forward`` direction. Use
+``limit_direction`` parameter to fill ``backward`` or from ``both`` directions.
+
+.. ipython:: python
+
+   # fill one consecutive value backwards
+   ser.interpolate(limit=1, limit_direction='backward')
+
+   # fill one consecutive value in both directions
+   ser.interpolate(limit=1, limit_direction='both')
+
+   # fill all consecutive values in both directions
+   ser.interpolate(limit_direction='both')
+
+By default, ``NaN`` values are filled whether they are inside (surrounded by)
+existing valid values, or outside existing valid values. Introduced in v0.23
+the ``limit_area`` parameter restricts filling to either inside or outside values.
+
+.. ipython:: python
+
+   # fill one consecutive inside value in both directions
+   ser.interpolate(limit_direction='both', limit_area='inside', limit=1)
+
+   # fill all consecutive outside values backward
+   ser.interpolate(limit_direction='backward', limit_area='outside')
+
+   # fill all consecutive outside values in both directions
+   ser.interpolate(limit_direction='both', limit_area='outside')
+
+.. _missing_data.replace:
+
+Replacing Generic Values
+~~~~~~~~~~~~~~~~~~~~~~~~
+Often times we want to replace arbitrary values with other values.
+
+:meth:`~Series.replace` in Series and :meth:`~DataFrame.replace` in DataFrame provides an efficient yet
+flexible way to perform such replacements.
+
+For a Series, you can replace a single value or a list of values by another
+value:
+
+.. ipython:: python
+
+   ser = pd.Series([0., 1., 2., 3., 4.])
+
+   ser.replace(0, 5)
+
+You can replace a list of values by a list of other values:
+
+.. ipython:: python
+
+   ser.replace([0, 1, 2, 3, 4], [4, 3, 2, 1, 0])
+
+You can also specify a mapping dict:
+
+.. ipython:: python
+
+   ser.replace({0: 10, 1: 100})
+
+For a DataFrame, you can specify individual values by column:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [0, 1, 2, 3, 4], 'b': [5, 6, 7, 8, 9]})
+
+   df.replace({'a': 0, 'b': 5}, 100)
+
+Instead of replacing with specified values, you can treat all given values as
+missing and interpolate over them:
+
+.. ipython:: python
+
+   ser.replace([1, 2, 3], method='pad')
+
+.. _missing_data.replace_expression:
+
+String/Regular Expression Replacement
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   Python strings prefixed with the ``r`` character such as ``r'hello world'``
+   are so-called "raw" strings. They have different semantics regarding
+   backslashes than strings without this prefix. Backslashes in raw strings
+   will be interpreted as an escaped backslash, e.g., ``r'\' == '\\'``. You
+   should `read about them
+   <https://docs.python.org/3/reference/lexical_analysis.html#string-literals>`__
+   if this is unclear.
+
+Replace the '.' with ``NaN`` (str -> str):
+
+.. ipython:: python
+
+   d = {'a': list(range(4)), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
+   df = pd.DataFrame(d)
+   df.replace('.', np.nan)
+
+Now do it with a regular expression that removes surrounding whitespace
+(regex -> regex):
+
+.. ipython:: python
+
+   df.replace(r'\s*\.\s*', np.nan, regex=True)
+
+Replace a few different values (list -> list):
+
+.. ipython:: python
+
+   df.replace(['a', '.'], ['b', np.nan])
+
+list of regex -> list of regex:
+
+.. ipython:: python
+
+   df.replace([r'\.', r'(a)'], ['dot', '\1stuff'], regex=True)
+
+Only search in column ``'b'`` (dict -> dict):
+
+.. ipython:: python
+
+   df.replace({'b': '.'}, {'b': np.nan})
+
+Same as the previous example, but use a regular expression for
+searching instead (dict of regex -> dict):
+
+.. ipython:: python
+
+   df.replace({'b': r'\s*\.\s*'}, {'b': np.nan}, regex=True)
+
+You can pass nested dictionaries of regular expressions that use ``regex=True``:
+
+.. ipython:: python
+
+   df.replace({'b': {'b': r''}}, regex=True)
+
+Alternatively, you can pass the nested dictionary like so:
+
+.. ipython:: python
+
+   df.replace(regex={'b': {r'\s*\.\s*': np.nan}})
+
+You can also use the group of a regular expression match when replacing (dict
+of regex -> dict of regex), this works for lists as well.
+
+.. ipython:: python
+
+   df.replace({'b': r'\s*(\.)\s*'}, {'b': r'\1ty'}, regex=True)
+
+You can pass a list of regular expressions, of which those that match
+will be replaced with a scalar (list of regex -> regex).
+
+.. ipython:: python
+
+   df.replace([r'\s*\.\s*', r'a|b'], np.nan, regex=True)
+
+All of the regular expression examples can also be passed with the
+``to_replace`` argument as the ``regex`` argument. In this case the ``value``
+argument must be passed explicitly by name or ``regex`` must be a nested
+dictionary. The previous example, in this case, would then be:
+
+.. ipython:: python
+
+   df.replace(regex=[r'\s*\.\s*', r'a|b'], value=np.nan)
+
+This can be convenient if you do not want to pass ``regex=True`` every time you
+want to use a regular expression.
+
+.. note::
+
+   Anywhere in the above ``replace`` examples that you see a regular expression
+   a compiled regular expression is valid as well.
+
+Numeric Replacement
+~~~~~~~~~~~~~~~~~~~
+
+:meth:`~DataFrame.replace` is similar to :meth:`~DataFrame.fillna`.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 2))
+   df[np.random.rand(df.shape[0]) > 0.5] = 1.5
+   df.replace(1.5, np.nan)
+
+Replacing more than one value is possible by passing a list.
+
+.. ipython:: python
+
+   df00 = df.iloc[0, 0]
+   df.replace([1.5, df00], [np.nan, 'a'])
+   df[1].dtype
+
+You can also operate on the DataFrame in place:
+
+.. ipython:: python
+
+   df.replace(1.5, np.nan, inplace=True)
+
+.. warning::
+
+   When replacing multiple ``bool`` or ``datetime64`` objects, the first
+   argument to ``replace`` (``to_replace``) must match the type of the value
+   being replaced. For example,
+
+   .. code-block:: python
+
+      >>> s = pd.Series([True, False, True])
+      >>> s.replace({'a string': 'new value', True: False})  # raises
+      TypeError: Cannot compare types 'ndarray(dtype=bool)' and 'str'
+
+   will raise a ``TypeError`` because one of the ``dict`` keys is not of the
+   correct type for replacement.
+
+   However, when replacing a *single* object such as,
+
+   .. ipython:: python
+
+      s = pd.Series([True, False, True])
+      s.replace('a string', 'another string')
+
+   the original ``NDFrame`` object will be returned untouched. We're working on
+   unifying this API, but for backwards compatibility reasons we cannot break
+   the latter behavior. See :issue:`6354` for more details.
+
+Missing data casting rules and indexing
+---------------------------------------
+
+While pandas supports storing arrays of integer and boolean type, these types
+are not capable of storing missing data. Until we can switch to using a native
+NA type in NumPy, we've established some "casting rules". When a reindexing
+operation introduces missing data, the Series will be cast according to the
+rules introduced in the table below.
+
+.. csv-table::
+    :header: "data type", "Cast to"
+    :widths: 40, 40
+
+    integer, float
+    boolean, object
+    float, no cast
+    object, no cast
+
+For example:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5), index=[0, 2, 4, 6, 7])
+   s > 0
+   (s > 0).dtype
+   crit = (s > 0).reindex(list(range(8)))
+   crit
+   crit.dtype
+
+Ordinarily NumPy will complain if you try to use an object array (even if it
+contains boolean values) instead of a boolean array to get or set values from
+an ndarray (e.g. selecting values based on some criteria). If a boolean vector
+contains NAs, an exception will be generated:
+
+.. ipython:: python
+   :okexcept:
+
+   reindexed = s.reindex(list(range(8))).fillna(0)
+   reindexed[crit]
+
+However, these can be filled in using :meth:`~DataFrame.fillna` and it will work fine:
+
+.. ipython:: python
+
+   reindexed[crit.fillna(False)]
+   reindexed[crit.fillna(True)]
+
+Pandas provides a nullable integer dtype, but you must explicitly request it
+when creating the series or column. Notice that we use a capital "I" in
+the ``dtype="Int64"``.
+
+.. ipython:: python
+
+   s = pd.Series([0, 1, np.nan, 3, 4], dtype="Int64")
+   s
+
+See :ref:`integer_na` for more.
diff --git a/doc/source/user_guide/options.rst b/doc/source/user_guide/options.rst
new file mode 100644
index 0000000000000..d640d8b1153c5
--- /dev/null
+++ b/doc/source/user_guide/options.rst
@@ -0,0 +1,554 @@
+.. _options:
+
+{{ header }}
+
+********************
+Options and Settings
+********************
+
+Overview
+--------
+pandas has an options system that lets you customize some aspects of its behaviour,
+display-related options being those the user is most likely to adjust.
+
+Options have a full "dotted-style", case-insensitive name (e.g. ``display.max_rows``).
+You can get/set options directly as attributes of the top-level ``options`` attribute:
+
+.. ipython:: python
+
+   import pandas as pd
+   pd.options.display.max_rows
+   pd.options.display.max_rows = 999
+   pd.options.display.max_rows
+
+The API is composed of 5 relevant functions, available directly from the ``pandas``
+namespace:
+
+* :func:`~pandas.get_option` / :func:`~pandas.set_option` - get/set the value of a single option.
+* :func:`~pandas.reset_option` - reset one or more options to their default value.
+* :func:`~pandas.describe_option` - print the descriptions of one or more options.
+* :func:`~pandas.option_context` - execute a codeblock with a set of options
+  that revert to prior settings after execution.
+
+**Note:** Developers can check out `pandas/core/config.py <https://github.com/pandas-dev/pandas/blob/master/pandas/core/config.py>`_ for more information.
+
+All of the functions above accept a regexp pattern (``re.search`` style) as an argument,
+and so passing in a substring will work - as long as it is unambiguous:
+
+.. ipython:: python
+
+   pd.get_option("display.max_rows")
+   pd.set_option("display.max_rows", 101)
+   pd.get_option("display.max_rows")
+   pd.set_option("max_r", 102)
+   pd.get_option("display.max_rows")
+
+
+The following will **not work** because it matches multiple option names, e.g.
+``display.max_colwidth``, ``display.max_rows``, ``display.max_columns``:
+
+.. ipython:: python
+   :okexcept:
+
+   try:
+       pd.get_option("column")
+   except KeyError as e:
+       print(e)
+
+
+**Note:** Using this form of shorthand may cause your code to break if new options with similar names are added in future versions.
+
+
+You can get a list of available options and their descriptions with ``describe_option``. When called
+with no argument ``describe_option`` will print out the descriptions for all available options.
+
+.. ipython:: python
+   :suppress:
+   :okwarning:
+
+   pd.reset_option("all")
+
+Getting and Setting Options
+---------------------------
+
+As described above, :func:`~pandas.get_option` and :func:`~pandas.set_option`
+are available from the pandas namespace.  To change an option, call
+``set_option('option regex', new_value)``.
+
+.. ipython:: python
+
+   pd.get_option('mode.sim_interactive')
+   pd.set_option('mode.sim_interactive', True)
+   pd.get_option('mode.sim_interactive')
+
+**Note:** The option 'mode.sim_interactive' is mostly used for debugging purposes.
+
+All options also have a default value, and you can use ``reset_option`` to do just that:
+
+.. ipython:: python
+   :suppress:
+
+   pd.reset_option("display.max_rows")
+
+.. ipython:: python
+
+   pd.get_option("display.max_rows")
+   pd.set_option("display.max_rows", 999)
+   pd.get_option("display.max_rows")
+   pd.reset_option("display.max_rows")
+   pd.get_option("display.max_rows")
+
+
+It's also possible to reset multiple options at once (using a regex):
+
+.. ipython:: python
+   :okwarning:
+
+   pd.reset_option("^display")
+
+
+``option_context`` context manager has been exposed through
+the top-level API, allowing you to execute code with given option values. Option values
+are restored automatically when you exit the `with` block:
+
+.. ipython:: python
+
+   with pd.option_context("display.max_rows", 10, "display.max_columns", 5):
+       print(pd.get_option("display.max_rows"))
+       print(pd.get_option("display.max_columns"))
+   print(pd.get_option("display.max_rows"))
+   print(pd.get_option("display.max_columns"))
+
+
+Setting Startup Options in python/ipython Environment
+-----------------------------------------------------
+
+Using startup scripts for the python/ipython environment to import pandas and set options makes working with pandas more efficient.  To do this, create a .py or .ipy script in the startup directory of the desired profile.  An example where the startup folder is in a default ipython profile can be found at:
+
+.. code-block:: none
+
+  $IPYTHONDIR/profile_default/startup
+
+More information can be found in the `ipython documentation
+<https://ipython.org/ipython-doc/stable/interactive/tutorial.html#startup-files>`__.  An example startup script for pandas is displayed below:
+
+.. code-block:: python
+
+  import pandas as pd
+  pd.set_option('display.max_rows', 999)
+  pd.set_option('precision', 5)
+
+.. _options.frequently_used:
+
+Frequently Used Options
+-----------------------
+The following is a walk-through of the more frequently used display options.
+
+``display.max_rows`` and ``display.max_columns`` sets the maximum number
+of rows and columns displayed when a frame is pretty-printed.  Truncated
+lines are replaced by an ellipsis.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(7, 2))
+   pd.set_option('max_rows', 7)
+   df
+   pd.set_option('max_rows', 5)
+   df
+   pd.reset_option('max_rows')
+
+``display.expand_frame_repr`` allows for the representation of
+dataframes to stretch across pages, wrapped over the full column vs row-wise.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 10))
+   pd.set_option('expand_frame_repr', True)
+   df
+   pd.set_option('expand_frame_repr', False)
+   df
+   pd.reset_option('expand_frame_repr')
+
+``display.large_repr`` lets you select whether to display dataframes that exceed
+``max_columns`` or ``max_rows`` as a truncated frame, or as a summary.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 10))
+   pd.set_option('max_rows', 5)
+   pd.set_option('large_repr', 'truncate')
+   df
+   pd.set_option('large_repr', 'info')
+   df
+   pd.reset_option('large_repr')
+   pd.reset_option('max_rows')
+
+``display.max_colwidth`` sets the maximum width of columns.  Cells
+of this length or longer will be truncated with an ellipsis.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.array([['foo', 'bar', 'bim', 'uncomfortably long string'],
+                               ['horse', 'cow', 'banana', 'apple']]))
+   pd.set_option('max_colwidth', 40)
+   df
+   pd.set_option('max_colwidth', 6)
+   df
+   pd.reset_option('max_colwidth')
+
+``display.max_info_columns`` sets a threshold for when by-column info
+will be given.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 10))
+   pd.set_option('max_info_columns', 11)
+   df.info()
+   pd.set_option('max_info_columns', 5)
+   df.info()
+   pd.reset_option('max_info_columns')
+
+``display.max_info_rows``: ``df.info()`` will usually show null-counts for each column.
+For large frames this can be quite slow. ``max_info_rows`` and ``max_info_cols``
+limit this null check only to frames with smaller dimensions then specified. Note that you
+can specify the option ``df.info(null_counts=True)`` to override on showing a particular frame.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.choice([0, 1, np.nan], size=(10, 10)))
+   df
+   pd.set_option('max_info_rows', 11)
+   df.info()
+   pd.set_option('max_info_rows', 5)
+   df.info()
+   pd.reset_option('max_info_rows')
+
+``display.precision`` sets the output display precision in terms of decimal places.
+This is only a suggestion.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 5))
+   pd.set_option('precision', 7)
+   df
+   pd.set_option('precision', 4)
+   df
+
+``display.chop_threshold`` sets at what level pandas rounds to zero when
+it displays a Series of DataFrame. This setting does not change the
+precision at which the number is stored.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(6, 6))
+   pd.set_option('chop_threshold', 0)
+   df
+   pd.set_option('chop_threshold', .5)
+   df
+   pd.reset_option('chop_threshold')
+
+``display.colheader_justify`` controls the justification of the headers.
+The options are 'right', and 'left'.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.array([np.random.randn(6),
+                               np.random.randint(1, 9, 6) * .1,
+                               np.zeros(6)]).T,
+                     columns=['A', 'B', 'C'], dtype='float')
+   pd.set_option('colheader_justify', 'right')
+   df
+   pd.set_option('colheader_justify', 'left')
+   df
+   pd.reset_option('colheader_justify')
+
+
+
+.. _options.available:
+
+Available Options
+-----------------
+
+======================================= ============ ==================================
+Option                                  Default      Function
+======================================= ============ ==================================
+display.chop_threshold                  None         If set to a float value, all float
+                                                     values smaller then the given
+                                                     threshold will be displayed as
+                                                     exactly 0 by repr and friends.
+display.colheader_justify               right        Controls the justification of
+                                                     column headers. used by DataFrameFormatter.
+display.column_space                    12           No description available.
+display.date_dayfirst                   False        When True, prints and parses dates
+                                                     with the day first, eg 20/01/2005
+display.date_yearfirst                  False        When True, prints and parses dates
+                                                     with the year first, eg 2005/01/20
+display.encoding                        UTF-8        Defaults to the detected encoding
+                                                     of the console. Specifies the encoding
+                                                     to be used for strings returned by
+                                                     to_string, these are generally strings
+                                                     meant to be displayed on the console.
+display.expand_frame_repr               True         Whether to print out the full DataFrame
+                                                     repr for wide DataFrames across
+                                                     multiple lines, `max_columns` is
+                                                     still respected, but the output will
+                                                     wrap-around across multiple "pages"
+                                                     if its width exceeds `display.width`.
+display.float_format                    None         The callable should accept a floating
+                                                     point number and return a string with
+                                                     the desired format of the number.
+                                                     This is used in some places like
+                                                     SeriesFormatter.
+                                                     See core.format.EngFormatter for an example.
+display.large_repr                      truncate     For DataFrames exceeding max_rows/max_cols,
+                                                     the repr (and HTML repr) can show
+                                                     a truncated table (the default),
+                                                     or switch to the view from df.info()
+                                                     (the behaviour in earlier versions of pandas).
+                                                     allowable settings, ['truncate', 'info']
+display.latex.repr                      False        Whether to produce a latex DataFrame
+                                                     representation for jupyter frontends
+                                                     that support it.
+display.latex.escape                    True         Escapes special characters in DataFrames, when
+                                                     using the to_latex method.
+display.latex.longtable                 False        Specifies if the to_latex method of a DataFrame
+                                                     uses the longtable format.
+display.latex.multicolumn               True         Combines columns when using a MultiIndex
+display.latex.multicolumn_format        'l'          Alignment of multicolumn labels
+display.latex.multirow                  False        Combines rows when using a MultiIndex.
+                                                     Centered instead of top-aligned,
+                                                     separated by clines.
+display.max_columns                     0 or 20      max_rows and max_columns are used
+                                                     in __repr__() methods to decide if
+                                                     to_string() or info() is used to
+                                                     render an object to a string.  In
+                                                     case Python/IPython is running in
+                                                     a terminal this is set to 0 by default and
+                                                     pandas will correctly auto-detect
+                                                     the width of the terminal and switch to
+                                                     a smaller format in case all columns
+                                                     would not fit vertically. The IPython
+                                                     notebook, IPython qtconsole, or IDLE
+                                                     do not run in a terminal and hence
+                                                     it is not possible to do correct
+                                                     auto-detection, in which case the default
+                                                     is set to 20. 'None' value means unlimited.
+display.max_colwidth                    50           The maximum width in characters of
+                                                     a column in the repr of a pandas
+                                                     data structure. When the column overflows,
+                                                     a "..." placeholder is embedded in
+                                                     the output.
+display.max_info_columns                100          max_info_columns is used in DataFrame.info
+                                                     method to decide if per column information
+                                                     will be printed.
+display.max_info_rows                   1690785      df.info() will usually show null-counts
+                                                     for each column. For large frames
+                                                     this can be quite slow. max_info_rows
+                                                     and max_info_cols limit this null
+                                                     check only to frames with smaller
+                                                     dimensions then specified.
+display.max_rows                        60           This sets the maximum number of rows
+                                                     pandas should output when printing
+                                                     out various output. For example,
+                                                     this value determines whether the
+                                                     repr() for a dataframe prints out
+                                                     fully or just a summary repr.
+                                                     'None' value means unlimited.
+display.max_seq_items                   100          when pretty-printing a long sequence,
+                                                     no more then `max_seq_items` will
+                                                     be printed. If items are omitted,
+                                                     they will be denoted by the addition
+                                                     of "..." to the resulting string.
+                                                     If set to None, the number of items
+                                                     to be printed is unlimited.
+display.memory_usage                    True         This specifies if the memory usage of
+                                                     a DataFrame should be displayed when the
+                                                     df.info() method is invoked.
+display.multi_sparse                    True         "Sparsify" MultiIndex display (don't
+                                                     display repeated elements in outer
+                                                     levels within groups)
+display.notebook_repr_html              True         When True, IPython notebook will
+                                                     use html representation for
+                                                     pandas objects (if it is available).
+display.pprint_nest_depth               3            Controls the number of nested levels
+                                                     to process when pretty-printing
+display.precision                       6            Floating point output precision in
+                                                     terms of number of places after the
+                                                     decimal, for regular formatting as well
+                                                     as scientific notation. Similar to
+                                                     numpy's ``precision`` print option
+display.show_dimensions                 truncate     Whether to print out dimensions
+                                                     at the end of DataFrame repr.
+                                                     If 'truncate' is specified, only
+                                                     print out the dimensions if the
+                                                     frame is truncated (e.g. not display
+                                                     all rows and/or columns)
+display.width                           80           Width of the display in characters.
+                                                     In case python/IPython is running in
+                                                     a terminal this can be set to None
+                                                     and pandas will correctly auto-detect
+                                                     the width. Note that the IPython notebook,
+                                                     IPython qtconsole, or IDLE do not run in a
+                                                     terminal and hence it is not possible
+                                                     to correctly detect the width.
+display.html.table_schema               False        Whether to publish a Table Schema
+                                                     representation for frontends that
+                                                     support it.
+display.html.border                     1            A ``border=value`` attribute is
+                                                     inserted in the ``<table>`` tag
+                                                     for the DataFrame HTML repr.
+display.html.use_mathjax                True         When True, Jupyter notebook will process
+                                                     table contents using MathJax, rendering
+                                                     mathematical expressions enclosed by the
+                                                     dollar symbol.
+io.excel.xls.writer                     xlwt         The default Excel writer engine for
+                                                     'xls' files.
+io.excel.xlsm.writer                    openpyxl     The default Excel writer engine for
+                                                     'xlsm' files. Available options:
+                                                     'openpyxl' (the default).
+io.excel.xlsx.writer                    openpyxl     The default Excel writer engine for
+                                                     'xlsx' files.
+io.hdf.default_format                   None         default format writing format, if
+                                                     None, then put will default to
+                                                     'fixed' and append will default to
+                                                     'table'
+io.hdf.dropna_table                     True         drop ALL nan rows when appending
+                                                     to a table
+io.parquet.engine                       None         The engine to use as a default for
+                                                     parquet reading and writing. If None
+                                                     then try 'pyarrow' and 'fastparquet'
+mode.chained_assignment                 warn         Controls ``SettingWithCopyWarning``:
+                                                     'raise', 'warn', or None. Raise an
+                                                     exception, warn, or no action if
+                                                     trying to use :ref:`chained assignment <indexing.evaluation_order>`.
+mode.sim_interactive                    False        Whether to simulate interactive mode
+                                                     for purposes of testing.
+mode.use_inf_as_na                      False        True means treat None, NaN, -INF,
+                                                     INF as NA (old way), False means
+                                                     None and NaN are null, but INF, -INF
+                                                     are not NA (new way).
+compute.use_bottleneck                  True         Use the bottleneck library to accelerate
+                                                     computation if it is installed.
+compute.use_numexpr                     True         Use the numexpr library to accelerate
+                                                     computation if it is installed.
+plotting.matplotlib.register_converters True         Register custom converters with
+                                                     matplotlib. Set to False to de-register.
+======================================= ============ ==================================
+
+
+.. _basics.console_output:
+
+Number Formatting
+------------------
+
+pandas also allows you to set how numbers are displayed in the console.
+This option is not set through the ``set_options`` API.
+
+Use the ``set_eng_float_format`` function
+to alter the floating-point formatting of pandas objects to produce a particular
+format.
+
+For instance:
+
+.. ipython:: python
+
+   import numpy as np
+
+   pd.set_eng_float_format(accuracy=3, use_eng_prefix=True)
+   s = pd.Series(np.random.randn(5), index=['a', 'b', 'c', 'd', 'e'])
+   s / 1.e3
+   s / 1.e6
+
+.. ipython:: python
+   :suppress:
+   :okwarning:
+
+   pd.reset_option("^display")
+
+To round floats on a case-by-case basis, you can also use :meth:`~pandas.Series.round` and :meth:`~pandas.DataFrame.round`.
+
+.. _options.east_asian_width:
+
+Unicode Formatting
+------------------
+
+.. warning::
+
+   Enabling this option will affect the performance for printing of DataFrame and Series (about 2 times slower).
+   Use only when it is actually required.
+
+Some East Asian countries use Unicode characters whose width corresponds to two Latin characters.
+If a DataFrame or Series contains these characters, the default output mode may not align them properly.
+
+.. note:: Screen captures are attached for each output to show the actual results.
+
+.. ipython:: python
+
+   df = pd.DataFrame({u'国籍': ['UK', u'日本'], u'名前': ['Alice', u'しのぶ']})
+   df
+
+.. image:: ../_static/option_unicode01.png
+
+Enabling ``display.unicode.east_asian_width`` allows pandas to check each character's "East Asian Width" property.
+These characters can be aligned properly by setting this option to ``True``. However, this will result in longer render
+times than the standard ``len`` function.
+
+.. ipython:: python
+
+   pd.set_option('display.unicode.east_asian_width', True)
+   df
+
+.. image:: ../_static/option_unicode02.png
+
+In addition, Unicode characters whose width is "Ambiguous" can either be 1 or 2 characters wide depending on the
+terminal setting or encoding. The option ``display.unicode.ambiguous_as_wide`` can be used to handle the ambiguity.
+
+By default, an "Ambiguous" character's width, such as "¡" (inverted exclamation) in the example below, is taken to be 1.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': ['xxx', u'¡¡'], 'b': ['yyy', u'¡¡']})
+   df
+
+.. image:: ../_static/option_unicode03.png
+
+Enabling ``display.unicode.ambiguous_as_wide`` makes pandas interpret these characters' widths to be 2.
+(Note that this option will only be effective when ``display.unicode.east_asian_width`` is enabled.)
+
+However, setting this option incorrectly for your terminal will cause these characters to be aligned incorrectly:
+
+.. ipython:: python
+
+   pd.set_option('display.unicode.ambiguous_as_wide', True)
+   df
+
+.. image:: ../_static/option_unicode04.png
+
+.. ipython:: python
+   :suppress:
+
+   pd.set_option('display.unicode.east_asian_width', False)
+   pd.set_option('display.unicode.ambiguous_as_wide', False)
+
+.. _options.table_schema:
+
+Table Schema Display
+--------------------
+
+.. versionadded:: 0.20.0
+
+``DataFrame`` and ``Series`` will publish a Table Schema representation
+by default. False by default, this can be enabled globally with the
+``display.html.table_schema`` option:
+
+.. ipython:: python
+
+  pd.set_option('display.html.table_schema', True)
+
+Only ``'display.max_rows'`` are serialized and published.
+
+
+.. ipython:: python
+    :suppress:
+
+    pd.reset_option('display.html.table_schema')
diff --git a/doc/source/user_guide/reshaping.rst b/doc/source/user_guide/reshaping.rst
new file mode 100644
index 0000000000000..5c11be34e6ed4
--- /dev/null
+++ b/doc/source/user_guide/reshaping.rst
@@ -0,0 +1,803 @@
+.. _reshaping:
+
+{{ header }}
+
+**************************
+Reshaping and Pivot Tables
+**************************
+
+Reshaping by pivoting DataFrame objects
+---------------------------------------
+
+.. image:: ../_static/reshaping_pivot.png
+
+.. ipython:: python
+   :suppress:
+
+   import pandas.util.testing as tm
+   tm.N = 3
+
+   def unpivot(frame):
+       N, K = frame.shape
+       data = {'value': frame.to_numpy().ravel('F'),
+               'variable': np.asarray(frame.columns).repeat(N),
+               'date': np.tile(np.asarray(frame.index), K)}
+       columns = ['date', 'variable', 'value']
+       return pd.DataFrame(data, columns=columns)
+
+   df = unpivot(tm.makeTimeDataFrame())
+
+Data is often stored in so-called "stacked" or "record" format:
+
+.. ipython:: python
+
+   df
+
+
+For the curious here is how the above ``DataFrame`` was created:
+
+.. code-block:: python
+
+   import pandas.util.testing as tm
+
+   tm.N = 3
+
+
+   def unpivot(frame):
+       N, K = frame.shape
+       data = {'value': frame.to_numpy().ravel('F'),
+               'variable': np.asarray(frame.columns).repeat(N),
+               'date': np.tile(np.asarray(frame.index), K)}
+       return pd.DataFrame(data, columns=['date', 'variable', 'value'])
+
+
+   df = unpivot(tm.makeTimeDataFrame())
+
+To select out everything for variable ``A`` we could do:
+
+.. ipython:: python
+
+   df[df['variable'] == 'A']
+
+But suppose we wish to do time series operations with the variables. A better
+representation would be where the ``columns`` are the unique variables and an
+``index`` of dates identifies individual observations. To reshape the data into
+this form, we use the :meth:`DataFrame.pivot` method (also implemented as a
+top level function :func:`~pandas.pivot`):
+
+.. ipython:: python
+
+   df.pivot(index='date', columns='variable', values='value')
+
+If the ``values`` argument is omitted, and the input ``DataFrame`` has more than
+one column of values which are not used as column or index inputs to ``pivot``,
+then the resulting "pivoted" ``DataFrame`` will have :ref:`hierarchical columns
+<advanced.hierarchical>` whose topmost level indicates the respective value
+column:
+
+.. ipython:: python
+
+   df['value2'] = df['value'] * 2
+   pivoted = df.pivot(index='date', columns='variable')
+   pivoted
+
+You can then select subsets from the pivoted ``DataFrame``:
+
+.. ipython:: python
+
+   pivoted['value2']
+
+Note that this returns a view on the underlying data in the case where the data
+are homogeneously-typed.
+
+.. note::
+   :func:`~pandas.pivot` will error with a ``ValueError: Index contains duplicate
+   entries, cannot reshape`` if the index/column pair is not unique. In this
+   case, consider using :func:`~pandas.pivot_table` which is a generalization
+   of pivot that can handle duplicate values for one index/column pair.
+
+.. _reshaping.stacking:
+
+Reshaping by stacking and unstacking
+------------------------------------
+
+.. image:: ../_static/reshaping_stack.png
+
+Closely related to the :meth:`~DataFrame.pivot` method are the related
+:meth:`~DataFrame.stack` and :meth:`~DataFrame.unstack` methods available on
+``Series`` and ``DataFrame``. These methods are designed to work together with
+``MultiIndex`` objects (see the section on :ref:`hierarchical indexing
+<advanced.hierarchical>`). Here are essentially what these methods do:
+
+* ``stack``: "pivot" a level of the (possibly hierarchical) column labels,
+  returning a ``DataFrame`` with an index with a new inner-most level of row
+  labels.
+* ``unstack``: (inverse operation of ``stack``) "pivot" a level of the
+  (possibly hierarchical) row index to the column axis, producing a reshaped
+  ``DataFrame`` with a new inner-most level of column labels.
+
+.. image:: ../_static/reshaping_unstack.png
+
+The clearest way to explain is by example. Let's take a prior example data set
+from the hierarchical indexing section:
+
+.. ipython:: python
+
+   tuples = list(zip(*[['bar', 'bar', 'baz', 'baz',
+                        'foo', 'foo', 'qux', 'qux'],
+                       ['one', 'two', 'one', 'two',
+                        'one', 'two', 'one', 'two']]))
+   index = pd.MultiIndex.from_tuples(tuples, names=['first', 'second'])
+   df = pd.DataFrame(np.random.randn(8, 2), index=index, columns=['A', 'B'])
+   df2 = df[:4]
+   df2
+
+The ``stack`` function "compresses" a level in the ``DataFrame``'s columns to
+produce either:
+
+* A ``Series``, in the case of a simple column Index.
+* A ``DataFrame``, in the case of a ``MultiIndex`` in the columns.
+
+If the columns have a ``MultiIndex``, you can choose which level to stack. The
+stacked level becomes the new lowest level in a ``MultiIndex`` on the columns:
+
+.. ipython:: python
+
+   stacked = df2.stack()
+   stacked
+
+With a "stacked" ``DataFrame`` or ``Series`` (having a ``MultiIndex`` as the
+``index``), the inverse operation of ``stack`` is ``unstack``, which by default
+unstacks the **last level**:
+
+.. ipython:: python
+
+   stacked.unstack()
+   stacked.unstack(1)
+   stacked.unstack(0)
+
+.. _reshaping.unstack_by_name:
+
+.. image:: ../_static/reshaping_unstack_1.png
+
+If the indexes have names, you can use the level names instead of specifying
+the level numbers:
+
+.. ipython:: python
+
+   stacked.unstack('second')
+
+
+.. image:: ../_static/reshaping_unstack_0.png
+
+Notice that the ``stack`` and ``unstack`` methods implicitly sort the index
+levels involved. Hence a call to ``stack`` and then ``unstack``, or vice versa,
+will result in a **sorted** copy of the original ``DataFrame`` or ``Series``:
+
+.. ipython:: python
+
+   index = pd.MultiIndex.from_product([[2, 1], ['a', 'b']])
+   df = pd.DataFrame(np.random.randn(4), index=index, columns=['A'])
+   df
+   all(df.unstack().stack() == df.sort_index())
+
+The above code will raise a ``TypeError`` if the call to ``sort_index`` is
+removed.
+
+.. _reshaping.stack_multiple:
+
+Multiple Levels
+~~~~~~~~~~~~~~~
+
+You may also stack or unstack more than one level at a time by passing a list
+of levels, in which case the end result is as if each level in the list were
+processed individually.
+
+.. ipython:: python
+
+    columns = pd.MultiIndex.from_tuples([
+        ('A', 'cat', 'long'), ('B', 'cat', 'long'),
+        ('A', 'dog', 'short'), ('B', 'dog', 'short')],
+        names=['exp', 'animal', 'hair_length']
+    )
+    df = pd.DataFrame(np.random.randn(4, 4), columns=columns)
+    df
+
+    df.stack(level=['animal', 'hair_length'])
+
+The list of levels can contain either level names or level numbers (but
+not a mixture of the two).
+
+.. ipython:: python
+
+    # df.stack(level=['animal', 'hair_length'])
+    # from above is equivalent to:
+    df.stack(level=[1, 2])
+
+Missing Data
+~~~~~~~~~~~~
+
+These functions are intelligent about handling missing data and do not expect
+each subgroup within the hierarchical index to have the same set of labels.
+They also can handle the index being unsorted (but you can make it sorted by
+calling ``sort_index``, of course). Here is a more complex example:
+
+.. ipython:: python
+
+   columns = pd.MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'),
+                                        ('B', 'cat'), ('A', 'dog')],
+                                       names=['exp', 'animal'])
+   index = pd.MultiIndex.from_product([('bar', 'baz', 'foo', 'qux'),
+                                       ('one', 'two')],
+                                      names=['first', 'second'])
+   df = pd.DataFrame(np.random.randn(8, 4), index=index, columns=columns)
+   df2 = df.iloc[[0, 1, 2, 4, 5, 7]]
+   df2
+
+As mentioned above, ``stack`` can be called with a ``level`` argument to select
+which level in the columns to stack:
+
+.. ipython:: python
+
+   df2.stack('exp')
+   df2.stack('animal')
+
+Unstacking can result in missing values if subgroups do not have the same
+set of labels.  By default, missing values will be replaced with the default
+fill value for that data type, ``NaN`` for float, ``NaT`` for datetimelike,
+etc.  For integer types, by default data will converted to float and missing
+values will be set to ``NaN``.
+
+.. ipython:: python
+
+   df3 = df.iloc[[0, 1, 4, 7], [1, 2]]
+   df3
+   df3.unstack()
+
+.. versionadded:: 0.18.0
+
+Alternatively, unstack takes an optional ``fill_value`` argument, for specifying
+the value of missing data.
+
+.. ipython:: python
+
+   df3.unstack(fill_value=-1e9)
+
+With a MultiIndex
+~~~~~~~~~~~~~~~~~
+
+Unstacking when the columns are a ``MultiIndex`` is also careful about doing
+the right thing:
+
+.. ipython:: python
+
+   df[:3].unstack(0)
+   df2.unstack(1)
+
+.. _reshaping.melt:
+
+Reshaping by Melt
+-----------------
+
+.. image:: ../_static/reshaping_melt.png
+
+The top-level :func:`~pandas.melt` function and the corresponding :meth:`DataFrame.melt`
+are useful to massage a ``DataFrame`` into a format where one or more columns
+are *identifier variables*, while all other columns, considered *measured
+variables*, are "unpivoted" to the row axis, leaving just two non-identifier
+columns, "variable" and "value". The names of those columns can be customized
+by supplying the ``var_name`` and ``value_name`` parameters.
+
+For instance,
+
+.. ipython:: python
+
+   cheese = pd.DataFrame({'first': ['John', 'Mary'],
+                          'last': ['Doe', 'Bo'],
+                          'height': [5.5, 6.0],
+                          'weight': [130, 150]})
+   cheese
+   cheese.melt(id_vars=['first', 'last'])
+   cheese.melt(id_vars=['first', 'last'], var_name='quantity')
+
+Another way to transform is to use the :func:`~pandas.wide_to_long` panel data
+convenience function. It is less flexible than :func:`~pandas.melt`, but more
+user-friendly.
+
+.. ipython:: python
+
+  dft = pd.DataFrame({"A1970": {0: "a", 1: "b", 2: "c"},
+                      "A1980": {0: "d", 1: "e", 2: "f"},
+                      "B1970": {0: 2.5, 1: 1.2, 2: .7},
+                      "B1980": {0: 3.2, 1: 1.3, 2: .1},
+                      "X": dict(zip(range(3), np.random.randn(3)))
+                     })
+  dft["id"] = dft.index
+  dft
+  pd.wide_to_long(dft, ["A", "B"], i="id", j="year")
+
+Combining with stats and GroupBy
+--------------------------------
+
+It should be no shock that combining ``pivot`` / ``stack`` / ``unstack`` with
+GroupBy and the basic Series and DataFrame statistical functions can produce
+some very expressive and fast data manipulations.
+
+.. ipython:: python
+
+   df
+   df.stack().mean(1).unstack()
+
+   # same result, another way
+   df.groupby(level=1, axis=1).mean()
+
+   df.stack().groupby(level=1).mean()
+
+   df.mean().unstack(0)
+
+
+Pivot tables
+------------
+
+.. _reshaping.pivot:
+
+
+
+While :meth:`~DataFrame.pivot` provides general purpose pivoting with various
+data types (strings, numerics, etc.), pandas also provides :func:`~pandas.pivot_table`
+for pivoting with aggregation of numeric data.
+
+The function :func:`~pandas.pivot_table` can be used to create spreadsheet-style
+pivot tables. See the :ref:`cookbook<cookbook.pivot>` for some advanced
+strategies.
+
+It takes a number of arguments:
+
+* ``data``: a DataFrame object.
+* ``values``: a column or a list of columns to aggregate.
+* ``index``: a column, Grouper, array which has the same length as data, or list of them.
+  Keys to group by on the pivot table index. If an array is passed, it is being used as the same manner as column values.
+* ``columns``: a column, Grouper, array which has the same length as data, or list of them.
+  Keys to group by on the pivot table column. If an array is passed, it is being used as the same manner as column values.
+* ``aggfunc``: function to use for aggregation, defaulting to ``numpy.mean``.
+
+Consider a data set like this:
+
+.. ipython:: python
+
+   import datetime
+   df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 6,
+                      'B': ['A', 'B', 'C'] * 8,
+                      'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 4,
+                      'D': np.random.randn(24),
+                      'E': np.random.randn(24),
+                      'F': [datetime.datetime(2013, i, 1) for i in range(1, 13)]
+                      + [datetime.datetime(2013, i, 15) for i in range(1, 13)]})
+   df
+
+We can produce pivot tables from this data very easily:
+
+.. ipython:: python
+
+   pd.pivot_table(df, values='D', index=['A', 'B'], columns=['C'])
+   pd.pivot_table(df, values='D', index=['B'], columns=['A', 'C'], aggfunc=np.sum)
+   pd.pivot_table(df, values=['D', 'E'], index=['B'], columns=['A', 'C'],
+                  aggfunc=np.sum)
+
+The result object is a ``DataFrame`` having potentially hierarchical indexes on the
+rows and columns. If the ``values`` column name is not given, the pivot table
+will include all of the data that can be aggregated in an additional level of
+hierarchy in the columns:
+
+.. ipython:: python
+
+   pd.pivot_table(df, index=['A', 'B'], columns=['C'])
+
+Also, you can use ``Grouper`` for ``index`` and ``columns`` keywords. For detail of ``Grouper``, see :ref:`Grouping with a Grouper specification <groupby.specify>`.
+
+.. ipython:: python
+
+   pd.pivot_table(df, values='D', index=pd.Grouper(freq='M', key='F'),
+                  columns='C')
+
+You can render a nice output of the table omitting the missing values by
+calling ``to_string`` if you wish:
+
+.. ipython:: python
+
+   table = pd.pivot_table(df, index=['A', 'B'], columns=['C'])
+   print(table.to_string(na_rep=''))
+
+Note that ``pivot_table`` is also available as an instance method on DataFrame,
+ i.e. :meth:`DataFrame.pivot_table`.
+
+.. _reshaping.pivot.margins:
+
+Adding margins
+~~~~~~~~~~~~~~
+
+If you pass ``margins=True`` to ``pivot_table``, special ``All`` columns and
+rows will be added with partial group aggregates across the categories on the
+rows and columns:
+
+.. ipython:: python
+
+   df.pivot_table(index=['A', 'B'], columns='C', margins=True, aggfunc=np.std)
+
+.. _reshaping.crosstabulations:
+
+Cross tabulations
+-----------------
+
+Use :func:`~pandas.crosstab` to compute a cross-tabulation of two (or more)
+factors. By default ``crosstab`` computes a frequency table of the factors
+unless an array of values and an aggregation function are passed.
+
+It takes a number of arguments
+
+* ``index``: array-like, values to group by in the rows.
+* ``columns``: array-like, values to group by in the columns.
+* ``values``: array-like, optional, array of values to aggregate according to
+  the factors.
+* ``aggfunc``: function, optional, If no values array is passed, computes a
+  frequency table.
+* ``rownames``: sequence, default ``None``, must match number of row arrays passed.
+* ``colnames``: sequence, default ``None``, if passed, must match number of column
+  arrays passed.
+* ``margins``: boolean, default ``False``, Add row/column margins (subtotals)
+* ``normalize``: boolean, {'all', 'index', 'columns'}, or {0,1}, default ``False``.
+  Normalize by dividing all values by the sum of values.
+
+
+Any ``Series`` passed will have their name attributes used unless row or column
+names for the cross-tabulation are specified
+
+For example:
+
+.. ipython:: python
+
+    foo, bar, dull, shiny, one, two = 'foo', 'bar', 'dull', 'shiny', 'one', 'two'
+    a = np.array([foo, foo, bar, bar, foo, foo], dtype=object)
+    b = np.array([one, one, two, one, two, one], dtype=object)
+    c = np.array([dull, dull, shiny, dull, dull, shiny], dtype=object)
+    pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
+
+
+If ``crosstab`` receives only two Series, it will provide a frequency table.
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 2, 2, 2, 2], 'B': [3, 3, 4, 4, 4],
+                       'C': [1, 1, np.nan, 1, 1]})
+    df
+
+    pd.crosstab(df.A, df.B)
+
+Any input passed containing ``Categorical`` data will have **all** of its
+categories included in the cross-tabulation, even if the actual data does
+not contain any instances of a particular category.
+
+.. ipython:: python
+
+    foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+    bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
+    pd.crosstab(foo, bar)
+
+Normalization
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+Frequency tables can also be normalized to show percentages rather than counts
+using the ``normalize`` argument:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, normalize=True)
+
+``normalize`` can also normalize values within each row or within each column:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, normalize='columns')
+
+``crosstab`` can also be passed a third ``Series`` and an aggregation function
+(``aggfunc``) that will be applied to the values of the third ``Series`` within
+each group defined by the first two ``Series``:
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum)
+
+Adding Margins
+~~~~~~~~~~~~~~
+
+Finally, one can also add margins or normalize this output.
+
+.. ipython:: python
+
+   pd.crosstab(df.A, df.B, values=df.C, aggfunc=np.sum, normalize=True,
+               margins=True)
+
+.. _reshaping.tile:
+.. _reshaping.tile.cut:
+
+Tiling
+------
+
+The :func:`~pandas.cut` function computes groupings for the values of the input
+array and is often used to transform continuous variables to discrete or
+categorical variables:
+
+.. ipython:: python
+
+   ages = np.array([10, 15, 13, 12, 23, 25, 28, 59, 60])
+
+   pd.cut(ages, bins=3)
+
+If the ``bins`` keyword is an integer, then equal-width bins are formed.
+Alternatively we can specify custom bin-edges:
+
+.. ipython:: python
+
+   c = pd.cut(ages, bins=[0, 18, 35, 70])
+   c
+
+.. versionadded:: 0.20.0
+
+If the ``bins`` keyword is an ``IntervalIndex``, then these will be
+used to bin the passed data.::
+
+   pd.cut([25, 20, 50], bins=c.categories)
+
+
+.. _reshaping.dummies:
+
+Computing indicator / dummy variables
+-------------------------------------
+
+To convert a categorical variable into a "dummy" or "indicator" ``DataFrame``,
+for example a column in a ``DataFrame`` (a ``Series``) which has ``k`` distinct
+values, can derive a ``DataFrame`` containing ``k`` columns of 1s and 0s using
+:func:`~pandas.get_dummies`:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'key': list('bbacab'), 'data1': range(6)})
+
+   pd.get_dummies(df['key'])
+
+Sometimes it's useful to prefix the column names, for example when merging the result
+with the original ``DataFrame``:
+
+.. ipython:: python
+
+   dummies = pd.get_dummies(df['key'], prefix='key')
+   dummies
+
+   df[['data1']].join(dummies)
+
+This function is often used along with discretization functions like ``cut``:
+
+.. ipython:: python
+
+   values = np.random.randn(10)
+   values
+
+   bins = [0, 0.2, 0.4, 0.6, 0.8, 1]
+
+   pd.get_dummies(pd.cut(values, bins))
+
+See also :func:`Series.str.get_dummies <pandas.Series.str.get_dummies>`.
+
+:func:`get_dummies` also accepts a ``DataFrame``. By default all categorical
+variables (categorical in the statistical sense, those with `object` or
+`categorical` dtype) are encoded as dummy variables.
+
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['c', 'c', 'b'],
+                       'C': [1, 2, 3]})
+    pd.get_dummies(df)
+
+All non-object columns are included untouched in the output. You can control
+the columns that are encoded with the ``columns`` keyword.
+
+.. ipython:: python
+
+    pd.get_dummies(df, columns=['A'])
+
+Notice that the ``B`` column is still included in the output, it just hasn't
+been encoded. You can drop ``B`` before calling ``get_dummies`` if you don't
+want to include it in the output.
+
+As with the ``Series`` version, you can pass values for the ``prefix`` and
+``prefix_sep``. By default the column name is used as the prefix, and '_' as
+the prefix separator. You can specify ``prefix`` and ``prefix_sep`` in 3 ways:
+
+* string: Use the same value for ``prefix`` or ``prefix_sep`` for each column
+  to be encoded.
+* list: Must be the same length as the number of columns being encoded.
+* dict: Mapping column name to prefix.
+
+.. ipython:: python
+
+    simple = pd.get_dummies(df, prefix='new_prefix')
+    simple
+    from_list = pd.get_dummies(df, prefix=['from_A', 'from_B'])
+    from_list
+    from_dict = pd.get_dummies(df, prefix={'B': 'from_B', 'A': 'from_A'})
+    from_dict
+
+.. versionadded:: 0.18.0
+
+Sometimes it will be useful to only keep k-1 levels of a categorical
+variable to avoid collinearity when feeding the result to statistical models.
+You can switch to this mode by turn on ``drop_first``.
+
+.. ipython:: python
+
+    s = pd.Series(list('abcaa'))
+
+    pd.get_dummies(s)
+
+    pd.get_dummies(s, drop_first=True)
+
+When a column contains only one level, it will be omitted in the result.
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('aaaaa'), 'B': list('ababc')})
+
+    pd.get_dummies(df)
+
+    pd.get_dummies(df, drop_first=True)
+
+By default new columns will have ``np.uint8`` dtype.
+To choose another dtype, use the ``dtype`` argument:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abc'), 'B': [1.1, 2.2, 3.3]})
+
+    pd.get_dummies(df, dtype=bool).dtypes
+
+.. versionadded:: 0.23.0
+
+
+.. _reshaping.factorize:
+
+Factorizing values
+------------------
+
+To encode 1-d values as an enumerated type use :func:`~pandas.factorize`:
+
+.. ipython:: python
+
+   x = pd.Series(['A', 'A', np.nan, 'B', 3.14, np.inf])
+   x
+   labels, uniques = pd.factorize(x)
+   labels
+   uniques
+
+Note that ``factorize`` is similar to ``numpy.unique``, but differs in its
+handling of NaN:
+
+.. note::
+   The following ``numpy.unique`` will fail under Python 3 with a ``TypeError``
+   because of an ordering bug. See also
+   `here <https://github.com/numpy/numpy/issues/641>`__.
+
+.. code-block:: ipython
+
+    In [1]: x = pd.Series(['A', 'A', np.nan, 'B', 3.14, np.inf])
+    In [2]: pd.factorize(x, sort=True)
+    Out[2]:
+    (array([ 2,  2, -1,  3,  0,  1]),
+     Index([3.14, inf, u'A', u'B'], dtype='object'))
+
+    In [3]: np.unique(x, return_inverse=True)[::-1]
+    Out[3]: (array([3, 3, 0, 4, 1, 2]), array([nan, 3.14, inf, 'A', 'B'], dtype=object))
+
+.. note::
+    If you just want to handle one column as a categorical variable (like R's factor),
+    you can use  ``df["cat_col"] = pd.Categorical(df["col"])`` or
+    ``df["cat_col"] = df["col"].astype("category")``. For full docs on :class:`~pandas.Categorical`,
+    see the :ref:`Categorical introduction <categorical>` and the
+    :ref:`API documentation <api.categorical>`.
+
+Examples
+--------
+
+In this section, we will review frequently asked questions and examples. The
+column names and relevant column values are named to correspond with how this
+DataFrame will be pivoted in the answers below.
+
+.. ipython:: python
+
+   np.random.seed([3, 1415])
+   n = 20
+
+   cols = np.array(['key', 'row', 'item', 'col'])
+   df = cols + pd.DataFrame((np.random.randint(5, size=(n, 4))
+                            // [2, 1, 2, 1]).astype(str))
+   df.columns = cols
+   df = df.join(pd.DataFrame(np.random.rand(n, 2).round(2)).add_prefix('val'))
+
+   df
+
+Pivoting with Single Aggregations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Suppose we wanted to pivot ``df`` such that the ``col`` values are columns,
+``row`` values are the index, and the mean of ``val0`` are the values? In
+particular, the resulting DataFrame should look like:
+
+.. note::
+
+   col   col0   col1   col2   col3  col4
+   row
+   row0  0.77  0.605    NaN  0.860  0.65
+   row2  0.13    NaN  0.395  0.500  0.25
+   row3   NaN  0.310    NaN  0.545   NaN
+   row4   NaN  0.100  0.395  0.760  0.24
+
+This solution uses :func:`~pandas.pivot_table`. Also note that
+``aggfunc='mean'`` is the default. It is included here to be explicit.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values='val0', index='row', columns='col', aggfunc='mean')
+
+Note that we can also replace the missing values by using the ``fill_value``
+parameter.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values='val0', index='row', columns='col', aggfunc='mean', fill_value=0)
+
+Also note that we can pass in other aggregation functions as well. For example,
+we can also pass in ``sum``.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values='val0', index='row', columns='col', aggfunc='sum', fill_value=0)
+
+Another aggregation we can do is calculate the frequency in which the columns
+and rows occur together a.k.a. "cross tabulation". To do this, we can pass
+``size`` to the ``aggfunc`` parameter.
+
+.. ipython:: python
+
+   df.pivot_table(index='row', columns='col', fill_value=0, aggfunc='size')
+
+Pivoting with Multiple Aggregations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+We can also perform multiple aggregations. For example, to perform both a
+``sum`` and ``mean``, we can pass in a list to the ``aggfunc`` argument.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values='val0', index='row', columns='col', aggfunc=['mean', 'sum'])
+
+Note to aggregate over multiple value columns, we can pass in a list to the
+``values`` parameter.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values=['val0', 'val1'], index='row', columns='col', aggfunc=['mean'])
+
+Note to subdivide over multiple columns we can pass in a list to the
+``columns`` parameter.
+
+.. ipython:: python
+
+   df.pivot_table(
+       values=['val0'], index='row', columns=['item', 'col'], aggfunc=['mean'])
diff --git a/doc/source/sparse.rst b/doc/source/user_guide/sparse.rst
similarity index 85%
rename from doc/source/sparse.rst
rename to doc/source/user_guide/sparse.rst
index b4884cf1c4141..540e52fc2b08a 100644
--- a/doc/source/sparse.rst
+++ b/doc/source/user_guide/sparse.rst
@@ -1,15 +1,6 @@
-.. currentmodule:: pandas
 .. _sparse:
 
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   np.random.seed(123456)
-   import pandas as pd
-   import pandas.util.testing as tm
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows = 15
+{{ header }}
 
 **********************
 Sparse data structures
@@ -17,22 +8,22 @@ Sparse data structures
 
 .. note:: The ``SparsePanel`` class has been removed in 0.19.0
 
-We have implemented "sparse" versions of Series and DataFrame. These are not sparse
+We have implemented "sparse" versions of ``Series`` and ``DataFrame``. These are not sparse
 in the typical "mostly 0". Rather, you can view these objects as being "compressed"
 where any data matching a specific value (``NaN`` / missing value, though any value
 can be chosen) is omitted. A special ``SparseIndex`` object tracks where data has been
-"sparsified". This will make much more sense in an example. All of the standard pandas
+"sparsified". This will make much more sense with an example. All of the standard pandas
 data structures have a ``to_sparse`` method:
 
 .. ipython:: python
 
-   ts = pd.Series(randn(10))
+   ts = pd.Series(np.random.randn(10))
    ts[2:-2] = np.nan
    sts = ts.to_sparse()
    sts
 
 The ``to_sparse`` method takes a ``kind`` argument (for the sparse index, see
-below) and a ``fill_value``. So if we had a mostly zero Series, we could
+below) and a ``fill_value``. So if we had a mostly zero ``Series``, we could
 convert it to sparse with ``fill_value=0``:
 
 .. ipython:: python
@@ -40,11 +31,11 @@ convert it to sparse with ``fill_value=0``:
    ts.fillna(0).to_sparse(fill_value=0)
 
 The sparse objects exist for memory efficiency reasons. Suppose you had a
-large, mostly NA DataFrame:
+large, mostly NA ``DataFrame``:
 
 .. ipython:: python
 
-   df = pd.DataFrame(randn(10000, 4))
+   df = pd.DataFrame(np.random.randn(10000, 4))
    df.iloc[:9998] = np.nan
    sdf = df.to_sparse()
    sdf
@@ -62,6 +53,26 @@ Any sparse object can be converted back to the standard dense form by calling
 
    sts.to_dense()
 
+.. _sparse.accessor:
+
+Sparse Accessor
+---------------
+
+.. versionadded:: 0.24.0
+
+Pandas provides a ``.sparse`` accessor, similar to ``.str`` for string data, ``.cat``
+for categorical data, and ``.dt`` for datetime-like data. This namespace provides
+attributes and methods that are specific to sparse data.
+
+.. ipython:: python
+
+   s = pd.Series([0, 0, 1, 2], dtype="Sparse[int]")
+   s.sparse.density
+   s.sparse.fill_value
+
+This accessor is available only on data with ``SparseDtype``, and on the :class:`Series`
+class itself for creating a Series with sparse data from a scipy COO matrix with.
+
 .. _sparse.array:
 
 SparseArray
@@ -74,7 +85,8 @@ distinct from the ``fill_value``:
 .. ipython:: python
 
    arr = np.random.randn(10)
-   arr[2:5] = np.nan; arr[7:8] = np.nan
+   arr[2:5] = np.nan
+   arr[7:8] = np.nan
    sparr = pd.SparseArray(arr)
    sparr
 
@@ -85,15 +97,6 @@ can be converted back to a regular ndarray by calling ``to_dense``:
 
    sparr.to_dense()
 
-.. _sparse.list:
-
-SparseList
-----------
-
-The ``SparseList`` class has been deprecated and will be removed in a future version.
-See the `docs of a previous version <http://pandas.pydata.org/pandas-docs/version/0.18.1/sparse.html#sparselist>`__
-for documentation on ``SparseList``.
-
 
 SparseIndex objects
 -------------------
@@ -113,9 +116,9 @@ Sparse data should have the same dtype as its dense representation. Currently,
 ``float64``, ``int64`` and ``bool`` dtypes are supported. Depending on the original
 dtype, ``fill_value`` default changes:
 
-- ``float64``: ``np.nan``
-- ``int64``: ``0``
-- ``bool``: ``False``
+* ``float64``: ``np.nan``
+* ``int64``: ``0``
+* ``bool``: ``False``
 
 .. ipython:: python
 
@@ -132,7 +135,7 @@ dtype, ``fill_value`` default changes:
    s.to_sparse()
 
 You can change the dtype using ``.astype()``, the result is also sparse. Note that
-``.astype()`` also affects to the ``fill_value`` to keep its dense represantation.
+``.astype()`` also affects to the ``fill_value`` to keep its dense representation.
 
 
 .. ipython:: python
@@ -148,6 +151,7 @@ It raises if any value cannot be coerced to specified dtype.
 .. code-block:: ipython
 
    In [1]: ss = pd.Series([1, np.nan, np.nan]).to_sparse()
+   Out[1]:
    0    1.0
    1    NaN
    2    NaN
@@ -157,6 +161,7 @@ It raises if any value cannot be coerced to specified dtype.
    Block lengths: array([1], dtype=int32)
 
    In [2]: ss.astype(np.int64)
+   Out[2]:
    ValueError: unable to coerce current fill_value nan to int64 dtype
 
 .. _sparse.calculation:
@@ -216,16 +221,10 @@ To convert a ``SparseDataFrame`` back to sparse SciPy matrix in COO format, you
 SparseSeries
 ~~~~~~~~~~~~
 
-.. versionadded:: 0.16.0
-
 A :meth:`SparseSeries.to_coo` method is implemented for transforming a ``SparseSeries`` indexed by a ``MultiIndex`` to a ``scipy.sparse.coo_matrix``.
 
 The method requires a ``MultiIndex`` with two or more levels.
 
-.. ipython:: python
-   :suppress:
-
-
 .. ipython:: python
 
    s = pd.Series([3.0, np.nan, 1.0, 3.0, np.nan, np.nan])
@@ -235,7 +234,7 @@ The method requires a ``MultiIndex`` with two or more levels.
                                         (1, 1, 'b', 1),
                                         (2, 1, 'b', 0),
                                         (2, 1, 'b', 1)],
-                                        names=['A', 'B', 'C', 'D'])
+                                       names=['A', 'B', 'C', 'D'])
 
    s
    # SparseSeries
@@ -270,9 +269,6 @@ Specifying different row and column labels (and not sorting them) yields a diffe
 
 A convenience method :meth:`SparseSeries.from_coo` is implemented for creating a ``SparseSeries`` from a ``scipy.sparse.coo_matrix``.
 
-.. ipython:: python
-   :suppress:
-
 .. ipython:: python
 
    from scipy import sparse
diff --git a/doc/source/user_guide/style.ipynb b/doc/source/user_guide/style.ipynb
new file mode 100644
index 0000000000000..79a9848704eec
--- /dev/null
+++ b/doc/source/user_guide/style.ipynb
@@ -0,0 +1,1188 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Styling\n",
+    "\n",
+    "*New in version 0.17.1*\n",
+    "\n",
+    "<span style=\"color: red\">*Provisional: This is a new feature and still under development. We'll be adding features and possibly making breaking changes in future releases. We'd love to hear your feedback.*</span>\n",
+    "\n",
+    "This document is written as a Jupyter Notebook, and can be viewed or downloaded [here](http://nbviewer.ipython.org/github/pandas-dev/pandas/blob/master/doc/source/style.ipynb).\n",
+    "\n",
+    "You can apply **conditional formatting**, the visual styling of a DataFrame\n",
+    "depending on the data within, by using the ``DataFrame.style`` property.\n",
+    "This is a property that returns a ``Styler`` object, which has\n",
+    "useful methods for formatting and displaying DataFrames.\n",
+    "\n",
+    "The styling is accomplished using CSS.\n",
+    "You write \"style functions\" that take scalars, `DataFrame`s or `Series`, and return *like-indexed* DataFrames or Series with CSS `\"attribute: value\"` pairs for the values.\n",
+    "These functions can be incrementally passed to the `Styler` which collects the styles before rendering."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Building Styles\n",
+    "\n",
+    "Pass your style functions into one of the following methods:\n",
+    "\n",
+    "- ``Styler.applymap``: elementwise\n",
+    "- ``Styler.apply``: column-/row-/table-wise\n",
+    "\n",
+    "Both of those methods take a function (and some other keyword arguments) and applies your function to the DataFrame in a certain way.\n",
+    "`Styler.applymap` works through the DataFrame elementwise.\n",
+    "`Styler.apply` passes each column or row into your DataFrame one-at-a-time or the entire table at once, depending on the `axis` keyword argument.\n",
+    "For columnwise use `axis=0`, rowwise use `axis=1`, and for the entire table at once use `axis=None`.\n",
+    "\n",
+    "For `Styler.applymap` your function should take a scalar and return a single string with the CSS attribute-value pair.\n",
+    "\n",
+    "For `Styler.apply` your function should take a Series or DataFrame (depending on the axis parameter), and return a Series or DataFrame with an identical shape where each value is a string with a CSS attribute-value pair.\n",
+    "\n",
+    "Let's see some examples."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "nbsphinx": "hidden"
+   },
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot\n",
+    "# We have this here to trigger matplotlib's font cache stuff.\n",
+    "# This cell is hidden from the output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "np.random.seed(24)\n",
+    "df = pd.DataFrame({'A': np.linspace(1, 10, 10)})\n",
+    "df = pd.concat([df, pd.DataFrame(np.random.randn(10, 4), columns=list('BCDE'))],\n",
+    "               axis=1)\n",
+    "df.iloc[0, 2] = np.nan"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Here's a boring example of rendering a DataFrame, without any (visible) styles:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "*Note*: The `DataFrame.style` attribute is a property that returns a `Styler` object. `Styler` has a `_repr_html_` method defined on it so they are rendered automatically. If you want the actual HTML back for further processing or for writing to file call the `.render()` method which returns a string.\n",
+    "\n",
+    "The above output looks very similar to the standard DataFrame HTML representation. But we've done some work behind the scenes to attach CSS classes to each cell. We can view these by calling the `.render` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_null().render().split('\\n')[:10]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The `row0_col2` is the identifier for that particular cell. We've also prepended each row/column identifier with a UUID unique to each DataFrame so that the style from one doesn't collide with the styling from another within the same notebook or page (you can set the `uuid` if you'd like to tie together the styling of two DataFrames).\n",
+    "\n",
+    "When writing style functions, you take care of producing the CSS attribute / value pairs you want. Pandas matches those up with the CSS classes that identify each cell."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's write a simple style function that will color negative numbers red and positive numbers black."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def color_negative_red(val):\n",
+    "    \"\"\"\n",
+    "    Takes a scalar and returns a string with\n",
+    "    the css property `'color: red'` for negative\n",
+    "    strings, black otherwise.\n",
+    "    \"\"\"\n",
+    "    color = 'red' if val < 0 else 'black'\n",
+    "    return 'color: %s' % color"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this case, the cell's style depends only on it's own value.\n",
+    "That means we should use the `Styler.applymap` method which works elementwise."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "s = df.style.applymap(color_negative_red)\n",
+    "s"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice the similarity with the standard `df.applymap`, which operates on DataFrames elementwise. We want you to be able to reuse your existing knowledge of how to interact with DataFrames.\n",
+    "\n",
+    "Notice also that our function returned a string containing the CSS attribute and value, separated by a colon just like in a `<style>` tag. This will be a common theme.\n",
+    "\n",
+    "Finally, the input shapes matched. `Styler.applymap` calls the function on each scalar input, and the function returns a scalar output."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now suppose you wanted to highlight the maximum value in each column.\n",
+    "We can't use `.applymap` anymore since that operated elementwise.\n",
+    "Instead, we'll turn to `.apply` which operates columnwise (or rowwise using the `axis` keyword). Later on we'll see that something like `highlight_max` is already defined on `Styler` so you wouldn't need to write this yourself."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def highlight_max(s):\n",
+    "    '''\n",
+    "    highlight the maximum in a Series yellow.\n",
+    "    '''\n",
+    "    is_max = s == s.max()\n",
+    "    return ['background-color: yellow' if v else '' for v in is_max]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "In this case the input is a `Series`, one column at a time.\n",
+    "Notice that the output shape of `highlight_max` matches the input shape, an array with `len(s)` items."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We encourage you to use method chains to build up a style piecewise, before finally rending at the end of the chain."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.\\\n",
+    "    applymap(color_negative_red).\\\n",
+    "    apply(highlight_max)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Above we used `Styler.apply` to pass in each column one at a time.\n",
+    "\n",
+    "<span style=\"background-color: #DEDEBE\">*Debugging Tip*: If you're having trouble writing your style function, try just passing it into <code style=\"background-color: #DEDEBE\">DataFrame.apply</code>. Internally, <code style=\"background-color: #DEDEBE\">Styler.apply</code> uses <code style=\"background-color: #DEDEBE\">DataFrame.apply</code> so the result should be the same.</span>\n",
+    "\n",
+    "What if you wanted to highlight just the maximum value in the entire table?\n",
+    "Use `.apply(function, axis=None)` to indicate that your function wants the entire table, not one column or row at a time. Let's try that next.\n",
+    "\n",
+    "We'll rewrite our `highlight-max` to handle either Series (from `.apply(axis=0 or 1)`) or DataFrames (from `.apply(axis=None)`). We'll also allow the color to be adjustable, to demonstrate that `.apply`, and `.applymap` pass along keyword arguments."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def highlight_max(data, color='yellow'):\n",
+    "    '''\n",
+    "    highlight the maximum in a Series or DataFrame\n",
+    "    '''\n",
+    "    attr = 'background-color: {}'.format(color)\n",
+    "    if data.ndim == 1:  # Series from .apply(axis=0) or axis=1\n",
+    "        is_max = data == data.max()\n",
+    "        return [attr if v else '' for v in is_max]\n",
+    "    else:  # from .apply(axis=None)\n",
+    "        is_max = data == data.max().max()\n",
+    "        return pd.DataFrame(np.where(is_max, attr, ''),\n",
+    "                            index=data.index, columns=data.columns)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "When using ``Styler.apply(func, axis=None)``, the function must return a DataFrame with the same index and column labels."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max, color='darkorange', axis=None)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Building Styles Summary\n",
+    "\n",
+    "Style functions should return strings with one or more CSS `attribute: value` delimited by semicolons. Use\n",
+    "\n",
+    "- `Styler.applymap(func)` for elementwise styles\n",
+    "- `Styler.apply(func, axis=0)` for columnwise styles\n",
+    "- `Styler.apply(func, axis=1)` for rowwise styles\n",
+    "- `Styler.apply(func, axis=None)` for tablewise styles\n",
+    "\n",
+    "And crucially the input and output shapes of `func` must match. If `x` is the input then ``func(x).shape == x.shape``."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Finer Control: Slicing"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Both `Styler.apply`, and `Styler.applymap` accept a `subset` keyword.\n",
+    "This allows you to apply styles to specific rows or columns, without having to code that logic into your `style` function.\n",
+    "\n",
+    "The value passed to `subset` behaves similar to slicing a DataFrame.\n",
+    "\n",
+    "- A scalar is treated as a column label\n",
+    "- A list (or series or numpy array)\n",
+    "- A tuple is treated as `(row_indexer, column_indexer)`\n",
+    "\n",
+    "Consider using `pd.IndexSlice` to construct the tuple for the last one."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.apply(highlight_max, subset=['B', 'C', 'D'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For row and column slicing, any valid indexer to `.loc` will work."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.applymap(color_negative_red,\n",
+    "                  subset=pd.IndexSlice[2:5, ['B', 'D']])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Only label-based slicing is supported right now, not positional.\n",
+    "\n",
+    "If your style function uses a `subset` or `axis` keyword argument, consider wrapping your function in a `functools.partial`, partialing out that keyword.\n",
+    "\n",
+    "```python\n",
+    "my_func2 = functools.partial(my_func, subset=42)\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Finer Control: Display Values\n",
+    "\n",
+    "We distinguish the *display* value from the *actual* value in `Styler`.\n",
+    "To control the display value, the text is printed in each cell, use `Styler.format`. Cells can be formatted according to a [format spec string](https://docs.python.org/3/library/string.html#format-specification-mini-language) or a callable that takes a single value and returns a string."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format(\"{:.2%}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Use a dictionary to format specific columns."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format({'B': \"{:0<4.0f}\", 'D': '{:+.2f}'})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Or pass in a callable (or dictionary of callables) for more flexible handling."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.format({\"B\": lambda x: \"±{:.2f}\".format(abs(x))})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Builtin Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Finally, we expect certain styling functions to be common enough that we've included a few \"built-in\" to the `Styler`, so you don't have to write them yourself."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_null(null_color='red')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can create \"heatmaps\" with the `background_gradient` method. These require matplotlib, and we'll use [Seaborn](http://stanford.edu/~mwaskom/software/seaborn/) to get a nice colormap."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import seaborn as sns\n",
+    "\n",
+    "cm = sns.light_palette(\"green\", as_cmap=True)\n",
+    "\n",
+    "s = df.style.background_gradient(cmap=cm)\n",
+    "s"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "`Styler.background_gradient` takes the keyword arguments `low` and `high`. Roughly speaking these extend the range of your data by `low` and `high` percent so that when we convert the colors, the colormap's entire range isn't used. This is useful so that you can actually read the text still."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Uses the full color range\n",
+    "df.loc[:4].style.background_gradient(cmap='viridis')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Compress the color range\n",
+    "(df.loc[:4]\n",
+    "    .style\n",
+    "    .background_gradient(cmap='viridis', low=.5, high=0)\n",
+    "    .highlight_null('red'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "There's also `.highlight_min` and `.highlight_max`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.highlight_max(axis=0)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Use `Styler.set_properties` when the style doesn't actually depend on the values."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.set_properties(**{'background-color': 'black',\n",
+    "                           'color': 'lawngreen',\n",
+    "                           'border-color': 'white'})"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Bar charts"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can include \"bar charts\" in your DataFrame."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.bar(subset=['A', 'B'], color='#d65f5f')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "New in version 0.20.0 is the ability to customize further the bar chart: You can now have the `df.style.bar` be centered on zero or midpoint value (in addition to the already existing way of having the min value at the left side of the cell), and you can pass a list of `[color_negative, color_positive]`.\n",
+    "\n",
+    "Here's how you can change the above with the new `align='mid'` option:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.bar(subset=['A', 'B'], align='mid', color=['#d65f5f', '#5fba7d'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The following example aims to give a highlight of the behavior of the new align options:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "from IPython.display import HTML\n",
+    "\n",
+    "# Test series\n",
+    "test1 = pd.Series([-100,-60,-30,-20], name='All Negative')\n",
+    "test2 = pd.Series([10,20,50,100], name='All Positive')\n",
+    "test3 = pd.Series([-10,-5,0,90], name='Both Pos and Neg')\n",
+    "\n",
+    "head = \"\"\"\n",
+    "<table>\n",
+    "    <thead>\n",
+    "        <th>Align</th>\n",
+    "        <th>All Negative</th>\n",
+    "        <th>All Positive</th>\n",
+    "        <th>Both Neg and Pos</th>\n",
+    "    </thead>\n",
+    "    </tbody>\n",
+    "\n",
+    "\"\"\"\n",
+    "\n",
+    "aligns = ['left','zero','mid']\n",
+    "for align in aligns:\n",
+    "    row = \"<tr><th>{}</th>\".format(align)\n",
+    "    for serie in [test1,test2,test3]:\n",
+    "        s = serie.copy()\n",
+    "        s.name=''\n",
+    "        row += \"<td>{}</td>\".format(s.to_frame().style.bar(align=align, \n",
+    "                                                           color=['#d65f5f', '#5fba7d'], \n",
+    "                                                           width=100).render()) #testn['width']\n",
+    "    row += '</tr>'\n",
+    "    head += row\n",
+    "    \n",
+    "head+= \"\"\"\n",
+    "</tbody>\n",
+    "</table>\"\"\"\n",
+    "        \n",
+    "\n",
+    "HTML(head)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Sharing Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Say you have a lovely style built up for a DataFrame, and now you want to apply the same style to a second DataFrame. Export the style with `df1.style.export`, and import it on the second DataFrame with `df1.style.set`"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df2 = -df\n",
+    "style1 = df.style.applymap(color_negative_red)\n",
+    "style1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "style2 = df2.style\n",
+    "style2.use(style1.export())\n",
+    "style2"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice that you're able share the styles even though they're data aware. The styles are re-evaluated on the new DataFrame they've been `use`d upon."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Other Options\n",
+    "\n",
+    "You've seen a few methods for data-driven styling.\n",
+    "`Styler` also provides a few other options for styles that don't depend on the data.\n",
+    "\n",
+    "- precision\n",
+    "- captions\n",
+    "- table-wide styles\n",
+    "- hiding the index or columns\n",
+    "\n",
+    "Each of these can be specified in two ways:\n",
+    "\n",
+    "- A keyword argument to `Styler.__init__`\n",
+    "- A call to one of the `.set_` or `.hide_` methods, e.g. `.set_caption` or `.hide_columns`\n",
+    "\n",
+    "The best method to use depends on the context. Use the `Styler` constructor when building many styled DataFrames that should all share the same properties. For interactive use, the`.set_` and `.hide_` methods are more convenient."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Precision"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "You can control the precision of floats using pandas' regular `display.precision` option."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with pd.option_context('display.precision', 2):\n",
+    "    html = (df.style\n",
+    "              .applymap(color_negative_red)\n",
+    "              .apply(highlight_max))\n",
+    "html"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Or through a `set_precision` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style\\\n",
+    "  .applymap(color_negative_red)\\\n",
+    "  .apply(highlight_max)\\\n",
+    "  .set_precision(2)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Setting the precision only affects the printed number; the full-precision values are always passed to your style functions. You can always use `df.round(2).style` if you'd prefer to round from the start."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Captions"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Regular table captions can be added in a few ways."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.set_caption('Colormaps, with a caption.')\\\n",
+    "    .background_gradient(cmap=cm)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Table Styles"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The next option you have are \"table styles\".\n",
+    "These are styles that apply to the table as a whole, but don't look at the data.\n",
+    "Certain sytlings, including pseudo-selectors like `:hover` can only be used this way."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.display import HTML\n",
+    "\n",
+    "def hover(hover_color=\"#ffff99\"):\n",
+    "    return dict(selector=\"tr:hover\",\n",
+    "                props=[(\"background-color\", \"%s\" % hover_color)])\n",
+    "\n",
+    "styles = [\n",
+    "    hover(),\n",
+    "    dict(selector=\"th\", props=[(\"font-size\", \"150%\"),\n",
+    "                               (\"text-align\", \"center\")]),\n",
+    "    dict(selector=\"caption\", props=[(\"caption-side\", \"bottom\")])\n",
+    "]\n",
+    "html = (df.style.set_table_styles(styles)\n",
+    "          .set_caption(\"Hover to highlight.\"))\n",
+    "html"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "`table_styles` should be a list of dictionaries.\n",
+    "Each dictionary should have the `selector` and `props` keys.\n",
+    "The value for `selector` should be a valid CSS selector.\n",
+    "Recall that all the styles are already attached to an `id`, unique to\n",
+    "each `Styler`. This selector is in addition to that `id`.\n",
+    "The value for `props` should be a list of tuples of `('attribute', 'value')`.\n",
+    "\n",
+    "`table_styles` are extremely flexible, but not as fun to type out by hand.\n",
+    "We hope to collect some useful ones either in pandas, or preferable in a new package that [builds on top](#Extensibility) the tools here."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Hiding the Index or Columns"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The index can be hidden from rendering by calling `Styler.hide_index`. Columns can be hidden from rendering by calling `Styler.hide_columns` and passing in the name of a column, or a slice of columns."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.hide_index()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.hide_columns(['C','D'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### CSS Classes\n",
+    "\n",
+    "Certain CSS classes are attached to cells.\n",
+    "\n",
+    "- Index and Column names include `index_name` and `level<k>` where `k` is its level in a MultiIndex\n",
+    "- Index label cells include\n",
+    "  + `row_heading`\n",
+    "  + `row<n>` where `n` is the numeric position of the row\n",
+    "  + `level<k>` where `k` is the level in a MultiIndex\n",
+    "- Column label cells include\n",
+    "  + `col_heading`\n",
+    "  + `col<n>` where `n` is the numeric position of the column\n",
+    "  + `level<k>` where `k` is the level in a MultiIndex\n",
+    "- Blank cells include `blank`\n",
+    "- Data cells include `data`"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Limitations\n",
+    "\n",
+    "- DataFrame only `(use Series.to_frame().style)`\n",
+    "- The index and columns must be unique\n",
+    "- No large repr, and performance isn't great; this is intended for summary DataFrames\n",
+    "- You can only style the *values*, not the index or columns\n",
+    "- You can only apply styles, you can't insert new HTML entities\n",
+    "\n",
+    "Some of these will be addressed in the future.\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Terms\n",
+    "\n",
+    "- Style function: a function that's passed into `Styler.apply` or `Styler.applymap` and returns values like `'css attribute: value'`\n",
+    "- Builtin style functions: style functions that are methods on `Styler`\n",
+    "- table style: a dictionary with the two keys `selector` and `props`. `selector` is the CSS selector that `props` will apply to. `props` is a list of `(attribute, value)` tuples. A list of table styles passed into `Styler`."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Fun stuff\n",
+    "\n",
+    "Here are a few interesting examples.\n",
+    "\n",
+    "`Styler` interacts pretty well with widgets. If you're viewing this online instead of running the notebook yourself, you're missing out on interactively adjusting the color palette."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.html import widgets\n",
+    "@widgets.interact\n",
+    "def f(h_neg=(0, 359, 1), h_pos=(0, 359), s=(0., 99.9), l=(0., 99.9)):\n",
+    "    return df.style.background_gradient(\n",
+    "        cmap=sns.palettes.diverging_palette(h_neg=h_neg, h_pos=h_pos, s=s, l=l,\n",
+    "                                            as_cmap=True)\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def magnify():\n",
+    "    return [dict(selector=\"th\",\n",
+    "                 props=[(\"font-size\", \"4pt\")]),\n",
+    "            dict(selector=\"td\",\n",
+    "                 props=[('padding', \"0em 0em\")]),\n",
+    "            dict(selector=\"th:hover\",\n",
+    "                 props=[(\"font-size\", \"12pt\")]),\n",
+    "            dict(selector=\"tr:hover td:hover\",\n",
+    "                 props=[('max-width', '200px'),\n",
+    "                        ('font-size', '12pt')])\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "np.random.seed(25)\n",
+    "cmap = cmap=sns.diverging_palette(5, 250, as_cmap=True)\n",
+    "bigdf = pd.DataFrame(np.random.randn(20, 25)).cumsum()\n",
+    "\n",
+    "bigdf.style.background_gradient(cmap, axis=1)\\\n",
+    "    .set_properties(**{'max-width': '80px', 'font-size': '1pt'})\\\n",
+    "    .set_caption(\"Hover to magnify\")\\\n",
+    "    .set_precision(2)\\\n",
+    "    .set_table_styles(magnify())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Export to Excel\n",
+    "\n",
+    "*New in version 0.20.0*\n",
+    "\n",
+    "<span style=\"color: red\">*Experimental: This is a new feature and still under development. We'll be adding features and possibly making breaking changes in future releases. We'd love to hear your feedback.*</span>\n",
+    "\n",
+    "Some support is available for exporting styled `DataFrames` to Excel worksheets using the `OpenPyXL` or `XlsxWriter` engines. CSS2.2 properties handled include:\n",
+    "\n",
+    "- `background-color`\n",
+    "- `border-style`, `border-width`, `border-color` and their {`top`, `right`, `bottom`, `left` variants}\n",
+    "- `color`\n",
+    "- `font-family`\n",
+    "- `font-style`\n",
+    "- `font-weight`\n",
+    "- `text-align`\n",
+    "- `text-decoration`\n",
+    "- `vertical-align`\n",
+    "- `white-space: nowrap`\n",
+    "\n",
+    "\n",
+    "- Only CSS2 named colors and hex colors of the form `#rgb` or `#rrggbb` are currently supported.\n",
+    "- The following pseudo CSS properties are also available to set excel specific style properties:\n",
+    "    - `number-format`\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df.style.\\\n",
+    "    applymap(color_negative_red).\\\n",
+    "    apply(highlight_max).\\\n",
+    "    to_excel('styled.xlsx', engine='openpyxl')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "A screenshot of the output:\n",
+    "\n",
+    "![Excel spreadsheet with styled DataFrame](../_static/style-excel.png)\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Extensibility\n",
+    "\n",
+    "The core of pandas is, and will remain, its \"high-performance, easy-to-use data structures\".\n",
+    "With that in mind, we hope that `DataFrame.style` accomplishes two goals\n",
+    "\n",
+    "- Provide an API that is pleasing to use interactively and is \"good enough\" for many tasks\n",
+    "- Provide the foundations for dedicated libraries to build on\n",
+    "\n",
+    "If you build a great library on top of this, let us know and we'll [link](http://pandas.pydata.org/pandas-docs/stable/ecosystem.html) to it.\n",
+    "\n",
+    "### Subclassing\n",
+    "\n",
+    "If the default template doesn't quite suit your needs, you can subclass Styler and extend or override the template.\n",
+    "We'll show an example of extending the default template to insert a custom header before each table."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from jinja2 import Environment, ChoiceLoader, FileSystemLoader\n",
+    "from IPython.display import HTML\n",
+    "from pandas.io.formats.style import Styler"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We'll use the following template:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open(\"templates/myhtml.tpl\") as f:\n",
+    "    print(f.read())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now that we've created a template, we need to set up a subclass of ``Styler`` that\n",
+    "knows about it."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class MyStyler(Styler):\n",
+    "    env = Environment(\n",
+    "        loader=ChoiceLoader([\n",
+    "            FileSystemLoader(\"templates\"),  # contains ours\n",
+    "            Styler.loader,  # the default\n",
+    "        ])\n",
+    "    )\n",
+    "    template = env.get_template(\"myhtml.tpl\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Notice that we include the original loader in our environment's loader.\n",
+    "That's because we extend the original template, so the Jinja environment needs\n",
+    "to be able to find it.\n",
+    "\n",
+    "Now we can use that custom styler. It's `__init__` takes a DataFrame."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "MyStyler(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Our custom template accepts a `table_title` keyword. We can provide the value in the `.render` method."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "HTML(MyStyler(df).render(table_title=\"Extending Example\"))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "For convenience, we provide the `Styler.from_custom_template` method that does the same as the custom subclass."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "EasyStyler = Styler.from_custom_template(\"templates\", \"myhtml.tpl\")\n",
+    "EasyStyler(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Here's the template structure:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open(\"templates/template_structure.html\") as f:\n",
+    "    structure = f.read()\n",
+    "    \n",
+    "HTML(structure)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "See the template in the [GitHub repo](https://github.com/pandas-dev/pandas) for more details."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "nbsphinx": "hidden"
+   },
+   "outputs": [],
+   "source": [
+    "# Hack to get the same style in the notebook as the\n",
+    "# main site. This is hidden in the docs.\n",
+    "from IPython.display import HTML\n",
+    "with open(\"themes/nature_with_gtoc/static/nature.css_t\") as f:\n",
+    "    css = f.read()\n",
+    "    \n",
+    "HTML('<style>{}</style>'.format(css))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
diff --git a/doc/source/user_guide/templates/myhtml.tpl b/doc/source/user_guide/templates/myhtml.tpl
new file mode 100644
index 0000000000000..1170fd3def653
--- /dev/null
+++ b/doc/source/user_guide/templates/myhtml.tpl
@@ -0,0 +1,5 @@
+{% extends "html.tpl" %}
+{% block table %}
+<h1>{{ table_title|default("My Table") }}</h1>
+{{ super() }}
+{% endblock table %}
diff --git a/doc/source/user_guide/templates/template_structure.html b/doc/source/user_guide/templates/template_structure.html
new file mode 100644
index 0000000000000..0778d8e2e6f18
--- /dev/null
+++ b/doc/source/user_guide/templates/template_structure.html
@@ -0,0 +1,57 @@
+<!--
+     This is an HTML fragment that gets included into a notebook & rst document
+
+     Inspired by nbconvert
+
+     https://github.com/jupyter/nbconvert/blob/8ac591a0b8694147d0f34bf6392594c2811c1395/docs/source/template_structure.html
+
+
+   -->
+<style type="text/css">
+    /* Overrides of notebook CSS for static HTML export */
+    .template_block {
+        background-color: hsla(120, 60%, 70%, 0.2);
+        margin: 10px;
+        padding: 5px;
+        border: 1px solid hsla(120, 60%, 70%, 0.5);
+        border-left: 2px solid black;
+    }
+    .template_block pre {
+        background: transparent;
+        padding: 0;
+    }
+    .big_vertical_ellipsis {
+        font-size: 24pt;
+    }
+</style>
+
+<div class="template_block">before_style</div>
+<div class="template_block">style
+    <pre>&lt;style type=&quot;text/css&quot;&gt;</pre>
+    <div class="template_block">table_styles</div>
+    <div class="template_block">before_cellstyle</div>
+    <div class="template_block">cellstyle</div>
+    <pre>&lt;/style&gt;</pre>
+</div><!-- /style -->
+
+<div class="template_block" >before_table</div>
+
+<div class="template_block" >table
+    <pre>&lt;table ...&gt;</pre>
+    <div class="template_block">caption</div>
+
+    <div class="template_block" >thead
+        <div class="template_block" >before_head_rows</div>
+        <div class="template_block">head_tr (loop over headers)</div>
+        <div class="template_block" >after_head_rows</div>
+    </div>
+
+    <div class="template_block" >tbody
+        <div class="template_block" >before_rows</div>
+        <div class="template_block">tr (loop over data rows)</div>
+        <div class="template_block" >after_rows</div>
+    </div>
+    <pre>&lt;/table&gt;</pre>
+</div><!-- /table -->
+
+<div class="template_block" >after_table</div>
diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
new file mode 100644
index 0000000000000..6f21a7d9beb36
--- /dev/null
+++ b/doc/source/user_guide/text.rst
@@ -0,0 +1,621 @@
+.. _text:
+
+{{ header }}
+
+======================
+Working with Text Data
+======================
+
+.. _text.string_methods:
+
+Series and Index are equipped with a set of string processing methods
+that make it easy to operate on each element of the array. Perhaps most
+importantly, these methods exclude missing/NA values automatically. These are
+accessed via the ``str`` attribute and generally have names matching
+the equivalent (scalar) built-in string methods:
+
+.. ipython:: python
+
+   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
+   s.str.lower()
+   s.str.upper()
+   s.str.len()
+
+.. ipython:: python
+
+   idx = pd.Index([' jack', 'jill ', ' jesse ', 'frank'])
+   idx.str.strip()
+   idx.str.lstrip()
+   idx.str.rstrip()
+
+The string methods on Index are especially useful for cleaning up or
+transforming DataFrame columns. For instance, you may have columns with
+leading or trailing whitespace:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(3, 2),
+                     columns=[' Column A ', ' Column B '], index=range(3))
+   df
+
+Since ``df.columns`` is an Index object, we can use the ``.str`` accessor
+
+.. ipython:: python
+
+   df.columns.str.strip()
+   df.columns.str.lower()
+
+These string methods can then be used to clean up the columns as needed.
+Here we are removing leading and trailing white spaces, lower casing all names,
+and replacing any remaining white spaces with underscores:
+
+.. ipython:: python
+
+   df.columns = df.columns.str.strip().str.lower().str.replace(' ', '_')
+   df
+
+.. note::
+
+    If you have a ``Series`` where lots of elements are repeated
+    (i.e. the number of unique elements in the ``Series`` is a lot smaller than the length of the
+    ``Series``), it can be faster to convert the original ``Series`` to one of type
+    ``category`` and then use ``.str.<method>`` or ``.dt.<property>`` on that.
+    The performance difference comes from the fact that, for ``Series`` of type ``category``, the
+    string operations are done on the ``.categories`` and not on each element of the
+    ``Series``.
+
+    Please note that a ``Series`` of type ``category`` with string ``.categories`` has
+    some limitations in comparison of ``Series`` of type string (e.g. you can't add strings to
+    each other: ``s + " " + s`` won't work if ``s`` is a ``Series`` of type ``category``). Also,
+    ``.str`` methods which operate on elements of type ``list`` are not available on such a
+    ``Series``.
+
+
+Splitting and Replacing Strings
+-------------------------------
+
+.. _text.split:
+
+Methods like ``split`` return a Series of lists:
+
+.. ipython:: python
+
+   s2 = pd.Series(['a_b_c', 'c_d_e', np.nan, 'f_g_h'])
+   s2.str.split('_')
+
+Elements in the split lists can be accessed using ``get`` or ``[]`` notation:
+
+.. ipython:: python
+
+   s2.str.split('_').str.get(1)
+   s2.str.split('_').str[1]
+
+It is easy to expand this to return a DataFrame using ``expand``.
+
+.. ipython:: python
+
+   s2.str.split('_', expand=True)
+
+It is also possible to limit the number of splits:
+
+.. ipython:: python
+
+   s2.str.split('_', expand=True, n=1)
+
+``rsplit`` is similar to ``split`` except it works in the reverse direction,
+i.e., from the end of the string to the beginning of the string:
+
+.. ipython:: python
+
+   s2.str.rsplit('_', expand=True, n=1)
+
+``replace`` by default replaces `regular expressions
+<https://docs.python.org/3/library/re.html>`__:
+
+.. ipython:: python
+
+   s3 = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca',
+                  '', np.nan, 'CABA', 'dog', 'cat'])
+   s3
+   s3.str.replace('^.a|dog', 'XX-XX ', case=False)
+
+Some caution must be taken to keep regular expressions in mind! For example, the
+following code will cause trouble because of the regular expression meaning of
+`$`:
+
+.. ipython:: python
+
+   # Consider the following badly formatted financial data
+   dollars = pd.Series(['12', '-$10', '$10,000'])
+
+   # This does what you'd naively expect:
+   dollars.str.replace('$', '')
+
+   # But this doesn't:
+   dollars.str.replace('-$', '-')
+
+   # We need to escape the special character (for >1 len patterns)
+   dollars.str.replace(r'-\$', '-')
+
+.. versionadded:: 0.23.0
+
+If you do want literal replacement of a string (equivalent to
+:meth:`str.replace`), you can set the optional ``regex`` parameter to
+``False``, rather than escaping each character. In this case both ``pat``
+and ``repl`` must be strings:
+
+.. ipython:: python
+
+    # These lines are equivalent
+    dollars.str.replace(r'-\$', '-')
+    dollars.str.replace('-$', '-', regex=False)
+
+.. versionadded:: 0.20.0
+
+The ``replace`` method can also take a callable as replacement. It is called
+on every ``pat`` using :func:`re.sub`. The callable should expect one
+positional argument (a regex object) and return a string.
+
+.. ipython:: python
+
+   # Reverse every lowercase alphabetic word
+   pat = r'[a-z]+'
+
+   def repl(m):
+       return m.group(0)[::-1]
+
+   pd.Series(['foo 123', 'bar baz', np.nan]).str.replace(pat, repl)
+
+   # Using regex groups
+   pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
+
+   def repl(m):
+       return m.group('two').swapcase()
+
+   pd.Series(['Foo Bar Baz', np.nan]).str.replace(pat, repl)
+
+.. versionadded:: 0.20.0
+
+The ``replace`` method also accepts a compiled regular expression object
+from :func:`re.compile` as a pattern. All flags should be included in the
+compiled regular expression object.
+
+.. ipython:: python
+
+   import re
+   regex_pat = re.compile(r'^.a|dog', flags=re.IGNORECASE)
+   s3.str.replace(regex_pat, 'XX-XX ')
+
+Including a ``flags`` argument when calling ``replace`` with a compiled
+regular expression object will raise a ``ValueError``.
+
+.. ipython::
+
+    @verbatim
+    In [1]: s3.str.replace(regex_pat, 'XX-XX ', flags=re.IGNORECASE)
+    ---------------------------------------------------------------------------
+    ValueError: case and flags cannot be set when pat is a compiled regex
+
+.. _text.concatenate:
+
+Concatenation
+-------------
+
+There are several ways to concatenate a ``Series`` or ``Index``, either with itself or others, all based on :meth:`~Series.str.cat`,
+resp. ``Index.str.cat``.
+
+Concatenating a single Series into a string
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The content of a ``Series`` (or ``Index``) can be concatenated:
+
+.. ipython:: python
+
+    s = pd.Series(['a', 'b', 'c', 'd'])
+    s.str.cat(sep=',')
+
+If not specified, the keyword ``sep`` for the separator defaults to the empty string, ``sep=''``:
+
+.. ipython:: python
+
+    s.str.cat()
+
+By default, missing values are ignored. Using ``na_rep``, they can be given a representation:
+
+.. ipython:: python
+
+    t = pd.Series(['a', 'b', np.nan, 'd'])
+    t.str.cat(sep=',')
+    t.str.cat(sep=',', na_rep='-')
+
+Concatenating a Series and something list-like into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The first argument to :meth:`~Series.str.cat` can be a list-like object, provided that it matches the length of the calling ``Series`` (or ``Index``).
+
+.. ipython:: python
+
+    s.str.cat(['A', 'B', 'C', 'D'])
+
+Missing values on either side will result in missing values in the result as well, *unless* ``na_rep`` is specified:
+
+.. ipython:: python
+
+    s.str.cat(t)
+    s.str.cat(t, na_rep='-')
+
+Concatenating a Series and something array-like into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.23.0
+
+The parameter ``others`` can also be two-dimensional. In this case, the number or rows must match the lengths of the calling ``Series`` (or ``Index``).
+
+.. ipython:: python
+
+    d = pd.concat([t, s], axis=1)
+    s
+    d
+    s.str.cat(d, na_rep='-')
+
+Concatenating a Series and an indexed object into a Series, with alignment
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. versionadded:: 0.23.0
+
+For concatenation with a ``Series`` or ``DataFrame``, it is possible to align the indexes before concatenation by setting
+the ``join``-keyword.
+
+.. ipython:: python
+   :okwarning:
+
+   u = pd.Series(['b', 'd', 'a', 'c'], index=[1, 3, 0, 2])
+   s
+   u
+   s.str.cat(u)
+   s.str.cat(u, join='left')
+
+.. warning::
+
+    If the ``join`` keyword is not passed, the method :meth:`~Series.str.cat` will currently fall back to the behavior before version 0.23.0 (i.e. no alignment),
+    but a ``FutureWarning`` will be raised if any of the involved indexes differ, since this default will change to ``join='left'`` in a future version.
+
+The usual options are available for ``join`` (one of ``'left', 'outer', 'inner', 'right'``).
+In particular, alignment also means that the different lengths do not need to coincide anymore.
+
+.. ipython:: python
+
+    v = pd.Series(['z', 'a', 'b', 'd', 'e'], index=[-1, 0, 1, 3, 4])
+    s
+    v
+    s.str.cat(v, join='left', na_rep='-')
+    s.str.cat(v, join='outer', na_rep='-')
+
+The same alignment can be used when ``others`` is a ``DataFrame``:
+
+.. ipython:: python
+
+    f = d.loc[[3, 2, 1, 0], :]
+    s
+    f
+    s.str.cat(f, join='left', na_rep='-')
+
+Concatenating a Series and many objects into a Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Several array-like items (specifically: ``Series``, ``Index``, and 1-dimensional variants of ``np.ndarray``)
+can be combined in a list-like container (including iterators, ``dict``-views, etc.).
+
+.. ipython:: python
+
+    s
+    u
+    s.str.cat([u, u.to_numpy()], join='left')
+
+All elements without an index (e.g. ``np.ndarray``) within the passed list-like must match in length to the calling ``Series`` (or ``Index``),
+but ``Series`` and ``Index`` may have arbitrary length (as long as alignment is not disabled with ``join=None``):
+
+.. ipython:: python
+
+    v
+    s.str.cat([v, u, u.to_numpy()], join='outer', na_rep='-')
+
+If using ``join='right'`` on a list-like of ``others`` that contains different indexes,
+the union of these indexes will be used as the basis for the final concatenation:
+
+.. ipython:: python
+
+    u.loc[[3]]
+    v.loc[[-1, 0]]
+    s.str.cat([u.loc[[3]], v.loc[[-1, 0]]], join='right', na_rep='-')
+
+Indexing with ``.str``
+----------------------
+
+.. _text.indexing:
+
+You can use ``[]`` notation to directly index by position locations. If you index past the end
+of the string, the result will be a ``NaN``.
+
+
+.. ipython:: python
+
+   s = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan,
+                  'CABA', 'dog', 'cat'])
+
+   s.str[0]
+   s.str[1]
+
+Extracting Substrings
+---------------------
+
+.. _text.extract:
+
+Extract first match in each subject (extract)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. warning::
+
+   In version 0.18.0, ``extract`` gained the ``expand`` argument. When
+   ``expand=False`` it returns a ``Series``, ``Index``, or
+   ``DataFrame``, depending on the subject and regular expression
+   pattern (same behavior as pre-0.18.0). When ``expand=True`` it
+   always returns a ``DataFrame``, which is more consistent and less
+   confusing from the perspective of a user. ``expand=True`` is the
+   default since version 0.23.0.
+
+The ``extract`` method accepts a `regular expression
+<https://docs.python.org/3/library/re.html>`__ with at least one
+capture group.
+
+Extracting a regular expression with more than one group returns a
+DataFrame with one column per group.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'([ab])(\d)', expand=False)
+
+Elements that do not match return a row filled with ``NaN``. Thus, a
+Series of messy strings can be "converted" into a like-indexed Series
+or DataFrame of cleaned-up or more useful strings, without
+necessitating ``get()`` to access tuples or ``re.match`` objects. The
+dtype of the result is always object, even if no match is found and
+the result only contains ``NaN``.
+
+Named groups like
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'(?P<letter>[ab])(?P<digit>\d)',
+                                             expand=False)
+
+and optional groups like
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', '3']).str.extract(r'([ab])?(\d)', expand=False)
+
+can also be used. Note that any capture group names in the regular
+expression will be used for column names; otherwise capture group
+numbers will be used.
+
+Extracting a regular expression with one group returns a ``DataFrame``
+with one column if ``expand=True``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'[ab](\d)', expand=True)
+
+It returns a Series if ``expand=False``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'[ab](\d)', expand=False)
+
+Calling on an ``Index`` with a regex with exactly one capture group
+returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
+   s
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
+
+It returns an ``Index`` if ``expand=False``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
+
+Calling on an ``Index`` with a regex with more than one capture group
+returns a ``DataFrame`` if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
+
+It raises ``ValueError`` if ``expand=False``.
+
+.. code-block:: python
+
+    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
+    ValueError: only one regex group is supported with Index
+
+The table below summarizes the behavior of ``extract(expand=False)``
+(input subject in first column, number of groups in regex in
+first row)
+
++--------+---------+------------+
+|        | 1 group | >1 group   |
++--------+---------+------------+
+| Index  | Index   | ValueError |
++--------+---------+------------+
+| Series | Series  | DataFrame  |
++--------+---------+------------+
+
+Extract all matches in each subject (extractall)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. _text.extractall:
+
+.. versionadded:: 0.18.0
+
+Unlike ``extract`` (which returns only the first match),
+
+.. ipython:: python
+
+   s = pd.Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
+   s
+   two_groups = '(?P<letter>[a-z])(?P<digit>[0-9])'
+   s.str.extract(two_groups, expand=True)
+
+the ``extractall`` method returns every match. The result of
+``extractall`` is always a ``DataFrame`` with a ``MultiIndex`` on its
+rows. The last level of the ``MultiIndex`` is named ``match`` and
+indicates the order in the subject.
+
+.. ipython:: python
+
+   s.str.extractall(two_groups)
+
+When each subject string in the Series has exactly one match,
+
+.. ipython:: python
+
+   s = pd.Series(['a3', 'b3', 'c2'])
+   s
+
+then ``extractall(pat).xs(0, level='match')`` gives the same result as
+``extract(pat)``.
+
+.. ipython:: python
+
+   extract_result = s.str.extract(two_groups, expand=True)
+   extract_result
+   extractall_result = s.str.extractall(two_groups)
+   extractall_result
+   extractall_result.xs(0, level="match")
+
+``Index`` also supports ``.str.extractall``. It returns a ``DataFrame`` which has the
+same result as a ``Series.str.extractall`` with a default index (starts from 0).
+
+.. versionadded:: 0.19.0
+
+.. ipython:: python
+
+   pd.Index(["a1a2", "b1", "c1"]).str.extractall(two_groups)
+
+   pd.Series(["a1a2", "b1", "c1"]).str.extractall(two_groups)
+
+
+Testing for Strings that Match or Contain a Pattern
+---------------------------------------------------
+
+You can check whether elements contain a pattern:
+
+.. ipython:: python
+
+   pattern = r'[0-9][a-z]'
+   pd.Series(['1', '2', '3a', '3b', '03c']).str.contains(pattern)
+
+Or whether elements match a pattern:
+
+.. ipython:: python
+
+   pd.Series(['1', '2', '3a', '3b', '03c']).str.match(pattern)
+
+The distinction between ``match`` and ``contains`` is strictness: ``match``
+relies on strict ``re.match``, while ``contains`` relies on ``re.search``.
+
+Methods like ``match``, ``contains``, ``startswith``, and ``endswith`` take
+an extra ``na`` argument so missing values can be considered True or False:
+
+.. ipython:: python
+
+   s4 = pd.Series(['A', 'B', 'C', 'Aaba', 'Baca', np.nan, 'CABA', 'dog', 'cat'])
+   s4.str.contains('A', na=False)
+
+.. _text.indicator:
+
+Creating Indicator Variables
+----------------------------
+
+You can extract dummy variables from string columns.
+For example if they are separated by a ``'|'``:
+
+.. ipython:: python
+
+    s = pd.Series(['a', 'a|b', np.nan, 'a|c'])
+    s.str.get_dummies(sep='|')
+
+String ``Index`` also supports ``get_dummies`` which returns a ``MultiIndex``.
+
+.. versionadded:: 0.18.1
+
+.. ipython:: python
+
+    idx = pd.Index(['a', 'a|b', np.nan, 'a|c'])
+    idx.str.get_dummies(sep='|')
+
+See also :func:`~pandas.get_dummies`.
+
+Method Summary
+--------------
+
+.. _text.summary:
+
+.. csv-table::
+    :header: "Method", "Description"
+    :widths: 20, 80
+    :delim: ;
+
+    :meth:`~Series.str.cat`;Concatenate strings
+    :meth:`~Series.str.split`;Split strings on delimiter
+    :meth:`~Series.str.rsplit`;Split strings on delimiter working from the end of the string
+    :meth:`~Series.str.get`;Index into each element (retrieve i-th element)
+    :meth:`~Series.str.join`;Join strings in each element of the Series with passed separator
+    :meth:`~Series.str.get_dummies`;Split strings on the delimiter returning DataFrame of dummy variables
+    :meth:`~Series.str.contains`;Return boolean array if each string contains pattern/regex
+    :meth:`~Series.str.replace`;Replace occurrences of pattern/regex/string with some other string or the return value of a callable given the occurrence
+    :meth:`~Series.str.repeat`;Duplicate values (``s.str.repeat(3)`` equivalent to ``x * 3``)
+    :meth:`~Series.str.pad`;"Add whitespace to left, right, or both sides of strings"
+    :meth:`~Series.str.center`;Equivalent to ``str.center``
+    :meth:`~Series.str.ljust`;Equivalent to ``str.ljust``
+    :meth:`~Series.str.rjust`;Equivalent to ``str.rjust``
+    :meth:`~Series.str.zfill`;Equivalent to ``str.zfill``
+    :meth:`~Series.str.wrap`;Split long strings into lines with length less than a given width
+    :meth:`~Series.str.slice`;Slice each string in the Series
+    :meth:`~Series.str.slice_replace`;Replace slice in each string with passed value
+    :meth:`~Series.str.count`;Count occurrences of pattern
+    :meth:`~Series.str.startswith`;Equivalent to ``str.startswith(pat)`` for each element
+    :meth:`~Series.str.endswith`;Equivalent to ``str.endswith(pat)`` for each element
+    :meth:`~Series.str.findall`;Compute list of all occurrences of pattern/regex for each string
+    :meth:`~Series.str.match`;"Call ``re.match`` on each element, returning matched groups as list"
+    :meth:`~Series.str.extract`;"Call ``re.search`` on each element, returning DataFrame with one row for each element and one column for each regex capture group"
+    :meth:`~Series.str.extractall`;"Call ``re.findall`` on each element, returning DataFrame with one row for each match and one column for each regex capture group"
+    :meth:`~Series.str.len`;Compute string lengths
+    :meth:`~Series.str.strip`;Equivalent to ``str.strip``
+    :meth:`~Series.str.rstrip`;Equivalent to ``str.rstrip``
+    :meth:`~Series.str.lstrip`;Equivalent to ``str.lstrip``
+    :meth:`~Series.str.partition`;Equivalent to ``str.partition``
+    :meth:`~Series.str.rpartition`;Equivalent to ``str.rpartition``
+    :meth:`~Series.str.lower`;Equivalent to ``str.lower``
+    :meth:`~Series.str.casefold`;Equivalent to ``str.casefold``
+    :meth:`~Series.str.upper`;Equivalent to ``str.upper``
+    :meth:`~Series.str.find`;Equivalent to ``str.find``
+    :meth:`~Series.str.rfind`;Equivalent to ``str.rfind``
+    :meth:`~Series.str.index`;Equivalent to ``str.index``
+    :meth:`~Series.str.rindex`;Equivalent to ``str.rindex``
+    :meth:`~Series.str.capitalize`;Equivalent to ``str.capitalize``
+    :meth:`~Series.str.swapcase`;Equivalent to ``str.swapcase``
+    :meth:`~Series.str.normalize`;Return Unicode normal form. Equivalent to ``unicodedata.normalize``
+    :meth:`~Series.str.translate`;Equivalent to ``str.translate``
+    :meth:`~Series.str.isalnum`;Equivalent to ``str.isalnum``
+    :meth:`~Series.str.isalpha`;Equivalent to ``str.isalpha``
+    :meth:`~Series.str.isdigit`;Equivalent to ``str.isdigit``
+    :meth:`~Series.str.isspace`;Equivalent to ``str.isspace``
+    :meth:`~Series.str.islower`;Equivalent to ``str.islower``
+    :meth:`~Series.str.isupper`;Equivalent to ``str.isupper``
+    :meth:`~Series.str.istitle`;Equivalent to ``str.istitle``
+    :meth:`~Series.str.isnumeric`;Equivalent to ``str.isnumeric``
+    :meth:`~Series.str.isdecimal`;Equivalent to ``str.isdecimal``
diff --git a/doc/source/user_guide/timedeltas.rst b/doc/source/user_guide/timedeltas.rst
new file mode 100644
index 0000000000000..37cf6afcb96a3
--- /dev/null
+++ b/doc/source/user_guide/timedeltas.rst
@@ -0,0 +1,484 @@
+.. _timedeltas:
+
+{{ header }}
+
+.. _timedeltas.timedeltas:
+
+***********
+Time Deltas
+***********
+
+Timedeltas are differences in times, expressed in difference units, e.g. days, hours, minutes,
+seconds. They can be both positive and negative.
+
+``Timedelta`` is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
+but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation,
+parsing, and attributes.
+
+Parsing
+-------
+
+You can construct a ``Timedelta`` scalar through various arguments:
+
+.. ipython:: python
+
+   import datetime
+
+   # strings
+   pd.Timedelta('1 days')
+   pd.Timedelta('1 days 00:00:00')
+   pd.Timedelta('1 days 2 hours')
+   pd.Timedelta('-1 days 2 min 3us')
+
+   # like datetime.timedelta
+   # note: these MUST be specified as keyword arguments
+   pd.Timedelta(days=1, seconds=1)
+
+   # integers with a unit
+   pd.Timedelta(1, unit='d')
+
+   # from a datetime.timedelta/np.timedelta64
+   pd.Timedelta(datetime.timedelta(days=1, seconds=1))
+   pd.Timedelta(np.timedelta64(1, 'ms'))
+
+   # negative Timedeltas have this string repr
+   # to be more consistent with datetime.timedelta conventions
+   pd.Timedelta('-1us')
+
+   # a NaT
+   pd.Timedelta('nan')
+   pd.Timedelta('nat')
+
+   # ISO 8601 Duration strings
+   pd.Timedelta('P0DT0H1M0S')
+   pd.Timedelta('P0DT0H0M0.000000123S')
+
+.. versionadded:: 0.23.0
+
+   Added constructor for `ISO 8601 Duration`_ strings
+
+:ref:`DateOffsets<timeseries.offsets>` (``Day, Hour, Minute, Second, Milli, Micro, Nano``) can also be used in construction.
+
+.. ipython:: python
+
+   pd.Timedelta(pd.offsets.Second(2))
+
+Further, operations among the scalars yield another scalar ``Timedelta``.
+
+.. ipython:: python
+
+   pd.Timedelta(pd.offsets.Day(2)) + pd.Timedelta(pd.offsets.Second(2)) +\
+       pd.Timedelta('00:00:00.000123')
+
+to_timedelta
+~~~~~~~~~~~~
+
+Using the top-level ``pd.to_timedelta``, you can convert a scalar, array, list,
+or Series from a recognized timedelta format / value into a ``Timedelta`` type.
+It will construct Series if the input is a Series, a scalar if the input is
+scalar-like, otherwise it will output a ``TimedeltaIndex``.
+
+You can parse a single string to a Timedelta:
+
+.. ipython:: python
+
+   pd.to_timedelta('1 days 06:05:01.00003')
+   pd.to_timedelta('15.5us')
+
+or a list/array of strings:
+
+.. ipython:: python
+
+   pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
+
+The ``unit`` keyword argument specifies the unit of the Timedelta:
+
+.. ipython:: python
+
+   pd.to_timedelta(np.arange(5), unit='s')
+   pd.to_timedelta(np.arange(5), unit='d')
+
+.. _timedeltas.limitations:
+
+Timedelta limitations
+~~~~~~~~~~~~~~~~~~~~~
+
+Pandas represents ``Timedeltas`` in nanosecond resolution using
+64 bit integers. As such, the 64 bit integer limits determine
+the ``Timedelta`` limits.
+
+.. ipython:: python
+
+   pd.Timedelta.min
+   pd.Timedelta.max
+
+.. _timedeltas.operations:
+
+Operations
+----------
+
+You can operate on Series/DataFrames and construct ``timedelta64[ns]`` Series through
+subtraction operations on ``datetime64[ns]`` Series, or ``Timestamps``.
+
+.. ipython:: python
+
+   s = pd.Series(pd.date_range('2012-1-1', periods=3, freq='D'))
+   td = pd.Series([pd.Timedelta(days=i) for i in range(3)])
+   df = pd.DataFrame({'A': s, 'B': td})
+   df
+   df['C'] = df['A'] + df['B']
+   df
+   df.dtypes
+
+   s - s.max()
+   s - datetime.datetime(2011, 1, 1, 3, 5)
+   s + datetime.timedelta(minutes=5)
+   s + pd.offsets.Minute(5)
+   s + pd.offsets.Minute(5) + pd.offsets.Milli(5)
+
+Operations with scalars from a ``timedelta64[ns]`` series:
+
+.. ipython:: python
+
+   y = s - s[0]
+   y
+
+Series of timedeltas with ``NaT`` values are supported:
+
+.. ipython:: python
+
+   y = s - s.shift()
+   y
+
+Elements can be set to ``NaT`` using ``np.nan`` analogously to datetimes:
+
+.. ipython:: python
+
+   y[1] = np.nan
+   y
+
+Operands can also appear in a reversed order (a singular object operated with a Series):
+
+.. ipython:: python
+
+   s.max() - s
+   datetime.datetime(2011, 1, 1, 3, 5) - s
+   datetime.timedelta(minutes=5) + s
+
+``min, max`` and the corresponding ``idxmin, idxmax`` operations are supported on frames:
+
+.. ipython:: python
+
+   A = s - pd.Timestamp('20120101') - pd.Timedelta('00:05:05')
+   B = s - pd.Series(pd.date_range('2012-1-2', periods=3, freq='D'))
+
+   df = pd.DataFrame({'A': A, 'B': B})
+   df
+
+   df.min()
+   df.min(axis=1)
+
+   df.idxmin()
+   df.idxmax()
+
+``min, max, idxmin, idxmax`` operations are supported on Series as well. A scalar result will be a ``Timedelta``.
+
+.. ipython:: python
+
+   df.min().max()
+   df.min(axis=1).min()
+
+   df.min().idxmax()
+   df.min(axis=1).idxmin()
+
+You can fillna on timedeltas. Integers will be interpreted as seconds. You can
+pass a timedelta to get a particular value.
+
+.. ipython:: python
+
+   y.fillna(0)
+   y.fillna(10)
+   y.fillna(pd.Timedelta('-1 days, 00:00:05'))
+
+You can also negate, multiply and use ``abs`` on ``Timedeltas``:
+
+.. ipython:: python
+
+   td1 = pd.Timedelta('-1 days 2 hours 3 seconds')
+   td1
+   -1 * td1
+   - td1
+   abs(td1)
+
+.. _timedeltas.timedeltas_reductions:
+
+Reductions
+----------
+
+Numeric reduction operation for ``timedelta64[ns]`` will return ``Timedelta`` objects. As usual
+``NaT`` are skipped during evaluation.
+
+.. ipython:: python
+
+   y2 = pd.Series(pd.to_timedelta(['-1 days +00:00:05', 'nat',
+                                   '-1 days +00:00:05', '1 days']))
+   y2
+   y2.mean()
+   y2.median()
+   y2.quantile(.1)
+   y2.sum()
+
+.. _timedeltas.timedeltas_convert:
+
+Frequency Conversion
+--------------------
+
+Timedelta Series, ``TimedeltaIndex``, and ``Timedelta`` scalars can be converted to other 'frequencies' by dividing by another timedelta,
+or by astyping to a specific timedelta type. These operations yield Series and propagate ``NaT`` -> ``nan``.
+Note that division by the NumPy scalar is true division, while astyping is equivalent of floor division.
+
+.. ipython:: python
+
+   december = pd.Series(pd.date_range('20121201', periods=4))
+   january = pd.Series(pd.date_range('20130101', periods=4))
+   td = january - december
+
+   td[2] += datetime.timedelta(minutes=5, seconds=3)
+   td[3] = np.nan
+   td
+
+   # to days
+   td / np.timedelta64(1, 'D')
+   td.astype('timedelta64[D]')
+
+   # to seconds
+   td / np.timedelta64(1, 's')
+   td.astype('timedelta64[s]')
+
+   # to months (these are constant months)
+   td / np.timedelta64(1, 'M')
+
+Dividing or multiplying a ``timedelta64[ns]`` Series by an integer or integer Series
+yields another ``timedelta64[ns]`` dtypes Series.
+
+.. ipython:: python
+
+   td * -1
+   td * pd.Series([1, 2, 3, 4])
+
+Rounded division (floor-division) of a ``timedelta64[ns]`` Series by a scalar
+``Timedelta`` gives a series of integers.
+
+.. ipython:: python
+
+   td // pd.Timedelta(days=3, hours=4)
+   pd.Timedelta(days=3, hours=4) // td
+
+.. _timedeltas.mod_divmod:
+
+The mod (%) and divmod operations are defined for ``Timedelta`` when operating with another timedelta-like or with a numeric argument.
+
+.. ipython:: python
+
+   pd.Timedelta(hours=37) % datetime.timedelta(hours=2)
+
+   # divmod against a timedelta-like returns a pair (int, Timedelta)
+   divmod(datetime.timedelta(hours=2), pd.Timedelta(minutes=11))
+
+   # divmod against a numeric returns a pair (Timedelta, Timedelta)
+   divmod(pd.Timedelta(hours=25), 86400000000000)
+
+Attributes
+----------
+
+You can access various components of the ``Timedelta`` or ``TimedeltaIndex`` directly using the attributes ``days,seconds,microseconds,nanoseconds``. These are identical to the values returned by ``datetime.timedelta``, in that, for example, the ``.seconds`` attribute represents the number of seconds >= 0 and < 1 day. These are signed according to whether the ``Timedelta`` is signed.
+
+These operations can also be directly accessed via the ``.dt`` property of the ``Series`` as well.
+
+.. note::
+
+   Note that the attributes are NOT the displayed values of the ``Timedelta``. Use ``.components`` to retrieve the displayed values.
+
+For a ``Series``:
+
+.. ipython:: python
+
+   td.dt.days
+   td.dt.seconds
+
+You can access the value of the fields for a scalar ``Timedelta`` directly.
+
+.. ipython:: python
+
+   tds = pd.Timedelta('31 days 5 min 3 sec')
+   tds.days
+   tds.seconds
+   (-tds).seconds
+
+You can use the ``.components`` property to access a reduced form of the timedelta. This returns a ``DataFrame`` indexed
+similarly to the ``Series``. These are the *displayed* values of the ``Timedelta``.
+
+.. ipython:: python
+
+   td.dt.components
+   td.dt.components.seconds
+
+.. _timedeltas.isoformat:
+
+You can convert a ``Timedelta`` to an `ISO 8601 Duration`_ string with the
+``.isoformat`` method
+
+.. versionadded:: 0.20.0
+
+.. ipython:: python
+
+    pd.Timedelta(days=6, minutes=50, seconds=3,
+                 milliseconds=10, microseconds=10,
+                 nanoseconds=12).isoformat()
+
+.. _ISO 8601 Duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
+
+.. _timedeltas.index:
+
+TimedeltaIndex
+--------------
+
+To generate an index with time delta, you can use either the :class:`TimedeltaIndex` or
+the :func:`timedelta_range` constructor.
+
+Using ``TimedeltaIndex`` you can pass string-like, ``Timedelta``, ``timedelta``,
+or ``np.timedelta64`` objects. Passing ``np.nan/pd.NaT/nat`` will represent missing values.
+
+.. ipython:: python
+
+   pd.TimedeltaIndex(['1 days', '1 days, 00:00:05', np.timedelta64(2, 'D'),
+                      datetime.timedelta(days=2, seconds=2)])
+
+The string 'infer' can be passed in order to set the frequency of the index as the
+inferred frequency upon creation:
+
+.. ipython:: python
+
+   pd.TimedeltaIndex(['0 days', '10 days', '20 days'], freq='infer')
+
+Generating Ranges of Time Deltas
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Similar to :func:`date_range`, you can construct regular ranges of a ``TimedeltaIndex``
+using :func:`timedelta_range`.  The default frequency for ``timedelta_range`` is
+calendar day:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', periods=5)
+
+Various combinations of ``start``, ``end``, and ``periods`` can be used with
+``timedelta_range``:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', end='5 days')
+
+   pd.timedelta_range(end='10 days', periods=4)
+
+The ``freq`` parameter can passed a variety of :ref:`frequency aliases <timeseries.offset_aliases>`:
+
+.. ipython:: python
+
+   pd.timedelta_range(start='1 days', end='2 days', freq='30T')
+
+   pd.timedelta_range(start='1 days', periods=5, freq='2D5H')
+
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+timedeltas from ``start`` to ``end`` inclusively, with ``periods`` number of elements
+in the resulting ``TimedeltaIndex``:
+
+.. ipython:: python
+
+   pd.timedelta_range('0 days', '4 days', periods=5)
+
+   pd.timedelta_range('0 days', '4 days', periods=10)
+
+Using the TimedeltaIndex
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+Similarly to other of the datetime-like indices, ``DatetimeIndex`` and ``PeriodIndex``, you can use
+``TimedeltaIndex`` as the index of pandas objects.
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(100),
+                 index=pd.timedelta_range('1 days', periods=100, freq='h'))
+   s
+
+Selections work similarly, with coercion on string-likes and slices:
+
+.. ipython:: python
+
+   s['1 day':'2 day']
+   s['1 day 01:00:00']
+   s[pd.Timedelta('1 day 1h')]
+
+Furthermore you can use partial string selection and the range will be inferred:
+
+.. ipython:: python
+
+   s['1 day':'1 day 5 hours']
+
+Operations
+~~~~~~~~~~
+
+Finally, the combination of ``TimedeltaIndex`` with ``DatetimeIndex`` allow certain combination operations that are NaT preserving:
+
+.. ipython:: python
+
+   tdi = pd.TimedeltaIndex(['1 days', pd.NaT, '2 days'])
+   tdi.to_list()
+   dti = pd.date_range('20130101', periods=3)
+   dti.to_list()
+   (dti + tdi).to_list()
+   (dti - tdi).to_list()
+
+Conversions
+~~~~~~~~~~~
+
+Similarly to frequency conversion on a ``Series`` above, you can convert these indices to yield another Index.
+
+.. ipython:: python
+
+   tdi / np.timedelta64(1, 's')
+   tdi.astype('timedelta64[s]')
+
+Scalars type ops work as well. These can potentially return a *different* type of index.
+
+.. ipython:: python
+
+   # adding or timedelta and date -> datelike
+   tdi + pd.Timestamp('20130101')
+
+   # subtraction of a date and a timedelta -> datelike
+   # note that trying to subtract a date from a Timedelta will raise an exception
+   (pd.Timestamp('20130101') - tdi).to_list()
+
+   # timedelta + timedelta -> timedelta
+   tdi + pd.Timedelta('10 days')
+
+   # division can result in a Timedelta if the divisor is an integer
+   tdi / 2
+
+   # or a Float64Index if the divisor is a Timedelta
+   tdi / tdi[0]
+
+.. _timedeltas.resampling:
+
+Resampling
+----------
+
+Similar to :ref:`timeseries resampling <timeseries.resampling>`, we can resample with a ``TimedeltaIndex``.
+
+.. ipython:: python
+
+   s.resample('D').mean()
diff --git a/doc/source/user_guide/timeseries.rst b/doc/source/user_guide/timeseries.rst
new file mode 100644
index 0000000000000..4e2c428415926
--- /dev/null
+++ b/doc/source/user_guide/timeseries.rst
@@ -0,0 +1,2445 @@
+.. _timeseries:
+
+{{ header }}
+
+********************************
+Time Series / Date functionality
+********************************
+
+pandas contains extensive capabilities and features for working with time series data for all domains.
+Using the NumPy ``datetime64`` and ``timedelta64`` dtypes, pandas has consolidated a large number of
+features from other Python libraries like ``scikits.timeseries`` as well as created
+a tremendous amount of new functionality for manipulating time series data.
+
+For example, pandas supports:
+
+Parsing time series information from various sources and formats
+
+.. ipython:: python
+
+   import datetime
+
+   dti = pd.to_datetime(['1/1/2018', np.datetime64('2018-01-01'),
+                         datetime.datetime(2018, 1, 1)])
+   dti
+
+Generate sequences of fixed-frequency dates and time spans
+
+.. ipython:: python
+
+   dti = pd.date_range('2018-01-01', periods=3, freq='H')
+   dti
+
+Manipulating and converting date times with timezone information
+
+.. ipython:: python
+
+   dti = dti.tz_localize('UTC')
+   dti
+   dti.tz_convert('US/Pacific')
+
+Resampling or converting a time series to a particular frequency
+
+.. ipython:: python
+
+   idx = pd.date_range('2018-01-01', periods=5, freq='H')
+   ts = pd.Series(range(len(idx)), index=idx)
+   ts
+   ts.resample('2H').mean()
+
+Performing date and time arithmetic with absolute or relative time increments
+
+.. ipython:: python
+
+    friday = pd.Timestamp('2018-01-05')
+    friday.day_name()
+    # Add 1 day
+    saturday = friday + pd.Timedelta('1 day')
+    saturday.day_name()
+    # Add 1 business day (Friday --> Monday)
+    monday = friday + pd.offsets.BDay()
+    monday.day_name()
+
+pandas provides a relatively compact and self-contained set of tools for
+performing the above tasks and more.
+
+
+.. _timeseries.overview:
+
+Overview
+--------
+
+pandas captures 4 general time related concepts:
+
+#. Date times: A specific date and time with timezone support. Similar to ``datetime.datetime`` from the standard library.
+#. Time deltas: An absolute time duration. Similar to ``datetime.timedelta`` from the standard library.
+#. Time spans: A span of time defined by a point in time and its associated frequency.
+#. Date offsets: A relative time duration that respects calendar arithmetic. Similar to ``dateutil.relativedelta.relativedelta`` from the ``dateutil`` package.
+
+=====================   =================  ===================   ============================================  ========================================
+Concept                 Scalar Class       Array Class           pandas Data Type                              Primary Creation Method
+=====================   =================  ===================   ============================================  ========================================
+Date times              ``Timestamp``      ``DatetimeIndex``     ``datetime64[ns]`` or ``datetime64[ns, tz]``  ``to_datetime`` or ``date_range``
+Time deltas             ``Timedelta``      ``TimedeltaIndex``    ``timedelta64[ns]``                           ``to_timedelta`` or ``timedelta_range``
+Time spans              ``Period``         ``PeriodIndex``       ``period[freq]``                              ``Period`` or ``period_range``
+Date offsets            ``DateOffset``     ``None``              ``None``                                      ``DateOffset``
+=====================   =================  ===================   ============================================  ========================================
+
+For time series data, it's conventional to represent the time component in the index of a :class:`Series` or :class:`DataFrame`
+so manipulations can be performed with respect to the time element.
+
+.. ipython:: python
+
+   pd.Series(range(3), index=pd.date_range('2000', freq='D', periods=3))
+
+However, :class:`Series` and :class:`DataFrame` can directly also support the time component as data itself.
+
+.. ipython:: python
+
+   pd.Series(pd.date_range('2000', freq='D', periods=3))
+
+:class:`Series` and :class:`DataFrame` have extended data type support and functionality for ``datetime``, ``timedelta``
+and ``Period`` data when passed into those constructors. ``DateOffset``
+data however will be stored as ``object`` data.
+
+.. ipython:: python
+
+   pd.Series(pd.period_range('1/1/2011', freq='M', periods=3))
+   pd.Series([pd.DateOffset(1), pd.DateOffset(2)])
+   pd.Series(pd.date_range('1/1/2011', freq='M', periods=3))
+
+Lastly, pandas represents null date times, time deltas, and time spans as ``NaT`` which
+is useful for representing missing or null date like values and behaves similar
+as ``np.nan`` does for float data.
+
+.. ipython:: python
+
+   pd.Timestamp(pd.NaT)
+   pd.Timedelta(pd.NaT)
+   pd.Period(pd.NaT)
+   # Equality acts as np.nan would
+   pd.NaT == pd.NaT
+
+.. _timeseries.representation:
+
+Timestamps vs. Time Spans
+-------------------------
+
+Timestamped data is the most basic type of time series data that associates
+values with points in time. For pandas objects it means using the points in
+time.
+
+.. ipython:: python
+
+   pd.Timestamp(datetime.datetime(2012, 5, 1))
+   pd.Timestamp('2012-05-01')
+   pd.Timestamp(2012, 5, 1)
+
+However, in many cases it is more natural to associate things like change
+variables with a time span instead. The span represented by ``Period`` can be
+specified explicitly, or inferred from datetime string format.
+
+For example:
+
+.. ipython:: python
+
+   pd.Period('2011-01')
+
+   pd.Period('2012-05', freq='D')
+
+:class:`Timestamp` and :class:`Period` can serve as an index. Lists of
+``Timestamp`` and ``Period`` are automatically coerced to :class:`DatetimeIndex`
+and :class:`PeriodIndex` respectively.
+
+.. ipython:: python
+
+   dates = [pd.Timestamp('2012-05-01'),
+            pd.Timestamp('2012-05-02'),
+            pd.Timestamp('2012-05-03')]
+   ts = pd.Series(np.random.randn(3), dates)
+
+   type(ts.index)
+   ts.index
+
+   ts
+
+   periods = [pd.Period('2012-01'), pd.Period('2012-02'), pd.Period('2012-03')]
+
+   ts = pd.Series(np.random.randn(3), periods)
+
+   type(ts.index)
+   ts.index
+
+   ts
+
+pandas allows you to capture both representations and
+convert between them. Under the hood, pandas represents timestamps using
+instances of ``Timestamp`` and sequences of timestamps using instances of
+``DatetimeIndex``. For regular time spans, pandas uses ``Period`` objects for
+scalar values and ``PeriodIndex`` for sequences of spans. Better support for
+irregular intervals with arbitrary start and end points are forth-coming in
+future releases.
+
+
+.. _timeseries.converting:
+
+Converting to Timestamps
+------------------------
+
+To convert a :class:`Series` or list-like object of date-like objects e.g. strings,
+epochs, or a mixture, you can use the ``to_datetime`` function. When passed
+a ``Series``, this returns a ``Series`` (with the same index), while a list-like
+is converted to a ``DatetimeIndex``:
+
+.. ipython:: python
+
+    pd.to_datetime(pd.Series(['Jul 31, 2009', '2010-01-10', None]))
+
+    pd.to_datetime(['2005/11/23', '2010.12.31'])
+
+If you use dates which start with the day first (i.e. European style),
+you can pass the ``dayfirst`` flag:
+
+.. ipython:: python
+
+    pd.to_datetime(['04-01-2012 10:00'], dayfirst=True)
+
+    pd.to_datetime(['14-01-2012', '01-14-2012'], dayfirst=True)
+
+.. warning::
+
+   You see in the above example that ``dayfirst`` isn't strict, so if a date
+   can't be parsed with the day being first it will be parsed as if
+   ``dayfirst`` were False.
+
+If you pass a single string to ``to_datetime``, it returns a single ``Timestamp``.
+``Timestamp`` can also accept string input, but it doesn't accept string parsing
+options like ``dayfirst`` or ``format``, so use ``to_datetime`` if these are required.
+
+.. ipython:: python
+
+    pd.to_datetime('2010/11/12')
+
+    pd.Timestamp('2010/11/12')
+
+You can also use the ``DatetimeIndex`` constructor directly:
+
+.. ipython:: python
+
+    pd.DatetimeIndex(['2018-01-01', '2018-01-03', '2018-01-05'])
+
+The string 'infer' can be passed in order to set the frequency of the index as the
+inferred frequency upon creation:
+
+.. ipython:: python
+
+    pd.DatetimeIndex(['2018-01-01', '2018-01-03', '2018-01-05'], freq='infer')
+
+Providing a Format Argument
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In addition to the required datetime string, a ``format`` argument can be passed to ensure specific parsing.
+This could also potentially speed up the conversion considerably.
+
+.. ipython:: python
+
+    pd.to_datetime('2010/11/12', format='%Y/%m/%d')
+
+    pd.to_datetime('12-11-2010 00:00', format='%d-%m-%Y %H:%M')
+
+For more information on the choices available when specifying the ``format``
+option, see the Python `datetime documentation`_.
+
+.. _datetime documentation: https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior
+
+Assembling Datetime from Multiple DataFrame Columns
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+You can also pass a ``DataFrame`` of integer or string columns to assemble into a ``Series`` of ``Timestamps``.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'year': [2015, 2016],
+                      'month': [2, 3],
+                      'day': [4, 5],
+                      'hour': [2, 3]})
+   pd.to_datetime(df)
+
+
+You can pass only the columns that you need to assemble.
+
+.. ipython:: python
+
+   pd.to_datetime(df[['year', 'month', 'day']])
+
+``pd.to_datetime`` looks for standard designations of the datetime component in the column names, including:
+
+* required: ``year``, ``month``, ``day``
+* optional: ``hour``, ``minute``, ``second``, ``millisecond``, ``microsecond``, ``nanosecond``
+
+Invalid Data
+~~~~~~~~~~~~
+
+The default behavior, ``errors='raise'``, is to raise when unparseable:
+
+.. code-block:: ipython
+
+    In [2]: pd.to_datetime(['2009/07/31', 'asd'], errors='raise')
+    ValueError: Unknown string format
+
+Pass ``errors='ignore'`` to return the original input when unparseable:
+
+.. ipython:: python
+
+   pd.to_datetime(['2009/07/31', 'asd'], errors='ignore')
+
+Pass ``errors='coerce'`` to convert unparseable data to ``NaT`` (not a time):
+
+.. ipython:: python
+
+   pd.to_datetime(['2009/07/31', 'asd'], errors='coerce')
+
+
+.. _timeseries.converting.epoch:
+
+Epoch Timestamps
+~~~~~~~~~~~~~~~~
+
+pandas supports converting integer or float epoch times to ``Timestamp`` and
+``DatetimeIndex``. The default unit is nanoseconds, since that is how ``Timestamp``
+objects are stored internally. However, epochs are often stored in another ``unit``
+which can be specified. These are computed from the starting point specified by the
+``origin`` parameter.
+
+.. ipython:: python
+
+   pd.to_datetime([1349720105, 1349806505, 1349892905,
+                   1349979305, 1350065705], unit='s')
+
+   pd.to_datetime([1349720105100, 1349720105200, 1349720105300,
+                   1349720105400, 1349720105500], unit='ms')
+
+Constructing a :class:`Timestamp` or :class:`DatetimeIndex` with an epoch timestamp
+with the ``tz`` argument specified will localize the epoch timestamps to UTC
+first then convert the result to the specified time zone.
+
+.. ipython:: python
+
+   pd.Timestamp(1262347200000000000, tz='US/Pacific')
+   pd.DatetimeIndex([1262347200000000000], tz='US/Pacific')
+
+.. note::
+
+   Epoch times will be rounded to the nearest nanosecond.
+
+.. warning::
+
+   Conversion of float epoch times can lead to inaccurate and unexpected results.
+   :ref:`Python floats <python:tut-fp-issues>` have about 15 digits precision in
+   decimal. Rounding during conversion from float to high precision ``Timestamp`` is
+   unavoidable. The only way to achieve exact precision is to use a fixed-width
+   types (e.g. an int64).
+
+   .. ipython:: python
+
+      pd.to_datetime([1490195805.433, 1490195805.433502912], unit='s')
+      pd.to_datetime(1490195805433502912, unit='ns')
+
+.. seealso::
+
+   :ref:`timeseries.origin`
+
+.. _timeseries.converting.epoch_inverse:
+
+From Timestamps to Epoch
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+To invert the operation from above, namely, to convert from a ``Timestamp`` to a 'unix' epoch:
+
+.. ipython:: python
+
+   stamps = pd.date_range('2012-10-08 18:15:05', periods=4, freq='D')
+   stamps
+
+We subtract the epoch (midnight at January 1, 1970 UTC) and then floor divide by the
+"unit" (1 second).
+
+.. ipython:: python
+
+   (stamps - pd.Timestamp("1970-01-01")) // pd.Timedelta('1s')
+
+.. _timeseries.origin:
+
+Using the ``origin`` Parameter
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.20.0
+
+Using the ``origin`` parameter, one can specify an alternative starting point for creation
+of a ``DatetimeIndex``. For example, to use 1960-01-01 as the starting date:
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D', origin=pd.Timestamp('1960-01-01'))
+
+The default is set at ``origin='unix'``, which defaults to ``1970-01-01 00:00:00``.
+Commonly called 'unix epoch' or POSIX time.
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D')
+
+.. _timeseries.daterange:
+
+Generating Ranges of Timestamps
+-------------------------------
+
+To generate an index with timestamps, you can use either the ``DatetimeIndex`` or
+``Index`` constructor and pass in a list of datetime objects:
+
+.. ipython:: python
+
+   dates = [datetime.datetime(2012, 5, 1),
+            datetime.datetime(2012, 5, 2),
+            datetime.datetime(2012, 5, 3)]
+
+   # Note the frequency information
+   index = pd.DatetimeIndex(dates)
+   index
+
+   # Automatically converted to DatetimeIndex
+   index = pd.Index(dates)
+   index
+
+In practice this becomes very cumbersome because we often need a very long
+index with a large number of timestamps. If we need timestamps on a regular
+frequency, we can use the :func:`date_range` and :func:`bdate_range` functions
+to create a ``DatetimeIndex``. The default frequency for ``date_range`` is a
+**calendar day** while the default for ``bdate_range`` is a **business day**:
+
+.. ipython:: python
+
+   start = datetime.datetime(2011, 1, 1)
+   end = datetime.datetime(2012, 1, 1)
+
+   index = pd.date_range(start, end)
+   index
+
+   index = pd.bdate_range(start, end)
+   index
+
+Convenience functions like ``date_range`` and ``bdate_range`` can utilize a
+variety of :ref:`frequency aliases <timeseries.offset_aliases>`:
+
+.. ipython:: python
+
+   pd.date_range(start, periods=1000, freq='M')
+
+   pd.bdate_range(start, periods=250, freq='BQS')
+
+``date_range`` and ``bdate_range`` make it easy to generate a range of dates
+using various combinations of parameters like ``start``, ``end``, ``periods``,
+and ``freq``. The start and end dates are strictly inclusive, so dates outside
+of those specified will not be generated:
+
+.. ipython:: python
+
+   pd.date_range(start, end, freq='BM')
+
+   pd.date_range(start, end, freq='W')
+
+   pd.bdate_range(end=end, periods=20)
+
+   pd.bdate_range(start=start, periods=20)
+
+.. versionadded:: 0.23.0
+
+Specifying ``start``, ``end``, and ``periods`` will generate a range of evenly spaced
+dates from ``start`` to ``end`` inclusively, with ``periods`` number of elements in the
+resulting ``DatetimeIndex``:
+
+.. ipython:: python
+
+   pd.date_range('2018-01-01', '2018-01-05', periods=5)
+
+   pd.date_range('2018-01-01', '2018-01-05', periods=10)
+
+.. _timeseries.custom-freq-ranges:
+
+Custom Frequency Ranges
+~~~~~~~~~~~~~~~~~~~~~~~
+
+.. warning::
+
+   This functionality was originally exclusive to ``cdate_range``, which is
+   deprecated as of version 0.21.0 in favor of ``bdate_range``.  Note that
+   ``cdate_range`` only utilizes the ``weekmask`` and ``holidays`` parameters
+   when custom business day, 'C', is passed as the frequency string. Support has
+   been expanded with ``bdate_range`` to work with any custom frequency string.
+
+.. versionadded:: 0.21.0
+
+``bdate_range`` can also generate a range of custom frequency dates by using
+the ``weekmask`` and ``holidays`` parameters.  These parameters will only be
+used if a custom frequency string is passed.
+
+.. ipython:: python
+
+   weekmask = 'Mon Wed Fri'
+
+   holidays = [datetime.datetime(2011, 1, 5), datetime.datetime(2011, 3, 14)]
+
+   pd.bdate_range(start, end, freq='C', weekmask=weekmask, holidays=holidays)
+
+   pd.bdate_range(start, end, freq='CBMS', weekmask=weekmask)
+
+.. seealso::
+
+   :ref:`timeseries.custombusinessdays`
+
+.. _timeseries.timestamp-limits:
+
+Timestamp Limitations
+---------------------
+
+Since pandas represents timestamps in nanosecond resolution, the time span that
+can be represented using a 64-bit integer is limited to approximately 584 years:
+
+.. ipython:: python
+
+   pd.Timestamp.min
+   pd.Timestamp.max
+
+.. seealso::
+
+   :ref:`timeseries.oob`
+
+.. _timeseries.datetimeindex:
+
+Indexing
+--------
+
+One of the main uses for ``DatetimeIndex`` is as an index for pandas objects.
+The ``DatetimeIndex`` class contains many time series related optimizations:
+
+* A large range of dates for various offsets are pre-computed and cached
+  under the hood in order to make generating subsequent date ranges very fast
+  (just have to grab a slice).
+* Fast shifting using the ``shift`` and ``tshift`` method on pandas objects.
+* Unioning of overlapping ``DatetimeIndex`` objects with the same frequency is
+  very fast (important for fast data alignment).
+* Quick access to date fields via properties such as ``year``, ``month``, etc.
+* Regularization functions like ``snap`` and very fast ``asof`` logic.
+
+``DatetimeIndex`` objects have all the basic functionality of regular ``Index``
+objects, and a smorgasbord of advanced time series specific methods for easy
+frequency processing.
+
+.. seealso::
+    :ref:`Reindexing methods <basics.reindexing>`
+
+.. note::
+
+    While pandas does not force you to have a sorted date index, some of these
+    methods may have unexpected or incorrect behavior if the dates are unsorted.
+
+``DatetimeIndex`` can be used like a regular index and offers all of its
+intelligent functionality like selection, slicing, etc.
+
+.. ipython:: python
+
+   rng = pd.date_range(start, end, freq='BM')
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
+   ts.index
+   ts[:5].index
+   ts[::2].index
+
+.. _timeseries.partialindexing:
+
+Partial String Indexing
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Dates and strings that parse to timestamps can be passed as indexing parameters:
+
+.. ipython:: python
+
+   ts['1/31/2011']
+
+   ts[datetime.datetime(2011, 12, 25):]
+
+   ts['10/31/2011':'12/31/2011']
+
+To provide convenience for accessing longer time series, you can also pass in
+the year or year and month as strings:
+
+.. ipython:: python
+
+   ts['2011']
+
+   ts['2011-6']
+
+This type of slicing will work on a ``DataFrame`` with a ``DatetimeIndex`` as well. Since the
+partial string selection is a form of label slicing, the endpoints **will be** included. This
+would include matching times on an included date:
+
+.. ipython:: python
+
+   dft = pd.DataFrame(np.random.randn(100000, 1), columns=['A'],
+                      index=pd.date_range('20130101', periods=100000, freq='T'))
+   dft
+   dft['2013']
+
+This starts on the very first time in the month, and includes the last date and
+time for the month:
+
+.. ipython:: python
+
+   dft['2013-1':'2013-2']
+
+This specifies a stop time **that includes all of the times on the last day**:
+
+.. ipython:: python
+
+   dft['2013-1':'2013-2-28']
+
+This specifies an **exact** stop time (and is not the same as the above):
+
+.. ipython:: python
+
+   dft['2013-1':'2013-2-28 00:00:00']
+
+We are stopping on the included end-point as it is part of the index:
+
+.. ipython:: python
+
+   dft['2013-1-15':'2013-1-15 12:30:00']
+
+.. versionadded:: 0.18.0
+
+``DatetimeIndex`` partial string indexing also works on a ``DataFrame`` with a ``MultiIndex``:
+
+.. ipython:: python
+
+   dft2 = pd.DataFrame(np.random.randn(20, 1),
+                       columns=['A'],
+                       index=pd.MultiIndex.from_product(
+                           [pd.date_range('20130101', periods=10, freq='12H'),
+                            ['a', 'b']]))
+   dft2
+   dft2.loc['2013-01-05']
+   idx = pd.IndexSlice
+   dft2 = dft2.swaplevel(0, 1).sort_index()
+   dft2.loc[idx[:, '2013-01-05'], :]
+
+.. versionadded:: 0.25.0
+
+Slicing with string indexing also honors UTC offset.
+
+.. ipython:: python
+
+    df = pd.DataFrame([0], index=pd.DatetimeIndex(['2019-01-01'], tz='US/Pacific'))
+    df
+    df['2019-01-01 12:00:00+04:00':'2019-01-01 13:00:00+04:00']
+
+.. _timeseries.slice_vs_exact_match:
+
+Slice vs. Exact Match
+~~~~~~~~~~~~~~~~~~~~~
+
+.. versionchanged:: 0.20.0
+
+The same string used as an indexing parameter can be treated either as a slice or as an exact match depending on the resolution of the index. If the string is less accurate than the index, it will be treated as a slice, otherwise as an exact match.
+
+Consider a ``Series`` object with a minute resolution index:
+
+.. ipython:: python
+
+    series_minute = pd.Series([1, 2, 3],
+                              pd.DatetimeIndex(['2011-12-31 23:59:00',
+                                                '2012-01-01 00:00:00',
+                                                '2012-01-01 00:02:00']))
+    series_minute.index.resolution
+
+A timestamp string less accurate than a minute gives a ``Series`` object.
+
+.. ipython:: python
+
+    series_minute['2011-12-31 23']
+
+A timestamp string with minute resolution (or more accurate), gives a scalar instead, i.e. it is not casted to a slice.
+
+.. ipython:: python
+
+    series_minute['2011-12-31 23:59']
+    series_minute['2011-12-31 23:59:00']
+
+If index resolution is second, then the minute-accurate timestamp gives a
+``Series``.
+
+.. ipython:: python
+
+    series_second = pd.Series([1, 2, 3],
+                              pd.DatetimeIndex(['2011-12-31 23:59:59',
+                                                '2012-01-01 00:00:00',
+                                                '2012-01-01 00:00:01']))
+    series_second.index.resolution
+    series_second['2011-12-31 23:59']
+
+If the timestamp string is treated as a slice, it can be used to index ``DataFrame`` with ``[]`` as well.
+
+.. ipython:: python
+
+    dft_minute = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]},
+                              index=series_minute.index)
+    dft_minute['2011-12-31 23']
+
+
+.. warning::
+
+   However, if the string is treated as an exact match, the selection in ``DataFrame``'s ``[]`` will be column-wise and not row-wise, see :ref:`Indexing Basics <indexing.basics>`. For example ``dft_minute['2011-12-31 23:59']`` will raise ``KeyError`` as ``'2012-12-31 23:59'`` has the same resolution as the index and there is no column with such name:
+
+   To *always* have unambiguous selection, whether the row is treated as a slice or a single selection, use ``.loc``.
+
+   .. ipython:: python
+
+      dft_minute.loc['2011-12-31 23:59']
+
+Note also that ``DatetimeIndex`` resolution cannot be less precise than day.
+
+.. ipython:: python
+
+    series_monthly = pd.Series([1, 2, 3],
+                               pd.DatetimeIndex(['2011-12', '2012-01', '2012-02']))
+    series_monthly.index.resolution
+    series_monthly['2011-12']  # returns Series
+
+
+Exact Indexing
+~~~~~~~~~~~~~~
+
+As discussed in previous section, indexing a ``DatetimeIndex`` with a partial string depends on the "accuracy" of the period, in other words how specific the interval is in relation to the resolution of the index. In contrast, indexing with ``Timestamp`` or ``datetime`` objects is exact, because the objects have exact meaning. These also follow the semantics of *including both endpoints*.
+
+These ``Timestamp`` and ``datetime`` objects have exact ``hours, minutes,`` and ``seconds``, even though they were not explicitly specified (they are ``0``).
+
+.. ipython:: python
+
+   dft[datetime.datetime(2013, 1, 1):datetime.datetime(2013, 2, 28)]
+
+With no defaults.
+
+.. ipython:: python
+
+   dft[datetime.datetime(2013, 1, 1, 10, 12, 0):
+       datetime.datetime(2013, 2, 28, 10, 12, 0)]
+
+
+Truncating & Fancy Indexing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A :meth:`~DataFrame.truncate` convenience function is provided that is similar
+to slicing. Note that ``truncate`` assumes a 0 value for any unspecified date
+component in a ``DatetimeIndex`` in contrast to slicing which returns any
+partially matching dates:
+
+.. ipython:: python
+
+   rng2 = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+   ts2 = pd.Series(np.random.randn(len(rng2)), index=rng2)
+
+   ts2.truncate(before='2011-11', after='2011-12')
+   ts2['2011-11':'2011-12']
+
+Even complicated fancy indexing that breaks the ``DatetimeIndex`` frequency
+regularity will result in a ``DatetimeIndex``, although frequency is lost:
+
+.. ipython:: python
+
+   ts2[[0, 2, 6]].index
+
+.. _timeseries.iterating-label:
+
+Iterating through groups
+------------------------
+
+With the ``Resampler`` object in hand, iterating through the grouped data is very
+natural and functions similarly to :py:func:`itertools.groupby`:
+
+.. ipython:: python
+
+   small = pd.Series(
+       range(6),
+       index=pd.to_datetime(['2017-01-01T00:00:00',
+                             '2017-01-01T00:30:00',
+                             '2017-01-01T00:31:00',
+                             '2017-01-01T01:00:00',
+                             '2017-01-01T03:00:00',
+                             '2017-01-01T03:05:00'])
+   )
+   resampled = small.resample('H')
+
+   for name, group in resampled:
+       print("Group: ", name)
+       print("-" * 27)
+       print(group, end="\n\n")
+
+See :ref:`groupby.iterating-label` or :class:`Resampler.__iter__` for more.
+
+.. _timeseries.components:
+
+Time/Date Components
+--------------------
+
+There are several time/date properties that one can access from ``Timestamp`` or a collection of timestamps like a ``DatetimeIndex``.
+
+.. csv-table::
+    :header: "Property", "Description"
+    :widths: 15, 65
+
+    year, "The year of the datetime"
+    month,"The month of the datetime"
+    day,"The days of the datetime"
+    hour,"The hour of the datetime"
+    minute,"The minutes of the datetime"
+    second,"The seconds of the datetime"
+    microsecond,"The microseconds of the datetime"
+    nanosecond,"The nanoseconds of the datetime"
+    date,"Returns datetime.date (does not contain timezone information)"
+    time,"Returns datetime.time (does not contain timezone information)"
+    timetz,"Returns datetime.time as local time with timezone information"
+    dayofyear,"The ordinal day of year"
+    weekofyear,"The week ordinal of the year"
+    week,"The week ordinal of the year"
+    dayofweek,"The number of the day of the week with Monday=0, Sunday=6"
+    weekday,"The number of the day of the week with Monday=0, Sunday=6"
+    weekday_name,"The name of the day in a week (ex: Friday)"
+    quarter,"Quarter of the date: Jan-Mar = 1, Apr-Jun = 2, etc."
+    days_in_month,"The number of days in the month of the datetime"
+    is_month_start,"Logical indicating if first day of month (defined by frequency)"
+    is_month_end,"Logical indicating if last day of month (defined by frequency)"
+    is_quarter_start,"Logical indicating if first day of quarter (defined by frequency)"
+    is_quarter_end,"Logical indicating if last day of quarter (defined by frequency)"
+    is_year_start,"Logical indicating if first day of year (defined by frequency)"
+    is_year_end,"Logical indicating if last day of year (defined by frequency)"
+    is_leap_year,"Logical indicating if the date belongs to a leap year"
+
+Furthermore, if you have a ``Series`` with datetimelike values, then you can
+access these properties via the ``.dt`` accessor, as detailed in the section
+on :ref:`.dt accessors<basics.dt_accessors>`.
+
+.. _timeseries.offsets:
+
+DateOffset Objects
+------------------
+
+In the preceding examples, frequency strings (e.g. ``'D'``) were used to specify
+a frequency that defined:
+
+* how the date times in :class:`DatetimeIndex` were spaced when using :meth:`date_range`
+* the frequency of a :class:`Period` or :class:`PeriodIndex`
+
+These frequency strings map to a :class:`DateOffset` object and its subclasses. A :class:`DateOffset`
+is similar to a :class:`Timedelta` that represents a duration of time but follows specific calendar duration rules.
+For example, a :class:`Timedelta` day will always increment ``datetimes`` by 24 hours, while a :class:`DateOffset` day
+will increment ``datetimes`` to the same time the next day whether a day represents 23, 24 or 25 hours due to daylight
+savings time. However, all :class:`DateOffset` subclasses that are an hour or smaller
+(``Hour``, ``Minute``, ``Second``, ``Milli``, ``Micro``, ``Nano``) behave like
+:class:`Timedelta` and respect absolute time.
+
+The basic :class:`DateOffset` acts similar to ``dateutil.relativedelta`` (`relativedelta documentation`_)
+that shifts a date time by the corresponding calendar duration specified. The
+arithmetic operator (``+``) or the ``apply`` method can be used to perform the shift.
+
+.. ipython:: python
+
+   # This particular day contains a day light savings time transition
+   ts = pd.Timestamp('2016-10-30 00:00:00', tz='Europe/Helsinki')
+   # Respects absolute time
+   ts + pd.Timedelta(days=1)
+   # Respects calendar time
+   ts + pd.DateOffset(days=1)
+   friday = pd.Timestamp('2018-01-05')
+   friday.day_name()
+   # Add 2 business days (Friday --> Tuesday)
+   two_business_days = 2 * pd.offsets.BDay()
+   two_business_days.apply(friday)
+   friday + two_business_days
+   (friday + two_business_days).day_name()
+
+Most ``DateOffsets`` have associated frequencies strings, or offset aliases, that can be passed
+into ``freq`` keyword arguments. The available date offsets and associated frequency strings can be found below:
+
+.. csv-table::
+    :header: "Date Offset", "Frequency String", "Description"
+    :widths: 15, 15, 65
+
+    :class:`~pandas.tseries.offsets.DateOffset`, None, "Generic offset class, defaults to 1 calendar day"
+    :class:`~pandas.tseries.offsets.BDay` or :class:`~pandas.tseries.offsets.BusinessDay`, ``'B'``,"business day (weekday)"
+    :class:`~pandas.tseries.offsets.CDay` or :class:`~pandas.tseries.offsets.CustomBusinessDay`, ``'C'``, "custom business day"
+    :class:`~pandas.tseries.offsets.Week`, ``'W'``, "one week, optionally anchored on a day of the week"
+    :class:`~pandas.tseries.offsets.WeekOfMonth`, ``'WOM'``, "the x-th day of the y-th week of each month"
+    :class:`~pandas.tseries.offsets.LastWeekOfMonth`, ``'LWOM'``, "the x-th day of the last week of each month"
+    :class:`~pandas.tseries.offsets.MonthEnd`, ``'M'``, "calendar month end"
+    :class:`~pandas.tseries.offsets.MonthBegin`, ``'MS'``, "calendar month begin"
+    :class:`~pandas.tseries.offsets.BMonthEnd` or :class:`~pandas.tseries.offsets.BusinessMonthEnd`, ``'BM'``, "business month end"
+    :class:`~pandas.tseries.offsets.BMonthBegin` or :class:`~pandas.tseries.offsets.BusinessMonthBegin`, ``'BMS'``, "business month begin"
+    :class:`~pandas.tseries.offsets.CBMonthEnd` or :class:`~pandas.tseries.offsets.CustomBusinessMonthEnd`, ``'CBM'``, "custom business month end"
+    :class:`~pandas.tseries.offsets.CBMonthBegin` or :class:`~pandas.tseries.offsets.CustomBusinessMonthBegin`, ``'CBMS'``, "custom business month begin"
+    :class:`~pandas.tseries.offsets.SemiMonthEnd`, ``'SM'``, "15th (or other day_of_month) and calendar month end"
+    :class:`~pandas.tseries.offsets.SemiMonthBegin`, ``'SMS'``, "15th (or other day_of_month) and calendar month begin"
+    :class:`~pandas.tseries.offsets.QuarterEnd`, ``'Q'``, "calendar quarter end"
+    :class:`~pandas.tseries.offsets.QuarterBegin`, ``'QS'``, "calendar quarter begin"
+    :class:`~pandas.tseries.offsets.BQuarterEnd`, ``'BQ``, "business quarter end"
+    :class:`~pandas.tseries.offsets.BQuarterBegin`, ``'BQS'``, "business quarter begin"
+    :class:`~pandas.tseries.offsets.FY5253Quarter`, ``'REQ'``, "retail (aka 52-53 week) quarter"
+    :class:`~pandas.tseries.offsets.YearEnd`, ``'A'``, "calendar year end"
+    :class:`~pandas.tseries.offsets.YearBegin`, ``'AS'`` or ``'BYS'``,"calendar year begin"
+    :class:`~pandas.tseries.offsets.BYearEnd`, ``'BA'``, "business year end"
+    :class:`~pandas.tseries.offsets.BYearBegin`, ``'BAS'``, "business year begin"
+    :class:`~pandas.tseries.offsets.FY5253`, ``'RE'``, "retail (aka 52-53 week) year"
+    :class:`~pandas.tseries.offsets.Easter`, None, "Easter holiday"
+    :class:`~pandas.tseries.offsets.BusinessHour`, ``'BH'``, "business hour"
+    :class:`~pandas.tseries.offsets.CustomBusinessHour`, ``'CBH'``, "custom business hour"
+    :class:`~pandas.tseries.offsets.Day`, ``'D'``, "one absolute day"
+    :class:`~pandas.tseries.offsets.Hour`, ``'H'``, "one hour"
+    :class:`~pandas.tseries.offsets.Minute`, ``'T'`` or ``'min'``,"one minute"
+    :class:`~pandas.tseries.offsets.Second`, ``'S'``, "one second"
+    :class:`~pandas.tseries.offsets.Milli`, ``'L'`` or ``'ms'``, "one millisecond"
+    :class:`~pandas.tseries.offsets.Micro`, ``'U'`` or ``'us'``, "one microsecond"
+    :class:`~pandas.tseries.offsets.Nano`, ``'N'``, "one nanosecond"
+
+``DateOffsets`` additionally have :meth:`rollforward` and :meth:`rollback`
+methods for moving a date forward or backward respectively to a valid offset
+date relative to the offset. For example, business offsets will roll dates
+that land on the weekends (Saturday and Sunday) forward to Monday since
+business offsets operate on the weekdays.
+
+.. ipython:: python
+
+   ts = pd.Timestamp('2018-01-06 00:00:00')
+   ts.day_name()
+   # BusinessHour's valid offset dates are Monday through Friday
+   offset = pd.offsets.BusinessHour(start='09:00')
+   # Bring the date to the closest offset date (Monday)
+   offset.rollforward(ts)
+   # Date is brought to the closest offset date first and then the hour is added
+   ts + offset
+
+These operations preserve time (hour, minute, etc) information by default.
+To reset time to midnight, use :meth:`normalize` before or after applying
+the operation (depending on whether you want the time information included
+in the operation).
+
+.. ipython:: python
+
+   ts = pd.Timestamp('2014-01-01 09:00')
+   day = pd.offsets.Day()
+   day.apply(ts)
+   day.apply(ts).normalize()
+
+   ts = pd.Timestamp('2014-01-01 22:00')
+   hour = pd.offsets.Hour()
+   hour.apply(ts)
+   hour.apply(ts).normalize()
+   hour.apply(pd.Timestamp("2014-01-01 23:30")).normalize()
+
+.. _relativedelta documentation: https://dateutil.readthedocs.io/en/stable/relativedelta.html
+
+
+Parametric Offsets
+~~~~~~~~~~~~~~~~~~
+
+Some of the offsets can be "parameterized" when created to result in different
+behaviors. For example, the ``Week`` offset for generating weekly data accepts a
+``weekday`` parameter which results in the generated dates always lying on a
+particular day of the week:
+
+.. ipython:: python
+
+   d = datetime.datetime(2008, 8, 18, 9, 0)
+   d
+   d + pd.offsets.Week()
+   d + pd.offsets.Week(weekday=4)
+   (d + pd.offsets.Week(weekday=4)).weekday()
+
+   d - pd.offsets.Week()
+
+The ``normalize`` option will be effective for addition and subtraction.
+
+.. ipython:: python
+
+   d + pd.offsets.Week(normalize=True)
+   d - pd.offsets.Week(normalize=True)
+
+
+Another example is parameterizing ``YearEnd`` with the specific ending month:
+
+.. ipython:: python
+
+   d + pd.offsets.YearEnd()
+   d + pd.offsets.YearEnd(month=6)
+
+
+.. _timeseries.offsetseries:
+
+Using Offsets with ``Series`` / ``DatetimeIndex``
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Offsets can be used with either a ``Series`` or ``DatetimeIndex`` to
+apply the offset to each element.
+
+.. ipython:: python
+
+   rng = pd.date_range('2012-01-01', '2012-01-03')
+   s = pd.Series(rng)
+   rng
+   rng + pd.DateOffset(months=2)
+   s + pd.DateOffset(months=2)
+   s - pd.DateOffset(months=2)
+
+If the offset class maps directly to a ``Timedelta`` (``Day``, ``Hour``,
+``Minute``, ``Second``, ``Micro``, ``Milli``, ``Nano``) it can be
+used exactly like a ``Timedelta`` - see the
+:ref:`Timedelta section<timedeltas.operations>` for more examples.
+
+.. ipython:: python
+
+   s - pd.offsets.Day(2)
+   td = s - pd.Series(pd.date_range('2011-12-29', '2011-12-31'))
+   td
+   td + pd.offsets.Minute(15)
+
+Note that some offsets (such as ``BQuarterEnd``) do not have a
+vectorized implementation.  They can still be used but may
+calculate significantly slower and will show a ``PerformanceWarning``
+
+.. ipython:: python
+   :okwarning:
+
+   rng + pd.offsets.BQuarterEnd()
+
+
+.. _timeseries.custombusinessdays:
+
+Custom Business Days
+~~~~~~~~~~~~~~~~~~~~
+
+The ``CDay`` or ``CustomBusinessDay`` class provides a parametric
+``BusinessDay`` class which can be used to create customized business day
+calendars which account for local holidays and local weekend conventions.
+
+As an interesting example, let's look at Egypt where a Friday-Saturday weekend is observed.
+
+.. ipython:: python
+
+    weekmask_egypt = 'Sun Mon Tue Wed Thu'
+
+    # They also observe International Workers' Day so let's
+    # add that for a couple of years
+
+    holidays = ['2012-05-01',
+                datetime.datetime(2013, 5, 1),
+                np.datetime64('2014-05-01')]
+    bday_egypt = pd.offsets.CustomBusinessDay(holidays=holidays,
+                                              weekmask=weekmask_egypt)
+    dt = datetime.datetime(2013, 4, 30)
+    dt + 2 * bday_egypt
+
+Let's map to the weekday names:
+
+.. ipython:: python
+
+    dts = pd.date_range(dt, periods=5, freq=bday_egypt)
+
+    pd.Series(dts.weekday, dts).map(
+        pd.Series('Mon Tue Wed Thu Fri Sat Sun'.split()))
+
+Holiday calendars can be used to provide the list of holidays.  See the
+:ref:`holiday calendar<timeseries.holiday>` section for more information.
+
+.. ipython:: python
+
+    from pandas.tseries.holiday import USFederalHolidayCalendar
+
+    bday_us = pd.offsets.CustomBusinessDay(calendar=USFederalHolidayCalendar())
+
+    # Friday before MLK Day
+    dt = datetime.datetime(2014, 1, 17)
+
+    # Tuesday after MLK Day (Monday is skipped because it's a holiday)
+    dt + bday_us
+
+Monthly offsets that respect a certain holiday calendar can be defined
+in the usual way.
+
+.. ipython:: python
+
+    bmth_us = pd.offsets.CustomBusinessMonthBegin(
+        calendar=USFederalHolidayCalendar())
+
+    # Skip new years
+    dt = datetime.datetime(2013, 12, 17)
+    dt + bmth_us
+
+    # Define date index with custom offset
+    pd.date_range(start='20100101', end='20120101', freq=bmth_us)
+
+.. note::
+
+    The frequency string 'C' is used to indicate that a CustomBusinessDay
+    DateOffset is used, it is important to note that since CustomBusinessDay is
+    a parameterised type, instances of CustomBusinessDay may differ and this is
+    not detectable from the 'C' frequency string. The user therefore needs to
+    ensure that the 'C' frequency string is used consistently within the user's
+    application.
+
+.. _timeseries.businesshour:
+
+Business Hour
+~~~~~~~~~~~~~
+
+The ``BusinessHour`` class provides a business hour representation on ``BusinessDay``,
+allowing to use specific start and end times.
+
+By default, ``BusinessHour`` uses 9:00 - 17:00 as business hours.
+Adding ``BusinessHour`` will increment ``Timestamp`` by hourly frequency.
+If target ``Timestamp`` is out of business hours, move to the next business hour
+then increment it. If the result exceeds the business hours end, the remaining
+hours are added to the next business day.
+
+.. ipython:: python
+
+    bh = pd.offsets.BusinessHour()
+    bh
+
+    # 2014-08-01 is Friday
+    pd.Timestamp('2014-08-01 10:00').weekday()
+    pd.Timestamp('2014-08-01 10:00') + bh
+
+    # Below example is the same as: pd.Timestamp('2014-08-01 09:00') + bh
+    pd.Timestamp('2014-08-01 08:00') + bh
+
+    # If the results is on the end time, move to the next business day
+    pd.Timestamp('2014-08-01 16:00') + bh
+
+    # Remainings are added to the next day
+    pd.Timestamp('2014-08-01 16:30') + bh
+
+    # Adding 2 business hours
+    pd.Timestamp('2014-08-01 10:00') + pd.offsets.BusinessHour(2)
+
+    # Subtracting 3 business hours
+    pd.Timestamp('2014-08-01 10:00') + pd.offsets.BusinessHour(-3)
+
+You can also specify ``start`` and ``end`` time by keywords. The argument must
+be a ``str`` with an ``hour:minute`` representation or a ``datetime.time``
+instance. Specifying seconds, microseconds and nanoseconds as business hour
+results in ``ValueError``.
+
+.. ipython:: python
+
+    bh = pd.offsets.BusinessHour(start='11:00', end=datetime.time(20, 0))
+    bh
+
+    pd.Timestamp('2014-08-01 13:00') + bh
+    pd.Timestamp('2014-08-01 09:00') + bh
+    pd.Timestamp('2014-08-01 18:00') + bh
+
+Passing ``start`` time later than ``end`` represents midnight business hour.
+In this case, business hour exceeds midnight and overlap to the next day.
+Valid business hours are distinguished by whether it started from valid ``BusinessDay``.
+
+.. ipython:: python
+
+    bh = pd.offsets.BusinessHour(start='17:00', end='09:00')
+    bh
+
+    pd.Timestamp('2014-08-01 17:00') + bh
+    pd.Timestamp('2014-08-01 23:00') + bh
+
+    # Although 2014-08-02 is Satuaday,
+    # it is valid because it starts from 08-01 (Friday).
+    pd.Timestamp('2014-08-02 04:00') + bh
+
+    # Although 2014-08-04 is Monday,
+    # it is out of business hours because it starts from 08-03 (Sunday).
+    pd.Timestamp('2014-08-04 04:00') + bh
+
+Applying ``BusinessHour.rollforward`` and ``rollback`` to out of business hours results in
+the next business hour start or previous day's end. Different from other offsets, ``BusinessHour.rollforward``
+may output different results from ``apply`` by definition.
+
+This is because one day's business hour end is equal to next day's business hour start. For example,
+under the default business hours (9:00 - 17:00), there is no gap (0 minutes) between ``2014-08-01 17:00`` and
+``2014-08-04 09:00``.
+
+.. ipython:: python
+
+    # This adjusts a Timestamp to business hour edge
+    pd.offsets.BusinessHour().rollback(pd.Timestamp('2014-08-02 15:00'))
+    pd.offsets.BusinessHour().rollforward(pd.Timestamp('2014-08-02 15:00'))
+
+    # It is the same as BusinessHour().apply(pd.Timestamp('2014-08-01 17:00')).
+    # And it is the same as BusinessHour().apply(pd.Timestamp('2014-08-04 09:00'))
+    pd.offsets.BusinessHour().apply(pd.Timestamp('2014-08-02 15:00'))
+
+    # BusinessDay results (for reference)
+    pd.offsets.BusinessHour().rollforward(pd.Timestamp('2014-08-02'))
+
+    # It is the same as BusinessDay().apply(pd.Timestamp('2014-08-01'))
+    # The result is the same as rollworward because BusinessDay never overlap.
+    pd.offsets.BusinessHour().apply(pd.Timestamp('2014-08-02'))
+
+``BusinessHour`` regards Saturday and Sunday as holidays. To use arbitrary
+holidays, you can use ``CustomBusinessHour`` offset, as explained in the
+following subsection.
+
+.. _timeseries.custombusinesshour:
+
+Custom Business Hour
+~~~~~~~~~~~~~~~~~~~~
+
+.. versionadded:: 0.18.1
+
+The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
+allows you to specify arbitrary holidays. ``CustomBusinessHour`` works as the same
+as ``BusinessHour`` except that it skips specified custom holidays.
+
+.. ipython:: python
+
+    from pandas.tseries.holiday import USFederalHolidayCalendar
+    bhour_us = pd.offsets.CustomBusinessHour(calendar=USFederalHolidayCalendar())
+    # Friday before MLK Day
+    dt = datetime.datetime(2014, 1, 17, 15)
+
+    dt + bhour_us
+
+    # Tuesday after MLK Day (Monday is skipped because it's a holiday)
+    dt + bhour_us * 2
+
+You can use keyword arguments supported by either ``BusinessHour`` and ``CustomBusinessDay``.
+
+.. ipython:: python
+
+    bhour_mon = pd.offsets.CustomBusinessHour(start='10:00',
+                                              weekmask='Tue Wed Thu Fri')
+
+    # Monday is skipped because it's a holiday, business hour starts from 10:00
+    dt + bhour_mon * 2
+
+.. _timeseries.offset_aliases:
+
+Offset Aliases
+~~~~~~~~~~~~~~
+
+A number of string aliases are given to useful common time series
+frequencies. We will refer to these aliases as *offset aliases*.
+
+.. csv-table::
+    :header: "Alias", "Description"
+    :widths: 15, 100
+
+    "B", "business day frequency"
+    "C", "custom business day frequency"
+    "D", "calendar day frequency"
+    "W", "weekly frequency"
+    "M", "month end frequency"
+    "SM", "semi-month end frequency (15th and end of month)"
+    "BM", "business month end frequency"
+    "CBM", "custom business month end frequency"
+    "MS", "month start frequency"
+    "SMS", "semi-month start frequency (1st and 15th)"
+    "BMS", "business month start frequency"
+    "CBMS", "custom business month start frequency"
+    "Q", "quarter end frequency"
+    "BQ", "business quarter end frequency"
+    "QS", "quarter start frequency"
+    "BQS", "business quarter start frequency"
+    "A, Y", "year end frequency"
+    "BA, BY", "business year end frequency"
+    "AS, YS", "year start frequency"
+    "BAS, BYS", "business year start frequency"
+    "BH", "business hour frequency"
+    "H", "hourly frequency"
+    "T, min", "minutely frequency"
+    "S", "secondly frequency"
+    "L, ms", "milliseconds"
+    "U, us", "microseconds"
+    "N", "nanoseconds"
+
+Combining Aliases
+~~~~~~~~~~~~~~~~~
+
+As we have seen previously, the alias and the offset instance are fungible in
+most functions:
+
+.. ipython:: python
+
+   pd.date_range(start, periods=5, freq='B')
+
+   pd.date_range(start, periods=5, freq=pd.offsets.BDay())
+
+You can combine together day and intraday offsets:
+
+.. ipython:: python
+
+   pd.date_range(start, periods=10, freq='2h20min')
+
+   pd.date_range(start, periods=10, freq='1D10U')
+
+Anchored Offsets
+~~~~~~~~~~~~~~~~
+
+For some frequencies you can specify an anchoring suffix:
+
+.. csv-table::
+    :header: "Alias", "Description"
+    :widths: 15, 100
+
+    "W\-SUN", "weekly frequency (Sundays). Same as 'W'"
+    "W\-MON", "weekly frequency (Mondays)"
+    "W\-TUE", "weekly frequency (Tuesdays)"
+    "W\-WED", "weekly frequency (Wednesdays)"
+    "W\-THU", "weekly frequency (Thursdays)"
+    "W\-FRI", "weekly frequency (Fridays)"
+    "W\-SAT", "weekly frequency (Saturdays)"
+    "(B)Q(S)\-DEC", "quarterly frequency, year ends in December. Same as 'Q'"
+    "(B)Q(S)\-JAN", "quarterly frequency, year ends in January"
+    "(B)Q(S)\-FEB", "quarterly frequency, year ends in February"
+    "(B)Q(S)\-MAR", "quarterly frequency, year ends in March"
+    "(B)Q(S)\-APR", "quarterly frequency, year ends in April"
+    "(B)Q(S)\-MAY", "quarterly frequency, year ends in May"
+    "(B)Q(S)\-JUN", "quarterly frequency, year ends in June"
+    "(B)Q(S)\-JUL", "quarterly frequency, year ends in July"
+    "(B)Q(S)\-AUG", "quarterly frequency, year ends in August"
+    "(B)Q(S)\-SEP", "quarterly frequency, year ends in September"
+    "(B)Q(S)\-OCT", "quarterly frequency, year ends in October"
+    "(B)Q(S)\-NOV", "quarterly frequency, year ends in November"
+    "(B)A(S)\-DEC", "annual frequency, anchored end of December. Same as 'A'"
+    "(B)A(S)\-JAN", "annual frequency, anchored end of January"
+    "(B)A(S)\-FEB", "annual frequency, anchored end of February"
+    "(B)A(S)\-MAR", "annual frequency, anchored end of March"
+    "(B)A(S)\-APR", "annual frequency, anchored end of April"
+    "(B)A(S)\-MAY", "annual frequency, anchored end of May"
+    "(B)A(S)\-JUN", "annual frequency, anchored end of June"
+    "(B)A(S)\-JUL", "annual frequency, anchored end of July"
+    "(B)A(S)\-AUG", "annual frequency, anchored end of August"
+    "(B)A(S)\-SEP", "annual frequency, anchored end of September"
+    "(B)A(S)\-OCT", "annual frequency, anchored end of October"
+    "(B)A(S)\-NOV", "annual frequency, anchored end of November"
+
+These can be used as arguments to ``date_range``, ``bdate_range``, constructors
+for ``DatetimeIndex``, as well as various other timeseries-related functions
+in pandas.
+
+Anchored Offset Semantics
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+For those offsets that are anchored to the start or end of specific
+frequency (``MonthEnd``, ``MonthBegin``, ``WeekEnd``, etc), the following
+rules apply to rolling forward and backwards.
+
+When ``n`` is not 0, if the given date is not on an anchor point, it snapped to the next(previous)
+anchor point, and moved ``|n|-1`` additional steps forwards or backwards.
+
+.. ipython:: python
+
+   pd.Timestamp('2014-01-02') + pd.offsets.MonthBegin(n=1)
+   pd.Timestamp('2014-01-02') + pd.offsets.MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-02') - pd.offsets.MonthBegin(n=1)
+   pd.Timestamp('2014-01-02') - pd.offsets.MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-02') + pd.offsets.MonthBegin(n=4)
+   pd.Timestamp('2014-01-02') - pd.offsets.MonthBegin(n=4)
+
+If the given date *is* on an anchor point, it is moved ``|n|`` points forwards
+or backwards.
+
+.. ipython:: python
+
+   pd.Timestamp('2014-01-01') + pd.offsets.MonthBegin(n=1)
+   pd.Timestamp('2014-01-31') + pd.offsets.MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-01') - pd.offsets.MonthBegin(n=1)
+   pd.Timestamp('2014-01-31') - pd.offsets.MonthEnd(n=1)
+
+   pd.Timestamp('2014-01-01') + pd.offsets.MonthBegin(n=4)
+   pd.Timestamp('2014-01-31') - pd.offsets.MonthBegin(n=4)
+
+For the case when ``n=0``, the date is not moved if on an anchor point, otherwise
+it is rolled forward to the next anchor point.
+
+.. ipython:: python
+
+   pd.Timestamp('2014-01-02') + pd.offsets.MonthBegin(n=0)
+   pd.Timestamp('2014-01-02') + pd.offsets.MonthEnd(n=0)
+
+   pd.Timestamp('2014-01-01') + pd.offsets.MonthBegin(n=0)
+   pd.Timestamp('2014-01-31') + pd.offsets.MonthEnd(n=0)
+
+.. _timeseries.holiday:
+
+Holidays / Holiday Calendars
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Holidays and calendars provide a simple way to define holiday rules to be used
+with ``CustomBusinessDay`` or in other analysis that requires a predefined
+set of holidays.  The ``AbstractHolidayCalendar`` class provides all the necessary
+methods to return a list of holidays and only ``rules`` need to be defined
+in a specific holiday calendar class. Furthermore, the ``start_date`` and ``end_date``
+class attributes determine over what date range holidays are generated.  These
+should be overwritten on the ``AbstractHolidayCalendar`` class to have the range
+apply to all calendar subclasses.  ``USFederalHolidayCalendar`` is the
+only calendar that exists and primarily serves as an example for developing
+other calendars.
+
+For holidays that occur on fixed dates (e.g., US Memorial Day or July 4th) an
+observance rule determines when that holiday is observed if it falls on a weekend
+or some other non-observed day.  Defined observance rules are:
+
+.. csv-table::
+    :header: "Rule", "Description"
+    :widths: 15, 70
+
+    "nearest_workday", "move Saturday to Friday and Sunday to Monday"
+    "sunday_to_monday", "move Sunday to following Monday"
+    "next_monday_or_tuesday", "move Saturday to Monday and Sunday/Monday to Tuesday"
+    "previous_friday", move Saturday and Sunday to previous Friday"
+    "next_monday", "move Saturday and Sunday to following Monday"
+
+An example of how holidays and holiday calendars are defined:
+
+.. ipython:: python
+
+    from pandas.tseries.holiday import Holiday, USMemorialDay,\
+        AbstractHolidayCalendar, nearest_workday, MO
+    class ExampleCalendar(AbstractHolidayCalendar):
+        rules = [
+            USMemorialDay,
+            Holiday('July 4th', month=7, day=4, observance=nearest_workday),
+            Holiday('Columbus Day', month=10, day=1,
+                    offset=pd.DateOffset(weekday=MO(2)))]
+
+    cal = ExampleCalendar()
+    cal.holidays(datetime.datetime(2012, 1, 1), datetime.datetime(2012, 12, 31))
+
+:hint:
+   **weekday=MO(2)** is same as **2 * Week(weekday=2)**
+
+Using this calendar, creating an index or doing offset arithmetic skips weekends
+and holidays (i.e., Memorial Day/July 4th).  For example, the below defines
+a custom business day offset using the ``ExampleCalendar``.  Like any other offset,
+it can be used to create a ``DatetimeIndex`` or added to ``datetime``
+or ``Timestamp`` objects.
+
+.. ipython:: python
+
+    pd.date_range(start='7/1/2012', end='7/10/2012',
+                  freq=pd.offsets.CDay(calendar=cal)).to_pydatetime()
+    offset = pd.offsets.CustomBusinessDay(calendar=cal)
+    datetime.datetime(2012, 5, 25) + offset
+    datetime.datetime(2012, 7, 3) + offset
+    datetime.datetime(2012, 7, 3) + 2 * offset
+    datetime.datetime(2012, 7, 6) + offset
+
+Ranges are defined by the ``start_date`` and ``end_date`` class attributes
+of ``AbstractHolidayCalendar``.  The defaults are shown below.
+
+.. ipython:: python
+
+    AbstractHolidayCalendar.start_date
+    AbstractHolidayCalendar.end_date
+
+These dates can be overwritten by setting the attributes as
+datetime/Timestamp/string.
+
+.. ipython:: python
+
+    AbstractHolidayCalendar.start_date = datetime.datetime(2012, 1, 1)
+    AbstractHolidayCalendar.end_date = datetime.datetime(2012, 12, 31)
+    cal.holidays()
+
+Every calendar class is accessible by name using the ``get_calendar`` function
+which returns a holiday class instance.  Any imported calendar class will
+automatically be available by this function.  Also, ``HolidayCalendarFactory``
+provides an easy interface to create calendars that are combinations of calendars
+or calendars with additional rules.
+
+.. ipython:: python
+
+    from pandas.tseries.holiday import get_calendar, HolidayCalendarFactory,\
+        USLaborDay
+    cal = get_calendar('ExampleCalendar')
+    cal.rules
+    new_cal = HolidayCalendarFactory('NewExampleCalendar', cal, USLaborDay)
+    new_cal.rules
+
+.. _timeseries.advanced_datetime:
+
+Time Series-Related Instance Methods
+------------------------------------
+
+Shifting / Lagging
+~~~~~~~~~~~~~~~~~~
+
+One may want to *shift* or *lag* the values in a time series back and forward in
+time. The method for this is :meth:`~Series.shift`, which is available on all of
+the pandas objects.
+
+.. ipython:: python
+
+   ts = pd.Series(range(len(rng)), index=rng)
+   ts = ts[:5]
+   ts.shift(1)
+
+The ``shift`` method accepts an ``freq`` argument which can accept a
+``DateOffset`` class or other ``timedelta``-like object or also an
+:ref:`offset alias <timeseries.offset_aliases>`:
+
+.. ipython:: python
+
+   ts.shift(5, freq=pd.offsets.BDay())
+   ts.shift(5, freq='BM')
+
+Rather than changing the alignment of the data and the index, ``DataFrame`` and
+``Series`` objects also have a :meth:`~Series.tshift` convenience method that
+changes all the dates in the index by a specified number of offsets:
+
+.. ipython:: python
+
+   ts.tshift(5, freq='D')
+
+Note that with ``tshift``, the leading entry is no longer NaN because the data
+is not being realigned.
+
+Frequency Conversion
+~~~~~~~~~~~~~~~~~~~~
+
+The primary function for changing frequencies is the :meth:`~Series.asfreq`
+method. For a ``DatetimeIndex``, this is basically just a thin, but convenient
+wrapper around :meth:`~Series.reindex`  which generates a ``date_range`` and
+calls ``reindex``.
+
+.. ipython:: python
+
+   dr = pd.date_range('1/1/2010', periods=3, freq=3 * pd.offsets.BDay())
+   ts = pd.Series(np.random.randn(3), index=dr)
+   ts
+   ts.asfreq(pd.offsets.BDay())
+
+``asfreq`` provides a further convenience so you can specify an interpolation
+method for any gaps that may appear after the frequency conversion.
+
+.. ipython:: python
+
+   ts.asfreq(pd.offsets.BDay(), method='pad')
+
+Filling Forward / Backward
+~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Related to ``asfreq`` and ``reindex`` is :meth:`~Series.fillna`, which is
+documented in the :ref:`missing data section <missing_data.fillna>`.
+
+Converting to Python Datetimes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``DatetimeIndex`` can be converted to an array of Python native
+:py:class:`datetime.datetime` objects using the ``to_pydatetime`` method.
+
+.. _timeseries.resampling:
+
+Resampling
+----------
+
+.. warning::
+
+   The interface to ``.resample`` has changed in 0.18.0 to be more groupby-like and hence more flexible.
+   See the :ref:`whatsnew docs <whatsnew_0180.breaking.resample>` for a comparison with prior versions.
+
+Pandas has a simple, powerful, and efficient functionality for performing
+resampling operations during frequency conversion (e.g., converting secondly
+data into 5-minutely data). This is extremely common in, but not limited to,
+financial applications.
+
+:meth:`~Series.resample` is a time-based groupby, followed by a reduction method
+on each of its groups. See some :ref:`cookbook examples <cookbook.resample>` for
+some advanced strategies.
+
+Starting in version 0.18.1, the ``resample()`` function can be used directly from
+``DataFrameGroupBy`` objects, see the :ref:`groupby docs <groupby.transform.window_resample>`.
+
+.. note::
+
+   ``.resample()`` is similar to using a :meth:`~Series.rolling` operation with
+   a time-based offset, see a discussion :ref:`here <stats.moments.ts-versus-resampling>`.
+
+Basics
+~~~~~~
+
+.. ipython:: python
+
+   rng = pd.date_range('1/1/2012', periods=100, freq='S')
+
+   ts = pd.Series(np.random.randint(0, 500, len(rng)), index=rng)
+
+   ts.resample('5Min').sum()
+
+The ``resample`` function is very flexible and allows you to specify many
+different parameters to control the frequency conversion and resampling
+operation.
+
+Any function available via :ref:`dispatching <groupby.dispatch>` is available as
+a method of the returned object, including ``sum``, ``mean``, ``std``, ``sem``,
+``max``, ``min``, ``median``, ``first``, ``last``, ``ohlc``:
+
+.. ipython:: python
+
+   ts.resample('5Min').mean()
+
+   ts.resample('5Min').ohlc()
+
+   ts.resample('5Min').max()
+
+
+For downsampling, ``closed`` can be set to 'left' or 'right' to specify which
+end of the interval is closed:
+
+.. ipython:: python
+
+   ts.resample('5Min', closed='right').mean()
+
+   ts.resample('5Min', closed='left').mean()
+
+Parameters like ``label`` and ``loffset`` are used to manipulate the resulting
+labels. ``label`` specifies whether the result is labeled with the beginning or
+the end of the interval. ``loffset`` performs a time adjustment on the output
+labels.
+
+.. ipython:: python
+
+   ts.resample('5Min').mean()  # by default label='left'
+
+   ts.resample('5Min', label='left').mean()
+
+   ts.resample('5Min', label='left', loffset='1s').mean()
+
+.. note::
+
+    The default values for ``label`` and ``closed`` is 'left' for all
+    frequency offsets except for 'M', 'A', 'Q', 'BM', 'BA', 'BQ', and 'W'
+    which all have a default of 'right'.
+
+    .. ipython:: python
+
+       rng2 = pd.date_range('1/1/2012', end='3/31/2012', freq='D')
+       ts2 = pd.Series(range(len(rng2)), index=rng2)
+
+       # default: label='right', closed='right'
+       ts2.resample('M').max()
+
+       # default: label='left', closed='left'
+       ts2.resample('SM').max()
+
+       ts2.resample('SM', label='right', closed='right').max()
+
+The ``axis`` parameter can be set to 0 or 1 and allows you to resample the
+specified axis for a ``DataFrame``.
+
+``kind`` can be set to 'timestamp' or 'period' to convert the resulting index
+to/from timestamp and time span representations. By default ``resample``
+retains the input representation.
+
+``convention`` can be set to 'start' or 'end' when resampling period data
+(detail below). It specifies how low frequency periods are converted to higher
+frequency periods.
+
+
+Upsampling
+~~~~~~~~~~
+
+For upsampling, you can specify a way to upsample and the ``limit`` parameter to interpolate over the gaps that are created:
+
+.. ipython:: python
+
+   # from secondly to every 250 milliseconds
+
+   ts[:2].resample('250L').asfreq()
+
+   ts[:2].resample('250L').ffill()
+
+   ts[:2].resample('250L').ffill(limit=2)
+
+Sparse Resampling
+~~~~~~~~~~~~~~~~~
+
+Sparse timeseries are the ones where you have a lot fewer points relative
+to the amount of time you are looking to resample. Naively upsampling a sparse
+series can potentially generate lots of intermediate values. When you don't want
+to use a method to fill these values, e.g. ``fill_method`` is ``None``, then
+intermediate values will be filled with ``NaN``.
+
+Since ``resample`` is a time-based groupby, the following is a method to efficiently
+resample only the groups that are not all ``NaN``.
+
+.. ipython:: python
+
+    rng = pd.date_range('2014-1-1', periods=100, freq='D') + pd.Timedelta('1s')
+    ts = pd.Series(range(100), index=rng)
+
+If we want to resample to the full range of the series:
+
+.. ipython:: python
+
+    ts.resample('3T').sum()
+
+We can instead only resample those groups where we have points as follows:
+
+.. ipython:: python
+
+    from functools import partial
+    from pandas.tseries.frequencies import to_offset
+
+    def round(t, freq):
+        # round a Timestamp to a specified freq
+        freq = to_offset(freq)
+        return pd.Timestamp((t.value // freq.delta.value) * freq.delta.value)
+
+    ts.groupby(partial(round, freq='3T')).sum()
+
+.. _timeseries.aggregate:
+
+Aggregation
+~~~~~~~~~~~
+
+Similar to the :ref:`aggregating API <basics.aggregate>`, :ref:`groupby API <groupby.aggregate>`, and the :ref:`window functions API <stats.aggregate>`,
+a ``Resampler`` can be selectively resampled.
+
+Resampling a ``DataFrame``, the default will be to act on all columns with the same function.
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(1000, 3),
+                     index=pd.date_range('1/1/2012', freq='S', periods=1000),
+                     columns=['A', 'B', 'C'])
+   r = df.resample('3T')
+   r.mean()
+
+We can select a specific column or columns using standard getitem.
+
+.. ipython:: python
+
+   r['A'].mean()
+
+   r[['A', 'B']].mean()
+
+You can pass a list or dict of functions to do aggregation with, outputting a ``DataFrame``:
+
+.. ipython:: python
+
+   r['A'].agg([np.sum, np.mean, np.std])
+
+On a resampled ``DataFrame``, you can pass a list of functions to apply to each
+column, which produces an aggregated result with a hierarchical index:
+
+.. ipython:: python
+
+   r.agg([np.sum, np.mean])
+
+By passing a dict to ``aggregate`` you can apply a different aggregation to the
+columns of a ``DataFrame``:
+
+.. ipython:: python
+   :okexcept:
+
+   r.agg({'A': np.sum,
+          'B': lambda x: np.std(x, ddof=1)})
+
+The function names can also be strings. In order for a string to be valid it
+must be implemented on the resampled object:
+
+.. ipython:: python
+
+   r.agg({'A': 'sum', 'B': 'std'})
+
+Furthermore, you can also specify multiple aggregation functions for each column separately.
+
+.. ipython:: python
+
+   r.agg({'A': ['sum', 'std'], 'B': ['mean', 'std']})
+
+
+If a ``DataFrame`` does not have a datetimelike index, but instead you want
+to resample based on datetimelike column in the frame, it can passed to the
+``on`` keyword.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
+                      'a': np.arange(5)},
+                     index=pd.MultiIndex.from_arrays([
+                         [1, 2, 3, 4, 5],
+                         pd.date_range('2015-01-01', freq='W', periods=5)],
+                         names=['v', 'd']))
+   df
+   df.resample('M', on='date').sum()
+
+Similarly, if you instead want to resample by a datetimelike
+level of ``MultiIndex``, its name or location can be passed to the
+``level`` keyword.
+
+.. ipython:: python
+
+   df.resample('M', level='d').sum()
+
+
+.. _timeseries.periods:
+
+Time Span Representation
+------------------------
+
+Regular intervals of time are represented by ``Period`` objects in pandas while
+sequences of ``Period`` objects are collected in a ``PeriodIndex``, which can
+be created with the convenience function ``period_range``.
+
+Period
+~~~~~~
+
+A ``Period`` represents a span of time (e.g., a day, a month, a quarter, etc).
+You can specify the span via ``freq`` keyword using a frequency alias like below.
+Because ``freq`` represents a span of ``Period``, it cannot be negative like "-3D".
+
+.. ipython:: python
+
+   pd.Period('2012', freq='A-DEC')
+
+   pd.Period('2012-1-1', freq='D')
+
+   pd.Period('2012-1-1 19:00', freq='H')
+
+   pd.Period('2012-1-1 19:00', freq='5H')
+
+Adding and subtracting integers from periods shifts the period by its own
+frequency. Arithmetic is not allowed between ``Period`` with different ``freq`` (span).
+
+.. ipython:: python
+
+   p = pd.Period('2012', freq='A-DEC')
+   p + 1
+   p - 3
+   p = pd.Period('2012-01', freq='2M')
+   p + 2
+   p - 1
+   @okexcept
+   p == pd.Period('2012-01', freq='3M')
+
+
+If ``Period`` freq is daily or higher (``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``), ``offsets`` and ``timedelta``-like can be added if the result can have the same freq. Otherwise, ``ValueError`` will be raised.
+
+.. ipython:: python
+
+   p = pd.Period('2014-07-01 09:00', freq='H')
+   p + pd.offsets.Hour(2)
+   p + datetime.timedelta(minutes=120)
+   p + np.timedelta64(7200, 's')
+
+.. code-block:: ipython
+
+   In [1]: p + pd.offsets.Minute(5)
+   Traceback
+      ...
+   ValueError: Input has different freq from Period(freq=H)
+
+If ``Period`` has other frequencies, only the same ``offsets`` can be added. Otherwise, ``ValueError`` will be raised.
+
+.. ipython:: python
+
+   p = pd.Period('2014-07', freq='M')
+   p + pd.offsets.MonthEnd(3)
+
+.. code-block:: ipython
+
+   In [1]: p + pd.offsets.MonthBegin(3)
+   Traceback
+      ...
+   ValueError: Input has different freq from Period(freq=M)
+
+Taking the difference of ``Period`` instances with the same frequency will
+return the number of frequency units between them:
+
+.. ipython:: python
+
+   pd.Period('2012', freq='A-DEC') - pd.Period('2002', freq='A-DEC')
+
+PeriodIndex and period_range
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Regular sequences of ``Period`` objects can be collected in a ``PeriodIndex``,
+which can be constructed using the ``period_range`` convenience function:
+
+.. ipython:: python
+
+   prng = pd.period_range('1/1/2011', '1/1/2012', freq='M')
+   prng
+
+The ``PeriodIndex`` constructor can also be used directly:
+
+.. ipython:: python
+
+   pd.PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
+
+Passing multiplied frequency outputs a sequence of ``Period`` which
+has multiplied span.
+
+.. ipython:: python
+
+   pd.period_range(start='2014-01', freq='3M', periods=4)
+
+If ``start`` or ``end`` are ``Period`` objects, they will be used as anchor
+endpoints for a ``PeriodIndex`` with frequency matching that of the
+``PeriodIndex`` constructor.
+
+.. ipython:: python
+
+   pd.period_range(start=pd.Period('2017Q1', freq='Q'),
+                   end=pd.Period('2017Q2', freq='Q'), freq='M')
+
+Just like ``DatetimeIndex``, a ``PeriodIndex`` can also be used to index pandas
+objects:
+
+.. ipython:: python
+
+   ps = pd.Series(np.random.randn(len(prng)), prng)
+   ps
+
+``PeriodIndex`` supports addition and subtraction with the same rule as ``Period``.
+
+.. ipython:: python
+
+   idx = pd.period_range('2014-07-01 09:00', periods=5, freq='H')
+   idx
+   idx + pd.offsets.Hour(2)
+
+   idx = pd.period_range('2014-07', periods=5, freq='M')
+   idx
+   idx + pd.offsets.MonthEnd(3)
+
+``PeriodIndex`` has its own dtype named ``period``, refer to :ref:`Period Dtypes <timeseries.period_dtype>`.
+
+.. _timeseries.period_dtype:
+
+Period Dtypes
+~~~~~~~~~~~~~
+
+.. versionadded:: 0.19.0
+
+``PeriodIndex`` has a custom ``period`` dtype. This is a pandas extension
+dtype similar to the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``).
+
+The ``period`` dtype holds the ``freq`` attribute and is represented with
+``period[freq]`` like ``period[D]`` or ``period[M]``, using :ref:`frequency strings <timeseries.offset_aliases>`.
+
+.. ipython:: python
+
+   pi = pd.period_range('2016-01-01', periods=3, freq='M')
+   pi
+   pi.dtype
+
+The ``period`` dtype can be used in ``.astype(...)``. It allows one to change the
+``freq`` of a ``PeriodIndex`` like ``.asfreq()`` and convert a
+``DatetimeIndex`` to ``PeriodIndex`` like ``to_period()``:
+
+.. ipython:: python
+
+   # change monthly freq to daily freq
+   pi.astype('period[D]')
+
+   # convert to DatetimeIndex
+   pi.astype('datetime64[ns]')
+
+   # convert to PeriodIndex
+   dti = pd.date_range('2011-01-01', freq='M', periods=3)
+   dti
+   dti.astype('period[M]')
+
+
+PeriodIndex Partial String Indexing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can pass in dates and strings to ``Series`` and ``DataFrame`` with ``PeriodIndex``, in the same manner as ``DatetimeIndex``. For details, refer to :ref:`DatetimeIndex Partial String Indexing <timeseries.partialindexing>`.
+
+.. ipython:: python
+
+   ps['2011-01']
+
+   ps[datetime.datetime(2011, 12, 25):]
+
+   ps['10/31/2011':'12/31/2011']
+
+Passing a string representing a lower frequency than ``PeriodIndex`` returns partial sliced data.
+
+.. ipython:: python
+
+   ps['2011']
+
+   dfp = pd.DataFrame(np.random.randn(600, 1),
+                      columns=['A'],
+                      index=pd.period_range('2013-01-01 9:00',
+                                            periods=600,
+                                            freq='T'))
+   dfp
+   dfp['2013-01-01 10H']
+
+As with ``DatetimeIndex``, the endpoints will be included in the result. The example below slices data starting from 10:00 to 11:59.
+
+.. ipython:: python
+
+   dfp['2013-01-01 10H':'2013-01-01 11H']
+
+Frequency Conversion and Resampling with PeriodIndex
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+The frequency of ``Period`` and ``PeriodIndex`` can be converted via the ``asfreq``
+method. Let's start with the fiscal year 2011, ending in December:
+
+.. ipython:: python
+
+   p = pd.Period('2011', freq='A-DEC')
+   p
+
+We can convert it to a monthly frequency. Using the ``how`` parameter, we can
+specify whether to return the starting or ending month:
+
+.. ipython:: python
+
+   p.asfreq('M', how='start')
+
+   p.asfreq('M', how='end')
+
+The shorthands 's' and 'e' are provided for convenience:
+
+.. ipython:: python
+
+   p.asfreq('M', 's')
+   p.asfreq('M', 'e')
+
+Converting to a "super-period" (e.g., annual frequency is a super-period of
+quarterly frequency) automatically returns the super-period that includes the
+input period:
+
+.. ipython:: python
+
+   p = pd.Period('2011-12', freq='M')
+
+   p.asfreq('A-NOV')
+
+Note that since we converted to an annual frequency that ends the year in
+November, the monthly period of December 2011 is actually in the 2012 A-NOV
+period.
+
+.. _timeseries.quarterly:
+
+Period conversions with anchored frequencies are particularly useful for
+working with various quarterly data common to economics, business, and other
+fields. Many organizations define quarters relative to the month in which their
+fiscal year starts and ends. Thus, first quarter of 2011 could start in 2010 or
+a few months into 2011. Via anchored frequencies, pandas works for all quarterly
+frequencies ``Q-JAN`` through ``Q-DEC``.
+
+``Q-DEC`` define regular calendar quarters:
+
+.. ipython:: python
+
+   p = pd.Period('2012Q1', freq='Q-DEC')
+
+   p.asfreq('D', 's')
+
+   p.asfreq('D', 'e')
+
+``Q-MAR`` defines fiscal year end in March:
+
+.. ipython:: python
+
+   p = pd.Period('2011Q4', freq='Q-MAR')
+
+   p.asfreq('D', 's')
+
+   p.asfreq('D', 'e')
+
+.. _timeseries.interchange:
+
+Converting Between Representations
+----------------------------------
+
+Timestamped data can be converted to PeriodIndex-ed data using ``to_period``
+and vice-versa using ``to_timestamp``:
+
+.. ipython:: python
+
+   rng = pd.date_range('1/1/2012', periods=5, freq='M')
+
+   ts = pd.Series(np.random.randn(len(rng)), index=rng)
+
+   ts
+
+   ps = ts.to_period()
+
+   ps
+
+   ps.to_timestamp()
+
+Remember that 's' and 'e' can be used to return the timestamps at the start or
+end of the period:
+
+.. ipython:: python
+
+   ps.to_timestamp('D', how='s')
+
+Converting between period and timestamp enables some convenient arithmetic
+functions to be used. In the following example, we convert a quarterly
+frequency with year ending in November to 9am of the end of the month following
+the quarter end:
+
+.. ipython:: python
+
+   prng = pd.period_range('1990Q1', '2000Q4', freq='Q-NOV')
+
+   ts = pd.Series(np.random.randn(len(prng)), prng)
+
+   ts.index = (prng.asfreq('M', 'e') + 1).asfreq('H', 's') + 9
+
+   ts.head()
+
+.. _timeseries.oob:
+
+Representing Out-of-Bounds Spans
+--------------------------------
+
+If you have data that is outside of the ``Timestamp`` bounds, see :ref:`Timestamp limitations <timeseries.timestamp-limits>`,
+then you can use a ``PeriodIndex`` and/or ``Series`` of ``Periods`` to do computations.
+
+.. ipython:: python
+
+   span = pd.period_range('1215-01-01', '1381-01-01', freq='D')
+   span
+
+To convert from an ``int64`` based YYYYMMDD representation.
+
+.. ipython:: python
+
+   s = pd.Series([20121231, 20141130, 99991231])
+   s
+
+   def conv(x):
+       return pd.Period(year=x // 10000, month=x // 100 % 100,
+                        day=x % 100, freq='D')
+
+   s.apply(conv)
+   s.apply(conv)[2]
+
+These can easily be converted to a ``PeriodIndex``:
+
+.. ipython:: python
+
+   span = pd.PeriodIndex(s.apply(conv))
+   span
+
+.. _timeseries.timezone:
+
+Time Zone Handling
+------------------
+
+pandas provides rich support for working with timestamps in different time
+zones using the ``pytz`` and ``dateutil`` libraries.
+
+.. note::
+
+    pandas does not yet support ``datetime.timezone`` objects from the standard
+    library.
+
+Working with Time Zones
+~~~~~~~~~~~~~~~~~~~~~~~
+
+By default, pandas objects are time zone unaware:
+
+.. ipython:: python
+
+   rng = pd.date_range('3/6/2012 00:00', periods=15, freq='D')
+   rng.tz is None
+
+To localize these dates to a time zone (assign a particular time zone to a naive date),
+you can use the ``tz_localize`` method or the ``tz`` keyword argument in
+:func:`date_range`, :class:`Timestamp`, or :class:`DatetimeIndex`.
+You can either pass ``pytz`` or ``dateutil`` time zone objects or Olson time zone database strings.
+Olson time zone strings will return ``pytz`` time zone objects by default.
+To return ``dateutil`` time zone objects, append ``dateutil/`` before the string.
+
+* In ``pytz`` you can find a list of common (and less common) time zones using
+  ``from pytz import common_timezones, all_timezones``.
+* ``dateutil`` uses the OS time zones so there isn't a fixed list available. For
+  common zones, the names are the same as ``pytz``.
+
+.. ipython:: python
+
+   import dateutil
+
+   # pytz
+   rng_pytz = pd.date_range('3/6/2012 00:00', periods=3, freq='D',
+                            tz='Europe/London')
+   rng_pytz.tz
+
+   # dateutil
+   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=3, freq='D')
+   rng_dateutil = rng_dateutil.tz_localize('dateutil/Europe/London')
+   rng_dateutil.tz
+
+   # dateutil - utc special case
+   rng_utc = pd.date_range('3/6/2012 00:00', periods=3, freq='D',
+                           tz=dateutil.tz.tzutc())
+   rng_utc.tz
+
+Note that the ``UTC`` time zone is a special case in ``dateutil`` and should be constructed explicitly
+as an instance of ``dateutil.tz.tzutc``. You can also construct other time
+zones objects explicitly first.
+
+.. ipython:: python
+
+   import pytz
+
+   # pytz
+   tz_pytz = pytz.timezone('Europe/London')
+   rng_pytz = pd.date_range('3/6/2012 00:00', periods=3, freq='D')
+   rng_pytz = rng_pytz.tz_localize(tz_pytz)
+   rng_pytz.tz == tz_pytz
+
+   # dateutil
+   tz_dateutil = dateutil.tz.gettz('Europe/London')
+   rng_dateutil = pd.date_range('3/6/2012 00:00', periods=3, freq='D',
+                                tz=tz_dateutil)
+   rng_dateutil.tz == tz_dateutil
+
+To convert a time zone aware pandas object from one time zone to another,
+you can use the ``tz_convert`` method.
+
+.. ipython:: python
+
+   rng_pytz.tz_convert('US/Eastern')
+
+.. note::
+
+    When using ``pytz`` time zones, :class:`DatetimeIndex` will construct a different
+    time zone object than a :class:`Timestamp` for the same time zone input. A :class:`DatetimeIndex`
+    can hold a collection of :class:`Timestamp` objects that may have different UTC offsets and cannot be
+    succinctly represented by one ``pytz`` time zone instance while one :class:`Timestamp`
+    represents one point in time with a specific UTC offset.
+
+    .. ipython:: python
+
+       dti = pd.date_range('2019-01-01', periods=3, freq='D', tz='US/Pacific')
+       dti.tz
+       ts = pd.Timestamp('2019-01-01', tz='US/Pacific')
+       ts.tz
+
+.. warning::
+
+	Be wary of conversions between libraries. For some time zones, ``pytz`` and ``dateutil`` have different
+	definitions of the zone. This is more of a problem for unusual time zones than for
+	'standard' zones like ``US/Eastern``.
+
+.. warning::
+
+    Be aware that a time zone definition across versions of time zone libraries may not
+    be considered equal.  This may cause problems when working with stored data that
+    is localized using one version and operated on with a different version.
+    See :ref:`here<io.hdf5-notes>` for how to handle such a situation.
+
+.. warning::
+
+    For ``pytz`` time zones, it is incorrect to pass a time zone object directly into
+    the ``datetime.datetime`` constructor
+    (e.g., ``datetime.datetime(2011, 1, 1, tz=pytz.timezone('US/Eastern'))``.
+    Instead, the datetime needs to be localized using the ``localize`` method
+    on the ``pytz`` time zone object.
+
+Under the hood, all timestamps are stored in UTC. Values from a time zone aware
+:class:`DatetimeIndex` or :class:`Timestamp` will have their fields (day, hour, minute, etc.)
+localized to the time zone. However, timestamps with the same UTC value are
+still considered to be equal even if they are in different time zones:
+
+.. ipython:: python
+
+   rng_eastern = rng_utc.tz_convert('US/Eastern')
+   rng_berlin = rng_utc.tz_convert('Europe/Berlin')
+
+   rng_eastern[2]
+   rng_berlin[2]
+   rng_eastern[2] == rng_berlin[2]
+
+Operations between :class:`Series` in different time zones will yield UTC
+:class:`Series`, aligning the data on the UTC timestamps:
+
+.. ipython:: python
+
+   ts_utc = pd.Series(range(3), pd.date_range('20130101', periods=3, tz='UTC'))
+   eastern = ts_utc.tz_convert('US/Eastern')
+   berlin = ts_utc.tz_convert('Europe/Berlin')
+   result = eastern + berlin
+   result
+   result.index
+
+To remove time zone information, use ``tz_localize(None)`` or ``tz_convert(None)``.
+``tz_localize(None)`` will remove the time zone yielding the local time representation.
+``tz_convert(None)`` will remove the time zone after converting to UTC time.
+
+.. ipython:: python
+
+   didx = pd.date_range(start='2014-08-01 09:00', freq='H',
+                        periods=3, tz='US/Eastern')
+   didx
+   didx.tz_localize(None)
+   didx.tz_convert(None)
+
+   # tz_convert(None) is identical to tz_convert('UTC').tz_localize(None)
+   didx.tz_convert('UTC').tz_localize(None)
+
+.. _timeseries.timezone_ambiguous:
+
+Ambiguous Times when Localizing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+``tz_localize`` may not be able to determine the UTC offset of a timestamp
+because daylight savings time (DST) in a local time zone causes some times to occur
+twice within one day ("clocks fall back"). The following options are available:
+
+* ``'raise'``: Raises a ``pytz.AmbiguousTimeError`` (the default behavior)
+* ``'infer'``: Attempt to determine the correct offset base on the monotonicity of the timestamps
+* ``'NaT'``: Replaces ambiguous times with ``NaT``
+* ``bool``: ``True`` represents a DST time, ``False`` represents non-DST time. An array-like of ``bool`` values is supported for a sequence of times.
+
+.. ipython:: python
+
+   rng_hourly = pd.DatetimeIndex(['11/06/2011 00:00', '11/06/2011 01:00',
+                                  '11/06/2011 01:00', '11/06/2011 02:00'])
+
+This will fail as there are ambiguous times (``'11/06/2011 01:00'``)
+
+.. code-block:: ipython
+
+   In [2]: rng_hourly.tz_localize('US/Eastern')
+   AmbiguousTimeError: Cannot infer dst time from Timestamp('2011-11-06 01:00:00'), try using the 'ambiguous' argument
+
+Handle these ambiguous times by specifying the following.
+
+.. ipython:: python
+
+   rng_hourly.tz_localize('US/Eastern', ambiguous='infer')
+   rng_hourly.tz_localize('US/Eastern', ambiguous='NaT')
+   rng_hourly.tz_localize('US/Eastern', ambiguous=[True, True, False, False])
+
+.. _timeseries.timezone_nonexistent:
+
+Nonexistent Times when Localizing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A DST transition may also shift the local time ahead by 1 hour creating nonexistent
+local times ("clocks spring forward"). The behavior of localizing a timeseries with nonexistent times
+can be controlled by the ``nonexistent`` argument. The following options are available:
+
+* ``'raise'``: Raises a ``pytz.NonExistentTimeError`` (the default behavior)
+* ``'NaT'``: Replaces nonexistent times with ``NaT``
+* ``'shift_forward'``: Shifts nonexistent times forward to the closest real time
+* ``'shift_backward'``: Shifts nonexistent times backward to the closest real time
+* timedelta object: Shifts nonexistent times by the timedelta duration
+
+.. ipython:: python
+
+    dti = pd.date_range(start='2015-03-29 02:30:00', periods=3, freq='H')
+    # 2:30 is a nonexistent time
+
+Localization of nonexistent times will raise an error by default.
+
+.. code-block:: ipython
+
+   In [2]: dti.tz_localize('Europe/Warsaw')
+   NonExistentTimeError: 2015-03-29 02:30:00
+
+Transform nonexistent times to ``NaT`` or shift the times.
+
+.. ipython:: python
+
+    dti
+    dti.tz_localize('Europe/Warsaw', nonexistent='shift_forward')
+    dti.tz_localize('Europe/Warsaw', nonexistent='shift_backward')
+    dti.tz_localize('Europe/Warsaw', nonexistent=pd.Timedelta(1, unit='H'))
+    dti.tz_localize('Europe/Warsaw', nonexistent='NaT')
+
+
+.. _timeseries.timezone_series:
+
+Time Zone Series Operations
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+A :class:`Series` with time zone **naive** values is
+represented with a dtype of ``datetime64[ns]``.
+
+.. ipython:: python
+
+   s_naive = pd.Series(pd.date_range('20130101', periods=3))
+   s_naive
+
+A :class:`Series` with a time zone **aware** values is
+represented with a dtype of ``datetime64[ns, tz]`` where ``tz`` is the time zone
+
+.. ipython:: python
+
+   s_aware = pd.Series(pd.date_range('20130101', periods=3, tz='US/Eastern'))
+   s_aware
+
+Both of these :class:`Series` time zone information
+can be manipulated via the ``.dt`` accessor, see :ref:`the dt accessor section <basics.dt_accessors>`.
+
+For example, to localize and convert a naive stamp to time zone aware.
+
+.. ipython:: python
+
+   s_naive.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
+
+Time zone information can also be manipulated using the ``astype`` method.
+This method can localize and convert time zone naive timestamps or
+convert time zone aware timestamps.
+
+.. ipython:: python
+
+   # localize and convert a naive time zone
+   s_naive.astype('datetime64[ns, US/Eastern]')
+
+   # make an aware tz naive
+   s_aware.astype('datetime64[ns]')
+
+   # convert to a new time zone
+   s_aware.astype('datetime64[ns, CET]')
+
+.. note::
+
+   Using :meth:`Series.to_numpy` on a ``Series``, returns a NumPy array of the data.
+   NumPy does not currently support time zones (even though it is *printing* in the local time zone!),
+   therefore an object array of Timestamps is returned for time zone aware data:
+
+   .. ipython:: python
+
+      s_naive.to_numpy()
+      s_aware.to_numpy()
+
+   By converting to an object array of Timestamps, it preserves the time zone
+   information. For example, when converting back to a Series:
+
+   .. ipython:: python
+
+      pd.Series(s_aware.to_numpy())
+
+   However, if you want an actual NumPy ``datetime64[ns]`` array (with the values
+   converted to UTC) instead of an array of objects, you can specify the
+   ``dtype`` argument:
+
+   .. ipython:: python
+
+      s_aware.to_numpy(dtype='datetime64[ns]')
diff --git a/doc/source/visualization.rst b/doc/source/user_guide/visualization.rst
similarity index 78%
rename from doc/source/visualization.rst
rename to doc/source/user_guide/visualization.rst
index e8998bf6f6f5c..23207a0e11a65 100644
--- a/doc/source/visualization.rst
+++ b/doc/source/user_guide/visualization.rst
@@ -1,18 +1,6 @@
-.. currentmodule:: pandas
 .. _visualization:
 
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   import pandas as pd
-   np.random.seed(123456)
-   np.set_printoptions(precision=4, suppress=True)
-   pd.options.display.max_rows = 15
-   import matplotlib
-   matplotlib.style.use('ggplot')
-   import matplotlib.pyplot as plt
-   plt.close('all')
+{{ header }}
 
 *************
 Visualization
@@ -23,13 +11,7 @@ We use the standard convention for referencing the matplotlib API:
 .. ipython:: python
 
    import matplotlib.pyplot as plt
-
-The plots in this document are made using matplotlib's ``ggplot`` style (new in version 1.4):
-
-.. code-block:: python
-
-   import matplotlib
-   matplotlib.style.use('ggplot')
+   plt.close('all')
 
 We provide the basics in pandas to easily create decent looking plots.
 See the :ref:`ecosystem <ecosystem.visualization>` section for visualization
@@ -44,7 +26,8 @@ libraries that go beyond the basics documented here.
 Basic Plotting: ``plot``
 ------------------------
 
-See the :ref:`cookbook<cookbook.plotting>` for some advanced strategies
+We will demonstrate the basics, see the :ref:`cookbook<cookbook.plotting>` for
+some advanced strategies.
 
 The ``plot`` method on Series and DataFrame is just a simple wrapper around
 :meth:`plt.plot() <matplotlib.axes.Axes.plot>`:
@@ -56,7 +39,8 @@ The ``plot`` method on Series and DataFrame is just a simple wrapper around
 
 .. ipython:: python
 
-   ts = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
+   ts = pd.Series(np.random.randn(1000),
+                  index=pd.date_range('1/1/2000', periods=1000))
    ts = ts.cumsum()
 
    @savefig series_plot_basic.png
@@ -75,11 +59,13 @@ On DataFrame, :meth:`~DataFrame.plot` is a convenience to plot all of the column
 
 .. ipython:: python
 
-   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index, columns=list('ABCD'))
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=ts.index, columns=list('ABCD'))
    df = df.cumsum()
 
+   plt.figure();
    @savefig frame_plot_basic.png
-   plt.figure(); df.plot();
+   df.plot();
 
 You can plot one column versus another using the `x` and `y` keywords in
 :meth:`~DataFrame.plot`:
@@ -101,7 +87,8 @@ You can plot one column versus another using the `x` and `y` keywords in
 
 .. note::
 
-   For more formatting and styling options, see :ref:`below <visualization.formatting>`.
+   For more formatting and styling options, see
+   :ref:`formatting <visualization.formatting>` below.
 
 .. ipython:: python
     :suppress:
@@ -114,14 +101,13 @@ Other Plots
 -----------
 
 Plotting methods allow for a handful of plot styles other than the
-default Line plot. These methods can be provided as the ``kind``
-keyword argument to :meth:`~DataFrame.plot`.
-These include:
+default line plot. These methods can be provided as the ``kind``
+keyword argument to :meth:`~DataFrame.plot`, and include:
 
 * :ref:`'bar' <visualization.barplot>` or :ref:`'barh' <visualization.barplot>` for bar plots
 * :ref:`'hist' <visualization.hist>` for histogram
 * :ref:`'box' <visualization.box>` for boxplot
-* :ref:`'kde' <visualization.kde>` or ``'density'`` for density plots
+* :ref:`'kde' <visualization.kde>` or :ref:`'density' <visualization.kde>` for density plots
 * :ref:`'area' <visualization.area_plot>` for area plots
 * :ref:`'scatter' <visualization.scatter>` for scatter plots
 * :ref:`'hexbin' <visualization.hexbin>` for hexagonal bin plots
@@ -134,9 +120,7 @@ For example, a bar plot can be created the following way:
    plt.figure();
 
    @savefig bar_plot_ex.png
-   df.iloc[5].plot(kind='bar'); plt.axhline(0, color='k')
-
-.. versionadded:: 0.17.0
+   df.iloc[5].plot(kind='bar');
 
 You can also create these other plots using the methods ``DataFrame.plot.<kind>`` instead of providing the ``kind`` keyword argument. This makes it easier to discover plot methods and the specific arguments they use:
 
@@ -145,16 +129,16 @@ You can also create these other plots using the methods ``DataFrame.plot.<kind>`
 
     In [14]: df = pd.DataFrame()
 
-    In [15]: df.plot.<TAB>
+    In [15]: df.plot.<TAB>  # noqa: E225, E999
     df.plot.area     df.plot.barh     df.plot.density  df.plot.hist     df.plot.line     df.plot.scatter
     df.plot.bar      df.plot.box      df.plot.hexbin   df.plot.kde      df.plot.pie
 
-In addition to these ``kind`` s, there are  the :ref:`DataFrame.hist() <visualization.hist>`,
+In addition to these ``kind`` s, there are the :ref:`DataFrame.hist() <visualization.hist>`,
 and :ref:`DataFrame.boxplot() <visualization.box>` methods, which use a separate interface.
 
-Finally, there are several :ref:`plotting functions <visualization.tools>` in ``pandas.tools.plotting``
+Finally, there are several :ref:`plotting functions <visualization.tools>` in ``pandas.plotting``
 that take a :class:`Series` or :class:`DataFrame` as an argument. These
-include
+include:
 
 * :ref:`Scatter Matrix <visualization.scatter_matrix>`
 * :ref:`Andrews Curves <visualization.andrews_curves>`
@@ -179,7 +163,8 @@ For labeled, non-time series data, you may wish to produce a bar plot:
    plt.figure();
 
    @savefig bar_plot_ex.png
-   df.iloc[5].plot.bar(); plt.axhline(0, color='k')
+   df.iloc[5].plot.bar()
+   plt.axhline(0, color='k');
 
 Calling a DataFrame's :meth:`plot.bar() <DataFrame.plot.bar>` method produces a multiple
 bar plot:
@@ -229,9 +214,7 @@ To get horizontal bar plots, use the ``barh`` method:
 Histograms
 ~~~~~~~~~~
 
-.. versionadded:: 0.15.0
-
-Histogram can be drawn by using the :meth:`DataFrame.plot.hist` and :meth:`Series.plot.hist` methods.
+Histograms can be drawn by using the :meth:`DataFrame.plot.hist` and :meth:`Series.plot.hist` methods.
 
 .. ipython:: python
 
@@ -249,7 +232,8 @@ Histogram can be drawn by using the :meth:`DataFrame.plot.hist` and :meth:`Serie
 
    plt.close('all')
 
-Histogram can be stacked by ``stacked=True``. Bin size can be changed by ``bins`` keyword.
+A histogram can be stacked using ``stacked=True``. Bin size can be changed
+using the ``bins`` keyword.
 
 .. ipython:: python
 
@@ -263,7 +247,9 @@ Histogram can be stacked by ``stacked=True``. Bin size can be changed by ``bins`
 
    plt.close('all')
 
-You can pass other keywords supported by matplotlib ``hist``. For example, horizontal and cumulative histgram can be drawn by ``orientation='horizontal'`` and ``cumulative='True'``.
+You can pass other keywords supported by matplotlib ``hist``. For example,
+horizontal and cumulative histograms can be drawn by
+``orientation='horizontal'`` and ``cumulative=True``.
 
 .. ipython:: python
 
@@ -306,8 +292,6 @@ subplots:
    df.diff().hist(color='k', alpha=0.5, bins=50)
 
 
-.. versionadded:: 0.10.0
-
 The ``by`` keyword can be specified to plot grouped histograms:
 
 .. ipython:: python
@@ -330,8 +314,6 @@ The ``by`` keyword can be specified to plot grouped histograms:
 Box Plots
 ~~~~~~~~~
 
-.. versionadded:: 0.15.0
-
 Boxplot can be drawn calling :meth:`Series.plot.box` and :meth:`DataFrame.plot.box`,
 or :meth:`DataFrame.boxplot` to visualize the distribution of values within each column.
 
@@ -366,8 +348,8 @@ more complicated colorization, you can get each drawn artists by passing
 
 .. ipython:: python
 
-   color = dict(boxes='DarkGreen', whiskers='DarkOrange',
-                medians='DarkBlue', caps='Gray')
+   color = {'boxes': 'DarkGreen', 'whiskers': 'DarkOrange',
+            'medians': 'DarkBlue', 'caps': 'Gray'}
 
    @savefig box_new_colorize.png
    df.plot.box(color=color, sym='r+')
@@ -402,7 +384,7 @@ The existing interface ``DataFrame.boxplot`` to plot boxplot still can be used.
 .. ipython:: python
    :okwarning:
 
-   df = pd.DataFrame(np.random.rand(10,5))
+   df = pd.DataFrame(np.random.rand(10, 5))
    plt.figure();
 
    @savefig box_plot_ex.png
@@ -420,8 +402,8 @@ groupings.  For instance,
 .. ipython:: python
    :okwarning:
 
-   df = pd.DataFrame(np.random.rand(10,2), columns=['Col1', 'Col2'] )
-   df['X'] = pd.Series(['A','A','A','A','A','B','B','B','B','B'])
+   df = pd.DataFrame(np.random.rand(10, 2), columns=['Col1', 'Col2'])
+   df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'B', 'B'])
 
    plt.figure();
 
@@ -440,14 +422,14 @@ columns:
 .. ipython:: python
    :okwarning:
 
-   df = pd.DataFrame(np.random.rand(10,3), columns=['Col1', 'Col2', 'Col3'])
-   df['X'] = pd.Series(['A','A','A','A','A','B','B','B','B','B'])
-   df['Y'] = pd.Series(['A','B','A','B','A','B','A','B','A','B'])
+   df = pd.DataFrame(np.random.rand(10, 3), columns=['Col1', 'Col2', 'Col3'])
+   df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'B', 'B'])
+   df['Y'] = pd.Series(['A', 'B', 'A', 'B', 'A', 'B', 'A', 'B', 'A', 'B'])
 
    plt.figure();
 
    @savefig box_plot_ex3.png
-   bp = df.boxplot(column=['Col1','Col2'], by=['X','Y'])
+   bp = df.boxplot(column=['Col1', 'Col2'], by=['X', 'Y'])
 
 .. ipython:: python
    :suppress:
@@ -478,7 +460,7 @@ keyword, will affect the output type as well:
 ``'both'``       Yes     Series of namedtuples
 ================ ======= ==========================
 
-``Groupby.boxplot`` always returns a Series of ``return_type``.
+``Groupby.boxplot`` always returns a ``Series`` of ``return_type``.
 
 .. ipython:: python
    :okwarning:
@@ -496,7 +478,9 @@ keyword, will affect the output type as well:
 
    plt.close('all')
 
-Compare to:
+The subplots above are split by the numeric columns first, then the value of
+the ``g`` column. Below the subplots are first split by the value of ``g``,
+then by the numeric columns.
 
 .. ipython:: python
    :okwarning:
@@ -514,8 +498,6 @@ Compare to:
 Area Plot
 ~~~~~~~~~
 
-.. versionadded:: 0.14
-
 You can create area plots with :meth:`Series.plot.area` and :meth:`DataFrame.plot.area`.
 Area plots are stacked by default. To produce stacked area plot, each column must be either all positive or all negative values.
 
@@ -552,11 +534,9 @@ To produce an unstacked plot, pass ``stacked=False``. Alpha value is set to 0.5
 Scatter Plot
 ~~~~~~~~~~~~
 
-.. versionadded:: 0.13
-
 Scatter plot can be drawn by using the :meth:`DataFrame.plot.scatter` method.
-Scatter plot requires numeric columns for x and y axis.
-These can be specified by ``x`` and ``y`` keywords each.
+Scatter plot requires numeric columns for the x and y axes.
+These can be specified by the ``x`` and ``y`` keywords.
 
 .. ipython:: python
    :suppress:
@@ -600,13 +580,14 @@ each point:
 
    plt.close('all')
 
-You can pass other keywords supported by matplotlib ``scatter``.
-Below example shows a bubble chart using a dataframe column values as bubble size.
+You can pass other keywords supported by matplotlib
+:meth:`scatter <matplotlib.axes.Axes.scatter>`. The example  below shows a
+bubble chart using a column of the ``DataFrame`` as the bubble size.
 
 .. ipython:: python
 
    @savefig scatter_plot_bubble.png
-   df.plot.scatter(x='a', y='b', s=df['c']*200);
+   df.plot.scatter(x='a', y='b', s=df['c'] * 200);
 
 .. ipython:: python
    :suppress:
@@ -621,8 +602,6 @@ See the :meth:`scatter <matplotlib.axes.Axes.scatter>` method and the
 Hexagonal Bin Plot
 ~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
-
 You can create hexagonal bin plots with :meth:`DataFrame.plot.hexbin`.
 Hexbin plots can be a useful alternative to scatter plots if your data are
 too dense to plot each point individually.
@@ -652,7 +631,7 @@ You can specify alternative aggregations by passing values to the ``C`` and
 and ``reduce_C_function`` is a function of one argument that reduces all the
 values in a bin to a single number (e.g. ``mean``, ``max``, ``sum``, ``std``).  In this
 example the positions are given by columns ``a`` and ``b``, while the value is
-given by column ``z``. The bins are aggregated with numpy's ``max`` function.
+given by column ``z``. The bins are aggregated with NumPy's ``max`` function.
 
 .. ipython:: python
    :suppress:
@@ -668,8 +647,7 @@ given by column ``z``. The bins are aggregated with numpy's ``max`` function.
    df['z'] = np.random.uniform(0, 3, 1000)
 
    @savefig hexbin_plot_agg.png
-   df.plot.hexbin(x='a', y='b', C='z', reduce_C_function=np.max,
-           gridsize=25)
+   df.plot.hexbin(x='a', y='b', C='z', reduce_C_function=np.max, gridsize=25)
 
 .. ipython:: python
    :suppress:
@@ -684,8 +662,6 @@ See the :meth:`hexbin <matplotlib.axes.Axes.hexbin>` method and the
 Pie plot
 ~~~~~~~~
 
-.. versionadded:: 0.14
-
 You can create a pie plot with :meth:`DataFrame.plot.pie` or :meth:`Series.plot.pie`.
 If your data includes any ``NaN``, they will be automatically filled with 0.
 A ``ValueError`` will be raised if there are any negative values in your data.
@@ -698,7 +674,8 @@ A ``ValueError`` will be raised if there are any negative values in your data.
 
 .. ipython:: python
 
-   series = pd.Series(3 * np.random.rand(4), index=['a', 'b', 'c', 'd'], name='series')
+   series = pd.Series(3 * np.random.rand(4),
+                      index=['a', 'b', 'c', 'd'], name='series')
 
    @savefig series_pie_plot.png
    series.plot.pie(figsize=(6, 6))
@@ -708,14 +685,16 @@ A ``ValueError`` will be raised if there are any negative values in your data.
 
    plt.close('all')
 
-For pie plots it's best to use square figures, one's with an equal aspect ratio. You can create the
-figure with equal width and height, or force the aspect ratio to be equal after plotting by
-calling ``ax.set_aspect('equal')`` on the returned ``axes`` object.
+For pie plots it's best to use square figures, i.e. a figure aspect ratio 1.
+You can create the figure with equal width and height, or force the aspect ratio
+to be equal after plotting by calling ``ax.set_aspect('equal')`` on the returned
+``axes`` object.
 
-Note that pie plot with :class:`DataFrame` requires that you either specify a target column by the ``y``
-argument or ``subplots=True``. When ``y`` is specified, pie plot of selected column
-will be drawn. If ``subplots=True`` is specified, pie plots for each column are drawn as subplots.
-A legend will be drawn in each pie plots by default; specify ``legend=False`` to hide it.
+Note that pie plot with :class:`DataFrame` requires that you either specify a
+target column by the ``y`` argument or ``subplots=True``. When ``y`` is
+specified, pie plot of selected column will be drawn. If ``subplots=True`` is
+specified, pie plots for each column are drawn as subplots. A legend will be
+drawn in each pie plots by default; specify ``legend=False`` to hide it.
 
 .. ipython:: python
    :suppress:
@@ -725,7 +704,8 @@ A legend will be drawn in each pie plots by default; specify ``legend=False`` to
 
 .. ipython:: python
 
-   df = pd.DataFrame(3 * np.random.rand(4, 2), index=['a', 'b', 'c', 'd'], columns=['x', 'y'])
+   df = pd.DataFrame(3 * np.random.rand(4, 2),
+                     index=['a', 'b', 'c', 'd'], columns=['x', 'y'])
 
    @savefig df_pie_plot.png
    df.plot.pie(subplots=True, figsize=(8, 4))
@@ -739,7 +719,7 @@ You can use the ``labels`` and ``colors`` keywords to specify the labels and col
 
 .. warning::
 
-   Most pandas plots use the the ``label`` and ``color`` arguments (note the lack of "s" on those).
+   Most pandas plots use the ``label`` and ``color`` arguments (note the lack of "s" on those).
    To be consistent with :func:`matplotlib.pyplot.pie` you must use ``labels`` and ``colors``.
 
 If you want to hide wedge labels, specify ``labels=None``.
@@ -785,7 +765,7 @@ See the `matplotlib pie documentation <http://matplotlib.org/api/pyplot_api.html
 Plotting with Missing Data
 --------------------------
 
-Pandas tries to be pragmatic about plotting DataFrames or Series
+Pandas tries to be pragmatic about plotting ``DataFrames`` or ``Series``
 that contain missing data. Missing values are dropped, left out, or filled
 depending on the plot type.
 
@@ -823,7 +803,7 @@ before plotting.
 Plotting Tools
 --------------
 
-These functions can be imported from ``pandas.tools.plotting``
+These functions can be imported from ``pandas.plotting``
 and take a :class:`Series` or :class:`DataFrame` as an argument.
 
 .. _visualization.scatter_matrix:
@@ -831,10 +811,8 @@ and take a :class:`Series` or :class:`DataFrame` as an argument.
 Scatter Matrix Plot
 ~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.7.3
-
 You can create a scatter plot matrix using the
-``scatter_matrix`` method in ``pandas.tools.plotting``:
+``scatter_matrix`` method in ``pandas.plotting``:
 
 .. ipython:: python
    :suppress:
@@ -843,7 +821,7 @@ You can create a scatter plot matrix using the
 
 .. ipython:: python
 
-   from pandas.tools.plotting import scatter_matrix
+   from pandas.plotting import scatter_matrix
    df = pd.DataFrame(np.random.randn(1000, 4), columns=['a', 'b', 'c', 'd'])
 
    @savefig scatter_matrix_kde.png
@@ -859,8 +837,6 @@ You can create a scatter plot matrix using the
 Density Plot
 ~~~~~~~~~~~~
 
-.. versionadded:: 0.8.0
-
 You can create density plots using the :meth:`Series.plot.kde` and :meth:`DataFrame.plot.kde` methods.
 
 .. ipython:: python
@@ -888,7 +864,8 @@ Andrews Curves
 
 Andrews curves allow one to plot multivariate data as a large number
 of curves that are created using the attributes of samples as coefficients
-for Fourier series. By coloring these curves differently for each class
+for Fourier series, see the `Wikipedia entry <https://en.wikipedia.org/wiki/Andrews_plot>`__
+for more information. By coloring these curves differently for each class
 it is possible to visualize data clustering. Curves belonging to samples
 of the same class will usually be closer together and form larger structures.
 
@@ -896,7 +873,7 @@ of the same class will usually be closer together and form larger structures.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import andrews_curves
+   from pandas.plotting import andrews_curves
 
    data = pd.read_csv('data/iris.data')
 
@@ -910,15 +887,17 @@ of the same class will usually be closer together and form larger structures.
 Parallel Coordinates
 ~~~~~~~~~~~~~~~~~~~~
 
-Parallel coordinates is a plotting technique for plotting multivariate data.
-It allows one to see clusters in data and to estimate other statistics visually.
+Parallel coordinates is a plotting technique for plotting multivariate data,
+see the `Wikipedia entry <https://en.wikipedia.org/wiki/Parallel_coordinates>`__
+for an introduction.
+Parallel coordinates allows one to see clusters in data and to estimate other statistics visually.
 Using parallel coordinates points are represented as connected line segments.
 Each vertical line represents one attribute. One set of connected line segments
 represents one data point. Points that tend to cluster will appear closer together.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import parallel_coordinates
+   from pandas.plotting import parallel_coordinates
 
    data = pd.read_csv('data/iris.data')
 
@@ -939,7 +918,9 @@ Lag Plot
 
 Lag plots are used to check if a data set or time series is random. Random
 data should not exhibit any structure in the lag plot. Non-random structure
-implies that the underlying data are not random.
+implies that the underlying data are not random. The ``lag`` argument may
+be passed, and when ``lag=1`` the plot is essentially ``data[:-1]`` vs.
+``data[1:]``.
 
 .. ipython:: python
    :suppress:
@@ -948,12 +929,12 @@ implies that the underlying data are not random.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import lag_plot
+   from pandas.plotting import lag_plot
 
    plt.figure()
 
-   data = pd.Series(0.1 * np.random.rand(1000) +
-       0.9 * np.sin(np.linspace(-99 * np.pi, 99 * np.pi, num=1000)))
+   spacing = np.linspace(-99 * np.pi, 99 * np.pi, num=1000)
+   data = pd.Series(0.1 * np.random.rand(1000) + 0.9 * np.sin(spacing))
 
    @savefig lag_plot.png
    lag_plot(data)
@@ -974,7 +955,9 @@ If time series is random, such autocorrelations should be near zero for any and
 all time-lag separations. If time series is non-random then one or more of the
 autocorrelations will be significantly non-zero. The horizontal lines displayed
 in the plot correspond to 95% and 99% confidence bands. The dashed line is 99%
-confidence band.
+confidence band. See the
+`Wikipedia entry <https://en.wikipedia.org/wiki/Correlogram>`__ for more about
+autocorrelation plots.
 
 .. ipython:: python
    :suppress:
@@ -983,12 +966,12 @@ confidence band.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import autocorrelation_plot
+   from pandas.plotting import autocorrelation_plot
 
    plt.figure()
 
-   data = pd.Series(0.7 * np.random.rand(1000) +
-      0.3 * np.sin(np.linspace(-9 * np.pi, 9 * np.pi, num=1000)))
+   spacing = np.linspace(-9 * np.pi, 9 * np.pi, num=1000)
+   data = pd.Series(0.7 * np.random.rand(1000) + 0.3 * np.sin(spacing))
 
    @savefig autocorrelation_plot.png
    autocorrelation_plot(data)
@@ -1016,7 +999,7 @@ are what constitutes the bootstrap plot.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import bootstrap_plot
+   from pandas.plotting import bootstrap_plot
 
    data = pd.Series(np.random.rand(1000))
 
@@ -1043,12 +1026,14 @@ unit interval). The point in the plane, where our sample settles to (where the
 forces acting on our sample are at an equilibrium) is where a dot representing
 our sample will be drawn. Depending on which class that sample belongs it will
 be colored differently.
+See the R package `Radviz <https://cran.r-project.org/web/packages/Radviz/>`__
+for more information.
 
 **Note**: The "Iris" dataset is available `here <https://raw.github.com/pandas-dev/pandas/master/pandas/tests/data/iris.csv>`__.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import radviz
+   from pandas.plotting import radviz
 
    data = pd.read_csv('data/iris.data')
 
@@ -1067,13 +1052,29 @@ be colored differently.
 Plot Formatting
 ---------------
 
+Setting the plot style
+~~~~~~~~~~~~~~~~~~~~~~
+
+From version 1.5 and up, matplotlib offers a range of pre-configured plotting styles. Setting the
+style can be used to easily give plots the general look that you want.
+Setting the style is as easy as calling ``matplotlib.style.use(my_plot_style)`` before
+creating your plot. For example you could write ``matplotlib.style.use('ggplot')`` for ggplot-style
+plots.
+
+You can see the various available style names at ``matplotlib.style.available`` and it's very
+easy to try them out.
+
+General plot style arguments
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
 Most plotting methods have a set of keyword arguments that control the
 layout and formatting of the returned plot:
 
 .. ipython:: python
 
+   plt.figure();
    @savefig series_plot_basic2.png
-   plt.figure(); ts.plot(style='k--', label='Series');
+   ts.plot(style='k--', label='Series');
 
 .. ipython:: python
    :suppress:
@@ -1100,7 +1101,8 @@ shown by default.
 
 .. ipython:: python
 
-   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index, columns=list('ABCD'))
+   df = pd.DataFrame(np.random.randn(1000, 4),
+                     index=ts.index, columns=list('ABCD'))
    df = df.cumsum()
 
    @savefig frame_plot_basic_noleg.png
@@ -1124,7 +1126,8 @@ You may pass ``logy`` to get a log-scale Y axis.
 
 .. ipython:: python
 
-   ts = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
+   ts = pd.Series(np.random.randn(1000),
+                  index=pd.date_range('1/1/2000', periods=1000))
    ts = np.exp(ts.cumsum())
 
    @savefig series_plot_logy.png
@@ -1159,7 +1162,7 @@ To plot data on a secondary y-axis, use the ``secondary_y`` keyword:
 
    plt.close('all')
 
-To plot some columns in a DataFrame, give the column names to the ``secondary_y``
+To plot some columns in a ``DataFrame``, give the column names to the ``secondary_y``
 keyword:
 
 .. ipython:: python
@@ -1199,7 +1202,7 @@ time-series data. For limited cases where pandas cannot infer the frequency
 information (e.g., in an externally created ``twinx``), you can choose to
 suppress this behavior for alignment purposes.
 
-Here is the default behavior, notice how the x-axis tick labelling is performed:
+Here is the default behavior, notice how the x-axis tick labeling is performed:
 
 .. ipython:: python
 
@@ -1228,14 +1231,14 @@ Using the ``x_compat`` parameter, you can suppress this behavior:
    plt.close('all')
 
 If you have more than one plot that needs to be suppressed, the ``use`` method
-in ``pandas.plot_params`` can be used in a `with statement`:
+in ``pandas.plotting.plot_params`` can be used in a `with statement`:
 
 .. ipython:: python
 
    plt.figure()
 
    @savefig ser_plot_suppress_context.png
-   with pd.plot_params.use('x_compat', True):
+   with pd.plotting.plot_params.use('x_compat', True):
        df.A.plot(color='r')
        df.B.plot(color='g')
        df.C.plot(color='b')
@@ -1260,7 +1263,7 @@ See the :meth:`autofmt_xdate <matplotlib.figure.autofmt_xdate>` method and the
 Subplots
 ~~~~~~~~
 
-Each Series in a DataFrame can be plotted on a different axis
+Each ``Series`` in a ``DataFrame`` can be plotted on a different axis
 with the ``subplots`` keyword:
 
 .. ipython:: python
@@ -1276,13 +1279,13 @@ with the ``subplots`` keyword:
 Using Layout and Targeting Multiple Axes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-The layout of subplots can be specified by ``layout`` keyword. It can accept
+The layout of subplots can be specified by the ``layout`` keyword. It can accept
 ``(rows, columns)``. The ``layout`` keyword can be used in
-``hist`` and ``boxplot`` also. If input is invalid, ``ValueError`` will be raised.
+``hist`` and ``boxplot`` also. If the input is invalid, a ``ValueError`` will be raised.
 
 The number of axes which can be contained by rows x columns specified by ``layout`` must be
 larger than the number of required subplots. If layout can contain more axes than required,
-blank axes are not drawn. Similar to a numpy array's ``reshape`` method, you
+blank axes are not drawn. Similar to a NumPy array's ``reshape`` method, you
 can use ``-1`` for one dimension to automatically calculate the number of rows
 or columns needed, given the other.
 
@@ -1296,7 +1299,7 @@ or columns needed, given the other.
 
    plt.close('all')
 
-The above example is identical to using
+The above example is identical to using:
 
 .. ipython:: python
 
@@ -1310,24 +1313,25 @@ The above example is identical to using
 The required number of columns (3) is inferred from the number of series to plot
 and the given number of rows (2).
 
-Also, you can pass multiple axes created beforehand as list-like via ``ax`` keyword.
-This allows to use more complicated layout.
+You can pass multiple axes created beforehand as list-like via ``ax`` keyword.
+This allows more complicated layouts.
 The passed axes must be the same number as the subplots being drawn.
 
-When multiple axes are passed via ``ax`` keyword, ``layout``, ``sharex`` and ``sharey`` keywords
+When multiple axes are passed via the ``ax`` keyword, ``layout``, ``sharex`` and ``sharey`` keywords
 don't affect to the output. You should explicitly pass ``sharex=False`` and ``sharey=False``,
 otherwise you will see a warning.
 
 .. ipython:: python
 
-   fig, axes = plt.subplots(4, 4, figsize=(6, 6));
-   plt.subplots_adjust(wspace=0.5, hspace=0.5);
+   fig, axes = plt.subplots(4, 4, figsize=(6, 6))
+   plt.subplots_adjust(wspace=0.5, hspace=0.5)
    target1 = [axes[0][0], axes[1][1], axes[2][2], axes[3][3]]
    target2 = [axes[3][0], axes[2][1], axes[1][2], axes[0][3]]
 
    df.plot(subplots=True, ax=target1, legend=False, sharex=False, sharey=False);
    @savefig frame_plot_subplots_multi_ax.png
-   (-df).plot(subplots=True, ax=target2, legend=False, sharex=False, sharey=False);
+   (-df).plot(subplots=True, ax=target2, legend=False,
+              sharex=False, sharey=False);
 
 .. ipython:: python
    :suppress:
@@ -1340,10 +1344,12 @@ Another option is passing an ``ax`` argument to :meth:`Series.plot` to plot on a
    :suppress:
 
    np.random.seed(123456)
-   ts = pd.Series(np.random.randn(1000), index=pd.date_range('1/1/2000', periods=1000))
+   ts = pd.Series(np.random.randn(1000),
+                  index=pd.date_range('1/1/2000', periods=1000))
    ts = ts.cumsum()
 
-   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index, columns=list('ABCD'))
+   df = pd.DataFrame(np.random.randn(1000, 4), index=ts.index,
+                     columns=list('ABCD'))
    df = df.cumsum()
 
 .. ipython:: python
@@ -1354,12 +1360,15 @@ Another option is passing an ``ax`` argument to :meth:`Series.plot` to plot on a
 .. ipython:: python
 
    fig, axes = plt.subplots(nrows=2, ncols=2)
-   df['A'].plot(ax=axes[0,0]); axes[0,0].set_title('A');
-   df['B'].plot(ax=axes[0,1]); axes[0,1].set_title('B');
-   df['C'].plot(ax=axes[1,0]); axes[1,0].set_title('C');
-
+   df['A'].plot(ax=axes[0, 0]);
+   axes[0, 0].set_title('A');
+   df['B'].plot(ax=axes[0, 1]);
+   axes[0, 1].set_title('B');
+   df['C'].plot(ax=axes[1, 0]);
+   axes[1, 0].set_title('C');
+   df['D'].plot(ax=axes[1, 1]);
    @savefig series_plot_multi.png
-   df['D'].plot(ax=axes[1,1]); axes[1,1].set_title('D');
+   axes[1, 1].set_title('D');
 
 .. ipython:: python
    :suppress:
@@ -1371,15 +1380,13 @@ Another option is passing an ``ax`` argument to :meth:`Series.plot` to plot on a
 Plotting With Error Bars
 ~~~~~~~~~~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
+Plotting with error bars is supported in :meth:`DataFrame.plot` and :meth:`Series.plot`.
 
-Plotting with error bars is now supported in the :meth:`DataFrame.plot` and :meth:`Series.plot`
+Horizontal and vertical error bars can be supplied to the ``xerr`` and ``yerr`` keyword arguments to :meth:`~DataFrame.plot()`. The error values can be specified using a variety of formats:
 
-Horizontal and vertical errorbars can be supplied to the ``xerr`` and ``yerr`` keyword arguments to :meth:`~DataFrame.plot()`. The error values can be specified using a variety of formats.
-
-- As a :class:`DataFrame` or ``dict`` of errors with column names matching the ``columns`` attribute of the plotting :class:`DataFrame` or matching the ``name`` attribute of the :class:`Series`
-- As a ``str`` indicating which of the columns of plotting :class:`DataFrame` contain the error values
-- As raw values (``list``, ``tuple``, or ``np.ndarray``). Must be the same length as the plotting :class:`DataFrame`/:class:`Series`
+* As a :class:`DataFrame` or ``dict`` of errors with column names matching the ``columns`` attribute of the plotting :class:`DataFrame` or matching the ``name`` attribute of the :class:`Series`.
+* As a ``str`` indicating which of the columns of plotting :class:`DataFrame` contain the error values.
+* As raw values (``list``, ``tuple``, or ``np.ndarray``). Must be the same length as the plotting :class:`DataFrame`/:class:`Series`.
 
 Asymmetrical error bars are also supported, however raw error values must be provided in this case. For a ``M`` length :class:`Series`, a ``Mx2`` array should be provided indicating lower and upper (or left and right) errors. For a ``MxN`` :class:`DataFrame`, asymmetrical errors should be in a ``Mx2xN`` array.
 
@@ -1388,10 +1395,16 @@ Here is an example of one way to easily plot group means with standard deviation
 .. ipython:: python
 
    # Generate the data
-   ix3 = pd.MultiIndex.from_arrays([['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'], ['foo', 'foo', 'bar', 'bar', 'foo', 'foo', 'bar', 'bar']], names=['letter', 'word'])
-   df3 = pd.DataFrame({'data1': [3, 2, 4, 3, 2, 4, 3, 2], 'data2': [6, 5, 7, 5, 4, 5, 6, 5]}, index=ix3)
+   ix3 = pd.MultiIndex.from_arrays([
+       ['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'],
+       ['foo', 'foo', 'bar', 'bar', 'foo', 'foo', 'bar', 'bar']],
+       names=['letter', 'word'])
+
+   df3 = pd.DataFrame({'data1': [3, 2, 4, 3, 2, 4, 3, 2],
+                       'data2': [6, 5, 7, 5, 4, 5, 6, 5]}, index=ix3)
 
-   # Group by index labels and take the means and standard deviations for each group
+   # Group by index labels and take the means and standard deviations
+   # for each group
    gp3 = df3.groupby(level=('letter', 'word'))
    means = gp3.mean()
    errors = gp3.std()
@@ -1401,7 +1414,7 @@ Here is an example of one way to easily plot group means with standard deviation
    # Plot
    fig, ax = plt.subplots()
    @savefig errorbar_example.png
-   means.plot.bar(yerr=errors, ax=ax)
+   means.plot.bar(yerr=errors, ax=ax, capsize=4)
 
 .. ipython:: python
    :suppress:
@@ -1413,8 +1426,6 @@ Here is an example of one way to easily plot group means with standard deviation
 Plotting Tables
 ~~~~~~~~~~~~~~~
 
-.. versionadded:: 0.14
-
 Plotting with matplotlib table is now supported in  :meth:`DataFrame.plot` and :meth:`Series.plot` with a ``table`` keyword. The ``table`` keyword can accept ``bool``, :class:`DataFrame` or :class:`Series`. The simple way to draw a table is to specify ``table=True``. Data will be transposed to meet matplotlib's default layout.
 
 .. ipython:: python
@@ -1436,7 +1447,10 @@ Plotting with matplotlib table is now supported in  :meth:`DataFrame.plot` and :
 
    plt.close('all')
 
-Also, you can pass different :class:`DataFrame` or :class:`Series` for ``table`` keyword. The data will be drawn as displayed in print method (not transposed automatically). If required, it should be transposed manually as below example.
+Also, you can pass a different :class:`DataFrame` or :class:`Series` to the
+``table`` keyword. The data will be drawn as displayed in print method
+(not transposed automatically). If required, it should be transposed manually
+as seen in the example below.
 
 .. ipython:: python
 
@@ -1450,11 +1464,14 @@ Also, you can pass different :class:`DataFrame` or :class:`Series` for ``table``
 
    plt.close('all')
 
-Finally, there is a helper function ``pandas.tools.plotting.table`` to create a table from :class:`DataFrame` and :class:`Series`, and add it to an ``matplotlib.Axes``. This function can accept keywords which matplotlib table has.
+There also exists a helper function ``pandas.plotting.table``, which creates a
+table from :class:`DataFrame` or :class:`Series`, and adds it to an
+``matplotlib.Axes`` instance. This function can accept keywords which the
+matplotlib `table <http://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table>`__ has.
 
 .. ipython:: python
 
-   from pandas.tools.plotting import table
+   from pandas.plotting import table
    fig, ax = plt.subplots(1, 1)
 
    table(ax, np.round(df.describe(), 2),
@@ -1477,18 +1494,18 @@ Colormaps
 
 A potential issue when plotting a large number of columns is that it can be
 difficult to distinguish some series due to repetition in the default colors. To
-remedy this, DataFrame plotting supports the use of the ``colormap=`` argument,
+remedy this, ``DataFrame`` plotting supports the use of the ``colormap`` argument,
 which accepts either a Matplotlib `colormap <http://matplotlib.org/api/cm_api.html>`__
 or a string that is a name of a colormap registered with Matplotlib. A
 visualization of the default matplotlib colormaps is available `here
-<http://wiki.scipy.org/Cookbook/Matplotlib/Show_colormaps>`__.
+<https://matplotlib.org/examples/color/colormaps_reference.html>`__.
 
 As matplotlib does not directly support colormaps for line-based plots, the
 colors are selected based on an even spacing determined by the number of columns
-in the DataFrame. There is no consideration made for background color, so some
+in the ``DataFrame``. There is no consideration made for background color, so some
 colormaps will produce lines that are not easily visible.
 
-To use the cubehelix colormap, we can simply pass ``'cubehelix'`` to ``colormap=``
+To use the cubehelix colormap, we can pass ``colormap='cubehelix'``.
 
 .. ipython:: python
    :suppress:
@@ -1510,7 +1527,7 @@ To use the cubehelix colormap, we can simply pass ``'cubehelix'`` to ``colormap=
 
    plt.close('all')
 
-or we can pass the colormap itself
+Alternatively, we can pass the colormap itself:
 
 .. ipython:: python
 
@@ -1581,9 +1598,9 @@ Plotting directly with matplotlib
 
 In some situations it may still be preferable or necessary to prepare plots
 directly with matplotlib, for instance when a certain type of plot or
-customization is not (yet) supported by pandas. Series and DataFrame objects
-behave like arrays and can therefore be passed directly to matplotlib functions
-without explicit casts.
+customization is not (yet) supported by pandas. ``Series`` and ``DataFrame``
+objects behave like arrays and can therefore be passed directly to
+matplotlib functions without explicit casts.
 
 pandas also automatically registers formatters and locators that recognize date
 indices, thereby extending date and time support to practically all plot types
@@ -1591,10 +1608,6 @@ available in matplotlib. Although this formatting does not provide the same
 level of refinement you would get when plotting via pandas, it can be faster
 when plotting a large number of points.
 
-.. note::
-
-    The speed up for large data sets only applies to pandas 0.14.0 and later.
-
 .. ipython:: python
    :suppress:
 
@@ -1612,7 +1625,8 @@ when plotting a large number of points.
    plt.plot(price.index, price, 'k')
    plt.plot(ma.index, ma, 'b')
    @savefig bollinger.png
-   plt.fill_between(mstd.index, ma-2*mstd, ma+2*mstd, color='b', alpha=0.2)
+   plt.fill_between(mstd.index, ma - 2 * mstd, ma + 2 * mstd,
+                    color='b', alpha=0.2)
 
 .. ipython:: python
    :suppress:
diff --git a/doc/source/whatsnew.rst b/doc/source/whatsnew.rst
deleted file mode 100644
index d6fb1c6a8f9cc..0000000000000
--- a/doc/source/whatsnew.rst
+++ /dev/null
@@ -1,87 +0,0 @@
-.. _whatsnew:
-
-.. currentmodule:: pandas
-
-.. ipython:: python
-   :suppress:
-
-   import numpy as np
-   from pandas import *
-   import pandas as pd
-   randn = np.random.randn
-   np.set_printoptions(precision=4, suppress=True)
-   options.display.max_rows = 15
-
-**********
-What's New
-**********
-
-These are new features and improvements of note in each release.
-
-.. include:: whatsnew/v0.20.0.txt
-
-.. include:: whatsnew/v0.19.2.txt
-
-.. include:: whatsnew/v0.19.1.txt
-
-.. include:: whatsnew/v0.19.0.txt
-
-.. include:: whatsnew/v0.18.1.txt
-
-.. include:: whatsnew/v0.18.0.txt
-
-.. include:: whatsnew/v0.17.1.txt
-
-.. include:: whatsnew/v0.17.0.txt
-
-.. include:: whatsnew/v0.16.2.txt
-
-.. include:: whatsnew/v0.16.1.txt
-
-.. include:: whatsnew/v0.16.0.txt
-
-.. include:: whatsnew/v0.15.2.txt
-
-.. include:: whatsnew/v0.15.1.txt
-
-.. include:: whatsnew/v0.15.0.txt
-
-.. include:: whatsnew/v0.14.1.txt
-
-.. include:: whatsnew/v0.14.0.txt
-
-.. include:: whatsnew/v0.13.1.txt
-
-.. include:: whatsnew/v0.13.0.txt
-
-.. include:: whatsnew/v0.12.0.txt
-
-.. include:: whatsnew/v0.11.0.txt
-
-.. include:: whatsnew/v0.10.1.txt
-
-.. include:: whatsnew/v0.10.0.txt
-
-.. include:: whatsnew/v0.9.1.txt
-
-.. include:: whatsnew/v0.9.0.txt
-
-.. include:: whatsnew/v0.8.1.txt
-
-.. include:: whatsnew/v0.8.0.txt
-
-.. include:: whatsnew/v0.7.3.txt
-
-.. include:: whatsnew/v0.7.2.txt
-
-.. include:: whatsnew/v0.7.1.txt
-
-.. include:: whatsnew/v0.7.0.txt
-
-.. include:: whatsnew/v0.6.1.txt
-
-.. include:: whatsnew/v0.6.0.txt
-
-.. include:: whatsnew/v0.5.0.txt
-
-.. include:: whatsnew/v0.4.x.txt
diff --git a/doc/source/whatsnew/index.rst b/doc/source/whatsnew/index.rst
new file mode 100644
index 0000000000000..d0aab4012ffd5
--- /dev/null
+++ b/doc/source/whatsnew/index.rst
@@ -0,0 +1,203 @@
+.. _release:
+
+{{ header }}
+
+*************
+Release Notes
+*************
+
+This is the list of changes to pandas between each release. For full details,
+see the commit logs at http://github.com/pandas-dev/pandas. For install and
+upgrade instructions, see :ref:`install`.
+
+Version 0.24
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.24.0
+
+Version 0.23
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.23.4
+   v0.23.3
+   v0.23.2
+   v0.23.1
+   v0.23.0
+
+Version 0.22
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.22.0
+
+Version 0.21
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.21.1
+   v0.21.0
+
+Version 0.20
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.20.3
+   v0.20.2
+   v0.20.0
+
+Version 0.19
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.19.2
+   v0.19.1
+   v0.19.0
+
+Version 0.18
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.18.1
+   v0.18.0
+
+Version 0.17
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.17.1
+   v0.17.0
+
+Version 0.16
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.16.2
+   v0.16.1
+   v0.16.0
+
+Version 0.15
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.15.2
+   v0.15.1
+   v0.15.0
+
+Version 0.14
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.14.1
+   v0.14.0
+
+Version 0.13
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.13.1
+   v0.13.0
+
+Version 0.12
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.12.0
+
+Version 0.11
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.11.0
+
+Version 0.10
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.10.1
+   v0.10.0
+
+Version 0.9
+-----------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.9.1
+   v0.9.0
+
+Version 0.8
+------------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.8.1
+   v0.8.0
+
+Version 0.7
+-----------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.7.3
+   v0.7.2
+   v0.7.1
+   v0.7.0
+
+Version 0.6
+-----------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.6.1
+   v0.6.0
+
+Version 0.5
+-----------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.5.0
+
+Version 0.4
+-----------
+
+.. toctree::
+   :maxdepth: 2
+
+   v0.4.x
diff --git a/doc/source/whatsnew/v0.10.0.rst b/doc/source/whatsnew/v0.10.0.rst
new file mode 100644
index 0000000000000..2d6550bb6888d
--- /dev/null
+++ b/doc/source/whatsnew/v0.10.0.rst
@@ -0,0 +1,446 @@
+.. _whatsnew_0100:
+
+v0.10.0 (December 17, 2012)
+---------------------------
+
+{{ header }}
+
+
+This is a major release from 0.9.1 and includes many new features and
+enhancements along with a large number of bug fixes. There are also a number of
+important API changes that long-time pandas users should pay close attention
+to.
+
+File parsing new features
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The delimited file parsing engine (the guts of ``read_csv`` and ``read_table``)
+has been rewritten from the ground up and now uses a fraction the amount of
+memory while parsing, while being 40% or more faster in most use cases (in some
+cases much faster).
+
+There are also many new features:
+
+- Much-improved Unicode handling via the ``encoding`` option.
+- Column filtering (``usecols``)
+- Dtype specification (``dtype`` argument)
+- Ability to specify strings to be recognized as True/False
+- Ability to yield NumPy record arrays (``as_recarray``)
+- High performance ``delim_whitespace`` option
+- Decimal format (e.g. European format) specification
+- Easier CSV dialect options: ``escapechar``, ``lineterminator``,
+  ``quotechar``, etc.
+- More robust handling of many exceptional kinds of files observed in the wild
+
+API changes
+~~~~~~~~~~~
+
+**Deprecated DataFrame BINOP TimeSeries special case behavior**
+
+The default behavior of binary operations between a DataFrame and a Series has
+always been to align on the DataFrame's columns and broadcast down the rows,
+**except** in the special case that the DataFrame contains time series. Since
+there are now method for each binary operator enabling you to specify how you
+want to broadcast, we are phasing out this special case (Zen of Python:
+*Special cases aren't special enough to break the rules*). Here's what I'm
+talking about:
+
+.. ipython:: python
+   :okwarning:
+
+   import pandas as pd
+   df = pd.DataFrame(np.random.randn(6, 4),
+                     index=pd.date_range('1/1/2000', periods=6))
+   df
+   # deprecated now
+   df - df[0]
+   # Change your code to
+   df.sub(df[0], axis=0)  # align on axis 0 (rows)
+
+You will get a deprecation warning in the 0.10.x series, and the deprecated
+functionality will be removed in 0.11 or later.
+
+**Altered resample default behavior**
+
+The default time series ``resample`` binning behavior of daily ``D`` and
+*higher* frequencies has been changed to ``closed='left', label='left'``. Lower
+nfrequencies are unaffected. The prior defaults were causing a great deal of
+confusion for users, especially resampling data to daily frequency (which
+labeled the aggregated group with the end of the interval: the next day).
+
+.. code-block:: ipython
+
+   In [1]: dates = pd.date_range('1/1/2000', '1/5/2000', freq='4h')
+
+   In [2]: series = pd.Series(np.arange(len(dates)), index=dates)
+
+   In [3]: series
+   Out[3]:
+   2000-01-01 00:00:00     0
+   2000-01-01 04:00:00     1
+   2000-01-01 08:00:00     2
+   2000-01-01 12:00:00     3
+   2000-01-01 16:00:00     4
+   2000-01-01 20:00:00     5
+   2000-01-02 00:00:00     6
+   2000-01-02 04:00:00     7
+   2000-01-02 08:00:00     8
+   2000-01-02 12:00:00     9
+   2000-01-02 16:00:00    10
+   2000-01-02 20:00:00    11
+   2000-01-03 00:00:00    12
+   2000-01-03 04:00:00    13
+   2000-01-03 08:00:00    14
+   2000-01-03 12:00:00    15
+   2000-01-03 16:00:00    16
+   2000-01-03 20:00:00    17
+   2000-01-04 00:00:00    18
+   2000-01-04 04:00:00    19
+   2000-01-04 08:00:00    20
+   2000-01-04 12:00:00    21
+   2000-01-04 16:00:00    22
+   2000-01-04 20:00:00    23
+   2000-01-05 00:00:00    24
+   Freq: 4H, dtype: int64
+
+   In [4]: series.resample('D', how='sum')
+   Out[4]:
+   2000-01-01     15
+   2000-01-02     51
+   2000-01-03     87
+   2000-01-04    123
+   2000-01-05     24
+   Freq: D, dtype: int64
+
+   In [5]: # old behavior
+   In [6]: series.resample('D', how='sum', closed='right', label='right')
+   Out[6]:
+   2000-01-01      0
+   2000-01-02     21
+   2000-01-03     57
+   2000-01-04     93
+   2000-01-05    129
+   Freq: D, dtype: int64
+
+- Infinity and negative infinity are no longer treated as NA by ``isnull`` and
+  ``notnull``. That they ever were was a relic of early pandas. This behavior
+  can be re-enabled globally by the ``mode.use_inf_as_null`` option:
+
+.. code-block:: ipython
+
+    In [6]: s = pd.Series([1.5, np.inf, 3.4, -np.inf])
+
+    In [7]: pd.isnull(s)
+    Out[7]:
+    0    False
+    1    False
+    2    False
+    3    False
+    Length: 4, dtype: bool
+
+    In [8]: s.fillna(0)
+    Out[8]:
+    0    1.500000
+    1         inf
+    2    3.400000
+    3        -inf
+    Length: 4, dtype: float64
+
+    In [9]: pd.set_option('use_inf_as_null', True)
+
+    In [10]: pd.isnull(s)
+    Out[10]:
+    0    False
+    1     True
+    2    False
+    3     True
+    Length: 4, dtype: bool
+
+    In [11]: s.fillna(0)
+    Out[11]:
+    0    1.5
+    1    0.0
+    2    3.4
+    3    0.0
+    Length: 4, dtype: float64
+
+    In [12]: pd.reset_option('use_inf_as_null')
+
+- Methods with the ``inplace`` option now all return ``None`` instead of the
+  calling object. E.g. code written like ``df = df.fillna(0, inplace=True)``
+  may stop working. To fix, simply delete the unnecessary variable assignment.
+
+- ``pandas.merge`` no longer sorts the group keys (``sort=False``) by
+  default. This was done for performance reasons: the group-key sorting is
+  often one of the more expensive parts of the computation and is often
+  unnecessary.
+
+- The default column names for a file with no header have been changed to the
+  integers ``0`` through ``N - 1``. This is to create consistency with the
+  DataFrame constructor with no columns specified. The v0.9.0 behavior (names
+  ``X0``, ``X1``, ...) can be reproduced by specifying ``prefix='X'``:
+
+.. ipython:: python
+
+    import io
+
+    data = ('a,b,c\n'
+            '1,Yes,2\n'
+            '3,No,4')
+    print(data)
+    pd.read_csv(io.StringIO(data), header=None)
+    pd.read_csv(io.StringIO(data), header=None, prefix='X')
+
+- Values like ``'Yes'`` and ``'No'`` are not interpreted as boolean by default,
+  though this can be controlled by new ``true_values`` and ``false_values``
+  arguments:
+
+.. ipython:: python
+
+    print(data)
+    pd.read_csv(io.StringIO(data))
+    pd.read_csv(io.StringIO(data), true_values=['Yes'], false_values=['No'])
+
+- The file parsers will not recognize non-string values arising from a
+  converter function as NA if passed in the ``na_values`` argument. It's better
+  to do post-processing using the ``replace`` function instead.
+
+- Calling ``fillna`` on Series or DataFrame with no arguments is no longer
+  valid code. You must either specify a fill value or an interpolation method:
+
+.. ipython:: python
+
+   s = pd.Series([np.nan, 1., 2., np.nan, 4])
+   s
+   s.fillna(0)
+   s.fillna(method='pad')
+
+Convenience methods ``ffill`` and  ``bfill`` have been added:
+
+.. ipython:: python
+
+   s.ffill()
+
+
+- ``Series.apply`` will now operate on a returned value from the applied
+  function, that is itself a series, and possibly upcast the result to a
+  DataFrame
+
+  .. ipython:: python
+
+      def f(x):
+          return pd.Series([x, x**2], index=['x', 'x^2'])
+
+      s = pd.Series(np.random.rand(5))
+      s
+      s.apply(f)
+
+- New API functions for working with pandas options (:issue:`2097`):
+
+  - ``get_option`` / ``set_option`` - get/set the value of an option. Partial
+    names are accepted.  - ``reset_option`` - reset one or more options to
+    their default value. Partial names are accepted.  - ``describe_option`` -
+    print a description of one or more options. When called with no
+    arguments. print all registered options.
+
+  Note: ``set_printoptions``/ ``reset_printoptions`` are now deprecated (but
+  functioning), the print options now live under "display.XYZ". For example:
+
+  .. ipython:: python
+
+     pd.get_option("display.max_rows")
+
+- to_string() methods now always return unicode strings  (:issue:`2224`).
+
+New features
+~~~~~~~~~~~~
+
+Wide DataFrame Printing
+~~~~~~~~~~~~~~~~~~~~~~~
+
+Instead of printing the summary information, pandas now splits the string
+representation across multiple rows by default:
+
+.. ipython:: python
+
+   wide_frame = pd.DataFrame(np.random.randn(5, 16))
+
+   wide_frame
+
+The old behavior of printing out summary information can be achieved via the
+'expand_frame_repr' print option:
+
+.. ipython:: python
+
+   pd.set_option('expand_frame_repr', False)
+
+   wide_frame
+
+.. ipython:: python
+   :suppress:
+
+   pd.reset_option('expand_frame_repr')
+
+The width of each line can be changed via 'line_width' (80 by default):
+
+.. code-block:: python
+
+   pd.set_option('line_width', 40)
+
+   wide_frame
+
+
+Updated PyTables Support
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+:ref:`Docs <io.hdf5>` for PyTables ``Table`` format & several enhancements to the api. Here is a taste of what to expect.
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   import os
+
+   os.remove('store.h5')
+
+.. ipython:: python
+
+   store = pd.HDFStore('store.h5')
+   df = pd.DataFrame(np.random.randn(8, 3),
+                     index=pd.date_range('1/1/2000', periods=8),
+                     columns=['A', 'B', 'C'])
+   df
+
+   # appending data frames
+   df1 = df[0:4]
+   df2 = df[4:]
+   store.append('df', df1)
+   store.append('df', df2)
+   store
+
+   # selecting the entire store
+   store.select('df')
+
+.. ipython:: python
+   :okwarning:
+
+   wp = pd.Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
+                 major_axis=pd.date_range('1/1/2000', periods=5),
+                 minor_axis=['A', 'B', 'C', 'D'])
+   wp
+
+   # storing a panel
+   store.append('wp', wp)
+
+   # selecting via A QUERY
+   store.select('wp', "major_axis>20000102 and minor_axis=['A','B']")
+
+   # removing data from tables
+   store.remove('wp', "major_axis>20000103")
+   store.select('wp')
+
+   # deleting a store
+   del store['df']
+   store
+
+**Enhancements**
+
+- added ability to hierarchical keys
+
+   .. ipython:: python
+
+     store.put('foo/bar/bah', df)
+     store.append('food/orange', df)
+     store.append('food/apple',  df)
+     store
+
+     # remove all nodes under this level
+     store.remove('food')
+     store
+
+- added mixed-dtype support!
+
+   .. ipython:: python
+
+      df['string'] = 'string'
+      df['int'] = 1
+      store.append('df', df)
+      df1 = store.select('df')
+      df1
+      df1.get_dtype_counts()
+
+- performance improvements on table writing
+- support for arbitrarily indexed dimensions
+- ``SparseSeries`` now has a ``density`` property (:issue:`2384`)
+- enable ``Series.str.strip/lstrip/rstrip`` methods to take an input argument
+  to strip arbitrary characters (:issue:`2411`)
+- implement ``value_vars`` in ``melt`` to limit values to certain columns
+  and add ``melt`` to pandas namespace (:issue:`2412`)
+
+**Bug Fixes**
+
+- added ``Term`` method of specifying where conditions (:issue:`1996`).
+- ``del store['df']`` now call ``store.remove('df')`` for store deletion
+- deleting of consecutive rows is much faster than before
+- ``min_itemsize`` parameter can be specified in table creation to force a
+  minimum size for indexing columns (the previous implementation would set the
+  column size based on the first append)
+- indexing support via ``create_table_index`` (requires PyTables >= 2.3)
+  (:issue:`698`).
+- appending on a store would fail if the table was not first created via ``put``
+- fixed issue with missing attributes after loading a pickled dataframe (GH2431)
+- minor change to select and remove: require a table ONLY if where is also
+  provided (and not None)
+
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   import os
+   os.remove('store.h5')
+
+**Compatibility**
+
+0.10 of ``HDFStore`` is backwards compatible for reading tables created in a prior version of pandas,
+however, query terms using the prior (undocumented) methodology are unsupported. You must read in the entire
+file and write it out using the new format to take advantage of the updates.
+
+N Dimensional Panels (Experimental)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Adding experimental support for Panel4D and factory functions to create n-dimensional named panels.
+Here is a taste of what to expect.
+
+.. code-block:: ipython
+
+  In [58]: p4d = Panel4D(randn(2, 2, 5, 4),
+    ....:       labels=['Label1','Label2'],
+    ....:       items=['Item1', 'Item2'],
+    ....:       major_axis=date_range('1/1/2000', periods=5),
+    ....:       minor_axis=['A', 'B', 'C', 'D'])
+    ....:
+
+  In [59]: p4d
+  Out[59]:
+  <class 'pandas.core.panelnd.Panel4D'>
+  Dimensions: 2 (labels) x 2 (items) x 5 (major_axis) x 4 (minor_axis)
+  Labels axis: Label1 to Label2
+  Items axis: Item1 to Item2
+  Major_axis axis: 2000-01-01 00:00:00 to 2000-01-05 00:00:00
+  Minor_axis axis: A to D
+
+
+
+
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+.. _whatsnew_0.10.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.9.0..v0.10.0
diff --git a/doc/source/whatsnew/v0.10.0.txt b/doc/source/whatsnew/v0.10.0.txt
deleted file mode 100644
index cf5369466308c..0000000000000
--- a/doc/source/whatsnew/v0.10.0.txt
+++ /dev/null
@@ -1,400 +0,0 @@
-.. _whatsnew_0100:
-
-.. ipython:: python
-   :suppress:
-
-   from pandas.compat import StringIO
-
-v0.10.0 (December 17, 2012)
----------------------------
-
-This is a major release from 0.9.1 and includes many new features and
-enhancements along with a large number of bug fixes. There are also a number of
-important API changes that long-time pandas users should pay close attention
-to.
-
-File parsing new features
-~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The delimited file parsing engine (the guts of ``read_csv`` and ``read_table``)
-has been rewritten from the ground up and now uses a fraction the amount of
-memory while parsing, while being 40% or more faster in most use cases (in some
-cases much faster).
-
-There are also many new features:
-
-- Much-improved Unicode handling via the ``encoding`` option.
-- Column filtering (``usecols``)
-- Dtype specification (``dtype`` argument)
-- Ability to specify strings to be recognized as True/False
-- Ability to yield NumPy record arrays (``as_recarray``)
-- High performance ``delim_whitespace`` option
-- Decimal format (e.g. European format) specification
-- Easier CSV dialect options: ``escapechar``, ``lineterminator``,
-  ``quotechar``, etc.
-- More robust handling of many exceptional kinds of files observed in the wild
-
-API changes
-~~~~~~~~~~~
-
-**Deprecated DataFrame BINOP TimeSeries special case behavior**
-
-The default behavior of binary operations between a DataFrame and a Series has
-always been to align on the DataFrame's columns and broadcast down the rows,
-**except** in the special case that the DataFrame contains time series. Since
-there are now method for each binary operator enabling you to specify how you
-want to broadcast, we are phasing out this special case (Zen of Python:
-*Special cases aren't special enough to break the rules*). Here's what I'm
-talking about:
-
-.. ipython:: python
-   :okwarning:
-
-   import pandas as pd
-   df = pd.DataFrame(np.random.randn(6, 4),
-                     index=pd.date_range('1/1/2000', periods=6))
-   df
-   # deprecated now
-   df - df[0]
-   # Change your code to
-   df.sub(df[0], axis=0) # align on axis 0 (rows)
-
-You will get a deprecation warning in the 0.10.x series, and the deprecated
-functionality will be removed in 0.11 or later.
-
-**Altered resample default behavior**
-
-The default time series ``resample`` binning behavior of daily ``D`` and
-*higher* frequencies has been changed to ``closed='left', label='left'``. Lower
-nfrequencies are unaffected. The prior defaults were causing a great deal of
-confusion for users, especially resampling data to daily frequency (which
-labeled the aggregated group with the end of the interval: the next day).
-
-.. code-block:: ipython
-
-   In [1]: dates = pd.date_range('1/1/2000', '1/5/2000', freq='4h')
-
-   In [2]: series = Series(np.arange(len(dates)), index=dates)
-
-   In [3]: series
-   Out[3]:
-   2000-01-01 00:00:00     0
-   2000-01-01 04:00:00     1
-   2000-01-01 08:00:00     2
-   2000-01-01 12:00:00     3
-   2000-01-01 16:00:00     4
-   2000-01-01 20:00:00     5
-   2000-01-02 00:00:00     6
-   2000-01-02 04:00:00     7
-   2000-01-02 08:00:00     8
-   2000-01-02 12:00:00     9
-   2000-01-02 16:00:00    10
-   2000-01-02 20:00:00    11
-   2000-01-03 00:00:00    12
-   2000-01-03 04:00:00    13
-   2000-01-03 08:00:00    14
-   2000-01-03 12:00:00    15
-   2000-01-03 16:00:00    16
-   2000-01-03 20:00:00    17
-   2000-01-04 00:00:00    18
-   2000-01-04 04:00:00    19
-   2000-01-04 08:00:00    20
-   2000-01-04 12:00:00    21
-   2000-01-04 16:00:00    22
-   2000-01-04 20:00:00    23
-   2000-01-05 00:00:00    24
-   Freq: 4H, dtype: int64
-
-   In [4]: series.resample('D', how='sum')
-   Out[4]:
-   2000-01-01     15
-   2000-01-02     51
-   2000-01-03     87
-   2000-01-04    123
-   2000-01-05     24
-   Freq: D, dtype: int64
-
-   In [5]: # old behavior
-   In [6]: series.resample('D', how='sum', closed='right', label='right')
-   Out[6]:
-   2000-01-01      0
-   2000-01-02     21
-   2000-01-03     57
-   2000-01-04     93
-   2000-01-05    129
-   Freq: D, dtype: int64
-
-- Infinity and negative infinity are no longer treated as NA by ``isnull`` and
-  ``notnull``. That they ever were was a relic of early pandas. This behavior
-  can be re-enabled globally by the ``mode.use_inf_as_null`` option:
-
-.. ipython:: python
-
-    s = pd.Series([1.5, np.inf, 3.4, -np.inf])
-	pd.isnull(s)
-    s.fillna(0)
-    pd.set_option('use_inf_as_null', True)
-	pd.isnull(s)
-    s.fillna(0)
-	pd.reset_option('use_inf_as_null')
-
-- Methods with the ``inplace`` option now all return ``None`` instead of the
-  calling object. E.g. code written like ``df = df.fillna(0, inplace=True)``
-  may stop working. To fix, simply delete the unnecessary variable assignment.
-
-- ``pandas.merge`` no longer sorts the group keys (``sort=False``) by
-  default. This was done for performance reasons: the group-key sorting is
-  often one of the more expensive parts of the computation and is often
-  unnecessary.
-
-- The default column names for a file with no header have been changed to the
-  integers ``0`` through ``N - 1``. This is to create consistency with the
-  DataFrame constructor with no columns specified. The v0.9.0 behavior (names
-  ``X0``, ``X1``, ...) can be reproduced by specifying ``prefix='X'``:
-
-.. ipython:: python
-
-    data= 'a,b,c\n1,Yes,2\n3,No,4'
-    print(data)
-    pd.read_csv(StringIO(data), header=None)
-    pd.read_csv(StringIO(data), header=None, prefix='X')
-
-- Values like ``'Yes'`` and ``'No'`` are not interpreted as boolean by default,
-  though this can be controlled by new ``true_values`` and ``false_values``
-  arguments:
-
-.. ipython:: python
-
-    print(data)
-    pd.read_csv(StringIO(data))
-    pd.read_csv(StringIO(data), true_values=['Yes'], false_values=['No'])
-
-- The file parsers will not recognize non-string values arising from a
-  converter function as NA if passed in the ``na_values`` argument. It's better
-  to do post-processing using the ``replace`` function instead.
-
-- Calling ``fillna`` on Series or DataFrame with no arguments is no longer
-  valid code. You must either specify a fill value or an interpolation method:
-
-.. ipython:: python
-
-   s = Series([np.nan, 1., 2., np.nan, 4])
-   s
-   s.fillna(0)
-   s.fillna(method='pad')
-
-Convenience methods ``ffill`` and  ``bfill`` have been added:
-
-.. ipython:: python
-
-   s.ffill()
-
-
-- ``Series.apply`` will now operate on a returned value from the applied
-  function, that is itself a series, and possibly upcast the result to a
-  DataFrame
-
-  .. ipython:: python
-
-      def f(x):
-          return Series([ x, x**2 ], index = ['x', 'x^2'])
-
-      s = Series(np.random.rand(5))
-      s
-      s.apply(f)
-
-- New API functions for working with pandas options (:issue:`2097`):
-
-  - ``get_option`` / ``set_option`` - get/set the value of an option. Partial
-    names are accepted.  - ``reset_option`` - reset one or more options to
-    their default value. Partial names are accepted.  - ``describe_option`` -
-    print a description of one or more options. When called with no
-    arguments. print all registered options.
-
-  Note: ``set_printoptions``/ ``reset_printoptions`` are now deprecated (but
-  functioning), the print options now live under "display.XYZ". For example:
-
-  .. ipython:: python
-
-     get_option("display.max_rows")
-
-- to_string() methods now always return unicode strings  (:issue:`2224`).
-
-New features
-~~~~~~~~~~~~
-
-Wide DataFrame Printing
-~~~~~~~~~~~~~~~~~~~~~~~
-
-Instead of printing the summary information, pandas now splits the string
-representation across multiple rows by default:
-
-.. ipython:: python
-
-   wide_frame = DataFrame(randn(5, 16))
-
-   wide_frame
-
-The old behavior of printing out summary information can be achieved via the
-'expand_frame_repr' print option:
-
-.. ipython:: python
-
-   pd.set_option('expand_frame_repr', False)
-
-   wide_frame
-
-.. ipython:: python
-   :suppress:
-
-   pd.reset_option('expand_frame_repr')
-
-The width of each line can be changed via 'line_width' (80 by default):
-
-.. ipython:: python
-
-   pd.set_option('line_width', 40)
-
-   wide_frame
-
-.. ipython:: python
-   :suppress:
-
-   pd.reset_option('line_width')
-
-
-Updated PyTables Support
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-:ref:`Docs <io.hdf5>` for PyTables ``Table`` format & several enhancements to the api. Here is a taste of what to expect.
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('store.h5')
-
-.. ipython:: python
-
-   store = HDFStore('store.h5')
-   df = DataFrame(randn(8, 3), index=date_range('1/1/2000', periods=8),
-              columns=['A', 'B', 'C'])
-   df
-
-   # appending data frames
-   df1 = df[0:4]
-   df2 = df[4:]
-   store.append('df', df1)
-   store.append('df', df2)
-   store
-
-   # selecting the entire store
-   store.select('df')
-
-.. ipython:: python
-   :okwarning:
-
-   wp = Panel(randn(2, 5, 4), items=['Item1', 'Item2'],
-          major_axis=date_range('1/1/2000', periods=5),
-          minor_axis=['A', 'B', 'C', 'D'])
-   wp
-
-   # storing a panel
-   store.append('wp',wp)
-
-   # selecting via A QUERY
-   store.select('wp', "major_axis>20000102 and minor_axis=['A','B']")
-
-   # removing data from tables
-   store.remove('wp', "major_axis>20000103")
-   store.select('wp')
-
-   # deleting a store
-   del store['df']
-   store
-
-**Enhancements**
-
-- added ability to hierarchical keys
-
-   .. ipython:: python
-
-     store.put('foo/bar/bah', df)
-     store.append('food/orange', df)
-     store.append('food/apple',  df)
-     store
-
-     # remove all nodes under this level
-     store.remove('food')
-     store
-
-- added mixed-dtype support!
-
-   .. ipython:: python
-
-      df['string'] = 'string'
-      df['int']    = 1
-      store.append('df',df)
-      df1 = store.select('df')
-      df1
-      df1.get_dtype_counts()
-
-- performance improvments on table writing
-- support for arbitrarily indexed dimensions
-- ``SparseSeries`` now has a ``density`` property (:issue:`2384`)
-- enable ``Series.str.strip/lstrip/rstrip`` methods to take an input argument
-  to strip arbitrary characters (:issue:`2411`)
-- implement ``value_vars`` in ``melt`` to limit values to certain columns
-  and add ``melt`` to pandas namespace (:issue:`2412`)
-
-**Bug Fixes**
-
-- added ``Term`` method of specifying where conditions (:issue:`1996`).
-- ``del store['df']`` now call ``store.remove('df')`` for store deletion
-- deleting of consecutive rows is much faster than before
-- ``min_itemsize`` parameter can be specified in table creation to force a
-  minimum size for indexing columns (the previous implementation would set the
-  column size based on the first append)
-- indexing support via ``create_table_index`` (requires PyTables >= 2.3)
-  (:issue:`698`).
-- appending on a store would fail if the table was not first created via ``put``
-- fixed issue with missing attributes after loading a pickled dataframe (GH2431)
-- minor change to select and remove: require a table ONLY if where is also
-  provided (and not None)
-
-.. ipython:: python
-   :suppress:
-
-   store.close()
-   import os
-   os.remove('store.h5')
-
-**Compatibility**
-
-0.10 of ``HDFStore`` is backwards compatible for reading tables created in a prior version of pandas,
-however, query terms using the prior (undocumented) methodology are unsupported. You must read in the entire
-file and write it out using the new format to take advantage of the updates.
-
-N Dimensional Panels (Experimental)
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Adding experimental support for Panel4D and factory functions to create n-dimensional named panels.
-:ref:`Docs <dsintro.panel4d>` for NDim. Here is a taste of what to expect.
-
-     .. ipython:: python
-        :okwarning:
-
-        p4d = Panel4D(randn(2, 2, 5, 4),
-              labels=['Label1','Label2'],
-              items=['Item1', 'Item2'],
-              major_axis=date_range('1/1/2000', periods=5),
-              minor_axis=['A', 'B', 'C', 'D'])
-        p4d
-
-
-
-
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
diff --git a/doc/source/whatsnew/v0.10.1.rst b/doc/source/whatsnew/v0.10.1.rst
new file mode 100644
index 0000000000000..b5b2b889732cd
--- /dev/null
+++ b/doc/source/whatsnew/v0.10.1.rst
@@ -0,0 +1,262 @@
+.. _whatsnew_0101:
+
+v0.10.1 (January 22, 2013)
+---------------------------
+
+{{ header }}
+
+
+This is a minor release from 0.10.0 and includes new features, enhancements,
+and bug fixes. In particular, there is substantial new HDFStore functionality
+contributed by Jeff Reback.
+
+An undesired API breakage with functions taking the ``inplace`` option has been
+reverted and deprecation warnings added.
+
+API changes
+~~~~~~~~~~~
+
+- Functions taking an ``inplace`` option return the calling object as before. A
+  deprecation message has been added
+- Groupby aggregations Max/Min no longer exclude non-numeric data (:issue:`2700`)
+- Resampling an empty DataFrame now returns an empty DataFrame instead of
+  raising an exception (:issue:`2640`)
+- The file reader will now raise an exception when NA values are found in an
+  explicitly specified integer column instead of converting the column to float
+  (:issue:`2631`)
+- DatetimeIndex.unique now returns a DatetimeIndex with the same name and
+- timezone instead of an array (:issue:`2563`)
+
+New features
+~~~~~~~~~~~~
+
+- MySQL support for database (contribution from Dan Allan)
+
+HDFStore
+~~~~~~~~
+
+You may need to upgrade your existing data files. Please visit the
+**compatibility** section in the main docs.
+
+
+.. ipython:: python
+   :suppress:
+   :okexcept:
+
+   import os
+
+   os.remove('store.h5')
+
+You can designate (and index) certain columns that you want to be able to
+perform queries on a table, by passing a list to ``data_columns``
+
+.. ipython:: python
+
+   store = pd.HDFStore('store.h5')
+   df = pd.DataFrame(np.random.randn(8, 3),
+                     index=pd.date_range('1/1/2000', periods=8),
+                     columns=['A', 'B', 'C'])
+   df['string'] = 'foo'
+   df.loc[df.index[4:6], 'string'] = np.nan
+   df.loc[df.index[7:9], 'string'] = 'bar'
+   df['string2'] = 'cool'
+   df
+
+   # on-disk operations
+   store.append('df', df, data_columns=['B', 'C', 'string', 'string2'])
+   store.select('df', "B>0 and string=='foo'")
+
+   # this is in-memory version of this type of selection
+   df[(df.B > 0) & (df.string == 'foo')]
+
+Retrieving unique values in an indexable or data column.
+
+.. code-block:: python
+
+   # note that this is deprecated as of 0.14.0
+   # can be replicated by: store.select_column('df','index').unique()
+   store.unique('df', 'index')
+   store.unique('df', 'string')
+
+You can now store ``datetime64`` in data columns
+
+.. ipython:: python
+
+    df_mixed = df.copy()
+    df_mixed['datetime64'] = pd.Timestamp('20010102')
+    df_mixed.loc[df_mixed.index[3:4], ['A', 'B']] = np.nan
+
+    store.append('df_mixed', df_mixed)
+    df_mixed1 = store.select('df_mixed')
+    df_mixed1
+    df_mixed1.get_dtype_counts()
+
+You can pass ``columns`` keyword to select to filter a list of the return
+columns, this is equivalent to passing a
+``Term('columns',list_of_columns_to_filter)``
+
+.. ipython:: python
+
+   store.select('df', columns=['A', 'B'])
+
+``HDFStore`` now serializes MultiIndex dataframes when appending tables.
+
+.. code-block:: ipython
+
+    In [19]: index = pd.MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+       ....:                               ['one', 'two', 'three']],
+       ....:                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+       ....:                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+       ....:                       names=['foo', 'bar'])
+       ....:
+
+    In [20]: df = pd.DataFrame(np.random.randn(10, 3), index=index,
+       ....:                   columns=['A', 'B', 'C'])
+       ....:
+
+    In [21]: df
+    Out[21]:
+                      A         B         C
+    foo bar
+    foo one   -0.116619  0.295575 -1.047704
+        two    1.640556  1.905836  2.772115
+        three  0.088787 -1.144197 -0.633372
+    bar one    0.925372 -0.006438 -0.820408
+        two   -0.600874 -1.039266  0.824758
+    baz two   -0.824095 -0.337730 -0.927764
+        three -0.840123  0.248505 -0.109250
+    qux one    0.431977 -0.460710  0.336505
+        two   -3.207595 -1.535854  0.409769
+        three -0.673145 -0.741113 -0.110891
+
+    In [22]: store.append('mi', df)
+
+    In [23]: store.select('mi')
+    Out[23]:
+                      A         B         C
+    foo bar
+    foo one   -0.116619  0.295575 -1.047704
+        two    1.640556  1.905836  2.772115
+        three  0.088787 -1.144197 -0.633372
+    bar one    0.925372 -0.006438 -0.820408
+        two   -0.600874 -1.039266  0.824758
+    baz two   -0.824095 -0.337730 -0.927764
+        three -0.840123  0.248505 -0.109250
+    qux one    0.431977 -0.460710  0.336505
+        two   -3.207595 -1.535854  0.409769
+        three -0.673145 -0.741113 -0.110891
+
+    # the levels are automatically included as data columns
+    In [24]: store.select('mi', "foo='bar'")
+    Out[24]:
+                    A         B         C
+    foo bar
+    bar one  0.925372 -0.006438 -0.820408
+        two -0.600874 -1.039266  0.824758
+
+Multi-table creation via ``append_to_multiple`` and selection via
+``select_as_multiple`` can create/select from multiple tables and return a
+combined result, by using ``where`` on a selector table.
+
+.. ipython:: python
+
+   df_mt = pd.DataFrame(np.random.randn(8, 6),
+                        index=pd.date_range('1/1/2000', periods=8),
+                        columns=['A', 'B', 'C', 'D', 'E', 'F'])
+   df_mt['foo'] = 'bar'
+
+   # you can also create the tables individually
+   store.append_to_multiple({'df1_mt': ['A', 'B'], 'df2_mt': None},
+                            df_mt, selector='df1_mt')
+   store
+
+   # indiviual tables were created
+   store.select('df1_mt')
+   store.select('df2_mt')
+
+   # as a multiple
+   store.select_as_multiple(['df1_mt', 'df2_mt'], where=['A>0', 'B>0'],
+                            selector='df1_mt')
+
+.. ipython:: python
+   :suppress:
+
+   store.close()
+   os.remove('store.h5')
+
+**Enhancements**
+
+- ``HDFStore`` now can read native PyTables table format tables
+
+- You can pass ``nan_rep = 'my_nan_rep'`` to append, to change the default nan
+  representation on disk (which converts to/from `np.nan`), this defaults to
+  `nan`.
+
+- You can pass ``index`` to ``append``. This defaults to ``True``. This will
+  automagically create indices on the *indexables* and *data columns* of the
+  table
+
+- You can pass ``chunksize=an integer`` to ``append``, to change the writing
+  chunksize (default is 50000). This will significantly lower your memory usage
+  on writing.
+
+- You can pass ``expectedrows=an integer`` to the first ``append``, to set the
+  TOTAL number of expected rows that ``PyTables`` will expected. This will
+  optimize read/write performance.
+
+- ``Select`` now supports passing ``start`` and ``stop`` to provide selection
+  space limiting in selection.
+
+- Greatly improved ISO8601 (e.g., yyyy-mm-dd) date parsing for file parsers (:issue:`2698`)
+- Allow ``DataFrame.merge`` to handle combinatorial sizes too large for 64-bit
+  integer (:issue:`2690`)
+- Series now has unary negation (-series) and inversion (~series) operators (:issue:`2686`)
+- DataFrame.plot now includes a ``logx`` parameter to change the x-axis to log scale (:issue:`2327`)
+- Series arithmetic operators can now handle constant and ndarray input (:issue:`2574`)
+- ExcelFile now takes a ``kind`` argument to specify the file type (:issue:`2613`)
+- A faster implementation for Series.str methods (:issue:`2602`)
+
+**Bug Fixes**
+
+- ``HDFStore`` tables can now store ``float32`` types correctly (cannot be
+  mixed with ``float64`` however)
+- Fixed Google Analytics prefix when specifying request segment (:issue:`2713`).
+- Function to reset Google Analytics token store so users can recover from
+  improperly setup client secrets (:issue:`2687`).
+- Fixed groupby bug resulting in segfault when passing in MultiIndex (:issue:`2706`)
+- Fixed bug where passing a Series with datetime64 values into `to_datetime`
+  results in bogus output values (:issue:`2699`)
+- Fixed bug in ``pattern in HDFStore`` expressions when pattern is not a valid
+  regex (:issue:`2694`)
+- Fixed performance issues while aggregating boolean data (:issue:`2692`)
+- When given a boolean mask key and a Series of new values, Series __setitem__
+  will now align the incoming values with the original Series (:issue:`2686`)
+- Fixed MemoryError caused by performing counting sort on sorting MultiIndex
+  levels with a very large number of combinatorial values (:issue:`2684`)
+- Fixed bug that causes plotting to fail when the index is a DatetimeIndex with
+  a fixed-offset timezone (:issue:`2683`)
+- Corrected business day subtraction logic when the offset is more than 5 bdays
+  and the starting date is on a weekend (:issue:`2680`)
+- Fixed C file parser behavior when the file has more columns than data
+  (:issue:`2668`)
+- Fixed file reader bug that misaligned columns with data in the presence of an
+  implicit column and a specified `usecols` value
+- DataFrames with numerical or datetime indices are now sorted prior to
+  plotting (:issue:`2609`)
+- Fixed DataFrame.from_records error when passed columns, index, but empty
+  records (:issue:`2633`)
+- Several bug fixed for Series operations when dtype is datetime64 (:issue:`2689`,
+  :issue:`2629`, :issue:`2626`)
+
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+.. _whatsnew_0.10.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.10.0..v0.10.1
diff --git a/doc/source/whatsnew/v0.10.1.txt b/doc/source/whatsnew/v0.10.1.txt
deleted file mode 100644
index d5880e44e46c6..0000000000000
--- a/doc/source/whatsnew/v0.10.1.txt
+++ /dev/null
@@ -1,210 +0,0 @@
-.. _whatsnew_0101:
-
-v0.10.1 (January 22, 2013)
----------------------------
-
-This is a minor release from 0.10.0 and includes new features, enhancements,
-and bug fixes. In particular, there is substantial new HDFStore functionality
-contributed by Jeff Reback.
-
-An undesired API breakage with functions taking the ``inplace`` option has been
-reverted and deprecation warnings added.
-
-API changes
-~~~~~~~~~~~
-
-- Functions taking an ``inplace`` option return the calling object as before. A
-  deprecation message has been added
-- Groupby aggregations Max/Min no longer exclude non-numeric data (:issue:`2700`)
-- Resampling an empty DataFrame now returns an empty DataFrame instead of
-  raising an exception (:issue:`2640`)
-- The file reader will now raise an exception when NA values are found in an
-  explicitly specified integer column instead of converting the column to float
-  (:issue:`2631`)
-- DatetimeIndex.unique now returns a DatetimeIndex with the same name and
-- timezone instead of an array (:issue:`2563`)
-
-New features
-~~~~~~~~~~~~
-
-- MySQL support for database (contribution from Dan Allan)
-
-HDFStore
-~~~~~~~~
-
-You may need to upgrade your existing data files. Please visit the
-**compatibility** section in the main docs.
-
-
-.. ipython:: python
-   :suppress:
-   :okexcept:
-
-   os.remove('store.h5')
-
-You can designate (and index) certain columns that you want to be able to
-perform queries on a table, by passing a list to ``data_columns``
-
-.. ipython:: python
-
-   store = HDFStore('store.h5')
-   df = DataFrame(randn(8, 3), index=date_range('1/1/2000', periods=8),
-              columns=['A', 'B', 'C'])
-   df['string'] = 'foo'
-   df.loc[df.index[4:6], 'string'] = np.nan
-   df.loc[df.index[7:9], 'string'] = 'bar'
-   df['string2'] = 'cool'
-   df
-
-   # on-disk operations
-   store.append('df', df, data_columns = ['B','C','string','string2'])
-   store.select('df', "B>0 and string=='foo'")
-
-   # this is in-memory version of this type of selection
-   df[(df.B > 0) & (df.string == 'foo')]
-
-Retrieving unique values in an indexable or data column.
-
-.. code-block:: python
-
-   # note that this is deprecated as of 0.14.0
-   # can be replicated by: store.select_column('df','index').unique()
-   store.unique('df','index')
-   store.unique('df','string')
-
-You can now store ``datetime64`` in data columns
-
-.. ipython:: python
-
-    df_mixed               = df.copy()
-    df_mixed['datetime64'] = Timestamp('20010102')
-    df_mixed.loc[df_mixed.index[3:4], ['A','B']] = np.nan
-
-    store.append('df_mixed', df_mixed)
-    df_mixed1 = store.select('df_mixed')
-    df_mixed1
-    df_mixed1.get_dtype_counts()
-
-You can pass ``columns`` keyword to select to filter a list of the return
-columns, this is equivalent to passing a
-``Term('columns',list_of_columns_to_filter)``
-
-.. ipython:: python
-
-   store.select('df',columns = ['A','B'])
-
-``HDFStore`` now serializes multi-index dataframes when appending tables.
-
-.. ipython:: python
-
-   index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                              ['one', 'two', 'three']],
-                      labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                      names=['foo', 'bar'])
-   df = DataFrame(np.random.randn(10, 3), index=index,
-                  columns=['A', 'B', 'C'])
-   df
-
-   store.append('mi',df)
-   store.select('mi')
-
-   # the levels are automatically included as data columns
-   store.select('mi', "foo='bar'")
-
-Multi-table creation via ``append_to_multiple`` and selection via
-``select_as_multiple`` can create/select from multiple tables and return a
-combined result, by using ``where`` on a selector table.
-
-.. ipython:: python
-
-   df_mt = DataFrame(randn(8, 6), index=date_range('1/1/2000', periods=8),
-                                  columns=['A', 'B', 'C', 'D', 'E', 'F'])
-   df_mt['foo'] = 'bar'
-
-   # you can also create the tables individually
-   store.append_to_multiple({ 'df1_mt' : ['A','B'], 'df2_mt' : None }, df_mt, selector = 'df1_mt')
-   store
-
-   # indiviual tables were created
-   store.select('df1_mt')
-   store.select('df2_mt')
-
-   # as a multiple
-   store.select_as_multiple(['df1_mt','df2_mt'], where = [ 'A>0','B>0' ], selector = 'df1_mt')
-
-.. ipython:: python
-   :suppress:
-
-   store.close()
-   import os
-   os.remove('store.h5')
-
-**Enhancements**
-
-- ``HDFStore`` now can read native PyTables table format tables
-
-- You can pass ``nan_rep = 'my_nan_rep'`` to append, to change the default nan
-  representation on disk (which converts to/from `np.nan`), this defaults to
-  `nan`.
-
-- You can pass ``index`` to ``append``. This defaults to ``True``. This will
-  automagically create indicies on the *indexables* and *data columns* of the
-  table
-
-- You can pass ``chunksize=an integer`` to ``append``, to change the writing
-  chunksize (default is 50000). This will signficantly lower your memory usage
-  on writing.
-
-- You can pass ``expectedrows=an integer`` to the first ``append``, to set the
-  TOTAL number of expectedrows that ``PyTables`` will expected. This will
-  optimize read/write performance.
-
-- ``Select`` now supports passing ``start`` and ``stop`` to provide selection
-  space limiting in selection.
-
-- Greatly improved ISO8601 (e.g., yyyy-mm-dd) date parsing for file parsers (:issue:`2698`)
-- Allow ``DataFrame.merge`` to handle combinatorial sizes too large for 64-bit
-  integer (:issue:`2690`)
-- Series now has unary negation (-series) and inversion (~series) operators (:issue:`2686`)
-- DataFrame.plot now includes a ``logx`` parameter to change the x-axis to log scale (:issue:`2327`)
-- Series arithmetic operators can now handle constant and ndarray input (:issue:`2574`)
-- ExcelFile now takes a ``kind`` argument to specify the file type (:issue:`2613`)
-- A faster implementation for Series.str methods (:issue:`2602`)
-
-**Bug Fixes**
-
-- ``HDFStore`` tables can now store ``float32`` types correctly (cannot be
-  mixed with ``float64`` however)
-- Fixed Google Analytics prefix when specifying request segment (:issue:`2713`).
-- Function to reset Google Analytics token store so users can recover from
-  improperly setup client secrets (:issue:`2687`).
-- Fixed groupby bug resulting in segfault when passing in MultiIndex (:issue:`2706`)
-- Fixed bug where passing a Series with datetime64 values into `to_datetime`
-  results in bogus output values (:issue:`2699`)
-- Fixed bug in ``pattern in HDFStore`` expressions when pattern is not a valid
-  regex (:issue:`2694`)
-- Fixed performance issues while aggregating boolean data (:issue:`2692`)
-- When given a boolean mask key and a Series of new values, Series __setitem__
-  will now align the incoming values with the original Series (:issue:`2686`)
-- Fixed MemoryError caused by performing counting sort on sorting MultiIndex
-  levels with a very large number of combinatorial values (:issue:`2684`)
-- Fixed bug that causes plotting to fail when the index is a DatetimeIndex with
-  a fixed-offset timezone (:issue:`2683`)
-- Corrected businessday subtraction logic when the offset is more than 5 bdays
-  and the starting date is on a weekend (:issue:`2680`)
-- Fixed C file parser behavior when the file has more columns than data
-  (:issue:`2668`)
-- Fixed file reader bug that misaligned columns with data in the presence of an
-  implicit column and a specified `usecols` value
-- DataFrames with numerical or datetime indices are now sorted prior to
-  plotting (:issue:`2609`)
-- Fixed DataFrame.from_records error when passed columns, index, but empty
-  records (:issue:`2633`)
-- Several bug fixed for Series operations when dtype is datetime64 (:issue:`2689`,
-  :issue:`2629`, :issue:`2626`)
-
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
diff --git a/doc/source/whatsnew/v0.11.0.rst b/doc/source/whatsnew/v0.11.0.rst
new file mode 100644
index 0000000000000..baa464fe842d3
--- /dev/null
+++ b/doc/source/whatsnew/v0.11.0.rst
@@ -0,0 +1,345 @@
+.. _whatsnew_0110:
+
+v0.11.0 (April 22, 2013)
+------------------------
+
+{{ header }}
+
+
+This is a major release from 0.10.1 and includes many new features and
+enhancements along with a large number of bug fixes. The methods of Selecting
+Data have had quite a number of additions, and Dtype support is now full-fledged.
+There are also a number of important API changes that long-time pandas users should
+pay close attention to.
+
+There is a new section in the documentation, :ref:`10 Minutes to Pandas <10min>`,
+primarily geared to new users.
+
+There is a new section in the documentation, :ref:`Cookbook <cookbook>`, a collection
+of useful recipes in pandas (and that we want contributions!).
+
+There are several libraries that are now :ref:`Recommended Dependencies <install.recommended_dependencies>`
+
+Selection Choices
+~~~~~~~~~~~~~~~~~
+
+Starting in 0.11.0, object selection has had a number of user-requested additions in
+order to support more explicit location based indexing. Pandas now supports
+three types of multi-axis indexing.
+
+- ``.loc`` is strictly label based, will raise ``KeyError`` when the items are not found, allowed inputs are:
+
+  - A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index)
+  - A list or array of labels ``['a', 'b', 'c']``
+  - A slice object with labels ``'a':'f'``, (note that contrary to usual python slices, **both** the start and the stop are included!)
+  - A boolean array
+
+  See more at :ref:`Selection by Label <indexing.label>`
+
+- ``.iloc`` is strictly integer position based (from ``0`` to ``length-1`` of the axis), will raise ``IndexError`` when the requested indices are out of bounds. Allowed inputs are:
+
+  - An integer e.g. ``5``
+  - A list or array of integers ``[4, 3, 0]``
+  - A slice object with ints ``1:7``
+  - A boolean array
+
+  See more at :ref:`Selection by Position <indexing.integer>`
+
+- ``.ix`` supports mixed integer and label based access. It is primarily label based, but will fallback to integer positional access. ``.ix`` is the most general and will support
+  any of the inputs to ``.loc`` and ``.iloc``, as well as support for floating point label schemes. ``.ix`` is especially useful when dealing with mixed positional and label
+  based hierarchical indexes.
+
+  As using integer slices with ``.ix`` have different behavior depending on whether the slice
+  is interpreted as position based or label based, it's usually better to be
+  explicit and use ``.iloc`` or ``.loc``.
+
+  See more at :ref:`Advanced Indexing <advanced>` and :ref:`Advanced Hierarchical <advanced.advanced_hierarchical>`.
+
+
+Selection Deprecations
+~~~~~~~~~~~~~~~~~~~~~~
+
+Starting in version 0.11.0, these methods *may* be deprecated in future versions.
+
+- ``irow``
+- ``icol``
+- ``iget_value``
+
+See the section :ref:`Selection by Position <indexing.integer>` for substitutes.
+
+Dtypes
+~~~~~~
+
+Numeric dtypes will propagate and can coexist in DataFrames. If a dtype is passed (either directly via the ``dtype`` keyword, a passed ``ndarray``, or a passed ``Series``, then it will be preserved in DataFrame operations. Furthermore, different numeric dtypes will **NOT** be combined. The following example will give you a taste.
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.random.randn(8, 1), columns=['A'], dtype='float32')
+   df1
+   df1.dtypes
+   df2 = pd.DataFrame({'A': pd.Series(np.random.randn(8), dtype='float16'),
+                       'B': pd.Series(np.random.randn(8)),
+                       'C': pd.Series(range(8), dtype='uint8')})
+   df2
+   df2.dtypes
+
+   # here you get some upcasting
+   df3 = df1.reindex_like(df2).fillna(value=0.0) + df2
+   df3
+   df3.dtypes
+
+Dtype Conversion
+~~~~~~~~~~~~~~~~
+
+This is lower-common-denominator upcasting, meaning you get the dtype which can accommodate all of the types
+
+.. ipython:: python
+
+   df3.values.dtype
+
+Conversion
+
+.. ipython:: python
+
+   df3.astype('float32').dtypes
+
+Mixed Conversion
+
+.. ipython:: python
+   :okwarning:
+
+   df3['D'] = '1.'
+   df3['E'] = '1'
+   df3.convert_objects(convert_numeric=True).dtypes
+
+   # same, but specific dtype conversion
+   df3['D'] = df3['D'].astype('float16')
+   df3['E'] = df3['E'].astype('int32')
+   df3.dtypes
+
+Forcing Date coercion (and setting ``NaT`` when not datelike)
+
+.. ipython:: python
+   :okwarning:
+
+   import datetime
+   s = pd.Series([datetime.datetime(2001, 1, 1, 0, 0), 'foo', 1.0, 1,
+                  pd.Timestamp('20010104'), '20010105'], dtype='O')
+   s.convert_objects(convert_dates='coerce')
+
+Dtype Gotchas
+~~~~~~~~~~~~~
+
+**Platform Gotchas**
+
+Starting in 0.11.0, construction of DataFrame/Series will use default dtypes of ``int64`` and ``float64``,
+*regardless of platform*. This is not an apparent change from earlier versions of pandas. If you specify
+dtypes, they *WILL* be respected, however (:issue:`2837`)
+
+The following will all result in ``int64`` dtypes
+
+.. ipython:: python
+
+    pd.DataFrame([1, 2], columns=['a']).dtypes
+    pd.DataFrame({'a': [1, 2]}).dtypes
+    pd.DataFrame({'a': 1}, index=range(2)).dtypes
+
+Keep in mind that ``DataFrame(np.array([1,2]))`` **WILL** result in ``int32`` on 32-bit platforms!
+
+
+**Upcasting Gotchas**
+
+Performing indexing operations on integer type data can easily upcast the data.
+The dtype of the input data will be preserved in cases where ``nans`` are not introduced.
+
+.. ipython:: python
+
+   dfi = df3.astype('int32')
+   dfi['D'] = dfi['D'].astype('int64')
+   dfi
+   dfi.dtypes
+
+   casted = dfi[dfi > 0]
+   casted
+   casted.dtypes
+
+While float dtypes are unchanged.
+
+.. ipython:: python
+
+   df4 = df3.copy()
+   df4['A'] = df4['A'].astype('float32')
+   df4.dtypes
+
+   casted = df4[df4 > 0]
+   casted
+   casted.dtypes
+
+Datetimes Conversion
+~~~~~~~~~~~~~~~~~~~~
+
+Datetime64[ns] columns in a DataFrame (or a Series) allow the use of ``np.nan`` to indicate a nan value,
+in addition to the traditional ``NaT``, or not-a-time. This allows convenient nan setting in a generic way.
+Furthermore ``datetime64[ns]`` columns are created by default, when passed datetimelike objects (*this change was introduced in 0.10.1*)
+(:issue:`2809`, :issue:`2810`)
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(6, 2), pd.date_range('20010102', periods=6),
+                     columns=['A', ' B'])
+   df['timestamp'] = pd.Timestamp('20010103')
+   df
+
+   # datetime64[ns] out of the box
+   df.get_dtype_counts()
+
+   # use the traditional nan, which is mapped to NaT internally
+   df.loc[df.index[2:4], ['A', 'timestamp']] = np.nan
+   df
+
+Astype conversion on ``datetime64[ns]`` to ``object``, implicitly converts ``NaT`` to ``np.nan``
+
+.. ipython:: python
+
+   s = pd.Series([datetime.datetime(2001, 1, 2, 0, 0) for i in range(3)])
+   s.dtype
+   s[1] = np.nan
+   s
+   s.dtype
+   s = s.astype('O')
+   s
+   s.dtype
+
+
+API changes
+~~~~~~~~~~~
+
+  - Added to_series() method to indices, to facilitate the creation of indexers
+    (:issue:`3275`)
+
+  - ``HDFStore``
+
+    - added the method ``select_column`` to select a single column from a table as a Series.
+    - deprecated the ``unique`` method, can be replicated by ``select_column(key,column).unique()``
+    - ``min_itemsize`` parameter to ``append`` will now automatically create data_columns for passed keys
+
+Enhancements
+~~~~~~~~~~~~
+
+  - Improved performance of df.to_csv() by up to 10x in some cases. (:issue:`3059`)
+
+  - Numexpr is now a :ref:`Recommended Dependencies <install.recommended_dependencies>`, to accelerate certain
+    types of numerical and boolean operations
+
+  - Bottleneck is now a :ref:`Recommended Dependencies <install.recommended_dependencies>`, to accelerate certain
+    types of ``nan`` operations
+
+  - ``HDFStore``
+
+    - support ``read_hdf/to_hdf`` API similar to ``read_csv/to_csv``
+
+      .. ipython:: python
+          :suppress:
+
+          from pandas.compat import lrange
+
+      .. ipython:: python
+
+          df = pd.DataFrame({'A': lrange(5), 'B': lrange(5)})
+          df.to_hdf('store.h5', 'table', append=True)
+          pd.read_hdf('store.h5', 'table', where=['index > 2'])
+
+      .. ipython:: python
+          :suppress:
+          :okexcept:
+
+          import os
+
+          os.remove('store.h5')
+
+    - provide dotted attribute access to ``get`` from stores, e.g. ``store.df == store['df']``
+
+    - new keywords ``iterator=boolean``, and ``chunksize=number_in_a_chunk`` are
+      provided to support iteration on ``select`` and ``select_as_multiple`` (:issue:`3076`)
+
+  - You can now select timestamps from an *unordered* timeseries similarly to an *ordered* timeseries (:issue:`2437`)
+
+  - You can now select with a string from a DataFrame with a datelike index, in a similar way to a Series (:issue:`3070`)
+
+    .. ipython:: python
+
+        idx = pd.date_range("2001-10-1", periods=5, freq='M')
+        ts = pd.Series(np.random.rand(len(idx)), index=idx)
+        ts['2001']
+
+        df = pd.DataFrame({'A': ts})
+        df['2001']
+
+  - ``Squeeze`` to possibly remove length 1 dimensions from an object.
+
+    .. ipython:: python
+
+       p = pd.Panel(np.random.randn(3, 4, 4), items=['ItemA', 'ItemB', 'ItemC'],
+                    major_axis=pd.date_range('20010102', periods=4),
+                    minor_axis=['A', 'B', 'C', 'D'])
+       p
+       p.reindex(items=['ItemA']).squeeze()
+       p.reindex(items=['ItemA'], minor=['B']).squeeze()
+
+  - In ``pd.io.data.Options``,
+
+    + Fix bug when trying to fetch data for the current month when already
+      past expiry.
+    + Now using lxml to scrape html instead of BeautifulSoup (lxml was faster).
+    + New instance variables for calls and puts are automatically created
+      when a method that creates them is called. This works for current month
+      where the instance variables are simply ``calls`` and ``puts``. Also
+      works for future expiry months and save the instance variable as
+      ``callsMMYY`` or ``putsMMYY``, where ``MMYY`` are, respectively, the
+      month and year of the option's expiry.
+    + ``Options.get_near_stock_price`` now allows the user to specify the
+      month for which to get relevant options data.
+    + ``Options.get_forward_data`` now has optional kwargs ``near`` and
+      ``above_below``. This allows the user to specify if they would like to
+      only return forward looking data for options near the current stock
+      price. This just obtains the data from Options.get_near_stock_price
+      instead of Options.get_xxx_data() (:issue:`2758`).
+
+  - Cursor coordinate information is now displayed in time-series plots.
+
+  - added option `display.max_seq_items` to control the number of
+    elements printed per sequence pprinting it.  (:issue:`2979`)
+
+  - added option `display.chop_threshold` to control display of small numerical
+    values. (:issue:`2739`)
+
+  - added option `display.max_info_rows` to prevent verbose_info from being
+    calculated for frames above 1M rows (configurable). (:issue:`2807`, :issue:`2918`)
+
+  - value_counts() now accepts a "normalize" argument, for normalized
+    histograms. (:issue:`2710`).
+
+  - DataFrame.from_records now accepts not only dicts but any instance of
+    the collections.Mapping ABC.
+
+  - added option `display.mpl_style` providing a sleeker visual style
+    for plots. Based on https://gist.github.com/huyng/816622 (:issue:`3075`).
+
+  - Treat boolean values as integers (values 1 and 0) for numeric
+    operations. (:issue:`2641`)
+
+  - to_html() now accepts an optional "escape" argument to control reserved
+    HTML character escaping (enabled by default) and escapes ``&``, in addition
+    to ``<`` and ``>``.  (:issue:`2919`)
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+.. _whatsnew_0.11.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.10.1..v0.11.0
diff --git a/doc/source/whatsnew/v0.11.0.txt b/doc/source/whatsnew/v0.11.0.txt
deleted file mode 100644
index ea149595e681f..0000000000000
--- a/doc/source/whatsnew/v0.11.0.txt
+++ /dev/null
@@ -1,332 +0,0 @@
-.. _whatsnew_0110:
-
-v0.11.0 (April 22, 2013)
-------------------------
-
-This is a major release from 0.10.1 and includes many new features and
-enhancements along with a large number of bug fixes. The methods of Selecting
-Data have had quite a number of additions, and Dtype support is now full-fledged.
-There are also a number of important API changes that long-time pandas users should
-pay close attention to.
-
-There is a new section in the documentation, :ref:`10 Minutes to Pandas <10min>`,
-primarily geared to new users.
-
-There is a new section in the documentation, :ref:`Cookbook <cookbook>`, a collection
-of useful recipes in pandas (and that we want contributions!).
-
-There are several libraries that are now :ref:`Recommended Dependencies <install.recommended_dependencies>`
-
-Selection Choices
-~~~~~~~~~~~~~~~~~
-
-Starting in 0.11.0, object selection has had a number of user-requested additions in
-order to support more explicit location based indexing. Pandas now supports
-three types of multi-axis indexing.
-
-- ``.loc`` is strictly label based, will raise ``KeyError`` when the items are not found, allowed inputs are:
-
-  - A single label, e.g. ``5`` or ``'a'``, (note that ``5`` is interpreted as a *label* of the index. This use is **not** an integer position along the index)
-  - A list or array of labels ``['a', 'b', 'c']``
-  - A slice object with labels ``'a':'f'``, (note that contrary to usual python slices, **both** the start and the stop are included!)
-  - A boolean array
-
-  See more at :ref:`Selection by Label <indexing.label>`
-
-- ``.iloc`` is strictly integer position based (from ``0`` to ``length-1`` of the axis), will raise ``IndexError`` when the requested indicies are out of bounds. Allowed inputs are:
-
-  - An integer e.g. ``5``
-  - A list or array of integers ``[4, 3, 0]``
-  - A slice object with ints ``1:7``
-  - A boolean array
-
-  See more at :ref:`Selection by Position <indexing.integer>`
-
-- ``.ix`` supports mixed integer and label based access. It is primarily label based, but will fallback to integer positional access. ``.ix`` is the most general and will support
-  any of the inputs to ``.loc`` and ``.iloc``, as well as support for floating point label schemes. ``.ix`` is especially useful when dealing with mixed positional and label
-  based hierarchial indexes.
-
-  As using integer slices with ``.ix`` have different behavior depending on whether the slice
-  is interpreted as position based or label based, it's usually better to be
-  explicit and use ``.iloc`` or ``.loc``.
-
-  See more at :ref:`Advanced Indexing <advanced>` and :ref:`Advanced Hierarchical <advanced.advanced_hierarchical>`.
-
-
-Selection Deprecations
-~~~~~~~~~~~~~~~~~~~~~~
-
-Starting in version 0.11.0, these methods *may* be deprecated in future versions.
-
-- ``irow``
-- ``icol``
-- ``iget_value``
-
-See the section :ref:`Selection by Position <indexing.integer>` for substitutes.
-
-Dtypes
-~~~~~~
-
-Numeric dtypes will propagate and can coexist in DataFrames. If a dtype is passed (either directly via the ``dtype`` keyword, a passed ``ndarray``, or a passed ``Series``, then it will be preserved in DataFrame operations. Furthermore, different numeric dtypes will **NOT** be combined. The following example will give you a taste.
-
-.. ipython:: python
-
-   df1 = DataFrame(randn(8, 1), columns = ['A'], dtype = 'float32')
-   df1
-   df1.dtypes
-   df2 = DataFrame(dict( A = Series(randn(8),dtype='float16'),
-                         B = Series(randn(8)),
-                         C = Series(randn(8),dtype='uint8') ))
-   df2
-   df2.dtypes
-
-   # here you get some upcasting
-   df3 = df1.reindex_like(df2).fillna(value=0.0) + df2
-   df3
-   df3.dtypes
-
-Dtype Conversion
-~~~~~~~~~~~~~~~~
-
-This is lower-common-denomicator upcasting, meaning you get the dtype which can accomodate all of the types
-
-.. ipython:: python
-
-   df3.values.dtype
-
-Conversion
-
-.. ipython:: python
-
-   df3.astype('float32').dtypes
-
-Mixed Conversion
-
-.. ipython:: python
-   :okwarning:
-
-   df3['D'] = '1.'
-   df3['E'] = '1'
-   df3.convert_objects(convert_numeric=True).dtypes
-
-   # same, but specific dtype conversion
-   df3['D'] = df3['D'].astype('float16')
-   df3['E'] = df3['E'].astype('int32')
-   df3.dtypes
-
-Forcing Date coercion (and setting ``NaT`` when not datelike)
-
-.. ipython:: python
-   :okwarning:
-
-   from datetime import datetime
-   s = Series([datetime(2001,1,1,0,0), 'foo', 1.0, 1,
-               Timestamp('20010104'), '20010105'],dtype='O')
-   s.convert_objects(convert_dates='coerce')
-
-Dtype Gotchas
-~~~~~~~~~~~~~
-
-**Platform Gotchas**
-
-Starting in 0.11.0, construction of DataFrame/Series will use default dtypes of ``int64`` and ``float64``,
-*regardless of platform*. This is not an apparent change from earlier versions of pandas. If you specify
-dtypes, they *WILL* be respected, however (:issue:`2837`)
-
-The following will all result in ``int64`` dtypes
-
-.. ipython:: python
-
-    DataFrame([1,2],columns=['a']).dtypes
-    DataFrame({'a' : [1,2] }).dtypes
-    DataFrame({'a' : 1 }, index=range(2)).dtypes
-
-Keep in mind that ``DataFrame(np.array([1,2]))`` **WILL** result in ``int32`` on 32-bit platforms!
-
-
-**Upcasting Gotchas**
-
-Performing indexing operations on integer type data can easily upcast the data.
-The dtype of the input data will be preserved in cases where ``nans`` are not introduced.
-
-.. ipython:: python
-
-   dfi = df3.astype('int32')
-   dfi['D'] = dfi['D'].astype('int64')
-   dfi
-   dfi.dtypes
-
-   casted = dfi[dfi>0]
-   casted
-   casted.dtypes
-
-While float dtypes are unchanged.
-
-.. ipython:: python
-
-   df4 = df3.copy()
-   df4['A'] = df4['A'].astype('float32')
-   df4.dtypes
-
-   casted = df4[df4>0]
-   casted
-   casted.dtypes
-
-Datetimes Conversion
-~~~~~~~~~~~~~~~~~~~~
-
-Datetime64[ns] columns in a DataFrame (or a Series) allow the use of ``np.nan`` to indicate a nan value,
-in addition to the traditional ``NaT``, or not-a-time. This allows convenient nan setting in a generic way.
-Furthermore ``datetime64[ns]`` columns are created by default, when passed datetimelike objects (*this change was introduced in 0.10.1*)
-(:issue:`2809`, :issue:`2810`)
-
-.. ipython:: python
-
-   df = DataFrame(randn(6,2),date_range('20010102',periods=6),columns=['A','B'])
-   df['timestamp'] = Timestamp('20010103')
-   df
-
-   # datetime64[ns] out of the box
-   df.get_dtype_counts()
-
-   # use the traditional nan, which is mapped to NaT internally
-   df.loc[df.index[2:4], ['A','timestamp']] = np.nan
-   df
-
-Astype conversion on ``datetime64[ns]`` to ``object``, implicity converts ``NaT`` to ``np.nan``
-
-.. ipython:: python
-
-   import datetime
-   s = Series([datetime.datetime(2001, 1, 2, 0, 0) for i in range(3)])
-   s.dtype
-   s[1] = np.nan
-   s
-   s.dtype
-   s = s.astype('O')
-   s
-   s.dtype
-
-
-API changes
-~~~~~~~~~~~
-
-  - Added to_series() method to indicies, to facilitate the creation of indexers
-    (:issue:`3275`)
-
-  - ``HDFStore``
-
-    - added the method ``select_column`` to select a single column from a table as a Series.
-    - deprecated the ``unique`` method, can be replicated by ``select_column(key,column).unique()``
-    - ``min_itemsize`` parameter to ``append`` will now automatically create data_columns for passed keys
-
-Enhancements
-~~~~~~~~~~~~
-
-  - Improved performance of df.to_csv() by up to 10x in some cases. (:issue:`3059`)
-
-  - Numexpr is now a :ref:`Recommended Dependencies <install.recommended_dependencies>`, to accelerate certain
-    types of numerical and boolean operations
-
-  - Bottleneck is now a :ref:`Recommended Dependencies <install.recommended_dependencies>`, to accelerate certain
-    types of ``nan`` operations
-
-  - ``HDFStore``
-
-    - support ``read_hdf/to_hdf`` API similar to ``read_csv/to_csv``
-
-      .. ipython:: python
-          :suppress:
-
-          from pandas.compat import lrange
-
-      .. ipython:: python
-
-          df = DataFrame(dict(A=lrange(5), B=lrange(5)))
-          df.to_hdf('store.h5','table',append=True)
-          read_hdf('store.h5', 'table', where = ['index>2'])
-
-      .. ipython:: python
-          :suppress:
-          :okexcept:
-
-          os.remove('store.h5')
-
-    - provide dotted attribute access to ``get`` from stores, e.g. ``store.df == store['df']``
-
-    - new keywords ``iterator=boolean``, and ``chunksize=number_in_a_chunk`` are
-      provided to support iteration on ``select`` and ``select_as_multiple`` (:issue:`3076`)
-
-  - You can now select timestamps from an *unordered* timeseries similarly to an *ordered* timeseries (:issue:`2437`)
-
-  - You can now select with a string from a DataFrame with a datelike index, in a similar way to a Series (:issue:`3070`)
-
-    .. ipython:: python
-
-        idx = date_range("2001-10-1", periods=5, freq='M')
-        ts = Series(np.random.rand(len(idx)),index=idx)
-        ts['2001']
-
-        df = DataFrame(dict(A = ts))
-        df['2001']
-
-  - ``Squeeze`` to possibly remove length 1 dimensions from an object.
-
-    .. ipython:: python
-
-       p = Panel(randn(3,4,4),items=['ItemA','ItemB','ItemC'],
-                          major_axis=date_range('20010102',periods=4),
-                          minor_axis=['A','B','C','D'])
-       p
-       p.reindex(items=['ItemA']).squeeze()
-       p.reindex(items=['ItemA'],minor=['B']).squeeze()
-
-  - In ``pd.io.data.Options``,
-
-    + Fix bug when trying to fetch data for the current month when already
-      past expiry.
-    + Now using lxml to scrape html instead of BeautifulSoup (lxml was faster).
-    + New instance variables for calls and puts are automatically created
-      when a method that creates them is called. This works for current month
-      where the instance variables are simply ``calls`` and ``puts``. Also
-      works for future expiry months and save the instance variable as
-      ``callsMMYY`` or ``putsMMYY``, where ``MMYY`` are, respectively, the
-      month and year of the option's expiry.
-    + ``Options.get_near_stock_price`` now allows the user to specify the
-      month for which to get relevant options data.
-    + ``Options.get_forward_data`` now has optional kwargs ``near`` and
-      ``above_below``. This allows the user to specify if they would like to
-      only return forward looking data for options near the current stock
-      price. This just obtains the data from Options.get_near_stock_price
-      instead of Options.get_xxx_data() (:issue:`2758`).
-
-  - Cursor coordinate information is now displayed in time-series plots.
-
-  - added option `display.max_seq_items` to control the number of
-    elements printed per sequence pprinting it.  (:issue:`2979`)
-
-  - added option `display.chop_threshold` to control display of small numerical
-    values. (:issue:`2739`)
-
-  - added option `display.max_info_rows` to prevent verbose_info from being
-    calculated for frames above 1M rows (configurable). (:issue:`2807`, :issue:`2918`)
-
-  - value_counts() now accepts a "normalize" argument, for normalized
-    histograms. (:issue:`2710`).
-
-  - DataFrame.from_records now accepts not only dicts but any instance of
-    the collections.Mapping ABC.
-
-  - added option `display.mpl_style` providing a sleeker visual style
-    for plots. Based on https://gist.github.com/huyng/816622 (:issue:`3075`).
-
-  - Treat boolean values as integers (values 1 and 0) for numeric
-    operations. (:issue:`2641`)
-
-  - to_html() now accepts an optional "escape" argument to control reserved
-    HTML character escaping (enabled by default) and escapes ``&``, in addition
-    to ``<`` and ``>``.  (:issue:`2919`)
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
diff --git a/doc/source/whatsnew/v0.12.0.rst b/doc/source/whatsnew/v0.12.0.rst
new file mode 100644
index 0000000000000..b2dd8229c91f3
--- /dev/null
+++ b/doc/source/whatsnew/v0.12.0.rst
@@ -0,0 +1,520 @@
+.. _whatsnew_0120:
+
+v0.12.0 (July 24, 2013)
+------------------------
+
+{{ header }}
+
+
+This is a major release from 0.11.0 and includes several new features and
+enhancements along with a large number of bug fixes.
+
+Highlights include a consistent I/O API naming scheme, routines to read html,
+write MultiIndexes to csv files, read & write STATA data files, read & write JSON format
+files, Python 3 support for ``HDFStore``, filtering of groupby expressions via ``filter``, and a
+revamped ``replace`` routine that accepts regular expressions.
+
+API changes
+~~~~~~~~~~~
+
+  - The I/O API is now much more consistent with a set of top level ``reader`` functions
+    accessed like ``pd.read_csv()`` that generally return a ``pandas`` object.
+
+    * ``read_csv``
+    * ``read_excel``
+    * ``read_hdf``
+    * ``read_sql``
+    * ``read_json``
+    * ``read_html``
+    * ``read_stata``
+    * ``read_clipboard``
+
+    The corresponding ``writer`` functions are object methods that are accessed like ``df.to_csv()``
+
+    * ``to_csv``
+    * ``to_excel``
+    * ``to_hdf``
+    * ``to_sql``
+    * ``to_json``
+    * ``to_html``
+    * ``to_stata``
+    * ``to_clipboard``
+
+
+  - Fix modulo and integer division on Series,DataFrames to act similarly to ``float`` dtypes to return
+    ``np.nan`` or ``np.inf`` as appropriate (:issue:`3590`). This correct a numpy bug that treats ``integer``
+    and ``float`` dtypes differently.
+
+    .. ipython:: python
+
+        p = pd.DataFrame({'first': [4, 5, 8], 'second': [0, 0, 3]})
+        p % 0
+        p % p
+        p / p
+        p / 0
+
+  - Add ``squeeze`` keyword to ``groupby`` to allow reduction from
+    DataFrame -> Series if groups are unique. This is a Regression from 0.10.1.
+    We are reverting back to the prior behavior. This means groupby will return the
+    same shaped objects whether the groups are unique or not. Revert this issue (:issue:`2893`)
+    with (:issue:`3596`).
+
+    .. ipython:: python
+
+        df2 = pd.DataFrame([{"val1": 1, "val2": 20},
+                            {"val1": 1, "val2": 19},
+                            {"val1": 1, "val2": 27},
+                            {"val1": 1, "val2": 12}])
+
+        def func(dataf):
+            return dataf["val2"] - dataf["val2"].mean()
+
+        # squeezing the result frame to a series (because we have unique groups)
+        df2.groupby("val1", squeeze=True).apply(func)
+
+        # no squeezing (the default, and behavior in 0.10.1)
+        df2.groupby("val1").apply(func)
+
+  - Raise on ``iloc`` when boolean indexing with a label based indexer mask
+    e.g. a boolean Series, even with integer labels, will raise. Since ``iloc``
+    is purely positional based, the labels on the Series are not alignable (:issue:`3631`)
+
+    This case is rarely used, and there are plenty of alternatives. This preserves the
+    ``iloc`` API to be *purely* positional based.
+
+    .. ipython:: python
+       :suppress:
+
+       from pandas.compat import lrange
+
+    .. ipython:: python
+
+       df = pd.DataFrame(lrange(5), list('ABCDE'), columns=['a'])
+       mask = (df.a % 2 == 0)
+       mask
+
+       # this is what you should use
+       df.loc[mask]
+
+       # this will work as well
+       df.iloc[mask.values]
+
+    ``df.iloc[mask]`` will raise a ``ValueError``
+
+  - The ``raise_on_error`` argument to plotting functions is removed. Instead,
+    plotting functions raise a ``TypeError`` when the ``dtype`` of the object
+    is ``object`` to remind you to avoid ``object`` arrays whenever possible
+    and thus you should cast to an appropriate numeric dtype if you need to
+    plot something.
+
+  - Add ``colormap`` keyword to DataFrame plotting methods. Accepts either a
+    matplotlib colormap object (ie, matplotlib.cm.jet) or a string name of such
+    an object (ie, 'jet'). The colormap is sampled to select the color for each
+    column. Please see :ref:`visualization.colormaps` for more information.
+    (:issue:`3860`)
+
+  - ``DataFrame.interpolate()`` is now deprecated. Please use
+    ``DataFrame.fillna()`` and ``DataFrame.replace()`` instead. (:issue:`3582`,
+    :issue:`3675`, :issue:`3676`)
+
+  - the ``method`` and ``axis`` arguments of ``DataFrame.replace()`` are
+    deprecated
+
+  - ``DataFrame.replace`` 's ``infer_types`` parameter is removed and now
+    performs conversion by default. (:issue:`3907`)
+
+  - Add the keyword ``allow_duplicates`` to ``DataFrame.insert`` to allow a duplicate column
+    to be inserted if ``True``, default is ``False`` (same as prior to 0.12) (:issue:`3679`)
+  - Implement ``__nonzero__`` for ``NDFrame`` objects (:issue:`3691`, :issue:`3696`)
+
+  - IO api
+
+    - added top-level function ``read_excel`` to replace the following,
+      The original API is deprecated and will be removed in a future version
+
+      .. code-block:: python
+
+         from pandas.io.parsers import ExcelFile
+         xls = ExcelFile('path_to_file.xls')
+         xls.parse('Sheet1', index_col=None, na_values=['NA'])
+
+      With
+
+      .. code-block:: python
+
+         import pandas as pd
+         pd.read_excel('path_to_file.xls', 'Sheet1', index_col=None, na_values=['NA'])
+
+    - added top-level function ``read_sql`` that is equivalent to the following
+
+      .. code-block:: python
+
+         from pandas.io.sql import read_frame
+         read_frame(...)
+
+  - ``DataFrame.to_html`` and ``DataFrame.to_latex`` now accept a path for
+    their first argument (:issue:`3702`)
+
+  - Do not allow astypes on ``datetime64[ns]`` except to ``object``, and
+    ``timedelta64[ns]`` to ``object/int`` (:issue:`3425`)
+
+  - The behavior of ``datetime64`` dtypes has changed with respect to certain
+    so-called reduction operations (:issue:`3726`). The following operations now
+    raise a ``TypeError`` when performed on a ``Series`` and return an *empty*
+    ``Series`` when performed on a ``DataFrame`` similar to performing these
+    operations on, for example, a ``DataFrame`` of ``slice`` objects:
+
+    - sum, prod, mean, std, var, skew, kurt, corr, and cov
+
+  - ``read_html`` now defaults to ``None`` when reading, and falls back on
+    ``bs4`` + ``html5lib`` when lxml fails to parse. a list of parsers to try
+    until success is also valid
+
+  - The internal ``pandas`` class hierarchy has changed (slightly). The
+    previous ``PandasObject`` now is called ``PandasContainer`` and a new
+    ``PandasObject`` has become the base class for ``PandasContainer`` as well
+    as ``Index``, ``Categorical``, ``GroupBy``, ``SparseList``, and
+    ``SparseArray`` (+ their base classes). Currently, ``PandasObject``
+    provides string methods (from ``StringMixin``). (:issue:`4090`, :issue:`4092`)
+
+  - New ``StringMixin`` that, given a ``__unicode__`` method, gets python 2 and
+    python 3 compatible string methods (``__str__``, ``__bytes__``, and
+    ``__repr__``). Plus string safety throughout. Now employed in many places
+    throughout the pandas library. (:issue:`4090`, :issue:`4092`)
+
+I/O Enhancements
+~~~~~~~~~~~~~~~~
+
+  - ``pd.read_html()`` can now parse HTML strings, files or urls and return
+    DataFrames, courtesy of @cpcloud. (:issue:`3477`, :issue:`3605`, :issue:`3606`, :issue:`3616`).
+    It works with a *single* parser backend: BeautifulSoup4 + html5lib :ref:`See the docs<io.html>`
+
+    You can use ``pd.read_html()`` to read the output from ``DataFrame.to_html()`` like so
+
+    .. ipython:: python
+       :okwarning:
+
+        df = pd.DataFrame({'a': range(3), 'b': list('abc')})
+        print(df)
+        html = df.to_html()
+        alist = pd.read_html(html, index_col=0)
+        print(df == alist[0])
+
+    Note that ``alist`` here is a Python ``list`` so ``pd.read_html()`` and
+    ``DataFrame.to_html()`` are not inverses.
+
+    - ``pd.read_html()`` no longer performs hard conversion of date strings
+      (:issue:`3656`).
+
+    .. warning::
+
+      You may have to install an older version of BeautifulSoup4,
+      :ref:`See the installation docs<install.optional_dependencies>`
+
+  - Added module for reading and writing Stata files: ``pandas.io.stata`` (:issue:`1512`)
+    accessible via ``read_stata`` top-level function for reading,
+    and ``to_stata`` DataFrame method for writing, :ref:`See the docs<io.stata>`
+
+  - Added module for reading and writing json format files: ``pandas.io.json``
+    accessible via ``read_json`` top-level function for reading,
+    and ``to_json`` DataFrame method for writing, :ref:`See the docs<io.json>`
+    various issues (:issue:`1226`, :issue:`3804`, :issue:`3876`, :issue:`3867`, :issue:`1305`)
+
+  - ``MultiIndex`` column support for reading and writing csv format files
+
+    - The ``header`` option in ``read_csv`` now accepts a
+      list of the rows from which to read the index.
+
+    - The option, ``tupleize_cols`` can now be specified in both ``to_csv`` and
+      ``read_csv``, to provide compatibility for the pre 0.12 behavior of
+      writing and reading ``MultIndex`` columns via a list of tuples. The default in
+      0.12 is to write lists of tuples and *not* interpret list of tuples as a
+      ``MultiIndex`` column.
+
+      Note: The default behavior in 0.12 remains unchanged from prior versions, but starting with 0.13,
+      the default *to* write and read ``MultiIndex`` columns will be in the new
+      format. (:issue:`3571`, :issue:`1651`, :issue:`3141`)
+
+    - If an ``index_col`` is not specified (e.g. you don't have an index, or wrote it
+      with ``df.to_csv(..., index=False``), then any ``names`` on the columns index will
+      be *lost*.
+
+      .. ipython:: python
+
+         from pandas.util.testing import makeCustomDataframe as mkdf
+         df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+         df.to_csv('mi.csv')
+         print(open('mi.csv').read())
+         pd.read_csv('mi.csv', header=[0, 1, 2, 3], index_col=[0, 1])
+
+      .. ipython:: python
+         :suppress:
+
+         import os
+         os.remove('mi.csv')
+
+  - Support for ``HDFStore`` (via ``PyTables 3.0.0``) on Python3
+
+  - Iterator support via ``read_hdf`` that automatically opens and closes the
+    store when iteration is finished. This is only for *tables*
+
+    .. code-block:: ipython
+
+        In [25]: path = 'store_iterator.h5'
+
+        In [26]: pd.DataFrame(np.random.randn(10, 2)).to_hdf(path, 'df', table=True)
+
+        In [27]: for df in pd.read_hdf(path, 'df', chunksize=3):
+           ....:     print(df)
+           ....:
+                  0         1
+        0  0.713216 -0.778461
+        1 -0.661062  0.862877
+        2  0.344342  0.149565
+                  0         1
+        3 -0.626968 -0.875772
+        4 -0.930687 -0.218983
+        5  0.949965 -0.442354
+                  0         1
+        6 -0.402985  1.111358
+        7 -0.241527 -0.670477
+        8  0.049355  0.632633
+                  0         1
+        9 -1.502767 -1.225492
+
+
+
+  - ``read_csv`` will now throw a more informative error message when a file
+    contains no columns, e.g., all newline characters
+
+Other Enhancements
+~~~~~~~~~~~~~~~~~~
+
+  - ``DataFrame.replace()`` now allows regular expressions on contained
+    ``Series`` with object dtype. See the examples section in the regular docs
+    :ref:`Replacing via String Expression <missing_data.replace_expression>`
+
+    For example you can do
+
+    .. ipython:: python
+
+        df = pd.DataFrame({'a': list('ab..'), 'b': [1, 2, 3, 4]})
+        df.replace(regex=r'\s*\.\s*', value=np.nan)
+
+    to replace all occurrences of the string ``'.'`` with zero or more
+    instances of surrounding white space with ``NaN``.
+
+    Regular string replacement still works as expected. For example, you can do
+
+    .. ipython:: python
+
+        df.replace('.', np.nan)
+
+    to replace all occurrences of the string ``'.'`` with ``NaN``.
+
+  - ``pd.melt()`` now accepts the optional parameters ``var_name`` and ``value_name``
+    to specify custom column names of the returned DataFrame.
+
+  - ``pd.set_option()`` now allows N option, value pairs (:issue:`3667`).
+
+      Let's say that we had an option ``'a.b'`` and another option ``'b.c'``.
+      We can set them at the same time:
+
+      .. ipython:: python
+         :suppress:
+
+         pd.core.config.register_option('a.b', 2, 'ay dot bee')
+         pd.core.config.register_option('b.c', 3, 'bee dot cee')
+
+      .. ipython:: python
+
+         pd.get_option('a.b')
+         pd.get_option('b.c')
+         pd.set_option('a.b', 1, 'b.c', 4)
+         pd.get_option('a.b')
+         pd.get_option('b.c')
+
+  - The ``filter`` method for group objects returns a subset of the original
+    object. Suppose we want to take only elements that belong to groups with a
+    group sum greater than 2.
+
+    .. ipython:: python
+
+       sf = pd.Series([1, 1, 2, 3, 3, 3])
+       sf.groupby(sf).filter(lambda x: x.sum() > 2)
+
+    The argument of ``filter`` must a function that, applied to the group as a
+    whole, returns ``True`` or ``False``.
+
+    Another useful operation is filtering out elements that belong to groups
+    with only a couple members.
+
+    .. ipython:: python
+
+       dff = pd.DataFrame({'A': np.arange(8), 'B': list('aabbbbcc')})
+       dff.groupby('B').filter(lambda x: len(x) > 2)
+
+    Alternatively, instead of dropping the offending groups, we can return a
+    like-indexed objects where the groups that do not pass the filter are
+    filled with NaNs.
+
+    .. ipython:: python
+
+       dff.groupby('B').filter(lambda x: len(x) > 2, dropna=False)
+
+  - Series and DataFrame hist methods now take a ``figsize`` argument (:issue:`3834`)
+
+  - DatetimeIndexes no longer try to convert mixed-integer indexes during join
+    operations (:issue:`3877`)
+
+  - Timestamp.min and Timestamp.max now represent valid Timestamp instances instead
+    of the default datetime.min and datetime.max (respectively), thanks @SleepingPills
+
+  - ``read_html`` now raises when no tables are found and BeautifulSoup==4.2.0
+    is detected (:issue:`4214`)
+
+
+Experimental Features
+~~~~~~~~~~~~~~~~~~~~~
+
+  - Added experimental ``CustomBusinessDay`` class to support ``DateOffsets``
+    with custom holiday calendars and custom weekmasks. (:issue:`2301`)
+
+    .. note::
+
+       This uses the ``numpy.busdaycalendar`` API introduced in Numpy 1.7 and
+       therefore requires Numpy 1.7.0 or newer.
+
+    .. ipython:: python
+
+      from pandas.tseries.offsets import CustomBusinessDay
+      from datetime import datetime
+      # As an interesting example, let's look at Egypt where
+      # a Friday-Saturday weekend is observed.
+      weekmask_egypt = 'Sun Mon Tue Wed Thu'
+      # They also observe International Workers' Day so let's
+      # add that for a couple of years
+      holidays = ['2012-05-01', datetime(2013, 5, 1), np.datetime64('2014-05-01')]
+      bday_egypt = CustomBusinessDay(holidays=holidays, weekmask=weekmask_egypt)
+      dt = datetime(2013, 4, 30)
+      print(dt + 2 * bday_egypt)
+      dts = pd.date_range(dt, periods=5, freq=bday_egypt)
+      print(pd.Series(dts.weekday, dts).map(pd.Series('Mon Tue Wed Thu Fri Sat Sun'.split())))
+
+Bug Fixes
+~~~~~~~~~
+
+  - Plotting functions now raise a ``TypeError`` before trying to plot anything
+    if the associated objects have have a dtype of ``object`` (:issue:`1818`,
+    :issue:`3572`, :issue:`3911`, :issue:`3912`), but they will try to convert object arrays to
+    numeric arrays if possible so that you can still plot, for example, an
+    object array with floats. This happens before any drawing takes place which
+    eliminates any spurious plots from showing up.
+
+  - ``fillna`` methods now raise a ``TypeError`` if the ``value`` parameter is
+    a list or tuple.
+
+  - ``Series.str`` now supports iteration (:issue:`3638`). You can iterate over the
+    individual elements of each string in the ``Series``. Each iteration yields
+    yields a ``Series`` with either a single character at each index of the
+    original ``Series`` or ``NaN``. For example,
+
+    .. ipython:: python
+
+        strs = 'go', 'bow', 'joe', 'slow'
+        ds = pd.Series(strs)
+
+        for s in ds.str:
+            print(s)
+
+        s
+        s.dropna().values.item() == 'w'
+
+    The last element yielded by the iterator will be a ``Series`` containing
+    the last element of the longest string in the ``Series`` with all other
+    elements being ``NaN``. Here since ``'slow'`` is the longest string
+    and there are no other strings with the same length ``'w'`` is the only
+    non-null string in the yielded ``Series``.
+
+  - ``HDFStore``
+
+    - will retain index attributes (freq,tz,name) on recreation (:issue:`3499`)
+    - will warn with a ``AttributeConflictWarning`` if you are attempting to append
+      an index with a different frequency than the existing, or attempting
+      to append an index with a different name than the existing
+    - support datelike columns with a timezone as data_columns (:issue:`2852`)
+
+  - Non-unique index support clarified (:issue:`3468`).
+
+    - Fix assigning a new index to a duplicate index in a DataFrame would fail (:issue:`3468`)
+    - Fix construction of a DataFrame with a duplicate index
+    - ref_locs support to allow duplicative indices across dtypes,
+      allows iget support to always find the index (even across dtypes) (:issue:`2194`)
+    - applymap on a DataFrame with a non-unique index now works
+      (removed warning) (:issue:`2786`), and fix (:issue:`3230`)
+    - Fix to_csv to handle non-unique columns (:issue:`3495`)
+    - Duplicate indexes with getitem will return items in the correct order (:issue:`3455`, :issue:`3457`)
+      and handle missing elements like unique indices (:issue:`3561`)
+    - Duplicate indexes with and empty DataFrame.from_records will return a correct frame (:issue:`3562`)
+    - Concat to produce a non-unique columns when duplicates are across dtypes is fixed (:issue:`3602`)
+    - Allow insert/delete to non-unique columns (:issue:`3679`)
+    - Non-unique indexing with a slice via ``loc`` and friends fixed (:issue:`3659`)
+    - Allow insert/delete to non-unique columns (:issue:`3679`)
+    - Extend ``reindex`` to correctly deal with non-unique indices (:issue:`3679`)
+    - ``DataFrame.itertuples()`` now works with frames with duplicate column
+      names (:issue:`3873`)
+    - Bug in non-unique indexing via ``iloc`` (:issue:`4017`); added ``takeable`` argument to
+      ``reindex`` for location-based taking
+    - Allow non-unique indexing in series via ``.ix/.loc`` and ``__getitem__`` (:issue:`4246`)
+    - Fixed non-unique indexing memory allocation issue with ``.ix/.loc`` (:issue:`4280`)
+
+  - ``DataFrame.from_records`` did not accept empty recarrays (:issue:`3682`)
+  - ``read_html`` now correctly skips tests (:issue:`3741`)
+  - Fixed a bug where ``DataFrame.replace`` with a compiled regular expression
+    in the ``to_replace`` argument wasn't working (:issue:`3907`)
+  - Improved ``network`` test decorator to catch ``IOError`` (and therefore
+    ``URLError`` as well). Added ``with_connectivity_check`` decorator to allow
+    explicitly checking a website as a proxy for seeing if there is network
+    connectivity. Plus, new ``optional_args`` decorator factory for decorators.
+    (:issue:`3910`, :issue:`3914`)
+  - Fixed testing issue where too many sockets where open thus leading to a
+    connection reset issue (:issue:`3982`, :issue:`3985`, :issue:`4028`,
+    :issue:`4054`)
+  - Fixed failing tests in test_yahoo, test_google where symbols were not
+    retrieved but were being accessed (:issue:`3982`, :issue:`3985`,
+    :issue:`4028`, :issue:`4054`)
+  - ``Series.hist`` will now take the figure from the current environment if
+    one is not passed
+  - Fixed bug where a 1xN DataFrame would barf on a 1xN mask (:issue:`4071`)
+  - Fixed running of ``tox`` under python3 where the pickle import was getting
+    rewritten in an incompatible way (:issue:`4062`, :issue:`4063`)
+  - Fixed bug where sharex and sharey were not being passed to grouped_hist
+    (:issue:`4089`)
+  - Fixed bug in ``DataFrame.replace`` where a nested dict wasn't being
+    iterated over when regex=False (:issue:`4115`)
+  - Fixed bug in the parsing of microseconds when using the ``format``
+    argument in ``to_datetime`` (:issue:`4152`)
+  - Fixed bug in ``PandasAutoDateLocator`` where ``invert_xaxis`` triggered
+    incorrectly ``MilliSecondLocator``  (:issue:`3990`)
+  - Fixed bug in plotting that wasn't raising on invalid colormap for
+    matplotlib 1.1.1 (:issue:`4215`)
+  - Fixed the legend displaying in ``DataFrame.plot(kind='kde')`` (:issue:`4216`)
+  - Fixed bug where Index slices weren't carrying the name attribute
+    (:issue:`4226`)
+  - Fixed bug in initializing ``DatetimeIndex`` with an array of strings
+    in a certain time zone (:issue:`4229`)
+  - Fixed bug where html5lib wasn't being properly skipped (:issue:`4265`)
+  - Fixed bug where get_data_famafrench wasn't using the correct file edges
+    (:issue:`4281`)
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+.. _whatsnew_0.12.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.11.0..v0.12.0
diff --git a/doc/source/whatsnew/v0.12.0.txt b/doc/source/whatsnew/v0.12.0.txt
deleted file mode 100644
index c4188898bdf71..0000000000000
--- a/doc/source/whatsnew/v0.12.0.txt
+++ /dev/null
@@ -1,506 +0,0 @@
-.. _whatsnew_0120:
-
-v0.12.0 (July 24, 2013)
-------------------------
-
-This is a major release from 0.11.0 and includes several new features and
-enhancements along with a large number of bug fixes.
-
-Highlights include a consistent I/O API naming scheme, routines to read html,
-write multi-indexes to csv files, read & write STATA data files, read & write JSON format
-files, Python 3 support for ``HDFStore``, filtering of groupby expressions via ``filter``, and a
-revamped ``replace`` routine that accepts regular expressions.
-
-API changes
-~~~~~~~~~~~
-
-  - The I/O API is now much more consistent with a set of top level ``reader`` functions
-    accessed like ``pd.read_csv()`` that generally return a ``pandas`` object.
-
-    * ``read_csv``
-    * ``read_excel``
-    * ``read_hdf``
-    * ``read_sql``
-    * ``read_json``
-    * ``read_html``
-    * ``read_stata``
-    * ``read_clipboard``
-
-    The corresponding ``writer`` functions are object methods that are accessed like ``df.to_csv()``
-
-    * ``to_csv``
-    * ``to_excel``
-    * ``to_hdf``
-    * ``to_sql``
-    * ``to_json``
-    * ``to_html``
-    * ``to_stata``
-    * ``to_clipboard``
-
-
-  - Fix modulo and integer division on Series,DataFrames to act similary to ``float`` dtypes to return
-    ``np.nan`` or ``np.inf`` as appropriate (:issue:`3590`). This correct a numpy bug that treats ``integer``
-    and ``float`` dtypes differently.
-
-    .. ipython:: python
-
-        p = DataFrame({ 'first' : [4,5,8], 'second' : [0,0,3] })
-        p % 0
-        p % p
-        p / p
-        p / 0
-
-  - Add ``squeeze`` keyword to ``groupby`` to allow reduction from
-    DataFrame -> Series if groups are unique. This is a Regression from 0.10.1.
-    We are reverting back to the prior behavior. This means groupby will return the
-    same shaped objects whether the groups are unique or not. Revert this issue (:issue:`2893`)
-    with (:issue:`3596`).
-
-    .. ipython:: python
-
-        df2 = DataFrame([{"val1": 1, "val2" : 20}, {"val1":1, "val2": 19},
-                         {"val1":1, "val2": 27}, {"val1":1, "val2": 12}])
-        def func(dataf):
-            return dataf["val2"]  - dataf["val2"].mean()
-
-        # squeezing the result frame to a series (because we have unique groups)
-        df2.groupby("val1", squeeze=True).apply(func)
-
-        # no squeezing (the default, and behavior in 0.10.1)
-        df2.groupby("val1").apply(func)
-
-  - Raise on ``iloc`` when boolean indexing with a label based indexer mask
-    e.g. a boolean Series, even with integer labels, will raise. Since ``iloc``
-    is purely positional based, the labels on the Series are not alignable (:issue:`3631`)
-
-    This case is rarely used, and there are plently of alternatives. This preserves the
-    ``iloc`` API to be *purely* positional based.
-
-    .. ipython:: python
-       :suppress:
-
-       from pandas.compat import lrange
-
-    .. ipython:: python
-
-       df = DataFrame(lrange(5), list('ABCDE'), columns=['a'])
-       mask = (df.a%2 == 0)
-       mask
-
-       # this is what you should use
-       df.loc[mask]
-
-       # this will work as well
-       df.iloc[mask.values]
-
-    ``df.iloc[mask]`` will raise a ``ValueError``
-
-  - The ``raise_on_error`` argument to plotting functions is removed. Instead,
-    plotting functions raise a ``TypeError`` when the ``dtype`` of the object
-    is ``object`` to remind you to avoid ``object`` arrays whenever possible
-    and thus you should cast to an appropriate numeric dtype if you need to
-    plot something.
-
-  - Add ``colormap`` keyword to DataFrame plotting methods. Accepts either a
-    matplotlib colormap object (ie, matplotlib.cm.jet) or a string name of such
-    an object (ie, 'jet'). The colormap is sampled to select the color for each
-    column. Please see :ref:`visualization.colormaps` for more information.
-    (:issue:`3860`)
-
-  - ``DataFrame.interpolate()`` is now deprecated. Please use
-    ``DataFrame.fillna()`` and ``DataFrame.replace()`` instead. (:issue:`3582`,
-    :issue:`3675`, :issue:`3676`)
-
-  - the ``method`` and ``axis`` arguments of ``DataFrame.replace()`` are
-    deprecated
-
-  - ``DataFrame.replace`` 's ``infer_types`` parameter is removed and now
-    performs conversion by default. (:issue:`3907`)
-
-  - Add the keyword ``allow_duplicates`` to ``DataFrame.insert`` to allow a duplicate column
-    to be inserted if ``True``, default is ``False`` (same as prior to 0.12) (:issue:`3679`)
-  - Implement ``__nonzero__`` for ``NDFrame`` objects (:issue:`3691`, :issue:`3696`)
-
-  - IO api
-
-    - added top-level function ``read_excel`` to replace the following,
-      The original API is deprecated and will be removed in a future version
-
-      .. code-block:: python
-
-         from pandas.io.parsers import ExcelFile
-         xls = ExcelFile('path_to_file.xls')
-         xls.parse('Sheet1', index_col=None, na_values=['NA'])
-
-      With
-
-      .. code-block:: python
-
-         import pandas as pd
-         pd.read_excel('path_to_file.xls', 'Sheet1', index_col=None, na_values=['NA'])
-
-    - added top-level function ``read_sql`` that is equivalent to the following
-
-      .. code-block:: python
-
-         from pandas.io.sql import read_frame
-         read_frame(....)
-
-  - ``DataFrame.to_html`` and ``DataFrame.to_latex`` now accept a path for
-    their first argument (:issue:`3702`)
-
-  - Do not allow astypes on ``datetime64[ns]`` except to ``object``, and
-    ``timedelta64[ns]`` to ``object/int`` (:issue:`3425`)
-
-  - The behavior of ``datetime64`` dtypes has changed with respect to certain
-    so-called reduction operations (:issue:`3726`). The following operations now
-    raise a ``TypeError`` when perfomed on a ``Series`` and return an *empty*
-    ``Series`` when performed on a ``DataFrame`` similar to performing these
-    operations on, for example, a ``DataFrame`` of ``slice`` objects:
-
-    - sum, prod, mean, std, var, skew, kurt, corr, and cov
-
-  - ``read_html`` now defaults to ``None`` when reading, and falls back on
-    ``bs4`` + ``html5lib`` when lxml fails to parse. a list of parsers to try
-    until success is also valid
-
-  - The internal ``pandas`` class hierarchy has changed (slightly). The
-    previous ``PandasObject`` now is called ``PandasContainer`` and a new
-    ``PandasObject`` has become the baseclass for ``PandasContainer`` as well
-    as ``Index``, ``Categorical``, ``GroupBy``, ``SparseList``, and
-    ``SparseArray`` (+ their base classes). Currently, ``PandasObject``
-    provides string methods (from ``StringMixin``). (:issue:`4090`, :issue:`4092`)
-
-  - New ``StringMixin`` that, given a ``__unicode__`` method, gets python 2 and
-    python 3 compatible string methods (``__str__``, ``__bytes__``, and
-    ``__repr__``). Plus string safety throughout. Now employed in many places
-    throughout the pandas library. (:issue:`4090`, :issue:`4092`)
-
-I/O Enhancements
-~~~~~~~~~~~~~~~~
-
-  - ``pd.read_html()`` can now parse HTML strings, files or urls and return
-    DataFrames, courtesy of @cpcloud. (:issue:`3477`, :issue:`3605`, :issue:`3606`, :issue:`3616`).
-    It works with a *single* parser backend: BeautifulSoup4 + html5lib :ref:`See the docs<io.html>`
-
-    You can use ``pd.read_html()`` to read the output from ``DataFrame.to_html()`` like so
-
-    .. ipython :: python
-       :okwarning:
-
-        df = DataFrame({'a': range(3), 'b': list('abc')})
-        print(df)
-        html = df.to_html()
-        alist = pd.read_html(html, index_col=0)
-        print(df == alist[0])
-
-    Note that ``alist`` here is a Python ``list`` so ``pd.read_html()`` and
-    ``DataFrame.to_html()`` are not inverses.
-
-    - ``pd.read_html()`` no longer performs hard conversion of date strings
-      (:issue:`3656`).
-
-    .. warning::
-
-      You may have to install an older version of BeautifulSoup4,
-      :ref:`See the installation docs<install.optional_dependencies>`
-
-  - Added module for reading and writing Stata files: ``pandas.io.stata`` (:issue:`1512`)
-    accessable via ``read_stata`` top-level function for reading,
-    and ``to_stata`` DataFrame method for writing, :ref:`See the docs<io.stata>`
-
-  - Added module for reading and writing json format files: ``pandas.io.json``
-    accessable via ``read_json`` top-level function for reading,
-    and ``to_json`` DataFrame method for writing, :ref:`See the docs<io.json>`
-    various issues (:issue:`1226`, :issue:`3804`, :issue:`3876`, :issue:`3867`, :issue:`1305`)
-
-  - ``MultiIndex`` column support for reading and writing csv format files
-
-    - The ``header`` option in ``read_csv`` now accepts a
-      list of the rows from which to read the index.
-
-    - The option, ``tupleize_cols`` can now be specified in both ``to_csv`` and
-      ``read_csv``, to provide compatiblity for the pre 0.12 behavior of
-      writing and reading ``MultIndex`` columns via a list of tuples. The default in
-      0.12 is to write lists of tuples and *not* interpret list of tuples as a
-      ``MultiIndex`` column.
-
-      Note: The default behavior in 0.12 remains unchanged from prior versions, but starting with 0.13,
-      the default *to* write and read ``MultiIndex`` columns will be in the new
-      format. (:issue:`3571`, :issue:`1651`, :issue:`3141`)
-
-    - If an ``index_col`` is not specified (e.g. you don't have an index, or wrote it
-      with ``df.to_csv(..., index=False``), then any ``names`` on the columns index will
-      be *lost*.
-
-      .. ipython:: python
-
-         from pandas.util.testing import makeCustomDataframe as mkdf
-         df = mkdf(5,3,r_idx_nlevels=2,c_idx_nlevels=4)
-         df.to_csv('mi.csv',tupleize_cols=False)
-         print(open('mi.csv').read())
-         pd.read_csv('mi.csv',header=[0,1,2,3],index_col=[0,1],tupleize_cols=False)
-
-      .. ipython:: python
-         :suppress:
-
-         import os
-         os.remove('mi.csv')
-
-  - Support for ``HDFStore`` (via ``PyTables 3.0.0``) on Python3
-
-  - Iterator support via ``read_hdf`` that automatically opens and closes the
-    store when iteration is finished. This is only for *tables*
-
-    .. code-block:: ipython
-
-        In [25]: path = 'store_iterator.h5'
-
-        In [26]: DataFrame(randn(10,2)).to_hdf(path,'df',table=True)
-
-        In [27]: for df in read_hdf(path,'df', chunksize=3):
-           ....:    print df
-           ....:
-                  0         1
-        0  0.713216 -0.778461
-        1 -0.661062  0.862877
-        2  0.344342  0.149565
-                  0         1
-        3 -0.626968 -0.875772
-        4 -0.930687 -0.218983
-        5  0.949965 -0.442354
-                  0         1
-        6 -0.402985  1.111358
-        7 -0.241527 -0.670477
-        8  0.049355  0.632633
-                  0         1
-        9 -1.502767 -1.225492
-
-
-
-  - ``read_csv`` will now throw a more informative error message when a file
-    contains no columns, e.g., all newline characters
-
-Other Enhancements
-~~~~~~~~~~~~~~~~~~
-
-  - ``DataFrame.replace()`` now allows regular expressions on contained
-    ``Series`` with object dtype. See the examples section in the regular docs
-    :ref:`Replacing via String Expression <missing_data.replace_expression>`
-
-    For example you can do
-
-    .. ipython :: python
-
-        df = DataFrame({'a': list('ab..'), 'b': [1, 2, 3, 4]})
-        df.replace(regex=r'\s*\.\s*', value=np.nan)
-
-    to replace all occurrences of the string ``'.'`` with zero or more
-    instances of surrounding whitespace with ``NaN``.
-
-    Regular string replacement still works as expected. For example, you can do
-
-    .. ipython :: python
-
-        df.replace('.', np.nan)
-
-    to replace all occurrences of the string ``'.'`` with ``NaN``.
-
-  - ``pd.melt()`` now accepts the optional parameters ``var_name`` and ``value_name``
-    to specify custom column names of the returned DataFrame.
-
-  - ``pd.set_option()`` now allows N option, value pairs (:issue:`3667`).
-
-      Let's say that we had an option ``'a.b'`` and another option ``'b.c'``.
-      We can set them at the same time:
-
-      .. ipython:: python
-         :suppress:
-
-         pd.core.config.register_option('a.b', 2, 'ay dot bee')
-         pd.core.config.register_option('b.c', 3, 'bee dot cee')
-
-      .. ipython:: python
-
-         pd.get_option('a.b')
-         pd.get_option('b.c')
-         pd.set_option('a.b', 1, 'b.c', 4)
-         pd.get_option('a.b')
-         pd.get_option('b.c')
-
-  - The ``filter`` method for group objects returns a subset of the original
-    object. Suppose we want to take only elements that belong to groups with a
-    group sum greater than 2.
-
-    .. ipython:: python
-
-       sf = Series([1, 1, 2, 3, 3, 3])
-       sf.groupby(sf).filter(lambda x: x.sum() > 2)
-
-    The argument of ``filter`` must a function that, applied to the group as a
-    whole, returns ``True`` or ``False``.
-
-    Another useful operation is filtering out elements that belong to groups
-    with only a couple members.
-
-    .. ipython:: python
-
-       dff = DataFrame({'A': np.arange(8), 'B': list('aabbbbcc')})
-       dff.groupby('B').filter(lambda x: len(x) > 2)
-
-    Alternatively, instead of dropping the offending groups, we can return a
-    like-indexed objects where the groups that do not pass the filter are
-    filled with NaNs.
-
-    .. ipython:: python
-
-       dff.groupby('B').filter(lambda x: len(x) > 2, dropna=False)
-
-  - Series and DataFrame hist methods now take a ``figsize`` argument (:issue:`3834`)
-
-  - DatetimeIndexes no longer try to convert mixed-integer indexes during join
-    operations (:issue:`3877`)
-
-  - Timestamp.min and Timestamp.max now represent valid Timestamp instances instead
-    of the default datetime.min and datetime.max (respectively), thanks @SleepingPills
-
-  - ``read_html`` now raises when no tables are found and BeautifulSoup==4.2.0
-    is detected (:issue:`4214`)
-
-
-Experimental Features
-~~~~~~~~~~~~~~~~~~~~~
-
-  - Added experimental ``CustomBusinessDay`` class to support ``DateOffsets``
-    with custom holiday calendars and custom weekmasks. (:issue:`2301`)
-
-    .. note::
-
-       This uses the ``numpy.busdaycalendar`` API introduced in Numpy 1.7 and
-       therefore requires Numpy 1.7.0 or newer.
-
-    .. ipython:: python
-
-      from pandas.tseries.offsets import CustomBusinessDay
-      from datetime import datetime
-      # As an interesting example, let's look at Egypt where
-      # a Friday-Saturday weekend is observed.
-      weekmask_egypt = 'Sun Mon Tue Wed Thu'
-      # They also observe International Workers' Day so let's
-      # add that for a couple of years
-      holidays = ['2012-05-01', datetime(2013, 5, 1), np.datetime64('2014-05-01')]
-      bday_egypt = CustomBusinessDay(holidays=holidays, weekmask=weekmask_egypt)
-      dt = datetime(2013, 4, 30)
-      print(dt + 2 * bday_egypt)
-      dts = date_range(dt, periods=5, freq=bday_egypt)
-      print(Series(dts.weekday, dts).map(Series('Mon Tue Wed Thu Fri Sat Sun'.split())))
-
-Bug Fixes
-~~~~~~~~~
-
-  - Plotting functions now raise a ``TypeError`` before trying to plot anything
-    if the associated objects have have a dtype of ``object`` (:issue:`1818`,
-    :issue:`3572`, :issue:`3911`, :issue:`3912`), but they will try to convert object arrays to
-    numeric arrays if possible so that you can still plot, for example, an
-    object array with floats. This happens before any drawing takes place which
-    elimnates any spurious plots from showing up.
-
-  - ``fillna`` methods now raise a ``TypeError`` if the ``value`` parameter is
-    a list or tuple.
-
-  - ``Series.str`` now supports iteration (:issue:`3638`). You can iterate over the
-    individual elements of each string in the ``Series``. Each iteration yields
-    yields a ``Series`` with either a single character at each index of the
-    original ``Series`` or ``NaN``. For example,
-
-    .. ipython:: python
-
-        strs = 'go', 'bow', 'joe', 'slow'
-        ds = Series(strs)
-
-        for s in ds.str:
-            print(s)
-
-        s
-        s.dropna().values.item() == 'w'
-
-    The last element yielded by the iterator will be a ``Series`` containing
-    the last element of the longest string in the ``Series`` with all other
-    elements being ``NaN``. Here since ``'slow'`` is the longest string
-    and there are no other strings with the same length ``'w'`` is the only
-    non-null string in the yielded ``Series``.
-
-  - ``HDFStore``
-
-    - will retain index attributes (freq,tz,name) on recreation (:issue:`3499`)
-    - will warn with a ``AttributeConflictWarning`` if you are attempting to append
-      an index with a different frequency than the existing, or attempting
-      to append an index with a different name than the existing
-    - support datelike columns with a timezone as data_columns (:issue:`2852`)
-
-  - Non-unique index support clarified (:issue:`3468`).
-
-    - Fix assigning a new index to a duplicate index in a DataFrame would fail (:issue:`3468`)
-    - Fix construction of a DataFrame with a duplicate index
-    - ref_locs support to allow duplicative indices across dtypes,
-      allows iget support to always find the index (even across dtypes) (:issue:`2194`)
-    - applymap on a DataFrame with a non-unique index now works
-      (removed warning) (:issue:`2786`), and fix (:issue:`3230`)
-    - Fix to_csv to handle non-unique columns (:issue:`3495`)
-    - Duplicate indexes with getitem will return items in the correct order (:issue:`3455`, :issue:`3457`)
-      and handle missing elements like unique indices (:issue:`3561`)
-    - Duplicate indexes with and empty DataFrame.from_records will return a correct frame (:issue:`3562`)
-    - Concat to produce a non-unique columns when duplicates are across dtypes is fixed (:issue:`3602`)
-    - Allow insert/delete to non-unique columns (:issue:`3679`)
-    - Non-unique indexing with a slice via ``loc`` and friends fixed (:issue:`3659`)
-    - Allow insert/delete to non-unique columns (:issue:`3679`)
-    - Extend ``reindex`` to correctly deal with non-unique indices (:issue:`3679`)
-    - ``DataFrame.itertuples()`` now works with frames with duplicate column
-      names (:issue:`3873`)
-    - Bug in non-unique indexing via ``iloc`` (:issue:`4017`); added ``takeable`` argument to
-      ``reindex`` for location-based taking
-    - Allow non-unique indexing in series via ``.ix/.loc`` and ``__getitem__`` (:issue:`4246`)
-    - Fixed non-unique indexing memory allocation issue with ``.ix/.loc`` (:issue:`4280`)
-
-  - ``DataFrame.from_records`` did not accept empty recarrays (:issue:`3682`)
-  - ``read_html`` now correctly skips tests (:issue:`3741`)
-  - Fixed a bug where ``DataFrame.replace`` with a compiled regular expression
-    in the ``to_replace`` argument wasn't working (:issue:`3907`)
-  - Improved ``network`` test decorator to catch ``IOError`` (and therefore
-    ``URLError`` as well). Added ``with_connectivity_check`` decorator to allow
-    explicitly checking a website as a proxy for seeing if there is network
-    connectivity. Plus, new ``optional_args`` decorator factory for decorators.
-    (:issue:`3910`, :issue:`3914`)
-  - Fixed testing issue where too many sockets where open thus leading to a
-    connection reset issue (:issue:`3982`, :issue:`3985`, :issue:`4028`,
-    :issue:`4054`)
-  - Fixed failing tests in test_yahoo, test_google where symbols were not
-    retrieved but were being accessed (:issue:`3982`, :issue:`3985`,
-    :issue:`4028`, :issue:`4054`)
-  - ``Series.hist`` will now take the figure from the current environment if
-    one is not passed
-  - Fixed bug where a 1xN DataFrame would barf on a 1xN mask (:issue:`4071`)
-  - Fixed running of ``tox`` under python3 where the pickle import was getting
-    rewritten in an incompatible way (:issue:`4062`, :issue:`4063`)
-  - Fixed bug where sharex and sharey were not being passed to grouped_hist
-    (:issue:`4089`)
-  - Fixed bug in ``DataFrame.replace`` where a nested dict wasn't being
-    iterated over when regex=False (:issue:`4115`)
-  - Fixed bug in the parsing of microseconds when using the ``format``
-    argument in ``to_datetime`` (:issue:`4152`)
-  - Fixed bug in ``PandasAutoDateLocator`` where ``invert_xaxis`` triggered
-    incorrectly ``MilliSecondLocator``  (:issue:`3990`)
-  - Fixed bug in plotting that wasn't raising on invalid colormap for
-    matplotlib 1.1.1 (:issue:`4215`)
-  - Fixed the legend displaying in ``DataFrame.plot(kind='kde')`` (:issue:`4216`)
-  - Fixed bug where Index slices weren't carrying the name attribute
-    (:issue:`4226`)
-  - Fixed bug in initializing ``DatetimeIndex`` with an array of strings
-    in a certain time zone (:issue:`4229`)
-  - Fixed bug where html5lib wasn't being properly skipped (:issue:`4265`)
-  - Fixed bug where get_data_famafrench wasn't using the correct file edges
-    (:issue:`4281`)
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
diff --git a/doc/source/whatsnew/v0.13.0.rst b/doc/source/whatsnew/v0.13.0.rst
new file mode 100644
index 0000000000000..0f799c069f494
--- /dev/null
+++ b/doc/source/whatsnew/v0.13.0.rst
@@ -0,0 +1,1312 @@
+.. _whatsnew_0130:
+
+v0.13.0 (January 3, 2014)
+---------------------------
+
+{{ header }}
+
+
+
+This is a major release from 0.12.0 and includes a number of API changes, several new features and
+enhancements along with a large number of bug fixes.
+
+Highlights include:
+
+- support for a new index type ``Float64Index``, and other Indexing enhancements
+- ``HDFStore`` has a new string based syntax for query specification
+- support for new methods of interpolation
+- updated ``timedelta`` operations
+- a new string manipulation method ``extract``
+- Nanosecond support for Offsets
+- ``isin`` for DataFrames
+
+Several experimental features are added, including:
+
+- new ``eval/query`` methods for expression evaluation
+- support for ``msgpack`` serialization
+- an i/o interface to Google's ``BigQuery``
+
+Their are several new or updated docs sections including:
+
+- :ref:`Comparison with SQL<compare_with_sql>`, which should be useful for those familiar with SQL but still learning pandas.
+- :ref:`Comparison with R<compare_with_r>`, idiom translations from R to pandas.
+- :ref:`Enhancing Performance<enhancingperf>`, ways to enhance pandas performance with ``eval/query``.
+
+.. warning::
+
+   In 0.13.0 ``Series`` has internally been refactored to no longer sub-class ``ndarray``
+   but instead subclass ``NDFrame``, similar to the rest of the pandas containers. This should be
+   a transparent change with only very limited API implications. See :ref:`Internal Refactoring<whatsnew_0130.refactoring>`
+
+API changes
+~~~~~~~~~~~
+
+- ``read_excel`` now supports an integer in its ``sheetname`` argument giving
+  the index of the sheet to read in (:issue:`4301`).
+- Text parser now treats anything that reads like inf ("inf", "Inf", "-Inf",
+  "iNf", etc.) as infinity. (:issue:`4220`, :issue:`4219`), affecting
+  ``read_table``, ``read_csv``, etc.
+- ``pandas`` now is Python 2/3 compatible without the need for 2to3 thanks to
+  @jtratner. As a result, pandas now uses iterators more extensively. This
+  also led to the introduction of substantive parts of the Benjamin
+  Peterson's ``six`` library into compat. (:issue:`4384`, :issue:`4375`,
+  :issue:`4372`)
+- ``pandas.util.compat`` and ``pandas.util.py3compat`` have been merged into
+  ``pandas.compat``. ``pandas.compat`` now includes many functions allowing
+  2/3 compatibility. It contains both list and iterator versions of range,
+  filter, map and zip, plus other necessary elements for Python 3
+  compatibility. ``lmap``, ``lzip``, ``lrange`` and ``lfilter`` all produce
+  lists instead of iterators, for compatibility with ``numpy``, subscripting
+  and ``pandas`` constructors.(:issue:`4384`, :issue:`4375`, :issue:`4372`)
+- ``Series.get`` with negative indexers now returns the same as ``[]`` (:issue:`4390`)
+- Changes to how ``Index`` and ``MultiIndex`` handle metadata (``levels``,
+  ``labels``, and ``names``) (:issue:`4039`):
+
+  .. code-block:: python
+
+     # previously, you would have set levels or labels directly
+     >>> pd.index.levels = [[1, 2, 3, 4], [1, 2, 4, 4]]
+
+     # now, you use the set_levels or set_labels methods
+     >>> index = pd.index.set_levels([[1, 2, 3, 4], [1, 2, 4, 4]])
+
+     # similarly, for names, you can rename the object
+     # but setting names is not deprecated
+     >>> index = pd.index.set_names(["bob", "cranberry"])
+
+     # and all methods take an inplace kwarg - but return None
+     >>> pd.index.set_names(["bob", "cranberry"], inplace=True)
+
+- **All** division with ``NDFrame`` objects is now *truedivision*, regardless
+  of the future import. This means that operating on pandas objects will by default
+  use *floating point* division, and return a floating point dtype.
+  You can use ``//`` and ``floordiv`` to do integer division.
+
+  Integer division
+
+  .. code-block:: ipython
+
+     In [3]: arr = np.array([1, 2, 3, 4])
+
+     In [4]: arr2 = np.array([5, 3, 2, 1])
+
+     In [5]: arr / arr2
+     Out[5]: array([0, 0, 1, 4])
+
+     In [6]: pd.Series(arr) // pd.Series(arr2)
+     Out[6]:
+     0    0
+     1    0
+     2    1
+     3    4
+     dtype: int64
+
+  True Division
+
+  .. code-block:: ipython
+
+      In [7]: pd.Series(arr) / pd.Series(arr2)  # no future import required
+      Out[7]:
+      0    0.200000
+      1    0.666667
+      2    1.500000
+      3    4.000000
+      dtype: float64
+
+- Infer and downcast dtype if ``downcast='infer'`` is passed to ``fillna/ffill/bfill`` (:issue:`4604`)
+- ``__nonzero__`` for all NDFrame objects, will now raise a ``ValueError``, this reverts back to (:issue:`1073`, :issue:`4633`)
+  behavior. See :ref:`gotchas<gotchas.truth>` for a more detailed discussion.
+
+  This prevents doing boolean comparison on *entire* pandas objects, which is inherently ambiguous. These all will raise a ``ValueError``.
+
+  .. code-block:: python
+
+     >>> df = pd.DataFrame({'A': np.random.randn(10),
+     ...                    'B': np.random.randn(10),
+     ...                    'C': pd.date_range('20130101', periods=10)
+     ...                    })
+     ...
+     >>> if df:
+     ...     pass
+     ...
+     Traceback (most recent call last):
+         ...
+     ValueError: The truth value of a DataFrame is ambiguous.  Use a.empty,
+     a.bool(), a.item(), a.any() or a.all().
+
+     >>> df1 = df
+     >>> df2 = df
+     >>> df1 and df2
+     Traceback (most recent call last):
+         ...
+     ValueError: The truth value of a DataFrame is ambiguous.  Use a.empty,
+     a.bool(), a.item(), a.any() or a.all().
+
+     >>> d = [1, 2, 3]
+     >>> s1 = pd.Series(d)
+     >>> s2 = pd.Series(d)
+     >>> s1 and s2
+     Traceback (most recent call last):
+         ...
+     ValueError: The truth value of a DataFrame is ambiguous.  Use a.empty,
+     a.bool(), a.item(), a.any() or a.all().
+
+  Added the ``.bool()`` method to ``NDFrame`` objects to facilitate evaluating of single-element boolean Series:
+
+  .. ipython:: python
+
+     pd.Series([True]).bool()
+     pd.Series([False]).bool()
+     pd.DataFrame([[True]]).bool()
+     pd.DataFrame([[False]]).bool()
+
+- All non-Index NDFrames (``Series``, ``DataFrame``, ``Panel``, ``Panel4D``,
+  ``SparsePanel``, etc.), now support the entire set of arithmetic operators
+  and arithmetic flex methods (add, sub, mul, etc.). ``SparsePanel`` does not
+  support ``pow`` or ``mod`` with non-scalars. (:issue:`3765`)
+- ``Series`` and ``DataFrame`` now have a ``mode()`` method to calculate the
+  statistical mode(s) by axis/Series. (:issue:`5367`)
+
+- Chained assignment will now by default warn if the user is assigning to a copy. This can be changed
+  with the option ``mode.chained_assignment``, allowed options are ``raise/warn/None``. See :ref:`the docs<indexing.view_versus_copy>`.
+
+  .. ipython:: python
+
+     dfc = pd.DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
+     pd.set_option('chained_assignment', 'warn')
+
+  The following warning / exception will show if this is attempted.
+
+  .. ipython:: python
+     :okwarning:
+
+     dfc.loc[0]['A'] = 1111
+
+  ::
+
+     Traceback (most recent call last)
+        ...
+     SettingWithCopyWarning:
+        A value is trying to be set on a copy of a slice from a DataFrame.
+        Try using .loc[row_index,col_indexer] = value instead
+
+  Here is the correct method of assignment.
+
+  .. ipython:: python
+
+     dfc.loc[0, 'A'] = 11
+     dfc
+
+- ``Panel.reindex`` has the following call signature ``Panel.reindex(items=None, major_axis=None, minor_axis=None, **kwargs)``
+   to conform with other ``NDFrame`` objects. See :ref:`Internal Refactoring<whatsnew_0130.refactoring>` for more information.
+
+- ``Series.argmin`` and ``Series.argmax`` are now aliased to ``Series.idxmin`` and ``Series.idxmax``. These return the *index* of the
+   min or max element respectively. Prior to 0.13.0 these would return the position of the min / max element. (:issue:`6214`)
+
+Prior Version Deprecations/Changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+These were announced changes in 0.12 or prior that are taking effect as of 0.13.0
+
+- Remove deprecated ``Factor`` (:issue:`3650`)
+- Remove deprecated ``set_printoptions/reset_printoptions`` (:issue:`3046`)
+- Remove deprecated ``_verbose_info`` (:issue:`3215`)
+- Remove deprecated ``read_clipboard/to_clipboard/ExcelFile/ExcelWriter`` from ``pandas.io.parsers`` (:issue:`3717`)
+  These are available as functions in the main pandas namespace (e.g. ``pd.read_clipboard``)
+- default for ``tupleize_cols`` is now ``False`` for both ``to_csv`` and ``read_csv``. Fair warning in 0.12 (:issue:`3604`)
+- default for `display.max_seq_len` is now 100 rather then `None`. This activates
+  truncated display ("...") of long sequences in various places. (:issue:`3391`)
+
+Deprecations
+~~~~~~~~~~~~
+
+Deprecated in 0.13.0
+
+- deprecated ``iterkv``, which will be removed in a future release (this was
+  an alias of iteritems used to bypass ``2to3``'s changes).
+  (:issue:`4384`, :issue:`4375`, :issue:`4372`)
+- deprecated the string method ``match``, whose role is now performed more
+  idiomatically by ``extract``. In a future release, the default behavior
+  of ``match`` will change to become analogous to ``contains``, which returns
+  a boolean indexer. (Their
+  distinction is strictness: ``match`` relies on ``re.match`` while
+  ``contains`` relies on ``re.search``.) In this release, the deprecated
+  behavior is the default, but the new behavior is available through the
+  keyword argument ``as_indexer=True``.
+
+Indexing API Changes
+~~~~~~~~~~~~~~~~~~~~
+
+Prior to 0.13, it was impossible to use a label indexer (``.loc/.ix``) to set a value that
+was not contained in the index of a particular axis. (:issue:`2578`). See :ref:`the docs<indexing.basics.partial_setting>`
+
+In the ``Series`` case this is effectively an appending operation
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+   s[5] = 5.
+   s
+
+.. ipython:: python
+
+   dfi = pd.DataFrame(np.arange(6).reshape(3, 2),
+                      columns=['A', 'B'])
+   dfi
+
+This would previously ``KeyError``
+
+.. ipython:: python
+
+   dfi.loc[:, 'C'] = dfi.loc[:, 'A']
+   dfi
+
+This is like an ``append`` operation.
+
+.. ipython:: python
+
+   dfi.loc[3] = 5
+   dfi
+
+A Panel setting operation on an arbitrary axis aligns the input to the Panel
+
+.. ipython:: python
+
+   p = pd.Panel(np.arange(16).reshape(2, 4, 2),
+                items=['Item1', 'Item2'],
+                major_axis=pd.date_range('2001/1/12', periods=4),
+                minor_axis=['A', 'B'], dtype='float64')
+   p
+   p.loc[:, :, 'C'] = pd.Series([30, 32], index=p.items)
+   p
+   p.loc[:, :, 'C']
+
+Float64Index API Change
+~~~~~~~~~~~~~~~~~~~~~~~
+
+- Added a new index type, ``Float64Index``. This will be automatically created when passing floating values in index creation.
+  This enables a pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar indexing and slicing work exactly the
+  same. See :ref:`the docs<indexing.float64index>`, (:issue:`263`)
+
+  Construction is by default for floating type values.
+
+  .. ipython:: python
+
+     index = pd.Index([1.5, 2, 3, 4.5, 5])
+     index
+     s = pd.Series(range(5), index=index)
+     s
+
+  Scalar selection for ``[],.ix,.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``)
+
+  .. ipython:: python
+
+     s[3]
+     s.loc[3]
+
+  The only positional indexing is via ``iloc``
+
+  .. ipython:: python
+
+     s.iloc[3]
+
+  A scalar index that is not found will raise ``KeyError``
+
+  Slicing is ALWAYS on the values of the index, for ``[],ix,loc`` and ALWAYS positional with ``iloc``
+
+  .. ipython:: python
+
+     s[2:4]
+     s.loc[2:4]
+     s.iloc[2:4]
+
+  In float indexes, slicing using floats are allowed
+
+  .. ipython:: python
+
+     s[2.1:4.6]
+     s.loc[2.1:4.6]
+
+- Indexing on other index types are preserved (and positional fallback for ``[],ix``), with the exception, that floating point slicing
+  on indexes on non ``Float64Index`` will now raise a ``TypeError``.
+
+  .. code-block:: ipython
+
+     In [1]: pd.Series(range(5))[3.5]
+     TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
+
+     In [1]: pd.Series(range(5))[3.5:4.5]
+     TypeError: the slice start [3.5] is not a proper indexer for this index type (Int64Index)
+
+  Using a scalar float indexer will be deprecated in a future version, but is allowed for now.
+
+  .. code-block:: ipython
+
+     In [3]: pd.Series(range(5))[3.0]
+     Out[3]: 3
+
+HDFStore API Changes
+~~~~~~~~~~~~~~~~~~~~
+
+- Query Format Changes. A much more string-like query format is now supported. See :ref:`the docs<io.hdf5-query>`.
+
+  .. ipython:: python
+
+     path = 'test.h5'
+     dfq = pd.DataFrame(np.random.randn(10, 4),
+                        columns=list('ABCD'),
+                        index=pd.date_range('20130101', periods=10))
+     dfq.to_hdf(path, 'dfq', format='table', data_columns=True)
+
+  Use boolean expressions, with in-line function evaluation.
+
+  .. ipython:: python
+
+     pd.read_hdf(path, 'dfq',
+                 where="index>Timestamp('20130104') & columns=['A', 'B']")
+
+  Use an inline column reference
+
+  .. ipython:: python
+
+     pd.read_hdf(path, 'dfq',
+                 where="A>0 or C>0")
+
+  .. ipython:: python
+     :suppress:
+
+     import os
+     os.remove(path)
+
+- the ``format`` keyword now replaces the ``table`` keyword; allowed values are ``fixed(f)`` or ``table(t)``
+  the same defaults as prior < 0.13.0 remain, e.g. ``put`` implies ``fixed`` format and ``append`` implies
+  ``table`` format. This default format can be set as an option by setting ``io.hdf.default_format``.
+
+  .. ipython:: python
+
+     path = 'test.h5'
+     df = pd.DataFrame(np.random.randn(10, 2))
+     df.to_hdf(path, 'df_table', format='table')
+     df.to_hdf(path, 'df_table2', append=True)
+     df.to_hdf(path, 'df_fixed')
+     with pd.HDFStore(path) as store:
+         print(store)
+
+  .. ipython:: python
+     :suppress:
+
+     import os
+     os.remove(path)
+
+- Significant table writing performance improvements
+- handle a passed ``Series`` in table format (:issue:`4330`)
+- can now serialize a ``timedelta64[ns]`` dtype in a table (:issue:`3577`), See :ref:`the docs<io.hdf5-timedelta>`.
+- added an ``is_open`` property to indicate if the underlying file handle is_open;
+  a closed store will now report 'CLOSED' when viewing the store (rather than raising an error)
+  (:issue:`4409`)
+- a close of a ``HDFStore`` now will close that instance of the ``HDFStore``
+  but will only close the actual file if the ref count (by ``PyTables``) w.r.t. all of the open handles
+  are 0. Essentially you have a local instance of ``HDFStore`` referenced by a variable. Once you
+  close it, it will report closed. Other references (to the same file) will continue to operate
+  until they themselves are closed. Performing an action on a closed file will raise
+  ``ClosedFileError``
+
+  .. ipython:: python
+
+     path = 'test.h5'
+     df = pd.DataFrame(np.random.randn(10, 2))
+     store1 = pd.HDFStore(path)
+     store2 = pd.HDFStore(path)
+     store1.append('df', df)
+     store2.append('df2', df)
+
+     store1
+     store2
+     store1.close()
+     store2
+     store2.close()
+     store2
+
+  .. ipython:: python
+     :suppress:
+
+     import os
+     os.remove(path)
+
+- removed the ``_quiet`` attribute, replace by a ``DuplicateWarning`` if retrieving
+  duplicate rows from a table (:issue:`4367`)
+- removed the ``warn`` argument from ``open``. Instead a ``PossibleDataLossError`` exception will
+  be raised if you try to use ``mode='w'`` with an OPEN file handle (:issue:`4367`)
+- allow a passed locations array or mask as a ``where`` condition (:issue:`4467`).
+  See :ref:`the docs<io.hdf5-where_mask>` for an example.
+- add the keyword ``dropna=True`` to ``append`` to change whether ALL nan rows are not written
+  to the store (default is ``True``, ALL nan rows are NOT written), also settable
+  via the option ``io.hdf.dropna_table`` (:issue:`4625`)
+- pass through store creation arguments; can be used to support in-memory stores
+
+DataFrame repr Changes
+~~~~~~~~~~~~~~~~~~~~~~
+
+The HTML and plain text representations of :class:`DataFrame` now show
+a truncated view of the table once it exceeds a certain size, rather
+than switching to the short info view (:issue:`4886`, :issue:`5550`).
+This makes the representation more consistent as small DataFrames get
+larger.
+
+.. image:: ../_static/df_repr_truncated.png
+   :alt: Truncated HTML representation of a DataFrame
+
+To get the info view, call :meth:`DataFrame.info`. If you prefer the
+info view as the repr for large DataFrames, you can set this by running
+``set_option('display.large_repr', 'info')``.
+
+Enhancements
+~~~~~~~~~~~~
+
+- ``df.to_clipboard()`` learned a new ``excel`` keyword that let's you
+  paste df data directly into excel (enabled by default). (:issue:`5070`).
+- ``read_html`` now raises a ``URLError`` instead of catching and raising a
+  ``ValueError`` (:issue:`4303`, :issue:`4305`)
+- Added a test for ``read_clipboard()`` and ``to_clipboard()`` (:issue:`4282`)
+- Clipboard functionality now works with PySide (:issue:`4282`)
+- Added a more informative error message when plot arguments contain
+  overlapping color and style arguments (:issue:`4402`)
+- ``to_dict`` now takes ``records`` as a possible out type.  Returns an array
+  of column-keyed dictionaries. (:issue:`4936`)
+
+- ``NaN`` handing in get_dummies (:issue:`4446`) with `dummy_na`
+
+  .. ipython:: python
+
+     # previously, nan was erroneously counted as 2 here
+     # now it is not counted at all
+     pd.get_dummies([1, 2, np.nan])
+
+     # unless requested
+     pd.get_dummies([1, 2, np.nan], dummy_na=True)
+
+
+- ``timedelta64[ns]`` operations. See :ref:`the docs<timedeltas.timedeltas_convert>`.
+
+  .. warning::
+
+     Most of these operations require ``numpy >= 1.7``
+
+  Using the new top-level ``to_timedelta``, you can convert a scalar or array from the standard
+  timedelta format (produced by ``to_csv``) into a timedelta type (``np.timedelta64`` in ``nanoseconds``).
+
+  .. ipython:: python
+
+     pd.to_timedelta('1 days 06:05:01.00003')
+     pd.to_timedelta('15.5us')
+     pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
+     pd.to_timedelta(np.arange(5), unit='s')
+     pd.to_timedelta(np.arange(5), unit='d')
+
+  A Series of dtype ``timedelta64[ns]`` can now be divided by another
+  ``timedelta64[ns]`` object, or astyped to yield a ``float64`` dtyped Series. This
+  is frequency conversion. See :ref:`the docs<timedeltas.timedeltas_convert>` for the docs.
+
+  .. ipython:: python
+
+     import datetime
+     td = pd.Series(pd.date_range('20130101', periods=4)) - pd.Series(
+         pd.date_range('20121201', periods=4))
+     td[2] += np.timedelta64(datetime.timedelta(minutes=5, seconds=3))
+     td[3] = np.nan
+     td
+
+     # to days
+     td / np.timedelta64(1, 'D')
+     td.astype('timedelta64[D]')
+
+     # to seconds
+     td / np.timedelta64(1, 's')
+     td.astype('timedelta64[s]')
+
+  Dividing or multiplying a ``timedelta64[ns]`` Series by an integer or integer Series
+
+  .. ipython:: python
+
+     td * -1
+     td * pd.Series([1, 2, 3, 4])
+
+  Absolute ``DateOffset`` objects can act equivalently to ``timedeltas``
+
+  .. ipython:: python
+
+     from pandas import offsets
+     td + offsets.Minute(5) + offsets.Milli(5)
+
+  Fillna is now supported for timedeltas
+
+  .. ipython:: python
+
+     td.fillna(0)
+     td.fillna(datetime.timedelta(days=1, seconds=5))
+
+  You can do numeric reduction operations on timedeltas.
+
+  .. ipython:: python
+
+     td.mean()
+     td.quantile(.1)
+
+- ``plot(kind='kde')`` now accepts the optional parameters ``bw_method`` and
+  ``ind``, passed to scipy.stats.gaussian_kde() (for scipy >= 0.11.0) to set
+  the bandwidth, and to gkde.evaluate() to specify the indices at which it
+  is evaluated, respectively. See scipy docs. (:issue:`4298`)
+
+- DataFrame constructor now accepts a numpy masked record array (:issue:`3478`)
+
+- The new vectorized string method ``extract`` return regular expression
+  matches more conveniently.
+
+  .. ipython:: python
+     :okwarning:
+
+     pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\\d)')
+
+  Elements that do not match return ``NaN``. Extracting a regular expression
+  with more than one group returns a DataFrame with one column per group.
+
+
+  .. ipython:: python
+     :okwarning:
+
+     pd.Series(['a1', 'b2', 'c3']).str.extract('([ab])(\\d)')
+
+  Elements that do not match return a row of ``NaN``.
+  Thus, a Series of messy strings can be *converted* into a
+  like-indexed Series or DataFrame of cleaned-up or more useful strings,
+  without necessitating ``get()`` to access tuples or ``re.match`` objects.
+
+  Named groups like
+
+  .. ipython:: python
+     :okwarning:
+
+     pd.Series(['a1', 'b2', 'c3']).str.extract(
+         '(?P<letter>[ab])(?P<digit>\\d)')
+
+  and optional groups can also be used.
+
+  .. ipython:: python
+     :okwarning:
+
+      pd.Series(['a1', 'b2', '3']).str.extract(
+          '(?P<letter>[ab])?(?P<digit>\\d)')
+
+- ``read_stata`` now accepts Stata 13 format (:issue:`4291`)
+
+- ``read_fwf`` now infers the column specifications from the first 100 rows of
+  the file if the data has correctly separated and properly aligned columns
+  using the delimiter provided to the function (:issue:`4488`).
+
+- support for nanosecond times as an offset
+
+  .. warning::
+
+     These operations require ``numpy >= 1.7``
+
+  Period conversions in the range of seconds and below were reworked and extended
+  up to nanoseconds. Periods in the nanosecond range are now available.
+
+  .. ipython:: python
+
+     pd.date_range('2013-01-01', periods=5, freq='5N')
+
+  or with frequency as offset
+
+  .. ipython:: python
+
+     pd.date_range('2013-01-01', periods=5, freq=pd.offsets.Nano(5))
+
+  Timestamps can be modified in the nanosecond range
+
+  .. ipython:: python
+
+     t = pd.Timestamp('20130101 09:01:02')
+     t + pd.tseries.offsets.Nano(123)
+
+- A new method, ``isin`` for DataFrames, which plays nicely with boolean indexing. The argument to ``isin``, what we're comparing the DataFrame to, can be a DataFrame, Series, dict, or array of values. See :ref:`the docs<indexing.basics.indexing_isin>` for more.
+
+  To get the rows where any of the conditions are met:
+
+  .. ipython:: python
+
+     dfi = pd.DataFrame({'A': [1, 2, 3, 4], 'B': ['a', 'b', 'f', 'n']})
+     dfi
+     other = pd.DataFrame({'A': [1, 3, 3, 7], 'B': ['e', 'f', 'f', 'e']})
+     mask = dfi.isin(other)
+     mask
+     dfi[mask.any(1)]
+
+- ``Series`` now supports a ``to_frame`` method to convert it to a single-column DataFrame (:issue:`5164`)
+
+- All R datasets listed here http://stat.ethz.ch/R-manual/R-devel/library/datasets/html/00Index.html can now be loaded into Pandas objects
+
+  .. code-block:: python
+
+     # note that pandas.rpy was deprecated in v0.16.0
+     import pandas.rpy.common as com
+     com.load_data('Titanic')
+
+- ``tz_localize`` can infer a fall daylight savings transition based on the structure
+  of the unlocalized data (:issue:`4230`), see :ref:`the docs<timeseries.timezone>`
+
+- ``DatetimeIndex`` is now in the API documentation, see :ref:`the docs<api.datetimeindex>`
+
+- :meth:`~pandas.io.json.json_normalize` is a new method to allow you to create a flat table
+  from semi-structured JSON data. See :ref:`the docs<io.json_normalize>` (:issue:`1067`)
+
+- Added PySide support for the qtpandas DataFrameModel and DataFrameWidget.
+
+- Python csv parser now supports usecols (:issue:`4335`)
+
+- Frequencies gained several new offsets:
+
+  * ``LastWeekOfMonth`` (:issue:`4637`)
+  * ``FY5253``, and ``FY5253Quarter`` (:issue:`4511`)
+
+
+- DataFrame has a new ``interpolate`` method, similar to Series (:issue:`4434`, :issue:`1892`)
+
+  .. ipython:: python
+
+      df = pd.DataFrame({'A': [1, 2.1, np.nan, 4.7, 5.6, 6.8],
+                        'B': [.25, np.nan, np.nan, 4, 12.2, 14.4]})
+      df.interpolate()
+
+  Additionally, the ``method`` argument to ``interpolate`` has been expanded
+  to include ``'nearest', 'zero', 'slinear', 'quadratic', 'cubic',
+  'barycentric', 'krogh', 'piecewise_polynomial', 'pchip', 'polynomial', 'spline'``
+  The new methods require scipy_. Consult the Scipy reference guide_ and documentation_ for more information
+  about when the various methods are appropriate. See :ref:`the docs<missing_data.interpolate>`.
+
+  Interpolate now also accepts a ``limit`` keyword argument.
+  This works similar to ``fillna``'s limit:
+
+  .. ipython:: python
+
+    ser = pd.Series([1, 3, np.nan, np.nan, np.nan, 11])
+    ser.interpolate(limit=2)
+
+- Added ``wide_to_long`` panel data convenience function. See :ref:`the docs<reshaping.melt>`.
+
+  .. ipython:: python
+
+    np.random.seed(123)
+    df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
+                       "A1980" : {0 : "d", 1 : "e", 2 : "f"},
+                       "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
+                       "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
+                       "X"     : dict(zip(range(3), np.random.randn(3)))
+                      })
+    df["id"] = df.index
+    df
+    pd.wide_to_long(df, ["A", "B"], i="id", j="year")
+
+.. _scipy: http://www.scipy.org
+.. _documentation: http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation
+.. _guide: http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html
+
+- ``to_csv`` now takes a ``date_format`` keyword argument that specifies how
+  output datetime objects should be formatted. Datetimes encountered in the
+  index, columns, and values will all have this formatting applied. (:issue:`4313`)
+- ``DataFrame.plot`` will scatter plot x versus y by passing ``kind='scatter'`` (:issue:`2215`)
+- Added support for Google Analytics v3 API segment IDs that also supports v2 IDs. (:issue:`5271`)
+
+.. _whatsnew_0130.experimental:
+
+Experimental
+~~~~~~~~~~~~
+
+- The new :func:`~pandas.eval` function implements expression evaluation using
+  ``numexpr`` behind the scenes. This results in large speedups for
+  complicated expressions involving large DataFrames/Series. For example,
+
+  .. ipython:: python
+
+     nrows, ncols = 20000, 100
+     df1, df2, df3, df4 = [pd.DataFrame(np.random.randn(nrows, ncols))
+                           for _ in range(4)]
+
+  .. ipython:: python
+
+     # eval with NumExpr backend
+     %timeit pd.eval('df1 + df2 + df3 + df4')
+
+  .. ipython:: python
+
+     # pure Python evaluation
+     %timeit df1 + df2 + df3 + df4
+
+  For more details, see the :ref:`the docs<enhancingperf.eval>`
+
+- Similar to ``pandas.eval``, :class:`~pandas.DataFrame` has a new
+  ``DataFrame.eval`` method that evaluates an expression in the context of
+  the ``DataFrame``. For example,
+
+  .. ipython:: python
+     :suppress:
+
+     try:
+         del a  # noqa: F821
+     except NameError:
+         pass
+
+     try:
+         del b  # noqa: F821
+     except NameError:
+         pass
+
+  .. ipython:: python
+
+     df = pd.DataFrame(np.random.randn(10, 2), columns=['a', 'b'])
+     df.eval('a + b')
+
+- :meth:`~pandas.DataFrame.query` method has been added that allows
+  you to select elements of a ``DataFrame`` using a natural query syntax
+  nearly identical to Python syntax. For example,
+
+  .. ipython:: python
+     :suppress:
+
+     try:
+         del a  # noqa: F821
+     except NameError:
+         pass
+
+     try:
+         del b  # noqa: F821
+     except NameError:
+         pass
+
+     try:
+         del c  # noqa: F821
+     except NameError:
+         pass
+
+  .. ipython:: python
+
+     n = 20
+     df = pd.DataFrame(np.random.randint(n, size=(n, 3)), columns=['a', 'b', 'c'])
+     df.query('a < b < c')
+
+  selects all the rows of ``df`` where ``a < b < c`` evaluates to ``True``.
+  For more details see the :ref:`the docs<indexing.query>`.
+
+- ``pd.read_msgpack()`` and ``pd.to_msgpack()`` are now a supported method of serialization
+  of arbitrary pandas (and python objects) in a lightweight portable binary format. See :ref:`the docs<io.msgpack>`
+
+  .. warning::
+
+     Since this is an EXPERIMENTAL LIBRARY, the storage format may not be stable until a future release.
+
+  .. ipython:: python
+
+     df = pd.DataFrame(np.random.rand(5, 2), columns=list('AB'))
+     df.to_msgpack('foo.msg')
+     pd.read_msgpack('foo.msg')
+
+     s = pd.Series(np.random.rand(5), index=pd.date_range('20130101', periods=5))
+     pd.to_msgpack('foo.msg', df, s)
+     pd.read_msgpack('foo.msg')
+
+  You can pass ``iterator=True`` to iterator over the unpacked results
+
+  .. ipython:: python
+
+     for o in pd.read_msgpack('foo.msg', iterator=True):
+         print(o)
+
+  .. ipython:: python
+     :suppress:
+     :okexcept:
+
+     os.remove('foo.msg')
+
+- ``pandas.io.gbq`` provides a simple way to extract from, and load data into,
+  Google's BigQuery Data Sets by way of pandas DataFrames. BigQuery is a high
+  performance SQL-like database service, useful for performing ad-hoc queries
+  against extremely large datasets. :ref:`See the docs <io.bigquery>`
+
+  .. code-block:: python
+
+     from pandas.io import gbq
+
+     # A query to select the average monthly temperatures in the
+     # in the year 2000 across the USA. The dataset,
+     # publicata:samples.gsod, is available on all BigQuery accounts,
+     # and is based on NOAA gsod data.
+
+     query = """SELECT station_number as STATION,
+     month as MONTH, AVG(mean_temp) as MEAN_TEMP
+     FROM publicdata:samples.gsod
+     WHERE YEAR = 2000
+     GROUP BY STATION, MONTH
+     ORDER BY STATION, MONTH ASC"""
+
+     # Fetch the result set for this query
+
+     # Your Google BigQuery Project ID
+     # To find this, see your dashboard:
+     # https://console.developers.google.com/iam-admin/projects?authuser=0
+     projectid = 'xxxxxxxxx'
+     df = gbq.read_gbq(query, project_id=projectid)
+
+     # Use pandas to process and reshape the dataset
+
+     df2 = df.pivot(index='STATION', columns='MONTH', values='MEAN_TEMP')
+     df3 = pd.concat([df2.min(), df2.mean(), df2.max()],
+                     axis=1, keys=["Min Tem", "Mean Temp", "Max Temp"])
+
+  The resulting DataFrame is::
+
+     > df3
+                 Min Tem  Mean Temp    Max Temp
+      MONTH
+      1     -53.336667  39.827892   89.770968
+      2     -49.837500  43.685219   93.437932
+      3     -77.926087  48.708355   96.099998
+      4     -82.892858  55.070087   97.317240
+      5     -92.378261  61.428117  102.042856
+      6     -77.703334  65.858888  102.900000
+      7     -87.821428  68.169663  106.510714
+      8     -89.431999  68.614215  105.500000
+      9     -86.611112  63.436935  107.142856
+      10    -78.209677  56.880838   92.103333
+      11    -50.125000  48.861228   94.996428
+      12    -50.332258  42.286879   94.396774
+
+  .. warning::
+
+     To use this module, you will need a BigQuery account. See
+     <https://cloud.google.com/products/big-query> for details.
+
+     As of 10/10/13, there is a bug in Google's API preventing result sets
+     from being larger than 100,000 rows. A patch is scheduled for the week of
+     10/14/13.
+
+.. _whatsnew_0130.refactoring:
+
+Internal Refactoring
+~~~~~~~~~~~~~~~~~~~~
+
+In 0.13.0 there is a major refactor primarily to subclass ``Series`` from
+``NDFrame``, which is the base class currently for ``DataFrame`` and ``Panel``,
+to unify methods and behaviors. Series formerly subclassed directly from
+``ndarray``. (:issue:`4080`, :issue:`3862`, :issue:`816`)
+
+.. warning::
+
+   There are two potential incompatibilities from < 0.13.0
+
+   - Using certain numpy functions would previously return a ``Series`` if passed a ``Series``
+     as an argument. This seems only to affect ``np.ones_like``, ``np.empty_like``,
+     ``np.diff`` and ``np.where``. These now return ``ndarrays``.
+
+     .. ipython:: python
+
+        s = pd.Series([1, 2, 3, 4])
+
+     Numpy Usage
+
+     .. ipython:: python
+
+        np.ones_like(s)
+        np.diff(s)
+        np.where(s > 1, s, np.nan)
+
+     Pandonic Usage
+
+     .. ipython:: python
+
+        pd.Series(1, index=s.index)
+        s.diff()
+        s.where(s > 1)
+
+   - Passing a ``Series`` directly to a cython function expecting an ``ndarray`` type will no
+     long work directly, you must pass ``Series.values``, See :ref:`Enhancing Performance<enhancingperf.ndarray>`
+
+   - ``Series(0.5)`` would previously return the scalar ``0.5``, instead this will return a 1-element ``Series``
+
+   - This change breaks ``rpy2<=2.3.8``. an Issue has been opened against rpy2 and a workaround
+     is detailed in :issue:`5698`. Thanks @JanSchulz.
+
+- Pickle compatibility is preserved for pickles created prior to 0.13. These must be unpickled with ``pd.read_pickle``, see :ref:`Pickling<io.pickle>`.
+
+- Refactor of series.py/frame.py/panel.py to move common code to generic.py
+
+  - added ``_setup_axes`` to created generic NDFrame structures
+  - moved methods
+
+    - ``from_axes,_wrap_array,axes,ix,loc,iloc,shape,empty,swapaxes,transpose,pop``
+    - ``__iter__,keys,__contains__,__len__,__neg__,__invert__``
+    - ``convert_objects,as_blocks,as_matrix,values``
+    - ``__getstate__,__setstate__`` (compat remains in frame/panel)
+    - ``__getattr__,__setattr__``
+    - ``_indexed_same,reindex_like,align,where,mask``
+    - ``fillna,replace`` (``Series`` replace is now consistent with ``DataFrame``)
+    - ``filter`` (also added axis argument to selectively filter on a different axis)
+    - ``reindex,reindex_axis,take``
+    - ``truncate`` (moved to become part of ``NDFrame``)
+
+- These are API changes which make ``Panel`` more consistent with ``DataFrame``
+
+  - ``swapaxes`` on a ``Panel`` with the same axes specified now return a copy
+  - support attribute access for setting
+  - filter supports the same API as the original ``DataFrame`` filter
+
+- Reindex called with no arguments will now return a copy of the input object
+
+- ``TimeSeries`` is now an alias for ``Series``. the property ``is_time_series``
+  can be used to distinguish (if desired)
+
+- Refactor of Sparse objects to use BlockManager
+
+  - Created a new block type in internals, ``SparseBlock``, which can hold multi-dtypes
+    and is non-consolidatable. ``SparseSeries`` and ``SparseDataFrame`` now inherit
+    more methods from there hierarchy (Series/DataFrame), and no longer inherit
+    from ``SparseArray`` (which instead is the object of the ``SparseBlock``)
+  - Sparse suite now supports integration with non-sparse data. Non-float sparse
+    data is supportable (partially implemented)
+  - Operations on sparse structures within DataFrames should preserve sparseness,
+    merging type operations will convert to dense (and back to sparse), so might
+    be somewhat inefficient
+  - enable setitem on ``SparseSeries`` for boolean/integer/slices
+  - ``SparsePanels`` implementation is unchanged (e.g. not using BlockManager, needs work)
+
+- added ``ftypes`` method to Series/DataFrame, similar to ``dtypes``, but indicates
+  if the underlying is sparse/dense (as well as the dtype)
+- All ``NDFrame`` objects can now use ``__finalize__()`` to specify various
+  values to propagate to new objects from an existing one (e.g. ``name`` in ``Series`` will
+  follow more automatically now)
+- Internal type checking is now done via a suite of generated classes, allowing ``isinstance(value, klass)``
+  without having to directly import the klass, courtesy of @jtratner
+- Bug in Series update where the parent frame is not updating its cache based on
+  changes (:issue:`4080`) or types (:issue:`3217`), fillna (:issue:`3386`)
+- Indexing with dtype conversions fixed (:issue:`4463`, :issue:`4204`)
+- Refactor ``Series.reindex`` to core/generic.py (:issue:`4604`, :issue:`4618`), allow ``method=`` in reindexing
+  on a Series to work
+- ``Series.copy`` no longer accepts the ``order`` parameter and is now consistent with ``NDFrame`` copy
+- Refactor ``rename`` methods to core/generic.py; fixes ``Series.rename`` for (:issue:`4605`), and adds ``rename``
+  with the same signature for ``Panel``
+- Refactor ``clip`` methods to core/generic.py (:issue:`4798`)
+- Refactor of ``_get_numeric_data/_get_bool_data`` to core/generic.py, allowing Series/Panel functionality
+- ``Series`` (for index) / ``Panel`` (for items) now allow attribute access to its elements  (:issue:`1903`)
+
+  .. ipython:: python
+
+     s = pd.Series([1, 2, 3], index=list('abc'))
+     s.b
+     s.a = 5
+     s
+
+.. _release.bug_fixes-0.13.0:
+
+Bug Fixes
+~~~~~~~~~
+
+- ``HDFStore``
+
+  - raising an invalid ``TypeError`` rather than ``ValueError`` when
+    appending with a different block ordering (:issue:`4096`)
+  - ``read_hdf`` was not respecting as passed ``mode`` (:issue:`4504`)
+  - appending a 0-len table will work correctly (:issue:`4273`)
+  - ``to_hdf`` was raising when passing both arguments ``append`` and
+    ``table`` (:issue:`4584`)
+  - reading from a store with duplicate columns across dtypes would raise
+    (:issue:`4767`)
+  - Fixed a bug where ``ValueError`` wasn't correctly raised when column
+    names weren't strings (:issue:`4956`)
+  - A zero length series written in Fixed format not deserializing properly.
+    (:issue:`4708`)
+  - Fixed decoding perf issue on pyt3 (:issue:`5441`)
+  - Validate levels in a MultiIndex before storing (:issue:`5527`)
+  - Correctly handle ``data_columns`` with a Panel (:issue:`5717`)
+- Fixed bug in tslib.tz_convert(vals, tz1, tz2): it could raise IndexError
+  exception while trying to access trans[pos + 1] (:issue:`4496`)
+- The ``by`` argument now works correctly with the ``layout`` argument
+  (:issue:`4102`, :issue:`4014`) in ``*.hist`` plotting methods
+- Fixed bug in ``PeriodIndex.map`` where using ``str`` would return the str
+  representation of the index (:issue:`4136`)
+- Fixed test failure ``test_time_series_plot_color_with_empty_kwargs`` when
+  using custom matplotlib default colors (:issue:`4345`)
+- Fix running of stata IO tests. Now uses temporary files to write
+  (:issue:`4353`)
+- Fixed an issue where ``DataFrame.sum`` was slower than ``DataFrame.mean``
+  for integer valued frames (:issue:`4365`)
+- ``read_html`` tests now work with Python 2.6 (:issue:`4351`)
+- Fixed bug where ``network`` testing was throwing ``NameError`` because a
+  local variable was undefined (:issue:`4381`)
+- In ``to_json``, raise if a passed ``orient`` would cause loss of data
+  because of a duplicate index (:issue:`4359`)
+- In ``to_json``, fix date handling so milliseconds are the default timestamp
+  as the docstring says (:issue:`4362`).
+- ``as_index`` is no longer ignored when doing groupby apply (:issue:`4648`,
+  :issue:`3417`)
+- JSON NaT handling fixed, NaTs are now serialized to `null` (:issue:`4498`)
+- Fixed JSON handling of escapable characters in JSON object keys
+  (:issue:`4593`)
+- Fixed passing ``keep_default_na=False`` when ``na_values=None``
+  (:issue:`4318`)
+- Fixed bug with ``values`` raising an error on a DataFrame with duplicate
+  columns and mixed dtypes, surfaced in (:issue:`4377`)
+- Fixed bug with duplicate columns and type conversion in ``read_json`` when
+  ``orient='split'`` (:issue:`4377`)
+- Fixed JSON bug where locales with decimal separators other than '.' threw
+  exceptions when encoding / decoding certain values. (:issue:`4918`)
+- Fix ``.iat`` indexing with a ``PeriodIndex`` (:issue:`4390`)
+- Fixed an issue where ``PeriodIndex`` joining with self was returning a new
+  instance rather than the same instance (:issue:`4379`); also adds a test
+  for this for the other index types
+- Fixed a bug with all the dtypes being converted to object when using the
+  CSV cparser with the usecols parameter (:issue:`3192`)
+- Fix an issue in merging blocks where the resulting DataFrame had partially
+  set _ref_locs (:issue:`4403`)
+- Fixed an issue where hist subplots were being overwritten when they were
+  called using the top level matplotlib API (:issue:`4408`)
+- Fixed a bug where calling ``Series.astype(str)`` would truncate the string
+  (:issue:`4405`, :issue:`4437`)
+- Fixed a py3 compat issue where bytes were being repr'd as tuples
+  (:issue:`4455`)
+- Fixed Panel attribute naming conflict if item is named 'a'
+  (:issue:`3440`)
+- Fixed an issue where duplicate indexes were raising when plotting
+  (:issue:`4486`)
+- Fixed an issue where cumsum and cumprod didn't work with bool dtypes
+  (:issue:`4170`, :issue:`4440`)
+- Fixed Panel slicing issued in ``xs`` that was returning an incorrect dimmed
+  object (:issue:`4016`)
+- Fix resampling bug where custom reduce function not used if only one group
+  (:issue:`3849`, :issue:`4494`)
+- Fixed Panel assignment with a transposed frame (:issue:`3830`)
+- Raise on set indexing with a Panel and a Panel as a value which needs
+  alignment (:issue:`3777`)
+- frozenset objects now raise in the ``Series`` constructor (:issue:`4482`,
+  :issue:`4480`)
+- Fixed issue with sorting a duplicate MultiIndex that has multiple dtypes
+  (:issue:`4516`)
+- Fixed bug in ``DataFrame.set_values`` which was causing name attributes to
+  be lost when expanding the index. (:issue:`3742`, :issue:`4039`)
+- Fixed issue where individual ``names``, ``levels`` and ``labels`` could be
+  set on ``MultiIndex`` without validation (:issue:`3714`, :issue:`4039`)
+- Fixed (:issue:`3334`) in pivot_table. Margins did not compute if values is
+  the index.
+- Fix bug in having a rhs of ``np.timedelta64`` or ``np.offsets.DateOffset``
+  when operating with datetimes (:issue:`4532`)
+- Fix arithmetic with series/datetimeindex and ``np.timedelta64`` not working
+  the same (:issue:`4134`) and buggy timedelta in NumPy 1.6 (:issue:`4135`)
+- Fix bug in ``pd.read_clipboard`` on windows with PY3 (:issue:`4561`); not
+  decoding properly
+- ``tslib.get_period_field()`` and ``tslib.get_period_field_arr()`` now raise
+  if code argument out of range (:issue:`4519`, :issue:`4520`)
+- Fix boolean indexing on an empty series loses index names (:issue:`4235`),
+  infer_dtype works with empty arrays.
+- Fix reindexing with multiple axes; if an axes match was not replacing the
+  current axes, leading to a possible lazy frequency inference issue
+  (:issue:`3317`)
+- Fixed issue where ``DataFrame.apply`` was reraising exceptions incorrectly
+  (causing the original stack trace to be truncated).
+- Fix selection with ``ix/loc`` and non_unique selectors (:issue:`4619`)
+- Fix assignment with iloc/loc involving a dtype change in an existing column
+  (:issue:`4312`, :issue:`5702`) have internal setitem_with_indexer in core/indexing
+  to use Block.setitem
+- Fixed bug where thousands operator was not handled correctly for floating
+  point numbers in csv_import (:issue:`4322`)
+- Fix an issue with CacheableOffset not properly being used by many
+  DateOffset; this prevented the DateOffset from being cached (:issue:`4609`)
+- Fix boolean comparison with a DataFrame on the lhs, and a list/tuple on the
+  rhs (:issue:`4576`)
+- Fix error/dtype conversion with setitem of ``None`` on ``Series/DataFrame``
+  (:issue:`4667`)
+- Fix decoding based on a passed in non-default encoding in ``pd.read_stata``
+  (:issue:`4626`)
+- Fix ``DataFrame.from_records`` with a plain-vanilla ``ndarray``.
+  (:issue:`4727`)
+- Fix some inconsistencies with ``Index.rename`` and ``MultiIndex.rename``,
+  etc. (:issue:`4718`, :issue:`4628`)
+- Bug in using ``iloc/loc`` with a cross-sectional and duplicate indices
+  (:issue:`4726`)
+- Bug with using ``QUOTE_NONE`` with ``to_csv`` causing ``Exception``.
+  (:issue:`4328`)
+- Bug with Series indexing not raising an error when the right-hand-side has
+  an incorrect length (:issue:`2702`)
+- Bug in MultiIndexing with a partial string selection as one part of a
+  MultIndex (:issue:`4758`)
+- Bug with reindexing on the index with a non-unique index will now raise
+  ``ValueError`` (:issue:`4746`)
+- Bug in setting with ``loc/ix`` a single indexer with a MultiIndex axis and
+  a NumPy array, related to (:issue:`3777`)
+- Bug in concatenation with duplicate columns across dtypes not merging with
+  axis=0 (:issue:`4771`, :issue:`4975`)
+- Bug in ``iloc`` with a slice index failing (:issue:`4771`)
+- Incorrect error message with no colspecs or width in ``read_fwf``.
+  (:issue:`4774`)
+- Fix bugs in indexing in a Series with a duplicate index (:issue:`4548`,
+  :issue:`4550`)
+- Fixed bug with reading compressed files with ``read_fwf`` in Python 3.
+  (:issue:`3963`)
+- Fixed an issue with a duplicate index and assignment with a dtype change
+  (:issue:`4686`)
+- Fixed bug with reading compressed files in as ``bytes`` rather than ``str``
+  in Python 3. Simplifies bytes-producing file-handling in Python 3
+  (:issue:`3963`, :issue:`4785`).
+- Fixed an issue related to ticklocs/ticklabels with log scale bar plots
+  across different versions of matplotlib (:issue:`4789`)
+- Suppressed DeprecationWarning associated with internal calls issued by
+  repr() (:issue:`4391`)
+- Fixed an issue with a duplicate index and duplicate selector with ``.loc``
+  (:issue:`4825`)
+- Fixed an issue with ``DataFrame.sort_index`` where, when sorting by a
+  single column and passing a list for ``ascending``, the argument for
+  ``ascending`` was being interpreted as ``True`` (:issue:`4839`,
+  :issue:`4846`)
+- Fixed ``Panel.tshift`` not working. Added `freq` support to ``Panel.shift``
+  (:issue:`4853`)
+- Fix an issue in TextFileReader w/ Python engine (i.e. PythonParser)
+  with thousands != "," (:issue:`4596`)
+- Bug in getitem with a duplicate index when using where (:issue:`4879`)
+- Fix Type inference code coerces float column into datetime (:issue:`4601`)
+- Fixed ``_ensure_numeric`` does not check for complex numbers
+  (:issue:`4902`)
+- Fixed a bug in ``Series.hist`` where two figures were being created when
+  the ``by`` argument was passed (:issue:`4112`, :issue:`4113`).
+- Fixed a bug in ``convert_objects`` for > 2 ndims (:issue:`4937`)
+- Fixed a bug in DataFrame/Panel cache insertion and subsequent indexing
+  (:issue:`4939`, :issue:`5424`)
+- Fixed string methods for ``FrozenNDArray`` and ``FrozenList``
+  (:issue:`4929`)
+- Fixed a bug with setting invalid or out-of-range values in indexing
+  enlargement scenarios (:issue:`4940`)
+- Tests for fillna on empty Series (:issue:`4346`), thanks @immerrr
+- Fixed ``copy()`` to shallow copy axes/indices as well and thereby keep
+  separate metadata. (:issue:`4202`, :issue:`4830`)
+- Fixed skiprows option in Python parser for read_csv (:issue:`4382`)
+- Fixed bug preventing ``cut`` from working with ``np.inf`` levels without
+  explicitly passing labels (:issue:`3415`)
+- Fixed wrong check for overlapping in ``DatetimeIndex.union``
+  (:issue:`4564`)
+- Fixed conflict between thousands separator and date parser in csv_parser
+  (:issue:`4678`)
+- Fix appending when dtypes are not the same (error showing mixing
+  float/np.datetime64) (:issue:`4993`)
+- Fix repr for DateOffset. No longer show duplicate entries in kwds.
+  Removed unused offset fields. (:issue:`4638`)
+- Fixed wrong index name during read_csv if using usecols. Applies to c
+  parser only. (:issue:`4201`)
+- ``Timestamp`` objects can now appear in the left hand side of a comparison
+  operation with a ``Series`` or ``DataFrame`` object (:issue:`4982`).
+- Fix a bug when indexing with ``np.nan`` via ``iloc/loc`` (:issue:`5016`)
+- Fixed a bug where low memory c parser could create different types in
+  different chunks of the same file. Now coerces to numerical type or raises
+  warning. (:issue:`3866`)
+- Fix a bug where reshaping a ``Series`` to its own shape raised
+  ``TypeError`` (:issue:`4554`) and other reshaping issues.
+- Bug in setting with ``ix/loc`` and a mixed int/string index (:issue:`4544`)
+- Make sure series-series boolean comparisons are label based (:issue:`4947`)
+- Bug in multi-level indexing with a Timestamp partial indexer
+  (:issue:`4294`)
+- Tests/fix for MultiIndex construction of an all-nan frame (:issue:`4078`)
+- Fixed a bug where :func:`~pandas.read_html` wasn't correctly inferring
+  values of tables with commas (:issue:`5029`)
+- Fixed a bug where :func:`~pandas.read_html` wasn't providing a stable
+  ordering of returned tables (:issue:`4770`, :issue:`5029`).
+- Fixed a bug where :func:`~pandas.read_html` was incorrectly parsing when
+  passed ``index_col=0`` (:issue:`5066`).
+- Fixed a bug where :func:`~pandas.read_html` was incorrectly inferring the
+  type of headers (:issue:`5048`).
+- Fixed a bug where ``DatetimeIndex`` joins with ``PeriodIndex`` caused a
+  stack overflow (:issue:`3899`).
+- Fixed a bug where ``groupby`` objects didn't allow plots (:issue:`5102`).
+- Fixed a bug where ``groupby`` objects weren't tab-completing column names
+  (:issue:`5102`).
+- Fixed a bug where ``groupby.plot()`` and friends were duplicating figures
+  multiple times (:issue:`5102`).
+- Provide automatic conversion of ``object`` dtypes on fillna, related
+  (:issue:`5103`)
+- Fixed a bug where default options were being overwritten in the option
+  parser cleaning (:issue:`5121`).
+- Treat a list/ndarray identically for ``iloc`` indexing with list-like
+  (:issue:`5006`)
+- Fix ``MultiIndex.get_level_values()`` with missing values (:issue:`5074`)
+- Fix bound checking for Timestamp() with datetime64 input (:issue:`4065`)
+- Fix a bug where ``TestReadHtml`` wasn't calling the correct ``read_html()``
+  function (:issue:`5150`).
+- Fix a bug with ``NDFrame.replace()`` which made replacement appear as
+  though it was (incorrectly) using regular expressions (:issue:`5143`).
+- Fix better error message for to_datetime (:issue:`4928`)
+- Made sure different locales are tested on travis-ci (:issue:`4918`). Also
+  adds a couple of utilities for getting locales and setting locales with a
+  context manager.
+- Fixed segfault on ``isnull(MultiIndex)`` (now raises an error instead)
+  (:issue:`5123`, :issue:`5125`)
+- Allow duplicate indices when performing operations that align
+  (:issue:`5185`, :issue:`5639`)
+- Compound dtypes in a constructor raise ``NotImplementedError``
+  (:issue:`5191`)
+- Bug in comparing duplicate frames (:issue:`4421`) related
+- Bug in describe on duplicate frames
+- Bug in ``to_datetime`` with a format and ``coerce=True`` not raising
+  (:issue:`5195`)
+- Bug in ``loc`` setting with multiple indexers and a rhs of a Series that
+  needs broadcasting (:issue:`5206`)
+- Fixed bug where inplace setting of levels or labels on ``MultiIndex`` would
+  not clear cached ``values`` property and therefore return wrong ``values``.
+  (:issue:`5215`)
+- Fixed bug where filtering a grouped DataFrame or Series did not maintain
+  the original ordering (:issue:`4621`).
+- Fixed ``Period`` with a business date freq to always roll-forward if on a
+  non-business date. (:issue:`5203`)
+- Fixed bug in Excel writers where frames with duplicate column names weren't
+  written correctly. (:issue:`5235`)
+- Fixed issue with ``drop`` and a non-unique index on Series (:issue:`5248`)
+- Fixed segfault in C parser caused by passing more names than columns in
+  the file. (:issue:`5156`)
+- Fix ``Series.isin`` with date/time-like dtypes (:issue:`5021`)
+- C and Python Parser can now handle the more common MultiIndex column
+  format which doesn't have a row for index names (:issue:`4702`)
+- Bug when trying to use an out-of-bounds date as an object dtype
+  (:issue:`5312`)
+- Bug when trying to display an embedded PandasObject (:issue:`5324`)
+- Allows operating of Timestamps to return a datetime if the result is out-of-bounds
+  related (:issue:`5312`)
+- Fix return value/type signature of ``initObjToJSON()`` to be compatible
+  with numpy's ``import_array()`` (:issue:`5334`, :issue:`5326`)
+- Bug when renaming then set_index on a DataFrame (:issue:`5344`)
+- Test suite no longer leaves around temporary files when testing graphics. (:issue:`5347`)
+  (thanks for catching this @yarikoptic!)
+- Fixed html tests on win32. (:issue:`4580`)
+- Make sure that ``head/tail`` are ``iloc`` based, (:issue:`5370`)
+- Fixed bug for ``PeriodIndex`` string representation if there are 1 or 2
+  elements. (:issue:`5372`)
+- The GroupBy methods ``transform`` and ``filter`` can be used on Series
+  and DataFrames that have repeated (non-unique) indices. (:issue:`4620`)
+- Fix empty series not printing name in repr (:issue:`4651`)
+- Make tests create temp files in temp directory by default. (:issue:`5419`)
+- ``pd.to_timedelta`` of a scalar returns a scalar (:issue:`5410`)
+- ``pd.to_timedelta`` accepts ``NaN`` and ``NaT``, returning ``NaT`` instead of raising (:issue:`5437`)
+- performance improvements in ``isnull`` on larger size pandas objects
+- Fixed various setitem with 1d ndarray that does not have a matching
+  length to the indexer (:issue:`5508`)
+- Bug in getitem with a MultiIndex and ``iloc`` (:issue:`5528`)
+- Bug in delitem on a Series (:issue:`5542`)
+- Bug fix in apply when using custom function and objects are not mutated (:issue:`5545`)
+- Bug in selecting from a non-unique index with ``loc`` (:issue:`5553`)
+- Bug in groupby returning non-consistent types when user function returns a ``None``, (:issue:`5592`)
+- Work around regression in numpy 1.7.0 which erroneously raises IndexError from ``ndarray.item`` (:issue:`5666`)
+- Bug in repeated indexing of object with resultant non-unique index (:issue:`5678`)
+- Bug in fillna with Series and a passed series/dict (:issue:`5703`)
+- Bug in groupby transform with a datetime-like grouper (:issue:`5712`)
+- Bug in MultiIndex selection in PY3 when using certain keys (:issue:`5725`)
+- Row-wise concat of differing dtypes failing in certain cases (:issue:`5754`)
+
+.. _whatsnew_0.13.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.12.0..v0.13.0
diff --git a/doc/source/whatsnew/v0.13.0.txt b/doc/source/whatsnew/v0.13.0.txt
deleted file mode 100644
index 118632cc2c0ee..0000000000000
--- a/doc/source/whatsnew/v0.13.0.txt
+++ /dev/null
@@ -1,986 +0,0 @@
-.. _whatsnew_0130:
-
-v0.13.0 (January 3, 2014)
----------------------------
-
-This is a major release from 0.12.0 and includes a number of API changes, several new features and
-enhancements along with a large number of bug fixes.
-
-Highlights include:
-
-- support for a new index type ``Float64Index``, and other Indexing enhancements
-- ``HDFStore`` has a new string based syntax for query specification
-- support for new methods of interpolation
-- updated ``timedelta`` operations
-- a new string manipulation method ``extract``
-- Nanosecond support for Offsets
-- ``isin`` for DataFrames
-
-Several experimental features are added, including:
-
-- new ``eval/query`` methods for expression evaluation
-- support for ``msgpack`` serialization
-- an i/o interface to Google's ``BigQuery``
-
-Their are several new or updated docs sections including:
-
-- :ref:`Comparison with SQL<compare_with_sql>`, which should be useful for those familiar with SQL but still learning pandas.
-- :ref:`Comparison with R<compare_with_r>`, idiom translations from R to pandas.
-- :ref:`Enhancing Performance<enhancingperf>`, ways to enhance pandas performance with ``eval/query``.
-
-.. warning::
-
-   In 0.13.0 ``Series`` has internally been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``NDFrame``, similar to the rest of the pandas containers. This should be
-   a transparent change with only very limited API implications. See :ref:`Internal Refactoring<whatsnew_0130.refactoring>`
-
-API changes
-~~~~~~~~~~~
-
-- ``read_excel`` now supports an integer in its ``sheetname`` argument giving
-  the index of the sheet to read in (:issue:`4301`).
-- Text parser now treats anything that reads like inf ("inf", "Inf", "-Inf",
-  "iNf", etc.) as infinity. (:issue:`4220`, :issue:`4219`), affecting
-  ``read_table``, ``read_csv``, etc.
-- ``pandas`` now is Python 2/3 compatible without the need for 2to3 thanks to
-  @jtratner. As a result, pandas now uses iterators more extensively. This
-  also led to the introduction of substantive parts of the Benjamin
-  Peterson's ``six`` library into compat. (:issue:`4384`, :issue:`4375`,
-  :issue:`4372`)
-- ``pandas.util.compat`` and ``pandas.util.py3compat`` have been merged into
-  ``pandas.compat``. ``pandas.compat`` now includes many functions allowing
-  2/3 compatibility. It contains both list and iterator versions of range,
-  filter, map and zip, plus other necessary elements for Python 3
-  compatibility. ``lmap``, ``lzip``, ``lrange`` and ``lfilter`` all produce
-  lists instead of iterators, for compatibility with ``numpy``, subscripting
-  and ``pandas`` constructors.(:issue:`4384`, :issue:`4375`, :issue:`4372`)
-- ``Series.get`` with negative indexers now returns the same as ``[]`` (:issue:`4390`)
-- Changes to how ``Index`` and ``MultiIndex`` handle metadata (``levels``,
-  ``labels``, and ``names``) (:issue:`4039`):
-
-  .. code-block:: python
-
-      # previously, you would have set levels or labels directly
-      index.levels = [[1, 2, 3, 4], [1, 2, 4, 4]]
-
-      # now, you use the set_levels or set_labels methods
-      index = index.set_levels([[1, 2, 3, 4], [1, 2, 4, 4]])
-
-      # similarly, for names, you can rename the object
-      # but setting names is not deprecated
-      index = index.set_names(["bob", "cranberry"])
-
-      # and all methods take an inplace kwarg - but return None
-      index.set_names(["bob", "cranberry"], inplace=True)
-
-- **All** division with ``NDFrame`` objects is now *truedivision*, regardless
-  of the future import. This means that operating on pandas objects will by default
-  use *floating point* division, and return a floating point dtype.
-  You can use ``//`` and ``floordiv`` to do integer division.
-
-  Integer division
-
-  .. code-block:: ipython
-
-      In [3]: arr = np.array([1, 2, 3, 4])
-
-      In [4]: arr2 = np.array([5, 3, 2, 1])
-
-      In [5]: arr / arr2
-      Out[5]: array([0, 0, 1, 4])
-
-      In [6]: Series(arr) // Series(arr2)
-      Out[6]:
-      0    0
-      1    0
-      2    1
-      3    4
-      dtype: int64
-
-  True Division
-
-  .. code-block:: ipython
-
-      In [7]: pd.Series(arr) / pd.Series(arr2) # no future import required
-      Out[7]:
-      0    0.200000
-      1    0.666667
-      2    1.500000
-      3    4.000000
-      dtype: float64
-
-- Infer and downcast dtype if ``downcast='infer'`` is passed to ``fillna/ffill/bfill`` (:issue:`4604`)
-- ``__nonzero__`` for all NDFrame objects, will now raise a ``ValueError``, this reverts back to (:issue:`1073`, :issue:`4633`)
-  behavior. See :ref:`gotchas<gotchas.truth>` for a more detailed discussion.
-
-  This prevents doing boolean comparison on *entire* pandas objects, which is inherently ambiguous. These all will raise a ``ValueError``.
-
-  .. code-block:: python
-
-      if df:
-         ....
-      df1 and df2
-      s1 and s2
-
-  Added the ``.bool()`` method to ``NDFrame`` objects to facilitate evaluating of single-element boolean Series:
-
-  .. ipython:: python
-
-     Series([True]).bool()
-     Series([False]).bool()
-     DataFrame([[True]]).bool()
-     DataFrame([[False]]).bool()
-
-- All non-Index NDFrames (``Series``, ``DataFrame``, ``Panel``, ``Panel4D``,
-  ``SparsePanel``, etc.), now support the entire set of arithmetic operators
-  and arithmetic flex methods (add, sub, mul, etc.). ``SparsePanel`` does not
-  support ``pow`` or ``mod`` with non-scalars. (:issue:`3765`)
-- ``Series`` and ``DataFrame`` now have a ``mode()`` method to calculate the
-  statistical mode(s) by axis/Series. (:issue:`5367`)
-
-- Chained assignment will now by default warn if the user is assigning to a copy. This can be changed
-  with the option ``mode.chained_assignment``, allowed options are ``raise/warn/None``. See :ref:`the docs<indexing.view_versus_copy>`.
-
-  .. ipython:: python
-
-     dfc = DataFrame({'A':['aaa','bbb','ccc'],'B':[1,2,3]})
-     pd.set_option('chained_assignment','warn')
-
-  The following warning / exception will show if this is attempted.
-
-  .. ipython:: python
-     :okwarning:
-
-     dfc.loc[0]['A'] = 1111
-
-  ::
-
-     Traceback (most recent call last)
-        ...
-     SettingWithCopyWarning:
-        A value is trying to be set on a copy of a slice from a DataFrame.
-        Try using .loc[row_index,col_indexer] = value instead
-
-  Here is the correct method of assignment.
-
-  .. ipython:: python
-
-     dfc.loc[0,'A'] = 11
-     dfc
-
-- ``Panel.reindex`` has the following call signature ``Panel.reindex(items=None, major_axis=None, minor_axis=None, **kwargs)``
-   to conform with other ``NDFrame`` objects. See :ref:`Internal Refactoring<whatsnew_0130.refactoring>` for more information.
-
-- ``Series.argmin`` and ``Series.argmax`` are now aliased to ``Series.idxmin`` and ``Series.idxmax``. These return the *index* of the
-   min or max element respectively. Prior to 0.13.0 these would return the position of the min / max element. (:issue:`6214`)
-
-Prior Version Deprecations/Changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-These were announced changes in 0.12 or prior that are taking effect as of 0.13.0
-
-- Remove deprecated ``Factor`` (:issue:`3650`)
-- Remove deprecated ``set_printoptions/reset_printoptions`` (:issue:`3046`)
-- Remove deprecated ``_verbose_info`` (:issue:`3215`)
-- Remove deprecated ``read_clipboard/to_clipboard/ExcelFile/ExcelWriter`` from ``pandas.io.parsers`` (:issue:`3717`)
-  These are available as functions in the main pandas namespace (e.g. ``pd.read_clipboard``)
-- default for ``tupleize_cols`` is now ``False`` for both ``to_csv`` and ``read_csv``. Fair warning in 0.12 (:issue:`3604`)
-- default for `display.max_seq_len` is now 100 rather then `None`. This activates
-  truncated display ("...") of long sequences in various places. (:issue:`3391`)
-
-Deprecations
-~~~~~~~~~~~~
-
-Deprecated in 0.13.0
-
-- deprecated ``iterkv``, which will be removed in a future release (this was
-  an alias of iteritems used to bypass ``2to3``'s changes).
-  (:issue:`4384`, :issue:`4375`, :issue:`4372`)
-- deprecated the string method ``match``, whose role is now performed more
-  idiomatically by ``extract``. In a future release, the default behavior
-  of ``match`` will change to become analogous to ``contains``, which returns
-  a boolean indexer. (Their
-  distinction is strictness: ``match`` relies on ``re.match`` while
-  ``contains`` relies on ``re.search``.) In this release, the deprecated
-  behavior is the default, but the new behavior is available through the
-  keyword argument ``as_indexer=True``.
-
-Indexing API Changes
-~~~~~~~~~~~~~~~~~~~~
-
-Prior to 0.13, it was impossible to use a label indexer (``.loc/.ix``) to set a value that
-was not contained in the index of a particular axis. (:issue:`2578`). See :ref:`the docs<indexing.basics.partial_setting>`
-
-In the ``Series`` case this is effectively an appending operation
-
-.. ipython:: python
-
-   s = Series([1,2,3])
-   s
-   s[5] = 5.
-   s
-
-.. ipython:: python
-
-   dfi = DataFrame(np.arange(6).reshape(3,2),
-                   columns=['A','B'])
-   dfi
-
-This would previously ``KeyError``
-
-.. ipython:: python
-
-   dfi.loc[:,'C'] = dfi.loc[:,'A']
-   dfi
-
-This is like an ``append`` operation.
-
-.. ipython:: python
-
-   dfi.loc[3] = 5
-   dfi
-
-A Panel setting operation on an arbitrary axis aligns the input to the Panel
-
-.. ipython:: python
-
-   p = pd.Panel(np.arange(16).reshape(2,4,2),
-               items=['Item1','Item2'],
-               major_axis=pd.date_range('2001/1/12',periods=4),
-               minor_axis=['A','B'],dtype='float64')
-   p
-   p.loc[:,:,'C'] = Series([30,32],index=p.items)
-   p
-   p.loc[:,:,'C']
-
-Float64Index API Change
-~~~~~~~~~~~~~~~~~~~~~~~
-
-- Added a new index type, ``Float64Index``. This will be automatically created when passing floating values in index creation.
-  This enables a pure label-based slicing paradigm that makes ``[],ix,loc`` for scalar indexing and slicing work exactly the
-  same. See :ref:`the docs<indexing.float64index>`, (:issue:`263`)
-
-  Construction is by default for floating type values.
-
-  .. ipython:: python
-
-     index = Index([1.5, 2, 3, 4.5, 5])
-     index
-     s = Series(range(5),index=index)
-     s
-
-  Scalar selection for ``[],.ix,.loc`` will always be label based. An integer will match an equal float index (e.g. ``3`` is equivalent to ``3.0``)
-
-  .. ipython:: python
-
-     s[3]
-     s.loc[3]
-
-  The only positional indexing is via ``iloc``
-
-  .. ipython:: python
-
-     s.iloc[3]
-
-  A scalar index that is not found will raise ``KeyError``
-
-  Slicing is ALWAYS on the values of the index, for ``[],ix,loc`` and ALWAYS positional with ``iloc``
-
-  .. ipython:: python
-
-     s[2:4]
-     s.loc[2:4]
-     s.iloc[2:4]
-
-  In float indexes, slicing using floats are allowed
-
-  .. ipython:: python
-
-     s[2.1:4.6]
-     s.loc[2.1:4.6]
-
-- Indexing on other index types are preserved (and positional fallback for ``[],ix``), with the exception, that floating point slicing
-  on indexes on non ``Float64Index`` will now raise a ``TypeError``.
-
-  .. code-block:: ipython
-
-     In [1]: Series(range(5))[3.5]
-     TypeError: the label [3.5] is not a proper indexer for this index type (Int64Index)
-
-     In [1]: Series(range(5))[3.5:4.5]
-     TypeError: the slice start [3.5] is not a proper indexer for this index type (Int64Index)
-
-  Using a scalar float indexer will be deprecated in a future version, but is allowed for now.
-
-  .. code-block:: ipython
-
-     In [3]: Series(range(5))[3.0]
-     Out[3]: 3
-
-HDFStore API Changes
-~~~~~~~~~~~~~~~~~~~~
-
-- Query Format Changes. A much more string-like query format is now supported. See :ref:`the docs<io.hdf5-query>`.
-
-  .. ipython:: python
-
-     path = 'test.h5'
-     dfq = DataFrame(randn(10,4),
-              columns=list('ABCD'),
-              index=date_range('20130101',periods=10))
-     dfq.to_hdf(path,'dfq',format='table',data_columns=True)
-
-  Use boolean expressions, with in-line function evaluation.
-
-  .. ipython:: python
-
-     read_hdf(path,'dfq',
-         where="index>Timestamp('20130104') & columns=['A', 'B']")
-
-  Use an inline column reference
-
-  .. ipython:: python
-
-     read_hdf(path,'dfq',
-         where="A>0 or C>0")
-
-  .. ipython:: python
-     :suppress:
-
-     import os
-     os.remove(path)
-
-- the ``format`` keyword now replaces the ``table`` keyword; allowed values are ``fixed(f)`` or ``table(t)``
-  the same defaults as prior < 0.13.0 remain, e.g. ``put`` implies ``fixed`` format and ``append`` implies
-  ``table`` format. This default format can be set as an option by setting ``io.hdf.default_format``.
-
-  .. ipython:: python
-
-     path = 'test.h5'
-     df = DataFrame(randn(10,2))
-     df.to_hdf(path,'df_table',format='table')
-     df.to_hdf(path,'df_table2',append=True)
-     df.to_hdf(path,'df_fixed')
-     with get_store(path) as store:
-        print(store)
-
-  .. ipython:: python
-     :suppress:
-
-     import os
-     os.remove(path)
-
-- Significant table writing performance improvements
-- handle a passed ``Series`` in table format (:issue:`4330`)
-- can now serialize a ``timedelta64[ns]`` dtype in a table (:issue:`3577`), See :ref:`the docs<io.hdf5-timedelta>`.
-- added an ``is_open`` property to indicate if the underlying file handle is_open;
-  a closed store will now report 'CLOSED' when viewing the store (rather than raising an error)
-  (:issue:`4409`)
-- a close of a ``HDFStore`` now will close that instance of the ``HDFStore``
-  but will only close the actual file if the ref count (by ``PyTables``) w.r.t. all of the open handles
-  are 0. Essentially you have a local instance of ``HDFStore`` referenced by a variable. Once you
-  close it, it will report closed. Other references (to the same file) will continue to operate
-  until they themselves are closed. Performing an action on a closed file will raise
-  ``ClosedFileError``
-
-  .. ipython:: python
-
-     path = 'test.h5'
-     df = DataFrame(randn(10,2))
-     store1 = HDFStore(path)
-     store2 = HDFStore(path)
-     store1.append('df',df)
-     store2.append('df2',df)
-
-     store1
-     store2
-     store1.close()
-     store2
-     store2.close()
-     store2
-
-  .. ipython:: python
-     :suppress:
-
-     import os
-     os.remove(path)
-
-- removed the ``_quiet`` attribute, replace by a ``DuplicateWarning`` if retrieving
-  duplicate rows from a table (:issue:`4367`)
-- removed the ``warn`` argument from ``open``. Instead a ``PossibleDataLossError`` exception will
-  be raised if you try to use ``mode='w'`` with an OPEN file handle (:issue:`4367`)
-- allow a passed locations array or mask as a ``where`` condition (:issue:`4467`).
-  See :ref:`the docs<io.hdf5-where_mask>` for an example.
-- add the keyword ``dropna=True`` to ``append`` to change whether ALL nan rows are not written
-  to the store (default is ``True``, ALL nan rows are NOT written), also settable
-  via the option ``io.hdf.dropna_table`` (:issue:`4625`)
-- pass thru store creation arguments; can be used to support in-memory stores
-
-DataFrame repr Changes
-~~~~~~~~~~~~~~~~~~~~~~
-
-The HTML and plain text representations of :class:`DataFrame` now show
-a truncated view of the table once it exceeds a certain size, rather
-than switching to the short info view (:issue:`4886`, :issue:`5550`).
-This makes the representation more consistent as small DataFrames get
-larger.
-
-.. image:: _static/df_repr_truncated.png
-   :alt: Truncated HTML representation of a DataFrame
-
-To get the info view, call :meth:`DataFrame.info`. If you prefer the
-info view as the repr for large DataFrames, you can set this by running
-``set_option('display.large_repr', 'info')``.
-
-Enhancements
-~~~~~~~~~~~~
-
-- ``df.to_clipboard()`` learned a new ``excel`` keyword that let's you
-  paste df data directly into excel (enabled by default). (:issue:`5070`).
-- ``read_html`` now raises a ``URLError`` instead of catching and raising a
-  ``ValueError`` (:issue:`4303`, :issue:`4305`)
-- Added a test for ``read_clipboard()`` and ``to_clipboard()`` (:issue:`4282`)
-- Clipboard functionality now works with PySide (:issue:`4282`)
-- Added a more informative error message when plot arguments contain
-  overlapping color and style arguments (:issue:`4402`)
-- ``to_dict`` now takes ``records`` as a possible outtype.  Returns an array
-  of column-keyed dictionaries. (:issue:`4936`)
-
-- ``NaN`` handing in get_dummies (:issue:`4446`) with `dummy_na`
-
-  .. ipython:: python
-
-     # previously, nan was erroneously counted as 2 here
-     # now it is not counted at all
-     get_dummies([1, 2, np.nan])
-
-     # unless requested
-     get_dummies([1, 2, np.nan], dummy_na=True)
-
-
-- ``timedelta64[ns]`` operations. See :ref:`the docs<timedeltas.timedeltas_convert>`.
-
-  .. warning::
-
-     Most of these operations require ``numpy >= 1.7``
-
-  Using the new top-level ``to_timedelta``, you can convert a scalar or array from the standard
-  timedelta format (produced by ``to_csv``) into a timedelta type (``np.timedelta64`` in ``nanoseconds``).
-
-  .. ipython:: python
-
-     to_timedelta('1 days 06:05:01.00003')
-     to_timedelta('15.5us')
-     to_timedelta(['1 days 06:05:01.00003','15.5us','nan'])
-     to_timedelta(np.arange(5),unit='s')
-     to_timedelta(np.arange(5),unit='d')
-
-  A Series of dtype ``timedelta64[ns]`` can now be divided by another
-  ``timedelta64[ns]`` object, or astyped to yield a ``float64`` dtyped Series. This
-  is frequency conversion. See :ref:`the docs<timedeltas.timedeltas_convert>` for the docs.
-
-  .. ipython:: python
-
-     from datetime import timedelta
-     td = Series(date_range('20130101',periods=4))-Series(date_range('20121201',periods=4))
-     td[2] += np.timedelta64(timedelta(minutes=5,seconds=3))
-     td[3] = np.nan
-     td
-
-     # to days
-     td / np.timedelta64(1,'D')
-     td.astype('timedelta64[D]')
-
-     # to seconds
-     td / np.timedelta64(1,'s')
-     td.astype('timedelta64[s]')
-
-  Dividing or multiplying a ``timedelta64[ns]`` Series by an integer or integer Series
-
-  .. ipython:: python
-
-     td * -1
-     td * Series([1,2,3,4])
-
-  Absolute ``DateOffset`` objects can act equivalently to ``timedeltas``
-
-  .. ipython:: python
-
-     from pandas import offsets
-     td + offsets.Minute(5) + offsets.Milli(5)
-
-  Fillna is now supported for timedeltas
-
-  .. ipython:: python
-
-     td.fillna(0)
-     td.fillna(timedelta(days=1,seconds=5))
-
-  You can do numeric reduction operations on timedeltas.
-
-  .. ipython:: python
-
-     td.mean()
-     td.quantile(.1)
-
-- ``plot(kind='kde')`` now accepts the optional parameters ``bw_method`` and
-  ``ind``, passed to scipy.stats.gaussian_kde() (for scipy >= 0.11.0) to set
-  the bandwidth, and to gkde.evaluate() to specify the indices at which it
-  is evaluated, respectively. See scipy docs. (:issue:`4298`)
-
-- DataFrame constructor now accepts a numpy masked record array (:issue:`3478`)
-
-- The new vectorized string method ``extract`` return regular expression
-  matches more conveniently.
-
-  .. ipython:: python
-     :okwarning:
-
-     Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)')
-
-  Elements that do not match return ``NaN``. Extracting a regular expression
-  with more than one group returns a DataFrame with one column per group.
-
-
-  .. ipython:: python
-     :okwarning:
-
-     Series(['a1', 'b2', 'c3']).str.extract('([ab])(\d)')
-
-  Elements that do not match return a row of ``NaN``.
-  Thus, a Series of messy strings can be *converted* into a
-  like-indexed Series or DataFrame of cleaned-up or more useful strings,
-  without necessitating ``get()`` to access tuples or ``re.match`` objects.
-
-  Named groups like
-
-  .. ipython:: python
-     :okwarning:
-
-     Series(['a1', 'b2', 'c3']).str.extract(
-             '(?P<letter>[ab])(?P<digit>\d)')
-
-  and optional groups can also be used.
-
-  .. ipython:: python
-     :okwarning:
-
-      Series(['a1', 'b2', '3']).str.extract(
-              '(?P<letter>[ab])?(?P<digit>\d)')
-
-- ``read_stata`` now accepts Stata 13 format (:issue:`4291`)
-
-- ``read_fwf`` now infers the column specifications from the first 100 rows of
-  the file if the data has correctly separated and properly aligned columns
-  using the delimiter provided to the function (:issue:`4488`).
-
-- support for nanosecond times as an offset
-
-  .. warning::
-
-     These operations require ``numpy >= 1.7``
-
-  Period conversions in the range of seconds and below were reworked and extended
-  up to nanoseconds. Periods in the nanosecond range are now available.
-
-  .. ipython:: python
-
-     date_range('2013-01-01', periods=5, freq='5N')
-
-  or with frequency as offset
-
-  .. ipython:: python
-
-     date_range('2013-01-01', periods=5, freq=pd.offsets.Nano(5))
-
-  Timestamps can be modified in the nanosecond range
-
-  .. ipython:: python
-
-     t = Timestamp('20130101 09:01:02')
-     t + pd.tseries.offsets.Nano(123)
-
-- A new method, ``isin`` for DataFrames, which plays nicely with boolean indexing. The argument to ``isin``, what we're comparing the DataFrame to, can be a DataFrame, Series, dict, or array of values. See :ref:`the docs<indexing.basics.indexing_isin>` for more.
-
-  To get the rows where any of the conditions are met:
-
-  .. ipython:: python
-
-     dfi = DataFrame({'A': [1, 2, 3, 4], 'B': ['a', 'b', 'f', 'n']})
-     dfi
-     other = DataFrame({'A': [1, 3, 3, 7], 'B': ['e', 'f', 'f', 'e']})
-     mask = dfi.isin(other)
-     mask
-     dfi[mask.any(1)]
-
-- ``Series`` now supports a ``to_frame`` method to convert it to a single-column DataFrame (:issue:`5164`)
-
-- All R datasets listed here http://stat.ethz.ch/R-manual/R-devel/library/datasets/html/00Index.html can now be loaded into Pandas objects
-
-  .. code-block:: python
-
-     # note that pandas.rpy was deprecated in v0.16.0
-     import pandas.rpy.common as com
-     com.load_data('Titanic')
-
-- ``tz_localize`` can infer a fall daylight savings transition based on the structure
-  of the unlocalized data (:issue:`4230`), see :ref:`the docs<timeseries.timezone>`
-
-- ``DatetimeIndex`` is now in the API documentation, see :ref:`the docs<api.datetimeindex>`
-
-- :meth:`~pandas.io.json.json_normalize` is a new method to allow you to create a flat table
-  from semi-structured JSON data. See :ref:`the docs<io.json_normalize>` (:issue:`1067`)
-
-- Added PySide support for the qtpandas DataFrameModel and DataFrameWidget.
-
-- Python csv parser now supports usecols (:issue:`4335`)
-
-- Frequencies gained several new offsets:
-
-  * ``LastWeekOfMonth`` (:issue:`4637`)
-  * ``FY5253``, and ``FY5253Quarter`` (:issue:`4511`)
-
-
-- DataFrame has a new ``interpolate`` method, similar to Series (:issue:`4434`, :issue:`1892`)
-
-  .. ipython:: python
-
-      df = DataFrame({'A': [1, 2.1, np.nan, 4.7, 5.6, 6.8],
-                      'B': [.25, np.nan, np.nan, 4, 12.2, 14.4]})
-      df.interpolate()
-
-  Additionally, the ``method`` argument to ``interpolate`` has been expanded
-  to include ``'nearest', 'zero', 'slinear', 'quadratic', 'cubic',
-  'barycentric', 'krogh', 'piecewise_polynomial', 'pchip', `polynomial`, 'spline'``
-  The new methods require scipy_. Consult the Scipy reference guide_ and documentation_ for more information
-  about when the various methods are appropriate. See :ref:`the docs<missing_data.interpolate>`.
-
-  Interpolate now also accepts a ``limit`` keyword argument.
-  This works similar to ``fillna``'s limit:
-
-  .. ipython:: python
-
-    ser = Series([1, 3, np.nan, np.nan, np.nan, 11])
-    ser.interpolate(limit=2)
-
-- Added ``wide_to_long`` panel data convenience function. See :ref:`the docs<reshaping.melt>`.
-
-  .. ipython:: python
-
-    np.random.seed(123)
-    df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
-                       "A1980" : {0 : "d", 1 : "e", 2 : "f"},
-                       "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
-                       "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
-                       "X"     : dict(zip(range(3), np.random.randn(3)))
-                      })
-    df["id"] = df.index
-    df
-    wide_to_long(df, ["A", "B"], i="id", j="year")
-
-.. _scipy: http://www.scipy.org
-.. _documentation: http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation
-.. _guide: http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html
-
-- ``to_csv`` now takes a ``date_format`` keyword argument that specifies how
-  output datetime objects should be formatted. Datetimes encountered in the
-  index, columns, and values will all have this formatting applied. (:issue:`4313`)
-- ``DataFrame.plot`` will scatter plot x versus y by passing ``kind='scatter'`` (:issue:`2215`)
-- Added support for Google Analytics v3 API segment IDs that also supports v2 IDs. (:issue:`5271`)
-
-.. _whatsnew_0130.experimental:
-
-Experimental
-~~~~~~~~~~~~
-
-- The new :func:`~pandas.eval` function implements expression evaluation using
-  ``numexpr`` behind the scenes. This results in large speedups for
-  complicated expressions involving large DataFrames/Series. For example,
-
-  .. ipython:: python
-
-     nrows, ncols = 20000, 100
-     df1, df2, df3, df4 = [DataFrame(randn(nrows, ncols))
-                           for _ in range(4)]
-
-  .. ipython:: python
-
-     # eval with NumExpr backend
-     %timeit pd.eval('df1 + df2 + df3 + df4')
-
-  .. ipython:: python
-
-     # pure Python evaluation
-     %timeit df1 + df2 + df3 + df4
-
-  For more details, see the :ref:`the docs<enhancingperf.eval>`
-
-- Similar to ``pandas.eval``, :class:`~pandas.DataFrame` has a new
-  ``DataFrame.eval`` method that evaluates an expression in the context of
-  the ``DataFrame``. For example,
-
-  .. ipython:: python
-     :suppress:
-
-     try:
-        del a
-     except NameError:
-        pass
-
-     try:
-        del b
-     except NameError:
-        pass
-
-  .. ipython:: python
-
-     df = DataFrame(randn(10, 2), columns=['a', 'b'])
-     df.eval('a + b')
-
-- :meth:`~pandas.DataFrame.query` method has been added that allows
-  you to select elements of a ``DataFrame`` using a natural query syntax
-  nearly identical to Python syntax. For example,
-
-  .. ipython:: python
-     :suppress:
-
-     try:
-        del a
-     except NameError:
-        pass
-
-     try:
-        del b
-     except NameError:
-        pass
-
-     try:
-        del c
-     except NameError:
-        pass
-
-  .. ipython:: python
-
-     n = 20
-     df = DataFrame(np.random.randint(n, size=(n, 3)), columns=['a', 'b', 'c'])
-     df.query('a < b < c')
-
-  selects all the rows of ``df`` where ``a < b < c`` evaluates to ``True``.
-  For more details see the :ref:`the docs<indexing.query>`.
-
-- ``pd.read_msgpack()`` and ``pd.to_msgpack()`` are now a supported method of serialization
-  of arbitrary pandas (and python objects) in a lightweight portable binary format. See :ref:`the docs<io.msgpack>`
-
-  .. warning::
-
-     Since this is an EXPERIMENTAL LIBRARY, the storage format may not be stable until a future release.
-
-  .. ipython:: python
-
-     df = DataFrame(np.random.rand(5,2),columns=list('AB'))
-     df.to_msgpack('foo.msg')
-     pd.read_msgpack('foo.msg')
-
-     s = Series(np.random.rand(5),index=date_range('20130101',periods=5))
-     pd.to_msgpack('foo.msg', df, s)
-     pd.read_msgpack('foo.msg')
-
-  You can pass ``iterator=True`` to iterator over the unpacked results
-
-  .. ipython:: python
-
-     for o in pd.read_msgpack('foo.msg',iterator=True):
-        print o
-
-  .. ipython:: python
-     :suppress:
-     :okexcept:
-
-     os.remove('foo.msg')
-
-- ``pandas.io.gbq`` provides a simple way to extract from, and load data into,
-  Google's BigQuery Data Sets by way of pandas DataFrames. BigQuery is a high
-  performance SQL-like database service, useful for performing ad-hoc queries
-  against extremely large datasets. :ref:`See the docs <io.bigquery>`
-
-  .. code-block:: python
-
-     from pandas.io import gbq
-
-     # A query to select the average monthly temperatures in the
-     # in the year 2000 across the USA. The dataset,
-     # publicata:samples.gsod, is available on all BigQuery accounts,
-     # and is based on NOAA gsod data.
-
-     query = """SELECT station_number as STATION,
-     month as MONTH, AVG(mean_temp) as MEAN_TEMP
-     FROM publicdata:samples.gsod
-     WHERE YEAR = 2000
-     GROUP BY STATION, MONTH
-     ORDER BY STATION, MONTH ASC"""
-
-     # Fetch the result set for this query
-
-     # Your Google BigQuery Project ID
-     # To find this, see your dashboard:
-     # https://console.developers.google.com/iam-admin/projects?authuser=0
-     projectid = xxxxxxxxx;
-
-     df = gbq.read_gbq(query, project_id = projectid)
-
-     # Use pandas to process and reshape the dataset
-
-     df2 = df.pivot(index='STATION', columns='MONTH', values='MEAN_TEMP')
-     df3 = pandas.concat([df2.min(), df2.mean(), df2.max()],
-                         axis=1,keys=["Min Tem", "Mean Temp", "Max Temp"])
-
-  The resulting DataFrame is::
-
-     > df3
-                 Min Tem  Mean Temp    Max Temp
-      MONTH
-      1     -53.336667  39.827892   89.770968
-      2     -49.837500  43.685219   93.437932
-      3     -77.926087  48.708355   96.099998
-      4     -82.892858  55.070087   97.317240
-      5     -92.378261  61.428117  102.042856
-      6     -77.703334  65.858888  102.900000
-      7     -87.821428  68.169663  106.510714
-      8     -89.431999  68.614215  105.500000
-      9     -86.611112  63.436935  107.142856
-      10    -78.209677  56.880838   92.103333
-      11    -50.125000  48.861228   94.996428
-      12    -50.332258  42.286879   94.396774
-
-  .. warning::
-
-     To use this module, you will need a BigQuery account. See
-     <https://cloud.google.com/products/big-query> for details.
-
-     As of 10/10/13, there is a bug in Google's API preventing result sets
-     from being larger than 100,000 rows. A patch is scheduled for the week of
-     10/14/13.
-
-.. _whatsnew_0130.refactoring:
-
-Internal Refactoring
-~~~~~~~~~~~~~~~~~~~~
-
-In 0.13.0 there is a major refactor primarily to subclass ``Series`` from
-``NDFrame``, which is the base class currently for ``DataFrame`` and ``Panel``,
-to unify methods and behaviors. Series formerly subclassed directly from
-``ndarray``. (:issue:`4080`, :issue:`3862`, :issue:`816`)
-
-.. warning::
-
-   There are two potential incompatibilities from < 0.13.0
-
-   - Using certain numpy functions would previously return a ``Series`` if passed a ``Series``
-     as an argument. This seems only to affect ``np.ones_like``, ``np.empty_like``,
-     ``np.diff`` and ``np.where``. These now return ``ndarrays``.
-
-     .. ipython:: python
-
-        s = Series([1,2,3,4])
-
-     Numpy Usage
-
-     .. ipython:: python
-
-        np.ones_like(s)
-        np.diff(s)
-        np.where(s>1,s,np.nan)
-
-     Pandonic Usage
-
-     .. ipython:: python
-
-        Series(1,index=s.index)
-        s.diff()
-        s.where(s>1)
-
-   - Passing a ``Series`` directly to a cython function expecting an ``ndarray`` type will no
-     long work directly, you must pass ``Series.values``, See :ref:`Enhancing Performance<enhancingperf.ndarray>`
-
-   - ``Series(0.5)`` would previously return the scalar ``0.5``, instead this will return a 1-element ``Series``
-
-   - This change breaks ``rpy2<=2.3.8``. an Issue has been opened against rpy2 and a workaround
-     is detailed in :issue:`5698`. Thanks @JanSchulz.
-
-- Pickle compatibility is preserved for pickles created prior to 0.13. These must be unpickled with ``pd.read_pickle``, see :ref:`Pickling<io.pickle>`.
-
-- Refactor of series.py/frame.py/panel.py to move common code to generic.py
-
-  - added ``_setup_axes`` to created generic NDFrame structures
-  - moved methods
-
-    - ``from_axes,_wrap_array,axes,ix,loc,iloc,shape,empty,swapaxes,transpose,pop``
-    - ``__iter__,keys,__contains__,__len__,__neg__,__invert__``
-    - ``convert_objects,as_blocks,as_matrix,values``
-    - ``__getstate__,__setstate__`` (compat remains in frame/panel)
-    - ``__getattr__,__setattr__``
-    - ``_indexed_same,reindex_like,align,where,mask``
-    - ``fillna,replace`` (``Series`` replace is now consistent with ``DataFrame``)
-    - ``filter`` (also added axis argument to selectively filter on a different axis)
-    - ``reindex,reindex_axis,take``
-    - ``truncate`` (moved to become part of ``NDFrame``)
-
-- These are API changes which make ``Panel`` more consistent with ``DataFrame``
-
-  - ``swapaxes`` on a ``Panel`` with the same axes specified now return a copy
-  - support attribute access for setting
-  - filter supports the same API as the original ``DataFrame`` filter
-
-- Reindex called with no arguments will now return a copy of the input object
-
-- ``TimeSeries`` is now an alias for ``Series``. the property ``is_time_series``
-  can be used to distinguish (if desired)
-
-- Refactor of Sparse objects to use BlockManager
-
-  - Created a new block type in internals, ``SparseBlock``, which can hold multi-dtypes
-    and is non-consolidatable. ``SparseSeries`` and ``SparseDataFrame`` now inherit
-    more methods from there hierarchy (Series/DataFrame), and no longer inherit
-    from ``SparseArray`` (which instead is the object of the ``SparseBlock``)
-  - Sparse suite now supports integration with non-sparse data. Non-float sparse
-    data is supportable (partially implemented)
-  - Operations on sparse structures within DataFrames should preserve sparseness,
-    merging type operations will convert to dense (and back to sparse), so might
-    be somewhat inefficient
-  - enable setitem on ``SparseSeries`` for boolean/integer/slices
-  - ``SparsePanels`` implementation is unchanged (e.g. not using BlockManager, needs work)
-
-- added ``ftypes`` method to Series/DataFrame, similar to ``dtypes``, but indicates
-  if the underlying is sparse/dense (as well as the dtype)
-- All ``NDFrame`` objects can now use ``__finalize__()`` to specify various
-  values to propagate to new objects from an existing one (e.g. ``name`` in ``Series`` will
-  follow more automatically now)
-- Internal type checking is now done via a suite of generated classes, allowing ``isinstance(value, klass)``
-  without having to directly import the klass, courtesy of @jtratner
-- Bug in Series update where the parent frame is not updating its cache based on
-  changes (:issue:`4080`) or types (:issue:`3217`), fillna (:issue:`3386`)
-- Indexing with dtype conversions fixed (:issue:`4463`, :issue:`4204`)
-- Refactor ``Series.reindex`` to core/generic.py (:issue:`4604`, :issue:`4618`), allow ``method=`` in reindexing
-  on a Series to work
-- ``Series.copy`` no longer accepts the ``order`` parameter and is now consistent with ``NDFrame`` copy
-- Refactor ``rename`` methods to core/generic.py; fixes ``Series.rename`` for (:issue:`4605`), and adds ``rename``
-  with the same signature for ``Panel``
-- Refactor ``clip`` methods to core/generic.py (:issue:`4798`)
-- Refactor of ``_get_numeric_data/_get_bool_data`` to core/generic.py, allowing Series/Panel functionality
-- ``Series`` (for index) / ``Panel`` (for items) now allow attribute access to its elements  (:issue:`1903`)
-
-  .. ipython:: python
-
-     s = Series([1,2,3],index=list('abc'))
-     s.b
-     s.a = 5
-     s
-
-Bug Fixes
-~~~~~~~~~
-
-See :ref:`V0.13.0 Bug Fixes<release.bug_fixes-0.13.0>` for an extensive list of bugs that have been fixed in 0.13.0.
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list of all API changes, Enhancements and Bug Fixes.
diff --git a/doc/source/whatsnew/v0.13.1.rst b/doc/source/whatsnew/v0.13.1.rst
new file mode 100644
index 0000000000000..8a89450be2f48
--- /dev/null
+++ b/doc/source/whatsnew/v0.13.1.rst
@@ -0,0 +1,382 @@
+.. _whatsnew_0131:
+
+v0.13.1 (February 3, 2014)
+--------------------------
+
+{{ header }}
+
+
+
+This is a minor release from 0.13.0 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- Added ``infer_datetime_format`` keyword to ``read_csv/to_datetime`` to allow speedups for homogeneously formatted datetimes.
+- Will intelligently limit display precision for datetime/timedelta formats.
+- Enhanced Panel :meth:`~pandas.Panel.apply` method.
+- Suggested tutorials in new :ref:`Tutorials<tutorials>` section.
+- Our pandas ecosystem is growing, We now feature related projects in a new :ref:`Pandas Ecosystem<ecosystem>` section.
+- Much work has been taking place on improving the docs, and a new :ref:`Contributing<contributing>` section has been added.
+- Even though it may only be of interest to devs, we <3 our new CI status page: `ScatterCI <http://scatterci.github.io/pydata/pandas>`__.
+
+.. warning::
+
+   0.13.1 fixes a bug that was caused by a combination of having numpy < 1.8, and doing
+   chained assignment on a string-like array. Please review :ref:`the docs<indexing.view_versus_copy>`,
+   chained indexing can have unexpected results and should generally be avoided.
+
+   This would previously segfault:
+
+   .. ipython:: python
+
+      df = pd.DataFrame({'A': np.array(['foo', 'bar', 'bah', 'foo', 'bar'])})
+      df['A'].iloc[0] = np.nan
+      df
+
+   The recommended way to do this type of assignment is:
+
+   .. ipython:: python
+
+      df = pd.DataFrame({'A': np.array(['foo', 'bar', 'bah', 'foo', 'bar'])})
+      df.loc[0, 'A'] = np.nan
+      df
+
+Output Formatting Enhancements
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- df.info() view now display dtype info per column (:issue:`5682`)
+
+- df.info() now honors the option ``max_info_rows``, to disable null counts for large frames (:issue:`5974`)
+
+  .. ipython:: python
+
+     max_info_rows = pd.get_option('max_info_rows')
+
+     df = pd.DataFrame({'A': np.random.randn(10),
+                        'B': np.random.randn(10),
+                        'C': pd.date_range('20130101', periods=10)
+                        })
+     df.iloc[3:6, [0, 2]] = np.nan
+
+  .. ipython:: python
+
+     # set to not display the null counts
+     pd.set_option('max_info_rows', 0)
+     df.info()
+
+  .. ipython:: python
+
+     # this is the default (same as in 0.13.0)
+     pd.set_option('max_info_rows', max_info_rows)
+     df.info()
+
+- Add ``show_dimensions`` display option for the new DataFrame repr to control whether the dimensions print.
+
+  .. ipython:: python
+
+      df = pd.DataFrame([[1, 2], [3, 4]])
+      pd.set_option('show_dimensions', False)
+      df
+
+      pd.set_option('show_dimensions', True)
+      df
+
+- The ``ArrayFormatter`` for ``datetime`` and ``timedelta64`` now intelligently
+  limit precision based on the values in the array (:issue:`3401`)
+
+  Previously output might look like:
+
+  ..   code-block:: text
+
+        age                 today               diff
+      0 2001-01-01 00:00:00 2013-04-19 00:00:00 4491 days, 00:00:00
+      1 2004-06-01 00:00:00 2013-04-19 00:00:00 3244 days, 00:00:00
+
+  Now the output looks like:
+
+  .. ipython:: python
+
+     df = pd.DataFrame([pd.Timestamp('20010101'),
+                        pd.Timestamp('20040601')], columns=['age'])
+     df['today'] = pd.Timestamp('20130419')
+     df['diff'] = df['today'] - df['age']
+     df
+
+API changes
+~~~~~~~~~~~
+
+- Add ``-NaN`` and ``-nan`` to the default set of NA values (:issue:`5952`).
+  See :ref:`NA Values <io.na_values>`.
+
+- Added ``Series.str.get_dummies`` vectorized string method (:issue:`6021`), to extract
+  dummy/indicator variables for separated string columns:
+
+  .. ipython:: python
+
+      s = pd.Series(['a', 'a|b', np.nan, 'a|c'])
+      s.str.get_dummies(sep='|')
+
+- Added the ``NDFrame.equals()`` method to compare if two NDFrames are
+  equal have equal axes, dtypes, and values. Added the
+  ``array_equivalent`` function to compare if two ndarrays are
+  equal. NaNs in identical locations are treated as
+  equal. (:issue:`5283`) See also :ref:`the docs<basics.equals>` for a motivating example.
+
+  .. code-block:: python
+
+      df = pd.DataFrame({'col': ['foo', 0, np.nan]})
+      df2 = pd.DataFrame({'col': [np.nan, 0, 'foo']}, index=[2, 1, 0])
+      df.equals(df2)
+      df.equals(df2.sort_index())
+
+- ``DataFrame.apply`` will use the ``reduce`` argument to determine whether a
+  ``Series`` or a ``DataFrame`` should be returned when the ``DataFrame`` is
+  empty (:issue:`6007`).
+
+  Previously, calling ``DataFrame.apply`` an empty ``DataFrame`` would return
+  either a ``DataFrame`` if there were no columns, or the function being
+  applied would be called with an empty ``Series`` to guess whether a
+  ``Series`` or ``DataFrame`` should be returned:
+
+  .. code-block:: ipython
+
+    In [32]: def applied_func(col):
+      ....:    print("Apply function being called with: ", col)
+      ....:    return col.sum()
+      ....:
+
+    In [33]: empty = DataFrame(columns=['a', 'b'])
+
+    In [34]: empty.apply(applied_func)
+    Apply function being called with:  Series([], Length: 0, dtype: float64)
+    Out[34]:
+    a   NaN
+    b   NaN
+    Length: 2, dtype: float64
+
+  Now, when ``apply`` is called on an empty ``DataFrame``: if the ``reduce``
+  argument is ``True`` a ``Series`` will returned, if it is ``False`` a
+  ``DataFrame`` will be returned, and if it is ``None`` (the default) the
+  function being applied will be called with an empty series to try and guess
+  the return type.
+
+  .. code-block:: ipython
+
+    In [35]: empty.apply(applied_func, reduce=True)
+    Out[35]:
+    a   NaN
+    b   NaN
+    Length: 2, dtype: float64
+
+    In [36]: empty.apply(applied_func, reduce=False)
+    Out[36]:
+    Empty DataFrame
+    Columns: [a, b]
+    Index: []
+
+    [0 rows x 2 columns]
+
+
+Prior Version Deprecations/Changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+There are no announced changes in 0.13 or prior that are taking effect as of 0.13.1
+
+Deprecations
+~~~~~~~~~~~~
+
+There are no deprecations of prior behavior in 0.13.1
+
+Enhancements
+~~~~~~~~~~~~
+
+- ``pd.read_csv`` and ``pd.to_datetime`` learned a new ``infer_datetime_format`` keyword which greatly
+  improves parsing perf in many cases. Thanks to @lexual for suggesting and @danbirken
+  for rapidly implementing. (:issue:`5490`, :issue:`6021`)
+
+  If ``parse_dates`` is enabled and this flag is set, pandas will attempt to
+  infer the format of the datetime strings in the columns, and if it can
+  be inferred, switch to a faster method of parsing them.  In some cases
+  this can increase the parsing speed by ~5-10x.
+
+  .. code-block:: python
+
+      # Try to infer the format for the index column
+      df = pd.read_csv('foo.csv', index_col=0, parse_dates=True,
+                       infer_datetime_format=True)
+
+- ``date_format`` and ``datetime_format`` keywords can now be specified when writing to ``excel``
+  files (:issue:`4133`)
+
+- ``MultiIndex.from_product`` convenience function for creating a MultiIndex from
+  the cartesian product of a set of iterables (:issue:`6055`):
+
+  .. ipython:: python
+
+      shades = ['light', 'dark']
+      colors = ['red', 'green', 'blue']
+
+      pd.MultiIndex.from_product([shades, colors], names=['shade', 'color'])
+
+- Panel :meth:`~pandas.Panel.apply` will work on non-ufuncs. See :ref:`the docs<basics.apply>`.
+
+  .. ipython:: python
+
+     import pandas.util.testing as tm
+     panel = tm.makePanel(5)
+     panel
+     panel['ItemA']
+
+  Specifying an ``apply`` that operates on a Series (to return a single element)
+
+  .. ipython:: python
+
+     panel.apply(lambda x: x.dtype, axis='items')
+
+  A similar reduction type operation
+
+  .. ipython:: python
+
+     panel.apply(lambda x: x.sum(), axis='major_axis')
+
+  This is equivalent to
+
+  .. ipython:: python
+
+     panel.sum('major_axis')
+
+  A transformation operation that returns a Panel, but is computing
+  the z-score across the major_axis
+
+  .. ipython:: python
+
+     result = panel.apply(lambda x: (x - x.mean()) / x.std(),
+                          axis='major_axis')
+     result
+     result['ItemA']
+
+- Panel :meth:`~pandas.Panel.apply` operating on cross-sectional slabs. (:issue:`1148`)
+
+  .. ipython:: python
+
+     def f(x):
+         return ((x.T - x.mean(1)) / x.std(1)).T
+
+     result = panel.apply(f, axis=['items', 'major_axis'])
+     result
+     result.loc[:, :, 'ItemA']
+
+  This is equivalent to the following
+
+  .. ipython:: python
+
+     result = pd.Panel({ax: f(panel.loc[:, :, ax]) for ax in panel.minor_axis})
+
+     result
+     result.loc[:, :, 'ItemA']
+
+Performance
+~~~~~~~~~~~
+
+Performance improvements for 0.13.1
+
+- Series datetime/timedelta binary operations (:issue:`5801`)
+- DataFrame ``count/dropna`` for ``axis=1``
+- Series.str.contains now has a `regex=False` keyword which can be faster for plain (non-regex) string patterns. (:issue:`5879`)
+- Series.str.extract (:issue:`5944`)
+- ``dtypes/ftypes`` methods (:issue:`5968`)
+- indexing with object dtypes (:issue:`5968`)
+- ``DataFrame.apply`` (:issue:`6013`)
+- Regression in JSON IO (:issue:`5765`)
+- Index construction from Series (:issue:`6150`)
+
+Experimental
+~~~~~~~~~~~~
+
+There are no experimental changes in 0.13.1
+
+.. _release.bug_fixes-0.13.1:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``io.wb.get_countries`` not including all countries (:issue:`6008`)
+- Bug in Series replace with timestamp dict (:issue:`5797`)
+- read_csv/read_table now respects the `prefix` kwarg (:issue:`5732`).
+- Bug in selection with missing values via ``.ix`` from a duplicate indexed DataFrame failing (:issue:`5835`)
+- Fix issue of boolean comparison on empty DataFrames (:issue:`5808`)
+- Bug in isnull handling ``NaT`` in an object array (:issue:`5443`)
+- Bug in ``to_datetime`` when passed a ``np.nan`` or integer datelike and a format string (:issue:`5863`)
+- Bug in groupby dtype conversion with datetimelike (:issue:`5869`)
+- Regression in handling of empty Series as indexers to Series  (:issue:`5877`)
+- Bug in internal caching, related to (:issue:`5727`)
+- Testing bug in reading JSON/msgpack from a non-filepath on windows under py3 (:issue:`5874`)
+- Bug when assigning to .ix[tuple(...)] (:issue:`5896`)
+- Bug in fully reindexing a Panel (:issue:`5905`)
+- Bug in idxmin/max with object dtypes (:issue:`5914`)
+- Bug in ``BusinessDay`` when adding n days to a date not on offset when n>5 and n%5==0 (:issue:`5890`)
+- Bug in assigning to chained series with a series via ix (:issue:`5928`)
+- Bug in creating an empty DataFrame, copying, then assigning (:issue:`5932`)
+- Bug in DataFrame.tail with empty frame (:issue:`5846`)
+- Bug in propagating metadata on ``resample`` (:issue:`5862`)
+- Fixed string-representation of ``NaT`` to be "NaT" (:issue:`5708`)
+- Fixed string-representation for Timestamp to show nanoseconds if present (:issue:`5912`)
+- ``pd.match`` not returning passed sentinel
+- ``Panel.to_frame()`` no longer fails when ``major_axis`` is a
+  ``MultiIndex`` (:issue:`5402`).
+- Bug in ``pd.read_msgpack`` with inferring a ``DateTimeIndex`` frequency
+  incorrectly (:issue:`5947`)
+- Fixed ``to_datetime`` for array with both Tz-aware datetimes and ``NaT``'s  (:issue:`5961`)
+- Bug in rolling skew/kurtosis when passed a Series with bad data (:issue:`5749`)
+- Bug in scipy ``interpolate`` methods with a datetime index (:issue:`5975`)
+- Bug in NaT comparison if a mixed datetime/np.datetime64 with NaT were passed (:issue:`5968`)
+- Fixed bug with ``pd.concat`` losing dtype information if all inputs are empty (:issue:`5742`)
+- Recent changes in IPython cause warnings to be emitted when using previous versions
+  of pandas in QTConsole, now fixed. If you're using an older version and
+  need to suppress the warnings, see (:issue:`5922`).
+- Bug in merging ``timedelta`` dtypes (:issue:`5695`)
+- Bug in plotting.scatter_matrix function. Wrong alignment among diagonal
+  and off-diagonal plots, see (:issue:`5497`).
+- Regression in Series with a MultiIndex via ix (:issue:`6018`)
+- Bug in Series.xs with a MultiIndex (:issue:`6018`)
+- Bug in Series construction of mixed type with datelike and an integer (which should result in
+  object type and not automatic conversion) (:issue:`6028`)
+- Possible segfault when chained indexing with an object array under NumPy 1.7.1 (:issue:`6026`, :issue:`6056`)
+- Bug in setting using fancy indexing a single element with a non-scalar (e.g. a list),
+  (:issue:`6043`)
+- ``to_sql`` did not respect ``if_exists`` (:issue:`4110` :issue:`4304`)
+- Regression in ``.get(None)`` indexing from 0.12 (:issue:`5652`)
+- Subtle ``iloc`` indexing bug, surfaced in (:issue:`6059`)
+- Bug with insert of strings into DatetimeIndex (:issue:`5818`)
+- Fixed unicode bug in to_html/HTML repr (:issue:`6098`)
+- Fixed missing arg validation in get_options_data (:issue:`6105`)
+- Bug in assignment with duplicate columns in a frame where the locations
+  are a slice (e.g. next to each other) (:issue:`6120`)
+- Bug in propagating _ref_locs during construction of a DataFrame with dups
+  index/columns (:issue:`6121`)
+- Bug in ``DataFrame.apply`` when using mixed datelike reductions (:issue:`6125`)
+- Bug in ``DataFrame.append`` when appending a row with different columns (:issue:`6129`)
+- Bug in DataFrame construction with recarray and non-ns datetime dtype (:issue:`6140`)
+- Bug in ``.loc`` setitem indexing with a dataframe on rhs, multiple item setting, and
+  a datetimelike (:issue:`6152`)
+- Fixed a bug in ``query``/``eval`` during lexicographic string comparisons (:issue:`6155`).
+- Fixed a bug in ``query`` where the index of a single-element ``Series`` was
+  being thrown away (:issue:`6148`).
+- Bug in ``HDFStore`` on appending a dataframe with MultiIndexed columns to
+  an existing table (:issue:`6167`)
+- Consistency with dtypes in setting an empty DataFrame (:issue:`6171`)
+- Bug in selecting on a MultiIndex ``HDFStore`` even in the presence of under
+  specified column spec (:issue:`6169`)
+- Bug in ``nanops.var`` with ``ddof=1`` and 1 elements would sometimes return ``inf``
+  rather than ``nan`` on some platforms (:issue:`6136`)
+- Bug in Series and DataFrame bar plots ignoring the ``use_index`` keyword (:issue:`6209`)
+- Bug in groupby with mixed str/int under python3 fixed; ``argsort`` was failing (:issue:`6212`)
+
+.. _whatsnew_0.13.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.13.0..v0.13.1
diff --git a/doc/source/whatsnew/v0.13.1.txt b/doc/source/whatsnew/v0.13.1.txt
deleted file mode 100644
index 5e5653945fefa..0000000000000
--- a/doc/source/whatsnew/v0.13.1.txt
+++ /dev/null
@@ -1,288 +0,0 @@
-.. _whatsnew_0131:
-
-v0.13.1 (February 3, 2014)
---------------------------
-
-This is a minor release from 0.13.0 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- Added ``infer_datetime_format`` keyword to ``read_csv/to_datetime`` to allow speedups for homogeneously formatted datetimes.
-- Will intelligently limit display precision for datetime/timedelta formats.
-- Enhanced Panel :meth:`~pandas.Panel.apply` method.
-- Suggested tutorials in new :ref:`Tutorials<tutorials>` section.
-- Our pandas ecosystem is growing, We now feature related projects in a new :ref:`Pandas Ecosystem<ecosystem>` section.
-- Much work has been taking place on improving the docs, and a new :ref:`Contributing<contributing>` section has been added.
-- Even though it may only be of interest to devs, we <3 our new CI status page: `ScatterCI <http://scatterci.github.io/pydata/pandas>`__.
-
-.. warning::
-
-   0.13.1 fixes a bug that was caused by a combination of having numpy < 1.8, and doing
-   chained assignment on a string-like array. Please review :ref:`the docs<indexing.view_versus_copy>`,
-   chained indexing can have unexpected results and should generally be avoided.
-
-   This would previously segfault:
-
-   .. ipython:: python
-
-      df = DataFrame(dict(A = np.array(['foo','bar','bah','foo','bar'])))
-      df['A'].iloc[0] = np.nan
-      df
-
-   The recommended way to do this type of assignment is:
-
-   .. ipython:: python
-
-      df = DataFrame(dict(A = np.array(['foo','bar','bah','foo','bar'])))
-      df.loc[0,'A'] = np.nan
-      df
-
-Output Formatting Enhancements
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- df.info() view now display dtype info per column (:issue:`5682`)
-
-- df.info() now honors the option ``max_info_rows``, to disable null counts for large frames (:issue:`5974`)
-
-  .. ipython:: python
-
-     max_info_rows = pd.get_option('max_info_rows')
-
-     df = DataFrame(dict(A = np.random.randn(10),
-                         B = np.random.randn(10),
-                         C = date_range('20130101',periods=10)))
-     df.iloc[3:6,[0,2]] = np.nan
-
-  .. ipython:: python
-
-     # set to not display the null counts
-     pd.set_option('max_info_rows',0)
-     df.info()
-
-  .. ipython:: python
-
-     # this is the default (same as in 0.13.0)
-     pd.set_option('max_info_rows',max_info_rows)
-     df.info()
-
-- Add ``show_dimensions`` display option for the new DataFrame repr to control whether the dimensions print.
-
-  .. ipython:: python
-
-      df = DataFrame([[1, 2], [3, 4]])
-      pd.set_option('show_dimensions', False)
-      df
-
-      pd.set_option('show_dimensions', True)
-      df
-
-- The ``ArrayFormatter`` for ``datetime`` and ``timedelta64`` now intelligently
-  limit precision based on the values in the array (:issue:`3401`)
-
-  Previously output might look like:
-
-  .. code-block:: python
-
-        age                 today               diff
-      0 2001-01-01 00:00:00 2013-04-19 00:00:00 4491 days, 00:00:00
-      1 2004-06-01 00:00:00 2013-04-19 00:00:00 3244 days, 00:00:00
-
-  Now the output looks like:
-
-  .. ipython:: python
-
-     df = DataFrame([ Timestamp('20010101'),
-                      Timestamp('20040601') ], columns=['age'])
-     df['today'] = Timestamp('20130419')
-     df['diff'] = df['today']-df['age']
-     df
-
-API changes
-~~~~~~~~~~~
-
-- Add ``-NaN`` and ``-nan`` to the default set of NA values (:issue:`5952`).
-  See :ref:`NA Values <io.na_values>`.
-
-- Added ``Series.str.get_dummies`` vectorized string method (:issue:`6021`), to extract
-  dummy/indicator variables for separated string columns:
-
-  .. ipython:: python
-
-      s = Series(['a', 'a|b', np.nan, 'a|c'])
-      s.str.get_dummies(sep='|')
-
-- Added the ``NDFrame.equals()`` method to compare if two NDFrames are
-  equal have equal axes, dtypes, and values. Added the
-  ``array_equivalent`` function to compare if two ndarrays are
-  equal. NaNs in identical locations are treated as
-  equal. (:issue:`5283`) See also :ref:`the docs<basics.equals>` for a motivating example.
-
-  .. ipython:: python
-      :okwarning:
-
-      df = DataFrame({'col':['foo', 0, np.nan]})
-      df2 = DataFrame({'col':[np.nan, 0, 'foo']}, index=[2,1,0])
-      df.equals(df2)
-      df.equals(df2.sort_index())
-
-      import pandas.core.common as com
-      com.array_equivalent(np.array([0, np.nan]), np.array([0, np.nan]))
-      np.array_equal(np.array([0, np.nan]), np.array([0, np.nan]))
-
-- ``DataFrame.apply`` will use the ``reduce`` argument to determine whether a
-  ``Series`` or a ``DataFrame`` should be returned when the ``DataFrame`` is
-  empty (:issue:`6007`).
-
-  Previously, calling ``DataFrame.apply`` an empty ``DataFrame`` would return
-  either a ``DataFrame`` if there were no columns, or the function being
-  applied would be called with an empty ``Series`` to guess whether a
-  ``Series`` or ``DataFrame`` should be returned:
-
-  .. ipython:: python
-
-     def applied_func(col):
-        print("Apply function being called with: ", col)
-        return col.sum()
-
-     empty = DataFrame(columns=['a', 'b'])
-     empty.apply(applied_func)
-
-  Now, when ``apply`` is called on an empty ``DataFrame``: if the ``reduce``
-  argument is ``True`` a ``Series`` will returned, if it is ``False`` a
-  ``DataFrame`` will be returned, and if it is ``None`` (the default) the
-  function being applied will be called with an empty series to try and guess
-  the return type.
-
-  .. ipython:: python
-
-     empty.apply(applied_func, reduce=True)
-     empty.apply(applied_func, reduce=False)
-
-Prior Version Deprecations/Changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-There are no announced changes in 0.13 or prior that are taking effect as of 0.13.1
-
-Deprecations
-~~~~~~~~~~~~
-
-There are no deprecations of prior behavior in 0.13.1
-
-Enhancements
-~~~~~~~~~~~~
-
-- ``pd.read_csv`` and ``pd.to_datetime`` learned a new ``infer_datetime_format`` keyword which greatly
-  improves parsing perf in many cases. Thanks to @lexual for suggesting and @danbirken
-  for rapidly implementing. (:issue:`5490`, :issue:`6021`)
-
-  If ``parse_dates`` is enabled and this flag is set, pandas will attempt to
-  infer the format of the datetime strings in the columns, and if it can
-  be inferred, switch to a faster method of parsing them.  In some cases
-  this can increase the parsing speed by ~5-10x.
-
-  .. code-block:: python
-
-      # Try to infer the format for the index column
-      df = pd.read_csv('foo.csv', index_col=0, parse_dates=True,
-                       infer_datetime_format=True)
-
-- ``date_format`` and ``datetime_format`` keywords can now be specified when writing to ``excel``
-  files (:issue:`4133`)
-
-- ``MultiIndex.from_product`` convenience function for creating a MultiIndex from
-  the cartesian product of a set of iterables (:issue:`6055`):
-
-  .. ipython:: python
-
-      shades = ['light', 'dark']
-      colors = ['red', 'green', 'blue']
-
-      MultiIndex.from_product([shades, colors], names=['shade', 'color'])
-
-- Panel :meth:`~pandas.Panel.apply` will work on non-ufuncs. See :ref:`the docs<basics.apply_panel>`.
-
-  .. ipython:: python
-
-     import pandas.util.testing as tm
-     panel = tm.makePanel(5)
-     panel
-     panel['ItemA']
-
-  Specifying an ``apply`` that operates on a Series (to return a single element)
-
-  .. ipython:: python
-
-     panel.apply(lambda x: x.dtype, axis='items')
-
-  A similar reduction type operation
-
-  .. ipython:: python
-
-     panel.apply(lambda x: x.sum(), axis='major_axis')
-
-  This is equivalent to
-
-  .. ipython:: python
-
-     panel.sum('major_axis')
-
-  A transformation operation that returns a Panel, but is computing
-  the z-score across the major_axis
-
-  .. ipython:: python
-
-     result = panel.apply(
-                lambda x: (x-x.mean())/x.std(),
-                axis='major_axis')
-     result
-     result['ItemA']
-
-- Panel :meth:`~pandas.Panel.apply` operating on cross-sectional slabs. (:issue:`1148`)
-
-  .. ipython:: python
-
-     f = lambda x: ((x.T-x.mean(1))/x.std(1)).T
-
-     result = panel.apply(f, axis = ['items','major_axis'])
-     result
-     result.loc[:,:,'ItemA']
-
-  This is equivalent to the following
-
-  .. ipython:: python
-
-     result = Panel(dict([ (ax,f(panel.loc[:,:,ax]))
-                             for ax in panel.minor_axis ]))
-     result
-     result.loc[:,:,'ItemA']
-
-Performance
-~~~~~~~~~~~
-
-Performance improvements for 0.13.1
-
-- Series datetime/timedelta binary operations (:issue:`5801`)
-- DataFrame ``count/dropna`` for ``axis=1``
-- Series.str.contains now has a `regex=False` keyword which can be faster for plain (non-regex) string patterns. (:issue:`5879`)
-- Series.str.extract (:issue:`5944`)
-- ``dtypes/ftypes`` methods (:issue:`5968`)
-- indexing with object dtypes (:issue:`5968`)
-- ``DataFrame.apply`` (:issue:`6013`)
-- Regression in JSON IO (:issue:`5765`)
-- Index construction from Series (:issue:`6150`)
-
-Experimental
-~~~~~~~~~~~~
-
-There are no experimental changes in 0.13.1
-
-Bug Fixes
-~~~~~~~~~
-
-See :ref:`V0.13.1 Bug Fixes<release.bug_fixes-0.13.1>` for an extensive list of bugs that have been fixed in 0.13.1.
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list of all API changes, Enhancements and Bug Fixes.
diff --git a/doc/source/whatsnew/v0.14.0.rst b/doc/source/whatsnew/v0.14.0.rst
new file mode 100644
index 0000000000000..d61b9a40438f8
--- /dev/null
+++ b/doc/source/whatsnew/v0.14.0.rst
@@ -0,0 +1,1087 @@
+.. _whatsnew_0140:
+
+v0.14.0 (May 31 , 2014)
+-----------------------
+
+{{ header }}
+
+
+This is a major release from 0.13.1 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+- Highlights include:
+
+  - Officially support Python 3.4
+  - SQL interfaces updated to use ``sqlalchemy``, See :ref:`Here<whatsnew_0140.sql>`.
+  - Display interface changes, See :ref:`Here<whatsnew_0140.display>`
+  - MultiIndexing Using Slicers, See :ref:`Here<whatsnew_0140.slicers>`.
+  - Ability to join a singly-indexed DataFrame with a MultiIndexed DataFrame, see :ref:`Here <merging.join_on_mi>`
+  - More consistency in groupby results and more flexible groupby specifications, See :ref:`Here<whatsnew_0140.groupby>`
+  - Holiday calendars are now supported in ``CustomBusinessDay``, see :ref:`Here <timeseries.holiday>`
+  - Several improvements in plotting functions, including: hexbin, area and pie plots, see :ref:`Here<whatsnew_0140.plotting>`.
+  - Performance doc section on I/O operations, See :ref:`Here <io.perf>`
+
+- :ref:`Other Enhancements <whatsnew_0140.enhancements>`
+
+- :ref:`API Changes <whatsnew_0140.api>`
+
+- :ref:`Text Parsing API Changes <whatsnew_0140.parsing>`
+
+- :ref:`Groupby API Changes <whatsnew_0140.groupby>`
+
+- :ref:`Performance Improvements <whatsnew_0140.performance>`
+
+- :ref:`Prior Deprecations <whatsnew_0140.prior_deprecations>`
+
+- :ref:`Deprecations <whatsnew_0140.deprecations>`
+
+- :ref:`Known Issues <whatsnew_0140.knownissues>`
+
+- :ref:`Bug Fixes <whatsnew_0140.bug_fixes>`
+
+.. warning::
+
+   In 0.14.0 all ``NDFrame`` based containers have undergone significant internal refactoring. Before that each block of
+   homogeneous data had its own labels and extra care was necessary to keep those in sync with the parent container's labels.
+   This should not have any visible user/API behavior changes (:issue:`6745`)
+
+.. _whatsnew_0140.api:
+
+API changes
+~~~~~~~~~~~
+
+- ``read_excel`` uses 0 as the default sheet (:issue:`6573`)
+- ``iloc`` will now accept out-of-bounds indexers for slices, e.g. a value that exceeds the length of the object being
+  indexed. These will be excluded. This will make pandas conform more with python/numpy indexing of out-of-bounds
+  values. A single indexer that is out-of-bounds and drops the dimensions of the object will still raise
+  ``IndexError`` (:issue:`6296`, :issue:`6299`). This could result in an empty axis (e.g. an empty DataFrame being returned)
+
+  .. ipython:: python
+
+     dfl = pd.DataFrame(np.random.randn(5, 2), columns=list('AB'))
+     dfl
+     dfl.iloc[:, 2:3]
+     dfl.iloc[:, 1:3]
+     dfl.iloc[4:6]
+
+  These are out-of-bounds selections
+
+  .. code-block:: python
+
+     >>> dfl.iloc[[4, 5, 6]]
+     IndexError: positional indexers are out-of-bounds
+
+     >>> dfl.iloc[:, 4]
+     IndexError: single positional indexer is out-of-bounds
+
+- Slicing with negative start, stop & step values handles corner cases better (:issue:`6531`):
+
+  - ``df.iloc[:-len(df)]`` is now empty
+  - ``df.iloc[len(df)::-1]`` now enumerates all elements in reverse
+
+- The :meth:`DataFrame.interpolate` keyword ``downcast`` default has been changed from ``infer`` to
+  ``None``. This is to preserve the original dtype unless explicitly requested otherwise (:issue:`6290`).
+- When converting a dataframe to HTML it used to return `Empty DataFrame`. This special case has
+  been removed, instead a header with the column names is returned (:issue:`6062`).
+- ``Series`` and ``Index`` now internally share more common operations, e.g. ``factorize(),nunique(),value_counts()`` are
+  now supported on ``Index`` types as well. The ``Series.weekday`` property from is removed
+  from Series for API consistency. Using a ``DatetimeIndex/PeriodIndex`` method on a Series will now raise a ``TypeError``.
+  (:issue:`4551`, :issue:`4056`, :issue:`5519`, :issue:`6380`, :issue:`7206`).
+
+- Add ``is_month_start``, ``is_month_end``, ``is_quarter_start``, ``is_quarter_end``, ``is_year_start``, ``is_year_end`` accessors for ``DateTimeIndex`` / ``Timestamp`` which return a boolean array of whether the timestamp(s) are at the start/end of the month/quarter/year defined by the frequency of the ``DateTimeIndex`` / ``Timestamp`` (:issue:`4565`, :issue:`6998`)
+
+- Local variable usage has changed in
+  :func:`pandas.eval`/:meth:`DataFrame.eval`/:meth:`DataFrame.query`
+  (:issue:`5987`). For the :class:`~pandas.DataFrame` methods, two things have
+  changed
+
+  - Column names are now given precedence over locals
+  - Local variables must be referred to explicitly. This means that even if
+    you have a local variable that is *not* a column you must still refer to
+    it with the ``'@'`` prefix.
+  - You can have an expression like ``df.query('@a < a')`` with no complaints
+    from ``pandas`` about ambiguity of the name ``a``.
+  - The top-level :func:`pandas.eval` function does not allow you use the
+    ``'@'`` prefix and provides you with an error message telling you so.
+  - ``NameResolutionError`` was removed because it isn't necessary anymore.
+
+- Define and document the order of column vs index names in query/eval (:issue:`6676`)
+- ``concat`` will now concatenate mixed Series and DataFrames using the Series name
+  or numbering columns as needed (:issue:`2385`). See :ref:`the docs <merging.mixed_ndims>`
+- Slicing and advanced/boolean indexing operations on ``Index`` classes as well
+  as :meth:`Index.delete` and :meth:`Index.drop` methods will no longer change the type of the
+  resulting index (:issue:`6440`, :issue:`7040`)
+
+  .. ipython:: python
+
+     i = pd.Index([1, 2, 3, 'a', 'b', 'c'])
+     i[[0, 1, 2]]
+     i.drop(['a', 'b', 'c'])
+
+  Previously, the above operation would return ``Int64Index``.  If you'd like
+  to do this manually, use :meth:`Index.astype`
+
+  .. ipython:: python
+
+     i[[0, 1, 2]].astype(np.int_)
+
+- ``set_index`` no longer converts MultiIndexes to an Index of tuples. For example,
+  the old behavior returned an Index in this case (:issue:`6459`):
+
+  .. ipython:: python
+     :suppress:
+
+     np.random.seed(1234)
+     from itertools import product
+     tuples = list(product(('a', 'b'), ('c', 'd')))
+     mi = pd.MultiIndex.from_tuples(tuples)
+     df_multi = pd.DataFrame(np.random.randn(4, 2), index=mi)
+     tuple_ind = pd.Index(tuples, tupleize_cols=False)
+     df_multi.index
+
+  .. ipython:: python
+
+     # Old behavior, casted MultiIndex to an Index
+     tuple_ind
+     df_multi.set_index(tuple_ind)
+
+     # New behavior
+     mi
+     df_multi.set_index(mi)
+
+  This also applies when passing multiple indices to ``set_index``:
+
+  .. ipython:: python
+
+    @suppress
+    df_multi.index = tuple_ind
+
+    # Old output, 2-level MultiIndex of tuples
+    df_multi.set_index([df_multi.index, df_multi.index])
+
+    @suppress
+    df_multi.index = mi
+
+    # New output, 4-level MultiIndex
+    df_multi.set_index([df_multi.index, df_multi.index])
+
+- ``pairwise`` keyword was added to the statistical moment functions
+  ``rolling_cov``, ``rolling_corr``, ``ewmcov``, ``ewmcorr``,
+  ``expanding_cov``, ``expanding_corr`` to allow the calculation of moving
+  window covariance and correlation matrices (:issue:`4950`). See
+  :ref:`Computing rolling pairwise covariances and correlations
+  <stats.moments.corr_pairwise>` in the docs.
+
+  .. code-block:: ipython
+
+     In [1]: df = pd.DataFrame(np.random.randn(10, 4), columns=list('ABCD'))
+
+     In [4]: covs = pd.rolling_cov(df[['A', 'B', 'C']],
+       ....:                       df[['B', 'C', 'D']],
+       ....:                       5,
+       ....:                       pairwise=True)
+
+
+     In [5]: covs[df.index[-1]]
+     Out[5]:
+               B         C         D
+     A  0.035310  0.326593 -0.505430
+     B  0.137748 -0.006888 -0.005383
+     C -0.006888  0.861040  0.020762
+
+- ``Series.iteritems()`` is now lazy (returns an iterator rather than a list). This was the documented behavior prior to 0.14. (:issue:`6760`)
+
+- Added ``nunique`` and ``value_counts`` functions to ``Index`` for counting unique elements. (:issue:`6734`)
+- ``stack`` and ``unstack`` now raise a ``ValueError`` when the ``level`` keyword refers
+  to a non-unique item in the ``Index`` (previously raised a ``KeyError``). (:issue:`6738`)
+- drop unused order argument from ``Series.sort``; args now are in the same order as ``Series.order``;
+  add ``na_position`` arg to conform to ``Series.order`` (:issue:`6847`)
+- default sorting algorithm for ``Series.order`` is now ``quicksort``, to conform with ``Series.sort``
+  (and numpy defaults)
+- add ``inplace`` keyword to ``Series.order/sort`` to make them inverses (:issue:`6859`)
+- ``DataFrame.sort`` now places NaNs at the beginning or end of the sort according to the ``na_position`` parameter. (:issue:`3917`)
+- accept ``TextFileReader`` in ``concat``, which was affecting a common user idiom (:issue:`6583`), this was a regression
+  from 0.13.1
+- Added ``factorize`` functions to ``Index`` and ``Series`` to get indexer and unique values (:issue:`7090`)
+- ``describe`` on a DataFrame with a mix of Timestamp and string like objects returns a different Index (:issue:`7088`).
+  Previously the index was unintentionally sorted.
+- Arithmetic operations with **only** ``bool`` dtypes now give a warning indicating
+  that they are evaluated in Python space for ``+``, ``-``,
+  and ``*`` operations and raise for all others (:issue:`7011`, :issue:`6762`,
+  :issue:`7015`, :issue:`7210`)
+
+  .. code-block:: python
+
+     >>> x = pd.Series(np.random.rand(10) > 0.5)
+     >>> y = True
+     >>> x + y  # warning generated: should do x | y instead
+     UserWarning: evaluating in Python space because the '+' operator is not
+     supported by numexpr for the bool dtype, use '|' instead
+     >>> x / y  # this raises because it doesn't make sense
+     NotImplementedError: operator '/' not implemented for bool dtypes
+
+- In ``HDFStore``, ``select_as_multiple`` will always raise a ``KeyError``, when a key or the selector is not found (:issue:`6177`)
+- ``df['col'] = value`` and ``df.loc[:,'col'] = value`` are now completely equivalent;
+  previously the ``.loc`` would not necessarily coerce the dtype of the resultant series (:issue:`6149`)
+- ``dtypes`` and ``ftypes`` now return a series with ``dtype=object`` on empty containers (:issue:`5740`)
+- ``df.to_csv`` will now return a string of the CSV data if neither a target path nor a buffer is provided
+  (:issue:`6061`)
+- ``pd.infer_freq()`` will now raise a ``TypeError`` if given an invalid ``Series/Index``
+  type (:issue:`6407`, :issue:`6463`)
+- A tuple passed to ``DataFame.sort_index`` will be interpreted as the levels of
+  the index, rather than requiring a list of tuple (:issue:`4370`)
+- all offset operations now return ``Timestamp`` types (rather than datetime), Business/Week frequencies were incorrect (:issue:`4069`)
+- ``to_excel`` now converts ``np.inf`` into a string representation,
+  customizable by the ``inf_rep`` keyword argument (Excel has no native inf
+  representation) (:issue:`6782`)
+- Replace ``pandas.compat.scipy.scoreatpercentile`` with ``numpy.percentile`` (:issue:`6810`)
+- ``.quantile`` on a ``datetime[ns]`` series now returns ``Timestamp`` instead
+  of ``np.datetime64`` objects (:issue:`6810`)
+- change ``AssertionError`` to ``TypeError`` for invalid types passed to ``concat`` (:issue:`6583`)
+- Raise a ``TypeError`` when ``DataFrame`` is passed an iterator as the
+  ``data`` argument (:issue:`5357`)
+
+
+.. _whatsnew_0140.display:
+
+Display Changes
+~~~~~~~~~~~~~~~
+
+- The default way of printing large DataFrames has changed. DataFrames
+  exceeding ``max_rows`` and/or ``max_columns`` are now displayed in a
+  centrally truncated view, consistent with the printing of a
+  :class:`pandas.Series` (:issue:`5603`).
+
+  In previous versions, a DataFrame was truncated once the dimension
+  constraints were reached and an ellipse (...) signaled that part of
+  the data was cut off.
+
+  .. image:: ../_static/trunc_before.png
+      :alt: The previous look of truncate.
+
+  In the current version, large DataFrames are centrally truncated,
+  showing a preview of head and tail in both dimensions.
+
+  .. image:: ../_static/trunc_after.png
+     :alt: The new look.
+
+- allow option ``'truncate'`` for ``display.show_dimensions`` to only show the dimensions if the
+  frame is truncated (:issue:`6547`).
+
+  The default for ``display.show_dimensions`` will now be ``truncate``. This is consistent with
+  how Series display length.
+
+  .. ipython:: python
+
+     dfd = pd.DataFrame(np.arange(25).reshape(-1, 5),
+                        index=[0, 1, 2, 3, 4],
+                        columns=[0, 1, 2, 3, 4])
+
+     # show dimensions since this is truncated
+     with pd.option_context('display.max_rows', 2, 'display.max_columns', 2,
+                            'display.show_dimensions', 'truncate'):
+         print(dfd)
+
+     # will not show dimensions since it is not truncated
+     with pd.option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.show_dimensions', 'truncate'):
+         print(dfd)
+
+- Regression in the display of a MultiIndexed Series with ``display.max_rows`` is less than the
+  length of the series (:issue:`7101`)
+- Fixed a bug in the HTML repr of a truncated Series or DataFrame not showing the class name with the
+  `large_repr` set to 'info' (:issue:`7105`)
+- The `verbose` keyword in ``DataFrame.info()``, which controls whether to shorten the ``info``
+  representation, is now ``None`` by default. This will follow the global setting in
+  ``display.max_info_columns``. The global setting can be overridden with ``verbose=True`` or
+  ``verbose=False``.
+- Fixed a bug with the `info` repr not honoring the `display.max_info_columns` setting (:issue:`6939`)
+- Offset/freq info now in Timestamp __repr__ (:issue:`4553`)
+
+.. _whatsnew_0140.parsing:
+
+Text Parsing API Changes
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+:func:`read_csv`/:func:`read_table` will now be noisier w.r.t invalid options rather than falling back to the ``PythonParser``.
+
+- Raise ``ValueError`` when ``sep`` specified with
+  ``delim_whitespace=True`` in :func:`read_csv`/:func:`read_table`
+  (:issue:`6607`)
+- Raise ``ValueError`` when ``engine='c'`` specified with unsupported
+  options in :func:`read_csv`/:func:`read_table` (:issue:`6607`)
+- Raise ``ValueError`` when fallback to python parser causes options to be
+  ignored (:issue:`6607`)
+- Produce :class:`~pandas.io.parsers.ParserWarning` on fallback to python
+  parser when no options are ignored (:issue:`6607`)
+- Translate ``sep='\s+'`` to ``delim_whitespace=True`` in
+  :func:`read_csv`/:func:`read_table` if no other C-unsupported options
+  specified (:issue:`6607`)
+
+.. _whatsnew_0140.groupby:
+
+Groupby API Changes
+~~~~~~~~~~~~~~~~~~~
+
+More consistent behaviour for some groupby methods:
+
+- groupby ``head`` and ``tail`` now act more like ``filter`` rather than an aggregation:
+
+  .. ipython:: python
+
+     df = pd.DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+     g = df.groupby('A')
+     g.head(1)  # filters DataFrame
+
+     g.apply(lambda x: x.head(1))  # used to simply fall-through
+
+- groupby head and tail respect column selection:
+
+  .. ipython:: python
+
+     g[['B']].head(1)
+
+- groupby ``nth`` now reduces by default; filtering can be achieved by passing ``as_index=False``. With an optional ``dropna`` argument to ignore
+  NaN. See :ref:`the docs <groupby.nth>`.
+
+  Reducing
+
+  .. ipython:: python
+
+     df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+     g = df.groupby('A')
+     g.nth(0)
+
+     # this is equivalent to g.first()
+     g.nth(0, dropna='any')
+
+     # this is equivalent to g.last()
+     g.nth(-1, dropna='any')
+
+  Filtering
+
+  .. ipython:: python
+
+     gf = df.groupby('A', as_index=False)
+     gf.nth(0)
+     gf.nth(0, dropna='any')
+
+- groupby will now not return the grouped column for non-cython functions (:issue:`5610`, :issue:`5614`, :issue:`6732`),
+  as its already the index
+
+  .. ipython:: python
+
+     df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6], [5, 8]], columns=['A', 'B'])
+     g = df.groupby('A')
+     g.count()
+     g.describe()
+
+- passing ``as_index`` will leave the grouped column in-place (this is not change in 0.14.0)
+
+  .. ipython:: python
+
+     df = pd.DataFrame([[1, np.nan], [1, 4], [5, 6], [5, 8]], columns=['A', 'B'])
+     g = df.groupby('A', as_index=False)
+     g.count()
+     g.describe()
+
+- Allow specification of a more complex groupby via ``pd.Grouper``, such as grouping
+  by a Time and a string field simultaneously. See :ref:`the docs <groupby.specify>`. (:issue:`3794`)
+
+- Better propagation/preservation of Series names when performing groupby
+  operations:
+
+  - ``SeriesGroupBy.agg`` will ensure that the name attribute of the original
+    series is propagated to the result (:issue:`6265`).
+  - If the function provided to ``GroupBy.apply`` returns a named series, the
+    name of the series will be kept as the name of the column index of the
+    DataFrame returned by ``GroupBy.apply`` (:issue:`6124`).  This facilitates
+    ``DataFrame.stack`` operations where the name of the column index is used as
+    the name of the inserted column containing the pivoted data.
+
+
+.. _whatsnew_0140.sql:
+
+SQL
+~~~
+
+The SQL reading and writing functions now support more database flavors
+through SQLAlchemy (:issue:`2717`, :issue:`4163`, :issue:`5950`, :issue:`6292`).
+All databases supported by SQLAlchemy can be used, such
+as PostgreSQL, MySQL, Oracle, Microsoft SQL server (see documentation of
+SQLAlchemy on `included dialects
+<https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html>`_).
+
+The functionality of providing DBAPI connection objects will only be supported
+for sqlite3 in the future. The ``'mysql'`` flavor is deprecated.
+
+The new functions :func:`~pandas.read_sql_query` and :func:`~pandas.read_sql_table`
+are introduced. The function :func:`~pandas.read_sql` is kept as a convenience
+wrapper around the other two and will delegate to specific function depending on
+the provided input (database table name or sql query).
+
+In practice, you have to provide a SQLAlchemy ``engine`` to the sql functions.
+To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
+object from database URI. You only need to create the engine once per database you are
+connecting to. For an in-memory sqlite database:
+
+.. ipython:: python
+
+   from sqlalchemy import create_engine
+   # Create your connection.
+   engine = create_engine('sqlite:///:memory:')
+
+This ``engine`` can then be used to write or read data to/from this database:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'c']})
+    df.to_sql('db_table', engine, index=False)
+
+You can read data from a database by specifying the table name:
+
+.. ipython:: python
+
+   pd.read_sql_table('db_table', engine)
+
+or by specifying a sql query:
+
+.. ipython:: python
+
+   pd.read_sql_query('SELECT * FROM db_table', engine)
+
+Some other enhancements to the sql functions include:
+
+- support for writing the index. This can be controlled with the ``index``
+  keyword (default is True).
+- specify the column label to use when writing the index with ``index_label``.
+- specify string columns to parse as datetimes with the ``parse_dates``
+  keyword in :func:`~pandas.read_sql_query` and :func:`~pandas.read_sql_table`.
+
+.. warning::
+
+    Some of the existing functions or function aliases have been deprecated
+    and will be removed in future versions. This includes: ``tquery``, ``uquery``,
+    ``read_frame``, ``frame_query``, ``write_frame``.
+
+.. warning::
+
+    The support for the 'mysql' flavor when using DBAPI connection objects has been deprecated.
+    MySQL will be further supported with SQLAlchemy engines (:issue:`6900`).
+
+
+.. _whatsnew_0140.slicers:
+
+MultiIndexing Using Slicers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+In 0.14.0 we added a new way to slice MultiIndexed objects.
+You can slice a MultiIndex by providing multiple indexers.
+
+You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
+including slices, lists of labels, labels, and boolean indexers.
+
+You can use ``slice(None)`` to select all the contents of *that* level. You do not need to specify all the
+*deeper* levels, they will be implied as ``slice(None)``.
+
+As usual, **both sides** of the slicers are included as this is label indexing.
+
+See :ref:`the docs<advanced.mi_slicers>`
+See also issues (:issue:`6134`, :issue:`4036`, :issue:`3057`, :issue:`2598`, :issue:`5641`, :issue:`7106`)
+
+.. warning::
+
+   You should specify all axes in the ``.loc`` specifier, meaning the indexer for the **index** and
+   for the **columns**. Their are some ambiguous cases where the passed indexer could be mis-interpreted
+   as indexing *both* axes, rather than into say the MuliIndex for the rows.
+
+   You should do this:
+
+  .. code-block:: python
+
+     >>> df.loc[(slice('A1', 'A3'), ...), :]  # noqa: E901
+
+   rather than this:
+
+  .. code-block:: python
+
+     >>> df.loc[(slice('A1', 'A3'), ...)]  # noqa: E901
+
+.. warning::
+
+   You will need to make sure that the selection axes are fully lexsorted!
+
+.. ipython:: python
+
+   def mklbl(prefix, n):
+       return ["%s%s" % (prefix, i) for i in range(n)]
+
+   index = pd.MultiIndex.from_product([mklbl('A', 4),
+                                       mklbl('B', 2),
+                                       mklbl('C', 4),
+                                       mklbl('D', 2)])
+   columns = pd.MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                        ('b', 'foo'), ('b', 'bah')],
+                                       names=['lvl0', 'lvl1'])
+   df = pd.DataFrame(np.arange(len(index) * len(columns)).reshape((len(index),
+                     len(columns))),
+                     index=index,
+                     columns=columns).sort_index().sort_index(axis=1)
+   df
+
+Basic MultiIndex slicing using slices, lists, and labels.
+
+.. ipython:: python
+
+   df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+
+You can use a ``pd.IndexSlice`` to shortcut the creation of these slices
+
+.. ipython:: python
+
+   idx = pd.IndexSlice
+   df.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
+
+It is possible to perform quite complicated selections using this method on multiple
+axes at the same time.
+
+.. ipython:: python
+
+   df.loc['A1', (slice(None), 'foo')]
+   df.loc[idx[:, :, ['C1', 'C3']], idx[:, 'foo']]
+
+Using a boolean indexer you can provide selection related to the *values*.
+
+.. ipython:: python
+
+   mask = df[('a', 'foo')] > 200
+   df.loc[idx[mask, :, ['C1', 'C3']], idx[:, 'foo']]
+
+You can also specify the ``axis`` argument to ``.loc`` to interpret the passed
+slicers on a single axis.
+
+.. ipython:: python
+
+   df.loc(axis=0)[:, :, ['C1', 'C3']]
+
+Furthermore you can *set* the values using these methods
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2.loc(axis=0)[:, :, ['C1', 'C3']] = -10
+   df2
+
+You can use a right-hand-side of an alignable object as well.
+
+.. ipython:: python
+
+   df2 = df.copy()
+   df2.loc[idx[:, :, ['C1', 'C3']], :] = df2 * 1000
+   df2
+
+.. _whatsnew_0140.plotting:
+
+Plotting
+~~~~~~~~
+
+- Hexagonal bin plots from ``DataFrame.plot`` with ``kind='hexbin'`` (:issue:`5478`), See :ref:`the docs<visualization.hexbin>`.
+- ``DataFrame.plot`` and ``Series.plot`` now supports area plot with specifying ``kind='area'`` (:issue:`6656`), See :ref:`the docs<visualization.area_plot>`
+- Pie plots from ``Series.plot`` and ``DataFrame.plot`` with ``kind='pie'`` (:issue:`6976`), See :ref:`the docs<visualization.pie>`.
+- Plotting with Error Bars is now supported in the ``.plot`` method of ``DataFrame`` and ``Series`` objects (:issue:`3796`, :issue:`6834`), See :ref:`the docs<visualization.errorbars>`.
+- ``DataFrame.plot`` and ``Series.plot`` now support a ``table`` keyword for plotting ``matplotlib.Table``, See :ref:`the docs<visualization.table>`. The ``table`` keyword can receive the following values.
+
+  - ``False``: Do nothing (default).
+  - ``True``: Draw a table using the ``DataFrame`` or ``Series`` called ``plot`` method. Data will be transposed to meet matplotlib's default layout.
+  - ``DataFrame`` or ``Series``: Draw matplotlib.table using the passed data. The data will be drawn as displayed in print method (not transposed automatically).
+    Also, helper function ``pandas.tools.plotting.table`` is added to create a table from ``DataFrame`` and ``Series``, and add it to an ``matplotlib.Axes``.
+
+- ``plot(legend='reverse')`` will now reverse the order of legend labels for
+  most plot kinds. (:issue:`6014`)
+- Line plot and area plot can be stacked by ``stacked=True`` (:issue:`6656`)
+
+- Following keywords are now acceptable for :meth:`DataFrame.plot` with ``kind='bar'`` and ``kind='barh'``:
+
+  - `width`: Specify the bar width. In previous versions, static value 0.5 was passed to matplotlib and it cannot be overwritten. (:issue:`6604`)
+  - `align`: Specify the bar alignment. Default is `center` (different from matplotlib). In previous versions, pandas passes `align='edge'` to matplotlib and adjust the location to `center` by itself, and it results `align` keyword is not applied as expected. (:issue:`4525`)
+  - `position`: Specify relative alignments for bar plot layout. From 0 (left/bottom-end) to 1(right/top-end). Default is 0.5 (center). (:issue:`6604`)
+
+  Because of the default `align` value changes, coordinates of bar plots are now located on integer values (0.0, 1.0, 2.0 ...). This is intended to make bar plot be located on the same coordinates as line plot. However, bar plot may differs unexpectedly when you manually adjust the bar location or drawing area, such as using `set_xlim`, `set_ylim`, etc. In this cases, please modify your script to meet with new coordinates.
+
+- The :func:`parallel_coordinates` function now takes argument ``color``
+  instead of ``colors``. A ``FutureWarning`` is raised to alert that
+  the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
+
+- The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
+  positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
+  raised if the old ``data`` argument is used by name. (:issue:`6956`)
+
+- :meth:`DataFrame.boxplot` now supports ``layout`` keyword (:issue:`6769`)
+- :meth:`DataFrame.boxplot` has a new keyword argument, `return_type`. It accepts ``'dict'``,
+  ``'axes'``, or ``'both'``, in which case a namedtuple with the matplotlib
+  axes and a dict of matplotlib Lines is returned.
+
+
+.. _whatsnew_0140.prior_deprecations:
+
+Prior Version Deprecations/Changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+There are prior version deprecations that are taking effect as of 0.14.0.
+
+- Remove :class:`DateRange` in favor of :class:`DatetimeIndex` (:issue:`6816`)
+- Remove ``column`` keyword from ``DataFrame.sort`` (:issue:`4370`)
+- Remove ``precision`` keyword from :func:`set_eng_float_format` (:issue:`395`)
+- Remove ``force_unicode`` keyword from :meth:`DataFrame.to_string`,
+  :meth:`DataFrame.to_latex`, and :meth:`DataFrame.to_html`; these function
+  encode in unicode by default (:issue:`2224`, :issue:`2225`)
+- Remove ``nanRep`` keyword from :meth:`DataFrame.to_csv` and
+  :meth:`DataFrame.to_string` (:issue:`275`)
+- Remove ``unique`` keyword from :meth:`HDFStore.select_column` (:issue:`3256`)
+- Remove ``inferTimeRule`` keyword from :func:`Timestamp.offset` (:issue:`391`)
+- Remove ``name`` keyword from :func:`get_data_yahoo` and
+  :func:`get_data_google` ( `commit b921d1a <https://github.com/pandas-dev/pandas/commit/b921d1a2>`__ )
+- Remove ``offset`` keyword from :class:`DatetimeIndex` constructor
+  ( `commit 3136390 <https://github.com/pandas-dev/pandas/commit/3136390>`__ )
+- Remove ``time_rule`` from several rolling-moment statistical functions, such
+  as :func:`rolling_sum` (:issue:`1042`)
+- Removed neg ``-`` boolean operations on numpy arrays in favor of inv ``~``, as this is going to
+  be deprecated in numpy 1.9 (:issue:`6960`)
+
+.. _whatsnew_0140.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- The :func:`pivot_table`/:meth:`DataFrame.pivot_table` and :func:`crosstab` functions
+  now take arguments ``index`` and ``columns`` instead of ``rows`` and ``cols``.  A
+  ``FutureWarning`` is raised to alert that the old ``rows`` and ``cols`` arguments
+  will not be supported in a future release (:issue:`5505`)
+
+- The :meth:`DataFrame.drop_duplicates` and :meth:`DataFrame.duplicated` methods
+  now take argument ``subset`` instead of ``cols`` to better align with
+  :meth:`DataFrame.dropna`.  A ``FutureWarning`` is raised to alert that the old
+  ``cols`` arguments will not be supported in a future release (:issue:`6680`)
+
+- The :meth:`DataFrame.to_csv` and :meth:`DataFrame.to_excel` functions
+  now takes argument ``columns`` instead of ``cols``.  A
+  ``FutureWarning`` is raised to alert that the old ``cols`` arguments
+  will not be supported in a future release (:issue:`6645`)
+
+- Indexers will warn ``FutureWarning`` when used with a scalar indexer and
+  a non-floating point Index (:issue:`4892`, :issue:`6960`)
+
+  .. code-block:: ipython
+
+     # non-floating point indexes can only be indexed by integers / labels
+     In [1]: pd.Series(1, np.arange(5))[3.0]
+             pandas/core/index.py:469: FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+     Out[1]: 1
+
+     In [2]: pd.Series(1, np.arange(5)).iloc[3.0]
+             pandas/core/index.py:469: FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+     Out[2]: 1
+
+     In [3]: pd.Series(1, np.arange(5)).iloc[3.0:4]
+             pandas/core/index.py:527: FutureWarning: slice indexers when using iloc should be integers and not floating point
+     Out[3]:
+             3    1
+             dtype: int64
+
+     # these are Float64Indexes, so integer or floating point is acceptable
+     In [4]: pd.Series(1, np.arange(5.))[3]
+     Out[4]: 1
+
+     In [5]: pd.Series(1, np.arange(5.))[3.0]
+     Out[6]: 1
+
+- Numpy 1.9 compat w.r.t. deprecation warnings (:issue:`6960`)
+
+- :meth:`Panel.shift` now has a function signature that matches :meth:`DataFrame.shift`.
+  The old positional argument ``lags`` has been changed to a keyword argument
+  ``periods`` with a default value of 1. A ``FutureWarning`` is raised if the
+  old argument ``lags`` is used by name. (:issue:`6910`)
+- The ``order`` keyword argument of :func:`factorize` will be removed. (:issue:`6926`).
+
+- Remove the ``copy`` keyword from :meth:`DataFrame.xs`, :meth:`Panel.major_xs`, :meth:`Panel.minor_xs`. A view will be
+  returned if possible, otherwise a copy will be made. Previously the user could think that ``copy=False`` would
+  ALWAYS return a view. (:issue:`6894`)
+
+- The :func:`parallel_coordinates` function now takes argument ``color``
+  instead of ``colors``. A ``FutureWarning`` is raised to alert that
+  the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
+
+- The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
+  positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
+  raised if the old ``data`` argument is used by name. (:issue:`6956`)
+
+- The support for the 'mysql' flavor when using DBAPI connection objects has been deprecated.
+  MySQL will be further supported with SQLAlchemy engines (:issue:`6900`).
+
+- The following ``io.sql`` functions have been deprecated: ``tquery``, ``uquery``, ``read_frame``, ``frame_query``, ``write_frame``.
+
+- The `percentile_width` keyword argument in :meth:`~DataFrame.describe` has been deprecated.
+  Use the `percentiles` keyword instead, which takes a list of percentiles to display. The
+  default output is unchanged.
+
+- The default return type of :func:`boxplot` will change from a dict to a matplotlib Axes
+  in a future release. You can use the future behavior now by passing ``return_type='axes'``
+  to boxplot.
+
+.. _whatsnew_0140.knownissues:
+
+Known Issues
+~~~~~~~~~~~~
+
+- OpenPyXL 2.0.0 breaks backwards compatibility (:issue:`7169`)
+
+
+.. _whatsnew_0140.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- DataFrame and Series will create a MultiIndex object if passed a tuples dict, See :ref:`the docs<basics.dataframe.from_dict_of_tuples>` (:issue:`3323`)
+
+  .. ipython:: python
+
+     pd.Series({('a', 'b'): 1, ('a', 'a'): 0,
+                ('a', 'c'): 2, ('b', 'a'): 3, ('b', 'b'): 4})
+     pd.DataFrame({('a', 'b'): {('A', 'B'): 1, ('A', 'C'): 2},
+                  ('a', 'a'): {('A', 'C'): 3, ('A', 'B'): 4},
+                  ('a', 'c'): {('A', 'B'): 5, ('A', 'C'): 6},
+                  ('b', 'a'): {('A', 'C'): 7, ('A', 'B'): 8},
+                  ('b', 'b'): {('A', 'D'): 9, ('A', 'B'): 10}})
+
+- Added the ``sym_diff`` method to ``Index`` (:issue:`5543`)
+- ``DataFrame.to_latex`` now takes a longtable keyword, which if True will return a table in a longtable environment. (:issue:`6617`)
+- Add option to turn off escaping in ``DataFrame.to_latex`` (:issue:`6472`)
+- ``pd.read_clipboard`` will, if the keyword ``sep`` is unspecified, try to detect data copied from a spreadsheet
+  and parse accordingly. (:issue:`6223`)
+- Joining a singly-indexed DataFrame with a MultiIndexed DataFrame (:issue:`3662`)
+
+  See :ref:`the docs<merging.join_on_mi>`. Joining MultiIndex DataFrames on both the left and right is not yet supported ATM.
+
+  .. ipython:: python
+
+     household = pd.DataFrame({'household_id': [1, 2, 3],
+                               'male': [0, 1, 0],
+                               'wealth': [196087.3, 316478.7, 294750]
+                               },
+                              columns=['household_id', 'male', 'wealth']
+                              ).set_index('household_id')
+     household
+     portfolio = pd.DataFrame({'household_id': [1, 2, 2, 3, 3, 3, 4],
+                               'asset_id': ["nl0000301109",
+                                            "nl0000289783",
+                                            "gb00b03mlx29",
+                                            "gb00b03mlx29",
+                                            "lu0197800237",
+                                            "nl0000289965",
+                                            np.nan],
+                               'name': ["ABN Amro",
+                                        "Robeco",
+                                        "Royal Dutch Shell",
+                                        "Royal Dutch Shell",
+                                        "AAB Eastern Europe Equity Fund",
+                                        "Postbank BioTech Fonds",
+                                        np.nan],
+                               'share': [1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]
+                               },
+                              columns=['household_id', 'asset_id', 'name', 'share']
+                              ).set_index(['household_id', 'asset_id'])
+     portfolio
+
+     household.join(portfolio, how='inner')
+
+- ``quotechar``, ``doublequote``, and ``escapechar`` can now be specified when
+  using ``DataFrame.to_csv`` (:issue:`5414`, :issue:`4528`)
+- Partially sort by only the specified levels of a MultiIndex with the
+  ``sort_remaining`` boolean kwarg. (:issue:`3984`)
+- Added ``to_julian_date`` to ``TimeStamp`` and ``DatetimeIndex``.  The Julian
+  Date is used primarily in astronomy and represents the number of days from
+  noon, January 1, 4713 BC.  Because nanoseconds are used to define the time
+  in pandas the actual range of dates that you can use is 1678 AD to 2262 AD. (:issue:`4041`)
+- ``DataFrame.to_stata`` will now check data for compatibility with Stata data types
+  and will upcast when needed.  When it is not possible to losslessly upcast, a warning
+  is issued (:issue:`6327`)
+- ``DataFrame.to_stata`` and ``StataWriter`` will accept keyword arguments time_stamp
+  and data_label which allow the time stamp and dataset label to be set when creating a
+  file. (:issue:`6545`)
+- ``pandas.io.gbq`` now handles reading unicode strings properly. (:issue:`5940`)
+- :ref:`Holidays Calendars<timeseries.holiday>` are now available and can be used with the ``CustomBusinessDay`` offset (:issue:`6719`)
+- ``Float64Index`` is now backed by a ``float64`` dtype ndarray instead of an
+  ``object`` dtype array (:issue:`6471`).
+- Implemented ``Panel.pct_change`` (:issue:`6904`)
+- Added ``how`` option to rolling-moment functions to dictate how to handle resampling; :func:`rolling_max` defaults to max,
+  :func:`rolling_min` defaults to min, and all others default to mean (:issue:`6297`)
+- ``CustomBuisnessMonthBegin`` and ``CustomBusinessMonthEnd`` are now available (:issue:`6866`)
+- :meth:`Series.quantile` and :meth:`DataFrame.quantile` now accept an array of
+  quantiles.
+- :meth:`~DataFrame.describe` now accepts an array of percentiles to include in the summary statistics (:issue:`4196`)
+- ``pivot_table`` can now accept ``Grouper`` by ``index`` and ``columns`` keywords (:issue:`6913`)
+
+  .. ipython:: python
+
+     import datetime
+     df = pd.DataFrame({
+         'Branch': 'A A A A A B'.split(),
+         'Buyer': 'Carl Mark Carl Carl Joe Joe'.split(),
+         'Quantity': [1, 3, 5, 1, 8, 1],
+         'Date': [datetime.datetime(2013, 11, 1, 13, 0),
+                  datetime.datetime(2013, 9, 1, 13, 5),
+                  datetime.datetime(2013, 10, 1, 20, 0),
+                  datetime.datetime(2013, 10, 2, 10, 0),
+                  datetime.datetime(2013, 11, 1, 20, 0),
+                  datetime.datetime(2013, 10, 2, 10, 0)],
+         'PayDay': [datetime.datetime(2013, 10, 4, 0, 0),
+                    datetime.datetime(2013, 10, 15, 13, 5),
+                    datetime.datetime(2013, 9, 5, 20, 0),
+                    datetime.datetime(2013, 11, 2, 10, 0),
+                    datetime.datetime(2013, 10, 7, 20, 0),
+                    datetime.datetime(2013, 9, 5, 10, 0)]})
+     df
+
+     df.pivot_table(values='Quantity',
+                    index=pd.Grouper(freq='M', key='Date'),
+                    columns=pd.Grouper(freq='M', key='PayDay'),
+                    aggfunc=np.sum)
+
+- Arrays of strings can be wrapped to a specified width (``str.wrap``) (:issue:`6999`)
+- Add :meth:`~Series.nsmallest` and :meth:`Series.nlargest` methods to Series, See :ref:`the docs <basics.nsorted>` (:issue:`3960`)
+
+- `PeriodIndex` fully supports partial string indexing like `DatetimeIndex` (:issue:`7043`)
+
+  .. ipython:: python
+
+     prng = pd.period_range('2013-01-01 09:00', periods=100, freq='H')
+     ps = pd.Series(np.random.randn(len(prng)), index=prng)
+     ps
+     ps['2013-01-02']
+
+- ``read_excel`` can now read milliseconds in Excel dates and times with xlrd >= 0.9.3. (:issue:`5945`)
+- ``pd.stats.moments.rolling_var`` now uses Welford's method for increased numerical stability (:issue:`6817`)
+- pd.expanding_apply and pd.rolling_apply now take args and kwargs that are passed on to
+  the func (:issue:`6289`)
+- ``DataFrame.rank()`` now has a percentage rank option (:issue:`5971`)
+- ``Series.rank()`` now has a percentage rank option (:issue:`5971`)
+- ``Series.rank()`` and ``DataFrame.rank()`` now accept ``method='dense'`` for ranks without gaps (:issue:`6514`)
+- Support passing ``encoding`` with xlwt (:issue:`3710`)
+- Refactor Block classes removing `Block.items` attributes to avoid duplication
+  in item handling (:issue:`6745`, :issue:`6988`).
+- Testing statements updated to use specialized asserts (:issue:`6175`)
+
+
+
+.. _whatsnew_0140.performance:
+
+Performance
+~~~~~~~~~~~
+
+- Performance improvement when converting ``DatetimeIndex`` to floating ordinals
+  using ``DatetimeConverter`` (:issue:`6636`)
+- Performance improvement for  ``DataFrame.shift`` (:issue:`5609`)
+- Performance improvement in indexing into a MultiIndexed Series (:issue:`5567`)
+- Performance improvements in single-dtyped indexing (:issue:`6484`)
+- Improve performance of DataFrame construction with certain offsets, by removing faulty caching
+  (e.g. MonthEnd,BusinessMonthEnd), (:issue:`6479`)
+- Improve performance of ``CustomBusinessDay`` (:issue:`6584`)
+- improve performance of slice indexing on Series with string keys (:issue:`6341`, :issue:`6372`)
+- Performance improvement for ``DataFrame.from_records`` when reading a
+  specified number of rows from an iterable (:issue:`6700`)
+- Performance improvements in timedelta conversions for integer dtypes (:issue:`6754`)
+- Improved performance of compatible pickles (:issue:`6899`)
+- Improve performance in certain reindexing operations by optimizing ``take_2d`` (:issue:`6749`)
+- ``GroupBy.count()`` is now implemented in Cython and is much faster for large
+  numbers of groups (:issue:`7016`).
+
+Experimental
+~~~~~~~~~~~~
+
+There are no experimental changes in 0.14.0
+
+
+.. _whatsnew_0140.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in Series ValueError when index doesn't match data (:issue:`6532`)
+- Prevent segfault due to MultiIndex not being supported in HDFStore table
+  format (:issue:`1848`)
+- Bug in ``pd.DataFrame.sort_index`` where mergesort wasn't stable when ``ascending=False`` (:issue:`6399`)
+- Bug in ``pd.tseries.frequencies.to_offset`` when argument has leading zeros (:issue:`6391`)
+- Bug in version string gen. for dev versions with shallow clones / install from tarball (:issue:`6127`)
+- Inconsistent tz parsing ``Timestamp`` / ``to_datetime`` for current year (:issue:`5958`)
+- Indexing bugs with reordered indexes (:issue:`6252`, :issue:`6254`)
+- Bug in ``.xs`` with a Series multiindex (:issue:`6258`, :issue:`5684`)
+- Bug in conversion of a string types to a DatetimeIndex with a specified frequency (:issue:`6273`, :issue:`6274`)
+- Bug in ``eval`` where type-promotion failed for large expressions (:issue:`6205`)
+- Bug in interpolate with ``inplace=True`` (:issue:`6281`)
+- ``HDFStore.remove`` now handles start and stop (:issue:`6177`)
+- ``HDFStore.select_as_multiple`` handles start and stop the same way as ``select`` (:issue:`6177`)
+- ``HDFStore.select_as_coordinates`` and ``select_column`` works with a ``where`` clause that results in filters (:issue:`6177`)
+- Regression in join of non_unique_indexes (:issue:`6329`)
+- Issue with groupby ``agg`` with a single function and a a mixed-type frame (:issue:`6337`)
+- Bug in ``DataFrame.replace()`` when passing a non- ``bool``
+  ``to_replace`` argument (:issue:`6332`)
+- Raise when trying to align on different levels of a MultiIndex assignment (:issue:`3738`)
+- Bug in setting complex dtypes via boolean indexing (:issue:`6345`)
+- Bug in TimeGrouper/resample when presented with a non-monotonic DatetimeIndex that would return invalid results. (:issue:`4161`)
+- Bug in index name propagation in TimeGrouper/resample (:issue:`4161`)
+- TimeGrouper has a more compatible API to the rest of the groupers (e.g. ``groups`` was missing) (:issue:`3881`)
+- Bug in multiple grouping with a TimeGrouper depending on target column order (:issue:`6764`)
+- Bug in ``pd.eval`` when parsing strings with possible tokens like ``'&'``
+  (:issue:`6351`)
+- Bug correctly handle placements of ``-inf`` in Panels when dividing by integer 0 (:issue:`6178`)
+- ``DataFrame.shift`` with ``axis=1`` was raising (:issue:`6371`)
+- Disabled clipboard tests until release time (run locally with ``nosetests -A disabled``) (:issue:`6048`).
+- Bug in ``DataFrame.replace()`` when passing a nested ``dict`` that contained
+  keys not in the values to be replaced (:issue:`6342`)
+- ``str.match`` ignored the na flag (:issue:`6609`).
+- Bug in take with duplicate columns that were not consolidated (:issue:`6240`)
+- Bug in interpolate changing dtypes (:issue:`6290`)
+- Bug in ``Series.get``, was using a buggy access method (:issue:`6383`)
+- Bug in hdfstore queries of the form ``where=[('date', '>=', datetime(2013,1,1)), ('date', '<=', datetime(2014,1,1))]`` (:issue:`6313`)
+- Bug in ``DataFrame.dropna`` with duplicate indices (:issue:`6355`)
+- Regression in chained getitem indexing with embedded list-like from 0.12 (:issue:`6394`)
+- ``Float64Index`` with nans not comparing correctly (:issue:`6401`)
+- ``eval``/``query`` expressions with strings containing the ``@`` character
+  will now work (:issue:`6366`).
+- Bug in ``Series.reindex`` when specifying a ``method`` with some nan values was inconsistent (noted on a resample) (:issue:`6418`)
+- Bug in :meth:`DataFrame.replace` where nested dicts were erroneously
+  depending on the order of dictionary keys and values (:issue:`5338`).
+- Performance issue in concatenating with empty objects (:issue:`3259`)
+- Clarify sorting of ``sym_diff`` on ``Index`` objects with ``NaN`` values (:issue:`6444`)
+- Regression in ``MultiIndex.from_product`` with a ``DatetimeIndex`` as input (:issue:`6439`)
+- Bug in ``str.extract`` when passed a non-default index (:issue:`6348`)
+- Bug in ``str.split`` when passed ``pat=None`` and ``n=1`` (:issue:`6466`)
+- Bug in ``io.data.DataReader`` when passed ``"F-F_Momentum_Factor"`` and ``data_source="famafrench"`` (:issue:`6460`)
+- Bug in ``sum`` of a ``timedelta64[ns]`` series (:issue:`6462`)
+- Bug in ``resample`` with a timezone and certain offsets (:issue:`6397`)
+- Bug in ``iat/iloc`` with duplicate indices on a Series (:issue:`6493`)
+- Bug in ``read_html`` where nan's were incorrectly being used to indicate
+  missing values in text. Should use the empty string for consistency with the
+  rest of pandas (:issue:`5129`).
+- Bug in ``read_html`` tests where redirected invalid URLs would make one test
+  fail (:issue:`6445`).
+- Bug in multi-axis indexing using ``.loc`` on non-unique indices (:issue:`6504`)
+- Bug that caused _ref_locs corruption when slice indexing across columns axis of a DataFrame (:issue:`6525`)
+- Regression from 0.13 in the treatment of numpy ``datetime64`` non-ns dtypes in Series creation (:issue:`6529`)
+- ``.names`` attribute of MultiIndexes passed to ``set_index`` are now preserved (:issue:`6459`).
+- Bug in setitem with a duplicate index and an alignable rhs (:issue:`6541`)
+- Bug in setitem with ``.loc`` on mixed integer Indexes (:issue:`6546`)
+- Bug in ``pd.read_stata`` which would use the wrong data types and missing values (:issue:`6327`)
+- Bug in ``DataFrame.to_stata`` that lead to data loss in certain cases, and could be exported using the
+  wrong data types and missing values (:issue:`6335`)
+- ``StataWriter`` replaces missing values in string columns by empty string (:issue:`6802`)
+- Inconsistent types in ``Timestamp`` addition/subtraction (:issue:`6543`)
+- Bug in preserving frequency across Timestamp addition/subtraction (:issue:`4547`)
+- Bug in empty list lookup caused ``IndexError`` exceptions (:issue:`6536`, :issue:`6551`)
+- ``Series.quantile`` raising on an ``object`` dtype (:issue:`6555`)
+- Bug in ``.xs`` with a ``nan`` in level when dropped (:issue:`6574`)
+- Bug in fillna with ``method='bfill/ffill'`` and ``datetime64[ns]`` dtype (:issue:`6587`)
+- Bug in sql writing with mixed dtypes possibly leading to data loss (:issue:`6509`)
+- Bug in ``Series.pop`` (:issue:`6600`)
+- Bug in ``iloc`` indexing when positional indexer matched ``Int64Index`` of the corresponding axis and no reordering happened (:issue:`6612`)
+- Bug in ``fillna`` with ``limit`` and ``value`` specified
+- Bug in ``DataFrame.to_stata`` when columns have non-string names (:issue:`4558`)
+- Bug in compat with ``np.compress``, surfaced in (:issue:`6658`)
+- Bug in binary operations with a rhs of a Series not aligning (:issue:`6681`)
+- Bug in ``DataFrame.to_stata`` which incorrectly handles nan values and ignores ``with_index`` keyword argument (:issue:`6685`)
+- Bug in resample with extra bins when using an evenly divisible frequency (:issue:`4076`)
+- Bug in consistency of groupby aggregation when passing a custom function (:issue:`6715`)
+- Bug in resample when ``how=None`` resample freq is the same as the axis frequency (:issue:`5955`)
+- Bug in downcasting inference with empty arrays (:issue:`6733`)
+- Bug in ``obj.blocks`` on sparse containers dropping all but the last items of same for dtype (:issue:`6748`)
+- Bug in unpickling ``NaT (NaTType)`` (:issue:`4606`)
+- Bug in ``DataFrame.replace()`` where regex meta characters were being treated
+  as regex even when ``regex=False`` (:issue:`6777`).
+- Bug in timedelta ops on 32-bit platforms (:issue:`6808`)
+- Bug in setting a tz-aware index directly via ``.index`` (:issue:`6785`)
+- Bug in expressions.py where numexpr would try to evaluate arithmetic ops
+  (:issue:`6762`).
+- Bug in Makefile where it didn't remove Cython generated C files with ``make
+  clean`` (:issue:`6768`)
+- Bug with numpy < 1.7.2 when reading long strings from ``HDFStore`` (:issue:`6166`)
+- Bug in ``DataFrame._reduce`` where non bool-like (0/1) integers were being
+  converted into bools. (:issue:`6806`)
+- Regression from 0.13 with ``fillna`` and a Series on datetime-like (:issue:`6344`)
+- Bug in adding ``np.timedelta64`` to ``DatetimeIndex`` with timezone outputs incorrect results (:issue:`6818`)
+- Bug in ``DataFrame.replace()`` where changing a dtype through replacement
+  would only replace the first occurrence of a value (:issue:`6689`)
+- Better error message when passing a frequency of 'MS' in ``Period`` construction (GH5332)
+- Bug in ``Series.__unicode__`` when ``max_rows=None`` and the Series has more than 1000 rows. (:issue:`6863`)
+- Bug in ``groupby.get_group`` where a datelike wasn't always accepted (:issue:`5267`)
+- Bug in ``groupBy.get_group`` created by ``TimeGrouper`` raises ``AttributeError`` (:issue:`6914`)
+- Bug in ``DatetimeIndex.tz_localize`` and ``DatetimeIndex.tz_convert`` converting ``NaT`` incorrectly (:issue:`5546`)
+- Bug in arithmetic operations affecting ``NaT`` (:issue:`6873`)
+- Bug in ``Series.str.extract`` where the resulting ``Series`` from a single
+  group match wasn't renamed to the group name
+- Bug in ``DataFrame.to_csv`` where setting ``index=False`` ignored the
+  ``header`` kwarg (:issue:`6186`)
+- Bug in ``DataFrame.plot`` and ``Series.plot``, where the legend behave inconsistently when plotting to the same axes repeatedly (:issue:`6678`)
+- Internal tests for patching ``__finalize__`` / bug in merge not finalizing (:issue:`6923`, :issue:`6927`)
+- accept ``TextFileReader`` in ``concat``, which was affecting a common user idiom (:issue:`6583`)
+- Bug in C parser with leading white space (:issue:`3374`)
+- Bug in C parser with ``delim_whitespace=True`` and ``\r``-delimited lines
+- Bug in python parser with explicit MultiIndex in row following column header (:issue:`6893`)
+- Bug in ``Series.rank`` and ``DataFrame.rank`` that caused small floats (<1e-13) to all receive the same rank (:issue:`6886`)
+- Bug in ``DataFrame.apply`` with functions that used ``*args`` or ``**kwargs`` and returned
+  an empty result (:issue:`6952`)
+- Bug in sum/mean on 32-bit platforms on overflows (:issue:`6915`)
+- Moved ``Panel.shift`` to ``NDFrame.slice_shift`` and fixed to respect multiple dtypes. (:issue:`6959`)
+- Bug in enabling ``subplots=True`` in ``DataFrame.plot`` only has single column raises ``TypeError``, and ``Series.plot`` raises ``AttributeError`` (:issue:`6951`)
+- Bug in ``DataFrame.plot`` draws unnecessary axes when enabling ``subplots`` and ``kind=scatter`` (:issue:`6951`)
+- Bug in ``read_csv`` from a filesystem with non-utf-8 encoding (:issue:`6807`)
+- Bug in ``iloc`` when setting / aligning (:issue:`6766`)
+- Bug causing UnicodeEncodeError when get_dummies called with unicode values and a prefix (:issue:`6885`)
+- Bug in timeseries-with-frequency plot cursor display (:issue:`5453`)
+- Bug surfaced in ``groupby.plot`` when using a ``Float64Index`` (:issue:`7025`)
+- Stopped tests from failing if options data isn't able to be downloaded from Yahoo (:issue:`7034`)
+- Bug in ``parallel_coordinates`` and ``radviz`` where reordering of class column
+  caused possible color/class mismatch (:issue:`6956`)
+- Bug in ``radviz`` and ``andrews_curves`` where multiple values of 'color'
+  were being passed to plotting method (:issue:`6956`)
+- Bug in ``Float64Index.isin()`` where containing ``nan`` s would make indices
+  claim that they contained all the things (:issue:`7066`).
+- Bug in ``DataFrame.boxplot`` where it failed to use the axis passed as the ``ax`` argument (:issue:`3578`)
+- Bug in the ``XlsxWriter`` and ``XlwtWriter`` implementations that resulted in datetime columns being formatted without the time (:issue:`7075`)
+  were being passed to plotting method
+- :func:`read_fwf` treats ``None`` in ``colspec`` like regular python slices. It now reads from the beginning
+  or until the end of the line when ``colspec`` contains a ``None`` (previously raised a ``TypeError``)
+- Bug in cache coherence with chained indexing and slicing; add ``_is_view`` property to ``NDFrame`` to correctly predict
+  views; mark ``is_copy`` on ``xs`` only if its an actual copy (and not a view) (:issue:`7084`)
+- Bug in DatetimeIndex creation from string ndarray with ``dayfirst=True`` (:issue:`5917`)
+- Bug in ``MultiIndex.from_arrays`` created from ``DatetimeIndex`` doesn't preserve ``freq`` and ``tz`` (:issue:`7090`)
+- Bug in ``unstack`` raises ``ValueError`` when ``MultiIndex`` contains ``PeriodIndex`` (:issue:`4342`)
+- Bug in ``boxplot`` and ``hist`` draws unnecessary axes (:issue:`6769`)
+- Regression in ``groupby.nth()`` for out-of-bounds indexers (:issue:`6621`)
+- Bug in ``quantile`` with datetime values (:issue:`6965`)
+- Bug in ``Dataframe.set_index``, ``reindex`` and ``pivot`` don't preserve ``DatetimeIndex`` and ``PeriodIndex`` attributes (:issue:`3950`, :issue:`5878`, :issue:`6631`)
+- Bug in ``MultiIndex.get_level_values`` doesn't preserve ``DatetimeIndex`` and ``PeriodIndex`` attributes (:issue:`7092`)
+- Bug in ``Groupby`` doesn't preserve ``tz`` (:issue:`3950`)
+- Bug in ``PeriodIndex`` partial string slicing (:issue:`6716`)
+- Bug in the HTML repr of a truncated Series or DataFrame not showing the class name with the `large_repr` set to 'info'
+  (:issue:`7105`)
+- Bug in ``DatetimeIndex`` specifying ``freq`` raises ``ValueError`` when passed value is too short (:issue:`7098`)
+- Fixed a bug with the `info` repr not honoring the `display.max_info_columns` setting (:issue:`6939`)
+- Bug ``PeriodIndex`` string slicing with out of bounds values (:issue:`5407`)
+- Fixed a memory error in the hashtable implementation/factorizer on resizing of large tables (:issue:`7157`)
+- Bug in ``isnull`` when applied to 0-dimensional object arrays (:issue:`7176`)
+- Bug in ``query``/``eval`` where global constants were not looked up correctly
+  (:issue:`7178`)
+- Bug in recognizing out-of-bounds positional list indexers with ``iloc`` and a multi-axis tuple indexer (:issue:`7189`)
+- Bug in setitem with a single value, MultiIndex and integer indices (:issue:`7190`, :issue:`7218`)
+- Bug in expressions evaluation with reversed ops, showing in series-dataframe ops (:issue:`7198`, :issue:`7192`)
+- Bug in multi-axis indexing with > 2 ndim and a MultiIndex (:issue:`7199`)
+- Fix a bug where invalid eval/query operations would blow the stack (:issue:`5198`)
+
+
+.. _whatsnew_0.14.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.13.1..v0.14.0
\ No newline at end of file
diff --git a/doc/source/whatsnew/v0.14.0.txt b/doc/source/whatsnew/v0.14.0.txt
deleted file mode 100644
index f1feab4b909dc..0000000000000
--- a/doc/source/whatsnew/v0.14.0.txt
+++ /dev/null
@@ -1,1049 +0,0 @@
-.. _whatsnew_0140:
-
-v0.14.0 (May 31 , 2014)
------------------------
-
-This is a major release from 0.13.1 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-- Highlights include:
-
-  - Officially support Python 3.4
-  - SQL interfaces updated to use ``sqlalchemy``, See :ref:`Here<whatsnew_0140.sql>`.
-  - Display interface changes, See :ref:`Here<whatsnew_0140.display>`
-  - MultiIndexing Using Slicers, See :ref:`Here<whatsnew_0140.slicers>`.
-  - Ability to join a singly-indexed DataFrame with a multi-indexed DataFrame, see :ref:`Here <merging.join_on_mi>`
-  - More consistency in groupby results and more flexible groupby specifications, See :ref:`Here<whatsnew_0140.groupby>`
-  - Holiday calendars are now supported in ``CustomBusinessDay``, see :ref:`Here <timeseries.holiday>`
-  - Several improvements in plotting functions, including: hexbin, area and pie plots, see :ref:`Here<whatsnew_0140.plotting>`.
-  - Performance doc section on I/O operations, See :ref:`Here <io.perf>`
-
-- :ref:`Other Enhancements <whatsnew_0140.enhancements>`
-
-- :ref:`API Changes <whatsnew_0140.api>`
-
-- :ref:`Text Parsing API Changes <whatsnew_0140.parsing>`
-
-- :ref:`Groupby API Changes <whatsnew_0140.groupby>`
-
-- :ref:`Performance Improvements <whatsnew_0140.performance>`
-
-- :ref:`Prior Deprecations <whatsnew_0140.prior_deprecations>`
-
-- :ref:`Deprecations <whatsnew_0140.deprecations>`
-
-- :ref:`Known Issues <whatsnew_0140.knownissues>`
-
-- :ref:`Bug Fixes <whatsnew_0140.bug_fixes>`
-
-.. warning::
-
-   In 0.14.0 all ``NDFrame`` based containers have undergone significant internal refactoring. Before that each block of
-   homogeneous data had its own labels and extra care was necessary to keep those in sync with the parent container's labels.
-   This should not have any visible user/API behavior changes (:issue:`6745`)
-
-.. _whatsnew_0140.api:
-
-API changes
-~~~~~~~~~~~
-
-- ``read_excel`` uses 0 as the default sheet (:issue:`6573`)
-- ``iloc`` will now accept out-of-bounds indexers for slices, e.g. a value that exceeds the length of the object being
-  indexed. These will be excluded. This will make pandas conform more with python/numpy indexing of out-of-bounds
-  values. A single indexer that is out-of-bounds and drops the dimensions of the object will still raise
-  ``IndexError`` (:issue:`6296`, :issue:`6299`). This could result in an empty axis (e.g. an empty DataFrame being returned)
-
-  .. ipython:: python
-
-     dfl = DataFrame(np.random.randn(5,2),columns=list('AB'))
-     dfl
-     dfl.iloc[:,2:3]
-     dfl.iloc[:,1:3]
-     dfl.iloc[4:6]
-
-  These are out-of-bounds selections
-
-  .. code-block:: python
-
-     dfl.iloc[[4,5,6]]
-     IndexError: positional indexers are out-of-bounds
-
-     dfl.iloc[:,4]
-     IndexError: single positional indexer is out-of-bounds
-
-- Slicing with negative start, stop & step values handles corner cases better (:issue:`6531`):
-
-  - ``df.iloc[:-len(df)]`` is now empty
-  - ``df.iloc[len(df)::-1]`` now enumerates all elements in reverse
-
-- The :meth:`DataFrame.interpolate` keyword ``downcast`` default has been changed from ``infer`` to
-  ``None``. This is to preseve the original dtype unless explicitly requested otherwise (:issue:`6290`).
-- When converting a dataframe to HTML it used to return `Empty DataFrame`. This special case has
-  been removed, instead a header with the column names is returned (:issue:`6062`).
-- ``Series`` and ``Index`` now internall share more common operations, e.g. ``factorize(),nunique(),value_counts()`` are
-  now supported on ``Index`` types as well. The ``Series.weekday`` property from is removed
-  from Series for API  consistency. Using a ``DatetimeIndex/PeriodIndex`` method on a Series will now raise a ``TypeError``.
-  (:issue:`4551`, :issue:`4056`, :issue:`5519`, :issue:`6380`, :issue:`7206`).
-
-- Add ``is_month_start``, ``is_month_end``, ``is_quarter_start``, ``is_quarter_end``, ``is_year_start``, ``is_year_end`` accessors for ``DateTimeIndex`` / ``Timestamp`` which return a boolean array of whether the timestamp(s) are at the start/end of the month/quarter/year defined by the frequency of the ``DateTimeIndex`` / ``Timestamp`` (:issue:`4565`, :issue:`6998`)
-
-- Local variable usage has changed in
-  :func:`pandas.eval`/:meth:`DataFrame.eval`/:meth:`DataFrame.query`
-  (:issue:`5987`). For the :class:`~pandas.DataFrame` methods, two things have
-  changed
-
-  - Column names are now given precedence over locals
-  - Local variables must be referred to explicitly. This means that even if
-    you have a local variable that is *not* a column you must still refer to
-    it with the ``'@'`` prefix.
-  - You can have an expression like ``df.query('@a < a')`` with no complaints
-    from ``pandas`` about ambiguity of the name ``a``.
-  - The top-level :func:`pandas.eval` function does not allow you use the
-    ``'@'`` prefix and provides you with an error message telling you so.
-  - ``NameResolutionError`` was removed because it isn't necessary anymore.
-
-- Define and document the order of column vs index names in query/eval (:issue:`6676`)
-- ``concat`` will now concatenate mixed Series and DataFrames using the Series name
-  or numbering columns as needed (:issue:`2385`). See :ref:`the docs <merging.mixed_ndims>`
-- Slicing and advanced/boolean indexing operations on ``Index`` classes as well
-  as :meth:`Index.delete` and :meth:`Index.drop` methods will no longer change the type of the
-  resulting index (:issue:`6440`, :issue:`7040`)
-
-  .. ipython:: python
-
-     i = pd.Index([1, 2, 3, 'a' , 'b', 'c'])
-     i[[0,1,2]]
-     i.drop(['a', 'b', 'c'])
-
-  Previously, the above operation would return ``Int64Index``.  If you'd like
-  to do this manually, use :meth:`Index.astype`
-
-  .. ipython:: python
-
-     i[[0,1,2]].astype(np.int_)
-
-- ``set_index`` no longer converts MultiIndexes to an Index of tuples. For example,
-  the old behavior returned an Index in this case (:issue:`6459`):
-
-  .. ipython:: python
-     :suppress:
-
-     np.random.seed(1234)
-     from itertools import product
-     tuples = list(product(('a', 'b'), ('c', 'd')))
-     mi = MultiIndex.from_tuples(tuples)
-     df_multi = DataFrame(np.random.randn(4, 2), index=mi)
-     tuple_ind = pd.Index(tuples,tupleize_cols=False)
-     df_multi.index
-
-  .. ipython:: python
-
-     # Old behavior, casted MultiIndex to an Index
-     tuple_ind
-     df_multi.set_index(tuple_ind)
-
-     # New behavior
-     mi
-     df_multi.set_index(mi)
-
-  This also applies when passing multiple indices to ``set_index``:
-
-  .. ipython:: python
-
-    @suppress
-    df_multi.index = tuple_ind
-
-    # Old output, 2-level MultiIndex of tuples
-    df_multi.set_index([df_multi.index, df_multi.index])
-
-    @suppress
-    df_multi.index = mi
-
-    # New output, 4-level MultiIndex
-    df_multi.set_index([df_multi.index, df_multi.index])
-
-- ``pairwise`` keyword was added to the statistical moment functions
-  ``rolling_cov``, ``rolling_corr``, ``ewmcov``, ``ewmcorr``,
-  ``expanding_cov``, ``expanding_corr`` to allow the calculation of moving
-  window covariance and correlation matrices (:issue:`4950`). See
-  :ref:`Computing rolling pairwise covariances and correlations
-  <stats.moments.corr_pairwise>` in the docs.
-
-  .. code-block:: ipython
-
-     In [1]: df = DataFrame(np.random.randn(10,4),columns=list('ABCD'))
-
-     In [4]: covs = pd.rolling_cov(df[['A','B','C']], df[['B','C','D']], 5, pairwise=True)
-
-     In [5]: covs[df.index[-1]]
-     Out[5]:
-               B         C         D
-     A  0.035310  0.326593 -0.505430
-     B  0.137748 -0.006888 -0.005383
-     C -0.006888  0.861040  0.020762
-
-- ``Series.iteritems()`` is now lazy (returns an iterator rather than a list). This was the documented behavior prior to 0.14. (:issue:`6760`)
-
-- Added ``nunique`` and ``value_counts`` functions to ``Index`` for counting unique elements. (:issue:`6734`)
-- ``stack`` and ``unstack`` now raise a ``ValueError`` when the ``level`` keyword refers
-  to a non-unique item in the ``Index`` (previously raised a ``KeyError``). (:issue:`6738`)
-- drop unused order argument from ``Series.sort``; args now are in the same order as ``Series.order``;
-  add ``na_position`` arg to conform to ``Series.order`` (:issue:`6847`)
-- default sorting algorithm for ``Series.order`` is now ``quicksort``, to conform with ``Series.sort``
-  (and numpy defaults)
-- add ``inplace`` keyword to ``Series.order/sort`` to make them inverses (:issue:`6859`)
-- ``DataFrame.sort`` now places NaNs at the beginning or end of the sort according to the ``na_position`` parameter. (:issue:`3917`)
-- accept ``TextFileReader`` in ``concat``, which was affecting a common user idiom (:issue:`6583`), this was a regression
-  from 0.13.1
-- Added ``factorize`` functions to ``Index`` and ``Series`` to get indexer and unique values (:issue:`7090`)
-- ``describe`` on a DataFrame with a mix of Timestamp and string like objects returns a different Index (:issue:`7088`).
-  Previously the index was unintentionally sorted.
-- Arithmetic operations with **only** ``bool`` dtypes now give a warning indicating
-  that they are evaluated in Python space for ``+``, ``-``,
-  and ``*`` operations and raise for all others (:issue:`7011`, :issue:`6762`,
-  :issue:`7015`, :issue:`7210`)
-
-  .. code-block:: python
-
-     x = pd.Series(np.random.rand(10) > 0.5)
-     y = True
-     x + y  # warning generated: should do x | y instead
-     x / y  # this raises because it doesn't make sense
-
-     NotImplementedError: operator '/' not implemented for bool dtypes
-
-- In ``HDFStore``, ``select_as_multiple`` will always raise a ``KeyError``, when a key or the selector is not found (:issue:`6177`)
-- ``df['col'] = value`` and ``df.loc[:,'col'] = value`` are now completely equivalent;
-  previously the ``.loc`` would not necessarily coerce the dtype of the resultant series (:issue:`6149`)
-- ``dtypes`` and ``ftypes`` now return a series with ``dtype=object`` on empty containers (:issue:`5740`)
-- ``df.to_csv`` will now return a string of the CSV data if neither a target path nor a buffer is provided
-  (:issue:`6061`)
-- ``pd.infer_freq()`` will now raise a ``TypeError`` if given an invalid ``Series/Index``
-  type (:issue:`6407`, :issue:`6463`)
-- A tuple passed to ``DataFame.sort_index`` will be interpreted as the levels of
-  the index, rather than requiring a list of tuple (:issue:`4370`)
-- all offset operations now return ``Timestamp`` types (rather than datetime), Business/Week frequencies were incorrect (:issue:`4069`)
-- ``to_excel`` now converts ``np.inf`` into a string representation,
-  customizable by the ``inf_rep`` keyword argument (Excel has no native inf
-  representation) (:issue:`6782`)
-- Replace ``pandas.compat.scipy.scoreatpercentile`` with ``numpy.percentile`` (:issue:`6810`)
-- ``.quantile`` on a ``datetime[ns]`` series now returns ``Timestamp`` instead
-  of ``np.datetime64`` objects (:issue:`6810`)
-- change ``AssertionError`` to ``TypeError`` for invalid types passed to ``concat`` (:issue:`6583`)
-- Raise a ``TypeError`` when ``DataFrame`` is passed an iterator as the
-  ``data`` argument (:issue:`5357`)
-
-
-.. _whatsnew_0140.display:
-
-Display Changes
-~~~~~~~~~~~~~~~
-
-- The default way of printing large DataFrames has changed. DataFrames
-  exceeding ``max_rows`` and/or ``max_columns`` are now displayed in a
-  centrally truncated view, consistent with the printing of a
-  :class:`pandas.Series` (:issue:`5603`).
-
-  In previous versions, a DataFrame was truncated once the dimension
-  constraints were reached and an ellipse (...) signaled that part of
-  the data was cut off.
-
-  .. image:: _static/trunc_before.png
-      :alt: The previous look of truncate.
-
-  In the current version, large DataFrames are centrally truncated,
-  showing a preview of head and tail in both dimensions.
-
-  .. image:: _static/trunc_after.png
-     :alt: The new look.
-
-- allow option ``'truncate'`` for ``display.show_dimensions`` to only show the dimensions if the
-  frame is truncated (:issue:`6547`).
-
-  The default for ``display.show_dimensions`` will now be ``truncate``. This is consistent with
-  how Series display length.
-
-  .. ipython:: python
-
-     dfd = pd.DataFrame(np.arange(25).reshape(-1,5), index=[0,1,2,3,4], columns=[0,1,2,3,4])
-
-     # show dimensions since this is truncated
-     with pd.option_context('display.max_rows', 2, 'display.max_columns', 2,
-                            'display.show_dimensions', 'truncate'):
-        print(dfd)
-
-     # will not show dimensions since it is not truncated
-     with pd.option_context('display.max_rows', 10, 'display.max_columns', 40,
-                            'display.show_dimensions', 'truncate'):
-        print(dfd)
-
-- Regression in the display of a MultiIndexed Series with ``display.max_rows`` is less than the
-  length of the series (:issue:`7101`)
-- Fixed a bug in the HTML repr of a truncated Series or DataFrame not showing the class name with the
-  `large_repr` set to 'info' (:issue:`7105`)
-- The `verbose` keyword in ``DataFrame.info()``, which controls whether to shorten the ``info``
-  representation, is now ``None`` by default. This will follow the global setting in
-  ``display.max_info_columns``. The global setting can be overriden with ``verbose=True`` or
-  ``verbose=False``.
-- Fixed a bug with the `info` repr not honoring the `display.max_info_columns` setting (:issue:`6939`)
-- Offset/freq info now in Timestamp __repr__ (:issue:`4553`)
-
-.. _whatsnew_0140.parsing:
-
-Text Parsing API Changes
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-:func:`read_csv`/:func:`read_table` will now be noiser w.r.t invalid options rather than falling back to the ``PythonParser``.
-
-- Raise ``ValueError`` when ``sep`` specified with
-  ``delim_whitespace=True`` in :func:`read_csv`/:func:`read_table`
-  (:issue:`6607`)
-- Raise ``ValueError`` when ``engine='c'`` specified with unsupported
-  options in :func:`read_csv`/:func:`read_table` (:issue:`6607`)
-- Raise ``ValueError`` when fallback to python parser causes options to be
-  ignored (:issue:`6607`)
-- Produce :class:`~pandas.io.parsers.ParserWarning` on fallback to python
-  parser when no options are ignored (:issue:`6607`)
-- Translate ``sep='\s+'`` to ``delim_whitespace=True`` in
-  :func:`read_csv`/:func:`read_table` if no other C-unsupported options
-  specified (:issue:`6607`)
-
-.. _whatsnew_0140.groupby:
-
-Groupby API Changes
-~~~~~~~~~~~~~~~~~~~
-
-More consistent behaviour for some groupby methods:
-
-- groupby ``head`` and ``tail`` now act more like ``filter`` rather than an aggregation:
-
-  .. ipython:: python
-
-     df = pd.DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
-     g = df.groupby('A')
-     g.head(1)  # filters DataFrame
-
-     g.apply(lambda x: x.head(1))  # used to simply fall-through
-
-- groupby head and tail respect column selection:
-
-  .. ipython:: python
-
-     g[['B']].head(1)
-
-- groupby ``nth`` now reduces by default; filtering can be achieved by passing ``as_index=False``. With an optional ``dropna`` argument to ignore
-  NaN. See :ref:`the docs <groupby.nth>`.
-
-  Reducing
-
-  .. ipython:: python
-
-     df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-     g = df.groupby('A')
-     g.nth(0)
-
-     # this is equivalent to g.first()
-     g.nth(0, dropna='any')
-
-     # this is equivalent to g.last()
-     g.nth(-1, dropna='any')
-
-  Filtering
-
-  .. ipython:: python
-
-     gf = df.groupby('A',as_index=False)
-     gf.nth(0)
-     gf.nth(0, dropna='any')
-
-- groupby will now not return the grouped column for non-cython functions (:issue:`5610`, :issue:`5614`, :issue:`6732`),
-  as its already the index
-
-  .. ipython:: python
-
-     df = DataFrame([[1, np.nan], [1, 4], [5, 6], [5, 8]], columns=['A', 'B'])
-     g = df.groupby('A')
-     g.count()
-     g.describe()
-
-- passing ``as_index`` will leave the grouped column in-place (this is not change in 0.14.0)
-
-  .. ipython:: python
-
-     df = DataFrame([[1, np.nan], [1, 4], [5, 6], [5, 8]], columns=['A', 'B'])
-     g = df.groupby('A',as_index=False)
-     g.count()
-     g.describe()
-
-- Allow specification of a more complex groupby via ``pd.Grouper``, such as grouping
-  by a Time and a string field simultaneously. See :ref:`the docs <groupby.specify>`. (:issue:`3794`)
-
-- Better propagation/preservation of Series names when performing groupby
-  operations:
-
-  - ``SeriesGroupBy.agg`` will ensure that the name attribute of the original
-    series is propagated to the result (:issue:`6265`).
-  - If the function provided to ``GroupBy.apply`` returns a named series, the
-    name of the series will be kept as the name of the column index of the
-    DataFrame returned by ``GroupBy.apply`` (:issue:`6124`).  This facilitates
-    ``DataFrame.stack`` operations where the name of the column index is used as
-    the name of the inserted column containing the pivoted data.
-
-
-.. _whatsnew_0140.sql:
-
-SQL
-~~~
-
-The SQL reading and writing functions now support more database flavors
-through SQLAlchemy (:issue:`2717`, :issue:`4163`, :issue:`5950`, :issue:`6292`).
-All databases supported by SQLAlchemy can be used, such
-as PostgreSQL, MySQL, Oracle, Microsoft SQL server (see documentation of
-SQLAlchemy on `included dialects
-<https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html>`_).
-
-The functionality of providing DBAPI connection objects will only be supported
-for sqlite3 in the future. The ``'mysql'`` flavor is deprecated.
-
-The new functions :func:`~pandas.read_sql_query` and :func:`~pandas.read_sql_table`
-are introduced. The function :func:`~pandas.read_sql` is kept as a convenience
-wrapper around the other two and will delegate to specific function depending on
-the provided input (database table name or sql query).
-
-In practice, you have to provide a SQLAlchemy ``engine`` to the sql functions.
-To connect with SQLAlchemy you use the :func:`create_engine` function to create an engine
-object from database URI. You only need to create the engine once per database you are
-connecting to. For an in-memory sqlite database:
-
-.. ipython:: python
-
-   from sqlalchemy import create_engine
-   # Create your connection.
-   engine = create_engine('sqlite:///:memory:')
-
-This ``engine`` can then be used to write or read data to/from this database:
-
-.. ipython:: python
-
-    df = pd.DataFrame({'A': [1,2,3], 'B': ['a', 'b', 'c']})
-    df.to_sql('db_table', engine, index=False)
-
-You can read data from a database by specifying the table name:
-
-.. ipython:: python
-
-   pd.read_sql_table('db_table', engine)
-
-or by specifying a sql query:
-
-.. ipython:: python
-
-   pd.read_sql_query('SELECT * FROM db_table', engine)
-
-Some other enhancements to the sql functions include:
-
-- support for writing the index. This can be controlled with the ``index``
-  keyword (default is True).
-- specify the column label to use when writing the index with ``index_label``.
-- specify string columns to parse as datetimes withh the ``parse_dates``
-  keyword in :func:`~pandas.read_sql_query` and :func:`~pandas.read_sql_table`.
-
-.. warning::
-
-    Some of the existing functions or function aliases have been deprecated
-    and will be removed in future versions. This includes: ``tquery``, ``uquery``,
-    ``read_frame``, ``frame_query``, ``write_frame``.
-
-.. warning::
-
-    The support for the 'mysql' flavor when using DBAPI connection objects has been deprecated.
-    MySQL will be further supported with SQLAlchemy engines (:issue:`6900`).
-
-
-.. _whatsnew_0140.slicers:
-
-MultiIndexing Using Slicers
-~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-In 0.14.0 we added a new way to slice multi-indexed objects.
-You can slice a multi-index by providing multiple indexers.
-
-You can provide any of the selectors as if you are indexing by label, see :ref:`Selection by Label <indexing.label>`,
-including slices, lists of labels, labels, and boolean indexers.
-
-You can use ``slice(None)`` to select all the contents of *that* level. You do not need to specify all the
-*deeper* levels, they will be implied as ``slice(None)``.
-
-As usual, **both sides** of the slicers are included as this is label indexing.
-
-See :ref:`the docs<advanced.mi_slicers>`
-See also issues (:issue:`6134`, :issue:`4036`, :issue:`3057`, :issue:`2598`, :issue:`5641`, :issue:`7106`)
-
-.. warning::
-
-   You should specify all axes in the ``.loc`` specifier, meaning the indexer for the **index** and
-   for the **columns**. Their are some ambiguous cases where the passed indexer could be mis-interpreted
-   as indexing *both* axes, rather than into say the MuliIndex for the rows.
-
-   You should do this:
-
-   .. code-block:: python
-
-      df.loc[(slice('A1','A3'),.....),:]
-
-   rather than this:
-
-   .. code-block:: python
-
-      df.loc[(slice('A1','A3'),.....)]
-
-.. warning::
-
-   You will need to make sure that the selection axes are fully lexsorted!
-
-.. ipython:: python
-
-   def mklbl(prefix,n):
-       return ["%s%s" % (prefix,i)  for i in range(n)]
-
-   index = MultiIndex.from_product([mklbl('A',4),
-                                    mklbl('B',2),
-                                    mklbl('C',4),
-                                    mklbl('D',2)])
-   columns = MultiIndex.from_tuples([('a','foo'),('a','bar'),
-                                     ('b','foo'),('b','bah')],
-                                      names=['lvl0', 'lvl1'])
-   df = DataFrame(np.arange(len(index)*len(columns)).reshape((len(index),len(columns))),
-                  index=index,
-                  columns=columns).sort_index().sort_index(axis=1)
-   df
-
-Basic multi-index slicing using slices, lists, and labels.
-
-.. ipython:: python
-
-   df.loc[(slice('A1','A3'),slice(None), ['C1','C3']),:]
-
-You can use a ``pd.IndexSlice`` to shortcut the creation of these slices
-
-.. ipython:: python
-
-   idx = pd.IndexSlice
-   df.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
-
-It is possible to perform quite complicated selections using this method on multiple
-axes at the same time.
-
-.. ipython:: python
-
-   df.loc['A1',(slice(None),'foo')]
-   df.loc[idx[:,:,['C1','C3']],idx[:,'foo']]
-
-Using a boolean indexer you can provide selection related to the *values*.
-
-.. ipython:: python
-
-   mask = df[('a','foo')]>200
-   df.loc[idx[mask,:,['C1','C3']],idx[:,'foo']]
-
-You can also specify the ``axis`` argument to ``.loc`` to interpret the passed
-slicers on a single axis.
-
-.. ipython:: python
-
-   df.loc(axis=0)[:,:,['C1','C3']]
-
-Furthermore you can *set* the values using these methods
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2.loc(axis=0)[:,:,['C1','C3']] = -10
-   df2
-
-You can use a right-hand-side of an alignable object as well.
-
-.. ipython:: python
-
-   df2 = df.copy()
-   df2.loc[idx[:,:,['C1','C3']],:] = df2*1000
-   df2
-
-.. _whatsnew_0140.plotting:
-
-Plotting
-~~~~~~~~
-
-- Hexagonal bin plots from ``DataFrame.plot`` with ``kind='hexbin'`` (:issue:`5478`), See :ref:`the docs<visualization.hexbin>`.
-- ``DataFrame.plot`` and ``Series.plot`` now supports area plot with specifying ``kind='area'`` (:issue:`6656`), See :ref:`the docs<visualization.area_plot>`
-- Pie plots from ``Series.plot`` and ``DataFrame.plot`` with ``kind='pie'`` (:issue:`6976`), See :ref:`the docs<visualization.pie>`.
-- Plotting with Error Bars is now supported in the ``.plot`` method of ``DataFrame`` and ``Series`` objects (:issue:`3796`, :issue:`6834`), See :ref:`the docs<visualization.errorbars>`.
-- ``DataFrame.plot`` and ``Series.plot`` now support a ``table`` keyword for plotting ``matplotlib.Table``, See :ref:`the docs<visualization.table>`. The ``table`` keyword can receive the following values.
-
-  - ``False``: Do nothing (default).
-  - ``True``: Draw a table using the ``DataFrame`` or ``Series`` called ``plot`` method. Data will be transposed to meet matplotlib's default layout.
-  - ``DataFrame`` or ``Series``: Draw matplotlib.table using the passed data. The data will be drawn as displayed in print method (not transposed automatically).
-    Also, helper function ``pandas.tools.plotting.table`` is added to create a table from ``DataFrame`` and ``Series``, and add it to an ``matplotlib.Axes``.
-
-- ``plot(legend='reverse')`` will now reverse the order of legend labels for
-  most plot kinds. (:issue:`6014`)
-- Line plot and area plot can be stacked by ``stacked=True`` (:issue:`6656`)
-
-- Following keywords are now acceptable for :meth:`DataFrame.plot` with ``kind='bar'`` and ``kind='barh'``:
-
-  - `width`: Specify the bar width. In previous versions, static value 0.5 was passed to matplotlib and it cannot be overwritten. (:issue:`6604`)
-  - `align`: Specify the bar alignment. Default is `center` (different from matplotlib). In previous versions, pandas passes `align='edge'` to matplotlib and adjust the location to `center` by itself, and it results `align` keyword is not applied as expected. (:issue:`4525`)
-  - `position`: Specify relative alignments for bar plot layout. From 0 (left/bottom-end) to 1(right/top-end). Default is 0.5 (center). (:issue:`6604`)
-
-  Because of the default `align` value changes, coordinates of bar plots are now located on integer values (0.0, 1.0, 2.0 ...). This is intended to make bar plot be located on the same coodinates as line plot. However, bar plot may differs unexpectedly when you manually adjust the bar location or drawing area, such as using `set_xlim`, `set_ylim`, etc. In this cases, please modify your script to meet with new coordinates.
-
-- The :func:`parallel_coordinates` function now takes argument ``color``
-  instead of ``colors``. A ``FutureWarning`` is raised  to alert that
-  the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
-
-- The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
-  positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
-  raised  if the old ``data`` argument is used by name. (:issue:`6956`)
-
-- :meth:`DataFrame.boxplot` now supports ``layout`` keyword (:issue:`6769`)
-- :meth:`DataFrame.boxplot` has a new keyword argument, `return_type`. It accepts ``'dict'``,
-  ``'axes'``, or ``'both'``, in which case a namedtuple with the matplotlib
-  axes and a dict of matplotlib Lines is returned.
-
-
-.. _whatsnew_0140.prior_deprecations:
-
-Prior Version Deprecations/Changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-There are prior version deprecations that are taking effect as of 0.14.0.
-
-- Remove :class:`DateRange` in favor of :class:`DatetimeIndex` (:issue:`6816`)
-- Remove ``column`` keyword from ``DataFrame.sort`` (:issue:`4370`)
-- Remove ``precision`` keyword from :func:`set_eng_float_format` (:issue:`395`)
-- Remove ``force_unicode`` keyword from :meth:`DataFrame.to_string`,
-  :meth:`DataFrame.to_latex`, and :meth:`DataFrame.to_html`; these function
-  encode in unicode by default (:issue:`2224`, :issue:`2225`)
-- Remove ``nanRep`` keyword from :meth:`DataFrame.to_csv` and
-  :meth:`DataFrame.to_string` (:issue:`275`)
-- Remove ``unique`` keyword from :meth:`HDFStore.select_column` (:issue:`3256`)
-- Remove ``inferTimeRule`` keyword from :func:`Timestamp.offset` (:issue:`391`)
-- Remove ``name`` keyword from :func:`get_data_yahoo` and
-  :func:`get_data_google` ( `commit b921d1a <https://github.com/pandas-dev/pandas/commit/b921d1a2>`__ )
-- Remove ``offset`` keyword from :class:`DatetimeIndex` constructor
-  ( `commit 3136390 <https://github.com/pandas-dev/pandas/commit/3136390>`__ )
-- Remove ``time_rule`` from several rolling-moment statistical functions, such
-  as :func:`rolling_sum` (:issue:`1042`)
-- Removed neg ``-`` boolean operations on numpy arrays in favor of inv ``~``, as this is going to
-  be deprecated in numpy 1.9 (:issue:`6960`)
-
-.. _whatsnew_0140.deprecations:
-
-Deprecations
-~~~~~~~~~~~~
-
-- The :func:`pivot_table`/:meth:`DataFrame.pivot_table` and :func:`crosstab` functions
-  now take arguments ``index`` and ``columns`` instead of ``rows`` and ``cols``.  A
-  ``FutureWarning`` is raised  to alert that the old ``rows`` and ``cols`` arguments
-  will not be supported in a future release (:issue:`5505`)
-
-- The :meth:`DataFrame.drop_duplicates` and :meth:`DataFrame.duplicated` methods
-  now take argument ``subset`` instead of ``cols`` to better align with
-  :meth:`DataFrame.dropna`.  A ``FutureWarning`` is raised  to alert that the old
-  ``cols`` arguments will not be supported in a future release (:issue:`6680`)
-
-- The :meth:`DataFrame.to_csv` and :meth:`DataFrame.to_excel` functions
-  now takes argument ``columns`` instead of ``cols``.  A
-  ``FutureWarning`` is raised  to alert that the old ``cols`` arguments
-  will not be supported in a future release (:issue:`6645`)
-
-- Indexers will warn ``FutureWarning`` when used with a scalar indexer and
-  a non-floating point Index (:issue:`4892`, :issue:`6960`)
-
-  .. code-block:: ipython
-
-     # non-floating point indexes can only be indexed by integers / labels
-     In [1]: Series(1,np.arange(5))[3.0]
-             pandas/core/index.py:469: FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
-     Out[1]: 1
-
-     In [2]: Series(1,np.arange(5)).iloc[3.0]
-             pandas/core/index.py:469: FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
-     Out[2]: 1
-
-     In [3]: Series(1,np.arange(5)).iloc[3.0:4]
-             pandas/core/index.py:527: FutureWarning: slice indexers when using iloc should be integers and not floating point
-     Out[3]:
-             3    1
-             dtype: int64
-
-     # these are Float64Indexes, so integer or floating point is acceptable
-     In [4]: Series(1,np.arange(5.))[3]
-     Out[4]: 1
-
-     In [5]: Series(1,np.arange(5.))[3.0]
-     Out[6]: 1
-
-- Numpy 1.9 compat w.r.t. deprecation warnings (:issue:`6960`)
-
-- :meth:`Panel.shift` now has a function signature that matches :meth:`DataFrame.shift`.
-  The old positional argument ``lags`` has been changed to a keyword argument
-  ``periods`` with a default value of 1. A ``FutureWarning`` is raised if the
-  old argument ``lags`` is used by name. (:issue:`6910`)
-- The ``order`` keyword argument of :func:`factorize` will be removed. (:issue:`6926`).
-
-- Remove the ``copy`` keyword from :meth:`DataFrame.xs`, :meth:`Panel.major_xs`, :meth:`Panel.minor_xs`. A view will be
-  returned if possible, otherwise a copy will be made. Previously the user could think that ``copy=False`` would
-  ALWAYS return a view. (:issue:`6894`)
-
-- The :func:`parallel_coordinates` function now takes argument ``color``
-  instead of ``colors``. A ``FutureWarning`` is raised  to alert that
-  the old ``colors`` argument will not be supported in a future release. (:issue:`6956`)
-
-- The :func:`parallel_coordinates` and :func:`andrews_curves` functions now take
-  positional argument ``frame`` instead of ``data``. A ``FutureWarning`` is
-  raised  if the old ``data`` argument is used by name. (:issue:`6956`)
-
-- The support for the 'mysql' flavor when using DBAPI connection objects has been deprecated.
-  MySQL will be further supported with SQLAlchemy engines (:issue:`6900`).
-
-- The following ``io.sql`` functions have been deprecated: ``tquery``, ``uquery``, ``read_frame``, ``frame_query``, ``write_frame``.
-
-- The `percentile_width` keyword argument in :meth:`~DataFrame.describe` has been deprecated.
-  Use the `percentiles` keyword instead, which takes a list of percentiles to display. The
-  default output is unchanged.
-
-- The default return type of :func:`boxplot` will change from a dict to a matpltolib Axes
-  in a future release. You can use the future behavior now by passing ``return_type='axes'``
-  to boxplot.
-
-.. _whatsnew_0140.knownissues:
-
-Known Issues
-~~~~~~~~~~~~
-
-- OpenPyXL 2.0.0 breaks backwards compatibility (:issue:`7169`)
-
-
-.. _whatsnew_0140.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-- DataFrame and Series will create a MultiIndex object if passed a tuples dict, See :ref:`the docs<basics.dataframe.from_dict_of_tuples>` (:issue:`3323`)
-
-  .. ipython:: python
-
-     Series({('a', 'b'): 1, ('a', 'a'): 0,
-             ('a', 'c'): 2, ('b', 'a'): 3, ('b', 'b'): 4})
-     DataFrame({('a', 'b'): {('A', 'B'): 1, ('A', 'C'): 2},
-                ('a', 'a'): {('A', 'C'): 3, ('A', 'B'): 4},
-                ('a', 'c'): {('A', 'B'): 5, ('A', 'C'): 6},
-                ('b', 'a'): {('A', 'C'): 7, ('A', 'B'): 8},
-                ('b', 'b'): {('A', 'D'): 9, ('A', 'B'): 10}})
-
-- Added the ``sym_diff`` method to ``Index`` (:issue:`5543`)
-- ``DataFrame.to_latex`` now takes a longtable keyword, which if True will return a table in a longtable environment. (:issue:`6617`)
-- Add option to turn off escaping in ``DataFrame.to_latex`` (:issue:`6472`)
-- ``pd.read_clipboard`` will, if the keyword ``sep`` is unspecified, try to detect data copied from a spreadsheet
-  and parse accordingly. (:issue:`6223`)
-- Joining a singly-indexed DataFrame with a multi-indexed DataFrame (:issue:`3662`)
-
-  See :ref:`the docs<merging.join_on_mi>`. Joining multi-index DataFrames on both the left and right is not yet supported ATM.
-
-  .. ipython:: python
-
-     household = DataFrame(dict(household_id = [1,2,3],
-                                male = [0,1,0],
-                                wealth = [196087.3,316478.7,294750]),
-                           columns = ['household_id','male','wealth']
-                          ).set_index('household_id')
-     household
-     portfolio = DataFrame(dict(household_id = [1,2,2,3,3,3,4],
-                                asset_id = ["nl0000301109","nl0000289783","gb00b03mlx29",
-                                            "gb00b03mlx29","lu0197800237","nl0000289965",np.nan],
-                                name = ["ABN Amro","Robeco","Royal Dutch Shell","Royal Dutch Shell",
-                                        "AAB Eastern Europe Equity Fund","Postbank BioTech Fonds",np.nan],
-                                share = [1.0,0.4,0.6,0.15,0.6,0.25,1.0]),
-                           columns = ['household_id','asset_id','name','share']
-                          ).set_index(['household_id','asset_id'])
-     portfolio
-
-     household.join(portfolio, how='inner')
-
-- ``quotechar``, ``doublequote``, and ``escapechar`` can now be specified when
-  using ``DataFrame.to_csv`` (:issue:`5414`, :issue:`4528`)
-- Partially sort by only the specified levels of a MultiIndex with the
-  ``sort_remaining`` boolean kwarg. (:issue:`3984`)
-- Added ``to_julian_date`` to ``TimeStamp`` and ``DatetimeIndex``.  The Julian
-  Date is used primarily in astronomy and represents the number of days from
-  noon, January 1, 4713 BC.  Because nanoseconds are used to define the time
-  in pandas the actual range of dates that you can use is 1678 AD to 2262 AD. (:issue:`4041`)
-- ``DataFrame.to_stata`` will now check data for compatibility with Stata data types
-  and will upcast when needed.  When it is not possible to losslessly upcast, a warning
-  is issued (:issue:`6327`)
-- ``DataFrame.to_stata`` and ``StataWriter`` will accept keyword arguments time_stamp
-  and data_label which allow the time stamp and dataset label to be set when creating a
-  file. (:issue:`6545`)
-- ``pandas.io.gbq`` now handles reading unicode strings properly. (:issue:`5940`)
-- :ref:`Holidays Calendars<timeseries.holiday>` are now available and can be used with the ``CustomBusinessDay`` offset (:issue:`6719`)
-- ``Float64Index`` is now backed by a ``float64`` dtype ndarray instead of an
-  ``object`` dtype array (:issue:`6471`).
-- Implemented ``Panel.pct_change`` (:issue:`6904`)
-- Added ``how`` option to rolling-moment functions to dictate how to handle resampling; :func:`rolling_max` defaults to max,
-  :func:`rolling_min` defaults to min, and all others default to mean (:issue:`6297`)
-- ``CustomBuisnessMonthBegin`` and ``CustomBusinessMonthEnd`` are now available (:issue:`6866`)
-- :meth:`Series.quantile` and :meth:`DataFrame.quantile` now accept an array of
-  quantiles.
-- :meth:`~DataFrame.describe` now accepts an array of percentiles to include in the summary statistics (:issue:`4196`)
-- ``pivot_table`` can now accept ``Grouper`` by ``index`` and ``columns`` keywords (:issue:`6913`)
-
-  .. ipython:: python
-
-    import datetime
-    df = DataFrame({
-      'Branch' : 'A A A A A B'.split(),
-      'Buyer': 'Carl Mark Carl Carl Joe Joe'.split(),
-      'Quantity': [1, 3, 5, 1, 8, 1],
-      'Date' : [datetime.datetime(2013,11,1,13,0), datetime.datetime(2013,9,1,13,5),
-                datetime.datetime(2013,10,1,20,0), datetime.datetime(2013,10,2,10,0),
-                datetime.datetime(2013,11,1,20,0), datetime.datetime(2013,10,2,10,0)],
-      'PayDay' : [datetime.datetime(2013,10,4,0,0), datetime.datetime(2013,10,15,13,5),
-                  datetime.datetime(2013,9,5,20,0), datetime.datetime(2013,11,2,10,0),
-                  datetime.datetime(2013,10,7,20,0), datetime.datetime(2013,9,5,10,0)]})
-    df
-
-    pivot_table(df, index=Grouper(freq='M', key='Date'),
-                columns=Grouper(freq='M', key='PayDay'),
-                values='Quantity', aggfunc=np.sum)
-
-- Arrays of strings can be wrapped to a specified width (``str.wrap``) (:issue:`6999`)
-- Add :meth:`~Series.nsmallest` and :meth:`Series.nlargest` methods to Series, See :ref:`the docs <basics.nsorted>` (:issue:`3960`)
-
-- `PeriodIndex` fully supports partial string indexing like `DatetimeIndex` (:issue:`7043`)
-
-  .. ipython:: python
-
-     prng = period_range('2013-01-01 09:00', periods=100, freq='H')
-     ps = Series(np.random.randn(len(prng)), index=prng)
-     ps
-     ps['2013-01-02']
-
-- ``read_excel`` can now read milliseconds in Excel dates and times with xlrd >= 0.9.3. (:issue:`5945`)
-- ``pd.stats.moments.rolling_var`` now uses Welford's method for increased numerical stability (:issue:`6817`)
-- pd.expanding_apply and pd.rolling_apply now take args and kwargs that are passed on to
-  the func (:issue:`6289`)
-- ``DataFrame.rank()`` now has a percentage rank option (:issue:`5971`)
-- ``Series.rank()`` now has a percentage rank option (:issue:`5971`)
-- ``Series.rank()`` and ``DataFrame.rank()`` now accept ``method='dense'`` for ranks without gaps (:issue:`6514`)
-- Support passing ``encoding`` with xlwt (:issue:`3710`)
-- Refactor Block classes removing `Block.items` attributes to avoid duplication
-  in item handling (:issue:`6745`, :issue:`6988`).
-- Testing statements updated to use specialized asserts (:issue:`6175`)
-
-
-
-.. _whatsnew_0140.performance:
-
-Performance
-~~~~~~~~~~~
-
-- Performance improvement when converting ``DatetimeIndex`` to floating ordinals
-  using ``DatetimeConverter`` (:issue:`6636`)
-- Performance improvement for  ``DataFrame.shift`` (:issue:`5609`)
-- Performance improvement in indexing into a multi-indexed Series (:issue:`5567`)
-- Performance improvements in single-dtyped indexing (:issue:`6484`)
-- Improve performance of DataFrame construction with certain offsets, by removing faulty caching
-  (e.g. MonthEnd,BusinessMonthEnd), (:issue:`6479`)
-- Improve performance of ``CustomBusinessDay`` (:issue:`6584`)
-- improve performance of slice indexing on Series with string keys (:issue:`6341`, :issue:`6372`)
-- Performance improvement for ``DataFrame.from_records`` when reading a
-  specified number of rows from an iterable (:issue:`6700`)
-- Performance improvements in timedelta conversions for integer dtypes (:issue:`6754`)
-- Improved performance of compatible pickles (:issue:`6899`)
-- Improve performance in certain reindexing operations by optimizing ``take_2d`` (:issue:`6749`)
-- ``GroupBy.count()`` is now implemented in Cython and is much faster for large
-  numbers of groups (:issue:`7016`).
-
-Experimental
-~~~~~~~~~~~~
-
-There are no experimental changes in 0.14.0
-
-
-.. _whatsnew_0140.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in Series ValueError when index doesn't match data (:issue:`6532`)
-- Prevent segfault due to MultiIndex not being supported in HDFStore table
-  format (:issue:`1848`)
-- Bug in ``pd.DataFrame.sort_index`` where mergesort wasn't stable when ``ascending=False`` (:issue:`6399`)
-- Bug in ``pd.tseries.frequencies.to_offset`` when argument has leading zeroes (:issue:`6391`)
-- Bug in version string gen. for dev versions with shallow clones / install from tarball (:issue:`6127`)
-- Inconsistent tz parsing ``Timestamp`` / ``to_datetime`` for current year (:issue:`5958`)
-- Indexing bugs with reordered indexes (:issue:`6252`, :issue:`6254`)
-- Bug in ``.xs`` with a Series multiindex (:issue:`6258`, :issue:`5684`)
-- Bug in conversion of a string types to a DatetimeIndex with a specified frequency (:issue:`6273`, :issue:`6274`)
-- Bug in ``eval`` where type-promotion failed for large expressions (:issue:`6205`)
-- Bug in interpolate with ``inplace=True`` (:issue:`6281`)
-- ``HDFStore.remove`` now handles start and stop (:issue:`6177`)
-- ``HDFStore.select_as_multiple`` handles start and stop the same way as ``select`` (:issue:`6177`)
-- ``HDFStore.select_as_coordinates`` and ``select_column`` works with a ``where`` clause that results in filters (:issue:`6177`)
-- Regression in join of non_unique_indexes (:issue:`6329`)
-- Issue with groupby ``agg`` with a single function and a a mixed-type frame (:issue:`6337`)
-- Bug in ``DataFrame.replace()`` when passing a non- ``bool``
-  ``to_replace`` argument (:issue:`6332`)
-- Raise when trying to align on different levels of a multi-index assignment (:issue:`3738`)
-- Bug in setting complex dtypes via boolean indexing (:issue:`6345`)
-- Bug in TimeGrouper/resample when presented with a non-monotonic DatetimeIndex that would return invalid results. (:issue:`4161`)
-- Bug in index name propogation in TimeGrouper/resample (:issue:`4161`)
-- TimeGrouper has a more compatible API to the rest of the groupers (e.g. ``groups`` was missing) (:issue:`3881`)
-- Bug in multiple grouping with a TimeGrouper depending on target column order (:issue:`6764`)
-- Bug in ``pd.eval`` when parsing strings with possible tokens like ``'&'``
-  (:issue:`6351`)
-- Bug correctly handle placements of ``-inf`` in Panels when dividing by integer 0 (:issue:`6178`)
-- ``DataFrame.shift`` with ``axis=1`` was raising (:issue:`6371`)
-- Disabled clipboard tests until release time (run locally with ``nosetests -A disabled``) (:issue:`6048`).
-- Bug in ``DataFrame.replace()`` when passing a nested ``dict`` that contained
-  keys not in the values to be replaced (:issue:`6342`)
-- ``str.match`` ignored the na flag (:issue:`6609`).
-- Bug in take with duplicate columns that were not consolidated (:issue:`6240`)
-- Bug in interpolate changing dtypes (:issue:`6290`)
-- Bug in ``Series.get``, was using a buggy access method (:issue:`6383`)
-- Bug in hdfstore queries of the form ``where=[('date', '>=', datetime(2013,1,1)), ('date', '<=', datetime(2014,1,1))]`` (:issue:`6313`)
-- Bug in ``DataFrame.dropna`` with duplicate indices (:issue:`6355`)
-- Regression in chained getitem indexing with embedded list-like from 0.12 (:issue:`6394`)
-- ``Float64Index`` with nans not comparing correctly (:issue:`6401`)
-- ``eval``/``query`` expressions with strings containing the ``@`` character
-  will now work (:issue:`6366`).
-- Bug in ``Series.reindex`` when specifying a ``method`` with some nan values was inconsistent (noted on a resample) (:issue:`6418`)
-- Bug in :meth:`DataFrame.replace` where nested dicts were erroneously
-  depending on the order of dictionary keys and values (:issue:`5338`).
-- Perf issue in concatting with empty objects (:issue:`3259`)
-- Clarify sorting of ``sym_diff`` on ``Index`` objects with ``NaN`` values (:issue:`6444`)
-- Regression in ``MultiIndex.from_product`` with a ``DatetimeIndex`` as input (:issue:`6439`)
-- Bug in ``str.extract`` when passed a non-default index (:issue:`6348`)
-- Bug in ``str.split`` when passed ``pat=None`` and ``n=1`` (:issue:`6466`)
-- Bug in ``io.data.DataReader`` when passed ``"F-F_Momentum_Factor"`` and ``data_source="famafrench"`` (:issue:`6460`)
-- Bug in ``sum`` of a ``timedelta64[ns]`` series (:issue:`6462`)
-- Bug in ``resample`` with a timezone and certain offsets (:issue:`6397`)
-- Bug in ``iat/iloc`` with duplicate indices on a Series (:issue:`6493`)
-- Bug in ``read_html`` where nan's were incorrectly being used to indicate
-  missing values in text. Should use the empty string for consistency with the
-  rest of pandas (:issue:`5129`).
-- Bug in ``read_html`` tests where redirected invalid URLs would make one test
-  fail (:issue:`6445`).
-- Bug in multi-axis indexing using ``.loc`` on non-unique indices (:issue:`6504`)
-- Bug that caused _ref_locs corruption when slice indexing across columns axis of a DataFrame (:issue:`6525`)
-- Regression from 0.13 in the treatment of numpy ``datetime64`` non-ns dtypes in Series creation (:issue:`6529`)
-- ``.names`` attribute of MultiIndexes passed to ``set_index`` are now preserved (:issue:`6459`).
-- Bug in setitem with a duplicate index and an alignable rhs (:issue:`6541`)
-- Bug in setitem with ``.loc`` on mixed integer Indexes (:issue:`6546`)
-- Bug in ``pd.read_stata`` which would use the wrong data types and missing values (:issue:`6327`)
-- Bug in ``DataFrame.to_stata`` that lead to data loss in certain cases, and could be exported using the
-  wrong data types and missing values (:issue:`6335`)
-- ``StataWriter`` replaces missing values in string columns by empty string (:issue:`6802`)
-- Inconsistent types in ``Timestamp`` addition/subtraction (:issue:`6543`)
-- Bug in preserving frequency across Timestamp addition/subtraction (:issue:`4547`)
-- Bug in empty list lookup caused ``IndexError`` exceptions (:issue:`6536`, :issue:`6551`)
-- ``Series.quantile`` raising on an ``object`` dtype (:issue:`6555`)
-- Bug in ``.xs`` with a ``nan`` in level when dropped (:issue:`6574`)
-- Bug in fillna with ``method='bfill/ffill'`` and ``datetime64[ns]`` dtype (:issue:`6587`)
-- Bug in sql writing with mixed dtypes possibly leading to data loss (:issue:`6509`)
-- Bug in ``Series.pop`` (:issue:`6600`)
-- Bug in ``iloc`` indexing when positional indexer matched ``Int64Index`` of the corresponding axis and no reordering happened (:issue:`6612`)
-- Bug in ``fillna`` with ``limit`` and ``value`` specified
-- Bug in ``DataFrame.to_stata`` when columns have non-string names (:issue:`4558`)
-- Bug in compat with ``np.compress``, surfaced in (:issue:`6658`)
-- Bug in binary operations with a rhs of a Series not aligning (:issue:`6681`)
-- Bug in ``DataFrame.to_stata`` which incorrectly handles nan values and ignores ``with_index`` keyword argument (:issue:`6685`)
-- Bug in resample with extra bins when using an evenly divisible frequency (:issue:`4076`)
-- Bug in consistency of groupby aggregation when passing a custom function (:issue:`6715`)
-- Bug in resample when ``how=None`` resample freq is the same as the axis frequency (:issue:`5955`)
-- Bug in downcasting inference with empty arrays (:issue:`6733`)
-- Bug in ``obj.blocks`` on sparse containers dropping all but the last items of same for dtype (:issue:`6748`)
-- Bug in unpickling ``NaT (NaTType)`` (:issue:`4606`)
-- Bug in ``DataFrame.replace()`` where regex metacharacters were being treated
-  as regexs even when ``regex=False`` (:issue:`6777`).
-- Bug in timedelta ops on 32-bit platforms (:issue:`6808`)
-- Bug in setting a tz-aware index directly via ``.index`` (:issue:`6785`)
-- Bug in expressions.py where numexpr would try to evaluate arithmetic ops
-  (:issue:`6762`).
-- Bug in Makefile where it didn't remove Cython generated C files with ``make
-  clean`` (:issue:`6768`)
-- Bug with numpy < 1.7.2 when reading long strings from ``HDFStore`` (:issue:`6166`)
-- Bug in ``DataFrame._reduce`` where non bool-like (0/1) integers were being
-  coverted into bools. (:issue:`6806`)
-- Regression from 0.13 with ``fillna`` and a Series on datetime-like (:issue:`6344`)
-- Bug in adding ``np.timedelta64`` to ``DatetimeIndex`` with timezone outputs incorrect results (:issue:`6818`)
-- Bug in ``DataFrame.replace()`` where changing a dtype through replacement
-  would only replace the first occurrence of a value (:issue:`6689`)
-- Better error message when passing a frequency of 'MS' in ``Period`` construction (GH5332)
-- Bug in ``Series.__unicode__`` when ``max_rows=None`` and the Series has more than 1000 rows. (:issue:`6863`)
-- Bug in ``groupby.get_group`` where a datetlike wasn't always accepted (:issue:`5267`)
-- Bug in ``groupBy.get_group`` created by ``TimeGrouper`` raises ``AttributeError`` (:issue:`6914`)
-- Bug in ``DatetimeIndex.tz_localize`` and ``DatetimeIndex.tz_convert`` converting ``NaT`` incorrectly (:issue:`5546`)
-- Bug in arithmetic operations affecting ``NaT`` (:issue:`6873`)
-- Bug in ``Series.str.extract`` where the resulting ``Series`` from a single
-  group match wasn't renamed to the group name
-- Bug in ``DataFrame.to_csv`` where setting ``index=False`` ignored the
-  ``header`` kwarg (:issue:`6186`)
-- Bug in ``DataFrame.plot`` and ``Series.plot``, where the legend behave inconsistently when plotting to the same axes repeatedly (:issue:`6678`)
-- Internal tests for patching ``__finalize__`` / bug in merge not finalizing (:issue:`6923`, :issue:`6927`)
-- accept ``TextFileReader`` in ``concat``, which was affecting a common user idiom (:issue:`6583`)
-- Bug in C parser with leading whitespace (:issue:`3374`)
-- Bug in C parser with ``delim_whitespace=True`` and ``\r``-delimited lines
-- Bug in python parser with explicit multi-index in row following column header (:issue:`6893`)
-- Bug in ``Series.rank`` and ``DataFrame.rank`` that caused small floats (<1e-13) to all receive the same rank (:issue:`6886`)
-- Bug in ``DataFrame.apply`` with functions that used \*args`` or \*\*kwargs and returned
-  an empty result (:issue:`6952`)
-- Bug in sum/mean on 32-bit platforms on overflows (:issue:`6915`)
-- Moved ``Panel.shift`` to ``NDFrame.slice_shift`` and fixed to respect multiple dtypes. (:issue:`6959`)
-- Bug in enabling ``subplots=True`` in ``DataFrame.plot`` only has single column raises ``TypeError``, and ``Series.plot`` raises ``AttributeError`` (:issue:`6951`)
-- Bug in ``DataFrame.plot`` draws unnecessary axes when enabling ``subplots`` and ``kind=scatter`` (:issue:`6951`)
-- Bug in ``read_csv`` from a filesystem with non-utf-8 encoding (:issue:`6807`)
-- Bug in ``iloc`` when setting / aligning (:issue:`6766`)
-- Bug causing UnicodeEncodeError when get_dummies called with unicode values and a prefix (:issue:`6885`)
-- Bug in timeseries-with-frequency plot cursor display (:issue:`5453`)
-- Bug surfaced in ``groupby.plot`` when using a ``Float64Index`` (:issue:`7025`)
-- Stopped tests from failing if options data isn't able to be downloaded from Yahoo (:issue:`7034`)
-- Bug in ``parallel_coordinates`` and ``radviz`` where reordering of class column
-  caused possible color/class mismatch (:issue:`6956`)
-- Bug in ``radviz`` and ``andrews_curves`` where multiple values of 'color'
-  were being passed to plotting method (:issue:`6956`)
-- Bug in ``Float64Index.isin()`` where containing ``nan`` s would make indices
-  claim that they contained all the things (:issue:`7066`).
-- Bug in ``DataFrame.boxplot`` where it failed to use the axis passed as the ``ax`` argument (:issue:`3578`)
-- Bug in the ``XlsxWriter`` and ``XlwtWriter`` implementations that resulted in datetime columns being formatted without the time (:issue:`7075`)
-  were being passed to plotting method
-- :func:`read_fwf` treats ``None`` in ``colspec`` like regular python slices. It now reads from the beginning
-  or until the end of the line when ``colspec`` contains a ``None`` (previously raised a ``TypeError``)
-- Bug in cache coherence with chained indexing and slicing; add ``_is_view`` property to ``NDFrame`` to correctly predict
-  views; mark ``is_copy`` on ``xs`` only if its an actual copy (and not a view) (:issue:`7084`)
-- Bug in DatetimeIndex creation from string ndarray with ``dayfirst=True`` (:issue:`5917`)
-- Bug in ``MultiIndex.from_arrays`` created from ``DatetimeIndex`` doesn't preserve ``freq`` and ``tz`` (:issue:`7090`)
-- Bug in ``unstack`` raises ``ValueError`` when ``MultiIndex`` contains ``PeriodIndex`` (:issue:`4342`)
-- Bug in ``boxplot`` and ``hist`` draws unnecessary axes (:issue:`6769`)
-- Regression in ``groupby.nth()`` for out-of-bounds indexers (:issue:`6621`)
-- Bug in ``quantile`` with datetime values (:issue:`6965`)
-- Bug in ``Dataframe.set_index``, ``reindex`` and ``pivot`` don't preserve ``DatetimeIndex`` and ``PeriodIndex`` attributes (:issue:`3950`, :issue:`5878`, :issue:`6631`)
-- Bug in ``MultiIndex.get_level_values`` doesn't preserve ``DatetimeIndex`` and ``PeriodIndex`` attributes (:issue:`7092`)
-- Bug in ``Groupby`` doesn't preserve ``tz`` (:issue:`3950`)
-- Bug in ``PeriodIndex`` partial string slicing (:issue:`6716`)
-- Bug in the HTML repr of a truncated Series or DataFrame not showing the class name with the `large_repr` set to 'info'
-  (:issue:`7105`)
-- Bug in ``DatetimeIndex`` specifying ``freq`` raises ``ValueError`` when passed value is too short (:issue:`7098`)
-- Fixed a bug with the `info` repr not honoring the `display.max_info_columns` setting (:issue:`6939`)
-- Bug ``PeriodIndex`` string slicing with out of bounds values (:issue:`5407`)
-- Fixed a memory error in the hashtable implementation/factorizer on resizing of large tables (:issue:`7157`)
-- Bug in ``isnull`` when applied to 0-dimensional object arrays (:issue:`7176`)
-- Bug in ``query``/``eval`` where global constants were not looked up correctly
-  (:issue:`7178`)
-- Bug in recognizing out-of-bounds positional list indexers with ``iloc`` and a multi-axis tuple indexer (:issue:`7189`)
-- Bug in setitem with a single value, multi-index and integer indices (:issue:`7190`, :issue:`7218`)
-- Bug in expressions evaluation with reversed ops, showing in series-dataframe ops (:issue:`7198`, :issue:`7192`)
-- Bug in multi-axis indexing with > 2 ndim and a multi-index (:issue:`7199`)
-- Fix a bug where invalid eval/query operations would blow the stack (:issue:`5198`)
diff --git a/doc/source/whatsnew/v0.14.1.rst b/doc/source/whatsnew/v0.14.1.rst
new file mode 100644
index 0000000000000..98ebbd6a52344
--- /dev/null
+++ b/doc/source/whatsnew/v0.14.1.rst
@@ -0,0 +1,282 @@
+.. _whatsnew_0141:
+
+v0.14.1 (July 11, 2014)
+-----------------------
+
+{{ header }}
+
+
+This is a minor release from 0.14.0 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+- Highlights include:
+
+  - New methods :meth:`~pandas.DataFrame.select_dtypes` to select columns
+    based on the dtype and :meth:`~pandas.Series.sem` to calculate the
+    standard error of the mean.
+  - Support for dateutil timezones (see :ref:`docs <timeseries.timezone>`).
+  - Support for ignoring full line comments in the :func:`~pandas.read_csv`
+    text parser.
+  - New documentation section on :ref:`Options and Settings <options>`.
+  - Lots of bug fixes.
+
+- :ref:`Enhancements <whatsnew_0141.enhancements>`
+- :ref:`API Changes <whatsnew_0141.api>`
+- :ref:`Performance Improvements <whatsnew_0141.performance>`
+- :ref:`Experimental Changes <whatsnew_0141.experimental>`
+- :ref:`Bug Fixes <whatsnew_0141.bug_fixes>`
+
+.. _whatsnew_0141.api:
+
+API changes
+~~~~~~~~~~~
+
+- Openpyxl now raises a ValueError on construction of the openpyxl writer
+  instead of warning on pandas import (:issue:`7284`).
+
+- For ``StringMethods.extract``, when no match is found, the result - only
+  containing ``NaN`` values - now also has ``dtype=object`` instead of
+  ``float`` (:issue:`7242`)
+
+- ``Period`` objects no longer raise a ``TypeError`` when compared using ``==``
+  with another object that *isn't* a ``Period``. Instead
+  when comparing a ``Period`` with another object using ``==`` if the other
+  object isn't a ``Period`` ``False`` is returned. (:issue:`7376`)
+
+- Previously, the behaviour on resetting the time or not in
+  ``offsets.apply``, ``rollforward`` and ``rollback`` operations differed
+  between offsets. With the support of the ``normalize`` keyword for all offsets(see
+  below) with a default value of False (preserve time), the behaviour changed for certain
+  offsets (BusinessMonthBegin, MonthEnd, BusinessMonthEnd, CustomBusinessMonthEnd,
+  BusinessYearBegin, LastWeekOfMonth, FY5253Quarter, LastWeekOfMonth, Easter):
+
+  .. code-block:: ipython
+
+    In [6]: from pandas.tseries import offsets
+
+    In [7]: d = pd.Timestamp('2014-01-01 09:00')
+
+    # old behaviour < 0.14.1
+    In [8]: d + offsets.MonthEnd()
+    Out[8]: pd.Timestamp('2014-01-31 00:00:00')
+
+  Starting from 0.14.1 all offsets preserve time by default. The old
+  behaviour can be obtained with ``normalize=True``
+
+  .. ipython:: python
+     :suppress:
+
+     import pandas.tseries.offsets as offsets
+     d = pd.Timestamp('2014-01-01 09:00')
+
+  .. ipython:: python
+
+     # new behaviour
+     d + offsets.MonthEnd()
+     d + offsets.MonthEnd(normalize=True)
+
+  Note that for the other offsets the default behaviour did not change.
+
+- Add back ``#N/A N/A`` as a default NA value in text parsing, (regression from 0.12) (:issue:`5521`)
+- Raise a ``TypeError`` on inplace-setting with a ``.where`` and a non ``np.nan`` value as this is inconsistent
+  with a set-item expression like ``df[mask] = None`` (:issue:`7656`)
+
+
+.. _whatsnew_0141.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- Add ``dropna`` argument to ``value_counts`` and ``nunique`` (:issue:`5569`).
+- Add :meth:`~pandas.DataFrame.select_dtypes` method to allow selection of
+  columns based on dtype (:issue:`7316`). See :ref:`the docs <basics.selectdtypes>`.
+- All ``offsets`` supports the ``normalize`` keyword to specify whether
+  ``offsets.apply``, ``rollforward`` and ``rollback`` resets the time (hour,
+  minute, etc) or not (default ``False``, preserves time) (:issue:`7156`):
+
+  .. code-block:: python
+
+     import pandas.tseries.offsets as offsets
+
+     day = offsets.Day()
+     day.apply(pd.Timestamp('2014-01-01 09:00'))
+
+     day = offsets.Day(normalize=True)
+     day.apply(pd.Timestamp('2014-01-01 09:00'))
+
+- ``PeriodIndex`` is represented as the same format as ``DatetimeIndex`` (:issue:`7601`)
+- ``StringMethods`` now work on empty Series (:issue:`7242`)
+- The file parsers ``read_csv`` and ``read_table`` now ignore line comments provided by
+  the parameter `comment`, which accepts only a single character for the C reader.
+  In particular, they allow for comments before file data begins (:issue:`2685`)
+- Add ``NotImplementedError`` for simultaneous use of ``chunksize`` and ``nrows``
+  for read_csv() (:issue:`6774`).
+- Tests for basic reading of public S3 buckets now exist (:issue:`7281`).
+- ``read_html`` now sports an ``encoding`` argument that is passed to the
+  underlying parser library. You can use this to read non-ascii encoded web
+  pages (:issue:`7323`).
+- ``read_excel`` now supports reading from URLs in the same way
+  that ``read_csv`` does.  (:issue:`6809`)
+- Support for dateutil timezones, which can now be used in the same way as
+  pytz timezones across pandas. (:issue:`4688`)
+
+  .. ipython:: python
+
+     rng = pd.date_range('3/6/2012 00:00', periods=10, freq='D',
+                         tz='dateutil/Europe/London')
+     rng.tz
+
+  See :ref:`the docs <timeseries.timezone>`.
+
+- Implemented ``sem`` (standard error of the mean) operation for ``Series``,
+  ``DataFrame``, ``Panel``, and ``Groupby`` (:issue:`6897`)
+- Add ``nlargest`` and ``nsmallest`` to the ``Series`` ``groupby`` whitelist,
+  which means you can now use these methods on a ``SeriesGroupBy`` object
+  (:issue:`7053`).
+- All offsets ``apply``, ``rollforward`` and ``rollback`` can now handle ``np.datetime64``, previously results in ``ApplyTypeError`` (:issue:`7452`)
+- ``Period`` and ``PeriodIndex`` can contain ``NaT`` in its values (:issue:`7485`)
+- Support pickling ``Series``, ``DataFrame`` and ``Panel`` objects with
+  non-unique labels along *item* axis (``index``, ``columns`` and ``items``
+  respectively) (:issue:`7370`).
+- Improved inference of datetime/timedelta with mixed null objects. Regression from 0.13.1 in interpretation of an object Index
+  with all null elements (:issue:`7431`)
+
+.. _whatsnew_0141.performance:
+
+Performance
+~~~~~~~~~~~
+- Improvements in dtype inference for numeric operations involving yielding performance gains for dtypes: ``int64``, ``timedelta64``, ``datetime64`` (:issue:`7223`)
+- Improvements in Series.transform for significant performance gains (:issue:`6496`)
+- Improvements in DataFrame.transform with ufuncs and built-in grouper functions for significant performance gains (:issue:`7383`)
+- Regression in groupby aggregation of datetime64 dtypes (:issue:`7555`)
+- Improvements in `MultiIndex.from_product` for large iterables (:issue:`7627`)
+
+
+.. _whatsnew_0141.experimental:
+
+Experimental
+~~~~~~~~~~~~
+
+- ``pandas.io.data.Options`` has a new method, ``get_all_data`` method, and now consistently returns a
+  MultiIndexed ``DataFrame`` (:issue:`5602`)
+- ``io.gbq.read_gbq`` and ``io.gbq.to_gbq`` were refactored to remove the
+  dependency on the Google ``bq.py`` command line client. This submodule
+  now uses ``httplib2`` and the Google ``apiclient`` and ``oauth2client`` API client
+  libraries which should be more stable and, therefore, reliable than
+  ``bq.py``. See :ref:`the docs <io.bigquery>`. (:issue:`6937`).
+
+
+.. _whatsnew_0141.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- Bug in ``DataFrame.where`` with a symmetric shaped frame and a passed other of a DataFrame (:issue:`7506`)
+- Bug in Panel indexing with a MultiIndex axis (:issue:`7516`)
+- Regression in datetimelike slice indexing with a duplicated index and non-exact end-points (:issue:`7523`)
+- Bug in setitem with list-of-lists and single vs mixed types (:issue:`7551`:)
+- Bug in time ops with non-aligned Series (:issue:`7500`)
+- Bug in timedelta inference when assigning an incomplete Series (:issue:`7592`)
+- Bug in groupby ``.nth`` with a Series and integer-like column name (:issue:`7559`)
+- Bug in ``Series.get`` with a boolean accessor (:issue:`7407`)
+- Bug in ``value_counts`` where ``NaT`` did not qualify as missing (``NaN``) (:issue:`7423`)
+- Bug in ``to_timedelta`` that accepted invalid units and misinterpreted 'm/h' (:issue:`7611`, :issue:`6423`)
+- Bug in line plot doesn't set correct ``xlim`` if ``secondary_y=True`` (:issue:`7459`)
+- Bug in grouped ``hist`` and ``scatter`` plots use old ``figsize`` default (:issue:`7394`)
+- Bug in plotting subplots with ``DataFrame.plot``, ``hist`` clears passed ``ax`` even if the number of subplots is one (:issue:`7391`).
+- Bug in plotting subplots with ``DataFrame.boxplot`` with ``by`` kw raises ``ValueError`` if the number of subplots exceeds 1 (:issue:`7391`).
+- Bug in subplots displays ``ticklabels`` and ``labels`` in different rule (:issue:`5897`)
+- Bug in ``Panel.apply`` with a MultiIndex as an axis (:issue:`7469`)
+- Bug in ``DatetimeIndex.insert`` doesn't preserve ``name`` and ``tz`` (:issue:`7299`)
+- Bug in ``DatetimeIndex.asobject`` doesn't preserve ``name`` (:issue:`7299`)
+- Bug in MultiIndex slicing with datetimelike ranges (strings and Timestamps), (:issue:`7429`)
+- Bug in ``Index.min`` and ``max`` doesn't handle ``nan`` and ``NaT`` properly (:issue:`7261`)
+- Bug in ``PeriodIndex.min/max`` results in ``int`` (:issue:`7609`)
+- Bug in ``resample`` where ``fill_method`` was ignored if you passed ``how`` (:issue:`2073`)
+- Bug in ``TimeGrouper`` doesn't exclude column specified by ``key`` (:issue:`7227`)
+- Bug in ``DataFrame`` and ``Series`` bar and barh plot raises ``TypeError`` when ``bottom``
+  and ``left`` keyword is specified (:issue:`7226`)
+- Bug in ``DataFrame.hist`` raises ``TypeError`` when it contains non numeric column (:issue:`7277`)
+- Bug in ``Index.delete`` does not preserve ``name`` and ``freq`` attributes (:issue:`7302`)
+- Bug in ``DataFrame.query()``/``eval`` where local string variables with the @
+  sign were being treated as temporaries attempting to be deleted
+  (:issue:`7300`).
+- Bug in ``Float64Index`` which didn't allow duplicates (:issue:`7149`).
+- Bug in ``DataFrame.replace()`` where truthy values were being replaced
+  (:issue:`7140`).
+- Bug in ``StringMethods.extract()`` where a single match group Series
+  would use the matcher's name instead of the group name (:issue:`7313`).
+- Bug in ``isnull()`` when ``mode.use_inf_as_null == True`` where isnull
+  wouldn't test ``True`` when it encountered an ``inf``/``-inf``
+  (:issue:`7315`).
+- Bug in inferred_freq results in None for eastern hemisphere timezones (:issue:`7310`)
+- Bug in ``Easter`` returns incorrect date when offset is negative (:issue:`7195`)
+- Bug in broadcasting with ``.div``, integer dtypes and divide-by-zero (:issue:`7325`)
+- Bug in ``CustomBusinessDay.apply`` raises ``NameError`` when ``np.datetime64`` object is passed (:issue:`7196`)
+- Bug in ``MultiIndex.append``, ``concat`` and ``pivot_table`` don't preserve timezone (:issue:`6606`)
+- Bug in ``.loc`` with a list of indexers on a single-multi index level (that is not nested) (:issue:`7349`)
+- Bug in ``Series.map`` when mapping a dict with tuple keys of different lengths (:issue:`7333`)
+- Bug all ``StringMethods`` now work on empty Series (:issue:`7242`)
+- Fix delegation of `read_sql` to `read_sql_query` when query does not contain 'select' (:issue:`7324`).
+- Bug where a string column name assignment to a ``DataFrame`` with a
+  ``Float64Index`` raised a ``TypeError`` during a call to ``np.isnan``
+  (:issue:`7366`).
+- Bug where ``NDFrame.replace()`` didn't correctly replace objects with
+  ``Period`` values (:issue:`7379`).
+- Bug in ``.ix`` getitem should always return a Series (:issue:`7150`)
+- Bug in MultiIndex slicing with incomplete indexers (:issue:`7399`)
+- Bug in MultiIndex slicing with a step in a sliced level (:issue:`7400`)
+- Bug where negative indexers in ``DatetimeIndex`` were not correctly sliced
+  (:issue:`7408`)
+- Bug where ``NaT`` wasn't repr'd correctly in a ``MultiIndex`` (:issue:`7406`,
+  :issue:`7409`).
+- Bug where bool objects were converted to ``nan`` in ``convert_objects``
+  (:issue:`7416`).
+- Bug in ``quantile`` ignoring the axis keyword argument (:issue:`7306`)
+- Bug where ``nanops._maybe_null_out`` doesn't work with complex numbers
+  (:issue:`7353`)
+- Bug in several ``nanops`` functions when ``axis==0`` for
+  1-dimensional ``nan`` arrays (:issue:`7354`)
+- Bug where ``nanops.nanmedian`` doesn't work when ``axis==None``
+  (:issue:`7352`)
+- Bug where ``nanops._has_infs`` doesn't work with many dtypes
+  (:issue:`7357`)
+- Bug in ``StataReader.data`` where reading a 0-observation dta failed (:issue:`7369`)
+- Bug in ``StataReader`` when reading Stata 13 (117) files containing fixed width strings (:issue:`7360`)
+- Bug in ``StataWriter`` where encoding was ignored (:issue:`7286`)
+- Bug in ``DatetimeIndex`` comparison doesn't handle ``NaT`` properly (:issue:`7529`)
+- Bug in passing input with ``tzinfo`` to some offsets ``apply``, ``rollforward`` or ``rollback`` resets ``tzinfo`` or raises ``ValueError`` (:issue:`7465`)
+- Bug in ``DatetimeIndex.to_period``, ``PeriodIndex.asobject``, ``PeriodIndex.to_timestamp`` doesn't preserve ``name`` (:issue:`7485`)
+- Bug in ``DatetimeIndex.to_period`` and ``PeriodIndex.to_timestanp`` handle ``NaT`` incorrectly (:issue:`7228`)
+- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may return normal ``datetime`` (:issue:`7502`)
+- Bug in ``resample`` raises ``ValueError`` when target contains ``NaT`` (:issue:`7227`)
+- Bug in ``Timestamp.tz_localize`` resets ``nanosecond`` info (:issue:`7534`)
+- Bug in ``DatetimeIndex.asobject`` raises ``ValueError`` when it contains ``NaT`` (:issue:`7539`)
+- Bug in ``Timestamp.__new__`` doesn't preserve nanosecond properly (:issue:`7610`)
+- Bug in ``Index.astype(float)`` where it would return an ``object`` dtype
+  ``Index`` (:issue:`7464`).
+- Bug in ``DataFrame.reset_index`` loses ``tz`` (:issue:`3950`)
+- Bug in ``DatetimeIndex.freqstr`` raises ``AttributeError`` when ``freq`` is ``None`` (:issue:`7606`)
+- Bug in ``GroupBy.size`` created by ``TimeGrouper`` raises ``AttributeError`` (:issue:`7453`)
+- Bug in single column bar plot is misaligned (:issue:`7498`).
+- Bug in area plot with tz-aware time series raises ``ValueError`` (:issue:`7471`)
+- Bug in non-monotonic ``Index.union`` may preserve ``name`` incorrectly (:issue:`7458`)
+- Bug in ``DatetimeIndex.intersection`` doesn't preserve timezone (:issue:`4690`)
+- Bug in ``rolling_var`` where a window larger than the array would raise an error(:issue:`7297`)
+- Bug with last plotted timeseries dictating ``xlim`` (:issue:`2960`)
+- Bug with ``secondary_y`` axis not being considered for timeseries ``xlim`` (:issue:`3490`)
+- Bug in ``Float64Index`` assignment with a non scalar indexer (:issue:`7586`)
+- Bug in ``pandas.core.strings.str_contains`` does not properly match in a case insensitive fashion when ``regex=False`` and ``case=False`` (:issue:`7505`)
+- Bug in ``expanding_cov``, ``expanding_corr``, ``rolling_cov``, and ``rolling_corr`` for two arguments with mismatched index  (:issue:`7512`)
+- Bug in ``to_sql`` taking the boolean column as text column (:issue:`7678`)
+- Bug in grouped `hist` doesn't handle `rot` kw and `sharex` kw properly (:issue:`7234`)
+- Bug in ``.loc`` performing fallback integer indexing with ``object`` dtype indices (:issue:`7496`)
+- Bug (regression) in ``PeriodIndex`` constructor when passed ``Series`` objects (:issue:`7701`).
+
+
+.. _whatsnew_0.14.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.14.0..v0.14.1
diff --git a/doc/source/whatsnew/v0.14.1.txt b/doc/source/whatsnew/v0.14.1.txt
deleted file mode 100644
index 239d6c9c6e0d4..0000000000000
--- a/doc/source/whatsnew/v0.14.1.txt
+++ /dev/null
@@ -1,271 +0,0 @@
-.. _whatsnew_0141:
-
-v0.14.1 (July 11, 2014)
------------------------
-
-This is a minor release from 0.14.0 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-- Highlights include:
-
-  - New methods :meth:`~pandas.DataFrame.select_dtypes` to select columns
-    based on the dtype and :meth:`~pandas.Series.sem` to calculate the
-    standard error of the mean.
-  - Support for dateutil timezones (see :ref:`docs <timeseries.timezone>`).
-  - Support for ignoring full line comments in the :func:`~pandas.read_csv`
-    text parser.
-  - New documentation section on :ref:`Options and Settings <options>`.
-  - Lots of bug fixes.
-
-- :ref:`Enhancements <whatsnew_0141.enhancements>`
-- :ref:`API Changes <whatsnew_0141.api>`
-- :ref:`Performance Improvements <whatsnew_0141.performance>`
-- :ref:`Experimental Changes <whatsnew_0141.experimental>`
-- :ref:`Bug Fixes <whatsnew_0141.bug_fixes>`
-
-.. _whatsnew_0141.api:
-
-API changes
-~~~~~~~~~~~
-
-- Openpyxl now raises a ValueError on construction of the openpyxl writer
-  instead of warning on pandas import (:issue:`7284`).
-
-- For ``StringMethods.extract``, when no match is found, the result - only
-  containing ``NaN`` values - now also has ``dtype=object`` instead of
-  ``float`` (:issue:`7242`)
-
-- ``Period`` objects no longer raise a ``TypeError`` when compared using ``==``
-  with another object that *isn't* a ``Period``. Instead
-  when comparing a ``Period`` with another object using ``==`` if the other
-  object isn't a ``Period`` ``False`` is returned. (:issue:`7376`)
-
-- Previously, the behaviour on resetting the time or not in
-  ``offsets.apply``, ``rollforward`` and ``rollback`` operations differed
-  between offsets. With the support of the ``normalize`` keyword for all offsets(see
-  below) with a default value of False (preserve time), the behaviour changed for certain
-  offsets (BusinessMonthBegin, MonthEnd, BusinessMonthEnd, CustomBusinessMonthEnd,
-  BusinessYearBegin, LastWeekOfMonth, FY5253Quarter, LastWeekOfMonth, Easter):
-
-  .. code-block:: ipython
-
-     In [6]: from pandas.tseries import offsets
-
-     In [7]: d = pd.Timestamp('2014-01-01 09:00')
-
-     # old behaviour < 0.14.1
-     In [8]: d + offsets.MonthEnd()
-     Out[8]: Timestamp('2014-01-31 00:00:00')
-
-  Starting from 0.14.1 all offsets preserve time by default. The old
-  behaviour can be obtained with ``normalize=True``
-
-  .. ipython:: python
-     :suppress:
-
-     import pandas.tseries.offsets as offsets
-     d = pd.Timestamp('2014-01-01 09:00')
-
-  .. ipython:: python
-
-     # new behaviour
-     d + offsets.MonthEnd()
-     d + offsets.MonthEnd(normalize=True)
-
-  Note that for the other offsets the default behaviour did not change.
-
-- Add back ``#N/A N/A`` as a default NA value in text parsing, (regresion from 0.12) (:issue:`5521`)
-- Raise a ``TypeError`` on inplace-setting with a ``.where`` and a non ``np.nan`` value as this is inconsistent
-  with a set-item expression like ``df[mask] = None`` (:issue:`7656`)
-
-
-.. _whatsnew_0141.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-- Add ``dropna`` argument to ``value_counts`` and ``nunique`` (:issue:`5569`).
-- Add :meth:`~pandas.DataFrame.select_dtypes` method to allow selection of
-  columns based on dtype (:issue:`7316`). See :ref:`the docs <basics.selectdtypes>`.
-- All ``offsets`` suppports the ``normalize`` keyword to specify whether
-  ``offsets.apply``, ``rollforward`` and ``rollback`` resets the time (hour,
-  minute, etc) or not (default ``False``, preserves time) (:issue:`7156`):
-
-  .. ipython:: python
-
-   import pandas.tseries.offsets as offsets
-
-   day = offsets.Day()
-   day.apply(Timestamp('2014-01-01 09:00'))
-
-   day = offsets.Day(normalize=True)
-   day.apply(Timestamp('2014-01-01 09:00'))
-
-- ``PeriodIndex`` is represented as the same format as ``DatetimeIndex`` (:issue:`7601`)
-- ``StringMethods`` now work on empty Series (:issue:`7242`)
-- The file parsers ``read_csv`` and ``read_table`` now ignore line comments provided by
-  the parameter `comment`, which accepts only a single character for the C reader.
-  In particular, they allow for comments before file data begins (:issue:`2685`)
-- Add ``NotImplementedError`` for simultaneous use of ``chunksize`` and ``nrows``
-  for read_csv() (:issue:`6774`).
-- Tests for basic reading of public S3 buckets now exist (:issue:`7281`).
-- ``read_html`` now sports an ``encoding`` argument that is passed to the
-  underlying parser library. You can use this to read non-ascii encoded web
-  pages (:issue:`7323`).
-- ``read_excel`` now supports reading from URLs in the same way
-  that ``read_csv`` does.  (:issue:`6809`)
-- Support for dateutil timezones, which can now be used in the same way as
-  pytz timezones across pandas. (:issue:`4688`)
-
-  .. ipython:: python
-
-     rng = date_range('3/6/2012 00:00', periods=10, freq='D',
-                      tz='dateutil/Europe/London')
-     rng.tz
-
-  See :ref:`the docs <timeseries.timezone>`.
-
-- Implemented ``sem`` (standard error of the mean) operation for ``Series``,
-  ``DataFrame``, ``Panel``, and ``Groupby`` (:issue:`6897`)
-- Add ``nlargest`` and ``nsmallest`` to the ``Series`` ``groupby`` whitelist,
-  which means you can now use these methods on a ``SeriesGroupBy`` object
-  (:issue:`7053`).
-- All offsets ``apply``, ``rollforward`` and ``rollback`` can now handle ``np.datetime64``, previously results in ``ApplyTypeError`` (:issue:`7452`)
-- ``Period`` and ``PeriodIndex`` can contain ``NaT`` in its values (:issue:`7485`)
-- Support pickling ``Series``, ``DataFrame`` and ``Panel`` objects with
-  non-unique labels along *item* axis (``index``, ``columns`` and ``items``
-  respectively) (:issue:`7370`).
-- Improved inference of datetime/timedelta with mixed null objects. Regression from 0.13.1 in interpretation of an object Index
-  with all null elements (:issue:`7431`)
-
-.. _whatsnew_0141.performance:
-
-Performance
-~~~~~~~~~~~
-- Improvements in dtype inference for numeric operations involving yielding performance gains for dtypes: ``int64``, ``timedelta64``, ``datetime64`` (:issue:`7223`)
-- Improvements in Series.transform for significant performance gains (:issue:`6496`)
-- Improvements in DataFrame.transform with ufuncs and built-in grouper functions for signifcant performance gains (:issue:`7383`)
-- Regression in groupby aggregation of datetime64 dtypes (:issue:`7555`)
-- Improvements in `MultiIndex.from_product` for large iterables (:issue:`7627`)
-
-
-.. _whatsnew_0141.experimental:
-
-Experimental
-~~~~~~~~~~~~
-
-- ``pandas.io.data.Options`` has a new method, ``get_all_data`` method, and now consistently returns a
-  multi-indexed ``DataFrame`` (:issue:`5602`)
-- ``io.gbq.read_gbq`` and ``io.gbq.to_gbq`` were refactored to remove the
-  dependency on the Google ``bq.py`` command line client. This submodule
-  now uses ``httplib2`` and the Google ``apiclient`` and ``oauth2client`` API client
-  libraries which should be more stable and, therefore, reliable than
-  ``bq.py``. See :ref:`the docs <io.bigquery>`. (:issue:`6937`).
-
-
-.. _whatsnew_0141.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-- Bug in ``DataFrame.where`` with a symmetric shaped frame and a passed other of a DataFrame (:issue:`7506`)
-- Bug in Panel indexing with a multi-index axis (:issue:`7516`)
-- Regression in datetimelike slice indexing with a duplicated index and non-exact end-points (:issue:`7523`)
-- Bug in setitem with list-of-lists and single vs mixed types (:issue:`7551`:)
-- Bug in timeops with non-aligned Series (:issue:`7500`)
-- Bug in timedelta inference when assigning an incomplete Series (:issue:`7592`)
-- Bug in groupby ``.nth`` with a Series and integer-like column name (:issue:`7559`)
-- Bug in ``Series.get`` with a boolean accessor (:issue:`7407`)
-- Bug in ``value_counts`` where ``NaT`` did not qualify as missing (``NaN``) (:issue:`7423`)
-- Bug in ``to_timedelta`` that accepted invalid units and misinterpreted 'm/h' (:issue:`7611`, :issue:`6423`)
-- Bug in line plot doesn't set correct ``xlim`` if ``secondary_y=True`` (:issue:`7459`)
-- Bug in grouped ``hist`` and ``scatter`` plots use old ``figsize`` default (:issue:`7394`)
-- Bug in plotting subplots with ``DataFrame.plot``, ``hist`` clears passed ``ax`` even if the number of subplots is one (:issue:`7391`).
-- Bug in plotting subplots with ``DataFrame.boxplot`` with ``by`` kw raises ``ValueError`` if the number of subplots exceeds 1 (:issue:`7391`).
-- Bug in subplots displays ``ticklabels`` and ``labels`` in different rule (:issue:`5897`)
-- Bug in ``Panel.apply`` with a multi-index as an axis (:issue:`7469`)
-- Bug in ``DatetimeIndex.insert`` doesn't preserve ``name`` and ``tz`` (:issue:`7299`)
-- Bug in ``DatetimeIndex.asobject`` doesn't preserve ``name`` (:issue:`7299`)
-- Bug in multi-index slicing with datetimelike ranges (strings and Timestamps), (:issue:`7429`)
-- Bug in ``Index.min`` and ``max`` doesn't handle ``nan`` and ``NaT`` properly (:issue:`7261`)
-- Bug in ``PeriodIndex.min/max`` results in ``int`` (:issue:`7609`)
-- Bug in ``resample`` where ``fill_method`` was ignored if you passed ``how`` (:issue:`2073`)
-- Bug in ``TimeGrouper`` doesn't exclude column specified by ``key`` (:issue:`7227`)
-- Bug in ``DataFrame`` and ``Series`` bar and barh plot raises ``TypeError`` when ``bottom``
-  and ``left`` keyword is specified (:issue:`7226`)
-- Bug in ``DataFrame.hist`` raises ``TypeError`` when it contains non numeric column (:issue:`7277`)
-- Bug in ``Index.delete`` does not preserve ``name`` and ``freq`` attributes (:issue:`7302`)
-- Bug in ``DataFrame.query()``/``eval`` where local string variables with the @
-  sign were being treated as temporaries attempting to be deleted
-  (:issue:`7300`).
-- Bug in ``Float64Index`` which didn't allow duplicates (:issue:`7149`).
-- Bug in ``DataFrame.replace()`` where truthy values were being replaced
-  (:issue:`7140`).
-- Bug in ``StringMethods.extract()`` where a single match group Series
-  would use the matcher's name instead of the group name (:issue:`7313`).
-- Bug in ``isnull()`` when ``mode.use_inf_as_null == True`` where isnull
-  wouldn't test ``True`` when it encountered an ``inf``/``-inf``
-  (:issue:`7315`).
-- Bug in inferred_freq results in None for eastern hemisphere timezones (:issue:`7310`)
-- Bug in ``Easter`` returns incorrect date when offset is negative (:issue:`7195`)
-- Bug in broadcasting with ``.div``, integer dtypes and divide-by-zero (:issue:`7325`)
-- Bug in ``CustomBusinessDay.apply`` raiases ``NameError`` when ``np.datetime64`` object is passed (:issue:`7196`)
-- Bug in ``MultiIndex.append``, ``concat`` and ``pivot_table`` don't preserve timezone (:issue:`6606`)
-- Bug in ``.loc`` with a list of indexers on a single-multi index level (that is not nested) (:issue:`7349`)
-- Bug in ``Series.map`` when mapping a dict with tuple keys of different lengths (:issue:`7333`)
-- Bug all ``StringMethods`` now work on empty Series (:issue:`7242`)
-- Fix delegation of `read_sql` to `read_sql_query` when query does not contain 'select' (:issue:`7324`).
-- Bug where a string column name assignment to a ``DataFrame`` with a
-  ``Float64Index`` raised a ``TypeError`` during a call to ``np.isnan``
-  (:issue:`7366`).
-- Bug where ``NDFrame.replace()`` didn't correctly replace objects with
-  ``Period`` values (:issue:`7379`).
-- Bug in ``.ix`` getitem should always return a Series (:issue:`7150`)
-- Bug in multi-index slicing with incomplete indexers (:issue:`7399`)
-- Bug in multi-index slicing with a step in a sliced level (:issue:`7400`)
-- Bug where negative indexers in ``DatetimeIndex`` were not correctly sliced
-  (:issue:`7408`)
-- Bug where ``NaT`` wasn't repr'd correctly in a ``MultiIndex`` (:issue:`7406`,
-  :issue:`7409`).
-- Bug where bool objects were converted to ``nan`` in ``convert_objects``
-  (:issue:`7416`).
-- Bug in ``quantile`` ignoring the axis keyword argument (:issue`7306`)
-- Bug where ``nanops._maybe_null_out`` doesn't work with complex numbers
-  (:issue:`7353`)
-- Bug in several ``nanops`` functions when ``axis==0`` for
-  1-dimensional ``nan`` arrays (:issue:`7354`)
-- Bug where ``nanops.nanmedian`` doesn't work when ``axis==None``
-  (:issue:`7352`)
-- Bug where ``nanops._has_infs`` doesn't work with many dtypes
-  (:issue:`7357`)
-- Bug in ``StataReader.data`` where reading a 0-observation dta failed (:issue:`7369`)
-- Bug in ``StataReader`` when reading Stata 13 (117) files containing fixed width strings (:issue:`7360`)
-- Bug in ``StataWriter`` where encoding was ignored (:issue:`7286`)
-- Bug in ``DatetimeIndex`` comparison doesn't handle ``NaT`` properly (:issue:`7529`)
-- Bug in passing input with ``tzinfo`` to some offsets ``apply``, ``rollforward`` or ``rollback`` resets ``tzinfo`` or raises ``ValueError`` (:issue:`7465`)
-- Bug in ``DatetimeIndex.to_period``, ``PeriodIndex.asobject``, ``PeriodIndex.to_timestamp`` doesn't preserve ``name`` (:issue:`7485`)
-- Bug in ``DatetimeIndex.to_period`` and ``PeriodIndex.to_timestanp`` handle ``NaT`` incorrectly (:issue:`7228`)
-- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may return normal ``datetime`` (:issue:`7502`)
-- Bug in ``resample`` raises ``ValueError`` when target contains ``NaT`` (:issue:`7227`)
-- Bug in ``Timestamp.tz_localize`` resets ``nanosecond`` info (:issue:`7534`)
-- Bug in ``DatetimeIndex.asobject`` raises ``ValueError`` when it contains ``NaT`` (:issue:`7539`)
-- Bug in ``Timestamp.__new__`` doesn't preserve nanosecond properly (:issue:`7610`)
-- Bug in ``Index.astype(float)`` where it would return an ``object`` dtype
-  ``Index`` (:issue:`7464`).
-- Bug in ``DataFrame.reset_index`` loses ``tz`` (:issue:`3950`)
-- Bug in ``DatetimeIndex.freqstr`` raises ``AttributeError`` when ``freq`` is ``None`` (:issue:`7606`)
-- Bug in ``GroupBy.size`` created by ``TimeGrouper`` raises ``AttributeError`` (:issue:`7453`)
-- Bug in single column bar plot is misaligned (:issue:`7498`).
-- Bug in area plot with tz-aware time series raises ``ValueError`` (:issue:`7471`)
-- Bug in non-monotonic ``Index.union`` may preserve ``name`` incorrectly (:issue:`7458`)
-- Bug in ``DatetimeIndex.intersection`` doesn't preserve timezone (:issue:`4690`)
-- Bug in ``rolling_var`` where a window larger than the array would raise an error(:issue:`7297`)
-- Bug with last plotted timeseries dictating ``xlim`` (:issue:`2960`)
-- Bug with ``secondary_y`` axis not being considered for timeseries ``xlim`` (:issue:`3490`)
-- Bug in ``Float64Index`` assignment with a non scalar indexer (:issue:`7586`)
-- Bug in ``pandas.core.strings.str_contains`` does not properly match in a case insensitive fashion when ``regex=False`` and ``case=False`` (:issue:`7505`)
-- Bug in ``expanding_cov``, ``expanding_corr``, ``rolling_cov``, and ``rolling_corr`` for two arguments with mismatched index  (:issue:`7512`)
-- Bug in ``to_sql`` taking the boolean column as text column (:issue:`7678`)
-- Bug in grouped `hist` doesn't handle `rot` kw and `sharex` kw properly (:issue:`7234`)
-- Bug in ``.loc`` performing fallback integer indexing with ``object`` dtype indices (:issue:`7496`)
-- Bug (regression) in ``PeriodIndex`` constructor when passed ``Series`` objects (:issue:`7701`).
diff --git a/doc/source/whatsnew/v0.15.0.rst b/doc/source/whatsnew/v0.15.0.rst
new file mode 100644
index 0000000000000..7b9a8ba082411
--- /dev/null
+++ b/doc/source/whatsnew/v0.15.0.rst
@@ -0,0 +1,1237 @@
+.. _whatsnew_0150:
+
+v0.15.0 (October 18, 2014)
+--------------------------
+
+{{ header }}
+
+
+This is a major release from 0.14.1 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+.. warning::
+
+   pandas >= 0.15.0 will no longer support compatibility with NumPy versions <
+   1.7.0. If you want to use the latest versions of pandas, please upgrade to
+   NumPy >= 1.7.0 (:issue:`7711`)
+
+- Highlights include:
+
+  - The ``Categorical`` type was integrated as a first-class pandas type, see :ref:`here <whatsnew_0150.cat>`
+  - New scalar type ``Timedelta``, and a new index type ``TimedeltaIndex``, see :ref:`here <whatsnew_0150.timedeltaindex>`
+  - New datetimelike properties accessor ``.dt`` for Series, see :ref:`Datetimelike Properties <whatsnew_0150.dt>`
+  - New DataFrame default display for ``df.info()`` to include memory usage, see :ref:`Memory Usage <whatsnew_0150.memory>`
+  - ``read_csv`` will now by default ignore blank lines when parsing, see :ref:`here <whatsnew_0150.blanklines>`
+  - API change in using Indexes in set operations, see :ref:`here <whatsnew_0150.index_set_ops>`
+  - Enhancements in the handling of timezones, see :ref:`here <whatsnew_0150.tz>`
+  - A lot of improvements to the rolling and expanding moment functions, see :ref:`here <whatsnew_0150.roll>`
+  - Internal refactoring of the ``Index`` class to no longer sub-class ``ndarray``, see :ref:`Internal Refactoring <whatsnew_0150.refactoring>`
+  - dropping support for ``PyTables`` less than version 3.0.0, and ``numexpr`` less than version 2.1 (:issue:`7990`)
+  - Split indexing documentation into :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
+  - Split out string methods documentation into :ref:`Working with Text Data <text>`
+
+- Check the :ref:`API Changes <whatsnew_0150.api>` and :ref:`deprecations <whatsnew_0150.deprecations>` before updating
+
+- :ref:`Other Enhancements <whatsnew_0150.enhancements>`
+
+- :ref:`Performance Improvements <whatsnew_0150.performance>`
+
+- :ref:`Bug Fixes <whatsnew_0150.bug_fixes>`
+
+.. warning::
+
+   In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
+   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This change allows very easy sub-classing and creation of new index types. This should be
+   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
+
+.. warning::
+
+   The refactoring in :class:`~pandas.Categorical` changed the two argument constructor from
+   "codes/labels and levels" to "values and levels (now called 'categories')". This can lead to subtle bugs. If you use
+   :class:`~pandas.Categorical` directly, please audit your code before updating to this pandas
+   version and change it to use the :meth:`~pandas.Categorical.from_codes` constructor. See more on ``Categorical`` :ref:`here <whatsnew_0150.cat>`
+
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0150.cat:
+
+Categoricals in Series/DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:class:`~pandas.Categorical` can now be included in `Series` and `DataFrames` and gained new
+methods to manipulate. Thanks to Jan Schulz for much of this API/implementation. (:issue:`3943`, :issue:`5313`, :issue:`5314`,
+:issue:`7444`, :issue:`7839`, :issue:`7848`, :issue:`7864`, :issue:`7914`, :issue:`7768`, :issue:`8006`, :issue:`3678`,
+:issue:`8075`, :issue:`8076`, :issue:`8143`, :issue:`8453`, :issue:`8518`).
+
+For full docs, see the :ref:`categorical introduction <categorical>` and the
+:ref:`API documentation <api.arrays.categorical>`.
+
+.. ipython:: python
+    :okwarning:
+
+    df = pd.DataFrame({"id": [1, 2, 3, 4, 5, 6],
+                       "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+
+    df["grade"] = df["raw_grade"].astype("category")
+    df["grade"]
+
+    # Rename the categories
+    df["grade"].cat.categories = ["very good", "good", "very bad"]
+
+    # Reorder the categories and simultaneously add the missing categories
+    df["grade"] = df["grade"].cat.set_categories(["very bad", "bad",
+                                                  "medium", "good", "very good"])
+    df["grade"]
+    df.sort_values("grade")
+    df.groupby("grade").size()
+
+- ``pandas.core.group_agg`` and ``pandas.core.factor_agg`` were removed. As an alternative, construct
+  a dataframe and use ``df.groupby(<group>).agg(<func>)``.
+
+- Supplying "codes/labels and levels" to the :class:`~pandas.Categorical` constructor is not
+  supported anymore. Supplying two arguments to the constructor is now interpreted as
+  "values and levels (now called 'categories')". Please change your code to use the :meth:`~pandas.Categorical.from_codes`
+  constructor.
+
+- The ``Categorical.labels`` attribute was renamed to ``Categorical.codes`` and is read
+  only. If you want to manipulate codes, please use one of the
+  :ref:`API methods on Categoricals <api.arrays.categorical>`.
+
+- The ``Categorical.levels`` attribute is renamed to ``Categorical.categories``.
+
+
+.. _whatsnew_0150.timedeltaindex:
+
+TimedeltaIndex/Scalar
+^^^^^^^^^^^^^^^^^^^^^
+
+We introduce a new scalar type ``Timedelta``, which is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
+but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation, parsing, and attributes.
+This type is very similar to how ``Timestamp`` works for ``datetimes``. It is a nice-API box for the type. See the :ref:`docs <timedeltas.timedeltas>`.
+(:issue:`3009`, :issue:`4533`, :issue:`8209`, :issue:`8187`, :issue:`8190`, :issue:`7869`, :issue:`7661`, :issue:`8345`, :issue:`8471`)
+
+.. warning::
+
+   ``Timedelta`` scalars (and ``TimedeltaIndex``) component fields are *not the same* as the component fields on a ``datetime.timedelta`` object. For example, ``.seconds`` on a ``datetime.timedelta`` object returns the total number of seconds combined between ``hours``, ``minutes`` and ``seconds``. In contrast, the pandas ``Timedelta`` breaks out hours, minutes, microseconds and nanoseconds separately.
+
+   .. code-block:: ipython
+
+      # Timedelta accessor
+      In [9]: tds = pd.Timedelta('31 days 5 min 3 sec')
+
+      In [10]: tds.minutes
+      Out[10]: 5L
+
+      In [11]: tds.seconds
+      Out[11]: 3L
+
+      # datetime.timedelta accessor
+      # this is 5 minutes * 60 + 3 seconds
+      In [12]: tds.to_pytimedelta().seconds
+      Out[12]: 303
+
+   **Note**: this is no longer true starting from v0.16.0, where full
+   compatibility with ``datetime.timedelta`` is introduced. See the
+   :ref:`0.16.0 whatsnew entry <whatsnew_0160.api_breaking.timedelta>`
+
+.. warning::
+
+       Prior to 0.15.0 ``pd.to_timedelta`` would return a ``Series`` for list-like/Series input, and a ``np.timedelta64`` for scalar input.
+       It will now return a ``TimedeltaIndex`` for list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
+
+       The arguments to ``pd.to_timedelta`` are now ``(arg,unit='ns',box=True,coerce=False)``, previously were ``(arg,box=True,unit='ns')`` as these are more logical.
+
+Construct a scalar
+
+.. ipython:: python
+
+   pd.Timedelta('1 days 06:05:01.00003')
+   pd.Timedelta('15.5us')
+   pd.Timedelta('1 hour 15.5us')
+
+   # negative Timedeltas have this string repr
+   # to be more consistent with datetime.timedelta conventions
+   pd.Timedelta('-1us')
+
+   # a NaT
+   pd.Timedelta('nan')
+
+Access fields for a ``Timedelta``
+
+.. ipython:: python
+
+   td = pd.Timedelta('1 hour 3m 15.5us')
+   td.seconds
+   td.microseconds
+   td.nanoseconds
+
+Construct a ``TimedeltaIndex``
+
+.. ipython:: python
+   :suppress:
+
+   import datetime
+
+.. ipython:: python
+
+   pd.TimedeltaIndex(['1 days', '1 days, 00:00:05',
+                      np.timedelta64(2, 'D'),
+                      datetime.timedelta(days=2, seconds=2)])
+
+Constructing a ``TimedeltaIndex`` with a regular range
+
+.. ipython:: python
+
+   pd.timedelta_range('1 days', periods=5, freq='D')
+   pd.timedelta_range(start='1 days', end='2 days', freq='30T')
+
+You can now use a ``TimedeltaIndex`` as the index of a pandas object
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5),
+                 index=pd.timedelta_range('1 days', periods=5, freq='s'))
+   s
+
+You can select with partial string selections
+
+.. ipython:: python
+
+   s['1 day 00:00:02']
+   s['1 day':'1 day 00:00:02']
+
+Finally, the combination of ``TimedeltaIndex`` with ``DatetimeIndex`` allow certain combination operations that are ``NaT`` preserving:
+
+.. ipython:: python
+
+   tdi = pd.TimedeltaIndex(['1 days', pd.NaT, '2 days'])
+   tdi.tolist()
+   dti = pd.date_range('20130101', periods=3)
+   dti.tolist()
+
+   (dti + tdi).tolist()
+   (dti - tdi).tolist()
+
+- iteration of a ``Series`` e.g. ``list(Series(...))`` of ``timedelta64[ns]`` would prior to v0.15.0 return ``np.timedelta64`` for each element. These will now be wrapped in ``Timedelta``.
+
+
+.. _whatsnew_0150.memory:
+
+Memory Usage
+^^^^^^^^^^^^
+
+Implemented methods to find memory usage of a DataFrame. See the :ref:`FAQ <df-memory-usage>` for more. (:issue:`6852`).
+
+A new display option ``display.memory_usage`` (see :ref:`options`) sets the default behavior of the ``memory_usage`` argument in the ``df.info()`` method. By default ``display.memory_usage`` is ``True``.
+
+.. ipython:: python
+
+    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
+              'complex128', 'object', 'bool']
+    n = 5000
+    data = {t: np.random.randint(100, size=n).astype(t) for t in dtypes}
+    df = pd.DataFrame(data)
+    df['categorical'] = df['object'].astype('category')
+
+    df.info()
+
+Additionally :meth:`~pandas.DataFrame.memory_usage` is an available method for a dataframe object which returns the memory usage of each column.
+
+.. ipython:: python
+
+    df.memory_usage(index=True)
+
+
+.. _whatsnew_0150.dt:
+
+.dt accessor
+^^^^^^^^^^^^
+
+``Series`` has gained an accessor to succinctly return datetime like properties for the *values* of the Series, if its a datetime/period like Series. (:issue:`7207`)
+This will return a Series, indexed like the existing Series. See the :ref:`docs <basics.dt_accessors>`
+
+.. ipython:: python
+
+   # datetime
+   s = pd.Series(pd.date_range('20130101 09:10:12', periods=4))
+   s
+   s.dt.hour
+   s.dt.second
+   s.dt.day
+   s.dt.freq
+
+This enables nice expressions like this:
+
+.. ipython:: python
+
+   s[s.dt.day == 2]
+
+You can easily produce tz aware transformations:
+
+.. ipython:: python
+
+   stz = s.dt.tz_localize('US/Eastern')
+   stz
+   stz.dt.tz
+
+You can also chain these types of operations:
+
+.. ipython:: python
+
+   s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
+
+The ``.dt`` accessor works for period and timedelta dtypes.
+
+.. ipython:: python
+
+   # period
+   s = pd.Series(pd.period_range('20130101', periods=4, freq='D'))
+   s
+   s.dt.year
+   s.dt.day
+
+.. ipython:: python
+
+   # timedelta
+   s = pd.Series(pd.timedelta_range('1 day 00:00:05', periods=4, freq='s'))
+   s
+   s.dt.days
+   s.dt.seconds
+   s.dt.components
+
+
+.. _whatsnew_0150.tz:
+
+Timezone handling improvements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- ``tz_localize(None)`` for tz-aware ``Timestamp`` and ``DatetimeIndex`` now removes timezone holding local time,
+  previously this resulted in ``Exception`` or ``TypeError`` (:issue:`7812`)
+
+  .. ipython:: python
+     :okwarning:
+
+     ts = pd.Timestamp('2014-08-01 09:00', tz='US/Eastern')
+     ts
+     ts.tz_localize(None)
+
+     didx = pd.DatetimeIndex(start='2014-08-01 09:00', freq='H',
+                             periods=10, tz='US/Eastern')
+     didx
+     didx.tz_localize(None)
+
+- ``tz_localize`` now accepts the ``ambiguous`` keyword which allows for passing an array of bools
+  indicating whether the date belongs in DST or not, 'NaT' for setting transition times to NaT,
+  'infer' for inferring DST/non-DST, and 'raise' (default) for an ``AmbiguousTimeError`` to be raised. See :ref:`the docs<timeseries.timezone_ambiguous>` for more details (:issue:`7943`)
+
+- ``DataFrame.tz_localize`` and ``DataFrame.tz_convert`` now accepts an optional ``level`` argument
+  for localizing a specific level of a MultiIndex (:issue:`7846`)
+
+- ``Timestamp.tz_localize`` and ``Timestamp.tz_convert`` now raise ``TypeError`` in error cases, rather than ``Exception`` (:issue:`8025`)
+
+- a timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone (rather than being a naive ``datetime64[ns]``) as ``object`` dtype (:issue:`8411`)
+
+- ``Timestamp.__repr__`` displays ``dateutil.tz.tzoffset`` info (:issue:`7907`)
+
+
+.. _whatsnew_0150.roll:
+
+Rolling/Expanding Moments improvements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- :func:`rolling_min`, :func:`rolling_max`, :func:`rolling_cov`, and :func:`rolling_corr`
+  now return objects with all ``NaN`` when ``len(arg) < min_periods <= window`` rather
+  than raising. (This makes all rolling functions consistent in this behavior). (:issue:`7766`)
+
+  Prior to 0.15.0
+
+  .. ipython:: python
+
+     s = pd.Series([10, 11, 12, 13])
+
+  .. code-block:: ipython
+
+     In [15]: pd.rolling_min(s, window=10, min_periods=5)
+     ValueError: min_periods (5) must be <= window (4)
+
+  New behavior
+
+  .. code-block:: ipython
+
+     In [4]: pd.rolling_min(s, window=10, min_periods=5)
+     Out[4]:
+     0   NaN
+     1   NaN
+     2   NaN
+     3   NaN
+     dtype: float64
+
+- :func:`rolling_max`, :func:`rolling_min`, :func:`rolling_sum`, :func:`rolling_mean`, :func:`rolling_median`,
+  :func:`rolling_std`, :func:`rolling_var`, :func:`rolling_skew`, :func:`rolling_kurt`, :func:`rolling_quantile`,
+  :func:`rolling_cov`, :func:`rolling_corr`, :func:`rolling_corr_pairwise`,
+  :func:`rolling_window`, and :func:`rolling_apply` with ``center=True`` previously would return a result of the same
+  structure as the input ``arg`` with ``NaN`` in the final ``(window-1)/2`` entries.
+
+  Now the final ``(window-1)/2`` entries of the result are calculated as if the input ``arg`` were followed
+  by ``(window-1)/2`` ``NaN`` values (or with shrinking windows, in the case of :func:`rolling_apply`).
+  (:issue:`7925`, :issue:`8269`)
+
+  Prior behavior (note final value is ``NaN``):
+
+  .. code-block:: ipython
+
+    In [7]: pd.rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
+    Out[7]:
+    0     1
+    1     3
+    2     6
+    3   NaN
+    dtype: float64
+
+  New behavior (note final value is ``5 = sum([2, 3, NaN])``):
+
+  .. code-block:: ipython
+
+     In [7]: pd.rolling_sum(pd.Series(range(4)), window=3,
+       ....:                min_periods=0, center=True)
+     Out[7]:
+     0    1
+     1    3
+     2    6
+     3    5
+     dtype: float64
+
+- :func:`rolling_window` now normalizes the weights properly in rolling mean mode (`mean=True`) so that
+  the calculated weighted means (e.g. 'triang', 'gaussian') are distributed about the same means as those
+  calculated without weighting (i.e. 'boxcar'). See :ref:`the note on normalization <stats.moments.normalization>` for further details. (:issue:`7618`)
+
+  .. ipython:: python
+
+    s = pd.Series([10.5, 8.8, 11.4, 9.7, 9.3])
+
+  Behavior prior to 0.15.0:
+
+  .. code-block:: ipython
+
+     In [39]: pd.rolling_window(s, window=3, win_type='triang', center=True)
+     Out[39]:
+     0         NaN
+     1    6.583333
+     2    6.883333
+     3    6.683333
+     4         NaN
+     dtype: float64
+
+  New behavior
+
+  .. code-block:: ipython
+
+     In [10]: pd.rolling_window(s, window=3, win_type='triang', center=True)
+     Out[10]:
+     0       NaN
+     1     9.875
+     2    10.325
+     3    10.025
+     4       NaN
+     dtype: float64
+
+- Removed ``center`` argument from all :func:`expanding_ <expanding_apply>` functions (see :ref:`list <api.functions_expanding>`),
+  as the results produced when ``center=True`` did not make much sense. (:issue:`7925`)
+
+- Added optional ``ddof`` argument to :func:`expanding_cov` and :func:`rolling_cov`.
+  The default value of ``1`` is backwards-compatible. (:issue:`8279`)
+
+- Documented the ``ddof`` argument to :func:`expanding_var`, :func:`expanding_std`,
+  :func:`rolling_var`, and :func:`rolling_std`. These functions' support of a
+  ``ddof`` argument (with a default value of ``1``) was previously undocumented. (:issue:`8064`)
+
+- :func:`ewma`, :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
+  now interpret ``min_periods`` in the same manner that the :func:`rolling_*()` and :func:`expanding_*()` functions do:
+  a given result entry will be ``NaN`` if the (expanding, in this case) window does not contain
+  at least ``min_periods`` values. The previous behavior was to set to ``NaN`` the ``min_periods`` entries
+  starting with the first non- ``NaN`` value. (:issue:`7977`)
+
+  Prior behavior (note values start at index ``2``, which is ``min_periods`` after index ``0``
+  (the index of the first non-empty value)):
+
+  .. ipython:: python
+
+    s  = pd.Series([1, None, None, None, 2, 3])
+
+  .. code-block:: ipython
+
+	In [51]: ewma(s, com=3., min_periods=2)
+	Out[51]:
+	0         NaN
+	1         NaN
+	2    1.000000
+	3    1.000000
+	4    1.571429
+	5    2.189189
+	dtype: float64
+
+  New behavior (note values start at index ``4``, the location of the 2nd (since ``min_periods=2``) non-empty value):
+
+  .. code-block:: ipython
+
+     In [2]: pd.ewma(s, com=3., min_periods=2)
+     Out[2]:
+     0         NaN
+     1         NaN
+     2         NaN
+     3         NaN
+     4    1.759644
+     5    2.383784
+     dtype: float64
+
+- :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
+  now have an optional ``adjust`` argument, just like :func:`ewma` does,
+  affecting how the weights are calculated.
+  The default value of ``adjust`` is ``True``, which is backwards-compatible.
+  See :ref:`Exponentially weighted moment functions <stats.moments.exponentially_weighted>` for details. (:issue:`7911`)
+
+- :func:`ewma`, :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
+  now have an optional ``ignore_na`` argument.
+  When ``ignore_na=False`` (the default), missing values are taken into account in the weights calculation.
+  When ``ignore_na=True`` (which reproduces the pre-0.15.0 behavior), missing values are ignored in the weights calculation.
+  (:issue:`7543`)
+
+  .. code-block:: ipython
+
+     In [7]: pd.ewma(pd.Series([None, 1., 8.]), com=2.)
+     Out[7]:
+     0    NaN
+     1    1.0
+     2    5.2
+     dtype: float64
+
+     In [8]: pd.ewma(pd.Series([1., None, 8.]), com=2.,
+       ....:         ignore_na=True)  # pre-0.15.0 behavior
+     Out[8]:
+     0    1.0
+     1    1.0
+     2    5.2
+     dtype: float64
+
+     In [9]: pd.ewma(pd.Series([1., None, 8.]), com=2.,
+       ....:         ignore_na=False)  # new default
+     Out[9]:
+     0    1.000000
+     1    1.000000
+     2    5.846154
+     dtype: float64
+
+  .. warning::
+
+     By default (``ignore_na=False``) the :func:`ewm*()` functions' weights calculation
+     in the presence of missing values is different than in pre-0.15.0 versions.
+     To reproduce the pre-0.15.0 calculation of weights in the presence of missing values
+     one must specify explicitly ``ignore_na=True``.
+
+- Bug in :func:`expanding_cov`, :func:`expanding_corr`, :func:`rolling_cov`, :func:`rolling_cor`, :func:`ewmcov`, and :func:`ewmcorr`
+  returning results with columns sorted by name and producing an error for non-unique columns;
+  now handles non-unique columns and returns columns in original order
+  (except for the case of two DataFrames with ``pairwise=False``, where behavior is unchanged) (:issue:`7542`)
+- Bug in :func:`rolling_count` and :func:`expanding_*()` functions unnecessarily producing error message for zero-length data (:issue:`8056`)
+- Bug in :func:`rolling_apply` and :func:`expanding_apply` interpreting ``min_periods=0`` as ``min_periods=1`` (:issue:`8080`)
+- Bug in :func:`expanding_std` and :func:`expanding_var` for a single value producing a confusing error message (:issue:`7900`)
+- Bug in :func:`rolling_std` and :func:`rolling_var` for a single value producing ``0`` rather than ``NaN`` (:issue:`7900`)
+
+- Bug in :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, and :func:`ewmcov`
+  calculation of de-biasing factors when ``bias=False`` (the default).
+  Previously an incorrect constant factor was used, based on ``adjust=True``, ``ignore_na=True``,
+  and an infinite number of observations.
+  Now a different factor is used for each entry, based on the actual weights
+  (analogous to the usual ``N/(N-1)`` factor).
+  In particular, for a single point a value of ``NaN`` is returned when ``bias=False``,
+  whereas previously a value of (approximately) ``0`` was returned.
+
+  For example, consider the following pre-0.15.0 results for ``ewmvar(..., bias=False)``,
+  and the corresponding debiasing factors:
+
+  .. ipython:: python
+
+     s = pd.Series([1., 2., 0., 4.])
+
+  .. code-block:: ipython
+
+	 In [89]: ewmvar(s, com=2., bias=False)
+	 Out[89]:
+	 0   -2.775558e-16
+	 1    3.000000e-01
+	 2    9.556787e-01
+	 3    3.585799e+00
+	 dtype: float64
+
+	 In [90]: ewmvar(s, com=2., bias=False) / ewmvar(s, com=2., bias=True)
+	 Out[90]:
+	 0    1.25
+	 1    1.25
+	 2    1.25
+	 3    1.25
+	 dtype: float64
+
+  Note that entry ``0`` is approximately 0, and the debiasing factors are a constant 1.25.
+  By comparison, the following 0.15.0 results have a ``NaN`` for entry ``0``,
+  and the debiasing factors are decreasing (towards 1.25):
+
+  .. code-block:: ipython
+
+     In [14]: pd.ewmvar(s, com=2., bias=False)
+     Out[14]:
+     0         NaN
+     1    0.500000
+     2    1.210526
+     3    4.089069
+     dtype: float64
+
+     In [15]: pd.ewmvar(s, com=2., bias=False) / pd.ewmvar(s, com=2., bias=True)
+     Out[15]:
+     0         NaN
+     1    2.083333
+     2    1.583333
+     3    1.425439
+     dtype: float64
+
+  See :ref:`Exponentially weighted moment functions <stats.moments.exponentially_weighted>` for details. (:issue:`7912`)
+
+
+.. _whatsnew_0150.sql:
+
+Improvements in the sql io module
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Added support for a ``chunksize`` parameter to ``to_sql`` function. This allows DataFrame to be written in chunks and avoid packet-size overflow errors (:issue:`8062`).
+- Added support for a ``chunksize`` parameter to ``read_sql`` function. Specifying this argument will return an iterator through chunks of the query result (:issue:`2908`).
+- Added support for writing ``datetime.date`` and ``datetime.time`` object columns with ``to_sql`` (:issue:`6932`).
+- Added support for specifying a ``schema`` to read from/write to with ``read_sql_table`` and ``to_sql`` (:issue:`7441`, :issue:`7952`).
+  For example:
+
+  .. code-block:: python
+
+         df.to_sql('table', engine, schema='other_schema')  # noqa F821
+         pd.read_sql_table('table', engine, schema='other_schema')  # noqa F821
+
+- Added support for writing ``NaN`` values with ``to_sql`` (:issue:`2754`).
+- Added support for writing datetime64 columns with ``to_sql`` for all database flavors (:issue:`7103`).
+
+
+.. _whatsnew_0150.api:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0150.api_breaking:
+
+Breaking changes
+^^^^^^^^^^^^^^^^
+
+API changes related to ``Categorical`` (see :ref:`here <whatsnew_0150.cat>`
+for more details):
+
+- The ``Categorical`` constructor with two arguments changed from
+  "codes/labels and levels" to "values and levels (now called 'categories')".
+  This can lead to subtle bugs. If you use :class:`~pandas.Categorical` directly,
+  please audit your code by changing it to use the :meth:`~pandas.Categorical.from_codes`
+  constructor.
+
+  An old function call like (prior to 0.15.0):
+
+  .. code-block:: python
+
+    pd.Categorical([0,1,0,2,1], levels=['a', 'b', 'c'])
+
+  will have to adapted to the following to keep the same behaviour:
+
+  .. code-block:: ipython
+
+    In [2]: pd.Categorical.from_codes([0,1,0,2,1], categories=['a', 'b', 'c'])
+    Out[2]:
+    [a, b, a, c, b]
+    Categories (3, object): [a, b, c]
+
+API changes related to the introduction of the ``Timedelta`` scalar (see
+:ref:`above <whatsnew_0150.timedeltaindex>` for more details):
+
+- Prior to 0.15.0 :func:`to_timedelta` would return a ``Series`` for list-like/Series input,
+  and a ``np.timedelta64`` for scalar input. It will now return a ``TimedeltaIndex`` for
+  list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
+
+For API changes related to the rolling and expanding functions, see detailed overview :ref:`above <whatsnew_0150.roll>`.
+
+Other notable API changes:
+
+- Consistency when indexing with ``.loc`` and a list-like indexer when no values are found.
+
+  .. ipython:: python
+
+     df = pd.DataFrame([['a'], ['b']], index=[1, 2])
+     df
+
+  In prior versions there was a difference in these two constructs:
+
+  - ``df.loc[[3]]`` would return a frame reindexed by 3 (with all ``np.nan`` values)
+  - ``df.loc[[3],:]`` would raise ``KeyError``.
+
+  Both will now raise a ``KeyError``. The rule is that *at least 1* indexer must be found when using a list-like and ``.loc`` (:issue:`7999`)
+
+  Furthermore in prior versions these were also different:
+
+  - ``df.loc[[1,3]]`` would return a frame reindexed by [1,3]
+  - ``df.loc[[1,3],:]`` would raise ``KeyError``.
+
+  Both will now return a frame reindex by [1,3]. E.g.
+
+  .. code-block:: ipython
+
+     In [3]: df.loc[[1, 3]]
+     Out[3]:
+          0
+     1    a
+     3  NaN
+
+     In [4]: df.loc[[1, 3], :]
+     Out[4]:
+          0
+     1    a
+     3  NaN
+
+  This can also be seen in multi-axis indexing with a ``Panel``.
+
+  .. ipython:: python
+
+     p = pd.Panel(np.arange(2 * 3 * 4).reshape(2, 3, 4),
+                  items=['ItemA', 'ItemB'],
+                  major_axis=[1, 2, 3],
+                  minor_axis=['A', 'B', 'C', 'D'])
+     p
+
+  The following would raise ``KeyError`` prior to 0.15.0:
+
+  .. code-block:: ipython
+
+     In [5]:
+     Out[5]:
+        ItemA  ItemD
+     1      3    NaN
+     2      7    NaN
+     3     11    NaN
+
+  Furthermore, ``.loc`` will raise If no values are found in a MultiIndex with a list-like indexer:
+
+  .. ipython:: python
+     :okexcept:
+
+     s = pd.Series(np.arange(3, dtype='int64'),
+                   index=pd.MultiIndex.from_product([['A'],
+                                                    ['foo', 'bar', 'baz']],
+                                                    names=['one', 'two'])
+                   ).sort_index()
+     s
+     try:
+         s.loc[['D']]
+     except KeyError as e:
+         print("KeyError: " + str(e))
+
+- Assigning values to ``None`` now considers the dtype when choosing an 'empty' value (:issue:`7941`).
+
+  Previously, assigning to ``None`` in numeric containers changed the
+  dtype to object (or errored, depending on the call). It now uses
+  ``NaN``:
+
+  .. ipython:: python
+
+     s = pd.Series([1, 2, 3])
+     s.loc[0] = None
+     s
+
+  ``NaT`` is now used similarly for datetime containers.
+
+  For object containers, we now preserve ``None`` values (previously these
+  were converted to ``NaN`` values).
+
+  .. ipython:: python
+
+     s = pd.Series(["a", "b", "c"])
+     s.loc[0] = None
+     s
+
+  To insert a ``NaN``, you must explicitly use ``np.nan``. See the :ref:`docs <missing.inserting>`.
+
+- In prior versions, updating a pandas object inplace would not reflect in other python references to this object. (:issue:`8511`, :issue:`5104`)
+
+  .. ipython:: python
+
+     s = pd.Series([1, 2, 3])
+     s2 = s
+     s += 1.5
+
+  Behavior prior to v0.15.0
+
+  .. code-block:: ipython
+
+
+     # the original object
+     In [5]: s
+     Out[5]:
+     0    2.5
+     1    3.5
+     2    4.5
+     dtype: float64
+
+
+     # a reference to the original object
+     In [7]: s2
+     Out[7]:
+     0    1
+     1    2
+     2    3
+     dtype: int64
+
+  This is now the correct behavior
+
+  .. ipython:: python
+
+     # the original object
+     s
+
+     # a reference to the original object
+     s2
+
+.. _whatsnew_0150.blanklines:
+
+- Made both the C-based and Python engines for `read_csv` and `read_table` ignore empty lines in input as well as
+  white space-filled lines, as long as ``sep`` is not white space. This is an API change
+  that can be controlled by the keyword parameter ``skip_blank_lines``.  See :ref:`the docs <io.skiplines>` (:issue:`4466`)
+
+- A timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone
+  and inserted as ``object`` dtype rather than being converted to a naive ``datetime64[ns]`` (:issue:`8411`).
+
+- Bug in passing a ``DatetimeIndex`` with a timezone that was not being retained in DataFrame construction from a dict (:issue:`7822`)
+
+  In prior versions this would drop the timezone, now it retains the timezone,
+  but gives a column of ``object`` dtype:
+
+  .. ipython:: python
+
+        i = pd.date_range('1/1/2011', periods=3, freq='10s', tz='US/Eastern')
+        i
+        df = pd.DataFrame({'a': i})
+        df
+        df.dtypes
+
+  Previously this would have yielded a column of ``datetime64`` dtype, but without timezone info.
+
+  The behaviour of assigning a column to an existing dataframe as `df['a'] = i`
+  remains unchanged (this already returned an  ``object`` column with a timezone).
+
+- When passing multiple levels to :meth:`~pandas.DataFrame.stack()`, it will now raise a ``ValueError`` when the
+  levels aren't all level names or all level numbers (:issue:`7660`). See
+  :ref:`Reshaping by stacking and unstacking <reshaping.stack_multiple>`.
+
+- Raise a ``ValueError`` in ``df.to_hdf`` with 'fixed' format, if ``df`` has non-unique columns as the resulting file will be broken (:issue:`7761`)
+
+- ``SettingWithCopy`` raise/warnings (according to the option ``mode.chained_assignment``) will now be issued when setting a value on a sliced mixed-dtype DataFrame using chained-assignment. (:issue:`7845`, :issue:`7950`)
+
+  .. code-block:: python
+
+     In [1]: df = pd.DataFrame(np.arange(0, 9), columns=['count'])
+
+     In [2]: df['group'] = 'b'
+
+     In [3]: df.iloc[0:5]['group'] = 'a'
+     /usr/local/bin/ipython:1: SettingWithCopyWarning:
+     A value is trying to be set on a copy of a slice from a DataFrame.
+     Try using .loc[row_indexer,col_indexer] = value instead
+
+     See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
+
+- ``merge``, ``DataFrame.merge``, and ``ordered_merge`` now return the same type
+  as the ``left`` argument (:issue:`7737`).
+
+- Previously an enlargement with a mixed-dtype frame would act unlike ``.append`` which will preserve dtypes (related :issue:`2578`, :issue:`8176`):
+
+  .. ipython:: python
+
+     df = pd.DataFrame([[True, 1], [False, 2]],
+                       columns=["female", "fitness"])
+     df
+     df.dtypes
+
+     # dtypes are now preserved
+     df.loc[2] = df.loc[1]
+     df
+     df.dtypes
+
+- ``Series.to_csv()`` now returns a string when ``path=None``, matching the behaviour of ``DataFrame.to_csv()`` (:issue:`8215`).
+
+- ``read_hdf`` now raises ``IOError`` when a file that doesn't exist is passed in. Previously, a new, empty file was created, and a ``KeyError`` raised (:issue:`7715`).
+
+- ``DataFrame.info()`` now ends its output with a newline character (:issue:`8114`)
+- Concatenating no objects will now raise a ``ValueError`` rather than a bare ``Exception``.
+- Merge errors will now be sub-classes of ``ValueError`` rather than raw ``Exception`` (:issue:`8501`)
+- ``DataFrame.plot`` and ``Series.plot`` keywords are now have consistent orders (:issue:`8037`)
+
+
+.. _whatsnew_0150.refactoring:
+
+Internal Refactoring
+^^^^^^^^^^^^^^^^^^^^
+
+In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
+but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This
+change allows very easy sub-classing and creation of new index types. This should be
+a transparent change with only very limited API implications (:issue:`5080`, :issue:`7439`, :issue:`7796`, :issue:`8024`, :issue:`8367`, :issue:`7997`, :issue:`8522`):
+
+- you may need to unpickle pandas version < 0.15.0 pickles using ``pd.read_pickle`` rather than ``pickle.load``. See :ref:`pickle docs <io.pickle>`
+- when plotting with a ``PeriodIndex``, the matplotlib internal axes will now be arrays of ``Period`` rather than a ``PeriodIndex`` (this is similar to how a ``DatetimeIndex`` passes arrays of ``datetimes`` now)
+- MultiIndexes will now raise similarly to other pandas objects w.r.t. truth testing, see :ref:`here <gotchas.truth>` (:issue:`7897`).
+- When plotting a DatetimeIndex directly with matplotlib's `plot` function,
+  the axis labels will no longer be formatted as dates but as integers (the
+  internal representation of a ``datetime64``). **UPDATE** This is fixed
+  in 0.15.1, see :ref:`here <whatsnew_0151.datetime64_plotting>`.
+
+.. _whatsnew_0150.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- The attributes ``Categorical`` ``labels`` and ``levels`` attributes are
+  deprecated and renamed to ``codes`` and ``categories``.
+- The ``outtype`` argument to ``pd.DataFrame.to_dict`` has been deprecated in favor of ``orient``. (:issue:`7840`)
+- The ``convert_dummies`` method has been deprecated in favor of
+  ``get_dummies`` (:issue:`8140`)
+- The ``infer_dst`` argument in ``tz_localize`` will be deprecated in favor of
+  ``ambiguous`` to allow for more flexibility in dealing with DST transitions.
+  Replace ``infer_dst=True`` with ``ambiguous='infer'`` for the same behavior (:issue:`7943`).
+  See :ref:`the docs<timeseries.timezone_ambiguous>` for more details.
+- The top-level ``pd.value_range`` has been deprecated and can be replaced by ``.describe()`` (:issue:`8481`)
+
+.. _whatsnew_0150.index_set_ops:
+
+- The ``Index`` set operations ``+`` and ``-`` were deprecated in order to provide these for numeric type operations on certain index types. ``+`` can be replaced by ``.union()`` or ``|``, and ``-`` by ``.difference()``. Further the method name ``Index.diff()`` is deprecated and can be replaced by ``Index.difference()`` (:issue:`8226`)
+
+  .. code-block:: python
+
+     # +
+     pd.Index(['a', 'b', 'c']) + pd.Index(['b', 'c', 'd'])
+
+     # should be replaced by
+     pd.Index(['a', 'b', 'c']).union(pd.Index(['b', 'c', 'd']))
+
+  .. code-block:: python
+
+     # -
+     pd.Index(['a', 'b', 'c']) - pd.Index(['b', 'c', 'd'])
+
+     # should be replaced by
+     pd.Index(['a', 'b', 'c']).difference(pd.Index(['b', 'c', 'd']))
+
+- The ``infer_types`` argument to :func:`~pandas.read_html` now has no
+  effect and is deprecated (:issue:`7762`, :issue:`7032`).
+
+
+.. _whatsnew_0150.prior_deprecations:
+
+Removal of prior version deprecations/changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Remove ``DataFrame.delevel`` method in favor of ``DataFrame.reset_index``
+
+
+
+.. _whatsnew_0150.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+Enhancements in the importing/exporting of Stata files:
+
+- Added support for bool, uint8, uint16 and uint32 data types in ``to_stata`` (:issue:`7097`, :issue:`7365`)
+- Added conversion option when importing Stata files (:issue:`8527`)
+- ``DataFrame.to_stata`` and ``StataWriter`` check string length for
+  compatibility with limitations imposed in dta files where fixed-width
+  strings must contain 244 or fewer characters.  Attempting to write Stata
+  dta files with strings longer than 244 characters raises a ``ValueError``. (:issue:`7858`)
+- ``read_stata`` and ``StataReader`` can import missing data information into a
+  ``DataFrame`` by setting the argument ``convert_missing`` to ``True``. When
+  using this options, missing values are returned as ``StataMissingValue``
+  objects and columns containing missing values have ``object`` data type. (:issue:`8045`)
+
+Enhancements in the plotting functions:
+
+- Added ``layout`` keyword to ``DataFrame.plot``. You can pass a tuple of ``(rows, columns)``, one of which can be ``-1`` to automatically infer (:issue:`6667`, :issue:`8071`).
+- Allow to pass multiple axes to ``DataFrame.plot``, ``hist`` and ``boxplot`` (:issue:`5353`, :issue:`6970`, :issue:`7069`)
+- Added support for ``c``, ``colormap`` and ``colorbar`` arguments for ``DataFrame.plot`` with ``kind='scatter'`` (:issue:`7780`)
+- Histogram from ``DataFrame.plot`` with ``kind='hist'`` (:issue:`7809`), See :ref:`the docs<visualization.hist>`.
+- Boxplot from ``DataFrame.plot`` with ``kind='box'`` (:issue:`7998`), See :ref:`the docs<visualization.box>`.
+
+Other:
+
+- ``read_csv`` now has a keyword parameter ``float_precision`` which specifies which floating-point converter the C engine should use during parsing, see :ref:`here <io.float_precision>` (:issue:`8002`, :issue:`8044`)
+
+- Added ``searchsorted`` method to ``Series`` objects (:issue:`7447`)
+
+- :func:`describe` on mixed-types DataFrames is more flexible. Type-based column filtering is now possible via the ``include``/``exclude`` arguments.
+  See the :ref:`docs <basics.describe>` (:issue:`8164`).
+
+  .. ipython:: python
+
+    df = pd.DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
+                       'catB': ['a', 'b', 'c', 'd'] * 6,
+                       'numC': np.arange(24),
+                       'numD': np.arange(24.) + .5})
+    df.describe(include=["object"])
+    df.describe(include=["number", "object"], exclude=["float"])
+
+  Requesting all columns is possible with the shorthand 'all'
+
+  .. ipython:: python
+
+    df.describe(include='all')
+
+  Without those arguments, ``describe`` will behave as before, including only numerical columns or, if none are, only categorical columns. See also the :ref:`docs <basics.describe>`
+
+- Added ``split`` as an option to the ``orient`` argument in ``pd.DataFrame.to_dict``. (:issue:`7840`)
+
+- The ``get_dummies`` method can now be used on DataFrames. By default only
+  categorical columns are encoded as 0's and 1's, while other columns are
+  left untouched.
+
+  .. ipython:: python
+
+    df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['c', 'c', 'b'],
+                    'C': [1, 2, 3]})
+    pd.get_dummies(df)
+
+- ``PeriodIndex`` supports ``resolution`` as the same as ``DatetimeIndex`` (:issue:`7708`)
+- ``pandas.tseries.holiday`` has added support for additional holidays and ways to observe holidays (:issue:`7070`)
+- ``pandas.tseries.holiday.Holiday`` now supports a list of offsets in Python3 (:issue:`7070`)
+- ``pandas.tseries.holiday.Holiday`` now supports a days_of_week parameter (:issue:`7070`)
+- ``GroupBy.nth()`` now supports selecting multiple nth values (:issue:`7910`)
+
+  .. ipython:: python
+
+    business_dates = pd.date_range(start='4/1/2014', end='6/30/2014', freq='B')
+    df = pd.DataFrame(1, index=business_dates, columns=['a', 'b'])
+    # get the first, 4th, and last date index for each month
+    df.groupby([df.index.year, df.index.month]).nth([0, 3, -1])
+
+- ``Period`` and ``PeriodIndex`` supports addition/subtraction with ``timedelta``-likes (:issue:`7966`)
+
+  If ``Period`` freq is ``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``, ``Timedelta``-like can be added if the result can have same freq. Otherwise, only the same ``offsets`` can be added.
+
+  .. ipython:: python
+
+     idx = pd.period_range('2014-07-01 09:00', periods=5, freq='H')
+     idx
+     idx + pd.offsets.Hour(2)
+     idx + pd.Timedelta('120m')
+
+     idx = pd.period_range('2014-07', periods=5, freq='M')
+     idx
+     idx + pd.offsets.MonthEnd(3)
+
+- Added experimental compatibility with ``openpyxl`` for versions >= 2.0. The ``DataFrame.to_excel``
+  method ``engine`` keyword now recognizes ``openpyxl1`` and ``openpyxl2``
+  which will explicitly require openpyxl v1 and v2 respectively, failing if
+  the requested version is not available. The ``openpyxl`` engine is a now a
+  meta-engine that automatically uses whichever version of openpyxl is
+  installed. (:issue:`7177`)
+
+- ``DataFrame.fillna`` can now accept a ``DataFrame`` as a fill value (:issue:`8377`)
+
+- Passing multiple levels to :meth:`~pandas.DataFrame.stack()` will now work when multiple level
+  numbers are passed (:issue:`7660`). See
+  :ref:`Reshaping by stacking and unstacking <reshaping.stack_multiple>`.
+
+- :func:`set_names`, :func:`set_labels`, and :func:`set_levels` methods now take an optional ``level`` keyword argument to all modification of specific level(s) of a MultiIndex. Additionally :func:`set_names` now accepts a scalar string value when operating on an ``Index`` or on a specific level of a ``MultiIndex`` (:issue:`7792`)
+
+  .. ipython:: python
+
+      idx = pd.MultiIndex.from_product([['a'], range(3), list("pqr")],
+                                       names=['foo', 'bar', 'baz'])
+      idx.set_names('qux', level=0)
+      idx.set_names(['qux', 'corge'], level=[0, 1])
+      idx.set_levels(['a', 'b', 'c'], level='bar')
+      idx.set_levels([['a', 'b', 'c'], [1, 2, 3]], level=[1, 2])
+
+- ``Index.isin`` now supports a ``level`` argument to specify which index level
+  to use for membership tests (:issue:`7892`, :issue:`7890`)
+
+  .. code-block:: ipython
+
+     In [1]: idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b', 'c']])
+
+     In [2]: idx.values
+     Out[2]: array([(0, 'a'), (0, 'b'), (0, 'c'), (1, 'a'), (1, 'b'), (1, 'c')], dtype=object)
+
+     In [3]: idx.isin(['a', 'c', 'e'], level=1)
+     Out[3]: array([ True, False,  True,  True, False,  True], dtype=bool)
+
+- ``Index`` now supports ``duplicated`` and ``drop_duplicates``. (:issue:`4060`)
+
+  .. ipython:: python
+
+     idx = pd.Index([1, 2, 3, 4, 1, 2])
+     idx
+     idx.duplicated()
+     idx.drop_duplicates()
+
+- add ``copy=True`` argument to ``pd.concat`` to enable pass through of complete blocks (:issue:`8252`)
+
+- Added support for numpy 1.8+ data types (``bool_``, ``int_``, ``float_``, ``string_``) for conversion to R dataframe  (:issue:`8400`)
+
+
+
+.. _whatsnew_0150.performance:
+
+Performance
+~~~~~~~~~~~
+
+- Performance improvements in ``DatetimeIndex.__iter__`` to allow faster iteration (:issue:`7683`)
+- Performance improvements in ``Period`` creation (and ``PeriodIndex`` setitem) (:issue:`5155`)
+- Improvements in Series.transform for significant performance gains (revised) (:issue:`6496`)
+- Performance improvements in ``StataReader`` when reading large files (:issue:`8040`, :issue:`8073`)
+- Performance improvements in ``StataWriter`` when writing large files (:issue:`8079`)
+- Performance and memory usage improvements in multi-key ``groupby`` (:issue:`8128`)
+- Performance improvements in groupby ``.agg`` and ``.apply`` where builtins max/min were not mapped to numpy/cythonized versions (:issue:`7722`)
+- Performance improvement in writing to sql (``to_sql``) of up to 50% (:issue:`8208`).
+- Performance benchmarking of groupby for large value of ngroups (:issue:`6787`)
+- Performance improvement in ``CustomBusinessDay``, ``CustomBusinessMonth`` (:issue:`8236`)
+- Performance improvement for ``MultiIndex.values`` for multi-level indexes containing datetimes (:issue:`8543`)
+
+
+
+.. _whatsnew_0150.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in pivot_table, when using margins and a dict aggfunc (:issue:`8349`)
+- Bug in ``read_csv`` where ``squeeze=True`` would return a view (:issue:`8217`)
+- Bug in checking of table name in ``read_sql`` in certain cases (:issue:`7826`).
+- Bug in ``DataFrame.groupby`` where ``Grouper`` does not recognize level when frequency is specified (:issue:`7885`)
+- Bug in multiindexes dtypes getting mixed up when DataFrame is saved to SQL table (:issue:`8021`)
+- Bug in ``Series`` 0-division with a float and integer operand dtypes  (:issue:`7785`)
+- Bug in ``Series.astype("unicode")`` not calling ``unicode`` on the values correctly (:issue:`7758`)
+- Bug in ``DataFrame.as_matrix()`` with mixed ``datetime64[ns]`` and ``timedelta64[ns]`` dtypes (:issue:`7778`)
+- Bug in ``HDFStore.select_column()`` not preserving UTC timezone info when selecting a ``DatetimeIndex`` (:issue:`7777`)
+- Bug in ``to_datetime`` when ``format='%Y%m%d'`` and ``coerce=True`` are specified, where previously an object array was returned (rather than
+  a coerced time-series with ``NaT``), (:issue:`7930`)
+- Bug in ``DatetimeIndex`` and ``PeriodIndex`` in-place addition and subtraction cause different result from normal one (:issue:`6527`)
+- Bug in adding and subtracting ``PeriodIndex`` with ``PeriodIndex`` raise ``TypeError`` (:issue:`7741`)
+- Bug in ``combine_first`` with ``PeriodIndex`` data raises ``TypeError`` (:issue:`3367`)
+- Bug in MultiIndex slicing with missing indexers (:issue:`7866`)
+- Bug in MultiIndex slicing with various edge cases (:issue:`8132`)
+- Regression in MultiIndex indexing with a non-scalar type object (:issue:`7914`)
+- Bug in ``Timestamp`` comparisons with ``==`` and ``int64`` dtype (:issue:`8058`)
+- Bug in pickles contains ``DateOffset`` may raise ``AttributeError`` when ``normalize`` attribute is referred internally (:issue:`7748`)
+- Bug in ``Panel`` when using ``major_xs`` and ``copy=False`` is passed (deprecation warning fails because of missing ``warnings``) (:issue:`8152`).
+- Bug in pickle deserialization that failed for pre-0.14.1 containers with dup items trying to avoid ambiguity
+  when matching block and manager items, when there's only one block there's no ambiguity (:issue:`7794`)
+- Bug in putting a ``PeriodIndex`` into a ``Series`` would convert to ``int64`` dtype, rather than ``object`` of ``Periods`` (:issue:`7932`)
+- Bug in ``HDFStore`` iteration when passing a where (:issue:`8014`)
+- Bug in ``DataFrameGroupby.transform`` when transforming with a passed non-sorted key (:issue:`8046`, :issue:`8430`)
+- Bug in repeated timeseries line and area plot may result in ``ValueError`` or incorrect kind (:issue:`7733`)
+- Bug in inference in a ``MultiIndex`` with ``datetime.date`` inputs (:issue:`7888`)
+- Bug in ``get`` where an ``IndexError`` would not cause the default value to be returned (:issue:`7725`)
+- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may reset nanosecond (:issue:`7697`)
+- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may raise ``AttributeError`` if ``Timestamp`` has ``dateutil`` tzinfo (:issue:`7697`)
+- Bug in sorting a MultiIndex frame with a ``Float64Index`` (:issue:`8017`)
+- Bug in inconsistent panel setitem with a rhs of a ``DataFrame`` for alignment (:issue:`7763`)
+- Bug in ``is_superperiod`` and ``is_subperiod`` cannot handle higher frequencies than ``S`` (:issue:`7760`, :issue:`7772`, :issue:`7803`)
+- Bug in 32-bit platforms with ``Series.shift`` (:issue:`8129`)
+- Bug in ``PeriodIndex.unique`` returns int64 ``np.ndarray`` (:issue:`7540`)
+- Bug in ``groupby.apply`` with a non-affecting mutation in the function (:issue:`8467`)
+- Bug in ``DataFrame.reset_index`` which has ``MultiIndex`` contains ``PeriodIndex`` or ``DatetimeIndex`` with tz raises ``ValueError`` (:issue:`7746`, :issue:`7793`)
+- Bug in ``DataFrame.plot`` with ``subplots=True`` may draw unnecessary minor xticks and yticks (:issue:`7801`)
+- Bug in ``StataReader`` which did not read variable labels in 117 files due to difference between Stata documentation and implementation (:issue:`7816`)
+- Bug in ``StataReader`` where strings were always converted to 244 characters-fixed width irrespective of underlying string size (:issue:`7858`)
+- Bug in ``DataFrame.plot`` and ``Series.plot`` may ignore ``rot`` and ``fontsize`` keywords (:issue:`7844`)
+- Bug in ``DatetimeIndex.value_counts`` doesn't preserve tz  (:issue:`7735`)
+- Bug in ``PeriodIndex.value_counts`` results in ``Int64Index`` (:issue:`7735`)
+- Bug in ``DataFrame.join`` when doing left join on index and there are multiple matches (:issue:`5391`)
+- Bug in ``GroupBy.transform()`` where int groups with a transform that
+  didn't preserve the index were incorrectly truncated (:issue:`7972`).
+- Bug in ``groupby`` where callable objects without name attributes would take the wrong path,
+  and produce a ``DataFrame`` instead of a ``Series`` (:issue:`7929`)
+- Bug in ``groupby`` error message when a DataFrame grouping column is duplicated (:issue:`7511`)
+- Bug in ``read_html`` where the ``infer_types`` argument forced coercion of
+  date-likes incorrectly (:issue:`7762`, :issue:`7032`).
+- Bug in ``Series.str.cat`` with an index which was filtered as to not include the first item (:issue:`7857`)
+- Bug in ``Timestamp`` cannot parse ``nanosecond`` from string (:issue:`7878`)
+- Bug in ``Timestamp`` with string offset and ``tz`` results incorrect (:issue:`7833`)
+- Bug in ``tslib.tz_convert`` and ``tslib.tz_convert_single`` may return different results (:issue:`7798`)
+- Bug in ``DatetimeIndex.intersection`` of non-overlapping timestamps with tz raises ``IndexError`` (:issue:`7880`)
+- Bug in alignment with TimeOps and non-unique indexes (:issue:`8363`)
+- Bug in ``GroupBy.filter()`` where fast path vs. slow path made the filter
+  return a non scalar value that appeared valid but wasn't (:issue:`7870`).
+- Bug in ``date_range()``/``DatetimeIndex()`` when the timezone was inferred from input dates yet incorrect
+  times were returned when crossing DST boundaries (:issue:`7835`, :issue:`7901`).
+- Bug in ``to_excel()`` where a negative sign was being prepended to positive infinity and was absent for negative infinity (:issue:`7949`)
+- Bug in area plot draws legend with incorrect ``alpha`` when ``stacked=True`` (:issue:`8027`)
+- ``Period`` and ``PeriodIndex`` addition/subtraction with ``np.timedelta64`` results in incorrect internal representations (:issue:`7740`)
+- Bug in ``Holiday`` with no offset or observance (:issue:`7987`)
+- Bug in ``DataFrame.to_latex`` formatting when columns or index is a ``MultiIndex`` (:issue:`7982`).
+- Bug in ``DateOffset`` around Daylight Savings Time produces unexpected results (:issue:`5175`).
+- Bug in ``DataFrame.shift`` where empty columns would throw ``ZeroDivisionError`` on numpy 1.7 (:issue:`8019`)
+- Bug in installation where ``html_encoding/*.html`` wasn't installed and
+  therefore some tests were not running correctly (:issue:`7927`).
+- Bug in ``read_html`` where ``bytes`` objects were not tested for in
+  ``_read`` (:issue:`7927`).
+- Bug in ``DataFrame.stack()`` when one of the column levels was a datelike (:issue:`8039`)
+- Bug in broadcasting numpy scalars with ``DataFrame`` (:issue:`8116`)
+- Bug in ``pivot_table`` performed with nameless ``index`` and ``columns`` raises ``KeyError`` (:issue:`8103`)
+- Bug in ``DataFrame.plot(kind='scatter')`` draws points and errorbars with different colors when the color is specified by ``c`` keyword (:issue:`8081`)
+- Bug in ``Float64Index`` where ``iat`` and ``at`` were not testing and were
+  failing (:issue:`8092`).
+- Bug in ``DataFrame.boxplot()`` where y-limits were not set correctly when
+  producing multiple axes (:issue:`7528`, :issue:`5517`).
+- Bug in ``read_csv`` where line comments were not handled correctly given
+  a custom line terminator or ``delim_whitespace=True`` (:issue:`8122`).
+- Bug in ``read_html`` where empty tables caused a ``StopIteration`` (:issue:`7575`)
+- Bug in casting when setting a column in a same-dtype block (:issue:`7704`)
+- Bug in accessing groups from a ``GroupBy`` when the original grouper
+  was a tuple (:issue:`8121`).
+- Bug in ``.at`` that would accept integer indexers on a non-integer index and do fallback (:issue:`7814`)
+- Bug with kde plot and NaNs (:issue:`8182`)
+- Bug in ``GroupBy.count`` with float32 data type were nan values were not excluded (:issue:`8169`).
+- Bug with stacked barplots and NaNs (:issue:`8175`).
+- Bug in resample with non evenly divisible offsets (e.g. '7s') (:issue:`8371`)
+- Bug in interpolation methods with the ``limit`` keyword when no values needed interpolating (:issue:`7173`).
+- Bug where ``col_space`` was ignored in ``DataFrame.to_string()`` when ``header=False`` (:issue:`8230`).
+- Bug with ``DatetimeIndex.asof`` incorrectly matching partial strings and returning the wrong date (:issue:`8245`).
+- Bug in plotting methods modifying the global matplotlib rcParams (:issue:`8242`).
+- Bug in ``DataFrame.__setitem__`` that caused errors when setting a dataframe column to a sparse array (:issue:`8131`)
+- Bug where ``Dataframe.boxplot()`` failed when entire column was empty (:issue:`8181`).
+- Bug with messed variables in ``radviz`` visualization (:issue:`8199`).
+- Bug in interpolation methods with the ``limit`` keyword when no values needed interpolating (:issue:`7173`).
+- Bug where ``col_space`` was ignored in ``DataFrame.to_string()`` when ``header=False`` (:issue:`8230`).
+- Bug in ``to_clipboard`` that would clip long column data (:issue:`8305`)
+- Bug in ``DataFrame`` terminal display: Setting max_column/max_rows to zero did not trigger auto-resizing of dfs to fit terminal width/height (:issue:`7180`).
+- Bug in OLS where running with "cluster" and "nw_lags" parameters did not work correctly, but also did not throw an error
+  (:issue:`5884`).
+- Bug in ``DataFrame.dropna`` that interpreted non-existent columns in the subset argument as the 'last column' (:issue:`8303`)
+- Bug in ``Index.intersection`` on non-monotonic non-unique indexes (:issue:`8362`).
+- Bug in masked series assignment where mismatching types would break alignment (:issue:`8387`)
+- Bug in ``NDFrame.equals`` gives false negatives with dtype=object (:issue:`8437`)
+- Bug in assignment with indexer where type diversity would break alignment (:issue:`8258`)
+- Bug in ``NDFrame.loc`` indexing when row/column names were lost when target was a list/ndarray (:issue:`6552`)
+- Regression in ``NDFrame.loc`` indexing when rows/columns were converted to Float64Index if target was an empty list/ndarray (:issue:`7774`)
+- Bug in ``Series`` that allows it to be indexed by a ``DataFrame`` which has unexpected results.  Such indexing is no longer permitted (:issue:`8444`)
+- Bug in item assignment of a ``DataFrame`` with MultiIndex columns where right-hand-side columns were not aligned (:issue:`7655`)
+- Suppress FutureWarning generated by NumPy when comparing object arrays containing NaN for equality (:issue:`7065`)
+- Bug in ``DataFrame.eval()`` where the dtype of the ``not`` operator (``~``)
+  was not correctly inferred as ``bool``.
+
+
+.. _whatsnew_0.15.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.14.1..v0.15.0
diff --git a/doc/source/whatsnew/v0.15.0.txt b/doc/source/whatsnew/v0.15.0.txt
deleted file mode 100644
index 6282f15b6faeb..0000000000000
--- a/doc/source/whatsnew/v0.15.0.txt
+++ /dev/null
@@ -1,1204 +0,0 @@
-.. _whatsnew_0150:
-
-v0.15.0 (October 18, 2014)
---------------------------
-
-This is a major release from 0.14.1 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-.. warning::
-
-   pandas >= 0.15.0 will no longer support compatibility with NumPy versions <
-   1.7.0. If you want to use the latest versions of pandas, please upgrade to
-   NumPy >= 1.7.0 (:issue:`7711`)
-
-- Highlights include:
-
-  - The ``Categorical`` type was integrated as a first-class pandas type, see :ref:`here <whatsnew_0150.cat>`
-  - New scalar type ``Timedelta``, and a new index type ``TimedeltaIndex``, see :ref:`here <whatsnew_0150.timedeltaindex>`
-  - New datetimelike properties accessor ``.dt`` for Series, see :ref:`Datetimelike Properties <whatsnew_0150.dt>`
-  - New DataFrame default display for ``df.info()`` to include memory usage, see :ref:`Memory Usage <whatsnew_0150.memory>`
-  - ``read_csv`` will now by default ignore blank lines when parsing, see :ref:`here <whatsnew_0150.blanklines>`
-  - API change in using Indexes in set operations, see :ref:`here <whatsnew_0150.index_set_ops>`
-  - Enhancements in the handling of timezones, see :ref:`here <whatsnew_0150.tz>`
-  - A lot of improvements to the rolling and expanding moment funtions, see :ref:`here <whatsnew_0150.roll>`
-  - Internal refactoring of the ``Index`` class to no longer sub-class ``ndarray``, see :ref:`Internal Refactoring <whatsnew_0150.refactoring>`
-  - dropping support for ``PyTables`` less than version 3.0.0, and ``numexpr`` less than version 2.1 (:issue:`7990`)
-  - Split indexing documentation into :ref:`Indexing and Selecting Data <indexing>` and :ref:`MultiIndex / Advanced Indexing <advanced>`
-  - Split out string methods documentation into :ref:`Working with Text Data <text>`
-
-- Check the :ref:`API Changes <whatsnew_0150.api>` and :ref:`deprecations <whatsnew_0150.deprecations>` before updating
-
-- :ref:`Other Enhancements <whatsnew_0150.enhancements>`
-
-- :ref:`Performance Improvements <whatsnew_0150.performance>`
-
-- :ref:`Bug Fixes <whatsnew_0150.bug_fixes>`
-
-.. warning::
-
-   In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
-   but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This change allows very easy sub-classing and creation of new index types. This should be
-   a transparent change with only very limited API implications (See the :ref:`Internal Refactoring <whatsnew_0150.refactoring>`)
-
-.. warning::
-
-   The refactorings in :class:`~pandas.Categorical` changed the two argument constructor from
-   "codes/labels and levels" to "values and levels (now called 'categories')". This can lead to subtle bugs. If you use
-   :class:`~pandas.Categorical` directly, please audit your code before updating to this pandas
-   version and change it to use the :meth:`~pandas.Categorical.from_codes` constructor. See more on ``Categorical`` :ref:`here <whatsnew_0150.cat>`
-
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0150.cat:
-
-Categoricals in Series/DataFrame
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:class:`~pandas.Categorical` can now be included in `Series` and `DataFrames` and gained new
-methods to manipulate. Thanks to Jan Schulz for much of this API/implementation. (:issue:`3943`, :issue:`5313`, :issue:`5314`,
-:issue:`7444`, :issue:`7839`, :issue:`7848`, :issue:`7864`, :issue:`7914`, :issue:`7768`, :issue:`8006`, :issue:`3678`,
-:issue:`8075`, :issue:`8076`, :issue:`8143`, :issue:`8453`, :issue:`8518`).
-
-For full docs, see the :ref:`categorical introduction <categorical>` and the
-:ref:`API documentation <api.categorical>`.
-
-.. ipython:: python
-    :okwarning:
-
-    df = DataFrame({"id":[1,2,3,4,5,6], "raw_grade":['a', 'b', 'b', 'a', 'a', 'e']})
-
-    df["grade"] = df["raw_grade"].astype("category")
-    df["grade"]
-
-    # Rename the categories
-    df["grade"].cat.categories = ["very good", "good", "very bad"]
-
-    # Reorder the categories and simultaneously add the missing categories
-    df["grade"] = df["grade"].cat.set_categories(["very bad", "bad", "medium", "good", "very good"])
-    df["grade"]
-    df.sort_values("grade")
-    df.groupby("grade").size()
-
-- ``pandas.core.group_agg`` and ``pandas.core.factor_agg`` were removed. As an alternative, construct
-  a dataframe and use ``df.groupby(<group>).agg(<func>)``.
-
-- Supplying "codes/labels and levels" to the :class:`~pandas.Categorical` constructor is not
-  supported anymore. Supplying two arguments to the constructor is now interpreted as
-  "values and levels (now called 'categories')". Please change your code to use the :meth:`~pandas.Categorical.from_codes`
-  constructor.
-
-- The ``Categorical.labels`` attribute was renamed to ``Categorical.codes`` and is read
-  only. If you want to manipulate codes, please use one of the
-  :ref:`API methods on Categoricals <api.categorical>`.
-
-- The ``Categorical.levels`` attribute is renamed to ``Categorical.categories``.
-
-
-.. _whatsnew_0150.timedeltaindex:
-
-TimedeltaIndex/Scalar
-^^^^^^^^^^^^^^^^^^^^^
-
-We introduce a new scalar type ``Timedelta``, which is a subclass of ``datetime.timedelta``, and behaves in a similar manner,
-but allows compatibility with ``np.timedelta64`` types as well as a host of custom representation, parsing, and attributes.
-This type is very similar to how ``Timestamp`` works for ``datetimes``. It is a nice-API box for the type. See the :ref:`docs <timedeltas.timedeltas>`.
-(:issue:`3009`, :issue:`4533`, :issue:`8209`, :issue:`8187`, :issue:`8190`, :issue:`7869`, :issue:`7661`, :issue:`8345`, :issue:`8471`)
-
-.. warning::
-
-   ``Timedelta`` scalars (and ``TimedeltaIndex``) component fields are *not the same* as the component fields on a ``datetime.timedelta`` object. For example, ``.seconds`` on a ``datetime.timedelta`` object returns the total number of seconds combined between ``hours``, ``minutes`` and ``seconds``. In contrast, the pandas ``Timedelta`` breaks out hours, minutes, microseconds and nanoseconds separately.
-
-   .. code-block:: ipython
-
-      # Timedelta accessor
-      In [9]: tds = Timedelta('31 days 5 min 3 sec')
-
-      In [10]: tds.minutes
-      Out[10]: 5L
-
-      In [11]: tds.seconds
-      Out[11]: 3L
-
-      # datetime.timedelta accessor
-      # this is 5 minutes * 60 + 3 seconds
-      In [12]: tds.to_pytimedelta().seconds
-      Out[12]: 303
-
-   **Note**: this is no longer true starting from v0.16.0, where full
-   compatibility with ``datetime.timedelta`` is introduced. See the
-   :ref:`0.16.0 whatsnew entry <whatsnew_0160.api_breaking.timedelta>`
-
-.. warning::
-
-       Prior to 0.15.0 ``pd.to_timedelta`` would return a ``Series`` for list-like/Series input, and a ``np.timedelta64`` for scalar input.
-       It will now return a ``TimedeltaIndex`` for list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
-
-       The arguments to ``pd.to_timedelta`` are now ``(arg,unit='ns',box=True,coerce=False)``, previously were ``(arg,box=True,unit='ns')`` as these are more logical.
-
-Consruct a scalar
-
-.. ipython:: python
-
-   Timedelta('1 days 06:05:01.00003')
-   Timedelta('15.5us')
-   Timedelta('1 hour 15.5us')
-
-   # negative Timedeltas have this string repr
-   # to be more consistent with datetime.timedelta conventions
-   Timedelta('-1us')
-
-   # a NaT
-   Timedelta('nan')
-
-Access fields for a ``Timedelta``
-
-.. ipython:: python
-
-   td = Timedelta('1 hour 3m 15.5us')
-   td.seconds
-   td.microseconds
-   td.nanoseconds
-
-Construct a ``TimedeltaIndex``
-
-.. ipython:: python
-   :suppress:
-
-   import datetime
-   from datetime import timedelta
-
-.. ipython:: python
-
-   TimedeltaIndex(['1 days','1 days, 00:00:05',
-                   np.timedelta64(2,'D'),timedelta(days=2,seconds=2)])
-
-Constructing a ``TimedeltaIndex`` with a regular range
-
-.. ipython:: python
-
-   timedelta_range('1 days',periods=5,freq='D')
-   timedelta_range(start='1 days',end='2 days',freq='30T')
-
-You can now use a ``TimedeltaIndex`` as the index of a pandas object
-
-.. ipython:: python
-
-   s = Series(np.arange(5),
-              index=timedelta_range('1 days',periods=5,freq='s'))
-   s
-
-You can select with partial string selections
-
-.. ipython:: python
-
-   s['1 day 00:00:02']
-   s['1 day':'1 day 00:00:02']
-
-Finally, the combination of ``TimedeltaIndex`` with ``DatetimeIndex`` allow certain combination operations that are ``NaT`` preserving:
-
-.. ipython:: python
-
-   tdi = TimedeltaIndex(['1 days',pd.NaT,'2 days'])
-   tdi.tolist()
-   dti = date_range('20130101',periods=3)
-   dti.tolist()
-
-   (dti + tdi).tolist()
-   (dti - tdi).tolist()
-
-- iteration of a ``Series`` e.g. ``list(Series(...))`` of ``timedelta64[ns]`` would prior to v0.15.0 return ``np.timedelta64`` for each element. These will now be wrapped in ``Timedelta``.
-
-
-.. _whatsnew_0150.memory:
-
-Memory Usage
-^^^^^^^^^^^^
-
-Implemented methods to find memory usage of a DataFrame. See the :ref:`FAQ <df-memory-usage>` for more. (:issue:`6852`).
-
-A new display option ``display.memory_usage`` (see :ref:`options`) sets the default behavior of the ``memory_usage`` argument in the ``df.info()`` method. By default ``display.memory_usage`` is ``True``.
-
-.. ipython:: python
-
-    dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
-              'complex128', 'object', 'bool']
-    n = 5000
-    data = dict([ (t, np.random.randint(100, size=n).astype(t))
-                    for t in dtypes])
-    df = DataFrame(data)
-    df['categorical'] = df['object'].astype('category')
-
-    df.info()
-
-Additionally :meth:`~pandas.DataFrame.memory_usage` is an available method for a dataframe object which returns the memory usage of each column.
-
-.. ipython:: python
-
-    df.memory_usage(index=True)
-
-
-.. _whatsnew_0150.dt:
-
-.dt accessor
-^^^^^^^^^^^^
-
-``Series`` has gained an accessor to succinctly return datetime like properties for the *values* of the Series, if its a datetime/period like Series. (:issue:`7207`)
-This will return a Series, indexed like the existing Series. See the :ref:`docs <basics.dt_accessors>`
-
-.. ipython:: python
-
-   # datetime
-   s = Series(date_range('20130101 09:10:12',periods=4))
-   s
-   s.dt.hour
-   s.dt.second
-   s.dt.day
-   s.dt.freq
-
-This enables nice expressions like this:
-
-.. ipython:: python
-
-   s[s.dt.day==2]
-
-You can easily produce tz aware transformations:
-
-.. ipython:: python
-
-   stz = s.dt.tz_localize('US/Eastern')
-   stz
-   stz.dt.tz
-
-You can also chain these types of operations:
-
-.. ipython:: python
-
-   s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
-
-The ``.dt`` accessor works for period and timedelta dtypes.
-
-.. ipython:: python
-
-   # period
-   s = Series(period_range('20130101',periods=4,freq='D'))
-   s
-   s.dt.year
-   s.dt.day
-
-.. ipython:: python
-
-   # timedelta
-   s = Series(timedelta_range('1 day 00:00:05',periods=4,freq='s'))
-   s
-   s.dt.days
-   s.dt.seconds
-   s.dt.components
-
-
-.. _whatsnew_0150.tz:
-
-Timezone handling improvements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- ``tz_localize(None)`` for tz-aware ``Timestamp`` and ``DatetimeIndex`` now removes timezone holding local time,
-  previously this resulted in ``Exception`` or ``TypeError`` (:issue:`7812`)
-
-  .. ipython:: python
-
-     ts = Timestamp('2014-08-01 09:00', tz='US/Eastern')
-     ts
-     ts.tz_localize(None)
-
-     didx = DatetimeIndex(start='2014-08-01 09:00', freq='H', periods=10, tz='US/Eastern')
-     didx
-     didx.tz_localize(None)
-
-- ``tz_localize`` now accepts the ``ambiguous`` keyword which allows for passing an array of bools
-  indicating whether the date belongs in DST or not, 'NaT' for setting transition times to NaT,
-  'infer' for inferring DST/non-DST, and 'raise' (default) for an ``AmbiguousTimeError`` to be raised. See :ref:`the docs<timeseries.timezone_ambiguous>` for more details (:issue:`7943`)
-
-- ``DataFrame.tz_localize`` and ``DataFrame.tz_convert`` now accepts an optional ``level`` argument
-  for localizing a specific level of a MultiIndex (:issue:`7846`)
-
-- ``Timestamp.tz_localize`` and ``Timestamp.tz_convert`` now raise ``TypeError`` in error cases, rather than ``Exception`` (:issue:`8025`)
-
-- a  timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone (rather than being a naive ``datetime64[ns]``) as ``object`` dtype (:issue:`8411`)
-
-- ``Timestamp.__repr__`` displays ``dateutil.tz.tzoffset`` info (:issue:`7907`)
-
-
-.. _whatsnew_0150.roll:
-
-Rolling/Expanding Moments improvements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- :func:`rolling_min`, :func:`rolling_max`, :func:`rolling_cov`, and :func:`rolling_corr`
-  now return objects with all ``NaN`` when ``len(arg) < min_periods <= window`` rather
-  than raising. (This makes all rolling functions consistent in this behavior). (:issue:`7766`)
-
-  Prior to 0.15.0
-
-  .. ipython:: python
-
-     s = Series([10, 11, 12, 13])
-
-  .. code-block:: ipython
-
-     In [15]: rolling_min(s, window=10, min_periods=5)
-     ValueError: min_periods (5) must be <= window (4)
-
-  New behavior
-
-  .. code-block:: ipython
-
-     In [4]: pd.rolling_min(s, window=10, min_periods=5)
-     Out[4]:
-     0   NaN
-     1   NaN
-     2   NaN
-     3   NaN
-     dtype: float64
-
-- :func:`rolling_max`, :func:`rolling_min`, :func:`rolling_sum`, :func:`rolling_mean`, :func:`rolling_median`,
-  :func:`rolling_std`, :func:`rolling_var`, :func:`rolling_skew`, :func:`rolling_kurt`, :func:`rolling_quantile`,
-  :func:`rolling_cov`, :func:`rolling_corr`, :func:`rolling_corr_pairwise`,
-  :func:`rolling_window`, and :func:`rolling_apply` with ``center=True`` previously would return a result of the same
-  structure as the input ``arg`` with ``NaN`` in the final ``(window-1)/2`` entries.
-
-  Now the final ``(window-1)/2`` entries of the result are calculated as if the input ``arg`` were followed
-  by ``(window-1)/2`` ``NaN`` values (or with shrinking windows, in the case of :func:`rolling_apply`).
-  (:issue:`7925`, :issue:`8269`)
-
-  Prior behavior (note final value is ``NaN``):
-
-  .. code-block:: ipython
-
-    In [7]: rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
-    Out[7]:
-    0     1
-    1     3
-    2     6
-    3   NaN
-    dtype: float64
-
-  New behavior (note final value is ``5 = sum([2, 3, NaN])``):
-
-  .. code-block:: ipython
-
-     In [7]: rolling_sum(Series(range(4)), window=3, min_periods=0, center=True)
-     Out[7]:
-     0    1
-     1    3
-     2    6
-     3    5
-     dtype: float64
-
-- :func:`rolling_window` now normalizes the weights properly in rolling mean mode (`mean=True`) so that
-  the calculated weighted means (e.g. 'triang', 'gaussian') are distributed about the same means as those
-  calculated without weighting (i.e. 'boxcar'). See :ref:`the note on normalization <stats.moments.normalization>` for further details. (:issue:`7618`)
-
-  .. ipython:: python
-
-    s = Series([10.5, 8.8, 11.4, 9.7, 9.3])
-
-  Behavior prior to 0.15.0:
-
-  .. code-block:: ipython
-
-     In [39]: rolling_window(s, window=3, win_type='triang', center=True)
-     Out[39]:
-     0         NaN
-     1    6.583333
-     2    6.883333
-     3    6.683333
-     4         NaN
-     dtype: float64
-
-  New behavior
-
-  .. code-block:: ipython
-
-     In [10]: pd.rolling_window(s, window=3, win_type='triang', center=True)
-     Out[10]:
-     0       NaN
-     1     9.875
-     2    10.325
-     3    10.025
-     4       NaN
-     dtype: float64
-
-- Removed ``center`` argument from all :func:`expanding_ <expanding_apply>` functions (see :ref:`list <api.functions_expanding>`),
-  as the results produced when ``center=True`` did not make much sense. (:issue:`7925`)
-
-- Added optional ``ddof`` argument to :func:`expanding_cov` and :func:`rolling_cov`.
-  The default value of ``1`` is backwards-compatible. (:issue:`8279`)
-
-- Documented the ``ddof`` argument to :func:`expanding_var`, :func:`expanding_std`,
-  :func:`rolling_var`, and :func:`rolling_std`. These functions' support of a
-  ``ddof`` argument (with a default value of ``1``) was previously undocumented. (:issue:`8064`)
-
-- :func:`ewma`, :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
-  now interpret ``min_periods`` in the same manner that the :func:`rolling_*()` and :func:`expanding_*()` functions do:
-  a given result entry will be ``NaN`` if the (expanding, in this case) window does not contain
-  at least ``min_periods`` values. The previous behavior was to set to ``NaN`` the ``min_periods`` entries
-  starting with the first non- ``NaN`` value. (:issue:`7977`)
-
-  Prior behavior (note values start at index ``2``, which is ``min_periods`` after index ``0``
-  (the index of the first non-empty value)):
-
-  .. ipython:: python
-
-    s  = Series([1, None, None, None, 2, 3])
-
-  .. code-block:: ipython
-
-	In [51]: ewma(s, com=3., min_periods=2)
-	Out[51]:
-	0         NaN
-	1         NaN
-	2    1.000000
-	3    1.000000
-	4    1.571429
-	5    2.189189
-	dtype: float64
-
-  New behavior (note values start at index ``4``, the location of the 2nd (since ``min_periods=2``) non-empty value):
-
-  .. code-block:: ipython
-
-     In [2]: pd.ewma(s, com=3., min_periods=2)
-     Out[2]:
-     0         NaN
-     1         NaN
-     2         NaN
-     3         NaN
-     4    1.759644
-     5    2.383784
-     dtype: float64
-
-- :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
-  now have an optional ``adjust`` argument, just like :func:`ewma` does,
-  affecting how the weights are calculated.
-  The default value of ``adjust`` is ``True``, which is backwards-compatible.
-  See :ref:`Exponentially weighted moment functions <stats.moments.exponentially_weighted>` for details. (:issue:`7911`)
-
-- :func:`ewma`, :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, :func:`ewmcov`, and :func:`ewmcorr`
-  now have an optional ``ignore_na`` argument.
-  When ``ignore_na=False`` (the default), missing values are taken into account in the weights calculation.
-  When ``ignore_na=True`` (which reproduces the pre-0.15.0 behavior), missing values are ignored in the weights calculation.
-  (:issue:`7543`)
-
-  .. code-block:: ipython
-
-     In [7]: pd.ewma(Series([None, 1., 8.]), com=2.)
-     Out[7]:
-     0    NaN
-     1    1.0
-     2    5.2
-     dtype: float64
-
-     In [8]: pd.ewma(Series([1., None, 8.]), com=2., ignore_na=True)  # pre-0.15.0 behavior
-     Out[8]:
-     0    1.0
-     1    1.0
-     2    5.2
-     dtype: float64
-
-     In [9]: pd.ewma(Series([1., None, 8.]), com=2., ignore_na=False)  # new default
-     Out[9]:
-     0    1.000000
-     1    1.000000
-     2    5.846154
-     dtype: float64
-
-  .. warning::
-
-     By default (``ignore_na=False``) the :func:`ewm*()` functions' weights calculation
-     in the presence of missing values is different than in pre-0.15.0 versions.
-     To reproduce the pre-0.15.0 calculation of weights in the presence of missing values
-     one must specify explicitly ``ignore_na=True``.
-
-- Bug in :func:`expanding_cov`, :func:`expanding_corr`, :func:`rolling_cov`, :func:`rolling_cor`, :func:`ewmcov`, and :func:`ewmcorr`
-  returning results with columns sorted by name and producing an error for non-unique columns;
-  now handles non-unique columns and returns columns in original order
-  (except for the case of two DataFrames with ``pairwise=False``, where behavior is unchanged) (:issue:`7542`)
-- Bug in :func:`rolling_count` and :func:`expanding_*()` functions unnecessarily producing error message for zero-length data (:issue:`8056`)
-- Bug in :func:`rolling_apply` and :func:`expanding_apply` interpreting ``min_periods=0`` as ``min_periods=1`` (:issue:`8080`)
-- Bug in :func:`expanding_std` and :func:`expanding_var` for a single value producing a confusing error message (:issue:`7900`)
-- Bug in :func:`rolling_std` and :func:`rolling_var` for a single value producing ``0`` rather than ``NaN`` (:issue:`7900`)
-
-- Bug in :func:`ewmstd`, :func:`ewmvol`, :func:`ewmvar`, and :func:`ewmcov`
-  calculation of de-biasing factors when ``bias=False`` (the default).
-  Previously an incorrect constant factor was used, based on ``adjust=True``, ``ignore_na=True``,
-  and an infinite number of observations.
-  Now a different factor is used for each entry, based on the actual weights
-  (analogous to the usual ``N/(N-1)`` factor).
-  In particular, for a single point a value of ``NaN`` is returned when ``bias=False``,
-  whereas previously a value of (approximately) ``0`` was returned.
-
-  For example, consider the following pre-0.15.0 results for ``ewmvar(..., bias=False)``,
-  and the corresponding debiasing factors:
-
-  .. ipython:: python
-
-     s = Series([1., 2., 0., 4.])
-
-  .. code-block:: ipython
-
-	 In [89]: ewmvar(s, com=2., bias=False)
-	 Out[89]:
-	 0   -2.775558e-16
-	 1    3.000000e-01
-	 2    9.556787e-01
-	 3    3.585799e+00
-	 dtype: float64
-
-	 In [90]: ewmvar(s, com=2., bias=False) / ewmvar(s, com=2., bias=True)
-	 Out[90]:
-	 0    1.25
-	 1    1.25
-	 2    1.25
-	 3    1.25
-	 dtype: float64
-
-  Note that entry ``0`` is approximately 0, and the debiasing factors are a constant 1.25.
-  By comparison, the following 0.15.0 results have a ``NaN`` for entry ``0``,
-  and the debiasing factors are decreasing (towards 1.25):
-
-  .. code-block:: ipython
-
-     In [14]: pd.ewmvar(s, com=2., bias=False)
-     Out[14]:
-     0         NaN
-     1    0.500000
-     2    1.210526
-     3    4.089069
-     dtype: float64
-
-     In [15]: pd.ewmvar(s, com=2., bias=False) / pd.ewmvar(s, com=2., bias=True)
-     Out[15]:
-     0         NaN
-     1    2.083333
-     2    1.583333
-     3    1.425439
-     dtype: float64
-
-  See :ref:`Exponentially weighted moment functions <stats.moments.exponentially_weighted>` for details. (:issue:`7912`)
-
-
-.. _whatsnew_0150.sql:
-
-Improvements in the sql io module
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Added support for a ``chunksize`` parameter to ``to_sql`` function. This allows DataFrame to be written in chunks and avoid packet-size overflow errors (:issue:`8062`).
-- Added support for a ``chunksize`` parameter to ``read_sql`` function. Specifying this argument will return an iterator through chunks of the query result (:issue:`2908`).
-- Added support for writing ``datetime.date`` and ``datetime.time`` object columns with ``to_sql`` (:issue:`6932`).
-- Added support for specifying a ``schema`` to read from/write to with ``read_sql_table`` and ``to_sql`` (:issue:`7441`, :issue:`7952`).
-  For example:
-
-  .. code-block:: python
-
-         df.to_sql('table', engine, schema='other_schema')
-         pd.read_sql_table('table', engine, schema='other_schema')
-
-- Added support for writing ``NaN`` values with ``to_sql`` (:issue:`2754`).
-- Added support for writing datetime64 columns with ``to_sql`` for all database flavors (:issue:`7103`).
-
-
-.. _whatsnew_0150.api:
-
-Backwards incompatible API changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _whatsnew_0150.api_breaking:
-
-Breaking changes
-^^^^^^^^^^^^^^^^
-
-API changes related to ``Categorical`` (see :ref:`here <whatsnew_0150.cat>`
-for more details):
-
-- The ``Categorical`` constructor with two arguments changed from
-  "codes/labels and levels" to "values and levels (now called 'categories')".
-  This can lead to subtle bugs. If you use :class:`~pandas.Categorical` directly,
-  please audit your code by changing it to use the :meth:`~pandas.Categorical.from_codes`
-  constructor.
-
-  An old function call like (prior to 0.15.0):
-
-  .. code-block:: python
-
-    pd.Categorical([0,1,0,2,1], levels=['a', 'b', 'c'])
-
-  will have to adapted to the following to keep the same behaviour:
-
-  .. code-block:: ipython
-
-    In [2]: pd.Categorical.from_codes([0,1,0,2,1], categories=['a', 'b', 'c'])
-    Out[2]:
-    [a, b, a, c, b]
-    Categories (3, object): [a, b, c]
-
-API changes related to the introduction of the ``Timedelta`` scalar (see
-:ref:`above <whatsnew_0150.timedeltaindex>` for more details):
-
-- Prior to 0.15.0 :func:`to_timedelta` would return a ``Series`` for list-like/Series input,
-  and a ``np.timedelta64`` for scalar input. It will now return a ``TimedeltaIndex`` for
-  list-like input, ``Series`` for Series input, and ``Timedelta`` for scalar input.
-
-For API changes related to the rolling and expanding functions, see detailed overview :ref:`above <whatsnew_0150.roll>`.
-
-Other notable API changes:
-
-- Consistency when indexing with ``.loc`` and a list-like indexer when no values are found.
-
-  .. ipython:: python
-
-     df = DataFrame([['a'],['b']],index=[1,2])
-     df
-
-  In prior versions there was a difference in these two constructs:
-
-  - ``df.loc[[3]]`` would return a frame reindexed by 3 (with all ``np.nan`` values)
-  - ``df.loc[[3],:]`` would raise ``KeyError``.
-
-  Both will now raise a ``KeyError``. The rule is that *at least 1* indexer must be found when using a list-like and ``.loc`` (:issue:`7999`)
-
-  Furthermore in prior versions these were also different:
-
-  - ``df.loc[[1,3]]`` would return a frame reindexed by [1,3]
-  - ``df.loc[[1,3],:]`` would raise ``KeyError``.
-
-  Both will now return a frame reindex by [1,3]. E.g.
-
-  .. ipython:: python
-
-     df.loc[[1,3]]
-     df.loc[[1,3],:]
-
-  This can also be seen in multi-axis indexing with a ``Panel``.
-
-  .. ipython:: python
-
-     p = Panel(np.arange(2*3*4).reshape(2,3,4),
-               items=['ItemA','ItemB'],
-               major_axis=[1,2,3],
-               minor_axis=['A','B','C','D'])
-     p
-
-  The following would raise ``KeyError`` prior to 0.15.0:
-
-  .. ipython:: python
-
-     p.loc[['ItemA','ItemD'],:,'D']
-
-  Furthermore, ``.loc`` will raise If no values are found in a multi-index with a list-like indexer:
-
-  .. ipython:: python
-     :okexcept:
-
-     s = Series(np.arange(3,dtype='int64'),
-                index=MultiIndex.from_product([['A'],['foo','bar','baz']],
-                                              names=['one','two'])
-               ).sort_index()
-     s
-     try:
-        s.loc[['D']]
-     except KeyError as e:
-        print("KeyError: " + str(e))
-
-- Assigning values to ``None`` now considers the dtype when choosing an 'empty' value (:issue:`7941`).
-
-  Previously, assigning to ``None`` in numeric containers changed the
-  dtype to object (or errored, depending on the call). It now uses
-  ``NaN``:
-
-  .. ipython:: python
-
-     s = Series([1, 2, 3])
-     s.loc[0] = None
-     s
-
-  ``NaT`` is now used similarly for datetime containers.
-
-  For object containers, we now preserve ``None`` values (previously these
-  were converted to ``NaN`` values).
-
-  .. ipython:: python
-
-     s = Series(["a", "b", "c"])
-     s.loc[0] = None
-     s
-
-  To insert a ``NaN``, you must explicitly use ``np.nan``. See the :ref:`docs <missing.inserting>`.
-
-- In prior versions, updating a pandas object inplace would not reflect in other python references to this object. (:issue:`8511`, :issue:`5104`)
-
-  .. ipython:: python
-
-     s = Series([1, 2, 3])
-     s2 = s
-     s += 1.5
-
-  Behavior prior to v0.15.0
-
-  .. code-block:: ipython
-
-
-     # the original object
-     In [5]: s
-     Out[5]:
-     0    2.5
-     1    3.5
-     2    4.5
-     dtype: float64
-
-
-     # a reference to the original object
-     In [7]: s2
-     Out[7]:
-     0    1
-     1    2
-     2    3
-     dtype: int64
-
-  This is now the correct behavior
-
-  .. ipython:: python
-
-     # the original object
-     s
-
-     # a reference to the original object
-     s2
-
-.. _whatsnew_0150.blanklines:
-
-- Made both the C-based and Python engines for `read_csv` and `read_table` ignore empty lines in input as well as
-  whitespace-filled lines, as long as ``sep`` is not whitespace. This is an API change
-  that can be controlled by the keyword parameter ``skip_blank_lines``.  See :ref:`the docs <io.skiplines>` (:issue:`4466`)
-
-- A timeseries/index localized to UTC when inserted into a Series/DataFrame will preserve the UTC timezone
-  and inserted as ``object`` dtype rather than being converted to a naive ``datetime64[ns]`` (:issue:`8411`).
-
-- Bug in passing a ``DatetimeIndex`` with a timezone that was not being retained in DataFrame construction from a dict (:issue:`7822`)
-
-  In prior versions this would drop the timezone, now it retains the timezone,
-  but gives a column of ``object`` dtype:
-
-  .. ipython:: python
-
-        i = date_range('1/1/2011', periods=3, freq='10s', tz = 'US/Eastern')
-        i
-        df = DataFrame( {'a' : i } )
-        df
-        df.dtypes
-
-  Previously this would have yielded a column of ``datetime64`` dtype, but without timezone info.
-
-  The behaviour of assigning a column to an existing dataframe as `df['a'] = i`
-  remains unchanged (this already returned an  ``object`` column with a timezone).
-
-- When passing multiple levels to :meth:`~pandas.DataFrame.stack()`, it will now raise a ``ValueError`` when the
-  levels aren't all level names or all level numbers (:issue:`7660`). See
-  :ref:`Reshaping by stacking and unstacking <reshaping.stack_multiple>`.
-
-- Raise a ``ValueError`` in ``df.to_hdf`` with 'fixed' format, if ``df`` has non-unique columns as the resulting file will be broken (:issue:`7761`)
-
-- ``SettingWithCopy`` raise/warnings (according to the option ``mode.chained_assignment``) will now be issued when setting a value on a sliced mixed-dtype DataFrame using chained-assignment. (:issue:`7845`, :issue:`7950`)
-
-  .. code-block:: python
-
-     In [1]: df = DataFrame(np.arange(0,9), columns=['count'])
-
-     In [2]: df['group'] = 'b'
-
-     In [3]: df.iloc[0:5]['group'] = 'a'
-     /usr/local/bin/ipython:1: SettingWithCopyWarning:
-     A value is trying to be set on a copy of a slice from a DataFrame.
-     Try using .loc[row_indexer,col_indexer] = value instead
-
-     See the the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
-
-- ``merge``, ``DataFrame.merge``, and ``ordered_merge`` now return the same type
-  as the ``left`` argument (:issue:`7737`).
-
-- Previously an enlargement with a mixed-dtype frame would act unlike ``.append`` which will preserve dtypes (related :issue:`2578`, :issue:`8176`):
-
-  .. ipython:: python
-
-     df = DataFrame([[True, 1],[False, 2]],
-                    columns=["female","fitness"])
-     df
-     df.dtypes
-
-     # dtypes are now preserved
-     df.loc[2] = df.loc[1]
-     df
-     df.dtypes
-
-- ``Series.to_csv()`` now returns a string when ``path=None``, matching the behaviour of ``DataFrame.to_csv()`` (:issue:`8215`).
-
-- ``read_hdf`` now raises ``IOError`` when a file that doesn't exist is passed in. Previously, a new, empty file was created, and a ``KeyError`` raised (:issue:`7715`).
-
-- ``DataFrame.info()`` now ends its output with a newline character (:issue:`8114`)
-- Concatenating no objects will now raise a ``ValueError`` rather than a bare ``Exception``.
-- Merge errors will now be sub-classes of ``ValueError`` rather than raw ``Exception`` (:issue:`8501`)
-- ``DataFrame.plot`` and ``Series.plot`` keywords are now have consistent orders (:issue:`8037`)
-
-
-.. _whatsnew_0150.refactoring:
-
-Internal Refactoring
-^^^^^^^^^^^^^^^^^^^^
-
-In 0.15.0 ``Index`` has internally been refactored to no longer sub-class ``ndarray``
-but instead subclass ``PandasObject``, similarly to the rest of the pandas objects. This
-change allows very easy sub-classing and creation of new index types. This should be
-a transparent change with only very limited API implications (:issue:`5080`, :issue:`7439`, :issue:`7796`, :issue:`8024`, :issue:`8367`, :issue:`7997`, :issue:`8522`):
-
-- you may need to unpickle pandas version < 0.15.0 pickles using ``pd.read_pickle`` rather than ``pickle.load``. See :ref:`pickle docs <io.pickle>`
-- when plotting with a ``PeriodIndex``, the matplotlib internal axes will now be arrays of ``Period`` rather than a ``PeriodIndex`` (this is similar to how a ``DatetimeIndex`` passes arrays of ``datetimes`` now)
-- MultiIndexes will now raise similary to other pandas objects w.r.t. truth testing, see :ref:`here <gotchas.truth>` (:issue:`7897`).
-- When plotting a DatetimeIndex directly with matplotlib's `plot` function,
-  the axis labels will no longer be formatted as dates but as integers (the
-  internal representation of a ``datetime64``). **UPDATE** This is fixed
-  in 0.15.1, see :ref:`here <whatsnew_0151.datetime64_plotting>`.
-
-.. _whatsnew_0150.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- The attributes ``Categorical`` ``labels`` and ``levels`` attributes are
-  deprecated and renamed to ``codes`` and ``categories``.
-- The ``outtype`` argument to ``pd.DataFrame.to_dict`` has been deprecated in favor of ``orient``. (:issue:`7840`)
-- The ``convert_dummies`` method has been deprecated in favor of
-  ``get_dummies`` (:issue:`8140`)
-- The ``infer_dst`` argument in ``tz_localize`` will be deprecated in favor of
-  ``ambiguous`` to allow for more flexibility in dealing with DST transitions.
-  Replace ``infer_dst=True`` with ``ambiguous='infer'`` for the same behavior (:issue:`7943`).
-  See :ref:`the docs<timeseries.timezone_ambiguous>` for more details.
-- The top-level ``pd.value_range`` has been deprecated and can be replaced by ``.describe()`` (:issue:`8481`)
-
-.. _whatsnew_0150.index_set_ops:
-
-- The ``Index`` set operations ``+`` and ``-`` were deprecated in order to provide these for numeric type operations on certain index types. ``+`` can be replaced by ``.union()`` or ``|``, and ``-`` by ``.difference()``. Further the method name ``Index.diff()`` is deprecated and can be replaced by ``Index.difference()`` (:issue:`8226`)
-
-  .. code-block:: python
-
-     # +
-     Index(['a','b','c']) + Index(['b','c','d'])
-
-     # should be replaced by
-     Index(['a','b','c']).union(Index(['b','c','d']))
-
-  .. code-block:: python
-
-     # -
-     Index(['a','b','c']) - Index(['b','c','d'])
-
-     # should be replaced by
-     Index(['a','b','c']).difference(Index(['b','c','d']))
-
-- The ``infer_types`` argument to :func:`~pandas.read_html` now has no
-  effect and is deprecated (:issue:`7762`, :issue:`7032`).
-
-
-.. _whatsnew_0150.prior_deprecations:
-
-Removal of prior version deprecations/changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Remove ``DataFrame.delevel`` method in favor of ``DataFrame.reset_index``
-
-
-
-.. _whatsnew_0150.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-Enhancements in the importing/exporting of Stata files:
-
-- Added support for bool, uint8, uint16 and uint32 datatypes in ``to_stata`` (:issue:`7097`, :issue:`7365`)
-- Added conversion option when importing Stata files (:issue:`8527`)
-- ``DataFrame.to_stata`` and ``StataWriter`` check string length for
-  compatibility with limitations imposed in dta files where fixed-width
-  strings must contain 244 or fewer characters.  Attempting to write Stata
-  dta files with strings longer than 244 characters raises a ``ValueError``. (:issue:`7858`)
-- ``read_stata`` and ``StataReader`` can import missing data information into a
-  ``DataFrame`` by setting the argument ``convert_missing`` to ``True``. When
-  using this options, missing values are returned as ``StataMissingValue``
-  objects and columns containing missing values have ``object`` data type. (:issue:`8045`)
-
-Enhancements in the plotting functions:
-
-- Added ``layout`` keyword to ``DataFrame.plot``. You can pass a tuple of ``(rows, columns)``, one of which can be ``-1`` to automatically infer (:issue:`6667`, :issue:`8071`).
-- Allow to pass multiple axes to ``DataFrame.plot``, ``hist`` and ``boxplot`` (:issue:`5353`, :issue:`6970`, :issue:`7069`)
-- Added support for ``c``, ``colormap`` and ``colorbar`` arguments for ``DataFrame.plot`` with ``kind='scatter'`` (:issue:`7780`)
-- Histogram from ``DataFrame.plot`` with ``kind='hist'`` (:issue:`7809`), See :ref:`the docs<visualization.hist>`.
-- Boxplot from ``DataFrame.plot`` with ``kind='box'`` (:issue:`7998`), See :ref:`the docs<visualization.box>`.
-
-Other:
-
-- ``read_csv`` now has a keyword parameter ``float_precision`` which specifies which floating-point converter the C engine should use during parsing, see :ref:`here <io.float_precision>` (:issue:`8002`, :issue:`8044`)
-
-- Added ``searchsorted`` method to ``Series`` objects (:issue:`7447`)
-
-- :func:`describe` on mixed-types DataFrames is more flexible. Type-based column filtering is now possible via the ``include``/``exclude`` arguments.
-  See the :ref:`docs <basics.describe>` (:issue:`8164`).
-
-  .. ipython:: python
-
-    df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                    'catB': ['a', 'b', 'c', 'd'] * 6,
-                    'numC': np.arange(24),
-                    'numD': np.arange(24.) + .5})
-    df.describe(include=["object"])
-    df.describe(include=["number", "object"], exclude=["float"])
-
-  Requesting all columns is possible with the shorthand 'all'
-
-  .. ipython:: python
-
-    df.describe(include='all')
-
-  Without those arguments, 'describe` will behave as before, including only numerical columns or, if none are, only categorical columns. See also the :ref:`docs <basics.describe>`
-
-- Added ``split`` as an option to the ``orient`` argument in ``pd.DataFrame.to_dict``. (:issue:`7840`)
-
-- The ``get_dummies`` method can now be used on DataFrames. By default only
-  catagorical columns are encoded as 0's and 1's, while other columns are
-  left untouched.
-
-  .. ipython:: python
-
-    df = DataFrame({'A': ['a', 'b', 'a'], 'B': ['c', 'c', 'b'],
-                    'C': [1, 2, 3]})
-    pd.get_dummies(df)
-
-- ``PeriodIndex`` supports ``resolution`` as the same as ``DatetimeIndex`` (:issue:`7708`)
-- ``pandas.tseries.holiday`` has added support for additional holidays and ways to observe holidays (:issue:`7070`)
-- ``pandas.tseries.holiday.Holiday`` now supports a list of offsets in Python3 (:issue:`7070`)
-- ``pandas.tseries.holiday.Holiday`` now supports a days_of_week parameter (:issue:`7070`)
-- ``GroupBy.nth()`` now supports selecting multiple nth values (:issue:`7910`)
-
-  .. ipython:: python
-
-    business_dates = date_range(start='4/1/2014', end='6/30/2014', freq='B')
-    df = DataFrame(1, index=business_dates, columns=['a', 'b'])
-    # get the first, 4th, and last date index for each month
-    df.groupby((df.index.year, df.index.month)).nth([0, 3, -1])
-
-- ``Period`` and ``PeriodIndex`` supports addition/subtraction with ``timedelta``-likes (:issue:`7966`)
-
-  If ``Period`` freq is ``D``, ``H``, ``T``, ``S``, ``L``, ``U``, ``N``, ``Timedelta``-like can be added if the result can have same freq. Otherwise, only the same ``offsets`` can be added.
-
-  .. ipython:: python
-
-    idx = pd.period_range('2014-07-01 09:00', periods=5, freq='H')
-    idx
-    idx + pd.offsets.Hour(2)
-    idx + Timedelta('120m')
-
-    idx = pd.period_range('2014-07', periods=5, freq='M')
-    idx
-    idx + pd.offsets.MonthEnd(3)
-
-- Added experimental compatibility with ``openpyxl`` for versions >= 2.0. The ``DataFrame.to_excel``
-  method ``engine`` keyword now recognizes ``openpyxl1`` and ``openpyxl2``
-  which will explicitly require openpyxl v1 and v2 respectively, failing if
-  the requested version is not available. The ``openpyxl`` engine is a now a
-  meta-engine that automatically uses whichever version of openpyxl is
-  installed. (:issue:`7177`)
-
-- ``DataFrame.fillna`` can now accept a ``DataFrame`` as a fill value (:issue:`8377`)
-
-- Passing multiple levels to :meth:`~pandas.DataFrame.stack()` will now work when multiple level
-  numbers are passed (:issue:`7660`). See
-  :ref:`Reshaping by stacking and unstacking <reshaping.stack_multiple>`.
-
-- :func:`set_names`, :func:`set_labels`, and :func:`set_levels` methods now take an optional ``level`` keyword argument to all modification of specific level(s) of a MultiIndex. Additionally :func:`set_names` now accepts a scalar string value when operating on an ``Index`` or on a specific level of a ``MultiIndex`` (:issue:`7792`)
-
-  .. ipython:: python
-
-      idx = MultiIndex.from_product([['a'], range(3), list("pqr")], names=['foo', 'bar', 'baz'])
-      idx.set_names('qux', level=0)
-      idx.set_names(['qux','baz'], level=[0,1])
-      idx.set_levels(['a','b','c'], level='bar')
-      idx.set_levels([['a','b','c'],[1,2,3]], level=[1,2])
-
-- ``Index.isin`` now supports a ``level`` argument to specify which index level
-  to use for membership tests (:issue:`7892`, :issue:`7890`)
-
-  .. code-block:: ipython
-
-     In [1]: idx = MultiIndex.from_product([[0, 1], ['a', 'b', 'c']])
-
-     In [2]: idx.values
-     Out[2]: array([(0, 'a'), (0, 'b'), (0, 'c'), (1, 'a'), (1, 'b'), (1, 'c')], dtype=object)
-
-     In [3]: idx.isin(['a', 'c', 'e'], level=1)
-     Out[3]: array([ True, False,  True,  True, False,  True], dtype=bool)
-
-- ``Index`` now supports ``duplicated`` and ``drop_duplicates``. (:issue:`4060`)
-
-  .. ipython:: python
-
-     idx = Index([1, 2, 3, 4, 1, 2])
-     idx
-     idx.duplicated()
-     idx.drop_duplicates()
-
-- add ``copy=True`` argument to ``pd.concat`` to enable pass thru of complete blocks (:issue:`8252`)
-
-- Added support for numpy 1.8+ data types (``bool_``, ``int_``, ``float_``, ``string_``) for conversion to R dataframe  (:issue:`8400`)
-
-
-
-.. _whatsnew_0150.performance:
-
-Performance
-~~~~~~~~~~~
-
-- Performance improvements in ``DatetimeIndex.__iter__`` to allow faster iteration (:issue:`7683`)
-- Performance improvements in ``Period`` creation (and ``PeriodIndex`` setitem) (:issue:`5155`)
-- Improvements in Series.transform for significant performance gains (revised) (:issue:`6496`)
-- Performance improvements in ``StataReader`` when reading large files (:issue:`8040`, :issue:`8073`)
-- Performance improvements in ``StataWriter`` when writing large files (:issue:`8079`)
-- Performance and memory usage improvements in multi-key ``groupby`` (:issue:`8128`)
-- Performance improvements in groupby ``.agg`` and ``.apply`` where builtins max/min were not mapped to numpy/cythonized versions (:issue:`7722`)
-- Performance improvement in writing to sql (``to_sql``) of up to 50% (:issue:`8208`).
-- Performance benchmarking of groupby for large value of ngroups (:issue:`6787`)
-- Performance improvement in ``CustomBusinessDay``, ``CustomBusinessMonth`` (:issue:`8236`)
-- Performance improvement for ``MultiIndex.values`` for multi-level indexes containing datetimes (:issue:`8543`)
-
-
-
-.. _whatsnew_0150.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in pivot_table, when using margins and a dict aggfunc (:issue:`8349`)
-- Bug in ``read_csv`` where ``squeeze=True`` would return a view (:issue:`8217`)
-- Bug in checking of table name in ``read_sql`` in certain cases (:issue:`7826`).
-- Bug in ``DataFrame.groupby`` where ``Grouper`` does not recognize level when frequency is specified (:issue:`7885`)
-- Bug in multiindexes dtypes getting mixed up when DataFrame is saved to SQL table (:issue:`8021`)
-- Bug in ``Series`` 0-division with a float and integer operand dtypes  (:issue:`7785`)
-- Bug in ``Series.astype("unicode")`` not calling ``unicode`` on the values correctly (:issue:`7758`)
-- Bug in ``DataFrame.as_matrix()`` with mixed ``datetime64[ns]`` and ``timedelta64[ns]`` dtypes (:issue:`7778`)
-- Bug in ``HDFStore.select_column()`` not preserving UTC timezone info when selecting a ``DatetimeIndex`` (:issue:`7777`)
-- Bug in ``to_datetime`` when ``format='%Y%m%d'`` and ``coerce=True`` are specified, where previously an object array was returned (rather than
-  a coerced time-series with ``NaT``), (:issue:`7930`)
-- Bug in ``DatetimeIndex`` and ``PeriodIndex`` in-place addition and subtraction cause different result from normal one (:issue:`6527`)
-- Bug in adding and subtracting ``PeriodIndex`` with ``PeriodIndex`` raise ``TypeError`` (:issue:`7741`)
-- Bug in ``combine_first`` with ``PeriodIndex`` data raises ``TypeError`` (:issue:`3367`)
-- Bug in multi-index slicing with missing indexers (:issue:`7866`)
-- Bug in multi-index slicing with various edge cases (:issue:`8132`)
-- Regression in multi-index indexing with a non-scalar type object (:issue:`7914`)
-- Bug in ``Timestamp`` comparisons with ``==`` and ``int64`` dtype (:issue:`8058`)
-- Bug in pickles contains ``DateOffset`` may raise ``AttributeError`` when ``normalize`` attribute is reffered internally (:issue:`7748`)
-- Bug in ``Panel`` when using ``major_xs`` and ``copy=False`` is passed (deprecation warning fails because of missing ``warnings``) (:issue:`8152`).
-- Bug in pickle deserialization that failed for pre-0.14.1 containers with dup items trying to avoid ambiguity
-  when matching block and manager items, when there's only one block there's no ambiguity (:issue:`7794`)
-- Bug in putting a ``PeriodIndex`` into a ``Series`` would convert to ``int64`` dtype, rather than ``object`` of ``Periods`` (:issue:`7932`)
-- Bug in ``HDFStore`` iteration when passing a where (:issue:`8014`)
-- Bug in ``DataFrameGroupby.transform`` when transforming with a passed non-sorted key (:issue:`8046`, :issue:`8430`)
-- Bug in repeated timeseries line and area plot may result in ``ValueError`` or incorrect kind (:issue:`7733`)
-- Bug in inference in a ``MultiIndex`` with ``datetime.date`` inputs (:issue:`7888`)
-- Bug in ``get`` where an ``IndexError`` would not cause the default value to be returned (:issue:`7725`)
-- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may reset nanosecond (:issue:`7697`)
-- Bug in ``offsets.apply``, ``rollforward`` and ``rollback`` may raise ``AttributeError`` if ``Timestamp`` has ``dateutil`` tzinfo (:issue:`7697`)
-- Bug in sorting a multi-index frame with a ``Float64Index`` (:issue:`8017`)
-- Bug in inconsistent panel setitem with a rhs of a ``DataFrame`` for alignment (:issue:`7763`)
-- Bug in ``is_superperiod`` and ``is_subperiod`` cannot handle higher frequencies than ``S`` (:issue:`7760`, :issue:`7772`, :issue:`7803`)
-- Bug in 32-bit platforms with ``Series.shift`` (:issue:`8129`)
-- Bug in ``PeriodIndex.unique`` returns int64 ``np.ndarray`` (:issue:`7540`)
-- Bug in ``groupby.apply`` with a non-affecting mutation in the function (:issue:`8467`)
-- Bug in ``DataFrame.reset_index`` which has ``MultiIndex`` contains ``PeriodIndex`` or ``DatetimeIndex`` with tz raises ``ValueError`` (:issue:`7746`, :issue:`7793`)
-- Bug in ``DataFrame.plot`` with ``subplots=True`` may draw unnecessary minor xticks and yticks (:issue:`7801`)
-- Bug in ``StataReader`` which did not read variable labels in 117 files due to difference between Stata documentation and implementation (:issue:`7816`)
-- Bug in ``StataReader`` where strings were always converted to 244 characters-fixed width irrespective of underlying string size (:issue:`7858`)
-- Bug in ``DataFrame.plot`` and ``Series.plot`` may ignore ``rot`` and ``fontsize`` keywords (:issue:`7844`)
-- Bug in ``DatetimeIndex.value_counts`` doesn't preserve tz  (:issue:`7735`)
-- Bug in ``PeriodIndex.value_counts`` results in ``Int64Index`` (:issue:`7735`)
-- Bug in ``DataFrame.join`` when doing left join on index and there are multiple matches (:issue:`5391`)
-- Bug in ``GroupBy.transform()`` where int groups with a transform that
-  didn't preserve the index were incorrectly truncated (:issue:`7972`).
-- Bug in ``groupby`` where callable objects without name attributes would take the wrong path,
-  and produce a ``DataFrame`` instead of a ``Series`` (:issue:`7929`)
-- Bug in ``groupby`` error message when a DataFrame grouping column is duplicated (:issue:`7511`)
-- Bug in ``read_html`` where the ``infer_types`` argument forced coercion of
-  date-likes incorrectly (:issue:`7762`, :issue:`7032`).
-- Bug in ``Series.str.cat`` with an index which was filtered as to not include the first item (:issue:`7857`)
-- Bug in ``Timestamp`` cannot parse ``nanosecond`` from string (:issue:`7878`)
-- Bug in ``Timestamp`` with string offset and ``tz`` results incorrect (:issue:`7833`)
-- Bug in ``tslib.tz_convert`` and ``tslib.tz_convert_single`` may return different results (:issue:`7798`)
-- Bug in ``DatetimeIndex.intersection`` of non-overlapping timestamps with tz raises ``IndexError`` (:issue:`7880`)
-- Bug in alignment with TimeOps and non-unique indexes (:issue:`8363`)
-- Bug in ``GroupBy.filter()`` where fast path vs. slow path made the filter
-  return a non scalar value that appeared valid but wasn't (:issue:`7870`).
-- Bug in ``date_range()``/``DatetimeIndex()`` when the timezone was inferred from input dates yet incorrect
-  times were returned when crossing DST boundaries (:issue:`7835`, :issue:`7901`).
-- Bug in ``to_excel()`` where a negative sign was being prepended to positive infinity and was absent for negative infinity (:issue:`7949`)
-- Bug in area plot draws legend with incorrect ``alpha`` when ``stacked=True`` (:issue:`8027`)
-- ``Period`` and ``PeriodIndex`` addition/subtraction with ``np.timedelta64`` results in incorrect internal representations (:issue:`7740`)
-- Bug in ``Holiday`` with no offset or observance (:issue:`7987`)
-- Bug in ``DataFrame.to_latex`` formatting when columns or index is a ``MultiIndex`` (:issue:`7982`).
-- Bug in ``DateOffset`` around Daylight Savings Time produces unexpected results (:issue:`5175`).
-- Bug in ``DataFrame.shift`` where empty columns would throw ``ZeroDivisionError`` on numpy 1.7 (:issue:`8019`)
-- Bug in installation where ``html_encoding/*.html`` wasn't installed and
-  therefore some tests were not running correctly (:issue:`7927`).
-- Bug in ``read_html`` where ``bytes`` objects were not tested for in
-  ``_read`` (:issue:`7927`).
-- Bug in ``DataFrame.stack()`` when one of the column levels was a datelike (:issue:`8039`)
-- Bug in broadcasting numpy scalars with ``DataFrame`` (:issue:`8116`)
-- Bug in ``pivot_table`` performed with nameless ``index`` and ``columns`` raises ``KeyError`` (:issue:`8103`)
-- Bug in ``DataFrame.plot(kind='scatter')`` draws points and errorbars with different colors when the color is specified by ``c`` keyword (:issue:`8081`)
-- Bug in ``Float64Index`` where ``iat`` and ``at`` were not testing and were
-  failing (:issue:`8092`).
-- Bug in ``DataFrame.boxplot()`` where y-limits were not set correctly when
-  producing multiple axes (:issue:`7528`, :issue:`5517`).
-- Bug in ``read_csv`` where line comments were not handled correctly given
-  a custom line terminator or ``delim_whitespace=True`` (:issue:`8122`).
-- Bug in ``read_html`` where empty tables caused a ``StopIteration`` (:issue:`7575`)
-- Bug in casting when setting a column in a same-dtype block (:issue:`7704`)
-- Bug in accessing groups from a ``GroupBy`` when the original grouper
-  was a tuple (:issue:`8121`).
-- Bug in ``.at`` that would accept integer indexers on a non-integer index and do fallback (:issue:`7814`)
-- Bug with kde plot and NaNs (:issue:`8182`)
-- Bug in ``GroupBy.count`` with float32 data type were nan values were not excluded (:issue:`8169`).
-- Bug with stacked barplots and NaNs (:issue:`8175`).
-- Bug in resample with non evenly divisible offsets (e.g. '7s') (:issue:`8371`)
-- Bug in interpolation methods with the ``limit`` keyword when no values needed interpolating (:issue:`7173`).
-- Bug where ``col_space`` was ignored in ``DataFrame.to_string()`` when ``header=False`` (:issue:`8230`).
-- Bug with ``DatetimeIndex.asof`` incorrectly matching partial strings and returning the wrong date (:issue:`8245`).
-- Bug in plotting methods modifying the global matplotlib rcParams (:issue:`8242`).
-- Bug in ``DataFrame.__setitem__`` that caused errors when setting a dataframe column to a sparse array (:issue:`8131`)
-- Bug where ``Dataframe.boxplot()`` failed when entire column was empty (:issue:`8181`).
-- Bug with messed variables in ``radviz`` visualization (:issue:`8199`).
-- Bug in interpolation methods with the ``limit`` keyword when no values needed interpolating (:issue:`7173`).
-- Bug where ``col_space`` was ignored in ``DataFrame.to_string()`` when ``header=False`` (:issue:`8230`).
-- Bug in ``to_clipboard`` that would clip long column data (:issue:`8305`)
-- Bug in ``DataFrame`` terminal display: Setting max_column/max_rows to zero did not trigger auto-resizing of dfs to fit terminal width/height (:issue:`7180`).
-- Bug in OLS where running with "cluster" and "nw_lags" parameters did not work correctly, but also did not throw an error
-  (:issue:`5884`).
-- Bug in ``DataFrame.dropna`` that interpreted non-existent columns in the subset argument as the 'last column' (:issue:`8303`)
-- Bug in ``Index.intersection`` on non-monotonic non-unique indexes (:issue:`8362`).
-- Bug in masked series assignment where mismatching types would break alignment (:issue:`8387`)
-- Bug in ``NDFrame.equals`` gives false negatives with dtype=object (:issue:`8437`)
-- Bug in assignment with indexer where type diversity would break alignment (:issue:`8258`)
-- Bug in ``NDFrame.loc`` indexing when row/column names were lost when target was a list/ndarray (:issue:`6552`)
-- Regression in ``NDFrame.loc`` indexing when rows/columns were converted to Float64Index if target was an empty list/ndarray (:issue:`7774`)
-- Bug in ``Series`` that allows it to be indexed by a ``DataFrame`` which has unexpected results.  Such indexing is no longer permitted (:issue:`8444`)
-- Bug in item assignment of a ``DataFrame`` with multi-index columns where right-hand-side columns were not aligned (:issue:`7655`)
-- Suppress FutureWarning generated by NumPy when comparing object arrays containing NaN for equality (:issue:`7065`)
-- Bug in ``DataFrame.eval()`` where the dtype of the ``not`` operator (``~``)
-  was not correctly inferred as ``bool``.
diff --git a/doc/source/whatsnew/v0.15.1.rst b/doc/source/whatsnew/v0.15.1.rst
new file mode 100644
index 0000000000000..1091944cb056f
--- /dev/null
+++ b/doc/source/whatsnew/v0.15.1.rst
@@ -0,0 +1,318 @@
+.. _whatsnew_0151:
+
+v0.15.1 (November 9, 2014)
+--------------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release from 0.15.0 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+- :ref:`Enhancements <whatsnew_0151.enhancements>`
+- :ref:`API Changes <whatsnew_0151.api>`
+- :ref:`Bug Fixes <whatsnew_0151.bug_fixes>`
+
+.. _whatsnew_0151.api:
+
+API changes
+~~~~~~~~~~~
+
+- ``s.dt.hour`` and other ``.dt`` accessors will now return ``np.nan`` for missing values (rather than previously -1), (:issue:`8689`)
+
+  .. ipython:: python
+
+     s = pd.Series(pd.date_range('20130101', periods=5, freq='D'))
+     s.iloc[2] = np.nan
+     s
+
+  previous behavior:
+
+  .. code-block:: ipython
+
+     In [6]: s.dt.hour
+     Out[6]:
+     0    0
+     1    0
+     2   -1
+     3    0
+     4    0
+     dtype: int64
+
+  current behavior:
+
+  .. ipython:: python
+
+     s.dt.hour
+
+- ``groupby`` with ``as_index=False`` will not add erroneous extra columns to
+  result (:issue:`8582`):
+
+  .. ipython:: python
+
+     np.random.seed(2718281)
+     df = pd.DataFrame(np.random.randint(0, 100, (10, 2)),
+                       columns=['jim', 'joe'])
+     df.head()
+
+     ts = pd.Series(5 * np.random.randint(0, 3, 10))
+
+  previous behavior:
+
+  .. code-block:: ipython
+
+     In [4]: df.groupby(ts, as_index=False).max()
+     Out[4]:
+        NaN  jim  joe
+     0    0   72   83
+     1    5   77   84
+     2   10   96   65
+
+  current behavior:
+
+  .. ipython:: python
+
+    df.groupby(ts, as_index=False).max()
+
+- ``groupby`` will not erroneously exclude columns if the column name conflicts
+  with the grouper name (:issue:`8112`):
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'jim': range(5), 'joe': range(5, 10)})
+     df
+     gr = df.groupby(df['jim'] < 2)
+
+  previous behavior (excludes 1st column from output):
+
+  .. code-block:: ipython
+
+     In [4]: gr.apply(sum)
+     Out[4]:
+            joe
+     jim
+     False   24
+     True    11
+
+  current behavior:
+
+  .. ipython:: python
+
+     gr.apply(sum)
+
+- Support for slicing with monotonic decreasing indexes, even if ``start`` or ``stop`` is
+  not found in the index (:issue:`7860`):
+
+  .. ipython:: python
+
+    s = pd.Series(['a', 'b', 'c', 'd'], [4, 3, 2, 1])
+    s
+
+  previous behavior:
+
+  .. code-block:: ipython
+
+     In [8]: s.loc[3.5:1.5]
+     KeyError: 3.5
+
+  current behavior:
+
+  .. ipython:: python
+
+     s.loc[3.5:1.5]
+
+- ``io.data.Options`` has been fixed for a change in the format of the Yahoo Options page (:issue:`8612`), (:issue:`8741`)
+
+  .. note::
+
+    As a result of a change in Yahoo's option page layout, when an expiry date is given,
+    ``Options`` methods now return data for a single expiry date.  Previously, methods returned all
+    data for the selected month.
+
+  The ``month`` and ``year`` parameters have been undeprecated and can be used to get all
+  options data for a given month.
+
+  If an expiry date that is not valid is given, data for the next expiry after the given
+  date is returned.
+
+  Option data frames are now saved on the instance as ``callsYYMMDD`` or ``putsYYMMDD``.  Previously
+  they were saved as ``callsMMYY`` and ``putsMMYY``.  The next expiry is saved as ``calls`` and ``puts``.
+
+  New features:
+
+  - The expiry parameter can now be a single date or a list-like object containing dates.
+
+  - A new property ``expiry_dates`` was added, which returns all available expiry dates.
+
+  Current behavior:
+
+  .. code-block:: ipython
+
+      In [17]: from pandas.io.data import Options
+
+      In [18]: aapl = Options('aapl', 'yahoo')
+
+      In [19]: aapl.get_call_data().iloc[0:5, 0:1]
+      Out[19]:
+                                                   Last
+      Strike Expiry     Type Symbol
+      80     2014-11-14 call AAPL141114C00080000  29.05
+      84     2014-11-14 call AAPL141114C00084000  24.80
+      85     2014-11-14 call AAPL141114C00085000  24.05
+      86     2014-11-14 call AAPL141114C00086000  22.76
+      87     2014-11-14 call AAPL141114C00087000  21.74
+
+      In [20]: aapl.expiry_dates
+      Out[20]:
+      [datetime.date(2014, 11, 14),
+       datetime.date(2014, 11, 22),
+       datetime.date(2014, 11, 28),
+       datetime.date(2014, 12, 5),
+       datetime.date(2014, 12, 12),
+       datetime.date(2014, 12, 20),
+       datetime.date(2015, 1, 17),
+       datetime.date(2015, 2, 20),
+       datetime.date(2015, 4, 17),
+       datetime.date(2015, 7, 17),
+       datetime.date(2016, 1, 15),
+       datetime.date(2017, 1, 20)]
+
+      In [21]: aapl.get_near_stock_price(expiry=aapl.expiry_dates[0:3]).iloc[0:5, 0:1]
+      Out[21]:
+                                                  Last
+      Strike Expiry     Type Symbol
+      109    2014-11-22 call AAPL141122C00109000  1.48
+             2014-11-28 call AAPL141128C00109000  1.79
+      110    2014-11-14 call AAPL141114C00110000  0.55
+             2014-11-22 call AAPL141122C00110000  1.02
+             2014-11-28 call AAPL141128C00110000  1.32
+
+.. _whatsnew_0151.datetime64_plotting:
+
+- pandas now also registers the ``datetime64`` dtype in matplotlib's units registry
+  to plot such values as datetimes. This is activated once pandas is imported. In
+  previous versions, plotting an array of ``datetime64`` values will have resulted
+  in plotted integer values. To keep the previous behaviour, you can do
+  ``del matplotlib.units.registry[np.datetime64]`` (:issue:`8614`).
+
+
+.. _whatsnew_0151.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- ``concat`` permits a wider variety of iterables of pandas objects to be
+  passed as the first parameter (:issue:`8645`):
+
+  .. ipython:: python
+
+     from collections import deque
+     df1 = pd.DataFrame([1, 2, 3])
+     df2 = pd.DataFrame([4, 5, 6])
+
+  previous behavior:
+
+  .. code-block:: ipython
+
+     In [7]: pd.concat(deque((df1, df2)))
+     TypeError: first argument must be a list-like of pandas objects, you passed an object of type "deque"
+
+  current behavior:
+
+  .. ipython:: python
+
+     pd.concat(deque((df1, df2)))
+
+- Represent ``MultiIndex`` labels with a dtype that utilizes memory based on the level size. In prior versions, the memory usage was a constant 8 bytes per element in each level. In addition, in prior versions, the *reported* memory usage was incorrect as it didn't show the usage for the memory occupied by the underling data array. (:issue:`8456`)
+
+  .. ipython:: python
+
+     dfi = pd.DataFrame(1, index=pd.MultiIndex.from_product([['a'],
+                        range(1000)]), columns=['A'])
+
+  previous behavior:
+
+  .. code-block:: ipython
+
+     # this was underreported in prior versions
+     In [1]: dfi.memory_usage(index=True)
+     Out[1]:
+     Index    8000 # took about 24008 bytes in < 0.15.1
+     A        8000
+     dtype: int64
+
+
+  current behavior:
+
+  .. ipython:: python
+
+     dfi.memory_usage(index=True)
+
+- Added Index properties `is_monotonic_increasing` and `is_monotonic_decreasing` (:issue:`8680`).
+
+- Added option to select columns when importing Stata files (:issue:`7935`)
+
+- Qualify memory usage in ``DataFrame.info()`` by adding ``+`` if it is a lower bound (:issue:`8578`)
+
+- Raise errors in certain aggregation cases where an argument such as ``numeric_only`` is not handled (:issue:`8592`).
+
+- Added support for 3-character ISO and non-standard country codes in :func:`io.wb.download()` (:issue:`8482`)
+
+- World Bank data requests now will warn/raise based
+  on an ``errors`` argument, as well as a list of hard-coded country codes and
+  the World Bank's JSON response.  In prior versions, the error messages
+  didn't look at the World Bank's JSON response.  Problem-inducing input were
+  simply dropped prior to the request. The issue was that many good countries
+  were cropped in the hard-coded approach.  All countries will work now, but
+  some bad countries will raise exceptions because some edge cases break the
+  entire response. (:issue:`8482`)
+
+- Added option to ``Series.str.split()`` to return a ``DataFrame`` rather than a ``Series`` (:issue:`8428`)
+
+- Added option to ``df.info(null_counts=None|True|False)`` to override the default display options and force showing of the null-counts (:issue:`8701`)
+
+
+.. _whatsnew_0151.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in unpickling of a ``CustomBusinessDay`` object (:issue:`8591`)
+- Bug in coercing ``Categorical`` to a records array, e.g. ``df.to_records()`` (:issue:`8626`)
+- Bug in ``Categorical`` not created properly with ``Series.to_frame()`` (:issue:`8626`)
+- Bug in coercing in astype of a ``Categorical`` of a passed ``pd.Categorical`` (this now raises ``TypeError`` correctly), (:issue:`8626`)
+- Bug in ``cut``/``qcut`` when using ``Series`` and ``retbins=True`` (:issue:`8589`)
+- Bug in writing Categorical columns to an SQL database with ``to_sql`` (:issue:`8624`).
+- Bug in comparing ``Categorical`` of datetime raising when being compared to a scalar datetime (:issue:`8687`)
+- Bug in selecting from a ``Categorical`` with ``.iloc`` (:issue:`8623`)
+- Bug in groupby-transform with a Categorical (:issue:`8623`)
+- Bug in duplicated/drop_duplicates with a Categorical (:issue:`8623`)
+- Bug in ``Categorical`` reflected comparison operator raising if the first argument was a numpy array scalar (e.g. np.int64) (:issue:`8658`)
+- Bug in Panel indexing with a list-like (:issue:`8710`)
+- Compat issue is ``DataFrame.dtypes`` when ``options.mode.use_inf_as_null`` is True (:issue:`8722`)
+- Bug in ``read_csv``, ``dialect`` parameter would not take a string (:issue:`8703`)
+- Bug in slicing a MultiIndex level with an empty-list (:issue:`8737`)
+- Bug in numeric index operations of add/sub with Float/Index Index with numpy arrays (:issue:`8608`)
+- Bug in setitem with empty indexer and unwanted coercion of dtypes (:issue:`8669`)
+- Bug in ix/loc block splitting on setitem (manifests with integer-like dtypes, e.g. datetime64) (:issue:`8607`)
+- Bug when doing label based indexing with integers not found in the index for
+  non-unique but monotonic indexes (:issue:`8680`).
+- Bug when indexing a Float64Index with ``np.nan`` on numpy 1.7 (:issue:`8980`).
+- Fix ``shape`` attribute for ``MultiIndex`` (:issue:`8609`)
+- Bug in ``GroupBy`` where a name conflict between the grouper and columns
+  would break ``groupby`` operations (:issue:`7115`, :issue:`8112`)
+- Fixed a bug where plotting a column ``y`` and specifying a label would mutate the index name of the original DataFrame (:issue:`8494`)
+- Fix regression in plotting of a DatetimeIndex directly with matplotlib (:issue:`8614`).
+- Bug in ``date_range`` where partially-specified dates would incorporate current date (:issue:`6961`)
+- Bug in Setting by indexer to a scalar value with a mixed-dtype `Panel4d` was failing (:issue:`8702`)
+- Bug where ``DataReader``'s would fail if one of the symbols passed was invalid.  Now returns data for valid symbols and np.nan for invalid (:issue:`8494`)
+- Bug in ``get_quote_yahoo`` that wouldn't allow non-float return values (:issue:`5229`).
+
+
+.. _whatsnew_0.15.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.15.0..v0.15.1
diff --git a/doc/source/whatsnew/v0.15.1.txt b/doc/source/whatsnew/v0.15.1.txt
deleted file mode 100644
index cd9298c74539a..0000000000000
--- a/doc/source/whatsnew/v0.15.1.txt
+++ /dev/null
@@ -1,306 +0,0 @@
-.. _whatsnew_0151:
-
-v0.15.1 (November 9, 2014)
---------------------------
-
-This is a minor bug-fix release from 0.15.0 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-- :ref:`Enhancements <whatsnew_0151.enhancements>`
-- :ref:`API Changes <whatsnew_0151.api>`
-- :ref:`Bug Fixes <whatsnew_0151.bug_fixes>`
-
-.. _whatsnew_0151.api:
-
-API changes
-~~~~~~~~~~~
-
-- ``s.dt.hour`` and other ``.dt`` accessors will now return ``np.nan`` for missing values (rather than previously -1), (:issue:`8689`)
-
-  .. ipython:: python
-
-     s = Series(date_range('20130101',periods=5,freq='D'))
-     s.iloc[2] = np.nan
-     s
-
-  previous behavior:
-
-  .. code-block:: ipython
-
-     In [6]: s.dt.hour
-     Out[6]:
-     0    0
-     1    0
-     2   -1
-     3    0
-     4    0
-     dtype: int64
-
-  current behavior:
-
-  .. ipython:: python
-
-     s.dt.hour
-
-- ``groupby`` with ``as_index=False`` will not add erroneous extra columns to
-  result (:issue:`8582`):
-
-  .. ipython:: python
-
-    np.random.seed(2718281)
-    df = pd.DataFrame(np.random.randint(0, 100, (10, 2)),
-                      columns=['jim', 'joe'])
-    df.head()
-
-    ts = pd.Series(5 * np.random.randint(0, 3, 10))
-
-  previous behavior:
-
-  .. code-block:: ipython
-
-     In [4]: df.groupby(ts, as_index=False).max()
-     Out[4]:
-        NaN  jim  joe
-     0    0   72   83
-     1    5   77   84
-     2   10   96   65
-
-  current behavior:
-
-  .. ipython:: python
-
-    df.groupby(ts, as_index=False).max()
-
-- ``groupby`` will not erroneously exclude columns if the column name conflics
-  with the grouper name (:issue:`8112`):
-
-  .. ipython:: python
-
-     df = pd.DataFrame({'jim': range(5), 'joe': range(5, 10)})
-     df
-     gr = df.groupby(df['jim'] < 2)
-
-  previous behavior (excludes 1st column from output):
-
-  .. code-block:: ipython
-
-     In [4]: gr.apply(sum)
-     Out[4]:
-            joe
-     jim
-     False   24
-     True    11
-
-  current behavior:
-
-  .. ipython:: python
-
-     gr.apply(sum)
-
-- Support for slicing with monotonic decreasing indexes, even if ``start`` or ``stop`` is
-  not found in the index (:issue:`7860`):
-
-  .. ipython:: python
-
-    s = pd.Series(['a', 'b', 'c', 'd'], [4, 3, 2, 1])
-    s
-
-  previous behavior:
-
-  .. code-block:: ipython
-
-     In [8]: s.loc[3.5:1.5]
-     KeyError: 3.5
-
-  current behavior:
-
-  .. ipython:: python
-
-     s.loc[3.5:1.5]
-
-- ``io.data.Options`` has been fixed for a change in the format of the Yahoo Options page (:issue:`8612`), (:issue:`8741`)
-
-  .. note::
-
-    As a result of a change in Yahoo's option page layout, when an expiry date is given,
-    ``Options`` methods now return data for a single expiry date.  Previously, methods returned all
-    data for the selected month.
-
-  The ``month`` and ``year`` parameters have been undeprecated and can be used to get all
-  options data for a given month.
-
-  If an expiry date that is not valid is given, data for the next expiry after the given
-  date is returned.
-
-  Option data frames are now saved on the instance as ``callsYYMMDD`` or ``putsYYMMDD``.  Previously
-  they were saved as ``callsMMYY`` and ``putsMMYY``.  The next expiry is saved as ``calls`` and ``puts``.
-
-  New features:
-
-  - The expiry parameter can now be a single date or a list-like object containing dates.
-
-  - A new property ``expiry_dates`` was added, which returns all available expiry dates.
-
-  Current behavior:
-
-  .. code-block:: ipython
-
-      In [17]: from pandas.io.data import Options
-
-      In [18]: aapl = Options('aapl','yahoo')
-
-      In [19]: aapl.get_call_data().iloc[0:5,0:1]
-      Out[19]:
-                                                   Last
-      Strike Expiry     Type Symbol
-      80     2014-11-14 call AAPL141114C00080000  29.05
-      84     2014-11-14 call AAPL141114C00084000  24.80
-      85     2014-11-14 call AAPL141114C00085000  24.05
-      86     2014-11-14 call AAPL141114C00086000  22.76
-      87     2014-11-14 call AAPL141114C00087000  21.74
-
-      In [20]: aapl.expiry_dates
-      Out[20]:
-      [datetime.date(2014, 11, 14),
-       datetime.date(2014, 11, 22),
-       datetime.date(2014, 11, 28),
-       datetime.date(2014, 12, 5),
-       datetime.date(2014, 12, 12),
-       datetime.date(2014, 12, 20),
-       datetime.date(2015, 1, 17),
-       datetime.date(2015, 2, 20),
-       datetime.date(2015, 4, 17),
-       datetime.date(2015, 7, 17),
-       datetime.date(2016, 1, 15),
-       datetime.date(2017, 1, 20)]
-
-      In [21]: aapl.get_near_stock_price(expiry=aapl.expiry_dates[0:3]).iloc[0:5,0:1]
-      Out[21]:
-                                                  Last
-      Strike Expiry     Type Symbol
-      109    2014-11-22 call AAPL141122C00109000  1.48
-             2014-11-28 call AAPL141128C00109000  1.79
-      110    2014-11-14 call AAPL141114C00110000  0.55
-             2014-11-22 call AAPL141122C00110000  1.02
-             2014-11-28 call AAPL141128C00110000  1.32
-
-.. _whatsnew_0151.datetime64_plotting:
-
-- pandas now also registers the ``datetime64`` dtype in matplotlib's units registry
-  to plot such values as datetimes. This is activated once pandas is imported. In
-  previous versions, plotting an array of ``datetime64`` values will have resulted
-  in plotted integer values. To keep the previous behaviour, you can do
-  ``del matplotlib.units.registry[np.datetime64]`` (:issue:`8614`).
-
-
-.. _whatsnew_0151.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-- ``concat`` permits a wider variety of iterables of pandas objects to be
-  passed as the first parameter (:issue:`8645`):
-
-  .. ipython:: python
-
-     from collections import deque
-     df1 = pd.DataFrame([1, 2, 3])
-     df2 = pd.DataFrame([4, 5, 6])
-
-  previous behavior:
-
-  .. code-block:: ipython
-
-     In [7]: pd.concat(deque((df1, df2)))
-     TypeError: first argument must be a list-like of pandas objects, you passed an object of type "deque"
-
-  current behavior:
-
-  .. ipython:: python
-
-     pd.concat(deque((df1, df2)))
-
-- Represent ``MultiIndex`` labels with a dtype that utilizes memory based on the level size. In prior versions, the memory usage was a constant 8 bytes per element in each level. In addition, in prior versions, the *reported* memory usage was incorrect as it didn't show the usage for the memory occupied by the underling data array. (:issue:`8456`)
-
-  .. ipython:: python
-
-     dfi = DataFrame(1,index=pd.MultiIndex.from_product([['a'],range(1000)]),columns=['A'])
-
-  previous behavior:
-
-  .. code-block:: ipython
-
-     # this was underreported in prior versions
-     In [1]: dfi.memory_usage(index=True)
-     Out[1]:
-     Index    8000 # took about 24008 bytes in < 0.15.1
-     A        8000
-     dtype: int64
-
-
-  current behavior:
-
-  .. ipython:: python
-
-     dfi.memory_usage(index=True)
-
-- Added Index properties `is_monotonic_increasing` and `is_monotonic_decreasing` (:issue:`8680`).
-
-- Added option to select columns when importing Stata files (:issue:`7935`)
-
-- Qualify memory usage in ``DataFrame.info()`` by adding ``+`` if it is a lower bound (:issue:`8578`)
-
-- Raise errors in certain aggregation cases where an argument such as ``numeric_only`` is not handled (:issue:`8592`).
-
-- Added support for 3-character ISO and non-standard country codes in :func:`io.wb.download()` (:issue:`8482`)
-
-- World Bank data requests now will warn/raise based
-  on an ``errors`` argument, as well as a list of hard-coded country codes and
-  the World Bank's JSON response.  In prior versions, the error messages
-  didn't look at the World Bank's JSON response.  Problem-inducing input were
-  simply dropped prior to the request. The issue was that many good countries
-  were cropped in the hard-coded approach.  All countries will work now, but
-  some bad countries will raise exceptions because some edge cases break the
-  entire response. (:issue:`8482`)
-
-- Added option to ``Series.str.split()`` to return a ``DataFrame`` rather than a ``Series`` (:issue:`8428`)
-
-- Added option to ``df.info(null_counts=None|True|False)`` to override the default display options and force showing of the null-counts (:issue:`8701`)
-
-
-.. _whatsnew_0151.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in unpickling  of a ``CustomBusinessDay`` object (:issue:`8591`)
-- Bug in coercing ``Categorical`` to a records array, e.g. ``df.to_records()`` (:issue:`8626`)
-- Bug in ``Categorical`` not created properly with ``Series.to_frame()`` (:issue:`8626`)
-- Bug in coercing in astype of a ``Categorical`` of a passed ``pd.Categorical`` (this now raises ``TypeError`` correctly), (:issue:`8626`)
-- Bug in ``cut``/``qcut`` when using ``Series`` and ``retbins=True`` (:issue:`8589`)
-- Bug in writing Categorical columns to an SQL database with ``to_sql`` (:issue:`8624`).
-- Bug in comparing ``Categorical`` of datetime raising when being compared to a scalar datetime (:issue:`8687`)
-- Bug in selecting from a ``Categorical`` with ``.iloc`` (:issue:`8623`)
-- Bug in groupby-transform with a Categorical (:issue:`8623`)
-- Bug in duplicated/drop_duplicates with a Categorical (:issue:`8623`)
-- Bug in ``Categorical`` reflected comparison operator raising if the first argument was a numpy array scalar (e.g. np.int64) (:issue:`8658`)
-- Bug in Panel indexing with a list-like (:issue:`8710`)
-- Compat issue is ``DataFrame.dtypes`` when ``options.mode.use_inf_as_null`` is True (:issue:`8722`)
-- Bug in ``read_csv``, ``dialect`` parameter would not take a string (:issue: `8703`)
-- Bug in slicing a multi-index level with an empty-list (:issue:`8737`)
-- Bug in numeric index operations of add/sub with Float/Index Index with numpy arrays (:issue:`8608`)
-- Bug in setitem with empty indexer and unwanted coercion of dtypes (:issue:`8669`)
-- Bug in ix/loc block splitting on setitem (manifests with integer-like dtypes, e.g. datetime64) (:issue:`8607`)
-- Bug when doing label based indexing with integers not found in the index for
-  non-unique but monotonic indexes (:issue:`8680`).
-- Bug when indexing a Float64Index with ``np.nan`` on numpy 1.7 (:issue:`8980`).
-- Fix ``shape`` attribute for ``MultiIndex`` (:issue:`8609`)
-- Bug in ``GroupBy`` where a name conflict between the grouper and columns
-  would break ``groupby`` operations (:issue:`7115`, :issue:`8112`)
-- Fixed a bug where plotting a column ``y`` and specifying a label would mutate the index name of the original DataFrame (:issue:`8494`)
-- Fix regression in plotting of a DatetimeIndex directly with matplotlib (:issue:`8614`).
-- Bug in ``date_range`` where partially-specified dates would incorporate current date (:issue:`6961`)
-- Bug in Setting by indexer to a scalar value with a mixed-dtype `Panel4d` was failing (:issue:`8702`)
-- Bug where ``DataReader``'s would fail if one of the symbols passed was invalid.  Now returns data for valid symbols and np.nan for invalid (:issue:`8494`)
-- Bug in ``get_quote_yahoo`` that wouldn't allow non-float return values (:issue:`5229`).
diff --git a/doc/source/whatsnew/v0.15.2.rst b/doc/source/whatsnew/v0.15.2.rst
new file mode 100644
index 0000000000000..dabdcd1ab76c3
--- /dev/null
+++ b/doc/source/whatsnew/v0.15.2.rst
@@ -0,0 +1,251 @@
+.. _whatsnew_0152:
+
+v0.15.2 (December 12, 2014)
+---------------------------
+
+{{ header }}
+
+
+This is a minor release from 0.15.1 and includes a large number of bug fixes
+along with several new features, enhancements, and performance improvements.
+A small number of API changes were necessary to fix existing bugs.
+We recommend that all users upgrade to this version.
+
+- :ref:`Enhancements <whatsnew_0152.enhancements>`
+- :ref:`API Changes <whatsnew_0152.api>`
+- :ref:`Performance Improvements <whatsnew_0152.performance>`
+- :ref:`Bug Fixes <whatsnew_0152.bug_fixes>`
+
+.. _whatsnew_0152.api:
+
+API changes
+~~~~~~~~~~~
+
+- Indexing in ``MultiIndex`` beyond lex-sort depth is now supported, though
+  a lexically sorted index will have a better performance. (:issue:`2646`)
+
+  .. ipython:: python
+    :okwarning:
+
+    df = pd.DataFrame({'jim':[0, 0, 1, 1],
+                       'joe':['x', 'x', 'z', 'y'],
+                       'jolie':np.random.rand(4)}).set_index(['jim', 'joe'])
+    df
+    df.index.lexsort_depth
+
+    # in prior versions this would raise a KeyError
+    # will now show a PerformanceWarning
+    df.loc[(1, 'z')]
+
+    # lexically sorting
+    df2 = df.sort_index()
+    df2
+    df2.index.lexsort_depth
+    df2.loc[(1,'z')]
+
+- Bug in unique of Series with ``category`` dtype, which returned all categories regardless
+  whether they were "used" or not (see :issue:`8559` for the discussion).
+  Previous behaviour was to return all categories:
+
+  .. code-block:: ipython
+
+    In [3]: cat = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
+
+    In [4]: cat
+    Out[4]:
+    [a, b, a]
+    Categories (3, object): [a < b < c]
+
+    In [5]: cat.unique()
+    Out[5]: array(['a', 'b', 'c'], dtype=object)
+
+  Now, only the categories that do effectively occur in the array are returned:
+
+  .. ipython:: python
+
+    cat = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
+    cat.unique()
+
+- ``Series.all`` and ``Series.any`` now support the ``level`` and ``skipna`` parameters. ``Series.all``, ``Series.any``, ``Index.all``, and ``Index.any`` no longer support the ``out`` and ``keepdims`` parameters, which existed for compatibility with ndarray. Various index types no longer support the ``all`` and ``any`` aggregation functions and will now raise ``TypeError``. (:issue:`8302`).
+
+- Allow equality comparisons of Series with a categorical dtype and object dtype; previously these would raise ``TypeError`` (:issue:`8938`)
+
+- Bug in ``NDFrame``: conflicting attribute/column names now behave consistently between getting and setting. Previously, when both a column and attribute named ``y`` existed, ``data.y`` would return the attribute, while ``data.y = z`` would update the column (:issue:`8994`)
+
+  .. ipython:: python
+
+     data = pd.DataFrame({'x': [1, 2, 3]})
+     data.y = 2
+     data['y'] = [2, 4, 6]
+     data
+
+     # this assignment was inconsistent
+     data.y = 5
+
+  Old behavior:
+
+  .. code-block:: ipython
+
+     In [6]: data.y
+     Out[6]: 2
+
+     In [7]: data['y'].values
+     Out[7]: array([5, 5, 5])
+
+  New behavior:
+
+  .. ipython:: python
+
+     data.y
+     data['y'].values
+
+- ``Timestamp('now')`` is now equivalent to ``Timestamp.now()`` in that it returns the local time rather than UTC. Also, ``Timestamp('today')`` is now equivalent to ``Timestamp.today()`` and both have ``tz`` as a possible argument. (:issue:`9000`)
+
+- Fix negative step support for label-based slices (:issue:`8753`)
+
+  Old behavior:
+
+  .. code-block:: ipython
+
+     In [1]: s = pd.Series(np.arange(3), ['a', 'b', 'c'])
+     Out[1]:
+     a    0
+     b    1
+     c    2
+     dtype: int64
+
+     In [2]: s.loc['c':'a':-1]
+     Out[2]:
+     c    2
+     dtype: int64
+
+  New behavior:
+
+  .. ipython:: python
+
+     s = pd.Series(np.arange(3), ['a', 'b', 'c'])
+     s.loc['c':'a':-1]
+
+
+.. _whatsnew_0152.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+``Categorical`` enhancements:
+
+- Added ability to export Categorical data to Stata (:issue:`8633`).  See :ref:`here <io.stata-categorical>` for limitations of categorical variables exported to Stata data files.
+- Added flag ``order_categoricals`` to ``StataReader`` and ``read_stata`` to select whether to order imported categorical data (:issue:`8836`).  See :ref:`here <io.stata-categorical>` for more information on importing categorical variables from Stata data files.
+- Added ability to export Categorical data to to/from HDF5 (:issue:`7621`). Queries work the same as if it was an object array. However, the ``category`` dtyped data is stored in a more efficient manner. See :ref:`here <io.hdf5-categorical>` for an example and caveats w.r.t. prior versions of pandas.
+- Added support for ``searchsorted()`` on `Categorical` class (:issue:`8420`).
+
+Other enhancements:
+
+- Added the ability to specify the SQL type of columns when writing a DataFrame
+  to a database (:issue:`8778`).
+  For example, specifying to use the sqlalchemy ``String`` type instead of the
+  default ``Text`` type for string columns:
+
+  .. code-block:: python
+
+     from sqlalchemy.types import String
+     data.to_sql('data_dtype', engine, dtype={'Col_1': String})  # noqa F821
+
+- ``Series.all`` and ``Series.any`` now support the ``level`` and ``skipna`` parameters (:issue:`8302`):
+
+  .. ipython:: python
+
+     s = pd.Series([False, True, False], index=[0, 0, 1])
+     s.any(level=0)
+
+- ``Panel`` now supports the ``all`` and ``any`` aggregation functions. (:issue:`8302`):
+
+  .. ipython:: python
+
+     p = pd.Panel(np.random.rand(2, 5, 4) > 0.1)
+     p.all()
+
+- Added support for ``utcfromtimestamp()``, ``fromtimestamp()``, and ``combine()`` on `Timestamp` class (:issue:`5351`).
+- Added Google Analytics (`pandas.io.ga`) basic documentation (:issue:`8835`). See `here <http://pandas.pydata.org/pandas-docs/version/0.15.2/remote_data.html#remote-data-ga>`__.
+- ``Timedelta`` arithmetic returns ``NotImplemented`` in unknown cases, allowing extensions by custom classes (:issue:`8813`).
+- ``Timedelta`` now supports arithmetic with ``numpy.ndarray`` objects of the appropriate dtype (numpy 1.8 or newer only) (:issue:`8884`).
+- Added ``Timedelta.to_timedelta64()`` method to the public API (:issue:`8884`).
+- Added ``gbq.generate_bq_schema()`` function to the gbq module (:issue:`8325`).
+- ``Series`` now works with map objects the same way as generators (:issue:`8909`).
+- Added context manager to ``HDFStore`` for automatic closing (:issue:`8791`).
+- ``to_datetime`` gains an ``exact`` keyword to allow for a format to not require an exact match for a provided format string (if its ``False``). ``exact`` defaults to ``True`` (meaning that exact matching is still the default)  (:issue:`8904`)
+- Added ``axvlines`` boolean option to parallel_coordinates plot function, determines whether vertical lines will be printed, default is True
+- Added ability to read table footers to read_html (:issue:`8552`)
+- ``to_sql`` now infers data types of non-NA values for columns that contain NA values and have dtype ``object`` (:issue:`8778`).
+
+
+.. _whatsnew_0152.performance:
+
+Performance
+~~~~~~~~~~~
+
+- Reduce memory usage when skiprows is an integer in read_csv (:issue:`8681`)
+- Performance boost for ``to_datetime`` conversions with a passed ``format=``, and the ``exact=False`` (:issue:`8904`)
+
+
+.. _whatsnew_0152.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in concat of Series with ``category`` dtype which were coercing to ``object``. (:issue:`8641`)
+- Bug in Timestamp-Timestamp not returning a Timedelta type and datelike-datelike ops with timezones (:issue:`8865`)
+- Made consistent a timezone mismatch exception (either tz operated with None or incompatible timezone), will now return ``TypeError`` rather than ``ValueError`` (a couple of edge cases only), (:issue:`8865`)
+- Bug in using a ``pd.Grouper(key=...)`` with no level/axis or level only (:issue:`8795`, :issue:`8866`)
+- Report a ``TypeError`` when invalid/no parameters are passed in a groupby (:issue:`8015`)
+- Bug in packaging pandas with ``py2app/cx_Freeze`` (:issue:`8602`, :issue:`8831`)
+- Bug in ``groupby`` signatures that didn't include \*args or \*\*kwargs (:issue:`8733`).
+- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
+- Unclear error message in csv parsing when passing dtype and names and the parsed data is a different data type (:issue:`8833`)
+- Bug in slicing a MultiIndex with an empty list and at least one boolean indexer (:issue:`8781`)
+- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo (:issue:`8761`).
+- ``Timedelta`` kwargs may now be numpy ints and floats (:issue:`8757`).
+- Fixed several outstanding bugs for ``Timedelta`` arithmetic and comparisons (:issue:`8813`, :issue:`5963`, :issue:`5436`).
+- ``sql_schema`` now generates dialect appropriate ``CREATE TABLE`` statements (:issue:`8697`)
+- ``slice`` string method now takes step into account (:issue:`8754`)
+- Bug in ``BlockManager`` where setting values with different type would break block integrity (:issue:`8850`)
+- Bug in ``DatetimeIndex`` when using ``time`` object as key (:issue:`8667`)
+- Bug in ``merge`` where ``how='left'`` and ``sort=False`` would not preserve left frame order (:issue:`7331`)
+- Bug in ``MultiIndex.reindex`` where reindexing at level would not reorder labels (:issue:`4088`)
+- Bug in certain operations with dateutil timezones, manifesting with dateutil 2.3 (:issue:`8639`)
+- Regression in DatetimeIndex iteration with a Fixed/Local offset timezone (:issue:`8890`)
+- Bug in ``to_datetime`` when parsing a nanoseconds using the ``%f`` format (:issue:`8989`)
+- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
+- Fix: The font size was only set on x axis if vertical or the y axis if horizontal. (:issue:`8765`)
+- Fixed division by 0 when reading big csv files in python 3 (:issue:`8621`)
+- Bug in outputting a MultiIndex with ``to_html,index=False`` which would add an extra column (:issue:`8452`)
+- Imported categorical variables from Stata files retain the ordinal information in the underlying data (:issue:`8836`).
+- Defined ``.size`` attribute across ``NDFrame`` objects to provide compat with numpy >= 1.9.1; buggy with ``np.array_split`` (:issue:`8846`)
+- Skip testing of histogram plots for matplotlib <= 1.2 (:issue:`8648`).
+- Bug where ``get_data_google`` returned object dtypes (:issue:`3995`)
+- Bug in ``DataFrame.stack(..., dropna=False)`` when the DataFrame's ``columns`` is a ``MultiIndex``
+  whose ``labels`` do not reference all its ``levels``. (:issue:`8844`)
+- Bug in that Option context applied on ``__enter__`` (:issue:`8514`)
+- Bug in resample that causes a ValueError when resampling across multiple days
+  and the last offset is not calculated from the start of the range (:issue:`8683`)
+- Bug where ``DataFrame.plot(kind='scatter')`` fails when checking if an np.array is in the DataFrame (:issue:`8852`)
+- Bug in ``pd.infer_freq/DataFrame.inferred_freq`` that prevented proper sub-daily frequency inference when the index contained DST days (:issue:`8772`).
+- Bug where index name was still used when plotting a series with ``use_index=False`` (:issue:`8558`).
+- Bugs when trying to stack multiple columns, when some (or all) of the level names are numbers (:issue:`8584`).
+- Bug in ``MultiIndex`` where ``__contains__`` returns wrong result if index is not lexically sorted or unique (:issue:`7724`)
+- BUG CSV: fix problem with trailing white space in skipped rows, (:issue:`8679`), (:issue:`8661`), (:issue:`8983`)
+- Regression in ``Timestamp`` does not parse 'Z' zone designator for UTC (:issue:`8771`)
+- Bug in `StataWriter` the produces writes strings with 244 characters irrespective of actual size (:issue:`8969`)
+- Fixed ValueError raised by cummin/cummax when datetime64 Series contains NaT. (:issue:`8965`)
+- Bug in DataReader returns object dtype if there are missing values (:issue:`8980`)
+- Bug in plotting if sharex was enabled and index was a timeseries, would show labels on multiple axes (:issue:`3964`).
+- Bug where passing a unit to the TimedeltaIndex constructor applied the to nano-second conversion twice. (:issue:`9011`).
+- Bug in plotting of a period-like array (:issue:`9012`)
+
+
+.. _whatsnew_0.15.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.15.1..v0.15.2
diff --git a/doc/source/whatsnew/v0.15.2.txt b/doc/source/whatsnew/v0.15.2.txt
deleted file mode 100644
index feba3d6224e65..0000000000000
--- a/doc/source/whatsnew/v0.15.2.txt
+++ /dev/null
@@ -1,240 +0,0 @@
-.. _whatsnew_0152:
-
-v0.15.2 (December 12, 2014)
----------------------------
-
-This is a minor release from 0.15.1 and includes a large number of bug fixes
-along with several new features, enhancements, and performance improvements.
-A small number of API changes were necessary to fix existing bugs.
-We recommend that all users upgrade to this version.
-
-- :ref:`Enhancements <whatsnew_0152.enhancements>`
-- :ref:`API Changes <whatsnew_0152.api>`
-- :ref:`Performance Improvements <whatsnew_0152.performance>`
-- :ref:`Bug Fixes <whatsnew_0152.bug_fixes>`
-
-.. _whatsnew_0152.api:
-
-API changes
-~~~~~~~~~~~
-
-- Indexing in ``MultiIndex`` beyond lex-sort depth is now supported, though
-  a lexically sorted index will have a better performance. (:issue:`2646`)
-
-  .. ipython:: python
-    :okwarning:
-
-    df = pd.DataFrame({'jim':[0, 0, 1, 1],
-                       'joe':['x', 'x', 'z', 'y'],
-                       'jolie':np.random.rand(4)}).set_index(['jim', 'joe'])
-    df
-    df.index.lexsort_depth
-
-    # in prior versions this would raise a KeyError
-    # will now show a PerformanceWarning
-    df.loc[(1, 'z')]
-
-    # lexically sorting
-    df2 = df.sort_index()
-    df2
-    df2.index.lexsort_depth
-    df2.loc[(1,'z')]
-
-- Bug in unique of Series with ``category`` dtype, which returned all categories regardless
-  whether they were "used" or not (see :issue:`8559` for the discussion).
-  Previous behaviour was to return all categories:
-
-  .. code-block:: ipython
-
-    In [3]: cat = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
-
-    In [4]: cat
-    Out[4]:
-    [a, b, a]
-    Categories (3, object): [a < b < c]
-
-    In [5]: cat.unique()
-    Out[5]: array(['a', 'b', 'c'], dtype=object)
-
-  Now, only the categories that do effectively occur in the array are returned:
-
-  .. ipython:: python
-
-    cat = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
-    cat.unique()
-
-- ``Series.all`` and ``Series.any`` now support the ``level`` and ``skipna`` parameters. ``Series.all``, ``Series.any``, ``Index.all``, and ``Index.any`` no longer support the ``out`` and ``keepdims`` parameters, which existed for compatibility with ndarray. Various index types no longer support the ``all`` and ``any`` aggregation functions and will now raise ``TypeError``. (:issue:`8302`).
-
-- Allow equality comparisons of Series with a categorical dtype and object dtype; previously these would raise ``TypeError`` (:issue:`8938`)
-
-- Bug in ``NDFrame``: conflicting attribute/column names now behave consistently between getting and setting. Previously, when both a column and attribute named ``y`` existed, ``data.y`` would return the attribute, while ``data.y = z`` would update the column (:issue:`8994`)
-
-  .. ipython:: python
-
-     data = pd.DataFrame({'x':[1, 2, 3]})
-     data.y = 2
-     data['y'] = [2, 4, 6]
-     data
-
-     # this assignment was inconsistent
-     data.y = 5
-
-  Old behavior:
-
-  .. code-block:: ipython
-
-     In [6]: data.y
-     Out[6]: 2
-
-     In [7]: data['y'].values
-     Out[7]: array([5, 5, 5])
-
-  New behavior:
-
-  .. ipython:: python
-
-     data.y
-     data['y'].values
-
-- ``Timestamp('now')`` is now equivalent to ``Timestamp.now()`` in that it returns the local time rather than UTC. Also, ``Timestamp('today')`` is now equivalent to ``Timestamp.today()`` and both have ``tz`` as a possible argument. (:issue:`9000`)
-
-- Fix negative step support for label-based slices (:issue:`8753`)
-
-  Old behavior:
-
-  .. code-block:: ipython
-
-     In [1]: s = pd.Series(np.arange(3), ['a', 'b', 'c'])
-     Out[1]:
-     a    0
-     b    1
-     c    2
-     dtype: int64
-
-     In [2]: s.loc['c':'a':-1]
-     Out[2]:
-     c    2
-     dtype: int64
-
-  New behavior:
-
-  .. ipython:: python
-
-     s = pd.Series(np.arange(3), ['a', 'b', 'c'])
-     s.loc['c':'a':-1]
-
-
-.. _whatsnew_0152.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-``Categorical`` enhancements:
-
-- Added ability to export Categorical data to Stata (:issue:`8633`).  See :ref:`here <io.stata-categorical>` for limitations of categorical variables exported to Stata data files.
-- Added flag ``order_categoricals`` to ``StataReader`` and ``read_stata`` to select whether to order imported categorical data (:issue:`8836`).  See :ref:`here <io.stata-categorical>` for more information on importing categorical variables from Stata data files.
-- Added ability to export Categorical data to to/from HDF5 (:issue:`7621`). Queries work the same as if it was an object array. However, the ``category`` dtyped data is stored in a more efficient manner. See :ref:`here <io.hdf5-categorical>` for an example and caveats w.r.t. prior versions of pandas.
-- Added support for ``searchsorted()`` on `Categorical` class (:issue:`8420`).
-
-Other enhancements:
-
-- Added the ability to specify the SQL type of columns when writing a DataFrame
-  to a database (:issue:`8778`).
-  For example, specifying to use the sqlalchemy ``String`` type instead of the
-  default ``Text`` type for string columns:
-
-  .. code-block:: python
-
-     from sqlalchemy.types import String
-     data.to_sql('data_dtype', engine, dtype={'Col_1': String})
-
-- ``Series.all`` and ``Series.any`` now support the ``level`` and ``skipna`` parameters (:issue:`8302`):
-
-  .. ipython:: python
-
-     s = pd.Series([False, True, False], index=[0, 0, 1])
-     s.any(level=0)
-
-- ``Panel`` now supports the ``all`` and ``any`` aggregation functions. (:issue:`8302`):
-
-  .. ipython:: python
-
-     p = pd.Panel(np.random.rand(2, 5, 4) > 0.1)
-     p.all()
-
-- Added support for ``utcfromtimestamp()``, ``fromtimestamp()``, and ``combine()`` on `Timestamp` class (:issue:`5351`).
-- Added Google Analytics (`pandas.io.ga`) basic documentation (:issue:`8835`). See `here<http://pandas.pydata.org/pandas-docs/version/0.15.2/remote_data.html#remote-data-ga>`__.
-- ``Timedelta`` arithmetic returns ``NotImplemented`` in unknown cases, allowing extensions by custom classes (:issue:`8813`).
-- ``Timedelta`` now supports arithemtic with ``numpy.ndarray`` objects of the appropriate dtype (numpy 1.8 or newer only) (:issue:`8884`).
-- Added ``Timedelta.to_timedelta64()`` method to the public API (:issue:`8884`).
-- Added ``gbq.generate_bq_schema()`` function to the gbq module (:issue:`8325`).
-- ``Series`` now works with map objects the same way as generators (:issue:`8909`).
-- Added context manager to ``HDFStore`` for automatic closing (:issue:`8791`).
-- ``to_datetime`` gains an ``exact`` keyword to allow for a format to not require an exact match for a provided format string (if its ``False``). ``exact`` defaults to ``True`` (meaning that exact matching is still the default)  (:issue:`8904`)
-- Added ``axvlines`` boolean option to parallel_coordinates plot function, determines whether vertical lines will be printed, default is True
-- Added ability to read table footers to read_html (:issue:`8552`)
-- ``to_sql`` now infers datatypes of non-NA values for columns that contain NA values and have dtype ``object`` (:issue:`8778`).
-
-
-.. _whatsnew_0152.performance:
-
-Performance
-~~~~~~~~~~~
-
-- Reduce memory usage when skiprows is an integer in read_csv (:issue:`8681`)
-- Performance boost for ``to_datetime`` conversions with a passed ``format=``, and the ``exact=False`` (:issue:`8904`)
-
-
-.. _whatsnew_0152.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in concat of Series with ``category`` dtype which were coercing to ``object``. (:issue:`8641`)
-- Bug in Timestamp-Timestamp not returning a Timedelta type and datelike-datelike ops with timezones (:issue:`8865`)
-- Made consistent a timezone mismatch exception (either tz operated with None or incompatible timezone), will now return ``TypeError`` rather than ``ValueError`` (a couple of edge cases only), (:issue:`8865`)
-- Bug in using a ``pd.Grouper(key=...)`` with no level/axis or level only (:issue:`8795`, :issue:`8866`)
-- Report a ``TypeError`` when invalid/no parameters are passed in a groupby (:issue:`8015`)
-- Bug in packaging pandas with ``py2app/cx_Freeze`` (:issue:`8602`, :issue:`8831`)
-- Bug in ``groupby`` signatures that didn't include \*args or \*\*kwargs (:issue:`8733`).
-- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
-- Unclear error message in csv parsing when passing dtype and names and the parsed data is a different data type (:issue:`8833`)
-- Bug in slicing a multi-index with an empty list and at least one boolean indexer (:issue:`8781`)
-- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo (:issue:`8761`).
-- ``Timedelta`` kwargs may now be numpy ints and floats (:issue:`8757`).
-- Fixed several outstanding bugs for ``Timedelta`` arithmetic and comparisons (:issue:`8813`, :issue:`5963`, :issue:`5436`).
-- ``sql_schema`` now generates dialect appropriate ``CREATE TABLE`` statements (:issue:`8697`)
-- ``slice`` string method now takes step into account (:issue:`8754`)
-- Bug in ``BlockManager`` where setting values with different type would break block integrity (:issue:`8850`)
-- Bug in ``DatetimeIndex`` when using ``time`` object as key (:issue:`8667`)
-- Bug in ``merge`` where ``how='left'`` and ``sort=False`` would not preserve left frame order (:issue:`7331`)
-- Bug in ``MultiIndex.reindex`` where reindexing at level would not reorder labels (:issue:`4088`)
-- Bug in certain operations with dateutil timezones, manifesting with dateutil 2.3 (:issue:`8639`)
-- Regression in DatetimeIndex iteration with a Fixed/Local offset timezone (:issue:`8890`)
-- Bug in ``to_datetime`` when parsing a nanoseconds using the ``%f`` format (:issue:`8989`)
-- ``io.data.Options`` now raises ``RemoteDataError`` when no expiry dates are available from Yahoo and when it receives no data from Yahoo (:issue:`8761`), (:issue:`8783`).
-- Fix: The font size was only set on x axis if vertical or the y axis if horizontal. (:issue:`8765`)
-- Fixed division by 0 when reading big csv files in python 3 (:issue:`8621`)
-- Bug in outputing a Multindex with ``to_html,index=False`` which would add an extra column (:issue:`8452`)
-- Imported categorical variables from Stata files retain the ordinal information in the underlying data (:issue:`8836`).
-- Defined ``.size`` attribute across ``NDFrame`` objects to provide compat with numpy >= 1.9.1; buggy with ``np.array_split`` (:issue:`8846`)
-- Skip testing of histogram plots for matplotlib <= 1.2 (:issue:`8648`).
-- Bug where ``get_data_google`` returned object dtypes (:issue:`3995`)
-- Bug in ``DataFrame.stack(..., dropna=False)`` when the DataFrame's ``columns`` is a ``MultiIndex``
-  whose ``labels`` do not reference all its ``levels``. (:issue:`8844`)
-- Bug in that Option context applied on ``__enter__`` (:issue:`8514`)
-- Bug in resample that causes a ValueError when resampling across multiple days
-  and the last offset is not calculated from the start of the range (:issue:`8683`)
-- Bug where ``DataFrame.plot(kind='scatter')`` fails when checking if an np.array is in the DataFrame (:issue:`8852`)
-- Bug in ``pd.infer_freq/DataFrame.inferred_freq`` that prevented proper sub-daily frequency inference when the index contained DST days (:issue:`8772`).
-- Bug where index name was still used when plotting a series with ``use_index=False`` (:issue:`8558`).
-- Bugs when trying to stack multiple columns, when some (or all) of the level names are numbers (:issue:`8584`).
-- Bug in ``MultiIndex`` where ``__contains__`` returns wrong result if index is not lexically sorted or unique (:issue:`7724`)
-- BUG CSV: fix problem with trailing whitespace in skipped rows, (:issue:`8679`), (:issue:`8661`), (:issue:`8983`)
-- Regression in ``Timestamp`` does not parse 'Z' zone designator for UTC (:issue:`8771`)
-- Bug in `StataWriter` the produces writes strings with 244 characters irrespective of actual size (:issue:`8969`)
-- Fixed ValueError raised by cummin/cummax when datetime64 Series contains NaT. (:issue:`8965`)
-- Bug in Datareader returns object dtype if there are missing values (:issue:`8980`)
-- Bug in plotting if sharex was enabled and index was a timeseries, would show labels on multiple axes (:issue:`3964`).
-- Bug where passing a unit to the TimedeltaIndex constructor applied the to nano-second conversion twice. (:issue:`9011`).
-- Bug in plotting of a period-like array (:issue:`9012`)
diff --git a/doc/source/whatsnew/v0.16.0.rst b/doc/source/whatsnew/v0.16.0.rst
new file mode 100644
index 0000000000000..f082bf656f23c
--- /dev/null
+++ b/doc/source/whatsnew/v0.16.0.rst
@@ -0,0 +1,690 @@
+.. _whatsnew_0160:
+
+v0.16.0 (March 22, 2015)
+------------------------
+
+{{ header }}
+
+
+This is a major release from 0.15.2 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- ``DataFrame.assign`` method, see :ref:`here <whatsnew_0160.enhancements.assign>`
+- ``Series.to_coo/from_coo`` methods to interact with ``scipy.sparse``, see :ref:`here <whatsnew_0160.enhancements.sparse>`
+- Backwards incompatible change to ``Timedelta`` to conform the ``.seconds`` attribute with ``datetime.timedelta``, see :ref:`here <whatsnew_0160.api_breaking.timedelta>`
+- Changes to the ``.loc`` slicing API to conform with the behavior of ``.ix`` see :ref:`here <whatsnew_0160.api_breaking.indexing>`
+- Changes to the default for ordering in the ``Categorical`` constructor, see :ref:`here <whatsnew_0160.api_breaking.categorical>`
+-  Enhancement to the ``.str`` accessor to make string operations easier, see :ref:`here <whatsnew_0160.enhancements.string>`
+- The ``pandas.tools.rplot``, ``pandas.sandbox.qtpandas`` and ``pandas.rpy``
+  modules are deprecated. We refer users to external packages like
+  `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_,
+  `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_ and
+  `rpy2 <http://rpy2.bitbucket.org/>`_ for similar or equivalent
+  functionality, see :ref:`here <whatsnew_0160.deprecations>`
+
+Check the :ref:`API Changes <whatsnew_0160.api>` and :ref:`deprecations <whatsnew_0160.deprecations>` before updating.
+
+.. contents:: What's new in v0.16.0
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0160.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0160.enhancements.assign:
+
+DataFrame Assign
+^^^^^^^^^^^^^^^^
+
+Inspired by `dplyr's
+<http://cran.rstudio.com/web/packages/dplyr/vignettes/introduction.html#mutate>`__ ``mutate`` verb, DataFrame has a new
+:meth:`~pandas.DataFrame.assign` method.
+The function signature for ``assign`` is simply ``**kwargs``. The keys
+are the column names for the new fields, and the values are either a value
+to be inserted (for example, a ``Series`` or NumPy array), or a function
+of one argument to be called on the ``DataFrame``. The new values are inserted,
+and the entire DataFrame (with all original and new columns) is returned.
+
+.. ipython:: python
+
+   iris = pd.read_csv('data/iris.data')
+   iris.head()
+
+   iris.assign(sepal_ratio=iris['SepalWidth'] / iris['SepalLength']).head()
+
+Above was an example of inserting a precomputed value. We can also pass in
+a function to be evaluated.
+
+.. ipython:: python
+
+    iris.assign(sepal_ratio=lambda x: (x['SepalWidth']
+                                       / x['SepalLength'])).head()
+
+The power of ``assign`` comes when used in chains of operations. For example,
+we can limit the DataFrame to just those with a Sepal Length greater than 5,
+calculate the ratio, and plot
+
+.. ipython:: python
+
+   iris = pd.read_csv('data/iris.data')
+   (iris.query('SepalLength > 5')
+        .assign(SepalRatio=lambda x: x.SepalWidth / x.SepalLength,
+                PetalRatio=lambda x: x.PetalWidth / x.PetalLength)
+        .plot(kind='scatter', x='SepalRatio', y='PetalRatio'))
+
+.. image:: ../_static/whatsnew_assign.png
+  :scale: 50 %
+
+See the :ref:`documentation <dsintro.chained_assignment>` for more. (:issue:`9229`)
+
+
+.. _whatsnew_0160.enhancements.sparse:
+
+Interaction with scipy.sparse
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Added :meth:`SparseSeries.to_coo` and :meth:`SparseSeries.from_coo` methods (:issue:`8048`) for converting to and from ``scipy.sparse.coo_matrix`` instances (see :ref:`here <sparse.scipysparse>`). For example, given a SparseSeries with MultiIndex we can convert to a `scipy.sparse.coo_matrix` by specifying the row and column labels as index levels:
+
+.. ipython:: python
+
+   s = pd.Series([3.0, np.nan, 1.0, 3.0, np.nan, np.nan])
+   s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                        (1, 2, 'a', 1),
+                                        (1, 1, 'b', 0),
+                                        (1, 1, 'b', 1),
+                                        (2, 1, 'b', 0),
+                                        (2, 1, 'b', 1)],
+                                       names=['A', 'B', 'C', 'D'])
+
+   s
+
+   # SparseSeries
+   ss = s.to_sparse()
+   ss
+
+   A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
+                                column_levels=['C', 'D'],
+                                sort_labels=False)
+
+   A
+   A.todense()
+   rows
+   columns
+
+The from_coo method is a convenience method for creating a ``SparseSeries``
+from a ``scipy.sparse.coo_matrix``:
+
+.. ipython:: python
+
+   from scipy import sparse
+   A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
+                         shape=(3, 4))
+   A
+   A.todense()
+
+   ss = pd.SparseSeries.from_coo(A)
+   ss
+
+.. _whatsnew_0160.enhancements.string:
+
+String Methods Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Following new methods are accessible via ``.str`` accessor to apply the function to each values. This is intended to make it more consistent with standard methods on strings. (:issue:`9282`, :issue:`9352`, :issue:`9386`, :issue:`9387`, :issue:`9439`)
+
+  =============  =============  =============  ===============    ===============
+  ..             ..             Methods        ..                 ..
+  =============  =============  =============  ===============    ===============
+  ``isalnum()``  ``isalpha()``  ``isdigit()``  ``isdigit()``      ``isspace()``
+  ``islower()``  ``isupper()``  ``istitle()``  ``isnumeric()``    ``isdecimal()``
+  ``find()``     ``rfind()``    ``ljust()``    ``rjust()``        ``zfill()``
+  =============  =============  =============  ===============    ===============
+
+  .. ipython:: python
+
+     s = pd.Series(['abcd', '3456', 'EFGH'])
+     s.str.isalpha()
+     s.str.find('ab')
+
+- :meth:`Series.str.pad` and :meth:`Series.str.center` now accept ``fillchar`` option to specify filling character (:issue:`9352`)
+
+  .. ipython:: python
+
+     s = pd.Series(['12', '300', '25'])
+     s.str.pad(5, fillchar='_')
+
+- Added :meth:`Series.str.slice_replace`, which previously raised ``NotImplementedError`` (:issue:`8888`)
+
+  .. ipython:: python
+
+     s = pd.Series(['ABCD', 'EFGH', 'IJK'])
+     s.str.slice_replace(1, 3, 'X')
+     # replaced with empty char
+     s.str.slice_replace(0, 1)
+
+.. _whatsnew_0160.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Reindex now supports ``method='nearest'`` for frames or series with a monotonic increasing or decreasing index (:issue:`9258`):
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'x': range(5)})
+     df.reindex([0.2, 1.8, 3.5], method='nearest')
+
+  This method is also exposed by the lower level ``Index.get_indexer`` and ``Index.get_loc`` methods.
+
+- The ``read_excel()`` function's :ref:`sheetname <io.excel.specifying_sheets>` argument now accepts a list and ``None``, to get multiple or all sheets respectively.  If more than one sheet is specified, a dictionary is returned. (:issue:`9450`)
+
+  .. code-block:: python
+
+     # Returns the 1st and 4th sheet, as a dictionary of DataFrames.
+     pd.read_excel('path_to_file.xls', sheetname=['Sheet1', 3])
+
+
+- Allow Stata files to be read incrementally with an iterator; support for long strings in Stata files. See the docs :ref:`here<io.stata_reader>` (:issue:`9493`:).
+- Paths beginning with ~ will now be expanded to begin with the user's home directory (:issue:`9066`)
+- Added time interval selection in ``get_data_yahoo`` (:issue:`9071`)
+- Added ``Timestamp.to_datetime64()`` to complement ``Timedelta.to_timedelta64()`` (:issue:`9255`)
+- ``tseries.frequencies.to_offset()`` now accepts ``Timedelta`` as input (:issue:`9064`)
+- Lag parameter was added to the autocorrelation method of ``Series``, defaults to lag-1 autocorrelation (:issue:`9192`)
+- ``Timedelta`` will now accept ``nanoseconds`` keyword in constructor (:issue:`9273`)
+- SQL code now safely escapes table and column names (:issue:`8986`)
+- Added auto-complete for ``Series.str.<tab>``, ``Series.dt.<tab>`` and ``Series.cat.<tab>`` (:issue:`9322`)
+- ``Index.get_indexer`` now supports ``method='pad'`` and ``method='backfill'`` even for any target array, not just monotonic targets. These methods also work for monotonic decreasing as well as monotonic increasing indexes (:issue:`9258`).
+- ``Index.asof`` now works on all index types (:issue:`9258`).
+- A ``verbose`` argument has been augmented in ``io.read_excel()``, defaults to False. Set to True to print sheet names as they are parsed. (:issue:`9450`)
+- Added ``days_in_month`` (compatibility alias ``daysinmonth``) property to ``Timestamp``, ``DatetimeIndex``, ``Period``, ``PeriodIndex``, and ``Series.dt`` (:issue:`9572`)
+- Added ``decimal`` option in ``to_csv`` to provide formatting for non-'.' decimal separators (:issue:`781`)
+- Added ``normalize`` option for ``Timestamp`` to normalized to midnight (:issue:`8794`)
+- Added example for ``DataFrame`` import to R using HDF5 file and ``rhdf5``
+  library. See the :ref:`documentation <io.external_compatibility>` for more
+  (:issue:`9636`).
+
+.. _whatsnew_0160.api:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0160.api_breaking:
+
+.. _whatsnew_0160.api_breaking.timedelta:
+
+Changes in Timedelta
+^^^^^^^^^^^^^^^^^^^^
+
+In v0.15.0 a new scalar type ``Timedelta`` was introduced, that is a
+sub-class of ``datetime.timedelta``. Mentioned :ref:`here <whatsnew_0150.timedeltaindex>` was a notice of an API change w.r.t. the ``.seconds`` accessor. The intent was to provide a user-friendly set of accessors that give the 'natural' value for that unit, e.g. if you had a ``Timedelta('1 day, 10:11:12')``, then ``.seconds`` would return 12. However, this is at odds with the definition of ``datetime.timedelta``, which defines ``.seconds`` as ``10 * 3600 + 11 * 60 + 12 == 36672``.
+
+So in v0.16.0, we are restoring the API to match that of ``datetime.timedelta``. Further, the component values are still available through the ``.components`` accessor. This affects the ``.seconds`` and ``.microseconds`` accessors, and removes the ``.hours``, ``.minutes``, ``.milliseconds`` accessors. These changes affect ``TimedeltaIndex`` and the Series ``.dt`` accessor as well. (:issue:`9185`, :issue:`9139`)
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [2]: t = pd.Timedelta('1 day, 10:11:12.100123')
+
+   In [3]: t.days
+   Out[3]: 1
+
+   In [4]: t.seconds
+   Out[4]: 12
+
+   In [5]: t.microseconds
+   Out[5]: 123
+
+New Behavior
+
+.. ipython:: python
+
+   t = pd.Timedelta('1 day, 10:11:12.100123')
+   t.days
+   t.seconds
+   t.microseconds
+
+Using ``.components`` allows the full component access
+
+.. ipython:: python
+
+   t.components
+   t.components.seconds
+
+.. _whatsnew_0160.api_breaking.indexing:
+
+Indexing Changes
+^^^^^^^^^^^^^^^^
+
+The behavior of a small sub-set of edge cases for using ``.loc`` have changed (:issue:`8613`). Furthermore we have improved the content of the error messages that are raised:
+
+- Slicing with ``.loc`` where the start and/or stop bound is not found in the index is now allowed; this previously would raise a ``KeyError``. This makes the behavior the same as ``.ix`` in this case. This change is only for slicing, not when indexing with a single label.
+
+  .. ipython:: python
+
+     df = pd.DataFrame(np.random.randn(5, 4),
+                       columns=list('ABCD'),
+                       index=pd.date_range('20130101', periods=5))
+     df
+     s = pd.Series(range(5), [-2, -1, 1, 2, 3])
+     s
+
+  Previous Behavior
+
+  .. code-block:: ipython
+
+     In [4]: df.loc['2013-01-02':'2013-01-10']
+     KeyError: 'stop bound [2013-01-10] is not in the [index]'
+
+     In [6]: s.loc[-10:3]
+     KeyError: 'start bound [-10] is not the [index]'
+
+  New Behavior
+
+  .. ipython:: python
+
+     df.loc['2013-01-02':'2013-01-10']
+     s.loc[-10:3]
+
+- Allow slicing with float-like values on an integer index for ``.ix``. Previously this was only enabled for ``.loc``:
+
+  Previous Behavior
+
+  .. code-block:: ipython
+
+     In [8]: s.ix[-1.0:2]
+     TypeError: the slice start value [-1.0] is not a proper indexer for this index type (Int64Index)
+
+  New Behavior
+
+  .. code-block:: python
+
+     In [2]: s.ix[-1.0:2]
+     Out[2]:
+     -1    1
+      1    2
+      2    3
+     dtype: int64
+
+- Provide a useful exception for indexing with an invalid type for that index when using ``.loc``. For example trying to use ``.loc`` on an index of type ``DatetimeIndex`` or ``PeriodIndex`` or ``TimedeltaIndex``, with an integer (or a float).
+
+  Previous Behavior
+
+  .. code-block:: python
+
+     In [4]: df.loc[2:3]
+     KeyError: 'start bound [2] is not the [index]'
+
+  New Behavior
+
+  .. code-block:: ipython
+
+     In [4]: df.loc[2:3]
+     TypeError: Cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with <type 'int'> keys
+
+
+.. _whatsnew_0160.api_breaking.categorical:
+
+Categorical Changes
+^^^^^^^^^^^^^^^^^^^
+
+In prior versions, ``Categoricals`` that had an unspecified ordering (meaning no ``ordered`` keyword was passed) were defaulted as ``ordered`` Categoricals. Going forward, the ``ordered`` keyword in the ``Categorical`` constructor will default to ``False``. Ordering must now be explicit.
+
+Furthermore, previously you *could* change the ``ordered`` attribute of a Categorical by just setting the attribute, e.g. ``cat.ordered=True``; This is now deprecated and you should use ``cat.as_ordered()`` or ``cat.as_unordered()``. These will by default return a **new** object and not modify the existing object. (:issue:`9347`, :issue:`9190`)
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [3]: s = pd.Series([0, 1, 2], dtype='category')
+
+   In [4]: s
+   Out[4]:
+   0    0
+   1    1
+   2    2
+   dtype: category
+   Categories (3, int64): [0 < 1 < 2]
+
+   In [5]: s.cat.ordered
+   Out[5]: True
+
+   In [6]: s.cat.ordered = False
+
+   In [7]: s
+   Out[7]:
+   0    0
+   1    1
+   2    2
+   dtype: category
+   Categories (3, int64): [0, 1, 2]
+
+New Behavior
+
+.. ipython:: python
+
+   s = pd.Series([0, 1, 2], dtype='category')
+   s
+   s.cat.ordered
+   s = s.cat.as_ordered()
+   s
+   s.cat.ordered
+
+   # you can set in the constructor of the Categorical
+   s = pd.Series(pd.Categorical([0, 1, 2], ordered=True))
+   s
+   s.cat.ordered
+
+For ease of creation of series of categorical data, we have added the ability to pass keywords when calling ``.astype()``. These are passed directly to the constructor.
+
+.. code-block:: python
+
+    In [54]: s = pd.Series(["a", "b", "c", "a"]).astype('category', ordered=True)
+
+    In [55]: s
+    Out[55]:
+    0    a
+    1    b
+    2    c
+    3    a
+    dtype: category
+    Categories (3, object): [a < b < c]
+
+    In [56]: s = (pd.Series(["a", "b", "c", "a"])
+       ....:        .astype('category', categories=list('abcdef'), ordered=False))
+
+    In [57]: s
+    Out[57]:
+    0    a
+    1    b
+    2    c
+    3    a
+    dtype: category
+    Categories (6, object): [a, b, c, d, e, f]
+
+
+.. _whatsnew_0160.api_breaking.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- ``Index.duplicated`` now returns ``np.array(dtype=bool)`` rather than ``Index(dtype=object)`` containing ``bool`` values. (:issue:`8875`)
+- ``DataFrame.to_json`` now returns accurate type serialisation for each column for frames of mixed dtype (:issue:`9037`)
+
+  Previously data was coerced to a common dtype before serialisation, which for
+  example resulted in integers being serialised to floats:
+
+  .. code-block:: ipython
+
+    In [2]: pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
+    Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1.0,"1":2.0}}'
+
+  Now each column is serialised using its correct dtype:
+
+  .. code-block:: ipython
+
+    In [2]:  pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
+    Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1,"1":2}}'
+
+- ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex.summary`` now output the same format. (:issue:`9116`)
+- ``TimedeltaIndex.freqstr`` now output the same string format as ``DatetimeIndex``. (:issue:`9116`)
+
+- Bar and horizontal bar plots no longer add a dashed line along the info axis. The prior style can be achieved with matplotlib's ``axhline`` or ``axvline`` methods (:issue:`9088`).
+
+- ``Series`` accessors ``.dt``, ``.cat`` and ``.str`` now raise ``AttributeError`` instead of ``TypeError`` if the series does not contain the appropriate type of data (:issue:`9617`). This follows Python's built-in exception hierarchy more closely and ensures that tests like ``hasattr(s, 'cat')`` are consistent on both Python 2 and 3.
+
+- ``Series`` now supports bitwise operation for integral types (:issue:`9016`). Previously even if the input dtypes were integral, the output dtype was coerced to ``bool``.
+
+  Previous Behavior
+
+  .. code-block:: ipython
+
+     In [2]: pd.Series([0, 1, 2, 3], list('abcd')) | pd.Series([4, 4, 4, 4], list('abcd'))
+     Out[2]:
+     a    True
+     b    True
+     c    True
+     d    True
+     dtype: bool
+
+  New Behavior. If the input dtypes are integral, the output dtype is also integral and the output
+  values are the result of the bitwise operation.
+
+  .. code-block:: ipython
+
+     In [2]: pd.Series([0, 1, 2, 3], list('abcd')) | pd.Series([4, 4, 4, 4], list('abcd'))
+     Out[2]:
+     a    4
+     b    5
+     c    6
+     d    7
+     dtype: int64
+
+
+- During division involving a ``Series`` or ``DataFrame``, ``0/0`` and ``0//0`` now give ``np.nan`` instead of ``np.inf``. (:issue:`9144`, :issue:`8445`)
+
+  Previous Behavior
+
+  .. code-block:: ipython
+
+        In [2]: p = pd.Series([0, 1])
+
+        In [3]: p / 0
+        Out[3]:
+        0    inf
+        1    inf
+        dtype: float64
+
+        In [4]: p // 0
+        Out[4]:
+        0    inf
+        1    inf
+        dtype: float64
+
+
+
+  New Behavior
+
+  .. ipython:: python
+
+     p = pd.Series([0, 1])
+     p / 0
+     p // 0
+
+- ``Series.values_counts`` and ``Series.describe`` for categorical data will now put ``NaN`` entries at the end. (:issue:`9443`)
+- ``Series.describe`` for categorical data will now give counts and frequencies of 0, not ``NaN``, for unused categories (:issue:`9443`)
+
+- Due to a bug fix, looking up a partial string label with ``DatetimeIndex.asof`` now includes values that match the string, even if they are after the start of the partial string label (:issue:`9258`).
+
+  Old behavior:
+
+  .. code-block:: ipython
+
+    In [4]: pd.to_datetime(['2000-01-31', '2000-02-28']).asof('2000-02')
+    Out[4]: Timestamp('2000-01-31 00:00:00')
+
+  Fixed behavior:
+
+  .. ipython:: python
+
+    pd.to_datetime(['2000-01-31', '2000-02-28']).asof('2000-02')
+
+  To reproduce the old behavior, simply add more precision to the label (e.g., use ``2000-02-01`` instead of ``2000-02``).
+
+
+.. _whatsnew_0160.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- The ``rplot`` trellis plotting interface is deprecated and will be removed
+  in a future version. We refer to external packages like
+  `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_ for similar
+  but more refined functionality (:issue:`3445`).
+  The documentation includes some examples how to convert your existing code
+  using ``rplot`` to seaborn: :ref:`rplot docs <rplot>`.
+
+- The ``pandas.sandbox.qtpandas`` interface is deprecated and will be removed in a future version.
+  We refer users to the external package `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_. (:issue:`9615`)
+
+- The ``pandas.rpy`` interface is deprecated and will be removed in a future version.
+  Similar functionality can be accessed through the `rpy2 <http://rpy2.bitbucket.org/>`_ project (:issue:`9602`)
+
+- Adding ``DatetimeIndex/PeriodIndex`` to another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to a ``TypeError`` in a future version. ``.union()`` should be used for the union set operation. (:issue:`9094`)
+- Subtracting ``DatetimeIndex/PeriodIndex`` from another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to an actual numeric subtraction yielding a ``TimeDeltaIndex`` in a future version. ``.difference()`` should be used for the differencing set operation. (:issue:`9094`)
+
+
+.. _whatsnew_0160.prior_deprecations:
+
+Removal of prior version deprecations/changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- ``DataFrame.pivot_table`` and ``crosstab``'s ``rows`` and ``cols`` keyword arguments were removed in favor
+  of ``index`` and ``columns`` (:issue:`6581`)
+- ``DataFrame.to_excel`` and ``DataFrame.to_csv`` ``cols`` keyword argument was removed in favor of ``columns`` (:issue:`6581`)
+- Removed ``convert_dummies`` in favor of ``get_dummies`` (:issue:`6581`)
+- Removed ``value_range`` in favor of ``describe`` (:issue:`6581`)
+
+.. _whatsnew_0160.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Fixed a performance regression for ``.loc`` indexing with an array or list-like (:issue:`9126`:).
+- ``DataFrame.to_json`` 30x performance improvement for mixed dtype frames. (:issue:`9037`)
+- Performance improvements in ``MultiIndex.duplicated`` by working with labels instead of values (:issue:`9125`)
+- Improved the speed of ``nunique`` by calling ``unique`` instead of ``value_counts`` (:issue:`9129`, :issue:`7771`)
+- Performance improvement of up to 10x in ``DataFrame.count`` and ``DataFrame.dropna`` by taking advantage of homogeneous/heterogeneous dtypes appropriately (:issue:`9136`)
+- Performance improvement of up to 20x in ``DataFrame.count`` when using a ``MultiIndex`` and the ``level`` keyword argument  (:issue:`9163`)
+- Performance and memory usage improvements in ``merge`` when key space exceeds ``int64`` bounds (:issue:`9151`)
+- Performance improvements in multi-key ``groupby`` (:issue:`9429`)
+- Performance improvements in ``MultiIndex.sortlevel`` (:issue:`9445`)
+- Performance and memory usage improvements in ``DataFrame.duplicated`` (:issue:`9398`)
+- Cythonized ``Period`` (:issue:`9440`)
+- Decreased memory usage on ``to_hdf`` (:issue:`9648`)
+
+.. _whatsnew_0160.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Changed ``.to_html`` to remove leading/trailing spaces in table body (:issue:`4987`)
+- Fixed issue using ``read_csv`` on s3 with Python 3 (:issue:`9452`)
+- Fixed compatibility issue in ``DatetimeIndex`` affecting architectures where ``numpy.int_`` defaults to ``numpy.int32`` (:issue:`8943`)
+- Bug in Panel indexing with an object-like (:issue:`9140`)
+- Bug in the returned ``Series.dt.components`` index was reset to the default index (:issue:`9247`)
+- Bug in ``Categorical.__getitem__/__setitem__`` with listlike input getting incorrect results from indexer coercion (:issue:`9469`)
+- Bug in partial setting with a DatetimeIndex (:issue:`9478`)
+- Bug in groupby for integer and datetime64 columns when applying an aggregator that caused the value to be
+  changed when the number was sufficiently large (:issue:`9311`, :issue:`6620`)
+- Fixed bug in ``to_sql`` when mapping a ``Timestamp`` object column (datetime
+  column with timezone info) to the appropriate sqlalchemy type (:issue:`9085`).
+- Fixed bug in ``to_sql`` ``dtype`` argument not accepting an instantiated
+  SQLAlchemy type  (:issue:`9083`).
+- Bug in ``.loc`` partial setting with a ``np.datetime64`` (:issue:`9516`)
+- Incorrect dtypes inferred on datetimelike looking ``Series`` & on ``.xs`` slices (:issue:`9477`)
+- Items in ``Categorical.unique()`` (and ``s.unique()`` if ``s`` is of dtype ``category``) now appear in the order in which they are originally found, not in sorted order (:issue:`9331`). This is now consistent with the behavior for other dtypes in pandas.
+- Fixed bug on big endian platforms which produced incorrect results in ``StataReader`` (:issue:`8688`).
+- Bug in ``MultiIndex.has_duplicates`` when having many levels causes an indexer overflow (:issue:`9075`, :issue:`5873`)
+- Bug in ``pivot`` and ``unstack`` where ``nan`` values would break index alignment (:issue:`4862`, :issue:`7401`, :issue:`7403`, :issue:`7405`, :issue:`7466`, :issue:`9497`)
+- Bug in left ``join`` on MultiIndex with ``sort=True`` or null values (:issue:`9210`).
+- Bug in ``MultiIndex`` where inserting new keys would fail (:issue:`9250`).
+- Bug in ``groupby`` when key space exceeds ``int64`` bounds (:issue:`9096`).
+- Bug in ``unstack`` with ``TimedeltaIndex`` or ``DatetimeIndex`` and nulls (:issue:`9491`).
+- Bug in ``rank`` where comparing floats with tolerance will cause inconsistent behaviour (:issue:`8365`).
+- Fixed character encoding bug in ``read_stata`` and ``StataReader`` when loading data from a URL (:issue:`9231`).
+- Bug in adding ``offsets.Nano`` to other offsets raises ``TypeError`` (:issue:`9284`)
+- Bug in ``DatetimeIndex`` iteration, related to (:issue:`8890`), fixed in (:issue:`9100`)
+- Bugs in ``resample`` around DST transitions. This required fixing offset classes so they behave correctly on DST transitions. (:issue:`5172`, :issue:`8744`, :issue:`8653`, :issue:`9173`, :issue:`9468`).
+- Bug in binary operator method (eg ``.mul()``) alignment with integer levels (:issue:`9463`).
+- Bug in boxplot, scatter and hexbin plot may show an unnecessary warning (:issue:`8877`)
+- Bug in subplot with ``layout`` kw may show unnecessary warning (:issue:`9464`)
+- Bug in using grouper functions that need passed through arguments (e.g. axis), when using wrapped function (e.g. ``fillna``), (:issue:`9221`)
+- ``DataFrame`` now properly supports simultaneous ``copy`` and ``dtype`` arguments in constructor (:issue:`9099`)
+- Bug in ``read_csv`` when using skiprows on a file with CR line endings with the c engine. (:issue:`9079`)
+- ``isnull`` now detects ``NaT`` in ``PeriodIndex`` (:issue:`9129`)
+- Bug in groupby ``.nth()`` with a multiple column groupby (:issue:`8979`)
+- Bug in ``DataFrame.where`` and ``Series.where`` coerce numerics to string incorrectly (:issue:`9280`)
+- Bug in ``DataFrame.where`` and ``Series.where`` raise ``ValueError`` when string list-like is passed. (:issue:`9280`)
+- Accessing ``Series.str`` methods on with non-string values now raises ``TypeError`` instead of producing incorrect results (:issue:`9184`)
+- Bug in ``DatetimeIndex.__contains__`` when index has duplicates and is not monotonic increasing (:issue:`9512`)
+- Fixed division by zero error for ``Series.kurt()`` when all values are equal (:issue:`9197`)
+- Fixed issue in the ``xlsxwriter`` engine where it added a default 'General' format to cells if no other format was applied. This prevented other row or column formatting being applied. (:issue:`9167`)
+- Fixes issue with ``index_col=False`` when ``usecols`` is also specified in ``read_csv``. (:issue:`9082`)
+- Bug where ``wide_to_long`` would modify the input stub names list (:issue:`9204`)
+- Bug in ``to_sql`` not storing float64 values using double precision. (:issue:`9009`)
+- ``SparseSeries`` and ``SparsePanel`` now accept zero argument constructors (same as their non-sparse counterparts) (:issue:`9272`).
+- Regression in merging ``Categorical`` and ``object`` dtypes (:issue:`9426`)
+- Bug in ``read_csv`` with buffer overflows with certain malformed input files (:issue:`9205`)
+- Bug in groupby MultiIndex with missing pair (:issue:`9049`, :issue:`9344`)
+- Fixed bug in ``Series.groupby`` where grouping on ``MultiIndex`` levels would ignore the sort argument (:issue:`9444`)
+- Fix bug in ``DataFrame.Groupby`` where ``sort=False`` is ignored in the case of Categorical columns. (:issue:`8868`)
+- Fixed bug with reading CSV files from Amazon S3 on python 3 raising a TypeError (:issue:`9452`)
+- Bug in the Google BigQuery reader where the 'jobComplete' key may be present but False in the query results (:issue:`8728`)
+- Bug in ``Series.values_counts`` with excluding ``NaN`` for categorical type ``Series`` with ``dropna=True`` (:issue:`9443`)
+- Fixed missing numeric_only option for ``DataFrame.std/var/sem`` (:issue:`9201`)
+- Support constructing ``Panel`` or ``Panel4D`` with scalar data (:issue:`8285`)
+- ``Series`` text representation disconnected from `max_rows`/`max_columns` (:issue:`7508`).
+
+\
+
+- ``Series`` number formatting inconsistent when truncated (:issue:`8532`).
+
+  Previous Behavior
+
+  .. code-block:: python
+
+    In [2]: pd.options.display.max_rows = 10
+    In [3]: s = pd.Series([1,1,1,1,1,1,1,1,1,1,0.9999,1,1]*10)
+    In [4]: s
+    Out[4]:
+    0    1
+    1    1
+    2    1
+    ...
+    127    0.9999
+    128    1.0000
+    129    1.0000
+    Length: 130, dtype: float64
+
+  New Behavior
+
+  .. code-block:: python
+
+    0      1.0000
+    1      1.0000
+    2      1.0000
+    3      1.0000
+    4      1.0000
+    ...
+    125    1.0000
+    126    1.0000
+    127    0.9999
+    128    1.0000
+    129    1.0000
+    dtype: float64
+
+- A Spurious ``SettingWithCopy`` Warning was generated when setting a new item in a frame in some cases (:issue:`8730`)
+
+  The following would previously report a ``SettingWithCopy`` Warning.
+
+  .. ipython:: python
+
+     df1 = pd.DataFrame({'x': pd.Series(['a', 'b', 'c']),
+                         'y': pd.Series(['d', 'e', 'f'])})
+     df2 = df1[['x']]
+     df2['y'] = ['g', 'h', 'i']
+
+
+.. _whatsnew_0.16.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.15.2..v0.16.0
diff --git a/doc/source/whatsnew/v0.16.0.txt b/doc/source/whatsnew/v0.16.0.txt
deleted file mode 100644
index 4d43660960597..0000000000000
--- a/doc/source/whatsnew/v0.16.0.txt
+++ /dev/null
@@ -1,660 +0,0 @@
-.. _whatsnew_0160:
-
-v0.16.0 (March 22, 2015)
-------------------------
-
-This is a major release from 0.15.2 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- ``DataFrame.assign`` method, see :ref:`here <whatsnew_0160.enhancements.assign>`
-- ``Series.to_coo/from_coo`` methods to interact with ``scipy.sparse``, see :ref:`here <whatsnew_0160.enhancements.sparse>`
-- Backwards incompatible change to ``Timedelta`` to conform the ``.seconds`` attribute with ``datetime.timedelta``, see :ref:`here <whatsnew_0160.api_breaking.timedelta>`
-- Changes to the ``.loc`` slicing API to conform with the behavior of ``.ix`` see :ref:`here <whatsnew_0160.api_breaking.indexing>`
-- Changes to the default for ordering in the ``Categorical`` constructor, see :ref:`here <whatsnew_0160.api_breaking.categorical>`
--  Enhancement to the ``.str`` accessor to make string operations easier, see :ref:`here <whatsnew_0160.enhancements.string>`
-- The ``pandas.tools.rplot``, ``pandas.sandbox.qtpandas`` and ``pandas.rpy``
-  modules are deprecated. We refer users to external packages like
-  `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_,
-  `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_ and
-  `rpy2 <http://rpy2.bitbucket.org/>`_ for similar or equivalent
-  functionality, see :ref:`here <whatsnew_0160.deprecations>`
-
-Check the :ref:`API Changes <whatsnew_0160.api>` and :ref:`deprecations <whatsnew_0160.deprecations>` before updating.
-
-.. contents:: What's new in v0.16.0
-    :local:
-    :backlinks: none
-
-
-.. _whatsnew_0160.enhancements:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0160.enhancements.assign:
-
-DataFrame Assign
-^^^^^^^^^^^^^^^^
-
-Inspired by `dplyr's
-<http://cran.rstudio.com/web/packages/dplyr/vignettes/introduction.html#mutate>`__ ``mutate`` verb, DataFrame has a new
-:meth:`~pandas.DataFrame.assign` method.
-The function signature for ``assign`` is simply ``**kwargs``. The keys
-are the column names for the new fields, and the values are either a value
-to be inserted (for example, a ``Series`` or NumPy array), or a function
-of one argument to be called on the ``DataFrame``. The new values are inserted,
-and the entire DataFrame (with all original and new columns) is returned.
-
-.. ipython :: python
-
-   iris = read_csv('data/iris.data')
-   iris.head()
-
-   iris.assign(sepal_ratio=iris['SepalWidth'] / iris['SepalLength']).head()
-
-Above was an example of inserting a precomputed value. We can also pass in
-a function to be evalutated.
-
-.. ipython :: python
-
-    iris.assign(sepal_ratio = lambda x: (x['SepalWidth'] /
-                                         x['SepalLength'])).head()
-
-The power of ``assign`` comes when used in chains of operations. For example,
-we can limit the DataFrame to just those with a Sepal Length greater than 5,
-calculate the ratio, and plot
-
-.. ipython:: python
-
-   (iris.query('SepalLength > 5')
-        .assign(SepalRatio = lambda x: x.SepalWidth / x.SepalLength,
-                PetalRatio = lambda x: x.PetalWidth / x.PetalLength)
-        .plot(kind='scatter', x='SepalRatio', y='PetalRatio'))
-
-.. image:: _static/whatsnew_assign.png
-  :scale: 50 %
-
-See the :ref:`documentation <dsintro.chained_assignment>` for more. (:issue:`9229`)
-
-
-.. _whatsnew_0160.enhancements.sparse:
-
-Interaction with scipy.sparse
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Added :meth:`SparseSeries.to_coo` and :meth:`SparseSeries.from_coo` methods (:issue:`8048`) for converting to and from ``scipy.sparse.coo_matrix`` instances (see :ref:`here <sparse.scipysparse>`). For example, given a SparseSeries with MultiIndex we can convert to a `scipy.sparse.coo_matrix` by specifying the row and column labels as index levels:
-
-.. ipython:: python
-
-   from numpy import nan
-   s = Series([3.0, nan, 1.0, 3.0, nan, nan])
-   s.index = MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                     (1, 2, 'a', 1),
-                                     (1, 1, 'b', 0),
-                                     (1, 1, 'b', 1),
-                                     (2, 1, 'b', 0),
-                                     (2, 1, 'b', 1)],
-                                     names=['A', 'B', 'C', 'D'])
-
-   s
-
-   # SparseSeries
-   ss = s.to_sparse()
-   ss
-
-   A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
-                                column_levels=['C', 'D'],
-                                sort_labels=False)
-
-   A
-   A.todense()
-   rows
-   columns
-
-The from_coo method is a convenience method for creating a ``SparseSeries``
-from a ``scipy.sparse.coo_matrix``:
-
-.. ipython:: python
-
-   from scipy import sparse
-   A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
-                               shape=(3, 4))
-   A
-   A.todense()
-
-   ss = SparseSeries.from_coo(A)
-   ss
-
-.. _whatsnew_0160.enhancements.string:
-
-String Methods Enhancements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Following new methods are accesible via ``.str`` accessor to apply the function to each values. This is intended to make it more consistent with standard methods on strings. (:issue:`9282`, :issue:`9352`, :issue:`9386`, :issue:`9387`, :issue:`9439`)
-
-  =============  =============  =============  ===============    ===============
-  ..             ..             Methods        ..                 ..
-  =============  =============  =============  ===============    ===============
-  ``isalnum()``  ``isalpha()``  ``isdigit()``  ``isdigit()``      ``isspace()``
-  ``islower()``  ``isupper()``  ``istitle()``  ``isnumeric()``    ``isdecimal()``
-  ``find()``     ``rfind()``    ``ljust()``    ``rjust()``        ``zfill()``
-  =============  =============  =============  ===============    ===============
-
-  .. ipython:: python
-
-     s = Series(['abcd', '3456', 'EFGH'])
-     s.str.isalpha()
-     s.str.find('ab')
-
-- :meth:`Series.str.pad` and :meth:`Series.str.center` now accept ``fillchar`` option to specify filling character (:issue:`9352`)
-
-  .. ipython:: python
-
-     s = Series(['12', '300', '25'])
-     s.str.pad(5, fillchar='_')
-
-- Added :meth:`Series.str.slice_replace`, which previously raised ``NotImplementedError`` (:issue:`8888`)
-
-  .. ipython:: python
-
-     s = Series(['ABCD', 'EFGH', 'IJK'])
-     s.str.slice_replace(1, 3, 'X')
-     # replaced with empty char
-     s.str.slice_replace(0, 1)
-
-.. _whatsnew_0160.enhancements.other:
-
-Other enhancements
-^^^^^^^^^^^^^^^^^^
-
-- Reindex now supports ``method='nearest'`` for frames or series with a monotonic increasing or decreasing index (:issue:`9258`):
-
-  .. ipython:: python
-
-     df = pd.DataFrame({'x': range(5)})
-     df.reindex([0.2, 1.8, 3.5], method='nearest')
-
-  This method is also exposed by the lower level ``Index.get_indexer`` and ``Index.get_loc`` methods.
-
-- The ``read_excel()`` function's :ref:`sheetname <io.excel.specifying_sheets>` argument now accepts a list and ``None``, to get multiple or all sheets respectively.  If more than one sheet is specified, a dictionary is returned. (:issue:`9450`)
-
-  .. code-block:: python
-
-     # Returns the 1st and 4th sheet, as a dictionary of DataFrames.
-     pd.read_excel('path_to_file.xls',sheetname=['Sheet1',3])
-
-
-- Allow Stata files to be read incrementally with an iterator; support for long strings in Stata files. See the docs :ref:`here<io.stata_reader>` (:issue:`9493`:).
-- Paths beginning with ~ will now be expanded to begin with the user's home directory (:issue:`9066`)
-- Added time interval selection in ``get_data_yahoo`` (:issue:`9071`)
-- Added ``Timestamp.to_datetime64()`` to complement ``Timedelta.to_timedelta64()`` (:issue:`9255`)
-- ``tseries.frequencies.to_offset()`` now accepts ``Timedelta`` as input (:issue:`9064`)
-- Lag parameter was added to the autocorrelation method of ``Series``, defaults to lag-1 autocorrelation (:issue:`9192`)
-- ``Timedelta`` will now accept ``nanoseconds`` keyword in constructor (:issue:`9273`)
-- SQL code now safely escapes table and column names (:issue:`8986`)
-- Added auto-complete for ``Series.str.<tab>``, ``Series.dt.<tab>`` and ``Series.cat.<tab>`` (:issue:`9322`)
-- ``Index.get_indexer`` now supports ``method='pad'`` and ``method='backfill'`` even for any target array, not just monotonic targets. These methods also work for monotonic decreasing as well as monotonic increasing indexes (:issue:`9258`).
-- ``Index.asof`` now works on all index types (:issue:`9258`).
-- A ``verbose`` argument has been augmented in ``io.read_excel()``, defaults to False. Set to True to print sheet names as they are parsed. (:issue:`9450`)
-- Added ``days_in_month`` (compatibility alias ``daysinmonth``) property to ``Timestamp``, ``DatetimeIndex``, ``Period``, ``PeriodIndex``, and ``Series.dt`` (:issue:`9572`)
-- Added ``decimal`` option in ``to_csv`` to provide formatting for non-'.' decimal separators (:issue:`781`)
-- Added ``normalize`` option for ``Timestamp`` to normalized to midnight (:issue:`8794`)
-- Added example for ``DataFrame`` import to R using HDF5 file and ``rhdf5``
-  library. See the :ref:`documentation <io.external_compatibility>` for more
-  (:issue:`9636`).
-
-.. _whatsnew_0160.api:
-
-Backwards incompatible API changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _whatsnew_0160.api_breaking:
-
-.. _whatsnew_0160.api_breaking.timedelta:
-
-Changes in Timedelta
-^^^^^^^^^^^^^^^^^^^^
-
-In v0.15.0 a new scalar type ``Timedelta`` was introduced, that is a
-sub-class of ``datetime.timedelta``. Mentioned :ref:`here <whatsnew_0150.timedeltaindex>` was a notice of an API change w.r.t. the ``.seconds`` accessor. The intent was to provide a user-friendly set of accessors that give the 'natural' value for that unit, e.g. if you had a ``Timedelta('1 day, 10:11:12')``, then ``.seconds`` would return 12. However, this is at odds with the definition of ``datetime.timedelta``, which defines ``.seconds`` as ``10 * 3600 + 11 * 60 + 12 == 36672``.
-
-So in v0.16.0, we are restoring the API to match that of ``datetime.timedelta``. Further, the component values are still available through the ``.components`` accessor. This affects the ``.seconds`` and ``.microseconds`` accessors, and removes the ``.hours``, ``.minutes``, ``.milliseconds`` accessors. These changes affect ``TimedeltaIndex`` and the Series ``.dt`` accessor as well. (:issue:`9185`, :issue:`9139`)
-
-Previous Behavior
-
-.. code-block:: ipython
-
-   In [2]: t = pd.Timedelta('1 day, 10:11:12.100123')
-
-   In [3]: t.days
-   Out[3]: 1
-
-   In [4]: t.seconds
-   Out[4]: 12
-
-   In [5]: t.microseconds
-   Out[5]: 123
-
-New Behavior
-
-.. ipython:: python
-
-   t = pd.Timedelta('1 day, 10:11:12.100123')
-   t.days
-   t.seconds
-   t.microseconds
-
-Using ``.components`` allows the full component access
-
-.. ipython:: python
-
-   t.components
-   t.components.seconds
-
-.. _whatsnew_0160.api_breaking.indexing:
-
-Indexing Changes
-^^^^^^^^^^^^^^^^
-
-The behavior of a small sub-set of edge cases for using ``.loc`` have changed (:issue:`8613`). Furthermore we have improved the content of the error messages that are raised:
-
-- Slicing with ``.loc`` where the start and/or stop bound is not found in the index is now allowed; this previously would raise a ``KeyError``. This makes the behavior the same as ``.ix`` in this case. This change is only for slicing, not when indexing with a single label.
-
-  .. ipython:: python
-
-     df = DataFrame(np.random.randn(5,4),
-                    columns=list('ABCD'),
-                    index=date_range('20130101',periods=5))
-     df
-     s = Series(range(5),[-2,-1,1,2,3])
-     s
-
-  Previous Behavior
-
-  .. code-block:: ipython
-
-     In [4]: df.loc['2013-01-02':'2013-01-10']
-     KeyError: 'stop bound [2013-01-10] is not in the [index]'
-
-     In [6]: s.loc[-10:3]
-     KeyError: 'start bound [-10] is not the [index]'
-
-  New Behavior
-
-  .. ipython:: python
-
-     df.loc['2013-01-02':'2013-01-10']
-     s.loc[-10:3]
-
-- Allow slicing with float-like values on an integer index for ``.ix``. Previously this was only enabled for ``.loc``:
-
-  Previous Behavior
-
-  .. code-block:: ipython
-
-     In [8]: s.ix[-1.0:2]
-     TypeError: the slice start value [-1.0] is not a proper indexer for this index type (Int64Index)
-
-  New Behavior
-
-  .. code-block:: python
-
-     In [2]: s.ix[-1.0:2]
-     Out[2]:
-     -1    1
-      1    2
-      2    3
-     dtype: int64
-
-- Provide a useful exception for indexing with an invalid type for that index when using ``.loc``. For example trying to use ``.loc`` on an index of type ``DatetimeIndex`` or ``PeriodIndex`` or ``TimedeltaIndex``, with an integer (or a float).
-
-  Previous Behavior
-
-  .. code-block:: python
-
-     In [4]: df.loc[2:3]
-     KeyError: 'start bound [2] is not the [index]'
-
-  New Behavior
-
-  .. code-block:: ipython
-
-     In [4]: df.loc[2:3]
-     TypeError: Cannot do slice indexing on <class 'pandas.tseries.index.DatetimeIndex'> with <type 'int'> keys
-
-
-.. _whatsnew_0160.api_breaking.categorical:
-
-Categorical Changes
-^^^^^^^^^^^^^^^^^^^
-
-In prior versions, ``Categoricals`` that had an unspecified ordering (meaning no ``ordered`` keyword was passed) were defaulted as ``ordered`` Categoricals. Going forward, the ``ordered`` keyword in the ``Categorical`` constructor will default to ``False``. Ordering must now be explicit.
-
-Furthermore, previously you *could* change the ``ordered`` attribute of a Categorical by just setting the attribute, e.g. ``cat.ordered=True``; This is now deprecated and you should use ``cat.as_ordered()`` or ``cat.as_unordered()``. These will by default return a **new** object and not modify the existing object. (:issue:`9347`, :issue:`9190`)
-
-Previous Behavior
-
-.. code-block:: ipython
-
-   In [3]: s = Series([0,1,2], dtype='category')
-
-   In [4]: s
-   Out[4]:
-   0    0
-   1    1
-   2    2
-   dtype: category
-   Categories (3, int64): [0 < 1 < 2]
-
-   In [5]: s.cat.ordered
-   Out[5]: True
-
-   In [6]: s.cat.ordered = False
-
-   In [7]: s
-   Out[7]:
-   0    0
-   1    1
-   2    2
-   dtype: category
-   Categories (3, int64): [0, 1, 2]
-
-New Behavior
-
-.. ipython:: python
-
-   s = Series([0,1,2], dtype='category')
-   s
-   s.cat.ordered
-   s = s.cat.as_ordered()
-   s
-   s.cat.ordered
-
-   # you can set in the constructor of the Categorical
-   s = Series(Categorical([0,1,2],ordered=True))
-   s
-   s.cat.ordered
-
-For ease of creation of series of categorical data, we have added the ability to pass keywords when calling ``.astype()``. These are passed directly to the constructor.
-
-.. ipython:: python
-
-   s = Series(["a","b","c","a"]).astype('category',ordered=True)
-   s
-   s = Series(["a","b","c","a"]).astype('category',categories=list('abcdef'),ordered=False)
-   s
-
-
-.. _whatsnew_0160.api_breaking.other:
-
-Other API Changes
-^^^^^^^^^^^^^^^^^
-
-- ``Index.duplicated`` now returns ``np.array(dtype=bool)`` rather than ``Index(dtype=object)`` containing ``bool`` values. (:issue:`8875`)
-- ``DataFrame.to_json`` now returns accurate type serialisation for each column for frames of mixed dtype (:issue:`9037`)
-
-  Previously data was coerced to a common dtype before serialisation, which for
-  example resulted in integers being serialised to floats:
-
-  .. code-block:: ipython
-
-    In [2]: pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
-    Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1.0,"1":2.0}}'
-
-  Now each column is serialised using its correct dtype:
-
-  .. code-block:: ipython
-
-    In [2]:  pd.DataFrame({'i': [1,2], 'f': [3.0, 4.2]}).to_json()
-    Out[2]: '{"f":{"0":3.0,"1":4.2},"i":{"0":1,"1":2}}'
-
-- ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex.summary`` now output the same format. (:issue:`9116`)
-- ``TimedeltaIndex.freqstr`` now output the same string format as ``DatetimeIndex``. (:issue:`9116`)
-
-- Bar and horizontal bar plots no longer add a dashed line along the info axis. The prior style can be achieved with matplotlib's ``axhline`` or ``axvline`` methods (:issue:`9088`).
-
-- ``Series`` accessors ``.dt``, ``.cat`` and ``.str`` now raise ``AttributeError`` instead of ``TypeError`` if the series does not contain the appropriate type of data (:issue:`9617`). This follows Python's built-in exception hierarchy more closely and ensures that tests like ``hasattr(s, 'cat')`` are consistent on both Python 2 and 3.
-
-- ``Series`` now supports bitwise operation for integral types (:issue:`9016`). Previously even if the input dtypes were integral, the output dtype was coerced to ``bool``.
-
-  Previous Behavior
-
-  .. code-block:: ipython
-
-     In [2]: pd.Series([0,1,2,3], list('abcd')) | pd.Series([4,4,4,4], list('abcd'))
-     Out[2]:
-     a    True
-     b    True
-     c    True
-     d    True
-     dtype: bool
-
-  New Behavior. If the input dtypes are integral, the output dtype is also integral and the output
-  values are the result of the bitwise operation.
-
-  .. code-block:: ipython
-
-     In [2]: pd.Series([0,1,2,3], list('abcd')) | pd.Series([4,4,4,4], list('abcd'))
-     Out[2]:
-     a    4
-     b    5
-     c    6
-     d    7
-     dtype: int64
-
-
-- During division involving a ``Series`` or ``DataFrame``, ``0/0`` and ``0//0`` now give ``np.nan`` instead of ``np.inf``. (:issue:`9144`, :issue:`8445`)
-
-  Previous Behavior
-
-  .. code-block:: ipython
-
-        In [2]: p = pd.Series([0, 1])
-
-        In [3]: p / 0
-        Out[3]:
-        0    inf
-        1    inf
-        dtype: float64
-
-        In [4]: p // 0
-        Out[4]:
-        0    inf
-        1    inf
-        dtype: float64
-
-
-
-  New Behavior
-
-  .. ipython:: python
-
-     p = pd.Series([0, 1])
-     p / 0
-     p // 0
-
-- ``Series.values_counts`` and ``Series.describe`` for categorical data will now put ``NaN`` entries at the end. (:issue:`9443`)
-- ``Series.describe`` for categorical data will now give counts and frequencies of 0, not ``NaN``, for unused categories (:issue:`9443`)
-
-- Due to a bug fix, looking up a partial string label with ``DatetimeIndex.asof`` now includes values that match the string, even if they are after the start of the partial string label (:issue:`9258`).
-
-  Old behavior:
-
-  .. code-block:: ipython
-
-    In [4]: pd.to_datetime(['2000-01-31', '2000-02-28']).asof('2000-02')
-    Out[4]: Timestamp('2000-01-31 00:00:00')
-
-  Fixed behavior:
-
-  .. ipython:: python
-
-    pd.to_datetime(['2000-01-31', '2000-02-28']).asof('2000-02')
-
-  To reproduce the old behavior, simply add more precision to the label (e.g., use ``2000-02-01`` instead of ``2000-02``).
-
-
-.. _whatsnew_0160.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- The ``rplot`` trellis plotting interface is deprecated and will be removed
-  in a future version. We refer to external packages like
-  `seaborn <http://stanford.edu/~mwaskom/software/seaborn/>`_ for similar
-  but more refined functionality (:issue:`3445`).
-  The documentation includes some examples how to convert your existing code
-  using ``rplot`` to seaborn: :ref:`rplot docs <rplot>`.
-
-- The ``pandas.sandbox.qtpandas`` interface is deprecated and will be removed in a future version.
-  We refer users to the external package `pandas-qt <https://github.com/datalyze-solutions/pandas-qt>`_. (:issue:`9615`)
-
-- The ``pandas.rpy`` interface is deprecated and will be removed in a future version.
-  Similar functionaility can be accessed thru the `rpy2 <http://rpy2.bitbucket.org/>`_ project (:issue:`9602`)
-
-- Adding ``DatetimeIndex/PeriodIndex`` to another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to a ``TypeError`` in a future version. ``.union()`` should be used for the union set operation. (:issue:`9094`)
-- Subtracting ``DatetimeIndex/PeriodIndex`` from another ``DatetimeIndex/PeriodIndex`` is being deprecated as a set-operation. This will be changed to an actual numeric subtraction yielding a ``TimeDeltaIndex`` in a future version. ``.difference()`` should be used for the differencing set operation. (:issue:`9094`)
-
-
-.. _whatsnew_0160.prior_deprecations:
-
-Removal of prior version deprecations/changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- ``DataFrame.pivot_table`` and ``crosstab``'s ``rows`` and ``cols`` keyword arguments were removed in favor
-  of ``index`` and ``columns`` (:issue:`6581`)
-- ``DataFrame.to_excel`` and ``DataFrame.to_csv`` ``cols`` keyword argument was removed in favor of ``columns`` (:issue:`6581`)
-- Removed ``convert_dummies`` in favor of ``get_dummies`` (:issue:`6581`)
-- Removed ``value_range`` in favor of ``describe`` (:issue:`6581`)
-
-.. _whatsnew_0160.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Fixed a performance regression for ``.loc`` indexing with an array or list-like (:issue:`9126`:).
-- ``DataFrame.to_json`` 30x performance improvement for mixed dtype frames. (:issue:`9037`)
-- Performance improvements in ``MultiIndex.duplicated`` by working with labels instead of values (:issue:`9125`)
-- Improved the speed of ``nunique`` by calling ``unique`` instead of ``value_counts`` (:issue:`9129`, :issue:`7771`)
-- Performance improvement of up to 10x in ``DataFrame.count`` and ``DataFrame.dropna`` by taking advantage of homogeneous/heterogeneous dtypes appropriately (:issue:`9136`)
-- Performance improvement of up to 20x in ``DataFrame.count`` when using a ``MultiIndex`` and the ``level`` keyword argument  (:issue:`9163`)
-- Performance and memory usage improvements in ``merge`` when key space exceeds ``int64`` bounds (:issue:`9151`)
-- Performance improvements in multi-key ``groupby`` (:issue:`9429`)
-- Performance improvements in ``MultiIndex.sortlevel`` (:issue:`9445`)
-- Performance and memory usage improvements in ``DataFrame.duplicated`` (:issue:`9398`)
-- Cythonized ``Period`` (:issue:`9440`)
-- Decreased memory usage on ``to_hdf`` (:issue:`9648`)
-
-.. _whatsnew_0160.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Changed ``.to_html`` to remove leading/trailing spaces in table body (:issue:`4987`)
-- Fixed issue using ``read_csv`` on s3 with Python 3 (:issue:`9452`)
-- Fixed compatibility issue in ``DatetimeIndex`` affecting architectures where ``numpy.int_`` defaults to ``numpy.int32`` (:issue:`8943`)
-- Bug in Panel indexing with an object-like (:issue:`9140`)
-- Bug in the returned ``Series.dt.components`` index was reset to the default index (:issue:`9247`)
-- Bug in ``Categorical.__getitem__/__setitem__`` with listlike input getting incorrect results from indexer coercion (:issue:`9469`)
-- Bug in partial setting with a DatetimeIndex (:issue:`9478`)
-- Bug in groupby for integer and datetime64 columns when applying an aggregator that caused the value to be
-  changed when the number was sufficiently large (:issue:`9311`, :issue:`6620`)
-- Fixed bug in ``to_sql`` when mapping a ``Timestamp`` object column (datetime
-  column with timezone info) to the appropriate sqlalchemy type (:issue:`9085`).
-- Fixed bug in ``to_sql`` ``dtype`` argument not accepting an instantiated
-  SQLAlchemy type  (:issue:`9083`).
-- Bug in ``.loc`` partial setting with a ``np.datetime64`` (:issue:`9516`)
-- Incorrect dtypes inferred on datetimelike looking ``Series`` & on ``.xs`` slices (:issue:`9477`)
-- Items in ``Categorical.unique()`` (and ``s.unique()`` if ``s`` is of dtype ``category``) now appear in the order in which they are originally found, not in sorted order (:issue:`9331`). This is now consistent with the behavior for other dtypes in pandas.
-- Fixed bug on big endian platforms which produced incorrect results in ``StataReader`` (:issue:`8688`).
-- Bug in ``MultiIndex.has_duplicates`` when having many levels causes an indexer overflow (:issue:`9075`, :issue:`5873`)
-- Bug in ``pivot`` and ``unstack`` where ``nan`` values would break index alignment (:issue:`4862`, :issue:`7401`, :issue:`7403`, :issue:`7405`, :issue:`7466`, :issue:`9497`)
-- Bug in left ``join`` on multi-index with ``sort=True`` or null values (:issue:`9210`).
-- Bug in ``MultiIndex`` where inserting new keys would fail (:issue:`9250`).
-- Bug in ``groupby`` when key space exceeds ``int64`` bounds (:issue:`9096`).
-- Bug in ``unstack`` with ``TimedeltaIndex`` or ``DatetimeIndex`` and nulls (:issue:`9491`).
-- Bug in ``rank`` where comparing floats with tolerance will cause inconsistent behaviour (:issue:`8365`).
-- Fixed character encoding bug in ``read_stata`` and ``StataReader`` when loading data from a URL (:issue:`9231`).
-- Bug in adding ``offsets.Nano`` to other offets raises ``TypeError`` (:issue:`9284`)
-- Bug in ``DatetimeIndex`` iteration, related to (:issue:`8890`), fixed in (:issue:`9100`)
-- Bugs in ``resample`` around DST transitions. This required fixing offset classes so they behave correctly on DST transitions. (:issue:`5172`, :issue:`8744`, :issue:`8653`, :issue:`9173`, :issue:`9468`).
-- Bug in binary operator method (eg ``.mul()``) alignment with integer levels (:issue:`9463`).
-- Bug in boxplot, scatter and hexbin plot may show an unnecessary warning (:issue:`8877`)
-- Bug in subplot with ``layout`` kw may show unnecessary warning (:issue:`9464`)
-- Bug in using grouper functions that need passed thru arguments (e.g. axis), when using wrapped function (e.g. ``fillna``), (:issue:`9221`)
-- ``DataFrame`` now properly supports simultaneous ``copy`` and ``dtype`` arguments in constructor (:issue:`9099`)
-- Bug in ``read_csv`` when using skiprows on a file with CR line endings with the c engine. (:issue:`9079`)
-- ``isnull`` now detects ``NaT`` in ``PeriodIndex`` (:issue:`9129`)
-- Bug in groupby ``.nth()`` with a multiple column groupby (:issue:`8979`)
-- Bug in ``DataFrame.where`` and ``Series.where`` coerce numerics to string incorrectly (:issue:`9280`)
-- Bug in ``DataFrame.where`` and ``Series.where`` raise ``ValueError`` when string list-like is passed. (:issue:`9280`)
-- Accessing ``Series.str`` methods on with non-string values now raises ``TypeError`` instead of producing incorrect results (:issue:`9184`)
-- Bug in ``DatetimeIndex.__contains__`` when index has duplicates and is not monotonic increasing (:issue:`9512`)
-- Fixed division by zero error for ``Series.kurt()`` when all values are equal (:issue:`9197`)
-- Fixed issue in the ``xlsxwriter`` engine where it added a default 'General' format to cells if no other format wass applied. This prevented other row or column formatting being applied. (:issue:`9167`)
-- Fixes issue with ``index_col=False`` when ``usecols`` is also specified in ``read_csv``. (:issue:`9082`)
-- Bug where ``wide_to_long`` would modify the input stubnames list (:issue:`9204`)
-- Bug in ``to_sql`` not storing float64 values using double precision. (:issue:`9009`)
-- ``SparseSeries`` and ``SparsePanel`` now accept zero argument constructors (same as their non-sparse counterparts) (:issue:`9272`).
-- Regression in merging ``Categorical`` and ``object`` dtypes (:issue:`9426`)
-- Bug in ``read_csv`` with buffer overflows with certain malformed input files (:issue:`9205`)
-- Bug in groupby MultiIndex with missing pair (:issue:`9049`, :issue:`9344`)
-- Fixed bug in ``Series.groupby`` where grouping on ``MultiIndex`` levels would ignore the sort argument (:issue:`9444`)
-- Fix bug in ``DataFrame.Groupby`` where ``sort=False`` is ignored in the case of Categorical columns. (:issue:`8868`)
-- Fixed bug with reading CSV files from Amazon S3 on python 3 raising a TypeError (:issue:`9452`)
-- Bug in the Google BigQuery reader where the 'jobComplete' key may be present but False in the query results (:issue:`8728`)
-- Bug in ``Series.values_counts`` with excluding ``NaN`` for categorical type ``Series`` with ``dropna=True`` (:issue:`9443`)
-- Fixed mising numeric_only option for ``DataFrame.std/var/sem`` (:issue:`9201`)
-- Support constructing ``Panel`` or ``Panel4D`` with scalar data (:issue:`8285`)
-- ``Series`` text representation disconnected from `max_rows`/`max_columns` (:issue:`7508`).
-
-\
-
-- ``Series`` number formatting inconsistent when truncated (:issue:`8532`).
-
-  Previous Behavior
-
-  .. code-block:: python
-
-    In [2]: pd.options.display.max_rows = 10
-    In [3]: s = pd.Series([1,1,1,1,1,1,1,1,1,1,0.9999,1,1]*10)
-    In [4]: s
-    Out[4]:
-    0    1
-    1    1
-    2    1
-    ...
-    127    0.9999
-    128    1.0000
-    129    1.0000
-    Length: 130, dtype: float64
-
-  New Behavior
-
-  .. code-block:: python
-
-    0      1.0000
-    1      1.0000
-    2      1.0000
-    3      1.0000
-    4      1.0000
-    ...
-    125    1.0000
-    126    1.0000
-    127    0.9999
-    128    1.0000
-    129    1.0000
-    dtype: float64
-
-- A Spurious ``SettingWithCopy`` Warning was generated when setting a new item in a frame in some cases (:issue:`8730`)
-
-  The following would previously report a ``SettingWithCopy`` Warning.
-
-  .. ipython:: python
-
-     df1 = DataFrame({'x': Series(['a','b','c']), 'y': Series(['d','e','f'])})
-     df2 = df1[['x']]
-     df2['y'] = ['g', 'h', 'i']
diff --git a/doc/source/whatsnew/v0.16.1.rst b/doc/source/whatsnew/v0.16.1.rst
new file mode 100644
index 0000000000000..cbcb23e356577
--- /dev/null
+++ b/doc/source/whatsnew/v0.16.1.rst
@@ -0,0 +1,484 @@
+.. _whatsnew_0161:
+
+v0.16.1 (May 11, 2015)
+----------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release from 0.16.0 and includes a a large number of
+bug fixes along several new features, enhancements, and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Support for a ``CategoricalIndex``, a category based index, see :ref:`here <whatsnew_0161.enhancements.categoricalindex>`
+- New section on how-to-contribute to *pandas*, see :ref:`here <contributing>`
+- Revised "Merge, join, and concatenate" documentation, including graphical examples to make it easier to understand each operations, see :ref:`here <merging>`
+- New method ``sample`` for drawing random samples from Series, DataFrames and Panels. See :ref:`here <whatsnew_0161.enhancements.sample>`
+- The default ``Index`` printing has changed to a more uniform format, see :ref:`here <whatsnew_0161.index_repr>`
+- ``BusinessHour`` datetime-offset is now supported, see :ref:`here <timeseries.businesshour>`
+
+-  Further enhancement to the ``.str`` accessor to make string operations easier, see :ref:`here <whatsnew_0161.enhancements.string>`
+
+.. contents:: What's new in v0.16.1
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0161.enhancements:
+
+.. warning::
+
+   In pandas 0.17.0, the sub-package ``pandas.io.data`` will be removed in favor of a separately installable package (:issue:`8961`).
+
+Enhancements
+~~~~~~~~~~~~
+
+.. _whatsnew_0161.enhancements.categoricalindex:
+
+CategoricalIndex
+^^^^^^^^^^^^^^^^
+
+We introduce a ``CategoricalIndex``, a new type of index object that is useful for supporting
+indexing with duplicates. This is a container around a ``Categorical`` (introduced in v0.15.0)
+and allows efficient indexing and storage of an index with a large number of duplicated elements. Prior to 0.16.1,
+setting the index of a ``DataFrame/Series`` with a ``category`` dtype would convert this to regular object-based ``Index``.
+
+.. code-block:: ipython
+
+    In [1]: df = pd.DataFrame({'A': np.arange(6),
+       ...:                    'B': pd.Series(list('aabbca'))
+       ...:                           .astype('category', categories=list('cab'))
+       ...:                    })
+       ...:
+
+    In [2]: df
+    Out[2]:
+       A  B
+    0  0  a
+    1  1  a
+    2  2  b
+    3  3  b
+    4  4  c
+    5  5  a
+
+    In [3]: df.dtypes
+    Out[3]:
+    A       int64
+    B    category
+    dtype: object
+
+    In [4]: df.B.cat.categories
+    Out[4]: Index(['c', 'a', 'b'], dtype='object')
+
+
+setting the index, will create create a ``CategoricalIndex``
+
+.. code-block:: ipython
+
+    In [5]: df2 = df.set_index('B')
+
+    In [6]: df2.index
+    Out[6]: CategoricalIndex(['a', 'a', 'b', 'b', 'c', 'a'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
+
+indexing with ``__getitem__/.iloc/.loc/.ix`` works similarly to an Index with duplicates.
+The indexers MUST be in the category or the operation will raise.
+
+.. code-block:: ipython
+
+    In [7]: df2.loc['a']
+    Out[7]:
+       A
+    B
+    a  0
+    a  1
+    a  5
+
+and preserves the ``CategoricalIndex``
+
+.. code-block:: ipython
+
+    In [8]: df2.loc['a'].index
+    Out[8]: CategoricalIndex(['a', 'a', 'a'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
+
+
+sorting will order by the order of the categories
+
+.. code-block:: ipython
+
+    In [9]: df2.sort_index()
+    Out[9]:
+       A
+    B
+    c  4
+    a  0
+    a  1
+    a  5
+    b  2
+    b  3
+
+groupby operations on the index will preserve the index nature as well
+
+.. code-block:: ipython
+
+    In [10]: df2.groupby(level=0).sum()
+    Out[10]:
+       A
+    B
+    c  4
+    a  6
+    b  5
+
+    In [11]: df2.groupby(level=0).sum().index
+    Out[11]: CategoricalIndex(['c', 'a', 'b'], categories=['c', 'a', 'b'], ordered=False, name='B', dtype='category')
+
+
+reindexing operations, will return a resulting index based on the type of the passed
+indexer, meaning that passing a list will return a plain-old-``Index``; indexing with
+a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the categories
+of the PASSED ``Categorical`` dtype. This allows one to arbitrarily index these even with
+values NOT in the categories, similarly to how you can reindex ANY pandas index.
+
+.. code-block:: ipython
+
+    In [12]: df2.reindex(['a', 'e'])
+    Out[12]:
+         A
+    B
+    a  0.0
+    a  1.0
+    a  5.0
+    e  NaN
+
+    In [13]: df2.reindex(['a', 'e']).index
+    Out[13]: pd.Index(['a', 'a', 'a', 'e'], dtype='object', name='B')
+
+    In [14]: df2.reindex(pd.Categorical(['a', 'e'], categories=list('abcde')))
+    Out[14]:
+         A
+    B
+    a  0.0
+    a  1.0
+    a  5.0
+    e  NaN
+
+    In [15]: df2.reindex(pd.Categorical(['a', 'e'], categories=list('abcde'))).index
+    Out[15]: pd.CategoricalIndex(['a', 'a', 'a', 'e'],
+                                 categories=['a', 'b', 'c', 'd', 'e'],
+                                 ordered=False, name='B',
+                                 dtype='category')
+
+See the :ref:`documentation <indexing.categoricalindex>` for more. (:issue:`7629`, :issue:`10038`, :issue:`10039`)
+
+.. _whatsnew_0161.enhancements.sample:
+
+Sample
+^^^^^^
+
+Series, DataFrames, and Panels now have a new method: :meth:`~pandas.DataFrame.sample`.
+The method accepts a specific number of rows or columns to return, or a fraction of the
+total number or rows or columns. It also has options for sampling with or without replacement,
+for passing in a column for weights for non-uniform sampling, and for setting seed values to
+facilitate replication. (:issue:`2419`)
+
+.. ipython:: python
+
+   example_series = pd.Series([0, 1, 2, 3, 4, 5])
+
+   # When no arguments are passed, returns 1
+   example_series.sample()
+
+   # One may specify either a number of rows:
+   example_series.sample(n=3)
+
+   # Or a fraction of the rows:
+   example_series.sample(frac=0.5)
+
+   # weights are accepted.
+   example_weights = [0, 0, 0.2, 0.2, 0.2, 0.4]
+   example_series.sample(n=3, weights=example_weights)
+
+   # weights will also be normalized if they do not sum to one,
+   # and missing values will be treated as zeros.
+   example_weights2 = [0.5, 0, 0, 0, None, np.nan]
+   example_series.sample(n=1, weights=example_weights2)
+
+
+When applied to a DataFrame, one may pass the name of a column to specify sampling weights
+when sampling from rows.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'col1': [9, 8, 7, 6],
+                      'weight_column': [0.5, 0.4, 0.1, 0]})
+   df.sample(n=3, weights='weight_column')
+
+
+.. _whatsnew_0161.enhancements.string:
+
+String Methods Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:ref:`Continuing from v0.16.0 <whatsnew_0160.enhancements.string>`, the following
+enhancements make string operations easier and more consistent with standard python string operations.
+
+
+- Added ``StringMethods`` (``.str`` accessor) to ``Index`` (:issue:`9068`)
+
+  The ``.str`` accessor is now available for both ``Series`` and ``Index``.
+
+  .. ipython:: python
+
+     idx = pd.Index([' jack', 'jill ', ' jesse ', 'frank'])
+     idx.str.strip()
+
+  One special case for the `.str` accessor on ``Index`` is that if a string method returns ``bool``, the ``.str`` accessor
+  will return a ``np.array`` instead of a boolean ``Index`` (:issue:`8875`). This enables the following expression
+  to work naturally:
+
+  .. ipython:: python
+
+     idx = pd.Index(['a1', 'a2', 'b1', 'b2'])
+     s = pd.Series(range(4), index=idx)
+     s
+     idx.str.startswith('a')
+     s[s.index.str.startswith('a')]
+
+- The following new methods are accessible via ``.str`` accessor to apply the function to each values. (:issue:`9766`, :issue:`9773`, :issue:`10031`, :issue:`10045`, :issue:`10052`)
+
+  ================  ===============  ===============  ===============  ================
+  ..                ..               Methods          ..               ..
+  ================  ===============  ===============  ===============  ================
+  ``capitalize()``  ``swapcase()``   ``normalize()``  ``partition()``  ``rpartition()``
+  ``index()``       ``rindex()``     ``translate()``
+  ================  ===============  ===============  ===============  ================
+
+- ``split`` now takes ``expand`` keyword to specify whether to expand dimensionality. ``return_type`` is deprecated. (:issue:`9847`)
+
+  .. ipython:: python
+
+     s = pd.Series(['a,b', 'a,c', 'b,c'])
+
+     # return Series
+     s.str.split(',')
+
+     # return DataFrame
+     s.str.split(',', expand=True)
+
+     idx = pd.Index(['a,b', 'a,c', 'b,c'])
+
+     # return Index
+     idx.str.split(',')
+
+     # return MultiIndex
+     idx.str.split(',', expand=True)
+
+
+- Improved ``extract`` and ``get_dummies`` methods for ``Index.str`` (:issue:`9980`)
+
+
+.. _whatsnew_0161.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``BusinessHour`` offset is now supported, which represents business hours starting from 09:00 - 17:00 on ``BusinessDay`` by default. See :ref:`Here <timeseries.businesshour>` for details. (:issue:`7905`)
+
+  .. ipython:: python
+
+     pd.Timestamp('2014-08-01 09:00') + pd.tseries.offsets.BusinessHour()
+     pd.Timestamp('2014-08-01 07:00') + pd.tseries.offsets.BusinessHour()
+     pd.Timestamp('2014-08-01 16:30') + pd.tseries.offsets.BusinessHour()
+
+- ``DataFrame.diff`` now takes an ``axis`` parameter that determines the direction of differencing (:issue:`9727`)
+
+- Allow ``clip``, ``clip_lower``, and ``clip_upper`` to accept array-like arguments as thresholds (This is a regression from 0.11.0). These methods now have an ``axis`` parameter which determines how the Series or DataFrame will be aligned with the threshold(s). (:issue:`6966`)
+
+- ``DataFrame.mask()`` and ``Series.mask()`` now support same keywords as ``where`` (:issue:`8801`)
+
+- ``drop`` function can now accept ``errors`` keyword to suppress ``ValueError`` raised when any of label does not exist in the target data. (:issue:`6736`)
+
+  .. ipython:: python
+
+    df = pd.DataFrame(np.random.randn(3, 3), columns=['A', 'B', 'C'])
+    df.drop(['A', 'X'], axis=1, errors='ignore')
+
+- Add support for separating years and quarters using dashes, for
+  example 2014-Q1.  (:issue:`9688`)
+
+- Allow conversion of values with dtype ``datetime64`` or ``timedelta64`` to strings using ``astype(str)`` (:issue:`9757`)
+- ``get_dummies`` function now accepts ``sparse`` keyword.  If set to ``True``, the return ``DataFrame`` is sparse, e.g. ``SparseDataFrame``. (:issue:`8823`)
+- ``Period`` now accepts ``datetime64`` as value input. (:issue:`9054`)
+
+- Allow timedelta string conversion when leading zero is missing from time definition, ie `0:00:00` vs `00:00:00`. (:issue:`9570`)
+- Allow ``Panel.shift`` with ``axis='items'`` (:issue:`9890`)
+
+- Trying to write an excel file now raises ``NotImplementedError`` if the ``DataFrame`` has a ``MultiIndex`` instead of writing a broken Excel file. (:issue:`9794`)
+- Allow ``Categorical.add_categories`` to accept ``Series`` or ``np.array``. (:issue:`9927`)
+
+- Add/delete ``str/dt/cat`` accessors dynamically from ``__dir__``. (:issue:`9910`)
+- Add ``normalize`` as a ``dt`` accessor method. (:issue:`10047`)
+
+- ``DataFrame`` and ``Series`` now have ``_constructor_expanddim`` property as overridable constructor for one higher dimensionality data. This should be used only when it is really needed, see :ref:`here <extending.subclassing-pandas>`
+
+- ``pd.lib.infer_dtype`` now returns ``'bytes'`` in Python 3 where appropriate. (:issue:`10032`)
+
+
+.. _whatsnew_0161.api:
+
+API changes
+~~~~~~~~~~~
+
+- When passing in an ax to ``df.plot( ..., ax=ax)``, the `sharex` kwarg will now default to `False`.
+  The result is that the visibility of xlabels and xticklabels will not anymore be changed. You
+  have to do that by yourself for the right axes in your figure or set ``sharex=True`` explicitly
+  (but this changes the visible for all axes in the figure, not only the one which is passed in!).
+  If pandas creates the subplots itself (e.g. no passed in `ax` kwarg), then the
+  default is still ``sharex=True`` and the visibility changes are applied.
+
+- :meth:`~pandas.DataFrame.assign` now inserts new columns in alphabetical order. Previously
+  the order was arbitrary. (:issue:`9777`)
+
+- By default, ``read_csv`` and ``read_table`` will now try to infer the compression type based on the file extension. Set ``compression=None`` to restore the previous behavior (no decompression). (:issue:`9770`)
+
+.. _whatsnew_0161.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- ``Series.str.split``'s ``return_type`` keyword was removed in favor of ``expand`` (:issue:`9847`)
+
+
+.. _whatsnew_0161.index_repr:
+
+Index Representation
+~~~~~~~~~~~~~~~~~~~~
+
+The string representation of ``Index`` and its sub-classes have now been unified. These will show a single-line display if there are few values; a wrapped multi-line display for a lot of values (but less than ``display.max_seq_items``; if lots of items (> ``display.max_seq_items``) will show a truncated display (the head and tail of the data). The formatting for ``MultiIndex`` is unchanged (a multi-line wrapped display). The display width responds to the option ``display.max_seq_items``, which is defaulted to 100. (:issue:`6482`)
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [2]: pd.Index(range(4), name='foo')
+   Out[2]: Int64Index([0, 1, 2, 3], dtype='int64')
+
+   In [3]: pd.Index(range(104), name='foo')
+   Out[3]: Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...], dtype='int64')
+
+   In [4]: pd.date_range('20130101', periods=4, name='foo', tz='US/Eastern')
+   Out[4]:
+   <class 'pandas.tseries.index.DatetimeIndex'>
+   [2013-01-01 00:00:00-05:00, ..., 2013-01-04 00:00:00-05:00]
+   Length: 4, Freq: D, Timezone: US/Eastern
+
+   In [5]: pd.date_range('20130101', periods=104, name='foo', tz='US/Eastern')
+   Out[5]:
+   <class 'pandas.tseries.index.DatetimeIndex'>
+   [2013-01-01 00:00:00-05:00, ..., 2013-04-14 00:00:00-04:00]
+   Length: 104, Freq: D, Timezone: US/Eastern
+
+New Behavior
+
+.. ipython:: python
+
+   pd.set_option('display.width', 80)
+   pd.Index(range(4), name='foo')
+   pd.Index(range(30), name='foo')
+   pd.Index(range(104), name='foo')
+   pd.CategoricalIndex(['a', 'bb', 'ccc', 'dddd'],
+                       ordered=True, name='foobar')
+   pd.CategoricalIndex(['a', 'bb', 'ccc', 'dddd'] * 10,
+                       ordered=True, name='foobar')
+   pd.CategoricalIndex(['a', 'bb', 'ccc', 'dddd'] * 100,
+                       ordered=True, name='foobar')
+   pd.date_range('20130101', periods=4, name='foo', tz='US/Eastern')
+   pd.date_range('20130101', periods=25, freq='D')
+   pd.date_range('20130101', periods=104, name='foo', tz='US/Eastern')
+
+
+.. _whatsnew_0161.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved csv write performance with mixed dtypes, including datetimes by up to 5x (:issue:`9940`)
+- Improved csv write performance generally by 2x (:issue:`9940`)
+- Improved the performance of ``pd.lib.max_len_string_array`` by 5-7x (:issue:`10024`)
+
+
+.. _whatsnew_0161.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug where labels did not appear properly in the legend of ``DataFrame.plot()``, passing ``label=`` arguments works, and Series indices are no longer mutated. (:issue:`9542`)
+- Bug in json serialization causing a segfault when a frame had zero length. (:issue:`9805`)
+- Bug in ``read_csv`` where missing trailing delimiters would cause segfault. (:issue:`5664`)
+- Bug in retaining index name on appending (:issue:`9862`)
+- Bug in ``scatter_matrix`` draws unexpected axis ticklabels (:issue:`5662`)
+- Fixed bug in ``StataWriter`` resulting in changes to input ``DataFrame`` upon save (:issue:`9795`).
+- Bug in ``transform`` causing length mismatch when null entries were present and a fast aggregator was being used (:issue:`9697`)
+- Bug in ``equals`` causing false negatives when block order differed (:issue:`9330`)
+- Bug in grouping with multiple ``pd.Grouper`` where one is non-time based (:issue:`10063`)
+- Bug in ``read_sql_table`` error when reading postgres table with timezone (:issue:`7139`)
+- Bug in ``DataFrame`` slicing may not retain metadata (:issue:`9776`)
+- Bug where ``TimdeltaIndex`` were not properly serialized in fixed ``HDFStore`` (:issue:`9635`)
+- Bug with ``TimedeltaIndex`` constructor ignoring ``name`` when given another ``TimedeltaIndex`` as data (:issue:`10025`).
+- Bug in ``DataFrameFormatter._get_formatted_index`` with not applying ``max_colwidth`` to the ``DataFrame`` index (:issue:`7856`)
+- Bug in ``.loc`` with a read-only ndarray data source (:issue:`10043`)
+- Bug in ``groupby.apply()`` that would raise if a passed user defined function either returned only ``None`` (for all input). (:issue:`9685`)
+- Always use temporary files in pytables tests (:issue:`9992`)
+- Bug in plotting continuously using ``secondary_y`` may not show legend properly. (:issue:`9610`, :issue:`9779`)
+- Bug in ``DataFrame.plot(kind="hist")`` results in ``TypeError`` when ``DataFrame`` contains non-numeric columns  (:issue:`9853`)
+- Bug where repeated plotting of ``DataFrame`` with a ``DatetimeIndex`` may raise ``TypeError`` (:issue:`9852`)
+- Bug in ``setup.py`` that would allow an incompat cython version to build (:issue:`9827`)
+- Bug in plotting ``secondary_y`` incorrectly attaches ``right_ax`` property to secondary axes specifying itself recursively. (:issue:`9861`)
+- Bug in ``Series.quantile`` on empty Series of type ``Datetime`` or ``Timedelta`` (:issue:`9675`)
+- Bug in ``where`` causing incorrect results when upcasting was required (:issue:`9731`)
+- Bug in ``FloatArrayFormatter`` where decision boundary for displaying "small" floats in decimal format is off by one order of magnitude for a given display.precision (:issue:`9764`)
+- Fixed bug where ``DataFrame.plot()`` raised an error when both ``color`` and ``style`` keywords were passed and there was no color symbol in the style strings (:issue:`9671`)
+- Not showing a ``DeprecationWarning`` on combining list-likes with an ``Index`` (:issue:`10083`)
+- Bug in ``read_csv`` and ``read_table`` when using ``skip_rows`` parameter if blank lines are present. (:issue:`9832`)
+- Bug in ``read_csv()`` interprets ``index_col=True`` as ``1`` (:issue:`9798`)
+- Bug in index equality comparisons using ``==`` failing on Index/MultiIndex type incompatibility (:issue:`9785`)
+- Bug in which ``SparseDataFrame`` could not take `nan` as a column name (:issue:`8822`)
+- Bug in ``to_msgpack`` and ``read_msgpack`` zlib and blosc compression support (:issue:`9783`)
+- Bug ``GroupBy.size`` doesn't attach index name properly if grouped by ``TimeGrouper`` (:issue:`9925`)
+- Bug causing an exception in slice assignments because ``length_of_indexer`` returns wrong results (:issue:`9995`)
+- Bug in csv parser causing lines with initial white space plus one non-space character to be skipped. (:issue:`9710`)
+- Bug in C csv parser causing spurious NaNs when data started with newline followed by white space. (:issue:`10022`)
+- Bug causing elements with a null group to spill into the final group when grouping by a ``Categorical`` (:issue:`9603`)
+- Bug where .iloc and .loc behavior is not consistent on empty dataframes (:issue:`9964`)
+- Bug in invalid attribute access on a ``TimedeltaIndex`` incorrectly raised ``ValueError`` instead of ``AttributeError`` (:issue:`9680`)
+- Bug in unequal comparisons between categorical data and a scalar, which was not in the categories (e.g. ``Series(Categorical(list("abc"), ordered=True)) > "d"``. This returned ``False`` for all elements, but now raises a ``TypeError``. Equality comparisons also now return ``False`` for ``==`` and ``True`` for ``!=``. (:issue:`9848`)
+- Bug in DataFrame ``__setitem__`` when right hand side is a dictionary (:issue:`9874`)
+- Bug in ``where`` when dtype is ``datetime64/timedelta64``, but dtype of other is not (:issue:`9804`)
+- Bug in ``MultiIndex.sortlevel()`` results in unicode level name breaks (:issue:`9856`)
+- Bug in which ``groupby.transform`` incorrectly enforced output dtypes to match input dtypes. (:issue:`9807`)
+- Bug in ``DataFrame`` constructor when ``columns`` parameter is set, and ``data`` is an empty list (:issue:`9939`)
+- Bug in bar plot with ``log=True`` raises ``TypeError`` if all values are less than 1 (:issue:`9905`)
+- Bug in horizontal bar plot ignores ``log=True`` (:issue:`9905`)
+- Bug in PyTables queries that did not return proper results using the index (:issue:`8265`, :issue:`9676`)
+- Bug where dividing a dataframe containing values of type ``Decimal`` by another ``Decimal`` would raise. (:issue:`9787`)
+- Bug where using DataFrames asfreq would remove the name of the index. (:issue:`9885`)
+- Bug causing extra index point when resample BM/BQ (:issue:`9756`)
+- Changed caching in ``AbstractHolidayCalendar`` to be at the instance level rather than at the class level as the latter can result in unexpected behaviour. (:issue:`9552`)
+- Fixed latex output for MultiIndexed dataframes (:issue:`9778`)
+- Bug causing an exception when setting an empty range using ``DataFrame.loc`` (:issue:`9596`)
+- Bug in hiding ticklabels with subplots and shared axes when adding a new plot to an existing grid of axes (:issue:`9158`)
+- Bug in ``transform`` and ``filter`` when grouping on a categorical variable (:issue:`9921`)
+- Bug in ``transform`` when groups are equal in number and dtype to the input index (:issue:`9700`)
+- Google BigQuery connector now imports dependencies on a per-method basis.(:issue:`9713`)
+- Updated BigQuery connector to no longer use deprecated ``oauth2client.tools.run()`` (:issue:`8327`)
+- Bug in subclassed ``DataFrame``. It may not return the correct class, when slicing or subsetting it. (:issue:`9632`)
+- Bug in ``.median()`` where non-float null values are not handled correctly (:issue:`10040`)
+- Bug in Series.fillna() where it raises if a numerically convertible string is given (:issue:`10092`)
+
+
+.. _whatsnew_0.16.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.16.0..v0.16.1
diff --git a/doc/source/whatsnew/v0.16.1.txt b/doc/source/whatsnew/v0.16.1.txt
deleted file mode 100644
index 1a3b8319aeb59..0000000000000
--- a/doc/source/whatsnew/v0.16.1.txt
+++ /dev/null
@@ -1,402 +0,0 @@
-.. _whatsnew_0161:
-
-v0.16.1 (May 11, 2015)
-----------------------
-
-This is a minor bug-fix release from 0.16.0 and includes a a large number of
-bug fixes along several new features, enhancements, and performance improvements.
-We recommend that all users upgrade to this version.
-
-Highlights include:
-
-- Support for a ``CategoricalIndex``, a category based index, see :ref:`here <whatsnew_0161.enhancements.categoricalindex>`
-- New section on how-to-contribute to *pandas*, see :ref:`here <contributing>`
-- Revised "Merge, join, and concatenate" documentation, including graphical examples to make it easier to understand each operations, see :ref:`here <merging>`
-- New method ``sample`` for drawing random samples from Series, DataFrames and Panels. See :ref:`here <whatsnew_0161.enhancements.sample>`
-- The default ``Index`` printing has changed to a more uniform format, see :ref:`here <whatsnew_0161.index_repr>`
-- ``BusinessHour`` datetime-offset is now supported, see :ref:`here <timeseries.businesshour>`
-
--  Further enhancement to the ``.str`` accessor to make string operations easier, see :ref:`here <whatsnew_0161.enhancements.string>`
-
-.. contents:: What's new in v0.16.1
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0161.enhancements:
-
-.. warning::
-
-   In pandas 0.17.0, the sub-package ``pandas.io.data`` will be removed in favor of a separately installable package. See :ref:`here for details <remote_data.pandas_datareader>` (:issue:`8961`)
-
-Enhancements
-~~~~~~~~~~~~
-
-.. _whatsnew_0161.enhancements.categoricalindex:
-
-CategoricalIndex
-^^^^^^^^^^^^^^^^
-
-We introduce a ``CategoricalIndex``, a new type of index object that is useful for supporting
-indexing with duplicates. This is a container around a ``Categorical`` (introduced in v0.15.0)
-and allows efficient indexing and storage of an index with a large number of duplicated elements. Prior to 0.16.1,
-setting the index of a ``DataFrame/Series`` with a ``category`` dtype would convert this to regular object-based ``Index``.
-
-.. ipython :: python
-
-   df = DataFrame({'A' : np.arange(6),
-                   'B' : Series(list('aabbca')).astype('category',
-                                                       categories=list('cab'))
-                  })
-   df
-   df.dtypes
-   df.B.cat.categories
-
-setting the index, will create create a ``CategoricalIndex``
-
-.. ipython :: python
-
-   df2 = df.set_index('B')
-   df2.index
-
-indexing with ``__getitem__/.iloc/.loc/.ix`` works similarly to an Index with duplicates.
-The indexers MUST be in the category or the operation will raise.
-
-.. ipython :: python
-
-   df2.loc['a']
-
-and preserves the ``CategoricalIndex``
-
-.. ipython :: python
-
-   df2.loc['a'].index
-
-sorting will order by the order of the categories
-
-.. ipython :: python
-
-   df2.sort_index()
-
-groupby operations on the index will preserve the index nature as well
-
-.. ipython :: python
-
-   df2.groupby(level=0).sum()
-   df2.groupby(level=0).sum().index
-
-reindexing operations, will return a resulting index based on the type of the passed
-indexer, meaning that passing a list will return a plain-old-``Index``; indexing with
-a ``Categorical`` will return a ``CategoricalIndex``, indexed according to the categories
-of the PASSED ``Categorical`` dtype. This allows one to arbitrarly index these even with
-values NOT in the categories, similarly to how you can reindex ANY pandas index.
-
-.. ipython :: python
-
-   df2.reindex(['a','e'])
-   df2.reindex(['a','e']).index
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde')))
-   df2.reindex(pd.Categorical(['a','e'],categories=list('abcde'))).index
-
-See the :ref:`documentation <indexing.categoricalindex>` for more. (:issue:`7629`, :issue:`10038`, :issue:`10039`)
-
-.. _whatsnew_0161.enhancements.sample:
-
-Sample
-^^^^^^
-
-Series, DataFrames, and Panels now have a new method: :meth:`~pandas.DataFrame.sample`.
-The method accepts a specific number of rows or columns to return, or a fraction of the
-total number or rows or columns. It also has options for sampling with or without replacement,
-for passing in a column for weights for non-uniform sampling, and for setting seed values to
-facilitate replication. (:issue:`2419`)
-
-.. ipython :: python
-
-   example_series = Series([0,1,2,3,4,5])
-
-   # When no arguments are passed, returns 1
-   example_series.sample()
-
-   # One may specify either a number of rows:
-   example_series.sample(n=3)
-
-   # Or a fraction of the rows:
-   example_series.sample(frac=0.5)
-
-   # weights are accepted.
-   example_weights = [0, 0, 0.2, 0.2, 0.2, 0.4]
-   example_series.sample(n=3, weights=example_weights)
-
-   # weights will also be normalized if they do not sum to one,
-   # and missing values will be treated as zeros.
-   example_weights2 = [0.5, 0, 0, 0, None, np.nan]
-   example_series.sample(n=1, weights=example_weights2)
-
-
-When applied to a DataFrame, one may pass the name of a column to specify sampling weights
-when sampling from rows.
-
-.. ipython :: python
-
-   df = DataFrame({'col1':[9,8,7,6], 'weight_column':[0.5, 0.4, 0.1, 0]})
-   df.sample(n=3, weights='weight_column')
-
-
-.. _whatsnew_0161.enhancements.string:
-
-String Methods Enhancements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:ref:`Continuing from v0.16.0 <whatsnew_0160.enhancements.string>`, the following
-enhancements make string operations easier and more consistent with standard python string operations.
-
-
-- Added ``StringMethods`` (``.str`` accessor) to ``Index`` (:issue:`9068`)
-
-  The ``.str`` accessor is now available for both ``Series`` and ``Index``.
-
-  .. ipython:: python
-
-     idx = Index([' jack', 'jill ', ' jesse ', 'frank'])
-     idx.str.strip()
-
-  One special case for the `.str` accessor on ``Index`` is that if a string method returns ``bool``, the ``.str`` accessor
-  will return a ``np.array`` instead of a boolean ``Index`` (:issue:`8875`). This enables the following expression
-  to work naturally:
-
-  .. ipython:: python
-
-     idx = Index(['a1', 'a2', 'b1', 'b2'])
-     s = Series(range(4), index=idx)
-     s
-     idx.str.startswith('a')
-     s[s.index.str.startswith('a')]
-
-- The following new methods are accesible via ``.str`` accessor to apply the function to each values. (:issue:`9766`, :issue:`9773`, :issue:`10031`, :issue:`10045`, :issue:`10052`)
-
-  ================  ===============  ===============  ===============  ================
-  ..                ..               Methods          ..               ..
-  ================  ===============  ===============  ===============  ================
-  ``capitalize()``  ``swapcase()``   ``normalize()``  ``partition()``  ``rpartition()``
-  ``index()``       ``rindex()``     ``translate()``
-  ================  ===============  ===============  ===============  ================
-
-- ``split`` now takes ``expand`` keyword to specify whether to expand dimensionality. ``return_type`` is deprecated. (:issue:`9847`)
-
-  .. ipython:: python
-
-     s = Series(['a,b', 'a,c', 'b,c'])
-
-     # return Series
-     s.str.split(',')
-
-     # return DataFrame
-     s.str.split(',', expand=True)
-
-     idx = Index(['a,b', 'a,c', 'b,c'])
-
-     # return Index
-     idx.str.split(',')
-
-     # return MultiIndex
-     idx.str.split(',', expand=True)
-
-
-- Improved ``extract`` and ``get_dummies`` methods for ``Index.str`` (:issue:`9980`)
-
-
-.. _whatsnew_0161.enhancements.other:
-
-Other Enhancements
-^^^^^^^^^^^^^^^^^^
-
-- ``BusinessHour`` offset is now supported, which represents business hours starting from 09:00 - 17:00 on ``BusinessDay`` by default. See :ref:`Here <timeseries.businesshour>` for details. (:issue:`7905`)
-
-  .. ipython:: python
-
-     from pandas.tseries.offsets import BusinessHour
-     Timestamp('2014-08-01 09:00') + BusinessHour()
-     Timestamp('2014-08-01 07:00') + BusinessHour()
-     Timestamp('2014-08-01 16:30') + BusinessHour()
-
-- ``DataFrame.diff`` now takes an ``axis`` parameter that determines the direction of differencing (:issue:`9727`)
-
-- Allow ``clip``, ``clip_lower``, and ``clip_upper`` to accept array-like arguments as thresholds (This is a regression from 0.11.0). These methods now have an ``axis`` parameter which determines how the Series or DataFrame will be aligned with the threshold(s). (:issue:`6966`)
-
-- ``DataFrame.mask()`` and ``Series.mask()`` now support same keywords as ``where`` (:issue:`8801`)
-
-- ``drop`` function can now accept ``errors`` keyword to suppress ``ValueError`` raised when any of label does not exist in the target data. (:issue:`6736`)
-
-  .. ipython:: python
-
-    df = DataFrame(np.random.randn(3, 3), columns=['A', 'B', 'C'])
-    df.drop(['A', 'X'], axis=1, errors='ignore')
-
-- Add support for separating years and quarters using dashes, for
-  example 2014-Q1.  (:issue:`9688`)
-
-- Allow conversion of values with dtype ``datetime64`` or ``timedelta64`` to strings using ``astype(str)`` (:issue:`9757`)
-- ``get_dummies`` function now accepts ``sparse`` keyword.  If set to ``True``, the return ``DataFrame`` is sparse, e.g. ``SparseDataFrame``. (:issue:`8823`)
-- ``Period`` now accepts ``datetime64`` as value input. (:issue:`9054`)
-
-- Allow timedelta string conversion when leading zero is missing from time definition, ie `0:00:00` vs `00:00:00`. (:issue:`9570`)
-- Allow ``Panel.shift`` with ``axis='items'`` (:issue:`9890`)
-
-- Trying to write an excel file now raises ``NotImplementedError`` if the ``DataFrame`` has a ``MultiIndex`` instead of writing a broken Excel file. (:issue:`9794`)
-- Allow ``Categorical.add_categories`` to accept ``Series`` or ``np.array``. (:issue:`9927`)
-
-- Add/delete ``str/dt/cat`` accessors dynamically from ``__dir__``. (:issue:`9910`)
-- Add ``normalize`` as a ``dt`` accessor method. (:issue:`10047`)
-
-- ``DataFrame`` and ``Series`` now have ``_constructor_expanddim`` property as overridable constructor for one higher dimensionality data. This should be used only when it is really needed, see :ref:`here <ref-subclassing-pandas>`
-
-- ``pd.lib.infer_dtype`` now returns ``'bytes'`` in Python 3 where appropriate. (:issue:`10032`)
-
-
-.. _whatsnew_0161.api:
-
-API changes
-~~~~~~~~~~~
-
-- When passing in an ax to ``df.plot( ..., ax=ax)``, the `sharex` kwarg will now default to `False`.
-  The result is that the visibility of xlabels and xticklabels will not anymore be changed. You
-  have to do that by yourself for the right axes in your figure or set ``sharex=True`` explicitly
-  (but this changes the visible for all axes in the figure, not only the one which is passed in!).
-  If pandas creates the subplots itself (e.g. no passed in `ax` kwarg), then the
-  default is still ``sharex=True`` and the visibility changes are applied.
-
-- :meth:`~pandas.DataFrame.assign` now inserts new columns in alphabetical order. Previously
-  the order was arbitrary. (:issue:`9777`)
-
-- By default, ``read_csv`` and ``read_table`` will now try to infer the compression type based on the file extension. Set ``compression=None`` to restore the previous behavior (no decompression). (:issue:`9770`)
-
-.. _whatsnew_0161.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- ``Series.str.split``'s ``return_type`` keyword was removed in favor of ``expand`` (:issue:`9847`)
-
-
-.. _whatsnew_0161.index_repr:
-
-Index Representation
-~~~~~~~~~~~~~~~~~~~~
-
-The string representation of ``Index`` and its sub-classes have now been unified. These will show a single-line display if there are few values; a wrapped multi-line display for a lot of values (but less than ``display.max_seq_items``; if lots of items (> ``display.max_seq_items``) will show a truncated display (the head and tail of the data). The formatting for ``MultiIndex`` is unchanges (a multi-line wrapped display). The display width responds to the option ``display.max_seq_items``, which is defaulted to 100. (:issue:`6482`)
-
-Previous Behavior
-
-.. code-block:: ipython
-
-   In [2]: pd.Index(range(4),name='foo')
-   Out[2]: Int64Index([0, 1, 2, 3], dtype='int64')
-
-   In [3]: pd.Index(range(104),name='foo')
-   Out[3]: Int64Index([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, ...], dtype='int64')
-
-   In [4]: pd.date_range('20130101',periods=4,name='foo',tz='US/Eastern')
-   Out[4]:
-   <class 'pandas.tseries.index.DatetimeIndex'>
-   [2013-01-01 00:00:00-05:00, ..., 2013-01-04 00:00:00-05:00]
-   Length: 4, Freq: D, Timezone: US/Eastern
-
-   In [5]: pd.date_range('20130101',periods=104,name='foo',tz='US/Eastern')
-   Out[5]:
-   <class 'pandas.tseries.index.DatetimeIndex'>
-   [2013-01-01 00:00:00-05:00, ..., 2013-04-14 00:00:00-04:00]
-   Length: 104, Freq: D, Timezone: US/Eastern
-
-New Behavior
-
-.. ipython:: python
-
-   pd.set_option('display.width', 80)
-   pd.Index(range(4), name='foo')
-   pd.Index(range(30), name='foo')
-   pd.Index(range(104), name='foo')
-   pd.CategoricalIndex(['a','bb','ccc','dddd'], ordered=True, name='foobar')
-   pd.CategoricalIndex(['a','bb','ccc','dddd']*10, ordered=True, name='foobar')
-   pd.CategoricalIndex(['a','bb','ccc','dddd']*100, ordered=True, name='foobar')
-   pd.date_range('20130101',periods=4, name='foo', tz='US/Eastern')
-   pd.date_range('20130101',periods=25, freq='D')
-   pd.date_range('20130101',periods=104, name='foo', tz='US/Eastern')
-
-
-.. _whatsnew_0161.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved csv write performance with mixed dtypes, including datetimes by up to 5x (:issue:`9940`)
-- Improved csv write performance generally by 2x (:issue:`9940`)
-- Improved the performance of ``pd.lib.max_len_string_array`` by 5-7x (:issue:`10024`)
-
-
-.. _whatsnew_0161.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug where labels did not appear properly in the legend of ``DataFrame.plot()``, passing ``label=`` arguments works, and Series indices are no longer mutated. (:issue:`9542`)
-- Bug in json serialization causing a segfault when a frame had zero length. (:issue:`9805`)
-- Bug in ``read_csv`` where missing trailing delimiters would cause segfault. (:issue:`5664`)
-- Bug in retaining index name on appending (:issue:`9862`)
-- Bug in ``scatter_matrix`` draws unexpected axis ticklabels (:issue:`5662`)
-- Fixed bug in ``StataWriter`` resulting in changes to input ``DataFrame`` upon save (:issue:`9795`).
-- Bug in ``transform`` causing length mismatch when null entries were present and a fast aggregator was being used (:issue:`9697`)
-- Bug in ``equals`` causing false negatives when block order differed (:issue:`9330`)
-- Bug in grouping with multiple ``pd.Grouper`` where one is non-time based (:issue:`10063`)
-- Bug in ``read_sql_table`` error when reading postgres table with timezone (:issue:`7139`)
-- Bug in ``DataFrame`` slicing may not retain metadata (:issue:`9776`)
-- Bug where ``TimdeltaIndex`` were not properly serialized in fixed ``HDFStore`` (:issue:`9635`)
-- Bug with ``TimedeltaIndex`` constructor ignoring ``name`` when given another ``TimedeltaIndex`` as data (:issue:`10025`).
-- Bug in ``DataFrameFormatter._get_formatted_index`` with not applying ``max_colwidth`` to the ``DataFrame`` index (:issue:`7856`)
-- Bug in ``.loc`` with a read-only ndarray data source (:issue:`10043`)
-- Bug in ``groupby.apply()`` that would raise if a passed user defined function either returned only ``None`` (for all input). (:issue:`9685`)
-- Always use temporary files in pytables tests (:issue:`9992`)
-- Bug in plotting continuously using ``secondary_y`` may not show legend properly. (:issue:`9610`, :issue:`9779`)
-- Bug in ``DataFrame.plot(kind="hist")`` results in ``TypeError`` when ``DataFrame`` contains non-numeric columns  (:issue:`9853`)
-- Bug where repeated plotting of ``DataFrame`` with a ``DatetimeIndex`` may raise ``TypeError`` (:issue:`9852`)
-- Bug in ``setup.py`` that would allow an incompat cython version to build (:issue:`9827`)
-- Bug in plotting ``secondary_y`` incorrectly attaches ``right_ax`` property to secondary axes specifying itself recursively. (:issue:`9861`)
-- Bug in ``Series.quantile`` on empty Series of type ``Datetime`` or ``Timedelta`` (:issue:`9675`)
-- Bug in ``where`` causing incorrect results when upcasting was required (:issue:`9731`)
-- Bug in ``FloatArrayFormatter`` where decision boundary for displaying "small" floats in decimal format is off by one order of magnitude for a given display.precision (:issue:`9764`)
-- Fixed bug where ``DataFrame.plot()`` raised an error when both ``color`` and ``style`` keywords were passed and there was no color symbol in the style strings (:issue:`9671`)
-- Not showing a ``DeprecationWarning`` on combining list-likes with an ``Index`` (:issue:`10083`)
-- Bug in ``read_csv`` and ``read_table`` when using ``skip_rows`` parameter if blank lines are present. (:issue:`9832`)
-- Bug in ``read_csv()`` interprets ``index_col=True`` as ``1`` (:issue:`9798`)
-- Bug in index equality comparisons using ``==`` failing on Index/MultiIndex type incompatibility (:issue:`9785`)
-- Bug in which ``SparseDataFrame`` could not take `nan` as a column name (:issue:`8822`)
-- Bug in ``to_msgpack`` and ``read_msgpack`` zlib and blosc compression support (:issue:`9783`)
-- Bug ``GroupBy.size`` doesn't attach index name properly if grouped by ``TimeGrouper`` (:issue:`9925`)
-- Bug causing an exception in slice assignments because ``length_of_indexer`` returns wrong results (:issue:`9995`)
-- Bug in csv parser causing lines with initial whitespace plus one non-space character to be skipped. (:issue:`9710`)
-- Bug in C csv parser causing spurious NaNs when data started with newline followed by whitespace. (:issue:`10022`)
-- Bug causing elements with a null group to spill into the final group when grouping by a ``Categorical`` (:issue:`9603`)
-- Bug where .iloc and .loc behavior is not consistent on empty dataframes (:issue:`9964`)
-- Bug in invalid attribute access on a ``TimedeltaIndex`` incorrectly raised ``ValueError`` instead of ``AttributeError`` (:issue:`9680`)
-- Bug in unequal comparisons between categorical data and a scalar, which was not in the categories (e.g. ``Series(Categorical(list("abc"), ordered=True)) > "d"``. This returned ``False`` for all elements, but now raises a ``TypeError``. Equality comparisons also now return ``False`` for ``==`` and ``True`` for ``!=``. (:issue:`9848`)
-- Bug in DataFrame ``__setitem__`` when right hand side is a dictionary (:issue:`9874`)
-- Bug in ``where`` when dtype is ``datetime64/timedelta64``, but dtype of other is not (:issue:`9804`)
-- Bug in ``MultiIndex.sortlevel()`` results in unicode level name breaks (:issue:`9856`)
-- Bug in which ``groupby.transform`` incorrectly enforced output dtypes to match input dtypes. (:issue:`9807`)
-- Bug in ``DataFrame`` constructor when ``columns`` parameter is set, and ``data`` is an empty list (:issue:`9939`)
-- Bug in bar plot with ``log=True`` raises ``TypeError`` if all values are less than 1 (:issue:`9905`)
-- Bug in horizontal bar plot ignores ``log=True`` (:issue:`9905`)
-- Bug in PyTables queries that did not return proper results using the index (:issue:`8265`, :issue:`9676`)
-- Bug where dividing a dataframe containing values of type ``Decimal`` by another ``Decimal`` would raise. (:issue:`9787`)
-- Bug where using DataFrames asfreq would remove the name of the index. (:issue:`9885`)
-- Bug causing extra index point when resample BM/BQ (:issue:`9756`)
-- Changed caching in ``AbstractHolidayCalendar`` to be at the instance level rather than at the class level as the latter can result in unexpected behaviour. (:issue:`9552`)
-- Fixed latex output for multi-indexed dataframes (:issue:`9778`)
-- Bug causing an exception when setting an empty range using ``DataFrame.loc`` (:issue:`9596`)
-- Bug in hiding ticklabels with subplots and shared axes when adding a new plot to an existing grid of axes (:issue:`9158`)
-- Bug in ``transform`` and ``filter`` when grouping on a categorical variable (:issue:`9921`)
-- Bug in ``transform`` when groups are equal in number and dtype to the input index (:issue:`9700`)
-- Google BigQuery connector now imports dependencies on a per-method basis.(:issue:`9713`)
-- Updated BigQuery connector to no longer use deprecated ``oauth2client.tools.run()`` (:issue:`8327`)
-- Bug in subclassed ``DataFrame``. It may not return the correct class, when slicing or subsetting it. (:issue:`9632`)
-- Bug in ``.median()`` where non-float null values are not handled correctly (:issue:`10040`)
-- Bug in Series.fillna() where it raises if a numerically convertible string is given (:issue:`10092`)
diff --git a/doc/source/whatsnew/v0.16.2.rst b/doc/source/whatsnew/v0.16.2.rst
new file mode 100644
index 0000000000000..ca0ad8d3ae7f9
--- /dev/null
+++ b/doc/source/whatsnew/v0.16.2.rst
@@ -0,0 +1,178 @@
+.. _whatsnew_0162:
+
+v0.16.2 (June 12, 2015)
+-----------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release from 0.16.1 and includes a a large number of
+bug fixes along some new features (:meth:`~DataFrame.pipe` method), enhancements, and performance improvements.
+
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- A new ``pipe`` method, see :ref:`here <whatsnew_0162.enhancements.pipe>`
+- Documentation on how to use numba_ with *pandas*, see :ref:`here <enhancingperf.numba>`
+
+
+.. contents:: What's new in v0.16.2
+    :local:
+    :backlinks: none
+
+.. _numba: http://numba.pydata.org
+
+.. _whatsnew_0162.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0162.enhancements.pipe:
+
+Pipe
+^^^^
+
+We've introduced a new method :meth:`DataFrame.pipe`. As suggested by the name, ``pipe``
+should be used to pipe data through a chain of function calls.
+The goal is to avoid confusing nested function calls like
+
+.. code-block:: python
+
+   # df is a DataFrame
+   # f, g, and h are functions that take and return DataFrames
+   f(g(h(df), arg1=1), arg2=2, arg3=3)  # noqa F821
+
+The logic flows from inside out, and function names are separated from their keyword arguments.
+This can be rewritten as
+
+.. code-block:: python
+
+   (df.pipe(h)                   # noqa F821
+      .pipe(g, arg1=1)           # noqa F821
+      .pipe(f, arg2=2, arg3=3)   # noqa F821
+   )
+
+Now both the code and the logic flow from top to bottom. Keyword arguments are next to
+their functions. Overall the code is much more readable.
+
+In the example above, the functions ``f``, ``g``, and ``h`` each expected the DataFrame as the first positional argument.
+When the function you wish to apply takes its data anywhere other than the first argument, pass a tuple
+of ``(function, keyword)`` indicating where the DataFrame should flow. For example:
+
+.. ipython:: python
+
+   import statsmodels.formula.api as sm
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+
+   # sm.ols takes (formula, data)
+   (bb.query('h > 0')
+      .assign(ln_h=lambda df: np.log(df.h))
+      .pipe((sm.ols, 'data'), 'hr ~ ln_h + year + g + C(lg)')
+      .fit()
+      .summary()
+    )
+
+The pipe method is inspired by unix pipes, which stream text through
+processes. More recently dplyr_ and magrittr_ have introduced the
+popular ``(%>%)`` pipe operator for R_.
+
+See the :ref:`documentation <basics.pipe>` for more. (:issue:`10129`)
+
+.. _dplyr: https://github.com/hadley/dplyr
+.. _magrittr: https://github.com/smbache/magrittr
+.. _R: http://www.r-project.org
+
+.. _whatsnew_0162.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Added `rsplit` to Index/Series StringMethods (:issue:`10303`)
+
+- Removed the hard-coded size limits on the ``DataFrame`` HTML representation
+  in the IPython notebook, and leave this to IPython itself (only for IPython
+  v3.0 or greater). This eliminates the duplicate scroll bars that appeared in
+  the notebook with large frames (:issue:`10231`).
+
+  Note that the notebook has a ``toggle output scrolling`` feature to limit the
+  display of very large frames (by clicking left of the output).
+  You can also configure the way DataFrames are displayed using the pandas
+  options, see here :ref:`here <options.frequently_used>`.
+
+- ``axis`` parameter of ``DataFrame.quantile`` now accepts also ``index`` and ``column``. (:issue:`9543`)
+
+.. _whatsnew_0162.api:
+
+API Changes
+~~~~~~~~~~~
+
+- ``Holiday`` now raises ``NotImplementedError`` if both ``offset`` and ``observance`` are used in the constructor instead of returning an incorrect result (:issue:`10217`).
+
+
+.. _whatsnew_0162.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved ``Series.resample`` performance with ``dtype=datetime64[ns]`` (:issue:`7754`)
+- Increase performance of ``str.split`` when ``expand=True`` (:issue:`10081`)
+
+.. _whatsnew_0162.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``Series.hist`` raises an error when a one row ``Series`` was given (:issue:`10214`)
+- Bug where ``HDFStore.select`` modifies the passed columns list (:issue:`7212`)
+- Bug in ``Categorical`` repr with ``display.width`` of ``None`` in Python 3 (:issue:`10087`)
+- Bug in ``to_json`` with certain orients and a ``CategoricalIndex`` would segfault (:issue:`10317`)
+- Bug where some of the nan functions do not have consistent return dtypes (:issue:`10251`)
+- Bug in ``DataFrame.quantile`` on checking that a valid axis was passed (:issue:`9543`)
+- Bug in ``groupby.apply`` aggregation for ``Categorical`` not preserving categories (:issue:`10138`)
+- Bug in ``to_csv`` where ``date_format`` is ignored if the ``datetime`` is fractional (:issue:`10209`)
+- Bug in ``DataFrame.to_json`` with mixed data types (:issue:`10289`)
+- Bug in cache updating when consolidating (:issue:`10264`)
+- Bug in ``mean()`` where integer dtypes can overflow (:issue:`10172`)
+- Bug where ``Panel.from_dict`` does not set dtype when specified (:issue:`10058`)
+- Bug in ``Index.union`` raises ``AttributeError`` when passing array-likes. (:issue:`10149`)
+- Bug in ``Timestamp``'s' ``microsecond``, ``quarter``, ``dayofyear``, ``week`` and ``daysinmonth`` properties return ``np.int`` type, not built-in ``int``. (:issue:`10050`)
+- Bug in ``NaT`` raises ``AttributeError`` when accessing to ``daysinmonth``, ``dayofweek`` properties. (:issue:`10096`)
+- Bug in Index repr when using the ``max_seq_items=None`` setting (:issue:`10182`).
+- Bug in getting timezone data with ``dateutil`` on various platforms ( :issue:`9059`, :issue:`8639`, :issue:`9663`, :issue:`10121`)
+- Bug in displaying datetimes with mixed frequencies; display 'ms' datetimes to the proper precision. (:issue:`10170`)
+- Bug in ``setitem`` where type promotion is applied to the entire block (:issue:`10280`)
+- Bug in ``Series`` arithmetic methods may incorrectly hold names (:issue:`10068`)
+- Bug in ``GroupBy.get_group`` when grouping on multiple keys, one of which is categorical. (:issue:`10132`)
+- Bug in ``DatetimeIndex`` and ``TimedeltaIndex`` names are lost after timedelta arithmetics ( :issue:`9926`)
+- Bug in ``DataFrame`` construction from nested ``dict`` with ``datetime64`` (:issue:`10160`)
+- Bug in ``Series`` construction from ``dict`` with ``datetime64`` keys (:issue:`9456`)
+- Bug in ``Series.plot(label="LABEL")`` not correctly setting the label (:issue:`10119`)
+- Bug in ``plot`` not defaulting to matplotlib ``axes.grid`` setting (:issue:`9792`)
+- Bug causing strings containing an exponent, but no decimal to be parsed as ``int`` instead of ``float`` in ``engine='python'`` for the ``read_csv`` parser (:issue:`9565`)
+- Bug in ``Series.align`` resets ``name`` when ``fill_value`` is specified (:issue:`10067`)
+- Bug in ``read_csv`` causing index name not to be set on an empty DataFrame (:issue:`10184`)
+- Bug in ``SparseSeries.abs`` resets ``name`` (:issue:`10241`)
+- Bug in ``TimedeltaIndex`` slicing may reset freq (:issue:`10292`)
+- Bug in ``GroupBy.get_group`` raises ``ValueError`` when group key contains ``NaT`` (:issue:`6992`)
+- Bug in ``SparseSeries`` constructor ignores input data name (:issue:`10258`)
+- Bug in ``Categorical.remove_categories`` causing a ``ValueError`` when removing the ``NaN`` category if underlying dtype is floating-point (:issue:`10156`)
+- Bug where infer_freq infers time rule (WOM-5XXX) unsupported by to_offset (:issue:`9425`)
+- Bug in ``DataFrame.to_hdf()`` where table format would raise a seemingly unrelated error for invalid (non-string) column names. This is now explicitly forbidden. (:issue:`9057`)
+- Bug to handle masking empty ``DataFrame`` (:issue:`10126`).
+- Bug where MySQL interface could not handle numeric table/column names (:issue:`10255`)
+- Bug in ``read_csv`` with a ``date_parser`` that returned a ``datetime64`` array of other time resolution than ``[ns]`` (:issue:`10245`)
+- Bug in ``Panel.apply`` when the result has ndim=0 (:issue:`10332`)
+- Bug in ``read_hdf`` where ``auto_close`` could not be passed (:issue:`9327`).
+- Bug in ``read_hdf`` where open stores could not be used (:issue:`10330`).
+- Bug in adding empty ``DataFrames``, now results in a ``DataFrame`` that ``.equals`` an empty ``DataFrame`` (:issue:`10181`).
+- Bug in ``to_hdf`` and ``HDFStore`` which did not check that complib choices were valid (:issue:`4582`, :issue:`8874`).
+
+
+.. _whatsnew_0.16.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.16.1..v0.16.2
diff --git a/doc/source/whatsnew/v0.16.2.txt b/doc/source/whatsnew/v0.16.2.txt
deleted file mode 100644
index bfe44290e49d2..0000000000000
--- a/doc/source/whatsnew/v0.16.2.txt
+++ /dev/null
@@ -1,167 +0,0 @@
-.. _whatsnew_0162:
-
-v0.16.2 (June 12, 2015)
------------------------
-
-This is a minor bug-fix release from 0.16.1 and includes a a large number of
-bug fixes along some new features (:meth:`~DataFrame.pipe` method), enhancements, and performance improvements.
-
-We recommend that all users upgrade to this version.
-
-Highlights include:
-
-- A new ``pipe`` method, see :ref:`here <whatsnew_0162.enhancements.pipe>`
-- Documentation on how to use numba_ with *pandas*, see :ref:`here <enhancingperf.numba>`
-
-
-.. contents:: What's new in v0.16.2
-    :local:
-    :backlinks: none
-
-.. _numba: http://numba.pydata.org
-
-.. _whatsnew_0162.enhancements:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0162.enhancements.pipe:
-
-Pipe
-^^^^
-
-We've introduced a new method :meth:`DataFrame.pipe`. As suggested by the name, ``pipe``
-should be used to pipe data through a chain of function calls.
-The goal is to avoid confusing nested function calls like
-
-.. code-block:: python
-
-   # df is a DataFrame
-   # f, g, and h are functions that take and return DataFrames
-   f(g(h(df), arg1=1), arg2=2, arg3=3)
-
-The logic flows from inside out, and function names are separated from their keyword arguments.
-This can be rewritten as
-
-.. code-block:: python
-
-   (df.pipe(h)
-      .pipe(g, arg1=1)
-      .pipe(f, arg2=2, arg3=3)
-   )
-
-Now both the code and the logic flow from top to bottom. Keyword arguments are next to
-their functions. Overall the code is much more readable.
-
-In the example above, the functions ``f``, ``g``, and ``h`` each expected the DataFrame as the first positional argument.
-When the function you wish to apply takes its data anywhere other than the first argument, pass a tuple
-of ``(function, keyword)`` indicating where the DataFrame should flow. For example:
-
-.. ipython:: python
-
-   import statsmodels.formula.api as sm
-
-   bb = pd.read_csv('data/baseball.csv', index_col='id')
-
-   # sm.poisson takes (formula, data)
-   (bb.query('h > 0')
-      .assign(ln_h = lambda df: np.log(df.h))
-      .pipe((sm.poisson, 'data'), 'hr ~ ln_h + year + g + C(lg)')
-      .fit()
-      .summary()
-   )
-
-The pipe method is inspired by unix pipes, which stream text through
-processes. More recently dplyr_ and magrittr_ have introduced the
-popular ``(%>%)`` pipe operator for R_.
-
-See the :ref:`documentation <basics.pipe>` for more. (:issue:`10129`)
-
-.. _dplyr: https://github.com/hadley/dplyr
-.. _magrittr: https://github.com/smbache/magrittr
-.. _R: http://www.r-project.org
-
-.. _whatsnew_0162.enhancements.other:
-
-Other Enhancements
-^^^^^^^^^^^^^^^^^^
-
-- Added `rsplit` to Index/Series StringMethods (:issue:`10303`)
-
-- Removed the hard-coded size limits on the ``DataFrame`` HTML representation
-  in the IPython notebook, and leave this to IPython itself (only for IPython
-  v3.0 or greater). This eliminates the duplicate scroll bars that appeared in
-  the notebook with large frames (:issue:`10231`).
-
-  Note that the notebook has a ``toggle output scrolling`` feature to limit the
-  display of very large frames (by clicking left of the output).
-  You can also configure the way DataFrames are displayed using the pandas
-  options, see here :ref:`here <options.frequently_used>`.
-
-- ``axis`` parameter of ``DataFrame.quantile`` now accepts also ``index`` and ``column``. (:issue:`9543`)
-
-.. _whatsnew_0162.api:
-
-API Changes
-~~~~~~~~~~~
-
-- ``Holiday`` now raises ``NotImplementedError`` if both ``offset`` and ``observance`` are used in the constructor instead of returning an incorrect result (:issue:`10217`).
-
-
-.. _whatsnew_0162.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved ``Series.resample`` performance with ``dtype=datetime64[ns]`` (:issue:`7754`)
-- Increase performance of ``str.split`` when ``expand=True`` (:issue:`10081`)
-
-.. _whatsnew_0162.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in ``Series.hist`` raises an error when a one row ``Series`` was given (:issue:`10214`)
-- Bug where ``HDFStore.select`` modifies the passed columns list (:issue:`7212`)
-- Bug in ``Categorical`` repr with ``display.width`` of ``None`` in Python 3 (:issue:`10087`)
-- Bug in ``to_json`` with certain orients and a ``CategoricalIndex`` would segfault (:issue:`10317`)
-- Bug where some of the nan funcs do not have consistent return dtypes (:issue:`10251`)
-- Bug in ``DataFrame.quantile`` on checking that a valid axis was passed (:issue:`9543`)
-- Bug in ``groupby.apply`` aggregation for ``Categorical`` not preserving categories (:issue:`10138`)
-- Bug in ``to_csv`` where ``date_format`` is ignored if the ``datetime`` is fractional (:issue:`10209`)
-- Bug in ``DataFrame.to_json`` with mixed data types (:issue:`10289`)
-- Bug in cache updating when consolidating (:issue:`10264`)
-- Bug in ``mean()`` where integer dtypes can overflow (:issue:`10172`)
-- Bug where ``Panel.from_dict`` does not set dtype when specified (:issue:`10058`)
-- Bug in ``Index.union`` raises ``AttributeError`` when passing array-likes. (:issue:`10149`)
-- Bug in ``Timestamp``'s' ``microsecond``, ``quarter``, ``dayofyear``, ``week`` and ``daysinmonth`` properties return ``np.int`` type, not built-in ``int``. (:issue:`10050`)
-- Bug in ``NaT`` raises ``AttributeError`` when accessing to ``daysinmonth``, ``dayofweek`` properties. (:issue:`10096`)
-- Bug in Index repr when using the ``max_seq_items=None`` setting (:issue:`10182`).
-- Bug in getting timezone data with ``dateutil`` on various platforms ( :issue:`9059`, :issue:`8639`, :issue:`9663`, :issue:`10121`)
-- Bug in displaying datetimes with mixed frequencies; display 'ms' datetimes to the proper precision. (:issue:`10170`)
-- Bug in ``setitem`` where type promotion is applied to the entire block (:issue:`10280`)
-- Bug in ``Series`` arithmetic methods may incorrectly hold names (:issue:`10068`)
-- Bug in ``GroupBy.get_group`` when grouping on multiple keys, one of which is categorical. (:issue:`10132`)
-- Bug in ``DatetimeIndex`` and ``TimedeltaIndex`` names are lost after timedelta arithmetics ( :issue:`9926`)
-- Bug in ``DataFrame`` construction from nested ``dict`` with ``datetime64`` (:issue:`10160`)
-- Bug in ``Series`` construction from ``dict`` with ``datetime64`` keys (:issue:`9456`)
-- Bug in ``Series.plot(label="LABEL")`` not correctly setting the label (:issue:`10119`)
-- Bug in ``plot`` not defaulting to matplotlib ``axes.grid`` setting (:issue:`9792`)
-- Bug causing strings containing an exponent, but no decimal to be parsed as ``int`` instead of ``float`` in ``engine='python'`` for the ``read_csv`` parser (:issue:`9565`)
-- Bug in ``Series.align`` resets ``name`` when ``fill_value`` is specified (:issue:`10067`)
-- Bug in ``read_csv`` causing index name not to be set on an empty DataFrame (:issue:`10184`)
-- Bug in ``SparseSeries.abs`` resets ``name`` (:issue:`10241`)
-- Bug in ``TimedeltaIndex`` slicing may reset freq (:issue:`10292`)
-- Bug in ``GroupBy.get_group`` raises ``ValueError`` when group key contains ``NaT`` (:issue:`6992`)
-- Bug in ``SparseSeries`` constructor ignores input data name (:issue:`10258`)
-- Bug in ``Categorical.remove_categories`` causing a ``ValueError`` when removing the ``NaN`` category if underlying dtype is floating-point (:issue:`10156`)
-- Bug where infer_freq infers timerule (WOM-5XXX) unsupported by to_offset (:issue:`9425`)
-- Bug in ``DataFrame.to_hdf()`` where table format would raise a seemingly unrelated error for invalid (non-string) column names. This is now explicitly forbidden. (:issue:`9057`)
-- Bug to handle masking empty ``DataFrame`` (:issue:`10126`).
-- Bug where MySQL interface could not handle numeric table/column names (:issue:`10255`)
-- Bug in ``read_csv`` with a ``date_parser`` that returned a ``datetime64`` array of other time resolution than ``[ns]`` (:issue:`10245`)
-- Bug in ``Panel.apply`` when the result has ndim=0 (:issue:`10332`)
-- Bug in ``read_hdf`` where ``auto_close`` could not be passed (:issue:`9327`).
-- Bug in ``read_hdf`` where open stores could not be used (:issue:`10330`).
-- Bug in adding empty ``DataFrame``s, now results in a ``DataFrame`` that ``.equals`` an empty ``DataFrame`` (:issue:`10181`).
-- Bug in ``to_hdf`` and ``HDFStore`` which did not check that complib choices were valid (:issue:`4582`, :issue:`8874`).
diff --git a/doc/source/whatsnew/v0.17.0.rst b/doc/source/whatsnew/v0.17.0.rst
new file mode 100644
index 0000000000000..c53fee42548e9
--- /dev/null
+++ b/doc/source/whatsnew/v0.17.0.rst
@@ -0,0 +1,1181 @@
+.. _whatsnew_0170:
+
+v0.17.0 (October 9, 2015)
+-------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+
+
+This is a major release from 0.16.2 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+.. warning::
+
+   pandas >= 0.17.0 will no longer support compatibility with Python version 3.2 (:issue:`9118`)
+
+.. warning::
+
+   The ``pandas.io.data`` package is deprecated and will be replaced by the
+   `pandas-datareader package <https://github.com/pydata/pandas-datareader>`_.
+   This will allow the data modules to be independently updated to your pandas
+   installation. The API for ``pandas-datareader v0.1.1`` is exactly the same
+   as in ``pandas v0.17.0`` (:issue:`8961`, :issue:`10861`).
+
+   After installing pandas-datareader, you can easily change your imports:
+
+   .. code-block:: python
+
+     from pandas.io import data, wb
+
+   becomes
+
+   .. code-block:: python
+
+     from pandas_datareader import data, wb
+
+Highlights include:
+
+- Release the Global Interpreter Lock (GIL) on some cython operations, see :ref:`here <whatsnew_0170.gil>`
+- Plotting methods are now available as attributes of the ``.plot`` accessor, see :ref:`here <whatsnew_0170.plot>`
+- The sorting API has been revamped to remove some long-time inconsistencies, see :ref:`here <whatsnew_0170.api_breaking.sorting>`
+- Support for a ``datetime64[ns]`` with timezones as a first-class dtype, see :ref:`here <whatsnew_0170.tz>`
+- The default for ``to_datetime`` will now be to ``raise`` when presented with unparseable formats,
+  previously this would return the original input. Also, date parse
+  functions now return consistent results. See :ref:`here <whatsnew_0170.api_breaking.to_datetime>`
+- The default for ``dropna`` in ``HDFStore`` has changed to ``False``, to store by default all rows even
+  if they are all ``NaN``, see :ref:`here <whatsnew_0170.api_breaking.hdf_dropna>`
+- Datetime accessor (``dt``) now supports ``Series.dt.strftime`` to generate formatted strings for datetime-likes, and ``Series.dt.total_seconds`` to generate each duration of the timedelta in seconds. See :ref:`here <whatsnew_0170.strftime>`
+- ``Period`` and ``PeriodIndex`` can handle multiplied freq like ``3D``, which corresponding to 3 days span. See :ref:`here <whatsnew_0170.periodfreq>`
+- Development installed versions of pandas will now have ``PEP440`` compliant version strings (:issue:`9518`)
+- Development support for benchmarking with the `Air Speed Velocity library <https://github.com/spacetelescope/asv/>`_ (:issue:`8361`)
+- Support for reading SAS xport files, see :ref:`here <whatsnew_0170.enhancements.sas_xport>`
+- Documentation comparing SAS to *pandas*, see :ref:`here <compare_with_sas>`
+- Removal of the automatic TimeSeries broadcasting, deprecated since 0.8.0, see :ref:`here <whatsnew_0170.prior_deprecations>`
+- Display format with plain text can optionally align with Unicode East Asian Width, see :ref:`here <whatsnew_0170.east_asian_width>`
+- Compatibility with Python 3.5 (:issue:`11097`)
+- Compatibility with matplotlib 1.5.0 (:issue:`11111`)
+
+Check the :ref:`API Changes <whatsnew_0170.api>` and :ref:`deprecations <whatsnew_0170.deprecations>` before updating.
+
+.. contents:: What's new in v0.17.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0170.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0170.tz:
+
+Datetime with TZ
+^^^^^^^^^^^^^^^^
+
+We are adding an implementation that natively supports datetime with timezones. A ``Series`` or a ``DataFrame`` column previously
+*could* be assigned a datetime with timezones, and would work as an ``object`` dtype. This had performance issues with a large
+number rows. See the :ref:`docs <timeseries.timezone_series>` for more details. (:issue:`8260`, :issue:`10763`, :issue:`11034`).
+
+The new implementation allows for having a single-timezone across all rows, with operations in a performant manner.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': pd.date_range('20130101', periods=3),
+                      'B': pd.date_range('20130101', periods=3, tz='US/Eastern'),
+                      'C': pd.date_range('20130101', periods=3, tz='CET')})
+   df
+   df.dtypes
+
+.. ipython:: python
+
+   df.B
+   df.B.dt.tz_localize(None)
+
+This uses a new-dtype representation as well, that is very similar in look-and-feel to its numpy cousin ``datetime64[ns]``
+
+.. ipython:: python
+
+   df['B'].dtype
+   type(df['B'].dtype)
+
+.. note::
+
+   There is a slightly different string repr for the underlying ``DatetimeIndex`` as a result of the dtype changes, but
+   functionally these are the same.
+
+   Previous Behavior:
+
+   .. code-block:: ipython
+
+      In [1]: pd.date_range('20130101', periods=3, tz='US/Eastern')
+      Out[1]: DatetimeIndex(['2013-01-01 00:00:00-05:00', '2013-01-02 00:00:00-05:00',
+                             '2013-01-03 00:00:00-05:00'],
+                            dtype='datetime64[ns]', freq='D', tz='US/Eastern')
+
+      In [2]: pd.date_range('20130101', periods=3, tz='US/Eastern').dtype
+      Out[2]: dtype('<M8[ns]')
+
+   New Behavior:
+
+   .. ipython:: python
+
+      pd.date_range('20130101', periods=3, tz='US/Eastern')
+      pd.date_range('20130101', periods=3, tz='US/Eastern').dtype
+
+.. _whatsnew_0170.gil:
+
+Releasing the GIL
+^^^^^^^^^^^^^^^^^
+
+We are releasing the global-interpreter-lock (GIL) on some cython operations.
+This will allow other threads to run simultaneously during computation, potentially allowing performance improvements
+from multi-threading. Notably ``groupby``, ``nsmallest``, ``value_counts`` and some indexing operations benefit from this. (:issue:`8882`)
+
+For example the groupby expression in the following code will have the GIL released during the factorization step, e.g. ``df.groupby('key')``
+as well as the ``.sum()`` operation.
+
+.. code-block:: python
+
+   N = 1000000
+   ngroups = 10
+   df = DataFrame({'key': np.random.randint(0, ngroups, size=N),
+                   'data': np.random.randn(N)})
+   df.groupby('key')['data'].sum()
+
+Releasing of the GIL could benefit an application that uses threads for user interactions (e.g. QT_), or performing multi-threaded computations. A nice example of a library that can handle these types of computation-in-parallel is the dask_ library.
+
+.. _dask: https://dask.readthedocs.io/en/latest/
+.. _QT: https://wiki.python.org/moin/PyQt
+
+.. _whatsnew_0170.plot:
+
+Plot submethods
+^^^^^^^^^^^^^^^
+
+The Series and DataFrame ``.plot()`` method allows for customizing :ref:`plot types<visualization.other>` by supplying the ``kind`` keyword arguments. Unfortunately, many of these kinds of plots use different required and optional keyword arguments, which makes it difficult to discover what any given plot kind uses out of the dozens of possible arguments.
+
+To alleviate this issue, we have added a new, optional plotting interface, which exposes each kind of plot as a method of the ``.plot`` attribute. Instead of writing ``series.plot(kind=<kind>, ...)``, you can now also use ``series.plot.<kind>(...)``:
+
+.. ipython::
+    :verbatim:
+
+    In [13]: df = pd.DataFrame(np.random.rand(10, 2), columns=['a', 'b'])
+
+    In [14]: df.plot.bar()
+
+.. image:: ../_static/whatsnew_plot_submethods.png
+
+As a result of this change, these methods are now all discoverable via tab-completion:
+
+.. ipython::
+    :verbatim:
+
+    In [15]: df.plot.<TAB>  # noqa: E225, E999
+    df.plot.area     df.plot.barh     df.plot.density  df.plot.hist     df.plot.line     df.plot.scatter
+    df.plot.bar      df.plot.box      df.plot.hexbin   df.plot.kde      df.plot.pie
+
+Each method signature only includes relevant arguments. Currently, these are limited to required arguments, but in the future these will include optional arguments, as well. For an overview, see the new :ref:`api.dataframe.plotting` API documentation.
+
+.. _whatsnew_0170.strftime:
+
+Additional methods for ``dt`` accessor
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+strftime
+""""""""
+
+We are now supporting a ``Series.dt.strftime`` method for datetime-likes to generate a formatted string (:issue:`10110`). Examples:
+
+.. ipython:: python
+
+   # DatetimeIndex
+   s = pd.Series(pd.date_range('20130101', periods=4))
+   s
+   s.dt.strftime('%Y/%m/%d')
+
+.. ipython:: python
+
+   # PeriodIndex
+   s = pd.Series(pd.period_range('20130101', periods=4))
+   s
+   s.dt.strftime('%Y/%m/%d')
+
+The string format is as the python standard library and details can be found `here <https://docs.python.org/2/library/datetime.html#strftime-and-strptime-behavior>`_
+
+total_seconds
+"""""""""""""
+
+``pd.Series`` of type ``timedelta64`` has new method ``.dt.total_seconds()`` returning the duration of the timedelta in seconds (:issue:`10817`)
+
+.. ipython:: python
+
+   # TimedeltaIndex
+   s = pd.Series(pd.timedelta_range('1 minutes', periods=4))
+   s
+   s.dt.total_seconds()
+
+.. _whatsnew_0170.periodfreq:
+
+Period Frequency Enhancement
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Period``, ``PeriodIndex`` and ``period_range`` can now accept multiplied freq. Also, ``Period.freq`` and ``PeriodIndex.freq`` are now stored as a ``DateOffset`` instance like ``DatetimeIndex``, and not as ``str`` (:issue:`7811`)
+
+A multiplied freq represents a span of corresponding length. The example below creates a period of 3 days. Addition and subtraction will shift the period by its span.
+
+.. ipython:: python
+
+   p = pd.Period('2015-08-01', freq='3D')
+   p
+   p + 1
+   p - 2
+   p.to_timestamp()
+   p.to_timestamp(how='E')
+
+You can use the multiplied freq in ``PeriodIndex`` and ``period_range``.
+
+.. ipython:: python
+
+   idx = pd.period_range('2015-08-01', periods=4, freq='2D')
+   idx
+   idx + 1
+
+.. _whatsnew_0170.enhancements.sas_xport:
+
+Support for SAS XPORT files
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`~pandas.io.read_sas` provides support for reading *SAS XPORT* format files. (:issue:`4052`).
+
+.. code-block:: python
+
+    df = pd.read_sas('sas_xport.xpt')
+
+It is also possible to obtain an iterator and read an XPORT file
+incrementally.
+
+.. code-block:: python
+
+    for df in pd.read_sas('sas_xport.xpt', chunksize=10000):
+        do_something(df)
+
+See the :ref:`docs <io.sas>` for more details.
+
+.. _whatsnew_0170.matheval:
+
+Support for Math Functions in .eval()
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`~pandas.eval` now supports calling math functions (:issue:`4893`)
+
+.. code-block:: python
+
+    df = pd.DataFrame({'a': np.random.randn(10)})
+    df.eval("b = sin(a)")
+
+The support math functions are `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
+`sqrt`, `sinh`, `cosh`, `tanh`, `arcsin`, `arccos`, `arctan`, `arccosh`,
+`arcsinh`, `arctanh`, `abs` and `arctan2`.
+
+These functions map to the intrinsics for the ``NumExpr`` engine.  For the Python
+engine, they are mapped to ``NumPy`` calls.
+
+Changes to Excel with ``MultiIndex``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In version 0.16.2 a ``DataFrame`` with ``MultiIndex`` columns could not be written to Excel via ``to_excel``.
+That functionality has been added (:issue:`10564`), along with updating  ``read_excel`` so that the data can
+be read back with, no loss of information, by specifying which columns/rows make up the ``MultiIndex``
+in the ``header`` and ``index_col`` parameters (:issue:`4679`)
+
+See the :ref:`documentation <io.excel>` for more details.
+
+.. ipython:: python
+
+   df = pd.DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                     columns=pd.MultiIndex.from_product(
+                     [['foo', 'bar'], ['a', 'b']], names=['col1', 'col2']),
+                     index=pd.MultiIndex.from_product([['j'], ['l', 'k']],
+                                                      names=['i1', 'i2']))
+
+   df
+   df.to_excel('test.xlsx')
+
+   df = pd.read_excel('test.xlsx', header=[0, 1], index_col=[0, 1])
+   df
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('test.xlsx')
+
+Previously, it was necessary to specify the ``has_index_names`` argument in ``read_excel``,
+if the serialized data had index names.  For version 0.17.0 the output format of ``to_excel``
+has been changed to make this keyword unnecessary - the change is shown below.
+
+**Old**
+
+.. image:: ../_static/old-excel-index.png
+
+**New**
+
+.. image:: ../_static/new-excel-index.png
+
+.. warning::
+
+   Excel files saved in version 0.16.2 or prior that had index names will still able to be read in,
+   but the ``has_index_names`` argument must specified to ``True``.
+
+.. _whatsnew_0170.gbq:
+
+Google BigQuery Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+- Added ability to automatically create a table/dataset using the :func:`pandas.io.gbq.to_gbq` function if the destination table/dataset does not exist. (:issue:`8325`, :issue:`11121`).
+- Added ability to replace an existing table and schema when calling the :func:`pandas.io.gbq.to_gbq` function via the ``if_exists`` argument. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/writing.html>`__ for more details (:issue:`8325`).
+- ``InvalidColumnOrder`` and ``InvalidPageToken`` in the gbq module will raise ``ValueError`` instead of ``IOError``.
+- The ``generate_bq_schema()`` function is now deprecated and will be removed in a future version (:issue:`11121`)
+- The gbq module will now support Python 3 (:issue:`11094`).
+
+.. _whatsnew_0170.east_asian_width:
+
+Display Alignment with Unicode East Asian Width
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. warning::
+
+   Enabling this option will affect the performance for printing of ``DataFrame`` and ``Series`` (about 2 times slower).
+   Use only when it is actually required.
+
+Some East Asian countries use Unicode characters its width is corresponding to 2 alphabets. If a ``DataFrame`` or ``Series`` contains these characters, the default output cannot be aligned properly. The following options are added to enable precise handling for these characters.
+
+- ``display.unicode.east_asian_width``: Whether to use the Unicode East Asian Width to calculate the display text width. (:issue:`2612`)
+- ``display.unicode.ambiguous_as_wide``: Whether to handle Unicode characters belong to Ambiguous as Wide. (:issue:`11102`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({u'国籍': ['UK', u'日本'], u'名前': ['Alice', u'しのぶ']})
+   df;
+
+.. image:: ../_static/option_unicode01.png
+
+.. ipython:: python
+
+   pd.set_option('display.unicode.east_asian_width', True)
+   df;
+
+.. image:: ../_static/option_unicode02.png
+
+For further details, see :ref:`here <options.east_asian_width>`
+
+.. ipython:: python
+   :suppress:
+
+   pd.set_option('display.unicode.east_asian_width', False)
+
+.. _whatsnew_0170.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Support for ``openpyxl`` >= 2.2. The API for style support is now stable (:issue:`10125`)
+- ``merge`` now accepts the argument ``indicator`` which adds a Categorical-type column (by default called ``_merge``) to the output object that takes on the values (:issue:`8790`)
+
+  ===================================   ================
+  Observation Origin                    ``_merge`` value
+  ===================================   ================
+  Merge key only in ``'left'`` frame    ``left_only``
+  Merge key only in ``'right'`` frame   ``right_only``
+  Merge key in both frames              ``both``
+  ===================================   ================
+
+  .. ipython:: python
+
+    df1 = pd.DataFrame({'col1':[0,1], 'col_left':['a','b']})
+    df2 = pd.DataFrame({'col1':[1,2,2],'col_right':[2,2,2]})
+    pd.merge(df1, df2, on='col1', how='outer', indicator=True)
+
+  For more, see the :ref:`updated docs <merging.indicator>`
+
+- ``pd.to_numeric`` is a new function to coerce strings to numbers (possibly with coercion) (:issue:`11133`)
+
+- ``pd.merge`` will now allow duplicate column names if they are not merged upon (:issue:`10639`).
+
+- ``pd.pivot`` will now allow passing index as ``None`` (:issue:`3962`).
+
+- ``pd.concat`` will now use existing Series names if provided (:issue:`10698`).
+
+  .. ipython:: python
+
+     foo = pd.Series([1, 2], name='foo')
+     bar = pd.Series([1, 2])
+     baz = pd.Series([4, 5])
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+     In [1]: pd.concat([foo, bar, baz], 1)
+     Out[1]:
+           0  1  2
+        0  1  1  4
+        1  2  2  5
+
+  New Behavior:
+
+  .. ipython:: python
+
+    pd.concat([foo, bar, baz], 1)
+
+- ``DataFrame`` has gained the ``nlargest`` and ``nsmallest`` methods (:issue:`10393`)
+
+- Add a ``limit_direction`` keyword argument that works with ``limit`` to enable ``interpolate`` to fill ``NaN`` values forward, backward, or both (:issue:`9218`, :issue:`10420`, :issue:`11115`)
+
+  .. ipython:: python
+
+     ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13])
+     ser.interpolate(limit=1, limit_direction='both')
+
+- Added a ``DataFrame.round`` method to round the values to a variable number of decimal places (:issue:`10568`).
+
+  .. ipython:: python
+
+     df = pd.DataFrame(np.random.random([3, 3]),
+                       columns=['A', 'B', 'C'],
+                       index=['first', 'second', 'third'])
+     df
+     df.round(2)
+     df.round({'A': 0, 'C': 2})
+
+- ``drop_duplicates`` and ``duplicated`` now accept a ``keep`` keyword to target first, last, and all duplicates. The ``take_last`` keyword is deprecated, see :ref:`here <whatsnew_0170.deprecations>` (:issue:`6511`, :issue:`8505`)
+
+  .. ipython:: python
+
+     s = pd.Series(['A', 'B', 'C', 'A', 'B', 'D'])
+     s.drop_duplicates()
+     s.drop_duplicates(keep='last')
+     s.drop_duplicates(keep=False)
+
+- Reindex now has a ``tolerance`` argument that allows for finer control of :ref:`basics.limits_on_reindex_fill` (:issue:`10411`):
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'x': range(5),
+                        't': pd.date_range('2000-01-01', periods=5)})
+     df.reindex([0.1, 1.9, 3.5],
+                method='nearest',
+                tolerance=0.2)
+
+  When used on a ``DatetimeIndex``, ``TimedeltaIndex`` or ``PeriodIndex``, ``tolerance`` will coerced into a ``Timedelta`` if possible. This allows you to specify tolerance with a string:
+
+  .. ipython:: python
+
+     df = df.set_index('t')
+     df.reindex(pd.to_datetime(['1999-12-31']),
+                method='nearest',
+                tolerance='1 day')
+
+  ``tolerance`` is also exposed by the lower level ``Index.get_indexer`` and ``Index.get_loc`` methods.
+
+- Added functionality to use the ``base`` argument when resampling a ``TimeDeltaIndex`` (:issue:`10530`)
+
+- ``DatetimeIndex`` can be instantiated using strings contains ``NaT`` (:issue:`7599`)
+
+- ``to_datetime`` can now accept the ``yearfirst`` keyword (:issue:`7599`)
+
+- ``pandas.tseries.offsets`` larger than the ``Day`` offset can now be used with a ``Series`` for addition/subtraction (:issue:`10699`).  See the :ref:`docs <timeseries.offsetseries>` for more details.
+
+- ``pd.Timedelta.total_seconds()`` now returns Timedelta duration to ns precision (previously microsecond precision) (:issue:`10939`)
+
+- ``PeriodIndex`` now supports arithmetic with ``np.ndarray`` (:issue:`10638`)
+
+- Support pickling of ``Period`` objects (:issue:`10439`)
+
+- ``.as_blocks`` will now take a ``copy`` optional argument to return a copy of the data, default is to copy (no change in behavior from prior versions), (:issue:`9607`)
+
+- ``regex`` argument to ``DataFrame.filter`` now handles numeric column names instead of raising ``ValueError`` (:issue:`10384`).
+
+- Enable reading gzip compressed files via URL, either by explicitly setting the compression parameter or by inferring from the presence of the HTTP Content-Encoding header in the response (:issue:`8685`)
+
+- Enable writing Excel files in :ref:`memory <io.excel_writing_buffer>` using StringIO/BytesIO (:issue:`7074`)
+
+- Enable serialization of lists and dicts to strings in ``ExcelWriter`` (:issue:`8188`)
+
+- SQL io functions now accept a SQLAlchemy connectable. (:issue:`7877`)
+
+- ``pd.read_sql`` and ``to_sql`` can accept database URI as ``con`` parameter (:issue:`10214`)
+
+- ``read_sql_table`` will now allow reading from views (:issue:`10750`).
+
+- Enable writing complex values to ``HDFStores`` when using the ``table`` format (:issue:`10447`)
+
+- Enable ``pd.read_hdf`` to be used without specifying a key when the HDF file contains a single dataset (:issue:`10443`)
+
+- ``pd.read_stata`` will now read Stata 118 type files. (:issue:`9882`)
+
+- ``msgpack`` submodule has been updated to 0.4.6 with backward compatibility (:issue:`10581`)
+
+- ``DataFrame.to_dict`` now accepts ``orient='index'`` keyword argument (:issue:`10844`).
+
+- ``DataFrame.apply`` will return a Series of dicts if the passed function returns a dict and ``reduce=True`` (:issue:`8735`).
+
+- Allow passing `kwargs` to the interpolation methods (:issue:`10378`).
+
+- Improved error message when concatenating an empty iterable of ``Dataframe`` objects (:issue:`9157`)
+
+- ``pd.read_csv`` can now read bz2-compressed files incrementally, and the C parser can read bz2-compressed files from AWS S3 (:issue:`11070`, :issue:`11072`).
+
+- In ``pd.read_csv``, recognize ``s3n://`` and ``s3a://`` URLs as designating S3 file storage (:issue:`11070`, :issue:`11071`).
+
+- Read CSV files from AWS S3 incrementally, instead of first downloading the entire file. (Full file download still required for compressed files in Python 2.)  (:issue:`11070`, :issue:`11073`)
+
+- ``pd.read_csv`` is now able to infer compression type for files read from AWS S3 storage (:issue:`11070`, :issue:`11074`).
+
+
+.. _whatsnew_0170.api:
+
+.. _whatsnew_0170.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0170.api_breaking.sorting:
+
+Changes to sorting API
+^^^^^^^^^^^^^^^^^^^^^^
+
+The sorting API has had some longtime inconsistencies. (:issue:`9816`, :issue:`8239`).
+
+Here is a summary of the API **PRIOR** to 0.17.0:
+
+- ``Series.sort`` is **INPLACE** while ``DataFrame.sort`` returns a new object.
+- ``Series.order`` returns a new object
+- It was possible to use ``Series/DataFrame.sort_index`` to sort by **values** by passing the ``by`` keyword.
+- ``Series/DataFrame.sortlevel`` worked only on a ``MultiIndex`` for sorting by index.
+
+To address these issues, we have revamped the API:
+
+- We have introduced a new method, :meth:`DataFrame.sort_values`, which is the merger of ``DataFrame.sort()``, ``Series.sort()``,
+  and ``Series.order()``, to handle sorting of **values**.
+- The existing methods ``Series.sort()``, ``Series.order()``, and ``DataFrame.sort()`` have been deprecated and will be removed in a
+  future version.
+- The ``by`` argument of ``DataFrame.sort_index()`` has been deprecated and will be removed in a future version.
+- The existing method ``.sort_index()`` will gain the ``level`` keyword to enable level sorting.
+
+We now have two distinct and non-overlapping methods of sorting. A ``*`` marks items that
+will show a ``FutureWarning``.
+
+To sort by the **values**:
+
+==================================    ====================================
+Previous                              Replacement
+==================================    ====================================
+\* ``Series.order()``                 ``Series.sort_values()``
+\* ``Series.sort()``                  ``Series.sort_values(inplace=True)``
+\* ``DataFrame.sort(columns=...)``    ``DataFrame.sort_values(by=...)``
+==================================    ====================================
+
+To sort by the **index**:
+
+==================================    ====================================
+Previous                              Replacement
+==================================    ====================================
+``Series.sort_index()``               ``Series.sort_index()``
+``Series.sortlevel(level=...)``       ``Series.sort_index(level=...``)
+``DataFrame.sort_index()``            ``DataFrame.sort_index()``
+``DataFrame.sortlevel(level=...)``    ``DataFrame.sort_index(level=...)``
+\* ``DataFrame.sort()``                 ``DataFrame.sort_index()``
+==================================    ====================================
+
+We have also deprecated and changed similar methods in two Series-like classes, ``Index`` and ``Categorical``.
+
+==================================    ====================================
+Previous                              Replacement
+==================================    ====================================
+\* ``Index.order()``                  ``Index.sort_values()``
+\* ``Categorical.order()``            ``Categorical.sort_values()``
+==================================    ====================================
+
+.. _whatsnew_0170.api_breaking.to_datetime:
+
+Changes to to_datetime and to_timedelta
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Error handling
+""""""""""""""
+
+The default for ``pd.to_datetime`` error handling has changed to ``errors='raise'``.
+In prior versions it was ``errors='ignore'``. Furthermore, the ``coerce`` argument
+has been deprecated in favor of ``errors='coerce'``. This means that invalid parsing
+will raise rather that return the original input as in previous versions. (:issue:`10636`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: pd.to_datetime(['2009-07-31', 'asd'])
+   Out[2]: array(['2009-07-31', 'asd'], dtype=object)
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [3]: pd.to_datetime(['2009-07-31', 'asd'])
+   ValueError: Unknown string format
+
+Of course you can coerce this as well.
+
+.. ipython:: python
+
+   pd.to_datetime(['2009-07-31', 'asd'], errors='coerce')
+
+To keep the previous behavior, you can use ``errors='ignore'``:
+
+.. ipython:: python
+
+   pd.to_datetime(['2009-07-31', 'asd'], errors='ignore')
+
+Furthermore, ``pd.to_timedelta`` has gained a similar API, of ``errors='raise'|'ignore'|'coerce'``, and the ``coerce`` keyword
+has been deprecated in favor of ``errors='coerce'``.
+
+Consistent Parsing
+""""""""""""""""""
+
+The string parsing of ``to_datetime``, ``Timestamp`` and ``DatetimeIndex`` has
+been made consistent. (:issue:`7599`)
+
+Prior to v0.17.0, ``Timestamp`` and ``to_datetime`` may parse year-only datetime-string incorrectly using today's date, otherwise ``DatetimeIndex``
+uses the beginning of the year. ``Timestamp`` and ``to_datetime`` may raise ``ValueError`` in some types of datetime-string which ``DatetimeIndex``
+can parse, such as a quarterly string.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: pd.Timestamp('2012Q2')
+   Traceback
+      ...
+   ValueError: Unable to parse 2012Q2
+
+   # Results in today's date.
+   In [2]: pd.Timestamp('2014')
+   Out [2]: 2014-08-12 00:00:00
+
+v0.17.0 can parse them as below. It works on ``DatetimeIndex`` also.
+
+New Behavior:
+
+.. ipython:: python
+
+   pd.Timestamp('2012Q2')
+   pd.Timestamp('2014')
+   pd.DatetimeIndex(['2012Q2', '2014'])
+
+.. note::
+
+   If you want to perform calculations based on today's date, use ``Timestamp.now()`` and ``pandas.tseries.offsets``.
+
+   .. ipython:: python
+
+      import pandas.tseries.offsets as offsets
+      pd.Timestamp.now()
+      pd.Timestamp.now() + offsets.DateOffset(years=1)
+
+Changes to Index Comparisons
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Operator equal on ``Index`` should behavior similarly to ``Series`` (:issue:`9947`, :issue:`10637`)
+
+Starting in v0.17.0, comparing ``Index`` objects of different lengths will raise
+a ``ValueError``. This is to be consistent with the behavior of ``Series``.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
+   Out[2]: array([ True, False, False], dtype=bool)
+
+   In [3]: pd.Index([1, 2, 3]) == pd.Index([2])
+   Out[3]: array([False,  True, False], dtype=bool)
+
+   In [4]: pd.Index([1, 2, 3]) == pd.Index([1, 2])
+   Out[4]: False
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [8]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
+   Out[8]: array([ True, False, False], dtype=bool)
+
+   In [9]: pd.Index([1, 2, 3]) == pd.Index([2])
+   ValueError: Lengths must match to compare
+
+   In [10]: pd.Index([1, 2, 3]) == pd.Index([1, 2])
+   ValueError: Lengths must match to compare
+
+Note that this is different from the ``numpy`` behavior where a comparison can
+be broadcast:
+
+.. ipython:: python
+
+   np.array([1, 2, 3]) == np.array([1])
+
+or it can return False if broadcasting can not be done:
+
+.. ipython:: python
+   :okwarning:
+
+   np.array([1, 2, 3]) == np.array([1, 2])
+
+Changes to Boolean Comparisons vs. None
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Boolean comparisons of a ``Series`` vs ``None`` will now be equivalent to comparing with ``np.nan``, rather than raise ``TypeError``. (:issue:`1079`).
+
+.. ipython:: python
+
+   s = pd.Series(range(3))
+   s.iloc[1] = None
+   s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [5]: s == None
+   TypeError: Could not compare <type 'NoneType'> type with Series
+
+New Behavior:
+
+.. ipython:: python
+
+   s == None
+
+Usually you simply want to know which values are null.
+
+.. ipython:: python
+
+   s.isnull()
+
+.. warning::
+
+   You generally will want to use ``isnull/notnull`` for these types of comparisons, as ``isnull/notnull`` tells you which elements are null. One has to be
+   mindful that ``nan's`` don't compare equal, but ``None's`` do. Note that Pandas/numpy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
+
+   .. ipython:: python
+
+      None == None
+      np.nan == np.nan
+
+.. _whatsnew_0170.api_breaking.hdf_dropna:
+
+HDFStore dropna behavior
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+The default behavior for HDFStore write functions with ``format='table'`` is now to keep rows that are all missing. Previously, the behavior was to drop rows that were all missing save the index. The previous behavior can be replicated using the ``dropna=True`` option. (:issue:`9382`)
+
+Previous Behavior:
+
+.. ipython:: python
+
+   df_with_missing = pd.DataFrame({'col1': [0, np.nan, 2],
+                                   'col2': [1, np.nan, np.nan]})
+
+   df_with_missing
+
+
+.. code-block:: ipython
+
+   In [27]:
+   df_with_missing.to_hdf('file.h5',
+                          'df_with_missing',
+                          format='table',
+                          mode='w')
+
+   In [28]: pd.read_hdf('file.h5', 'df_with_missing')
+
+   Out [28]:
+         col1  col2
+     0     0     1
+     2     2   NaN
+
+
+New Behavior:
+
+.. ipython:: python
+
+   df_with_missing.to_hdf('file.h5',
+                          'df_with_missing',
+                          format='table',
+                          mode='w')
+
+   pd.read_hdf('file.h5', 'df_with_missing')
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('file.h5')
+
+See the :ref:`docs <io.hdf5>` for more details.
+
+.. _whatsnew_0170.api_breaking.display_precision:
+
+Changes to ``display.precision`` option
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``display.precision`` option has been clarified to refer to decimal places (:issue:`10451`).
+
+Earlier versions of pandas would format floating point numbers to have one less decimal place than the value in
+``display.precision``.
+
+.. code-block:: ipython
+
+  In [1]: pd.set_option('display.precision', 2)
+
+  In [2]: pd.DataFrame({'x': [123.456789]})
+  Out[2]:
+         x
+  0  123.5
+
+If interpreting precision as "significant figures" this did work for scientific notation but that same interpretation
+did not work for values with standard formatting. It was also out of step with how numpy handles formatting.
+
+Going forward the value of ``display.precision`` will directly control the number of places after the decimal, for
+regular formatting as well as scientific notation, similar to how numpy's ``precision`` print option works.
+
+.. ipython:: python
+
+  pd.set_option('display.precision', 2)
+  pd.DataFrame({'x': [123.456789]})
+
+To preserve output behavior with prior versions the default value of ``display.precision`` has been reduced to ``6``
+from ``7``.
+
+.. ipython:: python
+  :suppress:
+
+  pd.set_option('display.precision', 6)
+
+.. _whatsnew_0170.api_breaking.categorical_unique:
+
+Changes to ``Categorical.unique``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Categorical.unique`` now returns new ``Categoricals`` with ``categories`` and ``codes`` that are unique, rather than returning ``np.array`` (:issue:`10508`)
+
+- unordered category: values and categories are sorted by appearance order.
+- ordered category: values are sorted by appearance order, categories keep existing order.
+
+.. ipython:: python
+
+   cat = pd.Categorical(['C', 'A', 'B', 'C'],
+                        categories=['A', 'B', 'C'],
+                        ordered=True)
+   cat
+   cat.unique()
+
+   cat = pd.Categorical(['C', 'A', 'B', 'C'],
+                        categories=['A', 'B', 'C'])
+   cat
+   cat.unique()
+
+Changes to ``bool`` passed as ``header`` in Parsers
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In earlier versions of pandas, if a bool was passed the ``header`` argument of
+``read_csv``, ``read_excel``, or ``read_html`` it was implicitly converted to
+an integer, resulting in ``header=0`` for ``False`` and ``header=1`` for ``True``
+(:issue:`6113`)
+
+A ``bool`` input to ``header`` will now raise a ``TypeError``
+
+.. code-block:: ipython
+
+   In [29]: df = pd.read_csv('data.csv', header=False)
+   TypeError: Passing a bool to header is invalid. Use header=None for no header or
+   header=int or list-like of ints to specify the row(s) making up the column names
+
+
+.. _whatsnew_0170.api_breaking.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- Line and kde plot with ``subplots=True`` now uses default colors, not all black. Specify ``color='k'`` to draw all lines in black (:issue:`9894`)
+- Calling the ``.value_counts()`` method on a Series with a ``categorical`` dtype now returns a Series with a ``CategoricalIndex`` (:issue:`10704`)
+- The metadata properties of subclasses of pandas objects will now be serialized (:issue:`10553`).
+- ``groupby`` using ``Categorical`` follows the same rule as ``Categorical.unique`` described above  (:issue:`10508`)
+- When constructing ``DataFrame`` with an array of ``complex64`` dtype previously meant the corresponding column
+  was automatically promoted to the ``complex128`` dtype. Pandas will now preserve the itemsize of the input for complex data (:issue:`10952`)
+- some numeric reduction operators would return ``ValueError``, rather than ``TypeError`` on object types that includes strings and numbers (:issue:`11131`)
+- Passing currently unsupported ``chunksize`` argument to ``read_excel`` or ``ExcelFile.parse`` will now raise ``NotImplementedError`` (:issue:`8011`)
+- Allow an ``ExcelFile`` object to be passed into ``read_excel`` (:issue:`11198`)
+- ``DatetimeIndex.union`` does not infer ``freq`` if ``self`` and the input have ``None`` as ``freq`` (:issue:`11086`)
+- ``NaT``'s methods now either raise ``ValueError``, or return ``np.nan`` or ``NaT`` (:issue:`9513`)
+
+  ===============================     ===============================================================
+  Behavior                            Methods
+  ===============================     ===============================================================
+  return ``np.nan``                   ``weekday``, ``isoweekday``
+  return ``NaT``                      ``date``, ``now``, ``replace``, ``to_datetime``, ``today``
+  return ``np.datetime64('NaT')``     ``to_datetime64`` (unchanged)
+  raise ``ValueError``                All other public methods (names not beginning with underscores)
+  ===============================     ===============================================================
+
+.. _whatsnew_0170.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- For ``Series`` the following indexing functions are deprecated (:issue:`10177`).
+
+  =====================  =================================
+  Deprecated Function    Replacement
+  =====================  =================================
+  ``.irow(i)``           ``.iloc[i]`` or ``.iat[i]``
+  ``.iget(i)``           ``.iloc[i]`` or ``.iat[i]``
+  ``.iget_value(i)``     ``.iloc[i]`` or ``.iat[i]``
+  =====================  =================================
+
+- For ``DataFrame`` the following indexing functions are deprecated (:issue:`10177`).
+
+  =====================  =================================
+  Deprecated Function    Replacement
+  =====================  =================================
+  ``.irow(i)``           ``.iloc[i]``
+  ``.iget_value(i, j)``  ``.iloc[i, j]`` or ``.iat[i, j]``
+  ``.icol(j)``           ``.iloc[:, j]``
+  =====================  =================================
+
+.. note:: These indexing function have been deprecated in the documentation since 0.11.0.
+
+- ``Categorical.name`` was deprecated to make ``Categorical`` more ``numpy.ndarray`` like. Use ``Series(cat, name="whatever")`` instead (:issue:`10482`).
+- Setting missing values (NaN) in a ``Categorical``'s ``categories`` will issue a warning (:issue:`10748`). You can still have missing values in the ``values``.
+- ``drop_duplicates`` and ``duplicated``'s ``take_last`` keyword was deprecated in favor of ``keep``. (:issue:`6511`, :issue:`8505`)
+- ``Series.nsmallest`` and ``nlargest``'s ``take_last`` keyword was deprecated in favor of ``keep``. (:issue:`10792`)
+- ``DataFrame.combineAdd`` and ``DataFrame.combineMult`` are deprecated. They
+  can easily be replaced by using the ``add`` and ``mul`` methods:
+  ``DataFrame.add(other, fill_value=0)`` and ``DataFrame.mul(other, fill_value=1.)``
+  (:issue:`10735`).
+- ``TimeSeries`` deprecated in favor of ``Series`` (note that this has been an alias since 0.13.0), (:issue:`10890`)
+- ``SparsePanel`` deprecated and will be removed in a future version (:issue:`11157`).
+- ``Series.is_time_series`` deprecated in favor of ``Series.index.is_all_dates`` (:issue:`11135`)
+- Legacy offsets (like ``'A@JAN'``) are deprecated (note that this has been alias since 0.8.0) (:issue:`10878`)
+- ``WidePanel`` deprecated in favor of ``Panel``, ``LongPanel`` in favor of ``DataFrame`` (note these have been aliases since < 0.11.0), (:issue:`10892`)
+- ``DataFrame.convert_objects`` has been deprecated in favor of type-specific functions ``pd.to_datetime``, ``pd.to_timestamp`` and ``pd.to_numeric`` (new in 0.17.0) (:issue:`11133`).
+
+.. _whatsnew_0170.prior_deprecations:
+
+Removal of prior version deprecations/changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Removal of ``na_last`` parameters from ``Series.order()`` and ``Series.sort()``, in favor of ``na_position``. (:issue:`5231`)
+- Remove of ``percentile_width`` from ``.describe()``, in favor of ``percentiles``. (:issue:`7088`)
+- Removal of ``colSpace`` parameter from ``DataFrame.to_string()``, in favor of ``col_space``, circa 0.8.0 version.
+- Removal of automatic time-series broadcasting (:issue:`2304`)
+
+  .. ipython:: python
+
+     np.random.seed(1234)
+     df = pd.DataFrame(np.random.randn(5, 2),
+                       columns=list('AB'),
+                       index=pd.date_range('2013-01-01', periods=5))
+     df
+
+  Previously
+
+  .. code-block:: ipython
+
+     In [3]: df + df.A
+     FutureWarning: TimeSeries broadcasting along DataFrame index by default is deprecated.
+     Please use DataFrame.<op> to explicitly broadcast arithmetic operations along the index
+
+     Out[3]:
+                         A         B
+     2013-01-01  0.942870 -0.719541
+     2013-01-02  2.865414  1.120055
+     2013-01-03 -1.441177  0.166574
+     2013-01-04  1.719177  0.223065
+     2013-01-05  0.031393 -2.226989
+
+  Current
+
+  .. ipython:: python
+
+     df.add(df.A, axis='index')
+
+
+- Remove ``table`` keyword in ``HDFStore.put/append``, in favor of using ``format=`` (:issue:`4645`)
+- Remove ``kind`` in ``read_excel/ExcelFile`` as its unused (:issue:`4712`)
+- Remove ``infer_type`` keyword from ``pd.read_html`` as its unused (:issue:`4770`, :issue:`7032`)
+- Remove ``offset`` and ``timeRule`` keywords from ``Series.tshift/shift``, in favor of ``freq`` (:issue:`4853`, :issue:`4864`)
+- Remove ``pd.load/pd.save`` aliases in favor of ``pd.to_pickle/pd.read_pickle`` (:issue:`3787`)
+
+.. _whatsnew_0170.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Development support for benchmarking with the `Air Speed Velocity library <https://github.com/spacetelescope/asv/>`_ (:issue:`8361`)
+- Added vbench benchmarks for alternative ExcelWriter engines and reading Excel files (:issue:`7171`)
+- Performance improvements in ``Categorical.value_counts`` (:issue:`10804`)
+- Performance improvements in ``SeriesGroupBy.nunique`` and ``SeriesGroupBy.value_counts`` and ``SeriesGroupby.transform`` (:issue:`10820`, :issue:`11077`)
+- Performance improvements in ``DataFrame.drop_duplicates`` with integer dtypes (:issue:`10917`)
+- Performance improvements in ``DataFrame.duplicated`` with wide frames. (:issue:`10161`, :issue:`11180`)
+- 4x improvement in ``timedelta`` string parsing (:issue:`6755`, :issue:`10426`)
+- 8x improvement in ``timedelta64`` and ``datetime64`` ops (:issue:`6755`)
+- Significantly improved performance of indexing ``MultiIndex`` with slicers (:issue:`10287`)
+- 8x improvement in ``iloc`` using list-like input (:issue:`10791`)
+- Improved performance of ``Series.isin`` for datetimelike/integer Series (:issue:`10287`)
+- 20x improvement in ``concat`` of Categoricals when categories are identical (:issue:`10587`)
+- Improved performance of ``to_datetime`` when specified format string is ISO8601 (:issue:`10178`)
+- 2x improvement of ``Series.value_counts`` for float dtype (:issue:`10821`)
+- Enable ``infer_datetime_format`` in ``to_datetime`` when date components do not have 0 padding (:issue:`11142`)
+- Regression from 0.16.1 in constructing ``DataFrame`` from nested dictionary (:issue:`11084`)
+- Performance improvements in addition/subtraction operations for ``DateOffset`` with ``Series`` or ``DatetimeIndex``  (:issue:`10744`, :issue:`11205`)
+
+.. _whatsnew_0170.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in incorrect computation of ``.mean()`` on ``timedelta64[ns]`` because of overflow (:issue:`9442`)
+- Bug in  ``.isin`` on older numpies (:issue:`11232`)
+- Bug in ``DataFrame.to_html(index=False)`` renders unnecessary ``name`` row (:issue:`10344`)
+- Bug in ``DataFrame.to_latex()`` the ``column_format`` argument could not be passed (:issue:`9402`)
+- Bug in ``DatetimeIndex`` when localizing with ``NaT`` (:issue:`10477`)
+- Bug in ``Series.dt`` ops in preserving meta-data (:issue:`10477`)
+- Bug in preserving ``NaT`` when passed in an otherwise invalid ``to_datetime`` construction (:issue:`10477`)
+- Bug in ``DataFrame.apply`` when function returns categorical series. (:issue:`9573`)
+- Bug in ``to_datetime`` with invalid dates and formats supplied (:issue:`10154`)
+- Bug in ``Index.drop_duplicates`` dropping name(s) (:issue:`10115`)
+- Bug in ``Series.quantile`` dropping name (:issue:`10881`)
+- Bug in ``pd.Series`` when setting a value on an empty ``Series`` whose index has a frequency. (:issue:`10193`)
+- Bug in ``pd.Series.interpolate`` with invalid ``order`` keyword values. (:issue:`10633`)
+- Bug in ``DataFrame.plot`` raises ``ValueError`` when color name is specified by multiple characters (:issue:`10387`)
+- Bug in ``Index`` construction with a mixed list of tuples (:issue:`10697`)
+- Bug in ``DataFrame.reset_index`` when index contains ``NaT``. (:issue:`10388`)
+- Bug in ``ExcelReader`` when worksheet is empty (:issue:`6403`)
+- Bug in ``BinGrouper.group_info`` where returned values are not compatible with base class (:issue:`10914`)
+- Bug in clearing the cache on ``DataFrame.pop`` and a subsequent inplace op (:issue:`10912`)
+- Bug in indexing with a mixed-integer ``Index`` causing an ``ImportError`` (:issue:`10610`)
+- Bug in ``Series.count`` when index has nulls (:issue:`10946`)
+- Bug in pickling of a non-regular freq ``DatetimeIndex`` (:issue:`11002`)
+- Bug causing ``DataFrame.where`` to not respect the ``axis`` parameter when the frame has a symmetric shape. (:issue:`9736`)
+- Bug in ``Table.select_column`` where name is not preserved (:issue:`10392`)
+- Bug in ``offsets.generate_range`` where ``start`` and ``end`` have finer precision than ``offset`` (:issue:`9907`)
+- Bug in ``pd.rolling_*`` where ``Series.name`` would be lost in the output (:issue:`10565`)
+- Bug in ``stack`` when index or columns are not unique. (:issue:`10417`)
+- Bug in setting a ``Panel`` when an axis has a MultiIndex (:issue:`10360`)
+- Bug in ``USFederalHolidayCalendar`` where ``USMemorialDay`` and ``USMartinLutherKingJr`` were incorrect (:issue:`10278` and :issue:`9760` )
+- Bug in ``.sample()`` where returned object, if set, gives unnecessary ``SettingWithCopyWarning`` (:issue:`10738`)
+- Bug in ``.sample()`` where weights passed as ``Series`` were not aligned along axis before being treated positionally, potentially causing problems if weight indices were not aligned with sampled object. (:issue:`10738`)
+
+- Regression fixed in (:issue:`9311`, :issue:`6620`, :issue:`9345`), where groupby with a datetime-like converting to float with certain aggregators (:issue:`10979`)
+
+- Bug in ``DataFrame.interpolate`` with ``axis=1`` and ``inplace=True`` (:issue:`10395`)
+- Bug in ``io.sql.get_schema`` when specifying multiple columns as primary
+  key (:issue:`10385`).
+
+- Bug in ``groupby(sort=False)`` with datetime-like ``Categorical`` raises ``ValueError`` (:issue:`10505`)
+- Bug in ``groupby(axis=1)`` with ``filter()`` throws ``IndexError`` (:issue:`11041`)
+- Bug in ``test_categorical`` on big-endian builds (:issue:`10425`)
+- Bug in ``Series.shift`` and ``DataFrame.shift`` not supporting categorical data (:issue:`9416`)
+- Bug in ``Series.map`` using categorical ``Series`` raises ``AttributeError`` (:issue:`10324`)
+- Bug in ``MultiIndex.get_level_values`` including ``Categorical`` raises ``AttributeError`` (:issue:`10460`)
+- Bug in ``pd.get_dummies`` with ``sparse=True`` not returning ``SparseDataFrame`` (:issue:`10531`)
+- Bug in ``Index`` subtypes (such as ``PeriodIndex``) not returning their own type for ``.drop`` and ``.insert`` methods (:issue:`10620`)
+- Bug in ``algos.outer_join_indexer`` when ``right`` array is empty (:issue:`10618`)
+
+- Bug in ``filter`` (regression from 0.16.0) and ``transform`` when grouping on multiple keys, one of which is datetime-like (:issue:`10114`)
+
+
+- Bug in ``to_datetime`` and ``to_timedelta`` causing ``Index`` name to be lost (:issue:`10875`)
+- Bug in ``len(DataFrame.groupby)`` causing ``IndexError`` when there's a column containing only NaNs (:issue:`11016`)
+
+- Bug that caused segfault when resampling an empty Series (:issue:`10228`)
+- Bug in ``DatetimeIndex`` and ``PeriodIndex.value_counts`` resets name from its result, but retains in result's ``Index``. (:issue:`10150`)
+- Bug in ``pd.eval`` using ``numexpr`` engine coerces 1 element numpy array to scalar (:issue:`10546`)
+- Bug in ``pd.concat`` with ``axis=0`` when column is of dtype ``category`` (:issue:`10177`)
+- Bug in ``read_msgpack`` where input type is not always checked (:issue:`10369`, :issue:`10630`)
+- Bug in ``pd.read_csv`` with kwargs ``index_col=False``, ``index_col=['a', 'b']`` or ``dtype``
+  (:issue:`10413`, :issue:`10467`, :issue:`10577`)
+- Bug in ``Series.from_csv`` with ``header`` kwarg not setting the ``Series.name`` or the ``Series.index.name`` (:issue:`10483`)
+- Bug in ``groupby.var`` which caused variance to be inaccurate for small float values (:issue:`10448`)
+- Bug in ``Series.plot(kind='hist')`` Y Label not informative (:issue:`10485`)
+- Bug in ``read_csv`` when using a converter which generates a ``uint8`` type (:issue:`9266`)
+
+- Bug causes memory leak in time-series line and area plot (:issue:`9003`)
+
+- Bug when setting a ``Panel`` sliced along the major or minor axes when the right-hand side is a ``DataFrame`` (:issue:`11014`)
+- Bug that returns ``None`` and does not raise ``NotImplementedError`` when operator functions (e.g. ``.add``) of ``Panel`` are not implemented (:issue:`7692`)
+
+- Bug in line and kde plot cannot accept multiple colors when ``subplots=True`` (:issue:`9894`)
+- Bug in ``DataFrame.plot`` raises ``ValueError`` when color name is specified by multiple characters (:issue:`10387`)
+
+- Bug in left and right ``align`` of ``Series`` with ``MultiIndex`` may be inverted (:issue:`10665`)
+- Bug in left and right ``join`` of with ``MultiIndex`` may be inverted (:issue:`10741`)
+
+- Bug in ``read_stata`` when reading a file with a different order set in ``columns`` (:issue:`10757`)
+- Bug in ``Categorical`` may not representing properly when category contains ``tz`` or ``Period`` (:issue:`10713`)
+- Bug in ``Categorical.__iter__`` may not returning correct ``datetime`` and ``Period`` (:issue:`10713`)
+- Bug in indexing with a ``PeriodIndex`` on an object with a ``PeriodIndex`` (:issue:`4125`)
+- Bug in ``read_csv`` with ``engine='c'``: EOF preceded by a comment, blank line, etc. was not handled correctly (:issue:`10728`, :issue:`10548`)
+
+- Reading "famafrench" data via ``DataReader`` results in HTTP 404 error because of the website url is changed (:issue:`10591`).
+- Bug in ``read_msgpack`` where DataFrame to decode has duplicate column names (:issue:`9618`)
+- Bug in ``io.common.get_filepath_or_buffer`` which caused reading of valid S3 files to fail if the bucket also contained keys for which the user does not have read permission (:issue:`10604`)
+- Bug in vectorised setting of timestamp columns with python ``datetime.date`` and numpy ``datetime64`` (:issue:`10408`, :issue:`10412`)
+- Bug in ``Index.take`` may add unnecessary ``freq`` attribute (:issue:`10791`)
+- Bug in ``merge`` with empty ``DataFrame`` may raise ``IndexError`` (:issue:`10824`)
+- Bug in ``to_latex`` where unexpected keyword argument for some documented arguments (:issue:`10888`)
+- Bug in indexing of large ``DataFrame`` where ``IndexError`` is uncaught (:issue:`10645` and :issue:`10692`)
+- Bug in ``read_csv`` when using the ``nrows`` or ``chunksize`` parameters if file contains only a header line (:issue:`9535`)
+- Bug in serialization of ``category`` types in HDF5 in presence of alternate encodings. (:issue:`10366`)
+- Bug in ``pd.DataFrame`` when constructing an empty DataFrame with a string dtype (:issue:`9428`)
+- Bug in ``pd.DataFrame.diff`` when DataFrame is not consolidated (:issue:`10907`)
+- Bug in ``pd.unique`` for arrays with the ``datetime64`` or ``timedelta64`` dtype that meant an array with object dtype was returned instead the original dtype (:issue:`9431`)
+- Bug in ``Timedelta`` raising error when slicing from 0s (:issue:`10583`)
+- Bug in ``DatetimeIndex.take`` and ``TimedeltaIndex.take`` may not raise ``IndexError`` against invalid index (:issue:`10295`)
+- Bug in ``Series([np.nan]).astype('M8[ms]')``, which now returns ``Series([pd.NaT])`` (:issue:`10747`)
+- Bug in ``PeriodIndex.order`` reset freq (:issue:`10295`)
+- Bug in ``date_range`` when ``freq`` divides ``end`` as nanos (:issue:`10885`)
+- Bug in ``iloc`` allowing memory outside bounds of a Series to be accessed with negative integers (:issue:`10779`)
+- Bug in ``read_msgpack`` where encoding is not respected (:issue:`10581`)
+- Bug preventing access to the first index when using ``iloc`` with a list containing the appropriate negative integer (:issue:`10547`, :issue:`10779`)
+- Bug in ``TimedeltaIndex`` formatter causing error while trying to save ``DataFrame`` with ``TimedeltaIndex`` using ``to_csv`` (:issue:`10833`)
+- Bug in ``DataFrame.where`` when handling Series slicing (:issue:`10218`, :issue:`9558`)
+- Bug where ``pd.read_gbq`` throws ``ValueError`` when Bigquery returns zero rows (:issue:`10273`)
+- Bug in ``to_json`` which was causing segmentation fault when serializing 0-rank ndarray (:issue:`9576`)
+- Bug in plotting functions may raise ``IndexError`` when plotted on ``GridSpec`` (:issue:`10819`)
+- Bug in plot result may show unnecessary minor ticklabels (:issue:`10657`)
+- Bug in ``groupby`` incorrect computation for aggregation on ``DataFrame`` with ``NaT`` (E.g ``first``, ``last``, ``min``). (:issue:`10590`, :issue:`11010`)
+- Bug when constructing ``DataFrame`` where passing a dictionary with only scalar values and specifying columns did not raise an error (:issue:`10856`)
+- Bug in ``.var()`` causing roundoff errors for highly similar values (:issue:`10242`)
+- Bug in ``DataFrame.plot(subplots=True)`` with duplicated columns outputs incorrect result (:issue:`10962`)
+- Bug in ``Index`` arithmetic may result in incorrect class (:issue:`10638`)
+- Bug in ``date_range`` results in empty if freq is negative annually, quarterly and monthly (:issue:`11018`)
+- Bug in ``DatetimeIndex`` cannot infer negative freq (:issue:`11018`)
+- Remove use of some deprecated numpy comparison operations, mainly in tests. (:issue:`10569`)
+- Bug in ``Index`` dtype may not applied properly (:issue:`11017`)
+- Bug in ``io.gbq`` when testing for minimum google api client version (:issue:`10652`)
+- Bug in ``DataFrame`` construction from nested ``dict`` with ``timedelta`` keys (:issue:`11129`)
+- Bug in ``.fillna`` against may raise ``TypeError`` when data contains datetime dtype (:issue:`7095`, :issue:`11153`)
+- Bug in ``.groupby`` when number of keys to group by is same as length of index (:issue:`11185`)
+- Bug in ``convert_objects`` where converted values might not be returned if all null and ``coerce`` (:issue:`9589`)
+- Bug in ``convert_objects`` where ``copy`` keyword was not respected (:issue:`9589`)
+
+
+.. _whatsnew_0.17.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.16.2..v0.17.0
diff --git a/doc/source/whatsnew/v0.17.0.txt b/doc/source/whatsnew/v0.17.0.txt
deleted file mode 100644
index a3bbaf73c01ca..0000000000000
--- a/doc/source/whatsnew/v0.17.0.txt
+++ /dev/null
@@ -1,1169 +0,0 @@
-.. _whatsnew_0170:
-
-v0.17.0 (October 9, 2015)
--------------------------
-
-This is a major release from 0.16.2 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-.. warning::
-
-   pandas >= 0.17.0 will no longer support compatibility with Python version 3.2 (:issue:`9118`)
-
-.. warning::
-
-   The ``pandas.io.data`` package is deprecated and will be replaced by the
-   `pandas-datareader package <https://github.com/pydata/pandas-datareader>`_.
-   This will allow the data modules to be independently updated to your pandas
-   installation. The API for ``pandas-datareader v0.1.1`` is exactly the same
-   as in ``pandas v0.17.0`` (:issue:`8961`, :issue:`10861`).
-
-   After installing pandas-datareader, you can easily change your imports:
-
-   .. code-block:: python
-
-     from pandas.io import data, wb
-
-   becomes
-
-   .. code-block:: python
-
-     from pandas_datareader import data, wb
-
-Highlights include:
-
-- Release the Global Interpreter Lock (GIL) on some cython operations, see :ref:`here <whatsnew_0170.gil>`
-- Plotting methods are now available as attributes of the ``.plot`` accessor, see :ref:`here <whatsnew_0170.plot>`
-- The sorting API has been revamped to remove some long-time inconsistencies, see :ref:`here <whatsnew_0170.api_breaking.sorting>`
-- Support for a ``datetime64[ns]`` with timezones as a first-class dtype, see :ref:`here <whatsnew_0170.tz>`
-- The default for ``to_datetime`` will now be to ``raise`` when presented with unparseable formats,
-  previously this would return the original input. Also, date parse
-  functions now return consistent results. See :ref:`here <whatsnew_0170.api_breaking.to_datetime>`
-- The default for ``dropna`` in ``HDFStore`` has changed to ``False``, to store by default all rows even
-  if they are all ``NaN``, see :ref:`here <whatsnew_0170.api_breaking.hdf_dropna>`
-- Datetime accessor (``dt``) now supports ``Series.dt.strftime`` to generate formatted strings for datetime-likes, and ``Series.dt.total_seconds`` to generate each duration of the timedelta in seconds. See :ref:`here <whatsnew_0170.strftime>`
-- ``Period`` and ``PeriodIndex`` can handle multiplied freq like ``3D``, which corresponding to 3 days span. See :ref:`here <whatsnew_0170.periodfreq>`
-- Development installed versions of pandas will now have ``PEP440`` compliant version strings (:issue:`9518`)
-- Development support for benchmarking with the `Air Speed Velocity library <https://github.com/spacetelescope/asv/>`_ (:issue:`8361`)
-- Support for reading SAS xport files, see :ref:`here <whatsnew_0170.enhancements.sas_xport>`
-- Documentation comparing SAS to *pandas*, see :ref:`here <compare_with_sas>`
-- Removal of the automatic TimeSeries broadcasting, deprecated since 0.8.0, see :ref:`here <whatsnew_0170.prior_deprecations>`
-- Display format with plain text can optionally align with Unicode East Asian Width, see :ref:`here <whatsnew_0170.east_asian_width>`
-- Compatibility with Python 3.5 (:issue:`11097`)
-- Compatibility with matplotlib 1.5.0 (:issue:`11111`)
-
-Check the :ref:`API Changes <whatsnew_0170.api>` and :ref:`deprecations <whatsnew_0170.deprecations>` before updating.
-
-.. contents:: What's new in v0.17.0
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0170.enhancements:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0170.tz:
-
-Datetime with TZ
-^^^^^^^^^^^^^^^^
-
-We are adding an implementation that natively supports datetime with timezones. A ``Series`` or a ``DataFrame`` column previously
-*could* be assigned a datetime with timezones, and would work as an ``object`` dtype. This had performance issues with a large
-number rows. See the :ref:`docs <timeseries.timezone_series>` for more details. (:issue:`8260`, :issue:`10763`, :issue:`11034`).
-
-The new implementation allows for having a single-timezone across all rows, with operations in a performant manner.
-
-.. ipython:: python
-
-   df = DataFrame({'A' : date_range('20130101',periods=3),
-                   'B' : date_range('20130101',periods=3,tz='US/Eastern'),
-                   'C' : date_range('20130101',periods=3,tz='CET')})
-   df
-   df.dtypes
-
-.. ipython:: python
-
-   df.B
-   df.B.dt.tz_localize(None)
-
-This uses a new-dtype representation as well, that is very similar in look-and-feel to its numpy cousin ``datetime64[ns]``
-
-.. ipython:: python
-
-   df['B'].dtype
-   type(df['B'].dtype)
-
-.. note::
-
-   There is a slightly different string repr for the underlying ``DatetimeIndex`` as a result of the dtype changes, but
-   functionally these are the same.
-
-   Previous Behavior:
-
-   .. code-block:: ipython
-
-      In [1]: pd.date_range('20130101',periods=3,tz='US/Eastern')
-      Out[1]: DatetimeIndex(['2013-01-01 00:00:00-05:00', '2013-01-02 00:00:00-05:00',
-                             '2013-01-03 00:00:00-05:00'],
-                            dtype='datetime64[ns]', freq='D', tz='US/Eastern')
-
-      In [2]: pd.date_range('20130101',periods=3,tz='US/Eastern').dtype
-      Out[2]: dtype('<M8[ns]')
-
-   New Behavior:
-
-   .. ipython:: python
-
-      pd.date_range('20130101',periods=3,tz='US/Eastern')
-      pd.date_range('20130101',periods=3,tz='US/Eastern').dtype
-
-.. _whatsnew_0170.gil:
-
-Releasing the GIL
-^^^^^^^^^^^^^^^^^
-
-We are releasing the global-interpreter-lock (GIL) on some cython operations.
-This will allow other threads to run simultaneously during computation, potentially allowing performance improvements
-from multi-threading. Notably ``groupby``, ``nsmallest``, ``value_counts`` and some indexing operations benefit from this. (:issue:`8882`)
-
-For example the groupby expression in the following code will have the GIL released during the factorization step, e.g. ``df.groupby('key')``
-as well as the ``.sum()`` operation.
-
-.. code-block:: python
-
-   N = 1000000
-   ngroups = 10
-   df = DataFrame({'key' : np.random.randint(0,ngroups,size=N),
-                   'data' : np.random.randn(N) })
-   df.groupby('key')['data'].sum()
-
-Releasing of the GIL could benefit an application that uses threads for user interactions (e.g. QT_), or performing multi-threaded computations. A nice example of a library that can handle these types of computation-in-parallel is the dask_ library.
-
-.. _dask: https://dask.readthedocs.io/en/latest/
-.. _QT: https://wiki.python.org/moin/PyQt
-
-.. _whatsnew_0170.plot:
-
-Plot submethods
-^^^^^^^^^^^^^^^
-
-The Series and DataFrame ``.plot()`` method allows for customizing :ref:`plot types<visualization.other>` by supplying the ``kind`` keyword arguments. Unfortunately, many of these kinds of plots use different required and optional keyword arguments, which makes it difficult to discover what any given plot kind uses out of the dozens of possible arguments.
-
-To alleviate this issue, we have added a new, optional plotting interface, which exposes each kind of plot as a method of the ``.plot`` attribute. Instead of writing ``series.plot(kind=<kind>, ...)``, you can now also use ``series.plot.<kind>(...)``:
-
-.. ipython::
-    :verbatim:
-
-    In [13]: df = pd.DataFrame(np.random.rand(10, 2), columns=['a', 'b'])
-
-    In [14]: df.plot.bar()
-
-.. image:: _static/whatsnew_plot_submethods.png
-
-As a result of this change, these methods are now all discoverable via tab-completion:
-
-.. ipython::
-    :verbatim:
-
-    In [15]: df.plot.<TAB>
-    df.plot.area     df.plot.barh     df.plot.density  df.plot.hist     df.plot.line     df.plot.scatter
-    df.plot.bar      df.plot.box      df.plot.hexbin   df.plot.kde      df.plot.pie
-
-Each method signature only includes relevant arguments. Currently, these are limited to required arguments, but in the future these will include optional arguments, as well. For an overview, see the new :ref:`api.dataframe.plotting` API documentation.
-
-.. _whatsnew_0170.strftime:
-
-Additional methods for ``dt`` accessor
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-strftime
-""""""""
-
-We are now supporting a ``Series.dt.strftime`` method for datetime-likes to generate a formatted string (:issue:`10110`). Examples:
-
-.. ipython:: python
-
-   # DatetimeIndex
-   s = pd.Series(pd.date_range('20130101', periods=4))
-   s
-   s.dt.strftime('%Y/%m/%d')
-
-.. ipython:: python
-
-   # PeriodIndex
-   s = pd.Series(pd.period_range('20130101', periods=4))
-   s
-   s.dt.strftime('%Y/%m/%d')
-
-The string format is as the python standard library and details can be found `here <https://docs.python.org/2/library/datetime.html#strftime-and-strptime-behavior>`_
-
-total_seconds
-"""""""""""""
-
-``pd.Series`` of type ``timedelta64`` has new method ``.dt.total_seconds()`` returning the duration of the timedelta in seconds (:issue:`10817`)
-
-.. ipython:: python
-
-   # TimedeltaIndex
-   s = pd.Series(pd.timedelta_range('1 minutes', periods=4))
-   s
-   s.dt.total_seconds()
-
-.. _whatsnew_0170.periodfreq:
-
-Period Frequency Enhancement
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Period``, ``PeriodIndex`` and ``period_range`` can now accept multiplied freq. Also, ``Period.freq`` and ``PeriodIndex.freq`` are now stored as a ``DateOffset`` instance like ``DatetimeIndex``, and not as ``str`` (:issue:`7811`)
-
-A multiplied freq represents a span of corresponding length. The example below creates a period of 3 days. Addition and subtraction will shift the period by its span.
-
-.. ipython:: python
-
-   p = pd.Period('2015-08-01', freq='3D')
-   p
-   p + 1
-   p - 2
-   p.to_timestamp()
-   p.to_timestamp(how='E')
-
-You can use the multiplied freq in ``PeriodIndex`` and ``period_range``.
-
-.. ipython:: python
-
-   idx = pd.period_range('2015-08-01', periods=4, freq='2D')
-   idx
-   idx + 1
-
-.. _whatsnew_0170.enhancements.sas_xport:
-
-Support for SAS XPORT files
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:meth:`~pandas.io.read_sas` provides support for reading *SAS XPORT* format files. (:issue:`4052`).
-
-.. code-block:: python
-
-    df = pd.read_sas('sas_xport.xpt')
-
-It is also possible to obtain an iterator and read an XPORT file
-incrementally.
-
-.. code-block:: python
-
-    for df in pd.read_sas('sas_xport.xpt', chunksize=10000)
-        do_something(df)
-
-See the :ref:`docs <io.sas>` for more details.
-
-.. _whatsnew_0170.matheval:
-
-Support for Math Functions in .eval()
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:meth:`~pandas.eval` now supports calling math functions (:issue:`4893`)
-
-.. code-block:: python
-
-    df = pd.DataFrame({'a': np.random.randn(10)})
-    df.eval("b = sin(a)")
-
-The support math functions are `sin`, `cos`, `exp`, `log`, `expm1`, `log1p`,
-`sqrt`, `sinh`, `cosh`, `tanh`, `arcsin`, `arccos`, `arctan`, `arccosh`,
-`arcsinh`, `arctanh`, `abs` and `arctan2`.
-
-These functions map to the intrinsics for the ``NumExpr`` engine.  For the Python
-engine, they are mapped to ``NumPy`` calls.
-
-Changes to Excel with ``MultiIndex``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In version 0.16.2 a ``DataFrame`` with ``MultiIndex`` columns could not be written to Excel via ``to_excel``.
-That functionality has been added (:issue:`10564`), along with updating  ``read_excel`` so that the data can
-be read back with, no loss of information, by specifying which columns/rows make up the ``MultiIndex``
-in the ``header`` and ``index_col`` parameters (:issue:`4679`)
-
-See the :ref:`documentation <io.excel>` for more details.
-
-.. ipython:: python
-
-   df = pd.DataFrame([[1,2,3,4], [5,6,7,8]],
-                     columns = pd.MultiIndex.from_product([['foo','bar'],['a','b']],
-                                                          names = ['col1', 'col2']),
-                     index = pd.MultiIndex.from_product([['j'], ['l', 'k']],
-                                                        names = ['i1', 'i2']))
-
-   df
-   df.to_excel('test.xlsx')
-
-   df = pd.read_excel('test.xlsx', header=[0,1], index_col=[0,1])
-   df
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove('test.xlsx')
-
-Previously, it was necessary to specify the ``has_index_names`` argument in ``read_excel``,
-if the serialized data had index names.  For version 0.17.0 the ouptput format of ``to_excel``
-has been changed to make this keyword unnecessary - the change is shown below.
-
-**Old**
-
-.. image:: _static/old-excel-index.png
-
-**New**
-
-.. image:: _static/new-excel-index.png
-
-.. warning::
-
-   Excel files saved in version 0.16.2 or prior that had index names will still able to be read in,
-   but the ``has_index_names`` argument must specified to ``True``.
-
-.. _whatsnew_0170.gbq:
-
-Google BigQuery Enhancements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-- Added ability to automatically create a table/dataset using the :func:`pandas.io.gbq.to_gbq` function if the destination table/dataset does not exist. (:issue:`8325`, :issue:`11121`).
-- Added ability to replace an existing table and schema when calling the :func:`pandas.io.gbq.to_gbq` function via the ``if_exists`` argument. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/writing.html>`__ for more details (:issue:`8325`).
-- ``InvalidColumnOrder`` and ``InvalidPageToken`` in the gbq module will raise ``ValueError`` instead of ``IOError``.
-- The ``generate_bq_schema()`` function is now deprecated and will be removed in a future version (:issue:`11121`)
-- The gbq module will now support Python 3 (:issue:`11094`).
-
-.. _whatsnew_0170.east_asian_width:
-
-Display Alignment with Unicode East Asian Width
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. warning::
-
-   Enabling this option will affect the performance for printing of ``DataFrame`` and ``Series`` (about 2 times slower).
-   Use only when it is actually required.
-
-Some East Asian countries use Unicode characters its width is corresponding to 2 alphabets. If a ``DataFrame`` or ``Series`` contains these characters, the default output cannot be aligned properly. The following options are added to enable precise handling for these characters.
-
-- ``display.unicode.east_asian_width``: Whether to use the Unicode East Asian Width to calculate the display text width. (:issue:`2612`)
-- ``display.unicode.ambiguous_as_wide``: Whether to handle Unicode characters belong to Ambiguous as Wide. (:issue:`11102`)
-
-.. ipython:: python
-
-   df = pd.DataFrame({u'国籍': ['UK', u'日本'], u'名前': ['Alice', u'しのぶ']})
-   df;
-
-.. image:: _static/option_unicode01.png
-
-.. ipython:: python
-
-   pd.set_option('display.unicode.east_asian_width', True)
-   df;
-
-.. image:: _static/option_unicode02.png
-
-For further details, see :ref:`here <options.east_asian_width>`
-
-.. ipython:: python
-   :suppress:
-
-   pd.set_option('display.unicode.east_asian_width', False)
-
-.. _whatsnew_0170.enhancements.other:
-
-Other enhancements
-^^^^^^^^^^^^^^^^^^
-
-- Support for ``openpyxl`` >= 2.2. The API for style support is now stable (:issue:`10125`)
-- ``merge`` now accepts the argument ``indicator`` which adds a Categorical-type column (by default called ``_merge``) to the output object that takes on the values (:issue:`8790`)
-
-  ===================================   ================
-  Observation Origin                    ``_merge`` value
-  ===================================   ================
-  Merge key only in ``'left'`` frame    ``left_only``
-  Merge key only in ``'right'`` frame   ``right_only``
-  Merge key in both frames              ``both``
-  ===================================   ================
-
-  .. ipython:: python
-
-    df1 = pd.DataFrame({'col1':[0,1], 'col_left':['a','b']})
-    df2 = pd.DataFrame({'col1':[1,2,2],'col_right':[2,2,2]})
-    pd.merge(df1, df2, on='col1', how='outer', indicator=True)
-
-  For more, see the :ref:`updated docs <merging.indicator>`
-
-- ``pd.to_numeric`` is a new function to coerce strings to numbers (possibly with coercion) (:issue:`11133`)
-
-- ``pd.merge`` will now allow duplicate column names if they are not merged upon (:issue:`10639`).
-
-- ``pd.pivot`` will now allow passing index as ``None`` (:issue:`3962`).
-
-- ``pd.concat`` will now use existing Series names if provided (:issue:`10698`).
-
-  .. ipython:: python
-
-     foo = pd.Series([1,2], name='foo')
-     bar = pd.Series([1,2])
-     baz = pd.Series([4,5])
-
-  Previous Behavior:
-
-  .. code-block:: ipython
-
-     In [1] pd.concat([foo, bar, baz], 1)
-     Out[1]:
-           0  1  2
-        0  1  1  4
-        1  2  2  5
-
-  New Behavior:
-
-  .. ipython:: python
-
-    pd.concat([foo, bar, baz], 1)
-
-- ``DataFrame`` has gained the ``nlargest`` and ``nsmallest`` methods (:issue:`10393`)
-
-- Add a ``limit_direction`` keyword argument that works with ``limit`` to enable ``interpolate`` to fill ``NaN`` values forward, backward, or both (:issue:`9218`, :issue:`10420`, :issue:`11115`)
-
-  .. ipython:: python
-
-     ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan, np.nan, 13])
-     ser.interpolate(limit=1, limit_direction='both')
-
-- Added a ``DataFrame.round`` method to round the values to a variable number of decimal places (:issue:`10568`).
-
-  .. ipython :: python
-
-     df = pd.DataFrame(np.random.random([3, 3]), columns=['A', 'B', 'C'],
-     index=['first', 'second', 'third'])
-     df
-     df.round(2)
-     df.round({'A': 0, 'C': 2})
-
-- ``drop_duplicates`` and ``duplicated`` now accept a ``keep`` keyword to target first, last, and all duplicates. The ``take_last`` keyword is deprecated, see :ref:`here <whatsnew_0170.deprecations>` (:issue:`6511`, :issue:`8505`)
-
-  .. ipython :: python
-
-     s = pd.Series(['A', 'B', 'C', 'A', 'B', 'D'])
-     s.drop_duplicates()
-     s.drop_duplicates(keep='last')
-     s.drop_duplicates(keep=False)
-
-- Reindex now has a ``tolerance`` argument that allows for finer control of :ref:`basics.limits_on_reindex_fill` (:issue:`10411`):
-
-  .. ipython:: python
-
-     df = pd.DataFrame({'x': range(5),
-                        't': pd.date_range('2000-01-01', periods=5)})
-     df.reindex([0.1, 1.9, 3.5],
-                method='nearest',
-                tolerance=0.2)
-
-  When used on a ``DatetimeIndex``, ``TimedeltaIndex`` or ``PeriodIndex``, ``tolerance`` will coerced into a ``Timedelta`` if possible. This allows you to specify tolerance with a string:
-
-  .. ipython:: python
-
-     df = df.set_index('t')
-     df.reindex(pd.to_datetime(['1999-12-31']),
-                method='nearest',
-                tolerance='1 day')
-
-  ``tolerance`` is also exposed by the lower level ``Index.get_indexer`` and ``Index.get_loc`` methods.
-
-- Added functionality to use the ``base`` argument when resampling a ``TimeDeltaIndex`` (:issue:`10530`)
-
-- ``DatetimeIndex`` can be instantiated using strings contains ``NaT`` (:issue:`7599`)
-
-- ``to_datetime`` can now accept the ``yearfirst`` keyword (:issue:`7599`)
-
-- ``pandas.tseries.offsets`` larger than the ``Day`` offset can now be used with a ``Series`` for addition/subtraction (:issue:`10699`).  See the :ref:`docs <timeseries.offsetseries>` for more details.
-
-- ``pd.Timedelta.total_seconds()`` now returns Timedelta duration to ns precision (previously microsecond precision) (:issue:`10939`)
-
-- ``PeriodIndex`` now supports arithmetic with ``np.ndarray`` (:issue:`10638`)
-
-- Support pickling of ``Period`` objects (:issue:`10439`)
-
-- ``.as_blocks`` will now take a ``copy`` optional argument to return a copy of the data, default is to copy (no change in behavior from prior versions), (:issue:`9607`)
-
-- ``regex`` argument to ``DataFrame.filter`` now handles numeric column names instead of raising ``ValueError`` (:issue:`10384`).
-
-- Enable reading gzip compressed files via URL, either by explicitly setting the compression parameter or by inferring from the presence of the HTTP Content-Encoding header in the response (:issue:`8685`)
-
-- Enable writing Excel files in :ref:`memory <io.excel_writing_buffer>` using StringIO/BytesIO (:issue:`7074`)
-
-- Enable serialization of lists and dicts to strings in ``ExcelWriter`` (:issue:`8188`)
-
-- SQL io functions now accept a SQLAlchemy connectable. (:issue:`7877`)
-
-- ``pd.read_sql`` and ``to_sql`` can accept database URI as ``con`` parameter (:issue:`10214`)
-
-- ``read_sql_table`` will now allow reading from views (:issue:`10750`).
-
-- Enable writing complex values to ``HDFStores`` when using the ``table`` format (:issue:`10447`)
-
-- Enable ``pd.read_hdf`` to be used without specifying a key when the HDF file contains a single dataset (:issue:`10443`)
-
-- ``pd.read_stata`` will now read Stata 118 type files. (:issue:`9882`)
-
-- ``msgpack`` submodule has been updated to 0.4.6 with backward compatibility (:issue:`10581`)
-
-- ``DataFrame.to_dict`` now accepts ``orient='index'`` keyword argument (:issue:`10844`).
-
-- ``DataFrame.apply`` will return a Series of dicts if the passed function returns a dict and ``reduce=True`` (:issue:`8735`).
-
-- Allow passing `kwargs` to the interpolation methods (:issue:`10378`).
-
-- Improved error message when concatenating an empty iterable of ``Dataframe`` objects (:issue:`9157`)
-
-- ``pd.read_csv`` can now read bz2-compressed files incrementally, and the C parser can read bz2-compressed files from AWS S3 (:issue:`11070`, :issue:`11072`).
-
-- In ``pd.read_csv``, recognize ``s3n://`` and ``s3a://`` URLs as designating S3 file storage (:issue:`11070`, :issue:`11071`).
-
-- Read CSV files from AWS S3 incrementally, instead of first downloading the entire file. (Full file download still required for compressed files in Python 2.)  (:issue:`11070`, :issue:`11073`)
-
-- ``pd.read_csv`` is now able to infer compression type for files read from AWS S3 storage (:issue:`11070`, :issue:`11074`).
-
-
-.. _whatsnew_0170.api:
-
-.. _whatsnew_0170.api_breaking:
-
-Backwards incompatible API changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _whatsnew_0170.api_breaking.sorting:
-
-Changes to sorting API
-^^^^^^^^^^^^^^^^^^^^^^
-
-The sorting API has had some longtime inconsistencies. (:issue:`9816`, :issue:`8239`).
-
-Here is a summary of the API **PRIOR** to 0.17.0:
-
-- ``Series.sort`` is **INPLACE** while ``DataFrame.sort`` returns a new object.
-- ``Series.order`` returns a new object
-- It was possible to use ``Series/DataFrame.sort_index`` to sort by **values** by passing the ``by`` keyword.
-- ``Series/DataFrame.sortlevel`` worked only on a ``MultiIndex`` for sorting by index.
-
-To address these issues, we have revamped the API:
-
-- We have introduced a new method, :meth:`DataFrame.sort_values`, which is the merger of ``DataFrame.sort()``, ``Series.sort()``,
-  and ``Series.order()``, to handle sorting of **values**.
-- The existing methods ``Series.sort()``, ``Series.order()``, and ``DataFrame.sort()`` have been deprecated and will be removed in a
-  future version.
-- The ``by`` argument of ``DataFrame.sort_index()`` has been deprecated and will be removed in a future version.
-- The existing method ``.sort_index()`` will gain the ``level`` keyword to enable level sorting.
-
-We now have two distinct and non-overlapping methods of sorting. A ``*`` marks items that
-will show a ``FutureWarning``.
-
-To sort by the **values**:
-
-==================================    ====================================
-Previous                              Replacement
-==================================    ====================================
-\* ``Series.order()``                 ``Series.sort_values()``
-\* ``Series.sort()``                  ``Series.sort_values(inplace=True)``
-\* ``DataFrame.sort(columns=...)``    ``DataFrame.sort_values(by=...)``
-==================================    ====================================
-
-To sort by the **index**:
-
-==================================    ====================================
-Previous                              Replacement
-==================================    ====================================
-``Series.sort_index()``               ``Series.sort_index()``
-``Series.sortlevel(level=...)``       ``Series.sort_index(level=...``)
-``DataFrame.sort_index()``            ``DataFrame.sort_index()``
-``DataFrame.sortlevel(level=...)``    ``DataFrame.sort_index(level=...)``
-\* ``DataFrame.sort()``                 ``DataFrame.sort_index()``
-==================================    ====================================
-
-We have also deprecated and changed similar methods in two Series-like classes, ``Index`` and ``Categorical``.
-
-==================================    ====================================
-Previous                              Replacement
-==================================    ====================================
-\* ``Index.order()``                  ``Index.sort_values()``
-\* ``Categorical.order()``            ``Categorical.sort_values()``
-==================================    ====================================
-
-.. _whatsnew_0170.api_breaking.to_datetime:
-
-Changes to to_datetime and to_timedelta
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Error handling
-""""""""""""""
-
-The default for ``pd.to_datetime`` error handling has changed to ``errors='raise'``.
-In prior versions it was ``errors='ignore'``. Furthermore, the ``coerce`` argument
-has been deprecated in favor of ``errors='coerce'``. This means that invalid parsing
-will raise rather that return the original input as in previous versions. (:issue:`10636`)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [2]: pd.to_datetime(['2009-07-31', 'asd'])
-   Out[2]: array(['2009-07-31', 'asd'], dtype=object)
-
-New Behavior:
-
-.. code-block:: ipython
-
-   In [3]: pd.to_datetime(['2009-07-31', 'asd'])
-   ValueError: Unknown string format
-
-.. ipython:: python
-
-Of course you can coerce this as well.
-
-.. ipython:: python
-
-   to_datetime(['2009-07-31', 'asd'], errors='coerce')
-
-To keep the previous behavior, you can use ``errors='ignore'``:
-
-.. ipython:: python
-
-   to_datetime(['2009-07-31', 'asd'], errors='ignore')
-
-Furthermore, ``pd.to_timedelta`` has gained a similar API, of ``errors='raise'|'ignore'|'coerce'``, and the ``coerce`` keyword
-has been deprecated in favor of ``errors='coerce'``.
-
-Consistent Parsing
-""""""""""""""""""
-
-The string parsing of ``to_datetime``, ``Timestamp`` and ``DatetimeIndex`` has
-been made consistent. (:issue:`7599`)
-
-Prior to v0.17.0, ``Timestamp`` and ``to_datetime`` may parse year-only datetime-string incorrectly using today's date, otherwise ``DatetimeIndex``
-uses the beginning of the year. ``Timestamp`` and ``to_datetime`` may raise ``ValueError`` in some types of datetime-string which ``DatetimeIndex``
-can parse, such as a quarterly string.
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [1]: Timestamp('2012Q2')
-   Traceback
-      ...
-   ValueError: Unable to parse 2012Q2
-
-   # Results in today's date.
-   In [2]: Timestamp('2014')
-   Out [2]: 2014-08-12 00:00:00
-
-v0.17.0 can parse them as below. It works on ``DatetimeIndex`` also.
-
-New Behavior:
-
-.. ipython:: python
-
-   Timestamp('2012Q2')
-   Timestamp('2014')
-   DatetimeIndex(['2012Q2', '2014'])
-
-.. note::
-
-   If you want to perform calculations based on today's date, use ``Timestamp.now()`` and ``pandas.tseries.offsets``.
-
-   .. ipython:: python
-
-      import pandas.tseries.offsets as offsets
-      Timestamp.now()
-      Timestamp.now() + offsets.DateOffset(years=1)
-
-Changes to Index Comparisons
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Operator equal on ``Index`` should behavior similarly to ``Series`` (:issue:`9947`, :issue:`10637`)
-
-Starting in v0.17.0, comparing ``Index`` objects of different lengths will raise
-a ``ValueError``. This is to be consistent with the behavior of ``Series``.
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [2]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
-   Out[2]: array([ True, False, False], dtype=bool)
-
-   In [3]: pd.Index([1, 2, 3]) == pd.Index([2])
-   Out[3]: array([False,  True, False], dtype=bool)
-
-   In [4]: pd.Index([1, 2, 3]) == pd.Index([1, 2])
-   Out[4]: False
-
-New Behavior:
-
-.. code-block:: ipython
-
-   In [8]: pd.Index([1, 2, 3]) == pd.Index([1, 4, 5])
-   Out[8]: array([ True, False, False], dtype=bool)
-
-   In [9]: pd.Index([1, 2, 3]) == pd.Index([2])
-   ValueError: Lengths must match to compare
-
-   In [10]: pd.Index([1, 2, 3]) == pd.Index([1, 2])
-   ValueError: Lengths must match to compare
-
-Note that this is different from the ``numpy`` behavior where a comparison can
-be broadcast:
-
-.. ipython:: python
-
-   np.array([1, 2, 3]) == np.array([1])
-
-or it can return False if broadcasting can not be done:
-
-.. ipython:: python
-   :okwarning:
-
-   np.array([1, 2, 3]) == np.array([1, 2])
-
-Changes to Boolean Comparisons vs. None
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Boolean comparisons of a ``Series`` vs ``None`` will now be equivalent to comparing with ``np.nan``, rather than raise ``TypeError``. (:issue:`1079`).
-
-.. ipython:: python
-
-   s = Series(range(3))
-   s.iloc[1] = None
-   s
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [5]: s==None
-   TypeError: Could not compare <type 'NoneType'> type with Series
-
-New Behavior:
-
-.. ipython:: python
-
-   s==None
-
-Usually you simply want to know which values are null.
-
-.. ipython:: python
-
-   s.isnull()
-
-.. warning::
-
-   You generally will want to use ``isnull/notnull`` for these types of comparisons, as ``isnull/notnull`` tells you which elements are null. One has to be
-   mindful that ``nan's`` don't compare equal, but ``None's`` do. Note that Pandas/numpy uses the fact that ``np.nan != np.nan``, and treats ``None`` like ``np.nan``.
-
-   .. ipython:: python
-
-      None == None
-      np.nan == np.nan
-
-.. _whatsnew_0170.api_breaking.hdf_dropna:
-
-HDFStore dropna behavior
-^^^^^^^^^^^^^^^^^^^^^^^^
-
-The default behavior for HDFStore write functions with ``format='table'`` is now to keep rows that are all missing. Previously, the behavior was to drop rows that were all missing save the index. The previous behavior can be replicated using the ``dropna=True`` option. (:issue:`9382`)
-
-Previous Behavior:
-
-.. ipython:: python
-
-   df_with_missing = pd.DataFrame({'col1':[0, np.nan, 2],
-                                   'col2':[1, np.nan, np.nan]})
-
-   df_with_missing
-
-
-.. code-block:: ipython
-
-   In [27]:
-   df_with_missing.to_hdf('file.h5',
-                          'df_with_missing',
-                          format='table',
-                          mode='w')
-
-   In [28]: pd.read_hdf('file.h5', 'df_with_missing')
-
-   Out [28]:
-         col1  col2
-     0     0     1
-     2     2   NaN
-
-
-New Behavior:
-
-.. ipython:: python
-   :suppress:
-
-   import os
-
-.. ipython:: python
-
-   df_with_missing.to_hdf('file.h5',
-                          'df_with_missing',
-                           format='table',
-                           mode='w')
-
-   pd.read_hdf('file.h5', 'df_with_missing')
-
-.. ipython:: python
-   :suppress:
-
-   os.remove('file.h5')
-
-See the :ref:`docs <io.hdf5>` for more details.
-
-.. _whatsnew_0170.api_breaking.display_precision:
-
-Changes to ``display.precision`` option
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The ``display.precision`` option has been clarified to refer to decimal places (:issue:`10451`).
-
-Earlier versions of pandas would format floating point numbers to have one less decimal place than the value in
-``display.precision``.
-
-.. code-block:: ipython
-
-  In [1]: pd.set_option('display.precision', 2)
-
-  In [2]: pd.DataFrame({'x': [123.456789]})
-  Out[2]:
-         x
-  0  123.5
-
-If interpreting precision as "significant figures" this did work for scientific notation but that same interpretation
-did not work for values with standard formatting. It was also out of step with how numpy handles formatting.
-
-Going forward the value of ``display.precision`` will directly control the number of places after the decimal, for
-regular formatting as well as scientific notation, similar to how numpy's ``precision`` print option works.
-
-.. ipython:: python
-
-  pd.set_option('display.precision', 2)
-  pd.DataFrame({'x': [123.456789]})
-
-To preserve output behavior with prior versions the default value of ``display.precision`` has been reduced to ``6``
-from ``7``.
-
-.. ipython:: python
-  :suppress:
-
-  pd.set_option('display.precision', 6)
-
-.. _whatsnew_0170.api_breaking.categorical_unique:
-
-Changes to ``Categorical.unique``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Categorical.unique`` now returns new ``Categoricals`` with ``categories`` and ``codes`` that are unique, rather than returning ``np.array`` (:issue:`10508`)
-
-- unordered category: values and categories are sorted by appearance order.
-- ordered category: values are sorted by appearance order, categories keep existing order.
-
-.. ipython :: python
-
-   cat = pd.Categorical(['C', 'A', 'B', 'C'],
-                        categories=['A', 'B', 'C'],
-                        ordered=True)
-   cat
-   cat.unique()
-
-   cat = pd.Categorical(['C', 'A', 'B', 'C'],
-                        categories=['A', 'B', 'C'])
-   cat
-   cat.unique()
-
-Changes to ``bool`` passed as ``header`` in Parsers
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In earlier versions of pandas, if a bool was passed the ``header`` argument of
-``read_csv``, ``read_excel``, or ``read_html`` it was implicitly converted to
-an integer, resulting in ``header=0`` for ``False`` and ``header=1`` for ``True``
-(:issue:`6113`)
-
-A ``bool`` input to ``header`` will now raise a ``TypeError``
-
-.. code-block :: python
-
-   In [29]: df = pd.read_csv('data.csv', header=False)
-   TypeError: Passing a bool to header is invalid. Use header=None for no header or
-   header=int or list-like of ints to specify the row(s) making up the column names
-
-
-.. _whatsnew_0170.api_breaking.other:
-
-Other API Changes
-^^^^^^^^^^^^^^^^^
-
-- Line and kde plot with ``subplots=True`` now uses default colors, not all black. Specify ``color='k'`` to draw all lines in black (:issue:`9894`)
-- Calling the ``.value_counts()`` method on a Series with a ``categorical`` dtype now returns a Series with a ``CategoricalIndex`` (:issue:`10704`)
-- The metadata properties of subclasses of pandas objects will now be serialized (:issue:`10553`).
-- ``groupby`` using ``Categorical`` follows the same rule as ``Categorical.unique`` described above  (:issue:`10508`)
-- When constructing ``DataFrame`` with an array of ``complex64`` dtype previously meant the corresponding column
-  was automatically promoted to the ``complex128`` dtype. Pandas will now preserve the itemsize of the input for complex data (:issue:`10952`)
-- some numeric reduction operators would return ``ValueError``, rather than ``TypeError`` on object types that includes strings and numbers (:issue:`11131`)
-- Passing currently unsupported ``chunksize`` argument to ``read_excel`` or ``ExcelFile.parse`` will now raise ``NotImplementedError`` (:issue:`8011`)
-- Allow an ``ExcelFile`` object to be passed into ``read_excel`` (:issue:`11198`)
-- ``DatetimeIndex.union`` does not infer ``freq`` if ``self`` and the input have ``None`` as ``freq`` (:issue:`11086`)
-- ``NaT``'s methods now either raise ``ValueError``, or return ``np.nan`` or ``NaT`` (:issue:`9513`)
-
-  ===============================     ===============================================================
-  Behavior                            Methods
-  ===============================     ===============================================================
-  return ``np.nan``                   ``weekday``, ``isoweekday``
-  return ``NaT``                      ``date``, ``now``, ``replace``, ``to_datetime``, ``today``
-  return ``np.datetime64('NaT')``     ``to_datetime64`` (unchanged)
-  raise ``ValueError``                All other public methods (names not beginning with underscores)
-  ===============================     ===============================================================
-
-.. _whatsnew_0170.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- For ``Series`` the following indexing functions are deprecated (:issue:`10177`).
-
-  =====================  =================================
-  Deprecated Function    Replacement
-  =====================  =================================
-  ``.irow(i)``           ``.iloc[i]`` or ``.iat[i]``
-  ``.iget(i)``           ``.iloc[i]`` or ``.iat[i]``
-  ``.iget_value(i)``     ``.iloc[i]`` or ``.iat[i]``
-  =====================  =================================
-
-- For ``DataFrame`` the following indexing functions are deprecated (:issue:`10177`).
-
-  =====================  =================================
-  Deprecated Function    Replacement
-  =====================  =================================
-  ``.irow(i)``           ``.iloc[i]``
-  ``.iget_value(i, j)``  ``.iloc[i, j]`` or ``.iat[i, j]``
-  ``.icol(j)``           ``.iloc[:, j]``
-  =====================  =================================
-
-.. note:: These indexing function have been deprecated in the documentation since 0.11.0.
-
-- ``Categorical.name`` was deprecated to make ``Categorical`` more ``numpy.ndarray`` like. Use ``Series(cat, name="whatever")`` instead (:issue:`10482`).
-- Setting missing values (NaN) in a ``Categorical``'s ``categories`` will issue a warning (:issue:`10748`). You can still have missing values in the ``values``.
-- ``drop_duplicates`` and ``duplicated``'s ``take_last`` keyword was deprecated in favor of ``keep``. (:issue:`6511`, :issue:`8505`)
-- ``Series.nsmallest`` and ``nlargest``'s ``take_last`` keyword was deprecated in favor of ``keep``. (:issue:`10792`)
-- ``DataFrame.combineAdd`` and ``DataFrame.combineMult`` are deprecated. They
-  can easily be replaced by using the ``add`` and ``mul`` methods:
-  ``DataFrame.add(other, fill_value=0)`` and ``DataFrame.mul(other, fill_value=1.)``
-  (:issue:`10735`).
-- ``TimeSeries`` deprecated in favor of ``Series`` (note that this has been an alias since 0.13.0), (:issue:`10890`)
-- ``SparsePanel`` deprecated and will be removed in a future version (:issue:`11157`).
-- ``Series.is_time_series`` deprecated in favor of ``Series.index.is_all_dates`` (:issue:`11135`)
-- Legacy offsets (like ``'A@JAN'``) are deprecated (note that this has been alias since 0.8.0) (:issue:`10878`)
-- ``WidePanel`` deprecated in favor of ``Panel``, ``LongPanel`` in favor of ``DataFrame`` (note these have been aliases since < 0.11.0), (:issue:`10892`)
-- ``DataFrame.convert_objects`` has been deprecated in favor of type-specific functions ``pd.to_datetime``, ``pd.to_timestamp`` and ``pd.to_numeric`` (new in 0.17.0) (:issue:`11133`).
-
-.. _whatsnew_0170.prior_deprecations:
-
-Removal of prior version deprecations/changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Removal of ``na_last`` parameters from ``Series.order()`` and ``Series.sort()``, in favor of ``na_position``. (:issue:`5231`)
-- Remove of ``percentile_width`` from ``.describe()``, in favor of ``percentiles``. (:issue:`7088`)
-- Removal of ``colSpace`` parameter from ``DataFrame.to_string()``, in favor of ``col_space``, circa 0.8.0 version.
-- Removal of automatic time-series broadcasting (:issue:`2304`)
-
-  .. ipython :: python
-
-     np.random.seed(1234)
-     df = DataFrame(np.random.randn(5,2),columns=list('AB'),index=date_range('20130101',periods=5))
-     df
-
-  Previously
-
-  .. code-block:: ipython
-
-     In [3]: df + df.A
-     FutureWarning: TimeSeries broadcasting along DataFrame index by default is deprecated.
-     Please use DataFrame.<op> to explicitly broadcast arithmetic operations along the index
-
-     Out[3]:
-                         A         B
-     2013-01-01  0.942870 -0.719541
-     2013-01-02  2.865414  1.120055
-     2013-01-03 -1.441177  0.166574
-     2013-01-04  1.719177  0.223065
-     2013-01-05  0.031393 -2.226989
-
-  Current
-
-  .. ipython :: python
-
-     df.add(df.A,axis='index')
-
-
-- Remove ``table`` keyword in ``HDFStore.put/append``, in favor of using ``format=`` (:issue:`4645`)
-- Remove ``kind`` in ``read_excel/ExcelFile`` as its unused (:issue:`4712`)
-- Remove ``infer_type`` keyword from ``pd.read_html`` as its unused (:issue:`4770`, :issue:`7032`)
-- Remove ``offset`` and ``timeRule`` keywords from ``Series.tshift/shift``, in favor of ``freq`` (:issue:`4853`, :issue:`4864`)
-- Remove ``pd.load/pd.save`` aliases in favor of ``pd.to_pickle/pd.read_pickle`` (:issue:`3787`)
-
-.. _whatsnew_0170.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Development support for benchmarking with the `Air Speed Velocity library <https://github.com/spacetelescope/asv/>`_ (:issue:`8361`)
-- Added vbench benchmarks for alternative ExcelWriter engines and reading Excel files (:issue:`7171`)
-- Performance improvements in ``Categorical.value_counts`` (:issue:`10804`)
-- Performance improvements in ``SeriesGroupBy.nunique`` and ``SeriesGroupBy.value_counts`` and ``SeriesGroupby.transform`` (:issue:`10820`, :issue:`11077`)
-- Performance improvements in ``DataFrame.drop_duplicates`` with integer dtypes (:issue:`10917`)
-- Performance improvements in ``DataFrame.duplicated`` with wide frames. (:issue:`10161`, :issue:`11180`)
-- 4x improvement in ``timedelta`` string parsing (:issue:`6755`, :issue:`10426`)
-- 8x improvement in ``timedelta64`` and ``datetime64`` ops (:issue:`6755`)
-- Significantly improved performance of indexing ``MultiIndex`` with slicers (:issue:`10287`)
-- 8x improvement in ``iloc`` using list-like input (:issue:`10791`)
-- Improved performance of ``Series.isin`` for datetimelike/integer Series (:issue:`10287`)
-- 20x improvement in ``concat`` of Categoricals when categories are identical (:issue:`10587`)
-- Improved performance of ``to_datetime`` when specified format string is ISO8601 (:issue:`10178`)
-- 2x improvement of ``Series.value_counts`` for float dtype (:issue:`10821`)
-- Enable ``infer_datetime_format`` in ``to_datetime`` when date components do not have 0 padding (:issue:`11142`)
-- Regression from 0.16.1 in constructing ``DataFrame`` from nested dictionary (:issue:`11084`)
-- Performance improvements in addition/subtraction operations for ``DateOffset`` with ``Series`` or ``DatetimeIndex``  (:issue:`10744`, :issue:`11205`)
-
-.. _whatsnew_0170.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in incorrection computation of ``.mean()`` on ``timedelta64[ns]`` because of overflow (:issue:`9442`)
-- Bug in  ``.isin`` on older numpies (:issue: `11232`)
-- Bug in ``DataFrame.to_html(index=False)`` renders unnecessary ``name`` row (:issue:`10344`)
-- Bug in ``DataFrame.to_latex()`` the ``column_format`` argument could not be passed (:issue:`9402`)
-- Bug in ``DatetimeIndex`` when localizing with ``NaT`` (:issue:`10477`)
-- Bug in ``Series.dt`` ops in preserving meta-data (:issue:`10477`)
-- Bug in preserving ``NaT`` when passed in an otherwise invalid ``to_datetime`` construction (:issue:`10477`)
-- Bug in ``DataFrame.apply`` when function returns categorical series. (:issue:`9573`)
-- Bug in ``to_datetime`` with invalid dates and formats supplied (:issue:`10154`)
-- Bug in ``Index.drop_duplicates`` dropping name(s) (:issue:`10115`)
-- Bug in ``Series.quantile`` dropping name (:issue:`10881`)
-- Bug in ``pd.Series`` when setting a value on an empty ``Series`` whose index has a frequency. (:issue:`10193`)
-- Bug in ``pd.Series.interpolate`` with invalid ``order`` keyword values. (:issue:`10633`)
-- Bug in ``DataFrame.plot`` raises ``ValueError`` when color name is specified by multiple characters (:issue:`10387`)
-- Bug in ``Index`` construction with a mixed list of tuples (:issue:`10697`)
-- Bug in ``DataFrame.reset_index`` when index contains ``NaT``. (:issue:`10388`)
-- Bug in ``ExcelReader`` when worksheet is empty (:issue:`6403`)
-- Bug in ``BinGrouper.group_info`` where returned values are not compatible with base class (:issue:`10914`)
-- Bug in clearing the cache on ``DataFrame.pop`` and a subsequent inplace op (:issue:`10912`)
-- Bug in indexing with a mixed-integer ``Index`` causing an ``ImportError`` (:issue:`10610`)
-- Bug in ``Series.count`` when index has nulls (:issue:`10946`)
-- Bug in pickling of a non-regular freq ``DatetimeIndex`` (:issue:`11002`)
-- Bug causing ``DataFrame.where`` to not respect the ``axis`` parameter when the frame has a symmetric shape. (:issue:`9736`)
-- Bug in ``Table.select_column`` where name is not preserved (:issue:`10392`)
-- Bug in ``offsets.generate_range`` where ``start`` and ``end`` have finer precision than ``offset`` (:issue:`9907`)
-- Bug in ``pd.rolling_*`` where ``Series.name`` would be lost in the output (:issue:`10565`)
-- Bug in ``stack`` when index or columns are not unique. (:issue:`10417`)
-- Bug in setting a ``Panel`` when an axis has a multi-index (:issue:`10360`)
-- Bug in ``USFederalHolidayCalendar`` where ``USMemorialDay`` and ``USMartinLutherKingJr`` were incorrect (:issue:`10278` and :issue:`9760` )
-- Bug in ``.sample()`` where returned object, if set, gives unnecessary ``SettingWithCopyWarning`` (:issue:`10738`)
-- Bug in ``.sample()`` where weights passed as ``Series`` were not aligned along axis before being treated positionally, potentially causing problems if weight indices were not aligned with sampled object. (:issue:`10738`)
-
-- Regression fixed in (:issue:`9311`, :issue:`6620`, :issue:`9345`), where groupby with a datetime-like converting to float with certain aggregators (:issue:`10979`)
-
-- Bug in ``DataFrame.interpolate`` with ``axis=1`` and ``inplace=True`` (:issue:`10395`)
-- Bug in ``io.sql.get_schema`` when specifying multiple columns as primary
-  key (:issue:`10385`).
-
-- Bug in ``groupby(sort=False)`` with datetime-like ``Categorical`` raises ``ValueError`` (:issue:`10505`)
-- Bug in ``groupby(axis=1)`` with ``filter()`` throws ``IndexError`` (:issue:`11041`)
-- Bug in ``test_categorical`` on big-endian builds (:issue:`10425`)
-- Bug in ``Series.shift`` and ``DataFrame.shift`` not supporting categorical data (:issue:`9416`)
-- Bug in ``Series.map`` using categorical ``Series`` raises ``AttributeError`` (:issue:`10324`)
-- Bug in ``MultiIndex.get_level_values`` including ``Categorical`` raises ``AttributeError`` (:issue:`10460`)
-- Bug in ``pd.get_dummies`` with ``sparse=True`` not returning ``SparseDataFrame`` (:issue:`10531`)
-- Bug in ``Index`` subtypes (such as ``PeriodIndex``) not returning their own type for ``.drop`` and ``.insert`` methods (:issue:`10620`)
-- Bug in ``algos.outer_join_indexer`` when ``right`` array is empty (:issue:`10618`)
-
-- Bug in ``filter`` (regression from 0.16.0) and ``transform`` when grouping on multiple keys, one of which is datetime-like (:issue:`10114`)
-
-
-- Bug in ``to_datetime`` and ``to_timedelta`` causing ``Index`` name to be lost (:issue:`10875`)
-- Bug in ``len(DataFrame.groupby)`` causing ``IndexError`` when there's a column containing only NaNs (:issue: `11016`)
-
-- Bug that caused segfault when resampling an empty Series (:issue:`10228`)
-- Bug in ``DatetimeIndex`` and ``PeriodIndex.value_counts`` resets name from its result, but retains in result's ``Index``. (:issue:`10150`)
-- Bug in ``pd.eval`` using ``numexpr`` engine coerces 1 element numpy array to scalar (:issue:`10546`)
-- Bug in ``pd.concat`` with ``axis=0`` when column is of dtype ``category`` (:issue:`10177`)
-- Bug in ``read_msgpack`` where input type is not always checked (:issue:`10369`, :issue:`10630`)
-- Bug in ``pd.read_csv`` with kwargs ``index_col=False``, ``index_col=['a', 'b']`` or ``dtype``
-  (:issue:`10413`, :issue:`10467`, :issue:`10577`)
-- Bug in ``Series.from_csv`` with ``header`` kwarg not setting the ``Series.name`` or the ``Series.index.name`` (:issue:`10483`)
-- Bug in ``groupby.var`` which caused variance to be inaccurate for small float values (:issue:`10448`)
-- Bug in ``Series.plot(kind='hist')`` Y Label not informative (:issue:`10485`)
-- Bug in ``read_csv`` when using a converter which generates a ``uint8`` type (:issue:`9266`)
-
-- Bug causes memory leak in time-series line and area plot (:issue:`9003`)
-
-- Bug when setting a ``Panel`` sliced along the major or minor axes when the right-hand side is a ``DataFrame`` (:issue:`11014`)
-- Bug that returns ``None`` and does not raise ``NotImplementedError`` when operator functions (e.g. ``.add``) of ``Panel`` are not implemented (:issue:`7692`)
-
-- Bug in line and kde plot cannot accept multiple colors when ``subplots=True`` (:issue:`9894`)
-- Bug in ``DataFrame.plot`` raises ``ValueError`` when color name is specified by multiple characters (:issue:`10387`)
-
-- Bug in left and right ``align`` of ``Series`` with ``MultiIndex`` may be inverted (:issue:`10665`)
-- Bug in left and right ``join`` of with ``MultiIndex`` may be inverted (:issue:`10741`)
-
-- Bug in ``read_stata`` when reading a file with a different order set in ``columns`` (:issue:`10757`)
-- Bug in ``Categorical`` may not representing properly when category contains ``tz`` or ``Period`` (:issue:`10713`)
-- Bug in ``Categorical.__iter__`` may not returning correct ``datetime`` and ``Period`` (:issue:`10713`)
-- Bug in indexing with a ``PeriodIndex`` on an object with a ``PeriodIndex`` (:issue:`4125`)
-- Bug in ``read_csv`` with ``engine='c'``: EOF preceded by a comment, blank line, etc. was not handled correctly (:issue:`10728`, :issue:`10548`)
-
-- Reading "famafrench" data via ``DataReader`` results in HTTP 404 error because of the website url is changed (:issue:`10591`).
-- Bug in ``read_msgpack`` where DataFrame to decode has duplicate column names (:issue:`9618`)
-- Bug in ``io.common.get_filepath_or_buffer`` which caused reading of valid S3 files to fail if the bucket also contained keys for which the user does not have read permission (:issue:`10604`)
-- Bug in vectorised setting of timestamp columns with python ``datetime.date`` and numpy ``datetime64`` (:issue:`10408`, :issue:`10412`)
-- Bug in ``Index.take`` may add unnecessary ``freq`` attribute (:issue:`10791`)
-- Bug in ``merge`` with empty ``DataFrame`` may raise ``IndexError`` (:issue:`10824`)
-- Bug in ``to_latex`` where unexpected keyword argument for some documented arguments (:issue:`10888`)
-- Bug in indexing of large ``DataFrame`` where ``IndexError`` is uncaught (:issue:`10645` and :issue:`10692`)
-- Bug in ``read_csv`` when using the ``nrows`` or ``chunksize`` parameters if file contains only a header line (:issue:`9535`)
-- Bug in serialization of ``category`` types in HDF5 in presence of alternate encodings. (:issue:`10366`)
-- Bug in ``pd.DataFrame`` when constructing an empty DataFrame with a string dtype (:issue:`9428`)
-- Bug in ``pd.DataFrame.diff`` when DataFrame is not consolidated (:issue:`10907`)
-- Bug in ``pd.unique`` for arrays with the ``datetime64`` or ``timedelta64`` dtype that meant an array with object dtype was returned instead the original dtype (:issue:`9431`)
-- Bug in ``Timedelta`` raising error when slicing from 0s (:issue:`10583`)
-- Bug in ``DatetimeIndex.take`` and ``TimedeltaIndex.take`` may not raise ``IndexError`` against invalid index (:issue:`10295`)
-- Bug in ``Series([np.nan]).astype('M8[ms]')``, which now returns ``Series([pd.NaT])`` (:issue:`10747`)
-- Bug in ``PeriodIndex.order`` reset freq (:issue:`10295`)
-- Bug in ``date_range`` when ``freq`` divides ``end`` as nanos (:issue:`10885`)
-- Bug in ``iloc`` allowing memory outside bounds of a Series to be accessed with negative integers (:issue:`10779`)
-- Bug in ``read_msgpack`` where encoding is not respected (:issue:`10581`)
-- Bug preventing access to the first index when using ``iloc`` with a list containing the appropriate negative integer (:issue:`10547`, :issue:`10779`)
-- Bug in ``TimedeltaIndex`` formatter causing error while trying to save ``DataFrame`` with ``TimedeltaIndex`` using ``to_csv`` (:issue:`10833`)
-- Bug in ``DataFrame.where`` when handling Series slicing (:issue:`10218`, :issue:`9558`)
-- Bug where ``pd.read_gbq`` throws ``ValueError`` when Bigquery returns zero rows (:issue:`10273`)
-- Bug in ``to_json`` which was causing segmentation fault when serializing 0-rank ndarray (:issue:`9576`)
-- Bug in plotting functions may raise ``IndexError`` when plotted on ``GridSpec`` (:issue:`10819`)
-- Bug in plot result may show unnecessary minor ticklabels (:issue:`10657`)
-- Bug in ``groupby`` incorrect computation for aggregation on ``DataFrame`` with ``NaT`` (E.g ``first``, ``last``, ``min``). (:issue:`10590`, :issue:`11010`)
-- Bug when constructing ``DataFrame`` where passing a dictionary with only scalar values and specifying columns did not raise an error (:issue:`10856`)
-- Bug in ``.var()`` causing roundoff errors for highly similar values (:issue:`10242`)
-- Bug in ``DataFrame.plot(subplots=True)`` with duplicated columns outputs incorrect result (:issue:`10962`)
-- Bug in ``Index`` arithmetic may result in incorrect class (:issue:`10638`)
-- Bug in ``date_range`` results in empty if freq is negative annualy, quarterly and monthly (:issue:`11018`)
-- Bug in ``DatetimeIndex`` cannot infer negative freq (:issue:`11018`)
-- Remove use of some deprecated numpy comparison operations, mainly in tests. (:issue:`10569`)
-- Bug in ``Index`` dtype may not applied properly (:issue:`11017`)
-- Bug in ``io.gbq`` when testing for minimum google api client version (:issue:`10652`)
-- Bug in ``DataFrame`` construction from nested ``dict`` with ``timedelta`` keys (:issue:`11129`)
-- Bug in ``.fillna`` against may raise ``TypeError`` when data contains datetime dtype (:issue:`7095`, :issue:`11153`)
-- Bug in ``.groupby`` when number of keys to group by is same as length of index (:issue:`11185`)
-- Bug in ``convert_objects`` where converted values might not be returned if all null and ``coerce`` (:issue:`9589`)
-- Bug in ``convert_objects`` where ``copy`` keyword was not respected (:issue:`9589`)
diff --git a/doc/source/whatsnew/v0.17.1.rst b/doc/source/whatsnew/v0.17.1.rst
new file mode 100644
index 0000000000000..233414dae957d
--- /dev/null
+++ b/doc/source/whatsnew/v0.17.1.rst
@@ -0,0 +1,219 @@
+.. _whatsnew_0171:
+
+v0.17.1 (November 21, 2015)
+---------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+
+
+.. note::
+
+   We are proud to announce that *pandas* has become a sponsored project of the (`NumFOCUS organization`_). This will help ensure the success of development of *pandas* as a world-class open-source project.
+
+.. _numfocus organization: http://www.numfocus.org/blog/numfocus-announces-new-fiscally-sponsored-project-pandas
+
+This is a minor bug-fix release from 0.17.0 and includes a large number of
+bug fixes along several new features, enhancements, and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Support for Conditional HTML Formatting, see :ref:`here <whatsnew_0171.style>`
+- Releasing the GIL on the csv reader & other ops, see :ref:`here <whatsnew_0171.performance>`
+- Fixed regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
+
+.. contents:: What's new in v0.17.1
+    :local:
+    :backlinks: none
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0171.style:
+
+Conditional HTML Formatting
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. warning::
+    This is a new feature and is under active development.
+    We'll be adding features an  possibly making breaking changes in future
+    releases. Feedback is welcome_.
+
+.. _welcome: https://github.com/pandas-dev/pandas/issues/11610
+
+We've added *experimental* support for conditional HTML formatting:
+the visual styling of a DataFrame based on the data.
+The styling is accomplished with HTML and CSS.
+Accesses the styler class with the :attr:`pandas.DataFrame.style`, attribute,
+an instance of :class:`~pandas.core.style.Styler` with your data attached.
+
+Here's a quick example:
+
+  .. ipython:: python
+
+    np.random.seed(123)
+    df = pd.DataFrame(np.random.randn(10, 5), columns=list('abcde'))
+    html = df.style.background_gradient(cmap='viridis', low=.5)
+
+We can render the HTML to get the following table.
+
+.. raw:: html
+   :file: whatsnew_0171_html_table.html
+
+:class:`~pandas.core.style.Styler` interacts nicely with the Jupyter Notebook.
+See the :ref:`documentation </style.ipynb>` for more.
+
+.. _whatsnew_0171.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- ``DatetimeIndex`` now supports conversion to strings with ``astype(str)`` (:issue:`10442`)
+- Support for ``compression`` (gzip/bz2) in :meth:`pandas.DataFrame.to_csv` (:issue:`7615`)
+- ``pd.read_*`` functions can now also accept :class:`python:pathlib.Path`, or :class:`py:py._path.local.LocalPath`
+  objects for the ``filepath_or_buffer`` argument. (:issue:`11033`)
+  - The ``DataFrame`` and ``Series`` functions ``.to_csv()``, ``.to_html()`` and ``.to_latex()`` can now handle paths beginning with tildes (e.g. ``~/Documents/``) (:issue:`11438`)
+- ``DataFrame`` now uses the fields of a ``namedtuple`` as columns, if columns are not supplied (:issue:`11181`)
+- ``DataFrame.itertuples()`` now returns ``namedtuple`` objects, when possible. (:issue:`11269`, :issue:`11625`)
+- Added ``axvlines_kwds`` to parallel coordinates plot (:issue:`10709`)
+- Option to ``.info()`` and ``.memory_usage()`` to provide for deep introspection of memory consumption. Note that this can be expensive to compute and therefore is an optional parameter. (:issue:`11595`)
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'A': ['foo'] * 1000})  # noqa: F821
+     df['B'] = df['A'].astype('category')
+
+     # shows the '+' as we have object dtypes
+     df.info()
+
+     # we have an accurate memory assessment (but can be expensive to compute this)
+     df.info(memory_usage='deep')
+
+- ``Index`` now has a ``fillna`` method (:issue:`10089`)
+
+  .. ipython:: python
+
+     pd.Index([1, np.nan, 3]).fillna(2)
+
+- Series of type ``category`` now make ``.str.<...>`` and ``.dt.<...>`` accessor methods / properties available, if the categories are of that type. (:issue:`10661`)
+
+  .. ipython:: python
+
+     s = pd.Series(list('aabb')).astype('category')
+     s
+     s.str.contains("a")
+
+     date = pd.Series(pd.date_range('1/1/2015', periods=5)).astype('category')
+     date
+     date.dt.day
+
+- ``pivot_table`` now has a ``margins_name`` argument so you can use something other than the default of 'All' (:issue:`3335`)
+- Implement export of ``datetime64[ns, tz]`` dtypes with a fixed HDF5 store (:issue:`11411`)
+- Pretty printing sets (e.g. in DataFrame cells) now uses set literal syntax (``{x, y}``) instead of
+  Legacy Python syntax (``set([x, y])``) (:issue:`11215`)
+- Improve the error message in :func:`pandas.io.gbq.to_gbq` when a streaming insert fails (:issue:`11285`)
+  and when the DataFrame does not match the schema of the destination table (:issue:`11359`)
+
+.. _whatsnew_0171.api:
+
+API changes
+~~~~~~~~~~~
+
+- raise ``NotImplementedError`` in ``Index.shift`` for non-supported index types (:issue:`8038`)
+- ``min`` and ``max`` reductions on ``datetime64`` and ``timedelta64`` dtyped series now
+  result in ``NaT`` and not ``nan`` (:issue:`11245`).
+- Indexing with a null key will raise a ``TypeError``, instead of a ``ValueError`` (:issue:`11356`)
+- ``Series.ptp`` will now ignore missing values by default (:issue:`11163`)
+
+.. _whatsnew_0171.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- The ``pandas.io.ga`` module which implements ``google-analytics`` support is deprecated and will be removed in a future version (:issue:`11308`)
+- Deprecate the ``engine`` keyword in ``.to_csv()``, which will be removed in a future version (:issue:`11274`)
+
+.. _whatsnew_0171.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Checking monotonic-ness before sorting on an index (:issue:`11080`)
+- ``Series.dropna`` performance improvement when its dtype can't contain ``NaN`` (:issue:`11159`)
+- Release the GIL on most datetime field operations (e.g. ``DatetimeIndex.year``, ``Series.dt.year``), normalization, and conversion to and from ``Period``, ``DatetimeIndex.to_period`` and ``PeriodIndex.to_timestamp`` (:issue:`11263`)
+- Release the GIL on some rolling algos: ``rolling_median``, ``rolling_mean``, ``rolling_max``, ``rolling_min``, ``rolling_var``, ``rolling_kurt``, ``rolling_skew`` (:issue:`11450`)
+- Release the GIL when reading and parsing text files in ``read_csv``, ``read_table`` (:issue:`11272`)
+- Improved performance of ``rolling_median`` (:issue:`11450`)
+- Improved performance of ``to_excel`` (:issue:`11352`)
+- Performance bug in repr of ``Categorical`` categories, which was rendering the strings before chopping them for display (:issue:`11305`)
+- Performance improvement in ``Categorical.remove_unused_categories``, (:issue:`11643`).
+- Improved performance of ``Series`` constructor with no data and ``DatetimeIndex`` (:issue:`11433`)
+- Improved performance of ``shift``, ``cumprod``, and ``cumsum`` with groupby (:issue:`4095`)
+
+.. _whatsnew_0171.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- ``SparseArray.__iter__()`` now does not cause ``PendingDeprecationWarning`` in Python 3.5 (:issue:`11622`)
+- Regression from 0.16.2 for output formatting of long floats/nan, restored in (:issue:`11302`)
+- ``Series.sort_index()`` now correctly handles the ``inplace`` option (:issue:`11402`)
+- Incorrectly distributed .c file in the build on ``PyPi`` when reading a csv of floats and passing ``na_values=<a scalar>`` would show an exception (:issue:`11374`)
+- Bug in ``.to_latex()`` output broken when the index has a name (:issue:`10660`)
+- Bug in ``HDFStore.append`` with strings whose encoded length exceeded the max unencoded length (:issue:`11234`)
+- Bug in merging ``datetime64[ns, tz]`` dtypes (:issue:`11405`)
+- Bug in ``HDFStore.select`` when comparing with a numpy scalar in a where clause (:issue:`11283`)
+- Bug in using ``DataFrame.ix`` with a MultiIndex indexer (:issue:`11372`)
+- Bug in ``date_range`` with ambiguous endpoints (:issue:`11626`)
+- Prevent adding new attributes to the accessors ``.str``, ``.dt`` and ``.cat``. Retrieving such
+  a value was not possible, so error out on setting it. (:issue:`10673`)
+- Bug in tz-conversions with an ambiguous time and ``.dt`` accessors (:issue:`11295`)
+- Bug in output formatting when using an index of ambiguous times (:issue:`11619`)
+- Bug in comparisons of Series vs list-likes (:issue:`11339`)
+- Bug in ``DataFrame.replace`` with a ``datetime64[ns, tz]`` and a non-compat to_replace (:issue:`11326`, :issue:`11153`)
+- Bug in ``isnull`` where ``numpy.datetime64('NaT')`` in a ``numpy.array`` was not determined to be null(:issue:`11206`)
+- Bug in list-like indexing with a mixed-integer Index (:issue:`11320`)
+- Bug in ``pivot_table`` with ``margins=True`` when indexes are of ``Categorical`` dtype (:issue:`10993`)
+- Bug in ``DataFrame.plot`` cannot use hex strings colors (:issue:`10299`)
+- Regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
+- Bug in ``pd.eval`` where unary ops in a list error (:issue:`11235`)
+- Bug in ``squeeze()`` with zero length arrays (:issue:`11230`, :issue:`8999`)
+- Bug in ``describe()`` dropping column names for hierarchical indexes (:issue:`11517`)
+- Bug in ``DataFrame.pct_change()`` not propagating ``axis`` keyword on ``.fillna`` method (:issue:`11150`)
+- Bug in ``.to_csv()`` when a mix of integer and string column names are passed as the ``columns`` parameter (:issue:`11637`)
+- Bug in indexing with a ``range``, (:issue:`11652`)
+- Bug in inference of numpy scalars and preserving dtype when setting columns (:issue:`11638`)
+- Bug in ``to_sql`` using unicode column names giving UnicodeEncodeError with (:issue:`11431`).
+- Fix regression in setting of ``xticks`` in ``plot`` (:issue:`11529`).
+- Bug in ``holiday.dates`` where observance rules could not be applied to holiday and doc enhancement (:issue:`11477`, :issue:`11533`)
+- Fix plotting issues when having plain ``Axes`` instances instead of ``SubplotAxes`` (:issue:`11520`, :issue:`11556`).
+- Bug in ``DataFrame.to_latex()`` produces an extra rule when ``header=False`` (:issue:`7124`)
+- Bug in ``df.groupby(...).apply(func)`` when a func returns a ``Series`` containing a new datetimelike column (:issue:`11324`)
+- Bug in ``pandas.json`` when file to load is big (:issue:`11344`)
+- Bugs in ``to_excel`` with duplicate columns (:issue:`11007`, :issue:`10982`, :issue:`10970`)
+- Fixed a bug that prevented the construction of an empty series of dtype ``datetime64[ns, tz]`` (:issue:`11245`).
+- Bug in ``read_excel`` with MultiIndex containing integers (:issue:`11317`)
+- Bug in ``to_excel`` with openpyxl 2.2+ and merging (:issue:`11408`)
+- Bug in ``DataFrame.to_dict()`` produces a ``np.datetime64`` object instead of ``Timestamp`` when only datetime is present in data (:issue:`11327`)
+- Bug in ``DataFrame.corr()`` raises exception when computes Kendall correlation for DataFrames with boolean and not boolean columns (:issue:`11560`)
+- Bug in the link-time error caused by C ``inline`` functions on FreeBSD 10+ (with ``clang``) (:issue:`10510`)
+- Bug in ``DataFrame.to_csv`` in passing through arguments for formatting ``MultiIndexes``, including ``date_format`` (:issue:`7791`)
+- Bug in ``DataFrame.join()`` with ``how='right'`` producing a ``TypeError`` (:issue:`11519`)
+- Bug in ``Series.quantile`` with empty list results has ``Index`` with ``object`` dtype (:issue:`11588`)
+- Bug in ``pd.merge`` results in empty ``Int64Index`` rather than ``Index(dtype=object)`` when the merge result is empty (:issue:`11588`)
+- Bug in ``Categorical.remove_unused_categories`` when having ``NaN`` values (:issue:`11599`)
+- Bug in ``DataFrame.to_sparse()`` loses column names for MultiIndexes (:issue:`11600`)
+- Bug in ``DataFrame.round()`` with non-unique column index producing a Fatal Python error (:issue:`11611`)
+- Bug in ``DataFrame.round()`` with ``decimals`` being a non-unique indexed Series producing extra columns (:issue:`11618`)
+
+
+.. _whatsnew_0.17.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.17.0..v0.17.1
diff --git a/doc/source/whatsnew/v0.17.1.txt b/doc/source/whatsnew/v0.17.1.txt
deleted file mode 100644
index 17496c84b7181..0000000000000
--- a/doc/source/whatsnew/v0.17.1.txt
+++ /dev/null
@@ -1,204 +0,0 @@
-.. _whatsnew_0171:
-
-v0.17.1 (November 21, 2015)
----------------------------
-
-.. note::
-
-   We are proud to announce that *pandas* has become a sponsored project of the (`NUMFocus organization`_). This will help ensure the success of development of *pandas* as a world-class open-source project.
-
-.. _numfocus organization: http://www.numfocus.org/blog/numfocus-announces-new-fiscally-sponsored-project-pandas
-
-This is a minor bug-fix release from 0.17.0 and includes a large number of
-bug fixes along several new features, enhancements, and performance improvements.
-We recommend that all users upgrade to this version.
-
-Highlights include:
-
-- Support for Conditional HTML Formatting, see :ref:`here <whatsnew_0171.style>`
-- Releasing the GIL on the csv reader & other ops, see :ref:`here <whatsnew_0171.performance>`
-- Fixed regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
-
-.. contents:: What's new in v0.17.1
-    :local:
-    :backlinks: none
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0171.style:
-
-Conditional HTML Formatting
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. warning::
-    This is a new feature and is under active development.
-    We'll be adding features an  possibly making breaking changes in future
-    releases. Feedback is welcome_.
-
-.. _welcome: https://github.com/pandas-dev/pandas/issues/11610
-
-We've added *experimental* support for conditional HTML formatting:
-the visual styling of a DataFrame based on the data.
-The styling is accomplished with HTML and CSS.
-Acesses the styler class with the :attr:`pandas.DataFrame.style`, attribute,
-an instance of :class:`~pandas.core.style.Styler` with your data attached.
-
-Here's a quick example:
-
-  .. ipython:: python
-
-    np.random.seed(123)
-    df = DataFrame(np.random.randn(10, 5), columns=list('abcde'))
-    html = df.style.background_gradient(cmap='viridis', low=.5)
-
-We can render the HTML to get the following table.
-
-.. raw:: html
-   :file: whatsnew_0171_html_table.html
-
-:class:`~pandas.core.style.Styler` interacts nicely with the Jupyter Notebook.
-See the :ref:`documentation <style>` for more.
-
-.. _whatsnew_0171.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-- ``DatetimeIndex`` now supports conversion to strings with ``astype(str)`` (:issue:`10442`)
-- Support for ``compression`` (gzip/bz2) in :meth:`pandas.DataFrame.to_csv` (:issue:`7615`)
-- ``pd.read_*`` functions can now also accept :class:`python:pathlib.Path`, or :class:`py:py._path.local.LocalPath`
-  objects for the ``filepath_or_buffer`` argument. (:issue:`11033`)
-  - The ``DataFrame`` and ``Series`` functions ``.to_csv()``, ``.to_html()`` and ``.to_latex()`` can now handle paths beginning with tildes (e.g. ``~/Documents/``) (:issue:`11438`)
-- ``DataFrame`` now uses the fields of a ``namedtuple`` as columns, if columns are not supplied (:issue:`11181`)
-- ``DataFrame.itertuples()`` now returns ``namedtuple`` objects, when possible. (:issue:`11269`, :issue:`11625`)
-- Added ``axvlines_kwds`` to parallel coordinates plot (:issue:`10709`)
-- Option to ``.info()`` and ``.memory_usage()`` to provide for deep introspection of memory consumption. Note that this can be expensive to compute and therefore is an optional parameter. (:issue:`11595`)
-
-  .. ipython:: python
-
-     df = DataFrame({'A' : ['foo']*1000})
-     df['B'] = df['A'].astype('category')
-
-     # shows the '+' as we have object dtypes
-     df.info()
-
-     # we have an accurate memory assessment (but can be expensive to compute this)
-     df.info(memory_usage='deep')
-
-- ``Index`` now has a ``fillna`` method (:issue:`10089`)
-
-  .. ipython:: python
-
-     pd.Index([1, np.nan, 3]).fillna(2)
-
-- Series of type ``category`` now make ``.str.<...>`` and ``.dt.<...>`` accessor methods / properties available, if the categories are of that type. (:issue:`10661`)
-
-  .. ipython:: python
-
-     s = pd.Series(list('aabb')).astype('category')
-     s
-     s.str.contains("a")
-
-     date = pd.Series(pd.date_range('1/1/2015', periods=5)).astype('category')
-     date
-     date.dt.day
-
-- ``pivot_table`` now has a ``margins_name`` argument so you can use something other than the default of 'All' (:issue:`3335`)
-- Implement export of ``datetime64[ns, tz]`` dtypes with a fixed HDF5 store (:issue:`11411`)
-- Pretty printing sets (e.g. in DataFrame cells) now uses set literal syntax (``{x, y}``) instead of
-  Legacy Python syntax (``set([x, y])``) (:issue:`11215`)
-- Improve the error message in :func:`pandas.io.gbq.to_gbq` when a streaming insert fails (:issue:`11285`)
-  and when the DataFrame does not match the schema of the destination table (:issue:`11359`)
-
-.. _whatsnew_0171.api:
-
-API changes
-~~~~~~~~~~~
-
-- raise ``NotImplementedError`` in ``Index.shift`` for non-supported index types (:issue:`8038`)
-- ``min`` and ``max`` reductions on ``datetime64`` and ``timedelta64`` dtyped series now
-  result in ``NaT`` and not ``nan`` (:issue:`11245`).
-- Indexing with a null key will raise a ``TypeError``, instead of a ``ValueError`` (:issue:`11356`)
-- ``Series.ptp`` will now ignore missing values by default (:issue:`11163`)
-
-.. _whatsnew_0171.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- The ``pandas.io.ga`` module which implements ``google-analytics`` support is deprecated and will be removed in a future version (:issue:`11308`)
-- Deprecate the ``engine`` keyword in ``.to_csv()``, which will be removed in a future version (:issue:`11274`)
-
-.. _whatsnew_0171.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Checking monotonic-ness before sorting on an index (:issue:`11080`)
-- ``Series.dropna`` performance improvement when its dtype can't contain ``NaN`` (:issue:`11159`)
-- Release the GIL on most datetime field operations (e.g. ``DatetimeIndex.year``, ``Series.dt.year``), normalization, and conversion to and from ``Period``, ``DatetimeIndex.to_period`` and ``PeriodIndex.to_timestamp`` (:issue:`11263`)
-- Release the GIL on some rolling algos: ``rolling_median``, ``rolling_mean``, ``rolling_max``, ``rolling_min``, ``rolling_var``, ``rolling_kurt``, ``rolling_skew`` (:issue:`11450`)
-- Release the GIL when reading and parsing text files in ``read_csv``, ``read_table`` (:issue:`11272`)
-- Improved performance of ``rolling_median`` (:issue:`11450`)
-- Improved performance of ``to_excel`` (:issue:`11352`)
-- Performance bug in repr of ``Categorical`` categories, which was rendering the strings before chopping them for display (:issue:`11305`)
-- Performance improvement in ``Categorical.remove_unused_categories``, (:issue:`11643`).
-- Improved performance of ``Series`` constructor with no data and ``DatetimeIndex`` (:issue:`11433`)
-- Improved performance of ``shift``, ``cumprod``, and ``cumsum`` with groupby (:issue:`4095`)
-
-.. _whatsnew_0171.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- ``SparseArray.__iter__()`` now does not cause ``PendingDeprecationWarning`` in Python 3.5 (:issue:`11622`)
-- Regression from 0.16.2 for output formatting of long floats/nan, restored in (:issue:`11302`)
-- ``Series.sort_index()`` now correctly handles the ``inplace`` option (:issue:`11402`)
-- Incorrectly distributed .c file in the build on ``PyPi`` when reading a csv of floats and passing ``na_values=<a scalar>`` would show an exception (:issue:`11374`)
-- Bug in ``.to_latex()`` output broken when the index has a name (:issue:`10660`)
-- Bug in ``HDFStore.append`` with strings whose encoded length exceded the max unencoded length (:issue:`11234`)
-- Bug in merging ``datetime64[ns, tz]`` dtypes (:issue:`11405`)
-- Bug in ``HDFStore.select`` when comparing with a numpy scalar in a where clause (:issue:`11283`)
-- Bug in using ``DataFrame.ix`` with a multi-index indexer (:issue:`11372`)
-- Bug in ``date_range`` with ambigous endpoints (:issue:`11626`)
-- Prevent adding new attributes to the accessors ``.str``, ``.dt`` and ``.cat``. Retrieving such
-  a value was not possible, so error out on setting it. (:issue:`10673`)
-- Bug in tz-conversions with an ambiguous time and ``.dt`` accessors (:issue:`11295`)
-- Bug in output formatting when using an index of ambiguous times (:issue:`11619`)
-- Bug in comparisons of Series vs list-likes (:issue:`11339`)
-- Bug in ``DataFrame.replace`` with a ``datetime64[ns, tz]`` and a non-compat to_replace (:issue:`11326`, :issue:`11153`)
-- Bug in ``isnull`` where ``numpy.datetime64('NaT')`` in a ``numpy.array`` was not determined to be null(:issue:`11206`)
-- Bug in list-like indexing with a mixed-integer Index (:issue:`11320`)
-- Bug in ``pivot_table`` with ``margins=True`` when indexes are of ``Categorical`` dtype (:issue:`10993`)
-- Bug in ``DataFrame.plot`` cannot use hex strings colors (:issue:`10299`)
-- Regression in ``DataFrame.drop_duplicates`` from 0.16.2, causing incorrect results on integer values (:issue:`11376`)
-- Bug in ``pd.eval`` where unary ops in a list error (:issue:`11235`)
-- Bug in ``squeeze()`` with zero length arrays (:issue:`11230`, :issue:`8999`)
-- Bug in ``describe()`` dropping column names for hierarchical indexes (:issue:`11517`)
-- Bug in ``DataFrame.pct_change()`` not propagating ``axis`` keyword on ``.fillna`` method (:issue:`11150`)
-- Bug in ``.to_csv()`` when a mix of integer and string column names are passed as the ``columns`` parameter (:issue:`11637`)
-- Bug in indexing with a ``range``, (:issue:`11652`)
-- Bug in inference of numpy scalars and preserving dtype when setting columns (:issue:`11638`)
-- Bug in ``to_sql`` using unicode column names giving UnicodeEncodeError with (:issue:`11431`).
-- Fix regression in setting of ``xticks`` in ``plot`` (:issue:`11529`).
-- Bug in ``holiday.dates`` where observance rules could not be applied to holiday and doc enhancement (:issue:`11477`, :issue:`11533`)
-- Fix plotting issues when having plain ``Axes`` instances instead of ``SubplotAxes`` (:issue:`11520`, :issue:`11556`).
-- Bug in ``DataFrame.to_latex()`` produces an extra rule when ``header=False`` (:issue:`7124`)
-- Bug in ``df.groupby(...).apply(func)`` when a func returns a ``Series`` containing a new datetimelike column (:issue:`11324`)
-- Bug in ``pandas.json`` when file to load is big (:issue:`11344`)
-- Bugs in ``to_excel`` with duplicate columns (:issue:`11007`, :issue:`10982`, :issue:`10970`)
-- Fixed a bug that prevented the construction of an empty series of dtype ``datetime64[ns, tz]`` (:issue:`11245`).
-- Bug in ``read_excel`` with multi-index containing integers (:issue:`11317`)
-- Bug in ``to_excel`` with openpyxl 2.2+ and merging (:issue:`11408`)
-- Bug in ``DataFrame.to_dict()`` produces a ``np.datetime64`` object instead of ``Timestamp`` when only datetime is present in data (:issue:`11327`)
-- Bug in ``DataFrame.corr()`` raises exception when computes Kendall correlation for DataFrames with boolean and not boolean columns (:issue:`11560`)
-- Bug in the link-time error caused by C ``inline`` functions on FreeBSD 10+ (with ``clang``) (:issue:`10510`)
-- Bug in ``DataFrame.to_csv`` in passing through arguments for formatting ``MultiIndexes``, including ``date_format`` (:issue:`7791`)
-- Bug in ``DataFrame.join()`` with ``how='right'`` producing a ``TypeError`` (:issue:`11519`)
-- Bug in ``Series.quantile`` with empty list results has ``Index`` with ``object`` dtype (:issue:`11588`)
-- Bug in ``pd.merge`` results in empty ``Int64Index`` rather than ``Index(dtype=object)`` when the merge result is empty (:issue:`11588`)
-- Bug in ``Categorical.remove_unused_categories`` when having ``NaN`` values (:issue:`11599`)
-- Bug in ``DataFrame.to_sparse()`` loses column names for MultiIndexes (:issue:`11600`)
-- Bug in ``DataFrame.round()`` with non-unique column index producing a Fatal Python error (:issue:`11611`)
-- Bug in ``DataFrame.round()`` with ``decimals`` being a non-unique indexed Series producing extra columns (:issue:`11618`)
diff --git a/doc/source/whatsnew/v0.18.0.rst b/doc/source/whatsnew/v0.18.0.rst
new file mode 100644
index 0000000000000..9ff6ad7188f5a
--- /dev/null
+++ b/doc/source/whatsnew/v0.18.0.rst
@@ -0,0 +1,1304 @@
+.. _whatsnew_0180:
+
+v0.18.0 (March 13, 2016)
+------------------------
+
+{{ header }}
+
+
+This is a major release from 0.17.1 and includes a small number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+.. warning::
+
+   pandas >= 0.18.0 no longer supports compatibility with Python version 2.6
+   and 3.3 (:issue:`7718`, :issue:`11273`)
+
+.. warning::
+
+   ``numexpr`` version 2.4.4 will now show a warning and not be used as a computation back-end for pandas because of some buggy behavior. This does not affect other versions (>= 2.1 and >= 2.4.6). (:issue:`12489`)
+
+Highlights include:
+
+- Moving and expanding window functions are now methods on Series and DataFrame,
+  similar to ``.groupby``, see :ref:`here <whatsnew_0180.enhancements.moments>`.
+- Adding support for a ``RangeIndex`` as a specialized form of the ``Int64Index``
+  for memory savings, see :ref:`here <whatsnew_0180.enhancements.rangeindex>`.
+- API breaking change to the ``.resample`` method to make it more ``.groupby``
+  like, see :ref:`here <whatsnew_0180.breaking.resample>`.
+- Removal of support for positional indexing with floats, which was deprecated
+  since 0.14.0. This will now raise a ``TypeError``, see :ref:`here <whatsnew_0180.float_indexers>`.
+- The ``.to_xarray()`` function has been added for compatibility with the
+  `xarray package <http://xarray.pydata.org/en/stable/>`__, see :ref:`here <whatsnew_0180.enhancements.xarray>`.
+- The ``read_sas`` function has been enhanced to read ``sas7bdat`` files, see :ref:`here <whatsnew_0180.enhancements.sas>`.
+- Addition of the :ref:`.str.extractall() method <whatsnew_0180.enhancements.extract>`,
+  and API changes to the :ref:`.str.extract() method <whatsnew_0180.enhancements.extract>`
+  and :ref:`.str.cat() method <whatsnew_0180.enhancements.strcat>`.
+- ``pd.test()`` top-level nose test runner is available (:issue:`4327`).
+
+Check the :ref:`API Changes <whatsnew_0180.api_breaking>` and :ref:`deprecations <whatsnew_0180.deprecations>` before updating.
+
+.. contents:: What's new in v0.18.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0180.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0180.enhancements.moments:
+
+Window functions are now methods
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Window functions have been refactored to be methods on ``Series/DataFrame`` objects, rather than top-level functions, which are now deprecated. This allows these window-type functions, to have a similar API to that of ``.groupby``. See the full documentation :ref:`here <stats.moments>` (:issue:`11603`, :issue:`12373`)
+
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame({'A': range(10), 'B': np.random.randn(10)})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [8]: pd.rolling_mean(df, window=3)
+           FutureWarning: pd.rolling_mean is deprecated for DataFrame and will be removed in a future version, replace with
+                          DataFrame.rolling(window=3,center=False).mean()
+   Out[8]:
+       A         B
+   0 NaN       NaN
+   1 NaN       NaN
+   2   1  0.237722
+   3   2 -0.023640
+   4   3  0.133155
+   5   4 -0.048693
+   6   5  0.342054
+   7   6  0.370076
+   8   7  0.079587
+   9   8 -0.954504
+
+New Behavior:
+
+.. ipython:: python
+
+   r = df.rolling(window=3)
+
+These show a descriptive repr
+
+.. ipython:: python
+
+   r
+with tab-completion of available methods and properties.
+
+.. code-block:: ipython
+
+   In [9]: r.<TAB>  # noqa E225, E999
+   r.A           r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
+   r.B           r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
+
+The methods operate on the ``Rolling`` object itself
+
+.. ipython:: python
+
+   r.mean()
+
+They provide getitem accessors
+
+.. ipython:: python
+
+   r['A'].mean()
+
+And multiple aggregations
+
+.. ipython:: python
+
+   r.agg({'A': ['mean', 'std'],
+          'B': ['mean', 'std']})
+
+.. _whatsnew_0180.enhancements.rename:
+
+Changes to rename
+^^^^^^^^^^^^^^^^^
+
+``Series.rename`` and ``NDFrame.rename_axis`` can now take a scalar or list-like
+argument for altering the Series or axis *name*, in addition to their old behaviors of altering labels. (:issue:`9494`, :issue:`11965`)
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(5))
+   s.rename('newname')
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(5, 2))
+   (df.rename_axis("indexname")
+      .rename_axis("columns_name", axis="columns"))
+
+The new functionality works well in method chains. Previously these methods only accepted functions or dicts mapping a *label* to a new label.
+This continues to work as before for function or dict-like values.
+
+
+.. _whatsnew_0180.enhancements.rangeindex:
+
+Range Index
+^^^^^^^^^^^
+
+A ``RangeIndex`` has been added to the ``Int64Index`` sub-classes to support a memory saving alternative for common use cases. This has a similar implementation to the python ``range`` object (``xrange`` in python 2), in that it only stores the start, stop, and step values for the index. It will transparently interact with the user API, converting to ``Int64Index`` if needed.
+
+This will now be the default constructed index for ``NDFrame`` objects, rather than previous an ``Int64Index``. (:issue:`939`, :issue:`12070`, :issue:`12071`, :issue:`12109`, :issue:`12888`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [3]: s = pd.Series(range(1000))
+
+   In [4]: s.index
+   Out[4]:
+   Int64Index([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,
+               ...
+               990, 991, 992, 993, 994, 995, 996, 997, 998, 999], dtype='int64', length=1000)
+
+   In [6]: s.index.nbytes
+   Out[6]: 8000
+
+
+New Behavior:
+
+.. ipython:: python
+
+   s = pd.Series(range(1000))
+   s.index
+   s.index.nbytes
+
+.. _whatsnew_0180.enhancements.extract:
+
+Changes to str.extract
+^^^^^^^^^^^^^^^^^^^^^^
+
+The :ref:`.str.extract <text.extract>` method takes a regular
+expression with capture groups, finds the first match in each subject
+string, and returns the contents of the capture groups
+(:issue:`11386`).
+
+In v0.18.0, the ``expand`` argument was added to
+``extract``.
+
+- ``expand=False``: it returns a ``Series``, ``Index``, or ``DataFrame``, depending on the subject and regular expression pattern (same behavior as pre-0.18.0).
+- ``expand=True``: it always returns a ``DataFrame``, which is more consistent and less confusing from the perspective of a user.
+
+Currently the default is ``expand=None`` which gives a ``FutureWarning`` and uses ``expand=False``. To avoid this warning, please explicitly specify ``expand``.
+
+.. code-block:: ipython
+
+   In [1]: pd.Series(['a1', 'b2', 'c3']).str.extract(r'[ab](\d)', expand=None)
+   FutureWarning: currently extract(expand=None) means expand=False (return Index/Series/DataFrame)
+   but in a future version of pandas this will be changed to expand=True (return DataFrame)
+
+   Out[1]:
+   0      1
+   1      2
+   2    NaN
+   dtype: object
+
+Extracting a regular expression with one group returns a Series if
+``expand=False``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'[ab](\d)', expand=False)
+
+It returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   pd.Series(['a1', 'b2', 'c3']).str.extract(r'[ab](\d)', expand=True)
+
+Calling on an ``Index`` with a regex with exactly one capture group
+returns an ``Index`` if ``expand=False``.
+
+.. ipython:: python
+
+   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
+   s.index
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
+
+It returns a ``DataFrame`` with one column if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
+
+Calling on an ``Index`` with a regex with more than one capture group
+raises ``ValueError`` if ``expand=False``.
+
+.. code-block:: python
+
+    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
+    ValueError: only one regex group is supported with Index
+
+It returns a ``DataFrame`` if ``expand=True``.
+
+.. ipython:: python
+
+   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
+
+In summary, ``extract(expand=True)`` always returns a ``DataFrame``
+with a row for every subject string, and a column for every capture
+group.
+
+.. _whatsnew_0180.enhancements.extractall:
+
+Addition of str.extractall
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :ref:`.str.extractall <text.extractall>` method was added
+(:issue:`11386`).  Unlike ``extract``, which returns only the first
+match.
+
+.. ipython:: python
+
+   s = pd.Series(["a1a2", "b1", "c1"], ["A", "B", "C"])
+   s
+   s.str.extract(r"(?P<letter>[ab])(?P<digit>\d)", expand=False)
+
+The ``extractall`` method returns all matches.
+
+.. ipython:: python
+
+   s.str.extractall(r"(?P<letter>[ab])(?P<digit>\d)")
+
+.. _whatsnew_0180.enhancements.strcat:
+
+Changes to str.cat
+^^^^^^^^^^^^^^^^^^
+
+The method ``.str.cat()`` concatenates the members of a ``Series``. Before, if ``NaN`` values were present in the Series, calling ``.str.cat()`` on it would return ``NaN``, unlike the rest of the ``Series.str.*`` API. This behavior has been amended to ignore ``NaN`` values by default. (:issue:`11435`).
+
+A new, friendlier ``ValueError`` is added to protect against the mistake of supplying the ``sep`` as an arg, rather than as a kwarg. (:issue:`11334`).
+
+.. ipython:: python
+
+    pd.Series(['a', 'b', np.nan, 'c']).str.cat(sep=' ')
+    pd.Series(['a', 'b', np.nan, 'c']).str.cat(sep=' ', na_rep='?')
+
+.. code-block:: ipython
+
+    In [2]: pd.Series(['a', 'b', np.nan, 'c']).str.cat(' ')
+    ValueError: Did you mean to supply a `sep` keyword?
+
+
+.. _whatsnew_0180.enhancements.rounding:
+
+Datetimelike rounding
+^^^^^^^^^^^^^^^^^^^^^
+
+``DatetimeIndex``, ``Timestamp``, ``TimedeltaIndex``, ``Timedelta`` have gained the ``.round()``, ``.floor()`` and ``.ceil()`` method for datetimelike rounding, flooring and ceiling. (:issue:`4314`, :issue:`11963`)
+
+Naive datetimes
+
+.. ipython:: python
+
+   dr = pd.date_range('20130101 09:12:56.1234', periods=3)
+   dr
+   dr.round('s')
+
+   # Timestamp scalar
+   dr[0]
+   dr[0].round('10s')
+
+Tz-aware are rounded, floored and ceiled in local times
+
+.. ipython:: python
+
+   dr = dr.tz_localize('US/Eastern')
+   dr
+   dr.round('s')
+
+Timedeltas
+
+.. ipython:: python
+
+   t = pd.timedelta_range('1 days 2 hr 13 min 45 us', periods=3, freq='d')
+   t
+   t.round('10min')
+
+   # Timedelta scalar
+   t[0]
+   t[0].round('2h')
+
+
+In addition, ``.round()``, ``.floor()`` and ``.ceil()`` will be available through the ``.dt`` accessor of ``Series``.
+
+.. ipython:: python
+
+   s = pd.Series(dr)
+   s
+   s.dt.round('D')
+
+Formatting of Integers in FloatIndex
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Integers in ``FloatIndex``, e.g. 1., are now formatted with a decimal point and a ``0`` digit, e.g. ``1.0`` (:issue:`11713`)
+This change not only affects the display to the console, but also the output of IO methods like ``.to_csv`` or ``.to_html``.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: s = pd.Series([1, 2, 3], index=np.arange(3.))
+
+   In [3]: s
+   Out[3]:
+   0    1
+   1    2
+   2    3
+   dtype: int64
+
+   In [4]: s.index
+   Out[4]: Float64Index([0.0, 1.0, 2.0], dtype='float64')
+
+   In [5]: print(s.to_csv(path=None))
+   0,1
+   1,2
+   2,3
+
+
+New Behavior:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=np.arange(3.))
+   s
+   s.index
+   print(s.to_csv(path_or_buf=None, header=False))
+
+Changes to dtype assignment behaviors
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+When a DataFrame's slice is updated with a new slice of the same dtype, the dtype of the DataFrame will now remain the same. (:issue:`10503`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [5]: df = pd.DataFrame({'a': [0, 1, 1],
+                              'b': pd.Series([100, 200, 300], dtype='uint32')})
+
+   In [7]: df.dtypes
+   Out[7]:
+   a     int64
+   b    uint32
+   dtype: object
+
+   In [8]: ix = df['a'] == 1
+
+   In [9]: df.loc[ix, 'b'] = df.loc[ix, 'b']
+
+   In [11]: df.dtypes
+   Out[11]:
+   a    int64
+   b    int64
+   dtype: object
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [0, 1, 1],
+                      'b': pd.Series([100, 200, 300], dtype='uint32')})
+   df.dtypes
+   ix = df['a'] == 1
+   df.loc[ix, 'b'] = df.loc[ix, 'b']
+   df.dtypes
+
+When a DataFrame's integer slice is partially updated with a new slice of floats that could potentially be down-casted to integer without losing precision, the dtype of the slice will be set to float instead of integer.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
+                             columns=list('abc'),
+                             index=[[4,4,8], [8,10,12]])
+
+   In [5]: df
+   Out[5]:
+         a  b  c
+   4 8   1  2  3
+     10  4  5  6
+   8 12  7  8  9
+
+   In [7]: df.ix[4, 'c'] = np.array([0., 1.])
+
+   In [8]: df
+   Out[8]:
+         a  b  c
+   4 8   1  2  0
+     10  4  5  1
+   8 12  7  8  9
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
+                     columns=list('abc'),
+                     index=[[4,4,8], [8,10,12]])
+   df
+   df.loc[4, 'c'] = np.array([0., 1.])
+   df
+
+.. _whatsnew_0180.enhancements.xarray:
+
+to_xarray
+^^^^^^^^^
+
+In a future version of pandas, we will be deprecating ``Panel`` and other > 2 ndim objects. In order to provide for continuity,
+all ``NDFrame`` objects have gained the ``.to_xarray()`` method in order to convert to ``xarray`` objects, which has
+a pandas-like interface for > 2 ndim. (:issue:`11972`)
+
+See the `xarray full-documentation here <http://xarray.pydata.org/en/stable/>`__.
+
+.. code-block:: ipython
+
+   In [1]: p = Panel(np.arange(2*3*4).reshape(2,3,4))
+
+   In [2]: p.to_xarray()
+   Out[2]:
+   <xarray.DataArray (items: 2, major_axis: 3, minor_axis: 4)>
+   array([[[ 0,  1,  2,  3],
+           [ 4,  5,  6,  7],
+           [ 8,  9, 10, 11]],
+
+          [[12, 13, 14, 15],
+           [16, 17, 18, 19],
+           [20, 21, 22, 23]]])
+   Coordinates:
+     * items       (items) int64 0 1
+     * major_axis  (major_axis) int64 0 1 2
+     * minor_axis  (minor_axis) int64 0 1 2 3
+
+Latex Representation
+^^^^^^^^^^^^^^^^^^^^
+
+``DataFrame`` has gained a ``._repr_latex_()`` method in order to allow for conversion to latex in a ipython/jupyter notebook using nbconvert. (:issue:`11778`)
+
+Note that this must be activated by setting the option ``pd.display.latex.repr=True`` (:issue:`12182`)
+
+For example, if you have a jupyter notebook you plan to convert to latex using nbconvert, place the statement ``pd.display.latex.repr=True`` in the first cell to have the contained DataFrame output also stored as latex.
+
+The options ``display.latex.escape`` and ``display.latex.longtable`` have also been added to the configuration and are used automatically by the ``to_latex``
+method. See the :ref:`available options docs <options.available>` for more info.
+
+.. _whatsnew_0180.enhancements.sas:
+
+``pd.read_sas()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``read_sas`` has gained the ability to read SAS7BDAT files, including compressed files.  The files can be read in entirety, or incrementally.  For full details see :ref:`here <io.sas>`. (:issue:`4052`)
+
+.. _whatsnew_0180.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Handle truncated floats in SAS xport files (:issue:`11713`)
+- Added option to hide index in ``Series.to_string`` (:issue:`11729`)
+- ``read_excel`` now supports s3 urls of the format ``s3://bucketname/filename`` (:issue:`11447`)
+- add support for ``AWS_S3_HOST`` env variable when reading from s3 (:issue:`12198`)
+- A simple version of ``Panel.round()`` is now implemented (:issue:`11763`)
+- For Python 3.x, ``round(DataFrame)``, ``round(Series)``, ``round(Panel)`` will work (:issue:`11763`)
+- ``sys.getsizeof(obj)`` returns the memory usage of a pandas object, including the
+  values it contains (:issue:`11597`)
+- ``Series`` gained an ``is_unique`` attribute (:issue:`11946`)
+- ``DataFrame.quantile`` and ``Series.quantile`` now accept ``interpolation`` keyword (:issue:`10174`).
+- Added ``DataFrame.style.format`` for more flexible formatting of cell values (:issue:`11692`)
+- ``DataFrame.select_dtypes`` now allows the ``np.float16`` type code (:issue:`11990`)
+- ``pivot_table()`` now accepts most iterables for the ``values`` parameter (:issue:`12017`)
+- Added Google ``BigQuery`` service account authentication support, which enables authentication on remote servers. (:issue:`11881`, :issue:`12572`). For further details see `here <https://pandas-gbq.readthedocs.io/en/latest/intro.html>`__
+- ``HDFStore`` is now iterable: ``for k in store`` is equivalent to ``for k in store.keys()`` (:issue:`12221`).
+- Add missing methods/fields to ``.dt`` for ``Period`` (:issue:`8848`)
+- The entire code base has been ``PEP``-ified (:issue:`12096`)
+
+.. _whatsnew_0180.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- the leading white spaces have been removed from the output of ``.to_string(index=False)`` method (:issue:`11833`)
+- the ``out`` parameter has been removed from the ``Series.round()`` method. (:issue:`11763`)
+- ``DataFrame.round()`` leaves non-numeric columns unchanged in its return, rather than raises. (:issue:`11885`)
+- ``DataFrame.head(0)`` and ``DataFrame.tail(0)`` return empty frames, rather than ``self``.  (:issue:`11937`)
+- ``Series.head(0)`` and ``Series.tail(0)`` return empty series, rather than ``self``.  (:issue:`11937`)
+- ``to_msgpack`` and ``read_msgpack`` encoding now defaults to ``'utf-8'``. (:issue:`12170`)
+- the order of keyword arguments to text file parsing functions (``.read_csv()``, ``.read_table()``, ``.read_fwf()``) changed to group related arguments. (:issue:`11555`)
+- ``NaTType.isoformat`` now returns the string ``'NaT`` to allow the result to
+  be passed to the constructor of ``Timestamp``. (:issue:`12300`)
+
+NaT and Timedelta operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``NaT`` and ``Timedelta`` have expanded arithmetic operations, which are extended to ``Series``
+arithmetic where applicable.  Operations defined for ``datetime64[ns]`` or ``timedelta64[ns]``
+are now also defined for ``NaT`` (:issue:`11564`).
+
+``NaT`` now supports arithmetic operations with integers and floats.
+
+.. ipython:: python
+
+   pd.NaT * 1
+   pd.NaT * 1.5
+   pd.NaT / 2
+   pd.NaT * np.nan
+
+``NaT`` defines more arithmetic operations with ``datetime64[ns]`` and ``timedelta64[ns]``.
+
+.. ipython:: python
+
+   pd.NaT / pd.NaT
+   pd.Timedelta('1s') / pd.NaT
+
+``NaT`` may represent either a ``datetime64[ns]`` null or a ``timedelta64[ns]`` null.
+Given the ambiguity, it is treated as a ``timedelta64[ns]``, which allows more operations
+to succeed.
+
+.. ipython:: python
+
+   pd.NaT + pd.NaT
+
+   # same as
+   pd.Timedelta('1s') + pd.Timedelta('1s')
+
+as opposed to
+
+.. code-block:: ipython
+
+   In [3]: pd.Timestamp('19900315') + pd.Timestamp('19900315')
+   TypeError: unsupported operand type(s) for +: 'Timestamp' and 'Timestamp'
+
+However, when wrapped in a ``Series`` whose ``dtype`` is ``datetime64[ns]`` or ``timedelta64[ns]``,
+the ``dtype`` information is respected.
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([pd.NaT], dtype='<M8[ns]') + pd.Series([pd.NaT], dtype='<M8[ns]')
+   TypeError: can only operate on a datetimes for subtraction,
+              but the operator [__add__] was passed
+
+.. ipython:: python
+
+   pd.Series([pd.NaT], dtype='<m8[ns]') + pd.Series([pd.NaT], dtype='<m8[ns]')
+
+``Timedelta`` division by ``floats`` now works.
+
+.. ipython:: python
+
+   pd.Timedelta('1s') / 2.0
+
+Subtraction by ``Timedelta`` in a ``Series`` by a ``Timestamp`` works (:issue:`11925`)
+
+.. ipython:: python
+
+   ser = pd.Series(pd.timedelta_range('1 day', periods=3))
+   ser
+   pd.Timestamp('2012-01-01') - ser
+
+
+``NaT.isoformat()`` now returns ``'NaT'``. This change allows allows
+``pd.Timestamp`` to rehydrate any timestamp like object from its isoformat
+(:issue:`12300`).
+
+Changes to msgpack
+^^^^^^^^^^^^^^^^^^
+
+Forward incompatible changes in ``msgpack`` writing format were made over 0.17.0 and 0.18.0; older versions of pandas cannot read files packed by newer versions (:issue:`12129`, :issue:`10527`)
+
+Bugs in ``to_msgpack`` and ``read_msgpack`` introduced in 0.17.0 and fixed in 0.18.0, caused files packed in Python 2 unreadable by Python 3 (:issue:`12142`). The following table describes the backward and forward compat of msgpacks.
+
+.. warning::
+
+   +----------------------+------------------------+
+   | Packed with          | Can be unpacked with   |
+   +======================+========================+
+   | pre-0.17 / Python 2  | any                    |
+   +----------------------+------------------------+
+   | pre-0.17 / Python 3  | any                    |
+   +----------------------+------------------------+
+   | 0.17 / Python 2      | - ==0.17 / Python 2    |
+   |                      | - >=0.18 / any Python  |
+   +----------------------+------------------------+
+   | 0.17 / Python 3      | >=0.18 / any Python    |
+   +----------------------+------------------------+
+   | 0.18                 | >= 0.18                |
+   +----------------------+------------------------+
+
+
+   0.18.0 is backward-compatible for reading files packed by older versions, except for files packed with 0.17 in Python 2, in which case only they can only be unpacked in Python 2.
+
+Signature change for .rank
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Series.rank`` and ``DataFrame.rank`` now have the same signature (:issue:`11759`)
+
+Previous signature
+
+.. code-block:: ipython
+
+   In [3]: pd.Series([0,1]).rank(method='average', na_option='keep',
+                                 ascending=True, pct=False)
+   Out[3]:
+   0    1
+   1    2
+   dtype: float64
+
+   In [4]: pd.DataFrame([0,1]).rank(axis=0, numeric_only=None,
+                                    method='average', na_option='keep',
+                                    ascending=True, pct=False)
+   Out[4]:
+      0
+   0  1
+   1  2
+
+New signature
+
+.. ipython:: python
+
+   pd.Series([0,1]).rank(axis=0, method='average', numeric_only=None,
+                         na_option='keep', ascending=True, pct=False)
+   pd.DataFrame([0,1]).rank(axis=0, method='average', numeric_only=None,
+                            na_option='keep', ascending=True, pct=False)
+
+
+Bug in QuarterBegin with n=0
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, the behavior of the QuarterBegin offset was inconsistent
+depending on the date when the ``n`` parameter was 0. (:issue:`11406`)
+
+The general semantics of anchored offsets for ``n=0`` is to not move the date
+when it is an anchor point (e.g., a quarter start date), and otherwise roll
+forward to the next anchor point.
+
+.. ipython:: python
+
+   d = pd.Timestamp('2014-02-01')
+   d
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=1)
+
+For the ``QuarterBegin`` offset in previous versions, the date would be rolled
+*backwards* if date was in the same month as the quarter start date.
+
+.. code-block:: ipython
+
+   In [3]: d = pd.Timestamp('2014-02-15')
+
+   In [4]: d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+   Out[4]: Timestamp('2014-02-01 00:00:00')
+
+This behavior has been corrected in version 0.18.0, which is consistent with
+other anchored offsets like ``MonthBegin`` and ``YearBegin``.
+
+.. ipython:: python
+
+   d = pd.Timestamp('2014-02-15')
+   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
+
+.. _whatsnew_0180.breaking.resample:
+
+Resample API
+^^^^^^^^^^^^
+
+Like the change in the window functions API :ref:`above <whatsnew_0180.enhancements.moments>`, ``.resample(...)`` is changing to have a more groupby-like API. (:issue:`11732`, :issue:`12702`, :issue:`12202`, :issue:`12332`, :issue:`12334`, :issue:`12348`, :issue:`12448`).
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.rand(10,4),
+                     columns=list('ABCD'),
+                     index=pd.date_range('2010-01-01 09:00:00',
+                                         periods=10, freq='s'))
+   df
+
+
+**Previous API**:
+
+You would write a resampling operation that immediately evaluates. If a ``how`` parameter was not provided, it
+would default to ``how='mean'``.
+
+.. code-block:: ipython
+
+   In [6]: df.resample('2s')
+   Out[6]:
+                            A         B         C         D
+   2010-01-01 09:00:00  0.485748  0.447351  0.357096  0.793615
+   2010-01-01 09:00:02  0.820801  0.794317  0.364034  0.531096
+   2010-01-01 09:00:04  0.433985  0.314582  0.424104  0.625733
+   2010-01-01 09:00:06  0.624988  0.609738  0.633165  0.612452
+   2010-01-01 09:00:08  0.510470  0.534317  0.573201  0.806949
+
+You could also specify a ``how`` directly
+
+.. code-block:: ipython
+
+   In [7]: df.resample('2s', how='sum')
+   Out[7]:
+                            A         B         C         D
+   2010-01-01 09:00:00  0.971495  0.894701  0.714192  1.587231
+   2010-01-01 09:00:02  1.641602  1.588635  0.728068  1.062191
+   2010-01-01 09:00:04  0.867969  0.629165  0.848208  1.251465
+   2010-01-01 09:00:06  1.249976  1.219477  1.266330  1.224904
+   2010-01-01 09:00:08  1.020940  1.068634  1.146402  1.613897
+
+**New API**:
+
+Now, you can write ``.resample(..)`` as a 2-stage operation like ``.groupby(...)``, which
+yields a ``Resampler``.
+
+.. ipython:: python
+   :okwarning:
+
+   r = df.resample('2s')
+   r
+
+Downsampling
+""""""""""""
+
+You can then use this object to perform operations.
+These are downsampling operations (going from a higher frequency to a lower one).
+
+.. ipython:: python
+
+   r.mean()
+
+.. ipython:: python
+
+   r.sum()
+
+Furthermore, resample now supports ``getitem`` operations to perform the resample on specific columns.
+
+.. ipython:: python
+
+   r[['A','C']].mean()
+
+and ``.aggregate`` type operations.
+
+.. ipython:: python
+
+   r.agg({'A' : 'mean', 'B' : 'sum'})
+
+These accessors can of course, be combined
+
+.. ipython:: python
+
+   r[['A','B']].agg(['mean','sum'])
+
+Upsampling
+""""""""""
+
+.. currentmodule:: pandas.tseries.resample
+
+Upsampling operations take you from a lower frequency to a higher frequency. These are now
+performed with the ``Resampler`` objects with :meth:`~Resampler.backfill`,
+:meth:`~Resampler.ffill`, :meth:`~Resampler.fillna` and :meth:`~Resampler.asfreq` methods.
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5, dtype='int64'),
+                 index=pd.date_range('2010-01-01', periods=5, freq='Q'))
+   s
+
+Previously
+
+.. code-block:: ipython
+
+   In [6]: s.resample('M', fill_method='ffill')
+   Out[6]:
+   2010-03-31    0
+   2010-04-30    0
+   2010-05-31    0
+   2010-06-30    1
+   2010-07-31    1
+   2010-08-31    1
+   2010-09-30    2
+   2010-10-31    2
+   2010-11-30    2
+   2010-12-31    3
+   2011-01-31    3
+   2011-02-28    3
+   2011-03-31    4
+   Freq: M, dtype: int64
+
+New API
+
+.. ipython:: python
+
+   s.resample('M').ffill()
+
+.. note::
+
+   In the new API, you can either downsample OR upsample. The prior implementation would allow you to pass an aggregator function (like ``mean``) even though you were upsampling, providing a bit of confusion.
+
+Previous API will work but with deprecations
+""""""""""""""""""""""""""""""""""""""""""""
+
+.. warning::
+
+   This new API for resample includes some internal changes for the prior-to-0.18.0 API, to work with a deprecation warning in most cases, as the resample operation returns a deferred object. We can intercept operations and just do what the (pre 0.18.0) API did (with a warning). Here is a typical use case:
+
+   .. code-block:: ipython
+
+      In [4]: r = df.resample('2s')
+
+      In [6]: r*10
+      pandas/tseries/resample.py:80: FutureWarning: .resample() is now a deferred operation
+      use .resample(...).mean() instead of .resample(...)
+
+      Out[6]:
+                            A         B         C         D
+      2010-01-01 09:00:00  4.857476  4.473507  3.570960  7.936154
+      2010-01-01 09:00:02  8.208011  7.943173  3.640340  5.310957
+      2010-01-01 09:00:04  4.339846  3.145823  4.241039  6.257326
+      2010-01-01 09:00:06  6.249881  6.097384  6.331650  6.124518
+      2010-01-01 09:00:08  5.104699  5.343172  5.732009  8.069486
+
+   However, getting and assignment operations directly on a ``Resampler`` will raise a ``ValueError``:
+
+   .. code-block:: ipython
+
+      In [7]: r.iloc[0] = 5
+      ValueError: .resample() is now a deferred operation
+      use .resample(...).mean() instead of .resample(...)
+
+   There is a situation where the new API can not perform all the operations when using original code.
+   This code is intending to resample every 2s, take the ``mean`` AND then take the ``min`` of those results.
+
+   .. code-block:: ipython
+
+      In [4]: df.resample('2s').min()
+      Out[4]:
+      A    0.433985
+      B    0.314582
+      C    0.357096
+      D    0.531096
+      dtype: float64
+
+   The new API will:
+
+   .. ipython:: python
+
+      df.resample('2s').min()
+
+   The good news is the return dimensions will differ between the new API and the old API, so this should loudly raise
+   an exception.
+
+   To replicate the original operation
+
+   .. ipython:: python
+
+      df.resample('2s').mean().min()
+
+Changes to eval
+^^^^^^^^^^^^^^^
+
+In prior versions, new columns assignments in an ``eval`` expression resulted
+in an inplace change to the ``DataFrame``. (:issue:`9297`, :issue:`8664`, :issue:`10486`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': np.linspace(0, 10, 5), 'b': range(5)})
+   df
+
+.. ipython:: python
+   :suppress:
+
+   df.eval('c = a + b', inplace=True)
+
+.. code-block:: ipython
+
+   In [12]: df.eval('c = a + b')
+   FutureWarning: eval expressions containing an assignment currentlydefault to operating inplace.
+   This will change in a future version of pandas, use inplace=True to avoid this warning.
+
+   In [13]: df
+   Out[13]:
+         a  b     c
+   0   0.0  0   0.0
+   1   2.5  1   3.5
+   2   5.0  2   7.0
+   3   7.5  3  10.5
+   4  10.0  4  14.0
+
+In version 0.18.0, a new ``inplace`` keyword was added to choose whether the
+assignment should be done inplace or return a copy.
+
+.. ipython:: python
+
+   df
+   df.eval('d = c - b', inplace=False)
+   df
+   df.eval('d = c - b', inplace=True)
+   df
+
+.. warning::
+
+   For backwards compatibility, ``inplace`` defaults to ``True`` if not specified.
+   This will change in a future version of pandas. If your code depends on an
+   inplace assignment you should update to explicitly set ``inplace=True``
+
+The ``inplace`` keyword parameter was also added the ``query`` method.
+
+.. ipython:: python
+
+   df.query('a > 5')
+   df.query('a > 5', inplace=True)
+   df
+
+.. warning::
+
+   Note that the default value for ``inplace`` in a ``query``
+   is ``False``, which is consistent with prior versions.
+
+``eval`` has also been updated to allow multi-line expressions for multiple
+assignments.  These expressions will be evaluated one at a time in order.  Only
+assignments are valid for multi-line expressions.
+
+.. ipython:: python
+
+   df
+   df.eval("""
+   e = d + a
+   f = e - 22
+   g = f / 2.0""", inplace=True)
+   df
+
+
+.. _whatsnew_0180.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+- ``DataFrame.between_time`` and ``Series.between_time`` now only parse a fixed set of time strings. Parsing of date strings is no longer supported and raises a ``ValueError``. (:issue:`11818`)
+
+  .. ipython:: python
+
+     s = pd.Series(range(10), pd.date_range('2015-01-01', freq='H', periods=10))
+     s.between_time("7:00am", "9:00am")
+
+  This will now raise.
+
+  .. code-block:: ipython
+
+     In [2]: s.between_time('20150101 07:00:00','20150101 09:00:00')
+     ValueError: Cannot convert arg ['20150101 07:00:00'] to a time.
+
+- ``.memory_usage()`` now includes values in the index, as does memory_usage in ``.info()`` (:issue:`11597`)
+- ``DataFrame.to_latex()`` now supports non-ascii encodings (eg ``utf-8``) in Python 2 with the parameter ``encoding`` (:issue:`7061`)
+- ``pandas.merge()`` and ``DataFrame.merge()`` will show a specific error message when trying to merge with an object that is not of type ``DataFrame`` or a subclass (:issue:`12081`)
+- ``DataFrame.unstack`` and ``Series.unstack`` now take ``fill_value`` keyword to allow direct replacement of missing values when an unstack results in missing values in the resulting ``DataFrame``. As an added benefit, specifying ``fill_value`` will preserve the data type of the original stacked data.  (:issue:`9746`)
+- As part of the new API for :ref:`window functions <whatsnew_0180.enhancements.moments>` and :ref:`resampling <whatsnew_0180.breaking.resample>`, aggregation functions have been clarified, raising more informative error messages on invalid aggregations. (:issue:`9052`). A full set of examples are presented in :ref:`groupby <groupby.aggregate>`.
+- Statistical functions for ``NDFrame`` objects (like ``sum(), mean(), min()``) will now raise if non-numpy-compatible arguments are passed in for ``**kwargs`` (:issue:`12301`)
+- ``.to_latex`` and ``.to_html`` gain a ``decimal`` parameter like ``.to_csv``; the default is ``'.'`` (:issue:`12031`)
+- More helpful error message when constructing a ``DataFrame`` with empty data but with indices (:issue:`8020`)
+- ``.describe()`` will now properly handle bool dtype as a categorical (:issue:`6625`)
+- More helpful error message with an invalid ``.transform`` with user defined input (:issue:`10165`)
+- Exponentially weighted functions now allow specifying alpha directly (:issue:`10789`) and raise ``ValueError`` if parameters violate ``0 < alpha <= 1`` (:issue:`12492`)
+
+.. _whatsnew_0180.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+.. _whatsnew_0180.window_deprecations:
+
+- The functions ``pd.rolling_*``, ``pd.expanding_*``, and ``pd.ewm*`` are deprecated and replaced by the corresponding method call. Note that
+  the new suggested syntax includes all of the arguments (even if default) (:issue:`11603`)
+
+  .. code-block:: ipython
+
+     In [1]: s = pd.Series(range(3))
+
+     In [2]: pd.rolling_mean(s,window=2,min_periods=1)
+             FutureWarning: pd.rolling_mean is deprecated for Series and
+                  will be removed in a future version, replace with
+                  Series.rolling(min_periods=1,window=2,center=False).mean()
+     Out[2]:
+             0    0.0
+             1    0.5
+             2    1.5
+             dtype: float64
+
+     In [3]: pd.rolling_cov(s, s, window=2)
+             FutureWarning: pd.rolling_cov is deprecated for Series and
+                  will be removed in a future version, replace with
+                  Series.rolling(window=2).cov(other=<Series>)
+     Out[3]:
+             0    NaN
+             1    0.5
+             2    0.5
+             dtype: float64
+
+- The ``freq`` and ``how`` arguments to the ``.rolling``, ``.expanding``, and ``.ewm`` (new) functions are deprecated, and will be removed in a future version. You can simply resample the input prior to creating a window function. (:issue:`11603`).
+
+  For example, instead of ``s.rolling(window=5,freq='D').max()`` to get the max value on a rolling 5 Day window, one could use ``s.resample('D').mean().rolling(window=5).max()``, which first resamples the data to daily data, then provides a rolling 5 day window.
+
+- ``pd.tseries.frequencies.get_offset_name`` function is deprecated. Use offset's ``.freqstr`` property as alternative (:issue:`11192`)
+- ``pandas.stats.fama_macbeth`` routines are deprecated and will be removed in a future version (:issue:`6077`)
+- ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var`` routines are deprecated and will be removed in a future version (:issue:`6077`)
+- show a ``FutureWarning`` rather than a ``DeprecationWarning`` on using long-time deprecated syntax in ``HDFStore.select``, where the ``where`` clause is not a string-like (:issue:`12027`)
+
+- The ``pandas.options.display.mpl_style`` configuration has been deprecated
+  and will be removed in a future version of pandas. This functionality
+  is better handled by matplotlib's `style sheets`_ (:issue:`11783`).
+
+
+.. _style sheets: http://matplotlib.org/users/style_sheets.html
+
+.. _whatsnew_0180.float_indexers:
+
+Removal of deprecated float indexers
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In :issue:`4892` indexing with floating point numbers on a non-``Float64Index`` was deprecated (in version 0.14.0).
+In 0.18.0, this deprecation warning is removed and these will now raise a ``TypeError``. (:issue:`12165`, :issue:`12333`)
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=[4, 5, 6])
+   s
+   s2 = pd.Series([1, 2, 3], index=list('abc'))
+   s2
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   # this is label indexing
+   In [2]: s[5.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[2]: 2
+
+   # this is positional indexing
+   In [3]: s.iloc[1.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[3]: 2
+
+   # this is label indexing
+   In [4]: s.loc[5.0]
+   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
+   Out[4]: 2
+
+   # .ix would coerce 1.0 to the positional 1, and index
+   In [5]: s2.ix[1.0] = 10
+   FutureWarning: scalar indexers for index type Index should be integers and not floating point
+
+   In [6]: s2
+   Out[6]:
+   a     1
+   b    10
+   c     3
+   dtype: int64
+
+New Behavior:
+
+For iloc, getting & setting via a float scalar will always raise.
+
+.. code-block:: ipython
+
+   In [3]: s.iloc[2.0]
+   TypeError: cannot do label indexing on <class 'pandas.indexes.numeric.Int64Index'> with these indexers [2.0] of <type 'float'>
+
+Other indexers will coerce to a like integer for both getting and setting. The ``FutureWarning`` has been dropped for ``.loc``, ``.ix`` and ``[]``.
+
+.. ipython:: python
+
+   s[5.0]
+   s.loc[5.0]
+
+and setting
+
+.. ipython:: python
+
+   s_copy = s.copy()
+   s_copy[5.0] = 10
+   s_copy
+   s_copy = s.copy()
+   s_copy.loc[5.0] = 10
+   s_copy
+
+Positional setting with ``.ix`` and a float indexer will ADD this value to the index, rather than previously setting the value by position.
+
+.. code-block:: ipython
+
+   In [3]: s2.ix[1.0] = 10
+   In [4]: s2
+   Out[4]:
+   a       1
+   b       2
+   c       3
+   1.0    10
+   dtype: int64
+
+Slicing will also coerce integer-like floats to integers for a non-``Float64Index``.
+
+.. ipython:: python
+
+   s.loc[5.0:6]
+
+Note that for floats that are NOT coercible to ints, the label based bounds will be excluded
+
+.. ipython:: python
+
+   s.loc[5.1:6]
+
+Float indexing on a ``Float64Index`` is unchanged.
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=np.arange(3.))
+   s[1.0]
+   s[1.0:2.5]
+
+.. _whatsnew_0180.prior_deprecations:
+
+Removal of prior version deprecations/changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Removal of ``rolling_corr_pairwise`` in favor of ``.rolling().corr(pairwise=True)`` (:issue:`4950`)
+- Removal of ``expanding_corr_pairwise`` in favor of ``.expanding().corr(pairwise=True)`` (:issue:`4950`)
+- Removal of ``DataMatrix`` module. This was not imported into the pandas namespace in any event (:issue:`12111`)
+- Removal of ``cols`` keyword in favor of ``subset`` in ``DataFrame.duplicated()`` and ``DataFrame.drop_duplicates()`` (:issue:`6680`)
+- Removal of the ``read_frame`` and ``frame_query`` (both aliases for ``pd.read_sql``)
+  and ``write_frame`` (alias of ``to_sql``) functions in the ``pd.io.sql`` namespace,
+  deprecated since 0.14.0 (:issue:`6292`).
+- Removal of the ``order`` keyword from ``.factorize()`` (:issue:`6930`)
+
+.. _whatsnew_0180.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of ``andrews_curves`` (:issue:`11534`)
+- Improved huge ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex``'s ops performance including ``NaT`` (:issue:`10277`)
+- Improved performance of ``pandas.concat`` (:issue:`11958`)
+- Improved performance of ``StataReader`` (:issue:`11591`)
+- Improved performance in construction of ``Categoricals`` with ``Series`` of datetimes containing ``NaT`` (:issue:`12077`)
+
+
+- Improved performance of ISO 8601 date parsing for dates without separators (:issue:`11899`), leading zeros (:issue:`11871`) and with white space preceding the time zone (:issue:`9714`)
+
+
+
+
+.. _whatsnew_0180.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``GroupBy.size`` when data-frame is empty. (:issue:`11699`)
+- Bug in ``Period.end_time`` when a multiple of time period is requested (:issue:`11738`)
+- Regression in ``.clip`` with tz-aware datetimes (:issue:`11838`)
+- Bug in ``date_range`` when the boundaries fell on the frequency (:issue:`11804`, :issue:`12409`)
+- Bug in consistency of passing nested dicts to ``.groupby(...).agg(...)`` (:issue:`9052`)
+- Accept unicode in ``Timedelta`` constructor (:issue:`11995`)
+- Bug in value label reading for ``StataReader`` when reading incrementally (:issue:`12014`)
+- Bug in vectorized ``DateOffset`` when ``n`` parameter is ``0`` (:issue:`11370`)
+- Compat for numpy 1.11 w.r.t. ``NaT`` comparison changes (:issue:`12049`)
+- Bug in ``read_csv`` when reading from a ``StringIO`` in threads (:issue:`11790`)
+- Bug in not treating ``NaT`` as a missing value in datetimelikes when factorizing & with ``Categoricals`` (:issue:`12077`)
+- Bug in getitem when the values of a ``Series`` were tz-aware (:issue:`12089`)
+- Bug in ``Series.str.get_dummies`` when one of the variables was 'name' (:issue:`12180`)
+- Bug in ``pd.concat`` while concatenating tz-aware NaT series. (:issue:`11693`, :issue:`11755`, :issue:`12217`)
+- Bug in ``pd.read_stata`` with version <= 108 files (:issue:`12232`)
+- Bug in ``Series.resample`` using a frequency of ``Nano`` when the index is a ``DatetimeIndex`` and contains non-zero nanosecond parts (:issue:`12037`)
+- Bug in resampling with ``.nunique`` and a sparse index (:issue:`12352`)
+- Removed some compiler warnings (:issue:`12471`)
+- Work around compat issues with ``boto`` in python 3.5 (:issue:`11915`)
+- Bug in ``NaT`` subtraction from ``Timestamp`` or ``DatetimeIndex`` with timezones (:issue:`11718`)
+- Bug in subtraction of ``Series`` of a single tz-aware ``Timestamp`` (:issue:`12290`)
+- Use compat iterators in PY2 to support ``.next()`` (:issue:`12299`)
+- Bug in ``Timedelta.round`` with negative values (:issue:`11690`)
+- Bug in ``.loc`` against ``CategoricalIndex`` may result in normal ``Index`` (:issue:`11586`)
+- Bug in ``DataFrame.info`` when duplicated column names exist (:issue:`11761`)
+- Bug in ``.copy`` of datetime tz-aware objects (:issue:`11794`)
+- Bug in ``Series.apply`` and ``Series.map`` where ``timedelta64`` was not boxed (:issue:`11349`)
+- Bug in ``DataFrame.set_index()`` with tz-aware ``Series`` (:issue:`12358`)
+
+
+
+- Bug in subclasses of ``DataFrame`` where ``AttributeError`` did not propagate (:issue:`11808`)
+- Bug groupby on tz-aware data where selection not returning ``Timestamp`` (:issue:`11616`)
+- Bug in ``pd.read_clipboard`` and ``pd.to_clipboard`` functions not supporting Unicode; upgrade included ``pyperclip`` to v1.5.15 (:issue:`9263`)
+- Bug in ``DataFrame.query`` containing an assignment (:issue:`8664`)
+
+- Bug in ``from_msgpack`` where ``__contains__()`` fails for columns of the unpacked ``DataFrame``, if the ``DataFrame`` has object columns. (:issue:`11880`)
+- Bug in ``.resample`` on categorical data with ``TimedeltaIndex`` (:issue:`12169`)
+
+
+- Bug in timezone info lost when broadcasting scalar datetime to ``DataFrame`` (:issue:`11682`)
+- Bug in ``Index`` creation from ``Timestamp`` with mixed tz coerces to UTC (:issue:`11488`)
+- Bug in ``to_numeric`` where it does not raise if input is more than one dimension (:issue:`11776`)
+- Bug in parsing timezone offset strings with non-zero minutes (:issue:`11708`)
+- Bug in ``df.plot`` using incorrect colors for bar plots under matplotlib 1.5+ (:issue:`11614`)
+- Bug in the ``groupby`` ``plot`` method when using keyword arguments (:issue:`11805`).
+- Bug in ``DataFrame.duplicated`` and ``drop_duplicates`` causing spurious matches when setting ``keep=False`` (:issue:`11864`)
+- Bug in ``.loc`` result with duplicated key may have ``Index`` with incorrect dtype (:issue:`11497`)
+- Bug in ``pd.rolling_median`` where memory allocation failed even with sufficient memory (:issue:`11696`)
+- Bug in ``DataFrame.style`` with spurious zeros (:issue:`12134`)
+- Bug in ``DataFrame.style`` with integer columns not starting at 0 (:issue:`12125`)
+- Bug in ``.style.bar`` may not rendered properly using specific browser (:issue:`11678`)
+- Bug in rich comparison of ``Timedelta`` with a ``numpy.array`` of ``Timedelta`` that caused an infinite recursion (:issue:`11835`)
+- Bug in ``DataFrame.round`` dropping column index name (:issue:`11986`)
+- Bug in ``df.replace`` while replacing value in mixed dtype ``Dataframe`` (:issue:`11698`)
+- Bug in ``Index`` prevents copying name of passed ``Index``, when a new name is not provided (:issue:`11193`)
+- Bug in ``read_excel`` failing to read any non-empty sheets when empty sheets exist and ``sheetname=None`` (:issue:`11711`)
+- Bug in ``read_excel`` failing to raise ``NotImplemented`` error when keywords ``parse_dates`` and ``date_parser`` are provided (:issue:`11544`)
+- Bug in ``read_sql`` with ``pymysql`` connections failing to return chunked data (:issue:`11522`)
+- Bug in ``.to_csv`` ignoring formatting parameters ``decimal``, ``na_rep``, ``float_format`` for float indexes (:issue:`11553`)
+- Bug in ``Int64Index`` and ``Float64Index`` preventing the use of the modulo operator (:issue:`9244`)
+- Bug in ``MultiIndex.drop`` for not lexsorted MultiIndexes (:issue:`12078`)
+
+- Bug in ``DataFrame`` when masking an empty ``DataFrame`` (:issue:`11859`)
+
+
+- Bug in ``.plot`` potentially modifying the ``colors`` input when the number of columns didn't match the number of series provided (:issue:`12039`).
+- Bug in ``Series.plot`` failing when index has a ``CustomBusinessDay`` frequency (:issue:`7222`).
+- Bug in ``.to_sql`` for ``datetime.time`` values with sqlite fallback (:issue:`8341`)
+- Bug in ``read_excel`` failing to read data with one column when ``squeeze=True`` (:issue:`12157`)
+- Bug in ``read_excel`` failing to read one empty column (:issue:`12292`, :issue:`9002`)
+- Bug in ``.groupby`` where a ``KeyError`` was not raised for a wrong column if there was only one row in the dataframe (:issue:`11741`)
+- Bug in ``.read_csv`` with dtype specified on empty data producing an error (:issue:`12048`)
+- Bug in ``.read_csv`` where strings like ``'2E'`` are treated as valid floats (:issue:`12237`)
+- Bug in building *pandas* with debugging symbols (:issue:`12123`)
+
+
+- Removed ``millisecond`` property of ``DatetimeIndex``. This would always raise a ``ValueError`` (:issue:`12019`).
+- Bug in ``Series`` constructor with read-only data (:issue:`11502`)
+- Removed ``pandas.util.testing.choice()``.  Should use ``np.random.choice()``, instead. (:issue:`12386`)
+- Bug in ``.loc`` setitem indexer preventing the use of a TZ-aware DatetimeIndex (:issue:`12050`)
+- Bug in ``.style`` indexes and MultiIndexes not appearing (:issue:`11655`)
+- Bug in ``to_msgpack`` and ``from_msgpack`` which did not correctly serialize or deserialize ``NaT`` (:issue:`12307`).
+- Bug in ``.skew`` and ``.kurt`` due to roundoff error for highly similar values (:issue:`11974`)
+- Bug in ``Timestamp`` constructor where microsecond resolution was lost if HHMMSS were not separated with ':' (:issue:`10041`)
+- Bug in ``buffer_rd_bytes`` src->buffer could be freed more than once if reading failed, causing a segfault (:issue:`12098`)
+
+- Bug in ``crosstab`` where arguments with non-overlapping indexes would return a ``KeyError`` (:issue:`10291`)
+
+- Bug in ``DataFrame.apply`` in which reduction was not being prevented for cases in which ``dtype`` was not a numpy dtype (:issue:`12244`)
+- Bug when initializing categorical series with a scalar value. (:issue:`12336`)
+- Bug when specifying a UTC ``DatetimeIndex`` by setting ``utc=True`` in ``.to_datetime`` (:issue:`11934`)
+- Bug when increasing the buffer size of CSV reader in ``read_csv`` (:issue:`12494`)
+- Bug when setting columns of a ``DataFrame`` with duplicate column names (:issue:`12344`)
+
+
+.. _whatsnew_0.18.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.17.1..v0.18.0
diff --git a/doc/source/whatsnew/v0.18.0.txt b/doc/source/whatsnew/v0.18.0.txt
deleted file mode 100644
index 4b27cf706f9b2..0000000000000
--- a/doc/source/whatsnew/v0.18.0.txt
+++ /dev/null
@@ -1,1292 +0,0 @@
-.. _whatsnew_0180:
-
-v0.18.0 (March 13, 2016)
-------------------------
-
-This is a major release from 0.17.1 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-.. warning::
-
-   pandas >= 0.18.0 no longer supports compatibility with Python version 2.6
-   and 3.3 (:issue:`7718`, :issue:`11273`)
-
-.. warning::
-
-   ``numexpr`` version 2.4.4 will now show a warning and not be used as a computation back-end for pandas because of some buggy behavior. This does not affect other versions (>= 2.1 and >= 2.4.6). (:issue:`12489`)
-
-Highlights include:
-
-- Moving and expanding window functions are now methods on Series and DataFrame,
-  similar to ``.groupby``, see :ref:`here <whatsnew_0180.enhancements.moments>`.
-- Adding support for a ``RangeIndex`` as a specialized form of the ``Int64Index``
-  for memory savings, see :ref:`here <whatsnew_0180.enhancements.rangeindex>`.
-- API breaking change to the ``.resample`` method to make it more ``.groupby``
-  like, see :ref:`here <whatsnew_0180.breaking.resample>`.
-- Removal of support for positional indexing with floats, which was deprecated
-  since 0.14.0. This will now raise a ``TypeError``, see :ref:`here <whatsnew_0180.float_indexers>`.
-- The ``.to_xarray()`` function has been added for compatibility with the
-  `xarray package <http://xarray.pydata.org/en/stable/>`__, see :ref:`here <whatsnew_0180.enhancements.xarray>`.
-- The ``read_sas`` function has been enhanced to read ``sas7bdat`` files, see :ref:`here <whatsnew_0180.enhancements.sas>`.
-- Addition of the :ref:`.str.extractall() method <whatsnew_0180.enhancements.extract>`,
-  and API changes to the :ref:`.str.extract() method <whatsnew_0180.enhancements.extract>`
-  and :ref:`.str.cat() method <whatsnew_0180.enhancements.strcat>`.
-- ``pd.test()`` top-level nose test runner is available (:issue:`4327`).
-
-Check the :ref:`API Changes <whatsnew_0180.api_breaking>` and :ref:`deprecations <whatsnew_0180.deprecations>` before updating.
-
-.. contents:: What's new in v0.18.0
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0180.enhancements:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0180.enhancements.moments:
-
-Window functions are now methods
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Window functions have been refactored to be methods on ``Series/DataFrame`` objects, rather than top-level functions, which are now deprecated. This allows these window-type functions, to have a similar API to that of ``.groupby``. See the full documentation :ref:`here <stats.moments>` (:issue:`11603`, :issue:`12373`)
-
-
-.. ipython:: python
-
-   np.random.seed(1234)
-   df = pd.DataFrame({'A' : range(10), 'B' : np.random.randn(10)})
-   df
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [8]: pd.rolling_mean(df,window=3)
-           FutureWarning: pd.rolling_mean is deprecated for DataFrame and will be removed in a future version, replace with
-                          DataFrame.rolling(window=3,center=False).mean()
-   Out[8]:
-       A         B
-   0 NaN       NaN
-   1 NaN       NaN
-   2   1  0.237722
-   3   2 -0.023640
-   4   3  0.133155
-   5   4 -0.048693
-   6   5  0.342054
-   7   6  0.370076
-   8   7  0.079587
-   9   8 -0.954504
-
-New Behavior:
-
-.. ipython:: python
-
-   r = df.rolling(window=3)
-
-These show a descriptive repr
-
-.. ipython:: python
-
-   r
-with tab-completion of available methods and properties.
-
-.. code-block:: ipython
-
-   In [9]: r.
-   r.A           r.agg         r.apply       r.count       r.exclusions  r.max         r.median      r.name        r.skew        r.sum
-   r.B           r.aggregate   r.corr        r.cov         r.kurt        r.mean        r.min         r.quantile    r.std         r.var
-
-The methods operate on the ``Rolling`` object itself
-
-.. ipython:: python
-
-   r.mean()
-
-They provide getitem accessors
-
-.. ipython:: python
-
-   r['A'].mean()
-
-And multiple aggregations
-
-.. ipython:: python
-
-   r.agg({'A' : ['mean','std'],
-          'B' : ['mean','std']})
-
-.. _whatsnew_0180.enhancements.rename:
-
-Changes to rename
-^^^^^^^^^^^^^^^^^
-
-``Series.rename`` and ``NDFrame.rename_axis`` can now take a scalar or list-like
-argument for altering the Series or axis *name*, in addition to their old behaviors of altering labels. (:issue:`9494`, :issue:`11965`)
-
-.. ipython:: python
-
-   s = pd.Series(np.random.randn(5))
-   s.rename('newname')
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.random.randn(5, 2))
-   (df.rename_axis("indexname")
-      .rename_axis("columns_name", axis="columns"))
-
-The new functionality works well in method chains. Previously these methods only accepted functions or dicts mapping a *label* to a new label.
-This continues to work as before for function or dict-like values.
-
-
-.. _whatsnew_0180.enhancements.rangeindex:
-
-Range Index
-^^^^^^^^^^^
-
-A ``RangeIndex`` has been added to the ``Int64Index`` sub-classes to support a memory saving alternative for common use cases. This has a similar implementation to the python ``range`` object (``xrange`` in python 2), in that it only stores the start, stop, and step values for the index. It will transparently interact with the user API, converting to ``Int64Index`` if needed.
-
-This will now be the default constructed index for ``NDFrame`` objects, rather than previous an ``Int64Index``. (:issue:`939`, :issue:`12070`, :issue:`12071`, :issue:`12109`, :issue:`12888`)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [3]: s = pd.Series(range(1000))
-
-   In [4]: s.index
-   Out[4]:
-   Int64Index([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,
-               ...
-               990, 991, 992, 993, 994, 995, 996, 997, 998, 999], dtype='int64', length=1000)
-
-   In [6]: s.index.nbytes
-   Out[6]: 8000
-
-
-New Behavior:
-
-.. ipython:: python
-
-   s = pd.Series(range(1000))
-   s.index
-   s.index.nbytes
-
-.. _whatsnew_0180.enhancements.extract:
-
-Changes to str.extract
-^^^^^^^^^^^^^^^^^^^^^^
-
-The :ref:`.str.extract <text.extract>` method takes a regular
-expression with capture groups, finds the first match in each subject
-string, and returns the contents of the capture groups
-(:issue:`11386`).
-
-In v0.18.0, the ``expand`` argument was added to
-``extract``.
-
-- ``expand=False``: it returns a ``Series``, ``Index``, or ``DataFrame``, depending on the subject and regular expression pattern (same behavior as pre-0.18.0).
-- ``expand=True``: it always returns a ``DataFrame``, which is more consistent and less confusing from the perspective of a user.
-
-Currently the default is ``expand=None`` which gives a ``FutureWarning`` and uses ``expand=False``. To avoid this warning, please explicitly specify ``expand``.
-
-.. code-block:: ipython
-
-   In [1]: pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=None)
-   FutureWarning: currently extract(expand=None) means expand=False (return Index/Series/DataFrame)
-   but in a future version of pandas this will be changed to expand=True (return DataFrame)
-
-   Out[1]:
-   0      1
-   1      2
-   2    NaN
-   dtype: object
-
-Extracting a regular expression with one group returns a Series if
-``expand=False``.
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=False)
-
-It returns a ``DataFrame`` with one column if ``expand=True``.
-
-.. ipython:: python
-
-   pd.Series(['a1', 'b2', 'c3']).str.extract('[ab](\d)', expand=True)
-
-Calling on an ``Index`` with a regex with exactly one capture group
-returns  an ``Index`` if ``expand=False``.
-
-.. ipython:: python
-
-   s = pd.Series(["a1", "b2", "c3"], ["A11", "B22", "C33"])
-   s.index
-   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=False)
-
-It returns a ``DataFrame`` with one column if ``expand=True``.
-
-.. ipython:: python
-
-   s.index.str.extract("(?P<letter>[a-zA-Z])", expand=True)
-
-Calling on an ``Index`` with a regex with more than one capture group
-raises ``ValueError`` if ``expand=False``.
-
-.. code-block:: python
-
-    >>> s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=False)
-    ValueError: only one regex group is supported with Index
-
-It returns a ``DataFrame`` if ``expand=True``.
-
-.. ipython:: python
-
-   s.index.str.extract("(?P<letter>[a-zA-Z])([0-9]+)", expand=True)
-
-In summary, ``extract(expand=True)`` always returns a ``DataFrame``
-with a row for every subject string, and a column for every capture
-group.
-
-.. _whatsnew_0180.enhancements.extractall:
-
-Addition of str.extractall
-^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The :ref:`.str.extractall <text.extractall>` method was added
-(:issue:`11386`).  Unlike ``extract``, which returns only the first
-match.
-
-.. ipython:: python
-
-   s = pd.Series(["a1a2", "b1", "c1"], ["A", "B", "C"])
-   s
-   s.str.extract("(?P<letter>[ab])(?P<digit>\d)", expand=False)
-
-The ``extractall`` method returns all matches.
-
-.. ipython:: python
-
-   s.str.extractall("(?P<letter>[ab])(?P<digit>\d)")
-
-.. _whatsnew_0180.enhancements.strcat:
-
-Changes to str.cat
-^^^^^^^^^^^^^^^^^^
-
-The method ``.str.cat()`` concatenates the members of a ``Series``. Before, if ``NaN`` values were present in the Series, calling ``.str.cat()`` on it would return ``NaN``, unlike the rest of the ``Series.str.*`` API. This behavior has been amended to ignore ``NaN`` values by default. (:issue:`11435`).
-
-A new, friendlier ``ValueError`` is added to protect against the mistake of supplying the ``sep`` as an arg, rather than as a kwarg. (:issue:`11334`).
-
-.. ipython:: python
-
-    pd.Series(['a','b',np.nan,'c']).str.cat(sep=' ')
-    pd.Series(['a','b',np.nan,'c']).str.cat(sep=' ', na_rep='?')
-
-.. code-block:: ipython
-
-    In [2]: pd.Series(['a','b',np.nan,'c']).str.cat(' ')
-    ValueError: Did you mean to supply a `sep` keyword?
-
-
-.. _whatsnew_0180.enhancements.rounding:
-
-Datetimelike rounding
-^^^^^^^^^^^^^^^^^^^^^
-
-``DatetimeIndex``, ``Timestamp``, ``TimedeltaIndex``, ``Timedelta`` have gained the ``.round()``, ``.floor()`` and ``.ceil()`` method for datetimelike rounding, flooring and ceiling. (:issue:`4314`, :issue:`11963`)
-
-Naive datetimes
-
-.. ipython:: python
-
-   dr = pd.date_range('20130101 09:12:56.1234', periods=3)
-   dr
-   dr.round('s')
-
-   # Timestamp scalar
-   dr[0]
-   dr[0].round('10s')
-
-Tz-aware are rounded, floored and ceiled in local times
-
-.. ipython:: python
-
-   dr = dr.tz_localize('US/Eastern')
-   dr
-   dr.round('s')
-
-Timedeltas
-
-.. ipython:: python
-
-   t = timedelta_range('1 days 2 hr 13 min 45 us',periods=3,freq='d')
-   t
-   t.round('10min')
-
-   # Timedelta scalar
-   t[0]
-   t[0].round('2h')
-
-
-In addition, ``.round()``, ``.floor()`` and ``.ceil()`` will be available thru the ``.dt`` accessor of ``Series``.
-
-.. ipython:: python
-
-   s = pd.Series(dr)
-   s
-   s.dt.round('D')
-
-Formatting of Integers in FloatIndex
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Integers in ``FloatIndex``, e.g. 1., are now formatted with a decimal point and a ``0`` digit, e.g. ``1.0`` (:issue:`11713`)
-This change not only affects the display to the console, but also the output of IO methods like ``.to_csv`` or ``.to_html``.
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [2]: s = pd.Series([1,2,3], index=np.arange(3.))
-
-   In [3]: s
-   Out[3]:
-   0    1
-   1    2
-   2    3
-   dtype: int64
-
-   In [4]: s.index
-   Out[4]: Float64Index([0.0, 1.0, 2.0], dtype='float64')
-
-   In [5]: print(s.to_csv(path=None))
-   0,1
-   1,2
-   2,3
-
-
-New Behavior:
-
-.. ipython:: python
-
-   s = pd.Series([1,2,3], index=np.arange(3.))
-   s
-   s.index
-   print(s.to_csv(path=None))
-
-Changes to dtype assignment behaviors
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-When a DataFrame's slice is updated with a new slice of the same dtype, the dtype of the DataFrame will now remain the same. (:issue:`10503`)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [5]: df = pd.DataFrame({'a': [0, 1, 1],
-                              'b': pd.Series([100, 200, 300], dtype='uint32')})
-
-   In [7]: df.dtypes
-   Out[7]:
-   a     int64
-   b    uint32
-   dtype: object
-
-   In [8]: ix = df['a'] == 1
-
-   In [9]: df.loc[ix, 'b'] = df.loc[ix, 'b']
-
-   In [11]: df.dtypes
-   Out[11]:
-   a    int64
-   b    int64
-   dtype: object
-
-New Behavior:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': [0, 1, 1],
-                      'b': pd.Series([100, 200, 300], dtype='uint32')})
-   df.dtypes
-   ix = df['a'] == 1
-   df.loc[ix, 'b'] = df.loc[ix, 'b']
-   df.dtypes
-
-When a DataFrame's integer slice is partially updated with a new slice of floats that could potentially be downcasted to integer without losing precision, the dtype of the slice will be set to float instead of integer.
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [4]: df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
-                             columns=list('abc'),
-                             index=[[4,4,8], [8,10,12]])
-
-   In [5]: df
-   Out[5]:
-         a  b  c
-   4 8   1  2  3
-     10  4  5  6
-   8 12  7  8  9
-
-   In [7]: df.ix[4, 'c'] = np.array([0., 1.])
-
-   In [8]: df
-   Out[8]:
-         a  b  c
-   4 8   1  2  0
-     10  4  5  1
-   8 12  7  8  9
-
-New Behavior:
-
-.. ipython:: python
-
-   df = pd.DataFrame(np.array(range(1,10)).reshape(3,3),
-                     columns=list('abc'),
-                     index=[[4,4,8], [8,10,12]])
-   df
-   df.loc[4, 'c'] = np.array([0., 1.])
-   df
-
-.. _whatsnew_0180.enhancements.xarray:
-
-to_xarray
-^^^^^^^^^
-
-In a future version of pandas, we will be deprecating ``Panel`` and other > 2 ndim objects. In order to provide for continuity,
-all ``NDFrame`` objects have gained the ``.to_xarray()`` method in order to convert to ``xarray`` objects, which has
-a pandas-like interface for > 2 ndim. (:issue:`11972`)
-
-See the `xarray full-documentation here <http://xarray.pydata.org/en/stable/>`__.
-
-.. code-block:: ipython
-
-   In [1]: p = Panel(np.arange(2*3*4).reshape(2,3,4))
-
-   In [2]: p.to_xarray()
-   Out[2]:
-   <xarray.DataArray (items: 2, major_axis: 3, minor_axis: 4)>
-   array([[[ 0,  1,  2,  3],
-           [ 4,  5,  6,  7],
-           [ 8,  9, 10, 11]],
-
-          [[12, 13, 14, 15],
-           [16, 17, 18, 19],
-           [20, 21, 22, 23]]])
-   Coordinates:
-     * items       (items) int64 0 1
-     * major_axis  (major_axis) int64 0 1 2
-     * minor_axis  (minor_axis) int64 0 1 2 3
-
-Latex Representation
-^^^^^^^^^^^^^^^^^^^^
-
-``DataFrame`` has gained a ``._repr_latex_()`` method in order to allow for conversion to latex in a ipython/jupyter notebook using nbconvert. (:issue:`11778`)
-
-Note that this must be activated by setting the option ``pd.display.latex.repr=True`` (:issue:`12182`)
-
-For example, if you have a jupyter notebook you plan to convert to latex using nbconvert, place the statement ``pd.display.latex.repr=True`` in the first cell to have the contained DataFrame output also stored as latex.
-
-The options ``display.latex.escape`` and ``display.latex.longtable`` have also been added to the configuration and are used automatically by the ``to_latex``
-method. See the :ref:`available options docs <options.available>` for more info.
-
-.. _whatsnew_0180.enhancements.sas:
-
-``pd.read_sas()`` changes
-^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``read_sas`` has gained the ability to read SAS7BDAT files, including compressed files.  The files can be read in entirety, or incrementally.  For full details see :ref:`here <io.sas>`. (:issue:`4052`)
-
-.. _whatsnew_0180.enhancements.other:
-
-Other enhancements
-^^^^^^^^^^^^^^^^^^
-
-- Handle truncated floats in SAS xport files (:issue:`11713`)
-- Added option to hide index in ``Series.to_string`` (:issue:`11729`)
-- ``read_excel`` now supports s3 urls of the format ``s3://bucketname/filename`` (:issue:`11447`)
-- add support for ``AWS_S3_HOST`` env variable when reading from s3 (:issue:`12198`)
-- A simple version of ``Panel.round()`` is now implemented (:issue:`11763`)
-- For Python 3.x, ``round(DataFrame)``, ``round(Series)``, ``round(Panel)`` will work (:issue:`11763`)
-- ``sys.getsizeof(obj)`` returns the memory usage of a pandas object, including the
-  values it contains (:issue:`11597`)
-- ``Series`` gained an ``is_unique`` attribute (:issue:`11946`)
-- ``DataFrame.quantile`` and ``Series.quantile`` now accept ``interpolation`` keyword (:issue:`10174`).
-- Added ``DataFrame.style.format`` for more flexible formatting of cell values (:issue:`11692`)
-- ``DataFrame.select_dtypes`` now allows the ``np.float16`` typecode (:issue:`11990`)
-- ``pivot_table()`` now accepts most iterables for the ``values`` parameter (:issue:`12017`)
-- Added Google ``BigQuery`` service account authentication support, which enables authentication on remote servers. (:issue:`11881`, :issue:`12572`). For further details see `here <https://pandas-gbq.readthedocs.io/en/latest/intro.html>`__
-- ``HDFStore`` is now iterable: ``for k in store`` is equivalent to ``for k in store.keys()`` (:issue:`12221`).
-- Add missing methods/fields to ``.dt`` for ``Period`` (:issue:`8848`)
-- The entire codebase has been ``PEP``-ified (:issue:`12096`)
-
-.. _whatsnew_0180.api_breaking:
-
-Backwards incompatible API changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- the leading whitespaces have been removed from the output of ``.to_string(index=False)`` method (:issue:`11833`)
-- the ``out`` parameter has been removed from the ``Series.round()`` method. (:issue:`11763`)
-- ``DataFrame.round()`` leaves non-numeric columns unchanged in its return, rather than raises. (:issue:`11885`)
-- ``DataFrame.head(0)`` and ``DataFrame.tail(0)`` return empty frames, rather than ``self``.  (:issue:`11937`)
-- ``Series.head(0)`` and ``Series.tail(0)`` return empty series, rather than ``self``.  (:issue:`11937`)
-- ``to_msgpack`` and ``read_msgpack`` encoding now defaults to ``'utf-8'``. (:issue:`12170`)
-- the order of keyword arguments to text file parsing functions (``.read_csv()``, ``.read_table()``, ``.read_fwf()``) changed to group related arguments. (:issue:`11555`)
-- ``NaTType.isoformat`` now returns the string ``'NaT`` to allow the result to
-  be passed to the constructor of ``Timestamp``. (:issue:`12300`)
-
-NaT and Timedelta operations
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``NaT`` and ``Timedelta`` have expanded arithmetic operations, which are extended to ``Series``
-arithmetic where applicable.  Operations defined for ``datetime64[ns]`` or ``timedelta64[ns]``
-are now also defined for ``NaT`` (:issue:`11564`).
-
-``NaT`` now supports arithmetic operations with integers and floats.
-
-.. ipython:: python
-
-   pd.NaT * 1
-   pd.NaT * 1.5
-   pd.NaT / 2
-   pd.NaT * np.nan
-
-``NaT`` defines more arithmetic operations with ``datetime64[ns]`` and ``timedelta64[ns]``.
-
-.. ipython:: python
-
-   pd.NaT / pd.NaT
-   pd.Timedelta('1s') / pd.NaT
-
-``NaT`` may represent either a ``datetime64[ns]`` null or a ``timedelta64[ns]`` null.
-Given the ambiguity, it is treated as a ``timedelta64[ns]``, which allows more operations
-to succeed.
-
-.. ipython:: python
-
-   pd.NaT + pd.NaT
-
-   # same as
-   pd.Timedelta('1s') + pd.Timedelta('1s')
-
-as opposed to
-
-.. code-block:: ipython
-
-   In [3]: pd.Timestamp('19900315') + pd.Timestamp('19900315')
-   TypeError: unsupported operand type(s) for +: 'Timestamp' and 'Timestamp'
-
-However, when wrapped in a ``Series`` whose ``dtype`` is ``datetime64[ns]`` or ``timedelta64[ns]``,
-the ``dtype`` information is respected.
-
-.. code-block:: ipython
-
-   In [1]: pd.Series([pd.NaT], dtype='<M8[ns]') + pd.Series([pd.NaT], dtype='<M8[ns]')
-   TypeError: can only operate on a datetimes for subtraction,
-              but the operator [__add__] was passed
-
-.. ipython:: python
-
-   pd.Series([pd.NaT], dtype='<m8[ns]') + pd.Series([pd.NaT], dtype='<m8[ns]')
-
-``Timedelta`` division by ``floats`` now works.
-
-.. ipython:: python
-
-   pd.Timedelta('1s') / 2.0
-
-Subtraction by ``Timedelta`` in a ``Series`` by a ``Timestamp`` works (:issue:`11925`)
-
-.. ipython:: python
-
-   ser = pd.Series(pd.timedelta_range('1 day', periods=3))
-   ser
-   pd.Timestamp('2012-01-01') - ser
-
-
-``NaT.isoformat()`` now returns ``'NaT'``. This change allows allows
-``pd.Timestamp`` to rehydrate any timestamp like object from its isoformat
-(:issue:`12300`).
-
-Changes to msgpack
-^^^^^^^^^^^^^^^^^^
-
-Forward incompatible changes in ``msgpack`` writing format were made over 0.17.0 and 0.18.0; older versions of pandas cannot read files packed by newer versions (:issue:`12129`, :issue:`10527`)
-
-Bugs in ``to_msgpack`` and ``read_msgpack`` introduced in 0.17.0 and fixed in 0.18.0, caused files packed in Python 2 unreadable by Python 3 (:issue:`12142`). The following table describes the backward and forward compat of msgpacks.
-
-.. warning::
-
-   +----------------------+------------------------+
-   | Packed with          | Can be unpacked with   |
-   +======================+========================+
-   | pre-0.17 / Python 2  | any                    |
-   +----------------------+------------------------+
-   | pre-0.17 / Python 3  | any                    |
-   +----------------------+------------------------+
-   | 0.17 / Python 2      | - ==0.17 / Python 2    |
-   |                      | - >=0.18 / any Python  |
-   +----------------------+------------------------+
-   | 0.17 / Python 3      | >=0.18 / any Python    |
-   +----------------------+------------------------+
-   | 0.18                 | >= 0.18                |
-   +----------------------+------------------------+
-
-
-   0.18.0 is backward-compatible for reading files packed by older versions, except for files packed with 0.17 in Python 2, in which case only they can only be unpacked in Python 2.
-
-Signature change for .rank
-^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Series.rank`` and ``DataFrame.rank`` now have the same signature (:issue:`11759`)
-
-Previous signature
-
-.. code-block:: ipython
-
-   In [3]: pd.Series([0,1]).rank(method='average', na_option='keep',
-                                 ascending=True, pct=False)
-   Out[3]:
-   0    1
-   1    2
-   dtype: float64
-
-   In [4]: pd.DataFrame([0,1]).rank(axis=0, numeric_only=None,
-                                    method='average', na_option='keep',
-                                    ascending=True, pct=False)
-   Out[4]:
-      0
-   0  1
-   1  2
-
-New signature
-
-.. ipython:: python
-
-   pd.Series([0,1]).rank(axis=0, method='average', numeric_only=None,
-                         na_option='keep', ascending=True, pct=False)
-   pd.DataFrame([0,1]).rank(axis=0, method='average', numeric_only=None,
-                            na_option='keep', ascending=True, pct=False)
-
-
-Bug in QuarterBegin with n=0
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In previous versions, the behavior of the QuarterBegin offset was inconsistent
-depending on the date when the ``n`` parameter was 0. (:issue:`11406`)
-
-The general semantics of anchored offsets for ``n=0`` is to not move the date
-when it is an anchor point (e.g., a quarter start date), and otherwise roll
-forward to the next anchor point.
-
-.. ipython:: python
-
-   d = pd.Timestamp('2014-02-01')
-   d
-   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
-   d + pd.offsets.QuarterBegin(n=0, startingMonth=1)
-
-For the ``QuarterBegin`` offset in previous versions, the date would be rolled
-*backwards* if date was in the same month as the quarter start date.
-
-.. code-block:: ipython
-
-   In [3]: d = pd.Timestamp('2014-02-15')
-
-   In [4]: d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
-   Out[4]: Timestamp('2014-02-01 00:00:00')
-
-This behavior has been corrected in version 0.18.0, which is consistent with
-other anchored offsets like ``MonthBegin`` and ``YearBegin``.
-
-.. ipython:: python
-
-   d = pd.Timestamp('2014-02-15')
-   d + pd.offsets.QuarterBegin(n=0, startingMonth=2)
-
-.. _whatsnew_0180.breaking.resample:
-
-Resample API
-^^^^^^^^^^^^
-
-Like the change in the window functions API :ref:`above <whatsnew_0180.enhancements.moments>`, ``.resample(...)`` is changing to have a more groupby-like API. (:issue:`11732`, :issue:`12702`, :issue:`12202`, :issue:`12332`, :issue:`12334`, :issue:`12348`, :issue:`12448`).
-
-.. ipython:: python
-
-   np.random.seed(1234)
-   df = pd.DataFrame(np.random.rand(10,4),
-                     columns=list('ABCD'),
-                     index=pd.date_range('2010-01-01 09:00:00', periods=10, freq='s'))
-   df
-
-
-**Previous API**:
-
-You would write a resampling operation that immediately evaluates. If a ``how`` parameter was not provided, it
-would default to ``how='mean'``.
-
-.. code-block:: ipython
-
-   In [6]: df.resample('2s')
-   Out[6]:
-                            A         B         C         D
-   2010-01-01 09:00:00  0.485748  0.447351  0.357096  0.793615
-   2010-01-01 09:00:02  0.820801  0.794317  0.364034  0.531096
-   2010-01-01 09:00:04  0.433985  0.314582  0.424104  0.625733
-   2010-01-01 09:00:06  0.624988  0.609738  0.633165  0.612452
-   2010-01-01 09:00:08  0.510470  0.534317  0.573201  0.806949
-
-You could also specify a ``how`` directly
-
-.. code-block:: ipython
-
-   In [7]: df.resample('2s', how='sum')
-   Out[7]:
-                            A         B         C         D
-   2010-01-01 09:00:00  0.971495  0.894701  0.714192  1.587231
-   2010-01-01 09:00:02  1.641602  1.588635  0.728068  1.062191
-   2010-01-01 09:00:04  0.867969  0.629165  0.848208  1.251465
-   2010-01-01 09:00:06  1.249976  1.219477  1.266330  1.224904
-   2010-01-01 09:00:08  1.020940  1.068634  1.146402  1.613897
-
-**New API**:
-
-Now, you can write ``.resample(..)`` as a 2-stage operation like ``.groupby(...)``, which
-yields a ``Resampler``.
-
-.. ipython:: python
-   :okwarning:
-
-   r = df.resample('2s')
-   r
-
-Downsampling
-""""""""""""
-
-You can then use this object to perform operations.
-These are downsampling operations (going from a higher frequency to a lower one).
-
-.. ipython:: python
-
-   r.mean()
-
-.. ipython:: python
-
-   r.sum()
-
-Furthermore, resample now supports ``getitem`` operations to perform the resample on specific columns.
-
-.. ipython:: python
-
-   r[['A','C']].mean()
-
-and ``.aggregate`` type operations.
-
-.. ipython:: python
-
-   r.agg({'A' : 'mean', 'B' : 'sum'})
-
-These accessors can of course, be combined
-
-.. ipython:: python
-
-   r[['A','B']].agg(['mean','sum'])
-
-Upsampling
-""""""""""
-
-.. currentmodule:: pandas.tseries.resample
-
-Upsampling operations take you from a lower frequency to a higher frequency. These are now
-performed with the ``Resampler`` objects with :meth:`~Resampler.backfill`,
-:meth:`~Resampler.ffill`, :meth:`~Resampler.fillna` and :meth:`~Resampler.asfreq` methods.
-
-.. ipython:: python
-
-   s = pd.Series(np.arange(5,dtype='int64'),
-                 index=date_range('2010-01-01', periods=5, freq='Q'))
-   s
-
-Previously
-
-.. code-block:: ipython
-
-   In [6]: s.resample('M', fill_method='ffill')
-   Out[6]:
-   2010-03-31    0
-   2010-04-30    0
-   2010-05-31    0
-   2010-06-30    1
-   2010-07-31    1
-   2010-08-31    1
-   2010-09-30    2
-   2010-10-31    2
-   2010-11-30    2
-   2010-12-31    3
-   2011-01-31    3
-   2011-02-28    3
-   2011-03-31    4
-   Freq: M, dtype: int64
-
-New API
-
-.. ipython:: python
-
-   s.resample('M').ffill()
-
-.. note::
-
-   In the new API, you can either downsample OR upsample. The prior implementation would allow you to pass an aggregator function (like ``mean``) even though you were upsampling, providing a bit of confusion.
-
-Previous API will work but with deprecations
-""""""""""""""""""""""""""""""""""""""""""""
-
-.. warning::
-
-   This new API for resample includes some internal changes for the prior-to-0.18.0 API, to work with a deprecation warning in most cases, as the resample operation returns a deferred object. We can intercept operations and just do what the (pre 0.18.0) API did (with a warning). Here is a typical use case:
-
-   .. code-block:: ipython
-
-      In [4]: r = df.resample('2s')
-
-      In [6]: r*10
-      pandas/tseries/resample.py:80: FutureWarning: .resample() is now a deferred operation
-      use .resample(...).mean() instead of .resample(...)
-
-      Out[6]:
-                            A         B         C         D
-      2010-01-01 09:00:00  4.857476  4.473507  3.570960  7.936154
-      2010-01-01 09:00:02  8.208011  7.943173  3.640340  5.310957
-      2010-01-01 09:00:04  4.339846  3.145823  4.241039  6.257326
-      2010-01-01 09:00:06  6.249881  6.097384  6.331650  6.124518
-      2010-01-01 09:00:08  5.104699  5.343172  5.732009  8.069486
-
-   However, getting and assignment operations directly on a ``Resampler`` will raise a ``ValueError``:
-
-   .. code-block:: ipython
-
-      In [7]: r.iloc[0] = 5
-      ValueError: .resample() is now a deferred operation
-      use .resample(...).mean() instead of .resample(...)
-
-   There is a situation where the new API can not perform all the operations when using original code.
-   This code is intending to resample every 2s, take the ``mean`` AND then take the ``min`` of those results.
-
-   .. code-block:: ipython
-
-      In [4]: df.resample('2s').min()
-      Out[4]:
-      A    0.433985
-      B    0.314582
-      C    0.357096
-      D    0.531096
-      dtype: float64
-
-   The new API will:
-
-   .. ipython:: python
-
-      df.resample('2s').min()
-
-   The good news is the return dimensions will differ between the new API and the old API, so this should loudly raise
-   an exception.
-
-   To replicate the original operation
-
-   .. ipython:: python
-
-      df.resample('2s').mean().min()
-
-Changes to eval
-^^^^^^^^^^^^^^^
-
-In prior versions, new columns assignments in an ``eval`` expression resulted
-in an inplace change to the ``DataFrame``. (:issue:`9297`, :issue:`8664`, :issue:`10486`)
-
-.. ipython:: python
-
-   df = pd.DataFrame({'a': np.linspace(0, 10, 5), 'b': range(5)})
-   df
-
-.. ipython:: python
-   :suppress:
-
-   df.eval('c = a + b', inplace=True)
-
-.. code-block:: ipython
-
-   In [12]: df.eval('c = a + b')
-   FutureWarning: eval expressions containing an assignment currentlydefault to operating inplace.
-   This will change in a future version of pandas, use inplace=True to avoid this warning.
-
-   In [13]: df
-   Out[13]:
-         a  b     c
-   0   0.0  0   0.0
-   1   2.5  1   3.5
-   2   5.0  2   7.0
-   3   7.5  3  10.5
-   4  10.0  4  14.0
-
-In version 0.18.0, a new ``inplace`` keyword was added to choose whether the
-assignment should be done inplace or return a copy.
-
-.. ipython:: python
-
-   df
-   df.eval('d = c - b', inplace=False)
-   df
-   df.eval('d = c - b', inplace=True)
-   df
-
-.. warning::
-
-   For backwards compatability, ``inplace`` defaults to ``True`` if not specified.
-   This will change in a future version of pandas. If your code depends on an
-   inplace assignment you should update to explicitly set ``inplace=True``
-
-The ``inplace`` keyword parameter was also added the ``query`` method.
-
-.. ipython:: python
-
-   df.query('a > 5')
-   df.query('a > 5', inplace=True)
-   df
-
-.. warning::
-
-   Note that the default value for ``inplace`` in a ``query``
-   is ``False``, which is consistent with prior versions.
-
-``eval`` has also been updated to allow multi-line expressions for multiple
-assignments.  These expressions will be evaluated one at a time in order.  Only
-assignments are valid for multi-line expressions.
-
-.. ipython:: python
-
-   df
-   df.eval("""
-   e = d + a
-   f = e - 22
-   g = f / 2.0""", inplace=True)
-   df
-
-
-.. _whatsnew_0180.api:
-
-Other API Changes
-^^^^^^^^^^^^^^^^^
-- ``DataFrame.between_time`` and ``Series.between_time`` now only parse a fixed set of time strings. Parsing of date strings is no longer supported and raises a ``ValueError``. (:issue:`11818`)
-
-  .. ipython:: python
-
-     s = pd.Series(range(10), pd.date_range('2015-01-01', freq='H', periods=10))
-     s.between_time("7:00am", "9:00am")
-
-  This will now raise.
-
-  .. code-block:: ipython
-
-     In [2]: s.between_time('20150101 07:00:00','20150101 09:00:00')
-     ValueError: Cannot convert arg ['20150101 07:00:00'] to a time.
-
-- ``.memory_usage()`` now includes values in the index, as does memory_usage in ``.info()`` (:issue:`11597`)
-- ``DataFrame.to_latex()`` now supports non-ascii encodings (eg ``utf-8``) in Python 2 with the parameter ``encoding`` (:issue:`7061`)
-- ``pandas.merge()`` and ``DataFrame.merge()`` will show a specific error message when trying to merge with an object that is not of type ``DataFrame`` or a subclass (:issue:`12081`)
-- ``DataFrame.unstack`` and ``Series.unstack`` now take ``fill_value`` keyword to allow direct replacement of missing values when an unstack results in missing values in the resulting ``DataFrame``. As an added benefit, specifying ``fill_value`` will preserve the data type of the original stacked data.  (:issue:`9746`)
-- As part of the new API for :ref:`window functions <whatsnew_0180.enhancements.moments>` and :ref:`resampling <whatsnew_0180.breaking.resample>`, aggregation functions have been clarified, raising more informative error messages on invalid aggregations. (:issue:`9052`). A full set of examples are presented in :ref:`groupby <groupby.aggregate>`.
-- Statistical functions for ``NDFrame`` objects (like ``sum(), mean(), min()``) will now raise if non-numpy-compatible arguments are passed in for ``**kwargs`` (:issue:`12301`)
-- ``.to_latex`` and ``.to_html`` gain a ``decimal`` parameter like ``.to_csv``; the default is ``'.'`` (:issue:`12031`)
-- More helpful error message when constructing a ``DataFrame`` with empty data but with indices (:issue:`8020`)
-- ``.describe()`` will now properly handle bool dtype as a categorical (:issue:`6625`)
-- More helpful error message with an invalid ``.transform`` with user defined input (:issue:`10165`)
-- Exponentially weighted functions now allow specifying alpha directly (:issue:`10789`) and raise ``ValueError`` if parameters violate ``0 < alpha <= 1`` (:issue:`12492`)
-
-.. _whatsnew_0180.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-.. _whatsnew_0180.window_deprecations:
-
-- The functions ``pd.rolling_*``, ``pd.expanding_*``, and ``pd.ewm*`` are deprecated and replaced by the corresponding method call. Note that
-  the new suggested syntax includes all of the arguments (even if default) (:issue:`11603`)
-
-  .. code-block:: ipython
-
-     In [1]: s = pd.Series(range(3))
-
-     In [2]: pd.rolling_mean(s,window=2,min_periods=1)
-             FutureWarning: pd.rolling_mean is deprecated for Series and
-                  will be removed in a future version, replace with
-                  Series.rolling(min_periods=1,window=2,center=False).mean()
-     Out[2]:
-             0    0.0
-             1    0.5
-             2    1.5
-             dtype: float64
-
-     In [3]: pd.rolling_cov(s, s, window=2)
-             FutureWarning: pd.rolling_cov is deprecated for Series and
-                  will be removed in a future version, replace with
-                  Series.rolling(window=2).cov(other=<Series>)
-     Out[3]:
-             0    NaN
-             1    0.5
-             2    0.5
-             dtype: float64
-
-- The the ``freq`` and ``how`` arguments to the ``.rolling``, ``.expanding``, and ``.ewm`` (new) functions are deprecated, and will be removed in a future version. You can simply resample the input prior to creating a window function. (:issue:`11603`).
-
-  For example, instead of ``s.rolling(window=5,freq='D').max()`` to get the max value on a rolling 5 Day window, one could use ``s.resample('D').mean().rolling(window=5).max()``, which first resamples the data to daily data, then provides a rolling 5 day window.
-
-- ``pd.tseries.frequencies.get_offset_name`` function is deprecated. Use offset's ``.freqstr`` property as alternative (:issue:`11192`)
-- ``pandas.stats.fama_macbeth`` routines are deprecated and will be removed in a future version (:issue:`6077`)
-- ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var`` routines are deprecated and will be removed in a future version (:issue:`6077`)
-- show a ``FutureWarning`` rather than a ``DeprecationWarning`` on using long-time deprecated syntax in ``HDFStore.select``, where the ``where`` clause is not a string-like (:issue:`12027`)
-
-- The ``pandas.options.display.mpl_style`` configuration has been deprecated
-  and will be removed in a future version of pandas. This functionality
-  is better handled by matplotlib's `style sheets`_ (:issue:`11783`).
-
-
-.. _style sheets: http://matplotlib.org/users/style_sheets.html
-
-.. _whatsnew_0180.float_indexers:
-
-Removal of deprecated float indexers
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In :issue:`4892` indexing with floating point numbers on a non-``Float64Index`` was deprecated (in version 0.14.0).
-In 0.18.0, this deprecation warning is removed and these will now raise a ``TypeError``. (:issue:`12165`, :issue:`12333`)
-
-.. ipython:: python
-
-   s = pd.Series([1, 2, 3], index=[4, 5, 6])
-   s
-   s2 = pd.Series([1, 2, 3], index=list('abc'))
-   s2
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   # this is label indexing
-   In [2]: s[5.0]
-   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
-   Out[2]: 2
-
-   # this is positional indexing
-   In [3]: s.iloc[1.0]
-   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
-   Out[3]: 2
-
-   # this is label indexing
-   In [4]: s.loc[5.0]
-   FutureWarning: scalar indexers for index type Int64Index should be integers and not floating point
-   Out[4]: 2
-
-   # .ix would coerce 1.0 to the positional 1, and index
-   In [5]: s2.ix[1.0] = 10
-   FutureWarning: scalar indexers for index type Index should be integers and not floating point
-
-   In [6]: s2
-   Out[6]:
-   a     1
-   b    10
-   c     3
-   dtype: int64
-
-New Behavior:
-
-For iloc, getting & setting via a float scalar will always raise.
-
-.. code-block:: ipython
-
-   In [3]: s.iloc[2.0]
-   TypeError: cannot do label indexing on <class 'pandas.indexes.numeric.Int64Index'> with these indexers [2.0] of <type 'float'>
-
-Other indexers will coerce to a like integer for both getting and setting. The ``FutureWarning`` has been dropped for ``.loc``, ``.ix`` and ``[]``.
-
-.. ipython:: python
-
-   s[5.0]
-   s.loc[5.0]
-
-and setting
-
-.. ipython:: python
-
-   s_copy = s.copy()
-   s_copy[5.0] = 10
-   s_copy
-   s_copy = s.copy()
-   s_copy.loc[5.0] = 10
-   s_copy
-
-Positional setting with ``.ix`` and a float indexer will ADD this value to the index, rather than previously setting the value by position.
-
-.. code-block:: python
-
-   In [3]: s2.ix[1.0] = 10
-   In [4]: s2
-   Out[4]:
-   a       1
-   b       2
-   c       3
-   1.0    10
-   dtype: int64
-
-Slicing will also coerce integer-like floats to integers for a non-``Float64Index``.
-
-.. ipython:: python
-
-   s.loc[5.0:6]
-
-Note that for floats that are NOT coercible to ints, the label based bounds will be excluded
-
-.. ipython:: python
-
-   s.loc[5.1:6]
-
-Float indexing on a ``Float64Index`` is unchanged.
-
-.. ipython:: python
-
-   s = pd.Series([1, 2, 3], index=np.arange(3.))
-   s[1.0]
-   s[1.0:2.5]
-
-.. _whatsnew_0180.prior_deprecations:
-
-Removal of prior version deprecations/changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Removal of ``rolling_corr_pairwise`` in favor of ``.rolling().corr(pairwise=True)`` (:issue:`4950`)
-- Removal of ``expanding_corr_pairwise`` in favor of ``.expanding().corr(pairwise=True)`` (:issue:`4950`)
-- Removal of ``DataMatrix`` module. This was not imported into the pandas namespace in any event (:issue:`12111`)
-- Removal of ``cols`` keyword in favor of ``subset`` in ``DataFrame.duplicated()`` and ``DataFrame.drop_duplicates()`` (:issue:`6680`)
-- Removal of the ``read_frame`` and ``frame_query`` (both aliases for ``pd.read_sql``)
-  and ``write_frame`` (alias of ``to_sql``) functions in the ``pd.io.sql`` namespace,
-  deprecated since 0.14.0 (:issue:`6292`).
-- Removal of the ``order`` keyword from ``.factorize()`` (:issue:`6930`)
-
-.. _whatsnew_0180.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved performance of ``andrews_curves`` (:issue:`11534`)
-- Improved huge ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex``'s ops performance including ``NaT`` (:issue:`10277`)
-- Improved performance of ``pandas.concat`` (:issue:`11958`)
-- Improved performance of ``StataReader`` (:issue:`11591`)
-- Improved performance in construction of ``Categoricals`` with ``Series`` of datetimes containing ``NaT`` (:issue:`12077`)
-
-
-- Improved performance of ISO 8601 date parsing for dates without separators (:issue:`11899`), leading zeros (:issue:`11871`) and with whitespace preceding the time zone (:issue:`9714`)
-
-
-
-
-.. _whatsnew_0180.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in ``GroupBy.size`` when data-frame is empty. (:issue:`11699`)
-- Bug in ``Period.end_time`` when a multiple of time period is requested (:issue:`11738`)
-- Regression in ``.clip`` with tz-aware datetimes (:issue:`11838`)
-- Bug in ``date_range`` when the boundaries fell on the frequency (:issue:`11804`, :issue:`12409`)
-- Bug in consistency of passing nested dicts to ``.groupby(...).agg(...)`` (:issue:`9052`)
-- Accept unicode in ``Timedelta`` constructor (:issue:`11995`)
-- Bug in value label reading for ``StataReader`` when reading incrementally (:issue:`12014`)
-- Bug in vectorized ``DateOffset`` when ``n`` parameter is ``0`` (:issue:`11370`)
-- Compat for numpy 1.11 w.r.t. ``NaT`` comparison changes (:issue:`12049`)
-- Bug in ``read_csv`` when reading from a ``StringIO`` in threads (:issue:`11790`)
-- Bug in not treating ``NaT`` as a missing value in datetimelikes when factorizing & with ``Categoricals`` (:issue:`12077`)
-- Bug in getitem when the values of a ``Series`` were tz-aware (:issue:`12089`)
-- Bug in ``Series.str.get_dummies`` when one of the variables was 'name' (:issue:`12180`)
-- Bug in ``pd.concat`` while concatenating tz-aware NaT series. (:issue:`11693`, :issue:`11755`, :issue:`12217`)
-- Bug in ``pd.read_stata`` with version <= 108 files (:issue:`12232`)
-- Bug in ``Series.resample`` using a frequency of ``Nano`` when the index is a ``DatetimeIndex`` and contains non-zero nanosecond parts (:issue:`12037`)
-- Bug in resampling with ``.nunique`` and a sparse index (:issue:`12352`)
-- Removed some compiler warnings (:issue:`12471`)
-- Work around compat issues with ``boto`` in python 3.5 (:issue:`11915`)
-- Bug in ``NaT`` subtraction from ``Timestamp`` or ``DatetimeIndex`` with timezones (:issue:`11718`)
-- Bug in subtraction of ``Series`` of a single tz-aware ``Timestamp`` (:issue:`12290`)
-- Use compat iterators in PY2 to support ``.next()`` (:issue:`12299`)
-- Bug in ``Timedelta.round`` with negative values (:issue:`11690`)
-- Bug in ``.loc`` against ``CategoricalIndex`` may result in normal ``Index`` (:issue:`11586`)
-- Bug in ``DataFrame.info`` when duplicated column names exist (:issue:`11761`)
-- Bug in ``.copy`` of datetime tz-aware objects (:issue:`11794`)
-- Bug in ``Series.apply`` and ``Series.map`` where ``timedelta64`` was not boxed (:issue:`11349`)
-- Bug in ``DataFrame.set_index()`` with tz-aware ``Series`` (:issue:`12358`)
-
-
-
-- Bug in subclasses of ``DataFrame`` where ``AttributeError`` did not propagate (:issue:`11808`)
-- Bug groupby on tz-aware data where selection not returning ``Timestamp`` (:issue:`11616`)
-- Bug in ``pd.read_clipboard`` and ``pd.to_clipboard`` functions not supporting Unicode; upgrade included ``pyperclip`` to v1.5.15 (:issue:`9263`)
-- Bug in ``DataFrame.query`` containing an assignment (:issue:`8664`)
-
-- Bug in ``from_msgpack`` where ``__contains__()`` fails for columns of the unpacked ``DataFrame``, if the ``DataFrame`` has object columns. (:issue:`11880`)
-- Bug in ``.resample`` on categorical data with ``TimedeltaIndex`` (:issue:`12169`)
-
-
-- Bug in timezone info lost when broadcasting scalar datetime to ``DataFrame`` (:issue:`11682`)
-- Bug in ``Index`` creation from ``Timestamp`` with mixed tz coerces to UTC (:issue:`11488`)
-- Bug in ``to_numeric`` where it does not raise if input is more than one dimension (:issue:`11776`)
-- Bug in parsing timezone offset strings with non-zero minutes (:issue:`11708`)
-- Bug in ``df.plot`` using incorrect colors for bar plots under matplotlib 1.5+ (:issue:`11614`)
-- Bug in the ``groupby`` ``plot`` method when using keyword arguments (:issue:`11805`).
-- Bug in ``DataFrame.duplicated`` and ``drop_duplicates`` causing spurious matches when setting ``keep=False`` (:issue:`11864`)
-- Bug in ``.loc`` result with duplicated key may have ``Index`` with incorrect dtype (:issue:`11497`)
-- Bug in ``pd.rolling_median`` where memory allocation failed even with sufficient memory (:issue:`11696`)
-- Bug in ``DataFrame.style`` with spurious zeros (:issue:`12134`)
-- Bug in ``DataFrame.style`` with integer columns not starting at 0 (:issue:`12125`)
-- Bug in ``.style.bar`` may not rendered properly using specific browser (:issue:`11678`)
-- Bug in rich comparison of ``Timedelta`` with a ``numpy.array`` of ``Timedelta`` that caused an infinite recursion (:issue:`11835`)
-- Bug in ``DataFrame.round`` dropping column index name (:issue:`11986`)
-- Bug in ``df.replace`` while replacing value in mixed dtype ``Dataframe`` (:issue:`11698`)
-- Bug in ``Index`` prevents copying name of passed ``Index``, when a new name is not provided (:issue:`11193`)
-- Bug in ``read_excel`` failing to read any non-empty sheets when empty sheets exist and ``sheetname=None`` (:issue:`11711`)
-- Bug in ``read_excel`` failing to raise ``NotImplemented`` error when keywords ``parse_dates`` and ``date_parser`` are provided (:issue:`11544`)
-- Bug in ``read_sql`` with ``pymysql`` connections failing to return chunked data (:issue:`11522`)
-- Bug in ``.to_csv`` ignoring formatting parameters ``decimal``, ``na_rep``, ``float_format`` for float indexes (:issue:`11553`)
-- Bug in ``Int64Index`` and ``Float64Index`` preventing the use of the modulo operator (:issue:`9244`)
-- Bug in ``MultiIndex.drop`` for not lexsorted multi-indexes (:issue:`12078`)
-
-- Bug in ``DataFrame`` when masking an empty ``DataFrame`` (:issue:`11859`)
-
-
-- Bug in ``.plot`` potentially modifying the ``colors`` input when the number of columns didn't match the number of series provided (:issue:`12039`).
-- Bug in ``Series.plot`` failing when index has a ``CustomBusinessDay`` frequency (:issue:`7222`).
-- Bug in ``.to_sql`` for ``datetime.time`` values with sqlite fallback (:issue:`8341`)
-- Bug in ``read_excel`` failing to read data with one column when ``squeeze=True`` (:issue:`12157`)
-- Bug in ``read_excel`` failing to read one empty column (:issue:`12292`, :issue:`9002`)
-- Bug in ``.groupby`` where a ``KeyError`` was not raised for a wrong column if there was only one row in the dataframe (:issue:`11741`)
-- Bug in ``.read_csv`` with dtype specified on empty data producing an error (:issue:`12048`)
-- Bug in ``.read_csv`` where strings like ``'2E'`` are treated as valid floats (:issue:`12237`)
-- Bug in building *pandas* with debugging symbols (:issue:`12123`)
-
-
-- Removed ``millisecond`` property of ``DatetimeIndex``. This would always raise a ``ValueError`` (:issue:`12019`).
-- Bug in ``Series`` constructor with read-only data (:issue:`11502`)
-- Removed ``pandas.util.testing.choice()``.  Should use ``np.random.choice()``, instead. (:issue:`12386`)
-- Bug in ``.loc`` setitem indexer preventing the use of a TZ-aware DatetimeIndex (:issue:`12050`)
-- Bug in ``.style`` indexes and multi-indexes not appearing (:issue:`11655`)
-- Bug in ``to_msgpack`` and ``from_msgpack`` which did not correctly serialize or deserialize ``NaT`` (:issue:`12307`).
-- Bug in ``.skew`` and ``.kurt`` due to roundoff error for highly similar values (:issue:`11974`)
-- Bug in ``Timestamp`` constructor where microsecond resolution was lost if HHMMSS were not separated with ':' (:issue:`10041`)
-- Bug in ``buffer_rd_bytes`` src->buffer could be freed more than once if reading failed, causing a segfault (:issue:`12098`)
-
-- Bug in ``crosstab`` where arguments with non-overlapping indexes would return a ``KeyError`` (:issue:`10291`)
-
-- Bug in ``DataFrame.apply`` in which reduction was not being prevented for cases in which ``dtype`` was not a numpy dtype (:issue:`12244`)
-- Bug when initializing categorical series with a scalar value. (:issue:`12336`)
-- Bug when specifying a UTC ``DatetimeIndex`` by setting ``utc=True`` in ``.to_datetime`` (:issue:`11934`)
-- Bug when increasing the buffer size of CSV reader in ``read_csv`` (:issue:`12494`)
-- Bug when setting columns of a ``DataFrame`` with duplicate column names (:issue:`12344`)
diff --git a/doc/source/whatsnew/v0.18.1.rst b/doc/source/whatsnew/v0.18.1.rst
new file mode 100644
index 0000000000000..f099ccf284bc2
--- /dev/null
+++ b/doc/source/whatsnew/v0.18.1.rst
@@ -0,0 +1,713 @@
+.. _whatsnew_0181:
+
+v0.18.1 (May 3, 2016)
+---------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release from 0.18.0 and includes a large number of
+bug fixes along with several new features, enhancements, and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- ``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see :ref:`here <whatsnew_0181.deferred_ops>`
+- ``pd.to_datetime()`` has gained the ability to assemble dates from a ``DataFrame``, see :ref:`here <whatsnew_0181.enhancements.assembling>`
+- Method chaining improvements, see :ref:`here <whatsnew_0181.enhancements.method_chain>`.
+- Custom business hour offset, see :ref:`here <whatsnew_0181.enhancements.custombusinesshour>`.
+- Many bug fixes in the handling of ``sparse``, see :ref:`here <whatsnew_0181.sparse>`
+- Expanded the :ref:`Tutorials section <tutorial-modern>` with a feature on modern pandas, courtesy of `@TomAugsburger <https://twitter.com/TomAugspurger>`__. (:issue:`13045`).
+
+
+.. contents:: What's new in v0.18.1
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0181.new_features:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0181.enhancements.custombusinesshour:
+
+Custom Business Hour
+^^^^^^^^^^^^^^^^^^^^
+
+The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
+allows you to specify arbitrary holidays. For details,
+see :ref:`Custom Business Hour <timeseries.custombusinesshour>` (:issue:`11514`)
+
+.. ipython:: python
+
+    from pandas.tseries.offsets import CustomBusinessHour
+    from pandas.tseries.holiday import USFederalHolidayCalendar
+    bhour_us = CustomBusinessHour(calendar=USFederalHolidayCalendar())
+
+Friday before MLK Day
+
+.. ipython:: python
+
+    import datetime
+    dt = datetime.datetime(2014, 1, 17, 15)
+
+    dt + bhour_us
+
+Tuesday after MLK Day (Monday is skipped because it's a holiday)
+
+.. ipython:: python
+
+    dt + bhour_us * 2
+
+.. _whatsnew_0181.deferred_ops:
+
+``.groupby(..)`` syntax with window and resample operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see (:issue:`12486`, :issue:`12738`).
+
+You can now use ``.rolling(..)`` and ``.expanding(..)`` as methods on groupbys. These return another deferred object (similar to what ``.rolling()`` and ``.expanding()`` do on ungrouped pandas objects). You can then operate on these ``RollingGroupby`` objects in a similar manner.
+
+Previously you would have to do this to get a rolling window mean per-group:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                      'B': np.arange(40)})
+   df
+
+.. ipython:: python
+
+   df.groupby('A').apply(lambda x: x.rolling(4).B.mean())
+
+Now you can do:
+
+.. ipython:: python
+
+   df.groupby('A').rolling(4).B.mean()
+
+For ``.resample(..)`` type of operations, previously you would have to:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'date': pd.date_range(start='2016-01-01',
+                                            periods=4,
+                                            freq='W'),
+                      'group': [1, 1, 2, 2],
+                      'val': [5, 6, 7, 8]}).set_index('date')
+
+   df
+
+.. ipython:: python
+
+   df.groupby('group').apply(lambda x: x.resample('1D').ffill())
+
+Now you can do:
+
+.. ipython:: python
+
+   df.groupby('group').resample('1D').ffill()
+
+.. _whatsnew_0181.enhancements.method_chain:
+
+Method chaining improvements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The following methods / indexers now accept a ``callable``. It is intended to make
+these more useful in method chains, see the :ref:`documentation <indexing.callable>`.
+(:issue:`11485`, :issue:`12533`)
+
+- ``.where()`` and ``.mask()``
+- ``.loc[]``, ``iloc[]`` and ``.ix[]``
+- ``[]`` indexing
+
+``.where()`` and ``.mask()``
+""""""""""""""""""""""""""""
+
+These can accept a callable for the condition and ``other``
+arguments.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [4, 5, 6],
+                      'C': [7, 8, 9]})
+   df.where(lambda x: x > 4, lambda x: x + 10)
+
+``.loc[]``, ``.iloc[]``, ``.ix[]``
+""""""""""""""""""""""""""""""""""
+
+These can accept a callable, and a tuple of callable as a slicer. The callable
+can return a valid boolean indexer or anything which is valid for these indexer's input.
+
+.. ipython:: python
+
+   # callable returns bool indexer
+   df.loc[lambda x: x.A >= 2, lambda x: x.sum() > 10]
+
+   # callable returns list of labels
+   df.loc[lambda x: [1, 2], lambda x: ['A', 'B']]
+
+``[]`` indexing
+"""""""""""""""
+
+Finally, you can use a callable in ``[]`` indexing of Series, DataFrame and Panel.
+The callable must return a valid input for ``[]`` indexing depending on its
+class and index type.
+
+.. ipython:: python
+
+   df[lambda x: 'A']
+
+Using these methods / indexers, you can chain data selection operations
+without using temporary variable.
+
+.. ipython:: python
+
+   bb = pd.read_csv('data/baseball.csv', index_col='id')
+   (bb.groupby(['year', 'team'])
+      .sum()
+      .loc[lambda df: df.r > 100])
+
+.. _whatsnew_0181.partial_string_indexing:
+
+Partial string indexing on ``DateTimeIndex`` when part of a ``MultiIndex``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Partial string indexing now matches on ``DateTimeIndex`` when part of a ``MultiIndex`` (:issue:`10331`)
+
+.. ipython:: python
+
+   dft2 = pd.DataFrame(
+       np.random.randn(20, 1),
+       columns=['A'],
+       index=pd.MultiIndex.from_product([pd.date_range('20130101',
+                                                       periods=10,
+                                                       freq='12H'),
+                                         ['a', 'b']]))
+   dft2
+   dft2.loc['2013-01-05']
+
+On other levels
+
+.. ipython:: python
+
+   idx = pd.IndexSlice
+   dft2 = dft2.swaplevel(0, 1).sort_index()
+   dft2
+   dft2.loc[idx[:, '2013-01-05'], :]
+
+.. _whatsnew_0181.enhancements.assembling:
+
+Assembling Datetimes
+^^^^^^^^^^^^^^^^^^^^
+
+``pd.to_datetime()`` has gained the ability to assemble datetimes from a passed in ``DataFrame`` or a dict. (:issue:`8158`).
+
+.. ipython:: python
+
+   df = pd.DataFrame({'year': [2015, 2016],
+                      'month': [2, 3],
+                      'day': [4, 5],
+                      'hour': [2, 3]})
+   df
+
+Assembling using the passed frame.
+
+.. ipython:: python
+
+   pd.to_datetime(df)
+
+You can pass only the columns that you need to assemble.
+
+.. ipython:: python
+
+   pd.to_datetime(df[['year', 'month', 'day']])
+
+.. _whatsnew_0181.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``pd.read_csv()`` now supports ``delim_whitespace=True`` for the Python engine (:issue:`12958`)
+- ``pd.read_csv()`` now supports opening ZIP files that contains a single CSV, via extension inference or explicit ``compression='zip'`` (:issue:`12175`)
+- ``pd.read_csv()`` now supports opening files using xz compression, via extension inference or explicit ``compression='xz'`` is specified; ``xz`` compressions is also supported by ``DataFrame.to_csv`` in the same way (:issue:`11852`)
+- ``pd.read_msgpack()`` now always gives writeable ndarrays even when compression is used (:issue:`12359`).
+- ``pd.read_msgpack()`` now supports serializing and de-serializing categoricals with msgpack (:issue:`12573`)
+- ``.to_json()`` now supports ``NDFrames`` that contain categorical and sparse data (:issue:`10778`)
+- ``interpolate()`` now supports ``method='akima'`` (:issue:`7588`).
+- ``pd.read_excel()`` now accepts path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path, in line with other ``read_*`` functions (:issue:`12655`)
+- Added ``.weekday_name`` property as a component to ``DatetimeIndex`` and the ``.dt`` accessor. (:issue:`11128`)
+
+- ``Index.take`` now handles ``allow_fill`` and ``fill_value`` consistently (:issue:`12631`)
+
+  .. ipython:: python
+
+     idx = pd.Index([1., 2., 3., 4.], dtype='float')
+
+     # default, allow_fill=True, fill_value=None
+     idx.take([2, -1])
+     idx.take([2, -1], fill_value=True)
+
+- ``Index`` now supports ``.str.get_dummies()`` which returns ``MultiIndex``, see :ref:`Creating Indicator Variables <text.indicator>` (:issue:`10008`, :issue:`10103`)
+
+  .. ipython:: python
+
+     idx = pd.Index(['a|b', 'a|c', 'b|c'])
+     idx.str.get_dummies('|')
+
+
+- ``pd.crosstab()`` has gained a ``normalize`` argument for normalizing frequency tables (:issue:`12569`). Examples in the updated docs :ref:`here <reshaping.crosstabulations>`.
+- ``.resample(..).interpolate()`` is now supported (:issue:`12925`)
+- ``.isin()`` now accepts passed ``sets`` (:issue:`12988`)
+
+.. _whatsnew_0181.sparse:
+
+Sparse changes
+~~~~~~~~~~~~~~
+
+These changes conform sparse handling to return the correct types and work to make a smoother experience with indexing.
+
+``SparseArray.take`` now returns a scalar for scalar input, ``SparseArray`` for others. Furthermore, it handles a negative indexer with the same rule as ``Index`` (:issue:`10560`, :issue:`12796`)
+
+.. code-block:: python
+
+   s = pd.SparseArray([np.nan, np.nan, 1, 2, 3, np.nan, 4, 5, np.nan, 6])
+   s.take(0)
+   s.take([1, 2, 3])
+
+- Bug in ``SparseSeries[]`` indexing with ``Ellipsis`` raises ``KeyError`` (:issue:`9467`)
+- Bug in ``SparseArray[]`` indexing with tuples are not handled properly (:issue:`12966`)
+- Bug in ``SparseSeries.loc[]`` with list-like input raises ``TypeError`` (:issue:`10560`)
+- Bug in ``SparseSeries.iloc[]`` with scalar input may raise ``IndexError`` (:issue:`10560`)
+- Bug in ``SparseSeries.loc[]``, ``.iloc[]`` with ``slice`` returns ``SparseArray``, rather than ``SparseSeries`` (:issue:`10560`)
+- Bug in ``SparseDataFrame.loc[]``, ``.iloc[]`` may results in dense ``Series``, rather than ``SparseSeries`` (:issue:`12787`)
+- Bug in ``SparseArray`` addition ignores ``fill_value`` of right hand side (:issue:`12910`)
+- Bug in ``SparseArray`` mod raises ``AttributeError`` (:issue:`12910`)
+- Bug in ``SparseArray`` pow calculates ``1 ** np.nan`` as ``np.nan`` which must be 1 (:issue:`12910`)
+- Bug in ``SparseArray`` comparison output may incorrect result or raise ``ValueError`` (:issue:`12971`)
+- Bug in ``SparseSeries.__repr__`` raises ``TypeError`` when it is longer than ``max_rows`` (:issue:`10560`)
+- Bug in ``SparseSeries.shape`` ignores ``fill_value`` (:issue:`10452`)
+- Bug in ``SparseSeries`` and ``SparseArray`` may have different ``dtype`` from its dense values (:issue:`12908`)
+- Bug in ``SparseSeries.reindex`` incorrectly handle ``fill_value`` (:issue:`12797`)
+- Bug in ``SparseArray.to_frame()`` results in ``DataFrame``, rather than ``SparseDataFrame`` (:issue:`9850`)
+- Bug in ``SparseSeries.value_counts()`` does not count ``fill_value`` (:issue:`6749`)
+- Bug in ``SparseArray.to_dense()`` does not preserve ``dtype`` (:issue:`10648`)
+- Bug in ``SparseArray.to_dense()`` incorrectly handle ``fill_value`` (:issue:`12797`)
+- Bug in ``pd.concat()`` of ``SparseSeries`` results in dense (:issue:`10536`)
+- Bug in ``pd.concat()`` of ``SparseDataFrame`` incorrectly handle ``fill_value`` (:issue:`9765`)
+- Bug in ``pd.concat()`` of ``SparseDataFrame`` may raise ``AttributeError`` (:issue:`12174`)
+- Bug in ``SparseArray.shift()`` may raise ``NameError`` or ``TypeError`` (:issue:`12908`)
+
+.. _whatsnew_0181.api:
+
+API changes
+~~~~~~~~~~~
+
+.. _whatsnew_0181.api.groubynth:
+
+``.groupby(..).nth()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The index in ``.groupby(..).nth()`` output is now more consistent when the ``as_index`` argument is passed (:issue:`11039`):
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': ['a', 'b', 'a'],
+                      'B': [1, 2, 3]})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [3]: df.groupby('A', as_index=True)['B'].nth(0)
+   Out[3]:
+   0    1
+   1    2
+   Name: B, dtype: int64
+
+   In [4]: df.groupby('A', as_index=False)['B'].nth(0)
+   Out[4]:
+   0    1
+   1    2
+   Name: B, dtype: int64
+
+New Behavior:
+
+.. ipython:: python
+
+    df.groupby('A', as_index=True)['B'].nth(0)
+    df.groupby('A', as_index=False)['B'].nth(0)
+
+Furthermore, previously, a ``.groupby`` would always sort, regardless if ``sort=False`` was passed with ``.nth()``.
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.randn(100, 2), columns=['a', 'b'])
+   df['c'] = np.random.randint(0, 4, 100)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df.groupby('c', sort=True).nth(1)
+   Out[4]:
+             a         b
+   c
+   0 -0.334077  0.002118
+   1  0.036142 -2.074978
+   2 -0.720589  0.887163
+   3  0.859588 -0.636524
+
+   In [5]: df.groupby('c', sort=False).nth(1)
+   Out[5]:
+             a         b
+   c
+   0 -0.334077  0.002118
+   1  0.036142 -2.074978
+   2 -0.720589  0.887163
+   3  0.859588 -0.636524
+
+New Behavior:
+
+.. ipython:: python
+
+   df.groupby('c', sort=True).nth(1)
+   df.groupby('c', sort=False).nth(1)
+
+
+.. _whatsnew_0181.numpy_compatibility:
+
+numpy function compatibility
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Compatibility between pandas array-like methods (e.g. ``sum`` and ``take``) and their ``numpy``
+counterparts has been greatly increased by augmenting the signatures of the ``pandas`` methods so
+as to accept arguments that can be passed in from ``numpy``, even if they are not necessarily
+used in the ``pandas`` implementation (:issue:`12644`, :issue:`12638`, :issue:`12687`)
+
+- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
+- Bug in numpy compatibility of ``np.round()`` on a ``Series`` (:issue:`12600`)
+
+An example of this signature augmentation is illustrated below:
+
+.. ipython:: python
+
+   sp = pd.SparseDataFrame([1, 2, 3])
+   sp
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [2]: np.cumsum(sp, axis=0)
+   ...
+   TypeError: cumsum() takes at most 2 arguments (4 given)
+
+New behaviour:
+
+.. ipython:: python
+
+   np.cumsum(sp, axis=0)
+
+.. _whatsnew_0181.apply_resample:
+
+Using ``.apply`` on groupby resampling
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Using ``apply`` on resampling groupby operations (using a ``pd.TimeGrouper``) now has the same output types as similar ``apply`` calls on other groupby operations. (:issue:`11742`).
+
+.. ipython:: python
+
+    df = pd.DataFrame({'date': pd.to_datetime(['10/10/2000', '11/10/2000']),
+                      'value': [10, 13]})
+    df
+
+Previous behavior:
+
+.. code-block:: ipython
+
+    In [1]: df.groupby(pd.TimeGrouper(key='date',
+       ...:                           freq='M')).apply(lambda x: x.value.sum())
+    Out[1]:
+    ...
+    TypeError: cannot concatenate a non-NDFrame object
+
+    # Output is a Series
+    In [2]: df.groupby(pd.TimeGrouper(key='date',
+       ...:                           freq='M')).apply(lambda x: x[['value']].sum())
+    Out[2]:
+    date
+    2000-10-31  value    10
+    2000-11-30  value    13
+    dtype: int64
+
+New Behavior:
+
+.. code-block:: ipython
+
+    # Output is a Series
+    In [55]: df.groupby(pd.TimeGrouper(key='date',
+        ...:                           freq='M')).apply(lambda x: x.value.sum())
+    Out[55]:
+    date
+    2000-10-31    10
+    2000-11-30    13
+    Freq: M, dtype: int64
+
+    # Output is a DataFrame
+    In [56]: df.groupby(pd.TimeGrouper(key='date',
+        ...:                           freq='M')).apply(lambda x: x[['value']].sum())
+    Out[56]:
+                value
+    date
+    2000-10-31     10
+    2000-11-30     13
+
+.. _whatsnew_0181.read_csv_exceptions:
+
+Changes in ``read_csv`` exceptions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+
+In order to standardize the ``read_csv`` API for both the ``c`` and ``python`` engines, both will now raise an
+``EmptyDataError``, a subclass of ``ValueError``, in response to empty columns or header (:issue:`12493`, :issue:`12506`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [1]: import io
+
+   In [2]: df = pd.read_csv(io.StringIO(''), engine='c')
+   ...
+   ValueError: No columns to parse from file
+
+   In [3]: df = pd.read_csv(io.StringIO(''), engine='python')
+   ...
+   StopIteration
+
+New behaviour:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.read_csv(io.StringIO(''), engine='c')
+   ...
+   pandas.io.common.EmptyDataError: No columns to parse from file
+
+   In [2]: df = pd.read_csv(io.StringIO(''), engine='python')
+   ...
+   pandas.io.common.EmptyDataError: No columns to parse from file
+
+In addition to this error change, several others have been made as well:
+
+- ``CParserError`` now sub-classes ``ValueError`` instead of just a ``Exception`` (:issue:`12551`)
+- A ``CParserError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine cannot parse a column (:issue:`12506`)
+- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine encounters a ``NaN`` value in an integer column (:issue:`12506`)
+- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when ``true_values`` is specified, and the ``c`` engine encounters an element in a column containing unencodable bytes (:issue:`12506`)
+- ``pandas.parser.OverflowError`` exception has been removed and has been replaced with Python's built-in ``OverflowError`` exception (:issue:`12506`)
+- ``pd.read_csv()`` no longer allows a combination of strings and integers for the ``usecols`` parameter (:issue:`12678`)
+
+
+.. _whatsnew_0181.api.to_datetime:
+
+``to_datetime`` error changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Bugs in ``pd.to_datetime()`` when passing a ``unit`` with convertible entries and ``errors='coerce'`` or non-convertible with ``errors='ignore'``. Furthermore, an ``OutOfBoundsDateime`` exception will be raised when an out-of-range value is encountered for that unit when ``errors='raise'``. (:issue:`11758`, :issue:`13052`, :issue:`13059`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [27]: pd.to_datetime(1420043460, unit='s', errors='coerce')
+   Out[27]: NaT
+
+   In [28]: pd.to_datetime(11111111, unit='D', errors='ignore')
+   OverflowError: Python int too large to convert to C long
+
+   In [29]: pd.to_datetime(11111111, unit='D', errors='raise')
+   OverflowError: Python int too large to convert to C long
+
+New behaviour:
+
+.. code-block:: ipython
+
+   In [2]: pd.to_datetime(1420043460, unit='s', errors='coerce')
+   Out[2]: Timestamp('2014-12-31 16:31:00')
+
+   In [3]: pd.to_datetime(11111111, unit='D', errors='ignore')
+   Out[3]: 11111111
+
+   In [4]: pd.to_datetime(11111111, unit='D', errors='raise')
+   OutOfBoundsDatetime: cannot convert input with unit 'D'
+
+.. _whatsnew_0181.api.other:
+
+Other API changes
+^^^^^^^^^^^^^^^^^
+
+- ``.swaplevel()`` for ``Series``, ``DataFrame``, ``Panel``, and ``MultiIndex`` now features defaults for its first two parameters ``i`` and ``j`` that swap the two innermost levels of the index. (:issue:`12934`)
+- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
+- ``Period`` and ``PeriodIndex`` now raises ``IncompatibleFrequency`` error which inherits ``ValueError`` rather than raw ``ValueError`` (:issue:`12615`)
+- ``Series.apply`` for category dtype now applies the passed function to each of the ``.categories`` (and not the ``.codes``), and returns a ``category`` dtype if possible (:issue:`12473`)
+- ``read_csv`` will now raise a ``TypeError`` if ``parse_dates`` is neither a boolean, list, or dictionary (matches the doc-string) (:issue:`5636`)
+- The default for ``.query()/.eval()`` is now ``engine=None``, which will use ``numexpr`` if it's installed; otherwise it will fallback to the ``python`` engine. This mimics the pre-0.18.1 behavior if ``numexpr`` is installed (and which, previously, if numexpr was not installed, ``.query()/.eval()`` would raise). (:issue:`12749`)
+- ``pd.show_versions()`` now includes ``pandas_datareader`` version (:issue:`12740`)
+- Provide a proper ``__name__`` and ``__qualname__`` attributes for generic functions (:issue:`12021`)
+- ``pd.concat(ignore_index=True)`` now uses ``RangeIndex`` as default (:issue:`12695`)
+- ``pd.merge()`` and ``DataFrame.join()`` will show a ``UserWarning`` when merging/joining a single- with a multi-leveled dataframe (:issue:`9455`, :issue:`12219`)
+- Compat with ``scipy`` > 0.17 for deprecated ``piecewise_polynomial`` interpolation method; support for the replacement ``from_derivatives`` method (:issue:`12887`)
+
+.. _whatsnew_0181.deprecations:
+
+Deprecations
+^^^^^^^^^^^^
+
+- The method name ``Index.sym_diff()`` is deprecated and can be replaced by ``Index.symmetric_difference()`` (:issue:`12591`)
+- The method name ``Categorical.sort()`` is deprecated in favor of ``Categorical.sort_values()`` (:issue:`12882`)
+
+
+
+
+
+
+
+
+.. _whatsnew_0181.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved speed of SAS reader (:issue:`12656`, :issue:`12961`)
+- Performance improvements in ``.groupby(..).cumcount()`` (:issue:`11039`)
+- Improved memory usage in ``pd.read_csv()`` when using ``skiprows=an_integer`` (:issue:`13005`)
+- Improved performance of ``DataFrame.to_sql`` when checking case sensitivity for tables. Now only checks if table has been created correctly when table name is not lower case. (:issue:`12876`)
+- Improved performance of ``Period`` construction and time series plotting (:issue:`12903`, :issue:`11831`).
+- Improved performance of ``.str.encode()`` and ``.str.decode()`` methods (:issue:`13008`)
+- Improved performance of ``to_numeric`` if input is numeric dtype (:issue:`12777`)
+- Improved performance of sparse arithmetic with ``IntIndex`` (:issue:`13036`)
+
+
+
+
+
+
+
+
+.. _whatsnew_0181.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- ``usecols`` parameter in ``pd.read_csv`` is now respected even when the lines of a CSV file are not even (:issue:`12203`)
+- Bug in ``groupby.transform(..)`` when ``axis=1`` is specified with a non-monotonic ordered index (:issue:`12713`)
+- Bug in ``Period`` and ``PeriodIndex`` creation raises ``KeyError`` if ``freq="Minute"`` is specified. Note that "Minute" freq is deprecated in v0.17.0, and recommended to use ``freq="T"`` instead (:issue:`11854`)
+- Bug in ``.resample(...).count()`` with a ``PeriodIndex`` always raising a ``TypeError`` (:issue:`12774`)
+- Bug in ``.resample(...)`` with a ``PeriodIndex`` casting to a ``DatetimeIndex`` when empty (:issue:`12868`)
+- Bug in ``.resample(...)`` with a ``PeriodIndex`` when resampling to an existing frequency (:issue:`12770`)
+- Bug in printing data which contains ``Period`` with different ``freq`` raises ``ValueError`` (:issue:`12615`)
+- Bug in ``Series`` construction with ``Categorical`` and ``dtype='category'`` is specified (:issue:`12574`)
+- Bugs in concatenation with a coercible dtype was too aggressive, resulting in different dtypes in output formatting when an object was longer than ``display.max_rows`` (:issue:`12411`, :issue:`12045`, :issue:`11594`, :issue:`10571`, :issue:`12211`)
+- Bug in ``float_format`` option with option not being validated as a callable. (:issue:`12706`)
+- Bug in ``GroupBy.filter`` when ``dropna=False`` and no groups fulfilled the criteria (:issue:`12768`)
+- Bug in ``__name__`` of ``.cum*`` functions (:issue:`12021`)
+- Bug in ``.astype()`` of a ``Float64Inde/Int64Index`` to an ``Int64Index`` (:issue:`12881`)
+- Bug in round tripping an integer based index in ``.to_json()/.read_json()`` when ``orient='index'`` (the default) (:issue:`12866`)
+- Bug in plotting ``Categorical`` dtypes cause error when attempting stacked bar plot (:issue:`13019`)
+- Compat with >= ``numpy`` 1.11 for ``NaT`` comparisons (:issue:`12969`)
+- Bug in ``.drop()`` with a non-unique ``MultiIndex``. (:issue:`12701`)
+- Bug in ``.concat`` of datetime tz-aware and naive DataFrames (:issue:`12467`)
+- Bug in correctly raising a ``ValueError`` in ``.resample(..).fillna(..)`` when passing a non-string (:issue:`12952`)
+- Bug fixes in various encoding and header processing issues in ``pd.read_sas()`` (:issue:`12659`, :issue:`12654`, :issue:`12647`, :issue:`12809`)
+- Bug in ``pd.crosstab()`` where would silently ignore ``aggfunc`` if ``values=None`` (:issue:`12569`).
+- Potential segfault in ``DataFrame.to_json`` when serialising ``datetime.time`` (:issue:`11473`).
+- Potential segfault in ``DataFrame.to_json`` when attempting to serialise 0d array (:issue:`11299`).
+- Segfault in ``to_json`` when attempting to serialise a ``DataFrame`` or ``Series`` with non-ndarray values; now supports serialization of ``category``, ``sparse``, and ``datetime64[ns, tz]`` dtypes (:issue:`10778`).
+- Bug in ``DataFrame.to_json`` with unsupported dtype not passed to default handler (:issue:`12554`).
+- Bug in ``.align`` not returning the sub-class (:issue:`12983`)
+- Bug in aligning a ``Series`` with a ``DataFrame`` (:issue:`13037`)
+- Bug in ``ABCPanel`` in which ``Panel4D`` was not being considered as a valid instance of this generic type (:issue:`12810`)
+
+
+- Bug in consistency of ``.name`` on ``.groupby(..).apply(..)`` cases (:issue:`12363`)
+
+- Bug in ``Timestamp.__repr__`` that caused ``pprint`` to fail in nested structures (:issue:`12622`)
+- Bug in ``Timedelta.min`` and ``Timedelta.max``, the properties now report the true minimum/maximum ``timedeltas`` as recognized by pandas. See the :ref:`documentation <timedeltas.limitations>`. (:issue:`12727`)
+- Bug in ``.quantile()`` with interpolation may coerce to ``float`` unexpectedly (:issue:`12772`)
+- Bug in ``.quantile()`` with empty ``Series`` may return scalar rather than empty ``Series`` (:issue:`12772`)
+
+
+- Bug in ``.loc`` with out-of-bounds in a large indexer would raise ``IndexError`` rather than ``KeyError`` (:issue:`12527`)
+- Bug in resampling when using a ``TimedeltaIndex`` and ``.asfreq()``, would previously not include the final fencepost (:issue:`12926`)
+
+- Bug in equality testing with a ``Categorical`` in a ``DataFrame`` (:issue:`12564`)
+- Bug in ``GroupBy.first()``, ``.last()`` returns incorrect row when ``TimeGrouper`` is used (:issue:`7453`)
+
+
+
+- Bug in ``pd.read_csv()`` with the ``c`` engine when specifying ``skiprows`` with newlines in quoted items (:issue:`10911`, :issue:`12775`)
+- Bug in ``DataFrame`` timezone lost when assigning tz-aware datetime ``Series`` with alignment (:issue:`12981`)
+
+
+
+
+- Bug in ``.value_counts()`` when ``normalize=True`` and ``dropna=True`` where nulls still contributed to the normalized count (:issue:`12558`)
+- Bug in ``Series.value_counts()`` loses name if its dtype is ``category`` (:issue:`12835`)
+- Bug in ``Series.value_counts()`` loses timezone info (:issue:`12835`)
+- Bug in ``Series.value_counts(normalize=True)`` with ``Categorical`` raises ``UnboundLocalError`` (:issue:`12835`)
+- Bug in ``Panel.fillna()`` ignoring ``inplace=True`` (:issue:`12633`)
+- Bug in ``pd.read_csv()`` when specifying ``names``, ``usecols``, and ``parse_dates`` simultaneously with the ``c`` engine (:issue:`9755`)
+- Bug in ``pd.read_csv()`` when specifying ``delim_whitespace=True`` and ``lineterminator`` simultaneously with the ``c`` engine (:issue:`12912`)
+- Bug in ``Series.rename``, ``DataFrame.rename`` and ``DataFrame.rename_axis`` not treating ``Series`` as mappings to relabel (:issue:`12623`).
+- Clean in ``.rolling.min`` and ``.rolling.max`` to enhance dtype handling (:issue:`12373`)
+- Bug in ``groupby`` where complex types are coerced to float (:issue:`12902`)
+- Bug in ``Series.map`` raises ``TypeError`` if its dtype is ``category`` or tz-aware ``datetime`` (:issue:`12473`)
+
+- Bugs on 32bit platforms for some test comparisons (:issue:`12972`)
+- Bug in index coercion when falling back from ``RangeIndex`` construction (:issue:`12893`)
+- Better error message in window functions when invalid argument (e.g. a float window) is passed (:issue:`12669`)
+
+- Bug in slicing subclassed ``DataFrame`` defined to return subclassed ``Series`` may return normal ``Series`` (:issue:`11559`)
+
+
+- Bug in ``.str`` accessor methods may raise ``ValueError`` if input has ``name`` and the result is ``DataFrame`` or ``MultiIndex`` (:issue:`12617`)
+- Bug in ``DataFrame.last_valid_index()`` and ``DataFrame.first_valid_index()`` on empty frames (:issue:`12800`)
+
+
+- Bug in ``CategoricalIndex.get_loc`` returns different result from regular ``Index`` (:issue:`12531`)
+- Bug in ``PeriodIndex.resample`` where name not propagated (:issue:`12769`)
+
+- Bug in ``date_range`` ``closed`` keyword and timezones (:issue:`12684`).
+
+- Bug in ``pd.concat`` raises ``AttributeError`` when input data contains tz-aware datetime and timedelta (:issue:`12620`)
+- Bug in ``pd.concat`` did not handle empty ``Series`` properly (:issue:`11082`)
+
+- Bug in ``.plot.bar`` alignment when ``width`` is specified with ``int`` (:issue:`12979`)
+
+
+- Bug in ``fill_value`` is ignored if the argument to a binary operator is a constant (:issue:`12723`)
+
+- Bug in ``pd.read_html()`` when using bs4 flavor and parsing table with a header and only one column (:issue:`9178`)
+
+- Bug in ``.pivot_table`` when ``margins=True`` and ``dropna=True`` where nulls still contributed to margin count (:issue:`12577`)
+- Bug in ``.pivot_table`` when ``dropna=False`` where table index/column names disappear (:issue:`12133`)
+- Bug in ``pd.crosstab()`` when ``margins=True`` and ``dropna=False`` which raised (:issue:`12642`)
+
+- Bug in ``Series.name`` when ``name`` attribute can be a hashable type (:issue:`12610`)
+
+- Bug in ``.describe()`` resets categorical columns information (:issue:`11558`)
+- Bug where ``loffset`` argument was not applied when calling ``resample().count()`` on a timeseries (:issue:`12725`)
+- ``pd.read_excel()`` now accepts column names associated with keyword argument ``names`` (:issue:`12870`)
+- Bug in ``pd.to_numeric()`` with ``Index`` returns ``np.ndarray``, rather than ``Index`` (:issue:`12777`)
+- Bug in ``pd.to_numeric()`` with datetime-like may raise ``TypeError`` (:issue:`12777`)
+- Bug in ``pd.to_numeric()`` with scalar raises ``ValueError`` (:issue:`12777`)
+
+
+.. _whatsnew_0.18.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.18.0..v0.18.1
diff --git a/doc/source/whatsnew/v0.18.1.txt b/doc/source/whatsnew/v0.18.1.txt
deleted file mode 100644
index 7f74d8a769e4b..0000000000000
--- a/doc/source/whatsnew/v0.18.1.txt
+++ /dev/null
@@ -1,684 +0,0 @@
-.. _whatsnew_0181:
-
-v0.18.1 (May 3, 2016)
----------------------
-
-This is a minor bug-fix release from 0.18.0 and includes a large number of
-bug fixes along with several new features, enhancements, and performance improvements.
-We recommend that all users upgrade to this version.
-
-Highlights include:
-
-- ``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see :ref:`here <whatsnew_0181.deferred_ops>`
-- ``pd.to_datetime()`` has gained the ability to assemble dates from a ``DataFrame``, see :ref:`here <whatsnew_0181.enhancements.assembling>`
-- Method chaining improvements, see :ref:`here <whatsnew_0181.enhancements.method_chain>`.
-- Custom business hour offset, see :ref:`here <whatsnew_0181.enhancements.custombusinesshour>`.
-- Many bug fixes in the handling of ``sparse``, see :ref:`here <whatsnew_0181.sparse>`
-- Expanded the :ref:`Tutorials section <tutorial-modern>` with a feature on modern pandas, courtesy of `@TomAugsburger <https://twitter.com/TomAugspurger>`__. (:issue:`13045`).
-
-
-.. contents:: What's new in v0.18.1
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0181.new_features:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0181.enhancements.custombusinesshour:
-
-Custom Business Hour
-^^^^^^^^^^^^^^^^^^^^
-
-The ``CustomBusinessHour`` is a mixture of ``BusinessHour`` and ``CustomBusinessDay`` which
-allows you to specify arbitrary holidays. For details,
-see :ref:`Custom Business Hour <timeseries.custombusinesshour>` (:issue:`11514`)
-
-.. ipython:: python
-
-    from pandas.tseries.offsets import CustomBusinessHour
-    from pandas.tseries.holiday import USFederalHolidayCalendar
-    bhour_us = CustomBusinessHour(calendar=USFederalHolidayCalendar())
-
-Friday before MLK Day
-
-.. ipython:: python
-
-    dt = datetime(2014, 1, 17, 15)
-
-    dt + bhour_us
-
-Tuesday after MLK Day (Monday is skipped because it's a holiday)
-
-.. ipython:: python
-
-    dt + bhour_us * 2
-
-.. _whatsnew_0181.deferred_ops:
-
-``.groupby(..)`` syntax with window and resample operations
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``.groupby(...)`` has been enhanced to provide convenient syntax when working with ``.rolling(..)``, ``.expanding(..)`` and ``.resample(..)`` per group, see (:issue:`12486`, :issue:`12738`).
-
-You can now use ``.rolling(..)`` and ``.expanding(..)`` as methods on groupbys. These return another deferred object (similar to what ``.rolling()`` and ``.expanding()`` do on ungrouped pandas objects). You can then operate on these ``RollingGroupby`` objects in a similar manner.
-
-Previously you would have to do this to get a rolling window mean per-group:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
-                      'B': np.arange(40)})
-   df
-
-.. ipython:: python
-
-   df.groupby('A').apply(lambda x: x.rolling(4).B.mean())
-
-Now you can do:
-
-.. ipython:: python
-
-   df.groupby('A').rolling(4).B.mean()
-
-For ``.resample(..)`` type of operations, previously you would have to:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'date': pd.date_range(start='2016-01-01',
-                                            periods=4,
-                                            freq='W'),
-                      'group': [1, 1, 2, 2],
-                      'val': [5, 6, 7, 8]}).set_index('date')
-
-   df
-
-.. ipython:: python
-
-   df.groupby('group').apply(lambda x: x.resample('1D').ffill())
-
-Now you can do:
-
-.. ipython:: python
-
-   df.groupby('group').resample('1D').ffill()
-
-.. _whatsnew_0181.enhancements.method_chain:
-
-Method chaininng improvements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The following methods / indexers now accept a ``callable``. It is intended to make
-these more useful in method chains, see the :ref:`documentation <indexing.callable>`.
-(:issue:`11485`, :issue:`12533`)
-
-- ``.where()`` and ``.mask()``
-- ``.loc[]``, ``iloc[]`` and ``.ix[]``
-- ``[]`` indexing
-
-``.where()`` and ``.mask()``
-""""""""""""""""""""""""""""
-
-These can accept a callable for the condition and ``other``
-arguments.
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [1, 2, 3],
-                      'B': [4, 5, 6],
-                      'C': [7, 8, 9]})
-   df.where(lambda x: x > 4, lambda x: x + 10)
-
-``.loc[]``, ``.iloc[]``, ``.ix[]``
-""""""""""""""""""""""""""""""""""
-
-These can accept a callable, and a tuple of callable as a slicer. The callable
-can return a valid boolean indexer or anything which is valid for these indexer's input.
-
-.. ipython:: python
-
-   # callable returns bool indexer
-   df.loc[lambda x: x.A >= 2, lambda x: x.sum() > 10]
-
-   # callable returns list of labels
-   df.loc[lambda x: [1, 2], lambda x: ['A', 'B']]
-
-``[]`` indexing
-"""""""""""""""
-
-Finally, you can use a callable in ``[]`` indexing of Series, DataFrame and Panel.
-The callable must return a valid input for ``[]`` indexing depending on its
-class and index type.
-
-.. ipython:: python
-
-   df[lambda x: 'A']
-
-Using these methods / indexers, you can chain data selection operations
-without using temporary variable.
-
-.. ipython:: python
-
-   bb = pd.read_csv('data/baseball.csv', index_col='id')
-   (bb.groupby(['year', 'team'])
-      .sum()
-      .loc[lambda df: df.r > 100]
-   )
-
-.. _whatsnew_0181.partial_string_indexing:
-
-Partial string indexing on ``DateTimeIndex`` when part of a ``MultiIndex``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Partial string indexing now matches on ``DateTimeIndex`` when part of a ``MultiIndex`` (:issue:`10331`)
-
-.. ipython:: python
-
-   dft2 = pd.DataFrame(np.random.randn(20, 1),
-                       columns=['A'],
-                       index=pd.MultiIndex.from_product([pd.date_range('20130101',
-                                                                       periods=10,
-                                                                       freq='12H'),
-                                                        ['a', 'b']]))
-   dft2
-   dft2.loc['2013-01-05']
-
-On other levels
-
-.. ipython:: python
-
-   idx = pd.IndexSlice
-   dft2 = dft2.swaplevel(0, 1).sort_index()
-   dft2
-   dft2.loc[idx[:, '2013-01-05'], :]
-
-.. _whatsnew_0181.enhancements.assembling:
-
-Assembling Datetimes
-^^^^^^^^^^^^^^^^^^^^
-
-``pd.to_datetime()`` has gained the ability to assemble datetimes from a passed in ``DataFrame`` or a dict. (:issue:`8158`).
-
-.. ipython:: python
-
-   df = pd.DataFrame({'year': [2015, 2016],
-                      'month': [2, 3],
-                      'day': [4, 5],
-                      'hour': [2, 3]})
-   df
-
-Assembling using the passed frame.
-
-.. ipython:: python
-
-   pd.to_datetime(df)
-
-You can pass only the columns that you need to assemble.
-
-.. ipython:: python
-
-   pd.to_datetime(df[['year', 'month', 'day']])
-
-.. _whatsnew_0181.other:
-
-Other Enhancements
-^^^^^^^^^^^^^^^^^^
-
-- ``pd.read_csv()`` now supports ``delim_whitespace=True`` for the Python engine (:issue:`12958`)
-- ``pd.read_csv()`` now supports opening ZIP files that contains a single CSV, via extension inference or explict ``compression='zip'`` (:issue:`12175`)
-- ``pd.read_csv()`` now supports opening files using xz compression, via extension inference or explicit ``compression='xz'`` is specified; ``xz`` compressions is also supported by ``DataFrame.to_csv`` in the same way (:issue:`11852`)
-- ``pd.read_msgpack()`` now always gives writeable ndarrays even when compression is used (:issue:`12359`).
-- ``pd.read_msgpack()`` now supports serializing and de-serializing categoricals with msgpack (:issue:`12573`)
-- ``.to_json()`` now supports ``NDFrames`` that contain categorical and sparse data (:issue:`10778`)
-- ``interpolate()`` now supports ``method='akima'`` (:issue:`7588`).
-- ``pd.read_excel()`` now accepts path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path, in line with other ``read_*`` functions (:issue:`12655`)
-- Added ``.weekday_name`` property as a component to ``DatetimeIndex`` and the ``.dt`` accessor. (:issue:`11128`)
-
-- ``Index.take`` now handles ``allow_fill`` and ``fill_value`` consistently (:issue:`12631`)
-
-  .. ipython:: python
-
-     idx = pd.Index([1., 2., 3., 4.], dtype='float')
-
-     # default, allow_fill=True, fill_value=None
-     idx.take([2, -1])
-     idx.take([2, -1], fill_value=True)
-
-- ``Index`` now supports ``.str.get_dummies()`` which returns ``MultiIndex``, see :ref:`Creating Indicator Variables <text.indicator>` (:issue:`10008`, :issue:`10103`)
-
-  .. ipython:: python
-
-     idx = pd.Index(['a|b', 'a|c', 'b|c'])
-     idx.str.get_dummies('|')
-
-
-- ``pd.crosstab()`` has gained a ``normalize`` argument for normalizing frequency tables (:issue:`12569`). Examples in the updated docs :ref:`here <reshaping.crosstabulations>`.
-- ``.resample(..).interpolate()`` is now supported (:issue:`12925`)
-- ``.isin()`` now accepts passed ``sets`` (:issue:`12988`)
-
-.. _whatsnew_0181.sparse:
-
-Sparse changes
-~~~~~~~~~~~~~~
-
-These changes conform sparse handling to return the correct types and work to make a smoother experience with indexing.
-
-``SparseArray.take`` now returns a scalar for scalar input, ``SparseArray`` for others. Furthermore, it handles a negative indexer with the same rule as ``Index`` (:issue:`10560`, :issue:`12796`)
-
-.. ipython:: python
-
-   s = pd.SparseArray([np.nan, np.nan, 1, 2, 3, np.nan, 4, 5, np.nan, 6])
-   s.take(0)
-   s.take([1, 2, 3])
-
-- Bug in ``SparseSeries[]`` indexing with ``Ellipsis`` raises ``KeyError`` (:issue:`9467`)
-- Bug in ``SparseArray[]`` indexing with tuples are not handled properly (:issue:`12966`)
-- Bug in ``SparseSeries.loc[]`` with list-like input raises ``TypeError`` (:issue:`10560`)
-- Bug in ``SparseSeries.iloc[]`` with scalar input may raise ``IndexError`` (:issue:`10560`)
-- Bug in ``SparseSeries.loc[]``, ``.iloc[]`` with ``slice`` returns ``SparseArray``, rather than ``SparseSeries`` (:issue:`10560`)
-- Bug in ``SparseDataFrame.loc[]``, ``.iloc[]`` may results in dense ``Series``, rather than ``SparseSeries`` (:issue:`12787`)
-- Bug in ``SparseArray`` addition ignores ``fill_value`` of right hand side (:issue:`12910`)
-- Bug in ``SparseArray`` mod raises ``AttributeError`` (:issue:`12910`)
-- Bug in ``SparseArray`` pow calculates ``1 ** np.nan`` as ``np.nan`` which must be 1 (:issue:`12910`)
-- Bug in ``SparseArray`` comparison output may incorrect result or raise ``ValueError`` (:issue:`12971`)
-- Bug in ``SparseSeries.__repr__`` raises ``TypeError`` when it is longer than ``max_rows`` (:issue:`10560`)
-- Bug in ``SparseSeries.shape`` ignores ``fill_value`` (:issue:`10452`)
-- Bug in ``SparseSeries`` and ``SparseArray`` may have different ``dtype`` from its dense values (:issue:`12908`)
-- Bug in ``SparseSeries.reindex`` incorrectly handle ``fill_value`` (:issue:`12797`)
-- Bug in ``SparseArray.to_frame()`` results in ``DataFrame``, rather than ``SparseDataFrame`` (:issue:`9850`)
-- Bug in ``SparseSeries.value_counts()`` does not count ``fill_value`` (:issue:`6749`)
-- Bug in ``SparseArray.to_dense()`` does not preserve ``dtype`` (:issue:`10648`)
-- Bug in ``SparseArray.to_dense()`` incorrectly handle ``fill_value`` (:issue:`12797`)
-- Bug in ``pd.concat()`` of ``SparseSeries`` results in dense (:issue:`10536`)
-- Bug in ``pd.concat()`` of ``SparseDataFrame`` incorrectly handle ``fill_value`` (:issue:`9765`)
-- Bug in ``pd.concat()`` of ``SparseDataFrame`` may raise ``AttributeError`` (:issue:`12174`)
-- Bug in ``SparseArray.shift()`` may raise ``NameError`` or ``TypeError`` (:issue:`12908`)
-
-.. _whatsnew_0181.api:
-
-API changes
-~~~~~~~~~~~
-
-.. _whatsnew_0181.api.groubynth:
-
-``.groupby(..).nth()`` changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The index in ``.groupby(..).nth()`` output is now more consistent when the ``as_index`` argument is passed (:issue:`11039`):
-
-.. ipython:: python
-
-   df = DataFrame({'A' : ['a', 'b', 'a'],
-                   'B' : [1, 2, 3]})
-   df
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [3]: df.groupby('A', as_index=True)['B'].nth(0)
-   Out[3]:
-   0    1
-   1    2
-   Name: B, dtype: int64
-
-   In [4]: df.groupby('A', as_index=False)['B'].nth(0)
-   Out[4]:
-   0    1
-   1    2
-   Name: B, dtype: int64
-
-New Behavior:
-
-.. ipython:: python
-
-    df.groupby('A', as_index=True)['B'].nth(0)
-    df.groupby('A', as_index=False)['B'].nth(0)
-
-Furthermore, previously, a ``.groupby`` would always sort, regardless if ``sort=False`` was passed with ``.nth()``.
-
-.. ipython:: python
-
-   np.random.seed(1234)
-   df = pd.DataFrame(np.random.randn(100, 2), columns=['a', 'b'])
-   df['c'] = np.random.randint(0, 4, 100)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [4]: df.groupby('c', sort=True).nth(1)
-   Out[4]:
-             a         b
-   c
-   0 -0.334077  0.002118
-   1  0.036142 -2.074978
-   2 -0.720589  0.887163
-   3  0.859588 -0.636524
-
-   In [5]: df.groupby('c', sort=False).nth(1)
-   Out[5]:
-             a         b
-   c
-   0 -0.334077  0.002118
-   1  0.036142 -2.074978
-   2 -0.720589  0.887163
-   3  0.859588 -0.636524
-
-New Behavior:
-
-.. ipython:: python
-
-   df.groupby('c', sort=True).nth(1)
-   df.groupby('c', sort=False).nth(1)
-
-
-.. _whatsnew_0181.numpy_compatibility:
-
-numpy function compatibility
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Compatibility between pandas array-like methods (e.g. ``sum`` and ``take``) and their ``numpy``
-counterparts has been greatly increased by augmenting the signatures of the ``pandas`` methods so
-as to accept arguments that can be passed in from ``numpy``, even if they are not necessarily
-used in the ``pandas`` implementation (:issue:`12644`, :issue:`12638`, :issue:`12687`)
-
-- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
-- Bug in numpy compatibility of ``np.round()`` on a ``Series`` (:issue:`12600`)
-
-An example of this signature augmentation is illustrated below:
-
-.. ipython:: python
-
-   sp = pd.SparseDataFrame([1, 2, 3])
-   sp
-
-Previous behaviour:
-
-.. code-block:: ipython
-
-   In [2]: np.cumsum(sp, axis=0)
-   ...
-   TypeError: cumsum() takes at most 2 arguments (4 given)
-
-New behaviour:
-
-.. ipython:: python
-
-   np.cumsum(sp, axis=0)
-
-.. _whatsnew_0181.apply_resample:
-
-Using ``.apply`` on groupby resampling
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Using ``apply`` on resampling groupby operations (using a ``pd.TimeGrouper``) now has the same output types as similar ``apply`` calls on other groupby operations. (:issue:`11742`).
-
-.. ipython:: python
-
-    df = pd.DataFrame({'date': pd.to_datetime(['10/10/2000', '11/10/2000']),
-                      'value': [10, 13]})
-    df
-
-Previous behavior:
-
-.. code-block:: ipython
-
-    In [1]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x.value.sum())
-    Out[1]:
-    ...
-    TypeError: cannot concatenate a non-NDFrame object
-
-    # Output is a Series
-    In [2]: df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x[['value']].sum())
-    Out[2]:
-    date
-    2000-10-31  value    10
-    2000-11-30  value    13
-    dtype: int64
-
-New Behavior:
-
-.. ipython:: python
-
-    # Output is a Series
-    df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x.value.sum())
-
-    # Output is a DataFrame
-    df.groupby(pd.TimeGrouper(key='date', freq='M')).apply(lambda x: x[['value']].sum())
-
-.. _whatsnew_0181.read_csv_exceptions:
-
-Changes in ``read_csv`` exceptions
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In order to standardize the ``read_csv`` API for both the ``c`` and ``python`` engines, both will now raise an
-``EmptyDataError``, a subclass of ``ValueError``, in response to empty columns or header (:issue:`12493`, :issue:`12506`)
-
-Previous behaviour:
-
-.. code-block:: ipython
-
-   In [1]: df = pd.read_csv(StringIO(''), engine='c')
-   ...
-   ValueError: No columns to parse from file
-
-   In [2]: df = pd.read_csv(StringIO(''), engine='python')
-   ...
-   StopIteration
-
-New behaviour:
-
-.. code-block:: ipython
-
-   In [1]: df = pd.read_csv(StringIO(''), engine='c')
-   ...
-   pandas.io.common.EmptyDataError: No columns to parse from file
-
-   In [2]: df = pd.read_csv(StringIO(''), engine='python')
-   ...
-   pandas.io.common.EmptyDataError: No columns to parse from file
-
-In addition to this error change, several others have been made as well:
-
-- ``CParserError`` now sub-classes ``ValueError`` instead of just a ``Exception`` (:issue:`12551`)
-- A ``CParserError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine cannot parse a column (:issue:`12506`)
-- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when the ``c`` engine encounters a ``NaN`` value in an integer column (:issue:`12506`)
-- A ``ValueError`` is now raised instead of a generic ``Exception`` in ``read_csv`` when ``true_values`` is specified, and the ``c`` engine encounters an element in a column containing unencodable bytes (:issue:`12506`)
-- ``pandas.parser.OverflowError`` exception has been removed and has been replaced with Python's built-in ``OverflowError`` exception (:issue:`12506`)
-- ``pd.read_csv()`` no longer allows a combination of strings and integers for the ``usecols`` parameter (:issue:`12678`)
-
-
-.. _whatsnew_0181.api.to_datetime:
-
-``to_datetime`` error changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Bugs in ``pd.to_datetime()`` when passing a ``unit`` with convertible entries and ``errors='coerce'`` or non-convertible with ``errors='ignore'``. Furthermore, an ``OutOfBoundsDateime`` exception will be raised when an out-of-range value is encountered for that unit when ``errors='raise'``. (:issue:`11758`, :issue:`13052`, :issue:`13059`)
-
-Previous behaviour:
-
-.. code-block:: ipython
-
-   In [27]: pd.to_datetime(1420043460, unit='s', errors='coerce')
-   Out[27]: NaT
-
-   In [28]: pd.to_datetime(11111111, unit='D', errors='ignore')
-   OverflowError: Python int too large to convert to C long
-
-   In [29]: pd.to_datetime(11111111, unit='D', errors='raise')
-   OverflowError: Python int too large to convert to C long
-
-New behaviour:
-
-.. code-block:: ipython
-
-   In [2]: pd.to_datetime(1420043460, unit='s', errors='coerce')
-   Out[2]: Timestamp('2014-12-31 16:31:00')
-
-   In [3]: pd.to_datetime(11111111, unit='D', errors='ignore')
-   Out[3]: 11111111
-
-   In [4]: pd.to_datetime(11111111, unit='D', errors='raise')
-   OutOfBoundsDatetime: cannot convert input with unit 'D'
-
-.. _whatsnew_0181.api.other:
-
-Other API changes
-^^^^^^^^^^^^^^^^^
-
-- ``.swaplevel()`` for ``Series``, ``DataFrame``, ``Panel``, and ``MultiIndex`` now features defaults for its first two parameters ``i`` and ``j`` that swap the two innermost levels of the index. (:issue:`12934`)
-- ``.searchsorted()`` for ``Index`` and ``TimedeltaIndex`` now accept a ``sorter`` argument to maintain compatibility with numpy's ``searchsorted`` function (:issue:`12238`)
-- ``Period`` and ``PeriodIndex`` now raises ``IncompatibleFrequency`` error which inherits ``ValueError`` rather than raw ``ValueError`` (:issue:`12615`)
-- ``Series.apply`` for category dtype now applies the passed function to each of the ``.categories`` (and not the ``.codes``), and returns a ``category`` dtype if possible (:issue:`12473`)
-- ``read_csv`` will now raise a ``TypeError`` if ``parse_dates`` is neither a boolean, list, or dictionary (matches the doc-string) (:issue:`5636`)
-- The default for ``.query()/.eval()`` is now ``engine=None``, which will use ``numexpr`` if it's installed; otherwise it will fallback to the ``python`` engine. This mimics the pre-0.18.1 behavior if ``numexpr`` is installed (and which, previously, if numexpr was not installed, ``.query()/.eval()`` would raise). (:issue:`12749`)
-- ``pd.show_versions()`` now includes ``pandas_datareader`` version (:issue:`12740`)
-- Provide a proper ``__name__`` and ``__qualname__`` attributes for generic functions (:issue:`12021`)
-- ``pd.concat(ignore_index=True)`` now uses ``RangeIndex`` as default (:issue:`12695`)
-- ``pd.merge()`` and ``DataFrame.join()`` will show a ``UserWarning`` when merging/joining a single- with a multi-leveled dataframe (:issue:`9455`, :issue:`12219`)
-- Compat with ``scipy`` > 0.17 for deprecated ``piecewise_polynomial`` interpolation method; support for the replacement ``from_derivatives`` method (:issue:`12887`)
-
-.. _whatsnew_0181.deprecations:
-
-Deprecations
-^^^^^^^^^^^^
-
-- The method name ``Index.sym_diff()`` is deprecated and can be replaced by ``Index.symmetric_difference()`` (:issue:`12591`)
-- The method name ``Categorical.sort()`` is deprecated in favor of ``Categorical.sort_values()`` (:issue:`12882`)
-
-
-
-
-
-
-
-
-.. _whatsnew_0181.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved speed of SAS reader (:issue:`12656`, :issue:`12961`)
-- Performance improvements in ``.groupby(..).cumcount()`` (:issue:`11039`)
-- Improved memory usage in ``pd.read_csv()`` when using ``skiprows=an_integer`` (:issue:`13005`)
-- Improved performance of ``DataFrame.to_sql`` when checking case sensitivity for tables. Now only checks if table has been created correctly when table name is not lower case. (:issue:`12876`)
-- Improved performance of ``Period`` construction and time series plotting (:issue:`12903`, :issue:`11831`).
-- Improved performance of ``.str.encode()`` and ``.str.decode()`` methods (:issue:`13008`)
-- Improved performance of ``to_numeric`` if input is numeric dtype (:issue:`12777`)
-- Improved performance of sparse arithmetic with ``IntIndex`` (:issue:`13036`)
-
-
-
-
-
-
-
-
-.. _whatsnew_0181.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-- ``usecols`` parameter in ``pd.read_csv`` is now respected even when the lines of a CSV file are not even (:issue:`12203`)
-- Bug in ``groupby.transform(..)`` when ``axis=1`` is specified with a non-monotonic ordered index (:issue:`12713`)
-- Bug in ``Period`` and ``PeriodIndex`` creation raises ``KeyError`` if ``freq="Minute"`` is specified. Note that "Minute" freq is deprecated in v0.17.0, and recommended to use ``freq="T"`` instead (:issue:`11854`)
-- Bug in ``.resample(...).count()`` with a ``PeriodIndex`` always raising a ``TypeError`` (:issue:`12774`)
-- Bug in ``.resample(...)`` with a ``PeriodIndex`` casting to a ``DatetimeIndex`` when empty (:issue:`12868`)
-- Bug in ``.resample(...)`` with a ``PeriodIndex`` when resampling to an existing frequency (:issue:`12770`)
-- Bug in printing data which contains ``Period`` with different ``freq`` raises ``ValueError`` (:issue:`12615`)
-- Bug in ``Series`` construction with ``Categorical`` and ``dtype='category'`` is specified (:issue:`12574`)
-- Bugs in concatenation with a coercable dtype was too aggressive, resulting in different dtypes in outputformatting when an object was longer than ``display.max_rows`` (:issue:`12411`, :issue:`12045`, :issue:`11594`, :issue:`10571`, :issue:`12211`)
-- Bug in ``float_format`` option with option not being validated as a callable. (:issue:`12706`)
-- Bug in ``GroupBy.filter`` when ``dropna=False`` and no groups fulfilled the criteria (:issue:`12768`)
-- Bug in ``__name__`` of ``.cum*`` functions (:issue:`12021`)
-- Bug in ``.astype()`` of a ``Float64Inde/Int64Index`` to an ``Int64Index`` (:issue:`12881`)
-- Bug in roundtripping an integer based index in ``.to_json()/.read_json()`` when ``orient='index'`` (the default) (:issue:`12866`)
-- Bug in plotting ``Categorical`` dtypes cause error when attempting stacked bar plot (:issue:`13019`)
-- Compat with >= ``numpy`` 1.11 for ``NaT`` comparions (:issue:`12969`)
-- Bug in ``.drop()`` with a non-unique ``MultiIndex``. (:issue:`12701`)
-- Bug in ``.concat`` of datetime tz-aware and naive DataFrames (:issue:`12467`)
-- Bug in correctly raising a ``ValueError`` in ``.resample(..).fillna(..)`` when passing a non-string (:issue:`12952`)
-- Bug fixes in various encoding and header processing issues in ``pd.read_sas()`` (:issue:`12659`, :issue:`12654`, :issue:`12647`, :issue:`12809`)
-- Bug in ``pd.crosstab()`` where would silently ignore ``aggfunc`` if ``values=None`` (:issue:`12569`).
-- Potential segfault in ``DataFrame.to_json`` when serialising ``datetime.time`` (:issue:`11473`).
-- Potential segfault in ``DataFrame.to_json`` when attempting to serialise 0d array (:issue:`11299`).
-- Segfault in ``to_json`` when attempting to serialise a ``DataFrame`` or ``Series`` with non-ndarray values; now supports serialization of ``category``, ``sparse``, and ``datetime64[ns, tz]`` dtypes (:issue:`10778`).
-- Bug in ``DataFrame.to_json`` with unsupported dtype not passed to default handler (:issue:`12554`).
-- Bug in ``.align`` not returning the sub-class (:issue:`12983`)
-- Bug in aligning a ``Series`` with a ``DataFrame`` (:issue:`13037`)
-- Bug in ``ABCPanel`` in which ``Panel4D`` was not being considered as a valid instance of this generic type (:issue:`12810`)
-
-
-- Bug in consistency of ``.name`` on ``.groupby(..).apply(..)`` cases (:issue:`12363`)
-
-- Bug in ``Timestamp.__repr__`` that caused ``pprint`` to fail in nested structures (:issue:`12622`)
-- Bug in ``Timedelta.min`` and ``Timedelta.max``, the properties now report the true minimum/maximum ``timedeltas`` as recognized by pandas. See the :ref:`documentation <timedeltas.limitations>`. (:issue:`12727`)
-- Bug in ``.quantile()`` with interpolation may coerce to ``float`` unexpectedly (:issue:`12772`)
-- Bug in ``.quantile()`` with empty ``Series`` may return scalar rather than empty ``Series`` (:issue:`12772`)
-
-
-- Bug in ``.loc`` with out-of-bounds in a large indexer would raise ``IndexError`` rather than ``KeyError`` (:issue:`12527`)
-- Bug in resampling when using a ``TimedeltaIndex`` and ``.asfreq()``, would previously not include the final fencepost (:issue:`12926`)
-
-- Bug in equality testing with a ``Categorical`` in a ``DataFrame`` (:issue:`12564`)
-- Bug in ``GroupBy.first()``, ``.last()`` returns incorrect row when ``TimeGrouper`` is used (:issue:`7453`)
-
-
-
-- Bug in ``pd.read_csv()`` with the ``c`` engine when specifying ``skiprows`` with newlines in quoted items (:issue:`10911`, :issue:`12775`)
-- Bug in ``DataFrame`` timezone lost when assigning tz-aware datetime ``Series`` with alignment (:issue:`12981`)
-
-
-
-
-- Bug in ``.value_counts()`` when ``normalize=True`` and ``dropna=True`` where nulls still contributed to the normalized count (:issue:`12558`)
-- Bug in ``Series.value_counts()`` loses name if its dtype is ``category`` (:issue:`12835`)
-- Bug in ``Series.value_counts()`` loses timezone info (:issue:`12835`)
-- Bug in ``Series.value_counts(normalize=True)`` with ``Categorical`` raises ``UnboundLocalError`` (:issue:`12835`)
-- Bug in ``Panel.fillna()`` ignoring ``inplace=True`` (:issue:`12633`)
-- Bug in ``pd.read_csv()`` when specifying ``names``, ``usecols``, and ``parse_dates`` simultaneously with the ``c`` engine (:issue:`9755`)
-- Bug in ``pd.read_csv()`` when specifying ``delim_whitespace=True`` and ``lineterminator`` simultaneously with the ``c`` engine (:issue:`12912`)
-- Bug in ``Series.rename``, ``DataFrame.rename`` and ``DataFrame.rename_axis`` not treating ``Series`` as mappings to relabel (:issue:`12623`).
-- Clean in ``.rolling.min`` and ``.rolling.max`` to enhance dtype handling (:issue:`12373`)
-- Bug in ``groupby`` where complex types are coerced to float (:issue:`12902`)
-- Bug in ``Series.map`` raises ``TypeError`` if its dtype is ``category`` or tz-aware ``datetime`` (:issue:`12473`)
-
-- Bugs on 32bit platforms for some test comparisons (:issue:`12972`)
-- Bug in index coercion when falling back from ``RangeIndex`` construction (:issue:`12893`)
-- Better error message in window functions when invalid argument (e.g. a float window) is passed (:issue:`12669`)
-
-- Bug in slicing subclassed ``DataFrame`` defined to return subclassed ``Series`` may return normal ``Series`` (:issue:`11559`)
-
-
-- Bug in ``.str`` accessor methods may raise ``ValueError`` if input has ``name`` and the result is ``DataFrame`` or ``MultiIndex`` (:issue:`12617`)
-- Bug in ``DataFrame.last_valid_index()`` and ``DataFrame.first_valid_index()`` on empty frames (:issue:`12800`)
-
-
-- Bug in ``CategoricalIndex.get_loc`` returns different result from regular ``Index`` (:issue:`12531`)
-- Bug in ``PeriodIndex.resample`` where name not propagated (:issue:`12769`)
-
-- Bug in ``date_range`` ``closed`` keyword and timezones (:issue:`12684`).
-
-- Bug in ``pd.concat`` raises ``AttributeError`` when input data contains tz-aware datetime and timedelta (:issue:`12620`)
-- Bug in ``pd.concat`` did not handle empty ``Series`` properly (:issue:`11082`)
-
-- Bug in ``.plot.bar`` alginment when ``width`` is specified with ``int`` (:issue:`12979`)
-
-
-- Bug in ``fill_value`` is ignored if the argument to a binary operator is a constant (:issue:`12723`)
-
-- Bug in ``pd.read_html()`` when using bs4 flavor and parsing table with a header and only one column (:issue:`9178`)
-
-- Bug in ``.pivot_table`` when ``margins=True`` and ``dropna=True`` where nulls still contributed to margin count (:issue:`12577`)
-- Bug in ``.pivot_table`` when ``dropna=False`` where table index/column names disappear (:issue:`12133`)
-- Bug in ``pd.crosstab()`` when ``margins=True`` and ``dropna=False`` which raised (:issue:`12642`)
-
-- Bug in ``Series.name`` when ``name`` attribute can be a hashable type (:issue:`12610`)
-
-- Bug in ``.describe()`` resets categorical columns information (:issue:`11558`)
-- Bug where ``loffset`` argument was not applied when calling ``resample().count()`` on a timeseries (:issue:`12725`)
-- ``pd.read_excel()`` now accepts column names associated with keyword argument ``names`` (:issue:`12870`)
-- Bug in ``pd.to_numeric()`` with ``Index`` returns ``np.ndarray``, rather than ``Index`` (:issue:`12777`)
-- Bug in ``pd.to_numeric()`` with datetime-like may raise ``TypeError`` (:issue:`12777`)
-- Bug in ``pd.to_numeric()`` with scalar raises ``ValueError`` (:issue:`12777`)
diff --git a/doc/source/whatsnew/v0.19.0.rst b/doc/source/whatsnew/v0.19.0.rst
new file mode 100644
index 0000000000000..00d0d202d56cc
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.0.rst
@@ -0,0 +1,1581 @@
+.. _whatsnew_0190:
+
+v0.19.0 (October 2, 2016)
+-------------------------
+
+{{ header }}
+
+This is a major release from 0.18.1 and includes number of API changes, several new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- :func:`merge_asof` for asof-style time-series joining, see :ref:`here <whatsnew_0190.enhancements.asof_merge>`
+- ``.rolling()`` is now time-series aware, see :ref:`here <whatsnew_0190.enhancements.rolling_ts>`
+- :func:`read_csv` now supports parsing ``Categorical`` data, see :ref:`here <whatsnew_0190.enhancements.read_csv_categorical>`
+- A function :func:`union_categorical` has been added for combining categoricals, see :ref:`here <whatsnew_0190.enhancements.union_categoricals>`
+- ``PeriodIndex`` now has its own ``period`` dtype, and changed to be more consistent with other ``Index`` classes. See :ref:`here <whatsnew_0190.api.period>`
+- Sparse data structures gained enhanced support of ``int`` and ``bool`` dtypes, see :ref:`here <whatsnew_0190.sparse>`
+- Comparison operations with ``Series`` no longer ignores the index, see :ref:`here <whatsnew_0190.api.series_ops>` for an overview of the API changes.
+- Introduction of a pandas development API for utility functions, see :ref:`here <whatsnew_0190.dev_api>`.
+- Deprecation of ``Panel4D`` and ``PanelND``. We recommend to represent these types of n-dimensional data with the `xarray package <http://xarray.pydata.org/en/stable/>`__.
+- Removal of the previously deprecated modules ``pandas.io.data``, ``pandas.io.wb``, ``pandas.tools.rplot``.
+
+.. warning::
+
+    pandas >= 0.19.0 will no longer silence numpy ufunc warnings upon import, see :ref:`here <whatsnew_0190.errstate>`.
+
+.. contents:: What's new in v0.19.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0190.new_features:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0190.enhancements.asof_merge:
+
+``merge_asof`` for asof-style time-series joining
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A long-time requested feature has been added through the :func:`merge_asof` function, to
+support asof style joining of time-series (:issue:`1870`, :issue:`13695`, :issue:`13709`, :issue:`13902`). Full documentation is
+:ref:`here <merging.merge_asof>`.
+
+The :func:`merge_asof` performs an asof merge, which is similar to a left-join
+except that we match on nearest key rather than equal keys.
+
+.. ipython:: python
+
+   left = pd.DataFrame({'a': [1, 5, 10],
+                        'left_val': ['a', 'b', 'c']})
+   right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+                        'right_val': [1, 2, 3, 6, 7]})
+
+   left
+   right
+
+We typically want to match exactly when possible, and use the most
+recent value otherwise.
+
+.. ipython:: python
+
+   pd.merge_asof(left, right, on='a')
+
+We can also match rows ONLY with prior data, and not an exact match.
+
+.. ipython:: python
+
+   pd.merge_asof(left, right, on='a', allow_exact_matches=False)
+
+
+In a typical time-series example, we have ``trades`` and ``quotes`` and we want to ``asof-join`` them.
+This also illustrates using the ``by`` parameter to group data before merging.
+
+.. ipython:: python
+
+   trades = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.038',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.048']),
+       'ticker': ['MSFT', 'MSFT',
+                  'GOOG', 'GOOG', 'AAPL'],
+       'price': [51.95, 51.95,
+                 720.77, 720.92, 98.00],
+       'quantity': [75, 155,
+                    100, 100, 100]},
+       columns=['time', 'ticker', 'price', 'quantity'])
+
+   quotes = pd.DataFrame({
+       'time': pd.to_datetime(['20160525 13:30:00.023',
+                               '20160525 13:30:00.023',
+                               '20160525 13:30:00.030',
+                               '20160525 13:30:00.041',
+                               '20160525 13:30:00.048',
+                               '20160525 13:30:00.049',
+                               '20160525 13:30:00.072',
+                               '20160525 13:30:00.075']),
+       'ticker': ['GOOG', 'MSFT', 'MSFT', 'MSFT',
+                  'GOOG', 'AAPL', 'GOOG', 'MSFT'],
+       'bid': [720.50, 51.95, 51.97, 51.99,
+               720.50, 97.99, 720.50, 52.01],
+       'ask': [720.93, 51.96, 51.98, 52.00,
+               720.93, 98.01, 720.88, 52.03]},
+       columns=['time', 'ticker', 'bid', 'ask'])
+
+.. ipython:: python
+
+   trades
+   quotes
+
+An asof merge joins on the ``on``, typically a datetimelike field, which is ordered, and
+in this case we are using a grouper in the ``by`` field. This is like a left-outer join, except
+that forward filling happens automatically taking the most recent non-NaN value.
+
+.. ipython:: python
+
+   pd.merge_asof(trades, quotes,
+                 on='time',
+                 by='ticker')
+
+This returns a merged DataFrame with the entries in the same order as the original left
+passed DataFrame (``trades`` in this case), with the fields of the ``quotes`` merged.
+
+.. _whatsnew_0190.enhancements.rolling_ts:
+
+``.rolling()`` is now time-series aware
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``.rolling()`` objects are now time-series aware and can accept a time-series offset (or convertible) for the ``window`` argument (:issue:`13327`, :issue:`12995`).
+See the full documentation :ref:`here <stats.moments.ts>`.
+
+.. ipython:: python
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.date_range('20130101 09:00:00',
+                                          periods=5, freq='s'))
+   dft
+
+This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
+
+.. ipython:: python
+
+   dft.rolling(2).sum()
+   dft.rolling(2, min_periods=1).sum()
+
+Specifying an offset allows a more intuitive specification of the rolling frequency.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
+
+.. ipython:: python
+
+
+   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
+                      index=pd.Index([pd.Timestamp('20130101 09:00:00'),
+                                      pd.Timestamp('20130101 09:00:02'),
+                                      pd.Timestamp('20130101 09:00:03'),
+                                      pd.Timestamp('20130101 09:00:05'),
+                                      pd.Timestamp('20130101 09:00:06')],
+                                     name='foo'))
+
+   dft
+   dft.rolling(2).sum()
+
+Using the time-specification generates variable windows for this sparse data.
+
+.. ipython:: python
+
+   dft.rolling('2s').sum()
+
+Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
+default of the index) in a DataFrame.
+
+.. ipython:: python
+
+   dft = dft.reset_index()
+   dft
+   dft.rolling('2s', on='foo').sum()
+
+.. _whatsnew_0190.enhancements.read_csv_dupe_col_names_support:
+
+``read_csv`` has improved support for duplicate column names
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+:ref:`Duplicate column names <io.dupe_names>` are now supported in :func:`read_csv` whether
+they are in the file or passed in as the ``names`` parameter (:issue:`7160`, :issue:`9424`)
+
+.. ipython:: python
+
+   data = '0,1,2\n3,4,5'
+   names = ['a', 'b', 'a']
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.read_csv(StringIO(data), names=names)
+   Out[2]:
+      a  b  a
+   0  2  1  2
+   1  5  4  5
+
+The first ``a`` column contained the same data as the second ``a`` column, when it should have
+contained the values ``[0, 3]``.
+
+**New behavior**:
+
+.. ipython:: python
+   :okwarning:
+
+   pd.read_csv(StringIO(data), names=names)
+
+
+.. _whatsnew_0190.enhancements.read_csv_categorical:
+
+``read_csv`` supports parsing ``Categorical`` directly
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`read_csv` function now supports parsing a ``Categorical`` column when
+specified as a dtype (:issue:`10153`).  Depending on the structure of the data,
+this can result in a faster parse time and lower memory usage compared to
+converting to ``Categorical`` after parsing.  See the io :ref:`docs here <io.categorical>`.
+
+.. ipython:: python
+
+   data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
+
+   pd.read_csv(StringIO(data))
+   pd.read_csv(StringIO(data)).dtypes
+   pd.read_csv(StringIO(data), dtype='category').dtypes
+
+Individual columns can be parsed as a ``Categorical`` using a dict specification
+
+.. ipython:: python
+
+   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
+
+.. note::
+
+   The resulting categories will always be parsed as strings (object dtype).
+   If the categories are numeric they can be converted using the
+   :func:`to_numeric` function, or as appropriate, another converter
+   such as :func:`to_datetime`.
+
+   .. ipython:: python
+
+      df = pd.read_csv(StringIO(data), dtype='category')
+      df.dtypes
+      df['col3']
+      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
+      df['col3']
+
+.. _whatsnew_0190.enhancements.union_categoricals:
+
+Categorical Concatenation
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- A function :func:`union_categoricals` has been added for combining categoricals, see :ref:`Unioning Categoricals<categorical.union>` (:issue:`13361`, :issue:`13763`, :issue:`13846`, :issue:`14173`)
+
+  .. ipython:: python
+
+     from pandas.api.types import union_categoricals
+     a = pd.Categorical(["b", "c"])
+     b = pd.Categorical(["a", "b"])
+     union_categoricals([a, b])
+
+- ``concat`` and ``append`` now can concat ``category`` dtypes with different ``categories`` as ``object`` dtype (:issue:`13524`)
+
+  .. ipython:: python
+
+     s1 = pd.Series(['a', 'b'], dtype='category')
+     s2 = pd.Series(['b', 'c'], dtype='category')
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pd.concat([s1, s2])
+   ValueError: incompatible categories in categorical concat
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.concat([s1, s2])
+
+.. _whatsnew_0190.enhancements.semi_month_offsets:
+
+Semi-Month Offsets
+^^^^^^^^^^^^^^^^^^
+
+Pandas has gained new frequency offsets, ``SemiMonthEnd`` ('SM') and ``SemiMonthBegin`` ('SMS').
+These provide date offsets anchored (by default) to the 15th and end of month, and 15th and 1st of month respectively.
+(:issue:`1543`)
+
+.. ipython:: python
+
+   from pandas.tseries.offsets import SemiMonthEnd, SemiMonthBegin
+
+**SemiMonthEnd**:
+
+.. ipython:: python
+
+   pd.Timestamp('2016-01-01') + SemiMonthEnd()
+
+   pd.date_range('2015-01-01', freq='SM', periods=4)
+
+**SemiMonthBegin**:
+
+.. ipython:: python
+
+   pd.Timestamp('2016-01-01') + SemiMonthBegin()
+
+   pd.date_range('2015-01-01', freq='SMS', periods=4)
+
+Using the anchoring suffix, you can also specify the day of month to use instead of the 15th.
+
+.. ipython:: python
+
+   pd.date_range('2015-01-01', freq='SMS-16', periods=4)
+
+   pd.date_range('2015-01-01', freq='SM-14', periods=4)
+
+.. _whatsnew_0190.enhancements.index:
+
+New Index methods
+^^^^^^^^^^^^^^^^^
+
+The following methods and options are added to ``Index``, to be more consistent with the ``Series`` and ``DataFrame`` API.
+
+``Index`` now supports the ``.where()`` function for same shape indexing (:issue:`13170`)
+
+.. ipython:: python
+
+   idx = pd.Index(['a', 'b', 'c'])
+   idx.where([True, False, True])
+
+
+``Index`` now supports ``.dropna()`` to exclude missing values (:issue:`6194`)
+
+.. ipython:: python
+
+   idx = pd.Index([1, 2, np.nan, 4])
+   idx.dropna()
+
+For ``MultiIndex``, values are dropped if any level is missing by default. Specifying
+``how='all'`` only drops values where all levels are missing.
+
+.. ipython:: python
+
+   midx = pd.MultiIndex.from_arrays([[1, 2, np.nan, 4],
+                                     [1, 2, np.nan, np.nan]])
+   midx
+   midx.dropna()
+   midx.dropna(how='all')
+
+``Index`` now supports ``.str.extractall()`` which returns a ``DataFrame``, see the :ref:`docs here <text.extractall>` (:issue:`10008`, :issue:`13156`)
+
+.. ipython:: python
+
+   idx = pd.Index(["a1a2", "b1", "c1"])
+   idx.str.extractall(r"[ab](?P<digit>\d)")
+
+``Index.astype()`` now accepts an optional boolean argument ``copy``, which allows optional copying if the requirements on dtype are satisfied (:issue:`13209`)
+
+.. _whatsnew_0190.gbq:
+
+Google BigQuery Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- The :func:`read_gbq` method has gained the ``dialect`` argument to allow users to specify whether to use BigQuery's legacy SQL or BigQuery's standard SQL. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/reading.html>`__ for more details (:issue:`13615`).
+- The :func:`~DataFrame.to_gbq` method now allows the DataFrame column order to differ from the destination table schema (:issue:`11359`).
+
+.. _whatsnew_0190.errstate:
+
+Fine-grained numpy errstate
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previous versions of pandas would permanently silence numpy's ufunc error handling when ``pandas`` was imported. Pandas did this in order to silence the warnings that would arise from using numpy ufuncs on missing data, which are usually represented as ``NaN`` s. Unfortunately, this silenced legitimate warnings arising in non-pandas code in the application. Starting with 0.19.0, pandas will use the ``numpy.errstate`` context manager to silence these warnings in a more fine-grained manner, only around where these operations are actually used in the pandas code base. (:issue:`13109`, :issue:`13145`)
+
+After upgrading pandas, you may see *new* ``RuntimeWarnings`` being issued from your code. These are likely legitimate, and the underlying cause likely existed in the code when using previous versions of pandas that simply silenced the warning. Use `numpy.errstate <http://docs.scipy.org/doc/numpy/reference/generated/numpy.errstate.html>`__ around the source of the ``RuntimeWarning`` to control how these conditions are handled.
+
+.. _whatsnew_0190.get_dummies_dtypes:
+
+``get_dummies`` now returns integer dtypes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``pd.get_dummies`` function now returns dummy-encoded columns as small integers, rather than floats (:issue:`8725`). This should provide an improved memory footprint.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
+
+   Out[1]:
+   a    float64
+   b    float64
+   c    float64
+   dtype: object
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
+
+
+.. _whatsnew_0190.enhancements.to_numeric_downcast:
+
+Downcast values to smallest possible dtype in ``to_numeric``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``pd.to_numeric()`` now accepts a ``downcast`` parameter, which will downcast the data if possible to smallest specified numerical dtype (:issue:`13352`)
+
+.. ipython:: python
+
+   s = ['1', 2, 3]
+   pd.to_numeric(s, downcast='unsigned')
+   pd.to_numeric(s, downcast='integer')
+
+.. _whatsnew_0190.dev_api:
+
+pandas development API
+^^^^^^^^^^^^^^^^^^^^^^
+
+As part of making pandas API more uniform and accessible in the future, we have created a standard
+sub-package of pandas, ``pandas.api`` to hold public API's. We are starting by exposing type
+introspection functions in ``pandas.api.types``. More sub-packages and officially sanctioned API's
+will be published in future versions of pandas (:issue:`13147`, :issue:`13634`)
+
+The following are now part of this API:
+
+.. ipython:: python
+
+   import pprint
+   from pandas.api import types
+   funcs = [f for f in dir(types) if not f.startswith('_')]
+   pprint.pprint(funcs)
+
+.. note::
+
+   Calling these functions from the internal module ``pandas.core.common`` will now show a ``DeprecationWarning`` (:issue:`13990`)
+
+
+.. _whatsnew_0190.enhancements.other:
+
+Other enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``Timestamp`` can now accept positional and keyword parameters similar to :func:`datetime.datetime` (:issue:`10758`, :issue:`11630`)
+
+  .. ipython:: python
+
+     pd.Timestamp(2012, 1, 1)
+
+     pd.Timestamp(year=2012, month=1, day=1, hour=8, minute=30)
+
+- The ``.resample()`` function now accepts a ``on=`` or ``level=`` parameter for resampling on a datetimelike column or ``MultiIndex`` level (:issue:`13500`)
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
+                        'a': np.arange(5)},
+                       index=pd.MultiIndex.from_arrays([[1, 2, 3, 4, 5],
+                                                        pd.date_range('2015-01-01',
+                                                                      freq='W',
+                                                                      periods=5)
+                                                        ], names=['v', 'd']))
+     df
+     df.resample('M', on='date').sum()
+     df.resample('M', level='d').sum()
+
+- The ``.get_credentials()`` method of ``GbqConnector`` can now first try to fetch `the application default credentials <https://developers.google.com/identity/protocols/application-default-credentials>`__. See the docs for more details (:issue:`13577`).
+- The ``.tz_localize()`` method of ``DatetimeIndex`` and ``Timestamp`` has gained the ``errors`` keyword, so you can potentially coerce nonexistent timestamps to ``NaT``. The default behavior remains to raising a ``NonExistentTimeError`` (:issue:`13057`)
+- ``.to_hdf/read_hdf()`` now accept path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path (:issue:`11773`)
+- The ``pd.read_csv()`` with ``engine='python'`` has gained support for the
+  ``decimal`` (:issue:`12933`), ``na_filter`` (:issue:`13321`) and the ``memory_map`` option (:issue:`13381`).
+- Consistent with the Python API, ``pd.read_csv()`` will now interpret ``+inf`` as positive infinity (:issue:`13274`)
+- The ``pd.read_html()`` has gained support for the ``na_values``, ``converters``, ``keep_default_na``  options (:issue:`13461`)
+- ``Categorical.astype()`` now accepts an optional boolean argument ``copy``, effective when dtype is categorical (:issue:`13209`)
+- ``DataFrame`` has gained the ``.asof()`` method to return the last non-NaN values according to the selected subset (:issue:`13358`)
+- The ``DataFrame`` constructor will now respect key ordering if a list of ``OrderedDict`` objects are passed in (:issue:`13304`)
+- ``pd.read_html()`` has gained support for the ``decimal`` option (:issue:`12907`)
+- ``Series`` has gained the properties ``.is_monotonic``, ``.is_monotonic_increasing``, ``.is_monotonic_decreasing``, similar to ``Index`` (:issue:`13336`)
+- ``DataFrame.to_sql()`` now allows a single value as the SQL type for all columns (:issue:`11886`).
+- ``Series.append`` now supports the ``ignore_index`` option (:issue:`13677`)
+- ``.to_stata()`` and ``StataWriter`` can now write variable labels to Stata dta files using a dictionary to make column names to labels (:issue:`13535`, :issue:`13536`)
+- ``.to_stata()`` and ``StataWriter`` will automatically convert ``datetime64[ns]`` columns to Stata format ``%tc``, rather than raising a ``ValueError`` (:issue:`12259`)
+- ``read_stata()`` and ``StataReader`` raise with a more explicit error message when reading Stata files with repeated value labels when ``convert_categoricals=True`` (:issue:`13923`)
+- ``DataFrame.style`` will now render sparsified MultiIndexes (:issue:`11655`)
+- ``DataFrame.style`` will now show column level names (e.g. ``DataFrame.columns.names``) (:issue:`13775`)
+- ``DataFrame`` has gained support to re-order the columns based on the values
+  in a row using ``df.sort_values(by='...', axis=1)`` (:issue:`10806`)
+
+  .. ipython:: python
+
+     df = pd.DataFrame({'A': [2, 7], 'B': [3, 5], 'C': [4, 8]},
+                       index=['row1', 'row2'])
+     df
+     df.sort_values(by='row2', axis=1)
+
+- Added documentation to :ref:`I/O<io.dtypes>` regarding the perils of reading in columns with mixed dtypes and how to handle it (:issue:`13746`)
+- :meth:`~DataFrame.to_html` now has a ``border`` argument to control the value in the opening ``<table>`` tag. The default is the value of the ``html.border`` option, which defaults to 1. This also affects the notebook HTML repr, but since Jupyter's CSS includes a border-width attribute, the visual effect is the same. (:issue:`11563`).
+- Raise ``ImportError`` in the sql functions when ``sqlalchemy`` is not installed and a connection string is used (:issue:`11920`).
+- Compatibility with matplotlib 2.0. Older versions of pandas should also work with matplotlib 2.0 (:issue:`13333`)
+- ``Timestamp``, ``Period``, ``DatetimeIndex``, ``PeriodIndex`` and ``.dt`` accessor have gained a ``.is_leap_year`` property to check whether the date belongs to a leap year. (:issue:`13727`)
+- ``astype()`` will now accept a dict of column name to data types mapping as the ``dtype`` argument. (:issue:`12086`)
+- The ``pd.read_json`` and ``DataFrame.to_json`` has gained support for reading and writing json lines with ``lines`` option see :ref:`Line delimited json <io.jsonl>` (:issue:`9180`)
+- :func:`read_excel` now supports the true_values and false_values keyword arguments (:issue:`13347`)
+- ``groupby()`` will now accept a scalar and a single-element list for specifying ``level`` on a non-``MultiIndex`` grouper. (:issue:`13907`)
+- Non-convertible dates in an excel date column will be returned without conversion and the column will be ``object`` dtype, rather than raising an exception (:issue:`10001`).
+- ``pd.Timedelta(None)`` is now accepted and will return ``NaT``, mirroring ``pd.Timestamp`` (:issue:`13687`)
+- ``pd.read_stata()`` can now handle some format 111 files, which are produced by SAS when generating Stata dta files (:issue:`11526`)
+- ``Series`` and ``Index`` now support ``divmod`` which will return a tuple of
+  series or indices. This behaves like a standard binary operator with regards
+  to broadcasting rules (:issue:`14208`).
+
+
+.. _whatsnew_0190.api:
+
+API changes
+~~~~~~~~~~~
+
+``Series.tolist()`` will now return Python types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Series.tolist()`` will now return Python types in the output, mimicking NumPy ``.tolist()`` behavior (:issue:`10904`)
+
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [7]: type(s.tolist()[0])
+   Out[7]:
+    <class 'numpy.int64'>
+
+**New behavior**:
+
+.. ipython:: python
+
+   type(s.tolist()[0])
+
+.. _whatsnew_0190.api.series_ops:
+
+``Series`` operators for different indexes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Following ``Series`` operators have been changed to make all operators consistent,
+including ``DataFrame`` (:issue:`1134`, :issue:`4581`, :issue:`13538`)
+
+- ``Series`` comparison operators now raise ``ValueError`` when ``index`` are different.
+- ``Series`` logical operators align both ``index`` of left and right hand side.
+
+.. warning::
+   Until 0.18.1, comparing ``Series`` with the same length, would succeed even if
+   the ``.index`` are different (the result ignores ``.index``). As of 0.19.0, this will raises ``ValueError`` to be more strict. This section also describes how to keep previous behavior or align different indexes, using the flexible comparison methods like ``.eq``.
+
+
+As a result, ``Series`` and ``DataFrame`` operators behave as below:
+
+Arithmetic operators
+""""""""""""""""""""
+
+Arithmetic operators align both ``index`` (no changes).
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3], index=list('ABC'))
+   s2 = pd.Series([2, 2, 2], index=list('ABD'))
+   s1 + s2
+
+   df1 = pd.DataFrame([1, 2, 3], index=list('ABC'))
+   df2 = pd.DataFrame([2, 2, 2], index=list('ABD'))
+   df1 + df2
+
+Comparison operators
+""""""""""""""""""""
+
+Comparison operators raise ``ValueError`` when ``.index`` are different.
+
+**Previous Behavior** (``Series``):
+
+``Series`` compared values ignoring the ``.index`` as long as both had the same length:
+
+.. code-block:: ipython
+
+   In [1]: s1 == s2
+   Out[1]:
+   A    False
+   B     True
+   C    False
+   dtype: bool
+
+**New behavior** (``Series``):
+
+.. code-block:: ipython
+
+   In [2]: s1 == s2
+   Out[2]:
+   ValueError: Can only compare identically-labeled Series objects
+
+.. note::
+
+   To achieve the same result as previous versions (compare values based on locations ignoring ``.index``), compare both ``.values``.
+
+   .. ipython:: python
+
+      s1.values == s2.values
+
+   If you want to compare ``Series`` aligning its ``.index``, see flexible comparison methods section below:
+
+   .. ipython:: python
+
+      s1.eq(s2)
+
+**Current Behavior** (``DataFrame``, no change):
+
+.. code-block:: ipython
+
+   In [3]: df1 == df2
+   Out[3]:
+   ValueError: Can only compare identically-labeled DataFrame objects
+
+Logical operators
+"""""""""""""""""
+
+Logical operators align both ``.index`` of left and right hand side.
+
+**Previous behavior** (``Series``), only left hand side ``index`` was kept:
+
+.. code-block:: ipython
+
+   In [4]: s1 = pd.Series([True, False, True], index=list('ABC'))
+   In [5]: s2 = pd.Series([True, True, True], index=list('ABD'))
+   In [6]: s1 & s2
+   Out[6]:
+   A     True
+   B    False
+   C    False
+   dtype: bool
+
+**New behavior** (``Series``):
+
+.. ipython:: python
+
+   s1 = pd.Series([True, False, True], index=list('ABC'))
+   s2 = pd.Series([True, True, True], index=list('ABD'))
+   s1 & s2
+
+.. note::
+   ``Series`` logical operators fill a ``NaN`` result with ``False``.
+
+.. note::
+   To achieve the same result as previous versions (compare values based on only left hand side index), you can use ``reindex_like``:
+
+   .. ipython:: python
+
+      s1 & s2.reindex_like(s1)
+
+**Current Behavior** (``DataFrame``, no change):
+
+.. ipython:: python
+
+   df1 = pd.DataFrame([True, False, True], index=list('ABC'))
+   df2 = pd.DataFrame([True, True, True], index=list('ABD'))
+   df1 & df2
+
+Flexible comparison methods
+"""""""""""""""""""""""""""
+
+``Series`` flexible comparison methods like ``eq``, ``ne``, ``le``, ``lt``, ``ge`` and ``gt`` now align both ``index``. Use these operators if you want to compare two ``Series``
+which has the different ``index``.
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c'])
+   s2 = pd.Series([2, 2, 2], index=['b', 'c', 'd'])
+   s1.eq(s2)
+   s1.ge(s2)
+
+Previously, this worked the same as comparison operators (see above).
+
+.. _whatsnew_0190.api.promote:
+
+``Series`` type promotion on assignment
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A ``Series`` will now correctly promote its dtype for assignment with incompat values to the current dtype (:issue:`13234`)
+
+
+.. ipython:: python
+
+   s = pd.Series()
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: s["a"] = pd.Timestamp("2016-01-01")
+
+   In [3]: s["b"] = 3.0
+   TypeError: invalid type promotion
+
+**New behavior**:
+
+.. ipython:: python
+
+   s["a"] = pd.Timestamp("2016-01-01")
+   s["b"] = 3.0
+   s
+   s.dtype
+
+.. _whatsnew_0190.api.to_datetime_coerce:
+
+``.to_datetime()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously if ``.to_datetime()`` encountered mixed integers/floats and strings, but no datetimes with ``errors='coerce'`` it would convert all to ``NaT``.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.to_datetime([1, 'foo'], errors='coerce')
+   Out[2]: DatetimeIndex(['NaT', 'NaT'], dtype='datetime64[ns]', freq=None)
+
+**Current behavior**:
+
+This will now convert integers/floats with the default unit of ``ns``.
+
+.. ipython:: python
+
+   pd.to_datetime([1, 'foo'], errors='coerce')
+
+Bug fixes related to ``.to_datetime()``:
+
+- Bug in ``pd.to_datetime()`` when passing integers or floats, and no ``unit`` and ``errors='coerce'`` (:issue:`13180`).
+- Bug in ``pd.to_datetime()`` when passing invalid data types (e.g. bool); will now respect the ``errors`` keyword (:issue:`13176`)
+- Bug in ``pd.to_datetime()`` which overflowed on ``int8``, and ``int16`` dtypes (:issue:`13451`)
+- Bug in ``pd.to_datetime()`` raise ``AttributeError`` with ``NaN`` and the other string is not valid when ``errors='ignore'`` (:issue:`12424`)
+- Bug in ``pd.to_datetime()`` did not cast floats correctly when ``unit`` was specified, resulting in truncated datetime (:issue:`13834`)
+
+.. _whatsnew_0190.api.merging:
+
+Merging changes
+^^^^^^^^^^^^^^^
+
+Merging will now preserve the dtype of the join keys (:issue:`8596`)
+
+.. ipython:: python
+
+   df1 = pd.DataFrame({'key': [1], 'v1': [10]})
+   df1
+   df2 = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
+   df2
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.merge(df1, df2, how='outer')
+   Out[5]:
+      key    v1
+   0  1.0  10.0
+   1  1.0  20.0
+   2  2.0  30.0
+
+   In [6]: pd.merge(df1, df2, how='outer').dtypes
+   Out[6]:
+   key    float64
+   v1     float64
+   dtype: object
+
+**New behavior**:
+
+We are able to preserve the join keys
+
+.. ipython:: python
+
+   pd.merge(df1, df2, how='outer')
+   pd.merge(df1, df2, how='outer').dtypes
+
+Of course if you have missing values that are introduced, then the
+resulting dtype will be upcast, which is unchanged from previous.
+
+.. ipython:: python
+
+   pd.merge(df1, df2, how='outer', on='key')
+   pd.merge(df1, df2, how='outer', on='key').dtypes
+
+.. _whatsnew_0190.api.describe:
+
+``.describe()`` changes
+^^^^^^^^^^^^^^^^^^^^^^^
+
+Percentile identifiers in the index of a ``.describe()`` output will now be rounded to the least precision that keeps them distinct (:issue:`13104`)
+
+.. ipython:: python
+
+   s = pd.Series([0, 1, 2, 3, 4])
+   df = pd.DataFrame([0, 1, 2, 3, 4])
+
+**Previous behavior**:
+
+The percentiles were rounded to at most one decimal place, which could raise ``ValueError`` for a data frame if the percentiles were duplicated.
+
+.. code-block:: ipython
+
+   In [3]: s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   Out[3]:
+   count     5.000000
+   mean      2.000000
+   std       1.581139
+   min       0.000000
+   0.0%      0.000400
+   0.1%      0.002000
+   0.1%      0.004000
+   50%       2.000000
+   99.9%     3.996000
+   100.0%    3.998000
+   100.0%    3.999600
+   max       4.000000
+   dtype: float64
+
+   In [4]: df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   Out[4]:
+   ...
+   ValueError: cannot reindex from a duplicate axis
+
+**New behavior**:
+
+.. ipython:: python
+
+   s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+   df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
+
+Furthermore:
+
+- Passing duplicated ``percentiles`` will now raise a ``ValueError``.
+- Bug in ``.describe()`` on a DataFrame with a mixed-dtype column index, which would previously raise a ``TypeError`` (:issue:`13288`)
+
+.. _whatsnew_0190.api.period:
+
+``Period`` changes
+^^^^^^^^^^^^^^^^^^
+
+``PeriodIndex`` now has ``period`` dtype
+""""""""""""""""""""""""""""""""""""""""
+
+``PeriodIndex`` now has its own ``period`` dtype. The ``period`` dtype is a
+pandas extension dtype like ``category`` or the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``) (:issue:`13941`).
+As a consequence of this change, ``PeriodIndex`` no longer has an integer dtype:
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.PeriodIndex(['2016-08-01'], freq='D')
+
+   In [2]: pi
+   Out[2]: PeriodIndex(['2016-08-01'], dtype='int64', freq='D')
+
+   In [3]: pd.api.types.is_integer_dtype(pi)
+   Out[3]: True
+
+   In [4]: pi.dtype
+   Out[4]: dtype('int64')
+
+**New behavior**:
+
+.. ipython:: python
+
+   pi = pd.PeriodIndex(['2016-08-01'], freq='D')
+   pi
+   pd.api.types.is_integer_dtype(pi)
+   pd.api.types.is_period_dtype(pi)
+   pi.dtype
+   type(pi.dtype)
+
+.. _whatsnew_0190.api.periodnat:
+
+``Period('NaT')`` now returns ``pd.NaT``
+""""""""""""""""""""""""""""""""""""""""
+
+Previously, ``Period`` has its own ``Period('NaT')`` representation different from ``pd.NaT``. Now ``Period('NaT')`` has been changed to return ``pd.NaT``. (:issue:`12759`, :issue:`13582`)
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.Period('NaT', freq='D')
+   Out[5]: Period('NaT', 'D')
+
+**New behavior**:
+
+These result in ``pd.NaT`` without providing ``freq`` option.
+
+.. ipython:: python
+
+   pd.Period('NaT')
+   pd.Period(None)
+
+
+To be compatible with ``Period`` addition and subtraction, ``pd.NaT`` now supports addition and subtraction with ``int``. Previously it raised ``ValueError``.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [5]: pd.NaT + 1
+   ...
+   ValueError: Cannot add integral value to Timestamp without freq.
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.NaT + 1
+   pd.NaT - 1
+
+``PeriodIndex.values`` now returns array of ``Period`` object
+"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""
+
+``.values`` is changed to return an array of ``Period`` objects, rather than an array
+of integers (:issue:`13988`).
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [6]: pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+   In [7]: pi.values
+   Out[7]: array([492, 493])
+
+**New behavior**:
+
+.. ipython:: python
+
+   pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+   pi.values
+
+
+.. _whatsnew_0190.api.setops:
+
+Index ``+`` / ``-`` no longer used for set operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Addition and subtraction of the base Index type and of DatetimeIndex
+(not the numeric index types)
+previously performed set operations (set union and difference). This
+behavior was already deprecated since 0.15.0 (in favor using the specific
+``.union()`` and ``.difference()`` methods), and is now disabled. When
+possible, ``+`` and ``-`` are now used for element-wise operations, for
+example for concatenating strings or subtracting datetimes
+(:issue:`8227`, :issue:`14127`).
+
+Previous behavior:
+
+.. code-block:: ipython
+
+   In [1]: pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
+   FutureWarning: using '+' to provide set union with Indexes is deprecated, use '|' or .union()
+   Out[1]: Index(['a', 'b', 'c'], dtype='object')
+
+**New behavior**: the same operation will now perform element-wise addition:
+
+.. ipython:: python
+
+   pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
+
+Note that numeric Index objects already performed element-wise operations.
+For example, the behavior of adding two integer Indexes is unchanged.
+The base ``Index`` is now made consistent with this behavior.
+
+.. ipython:: python
+
+   pd.Index([1, 2, 3]) + pd.Index([2, 3, 4])
+
+Further, because of this change, it is now possible to subtract two
+DatetimeIndex objects resulting in a TimedeltaIndex:
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+    In [1]: (pd.DatetimeIndex(['2016-01-01', '2016-01-02'])
+       ...:  - pd.DatetimeIndex(['2016-01-02', '2016-01-03']))
+    FutureWarning: using '-' to provide set differences with datetimelike Indexes is deprecated, use .difference()
+    Out[1]: DatetimeIndex(['2016-01-01'], dtype='datetime64[ns]', freq=None)
+
+**New behavior**:
+
+.. ipython:: python
+
+    (pd.DatetimeIndex(['2016-01-01', '2016-01-02'])
+     - pd.DatetimeIndex(['2016-01-02', '2016-01-03']))
+
+
+.. _whatsnew_0190.api.difference:
+
+``Index.difference`` and ``.symmetric_difference`` changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Index.difference`` and ``Index.symmetric_difference`` will now, more consistently, treat ``NaN`` values as any other values. (:issue:`13514`)
+
+.. ipython:: python
+
+   idx1 = pd.Index([1, 2, 3, np.nan])
+   idx2 = pd.Index([0, 1, np.nan])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [3]: idx1.difference(idx2)
+   Out[3]: Float64Index([nan, 2.0, 3.0], dtype='float64')
+
+   In [4]: idx1.symmetric_difference(idx2)
+   Out[4]: Float64Index([0.0, nan, 2.0, 3.0], dtype='float64')
+
+**New behavior**:
+
+.. ipython:: python
+
+   idx1.difference(idx2)
+   idx1.symmetric_difference(idx2)
+
+.. _whatsnew_0190.api.unique_index:
+
+``Index.unique`` consistently returns ``Index``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Index.unique()`` now returns unique values as an
+``Index`` of the appropriate ``dtype``. (:issue:`13395`).
+Previously, most ``Index`` classes returned ``np.ndarray``, and ``DatetimeIndex``,
+``TimedeltaIndex`` and ``PeriodIndex`` returned ``Index`` to keep metadata like timezone.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: pd.Index([1, 2, 3]).unique()
+   Out[1]: array([1, 2, 3])
+
+   In [2]: pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+      ...:                   '2011-01-03'], tz='Asia/Tokyo').unique()
+   Out[2]:
+   DatetimeIndex(['2011-01-01 00:00:00+09:00', '2011-01-02 00:00:00+09:00',
+                  '2011-01-03 00:00:00+09:00'],
+                 dtype='datetime64[ns, Asia/Tokyo]', freq=None)
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.Index([1, 2, 3]).unique()
+   pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                    tz='Asia/Tokyo').unique()
+
+.. _whatsnew_0190.api.multiindex:
+
+``MultiIndex`` constructors, ``groupby`` and ``set_index`` preserve categorical dtypes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``MultiIndex.from_arrays`` and ``MultiIndex.from_product`` will now preserve categorical dtype
+in ``MultiIndex`` levels (:issue:`13743`, :issue:`13854`).
+
+.. ipython:: python
+
+   cat = pd.Categorical(['a', 'b'], categories=list("bac"))
+   lvl1 = ['foo', 'bar']
+   midx = pd.MultiIndex.from_arrays([cat, lvl1])
+   midx
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [4]: midx.levels[0]
+   Out[4]: Index(['b', 'a', 'c'], dtype='object')
+
+   In [5]: midx.get_level_values[0]
+   Out[5]: Index(['a', 'b'], dtype='object')
+
+**New behavior**: the single level is now a ``CategoricalIndex``:
+
+.. ipython:: python
+
+   midx.levels[0]
+   midx.get_level_values(0)
+
+An analogous change has been made to ``MultiIndex.from_product``.
+As a consequence, ``groupby`` and ``set_index`` also preserve categorical dtypes in indexes
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [0, 1], 'B': [10, 11], 'C': cat})
+   df_grouped = df.groupby(by=['A', 'C']).first()
+   df_set_idx = df.set_index(['A', 'C'])
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [11]: df_grouped.index.levels[1]
+   Out[11]: Index(['b', 'a', 'c'], dtype='object', name='C')
+   In [12]: df_grouped.reset_index().dtypes
+   Out[12]:
+   A      int64
+   C     object
+   B    float64
+   dtype: object
+
+   In [13]: df_set_idx.index.levels[1]
+   Out[13]: Index(['b', 'a', 'c'], dtype='object', name='C')
+   In [14]: df_set_idx.reset_index().dtypes
+   Out[14]:
+   A      int64
+   C     object
+   B      int64
+   dtype: object
+
+**New behavior**:
+
+.. ipython:: python
+
+   df_grouped.index.levels[1]
+   df_grouped.reset_index().dtypes
+
+   df_set_idx.index.levels[1]
+   df_set_idx.reset_index().dtypes
+
+.. _whatsnew_0190.api.autogenerated_chunksize_index:
+
+``read_csv`` will progressively enumerate chunks
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+When :func:`read_csv` is called with ``chunksize=n`` and without specifying an index,
+each chunk used to have an independently generated index from ``0`` to ``n-1``.
+They are now given instead a progressive index, starting from ``0`` for the first chunk,
+from ``n`` for the second, and so on, so that, when concatenated, they are identical to
+the result of calling :func:`read_csv` without the ``chunksize=`` argument
+(:issue:`12185`).
+
+.. ipython:: python
+
+   data = 'A,B\n0,1\n2,3\n4,5\n6,7'
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [2]: pd.concat(pd.read_csv(StringIO(data), chunksize=2))
+   Out[2]:
+      A  B
+   0  0  1
+   1  2  3
+   0  4  5
+   1  6  7
+
+**New behavior**:
+
+.. ipython:: python
+
+   pd.concat(pd.read_csv(StringIO(data), chunksize=2))
+
+.. _whatsnew_0190.sparse:
+
+Sparse Changes
+^^^^^^^^^^^^^^
+
+These changes allow pandas to handle sparse data with more dtypes, and for work to make a smoother experience with data handling.
+
+``int64`` and ``bool`` support enhancements
+"""""""""""""""""""""""""""""""""""""""""""
+
+Sparse data structures now gained enhanced support of ``int64`` and ``bool`` ``dtype`` (:issue:`667`, :issue:`13849`).
+
+Previously, sparse data were ``float64`` dtype by default, even if all inputs were of ``int`` or ``bool`` dtype. You had to specify ``dtype`` explicitly to create sparse data with ``int64`` dtype. Also, ``fill_value`` had to be specified explicitly because the default was ``np.nan`` which doesn't appear in ``int64`` or ``bool`` data.
+
+.. code-block:: ipython
+
+   In [1]: pd.SparseArray([1, 2, 0, 0])
+   Out[1]:
+   [1.0, 2.0, 0.0, 0.0]
+   Fill: nan
+   IntIndex
+   Indices: array([0, 1, 2, 3], dtype=int32)
+
+   # specifying int64 dtype, but all values are stored in sp_values because
+   # fill_value default is np.nan
+   In [2]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
+   Out[2]:
+   [1, 2, 0, 0]
+   Fill: nan
+   IntIndex
+   Indices: array([0, 1, 2, 3], dtype=int32)
+
+   In [3]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64, fill_value=0)
+   Out[3]:
+   [1, 2, 0, 0]
+   Fill: 0
+   IntIndex
+   Indices: array([0, 1], dtype=int32)
+
+As of v0.19.0, sparse data keeps the input dtype, and uses more appropriate ``fill_value`` defaults (``0`` for ``int64`` dtype, ``False`` for ``bool`` dtype).
+
+.. ipython:: python
+
+   pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
+   pd.SparseArray([True, False, False, False])
+
+See the :ref:`docs <sparse.dtype>` for more details.
+
+Operators now preserve dtypes
+"""""""""""""""""""""""""""""
+
+- Sparse data structure now can preserve ``dtype`` after arithmetic ops (:issue:`13848`)
+
+.. ipython:: python
+
+   s = pd.SparseSeries([0, 2, 0, 1], fill_value=0, dtype=np.int64)
+   s.dtype
+
+   s + 1
+
+- Sparse data structure now support ``astype`` to convert internal ``dtype`` (:issue:`13900`)
+
+.. ipython:: python
+
+   s = pd.SparseSeries([1., 0., 2., 0.], fill_value=0)
+   s
+   s.astype(np.int64)
+
+``astype`` fails if data contains values which cannot be converted to specified ``dtype``.
+Note that the limitation is applied to ``fill_value`` which default is ``np.nan``.
+
+.. code-block:: ipython
+
+   In [7]: pd.SparseSeries([1., np.nan, 2., np.nan], fill_value=np.nan).astype(np.int64)
+   Out[7]:
+   ValueError: unable to coerce current fill_value nan to int64 dtype
+
+Other sparse fixes
+""""""""""""""""""
+
+- Subclassed ``SparseDataFrame`` and ``SparseSeries`` now preserve class types when slicing or transposing. (:issue:`13787`)
+- ``SparseArray`` with ``bool`` dtype now supports logical (bool) operators (:issue:`14000`)
+- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing may raise ``IndexError`` (:issue:`13144`)
+- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing result may have normal ``Index`` (:issue:`13144`)
+- Bug in ``SparseDataFrame`` in which ``axis=None`` did not default to ``axis=0`` (:issue:`13048`)
+- Bug in ``SparseSeries`` and ``SparseDataFrame`` creation with ``object`` dtype may raise ``TypeError`` (:issue:`11633`)
+- Bug in ``SparseDataFrame`` doesn't respect passed ``SparseArray`` or ``SparseSeries`` 's dtype and ``fill_value``  (:issue:`13866`)
+- Bug in ``SparseArray`` and ``SparseSeries`` don't apply ufunc to ``fill_value`` (:issue:`13853`)
+- Bug in ``SparseSeries.abs`` incorrectly keeps negative ``fill_value`` (:issue:`13853`)
+- Bug in single row slicing on multi-type ``SparseDataFrame`` s, types were previously forced to float (:issue:`13917`)
+- Bug in ``SparseSeries`` slicing changes integer dtype to float (:issue:`8292`)
+- Bug in ``SparseDataFarme`` comparison ops may raise ``TypeError`` (:issue:`13001`)
+- Bug in ``SparseDataFarme.isnull`` raises ``ValueError`` (:issue:`8276`)
+- Bug in ``SparseSeries`` representation with ``bool`` dtype may raise ``IndexError`` (:issue:`13110`)
+- Bug in ``SparseSeries`` and ``SparseDataFrame`` of ``bool`` or ``int64`` dtype may display its values like ``float64`` dtype (:issue:`13110`)
+- Bug in sparse indexing using ``SparseArray`` with ``bool`` dtype may return incorrect result  (:issue:`13985`)
+- Bug in ``SparseArray`` created from ``SparseSeries`` may lose ``dtype`` (:issue:`13999`)
+- Bug in ``SparseSeries`` comparison with dense returns normal ``Series`` rather than ``SparseSeries`` (:issue:`13999`)
+
+
+.. _whatsnew_0190.indexer_dtype:
+
+Indexer dtype changes
+^^^^^^^^^^^^^^^^^^^^^
+
+.. note::
+
+   This change only affects 64 bit python running on Windows, and only affects relatively advanced
+   indexing operations
+
+Methods such as ``Index.get_indexer`` that return an indexer array, coerce that array to a "platform int", so that it can be
+directly used in 3rd party library operations like ``numpy.take``.  Previously, a platform int was defined as ``np.int_``
+which corresponds to a C integer, but the correct type, and what is being used now, is ``np.intp``, which corresponds
+to the C integer size that can hold a pointer (:issue:`3033`, :issue:`13972`).
+
+These types are the same on many platform, but for 64 bit python on Windows,
+``np.int_`` is 32 bits, and ``np.intp`` is 64 bits.  Changing this behavior improves performance for many
+operations on that platform.
+
+**Previous behavior**:
+
+.. code-block:: ipython
+
+   In [1]: i = pd.Index(['a', 'b', 'c'])
+
+   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
+   Out[2]: dtype('int32')
+
+**New behavior**:
+
+.. code-block:: ipython
+
+   In [1]: i = pd.Index(['a', 'b', 'c'])
+
+   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
+   Out[2]: dtype('int64')
+
+
+.. _whatsnew_0190.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- ``Timestamp.to_pydatetime`` will issue a ``UserWarning`` when ``warn=True``, and the instance has a non-zero number of nanoseconds, previously this would print a message to stdout (:issue:`14101`).
+- ``Series.unique()`` with datetime and timezone now returns return array of ``Timestamp`` with timezone (:issue:`13565`).
+- ``Panel.to_sparse()`` will raise a ``NotImplementedError`` exception when called (:issue:`13778`).
+- ``Index.reshape()`` will raise a ``NotImplementedError`` exception when called (:issue:`12882`).
+- ``.filter()`` enforces mutual exclusion of the keyword arguments (:issue:`12399`).
+- ``eval``'s upcasting rules for ``float32`` types have been updated to be more consistent with NumPy's rules.  New behavior will not upcast to ``float64`` if you multiply a pandas ``float32`` object by a scalar float64 (:issue:`12388`).
+- An ``UnsupportedFunctionCall`` error is now raised if NumPy ufuncs like ``np.mean`` are called on groupby or resample objects (:issue:`12811`).
+- ``__setitem__`` will no longer apply a callable rhs as a function instead of storing it. Call ``where`` directly to get the previous behavior (:issue:`13299`).
+- Calls to ``.sample()`` will respect the random seed set via ``numpy.random.seed(n)`` (:issue:`13161`)
+- ``Styler.apply`` is now more strict about the outputs your function must return. For ``axis=0`` or ``axis=1``, the output shape must be identical. For ``axis=None``, the output must be a DataFrame with identical columns and index labels (:issue:`13222`).
+- ``Float64Index.astype(int)`` will now raise ``ValueError`` if ``Float64Index`` contains ``NaN`` values (:issue:`13149`)
+- ``TimedeltaIndex.astype(int)`` and ``DatetimeIndex.astype(int)`` will now return ``Int64Index`` instead of ``np.array`` (:issue:`13209`)
+- Passing ``Period`` with multiple frequencies to normal ``Index`` now returns ``Index`` with ``object`` dtype (:issue:`13664`)
+- ``PeriodIndex.fillna`` with ``Period`` has different freq now coerces to ``object`` dtype (:issue:`13664`)
+- Faceted boxplots from ``DataFrame.boxplot(by=col)`` now return a ``Series`` when ``return_type`` is not None. Previously these returned an ``OrderedDict``. Note that when ``return_type=None``, the default, these still return a 2-D NumPy array (:issue:`12216`, :issue:`7096`).
+- ``pd.read_hdf`` will now raise a ``ValueError`` instead of ``KeyError``, if a mode other than ``r``, ``r+`` and ``a`` is supplied. (:issue:`13623`)
+- ``pd.read_csv()``, ``pd.read_table()``, and ``pd.read_hdf()`` raise the builtin ``FileNotFoundError`` exception for Python 3.x when called on a nonexistent file; this is back-ported as ``IOError`` in Python 2.x (:issue:`14086`)
+- More informative exceptions are passed through the csv parser. The exception type would now be the original exception type instead of ``CParserError`` (:issue:`13652`).
+- ``pd.read_csv()`` in the C engine will now issue a ``ParserWarning`` or raise a ``ValueError`` when ``sep`` encoded is more than one character long (:issue:`14065`)
+- ``DataFrame.values`` will now return ``float64`` with a ``DataFrame`` of mixed ``int64`` and ``uint64`` dtypes, conforming to ``np.find_common_type`` (:issue:`10364`, :issue:`13917`)
+- ``.groupby.groups`` will now return a dictionary of ``Index`` objects, rather than a dictionary of ``np.ndarray`` or ``lists`` (:issue:`14293`)
+
+.. _whatsnew_0190.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+- ``Series.reshape`` and ``Categorical.reshape`` have been deprecated and will be removed in a subsequent release (:issue:`12882`, :issue:`12882`)
+- ``PeriodIndex.to_datetime`` has been deprecated in favor of ``PeriodIndex.to_timestamp`` (:issue:`8254`)
+- ``Timestamp.to_datetime`` has been deprecated in favor of ``Timestamp.to_pydatetime`` (:issue:`8254`)
+- ``Index.to_datetime`` and ``DatetimeIndex.to_datetime`` have been deprecated in favor of ``pd.to_datetime`` (:issue:`8254`)
+- ``pandas.core.datetools`` module has been deprecated and will be removed in a subsequent release (:issue:`14094`)
+- ``SparseList`` has been deprecated and will be removed in a future version (:issue:`13784`)
+- ``DataFrame.to_html()`` and ``DataFrame.to_latex()`` have dropped the ``colSpace`` parameter in favor of ``col_space`` (:issue:`13857`)
+- ``DataFrame.to_sql()`` has deprecated the ``flavor`` parameter, as it is superfluous when SQLAlchemy is not installed (:issue:`13611`)
+- Deprecated ``read_csv`` keywords:
+
+  - ``compact_ints`` and ``use_unsigned`` have been deprecated and will be removed in a future version (:issue:`13320`)
+  - ``buffer_lines`` has been deprecated and will be removed in a future version (:issue:`13360`)
+  - ``as_recarray`` has been deprecated and will be removed in a future version (:issue:`13373`)
+  - ``skip_footer`` has been deprecated in favor of ``skipfooter`` and will be removed in a future version (:issue:`13349`)
+
+- top-level ``pd.ordered_merge()`` has been renamed to ``pd.merge_ordered()`` and the original name will be removed in a future version (:issue:`13358`)
+- ``Timestamp.offset`` property (and named arg in the constructor), has been deprecated in favor of ``freq`` (:issue:`12160`)
+- ``pd.tseries.util.pivot_annual`` is deprecated. Use ``pivot_table`` as alternative, an example is :ref:`here <cookbook.pivot>` (:issue:`736`)
+- ``pd.tseries.util.isleapyear`` has been deprecated and will be removed in a subsequent release. Datetime-likes now have a ``.is_leap_year`` property (:issue:`13727`)
+- ``Panel4D`` and ``PanelND`` constructors are deprecated and will be removed in a future version. The recommended way to represent these types of n-dimensional data are with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas provides a :meth:`~Panel4D.to_xarray` method to automate this conversion (:issue:`13564`).
+- ``pandas.tseries.frequencies.get_standard_freq`` is deprecated. Use  ``pandas.tseries.frequencies.to_offset(freq).rule_code`` instead (:issue:`13874`)
+- ``pandas.tseries.frequencies.to_offset``'s ``freqstr`` keyword is deprecated in favor of ``freq`` (:issue:`13874`)
+- ``Categorical.from_array`` has been deprecated and will be removed in a future version (:issue:`13854`)
+
+.. _whatsnew_0190.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``SparsePanel`` class has been removed (:issue:`13778`)
+- The ``pd.sandbox`` module has been removed in favor of the external library ``pandas-qt`` (:issue:`13670`)
+- The ``pandas.io.data`` and ``pandas.io.wb`` modules are removed in favor of
+  the `pandas-datareader package <https://github.com/pydata/pandas-datareader>`__ (:issue:`13724`).
+- The ``pandas.tools.rplot`` module has been removed in favor of
+  the `seaborn package <https://github.com/mwaskom/seaborn>`__ (:issue:`13855`)
+- ``DataFrame.to_csv()`` has dropped the ``engine`` parameter, as was deprecated in 0.17.1 (:issue:`11274`, :issue:`13419`)
+- ``DataFrame.to_dict()`` has dropped the ``outtype`` parameter in favor of ``orient`` (:issue:`13627`, :issue:`8486`)
+- ``pd.Categorical`` has dropped setting of the ``ordered`` attribute directly in favor of the ``set_ordered`` method (:issue:`13671`)
+- ``pd.Categorical`` has dropped the ``levels`` attribute in favor of ``categories`` (:issue:`8376`)
+- ``DataFrame.to_sql()`` has dropped the ``mysql`` option for the ``flavor`` parameter (:issue:`13611`)
+- ``Panel.shift()`` has dropped the ``lags`` parameter in favor of ``periods`` (:issue:`14041`)
+- ``pd.Index`` has dropped the ``diff`` method in favor of ``difference`` (:issue:`13669`)
+- ``pd.DataFrame`` has dropped the ``to_wide`` method in favor of ``to_panel`` (:issue:`14039`)
+- ``Series.to_csv`` has dropped the ``nanRep`` parameter in favor of ``na_rep`` (:issue:`13804`)
+- ``Series.xs``, ``DataFrame.xs``, ``Panel.xs``, ``Panel.major_xs``, and ``Panel.minor_xs`` have dropped the ``copy`` parameter (:issue:`13781`)
+- ``str.split`` has dropped the ``return_type`` parameter in favor of ``expand`` (:issue:`13701`)
+- Removal of the legacy time rules (offset aliases), deprecated since 0.17.0 (this has been alias since 0.8.0) (:issue:`13590`, :issue:`13868`). Now legacy time rules raises ``ValueError``. For the list of currently supported offsets, see :ref:`here <timeseries.offset_aliases>`.
+- The default value for the ``return_type`` parameter for ``DataFrame.plot.box`` and ``DataFrame.boxplot`` changed from ``None`` to ``"axes"``. These methods will now return a matplotlib axes by default instead of a dictionary of artists. See :ref:`here <visualization.box.return>` (:issue:`6581`).
+- The ``tquery`` and ``uquery`` functions in the ``pandas.io.sql`` module are removed (:issue:`5950`).
+
+
+.. _whatsnew_0190.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of sparse ``IntIndex.intersect`` (:issue:`13082`)
+- Improved performance of sparse arithmetic with ``BlockIndex`` when the number of blocks are large, though recommended to use ``IntIndex`` in such cases (:issue:`13082`)
+- Improved performance of ``DataFrame.quantile()`` as it now operates per-block (:issue:`11623`)
+- Improved performance of float64 hash table operations, fixing some very slow indexing and groupby operations in python 3 (:issue:`13166`, :issue:`13334`)
+- Improved performance of ``DataFrameGroupBy.transform`` (:issue:`12737`)
+- Improved performance of ``Index`` and ``Series`` ``.duplicated`` (:issue:`10235`)
+- Improved performance of ``Index.difference`` (:issue:`12044`)
+- Improved performance of ``RangeIndex.is_monotonic_increasing`` and ``is_monotonic_decreasing`` (:issue:`13749`)
+- Improved performance of datetime string parsing in ``DatetimeIndex`` (:issue:`13692`)
+- Improved performance of hashing ``Period`` (:issue:`12817`)
+- Improved performance of ``factorize`` of datetime with timezone (:issue:`13750`)
+- Improved performance of by lazily creating indexing hashtables on larger Indexes (:issue:`14266`)
+- Improved performance of ``groupby.groups`` (:issue:`14293`)
+- Unnecessary materializing of a MultiIndex when introspecting for memory usage (:issue:`14308`)
+
+.. _whatsnew_0190.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Bug in ``groupby().shift()``, which could cause a segfault or corruption in rare circumstances when grouping by columns with missing values (:issue:`13813`)
+- Bug in ``groupby().cumsum()`` calculating ``cumprod`` when ``axis=1``. (:issue:`13994`)
+- Bug in ``pd.to_timedelta()`` in which the ``errors`` parameter was not being respected (:issue:`13613`)
+- Bug in ``io.json.json_normalize()``, where non-ascii keys raised an exception (:issue:`13213`)
+- Bug when passing a not-default-indexed ``Series`` as ``xerr`` or ``yerr`` in ``.plot()`` (:issue:`11858`)
+- Bug in area plot draws legend incorrectly if subplot is enabled or legend is moved after plot (matplotlib 1.5.0 is required to draw area plot legend properly) (:issue:`9161`, :issue:`13544`)
+- Bug in ``DataFrame`` assignment with an object-dtyped ``Index`` where the resultant column is mutable to the original object. (:issue:`13522`)
+- Bug in matplotlib ``AutoDataFormatter``; this restores the second scaled formatting and re-adds micro-second scaled formatting (:issue:`13131`)
+- Bug in selection from a ``HDFStore`` with a fixed format and ``start`` and/or ``stop`` specified will now return the selected range (:issue:`8287`)
+- Bug in ``Categorical.from_codes()`` where an unhelpful error was raised when an invalid ``ordered`` parameter was passed in (:issue:`14058`)
+- Bug in ``Series`` construction from a tuple of integers on windows not returning default dtype (int64) (:issue:`13646`)
+- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow was not being caught (:issue:`14068`)
+- Bug in ``.groupby(..).resample(..)`` when the same object is called multiple times (:issue:`13174`)
+- Bug in ``.to_records()`` when index name is a unicode string (:issue:`13172`)
+- Bug in calling ``.memory_usage()`` on object which doesn't implement (:issue:`12924`)
+- Regression in ``Series.quantile`` with nans (also shows up in ``.median()`` and ``.describe()`` ); furthermore now names the ``Series`` with the quantile (:issue:`13098`, :issue:`13146`)
+- Bug in ``SeriesGroupBy.transform`` with datetime values and missing groups (:issue:`13191`)
+- Bug where empty ``Series`` were incorrectly coerced in datetime-like numeric operations (:issue:`13844`)
+- Bug in ``Categorical`` constructor when passed a ``Categorical`` containing datetimes with timezones (:issue:`14190`)
+- Bug in ``Series.str.extractall()`` with ``str`` index raises ``ValueError``  (:issue:`13156`)
+- Bug in ``Series.str.extractall()`` with single group and quantifier  (:issue:`13382`)
+- Bug in ``DatetimeIndex`` and ``Period`` subtraction raises ``ValueError`` or ``AttributeError`` rather than ``TypeError`` (:issue:`13078`)
+- Bug in ``Index`` and ``Series`` created with ``NaN`` and ``NaT`` mixed data may not have ``datetime64`` dtype  (:issue:`13324`)
+- Bug in ``Index`` and ``Series`` may ignore ``np.datetime64('nat')`` and ``np.timdelta64('nat')`` to infer dtype (:issue:`13324`)
+- Bug in ``PeriodIndex`` and ``Period`` subtraction raises ``AttributeError`` (:issue:`13071`)
+- Bug in ``PeriodIndex`` construction returning a ``float64`` index in some circumstances (:issue:`13067`)
+- Bug in ``.resample(..)`` with a ``PeriodIndex`` not changing its ``freq`` appropriately when empty (:issue:`13067`)
+- Bug in ``.resample(..)`` with a ``PeriodIndex`` not retaining its type or name with an empty ``DataFrame`` appropriately when empty (:issue:`13212`)
+- Bug in ``groupby(..).apply(..)`` when the passed function returns scalar values per group (:issue:`13468`).
+- Bug in ``groupby(..).resample(..)`` where passing some keywords would raise an exception (:issue:`13235`)
+- Bug in ``.tz_convert`` on a tz-aware ``DateTimeIndex`` that relied on index being sorted for correct results (:issue:`13306`)
+- Bug in ``.tz_localize`` with ``dateutil.tz.tzlocal`` may return incorrect result (:issue:`13583`)
+- Bug in ``DatetimeTZDtype`` dtype with ``dateutil.tz.tzlocal`` cannot be regarded as valid dtype (:issue:`13583`)
+- Bug in ``pd.read_hdf()`` where attempting to load an HDF file with a single dataset, that had one or more categorical columns, failed unless the key argument was set to the name of the dataset. (:issue:`13231`)
+- Bug in ``.rolling()`` that allowed a negative integer window in construction of the ``Rolling()`` object, but would later fail on aggregation (:issue:`13383`)
+- Bug in ``Series`` indexing with tuple-valued data and a numeric index (:issue:`13509`)
+- Bug in printing ``pd.DataFrame`` where unusual elements with the ``object`` dtype were causing segfaults (:issue:`13717`)
+- Bug in ranking ``Series`` which could result in segfaults (:issue:`13445`)
+- Bug in various index types, which did not propagate the name of passed index (:issue:`12309`)
+- Bug in ``DatetimeIndex``, which did not honour the ``copy=True`` (:issue:`13205`)
+- Bug in ``DatetimeIndex.is_normalized`` returns incorrectly for normalized date_range in case of local timezones (:issue:`13459`)
+- Bug in ``pd.concat`` and ``.append`` may coerces ``datetime64`` and ``timedelta`` to ``object`` dtype containing python built-in ``datetime`` or ``timedelta`` rather than ``Timestamp`` or ``Timedelta`` (:issue:`13626`)
+- Bug in ``PeriodIndex.append`` may raises ``AttributeError`` when the result is ``object`` dtype (:issue:`13221`)
+- Bug in ``CategoricalIndex.append`` may accept normal ``list`` (:issue:`13626`)
+- Bug in ``pd.concat`` and ``.append`` with the same timezone get reset to UTC (:issue:`7795`)
+- Bug in ``Series`` and ``DataFrame`` ``.append`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13626`)
+- Bug in ``DataFrame.to_csv()`` in which float values were being quoted even though quotations were specified for non-numeric values only (:issue:`12922`, :issue:`13259`)
+- Bug in ``DataFrame.describe()`` raising ``ValueError`` with only boolean columns (:issue:`13898`)
+- Bug in ``MultiIndex`` slicing where extra elements were returned when level is non-unique (:issue:`12896`)
+- Bug in ``.str.replace`` does not raise ``TypeError`` for invalid replacement (:issue:`13438`)
+- Bug in ``MultiIndex.from_arrays`` which didn't check for input array lengths matching (:issue:`13599`)
+- Bug in ``cartesian_product`` and ``MultiIndex.from_product`` which may raise with empty input arrays (:issue:`12258`)
+- Bug in ``pd.read_csv()`` which may cause a segfault or corruption when iterating in large chunks over a stream/file under rare circumstances (:issue:`13703`)
+- Bug in ``pd.read_csv()`` which caused errors to be raised when a dictionary containing scalars is passed in for ``na_values`` (:issue:`12224`)
+- Bug in ``pd.read_csv()`` which caused BOM files to be incorrectly parsed by not ignoring the BOM (:issue:`4793`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` which raised errors when a numpy array was passed in for ``usecols`` (:issue:`12546`)
+- Bug in ``pd.read_csv()`` where the index columns were being incorrectly parsed when parsed as dates with a ``thousands`` parameter (:issue:`14066`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which ``NaN`` values weren't being detected after data was converted to numeric values (:issue:`13314`)
+- Bug in ``pd.read_csv()`` in which the ``nrows`` argument was not properly validated for both engines (:issue:`10476`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which infinities of mixed-case forms were not being interpreted properly (:issue:`13274`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` in which trailing ``NaN`` values were not being parsed (:issue:`13320`)
+- Bug in ``pd.read_csv()`` with ``engine='python'`` when reading from a ``tempfile.TemporaryFile`` on Windows with Python 3 (:issue:`13398`)
+- Bug in ``pd.read_csv()`` that prevents ``usecols`` kwarg from accepting single-byte unicode strings (:issue:`13219`)
+- Bug in ``pd.read_csv()`` that prevents ``usecols`` from being an empty set (:issue:`13402`)
+- Bug in ``pd.read_csv()`` in the C engine where the NULL character was not being parsed as NULL (:issue:`14012`)
+- Bug in ``pd.read_csv()`` with ``engine='c'`` in which NULL ``quotechar`` was not accepted even though ``quoting`` was specified as ``None`` (:issue:`13411`)
+- Bug in ``pd.read_csv()`` with ``engine='c'`` in which fields were not properly cast to float when quoting was specified as non-numeric (:issue:`13411`)
+- Bug in ``pd.read_csv()`` in Python 2.x with non-UTF8 encoded, multi-character separated data (:issue:`3404`)
+- Bug in ``pd.read_csv()``, where aliases for utf-xx (e.g. UTF-xx, UTF_xx, utf_xx) raised UnicodeDecodeError (:issue:`13549`)
+- Bug in ``pd.read_csv``, ``pd.read_table``, ``pd.read_fwf``, ``pd.read_stata`` and ``pd.read_sas`` where files were opened by parsers but not closed if both ``chunksize`` and ``iterator`` were ``None``. (:issue:`13940`)
+- Bug in ``StataReader``, ``StataWriter``, ``XportReader`` and ``SAS7BDATReader`` where a file was not properly closed when an error was raised. (:issue:`13940`)
+- Bug in ``pd.pivot_table()`` where ``margins_name`` is ignored when ``aggfunc`` is a list (:issue:`13354`)
+- Bug in ``pd.Series.str.zfill``, ``center``, ``ljust``, ``rjust``, and ``pad`` when passing non-integers, did not raise ``TypeError`` (:issue:`13598`)
+- Bug in checking for any null objects in a ``TimedeltaIndex``, which always returned ``True`` (:issue:`13603`)
+- Bug in ``Series`` arithmetic raises ``TypeError`` if it contains datetime-like as ``object`` dtype (:issue:`13043`)
+- Bug ``Series.isnull()`` and ``Series.notnull()`` ignore ``Period('NaT')``  (:issue:`13737`)
+- Bug ``Series.fillna()`` and ``Series.dropna()`` don't affect to ``Period('NaT')``  (:issue:`13737`
+- Bug in ``.fillna(value=np.nan)`` incorrectly raises ``KeyError`` on a ``category`` dtyped ``Series`` (:issue:`14021`)
+- Bug in extension dtype creation where the created types were not is/identical (:issue:`13285`)
+- Bug in ``.resample(..)`` where incorrect warnings were triggered by IPython introspection (:issue:`13618`)
+- Bug in ``NaT`` - ``Period`` raises ``AttributeError`` (:issue:`13071`)
+- Bug in ``Series`` comparison may output incorrect result if rhs contains ``NaT`` (:issue:`9005`)
+- Bug in ``Series`` and ``Index`` comparison may output incorrect result if it contains ``NaT`` with ``object`` dtype (:issue:`13592`)
+- Bug in ``Period`` addition raises ``TypeError`` if ``Period`` is on right hand side (:issue:`13069`)
+- Bug in ``Peirod`` and ``Series`` or ``Index`` comparison raises ``TypeError`` (:issue:`13200`)
+- Bug in ``pd.set_eng_float_format()`` that would prevent NaN and Inf from formatting (:issue:`11981`)
+- Bug in ``.unstack`` with ``Categorical`` dtype resets ``.ordered`` to ``True`` (:issue:`13249`)
+- Clean some compile time warnings in datetime parsing (:issue:`13607`)
+- Bug in ``factorize`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13750`)
+- Bug in ``.set_index`` raises ``AmbiguousTimeError`` if new index contains DST boundary and multi levels (:issue:`12920`)
+- Bug in ``.shift`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13926`)
+- Bug in ``pd.read_hdf()`` returns incorrect result when a ``DataFrame`` with a ``categorical`` column and a query which doesn't match any values (:issue:`13792`)
+- Bug in ``.iloc`` when indexing with a non lexsorted MultiIndex (:issue:`13797`)
+- Bug in ``.loc`` when indexing with date strings in a reverse sorted ``DatetimeIndex`` (:issue:`14316`)
+- Bug in ``Series`` comparison operators when dealing with zero dim NumPy arrays (:issue:`13006`)
+- Bug in ``.combine_first`` may return incorrect ``dtype`` (:issue:`7630`, :issue:`10567`)
+- Bug in ``groupby`` where ``apply`` returns different result depending on whether first result is ``None`` or not (:issue:`12824`)
+- Bug in ``groupby(..).nth()`` where the group key is included inconsistently if called after ``.head()/.tail()`` (:issue:`12839`)
+- Bug in ``.to_html``, ``.to_latex`` and ``.to_string`` silently ignore custom datetime formatter passed through the ``formatters`` key word (:issue:`10690`)
+- Bug in ``DataFrame.iterrows()``, not yielding a ``Series`` subclasse if defined (:issue:`13977`)
+- Bug in ``pd.to_numeric`` when ``errors='coerce'`` and input contains non-hashable objects (:issue:`13324`)
+- Bug in invalid ``Timedelta`` arithmetic and comparison may raise ``ValueError`` rather than ``TypeError`` (:issue:`13624`)
+- Bug in invalid datetime parsing in ``to_datetime`` and ``DatetimeIndex`` may raise ``TypeError`` rather than ``ValueError`` (:issue:`11169`, :issue:`11287`)
+- Bug in ``Index`` created with tz-aware ``Timestamp`` and mismatched ``tz`` option incorrectly coerces timezone (:issue:`13692`)
+- Bug in ``DatetimeIndex`` with nanosecond frequency does not include timestamp specified with ``end`` (:issue:`13672`)
+- Bug in ```Series`` when setting a slice with a ``np.timedelta64`` (:issue:`14155`)
+- Bug in ``Index`` raises ``OutOfBoundsDatetime`` if ``datetime`` exceeds ``datetime64[ns]`` bounds, rather than coercing to ``object`` dtype (:issue:`13663`)
+- Bug in ``Index`` may ignore specified ``datetime64`` or ``timedelta64`` passed as ``dtype``  (:issue:`13981`)
+- Bug in ``RangeIndex`` can be created without no arguments rather than raises ``TypeError`` (:issue:`13793`)
+- Bug in ``.value_counts()`` raises ``OutOfBoundsDatetime`` if data exceeds ``datetime64[ns]`` bounds (:issue:`13663`)
+- Bug in ``DatetimeIndex`` may raise ``OutOfBoundsDatetime`` if input ``np.datetime64`` has other unit than ``ns`` (:issue:`9114`)
+- Bug in ``Series`` creation with ``np.datetime64`` which has other unit than ``ns`` as ``object`` dtype results in incorrect values (:issue:`13876`)
+- Bug in ``resample`` with timedelta data where data was casted to float (:issue:`13119`).
+- Bug in ``pd.isnull()`` ``pd.notnull()`` raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
+- Bug in ``pd.merge()`` may raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
+- Bug in ``HDFStore``/``read_hdf()`` discarded ``DatetimeIndex.name`` if ``tz`` was set (:issue:`13884`)
+- Bug in ``Categorical.remove_unused_categories()`` changes ``.codes`` dtype to platform int (:issue:`13261`)
+- Bug in ``groupby`` with ``as_index=False`` returns all NaN's when grouping on multiple columns including a categorical one (:issue:`13204`)
+- Bug in ``df.groupby(...)[...]`` where getitem with ``Int64Index`` raised an error (:issue:`13731`)
+- Bug in the CSS classes assigned to ``DataFrame.style`` for index names. Previously they were assigned ``"col_heading level<n> col<c>"`` where ``n`` was the number of levels + 1. Now they are assigned ``"index_name level<n>"``, where ``n`` is the correct level for that MultiIndex.
+- Bug where ``pd.read_gbq()`` could throw ``ImportError: No module named discovery`` as a result of a naming conflict with another python package called apiclient  (:issue:`13454`)
+- Bug in ``Index.union`` returns an incorrect result with a named empty index (:issue:`13432`)
+- Bugs in ``Index.difference`` and ``DataFrame.join`` raise in Python3 when using mixed-integer indexes (:issue:`13432`, :issue:`12814`)
+- Bug in subtract tz-aware ``datetime.datetime`` from tz-aware ``datetime64`` series (:issue:`14088`)
+- Bug in ``.to_excel()`` when DataFrame contains a MultiIndex which contains a label with a NaN value (:issue:`13511`)
+- Bug in invalid frequency offset string like "D1", "-2-3H" may not raise ``ValueError`` (:issue:`13930`)
+- Bug in ``concat`` and ``groupby`` for hierarchical frames with ``RangeIndex`` levels (:issue:`13542`).
+- Bug in ``Series.str.contains()`` for Series containing only ``NaN`` values of ``object`` dtype (:issue:`14171`)
+- Bug in ``agg()`` function on groupby dataframe changes dtype of ``datetime64[ns]`` column to ``float64`` (:issue:`12821`)
+- Bug in using NumPy ufunc with ``PeriodIndex`` to add or subtract integer raise ``IncompatibleFrequency``. Note that using standard operator like ``+`` or ``-`` is recommended, because standard operators use more efficient path (:issue:`13980`)
+- Bug in operations on ``NaT`` returning ``float`` instead of ``datetime64[ns]`` (:issue:`12941`)
+- Bug in ``Series`` flexible arithmetic methods (like ``.add()``) raises ``ValueError`` when ``axis=None`` (:issue:`13894`)
+- Bug in ``DataFrame.to_csv()`` with ``MultiIndex`` columns in which a stray empty line was added (:issue:`6618`)
+- Bug in ``DatetimeIndex``, ``TimedeltaIndex`` and ``PeriodIndex.equals()`` may return ``True`` when input isn't ``Index`` but contains the same values (:issue:`13107`)
+- Bug in assignment against datetime with timezone may not work if it contains datetime near DST boundary (:issue:`14146`)
+- Bug in ``pd.eval()`` and ``HDFStore`` query truncating long float literals with python 2 (:issue:`14241`)
+- Bug in ``Index`` raises ``KeyError`` displaying incorrect column when column is not in the df and columns contains duplicate values (:issue:`13822`)
+- Bug in ``Period`` and ``PeriodIndex`` creating wrong dates when frequency has combined offset aliases (:issue:`13874`)
+- Bug in ``.to_string()`` when called with an integer ``line_width`` and ``index=False`` raises an UnboundLocalError exception because ``idx`` referenced before assignment.
+- Bug in ``eval()`` where the ``resolvers`` argument would not accept a list (:issue:`14095`)
+- Bugs in ``stack``, ``get_dummies``, ``make_axis_dummies`` which don't preserve categorical dtypes in (multi)indexes (:issue:`13854`)
+- ``PeriodIndex`` can now accept ``list`` and ``array`` which contains ``pd.NaT`` (:issue:`13430`)
+- Bug in ``df.groupby`` where ``.median()`` returns arbitrary values if grouped dataframe contains empty bins (:issue:`13629`)
+- Bug in ``Index.copy()`` where ``name`` parameter was ignored (:issue:`14302`)
+
+
+.. _whatsnew_0.19.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.18.1..v0.19.0
diff --git a/doc/source/whatsnew/v0.19.0.txt b/doc/source/whatsnew/v0.19.0.txt
deleted file mode 100644
index 9b003034aa94a..0000000000000
--- a/doc/source/whatsnew/v0.19.0.txt
+++ /dev/null
@@ -1,1565 +0,0 @@
-.. _whatsnew_0190:
-
-v0.19.0 (October 2, 2016)
--------------------------
-
-This is a major release from 0.18.1 and includes number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- :func:`merge_asof` for asof-style time-series joining, see :ref:`here <whatsnew_0190.enhancements.asof_merge>`
-- ``.rolling()`` is now time-series aware, see :ref:`here <whatsnew_0190.enhancements.rolling_ts>`
-- :func:`read_csv` now supports parsing ``Categorical`` data, see :ref:`here <whatsnew_0190.enhancements.read_csv_categorical>`
-- A function :func:`union_categorical` has been added for combining categoricals, see :ref:`here <whatsnew_0190.enhancements.union_categoricals>`
-- ``PeriodIndex`` now has its own ``period`` dtype, and changed to be more consistent with other ``Index`` classes. See :ref:`here <whatsnew_0190.api.period>`
-- Sparse data structures gained enhanced support of ``int`` and ``bool`` dtypes, see :ref:`here <whatsnew_0190.sparse>`
-- Comparison operations with ``Series`` no longer ignores the index, see :ref:`here <whatsnew_0190.api.series_ops>` for an overview of the API changes.
-- Introduction of a pandas development API for utility functions, see :ref:`here <whatsnew_0190.dev_api>`.
-- Deprecation of ``Panel4D`` and ``PanelND``. We recommend to represent these types of n-dimensional data with the `xarray package <http://xarray.pydata.org/en/stable/>`__.
-- Removal of the previously deprecated modules ``pandas.io.data``, ``pandas.io.wb``, ``pandas.tools.rplot``.
-
-.. warning::
-
-    pandas >= 0.19.0 will no longer silence numpy ufunc warnings upon import, see :ref:`here <whatsnew_0190.errstate>`.
-
-.. contents:: What's new in v0.19.0
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0190.new_features:
-
-New features
-~~~~~~~~~~~~
-
-.. _whatsnew_0190.enhancements.asof_merge:
-
-``merge_asof`` for asof-style time-series joining
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-A long-time requested feature has been added through the :func:`merge_asof` function, to
-support asof style joining of time-series (:issue:`1870`, :issue:`13695`, :issue:`13709`, :issue:`13902`). Full documentation is
-:ref:`here <merging.merge_asof>`.
-
-The :func:`merge_asof` performs an asof merge, which is similar to a left-join
-except that we match on nearest key rather than equal keys.
-
-.. ipython:: python
-
-   left = pd.DataFrame({'a': [1, 5, 10],
-                        'left_val': ['a', 'b', 'c']})
-   right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
-                        'right_val': [1, 2, 3, 6, 7]})
-
-   left
-   right
-
-We typically want to match exactly when possible, and use the most
-recent value otherwise.
-
-.. ipython:: python
-
-   pd.merge_asof(left, right, on='a')
-
-We can also match rows ONLY with prior data, and not an exact match.
-
-.. ipython:: python
-
-   pd.merge_asof(left, right, on='a', allow_exact_matches=False)
-
-
-In a typical time-series example, we have ``trades`` and ``quotes`` and we want to ``asof-join`` them.
-This also illustrates using the ``by`` parameter to group data before merging.
-
-.. ipython:: python
-
-   trades = pd.DataFrame({
-       'time': pd.to_datetime(['20160525 13:30:00.023',
-                               '20160525 13:30:00.038',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.048']),
-       'ticker': ['MSFT', 'MSFT',
-                  'GOOG', 'GOOG', 'AAPL'],
-       'price': [51.95, 51.95,
-                 720.77, 720.92, 98.00],
-       'quantity': [75, 155,
-                    100, 100, 100]},
-       columns=['time', 'ticker', 'price', 'quantity'])
-
-   quotes = pd.DataFrame({
-       'time': pd.to_datetime(['20160525 13:30:00.023',
-                               '20160525 13:30:00.023',
-                               '20160525 13:30:00.030',
-                               '20160525 13:30:00.041',
-                               '20160525 13:30:00.048',
-                               '20160525 13:30:00.049',
-                               '20160525 13:30:00.072',
-                               '20160525 13:30:00.075']),
-       'ticker': ['GOOG', 'MSFT', 'MSFT',
-                  'MSFT', 'GOOG', 'AAPL', 'GOOG',
-                  'MSFT'],
-       'bid': [720.50, 51.95, 51.97, 51.99,
-               720.50, 97.99, 720.50, 52.01],
-       'ask': [720.93, 51.96, 51.98, 52.00,
-               720.93, 98.01, 720.88, 52.03]},
-       columns=['time', 'ticker', 'bid', 'ask'])
-
-.. ipython:: python
-
-   trades
-   quotes
-
-An asof merge joins on the ``on``, typically a datetimelike field, which is ordered, and
-in this case we are using a grouper in the ``by`` field. This is like a left-outer join, except
-that forward filling happens automatically taking the most recent non-NaN value.
-
-.. ipython:: python
-
-   pd.merge_asof(trades, quotes,
-                 on='time',
-                 by='ticker')
-
-This returns a merged DataFrame with the entries in the same order as the original left
-passed DataFrame (``trades`` in this case), with the fields of the ``quotes`` merged.
-
-.. _whatsnew_0190.enhancements.rolling_ts:
-
-``.rolling()`` is now time-series aware
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``.rolling()`` objects are now time-series aware and can accept a time-series offset (or convertible) for the ``window`` argument (:issue:`13327`, :issue:`12995`).
-See the full documentation :ref:`here <stats.moments.ts>`.
-
-.. ipython:: python
-
-   dft = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
-                      index=pd.date_range('20130101 09:00:00', periods=5, freq='s'))
-   dft
-
-This is a regular frequency index. Using an integer window parameter works to roll along the window frequency.
-
-.. ipython:: python
-
-   dft.rolling(2).sum()
-   dft.rolling(2, min_periods=1).sum()
-
-Specifying an offset allows a more intuitive specification of the rolling frequency.
-
-.. ipython:: python
-
-   dft.rolling('2s').sum()
-
-Using a non-regular, but still monotonic index, rolling with an integer window does not impart any special calculation.
-
-.. ipython:: python
-
-
-   dft = DataFrame({'B': [0, 1, 2, np.nan, 4]},
-                   index = pd.Index([pd.Timestamp('20130101 09:00:00'),
-                                     pd.Timestamp('20130101 09:00:02'),
-                                     pd.Timestamp('20130101 09:00:03'),
-                                     pd.Timestamp('20130101 09:00:05'),
-                                     pd.Timestamp('20130101 09:00:06')],
-                                    name='foo'))
-
-   dft
-   dft.rolling(2).sum()
-
-Using the time-specification generates variable windows for this sparse data.
-
-.. ipython:: python
-
-   dft.rolling('2s').sum()
-
-Furthermore, we now allow an optional ``on`` parameter to specify a column (rather than the
-default of the index) in a DataFrame.
-
-.. ipython:: python
-
-   dft = dft.reset_index()
-   dft
-   dft.rolling('2s', on='foo').sum()
-
-.. _whatsnew_0190.enhancements.read_csv_dupe_col_names_support:
-
-``read_csv`` has improved support for duplicate column names
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-.. ipython:: python
-   :suppress:
-
-   from pandas.compat import StringIO
-
-:ref:`Duplicate column names <io.dupe_names>` are now supported in :func:`read_csv` whether
-they are in the file or passed in as the ``names`` parameter (:issue:`7160`, :issue:`9424`)
-
-.. ipython:: python
-
-   data = '0,1,2\n3,4,5'
-   names = ['a', 'b', 'a']
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [2]: pd.read_csv(StringIO(data), names=names)
-   Out[2]:
-      a  b  a
-   0  2  1  2
-   1  5  4  5
-
-The first ``a`` column contained the same data as the second ``a`` column, when it should have
-contained the values ``[0, 3]``.
-
-**New behavior**:
-
-.. ipython:: python
-
-   pd.read_csv(StringIO(data), names=names)
-
-
-.. _whatsnew_0190.enhancements.read_csv_categorical:
-
-``read_csv`` supports parsing ``Categorical`` directly
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The :func:`read_csv` function now supports parsing a ``Categorical`` column when
-specified as a dtype (:issue:`10153`).  Depending on the structure of the data,
-this can result in a faster parse time and lower memory usage compared to
-converting to ``Categorical`` after parsing.  See the io :ref:`docs here <io.categorical>`.
-
-.. ipython:: python
-
-   data = 'col1,col2,col3\na,b,1\na,b,2\nc,d,3'
-
-   pd.read_csv(StringIO(data))
-   pd.read_csv(StringIO(data)).dtypes
-   pd.read_csv(StringIO(data), dtype='category').dtypes
-
-Individual columns can be parsed as a ``Categorical`` using a dict specification
-
-.. ipython:: python
-
-   pd.read_csv(StringIO(data), dtype={'col1': 'category'}).dtypes
-
-.. note::
-
-   The resulting categories will always be parsed as strings (object dtype).
-   If the categories are numeric they can be converted using the
-   :func:`to_numeric` function, or as appropriate, another converter
-   such as :func:`to_datetime`.
-
-   .. ipython:: python
-
-      df = pd.read_csv(StringIO(data), dtype='category')
-      df.dtypes
-      df['col3']
-      df['col3'].cat.categories = pd.to_numeric(df['col3'].cat.categories)
-      df['col3']
-
-.. _whatsnew_0190.enhancements.union_categoricals:
-
-Categorical Concatenation
-^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- A function :func:`union_categoricals` has been added for combining categoricals, see :ref:`Unioning Categoricals<categorical.union>` (:issue:`13361`, :issue:`:13763`, issue:`13846`, :issue:`14173`)
-
-  .. ipython:: python
-
-      from pandas.types.concat import union_categoricals
-      a = pd.Categorical(["b", "c"])
-      b = pd.Categorical(["a", "b"])
-      union_categoricals([a, b])
-
-- ``concat`` and ``append`` now can concat ``category`` dtypes with different ``categories`` as ``object`` dtype (:issue:`13524`)
-
-  .. ipython:: python
-
-     s1 = pd.Series(['a', 'b'], dtype='category')
-     s2 = pd.Series(['b', 'c'], dtype='category')
-
-  **Previous behavior**:
-
-  .. code-block:: ipython
-
-     In [1]: pd.concat([s1, s2])
-     ValueError: incompatible categories in categorical concat
-
-  **New behavior**:
-
-  .. ipython:: python
-
-     pd.concat([s1, s2])
-
-.. _whatsnew_0190.enhancements.semi_month_offsets:
-
-Semi-Month Offsets
-^^^^^^^^^^^^^^^^^^
-
-Pandas has gained new frequency offsets, ``SemiMonthEnd`` ('SM') and ``SemiMonthBegin`` ('SMS').
-These provide date offsets anchored (by default) to the 15th and end of month, and 15th and 1st of month respectively.
-(:issue:`1543`)
-
-.. ipython:: python
-
-    from pandas.tseries.offsets import SemiMonthEnd, SemiMonthBegin
-
-**SemiMonthEnd**:
-
-.. ipython:: python
-
-    Timestamp('2016-01-01') + SemiMonthEnd()
-
-    pd.date_range('2015-01-01', freq='SM', periods=4)
-
-**SemiMonthBegin**:
-
-.. ipython:: python
-
-    Timestamp('2016-01-01') + SemiMonthBegin()
-
-    pd.date_range('2015-01-01', freq='SMS', periods=4)
-
-Using the anchoring suffix, you can also specify the day of month to use instead of the 15th.
-
-.. ipython:: python
-
-    pd.date_range('2015-01-01', freq='SMS-16', periods=4)
-
-    pd.date_range('2015-01-01', freq='SM-14', periods=4)
-
-.. _whatsnew_0190.enhancements.index:
-
-New Index methods
-^^^^^^^^^^^^^^^^^
-
-The following methods and options are added to ``Index``, to be more consistent with the ``Series`` and ``DataFrame`` API.
-
-``Index`` now supports the ``.where()`` function for same shape indexing (:issue:`13170`)
-
-.. ipython:: python
-
-   idx = pd.Index(['a', 'b', 'c'])
-   idx.where([True, False, True])
-
-
-``Index`` now supports ``.dropna()`` to exclude missing values (:issue:`6194`)
-
-.. ipython:: python
-
-   idx = pd.Index([1, 2, np.nan, 4])
-   idx.dropna()
-
-For ``MultiIndex``, values are dropped if any level is missing by default. Specifying
-``how='all'`` only drops values where all levels are missing.
-
-.. ipython:: python
-
-   midx = pd.MultiIndex.from_arrays([[1, 2, np.nan, 4],
-                                       [1, 2, np.nan, np.nan]])
-   midx
-   midx.dropna()
-   midx.dropna(how='all')
-
-``Index`` now supports ``.str.extractall()`` which returns a ``DataFrame``, see the :ref:`docs here <text.extractall>` (:issue:`10008`, :issue:`13156`)
-
-.. ipython:: python
-
-   idx = pd.Index(["a1a2", "b1", "c1"])
-   idx.str.extractall("[ab](?P<digit>\d)")
-
-``Index.astype()`` now accepts an optional boolean argument ``copy``, which allows optional copying if the requirements on dtype are satisfied (:issue:`13209`)
-
-.. _whatsnew_0190.gbq:
-
-Google BigQuery Enhancements
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-- The :func:`read_gbq` method has gained the ``dialect`` argument to allow users to specify whether to use BigQuery's legacy SQL or BigQuery's standard SQL. See the `docs <https://pandas-gbq.readthedocs.io/en/latest/reading.html>`__ for more details (:issue:`13615`).
-- The :func:`~DataFrame.to_gbq` method now allows the DataFrame column order to differ from the destination table schema (:issue:`11359`).
-
-.. _whatsnew_0190.errstate:
-
-Fine-grained numpy errstate
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Previous versions of pandas would permanently silence numpy's ufunc error handling when ``pandas`` was imported. Pandas did this in order to silence the warnings that would arise from using numpy ufuncs on missing data, which are usually represented as ``NaN`` s. Unfortunately, this silenced legitimate warnings arising in non-pandas code in the application. Starting with 0.19.0, pandas will use the ``numpy.errstate`` context manager to silence these warnings in a more fine-grained manner, only around where these operations are actually used in the pandas codebase. (:issue:`13109`, :issue:`13145`)
-
-After upgrading pandas, you may see *new* ``RuntimeWarnings`` being issued from your code. These are likely legitimate, and the underlying cause likely existed in the code when using previous versions of pandas that simply silenced the warning. Use `numpy.errstate <http://docs.scipy.org/doc/numpy/reference/generated/numpy.errstate.html>`__ around the source of the ``RuntimeWarning`` to control how these conditions are handled.
-
-.. _whatsnew_0190.get_dummies_dtypes:
-
-``get_dummies`` now returns integer dtypes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The ``pd.get_dummies`` function now returns dummy-encoded columns as small integers, rather than floats (:issue:`8725`). This should provide an improved memory footprint.
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [1]: pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
-
-   Out[1]:
-   a    float64
-   b    float64
-   c    float64
-   dtype: object
-
-**New behavior**:
-
-.. ipython:: python
-
-   pd.get_dummies(['a', 'b', 'a', 'c']).dtypes
-
-
-.. _whatsnew_0190.enhancements.to_numeric_downcast:
-
-Downcast values to smallest possible dtype in ``to_numeric``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``pd.to_numeric()`` now accepts a ``downcast`` parameter, which will downcast the data if possible to smallest specified numerical dtype (:issue:`13352`)
-
-.. ipython:: python
-
-   s = ['1', 2, 3]
-   pd.to_numeric(s, downcast='unsigned')
-   pd.to_numeric(s, downcast='integer')
-
-.. _whatsnew_0190.dev_api:
-
-pandas development API
-^^^^^^^^^^^^^^^^^^^^^^
-
-As part of making pandas API more uniform and accessible in the future, we have created a standard
-sub-package of pandas, ``pandas.api`` to hold public API's. We are starting by exposing type
-introspection functions in ``pandas.api.types``. More sub-packages and officially sanctioned API's
-will be published in future versions of pandas (:issue:`13147`, :issue:`13634`)
-
-The following are now part of this API:
-
-.. ipython:: python
-
-   import pprint
-   from pandas.api import types
-   funcs = [ f for f in dir(types) if not f.startswith('_') ]
-   pprint.pprint(funcs)
-
-.. note::
-
-   Calling these functions from the internal module ``pandas.core.common`` will now show a ``DeprecationWarning`` (:issue:`13990`)
-
-
-.. _whatsnew_0190.enhancements.other:
-
-Other enhancements
-^^^^^^^^^^^^^^^^^^
-
-- ``Timestamp`` can now accept positional and keyword parameters similar to :func:`datetime.datetime` (:issue:`10758`, :issue:`11630`)
-
-  .. ipython:: python
-
-    pd.Timestamp(2012, 1, 1)
-
-    pd.Timestamp(year=2012, month=1, day=1, hour=8, minute=30)
-
-- The ``.resample()`` function now accepts a ``on=`` or ``level=`` parameter for resampling on a datetimelike column or ``MultiIndex`` level (:issue:`13500`)
-
-  .. ipython:: python
-
-     df = pd.DataFrame({'date': pd.date_range('2015-01-01', freq='W', periods=5),
-                        'a': np.arange(5)},
-                       index=pd.MultiIndex.from_arrays([
-                                [1,2,3,4,5],
-                                pd.date_range('2015-01-01', freq='W', periods=5)],
-                            names=['v','d']))
-     df
-     df.resample('M', on='date').sum()
-     df.resample('M', level='d').sum()
-
-- The ``.get_credentials()`` method of ``GbqConnector`` can now first try to fetch `the application default credentials <https://developers.google.com/identity/protocols/application-default-credentials>`__. See the :ref:`docs <io.bigquery_authentication>` for more details (:issue:`13577`).
-- The ``.tz_localize()`` method of ``DatetimeIndex`` and ``Timestamp`` has gained the ``errors`` keyword, so you can potentially coerce nonexistent timestamps to ``NaT``. The default behavior remains to raising a ``NonExistentTimeError`` (:issue:`13057`)
-- ``.to_hdf/read_hdf()`` now accept path objects (e.g. ``pathlib.Path``, ``py.path.local``) for the file path (:issue:`11773`)
-- The ``pd.read_csv()`` with ``engine='python'`` has gained support for the
-  ``decimal`` (:issue:`12933`), ``na_filter`` (:issue:`13321`) and the ``memory_map`` option (:issue:`13381`).
-- Consistent with the Python API, ``pd.read_csv()`` will now interpret ``+inf`` as positive infinity (:issue:`13274`)
-- The ``pd.read_html()`` has gained support for the ``na_values``, ``converters``, ``keep_default_na``  options (:issue:`13461`)
-- ``Categorical.astype()`` now accepts an optional boolean argument ``copy``, effective when dtype is categorical (:issue:`13209`)
-- ``DataFrame`` has gained the ``.asof()`` method to return the last non-NaN values according to the selected subset (:issue:`13358`)
-- The ``DataFrame`` constructor will now respect key ordering if a list of ``OrderedDict`` objects are passed in (:issue:`13304`)
-- ``pd.read_html()`` has gained support for the ``decimal`` option (:issue:`12907`)
-- ``Series`` has gained the properties ``.is_monotonic``, ``.is_monotonic_increasing``, ``.is_monotonic_decreasing``, similar to ``Index`` (:issue:`13336`)
-- ``DataFrame.to_sql()`` now allows a single value as the SQL type for all columns (:issue:`11886`).
-- ``Series.append`` now supports the ``ignore_index`` option (:issue:`13677`)
-- ``.to_stata()`` and ``StataWriter`` can now write variable labels to Stata dta files using a dictionary to make column names to labels (:issue:`13535`, :issue:`13536`)
-- ``.to_stata()`` and ``StataWriter`` will automatically convert ``datetime64[ns]`` columns to Stata format ``%tc``, rather than raising a ``ValueError`` (:issue:`12259`)
-- ``read_stata()`` and ``StataReader`` raise with a more explicit error message when reading Stata files with repeated value labels when ``convert_categoricals=True`` (:issue:`13923`)
-- ``DataFrame.style`` will now render sparsified MultiIndexes (:issue:`11655`)
-- ``DataFrame.style`` will now show column level names (e.g. ``DataFrame.columns.names``) (:issue:`13775`)
-- ``DataFrame`` has gained support to re-order the columns based on the values
-  in a row using ``df.sort_values(by='...', axis=1)`` (:issue:`10806`)
-
-  .. ipython:: python
-
-     df = pd.DataFrame({'A': [2, 7], 'B': [3, 5], 'C': [4, 8]},
-                       index=['row1', 'row2'])
-     df
-     df.sort_values(by='row2', axis=1)
-
-- Added documentation to :ref:`I/O<io.dtypes>` regarding the perils of reading in columns with mixed dtypes and how to handle it (:issue:`13746`)
-- :meth:`~DataFrame.to_html` now has a ``border`` argument to control the value in the opening ``<table>`` tag. The default is the value of the ``html.border`` option, which defaults to 1. This also affects the notebook HTML repr, but since Jupyter's CSS includes a border-width attribute, the visual effect is the same. (:issue:`11563`).
-- Raise ``ImportError`` in the sql functions when ``sqlalchemy`` is not installed and a connection string is used (:issue:`11920`).
-- Compatibility with matplotlib 2.0. Older versions of pandas should also work with matplotlib 2.0 (:issue:`13333`)
-- ``Timestamp``, ``Period``, ``DatetimeIndex``, ``PeriodIndex`` and ``.dt`` accessor have gained a ``.is_leap_year`` property to check whether the date belongs to a leap year. (:issue:`13727`)
-- ``astype()`` will now accept a dict of column name to data types mapping as the ``dtype`` argument. (:issue:`12086`)
-- The ``pd.read_json`` and ``DataFrame.to_json`` has gained support for reading and writing json lines with ``lines`` option see :ref:`Line delimited json <io.jsonl>` (:issue:`9180`)
-- :func:`read_excel` now supports the true_values and false_values keyword arguments (:issue:`13347`)
-- ``groupby()`` will now accept a scalar and a single-element list for specifying ``level`` on a non-``MultiIndex`` grouper. (:issue:`13907`)
-- Non-convertible dates in an excel date column will be returned without conversion and the column will be ``object`` dtype, rather than raising an exception (:issue:`10001`).
-- ``pd.Timedelta(None)`` is now accepted and will return ``NaT``, mirroring ``pd.Timestamp`` (:issue:`13687`)
-- ``pd.read_stata()`` can now handle some format 111 files, which are produced by SAS when generating Stata dta files (:issue:`11526`)
-- ``Series`` and ``Index`` now support ``divmod`` which will return a tuple of
-  series or indices. This behaves like a standard binary operator with regards
-  to broadcasting rules (:issue:`14208`).
-
-
-.. _whatsnew_0190.api:
-
-API changes
-~~~~~~~~~~~
-
-``Series.tolist()`` will now return Python types
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Series.tolist()`` will now return Python types in the output, mimicking NumPy ``.tolist()`` behavior (:issue:`10904`)
-
-
-.. ipython:: python
-
-   s = pd.Series([1,2,3])
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [7]: type(s.tolist()[0])
-   Out[7]:
-    <class 'numpy.int64'>
-
-**New behavior**:
-
-.. ipython:: python
-
-   type(s.tolist()[0])
-
-.. _whatsnew_0190.api.series_ops:
-
-``Series`` operators for different indexes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Following ``Series`` operators have been changed to make all operators consistent,
-including ``DataFrame`` (:issue:`1134`, :issue:`4581`, :issue:`13538`)
-
-- ``Series`` comparison operators now raise ``ValueError`` when ``index`` are different.
-- ``Series`` logical operators align both ``index`` of left and right hand side.
-
-.. warning::
-   Until 0.18.1, comparing ``Series`` with the same length, would succeed even if
-   the ``.index`` are different (the result ignores ``.index``). As of 0.19.0, this will raises ``ValueError`` to be more strict. This section also describes how to keep previous behavior or align different indexes, using the flexible comparison methods like ``.eq``.
-
-
-As a result, ``Series`` and ``DataFrame`` operators behave as below:
-
-Arithmetic operators
-""""""""""""""""""""
-
-Arithmetic operators align both ``index`` (no changes).
-
-.. ipython:: python
-
-   s1 = pd.Series([1, 2, 3], index=list('ABC'))
-   s2 = pd.Series([2, 2, 2], index=list('ABD'))
-   s1 + s2
-
-   df1 = pd.DataFrame([1, 2, 3], index=list('ABC'))
-   df2 = pd.DataFrame([2, 2, 2], index=list('ABD'))
-   df1 + df2
-
-Comparison operators
-""""""""""""""""""""
-
-Comparison operators raise ``ValueError`` when ``.index`` are different.
-
-**Previous Behavior** (``Series``):
-
-``Series`` compared values ignoring the ``.index`` as long as both had the same length:
-
-.. code-block:: ipython
-
-   In [1]: s1 == s2
-   Out[1]:
-   A    False
-   B     True
-   C    False
-   dtype: bool
-
-**New behavior** (``Series``):
-
-.. code-block:: ipython
-
-   In [2]: s1 == s2
-   Out[2]:
-   ValueError: Can only compare identically-labeled Series objects
-
-.. note::
-
-   To achieve the same result as previous versions (compare values based on locations ignoring ``.index``), compare both ``.values``.
-
-   .. ipython:: python
-
-      s1.values == s2.values
-
-   If you want to compare ``Series`` aligning its ``.index``, see flexible comparison methods section below:
-
-   .. ipython:: python
-
-      s1.eq(s2)
-
-**Current Behavior** (``DataFrame``, no change):
-
-.. code-block:: ipython
-
-   In [3]: df1 == df2
-   Out[3]:
-   ValueError: Can only compare identically-labeled DataFrame objects
-
-Logical operators
-"""""""""""""""""
-
-Logical operators align both ``.index`` of left and right hand side.
-
-**Previous behavior** (``Series``), only left hand side ``index`` was kept:
-
-.. code-block:: ipython
-
-   In [4]: s1 = pd.Series([True, False, True], index=list('ABC'))
-   In [5]: s2 = pd.Series([True, True, True], index=list('ABD'))
-   In [6]: s1 & s2
-   Out[6]:
-   A     True
-   B    False
-   C    False
-   dtype: bool
-
-**New behavior** (``Series``):
-
-.. ipython:: python
-
-   s1 = pd.Series([True, False, True], index=list('ABC'))
-   s2 = pd.Series([True, True, True], index=list('ABD'))
-   s1 & s2
-
-.. note::
-   ``Series`` logical operators fill a ``NaN`` result with ``False``.
-
-.. note::
-   To achieve the same result as previous versions (compare values based on only left hand side index), you can use ``reindex_like``:
-
-   .. ipython:: python
-
-      s1 & s2.reindex_like(s1)
-
-**Current Behavior** (``DataFrame``, no change):
-
-.. ipython:: python
-
-   df1 = pd.DataFrame([True, False, True], index=list('ABC'))
-   df2 = pd.DataFrame([True, True, True], index=list('ABD'))
-   df1 & df2
-
-Flexible comparison methods
-"""""""""""""""""""""""""""
-
-``Series`` flexible comparison methods like ``eq``, ``ne``, ``le``, ``lt``, ``ge`` and ``gt`` now align both ``index``. Use these operators if you want to compare two ``Series``
-which has the different ``index``.
-
-.. ipython:: python
-
-   s1 = pd.Series([1, 2, 3], index=['a', 'b', 'c'])
-   s2 = pd.Series([2, 2, 2], index=['b', 'c', 'd'])
-   s1.eq(s2)
-   s1.ge(s2)
-
-Previously, this worked the same as comparison operators (see above).
-
-.. _whatsnew_0190.api.promote:
-
-``Series`` type promotion on assignment
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-A ``Series`` will now correctly promote its dtype for assignment with incompat values to the current dtype (:issue:`13234`)
-
-
-.. ipython:: python
-
-   s = pd.Series()
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [2]: s["a"] = pd.Timestamp("2016-01-01")
-
-   In [3]: s["b"] = 3.0
-   TypeError: invalid type promotion
-
-**New behavior**:
-
-.. ipython:: python
-
-   s["a"] = pd.Timestamp("2016-01-01")
-   s["b"] = 3.0
-   s
-   s.dtype
-
-.. _whatsnew_0190.api.to_datetime_coerce:
-
-``.to_datetime()`` changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Previously if ``.to_datetime()`` encountered mixed integers/floats and strings, but no datetimes with ``errors='coerce'`` it would convert all to ``NaT``.
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [2]: pd.to_datetime([1, 'foo'], errors='coerce')
-   Out[2]: DatetimeIndex(['NaT', 'NaT'], dtype='datetime64[ns]', freq=None)
-
-**Current behavior**:
-
-This will now convert integers/floats with the default unit of ``ns``.
-
-.. ipython:: python
-
-   pd.to_datetime([1, 'foo'], errors='coerce')
-
-Bug fixes related to ``.to_datetime()``:
-
-- Bug in ``pd.to_datetime()`` when passing integers or floats, and no ``unit`` and ``errors='coerce'`` (:issue:`13180`).
-- Bug in ``pd.to_datetime()`` when passing invalid datatypes (e.g. bool); will now respect the ``errors`` keyword (:issue:`13176`)
-- Bug in ``pd.to_datetime()`` which overflowed on ``int8``, and ``int16`` dtypes (:issue:`13451`)
-- Bug in ``pd.to_datetime()`` raise ``AttributeError`` with ``NaN`` and the other string is not valid when ``errors='ignore'`` (:issue:`12424`)
-- Bug in ``pd.to_datetime()`` did not cast floats correctly when ``unit`` was specified, resulting in truncated datetime (:issue:`13834`)
-
-.. _whatsnew_0190.api.merging:
-
-Merging changes
-^^^^^^^^^^^^^^^
-
-Merging will now preserve the dtype of the join keys (:issue:`8596`)
-
-.. ipython:: python
-
-   df1 = pd.DataFrame({'key': [1], 'v1': [10]})
-   df1
-   df2 = pd.DataFrame({'key': [1, 2], 'v1': [20, 30]})
-   df2
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [5]: pd.merge(df1, df2, how='outer')
-   Out[5]:
-      key    v1
-   0  1.0  10.0
-   1  1.0  20.0
-   2  2.0  30.0
-
-   In [6]: pd.merge(df1, df2, how='outer').dtypes
-   Out[6]:
-   key    float64
-   v1     float64
-   dtype: object
-
-**New behavior**:
-
-We are able to preserve the join keys
-
-.. ipython:: python
-
-   pd.merge(df1, df2, how='outer')
-   pd.merge(df1, df2, how='outer').dtypes
-
-Of course if you have missing values that are introduced, then the
-resulting dtype will be upcast, which is unchanged from previous.
-
-.. ipython:: python
-
-   pd.merge(df1, df2, how='outer', on='key')
-   pd.merge(df1, df2, how='outer', on='key').dtypes
-
-.. _whatsnew_0190.api.describe:
-
-``.describe()`` changes
-^^^^^^^^^^^^^^^^^^^^^^^
-
-Percentile identifiers in the index of a ``.describe()`` output will now be rounded to the least precision that keeps them distinct (:issue:`13104`)
-
-.. ipython:: python
-
-   s = pd.Series([0, 1, 2, 3, 4])
-   df = pd.DataFrame([0, 1, 2, 3, 4])
-
-**Previous behavior**:
-
-The percentiles were rounded to at most one decimal place, which could raise ``ValueError`` for a data frame if the percentiles were duplicated.
-
-.. code-block:: ipython
-
-   In [3]: s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
-   Out[3]:
-   count     5.000000
-   mean      2.000000
-   std       1.581139
-   min       0.000000
-   0.0%      0.000400
-   0.1%      0.002000
-   0.1%      0.004000
-   50%       2.000000
-   99.9%     3.996000
-   100.0%    3.998000
-   100.0%    3.999600
-   max       4.000000
-   dtype: float64
-
-   In [4]: df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
-   Out[4]:
-   ...
-   ValueError: cannot reindex from a duplicate axis
-
-**New behavior**:
-
-.. ipython:: python
-
-   s.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
-   df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999, 0.9995, 0.9999])
-
-Furthermore:
-
-- Passing duplicated ``percentiles`` will now raise a ``ValueError``.
-- Bug in ``.describe()`` on a DataFrame with a mixed-dtype column index, which would previously raise a ``TypeError`` (:issue:`13288`)
-
-.. _whatsnew_0190.api.period:
-
-``Period`` changes
-^^^^^^^^^^^^^^^^^^
-
-``PeriodIndex`` now has ``period`` dtype
-""""""""""""""""""""""""""""""""""""""""
-
-``PeriodIndex`` now has its own ``period`` dtype. The ``period`` dtype is a
-pandas extension dtype like ``category`` or the :ref:`timezone aware dtype <timeseries.timezone_series>` (``datetime64[ns, tz]``) (:issue:`13941`).
-As a consequence of this change, ``PeriodIndex`` no longer has an integer dtype:
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [1]: pi = pd.PeriodIndex(['2016-08-01'], freq='D')
-
-   In [2]: pi
-   Out[2]: PeriodIndex(['2016-08-01'], dtype='int64', freq='D')
-
-   In [3]: pd.api.types.is_integer_dtype(pi)
-   Out[3]: True
-
-   In [4]: pi.dtype
-   Out[4]: dtype('int64')
-
-**New behavior**:
-
-.. ipython:: python
-
-   pi = pd.PeriodIndex(['2016-08-01'], freq='D')
-   pi
-   pd.api.types.is_integer_dtype(pi)
-   pd.api.types.is_period_dtype(pi)
-   pi.dtype
-   type(pi.dtype)
-
-.. _whatsnew_0190.api.periodnat:
-
-``Period('NaT')`` now returns ``pd.NaT``
-""""""""""""""""""""""""""""""""""""""""
-
-Previously, ``Period`` has its own ``Period('NaT')`` representation different from ``pd.NaT``. Now ``Period('NaT')`` has been changed to return ``pd.NaT``. (:issue:`12759`, :issue:`13582`)
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [5]: pd.Period('NaT', freq='D')
-   Out[5]: Period('NaT', 'D')
-
-**New behavior**:
-
-These result in ``pd.NaT`` without providing ``freq`` option.
-
-.. ipython:: python
-
-   pd.Period('NaT')
-   pd.Period(None)
-
-
-To be compatible with ``Period`` addition and subtraction, ``pd.NaT`` now supports addition and subtraction with ``int``. Previously it raised ``ValueError``.
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [5]: pd.NaT + 1
-   ...
-   ValueError: Cannot add integral value to Timestamp without freq.
-
-**New behavior**:
-
-.. ipython:: python
-
-   pd.NaT + 1
-   pd.NaT - 1
-
-``PeriodIndex.values`` now returns array of ``Period`` object
-"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""
-
-``.values`` is changed to return an array of ``Period`` objects, rather than an array
-of integers (:issue:`13988`).
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [6]: pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
-   In [7]: pi.values
-   array([492, 493])
-
-**New behavior**:
-
-.. ipython:: python
-
-   pi = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
-   pi.values
-
-
-.. _whatsnew_0190.api.setops:
-
-Index ``+`` / ``-`` no longer used for set operations
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Addition and subtraction of the base Index type and of DatetimeIndex
-(not the numeric index types)
-previously performed set operations (set union and difference). This
-behavior was already deprecated since 0.15.0 (in favor using the specific
-``.union()`` and ``.difference()`` methods), and is now disabled. When
-possible, ``+`` and ``-`` are now used for element-wise operations, for
-example for concatenating strings or subtracting datetimes
-(:issue:`8227`, :issue:`14127`).
-
-Previous behavior:
-
-.. code-block:: ipython
-
-    In [1]: pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
-    FutureWarning: using '+' to provide set union with Indexes is deprecated, use '|' or .union()
-    Out[1]: Index(['a', 'b', 'c'], dtype='object')
-
-**New behavior**: the same operation will now perform element-wise addition:
-
-.. ipython:: python
-
-    pd.Index(['a', 'b']) + pd.Index(['a', 'c'])
-
-Note that numeric Index objects already performed element-wise operations.
-For example, the behavior of adding two integer Indexes is unchanged.
-The base ``Index`` is now made consistent with this behavior.
-
-.. ipython:: python
-
-    pd.Index([1, 2, 3]) + pd.Index([2, 3, 4])
-
-Further, because of this change, it is now possible to subtract two
-DatetimeIndex objects resulting in a TimedeltaIndex:
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-    In [1]: pd.DatetimeIndex(['2016-01-01', '2016-01-02']) - pd.DatetimeIndex(['2016-01-02', '2016-01-03'])
-    FutureWarning: using '-' to provide set differences with datetimelike Indexes is deprecated, use .difference()
-    Out[1]: DatetimeIndex(['2016-01-01'], dtype='datetime64[ns]', freq=None)
-
-**New behavior**:
-
-.. ipython:: python
-
-    pd.DatetimeIndex(['2016-01-01', '2016-01-02']) - pd.DatetimeIndex(['2016-01-02', '2016-01-03'])
-
-
-.. _whatsnew_0190.api.difference:
-
-``Index.difference`` and ``.symmetric_difference`` changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Index.difference`` and ``Index.symmetric_difference`` will now, more consistently, treat ``NaN`` values as any other values. (:issue:`13514`)
-
-.. ipython:: python
-
-   idx1 = pd.Index([1, 2, 3, np.nan])
-   idx2 = pd.Index([0, 1, np.nan])
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [3]: idx1.difference(idx2)
-   Out[3]: Float64Index([nan, 2.0, 3.0], dtype='float64')
-
-   In [4]: idx1.symmetric_difference(idx2)
-   Out[4]: Float64Index([0.0, nan, 2.0, 3.0], dtype='float64')
-
-**New behavior**:
-
-.. ipython:: python
-
-   idx1.difference(idx2)
-   idx1.symmetric_difference(idx2)
-
-.. _whatsnew_0190.api.unique_index:
-
-``Index.unique`` consistently returns ``Index``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``Index.unique()`` now returns unique values as an
-``Index`` of the appropriate ``dtype``. (:issue:`13395`).
-Previously, most ``Index`` classes returned ``np.ndarray``, and ``DatetimeIndex``,
-``TimedeltaIndex`` and ``PeriodIndex`` returned ``Index`` to keep metadata like timezone.
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [1]: pd.Index([1, 2, 3]).unique()
-   Out[1]: array([1, 2, 3])
-
-   In [2]: pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], tz='Asia/Tokyo').unique()
-   Out[2]:
-   DatetimeIndex(['2011-01-01 00:00:00+09:00', '2011-01-02 00:00:00+09:00',
-                  '2011-01-03 00:00:00+09:00'],
-                 dtype='datetime64[ns, Asia/Tokyo]', freq=None)
-
-**New behavior**:
-
-.. ipython:: python
-
-   pd.Index([1, 2, 3]).unique()
-   pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], tz='Asia/Tokyo').unique()
-
-.. _whatsnew_0190.api.multiindex:
-
-``MultiIndex`` constructors, ``groupby`` and ``set_index`` preserve categorical dtypes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``MultiIndex.from_arrays`` and ``MultiIndex.from_product`` will now preserve categorical dtype
-in ``MultiIndex`` levels (:issue:`13743`, :issue:`13854`).
-
-.. ipython:: python
-
-   cat = pd.Categorical(['a', 'b'], categories=list("bac"))
-   lvl1 = ['foo', 'bar']
-   midx = pd.MultiIndex.from_arrays([cat, lvl1])
-   midx
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [4]: midx.levels[0]
-   Out[4]: Index(['b', 'a', 'c'], dtype='object')
-
-   In [5]: midx.get_level_values[0]
-   Out[5]: Index(['a', 'b'], dtype='object')
-
-**New behavior**: the single level is now a ``CategoricalIndex``:
-
-.. ipython:: python
-
-   midx.levels[0]
-   midx.get_level_values(0)
-
-An analogous change has been made to ``MultiIndex.from_product``.
-As a consequence, ``groupby`` and ``set_index`` also preserve categorical dtypes in indexes
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [0, 1], 'B': [10, 11], 'C': cat})
-   df_grouped = df.groupby(by=['A', 'C']).first()
-   df_set_idx = df.set_index(['A', 'C'])
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [11]: df_grouped.index.levels[1]
-   Out[11]: Index(['b', 'a', 'c'], dtype='object', name='C')
-   In [12]: df_grouped.reset_index().dtypes
-   Out[12]:
-   A      int64
-   C     object
-   B    float64
-   dtype: object
-
-   In [13]: df_set_idx.index.levels[1]
-   Out[13]: Index(['b', 'a', 'c'], dtype='object', name='C')
-   In [14]: df_set_idx.reset_index().dtypes
-   Out[14]:
-   A      int64
-   C     object
-   B      int64
-   dtype: object
-
-**New behavior**:
-
-.. ipython:: python
-
-   df_grouped.index.levels[1]
-   df_grouped.reset_index().dtypes
-
-   df_set_idx.index.levels[1]
-   df_set_idx.reset_index().dtypes
-
-.. _whatsnew_0190.api.autogenerated_chunksize_index:
-
-``read_csv`` will progressively enumerate chunks
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-When :func:`read_csv` is called with ``chunksize=n`` and without specifying an index,
-each chunk used to have an independently generated index from ``0`` to ``n-1``.
-They are now given instead a progressive index, starting from ``0`` for the first chunk,
-from ``n`` for the second, and so on, so that, when concatenated, they are identical to
-the result of calling :func:`read_csv` without the ``chunksize=`` argument
-(:issue:`12185`).
-
-.. ipython :: python
-
-   data = 'A,B\n0,1\n2,3\n4,5\n6,7'
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [2]: pd.concat(pd.read_csv(StringIO(data), chunksize=2))
-   Out[2]:
-      A  B
-   0  0  1
-   1  2  3
-   0  4  5
-   1  6  7
-
-**New behavior**:
-
-.. ipython :: python
-
-   pd.concat(pd.read_csv(StringIO(data), chunksize=2))
-
-.. _whatsnew_0190.sparse:
-
-Sparse Changes
-^^^^^^^^^^^^^^
-
-These changes allow pandas to handle sparse data with more dtypes, and for work to make a smoother experience with data handling.
-
-``int64`` and ``bool`` support enhancements
-"""""""""""""""""""""""""""""""""""""""""""
-
-Sparse data structures now gained enhanced support of ``int64`` and ``bool`` ``dtype`` (:issue:`667`, :issue:`13849`).
-
-Previously, sparse data were ``float64`` dtype by default, even if all inputs were of ``int`` or ``bool`` dtype. You had to specify ``dtype`` explicitly to create sparse data with ``int64`` dtype. Also, ``fill_value`` had to be specified explicitly because the default was ``np.nan`` which doesn't appear in ``int64`` or ``bool`` data.
-
-.. code-block:: ipython
-
-   In [1]: pd.SparseArray([1, 2, 0, 0])
-   Out[1]:
-   [1.0, 2.0, 0.0, 0.0]
-   Fill: nan
-   IntIndex
-   Indices: array([0, 1, 2, 3], dtype=int32)
-
-   # specifying int64 dtype, but all values are stored in sp_values because
-   # fill_value default is np.nan
-   In [2]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
-   Out[2]:
-   [1, 2, 0, 0]
-   Fill: nan
-   IntIndex
-   Indices: array([0, 1, 2, 3], dtype=int32)
-
-   In [3]: pd.SparseArray([1, 2, 0, 0], dtype=np.int64, fill_value=0)
-   Out[3]:
-   [1, 2, 0, 0]
-   Fill: 0
-   IntIndex
-   Indices: array([0, 1], dtype=int32)
-
-As of v0.19.0, sparse data keeps the input dtype, and uses more appropriate ``fill_value`` defaults (``0`` for ``int64`` dtype, ``False`` for ``bool`` dtype).
-
-.. ipython:: python
-
-   pd.SparseArray([1, 2, 0, 0], dtype=np.int64)
-   pd.SparseArray([True, False, False, False])
-
-See the :ref:`docs <sparse.dtype>` for more details.
-
-Operators now preserve dtypes
-"""""""""""""""""""""""""""""
-
-- Sparse data structure now can preserve ``dtype`` after arithmetic ops (:issue:`13848`)
-
-  .. ipython:: python
-
-      s = pd.SparseSeries([0, 2, 0, 1], fill_value=0, dtype=np.int64)
-      s.dtype
-
-      s + 1
-
-- Sparse data structure now support ``astype`` to convert internal ``dtype`` (:issue:`13900`)
-
-  .. ipython:: python
-
-      s = pd.SparseSeries([1., 0., 2., 0.], fill_value=0)
-      s
-      s.astype(np.int64)
-
-  ``astype`` fails if data contains values which cannot be converted to specified ``dtype``.
-  Note that the limitation is applied to ``fill_value`` which default is ``np.nan``.
-
-  .. code-block:: ipython
-
-     In [7]: pd.SparseSeries([1., np.nan, 2., np.nan], fill_value=np.nan).astype(np.int64)
-     Out[7]:
-     ValueError: unable to coerce current fill_value nan to int64 dtype
-
-Other sparse fixes
-""""""""""""""""""
-
-- Subclassed ``SparseDataFrame`` and ``SparseSeries`` now preserve class types when slicing or transposing. (:issue:`13787`)
-- ``SparseArray`` with ``bool`` dtype now supports logical (bool) operators (:issue:`14000`)
-- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing may raise ``IndexError`` (:issue:`13144`)
-- Bug in ``SparseSeries`` with ``MultiIndex`` ``[]`` indexing result may have normal ``Index`` (:issue:`13144`)
-- Bug in ``SparseDataFrame`` in which ``axis=None`` did not default to ``axis=0`` (:issue:`13048`)
-- Bug in ``SparseSeries`` and ``SparseDataFrame`` creation with ``object`` dtype may raise ``TypeError`` (:issue:`11633`)
-- Bug in ``SparseDataFrame`` doesn't respect passed ``SparseArray`` or ``SparseSeries`` 's dtype and ``fill_value``  (:issue:`13866`)
-- Bug in ``SparseArray`` and ``SparseSeries`` don't apply ufunc to ``fill_value`` (:issue:`13853`)
-- Bug in ``SparseSeries.abs`` incorrectly keeps negative ``fill_value`` (:issue:`13853`)
-- Bug in single row slicing on multi-type ``SparseDataFrame`` s, types were previously forced to float (:issue:`13917`)
-- Bug in ``SparseSeries`` slicing changes integer dtype to float (:issue:`8292`)
-- Bug in ``SparseDataFarme`` comparison ops may raise ``TypeError`` (:issue:`13001`)
-- Bug in ``SparseDataFarme.isnull`` raises ``ValueError`` (:issue:`8276`)
-- Bug in ``SparseSeries`` representation with ``bool`` dtype may raise ``IndexError`` (:issue:`13110`)
-- Bug in ``SparseSeries`` and ``SparseDataFrame`` of ``bool`` or ``int64`` dtype may display its values like ``float64`` dtype (:issue:`13110`)
-- Bug in sparse indexing using ``SparseArray`` with ``bool`` dtype may return incorrect result  (:issue:`13985`)
-- Bug in ``SparseArray`` created from ``SparseSeries`` may lose ``dtype`` (:issue:`13999`)
-- Bug in ``SparseSeries`` comparison with dense returns normal ``Series`` rather than ``SparseSeries`` (:issue:`13999`)
-
-
-.. _whatsnew_0190.indexer_dtype:
-
-Indexer dtype changes
-^^^^^^^^^^^^^^^^^^^^^
-
-.. note::
-
-   This change only affects 64 bit python running on Windows, and only affects relatively advanced
-   indexing operations
-
-Methods such as ``Index.get_indexer`` that return an indexer array, coerce that array to a "platform int", so that it can be
-directly used in 3rd party library operations like ``numpy.take``.  Previously, a platform int was defined as ``np.int_``
-which corresponds to a C integer, but the correct type, and what is being used now, is ``np.intp``, which corresponds
-to the C integer size that can hold a pointer (:issue:`3033`, :issue:`13972`).
-
-These types are the same on many platform, but for 64 bit python on Windows,
-``np.int_`` is 32 bits, and ``np.intp`` is 64 bits.  Changing this behavior improves performance for many
-operations on that platform.
-
-**Previous behavior**:
-
-.. code-block:: ipython
-
-   In [1]: i = pd.Index(['a', 'b', 'c'])
-
-   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
-   Out[2]: dtype('int32')
-
-**New behavior**:
-
-.. code-block:: ipython
-
-   In [1]: i = pd.Index(['a', 'b', 'c'])
-
-   In [2]: i.get_indexer(['b', 'b', 'c']).dtype
-   Out[2]: dtype('int64')
-
-
-.. _whatsnew_0190.api.other:
-
-Other API Changes
-^^^^^^^^^^^^^^^^^
-
-- ``Timestamp.to_pydatetime`` will issue a ``UserWarning`` when ``warn=True``, and the instance has a non-zero number of nanoseconds, previously this would print a message to stdout (:issue:`14101`).
-- ``Series.unique()`` with datetime and timezone now returns return array of ``Timestamp`` with timezone (:issue:`13565`).
-- ``Panel.to_sparse()`` will raise a ``NotImplementedError`` exception when called (:issue:`13778`).
-- ``Index.reshape()`` will raise a ``NotImplementedError`` exception when called (:issue:`12882`).
-- ``.filter()`` enforces mutual exclusion of the keyword arguments (:issue:`12399`).
-- ``eval``'s upcasting rules for ``float32`` types have been updated to be more consistent with NumPy's rules.  New behavior will not upcast to ``float64`` if you multiply a pandas ``float32`` object by a scalar float64 (:issue:`12388`).
-- An ``UnsupportedFunctionCall`` error is now raised if NumPy ufuncs like ``np.mean`` are called on groupby or resample objects (:issue:`12811`).
-- ``__setitem__`` will no longer apply a callable rhs as a function instead of storing it. Call ``where`` directly to get the previous behavior (:issue:`13299`).
-- Calls to ``.sample()`` will respect the random seed set via ``numpy.random.seed(n)`` (:issue:`13161`)
-- ``Styler.apply`` is now more strict about the outputs your function must return. For ``axis=0`` or ``axis=1``, the output shape must be identical. For ``axis=None``, the output must be a DataFrame with identical columns and index labels (:issue:`13222`).
-- ``Float64Index.astype(int)`` will now raise ``ValueError`` if ``Float64Index`` contains ``NaN`` values (:issue:`13149`)
-- ``TimedeltaIndex.astype(int)`` and ``DatetimeIndex.astype(int)`` will now return ``Int64Index`` instead of ``np.array`` (:issue:`13209`)
-- Passing ``Period`` with multiple frequencies to normal ``Index`` now returns ``Index`` with ``object`` dtype (:issue:`13664`)
-- ``PeriodIndex.fillna`` with ``Period`` has different freq now coerces to ``object`` dtype (:issue:`13664`)
-- Faceted boxplots from ``DataFrame.boxplot(by=col)`` now return a ``Series`` when ``return_type`` is not None. Previously these returned an ``OrderedDict``. Note that when ``return_type=None``, the default, these still return a 2-D NumPy array (:issue:`12216`, :issue:`7096`).
-- ``pd.read_hdf`` will now raise a ``ValueError`` instead of ``KeyError``, if a mode other than ``r``, ``r+`` and ``a`` is supplied. (:issue:`13623`)
-- ``pd.read_csv()``, ``pd.read_table()``, and ``pd.read_hdf()`` raise the builtin ``FileNotFoundError`` exception for Python 3.x when called on a nonexistent file; this is back-ported as ``IOError`` in Python 2.x (:issue:`14086`)
-- More informative exceptions are passed through the csv parser. The exception type would now be the original exception type instead of ``CParserError`` (:issue:`13652`).
-- ``pd.read_csv()`` in the C engine will now issue a ``ParserWarning`` or raise a ``ValueError`` when ``sep`` encoded is more than one character long (:issue:`14065`)
-- ``DataFrame.values`` will now return ``float64`` with a ``DataFrame`` of mixed ``int64`` and ``uint64`` dtypes, conforming to ``np.find_common_type`` (:issue:`10364`, :issue:`13917`)
-- ``.groupby.groups`` will now return a dictionary of ``Index`` objects, rather than a dictionary of ``np.ndarray`` or ``lists`` (:issue:`14293`)
-
-.. _whatsnew_0190.deprecations:
-
-Deprecations
-~~~~~~~~~~~~
-- ``Series.reshape`` and ``Categorical.reshape`` have been deprecated and will be removed in a subsequent release (:issue:`12882`, :issue:`12882`)
-- ``PeriodIndex.to_datetime`` has been deprecated in favor of ``PeriodIndex.to_timestamp`` (:issue:`8254`)
-- ``Timestamp.to_datetime`` has been deprecated in favor of ``Timestamp.to_pydatetime`` (:issue:`8254`)
-- ``Index.to_datetime`` and ``DatetimeIndex.to_datetime`` have been deprecated in favor of ``pd.to_datetime`` (:issue:`8254`)
-- ``pandas.core.datetools`` module has been deprecated and will be removed in a subsequent release (:issue:`14094`)
-- ``SparseList`` has been deprecated and will be removed in a future version (:issue:`13784`)
-- ``DataFrame.to_html()`` and ``DataFrame.to_latex()`` have dropped the ``colSpace`` parameter in favor of ``col_space`` (:issue:`13857`)
-- ``DataFrame.to_sql()`` has deprecated the ``flavor`` parameter, as it is superfluous when SQLAlchemy is not installed (:issue:`13611`)
-- Deprecated ``read_csv`` keywords:
-
-  - ``compact_ints`` and ``use_unsigned`` have been deprecated and will be removed in a future version (:issue:`13320`)
-  - ``buffer_lines`` has been deprecated and will be removed in a future version (:issue:`13360`)
-  - ``as_recarray`` has been deprecated and will be removed in a future version (:issue:`13373`)
-  - ``skip_footer`` has been deprecated in favor of ``skipfooter`` and will be removed in a future version (:issue:`13349`)
-
-- top-level ``pd.ordered_merge()`` has been renamed to ``pd.merge_ordered()`` and the original name will be removed in a future version (:issue:`13358`)
-- ``Timestamp.offset`` property (and named arg in the constructor), has been deprecated in favor of ``freq`` (:issue:`12160`)
-- ``pd.tseries.util.pivot_annual`` is deprecated. Use ``pivot_table`` as alternative, an example is :ref:`here <cookbook.pivot>` (:issue:`736`)
-- ``pd.tseries.util.isleapyear`` has been deprecated and will be removed in a subsequent release. Datetime-likes now have a ``.is_leap_year`` property (:issue:`13727`)
-- ``Panel4D`` and ``PanelND`` constructors are deprecated and will be removed in a future version. The recommended way to represent these types of n-dimensional data are with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas provides a :meth:`~Panel4D.to_xarray` method to automate this conversion (:issue:`13564`).
-- ``pandas.tseries.frequencies.get_standard_freq`` is deprecated. Use  ``pandas.tseries.frequencies.to_offset(freq).rule_code`` instead (:issue:`13874`)
-- ``pandas.tseries.frequencies.to_offset``'s ``freqstr`` keyword is deprecated in favor of ``freq`` (:issue:`13874`)
-- ``Categorical.from_array`` has been deprecated and will be removed in a future version (:issue:`13854`)
-
-.. _whatsnew_0190.prior_deprecations:
-
-Removal of prior version deprecations/changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- The ``SparsePanel`` class has been removed (:issue:`13778`)
-- The ``pd.sandbox`` module has been removed in favor of the external library ``pandas-qt`` (:issue:`13670`)
-- The ``pandas.io.data`` and ``pandas.io.wb`` modules are removed in favor of
-  the `pandas-datareader package <https://github.com/pydata/pandas-datareader>`__ (:issue:`13724`).
-- The ``pandas.tools.rplot`` module has been removed in favor of
-  the `seaborn package <https://github.com/mwaskom/seaborn>`__ (:issue:`13855`)
-- ``DataFrame.to_csv()`` has dropped the ``engine`` parameter, as was deprecated in 0.17.1 (:issue:`11274`, :issue:`13419`)
-- ``DataFrame.to_dict()`` has dropped the ``outtype`` parameter in favor of ``orient`` (:issue:`13627`, :issue:`8486`)
-- ``pd.Categorical`` has dropped setting of the ``ordered`` attribute directly in favor of the ``set_ordered`` method (:issue:`13671`)
-- ``pd.Categorical`` has dropped the ``levels`` attribute in favor of ``categories`` (:issue:`8376`)
-- ``DataFrame.to_sql()`` has dropped the ``mysql`` option for the ``flavor`` parameter (:issue:`13611`)
-- ``Panel.shift()`` has dropped the ``lags`` parameter in favor of ``periods`` (:issue:`14041`)
-- ``pd.Index`` has dropped the ``diff`` method in favor of ``difference`` (:issue:`13669`)
-- ``pd.DataFrame`` has dropped the ``to_wide`` method in favor of ``to_panel`` (:issue:`14039`)
-- ``Series.to_csv`` has dropped the ``nanRep`` parameter in favor of ``na_rep`` (:issue:`13804`)
-- ``Series.xs``, ``DataFrame.xs``, ``Panel.xs``, ``Panel.major_xs``, and ``Panel.minor_xs`` have dropped the ``copy`` parameter (:issue:`13781`)
-- ``str.split`` has dropped the ``return_type`` parameter in favor of ``expand`` (:issue:`13701`)
-- Removal of the legacy time rules (offset aliases), deprecated since 0.17.0 (this has been alias since 0.8.0) (:issue:`13590`, :issue:`13868`). Now legacy time rules raises ``ValueError``. For the list of currently supported offsets, see :ref:`here <timeseries.offset_aliases>`.
-- The default value for the ``return_type`` parameter for ``DataFrame.plot.box`` and ``DataFrame.boxplot`` changed from ``None`` to ``"axes"``. These methods will now return a matplotlib axes by default instead of a dictionary of artists. See :ref:`here <visualization.box.return>` (:issue:`6581`).
-- The ``tquery`` and ``uquery`` functions in the ``pandas.io.sql`` module are removed (:issue:`5950`).
-
-
-.. _whatsnew_0190.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved performance of sparse ``IntIndex.intersect`` (:issue:`13082`)
-- Improved performance of sparse arithmetic with ``BlockIndex`` when the number of blocks are large, though recommended to use ``IntIndex`` in such cases (:issue:`13082`)
-- Improved performance of ``DataFrame.quantile()`` as it now operates per-block (:issue:`11623`)
-- Improved performance of float64 hash table operations, fixing some very slow indexing and groupby operations in python 3 (:issue:`13166`, :issue:`13334`)
-- Improved performance of ``DataFrameGroupBy.transform`` (:issue:`12737`)
-- Improved performance of ``Index`` and ``Series`` ``.duplicated`` (:issue:`10235`)
-- Improved performance of ``Index.difference`` (:issue:`12044`)
-- Improved performance of ``RangeIndex.is_monotonic_increasing`` and ``is_monotonic_decreasing`` (:issue:`13749`)
-- Improved performance of datetime string parsing in ``DatetimeIndex`` (:issue:`13692`)
-- Improved performance of hashing ``Period`` (:issue:`12817`)
-- Improved performance of ``factorize`` of datetime with timezone (:issue:`13750`)
-- Improved performance of by lazily creating indexing hashtables on larger Indexes (:issue:`14266`)
-- Improved performance of ``groupby.groups`` (:issue:`14293`)
-- Unecessary materializing of a MultiIndex when introspecting for memory usage (:issue:`14308`)
-
-.. _whatsnew_0190.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Bug in ``groupby().shift()``, which could cause a segfault or corruption in rare circumstances when grouping by columns with missing values (:issue:`13813`)
-- Bug in ``groupby().cumsum()`` calculating ``cumprod`` when ``axis=1``. (:issue:`13994`)
-- Bug in ``pd.to_timedelta()`` in which the ``errors`` parameter was not being respected (:issue:`13613`)
-- Bug in ``io.json.json_normalize()``, where non-ascii keys raised an exception (:issue:`13213`)
-- Bug when passing a not-default-indexed ``Series`` as ``xerr`` or ``yerr`` in ``.plot()`` (:issue:`11858`)
-- Bug in area plot draws legend incorrectly if subplot is enabled or legend is moved after plot (matplotlib 1.5.0 is required to draw area plot legend properly) (:issue:`9161`, :issue:`13544`)
-- Bug in ``DataFrame`` assignment with an object-dtyped ``Index`` where the resultant column is mutable to the original object. (:issue:`13522`)
-- Bug in matplotlib ``AutoDataFormatter``; this restores the second scaled formatting and re-adds micro-second scaled formatting (:issue:`13131`)
-- Bug in selection from a ``HDFStore`` with a fixed format and ``start`` and/or ``stop`` specified will now return the selected range (:issue:`8287`)
-- Bug in ``Categorical.from_codes()`` where an unhelpful error was raised when an invalid ``ordered`` parameter was passed in (:issue:`14058`)
-- Bug in ``Series`` construction from a tuple of integers on windows not returning default dtype (int64) (:issue:`13646`)
-- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow was not being caught (:issue:`14068`)
-- Bug in ``.groupby(..).resample(..)`` when the same object is called multiple times (:issue:`13174`)
-- Bug in ``.to_records()`` when index name is a unicode string (:issue:`13172`)
-- Bug in calling ``.memory_usage()`` on object which doesn't implement (:issue:`12924`)
-- Regression in ``Series.quantile`` with nans (also shows up in ``.median()`` and ``.describe()`` ); furthermore now names the ``Series`` with the quantile (:issue:`13098`, :issue:`13146`)
-- Bug in ``SeriesGroupBy.transform`` with datetime values and missing groups (:issue:`13191`)
-- Bug where empty ``Series`` were incorrectly coerced in datetime-like numeric operations (:issue:`13844`)
-- Bug in ``Categorical`` constructor when passed a ``Categorical`` containing datetimes with timezones (:issue:`14190`)
-- Bug in ``Series.str.extractall()`` with ``str`` index raises ``ValueError``  (:issue:`13156`)
-- Bug in ``Series.str.extractall()`` with single group and quantifier  (:issue:`13382`)
-- Bug in ``DatetimeIndex`` and ``Period`` subtraction raises ``ValueError`` or ``AttributeError`` rather than ``TypeError`` (:issue:`13078`)
-- Bug in ``Index`` and ``Series`` created with ``NaN`` and ``NaT`` mixed data may not have ``datetime64`` dtype  (:issue:`13324`)
-- Bug in ``Index`` and ``Series`` may ignore ``np.datetime64('nat')`` and ``np.timdelta64('nat')`` to infer dtype (:issue:`13324`)
-- Bug in ``PeriodIndex`` and ``Period`` subtraction raises ``AttributeError`` (:issue:`13071`)
-- Bug in ``PeriodIndex`` construction returning a ``float64`` index in some circumstances (:issue:`13067`)
-- Bug in ``.resample(..)`` with a ``PeriodIndex`` not changing its ``freq`` appropriately when empty (:issue:`13067`)
-- Bug in ``.resample(..)`` with a ``PeriodIndex`` not retaining its type or name with an empty ``DataFrame`` appropriately when empty (:issue:`13212`)
-- Bug in ``groupby(..).apply(..)`` when the passed function returns scalar values per group (:issue:`13468`).
-- Bug in ``groupby(..).resample(..)`` where passing some keywords would raise an exception (:issue:`13235`)
-- Bug in ``.tz_convert`` on a tz-aware ``DateTimeIndex`` that relied on index being sorted for correct results (:issue:`13306`)
-- Bug in ``.tz_localize`` with ``dateutil.tz.tzlocal`` may return incorrect result (:issue:`13583`)
-- Bug in ``DatetimeTZDtype`` dtype with ``dateutil.tz.tzlocal`` cannot be regarded as valid dtype (:issue:`13583`)
-- Bug in ``pd.read_hdf()`` where attempting to load an HDF file with a single dataset, that had one or more categorical columns, failed unless the key argument was set to the name of the dataset. (:issue:`13231`)
-- Bug in ``.rolling()`` that allowed a negative integer window in contruction of the ``Rolling()`` object, but would later fail on aggregation (:issue:`13383`)
-- Bug in ``Series`` indexing with tuple-valued data and a numeric index (:issue:`13509`)
-- Bug in printing ``pd.DataFrame`` where unusual elements with the ``object`` dtype were causing segfaults (:issue:`13717`)
-- Bug in ranking ``Series`` which could result in segfaults (:issue:`13445`)
-- Bug in various index types, which did not propagate the name of passed index (:issue:`12309`)
-- Bug in ``DatetimeIndex``, which did not honour the ``copy=True`` (:issue:`13205`)
-- Bug in ``DatetimeIndex.is_normalized`` returns incorrectly for normalized date_range in case of local timezones (:issue:`13459`)
-- Bug in ``pd.concat`` and ``.append`` may coerces ``datetime64`` and ``timedelta`` to ``object`` dtype containing python built-in ``datetime`` or ``timedelta`` rather than ``Timestamp`` or ``Timedelta`` (:issue:`13626`)
-- Bug in ``PeriodIndex.append`` may raises ``AttributeError`` when the result is ``object`` dtype (:issue:`13221`)
-- Bug in ``CategoricalIndex.append`` may accept normal ``list`` (:issue:`13626`)
-- Bug in ``pd.concat`` and ``.append`` with the same timezone get reset to UTC (:issue:`7795`)
-- Bug in ``Series`` and ``DataFrame`` ``.append`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13626`)
-- Bug in ``DataFrame.to_csv()`` in which float values were being quoted even though quotations were specified for non-numeric values only (:issue:`12922`, :issue:`13259`)
-- Bug in ``DataFrame.describe()`` raising ``ValueError`` with only boolean columns (:issue:`13898`)
-- Bug in ``MultiIndex`` slicing where extra elements were returned when level is non-unique (:issue:`12896`)
-- Bug in ``.str.replace`` does not raise ``TypeError`` for invalid replacement (:issue:`13438`)
-- Bug in ``MultiIndex.from_arrays`` which didn't check for input array lengths matching (:issue:`13599`)
-- Bug in ``cartesian_product`` and ``MultiIndex.from_product`` which may raise with empty input arrays (:issue:`12258`)
-- Bug in ``pd.read_csv()`` which may cause a segfault or corruption when iterating in large chunks over a stream/file under rare circumstances (:issue:`13703`)
-- Bug in ``pd.read_csv()`` which caused errors to be raised when a dictionary containing scalars is passed in for ``na_values`` (:issue:`12224`)
-- Bug in ``pd.read_csv()`` which caused BOM files to be incorrectly parsed by not ignoring the BOM (:issue:`4793`)
-- Bug in ``pd.read_csv()`` with ``engine='python'`` which raised errors when a numpy array was passed in for ``usecols`` (:issue:`12546`)
-- Bug in ``pd.read_csv()`` where the index columns were being incorrectly parsed when parsed as dates with a ``thousands`` parameter (:issue:`14066`)
-- Bug in ``pd.read_csv()`` with ``engine='python'`` in which ``NaN`` values weren't being detected after data was converted to numeric values (:issue:`13314`)
-- Bug in ``pd.read_csv()`` in which the ``nrows`` argument was not properly validated for both engines (:issue:`10476`)
-- Bug in ``pd.read_csv()`` with ``engine='python'`` in which infinities of mixed-case forms were not being interpreted properly (:issue:`13274`)
-- Bug in ``pd.read_csv()`` with ``engine='python'`` in which trailing ``NaN`` values were not being parsed (:issue:`13320`)
-- Bug in ``pd.read_csv()`` with ``engine='python'`` when reading from a ``tempfile.TemporaryFile`` on Windows with Python 3 (:issue:`13398`)
-- Bug in ``pd.read_csv()`` that prevents ``usecols`` kwarg from accepting single-byte unicode strings (:issue:`13219`)
-- Bug in ``pd.read_csv()`` that prevents ``usecols`` from being an empty set (:issue:`13402`)
-- Bug in ``pd.read_csv()`` in the C engine where the NULL character was not being parsed as NULL (:issue:`14012`)
-- Bug in ``pd.read_csv()`` with ``engine='c'`` in which NULL ``quotechar`` was not accepted even though ``quoting`` was specified as ``None`` (:issue:`13411`)
-- Bug in ``pd.read_csv()`` with ``engine='c'`` in which fields were not properly cast to float when quoting was specified as non-numeric (:issue:`13411`)
-- Bug in ``pd.read_csv()`` in Python 2.x with non-UTF8 encoded, multi-character separated data (:issue:`3404`)
-- Bug in ``pd.read_csv()``, where aliases for utf-xx (e.g. UTF-xx, UTF_xx, utf_xx) raised UnicodeDecodeError (:issue:`13549`)
-- Bug in ``pd.read_csv``, ``pd.read_table``, ``pd.read_fwf``, ``pd.read_stata`` and ``pd.read_sas`` where files were opened by parsers but not closed if both ``chunksize`` and ``iterator`` were ``None``. (:issue:`13940`)
-- Bug in ``StataReader``, ``StataWriter``, ``XportReader`` and ``SAS7BDATReader`` where a file was not properly closed when an error was raised. (:issue:`13940`)
-- Bug in ``pd.pivot_table()`` where ``margins_name`` is ignored when ``aggfunc`` is a list (:issue:`13354`)
-- Bug in ``pd.Series.str.zfill``, ``center``, ``ljust``, ``rjust``, and ``pad`` when passing non-integers, did not raise ``TypeError`` (:issue:`13598`)
-- Bug in checking for any null objects in a ``TimedeltaIndex``, which always returned ``True`` (:issue:`13603`)
-- Bug in ``Series`` arithmetic raises ``TypeError`` if it contains datetime-like as ``object`` dtype (:issue:`13043`)
-- Bug ``Series.isnull()`` and ``Series.notnull()`` ignore ``Period('NaT')``  (:issue:`13737`)
-- Bug ``Series.fillna()`` and ``Series.dropna()`` don't affect to ``Period('NaT')``  (:issue:`13737`
-- Bug in ``.fillna(value=np.nan)`` incorrectly raises ``KeyError`` on a ``category`` dtyped ``Series`` (:issue:`14021`)
-- Bug in extension dtype creation where the created types were not is/identical (:issue:`13285`)
-- Bug in ``.resample(..)`` where incorrect warnings were triggered by IPython introspection (:issue:`13618`)
-- Bug in ``NaT`` - ``Period`` raises ``AttributeError`` (:issue:`13071`)
-- Bug in ``Series`` comparison may output incorrect result if rhs contains ``NaT`` (:issue:`9005`)
-- Bug in ``Series`` and ``Index`` comparison may output incorrect result if it contains ``NaT`` with ``object`` dtype (:issue:`13592`)
-- Bug in ``Period`` addition raises ``TypeError`` if ``Period`` is on right hand side (:issue:`13069`)
-- Bug in ``Peirod`` and ``Series`` or ``Index`` comparison raises ``TypeError`` (:issue:`13200`)
-- Bug in ``pd.set_eng_float_format()`` that would prevent NaN and Inf from formatting (:issue:`11981`)
-- Bug in ``.unstack`` with ``Categorical`` dtype resets ``.ordered`` to ``True`` (:issue:`13249`)
-- Clean some compile time warnings in datetime parsing (:issue:`13607`)
-- Bug in ``factorize`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13750`)
-- Bug in ``.set_index`` raises ``AmbiguousTimeError`` if new index contains DST boundary and multi levels (:issue:`12920`)
-- Bug in ``.shift`` raises ``AmbiguousTimeError`` if data contains datetime near DST boundary (:issue:`13926`)
-- Bug in ``pd.read_hdf()`` returns incorrect result when a ``DataFrame`` with a ``categorical`` column and a query which doesn't match any values (:issue:`13792`)
-- Bug in ``.iloc`` when indexing with a non lex-sorted MultiIndex (:issue:`13797`)
-- Bug in ``.loc`` when indexing with date strings in a reverse sorted ``DatetimeIndex`` (:issue:`14316`)
-- Bug in ``Series`` comparison operators when dealing with zero dim NumPy arrays (:issue:`13006`)
-- Bug in ``.combine_first`` may return incorrect ``dtype`` (:issue:`7630`, :issue:`10567`)
-- Bug in ``groupby`` where ``apply`` returns different result depending on whether first result is ``None`` or not (:issue:`12824`)
-- Bug in ``groupby(..).nth()`` where the group key is included inconsistently if called after ``.head()/.tail()`` (:issue:`12839`)
-- Bug in ``.to_html``, ``.to_latex`` and ``.to_string`` silently ignore custom datetime formatter passed through the ``formatters`` key word (:issue:`10690`)
-- Bug in ``DataFrame.iterrows()``, not yielding a ``Series`` subclasse if defined (:issue:`13977`)
-- Bug in ``pd.to_numeric`` when ``errors='coerce'`` and input contains non-hashable objects (:issue:`13324`)
-- Bug in invalid ``Timedelta`` arithmetic and comparison may raise ``ValueError`` rather than ``TypeError`` (:issue:`13624`)
-- Bug in invalid datetime parsing in ``to_datetime`` and ``DatetimeIndex`` may raise ``TypeError`` rather than ``ValueError`` (:issue:`11169`, :issue:`11287`)
-- Bug in ``Index`` created with tz-aware ``Timestamp`` and mismatched ``tz`` option incorrectly coerces timezone (:issue:`13692`)
-- Bug in ``DatetimeIndex`` with nanosecond frequency does not include timestamp specified with ``end`` (:issue:`13672`)
-- Bug in ```Series``` when setting a slice with a ```np.timedelta64``` (:issue:`14155`)
-- Bug in ``Index`` raises ``OutOfBoundsDatetime`` if ``datetime`` exceeds ``datetime64[ns]`` bounds, rather than coercing to ``object`` dtype (:issue:`13663`)
-- Bug in ``Index`` may ignore specified ``datetime64`` or ``timedelta64`` passed as ``dtype``  (:issue:`13981`)
-- Bug in ``RangeIndex`` can be created without no arguments rather than raises ``TypeError`` (:issue:`13793`)
-- Bug in ``.value_counts()`` raises ``OutOfBoundsDatetime`` if data exceeds ``datetime64[ns]`` bounds (:issue:`13663`)
-- Bug in ``DatetimeIndex`` may raise ``OutOfBoundsDatetime`` if input ``np.datetime64`` has other unit than ``ns`` (:issue:`9114`)
-- Bug in ``Series`` creation with ``np.datetime64`` which has other unit than ``ns`` as ``object`` dtype results in incorrect values (:issue:`13876`)
-- Bug in ``resample`` with timedelta data where data was casted to float (:issue:`13119`).
-- Bug in ``pd.isnull()`` ``pd.notnull()`` raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
-- Bug in ``pd.merge()`` may raise ``TypeError`` if input datetime-like has other unit than ``ns`` (:issue:`13389`)
-- Bug in ``HDFStore``/``read_hdf()`` discarded ``DatetimeIndex.name`` if ``tz`` was set (:issue:`13884`)
-- Bug in ``Categorical.remove_unused_categories()`` changes ``.codes`` dtype to platform int (:issue:`13261`)
-- Bug in ``groupby`` with ``as_index=False`` returns all NaN's when grouping on multiple columns including a categorical one (:issue:`13204`)
-- Bug in ``df.groupby(...)[...]`` where getitem with ``Int64Index`` raised an error (:issue:`13731`)
-- Bug in the CSS classes assigned to ``DataFrame.style`` for index names. Previously they were assigned ``"col_heading level<n> col<c>"`` where ``n`` was the number of levels + 1. Now they are assigned ``"index_name level<n>"``, where ``n`` is the correct level for that MultiIndex.
-- Bug where ``pd.read_gbq()`` could throw ``ImportError: No module named discovery`` as a result of a naming conflict with another python package called apiclient  (:issue:`13454`)
-- Bug in ``Index.union`` returns an incorrect result with a named empty index (:issue:`13432`)
-- Bugs in ``Index.difference`` and ``DataFrame.join`` raise in Python3 when using mixed-integer indexes (:issue:`13432`, :issue:`12814`)
-- Bug in subtract tz-aware ``datetime.datetime`` from tz-aware ``datetime64`` series (:issue:`14088`)
-- Bug in ``.to_excel()`` when DataFrame contains a MultiIndex which contains a label with a NaN value (:issue:`13511`)
-- Bug in invalid frequency offset string like "D1", "-2-3H" may not raise ``ValueError`` (:issue:`13930`)
-- Bug in ``concat`` and ``groupby`` for hierarchical frames with ``RangeIndex`` levels (:issue:`13542`).
-- Bug in ``Series.str.contains()`` for Series containing only ``NaN`` values of ``object`` dtype (:issue:`14171`)
-- Bug in ``agg()`` function on groupby dataframe changes dtype of ``datetime64[ns]`` column to ``float64`` (:issue:`12821`)
-- Bug in using NumPy ufunc with ``PeriodIndex`` to add or subtract integer raise ``IncompatibleFrequency``. Note that using standard operator like ``+`` or ``-`` is recommended, because standard operators use more efficient path (:issue:`13980`)
-- Bug in operations on ``NaT`` returning ``float`` instead of ``datetime64[ns]`` (:issue:`12941`)
-- Bug in ``Series`` flexible arithmetic methods (like ``.add()``) raises ``ValueError`` when ``axis=None`` (:issue:`13894`)
-- Bug in ``DataFrame.to_csv()`` with ``MultiIndex`` columns in which a stray empty line was added (:issue:`6618`)
-- Bug in ``DatetimeIndex``, ``TimedeltaIndex`` and ``PeriodIndex.equals()`` may return ``True`` when input isn't ``Index`` but contains the same values (:issue:`13107`)
-- Bug in assignment against datetime with timezone may not work if it contains datetime near DST boundary (:issue:`14146`)
-- Bug in ``pd.eval()`` and ``HDFStore`` query truncating long float literals with python 2 (:issue:`14241`)
-- Bug in ``Index`` raises ``KeyError`` displaying incorrect column when column is not in the df and columns contains duplicate values (:issue:`13822`)
-- Bug in ``Period`` and ``PeriodIndex`` creating wrong dates when frequency has combined offset aliases (:issue:`13874`)
-- Bug in ``.to_string()`` when called with an integer ``line_width`` and ``index=False`` raises an UnboundLocalError exception because ``idx`` referenced before assignment.
-- Bug in ``eval()`` where the ``resolvers`` argument would not accept a list (:issue:`14095`)
-- Bugs in ``stack``, ``get_dummies``, ``make_axis_dummies`` which don't preserve categorical dtypes in (multi)indexes (:issue:`13854`)
-- ``PeriodIndex`` can now accept ``list`` and ``array`` which contains ``pd.NaT`` (:issue:`13430`)
-- Bug in ``df.groupby`` where ``.median()`` returns arbitrary values if grouped dataframe contains empty bins (:issue:`13629`)
-- Bug in ``Index.copy()`` where ``name`` parameter was ignored (:issue:`14302`)
diff --git a/doc/source/whatsnew/v0.19.1.rst b/doc/source/whatsnew/v0.19.1.rst
new file mode 100644
index 0000000000000..12f3e985565e0
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.1.rst
@@ -0,0 +1,77 @@
+.. _whatsnew_0191:
+
+v0.19.1 (November 3, 2016)
+--------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a minor bug-fix release from 0.19.0 and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.19.1
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0191.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Fixed performance regression in factorization of ``Period`` data (:issue:`14338`)
+- Fixed performance regression in ``Series.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
+- Improved performance in ``DataFrame.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
+- Improved performance in ``.to_json()`` when ``lines=True`` (:issue:`14408`)
+- Improved performance in certain types of `loc` indexing with a MultiIndex (:issue:`14551`).
+
+
+.. _whatsnew_0191.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Source installs from PyPI will now again work without ``cython`` installed, as in previous versions (:issue:`14204`)
+- Compat with Cython 0.25 for building (:issue:`14496`)
+- Fixed regression where user-provided file handles were closed in ``read_csv`` (c engine) (:issue:`14418`).
+- Fixed regression in ``DataFrame.quantile`` when missing values where present in some columns (:issue:`14357`).
+- Fixed regression in ``Index.difference`` where the ``freq`` of a ``DatetimeIndex`` was incorrectly set (:issue:`14323`)
+- Added back ``pandas.core.common.array_equivalent`` with a deprecation warning (:issue:`14555`).
+- Bug in ``pd.read_csv`` for the C engine in which quotation marks were improperly parsed in skipped rows (:issue:`14459`)
+- Bug in ``pd.read_csv`` for Python 2.x in which Unicode quote characters were no longer being respected (:issue:`14477`)
+- Fixed regression in ``Index.append`` when categorical indices were appended (:issue:`14545`).
+- Fixed regression in ``pd.DataFrame`` where constructor fails when given dict with ``None`` value (:issue:`14381`)
+- Fixed regression in ``DatetimeIndex._maybe_cast_slice_bound`` when index is empty (:issue:`14354`).
+- Bug in localizing an ambiguous timezone when a boolean is passed (:issue:`14402`)
+- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow in the negative direction was not being caught (:issue:`14068`, :issue:`14453`)
+- Bug in string indexing against data with ``object`` ``Index`` may raise ``AttributeError`` (:issue:`14424`)
+- Correctly raise ``ValueError`` on empty input to ``pd.eval()`` and ``df.query()`` (:issue:`13139`)
+- Bug in ``RangeIndex.intersection`` when result is a empty set (:issue:`14364`).
+- Bug in groupby-transform broadcasting that could cause incorrect dtype coercion (:issue:`14457`)
+- Bug in ``Series.__setitem__`` which allowed mutating read-only arrays (:issue:`14359`).
+- Bug in ``DataFrame.insert`` where multiple calls with duplicate columns can fail (:issue:`14291`)
+- ``pd.merge()`` will raise ``ValueError`` with non-boolean parameters in passed boolean type arguments (:issue:`14434`)
+- Bug in ``Timestamp`` where dates very near the minimum (1677-09) could underflow on creation (:issue:`14415`)
+- Bug in ``pd.concat`` where names of the ``keys`` were not propagated to the resulting ``MultiIndex`` (:issue:`14252`)
+- Bug in ``pd.concat`` where ``axis`` cannot take string parameters ``'rows'`` or ``'columns'`` (:issue:`14369`)
+- Bug in ``pd.concat`` with dataframes heterogeneous in length and tuple ``keys`` (:issue:`14438`)
+- Bug in ``MultiIndex.set_levels`` where illegal level values were still set after raising an error (:issue:`13754`)
+- Bug in ``DataFrame.to_json`` where ``lines=True`` and a value contained a ``}`` character (:issue:`14391`)
+- Bug in ``df.groupby`` causing an ``AttributeError`` when grouping a single index frame by a column and the index level (:issue:`14327`)
+- Bug in ``df.groupby`` where ``TypeError`` raised when ``pd.Grouper(key=...)`` is passed in a list (:issue:`14334`)
+- Bug in ``pd.pivot_table`` may raise ``TypeError`` or ``ValueError`` when ``index`` or ``columns``
+  is not scalar and ``values`` is not specified (:issue:`14380`)
+
+
+.. _whatsnew_0.19.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.19.0..v0.19.1
diff --git a/doc/source/whatsnew/v0.19.1.txt b/doc/source/whatsnew/v0.19.1.txt
deleted file mode 100644
index 545b4380d9b75..0000000000000
--- a/doc/source/whatsnew/v0.19.1.txt
+++ /dev/null
@@ -1,61 +0,0 @@
-.. _whatsnew_0191:
-
-v0.19.1 (November 3, 2016)
---------------------------
-
-This is a minor bug-fix release from 0.19.0 and includes some small regression fixes,
-bug fixes and performance improvements.
-We recommend that all users upgrade to this version.
-
-.. contents:: What's new in v0.19.1
-    :local:
-    :backlinks: none
-
-
-.. _whatsnew_0191.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Fixed performance regression in factorization of ``Period`` data (:issue:`14338`)
-- Fixed performance regression in ``Series.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
-- Improved performance in ``DataFrame.asof(where)`` when ``where`` is a scalar (:issue:`14461`)
-- Improved performance in ``.to_json()`` when ``lines=True`` (:issue:`14408`)
-- Improved performance in certain types of `loc` indexing with a MultiIndex (:issue:`14551`).
-
-
-.. _whatsnew_0191.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-- Source installs from PyPI will now again work without ``cython`` installed, as in previous versions (:issue:`14204`)
-- Compat with Cython 0.25 for building (:issue:`14496`)
-- Fixed regression where user-provided file handles were closed in ``read_csv`` (c engine) (:issue:`14418`).
-- Fixed regression in ``DataFrame.quantile`` when missing values where present in some columns (:issue:`14357`).
-- Fixed regression in ``Index.difference`` where the ``freq`` of a ``DatetimeIndex`` was incorrectly set (:issue:`14323`)
-- Added back ``pandas.core.common.array_equivalent`` with a deprecation warning (:issue:`14555`).
-- Bug in ``pd.read_csv`` for the C engine in which quotation marks were improperly parsed in skipped rows (:issue:`14459`)
-- Bug in ``pd.read_csv`` for Python 2.x in which Unicode quote characters were no longer being respected (:issue:`14477`)
-- Fixed regression in ``Index.append`` when categorical indices were appended (:issue:`14545`).
-- Fixed regression in ``pd.DataFrame`` where constructor fails when given dict with ``None`` value (:issue:`14381`)
-- Fixed regression in ``DatetimeIndex._maybe_cast_slice_bound`` when index is empty (:issue:`14354`).
-- Bug in localizing an ambiguous timezone when a boolean is passed (:issue:`14402`)
-- Bug in ``TimedeltaIndex`` addition with a Datetime-like object where addition overflow in the negative direction was not being caught (:issue:`14068`, :issue:`14453`)
-- Bug in string indexing against data with ``object`` ``Index`` may raise ``AttributeError`` (:issue:`14424`)
-- Corrrecly raise ``ValueError`` on empty input to ``pd.eval()`` and ``df.query()`` (:issue:`13139`)
-- Bug in ``RangeIndex.intersection`` when result is a empty set (:issue:`14364`).
-- Bug in groupby-transform broadcasting that could cause incorrect dtype coercion (:issue:`14457`)
-- Bug in ``Series.__setitem__`` which allowed mutating read-only arrays (:issue:`14359`).
-- Bug in ``DataFrame.insert`` where multiple calls with duplicate columns can fail (:issue:`14291`)
-- ``pd.merge()`` will raise ``ValueError`` with non-boolean parameters in passed boolean type arguments (:issue:`14434`)
-- Bug in ``Timestamp`` where dates very near the minimum (1677-09) could underflow on creation (:issue:`14415`)
-- Bug in ``pd.concat`` where names of the ``keys`` were not propagated to the resulting ``MultiIndex`` (:issue:`14252`)
-- Bug in ``pd.concat`` where ``axis`` cannot take string parameters ``'rows'`` or ``'columns'`` (:issue:`14369`)
-- Bug in ``pd.concat`` with dataframes heterogeneous in length and tuple ``keys`` (:issue:`14438`)
-- Bug in ``MultiIndex.set_levels`` where illegal level values were still set after raising an error (:issue:`13754`)
-- Bug in ``DataFrame.to_json`` where ``lines=True`` and a value contained a ``}`` character (:issue:`14391`)
-- Bug in ``df.groupby`` causing an ``AttributeError`` when grouping a single index frame by a column and the index level (:issue`14327`)
-- Bug in ``df.groupby`` where ``TypeError`` raised when ``pd.Grouper(key=...)`` is passed in a list (:issue:`14334`)
-- Bug in ``pd.pivot_table`` may raise ``TypeError`` or ``ValueError`` when ``index`` or ``columns``
-  is not scalar and ``values`` is not specified (:issue:`14380`)
diff --git a/doc/source/whatsnew/v0.19.2.rst b/doc/source/whatsnew/v0.19.2.rst
new file mode 100644
index 0000000000000..14310ceb45b4a
--- /dev/null
+++ b/doc/source/whatsnew/v0.19.2.rst
@@ -0,0 +1,98 @@
+.. _whatsnew_0192:
+
+v0.19.2 (December 24, 2016)
+---------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a minor bug-fix release in the 0.19.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Compatibility with Python 3.6
+- Added a `Pandas Cheat Sheet <https://github.com/pandas-dev/pandas/tree/master/doc/cheatsheet/Pandas_Cheat_Sheet.pdf>`__. (:issue:`13202`).
+
+
+.. contents:: What's new in v0.19.2
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0192.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+The ``pd.merge_asof()``, added in 0.19.0, gained some improvements:
+
+- ``pd.merge_asof()`` gained ``left_index``/``right_index`` and ``left_by``/``right_by`` arguments (:issue:`14253`)
+- ``pd.merge_asof()`` can take multiple columns in ``by`` parameter and has specialized dtypes for better performance (:issue:`13936`)
+
+
+.. _whatsnew_0192.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Performance regression with ``PeriodIndex`` (:issue:`14822`)
+- Performance regression in indexing with getitem (:issue:`14930`)
+- Improved performance of ``.replace()`` (:issue:`12745`)
+- Improved performance ``Series`` creation with a datetime index and dictionary data (:issue:`14894`)
+
+
+.. _whatsnew_0192.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- Compat with python 3.6 for pickling of some offsets (:issue:`14685`)
+- Compat with python 3.6 for some indexing exception types (:issue:`14684`, :issue:`14689`)
+- Compat with python 3.6 for deprecation warnings in the test suite (:issue:`14681`)
+- Compat with python 3.6 for Timestamp pickles (:issue:`14689`)
+- Compat with ``dateutil==2.6.0``; segfault reported in the testing suite (:issue:`14621`)
+- Allow ``nanoseconds`` in ``Timestamp.replace`` as a kwarg (:issue:`14621`)
+- Bug in ``pd.read_csv`` in which aliasing was being done for ``na_values`` when passed in as a dictionary (:issue:`14203`)
+- Bug in ``pd.read_csv`` in which column indices for a dict-like ``na_values`` were not being respected (:issue:`14203`)
+- Bug in ``pd.read_csv`` where reading files fails, if the number of headers is equal to the number of lines in the file (:issue:`14515`)
+- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when multi-char delimiters were not being respected with quotes (:issue:`14582`)
+- Fix bugs (:issue:`14734`, :issue:`13654`) in ``pd.read_sas`` and ``pandas.io.sas.sas7bdat.SAS7BDATReader`` that caused problems when reading a SAS file incrementally.
+- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when ``skipfooter`` was not being respected by Python's CSV library (:issue:`13879`)
+- Bug in ``.fillna()`` in which timezone aware datetime64 values were incorrectly rounded (:issue:`14872`)
+- Bug in ``.groupby(..., sort=True)`` of a non-lexsorted MultiIndex when grouping with multiple levels (:issue:`14776`)
+- Bug in ``pd.cut`` with negative values and a single bin (:issue:`14652`)
+- Bug in ``pd.to_numeric`` where a 0 was not unsigned on a ``downcast='unsigned'`` argument (:issue:`14401`)
+- Bug in plotting regular and irregular timeseries using shared axes
+  (``sharex=True`` or ``ax.twinx()``) (:issue:`13341`, :issue:`14322`).
+- Bug in not propagating exceptions in parsing invalid datetimes, noted in python 3.6 (:issue:`14561`)
+- Bug in resampling a ``DatetimeIndex`` in local TZ, covering a DST change, which would raise ``AmbiguousTimeError`` (:issue:`14682`)
+- Bug in indexing that transformed ``RecursionError`` into ``KeyError`` or ``IndexingError`` (:issue:`14554`)
+- Bug in ``HDFStore`` when writing a ``MultiIndex`` when using ``data_columns=True`` (:issue:`14435`)
+- Bug in ``HDFStore.append()`` when writing a ``Series`` and passing a ``min_itemsize`` argument containing a value for the ``index`` (:issue:`11412`)
+- Bug when writing to a ``HDFStore`` in ``table`` format with a ``min_itemsize`` value for the ``index`` and without asking to append (:issue:`10381`)
+- Bug in ``Series.groupby.nunique()`` raising an ``IndexError`` for an empty ``Series`` (:issue:`12553`)
+- Bug in ``DataFrame.nlargest`` and ``DataFrame.nsmallest`` when the index had duplicate values (:issue:`13412`)
+- Bug in clipboard functions on linux with python2 with unicode and separators (:issue:`13747`)
+- Bug in clipboard functions on Windows 10 and python 3 (:issue:`14362`, :issue:`12807`)
+- Bug in ``.to_clipboard()`` and Excel compat (:issue:`12529`)
+- Bug in ``DataFrame.combine_first()`` for integer columns (:issue:`14687`).
+- Bug in ``pd.read_csv()`` in which the ``dtype`` parameter was not being respected for empty data (:issue:`14712`)
+- Bug in ``pd.read_csv()`` in which the ``nrows`` parameter was not being respected for large input when using the C engine for parsing (:issue:`7626`)
+- Bug in ``pd.merge_asof()`` could not handle timezone-aware DatetimeIndex when a tolerance was specified (:issue:`14844`)
+- Explicit check in ``to_stata`` and ``StataWriter`` for out-of-range values when writing doubles (:issue:`14618`)
+- Bug in ``.plot(kind='kde')`` which did not drop missing values to generate the KDE Plot, instead generating an empty plot. (:issue:`14821`)
+- Bug in ``unstack()`` if called with a list of column(s) as an argument, regardless of the dtypes of all columns, they get coerced to ``object`` (:issue:`11847`)
+
+
+.. _whatsnew_0.19.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.19.1..v0.19.2
diff --git a/doc/source/whatsnew/v0.19.2.txt b/doc/source/whatsnew/v0.19.2.txt
deleted file mode 100644
index 722e494c9e614..0000000000000
--- a/doc/source/whatsnew/v0.19.2.txt
+++ /dev/null
@@ -1,82 +0,0 @@
-.. _whatsnew_0192:
-
-v0.19.2 (December 24, 2016)
----------------------------
-
-This is a minor bug-fix release in the 0.19.x series and includes some small regression fixes,
-bug fixes and performance improvements.
-We recommend that all users upgrade to this version.
-
-Highlights include:
-
-- Compatibility with Python 3.6
-- Added a `Pandas Cheat Sheet <https://github.com/pandas-dev/pandas/tree/master/doc/cheatsheet/Pandas_Cheat_Sheet.pdf>`__. (:issue:`13202`).
-
-
-.. contents:: What's new in v0.19.2
-    :local:
-    :backlinks: none
-
-
-.. _whatsnew_0192.enhancements:
-
-Enhancements
-~~~~~~~~~~~~
-
-The ``pd.merge_asof()``, added in 0.19.0, gained some improvements:
-
-- ``pd.merge_asof()`` gained ``left_index``/``right_index`` and ``left_by``/``right_by`` arguments (:issue:`14253`)
-- ``pd.merge_asof()`` can take multiple columns in ``by`` parameter and has specialized dtypes for better performace (:issue:`13936`)
-
-
-.. _whatsnew_0192.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Performance regression with ``PeriodIndex`` (:issue:`14822`)
-- Performance regression in indexing with getitem (:issue:`14930`)
-- Improved performance of ``.replace()`` (:issue:`12745`)
-- Improved performance ``Series`` creation with a datetime index and dictionary data (:issue:`14894`)
-
-
-.. _whatsnew_0192.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-- Compat with python 3.6 for pickling of some offsets (:issue:`14685`)
-- Compat with python 3.6 for some indexing exception types (:issue:`14684`, :issue:`14689`)
-- Compat with python 3.6 for deprecation warnings in the test suite (:issue:`14681`)
-- Compat with python 3.6 for Timestamp pickles (:issue:`14689`)
-- Compat with ``dateutil==2.6.0``; segfault reported in the testing suite (:issue:`14621`)
-- Allow ``nanoseconds`` in ``Timestamp.replace`` as a kwarg (:issue:`14621`)
-- Bug in ``pd.read_csv`` in which aliasing was being done for ``na_values`` when passed in as a dictionary (:issue:`14203`)
-- Bug in ``pd.read_csv`` in which column indices for a dict-like ``na_values`` were not being respected (:issue:`14203`)
-- Bug in ``pd.read_csv`` where reading files fails, if the number of headers is equal to the number of lines in the file (:issue:`14515`)
-- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when multi-char delimiters were not being respected with quotes (:issue:`14582`)
-- Fix bugs (:issue:`14734`, :issue:`13654`) in ``pd.read_sas`` and ``pandas.io.sas.sas7bdat.SAS7BDATReader`` that caused problems when reading a SAS file incrementally.
-- Bug in ``pd.read_csv`` for the Python engine in which an unhelpful error message was being raised when ``skipfooter`` was not being respected by Python's CSV library (:issue:`13879`)
-- Bug in ``.fillna()`` in which timezone aware datetime64 values were incorrectly rounded (:issue:`14872`)
-- Bug in ``.groupby(..., sort=True)`` of a non-lexsorted MultiIndex when grouping with multiple levels (:issue:`14776`)
-- Bug in ``pd.cut`` with negative values and a single bin (:issue:`14652`)
-- Bug in ``pd.to_numeric`` where a 0 was not unsigned on a ``downcast='unsigned'`` argument (:issue:`14401`)
-- Bug in plotting regular and irregular timeseries using shared axes
-  (``sharex=True`` or ``ax.twinx()``) (:issue:`13341`, :issue:`14322`).
-- Bug in not propogating exceptions in parsing invalid datetimes, noted in python 3.6 (:issue:`14561`)
-- Bug in resampling a ``DatetimeIndex`` in local TZ, covering a DST change, which would raise ``AmbiguousTimeError`` (:issue:`14682`)
-- Bug in indexing that transformed ``RecursionError`` into ``KeyError`` or ``IndexingError`` (:issue:`14554`)
-- Bug in ``HDFStore`` when writing a ``MultiIndex`` when using ``data_columns=True`` (:issue:`14435`)
-- Bug in ``HDFStore.append()`` when writing a ``Series`` and passing a ``min_itemsize`` argument containing a value for the ``index`` (:issue:`11412`)
-- Bug when writing to a ``HDFStore`` in ``table`` format with a ``min_itemsize`` value for the ``index`` and without asking to append (:issue:`10381`)
-- Bug in ``Series.groupby.nunique()`` raising an ``IndexError`` for an empty ``Series`` (:issue:`12553`)
-- Bug in ``DataFrame.nlargest`` and ``DataFrame.nsmallest`` when the index had duplicate values (:issue:`13412`)
-- Bug in clipboard functions on linux with python2 with unicode and separators (:issue:`13747`)
-- Bug in clipboard functions on Windows 10 and python 3 (:issue:`14362`, :issue:`12807`)
-- Bug in ``.to_clipboard()`` and Excel compat (:issue:`12529`)
-- Bug in ``DataFrame.combine_first()`` for integer columns (:issue:`14687`).
-- Bug in ``pd.read_csv()`` in which the ``dtype`` parameter was not being respected for empty data (:issue:`14712`)
-- Bug in ``pd.read_csv()`` in which the ``nrows`` parameter was not being respected for large input when using the C engine for parsing (:issue:`7626`)
-- Bug in ``pd.merge_asof()`` could not handle timezone-aware DatetimeIndex when a tolerance was specified (:issue:`14844`)
-- Explicit check in ``to_stata`` and ``StataWriter`` for out-of-range values when writing doubles (:issue:`14618`)
-- Bug in ``.plot(kind='kde')`` which did not drop missing values to generate the KDE Plot, instead generating an empty plot. (:issue:`14821`)
-- Bug in ``unstack()`` if called with a list of column(s) as an argument, regardless of the dtypes of all columns, they get coerced to ``object`` (:issue:`11847`)
diff --git a/doc/source/whatsnew/v0.20.0.rst b/doc/source/whatsnew/v0.20.0.rst
new file mode 100644
index 0000000000000..c720e075012eb
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.0.rst
@@ -0,0 +1,1744 @@
+.. _whatsnew_0200:
+
+v0.20.1 (May 5, 2017)
+---------------------
+
+{{ header }}
+
+This is a major release from 0.19.2 and includes a number of API changes, deprecations, new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- New ``.agg()`` API for Series/DataFrame similar to the groupby-rolling-resample API's, see :ref:`here <whatsnew_0200.enhancements.agg>`
+- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
+- The ``.ix`` indexer has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_ix>`
+- ``Panel`` has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_panel>`
+- Addition of an ``IntervalIndex`` and ``Interval`` scalar type, see :ref:`here <whatsnew_0200.enhancements.intervalindex>`
+- Improved user API when grouping by index levels in ``.groupby()``, see :ref:`here <whatsnew_0200.enhancements.groupby_access>`
+- Improved support for ``UInt64`` dtypes, see :ref:`here <whatsnew_0200.enhancements.uint64_support>`
+- A new orient for JSON serialization, ``orient='table'``, that uses the Table Schema spec and that gives the possibility for a more interactive repr in the Jupyter Notebook, see :ref:`here <whatsnew_0200.enhancements.table_schema>`
+- Experimental support for exporting styled DataFrames (``DataFrame.style``) to Excel, see :ref:`here <whatsnew_0200.enhancements.style_excel>`
+- Window binary corr/cov operations now return a MultiIndexed ``DataFrame`` rather than a ``Panel``, as ``Panel`` is now deprecated, see :ref:`here <whatsnew_0200.api_breaking.rolling_pairwise>`
+- Support for S3 handling now uses ``s3fs``, see :ref:`here <whatsnew_0200.api_breaking.s3>`
+- Google BigQuery support now uses the ``pandas-gbq`` library, see :ref:`here <whatsnew_0200.api_breaking.gbq>`
+
+.. warning::
+
+  Pandas has changed the internal structure and layout of the code base.
+  This can affect imports that are not from the top-level ``pandas.*`` namespace, please see the changes :ref:`here <whatsnew_0200.privacy>`.
+
+Check the :ref:`API Changes <whatsnew_0200.api_breaking>` and :ref:`deprecations <whatsnew_0200.deprecations>` before updating.
+
+.. note::
+
+   This is a combined release for 0.20.0 and and 0.20.1.
+   Version 0.20.1 contains one additional change for backwards-compatibility with downstream projects using pandas' ``utils`` routines. (:issue:`16250`)
+
+.. contents:: What's new in v0.20.0
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0200.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. ipython:: python
+   :suppress:
+
+   import pandas.util.testing as tm
+
+.. _whatsnew_0200.enhancements.agg:
+
+``agg`` API for DataFrame/Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Series & DataFrame have been enhanced to support the aggregation API. This is a familiar API
+from groupby, window operations, and resampling. This allows aggregation operations in a concise way
+by using :meth:`~DataFrame.agg` and :meth:`~DataFrame.transform`. The full documentation
+is :ref:`here <basics.aggregate>` (:issue:`1623`).
+
+Here is a sample
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'],
+                     index=pd.date_range('1/1/2000', periods=10))
+   df.iloc[3:7] = np.nan
+   df
+
+One can operate using string function names, callables, lists, or dictionaries of these.
+
+Using a single function is equivalent to ``.apply``.
+
+.. ipython:: python
+
+   df.agg('sum')
+
+Multiple aggregations with a list of functions.
+
+.. ipython:: python
+
+   df.agg(['sum', 'min'])
+
+Using a dict provides the ability to apply specific aggregations per column.
+You will get a matrix-like output of all of the aggregators. The output has one column
+per unique function. Those functions applied to a particular column will be ``NaN``:
+
+.. ipython:: python
+
+   df.agg({'A': ['sum', 'min'], 'B': ['min', 'max']})
+
+The API also supports a ``.transform()`` function for broadcasting results.
+
+.. ipython:: python
+   :okwarning:
+
+   df.transform(['abs', lambda x: x - x.min()])
+
+When presented with mixed dtypes that cannot be aggregated, ``.agg()`` will only take the valid
+aggregations. This is similar to how groupby ``.agg()`` works. (:issue:`15015`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [1., 2., 3.],
+                      'C': ['foo', 'bar', 'baz'],
+                      'D': pd.date_range('20130101', periods=3)})
+   df.dtypes
+
+.. ipython:: python
+
+   df.agg(['min', 'sum'])
+
+.. _whatsnew_0200.enhancements.dataio_dtype:
+
+``dtype`` keyword for data IO
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``'python'`` engine for :func:`read_csv`, as well as the :func:`read_fwf` function for parsing
+fixed-width text files and :func:`read_excel` for parsing Excel files, now accept the ``dtype`` keyword argument for specifying the types of specific columns (:issue:`14295`). See the :ref:`io docs <io.dtypes>` for more information.
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+.. ipython:: python
+
+   data = "a  b\n1  2\n3  4"
+   pd.read_fwf(StringIO(data)).dtypes
+   pd.read_fwf(StringIO(data), dtype={'a': 'float64', 'b': 'object'}).dtypes
+
+.. _whatsnew_0120.enhancements.datetime_origin:
+
+``.to_datetime()`` has gained an ``origin`` parameter
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`to_datetime` has gained a new parameter, ``origin``, to define a reference date
+from where to compute the resulting timestamps when parsing numerical values with a specific ``unit`` specified. (:issue:`11276`, :issue:`11745`)
+
+For example, with 1960-01-01 as the starting date:
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D', origin=pd.Timestamp('1960-01-01'))
+
+The default is set at ``origin='unix'``, which defaults to ``1970-01-01 00:00:00``, which is
+commonly called 'unix epoch' or POSIX time. This was the previous default, so this is a backward compatible change.
+
+.. ipython:: python
+
+   pd.to_datetime([1, 2, 3], unit='D')
+
+
+.. _whatsnew_0200.enhancements.groupby_access:
+
+Groupby Enhancements
+^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to ``DataFrame.groupby()`` as the ``by`` parameter may now reference either column names or index level names. Previously, only column names could be referenced. This allows to easily group by a column and index level at the same time. (:issue:`5677`)
+
+.. ipython:: python
+
+   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+
+   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
+
+   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
+                      'B': np.arange(8)},
+                     index=index)
+   df
+
+   df.groupby(['second', 'A']).sum()
+
+
+.. _whatsnew_0200.enhancements.compressed_urls:
+
+Better support for compressed URLs in ``read_csv``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The compression code was refactored (:issue:`12688`). As a result, reading
+dataframes from URLs in :func:`read_csv` or :func:`read_table` now supports
+additional compression methods: ``xz``, ``bz2``, and ``zip`` (:issue:`14570`).
+Previously, only ``gzip`` compression was supported. By default, compression of
+URLs and paths are now inferred using their file extensions. Additionally,
+support for bz2 compression in the python 2 C-engine improved (:issue:`14874`).
+
+.. ipython:: python
+
+   url = ('https://github.com/{repo}/raw/{branch}/{path}'
+          .format(repo='pandas-dev/pandas',
+                  branch='master',
+                  path='pandas/tests/io/parser/data/salaries.csv.bz2'))
+   # default, infer compression
+   df = pd.read_csv(url, sep='\t', compression='infer')
+   # explicitly specify compression
+   df = pd.read_csv(url, sep='\t', compression='bz2')
+   df.head(2)
+
+.. _whatsnew_0200.enhancements.pickle_compression:
+
+Pickle file I/O now supports compression
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`read_pickle`, :meth:`DataFrame.to_pickle` and :meth:`Series.to_pickle`
+can now read from and write to compressed pickle files. Compression methods
+can be an explicit parameter or be inferred from the file extension.
+See :ref:`the docs here. <io.pickle.compression>`
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': np.random.randn(1000),
+                      'B': 'foo',
+                      'C': pd.date_range('20130101', periods=1000, freq='s')})
+
+Using an explicit compression type
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.compress", compression="gzip")
+   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
+   rt.head()
+
+The default is to infer the compression type from the extension (``compression='infer'``):
+
+.. ipython:: python
+
+   df.to_pickle("data.pkl.gz")
+   rt = pd.read_pickle("data.pkl.gz")
+   rt.head()
+   df["A"].to_pickle("s1.pkl.bz2")
+   rt = pd.read_pickle("s1.pkl.bz2")
+   rt.head()
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove("data.pkl.compress")
+   os.remove("data.pkl.gz")
+   os.remove("s1.pkl.bz2")
+
+.. _whatsnew_0200.enhancements.uint64_support:
+
+UInt64 Support Improved
+^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas has significantly improved support for operations involving unsigned,
+or purely non-negative, integers. Previously, handling these integers would
+result in improper rounding or data-type casting, leading to incorrect results.
+Notably, a new numerical index, ``UInt64Index``, has been created (:issue:`14937`)
+
+.. ipython:: python
+
+   idx = pd.UInt64Index([1, 2, 3])
+   df = pd.DataFrame({'A': ['a', 'b', 'c']}, index=idx)
+   df.index
+
+- Bug in converting object elements of array-like objects to unsigned 64-bit integers (:issue:`4471`, :issue:`14982`)
+- Bug in ``Series.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14721`)
+- Bug in ``DataFrame`` construction in which unsigned 64-bit integer elements were being converted to objects (:issue:`14881`)
+- Bug in ``pd.read_csv()`` in which unsigned 64-bit integer elements were being improperly converted to the wrong data types (:issue:`14983`)
+- Bug in ``pd.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14915`)
+- Bug in ``pd.value_counts()`` in which unsigned 64-bit integers were being erroneously truncated in the output (:issue:`14934`)
+
+.. _whatsnew_0200.enhancements.groupy_categorical:
+
+GroupBy on Categoricals
+^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, ``.groupby(..., sort=False)`` would fail with a ``ValueError`` when grouping on a categorical series with some categories not appearing in the data. (:issue:`13179`)
+
+.. ipython:: python
+
+   chromosomes = np.r_[np.arange(1, 23).astype(str), ['X', 'Y']]
+   df = pd.DataFrame({
+       'A': np.random.randint(100),
+       'B': np.random.randint(100),
+       'C': np.random.randint(100),
+       'chromosomes': pd.Categorical(np.random.choice(chromosomes, 100),
+                                     categories=chromosomes,
+                                     ordered=True)})
+   df
+
+**Previous Behavior**:
+
+.. code-block:: ipython
+
+   In [3]: df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
+   ---------------------------------------------------------------------------
+   ValueError: items in new_categories are not the same as in old categories
+
+**New Behavior**:
+
+.. ipython:: python
+
+   df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
+
+.. _whatsnew_0200.enhancements.table_schema:
+
+Table Schema Output
+^^^^^^^^^^^^^^^^^^^
+
+The new orient ``'table'`` for :meth:`DataFrame.to_json`
+will generate a `Table Schema`_ compatible string representation of
+the data.
+
+.. ipython:: python
+
+   df = pd.DataFrame(
+       {'A': [1, 2, 3],
+        'B': ['a', 'b', 'c'],
+        'C': pd.date_range('2016-01-01', freq='d', periods=3)},
+       index=pd.Index(range(3), name='idx'))
+   df
+   df.to_json(orient='table')
+
+
+See :ref:`IO: Table Schema for more information <io.table_schema>`.
+
+Additionally, the repr for ``DataFrame`` and ``Series`` can now publish
+this JSON Table schema representation of the Series or DataFrame if you are
+using IPython (or another frontend like `nteract`_ using the Jupyter messaging
+protocol).
+This gives frontends like the Jupyter notebook and `nteract`_
+more flexibility in how they display pandas objects, since they have
+more information about the data.
+You must enable this by setting the ``display.html.table_schema`` option to ``True``.
+
+.. _Table Schema: http://specs.frictionlessdata.io/json-table-schema/
+.. _nteract: http://nteract.io/
+
+.. _whatsnew_0200.enhancements.scipy_sparse:
+
+SciPy sparse matrix from/to SparseDataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas now supports creating sparse dataframes directly from ``scipy.sparse.spmatrix`` instances.
+See the :ref:`documentation <sparse.scipysparse>` for more information. (:issue:`4343`)
+
+All sparse formats are supported, but matrices that are not in :mod:`COOrdinate <scipy.sparse>` format will be converted, copying data as needed.
+
+.. ipython:: python
+
+   from scipy.sparse import csr_matrix
+   arr = np.random.random(size=(1000, 5))
+   arr[arr < .9] = 0
+   sp_arr = csr_matrix(arr)
+   sp_arr
+   sdf = pd.SparseDataFrame(sp_arr)
+   sdf
+
+To convert a ``SparseDataFrame`` back to sparse SciPy matrix in COO format, you can use:
+
+.. ipython:: python
+
+   sdf.to_coo()
+
+.. _whatsnew_0200.enhancements.style_excel:
+
+Excel output for styled DataFrames
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Experimental support has been added to export ``DataFrame.style`` formats to Excel using the ``openpyxl`` engine. (:issue:`15530`)
+
+For example, after running the following, ``styled.xlsx`` renders as below:
+
+.. ipython:: python
+   :okwarning:
+
+   np.random.seed(24)
+   df = pd.DataFrame({'A': np.linspace(1, 10, 10)})
+   df = pd.concat([df, pd.DataFrame(np.random.RandomState(24).randn(10, 4),
+                                    columns=list('BCDE'))],
+                  axis=1)
+   df.iloc[0, 2] = np.nan
+   df
+   styled = (df.style
+             .applymap(lambda val: 'color: %s' % 'red' if val < 0 else 'black')
+             .highlight_max())
+   styled.to_excel('styled.xlsx', engine='openpyxl')
+
+.. image:: ../_static/style-excel.png
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('styled.xlsx')
+
+See the :ref:`Style documentation </style.ipynb#Export-to-Excel>` for more detail.
+
+.. _whatsnew_0200.enhancements.intervalindex:
+
+IntervalIndex
+^^^^^^^^^^^^^
+
+pandas has gained an ``IntervalIndex`` with its own dtype, ``interval`` as well as the ``Interval`` scalar type. These allow first-class support for interval
+notation, specifically as a return type for the categories in :func:`cut` and :func:`qcut`. The ``IntervalIndex`` allows some unique indexing, see the
+:ref:`docs <indexing.intervallindex>`. (:issue:`7640`, :issue:`8625`)
+
+.. warning::
+
+   These indexing behaviors of the IntervalIndex are provisional and may change in a future version of pandas. Feedback on usage is welcome.
+
+
+Previous behavior:
+
+The returned categories were strings, representing Intervals
+
+.. code-block:: ipython
+
+   In [1]: c = pd.cut(range(4), bins=2)
+
+   In [2]: c
+   Out[2]:
+   [(-0.003, 1.5], (-0.003, 1.5], (1.5, 3], (1.5, 3]]
+   Categories (2, object): [(-0.003, 1.5] < (1.5, 3]]
+
+   In [3]: c.categories
+   Out[3]: Index(['(-0.003, 1.5]', '(1.5, 3]'], dtype='object')
+
+New behavior:
+
+.. ipython:: python
+
+   c = pd.cut(range(4), bins=2)
+   c
+   c.categories
+
+Furthermore, this allows one to bin *other* data with these same bins, with ``NaN`` representing a missing
+value similar to other dtypes.
+
+.. ipython:: python
+
+   pd.cut([0, 3, 5, 1], bins=c.categories)
+
+An ``IntervalIndex`` can also be used in ``Series`` and ``DataFrame`` as the index.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': range(4),
+                      'B': pd.cut([0, 3, 1, 1], bins=c.categories)
+                      }).set_index('B')
+   df
+
+Selecting via a specific interval:
+
+.. ipython:: python
+
+   df.loc[pd.Interval(1.5, 3.0)]
+
+Selecting via a scalar value that is contained *in* the intervals.
+
+.. ipython:: python
+
+   df.loc[0]
+
+.. _whatsnew_0200.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- ``DataFrame.rolling()`` now accepts the parameter ``closed='right'|'left'|'both'|'neither'`` to choose the rolling window-endpoint closedness. See the :ref:`documentation <stats.rolling_window.endpoints>` (:issue:`13965`)
+- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
+- ``Series.str.replace()`` now accepts a callable, as replacement, which is passed to ``re.sub`` (:issue:`15055`)
+- ``Series.str.replace()`` now accepts a compiled regular expression as a pattern (:issue:`15446`)
+- ``Series.sort_index`` accepts parameters ``kind`` and ``na_position`` (:issue:`13589`, :issue:`14444`)
+- ``DataFrame`` and ``DataFrame.groupby()``  have gained a ``nunique()`` method to count the distinct values over an axis (:issue:`14336`, :issue:`15197`).
+- ``DataFrame`` has gained a ``melt()`` method, equivalent to ``pd.melt()``, for unpivoting from a wide to long format (:issue:`12640`).
+- ``pd.read_excel()`` now preserves sheet order when using ``sheetname=None`` (:issue:`9930`)
+- Multiple offset aliases with decimal points are now supported (e.g. ``0.5min`` is parsed as ``30s``) (:issue:`8419`)
+- ``.isnull()`` and ``.notnull()`` have been added to ``Index`` object to make them more consistent with the ``Series`` API (:issue:`15300`)
+- New ``UnsortedIndexError`` (subclass of ``KeyError``) raised when indexing/slicing into an
+  unsorted MultiIndex (:issue:`11897`). This allows differentiation between errors due to lack
+  of sorting or an incorrect key. See :ref:`here <advanced.unsorted>`
+- ``MultiIndex`` has gained a ``.to_frame()`` method to convert to a ``DataFrame`` (:issue:`12397`)
+- ``pd.cut`` and ``pd.qcut`` now support datetime64 and timedelta64 dtypes (:issue:`14714`, :issue:`14798`)
+- ``pd.qcut`` has gained the ``duplicates='raise'|'drop'`` option to control whether to raise on duplicated edges (:issue:`7751`)
+- ``Series`` provides a ``to_excel`` method to output Excel files (:issue:`8825`)
+- The ``usecols`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`14154`)
+- The ``skiprows`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`10882`)
+- The ``nrows`` and ``chunksize`` arguments in ``pd.read_csv()`` are supported if both are passed (:issue:`6774`, :issue:`15755`)
+- ``DataFrame.plot`` now prints a title above each subplot if ``suplots=True`` and ``title`` is a list of strings (:issue:`14753`)
+- ``DataFrame.plot`` can pass the matplotlib 2.0 default color cycle as a single string as color parameter, see `here <http://matplotlib.org/2.0.0/users/colors.html#cn-color-selection>`__. (:issue:`15516`)
+- ``Series.interpolate()`` now supports timedelta as an index type with ``method='time'`` (:issue:`6424`)
+- Addition of a ``level`` keyword to ``DataFrame/Series.rename`` to rename
+  labels in the specified level of a MultiIndex (:issue:`4160`).
+- ``DataFrame.reset_index()`` will now interpret a tuple ``index.name`` as a key spanning across levels of ``columns``, if this is a ``MultiIndex`` (:issue:`16164`)
+- ``Timedelta.isoformat`` method added for formatting Timedeltas as an `ISO 8601 duration`_. See the :ref:`Timedelta docs <timedeltas.isoformat>` (:issue:`15136`)
+- ``.select_dtypes()`` now allows the string ``datetimetz`` to generically select datetimes with tz (:issue:`14910`)
+- The ``.to_latex()`` method will now accept ``multicolumn`` and ``multirow`` arguments to use the accompanying LaTeX enhancements
+- ``pd.merge_asof()`` gained the option ``direction='backward'|'forward'|'nearest'`` (:issue:`14887`)
+- ``Series/DataFrame.asfreq()`` have gained a ``fill_value`` parameter, to fill missing values (:issue:`3715`).
+- ``Series/DataFrame.resample.asfreq`` have gained a ``fill_value`` parameter, to fill missing values during resampling (:issue:`3715`).
+- :func:`pandas.util.hash_pandas_object` has gained the ability to hash a ``MultiIndex`` (:issue:`15224`)
+- ``Series/DataFrame.squeeze()`` have gained the ``axis`` parameter. (:issue:`15339`)
+- ``DataFrame.to_excel()`` has a new ``freeze_panes`` parameter to turn on Freeze Panes when exporting to Excel (:issue:`15160`)
+- ``pd.read_html()`` will parse multiple header rows, creating a MutliIndex header. (:issue:`13434`).
+- HTML table output skips ``colspan`` or ``rowspan`` attribute if equal to 1. (:issue:`15403`)
+- :class:`pandas.io.formats.style.Styler` template now has blocks for easier extension, see the :ref:`example notebook </style.ipynb#Subclassing>` (:issue:`15649`)
+- :meth:`Styler.render() <pandas.io.formats.style.Styler.render>` now accepts ``**kwargs`` to allow user-defined variables in the template (:issue:`15649`)
+- Compatibility with Jupyter notebook 5.0; MultiIndex column labels are left-aligned and MultiIndex row-labels are top-aligned (:issue:`15379`)
+- ``TimedeltaIndex`` now has a custom date-tick formatter specifically designed for nanosecond level precision (:issue:`8711`)
+- ``pd.api.types.union_categoricals`` gained the ``ignore_ordered`` argument to allow ignoring the ordered attribute of unioned categoricals (:issue:`13410`). See the :ref:`categorical union docs <categorical.union>` for more information.
+- ``DataFrame.to_latex()`` and ``DataFrame.to_string()`` now allow optional header aliases. (:issue:`15536`)
+- Re-enable the ``parse_dates`` keyword of ``pd.read_excel()`` to parse string columns as dates (:issue:`14326`)
+- Added ``.empty`` property to subclasses of ``Index``. (:issue:`15270`)
+- Enabled floor division for ``Timedelta`` and ``TimedeltaIndex`` (:issue:`15828`)
+- ``pandas.io.json.json_normalize()`` gained the option ``errors='ignore'|'raise'``; the default is ``errors='raise'`` which is backward compatible. (:issue:`14583`)
+- ``pandas.io.json.json_normalize()`` with an empty ``list`` will return an empty ``DataFrame`` (:issue:`15534`)
+- ``pandas.io.json.json_normalize()`` has gained a ``sep`` option that accepts ``str`` to separate joined fields; the default is ".", which is backward compatible. (:issue:`14883`)
+- :meth:`MultiIndex.remove_unused_levels` has been added to facilitate :ref:`removing unused levels <advanced.shown_levels>`. (:issue:`15694`)
+- ``pd.read_csv()`` will now raise a ``ParserError`` error whenever any parsing error occurs (:issue:`15913`, :issue:`15925`)
+- ``pd.read_csv()`` now supports the ``error_bad_lines`` and ``warn_bad_lines`` arguments for the Python parser (:issue:`15925`)
+- The ``display.show_dimensions`` option can now also be used to specify
+  whether the length of a ``Series`` should be shown in its repr (:issue:`7117`).
+- ``parallel_coordinates()`` has gained a ``sort_labels`` keyword argument that sorts class labels and the colors assigned to them (:issue:`15908`)
+- Options added to allow one to turn on/off using ``bottleneck`` and ``numexpr``, see :ref:`here <basics.accelerate>` (:issue:`16157`)
+- ``DataFrame.style.bar()`` now accepts two more options to further customize the bar chart. Bar alignment is set with ``align='left'|'mid'|'zero'``, the default is "left", which is backward compatible; You can now pass a list of ``color=[color_negative, color_positive]``. (:issue:`14757`)
+
+.. _ISO 8601 duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
+
+
+.. _whatsnew_0200.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew.api_breaking.io_compat:
+
+Possible incompatibility for HDF5 formats created with pandas < 0.13.0
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``pd.TimeSeries`` was deprecated officially in 0.17.0, though has already been an alias since 0.13.0. It has
+been dropped in favor of ``pd.Series``. (:issue:`15098`).
+
+This *may* cause HDF5 files that were created in prior versions to become unreadable if ``pd.TimeSeries``
+was used. This is most likely to be for pandas < 0.13.0. If you find yourself in this situation.
+You can use a recent prior version of pandas to read in your HDF5 files,
+then write them out again after applying the procedure below.
+
+.. code-block:: ipython
+
+   In [2]: s = pd.TimeSeries([1, 2, 3], index=pd.date_range('20130101', periods=3))
+
+   In [3]: s
+   Out[3]:
+   2013-01-01    1
+   2013-01-02    2
+   2013-01-03    3
+   Freq: D, dtype: int64
+
+   In [4]: type(s)
+   Out[4]: pandas.core.series.TimeSeries
+
+   In [5]: s = pd.Series(s)
+
+   In [6]: s
+   Out[6]:
+   2013-01-01    1
+   2013-01-02    2
+   2013-01-03    3
+   Freq: D, dtype: int64
+
+   In [7]: type(s)
+   Out[7]: pandas.core.series.Series
+
+
+.. _whatsnew_0200.api_breaking.index_map:
+
+Map on Index types now return other Index types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``map`` on an ``Index`` now returns an ``Index``, not a numpy array (:issue:`12766`)
+
+.. ipython:: python
+
+   idx = pd.Index([1, 2])
+   idx
+   mi = pd.MultiIndex.from_tuples([(1, 2), (2, 4)])
+   mi
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [5]: idx.map(lambda x: x * 2)
+   Out[5]: array([2, 4])
+
+   In [6]: idx.map(lambda x: (x, x * 2))
+   Out[6]: array([(1, 2), (2, 4)], dtype=object)
+
+   In [7]: mi.map(lambda x: x)
+   Out[7]: array([(1, 2), (2, 4)], dtype=object)
+
+   In [8]: mi.map(lambda x: x[0])
+   Out[8]: array([1, 2])
+
+New Behavior:
+
+.. ipython:: python
+
+   idx.map(lambda x: x * 2)
+   idx.map(lambda x: (x, x * 2))
+
+   mi.map(lambda x: x)
+
+   mi.map(lambda x: x[0])
+
+
+``map`` on a ``Series`` with ``datetime64`` values may return ``int64`` dtypes rather than ``int32``
+
+.. ipython:: python
+
+   s = pd.Series(pd.date_range('2011-01-02T00:00', '2011-01-02T02:00', freq='H')
+                 .tz_localize('Asia/Tokyo'))
+   s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [9]: s.map(lambda x: x.hour)
+   Out[9]:
+   0    0
+   1    1
+   2    2
+   dtype: int32
+
+New Behavior:
+
+.. ipython:: python
+
+   s.map(lambda x: x.hour)
+
+
+.. _whatsnew_0200.api_breaking.index_dt_field:
+
+Accessing datetime fields of Index now return Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The datetime-related attributes (see :ref:`here <timeseries.components>`
+for an overview) of ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex`` previously
+returned numpy arrays. They will now return a new ``Index`` object, except
+in the case of a boolean field, where the result will still be a boolean ndarray. (:issue:`15022`)
+
+Previous behaviour:
+
+.. code-block:: ipython
+
+   In [1]: idx = pd.date_range("2015-01-01", periods=5, freq='10H')
+
+   In [2]: idx.hour
+   Out[2]: array([ 0, 10, 20,  6, 16], dtype=int32)
+
+New Behavior:
+
+.. ipython:: python
+
+   idx = pd.date_range("2015-01-01", periods=5, freq='10H')
+   idx.hour
+
+This has the advantage that specific ``Index`` methods are still available on the
+result. On the other hand, this might have backward incompatibilities: e.g.
+compared to numpy arrays, ``Index`` objects are not mutable. To get the original
+ndarray, you can always convert explicitly using ``np.asarray(idx.hour)``.
+
+.. _whatsnew_0200.api_breaking.unique:
+
+pd.unique will now be consistent with extension types
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In prior versions, using :meth:`Series.unique` and :func:`pandas.unique` on ``Categorical`` and tz-aware
+data-types would yield different return types. These are now made consistent. (:issue:`15903`)
+
+- Datetime tz-aware
+
+  Previous behaviour:
+
+  .. code-block:: ipython
+
+     # Series
+     In [5]: pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+        ...:            pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     Out[5]: array([Timestamp('2016-01-01 00:00:00-0500', tz='US/Eastern')], dtype=object)
+
+     In [6]: pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+        ...:                      pd.Timestamp('20160101', tz='US/Eastern')]))
+     Out[6]: array(['2016-01-01T05:00:00.000000000'], dtype='datetime64[ns]')
+
+     # Index
+     In [7]: pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+        ...:           pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     Out[7]: DatetimeIndex(['2016-01-01 00:00:00-05:00'], dtype='datetime64[ns, US/Eastern]', freq=None)
+
+     In [8]: pd.unique([pd.Timestamp('20160101', tz='US/Eastern'),
+        ...:            pd.Timestamp('20160101', tz='US/Eastern')])
+     Out[8]: array(['2016-01-01T05:00:00.000000000'], dtype='datetime64[ns]')
+
+  New Behavior:
+
+  .. ipython:: python
+
+     # Series, returns an array of Timestamp tz-aware
+     pd.Series([pd.Timestamp(r'20160101', tz=r'US/Eastern'),
+                pd.Timestamp(r'20160101', tz=r'US/Eastern')]).unique()
+     pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+               pd.Timestamp('20160101', tz='US/Eastern')]))
+
+     # Index, returns a DatetimeIndex
+     pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+               pd.Timestamp('20160101', tz='US/Eastern')]).unique()
+     pd.unique(pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+                         pd.Timestamp('20160101', tz='US/Eastern')]))
+
+- Categoricals
+
+  Previous behaviour:
+
+  .. code-block:: ipython
+
+     In [1]: pd.Series(list('baabc'), dtype='category').unique()
+     Out[1]:
+     [b, a, c]
+     Categories (3, object): [b, a, c]
+
+     In [2]: pd.unique(pd.Series(list('baabc'), dtype='category'))
+     Out[2]: array(['b', 'a', 'c'], dtype=object)
+
+  New Behavior:
+
+  .. ipython:: python
+
+     # returns a Categorical
+     pd.Series(list('baabc'), dtype='category').unique()
+     pd.unique(pd.Series(list('baabc'), dtype='category'))
+
+.. _whatsnew_0200.api_breaking.s3:
+
+S3 File Handling
+^^^^^^^^^^^^^^^^
+
+pandas now uses `s3fs <http://s3fs.readthedocs.io/>`_ for handling S3 connections. This shouldn't break
+any code. However, since ``s3fs`` is not a required dependency, you will need to install it separately, like ``boto``
+in prior versions of pandas. (:issue:`11915`).
+
+.. _whatsnew_0200.api_breaking.partial_string_indexing:
+
+Partial String Indexing Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:ref:`DatetimeIndex Partial String Indexing <timeseries.partialindexing>` now works as an exact match, provided that string resolution coincides with index resolution, including a case when both are seconds (:issue:`14826`). See :ref:`Slice vs. Exact Match <timeseries.slice_vs_exact_match>` for details.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [1, 2, 3]}, pd.DatetimeIndex(['2011-12-31 23:59:59',
+                                                         '2012-01-01 00:00:00',
+                                                         '2012-01-01 00:00:01']))
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df['2011-12-31 23:59:59']
+   Out[4]:
+                          a
+   2011-12-31 23:59:59  1
+
+   In [5]: df['a']['2011-12-31 23:59:59']
+   Out[5]:
+   2011-12-31 23:59:59    1
+   Name: a, dtype: int64
+
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [4]: df['2011-12-31 23:59:59']
+   KeyError: '2011-12-31 23:59:59'
+
+   In [5]: df['a']['2011-12-31 23:59:59']
+   Out[5]: 1
+
+.. _whatsnew_0200.api_breaking.concat_dtypes:
+
+Concat of different float dtypes will not automatically upcast
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, ``concat`` of multiple objects with different ``float`` dtypes would automatically upcast results to a dtype of ``float64``.
+Now the smallest acceptable dtype will be used (:issue:`13247`)
+
+.. ipython:: python
+
+   df1 = pd.DataFrame(np.array([1.0], dtype=np.float32, ndmin=2))
+   df1.dtypes
+
+   df2 = pd.DataFrame(np.array([np.nan], dtype=np.float32, ndmin=2))
+   df2.dtypes
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [7]: pd.concat([df1, df2]).dtypes
+   Out[7]:
+   0    float64
+   dtype: object
+
+New Behavior:
+
+.. ipython:: python
+
+   pd.concat([df1, df2]).dtypes
+
+.. _whatsnew_0200.api_breaking.gbq:
+
+Pandas Google BigQuery support has moved
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+pandas has split off Google BigQuery support into a separate package ``pandas-gbq``. You can ``conda install pandas-gbq -c conda-forge`` or
+``pip install pandas-gbq`` to get it. The functionality of :func:`read_gbq` and :meth:`DataFrame.to_gbq` remain the same with the
+currently released version of ``pandas-gbq=0.1.4``. Documentation is now hosted `here <https://pandas-gbq.readthedocs.io/>`__  (:issue:`15347`)
+
+.. _whatsnew_0200.api_breaking.memory_usage:
+
+Memory Usage for Index is more Accurate
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, showing ``.memory_usage()`` on a pandas structure that has an index, would only include actual index values and not include structures that facilitated fast indexing. This will generally be different for ``Index`` and ``MultiIndex`` and less-so for other index types. (:issue:`15237`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [8]: index = pd.Index(['foo', 'bar', 'baz'])
+
+   In [9]: index.memory_usage(deep=True)
+   Out[9]: 180
+
+   In [10]: index.get_loc('foo')
+   Out[10]: 0
+
+   In [11]: index.memory_usage(deep=True)
+   Out[11]: 180
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [8]: index = pd.Index(['foo', 'bar', 'baz'])
+
+   In [9]: index.memory_usage(deep=True)
+   Out[9]: 180
+
+   In [10]: index.get_loc('foo')
+   Out[10]: 0
+
+   In [11]: index.memory_usage(deep=True)
+   Out[11]: 260
+
+.. _whatsnew_0200.api_breaking.sort_index:
+
+DataFrame.sort_index changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In certain cases, calling ``.sort_index()`` on a MultiIndexed DataFrame would return the *same* DataFrame without seeming to sort.
+This would happen with a ``lexsorted``, but non-monotonic levels. (:issue:`15622`, :issue:`15687`, :issue:`14015`, :issue:`13431`, :issue:`15797`)
+
+This is *unchanged* from prior versions, but shown for illustration purposes:
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.arange(6), columns=['value'],
+                     index=pd.MultiIndex.from_product([list('BA'), range(3)]))
+   df
+
+.. ipython:: python
+
+   df.index.is_lexsorted()
+   df.index.is_monotonic
+
+Sorting works as expected
+
+.. ipython:: python
+
+   df.sort_index()
+
+.. ipython:: python
+
+   df.sort_index().index.is_lexsorted()
+   df.sort_index().index.is_monotonic
+
+However, this example, which has a non-monotonic 2nd level,
+doesn't behave as desired.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'value': [1, 2, 3, 4]},
+                     index=pd.MultiIndex([['a', 'b'], ['bb', 'aa']],
+                                         [[0, 0, 1, 1], [0, 1, 0, 1]]))
+   df
+
+Previous Behavior:
+
+.. code-block:: python
+
+   In [11]: df.sort_index()
+   Out[11]:
+         value
+   a bb      1
+     aa      2
+   b bb      3
+     aa      4
+
+   In [14]: df.sort_index().index.is_lexsorted()
+   Out[14]: True
+
+   In [15]: df.sort_index().index.is_monotonic
+   Out[15]: False
+
+New Behavior:
+
+.. ipython:: python
+
+   df.sort_index()
+   df.sort_index().index.is_lexsorted()
+   df.sort_index().index.is_monotonic
+
+
+.. _whatsnew_0200.api_breaking.groupby_describe:
+
+Groupby Describe Formatting
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The output formatting of ``groupby.describe()`` now labels the ``describe()`` metrics in the columns instead of the index.
+This format is consistent with ``groupby.agg()`` when applying multiple functions at once. (:issue:`4792`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
+
+   In [2]: df.groupby('A').describe()
+   Out[2]:
+                   B
+   A
+   1 count  2.000000
+     mean   1.500000
+     std    0.707107
+     min    1.000000
+     25%    1.250000
+     50%    1.500000
+     75%    1.750000
+     max    2.000000
+   2 count  2.000000
+     mean   3.500000
+     std    0.707107
+     min    3.000000
+     25%    3.250000
+     50%    3.500000
+     75%    3.750000
+     max    4.000000
+
+   In [3]: df.groupby('A').agg([np.mean, np.std, np.min, np.max])
+   Out[3]:
+        B
+     mean       std amin amax
+   A
+   1  1.5  0.707107    1    2
+   2  3.5  0.707107    3    4
+
+New Behavior:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
+
+   df.groupby('A').describe()
+
+   df.groupby('A').agg([np.mean, np.std, np.min, np.max])
+
+.. _whatsnew_0200.api_breaking.rolling_pairwise:
+
+Window Binary Corr/Cov operations return a MultiIndex DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A binary window operation, like ``.corr()`` or ``.cov()``, when operating on a ``.rolling(..)``, ``.expanding(..)``, or ``.ewm(..)`` object,
+will now return a 2-level ``MultiIndexed DataFrame`` rather than a ``Panel``, as ``Panel`` is now deprecated,
+see :ref:`here <whatsnew_0200.api_breaking.deprecate_panel>`. These are equivalent in function,
+but a MultiIndexed ``DataFrame`` enjoys more support in pandas.
+See the section on :ref:`Windowed Binary Operations <stats.moments.binary>` for more information. (:issue:`15677`)
+
+.. ipython:: python
+
+   np.random.seed(1234)
+   df = pd.DataFrame(np.random.rand(100, 2),
+                     columns=pd.Index(['A', 'B'], name='bar'),
+                     index=pd.date_range('20160101',
+                                         periods=100, freq='D', name='foo'))
+   df.tail()
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: df.rolling(12).corr()
+   Out[2]:
+   <class 'pandas.core.panel.Panel'>
+   Dimensions: 100 (items) x 2 (major_axis) x 2 (minor_axis)
+   Items axis: 2016-01-01 00:00:00 to 2016-04-09 00:00:00
+   Major_axis axis: A to B
+   Minor_axis axis: A to B
+
+New Behavior:
+
+.. ipython:: python
+
+   res = df.rolling(12).corr()
+   res.tail()
+
+Retrieving a correlation matrix for a cross-section
+
+.. ipython:: python
+
+   df.rolling(12).corr().loc['2016-04-07']
+
+.. _whatsnew_0200.api_breaking.hdfstore_where:
+
+HDFStore where string comparison
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions most types could be compared to string column in a ``HDFStore``
+usually resulting in an invalid comparison, returning an empty result frame. These comparisons will now raise a
+``TypeError`` (:issue:`15492`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'unparsed_date': ['2014-01-01', '2014-01-01']})
+   df.to_hdf('store.h5', 'key', format='table', data_columns=True)
+   df.dtypes
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: pd.read_hdf('store.h5', 'key', where='unparsed_date > ts')
+   File "<string>", line 1
+     (unparsed_date > 1970-01-01 00:00:01.388552400)
+                           ^
+   SyntaxError: invalid token
+
+New Behavior:
+
+.. code-block:: ipython
+
+   In [18]: ts = pd.Timestamp('2014-01-01')
+
+   In [19]: pd.read_hdf('store.h5', 'key', where='unparsed_date > ts')
+   TypeError: Cannot compare 2014-01-01 00:00:00 of
+   type <class 'pandas.tslib.Timestamp'> to string column
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('store.h5')
+
+.. _whatsnew_0200.api_breaking.index_order:
+
+Index.intersection and inner join now preserve the order of the left Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`Index.intersection` now preserves the order of the calling ``Index`` (left)
+instead of the other ``Index`` (right) (:issue:`15582`). This affects inner
+joins, :meth:`DataFrame.join` and :func:`merge`, and the ``.align`` method.
+
+- ``Index.intersection``
+
+  .. ipython:: python
+
+     left = pd.Index([2, 1, 0])
+     left
+     right = pd.Index([1, 2, 3])
+     right
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+     In [4]: left.intersection(right)
+     Out[4]: Int64Index([1, 2], dtype='int64')
+
+  New Behavior:
+
+  .. ipython:: python
+
+     left.intersection(right)
+
+- ``DataFrame.join`` and ``pd.merge``
+
+  .. ipython:: python
+
+     left = pd.DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
+     left
+     right = pd.DataFrame({'b': [100, 200, 300]}, index=[1, 2, 3])
+     right
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+     In [4]: left.join(right, how='inner')
+     Out[4]:
+        a    b
+     1  10  100
+     2  20  200
+
+  New Behavior:
+
+  .. ipython:: python
+
+     left.join(right, how='inner')
+
+.. _whatsnew_0200.api_breaking.pivot_table:
+
+Pivot Table always returns a DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The documentation for :meth:`pivot_table` states that a ``DataFrame`` is *always* returned. Here a bug
+is fixed that allowed this to return a ``Series`` under certain circumstance. (:issue:`4386`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'col1': [3, 4, 5],
+                      'col2': ['C', 'D', 'E'],
+                      'col3': [1, 3, 9]})
+   df
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+   Out[2]:
+   col3  col2
+   1     C       3
+   3     D       4
+   9     E       5
+   Name: col1, dtype: int64
+
+New Behavior:
+
+.. ipython:: python
+
+   df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+
+.. _whatsnew_0200.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- ``numexpr`` version is now required to be >= 2.4.6 and it will not be used at all if this requisite is not fulfilled (:issue:`15213`).
+- ``CParserError`` has been renamed to ``ParserError`` in ``pd.read_csv()`` and will be removed in the future (:issue:`12665`)
+- ``SparseArray.cumsum()`` and ``SparseSeries.cumsum()`` will now always return ``SparseArray`` and ``SparseSeries`` respectively (:issue:`12855`)
+- ``DataFrame.applymap()`` with an empty ``DataFrame`` will return a copy of the empty ``DataFrame`` instead of a ``Series`` (:issue:`8222`)
+- ``Series.map()`` now respects default values of dictionary subclasses with a ``__missing__`` method, such as ``collections.Counter`` (:issue:`15999`)
+- ``.loc`` has compat with ``.ix`` for accepting iterators, and NamedTuples (:issue:`15120`)
+- ``interpolate()`` and ``fillna()`` will raise a ``ValueError`` if the ``limit`` keyword argument is not greater than 0. (:issue:`9217`)
+- ``pd.read_csv()`` will now issue a ``ParserWarning`` whenever there are conflicting values provided by the ``dialect`` parameter and the user (:issue:`14898`)
+- ``pd.read_csv()`` will now raise a ``ValueError`` for the C engine if the quote character is larger than than one byte (:issue:`11592`)
+- ``inplace`` arguments now require a boolean value, else a ``ValueError`` is thrown (:issue:`14189`)
+- ``pandas.api.types.is_datetime64_ns_dtype`` will now report ``True`` on a tz-aware dtype, similar to ``pandas.api.types.is_datetime64_any_dtype``
+- ``DataFrame.asof()`` will return a null filled ``Series`` instead the scalar ``NaN`` if a match is not found (:issue:`15118`)
+- Specific support for ``copy.copy()`` and ``copy.deepcopy()`` functions on NDFrame objects (:issue:`15444`)
+- ``Series.sort_values()`` accepts a one element list of bool for consistency with the behavior of ``DataFrame.sort_values()`` (:issue:`15604`)
+- ``.merge()`` and ``.join()`` on ``category`` dtype columns will now preserve the category dtype when possible (:issue:`10409`)
+- ``SparseDataFrame.default_fill_value`` will be 0, previously was ``nan`` in the return from ``pd.get_dummies(..., sparse=True)`` (:issue:`15594`)
+- The default behaviour of ``Series.str.match`` has changed from extracting
+  groups to matching the pattern. The extracting behaviour was deprecated
+  since pandas version 0.13.0 and can be done with the ``Series.str.extract``
+  method (:issue:`5224`). As a consequence, the ``as_indexer`` keyword is
+  ignored (no longer needed to specify the new behaviour) and is deprecated.
+- ``NaT`` will now correctly report ``False`` for datetimelike boolean operations such as ``is_month_start`` (:issue:`15781`)
+- ``NaT`` will now correctly return ``np.nan`` for ``Timedelta`` and ``Period`` accessors such as ``days`` and ``quarter`` (:issue:`15782`)
+- ``NaT`` will now returns ``NaT`` for ``tz_localize`` and ``tz_convert``
+  methods (:issue:`15830`)
+- ``DataFrame`` and ``Panel`` constructors with invalid input will now raise ``ValueError`` rather than ``PandasError``, if called with scalar inputs and not axes (:issue:`15541`)
+- ``DataFrame`` and ``Panel`` constructors with invalid input will now raise ``ValueError`` rather than ``pandas.core.common.PandasError``, if called with scalar inputs and not axes; The exception ``PandasError`` is removed as well. (:issue:`15541`)
+- The exception ``pandas.core.common.AmbiguousIndexError`` is removed as it is not referenced (:issue:`15541`)
+
+
+.. _whatsnew_0200.privacy:
+
+Reorganization of the library: Privacy Changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0200.privacy.extensions:
+
+Modules Privacy Has Changed
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Some formerly public python/c/c++/cython extension modules have been moved and/or renamed. These are all removed from the public API.
+Furthermore, the ``pandas.core``, ``pandas.compat``, and ``pandas.util`` top-level modules are now considered to be PRIVATE.
+If indicated, a deprecation warning will be issued if you reference theses modules. (:issue:`12588`)
+
+.. csv-table::
+    :header: "Previous Location", "New Location", "Deprecated"
+    :widths: 30, 30, 4
+
+    "pandas.lib", "pandas._libs.lib", "X"
+    "pandas.tslib", "pandas._libs.tslib", "X"
+    "pandas.computation", "pandas.core.computation", "X"
+    "pandas.msgpack", "pandas.io.msgpack", ""
+    "pandas.index", "pandas._libs.index", ""
+    "pandas.algos", "pandas._libs.algos", ""
+    "pandas.hashtable", "pandas._libs.hashtable", ""
+    "pandas.indexes", "pandas.core.indexes", ""
+    "pandas.json", "pandas._libs.json / pandas.io.json", "X"
+    "pandas.parser", "pandas._libs.parsers", "X"
+    "pandas.formats", "pandas.io.formats", ""
+    "pandas.sparse", "pandas.core.sparse", ""
+    "pandas.tools", "pandas.core.reshape", "X"
+    "pandas.types", "pandas.core.dtypes", "X"
+    "pandas.io.sas.saslib", "pandas.io.sas._sas", ""
+    "pandas._join", "pandas._libs.join", ""
+    "pandas._hash", "pandas._libs.hashing", ""
+    "pandas._period", "pandas._libs.period", ""
+    "pandas._sparse", "pandas._libs.sparse", ""
+    "pandas._testing", "pandas._libs.testing", ""
+    "pandas._window", "pandas._libs.window", ""
+
+
+Some new subpackages are created with public functionality that is not directly
+exposed in the top-level namespace: ``pandas.errors``, ``pandas.plotting`` and
+``pandas.testing`` (more details below). Together with ``pandas.api.types`` and
+certain functions in the ``pandas.io`` and ``pandas.tseries`` submodules,
+these are now the public subpackages.
+
+Further changes:
+
+- The function :func:`~pandas.api.types.union_categoricals` is now importable from ``pandas.api.types``, formerly from ``pandas.types.concat`` (:issue:`15998`)
+- The type import ``pandas.tslib.NaTType`` is deprecated and can be replaced by using ``type(pandas.NaT)`` (:issue:`16146`)
+- The public functions in ``pandas.tools.hashing`` deprecated from that locations, but are now importable from ``pandas.util`` (:issue:`16223`)
+- The modules in ``pandas.util``: ``decorators``, ``print_versions``, ``doctools``, ``validators``, ``depr_module`` are now private. Only the functions exposed in ``pandas.util`` itself are public (:issue:`16223`)
+
+.. _whatsnew_0200.privacy.errors:
+
+``pandas.errors``
+^^^^^^^^^^^^^^^^^
+
+We are adding a standard public module for all pandas exceptions & warnings ``pandas.errors``. (:issue:`14800`). Previously
+these exceptions & warnings could be imported from ``pandas.core.common`` or ``pandas.io.common``. These exceptions and warnings
+will be removed from the ``*.common`` locations in a future release. (:issue:`15541`)
+
+The following are now part of this API:
+
+.. code-block:: python
+
+   ['DtypeWarning',
+    'EmptyDataError',
+    'OutOfBoundsDatetime',
+    'ParserError',
+    'ParserWarning',
+    'PerformanceWarning',
+    'UnsortedIndexError',
+    'UnsupportedFunctionCall']
+
+
+.. _whatsnew_0200.privacy.testing:
+
+``pandas.testing``
+^^^^^^^^^^^^^^^^^^
+
+We are adding a standard module that exposes the public testing functions in ``pandas.testing`` (:issue:`9895`). Those functions can be used when writing tests for functionality using pandas objects.
+
+The following testing functions are now part of this API:
+
+- :func:`testing.assert_frame_equal`
+- :func:`testing.assert_series_equal`
+- :func:`testing.assert_index_equal`
+
+
+.. _whatsnew_0200.privacy.plotting:
+
+``pandas.plotting``
+^^^^^^^^^^^^^^^^^^^
+
+A new public ``pandas.plotting`` module has been added that holds plotting functionality that was previously in either ``pandas.tools.plotting`` or in the top-level namespace. See the :ref:`deprecations sections <whatsnew_0200.privacy.deprecate_plotting>` for more details.
+
+.. _whatsnew_0200.privacy.development:
+
+Other Development Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Building pandas for development now requires ``cython >= 0.23`` (:issue:`14831`)
+- Require at least 0.23 version of cython to avoid problems with character encodings (:issue:`14699`)
+- Switched the test framework to use `pytest <http://doc.pytest.org/en/latest>`__ (:issue:`13097`)
+- Reorganization of tests directory layout (:issue:`14854`, :issue:`15707`).
+
+
+.. _whatsnew_0200.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+.. _whatsnew_0200.api_breaking.deprecate_ix:
+
+Deprecate ``.ix``
+^^^^^^^^^^^^^^^^^
+
+The ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc`` and ``.loc`` indexers. ``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide to index *positionally* OR via *labels*, depending on the data type of the index. This has caused quite a bit of user confusion over the years. The full indexing documentation is :ref:`here <indexing>`. (:issue:`14218`)
+
+The recommended methods of indexing are:
+
+- ``.loc`` if you want to *label* index
+- ``.iloc`` if you want to *positionally* index.
+
+Using ``.ix`` will now show a ``DeprecationWarning`` with a link to some examples of how to convert code :ref:`here <indexing.deprecate_ix>`.
+
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': [4, 5, 6]},
+                     index=list('abc'))
+
+   df
+
+Previous Behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
+
+.. code-block:: ipython
+
+   In [3]: df.ix[[0, 2], 'A']
+   Out[3]:
+   a    1
+   c    3
+   Name: A, dtype: int64
+
+Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
+
+.. ipython:: python
+
+   df.loc[df.index[[0, 2]], 'A']
+
+Using ``.iloc``. Here we will get the location of the 'A' column, then use *positional* indexing to select things.
+
+.. ipython:: python
+
+   df.iloc[[0, 2], df.columns.get_loc('A')]
+
+
+.. _whatsnew_0200.api_breaking.deprecate_panel:
+
+Deprecate Panel
+^^^^^^^^^^^^^^^
+
+``Panel`` is deprecated and will be removed in a future version. The recommended way to represent 3-D data are
+with a ``MultiIndex`` on a ``DataFrame`` via the :meth:`~Panel.to_frame` or with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas
+provides a :meth:`~Panel.to_xarray` method to automate this conversion. For more details see :ref:`Deprecate Panel <dsintro.deprecate_panel>` documentation. (:issue:`13563`).
+
+.. ipython:: python
+   :okwarning:
+
+   p = tm.makePanel()
+   p
+
+Convert to a MultiIndex DataFrame
+
+.. ipython:: python
+
+   p.to_frame()
+
+Convert to an xarray DataArray
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_xarray()
+
+.. _whatsnew_0200.api_breaking.deprecate_group_agg_dict:
+
+Deprecate groupby.agg() with a dictionary when renaming
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``.groupby(..).agg(..)``, ``.rolling(..).agg(..)``, and ``.resample(..).agg(..)``  syntax can accept a variable of inputs, including scalars,
+list, and a dict of column names to scalars or lists. This provides a useful syntax for constructing multiple
+(potentially different) aggregations.
+
+However, ``.agg(..)`` can *also* accept a dict that allows 'renaming' of the result columns. This is a complicated and confusing syntax, as well as not consistent
+between ``Series`` and ``DataFrame``. We are deprecating this 'renaming' functionality.
+
+- We are deprecating passing a dict to a grouped/rolled/resampled ``Series``. This allowed
+  one to ``rename`` the resulting aggregation, but this had a completely different
+  meaning than passing a dictionary to a grouped ``DataFrame``, which accepts column-to-aggregations.
+- We are deprecating passing a dict-of-dicts to a grouped/rolled/resampled ``DataFrame`` in a similar manner.
+
+This is an illustrative example:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 1, 1, 2, 2],
+                      'B': range(5),
+                      'C': range(5)})
+   df
+
+Here is a typical useful syntax for computing different aggregations for different columns. This
+is a natural, and useful syntax. We aggregate from the dict-to-list by taking the specified
+columns and applying the list of functions. This returns a ``MultiIndex`` for the columns (this is *not* deprecated).
+
+.. ipython:: python
+
+   df.groupby('A').agg({'B': 'sum', 'C': 'min'})
+
+Here's an example of the first deprecation, passing a dict to a grouped ``Series``. This
+is a combination aggregation & renaming:
+
+.. code-block:: ipython
+
+   In [6]: df.groupby('A').B.agg({'foo': 'count'})
+   FutureWarning: using a dict on a Series for aggregation
+   is deprecated and will be removed in a future version
+
+   Out[6]:
+      foo
+   A
+   1    3
+   2    2
+
+You can accomplish the same operation, more idiomatically by:
+
+.. ipython:: python
+
+   df.groupby('A').B.agg(['count']).rename(columns={'count': 'foo'})
+
+
+Here's an example of the second deprecation, passing a dict-of-dict to a grouped ``DataFrame``:
+
+.. code-block:: python
+
+   In [23]: (df.groupby('A')
+       ...:    .agg({'B': {'foo': 'sum'}, 'C': {'bar': 'min'}})
+       ...:  )
+   FutureWarning: using a dict with renaming is deprecated and
+   will be removed in a future version
+
+   Out[23]:
+        B   C
+      foo bar
+   A
+   1   3   0
+   2   7   3
+
+
+You can accomplish nearly the same by:
+
+.. ipython:: python
+
+   (df.groupby('A')
+      .agg({'B': 'sum', 'C': 'min'})
+      .rename(columns={'B': 'foo', 'C': 'bar'})
+    )
+
+
+
+.. _whatsnew_0200.privacy.deprecate_plotting:
+
+Deprecate .plotting
+^^^^^^^^^^^^^^^^^^^
+
+The ``pandas.tools.plotting`` module has been deprecated,  in favor of the top level ``pandas.plotting`` module. All the public plotting functions are now available
+from ``pandas.plotting`` (:issue:`12548`).
+
+Furthermore, the top-level ``pandas.scatter_matrix`` and ``pandas.plot_params`` are deprecated.
+Users can import these from ``pandas.plotting`` as well.
+
+Previous script:
+
+.. code-block:: python
+
+   pd.tools.plotting.scatter_matrix(df)
+   pd.scatter_matrix(df)
+
+Should be changed to:
+
+.. code-block:: python
+
+   pd.plotting.scatter_matrix(df)
+
+
+
+.. _whatsnew_0200.deprecations.other:
+
+Other Deprecations
+^^^^^^^^^^^^^^^^^^
+
+- ``SparseArray.to_dense()`` has deprecated the ``fill`` parameter, as that parameter was not being respected (:issue:`14647`)
+- ``SparseSeries.to_dense()`` has deprecated the ``sparse_only`` parameter (:issue:`14647`)
+- ``Series.repeat()`` has deprecated the ``reps`` parameter in favor of ``repeats`` (:issue:`12662`)
+- The ``Series`` constructor and ``.astype`` method have deprecated accepting timestamp dtypes without a frequency (e.g. ``np.datetime64``) for the ``dtype`` parameter (:issue:`15524`)
+- ``Index.repeat()`` and ``MultiIndex.repeat()`` have deprecated the ``n`` parameter in favor of ``repeats`` (:issue:`12662`)
+- ``Categorical.searchsorted()`` and ``Series.searchsorted()`` have deprecated the ``v`` parameter in favor of ``value`` (:issue:`12662`)
+- ``TimedeltaIndex.searchsorted()``, ``DatetimeIndex.searchsorted()``, and ``PeriodIndex.searchsorted()`` have deprecated the ``key`` parameter in favor of ``value`` (:issue:`12662`)
+- ``DataFrame.astype()`` has deprecated the ``raise_on_error`` parameter in favor of ``errors`` (:issue:`14878`)
+- ``Series.sortlevel`` and ``DataFrame.sortlevel`` have been deprecated in favor of ``Series.sort_index`` and ``DataFrame.sort_index`` (:issue:`15099`)
+- importing ``concat`` from ``pandas.tools.merge`` has been deprecated in favor of imports from the ``pandas`` namespace. This should only affect explicit imports (:issue:`15358`)
+- ``Series/DataFrame/Panel.consolidate()`` been deprecated as a public method. (:issue:`15483`)
+- The ``as_indexer`` keyword of ``Series.str.match()`` has been deprecated (ignored keyword) (:issue:`15257`).
+- The following top-level pandas functions have been deprecated and will be removed in a future version (:issue:`13790`, :issue:`15940`)
+
+  * ``pd.pnow()``, replaced by ``Period.now()``
+  * ``pd.Term``, is removed, as it is not applicable to user code. Instead use in-line string expressions in the where clause when searching in HDFStore
+  * ``pd.Expr``, is removed, as it is not applicable to user code.
+  * ``pd.match()``, is removed.
+  * ``pd.groupby()``, replaced by using the ``.groupby()`` method directly on a ``Series/DataFrame``
+  * ``pd.get_store()``, replaced by a direct call to ``pd.HDFStore(...)``
+- ``is_any_int_dtype``, ``is_floating_dtype``, and ``is_sequence`` are deprecated from ``pandas.api.types`` (:issue:`16042`)
+
+.. _whatsnew_0200.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``pandas.rpy`` module is removed. Similar functionality can be accessed
+  through the `rpy2 <https://rpy2.readthedocs.io/>`__ project.
+  See the :ref:`R interfacing docs <rpy>` for more details.
+- The ``pandas.io.ga`` module with a ``google-analytics`` interface is removed (:issue:`11308`).
+  Similar functionality can be found in the `Google2Pandas <https://github.com/panalysis/Google2Pandas>`__ package.
+- ``pd.to_datetime`` and ``pd.to_timedelta`` have dropped the ``coerce`` parameter in favor of ``errors`` (:issue:`13602`)
+- ``pandas.stats.fama_macbeth``, ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var``, as well as the top-level ``pandas.fama_macbeth`` and ``pandas.ols`` routines are removed. Similar functionality can be found in the `statsmodels <https://www.statsmodels.org/dev/>`__ package. (:issue:`11898`)
+- The ``TimeSeries`` and ``SparseTimeSeries`` classes, aliases of ``Series``
+  and ``SparseSeries``, are removed (:issue:`10890`, :issue:`15098`).
+- ``Series.is_time_series`` is dropped in favor of ``Series.index.is_all_dates`` (:issue:`15098`)
+- The deprecated ``irow``, ``icol``, ``iget`` and ``iget_value`` methods are removed
+  in favor of ``iloc`` and ``iat`` as explained :ref:`here <whatsnew_0170.deprecations>` (:issue:`10711`).
+- The deprecated ``DataFrame.iterkv()`` has been removed in favor of ``DataFrame.iteritems()`` (:issue:`10711`)
+- The ``Categorical`` constructor has dropped the ``name`` parameter (:issue:`10632`)
+- ``Categorical`` has dropped support for ``NaN`` categories (:issue:`10748`)
+- The ``take_last`` parameter has been dropped from ``duplicated()``, ``drop_duplicates()``, ``nlargest()``, and ``nsmallest()`` methods (:issue:`10236`, :issue:`10792`, :issue:`10920`)
+- ``Series``, ``Index``, and ``DataFrame`` have dropped the ``sort`` and ``order`` methods (:issue:`10726`)
+- Where clauses in ``pytables`` are only accepted as strings and expressions types and not other data-types (:issue:`12027`)
+- ``DataFrame`` has dropped the ``combineAdd`` and ``combineMult`` methods in favor of ``add`` and ``mul`` respectively (:issue:`10735`)
+
+.. _whatsnew_0200.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of ``pd.wide_to_long()`` (:issue:`14779`)
+- Improved performance of ``pd.factorize()`` by releasing the GIL with ``object`` dtype when inferred as strings (:issue:`14859`, :issue:`16057`)
+- Improved performance of timeseries plotting with an irregular DatetimeIndex
+  (or with ``compat_x=True``) (:issue:`15073`).
+- Improved performance of ``groupby().cummin()`` and ``groupby().cummax()`` (:issue:`15048`, :issue:`15109`, :issue:`15561`, :issue:`15635`)
+- Improved performance and reduced memory when indexing with a ``MultiIndex`` (:issue:`15245`)
+- When reading buffer object in ``read_sas()`` method without specified format, filepath string is inferred rather than buffer object. (:issue:`14947`)
+- Improved performance of ``.rank()`` for categorical data (:issue:`15498`)
+- Improved performance when using ``.unstack()`` (:issue:`15503`)
+- Improved performance of merge/join on ``category`` columns (:issue:`10409`)
+- Improved performance of ``drop_duplicates()`` on ``bool`` columns (:issue:`12963`)
+- Improve performance of ``pd.core.groupby.GroupBy.apply`` when the applied
+  function used the ``.name`` attribute of the group DataFrame (:issue:`15062`).
+- Improved performance of ``iloc`` indexing with a list or array (:issue:`15504`).
+- Improved performance of ``Series.sort_index()`` with a monotonic index (:issue:`15694`)
+- Improved performance in ``pd.read_csv()`` on some platforms with buffered reads (:issue:`16039`)
+
+.. _whatsnew_0200.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in ``Timestamp.replace`` now raises ``TypeError`` when incorrect argument names are given; previously this raised ``ValueError`` (:issue:`15240`)
+- Bug in ``Timestamp.replace`` with compat for passing long integers (:issue:`15030`)
+- Bug in ``Timestamp`` returning UTC based time/date attributes when a timezone was provided (:issue:`13303`, :issue:`6538`)
+- Bug in ``Timestamp`` incorrectly localizing timezones during construction (:issue:`11481`, :issue:`15777`)
+- Bug in ``TimedeltaIndex`` addition where overflow was being allowed without error (:issue:`14816`)
+- Bug in ``TimedeltaIndex`` raising a ``ValueError`` when boolean indexing with ``loc`` (:issue:`14946`)
+- Bug in catching an overflow in ``Timestamp`` + ``Timedelta/Offset`` operations (:issue:`15126`)
+- Bug in ``DatetimeIndex.round()`` and ``Timestamp.round()`` floating point accuracy when rounding by milliseconds or less (:issue:`14440`, :issue:`15578`)
+- Bug in ``astype()`` where ``inf`` values were incorrectly converted to integers. Now raises error now with ``astype()`` for Series and DataFrames (:issue:`14265`)
+- Bug in ``DataFrame(..).apply(to_numeric)`` when values are of type decimal.Decimal. (:issue:`14827`)
+- Bug in ``describe()`` when passing a numpy array which does not contain the median to the ``percentiles`` keyword argument (:issue:`14908`)
+- Cleaned up ``PeriodIndex`` constructor, including raising on floats more consistently (:issue:`13277`)
+- Bug in using ``__deepcopy__`` on empty NDFrame objects (:issue:`15370`)
+- Bug in ``.replace()`` may result in incorrect dtypes. (:issue:`12747`, :issue:`15765`)
+- Bug in ``Series.replace`` and ``DataFrame.replace`` which failed on empty replacement dicts (:issue:`15289`)
+- Bug in ``Series.replace`` which replaced a numeric by string (:issue:`15743`)
+- Bug in ``Index`` construction with ``NaN`` elements and integer dtype specified (:issue:`15187`)
+- Bug in ``Series`` construction with a datetimetz (:issue:`14928`)
+- Bug in ``Series.dt.round()`` inconsistent behaviour on ``NaT`` 's with different arguments (:issue:`14940`)
+- Bug in ``Series`` constructor when both ``copy=True`` and ``dtype`` arguments are provided (:issue:`15125`)
+- Incorrect dtyped ``Series`` was returned by comparison methods (e.g., ``lt``, ``gt``, ...) against a constant for an empty ``DataFrame`` (:issue:`15077`)
+- Bug in ``Series.ffill()`` with mixed dtypes containing tz-aware datetimes. (:issue:`14956`)
+- Bug in ``DataFrame.fillna()`` where the argument ``downcast`` was ignored when fillna value was of type ``dict`` (:issue:`15277`)
+- Bug in ``.asfreq()``, where frequency was not set for empty ``Series`` (:issue:`14320`)
+- Bug in ``DataFrame`` construction with nulls and datetimes in a list-like (:issue:`15869`)
+- Bug in ``DataFrame.fillna()`` with tz-aware datetimes (:issue:`15855`)
+- Bug in ``is_string_dtype``, ``is_timedelta64_ns_dtype``, and ``is_string_like_dtype`` in which an error was raised when ``None`` was passed in (:issue:`15941`)
+- Bug in the return type of ``pd.unique`` on a ``Categorical``, which was returning an ndarray and not a ``Categorical`` (:issue:`15903`)
+- Bug in ``Index.to_series()`` where the index was not copied (and so mutating later would change the original), (:issue:`15949`)
+- Bug in indexing with partial string indexing with a len-1 DataFrame (:issue:`16071`)
+- Bug in ``Series`` construction where passing invalid dtype didn't raise an error. (:issue:`15520`)
+
+Indexing
+^^^^^^^^
+
+- Bug in ``Index`` power operations with reversed operands (:issue:`14973`)
+- Bug in ``DataFrame.sort_values()`` when sorting by multiple columns where one column is of type ``int64`` and contains ``NaT`` (:issue:`14922`)
+- Bug in ``DataFrame.reindex()`` in which ``method`` was ignored when passing ``columns`` (:issue:`14992`)
+- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a ``Series`` indexer (:issue:`14730`, :issue:`15424`)
+- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a numpy array (:issue:`15434`)
+- Bug in ``Series.asof`` which raised if the series contained all ``np.nan`` (:issue:`15713`)
+- Bug in ``.at`` when selecting from a tz-aware column (:issue:`15822`)
+- Bug in ``Series.where()`` and ``DataFrame.where()`` where array-like conditionals were being rejected (:issue:`15414`)
+- Bug in ``Series.where()`` where TZ-aware data was converted to float representation (:issue:`15701`)
+- Bug in ``.loc`` that would not return the correct dtype for scalar access for a DataFrame (:issue:`11617`)
+- Bug in output formatting of a ``MultiIndex`` when names are integers (:issue:`12223`, :issue:`15262`)
+- Bug in ``Categorical.searchsorted()`` where alphabetical instead of the provided categorical order was used (:issue:`14522`)
+- Bug in ``Series.iloc`` where a ``Categorical`` object for list-like indexes input was returned, where a ``Series`` was expected. (:issue:`14580`)
+- Bug in ``DataFrame.isin`` comparing datetimelike to empty frame (:issue:`15473`)
+- Bug in ``.reset_index()`` when an all ``NaN`` level of a ``MultiIndex`` would fail (:issue:`6322`)
+- Bug in ``.reset_index()`` when raising error for index name already present in ``MultiIndex`` columns (:issue:`16120`)
+- Bug in creating a ``MultiIndex`` with tuples and not passing a list of names; this will now raise ``ValueError`` (:issue:`15110`)
+- Bug in the HTML display with with a ``MultiIndex`` and truncation (:issue:`14882`)
+- Bug in the display of ``.info()`` where a qualifier (+) would always be displayed with a ``MultiIndex`` that contains only non-strings (:issue:`15245`)
+- Bug in ``pd.concat()`` where the names of ``MultiIndex`` of resulting ``DataFrame`` are not handled correctly when ``None`` is presented in the names of ``MultiIndex`` of input ``DataFrame`` (:issue:`15787`)
+- Bug in ``DataFrame.sort_index()`` and ``Series.sort_index()`` where ``na_position`` doesn't work with a ``MultiIndex`` (:issue:`14784`, :issue:`16604`)
+- Bug in in ``pd.concat()`` when combining objects with a ``CategoricalIndex`` (:issue:`16111`)
+- Bug in indexing with a scalar and a ``CategoricalIndex`` (:issue:`16123`)
+
+I/O
+^^^
+
+- Bug in ``pd.to_numeric()`` in which float and unsigned integer elements were being improperly casted (:issue:`14941`, :issue:`15005`)
+- Bug in ``pd.read_fwf()`` where the skiprows parameter was not being respected during column width inference (:issue:`11256`)
+- Bug in ``pd.read_csv()`` in which the ``dialect`` parameter was not being verified before processing (:issue:`14898`)
+- Bug in ``pd.read_csv()`` in which missing data was being improperly handled with ``usecols`` (:issue:`6710`)
+- Bug in ``pd.read_csv()`` in which a file containing a row with many columns followed by rows with fewer columns would cause a crash (:issue:`14125`)
+- Bug in ``pd.read_csv()`` for the C engine where ``usecols`` were being indexed incorrectly with ``parse_dates`` (:issue:`14792`)
+- Bug in ``pd.read_csv()`` with ``parse_dates`` when multi-line headers are specified (:issue:`15376`)
+- Bug in ``pd.read_csv()`` with ``float_precision='round_trip'`` which caused a segfault when a text entry is parsed (:issue:`15140`)
+- Bug in ``pd.read_csv()`` when an index was specified and no values were specified as null values (:issue:`15835`)
+- Bug in ``pd.read_csv()`` in which certain invalid file objects caused the Python interpreter to crash (:issue:`15337`)
+- Bug in ``pd.read_csv()`` in which invalid values for ``nrows`` and ``chunksize`` were allowed (:issue:`15767`)
+- Bug in ``pd.read_csv()`` for the Python engine in which unhelpful error messages were being raised when parsing errors occurred (:issue:`15910`)
+- Bug in ``pd.read_csv()`` in which the ``skipfooter`` parameter was not being properly validated (:issue:`15925`)
+- Bug in ``pd.to_csv()`` in which there was numeric overflow when a timestamp index was being written (:issue:`15982`)
+- Bug in ``pd.util.hashing.hash_pandas_object()`` in which hashing of categoricals depended on the ordering of categories, instead of just their values. (:issue:`15143`)
+- Bug in ``.to_json()`` where ``lines=True`` and contents (keys or values) contain escaped characters (:issue:`15096`)
+- Bug in ``.to_json()`` causing single byte ascii characters to be expanded to four byte unicode (:issue:`15344`)
+- Bug in ``.to_json()`` for the C engine where rollover was not correctly handled for case where frac is odd and diff is exactly 0.5 (:issue:`15716`, :issue:`15864`)
+- Bug in ``pd.read_json()`` for Python 2 where ``lines=True`` and contents contain non-ascii unicode characters (:issue:`15132`)
+- Bug in ``pd.read_msgpack()`` in which ``Series`` categoricals were being improperly processed (:issue:`14901`)
+- Bug in ``pd.read_msgpack()`` which did not allow loading of a dataframe with an index of type ``CategoricalIndex`` (:issue:`15487`)
+- Bug in ``pd.read_msgpack()`` when deserializing a ``CategoricalIndex`` (:issue:`15487`)
+- Bug in ``DataFrame.to_records()`` with converting a ``DatetimeIndex`` with a timezone (:issue:`13937`)
+- Bug in ``DataFrame.to_records()`` which failed with unicode characters in column names (:issue:`11879`)
+- Bug in ``.to_sql()`` when writing a DataFrame with numeric index names (:issue:`15404`).
+- Bug in ``DataFrame.to_html()`` with ``index=False`` and ``max_rows`` raising in ``IndexError`` (:issue:`14998`)
+- Bug in ``pd.read_hdf()`` passing a ``Timestamp`` to the ``where`` parameter with a non date column (:issue:`15492`)
+- Bug in ``DataFrame.to_stata()`` and ``StataWriter`` which produces incorrectly formatted files to be produced for some locales (:issue:`13856`)
+- Bug in ``StataReader`` and ``StataWriter`` which allows invalid encodings (:issue:`15723`)
+- Bug in the ``Series`` repr not showing the length when the output was truncated (:issue:`15962`).
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.hist`` where ``plt.tight_layout`` caused an ``AttributeError``  (use ``matplotlib >= 2.0.1``) (:issue:`9351`)
+- Bug in ``DataFrame.boxplot`` where ``fontsize`` was not applied to the tick labels on both axes (:issue:`15108`)
+- Bug in the date and time converters pandas registers with matplotlib not handling multiple dimensions (:issue:`16026`)
+- Bug in ``pd.scatter_matrix()`` could accept either ``color`` or ``c``, but not both (:issue:`14855`)
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``.groupby(..).resample()`` when passed the ``on=`` kwarg. (:issue:`15021`)
+- Properly set ``__name__`` and ``__qualname__`` for ``Groupby.*`` functions (:issue:`14620`)
+- Bug in ``GroupBy.get_group()`` failing with a categorical grouper (:issue:`15155`)
+- Bug in ``.groupby(...).rolling(...)`` when ``on`` is specified and using a ``DatetimeIndex`` (:issue:`15130`, :issue:`13966`)
+- Bug in groupby operations with ``timedelta64`` when passing ``numeric_only=False`` (:issue:`5724`)
+- Bug in ``groupby.apply()`` coercing ``object`` dtypes to numeric types, when not all values were numeric (:issue:`14423`, :issue:`15421`, :issue:`15670`)
+- Bug in ``resample``, where a non-string ``loffset`` argument would not be applied when resampling a timeseries (:issue:`13218`)
+- Bug in ``DataFrame.groupby().describe()`` when grouping on ``Index`` containing tuples (:issue:`14848`)
+- Bug in ``groupby().nunique()`` with a datetimelike-grouper where bins counts were incorrect (:issue:`13453`)
+- Bug in ``groupby.transform()`` that would coerce the resultant dtypes back to the original (:issue:`10972`, :issue:`11444`)
+- Bug in ``groupby.agg()`` incorrectly localizing timezone on ``datetime`` (:issue:`15426`, :issue:`10668`, :issue:`13046`)
+- Bug in ``.rolling/expanding()`` functions where ``count()`` was not counting ``np.Inf``, nor handling ``object`` dtypes (:issue:`12541`)
+- Bug in ``.rolling()`` where ``pd.Timedelta`` or ``datetime.timedelta`` was not accepted as a ``window`` argument (:issue:`15440`)
+- Bug in ``Rolling.quantile`` function that caused a segmentation fault when called with a quantile value outside of the range [0, 1] (:issue:`15463`)
+- Bug in ``DataFrame.resample().median()`` if duplicate column names are present (:issue:`14233`)
+
+Sparse
+^^^^^^
+
+- Bug in ``SparseSeries.reindex`` on single level with list of length 1 (:issue:`15447`)
+- Bug in repr-formatting a ``SparseDataFrame`` after a value was set on (a copy of) one of its series (:issue:`15488`)
+- Bug in ``SparseDataFrame`` construction with lists not coercing to dtype (:issue:`15682`)
+- Bug in sparse array indexing in which indices were not being validated (:issue:`15863`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in ``pd.merge_asof()`` where ``left_index`` or ``right_index`` caused a failure when multiple ``by`` was specified (:issue:`15676`)
+- Bug in ``pd.merge_asof()`` where ``left_index``/``right_index`` together caused a failure when ``tolerance`` was specified (:issue:`15135`)
+- Bug in ``DataFrame.pivot_table()`` where ``dropna=True`` would not drop all-NaN columns when the columns was a ``category`` dtype (:issue:`15193`)
+- Bug in ``pd.melt()`` where passing a tuple value for ``value_vars`` caused a ``TypeError`` (:issue:`15348`)
+- Bug in ``pd.pivot_table()`` where no error was raised when values argument was not in the columns (:issue:`14938`)
+- Bug in ``pd.concat()`` in which concatenating with an empty dataframe with ``join='inner'`` was being improperly handled (:issue:`15328`)
+- Bug with ``sort=True`` in ``DataFrame.join`` and ``pd.merge`` when joining on indexes (:issue:`15582`)
+- Bug in ``DataFrame.nsmallest`` and ``DataFrame.nlargest`` where identical values resulted in duplicated rows (:issue:`15297`)
+- Bug in :func:`pandas.pivot_table` incorrectly raising ``UnicodeError`` when passing unicode input for ``margins`` keyword (:issue:`13292`)
+
+Numeric
+^^^^^^^
+
+- Bug in ``.rank()`` which incorrectly ranks ordered categories (:issue:`15420`)
+- Bug in ``.corr()`` and ``.cov()`` where the column and index were the same object (:issue:`14617`)
+- Bug in ``.mode()`` where ``mode`` was not returned if was only a single value (:issue:`15714`)
+- Bug in ``pd.cut()`` with a single bin on an all 0s array (:issue:`15428`)
+- Bug in ``pd.qcut()`` with a single quantile and an array with identical values (:issue:`15431`)
+- Bug in ``pandas.tools.utils.cartesian_product()`` with large input can cause overflow on windows (:issue:`15265`)
+- Bug in ``.eval()`` which caused multi-line evals to fail with local variables not on the first line (:issue:`15342`)
+
+Other
+^^^^^
+
+- Compat with SciPy 0.19.0 for testing on ``.interpolate()`` (:issue:`15662`)
+- Compat for 32-bit platforms for ``.qcut/cut``; bins will now be ``int64`` dtype (:issue:`14866`)
+- Bug in interactions with ``Qt`` when a ``QtApplication`` already exists (:issue:`14372`)
+- Avoid use of ``np.finfo()`` during ``import pandas`` removed to mitigate deadlock on Python GIL misuse (:issue:`14641`)
+
+
+.. _whatsnew_0.20.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.19.2..v0.20.0
diff --git a/doc/source/whatsnew/v0.20.0.txt b/doc/source/whatsnew/v0.20.0.txt
deleted file mode 100644
index 399f91fc60810..0000000000000
--- a/doc/source/whatsnew/v0.20.0.txt
+++ /dev/null
@@ -1,1053 +0,0 @@
-.. _whatsnew_0200:
-
-v0.20.0 (????, 2017)
---------------------
-
-This is a major release from 0.19 and includes a small number of API changes, several new features,
-enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
-users upgrade to this version.
-
-Highlights include:
-
-- Building pandas for development now requires ``cython >= 0.23`` (:issue:`14831`)
-- The ``.ix`` indexer has been deprecated, see :ref:`here <whatsnew_0200.api_breaking.deprecate_ix>`
-- Switched the test framework to `pytest`_ (:issue:`13097`)
-- A new orient for JSON serialization, ``orient='table'``, that uses the Table Schema spec, see :ref:`here <whatsnew_0200.enhancements.table_schema>`
-
-.. _pytest: http://doc.pytest.org/en/latest/
-
-Check the :ref:`API Changes <whatsnew_0200.api_breaking>` and :ref:`deprecations <whatsnew_0200.deprecations>` before updating.
-
-.. contents:: What's new in v0.20.0
-    :local:
-    :backlinks: none
-
-.. _whatsnew_0200.enhancements:
-
-New features
-~~~~~~~~~~~~
-
-
-.. _whatsnew_0200.enhancements.dataio_dtype:
-
-``dtype`` keyword for data IO
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The ``dtype`` keyword argument in the :func:`read_csv` function for specifying the types of parsed columns is now supported with the ``'python'`` engine (:issue:`14295`). See the :ref:`io docs <io.dtypes>` for more information.
-
-.. ipython:: python
-   :suppress:
-
-   from pandas.compat import StringIO
-
-.. ipython:: python
-
-   data = "a,b\n1,2\n3,4"
-   pd.read_csv(StringIO(data), engine='python').dtypes
-   pd.read_csv(StringIO(data), engine='python', dtype={'a':'float64', 'b':'object'}).dtypes
-
-The ``dtype`` keyword argument is also now supported in the :func:`read_fwf` function for parsing
-fixed-width text files, and :func:`read_excel` for parsing Excel files.
-
-.. ipython:: python
-
-   data = "a  b\n1  2\n3  4"
-   pd.read_fwf(StringIO(data)).dtypes
-   pd.read_fwf(StringIO(data), dtype={'a':'float64', 'b':'object'}).dtypes
-
-.. _whatsnew_0200.enhancements.groupby_access:
-
-Groupby Enhancements
-^^^^^^^^^^^^^^^^^^^^
-
-Strings passed to ``DataFrame.groupby()`` as the ``by`` parameter may now reference either column names or index level names (:issue:`5677`)
-
-.. ipython:: python
-
-   arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-             ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-
-   index = pd.MultiIndex.from_arrays(arrays, names=['first', 'second'])
-
-   df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 3, 3],
-                      'B': np.arange(8)},
-                     index=index)
-   df
-
-   df.groupby(['second', 'A']).sum()
-
-.. _whatsnew_0200.enhancements.compressed_urls:
-
-Better support for compressed URLs in ``read_csv``
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The compression code was refactored (:issue:`12688`). As a result, reading
-dataframes from URLs in :func:`read_csv` or :func:`read_table` now supports
-additional compression methods: ``xz``, ``bz2``, and ``zip`` (:issue:`14570`).
-Previously, only ``gzip`` compression was supported. By default, compression of
-URLs and paths are now both inferred using their file extensions. Additionally,
-support for bz2 compression in the python 2 c-engine improved (:issue:`14874`).
-
-.. ipython:: python
-
-   url = 'https://github.com/{repo}/raw/{branch}/{path}'.format(
-       repo = 'pandas-dev/pandas',
-       branch = 'master',
-       path = 'pandas/tests/io/parser/data/salaries.csv.bz2',
-   )
-   df = pd.read_table(url, compression='infer')  # default, infer compression
-   df = pd.read_table(url, compression='bz2')  # explicitly specify compression
-   df.head(2)
-
-.. _whatsnew_0200.enhancements.pickle_compression:
-
-Pickle file I/O now supports compression
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:func:`read_pickle`, :meth:`DataFame.to_pickle` and :meth:`Series.to_pickle`
-can now read from and write to compressed pickle files. Compression methods
-can be an explicit parameter or be inferred from the file extension.
-See :ref:`the docs here <io.pickle.compression>`
-
-.. ipython:: python
-
-   df = pd.DataFrame({
-       'A': np.random.randn(1000),
-       'B': 'foo',
-       'C': pd.date_range('20130101', periods=1000, freq='s')})
-
-Using an explicit compression type
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.compress", compression="gzip")
-   rt = pd.read_pickle("data.pkl.compress", compression="gzip")
-   rt
-
-Inferring compression type from the extension
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.xz", compression="infer")
-   rt = pd.read_pickle("data.pkl.xz", compression="infer")
-   rt
-
-The default is to 'infer
-
-.. ipython:: python
-
-   df.to_pickle("data.pkl.gz")
-   rt = pd.read_pickle("data.pkl.gz")
-   rt
-   df["A"].to_pickle("s1.pkl.bz2")
-   rt = pd.read_pickle("s1.pkl.bz2")
-   rt
-
-.. ipython:: python
-   :suppress:
-
-   import os
-   os.remove("data.pkl.compress")
-   os.remove("data.pkl.xz")
-   os.remove("data.pkl.gz")
-   os.remove("s1.pkl.bz2")
-
-.. _whatsnew_0200.enhancements.uint64_support:
-
-UInt64 Support Improved
-^^^^^^^^^^^^^^^^^^^^^^^
-
-Pandas has significantly improved support for operations involving unsigned,
-or purely non-negative, integers. Previously, handling these integers would
-result in improper rounding or data-type casting, leading to incorrect results.
-Notably, a new numerical index, ``UInt64Index``, has been created (:issue:`14937`)
-
-.. ipython:: python
-
-   idx = pd.UInt64Index([1, 2, 3])
-   df = pd.DataFrame({'A': ['a', 'b', 'c']}, index=idx)
-   df.index
-
-- Bug in converting object elements of array-like objects to unsigned 64-bit integers (:issue:`4471`, :issue:`14982`)
-- Bug in ``Series.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14721`)
-- Bug in ``DataFrame`` construction in which unsigned 64-bit integer elements were being converted to objects (:issue:`14881`)
-- Bug in ``pd.read_csv()`` in which unsigned 64-bit integer elements were being improperly converted to the wrong data types (:issue:`14983`)
-- Bug in ``pd.unique()`` in which unsigned 64-bit integers were causing overflow (:issue:`14915`)
-- Bug in ``pd.value_counts()`` in which unsigned 64-bit integers were being erroneously truncated in the output (:issue:`14934`)
-
-.. _whatsnew_0200.enhancements.groupy_categorical:
-
-GroupBy on Categoricals
-^^^^^^^^^^^^^^^^^^^^^^^
-
-In previous versions, ``.groupby(..., sort=False)`` would fail with a ``ValueError`` when grouping on a categorical series with some categories not appearing in the data. (:issue:`13179`)
-
-.. ipython:: python
-
-  chromosomes = np.r_[np.arange(1, 23).astype(str), ['X', 'Y']]
-  df = pd.DataFrame({
-      'A': np.random.randint(100),
-      'B': np.random.randint(100),
-      'C': np.random.randint(100),
-      'chromosomes': pd.Categorical(np.random.choice(chromosomes, 100),
-                                    categories=chromosomes,
-                                    ordered=True)})
-  df
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-  In [3]: df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
-  ---------------------------------------------------------------------------
-  ValueError: items in new_categories are not the same as in old categories
-
-New Behavior:
-
-.. ipython:: python
-
-  df[df.chromosomes != '1'].groupby('chromosomes', sort=False).sum()
-
-.. _whatsnew_0200.enhancements.table_schema:
-
-Table Schema Output
-^^^^^^^^^^^^^^^^^^^
-
-The new orient ``'table'`` for :meth:`DataFrame.to_json`
-will generate a `Table Schema`_ compatible string representation of
-the data.
-
-.. ipython:: python
-
-   df = pd.DataFrame(
-       {'A': [1, 2, 3],
-        'B': ['a', 'b', 'c'],
-        'C': pd.date_range('2016-01-01', freq='d', periods=3),
-       }, index=pd.Index(range(3), name='idx'))
-   df
-   df.to_json(orient='table')
-
-
-See :ref:`IO: Table Schema for more<io.table_schema>`.
-
-Additionally, the repr for ``DataFrame`` and ``Series`` can now publish
-this JSON Table schema representation of the Series or DataFrame if you are
-using IPython (or another frontend like `nteract`_ using the Jupyter messaging
-protocol).
-This gives frontends like the Jupyter notebook and `nteract`_
-more flexiblity in how they display pandas objects, since they have
-more information about the data.
-You must enable this by setting the ``display.html.table_schema`` option to True.
-
-.. _Table Schema: http://specs.frictionlessdata.io/json-table-schema/
-.. _nteract: http://nteract.io/
-
-.. _whatsnew_0200.enhancements.scipy_sparse:
-
-SciPy sparse matrix from/to SparseDataFrame
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Pandas now supports creating sparse dataframes directly from ``scipy.sparse.spmatrix`` instances.
-See the :ref:`documentation <sparse.scipysparse>` for more information. (:issue:`4343`)
-
-All sparse formats are supported, but matrices that are not in :mod:`COOrdinate <scipy.sparse>` format will be converted, copying data as needed.
-
-.. ipython:: python
-
-   from scipy.sparse import csr_matrix
-   arr = np.random.random(size=(1000, 5))
-   arr[arr < .9] = 0
-   sp_arr = csr_matrix(arr)
-   sp_arr
-   sdf = pd.SparseDataFrame(sp_arr)
-   sdf
-
-To convert a ``SparseDataFrame`` back to sparse SciPy matrix in COO format, you can use:
-
-.. ipython:: python
-
-   sdf.to_coo()
-
-.. _whatsnew_0200.enhancements.other:
-
-Other Enhancements
-^^^^^^^^^^^^^^^^^^
-
-- Integration with the ``feather-format``, including a new top-level ``pd.read_feather()`` and ``DataFrame.to_feather()`` method, see :ref:`here <io.feather>`.
-- ``Series.str.replace()`` now accepts a callable, as replacement, which is passed to ``re.sub`` (:issue:`15055`)
-- ``Series.str.replace()`` now accepts a compiled regular expression as a pattern (:issue:`15446`)
-
-
-- ``Series.sort_index`` accepts parameters ``kind`` and ``na_position`` (:issue:`13589`, :issue:`14444`)
-
-- ``DataFrame`` has gained a ``nunique()`` method to count the distinct values over an axis (:issue:`14336`).
-- ``DataFrame.groupby()`` has gained a ``.nunique()`` method to count the distinct values for all columns within each group (:issue:`14336`, :issue:`15197`).
-
-- ``pd.read_excel()`` now preserves sheet order when using ``sheetname=None`` (:issue:`9930`)
-- Multiple offset aliases with decimal points are now supported (e.g. '0.5min' is parsed as '30s') (:issue:`8419`)
-- ``.isnull()`` and ``.notnull()`` have been added to ``Index`` object to make them more consistent with the ``Series`` API (:issue:`15300`)
-
-- New ``UnsortedIndexError`` (subclass of ``KeyError``) raised when indexing/slicing into an
-  unsorted MultiIndex (:issue:`11897`). This allows differentiation between errors due to lack
-  of sorting or an incorrect key. See :ref:`here <advanced.unsorted>`
-- ``MultiIndex`` has gained a ``.to_frame()`` method to convert to a ``DataFrame`` (:issue:`12397`)
-- ``pd.cut`` and ``pd.qcut`` now support datetime64 and timedelta64 dtypes (:issue:`14714`, :issue:`14798`)
-- ``pd.qcut`` has gained the ``duplicates='raise'|'drop'`` option to control whether to raise on duplicated edges (:issue:`7751`)
-- ``Series`` provides a ``to_excel`` method to output Excel files (:issue:`8825`)
-- The ``usecols`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`14154`)
-- The ``skiprows`` argument in ``pd.read_csv()`` now accepts a callable function as a value  (:issue:`10882`)
-- The ``nrows`` and ``chunksize`` arguments in ``pd.read_csv()`` are supported if both are passed (:issue:`6774`, :issue:`15755`)
-- ``pd.DataFrame.plot`` now prints a title above each subplot if ``suplots=True`` and ``title`` is a list of strings (:issue:`14753`)
-- ``pd.Series.interpolate`` now supports timedelta as an index type with ``method='time'`` (:issue:`6424`)
-- ``Timedelta.isoformat`` method added for formatting Timedeltas as an `ISO 8601 duration`_. See the :ref:`Timedelta docs <timedeltas.isoformat>` (:issue:`15136`)
-- ``.select_dtypes()`` now allows the string 'datetimetz' to generically select datetimes with tz (:issue:`14910`)
-- The ``.to_latex()`` method will now accept ``multicolumn`` and ``multirow`` arguments to use the accompanying LaTeX enhancements
-
-- ``pd.merge_asof()`` gained the option ``direction='backward'|'forward'|'nearest'`` (:issue:`14887`)
-- ``Series/DataFrame.asfreq()`` have gained a ``fill_value`` parameter, to fill missing values (:issue:`3715`).
-- ``Series/DataFrame.resample.asfreq`` have gained a ``fill_value`` parameter, to fill missing values during resampling (:issue:`3715`).
-- ``pandas.tools.hashing`` has gained a ``hash_tuples`` routine, and ``hash_pandas_object`` has gained the ability to hash a ``MultiIndex`` (:issue:`15224`)
-- ``Series/DataFrame.squeeze()`` have gained the ``axis`` parameter. (:issue:`15339`)
-- ``DataFrame.to_excel()`` has a new ``freeze_panes`` parameter to turn on Freeze Panes when exporting to Excel (:issue:`15160`)
-- ``pd.read_html()`` will parse multiple header rows, creating a multiindex header. (:issue:`13434`).
-- HTML table output skips ``colspan`` or ``rowspan`` attribute if equal to 1. (:issue:`15403`)
-
-- ``pd.TimedeltaIndex`` now has a custom datetick formatter specifically designed for nanosecond level precision (:issue:`8711`)
-- ``pd.types.concat.union_categoricals`` gained the ``ignore_ordered`` argument to allow ignoring the ordered attribute of unioned categoricals (:issue:`13410`). See the :ref:`categorical union docs <categorical.union>` for more information.
-- ``pd.DataFrame.to_latex`` and ``pd.DataFrame.to_string`` now allow optional header aliases. (:issue:`15536`)
-- Re-enable the ``parse_dates`` keyword of ``read_excel`` to parse string columns as dates (:issue:`14326`)
-- Added ``.empty`` property to subclasses of ``Index``. (:issue:`15270`)
-
-- ``pandas.io.json.json_normalize()`` gained the option ``errors='ignore'|'raise'``; the default is ``errors='raise'`` which is backward compatible. (:issue:`14583`)
-- ``pandas.io.json.json_normalize()`` with an empty ``list`` will return an empty ``DataFrame`` (:issue:`15534`)
-- ``pandas.io.json.json_normalize()`` has gained a ``sep`` option that accepts ``str`` to separate joined fields; the default is ".", which is backward compatible. (:issue:`14883`)
-
-
-.. _ISO 8601 duration: https://en.wikipedia.org/wiki/ISO_8601#Durations
-
-
-.. _whatsnew_0200.api_breaking:
-
-Backwards incompatible API changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. _whatsnew_0200.api_breaking.deprecate_ix:
-
-Deprecate .ix
-^^^^^^^^^^^^^
-
-The ``.ix`` indexer is deprecated, in favor of the more strict ``.iloc`` and ``.loc`` indexers. ``.ix`` offers a lot of magic on the inference of what the user wants to do. To wit, ``.ix`` can decide to index *positionally* OR via *labels*, depending on the data type of the index. This has caused quite a bit of user confusion over the years. The full indexing documentation are :ref:`here <indexing>`. (:issue:`14218`)
-
-
-The recommended methods of indexing are:
-
-- ``.loc`` if you want to *label* index
-- ``.iloc`` if you want to *positionally* index.
-
-Using ``.ix`` will now show a ``DeprecationWarning`` with a link to some examples of how to convert code :ref:`here <indexing.deprecate_ix>`.
-
-
-.. ipython:: python
-
-  df = pd.DataFrame({'A': [1, 2, 3],
-                     'B': [4, 5, 6]},
-                    index=list('abc'))
-
-  df
-
-Previous Behavior, where you wish to get the 0th and the 2nd elements from the index in the 'A' column.
-
-.. code-block:: ipython
-
-  In [3]: df.ix[[0, 2], 'A']
-  Out[3]:
-  a    1
-  c    3
-  Name: A, dtype: int64
-
-Using ``.loc``. Here we will select the appropriate indexes from the index, then use *label* indexing.
-
-.. ipython:: python
-
-  df.loc[df.index[[0, 2]], 'A']
-
-Using ``.iloc``. Here we will get the location of the 'A' column, then use *positional* indexing to select things.
-
-.. ipython:: python
-
-  df.iloc[[0, 2], df.columns.get_loc('A')]
-
-
-.. _whatsnew.api_breaking.io_compat:
-
-Possible incompat for HDF5 formats for pandas < 0.13.0
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``pd.TimeSeries`` was deprecated officially in 0.17.0, though has only been an alias since 0.13.0. It has
-been dropped in favor of ``pd.Series``. (:issue:`15098`).
-
-This *may* cause HDF5 files that were created in prior versions to become unreadable if ``pd.TimeSeries``
-was used. This is most likely to be for pandas < 0.13.0. If you find yourself in this situation.
-You can use a recent prior version of pandas to read in your HDF5 files,
-then write them out again after applying the procedure below.
-
-.. code-block:: ipython
-
-   In [2]: s = pd.TimeSeries([1,2,3], index=pd.date_range('20130101', periods=3))
-
-   In [3]: s
-   Out[3]:
-   2013-01-01    1
-   2013-01-02    2
-   2013-01-03    3
-   Freq: D, dtype: int64
-
-   In [4]: type(s)
-   Out[4]: pandas.core.series.TimeSeries
-
-   In [5]: s = pd.Series(s)
-
-   In [6]: s
-   Out[6]:
-   2013-01-01    1
-   2013-01-02    2
-   2013-01-03    3
-   Freq: D, dtype: int64
-
-   In [7]: type(s)
-   Out[7]: pandas.core.series.Series
-
-
-.. _whatsnew_0200.api_breaking.index_map:
-
-Map on Index types now return other Index types
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-``map`` on an ``Index`` now returns an ``Index``, not a numpy array (:issue:`12766`)
-
-.. ipython:: python
-
-   idx = Index([1, 2])
-   idx
-   mi = MultiIndex.from_tuples([(1, 2), (2, 4)])
-   mi
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [5]: idx.map(lambda x: x * 2)
-   Out[5]: array([2, 4])
-
-   In [6]: idx.map(lambda x: (x, x * 2))
-   Out[6]: array([(1, 2), (2, 4)], dtype=object)
-
-   In [7]: mi.map(lambda x: x)
-   Out[7]: array([(1, 2), (2, 4)], dtype=object)
-
-   In [8]: mi.map(lambda x: x[0])
-   Out[8]: array([1, 2])
-
-New Behavior:
-
-.. ipython:: python
-
-   idx.map(lambda x: x * 2)
-   idx.map(lambda x: (x, x * 2))
-
-   mi.map(lambda x: x)
-
-   mi.map(lambda x: x[0])
-
-
-``map`` on a ``Series`` with ``datetime64`` values may return ``int64`` dtypes rather than ``int32``
-
-.. ipython:: python
-
-   s = Series(date_range('2011-01-02T00:00', '2011-01-02T02:00', freq='H').tz_localize('Asia/Tokyo'))
-   s
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [9]: s.map(lambda x: x.hour)
-   Out[9]:
-   0    0
-   1    1
-   2    2
-   dtype: int32
-
-New Behavior:
-
-.. ipython:: python
-
-   s.map(lambda x: x.hour)
-
-
-.. _whatsnew_0200.api_breaking.index_dt_field:
-
-Accessing datetime fields of Index now return Index
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The datetime-related attributes (see :ref:`here <timeseries.components>`
-for an overview) of ``DatetimeIndex``, ``PeriodIndex`` and ``TimedeltaIndex`` previously
-returned numpy arrays. They will now return a new ``Index`` object, except
-in the case of a boolean field, where the result will stil be a boolean ndarray. (:issue:`15022`)
-
-Previous behaviour:
-
-.. code-block:: ipython
-
-    In [1]: idx = pd.date_range("2015-01-01", periods=5, freq='10H')
-
-    In [2]: idx.hour
-    Out[2]: array([ 0, 10, 20,  6, 16], dtype=int32)
-
-New Behavior:
-
-.. ipython:: python
-
-    idx = pd.date_range("2015-01-01", periods=5, freq='10H')
-    idx.hour
-
-This has the advantage that specific ``Index`` methods are still available on the
-result. On the other hand, this might have backward incompatibilities: e.g.
-compared to numpy arrays, ``Index`` objects are not mutable. To get the original
-ndarray, you can always convert explicitly using ``np.asarray(idx.hour)``.
-
-.. _whatsnew_0200.api_breaking.s3:
-
-S3 File Handling
-^^^^^^^^^^^^^^^^
-
-pandas now uses `s3fs <http://s3fs.readthedocs.io/>`_ for handling S3 connections. This shouldn't break
-any code. However, since s3fs is not a required dependency, you will need to install it separately, like ``boto``
-in prior versions of pandas. (:issue:`11915`).
-
-.. _whatsnew_0200.api_breaking.partial_string_indexing:
-
-Partial String Indexing Changes
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-:ref:`DatetimeIndex Partial String Indexing <timeseries.partialindexing>` now works as exact match, provided that string resolution coincides with index resolution, including a case when both are seconds (:issue:`14826`). See :ref:`Slice vs. Exact Match <timeseries.slice_vs_exact_match>` for details.
-
-.. ipython:: python
-
-  df = DataFrame({'a': [1, 2, 3]}, DatetimeIndex(['2011-12-31 23:59:59',
-                                                  '2012-01-01 00:00:00',
-                                                  '2012-01-01 00:00:01']))
-Previous Behavior:
-
-.. code-block:: ipython
-
-  In [4]: df['2011-12-31 23:59:59']
-  Out[4]:
-                         a
-  2011-12-31 23:59:59  1
-
-  In [5]: df['a']['2011-12-31 23:59:59']
-  Out[5]:
-  2011-12-31 23:59:59    1
-  Name: a, dtype: int64
-
-
-New Behavior:
-
-.. code-block:: ipython
-
-  In [4]: df['2011-12-31 23:59:59']
-  KeyError: '2011-12-31 23:59:59'
-
-  In [5]: df['a']['2011-12-31 23:59:59']
-  Out[5]: 1
-
-.. _whatsnew_0200.api_breaking.concat_dtypes:
-
-Concat of different float dtypes will not automatically upcast
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-Previously, ``concat`` of multiple objects with different ``float`` dtypes would automatically upcast results to a dtype of ``float64``.
-Now the smallest acceptable dtype will be used (:issue:`13247`)
-
-.. ipython:: python
-
-   df1 = pd.DataFrame(np.array([1.0], dtype=np.float32, ndmin=2))
-   df1.dtypes
-
-.. ipython:: python
-
-   df2 = pd.DataFrame(np.array([np.nan], dtype=np.float32, ndmin=2))
-   df2.dtypes
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [7]: pd.concat([df1,df2]).dtypes
-   Out[7]:
-   0    float64
-   dtype: object
-
-New Behavior:
-
-.. ipython:: python
-
-   pd.concat([df1,df2]).dtypes
-
-.. _whatsnew_0200.api_breaking.gbq:
-
-Pandas Google BigQuery support has moved
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-pandas has split off Google BigQuery support into a separate package ``pandas-gbq``. You can ``pip install pandas-gbq`` to get it.
-The functionality of :func:`read_gbq` and :meth:`DataFrame.to_gbq` remain the same with the currently released version of ``pandas-gbq=0.1.3``.
-Documentation is now hosted `here <https://pandas-gbq.readthedocs.io/>`__  (:issue:`15347`)
-
-.. _whatsnew_0200.api_breaking.memory_usage:
-
-Memory Usage for Index is more Accurate
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In previous versions, showing ``.memory_usage()`` on a pandas structure that has an index, would only include actual index values and not include structures that facilitated fast indexing. This will generally be different for ``Index`` and ``MultiIndex`` and less-so for other index types. (:issue:`15237`)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [8]: index = Index(['foo', 'bar', 'baz'])
-
-   In [9]: index.memory_usage(deep=True)
-   Out[9]: 180
-
-   In [10]: index.get_loc('foo')
-   Out[10]: 0
-
-   In [11]: index.memory_usage(deep=True)
-   Out[11]: 180
-
-New Behavior:
-
-.. code-block:: ipython
-
-   In [8]: index = Index(['foo', 'bar', 'baz'])
-
-   In [9]: index.memory_usage(deep=True)
-   Out[9]: 180
-
-   In [10]: index.get_loc('foo')
-   Out[10]: 0
-
-   In [11]: index.memory_usage(deep=True)
-   Out[11]: 260
-
-.. _whatsnew_0200.api_breaking.extensions:
-
-Extension Modules Moved
-^^^^^^^^^^^^^^^^^^^^^^^
-
-Some formerly public c/c++/cython extension modules have been moved and/or renamed. These are all removed from the public API.
-If indicated, a deprecation warning will be issued if you reference that module. (:issue:`12588`)
-
-.. csv-table::
-    :header: "Previous Location", "New Location", "Deprecated"
-    :widths: 30, 30, 4
-
-    "pandas.lib", "pandas._libs.lib", "X"
-    "pandas.tslib", "pandas._libs.tslib", "X"
-    "pandas._join", "pandas._libs.join", ""
-    "pandas._period", "pandas._libs.period", ""
-    "pandas.msgpack", "pandas.io.msgpack", ""
-    "pandas.index", "pandas._libs.index", ""
-    "pandas.algos", "pandas._libs.algos", ""
-    "pandas.hashtable", "pandas._libs.hashtable", ""
-    "pandas.json", "pandas.io.json.libjson", "X"
-    "pandas.parser", "pandas.io.libparsers", "X"
-    "pandas.io.sas.saslib", "pandas.io.sas.libsas", ""
-    "pandas._testing", "pandas.util.libtesting", ""
-    "pandas._sparse", "pandas.sparse.libsparse", ""
-    "pandas._hash", "pandas.tools.libhash", ""
-    "pandas._window", "pandas.core.libwindow", ""
-
-
-.. _whatsnew_0200.api_breaking.groupby_describe:
-
-Groupby Describe Formatting
-^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-The output formatting of ``groupby.describe()`` now labels the ``describe()`` metrics in the columns instead of the index.
-This format is consistent with ``groupby.agg()`` when applying multiple functions at once. (:issue:`4792`)
-
-Previous Behavior:
-
-.. code-block:: ipython
-
-   In [1]: df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
-
-   In [2]: df.groupby('A').describe()
-   Out[2]:
-                   B
-   A
-   1 count  2.000000
-     mean   1.500000
-     std    0.707107
-     min    1.000000
-     25%    1.250000
-     50%    1.500000
-     75%    1.750000
-     max    2.000000
-   2 count  2.000000
-     mean   3.500000
-     std    0.707107
-     min    3.000000
-     25%    3.250000
-     50%    3.500000
-     75%    3.750000
-     max    4.000000
-
-   In [3]: df.groupby('A').agg([np.mean, np.std, np.min, np.max])
-   Out[3]:
-        B
-     mean       std amin amax
-   A
-   1  1.5  0.707107    1    2
-   2  3.5  0.707107    3    4
-
-New Behavior:
-
-.. ipython:: python
-
-   df = pd.DataFrame({'A': [1, 1, 2, 2], 'B': [1, 2, 3, 4]})
-
-   df.groupby('A').describe()
-
-   df.groupby('A').agg([np.mean, np.std, np.min, np.max])
-
-.. _whatsnew_0200.api_breaking.hdfstore_where:
-
-HDFStore where string comparison
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-In previous versions most types could be compared to string column in a ``HDFStore``
-usually resulting in an invalid comparsion.  These comparisions will now raise a
-``TypeError`` (:issue:`15492`)
-
-New Behavior:
-
-.. code-block:: ipython
-
-   In [15]: df = pd.DataFrame({'unparsed_date': ['2014-01-01', '2014-01-01']})
-
-   In [16]: df.dtypes
-   Out[16]:
-   unparsed_date    object
-   dtype: object
-
-   In [17]: df.to_hdf('store.h5', 'key', format='table', data_columns=True)
-
-   In [18]: ts = pd.Timestamp('2014-01-01')
-
-   In [19]: pd.read_hdf('store.h5', 'key', where='unparsed_date > ts')
-   TypeError: Cannot compare 2014-01-01 00:00:00 of
-   type <class 'pandas.tslib.Timestamp'> to string column
-
-.. _whatsnew_0200.api_breaking.index_order:
-
-Index.intersection and inner join now preserve the order of the left Index
-^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-
-`:meth:Index.intersection` now preserves the order of the calling ``Index`` (left)
-instead of the other ``Index`` (right) (:issue:`15582`). This affects the inner
-joins (`:meth:DataFrame.join` and `:func:merge`) and the ``.align`` methods.
-
-- ``Index.intersection``
-
-  .. ipython:: python
-
-     left = pd.Index([2, 1, 0])
-     left
-     right = pd.Index([1, 2, 3])
-     right
-
-  Previous Behavior:
-
-  .. code-block:: ipython
-
-     In [4]: left.intersection(right)
-     Out[4]: Int64Index([1, 2], dtype='int64')
-
-  New Behavior:
-
-  .. ipython:: python
-
-     left.intersection(right)
-
-- ``DataFrame.join`` and ``pd.merge``
-
-  .. ipython:: python
-
-     left = pd.DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
-     left
-     right = pd.DataFrame({'b': [100, 200, 300]}, index=[1, 2, 3])
-     right
-
-  Previous Behavior:
-
-  .. code-block:: ipython
-
-     In [4]: left.join(right, how='inner')
-     Out[4]:
-         a    b
-     1  10  100
-     2  20  200
-
-  New Behavior:
-
-  .. ipython:: python
-
-     left.join(right, how='inner')
-
-
-.. _whatsnew_0200.api:
-
-Other API Changes
-^^^^^^^^^^^^^^^^^
-
-- ``numexpr`` version is now required to be >= 2.4.6 and it will not be used at all if this requisite is not fulfilled (:issue:`15213`).
-- ``CParserError`` has been renamed to ``ParserError`` in ``pd.read_csv()`` and will be removed in the future (:issue:`12665`)
-- ``SparseArray.cumsum()`` and ``SparseSeries.cumsum()`` will now always return ``SparseArray`` and ``SparseSeries`` respectively (:issue:`12855`)
-- ``DataFrame.applymap()`` with an empty ``DataFrame`` will return a copy of the empty ``DataFrame`` instead of a ``Series`` (:issue:`8222`)
-- ``.loc`` has compat with ``.ix`` for accepting iterators, and NamedTuples (:issue:`15120`)
-- ``interpolate()`` and ``fillna()`` will raise a ``ValueError`` if the ``limit`` keyword argument is not greater than 0. (:issue:`9217`)
-- ``pd.read_csv()`` will now issue a ``ParserWarning`` whenever there are conflicting values provided by the ``dialect`` parameter and the user (:issue:`14898`)
-- ``pd.read_csv()`` will now raise a ``ValueError`` for the C engine if the quote character is larger than than one byte (:issue:`11592`)
-- ``inplace`` arguments now require a boolean value, else a ``ValueError`` is thrown (:issue:`14189`)
-- ``pandas.api.types.is_datetime64_ns_dtype`` will now report ``True`` on a tz-aware dtype, similar to ``pandas.api.types.is_datetime64_any_dtype``
-- ``DataFrame.asof()`` will return a null filled ``Series`` instead the scalar ``NaN`` if a match is not found (:issue:`15118`)
-- Reorganization of timeseries development tests (:issue:`14854`)
-- Reorganization of date converter tests (:issue:`15707`)
-- Specific support for ``copy.copy()`` and ``copy.deepcopy()`` functions on NDFrame objects (:issue:`15444`)
-- ``Series.sort_values()`` accepts a one element list of bool for consistency with the behavior of ``DataFrame.sort_values()`` (:issue:`15604`)
-- ``.merge()`` and ``.join()`` on ``category`` dtype columns will now preserve the category dtype when possible (:issue:`10409`)
-- ``SparseDataFrame.default_fill_value`` will be 0, previously was ``nan`` in the return from ``pd.get_dummies(..., sparse=True)`` (:issue:`15594`)
-- The default behaviour of ``Series.str.match`` has changed from extracting
-  groups to matching the pattern. The extracting behaviour was deprecated
-  since pandas version 0.13.0 and can be done with the ``Series.str.extract``
-  method (:issue:`5224`). As a consequence, the ``as_indexer`` keyword is
-  ignored (no longer needed to specify the new behaviour) and is deprecated.
-- ``NaT`` will now correctly report ``False`` for datetimelike boolean operations such as ``is_month_start`` (:issue:`15781`)
-- ``NaT`` will now correctly return ``np.nan`` for ``Timedelta`` and ``Period`` accessors such as ``days`` and ``quarter`` (:issue:`15782`)
-
-.. _whatsnew_0200.deprecations:
-
-Deprecations
-~~~~~~~~~~~~
-
-- ``SparseArray.to_dense()`` has deprecated the ``fill`` parameter, as that parameter was not being respected (:issue:`14647`)
-- ``SparseSeries.to_dense()`` has deprecated the ``sparse_only`` parameter (:issue:`14647`)
-- ``Series.repeat()`` has deprecated the ``reps`` parameter in favor of ``repeats`` (:issue:`12662`)
-- ``Index.repeat()`` and ``MultiIndex.repeat()`` have deprecated the ``n`` parameter in favor of ``repeats`` (:issue:`12662`)
-- ``Categorical.searchsorted()`` and ``Series.searchsorted()`` have deprecated the ``v`` parameter in favor of ``value`` (:issue:`12662`)
-- ``TimedeltaIndex.searchsorted()``, ``DatetimeIndex.searchsorted()``, and ``PeriodIndex.searchsorted()`` have deprecated the ``key`` parameter in favor of ``value`` (:issue:`12662`)
-- ``DataFrame.astype()`` has deprecated the ``raise_on_error`` parameter in favor of ``errors`` (:issue:`14878`)
-- ``Series.sortlevel`` and ``DataFrame.sortlevel`` have been deprecated in favor of ``Series.sort_index`` and ``DataFrame.sort_index`` (:issue:`15099`)
-- importing ``concat`` from ``pandas.tools.merge`` has been deprecated in favor of imports from the ``pandas`` namespace. This should only affect explict imports (:issue:`15358`)
-- ``Series/DataFrame/Panel.consolidate()`` been deprecated as a public method. (:issue:`15483`)
-- The ``as_indexer`` keyword of ``Series.str.match()`` has been deprecated (ignored keyword) (:issue:`15257`).
-- The following top-level pandas functions have been deprecated and will be removed in a future version (:issue:`13790`)
-
-  * ``pd.pnow()``, replaced by ``Period.now()``
-  * ``pd.Term``, is removed, as it is not applicable to user code. Instead use in-line string expressions in the where clause when searching in HDFStore
-  * ``pd.Expr``, is removed, as it is not applicable to user code.
-  * ``pd.match()``, is removed.
-  * ``pd.groupby()``, replaced by using the ``.groupby()`` method directly on a ``Series/DataFrame``
-
-.. _whatsnew_0200.prior_deprecations:
-
-Removal of prior version deprecations/changes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-- The ``pandas.rpy`` module is removed. Similar functionality can be accessed
-  through the `rpy2 <https://rpy2.readthedocs.io/>`__ project.
-  See the :ref:`R interfacing docs <rpy>` for more details.
-- The ``pandas.io.ga`` module with a ``google-analytics`` interface is removed (:issue:`11308`).
-  Similar functionality can be found in the `Google2Pandas <https://github.com/panalysis/Google2Pandas>`__ package.
-- ``pd.to_datetime`` and ``pd.to_timedelta`` have dropped the ``coerce`` parameter in favor of ``errors`` (:issue:`13602`)
-- ``pandas.stats.fama_macbeth``, ``pandas.stats.ols``, ``pandas.stats.plm`` and ``pandas.stats.var``, as well as the top-level ``pandas.fama_macbeth`` and ``pandas.ols`` routines are removed. Similar functionaility can be found in the `statsmodels <shttp://www.statsmodels.org/dev/>`__ package. (:issue:`11898`)
-- The ``TimeSeries`` and ``SparseTimeSeries`` classes, aliases of ``Series``
-  and ``SparseSeries``, are removed (:issue:`10890`, :issue:`15098`).
-- ``Series.is_time_series`` is dropped in favor of ``Series.index.is_all_dates`` (:issue:`15098`)
-- The deprecated ``irow``, ``icol``, ``iget`` and ``iget_value`` methods are removed
-  in favor of ``iloc`` and ``iat`` as explained :ref:`here <whatsnew_0170.deprecations>` (:issue:`10711`).
-- The deprecated ``DataFrame.iterkv()`` has been removed in favor of ``DataFrame.iteritems()`` (:issue:`10711`)
-- The ``Categorical`` constructor has dropped the ``name`` parameter (:issue:`10632`)
-- ``Categorical`` has dropped support for ``NaN`` categories (:issue:`10748`)
-- The ``take_last`` parameter has been dropped from ``duplicated()``, ``drop_duplicates()``, ``nlargest()``, and ``nsmallest()`` methods (:issue:`10236`, :issue:`10792`, :issue:`10920`)
-- ``Series``, ``Index``, and ``DataFrame`` have dropped the ``sort`` and ``order`` methods (:issue:`10726`)
-- Where clauses in ``pytables`` are only accepted as strings and expressions types and not other data-types (:issue:`12027`)
-- ``DataFrame`` has dropped the ``combineAdd`` and ``combineMult`` methods in favor of ``add`` and ``mul`` respectively (:issue:`10735`)
-
-.. _whatsnew_0200.performance:
-
-Performance Improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improved performance of ``pd.wide_to_long()`` (:issue:`14779`)
-- Increased performance of ``pd.factorize()`` by releasing the GIL with ``object`` dtype when inferred as strings (:issue:`14859`)
-- Improved performance of timeseries plotting with an irregular DatetimeIndex
-  (or with ``compat_x=True``) (:issue:`15073`).
-- Improved performance of ``groupby().cummin()`` and ``groupby().cummax()`` (:issue:`15048`, :issue:`15109`, :issue:`15561`, :issue:`15635`)
-- Improved performance and reduced memory when indexing with a ``MultiIndex`` (:issue:`15245`)
-- When reading buffer object in ``read_sas()`` method without specified format, filepath string is inferred rather than buffer object. (:issue:`14947`)
-- Improved performance of ``.rank()`` for categorical data (:issue:`15498`)
-- Improved performance when using ``.unstack()`` (:issue:`15503`)
-- Improved performance of merge/join on ``category`` columns (:issue:`10409`)
-- Improved performance of ``drop_duplicates()`` on ``bool`` columns (:issue:`12963`)
-- Improve performance of ``pd.core.groupby.GroupBy.apply`` when the applied
-  function used the ``.name`` attribute of the group DataFrame (:issue:`15062`).
-
-
-
-.. _whatsnew_0200.bug_fixes:
-
-Bug Fixes
-~~~~~~~~~
-
-Conversion
-^^^^^^^^^^
-
-- Bug in ``Timestamp.replace`` now raises ``TypeError`` when incorrect argument names are given; previously this raised ``ValueError`` (:issue:`15240`)
-- Bug in ``Timestamp.replace`` with compat for passing long integers (:issue:`15030`)
-- Bug in ``Timestamp`` returning UTC based time/date attributes when a timezone was provided (:issue:`13303`)
-- Bug in ``TimedeltaIndex`` addition where overflow was being allowed without error (:issue:`14816`)
-- Bug in ``TimedeltaIndex`` raising a ``ValueError`` when boolean indexing with ``loc`` (:issue:`14946`)
-- Bug in catching an overflow in ``Timestamp`` + ``Timedelta/Offset`` operations (:issue:`15126`)
-- Bug in ``DatetimeIndex.round()`` and ``Timestamp.round()`` floating point accuracy when rounding by milliseconds or less (:issue:`14440`, :issue:`15578`)
-- Bug in ``astype()`` where ``inf`` values were incorrectly converted to integers. Now raises error now with ``astype()`` for Series and DataFrames (:issue:`14265`)
-- Bug in ``DataFrame(..).apply(to_numeric)`` when values are of type decimal.Decimal. (:issue:`14827`)
-- Bug in ``describe()`` when passing a numpy array which does not contain the median to the ``percentiles`` keyword argument (:issue:`14908`)
-- Cleaned up ``PeriodIndex`` constructor, including raising on floats more consistently (:issue:`13277`)
-- Bug in using ``__deepcopy__`` on empty NDFrame objects (:issue:`15370`)
-- Bug in ``.replace()`` may result in incorrect dtypes. (:issue:`12747`, :issue:`15765`)
-- Bug in ``Series.replace`` and ``DataFrame.replace`` which failed on empty replacement dicts (:issue:`15289`)
-- Bug in ``Series.replace`` which replaced a numeric by string (:issue:`15743`)
-- Bug in ``Index`` construction with ``NaN`` elements and integer dtype specified (:issue:`15187`)
-- Bug in ``Series`` construction with a datetimetz (:issue:`14928`)
-- Bug in ``Series.dt.round()`` inconsistent behaviour on ``NaT`` 's with different arguments (:issue:`14940`)
-- Bug in ``Series`` constructor when both ``copy=True`` and ``dtype`` arguments are provided (:issue:`15125`)
-- Incorrect dtyped ``Series`` was returned by comparison methods (e.g., ``lt``, ``gt``, ...) against a constant for an empty ``DataFrame`` (:issue:`15077`)
-- Bug in ``Series.ffill()`` with mixed dtypes containing tz-aware datetimes. (:issue:`14956`)
-- Bug in ``DataFrame.fillna()`` where the argument ``downcast`` was ignored when fillna value was of type ``dict`` (:issue:`15277`)
-- Bug in ``.asfreq()``, where frequency was not set for empty ``Series`` (:issue:`14320`)
-
-Indexing
-^^^^^^^^
-
-- Bug in ``Index`` power operations with reversed operands (:issue:`14973`)
-- Bug in ``DataFrame.sort_values()`` when sorting by multiple columns where one column is of type ``int64`` and contains ``NaT`` (:issue:`14922`)
-- Bug in ``DataFrame.reindex()`` in which ``method`` was ignored when passing ``columns`` (:issue:`14992`)
-- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a ``Series`` indexer (:issue:`14730`, :issue:`15424`)
-- Bug in ``DataFrame.loc`` with indexing a ``MultiIndex`` with a numpy array (:issue:`15434`)
-- Bug in ``Series.asof`` which raised if the series contained all ``np.nan`` (:issue:`15713`)
-- Bug in ``.at`` when selecting from a tz-aware column (:issue:`15822`)
-- Bug in ``Series.where()`` and ``DataFrame.where()`` where array-like conditionals were being rejected (:issue:`15414`)
-- Bug in ``Series.where()`` where TZ-aware data was converted to float representation (:issue:`15701`)
-- Bug in ``.loc`` that would not return the correct dtype for scalar access for a DataFrame (:issue:`11617`)
-- Bug in output formatting of a ``MultiIndex`` when names are integers (:issue:`12223`, :issue:`15262`)
-- Bug in ``Categorical.searchsorted()`` where alphabetical instead of the provided categorical order was used (:issue:`14522`)
-- Bug in ``Series.iloc`` where a ``Categorical`` object for list-like indexes input was returned, where a ``Series`` was expected. (:issue:`14580`)
-- Bug in ``DataFrame.isin`` comparing datetimelike to empty frame (:issue:`15473`)
-- Bug in ``.reset_index()`` when an all ``NaN`` level of a ``MultiIndex`` would fail (:issue:`6322`)
-- Bug in creating a ``MultiIndex`` with tuples and not passing a list of names; this will now raise ``ValueError`` (:issue:`15110`)
-- Bug in the HTML display with with a ``MultiIndex`` and truncation (:issue:`14882`)
-- Bug in the display of ``.info()`` where a qualifier (+) would always be displayed with a ``MultiIndex`` that contains only non-strings (:issue:`15245`)
-
-I/O
-^^^
-
-- Bug in ``pd.to_numeric()`` in which float and unsigned integer elements were being improperly casted (:issue:`14941`, :issue:`15005`)
-- Bug in ``pd.read_fwf()`` where the skiprows parameter was not being respected during column width inference (:issue:`11256`)
-- Bug in ``pd.read_csv()`` in which the ``dialect`` parameter was not being verified before processing (:issue:`14898`)
-- Bug in ``pd.read_csv()`` in which missing data was being improperly handled with ``usecols`` (:issue:`6710`)
-- Bug in ``pd.read_csv()`` in which a file containing a row with many columns followed by rows with fewer columns would cause a crash (:issue:`14125`)
-- Bug in ``pd.read_csv()`` for the C engine where ``usecols`` were being indexed incorrectly with ``parse_dates`` (:issue:`14792`)
-- Bug in ``pd.read_csv()`` with ``parse_dates`` when multiline headers are specified (:issue:`15376`)
-- Bug in ``pd.read_csv()`` with ``float_precision='round_trip'`` which caused a segfault when a text entry is parsed (:issue:`15140`)
-- Added checks in ``pd.read_csv()`` ensuring that values for ``nrows`` and ``chunksize`` are valid (:issue:`15767`)
-- Bug in ``pd.tools.hashing.hash_pandas_object()`` in which hashing of categoricals depended on the ordering of categories, instead of just their values. (:issue:`15143`)
-- Bug in ``.to_json()`` where ``lines=True`` and contents (keys or values) contain escaped characters (:issue:`15096`)
-- Bug in ``.to_json()`` causing single byte ascii characters to be expanded to four byte unicode (:issue:`15344`)
-- Bug in ``.read_json()`` for Python 2 where ``lines=True`` and contents contain non-ascii unicode characters (:issue:`15132`)
-- Bug in ``pd.read_msgpack()`` in which ``Series`` categoricals were being improperly processed (:issue:`14901`)
-- Bug in ``pd.read_msgpack()`` which did not allow loading of a dataframe with an index of type ``CategoricalIndex`` (:issue:`15487`)
-- Bug in ``pd.read_msgpack()`` when deserializing a ``CategoricalIndex`` (:issue:`15487`)
-- Bug in ``DataFrame.to_records()`` with converting a ``DatetimeIndex`` with a timezone (:issue:`13937`)
-- Bug in ``DataFrame.to_records()`` which failed with unicode characters in column names (:issue:`11879`)
-- Bug in ``.to_sql()`` when writing a DataFrame with numeric index names (:issue:`15404`).
-- Bug in ``DataFrame.to_html()`` with ``index=False`` and ``max_rows`` raising in ``IndexError`` (:issue:`14998`)
-- Bug in ``pd.read_hdf()`` passing a ``Timestamp`` to the ``where`` parameter with a non date column (:issue:`15492`)
-- Bug in ``DataFrame.to_stata()`` and ``StataWriter`` which produces incorrectly formatted files to be produced for some locales (:issue:`13856`)
-- Bug in ``StataReader`` and ``StataWriter`` which allows invalid encodings (:issue:`15723`)
-
-Plotting
-^^^^^^^^
-
-- Bug in ``DataFrame.hist`` where ``plt.tight_layout`` caused an ``AttributeError``  (use ``matplotlib >= 2.0.1``) (:issue:`9351`)
-- Bug in ``DataFrame.boxplot`` where ``fontsize`` was not applied to the tick labels on both axes (:issue:`15108`)
-
-Groupby/Resample/Rolling
-^^^^^^^^^^^^^^^^^^^^^^^^
-
-- Bug in ``.groupby(..).resample()`` when passed the ``on=`` kwarg. (:issue:`15021`)
-- Properly set ``__name__`` and ``__qualname__`` for ``Groupby.*`` functions (:issue:`14620`)
-- Bug in ``GroupBy.get_group()`` failing with a categorical grouper (:issue:`15155`)
-- Bug in ``.groupby(...).rolling(...)`` when ``on`` is specified and using a ``DatetimeIndex`` (:issue:`15130`)
-- Bug in groupby operations with timedelta64 when passing ``numeric_only=False`` (:issue:`5724`)
-- Bug in ``groupby.apply()`` coercing ``object`` dtypes to numeric types, when not all values were numeric (:issue:`14423`, :issue:`15421`, :issue:`15670`)
-- Bug in ``resample``, where a non-string ``loffset`` argument would not be applied when resampling a timeseries (:issue:`13218`)
-- Bug in ``DataFrame.groupby().describe()`` when grouping on ``Index`` containing tuples (:issue:`14848`)
-- Bug in ``groupby().nunique()`` with a datetimelike-grouper where bins counts were incorrect (:issue:`13453`)
-- Bug in ``groupby.transform()`` that would coerce the resultant dtypes back to the original (:issue:`10972`, :issue:`11444`)
-- Bug in ``groupby.agg()`` incorrectly localizing timezone on ``datetime`` (:issue:`15426`, :issue:`10668`, :issue:`13046`)
-- Bug in ``.rolling/expanding()`` functions where ``count()`` was not counting ``np.Inf``, nor handling ``object`` dtypes (:issue:`12541`)
-- Bug in ``.rolling()`` where ``pd.Timedelta`` or ``datetime.timedelta`` was not accepted as a ``window`` argument (:issue:`15440`)
-- Bug in ``Rolling.quantile`` function that caused a segmentation fault when called with a quantile value outside of the range [0, 1] (:issue:`15463`)
-- Bug in ``DataFrame.resample().median()`` if duplicate column names are present (:issue:`14233`)
-
-Sparse
-^^^^^^
-
-- Bug in ``SparseSeries.reindex`` on single level with list of length 1 (:issue:`15447`)
-- Bug in repr-formatting a ``SparseDataFrame`` after a value was set on (a copy of) one of its series (:issue:`15488`)
-- Bug in ``SparseDataFrame`` construction with lists not coercing to dtype (:issue:`15682`)
-
-Reshaping
-^^^^^^^^^
-
-- Bug in ``pd.merge_asof()`` where ``left_index`` or ``right_index`` caused a failure when multiple ``by`` was specified (:issue:`15676`)
-- Bug in ``pd.merge_asof()`` where ``left_index``/``right_index`` together caused a failure when ``tolerance`` was specified (:issue:`15135`)
-- Bug in ``DataFrame.pivot_table()`` where ``dropna=True`` would not drop all-NaN columns when the columns was a ``category`` dtype (:issue:`15193`)
-- Bug in ``pd.melt()`` where passing a tuple value for ``value_vars`` caused a ``TypeError`` (:issue:`15348`)
-- Bug in ``pd.pivot_table()`` where no error was raised when values argument was not in the columns (:issue:`14938`)
-- Bug in ``pd.concat()`` in which concatting with an empty dataframe with ``join='inner'`` was being improperly handled (:issue:`15328`)
-- Bug with ``sort=True`` in ``DataFrame.join`` and ``pd.merge`` when joining on indexes (:issue:`15582`)
-
-Numeric
-^^^^^^^
-
-- Bug in ``.rank()`` which incorrectly ranks ordered categories (:issue:`15420`)
-- Bug in ``.corr()`` and ``.cov()`` where the column and index were the same object (:issue:`14617`)
-- Bug in ``.mode()`` where ``mode`` was not returned if was only a single value (:issue:`15714`)
-- Bug in ``pd.cut()`` with a single bin on an all 0s array (:issue:`15428`)
-- Bug in ``pd.qcut()`` with a single quantile and an array with identical values (:issue:`15431`)
-- Bug in ``pandas.tools.utils.cartesian_product()`` with large input can cause overflow on windows (:issue:`15265`)
-- Bug in ``.eval()`` which caused multiline evals to fail with local variables not on the first line (:issue:`15342`)
-
-Other
-^^^^^
-
-- Compat with SciPy 0.19.0 for testing on ``.interpolate()`` (:issue:`15662`)
-- Compat for 32-bit platforms for ``.qcut/cut``; bins will now be ``int64`` dtype (:issue:`14866`)
-- Require at least 0.23 version of cython to avoid problems with character encodings (:issue:`14699`)
-- Bug in interactions with ``Qt`` when a ``QtApplication`` already exists (:issue:`14372`)
-- Avoid use of ``np.finfo()`` during ``import pandas`` removed to mitigate deadlock on Python GIL misuse (:issue:`14641`)
diff --git a/doc/source/whatsnew/v0.20.2.rst b/doc/source/whatsnew/v0.20.2.rst
new file mode 100644
index 0000000000000..b2592579eb03f
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.2.rst
@@ -0,0 +1,143 @@
+.. _whatsnew_0202:
+
+v0.20.2 (June 4, 2017)
+----------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a minor bug-fix release in the 0.20.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.20.2
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0202.enhancements:
+
+Enhancements
+~~~~~~~~~~~~
+
+- Unblocked access to additional compression types supported in pytables: 'blosc:blosclz, 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy', 'blosc:zlib', 'blosc:zstd' (:issue:`14478`)
+- ``Series`` provides a ``to_latex`` method (:issue:`16180`)
+
+- A new groupby method :meth:`~pandas.core.groupby.GroupBy.ngroup`,
+  parallel to the existing :meth:`~pandas.core.groupby.GroupBy.cumcount`,
+  has been added to return the group order (:issue:`11642`); see
+  :ref:`here <groupby.ngroup>`.
+
+.. _whatsnew_0202.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Performance regression fix when indexing with a list-like (:issue:`16285`)
+- Performance regression fix for MultiIndexes (:issue:`16319`, :issue:`16346`)
+- Improved performance of ``.clip()`` with scalar arguments (:issue:`15400`)
+- Improved performance of groupby with categorical groupers (:issue:`16413`)
+- Improved performance of ``MultiIndex.remove_unused_levels()`` (:issue:`16556`)
+
+.. _whatsnew_0202.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Silenced a warning on some Windows environments about "tput: terminal attributes: No such device or address" when
+  detecting the terminal size. This fix only applies to python 3 (:issue:`16496`)
+- Bug in using ``pathlib.Path`` or ``py.path.local`` objects with io functions (:issue:`16291`)
+- Bug in ``Index.symmetric_difference()`` on two equal MultiIndex's, results in a ``TypeError`` (:issue:`13490`)
+- Bug in ``DataFrame.update()`` with ``overwrite=False`` and ``NaN values`` (:issue:`15593`)
+- Passing an invalid engine to :func:`read_csv` now raises an informative
+  ``ValueError`` rather than ``UnboundLocalError``. (:issue:`16511`)
+- Bug in :func:`unique` on an array of tuples (:issue:`16519`)
+- Bug in :func:`cut` when ``labels`` are set, resulting in incorrect label ordering (:issue:`16459`)
+- Fixed a compatibility issue with IPython 6.0's tab completion showing deprecation warnings on ``Categoricals`` (:issue:`16409`)
+
+Conversion
+^^^^^^^^^^
+
+- Bug in :func:`to_numeric` in which empty data inputs were causing a segfault of the interpreter (:issue:`16302`)
+- Silence numpy warnings when broadcasting ``DataFrame`` to ``Series`` with comparison ops (:issue:`16378`, :issue:`16306`)
+
+
+Indexing
+^^^^^^^^
+
+- Bug in ``DataFrame.reset_index(level=)`` with single level index (:issue:`16263`)
+- Bug in partial string indexing with a monotonic, but not strictly-monotonic, index incorrectly reversing the slice bounds (:issue:`16515`)
+- Bug in ``MultiIndex.remove_unused_levels()`` that would not return a ``MultiIndex`` equal to the original. (:issue:`16556`)
+
+I/O
+^^^
+
+- Bug in :func:`read_csv` when ``comment`` is passed in a space delimited text file (:issue:`16472`)
+- Bug in :func:`read_csv` not raising an exception with nonexistent columns in ``usecols`` when it had the correct length (:issue:`14671`)
+- Bug that would force importing of the clipboard routines unnecessarily, potentially causing an import error on startup (:issue:`16288`)
+- Bug that raised ``IndexError`` when HTML-rendering an empty ``DataFrame`` (:issue:`15953`)
+- Bug in :func:`read_csv` in which tarfile object inputs were raising an error in Python 2.x for the C engine (:issue:`16530`)
+- Bug where ``DataFrame.to_html()`` ignored the ``index_names`` parameter (:issue:`16493`)
+- Bug where ``pd.read_hdf()`` returns numpy strings for index names (:issue:`13492`)
+
+- Bug in ``HDFStore.select_as_multiple()`` where start/stop arguments were not respected (:issue:`16209`)
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.plot`` with a single column and a list-like ``color`` (:issue:`3486`)
+- Bug in ``plot`` where ``NaT`` in ``DatetimeIndex`` results in ``Timestamp.min`` (:issue:`12405`)
+- Bug in ``DataFrame.boxplot`` where ``figsize`` keyword was not respected for non-grouped boxplots (:issue:`11959`)
+
+
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in creating a time-based rolling window on an empty ``DataFrame`` (:issue:`15819`)
+- Bug in ``rolling.cov()`` with offset window (:issue:`16058`)
+- Bug in ``.resample()`` and ``.groupby()`` when aggregating on integers (:issue:`16361`)
+
+
+Sparse
+^^^^^^
+
+- Bug in construction of ``SparseDataFrame`` from ``scipy.sparse.dok_matrix`` (:issue:`16179`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in ``DataFrame.stack`` with unsorted levels in ``MultiIndex`` columns (:issue:`16323`)
+- Bug in ``pd.wide_to_long()`` where no error was raised when ``i`` was not a unique identifier (:issue:`16382`)
+- Bug in ``Series.isin(..)`` with a list of tuples (:issue:`16394`)
+- Bug in construction of a ``DataFrame`` with mixed dtypes including an all-NaT column. (:issue:`16395`)
+- Bug in ``DataFrame.agg()`` and ``Series.agg()`` with aggregating on non-callable attributes (:issue:`16405`)
+
+
+Numeric
+^^^^^^^
+- Bug in ``.interpolate()``, where ``limit_direction`` was not respected when ``limit=None`` (default) was passed (:issue:`16282`)
+
+Categorical
+^^^^^^^^^^^
+
+- Fixed comparison operations considering the order of the categories when both categoricals are unordered (:issue:`16014`)
+
+Other
+^^^^^
+
+- Bug in ``DataFrame.drop()`` with an empty-list with non-unique indices (:issue:`16270`)
+
+
+.. _whatsnew_0.20.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.20.0..v0.20.2
diff --git a/doc/source/whatsnew/v0.20.3.rst b/doc/source/whatsnew/v0.20.3.rst
new file mode 100644
index 0000000000000..8dc6acc2074bd
--- /dev/null
+++ b/doc/source/whatsnew/v0.20.3.rst
@@ -0,0 +1,76 @@
+.. _whatsnew_0203:
+
+v0.20.3 (July 7, 2017)
+-----------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a minor bug-fix release in the 0.20.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. contents:: What's new in v0.20.3
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0203.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+- Fixed a bug in failing to compute rolling computations of a column-MultiIndexed ``DataFrame`` (:issue:`16789`, :issue:`16825`)
+- Fixed a pytest marker failing downstream packages' tests suites (:issue:`16680`)
+
+Conversion
+^^^^^^^^^^
+
+- Bug in pickle compat prior to the v0.20.x series, when ``UTC`` is a timezone in a Series/DataFrame/Index (:issue:`16608`)
+- Bug in ``Series`` construction when passing a ``Series`` with ``dtype='category'`` (:issue:`16524`).
+- Bug in :meth:`DataFrame.astype` when passing a ``Series`` as the ``dtype`` kwarg. (:issue:`16717`).
+
+Indexing
+^^^^^^^^
+
+- Bug in ``Float64Index`` causing an empty array instead of ``None`` to be returned from ``.get(np.nan)`` on a Series whose index did not contain any ``NaN`` s (:issue:`8569`)
+- Bug in ``MultiIndex.isin`` causing an error when passing an empty iterable (:issue:`16777`)
+- Fixed a bug in a slicing DataFrame/Series that have a  ``TimedeltaIndex`` (:issue:`16637`)
+
+I/O
+^^^
+
+- Bug in :func:`read_csv` in which files weren't opened as binary files by the C engine on Windows, causing EOF characters mid-field, which would fail (:issue:`16039`, :issue:`16559`, :issue:`16675`)
+- Bug in :func:`read_hdf` in which reading a ``Series`` saved to an HDF file in 'fixed' format fails when an explicit ``mode='r'`` argument is supplied (:issue:`16583`)
+- Bug in :meth:`DataFrame.to_latex` where ``bold_rows`` was wrongly specified to be ``True`` by default, whereas in reality row labels remained non-bold whatever parameter provided. (:issue:`16707`)
+- Fixed an issue with :meth:`DataFrame.style` where generated element ids were not unique (:issue:`16780`)
+- Fixed loading a ``DataFrame`` with a ``PeriodIndex``, from a ``format='fixed'`` HDFStore, in Python 3, that was written in Python 2 (:issue:`16781`)
+
+Plotting
+^^^^^^^^
+
+- Fixed regression that prevented RGB and RGBA tuples from being used as color arguments (:issue:`16233`)
+- Fixed an issue with :meth:`DataFrame.plot.scatter` that incorrectly raised a ``KeyError`` when categorical data is used for plotting (:issue:`16199`)
+
+Reshaping
+^^^^^^^^^
+
+- ``PeriodIndex`` / ``TimedeltaIndex.join`` was missing the ``sort=`` kwarg (:issue:`16541`)
+- Bug in joining on a ``MultiIndex`` with a ``category`` dtype for a level (:issue:`16627`).
+- Bug in :func:`merge` when merging/joining with multiple categorical columns (:issue:`16767`)
+
+Categorical
+^^^^^^^^^^^
+
+- Bug in ``DataFrame.sort_values`` not respecting the ``kind`` parameter with categorical data (:issue:`16793`)
+
+
+.. _whatsnew_0.20.3.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.20.2..v0.20.3
diff --git a/doc/source/whatsnew/v0.21.0.rst b/doc/source/whatsnew/v0.21.0.rst
new file mode 100644
index 0000000000000..c62a2ee6ac92d
--- /dev/null
+++ b/doc/source/whatsnew/v0.21.0.rst
@@ -0,0 +1,1197 @@
+.. _whatsnew_0210:
+
+v0.21.0 (October 27, 2017)
+--------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a major release from 0.20.3 and includes a number of API changes, deprecations, new features,
+enhancements, and performance improvements along with a large number of bug fixes. We recommend that all
+users upgrade to this version.
+
+Highlights include:
+
+- Integration with `Apache Parquet <https://parquet.apache.org/>`__, including a new top-level :func:`read_parquet` function and :meth:`DataFrame.to_parquet` method, see :ref:`here <whatsnew_0210.enhancements.parquet>`.
+- New user-facing :class:`pandas.api.types.CategoricalDtype` for specifying
+  categoricals independent of the data, see :ref:`here <whatsnew_0210.enhancements.categorical_dtype>`.
+- The behavior of ``sum`` and ``prod`` on all-NaN Series/DataFrames is now consistent and no longer depends on whether `bottleneck <http://berkeleyanalytics.com/bottleneck>`__ is installed, and ``sum`` and ``prod`` on empty Series now return NaN instead of 0, see :ref:`here <whatsnew_0210.api_breaking.bottleneck>`.
+- Compatibility fixes for pypy, see :ref:`here <whatsnew_0210.pypy>`.
+- Additions to the ``drop``, ``reindex`` and ``rename`` API to make them more consistent, see :ref:`here <whatsnew_0210.enhancements.drop_api>`.
+- Addition of the new methods ``DataFrame.infer_objects`` (see :ref:`here <whatsnew_0210.enhancements.infer_objects>`) and ``GroupBy.pipe`` (see :ref:`here <whatsnew_0210.enhancements.GroupBy_pipe>`).
+- Indexing with a list of labels, where one or more of the labels is missing, is deprecated and will raise a KeyError in a future version, see :ref:`here <whatsnew_0210.api_breaking.loc>`.
+
+Check the :ref:`API Changes <whatsnew_0210.api_breaking>` and :ref:`deprecations <whatsnew_0210.deprecations>` before updating.
+
+.. contents:: What's new in v0.21.0
+    :local:
+    :backlinks: none
+    :depth: 2
+
+.. _whatsnew_0210.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0210.enhancements.parquet:
+
+Integration with Apache Parquet file format
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Integration with `Apache Parquet <https://parquet.apache.org/>`__, including a new top-level :func:`read_parquet` and :func:`DataFrame.to_parquet` method, see :ref:`here <io.parquet>` (:issue:`15838`, :issue:`17438`).
+
+`Apache Parquet <https://parquet.apache.org/>`__ provides a cross-language, binary file format for reading and writing data frames efficiently.
+Parquet is designed to faithfully serialize and de-serialize ``DataFrame`` s, supporting all of the pandas
+dtypes, including extension dtypes such as datetime with timezones.
+
+This functionality depends on either the `pyarrow <http://arrow.apache.org/docs/python/>`__ or `fastparquet <https://fastparquet.readthedocs.io/en/latest/>`__ library.
+For more details, see see :ref:`the IO docs on Parquet <io.parquet>`.
+
+
+.. _whatsnew_0210.enhancements.infer_objects:
+
+``infer_objects`` type conversion
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`DataFrame.infer_objects` and :meth:`Series.infer_objects`
+methods have been added to perform dtype inference on object columns, replacing
+some of the functionality of the deprecated ``convert_objects``
+method. See the documentation :ref:`here <basics.object_conversion>`
+for more details. (:issue:`11221`)
+
+This method only performs soft conversions on object columns, converting Python objects
+to native types, but not any coercive conversions. For example:
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3],
+                      'B': np.array([1, 2, 3], dtype='object'),
+                      'C': ['1', '2', '3']})
+   df.dtypes
+   df.infer_objects().dtypes
+
+Note that column ``'C'`` was not converted - only scalar numeric types
+will be converted to a new type.  Other types of conversion should be accomplished
+using the :func:`to_numeric` function (or :func:`to_datetime`, :func:`to_timedelta`).
+
+.. ipython:: python
+
+   df = df.infer_objects()
+   df['C'] = pd.to_numeric(df['C'], errors='coerce')
+   df.dtypes
+
+.. _whatsnew_0210.enhancements.attribute_access:
+
+Improved warnings when attempting to create columns
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+New users are often puzzled by the relationship between column operations and
+attribute access on ``DataFrame`` instances (:issue:`7175`). One specific
+instance of this confusion is attempting to create a new column by setting an
+attribute on the ``DataFrame``:
+
+.. code-block:: ipython
+
+   In [1]: df = pd.DataFrame({'one': [1., 2., 3.]})
+   In [2]: df.two = [4, 5, 6]
+
+This does not raise any obvious exceptions, but also does not create a new column:
+
+.. code-block:: ipython
+
+   In [3]: df
+   Out[3]:
+       one
+   0  1.0
+   1  2.0
+   2  3.0
+
+Setting a list-like data structure into a new attribute now raises a ``UserWarning`` about the potential for unexpected behavior. See :ref:`Attribute Access <indexing.attribute_access>`.
+
+.. _whatsnew_0210.enhancements.drop_api:
+
+``drop`` now also accepts index/columns keywords
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`~DataFrame.drop` method has gained ``index``/``columns`` keywords as an
+alternative to specifying the ``axis``. This is similar to the behavior of ``reindex``
+(:issue:`12392`).
+
+For example:
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.arange(8).reshape(2, 4),
+                      columns=['A', 'B', 'C', 'D'])
+    df
+    df.drop(['B', 'C'], axis=1)
+    # the following is now equivalent
+    df.drop(columns=['B', 'C'])
+
+.. _whatsnew_0210.enhancements.rename_reindex_axis:
+
+``rename``, ``reindex`` now also accept axis keyword
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`DataFrame.rename` and :meth:`DataFrame.reindex` methods have gained
+the ``axis`` keyword to specify the axis to target with the operation
+(:issue:`12392`).
+
+Here's ``rename``:
+
+.. ipython:: python
+
+   df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+   df.rename(str.lower, axis='columns')
+   df.rename(id, axis='index')
+
+And ``reindex``:
+
+.. ipython:: python
+
+   df.reindex(['A', 'B', 'C'], axis='columns')
+   df.reindex([0, 1, 3], axis='index')
+
+The "index, columns" style continues to work as before.
+
+.. ipython:: python
+
+   df.rename(index=id, columns=str.lower)
+   df.reindex(index=[0, 1, 3], columns=['A', 'B', 'C'])
+
+We *highly* encourage using named arguments to avoid confusion when using either
+style.
+
+.. _whatsnew_0210.enhancements.categorical_dtype:
+
+``CategoricalDtype`` for specifying categoricals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:class:`pandas.api.types.CategoricalDtype` has been added to the public API and
+expanded to include the ``categories`` and ``ordered`` attributes. A
+``CategoricalDtype`` can be used to specify the set of categories and
+orderedness of an array, independent of the data. This can be useful for example,
+when converting string data to a ``Categorical`` (:issue:`14711`,
+:issue:`15078`, :issue:`16015`, :issue:`17643`):
+
+.. ipython:: python
+
+   from pandas.api.types import CategoricalDtype
+
+   s = pd.Series(['a', 'b', 'c', 'a'])  # strings
+   dtype = CategoricalDtype(categories=['a', 'b', 'c', 'd'], ordered=True)
+   s.astype(dtype)
+
+One place that deserves special mention is in :meth:`read_csv`. Previously, with
+``dtype={'col': 'category'}``, the returned values and categories would always
+be strings.
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+.. ipython:: python
+
+   data = 'A,B\na,1\nb,2\nc,3'
+   pd.read_csv(StringIO(data), dtype={'B': 'category'}).B.cat.categories
+
+Notice the "object" dtype.
+
+With a ``CategoricalDtype`` of all numerics, datetimes, or
+timedeltas, we can automatically convert to the correct type
+
+.. ipython:: python
+
+   dtype = {'B': CategoricalDtype([1, 2, 3])}
+   pd.read_csv(StringIO(data), dtype=dtype).B.cat.categories
+
+The values have been correctly interpreted as integers.
+
+The ``.dtype`` property of a ``Categorical``, ``CategoricalIndex`` or a
+``Series`` with categorical type will now return an instance of
+``CategoricalDtype``. While the repr has changed, ``str(CategoricalDtype())`` is
+still the string ``'category'``. We'll take this moment to remind users that the
+*preferred* way to detect categorical data is to use
+:func:`pandas.api.types.is_categorical_dtype`, and not ``str(dtype) == 'category'``.
+
+See the :ref:`CategoricalDtype docs <categorical.categoricaldtype>` for more.
+
+.. _whatsnew_0210.enhancements.GroupBy_pipe:
+
+``GroupBy`` objects now have a ``pipe`` method
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``GroupBy`` objects now have a ``pipe`` method, similar to the one on
+``DataFrame`` and ``Series``, that allow for functions that take a
+``GroupBy`` to be composed in a clean, readable syntax. (:issue:`17871`)
+
+For a concrete example on combining ``.groupby`` and ``.pipe`` , imagine having a
+DataFrame with columns for stores, products, revenue and sold quantity. We'd like to
+do a groupwise calculation of *prices* (i.e. revenue/quantity) per store and per product.
+We could do this in a multi-step operation, but expressing it in terms of piping can make the
+code more readable.
+
+First we set the data:
+
+.. ipython:: python
+
+   import numpy as np
+   n = 1000
+   df = pd.DataFrame({'Store': np.random.choice(['Store_1', 'Store_2'], n),
+                      'Product': np.random.choice(['Product_1',
+                                                   'Product_2',
+                                                   'Product_3'
+                                                   ], n),
+                      'Revenue': (np.random.random(n) * 50 + 10).round(2),
+                      'Quantity': np.random.randint(1, 10, size=n)})
+   df.head(2)
+
+Now, to find prices per store/product, we can simply do:
+
+.. ipython:: python
+
+   (df.groupby(['Store', 'Product'])
+      .pipe(lambda grp: grp.Revenue.sum() / grp.Quantity.sum())
+      .unstack().round(2))
+
+See the :ref:`documentation <groupby.pipe>` for more.
+
+
+.. _whatsnew_0210.enhancements.reanme_categories:
+
+``Categorical.rename_categories`` accepts a dict-like
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`~Series.cat.rename_categories` now accepts a dict-like argument for
+``new_categories``. The previous categories are looked up in the dictionary's
+keys and replaced if found. The behavior of missing and extra keys is the same
+as in :meth:`DataFrame.rename`.
+
+.. ipython:: python
+
+   c = pd.Categorical(['a', 'a', 'b'])
+   c.rename_categories({"a": "eh", "b": "bee"})
+
+.. warning::
+
+    To assist with upgrading pandas, ``rename_categories`` treats ``Series`` as
+    list-like. Typically, Series are considered to be dict-like (e.g. in
+    ``.rename``, ``.map``). In a future version of pandas ``rename_categories``
+    will change to treat them as dict-like. Follow the warning message's
+    recommendations for writing future-proof code.
+
+    .. code-block:: ipython
+
+        In [33]: c.rename_categories(pd.Series([0, 1], index=['a', 'c']))
+        FutureWarning: Treating Series 'new_categories' as a list-like and using the values.
+        In a future version, 'rename_categories' will treat Series like a dictionary.
+        For dict-like, use 'new_categories.to_dict()'
+        For list-like, use 'new_categories.values'.
+        Out[33]:
+        [0, 0, 1]
+        Categories (2, int64): [0, 1]
+
+
+.. _whatsnew_0210.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+New functions or methods
+""""""""""""""""""""""""
+
+- :meth:`~pandas.core.resample.Resampler.nearest` is added to support nearest-neighbor upsampling (:issue:`17496`).
+- :class:`~pandas.Index` has added support for a ``to_frame`` method (:issue:`15230`).
+
+New keywords
+""""""""""""
+
+- Added a ``skipna`` parameter to :func:`~pandas.api.types.infer_dtype` to
+  support type inference in the presence of missing values (:issue:`17059`).
+- :func:`Series.to_dict` and :func:`DataFrame.to_dict` now support an ``into`` keyword which allows you to specify the ``collections.Mapping`` subclass that you would like returned.  The default is ``dict``, which is backwards compatible. (:issue:`16122`)
+- :func:`Series.set_axis` and :func:`DataFrame.set_axis` now support the ``inplace`` parameter. (:issue:`14636`)
+- :func:`Series.to_pickle` and :func:`DataFrame.to_pickle` have gained a ``protocol`` parameter (:issue:`16252`). By default, this parameter is set to `HIGHEST_PROTOCOL <https://docs.python.org/3/library/pickle.html#data-stream-format>`__
+- :func:`read_feather` has gained the ``nthreads`` parameter for multi-threaded operations (:issue:`16359`)
+- :func:`DataFrame.clip()` and :func:`Series.clip()` have gained an ``inplace`` argument. (:issue:`15388`)
+- :func:`crosstab` has gained a ``margins_name`` parameter to define the name of the row / column that will contain the totals when ``margins=True``. (:issue:`15972`)
+- :func:`read_json` now accepts a ``chunksize`` parameter that can be used when ``lines=True``. If ``chunksize`` is passed, read_json now returns an iterator which reads in ``chunksize`` lines with each iteration. (:issue:`17048`)
+- :func:`read_json` and :func:`~DataFrame.to_json` now accept a ``compression`` argument which allows them to transparently handle compressed files. (:issue:`17798`)
+
+Various enhancements
+""""""""""""""""""""
+
+- Improved the import time of pandas by about 2.25x.  (:issue:`16764`)
+- Support for `PEP 519 -- Adding a file system path protocol
+  <https://www.python.org/dev/peps/pep-0519/>`_ on most readers (e.g.
+  :func:`read_csv`) and writers (e.g. :meth:`DataFrame.to_csv`) (:issue:`13823`).
+- Added a ``__fspath__`` method to ``pd.HDFStore``, ``pd.ExcelFile``,
+  and ``pd.ExcelWriter`` to work properly with the file system path protocol (:issue:`13823`).
+- The ``validate`` argument for :func:`merge` now checks whether a merge is one-to-one, one-to-many, many-to-one, or many-to-many. If a merge is found to not be an example of specified merge type, an exception of type ``MergeError`` will be raised. For more, see :ref:`here <merging.validation>` (:issue:`16270`)
+- Added support for `PEP 518 <https://www.python.org/dev/peps/pep-0518/>`_ (``pyproject.toml``) to the build system (:issue:`16745`)
+- :func:`RangeIndex.append` now returns a ``RangeIndex`` object when possible (:issue:`16212`)
+- :func:`Series.rename_axis` and :func:`DataFrame.rename_axis` with ``inplace=True`` now return ``None`` while renaming the axis inplace. (:issue:`15704`)
+- :func:`api.types.infer_dtype` now infers decimals. (:issue:`15690`)
+- :func:`DataFrame.select_dtypes` now accepts scalar values for include/exclude as well as list-like. (:issue:`16855`)
+- :func:`date_range` now accepts 'YS' in addition to 'AS' as an alias for start of year. (:issue:`9313`)
+- :func:`date_range` now accepts 'Y' in addition to 'A' as an alias for end of year. (:issue:`9313`)
+- :func:`DataFrame.add_prefix` and :func:`DataFrame.add_suffix` now accept strings containing the '%' character. (:issue:`17151`)
+- Read/write methods that infer compression (:func:`read_csv`, :func:`read_table`, :func:`read_pickle`, and :meth:`~DataFrame.to_pickle`) can now infer from path-like objects, such as ``pathlib.Path``. (:issue:`17206`)
+- :func:`read_sas` now recognizes much more of the most frequently used date (datetime) formats in SAS7BDAT files. (:issue:`15871`)
+- :func:`DataFrame.items` and :func:`Series.items` are now present in both Python 2 and 3 and is lazy in all cases. (:issue:`13918`, :issue:`17213`)
+- :meth:`pandas.io.formats.style.Styler.where` has been implemented as a convenience for :meth:`pandas.io.formats.style.Styler.applymap`. (:issue:`17474`)
+- :func:`MultiIndex.is_monotonic_decreasing` has been implemented.  Previously returned ``False`` in all cases. (:issue:`16554`)
+- :func:`read_excel` raises ``ImportError`` with a better message if ``xlrd`` is not installed. (:issue:`17613`)
+- :meth:`DataFrame.assign` will preserve the original order of ``**kwargs`` for Python 3.6+ users instead of sorting the column names. (:issue:`14207`)
+- :func:`Series.reindex`, :func:`DataFrame.reindex`, :func:`Index.get_indexer` now support list-like argument for ``tolerance``. (:issue:`17367`)
+
+.. _whatsnew_0210.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0210.api_breaking.deps:
+
+Dependencies have increased minimum versions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`15206`, :issue:`15543`, :issue:`15214`).
+If installed, we now require:
+
+   +--------------+-----------------+----------+
+   | Package      | Minimum Version | Required |
+   +==============+=================+==========+
+   | Numpy        | 1.9.0           |    X     |
+   +--------------+-----------------+----------+
+   | Matplotlib   | 1.4.3           |          |
+   +--------------+-----------------+----------+
+   | Scipy        | 0.14.0          |          |
+   +--------------+-----------------+----------+
+   | Bottleneck   | 1.0.0           |          |
+   +--------------+-----------------+----------+
+
+Additionally, support has been dropped for Python 3.4 (:issue:`15251`).
+
+
+.. _whatsnew_0210.api_breaking.bottleneck:
+
+Sum/Prod of all-NaN or empty Series/DataFrames is now consistently NaN
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. note::
+
+   The changes described here have been partially reverted. See
+   the :ref:`v0.22.0 Whatsnew <whatsnew_0220>` for more.
+
+
+The behavior of ``sum`` and ``prod`` on all-NaN Series/DataFrames no longer depends on
+whether `bottleneck <http://berkeleyanalytics.com/bottleneck>`__ is installed, and return value of ``sum`` and ``prod`` on an empty Series has changed (:issue:`9422`, :issue:`15507`).
+
+Calling ``sum`` or ``prod`` on an empty or all-``NaN`` ``Series``, or columns of a ``DataFrame``, will result in ``NaN``. See the :ref:`docs <missing_data.numeric_sum>`.
+
+.. ipython:: python
+
+   s = pd.Series([np.nan])
+
+Previously WITHOUT ``bottleneck`` installed:
+
+.. code-block:: ipython
+
+   In [2]: s.sum()
+   Out[2]: np.nan
+
+Previously WITH ``bottleneck``:
+
+.. code-block:: ipython
+
+   In [2]: s.sum()
+   Out[2]: 0.0
+
+New Behavior, without regard to the bottleneck installation:
+
+.. ipython:: python
+
+   s.sum()
+
+Note that this also changes the sum of an empty ``Series``. Previously this always returned 0 regardless of a ``bottlenck`` installation:
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([]).sum()
+   Out[1]: 0
+
+but for consistency with the all-NaN case, this was changed to return NaN as well:
+
+.. ipython:: python
+
+   pd.Series([]).sum()
+
+
+.. _whatsnew_0210.api_breaking.loc:
+
+Indexing with a list with missing labels is Deprecated
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, selecting with a list of labels, where one or more labels were missing would always succeed, returning ``NaN`` for missing labels.
+This will now show a ``FutureWarning``. In the future this will raise a ``KeyError`` (:issue:`15747`).
+This warning will trigger on a ``DataFrame`` or a ``Series`` for using ``.loc[]``  or ``[[]]`` when passing a list-of-labels with at least 1 missing label.
+See the :ref:`deprecation docs <indexing.deprecate_loc_reindex_listlike>`.
+
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Previous Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+
+Current Behavior
+
+.. code-block:: ipython
+
+   In [4]: s.loc[[1, 2, 3]]
+   Passing list-likes to .loc or [] with any missing label will raise
+   KeyError in the future, you can use .reindex() as an alternative.
+
+   See the documentation here:
+   http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
+
+   Out[4]:
+   1    2.0
+   2    3.0
+   3    NaN
+   dtype: float64
+
+The idiomatic way to achieve selecting potentially not-found elements is via ``.reindex()``
+
+.. ipython:: python
+
+   s.reindex([1, 2, 3])
+
+Selection with all keys found is unchanged.
+
+.. ipython:: python
+
+   s.loc[[1, 2]]
+
+
+.. _whatsnew_0210.api.na_changes:
+
+NA naming Changes
+^^^^^^^^^^^^^^^^^
+
+In order to promote more consistency among the pandas API, we have added additional top-level
+functions :func:`isna` and :func:`notna` that are aliases for :func:`isnull` and :func:`notnull`.
+The naming scheme is now more consistent with methods like ``.dropna()`` and ``.fillna()``. Furthermore
+in all cases where ``.isnull()`` and ``.notnull()`` methods are defined, these have additional methods
+named ``.isna()`` and ``.notna()``, these are included for classes ``Categorical``,
+``Index``, ``Series``, and ``DataFrame``. (:issue:`15001`).
+
+The configuration option ``pd.options.mode.use_inf_as_null`` is deprecated, and ``pd.options.mode.use_inf_as_na`` is added as a replacement.
+
+
+.. _whatsnew_0210.api_breaking.iteration_scalars:
+
+Iteration of Series/Index will now return Python scalars
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, when using certain iteration methods for a ``Series`` with dtype ``int`` or ``float``, you would receive a ``numpy`` scalar, e.g. a ``np.int64``, rather than a Python ``int``. Issue (:issue:`10904`) corrected this for ``Series.tolist()`` and ``list(Series)``. This change makes all iteration methods consistent, in particular, for ``__iter__()`` and ``.map()``; note that this only affects int/float dtypes. (:issue:`13236`, :issue:`13258`, :issue:`14216`).
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+   s
+
+Previously:
+
+.. code-block:: ipython
+
+   In [2]: type(list(s)[0])
+   Out[2]: numpy.int64
+
+New Behaviour:
+
+.. ipython:: python
+
+   type(list(s)[0])
+
+Furthermore this will now correctly box the results of iteration for :func:`DataFrame.to_dict` as well.
+
+.. ipython:: python
+
+   d = {'a': [1], 'b': ['b']}
+   df = pd.DataFrame(d)
+
+Previously:
+
+.. code-block:: ipython
+
+   In [8]: type(df.to_dict()['a'][0])
+   Out[8]: numpy.int64
+
+New Behaviour:
+
+.. ipython:: python
+
+   type(df.to_dict()['a'][0])
+
+
+.. _whatsnew_0210.api_breaking.loc_with_index:
+
+Indexing with a Boolean Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously when passing a boolean ``Index`` to ``.loc``, if the index of the ``Series/DataFrame`` had ``boolean`` labels,
+you would get a label based selection, potentially duplicating result labels, rather than a boolean indexing selection
+(where ``True`` selects elements), this was inconsistent how a boolean numpy array indexed. The new behavior is to
+act like a boolean numpy array indexer. (:issue:`17738`)
+
+Previous Behavior:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=[False, True, False])
+   s
+
+.. code-block:: ipython
+
+   In [59]: s.loc[pd.Index([True, False, True])]
+   Out[59]:
+   True     2
+   False    1
+   False    3
+   True     2
+   dtype: int64
+
+Current Behavior
+
+.. ipython:: python
+
+   s.loc[pd.Index([True, False, True])]
+
+
+Furthermore, previously if you had an index that was non-numeric (e.g. strings), then a boolean Index would raise a ``KeyError``.
+This will now be treated as a boolean indexer.
+
+Previously Behavior:
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3], index=['a', 'b', 'c'])
+   s
+
+.. code-block:: ipython
+
+   In [39]: s.loc[pd.Index([True, False, True])]
+   KeyError: "None of [Index([True, False, True], dtype='object')] are in the [index]"
+
+Current Behavior
+
+.. ipython:: python
+
+   s.loc[pd.Index([True, False, True])]
+
+
+.. _whatsnew_0210.api_breaking.period_index_resampling:
+
+``PeriodIndex`` resampling
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions of pandas, resampling a ``Series``/``DataFrame`` indexed by a ``PeriodIndex`` returned a ``DatetimeIndex`` in some cases (:issue:`12884`). Resampling to a multiplied frequency now returns a ``PeriodIndex`` (:issue:`15944`). As a minor enhancement, resampling a ``PeriodIndex`` can now handle ``NaT`` values (:issue:`13224`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.period_range('2017-01', periods=12, freq='M')
+
+   In [2]: s = pd.Series(np.arange(12), index=pi)
+
+   In [3]: resampled = s.resample('2Q').mean()
+
+   In [4]: resampled
+   Out[4]:
+   2017-03-31     1.0
+   2017-09-30     5.5
+   2018-03-31    10.0
+   Freq: 2Q-DEC, dtype: float64
+
+   In [5]: resampled.index
+   Out[5]: DatetimeIndex(['2017-03-31', '2017-09-30', '2018-03-31'], dtype='datetime64[ns]', freq='2Q-DEC')
+
+New Behavior:
+
+.. ipython:: python
+
+   pi = pd.period_range('2017-01', periods=12, freq='M')
+
+   s = pd.Series(np.arange(12), index=pi)
+
+   resampled = s.resample('2Q').mean()
+
+   resampled
+
+   resampled.index
+
+Upsampling and calling ``.ohlc()`` previously returned a ``Series``, basically identical to calling ``.asfreq()``. OHLC upsampling now returns a DataFrame with columns ``open``, ``high``, ``low`` and ``close`` (:issue:`13083`). This is consistent with downsampling and ``DatetimeIndex`` behavior.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [1]: pi = pd.period_range(start='2000-01-01', freq='D', periods=10)
+
+   In [2]: s = pd.Series(np.arange(10), index=pi)
+
+   In [3]: s.resample('H').ohlc()
+   Out[3]:
+   2000-01-01 00:00    0.0
+                   ...
+   2000-01-10 23:00    NaN
+   Freq: H, Length: 240, dtype: float64
+
+   In [4]: s.resample('M').ohlc()
+   Out[4]:
+            open  high  low  close
+   2000-01     0     9    0      9
+
+New Behavior:
+
+.. ipython:: python
+
+   pi = pd.period_range(start='2000-01-01', freq='D', periods=10)
+
+   s = pd.Series(np.arange(10), index=pi)
+
+   s.resample('H').ohlc()
+
+   s.resample('M').ohlc()
+
+
+.. _whatsnew_0210.api_breaking.pandas_eval:
+
+Improved error handling during item assignment in pd.eval
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`eval` will now raise a ``ValueError`` when item assignment malfunctions, or
+inplace operations are specified, but there is no item assignment in the expression (:issue:`16732`)
+
+.. ipython:: python
+
+   arr = np.array([1, 2, 3])
+
+Previously, if you attempted the following expression, you would get a not very helpful error message:
+
+.. code-block:: ipython
+
+   In [3]: pd.eval("a = 1 + 2", target=arr, inplace=True)
+   ...
+   IndexError: only integers, slices (`:`), ellipsis (`...`), numpy.newaxis (`None`)
+   and integer or boolean arrays are valid indices
+
+This is a very long way of saying numpy arrays don't support string-item indexing. With this
+change, the error message is now this:
+
+.. code-block:: python
+
+   In [3]: pd.eval("a = 1 + 2", target=arr, inplace=True)
+   ...
+   ValueError: Cannot assign expression output to target
+
+It also used to be possible to evaluate expressions inplace, even if there was no item assignment:
+
+.. code-block:: ipython
+
+   In [4]: pd.eval("1 + 2", target=arr, inplace=True)
+   Out[4]: 3
+
+However, this input does not make much sense because the output is not being assigned to
+the target. Now, a ``ValueError`` will be raised when such an input is passed in:
+
+.. code-block:: ipython
+
+   In [4]: pd.eval("1 + 2", target=arr, inplace=True)
+   ...
+   ValueError: Cannot operate inplace if there is no assignment
+
+
+.. _whatsnew_0210.api_breaking.dtype_conversions:
+
+Dtype Conversions
+^^^^^^^^^^^^^^^^^
+
+Previously assignments, ``.where()`` and ``.fillna()`` with a ``bool`` assignment, would coerce to same the type (e.g. int / float), or raise for datetimelikes. These will now preserve the bools with ``object`` dtypes. (:issue:`16821`).
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, 3])
+
+.. code-block:: python
+
+   In [5]: s[1] = True
+
+   In [6]: s
+   Out[6]:
+   0    1
+   1    1
+   2    3
+   dtype: int64
+
+New Behavior
+
+.. ipython:: python
+
+   s[1] = True
+   s
+
+Previously, as assignment to a datetimelike with a non-datetimelike would coerce the
+non-datetime-like item being assigned (:issue:`14145`).
+
+.. ipython:: python
+
+   s = pd.Series([pd.Timestamp('2011-01-01'), pd.Timestamp('2012-01-01')])
+
+.. code-block:: python
+
+   In [1]: s[1] = 1
+
+   In [2]: s
+   Out[2]:
+   0   2011-01-01 00:00:00.000000000
+   1   1970-01-01 00:00:00.000000001
+   dtype: datetime64[ns]
+
+These now coerce to ``object`` dtype.
+
+.. ipython:: python
+
+   s[1] = 1
+   s
+
+- Inconsistent behavior in ``.where()`` with datetimelikes which would raise rather than coerce to ``object`` (:issue:`16402`)
+- Bug in assignment against ``int64`` data with ``np.ndarray`` with ``float64`` dtype may keep ``int64`` dtype (:issue:`14001`)
+
+
+.. _whatsnew_210.api.multiindex_single:
+
+MultiIndex Constructor with a Single Level
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``MultiIndex`` constructors no longer squeezes a MultiIndex with all
+length-one levels down to a regular ``Index``. This affects all the
+``MultiIndex`` constructors. (:issue:`17178`)
+
+Previous behavior:
+
+.. code-block:: ipython
+
+   In [2]: pd.MultiIndex.from_tuples([('a',), ('b',)])
+   Out[2]: Index(['a', 'b'], dtype='object')
+
+Length 1 levels are no longer special-cased. They behave exactly as if you had
+length 2+ levels, so a :class:`MultiIndex` is always returned from all of the
+``MultiIndex`` constructors:
+
+.. ipython:: python
+
+   pd.MultiIndex.from_tuples([('a',), ('b',)])
+
+.. _whatsnew_0210.api.utc_localization_with_series:
+
+UTC Localization with Series
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, :func:`to_datetime` did not localize datetime ``Series`` data when ``utc=True`` was passed. Now, :func:`to_datetime` will correctly localize ``Series`` with a ``datetime64[ns, UTC]`` dtype to be consistent with how list-like and ``Index`` data are handled. (:issue:`6415`).
+
+Previous Behavior
+
+.. ipython:: python
+
+   s = pd.Series(['20130101 00:00:00'] * 3)
+
+.. code-block:: ipython
+
+   In [12]: pd.to_datetime(s, utc=True)
+   Out[12]:
+   0   2013-01-01
+   1   2013-01-01
+   2   2013-01-01
+   dtype: datetime64[ns]
+
+New Behavior
+
+.. ipython:: python
+
+   pd.to_datetime(s, utc=True)
+
+Additionally, DataFrames with datetime columns that were parsed by :func:`read_sql_table` and :func:`read_sql_query` will also be localized to UTC only if the original SQL columns were timezone aware datetime columns.
+
+.. _whatsnew_0210.api.consistency_of_range_functions:
+
+Consistency of Range Functions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, there were some inconsistencies between the various range functions: :func:`date_range`, :func:`bdate_range`, :func:`period_range`, :func:`timedelta_range`, and :func:`interval_range`. (:issue:`17471`).
+
+One of the inconsistent behaviors occurred when the ``start``, ``end`` and ``period`` parameters were all specified, potentially leading to ambiguous ranges.  When all three parameters were passed, ``interval_range`` ignored the ``period`` parameter, ``period_range`` ignored the ``end`` parameter, and the other range functions raised.  To promote consistency among the range functions, and avoid potentially ambiguous ranges, ``interval_range`` and ``period_range`` will now raise when all three parameters are passed.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [2]: pd.interval_range(start=0, end=4, periods=6)
+   Out[2]:
+   IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                 closed='right',
+                 dtype='interval[int64]')
+
+  In [3]: pd.period_range(start='2017Q1', end='2017Q4', periods=6, freq='Q')
+  Out[3]: PeriodIndex(['2017Q1', '2017Q2', '2017Q3', '2017Q4', '2018Q1', '2018Q2'], dtype='period[Q-DEC]', freq='Q-DEC')
+
+New Behavior:
+
+.. code-block:: ipython
+
+  In [2]: pd.interval_range(start=0, end=4, periods=6)
+  ---------------------------------------------------------------------------
+  ValueError: Of the three parameters: start, end, and periods, exactly two must be specified
+
+  In [3]: pd.period_range(start='2017Q1', end='2017Q4', periods=6, freq='Q')
+  ---------------------------------------------------------------------------
+  ValueError: Of the three parameters: start, end, and periods, exactly two must be specified
+
+Additionally, the endpoint parameter ``end`` was not included in the intervals produced by ``interval_range``.  However, all other range functions include ``end`` in their output.  To promote consistency among the range functions, ``interval_range`` will now include ``end`` as the right endpoint of the final interval, except if ``freq`` is specified in a way which skips ``end``.
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+   In [4]: pd.interval_range(start=0, end=4)
+   Out[4]:
+   IntervalIndex([(0, 1], (1, 2], (2, 3]]
+                 closed='right',
+                 dtype='interval[int64]')
+
+
+New Behavior:
+
+.. ipython:: python
+
+   pd.interval_range(start=0, end=4)
+
+.. _whatsnew_0210.api.mpl_converters:
+
+No Automatic Matplotlib Converters
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas no longer registers our ``date``, ``time``, ``datetime``,
+``datetime64``, and ``Period`` converters with matplotlib when pandas is
+imported. Matplotlib plot methods (``plt.plot``, ``ax.plot``, ...), will not
+nicely format the x-axis for ``DatetimeIndex`` or ``PeriodIndex`` values. You
+must explicitly register these methods:
+
+Pandas built-in ``Series.plot`` and ``DataFrame.plot`` *will* register these
+converters on first-use (:issue:`17710`).
+
+.. note::
+
+  This change has been temporarily reverted in pandas 0.21.1,
+  for more details see :ref:`here <whatsnew_0211.converters>`.
+
+.. _whatsnew_0210.api:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- The Categorical constructor no longer accepts a scalar for the ``categories`` keyword. (:issue:`16022`)
+- Accessing a non-existent attribute on a closed :class:`~pandas.HDFStore` will now
+  raise an ``AttributeError`` rather than a ``ClosedFileError`` (:issue:`16301`)
+- :func:`read_csv` now issues a ``UserWarning`` if the ``names`` parameter contains duplicates (:issue:`17095`)
+- :func:`read_csv` now treats ``'null'`` and ``'n/a'`` strings as missing values by default (:issue:`16471`, :issue:`16078`)
+- :class:`pandas.HDFStore`'s string representation is now faster and less detailed. For the previous behavior, use ``pandas.HDFStore.info()``. (:issue:`16503`).
+- Compression defaults in HDF stores now follow pytables standards. Default is no compression and if ``complib`` is missing and ``complevel`` > 0 ``zlib`` is used (:issue:`15943`)
+- ``Index.get_indexer_non_unique()`` now returns a ndarray indexer rather than an ``Index``; this is consistent with ``Index.get_indexer()`` (:issue:`16819`)
+- Removed the ``@slow`` decorator from ``pandas.util.testing``, which caused issues for some downstream packages' test suites. Use ``@pytest.mark.slow`` instead, which achieves the same thing (:issue:`16850`)
+- Moved definition of ``MergeError`` to the ``pandas.errors`` module.
+- The signature of :func:`Series.set_axis` and :func:`DataFrame.set_axis` has been changed from ``set_axis(axis, labels)`` to ``set_axis(labels, axis=0)``, for consistency with the rest of the API. The old signature is deprecated and will show a ``FutureWarning`` (:issue:`14636`)
+- :func:`Series.argmin` and :func:`Series.argmax` will now raise a ``TypeError`` when used with ``object`` dtypes, instead of a ``ValueError`` (:issue:`13595`)
+- :class:`Period` is now immutable, and will now raise an ``AttributeError`` when a user tries to assign a new value to the ``ordinal`` or ``freq`` attributes (:issue:`17116`).
+- :func:`to_datetime` when passed a tz-aware ``origin=`` kwarg will now raise a more informative ``ValueError`` rather than a ``TypeError`` (:issue:`16842`)
+- :func:`to_datetime` now raises a ``ValueError`` when format includes ``%W`` or ``%U`` without also including day of the week and calendar year (:issue:`16774`)
+- Renamed non-functional ``index`` to ``index_col`` in :func:`read_stata` to improve API consistency (:issue:`16342`)
+- Bug in :func:`DataFrame.drop` caused boolean labels ``False`` and ``True`` to be treated as labels 0 and 1 respectively when dropping indices from a numeric index. This will now raise a ValueError (:issue:`16877`)
+- Restricted DateOffset keyword arguments.  Previously, ``DateOffset`` subclasses allowed arbitrary keyword arguments which could lead to unexpected behavior.  Now, only valid arguments will be accepted. (:issue:`17176`).
+
+.. _whatsnew_0210.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- :meth:`DataFrame.from_csv` and :meth:`Series.from_csv` have been deprecated in favor of :func:`read_csv()` (:issue:`4191`)
+- :func:`read_excel()` has deprecated ``sheetname`` in favor of ``sheet_name`` for consistency with ``.to_excel()`` (:issue:`10559`).
+- :func:`read_excel()` has deprecated ``parse_cols`` in favor of ``usecols`` for consistency with :func:`read_csv` (:issue:`4988`)
+- :func:`read_csv()` has deprecated the ``tupleize_cols`` argument. Column tuples will always be converted to a ``MultiIndex`` (:issue:`17060`)
+- :meth:`DataFrame.to_csv` has deprecated the ``tupleize_cols`` argument. MultiIndex columns will be always written as rows in the CSV file (:issue:`17060`)
+- The ``convert`` parameter has been deprecated in the ``.take()`` method, as it was not being respected (:issue:`16948`)
+- ``pd.options.html.border`` has been deprecated in favor of ``pd.options.display.html.border`` (:issue:`15793`).
+- :func:`SeriesGroupBy.nth` has deprecated ``True`` in favor of ``'all'`` for its kwarg ``dropna`` (:issue:`11038`).
+- :func:`DataFrame.as_blocks` is deprecated, as this is exposing the internal implementation (:issue:`17302`)
+- ``pd.TimeGrouper`` is deprecated in favor of :class:`pandas.Grouper` (:issue:`16747`)
+- ``cdate_range`` has been deprecated in favor of :func:`bdate_range`, which has gained ``weekmask`` and ``holidays`` parameters for building custom frequency date ranges. See the :ref:`documentation <timeseries.custom-freq-ranges>` for more details (:issue:`17596`)
+- passing ``categories`` or ``ordered`` kwargs to :func:`Series.astype` is deprecated, in favor of passing a :ref:`CategoricalDtype <whatsnew_0210.enhancements.categorical_dtype>` (:issue:`17636`)
+- ``.get_value`` and ``.set_value`` on ``Series``, ``DataFrame``, ``Panel``, ``SparseSeries``, and ``SparseDataFrame`` are deprecated in favor of using ``.iat[]`` or ``.at[]`` accessors (:issue:`15269`)
+- Passing a non-existent column in ``.to_excel(..., columns=)`` is deprecated and will raise a ``KeyError`` in the future (:issue:`17295`)
+- ``raise_on_error`` parameter to :func:`Series.where`, :func:`Series.mask`, :func:`DataFrame.where`, :func:`DataFrame.mask` is deprecated, in favor of ``errors=`` (:issue:`14968`)
+- Using :meth:`DataFrame.rename_axis` and :meth:`Series.rename_axis` to alter index or column *labels* is now deprecated in favor of using ``.rename``. ``rename_axis`` may still be used to alter the name of the index or columns (:issue:`17833`).
+- :meth:`~DataFrame.reindex_axis` has been deprecated in favor of :meth:`~DataFrame.reindex`. See :ref:`here <whatsnew_0210.enhancements.rename_reindex_axis>` for more (:issue:`17833`).
+
+.. _whatsnew_0210.deprecations.select:
+
+Series.select and DataFrame.select
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :meth:`Series.select` and :meth:`DataFrame.select` methods are deprecated in favor of using ``df.loc[labels.map(crit)]`` (:issue:`12401`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': [1, 2, 3]}, index=['foo', 'bar', 'baz'])
+
+.. code-block:: ipython
+
+   In [3]: df.select(lambda x: x in ['bar', 'baz'])
+   FutureWarning: select is deprecated and will be removed in a future release. You can use .loc[crit] as a replacement
+   Out[3]:
+        A
+   bar  2
+   baz  3
+
+.. ipython:: python
+
+   df.loc[df.index.map(lambda x: x in ['bar', 'baz'])]
+
+
+.. _whatsnew_0210.deprecations.argmin_min:
+
+Series.argmax and Series.argmin
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The behavior of :func:`Series.argmax` and :func:`Series.argmin` have been deprecated in favor of :func:`Series.idxmax` and :func:`Series.idxmin`, respectively (:issue:`16830`).
+
+For compatibility with NumPy arrays, ``pd.Series`` implements ``argmax`` and
+``argmin``. Since pandas 0.13.0, ``argmax`` has been an alias for
+:meth:`pandas.Series.idxmax`, and ``argmin`` has been an alias for
+:meth:`pandas.Series.idxmin`. They return the *label* of the maximum or minimum,
+rather than the *position*.
+
+We've deprecated the current behavior of ``Series.argmax`` and
+``Series.argmin``. Using either of these will emit a ``FutureWarning``. Use
+:meth:`Series.idxmax` if you want the label of the maximum. Use
+``Series.values.argmax()`` if you want the position of the maximum. Likewise for
+the minimum. In a future release ``Series.argmax`` and ``Series.argmin`` will
+return the position of the maximum or minimum.
+
+.. _whatsnew_0210.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- :func:`read_excel()` has dropped the ``has_index_names`` parameter (:issue:`10967`)
+- The ``pd.options.display.height`` configuration has been dropped (:issue:`3663`)
+- The ``pd.options.display.line_width`` configuration has been dropped (:issue:`2881`)
+- The ``pd.options.display.mpl_style`` configuration has been dropped (:issue:`12190`)
+- ``Index`` has dropped the ``.sym_diff()`` method in favor of ``.symmetric_difference()`` (:issue:`12591`)
+- ``Categorical`` has dropped the ``.order()`` and ``.sort()`` methods in favor of ``.sort_values()`` (:issue:`12882`)
+- :func:`eval` and :func:`DataFrame.eval` have changed the default of ``inplace`` from ``None`` to ``False`` (:issue:`11149`)
+- The function ``get_offset_name`` has been dropped in favor of the ``.freqstr`` attribute for an offset (:issue:`11834`)
+- pandas no longer tests for compatibility with hdf5-files created with pandas < 0.11 (:issue:`17404`).
+
+
+
+.. _whatsnew_0210.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of instantiating :class:`SparseDataFrame` (:issue:`16773`)
+- :attr:`Series.dt` no longer performs frequency inference, yielding a large speedup when accessing the attribute (:issue:`17210`)
+- Improved performance of :meth:`~Series.cat.set_categories` by not materializing the values (:issue:`17508`)
+- :attr:`Timestamp.microsecond` no longer re-computes on attribute access (:issue:`17331`)
+- Improved performance of the :class:`CategoricalIndex` for data that is already categorical dtype (:issue:`17513`)
+- Improved performance of :meth:`RangeIndex.min` and :meth:`RangeIndex.max` by using ``RangeIndex`` properties to perform the computations (:issue:`17607`)
+
+.. _whatsnew_0210.docs:
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+- Several ``NaT`` method docstrings (e.g. :func:`NaT.ctime`) were incorrect (:issue:`17327`)
+- The documentation has had references to versions < v0.17 removed and cleaned up (:issue:`17442`, :issue:`17442`, :issue:`17404` & :issue:`17504`)
+
+.. _whatsnew_0210.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in assignment against datetime-like data with ``int`` may incorrectly convert to datetime-like (:issue:`14145`)
+- Bug in assignment against ``int64`` data with ``np.ndarray`` with ``float64`` dtype may keep ``int64`` dtype (:issue:`14001`)
+- Fixed the return type of ``IntervalIndex.is_non_overlapping_monotonic`` to be a Python ``bool`` for consistency with similar attributes/methods.  Previously returned a ``numpy.bool_``. (:issue:`17237`)
+- Bug in ``IntervalIndex.is_non_overlapping_monotonic`` when intervals are closed on both sides and overlap at a point (:issue:`16560`)
+- Bug in :func:`Series.fillna` returns frame when ``inplace=True`` and ``value`` is dict (:issue:`16156`)
+- Bug in :attr:`Timestamp.weekday_name` returning a UTC-based weekday name when localized to a timezone (:issue:`17354`)
+- Bug in ``Timestamp.replace`` when replacing ``tzinfo`` around DST changes (:issue:`15683`)
+- Bug in ``Timedelta`` construction and arithmetic that would not propagate the ``Overflow`` exception (:issue:`17367`)
+- Bug in :meth:`~DataFrame.astype` converting to object dtype when passed extension type classes (``DatetimeTZDtype``, ``CategoricalDtype``) rather than instances. Now a ``TypeError`` is raised when a class is passed (:issue:`17780`).
+- Bug in :meth:`to_numeric` in which elements were not always being coerced to numeric when ``errors='coerce'`` (:issue:`17007`, :issue:`17125`)
+- Bug in ``DataFrame`` and ``Series`` constructors where ``range`` objects are converted to ``int32`` dtype on Windows instead of ``int64`` (:issue:`16804`)
+
+Indexing
+^^^^^^^^
+
+- When called with a null slice (e.g. ``df.iloc[:]``), the ``.iloc`` and ``.loc`` indexers return a shallow copy of the original object. Previously they returned the original object. (:issue:`13873`).
+- When called on an unsorted ``MultiIndex``, the ``loc`` indexer now will raise ``UnsortedIndexError`` only if proper slicing is used on non-sorted levels (:issue:`16734`).
+- Fixes regression in 0.20.3 when indexing with a string on a ``TimedeltaIndex`` (:issue:`16896`).
+- Fixed :func:`TimedeltaIndex.get_loc` handling of ``np.timedelta64`` inputs (:issue:`16909`).
+- Fix :func:`MultiIndex.sort_index` ordering when ``ascending`` argument is a list, but not all levels are specified, or are in a different order (:issue:`16934`).
+- Fixes bug where indexing with ``np.inf`` caused an ``OverflowError`` to be raised (:issue:`16957`)
+- Bug in reindexing on an empty ``CategoricalIndex`` (:issue:`16770`)
+- Fixes ``DataFrame.loc`` for setting with alignment and tz-aware ``DatetimeIndex`` (:issue:`16889`)
+- Avoids ``IndexError`` when passing an Index or Series to ``.iloc`` with older numpy (:issue:`17193`)
+- Allow unicode empty strings as placeholders in multilevel columns in Python 2 (:issue:`17099`)
+- Bug in ``.iloc`` when used with inplace addition or assignment and an int indexer on a ``MultiIndex`` causing the wrong indexes to be read from and written to (:issue:`17148`)
+- Bug in ``.isin()`` in which checking membership in empty ``Series`` objects raised an error (:issue:`16991`)
+- Bug in ``CategoricalIndex`` reindexing in which specified indices containing duplicates were not being respected (:issue:`17323`)
+- Bug in intersection of ``RangeIndex`` with negative step (:issue:`17296`)
+- Bug in ``IntervalIndex`` where performing a scalar lookup fails for included right endpoints of non-overlapping monotonic decreasing indexes (:issue:`16417`, :issue:`17271`)
+- Bug in :meth:`DataFrame.first_valid_index` and :meth:`DataFrame.last_valid_index` when no valid entry (:issue:`17400`)
+- Bug in :func:`Series.rename` when called with a callable, incorrectly alters the name of the ``Series``, rather than the name of the ``Index``. (:issue:`17407`)
+- Bug in :func:`String.str_get` raises ``IndexError`` instead of inserting NaNs when using a negative index. (:issue:`17704`)
+
+I/O
+^^^
+
+- Bug in :func:`read_hdf` when reading a timezone aware index from ``fixed`` format HDFStore (:issue:`17618`)
+- Bug in :func:`read_csv` in which columns were not being thoroughly de-duplicated (:issue:`17060`)
+- Bug in :func:`read_csv` in which specified column names were not being thoroughly de-duplicated (:issue:`17095`)
+- Bug in :func:`read_csv` in which non integer values for the header argument generated an unhelpful / unrelated error message (:issue:`16338`)
+- Bug in :func:`read_csv` in which memory management issues in exception handling, under certain conditions, would cause the interpreter to segfault (:issue:`14696`, :issue:`16798`).
+- Bug in :func:`read_csv` when called with ``low_memory=False`` in which a CSV with at least one column > 2GB in size would incorrectly raise a ``MemoryError`` (:issue:`16798`).
+- Bug in :func:`read_csv` when called with a single-element list ``header`` would return a ``DataFrame`` of all NaN values (:issue:`7757`)
+- Bug in :meth:`DataFrame.to_csv` defaulting to 'ascii' encoding in Python 3, instead of 'utf-8' (:issue:`17097`)
+- Bug in :func:`read_stata` where value labels could not be read when using an iterator (:issue:`16923`)
+- Bug in :func:`read_stata` where the index was not set (:issue:`16342`)
+- Bug in :func:`read_html` where import check fails when run in multiple threads (:issue:`16928`)
+- Bug in :func:`read_csv` where automatic delimiter detection caused a ``TypeError`` to be thrown when a bad line was encountered rather than the correct error message (:issue:`13374`)
+- Bug in :meth:`DataFrame.to_html` with ``notebook=True`` where DataFrames with named indices or non-MultiIndex indices had undesired horizontal or vertical alignment for column or row labels, respectively (:issue:`16792`)
+- Bug in :meth:`DataFrame.to_html` in which there was no validation of the ``justify`` parameter (:issue:`17527`)
+- Bug in :func:`HDFStore.select` when reading a contiguous mixed-data table featuring VLArray (:issue:`17021`)
+- Bug in :func:`to_json` where several conditions (including objects with unprintable symbols, objects with deep recursion, overlong labels) caused segfaults instead of raising the appropriate exception (:issue:`14256`)
+
+Plotting
+^^^^^^^^
+- Bug in plotting methods using ``secondary_y`` and ``fontsize`` not setting secondary axis font size (:issue:`12565`)
+- Bug when plotting ``timedelta`` and ``datetime`` dtypes on y-axis (:issue:`16953`)
+- Line plots no longer assume monotonic x data when calculating xlims, they show the entire lines now even for unsorted x data. (:issue:`11310`, :issue:`11471`)
+- With matplotlib 2.0.0 and above, calculation of x limits for line plots is left to matplotlib, so that its new default settings are applied. (:issue:`15495`)
+- Bug in ``Series.plot.bar`` or ``DataFrame.plot.bar`` with ``y`` not respecting user-passed ``color`` (:issue:`16822`)
+- Bug causing ``plotting.parallel_coordinates`` to reset the random seed when using random colors (:issue:`17525`)
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``DataFrame.resample(...).size()`` where an empty ``DataFrame`` did not return a ``Series`` (:issue:`14962`)
+- Bug in :func:`infer_freq` causing indices with 2-day gaps during the working week to be wrongly inferred as business daily (:issue:`16624`)
+- Bug in ``.rolling(...).quantile()`` which incorrectly used different defaults than :func:`Series.quantile()` and :func:`DataFrame.quantile()` (:issue:`9413`, :issue:`16211`)
+- Bug in ``groupby.transform()`` that would coerce boolean dtypes back to float (:issue:`16875`)
+- Bug in ``Series.resample(...).apply()`` where an empty ``Series`` modified the source index and did not return the name of a ``Series`` (:issue:`14313`)
+- Bug in ``.rolling(...).apply(...)`` with a ``DataFrame`` with a ``DatetimeIndex``, a ``window`` of a timedelta-convertible and ``min_periods >= 1`` (:issue:`15305`)
+- Bug in ``DataFrame.groupby`` where index and column keys were not recognized correctly when the number of keys equaled the number of elements on the groupby axis (:issue:`16859`)
+- Bug in ``groupby.nunique()`` with ``TimeGrouper`` which cannot handle ``NaT`` correctly (:issue:`17575`)
+- Bug in ``DataFrame.groupby`` where a single level selection from a ``MultiIndex`` unexpectedly sorts (:issue:`17537`)
+- Bug in ``DataFrame.groupby`` where spurious warning is raised when ``Grouper`` object is used to override ambiguous column name (:issue:`17383`)
+- Bug in ``TimeGrouper`` differs when passes as a list and as a scalar (:issue:`17530`)
+
+Sparse
+^^^^^^
+
+- Bug in ``SparseSeries`` raises ``AttributeError`` when a dictionary is passed in as data (:issue:`16905`)
+- Bug in :func:`SparseDataFrame.fillna` not filling all NaNs when frame was instantiated from SciPy sparse matrix (:issue:`16112`)
+- Bug in :func:`SparseSeries.unstack` and :func:`SparseDataFrame.stack` (:issue:`16614`, :issue:`15045`)
+- Bug in :func:`make_sparse` treating two numeric/boolean data, which have same bits, as same when array ``dtype`` is ``object`` (:issue:`17574`)
+- :func:`SparseArray.all` and :func:`SparseArray.any` are now implemented to handle ``SparseArray``, these were used but not implemented (:issue:`17570`)
+
+Reshaping
+^^^^^^^^^
+- Joining/Merging with a non unique ``PeriodIndex`` raised a ``TypeError`` (:issue:`16871`)
+- Bug in :func:`crosstab` where non-aligned series of integers were casted to float (:issue:`17005`)
+- Bug in merging with categorical dtypes with datetimelikes incorrectly raised a ``TypeError`` (:issue:`16900`)
+- Bug when using :func:`isin` on a large object series and large comparison array (:issue:`16012`)
+- Fixes regression from 0.20, :func:`Series.aggregate` and :func:`DataFrame.aggregate` allow dictionaries as return values again (:issue:`16741`)
+- Fixes dtype of result with integer dtype input, from :func:`pivot_table` when called with ``margins=True`` (:issue:`17013`)
+- Bug in :func:`crosstab` where passing two ``Series`` with the same name raised a ``KeyError`` (:issue:`13279`)
+- :func:`Series.argmin`, :func:`Series.argmax`, and their counterparts on ``DataFrame`` and groupby objects work correctly with floating point data that contains infinite values (:issue:`13595`).
+- Bug in :func:`unique` where checking a tuple of strings raised a ``TypeError`` (:issue:`17108`)
+- Bug in :func:`concat` where order of result index was unpredictable if it contained non-comparable elements (:issue:`17344`)
+- Fixes regression when sorting by multiple columns on a ``datetime64`` dtype ``Series`` with ``NaT`` values (:issue:`16836`)
+- Bug in :func:`pivot_table` where the result's columns did not preserve the categorical dtype of ``columns`` when ``dropna`` was ``False`` (:issue:`17842`)
+- Bug in ``DataFrame.drop_duplicates`` where dropping with non-unique column names raised a ``ValueError`` (:issue:`17836`)
+- Bug in :func:`unstack` which, when called on a list of levels, would discard the ``fillna`` argument (:issue:`13971`)
+- Bug in the alignment of ``range`` objects and other list-likes with ``DataFrame`` leading to operations being performed row-wise instead of column-wise (:issue:`17901`)
+
+Numeric
+^^^^^^^
+- Bug in ``.clip()`` with ``axis=1`` and a list-like for ``threshold`` is passed; previously this raised ``ValueError`` (:issue:`15390`)
+- :func:`Series.clip()` and :func:`DataFrame.clip()` now treat NA values for upper and lower arguments as ``None`` instead of raising ``ValueError`` (:issue:`17276`).
+
+
+Categorical
+^^^^^^^^^^^
+- Bug in :func:`Series.isin` when called with a categorical (:issue:`16639`)
+- Bug in the categorical constructor with empty values and categories causing the ``.categories`` to be an empty ``Float64Index`` rather than an empty ``Index`` with object dtype (:issue:`17248`)
+- Bug in categorical operations with :ref:`Series.cat <categorical.cat>` not preserving the original Series' name (:issue:`17509`)
+- Bug in :func:`DataFrame.merge` failing for categorical columns with boolean/int data types (:issue:`17187`)
+- Bug in constructing a ``Categorical``/``CategoricalDtype`` when the specified ``categories`` are of categorical type (:issue:`17884`).
+
+.. _whatsnew_0210.pypy:
+
+PyPy
+^^^^
+
+- Compatibility with PyPy in :func:`read_csv` with ``usecols=[<unsorted ints>]`` and
+  :func:`read_json` (:issue:`17351`)
+- Split tests into cases for CPython and PyPy where needed, which highlights the fragility
+  of index matching with ``float('nan')``, ``np.nan`` and ``NAT`` (:issue:`17351`)
+- Fix :func:`DataFrame.memory_usage` to support PyPy. Objects on PyPy do not have a fixed size,
+  so an approximation is used instead (:issue:`17228`)
+
+Other
+^^^^^
+- Bug where some inplace operators were not being wrapped and produced a copy when invoked (:issue:`12962`)
+- Bug in :func:`eval` where the ``inplace`` parameter was being incorrectly handled (:issue:`16732`)
+
+
+
+.. _whatsnew_0.21.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.20.3..v0.21.0
diff --git a/doc/source/whatsnew/v0.21.1.rst b/doc/source/whatsnew/v0.21.1.rst
new file mode 100644
index 0000000000000..c8897ca86e8cf
--- /dev/null
+++ b/doc/source/whatsnew/v0.21.1.rst
@@ -0,0 +1,187 @@
+.. _whatsnew_0211:
+
+v0.21.1 (December 12, 2017)
+---------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a minor bug-fix release in the 0.21.x series and includes some small regression fixes,
+bug fixes and performance improvements.
+We recommend that all users upgrade to this version.
+
+Highlights include:
+
+- Temporarily restore matplotlib datetime plotting functionality. This should
+  resolve issues for users who implicitly relied on pandas to plot datetimes
+  with matplotlib. See :ref:`here <whatsnew_0211.converters>`.
+- Improvements to the Parquet IO functions introduced in 0.21.0. See
+  :ref:`here <whatsnew_0211.enhancements.parquet>`.
+
+
+.. contents:: What's new in v0.21.1
+    :local:
+    :backlinks: none
+
+
+.. _whatsnew_0211.converters:
+
+Restore Matplotlib datetime Converter Registration
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas implements some matplotlib converters for nicely formatting the axis
+labels on plots with ``datetime`` or ``Period`` values. Prior to pandas 0.21.0,
+these were implicitly registered with matplotlib, as a side effect of ``import
+pandas``.
+
+In pandas 0.21.0, we required users to explicitly register the
+converter. This caused problems for some users who relied on those converters
+being present for regular ``matplotlib.pyplot`` plotting methods, so we're
+temporarily reverting that change; pandas 0.21.1 again registers the converters on
+import, just like before 0.21.0.
+
+We've added a new option to control the converters:
+``pd.options.plotting.matplotlib.register_converters``. By default, they are
+registered. Toggling this to ``False`` removes pandas' formatters and restore
+any converters we overwrote when registering them (:issue:`18301`).
+
+We're working with the matplotlib developers to make this easier. We're trying
+to balance user convenience (automatically registering the converters) with
+import performance and best practices (importing pandas shouldn't have the side
+effect of overwriting any custom converters you've already set). In the future
+we hope to have most of the datetime formatting functionality in matplotlib,
+with just the pandas-specific converters in pandas. We'll then gracefully
+deprecate the automatic registration of converters in favor of users explicitly
+registering them when they want them.
+
+.. _whatsnew_0211.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0211.enhancements.parquet:
+
+Improvements to the Parquet IO functionality
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+- :func:`DataFrame.to_parquet` will now write non-default indexes when the
+  underlying engine supports it. The indexes will be preserved when reading
+  back in with :func:`read_parquet` (:issue:`18581`).
+- :func:`read_parquet` now allows to specify the columns to read from a parquet file (:issue:`18154`)
+- :func:`read_parquet` now allows to specify kwargs which are passed to the respective engine (:issue:`18216`)
+
+.. _whatsnew_0211.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- :meth:`Timestamp.timestamp` is now available in Python 2.7. (:issue:`17329`)
+- :class:`Grouper` and :class:`TimeGrouper` now have a friendly repr output (:issue:`18203`).
+
+.. _whatsnew_0211.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- ``pandas.tseries.register`` has been renamed to
+  :func:`pandas.plotting.register_matplotlib_converters` (:issue:`18301`)
+
+.. _whatsnew_0211.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of plotting large series/dataframes (:issue:`18236`).
+
+.. _whatsnew_0211.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Conversion
+^^^^^^^^^^
+
+- Bug in :class:`TimedeltaIndex` subtraction could incorrectly overflow when ``NaT`` is present (:issue:`17791`)
+- Bug in :class:`DatetimeIndex` subtracting datetimelike from DatetimeIndex could fail to overflow (:issue:`18020`)
+- Bug in :meth:`IntervalIndex.copy` when copying and ``IntervalIndex`` with non-default ``closed`` (:issue:`18339`)
+- Bug in :func:`DataFrame.to_dict` where columns of datetime that are tz-aware were not converted to required arrays when used with ``orient='records'``, raising ``TypeError`` (:issue:`18372`)
+- Bug in :class:`DateTimeIndex` and :meth:`date_range` where mismatching tz-aware ``start`` and ``end`` timezones would not raise an err if ``end.tzinfo`` is None (:issue:`18431`)
+- Bug in :meth:`Series.fillna` which raised when passed a long integer on Python 2 (:issue:`18159`).
+
+Indexing
+^^^^^^^^
+
+- Bug in a boolean comparison of a ``datetime.datetime`` and a ``datetime64[ns]`` dtype Series (:issue:`17965`)
+- Bug where a ``MultiIndex`` with more than a million records was not raising ``AttributeError`` when trying to access a missing attribute (:issue:`18165`)
+- Bug in :class:`IntervalIndex` constructor when a list of intervals is passed with non-default ``closed`` (:issue:`18334`)
+- Bug in ``Index.putmask`` when an invalid mask passed (:issue:`18368`)
+- Bug in masked assignment of a ``timedelta64[ns]`` dtype ``Series``, incorrectly coerced to float (:issue:`18493`)
+
+I/O
+^^^
+
+- Bug in class:`~pandas.io.stata.StataReader` not converting date/time columns with display formatting addressed (:issue:`17990`). Previously columns with display formatting were normally left as ordinal numbers and not converted to datetime objects.
+- Bug in :func:`read_csv` when reading a compressed UTF-16 encoded file (:issue:`18071`)
+- Bug in :func:`read_csv` for handling null values in index columns when specifying ``na_filter=False`` (:issue:`5239`)
+- Bug in :func:`read_csv` when reading numeric category fields with high cardinality (:issue:`18186`)
+- Bug in :meth:`DataFrame.to_csv` when the table had ``MultiIndex`` columns, and a list of strings was passed in for ``header`` (:issue:`5539`)
+- Bug in parsing integer datetime-like columns with specified format in ``read_sql`` (:issue:`17855`).
+- Bug in :meth:`DataFrame.to_msgpack` when serializing data of the ``numpy.bool_`` datatype (:issue:`18390`)
+- Bug in :func:`read_json` not decoding when reading line delimited JSON from S3 (:issue:`17200`)
+- Bug in :func:`pandas.io.json.json_normalize` to avoid modification of ``meta`` (:issue:`18610`)
+- Bug in :func:`to_latex` where repeated MultiIndex values were not printed even though a higher level index differed from the previous row (:issue:`14484`)
+- Bug when reading NaN-only categorical columns in :class:`HDFStore` (:issue:`18413`)
+- Bug in :meth:`DataFrame.to_latex` with ``longtable=True`` where a latex multicolumn always spanned over three columns (:issue:`17959`)
+
+Plotting
+^^^^^^^^
+
+- Bug in ``DataFrame.plot()`` and ``Series.plot()`` with :class:`DatetimeIndex` where a figure generated by them is not pickleable in Python 3 (:issue:`18439`)
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in ``DataFrame.resample(...).apply(...)`` when there is a callable that returns different columns (:issue:`15169`)
+- Bug in ``DataFrame.resample(...)`` when there is a time change (DST) and resampling frequency is 12h or higher (:issue:`15549`)
+- Bug in ``pd.DataFrameGroupBy.count()`` when counting over a datetimelike column (:issue:`13393`)
+- Bug in ``rolling.var`` where calculation is inaccurate with a zero-valued array (:issue:`18430`)
+
+Reshaping
+^^^^^^^^^
+
+- Error message in ``pd.merge_asof()`` for key datatype mismatch now includes datatype of left and right key (:issue:`18068`)
+- Bug in ``pd.concat`` when empty and non-empty DataFrames or Series are concatenated (:issue:`18178` :issue:`18187`)
+- Bug in ``DataFrame.filter(...)`` when :class:`unicode` is passed as a condition in Python 2 (:issue:`13101`)
+- Bug when merging empty DataFrames when ``np.seterr(divide='raise')`` is set (:issue:`17776`)
+
+Numeric
+^^^^^^^
+
+- Bug in ``pd.Series.rolling.skew()`` and ``rolling.kurt()`` with all equal values has floating issue (:issue:`18044`)
+
+Categorical
+^^^^^^^^^^^
+
+- Bug in :meth:`DataFrame.astype` where casting to 'category' on an empty ``DataFrame`` causes a segmentation fault (:issue:`18004`)
+- Error messages in the testing module have been improved when items have different ``CategoricalDtype`` (:issue:`18069`)
+- ``CategoricalIndex`` can now correctly take a ``pd.api.types.CategoricalDtype`` as its dtype (:issue:`18116`)
+- Bug in ``Categorical.unique()`` returning read-only ``codes``  array when all categories were ``NaN`` (:issue:`18051`)
+- Bug in ``DataFrame.groupby(axis=1)`` with a ``CategoricalIndex`` (:issue:`18432`)
+
+String
+^^^^^^
+
+- :meth:`Series.str.split()` will now propagate ``NaN`` values across all expanded columns instead of ``None`` (:issue:`18450`)
+
+
+.. _whatsnew_0.21.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.21.0..v0.21.1
diff --git a/doc/source/whatsnew/v0.22.0.rst b/doc/source/whatsnew/v0.22.0.rst
new file mode 100644
index 0000000000000..b38fcd9d62af4
--- /dev/null
+++ b/doc/source/whatsnew/v0.22.0.rst
@@ -0,0 +1,259 @@
+.. _whatsnew_0220:
+
+v0.22.0 (December 29, 2017)
+---------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a major release from 0.21.1 and includes a single, API-breaking change.
+We recommend that all users upgrade to this version after carefully reading the
+release note (singular!).
+
+.. _whatsnew_0220.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas 0.22.0 changes the handling of empty and all-*NA* sums and products. The
+summary is that
+
+* The sum of an empty or all-*NA* ``Series`` is now ``0``
+* The product of an empty or all-*NA* ``Series`` is now ``1``
+* We've added a ``min_count`` parameter to ``.sum()`` and ``.prod()`` controlling
+  the minimum number of valid values for the result to be valid. If fewer than
+  ``min_count`` non-*NA* values are present, the result is *NA*. The default is
+  ``0``. To return ``NaN``, the 0.21 behavior, use ``min_count=1``.
+
+Some background: In pandas 0.21, we fixed a long-standing inconsistency
+in the return value of all-*NA* series depending on whether or not bottleneck
+was installed. See :ref:`whatsnew_0210.api_breaking.bottleneck`. At the same
+time, we changed the sum and prod of an empty ``Series`` to also be ``NaN``.
+
+Based on feedback, we've partially reverted those changes.
+
+Arithmetic Operations
+^^^^^^^^^^^^^^^^^^^^^
+
+The default sum for empty or all-*NA* ``Series`` is now ``0``.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [1]: pd.Series([]).sum()
+   Out[1]: nan
+
+   In [2]: pd.Series([np.nan]).sum()
+   Out[2]: nan
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   pd.Series([]).sum()
+   pd.Series([np.nan]).sum()
+
+The default behavior is the same as pandas 0.20.3 with bottleneck installed. It
+also matches the behavior of NumPy's ``np.nansum`` on empty and all-*NA* arrays.
+
+To have the sum of an empty series return ``NaN`` (the default behavior of
+pandas 0.20.3 without bottleneck, or pandas 0.21.x), use the ``min_count``
+keyword.
+
+.. ipython:: python
+
+   pd.Series([]).sum(min_count=1)
+
+Thanks to the ``skipna`` parameter, the ``.sum`` on an all-*NA*
+series is conceptually the same as the ``.sum`` of an empty one with
+``skipna=True`` (the default).
+
+.. ipython:: python
+
+   pd.Series([np.nan]).sum(min_count=1)  # skipna=True by default
+
+The ``min_count`` parameter refers to the minimum number of *non-null* values
+required for a non-NA sum or product.
+
+:meth:`Series.prod` has been updated to behave the same as :meth:`Series.sum`,
+returning ``1`` instead.
+
+.. ipython:: python
+
+   pd.Series([]).prod()
+   pd.Series([np.nan]).prod()
+   pd.Series([]).prod(min_count=1)
+
+These changes affect :meth:`DataFrame.sum` and :meth:`DataFrame.prod` as well.
+Finally, a few less obvious places in pandas are affected by this change.
+
+Grouping by a Categorical
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Grouping by a ``Categorical`` and summing now returns ``0`` instead of
+``NaN`` for categories with no observations. The product now returns ``1``
+instead of ``NaN``.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [8]: grouper = pd.Categorical(['a', 'a'], categories=['a', 'b'])
+
+   In [9]: pd.Series([1, 2]).groupby(grouper).sum()
+   Out[9]:
+   a    3.0
+   b    NaN
+   dtype: float64
+
+*pandas 0.22*
+
+.. ipython:: python
+
+   grouper = pd.Categorical(['a', 'a'], categories=['a', 'b'])
+   pd.Series([1, 2]).groupby(grouper).sum()
+
+To restore the 0.21 behavior of returning ``NaN`` for unobserved groups,
+use ``min_count>=1``.
+
+.. ipython:: python
+
+   pd.Series([1, 2]).groupby(grouper).sum(min_count=1)
+
+Resample
+^^^^^^^^
+
+The sum and product of all-*NA* bins has changed from ``NaN`` to ``0`` for
+sum and ``1`` for product.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [11]: s = pd.Series([1, 1, np.nan, np.nan],
+      ....:               index=pd.date_range('2017', periods=4))
+      ....: s
+   Out[11]:
+   2017-01-01    1.0
+   2017-01-02    1.0
+   2017-01-03    NaN
+   2017-01-04    NaN
+   Freq: D, dtype: float64
+
+   In [12]: s.resample('2d').sum()
+   Out[12]:
+   2017-01-01    2.0
+   2017-01-03    NaN
+   Freq: 2D, dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   s = pd.Series([1, 1, np.nan, np.nan],
+                 index=pd.date_range('2017', periods=4))
+   s.resample('2d').sum()
+
+To restore the 0.21 behavior of returning ``NaN``, use ``min_count>=1``.
+
+.. ipython:: python
+
+   s.resample('2d').sum(min_count=1)
+
+In particular, upsampling and taking the sum or product is affected, as
+upsampling introduces missing values even if the original series was
+entirely valid.
+
+*pandas 0.21.x*
+
+.. code-block:: ipython
+
+   In [14]: idx = pd.DatetimeIndex(['2017-01-01', '2017-01-02'])
+
+   In [15]: pd.Series([1, 2], index=idx).resample('12H').sum()
+   Out[15]:
+   2017-01-01 00:00:00    1.0
+   2017-01-01 12:00:00    NaN
+   2017-01-02 00:00:00    2.0
+   Freq: 12H, dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   idx = pd.DatetimeIndex(['2017-01-01', '2017-01-02'])
+   pd.Series([1, 2], index=idx).resample("12H").sum()
+
+Once again, the ``min_count`` keyword is available to restore the 0.21 behavior.
+
+.. ipython:: python
+
+   pd.Series([1, 2], index=idx).resample("12H").sum(min_count=1)
+
+Rolling and Expanding
+^^^^^^^^^^^^^^^^^^^^^
+
+Rolling and expanding already have a ``min_periods`` keyword that behaves
+similar to ``min_count``. The only case that changes is when doing a rolling
+or expanding sum with ``min_periods=0``. Previously this returned ``NaN``,
+when fewer than ``min_periods`` non-*NA* values were in the window. Now it
+returns ``0``.
+
+*pandas 0.21.1*
+
+.. code-block:: ipython
+
+   In [17]: s = pd.Series([np.nan, np.nan])
+
+   In [18]: s.rolling(2, min_periods=0).sum()
+   Out[18]:
+   0   NaN
+   1   NaN
+   dtype: float64
+
+*pandas 0.22.0*
+
+.. ipython:: python
+
+   s = pd.Series([np.nan, np.nan])
+   s.rolling(2, min_periods=0).sum()
+
+The default behavior of ``min_periods=None``, implying that ``min_periods``
+equals the window size, is unchanged.
+
+Compatibility
+~~~~~~~~~~~~~
+
+If you maintain a library that should work across pandas versions, it
+may be easiest to exclude pandas 0.21 from your requirements. Otherwise, all your
+``sum()`` calls would need to check if the ``Series`` is empty before summing.
+
+With setuptools, in your ``setup.py`` use::
+
+    install_requires=['pandas!=0.21.*', ...]
+
+With conda, use
+
+.. code-block:: yaml
+
+    requirements:
+      run:
+        - pandas !=0.21.0,!=0.21.1
+
+Note that the inconsistency in the return value for all-*NA* series is still
+there for pandas 0.20.3 and earlier. Avoiding pandas 0.21 will only help with
+the empty case.
+
+
+.. _whatsnew_0.22.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.21.1..v0.22.0
diff --git a/doc/source/whatsnew/v0.23.0.rst b/doc/source/whatsnew/v0.23.0.rst
new file mode 100644
index 0000000000000..e52a36a922bd9
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.0.rst
@@ -0,0 +1,1434 @@
+.. _whatsnew_0230:
+
+What's new in 0.23.0 (May 15, 2018)
+-----------------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+This is a major release from 0.22.0 and includes a number of API changes,
+deprecations, new features, enhancements, and performance improvements along
+with a large number of bug fixes. We recommend that all users upgrade to this
+version.
+
+Highlights include:
+
+- :ref:`Round-trippable JSON format with 'table' orient <whatsnew_0230.enhancements.round-trippable_json>`.
+- :ref:`Instantiation from dicts respects order for Python 3.6+ <whatsnew_0230.api_breaking.dict_insertion_order>`.
+- :ref:`Dependent column arguments for assign <whatsnew_0230.enhancements.assign_dependent>`.
+- :ref:`Merging / sorting on a combination of columns and index levels <whatsnew_0230.enhancements.merge_on_columns_and_levels>`.
+- :ref:`Extending Pandas with custom types <whatsnew_023.enhancements.extension>`.
+- :ref:`Excluding unobserved categories from groupby <whatsnew_0230.enhancements.categorical_grouping>`.
+- :ref:`Changes to make output shape of DataFrame.apply consistent <whatsnew_0230.api_breaking.apply>`.
+
+Check the :ref:`API Changes <whatsnew_0230.api_breaking>` and :ref:`deprecations <whatsnew_0230.deprecations>` before updating.
+
+.. warning::
+
+   Starting January 1, 2019, pandas feature releases will support Python 3 only.
+   See :ref:`install.dropping-27` for more.
+
+.. contents:: What's new in v0.23.0
+    :local:
+    :backlinks: none
+    :depth: 2
+
+.. _whatsnew_0230.enhancements:
+
+New features
+~~~~~~~~~~~~
+
+.. _whatsnew_0230.enhancements.round-trippable_json:
+
+JSON read/write round-trippable with ``orient='table'``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A ``DataFrame`` can now be written to and subsequently read back via JSON while preserving metadata through usage of the ``orient='table'`` argument (see :issue:`18912` and :issue:`9146`). Previously, none of the available ``orient`` values guaranteed the preservation of dtypes and index names, amongst other metadata.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'foo': [1, 2, 3, 4],
+                      'bar': ['a', 'b', 'c', 'd'],
+                      'baz': pd.date_range('2018-01-01', freq='d', periods=4),
+                      'qux': pd.Categorical(['a', 'b', 'c', 'c'])},
+                     index=pd.Index(range(4), name='idx'))
+   df
+   df.dtypes
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+Please note that the string `index` is not supported with the round trip format, as it is used by default in ``write_json`` to indicate a missing index name.
+
+.. ipython:: python
+   :okwarning:
+
+   df.index.name = 'index'
+
+   df.to_json('test.json', orient='table')
+   new_df = pd.read_json('test.json', orient='table')
+   new_df
+   new_df.dtypes
+
+.. ipython:: python
+   :suppress:
+
+   import os
+   os.remove('test.json')
+
+
+.. _whatsnew_0230.enhancements.assign_dependent:
+
+
+``.assign()`` accepts dependent arguments
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`DataFrame.assign` now accepts dependent keyword arguments for python version later than 3.6 (see also `PEP 468
+<https://www.python.org/dev/peps/pep-0468/>`_). Later keyword arguments may now refer to earlier ones if the argument is a callable. See the
+:ref:`documentation here <dsintro.chained_assignment>` (:issue:`14207`)
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': [1, 2, 3]})
+    df
+    df.assign(B=df.A, C=lambda x: x['A'] + x['B'])
+
+.. warning::
+
+  This may subtly change the behavior of your code when you're
+  using ``.assign()`` to update an existing column. Previously, callables
+  referring to other variables being updated would get the "old" values
+
+  Previous Behavior:
+
+  .. code-block:: ipython
+
+      In [2]: df = pd.DataFrame({"A": [1, 2, 3]})
+
+      In [3]: df.assign(A=lambda df: df.A + 1, C=lambda df: df.A * -1)
+      Out[3]:
+         A  C
+      0  2 -1
+      1  3 -2
+      2  4 -3
+
+  New Behavior:
+
+  .. ipython:: python
+
+      df.assign(A=df.A + 1, C=lambda df: df.A * -1)
+
+
+
+.. _whatsnew_0230.enhancements.merge_on_columns_and_levels:
+
+Merging on a combination of columns and index levels
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to :meth:`DataFrame.merge` as the ``on``, ``left_on``, and ``right_on``
+parameters may now refer to either column names or index level names.
+This enables merging ``DataFrame`` instances on a combination of index levels
+and columns without resetting indexes. See the :ref:`Merge on columns and
+levels <merging.merge_on_columns_and_levels>` documentation section.
+(:issue:`14355`)
+
+.. ipython:: python
+
+   left_index = pd.Index(['K0', 'K0', 'K1', 'K2'], name='key1')
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2', 'A3'],
+                        'B': ['B0', 'B1', 'B2', 'B3'],
+                        'key2': ['K0', 'K1', 'K0', 'K1']},
+                       index=left_index)
+
+   right_index = pd.Index(['K0', 'K1', 'K2', 'K2'], name='key1')
+
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3'],
+                         'key2': ['K0', 'K0', 'K0', 'K1']},
+                        index=right_index)
+
+   left.merge(right, on=['key1', 'key2'])
+
+.. _whatsnew_0230.enhancements.sort_by_columns_and_levels:
+
+Sorting by a combination of columns and index levels
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Strings passed to :meth:`DataFrame.sort_values` as the ``by`` parameter may
+now refer to either column names or index level names.  This enables sorting
+``DataFrame`` instances by a combination of index levels and columns without
+resetting indexes. See the :ref:`Sorting by Indexes and Values
+<basics.sort_indexes_and_values>` documentation section.
+(:issue:`14353`)
+
+.. ipython:: python
+
+   # Build MultiIndex
+   idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 2),
+                                    ('b', 2), ('b', 1), ('b', 1)])
+   idx.names = ['first', 'second']
+
+   # Build DataFrame
+   df_multi = pd.DataFrame({'A': np.arange(6, 0, -1)},
+                           index=idx)
+   df_multi
+
+   # Sort by 'second' (index) and 'A' (column)
+   df_multi.sort_values(by=['second', 'A'])
+
+
+.. _whatsnew_023.enhancements.extension:
+
+Extending Pandas with Custom Types (Experimental)
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas now supports storing array-like objects that aren't necessarily 1-D NumPy
+arrays as columns in a DataFrame or values in a Series. This allows third-party
+libraries to implement extensions to NumPy's types, similar to how pandas
+implemented categoricals, datetimes with timezones, periods, and intervals.
+
+As a demonstration, we'll use cyberpandas_, which provides an ``IPArray`` type
+for storing ip addresses.
+
+.. code-block:: ipython
+
+   In [1]: from cyberpandas import IPArray
+
+   In [2]: values = IPArray([
+      ...:     0,
+      ...:     3232235777,
+      ...:     42540766452641154071740215577757643572
+      ...: ])
+      ...:
+      ...:
+
+``IPArray`` isn't a normal 1-D NumPy array, but because it's a pandas
+:class:`~pandas.api.extensions.ExtensionArray`, it can be stored properly inside pandas' containers.
+
+.. code-block:: ipython
+
+   In [3]: ser = pd.Series(values)
+
+   In [4]: ser
+   Out[4]:
+   0                         0.0.0.0
+   1                     192.168.1.1
+   2    2001:db8:85a3::8a2e:370:7334
+   dtype: ip
+
+Notice that the dtype is ``ip``. The missing value semantics of the underlying
+array are respected:
+
+.. code-block:: ipython
+
+   In [5]: ser.isna()
+   Out[5]:
+   0     True
+   1    False
+   2    False
+   dtype: bool
+
+For more, see the :ref:`extension types <extending.extension-types>`
+documentation. If you build an extension array, publicize it on our
+:ref:`ecosystem page <ecosystem.extensions>`.
+
+.. _cyberpandas: https://cyberpandas.readthedocs.io/en/latest/
+
+
+.. _whatsnew_0230.enhancements.categorical_grouping:
+
+New ``observed`` keyword for excluding unobserved categories in ``groupby``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Grouping by a categorical includes the unobserved categories in the output.
+When grouping by multiple categorical columns, this means you get the cartesian product of all the
+categories, including combinations where there are no observations, which can result in a large
+number of groups. We have added a keyword ``observed`` to control this behavior, it defaults to
+``observed=False`` for backward-compatibility. (:issue:`14942`, :issue:`8138`, :issue:`15217`, :issue:`17594`, :issue:`8669`, :issue:`20583`, :issue:`20902`)
+
+.. ipython:: python
+
+   cat1 = pd.Categorical(["a", "a", "b", "b"],
+                         categories=["a", "b", "z"], ordered=True)
+   cat2 = pd.Categorical(["c", "d", "c", "d"],
+                         categories=["c", "d", "y"], ordered=True)
+   df = pd.DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+   df['C'] = ['foo', 'bar'] * 2
+   df
+
+To show all values, the previous behavior:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B', 'C'], observed=False).count()
+
+
+To show only observed values:
+
+.. ipython:: python
+
+   df.groupby(['A', 'B', 'C'], observed=True).count()
+
+For pivotting operations, this behavior is *already* controlled by the ``dropna`` keyword:
+
+.. ipython:: python
+
+   cat1 = pd.Categorical(["a", "a", "b", "b"],
+                         categories=["a", "b", "z"], ordered=True)
+   cat2 = pd.Categorical(["c", "d", "c", "d"],
+                         categories=["c", "d", "y"], ordered=True)
+   df = pd.DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+   df
+
+.. ipython:: python
+
+   pd.pivot_table(df, values='values', index=['A', 'B'],
+                  dropna=True)
+   pd.pivot_table(df, values='values', index=['A', 'B'],
+                  dropna=False)
+
+
+.. _whatsnew_0230.enhancements.window_raw:
+
+Rolling/Expanding.apply() accepts ``raw=False`` to pass a ``Series`` to the function
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`Series.rolling().apply() <pandas.core.window.Rolling.apply>`, :func:`DataFrame.rolling().apply() <pandas.core.window.Rolling.apply>`,
+:func:`Series.expanding().apply() <pandas.core.window.Expanding.apply>`, and :func:`DataFrame.expanding().apply() <pandas.core.window.Expanding.apply>` have gained a ``raw=None`` parameter.
+This is similar to :func:`DataFame.apply`. This parameter, if ``True`` allows one to send a ``np.ndarray`` to the applied function. If ``False`` a ``Series`` will be passed. The
+default is ``None``, which preserves backward compatibility, so this will default to ``True``, sending an ``np.ndarray``.
+In a future version the default will be changed to ``False``, sending a ``Series``. (:issue:`5071`, :issue:`20584`)
+
+.. ipython:: python
+
+   s = pd.Series(np.arange(5), np.arange(5) + 1)
+   s
+
+Pass a ``Series``:
+
+.. ipython:: python
+
+   s.rolling(2, min_periods=1).apply(lambda x: x.iloc[-1], raw=False)
+
+Mimic the original behavior of passing a ndarray:
+
+.. ipython:: python
+
+   s.rolling(2, min_periods=1).apply(lambda x: x[-1], raw=True)
+
+
+.. _whatsnew_0210.enhancements.limit_area:
+
+``DataFrame.interpolate`` has gained the ``limit_area`` kwarg
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`DataFrame.interpolate` has gained a ``limit_area`` parameter to allow further control of which ``NaN`` s are replaced.
+Use ``limit_area='inside'`` to fill only NaNs surrounded by valid values or use ``limit_area='outside'`` to fill only ``NaN`` s
+outside the existing valid values while preserving those inside.  (:issue:`16284`) See the :ref:`full documentation here <missing_data.interp_limits>`.
+
+
+.. ipython:: python
+
+   ser = pd.Series([np.nan, np.nan, 5, np.nan, np.nan,
+                    np.nan, 13, np.nan, np.nan])
+   ser
+
+Fill one consecutive inside value in both directions
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='both', limit_area='inside', limit=1)
+
+Fill all consecutive outside values backward
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='backward', limit_area='outside')
+
+Fill all consecutive outside values in both directions
+
+.. ipython:: python
+
+   ser.interpolate(limit_direction='both', limit_area='outside')
+
+.. _whatsnew_0210.enhancements.get_dummies_dtype:
+
+``get_dummies`` now supports ``dtype`` argument
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The :func:`get_dummies` now accepts a ``dtype`` argument, which specifies a dtype for the new columns. The default remains uint8. (:issue:`18330`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
+   pd.get_dummies(df, columns=['c']).dtypes
+   pd.get_dummies(df, columns=['c'], dtype=bool).dtypes
+
+
+.. _whatsnew_0230.enhancements.timedelta_mod:
+
+Timedelta mod method
+^^^^^^^^^^^^^^^^^^^^
+
+``mod`` (%) and ``divmod`` operations are now defined on ``Timedelta`` objects
+when operating with either timedelta-like or with numeric arguments.
+See the :ref:`documentation here <timedeltas.mod_divmod>`. (:issue:`19365`)
+
+.. ipython:: python
+
+    td = pd.Timedelta(hours=37)
+    td % pd.Timedelta(minutes=45)
+
+.. _whatsnew_0230.enhancements.ran_inf:
+
+``.rank()`` handles ``inf`` values when ``NaN`` are present
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In previous versions, ``.rank()`` would assign ``inf`` elements ``NaN`` as their ranks. Now ranks are calculated properly. (:issue:`6945`)
+
+.. ipython:: python
+
+    s = pd.Series([-np.inf, 0, 1, np.nan, np.inf])
+    s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [11]: s.rank()
+    Out[11]:
+    0    1.0
+    1    2.0
+    2    3.0
+    3    NaN
+    4    NaN
+    dtype: float64
+
+Current Behavior:
+
+.. ipython:: python
+
+    s.rank()
+
+Furthermore, previously if you rank ``inf`` or ``-inf`` values together with ``NaN`` values, the calculation won't distinguish ``NaN`` from infinity when using 'top' or 'bottom' argument.
+
+.. ipython:: python
+
+    s = pd.Series([np.nan, np.nan, -np.inf, -np.inf])
+    s
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [15]: s.rank(na_option='top')
+    Out[15]:
+    0    2.5
+    1    2.5
+    2    2.5
+    3    2.5
+    dtype: float64
+
+Current Behavior:
+
+.. ipython:: python
+
+    s.rank(na_option='top')
+
+These bugs were squashed:
+
+- Bug in :meth:`DataFrame.rank` and :meth:`Series.rank` when ``method='dense'`` and ``pct=True`` in which percentile ranks were not being used with the number of distinct observations (:issue:`15630`)
+- Bug in :meth:`Series.rank` and :meth:`DataFrame.rank` when ``ascending='False'`` failed to return correct ranks for infinity if ``NaN`` were present (:issue:`19538`)
+- Bug in :func:`DataFrameGroupBy.rank` where ranks were incorrect when both infinity and ``NaN`` were present (:issue:`20561`)
+
+
+.. _whatsnew_0230.enhancements.str_cat_align:
+
+``Series.str.cat`` has gained the ``join`` kwarg
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, :meth:`Series.str.cat` did not -- in contrast to most of ``pandas`` -- align :class:`Series` on their index before concatenation (see :issue:`18657`).
+The method has now gained a keyword ``join`` to control the manner of alignment, see examples below and :ref:`here <text.concatenate>`.
+
+In v.0.23 `join` will default to None (meaning no alignment), but this default will change to ``'left'`` in a future version of pandas.
+
+.. ipython:: python
+   :okwarning:
+
+    s = pd.Series(['a', 'b', 'c', 'd'])
+    t = pd.Series(['b', 'd', 'e', 'c'], index=[1, 3, 4, 2])
+    s.str.cat(t)
+    s.str.cat(t, join='left', na_rep='-')
+
+Furthermore, :meth:`Series.str.cat` now works for ``CategoricalIndex`` as well (previously raised a ``ValueError``; see :issue:`20842`).
+
+.. _whatsnew_0230.enhancements.astype_category:
+
+``DataFrame.astype`` performs column-wise conversion to ``Categorical``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:meth:`DataFrame.astype` can now perform column-wise conversion to ``Categorical`` by supplying the string ``'category'`` or
+a :class:`~pandas.api.types.CategoricalDtype`. Previously, attempting this would raise a ``NotImplementedError``. See the
+:ref:`categorical.objectcreation` section of the documentation for more details and examples. (:issue:`12860`, :issue:`18099`)
+
+Supplying the string ``'category'`` performs column-wise conversion, with only labels appearing in a given column set as categories:
+
+.. ipython:: python
+
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    df = df.astype('category')
+    df['A'].dtype
+    df['B'].dtype
+
+
+Supplying a ``CategoricalDtype`` will make the categories in each column consistent with the supplied dtype:
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    df = pd.DataFrame({'A': list('abca'), 'B': list('bccd')})
+    cdt = CategoricalDtype(categories=list('abcd'), ordered=True)
+    df = df.astype(cdt)
+    df['A'].dtype
+    df['B'].dtype
+
+
+.. _whatsnew_0230.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Unary ``+`` now permitted for ``Series`` and ``DataFrame`` as  numeric operator (:issue:`16073`)
+- Better support for :meth:`~pandas.io.formats.style.Styler.to_excel` output with the ``xlsxwriter`` engine. (:issue:`16149`)
+- :func:`pandas.tseries.frequencies.to_offset` now accepts leading '+' signs e.g. '+1h'. (:issue:`18171`)
+- :func:`MultiIndex.unique` now supports the ``level=`` argument, to get unique values from a specific index level (:issue:`17896`)
+- :class:`pandas.io.formats.style.Styler` now has method ``hide_index()`` to determine whether the index will be rendered in output (:issue:`14194`)
+- :class:`pandas.io.formats.style.Styler` now has method ``hide_columns()`` to determine whether columns will be hidden in output (:issue:`14194`)
+- Improved wording of ``ValueError`` raised in :func:`to_datetime` when ``unit=`` is passed with a non-convertible value (:issue:`14350`)
+- :func:`Series.fillna` now accepts a Series or a dict as a ``value`` for a categorical dtype (:issue:`17033`)
+- :func:`pandas.read_clipboard` updated to use qtpy, falling back to PyQt5 and then PyQt4, adding compatibility with Python3 and multiple python-qt bindings (:issue:`17722`)
+- Improved wording of ``ValueError`` raised in :func:`read_csv` when the ``usecols`` argument cannot match all columns. (:issue:`17301`)
+- :func:`DataFrame.corrwith` now silently drops non-numeric columns when passed a Series. Before, an exception was raised (:issue:`18570`).
+- :class:`IntervalIndex` now supports time zone aware ``Interval`` objects (:issue:`18537`, :issue:`18538`)
+- :func:`Series` / :func:`DataFrame` tab completion also returns identifiers in the first level of a :func:`MultiIndex`. (:issue:`16326`)
+- :func:`read_excel()` has gained the ``nrows`` parameter (:issue:`16645`)
+- :meth:`DataFrame.append` can now in more cases preserve the type of the calling dataframe's columns (e.g. if both are ``CategoricalIndex``) (:issue:`18359`)
+- :meth:`DataFrame.to_json` and :meth:`Series.to_json` now accept an ``index`` argument which allows the user to exclude the index from the JSON output (:issue:`17394`)
+- ``IntervalIndex.to_tuples()`` has gained the ``na_tuple`` parameter to control whether NA is returned as a tuple of NA, or NA itself (:issue:`18756`)
+- ``Categorical.rename_categories``, ``CategoricalIndex.rename_categories`` and :attr:`Series.cat.rename_categories`
+  can now take a callable as their argument (:issue:`18862`)
+- :class:`Interval` and :class:`IntervalIndex` have gained a ``length`` attribute (:issue:`18789`)
+- ``Resampler`` objects now have a functioning :attr:`~pandas.core.resample.Resampler.pipe` method.
+  Previously, calls to ``pipe`` were diverted to  the ``mean`` method (:issue:`17905`).
+- :func:`~pandas.api.types.is_scalar` now returns ``True`` for ``DateOffset`` objects (:issue:`18943`).
+- :func:`DataFrame.pivot` now accepts a list for the ``values=`` kwarg (:issue:`17160`).
+- Added :func:`pandas.api.extensions.register_dataframe_accessor`,
+  :func:`pandas.api.extensions.register_series_accessor`, and
+  :func:`pandas.api.extensions.register_index_accessor`, accessor for libraries downstream of pandas
+  to register custom accessors like ``.cat`` on pandas objects. See
+  :ref:`Registering Custom Accessors <extending.register-accessors>` for more (:issue:`14781`).
+
+- ``IntervalIndex.astype`` now supports conversions between subtypes when passed an ``IntervalDtype`` (:issue:`19197`)
+- :class:`IntervalIndex` and its associated constructor methods (``from_arrays``, ``from_breaks``, ``from_tuples``) have gained a ``dtype`` parameter (:issue:`19262`)
+- Added :func:`pandas.core.groupby.SeriesGroupBy.is_monotonic_increasing` and :func:`pandas.core.groupby.SeriesGroupBy.is_monotonic_decreasing` (:issue:`17015`)
+- For subclassed ``DataFrames``, :func:`DataFrame.apply` will now preserve the ``Series`` subclass (if defined) when passing the data to the applied function (:issue:`19822`)
+- :func:`DataFrame.from_dict` now accepts a ``columns`` argument that can be used to specify the column names when ``orient='index'`` is used (:issue:`18529`)
+- Added option ``display.html.use_mathjax`` so `MathJax <https://www.mathjax.org/>`_ can be disabled when rendering tables in ``Jupyter`` notebooks (:issue:`19856`, :issue:`19824`)
+- :func:`DataFrame.replace` now supports the ``method`` parameter, which can be used to specify the replacement method when ``to_replace`` is a scalar, list or tuple and ``value`` is ``None`` (:issue:`19632`)
+- :meth:`Timestamp.month_name`, :meth:`DatetimeIndex.month_name`, and :meth:`Series.dt.month_name` are now available (:issue:`12805`)
+- :meth:`Timestamp.day_name` and :meth:`DatetimeIndex.day_name` are now available to return day names with a specified locale (:issue:`12806`)
+- :meth:`DataFrame.to_sql` now performs a multi-value insert if the underlying connection supports itk rather than inserting row by row.
+  ``SQLAlchemy`` dialects supporting multi-value inserts include: ``mysql``, ``postgresql``, ``sqlite`` and any dialect with ``supports_multivalues_insert``. (:issue:`14315`, :issue:`8953`)
+- :func:`read_html` now accepts a ``displayed_only`` keyword argument to controls whether or not hidden elements are parsed (``True`` by default) (:issue:`20027`)
+- :func:`read_html` now reads all ``<tbody>`` elements in a ``<table>``, not just the first. (:issue:`20690`)
+- :meth:`~pandas.core.window.Rolling.quantile` and :meth:`~pandas.core.window.Expanding.quantile` now accept the ``interpolation`` keyword, ``linear`` by default (:issue:`20497`)
+- zip compression is supported via ``compression=zip`` in :func:`DataFrame.to_pickle`, :func:`Series.to_pickle`, :func:`DataFrame.to_csv`, :func:`Series.to_csv`, :func:`DataFrame.to_json`, :func:`Series.to_json`. (:issue:`17778`)
+- :class:`~pandas.tseries.offsets.WeekOfMonth` constructor now supports ``n=0`` (:issue:`20517`).
+- :class:`DataFrame` and :class:`Series` now support matrix multiplication (``@``) operator (:issue:`10259`) for Python>=3.5
+- Updated :meth:`DataFrame.to_gbq` and :meth:`pandas.read_gbq` signature and documentation to reflect changes from
+  the Pandas-GBQ library version 0.4.0. Adds intersphinx mapping to Pandas-GBQ
+  library. (:issue:`20564`)
+- Added new writer for exporting Stata dta files in version 117, ``StataWriter117``.  This format supports exporting strings with lengths up to 2,000,000 characters (:issue:`16450`)
+- :func:`to_hdf` and :func:`read_hdf` now accept an ``errors`` keyword argument to control encoding error handling (:issue:`20835`)
+- :func:`cut` has gained the ``duplicates='raise'|'drop'`` option to control whether to raise on duplicated edges (:issue:`20947`)
+- :func:`date_range`, :func:`timedelta_range`, and :func:`interval_range` now return a linearly spaced index if ``start``, ``stop``, and ``periods`` are specified, but ``freq`` is not. (:issue:`20808`, :issue:`20983`, :issue:`20976`)
+
+.. _whatsnew_0230.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0230.api_breaking.deps:
+
+Dependencies have increased minimum versions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`15184`).
+If installed, we now require:
+
++-----------------+-----------------+----------+---------------+
+| Package         | Minimum Version | Required |     Issue     |
++=================+=================+==========+===============+
+| python-dateutil | 2.5.0           |    X     | :issue:`15184`|
++-----------------+-----------------+----------+---------------+
+| openpyxl        | 2.4.0           |          | :issue:`15184`|
++-----------------+-----------------+----------+---------------+
+| beautifulsoup4  | 4.2.1           |          | :issue:`20082`|
++-----------------+-----------------+----------+---------------+
+| setuptools      | 24.2.0          |          | :issue:`20698`|
++-----------------+-----------------+----------+---------------+
+
+.. _whatsnew_0230.api_breaking.dict_insertion_order:
+
+Instantiation from dicts preserves dict insertion order for python 3.6+
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Until Python 3.6, dicts in Python had no formally defined ordering. For Python
+version 3.6 and later, dicts are ordered by insertion order, see
+`PEP 468 <https://www.python.org/dev/peps/pep-0468/>`_.
+Pandas will use the dict's insertion order, when creating a ``Series`` or
+``DataFrame`` from a dict and you're using Python version 3.6 or
+higher. (:issue:`19884`)
+
+Previous Behavior (and current behavior if on Python < 3.6):
+
+.. code-block:: ipython
+
+    In [16]: pd.Series({'Income': 2000,
+       ....:            'Expenses': -1500,
+       ....:            'Taxes': -200,
+       ....:            'Net result': 300})
+    Out[16]:
+    Expenses     -1500
+    Income        2000
+    Net result     300
+    Taxes         -200
+    dtype: int64
+
+Note the Series above is ordered alphabetically by the index values.
+
+New Behavior (for Python >= 3.6):
+
+.. ipython:: python
+
+    pd.Series({'Income': 2000,
+               'Expenses': -1500,
+               'Taxes': -200,
+               'Net result': 300})
+
+Notice that the Series is now ordered by insertion order. This new behavior is
+used for all relevant pandas types (``Series``, ``DataFrame``, ``SparseSeries``
+and ``SparseDataFrame``).
+
+If you wish to retain the old behavior while using Python >= 3.6, you can use
+``.sort_index()``:
+
+.. ipython:: python
+
+    pd.Series({'Income': 2000,
+               'Expenses': -1500,
+               'Taxes': -200,
+               'Net result': 300}).sort_index()
+
+.. _whatsnew_0230.api_breaking.deprecate_panel:
+
+Deprecate Panel
+^^^^^^^^^^^^^^^
+
+``Panel`` was deprecated in the 0.20.x release, showing as a ``DeprecationWarning``. Using ``Panel`` will now show a ``FutureWarning``. The recommended way to represent 3-D data are
+with a ``MultiIndex`` on a ``DataFrame`` via the :meth:`~Panel.to_frame` or with the `xarray package <http://xarray.pydata.org/en/stable/>`__. Pandas
+provides a :meth:`~Panel.to_xarray` method to automate this conversion. For more details see :ref:`Deprecate Panel <dsintro.deprecate_panel>` documentation. (:issue:`13563`, :issue:`18324`).
+
+.. ipython:: python
+   :suppress:
+
+   import pandas.util.testing as tm
+
+.. ipython:: python
+   :okwarning:
+
+   p = tm.makePanel()
+   p
+
+Convert to a MultiIndex DataFrame
+
+.. ipython:: python
+
+   p.to_frame()
+
+Convert to an xarray DataArray
+
+.. ipython:: python
+   :okwarning:
+
+   p.to_xarray()
+
+
+.. _whatsnew_0230.api_breaking.core_common:
+
+pandas.core.common removals
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The following error & warning messages are removed from ``pandas.core.common`` (:issue:`13634`, :issue:`19769`):
+
+- ``PerformanceWarning``
+- ``UnsupportedFunctionCall``
+- ``UnsortedIndexError``
+- ``AbstractMethodError``
+
+These are available from import from ``pandas.errors`` (since 0.19.0).
+
+
+.. _whatsnew_0230.api_breaking.apply:
+
+Changes to make output of ``DataFrame.apply`` consistent
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`DataFrame.apply` was inconsistent when applying an arbitrary user-defined-function that returned a list-like with ``axis=1``. Several bugs and inconsistencies
+are resolved. If the applied function returns a Series, then pandas will return a DataFrame; otherwise a Series will be returned, this includes the case
+where a list-like (e.g. ``tuple`` or ``list`` is returned) (:issue:`16353`, :issue:`17437`, :issue:`17970`, :issue:`17348`, :issue:`17892`, :issue:`18573`,
+:issue:`17602`, :issue:`18775`, :issue:`18901`, :issue:`18919`).
+
+.. ipython:: python
+
+    df = pd.DataFrame(np.tile(np.arange(3), 6).reshape(6, -1) + 1,
+                      columns=['A', 'B', 'C'])
+    df
+
+Previous Behavior: if the returned shape happened to match the length of original columns, this would return a ``DataFrame``.
+If the return shape did not match, a ``Series`` with lists was returned.
+
+.. code-block:: python
+
+   In [3]: df.apply(lambda x: [1, 2, 3], axis=1)
+   Out[3]:
+      A  B  C
+   0  1  2  3
+   1  1  2  3
+   2  1  2  3
+   3  1  2  3
+   4  1  2  3
+   5  1  2  3
+
+   In [4]: df.apply(lambda x: [1, 2], axis=1)
+   Out[4]:
+   0    [1, 2]
+   1    [1, 2]
+   2    [1, 2]
+   3    [1, 2]
+   4    [1, 2]
+   5    [1, 2]
+   dtype: object
+
+
+New Behavior: When the applied function returns a list-like, this will now *always* return a ``Series``.
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1)
+    df.apply(lambda x: [1, 2], axis=1)
+
+To have expanded columns, you can use ``result_type='expand'``
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1, result_type='expand')
+
+To broadcast the result across the original columns (the old behaviour for
+list-likes of the correct length), you can use ``result_type='broadcast'``.
+The shape must match the original columns.
+
+.. ipython:: python
+
+    df.apply(lambda x: [1, 2, 3], axis=1, result_type='broadcast')
+
+Returning a ``Series`` allows one to control the exact return structure and column names:
+
+.. ipython:: python
+
+    df.apply(lambda x: pd.Series([1, 2, 3], index=['D', 'E', 'F']), axis=1)
+
+.. _whatsnew_0230.api_breaking.concat:
+
+Concatenation will no longer sort
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In a future version of pandas :func:`pandas.concat` will no longer sort the non-concatenation axis when it is not already aligned.
+The current behavior is the same as the previous (sorting), but now a warning is issued when ``sort`` is not specified and the non-concatenation axis is not aligned (:issue:`4588`).
+
+.. ipython:: python
+   :okwarning:
+
+   df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+   df2 = pd.DataFrame({"a": [4, 5]})
+
+   pd.concat([df1, df2])
+
+To keep the previous behavior (sorting) and silence the warning, pass ``sort=True``
+
+.. ipython:: python
+
+   pd.concat([df1, df2], sort=True)
+
+To accept the future behavior (no sorting), pass ``sort=False``
+
+.. ipython
+
+   pd.concat([df1, df2], sort=False)
+
+Note that this change also applies to :meth:`DataFrame.append`, which has also received a ``sort`` keyword for controlling this behavior.
+
+
+.. _whatsnew_0230.api_breaking.build_changes:
+
+Build Changes
+^^^^^^^^^^^^^
+
+- Building pandas for development now requires ``cython >= 0.24`` (:issue:`18613`)
+- Building from source now explicitly requires ``setuptools`` in ``setup.py`` (:issue:`18113`)
+- Updated conda recipe to be in compliance with conda-build 3.0+ (:issue:`18002`)
+
+.. _whatsnew_0230.api_breaking.index_division_by_zero:
+
+Index Division By Zero Fills Correctly
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Division operations on ``Index`` and subclasses will now fill division of positive numbers by zero with ``np.inf``, division of negative numbers by zero with ``-np.inf`` and `0 / 0` with ``np.nan``.  This matches existing ``Series`` behavior. (:issue:`19322`, :issue:`19347`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [6]: index = pd.Int64Index([-1, 0, 1])
+
+    In [7]: index / 0
+    Out[7]: Int64Index([0, 0, 0], dtype='int64')
+
+    # Previous behavior yielded different results depending on the type of zero in the divisor
+    In [8]: index / 0.0
+    Out[8]: Float64Index([-inf, nan, inf], dtype='float64')
+
+    In [9]: index = pd.UInt64Index([0, 1])
+
+    In [10]: index / np.array([0, 0], dtype=np.uint64)
+    Out[10]: UInt64Index([0, 0], dtype='uint64')
+
+    In [11]: pd.RangeIndex(1, 5) / 0
+    ZeroDivisionError: integer division or modulo by zero
+
+Current Behavior:
+
+.. ipython:: python
+
+    index = pd.Int64Index([-1, 0, 1])
+    # division by zero gives -infinity where negative,
+    # +infinity where positive, and NaN for 0 / 0
+    index / 0
+
+    # The result of division by zero should not depend on
+    # whether the zero is int or float
+    index / 0.0
+
+    index = pd.UInt64Index([0, 1])
+    index / np.array([0, 0], dtype=np.uint64)
+
+    pd.RangeIndex(1, 5) / 0
+
+.. _whatsnew_0230.api_breaking.extract:
+
+Extraction of matching patterns from strings
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+By default, extracting matching patterns from strings with :func:`str.extract` used to return a
+``Series`` if a single group was being extracted (a ``DataFrame`` if more than one group was
+extracted). As of Pandas 0.23.0 :func:`str.extract` always returns a ``DataFrame``, unless
+``expand`` is set to ``False``. Finally, ``None`` was an accepted value for
+the ``expand`` parameter (which was equivalent to ``False``), but now raises a ``ValueError``. (:issue:`11386`)
+
+Previous Behavior:
+
+.. code-block:: ipython
+
+    In [1]: s = pd.Series(['number 10', '12 eggs'])
+
+    In [2]: extracted = s.str.extract(r'.*(\d\d).*')
+
+    In [3]: extracted
+    Out [3]:
+    0    10
+    1    12
+    dtype: object
+
+    In [4]: type(extracted)
+    Out [4]:
+    pandas.core.series.Series
+
+New Behavior:
+
+.. ipython:: python
+
+    s = pd.Series(['number 10', '12 eggs'])
+    extracted = s.str.extract(r'.*(\d\d).*')
+    extracted
+    type(extracted)
+
+To restore previous behavior, simply set ``expand`` to ``False``:
+
+.. ipython:: python
+
+    s = pd.Series(['number 10', '12 eggs'])
+    extracted = s.str.extract(r'.*(\d\d).*', expand=False)
+    extracted
+    type(extracted)
+
+.. _whatsnew_0230.api_breaking.cdt_ordered:
+
+Default value for the ``ordered`` parameter of ``CategoricalDtype``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The default value of the ``ordered`` parameter for :class:`~pandas.api.types.CategoricalDtype` has changed from ``False`` to ``None`` to allow updating of ``categories`` without impacting ``ordered``.  Behavior should remain consistent for downstream objects, such as :class:`Categorical` (:issue:`18790`)
+
+In previous versions, the default value for the ``ordered`` parameter was ``False``.  This could potentially lead to the ``ordered`` parameter unintentionally being changed from ``True`` to ``False`` when users attempt to update ``categories`` if ``ordered`` is not explicitly specified, as it would silently default to ``False``.  The new behavior for ``ordered=None`` is to retain the existing value of ``ordered``.
+
+New Behavior:
+
+.. ipython:: python
+
+    from pandas.api.types import CategoricalDtype
+    cat = pd.Categorical(list('abcaba'), ordered=True, categories=list('cba'))
+    cat
+    cdt = CategoricalDtype(categories=list('cbad'))
+    cat.astype(cdt)
+
+Notice in the example above that the converted ``Categorical`` has retained ``ordered=True``.  Had the default value for ``ordered`` remained as ``False``, the converted ``Categorical`` would have become unordered, despite ``ordered=False`` never being explicitly specified.  To change the value of ``ordered``, explicitly pass it to the new dtype, e.g. ``CategoricalDtype(categories=list('cbad'), ordered=False)``.
+
+Note that the unintentional conversion of ``ordered`` discussed above did not arise in previous versions due to separate bugs that prevented ``astype`` from doing any type of category to category conversion (:issue:`10696`, :issue:`18593`).  These bugs have been fixed in this release, and motivated changing the default value of ``ordered``.
+
+.. _whatsnew_0230.api_breaking.pretty_printing:
+
+Better pretty-printing of DataFrames in a terminal
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+Previously, the default value for the maximum number of columns was
+``pd.options.display.max_columns=20``. This meant that relatively wide data
+frames would not fit within the terminal width, and pandas would introduce line
+breaks to display these 20 columns. This resulted in an output that was
+relatively difficult to read:
+
+.. image:: ../_static/print_df_old.png
+
+If Python runs in a terminal, the maximum number of columns is now determined
+automatically so that the printed data frame fits within the current terminal
+width (``pd.options.display.max_columns=0``) (:issue:`17023`). If Python runs
+as a Jupyter kernel (such as the Jupyter QtConsole or a Jupyter notebook, as
+well as in many IDEs), this value cannot be inferred automatically and is thus
+set to `20` as in previous versions. In a terminal, this results in a much
+nicer output:
+
+.. image:: ../_static/print_df_new.png
+
+Note that if you don't like the new default, you can always set this option
+yourself. To revert to the old setting, you can run this line:
+
+.. code-block:: python
+
+  pd.options.display.max_columns = 20
+
+.. _whatsnew_0230.api.datetimelike:
+
+Datetimelike API Changes
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- The default ``Timedelta`` constructor now accepts an ``ISO 8601 Duration`` string as an argument (:issue:`19040`)
+- Subtracting ``NaT`` from a :class:`Series` with ``dtype='datetime64[ns]'`` returns a ``Series`` with ``dtype='timedelta64[ns]'`` instead of ``dtype='datetime64[ns]'`` (:issue:`18808`)
+- Addition or subtraction of ``NaT`` from :class:`TimedeltaIndex` will return ``TimedeltaIndex`` instead of ``DatetimeIndex`` (:issue:`19124`)
+- :func:`DatetimeIndex.shift` and :func:`TimedeltaIndex.shift` will now raise ``NullFrequencyError`` (which subclasses ``ValueError``, which was raised in older versions) when the index object frequency is ``None`` (:issue:`19147`)
+- Addition and subtraction of ``NaN`` from a :class:`Series` with ``dtype='timedelta64[ns]'`` will raise a ``TypeError`` instead of treating the ``NaN`` as ``NaT`` (:issue:`19274`)
+- ``NaT`` division with :class:`datetime.timedelta` will now return ``NaN`` instead of raising (:issue:`17876`)
+- Operations between a :class:`Series` with dtype ``dtype='datetime64[ns]'`` and a :class:`PeriodIndex` will correctly raises ``TypeError`` (:issue:`18850`)
+- Subtraction of :class:`Series` with timezone-aware ``dtype='datetime64[ns]'`` with mis-matched timezones will raise ``TypeError`` instead of ``ValueError`` (:issue:`18817`)
+- :class:`Timestamp` will no longer silently ignore unused or invalid ``tz`` or ``tzinfo`` keyword arguments (:issue:`17690`)
+- :class:`Timestamp` will no longer silently ignore invalid ``freq`` arguments (:issue:`5168`)
+- :class:`CacheableOffset` and :class:`WeekDay` are no longer available in the ``pandas.tseries.offsets`` module (:issue:`17830`)
+- ``pandas.tseries.frequencies.get_freq_group()`` and ``pandas.tseries.frequencies.DAYS`` are removed from the public API (:issue:`18034`)
+- :func:`Series.truncate` and :func:`DataFrame.truncate` will raise a ``ValueError`` if the index is not sorted instead of an unhelpful ``KeyError`` (:issue:`17935`)
+- :attr:`Series.first` and :attr:`DataFrame.first` will now raise a ``TypeError``
+  rather than ``NotImplementedError`` when index is not a :class:`DatetimeIndex` (:issue:`20725`).
+- :attr:`Series.last` and :attr:`DataFrame.last` will now raise a ``TypeError``
+  rather than ``NotImplementedError`` when index is not a :class:`DatetimeIndex` (:issue:`20725`).
+- Restricted ``DateOffset`` keyword arguments. Previously, ``DateOffset`` subclasses allowed arbitrary keyword arguments which could lead to unexpected behavior. Now, only valid arguments will be accepted. (:issue:`17176`, :issue:`18226`).
+- :func:`pandas.merge` provides a more informative error message when trying to merge on timezone-aware and timezone-naive columns (:issue:`15800`)
+- For :class:`DatetimeIndex` and :class:`TimedeltaIndex` with ``freq=None``, addition or subtraction of integer-dtyped array or ``Index`` will raise ``NullFrequencyError`` instead of ``TypeError`` (:issue:`19895`)
+- :class:`Timestamp` constructor now accepts a `nanosecond` keyword or positional argument (:issue:`18898`)
+- :class:`DatetimeIndex` will now raise an ``AttributeError`` when the ``tz`` attribute is set after instantiation (:issue:`3746`)
+- :class:`DatetimeIndex` with a ``pytz`` timezone will now return a consistent ``pytz`` timezone (:issue:`18595`)
+
+.. _whatsnew_0230.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- :func:`Series.astype` and :func:`Index.astype` with an incompatible dtype will now raise a ``TypeError`` rather than a ``ValueError`` (:issue:`18231`)
+- ``Series`` construction with an ``object`` dtyped tz-aware datetime and ``dtype=object`` specified, will now return an ``object`` dtyped ``Series``, previously this would infer the datetime dtype (:issue:`18231`)
+- A :class:`Series` of ``dtype=category`` constructed from an empty ``dict`` will now have categories of ``dtype=object`` rather than ``dtype=float64``, consistently with the case in which an empty list is passed (:issue:`18515`)
+- All-NaN levels in a ``MultiIndex`` are now assigned ``float`` rather than ``object`` dtype, promoting consistency with ``Index`` (:issue:`17929`).
+- Levels names of a ``MultiIndex`` (when not None) are now required to be unique: trying to create a ``MultiIndex`` with repeated names will raise a ``ValueError`` (:issue:`18872`)
+- Both construction and renaming of ``Index``/``MultiIndex`` with non-hashable ``name``/``names`` will now raise ``TypeError`` (:issue:`20527`)
+- :func:`Index.map` can now accept ``Series`` and dictionary input objects (:issue:`12756`, :issue:`18482`, :issue:`18509`).
+- :func:`DataFrame.unstack` will now default to filling with ``np.nan`` for ``object`` columns. (:issue:`12815`)
+- :class:`IntervalIndex` constructor will raise if the ``closed`` parameter conflicts with how the input data is inferred to be closed (:issue:`18421`)
+- Inserting missing values into indexes will work for all types of indexes and automatically insert the correct type of missing value (``NaN``, ``NaT``, etc.) regardless of the type passed in (:issue:`18295`)
+- When created with duplicate labels, ``MultiIndex`` now raises a ``ValueError``. (:issue:`17464`)
+- :func:`Series.fillna` now raises a ``TypeError`` instead of a ``ValueError`` when passed a list, tuple or DataFrame as a ``value`` (:issue:`18293`)
+- :func:`pandas.DataFrame.merge` no longer casts a ``float`` column to ``object`` when merging on ``int`` and ``float`` columns (:issue:`16572`)
+- :func:`pandas.merge` now raises a ``ValueError`` when trying to merge on incompatible data types (:issue:`9780`)
+- The default NA value for :class:`UInt64Index` has changed from 0 to ``NaN``, which impacts methods that mask with NA, such as ``UInt64Index.where()`` (:issue:`18398`)
+- Refactored ``setup.py`` to use ``find_packages`` instead of explicitly listing out all subpackages (:issue:`18535`)
+- Rearranged the order of keyword arguments in :func:`read_excel()` to align with :func:`read_csv()` (:issue:`16672`)
+- :func:`wide_to_long` previously kept numeric-like suffixes as ``object`` dtype. Now they are cast to numeric if possible (:issue:`17627`)
+- In :func:`read_excel`, the ``comment`` argument is now exposed as a named parameter (:issue:`18735`)
+- Rearranged the order of keyword arguments in :func:`read_excel()` to align with :func:`read_csv()` (:issue:`16672`)
+- The options ``html.border`` and ``mode.use_inf_as_null`` were deprecated in prior versions, these will now show ``FutureWarning`` rather than a ``DeprecationWarning`` (:issue:`19003`)
+- :class:`IntervalIndex` and ``IntervalDtype`` no longer support categorical, object, and string subtypes (:issue:`19016`)
+- ``IntervalDtype`` now returns ``True`` when compared against ``'interval'`` regardless of subtype, and ``IntervalDtype.name`` now returns ``'interval'`` regardless of subtype (:issue:`18980`)
+- ``KeyError`` now raises instead of ``ValueError`` in :meth:`~DataFrame.drop`, :meth:`~Panel.drop`, :meth:`~Series.drop`, :meth:`~Index.drop` when dropping a non-existent element in an axis with duplicates (:issue:`19186`)
+- :func:`Series.to_csv` now accepts a ``compression`` argument that works in the same way as the ``compression`` argument in :func:`DataFrame.to_csv` (:issue:`18958`)
+- Set operations (union, difference...) on :class:`IntervalIndex` with incompatible index types will now raise a ``TypeError`` rather than a ``ValueError`` (:issue:`19329`)
+- :class:`DateOffset` objects render more simply, e.g. ``<DateOffset: days=1>`` instead of ``<DateOffset: kwds={'days': 1}>`` (:issue:`19403`)
+- ``Categorical.fillna`` now validates its ``value`` and ``method`` keyword arguments. It now raises when both or none are specified, matching the behavior of :meth:`Series.fillna` (:issue:`19682`)
+- ``pd.to_datetime('today')`` now returns a datetime, consistent with ``pd.Timestamp('today')``; previously ``pd.to_datetime('today')`` returned a ``.normalized()`` datetime (:issue:`19935`)
+- :func:`Series.str.replace` now takes an optional `regex` keyword which, when set to ``False``, uses literal string replacement rather than regex replacement (:issue:`16808`)
+- :func:`DatetimeIndex.strftime` and :func:`PeriodIndex.strftime` now return an ``Index`` instead of a numpy array to be consistent with similar accessors (:issue:`20127`)
+- Constructing a Series from a list of length 1 no longer broadcasts this list when a longer index is specified (:issue:`19714`, :issue:`20391`).
+- :func:`DataFrame.to_dict` with ``orient='index'`` no longer casts int columns to float for a DataFrame with only int and float columns (:issue:`18580`)
+- A user-defined-function that is passed to :func:`Series.rolling().aggregate() <pandas.core.window.Rolling.aggregate>`, :func:`DataFrame.rolling().aggregate() <pandas.core.window.Rolling.aggregate>`, or its expanding cousins, will now *always* be passed a ``Series``, rather than a ``np.array``; ``.apply()`` only has the ``raw`` keyword, see :ref:`here <whatsnew_0230.enhancements.window_raw>`. This is consistent with the signatures of ``.aggregate()`` across pandas (:issue:`20584`)
+- Rolling and Expanding types raise ``NotImplementedError`` upon iteration (:issue:`11704`).
+
+.. _whatsnew_0230.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- ``Series.from_array`` and ``SparseSeries.from_array`` are deprecated. Use the normal constructor ``Series(..)`` and ``SparseSeries(..)`` instead (:issue:`18213`).
+- ``DataFrame.as_matrix`` is deprecated. Use ``DataFrame.values`` instead (:issue:`18458`).
+- ``Series.asobject``, ``DatetimeIndex.asobject``, ``PeriodIndex.asobject`` and ``TimeDeltaIndex.asobject`` have been deprecated. Use ``.astype(object)`` instead (:issue:`18572`)
+- Grouping by a tuple of keys now emits a ``FutureWarning`` and is deprecated.
+  In the future, a tuple passed to ``'by'`` will always refer to a single key
+  that is the actual tuple, instead of treating the tuple as multiple keys. To
+  retain the previous behavior, use a list instead of a tuple (:issue:`18314`)
+- ``Series.valid`` is deprecated. Use :meth:`Series.dropna` instead (:issue:`18800`).
+- :func:`read_excel` has deprecated the ``skip_footer`` parameter. Use ``skipfooter`` instead (:issue:`18836`)
+- :meth:`ExcelFile.parse` has deprecated ``sheetname`` in favor of ``sheet_name`` for consistency with :func:`read_excel` (:issue:`20920`).
+- The ``is_copy`` attribute is deprecated and will be removed in a future version (:issue:`18801`).
+- ``IntervalIndex.from_intervals`` is deprecated in favor of the :class:`IntervalIndex` constructor (:issue:`19263`)
+- ``DataFrame.from_items`` is deprecated. Use :func:`DataFrame.from_dict` instead, or ``DataFrame.from_dict(OrderedDict())`` if you wish to preserve the key order (:issue:`17320`, :issue:`17312`)
+- Indexing a :class:`MultiIndex` or a :class:`FloatIndex` with a list containing some missing keys will now show a :class:`FutureWarning`, which is consistent with other types of indexes (:issue:`17758`).
+
+- The ``broadcast`` parameter of ``.apply()`` is deprecated in favor of ``result_type='broadcast'`` (:issue:`18577`)
+- The ``reduce`` parameter of ``.apply()`` is deprecated in favor of ``result_type='reduce'`` (:issue:`18577`)
+- The ``order`` parameter of :func:`factorize` is deprecated and will be removed in a future release (:issue:`19727`)
+- :attr:`Timestamp.weekday_name`, :attr:`DatetimeIndex.weekday_name`, and :attr:`Series.dt.weekday_name` are deprecated in favor of :meth:`Timestamp.day_name`, :meth:`DatetimeIndex.day_name`, and :meth:`Series.dt.day_name` (:issue:`12806`)
+
+- ``pandas.tseries.plotting.tsplot`` is deprecated. Use :func:`Series.plot` instead (:issue:`18627`)
+- ``Index.summary()`` is deprecated and will be removed in a future version (:issue:`18217`)
+- ``NDFrame.get_ftype_counts()`` is deprecated and will be removed in a future version (:issue:`18243`)
+- The ``convert_datetime64`` parameter in :func:`DataFrame.to_records` has been deprecated and will be removed in a future version. The NumPy bug motivating this parameter has been resolved. The default value for this parameter has also changed from ``True`` to ``None`` (:issue:`18160`).
+- :func:`Series.rolling().apply() <pandas.core.window.Rolling.apply>`, :func:`DataFrame.rolling().apply() <pandas.core.window.Rolling.apply>`,
+  :func:`Series.expanding().apply() <pandas.core.window.Expanding.apply>`, and :func:`DataFrame.expanding().apply() <pandas.core.window.Expanding.apply>` have deprecated passing an ``np.array`` by default. One will need to pass the new ``raw`` parameter to be explicit about what is passed (:issue:`20584`)
+- The ``data``, ``base``, ``strides``, ``flags`` and ``itemsize`` properties
+  of the ``Series`` and ``Index`` classes have been deprecated and will be
+  removed in a future version (:issue:`20419`).
+- ``DatetimeIndex.offset`` is deprecated. Use ``DatetimeIndex.freq`` instead (:issue:`20716`)
+- Floor division between an integer ndarray and a :class:`Timedelta` is deprecated. Divide by :attr:`Timedelta.value` instead (:issue:`19761`)
+- Setting ``PeriodIndex.freq`` (which was not guaranteed to work correctly) is deprecated. Use :meth:`PeriodIndex.asfreq` instead (:issue:`20678`)
+- ``Index.get_duplicates()`` is deprecated and will be removed in a future version (:issue:`20239`)
+- The previous default behavior of negative indices in ``Categorical.take`` is deprecated. In a future version it will change from meaning missing values to meaning positional indices from the right. The future behavior is consistent with :meth:`Series.take` (:issue:`20664`).
+- Passing multiple axes to the ``axis`` parameter in :func:`DataFrame.dropna` has been deprecated and will be removed in a future version (:issue:`20987`)
+
+
+.. _whatsnew_0230.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Warnings against the obsolete usage ``Categorical(codes, categories)``, which were emitted for instance when the first two arguments to ``Categorical()`` had different dtypes, and recommended the use of ``Categorical.from_codes``, have now been removed (:issue:`8074`)
+- The ``levels`` and ``labels`` attributes of a ``MultiIndex`` can no longer be set directly (:issue:`4039`).
+- ``pd.tseries.util.pivot_annual`` has been removed (deprecated since v0.19). Use ``pivot_table`` instead (:issue:`18370`)
+- ``pd.tseries.util.isleapyear`` has been removed (deprecated since v0.19). Use ``.is_leap_year`` property in Datetime-likes instead (:issue:`18370`)
+- ``pd.ordered_merge`` has been removed (deprecated since v0.19). Use ``pd.merge_ordered`` instead (:issue:`18459`)
+- The ``SparseList`` class has been removed (:issue:`14007`)
+- The ``pandas.io.wb`` and ``pandas.io.data`` stub modules have been removed (:issue:`13735`)
+- ``Categorical.from_array`` has been removed (:issue:`13854`)
+- The ``freq`` and ``how`` parameters have been removed from the ``rolling``/``expanding``/``ewm`` methods of DataFrame
+  and Series (deprecated since v0.18). Instead, resample before calling the methods. (:issue:`18601` & :issue:`18668`)
+- ``DatetimeIndex.to_datetime``, ``Timestamp.to_datetime``, ``PeriodIndex.to_datetime``, and ``Index.to_datetime`` have been removed (:issue:`8254`, :issue:`14096`, :issue:`14113`)
+- :func:`read_csv` has dropped the ``skip_footer`` parameter (:issue:`13386`)
+- :func:`read_csv` has dropped the ``as_recarray`` parameter (:issue:`13373`)
+- :func:`read_csv` has dropped the ``buffer_lines`` parameter (:issue:`13360`)
+- :func:`read_csv` has dropped the ``compact_ints`` and ``use_unsigned`` parameters (:issue:`13323`)
+- The ``Timestamp`` class has dropped the ``offset`` attribute in favor of ``freq`` (:issue:`13593`)
+- The ``Series``, ``Categorical``, and ``Index`` classes have dropped the ``reshape`` method (:issue:`13012`)
+- ``pandas.tseries.frequencies.get_standard_freq`` has been removed in favor of ``pandas.tseries.frequencies.to_offset(freq).rule_code`` (:issue:`13874`)
+- The ``freqstr`` keyword has been removed from ``pandas.tseries.frequencies.to_offset`` in favor of ``freq`` (:issue:`13874`)
+- The ``Panel4D`` and ``PanelND`` classes have been removed (:issue:`13776`)
+- The ``Panel`` class has dropped the ``to_long`` and ``toLong`` methods (:issue:`19077`)
+- The options ``display.line_with`` and ``display.height`` are removed in favor of ``display.width`` and ``display.max_rows`` respectively (:issue:`4391`, :issue:`19107`)
+- The ``labels`` attribute of the ``Categorical`` class has been removed in favor of :attr:`Categorical.codes` (:issue:`7768`)
+- The ``flavor`` parameter have been removed from func:`to_sql` method (:issue:`13611`)
+- The modules ``pandas.tools.hashing`` and ``pandas.util.hashing`` have been removed (:issue:`16223`)
+- The top-level functions ``pd.rolling_*``, ``pd.expanding_*`` and ``pd.ewm*`` have been removed (Deprecated since v0.18).
+  Instead, use the DataFrame/Series methods :attr:`~DataFrame.rolling`, :attr:`~DataFrame.expanding` and :attr:`~DataFrame.ewm` (:issue:`18723`)
+- Imports from ``pandas.core.common`` for functions such as ``is_datetime64_dtype`` are now removed. These are located in ``pandas.api.types``. (:issue:`13634`, :issue:`19769`)
+- The ``infer_dst`` keyword in :meth:`Series.tz_localize`, :meth:`DatetimeIndex.tz_localize`
+  and :class:`DatetimeIndex` have been removed. ``infer_dst=True`` is equivalent to
+  ``ambiguous='infer'``, and ``infer_dst=False`` to ``ambiguous='raise'`` (:issue:`7963`).
+- When ``.resample()`` was changed from an eager to a lazy operation, like ``.groupby()`` in v0.18.0, we put in place compatibility (with a ``FutureWarning``),
+  so operations would continue to work. This is now fully removed, so a ``Resampler`` will no longer forward compat operations (:issue:`20554`)
+- Remove long deprecated ``axis=None`` parameter from ``.replace()`` (:issue:`20271`)
+
+.. _whatsnew_0230.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Indexers on ``Series`` or ``DataFrame`` no longer create a reference cycle (:issue:`17956`)
+- Added a keyword argument, ``cache``, to :func:`to_datetime` that improved the performance of converting duplicate datetime arguments (:issue:`11665`)
+- :class:`DateOffset` arithmetic performance is improved (:issue:`18218`)
+- Converting a ``Series`` of ``Timedelta`` objects to days, seconds, etc... sped up through vectorization of underlying methods (:issue:`18092`)
+- Improved performance of ``.map()`` with a ``Series/dict`` input (:issue:`15081`)
+- The overridden ``Timedelta`` properties of days, seconds and microseconds have been removed, leveraging their built-in Python versions instead (:issue:`18242`)
+- ``Series`` construction will reduce the number of copies made of the input data in certain cases (:issue:`17449`)
+- Improved performance of :func:`Series.dt.date` and :func:`DatetimeIndex.date` (:issue:`18058`)
+- Improved performance of :func:`Series.dt.time` and :func:`DatetimeIndex.time` (:issue:`18461`)
+- Improved performance of :func:`IntervalIndex.symmetric_difference()` (:issue:`18475`)
+- Improved performance of ``DatetimeIndex`` and ``Series`` arithmetic operations with Business-Month and Business-Quarter frequencies (:issue:`18489`)
+- :func:`Series` / :func:`DataFrame` tab completion limits to 100 values, for better performance. (:issue:`18587`)
+- Improved performance of :func:`DataFrame.median` with ``axis=1`` when bottleneck is not installed (:issue:`16468`)
+- Improved performance of :func:`MultiIndex.get_loc` for large indexes, at the cost of a reduction in performance for small ones (:issue:`18519`)
+- Improved performance of :func:`MultiIndex.remove_unused_levels` when there are no unused levels, at the cost of a reduction in performance when there are (:issue:`19289`)
+- Improved performance of :func:`Index.get_loc` for non-unique indexes (:issue:`19478`)
+- Improved performance of pairwise ``.rolling()`` and ``.expanding()`` with ``.cov()`` and ``.corr()`` operations (:issue:`17917`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.rank` (:issue:`15779`)
+- Improved performance of variable ``.rolling()`` on ``.min()`` and ``.max()`` (:issue:`19521`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.ffill` and :func:`pandas.core.groupby.GroupBy.bfill` (:issue:`11296`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.any` and :func:`pandas.core.groupby.GroupBy.all` (:issue:`15435`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.pct_change` (:issue:`19165`)
+- Improved performance of :func:`Series.isin` in the case of categorical dtypes (:issue:`20003`)
+- Improved performance of ``getattr(Series, attr)`` when the Series has certain index types. This manifested in slow printing of large Series with a ``DatetimeIndex`` (:issue:`19764`)
+- Fixed a performance regression for :func:`GroupBy.nth` and :func:`GroupBy.last` with some object columns (:issue:`19283`)
+- Improved performance of :func:`pandas.core.arrays.Categorical.from_codes` (:issue:`18501`)
+
+.. _whatsnew_0230.docs:
+
+Documentation Changes
+~~~~~~~~~~~~~~~~~~~~~
+
+Thanks to all of the contributors who participated in the Pandas Documentation
+Sprint, which took place on March 10th. We had about 500 participants from over
+30 locations across the world. You should notice that many of the
+:ref:`API docstrings <api>` have greatly improved.
+
+There were too many simultaneous contributions to include a release note for each
+improvement, but this `GitHub search`_ should give you an idea of how many docstrings
+were improved.
+
+Special thanks to `Marc Garcia`_ for organizing the sprint. For more information,
+read the `NumFOCUS blogpost`_ recapping the sprint.
+
+.. _GitHub search: https://github.com/pandas-dev/pandas/pulls?utf8=%E2%9C%93&q=is%3Apr+label%3ADocs+created%3A2018-03-10..2018-03-15+
+.. _NumFOCUS blogpost: https://www.numfocus.org/blog/worldwide-pandas-sprint/
+.. _Marc Garcia: https://github.com/datapythonista
+
+- Changed spelling of "numpy" to "NumPy", and "python" to "Python". (:issue:`19017`)
+- Consistency when introducing code samples, using either colon or period.
+  Rewrote some sentences for greater clarity, added more dynamic references
+  to functions, methods and classes.
+  (:issue:`18941`, :issue:`18948`, :issue:`18973`, :issue:`19017`)
+- Added a reference to :func:`DataFrame.assign` in the concatenate section of the merging documentation (:issue:`18665`)
+
+.. _whatsnew_0230.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Categorical
+^^^^^^^^^^^
+
+.. warning::
+
+   A class of bugs were introduced in pandas 0.21 with ``CategoricalDtype`` that
+   affects the correctness of operations like ``merge``, ``concat``, and
+   indexing when comparing multiple unordered ``Categorical`` arrays that have
+   the same categories, but in a different order. We highly recommend upgrading
+   or manually aligning your categories before doing these operations.
+
+- Bug in ``Categorical.equals`` returning the wrong result when comparing two
+  unordered ``Categorical`` arrays with the same categories, but in a different
+  order (:issue:`16603`)
+- Bug in :func:`pandas.api.types.union_categoricals` returning the wrong result
+  when for unordered categoricals with the categories in a different order.
+  This affected :func:`pandas.concat` with Categorical data (:issue:`19096`).
+- Bug in :func:`pandas.merge` returning the wrong result when joining on an
+  unordered ``Categorical`` that had the same categories but in a different
+  order (:issue:`19551`)
+- Bug in :meth:`CategoricalIndex.get_indexer` returning the wrong result when
+  ``target`` was an unordered ``Categorical`` that had the same categories as
+  ``self`` but in a different order (:issue:`19551`)
+- Bug in :meth:`Index.astype` with a categorical dtype where the resultant index is not converted to a :class:`CategoricalIndex` for all types of index (:issue:`18630`)
+- Bug in :meth:`Series.astype` and ``Categorical.astype()`` where an existing categorical data does not get updated (:issue:`10696`, :issue:`18593`)
+- Bug in :meth:`Series.str.split` with ``expand=True`` incorrectly raising an IndexError on empty strings (:issue:`20002`).
+- Bug in :class:`Index` constructor with ``dtype=CategoricalDtype(...)`` where ``categories`` and ``ordered`` are not maintained (:issue:`19032`)
+- Bug in :class:`Series` constructor with scalar and ``dtype=CategoricalDtype(...)`` where ``categories`` and ``ordered`` are not maintained (:issue:`19565`)
+- Bug in ``Categorical.__iter__`` not converting to Python types (:issue:`19909`)
+- Bug in :func:`pandas.factorize` returning the unique codes for the ``uniques``. This now returns a ``Categorical`` with the same dtype as the input (:issue:`19721`)
+- Bug in :func:`pandas.factorize` including an item for missing values in the ``uniques`` return value (:issue:`19721`)
+- Bug in :meth:`Series.take` with categorical data interpreting ``-1`` in `indices` as missing value markers, rather than the last element of the Series (:issue:`20664`)
+
+Datetimelike
+^^^^^^^^^^^^
+
+- Bug in :func:`Series.__sub__` subtracting a non-nanosecond ``np.datetime64`` object from a ``Series`` gave incorrect results (:issue:`7996`)
+- Bug in :class:`DatetimeIndex`, :class:`TimedeltaIndex` addition and subtraction of zero-dimensional integer arrays gave incorrect results (:issue:`19012`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` where adding or subtracting an array-like of ``DateOffset`` objects either raised (``np.array``, ``pd.Index``) or broadcast incorrectly (``pd.Series``) (:issue:`18849`)
+- Bug in :func:`Series.__add__` adding Series with dtype ``timedelta64[ns]`` to a timezone-aware ``DatetimeIndex`` incorrectly dropped timezone information (:issue:`13905`)
+- Adding a ``Period`` object to a ``datetime`` or ``Timestamp`` object will now correctly raise a ``TypeError`` (:issue:`17983`)
+- Bug in :class:`Timestamp` where comparison with an array of ``Timestamp`` objects would result in a ``RecursionError`` (:issue:`15183`)
+- Bug in :class:`Series` floor-division where operating on a scalar ``timedelta`` raises an exception (:issue:`18846`)
+- Bug in :class:`DatetimeIndex` where the repr was not showing high-precision time values at the end of a day (e.g., 23:59:59.999999999) (:issue:`19030`)
+- Bug in ``.astype()`` to non-ns timedelta units would hold the incorrect dtype (:issue:`19176`, :issue:`19223`, :issue:`12425`)
+- Bug in subtracting :class:`Series` from ``NaT`` incorrectly returning ``NaT`` (:issue:`19158`)
+- Bug in :func:`Series.truncate` which raises ``TypeError`` with a monotonic ``PeriodIndex`` (:issue:`17717`)
+- Bug in :func:`~DataFrame.pct_change` using ``periods`` and ``freq`` returned different length outputs (:issue:`7292`)
+- Bug in comparison of :class:`DatetimeIndex` against ``None`` or ``datetime.date`` objects raising ``TypeError`` for ``==`` and ``!=`` comparisons instead of all-``False`` and all-``True``, respectively (:issue:`19301`)
+- Bug in :class:`Timestamp` and :func:`to_datetime` where a string representing a barely out-of-bounds timestamp would be incorrectly rounded down instead of raising ``OutOfBoundsDatetime`` (:issue:`19382`)
+- Bug in :func:`Timestamp.floor` :func:`DatetimeIndex.floor` where time stamps far in the future and past were not rounded correctly (:issue:`19206`)
+- Bug in :func:`to_datetime` where passing an out-of-bounds datetime with ``errors='coerce'`` and ``utc=True`` would raise ``OutOfBoundsDatetime`` instead of parsing to ``NaT`` (:issue:`19612`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` addition and subtraction where name of the returned object was not always set consistently. (:issue:`19744`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` addition and subtraction where operations with numpy arrays raised ``TypeError`` (:issue:`19847`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` where setting the ``freq`` attribute was not fully supported (:issue:`20678`)
+
+Timedelta
+^^^^^^^^^
+
+- Bug in :func:`Timedelta.__mul__` where multiplying by ``NaT`` returned ``NaT`` instead of raising a ``TypeError`` (:issue:`19819`)
+- Bug in :class:`Series` with ``dtype='timedelta64[ns]'`` where addition or subtraction of ``TimedeltaIndex`` had results cast to ``dtype='int64'`` (:issue:`17250`)
+- Bug in :class:`Series` with ``dtype='timedelta64[ns]'`` where addition or subtraction of ``TimedeltaIndex`` could return a ``Series`` with an incorrect name (:issue:`19043`)
+- Bug in :func:`Timedelta.__floordiv__` and :func:`Timedelta.__rfloordiv__` dividing by many incompatible numpy objects was incorrectly allowed (:issue:`18846`)
+- Bug where dividing a scalar timedelta-like object with :class:`TimedeltaIndex` performed the reciprocal operation (:issue:`19125`)
+- Bug in :class:`TimedeltaIndex` where division by a ``Series`` would return a ``TimedeltaIndex`` instead of a ``Series`` (:issue:`19042`)
+- Bug in :func:`Timedelta.__add__`, :func:`Timedelta.__sub__` where adding or subtracting a ``np.timedelta64`` object would return another ``np.timedelta64`` instead of a ``Timedelta`` (:issue:`19738`)
+- Bug in :func:`Timedelta.__floordiv__`, :func:`Timedelta.__rfloordiv__` where operating with a ``Tick`` object would raise a ``TypeError`` instead of returning a numeric value (:issue:`19738`)
+- Bug in :func:`Period.asfreq` where periods near ``datetime(1, 1, 1)`` could be converted incorrectly (:issue:`19643`, :issue:`19834`)
+- Bug in :func:`Timedelta.total_seconds()` causing precision errors, for example ``Timedelta('30S').total_seconds()==30.000000000000004`` (:issue:`19458`)
+- Bug in :func:`Timedelta.__rmod__` where operating with a ``numpy.timedelta64`` returned a ``timedelta64`` object instead of a ``Timedelta`` (:issue:`19820`)
+- Multiplication of :class:`TimedeltaIndex` by ``TimedeltaIndex`` will now raise ``TypeError`` instead of raising ``ValueError`` in cases of length mis-match (:issue:`19333`)
+- Bug in indexing a :class:`TimedeltaIndex` with a ``np.timedelta64`` object which was raising a ``TypeError`` (:issue:`20393`)
+
+
+Timezones
+^^^^^^^^^
+
+- Bug in creating a ``Series`` from an array that contains both tz-naive and tz-aware values will result in a ``Series`` whose dtype is tz-aware instead of object (:issue:`16406`)
+- Bug in comparison of timezone-aware :class:`DatetimeIndex` against ``NaT`` incorrectly raising ``TypeError`` (:issue:`19276`)
+- Bug in :meth:`DatetimeIndex.astype` when converting between timezone aware dtypes, and converting from timezone aware to naive (:issue:`18951`)
+- Bug in comparing :class:`DatetimeIndex`, which failed to raise ``TypeError`` when attempting to compare timezone-aware and timezone-naive datetimelike objects (:issue:`18162`)
+- Bug in localization of a naive, datetime string in a ``Series`` constructor with a ``datetime64[ns, tz]`` dtype (:issue:`174151`)
+- :func:`Timestamp.replace` will now handle Daylight Savings transitions gracefully (:issue:`18319`)
+- Bug in tz-aware :class:`DatetimeIndex` where addition/subtraction with a :class:`TimedeltaIndex` or array with ``dtype='timedelta64[ns]'`` was incorrect (:issue:`17558`)
+- Bug in :func:`DatetimeIndex.insert` where inserting ``NaT`` into a timezone-aware index incorrectly raised (:issue:`16357`)
+- Bug in :class:`DataFrame` constructor, where tz-aware Datetimeindex and a given column name will result in an empty ``DataFrame`` (:issue:`19157`)
+- Bug in :func:`Timestamp.tz_localize` where localizing a timestamp near the minimum or maximum valid values could overflow and return a timestamp with an incorrect nanosecond value (:issue:`12677`)
+- Bug when iterating over :class:`DatetimeIndex` that was localized with fixed timezone offset that rounded nanosecond precision to microseconds (:issue:`19603`)
+- Bug in :func:`DataFrame.diff` that raised an ``IndexError`` with tz-aware values (:issue:`18578`)
+- Bug in :func:`melt` that converted tz-aware dtypes to tz-naive (:issue:`15785`)
+- Bug in :func:`Dataframe.count` that raised an ``ValueError``, if :func:`Dataframe.dropna` was called for a single column with timezone-aware values. (:issue:`13407`)
+
+Offsets
+^^^^^^^
+
+- Bug in :class:`WeekOfMonth` and :class:`Week` where addition and subtraction did not roll correctly (:issue:`18510`, :issue:`18672`, :issue:`18864`)
+- Bug in :class:`WeekOfMonth` and :class:`LastWeekOfMonth` where default keyword arguments for constructor raised ``ValueError`` (:issue:`19142`)
+- Bug in :class:`FY5253Quarter`, :class:`LastWeekOfMonth` where rollback and rollforward behavior was inconsistent with addition and subtraction behavior (:issue:`18854`)
+- Bug in :class:`FY5253` where ``datetime`` addition and subtraction incremented incorrectly for dates on the year-end but not normalized to midnight (:issue:`18854`)
+- Bug in :class:`FY5253` where date offsets could incorrectly raise an ``AssertionError`` in arithmetic operations (:issue:`14774`)
+
+Numeric
+^^^^^^^
+- Bug in :class:`Series` constructor with an int or float list where specifying ``dtype=str``, ``dtype='str'`` or ``dtype='U'`` failed to convert the data elements to strings (:issue:`16605`)
+- Bug in :class:`Index` multiplication and division methods where operating with a ``Series`` would return an ``Index`` object instead of a ``Series`` object (:issue:`19042`)
+- Bug in the :class:`DataFrame` constructor in which data containing very large positive or very large negative numbers was causing ``OverflowError`` (:issue:`18584`)
+- Bug in :class:`Index` constructor with ``dtype='uint64'`` where int-like floats were not coerced to :class:`UInt64Index` (:issue:`18400`)
+- Bug in :class:`DataFrame` flex arithmetic (e.g. ``df.add(other, fill_value=foo)``) with a ``fill_value`` other than ``None`` failed to raise ``NotImplementedError`` in corner cases where either the frame or ``other`` has length zero (:issue:`19522`)
+- Multiplication and division of numeric-dtyped :class:`Index` objects with timedelta-like scalars returns ``TimedeltaIndex`` instead of raising ``TypeError`` (:issue:`19333`)
+- Bug where ``NaN`` was returned instead of 0 by :func:`Series.pct_change` and :func:`DataFrame.pct_change` when ``fill_method`` is not ``None`` (:issue:`19873`)
+
+Strings
+^^^^^^^
+- Bug in :func:`Series.str.get` with a dictionary in the values and the index not in the keys, raising `KeyError` (:issue:`20671`)
+
+
+Indexing
+^^^^^^^^
+
+- Bug in :class:`Index` construction from list of mixed type tuples (:issue:`18505`)
+- Bug in :func:`Index.drop` when passing a list of both tuples and non-tuples (:issue:`18304`)
+- Bug in :func:`DataFrame.drop`, :meth:`Panel.drop`, :meth:`Series.drop`, :meth:`Index.drop` where no ``KeyError`` is raised when dropping a non-existent element from an axis that contains duplicates (:issue:`19186`)
+- Bug in indexing a datetimelike ``Index`` that raised ``ValueError`` instead of ``IndexError`` (:issue:`18386`).
+- :func:`Index.to_series` now accepts ``index`` and ``name`` kwargs (:issue:`18699`)
+- :func:`DatetimeIndex.to_series` now accepts ``index`` and ``name`` kwargs (:issue:`18699`)
+- Bug in indexing non-scalar value from ``Series`` having non-unique ``Index`` will return value flattened (:issue:`17610`)
+- Bug in indexing with iterator containing only missing keys, which raised no error (:issue:`20748`)
+- Fixed inconsistency in ``.ix`` between list and scalar keys when the index has integer dtype and does not include the desired keys (:issue:`20753`)
+- Bug in ``__setitem__`` when indexing a :class:`DataFrame` with a 2-d boolean ndarray (:issue:`18582`)
+- Bug in ``str.extractall`` when there were no matches empty :class:`Index` was returned instead of appropriate :class:`MultiIndex` (:issue:`19034`)
+- Bug in :class:`IntervalIndex` where empty and purely NA data was constructed inconsistently depending on the construction method (:issue:`18421`)
+- Bug in :func:`IntervalIndex.symmetric_difference` where the symmetric difference with a non-``IntervalIndex`` did not raise (:issue:`18475`)
+- Bug in :class:`IntervalIndex` where set operations that returned an empty ``IntervalIndex`` had the wrong dtype (:issue:`19101`)
+- Bug in :meth:`DataFrame.drop_duplicates` where no ``KeyError`` is raised when passing in columns that don't exist on the ``DataFrame`` (:issue:`19726`)
+- Bug in ``Index`` subclasses constructors that ignore unexpected keyword arguments (:issue:`19348`)
+- Bug in :meth:`Index.difference` when taking difference of an ``Index`` with itself (:issue:`20040`)
+- Bug in :meth:`DataFrame.first_valid_index` and :meth:`DataFrame.last_valid_index` in presence of entire rows of NaNs in the middle of values (:issue:`20499`).
+- Bug in :class:`IntervalIndex` where some indexing operations were not supported for overlapping or non-monotonic ``uint64`` data (:issue:`20636`)
+- Bug in ``Series.is_unique`` where extraneous output in stderr is shown if Series contains objects with ``__ne__`` defined (:issue:`20661`)
+- Bug in ``.loc`` assignment with a single-element list-like incorrectly assigns as a list (:issue:`19474`)
+- Bug in partial string indexing on a ``Series/DataFrame`` with a monotonic decreasing ``DatetimeIndex`` (:issue:`19362`)
+- Bug in performing in-place operations on a ``DataFrame`` with a duplicate ``Index`` (:issue:`17105`)
+- Bug in :meth:`IntervalIndex.get_loc` and :meth:`IntervalIndex.get_indexer` when used with an :class:`IntervalIndex` containing a single interval (:issue:`17284`, :issue:`20921`)
+- Bug in ``.loc`` with a ``uint64`` indexer (:issue:`20722`)
+
+MultiIndex
+^^^^^^^^^^
+
+- Bug in :func:`MultiIndex.__contains__` where non-tuple keys would return ``True`` even if they had been dropped (:issue:`19027`)
+- Bug in :func:`MultiIndex.set_labels` which would cause casting (and potentially clipping) of the new labels if the ``level`` argument is not 0 or a list like [0, 1, ... ]  (:issue:`19057`)
+- Bug in :func:`MultiIndex.get_level_values` which would return an invalid index on level of ints with missing values (:issue:`17924`)
+- Bug in :func:`MultiIndex.unique` when called on empty :class:`MultiIndex` (:issue:`20568`)
+- Bug in :func:`MultiIndex.unique` which would not preserve level names (:issue:`20570`)
+- Bug in :func:`MultiIndex.remove_unused_levels` which would fill nan values (:issue:`18417`)
+- Bug in :func:`MultiIndex.from_tuples` which would fail to take zipped tuples in python3 (:issue:`18434`)
+- Bug in :func:`MultiIndex.get_loc` which would fail to automatically cast values between float and int (:issue:`18818`, :issue:`15994`)
+- Bug in :func:`MultiIndex.get_loc` which would cast boolean to integer labels (:issue:`19086`)
+- Bug in :func:`MultiIndex.get_loc` which would fail to locate keys containing ``NaN`` (:issue:`18485`)
+- Bug in :func:`MultiIndex.get_loc` in large :class:`MultiIndex`, would fail when levels had different dtypes (:issue:`18520`)
+- Bug in indexing where nested indexers having only numpy arrays are handled incorrectly (:issue:`19686`)
+
+
+I/O
+^^^
+
+- :func:`read_html` now rewinds seekable IO objects after parse failure, before attempting to parse with a new parser. If a parser errors and the object is non-seekable, an informative error is raised suggesting the use of a different parser (:issue:`17975`)
+- :meth:`DataFrame.to_html` now has an option to add an id to the leading `<table>` tag (:issue:`8496`)
+- Bug in :func:`read_msgpack` with a non existent file is passed in Python 2 (:issue:`15296`)
+- Bug in :func:`read_csv` where a ``MultiIndex`` with duplicate columns was not being mangled appropriately (:issue:`18062`)
+- Bug in :func:`read_csv` where missing values were not being handled properly when ``keep_default_na=False`` with dictionary ``na_values`` (:issue:`19227`)
+- Bug in :func:`read_csv` causing heap corruption on 32-bit, big-endian architectures (:issue:`20785`)
+- Bug in :func:`read_sas` where a file with 0 variables gave an ``AttributeError`` incorrectly. Now it gives an ``EmptyDataError`` (:issue:`18184`)
+- Bug in :func:`DataFrame.to_latex()` where pairs of braces meant to serve as invisible placeholders were escaped (:issue:`18667`)
+- Bug in :func:`DataFrame.to_latex()` where a ``NaN`` in a ``MultiIndex`` would cause an ``IndexError`` or incorrect output (:issue:`14249`)
+- Bug in :func:`DataFrame.to_latex()` where a non-string index-level name would result in an ``AttributeError`` (:issue:`19981`)
+- Bug in :func:`DataFrame.to_latex()` where the combination of an index name and the `index_names=False` option would result in incorrect output (:issue:`18326`)
+- Bug in :func:`DataFrame.to_latex()` where a ``MultiIndex`` with an empty string as its name would result in incorrect output (:issue:`18669`)
+- Bug in :func:`DataFrame.to_latex()` where missing space characters caused wrong escaping and produced non-valid latex in some cases (:issue:`20859`)
+- Bug in :func:`read_json` where large numeric values were causing an ``OverflowError`` (:issue:`18842`)
+- Bug in :func:`DataFrame.to_parquet` where an exception was raised if the write destination is S3 (:issue:`19134`)
+- :class:`Interval` now supported in :func:`DataFrame.to_excel` for all Excel file types (:issue:`19242`)
+- :class:`Timedelta` now supported in :func:`DataFrame.to_excel` for all Excel file types (:issue:`19242`, :issue:`9155`, :issue:`19900`)
+- Bug in :meth:`pandas.io.stata.StataReader.value_labels` raising an ``AttributeError`` when called on very old files. Now returns an empty dict (:issue:`19417`)
+- Bug in :func:`read_pickle` when unpickling objects with :class:`TimedeltaIndex` or :class:`Float64Index` created with pandas prior to version 0.20 (:issue:`19939`)
+- Bug in :meth:`pandas.io.json.json_normalize` where sub-records are not properly normalized if any sub-records values are NoneType (:issue:`20030`)
+- Bug in ``usecols`` parameter in :func:`read_csv` where error is not raised correctly when passing a string. (:issue:`20529`)
+- Bug in :func:`HDFStore.keys` when reading a file with a soft link causes exception (:issue:`20523`)
+- Bug in :func:`HDFStore.select_column` where a key which is not a valid store raised an ``AttributeError`` instead of a ``KeyError`` (:issue:`17912`)
+
+Plotting
+^^^^^^^^
+
+- Better error message when attempting to plot but matplotlib is not installed (:issue:`19810`).
+- :func:`DataFrame.plot` now raises a ``ValueError`` when the ``x`` or ``y`` argument is improperly formed (:issue:`18671`)
+- Bug in :func:`DataFrame.plot` when ``x`` and ``y`` arguments given as positions caused incorrect referenced columns for line, bar and area plots (:issue:`20056`)
+- Bug in formatting tick labels with ``datetime.time()`` and fractional seconds (:issue:`18478`).
+- :meth:`Series.plot.kde` has exposed the args ``ind`` and ``bw_method`` in the docstring (:issue:`18461`). The argument ``ind`` may now also be an integer (number of sample points).
+- :func:`DataFrame.plot` now supports multiple columns to the ``y`` argument (:issue:`19699`)
+
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug when grouping by a single column and aggregating with a class like ``list`` or ``tuple`` (:issue:`18079`)
+- Fixed regression in :func:`DataFrame.groupby` which would not emit an error when called with a tuple key not in the index (:issue:`18798`)
+- Bug in :func:`DataFrame.resample` which silently ignored unsupported (or mistyped) options for ``label``, ``closed`` and ``convention`` (:issue:`19303`)
+- Bug in :func:`DataFrame.groupby` where tuples were interpreted as lists of keys rather than as keys (:issue:`17979`, :issue:`18249`)
+- Bug in :func:`DataFrame.groupby` where aggregation by ``first``/``last``/``min``/``max`` was causing timestamps to lose precision (:issue:`19526`)
+- Bug in :func:`DataFrame.transform` where particular aggregation functions were being incorrectly cast to match the dtype(s) of the grouped data (:issue:`19200`)
+- Bug in :func:`DataFrame.groupby` passing the `on=` kwarg, and subsequently using ``.apply()`` (:issue:`17813`)
+- Bug in :func:`DataFrame.resample().aggregate <pandas.core.resample.Resampler.aggregate>` not raising a ``KeyError`` when aggregating a non-existent column (:issue:`16766`, :issue:`19566`)
+- Bug in :func:`DataFrameGroupBy.cumsum` and :func:`DataFrameGroupBy.cumprod` when ``skipna`` was passed (:issue:`19806`)
+- Bug in :func:`DataFrame.resample` that dropped timezone information (:issue:`13238`)
+- Bug in :func:`DataFrame.groupby` where transformations using ``np.all`` and ``np.any`` were raising a ``ValueError`` (:issue:`20653`)
+- Bug in :func:`DataFrame.resample` where ``ffill``, ``bfill``, ``pad``, ``backfill``, ``fillna``, ``interpolate``, and ``asfreq`` were ignoring ``loffset``. (:issue:`20744`)
+- Bug in :func:`DataFrame.groupby` when applying a function that has mixed data types and the user supplied function can fail on the grouping column (:issue:`20949`)
+- Bug in :func:`DataFrameGroupBy.rolling().apply() <pandas.core.window.Rolling.apply>` where operations performed against the associated :class:`DataFrameGroupBy` object could impact the inclusion of the grouped item(s) in the result (:issue:`14013`)
+
+Sparse
+^^^^^^
+
+- Bug in which creating a :class:`SparseDataFrame` from a dense ``Series`` or an unsupported type raised an uncontrolled exception (:issue:`19374`)
+- Bug in :class:`SparseDataFrame.to_csv` causing exception (:issue:`19384`)
+- Bug in :class:`SparseSeries.memory_usage` which caused segfault by accessing non sparse elements (:issue:`19368`)
+- Bug in constructing a :class:`SparseArray`: if ``data`` is a scalar and ``index`` is defined it will coerce to ``float64`` regardless of scalar's dtype. (:issue:`19163`)
+
+Reshaping
+^^^^^^^^^
+
+- Bug in :func:`DataFrame.merge` where referencing a ``CategoricalIndex`` by name, where the ``by`` kwarg would ``KeyError`` (:issue:`20777`)
+- Bug in :func:`DataFrame.stack` which fails trying to sort mixed type levels under Python 3 (:issue:`18310`)
+- Bug in :func:`DataFrame.unstack` which casts int to float if ``columns`` is a ``MultiIndex`` with unused levels (:issue:`17845`)
+- Bug in :func:`DataFrame.unstack` which raises an error if ``index`` is a ``MultiIndex`` with unused labels on the unstacked level (:issue:`18562`)
+- Fixed construction of a :class:`Series` from a ``dict`` containing ``NaN`` as key (:issue:`18480`)
+- Fixed construction of a :class:`DataFrame` from a ``dict`` containing ``NaN`` as key (:issue:`18455`)
+- Disabled construction of a :class:`Series` where len(index) > len(data) = 1, which previously would broadcast the data item, and now raises a ``ValueError`` (:issue:`18819`)
+- Suppressed error in the construction of a :class:`DataFrame` from a ``dict`` containing scalar values when the corresponding keys are not included in the passed index (:issue:`18600`)
+
+- Fixed (changed from ``object`` to ``float64``) dtype of :class:`DataFrame` initialized with axes, no data, and ``dtype=int`` (:issue:`19646`)
+- Bug in :func:`Series.rank` where ``Series`` containing ``NaT`` modifies the ``Series`` inplace (:issue:`18521`)
+- Bug in :func:`cut` which fails when using readonly arrays (:issue:`18773`)
+- Bug in :func:`DataFrame.pivot_table` which fails when the ``aggfunc`` arg is of type string.  The behavior is now consistent with other methods like ``agg`` and ``apply`` (:issue:`18713`)
+- Bug in :func:`DataFrame.merge` in which merging using ``Index`` objects as vectors raised an Exception (:issue:`19038`)
+- Bug in :func:`DataFrame.stack`, :func:`DataFrame.unstack`, :func:`Series.unstack` which were not returning subclasses (:issue:`15563`)
+- Bug in timezone comparisons, manifesting as a conversion of the index to UTC in ``.concat()`` (:issue:`18523`)
+- Bug in :func:`concat` when concatenating sparse and dense series it returns only a ``SparseDataFrame``. Should be a ``DataFrame``. (:issue:`18914`, :issue:`18686`, and :issue:`16874`)
+- Improved error message for :func:`DataFrame.merge` when there is no common merge key (:issue:`19427`)
+- Bug in :func:`DataFrame.join` which does an ``outer`` instead of a ``left`` join when being called with multiple DataFrames and some have non-unique indices (:issue:`19624`)
+- :func:`Series.rename` now accepts ``axis`` as a kwarg (:issue:`18589`)
+- Bug in :func:`~DataFrame.rename` where an Index of same-length tuples was converted to a MultiIndex (:issue:`19497`)
+- Comparisons between :class:`Series` and :class:`Index` would return a ``Series`` with an incorrect name, ignoring the ``Index``'s name attribute (:issue:`19582`)
+- Bug in :func:`qcut` where datetime and timedelta data with ``NaT`` present raised a ``ValueError`` (:issue:`19768`)
+- Bug in :func:`DataFrame.iterrows`, which would infers strings not compliant to `ISO8601 <https://en.wikipedia.org/wiki/ISO_8601>`_ to datetimes (:issue:`19671`)
+- Bug in :class:`Series` constructor with ``Categorical`` where a ``ValueError`` is not raised when an index of different length is given (:issue:`19342`)
+- Bug in :meth:`DataFrame.astype` where column metadata is lost when converting to categorical or a dictionary of dtypes (:issue:`19920`)
+- Bug in :func:`cut` and :func:`qcut` where timezone information was dropped (:issue:`19872`)
+- Bug in :class:`Series` constructor with a ``dtype=str``, previously raised in some cases (:issue:`19853`)
+- Bug in :func:`get_dummies`, and :func:`select_dtypes`, where duplicate column names caused incorrect behavior (:issue:`20848`)
+- Bug in :func:`isna`, which cannot handle ambiguous typed lists (:issue:`20675`)
+- Bug in :func:`concat` which raises an error when concatenating TZ-aware dataframes and all-NaT dataframes (:issue:`12396`)
+- Bug in :func:`concat` which raises an error when concatenating empty TZ-aware series (:issue:`18447`)
+
+Other
+^^^^^
+
+- Improved error message when attempting to use a Python keyword as an identifier in a ``numexpr`` backed query (:issue:`18221`)
+- Bug in accessing a :func:`pandas.get_option`, which raised ``KeyError`` rather than ``OptionError`` when looking up a non-existent option key in some cases (:issue:`19789`)
+- Bug in :func:`testing.assert_series_equal` and :func:`testing.assert_frame_equal` for Series or DataFrames with differing unicode data (:issue:`20503`)
+
+.. _whatsnew_0.23.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.22.0..v0.23.0
diff --git a/doc/source/whatsnew/v0.23.1.rst b/doc/source/whatsnew/v0.23.1.rst
new file mode 100644
index 0000000000000..f6af2990c935b
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.1.rst
@@ -0,0 +1,151 @@
+.. _whatsnew_0231:
+
+What's New in 0.23.1 (June 12, 2018)
+------------------------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release in the 0.23.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. warning::
+
+   Starting January 1, 2019, pandas feature releases will support Python 3 only.
+   See :ref:`install.dropping-27` for more.
+
+.. contents:: What's new in v0.23.1
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0231.fixed_regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+**Comparing Series with datetime.date**
+
+We've reverted a 0.23.0 change to comparing a :class:`Series` holding datetimes and a ``datetime.date`` object (:issue:`21152`).
+In pandas 0.22 and earlier, comparing a Series holding datetimes and ``datetime.date`` objects would coerce the ``datetime.date`` to a datetime before comapring.
+This was inconsistent with Python, NumPy, and :class:`DatetimeIndex`, which never consider a datetime and ``datetime.date`` equal.
+
+In 0.23.0, we unified operations between DatetimeIndex and Series, and in the process changed comparisons between a Series of datetimes and ``datetime.date`` without warning.
+
+We've temporarily restored the 0.22.0 behavior, so datetimes and dates may again compare equal, but restore the 0.23.0 behavior in a future release.
+
+To summarize, here's the behavior in 0.22.0, 0.23.0, 0.23.1:
+
+.. code-block:: python
+
+   # 0.22.0... Silently coerce the datetime.date
+   >>> import datetime
+   >>> pd.Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   0     True
+   1    False
+   dtype: bool
+
+   # 0.23.0... Do not coerce the datetime.date
+   >>> pd.Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   0    False
+   1    False
+   dtype: bool
+
+   # 0.23.1... Coerce the datetime.date with a warning
+   >>> pd.Series(pd.date_range('2017', periods=2)) == datetime.date(2017, 1, 1)
+   /bin/python:1: FutureWarning: Comparing Series of datetimes with 'datetime.date'.  Currently, the
+   'datetime.date' is coerced to a datetime. In the future pandas will
+   not coerce, and the values not compare equal to the 'datetime.date'.
+   To retain the current behavior, convert the 'datetime.date' to a
+   datetime with 'pd.Timestamp'.
+     #!/bin/python3
+   0     True
+   1    False
+   dtype: bool
+
+In addition, ordering comparisons will raise a ``TypeError`` in the future.
+
+**Other Fixes**
+
+- Reverted the ability of :func:`~DataFrame.to_sql` to perform multivalue
+  inserts as this caused regression in certain cases (:issue:`21103`).
+  In the future this will be made configurable.
+- Fixed regression in the :attr:`DatetimeIndex.date` and :attr:`DatetimeIndex.time`
+  attributes in case of timezone-aware data: :attr:`DatetimeIndex.time` returned
+  a tz-aware time instead of tz-naive (:issue:`21267`) and :attr:`DatetimeIndex.date`
+  returned incorrect date when the input date has a non-UTC timezone (:issue:`21230`).
+- Fixed regression in :meth:`pandas.io.json.json_normalize` when called with ``None`` values
+  in nested levels in JSON, and to not drop keys with value as `None` (:issue:`21158`, :issue:`21356`).
+- Bug in :meth:`~DataFrame.to_csv` causes encoding error when compression and encoding are specified (:issue:`21241`, :issue:`21118`)
+- Bug preventing pandas from being importable with -OO optimization (:issue:`21071`)
+- Bug in :meth:`Categorical.fillna` incorrectly raising a ``TypeError`` when `value` the individual categories are iterable and `value` is an iterable (:issue:`21097`, :issue:`19788`)
+- Fixed regression in constructors coercing NA values like ``None`` to strings when passing ``dtype=str`` (:issue:`21083`)
+- Regression in :func:`pivot_table` where an ordered ``Categorical`` with missing
+  values for the pivot's ``index`` would give a mis-aligned result (:issue:`21133`)
+- Fixed regression in merging on boolean index/columns (:issue:`21119`).
+
+.. _whatsnew_0231.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improved performance of :meth:`CategoricalIndex.is_monotonic_increasing`, :meth:`CategoricalIndex.is_monotonic_decreasing` and :meth:`CategoricalIndex.is_monotonic` (:issue:`21025`)
+- Improved performance of :meth:`CategoricalIndex.is_unique` (:issue:`21107`)
+
+
+.. _whatsnew_0231.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Groupby/Resample/Rolling**
+
+- Bug in :func:`DataFrame.agg` where applying multiple aggregation functions to a :class:`DataFrame` with duplicated column names would cause a stack overflow (:issue:`21063`)
+- Bug in :func:`pandas.core.groupby.GroupBy.ffill` and :func:`pandas.core.groupby.GroupBy.bfill` where the fill within a grouping would not always be applied as intended due to the implementations' use of a non-stable sort (:issue:`21207`)
+- Bug in :func:`pandas.core.groupby.GroupBy.rank` where results did not scale to 100% when specifying ``method='dense'`` and ``pct=True``
+- Bug in :func:`pandas.DataFrame.rolling` and :func:`pandas.Series.rolling` which incorrectly accepted a 0 window size rather than raising (:issue:`21286`)
+
+**Data-type specific**
+
+- Bug in :meth:`Series.str.replace()` where the method throws `TypeError` on Python 3.5.2 (:issue:`21078`)
+- Bug in :class:`Timedelta` where passing a float with a unit would prematurely round the float precision (:issue:`14156`)
+- Bug in :func:`pandas.testing.assert_index_equal` which raised ``AssertionError`` incorrectly, when comparing two :class:`CategoricalIndex` objects with param ``check_categorical=False`` (:issue:`19776`)
+
+**Sparse**
+
+- Bug in :attr:`SparseArray.shape` which previously only returned the shape :attr:`SparseArray.sp_values` (:issue:`21126`)
+
+**Indexing**
+
+- Bug in :meth:`Series.reset_index` where appropriate error was not raised with an invalid level name (:issue:`20925`)
+- Bug in :func:`interval_range` when ``start``/``periods`` or ``end``/``periods`` are specified with float ``start`` or ``end`` (:issue:`21161`)
+- Bug in :meth:`MultiIndex.set_names` where error raised for a ``MultiIndex`` with ``nlevels == 1`` (:issue:`21149`)
+- Bug in :class:`IntervalIndex` constructors where creating an ``IntervalIndex`` from categorical data was not fully supported (:issue:`21243`, :issue:`21253`)
+- Bug in :meth:`MultiIndex.sort_index` which was not guaranteed to sort correctly with ``level=1``; this was also causing data misalignment in particular :meth:`DataFrame.stack` operations (:issue:`20994`, :issue:`20945`, :issue:`21052`)
+
+**Plotting**
+
+- New keywords (sharex, sharey) to turn on/off sharing of x/y-axis by subplots generated with pandas.DataFrame().groupby().boxplot() (:issue:`20968`)
+
+**I/O**
+
+- Bug in IO methods specifying ``compression='zip'`` which produced uncompressed zip archives (:issue:`17778`, :issue:`21144`)
+- Bug in :meth:`DataFrame.to_stata` which prevented exporting DataFrames to buffers and most file-like objects (:issue:`21041`)
+- Bug in :meth:`read_stata` and :class:`StataReader` which did not correctly decode utf-8 strings on Python 3 from Stata 14 files (dta version 118) (:issue:`21244`)
+- Bug in IO JSON :func:`read_json` reading empty JSON schema with ``orient='table'`` back to :class:`DataFrame` caused an error (:issue:`21287`)
+
+**Reshaping**
+
+- Bug in :func:`concat` where error was raised in concatenating :class:`Series` with numpy scalar and tuple names (:issue:`21015`)
+- Bug in :func:`concat` warning message providing the wrong guidance for future behavior (:issue:`21101`)
+
+**Other**
+
+- Tab completion on :class:`Index` in IPython no longer outputs deprecation warnings (:issue:`21125`)
+- Bug preventing pandas being used on Windows without C++ redistributable installed (:issue:`21106`)
+
+.. _whatsnew_0.23.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.23.0..v0.23.1
diff --git a/doc/source/whatsnew/v0.23.2.rst b/doc/source/whatsnew/v0.23.2.rst
new file mode 100644
index 0000000000000..cae2415e3374e
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.2.rst
@@ -0,0 +1,123 @@
+.. _whatsnew_0232:
+
+What's New in 0.23.2 (July 5, 2018)
+-----------------------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release in the 0.23.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. note::
+
+   Pandas 0.23.2 is first pandas release that's compatible with
+   Python 3.7 (:issue:`20552`)
+
+.. warning::
+
+   Starting January 1, 2019, pandas feature releases will support Python 3 only.
+   See :ref:`install.dropping-27` for more.
+
+.. contents:: What's new in v0.23.2
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0232.enhancements:
+
+Logical Reductions over Entire DataFrame
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+:meth:`DataFrame.all` and :meth:`DataFrame.any` now accept ``axis=None`` to reduce over all axes to a scalar (:issue:`19976`)
+
+.. ipython:: python
+
+   df = pd.DataFrame({"A": [1, 2], "B": [True, False]})
+   df.all(axis=None)
+
+
+This also provides compatibility with NumPy 1.15, which now dispatches to ``DataFrame.all``.
+With NumPy 1.15 and pandas 0.23.1 or earlier, :func:`numpy.all` will no longer reduce over every axis:
+
+.. code-block:: python
+
+   >>> # NumPy 1.15, pandas 0.23.1
+   >>> np.any(pd.DataFrame({"A": [False], "B": [False]}))
+   A    False
+   B    False
+   dtype: bool
+
+With pandas 0.23.2, that will correctly return False, as it did with NumPy < 1.15.
+
+.. ipython:: python
+
+   np.any(pd.DataFrame({"A": [False], "B": [False]}))
+
+
+.. _whatsnew_0232.fixed_regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+- Fixed regression in :meth:`to_csv` when handling file-like object incorrectly (:issue:`21471`)
+- Re-allowed duplicate level names of a ``MultiIndex``. Accessing a level that has a duplicate name by name still raises an error (:issue:`19029`).
+- Bug in both :meth:`DataFrame.first_valid_index` and :meth:`Series.first_valid_index` raised for a row index having duplicate values (:issue:`21441`)
+- Fixed printing of DataFrames with hierarchical columns with long names (:issue:`21180`)
+- Fixed regression in :meth:`~DataFrame.reindex` and :meth:`~DataFrame.groupby`
+  with a MultiIndex or multiple keys that contains categorical datetime-like values (:issue:`21390`).
+- Fixed regression in unary negative operations with object dtype (:issue:`21380`)
+- Bug in :meth:`Timestamp.ceil` and :meth:`Timestamp.floor` when timestamp is a multiple of the rounding frequency (:issue:`21262`)
+- Fixed regression in :func:`to_clipboard` that defaulted to copying dataframes with space delimited instead of tab delimited (:issue:`21104`)
+
+
+Build Changes
+~~~~~~~~~~~~~
+
+- The source and binary distributions no longer include test data files, resulting in smaller download sizes. Tests relying on these data files will be skipped when using ``pandas.test()``. (:issue:`19320`)
+
+.. _whatsnew_0232.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Conversion**
+
+- Bug in constructing :class:`Index` with an iterator or generator (:issue:`21470`)
+- Bug in :meth:`Series.nlargest` for signed and unsigned integer dtypes when the minimum value is present (:issue:`21426`)
+
+**Indexing**
+
+- Bug in :meth:`Index.get_indexer_non_unique` with categorical key (:issue:`21448`)
+- Bug in comparison operations for :class:`MultiIndex` where error was raised on equality / inequality comparison involving a MultiIndex with ``nlevels == 1`` (:issue:`21149`)
+- Bug in :meth:`DataFrame.drop` behaviour is not consistent for unique and non-unique indexes (:issue:`21494`)
+- Bug in :func:`DataFrame.duplicated` with a large number of columns causing a 'maximum recursion depth exceeded' (:issue:`21524`).
+
+**I/O**
+
+- Bug in :func:`read_csv` that caused it to incorrectly raise an error when ``nrows=0``, ``low_memory=True``, and ``index_col`` was not ``None`` (:issue:`21141`)
+- Bug in :func:`json_normalize` when formatting the ``record_prefix`` with integer columns (:issue:`21536`)
+
+**Categorical**
+
+- Bug in rendering :class:`Series` with ``Categorical`` dtype in rare conditions under Python 2.7 (:issue:`21002`)
+
+**Timezones**
+
+- Bug in :class:`Timestamp` and :class:`DatetimeIndex` where passing a :class:`Timestamp` localized after a DST transition would return a datetime before the DST transition (:issue:`20854`)
+- Bug in comparing :class:`DataFrame` with tz-aware :class:`DatetimeIndex` columns with a DST transition that raised a ``KeyError`` (:issue:`19970`)
+- Bug in :meth:`DatetimeIndex.shift` where an ``AssertionError`` would raise when shifting across DST (:issue:`8616`)
+- Bug in :class:`Timestamp` constructor where passing an invalid timezone offset designator (``Z``) would not raise a ``ValueError`` (:issue:`8910`)
+- Bug in :meth:`Timestamp.replace` where replacing at a DST boundary would retain an incorrect offset (:issue:`7825`)
+- Bug in :meth:`DatetimeIndex.reindex` when reindexing a tz-naive and tz-aware :class:`DatetimeIndex` (:issue:`8306`)
+- Bug in :meth:`DatetimeIndex.resample` when downsampling across a DST boundary (:issue:`8531`)
+
+**Timedelta**
+
+- Bug in :class:`Timedelta` where non-zero timedeltas shorter than 1 microsecond were considered False (:issue:`21484`)
+
+.. _whatsnew_0.23.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.23.1..v0.23.2
diff --git a/doc/source/whatsnew/v0.23.3.rst b/doc/source/whatsnew/v0.23.3.rst
new file mode 100644
index 0000000000000..3b1a0cfa5f273
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.3.rst
@@ -0,0 +1,16 @@
+.. _whatsnew_0233:
+
+What's New in 0.23.3 (July 7, 2018)
+-----------------------------------
+
+{{ header }}
+
+This release fixes a build issue with the sdist for Python 3.7 (:issue:`21785`)
+There are no other changes.
+
+.. _whatsnew_0.23.3.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.23.2..v0.23.3
diff --git a/doc/source/whatsnew/v0.23.4.rst b/doc/source/whatsnew/v0.23.4.rst
new file mode 100644
index 0000000000000..01f904e129f80
--- /dev/null
+++ b/doc/source/whatsnew/v0.23.4.rst
@@ -0,0 +1,47 @@
+.. _whatsnew_0234:
+
+What's New in 0.23.4 (August 3, 2018)
+-------------------------------------
+
+{{ header }}
+
+
+This is a minor bug-fix release in the 0.23.x series and includes some small regression fixes
+and bug fixes. We recommend that all users upgrade to this version.
+
+.. warning::
+
+   Starting January 1, 2019, pandas feature releases will support Python 3 only.
+   See :ref:`install.dropping-27` for more.
+
+.. contents:: What's new in v0.23.4
+    :local:
+    :backlinks: none
+
+.. _whatsnew_0234.fixed_regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+- Python 3.7 with Windows gave all missing values for rolling variance calculations (:issue:`21813`)
+
+.. _whatsnew_0234.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Groupby/Resample/Rolling**
+
+- Bug where calling :func:`DataFrameGroupBy.agg` with a list of functions including ``ohlc`` as the non-initial element would raise a ``ValueError`` (:issue:`21716`)
+- Bug in ``roll_quantile`` caused a memory leak when calling ``.rolling(...).quantile(q)`` with ``q`` in (0,1) (:issue:`21965`)
+
+**Missing**
+
+- Bug in :func:`Series.clip` and :func:`DataFrame.clip` cannot accept list-like threshold containing ``NaN`` (:issue:`19992`)
+
+.. _whatsnew_0.23.4.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.23.3..v0.23.4
diff --git a/doc/source/whatsnew/v0.24.0.rst b/doc/source/whatsnew/v0.24.0.rst
new file mode 100644
index 0000000000000..a49ea2cf493a6
--- /dev/null
+++ b/doc/source/whatsnew/v0.24.0.rst
@@ -0,0 +1,1936 @@
+.. _whatsnew_0240:
+
+What's New in 0.24.0 (January 25, 2019)
+---------------------------------------
+
+.. warning::
+
+   The 0.24.x series of releases will be the last to support Python 2. Future feature
+   releases will support Python 3 only. See :ref:`install.dropping-27` for more
+   details.
+
+{{ header }}
+
+This is a major release from 0.23.4 and includes a number of API changes, new
+features, enhancements, and performance improvements along with a large number
+of bug fixes.
+
+Highlights include:
+
+* :ref:`Optional Integer NA Support <whatsnew_0240.enhancements.intna>`
+* :ref:`New APIs for accessing the array backing a Series or Index <whatsnew_0240.values_api>`
+* :ref:`A new top-level method for creating arrays <whatsnew_0240.enhancements.array>`
+* :ref:`Store Interval and Period data in a Series or DataFrame <whatsnew_0240.enhancements.interval>`
+* :ref:`Support for joining on two MultiIndexes <whatsnew_0240.enhancements.join_with_two_multiindexes>`
+
+
+Check the :ref:`API Changes <whatsnew_0240.api_breaking>` and :ref:`deprecations <whatsnew_0240.deprecations>` before updating.
+
+These are the changes in pandas 0.24.0. See :ref:`release` for a full changelog
+including other versions of pandas.
+
+
+Enhancements
+~~~~~~~~~~~~
+
+.. _whatsnew_0240.enhancements.intna:
+
+Optional Integer NA Support
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Pandas has gained the ability to hold integer dtypes with missing values. This long requested feature is enabled through the use of :ref:`extension types <extending.extension-types>`.
+
+.. note::
+
+   IntegerArray is currently experimental. Its API or implementation may
+   change without warning.
+
+We can construct a ``Series`` with the specified dtype. The dtype string ``Int64`` is a pandas ``ExtensionDtype``. Specifying a list or array using the traditional missing value
+marker of ``np.nan`` will infer to integer dtype. The display of the ``Series`` will also use the ``NaN`` to indicate missing values in string outputs. (:issue:`20700`, :issue:`20747`, :issue:`22441`, :issue:`21789`, :issue:`22346`)
+
+.. ipython:: python
+
+   s = pd.Series([1, 2, np.nan], dtype='Int64')
+   s
+
+
+Operations on these dtypes will propagate ``NaN`` as other pandas operations.
+
+.. ipython:: python
+
+   # arithmetic
+   s + 1
+
+   # comparison
+   s == 1
+
+   # indexing
+   s.iloc[1:3]
+
+   # operate with other dtypes
+   s + s.iloc[1:3].astype('Int8')
+
+   # coerce when needed
+   s + 0.01
+
+These dtypes can operate as part of a ``DataFrame``.
+
+.. ipython:: python
+
+   df = pd.DataFrame({'A': s, 'B': [1, 1, 3], 'C': list('aab')})
+   df
+   df.dtypes
+
+
+These dtypes can be merged, reshaped, and casted.
+
+.. ipython:: python
+
+   pd.concat([df[['A']], df[['B', 'C']]], axis=1).dtypes
+   df['A'].astype(float)
+
+Reduction and groupby operations such as ``sum`` work.
+
+.. ipython:: python
+
+   df.sum()
+   df.groupby('B').A.sum()
+
+.. warning::
+
+   The Integer NA support currently uses the capitalized dtype version, e.g. ``Int8`` as compared to the traditional ``int8``. This may be changed at a future date.
+
+See :ref:`integer_na` for more.
+
+
+.. _whatsnew_0240.values_api:
+
+Accessing the values in a Series or Index
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:attr:`Series.array` and :attr:`Index.array` have been added for extracting the array backing a
+``Series`` or ``Index``. (:issue:`19954`, :issue:`23623`)
+
+.. ipython:: python
+
+   idx = pd.period_range('2000', periods=4)
+   idx.array
+   pd.Series(idx).array
+
+Historically, this would have been done with ``series.values``, but with
+``.values`` it was unclear whether the returned value would be the actual array,
+some transformation of it, or one of pandas custom arrays (like
+``Categorical``). For example, with :class:`PeriodIndex`, ``.values`` generates
+a new ndarray of period objects each time.
+
+.. ipython:: python
+
+   idx.values
+   id(idx.values)
+   id(idx.values)
+
+If you need an actual NumPy array, use :meth:`Series.to_numpy` or :meth:`Index.to_numpy`.
+
+.. ipython:: python
+
+   idx.to_numpy()
+   pd.Series(idx).to_numpy()
+
+For Series and Indexes backed by normal NumPy arrays, :attr:`Series.array` will return a
+new :class:`arrays.PandasArray`, which is a thin (no-copy) wrapper around a
+:class:`numpy.ndarray`. :class:`~arrays.PandasArray` isn't especially useful on its own,
+but it does provide the same interface as any extension array defined in pandas or by
+a third-party library.
+
+.. ipython:: python
+
+   ser = pd.Series([1, 2, 3])
+   ser.array
+   ser.to_numpy()
+
+We haven't removed or deprecated :attr:`Series.values` or :attr:`DataFrame.values`, but we
+highly recommend and using ``.array`` or ``.to_numpy()`` instead.
+
+See :ref:`Dtypes <basics.dtypes>` and :ref:`Attributes and Underlying Data <basics.attrs>` for more.
+
+
+.. _whatsnew_0240.enhancements.array:
+
+``pandas.array``: a new top-level method for creating arrays
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+A new top-level method :func:`array` has been added for creating 1-dimensional arrays (:issue:`22860`).
+This can be used to create any :ref:`extension array <extending.extension-types>`, including
+extension arrays registered by :ref:`3rd party libraries <ecosystem.extensions>`.
+See the :ref:`dtypes docs <basics.dtypes>` for more on extension arrays.
+
+.. ipython:: python
+
+   pd.array([1, 2, np.nan], dtype='Int64')
+   pd.array(['a', 'b', 'c'], dtype='category')
+
+Passing data for which there isn't dedicated extension type (e.g. float, integer, etc.)
+will return a new :class:`arrays.PandasArray`, which is just a thin (no-copy)
+wrapper around a :class:`numpy.ndarray` that satisfies the pandas extension array interface.
+
+.. ipython:: python
+
+   pd.array([1, 2, 3])
+
+On their own, a :class:`~arrays.PandasArray` isn't a very useful object.
+But if you need write low-level code that works generically for any
+:class:`~pandas.api.extensions.ExtensionArray`, :class:`~arrays.PandasArray`
+satisfies that need.
+
+Notice that by default, if no ``dtype`` is specified, the dtype of the returned
+array is inferred from the data. In particular, note that the first example of
+``[1, 2, np.nan]`` would have returned a floating-point array, since ``NaN``
+is a float.
+
+.. ipython:: python
+
+   pd.array([1, 2, np.nan])
+
+
+.. _whatsnew_0240.enhancements.interval:
+
+Storing Interval and Period Data in Series and DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:class:`Interval` and :class:`Period` data may now be stored in a :class:`Series` or :class:`DataFrame`, in addition to an
+:class:`IntervalIndex` and :class:`PeriodIndex` like previously (:issue:`19453`, :issue:`22862`).
+
+.. ipython:: python
+
+   ser = pd.Series(pd.interval_range(0, 5))
+   ser
+   ser.dtype
+
+For periods:
+
+.. ipython:: python
+
+   pser = pd.Series(pd.period_range("2000", freq="D", periods=5))
+   pser
+   pser.dtype
+
+Previously, these would be cast to a NumPy array with object dtype. In general,
+this should result in better performance when storing an array of intervals or periods
+in a :class:`Series` or column of a :class:`DataFrame`.
+
+Use :attr:`Series.array` to extract the underlying array of intervals or periods
+from the ``Series``:
+
+.. ipython:: python
+
+   ser.array
+   pser.array
+
+These return an instance of :class:`arrays.IntervalArray` or :class:`arrays.PeriodArray`,
+the new extension arrays that back interval and period data.
+
+.. warning::
+
+   For backwards compatibility, :attr:`Series.values` continues to return
+   a NumPy array of objects for Interval and Period data. We recommend
+   using :attr:`Series.array` when you need the array of data stored in the
+   ``Series``, and :meth:`Series.to_numpy` when you know you need a NumPy array.
+
+   See :ref:`Dtypes <basics.dtypes>` and :ref:`Attributes and Underlying Data <basics.attrs>`
+   for more.
+
+
+.. _whatsnew_0240.enhancements.join_with_two_multiindexes:
+
+Joining with two multi-indexes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`DataFrame.merge` and :func:`DataFrame.join` can now be used to join multi-indexed ``Dataframe`` instances on the overlapping index levels (:issue:`6360`)
+
+See the :ref:`Merge, join, and concatenate
+<merging.Join_with_two_multi_indexes>` documentation section.
+
+.. ipython:: python
+
+   index_left = pd.MultiIndex.from_tuples([('K0', 'X0'), ('K0', 'X1'),
+                                          ('K1', 'X2')],
+                                          names=['key', 'X'])
+
+   left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
+                        'B': ['B0', 'B1', 'B2']}, index=index_left)
+
+   index_right = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
+                                           ('K2', 'Y2'), ('K2', 'Y3')],
+                                           names=['key', 'Y'])
+
+   right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                         'D': ['D0', 'D1', 'D2', 'D3']}, index=index_right)
+
+   left.join(right)
+
+For earlier versions this can be done using the following.
+
+.. ipython:: python
+
+   pd.merge(left.reset_index(), right.reset_index(),
+            on=['key'], how='inner').set_index(['key', 'X', 'Y'])
+
+.. _whatsnew_0240.enhancements.read_html:
+
+``read_html`` Enhancements
+^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`read_html` previously ignored ``colspan`` and ``rowspan`` attributes.
+Now it understands them, treating them as sequences of cells with the same
+value. (:issue:`17054`)
+
+.. ipython:: python
+
+    result = pd.read_html("""
+      <table>
+        <thead>
+          <tr>
+            <th>A</th><th>B</th><th>C</th>
+          </tr>
+        </thead>
+        <tbody>
+          <tr>
+            <td colspan="2">1</td><td>2</td>
+          </tr>
+        </tbody>
+      </table>""")
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [13]: result
+    Out [13]:
+    [   A  B   C
+     0  1  2 NaN]
+
+*New Behavior*:
+
+.. ipython:: python
+
+    result
+
+
+New ``Styler.pipe()`` method
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+The :class:`~pandas.io.formats.style.Styler` class has gained a
+:meth:`~pandas.io.formats.style.Styler.pipe` method.  This provides a
+convenient way to apply users' predefined styling functions, and can help reduce
+"boilerplate" when using DataFrame styling functionality repeatedly within a notebook. (:issue:`23229`)
+
+.. ipython:: python
+
+    df = pd.DataFrame({'N': [1250, 1500, 1750], 'X': [0.25, 0.35, 0.50]})
+
+    def format_and_align(styler):
+        return (styler.format({'N': '{:,}', 'X': '{:.1%}'})
+                      .set_properties(**{'text-align': 'right'}))
+
+    df.style.pipe(format_and_align).set_caption('Summary of results.')
+
+Similar methods already exist for other classes in pandas, including :meth:`DataFrame.pipe`,
+:meth:`GroupBy.pipe() <pandas.core.groupby.GroupBy.pipe>`, and :meth:`Resampler.pipe() <pandas.core.resample.Resampler.pipe>`.
+
+.. _whatsnew_0240.enhancements.rename_axis:
+
+Renaming names in a MultiIndex
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`DataFrame.rename_axis` now supports ``index`` and ``columns`` arguments
+and :func:`Series.rename_axis` supports ``index`` argument (:issue:`19978`).
+
+This change allows a dictionary to be passed so that some of the names
+of a ``MultiIndex`` can be changed.
+
+Example:
+
+.. ipython:: python
+
+    mi = pd.MultiIndex.from_product([list('AB'), list('CD'), list('EF')],
+                                    names=['AB', 'CD', 'EF'])
+    df = pd.DataFrame([i for i in range(len(mi))], index=mi, columns=['N'])
+    df
+    df.rename_axis(index={'CD': 'New'})
+
+See the :ref:`Advanced documentation on renaming<advanced.index_names>` for more details.
+
+.. _whatsnew_0240.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- :func:`merge` now directly allows merge between objects of type ``DataFrame`` and named ``Series``, without the need to convert the ``Series`` object into a ``DataFrame`` beforehand (:issue:`21220`)
+- ``ExcelWriter`` now accepts ``mode`` as a keyword argument, enabling append to existing workbooks when using the ``openpyxl`` engine (:issue:`3441`)
+- ``FrozenList`` has gained the ``.union()`` and ``.difference()`` methods. This functionality greatly simplifies groupby's that rely on explicitly excluding certain columns. See :ref:`Splitting an object into groups <groupby.split>` for more information (:issue:`15475`, :issue:`15506`).
+- :func:`DataFrame.to_parquet` now accepts ``index`` as an argument, allowing
+  the user to override the engine's default behavior to include or omit the
+  dataframe's indexes from the resulting Parquet file. (:issue:`20768`)
+- :func:`read_feather` now accepts ``columns`` as an argument, allowing the user to specify which columns should be read. (:issue:`24025`)
+- :meth:`DataFrame.corr` and :meth:`Series.corr` now accept a callable for generic calculation methods of correlation, e.g. histogram intersection (:issue:`22684`)
+- :func:`DataFrame.to_string` now accepts ``decimal`` as an argument, allowing the user to specify which decimal separator should be used in the output. (:issue:`23614`)
+- :func:`DataFrame.to_html` now accepts ``render_links`` as an argument, allowing the user to generate HTML with links to any URLs that appear in the DataFrame.
+  See the :ref:`section on writing HTML <io.html>` in the IO docs for example usage. (:issue:`2679`)
+- :func:`pandas.read_csv` now supports pandas extension types as an argument to ``dtype``, allowing the user to use pandas extension types when reading CSVs. (:issue:`23228`)
+- The :meth:`~DataFrame.shift` method now accepts `fill_value` as an argument, allowing the user to specify a value which will be used instead of NA/NaT in the empty periods. (:issue:`15486`)
+- :func:`to_datetime` now supports the ``%Z`` and ``%z`` directive when passed into ``format`` (:issue:`13486`)
+- :func:`Series.mode` and :func:`DataFrame.mode` now support the ``dropna`` parameter which can be used to specify whether ``NaN``/``NaT`` values should be considered (:issue:`17534`)
+- :func:`DataFrame.to_csv` and :func:`Series.to_csv` now support the ``compression`` keyword when a file handle is passed. (:issue:`21227`)
+- :meth:`Index.droplevel` is now implemented also for flat indexes, for compatibility with :class:`MultiIndex` (:issue:`21115`)
+- :meth:`Series.droplevel` and :meth:`DataFrame.droplevel` are now implemented (:issue:`20342`)
+- Added support for reading from/writing to Google Cloud Storage via the ``gcsfs`` library (:issue:`19454`, :issue:`23094`)
+- :func:`DataFrame.to_gbq` and :func:`read_gbq` signature and documentation updated to
+  reflect changes from the `Pandas-GBQ library version 0.8.0
+  <https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0>`__.
+  Adds a ``credentials`` argument, which enables the use of any kind of
+  `google-auth credentials
+  <https://google-auth.readthedocs.io/en/latest/>`__. (:issue:`21627`,
+  :issue:`22557`, :issue:`23662`)
+- New method :meth:`HDFStore.walk` will recursively walk the group hierarchy of an HDF5 file (:issue:`10932`)
+- :func:`read_html` copies cell data across ``colspan`` and ``rowspan``, and it treats all-``th`` table rows as headers if ``header`` kwarg is not given and there is no ``thead`` (:issue:`17054`)
+- :meth:`Series.nlargest`, :meth:`Series.nsmallest`, :meth:`DataFrame.nlargest`, and :meth:`DataFrame.nsmallest` now accept the value ``"all"`` for the ``keep`` argument. This keeps all ties for the nth largest/smallest value (:issue:`16818`)
+- :class:`IntervalIndex` has gained the :meth:`~IntervalIndex.set_closed` method to change the existing ``closed`` value (:issue:`21670`)
+- :func:`~DataFrame.to_csv`, :func:`~Series.to_csv`, :func:`~DataFrame.to_json`, and :func:`~Series.to_json` now support ``compression='infer'`` to infer compression based on filename extension (:issue:`15008`).
+  The default compression for ``to_csv``, ``to_json``, and ``to_pickle`` methods has been updated to ``'infer'`` (:issue:`22004`).
+- :meth:`DataFrame.to_sql` now supports writing ``TIMESTAMP WITH TIME ZONE`` types for supported databases. For databases that don't support timezones, datetime data will be stored as timezone unaware local timestamps. See the :ref:`io.sql_datetime_data` for implications (:issue:`9086`).
+- :func:`to_timedelta` now supports iso-formated timedelta strings (:issue:`21877`)
+- :class:`Series` and :class:`DataFrame` now support :class:`Iterable` objects in the constructor (:issue:`2193`)
+- :class:`DatetimeIndex` has gained the :attr:`DatetimeIndex.timetz` attribute. This returns the local time with timezone information. (:issue:`21358`)
+- :meth:`~Timestamp.round`, :meth:`~Timestamp.ceil`, and :meth:`~Timestamp.floor` for :class:`DatetimeIndex` and :class:`Timestamp`
+  now support an ``ambiguous`` argument for handling datetimes that are rounded to ambiguous times (:issue:`18946`)
+  and a ``nonexistent`` argument for handling datetimes that are rounded to nonexistent times. See :ref:`timeseries.timezone_nonexistent` (:issue:`22647`)
+- The result of :meth:`~DataFrame.resample` is now iterable similar to ``groupby()`` (:issue:`15314`).
+- :meth:`Series.resample` and :meth:`DataFrame.resample` have gained the :meth:`pandas.core.resample.Resampler.quantile` (:issue:`15023`).
+- :meth:`DataFrame.resample` and :meth:`Series.resample` with a :class:`PeriodIndex` will now respect the ``base`` argument in the same fashion as with a :class:`DatetimeIndex`. (:issue:`23882`)
+- :meth:`pandas.api.types.is_list_like` has gained a keyword ``allow_sets`` which is ``True`` by default; if ``False``,
+  all instances of ``set`` will not be considered "list-like" anymore (:issue:`23061`)
+- :meth:`Index.to_frame` now supports overriding column name(s) (:issue:`22580`).
+- :meth:`Categorical.from_codes` now can take a ``dtype`` parameter as an alternative to passing ``categories`` and ``ordered`` (:issue:`24398`).
+- New attribute ``__git_version__`` will return git commit sha of current build (:issue:`21295`).
+- Compatibility with Matplotlib 3.0 (:issue:`22790`).
+- Added :meth:`Interval.overlaps`, :meth:`arrays.IntervalArray.overlaps`, and :meth:`IntervalIndex.overlaps` for determining overlaps between interval-like objects (:issue:`21998`)
+- :func:`read_fwf` now accepts keyword ``infer_nrows`` (:issue:`15138`).
+- :func:`~DataFrame.to_parquet` now supports writing a ``DataFrame`` as a directory of parquet files partitioned by a subset of the columns when ``engine = 'pyarrow'`` (:issue:`23283`)
+- :meth:`Timestamp.tz_localize`, :meth:`DatetimeIndex.tz_localize`, and :meth:`Series.tz_localize` have gained the ``nonexistent`` argument for alternative handling of nonexistent times. See :ref:`timeseries.timezone_nonexistent` (:issue:`8917`, :issue:`24466`)
+- :meth:`Index.difference`, :meth:`Index.intersection`, :meth:`Index.union`, and :meth:`Index.symmetric_difference` now have an optional ``sort`` parameter to control whether the results should be sorted if possible (:issue:`17839`, :issue:`24471`)
+- :meth:`read_excel()` now accepts ``usecols`` as a list of column names or callable (:issue:`18273`)
+- :meth:`MultiIndex.to_flat_index` has been added to flatten multiple levels into a single-level :class:`Index` object.
+- :meth:`DataFrame.to_stata` and :class:`pandas.io.stata.StataWriter117` can write mixed sting columns to Stata strl format (:issue:`23633`)
+- :meth:`DataFrame.between_time` and :meth:`DataFrame.at_time` have gained the ``axis`` parameter (:issue:`8839`)
+- :meth:`DataFrame.to_records` now accepts ``index_dtypes`` and ``column_dtypes`` parameters to allow different data types in stored column and index records (:issue:`18146`)
+- :class:`IntervalIndex` has gained the :attr:`~IntervalIndex.is_overlapping` attribute to indicate if the ``IntervalIndex`` contains any overlapping intervals (:issue:`23309`)
+- :func:`pandas.DataFrame.to_sql` has gained the ``method`` argument to control SQL insertion clause. See the :ref:`insertion method <io.sql.method>` section in the documentation. (:issue:`8953`)
+- :meth:`DataFrame.corrwith` now supports Spearman's rank correlation, Kendall's tau as well as callable correlation methods. (:issue:`21925`)
+- :meth:`DataFrame.to_json`, :meth:`DataFrame.to_csv`, :meth:`DataFrame.to_pickle`, and other export methods now support tilde(~) in path argument. (:issue:`23473`)
+
+.. _whatsnew_0240.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Pandas 0.24.0 includes a number of API breaking changes.
+
+
+.. _whatsnew_0240.api_breaking.deps:
+
+Increased minimum versions for dependencies
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`21242`, :issue:`18742`, :issue:`23774`, :issue:`24767`).
+If installed, we now require:
+
++-----------------+-----------------+----------+
+| Package         | Minimum Version | Required |
++=================+=================+==========+
+| numpy           | 1.12.0          |    X     |
++-----------------+-----------------+----------+
+| bottleneck      | 1.2.0           |          |
++-----------------+-----------------+----------+
+| fastparquet     | 0.2.1           |          |
++-----------------+-----------------+----------+
+| matplotlib      | 2.0.0           |          |
++-----------------+-----------------+----------+
+| numexpr         | 2.6.1           |          |
++-----------------+-----------------+----------+
+| pandas-gbq      | 0.8.0           |          |
++-----------------+-----------------+----------+
+| pyarrow         | 0.9.0           |          |
++-----------------+-----------------+----------+
+| pytables        | 3.4.2           |          |
++-----------------+-----------------+----------+
+| scipy           | 0.18.1          |          |
++-----------------+-----------------+----------+
+| xlrd            | 1.0.0           |          |
++-----------------+-----------------+----------+
+| pytest (dev)    | 3.6             |          |
++-----------------+-----------------+----------+
+
+Additionally we no longer depend on ``feather-format`` for feather based storage
+and replaced it with references to ``pyarrow`` (:issue:`21639` and :issue:`23053`).
+
+.. _whatsnew_0240.api_breaking.csv_line_terminator:
+
+`os.linesep` is used for ``line_terminator`` of ``DataFrame.to_csv``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`DataFrame.to_csv` now uses :func:`os.linesep` rather than ``'\n'``
+for the default line terminator (:issue:`20353`).
+This change only affects when running on Windows, where ``'\r\n'`` was used for line terminator
+even when ``'\n'`` was passed in ``line_terminator``.
+
+*Previous Behavior* on Windows:
+
+.. code-block:: ipython
+
+    In [1]: data = pd.DataFrame({"string_with_lf": ["a\nbc"],
+       ...:                      "string_with_crlf": ["a\r\nbc"]})
+
+    In [2]: # When passing file PATH to to_csv,
+       ...: # line_terminator does not work, and csv is saved with '\r\n'.
+       ...: # Also, this converts all '\n's in the data to '\r\n'.
+       ...: data.to_csv("test.csv", index=False, line_terminator='\n')
+
+    In [3]: with open("test.csv", mode='rb') as f:
+       ...:     print(f.read())
+    Out[3]: b'string_with_lf,string_with_crlf\r\n"a\r\nbc","a\r\r\nbc"\r\n'
+
+    In [4]: # When passing file OBJECT with newline option to
+       ...: # to_csv, line_terminator works.
+       ...: with open("test2.csv", mode='w', newline='\n') as f:
+       ...:     data.to_csv(f, index=False, line_terminator='\n')
+
+    In [5]: with open("test2.csv", mode='rb') as f:
+       ...:     print(f.read())
+    Out[5]: b'string_with_lf,string_with_crlf\n"a\nbc","a\r\nbc"\n'
+
+
+*New Behavior* on Windows:
+
+Passing ``line_terminator`` explicitly, set thes ``line terminator`` to that character.
+
+.. code-block:: ipython
+
+   In [1]: data = pd.DataFrame({"string_with_lf": ["a\nbc"],
+      ...:                      "string_with_crlf": ["a\r\nbc"]})
+
+   In [2]: data.to_csv("test.csv", index=False, line_terminator='\n')
+
+   In [3]: with open("test.csv", mode='rb') as f:
+      ...:     print(f.read())
+   Out[3]: b'string_with_lf,string_with_crlf\n"a\nbc","a\r\nbc"\n'
+
+
+On Windows, the value of ``os.linesep`` is ``'\r\n'``, so if ``line_terminator`` is not
+set, ``'\r\n'`` is used for line terminator.
+
+.. code-block:: ipython
+
+   In [1]: data = pd.DataFrame({"string_with_lf": ["a\nbc"],
+      ...:                      "string_with_crlf": ["a\r\nbc"]})
+
+   In [2]: data.to_csv("test.csv", index=False)
+
+   In [3]: with open("test.csv", mode='rb') as f:
+      ...:     print(f.read())
+   Out[3]: b'string_with_lf,string_with_crlf\r\n"a\nbc","a\r\nbc"\r\n'
+
+
+For file objects, specifying ``newline`` is not sufficient to set the line terminator.
+You must pass in the ``line_terminator`` explicitly, even in this case.
+
+.. code-block:: ipython
+
+   In [1]: data = pd.DataFrame({"string_with_lf": ["a\nbc"],
+      ...:                      "string_with_crlf": ["a\r\nbc"]})
+
+   In [2]: with open("test2.csv", mode='w', newline='\n') as f:
+      ...:     data.to_csv(f, index=False)
+
+   In [3]: with open("test2.csv", mode='rb') as f:
+      ...:     print(f.read())
+   Out[3]: b'string_with_lf,string_with_crlf\r\n"a\nbc","a\r\nbc"\r\n'
+
+.. _whatsnew_0240.bug_fixes.nan_with_str_dtype:
+
+Proper handling of `np.NaN` in a string data-typed column with the Python engine
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+There was bug in :func:`read_excel` and :func:`read_csv` with the Python
+engine, where missing values turned to ``'nan'`` with ``dtype=str`` and
+``na_filter=True``. Now, these missing values are converted to the string
+missing indicator, ``np.nan``. (:issue:`20377`)
+
+.. ipython:: python
+   :suppress:
+
+   from pandas.compat import StringIO
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+   In [5]: data = 'a,b,c\n1,,3\n4,5,6'
+   In [6]: df = pd.read_csv(StringIO(data), engine='python', dtype=str, na_filter=True)
+   In [7]: df.loc[0, 'b']
+   Out[7]:
+   'nan'
+
+*New Behavior*:
+
+.. ipython:: python
+
+   data = 'a,b,c\n1,,3\n4,5,6'
+   df = pd.read_csv(StringIO(data), engine='python', dtype=str, na_filter=True)
+   df.loc[0, 'b']
+
+Notice how we now instead output ``np.nan`` itself instead of a stringified form of it.
+
+.. _whatsnew_0240.api.timezone_offset_parsing:
+
+Parsing Datetime Strings with Timezone Offsets
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, parsing datetime strings with UTC offsets with :func:`to_datetime`
+or :class:`DatetimeIndex` would automatically convert the datetime to UTC
+without timezone localization. This is inconsistent from parsing the same
+datetime string with :class:`Timestamp` which would preserve the UTC
+offset in the ``tz`` attribute. Now, :func:`to_datetime` preserves the UTC
+offset in the ``tz`` attribute when all the datetime strings have the same
+UTC offset (:issue:`17697`, :issue:`11736`, :issue:`22457`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [2]: pd.to_datetime("2015-11-18 15:30:00+05:30")
+    Out[2]: Timestamp('2015-11-18 10:00:00')
+
+    In [3]: pd.Timestamp("2015-11-18 15:30:00+05:30")
+    Out[3]: Timestamp('2015-11-18 15:30:00+0530', tz='pytz.FixedOffset(330)')
+
+    # Different UTC offsets would automatically convert the datetimes to UTC (without a UTC timezone)
+    In [4]: pd.to_datetime(["2015-11-18 15:30:00+05:30", "2015-11-18 16:30:00+06:30"])
+    Out[4]: DatetimeIndex(['2015-11-18 10:00:00', '2015-11-18 10:00:00'], dtype='datetime64[ns]', freq=None)
+
+*New Behavior*:
+
+.. ipython:: python
+
+    pd.to_datetime("2015-11-18 15:30:00+05:30")
+    pd.Timestamp("2015-11-18 15:30:00+05:30")
+
+Parsing datetime strings with the same UTC offset will preserve the UTC offset in the ``tz``
+
+.. ipython:: python
+
+    pd.to_datetime(["2015-11-18 15:30:00+05:30"] * 2)
+
+Parsing datetime strings with different UTC offsets will now create an Index of
+``datetime.datetime`` objects with different UTC offsets
+
+.. ipython:: python
+
+    idx = pd.to_datetime(["2015-11-18 15:30:00+05:30",
+                          "2015-11-18 16:30:00+06:30"])
+    idx
+    idx[0]
+    idx[1]
+
+Passing ``utc=True`` will mimic the previous behavior but will correctly indicate
+that the dates have been converted to UTC
+
+.. ipython:: python
+
+    pd.to_datetime(["2015-11-18 15:30:00+05:30",
+                    "2015-11-18 16:30:00+06:30"], utc=True)
+
+
+.. _whatsnew_0240.api_breaking.read_csv_mixed_tz:
+
+Parsing mixed-timezones with :func:`read_csv`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:func:`read_csv` no longer silently converts mixed-timezone columns to UTC (:issue:`24987`).
+
+*Previous Behavior*
+
+.. code-block:: python
+
+   >>> import io
+   >>> content = """\
+   ... a
+   ... 2000-01-01T00:00:00+05:00
+   ... 2000-01-01T00:00:00+06:00"""
+   >>> df = pd.read_csv(io.StringIO(content), parse_dates=['a'])
+   >>> df.a
+   0   1999-12-31 19:00:00
+   1   1999-12-31 18:00:00
+   Name: a, dtype: datetime64[ns]
+
+*New Behavior*
+
+.. ipython:: python
+
+   import io
+   content = """\
+   a
+   2000-01-01T00:00:00+05:00
+   2000-01-01T00:00:00+06:00"""
+   df = pd.read_csv(io.StringIO(content), parse_dates=['a'])
+   df.a
+
+As can be seen, the ``dtype`` is object; each value in the column is a string.
+To convert the strings to an array of datetimes, the ``date_parser`` argument
+
+.. ipython:: python
+
+   df = pd.read_csv(io.StringIO(content), parse_dates=['a'],
+                    date_parser=lambda col: pd.to_datetime(col, utc=True))
+   df.a
+
+See :ref:`whatsnew_0240.api.timezone_offset_parsing` for more.
+
+.. _whatsnew_0240.api_breaking.period_end_time:
+
+Time values in ``dt.end_time`` and ``to_timestamp(how='end')``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The time values in :class:`Period` and :class:`PeriodIndex` objects are now set
+to '23:59:59.999999999' when calling :attr:`Series.dt.end_time`, :attr:`Period.end_time`,
+:attr:`PeriodIndex.end_time`, :func:`Period.to_timestamp()` with ``how='end'``,
+or :func:`PeriodIndex.to_timestamp()` with ``how='end'`` (:issue:`17157`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+   In [2]: p = pd.Period('2017-01-01', 'D')
+   In [3]: pi = pd.PeriodIndex([p])
+
+   In [4]: pd.Series(pi).dt.end_time[0]
+   Out[4]: Timestamp(2017-01-01 00:00:00)
+
+   In [5]: p.end_time
+   Out[5]: Timestamp(2017-01-01 23:59:59.999999999)
+
+*New Behavior*:
+
+Calling :attr:`Series.dt.end_time` will now result in a time of '23:59:59.999999999' as
+is the case with :attr:`Period.end_time`, for example
+
+.. ipython:: python
+
+   p = pd.Period('2017-01-01', 'D')
+   pi = pd.PeriodIndex([p])
+
+   pd.Series(pi).dt.end_time[0]
+
+   p.end_time
+
+.. _whatsnew_0240.api_breaking.datetime_unique:
+
+Series.unique for Timezone-Aware Data
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The return type of :meth:`Series.unique` for datetime with timezone values has changed
+from an :class:`numpy.ndarray` of :class:`Timestamp` objects to a :class:`arrays.DatetimeArray` (:issue:`24024`).
+
+.. ipython:: python
+
+   ser = pd.Series([pd.Timestamp('2000', tz='UTC'),
+                    pd.Timestamp('2000', tz='UTC')])
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+   In [3]: ser.unique()
+   Out[3]: array([Timestamp('2000-01-01 00:00:00+0000', tz='UTC')], dtype=object)
+
+
+*New Behavior*:
+
+.. ipython:: python
+
+   ser.unique()
+
+
+.. _whatsnew_0240.api_breaking.sparse_values:
+
+Sparse Data Structure Refactor
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``SparseArray``, the array backing ``SparseSeries`` and the columns in a ``SparseDataFrame``,
+is now an extension array (:issue:`21978`, :issue:`19056`, :issue:`22835`).
+To conform to this interface and for consistency with the rest of pandas, some API breaking
+changes were made:
+
+- ``SparseArray`` is no longer a subclass of :class:`numpy.ndarray`. To convert a ``SparseArray`` to a NumPy array, use :func:`numpy.asarray`.
+- ``SparseArray.dtype`` and ``SparseSeries.dtype`` are now instances of :class:`SparseDtype`, rather than ``np.dtype``. Access the underlying dtype with ``SparseDtype.subtype``.
+- ``numpy.asarray(sparse_array)`` now returns a dense array with all the values, not just the non-fill-value values (:issue:`14167`)
+- ``SparseArray.take`` now matches the API of :meth:`pandas.api.extensions.ExtensionArray.take` (:issue:`19506`):
+
+  * The default value of ``allow_fill`` has changed from ``False`` to ``True``.
+  * The ``out`` and ``mode`` parameters are now longer accepted (previously, this raised if they were specified).
+  * Passing a scalar for ``indices`` is no longer allowed.
+
+- The result of :func:`concat` with a mix of sparse and dense Series is a Series with sparse values, rather than a ``SparseSeries``.
+- ``SparseDataFrame.combine`` and ``DataFrame.combine_first`` no longer supports combining a sparse column with a dense column while preserving the sparse subtype. The result will be an object-dtype SparseArray.
+- Setting :attr:`SparseArray.fill_value` to a fill value with a different dtype is now allowed.
+- ``DataFrame[column]`` is now a :class:`Series` with sparse values, rather than a :class:`SparseSeries`, when slicing a single column with sparse values (:issue:`23559`).
+- The result of :meth:`Series.where` is now a ``Series`` with sparse values, like with other extension arrays (:issue:`24077`)
+
+Some new warnings are issued for operations that require or are likely to materialize a large dense array:
+
+- A :class:`errors.PerformanceWarning` is issued when using fillna with a ``method``, as a dense array is constructed to create the filled array. Filling with a ``value`` is the efficient way to fill a sparse array.
+- A :class:`errors.PerformanceWarning` is now issued when concatenating sparse Series with differing fill values. The fill value from the first sparse array continues to be used.
+
+In addition to these API breaking changes, many :ref:`Performance Improvements and Bug Fixes have been made <whatsnew_0240.bug_fixes.sparse>`.
+
+Finally, a ``Series.sparse`` accessor was added to provide sparse-specific methods like :meth:`Series.sparse.from_coo`.
+
+.. ipython:: python
+
+   s = pd.Series([0, 0, 1, 1, 1], dtype='Sparse[int]')
+   s.sparse.density
+
+.. _whatsnew_0240.api_breaking.get_dummies:
+
+:meth:`get_dummies` always returns a DataFrame
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Previously, when ``sparse=True`` was passed to :func:`get_dummies`, the return value could be either
+a :class:`DataFrame` or a :class:`SparseDataFrame`, depending on whether all or a just a subset
+of the columns were dummy-encoded. Now, a :class:`DataFrame` is always returned (:issue:`24284`).
+
+*Previous Behavior*
+
+The first :func:`get_dummies` returns a :class:`DataFrame` because the column ``A``
+is not dummy encoded. When just ``["B", "C"]`` are passed to ``get_dummies``,
+then all the columns are dummy-encoded, and a :class:`SparseDataFrame` was returned.
+
+.. code-block:: ipython
+
+   In [2]: df = pd.DataFrame({"A": [1, 2], "B": ['a', 'b'], "C": ['a', 'a']})
+
+   In [3]: type(pd.get_dummies(df, sparse=True))
+   Out[3]: pandas.core.frame.DataFrame
+
+   In [4]: type(pd.get_dummies(df[['B', 'C']], sparse=True))
+   Out[4]: pandas.core.sparse.frame.SparseDataFrame
+
+.. ipython:: python
+   :suppress:
+
+   df = pd.DataFrame({"A": [1, 2], "B": ['a', 'b'], "C": ['a', 'a']})
+
+*New Behavior*
+
+Now, the return type is consistently a :class:`DataFrame`.
+
+.. ipython:: python
+
+   type(pd.get_dummies(df, sparse=True))
+   type(pd.get_dummies(df[['B', 'C']], sparse=True))
+
+.. note::
+
+   There's no difference in memory usage between a :class:`SparseDataFrame`
+   and a :class:`DataFrame` with sparse values. The memory usage will
+   be the same as in the previous version of pandas.
+
+.. _whatsnew_0240.api_breaking.frame_to_dict_index_orient:
+
+Raise ValueError in ``DataFrame.to_dict(orient='index')``
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Bug in :func:`DataFrame.to_dict` raises ``ValueError`` when used with
+``orient='index'`` and a non-unique index instead of losing data (:issue:`22801`)
+
+.. ipython:: python
+    :okexcept:
+
+    df = pd.DataFrame({'a': [1, 2], 'b': [0.5, 0.75]}, index=['A', 'A'])
+    df
+
+    df.to_dict(orient='index')
+
+.. _whatsnew_0240.api.datetimelike.normalize:
+
+Tick DateOffset Normalize Restrictions
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Creating a ``Tick`` object (:class:`Day`, :class:`Hour`, :class:`Minute`,
+:class:`Second`, :class:`Milli`, :class:`Micro`, :class:`Nano`) with
+``normalize=True`` is no longer supported.  This prevents unexpected behavior
+where addition could fail to be monotone or associative.  (:issue:`21427`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+
+   In [2]: ts = pd.Timestamp('2018-06-11 18:01:14')
+
+   In [3]: ts
+   Out[3]: Timestamp('2018-06-11 18:01:14')
+
+   In [4]: tic = pd.offsets.Hour(n=2, normalize=True)
+      ...:
+
+   In [5]: tic
+   Out[5]: <2 * Hours>
+
+   In [6]: ts + tic
+   Out[6]: Timestamp('2018-06-11 00:00:00')
+
+   In [7]: ts + tic + tic + tic == ts + (tic + tic + tic)
+   Out[7]: False
+
+*New Behavior*:
+
+.. ipython:: python
+
+    ts = pd.Timestamp('2018-06-11 18:01:14')
+    tic = pd.offsets.Hour(n=2)
+    ts + tic + tic + tic == ts + (tic + tic + tic)
+
+
+.. _whatsnew_0240.api.datetimelike:
+
+
+.. _whatsnew_0240.api.period_subtraction:
+
+Period Subtraction
+^^^^^^^^^^^^^^^^^^
+
+Subtraction of a ``Period`` from another ``Period`` will give a ``DateOffset``.
+instead of an integer (:issue:`21314`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [2]: june = pd.Period('June 2018')
+
+    In [3]: april = pd.Period('April 2018')
+
+    In [4]: june - april
+    Out [4]: 2
+
+*New Behavior*:
+
+.. ipython:: python
+
+    june = pd.Period('June 2018')
+    april = pd.Period('April 2018')
+    june - april
+
+Similarly, subtraction of a ``Period`` from a ``PeriodIndex`` will now return
+an ``Index`` of ``DateOffset`` objects instead of an ``Int64Index``
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [2]: pi = pd.period_range('June 2018', freq='M', periods=3)
+
+    In [3]: pi - pi[0]
+    Out[3]: Int64Index([0, 1, 2], dtype='int64')
+
+*New Behavior*:
+
+.. ipython:: python
+
+    pi = pd.period_range('June 2018', freq='M', periods=3)
+    pi - pi[0]
+
+
+.. _whatsnew_0240.api.timedelta64_subtract_nan:
+
+Addition/Subtraction of ``NaN`` from :class:`DataFrame`
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Adding or subtracting ``NaN`` from a :class:`DataFrame` column with
+``timedelta64[ns]`` dtype will now raise a ``TypeError`` instead of returning
+all-``NaT``.  This is for compatibility with ``TimedeltaIndex`` and
+``Series`` behavior (:issue:`22163`)
+
+.. ipython:: python
+
+   df = pd.DataFrame([pd.Timedelta(days=1)])
+   df
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [4]: df = pd.DataFrame([pd.Timedelta(days=1)])
+
+    In [5]: df - np.nan
+    Out[5]:
+        0
+    0 NaT
+
+*New Behavior*:
+
+.. code-block:: ipython
+
+    In [2]: df - np.nan
+    ...
+    TypeError: unsupported operand type(s) for -: 'TimedeltaIndex' and 'float'
+
+.. _whatsnew_0240.api.dataframe_cmp_broadcasting:
+
+DataFrame Comparison Operations Broadcasting Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+Previously, the broadcasting behavior of :class:`DataFrame` comparison
+operations (``==``, ``!=``, ...) was inconsistent with the behavior of
+arithmetic operations (``+``, ``-``, ...).  The behavior of the comparison
+operations has been changed to match the arithmetic operations in these cases.
+(:issue:`22880`)
+
+The affected cases are:
+
+- operating against a 2-dimensional ``np.ndarray`` with either 1 row or 1 column will now broadcast the same way a ``np.ndarray`` would (:issue:`23000`).
+- a list or tuple with length matching the number of rows in the :class:`DataFrame` will now raise ``ValueError`` instead of operating column-by-column (:issue:`22880`.
+- a list or tuple with length matching the number of columns in the :class:`DataFrame` will now operate row-by-row instead of raising ``ValueError`` (:issue:`22880`).
+
+.. ipython:: python
+
+   arr = np.arange(6).reshape(3, 2)
+   df = pd.DataFrame(arr)
+   df
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+   In [5]: df == arr[[0], :]
+       ...: # comparison previously broadcast where arithmetic would raise
+   Out[5]:
+          0      1
+   0   True   True
+   1  False  False
+   2  False  False
+   In [6]: df + arr[[0], :]
+   ...
+   ValueError: Unable to coerce to DataFrame, shape must be (3, 2): given (1, 2)
+
+   In [7]: df == (1, 2)
+       ...: # length matches number of columns;
+       ...: # comparison previously raised where arithmetic would broadcast
+   ...
+   ValueError: Invalid broadcasting comparison [(1, 2)] with block values
+   In [8]: df + (1, 2)
+   Out[8]:
+      0  1
+   0  1  3
+   1  3  5
+   2  5  7
+
+   In [9]: df == (1, 2, 3)
+       ...:  # length matches number of rows
+       ...:  # comparison previously broadcast where arithmetic would raise
+   Out[9]:
+          0      1
+   0  False   True
+   1   True  False
+   2  False  False
+   In [10]: df + (1, 2, 3)
+   ...
+   ValueError: Unable to coerce to Series, length must be 2: given 3
+
+*New Behavior*:
+
+.. ipython:: python
+
+   # Comparison operations and arithmetic operations both broadcast.
+   df == arr[[0], :]
+   df + arr[[0], :]
+
+.. ipython:: python
+
+   # Comparison operations and arithmetic operations both broadcast.
+   df == (1, 2)
+   df + (1, 2)
+
+.. code-block:: ipython
+
+   # Comparison operations and arithmetic opeartions both raise ValueError.
+   In [6]: df == (1, 2, 3)
+   ...
+   ValueError: Unable to coerce to Series, length must be 2: given 3
+
+   In [7]: df + (1, 2, 3)
+   ...
+   ValueError: Unable to coerce to Series, length must be 2: given 3
+
+.. _whatsnew_0240.api.dataframe_arithmetic_broadcasting:
+
+DataFrame Arithmetic Operations Broadcasting Changes
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+:class:`DataFrame` arithmetic operations when operating with 2-dimensional
+``np.ndarray`` objects now broadcast in the same way as ``np.ndarray``
+broadcast.  (:issue:`23000`)
+
+.. ipython:: python
+
+   arr = np.arange(6).reshape(3, 2)
+   df = pd.DataFrame(arr)
+   df
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+   In [5]: df + arr[[0], :]   # 1 row, 2 columns
+   ...
+   ValueError: Unable to coerce to DataFrame, shape must be (3, 2): given (1, 2)
+   In [6]: df + arr[:, [1]]   # 1 column, 3 rows
+   ...
+   ValueError: Unable to coerce to DataFrame, shape must be (3, 2): given (3, 1)
+
+*New Behavior*:
+
+.. ipython:: python
+
+   df + arr[[0], :]   # 1 row, 2 columns
+   df + arr[:, [1]]   # 1 column, 3 rows
+
+.. _whatsnew_0240.api.incompatibilities:
+
+Series and Index Data-Dtype Incompatibilities
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+``Series`` and ``Index`` constructors now raise when the
+data is incompatible with a passed ``dtype=`` (:issue:`15832`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [4]: pd.Series([-1], dtype="uint64")
+    Out [4]:
+    0    18446744073709551615
+    dtype: uint64
+
+*New Behavior*:
+
+.. code-block:: ipython
+
+    In [4]: pd.Series([-1], dtype="uint64")
+    Out [4]:
+    ...
+    OverflowError: Trying to coerce negative values to unsigned integers
+
+.. _whatsnew_0240.api.concat_categorical:
+
+Concatenation Changes
+^^^^^^^^^^^^^^^^^^^^^
+
+Calling :func:`pandas.concat` on a ``Categorical`` of ints with NA values now
+causes them to be processed as objects when concatenating with anything
+other than another ``Categorical`` of ints (:issue:`19214`)
+
+.. ipython:: python
+
+    s = pd.Series([0, 1, np.nan])
+    c = pd.Series([0, 1, np.nan], dtype="category")
+
+*Previous Behavior*
+
+.. code-block:: ipython
+
+    In [3]: pd.concat([s, c])
+    Out[3]:
+    0    0.0
+    1    1.0
+    2    NaN
+    0    0.0
+    1    1.0
+    2    NaN
+    dtype: float64
+
+*New Behavior*
+
+.. ipython:: python
+
+    pd.concat([s, c])
+
+Datetimelike API Changes
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- For :class:`DatetimeIndex` and :class:`TimedeltaIndex` with non-``None`` ``freq`` attribute, addition or subtraction of integer-dtyped array or ``Index`` will return an object of the same class (:issue:`19959`)
+- :class:`DateOffset` objects are now immutable. Attempting to alter one of these will now raise ``AttributeError`` (:issue:`21341`)
+- :class:`PeriodIndex` subtraction of another ``PeriodIndex`` will now return an object-dtype :class:`Index` of :class:`DateOffset` objects instead of raising a ``TypeError`` (:issue:`20049`)
+- :func:`cut` and :func:`qcut` now returns a :class:`DatetimeIndex` or :class:`TimedeltaIndex` bins when the input is datetime or timedelta dtype respectively and ``retbins=True`` (:issue:`19891`)
+- :meth:`DatetimeIndex.to_period` and :meth:`Timestamp.to_period` will issue a warning when timezone information will be lost (:issue:`21333`)
+- :meth:`PeriodIndex.tz_convert` and :meth:`PeriodIndex.tz_localize` have been removed (:issue:`21781`)
+
+.. _whatsnew_0240.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- A newly constructed empty :class:`DataFrame` with integer as the ``dtype`` will now only be cast to ``float64`` if ``index`` is specified (:issue:`22858`)
+- :meth:`Series.str.cat` will now raise if ``others`` is a ``set`` (:issue:`23009`)
+- Passing scalar values to :class:`DatetimeIndex` or :class:`TimedeltaIndex` will now raise ``TypeError`` instead of ``ValueError`` (:issue:`23539`)
+- ``max_rows`` and ``max_cols`` parameters removed from :class:`HTMLFormatter` since truncation is handled by :class:`DataFrameFormatter` (:issue:`23818`)
+- :func:`read_csv` will now raise a ``ValueError`` if a column with missing values is declared as having dtype ``bool`` (:issue:`20591`)
+- The column order of the resultant :class:`DataFrame` from :meth:`MultiIndex.to_frame` is now guaranteed to match the :attr:`MultiIndex.names` order. (:issue:`22420`)
+- Incorrectly passing a :class:`DatetimeIndex` to :meth:`MultiIndex.from_tuples`, rather than a sequence of tuples, now raises a ``TypeError`` rather than a ``ValueError`` (:issue:`24024`)
+- :func:`pd.offsets.generate_range` argument ``time_rule`` has been removed; use ``offset`` instead (:issue:`24157`)
+- In 0.23.x, pandas would raise a ``ValueError`` on a merge of a numeric column (e.g. ``int`` dtyped column) and an ``object`` dtyped column (:issue:`9780`). We have re-enabled the ability to merge ``object`` and other dtypes; pandas will still raise on a merge between a numeric and an ``object`` dtyped column that is composed only of strings (:issue:`21681`)
+- Accessing a level of a ``MultiIndex`` with a duplicate name (e.g. in
+  :meth:`~MultiIndex.get_level_values`) now raises a ``ValueError`` instead of a ``KeyError`` (:issue:`21678`).
+- Invalid construction of ``IntervalDtype`` will now always raise a ``TypeError`` rather than a ``ValueError`` if the subdtype is invalid (:issue:`21185`)
+- Trying to reindex a ``DataFrame`` with a non unique ``MultiIndex`` now raises a ``ValueError`` instead of an ``Exception`` (:issue:`21770`)
+- :class:`Index` subtraction will attempt to operate element-wise instead of raising ``TypeError`` (:issue:`19369`)
+- :class:`pandas.io.formats.style.Styler` supports a ``number-format`` property when using :meth:`~pandas.io.formats.style.Styler.to_excel` (:issue:`22015`)
+- :meth:`DataFrame.corr` and :meth:`Series.corr` now raise a ``ValueError`` along with a helpful error message instead of a ``KeyError`` when supplied with an invalid method (:issue:`22298`)
+- :meth:`shift` will now always return a copy, instead of the previous behaviour of returning self when shifting by 0 (:issue:`22397`)
+- :meth:`DataFrame.set_index` now gives a better (and less frequent) KeyError, raises a ``ValueError`` for incorrect types,
+  and will not fail on duplicate column names with ``drop=True``. (:issue:`22484`)
+- Slicing a single row of a DataFrame with multiple ExtensionArrays of the same type now preserves the dtype, rather than coercing to object (:issue:`22784`)
+- :class:`DateOffset` attribute `_cacheable` and method `_should_cache` have been removed (:issue:`23118`)
+- :meth:`Series.searchsorted`, when supplied a scalar value to search for, now returns a scalar instead of an array (:issue:`23801`).
+- :meth:`Categorical.searchsorted`, when supplied a scalar value to search for, now returns a scalar instead of an array (:issue:`23466`).
+- :meth:`Categorical.searchsorted` now raises a ``KeyError`` rather that a ``ValueError``, if a searched for key is not found in its categories (:issue:`23466`).
+- :meth:`Index.hasnans` and :meth:`Series.hasnans` now always return a python boolean. Previously, a python or a numpy boolean could be returned, depending on circumstances (:issue:`23294`).
+- The order of the arguments of :func:`DataFrame.to_html` and :func:`DataFrame.to_string` is rearranged to be consistent with each other. (:issue:`23614`)
+- :meth:`CategoricalIndex.reindex` now raises a ``ValueError`` if the target index is non-unique and not equal to the current index. It previously only raised if the target index was not of a categorical dtype (:issue:`23963`).
+- :func:`Series.to_list` and :func:`Index.to_list` are now aliases of ``Series.tolist`` respectively ``Index.tolist`` (:issue:`8826`)
+- The result of ``SparseSeries.unstack`` is now a :class:`DataFrame` with sparse values, rather than a :class:`SparseDataFrame` (:issue:`24372`).
+- :class:`DatetimeIndex` and :class:`TimedeltaIndex` no longer ignore the dtype precision. Passing a non-nanosecond resolution dtype will raise a ``ValueError`` (:issue:`24753`)
+
+
+.. _whatsnew_0240.api.extension:
+
+Extension Type Changes
+~~~~~~~~~~~~~~~~~~~~~~
+
+**Equality and Hashability**
+
+Pandas now requires that extension dtypes be hashable (i.e. the respective
+``ExtensionDtype`` objects; hashability is not a requirement for the values
+of the corresponding ``ExtensionArray``). The base class implements
+a default ``__eq__`` and ``__hash__``. If you have a parametrized dtype, you should
+update the ``ExtensionDtype._metadata`` tuple to match the signature of your
+``__init__`` method. See :class:`pandas.api.extensions.ExtensionDtype` for more (:issue:`22476`).
+
+**New and changed methods**
+
+- :meth:`~pandas.api.types.ExtensionArray.dropna` has been added (:issue:`21185`)
+- :meth:`~pandas.api.types.ExtensionArray.repeat` has been added (:issue:`24349`)
+- The ``ExtensionArray`` constructor, ``_from_sequence`` now take the keyword arg ``copy=False`` (:issue:`21185`)
+- :meth:`pandas.api.extensions.ExtensionArray.shift` added as part of the basic ``ExtensionArray`` interface (:issue:`22387`).
+- :meth:`~pandas.api.types.ExtensionArray.searchsorted` has been added (:issue:`24350`)
+- Support for reduction operations such as ``sum``, ``mean`` via opt-in base class method override (:issue:`22762`)
+- :func:`ExtensionArray.isna` is allowed to return an ``ExtensionArray`` (:issue:`22325`).
+
+**Dtype changes**
+
+- ``ExtensionDtype`` has gained the ability to instantiate from string dtypes, e.g. ``decimal`` would instantiate a registered ``DecimalDtype``; furthermore
+  the ``ExtensionDtype`` has gained the method ``construct_array_type`` (:issue:`21185`)
+- Added ``ExtensionDtype._is_numeric`` for controlling whether an extension dtype is considered numeric (:issue:`22290`).
+- Added :meth:`pandas.api.types.register_extension_dtype` to register an extension type with pandas (:issue:`22664`)
+- Updated the ``.type`` attribute for ``PeriodDtype``, ``DatetimeTZDtype``, and ``IntervalDtype`` to be instances of the dtype (``Period``, ``Timestamp``, and ``Interval`` respectively) (:issue:`22938`)
+
+.. _whatsnew_0240.enhancements.extension_array_operators:
+
+**Operator support**
+
+A ``Series`` based on an ``ExtensionArray`` now supports arithmetic and comparison
+operators (:issue:`19577`). There are two approaches for providing operator support for an ``ExtensionArray``:
+
+1. Define each of the operators on your ``ExtensionArray`` subclass.
+2. Use an operator implementation from pandas that depends on operators that are already defined
+   on the underlying elements (scalars) of the ``ExtensionArray``.
+
+See the :ref:`ExtensionArray Operator Support
+<extending.extension.operator>` documentation section for details on both
+ways of adding operator support.
+
+**Other changes**
+
+- A default repr for :class:`pandas.api.extensions.ExtensionArray` is now provided (:issue:`23601`).
+- :meth:`ExtensionArray._formatting_values` is deprecated. Use :attr:`ExtensionArray._formatter` instead. (:issue:`23601`)
+- An ``ExtensionArray`` with a boolean dtype now works correctly as a boolean indexer. :meth:`pandas.api.types.is_bool_dtype` now properly considers them boolean (:issue:`22326`)
+
+**Bug Fixes**
+
+- Bug in :meth:`Series.get` for ``Series`` using ``ExtensionArray`` and integer index (:issue:`21257`)
+- :meth:`~Series.shift` now dispatches to :meth:`ExtensionArray.shift` (:issue:`22386`)
+- :meth:`Series.combine()` works correctly with :class:`~pandas.api.extensions.ExtensionArray` inside of :class:`Series` (:issue:`20825`)
+- :meth:`Series.combine()` with scalar argument now works for any function type (:issue:`21248`)
+- :meth:`Series.astype` and :meth:`DataFrame.astype` now dispatch to :meth:`ExtensionArray.astype` (:issue:`21185`).
+- Slicing a single row of a ``DataFrame`` with multiple ExtensionArrays of the same type now preserves the dtype, rather than coercing to object (:issue:`22784`)
+- Bug when concatenating multiple ``Series`` with different extension dtypes not casting to object dtype (:issue:`22994`)
+- Series backed by an ``ExtensionArray`` now work with :func:`util.hash_pandas_object` (:issue:`23066`)
+- :meth:`DataFrame.stack` no longer converts to object dtype for DataFrames where each column has the same extension dtype. The output Series will have the same dtype as the columns (:issue:`23077`).
+- :meth:`Series.unstack` and :meth:`DataFrame.unstack` no longer convert extension arrays to object-dtype ndarrays. Each column in the output ``DataFrame`` will now have the same dtype as the input (:issue:`23077`).
+- Bug when grouping :meth:`Dataframe.groupby()` and aggregating on ``ExtensionArray`` it was not returning the actual ``ExtensionArray`` dtype (:issue:`23227`).
+- Bug in :func:`pandas.merge` when merging on an extension array-backed column (:issue:`23020`).
+
+
+.. _whatsnew_0240.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- :attr:`MultiIndex.labels` has been deprecated and replaced by :attr:`MultiIndex.codes`.
+  The functionality is unchanged. The new name better reflects the natures of
+  these codes and makes the ``MultiIndex`` API more similar to the API for :class:`CategoricalIndex` (:issue:`13443`).
+  As a consequence, other uses of the name ``labels`` in ``MultiIndex`` have also been deprecated and replaced with ``codes``:
+
+  - You should initialize a ``MultiIndex`` instance using a parameter named ``codes`` rather than ``labels``.
+  - ``MultiIndex.set_labels`` has been deprecated in favor of :meth:`MultiIndex.set_codes`.
+  - For method :meth:`MultiIndex.copy`, the ``labels`` parameter has been deprecated and replaced by a ``codes`` parameter.
+- :meth:`DataFrame.to_stata`, :meth:`read_stata`, :class:`StataReader` and :class:`StataWriter` have deprecated the ``encoding`` argument. The encoding of a Stata dta file is determined by the file type and cannot be changed (:issue:`21244`)
+- :meth:`MultiIndex.to_hierarchical` is deprecated and will be removed in a future version (:issue:`21613`)
+- :meth:`Series.ptp` is deprecated. Use ``numpy.ptp`` instead (:issue:`21614`)
+- :meth:`Series.compress` is deprecated. Use ``Series[condition]`` instead (:issue:`18262`)
+- The signature of :meth:`Series.to_csv` has been uniformed to that of :meth:`DataFrame.to_csv`: the name of the first argument is now ``path_or_buf``, the order of subsequent arguments has changed, the ``header`` argument now defaults to ``True``. (:issue:`19715`)
+- :meth:`Categorical.from_codes` has deprecated providing float values for the ``codes`` argument. (:issue:`21767`)
+- :func:`pandas.read_table` is deprecated. Instead, use :func:`read_csv` passing ``sep='\t'`` if necessary (:issue:`21948`)
+- :meth:`Series.str.cat` has deprecated using arbitrary list-likes *within* list-likes. A list-like container may still contain
+  many ``Series``, ``Index`` or 1-dimensional ``np.ndarray``, or alternatively, only scalar values. (:issue:`21950`)
+- :meth:`FrozenNDArray.searchsorted` has deprecated the ``v`` parameter in favor of ``value`` (:issue:`14645`)
+- :func:`DatetimeIndex.shift` and :func:`PeriodIndex.shift` now accept ``periods`` argument instead of ``n`` for consistency with :func:`Index.shift` and :func:`Series.shift`. Using ``n`` throws a deprecation warning (:issue:`22458`, :issue:`22912`)
+- The ``fastpath`` keyword of the different Index constructors is deprecated (:issue:`23110`).
+- :meth:`Timestamp.tz_localize`, :meth:`DatetimeIndex.tz_localize`, and :meth:`Series.tz_localize` have deprecated the ``errors`` argument in favor of the ``nonexistent`` argument (:issue:`8917`)
+- The class ``FrozenNDArray`` has been deprecated. When unpickling, ``FrozenNDArray`` will be unpickled to ``np.ndarray`` once this class is removed (:issue:`9031`)
+- The methods :meth:`DataFrame.update` and :meth:`Panel.update` have deprecated the ``raise_conflict=False|True`` keyword in favor of ``errors='ignore'|'raise'`` (:issue:`23585`)
+- The methods :meth:`Series.str.partition` and :meth:`Series.str.rpartition` have deprecated the ``pat`` keyword in favor of ``sep`` (:issue:`22676`)
+- Deprecated the ``nthreads`` keyword of :func:`pandas.read_feather` in favor of ``use_threads`` to reflect the changes in ``pyarrow>=0.11.0``. (:issue:`23053`)
+- :func:`pandas.read_excel` has deprecated accepting ``usecols`` as an integer. Please pass in a list of ints from 0 to ``usecols`` inclusive instead (:issue:`23527`)
+- Constructing a :class:`TimedeltaIndex` from data with ``datetime64``-dtyped data is deprecated, will raise ``TypeError`` in a future version (:issue:`23539`)
+- Constructing a :class:`DatetimeIndex` from data with ``timedelta64``-dtyped data is deprecated, will raise ``TypeError`` in a future version (:issue:`23675`)
+- The ``keep_tz=False`` option (the default) of the ``keep_tz`` keyword of
+  :meth:`DatetimeIndex.to_series` is deprecated (:issue:`17832`).
+- Timezone converting a tz-aware ``datetime.datetime`` or :class:`Timestamp` with :class:`Timestamp` and the ``tz`` argument is now deprecated. Instead, use :meth:`Timestamp.tz_convert` (:issue:`23579`)
+- :func:`pandas.api.types.is_period` is deprecated in favor of ``pandas.api.types.is_period_dtype`` (:issue:`23917`)
+- :func:`pandas.api.types.is_datetimetz` is deprecated in favor of ``pandas.api.types.is_datetime64tz`` (:issue:`23917`)
+- Creating a :class:`TimedeltaIndex`, :class:`DatetimeIndex`, or :class:`PeriodIndex` by passing range arguments `start`, `end`, and `periods` is deprecated in favor of :func:`timedelta_range`, :func:`date_range`, or :func:`period_range` (:issue:`23919`)
+- Passing a string alias like ``'datetime64[ns, UTC]'`` as the ``unit`` parameter to :class:`DatetimeTZDtype` is deprecated. Use :class:`DatetimeTZDtype.construct_from_string` instead (:issue:`23990`).
+- The ``skipna`` parameter of :meth:`~pandas.api.types.infer_dtype` will switch to ``True`` by default in a future version of pandas (:issue:`17066`, :issue:`24050`)
+- In :meth:`Series.where` with Categorical data, providing an ``other`` that is not present in the categories is deprecated. Convert the categorical to a different dtype or add the ``other`` to the categories first (:issue:`24077`).
+- :meth:`Series.clip_lower`, :meth:`Series.clip_upper`, :meth:`DataFrame.clip_lower` and :meth:`DataFrame.clip_upper` are deprecated and will be removed in a future version. Use ``Series.clip(lower=threshold)``, ``Series.clip(upper=threshold)`` and the equivalent ``DataFrame`` methods (:issue:`24203`)
+- :meth:`Series.nonzero` is deprecated and will be removed in a future version (:issue:`18262`)
+- Passing an integer to :meth:`Series.fillna` and :meth:`DataFrame.fillna` with ``timedelta64[ns]`` dtypes is deprecated, will raise ``TypeError`` in a future version.  Use ``obj.fillna(pd.Timedelta(...))`` instead (:issue:`24694`)
+- ``Series.cat.categorical``, ``Series.cat.name`` and ``Sersies.cat.index`` have been deprecated. Use the attributes on ``Series.cat`` or ``Series`` directly. (:issue:`24751`).
+- Passing a dtype without a precision like ``np.dtype('datetime64')`` or ``timedelta64`` to :class:`Index`, :class:`DatetimeIndex` and :class:`TimedeltaIndex` is now deprecated. Use the nanosecond-precision dtype instead (:issue:`24753`).
+
+.. _whatsnew_0240.deprecations.datetimelike_int_ops:
+
+Integer Addition/Subtraction with Datetimes and Timedeltas is Deprecated
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+In the past, users could—in some cases—add or subtract integers or integer-dtype
+arrays from :class:`Timestamp`, :class:`DatetimeIndex` and :class:`TimedeltaIndex`.
+
+This usage is now deprecated.  Instead add or subtract integer multiples of
+the object's ``freq`` attribute (:issue:`21939`, :issue:`23878`).
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [5]: ts = pd.Timestamp('1994-05-06 12:15:16', freq=pd.offsets.Hour())
+    In [6]: ts + 2
+    Out[6]: Timestamp('1994-05-06 14:15:16', freq='H')
+
+    In [7]: tdi = pd.timedelta_range('1D', periods=2)
+    In [8]: tdi - np.array([2, 1])
+    Out[8]: TimedeltaIndex(['-1 days', '1 days'], dtype='timedelta64[ns]', freq=None)
+
+    In [9]: dti = pd.date_range('2001-01-01', periods=2, freq='7D')
+    In [10]: dti + pd.Index([1, 2])
+    Out[10]: DatetimeIndex(['2001-01-08', '2001-01-22'], dtype='datetime64[ns]', freq=None)
+
+*New Behavior*:
+
+.. ipython:: python
+    :okwarning:
+
+    ts = pd.Timestamp('1994-05-06 12:15:16', freq=pd.offsets.Hour())
+    ts + 2 * ts.freq
+
+    tdi = pd.timedelta_range('1D', periods=2)
+    tdi - np.array([2 * tdi.freq, 1 * tdi.freq])
+
+    dti = pd.date_range('2001-01-01', periods=2, freq='7D')
+    dti + pd.Index([1 * dti.freq, 2 * dti.freq])
+
+
+.. _whatsnew_0240.deprecations.integer_tz:
+
+Passing Integer data and a timezone to DatetimeIndex
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The behavior of :class:`DatetimeIndex` when passed integer data and
+a timezone is changing in a future version of pandas. Previously, these
+were interpreted as wall times in the desired timezone. In the future,
+these will be interpreted as wall times in UTC, which are then converted
+to the desired timezone (:issue:`24559`).
+
+The default behavior remains the same, but issues a warning:
+
+.. code-block:: ipython
+
+   In [3]: pd.DatetimeIndex([946684800000000000], tz="US/Central")
+   /bin/ipython:1: FutureWarning:
+       Passing integer-dtype data and a timezone to DatetimeIndex. Integer values
+       will be interpreted differently in a future version of pandas. Previously,
+       these were viewed as datetime64[ns] values representing the wall time
+       *in the specified timezone*. In the future, these will be viewed as
+       datetime64[ns] values representing the wall time *in UTC*. This is similar
+       to a nanosecond-precision UNIX epoch. To accept the future behavior, use
+
+           pd.to_datetime(integer_data, utc=True).tz_convert(tz)
+
+       To keep the previous behavior, use
+
+           pd.to_datetime(integer_data).tz_localize(tz)
+
+    #!/bin/python3
+    Out[3]: DatetimeIndex(['2000-01-01 00:00:00-06:00'], dtype='datetime64[ns, US/Central]', freq=None)
+
+As the warning message explains, opt in to the future behavior by specifying that
+the integer values are UTC, and then converting to the final timezone:
+
+.. ipython:: python
+
+   pd.to_datetime([946684800000000000], utc=True).tz_convert('US/Central')
+
+The old behavior can be retained with by localizing directly to the final timezone:
+
+.. ipython:: python
+
+   pd.to_datetime([946684800000000000]).tz_localize('US/Central')
+
+.. _whatsnew_0240.deprecations.tz_aware_array:
+
+Converting Timezone-Aware Series and Index to NumPy Arrays
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The conversion from a :class:`Series` or :class:`Index` with timezone-aware
+datetime data will change to preserve timezones by default (:issue:`23569`).
+
+NumPy doesn't have a dedicated dtype for timezone-aware datetimes.
+In the past, converting a :class:`Series` or :class:`DatetimeIndex` with
+timezone-aware datatimes would convert to a NumPy array by
+
+1. converting the tz-aware data to UTC
+2. dropping the timezone-info
+3. returning a :class:`numpy.ndarray` with ``datetime64[ns]`` dtype
+
+Future versions of pandas will preserve the timezone information by returning an
+object-dtype NumPy array where each value is a :class:`Timestamp` with the correct
+timezone attached
+
+.. ipython:: python
+
+   ser = pd.Series(pd.date_range('2000', periods=2, tz="CET"))
+   ser
+
+The default behavior remains the same, but issues a warning
+
+.. code-block:: python
+
+   In [8]: np.asarray(ser)
+   /bin/ipython:1: FutureWarning: Converting timezone-aware DatetimeArray to timezone-naive
+         ndarray with 'datetime64[ns]' dtype. In the future, this will return an ndarray
+         with 'object' dtype where each element is a 'pandas.Timestamp' with the correct 'tz'.
+
+           To accept the future behavior, pass 'dtype=object'.
+           To keep the old behavior, pass 'dtype="datetime64[ns]"'.
+     #!/bin/python3
+   Out[8]:
+   array(['1999-12-31T23:00:00.000000000', '2000-01-01T23:00:00.000000000'],
+         dtype='datetime64[ns]')
+
+The previous or future behavior can be obtained, without any warnings, by specifying
+the ``dtype``
+
+*Previous Behavior*
+
+.. ipython:: python
+
+   np.asarray(ser, dtype='datetime64[ns]')
+
+*Future Behavior*
+
+.. ipython:: python
+
+   # New behavior
+   np.asarray(ser, dtype=object)
+
+
+Or by using :meth:`Series.to_numpy`
+
+.. ipython:: python
+
+   ser.to_numpy()
+   ser.to_numpy(dtype="datetime64[ns]")
+
+All the above applies to a :class:`DatetimeIndex` with tz-aware values as well.
+
+.. _whatsnew_0240.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+- The ``LongPanel`` and ``WidePanel`` classes have been removed (:issue:`10892`)
+- :meth:`Series.repeat` has renamed the ``reps`` argument to ``repeats`` (:issue:`14645`)
+- Several private functions were removed from the (non-public) module ``pandas.core.common`` (:issue:`22001`)
+- Removal of the previously deprecated module ``pandas.core.datetools`` (:issue:`14105`, :issue:`14094`)
+- Strings passed into :meth:`DataFrame.groupby` that refer to both column and index levels will raise a ``ValueError`` (:issue:`14432`)
+- :meth:`Index.repeat` and :meth:`MultiIndex.repeat` have renamed the ``n`` argument to ``repeats`` (:issue:`14645`)
+- The ``Series`` constructor and ``.astype`` method will now raise a ``ValueError`` if timestamp dtypes are passed in without a unit (e.g. ``np.datetime64``) for the ``dtype`` parameter (:issue:`15987`)
+- Removal of the previously deprecated ``as_indexer`` keyword completely from ``str.match()`` (:issue:`22356`, :issue:`6581`)
+- The modules ``pandas.types``, ``pandas.computation``, and ``pandas.util.decorators`` have been removed (:issue:`16157`, :issue:`16250`)
+- Removed the ``pandas.formats.style`` shim for :class:`pandas.io.formats.style.Styler` (:issue:`16059`)
+- ``pandas.pnow``, ``pandas.match``, ``pandas.groupby``, ``pd.get_store``, ``pd.Expr``, and ``pd.Term`` have been removed (:issue:`15538`, :issue:`15940`)
+- :meth:`Categorical.searchsorted` and :meth:`Series.searchsorted` have renamed the ``v`` argument to ``value`` (:issue:`14645`)
+- ``pandas.parser``, ``pandas.lib``, and ``pandas.tslib`` have been removed (:issue:`15537`)
+- :meth:`Index.searchsorted` have renamed the ``key`` argument to ``value`` (:issue:`14645`)
+- ``DataFrame.consolidate`` and ``Series.consolidate`` have been removed (:issue:`15501`)
+- Removal of the previously deprecated module ``pandas.json`` (:issue:`19944`)
+- The module ``pandas.tools`` has been removed (:issue:`15358`, :issue:`16005`)
+- :meth:`SparseArray.get_values` and :meth:`SparseArray.to_dense` have dropped the ``fill`` parameter (:issue:`14686`)
+- ``DataFrame.sortlevel`` and ``Series.sortlevel`` have been removed (:issue:`15099`)
+- :meth:`SparseSeries.to_dense` has dropped the ``sparse_only`` parameter (:issue:`14686`)
+- :meth:`DataFrame.astype` and :meth:`Series.astype` have renamed the ``raise_on_error`` argument to ``errors`` (:issue:`14967`)
+- ``is_sequence``, ``is_any_int_dtype``, and ``is_floating_dtype`` have been removed from ``pandas.api.types`` (:issue:`16163`, :issue:`16189`)
+
+.. _whatsnew_0240.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Slicing Series and DataFrames with an monotonically increasing :class:`CategoricalIndex`
+  is now very fast and has speed comparable to slicing with an ``Int64Index``.
+  The speed increase is both when indexing by label (using .loc) and position(.iloc) (:issue:`20395`)
+  Slicing a monotonically increasing :class:`CategoricalIndex` itself (i.e. ``ci[1000:2000]``)
+  shows similar speed improvements as above (:issue:`21659`)
+- Improved performance of :meth:`CategoricalIndex.equals` when comparing to another :class:`CategoricalIndex` (:issue:`24023`)
+- Improved performance of :func:`Series.describe` in case of numeric dtpyes (:issue:`21274`)
+- Improved performance of :func:`pandas.core.groupby.GroupBy.rank` when dealing with tied rankings (:issue:`21237`)
+- Improved performance of :func:`DataFrame.set_index` with columns consisting of :class:`Period` objects (:issue:`21582`, :issue:`21606`)
+- Improved performance of :meth:`Series.at` and :meth:`Index.get_value` for Extension Arrays values (e.g. :class:`Categorical`) (:issue:`24204`)
+- Improved performance of membership checks in :class:`Categorical` and :class:`CategoricalIndex`
+  (i.e. ``x in cat``-style checks are much faster). :meth:`CategoricalIndex.contains`
+  is likewise much faster (:issue:`21369`, :issue:`21508`)
+- Improved performance of :meth:`HDFStore.groups` (and dependent functions like
+  :meth:`HDFStore.keys`.  (i.e. ``x in store`` checks are much faster)
+  (:issue:`21372`)
+- Improved the performance of :func:`pandas.get_dummies` with ``sparse=True`` (:issue:`21997`)
+- Improved performance of :func:`IndexEngine.get_indexer_non_unique` for sorted, non-unique indexes (:issue:`9466`)
+- Improved performance of :func:`PeriodIndex.unique` (:issue:`23083`)
+- Improved performance of :func:`concat` for `Series` objects (:issue:`23404`)
+- Improved performance of :meth:`DatetimeIndex.normalize` and :meth:`Timestamp.normalize` for timezone naive or UTC datetimes (:issue:`23634`)
+- Improved performance of :meth:`DatetimeIndex.tz_localize` and various ``DatetimeIndex`` attributes with dateutil UTC timezone (:issue:`23772`)
+- Fixed a performance regression on Windows with Python 3.7 of :func:`read_csv` (:issue:`23516`)
+- Improved performance of :class:`Categorical` constructor for ``Series`` objects (:issue:`23814`)
+- Improved performance of :meth:`~DataFrame.where` for Categorical data (:issue:`24077`)
+- Improved performance of iterating over a :class:`Series`. Using :meth:`DataFrame.itertuples` now creates iterators
+  without internally allocating lists of all elements (:issue:`20783`)
+- Improved performance of :class:`Period` constructor, additionally benefitting ``PeriodArray`` and ``PeriodIndex`` creation (:issue:`24084`, :issue:`24118`)
+- Improved performance of tz-aware :class:`DatetimeArray` binary operations (:issue:`24491`)
+
+.. _whatsnew_0240.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+Categorical
+^^^^^^^^^^^
+
+- Bug in :meth:`Categorical.from_codes` where ``NaN`` values in ``codes`` were silently converted to ``0`` (:issue:`21767`). In the future this will raise a ``ValueError``. Also changes the behavior of ``.from_codes([1.1, 2.0])``.
+- Bug in :meth:`Categorical.sort_values` where ``NaN`` values were always positioned in front regardless of ``na_position`` value. (:issue:`22556`).
+- Bug when indexing with a boolean-valued ``Categorical``. Now a boolean-valued ``Categorical`` is treated as a boolean mask (:issue:`22665`)
+- Constructing a :class:`CategoricalIndex` with empty values and boolean categories was raising a ``ValueError`` after a change to dtype coercion (:issue:`22702`).
+- Bug in :meth:`Categorical.take` with a user-provided ``fill_value`` not encoding the ``fill_value``, which could result in a ``ValueError``, incorrect results, or a segmentation fault (:issue:`23296`).
+- In :meth:`Series.unstack`, specifying a ``fill_value`` not present in the categories now raises a ``TypeError`` rather than ignoring the ``fill_value`` (:issue:`23284`)
+- Bug when resampling :meth:`DataFrame.resample()` and aggregating on categorical data, the categorical dtype was getting lost. (:issue:`23227`)
+- Bug in many methods of the ``.str``-accessor, which always failed on calling the ``CategoricalIndex.str`` constructor (:issue:`23555`, :issue:`23556`)
+- Bug in :meth:`Series.where` losing the categorical dtype for categorical data (:issue:`24077`)
+- Bug in :meth:`Categorical.apply` where ``NaN`` values could be handled unpredictably. They now remain unchanged (:issue:`24241`)
+- Bug in :class:`Categorical` comparison methods incorrectly raising ``ValueError`` when operating against a :class:`DataFrame` (:issue:`24630`)
+- Bug in :meth:`Categorical.set_categories` where setting fewer new categories with ``rename=True`` caused a segmentation fault (:issue:`24675`)
+
+Datetimelike
+^^^^^^^^^^^^
+
+- Fixed bug where two :class:`DateOffset` objects with different ``normalize`` attributes could evaluate as equal (:issue:`21404`)
+- Fixed bug where :meth:`Timestamp.resolution` incorrectly returned 1-microsecond ``timedelta`` instead of 1-nanosecond :class:`Timedelta` (:issue:`21336`, :issue:`21365`)
+- Bug in :func:`to_datetime` that did not consistently return an :class:`Index` when ``box=True`` was specified (:issue:`21864`)
+- Bug in :class:`DatetimeIndex` comparisons where string comparisons incorrectly raises ``TypeError`` (:issue:`22074`)
+- Bug in :class:`DatetimeIndex` comparisons when comparing against ``timedelta64[ns]`` dtyped arrays; in some cases ``TypeError`` was incorrectly raised, in others it incorrectly failed to raise (:issue:`22074`)
+- Bug in :class:`DatetimeIndex` comparisons when comparing against object-dtyped arrays (:issue:`22074`)
+- Bug in :class:`DataFrame` with ``datetime64[ns]`` dtype addition and subtraction with ``Timedelta``-like objects (:issue:`22005`, :issue:`22163`)
+- Bug in :class:`DataFrame` with ``datetime64[ns]`` dtype addition and subtraction with ``DateOffset`` objects returning an ``object`` dtype instead of ``datetime64[ns]`` dtype (:issue:`21610`, :issue:`22163`)
+- Bug in :class:`DataFrame` with ``datetime64[ns]`` dtype comparing against ``NaT`` incorrectly (:issue:`22242`, :issue:`22163`)
+- Bug in :class:`DataFrame` with ``datetime64[ns]`` dtype subtracting ``Timestamp``-like object incorrectly returned ``datetime64[ns]`` dtype instead of ``timedelta64[ns]`` dtype (:issue:`8554`, :issue:`22163`)
+- Bug in :class:`DataFrame` with ``datetime64[ns]`` dtype subtracting ``np.datetime64`` object with non-nanosecond unit failing to convert to nanoseconds (:issue:`18874`, :issue:`22163`)
+- Bug in :class:`DataFrame` comparisons against ``Timestamp``-like objects failing to raise ``TypeError`` for inequality checks with mismatched types (:issue:`8932`, :issue:`22163`)
+- Bug in :class:`DataFrame` with mixed dtypes including ``datetime64[ns]`` incorrectly raising ``TypeError`` on equality comparisons (:issue:`13128`, :issue:`22163`)
+- Bug in :attr:`DataFrame.values` returning a :class:`DatetimeIndex` for a single-column ``DataFrame`` with tz-aware datetime values. Now a 2-D :class:`numpy.ndarray` of :class:`Timestamp` objects is returned (:issue:`24024`)
+- Bug in :meth:`DataFrame.eq` comparison against ``NaT`` incorrectly returning ``True`` or ``NaN`` (:issue:`15697`, :issue:`22163`)
+- Bug in :class:`DatetimeIndex` subtraction that incorrectly failed to raise ``OverflowError`` (:issue:`22492`, :issue:`22508`)
+- Bug in :class:`DatetimeIndex` incorrectly allowing indexing with ``Timedelta`` object (:issue:`20464`)
+- Bug in :class:`DatetimeIndex` where frequency was being set if original frequency was ``None`` (:issue:`22150`)
+- Bug in rounding methods of :class:`DatetimeIndex` (:meth:`~DatetimeIndex.round`, :meth:`~DatetimeIndex.ceil`, :meth:`~DatetimeIndex.floor`) and :class:`Timestamp` (:meth:`~Timestamp.round`, :meth:`~Timestamp.ceil`, :meth:`~Timestamp.floor`) could give rise to loss of precision (:issue:`22591`)
+- Bug in :func:`to_datetime` with an :class:`Index` argument that would drop the ``name`` from the result (:issue:`21697`)
+- Bug in :class:`PeriodIndex` where adding or subtracting a :class:`timedelta` or :class:`Tick` object produced incorrect results (:issue:`22988`)
+- Bug in the :class:`Series` repr with period-dtype data missing a space before the data (:issue:`23601`)
+- Bug in :func:`date_range` when decrementing a start date to a past end date by a negative frequency (:issue:`23270`)
+- Bug in :meth:`Series.min` which would return ``NaN`` instead of ``NaT`` when called on a series of ``NaT`` (:issue:`23282`)
+- Bug in :meth:`Series.combine_first` not properly aligning categoricals, so that missing values in ``self`` where not filled by valid values from ``other`` (:issue:`24147`)
+- Bug in :func:`DataFrame.combine` with datetimelike values raising a TypeError (:issue:`23079`)
+- Bug in :func:`date_range` with frequency of ``Day`` or higher where dates sufficiently far in the future could wrap around to the past instead of raising ``OutOfBoundsDatetime`` (:issue:`14187`)
+- Bug in :func:`period_range` ignoring the frequency of ``start`` and ``end`` when those are provided as :class:`Period` objects (:issue:`20535`).
+- Bug in :class:`PeriodIndex` with attribute ``freq.n`` greater than 1 where adding a :class:`DateOffset` object would return incorrect results (:issue:`23215`)
+- Bug in :class:`Series` that interpreted string indices as lists of characters when setting datetimelike values (:issue:`23451`)
+- Bug in :class:`DataFrame` when creating a new column from an ndarray of :class:`Timestamp` objects with timezones creating an object-dtype column, rather than datetime with timezone (:issue:`23932`)
+- Bug in :class:`Timestamp` constructor which would drop the frequency of an input :class:`Timestamp` (:issue:`22311`)
+- Bug in :class:`DatetimeIndex` where calling ``np.array(dtindex, dtype=object)`` would incorrectly return an array of ``long`` objects (:issue:`23524`)
+- Bug in :class:`Index` where passing a timezone-aware :class:`DatetimeIndex` and `dtype=object` would incorrectly raise a ``ValueError`` (:issue:`23524`)
+- Bug in :class:`Index` where calling ``np.array(dtindex, dtype=object)`` on a timezone-naive :class:`DatetimeIndex` would return an array of ``datetime`` objects instead of :class:`Timestamp` objects, potentially losing nanosecond portions of the timestamps (:issue:`23524`)
+- Bug in :class:`Categorical.__setitem__` not allowing setting with another ``Categorical`` when both are undordered and have the same categories, but in a different order (:issue:`24142`)
+- Bug in :func:`date_range` where using dates with millisecond resolution or higher could return incorrect values or the wrong number of values in the index (:issue:`24110`)
+- Bug in :class:`DatetimeIndex` where constructing a :class:`DatetimeIndex` from a :class:`Categorical` or :class:`CategoricalIndex` would incorrectly drop timezone information (:issue:`18664`)
+- Bug in :class:`DatetimeIndex` and :class:`TimedeltaIndex` where indexing with ``Ellipsis`` would incorrectly lose the index's ``freq`` attribute (:issue:`21282`)
+- Clarified error message produced when passing an incorrect ``freq`` argument to :class:`DatetimeIndex` with ``NaT`` as the first entry in the passed data (:issue:`11587`)
+- Bug in :func:`to_datetime` where ``box`` and ``utc`` arguments were ignored when passing a :class:`DataFrame` or ``dict`` of unit mappings (:issue:`23760`)
+- Bug in :attr:`Series.dt` where the cache would not update properly after an in-place operation (:issue:`24408`)
+- Bug in :class:`PeriodIndex` where comparisons against an array-like object with length 1 failed to raise ``ValueError`` (:issue:`23078`)
+- Bug in :meth:`DatetimeIndex.astype`, :meth:`PeriodIndex.astype` and :meth:`TimedeltaIndex.astype` ignoring the sign of the ``dtype`` for unsigned integer dtypes (:issue:`24405`).
+- Fixed bug in :meth:`Series.max` with ``datetime64[ns]``-dtype failing to return ``NaT`` when nulls are present and ``skipna=False`` is passed (:issue:`24265`)
+- Bug in :func:`to_datetime` where arrays of ``datetime`` objects containing both timezone-aware and timezone-naive ``datetimes`` would fail to raise ``ValueError`` (:issue:`24569`)
+- Bug in :func:`to_datetime` with invalid datetime format doesn't coerce input to ``NaT`` even if ``errors='coerce'`` (:issue:`24763`)
+
+Timedelta
+^^^^^^^^^
+- Bug in :class:`DataFrame` with ``timedelta64[ns]`` dtype division by ``Timedelta``-like scalar incorrectly returning ``timedelta64[ns]`` dtype instead of ``float64`` dtype (:issue:`20088`, :issue:`22163`)
+- Bug in adding a :class:`Index` with object dtype to a :class:`Series` with ``timedelta64[ns]`` dtype incorrectly raising (:issue:`22390`)
+- Bug in multiplying a :class:`Series` with numeric dtype against a ``timedelta`` object (:issue:`22390`)
+- Bug in :class:`Series` with numeric dtype when adding or subtracting an an array or ``Series`` with ``timedelta64`` dtype (:issue:`22390`)
+- Bug in :class:`Index` with numeric dtype when multiplying or dividing an array with dtype ``timedelta64`` (:issue:`22390`)
+- Bug in :class:`TimedeltaIndex` incorrectly allowing indexing with ``Timestamp`` object (:issue:`20464`)
+- Fixed bug where subtracting :class:`Timedelta` from an object-dtyped array would raise ``TypeError`` (:issue:`21980`)
+- Fixed bug in adding a :class:`DataFrame` with all-`timedelta64[ns]` dtypes to a :class:`DataFrame` with all-integer dtypes returning incorrect results instead of raising ``TypeError`` (:issue:`22696`)
+- Bug in :class:`TimedeltaIndex` where adding a timezone-aware datetime scalar incorrectly returned a timezone-naive :class:`DatetimeIndex` (:issue:`23215`)
+- Bug in :class:`TimedeltaIndex` where adding ``np.timedelta64('NaT')`` incorrectly returned an all-``NaT`` :class:`DatetimeIndex` instead of an all-``NaT`` :class:`TimedeltaIndex` (:issue:`23215`)
+- Bug in :class:`Timedelta` and :func:`to_timedelta()` have inconsistencies in supported unit string (:issue:`21762`)
+- Bug in :class:`TimedeltaIndex` division where dividing by another :class:`TimedeltaIndex` raised ``TypeError`` instead of returning a :class:`Float64Index` (:issue:`23829`, :issue:`22631`)
+- Bug in :class:`TimedeltaIndex` comparison operations where comparing against non-``Timedelta``-like objects would raise ``TypeError`` instead of returning all-``False`` for ``__eq__`` and all-``True`` for ``__ne__`` (:issue:`24056`)
+- Bug in :class:`Timedelta` comparisons when comparing with a ``Tick`` object incorrectly raising ``TypeError`` (:issue:`24710`)
+
+Timezones
+^^^^^^^^^
+
+- Bug in :meth:`Index.shift` where an ``AssertionError`` would raise when shifting across DST (:issue:`8616`)
+- Bug in :class:`Timestamp` constructor where passing an invalid timezone offset designator (``Z``) would not raise a ``ValueError`` (:issue:`8910`)
+- Bug in :meth:`Timestamp.replace` where replacing at a DST boundary would retain an incorrect offset (:issue:`7825`)
+- Bug in :meth:`Series.replace` with ``datetime64[ns, tz]`` data when replacing ``NaT`` (:issue:`11792`)
+- Bug in :class:`Timestamp` when passing different string date formats with a timezone offset would produce different timezone offsets (:issue:`12064`)
+- Bug when comparing a tz-naive :class:`Timestamp` to a tz-aware :class:`DatetimeIndex` which would coerce the :class:`DatetimeIndex` to tz-naive (:issue:`12601`)
+- Bug in :meth:`Series.truncate` with a tz-aware :class:`DatetimeIndex` which would cause a core dump (:issue:`9243`)
+- Bug in :class:`Series` constructor which would coerce tz-aware and tz-naive :class:`Timestamp` to tz-aware (:issue:`13051`)
+- Bug in :class:`Index` with ``datetime64[ns, tz]`` dtype that did not localize integer data correctly (:issue:`20964`)
+- Bug in :class:`DatetimeIndex` where constructing with an integer and tz would not localize correctly (:issue:`12619`)
+- Fixed bug where :meth:`DataFrame.describe` and :meth:`Series.describe` on tz-aware datetimes did not show `first` and `last` result (:issue:`21328`)
+- Bug in :class:`DatetimeIndex` comparisons failing to raise ``TypeError`` when comparing timezone-aware ``DatetimeIndex`` against ``np.datetime64`` (:issue:`22074`)
+- Bug in ``DataFrame`` assignment with a timezone-aware scalar (:issue:`19843`)
+- Bug in :func:`DataFrame.asof` that raised a ``TypeError`` when attempting to compare tz-naive and tz-aware timestamps (:issue:`21194`)
+- Bug when constructing a :class:`DatetimeIndex` with :class:`Timestamp` constructed with the ``replace`` method across DST (:issue:`18785`)
+- Bug when setting a new value with :meth:`DataFrame.loc` with a :class:`DatetimeIndex` with a DST transition (:issue:`18308`, :issue:`20724`)
+- Bug in :meth:`Index.unique` that did not re-localize tz-aware dates correctly (:issue:`21737`)
+- Bug when indexing a :class:`Series` with a DST transition (:issue:`21846`)
+- Bug in :meth:`DataFrame.resample` and :meth:`Series.resample` where an ``AmbiguousTimeError`` or ``NonExistentTimeError`` would raise if a timezone aware timeseries ended on a DST transition (:issue:`19375`, :issue:`10117`)
+- Bug in :meth:`DataFrame.drop` and :meth:`Series.drop` when specifying a tz-aware Timestamp key to drop from a :class:`DatetimeIndex` with a DST transition (:issue:`21761`)
+- Bug in :class:`DatetimeIndex` constructor where ``NaT`` and ``dateutil.tz.tzlocal`` would raise an ``OutOfBoundsDatetime`` error (:issue:`23807`)
+- Bug in :meth:`DatetimeIndex.tz_localize` and :meth:`Timestamp.tz_localize` with ``dateutil.tz.tzlocal`` near a DST transition that would return an incorrectly localized datetime (:issue:`23807`)
+- Bug in :class:`Timestamp` constructor where a ``dateutil.tz.tzutc`` timezone passed with a ``datetime.datetime`` argument would be converted to a ``pytz.UTC`` timezone (:issue:`23807`)
+- Bug in :func:`to_datetime` where ``utc=True`` was not respected when specifying a ``unit`` and ``errors='ignore'`` (:issue:`23758`)
+- Bug in :func:`to_datetime` where ``utc=True`` was not respected when passing a :class:`Timestamp` (:issue:`24415`)
+- Bug in :meth:`DataFrame.any` returns wrong value when ``axis=1`` and the data is of datetimelike type (:issue:`23070`)
+- Bug in :meth:`DatetimeIndex.to_period` where a timezone aware index was converted to UTC first before creating :class:`PeriodIndex` (:issue:`22905`)
+- Bug in :meth:`DataFrame.tz_localize`, :meth:`DataFrame.tz_convert`, :meth:`Series.tz_localize`, and :meth:`Series.tz_convert` where ``copy=False`` would mutate the original argument inplace (:issue:`6326`)
+- Bug in :meth:`DataFrame.max` and :meth:`DataFrame.min` with ``axis=1`` where a :class:`Series` with ``NaN`` would be returned when all columns contained the same timezone (:issue:`10390`)
+
+Offsets
+^^^^^^^
+
+- Bug in :class:`FY5253` where date offsets could incorrectly raise an ``AssertionError`` in arithmetic operatons (:issue:`14774`)
+- Bug in :class:`DateOffset` where keyword arguments ``week`` and ``milliseconds`` were accepted and ignored.  Passing these will now raise ``ValueError`` (:issue:`19398`)
+- Bug in adding :class:`DateOffset` with :class:`DataFrame` or :class:`PeriodIndex` incorrectly raising ``TypeError`` (:issue:`23215`)
+- Bug in comparing :class:`DateOffset` objects with non-DateOffset objects, particularly strings, raising ``ValueError`` instead of returning ``False`` for equality checks and ``True`` for not-equal checks (:issue:`23524`)
+
+Numeric
+^^^^^^^
+
+- Bug in :class:`Series` ``__rmatmul__`` doesn't support matrix vector multiplication (:issue:`21530`)
+- Bug in :func:`factorize` fails with read-only array (:issue:`12813`)
+- Fixed bug in :func:`unique` handled signed zeros inconsistently: for some inputs 0.0 and -0.0 were treated as equal and for some inputs as different. Now they are treated as equal for all inputs (:issue:`21866`)
+- Bug in :meth:`DataFrame.agg`, :meth:`DataFrame.transform` and :meth:`DataFrame.apply` where,
+  when supplied with a list of functions and ``axis=1`` (e.g. ``df.apply(['sum', 'mean'], axis=1)``),
+  a ``TypeError`` was wrongly raised. For all three methods such calculation are now done correctly. (:issue:`16679`).
+- Bug in :class:`Series` comparison against datetime-like scalars and arrays (:issue:`22074`)
+- Bug in :class:`DataFrame` multiplication between boolean dtype and integer returning ``object`` dtype instead of integer dtype (:issue:`22047`, :issue:`22163`)
+- Bug in :meth:`DataFrame.apply` where, when supplied with a string argument and additional positional or keyword arguments (e.g. ``df.apply('sum', min_count=1)``), a ``TypeError`` was wrongly raised (:issue:`22376`)
+- Bug in :meth:`DataFrame.astype` to extension dtype may raise ``AttributeError`` (:issue:`22578`)
+- Bug in :class:`DataFrame` with ``timedelta64[ns]`` dtype arithmetic operations with ``ndarray`` with integer dtype incorrectly treating the narray as ``timedelta64[ns]`` dtype (:issue:`23114`)
+- Bug in :meth:`Series.rpow` with object dtype ``NaN`` for ``1 ** NA`` instead of ``1`` (:issue:`22922`).
+- :meth:`Series.agg` can now handle numpy NaN-aware methods like :func:`numpy.nansum` (:issue:`19629`)
+- Bug in :meth:`Series.rank` and :meth:`DataFrame.rank` when ``pct=True`` and more than 2\ :sup:`24` rows are present resulted in percentages greater than 1.0 (:issue:`18271`)
+- Calls such as :meth:`DataFrame.round` with a non-unique :meth:`CategoricalIndex` now return expected data. Previously, data would be improperly duplicated (:issue:`21809`).
+- Added ``log10``, `floor` and `ceil` to the list of supported functions in :meth:`DataFrame.eval` (:issue:`24139`, :issue:`24353`)
+- Logical operations ``&, |, ^`` between :class:`Series` and :class:`Index` will no longer raise ``ValueError`` (:issue:`22092`)
+- Checking PEP 3141 numbers in :func:`~pandas.api.types.is_scalar` function returns ``True`` (:issue:`22903`)
+- Reduction methods like :meth:`Series.sum` now accept the default value of ``keepdims=False`` when called from a NumPy ufunc, rather than raising a ``TypeError``. Full support for ``keepdims`` has not been implemented (:issue:`24356`).
+
+Conversion
+^^^^^^^^^^
+
+- Bug in :meth:`DataFrame.combine_first` in which column types were unexpectedly converted to float (:issue:`20699`)
+- Bug in :meth:`DataFrame.clip` in which column types are not preserved and casted to float (:issue:`24162`)
+- Bug in :meth:`DataFrame.clip` when order of columns of dataframes doesn't match, result observed is wrong in numeric values (:issue:`20911`)
+- Bug in :meth:`DataFrame.astype` where converting to an extension dtype when duplicate column names are present causes a ``RecursionError`` (:issue:`24704`)
+
+Strings
+^^^^^^^
+
+- Bug in :meth:`Index.str.partition` was not nan-safe (:issue:`23558`).
+- Bug in :meth:`Index.str.split` was not nan-safe (:issue:`23677`).
+- Bug :func:`Series.str.contains` not respecting the ``na`` argument for a ``Categorical`` dtype ``Series`` (:issue:`22158`)
+- Bug in :meth:`Index.str.cat` when the result contained only ``NaN`` (:issue:`24044`)
+
+Interval
+^^^^^^^^
+
+- Bug in the :class:`IntervalIndex` constructor where the ``closed`` parameter did not always override the inferred ``closed`` (:issue:`19370`)
+- Bug in the ``IntervalIndex`` repr where a trailing comma was missing after the list of intervals (:issue:`20611`)
+- Bug in :class:`Interval` where scalar arithmetic operations did not retain the ``closed`` value (:issue:`22313`)
+- Bug in :class:`IntervalIndex` where indexing with datetime-like values raised a ``KeyError`` (:issue:`20636`)
+- Bug in ``IntervalTree`` where data containing ``NaN`` triggered a warning and resulted in incorrect indexing queries with :class:`IntervalIndex` (:issue:`23352`)
+
+Indexing
+^^^^^^^^
+
+- Bug in :meth:`DataFrame.ne` fails if columns contain column name "dtype" (:issue:`22383`)
+- The traceback from a ``KeyError`` when asking ``.loc`` for a single missing label is now shorter and more clear (:issue:`21557`)
+- :class:`PeriodIndex` now emits a ``KeyError`` when a malformed string is looked up, which is consistent with the behavior of :class:`DatetimeIndex` (:issue:`22803`)
+- When ``.ix`` is asked for a missing integer label in a :class:`MultiIndex` with a first level of integer type, it now raises a ``KeyError``, consistently with the case of a flat :class:`Int64Index`, rather than falling back to positional indexing (:issue:`21593`)
+- Bug in :meth:`Index.reindex` when reindexing a tz-naive and tz-aware :class:`DatetimeIndex` (:issue:`8306`)
+- Bug in :meth:`Series.reindex` when reindexing an empty series with a ``datetime64[ns, tz]`` dtype (:issue:`20869`)
+- Bug in :class:`DataFrame` when setting values with ``.loc`` and a timezone aware :class:`DatetimeIndex` (:issue:`11365`)
+- ``DataFrame.__getitem__`` now accepts dictionaries and dictionary keys as list-likes of labels, consistently with ``Series.__getitem__`` (:issue:`21294`)
+- Fixed ``DataFrame[np.nan]`` when columns are non-unique (:issue:`21428`)
+- Bug when indexing :class:`DatetimeIndex` with nanosecond resolution dates and timezones (:issue:`11679`)
+- Bug where indexing with a Numpy array containing negative values would mutate the indexer (:issue:`21867`)
+- Bug where mixed indexes wouldn't allow integers for ``.at`` (:issue:`19860`)
+- ``Float64Index.get_loc`` now raises ``KeyError`` when boolean key passed. (:issue:`19087`)
+- Bug in :meth:`DataFrame.loc` when indexing with an :class:`IntervalIndex` (:issue:`19977`)
+- :class:`Index` no longer mangles ``None``, ``NaN`` and ``NaT``, i.e. they are treated as three different keys. However, for numeric Index all three are still coerced to a ``NaN`` (:issue:`22332`)
+- Bug in ``scalar in Index`` if scalar is a float while the ``Index`` is of integer dtype (:issue:`22085`)
+- Bug in :func:`MultiIndex.set_levels` when levels value is not subscriptable (:issue:`23273`)
+- Bug where setting a timedelta column by ``Index`` causes it to be casted to double, and therefore lose precision (:issue:`23511`)
+- Bug in :func:`Index.union` and :func:`Index.intersection` where name of the ``Index`` of the result was not computed correctly for certain cases (:issue:`9943`, :issue:`9862`)
+- Bug in :class:`Index` slicing with boolean :class:`Index` may raise ``TypeError`` (:issue:`22533`)
+- Bug in ``PeriodArray.__setitem__`` when accepting slice and list-like value (:issue:`23978`)
+- Bug in :class:`DatetimeIndex`, :class:`TimedeltaIndex` where indexing with ``Ellipsis`` would lose their ``freq`` attribute (:issue:`21282`)
+- Bug in ``iat`` where using it to assign an incompatible value would create a new column (:issue:`23236`)
+
+Missing
+^^^^^^^
+
+- Bug in :func:`DataFrame.fillna` where a ``ValueError`` would raise when one column contained a ``datetime64[ns, tz]`` dtype (:issue:`15522`)
+- Bug in :func:`Series.hasnans` that could be incorrectly cached and return incorrect answers if null elements are introduced after an initial call (:issue:`19700`)
+- :func:`Series.isin` now treats all NaN-floats as equal also for ``np.object``-dtype. This behavior is consistent with the behavior for float64 (:issue:`22119`)
+- :func:`unique` no longer mangles NaN-floats and the ``NaT``-object for ``np.object``-dtype, i.e. ``NaT`` is no longer coerced to a NaN-value and is treated as a different entity. (:issue:`22295`)
+- :class:`DataFrame` and :class:`Series` now properly handle numpy masked arrays with hardened masks. Previously, constructing a DataFrame or Series from a masked array with a hard mask would create a pandas object containing the underlying value, rather than the expected NaN. (:issue:`24574`)
+- Bug in :class:`DataFrame` constructor where ``dtype`` argument was not honored when handling numpy masked record arrays. (:issue:`24874`)
+
+MultiIndex
+^^^^^^^^^^
+
+- Bug in :func:`io.formats.style.Styler.applymap` where ``subset=`` with :class:`MultiIndex` slice would reduce to :class:`Series` (:issue:`19861`)
+- Removed compatibility for :class:`MultiIndex` pickles prior to version 0.8.0; compatibility with :class:`MultiIndex` pickles from version 0.13 forward is maintained (:issue:`21654`)
+- :meth:`MultiIndex.get_loc_level` (and as a consequence, ``.loc`` on a ``Series`` or ``DataFrame`` with a :class:`MultiIndex` index) will now raise a ``KeyError``, rather than returning an empty ``slice``, if asked a label which is present in the ``levels`` but is unused (:issue:`22221`)
+- :class:`MultiIndex` has gained the :meth:`MultiIndex.from_frame`, it allows constructing a :class:`MultiIndex` object from a :class:`DataFrame` (:issue:`22420`)
+- Fix ``TypeError`` in Python 3 when creating :class:`MultiIndex` in which some levels have mixed types, e.g. when some labels are tuples (:issue:`15457`)
+
+I/O
+^^^
+
+- Bug in :func:`read_csv` in which a column specified with ``CategoricalDtype`` of boolean categories was not being correctly coerced from string values to booleans (:issue:`20498`)
+- Bug in :func:`read_csv` in which unicode column names were not being properly recognized with Python 2.x (:issue:`13253`)
+- Bug in :meth:`DataFrame.to_sql` when writing timezone aware data (``datetime64[ns, tz]`` dtype) would raise a ``TypeError`` (:issue:`9086`)
+- Bug in :meth:`DataFrame.to_sql` where a naive :class:`DatetimeIndex` would be written as ``TIMESTAMP WITH TIMEZONE`` type in supported databases, e.g. PostgreSQL (:issue:`23510`)
+- Bug in :meth:`read_excel()` when ``parse_cols`` is specified with an empty dataset (:issue:`9208`)
+- :func:`read_html()` no longer ignores all-whitespace ``<tr>`` within ``<thead>`` when considering the ``skiprows`` and ``header`` arguments. Previously, users had to decrease their ``header`` and ``skiprows`` values on such tables to work around the issue. (:issue:`21641`)
+- :func:`read_excel()` will correctly show the deprecation warning for previously deprecated ``sheetname`` (:issue:`17994`)
+- :func:`read_csv()` and :func:`read_table()` will throw ``UnicodeError`` and not coredump on badly encoded strings (:issue:`22748`)
+- :func:`read_csv()` will correctly parse timezone-aware datetimes (:issue:`22256`)
+- Bug in :func:`read_csv()` in which memory management was prematurely optimized for the C engine when the data was being read in chunks (:issue:`23509`)
+- Bug in :func:`read_csv()` in unnamed columns were being improperly identified when extracting a multi-index (:issue:`23687`)
+- :func:`read_sas()` will parse numbers in sas7bdat-files that have width less than 8 bytes correctly. (:issue:`21616`)
+- :func:`read_sas()` will correctly parse sas7bdat files with many columns (:issue:`22628`)
+- :func:`read_sas()` will correctly parse sas7bdat files with data page types having also bit 7 set (so page type is 128 + 256 = 384) (:issue:`16615`)
+- Bug in :func:`read_sas()` in which an incorrect error was raised on an invalid file format. (:issue:`24548`)
+- Bug in :meth:`detect_client_encoding` where potential ``IOError`` goes unhandled when importing in a mod_wsgi process due to restricted access to stdout. (:issue:`21552`)
+- Bug in :func:`DataFrame.to_html()` with ``index=False`` misses truncation indicators (...) on truncated DataFrame (:issue:`15019`, :issue:`22783`)
+- Bug in :func:`DataFrame.to_html()` with ``index=False`` when both columns and row index are ``MultiIndex`` (:issue:`22579`)
+- Bug in :func:`DataFrame.to_html()` with ``index_names=False`` displaying index name (:issue:`22747`)
+- Bug in :func:`DataFrame.to_html()` with ``header=False`` not displaying row index names (:issue:`23788`)
+- Bug in :func:`DataFrame.to_html()` with ``sparsify=False`` that caused it to raise ``TypeError`` (:issue:`22887`)
+- Bug in :func:`DataFrame.to_string()` that broke column alignment when ``index=False`` and width of first column's values is greater than the width of first column's header (:issue:`16839`, :issue:`13032`)
+- Bug in :func:`DataFrame.to_string()` that caused representations of :class:`DataFrame` to not take up the whole window (:issue:`22984`)
+- Bug in :func:`DataFrame.to_csv` where a single level MultiIndex incorrectly wrote a tuple. Now just the value of the index is written (:issue:`19589`).
+- :class:`HDFStore` will raise ``ValueError`` when the ``format`` kwarg is passed to the constructor (:issue:`13291`)
+- Bug in :meth:`HDFStore.append` when appending a :class:`DataFrame` with an empty string column and ``min_itemsize`` < 8 (:issue:`12242`)
+- Bug in :func:`read_csv()` in which memory leaks occurred in the C engine when parsing ``NaN`` values due to insufficient cleanup on completion or error (:issue:`21353`)
+- Bug in :func:`read_csv()` in which incorrect error messages were being raised when ``skipfooter`` was passed in along with ``nrows``, ``iterator``, or ``chunksize`` (:issue:`23711`)
+- Bug in :func:`read_csv()` in which :class:`MultiIndex` index names were being improperly handled in the cases when they were not provided (:issue:`23484`)
+- Bug in :func:`read_csv()` in which unnecessary warnings were being raised when the dialect's values conflicted with the default arguments (:issue:`23761`)
+- Bug in :func:`read_html()` in which the error message was not displaying the valid flavors when an invalid one was provided (:issue:`23549`)
+- Bug in :meth:`read_excel()` in which extraneous header names were extracted, even though none were specified (:issue:`11733`)
+- Bug in :meth:`read_excel()` in which column names were not being properly converted to string sometimes in Python 2.x (:issue:`23874`)
+- Bug in :meth:`read_excel()` in which ``index_col=None`` was not being respected and parsing index columns anyway (:issue:`18792`, :issue:`20480`)
+- Bug in :meth:`read_excel()` in which ``usecols`` was not being validated for proper column names when passed in as a string (:issue:`20480`)
+- Bug in :meth:`DataFrame.to_dict` when the resulting dict contains non-Python scalars in the case of numeric data (:issue:`23753`)
+- :func:`DataFrame.to_string()`, :func:`DataFrame.to_html()`, :func:`DataFrame.to_latex()` will correctly format output when a string is passed as the ``float_format`` argument (:issue:`21625`, :issue:`22270`)
+- Bug in :func:`read_csv` that caused it to raise ``OverflowError`` when trying to use 'inf' as ``na_value`` with integer index column (:issue:`17128`)
+- Bug in :func:`read_csv` that caused the C engine on Python 3.6+ on Windows to improperly read CSV filenames with accented or special characters (:issue:`15086`)
+- Bug in :func:`read_fwf` in which the compression type of a file was not being properly inferred (:issue:`22199`)
+- Bug in :func:`pandas.io.json.json_normalize` that caused it to raise ``TypeError`` when two consecutive elements of ``record_path`` are dicts (:issue:`22706`)
+- Bug in :meth:`DataFrame.to_stata`, :class:`pandas.io.stata.StataWriter` and :class:`pandas.io.stata.StataWriter117` where a exception would leave a partially written and invalid dta file (:issue:`23573`)
+- Bug in :meth:`DataFrame.to_stata` and :class:`pandas.io.stata.StataWriter117` that produced invalid files when using strLs with non-ASCII characters (:issue:`23573`)
+- Bug in :class:`HDFStore` that caused it to raise ``ValueError`` when reading a Dataframe in Python 3 from fixed format written in Python 2 (:issue:`24510`)
+- Bug in :func:`DataFrame.to_string()` and more generally in the floating ``repr`` formatter. Zeros were not trimmed if ``inf`` was present in a columns while it was the case with NA values. Zeros are now trimmed as in the presence of NA (:issue:`24861`).
+- Bug in the ``repr`` when truncating the number of columns and having a wide last column (:issue:`24849`).
+
+Plotting
+^^^^^^^^
+
+- Bug in :func:`DataFrame.plot.scatter` and :func:`DataFrame.plot.hexbin` caused x-axis label and ticklabels to disappear when colorbar was on in IPython inline backend (:issue:`10611`, :issue:`10678`, and :issue:`20455`)
+- Bug in plotting a Series with datetimes using :func:`matplotlib.axes.Axes.scatter` (:issue:`22039`)
+- Bug in :func:`DataFrame.plot.bar` caused bars to use multiple colors instead of a single one (:issue:`20585`)
+- Bug in validating color parameter caused extra color to be appended to the given color array. This happened to multiple plotting functions using matplotlib. (:issue:`20726`)
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in :func:`pandas.core.window.Rolling.min` and :func:`pandas.core.window.Rolling.max` with ``closed='left'``, a datetime-like index and only one entry in the series leading to segfault (:issue:`24718`)
+- Bug in :func:`pandas.core.groupby.GroupBy.first` and :func:`pandas.core.groupby.GroupBy.last` with ``as_index=False`` leading to the loss of timezone information (:issue:`15884`)
+- Bug in :meth:`DateFrame.resample` when downsampling across a DST boundary (:issue:`8531`)
+- Bug in date anchoring for :meth:`DateFrame.resample` with offset :class:`Day` when n > 1 (:issue:`24127`)
+- Bug where ``ValueError`` is wrongly raised when calling :func:`~pandas.core.groupby.SeriesGroupBy.count` method of a
+  ``SeriesGroupBy`` when the grouping variable only contains NaNs and numpy version < 1.13 (:issue:`21956`).
+- Multiple bugs in :func:`pandas.core.window.Rolling.min` with ``closed='left'`` and a
+  datetime-like index leading to incorrect results and also segfault. (:issue:`21704`)
+- Bug in :meth:`pandas.core.resample.Resampler.apply` when passing postiional arguments to applied func (:issue:`14615`).
+- Bug in :meth:`Series.resample` when passing ``numpy.timedelta64`` to ``loffset`` kwarg (:issue:`7687`).
+- Bug in :meth:`pandas.core.resample.Resampler.asfreq` when frequency of ``TimedeltaIndex`` is a subperiod of a new frequency (:issue:`13022`).
+- Bug in :meth:`pandas.core.groupby.SeriesGroupBy.mean` when values were integral but could not fit inside of int64, overflowing instead. (:issue:`22487`)
+- :func:`pandas.core.groupby.RollingGroupby.agg` and :func:`pandas.core.groupby.ExpandingGroupby.agg` now support multiple aggregation functions as parameters (:issue:`15072`)
+- Bug in :meth:`DataFrame.resample` and :meth:`Series.resample` when resampling by a weekly offset (``'W'``) across a DST transition (:issue:`9119`, :issue:`21459`)
+- Bug in :meth:`DataFrame.expanding` in which the ``axis`` argument was not being respected during aggregations (:issue:`23372`)
+- Bug in :meth:`pandas.core.groupby.GroupBy.transform` which caused missing values when the input function can accept a :class:`DataFrame` but renames it (:issue:`23455`).
+- Bug in :func:`pandas.core.groupby.GroupBy.nth` where column order was not always preserved (:issue:`20760`)
+- Bug in :meth:`pandas.core.groupby.GroupBy.rank` with ``method='dense'`` and ``pct=True`` when a group has only one member would raise a ``ZeroDivisionError`` (:issue:`23666`).
+- Calling :meth:`pandas.core.groupby.GroupBy.rank` with empty groups and ``pct=True`` was raising a ``ZeroDivisionError`` (:issue:`22519`)
+- Bug in :meth:`DataFrame.resample` when resampling ``NaT`` in ``TimeDeltaIndex`` (:issue:`13223`).
+- Bug in :meth:`DataFrame.groupby` did not respect the ``observed`` argument when selecting a column and instead always used ``observed=False`` (:issue:`23970`)
+- Bug in :func:`pandas.core.groupby.SeriesGroupBy.pct_change` or :func:`pandas.core.groupby.DataFrameGroupBy.pct_change` would previously work across groups when calculating the percent change, where it now correctly works per group (:issue:`21200`, :issue:`21235`).
+- Bug preventing hash table creation with very large number (2^32) of rows (:issue:`22805`)
+- Bug in groupby when grouping on categorical causes ``ValueError`` and incorrect grouping if ``observed=True`` and ``nan`` is present in categorical column (:issue:`24740`, :issue:`21151`).
+
+Reshaping
+^^^^^^^^^
+
+- Bug in :func:`pandas.concat` when joining resampled DataFrames with timezone aware index (:issue:`13783`)
+- Bug in :func:`pandas.concat` when joining only `Series` the `names` argument of `concat` is no longer ignored (:issue:`23490`)
+- Bug in :meth:`Series.combine_first` with ``datetime64[ns, tz]`` dtype which would return tz-naive result (:issue:`21469`)
+- Bug in :meth:`Series.where` and :meth:`DataFrame.where` with ``datetime64[ns, tz]`` dtype (:issue:`21546`)
+- Bug in :meth:`DataFrame.where` with an empty DataFrame and empty ``cond`` having non-bool dtype (:issue:`21947`)
+- Bug in :meth:`Series.mask` and :meth:`DataFrame.mask` with ``list`` conditionals (:issue:`21891`)
+- Bug in :meth:`DataFrame.replace` raises RecursionError when converting OutOfBounds ``datetime64[ns, tz]`` (:issue:`20380`)
+- :func:`pandas.core.groupby.GroupBy.rank` now raises a ``ValueError`` when an invalid value is passed for argument ``na_option`` (:issue:`22124`)
+- Bug in :func:`get_dummies` with Unicode attributes in Python 2 (:issue:`22084`)
+- Bug in :meth:`DataFrame.replace` raises ``RecursionError`` when replacing empty lists (:issue:`22083`)
+- Bug in :meth:`Series.replace` and :meth:`DataFrame.replace` when dict is used as the ``to_replace`` value and one key in the dict is is another key's value, the results were inconsistent between using integer key and using string key (:issue:`20656`)
+- Bug in :meth:`DataFrame.drop_duplicates` for empty ``DataFrame`` which incorrectly raises an error (:issue:`20516`)
+- Bug in :func:`pandas.wide_to_long` when a string is passed to the stubnames argument and a column name is a substring of that stubname (:issue:`22468`)
+- Bug in :func:`merge` when merging ``datetime64[ns, tz]`` data that contained a DST transition (:issue:`18885`)
+- Bug in :func:`merge_asof` when merging on float values within defined tolerance (:issue:`22981`)
+- Bug in :func:`pandas.concat` when concatenating a multicolumn DataFrame with tz-aware data against a DataFrame with a different number of columns (:issue:`22796`)
+- Bug in :func:`merge_asof` where confusing error message raised when attempting to merge with missing values (:issue:`23189`)
+- Bug in :meth:`DataFrame.nsmallest` and :meth:`DataFrame.nlargest` for dataframes that have a :class:`MultiIndex` for columns (:issue:`23033`).
+- Bug in :func:`pandas.melt` when passing column names that are not present in ``DataFrame`` (:issue:`23575`)
+- Bug in :meth:`DataFrame.append` with a :class:`Series` with a dateutil timezone would raise a ``TypeError`` (:issue:`23682`)
+- Bug in :class:`Series` construction when passing no data and ``dtype=str`` (:issue:`22477`)
+- Bug in :func:`cut` with ``bins`` as an overlapping ``IntervalIndex`` where multiple bins were returned per item instead of raising a ``ValueError`` (:issue:`23980`)
+- Bug in :func:`pandas.concat` when joining ``Series`` datetimetz with ``Series`` category would lose timezone (:issue:`23816`)
+- Bug in :meth:`DataFrame.join` when joining on partial MultiIndex would drop names (:issue:`20452`).
+- :meth:`DataFrame.nlargest` and :meth:`DataFrame.nsmallest` now returns the correct n values when keep != 'all' also when tied on the first columns (:issue:`22752`)
+- Constructing a DataFrame with an index argument that wasn't already an instance of :class:`~pandas.core.Index` was broken (:issue:`22227`).
+- Bug in :class:`DataFrame` prevented list subclasses to be used to construction (:issue:`21226`)
+- Bug in :func:`DataFrame.unstack` and :func:`DataFrame.pivot_table` returning a missleading error message when the resulting DataFrame has more elements than int32 can handle. Now, the error message is improved, pointing towards the actual problem (:issue:`20601`)
+- Bug in :func:`DataFrame.unstack` where a ``ValueError`` was raised when unstacking timezone aware values (:issue:`18338`)
+- Bug in :func:`DataFrame.stack` where timezone aware values were converted to timezone naive values (:issue:`19420`)
+- Bug in :func:`merge_asof` where a ``TypeError`` was raised when ``by_col`` were timezone aware values (:issue:`21184`)
+- Bug showing an incorrect shape when throwing error during ``DataFrame`` construction. (:issue:`20742`)
+
+.. _whatsnew_0240.bug_fixes.sparse:
+
+Sparse
+^^^^^^
+
+- Updating a boolean, datetime, or timedelta column to be Sparse now works (:issue:`22367`)
+- Bug in :meth:`Series.to_sparse` with Series already holding sparse data not constructing properly (:issue:`22389`)
+- Providing a ``sparse_index`` to the SparseArray constructor no longer defaults the na-value to ``np.nan`` for all dtypes. The correct na_value for ``data.dtype`` is now used.
+- Bug in ``SparseArray.nbytes`` under-reporting its memory usage by not including the size of its sparse index.
+- Improved performance of :meth:`Series.shift` for non-NA ``fill_value``, as values are no longer converted to a dense array.
+- Bug in ``DataFrame.groupby`` not including ``fill_value`` in the groups for non-NA ``fill_value`` when grouping by a sparse column (:issue:`5078`)
+- Bug in unary inversion operator (``~``) on a ``SparseSeries`` with boolean values. The performance of this has also been improved (:issue:`22835`)
+- Bug in :meth:`SparseArary.unique` not returning the unique values (:issue:`19595`)
+- Bug in :meth:`SparseArray.nonzero` and :meth:`SparseDataFrame.dropna` returning shifted/incorrect results (:issue:`21172`)
+- Bug in :meth:`DataFrame.apply` where dtypes would lose sparseness (:issue:`23744`)
+- Bug in :func:`concat` when concatenating a list of :class:`Series` with all-sparse values changing the ``fill_value`` and converting to a dense Series (:issue:`24371`)
+
+Style
+^^^^^
+
+- :meth:`~pandas.io.formats.style.Styler.background_gradient` now takes a ``text_color_threshold`` parameter to automatically lighten the text color based on the luminance of the background color. This improves readability with dark background colors without the need to limit the background colormap range. (:issue:`21258`)
+- :meth:`~pandas.io.formats.style.Styler.background_gradient` now also supports tablewise application (in addition to rowwise and columnwise) with ``axis=None`` (:issue:`15204`)
+- :meth:`~pandas.io.formats.style.Styler.bar` now also supports tablewise application (in addition to rowwise and columnwise) with ``axis=None`` and setting clipping range with ``vmin`` and ``vmax`` (:issue:`21548` and :issue:`21526`). ``NaN`` values are also handled properly.
+
+Build Changes
+^^^^^^^^^^^^^
+
+- Building pandas for development now requires ``cython >= 0.28.2`` (:issue:`21688`)
+- Testing pandas now requires ``hypothesis>=3.58``.  You can find `the Hypothesis docs here <https://hypothesis.readthedocs.io/en/latest/index.html>`_, and a pandas-specific introduction :ref:`in the contributing guide <using-hypothesis>`. (:issue:`22280`)
+- Building pandas on macOS now targets minimum macOS 10.9 if run on macOS 10.9 or above (:issue:`23424`)
+
+Other
+^^^^^
+
+- Bug where C variables were declared with external linkage causing import errors if certain other C libraries were imported before Pandas. (:issue:`24113`)
+
+
+.. _whatsnew_0.24.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.23.4..HEAD
diff --git a/doc/source/whatsnew/v0.24.1.rst b/doc/source/whatsnew/v0.24.1.rst
new file mode 100644
index 0000000000000..be0a2eb682e87
--- /dev/null
+++ b/doc/source/whatsnew/v0.24.1.rst
@@ -0,0 +1,85 @@
+:orphan:
+
+.. _whatsnew_0241:
+
+Whats New in 0.24.1 (February 3, 2019)
+--------------------------------------
+
+.. warning::
+
+   The 0.24.x series of releases will be the last to support Python 2. Future feature
+   releases will support Python 3 only. See :ref:`install.dropping-27` for more.
+
+{{ header }}
+
+These are the changes in pandas 0.24.1. See :ref:`release` for a full changelog
+including other versions of pandas. See :ref:`whatsnew_0240` for the 0.24.0 changelog.
+
+.. _whatsnew_0241.api:
+
+API Changes
+~~~~~~~~~~~
+
+Changing the ``sort`` parameter for :class:`Index` set operations
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The default ``sort`` value for :meth:`Index.union` has changed from ``True`` to ``None`` (:issue:`24959`).
+The default *behavior*, however, remains the same: the result is sorted, unless
+
+1. ``self`` and ``other`` are identical
+2. ``self`` or ``other`` is empty
+3. ``self`` or ``other`` contain values that can not be compared (a ``RuntimeWarning`` is raised).
+
+This change will allow ``sort=True`` to mean "always sort" in a future release.
+
+The same change applies to :meth:`Index.difference` and :meth:`Index.symmetric_difference`, which
+would not sort the result when the values could not be compared.
+
+The `sort` option for :meth:`Index.intersection` has changed in three ways.
+
+1. The default has changed from ``True`` to ``False``, to restore the
+   pandas 0.23.4 and earlier behavior of not sorting by default.
+2. The behavior of ``sort=True`` can now be obtained with ``sort=None``.
+   This will sort the result only if the values in ``self`` and ``other``
+   are not identical.
+3. The value ``sort=True`` is no longer allowed. A future version of pandas
+   will properly support ``sort=True`` meaning "always sort".
+
+.. _whatsnew_0241.regressions:
+
+Fixed Regressions
+~~~~~~~~~~~~~~~~~
+
+- Fixed regression in :meth:`DataFrame.to_dict` with ``records`` orient raising an
+  ``AttributeError`` when the ``DataFrame`` contained more than 255 columns, or
+  wrongly converting column names that were not valid python identifiers (:issue:`24939`, :issue:`24940`).
+- Fixed regression in :func:`read_sql` when passing certain queries with MySQL/pymysql (:issue:`24988`).
+- Fixed regression in :class:`Index.intersection` incorrectly sorting the values by default (:issue:`24959`).
+- Fixed regression in :func:`merge` when merging an empty ``DataFrame`` with multiple timezone-aware columns on one of the timezone-aware columns (:issue:`25014`).
+- Fixed regression in :meth:`Series.rename_axis` and :meth:`DataFrame.rename_axis` where passing ``None`` failed to remove the axis name (:issue:`25034`)
+- Fixed regression in :func:`to_timedelta` with `box=False` incorrectly returning a ``datetime64`` object instead of a ``timedelta64`` object (:issue:`24961`)
+- Fixed regression where custom hashable types could not be used as column keys in :meth:`DataFrame.set_index` (:issue:`24969`)
+
+.. _whatsnew_0241.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Reshaping**
+
+- Bug in :meth:`DataFrame.groupby` with :class:`Grouper` when there is a time change (DST) and grouping frequency is ``'1d'`` (:issue:`24972`)
+
+**Visualization**
+
+- Fixed the warning for implicitly registered matplotlib converters not showing. See :ref:`whatsnew_0211.converters` for more (:issue:`24963`).
+
+**Other**
+
+- Fixed AttributeError when printing a DataFrame's HTML repr after accessing the IPython config object (:issue:`25036`)
+
+.. _whatsnew_0.241.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.24.0..v0.24.1
diff --git a/doc/source/whatsnew/v0.24.2.rst b/doc/source/whatsnew/v0.24.2.rst
new file mode 100644
index 0000000000000..2c6d1e01ed89b
--- /dev/null
+++ b/doc/source/whatsnew/v0.24.2.rst
@@ -0,0 +1,111 @@
+:orphan:
+
+.. _whatsnew_0242:
+
+Whats New in 0.24.2 (February XX, 2019)
+---------------------------------------
+
+.. warning::
+
+   The 0.24.x series of releases will be the last to support Python 2. Future feature
+   releases will support Python 3 only. See :ref:`install.dropping-27` for more.
+
+{{ header }}
+
+These are the changes in pandas 0.24.2. See :ref:`release` for a full changelog
+including other versions of pandas.
+
+.. _whatsnew_0242.regressions:
+
+Fixed Regressions
+^^^^^^^^^^^^^^^^^
+
+- Fixed regression in :meth:`DataFrame.all` and :meth:`DataFrame.any` where ``bool_only=True`` was ignored (:issue:`25101`)
+- Fixed issue in ``DataFrame`` construction with passing a mixed list of mixed types could segfault. (:issue:`25075`)
+- Fixed regression in :meth:`DataFrame.apply` causing ``RecursionError`` when ``dict``-like classes were passed as argument. (:issue:`25196`)
+- Fixed regression in :meth:`DataFrame.replace` where ``regex=True`` was only replacing patterns matching the start of the string (:issue:`25259`)
+- Fixed regression in :meth:`DataFrame.duplicated()`, where empty dataframe was not returning a boolean dtyped Series. (:issue:`25184`)
+- Fixed regression in :meth:`Series.min` and :meth:`Series.max` where ``numeric_only=True`` was ignored when the ``Series`` contained ``Categorical`` data (:issue:`25299`)
+- Fixed regression in subtraction between :class:`Series` objects with ``datetime64[ns]`` dtype incorrectly raising ``OverflowError`` when the ``Series`` on the right contains null values (:issue:`25317`)
+- Fixed regression in :class:`TimedeltaIndex` where ``np.sum(index)`` incorrectly returned a zero-dimensional object instead of a scalar (:issue:`25282`)
+- Fixed regression in ``IntervalDtype`` construction where passing an incorrect string with 'Interval' as a prefix could result in a ``RecursionError``. (:issue:`25338`)
+- Fixed regression in creating a period-dtype array from a read-only NumPy array of period objects. (:issue:`25403`)
+- Fixed regression in :class:`Categorical`, where constructing it from a categorical ``Series`` and an explicit ``categories=`` that differed from that in the ``Series`` created an invalid object which could trigger segfaults. (:issue:`25318`)
+- Fixed pip installing from source into an environment without NumPy (:issue:`25193`)
+
+.. _whatsnew_0242.enhancements:
+
+Enhancements
+^^^^^^^^^^^^
+
+-
+-
+
+.. _whatsnew_0242.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+
+**Conversion**
+
+-
+-
+-
+
+**Indexing**
+
+-
+-
+-
+
+**I/O**
+
+- Better handling of terminal printing when the terminal dimensions are not known (:issue:`25080`)
+- Bug in reading a HDF5 table-format ``DataFrame`` created in Python 2, in Python 3 (:issue:`24925`)
+- Bug in reading a JSON with ``orient='table'`` generated by :meth:`DataFrame.to_json` with ``index=False`` (:issue:`25170`)
+- Bug where float indexes could have misaligned values when printing (:issue:`25061`)
+-
+
+**Categorical**
+
+-
+-
+-
+
+**Timezones**
+
+-
+-
+-
+
+**Timedelta**
+
+-
+-
+-
+
+**Reshaping**
+
+- Bug in :meth:`~pandas.core.groupby.GroupBy.transform` where applying a function to a timezone aware column would return a timezone naive result (:issue:`24198`)
+- Bug in :func:`DataFrame.join` when joining on a timezone aware :class:`DatetimeIndex` (:issue:`23931`)
+-
+
+**Visualization**
+
+- Bug in :meth:`Series.plot` where a secondary y axis could not be set to log scale (:issue:`25545`)
+-
+-
+
+**Other**
+
+- Bug in :meth:`Series.is_unique` where single occurrences of ``NaN`` were not considered unique (:issue:`25180`)
+- Bug in :func:`merge` when merging an empty ``DataFrame`` with an ``Int64`` column or a non-empty ``DataFrame`` with an ``Int64`` column that is all ``NaN`` (:issue:`25183`)
+- Bug in ``IntervalTree`` where a ``RecursionError`` occurs upon construction due to an overflow when adding endpoints, which also causes :class:`IntervalIndex` to crash during indexing operations (:issue:`25485`)
+-
+
+.. _whatsnew_0242.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.24.1..v0.24.2
diff --git a/doc/source/whatsnew/v0.25.0.rst b/doc/source/whatsnew/v0.25.0.rst
new file mode 100644
index 0000000000000..ea08a0a6fe07b
--- /dev/null
+++ b/doc/source/whatsnew/v0.25.0.rst
@@ -0,0 +1,267 @@
+.. _whatsnew_0250:
+
+What's New in 0.25.0 (April XX, 2019)
+-------------------------------------
+
+.. warning::
+
+   Starting with the 0.25.x series of releases, pandas only supports Python 3.5 and higher.
+   See :ref:`install.dropping-27` for more details.
+
+{{ header }}
+
+These are the changes in pandas 0.25.0. See :ref:`release` for a full changelog
+including other versions of pandas.
+
+
+.. _whatsnew_0250.enhancements.other:
+
+Other Enhancements
+^^^^^^^^^^^^^^^^^^
+
+- Indexing of ``DataFrame`` and ``Series`` now accepts zerodim ``np.ndarray`` (:issue:`24919`)
+- :meth:`Timestamp.replace` now supports the ``fold`` argument to disambiguate DST transition times (:issue:`25017`)
+- :meth:`DataFrame.at_time` and :meth:`Series.at_time` now support :meth:`datetime.time` objects with timezones (:issue:`24043`)
+- ``Series.str`` has gained :meth:`Series.str.casefold` method to removes all case distinctions present in a string (:issue:`25405`)
+- :meth:`DataFrame.set_index` now works for instances of ``abc.Iterator``, provided their output is of the same length as the calling frame (:issue:`22484`, :issue:`24984`)
+- :meth:`DatetimeIndex.union` now supports the ``sort`` argument. The behaviour of the sort parameter matches that of :meth:`Index.union` (:issue:`24994`)
+- :meth:`DataFrame.rename` now supports the ``errors`` argument to raise errors when attempting to rename nonexistent keys (:issue:`13473`)
+
+.. _whatsnew_0250.api_breaking:
+
+Backwards incompatible API changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. _whatsnew_0250.api_breaking.utc_offset_indexing:
+
+Indexing with date strings with UTC offsets
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Indexing a :class:`DataFrame` or :class:`Series` with a :class:`DatetimeIndex` with a
+date string with a UTC offset would previously ignore the UTC offset. Now, the UTC offset
+is respected in indexing. (:issue:`24076`, :issue:`16785`)
+
+*Previous Behavior*:
+
+.. code-block:: ipython
+
+    In [1]: df = pd.DataFrame([0], index=pd.DatetimeIndex(['2019-01-01'], tz='US/Pacific'))
+
+    In [2]: df
+    Out[2]:
+                               0
+    2019-01-01 00:00:00-08:00  0
+
+    In [3]: df['2019-01-01 00:00:00+04:00':'2019-01-01 01:00:00+04:00']
+    Out[3]:
+                               0
+    2019-01-01 00:00:00-08:00  0
+
+*New Behavior*:
+
+.. ipython:: ipython
+
+    df = pd.DataFrame([0], index=pd.DatetimeIndex(['2019-01-01'], tz='US/Pacific'))
+    df['2019-01-01 12:00:00+04:00':'2019-01-01 13:00:00+04:00']
+
+.. _whatsnew_0250.api_breaking.deps:
+
+Increased minimum versions for dependencies
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+We have updated our minimum supported versions of dependencies (:issue:`23519`).
+If installed, we now require:
+
++-----------------+-----------------+----------+
+| Package         | Minimum Version | Required |
++=================+=================+==========+
+| pytest (dev)    | 4.0.2           |          |
++-----------------+-----------------+----------+
+
+.. _whatsnew_0250.api.other:
+
+Other API Changes
+^^^^^^^^^^^^^^^^^
+
+- :class:`DatetimeTZDtype` will now standardize pytz timezones to a common timezone instance (:issue:`24713`)
+- ``Timestamp`` and ``Timedelta`` scalars now implement the :meth:`to_numpy` method as aliases to :meth:`Timestamp.to_datetime64` and :meth:`Timedelta.to_timedelta64`, respectively. (:issue:`24653`)
+- :meth:`Timestamp.strptime` will now rise a ``NotImplementedError`` (:issue:`25016`)
+-
+
+.. _whatsnew_0250.deprecations:
+
+Deprecations
+~~~~~~~~~~~~
+
+- Deprecated the `M (months)` and `Y (year)` `units` parameter of :func: `pandas.to_timedelta`, :func: `pandas.Timedelta` and :func: `pandas.TimedeltaIndex` (:issue:`16344`)
+
+.. _whatsnew_0250.prior_deprecations:
+
+Removal of prior version deprecations/changes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+- Removed (parts of) :class:`Panel` (:issue:`25047`,:issue:`25191`,:issue:`25231`)
+-
+-
+-
+
+.. _whatsnew_0250.performance:
+
+Performance Improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Significant speedup in `SparseArray` initialization that benefits most operations, fixing performance regression introduced in v0.20.0 (:issue:`24985`)
+- `DataFrame.to_stata()` is now faster when outputting data with any string or non-native endian columns (:issue:`25045`)
+- Improved performance of :meth:`Series.searchsorted`. The speedup is especially large when the dtype is
+  int8/int16/int32 and the searched key is within the integer bounds for the dtype (:issue:`22034`)
+- Improved performance of :meth:`pandas.core.groupby.GroupBy.quantile` (:issue:`20405`)
+
+
+.. _whatsnew_0250.bug_fixes:
+
+Bug Fixes
+~~~~~~~~~
+- Bug in :func:`to_datetime` which would raise an (incorrect) ``ValueError`` when called with a date far into the future and the ``format`` argument specified instead of raising ``OutOfBoundsDatetime`` (:issue:`23830`)
+-
+-
+
+Categorical
+^^^^^^^^^^^
+
+-
+-
+-
+
+Datetimelike
+^^^^^^^^^^^^
+
+-
+-
+-
+
+Timedelta
+^^^^^^^^^
+
+-
+-
+-
+
+Timezones
+^^^^^^^^^
+
+- Bug in :func:`to_datetime` with ``utc=True`` and datetime strings that would apply previously parsed UTC offsets to subsequent arguments (:issue:`24992`)
+- Bug in :func:`Timestamp.tz_localize` and :func:`Timestamp.tz_convert` does not propagate ``freq`` (:issue:`25241`)
+- Bug in :func:`Series.at` where setting :class:`Timestamp` with timezone raises ``TypeError`` (:issue:`25506`)
+
+Numeric
+^^^^^^^
+
+- Bug in :meth:`to_numeric` in which large negative numbers were being improperly handled (:issue:`24910`)
+- Bug in :meth:`to_numeric` in which numbers were being coerced to float, even though ``errors`` was not ``coerce`` (:issue:`24910`)
+-
+-
+-
+
+
+Conversion
+^^^^^^^^^^
+
+-
+-
+-
+
+Strings
+^^^^^^^
+
+-
+-
+-
+
+
+Interval
+^^^^^^^^
+
+-
+-
+-
+
+Indexing
+^^^^^^^^
+
+-
+-
+-
+
+
+Missing
+^^^^^^^
+
+- Fixed misleading exception message in :meth:`Series.missing` if argument ``order`` is required, but omitted (:issue:`10633`, :issue:`24014`).
+- Fixed class type displayed in exception message in :meth:`DataFrame.dropna` if invalid ``axis`` parameter passed (:issue:`25555`)
+-
+
+MultiIndex
+^^^^^^^^^^
+
+- Bug in which incorrect exception raised by :meth:`pd.Timedelta` when testing the membership of :class:`MultiIndex` (:issue:`24570`)
+-
+-
+
+I/O
+^^^
+
+- Bug in :func:`DataFrame.to_html()` where values were truncated using display options instead of outputting the full content (:issue:`17004`)
+- Fixed bug in missing text when using :meth:`to_clipboard` if copying utf-16 characters in Python 3 on Windows (:issue:`25040`)
+- Bug in :func:`read_json` for ``orient='table'`` when it tries to infer dtypes by default, which is not applicable as dtypes are already defined in the JSON schema (:issue:`21345`)
+- Bug in :func:`read_json` for ``orient='table'`` and float index, as it infers index dtype by default, which is not applicable because index dtype is already defined in the JSON schema (:issue:`25433`)
+- Bug in :func:`read_json` for ``orient='table'`` and string of float column names, as it makes a column name type conversion to Timestamp, which is not applicable because column names are already defined in the JSON schema (:issue:`25435`)
+-
+-
+-
+
+
+Plotting
+^^^^^^^^
+
+-
+-
+-
+
+Groupby/Resample/Rolling
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+- Bug in :meth:`pandas.core.resample.Resampler.agg` with a timezone aware index where ``OverflowError`` would raise when passing a list of functions (:issue:`22660`)
+- Bug in :meth:`pandas.core.groupby.DataFrameGroupBy.nunique` in which the names of column levels were lost (:issue:`23222`)
+- Bug in :func:`pandas.core.groupby.GroupBy.agg` when applying a aggregation function to timezone aware data (:issue:`23683`)
+- Bug in :func:`pandas.core.groupby.GroupBy.first` and :func:`pandas.core.groupby.GroupBy.last` where timezone information would be dropped (:issue:`21603`)
+
+
+Reshaping
+^^^^^^^^^
+
+- Bug in :func:`pandas.merge` adds a string of ``None`` if ``None`` is assigned in suffixes instead of remain the column name as-is (:issue:`24782`).
+- Bug in :func:`merge` when merging by index name would sometimes result in an incorrectly numbered index (:issue:`24212`)
+- :func:`to_records` now accepts dtypes to its `column_dtypes` parameter (:issue:`24895`)
+
+
+Sparse
+^^^^^^
+
+- Significant speedup in `SparseArray` initialization that benefits most operations, fixing performance regression introduced in v0.20.0 (:issue:`24985`)
+- Bug in :class:`SparseFrame` constructor where passing ``None`` as the data would cause ``default_fill_value`` to be ignored (:issue:`16807`)
+-
+
+
+Other
+^^^^^
+
+-
+-
+-
+
+
+.. _whatsnew_0.250.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.24.x..HEAD
diff --git a/doc/source/whatsnew/v0.4.x.rst b/doc/source/whatsnew/v0.4.x.rst
new file mode 100644
index 0000000000000..0c2047ee69b81
--- /dev/null
+++ b/doc/source/whatsnew/v0.4.x.rst
@@ -0,0 +1,69 @@
+.. _whatsnew_04x:
+
+v.0.4.1 through v0.4.3 (September 25 - October 9, 2011)
+-------------------------------------------------------
+
+{{ header }}
+
+New Features
+~~~~~~~~~~~~
+
+- Added Python 3 support using 2to3 (:issue:`200`)
+- :ref:`Added <dsintro.name_attribute>` ``name`` attribute to ``Series``, now
+  prints as part of ``Series.__repr__``
+- :ref:`Added <missing.isna>` instance methods ``isnull`` and ``notnull`` to
+  Series (:issue:`209`, :issue:`203`)
+- :ref:`Added <basics.align>` ``Series.align`` method for aligning two series
+  with choice of join method (ENH56_)
+- :ref:`Added <advanced.get_level_values>` method ``get_level_values`` to
+  ``MultiIndex`` (:issue:`188`)
+- Set values in mixed-type ``DataFrame`` objects via ``.ix`` indexing attribute (:issue:`135`)
+- Added new ``DataFrame`` :ref:`methods <basics.dtypes>`
+  ``get_dtype_counts`` and property ``dtypes`` (ENHdc_)
+- Added :ref:`ignore_index <merging.ignore_index>` option to
+  ``DataFrame.append`` to stack DataFrames (ENH1b_)
+- ``read_csv`` tries to :ref:`sniff <io.sniff>` delimiters using
+  ``csv.Sniffer`` (:issue:`146`)
+- ``read_csv`` can :ref:`read <io.csv_multiindex>` multiple columns into a
+  ``MultiIndex``; DataFrame's ``to_csv`` method writes out a corresponding
+  ``MultiIndex`` (:issue:`151`)
+- ``DataFrame.rename`` has a new ``copy`` parameter to :ref:`rename
+  <basics.rename>` a DataFrame in place (ENHed_)
+- :ref:`Enable <reshaping.unstack_by_name>` unstacking by name (:issue:`142`)
+- :ref:`Enable <advanced.sortlevel_byname>` ``sortlevel`` to work by level (:issue:`141`)
+
+Performance Enhancements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Altered binary operations on differently-indexed SparseSeries objects
+  to use the integer-based (dense) alignment logic which is faster with a
+  larger number of blocks (:issue:`205`)
+- Wrote faster Cython data alignment / merging routines resulting in
+  substantial speed increases
+- Improved performance of ``isnull`` and ``notnull``, a regression from v0.3.0
+  (:issue:`187`)
+- Refactored code related to ``DataFrame.join`` so that intermediate aligned
+  copies of the data in each ``DataFrame`` argument do not need to be created.
+  Substantial performance increases result (:issue:`176`)
+- Substantially improved performance of generic ``Index.intersection`` and
+  ``Index.union``
+- Implemented ``BlockManager.take`` resulting in significantly faster ``take``
+  performance on mixed-type ``DataFrame`` objects (:issue:`104`)
+- Improved performance of ``Series.sort_index``
+- Significant groupby performance enhancement: removed unnecessary integrity
+  checks in DataFrame internals that were slowing down slicing operations to
+  retrieve groups
+- Optimized ``_ensure_index`` function resulting in performance savings in
+  type-checking Index objects
+- Wrote fast time series merging / joining methods in Cython. Will be
+  integrated later into DataFrame.join and related functions
+
+.. _ENH1b: https://github.com/pandas-dev/pandas/commit/1ba56251f0013ff7cd8834e9486cef2b10098371
+.. _ENHdc: https://github.com/pandas-dev/pandas/commit/dca3c5c5a6a3769ee01465baca04cfdfa66a4f76
+.. _ENHed: https://github.com/pandas-dev/pandas/commit/edd9f1945fc010a57fa0ae3b3444d1fffe592591
+.. _ENH56: https://github.com/pandas-dev/pandas/commit/56e0c9ffafac79ce262b55a6a13e1b10a88fbe93
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.4.1..v0.4.3
diff --git a/doc/source/whatsnew/v0.4.x.txt b/doc/source/whatsnew/v0.4.x.txt
deleted file mode 100644
index 237ea84425051..0000000000000
--- a/doc/source/whatsnew/v0.4.x.txt
+++ /dev/null
@@ -1,63 +0,0 @@
-.. _whatsnew_04x:
-
-v.0.4.3 through v0.4.1 (September 25 - October 9, 2011)
--------------------------------------------------------
-
-New Features
-~~~~~~~~~~~~
-
-- Added Python 3 support using 2to3 (:issue:`200`)
-- :ref:`Added <dsintro.name_attribute>` ``name`` attribute to ``Series``, now
-  prints as part of ``Series.__repr__``
-- :ref:`Added <missing.isnull>` instance methods ``isnull`` and ``notnull`` to
-  Series (:issue:`209`, :issue:`203`)
-- :ref:`Added <basics.align>` ``Series.align`` method for aligning two series
-  with choice of join method (ENH56_)
-- :ref:`Added <advanced.get_level_values>` method ``get_level_values`` to
-  ``MultiIndex`` (:issue:`188`)
-- Set values in mixed-type ``DataFrame`` objects via ``.ix`` indexing attribute (:issue:`135`)
-- Added new ``DataFrame`` :ref:`methods <basics.dtypes>`
-  ``get_dtype_counts`` and property ``dtypes`` (ENHdc_)
-- Added :ref:`ignore_index <merging.ignore_index>` option to
-  ``DataFrame.append`` to stack DataFrames (ENH1b_)
-- ``read_csv`` tries to :ref:`sniff <io.sniff>` delimiters using
-  ``csv.Sniffer`` (:issue:`146`)
-- ``read_csv`` can :ref:`read <io.csv_multiindex>` multiple columns into a
-  ``MultiIndex``; DataFrame's ``to_csv`` method writes out a corresponding
-  ``MultiIndex`` (:issue:`151`)
-- ``DataFrame.rename`` has a new ``copy`` parameter to :ref:`rename
-  <basics.rename>` a DataFrame in place (ENHed_)
-- :ref:`Enable <reshaping.unstack_by_name>` unstacking by name (:issue:`142`)
-- :ref:`Enable <advanced.sortlevel_byname>` ``sortlevel`` to work by level (:issue:`141`)
-
-Performance Enhancements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Altered binary operations on differently-indexed SparseSeries objects
-  to use the integer-based (dense) alignment logic which is faster with a
-  larger number of blocks (:issue:`205`)
-- Wrote faster Cython data alignment / merging routines resulting in
-  substantial speed increases
-- Improved performance of ``isnull`` and ``notnull``, a regression from v0.3.0
-  (:issue:`187`)
-- Refactored code related to ``DataFrame.join`` so that intermediate aligned
-  copies of the data in each ``DataFrame`` argument do not need to be created.
-  Substantial performance increases result (:issue:`176`)
-- Substantially improved performance of generic ``Index.intersection`` and
-  ``Index.union``
-- Implemented ``BlockManager.take`` resulting in significantly faster ``take``
-  performance on mixed-type ``DataFrame`` objects (:issue:`104`)
-- Improved performance of ``Series.sort_index``
-- Significant groupby performance enhancement: removed unnecessary integrity
-  checks in DataFrame internals that were slowing down slicing operations to
-  retrieve groups
-- Optimized ``_ensure_index`` function resulting in performance savings in
-  type-checking Index objects
-- Wrote fast time series merging / joining methods in Cython. Will be
-  integrated later into DataFrame.join and related functions
-
-.. _ENH1b: https://github.com/pandas-dev/pandas/commit/1ba56251f0013ff7cd8834e9486cef2b10098371
-.. _ENHdc: https://github.com/pandas-dev/pandas/commit/dca3c5c5a6a3769ee01465baca04cfdfa66a4f76
-.. _ENHed: https://github.com/pandas-dev/pandas/commit/edd9f1945fc010a57fa0ae3b3444d1fffe592591
-.. _ENH56: https://github.com/pandas-dev/pandas/commit/56e0c9ffafac79ce262b55a6a13e1b10a88fbe93
-
diff --git a/doc/source/whatsnew/v0.5.0.rst b/doc/source/whatsnew/v0.5.0.rst
new file mode 100644
index 0000000000000..4e635a5fe6859
--- /dev/null
+++ b/doc/source/whatsnew/v0.5.0.rst
@@ -0,0 +1,59 @@
+
+.. _whatsnew_050:
+
+v.0.5.0 (October 24, 2011)
+--------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+New Features
+~~~~~~~~~~~~
+
+- :ref:`Added <basics.df_join>` ``DataFrame.align`` method with standard join options
+- :ref:`Added <io.parse_dates>` ``parse_dates`` option to ``read_csv`` and ``read_table`` methods to optionally try to parse dates in the index columns
+- :ref:`Added <io.parse_dates>` ``nrows``, ``chunksize``, and ``iterator`` arguments to ``read_csv`` and ``read_table``. The last two return a new ``TextParser`` class capable of lazily iterating through chunks of a flat file (:issue:`242`)
+- :ref:`Added <merging.multikey_join>` ability to join on multiple columns in ``DataFrame.join`` (:issue:`214`)
+- Added private ``_get_duplicates`` function to ``Index`` for identifying duplicate values more easily (ENH5c_)
+- :ref:`Added <indexing.df_cols>` column attribute access to DataFrame.
+- :ref:`Added <indexing.df_cols>` Python tab completion hook for DataFrame columns. (:issue:`233`, :issue:`230`)
+- :ref:`Implemented <basics.describe>` ``Series.describe`` for Series containing objects (:issue:`241`)
+- :ref:`Added <merging.df_inner_join>` inner join option to ``DataFrame.join`` when joining on key(s) (:issue:`248`)
+- :ref:`Implemented <indexing.df_cols>` selecting DataFrame columns by passing a list to ``__getitem__`` (:issue:`253`)
+- :ref:`Implemented <indexing.set_ops>` & and | to intersect / union Index objects, respectively (:issue:`261`)
+- :ref:`Added<reshaping.pivot>` ``pivot_table`` convenience function to pandas namespace (:issue:`234`)
+- :ref:`Implemented <basics.rename_axis>` ``Panel.rename_axis`` function (:issue:`243`)
+- DataFrame will show index level names in console output (:issue:`334`)
+- :ref:`Implemented <advanced.take>` ``Panel.take``
+- :ref:`Added<basics.console_output>` ``set_eng_float_format`` for alternate DataFrame floating point string formatting (ENH61_)
+- :ref:`Added <indexing.set_index>` convenience ``set_index`` function for creating a DataFrame index from its existing columns
+- :ref:`Implemented <groupby.multiindex>` ``groupby`` hierarchical index level name  (:issue:`223`)
+- :ref:`Added <io.store_in_csv>` support for different delimiters in ``DataFrame.to_csv`` (:issue:`244`)
+- TODO: DOCS ABOUT TAKE METHODS
+
+Performance Enhancements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- VBENCH Major performance improvements in file parsing functions ``read_csv`` and ``read_table``
+- VBENCH Added Cython function for converting tuples to ndarray very fast. Speeds up many MultiIndex-related operations
+- VBENCH Refactored merging / joining code into a tidy class and disabled unnecessary computations in the float/object case, thus getting about 10% better performance (:issue:`211`)
+- VBENCH Improved speed of ``DataFrame.xs`` on mixed-type DataFrame objects by about 5x, regression from 0.3.0 (:issue:`215`)
+- VBENCH With new ``DataFrame.align`` method, speeding up binary operations between differently-indexed DataFrame objects by 10-25%.
+- VBENCH Significantly sped up conversion of nested dict into DataFrame (:issue:`212`)
+- VBENCH Significantly speed up DataFrame ``__repr__`` and ``count`` on large mixed-type DataFrame objects
+
+.. _ENH61: https://github.com/pandas-dev/pandas/commit/6141961
+.. _ENH5c: https://github.com/pandas-dev/pandas/commit/5ca6ff5d822ee4ddef1ec0d87b6d83d8b4bbd3eb
+
+
+.. _whatsnew_0.5.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.4.0..v0.5.0
diff --git a/doc/source/whatsnew/v0.5.0.txt b/doc/source/whatsnew/v0.5.0.txt
deleted file mode 100644
index 6fe6a02b08f70..0000000000000
--- a/doc/source/whatsnew/v0.5.0.txt
+++ /dev/null
@@ -1,43 +0,0 @@
-
-.. _whatsnew_050:
-
-v.0.5.0 (October 24, 2011)
---------------------------
-
-New Features
-~~~~~~~~~~~~
-
-- :ref:`Added <basics.df_join>` ``DataFrame.align`` method with standard join options
-- :ref:`Added <io.parse_dates>` ``parse_dates`` option to ``read_csv`` and ``read_table`` methods to optionally try to parse dates in the index columns
-- :ref:`Added <io.parse_dates>` ``nrows``, ``chunksize``, and ``iterator`` arguments to ``read_csv`` and ``read_table``. The last two return a new ``TextParser`` class capable of lazily iterating through chunks of a flat file (:issue:`242`)
-- :ref:`Added <merging.multikey_join>` ability to join on multiple columns in ``DataFrame.join`` (:issue:`214`)
-- Added private ``_get_duplicates`` function to ``Index`` for identifying duplicate values more easily (ENH5c_)
-- :ref:`Added <indexing.df_cols>` column attribute access to DataFrame.
-- :ref:`Added <indexing.df_cols>` Python tab completion hook for DataFrame columns. (:issue:`233`, :issue:`230`)
-- :ref:`Implemented <basics.describe>` ``Series.describe`` for Series containing objects (:issue:`241`)
-- :ref:`Added <merging.df_inner_join>` inner join option to ``DataFrame.join`` when joining on key(s) (:issue:`248`)
-- :ref:`Implemented <indexing.df_cols>` selecting DataFrame columns by passing a list to ``__getitem__`` (:issue:`253`)
-- :ref:`Implemented <indexing.set_ops>` & and | to intersect / union Index objects, respectively (:issue:`261`)
-- :ref:`Added<reshaping.pivot>` ``pivot_table`` convenience function to pandas namespace (:issue:`234`)
-- :ref:`Implemented <basics.rename_axis>` ``Panel.rename_axis`` function (:issue:`243`)
-- DataFrame will show index level names in console output (:issue:`334`)
-- :ref:`Implemented <advanced.take>` ``Panel.take``
-- :ref:`Added<basics.console_output>` ``set_eng_float_format`` for alternate DataFrame floating point string formatting (ENH61_)
-- :ref:`Added <indexing.set_index>` convenience ``set_index`` function for creating a DataFrame index from its existing columns
-- :ref:`Implemented <groupby.multiindex>` ``groupby`` hierarchical index level name  (:issue:`223`)
-- :ref:`Added <io.store_in_csv>` support for different delimiters in ``DataFrame.to_csv`` (:issue:`244`)
-- TODO: DOCS ABOUT TAKE METHODS
-
-Performance Enhancements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- VBENCH Major performance improvements in file parsing functions ``read_csv`` and ``read_table``
-- VBENCH Added Cython function for converting tuples to ndarray very fast. Speeds up many MultiIndex-related operations
-- VBENCH Refactored merging / joining code into a tidy class and disabled unnecessary computations in the float/object case, thus getting about 10% better performance (:issue:`211`)
-- VBENCH Improved speed of ``DataFrame.xs`` on mixed-type DataFrame objects by about 5x, regression from 0.3.0 (:issue:`215`)
-- VBENCH With new ``DataFrame.align`` method, speeding up binary operations between differently-indexed DataFrame objects by 10-25%.
-- VBENCH Significantly sped up conversion of nested dict into DataFrame (:issue:`212`)
-- VBENCH Significantly speed up DataFrame ``__repr__`` and ``count`` on large mixed-type DataFrame objects
-
-.. _ENH61: https://github.com/pandas-dev/pandas/commit/6141961
-.. _ENH5c: https://github.com/pandas-dev/pandas/commit/5ca6ff5d822ee4ddef1ec0d87b6d83d8b4bbd3eb
diff --git a/doc/source/whatsnew/v0.6.0.rst b/doc/source/whatsnew/v0.6.0.rst
new file mode 100644
index 0000000000000..ba2c6aec40f50
--- /dev/null
+++ b/doc/source/whatsnew/v0.6.0.rst
@@ -0,0 +1,72 @@
+.. _whatsnew_060:
+
+v.0.6.0 (November 25, 2011)
+---------------------------
+
+{{ header }}
+
+.. ipython:: python
+   :suppress:
+
+   from pandas import * # noqa F401, F403
+
+
+New Features
+~~~~~~~~~~~~
+- :ref:`Added <reshaping.melt>` ``melt`` function to ``pandas.core.reshape``
+- :ref:`Added <groupby.multiindex>` ``level`` parameter to group by level in Series and DataFrame descriptive statistics (:issue:`313`)
+- :ref:`Added <basics.head_tail>` ``head`` and ``tail`` methods to Series, analogous to to DataFrame (:issue:`296`)
+- :ref:`Added <indexing.boolean>` ``Series.isin`` function which checks if each value is contained in a passed sequence (:issue:`289`)
+- :ref:`Added <io.formatting>` ``float_format`` option to ``Series.to_string``
+- :ref:`Added <io.parse_dates>` ``skip_footer`` (:issue:`291`) and ``converters`` (:issue:`343`) options to ``read_csv`` and ``read_table``
+- :ref:`Added <indexing.duplicate>` ``drop_duplicates`` and ``duplicated`` functions for removing duplicate DataFrame rows and checking for duplicate rows, respectively (:issue:`319`)
+- :ref:`Implemented <dsintro.boolean>` operators '&', '|', '^', '-' on DataFrame (:issue:`347`)
+- :ref:`Added <basics.stats>` ``Series.mad``, mean absolute deviation
+- :ref:`Added <timeseries.offsets>` ``QuarterEnd`` DateOffset (:issue:`321`)
+- :ref:`Added <dsintro.numpy_interop>` ``dot`` to DataFrame (:issue:`65`)
+- :ref:`Added <basics.panel>` ``orient`` option to ``Panel.from_dict`` (:issue:`359`, :issue:`301`)
+- :ref:`Added <basics.dataframe.from_dict>` ``orient`` option to ``DataFrame.from_dict``
+- :ref:`Added <basics.dataframe.from_records>` passing list of tuples or list of lists to ``DataFrame.from_records`` (:issue:`357`)
+- :ref:`Added <groupby.multiindex>` multiple levels to groupby (:issue:`103`)
+- :ref:`Allow <basics.sorting>` multiple columns in ``by`` argument of ``DataFrame.sort_index`` (:issue:`92`, :issue:`362`)
+- :ref:`Added <indexing.basics.get_value>` fast ``get_value`` and ``put_value`` methods to DataFrame (:issue:`360`)
+- :ref:`Added <computation.covariance>` ``cov`` instance methods to Series and DataFrame (:issue:`194`, :issue:`362`)
+- :ref:`Added <visualization.barplot>` ``kind='bar'`` option to ``DataFrame.plot`` (:issue:`348`)
+- :ref:`Added <basics.idxmin>` ``idxmin`` and ``idxmax`` to Series and DataFrame (:issue:`286`)
+- :ref:`Added <io.clipboard>` ``read_clipboard`` function to parse DataFrame from clipboard (:issue:`300`)
+- :ref:`Added <basics.stats>` ``nunique`` function to Series for counting unique elements (:issue:`297`)
+- :ref:`Made <basics.dataframe>` DataFrame constructor use Series name if no columns passed (:issue:`373`)
+- :ref:`Support <io.parse_dates>` regular expressions in read_table/read_csv (:issue:`364`)
+- :ref:`Added <io.html>` ``DataFrame.to_html`` for writing DataFrame to HTML (:issue:`387`)
+- :ref:`Added <basics.dataframe>` support for MaskedArray data in DataFrame, masked values converted to NaN (:issue:`396`)
+- :ref:`Added <visualization.box>` ``DataFrame.boxplot`` function (:issue:`368`)
+- :ref:`Can <basics.apply>` pass extra args, kwds to DataFrame.apply (:issue:`376`)
+- :ref:`Implement <merging.multikey_join>` ``DataFrame.join`` with vector ``on`` argument (:issue:`312`)
+- :ref:`Added <visualization.basic>` ``legend`` boolean flag to ``DataFrame.plot`` (:issue:`324`)
+- :ref:`Can <reshaping.stacking>` pass multiple levels to ``stack`` and ``unstack`` (:issue:`370`)
+- :ref:`Can <reshaping.pivot>` pass multiple values columns to ``pivot_table`` (:issue:`381`)
+- :ref:`Use <groupby.multiindex>` Series name in GroupBy for result index (:issue:`363`)
+- :ref:`Added <basics.apply>` ``raw`` option to ``DataFrame.apply`` for performance if only need ndarray (:issue:`309`)
+- Added proper, tested weighted least squares to standard and panel OLS (:issue:`303`)
+
+Performance Enhancements
+~~~~~~~~~~~~~~~~~~~~~~~~
+- VBENCH Cythonized ``cache_readonly``, resulting in substantial micro-performance enhancements throughout the code base (:issue:`361`)
+- VBENCH Special Cython matrix iterator for applying arbitrary reduction operations with 3-5x better performance than `np.apply_along_axis` (:issue:`309`)
+- VBENCH Improved performance of ``MultiIndex.from_tuples``
+- VBENCH Special Cython matrix iterator for applying arbitrary reduction operations
+- VBENCH + DOCUMENT Add ``raw`` option to ``DataFrame.apply`` for getting better performance when
+- VBENCH Faster cythonized count by level in Series and DataFrame (:issue:`341`)
+- VBENCH? Significant GroupBy performance enhancement with multiple keys with many "empty" combinations
+- VBENCH New Cython vectorized function ``map_infer`` speeds up ``Series.apply`` and ``Series.map`` significantly when passed elementwise Python function, motivated by (:issue:`355`)
+- VBENCH Significantly improved performance of ``Series.order``, which also makes np.unique called on a Series faster (:issue:`327`)
+- VBENCH Vastly improved performance of GroupBy on axes with a MultiIndex (:issue:`299`)
+
+
+
+.. _whatsnew_0.6.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.5.0..v0.6.0
diff --git a/doc/source/whatsnew/v0.6.0.txt b/doc/source/whatsnew/v0.6.0.txt
deleted file mode 100644
index 55a67a75e0fd1..0000000000000
--- a/doc/source/whatsnew/v0.6.0.txt
+++ /dev/null
@@ -1,56 +0,0 @@
-.. _whatsnew_060:
-
-v.0.6.0 (November 25, 2011)
----------------------------
-
-New Features
-~~~~~~~~~~~~
-- :ref:`Added <reshaping.melt>` ``melt`` function to ``pandas.core.reshape``
-- :ref:`Added <groupby.multiindex>` ``level`` parameter to group by level in Series and DataFrame descriptive statistics (:issue:`313`)
-- :ref:`Added <basics.head_tail>` ``head`` and ``tail`` methods to Series, analogous to to DataFrame (:issue:`296`)
-- :ref:`Added <indexing.boolean>` ``Series.isin`` function which checks if each value is contained in a passed sequence (:issue:`289`)
-- :ref:`Added <io.formatting>` ``float_format`` option to ``Series.to_string``
-- :ref:`Added <io.parse_dates>` ``skip_footer`` (:issue:`291`) and ``converters`` (:issue:`343`) options to ``read_csv`` and ``read_table``
-- :ref:`Added <indexing.duplicate>` ``drop_duplicates`` and ``duplicated`` functions for removing duplicate DataFrame rows and checking for duplicate rows, respectively (:issue:`319`)
-- :ref:`Implemented <dsintro.boolean>` operators '&', '|', '^', '-' on DataFrame (:issue:`347`)
-- :ref:`Added <basics.stats>` ``Series.mad``, mean absolute deviation
-- :ref:`Added <timeseries.offsets>` ``QuarterEnd`` DateOffset (:issue:`321`)
-- :ref:`Added <dsintro.numpy_interop>` ``dot`` to DataFrame (:issue:`65`)
-- :ref:`Added <basics.panel>` ``orient`` option to ``Panel.from_dict`` (:issue:`359`, :issue:`301`)
-- :ref:`Added <basics.dataframe.from_dict>` ``orient`` option to ``DataFrame.from_dict``
-- :ref:`Added <basics.dataframe.from_records>` passing list of tuples or list of lists to ``DataFrame.from_records`` (:issue:`357`)
-- :ref:`Added <groupby.multiindex>` multiple levels to groupby (:issue:`103`)
-- :ref:`Allow <basics.sorting>` multiple columns in ``by`` argument of ``DataFrame.sort_index`` (:issue:`92`, :issue:`362`)
-- :ref:`Added <indexing.basics.get_value>` fast ``get_value`` and ``put_value`` methods to DataFrame (:issue:`360`)
-- :ref:`Added <computation.covariance>` ``cov`` instance methods to Series and DataFrame (:issue:`194`, :issue:`362`)
-- :ref:`Added <visualization.barplot>` ``kind='bar'`` option to ``DataFrame.plot`` (:issue:`348`)
-- :ref:`Added <basics.idxmin>` ``idxmin`` and ``idxmax`` to Series and DataFrame (:issue:`286`)
-- :ref:`Added <io.clipboard>` ``read_clipboard`` function to parse DataFrame from clipboard (:issue:`300`)
-- :ref:`Added <basics.stats>` ``nunique`` function to Series for counting unique elements (:issue:`297`)
-- :ref:`Made <basics.dataframe>` DataFrame constructor use Series name if no columns passed (:issue:`373`)
-- :ref:`Support <io.parse_dates>` regular expressions in read_table/read_csv (:issue:`364`)
-- :ref:`Added <io.html>` ``DataFrame.to_html`` for writing DataFrame to HTML (:issue:`387`)
-- :ref:`Added <basics.dataframe>` support for MaskedArray data in DataFrame, masked values converted to NaN (:issue:`396`)
-- :ref:`Added <visualization.box>` ``DataFrame.boxplot`` function (:issue:`368`)
-- :ref:`Can <basics.apply>` pass extra args, kwds to DataFrame.apply (:issue:`376`)
-- :ref:`Implement <merging.multikey_join>` ``DataFrame.join`` with vector ``on`` argument (:issue:`312`)
-- :ref:`Added <visualization.basic>` ``legend`` boolean flag to ``DataFrame.plot`` (:issue:`324`)
-- :ref:`Can <reshaping.stacking>` pass multiple levels to ``stack`` and ``unstack`` (:issue:`370`)
-- :ref:`Can <reshaping.pivot>` pass multiple values columns to ``pivot_table`` (:issue:`381`)
-- :ref:`Use <groupby.multiindex>` Series name in GroupBy for result index (:issue:`363`)
-- :ref:`Added <basics.apply>` ``raw`` option to ``DataFrame.apply`` for performance if only need ndarray (:issue:`309`)
-- Added proper, tested weighted least squares to standard and panel OLS (:issue:`303`)
-
-Performance Enhancements
-~~~~~~~~~~~~~~~~~~~~~~~~
-- VBENCH Cythonized ``cache_readonly``, resulting in substantial micro-performance enhancements throughout the codebase (:issue:`361`)
-- VBENCH Special Cython matrix iterator for applying arbitrary reduction operations with 3-5x better performance than `np.apply_along_axis` (:issue:`309`)
-- VBENCH Improved performance of ``MultiIndex.from_tuples``
-- VBENCH Special Cython matrix iterator for applying arbitrary reduction operations
-- VBENCH + DOCUMENT Add ``raw`` option to ``DataFrame.apply`` for getting better performance when
-- VBENCH Faster cythonized count by level in Series and DataFrame (:issue:`341`)
-- VBENCH? Significant GroupBy performance enhancement with multiple keys with many "empty" combinations
-- VBENCH New Cython vectorized function ``map_infer`` speeds up ``Series.apply`` and ``Series.map`` significantly when passed elementwise Python function, motivated by (:issue:`355`)
-- VBENCH Significantly improved performance of ``Series.order``, which also makes np.unique called on a Series faster (:issue:`327`)
-- VBENCH Vastly improved performance of GroupBy on axes with a MultiIndex (:issue:`299`)
-
diff --git a/doc/source/whatsnew/v0.6.1.rst b/doc/source/whatsnew/v0.6.1.rst
new file mode 100644
index 0000000000000..d01757775d694
--- /dev/null
+++ b/doc/source/whatsnew/v0.6.1.rst
@@ -0,0 +1,58 @@
+
+.. _whatsnew_061:
+
+v.0.6.1 (December 13, 2011)
+---------------------------
+
+New features
+~~~~~~~~~~~~
+- Can :ref:`append single rows <merging.append.row>` (as Series) to a DataFrame
+- Add Spearman and Kendall rank :ref:`correlation <computation.correlation>`
+  options to Series.corr and DataFrame.corr (:issue:`428`)
+- :ref:`Added <indexing.basics.get_value>` ``get_value`` and ``set_value`` methods to
+  Series, DataFrame, and Panel for very low-overhead access (>2x faster in many
+  cases) to scalar elements (:issue:`437`, :issue:`438`). ``set_value`` is capable of
+  producing an enlarged object.
+- Add PyQt table widget to sandbox (:issue:`435`)
+- DataFrame.align can :ref:`accept Series arguments <basics.align.frame.series>`
+  and an :ref:`axis option <basics.df_join>` (:issue:`461`)
+- Implement new :ref:`SparseArray <sparse.array>` and `SparseList`
+  data structures. SparseSeries now derives from SparseArray (:issue:`463`)
+- :ref:`Better console printing options <basics.console_output>` (:issue:`453`)
+- Implement fast :ref:`data ranking <computation.ranking>` for Series and
+  DataFrame, fast versions of scipy.stats.rankdata (:issue:`428`)
+- Implement `DataFrame.from_items` alternate
+  constructor (:issue:`444`)
+- DataFrame.convert_objects method for :ref:`inferring better dtypes <basics.cast>`
+  for object columns (:issue:`302`)
+- Add :ref:`rolling_corr_pairwise <stats.moments.corr_pairwise>` function for
+  computing Panel of correlation matrices (:issue:`189`)
+- Add :ref:`margins <reshaping.pivot.margins>` option to :ref:`pivot_table
+  <reshaping.pivot>` for computing subgroup aggregates (:issue:`114`)
+- Add ``Series.from_csv`` function (:issue:`482`)
+- :ref:`Can pass <stats.moments.binary>` DataFrame/DataFrame and
+  DataFrame/Series to rolling_corr/rolling_cov (GH #462)
+- MultiIndex.get_level_values can :ref:`accept the level name <advanced.get_level_values>`
+
+Performance improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- Improve memory usage of `DataFrame.describe` (do not copy data
+  unnecessarily) (PR #425)
+
+- Optimize scalar value lookups in the general case by 25% or more in Series
+  and DataFrame
+
+- Fix performance regression in cross-sectional count in DataFrame, affecting
+  DataFrame.dropna speed
+- Column deletion in DataFrame copies no data (computes views on blocks) (GH
+  #158)
+
+
+
+.. _whatsnew_0.6.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.6.0..v0.6.1
diff --git a/doc/source/whatsnew/v0.6.1.txt b/doc/source/whatsnew/v0.6.1.txt
deleted file mode 100644
index a2dab738546f9..0000000000000
--- a/doc/source/whatsnew/v0.6.1.txt
+++ /dev/null
@@ -1,50 +0,0 @@
-
-.. _whatsnew_061:
-
-v.0.6.1 (December 13, 2011)
----------------------------
-
-New features
-~~~~~~~~~~~~
-- Can :ref:`append single rows <merging.append.row>` (as Series) to a DataFrame
-- Add Spearman and Kendall rank :ref:`correlation <computation.correlation>`
-  options to Series.corr and DataFrame.corr (:issue:`428`)
-- :ref:`Added <indexing.basics.get_value>` ``get_value`` and ``set_value`` methods to
-  Series, DataFrame, and Panel for very low-overhead access (>2x faster in many
-  cases) to scalar elements (:issue:`437`, :issue:`438`). ``set_value`` is capable of
-  producing an enlarged object.
-- Add PyQt table widget to sandbox (:issue:`435`)
-- DataFrame.align can :ref:`accept Series arguments <basics.align.frame.series>`
-  and an :ref:`axis option <basics.df_join>` (:issue:`461`)
-- Implement new :ref:`SparseArray <sparse.array>` and :ref:`SparseList <sparse.list>`
-  data structures. SparseSeries now derives from SparseArray (:issue:`463`)
-- :ref:`Better console printing options <basics.console_output>` (:issue:`453`)
-- Implement fast :ref:`data ranking <computation.ranking>` for Series and
-  DataFrame, fast versions of scipy.stats.rankdata (:issue:`428`)
-- Implement :ref:`DataFrame.from_items <basics.dataframe.from_items>` alternate
-  constructor (:issue:`444`)
-- DataFrame.convert_objects method for :ref:`inferring better dtypes <basics.cast>`
-  for object columns (:issue:`302`)
-- Add :ref:`rolling_corr_pairwise <stats.moments.corr_pairwise>` function for
-  computing Panel of correlation matrices (:issue:`189`)
-- Add :ref:`margins <reshaping.pivot.margins>` option to :ref:`pivot_table
-  <reshaping.pivot>` for computing subgroup aggregates (:issue:`114`)
-- Add ``Series.from_csv`` function (:issue:`482`)
-- :ref:`Can pass <stats.moments.binary>` DataFrame/DataFrame and
-  DataFrame/Series to rolling_corr/rolling_cov (GH #462)
-- MultiIndex.get_level_values can :ref:`accept the level name <advanced.get_level_values>`
-
-Performance improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- Improve memory usage of `DataFrame.describe` (do not copy data
-  unnecessarily) (PR #425)
-
-- Optimize scalar value lookups in the general case by 25% or more in Series
-  and DataFrame
-
-- Fix performance regression in cross-sectional count in DataFrame, affecting
-  DataFrame.dropna speed
-- Column deletion in DataFrame copies no data (computes views on blocks) (GH
-  #158)
-
diff --git a/doc/source/whatsnew/v0.7.0.rst b/doc/source/whatsnew/v0.7.0.rst
new file mode 100644
index 0000000000000..d63b4a3cb4df1
--- /dev/null
+++ b/doc/source/whatsnew/v0.7.0.rst
@@ -0,0 +1,311 @@
+.. _whatsnew_0700:
+
+v.0.7.0 (February 9, 2012)
+--------------------------
+
+{{ header }}
+
+
+New features
+~~~~~~~~~~~~
+
+- New unified :ref:`merge function <merging.join>` for efficiently performing
+  full gamut of database / relational-algebra operations. Refactored existing
+  join methods to use the new infrastructure, resulting in substantial
+  performance gains (:issue:`220`, :issue:`249`, :issue:`267`)
+
+- New :ref:`unified concatenation function <merging.concat>` for concatenating
+  Series, DataFrame or Panel objects along an axis. Can form union or
+  intersection of the other axes. Improves performance of ``Series.append`` and
+  ``DataFrame.append`` (:issue:`468`, :issue:`479`, :issue:`273`)
+
+- :ref:`Can <merging.concatenation>` pass multiple DataFrames to
+  `DataFrame.append` to concatenate (stack) and multiple Series to
+  ``Series.append`` too
+
+- :ref:`Can<basics.dataframe.from_list_of_dicts>` pass list of dicts (e.g., a
+  list of JSON objects) to DataFrame constructor (:issue:`526`)
+
+- You can now :ref:`set multiple columns <indexing.columns.multiple>` in a
+  DataFrame via ``__getitem__``, useful for transformation (:issue:`342`)
+
+- Handle differently-indexed output values in ``DataFrame.apply`` (:issue:`498`)
+
+.. ipython:: python
+
+   df = pd.DataFrame(np.random.randn(10, 4))
+   df.apply(lambda x: x.describe())
+
+- :ref:`Add<advanced.reorderlevels>` ``reorder_levels`` method to Series and
+  DataFrame (:issue:`534`)
+
+- :ref:`Add<indexing.dictionarylike>` dict-like ``get`` function to DataFrame
+  and Panel (:issue:`521`)
+
+- :ref:`Add<basics.iterrows>` ``DataFrame.iterrows`` method for efficiently
+  iterating through the rows of a DataFrame
+
+- :ref:`Add<dsintro.to_panel>` ``DataFrame.to_panel`` with code adapted from
+  ``LongPanel.to_long``
+
+- :ref:`Add <basics.reindexing>` ``reindex_axis`` method added to DataFrame
+
+- :ref:`Add <basics.stats>` ``level`` option to binary arithmetic functions on
+  ``DataFrame`` and ``Series``
+
+- :ref:`Add <advanced.advanced_reindex>` ``level`` option to the ``reindex``
+  and ``align`` methods on Series and DataFrame for broadcasting values across
+  a level (:issue:`542`, :issue:`552`, others)
+
+- :ref:`Add <dsintro.panel_item_selection>` attribute-based item access to
+  ``Panel`` and add IPython completion (:issue:`563`)
+
+- :ref:`Add <visualization.basic>` ``logy`` option to ``Series.plot`` for
+  log-scaling on the Y axis
+
+- :ref:`Add <io.formatting>` ``index`` and ``header`` options to
+  ``DataFrame.to_string``
+
+- :ref:`Can <merging.multiple_join>` pass multiple DataFrames to
+  ``DataFrame.join`` to join on index (:issue:`115`)
+
+- :ref:`Can <merging.multiple_join>` pass multiple Panels to ``Panel.join``
+  (:issue:`115`)
+
+- :ref:`Added <io.formatting>` ``justify`` argument to ``DataFrame.to_string``
+  to allow different alignment of column headers
+
+- :ref:`Add <groupby.attributes>` ``sort`` option to GroupBy to allow disabling
+  sorting of the group keys for potential speedups (:issue:`595`)
+
+- :ref:`Can <basics.dataframe.from_series>` pass MaskedArray to Series
+  constructor (:issue:`563`)
+
+- :ref:`Add <dsintro.panel_item_selection>` Panel item access via attributes
+  and IPython completion (:issue:`554`)
+
+- Implement ``DataFrame.lookup``, fancy-indexing analogue for retrieving values
+  given a sequence of row and column labels (:issue:`338`)
+
+- Can pass a :ref:`list of functions <groupby.aggregate.multifunc>` to
+  aggregate with groupby on a DataFrame, yielding an aggregated result with
+  hierarchical columns (:issue:`166`)
+
+- Can call ``cummin`` and ``cummax`` on Series and DataFrame to get cumulative
+  minimum and maximum, respectively (:issue:`647`)
+
+- ``value_range`` added as utility function to get min and max of a dataframe
+  (:issue:`288`)
+
+- Added ``encoding`` argument to ``read_csv``, ``read_table``, ``to_csv`` and
+  ``from_csv`` for non-ascii text (:issue:`717`)
+
+- :ref:`Added <basics.stats>` ``abs`` method to pandas objects
+
+- :ref:`Added <reshaping.pivot>` ``crosstab`` function for easily computing frequency tables
+
+- :ref:`Added <indexing.set_ops>` ``isin`` method to index objects
+
+- :ref:`Added <advanced.xs>` ``level`` argument to ``xs`` method of DataFrame.
+
+
+API Changes to integer indexing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+One of the potentially riskiest API changes in 0.7.0, but also one of the most
+important, was a complete review of how **integer indexes** are handled with
+regard to label-based indexing. Here is an example:
+
+.. ipython:: python
+
+    s = pd.Series(np.random.randn(10), index=range(0, 20, 2))
+    s
+    s[0]
+    s[2]
+    s[4]
+
+This is all exactly identical to the behavior before. However, if you ask for a
+key **not** contained in the Series, in versions 0.6.1 and prior, Series would
+*fall back* on a location-based lookup. This now raises a ``KeyError``:
+
+.. code-block:: ipython
+
+   In [2]: s[1]
+   KeyError: 1
+
+This change also has the same impact on DataFrame:
+
+.. code-block:: ipython
+
+   In [3]: df = pd.DataFrame(np.random.randn(8, 4), index=range(0, 16, 2))
+
+   In [4]: df
+       0        1       2       3
+   0   0.88427  0.3363 -0.1787  0.03162
+   2   0.14451 -0.1415  0.2504  0.58374
+   4  -1.44779 -0.9186 -1.4996  0.27163
+   6  -0.26598 -2.4184 -0.2658  0.11503
+   8  -0.58776  0.3144 -0.8566  0.61941
+   10  0.10940 -0.7175 -1.0108  0.47990
+   12 -1.16919 -0.3087 -0.6049 -0.43544
+   14 -0.07337  0.3410  0.0424 -0.16037
+
+   In [5]: df.ix[3]
+   KeyError: 3
+
+In order to support purely integer-based indexing, the following methods have
+been added:
+
+.. csv-table::
+    :header: "Method","Description"
+    :widths: 40,60
+
+	``Series.iget_value(i)``, Retrieve value stored at location ``i``
+	``Series.iget(i)``, Alias for ``iget_value``
+	``DataFrame.irow(i)``, Retrieve the ``i``-th row
+	``DataFrame.icol(j)``, Retrieve the ``j``-th column
+	"``DataFrame.iget_value(i, j)``", Retrieve the value at row ``i`` and column ``j``
+
+API tweaks regarding label-based slicing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Label-based slicing using ``ix`` now requires that the index be sorted
+(monotonic) **unless** both the start and endpoint are contained in the index:
+
+.. code-block:: python
+
+   In [1]: s = pd.Series(np.random.randn(6), index=list('gmkaec'))
+
+   In [2]: s
+   Out[2]:
+   g   -1.182230
+   m   -0.276183
+   k   -0.243550
+   a    1.628992
+   e    0.073308
+   c   -0.539890
+   dtype: float64
+
+Then this is OK:
+
+.. code-block:: python
+
+   In [3]: s.ix['k':'e']
+   Out[3]:
+   k   -0.243550
+   a    1.628992
+   e    0.073308
+   dtype: float64
+
+But this is not:
+
+.. code-block:: ipython
+
+   In [12]: s.ix['b':'h']
+   KeyError 'b'
+
+If the index had been sorted, the "range selection" would have been possible:
+
+.. code-block:: python
+
+   In [4]: s2 = s.sort_index()
+
+   In [5]: s2
+   Out[5]:
+   a    1.628992
+   c   -0.539890
+   e    0.073308
+   g   -1.182230
+   k   -0.243550
+   m   -0.276183
+   dtype: float64
+
+   In [6]: s2.ix['b':'h']
+   Out[6]:
+   c   -0.539890
+   e    0.073308
+   g   -1.182230
+   dtype: float64
+
+Changes to Series ``[]`` operator
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+As as notational convenience, you can pass a sequence of labels or a label
+slice to a Series when getting and setting values via ``[]`` (i.e. the
+``__getitem__`` and ``__setitem__`` methods). The behavior will be the same as
+passing similar input to ``ix`` **except in the case of integer indexing**:
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(6), index=list('acegkm'))
+   s
+   s[['m', 'a', 'c', 'e']]
+   s['b':'l']
+   s['c':'k']
+
+In the case of integer indexes, the behavior will be exactly as before
+(shadowing ``ndarray``):
+
+.. ipython:: python
+
+   s = pd.Series(np.random.randn(6), index=range(0, 12, 2))
+   s[[4, 0, 2]]
+   s[1:5]
+
+If you wish to do indexing with sequences and slicing on an integer index with
+label semantics, use ``ix``.
+
+Other API Changes
+~~~~~~~~~~~~~~~~~
+
+- The deprecated ``LongPanel`` class has been completely removed
+
+- If ``Series.sort`` is called on a column of a DataFrame, an exception will
+  now be raised. Before it was possible to accidentally mutate a DataFrame's
+  column by doing ``df[col].sort()`` instead of the side-effect free method
+  ``df[col].order()`` (:issue:`316`)
+
+- Miscellaneous renames and deprecations which will (harmlessly) raise
+  ``FutureWarning``
+
+- ``drop`` added as an optional parameter to ``DataFrame.reset_index`` (:issue:`699`)
+
+Performance improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+- :ref:`Cythonized GroupBy aggregations <groupby.aggregate.cython>` no longer
+  presort the data, thus achieving a significant speedup (:issue:`93`).  GroupBy
+  aggregations with Python functions significantly sped up by clever
+  manipulation of the ndarray data type in Cython (:issue:`496`).
+- Better error message in DataFrame constructor when passed column labels
+  don't match data (:issue:`497`)
+- Substantially improve performance of multi-GroupBy aggregation when a
+  Python function is passed, reuse ndarray object in Cython (:issue:`496`)
+- Can store objects indexed by tuples and floats in HDFStore (:issue:`492`)
+- Don't print length by default in Series.to_string, add `length` option (:issue:`489`)
+- Improve Cython code for multi-groupby to aggregate without having to sort
+  the data (:issue:`93`)
+- Improve MultiIndex reindexing speed by storing tuples in the MultiIndex,
+  test for backwards unpickling compatibility
+- Improve column reindexing performance by using specialized Cython take
+  function
+- Further performance tweaking of Series.__getitem__ for standard use cases
+- Avoid Index dict creation in some cases (i.e. when getting slices, etc.),
+  regression from prior versions
+- Friendlier error message in setup.py if NumPy not installed
+- Use common set of NA-handling operations (sum, mean, etc.) in Panel class
+  also (:issue:`536`)
+- Default name assignment when calling ``reset_index`` on DataFrame with a
+  regular (non-hierarchical) index (:issue:`476`)
+- Use Cythonized groupers when possible in Series/DataFrame stat ops with
+  ``level`` parameter passed (:issue:`545`)
+- Ported skiplist data structure to C to speed up ``rolling_median`` by about
+  5-10x in most typical use cases (:issue:`374`)
+
+
+.. _whatsnew_0.7.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.6.1..v0.7.0
diff --git a/doc/source/whatsnew/v0.7.0.txt b/doc/source/whatsnew/v0.7.0.txt
deleted file mode 100644
index 21d91950e7b78..0000000000000
--- a/doc/source/whatsnew/v0.7.0.txt
+++ /dev/null
@@ -1,300 +0,0 @@
-.. _whatsnew_0700:
-
-v.0.7.0 (February 9, 2012)
---------------------------
-
-New features
-~~~~~~~~~~~~
-
-- New unified :ref:`merge function <merging.join>` for efficiently performing
-  full gamut of database / relational-algebra operations. Refactored existing
-  join methods to use the new infrastructure, resulting in substantial
-  performance gains (:issue:`220`, :issue:`249`, :issue:`267`)
-
-- New :ref:`unified concatenation function <merging.concat>` for concatenating
-  Series, DataFrame or Panel objects along an axis. Can form union or
-  intersection of the other axes. Improves performance of ``Series.append`` and
-  ``DataFrame.append`` (:issue:`468`, :issue:`479`, :issue:`273`)
-
-- :ref:`Can <merging.concatenation>` pass multiple DataFrames to
-  `DataFrame.append` to concatenate (stack) and multiple Series to
-  ``Series.append`` too
-
-- :ref:`Can<basics.dataframe.from_list_of_dicts>` pass list of dicts (e.g., a
-  list of JSON objects) to DataFrame constructor (:issue:`526`)
-
-- You can now :ref:`set multiple columns <indexing.columns.multiple>` in a
-  DataFrame via ``__getitem__``, useful for transformation (:issue:`342`)
-
-- Handle differently-indexed output values in ``DataFrame.apply`` (:issue:`498`)
-
-.. ipython:: python
-
-   df = DataFrame(randn(10, 4))
-   df.apply(lambda x: x.describe())
-
-- :ref:`Add<advanced.reorderlevels>` ``reorder_levels`` method to Series and
-  DataFrame (:issue:`534`)
-
-- :ref:`Add<indexing.dictionarylike>` dict-like ``get`` function to DataFrame
-  and Panel (:issue:`521`)
-
-- :ref:`Add<basics.iterrows>` ``DataFrame.iterrows`` method for efficiently
-  iterating through the rows of a DataFrame
-
-- :ref:`Add<dsintro.to_panel>` ``DataFrame.to_panel`` with code adapted from
-  ``LongPanel.to_long``
-
-- :ref:`Add <basics.reindexing>` ``reindex_axis`` method added to DataFrame
-
-- :ref:`Add <basics.stats>` ``level`` option to binary arithmetic functions on
-  ``DataFrame`` and ``Series``
-
-- :ref:`Add <advanced.advanced_reindex>` ``level`` option to the ``reindex``
-  and ``align`` methods on Series and DataFrame for broadcasting values across
-  a level (:issue:`542`, :issue:`552`, others)
-
-- :ref:`Add <dsintro.panel_item_selection>` attribute-based item access to
-  ``Panel`` and add IPython completion (:issue:`563`)
-
-- :ref:`Add <visualization.basic>` ``logy`` option to ``Series.plot`` for
-  log-scaling on the Y axis
-
-- :ref:`Add <io.formatting>` ``index`` and ``header`` options to
-  ``DataFrame.to_string``
-
-- :ref:`Can <merging.multiple_join>` pass multiple DataFrames to
-  ``DataFrame.join`` to join on index (:issue:`115`)
-
-- :ref:`Can <merging.multiple_join>` pass multiple Panels to ``Panel.join``
-  (:issue:`115`)
-
-- :ref:`Added <io.formatting>` ``justify`` argument to ``DataFrame.to_string``
-  to allow different alignment of column headers
-
-- :ref:`Add <groupby.attributes>` ``sort`` option to GroupBy to allow disabling
-  sorting of the group keys for potential speedups (:issue:`595`)
-
-- :ref:`Can <basics.dataframe.from_series>` pass MaskedArray to Series
-  constructor (:issue:`563`)
-
-- :ref:`Add <dsintro.panel_item_selection>` Panel item access via attributes
-  and IPython completion (:issue:`554`)
-
-- Implement ``DataFrame.lookup``, fancy-indexing analogue for retrieving values
-  given a sequence of row and column labels (:issue:`338`)
-
-- Can pass a :ref:`list of functions <groupby.aggregate.multifunc>` to
-  aggregate with groupby on a DataFrame, yielding an aggregated result with
-  hierarchical columns (:issue:`166`)
-
-- Can call ``cummin`` and ``cummax`` on Series and DataFrame to get cumulative
-  minimum and maximum, respectively (:issue:`647`)
-
-- ``value_range`` added as utility function to get min and max of a dataframe
-  (:issue:`288`)
-
-- Added ``encoding`` argument to ``read_csv``, ``read_table``, ``to_csv`` and
-  ``from_csv`` for non-ascii text (:issue:`717`)
-
-- :ref:`Added <basics.stats>` ``abs`` method to pandas objects
-
-- :ref:`Added <reshaping.pivot>` ``crosstab`` function for easily computing frequency tables
-
-- :ref:`Added <indexing.set_ops>` ``isin`` method to index objects
-
-- :ref:`Added <advanced.xs>` ``level`` argument to ``xs`` method of DataFrame.
-
-
-API Changes to integer indexing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-One of the potentially riskiest API changes in 0.7.0, but also one of the most
-important, was a complete review of how **integer indexes** are handled with
-regard to label-based indexing. Here is an example:
-
-.. ipython:: python
-
-    s = Series(randn(10), index=range(0, 20, 2))
-    s
-    s[0]
-    s[2]
-    s[4]
-
-This is all exactly identical to the behavior before. However, if you ask for a
-key **not** contained in the Series, in versions 0.6.1 and prior, Series would
-*fall back* on a location-based lookup. This now raises a ``KeyError``:
-
-.. code-block:: ipython
-
-   In [2]: s[1]
-   KeyError: 1
-
-This change also has the same impact on DataFrame:
-
-.. code-block:: ipython
-
-   In [3]: df = DataFrame(randn(8, 4), index=range(0, 16, 2))
-
-   In [4]: df
-       0        1       2       3
-   0   0.88427  0.3363 -0.1787  0.03162
-   2   0.14451 -0.1415  0.2504  0.58374
-   4  -1.44779 -0.9186 -1.4996  0.27163
-   6  -0.26598 -2.4184 -0.2658  0.11503
-   8  -0.58776  0.3144 -0.8566  0.61941
-   10  0.10940 -0.7175 -1.0108  0.47990
-   12 -1.16919 -0.3087 -0.6049 -0.43544
-   14 -0.07337  0.3410  0.0424 -0.16037
-
-   In [5]: df.ix[3]
-   KeyError: 3
-
-In order to support purely integer-based indexing, the following methods have
-been added:
-
-.. csv-table::
-    :header: "Method","Description"
-    :widths: 40,60
-
-	``Series.iget_value(i)``, Retrieve value stored at location ``i``
-	``Series.iget(i)``, Alias for ``iget_value``
-	``DataFrame.irow(i)``, Retrieve the ``i``-th row
-	``DataFrame.icol(j)``, Retrieve the ``j``-th column
-	"``DataFrame.iget_value(i, j)``", Retrieve the value at row ``i`` and column ``j``
-
-API tweaks regarding label-based slicing
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Label-based slicing using ``ix`` now requires that the index be sorted
-(monotonic) **unless** both the start and endpoint are contained in the index:
-
-.. code-block:: python
-
-   In [1]: s = Series(randn(6), index=list('gmkaec'))
-
-   In [2]: s
-   Out[2]:
-   g   -1.182230
-   m   -0.276183
-   k   -0.243550
-   a    1.628992
-   e    0.073308
-   c   -0.539890
-   dtype: float64
-
-Then this is OK:
-
-.. code-block:: python
-
-   In [3]: s.ix['k':'e']
-   Out[3]:
-   k   -0.243550
-   a    1.628992
-   e    0.073308
-   dtype: float64
-
-But this is not:
-
-.. code-block:: ipython
-
-   In [12]: s.ix['b':'h']
-   KeyError 'b'
-
-If the index had been sorted, the "range selection" would have been possible:
-
-.. code-block:: python
-
-   In [4]: s2 = s.sort_index()
-
-   In [5]: s2
-   Out[5]:
-   a    1.628992
-   c   -0.539890
-   e    0.073308
-   g   -1.182230
-   k   -0.243550
-   m   -0.276183
-   dtype: float64
-
-   In [6]: s2.ix['b':'h']
-   Out[6]:
-   c   -0.539890
-   e    0.073308
-   g   -1.182230
-   dtype: float64
-
-Changes to Series ``[]`` operator
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-As as notational convenience, you can pass a sequence of labels or a label
-slice to a Series when getting and setting values via ``[]`` (i.e. the
-``__getitem__`` and ``__setitem__`` methods). The behavior will be the same as
-passing similar input to ``ix`` **except in the case of integer indexing**:
-
-.. ipython:: python
-
-   s = Series(randn(6), index=list('acegkm'))
-   s
-   s[['m', 'a', 'c', 'e']]
-   s['b':'l']
-   s['c':'k']
-
-In the case of integer indexes, the behavior will be exactly as before
-(shadowing ``ndarray``):
-
-.. ipython:: python
-
-   s = Series(randn(6), index=range(0, 12, 2))
-   s[[4, 0, 2]]
-   s[1:5]
-
-If you wish to do indexing with sequences and slicing on an integer index with
-label semantics, use ``ix``.
-
-Other API Changes
-~~~~~~~~~~~~~~~~~
-
-- The deprecated ``LongPanel`` class has been completely removed
-
-- If ``Series.sort`` is called on a column of a DataFrame, an exception will
-  now be raised. Before it was possible to accidentally mutate a DataFrame's
-  column by doing ``df[col].sort()`` instead of the side-effect free method
-  ``df[col].order()`` (:issue:`316`)
-
-- Miscellaneous renames and deprecations which will (harmlessly) raise
-  ``FutureWarning``
-
-- ``drop`` added as an optional parameter to ``DataFrame.reset_index`` (:issue:`699`)
-
-Performance improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-- :ref:`Cythonized GroupBy aggregations <groupby.aggregate.cython>` no longer
-  presort the data, thus achieving a significant speedup (:issue:`93`).  GroupBy
-  aggregations with Python functions significantly sped up by clever
-  manipulation of the ndarray data type in Cython (:issue:`496`).
-- Better error message in DataFrame constructor when passed column labels
-  don't match data (:issue:`497`)
-- Substantially improve performance of multi-GroupBy aggregation when a
-  Python function is passed, reuse ndarray object in Cython (:issue:`496`)
-- Can store objects indexed by tuples and floats in HDFStore (:issue:`492`)
-- Don't print length by default in Series.to_string, add `length` option (:issue:`489`)
-- Improve Cython code for multi-groupby to aggregate without having to sort
-  the data (:issue:`93`)
-- Improve MultiIndex reindexing speed by storing tuples in the MultiIndex,
-  test for backwards unpickling compatibility
-- Improve column reindexing performance by using specialized Cython take
-  function
-- Further performance tweaking of Series.__getitem__ for standard use cases
-- Avoid Index dict creation in some cases (i.e. when getting slices, etc.),
-  regression from prior versions
-- Friendlier error message in setup.py if NumPy not installed
-- Use common set of NA-handling operations (sum, mean, etc.) in Panel class
-  also (:issue:`536`)
-- Default name assignment when calling ``reset_index`` on DataFrame with a
-  regular (non-hierarchical) index (:issue:`476`)
-- Use Cythonized groupers when possible in Series/DataFrame stat ops with
-  ``level`` parameter passed (:issue:`545`)
-- Ported skiplist data structure to C to speed up ``rolling_median`` by about
-  5-10x in most typical use cases (:issue:`374`)
diff --git a/doc/source/whatsnew/v0.7.1.rst b/doc/source/whatsnew/v0.7.1.rst
new file mode 100644
index 0000000000000..04b548a93c338
--- /dev/null
+++ b/doc/source/whatsnew/v0.7.1.rst
@@ -0,0 +1,41 @@
+.. _whatsnew_0701:
+
+v.0.7.1 (February 29, 2012)
+---------------------------
+
+{{ header }}
+
+
+This release includes a few new features and addresses over a dozen bugs in
+0.7.0.
+
+New features
+~~~~~~~~~~~~
+
+  - Add ``to_clipboard`` function to pandas namespace for writing objects to
+    the system clipboard (:issue:`774`)
+  - Add ``itertuples`` method to DataFrame for iterating through the rows of a
+    dataframe as tuples (:issue:`818`)
+  - Add ability to pass fill_value and method to DataFrame and Series align
+    method (:issue:`806`, :issue:`807`)
+  - Add fill_value option to reindex, align methods (:issue:`784`)
+  - Enable concat to produce DataFrame from Series (:issue:`787`)
+  - Add ``between`` method to Series (:issue:`802`)
+  - Add HTML representation hook to DataFrame for the IPython HTML notebook
+    (:issue:`773`)
+  - Support for reading Excel 2007 XML documents using openpyxl
+
+Performance improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+  - Improve performance and memory usage of fillna on DataFrame
+  - Can concatenate a list of Series along axis=1 to obtain a DataFrame (:issue:`787`)
+
+
+
+.. _whatsnew_0.7.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.7.0..v0.7.1
diff --git a/doc/source/whatsnew/v0.7.1.txt b/doc/source/whatsnew/v0.7.1.txt
deleted file mode 100644
index bc12cb8d200cd..0000000000000
--- a/doc/source/whatsnew/v0.7.1.txt
+++ /dev/null
@@ -1,30 +0,0 @@
-.. _whatsnew_0701:
-
-v.0.7.1 (February 29, 2012)
----------------------------
-
-This release includes a few new features and addresses over a dozen bugs in
-0.7.0.
-
-New features
-~~~~~~~~~~~~
-
-  - Add ``to_clipboard`` function to pandas namespace for writing objects to
-    the system clipboard (:issue:`774`)
-  - Add ``itertuples`` method to DataFrame for iterating through the rows of a
-    dataframe as tuples (:issue:`818`)
-  - Add ability to pass fill_value and method to DataFrame and Series align
-    method (:issue:`806`, :issue:`807`)
-  - Add fill_value option to reindex, align methods (:issue:`784`)
-  - Enable concat to produce DataFrame from Series (:issue:`787`)
-  - Add ``between`` method to Series (:issue:`802`)
-  - Add HTML representation hook to DataFrame for the IPython HTML notebook
-    (:issue:`773`)
-  - Support for reading Excel 2007 XML documents using openpyxl
-
-Performance improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-  - Improve performance and memory usage of fillna on DataFrame
-  - Can concatenate a list of Series along axis=1 to obtain a DataFrame (:issue:`787`)
-
diff --git a/doc/source/whatsnew/v0.7.2.rst b/doc/source/whatsnew/v0.7.2.rst
new file mode 100644
index 0000000000000..ad72b081e590c
--- /dev/null
+++ b/doc/source/whatsnew/v0.7.2.rst
@@ -0,0 +1,38 @@
+.. _whatsnew_0702:
+
+v.0.7.2 (March 16, 2012)
+---------------------------
+
+{{ header }}
+
+
+This release targets bugs in 0.7.1, and adds a few minor features.
+
+New features
+~~~~~~~~~~~~
+
+  - Add additional tie-breaking methods in DataFrame.rank (:issue:`874`)
+  - Add ascending parameter to rank in Series, DataFrame (:issue:`875`)
+  - Add coerce_float option to DataFrame.from_records (:issue:`893`)
+  - Add sort_columns parameter to allow unsorted plots (:issue:`918`)
+  - Enable column access via attributes on GroupBy (:issue:`882`)
+  - Can pass dict of values to DataFrame.fillna (:issue:`661`)
+  - Can select multiple hierarchical groups by passing list of values in .ix
+    (:issue:`134`)
+  - Add ``axis`` option to DataFrame.fillna (:issue:`174`)
+  - Add level keyword to ``drop`` for dropping values from a level (:issue:`159`)
+
+Performance improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+  - Use khash for Series.value_counts, add raw function to algorithms.py (:issue:`861`)
+  - Intercept __builtin__.sum in groupby (:issue:`885`)
+
+
+
+.. _whatsnew_0.7.2.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.7.1..v0.7.2
diff --git a/doc/source/whatsnew/v0.7.2.txt b/doc/source/whatsnew/v0.7.2.txt
deleted file mode 100644
index c711639354139..0000000000000
--- a/doc/source/whatsnew/v0.7.2.txt
+++ /dev/null
@@ -1,27 +0,0 @@
-.. _whatsnew_0702:
-
-v.0.7.2 (March 16, 2012)
----------------------------
-
-This release targets bugs in 0.7.1, and adds a few minor features.
-
-New features
-~~~~~~~~~~~~
-
-  - Add additional tie-breaking methods in DataFrame.rank (:issue:`874`)
-  - Add ascending parameter to rank in Series, DataFrame (:issue:`875`)
-  - Add coerce_float option to DataFrame.from_records (:issue:`893`)
-  - Add sort_columns parameter to allow unsorted plots (:issue:`918`)
-  - Enable column access via attributes on GroupBy (:issue:`882`)
-  - Can pass dict of values to DataFrame.fillna (:issue:`661`)
-  - Can select multiple hierarchical groups by passing list of values in .ix
-    (:issue:`134`)
-  - Add ``axis`` option to DataFrame.fillna (:issue:`174`)
-  - Add level keyword to ``drop`` for dropping values from a level (:issue:`159`)
-
-Performance improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-  - Use khash for Series.value_counts, add raw function to algorithms.py (:issue:`861`)
-  - Intercept __builtin__.sum in groupby (:issue:`885`)
-
diff --git a/doc/source/whatsnew/v0.7.3.rst b/doc/source/whatsnew/v0.7.3.rst
new file mode 100644
index 0000000000000..24bb756d66d68
--- /dev/null
+++ b/doc/source/whatsnew/v0.7.3.rst
@@ -0,0 +1,107 @@
+.. _whatsnew_0703:
+
+v.0.7.3 (April 12, 2012)
+------------------------
+
+{{ header }}
+
+
+This is a minor release from 0.7.2 and fixes many minor bugs and adds a number
+of nice new features. There are also a couple of API changes to note; these
+should not affect very many users, and we are inclined to call them "bug fixes"
+even though they do constitute a change in behavior. See the :ref:`full release
+notes <release>` or issue
+tracker on GitHub for a complete list.
+
+New features
+~~~~~~~~~~~~
+
+- New :ref:`fixed width file reader <io.fwf>`, ``read_fwf``
+- New :ref:`scatter_matrix <visualization.scatter_matrix>` function for making
+  a scatter plot matrix
+
+.. code-block:: python
+
+   from pandas.tools.plotting import scatter_matrix
+   scatter_matrix(df, alpha=0.2)        # noqa F821
+
+.. image:: ../savefig/scatter_matrix_kde.png
+   :width: 5in
+
+- Add ``stacked`` argument to Series and DataFrame's ``plot`` method for
+  :ref:`stacked bar plots <visualization.barplot>`.
+
+.. code-block:: python
+
+   df.plot(kind='bar', stacked=True)    # noqa F821
+
+.. image:: ../savefig/bar_plot_stacked_ex.png
+   :width: 4in
+
+.. code-block:: python
+
+   df.plot(kind='barh', stacked=True)   # noqa F821
+
+.. image:: ../savefig/barh_plot_stacked_ex.png
+   :width: 4in
+
+- Add log x and y :ref:`scaling options <visualization.basic>` to
+  ``DataFrame.plot`` and ``Series.plot``
+- Add ``kurt`` methods to Series and DataFrame for computing kurtosis
+
+
+NA Boolean Comparison API Change
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Reverted some changes to how NA values (represented typically as ``NaN`` or
+``None``) are handled in non-numeric Series:
+
+.. ipython:: python
+
+   series = pd.Series(['Steve', np.nan, 'Joe'])
+   series == 'Steve'
+   series != 'Steve'
+
+In comparisons, NA / NaN will always come through as ``False`` except with
+``!=`` which is ``True``. *Be very careful* with boolean arithmetic, especially
+negation, in the presence of NA data. You may wish to add an explicit NA
+filter into boolean array operations if you are worried about this:
+
+.. ipython:: python
+
+   mask = series == 'Steve'
+   series[mask & series.notnull()]
+
+While propagating NA in comparisons may seem like the right behavior to some
+users (and you could argue on purely technical grounds that this is the right
+thing to do), the evaluation was made that propagating NA everywhere, including
+in numerical arrays, would cause a large amount of problems for users. Thus, a
+"practicality beats purity" approach was taken. This issue may be revisited at
+some point in the future.
+
+Other API Changes
+~~~~~~~~~~~~~~~~~
+
+When calling ``apply`` on a grouped Series, the return value will also be a
+Series, to be more consistent with the ``groupby`` behavior with DataFrame:
+
+.. ipython:: python
+    :okwarning:
+
+    df = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                             'foo', 'bar', 'foo', 'foo'],
+                       'B': ['one', 'one', 'two', 'three',
+                             'two', 'two', 'one', 'three'],
+                       'C': np.random.randn(8), 'D': np.random.randn(8)})
+    df
+    grouped = df.groupby('A')['C']
+    grouped.describe()
+    grouped.apply(lambda x: x.sort_values()[-2:])    # top 2 values
+
+
+.. _whatsnew_0.7.3.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.7.2..v0.7.3
diff --git a/doc/source/whatsnew/v0.7.3.txt b/doc/source/whatsnew/v0.7.3.txt
deleted file mode 100644
index 6b5199c55cbf5..0000000000000
--- a/doc/source/whatsnew/v0.7.3.txt
+++ /dev/null
@@ -1,96 +0,0 @@
-.. _whatsnew_0703:
-
-v.0.7.3 (April 12, 2012)
-------------------------
-
-This is a minor release from 0.7.2 and fixes many minor bugs and adds a number
-of nice new features. There are also a couple of API changes to note; these
-should not affect very many users, and we are inclined to call them "bug fixes"
-even though they do constitute a change in behavior. See the :ref:`full release
-notes <release>` or issue
-tracker on GitHub for a complete list.
-
-New features
-~~~~~~~~~~~~
-
-- New :ref:`fixed width file reader <io.fwf>`, ``read_fwf``
-- New :ref:`scatter_matrix <visualization.scatter_matrix>` function for making
-  a scatter plot matrix
-
-.. code-block:: python
-
-   from pandas.tools.plotting import scatter_matrix
-   scatter_matrix(df, alpha=0.2)
-
-.. image:: _static/scatter_matrix_kde.png
-   :width: 5in
-
-- Add ``stacked`` argument to Series and DataFrame's ``plot`` method for
-  :ref:`stacked bar plots <visualization.barplot>`.
-
-.. code-block:: python
-
-   df.plot(kind='bar', stacked=True)
-
-.. image:: _static/bar_plot_stacked_ex.png
-   :width: 4in
-
-.. code-block:: python
-
-   df.plot(kind='barh', stacked=True)
-
-.. image:: _static/barh_plot_stacked_ex.png
-   :width: 4in
-
-- Add log x and y :ref:`scaling options <visualization.basic>` to
-  ``DataFrame.plot`` and ``Series.plot``
-- Add ``kurt`` methods to Series and DataFrame for computing kurtosis
-
-
-NA Boolean Comparison API Change
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Reverted some changes to how NA values (represented typically as ``NaN`` or
-``None``) are handled in non-numeric Series:
-
-.. ipython:: python
-
-   series = Series(['Steve', np.nan, 'Joe'])
-   series == 'Steve'
-   series != 'Steve'
-
-In comparisons, NA / NaN will always come through as ``False`` except with
-``!=`` which is ``True``. *Be very careful* with boolean arithmetic, especially
-negation, in the presence of NA data. You may wish to add an explicit NA
-filter into boolean array operations if you are worried about this:
-
-.. ipython:: python
-
-   mask = series == 'Steve'
-   series[mask & series.notnull()]
-
-While propagating NA in comparisons may seem like the right behavior to some
-users (and you could argue on purely technical grounds that this is the right
-thing to do), the evaluation was made that propagating NA everywhere, including
-in numerical arrays, would cause a large amount of problems for users. Thus, a
-"practicality beats purity" approach was taken. This issue may be revisited at
-some point in the future.
-
-Other API Changes
-~~~~~~~~~~~~~~~~~
-
-When calling ``apply`` on a grouped Series, the return value will also be a
-Series, to be more consistent with the ``groupby`` behavior with DataFrame:
-
-.. ipython:: python
-    :okwarning:
-
-    df = DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-                        'foo', 'bar', 'foo', 'foo'],
-                    'B' : ['one', 'one', 'two', 'three',
-                           'two', 'two', 'one', 'three'],
-                    'C' : np.random.randn(8), 'D' : np.random.randn(8)})
-    df
-    grouped = df.groupby('A')['C']
-    grouped.describe()
-    grouped.apply(lambda x: x.sort_values()[-2:]) # top 2 values
diff --git a/doc/source/whatsnew/v0.8.0.rst b/doc/source/whatsnew/v0.8.0.rst
new file mode 100644
index 0000000000000..575ec6b7d19f4
--- /dev/null
+++ b/doc/source/whatsnew/v0.8.0.rst
@@ -0,0 +1,282 @@
+.. _whatsnew_080:
+
+v0.8.0 (June 29, 2012)
+------------------------
+
+{{ header }}
+
+
+This is a major release from 0.7.3 and includes extensive work on the time
+series handling and processing infrastructure as well as a great deal of new
+functionality throughout the library. It includes over 700 commits from more
+than 20 distinct authors. Most pandas 0.7.3 and earlier users should not
+experience any issues upgrading, but due to the migration to the NumPy
+datetime64 dtype, there may be a number of bugs and incompatibilities
+lurking. Lingering incompatibilities will be fixed ASAP in a 0.8.1 release if
+necessary. See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+Support for non-unique indexes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+All objects can now work with non-unique indexes. Data alignment / join
+operations work according to SQL join semantics (including, if application,
+index duplication in many-to-many joins)
+
+NumPy datetime64 dtype and 1.6 dependency
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Time series data are now represented using NumPy's datetime64 dtype; thus,
+pandas 0.8.0 now requires at least NumPy 1.6. It has been tested and verified
+to work with the development version (1.7+) of NumPy as well which includes
+some significant user-facing API changes. NumPy 1.6 also has a number of bugs
+having to do with nanosecond resolution data, so I recommend that you steer
+clear of NumPy 1.6's datetime64 API functions (though limited as they are) and
+only interact with this data using the interface that pandas provides.
+
+See the end of the 0.8.0 section for a "porting" guide listing potential issues
+for users migrating legacy code bases from pandas 0.7 or earlier to 0.8.0.
+
+Bug fixes to the 0.7.x series for legacy NumPy < 1.6 users will be provided as
+they arise. There will be no more further development in 0.7.x beyond bug
+fixes.
+
+Time series changes and improvements
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+    With this release, legacy scikits.timeseries users should be able to port
+    their code to use pandas.
+
+.. note::
+
+    See :ref:`documentation <timeseries>` for overview of pandas timeseries API.
+
+- New datetime64 representation **speeds up join operations and data
+  alignment**, **reduces memory usage**, and improve serialization /
+  deserialization performance significantly over datetime.datetime
+- High performance and flexible **resample** method for converting from
+  high-to-low and low-to-high frequency. Supports interpolation, user-defined
+  aggregation functions, and control over how the intervals and result labeling
+  are defined. A suite of high performance Cython/C-based resampling functions
+  (including Open-High-Low-Close) have also been implemented.
+- Revamp of :ref:`frequency aliases <timeseries.offset_aliases>` and support for
+  **frequency shortcuts** like '15min', or '1h30min'
+- New :ref:`DatetimeIndex class <timeseries.datetimeindex>` supports both fixed
+  frequency and irregular time
+  series. Replaces now deprecated DateRange class
+- New ``PeriodIndex`` and ``Period`` classes for representing
+  :ref:`time spans <timeseries.periods>` and performing **calendar logic**,
+  including the `12 fiscal quarterly frequencies <timeseries.quarterly>`.
+  This is a partial port of, and a substantial enhancement to,
+  elements of the scikits.timeseries code base. Support for conversion between
+  PeriodIndex and DatetimeIndex
+- New Timestamp data type subclasses `datetime.datetime`, providing the same
+  interface while enabling working with nanosecond-resolution data. Also
+  provides :ref:`easy time zone conversions <timeseries.timezone>`.
+- Enhanced support for :ref:`time zones <timeseries.timezone>`. Add
+  `tz_convert` and ``tz_lcoalize`` methods to TimeSeries and DataFrame. All
+  timestamps are stored as UTC; Timestamps from DatetimeIndex objects with time
+  zone set will be localized to local time. Time zone conversions are therefore
+  essentially free. User needs to know very little about pytz library now; only
+  time zone names as as strings are required. Time zone-aware timestamps are
+  equal if and only if their UTC timestamps match. Operations between time
+  zone-aware time series with different time zones will result in a UTC-indexed
+  time series.
+- Time series **string indexing conveniences** / shortcuts: slice years, year
+  and month, and index values with strings
+- Enhanced time series **plotting**; adaptation of scikits.timeseries
+  matplotlib-based plotting code
+- New ``date_range``, ``bdate_range``, and ``period_range`` :ref:`factory
+  functions <timeseries.daterange>`
+- Robust **frequency inference** function `infer_freq` and ``inferred_freq``
+  property of DatetimeIndex, with option to infer frequency on construction of
+  DatetimeIndex
+- to_datetime function efficiently **parses array of strings** to
+  DatetimeIndex. DatetimeIndex will parse array or list of strings to
+  datetime64
+- **Optimized** support for datetime64-dtype data in Series and DataFrame
+  columns
+- New NaT (Not-a-Time) type to represent **NA** in timestamp arrays
+- Optimize Series.asof for looking up **"as of" values** for arrays of
+  timestamps
+- Milli, Micro, Nano date offset objects
+- Can index time series with datetime.time objects to select all data at
+  particular **time of day** (``TimeSeries.at_time``) or **between two times**
+  (``TimeSeries.between_time``)
+- Add :ref:`tshift <timeseries.advanced_datetime>` method for leading/lagging
+  using the frequency (if any) of the index, as opposed to a naive lead/lag
+  using shift
+
+Other new features
+~~~~~~~~~~~~~~~~~~
+
+- New :ref:`cut <reshaping.tile.cut>` and ``qcut`` functions (like R's cut
+  function) for computing a categorical variable from a continuous variable by
+  binning values either into value-based (``cut``) or quantile-based (``qcut``)
+  bins
+- Rename ``Factor`` to ``Categorical`` and add a number of usability features
+- Add :ref:`limit <missing_data.fillna.limit>` argument to fillna/reindex
+- More flexible multiple function application in GroupBy, and can pass list
+  (name, function) tuples to get result in particular order with given names
+- Add flexible :ref:`replace <missing_data.replace>` method for efficiently
+  substituting values
+- Enhanced :ref:`read_csv/read_table <io.parse_dates>` for reading time series
+  data and converting multiple columns to dates
+- Add :ref:`comments <io.comments>` option to parser functions: read_csv, etc.
+- Add :ref:`dayfirst <io.dayfirst>` option to parser functions for parsing
+  international DD/MM/YYYY dates
+- Allow the user to specify the CSV reader :ref:`dialect <io.dialect>` to
+  control quoting etc.
+- Handling :ref:`thousands <io.thousands>` separators in read_csv to improve
+  integer parsing.
+- Enable unstacking of multiple levels in one shot. Alleviate ``pivot_table``
+  bugs (empty columns being introduced)
+- Move to klib-based hash tables for indexing; better performance and less
+  memory usage than Python's dict
+- Add first, last, min, max, and prod optimized GroupBy functions
+- New :ref:`ordered_merge <merging.merge_ordered>` function
+- Add flexible :ref:`comparison <basics.binop>` instance methods eq, ne, lt,
+  gt, etc. to DataFrame, Series
+- Improve :ref:`scatter_matrix <visualization.scatter_matrix>` plotting
+  function and add histogram or kernel density estimates to diagonal
+- Add :ref:`'kde' <visualization.kde>` plot option for density plots
+- Support for converting DataFrame to R data.frame through rpy2
+- Improved support for complex numbers in Series and DataFrame
+- Add :ref:`pct_change <computation.pct_change>` method to all data structures
+- Add max_colwidth configuration option for DataFrame console output
+- :ref:`Interpolate <missing_data.interpolate>` Series values using index values
+- Can select multiple columns from GroupBy
+- Add :ref:`update <merging.combine_first.update>` methods to Series/DataFrame
+  for updating values in place
+- Add ``any`` and ``all`` method to DataFrame
+
+New plotting methods
+~~~~~~~~~~~~~~~~~~~~
+
+.. ipython:: python
+   :suppress:
+
+   import pandas as pd
+   fx = pd.read_pickle('data/fx_prices')
+   import matplotlib.pyplot as plt
+
+``Series.plot`` now supports a ``secondary_y`` option:
+
+.. ipython:: python
+
+   plt.figure()
+
+   fx['FR'].plot(style='g')
+
+   fx['IT'].plot(style='k--', secondary_y=True)
+
+Vytautas Jancauskas, the 2012 GSOC participant, has added many new plot
+types. For example, ``'kde'`` is a new option:
+
+.. ipython:: python
+
+   s = pd.Series(np.concatenate((np.random.randn(1000),
+                                 np.random.randn(1000) * 0.5 + 3)))
+   plt.figure()
+   s.hist(density=True, alpha=0.2)
+   s.plot(kind='kde')
+
+See :ref:`the plotting page <visualization.other>` for much more.
+
+Other API changes
+~~~~~~~~~~~~~~~~~
+
+- Deprecation of ``offset``, ``time_rule``, and ``timeRule`` arguments names in
+  time series functions. Warnings will be printed until pandas 0.9 or 1.0.
+
+Potential porting issues for pandas <= 0.7.3 users
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The major change that may affect you in pandas 0.8.0 is that time series
+indexes use NumPy's ``datetime64`` data type instead of ``dtype=object`` arrays
+of Python's built-in ``datetime.datetime`` objects. ``DateRange`` has been
+replaced by ``DatetimeIndex`` but otherwise behaved identically. But, if you
+have code that converts ``DateRange`` or ``Index`` objects that used to contain
+``datetime.datetime`` values to plain NumPy arrays, you may have bugs lurking
+with code using scalar values because you are handing control over to NumPy:
+
+.. ipython:: python
+
+   import datetime
+   rng = pd.date_range('1/1/2000', periods=10)
+   rng[5]
+   isinstance(rng[5], datetime.datetime)
+   rng_asarray = np.asarray(rng)
+   scalar_val = rng_asarray[5]
+   type(scalar_val)
+
+pandas's ``Timestamp`` object is a subclass of ``datetime.datetime`` that has
+nanosecond support (the ``nanosecond`` field store the nanosecond value between
+0 and 999). It should substitute directly into any code that used
+``datetime.datetime`` values before. Thus, I recommend not casting
+``DatetimeIndex`` to regular NumPy arrays.
+
+If you have code that requires an array of ``datetime.datetime`` objects, you
+have a couple of options. First, the ``astype(object)`` method of ``DatetimeIndex``
+produces an array of ``Timestamp`` objects:
+
+.. ipython:: python
+
+   stamp_array = rng.astype(object)
+   stamp_array
+   stamp_array[5]
+
+To get an array of proper ``datetime.datetime`` objects, use the
+``to_pydatetime`` method:
+
+.. ipython:: python
+
+   dt_array = rng.to_pydatetime()
+   dt_array
+   dt_array[5]
+
+matplotlib knows how to handle ``datetime.datetime`` but not Timestamp
+objects. While I recommend that you plot time series using ``TimeSeries.plot``,
+you can either use ``to_pydatetime`` or register a converter for the Timestamp
+type. See `matplotlib documentation
+<http://matplotlib.org/api/units_api.html>`__ for more on this.
+
+.. warning::
+
+    There are bugs in the user-facing API with the nanosecond datetime64 unit
+    in NumPy 1.6. In particular, the string version of the array shows garbage
+    values, and conversion to ``dtype=object`` is similarly broken.
+
+    .. ipython:: python
+
+       rng = pd.date_range('1/1/2000', periods=10)
+       rng
+       np.asarray(rng)
+       converted = np.asarray(rng, dtype=object)
+       converted[5]
+
+    **Trust me: don't panic**. If you are using NumPy 1.6 and restrict your
+    interaction with ``datetime64`` values to pandas's API you will be just
+    fine. There is nothing wrong with the data-type (a 64-bit integer
+    internally); all of the important data processing happens in pandas and is
+    heavily tested. I strongly recommend that you **do not work directly with
+    datetime64 arrays in NumPy 1.6** and only use the pandas API.
+
+
+**Support for non-unique indexes**: In the latter case, you may have code
+inside a ``try:... catch:`` block that failed due to the index not being
+unique. In many cases it will no longer fail (some method like ``append`` still
+check for uniqueness unless disabled). However, all is not lost: you can
+inspect ``index.is_unique`` and raise an exception explicitly if it is
+``False`` or go to a different code branch.
+
+
+.. _whatsnew_0.8.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.7.3..v0.8.0
diff --git a/doc/source/whatsnew/v0.8.0.txt b/doc/source/whatsnew/v0.8.0.txt
deleted file mode 100644
index 4136c108fba57..0000000000000
--- a/doc/source/whatsnew/v0.8.0.txt
+++ /dev/null
@@ -1,273 +0,0 @@
-.. _whatsnew_080:
-
-v0.8.0 (June 29, 2012)
-------------------------
-
-This is a major release from 0.7.3 and includes extensive work on the time
-series handling and processing infrastructure as well as a great deal of new
-functionality throughout the library. It includes over 700 commits from more
-than 20 distinct authors. Most pandas 0.7.3 and earlier users should not
-experience any issues upgrading, but due to the migration to the NumPy
-datetime64 dtype, there may be a number of bugs and incompatibilities
-lurking. Lingering incompatibilities will be fixed ASAP in a 0.8.1 release if
-necessary. See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
-
-Support for non-unique indexes
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-All objects can now work with non-unique indexes. Data alignment / join
-operations work according to SQL join semantics (including, if application,
-index duplication in many-to-many joins)
-
-NumPy datetime64 dtype and 1.6 dependency
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-Time series data are now represented using NumPy's datetime64 dtype; thus,
-pandas 0.8.0 now requires at least NumPy 1.6. It has been tested and verified
-to work with the development version (1.7+) of NumPy as well which includes
-some significant user-facing API changes. NumPy 1.6 also has a number of bugs
-having to do with nanosecond resolution data, so I recommend that you steer
-clear of NumPy 1.6's datetime64 API functions (though limited as they are) and
-only interact with this data using the interface that pandas provides.
-
-See the end of the 0.8.0 section for a "porting" guide listing potential issues
-for users migrating legacy codebases from pandas 0.7 or earlier to 0.8.0.
-
-Bug fixes to the 0.7.x series for legacy NumPy < 1.6 users will be provided as
-they arise. There will be no more further development in 0.7.x beyond bug
-fixes.
-
-Time series changes and improvements
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-.. note::
-
-    With this release, legacy scikits.timeseries users should be able to port
-    their code to use pandas.
-
-.. note::
-
-    See :ref:`documentation <timeseries>` for overview of pandas timeseries API.
-
-- New datetime64 representation **speeds up join operations and data
-  alignment**, **reduces memory usage**, and improve serialization /
-  deserialization performance significantly over datetime.datetime
-- High performance and flexible **resample** method for converting from
-  high-to-low and low-to-high frequency. Supports interpolation, user-defined
-  aggregation functions, and control over how the intervals and result labeling
-  are defined. A suite of high performance Cython/C-based resampling functions
-  (including Open-High-Low-Close) have also been implemented.
-- Revamp of :ref:`frequency aliases <timeseries.offset_aliases>` and support for
-  **frequency shortcuts** like '15min', or '1h30min'
-- New :ref:`DatetimeIndex class <timeseries.datetimeindex>` supports both fixed
-  frequency and irregular time
-  series. Replaces now deprecated DateRange class
-- New ``PeriodIndex`` and ``Period`` classes for representing
-  :ref:`time spans <timeseries.periods>` and performing **calendar logic**,
-  including the `12 fiscal quarterly frequencies <timeseries.quarterly>`.
-  This is a partial port of, and a substantial enhancement to,
-  elements of the scikits.timeseries codebase. Support for conversion between
-  PeriodIndex and DatetimeIndex
-- New Timestamp data type subclasses `datetime.datetime`, providing the same
-  interface while enabling working with nanosecond-resolution data. Also
-  provides :ref:`easy time zone conversions <timeseries.timezone>`.
-- Enhanced support for :ref:`time zones <timeseries.timezone>`. Add
-  `tz_convert` and ``tz_lcoalize`` methods to TimeSeries and DataFrame. All
-  timestamps are stored as UTC; Timestamps from DatetimeIndex objects with time
-  zone set will be localized to localtime. Time zone conversions are therefore
-  essentially free. User needs to know very little about pytz library now; only
-  time zone names as as strings are required. Time zone-aware timestamps are
-  equal if and only if their UTC timestamps match. Operations between time
-  zone-aware time series with different time zones will result in a UTC-indexed
-  time series.
-- Time series **string indexing conveniences** / shortcuts: slice years, year
-  and month, and index values with strings
-- Enhanced time series **plotting**; adaptation of scikits.timeseries
-  matplotlib-based plotting code
-- New ``date_range``, ``bdate_range``, and ``period_range`` :ref:`factory
-  functions <timeseries.daterange>`
-- Robust **frequency inference** function `infer_freq` and ``inferred_freq``
-  property of DatetimeIndex, with option to infer frequency on construction of
-  DatetimeIndex
-- to_datetime function efficiently **parses array of strings** to
-  DatetimeIndex. DatetimeIndex will parse array or list of strings to
-  datetime64
-- **Optimized** support for datetime64-dtype data in Series and DataFrame
-  columns
-- New NaT (Not-a-Time) type to represent **NA** in timestamp arrays
-- Optimize Series.asof for looking up **"as of" values** for arrays of
-  timestamps
-- Milli, Micro, Nano date offset objects
-- Can index time series with datetime.time objects to select all data at
-  particular **time of day** (``TimeSeries.at_time``) or **between two times**
-  (``TimeSeries.between_time``)
-- Add :ref:`tshift <timeseries.advanced_datetime>` method for leading/lagging
-  using the frequency (if any) of the index, as opposed to a naive lead/lag
-  using shift
-
-Other new features
-~~~~~~~~~~~~~~~~~~
-
-- New :ref:`cut <reshaping.tile.cut>` and ``qcut`` functions (like R's cut
-  function) for computing a categorical variable from a continuous variable by
-  binning values either into value-based (``cut``) or quantile-based (``qcut``)
-  bins
-- Rename ``Factor`` to ``Categorical`` and add a number of usability features
-- Add :ref:`limit <missing_data.fillna.limit>` argument to fillna/reindex
-- More flexible multiple function application in GroupBy, and can pass list
-  (name, function) tuples to get result in particular order with given names
-- Add flexible :ref:`replace <missing_data.replace>` method for efficiently
-  substituting values
-- Enhanced :ref:`read_csv/read_table <io.parse_dates>` for reading time series
-  data and converting multiple columns to dates
-- Add :ref:`comments <io.comments>` option to parser functions: read_csv, etc.
-- Add :ref`dayfirst <io.dayfirst>` option to parser functions for parsing
-  international DD/MM/YYYY dates
-- Allow the user to specify the CSV reader :ref:`dialect <io.dialect>` to
-  control quoting etc.
-- Handling :ref:`thousands <io.thousands>` separators in read_csv to improve
-  integer parsing.
-- Enable unstacking of multiple levels in one shot. Alleviate ``pivot_table``
-  bugs (empty columns being introduced)
-- Move to klib-based hash tables for indexing; better performance and less
-  memory usage than Python's dict
-- Add first, last, min, max, and prod optimized GroupBy functions
-- New :ref:`ordered_merge <merging.merge_ordered>` function
-- Add flexible :ref:`comparison <basics.binop>` instance methods eq, ne, lt,
-  gt, etc. to DataFrame, Series
-- Improve :ref:`scatter_matrix <visualization.scatter_matrix>` plotting
-  function and add histogram or kernel density estimates to diagonal
-- Add :ref:`'kde' <visualization.kde>` plot option for density plots
-- Support for converting DataFrame to R data.frame through rpy2
-- Improved support for complex numbers in Series and DataFrame
-- Add :ref:`pct_change <computation.pct_change>` method to all data structures
-- Add max_colwidth configuration option for DataFrame console output
-- :ref:`Interpolate <missing_data.interpolate>` Series values using index values
-- Can select multiple columns from GroupBy
-- Add :ref:`update <merging.combine_first.update>` methods to Series/DataFrame
-  for updating values in place
-- Add ``any`` and ``all`` method to DataFrame
-
-New plotting methods
-~~~~~~~~~~~~~~~~~~~~
-
-.. ipython:: python
-   :suppress:
-
-   import pandas as pd
-   fx = pd.read_pickle('data/fx_prices')
-   import matplotlib.pyplot as plt
-
-``Series.plot`` now supports a ``secondary_y`` option:
-
-.. ipython:: python
-
-   plt.figure()
-
-   fx['FR'].plot(style='g')
-
-   @savefig whatsnew_secondary_y.png
-   fx['IT'].plot(style='k--', secondary_y=True)
-
-Vytautas Jancauskas, the 2012 GSOC participant, has added many new plot
-types. For example, ``'kde'`` is a new option:
-
-.. ipython:: python
-
-   s = Series(np.concatenate((np.random.randn(1000),
-                              np.random.randn(1000) * 0.5 + 3)))
-   plt.figure()
-   s.hist(normed=True, alpha=0.2)
-   @savefig whatsnew_kde.png
-   s.plot(kind='kde')
-
-See :ref:`the plotting page <visualization.other>` for much more.
-
-Other API changes
-~~~~~~~~~~~~~~~~~
-
-- Deprecation of ``offset``, ``time_rule``, and ``timeRule`` arguments names in
-  time series functions. Warnings will be printed until pandas 0.9 or 1.0.
-
-Potential porting issues for pandas <= 0.7.3 users
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-
-The major change that may affect you in pandas 0.8.0 is that time series
-indexes use NumPy's ``datetime64`` data type instead of ``dtype=object`` arrays
-of Python's built-in ``datetime.datetime`` objects. ``DateRange`` has been
-replaced by ``DatetimeIndex`` but otherwise behaved identically. But, if you
-have code that converts ``DateRange`` or ``Index`` objects that used to contain
-``datetime.datetime`` values to plain NumPy arrays, you may have bugs lurking
-with code using scalar values because you are handing control over to NumPy:
-
-.. ipython:: python
-
-   import datetime
-   rng = date_range('1/1/2000', periods=10)
-   rng[5]
-   isinstance(rng[5], datetime.datetime)
-   rng_asarray = np.asarray(rng)
-   scalar_val = rng_asarray[5]
-   type(scalar_val)
-
-pandas's ``Timestamp`` object is a subclass of ``datetime.datetime`` that has
-nanosecond support (the ``nanosecond`` field store the nanosecond value between
-0 and 999). It should substitute directly into any code that used
-``datetime.datetime`` values before. Thus, I recommend not casting
-``DatetimeIndex`` to regular NumPy arrays.
-
-If you have code that requires an array of ``datetime.datetime`` objects, you
-have a couple of options. First, the ``asobject`` property of ``DatetimeIndex``
-produces an array of ``Timestamp`` objects:
-
-.. ipython:: python
-
-   stamp_array = rng.asobject
-   stamp_array
-   stamp_array[5]
-
-To get an array of proper ``datetime.datetime`` objects, use the
-``to_pydatetime`` method:
-
-.. ipython:: python
-
-   dt_array = rng.to_pydatetime()
-   dt_array
-   dt_array[5]
-
-matplotlib knows how to handle ``datetime.datetime`` but not Timestamp
-objects. While I recommend that you plot time series using ``TimeSeries.plot``,
-you can either use ``to_pydatetime`` or register a converter for the Timestamp
-type. See `matplotlib documentation
-<http://matplotlib.org/api/units_api.html>`__ for more on this.
-
-.. warning::
-
-    There are bugs in the user-facing API with the nanosecond datetime64 unit
-    in NumPy 1.6. In particular, the string version of the array shows garbage
-    values, and conversion to ``dtype=object`` is similarly broken.
-
-    .. ipython:: python
-
-       rng = date_range('1/1/2000', periods=10)
-       rng
-       np.asarray(rng)
-       converted = np.asarray(rng, dtype=object)
-       converted[5]
-
-    **Trust me: don't panic**. If you are using NumPy 1.6 and restrict your
-    interaction with ``datetime64`` values to pandas's API you will be just
-    fine. There is nothing wrong with the data-type (a 64-bit integer
-    internally); all of the important data processing happens in pandas and is
-    heavily tested. I strongly recommend that you **do not work directly with
-    datetime64 arrays in NumPy 1.6** and only use the pandas API.
-
-
-**Support for non-unique indexes**: In the latter case, you may have code
-inside a ``try:... catch:`` block that failed due to the index not being
-unique. In many cases it will no longer fail (some method like ``append`` still
-check for uniqueness unless disabled). However, all is not lost: you can
-inspect ``index.is_unique`` and raise an exception explicitly if it is
-``False`` or go to a different code branch.
diff --git a/doc/source/whatsnew/v0.8.1.rst b/doc/source/whatsnew/v0.8.1.rst
new file mode 100644
index 0000000000000..aaf1778bf637d
--- /dev/null
+++ b/doc/source/whatsnew/v0.8.1.rst
@@ -0,0 +1,47 @@
+.. _whatsnew_0801:
+
+v0.8.1 (July 22, 2012)
+----------------------
+
+{{ header }}
+
+
+This release includes a few new features, performance enhancements, and over 30
+bug fixes from 0.8.0.  New features include notably NA friendly string
+processing functionality and a series of new plot types and options.
+
+New features
+~~~~~~~~~~~~
+
+  - Add :ref:`vectorized string processing methods <text.string_methods>`
+    accessible via Series.str (:issue:`620`)
+  - Add option to disable adjustment in EWMA (:issue:`1584`)
+  - :ref:`Radviz plot <visualization.radviz>` (:issue:`1566`)
+  - :ref:`Parallel coordinates plot <visualization.parallel_coordinates>`
+  - :ref:`Bootstrap plot <visualization.bootstrap>`
+  - Per column styles and secondary y-axis plotting (:issue:`1559`)
+  - New datetime converters millisecond plotting  (:issue:`1599`)
+  - Add option to disable "sparse" display of hierarchical indexes (:issue:`1538`)
+  - Series/DataFrame's ``set_index`` method can :ref:`append levels
+    <indexing.set_index>` to an existing Index/MultiIndex (:issue:`1569`, :issue:`1577`)
+
+Performance improvements
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+  - Improved implementation of rolling min and max (thanks to `Bottleneck
+    <http://berkeleyanalytics.com/bottleneck/>`__ !)
+  - Add accelerated ``'median'`` GroupBy option (:issue:`1358`)
+  - Significantly improve the performance of parsing ISO8601-format date
+    strings with ``DatetimeIndex`` or ``to_datetime`` (:issue:`1571`)
+  - Improve the performance of GroupBy on single-key aggregations and use with
+    Categorical types
+  - Significant datetime parsing performance improvements
+
+
+
+.. _whatsnew_0.8.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.8.0..v0.8.1
diff --git a/doc/source/whatsnew/v0.8.1.txt b/doc/source/whatsnew/v0.8.1.txt
deleted file mode 100644
index 8227bc6bc9c66..0000000000000
--- a/doc/source/whatsnew/v0.8.1.txt
+++ /dev/null
@@ -1,36 +0,0 @@
-.. _whatsnew_0801:
-
-v0.8.1 (July 22, 2012)
-----------------------
-
-This release includes a few new features, performance enhancements, and over 30
-bug fixes from 0.8.0.  New features include notably NA friendly string
-processing functionality and a series of new plot types and options.
-
-New features
-~~~~~~~~~~~~
-
-  - Add :ref:`vectorized string processing methods <text.string_methods>`
-    accessible via Series.str (:issue:`620`)
-  - Add option to disable adjustment in EWMA (:issue:`1584`)
-  - :ref:`Radviz plot <visualization.radviz>` (:issue:`1566`)
-  - :ref:`Parallel coordinates plot <visualization.parallel_coordinates>`
-  - :ref:`Bootstrap plot <visualization.bootstrap>`
-  - Per column styles and secondary y-axis plotting (:issue:`1559`)
-  - New datetime converters millisecond plotting  (:issue:`1599`)
-  - Add option to disable "sparse" display of hierarchical indexes (:issue:`1538`)
-  - Series/DataFrame's ``set_index`` method can :ref:`append levels
-    <indexing.set_index>` to an existing Index/MultiIndex (:issue:`1569`, :issue:`1577`)
-
-Performance improvements
-~~~~~~~~~~~~~~~~~~~~~~~~
-
-  - Improved implementation of rolling min and max (thanks to `Bottleneck
-    <http://berkeleyanalytics.com/bottleneck/>`__ !)
-  - Add accelerated ``'median'`` GroupBy option (:issue:`1358`)
-  - Significantly improve the performance of parsing ISO8601-format date
-    strings with ``DatetimeIndex`` or ``to_datetime`` (:issue:`1571`)
-  - Improve the performance of GroupBy on single-key aggregations and use with
-    Categorical types
-  - Significant datetime parsing performance improvments
-
diff --git a/doc/source/whatsnew/v0.9.0.rst b/doc/source/whatsnew/v0.9.0.rst
new file mode 100644
index 0000000000000..3d9ff3c7a89fd
--- /dev/null
+++ b/doc/source/whatsnew/v0.9.0.rst
@@ -0,0 +1,107 @@
+.. _whatsnew_0900:
+
+{{ header }}
+
+
+v0.9.0 (October 7, 2012)
+------------------------
+
+This is a major release from 0.8.1 and includes several new features and
+enhancements along with a large number of bug fixes. New features include
+vectorized unicode encoding/decoding for `Series.str`, `to_latex` method to
+DataFrame, more flexible parsing of boolean values, and enabling the download of
+options data from Yahoo! Finance.
+
+New features
+~~~~~~~~~~~~
+
+  - Add ``encode`` and ``decode`` for unicode handling to :ref:`vectorized
+    string processing methods <text.string_methods>` in Series.str  (:issue:`1706`)
+  - Add ``DataFrame.to_latex`` method (:issue:`1735`)
+  - Add convenient expanding window equivalents of all rolling_* ops (:issue:`1785`)
+  - Add Options class to pandas.io.data for fetching options data from Yahoo!
+    Finance (:issue:`1748`, :issue:`1739`)
+  - More flexible parsing of boolean values (Yes, No, TRUE, FALSE, etc)
+    (:issue:`1691`, :issue:`1295`)
+  - Add ``level`` parameter to ``Series.reset_index``
+  - ``TimeSeries.between_time`` can now select times across midnight (:issue:`1871`)
+  - Series constructor can now handle generator as input (:issue:`1679`)
+  - ``DataFrame.dropna`` can now take multiple axes (tuple/list) as input
+    (:issue:`924`)
+  - Enable ``skip_footer`` parameter in ``ExcelFile.parse`` (:issue:`1843`)
+
+API changes
+~~~~~~~~~~~
+
+  - The default column names when ``header=None`` and no columns names passed to
+    functions like ``read_csv`` has changed to be more Pythonic and amenable to
+    attribute access:
+
+.. ipython:: python
+
+   import io
+
+   data = ('0,0,1\n'
+           '1,1,0\n'
+           '0,1,0')
+   df = pd.read_csv(io.StringIO(data), header=None)
+   df
+
+
+- Creating a Series from another Series, passing an index, will cause reindexing
+  to happen inside rather than treating the Series like an ndarray. Technically
+  improper usages like ``Series(df[col1], index=df[col2])`` that worked before
+  "by accident" (this was never intended) will lead to all NA Series in some
+  cases. To be perfectly clear:
+
+.. ipython:: python
+
+   s1 = pd.Series([1, 2, 3])
+   s1
+
+   s2 = pd.Series(s1, index=['foo', 'bar', 'baz'])
+   s2
+
+- Deprecated ``day_of_year`` API removed from PeriodIndex, use ``dayofyear``
+  (:issue:`1723`)
+
+- Don't modify NumPy suppress printoption to True at import time
+
+- The internal HDF5 data arrangement for DataFrames has been transposed.  Legacy
+  files will still be readable by HDFStore (:issue:`1834`, :issue:`1824`)
+
+- Legacy cruft removed: pandas.stats.misc.quantileTS
+
+- Use ISO8601 format for Period repr: monthly, daily, and on down (:issue:`1776`)
+
+- Empty DataFrame columns are now created as object dtype. This will prevent a
+  class of TypeErrors that was occurring in code where the dtype of a column
+  would depend on the presence of data or not (e.g. a SQL query having results)
+  (:issue:`1783`)
+
+- Setting parts of DataFrame/Panel using ix now aligns input Series/DataFrame
+  (:issue:`1630`)
+
+- ``first`` and ``last`` methods in ``GroupBy`` no longer drop non-numeric
+  columns (:issue:`1809`)
+
+- Resolved inconsistencies in specifying custom NA values in text parser.
+  ``na_values`` of type dict no longer override default NAs unless
+  ``keep_default_na`` is set to false explicitly (:issue:`1657`)
+
+- ``DataFrame.dot`` will not do data alignment, and also work with Series
+  (:issue:`1915`)
+
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+
+.. _whatsnew_0.9.0.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.8.1..v0.9.0
diff --git a/doc/source/whatsnew/v0.9.0.txt b/doc/source/whatsnew/v0.9.0.txt
deleted file mode 100644
index b60fb9cc64f4a..0000000000000
--- a/doc/source/whatsnew/v0.9.0.txt
+++ /dev/null
@@ -1,97 +0,0 @@
-.. _whatsnew_0900:
-
-.. ipython:: python
-   :suppress:
-
-   from pandas.compat import StringIO
-
-v0.9.0 (October 7, 2012)
-------------------------
-
-This is a major release from 0.8.1 and includes several new features and
-enhancements along with a large number of bug fixes. New features include
-vectorized unicode encoding/decoding for `Series.str`, `to_latex` method to
-DataFrame, more flexible parsing of boolean values, and enabling the download of
-options data from Yahoo! Finance.
-
-New features
-~~~~~~~~~~~~
-
-  - Add ``encode`` and ``decode`` for unicode handling to :ref:`vectorized
-    string processing methods <text.string_methods>` in Series.str  (:issue:`1706`)
-  - Add ``DataFrame.to_latex`` method (:issue:`1735`)
-  - Add convenient expanding window equivalents of all rolling_* ops (:issue:`1785`)
-  - Add Options class to pandas.io.data for fetching options data from Yahoo!
-    Finance (:issue:`1748`, :issue:`1739`)
-  - More flexible parsing of boolean values (Yes, No, TRUE, FALSE, etc)
-    (:issue:`1691`, :issue:`1295`)
-  - Add ``level`` parameter to ``Series.reset_index``
-  - ``TimeSeries.between_time`` can now select times across midnight (:issue:`1871`)
-  - Series constructor can now handle generator as input (:issue:`1679`)
-  - ``DataFrame.dropna`` can now take multiple axes (tuple/list) as input
-    (:issue:`924`)
-  - Enable ``skip_footer`` parameter in ``ExcelFile.parse`` (:issue:`1843`)
-
-API changes
-~~~~~~~~~~~
-
-  - The default column names when ``header=None`` and no columns names passed to
-    functions like ``read_csv`` has changed to be more Pythonic and amenable to
-    attribute access:
-
-.. ipython:: python
-
-   data = '0,0,1\n1,1,0\n0,1,0'
-   df = read_csv(StringIO(data), header=None)
-   df
-
-
-- Creating a Series from another Series, passing an index, will cause reindexing
-  to happen inside rather than treating the Series like an ndarray. Technically
-  improper usages like ``Series(df[col1], index=df[col2])`` that worked before
-  "by accident" (this was never intended) will lead to all NA Series in some
-  cases. To be perfectly clear:
-
-.. ipython:: python
-
-   s1 = Series([1, 2, 3])
-   s1
-
-   s2 = Series(s1, index=['foo', 'bar', 'baz'])
-   s2
-
-- Deprecated ``day_of_year`` API removed from PeriodIndex, use ``dayofyear``
-  (:issue:`1723`)
-
-- Don't modify NumPy suppress printoption to True at import time
-
-- The internal HDF5 data arrangement for DataFrames has been transposed.  Legacy
-  files will still be readable by HDFStore (:issue:`1834`, :issue:`1824`)
-
-- Legacy cruft removed: pandas.stats.misc.quantileTS
-
-- Use ISO8601 format for Period repr: monthly, daily, and on down (:issue:`1776`)
-
-- Empty DataFrame columns are now created as object dtype. This will prevent a
-  class of TypeErrors that was occurring in code where the dtype of a column
-  would depend on the presence of data or not (e.g. a SQL query having results)
-  (:issue:`1783`)
-
-- Setting parts of DataFrame/Panel using ix now aligns input Series/DataFrame
-  (:issue:`1630`)
-
-- ``first`` and ``last`` methods in ``GroupBy`` no longer drop non-numeric
-  columns (:issue:`1809`)
-
-- Resolved inconsistencies in specifying custom NA values in text parser.
-  ``na_values`` of type dict no longer override default NAs unless
-  ``keep_default_na`` is set to false explicitly (:issue:`1657`)
-
-- ``DataFrame.dot`` will not do data alignment, and also work with Series
-  (:issue:`1915`)
-
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
-
diff --git a/doc/source/whatsnew/v0.9.1.rst b/doc/source/whatsnew/v0.9.1.rst
new file mode 100644
index 0000000000000..b8932ae2ae522
--- /dev/null
+++ b/doc/source/whatsnew/v0.9.1.rst
@@ -0,0 +1,170 @@
+.. _whatsnew_0901:
+
+v0.9.1 (November 14, 2012)
+--------------------------
+
+{{ header }}
+
+
+This is a bug fix release from 0.9.0 and includes several new features and
+enhancements along with a large number of bug fixes. The new features include
+by-column sort order for DataFrame and Series, improved NA handling for the rank
+method, masking functions for DataFrame, and intraday time-series filtering for
+DataFrame.
+
+New features
+~~~~~~~~~~~~
+
+  - `Series.sort`, `DataFrame.sort`, and `DataFrame.sort_index` can now be
+    specified in a per-column manner to support multiple sort orders (:issue:`928`)
+
+    .. code-block:: ipython
+
+       In [2]: df = pd.DataFrame(np.random.randint(0, 2, (6, 3)),
+          ...:                   columns=['A', 'B', 'C'])
+
+       In [3]: df.sort(['A', 'B'], ascending=[1, 0])
+
+       Out[3]:
+          A  B  C
+       3  0  1  1
+       4  0  1  1
+       2  0  0  1
+       0  1  0  0
+       1  1  0  0
+       5  1  0  0
+
+  - `DataFrame.rank` now supports additional argument values for the
+    `na_option` parameter so missing values can be assigned either the largest
+    or the smallest rank (:issue:`1508`, :issue:`2159`)
+
+    .. ipython:: python
+
+        df = pd.DataFrame(np.random.randn(6, 3), columns=['A', 'B', 'C'])
+
+        df.loc[2:4] = np.nan
+
+        df.rank()
+
+        df.rank(na_option='top')
+
+        df.rank(na_option='bottom')
+
+
+  - DataFrame has new `where` and `mask` methods to select values according to a
+    given boolean mask (:issue:`2109`, :issue:`2151`)
+
+	DataFrame currently supports slicing via a boolean vector the same length as the DataFrame (inside the `[]`).
+	The returned DataFrame has the same number of columns as the original, but is sliced on its index.
+
+        .. ipython:: python
+
+    	    df = DataFrame(np.random.randn(5, 3), columns = ['A','B','C'])
+
+	    df
+
+	    df[df['A'] > 0]
+
+	If a DataFrame is sliced with a DataFrame based boolean condition (with the same size as the original DataFrame),
+	then a DataFrame the same size (index and columns) as the original is returned, with
+	elements that do not meet the boolean condition as `NaN`. This is accomplished via
+	the new method `DataFrame.where`. In addition, `where` takes an optional `other` argument for replacement.
+
+	.. ipython:: python
+
+	   df[df>0]
+
+	   df.where(df>0)
+
+	   df.where(df>0,-df)
+
+	Furthermore, `where` now aligns the input boolean condition (ndarray or DataFrame), such that partial selection
+	with setting is possible. This is analogous to partial setting via `.ix` (but on the contents rather than the axis labels)
+
+	.. ipython:: python
+
+	   df2 = df.copy()
+   	   df2[ df2[1:4] > 0 ] = 3
+	   df2
+
+	`DataFrame.mask` is the inverse boolean operation of `where`.
+
+	.. ipython:: python
+
+	   df.mask(df<=0)
+
+  - Enable referencing of Excel columns by their column names (:issue:`1936`)
+
+    .. ipython:: python
+
+        xl = pd.ExcelFile('data/test.xls')
+        xl.parse('Sheet1', index_col=0, parse_dates=True,
+                 parse_cols='A:D')
+
+
+  - Added option to disable pandas-style tick locators and formatters
+    using `series.plot(x_compat=True)` or `pandas.plot_params['x_compat'] =
+    True` (:issue:`2205`)
+  - Existing TimeSeries methods `at_time` and `between_time` were added to
+    DataFrame (:issue:`2149`)
+  - DataFrame.dot can now accept ndarrays (:issue:`2042`)
+  - DataFrame.drop now supports non-unique indexes (:issue:`2101`)
+  - Panel.shift now supports negative periods (:issue:`2164`)
+  - DataFrame now support unary ~ operator (:issue:`2110`)
+
+API changes
+~~~~~~~~~~~
+
+  - Upsampling data with a PeriodIndex will result in a higher frequency
+    TimeSeries that spans the original time window
+
+    .. code-block:: ipython
+
+       In [1]: prng = pd.period_range('2012Q1', periods=2, freq='Q')
+
+       In [2]: s = pd.Series(np.random.randn(len(prng)), prng)
+
+       In [4]: s.resample('M')
+       Out[4]:
+       2012-01   -1.471992
+       2012-02         NaN
+       2012-03         NaN
+       2012-04   -0.493593
+       2012-05         NaN
+       2012-06         NaN
+       Freq: M, dtype: float64
+
+  - Period.end_time now returns the last nanosecond in the time interval
+    (:issue:`2124`, :issue:`2125`, :issue:`1764`)
+
+    .. ipython:: python
+
+        p = pd.Period('2012')
+
+        p.end_time
+
+
+  - File parsers no longer coerce to float or bool for columns that have custom
+    converters specified (:issue:`2184`)
+
+    .. ipython:: python
+
+        import io
+
+        data = ('A,B,C\n'
+                '00001,001,5\n'
+                '00002,002,6')
+        pd.read_csv(io.StringIO(data), converters={'A': lambda x: x.strip()})
+
+
+See the :ref:`full release notes
+<release>` or issue tracker
+on GitHub for a complete list.
+
+
+.. _whatsnew_0.9.1.contributors:
+
+Contributors
+~~~~~~~~~~~~
+
+.. contributors:: v0.9.0..v0.9.1
diff --git a/doc/source/whatsnew/v0.9.1.txt b/doc/source/whatsnew/v0.9.1.txt
deleted file mode 100644
index 4faf38219ebee..0000000000000
--- a/doc/source/whatsnew/v0.9.1.txt
+++ /dev/null
@@ -1,160 +0,0 @@
-.. _whatsnew_0901:
-
-.. ipython:: python
-   :suppress:
-
-   from pandas.compat import StringIO
-
-v0.9.1 (November 14, 2012)
---------------------------
-
-This is a bugfix release from 0.9.0 and includes several new features and
-enhancements along with a large number of bug fixes. The new features include
-by-column sort order for DataFrame and Series, improved NA handling for the rank
-method, masking functions for DataFrame, and intraday time-series filtering for
-DataFrame.
-
-New features
-~~~~~~~~~~~~
-
-  - `Series.sort`, `DataFrame.sort`, and `DataFrame.sort_index` can now be
-    specified in a per-column manner to support multiple sort orders (:issue:`928`)
-
-    .. code-block:: ipython
-
-       In [2]:  df = DataFrame(np.random.randint(0, 2, (6, 3)), columns=['A', 'B', 'C'])
-
-       In [3]: df.sort(['A', 'B'], ascending=[1, 0])
-
-       Out[3]:
-          A  B  C
-       3  0  1  1
-       4  0  1  1
-       2  0  0  1
-       0  1  0  0
-       1  1  0  0
-       5  1  0  0
-
-  - `DataFrame.rank` now supports additional argument values for the
-    `na_option` parameter so missing values can be assigned either the largest
-    or the smallest rank (:issue:`1508`, :issue:`2159`)
-
-    .. ipython:: python
-
-        df = DataFrame(np.random.randn(6, 3), columns=['A', 'B', 'C'])
-
-        df.loc[2:4] = np.nan
-
-        df.rank()
-
-        df.rank(na_option='top')
-
-        df.rank(na_option='bottom')
-
-
-  - DataFrame has new `where` and `mask` methods to select values according to a
-    given boolean mask (:issue:`2109`, :issue:`2151`)
-
-	DataFrame currently supports slicing via a boolean vector the same length as the DataFrame (inside the `[]`).
-	The returned DataFrame has the same number of columns as the original, but is sliced on its index.
-
-        .. ipython:: python
-
-    	    df = DataFrame(np.random.randn(5, 3), columns = ['A','B','C'])
-
-	    df
-
-	    df[df['A'] > 0]
-
-	If a DataFrame is sliced with a DataFrame based boolean condition (with the same size as the original DataFrame),
-	then a DataFrame the same size (index and columns) as the original is returned, with
-	elements that do not meet the boolean condition as `NaN`. This is accomplished via
-	the new method `DataFrame.where`. In addition, `where` takes an optional `other` argument for replacement.
-
-	.. ipython:: python
-
-	   df[df>0]
-
-	   df.where(df>0)
-
-	   df.where(df>0,-df)
-
-	Furthermore, `where` now aligns the input boolean condition (ndarray or DataFrame), such that partial selection
-	with setting is possible. This is analagous to partial setting via `.ix` (but on the contents rather than the axis labels)
-
-	.. ipython:: python
-
-	   df2 = df.copy()
-   	   df2[ df2[1:4] > 0 ] = 3
-	   df2
-
-	`DataFrame.mask` is the inverse boolean operation of `where`.
-
-	.. ipython:: python
-
-	   df.mask(df<=0)
-
-  - Enable referencing of Excel columns by their column names (:issue:`1936`)
-
-    .. ipython:: python
-
-        xl = ExcelFile('data/test.xls')
-        xl.parse('Sheet1', index_col=0, parse_dates=True,
-                 parse_cols='A:D')
-
-
-  - Added option to disable pandas-style tick locators and formatters
-    using `series.plot(x_compat=True)` or `pandas.plot_params['x_compat'] =
-    True` (:issue:`2205`)
-  - Existing TimeSeries methods `at_time` and `between_time` were added to
-    DataFrame (:issue:`2149`)
-  - DataFrame.dot can now accept ndarrays (:issue:`2042`)
-  - DataFrame.drop now supports non-unique indexes (:issue:`2101`)
-  - Panel.shift now supports negative periods (:issue:`2164`)
-  - DataFrame now support unary ~ operator (:issue:`2110`)
-
-API changes
-~~~~~~~~~~~
-
-  - Upsampling data with a PeriodIndex will result in a higher frequency
-    TimeSeries that spans the original time window
-
-    .. code-block:: ipython
-
-       In [1]: prng = period_range('2012Q1', periods=2, freq='Q')
-
-       In [2]: s = Series(np.random.randn(len(prng)), prng)
-
-       In [4]: s.resample('M')
-       Out[4]:
-       2012-01   -1.471992
-       2012-02         NaN
-       2012-03         NaN
-       2012-04   -0.493593
-       2012-05         NaN
-       2012-06         NaN
-       Freq: M, dtype: float64
-
-  - Period.end_time now returns the last nanosecond in the time interval
-    (:issue:`2124`, :issue:`2125`, :issue:`1764`)
-
-    .. ipython:: python
-
-        p = Period('2012')
-
-        p.end_time
-
-
-  - File parsers no longer coerce to float or bool for columns that have custom
-    converters specified (:issue:`2184`)
-
-    .. ipython:: python
-
-        data = 'A,B,C\n00001,001,5\n00002,002,6'
-
-        read_csv(StringIO(data), converters={'A' : lambda x: x.strip()})
-
-
-See the :ref:`full release notes
-<release>` or issue tracker
-on GitHub for a complete list.
diff --git a/doc/source/whatsnew/whatsnew_0171_html_table.html b/doc/source/whatsnew/whatsnew_0171_html_table.html
index 12965a045e41f..a76d6207bba58 100644
--- a/doc/source/whatsnew/whatsnew_0171_html_table.html
+++ b/doc/source/whatsnew/whatsnew_0171_html_table.html
@@ -1,873 +1,872 @@
 
         <style  type="text/css" >
-        
-        
+
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col0 {
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col1 {
-            
+
                 background-color:  #89d548;
-            
+
                 background-color:  #89d548;
-            
+
                 background-color:  #89d548;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col2 {
-            
+
                 background-color:  #3aba76;
-            
+
                 background-color:  #3aba76;
-            
+
                 background-color:  #3aba76;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col3 {
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col4 {
-            
+
                 background-color:  #24878e;
-            
+
                 background-color:  #24878e;
-            
+
                 background-color:  #24878e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col0 {
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col1 {
-            
+
                 background-color:  #2c738e;
-            
+
                 background-color:  #2c738e;
-            
+
                 background-color:  #2c738e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col2 {
-            
+
                 background-color:  #1f9f88;
-            
+
                 background-color:  #1f9f88;
-            
+
                 background-color:  #1f9f88;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col3 {
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col4 {
-            
+
                 background-color:  #297a8e;
-            
+
                 background-color:  #297a8e;
-            
+
                 background-color:  #297a8e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col0 {
-            
+
                 background-color:  #27808e;
-            
+
                 background-color:  #27808e;
-            
+
                 background-color:  #27808e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col1 {
-            
+
                 background-color:  #3bbb75;
-            
+
                 background-color:  #3bbb75;
-            
+
                 background-color:  #3bbb75;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col2 {
-            
+
                 background-color:  #b2dd2d;
-            
+
                 background-color:  #b2dd2d;
-            
+
                 background-color:  #b2dd2d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col3 {
-            
+
                 background-color:  #1f9a8a;
-            
+
                 background-color:  #1f9a8a;
-            
+
                 background-color:  #1f9a8a;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col4 {
-            
+
                 background-color:  #228d8d;
-            
+
                 background-color:  #228d8d;
-            
+
                 background-color:  #228d8d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col0 {
-            
+
                 background-color:  #218e8d;
-            
+
                 background-color:  #218e8d;
-            
+
                 background-color:  #218e8d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col1 {
-            
+
                 background-color:  #efe51c;
-            
+
                 background-color:  #efe51c;
-            
+
                 background-color:  #efe51c;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col2 {
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col3 {
-            
+
                 background-color:  #d5e21a;
-            
+
                 background-color:  #d5e21a;
-            
+
                 background-color:  #d5e21a;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col4 {
-            
+
                 background-color:  #2eb37c;
-            
+
                 background-color:  #2eb37c;
-            
+
                 background-color:  #2eb37c;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col0 {
-            
+
                 background-color:  #6ece58;
-            
+
                 background-color:  #6ece58;
-            
+
                 background-color:  #6ece58;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col1 {
-            
+
                 background-color:  #b2dd2d;
-            
+
                 background-color:  #b2dd2d;
-            
+
                 background-color:  #b2dd2d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col2 {
-            
+
                 background-color:  #238a8d;
-            
+
                 background-color:  #238a8d;
-            
+
                 background-color:  #238a8d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col3 {
-            
+
                 background-color:  #f1e51d;
-            
+
                 background-color:  #f1e51d;
-            
+
                 background-color:  #f1e51d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col4 {
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col0 {
-            
+
                 background-color:  #26828e;
-            
+
                 background-color:  #26828e;
-            
+
                 background-color:  #26828e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col1 {
-            
+
                 background-color:  #81d34d;
-            
+
                 background-color:  #81d34d;
-            
+
                 background-color:  #81d34d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col2 {
-            
+
                 background-color:  #2a768e;
-            
+
                 background-color:  #2a768e;
-            
+
                 background-color:  #2a768e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col3 {
-            
+
                 background-color:  #34b679;
-            
+
                 background-color:  #34b679;
-            
+
                 background-color:  #34b679;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col4 {
-            
+
                 background-color:  #297a8e;
-            
+
                 background-color:  #297a8e;
-            
+
                 background-color:  #297a8e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col0 {
-            
+
                 background-color:  #1f998a;
-            
+
                 background-color:  #1f998a;
-            
+
                 background-color:  #1f998a;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col1 {
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col2 {
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
                 background-color:  #31688e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col3 {
-            
+
                 background-color:  #1f968b;
-            
+
                 background-color:  #1f968b;
-            
+
                 background-color:  #1f968b;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col4 {
-            
+
                 background-color:  #5cc863;
-            
+
                 background-color:  #5cc863;
-            
+
                 background-color:  #5cc863;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col0 {
-            
+
                 background-color:  #1f9e89;
-            
+
                 background-color:  #1f9e89;
-            
+
                 background-color:  #1f9e89;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col1 {
-            
+
                 background-color:  #40bd72;
-            
+
                 background-color:  #40bd72;
-            
+
                 background-color:  #40bd72;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col2 {
-            
+
                 background-color:  #5cc863;
-            
+
                 background-color:  #5cc863;
-            
+
                 background-color:  #5cc863;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col3 {
-            
+
                 background-color:  #228c8d;
-            
+
                 background-color:  #228c8d;
-            
+
                 background-color:  #228c8d;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col4 {
-            
+
                 background-color:  #28ae80;
-            
+
                 background-color:  #28ae80;
-            
+
                 background-color:  #28ae80;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col0 {
-            
+
                 background-color:  #2a788e;
-            
+
                 background-color:  #2a788e;
-            
+
                 background-color:  #2a788e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col1 {
-            
+
                 background-color:  #23898e;
-            
+
                 background-color:  #23898e;
-            
+
                 background-color:  #23898e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col2 {
-            
+
                 background-color:  #1fa088;
-            
+
                 background-color:  #1fa088;
-            
+
                 background-color:  #1fa088;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col3 {
-            
+
                 background-color:  #90d743;
-            
+
                 background-color:  #90d743;
-            
+
                 background-color:  #90d743;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col4 {
-            
+
                 background-color:  #2cb17e;
-            
+
                 background-color:  #2cb17e;
-            
+
                 background-color:  #2cb17e;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col0 {
-            
+
                 background-color:  #22a785;
-            
+
                 background-color:  #22a785;
-            
+
                 background-color:  #22a785;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col1 {
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col2 {
-            
+
                 background-color:  #44bf70;
-            
+
                 background-color:  #44bf70;
-            
+
                 background-color:  #44bf70;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col3 {
-            
+
                 background-color:  #d2e21b;
-            
+
                 background-color:  #d2e21b;
-            
+
                 background-color:  #d2e21b;
-            
+
             }
-        
+
             #T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col4 {
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
                 background-color:  #fde725;
-            
+
             }
-        
+
         </style>
 
         <table id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb">
-        
+
 
         <thead>
-            
+
             <tr>
-                
+
                 <th class="blank">
-                
+
                 <th class="col_heading level0 col0">a
-                
+
                 <th class="col_heading level0 col1">b
-                
+
                 <th class="col_heading level0 col2">c
-                
+
                 <th class="col_heading level0 col3">d
-                
+
                 <th class="col_heading level0 col4">e
-                
+
             </tr>
-            
+
         </thead>
         <tbody>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row0">
-                    
+
                         0
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col0" class="data row0 col0">
-                    
+
                         -1.085631
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col1" class="data row0 col1">
-                    
+
                         0.997345
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col2" class="data row0 col2">
-                    
+
                         0.282978
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col3" class="data row0 col3">
-                    
+
                         -1.506295
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow0_col4" class="data row0 col4">
-                    
+
                         -0.5786
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row1">
-                    
+
                         1
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col0" class="data row1 col0">
-                    
+
                         1.651437
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col1" class="data row1 col1">
-                    
+
                         -2.426679
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col2" class="data row1 col2">
-                    
+
                         -0.428913
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col3" class="data row1 col3">
-                    
+
                         1.265936
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow1_col4" class="data row1 col4">
-                    
+
                         -0.86674
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row2">
-                    
+
                         2
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col0" class="data row2 col0">
-                    
+
                         -0.678886
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col1" class="data row2 col1">
-                    
+
                         -0.094709
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col2" class="data row2 col2">
-                    
+
                         1.49139
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col3" class="data row2 col3">
-                    
+
                         -0.638902
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow2_col4" class="data row2 col4">
-                    
+
                         -0.443982
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row3">
-                    
+
                         3
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col0" class="data row3 col0">
-                    
+
                         -0.434351
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col1" class="data row3 col1">
-                    
+
                         2.20593
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col2" class="data row3 col2">
-                    
+
                         2.186786
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col3" class="data row3 col3">
-                    
+
                         1.004054
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow3_col4" class="data row3 col4">
-                    
+
                         0.386186
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row4">
-                    
+
                         4
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col0" class="data row4 col0">
-                    
+
                         0.737369
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col1" class="data row4 col1">
-                    
+
                         1.490732
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col2" class="data row4 col2">
-                    
+
                         -0.935834
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col3" class="data row4 col3">
-                    
+
                         1.175829
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow4_col4" class="data row4 col4">
-                    
+
                         -1.253881
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row5">
-                    
+
                         5
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col0" class="data row5 col0">
-                    
+
                         -0.637752
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col1" class="data row5 col1">
-                    
+
                         0.907105
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col2" class="data row5 col2">
-                    
+
                         -1.428681
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col3" class="data row5 col3">
-                    
+
                         -0.140069
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow5_col4" class="data row5 col4">
-                    
+
                         -0.861755
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row6">
-                    
+
                         6
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col0" class="data row6 col0">
-                    
+
                         -0.255619
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col1" class="data row6 col1">
-                    
+
                         -2.798589
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col2" class="data row6 col2">
-                    
+
                         -1.771533
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col3" class="data row6 col3">
-                    
+
                         -0.699877
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow6_col4" class="data row6 col4">
-                    
+
                         0.927462
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row7">
-                    
+
                         7
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col0" class="data row7 col0">
-                    
+
                         -0.173636
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col1" class="data row7 col1">
-                    
+
                         0.002846
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col2" class="data row7 col2">
-                    
+
                         0.688223
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col3" class="data row7 col3">
-                    
+
                         -0.879536
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow7_col4" class="data row7 col4">
-                    
+
                         0.283627
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row8">
-                    
+
                         8
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col0" class="data row8 col0">
-                    
+
                         -0.805367
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col1" class="data row8 col1">
-                    
+
                         -1.727669
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col2" class="data row8 col2">
-                    
+
                         -0.3909
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col3" class="data row8 col3">
-                    
+
                         0.573806
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow8_col4" class="data row8 col4">
-                    
+
                         0.338589
-                    
-                
+
+
             </tr>
-            
+
             <tr>
-                
+
                 <th id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fb" class="row_heading level4 row9">
-                    
+
                         9
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col0" class="data row9 col0">
-                    
+
                         -0.01183
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col1" class="data row9 col1">
-                    
+
                         2.392365
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col2" class="data row9 col2">
-                    
+
                         0.412912
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col3" class="data row9 col3">
-                    
+
                         0.978736
-                    
-                
+
+
                 <td id="T_8d7c2fec_8d9e_11e5_8e2c_a45e60bd97fbrow9_col4" class="data row9 col4">
-                    
+
                         2.238143
-                    
-                
+
+
             </tr>
-            
+
         </tbody>
         </table>
-        
\ No newline at end of file
diff --git a/doc/sphinxext/README.rst b/doc/sphinxext/README.rst
index e39cf8daac036..2be5372bc0216 100644
--- a/doc/sphinxext/README.rst
+++ b/doc/sphinxext/README.rst
@@ -14,4 +14,4 @@ pandas documentation. These copies originate from other projects:
 
     These copies are maintained at the respective projects, so fixes should,
     to the extent possible, be pushed upstream instead of only adapting our
-    local copy to avoid divergence between the the local and upstream version.
+    local copy to avoid divergence between the local and upstream version.
diff --git a/doc/sphinxext/announce.py b/doc/sphinxext/announce.py
new file mode 100755
index 0000000000000..6bc53d3e96d01
--- /dev/null
+++ b/doc/sphinxext/announce.py
@@ -0,0 +1,140 @@
+#!/usr/bin/env python
+# -*- encoding:utf-8 -*-
+"""
+Script to generate contributor and pull request lists
+
+This script generates contributor and pull request lists for release
+announcements using Github v3 protocol. Use requires an authentication token in
+order to have sufficient bandwidth, you can get one following the directions at
+`<https://help.github.com/articles/creating-an-access-token-for-command-line-use/>_
+Don't add any scope, as the default is read access to public information. The
+token may be stored in an environment variable as you only get one chance to
+see it.
+
+Usage::
+
+    $ ./scripts/announce.py <token> <revision range>
+
+The output is utf8 rst.
+
+Dependencies
+------------
+
+- gitpython
+- pygithub
+
+Some code was copied from scipy `tools/gh_lists.py` and `tools/authors.py`.
+
+Examples
+--------
+
+From the bash command line with $GITHUB token.
+
+    $ ./scripts/announce.py $GITHUB v1.11.0..v1.11.1 > announce.rst
+
+"""
+from __future__ import division, print_function
+
+import codecs
+import os
+import re
+import textwrap
+
+from git import Repo
+
+UTF8Writer = codecs.getwriter('utf8')
+this_repo = Repo(os.path.join(os.path.dirname(__file__), "..", ".."))
+
+author_msg = """\
+A total of %d people contributed patches to this release.  People with a
+"+" by their names contributed a patch for the first time.
+"""
+
+pull_request_msg = """\
+A total of %d pull requests were merged for this release.
+"""
+
+
+def get_authors(revision_range):
+    pat = u'^.*\\t(.*)$'
+    lst_release, cur_release = [r.strip() for r in revision_range.split('..')]
+
+    # authors, in current release and previous to current release.
+    cur = set(re.findall(pat, this_repo.git.shortlog('-s', revision_range),
+                         re.M))
+    pre = set(re.findall(pat, this_repo.git.shortlog('-s', lst_release),
+                         re.M))
+
+    # Homu is the author of auto merges, clean him out.
+    cur.discard('Homu')
+    pre.discard('Homu')
+
+    # Append '+' to new authors.
+    authors = [s + u' +' for s in cur - pre] + [s for s in cur & pre]
+    authors.sort()
+    return authors
+
+
+def get_pull_requests(repo, revision_range):
+    prnums = []
+
+    # From regular merges
+    merges = this_repo.git.log(
+        '--oneline', '--merges', revision_range)
+    issues = re.findall(u"Merge pull request \\#(\\d*)", merges)
+    prnums.extend(int(s) for s in issues)
+
+    # From Homu merges (Auto merges)
+    issues = re. findall(u"Auto merge of \\#(\\d*)", merges)
+    prnums.extend(int(s) for s in issues)
+
+    # From fast forward squash-merges
+    commits = this_repo.git.log(
+        '--oneline', '--no-merges', '--first-parent', revision_range)
+    issues = re.findall(u'^.*\\(\\#(\\d+)\\)$', commits, re.M)
+    prnums.extend(int(s) for s in issues)
+
+    # get PR data from github repo
+    prnums.sort()
+    prs = [repo.get_pull(n) for n in prnums]
+    return prs
+
+
+def build_components(revision_range, heading="Contributors"):
+    lst_release, cur_release = [r.strip() for r in revision_range.split('..')]
+    authors = get_authors(revision_range)
+
+    return {
+        'heading': heading,
+        'author_message': author_msg % len(authors),
+        'authors': authors,
+    }
+
+
+def build_string(revision_range, heading="Contributors"):
+    components = build_components(revision_range, heading=heading)
+    components['uline'] = '=' * len(components['heading'])
+    components['authors'] = "* " + "\n* ".join(components['authors'])
+
+    tpl = textwrap.dedent("""\
+    {heading}
+    {uline}
+
+    {author_message}
+    {authors}""").format(**components)
+    return tpl
+
+
+def main(revision_range):
+    # document authors
+    text = build_string(revision_range)
+    print(text)
+
+
+if __name__ == "__main__":
+    from argparse import ArgumentParser
+
+    parser = ArgumentParser(description="Generate author lists for release")
+    parser.add_argument('revision_range', help='<revision>..<revision>')
+    args = parser.parse_args()
+    main(args.revision_range)
diff --git a/doc/sphinxext/contributors.py b/doc/sphinxext/contributors.py
new file mode 100644
index 0000000000000..179ba19a0908a
--- /dev/null
+++ b/doc/sphinxext/contributors.py
@@ -0,0 +1,53 @@
+"""Sphinx extension for listing code contributors to a release.
+
+Usage::
+
+   .. contributors:: v0.23.0..v0.23.1
+
+This will be replaced with a message indicating the number of
+code contributors and commits, and then list each contributor
+individually.
+"""
+from docutils import nodes
+from docutils.parsers.rst import Directive
+import git
+
+from announce import build_components
+
+
+class ContributorsDirective(Directive):
+    required_arguments = 1
+    name = 'contributors'
+
+    def run(self):
+        range_ = self.arguments[0]
+        try:
+            components = build_components(range_)
+        except git.GitCommandError:
+            return [
+                self.state.document.reporter.warning(
+                    "Cannot find contributors for range '{}'".format(range_),
+                    line=self.lineno)
+            ]
+        else:
+            message = nodes.paragraph()
+            message += nodes.Text(components['author_message'])
+
+            listnode = nodes.bullet_list()
+
+            for author in components['authors']:
+                para = nodes.paragraph()
+                para += nodes.Text(author)
+                listnode += nodes.list_item('', para)
+
+        return [message, listnode]
+
+
+def setup(app):
+    app.add_directive('contributors', ContributorsDirective)
+
+    return {
+        'version': '0.1',
+        'parallel_read_safe': True,
+        'parallel_write_safe': True,
+    }
diff --git a/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py b/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py
deleted file mode 100644
index dfb489e49394d..0000000000000
--- a/doc/sphinxext/ipython_sphinxext/ipython_console_highlighting.py
+++ /dev/null
@@ -1,116 +0,0 @@
-"""reST directive for syntax-highlighting ipython interactive sessions.
-
-XXX - See what improvements can be made based on the new (as of Sept 2009)
-'pycon' lexer for the python console.  At the very least it will give better
-highlighted tracebacks.
-"""
-
-#-----------------------------------------------------------------------------
-# Needed modules
-
-# Standard library
-import re
-
-# Third party
-from pygments.lexer import Lexer, do_insertions
-from pygments.lexers.agile import (PythonConsoleLexer, PythonLexer,
-                                   PythonTracebackLexer)
-from pygments.token import Comment, Generic
-
-from sphinx import highlighting
-
-#-----------------------------------------------------------------------------
-# Global constants
-line_re = re.compile('.*?\n')
-
-#-----------------------------------------------------------------------------
-# Code begins - classes and functions
-
-
-class IPythonConsoleLexer(Lexer):
-
-    """
-    For IPython console output or doctests, such as:
-
-    .. sourcecode:: ipython
-
-      In [1]: a = 'foo'
-
-      In [2]: a
-      Out[2]: 'foo'
-
-      In [3]: print(a)
-      foo
-
-      In [4]: 1 / 0
-
-    Notes:
-
-      - Tracebacks are not currently supported.
-
-      - It assumes the default IPython prompts, not customized ones.
-    """
-
-    name = 'IPython console session'
-    aliases = ['ipython']
-    mimetypes = ['text/x-ipython-console']
-    input_prompt = re.compile("(In \[[0-9]+\]: )|(   \.\.\.+:)")
-    output_prompt = re.compile("(Out\[[0-9]+\]: )|(   \.\.\.+:)")
-    continue_prompt = re.compile("   \.\.\.+:")
-    tb_start = re.compile("\-+")
-
-    def get_tokens_unprocessed(self, text):
-        pylexer = PythonLexer(**self.options)
-        tblexer = PythonTracebackLexer(**self.options)
-
-        curcode = ''
-        insertions = []
-        for match in line_re.finditer(text):
-            line = match.group()
-            input_prompt = self.input_prompt.match(line)
-            continue_prompt = self.continue_prompt.match(line.rstrip())
-            output_prompt = self.output_prompt.match(line)
-            if line.startswith("#"):
-                insertions.append((len(curcode),
-                                   [(0, Comment, line)]))
-            elif input_prompt is not None:
-                insertions.append((len(curcode),
-                                   [(0, Generic.Prompt, input_prompt.group())]))
-                curcode += line[input_prompt.end():]
-            elif continue_prompt is not None:
-                insertions.append((len(curcode),
-                                   [(0, Generic.Prompt, continue_prompt.group())]))
-                curcode += line[continue_prompt.end():]
-            elif output_prompt is not None:
-                # Use the 'error' token for output.  We should probably make
-                # our own token, but error is typicaly in a bright color like
-                # red, so it works fine for our output prompts.
-                insertions.append((len(curcode),
-                                   [(0, Generic.Error, output_prompt.group())]))
-                curcode += line[output_prompt.end():]
-            else:
-                if curcode:
-                    for item in do_insertions(insertions,
-                                              pylexer.get_tokens_unprocessed(curcode)):
-                        yield item
-                        curcode = ''
-                        insertions = []
-                yield match.start(), Generic.Output, line
-        if curcode:
-            for item in do_insertions(insertions,
-                                      pylexer.get_tokens_unprocessed(curcode)):
-                yield item
-
-
-def setup(app):
-    """Setup as a sphinx extension."""
-
-    # This is only a lexer, so adding it below to pygments appears sufficient.
-    # But if somebody knows that the right API usage should be to do that via
-    # sphinx, by all means fix it here.  At least having this setup.py
-    # suppresses the sphinx warning we'd get without it.
-    pass
-
-#-----------------------------------------------------------------------------
-# Register the extension as a valid pygments lexer
-highlighting.lexers['ipython'] = IPythonConsoleLexer()
diff --git a/doc/sphinxext/ipython_sphinxext/ipython_directive.py b/doc/sphinxext/ipython_sphinxext/ipython_directive.py
deleted file mode 100644
index 49fbacba99592..0000000000000
--- a/doc/sphinxext/ipython_sphinxext/ipython_directive.py
+++ /dev/null
@@ -1,1093 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Sphinx directive to support embedded IPython code.
-
-This directive allows pasting of entire interactive IPython sessions, prompts
-and all, and their code will actually get re-executed at doc build time, with
-all prompts renumbered sequentially. It also allows you to input code as a pure
-python input by giving the argument python to the directive. The output looks
-like an interactive ipython section.
-
-To enable this directive, simply list it in your Sphinx ``conf.py`` file
-(making sure the directory where you placed it is visible to sphinx, as is
-needed for all Sphinx directives). For example, to enable syntax highlighting
-and the IPython directive::
-
-    extensions = ['IPython.sphinxext.ipython_console_highlighting',
-                  'IPython.sphinxext.ipython_directive']
-
-The IPython directive outputs code-blocks with the language 'ipython'. So
-if you do not have the syntax highlighting extension enabled as well, then
-all rendered code-blocks will be uncolored. By default this directive assumes
-that your prompts are unchanged IPython ones, but this can be customized.
-The configurable options that can be placed in conf.py are:
-
-ipython_savefig_dir:
-    The directory in which to save the figures. This is relative to the
-    Sphinx source directory. The default is `html_static_path`.
-ipython_rgxin:
-    The compiled regular expression to denote the start of IPython input
-    lines. The default is re.compile('In \[(\d+)\]:\s?(.*)\s*'). You
-    shouldn't need to change this.
-ipython_rgxout:
-    The compiled regular expression to denote the start of IPython output
-    lines. The default is re.compile('Out\[(\d+)\]:\s?(.*)\s*'). You
-    shouldn't need to change this.
-ipython_promptin:
-    The string to represent the IPython input prompt in the generated ReST.
-    The default is 'In [%d]:'. This expects that the line numbers are used
-    in the prompt.
-ipython_promptout:
-    The string to represent the IPython prompt in the generated ReST. The
-    default is 'Out [%d]:'. This expects that the line numbers are used
-    in the prompt.
-ipython_mplbackend:
-    The string which specifies if the embedded Sphinx shell should import
-    Matplotlib and set the backend. The value specifies a backend that is
-    passed to `matplotlib.use()` before any lines in `ipython_execlines` are
-    executed. If not specified in conf.py, then the default value of 'agg' is
-    used. To use the IPython directive without matplotlib as a dependency, set
-    the value to `None`. It may end up that matplotlib is still imported
-    if the user specifies so in `ipython_execlines` or makes use of the
-    @savefig pseudo decorator.
-ipython_execlines:
-    A list of strings to be exec'd in the embedded Sphinx shell. Typical
-    usage is to make certain packages always available. Set this to an empty
-    list if you wish to have no imports always available. If specified in
-    conf.py as `None`, then it has the effect of making no imports available.
-    If omitted from conf.py altogether, then the default value of
-    ['import numpy as np', 'import matplotlib.pyplot as plt'] is used.
-ipython_holdcount
-    When the @suppress pseudo-decorator is used, the execution count can be
-    incremented or not. The default behavior is to hold the execution count,
-    corresponding to a value of `True`. Set this to `False` to increment
-    the execution count after each suppressed command.
-
-As an example, to use the IPython directive when `matplotlib` is not available,
-one sets the backend to `None`::
-
-    ipython_mplbackend = None
-
-An example usage of the directive is:
-
-.. code-block:: rst
-
-    .. ipython::
-
-        In [1]: x = 1
-
-        In [2]: y = x**2
-
-        In [3]: print(y)
-
-See http://matplotlib.org/sampledoc/ipython_directive.html for additional
-documentation.
-
-ToDo
-----
-
-- Turn the ad-hoc test() function into a real test suite.
-- Break up ipython-specific functionality from matplotlib stuff into better
-  separated code.
-
-Authors
--------
-
-- John D Hunter: orignal author.
-- Fernando Perez: refactoring, documentation, cleanups, port to 0.11.
-- VáclavŠmilauer <eudoxos-AT-arcig.cz>: Prompt generalizations.
-- Skipper Seabold, refactoring, cleanups, pure python addition
-"""
-from __future__ import print_function
-from __future__ import unicode_literals
-
-#-----------------------------------------------------------------------------
-# Imports
-#-----------------------------------------------------------------------------
-
-# Stdlib
-import os
-import re
-import sys
-import tempfile
-import ast
-from pandas.compat import zip, range, map, lmap, u, cStringIO as StringIO
-import warnings
-
-# To keep compatibility with various python versions
-try:
-    from hashlib import md5
-except ImportError:
-    from md5 import md5
-
-# Third-party
-import sphinx
-from docutils.parsers.rst import directives
-from docutils import nodes
-from sphinx.util.compat import Directive
-
-# Our own
-try:
-    from traitlets.config import Config
-except ImportError:
-    from IPython import Config
-from IPython import InteractiveShell
-from IPython.core.profiledir import ProfileDir
-from IPython.utils import io
-from IPython.utils.py3compat import PY3
-
-if PY3:
-    from io import StringIO
-    text_type = str
-else:
-    from StringIO import StringIO
-    text_type = unicode
-
-#-----------------------------------------------------------------------------
-# Globals
-#-----------------------------------------------------------------------------
-# for tokenizing blocks
-COMMENT, INPUT, OUTPUT =  range(3)
-
-#-----------------------------------------------------------------------------
-# Functions and class declarations
-#-----------------------------------------------------------------------------
-
-def block_parser(part, rgxin, rgxout, fmtin, fmtout):
-    """
-    part is a string of ipython text, comprised of at most one
-    input, one ouput, comments, and blank lines.  The block parser
-    parses the text into a list of::
-
-      blocks = [ (TOKEN0, data0), (TOKEN1, data1), ...]
-
-    where TOKEN is one of [COMMENT | INPUT | OUTPUT ] and
-    data is, depending on the type of token::
-
-      COMMENT : the comment string
-
-      INPUT: the (DECORATOR, INPUT_LINE, REST) where
-         DECORATOR: the input decorator (or None)
-         INPUT_LINE: the input as string (possibly multi-line)
-         REST : any stdout generated by the input line (not OUTPUT)
-
-      OUTPUT: the output string, possibly multi-line
-
-    """
-    block = []
-    lines = part.split('\n')
-    N = len(lines)
-    i = 0
-    decorator = None
-    while 1:
-
-        if i==N:
-            # nothing left to parse -- the last line
-            break
-
-        line = lines[i]
-        i += 1
-        line_stripped = line.strip()
-        if line_stripped.startswith('#'):
-            block.append((COMMENT, line))
-            continue
-
-        if line_stripped.startswith('@'):
-            # we're assuming at most one decorator -- may need to
-            # rethink
-            decorator = line_stripped
-            continue
-
-        # does this look like an input line?
-        matchin = rgxin.match(line)
-        if matchin:
-            lineno, inputline = int(matchin.group(1)), matchin.group(2)
-
-            # the ....: continuation string
-            continuation = '   %s:'%''.join(['.']*(len(str(lineno))+2))
-            Nc = len(continuation)
-            # input lines can continue on for more than one line, if
-            # we have a '\' line continuation char or a function call
-            # echo line 'print'.  The input line can only be
-            # terminated by the end of the block or an output line, so
-            # we parse out the rest of the input line if it is
-            # multiline as well as any echo text
-
-            rest = []
-            while i<N:
-
-                # look ahead; if the next line is blank, or a comment, or
-                # an output line, we're done
-
-                nextline = lines[i]
-                matchout = rgxout.match(nextline)
-                #print "nextline=%s, continuation=%s, starts=%s"%(nextline, continuation, nextline.startswith(continuation))
-                if matchout or nextline.startswith('#'):
-                    break
-                elif nextline.startswith(continuation):
-                    nextline = nextline[Nc:]
-                    if nextline and nextline[0] == ' ':
-                        nextline = nextline[1:]
-
-                    inputline += '\n' +  nextline
-
-                else:
-                    rest.append(nextline)
-                i+= 1
-
-            block.append((INPUT, (decorator, inputline, '\n'.join(rest))))
-            continue
-
-        # if it looks like an output line grab all the text to the end
-        # of the block
-        matchout = rgxout.match(line)
-        if matchout:
-            lineno, output = int(matchout.group(1)), matchout.group(2)
-            if i<N-1:
-                output = '\n'.join([output] + lines[i:])
-
-            block.append((OUTPUT, output))
-            break
-
-    return block
-
-
-class DecodingStringIO(StringIO, object):
-    def __init__(self,buf='',encodings=('utf8',), *args, **kwds):
-        super(DecodingStringIO, self).__init__(buf, *args, **kwds)
-        self.set_encodings(encodings)
-
-    def set_encodings(self, encodings):
-        self.encodings = encodings
-
-    def write(self,data):
-        if isinstance(data, text_type):
-            return super(DecodingStringIO, self).write(data)
-        else:
-            for enc in self.encodings:
-                try:
-                    data = data.decode(enc)
-                    return super(DecodingStringIO, self).write(data)
-                except :
-                    pass
-        # default to brute utf8 if no encoding succeded
-            return super(DecodingStringIO, self).write(data.decode('utf8', 'replace'))
-
-
-class EmbeddedSphinxShell(object):
-    """An embedded IPython instance to run inside Sphinx"""
-
-    def __init__(self, exec_lines=None,state=None):
-
-        self.cout = DecodingStringIO(u'')
-
-        if exec_lines is None:
-            exec_lines = []
-
-        self.state = state
-
-        # Create config object for IPython
-        config = Config()
-        config.InteractiveShell.autocall = False
-        config.InteractiveShell.autoindent = False
-        config.InteractiveShell.colors = 'NoColor'
-
-        # create a profile so instance history isn't saved
-        tmp_profile_dir = tempfile.mkdtemp(prefix='profile_')
-        profname = 'auto_profile_sphinx_build'
-        pdir = os.path.join(tmp_profile_dir,profname)
-        profile = ProfileDir.create_profile_dir(pdir)
-
-        # Create and initialize global ipython, but don't start its mainloop.
-        # This will persist across different EmbededSphinxShell instances.
-        IP = InteractiveShell.instance(config=config, profile_dir=profile)
-
-        # io.stdout redirect must be done after instantiating InteractiveShell
-        io.stdout = self.cout
-        io.stderr = self.cout
-
-        # For debugging, so we can see normal output, use this:
-        #from IPython.utils.io import Tee
-        #io.stdout = Tee(self.cout, channel='stdout') # dbg
-        #io.stderr = Tee(self.cout, channel='stderr') # dbg
-
-        # Store a few parts of IPython we'll need.
-        self.IP = IP
-        self.user_ns = self.IP.user_ns
-        self.user_global_ns = self.IP.user_global_ns
-
-        self.input = ''
-        self.output = ''
-
-        self.is_verbatim = False
-        self.is_doctest = False
-        self.is_suppress = False
-
-        # Optionally, provide more detailed information to shell.
-        self.directive = None
-
-        # on the first call to the savefig decorator, we'll import
-        # pyplot as plt so we can make a call to the plt.gcf().savefig
-        self._pyplot_imported = False
-
-        # Prepopulate the namespace.
-        for line in exec_lines:
-            self.process_input_line(line, store_history=False)
-
-    def clear_cout(self):
-        self.cout.seek(0)
-        self.cout.truncate(0)
-
-    def process_input_line(self, line, store_history=True):
-        """process the input, capturing stdout"""
-
-        stdout = sys.stdout
-        splitter = self.IP.input_splitter
-        try:
-            sys.stdout = self.cout
-            splitter.push(line)
-            more = splitter.push_accepts_more()
-            if not more:
-                try:
-                    source_raw = splitter.source_raw_reset()[1]
-                except:
-                    # recent ipython #4504
-                    source_raw = splitter.raw_reset()
-                self.IP.run_cell(source_raw, store_history=store_history)
-        finally:
-            sys.stdout = stdout
-
-    def process_image(self, decorator):
-        """
-        # build out an image directive like
-        # .. image:: somefile.png
-        #    :width 4in
-        #
-        # from an input like
-        # savefig somefile.png width=4in
-        """
-        savefig_dir = self.savefig_dir
-        source_dir = self.source_dir
-        saveargs = decorator.split(' ')
-        filename = saveargs[1]
-        # insert relative path to image file in source
-        outfile = os.path.relpath(os.path.join(savefig_dir,filename),
-                    source_dir)
-
-        imagerows = ['.. image:: %s'%outfile]
-
-        for kwarg in saveargs[2:]:
-            arg, val = kwarg.split('=')
-            arg = arg.strip()
-            val = val.strip()
-            imagerows.append('   :%s: %s'%(arg, val))
-
-        image_file = os.path.basename(outfile) # only return file name
-        image_directive = '\n'.join(imagerows)
-        return image_file, image_directive
-
-    # Callbacks for each type of token
-    def process_input(self, data, input_prompt, lineno):
-        """
-        Process data block for INPUT token.
-
-        """
-        decorator, input, rest = data
-        image_file = None
-        image_directive = None
-
-        is_verbatim = decorator=='@verbatim' or self.is_verbatim
-        is_doctest = (decorator is not None and \
-                     decorator.startswith('@doctest')) or self.is_doctest
-        is_suppress = decorator=='@suppress' or self.is_suppress
-        is_okexcept = decorator=='@okexcept' or self.is_okexcept
-        is_okwarning = decorator=='@okwarning' or self.is_okwarning
-        is_savefig = decorator is not None and \
-                     decorator.startswith('@savefig')
-
-        # set the encodings to be used by DecodingStringIO
-        # to convert the execution output into unicode if
-        # needed. this attrib is set by IpythonDirective.run()
-        # based on the specified block options, defaulting to ['ut
-        self.cout.set_encodings(self.output_encoding)
-
-        input_lines = input.split('\n')
-
-        if len(input_lines) > 1:
-           if input_lines[-1] != "":
-               input_lines.append('') # make sure there's a blank line
-                                       # so splitter buffer gets reset
-
-        continuation = '   %s:'%''.join(['.']*(len(str(lineno))+2))
-
-        if is_savefig:
-            image_file, image_directive = self.process_image(decorator)
-
-        ret = []
-        is_semicolon = False
-
-        # Hold the execution count, if requested to do so.
-        if is_suppress and self.hold_count:
-            store_history = False
-        else:
-            store_history = True
-
-        # Note: catch_warnings is not thread safe
-        with warnings.catch_warnings(record=True) as ws:
-            for i, line in enumerate(input_lines):
-                if line.endswith(';'):
-                    is_semicolon = True
-
-                if i == 0:
-                    # process the first input line
-                    if is_verbatim:
-                        self.process_input_line('')
-                        self.IP.execution_count += 1 # increment it anyway
-                    else:
-                        # only submit the line in non-verbatim mode
-                        self.process_input_line(line, store_history=store_history)
-                    formatted_line = '%s %s'%(input_prompt, line)
-                else:
-                    # process a continuation line
-                    if not is_verbatim:
-                        self.process_input_line(line, store_history=store_history)
-
-                    formatted_line = '%s %s'%(continuation, line)
-
-                if not is_suppress:
-                    ret.append(formatted_line)
-
-        if not is_suppress and len(rest.strip()) and is_verbatim:
-            # the "rest" is the standard output of the
-            # input, which needs to be added in
-            # verbatim mode
-            ret.append(rest)
-
-        self.cout.seek(0)
-        output = self.cout.read()
-        if not is_suppress and not is_semicolon:
-            ret.append(output)
-        elif is_semicolon: # get spacing right
-            ret.append('')
-
-        # context information
-        filename = self.state.document.current_source
-        lineno = self.state.document.current_line
-
-        # output any exceptions raised during execution to stdout
-        # unless :okexcept: has been specified.
-        if not is_okexcept and "Traceback" in output:
-            s =  "\nException in %s at block ending on line %s\n" % (filename, lineno)
-            s += "Specify :okexcept: as an option in the ipython:: block to suppress this message\n"
-            sys.stdout.write('\n\n>>>' + ('-' * 73))
-            sys.stdout.write(s)
-            sys.stdout.write(output)
-            sys.stdout.write('<<<' + ('-' * 73) + '\n\n')
-
-        # output any warning raised during execution to stdout
-        # unless :okwarning: has been specified.
-        if not is_okwarning:
-            for w in ws:
-                s =  "\nWarning in %s at block ending on line %s\n" % (filename, lineno)
-                s += "Specify :okwarning: as an option in the ipython:: block to suppress this message\n"
-                sys.stdout.write('\n\n>>>' + ('-' * 73))
-                sys.stdout.write(s)
-                sys.stdout.write('-' * 76 + '\n')
-                s=warnings.formatwarning(w.message, w.category,
-                                         w.filename, w.lineno, w.line)
-                sys.stdout.write(s)
-                sys.stdout.write('<<<' + ('-' * 73) + '\n')
-
-        self.cout.truncate(0)
-        return (ret, input_lines, output, is_doctest, decorator, image_file,
-                    image_directive)
-
-
-    def process_output(self, data, output_prompt,
-                       input_lines, output, is_doctest, decorator, image_file):
-        """
-        Process data block for OUTPUT token.
-
-        """
-        TAB = ' ' * 4
-
-        if is_doctest and output is not None:
-
-            found = output
-            found = found.strip()
-            submitted = data.strip()
-
-            if self.directive is None:
-                source = 'Unavailable'
-                content = 'Unavailable'
-            else:
-                source = self.directive.state.document.current_source
-                content = self.directive.content
-                # Add tabs and join into a single string.
-                content = '\n'.join([TAB + line for line in content])
-
-            # Make sure the output contains the output prompt.
-            ind = found.find(output_prompt)
-            if ind < 0:
-                e = ('output does not contain output prompt\n\n'
-                     'Document source: {0}\n\n'
-                     'Raw content: \n{1}\n\n'
-                     'Input line(s):\n{TAB}{2}\n\n'
-                     'Output line(s):\n{TAB}{3}\n\n')
-                e = e.format(source, content, '\n'.join(input_lines),
-                             repr(found), TAB=TAB)
-                raise RuntimeError(e)
-            found = found[len(output_prompt):].strip()
-
-            # Handle the actual doctest comparison.
-            if decorator.strip() == '@doctest':
-                # Standard doctest
-                if found != submitted:
-                    e = ('doctest failure\n\n'
-                         'Document source: {0}\n\n'
-                         'Raw content: \n{1}\n\n'
-                         'On input line(s):\n{TAB}{2}\n\n'
-                         'we found output:\n{TAB}{3}\n\n'
-                         'instead of the expected:\n{TAB}{4}\n\n')
-                    e = e.format(source, content, '\n'.join(input_lines),
-                                 repr(found), repr(submitted), TAB=TAB)
-                    raise RuntimeError(e)
-            else:
-                self.custom_doctest(decorator, input_lines, found, submitted)
-
-    def process_comment(self, data):
-        """Process data fPblock for COMMENT token."""
-        if not self.is_suppress:
-            return [data]
-
-    def save_image(self, image_file):
-        """
-        Saves the image file to disk.
-        """
-        self.ensure_pyplot()
-        command = ('plt.gcf().savefig("%s", bbox_inches="tight", '
-                   'dpi=100)' % image_file)
-
-        #print 'SAVEFIG', command  # dbg
-        self.process_input_line('bookmark ipy_thisdir', store_history=False)
-        self.process_input_line('cd -b ipy_savedir', store_history=False)
-        self.process_input_line(command, store_history=False)
-        self.process_input_line('cd -b ipy_thisdir', store_history=False)
-        self.process_input_line('bookmark -d ipy_thisdir', store_history=False)
-        self.clear_cout()
-
-    def process_block(self, block):
-        """
-        process block from the block_parser and return a list of processed lines
-        """
-        ret = []
-        output = None
-        input_lines = None
-        lineno = self.IP.execution_count
-
-        input_prompt = self.promptin % lineno
-        output_prompt = self.promptout % lineno
-        image_file = None
-        image_directive = None
-
-        for token, data in block:
-            if token == COMMENT:
-                out_data = self.process_comment(data)
-            elif token == INPUT:
-                (out_data, input_lines, output, is_doctest, decorator,
-                    image_file, image_directive) = \
-                          self.process_input(data, input_prompt, lineno)
-            elif token == OUTPUT:
-                out_data = \
-                    self.process_output(data, output_prompt,
-                                        input_lines, output, is_doctest,
-                                        decorator, image_file)
-            if out_data:
-                ret.extend(out_data)
-
-        # save the image files
-        if image_file is not None:
-            self.save_image(image_file)
-
-        return ret, image_directive
-
-    def ensure_pyplot(self):
-        """
-        Ensures that pyplot has been imported into the embedded IPython shell.
-
-        Also, makes sure to set the backend appropriately if not set already.
-
-        """
-        # We are here if the @figure pseudo decorator was used. Thus, it's
-        # possible that we could be here even if python_mplbackend were set to
-        # `None`. That's also strange and perhaps worthy of raising an
-        # exception, but for now, we just set the backend to 'agg'.
-
-        if not self._pyplot_imported:
-            if 'matplotlib.backends' not in sys.modules:
-                # Then ipython_matplotlib was set to None but there was a
-                # call to the @figure decorator (and ipython_execlines did
-                # not set a backend).
-                #raise Exception("No backend was set, but @figure was used!")
-                import matplotlib
-                matplotlib.use('agg')
-
-            # Always import pyplot into embedded shell.
-            self.process_input_line('import matplotlib.pyplot as plt',
-                                    store_history=False)
-            self._pyplot_imported = True
-
-    def process_pure_python(self, content):
-        """
-        content is a list of strings. it is unedited directive content
-
-        This runs it line by line in the InteractiveShell, prepends
-        prompts as needed capturing stderr and stdout, then returns
-        the content as a list as if it were ipython code
-        """
-        output = []
-        savefig = False # keep up with this to clear figure
-        multiline = False # to handle line continuation
-        multiline_start = None
-        fmtin = self.promptin
-
-        ct = 0
-
-        for lineno, line in enumerate(content):
-
-            line_stripped = line.strip()
-            if not len(line):
-                output.append(line)
-                continue
-
-            # handle decorators
-            if line_stripped.startswith('@'):
-                output.extend([line])
-                if 'savefig' in line:
-                    savefig = True # and need to clear figure
-                continue
-
-            # handle comments
-            if line_stripped.startswith('#'):
-                output.extend([line])
-                continue
-
-            # deal with lines checking for multiline
-            continuation  = u'   %s:'% ''.join(['.']*(len(str(ct))+2))
-            if not multiline:
-                modified = u"%s %s" % (fmtin % ct, line_stripped)
-                output.append(modified)
-                ct += 1
-                try:
-                    ast.parse(line_stripped)
-                    output.append(u'')
-                except Exception: # on a multiline
-                    multiline = True
-                    multiline_start = lineno
-            else: # still on a multiline
-                modified = u'%s %s' % (continuation, line)
-                output.append(modified)
-
-                # if the next line is indented, it should be part of multiline
-                if len(content) > lineno + 1:
-                    nextline = content[lineno + 1]
-                    if len(nextline) - len(nextline.lstrip()) > 3:
-                        continue
-                try:
-                    mod = ast.parse(
-                            '\n'.join(content[multiline_start:lineno+1]))
-                    if isinstance(mod.body[0], ast.FunctionDef):
-                        # check to see if we have the whole function
-                        for element in mod.body[0].body:
-                            if isinstance(element, ast.Return):
-                                multiline = False
-                    else:
-                        output.append(u'')
-                        multiline = False
-                except Exception:
-                    pass
-
-            if savefig: # clear figure if plotted
-                self.ensure_pyplot()
-                self.process_input_line('plt.clf()', store_history=False)
-                self.clear_cout()
-                savefig = False
-
-        return output
-
-    def custom_doctest(self, decorator, input_lines, found, submitted):
-        """
-        Perform a specialized doctest.
-
-        """
-        from .custom_doctests import doctests
-
-        args = decorator.split()
-        doctest_type = args[1]
-        if doctest_type in doctests:
-            doctests[doctest_type](self, args, input_lines, found, submitted)
-        else:
-            e = "Invalid option to @doctest: {0}".format(doctest_type)
-            raise Exception(e)
-
-
-class IPythonDirective(Directive):
-
-    has_content = True
-    required_arguments = 0
-    optional_arguments = 4 # python, suppress, verbatim, doctest
-    final_argumuent_whitespace = True
-    option_spec = { 'python': directives.unchanged,
-                    'suppress' : directives.flag,
-                    'verbatim' : directives.flag,
-                    'doctest' : directives.flag,
-                    'okexcept': directives.flag,
-                    'okwarning': directives.flag,
-                    'output_encoding': directives.unchanged_required
-                  }
-
-    shell = None
-
-    seen_docs = set()
-
-    def get_config_options(self):
-        # contains sphinx configuration variables
-        config = self.state.document.settings.env.config
-
-        # get config variables to set figure output directory
-        confdir = self.state.document.settings.env.app.confdir
-        savefig_dir = config.ipython_savefig_dir
-        source_dir = os.path.dirname(self.state.document.current_source)
-        if savefig_dir is None:
-            savefig_dir = config.html_static_path
-        if isinstance(savefig_dir, list):
-            savefig_dir = savefig_dir[0] # safe to assume only one path?
-        savefig_dir = os.path.join(confdir, savefig_dir)
-
-        # get regex and prompt stuff
-        rgxin      = config.ipython_rgxin
-        rgxout     = config.ipython_rgxout
-        promptin   = config.ipython_promptin
-        promptout  = config.ipython_promptout
-        mplbackend = config.ipython_mplbackend
-        exec_lines = config.ipython_execlines
-        hold_count = config.ipython_holdcount
-
-        return (savefig_dir, source_dir, rgxin, rgxout,
-                promptin, promptout, mplbackend, exec_lines, hold_count)
-
-    def setup(self):
-        # Get configuration values.
-        (savefig_dir, source_dir, rgxin, rgxout, promptin, promptout,
-         mplbackend, exec_lines, hold_count) = self.get_config_options()
-
-        if self.shell is None:
-            # We will be here many times.  However, when the
-            # EmbeddedSphinxShell is created, its interactive shell member
-            # is the same for each instance.
-
-            if mplbackend and 'matplotlib.backends' not in sys.modules:
-                import matplotlib
-                # Repeated calls to use() will not hurt us since `mplbackend`
-                # is the same each time.
-                matplotlib.use(mplbackend)
-
-            # Must be called after (potentially) importing matplotlib and
-            # setting its backend since exec_lines might import pylab.
-            self.shell = EmbeddedSphinxShell(exec_lines, self.state)
-
-            # Store IPython directive to enable better error messages
-            self.shell.directive = self
-
-        # reset the execution count if we haven't processed this doc
-        #NOTE: this may be borked if there are multiple seen_doc tmp files
-        #check time stamp?
-        if self.state.document.current_source not in self.seen_docs:
-            self.shell.IP.history_manager.reset()
-            self.shell.IP.execution_count = 1
-            try:
-                self.shell.IP.prompt_manager.width = 0
-            except AttributeError:
-                # GH14003: class promptManager has removed after IPython 5.x
-                pass
-            self.seen_docs.add(self.state.document.current_source)
-
-        # and attach to shell so we don't have to pass them around
-        self.shell.rgxin = rgxin
-        self.shell.rgxout = rgxout
-        self.shell.promptin = promptin
-        self.shell.promptout = promptout
-        self.shell.savefig_dir = savefig_dir
-        self.shell.source_dir = source_dir
-        self.shell.hold_count = hold_count
-
-        # setup bookmark for saving figures directory
-        self.shell.process_input_line('bookmark ipy_savedir %s'%savefig_dir,
-                                      store_history=False)
-        self.shell.clear_cout()
-
-        return rgxin, rgxout, promptin, promptout
-
-    def teardown(self):
-        # delete last bookmark
-        self.shell.process_input_line('bookmark -d ipy_savedir',
-                                      store_history=False)
-        self.shell.clear_cout()
-
-    def run(self):
-        debug = False
-
-        #TODO, any reason block_parser can't be a method of embeddable shell
-        # then we wouldn't have to carry these around
-        rgxin, rgxout, promptin, promptout = self.setup()
-
-        options = self.options
-        self.shell.is_suppress = 'suppress' in options
-        self.shell.is_doctest = 'doctest' in options
-        self.shell.is_verbatim = 'verbatim' in options
-        self.shell.is_okexcept = 'okexcept' in options
-        self.shell.is_okwarning = 'okwarning' in options
-
-        self.shell.output_encoding = [options.get('output_encoding', 'utf8')]
-
-        # handle pure python code
-        if 'python' in self.arguments:
-            content = self.content
-            self.content = self.shell.process_pure_python(content)
-
-        parts = '\n'.join(self.content).split('\n\n')
-
-        lines = ['.. code-block:: ipython', '']
-        figures = []
-
-        for part in parts:
-            block = block_parser(part, rgxin, rgxout, promptin, promptout)
-            if len(block):
-                rows, figure = self.shell.process_block(block)
-                for row in rows:
-                    lines.extend(['   %s'%line for line in row.split('\n')])
-
-                if figure is not None:
-                    figures.append(figure)
-
-        for figure in figures:
-            lines.append('')
-            lines.extend(figure.split('\n'))
-            lines.append('')
-
-        if len(lines)>2:
-            if debug:
-                print('\n'.join(lines))
-            else:
-                # This has to do with input, not output. But if we comment
-                # these lines out, then no IPython code will appear in the
-                # final output.
-                self.state_machine.insert_input(
-                    lines, self.state_machine.input_lines.source(0))
-
-        # cleanup
-        self.teardown()
-
-        return []
-
-# Enable as a proper Sphinx directive
-def setup(app):
-    setup.app = app
-
-    app.add_directive('ipython', IPythonDirective)
-    app.add_config_value('ipython_savefig_dir', None, 'env')
-    app.add_config_value('ipython_rgxin',
-                         re.compile('In \[(\d+)\]:\s?(.*)\s*'), 'env')
-    app.add_config_value('ipython_rgxout',
-                         re.compile('Out\[(\d+)\]:\s?(.*)\s*'), 'env')
-    app.add_config_value('ipython_promptin', 'In [%d]:', 'env')
-    app.add_config_value('ipython_promptout', 'Out[%d]:', 'env')
-
-    # We could just let matplotlib pick whatever is specified as the default
-    # backend in the matplotlibrc file, but this would cause issues if the
-    # backend didn't work in headless environments. For this reason, 'agg'
-    # is a good default backend choice.
-    app.add_config_value('ipython_mplbackend', 'agg', 'env')
-
-    # If the user sets this config value to `None`, then EmbeddedSphinxShell's
-    # __init__ method will treat it as [].
-    execlines = ['import numpy as np', 'import matplotlib.pyplot as plt']
-    app.add_config_value('ipython_execlines', execlines, 'env')
-
-    app.add_config_value('ipython_holdcount', True, 'env')
-
-# Simple smoke test, needs to be converted to a proper automatic test.
-def test():
-
-    examples = [
-        r"""
-In [9]: pwd
-Out[9]: '/home/jdhunter/py4science/book'
-
-In [10]: cd bookdata/
-/home/jdhunter/py4science/book/bookdata
-
-In [2]: from pylab import *
-
-In [2]: ion()
-
-In [3]: im = imread('stinkbug.png')
-
-@savefig mystinkbug.png width=4in
-In [4]: imshow(im)
-Out[4]: <matplotlib.image.AxesImage object at 0x39ea850>
-
-""",
-        r"""
-
-In [1]: x = 'hello world'
-
-# string methods can be
-# used to alter the string
-@doctest
-In [2]: x.upper()
-Out[2]: 'HELLO WORLD'
-
-@verbatim
-In [3]: x.st<TAB>
-x.startswith  x.strip
-""",
-    r"""
-
-In [130]: url = 'http://ichart.finance.yahoo.com/table.csv?s=CROX\
-   .....: &d=9&e=22&f=2009&g=d&a=1&br=8&c=2006&ignore=.csv'
-
-In [131]: print url.split('&')
-['http://ichart.finance.yahoo.com/table.csv?s=CROX', 'd=9', 'e=22', 'f=2009', 'g=d', 'a=1', 'b=8', 'c=2006', 'ignore=.csv']
-
-In [60]: import urllib
-
-""",
-    r"""\
-
-In [133]: import numpy.random
-
-@suppress
-In [134]: numpy.random.seed(2358)
-
-@doctest
-In [135]: numpy.random.rand(10,2)
-Out[135]:
-array([[ 0.64524308,  0.59943846],
-       [ 0.47102322,  0.8715456 ],
-       [ 0.29370834,  0.74776844],
-       [ 0.99539577,  0.1313423 ],
-       [ 0.16250302,  0.21103583],
-       [ 0.81626524,  0.1312433 ],
-       [ 0.67338089,  0.72302393],
-       [ 0.7566368 ,  0.07033696],
-       [ 0.22591016,  0.77731835],
-       [ 0.0072729 ,  0.34273127]])
-
-""",
-
-    r"""
-In [106]: print x
-jdh
-
-In [109]: for i in range(10):
-   .....:     print i
-   .....:
-   .....:
-0
-1
-2
-3
-4
-5
-6
-7
-8
-9
-""",
-
-        r"""
-
-In [144]: from pylab import *
-
-In [145]: ion()
-
-# use a semicolon to suppress the output
-@savefig test_hist.png width=4in
-In [151]: hist(np.random.randn(10000), 100);
-
-
-@savefig test_plot.png width=4in
-In [151]: plot(np.random.randn(10000), 'o');
-   """,
-
-        r"""
-# use a semicolon to suppress the output
-In [151]: plt.clf()
-
-@savefig plot_simple.png width=4in
-In [151]: plot([1,2,3])
-
-@savefig hist_simple.png width=4in
-In [151]: hist(np.random.randn(10000), 100);
-
-""",
-     r"""
-# update the current fig
-In [151]: ylabel('number')
-
-In [152]: title('normal distribution')
-
-
-@savefig hist_with_text.png
-In [153]: grid(True)
-
-@doctest float
-In [154]: 0.1 + 0.2
-Out[154]: 0.3
-
-@doctest float
-In [155]: np.arange(16).reshape(4,4)
-Out[155]:
-array([[ 0,  1,  2,  3],
-       [ 4,  5,  6,  7],
-       [ 8,  9, 10, 11],
-       [12, 13, 14, 15]])
-
-In [1]: x = np.arange(16, dtype=float).reshape(4,4)
-
-In [2]: x[0,0] = np.inf
-
-In [3]: x[0,1] = np.nan
-
-@doctest float
-In [4]: x
-Out[4]:
-array([[ inf,  nan,   2.,   3.],
-       [  4.,   5.,   6.,   7.],
-       [  8.,   9.,  10.,  11.],
-       [ 12.,  13.,  14.,  15.]])
-
-
-        """,
-        ]
-    # skip local-file depending first example:
-    examples = examples[1:]
-
-    #ipython_directive.DEBUG = True  # dbg
-    #options = dict(suppress=True)  # dbg
-    options = dict()
-    for example in examples:
-        content = example.split('\n')
-        IPythonDirective('debug', arguments=None, options=options,
-                          content=content, lineno=0,
-                          content_offset=None, block_text=None,
-                          state=None, state_machine=None,
-                          )
-
-# Run test suite as a script
-if __name__=='__main__':
-    if not os.path.isdir('_static'):
-        os.mkdir('_static')
-    test()
-    print('All OK? Check figures in _static/')
diff --git a/doc/sphinxext/numpydoc/LICENSE.txt b/doc/sphinxext/numpydoc/LICENSE.txt
deleted file mode 100644
index b15c699dcecaa..0000000000000
--- a/doc/sphinxext/numpydoc/LICENSE.txt
+++ /dev/null
@@ -1,94 +0,0 @@
--------------------------------------------------------------------------------
-    The files
-    - numpydoc.py
-    - docscrape.py
-    - docscrape_sphinx.py
-    - phantom_import.py
-    have the following license:
-
-Copyright (C) 2008 Stefan van der Walt <stefan@mentat.za.net>, Pauli Virtanen <pav@iki.fi>
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are
-met:
-
- 1. Redistributions of source code must retain the above copyright
-    notice, this list of conditions and the following disclaimer.
- 2. Redistributions in binary form must reproduce the above copyright
-    notice, this list of conditions and the following disclaimer in
-    the documentation and/or other materials provided with the
-    distribution.
-
-THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
-IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
-INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
-SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
-HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
-STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
-IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
-POSSIBILITY OF SUCH DAMAGE.
-
--------------------------------------------------------------------------------
-    The files
-    - compiler_unparse.py
-    - comment_eater.py
-    - traitsdoc.py
-    have the following license:
-
-This software is OSI Certified Open Source Software.
-OSI Certified is a certification mark of the Open Source Initiative.
-
-Copyright (c) 2006, Enthought, Inc.
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-
- * Redistributions of source code must retain the above copyright notice, this
-   list of conditions and the following disclaimer.
- * Redistributions in binary form must reproduce the above copyright notice,
-   this list of conditions and the following disclaimer in the documentation
-   and/or other materials provided with the distribution.
- * Neither the name of Enthought, Inc. nor the names of its contributors may
-   be used to endorse or promote products derived from this software without
-   specific prior written permission.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
-ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
-ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
--------------------------------------------------------------------------------
-    The file
-    - plot_directive.py
-    originates from Matplotlib (http://matplotlib.sf.net/) which has
-    the following license:
-
-Copyright (c) 2002-2008 John D. Hunter; All Rights Reserved.
-
-1. This LICENSE AGREEMENT is between John D. Hunter (“JDH”), and the Individual or Organization (“Licensee”) accessing and otherwise using matplotlib software in source or binary form and its associated documentation.
-
-2. Subject to the terms and conditions of this License Agreement, JDH hereby grants Licensee a nonexclusive, royalty-free, world-wide license to reproduce, analyze, test, perform and/or display publicly, prepare derivative works, distribute, and otherwise use matplotlib 0.98.3 alone or in any derivative version, provided, however, that JDH’s License Agreement and JDH’s notice of copyright, i.e., “Copyright (c) 2002-2008 John D. Hunter; All Rights Reserved” are retained in matplotlib 0.98.3 alone or in any derivative version prepared by Licensee.
-
-3. In the event Licensee prepares a derivative work that is based on or incorporates matplotlib 0.98.3 or any part thereof, and wants to make the derivative work available to others as provided herein, then Licensee hereby agrees to include in any such work a brief summary of the changes made to matplotlib 0.98.3.
-
-4. JDH is making matplotlib 0.98.3 available to Licensee on an “AS IS” basis. JDH MAKES NO REPRESENTATIONS OR WARRANTIES, EXPRESS OR IMPLIED. BY WAY OF EXAMPLE, BUT NOT LIMITATION, JDH MAKES NO AND DISCLAIMS ANY REPRESENTATION OR WARRANTY OF MERCHANTABILITY OR FITNESS FOR ANY PARTICULAR PURPOSE OR THAT THE USE OF MATPLOTLIB 0.98.3 WILL NOT INFRINGE ANY THIRD PARTY RIGHTS.
-
-5. JDH SHALL NOT BE LIABLE TO LICENSEE OR ANY OTHER USERS OF MATPLOTLIB 0.98.3 FOR ANY INCIDENTAL, SPECIAL, OR CONSEQUENTIAL DAMAGES OR LOSS AS A RESULT OF MODIFYING, DISTRIBUTING, OR OTHERWISE USING MATPLOTLIB 0.98.3, OR ANY DERIVATIVE THEREOF, EVEN IF ADVISED OF THE POSSIBILITY THEREOF.
-
-6. This License Agreement will automatically terminate upon a material breach of its terms and conditions.
-
-7. Nothing in this License Agreement shall be deemed to create any relationship of agency, partnership, or joint venture between JDH and Licensee. This License Agreement does not grant permission to use JDH trademarks or trade name in a trademark sense to endorse or promote products or services of Licensee, or any third party.
-
-8. By copying, installing or otherwise using matplotlib 0.98.3, Licensee agrees to be bound by the terms and conditions of this License Agreement.
-
diff --git a/doc/sphinxext/numpydoc/README.rst b/doc/sphinxext/numpydoc/README.rst
deleted file mode 100755
index 89b9f2fd23e9b..0000000000000
--- a/doc/sphinxext/numpydoc/README.rst
+++ /dev/null
@@ -1,51 +0,0 @@
-=====================================
-numpydoc -- Numpy's Sphinx extensions
-=====================================
-
-Numpy's documentation uses several custom extensions to Sphinx.  These
-are shipped in this ``numpydoc`` package, in case you want to make use
-of them in third-party projects.
-
-The following extensions are available:
-
-  - ``numpydoc``: support for the Numpy docstring format in Sphinx, and add
-    the code description directives ``np:function``, ``np-c:function``, etc.
-    that support the Numpy docstring syntax.
-
-  - ``numpydoc.traitsdoc``: For gathering documentation about Traits attributes.
-
-  - ``numpydoc.plot_directive``: Adaptation of Matplotlib's ``plot::``
-    directive. Note that this implementation may still undergo severe
-    changes or eventually be deprecated.
-
-
-numpydoc
-========
-
-Numpydoc inserts a hook into Sphinx's autodoc that converts docstrings
-following the Numpy/Scipy format to a form palatable to Sphinx.
-
-Options
--------
-
-The following options can be set in conf.py:
-
-- numpydoc_use_plots: bool
-
-  Whether to produce ``plot::`` directives for Examples sections that
-  contain ``import matplotlib``.
-
-- numpydoc_show_class_members: bool
-
-  Whether to show all members of a class in the Methods and Attributes
-  sections automatically.
-
-- numpydoc_class_members_toctree: bool
-
-  Whether to create a Sphinx table of contents for the lists of class
-  methods and attributes. If a table of contents is made, Sphinx expects
-  each entry to have a separate page.
-
-- numpydoc_edit_link: bool  (DEPRECATED -- edit your HTML template instead)
-
-  Whether to insert an edit link after docstrings.
diff --git a/doc/sphinxext/numpydoc/__init__.py b/doc/sphinxext/numpydoc/__init__.py
deleted file mode 100755
index 0fce2cf747e23..0000000000000
--- a/doc/sphinxext/numpydoc/__init__.py
+++ /dev/null
@@ -1,3 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-from .numpydoc import setup
diff --git a/doc/sphinxext/numpydoc/comment_eater.py b/doc/sphinxext/numpydoc/comment_eater.py
deleted file mode 100755
index 8cddd3305f0bc..0000000000000
--- a/doc/sphinxext/numpydoc/comment_eater.py
+++ /dev/null
@@ -1,169 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import sys
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from io import StringIO
-
-import compiler
-import inspect
-import textwrap
-import tokenize
-
-from .compiler_unparse import unparse
-
-
-class Comment(object):
-    """ A comment block.
-    """
-    is_comment = True
-    def __init__(self, start_lineno, end_lineno, text):
-        # int : The first line number in the block. 1-indexed.
-        self.start_lineno = start_lineno
-        # int : The last line number. Inclusive!
-        self.end_lineno = end_lineno
-        # str : The text block including '#' character but not any leading spaces.
-        self.text = text
-
-    def add(self, string, start, end, line):
-        """ Add a new comment line.
-        """
-        self.start_lineno = min(self.start_lineno, start[0])
-        self.end_lineno = max(self.end_lineno, end[0])
-        self.text += string
-
-    def __repr__(self):
-        return '%s(%r, %r, %r)' % (self.__class__.__name__, self.start_lineno,
-            self.end_lineno, self.text)
-
-
-class NonComment(object):
-    """ A non-comment block of code.
-    """
-    is_comment = False
-    def __init__(self, start_lineno, end_lineno):
-        self.start_lineno = start_lineno
-        self.end_lineno = end_lineno
-
-    def add(self, string, start, end, line):
-        """ Add lines to the block.
-        """
-        if string.strip():
-            # Only add if not entirely whitespace.
-            self.start_lineno = min(self.start_lineno, start[0])
-            self.end_lineno = max(self.end_lineno, end[0])
-
-    def __repr__(self):
-        return '%s(%r, %r)' % (self.__class__.__name__, self.start_lineno,
-            self.end_lineno)
-
-
-class CommentBlocker(object):
-    """ Pull out contiguous comment blocks.
-    """
-    def __init__(self):
-        # Start with a dummy.
-        self.current_block = NonComment(0, 0)
-
-        # All of the blocks seen so far.
-        self.blocks = []
-
-        # The index mapping lines of code to their associated comment blocks.
-        self.index = {}
-
-    def process_file(self, file):
-        """ Process a file object.
-        """
-        if sys.version_info[0] >= 3:
-            nxt = file.__next__
-        else:
-            nxt = file.next
-        for token in tokenize.generate_tokens(nxt):
-            self.process_token(*token)
-        self.make_index()
-
-    def process_token(self, kind, string, start, end, line):
-        """ Process a single token.
-        """
-        if self.current_block.is_comment:
-            if kind == tokenize.COMMENT:
-                self.current_block.add(string, start, end, line)
-            else:
-                self.new_noncomment(start[0], end[0])
-        else:
-            if kind == tokenize.COMMENT:
-                self.new_comment(string, start, end, line)
-            else:
-                self.current_block.add(string, start, end, line)
-
-    def new_noncomment(self, start_lineno, end_lineno):
-        """ We are transitioning from a noncomment to a comment.
-        """
-        block = NonComment(start_lineno, end_lineno)
-        self.blocks.append(block)
-        self.current_block = block
-
-    def new_comment(self, string, start, end, line):
-        """ Possibly add a new comment.
-
-        Only adds a new comment if this comment is the only thing on the line.
-        Otherwise, it extends the noncomment block.
-        """
-        prefix = line[:start[1]]
-        if prefix.strip():
-            # Oops! Trailing comment, not a comment block.
-            self.current_block.add(string, start, end, line)
-        else:
-            # A comment block.
-            block = Comment(start[0], end[0], string)
-            self.blocks.append(block)
-            self.current_block = block
-
-    def make_index(self):
-        """ Make the index mapping lines of actual code to their associated
-        prefix comments.
-        """
-        for prev, block in zip(self.blocks[:-1], self.blocks[1:]):
-            if not block.is_comment:
-                self.index[block.start_lineno] = prev
-
-    def search_for_comment(self, lineno, default=None):
-        """ Find the comment block just before the given line number.
-
-        Returns None (or the specified default) if there is no such block.
-        """
-        if not self.index:
-            self.make_index()
-        block = self.index.get(lineno, None)
-        text = getattr(block, 'text', default)
-        return text
-
-
-def strip_comment_marker(text):
-    """ Strip # markers at the front of a block of comment text.
-    """
-    lines = []
-    for line in text.splitlines():
-        lines.append(line.lstrip('#'))
-    text = textwrap.dedent('\n'.join(lines))
-    return text
-
-
-def get_class_traits(klass):
-    """ Yield all of the documentation for trait definitions on a class object.
-    """
-    # FIXME: gracefully handle errors here or in the caller?
-    source = inspect.getsource(klass)
-    cb = CommentBlocker()
-    cb.process_file(StringIO(source))
-    mod_ast = compiler.parse(source)
-    class_ast = mod_ast.node.nodes[0]
-    for node in class_ast.code.nodes:
-        # FIXME: handle other kinds of assignments?
-        if isinstance(node, compiler.ast.Assign):
-            name = node.nodes[0].name
-            rhs = unparse(node.expr).strip()
-            doc = strip_comment_marker(cb.search_for_comment(node.lineno, default=''))
-            yield name, rhs, doc
-
diff --git a/doc/sphinxext/numpydoc/compiler_unparse.py b/doc/sphinxext/numpydoc/compiler_unparse.py
deleted file mode 100755
index 8933a83db3f23..0000000000000
--- a/doc/sphinxext/numpydoc/compiler_unparse.py
+++ /dev/null
@@ -1,865 +0,0 @@
-""" Turn compiler.ast structures back into executable python code.
-
-    The unparse method takes a compiler.ast tree and transforms it back into
-    valid python code.  It is incomplete and currently only works for
-    import statements, function calls, function definitions, assignments, and
-    basic expressions.
-
-    Inspired by python-2.5-svn/Demo/parser/unparse.py
-
-    fixme: We may want to move to using _ast trees because the compiler for
-           them is about 6 times faster than compiler.compile.
-"""
-from __future__ import division, absolute_import, print_function
-
-import sys
-from compiler.ast import Const, Name, Tuple, Div, Mul, Sub, Add
-
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from StringIO import StringIO
-
-def unparse(ast, single_line_functions=False):
-    s = StringIO()
-    UnparseCompilerAst(ast, s, single_line_functions)
-    return s.getvalue().lstrip()
-
-op_precedence = { 'compiler.ast.Power':3, 'compiler.ast.Mul':2, 'compiler.ast.Div':2,
-                  'compiler.ast.Add':1, 'compiler.ast.Sub':1 }
-
-class UnparseCompilerAst:
-    """ Methods in this class recursively traverse an AST and
-        output source code for the abstract syntax; original formatting
-        is disregarged.
-    """
-
-    #########################################################################
-    # object interface.
-    #########################################################################
-
-    def __init__(self, tree, file = sys.stdout, single_line_functions=False):
-        """ Unparser(tree, file=sys.stdout) -> None.
-
-            Print the source for tree to file.
-        """
-        self.f = file
-        self._single_func = single_line_functions
-        self._do_indent = True
-        self._indent = 0
-        self._dispatch(tree)
-        self._write("\n")
-        self.f.flush()
-
-    #########################################################################
-    # Unparser private interface.
-    #########################################################################
-
-    ### format, output, and dispatch methods ################################
-
-    def _fill(self, text = ""):
-        "Indent a piece of text, according to the current indentation level"
-        if self._do_indent:
-            self._write("\n"+"    "*self._indent + text)
-        else:
-            self._write(text)
-
-    def _write(self, text):
-        "Append a piece of text to the current line."
-        self.f.write(text)
-
-    def _enter(self):
-        "Print ':', and increase the indentation."
-        self._write(": ")
-        self._indent += 1
-
-    def _leave(self):
-        "Decrease the indentation level."
-        self._indent -= 1
-
-    def _dispatch(self, tree):
-        "_dispatcher function, _dispatching tree type T to method _T."
-        if isinstance(tree, list):
-            for t in tree:
-                self._dispatch(t)
-            return
-        meth = getattr(self, "_"+tree.__class__.__name__)
-        if tree.__class__.__name__ == 'NoneType' and not self._do_indent:
-            return
-        meth(tree)
-
-
-    #########################################################################
-    # compiler.ast unparsing methods.
-    #
-    # There should be one method per concrete grammar type. They are
-    # organized in alphabetical order.
-    #########################################################################
-
-    def _Add(self, t):
-        self.__binary_op(t, '+')
-
-    def _And(self, t):
-        self._write(" (")
-        for i, node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i != len(t.nodes)-1:
-                self._write(") and (")
-        self._write(")")
-
-    def _AssAttr(self, t):
-        """ Handle assigning an attribute of an object
-        """
-        self._dispatch(t.expr)
-        self._write('.'+t.attrname)
-
-    def _Assign(self, t):
-        """ Expression Assignment such as "a = 1".
-
-            This only handles assignment in expressions.  Keyword assignment
-            is handled separately.
-        """
-        self._fill()
-        for target in t.nodes:
-            self._dispatch(target)
-            self._write(" = ")
-        self._dispatch(t.expr)
-        if not self._do_indent:
-            self._write('; ')
-
-    def _AssName(self, t):
-        """ Name on left hand side of expression.
-
-            Treat just like a name on the right side of an expression.
-        """
-        self._Name(t)
-
-    def _AssTuple(self, t):
-        """ Tuple on left hand side of an expression.
-        """
-
-        # _write each elements, separated by a comma.
-        for element in t.nodes[:-1]:
-            self._dispatch(element)
-            self._write(", ")
-
-        # Handle the last one without writing comma
-        last_element = t.nodes[-1]
-        self._dispatch(last_element)
-
-    def _AugAssign(self, t):
-        """ +=,-=,*=,/=,**=, etc. operations
-        """
-
-        self._fill()
-        self._dispatch(t.node)
-        self._write(' '+t.op+' ')
-        self._dispatch(t.expr)
-        if not self._do_indent:
-            self._write(';')
-
-    def _Bitand(self, t):
-        """ Bit and operation.
-        """
-
-        for i, node in enumerate(t.nodes):
-            self._write("(")
-            self._dispatch(node)
-            self._write(")")
-            if i != len(t.nodes)-1:
-                self._write(" & ")
-
-    def _Bitor(self, t):
-        """ Bit or operation
-        """
-
-        for i, node in enumerate(t.nodes):
-            self._write("(")
-            self._dispatch(node)
-            self._write(")")
-            if i != len(t.nodes)-1:
-                self._write(" | ")
-
-    def _CallFunc(self, t):
-        """ Function call.
-        """
-        self._dispatch(t.node)
-        self._write("(")
-        comma = False
-        for e in t.args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._dispatch(e)
-        if t.star_args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._write("*")
-            self._dispatch(t.star_args)
-        if t.dstar_args:
-            if comma: self._write(", ")
-            else: comma = True
-            self._write("**")
-            self._dispatch(t.dstar_args)
-        self._write(")")
-
-    def _Compare(self, t):
-        self._dispatch(t.expr)
-        for op, expr in t.ops:
-            self._write(" " + op + " ")
-            self._dispatch(expr)
-
-    def _Const(self, t):
-        """ A constant value such as an integer value, 3, or a string, "hello".
-        """
-        self._dispatch(t.value)
-
-    def _Decorators(self, t):
-        """ Handle function decorators (eg. @has_units)
-        """
-        for node in t.nodes:
-            self._dispatch(node)
-
-    def _Dict(self, t):
-        self._write("{")
-        for  i, (k, v) in enumerate(t.items):
-            self._dispatch(k)
-            self._write(": ")
-            self._dispatch(v)
-            if i < len(t.items)-1:
-                self._write(", ")
-        self._write("}")
-
-    def _Discard(self, t):
-        """ Node for when return value is ignored such as in "foo(a)".
-        """
-        self._fill()
-        self._dispatch(t.expr)
-
-    def _Div(self, t):
-        self.__binary_op(t, '/')
-
-    def _Ellipsis(self, t):
-        self._write("...")
-
-    def _From(self, t):
-        """ Handle "from xyz import foo, bar as baz".
-        """
-        # fixme: Are From and ImportFrom handled differently?
-        self._fill("from ")
-        self._write(t.modname)
-        self._write(" import ")
-        for i, (name,asname) in enumerate(t.names):
-            if i != 0:
-                self._write(", ")
-            self._write(name)
-            if asname is not None:
-                self._write(" as "+asname)
-
-    def _Function(self, t):
-        """ Handle function definitions
-        """
-        if t.decorators is not None:
-            self._fill("@")
-            self._dispatch(t.decorators)
-        self._fill("def "+t.name + "(")
-        defaults = [None] * (len(t.argnames) - len(t.defaults)) + list(t.defaults)
-        for i, arg in enumerate(zip(t.argnames, defaults)):
-            self._write(arg[0])
-            if arg[1] is not None:
-                self._write('=')
-                self._dispatch(arg[1])
-            if i < len(t.argnames)-1:
-                self._write(', ')
-        self._write(")")
-        if self._single_func:
-            self._do_indent = False
-        self._enter()
-        self._dispatch(t.code)
-        self._leave()
-        self._do_indent = True
-
-    def _Getattr(self, t):
-        """ Handle getting an attribute of an object
-        """
-        if isinstance(t.expr, (Div, Mul, Sub, Add)):
-            self._write('(')
-            self._dispatch(t.expr)
-            self._write(')')
-        else:
-            self._dispatch(t.expr)
-            
-        self._write('.'+t.attrname)
-        
-    def _If(self, t):
-        self._fill()
-        
-        for i, (compare,code) in enumerate(t.tests):
-            if i == 0:
-                self._write("if ")
-            else:
-                self._write("elif ")
-            self._dispatch(compare)
-            self._enter()
-            self._fill()
-            self._dispatch(code)
-            self._leave()
-            self._write("\n")
-
-        if t.else_ is not None:
-            self._write("else")
-            self._enter()
-            self._fill()
-            self._dispatch(t.else_)
-            self._leave()
-            self._write("\n")
-            
-    def _IfExp(self, t):
-        self._dispatch(t.then)
-        self._write(" if ")
-        self._dispatch(t.test)
-
-        if t.else_ is not None:
-            self._write(" else (")
-            self._dispatch(t.else_)
-            self._write(")")
-
-    def _Import(self, t):
-        """ Handle "import xyz.foo".
-        """
-        self._fill("import ")
-        
-        for i, (name,asname) in enumerate(t.names):
-            if i != 0:
-                self._write(", ")
-            self._write(name)
-            if asname is not None:
-                self._write(" as "+asname)
-
-    def _Keyword(self, t):
-        """ Keyword value assignment within function calls and definitions.
-        """
-        self._write(t.name)
-        self._write("=")
-        self._dispatch(t.expr)
-        
-    def _List(self, t):
-        self._write("[")
-        for  i,node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i < len(t.nodes)-1:
-                self._write(", ")
-        self._write("]")
-
-    def _Module(self, t):
-        if t.doc is not None:
-            self._dispatch(t.doc)
-        self._dispatch(t.node)
-
-    def _Mul(self, t):
-        self.__binary_op(t, '*')
-
-    def _Name(self, t):
-        self._write(t.name)
-
-    def _NoneType(self, t):
-        self._write("None")
-        
-    def _Not(self, t):
-        self._write('not (')
-        self._dispatch(t.expr)
-        self._write(')')
-        
-    def _Or(self, t):
-        self._write(" (")
-        for i, node in enumerate(t.nodes):
-            self._dispatch(node)
-            if i != len(t.nodes)-1:
-                self._write(") or (")
-        self._write(")")
-                
-    def _Pass(self, t):
-        self._write("pass\n")
-
-    def _Printnl(self, t):
-        self._fill("print ")
-        if t.dest:
-            self._write(">> ")
-            self._dispatch(t.dest)
-            self._write(", ")
-        comma = False
-        for node in t.nodes:
-            if comma: self._write(', ')
-            else: comma = True
-            self._dispatch(node)
-
-    def _Power(self, t):
-        self.__binary_op(t, '**')
-
-    def _Return(self, t):
-        self._fill("return ")
-        if t.value:
-            if isinstance(t.value, Tuple):
-                text = ', '.join([ name.name for name in t.value.asList() ])
-                self._write(text)
-            else:
-                self._dispatch(t.value)
-            if not self._do_indent:
-                self._write('; ')
-
-    def _Slice(self, t):
-        self._dispatch(t.expr)
-        self._write("[")
-        if t.lower:
-            self._dispatch(t.lower)
-        self._write(":")
-        if t.upper:
-            self._dispatch(t.upper)
-        #if t.step:
-        #    self._write(":")
-        #    self._dispatch(t.step)
-        self._write("]")
-
-    def _Sliceobj(self, t):
-        for i, node in enumerate(t.nodes):
-            if i != 0:
-                self._write(":")
-            if not (isinstance(node, Const) and node.value is None):
-                self._dispatch(node)
-
-    def _Stmt(self, tree):
-        for node in tree.nodes:
-            self._dispatch(node)
-
-    def _Sub(self, t):
-        self.__binary_op(t, '-')
-
-    def _Subscript(self, t):
-        self._dispatch(t.expr)
-        self._write("[")
-        for i, value in enumerate(t.subs):
-            if i != 0:
-                self._write(",")
-            self._dispatch(value)
-        self._write("]")
-
-    def _TryExcept(self, t):
-        self._fill("try")
-        self._enter()
-        self._dispatch(t.body)
-        self._leave()
-
-        for handler in t.handlers:
-            self._fill('except ')
-            self._dispatch(handler[0])
-            if handler[1] is not None:
-                self._write(', ')
-                self._dispatch(handler[1])
-            self._enter()
-            self._dispatch(handler[2])
-            self._leave()
-            
-        if t.else_:
-            self._fill("else")
-            self._enter()
-            self._dispatch(t.else_)
-            self._leave()
-
-    def _Tuple(self, t):
-
-        if not t.nodes:
-            # Empty tuple.
-            self._write("()")
-        else:
-            self._write("(")
-
-            # _write each elements, separated by a comma.
-            for element in t.nodes[:-1]:
-                self._dispatch(element)
-                self._write(", ")
-
-            # Handle the last one without writing comma
-            last_element = t.nodes[-1]
-            self._dispatch(last_element)
-
-            self._write(")")
-            
-    def _UnaryAdd(self, t):
-        self._write("+")
-        self._dispatch(t.expr)
-        
-    def _UnarySub(self, t):
-        self._write("-")
-        self._dispatch(t.expr)        
-
-    def _With(self, t):
-        self._fill('with ')
-        self._dispatch(t.expr)
-        if t.vars:
-            self._write(' as ')
-            self._dispatch(t.vars.name)
-        self._enter()
-        self._dispatch(t.body)
-        self._leave()
-        self._write('\n')
-        
-    def _int(self, t):
-        self._write(repr(t))
-
-    def __binary_op(self, t, symbol):
-        # Check if parenthesis are needed on left side and then dispatch
-        has_paren = False
-        left_class = str(t.left.__class__)
-        if (left_class in op_precedence.keys() and
-            op_precedence[left_class] < op_precedence[str(t.__class__)]):
-            has_paren = True
-        if has_paren:
-            self._write('(')
-        self._dispatch(t.left)
-        if has_paren:
-            self._write(')')
-        # Write the appropriate symbol for operator
-        self._write(symbol)
-        # Check if parenthesis are needed on the right side and then dispatch
-        has_paren = False
-        right_class = str(t.right.__class__)
-        if (right_class in op_precedence.keys() and
-            op_precedence[right_class] < op_precedence[str(t.__class__)]):
-            has_paren = True
-        if has_paren:
-            self._write('(')
-        self._dispatch(t.right)
-        if has_paren:
-            self._write(')')
-
-    def _float(self, t):
-        # if t is 0.1, str(t)->'0.1' while repr(t)->'0.1000000000001'
-        # We prefer str here.
-        self._write(str(t))
-
-    def _str(self, t):
-        self._write(repr(t))
-        
-    def _tuple(self, t):
-        self._write(str(t))
-
-    #########################################################################
-    # These are the methods from the _ast modules unparse.
-    #
-    # As our needs to handle more advanced code increase, we may want to
-    # modify some of the methods below so that they work for compiler.ast.
-    #########################################################################
-
-#    # stmt
-#    def _Expr(self, tree):
-#        self._fill()
-#        self._dispatch(tree.value)
-#
-#    def _Import(self, t):
-#        self._fill("import ")
-#        first = True
-#        for a in t.names:
-#            if first:
-#                first = False
-#            else:
-#                self._write(", ")
-#            self._write(a.name)
-#            if a.asname:
-#                self._write(" as "+a.asname)
-#
-##    def _ImportFrom(self, t):
-##        self._fill("from ")
-##        self._write(t.module)
-##        self._write(" import ")
-##        for i, a in enumerate(t.names):
-##            if i == 0:
-##                self._write(", ")
-##            self._write(a.name)
-##            if a.asname:
-##                self._write(" as "+a.asname)
-##        # XXX(jpe) what is level for?
-##
-#
-#    def _Break(self, t):
-#        self._fill("break")
-#
-#    def _Continue(self, t):
-#        self._fill("continue")
-#
-#    def _Delete(self, t):
-#        self._fill("del ")
-#        self._dispatch(t.targets)
-#
-#    def _Assert(self, t):
-#        self._fill("assert ")
-#        self._dispatch(t.test)
-#        if t.msg:
-#            self._write(", ")
-#            self._dispatch(t.msg)
-#
-#    def _Exec(self, t):
-#        self._fill("exec ")
-#        self._dispatch(t.body)
-#        if t.globals:
-#            self._write(" in ")
-#            self._dispatch(t.globals)
-#        if t.locals:
-#            self._write(", ")
-#            self._dispatch(t.locals)
-#
-#    def _Print(self, t):
-#        self._fill("print ")
-#        do_comma = False
-#        if t.dest:
-#            self._write(">>")
-#            self._dispatch(t.dest)
-#            do_comma = True
-#        for e in t.values:
-#            if do_comma:self._write(", ")
-#            else:do_comma=True
-#            self._dispatch(e)
-#        if not t.nl:
-#            self._write(",")
-#
-#    def _Global(self, t):
-#        self._fill("global")
-#        for i, n in enumerate(t.names):
-#            if i != 0:
-#                self._write(",")
-#            self._write(" " + n)
-#
-#    def _Yield(self, t):
-#        self._fill("yield")
-#        if t.value:
-#            self._write(" (")
-#            self._dispatch(t.value)
-#            self._write(")")
-#
-#    def _Raise(self, t):
-#        self._fill('raise ')
-#        if t.type:
-#            self._dispatch(t.type)
-#        if t.inst:
-#            self._write(", ")
-#            self._dispatch(t.inst)
-#        if t.tback:
-#            self._write(", ")
-#            self._dispatch(t.tback)
-#
-#
-#    def _TryFinally(self, t):
-#        self._fill("try")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#        self._fill("finally")
-#        self._enter()
-#        self._dispatch(t.finalbody)
-#        self._leave()
-#
-#    def _excepthandler(self, t):
-#        self._fill("except ")
-#        if t.type:
-#            self._dispatch(t.type)
-#        if t.name:
-#            self._write(", ")
-#            self._dispatch(t.name)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _ClassDef(self, t):
-#        self._write("\n")
-#        self._fill("class "+t.name)
-#        if t.bases:
-#            self._write("(")
-#            for a in t.bases:
-#                self._dispatch(a)
-#                self._write(", ")
-#            self._write(")")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _FunctionDef(self, t):
-#        self._write("\n")
-#        for deco in t.decorators:
-#            self._fill("@")
-#            self._dispatch(deco)
-#        self._fill("def "+t.name + "(")
-#        self._dispatch(t.args)
-#        self._write(")")
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#
-#    def _For(self, t):
-#        self._fill("for ")
-#        self._dispatch(t.target)
-#        self._write(" in ")
-#        self._dispatch(t.iter)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#        if t.orelse:
-#            self._fill("else")
-#            self._enter()
-#            self._dispatch(t.orelse)
-#            self._leave
-#
-#    def _While(self, t):
-#        self._fill("while ")
-#        self._dispatch(t.test)
-#        self._enter()
-#        self._dispatch(t.body)
-#        self._leave()
-#        if t.orelse:
-#            self._fill("else")
-#            self._enter()
-#            self._dispatch(t.orelse)
-#            self._leave
-#
-#    # expr
-#    def _Str(self, tree):
-#        self._write(repr(tree.s))
-##
-#    def _Repr(self, t):
-#        self._write("`")
-#        self._dispatch(t.value)
-#        self._write("`")
-#
-#    def _Num(self, t):
-#        self._write(repr(t.n))
-#
-#    def _ListComp(self, t):
-#        self._write("[")
-#        self._dispatch(t.elt)
-#        for gen in t.generators:
-#            self._dispatch(gen)
-#        self._write("]")
-#
-#    def _GeneratorExp(self, t):
-#        self._write("(")
-#        self._dispatch(t.elt)
-#        for gen in t.generators:
-#            self._dispatch(gen)
-#        self._write(")")
-#
-#    def _comprehension(self, t):
-#        self._write(" for ")
-#        self._dispatch(t.target)
-#        self._write(" in ")
-#        self._dispatch(t.iter)
-#        for if_clause in t.ifs:
-#            self._write(" if ")
-#            self._dispatch(if_clause)
-#
-#    def _IfExp(self, t):
-#        self._dispatch(t.body)
-#        self._write(" if ")
-#        self._dispatch(t.test)
-#        if t.orelse:
-#            self._write(" else ")
-#            self._dispatch(t.orelse)
-#
-#    unop = {"Invert":"~", "Not": "not", "UAdd":"+", "USub":"-"}
-#    def _UnaryOp(self, t):
-#        self._write(self.unop[t.op.__class__.__name__])
-#        self._write("(")
-#        self._dispatch(t.operand)
-#        self._write(")")
-#
-#    binop = { "Add":"+", "Sub":"-", "Mult":"*", "Div":"/", "Mod":"%",
-#                    "LShift":">>", "RShift":"<<", "BitOr":"|", "BitXor":"^", "BitAnd":"&",
-#                    "FloorDiv":"//", "Pow": "**"}
-#    def _BinOp(self, t):
-#        self._write("(")
-#        self._dispatch(t.left)
-#        self._write(")" + self.binop[t.op.__class__.__name__] + "(")
-#        self._dispatch(t.right)
-#        self._write(")")
-#
-#    boolops = {_ast.And: 'and', _ast.Or: 'or'}
-#    def _BoolOp(self, t):
-#        self._write("(")
-#        self._dispatch(t.values[0])
-#        for v in t.values[1:]:
-#            self._write(" %s " % self.boolops[t.op.__class__])
-#            self._dispatch(v)
-#        self._write(")")
-#
-#    def _Attribute(self,t):
-#        self._dispatch(t.value)
-#        self._write(".")
-#        self._write(t.attr)
-#
-##    def _Call(self, t):
-##        self._dispatch(t.func)
-##        self._write("(")
-##        comma = False
-##        for e in t.args:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._dispatch(e)
-##        for e in t.keywords:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._dispatch(e)
-##        if t.starargs:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._write("*")
-##            self._dispatch(t.starargs)
-##        if t.kwargs:
-##            if comma: self._write(", ")
-##            else: comma = True
-##            self._write("**")
-##            self._dispatch(t.kwargs)
-##        self._write(")")
-#
-#    # slice
-#    def _Index(self, t):
-#        self._dispatch(t.value)
-#
-#    def _ExtSlice(self, t):
-#        for i, d in enumerate(t.dims):
-#            if i != 0:
-#                self._write(': ')
-#            self._dispatch(d)
-#
-#    # others
-#    def _arguments(self, t):
-#        first = True
-#        nonDef = len(t.args)-len(t.defaults)
-#        for a in t.args[0:nonDef]:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._dispatch(a)
-#        for a,d in zip(t.args[nonDef:], t.defaults):
-#            if first:first = False
-#            else: self._write(", ")
-#            self._dispatch(a),
-#            self._write("=")
-#            self._dispatch(d)
-#        if t.vararg:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._write("*"+t.vararg)
-#        if t.kwarg:
-#            if first:first = False
-#            else: self._write(", ")
-#            self._write("**"+t.kwarg)
-#
-##    def _keyword(self, t):
-##        self._write(t.arg)
-##        self._write("=")
-##        self._dispatch(t.value)
-#
-#    def _Lambda(self, t):
-#        self._write("lambda ")
-#        self._dispatch(t.args)
-#        self._write(": ")
-#        self._dispatch(t.body)
-
-
-
diff --git a/doc/sphinxext/numpydoc/docscrape.py b/doc/sphinxext/numpydoc/docscrape.py
deleted file mode 100755
index 2c49ed84ad224..0000000000000
--- a/doc/sphinxext/numpydoc/docscrape.py
+++ /dev/null
@@ -1,527 +0,0 @@
-"""Extract reference documentation from the NumPy source tree.
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import inspect
-import textwrap
-import re
-import pydoc
-from warnings import warn
-import collections
-
-
-class Reader(object):
-    """A line-based string reader.
-
-    """
-    def __init__(self, data):
-        """
-        Parameters
-        ----------
-        data : str
-           String with lines separated by '\n'.
-
-        """
-        if isinstance(data,list):
-            self._str = data
-        else:
-            self._str = data.split('\n') # store string as list of lines
-
-        self.reset()
-
-    def __getitem__(self, n):
-        return self._str[n]
-
-    def reset(self):
-        self._l = 0 # current line nr
-
-    def read(self):
-        if not self.eof():
-            out = self[self._l]
-            self._l += 1
-            return out
-        else:
-            return ''
-
-    def seek_next_non_empty_line(self):
-        for l in self[self._l:]:
-            if l.strip():
-                break
-            else:
-                self._l += 1
-
-    def eof(self):
-        return self._l >= len(self._str)
-
-    def read_to_condition(self, condition_func):
-        start = self._l
-        for line in self[start:]:
-            if condition_func(line):
-                return self[start:self._l]
-            self._l += 1
-            if self.eof():
-                return self[start:self._l+1]
-        return []
-
-    def read_to_next_empty_line(self):
-        self.seek_next_non_empty_line()
-        def is_empty(line):
-            return not line.strip()
-        return self.read_to_condition(is_empty)
-
-    def read_to_next_unindented_line(self):
-        def is_unindented(line):
-            return (line.strip() and (len(line.lstrip()) == len(line)))
-        return self.read_to_condition(is_unindented)
-
-    def peek(self,n=0):
-        if self._l + n < len(self._str):
-            return self[self._l + n]
-        else:
-            return ''
-
-    def is_empty(self):
-        return not ''.join(self._str).strip()
-
-
-class NumpyDocString(object):
-    def __init__(self, docstring, config={}):
-        docstring = textwrap.dedent(docstring).split('\n')
-
-        self._doc = Reader(docstring)
-        self._parsed_data = {
-            'Signature': '',
-            'Summary': [''],
-            'Extended Summary': [],
-            'Parameters': [],
-            'Returns': [],
-            'Raises': [],
-            'Warns': [],
-            'Other Parameters': [],
-            'Attributes': [],
-            'Methods': [],
-            'See Also': [],
-            'Notes': [],
-            'Warnings': [],
-            'References': '',
-            'Examples': '',
-            'index': {}
-            }
-
-        self._parse()
-
-    def __getitem__(self,key):
-        return self._parsed_data[key]
-
-    def __setitem__(self,key,val):
-        if key not in self._parsed_data:
-            warn("Unknown section %s" % key)
-        else:
-            self._parsed_data[key] = val
-
-    def _is_at_section(self):
-        self._doc.seek_next_non_empty_line()
-
-        if self._doc.eof():
-            return False
-
-        l1 = self._doc.peek().strip()  # e.g. Parameters
-
-        if l1.startswith('.. index::'):
-            return True
-
-        l2 = self._doc.peek(1).strip() #    ---------- or ==========
-        return l2.startswith('-'*len(l1)) or l2.startswith('='*len(l1))
-
-    def _strip(self,doc):
-        i = 0
-        j = 0
-        for i,line in enumerate(doc):
-            if line.strip(): break
-
-        for j,line in enumerate(doc[::-1]):
-            if line.strip(): break
-
-        return doc[i:len(doc)-j]
-
-    def _read_to_next_section(self):
-        section = self._doc.read_to_next_empty_line()
-
-        while not self._is_at_section() and not self._doc.eof():
-            if not self._doc.peek(-1).strip(): # previous line was empty
-                section += ['']
-
-            section += self._doc.read_to_next_empty_line()
-
-        return section
-
-    def _read_sections(self):
-        while not self._doc.eof():
-            data = self._read_to_next_section()
-            name = data[0].strip()
-
-            if name.startswith('..'): # index section
-                yield name, data[1:]
-            elif len(data) < 2:
-                yield StopIteration
-            else:
-                yield name, self._strip(data[2:])
-
-    def _parse_param_list(self,content):
-        r = Reader(content)
-        params = []
-        while not r.eof():
-            header = r.read().strip()
-            if ' : ' in header:
-                arg_name, arg_type = header.split(' : ')[:2]
-            else:
-                arg_name, arg_type = header, ''
-
-            desc = r.read_to_next_unindented_line()
-            desc = dedent_lines(desc)
-
-            params.append((arg_name,arg_type,desc))
-
-        return params
-
-
-    _name_rgx = re.compile(r"^\s*(:(?P<role>\w+):`(?P<name>[a-zA-Z0-9_.-]+)`|"
-                           r" (?P<name2>[a-zA-Z0-9_.-]+))\s*", re.X)
-    def _parse_see_also(self, content):
-        """
-        func_name : Descriptive text
-            continued text
-        another_func_name : Descriptive text
-        func_name1, func_name2, :meth:`func_name`, func_name3
-
-        """
-        items = []
-
-        def parse_item_name(text):
-            """Match ':role:`name`' or 'name'"""
-            m = self._name_rgx.match(text)
-            if m:
-                g = m.groups()
-                if g[1] is None:
-                    return g[3], None
-                else:
-                    return g[2], g[1]
-            raise ValueError("%s is not a item name" % text)
-
-        def push_item(name, rest):
-            if not name:
-                return
-            name, role = parse_item_name(name)
-            items.append((name, list(rest), role))
-            del rest[:]
-
-        current_func = None
-        rest = []
-
-        for line in content:
-            if not line.strip(): continue
-
-            m = self._name_rgx.match(line)
-            if m and line[m.end():].strip().startswith(':'):
-                push_item(current_func, rest)
-                current_func, line = line[:m.end()], line[m.end():]
-                rest = [line.split(':', 1)[1].strip()]
-                if not rest[0]:
-                    rest = []
-            elif not line.startswith(' '):
-                push_item(current_func, rest)
-                current_func = None
-                if ',' in line:
-                    for func in line.split(','):
-                        if func.strip():
-                            push_item(func, [])
-                elif line.strip():
-                    current_func = line
-            elif current_func is not None:
-                rest.append(line.strip())
-        push_item(current_func, rest)
-        return items
-
-    def _parse_index(self, section, content):
-        """
-        .. index: default
-           :refguide: something, else, and more
-
-        """
-        def strip_each_in(lst):
-            return [s.strip() for s in lst]
-
-        out = {}
-        section = section.split('::')
-        if len(section) > 1:
-            out['default'] = strip_each_in(section[1].split(','))[0]
-        for line in content:
-            line = line.split(':')
-            if len(line) > 2:
-                out[line[1]] = strip_each_in(line[2].split(','))
-        return out
-
-    def _parse_summary(self):
-        """Grab signature (if given) and summary"""
-        if self._is_at_section():
-            return
-
-        # If several signatures present, take the last one
-        while True:
-            summary = self._doc.read_to_next_empty_line()
-            summary_str = " ".join([s.strip() for s in summary]).strip()
-            if re.compile('^([\w., ]+=)?\s*[\w\.]+\(.*\)$').match(summary_str):
-                self['Signature'] = summary_str
-                if not self._is_at_section():
-                    continue
-            break
-
-        if summary is not None:
-            self['Summary'] = summary
-
-        if not self._is_at_section():
-            self['Extended Summary'] = self._read_to_next_section()
-
-    def _parse(self):
-        self._doc.reset()
-        self._parse_summary()
-
-        for (section,content) in self._read_sections():
-            if not section.startswith('..'):
-                section = ' '.join([s.capitalize() for s in section.split(' ')])
-            if section in ('Parameters', 'Returns', 'Raises', 'Warns',
-                           'Other Parameters', 'Attributes', 'Methods'):
-                self[section] = self._parse_param_list(content)
-            elif section.startswith('.. index::'):
-                self['index'] = self._parse_index(section, content)
-            elif section == 'See Also':
-                self['See Also'] = self._parse_see_also(content)
-            else:
-                self[section] = content
-
-    # string conversion routines
-
-    def _str_header(self, name, symbol='-'):
-        return [name, len(name)*symbol]
-
-    def _str_indent(self, doc, indent=4):
-        out = []
-        for line in doc:
-            out += [' '*indent + line]
-        return out
-
-    def _str_signature(self):
-        if self['Signature']:
-            return [self['Signature'].replace('*','\*')] + ['']
-        else:
-            return ['']
-
-    def _str_summary(self):
-        if self['Summary']:
-            return self['Summary'] + ['']
-        else:
-            return []
-
-    def _str_extended_summary(self):
-        if self['Extended Summary']:
-            return self['Extended Summary'] + ['']
-        else:
-            return []
-
-    def _str_param_list(self, name):
-        out = []
-        if self[name]:
-            out += self._str_header(name)
-            for param,param_type,desc in self[name]:
-                if param_type:
-                    out += ['%s : %s' % (param, param_type)]
-                else:
-                    out += [param]
-                out += self._str_indent(desc)
-            out += ['']
-        return out
-
-    def _str_section(self, name):
-        out = []
-        if self[name]:
-            out += self._str_header(name)
-            out += self[name]
-            out += ['']
-        return out
-
-    def _str_see_also(self, func_role):
-        if not self['See Also']: return []
-        out = []
-        out += self._str_header("See Also")
-        last_had_desc = True
-        for func, desc, role in self['See Also']:
-            if role:
-                link = ':%s:`%s`' % (role, func)
-            elif func_role:
-                link = ':%s:`%s`' % (func_role, func)
-            else:
-                link = "`%s`_" % func
-            if desc or last_had_desc:
-                out += ['']
-                out += [link]
-            else:
-                out[-1] += ", %s" % link
-            if desc:
-                out += self._str_indent([' '.join(desc)])
-                last_had_desc = True
-            else:
-                last_had_desc = False
-        out += ['']
-        return out
-
-    def _str_index(self):
-        idx = self['index']
-        out = []
-        out += ['.. index:: %s' % idx.get('default','')]
-        for section, references in idx.items():
-            if section == 'default':
-                continue
-            out += ['   :%s: %s' % (section, ', '.join(references))]
-        return out
-
-    def __str__(self, func_role=''):
-        out = []
-        out += self._str_signature()
-        out += self._str_summary()
-        out += self._str_extended_summary()
-        for param_list in ('Parameters', 'Returns', 'Other Parameters',
-                           'Raises', 'Warns'):
-            out += self._str_param_list(param_list)
-        out += self._str_section('Warnings')
-        out += self._str_see_also(func_role)
-        for s in ('Notes','References','Examples'):
-            out += self._str_section(s)
-        for param_list in ('Attributes', 'Methods'):
-            out += self._str_param_list(param_list)
-        out += self._str_index()
-        return '\n'.join(out)
-
-
-def indent(str,indent=4):
-    indent_str = ' '*indent
-    if str is None:
-        return indent_str
-    lines = str.split('\n')
-    return '\n'.join(indent_str + l for l in lines)
-
-def dedent_lines(lines):
-    """Deindent a list of lines maximally"""
-    return textwrap.dedent("\n".join(lines)).split("\n")
-
-def header(text, style='-'):
-    return text + '\n' + style*len(text) + '\n'
-
-
-class FunctionDoc(NumpyDocString):
-    def __init__(self, func, role='func', doc=None, config={}):
-        self._f = func
-        self._role = role # e.g. "func" or "meth"
-
-        if doc is None:
-            if func is None:
-                raise ValueError("No function or docstring given")
-            doc = inspect.getdoc(func) or ''
-        NumpyDocString.__init__(self, doc)
-
-        if not self['Signature'] and func is not None:
-            func, func_name = self.get_func()
-            try:
-                # try to read signature
-                argspec = inspect.getargspec(func)
-                argspec = inspect.formatargspec(*argspec)
-                argspec = argspec.replace('*','\*')
-                signature = '%s%s' % (func_name, argspec)
-            except TypeError as e:
-                signature = '%s()' % func_name
-            self['Signature'] = signature
-
-    def get_func(self):
-        func_name = getattr(self._f, '__name__', self.__class__.__name__)
-        if inspect.isclass(self._f):
-            func = getattr(self._f, '__call__', self._f.__init__)
-        else:
-            func = self._f
-        return func, func_name
-
-    def __str__(self):
-        out = ''
-
-        func, func_name = self.get_func()
-        signature = self['Signature'].replace('*', '\*')
-
-        roles = {'func': 'function',
-                 'meth': 'method'}
-
-        if self._role:
-            if self._role not in roles:
-                print("Warning: invalid role %s" % self._role)
-            out += '.. %s:: %s\n    \n\n' % (roles.get(self._role,''),
-                                             func_name)
-
-        out += super(FunctionDoc, self).__str__(func_role=self._role)
-        return out
-
-
-class ClassDoc(NumpyDocString):
-
-    extra_public_methods = ['__call__']
-
-    def __init__(self, cls, doc=None, modulename='', func_doc=FunctionDoc,
-                 config={}):
-        if not inspect.isclass(cls) and cls is not None:
-            raise ValueError("Expected a class or None, but got %r" % cls)
-        self._cls = cls
-
-        if modulename and not modulename.endswith('.'):
-            modulename += '.'
-        self._mod = modulename
-
-        if doc is None:
-            if cls is None:
-                raise ValueError("No class or documentation string given")
-            doc = pydoc.getdoc(cls)
-
-        NumpyDocString.__init__(self, doc)
-
-        if config.get('show_class_members', True):
-            def splitlines_x(s):
-                if not s:
-                    return []
-                else:
-                    return s.splitlines()
-
-            for field, items in [('Methods', self.methods),
-                                 ('Attributes', self.properties)]:
-                if not self[field]:
-                    doc_list = []
-                    for name in sorted(items):
-                         try:
-                            doc_item = pydoc.getdoc(getattr(self._cls, name))
-                            doc_list.append((name, '', splitlines_x(doc_item)))
-                         except AttributeError:
-                            pass # method doesn't exist
-                    self[field] = doc_list
-
-    @property
-    def methods(self):
-        if self._cls is None:
-            return []
-        return [name for name,func in inspect.getmembers(self._cls)
-                if ((not name.startswith('_')
-                     or name in self.extra_public_methods)
-                    and isinstance(func, collections.Callable))]
-
-    @property
-    def properties(self):
-        if self._cls is None:
-            return []
-        return [name for name,func in inspect.getmembers(self._cls)
-                if not name.startswith('_') and
-                (func is None or isinstance(func, property) or
-                 inspect.isgetsetdescriptor(func))]
diff --git a/doc/sphinxext/numpydoc/docscrape_sphinx.py b/doc/sphinxext/numpydoc/docscrape_sphinx.py
deleted file mode 100755
index 5a582b4d03282..0000000000000
--- a/doc/sphinxext/numpydoc/docscrape_sphinx.py
+++ /dev/null
@@ -1,277 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import sys, re, inspect, textwrap, pydoc
-import sphinx
-import collections
-from .docscrape import NumpyDocString, FunctionDoc, ClassDoc
-
-if sys.version_info[0] >= 3:
-    sixu = lambda s: s
-else:
-    sixu = lambda s: unicode(s, 'unicode_escape')
-
-
-class SphinxDocString(NumpyDocString):
-    def __init__(self, docstring, config={}):
-        # Subclasses seemingly do not call this.
-        NumpyDocString.__init__(self, docstring, config=config)
-
-    def load_config(self, config):
-        self.use_plots = config.get('use_plots', False)
-        self.class_members_toctree = config.get('class_members_toctree', True)
-        self.class_members_list = config.get('class_members_list', True)
-
-    # string conversion routines
-    def _str_header(self, name, symbol='`'):
-        return ['.. rubric:: ' + name, '']
-
-    def _str_field_list(self, name):
-        return [':' + name + ':']
-
-    def _str_indent(self, doc, indent=4):
-        out = []
-        for line in doc:
-            out += [' '*indent + line]
-        return out
-
-    def _str_signature(self):
-        return ['']
-        if self['Signature']:
-            return ['``%s``' % self['Signature']] + ['']
-        else:
-            return ['']
-
-    def _str_summary(self):
-        return self['Summary'] + ['']
-
-    def _str_extended_summary(self):
-        return self['Extended Summary'] + ['']
-
-    def _str_returns(self):
-        out = []
-        if self['Returns']:
-            out += self._str_field_list('Returns')
-            out += ['']
-            for param, param_type, desc in self['Returns']:
-                if param_type:
-                    out += self._str_indent(['**%s** : %s' % (param.strip(),
-                                                              param_type)])
-                else:
-                    out += self._str_indent([param.strip()])
-                if desc:
-                    out += ['']
-                    out += self._str_indent(desc, 8)
-                out += ['']
-        return out
-
-    def _str_param_list(self, name):
-        out = []
-        if self[name]:
-            out += self._str_field_list(name)
-            out += ['']
-            for param, param_type, desc in self[name]:
-                if param_type:
-                    out += self._str_indent(['**%s** : %s' % (param.strip(),
-                                                              param_type)])
-                else:
-                    out += self._str_indent(['**%s**' % param.strip()])
-                if desc:
-                    out += ['']
-                    out += self._str_indent(desc, 8)
-                out += ['']
-        return out
-
-    @property
-    def _obj(self):
-        if hasattr(self, '_cls'):
-            return self._cls
-        elif hasattr(self, '_f'):
-            return self._f
-        return None
-
-    def _str_member_list(self, name):
-        """
-        Generate a member listing, autosummary:: table where possible,
-        and a table where not.
-
-        """
-        out = []
-        if self[name] and self.class_members_list:
-            out += ['.. rubric:: %s' % name, '']
-            prefix = getattr(self, '_name', '')
-
-            if prefix:
-                prefix = '~%s.' % prefix
-
-            autosum = []
-            others = []
-            for param, param_type, desc in self[name]:
-                param = param.strip()
-
-                # Check if the referenced member can have a docstring or not
-                param_obj = getattr(self._obj, param, None)
-                if not (callable(param_obj)
-                        or isinstance(param_obj, property)
-                        or inspect.isgetsetdescriptor(param_obj)):
-                    param_obj = None
-
-                # pandas HACK - do not exclude attributes wich are None
-                # if param_obj and (pydoc.getdoc(param_obj) or not desc):
-                #     # Referenced object has a docstring
-                #     autosum += ["   %s%s" % (prefix, param)]
-                # else:
-                #     others.append((param, param_type, desc))
-                autosum += ["   %s%s" % (prefix, param)]
-
-            if autosum:
-                out += ['.. autosummary::']
-                if self.class_members_toctree:
-                    out += ['   :toctree:']
-                out += [''] + autosum
-
-            if others:
-                maxlen_0 = max(3, max([len(x[0]) for x in others]))
-                hdr = sixu("=")*maxlen_0 + sixu("  ") + sixu("=")*10
-                fmt = sixu('%%%ds  %%s  ') % (maxlen_0,)
-                out += ['', hdr]
-                for param, param_type, desc in others:
-                    desc = sixu(" ").join(x.strip() for x in desc).strip()
-                    if param_type:
-                        desc = "(%s) %s" % (param_type, desc)
-                    out += [fmt % (param.strip(), desc)]
-                out += [hdr]
-            out += ['']
-        return out
-
-    def _str_section(self, name):
-        out = []
-        if self[name]:
-            out += self._str_header(name)
-            out += ['']
-            content = textwrap.dedent("\n".join(self[name])).split("\n")
-            out += content
-            out += ['']
-        return out
-
-    def _str_see_also(self, func_role):
-        out = []
-        if self['See Also']:
-            see_also = super(SphinxDocString, self)._str_see_also(func_role)
-            out = ['.. seealso::', '']
-            out += self._str_indent(see_also[2:])
-        return out
-
-    def _str_warnings(self):
-        out = []
-        if self['Warnings']:
-            out = ['.. warning::', '']
-            out += self._str_indent(self['Warnings'])
-        return out
-
-    def _str_index(self):
-        idx = self['index']
-        out = []
-        if len(idx) == 0:
-            return out
-
-        out += ['.. index:: %s' % idx.get('default','')]
-        for section, references in idx.items():
-            if section == 'default':
-                continue
-            elif section == 'refguide':
-                out += ['   single: %s' % (', '.join(references))]
-            else:
-                out += ['   %s: %s' % (section, ','.join(references))]
-        return out
-
-    def _str_references(self):
-        out = []
-        if self['References']:
-            out += self._str_header('References')
-            if isinstance(self['References'], str):
-                self['References'] = [self['References']]
-            out.extend(self['References'])
-            out += ['']
-            # Latex collects all references to a separate bibliography,
-            # so we need to insert links to it
-            if sphinx.__version__ >= "0.6":
-                out += ['.. only:: latex','']
-            else:
-                out += ['.. latexonly::','']
-            items = []
-            for line in self['References']:
-                m = re.match(r'.. \[([a-z0-9._-]+)\]', line, re.I)
-                if m:
-                    items.append(m.group(1))
-            out += ['   ' + ", ".join(["[%s]_" % item for item in items]), '']
-        return out
-
-    def _str_examples(self):
-        examples_str = "\n".join(self['Examples'])
-
-        if (self.use_plots and 'import matplotlib' in examples_str
-                and 'plot::' not in examples_str):
-            out = []
-            out += self._str_header('Examples')
-            out += ['.. plot::', '']
-            out += self._str_indent(self['Examples'])
-            out += ['']
-            return out
-        else:
-            return self._str_section('Examples')
-
-    def __str__(self, indent=0, func_role="obj"):
-        out = []
-        out += self._str_signature()
-        out += self._str_index() + ['']
-        out += self._str_summary()
-        out += self._str_extended_summary()
-        out += self._str_param_list('Parameters')
-        out += self._str_returns()
-        for param_list in ('Other Parameters', 'Raises', 'Warns'):
-            out += self._str_param_list(param_list)
-        out += self._str_warnings()
-        out += self._str_see_also(func_role)
-        out += self._str_section('Notes')
-        out += self._str_references()
-        out += self._str_examples()
-        for param_list in ('Attributes', 'Methods'):
-            out += self._str_member_list(param_list)
-        out = self._str_indent(out,indent)
-        return '\n'.join(out)
-
-class SphinxFunctionDoc(SphinxDocString, FunctionDoc):
-    def __init__(self, obj, doc=None, config={}):
-        self.load_config(config)
-        FunctionDoc.__init__(self, obj, doc=doc, config=config)
-
-class SphinxClassDoc(SphinxDocString, ClassDoc):
-    def __init__(self, obj, doc=None, func_doc=None, config={}):
-        self.load_config(config)
-        ClassDoc.__init__(self, obj, doc=doc, func_doc=None, config=config)
-
-class SphinxObjDoc(SphinxDocString):
-    def __init__(self, obj, doc=None, config={}):
-        self._f = obj
-        self.load_config(config)
-        SphinxDocString.__init__(self, doc, config=config)
-
-def get_doc_object(obj, what=None, doc=None, config={}):
-    if what is None:
-        if inspect.isclass(obj):
-            what = 'class'
-        elif inspect.ismodule(obj):
-            what = 'module'
-        elif isinstance(obj, collections.Callable):
-            what = 'function'
-        else:
-            what = 'object'
-    if what == 'class':
-        return SphinxClassDoc(obj, func_doc=SphinxFunctionDoc, doc=doc,
-                              config=config)
-    elif what in ('function', 'method'):
-        return SphinxFunctionDoc(obj, doc=doc, config=config)
-    else:
-        if doc is None:
-            doc = pydoc.getdoc(obj)
-        return SphinxObjDoc(obj, doc, config=config)
diff --git a/doc/sphinxext/numpydoc/linkcode.py b/doc/sphinxext/numpydoc/linkcode.py
deleted file mode 100644
index 1ad3ab82cb49c..0000000000000
--- a/doc/sphinxext/numpydoc/linkcode.py
+++ /dev/null
@@ -1,83 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-    linkcode
-    ~~~~~~~~
-
-    Add external links to module code in Python object descriptions.
-
-    :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
-    :license: BSD, see LICENSE for details.
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import warnings
-import collections
-
-warnings.warn("This extension has been accepted to Sphinx upstream. "
-              "Use the version from there (Sphinx >= 1.2) "
-              "https://bitbucket.org/birkenfeld/sphinx/pull-request/47/sphinxextlinkcode",
-              FutureWarning, stacklevel=1)
-
-
-from docutils import nodes
-
-from sphinx import addnodes
-from sphinx.locale import _
-from sphinx.errors import SphinxError
-
-class LinkcodeError(SphinxError):
-    category = "linkcode error"
-
-def doctree_read(app, doctree):
-    env = app.builder.env
-
-    resolve_target = getattr(env.config, 'linkcode_resolve', None)
-    if not isinstance(env.config.linkcode_resolve, collections.Callable):
-        raise LinkcodeError(
-            "Function `linkcode_resolve` is not given in conf.py")
-
-    domain_keys = dict(
-        py=['module', 'fullname'],
-        c=['names'],
-        cpp=['names'],
-        js=['object', 'fullname'],
-    )
-
-    for objnode in doctree.traverse(addnodes.desc):
-        domain = objnode.get('domain')
-        uris = set()
-        for signode in objnode:
-            if not isinstance(signode, addnodes.desc_signature):
-                continue
-
-            # Convert signode to a specified format
-            info = {}
-            for key in domain_keys.get(domain, []):
-                value = signode.get(key)
-                if not value:
-                    value = ''
-                info[key] = value
-            if not info:
-                continue
-
-            # Call user code to resolve the link
-            uri = resolve_target(domain, info)
-            if not uri:
-                # no source
-                continue
-
-            if uri in uris or not uri:
-                # only one link per name, please
-                continue
-            uris.add(uri)
-
-            onlynode = addnodes.only(expr='html')
-            onlynode += nodes.reference('', '', internal=False, refuri=uri)
-            onlynode[0] += nodes.inline('', _('[source]'),
-                                        classes=['viewcode-link'])
-            signode += onlynode
-
-def setup(app):
-    app.connect('doctree-read', doctree_read)
-    app.add_config_value('linkcode_resolve', None, '')
diff --git a/doc/sphinxext/numpydoc/numpydoc.py b/doc/sphinxext/numpydoc/numpydoc.py
deleted file mode 100755
index 0cccf72de3745..0000000000000
--- a/doc/sphinxext/numpydoc/numpydoc.py
+++ /dev/null
@@ -1,191 +0,0 @@
-"""
-========
-numpydoc
-========
-
-Sphinx extension that handles docstrings in the Numpy standard format. [1]
-
-It will:
-
-- Convert Parameters etc. sections to field lists.
-- Convert See Also section to a See also entry.
-- Renumber references.
-- Extract the signature from the docstring, if it can't be determined otherwise.
-
-.. [1] https://github.com/numpy/numpy/blob/master/doc/HOWTO_DOCUMENT.rst.txt
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import os, sys, re, pydoc
-import sphinx
-import inspect
-import collections
-
-if sphinx.__version__ < '1.0.1':
-    raise RuntimeError("Sphinx 1.0.1 or newer is required")
-
-from .docscrape_sphinx import get_doc_object, SphinxDocString
-from sphinx.util.compat import Directive
-
-if sys.version_info[0] >= 3:
-    sixu = lambda s: s
-else:
-    sixu = lambda s: unicode(s, 'unicode_escape')
-
-
-def mangle_docstrings(app, what, name, obj, options, lines,
-                      reference_offset=[0]):
-
-    cfg = dict(use_plots=app.config.numpydoc_use_plots,
-               show_class_members=app.config.numpydoc_show_class_members,
-               class_members_toctree=app.config.numpydoc_class_members_toctree,
-              )
-
-    # PANDAS HACK (to remove the list of methods/attributes for Categorical)
-    if what == "class" and name.endswith(".Categorical"):
-        cfg['class_members_list'] = False
-
-    if what == 'module':
-        # Strip top title
-        title_re = re.compile(sixu('^\\s*[#*=]{4,}\\n[a-z0-9 -]+\\n[#*=]{4,}\\s*'),
-                              re.I|re.S)
-        lines[:] = title_re.sub(sixu(''), sixu("\n").join(lines)).split(sixu("\n"))
-    else:
-        doc = get_doc_object(obj, what, sixu("\n").join(lines), config=cfg)
-        if sys.version_info[0] >= 3:
-            doc = str(doc)
-        else:
-            doc = unicode(doc)
-        lines[:] = doc.split(sixu("\n"))
-
-    if app.config.numpydoc_edit_link and hasattr(obj, '__name__') and \
-           obj.__name__:
-        if hasattr(obj, '__module__'):
-            v = dict(full_name=sixu("%s.%s") % (obj.__module__, obj.__name__))
-        else:
-            v = dict(full_name=obj.__name__)
-        lines += [sixu(''), sixu('.. htmlonly::'), sixu('')]
-        lines += [sixu('    %s') % x for x in
-                  (app.config.numpydoc_edit_link % v).split("\n")]
-
-    # replace reference numbers so that there are no duplicates
-    references = []
-    for line in lines:
-        line = line.strip()
-        m = re.match(sixu('^.. \\[([a-z0-9_.-])\\]'), line, re.I)
-        if m:
-            references.append(m.group(1))
-
-    # start renaming from the longest string, to avoid overwriting parts
-    references.sort(key=lambda x: -len(x))
-    if references:
-        for i, line in enumerate(lines):
-            for r in references:
-                if re.match(sixu('^\\d+$'), r):
-                    new_r = sixu("R%d") % (reference_offset[0] + int(r))
-                else:
-                    new_r = sixu("%s%d") % (r, reference_offset[0])
-                lines[i] = lines[i].replace(sixu('[%s]_') % r,
-                                            sixu('[%s]_') % new_r)
-                lines[i] = lines[i].replace(sixu('.. [%s]') % r,
-                                            sixu('.. [%s]') % new_r)
-
-    reference_offset[0] += len(references)
-
-def mangle_signature(app, what, name, obj, options, sig, retann):
-    # Do not try to inspect classes that don't define `__init__`
-    if (inspect.isclass(obj) and
-        (not hasattr(obj, '__init__') or
-        'initializes x; see ' in pydoc.getdoc(obj.__init__))):
-        return '', ''
-
-    if not (isinstance(obj, collections.Callable) or hasattr(obj, '__argspec_is_invalid_')): return
-    if not hasattr(obj, '__doc__'): return
-
-    doc = SphinxDocString(pydoc.getdoc(obj))
-    if doc['Signature']:
-        sig = re.sub(sixu("^[^(]*"), sixu(""), doc['Signature'])
-        return sig, sixu('')
-
-def setup(app, get_doc_object_=get_doc_object):
-    if not hasattr(app, 'add_config_value'):
-        return # probably called by nose, better bail out
-
-    global get_doc_object
-    get_doc_object = get_doc_object_
-
-    app.connect('autodoc-process-docstring', mangle_docstrings)
-    app.connect('autodoc-process-signature', mangle_signature)
-    app.add_config_value('numpydoc_edit_link', None, False)
-    app.add_config_value('numpydoc_use_plots', None, False)
-    app.add_config_value('numpydoc_show_class_members', True, True)
-    app.add_config_value('numpydoc_class_members_toctree', True, True)
-
-    # Extra mangling domains
-    app.add_domain(NumpyPythonDomain)
-    app.add_domain(NumpyCDomain)
-
-#------------------------------------------------------------------------------
-# Docstring-mangling domains
-#------------------------------------------------------------------------------
-
-from docutils.statemachine import ViewList
-from sphinx.domains.c import CDomain
-from sphinx.domains.python import PythonDomain
-
-class ManglingDomainBase(object):
-    directive_mangling_map = {}
-
-    def __init__(self, *a, **kw):
-        super(ManglingDomainBase, self).__init__(*a, **kw)
-        self.wrap_mangling_directives()
-
-    def wrap_mangling_directives(self):
-        for name, objtype in list(self.directive_mangling_map.items()):
-            self.directives[name] = wrap_mangling_directive(
-                self.directives[name], objtype)
-
-class NumpyPythonDomain(ManglingDomainBase, PythonDomain):
-    name = 'np'
-    directive_mangling_map = {
-        'function': 'function',
-        'class': 'class',
-        'exception': 'class',
-        'method': 'function',
-        'classmethod': 'function',
-        'staticmethod': 'function',
-        'attribute': 'attribute',
-    }
-    indices = []
-
-class NumpyCDomain(ManglingDomainBase, CDomain):
-    name = 'np-c'
-    directive_mangling_map = {
-        'function': 'function',
-        'member': 'attribute',
-        'macro': 'function',
-        'type': 'class',
-        'var': 'object',
-    }
-
-def wrap_mangling_directive(base_directive, objtype):
-    class directive(base_directive):
-        def run(self):
-            env = self.state.document.settings.env
-
-            name = None
-            if self.arguments:
-                m = re.match(r'^(.*\s+)?(.*?)(\(.*)?', self.arguments[0])
-                name = m.group(2).strip()
-
-            if not name:
-                name = self.arguments[0]
-
-            lines = list(self.content)
-            mangle_docstrings(env.app, objtype, name, None, None, lines)
-            self.content = ViewList(lines, self.content.parent)
-
-            return base_directive.run(self)
-
-    return directive
diff --git a/doc/sphinxext/numpydoc/phantom_import.py b/doc/sphinxext/numpydoc/phantom_import.py
deleted file mode 100755
index 4b4fec863a0e3..0000000000000
--- a/doc/sphinxext/numpydoc/phantom_import.py
+++ /dev/null
@@ -1,167 +0,0 @@
-"""
-==============
-phantom_import
-==============
-
-Sphinx extension to make directives from ``sphinx.ext.autodoc`` and similar
-extensions to use docstrings loaded from an XML file.
-
-This extension loads an XML file in the Pydocweb format [1] and
-creates a dummy module that contains the specified docstrings. This
-can be used to get the current docstrings from a Pydocweb instance
-without needing to rebuild the documented module.
-
-.. [1] https://github.com/pv/pydocweb
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import imp, sys, compiler, types, os, inspect, re
-
-def setup(app):
-    app.connect('builder-inited', initialize)
-    app.add_config_value('phantom_import_file', None, True)
-
-def initialize(app):
-    fn = app.config.phantom_import_file
-    if (fn and os.path.isfile(fn)):
-        print("[numpydoc] Phantom importing modules from", fn, "...")
-        import_phantom_module(fn)
-
-#------------------------------------------------------------------------------
-# Creating 'phantom' modules from an XML description
-#------------------------------------------------------------------------------
-def import_phantom_module(xml_file):
-    """
-    Insert a fake Python module to sys.modules, based on a XML file.
-
-    The XML file is expected to conform to Pydocweb DTD. The fake
-    module will contain dummy objects, which guarantee the following:
-
-    - Docstrings are correct.
-    - Class inheritance relationships are correct (if present in XML).
-    - Function argspec is *NOT* correct (even if present in XML).
-      Instead, the function signature is prepended to the function docstring.
-    - Class attributes are *NOT* correct; instead, they are dummy objects.
-
-    Parameters
-    ----------
-    xml_file : str
-        Name of an XML file to read
-    
-    """
-    import lxml.etree as etree
-
-    object_cache = {}
-
-    tree = etree.parse(xml_file)
-    root = tree.getroot()
-
-    # Sort items so that
-    # - Base classes come before classes inherited from them
-    # - Modules come before their contents
-    all_nodes = dict([(n.attrib['id'], n) for n in root])
-    
-    def _get_bases(node, recurse=False):
-        bases = [x.attrib['ref'] for x in node.findall('base')]
-        if recurse:
-            j = 0
-            while True:
-                try:
-                    b = bases[j]
-                except IndexError: break
-                if b in all_nodes:
-                    bases.extend(_get_bases(all_nodes[b]))
-                j += 1
-        return bases
-
-    type_index = ['module', 'class', 'callable', 'object']
-    
-    def base_cmp(a, b):
-        x = cmp(type_index.index(a.tag), type_index.index(b.tag))
-        if x != 0: return x
-
-        if a.tag == 'class' and b.tag == 'class':
-            a_bases = _get_bases(a, recurse=True)
-            b_bases = _get_bases(b, recurse=True)
-            x = cmp(len(a_bases), len(b_bases))
-            if x != 0: return x
-            if a.attrib['id'] in b_bases: return -1
-            if b.attrib['id'] in a_bases: return 1
-        
-        return cmp(a.attrib['id'].count('.'), b.attrib['id'].count('.'))
-
-    nodes = root.getchildren()
-    nodes.sort(base_cmp)
-
-    # Create phantom items
-    for node in nodes:
-        name = node.attrib['id']
-        doc = (node.text or '').decode('string-escape') + "\n"
-        if doc == "\n": doc = ""
-
-        # create parent, if missing
-        parent = name
-        while True:
-            parent = '.'.join(parent.split('.')[:-1])
-            if not parent: break
-            if parent in object_cache: break
-            obj = imp.new_module(parent)
-            object_cache[parent] = obj
-            sys.modules[parent] = obj
-
-        # create object
-        if node.tag == 'module':
-            obj = imp.new_module(name)
-            obj.__doc__ = doc
-            sys.modules[name] = obj
-        elif node.tag == 'class':
-            bases = [object_cache[b] for b in _get_bases(node)
-                     if b in object_cache]
-            bases.append(object)
-            init = lambda self: None
-            init.__doc__ = doc
-            obj = type(name, tuple(bases), {'__doc__': doc, '__init__': init})
-            obj.__name__ = name.split('.')[-1]
-        elif node.tag == 'callable':
-            funcname = node.attrib['id'].split('.')[-1]
-            argspec = node.attrib.get('argspec')
-            if argspec:
-                argspec = re.sub('^[^(]*', '', argspec)
-                doc = "%s%s\n\n%s" % (funcname, argspec, doc)
-            obj = lambda: 0
-            obj.__argspec_is_invalid_ = True
-            if sys.version_info[0] >= 3:
-                obj.__name__ = funcname
-            else:
-                obj.func_name = funcname
-            obj.__name__ = name
-            obj.__doc__ = doc
-            if inspect.isclass(object_cache[parent]):
-                obj.__objclass__ = object_cache[parent]
-        else:
-            class Dummy(object): pass
-            obj = Dummy()
-            obj.__name__ = name
-            obj.__doc__ = doc
-            if inspect.isclass(object_cache[parent]):
-                obj.__get__ = lambda: None
-        object_cache[name] = obj
-
-        if parent:
-            if inspect.ismodule(object_cache[parent]):
-                obj.__module__ = parent
-                setattr(object_cache[parent], name.split('.')[-1], obj)
-
-    # Populate items
-    for node in root:
-        obj = object_cache.get(node.attrib['id'])
-        if obj is None: continue
-        for ref in node.findall('ref'):
-            if node.tag == 'class':
-                if ref.attrib['ref'].startswith(node.attrib['id'] + '.'):
-                    setattr(obj, ref.attrib['name'],
-                            object_cache.get(ref.attrib['ref']))
-            else:
-                setattr(obj, ref.attrib['name'],
-                        object_cache.get(ref.attrib['ref']))
diff --git a/doc/sphinxext/numpydoc/plot_directive.py b/doc/sphinxext/numpydoc/plot_directive.py
deleted file mode 100755
index 2014f857076c1..0000000000000
--- a/doc/sphinxext/numpydoc/plot_directive.py
+++ /dev/null
@@ -1,642 +0,0 @@
-"""
-A special directive for generating a matplotlib plot.
-
-.. warning::
-
-   This is a hacked version of plot_directive.py from Matplotlib.
-   It's very much subject to change!
-
-
-Usage
------
-
-Can be used like this::
-
-    .. plot:: examples/example.py
-
-    .. plot::
-
-       import matplotlib.pyplot as plt
-       plt.plot([1,2,3], [4,5,6])
-
-    .. plot::
-
-       A plotting example:
-
-       >>> import matplotlib.pyplot as plt
-       >>> plt.plot([1,2,3], [4,5,6])
-
-The content is interpreted as doctest formatted if it has a line starting
-with ``>>>``.
-
-The ``plot`` directive supports the options
-
-    format : {'python', 'doctest'}
-        Specify the format of the input
-
-    include-source : bool
-        Whether to display the source code. Default can be changed in conf.py
-
-and the ``image`` directive options ``alt``, ``height``, ``width``,
-``scale``, ``align``, ``class``.
-
-Configuration options
----------------------
-
-The plot directive has the following configuration options:
-
-    plot_include_source
-        Default value for the include-source option
-
-    plot_pre_code
-        Code that should be executed before each plot.
-
-    plot_basedir
-        Base directory, to which plot:: file names are relative to.
-        (If None or empty, file names are relative to the directoly where
-        the file containing the directive is.)
-
-    plot_formats
-        File formats to generate. List of tuples or strings::
-
-            [(suffix, dpi), suffix, ...]
-
-        that determine the file format and the DPI. For entries whose
-        DPI was omitted, sensible defaults are chosen.
-
-    plot_html_show_formats
-        Whether to show links to the files in HTML.
-
-TODO
-----
-
-* Refactor Latex output; now it's plain images, but it would be nice
-  to make them appear side-by-side, or in floats.
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import sys, os, glob, shutil, imp, warnings, re, textwrap, traceback
-import sphinx
-
-if sys.version_info[0] >= 3:
-    from io import StringIO
-else:
-    from io import StringIO
-
-import warnings
-warnings.warn("A plot_directive module is also available under "
-              "matplotlib.sphinxext; expect this numpydoc.plot_directive "
-              "module to be deprecated after relevant features have been "
-              "integrated there.",
-              FutureWarning, stacklevel=2)
-
-
-#------------------------------------------------------------------------------
-# Registration hook
-#------------------------------------------------------------------------------
-
-def setup(app):
-    setup.app = app
-    setup.config = app.config
-    setup.confdir = app.confdir
-
-    app.add_config_value('plot_pre_code', '', True)
-    app.add_config_value('plot_include_source', False, True)
-    app.add_config_value('plot_formats', ['png', 'hires.png', 'pdf'], True)
-    app.add_config_value('plot_basedir', None, True)
-    app.add_config_value('plot_html_show_formats', True, True)
-
-    app.add_directive('plot', plot_directive, True, (0, 1, False),
-                      **plot_directive_options)
-
-#------------------------------------------------------------------------------
-# plot:: directive
-#------------------------------------------------------------------------------
-from docutils.parsers.rst import directives
-from docutils import nodes
-
-def plot_directive(name, arguments, options, content, lineno,
-                   content_offset, block_text, state, state_machine):
-    return run(arguments, content, options, state_machine, state, lineno)
-plot_directive.__doc__ = __doc__
-
-def _option_boolean(arg):
-    if not arg or not arg.strip():
-        # no argument given, assume used as a flag
-        return True
-    elif arg.strip().lower() in ('no', '0', 'false'):
-        return False
-    elif arg.strip().lower() in ('yes', '1', 'true'):
-        return True
-    else:
-        raise ValueError('"%s" unknown boolean' % arg)
-
-def _option_format(arg):
-    return directives.choice(arg, ('python', 'lisp'))
-
-def _option_align(arg):
-    return directives.choice(arg, ("top", "middle", "bottom", "left", "center",
-                                   "right"))
-
-plot_directive_options = {'alt': directives.unchanged,
-                          'height': directives.length_or_unitless,
-                          'width': directives.length_or_percentage_or_unitless,
-                          'scale': directives.nonnegative_int,
-                          'align': _option_align,
-                          'class': directives.class_option,
-                          'include-source': _option_boolean,
-                          'format': _option_format,
-                          }
-
-#------------------------------------------------------------------------------
-# Generating output
-#------------------------------------------------------------------------------
-
-from docutils import nodes, utils
-
-try:
-    # Sphinx depends on either Jinja or Jinja2
-    import jinja2
-    def format_template(template, **kw):
-        return jinja2.Template(template).render(**kw)
-except ImportError:
-    import jinja
-    def format_template(template, **kw):
-        return jinja.from_string(template, **kw)
-
-TEMPLATE = """
-{{ source_code }}
-
-{{ only_html }}
-
-   {% if source_link or (html_show_formats and not multi_image) %}
-   (
-   {%- if source_link -%}
-   `Source code <{{ source_link }}>`__
-   {%- endif -%}
-   {%- if html_show_formats and not multi_image -%}
-     {%- for img in images -%}
-       {%- for fmt in img.formats -%}
-         {%- if source_link or not loop.first -%}, {% endif -%}
-         `{{ fmt }} <{{ dest_dir }}/{{ img.basename }}.{{ fmt }}>`__
-       {%- endfor -%}
-     {%- endfor -%}
-   {%- endif -%}
-   )
-   {% endif %}
-
-   {% for img in images %}
-   .. figure:: {{ build_dir }}/{{ img.basename }}.png
-      {%- for option in options %}
-      {{ option }}
-      {% endfor %}
-
-      {% if html_show_formats and multi_image -%}
-        (
-        {%- for fmt in img.formats -%}
-        {%- if not loop.first -%}, {% endif -%}
-        `{{ fmt }} <{{ dest_dir }}/{{ img.basename }}.{{ fmt }}>`__
-        {%- endfor -%}
-        )
-      {%- endif -%}
-   {% endfor %}
-
-{{ only_latex }}
-
-   {% for img in images %}
-   .. image:: {{ build_dir }}/{{ img.basename }}.pdf
-   {% endfor %}
-
-"""
-
-class ImageFile(object):
-    def __init__(self, basename, dirname):
-        self.basename = basename
-        self.dirname = dirname
-        self.formats = []
-
-    def filename(self, format):
-        return os.path.join(self.dirname, "%s.%s" % (self.basename, format))
-
-    def filenames(self):
-        return [self.filename(fmt) for fmt in self.formats]
-
-def run(arguments, content, options, state_machine, state, lineno):
-    if arguments and content:
-        raise RuntimeError("plot:: directive can't have both args and content")
-
-    document = state_machine.document
-    config = document.settings.env.config
-
-    options.setdefault('include-source', config.plot_include_source)
-
-    # determine input
-    rst_file = document.attributes['source']
-    rst_dir = os.path.dirname(rst_file)
-
-    if arguments:
-        if not config.plot_basedir:
-            source_file_name = os.path.join(rst_dir,
-                                            directives.uri(arguments[0]))
-        else:
-            source_file_name = os.path.join(setup.confdir, config.plot_basedir,
-                                            directives.uri(arguments[0]))
-        code = open(source_file_name, 'r').read()
-        output_base = os.path.basename(source_file_name)
-    else:
-        source_file_name = rst_file
-        code = textwrap.dedent("\n".join(map(str, content)))
-        counter = document.attributes.get('_plot_counter', 0) + 1
-        document.attributes['_plot_counter'] = counter
-        base, ext = os.path.splitext(os.path.basename(source_file_name))
-        output_base = '%s-%d.py' % (base, counter)
-
-    base, source_ext = os.path.splitext(output_base)
-    if source_ext in ('.py', '.rst', '.txt'):
-        output_base = base
-    else:
-        source_ext = ''
-
-    # ensure that LaTeX includegraphics doesn't choke in foo.bar.pdf filenames
-    output_base = output_base.replace('.', '-')
-
-    # is it in doctest format?
-    is_doctest = contains_doctest(code)
-    if 'format' in options:
-        if options['format'] == 'python':
-            is_doctest = False
-        else:
-            is_doctest = True
-
-    # determine output directory name fragment
-    source_rel_name = relpath(source_file_name, setup.confdir)
-    source_rel_dir = os.path.dirname(source_rel_name)
-    while source_rel_dir.startswith(os.path.sep):
-        source_rel_dir = source_rel_dir[1:]
-
-    # build_dir: where to place output files (temporarily)
-    build_dir = os.path.join(os.path.dirname(setup.app.doctreedir),
-                             'plot_directive',
-                             source_rel_dir)
-    if not os.path.exists(build_dir):
-        os.makedirs(build_dir)
-
-    # output_dir: final location in the builder's directory
-    dest_dir = os.path.abspath(os.path.join(setup.app.builder.outdir,
-                                            source_rel_dir))
-
-    # how to link to files from the RST file
-    dest_dir_link = os.path.join(relpath(setup.confdir, rst_dir),
-                                 source_rel_dir).replace(os.path.sep, '/')
-    build_dir_link = relpath(build_dir, rst_dir).replace(os.path.sep, '/')
-    source_link = dest_dir_link + '/' + output_base + source_ext
-
-    # make figures
-    try:
-        results = makefig(code, source_file_name, build_dir, output_base,
-                          config)
-        errors = []
-    except PlotError as err:
-        reporter = state.memo.reporter
-        sm = reporter.system_message(
-            2, "Exception occurred in plotting %s: %s" % (output_base, err),
-            line=lineno)
-        results = [(code, [])]
-        errors = [sm]
-
-    # generate output restructuredtext
-    total_lines = []
-    for j, (code_piece, images) in enumerate(results):
-        if options['include-source']:
-            if is_doctest:
-                lines = ['']
-                lines += [row.rstrip() for row in code_piece.split('\n')]
-            else:
-                lines = ['.. code-block:: python', '']
-                lines += ['    %s' % row.rstrip()
-                          for row in code_piece.split('\n')]
-            source_code = "\n".join(lines)
-        else:
-            source_code = ""
-
-        opts = [':%s: %s' % (key, val) for key, val in list(options.items())
-                if key in ('alt', 'height', 'width', 'scale', 'align', 'class')]
-
-        only_html = ".. only:: html"
-        only_latex = ".. only:: latex"
-
-        if j == 0:
-            src_link = source_link
-        else:
-            src_link = None
-
-        result = format_template(
-            TEMPLATE,
-            dest_dir=dest_dir_link,
-            build_dir=build_dir_link,
-            source_link=src_link,
-            multi_image=len(images) > 1,
-            only_html=only_html,
-            only_latex=only_latex,
-            options=opts,
-            images=images,
-            source_code=source_code,
-            html_show_formats=config.plot_html_show_formats)
-
-        total_lines.extend(result.split("\n"))
-        total_lines.extend("\n")
-
-    if total_lines:
-        state_machine.insert_input(total_lines, source=source_file_name)
-
-    # copy image files to builder's output directory
-    if not os.path.exists(dest_dir):
-        os.makedirs(dest_dir)
-
-    for code_piece, images in results:
-        for img in images:
-            for fn in img.filenames():
-                shutil.copyfile(fn, os.path.join(dest_dir,
-                                                 os.path.basename(fn)))
-
-    # copy script (if necessary)
-    if source_file_name == rst_file:
-        target_name = os.path.join(dest_dir, output_base + source_ext)
-        f = open(target_name, 'w')
-        f.write(unescape_doctest(code))
-        f.close()
-
-    return errors
-
-
-#------------------------------------------------------------------------------
-# Run code and capture figures
-#------------------------------------------------------------------------------
-
-import matplotlib
-matplotlib.use('Agg')
-import matplotlib.pyplot as plt
-import matplotlib.image as image
-from matplotlib import _pylab_helpers
-
-import exceptions
-
-def contains_doctest(text):
-    try:
-        # check if it's valid Python as-is
-        compile(text, '<string>', 'exec')
-        return False
-    except SyntaxError:
-        pass
-    r = re.compile(r'^\s*>>>', re.M)
-    m = r.search(text)
-    return bool(m)
-
-def unescape_doctest(text):
-    """
-    Extract code from a piece of text, which contains either Python code
-    or doctests.
-
-    """
-    if not contains_doctest(text):
-        return text
-
-    code = ""
-    for line in text.split("\n"):
-        m = re.match(r'^\s*(>>>|\.\.\.) (.*)$', line)
-        if m:
-            code += m.group(2) + "\n"
-        elif line.strip():
-            code += "# " + line.strip() + "\n"
-        else:
-            code += "\n"
-    return code
-
-def split_code_at_show(text):
-    """
-    Split code at plt.show()
-
-    """
-
-    parts = []
-    is_doctest = contains_doctest(text)
-
-    part = []
-    for line in text.split("\n"):
-        if (not is_doctest and line.strip() == 'plt.show()') or \
-               (is_doctest and line.strip() == '>>> plt.show()'):
-            part.append(line)
-            parts.append("\n".join(part))
-            part = []
-        else:
-            part.append(line)
-    if "\n".join(part).strip():
-        parts.append("\n".join(part))
-    return parts
-
-class PlotError(RuntimeError):
-    pass
-
-def run_code(code, code_path, ns=None):
-    # Change the working directory to the directory of the example, so
-    # it can get at its data files, if any.
-    pwd = os.getcwd()
-    old_sys_path = list(sys.path)
-    if code_path is not None:
-        dirname = os.path.abspath(os.path.dirname(code_path))
-        os.chdir(dirname)
-        sys.path.insert(0, dirname)
-
-    # Redirect stdout
-    stdout = sys.stdout
-    sys.stdout = StringIO()
-
-    # Reset sys.argv
-    old_sys_argv = sys.argv
-    sys.argv = [code_path]
-    
-    try:
-        try:
-            code = unescape_doctest(code)
-            if ns is None:
-                ns = {}
-            if not ns:
-                exec(setup.config.plot_pre_code, ns)
-            exec(code, ns)
-        except (Exception, SystemExit) as err:
-            raise PlotError(traceback.format_exc())
-    finally:
-        os.chdir(pwd)
-        sys.argv = old_sys_argv
-        sys.path[:] = old_sys_path
-        sys.stdout = stdout
-    return ns
-
-
-#------------------------------------------------------------------------------
-# Generating figures
-#------------------------------------------------------------------------------
-
-def out_of_date(original, derived):
-    """
-    Returns True if derivative is out-of-date wrt original,
-    both of which are full file paths.
-    """
-    return (not os.path.exists(derived)
-            or os.stat(derived).st_mtime < os.stat(original).st_mtime)
-
-
-def makefig(code, code_path, output_dir, output_base, config):
-    """
-    Run a pyplot script *code* and save the images under *output_dir*
-    with file names derived from *output_base*
-
-    """
-
-    # -- Parse format list
-    default_dpi = {'png': 80, 'hires.png': 200, 'pdf': 50}
-    formats = []
-    for fmt in config.plot_formats:
-        if isinstance(fmt, str):
-            formats.append((fmt, default_dpi.get(fmt, 80)))
-        elif type(fmt) in (tuple, list) and len(fmt)==2:
-            formats.append((str(fmt[0]), int(fmt[1])))
-        else:
-            raise PlotError('invalid image format "%r" in plot_formats' % fmt)
-
-    # -- Try to determine if all images already exist
-
-    code_pieces = split_code_at_show(code)
-
-    # Look for single-figure output files first
-    all_exists = True
-    img = ImageFile(output_base, output_dir)
-    for format, dpi in formats:
-        if out_of_date(code_path, img.filename(format)):
-            all_exists = False
-            break
-        img.formats.append(format)
-
-    if all_exists:
-        return [(code, [img])]
-
-    # Then look for multi-figure output files
-    results = []
-    all_exists = True
-    for i, code_piece in enumerate(code_pieces):
-        images = []
-        for j in range(1000):
-            img = ImageFile('%s_%02d_%02d' % (output_base, i, j), output_dir)
-            for format, dpi in formats:
-                if out_of_date(code_path, img.filename(format)):
-                    all_exists = False
-                    break
-                img.formats.append(format)
-
-            # assume that if we have one, we have them all
-            if not all_exists:
-                all_exists = (j > 0)
-                break
-            images.append(img)
-        if not all_exists:
-            break
-        results.append((code_piece, images))
-
-    if all_exists:
-        return results
-
-    # -- We didn't find the files, so build them
-
-    results = []
-    ns = {}
-
-    for i, code_piece in enumerate(code_pieces):
-        # Clear between runs
-        plt.close('all')
-
-        # Run code
-        run_code(code_piece, code_path, ns)
-
-        # Collect images
-        images = []
-        fig_managers = _pylab_helpers.Gcf.get_all_fig_managers()
-        for j, figman in enumerate(fig_managers):
-            if len(fig_managers) == 1 and len(code_pieces) == 1:
-                img = ImageFile(output_base, output_dir)
-            else:
-                img = ImageFile("%s_%02d_%02d" % (output_base, i, j),
-                                output_dir)
-            images.append(img)
-            for format, dpi in formats:
-                try:
-                    figman.canvas.figure.savefig(img.filename(format), dpi=dpi)
-                except exceptions.BaseException as err:
-                    raise PlotError(traceback.format_exc())
-                img.formats.append(format)
-
-        # Results
-        results.append((code_piece, images))
-
-    return results
-
-
-#------------------------------------------------------------------------------
-# Relative pathnames
-#------------------------------------------------------------------------------
-
-try:
-    from os.path import relpath
-except ImportError:
-    # Copied from Python 2.7
-    if 'posix' in sys.builtin_module_names:
-        def relpath(path, start=os.path.curdir):
-            """Return a relative version of a path"""
-            from os.path import sep, curdir, join, abspath, commonprefix, \
-                 pardir
-
-            if not path:
-                raise ValueError("no path specified")
-
-            start_list = abspath(start).split(sep)
-            path_list = abspath(path).split(sep)
-
-            # Work out how much of the filepath is shared by start and path.
-            i = len(commonprefix([start_list, path_list]))
-
-            rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
-            if not rel_list:
-                return curdir
-            return join(*rel_list)
-    elif 'nt' in sys.builtin_module_names:
-        def relpath(path, start=os.path.curdir):
-            """Return a relative version of a path"""
-            from os.path import sep, curdir, join, abspath, commonprefix, \
-                 pardir, splitunc
-
-            if not path:
-                raise ValueError("no path specified")
-            start_list = abspath(start).split(sep)
-            path_list = abspath(path).split(sep)
-            if start_list[0].lower() != path_list[0].lower():
-                unc_path, rest = splitunc(path)
-                unc_start, rest = splitunc(start)
-                if bool(unc_path) ^ bool(unc_start):
-                    raise ValueError("Cannot mix UNC and non-UNC paths (%s and %s)"
-                                                                        % (path, start))
-                else:
-                    raise ValueError("path is on drive %s, start on drive %s"
-                                                        % (path_list[0], start_list[0]))
-            # Work out how much of the filepath is shared by start and path.
-            for i in range(min(len(start_list), len(path_list))):
-                if start_list[i].lower() != path_list[i].lower():
-                    break
-            else:
-                i += 1
-
-            rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
-            if not rel_list:
-                return curdir
-            return join(*rel_list)
-    else:
-        raise RuntimeError("Unsupported platform (no relpath available!)")
diff --git a/doc/sphinxext/numpydoc/tests/test_docscrape.py b/doc/sphinxext/numpydoc/tests/test_docscrape.py
deleted file mode 100755
index b682504e1618f..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_docscrape.py
+++ /dev/null
@@ -1,767 +0,0 @@
-# -*- encoding:utf-8 -*-
-from __future__ import division, absolute_import, print_function
-
-import sys, textwrap
-
-from numpydoc.docscrape import NumpyDocString, FunctionDoc, ClassDoc
-from numpydoc.docscrape_sphinx import SphinxDocString, SphinxClassDoc
-from nose.tools import *
-
-if sys.version_info[0] >= 3:
-    sixu = lambda s: s
-else:
-    sixu = lambda s: unicode(s, 'unicode_escape')
-
-
-doc_txt = '''\
-  numpy.multivariate_normal(mean, cov, shape=None, spam=None)
-
-  Draw values from a multivariate normal distribution with specified
-  mean and covariance.
-
-  The multivariate normal or Gaussian distribution is a generalisation
-  of the one-dimensional normal distribution to higher dimensions.
-
-  Parameters
-  ----------
-  mean : (N,) ndarray
-      Mean of the N-dimensional distribution.
-
-      .. math::
-
-         (1+2+3)/3
-
-  cov : (N, N) ndarray
-      Covariance matrix of the distribution.
-  shape : tuple of ints
-      Given a shape of, for example, (m,n,k), m*n*k samples are
-      generated, and packed in an m-by-n-by-k arrangement.  Because
-      each sample is N-dimensional, the output shape is (m,n,k,N).
-
-  Returns
-  -------
-  out : ndarray
-      The drawn samples, arranged according to `shape`.  If the
-      shape given is (m,n,...), then the shape of `out` is is
-      (m,n,...,N).
-
-      In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
-      value drawn from the distribution.
-  list of str
-      This is not a real return value.  It exists to test
-      anonymous return values.
-
-  Other Parameters
-  ----------------
-  spam : parrot
-      A parrot off its mortal coil.
-
-  Raises
-  ------
-  RuntimeError
-      Some error
-
-  Warns
-  -----
-  RuntimeWarning
-      Some warning
-
-  Warnings
-  --------
-  Certain warnings apply.
-
-  Notes
-  -----
-  Instead of specifying the full covariance matrix, popular
-  approximations include:
-
-    - Spherical covariance (`cov` is a multiple of the identity matrix)
-    - Diagonal covariance (`cov` has non-negative elements only on the diagonal)
-
-  This geometrical property can be seen in two dimensions by plotting
-  generated data-points:
-
-  >>> mean = [0,0]
-  >>> cov = [[1,0],[0,100]] # diagonal covariance, points lie on x or y-axis
-
-  >>> x,y = multivariate_normal(mean,cov,5000).T
-  >>> plt.plot(x,y,'x'); plt.axis('equal'); plt.show()
-
-  Note that the covariance matrix must be symmetric and non-negative
-  definite.
-
-  References
-  ----------
-  .. [1] A. Papoulis, "Probability, Random Variables, and Stochastic
-         Processes," 3rd ed., McGraw-Hill Companies, 1991
-  .. [2] R.O. Duda, P.E. Hart, and D.G. Stork, "Pattern Classification,"
-         2nd ed., Wiley, 2001.
-
-  See Also
-  --------
-  some, other, funcs
-  otherfunc : relationship
-
-  Examples
-  --------
-  >>> mean = (1,2)
-  >>> cov = [[1,0],[1,0]]
-  >>> x = multivariate_normal(mean,cov,(3,3))
-  >>> print x.shape
-  (3, 3, 2)
-
-  The following is probably true, given that 0.6 is roughly twice the
-  standard deviation:
-
-  >>> print list( (x[0,0,:] - mean) < 0.6 )
-  [True, True]
-
-  .. index:: random
-     :refguide: random;distributions, random;gauss
-
-  '''
-doc = NumpyDocString(doc_txt)
-
-
-def test_signature():
-    assert doc['Signature'].startswith('numpy.multivariate_normal(')
-    assert doc['Signature'].endswith('spam=None)')
-
-def test_summary():
-    assert doc['Summary'][0].startswith('Draw values')
-    assert doc['Summary'][-1].endswith('covariance.')
-
-def test_extended_summary():
-    assert doc['Extended Summary'][0].startswith('The multivariate normal')
-
-def test_parameters():
-    assert_equal(len(doc['Parameters']), 3)
-    assert_equal([n for n,_,_ in doc['Parameters']], ['mean','cov','shape'])
-
-    arg, arg_type, desc = doc['Parameters'][1]
-    assert_equal(arg_type, '(N, N) ndarray')
-    assert desc[0].startswith('Covariance matrix')
-    assert doc['Parameters'][0][-1][-2] == '   (1+2+3)/3'
-
-def test_other_parameters():
-    assert_equal(len(doc['Other Parameters']), 1)
-    assert_equal([n for n,_,_ in doc['Other Parameters']], ['spam'])
-    arg, arg_type, desc = doc['Other Parameters'][0]
-    assert_equal(arg_type, 'parrot')
-    assert desc[0].startswith('A parrot off its mortal coil')
-
-def test_returns():
-    assert_equal(len(doc['Returns']), 2)
-    arg, arg_type, desc = doc['Returns'][0]
-    assert_equal(arg, 'out')
-    assert_equal(arg_type, 'ndarray')
-    assert desc[0].startswith('The drawn samples')
-    assert desc[-1].endswith('distribution.')
-
-    arg, arg_type, desc = doc['Returns'][1]
-    assert_equal(arg, 'list of str')
-    assert_equal(arg_type, '')
-    assert desc[0].startswith('This is not a real')
-    assert desc[-1].endswith('anonymous return values.')
-
-def test_notes():
-    assert doc['Notes'][0].startswith('Instead')
-    assert doc['Notes'][-1].endswith('definite.')
-    assert_equal(len(doc['Notes']), 17)
-
-def test_references():
-    assert doc['References'][0].startswith('..')
-    assert doc['References'][-1].endswith('2001.')
-
-def test_examples():
-    assert doc['Examples'][0].startswith('>>>')
-    assert doc['Examples'][-1].endswith('True]')
-
-def test_index():
-    assert_equal(doc['index']['default'], 'random')
-    assert_equal(len(doc['index']), 2)
-    assert_equal(len(doc['index']['refguide']), 2)
-
-def non_blank_line_by_line_compare(a,b):
-    a = textwrap.dedent(a)
-    b = textwrap.dedent(b)
-    a = [l.rstrip() for l in a.split('\n') if l.strip()]
-    b = [l.rstrip() for l in b.split('\n') if l.strip()]
-    for n,line in enumerate(a):
-        if not line == b[n]:
-            raise AssertionError("Lines %s of a and b differ: "
-                                 "\n>>> %s\n<<< %s\n" %
-                                 (n,line,b[n]))
-def test_str():
-    non_blank_line_by_line_compare(str(doc),
-"""numpy.multivariate_normal(mean, cov, shape=None, spam=None)
-
-Draw values from a multivariate normal distribution with specified
-mean and covariance.
-
-The multivariate normal or Gaussian distribution is a generalisation
-of the one-dimensional normal distribution to higher dimensions.
-
-Parameters
-----------
-mean : (N,) ndarray
-    Mean of the N-dimensional distribution.
-
-    .. math::
-
-       (1+2+3)/3
-
-cov : (N, N) ndarray
-    Covariance matrix of the distribution.
-shape : tuple of ints
-    Given a shape of, for example, (m,n,k), m*n*k samples are
-    generated, and packed in an m-by-n-by-k arrangement.  Because
-    each sample is N-dimensional, the output shape is (m,n,k,N).
-
-Returns
--------
-out : ndarray
-    The drawn samples, arranged according to `shape`.  If the
-    shape given is (m,n,...), then the shape of `out` is is
-    (m,n,...,N).
-
-    In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
-    value drawn from the distribution.
-list of str
-    This is not a real return value.  It exists to test
-    anonymous return values.
-
-Other Parameters
-----------------
-spam : parrot
-    A parrot off its mortal coil.
-
-Raises
-------
-RuntimeError
-    Some error
-
-Warns
------
-RuntimeWarning
-    Some warning
-
-Warnings
---------
-Certain warnings apply.
-
-See Also
---------
-`some`_, `other`_, `funcs`_
-
-`otherfunc`_
-    relationship
-
-Notes
------
-Instead of specifying the full covariance matrix, popular
-approximations include:
-
-  - Spherical covariance (`cov` is a multiple of the identity matrix)
-  - Diagonal covariance (`cov` has non-negative elements only on the diagonal)
-
-This geometrical property can be seen in two dimensions by plotting
-generated data-points:
-
->>> mean = [0,0]
->>> cov = [[1,0],[0,100]] # diagonal covariance, points lie on x or y-axis
-
->>> x,y = multivariate_normal(mean,cov,5000).T
->>> plt.plot(x,y,'x'); plt.axis('equal'); plt.show()
-
-Note that the covariance matrix must be symmetric and non-negative
-definite.
-
-References
-----------
-.. [1] A. Papoulis, "Probability, Random Variables, and Stochastic
-       Processes," 3rd ed., McGraw-Hill Companies, 1991
-.. [2] R.O. Duda, P.E. Hart, and D.G. Stork, "Pattern Classification,"
-       2nd ed., Wiley, 2001.
-
-Examples
---------
->>> mean = (1,2)
->>> cov = [[1,0],[1,0]]
->>> x = multivariate_normal(mean,cov,(3,3))
->>> print x.shape
-(3, 3, 2)
-
-The following is probably true, given that 0.6 is roughly twice the
-standard deviation:
-
->>> print list( (x[0,0,:] - mean) < 0.6 )
-[True, True]
-
-.. index:: random
-   :refguide: random;distributions, random;gauss""")
-
-
-def test_sphinx_str():
-    sphinx_doc = SphinxDocString(doc_txt)
-    non_blank_line_by_line_compare(str(sphinx_doc),
-"""
-.. index:: random
-   single: random;distributions, random;gauss
-
-Draw values from a multivariate normal distribution with specified
-mean and covariance.
-
-The multivariate normal or Gaussian distribution is a generalisation
-of the one-dimensional normal distribution to higher dimensions.
-
-:Parameters:
-
-    **mean** : (N,) ndarray
-
-        Mean of the N-dimensional distribution.
-
-        .. math::
-
-           (1+2+3)/3
-
-    **cov** : (N, N) ndarray
-
-        Covariance matrix of the distribution.
-
-    **shape** : tuple of ints
-
-        Given a shape of, for example, (m,n,k), m*n*k samples are
-        generated, and packed in an m-by-n-by-k arrangement.  Because
-        each sample is N-dimensional, the output shape is (m,n,k,N).
-
-:Returns:
-
-    **out** : ndarray
-
-        The drawn samples, arranged according to `shape`.  If the
-        shape given is (m,n,...), then the shape of `out` is is
-        (m,n,...,N).
-
-        In other words, each entry ``out[i,j,...,:]`` is an N-dimensional
-        value drawn from the distribution.
-
-    list of str
-
-        This is not a real return value.  It exists to test
-        anonymous return values.
-
-:Other Parameters:
-
-    **spam** : parrot
-
-        A parrot off its mortal coil.
-
-:Raises:
-
-    **RuntimeError**
-
-        Some error
-
-:Warns:
-
-    **RuntimeWarning**
-
-        Some warning
-
-.. warning::
-
-    Certain warnings apply.
-
-.. seealso::
-
-    :obj:`some`, :obj:`other`, :obj:`funcs`
-
-    :obj:`otherfunc`
-        relationship
-
-.. rubric:: Notes
-
-Instead of specifying the full covariance matrix, popular
-approximations include:
-
-  - Spherical covariance (`cov` is a multiple of the identity matrix)
-  - Diagonal covariance (`cov` has non-negative elements only on the diagonal)
-
-This geometrical property can be seen in two dimensions by plotting
-generated data-points:
-
->>> mean = [0,0]
->>> cov = [[1,0],[0,100]] # diagonal covariance, points lie on x or y-axis
-
->>> x,y = multivariate_normal(mean,cov,5000).T
->>> plt.plot(x,y,'x'); plt.axis('equal'); plt.show()
-
-Note that the covariance matrix must be symmetric and non-negative
-definite.
-
-.. rubric:: References
-
-.. [1] A. Papoulis, "Probability, Random Variables, and Stochastic
-       Processes," 3rd ed., McGraw-Hill Companies, 1991
-.. [2] R.O. Duda, P.E. Hart, and D.G. Stork, "Pattern Classification,"
-       2nd ed., Wiley, 2001.
-
-.. only:: latex
-
-   [1]_, [2]_
-
-.. rubric:: Examples
-
->>> mean = (1,2)
->>> cov = [[1,0],[1,0]]
->>> x = multivariate_normal(mean,cov,(3,3))
->>> print x.shape
-(3, 3, 2)
-
-The following is probably true, given that 0.6 is roughly twice the
-standard deviation:
-
->>> print list( (x[0,0,:] - mean) < 0.6 )
-[True, True]
-""")
-
-
-doc2 = NumpyDocString("""
-    Returns array of indices of the maximum values of along the given axis.
-
-    Parameters
-    ----------
-    a : {array_like}
-        Array to look in.
-    axis : {None, integer}
-        If None, the index is into the flattened array, otherwise along
-        the specified axis""")
-
-def test_parameters_without_extended_description():
-    assert_equal(len(doc2['Parameters']), 2)
-
-doc3 = NumpyDocString("""
-    my_signature(*params, **kwds)
-
-    Return this and that.
-    """)
-
-def test_escape_stars():
-    signature = str(doc3).split('\n')[0]
-    assert_equal(signature, 'my_signature(\*params, \*\*kwds)')
-
-doc4 = NumpyDocString(
-    """a.conj()
-
-    Return an array with all complex-valued elements conjugated.""")
-
-def test_empty_extended_summary():
-    assert_equal(doc4['Extended Summary'], [])
-
-doc5 = NumpyDocString(
-    """
-    a.something()
-
-    Raises
-    ------
-    LinAlgException
-        If array is singular.
-
-    Warns
-    -----
-    SomeWarning
-        If needed
-    """)
-
-def test_raises():
-    assert_equal(len(doc5['Raises']), 1)
-    name,_,desc = doc5['Raises'][0]
-    assert_equal(name,'LinAlgException')
-    assert_equal(desc,['If array is singular.'])
-
-def test_warns():
-    assert_equal(len(doc5['Warns']), 1)
-    name,_,desc = doc5['Warns'][0]
-    assert_equal(name,'SomeWarning')
-    assert_equal(desc,['If needed'])
-
-def test_see_also():
-    doc6 = NumpyDocString(
-    """
-    z(x,theta)
-
-    See Also
-    --------
-    func_a, func_b, func_c
-    func_d : some equivalent func
-    foo.func_e : some other func over
-             multiple lines
-    func_f, func_g, :meth:`func_h`, func_j,
-    func_k
-    :obj:`baz.obj_q`
-    :class:`class_j`: fubar
-        foobar
-    """)
-
-    assert len(doc6['See Also']) == 12
-    for func, desc, role in doc6['See Also']:
-        if func in ('func_a', 'func_b', 'func_c', 'func_f',
-                    'func_g', 'func_h', 'func_j', 'func_k', 'baz.obj_q'):
-            assert(not desc)
-        else:
-            assert(desc)
-
-        if func == 'func_h':
-            assert role == 'meth'
-        elif func == 'baz.obj_q':
-            assert role == 'obj'
-        elif func == 'class_j':
-            assert role == 'class'
-        else:
-            assert role is None
-
-        if func == 'func_d':
-            assert desc == ['some equivalent func']
-        elif func == 'foo.func_e':
-            assert desc == ['some other func over', 'multiple lines']
-        elif func == 'class_j':
-            assert desc == ['fubar', 'foobar']
-
-def test_see_also_print():
-    class Dummy(object):
-        """
-        See Also
-        --------
-        func_a, func_b
-        func_c : some relationship
-                 goes here
-        func_d
-        """
-        pass
-
-    obj = Dummy()
-    s = str(FunctionDoc(obj, role='func'))
-    assert(':func:`func_a`, :func:`func_b`' in s)
-    assert('    some relationship' in s)
-    assert(':func:`func_d`' in s)
-
-doc7 = NumpyDocString("""
-
-        Doc starts on second line.
-
-        """)
-
-def test_empty_first_line():
-    assert doc7['Summary'][0].startswith('Doc starts')
-
-
-def test_no_summary():
-    str(SphinxDocString("""
-    Parameters
-    ----------"""))
-
-
-def test_unicode():
-    doc = SphinxDocString("""
-    öäöäöäöäöåååå
-
-    öäöäöäööäååå
-
-    Parameters
-    ----------
-    ååå : äää
-        ööö
-
-    Returns
-    -------
-    ååå : ööö
-        äää
-
-    """)
-    assert isinstance(doc['Summary'][0], str)
-    assert doc['Summary'][0] == 'öäöäöäöäöåååå'
-
-def test_plot_examples():
-    cfg = dict(use_plots=True)
-
-    doc = SphinxDocString("""
-    Examples
-    --------
-    >>> import matplotlib.pyplot as plt
-    >>> plt.plot([1,2,3],[4,5,6])
-    >>> plt.show()
-    """, config=cfg)
-    assert 'plot::' in str(doc), str(doc)
-
-    doc = SphinxDocString("""
-    Examples
-    --------
-    .. plot::
-
-       import matplotlib.pyplot as plt
-       plt.plot([1,2,3],[4,5,6])
-       plt.show()
-    """, config=cfg)
-    assert str(doc).count('plot::') == 1, str(doc)
-
-def test_class_members():
-
-    class Dummy(object):
-        """
-        Dummy class.
-
-        """
-        def spam(self, a, b):
-            """Spam\n\nSpam spam."""
-            pass
-        def ham(self, c, d):
-            """Cheese\n\nNo cheese."""
-            pass
-        @property
-        def spammity(self):
-            """Spammity index"""
-            return 0.95
-
-        class Ignorable(object):
-            """local class, to be ignored"""
-            pass
-
-    for cls in (ClassDoc, SphinxClassDoc):
-        doc = cls(Dummy, config=dict(show_class_members=False))
-        assert 'Methods' not in str(doc), (cls, str(doc))
-        assert 'spam' not in str(doc), (cls, str(doc))
-        assert 'ham' not in str(doc), (cls, str(doc))
-        assert 'spammity' not in str(doc), (cls, str(doc))
-        assert 'Spammity index' not in str(doc), (cls, str(doc))
-
-        doc = cls(Dummy, config=dict(show_class_members=True))
-        assert 'Methods' in str(doc), (cls, str(doc))
-        assert 'spam' in str(doc), (cls, str(doc))
-        assert 'ham' in str(doc), (cls, str(doc))
-        assert 'spammity' in str(doc), (cls, str(doc))
-
-        if cls is SphinxClassDoc:
-            assert '.. autosummary::' in str(doc), str(doc)
-        else:
-            assert 'Spammity index' in str(doc), str(doc)
-
-def test_duplicate_signature():
-    # Duplicate function signatures occur e.g. in ufuncs, when the
-    # automatic mechanism adds one, and a more detailed comes from the
-    # docstring itself.
-
-    doc = NumpyDocString(
-    """
-    z(x1, x2)
-
-    z(a, theta)
-    """)
-
-    assert doc['Signature'].strip() == 'z(a, theta)'
-
-
-class_doc_txt = """
-    Foo
-
-    Parameters
-    ----------
-    f : callable ``f(t, y, *f_args)``
-        Aaa.
-    jac : callable ``jac(t, y, *jac_args)``
-        Bbb.
-
-    Attributes
-    ----------
-    t : float
-        Current time.
-    y : ndarray
-        Current variable values.
-
-    Methods
-    -------
-    a
-    b
-    c
-
-    Examples
-    --------
-    For usage examples, see `ode`.
-"""
-
-def test_class_members_doc():
-    doc = ClassDoc(None, class_doc_txt)
-    non_blank_line_by_line_compare(str(doc),
-    """
-    Foo
-
-    Parameters
-    ----------
-    f : callable ``f(t, y, *f_args)``
-        Aaa.
-    jac : callable ``jac(t, y, *jac_args)``
-        Bbb.
-
-    Examples
-    --------
-    For usage examples, see `ode`.
-
-    Attributes
-    ----------
-    t : float
-        Current time.
-    y : ndarray
-        Current variable values.
-
-    Methods
-    -------
-    a
-
-    b
-
-    c
-
-    .. index::
-
-    """)
-
-def test_class_members_doc_sphinx():
-    doc = SphinxClassDoc(None, class_doc_txt)
-    non_blank_line_by_line_compare(str(doc),
-    """
-    Foo
-
-    :Parameters:
-
-        **f** : callable ``f(t, y, *f_args)``
-
-            Aaa.
-
-        **jac** : callable ``jac(t, y, *jac_args)``
-
-            Bbb.
-
-    .. rubric:: Examples
-
-    For usage examples, see `ode`.
-
-    .. rubric:: Attributes
-
-    ===  ==========
-      t  (float) Current time.
-      y  (ndarray) Current variable values.
-    ===  ==========
-
-    .. rubric:: Methods
-
-    ===  ==========
-      a
-      b
-      c
-    ===  ==========
-
-    """)
-
-if __name__ == "__main__":
-    import nose
-    nose.run()
diff --git a/doc/sphinxext/numpydoc/tests/test_linkcode.py b/doc/sphinxext/numpydoc/tests/test_linkcode.py
deleted file mode 100644
index 340166a485fcd..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_linkcode.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.linkcode
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_phantom_import.py b/doc/sphinxext/numpydoc/tests/test_phantom_import.py
deleted file mode 100644
index 173b5662b8df7..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_phantom_import.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.phantom_import
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_plot_directive.py b/doc/sphinxext/numpydoc/tests/test_plot_directive.py
deleted file mode 100644
index 0e511fcbc1428..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_plot_directive.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.plot_directive
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/tests/test_traitsdoc.py b/doc/sphinxext/numpydoc/tests/test_traitsdoc.py
deleted file mode 100644
index d36e5ddbd751f..0000000000000
--- a/doc/sphinxext/numpydoc/tests/test_traitsdoc.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import division, absolute_import, print_function
-
-import numpydoc.traitsdoc
-
-# No tests at the moment...
diff --git a/doc/sphinxext/numpydoc/traitsdoc.py b/doc/sphinxext/numpydoc/traitsdoc.py
deleted file mode 100755
index 596c54eb389a3..0000000000000
--- a/doc/sphinxext/numpydoc/traitsdoc.py
+++ /dev/null
@@ -1,142 +0,0 @@
-"""
-=========
-traitsdoc
-=========
-
-Sphinx extension that handles docstrings in the Numpy standard format, [1]
-and support Traits [2].
-
-This extension can be used as a replacement for ``numpydoc`` when support
-for Traits is required.
-
-.. [1] http://projects.scipy.org/numpy/wiki/CodingStyleGuidelines#docstring-standard
-.. [2] http://code.enthought.com/projects/traits/
-
-"""
-from __future__ import division, absolute_import, print_function
-
-import inspect
-import os
-import pydoc
-import collections
-
-from . import docscrape
-from . import docscrape_sphinx
-from .docscrape_sphinx import SphinxClassDoc, SphinxFunctionDoc, SphinxDocString
-
-from . import numpydoc
-
-from . import comment_eater
-
-class SphinxTraitsDoc(SphinxClassDoc):
-    def __init__(self, cls, modulename='', func_doc=SphinxFunctionDoc):
-        if not inspect.isclass(cls):
-            raise ValueError("Initialise using a class. Got %r" % cls)
-        self._cls = cls
-
-        if modulename and not modulename.endswith('.'):
-            modulename += '.'
-        self._mod = modulename
-        self._name = cls.__name__
-        self._func_doc = func_doc
-
-        docstring = pydoc.getdoc(cls)
-        docstring = docstring.split('\n')
-
-        # De-indent paragraph
-        try:
-            indent = min(len(s) - len(s.lstrip()) for s in docstring
-                         if s.strip())
-        except ValueError:
-            indent = 0
-
-        for n,line in enumerate(docstring):
-            docstring[n] = docstring[n][indent:]
-
-        self._doc = docscrape.Reader(docstring)
-        self._parsed_data = {
-            'Signature': '',
-            'Summary': '',
-            'Description': [],
-            'Extended Summary': [],
-            'Parameters': [],
-            'Returns': [],
-            'Raises': [],
-            'Warns': [],
-            'Other Parameters': [],
-            'Traits': [],
-            'Methods': [],
-            'See Also': [],
-            'Notes': [],
-            'References': '',
-            'Example': '',
-            'Examples': '',
-            'index': {}
-            }
-
-        self._parse()
-
-    def _str_summary(self):
-        return self['Summary'] + ['']
-
-    def _str_extended_summary(self):
-        return self['Description'] + self['Extended Summary'] + ['']
-
-    def __str__(self, indent=0, func_role="func"):
-        out = []
-        out += self._str_signature()
-        out += self._str_index() + ['']
-        out += self._str_summary()
-        out += self._str_extended_summary()
-        for param_list in ('Parameters', 'Traits', 'Methods',
-                           'Returns','Raises'):
-            out += self._str_param_list(param_list)
-        out += self._str_see_also("obj")
-        out += self._str_section('Notes')
-        out += self._str_references()
-        out += self._str_section('Example')
-        out += self._str_section('Examples')
-        out = self._str_indent(out,indent)
-        return '\n'.join(out)
-
-def looks_like_issubclass(obj, classname):
-    """ Return True if the object has a class or superclass with the given class
-    name.
-
-    Ignores old-style classes.
-    """
-    t = obj
-    if t.__name__ == classname:
-        return True
-    for klass in t.__mro__:
-        if klass.__name__ == classname:
-            return True
-    return False
-
-def get_doc_object(obj, what=None, config=None):
-    if what is None:
-        if inspect.isclass(obj):
-            what = 'class'
-        elif inspect.ismodule(obj):
-            what = 'module'
-        elif isinstance(obj, collections.Callable):
-            what = 'function'
-        else:
-            what = 'object'
-    if what == 'class':
-        doc = SphinxTraitsDoc(obj, '', func_doc=SphinxFunctionDoc, config=config)
-        if looks_like_issubclass(obj, 'HasTraits'):
-            for name, trait, comment in comment_eater.get_class_traits(obj):
-                # Exclude private traits.
-                if not name.startswith('_'):
-                    doc['Traits'].append((name, trait, comment.splitlines()))
-        return doc
-    elif what in ('function', 'method'):
-        return SphinxFunctionDoc(obj, '', config=config)
-    else:
-        return SphinxDocString(pydoc.getdoc(obj), config=config)
-
-def setup(app):
-    # init numpydoc
-    numpydoc.setup(app, get_doc_object)
-
diff --git a/environment.yml b/environment.yml
new file mode 100644
index 0000000000000..c1669c9f49017
--- /dev/null
+++ b/environment.yml
@@ -0,0 +1,57 @@
+name: pandas-dev
+channels:
+  - defaults
+  - conda-forge
+dependencies:
+  # required
+  - numpy>=1.15
+  - python=3
+  - python-dateutil>=2.5.0
+  - pytz
+
+  # development
+  - asv
+  - cython>=0.28.2
+  - flake8
+  - flake8-comprehensions
+  - flake8-rst>=0.6.0,<=0.7.0
+  - gitpython
+  - hypothesis>=3.82
+  - isort
+  - moto
+  - pytest>=4.0.2
+  - pytest-mock
+  - sphinx
+  - numpydoc
+
+  # optional
+  - beautifulsoup4>=4.2.1
+  - blosc
+  - botocore>=1.11
+  - boto3
+  - bottleneck>=1.2.0
+  - fastparquet>=0.2.1
+  - html5lib
+  - ipython>=5.6.0
+  - ipykernel
+  - jinja2
+  - lxml
+  - matplotlib>=2.0.0
+  - nbsphinx
+  - numexpr>=2.6.8
+  - openpyxl
+  - pyarrow>=0.9.0
+  - pytables>=3.4.2
+  - pytest-cov
+  - pytest-xdist
+  - s3fs
+  - scipy>=1.1
+  - seaborn
+  - sqlalchemy
+  - statsmodels
+  - xarray
+  - xlrd
+  - xlsxwriter
+  - xlwt
+  - pip:
+    - cpplint
diff --git a/pandas/__init__.py b/pandas/__init__.py
index 5c7c9d44c5d10..427157acb433f 100644
--- a/pandas/__init__.py
+++ b/pandas/__init__.py
@@ -28,7 +28,7 @@
                              tslib as _tslib)
 except ImportError as e:  # pragma: no cover
     # hack but overkill to use re
-    module = str(e).lstrip('cannot import name ')
+    module = str(e).replace('cannot import name ', '')
     raise ImportError("C extension: {0} not built. If you want to import "
                       "pandas from the source directory, you may need to run "
                       "'python setup.py build_ext --inplace --force' to build "
@@ -40,35 +40,22 @@
 import pandas.core.config_init
 
 from pandas.core.api import *
-from pandas.sparse.api import *
-from pandas.stats.api import *
+from pandas.core.sparse.api import *
 from pandas.tseries.api import *
-from pandas.computation.api import *
-
-from pandas.tools.concat import concat
-from pandas.tools.merge import (merge, ordered_merge,
-                                merge_ordered, merge_asof)
-from pandas.tools.pivot import pivot_table, crosstab
-from pandas.tools.plotting import scatter_matrix, plot_params
-from pandas.tools.tile import cut, qcut
-from pandas.tools.util import to_numeric
-from pandas.core.reshape import melt
-from pandas.util.print_versions import show_versions
+from pandas.core.computation.api import *
+from pandas.core.reshape.api import *
+
+from pandas.util._print_versions import show_versions
 from pandas.io.api import *
 from pandas.util._tester import test
-
-# extension module deprecations
-from pandas.util.depr_module import _DeprecatedModule
-
-json = _DeprecatedModule(deprmod='pandas.json', deprmodto='pandas.io.json.libjson')
-parser = _DeprecatedModule(deprmod='pandas.parser', deprmodto='pandas.io.libparsers')
-lib = _DeprecatedModule(deprmod='pandas.lib', deprmodto='pandas._libs.lib')
-tslib = _DeprecatedModule(deprmod='pandas.tslib', deprmodto='pandas._libs.tslib')
+import pandas.testing
+import pandas.arrays
 
 # use the closest tagged version if possible
 from ._version import get_versions
 v = get_versions()
 __version__ = v.get('closest-tag', v['version'])
+__git_version__ = v.get('full-revisionid')
 del get_versions, v
 
 # module level doc-string
@@ -89,25 +76,25 @@
 Here are just a few of the things that pandas does well:
 
   - Easy handling of missing data in floating point as well as non-floating
-    point data
+    point data.
   - Size mutability: columns can be inserted and deleted from DataFrame and
     higher dimensional objects
-  - Automatic and explicit data alignment: objects can  be explicitly aligned
+  - Automatic and explicit data alignment: objects can be explicitly aligned
     to a set of labels, or the user can simply ignore the labels and let
     `Series`, `DataFrame`, etc. automatically align the data for you in
-    computations
+    computations.
   - Powerful, flexible group by functionality to perform split-apply-combine
-    operations on data sets, for both aggregating and transforming data
+    operations on data sets, for both aggregating and transforming data.
   - Make it easy to convert ragged, differently-indexed data in other Python
-    and NumPy data structures into DataFrame objects
+    and NumPy data structures into DataFrame objects.
   - Intelligent label-based slicing, fancy indexing, and subsetting of large
-    data sets
-  - Intuitive merging and joining data sets
-  - Flexible reshaping and pivoting of data sets
-  - Hierarchical labeling of axes (possible to have multiple labels per tick)
+    data sets.
+  - Intuitive merging and joining data sets.
+  - Flexible reshaping and pivoting of data sets.
+  - Hierarchical labeling of axes (possible to have multiple labels per tick).
   - Robust IO tools for loading data from flat files (CSV and delimited),
     Excel files, databases, and saving/loading data from the ultrafast HDF5
-    format
+    format.
   - Time series-specific functionality: date range generation and frequency
     conversion, moving window statistics, moving window linear regressions,
     date shifting and lagging, etc.
diff --git a/pandas/_libs/__init__.py b/pandas/_libs/__init__.py
index ab3832d0292ba..b02c423b79f43 100644
--- a/pandas/_libs/__init__.py
+++ b/pandas/_libs/__init__.py
@@ -1,8 +1,5 @@
+# -*- coding: utf-8 -*-
 # flake8: noqa
 
-from .tslib import iNaT, NaT, Timestamp, Timedelta, OutOfBoundsDatetime
-
-# TODO
-# period is directly dependent on tslib and imports python
-# modules, so exposing Period as an alias is currently not possible
-# from period import Period
+from .tslibs import (
+    iNaT, NaT, Timestamp, Timedelta, OutOfBoundsDatetime, Period)
diff --git a/pandas/_libs/algos.pxd b/pandas/_libs/algos.pxd
index 6d80e6f0073eb..4bca5b33a3c62 100644
--- a/pandas/_libs/algos.pxd
+++ b/pandas/_libs/algos.pxd
@@ -1,13 +1,21 @@
-from util cimport numeric
-from numpy cimport float64_t, double_t
+from pandas._libs.util cimport numeric
 
-cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k) nogil
 
 cdef inline Py_ssize_t swap(numeric *a, numeric *b) nogil:
-    cdef numeric t
+    cdef:
+        numeric t
 
     # cython doesn't allow pointer dereference so use array syntax
     t = a[0]
     a[0] = b[0]
     b[0] = t
     return 0
+
+
+cdef enum TiebreakEnumType:
+    TIEBREAK_AVERAGE
+    TIEBREAK_MIN,
+    TIEBREAK_MAX
+    TIEBREAK_FIRST
+    TIEBREAK_FIRST_DESCENDING
+    TIEBREAK_DENSE
diff --git a/pandas/_libs/algos.pyx b/pandas/_libs/algos.pyx
index 897a60e0c2f21..663411ad984c2 100644
--- a/pandas/_libs/algos.pyx
+++ b/pandas/_libs/algos.pyx
@@ -1,62 +1,38 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
+
+import cython
+from cython import Py_ssize_t
+
+from libc.stdlib cimport malloc, free
+from libc.string cimport memmove
+from libc.math cimport fabs, sqrt
 
-from numpy cimport *
-cimport numpy as np
 import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    NPY_INT64, NPY_INT32, NPY_INT16, NPY_INT8,
+                    NPY_UINT64, NPY_UINT32, NPY_UINT16, NPY_UINT8,
+                    NPY_FLOAT32, NPY_FLOAT64,
+                    NPY_OBJECT,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+cnp.import_array()
 
-cimport cython
 
-import_array()
+cimport pandas._libs.util as util
+from pandas._libs.util cimport numeric, get_nat
 
-cdef float64_t FP_ERR = 1e-13
+from pandas._libs.khash cimport (
+    khiter_t, kh_destroy_int64, kh_put_int64, kh_init_int64, kh_int64_t,
+    kh_resize_int64, kh_get_int64)
 
-cimport util
+import pandas._libs.missing as missing
 
-from libc.stdlib cimport malloc, free
-from libc.string cimport memmove
+cdef float64_t FP_ERR = 1e-13
 
-from numpy cimport NPY_INT8 as NPY_int8
-from numpy cimport NPY_INT16 as NPY_int16
-from numpy cimport NPY_INT32 as NPY_int32
-from numpy cimport NPY_INT64 as NPY_int64
-from numpy cimport NPY_FLOAT16 as NPY_float16
-from numpy cimport NPY_FLOAT32 as NPY_float32
-from numpy cimport NPY_FLOAT64 as NPY_float64
-
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
-
-int8 = np.dtype(np.int8)
-int16 = np.dtype(np.int16)
-int32 = np.dtype(np.int32)
-int64 = np.dtype(np.int64)
-float16 = np.dtype(np.float16)
-float32 = np.dtype(np.float32)
-float64 = np.dtype(np.float64)
-
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
-
-cdef extern from "../src/headers/math.h":
-    double sqrt(double x) nogil
-    double fabs(double) nogil
-
-# this is our util.pxd
-from util cimport numeric, get_nat
-
-cimport lib
-from lib cimport is_null_datetimelike
-from pandas._libs import lib
-
-cdef int64_t iNaT = get_nat()
-
-cdef:
-    int TIEBREAK_AVERAGE = 0
-    int TIEBREAK_MIN = 1
-    int TIEBREAK_MAX = 2
-    int TIEBREAK_FIRST = 3
-    int TIEBREAK_FIRST_DESCENDING = 4
-    int TIEBREAK_DENSE = 5
+cdef float64_t NaN = <float64_t>np.NaN
+
+cdef int64_t NPY_NAT = get_nat()
 
 tiebreakers = {
     'average': TIEBREAK_AVERAGE,
@@ -67,7 +43,7 @@ tiebreakers = {
 }
 
 
-cdef inline are_diff(object left, object right):
+cdef inline bint are_diff(object left, object right):
     try:
         return fabs(left - right) > FP_ERR
     except TypeError:
@@ -75,32 +51,72 @@ cdef inline are_diff(object left, object right):
 
 
 class Infinity(object):
-    """ provide a positive Infinity comparision method for ranking """
+    """ provide a positive Infinity comparison method for ranking """
 
     __lt__ = lambda self, other: False
-    __le__ = lambda self, other: self is other
-    __eq__ = lambda self, other: self is other
-    __ne__ = lambda self, other: self is not other
-    __gt__ = lambda self, other: self is not other
-    __ge__ = lambda self, other: True
+    __le__ = lambda self, other: isinstance(other, Infinity)
+    __eq__ = lambda self, other: isinstance(other, Infinity)
+    __ne__ = lambda self, other: not isinstance(other, Infinity)
+    __gt__ = lambda self, other: (not isinstance(other, Infinity) and
+                                  not missing.checknull(other))
+    __ge__ = lambda self, other: not missing.checknull(other)
 
 
 class NegInfinity(object):
-    """ provide a negative Infinity comparision method for ranking """
+    """ provide a negative Infinity comparison method for ranking """
 
-    __lt__ = lambda self, other: self is not other
-    __le__ = lambda self, other: True
-    __eq__ = lambda self, other: self is other
-    __ne__ = lambda self, other: self is not other
+    __lt__ = lambda self, other: (not isinstance(other, NegInfinity) and
+                                  not missing.checknull(other))
+    __le__ = lambda self, other: not missing.checknull(other)
+    __eq__ = lambda self, other: isinstance(other, NegInfinity)
+    __ne__ = lambda self, other: not isinstance(other, NegInfinity)
     __gt__ = lambda self, other: False
-    __ge__ = lambda self, other: self is other
+    __ge__ = lambda self, other: isinstance(other, NegInfinity)
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def is_lexsorted(list list_of_arrays):
+cpdef ndarray[int64_t, ndim=1] unique_deltas(const int64_t[:] arr):
+    """
+    Efficiently find the unique first-differences of the given array.
+
+    Parameters
+    ----------
+    arr : ndarray[in64_t]
+
+    Returns
+    -------
+    result : ndarray[int64_t]
+        result is sorted
+    """
     cdef:
-        int i
+        Py_ssize_t i, n = len(arr)
+        int64_t val
+        khiter_t k
+        kh_int64_t *table
+        int ret = 0
+        list uniques = []
+
+    table = kh_init_int64()
+    kh_resize_int64(table, 10)
+    for i in range(n - 1):
+        val = arr[i + 1] - arr[i]
+        k = kh_get_int64(table, val)
+        if k == table.n_buckets:
+            kh_put_int64(table, val, &ret)
+            uniques.append(val)
+    kh_destroy_int64(table)
+
+    result = np.array(uniques, dtype=np.int64)
+    result.sort()
+    return result
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def is_lexsorted(list_of_arrays: list) -> bint:
+    cdef:
+        Py_ssize_t i
         Py_ssize_t n, nlevels
         int64_t k, cur, pre
         ndarray arr
@@ -109,14 +125,15 @@ def is_lexsorted(list list_of_arrays):
     nlevels = len(list_of_arrays)
     n = len(list_of_arrays[0])
 
-    cdef int64_t **vecs = <int64_t**> malloc(nlevels * sizeof(int64_t*))
+    cdef int64_t **vecs = <int64_t**>malloc(nlevels * sizeof(int64_t*))
     for i in range(nlevels):
         arr = list_of_arrays[i]
-        vecs[i] = <int64_t*> arr.data
+        assert arr.dtype.name == 'int64'
+        vecs[i] = <int64_t*>cnp.PyArray_DATA(arr)
 
     # Assume uniqueness??
     with nogil:
-        for i in range(n):
+        for i in range(1, n):
             for k in range(nlevels):
                 cur = vecs[k][i]
                 pre = vecs[k][i -1]
@@ -133,7 +150,7 @@ def is_lexsorted(list list_of_arrays):
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def groupsort_indexer(ndarray[int64_t] index, Py_ssize_t ngroups):
+def groupsort_indexer(const int64_t[:] index, Py_ssize_t ngroups):
     """
     compute a 1-d indexer that is an ordering of the passed index,
     ordered by the groups. This is a reverse of the label
@@ -179,7 +196,7 @@ def groupsort_indexer(ndarray[int64_t] index, Py_ssize_t ngroups):
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k) nogil:
+def kth_smallest(numeric[:] a, Py_ssize_t k) -> numeric:
     cdef:
         Py_ssize_t i, j, l, m, n = a.shape[0]
         numeric x
@@ -207,76 +224,13 @@ cpdef numeric kth_smallest(numeric[:] a, Py_ssize_t k) nogil:
     return a[k]
 
 
-cpdef numeric median(numeric[:] arr):
-    """
-    A faster median
-    """
-    cdef Py_ssize_t n = arr.size
-
-    if n == 0:
-        return np.NaN
-
-    arr = arr.copy()
-
-    if n % 2:
-        return kth_smallest(arr, n // 2)
-    else:
-        return (kth_smallest(arr, n // 2) +
-                kth_smallest(arr, n // 2 - 1)) / 2
-
-
-# -------------- Min, Max subsequence
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def max_subseq(ndarray[double_t] arr):
-    cdef:
-        Py_ssize_t i=0, s=0, e=0, T, n
-        double m, S
-
-    n = len(arr)
-
-    if len(arr) == 0:
-        return (-1, -1, None)
-
-    m = arr[0]
-    S = m
-    T = 0
-
-    with nogil:
-        for i in range(1, n):
-            # S = max { S + A[i], A[i] )
-            if (S > 0):
-                S = S + arr[i]
-            else:
-                S = arr[i]
-                T = i
-            if S > m:
-                s = T
-                e = i
-                m = S
-
-    return (s, e, m)
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def min_subseq(ndarray[double_t] arr):
-    cdef:
-        Py_ssize_t s, e
-        double m
-
-    (s, e, m) = max_subseq(-arr)
-
-    return (s, e, -m)
-
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Pairwise correlation/covariance
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def nancorr(ndarray[float64_t, ndim=2] mat, bint cov=0, minp=None):
+def nancorr(const float64_t[:, :] mat, bint cov=0, minp=None):
     cdef:
         Py_ssize_t i, j, xi, yi, N, K
         bint minpv
@@ -285,7 +239,7 @@ def nancorr(ndarray[float64_t, ndim=2] mat, bint cov=0, minp=None):
         int64_t nobs = 0
         float64_t vx, vy, sumx, sumy, sumxx, sumyy, meanx, meany, divisor
 
-    N, K = (<object> mat).shape
+    N, K = (<object>mat).shape
 
     if minp is None:
         minpv = 1
@@ -334,13 +288,13 @@ def nancorr(ndarray[float64_t, ndim=2] mat, bint cov=0, minp=None):
 
     return result
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Pairwise Spearman correlation
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def nancorr_spearman(ndarray[float64_t, ndim=2] mat, Py_ssize_t minp=1):
+def nancorr_spearman(const float64_t[:, :] mat, Py_ssize_t minp=1):
     cdef:
         Py_ssize_t i, j, xi, yi, N, K
         ndarray[float64_t, ndim=2] result
@@ -350,7 +304,7 @@ def nancorr_spearman(ndarray[float64_t, ndim=2] mat, Py_ssize_t minp=1):
         int64_t nobs = 0
         float64_t vx, vy, sumx, sumxx, sumyy, mean, divisor
 
-    N, K = (<object> mat).shape
+    N, K = (<object>mat).shape
 
     result = np.empty((K, K), dtype=np.float64)
     mask = np.isfinite(mat).view(np.uint8)
@@ -398,6 +352,440 @@ def nancorr_spearman(ndarray[float64_t, ndim=2] mat, Py_ssize_t minp=1):
 
     return result
 
+
+# ----------------------------------------------------------------------
+
+ctypedef fused algos_t:
+    float64_t
+    float32_t
+    object
+    int64_t
+    int32_t
+    int16_t
+    int8_t
+    uint64_t
+    uint32_t
+    uint16_t
+    uint8_t
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad(ndarray[algos_t] old, ndarray[algos_t] new, limit=None):
+    cdef:
+        Py_ssize_t i, j, nleft, nright
+        ndarray[int64_t, ndim=1] indexer
+        algos_t cur, next
+        int lim, fill_count = 0
+
+    nleft = len(old)
+    nright = len(new)
+    indexer = np.empty(nright, dtype=np.int64)
+    indexer[:] = -1
+
+    if limit is None:
+        lim = nright
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
+        return indexer
+
+    i = j = 0
+
+    cur = old[0]
+
+    while j <= nright - 1 and new[j] < cur:
+        j += 1
+
+    while True:
+        if j == nright:
+            break
+
+        if i == nleft - 1:
+            while j < nright:
+                if new[j] == cur:
+                    indexer[j] = i
+                elif new[j] > cur and fill_count < lim:
+                    indexer[j] = i
+                    fill_count += 1
+                j += 1
+            break
+
+        next = old[i + 1]
+
+        while j < nright and cur <= new[j] < next:
+            if new[j] == cur:
+                indexer[j] = i
+            elif fill_count < lim:
+                indexer[j] = i
+                fill_count += 1
+            j += 1
+
+        fill_count = 0
+        i += 1
+        cur = next
+
+    return indexer
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad_inplace(algos_t[:] values,
+                const uint8_t[:] mask,
+                limit=None):
+    cdef:
+        Py_ssize_t i, N
+        algos_t val
+        int lim, fill_count = 0
+
+    N = len(values)
+
+    # GH#2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    val = values[0]
+    for i in range(N):
+        if mask[i]:
+            if fill_count >= lim:
+                continue
+            fill_count += 1
+            values[i] = val
+        else:
+            fill_count = 0
+            val = values[i]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def pad_2d_inplace(algos_t[:, :] values,
+                   const uint8_t[:, :] mask,
+                   limit=None):
+    cdef:
+        Py_ssize_t i, j, N, K
+        algos_t val
+        int lim, fill_count = 0
+
+    K, N = (<object>values).shape
+
+    # GH#2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    for j in range(K):
+        fill_count = 0
+        val = values[j, 0]
+        for i in range(N):
+            if mask[j, i]:
+                if fill_count >= lim:
+                    continue
+                fill_count += 1
+                values[j, i] = val
+            else:
+                fill_count = 0
+                val = values[j, i]
+
+
+"""
+Backfilling logic for generating fill vector
+
+Diagram of what's going on
+
+Old      New    Fill vector    Mask
+         .        0               1
+         .        0               1
+         .        0               1
+A        A        0               1
+         .        1               1
+         .        1               1
+         .        1               1
+         .        1               1
+         .        1               1
+B        B        1               1
+         .        2               1
+         .        2               1
+         .        2               1
+C        C        2               1
+         .                        0
+         .                        0
+D
+"""
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill(ndarray[algos_t] old, ndarray[algos_t] new, limit=None):
+    cdef:
+        Py_ssize_t i, j, nleft, nright
+        ndarray[int64_t, ndim=1] indexer
+        algos_t cur, prev
+        int lim, fill_count = 0
+
+    nleft = len(old)
+    nright = len(new)
+    indexer = np.empty(nright, dtype=np.int64)
+    indexer[:] = -1
+
+    if limit is None:
+        lim = nright
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
+        return indexer
+
+    i = nleft - 1
+    j = nright - 1
+
+    cur = old[nleft - 1]
+
+    while j >= 0 and new[j] > cur:
+        j -= 1
+
+    while True:
+        if j < 0:
+            break
+
+        if i == 0:
+            while j >= 0:
+                if new[j] == cur:
+                    indexer[j] = i
+                elif new[j] < cur and fill_count < lim:
+                    indexer[j] = i
+                    fill_count += 1
+                j -= 1
+            break
+
+        prev = old[i - 1]
+
+        while j >= 0 and prev < new[j] <= cur:
+            if new[j] == cur:
+                indexer[j] = i
+            elif new[j] < cur and fill_count < lim:
+                indexer[j] = i
+                fill_count += 1
+            j -= 1
+
+        fill_count = 0
+        i -= 1
+        cur = prev
+
+    return indexer
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill_inplace(algos_t[:] values,
+                     const uint8_t[:] mask,
+                     limit=None):
+    cdef:
+        Py_ssize_t i, N
+        algos_t val
+        int lim, fill_count = 0
+
+    N = len(values)
+
+    # GH#2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    val = values[N - 1]
+    for i in range(N - 1, -1, -1):
+        if mask[i]:
+            if fill_count >= lim:
+                continue
+            fill_count += 1
+            values[i] = val
+        else:
+            fill_count = 0
+            val = values[i]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def backfill_2d_inplace(algos_t[:, :] values,
+                        const uint8_t[:, :] mask,
+                        limit=None):
+    cdef:
+        Py_ssize_t i, j, N, K
+        algos_t val
+        int lim, fill_count = 0
+
+    K, N = (<object>values).shape
+
+    # GH#2778
+    if N == 0:
+        return
+
+    if limit is None:
+        lim = N
+    else:
+        if not util.is_integer_object(limit):
+            raise ValueError('Limit must be an integer')
+        if limit < 1:
+            raise ValueError('Limit must be greater than 0')
+        lim = limit
+
+    for j in range(K):
+        fill_count = 0
+        val = values[j, N - 1]
+        for i in range(N - 1, -1, -1):
+            if mask[j, i]:
+                if fill_count >= lim:
+                    continue
+                fill_count += 1
+                values[j, i] = val
+            else:
+                fill_count = 0
+                val = values[j, i]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def arrmap(algos_t[:] index, object func):
+    cdef:
+        Py_ssize_t length = index.shape[0]
+        Py_ssize_t i = 0
+        ndarray[object] result = np.empty(length, dtype=np.object_)
+
+    from pandas._libs.lib import maybe_convert_objects
+
+    for i in range(length):
+        result[i] = func(index[i])
+
+    return maybe_convert_objects(result)
+
+
+arrmap_float64 = arrmap["float64_t"]
+arrmap_float32 = arrmap["float32_t"]
+arrmap_object = arrmap["object"]
+arrmap_int64 = arrmap["int64_t"]
+arrmap_int32 = arrmap["int32_t"]
+arrmap_uint64 = arrmap["uint64_t"]
+arrmap_bool = arrmap["uint8_t"]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def is_monotonic(ndarray[algos_t, ndim=1] arr, bint timelike):
+    """
+    Returns
+    -------
+    is_monotonic_inc, is_monotonic_dec, is_unique
+    """
+    cdef:
+        Py_ssize_t i, n
+        algos_t prev, cur
+        bint is_monotonic_inc = 1
+        bint is_monotonic_dec = 1
+        bint is_unique = 1
+        bint is_strict_monotonic = 1
+
+    n = len(arr)
+
+    if n == 1:
+        if arr[0] != arr[0] or (timelike and <int64_t>arr[0] == NPY_NAT):
+            # single value is NaN
+            return False, False, True
+        else:
+            return True, True, True
+    elif n < 2:
+        return True, True, True
+
+    if timelike and <int64_t>arr[0] == NPY_NAT:
+        return False, False, True
+
+    if algos_t is not object:
+        with nogil:
+            prev = arr[0]
+            for i in range(1, n):
+                cur = arr[i]
+                if timelike and <int64_t>cur == NPY_NAT:
+                    is_monotonic_inc = 0
+                    is_monotonic_dec = 0
+                    break
+                if cur < prev:
+                    is_monotonic_inc = 0
+                elif cur > prev:
+                    is_monotonic_dec = 0
+                elif cur == prev:
+                    is_unique = 0
+                else:
+                    # cur or prev is NaN
+                    is_monotonic_inc = 0
+                    is_monotonic_dec = 0
+                    break
+                if not is_monotonic_inc and not is_monotonic_dec:
+                    is_monotonic_inc = 0
+                    is_monotonic_dec = 0
+                    break
+                prev = cur
+    else:
+        # object-dtype, identical to above except we cannot use `with nogil`
+        prev = arr[0]
+        for i in range(1, n):
+            cur = arr[i]
+            if timelike and <int64_t>cur == NPY_NAT:
+                is_monotonic_inc = 0
+                is_monotonic_dec = 0
+                break
+            if cur < prev:
+                is_monotonic_inc = 0
+            elif cur > prev:
+                is_monotonic_dec = 0
+            elif cur == prev:
+                is_unique = 0
+            else:
+                # cur or prev is NaN
+                is_monotonic_inc = 0
+                is_monotonic_dec = 0
+                break
+            if not is_monotonic_inc and not is_monotonic_dec:
+                is_monotonic_inc = 0
+                is_monotonic_dec = 0
+                break
+            prev = cur
+
+    is_strict_monotonic = is_unique and (is_monotonic_inc or is_monotonic_dec)
+    return is_monotonic_inc, is_monotonic_dec, is_strict_monotonic
+
+
 # generated from template
 include "algos_common_helper.pxi"
 include "algos_rank_helper.pxi"
diff --git a/pandas/_libs/algos_common_helper.pxi.in b/pandas/_libs/algos_common_helper.pxi.in
index 336dd77ea9a89..91599fa223b57 100644
--- a/pandas/_libs/algos_common_helper.pxi.in
+++ b/pandas/_libs/algos_common_helper.pxi.in
@@ -1,485 +1,40 @@
 """
 Template for each `dtype` helper function using 1-d template
 
-# 1-d template
-- map_indices
-- pad
-- pad_1d
-- pad_2d
-- backfill
-- backfill_1d
-- backfill_2d
-- is_monotonic
-- arrmap
-
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
-# 1-d template
-#----------------------------------------------------------------------
-
-{{py:
-
-# name, c_type, dtype, can_hold_na, nogil
-dtypes = [('float64', 'float64_t', 'np.float64', True, True),
-          ('float32', 'float32_t', 'np.float32', True, True),
-          ('object', 'object', 'object', True, False),
-          ('int32', 'int32_t', 'np.int32', False, True),
-          ('int64', 'int64_t', 'np.int64', False, True),
-          ('uint64', 'uint64_t', 'np.uint64', False, True),
-          ('bool', 'uint8_t', 'np.bool', False, True)]
-
-def get_dispatch(dtypes):
-
-    for name, c_type, dtype, can_hold_na, nogil in dtypes:
-
-        nogil_str = 'with nogil:' if nogil else ''
-        tab = '    ' if nogil else ''
-        yield name, c_type, dtype, can_hold_na, nogil_str, tab
-}}
-
-{{for name, c_type, dtype, can_hold_na, nogil_str, tab
-      in get_dispatch(dtypes)}}
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef map_indices_{{name}}(ndarray[{{c_type}}] index):
-    """
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    """
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
-
-    length = len(index)
-
-    for i in range(length):
-        result[index[i]] = i
-
-    return result
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_{{name}}(ndarray[{{c_type}}] old, ndarray[{{c_type}}] new,
-                 limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef {{c_type}} cur, next
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[nright - 1] < old[0]:
-        return indexer
-
-    i = j = 0
-
-    cur = old[0]
-
-    while j <= nright - 1 and new[j] < cur:
-        j += 1
-
-    while True:
-        if j == nright:
-            break
-
-        if i == nleft - 1:
-            while j < nright:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] > cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j += 1
-            break
-
-        next = old[i + 1]
-
-        while j < nright and cur <= new[j] < next:
-            if new[j] == cur:
-                indexer[j] = i
-            elif fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j += 1
-
-        fill_count = 0
-        i += 1
-        cur = next
-
-    return indexer
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_inplace_{{name}}(ndarray[{{c_type}}] values,
-                         ndarray[uint8_t, cast=True] mask,
-                         limit=None):
-    cdef Py_ssize_t i, N
-    cdef {{c_type}} val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    val = values[0]
-    for i in range(N):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def pad_2d_inplace_{{name}}(ndarray[{{c_type}}, ndim=2] values,
-                            ndarray[uint8_t, ndim=2] mask,
-                            limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef {{c_type}} val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, 0]
-        for i in range(N):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-"""
-Backfilling logic for generating fill vector
-
-Diagram of what's going on
-
-Old      New    Fill vector    Mask
-         .        0               1
-         .        0               1
-         .        0               1
-A        A        0               1
-         .        1               1
-         .        1               1
-         .        1               1
-         .        1               1
-         .        1               1
-B        B        1               1
-         .        2               1
-         .        2               1
-         .        2               1
-C        C        2               1
-         .                        0
-         .                        0
-D
-"""
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_{{name}}(ndarray[{{c_type}}] old, ndarray[{{c_type}}] new,
-                      limit=None):
-    cdef Py_ssize_t i, j, nleft, nright
-    cdef ndarray[int64_t, ndim=1] indexer
-    cdef {{c_type}} cur, prev
-    cdef int lim, fill_count = 0
-
-    nleft = len(old)
-    nright = len(new)
-    indexer = np.empty(nright, dtype=np.int64)
-    indexer.fill(-1)
-
-    if limit is None:
-        lim = nright
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    if nleft == 0 or nright == 0 or new[0] > old[nleft - 1]:
-        return indexer
-
-    i = nleft - 1
-    j = nright - 1
-
-    cur = old[nleft - 1]
-
-    while j >= 0 and new[j] > cur:
-        j -= 1
-
-    while True:
-        if j < 0:
-            break
-
-        if i == 0:
-            while j >= 0:
-                if new[j] == cur:
-                    indexer[j] = i
-                elif new[j] < cur and fill_count < lim:
-                    indexer[j] = i
-                    fill_count += 1
-                j -= 1
-            break
-
-        prev = old[i - 1]
-
-        while j >= 0 and prev < new[j] <= cur:
-            if new[j] == cur:
-                indexer[j] = i
-            elif new[j] < cur and fill_count < lim:
-                indexer[j] = i
-                fill_count += 1
-            j -= 1
-
-        fill_count = 0
-        i -= 1
-        cur = prev
-
-    return indexer
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_inplace_{{name}}(ndarray[{{c_type}}] values,
-                              ndarray[uint8_t, cast=True] mask,
-                              limit=None):
-    cdef Py_ssize_t i, N
-    cdef {{c_type}} val
-    cdef int lim, fill_count = 0
-
-    N = len(values)
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    val = values[N - 1]
-    for i in range(N - 1, -1, -1):
-        if mask[i]:
-            if fill_count >= lim:
-                continue
-            fill_count += 1
-            values[i] = val
-        else:
-            fill_count = 0
-            val = values[i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def backfill_2d_inplace_{{name}}(ndarray[{{c_type}}, ndim=2] values,
-                                 ndarray[uint8_t, ndim=2] mask,
-                                 limit=None):
-    cdef Py_ssize_t i, j, N, K
-    cdef {{c_type}} val
-    cdef int lim, fill_count = 0
-
-    K, N = (<object> values).shape
-
-    # GH 2778
-    if N == 0:
-        return
-
-    if limit is None:
-        lim = N
-    else:
-        if not util.is_integer_object(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        lim = limit
-
-    for j in range(K):
-        fill_count = 0
-        val = values[j, N - 1]
-        for i in range(N - 1, -1, -1):
-            if mask[j, i]:
-                if fill_count >= lim:
-                    continue
-                fill_count += 1
-                values[j, i] = val
-            else:
-                fill_count = 0
-                val = values[j, i]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def is_monotonic_{{name}}(ndarray[{{c_type}}] arr, bint timelike):
-    """
-    Returns
-    -------
-    is_monotonic_inc, is_monotonic_dec, is_unique
-    """
-    cdef:
-        Py_ssize_t i, n
-        {{c_type}} prev, cur
-        bint is_monotonic_inc = 1
-        bint is_monotonic_dec = 1
-        bint is_unique = 1
-
-    n = len(arr)
-
-    if n == 1:
-        if arr[0] != arr[0] or (timelike and <int64_t>arr[0] == iNaT):
-            # single value is NaN
-            return False, False, True
-        else:
-            return True, True, True
-    elif n < 2:
-        return True, True, True
-
-    if timelike and <int64_t>arr[0] == iNaT:
-        return False, False, True
-
-    {{nogil_str}}
-    {{tab}}prev = arr[0]
-    {{tab}}for i in range(1, n):
-    {{tab}}    cur = arr[i]
-    {{tab}}    if timelike and <int64_t>cur == iNaT:
-    {{tab}}        is_monotonic_inc = 0
-    {{tab}}        is_monotonic_dec = 0
-    {{tab}}        break
-    {{tab}}    if cur < prev:
-    {{tab}}        is_monotonic_inc = 0
-    {{tab}}    elif cur > prev:
-    {{tab}}        is_monotonic_dec = 0
-    {{tab}}    elif cur == prev:
-    {{tab}}        is_unique = 0
-    {{tab}}    else:
-    {{tab}}        # cur or prev is NaN
-    {{tab}}        is_monotonic_inc = 0
-    {{tab}}        is_monotonic_dec = 0
-    {{tab}}        break
-    {{tab}}    if not is_monotonic_inc and not is_monotonic_dec:
-    {{tab}}        is_monotonic_inc = 0
-    {{tab}}        is_monotonic_dec = 0
-    {{tab}}        break
-    {{tab}}    prev = cur
-    return is_monotonic_inc, is_monotonic_dec, \
-           is_unique and (is_monotonic_inc or is_monotonic_dec)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def arrmap_{{name}}(ndarray[{{c_type}}] index, object func):
-    cdef Py_ssize_t length = index.shape[0]
-    cdef Py_ssize_t i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    from pandas._libs.lib import maybe_convert_objects
-
-    for i in range(length):
-        result[i] = func(index[i])
-
-    return maybe_convert_objects(result)
-
-{{endfor}}
-
-#----------------------------------------------------------------------
-# put template
-#----------------------------------------------------------------------
-
 {{py:
 
-# name, c_type, dest_type, dest_dtype
-dtypes = [('float64', 'float64_t', 'float64_t', 'np.float64'),
-          ('float32', 'float32_t', 'float32_t', 'np.float32'),
-          ('int8',  'int8_t',  'float32_t', 'np.float32'),
-          ('int16', 'int16_t', 'float32_t', 'np.float32'),
-          ('int32', 'int32_t', 'float64_t', 'np.float64'),
-          ('int64', 'int64_t', 'float64_t', 'np.float64')]
+# name, c_type, dest_type
+dtypes = [('float64', 'float64_t', 'float64_t'),
+          ('float32', 'float32_t', 'float32_t'),
+          ('int8',  'int8_t',  'float32_t'),
+          ('int16', 'int16_t', 'float32_t'),
+          ('int32', 'int32_t', 'float64_t'),
+          ('int64', 'int64_t', 'float64_t')]
 
 def get_dispatch(dtypes):
 
-    for name, c_type, dest_type, dest_dtype, in dtypes:
-
-        dest_type2 = dest_type
-        dest_type = dest_type.replace('_t', '')
-
-        yield name, c_type, dest_type, dest_type2, dest_dtype
+    for name, c_type, dest_type, in dtypes:
+        dest_name = dest_type[:-2]  # i.e. strip "_t"
+        yield name, c_type, dest_type, dest_name
 
 }}
 
-{{for name, c_type, dest_type, dest_type2, dest_dtype
+{{for name, c_type, dest_type, dest_name
       in get_dispatch(dtypes)}}
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
 def diff_2d_{{name}}(ndarray[{{c_type}}, ndim=2] arr,
-                     ndarray[{{dest_type2}}, ndim=2] out,
+                     ndarray[{{dest_type}}, ndim=2] out,
                      Py_ssize_t periods, int axis):
     cdef:
         Py_ssize_t i, j, sx, sy
 
-    sx, sy = (<object> arr).shape
+    sx, sy = (<object>arr).shape
     if arr.flags.f_contiguous:
         if axis == 0:
             if periods >= 0:
@@ -515,45 +70,33 @@ def diff_2d_{{name}}(ndarray[{{c_type}}, ndim=2] arr,
                 for j in range(start, stop):
                     out[i, j] = arr[i, j] - arr[i, j - periods]
 
-
-def put2d_{{name}}_{{dest_type}}(ndarray[{{c_type}}, ndim=2, cast=True] values,
-                                 ndarray[int64_t] indexer, Py_ssize_t loc,
-                                 ndarray[{{dest_type2}}] out):
-    cdef:
-        Py_ssize_t i, j, k
-
-    k = len(values)
-    for j from 0 <= j < k:
-        i = indexer[j]
-        out[i] = values[j, loc]
-
 {{endfor}}
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # ensure_dtype
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
+
+cdef int PLATFORM_INT = (<ndarray>np.arange(0, dtype=np.intp)).descr.type_num
 
-cdef int PLATFORM_INT = (<ndarray> np.arange(0, dtype=np.intp)).descr.type_num
 
-cpdef ensure_platform_int(object arr):
+def ensure_platform_int(object arr):
     # GH3033, GH1392
     # platform int is the size of the int pointer, e.g. np.intp
     if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == PLATFORM_INT:
+        if (<ndarray>arr).descr.type_num == PLATFORM_INT:
             return arr
         else:
             return arr.astype(np.intp)
     else:
         return np.array(arr, dtype=np.intp)
 
-cpdef ensure_object(object arr):
+
+def ensure_object(object arr):
     if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_OBJECT:
+        if (<ndarray>arr).descr.type_num == NPY_OBJECT:
             return arr
         else:
             return arr.astype(np.object_)
-    elif hasattr(arr, 'asobject'):
-        return arr.asobject
     else:
         return np.array(arr, dtype=np.object_)
 
@@ -566,6 +109,9 @@ dtypes = [('float64', 'FLOAT64', 'float64'),
           ('int16', 'INT16', 'int16'),
           ('int32', 'INT32', 'int32'),
           ('int64', 'INT64', 'int64'),
+          ('uint8', 'UINT8', 'uint8'),
+          ('uint16', 'UINT16', 'uint16'),
+          ('uint32', 'UINT32', 'uint32'),
           ('uint64', 'UINT64', 'uint64'),
           # ('platform_int', 'INT', 'int_'),
           # ('object', 'OBJECT', 'object_'),
@@ -579,9 +125,10 @@ def get_dispatch(dtypes):
 
 {{for name, c_type, dtype in get_dispatch(dtypes)}}
 
-cpdef ensure_{{name}}(object arr, copy=True):
+
+def ensure_{{name}}(object arr, copy=True):
     if util.is_array(arr):
-        if (<ndarray> arr).descr.type_num == NPY_{{c_type}}:
+        if (<ndarray>arr).descr.type_num == NPY_{{c_type}}:
             return arr
         else:
             return arr.astype(np.{{dtype}}, copy=copy)
diff --git a/pandas/_libs/algos_rank_helper.pxi.in b/pandas/_libs/algos_rank_helper.pxi.in
index aafffbf60f638..5dac94394c7ed 100644
--- a/pandas/_libs/algos_rank_helper.pxi.in
+++ b/pandas/_libs/algos_rank_helper.pxi.in
@@ -4,9 +4,9 @@ Template for each `dtype` helper function for rank
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # rank_1d, rank_2d
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -24,23 +24,14 @@ dtypes = [('object', 'object', 'Infinity()', 'NegInfinity()'),
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-{{if dtype == 'object'}}
-
-
-def rank_1d_{{dtype}}(object in_arr, bint retry=1, ties_method='average',
+def rank_1d_{{dtype}}(object in_arr, ties_method='average',
                       ascending=True, na_option='keep', pct=False):
-{{else}}
-
-
-def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
-                      na_option='keep', pct=False):
-{{endif}}
     """
     Fast NaN-friendly version of scipy.stats.rankdata
     """
 
     cdef:
-        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0
+        Py_ssize_t i, j, n, dups = 0, total_tie_count = 0, non_na_idx = 0
 
         {{if dtype == 'object'}}
         ndarray sorted_data, values
@@ -50,6 +41,7 @@ def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
 
         ndarray[float64_t] ranks
         ndarray[int64_t] argsorted
+        ndarray[uint8_t, cast=True] sorted_mask
 
         {{if dtype == 'uint64'}}
         {{ctype}} val
@@ -60,7 +52,8 @@ def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
         float64_t sum_ranks = 0
         int tiebreak = 0
         bint keep_na = 0
-        float count = 0.0
+        bint isnan
+        float64_t count = 0.0
     tiebreak = tiebreakers[ties_method]
 
     {{if dtype == 'float64'}}
@@ -76,106 +69,92 @@ def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
 
     keep_na = na_option == 'keep'
 
-    {{if dtype != 'uint64'}}
-    if ascending ^ (na_option == 'top'):
-        nan_value = {{pos_nan_value}}
-    else:
-        nan_value = {{neg_nan_value}}
-
     {{if dtype == 'object'}}
-    mask = lib.isnullobj(values)
+    mask = missing.isnaobj(values)
     {{elif dtype == 'float64'}}
     mask = np.isnan(values)
     {{elif dtype == 'int64'}}
-    mask = values == iNaT
+    mask = values == NPY_NAT
+
+    # create copy in case of NPY_NAT
+    # values are mutated inplace
+    if mask.any():
+        values = values.copy()
     {{endif}}
 
+    # double sort first by mask and then by values to ensure nan values are
+    # either at the beginning or the end. mask/(~mask) controls padding at
+    # tail or the head
+    {{if dtype != 'uint64'}}
+    if ascending ^ (na_option == 'top'):
+        nan_value = {{pos_nan_value}}
+        order = (values, mask)
+    else:
+        nan_value = {{neg_nan_value}}
+        order = (values, ~mask)
     np.putmask(values, mask, nan_value)
+    {{else}}
+    mask = np.zeros(shape=len(values), dtype=bool)
+    order = (values, mask)
     {{endif}}
 
     n = len(values)
     ranks = np.empty(n, dtype='f8')
 
     {{if dtype == 'object'}}
-    try:
-        _as = values.argsort()
-    except TypeError:
-        if not retry:
-            raise
-
-        valid_locs = (~mask).nonzero()[0]
-        ranks.put(valid_locs, rank_1d_object(values.take(valid_locs), 0,
-                                             ties_method=ties_method,
-                                             ascending=ascending))
-        np.putmask(ranks, mask, np.nan)
-        return ranks
+    _as = np.lexsort(keys=order)
     {{else}}
     if tiebreak == TIEBREAK_FIRST:
         # need to use a stable sort here
-        _as = values.argsort(kind='mergesort')
+        _as = np.lexsort(keys=order)
         if not ascending:
             tiebreak = TIEBREAK_FIRST_DESCENDING
     else:
-        _as = values.argsort()
+        _as = np.lexsort(keys=order)
     {{endif}}
 
     if not ascending:
         _as = _as[::-1]
 
     sorted_data = values.take(_as)
+    sorted_mask = mask.take(_as)
+    _indices = np.diff(sorted_mask.astype(int)).nonzero()[0]
+    non_na_idx = _indices[0] if len(_indices) > 0 else -1
     argsorted = _as.astype('i8')
 
     {{if dtype == 'object'}}
-    for i in range(n):
-        sum_ranks += i + 1
-        dups += 1
-
-        val = util.get_value_at(sorted_data, i)
-
-        if (val is nan_value) and keep_na:
-            ranks[argsorted[i]] = nan
-            continue
-
-        count += 1.0
-
-        if (i == n - 1 or
-            are_diff(util.get_value_at(sorted_data, i + 1), val)):
-            if tiebreak == TIEBREAK_AVERAGE:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = sum_ranks / dups
-            elif tiebreak == TIEBREAK_MIN:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i - dups + 2
-            elif tiebreak == TIEBREAK_MAX:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = i + 1
-            elif tiebreak == TIEBREAK_FIRST:
-                raise ValueError('first not supported for non-numeric data')
-            elif tiebreak == TIEBREAK_FIRST_DESCENDING:
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = 2 * i - j - dups + 2
-            elif tiebreak == TIEBREAK_DENSE:
-                total_tie_count += 1
-                for j in range(i - dups + 1, i + 1):
-                    ranks[argsorted[j]] = total_tie_count
-            sum_ranks = dups = 0
+    if True:
     {{else}}
     with nogil:
+    {{endif}}
+        # TODO: why does the 2d version not have a nogil block?
         for i in range(n):
             sum_ranks += i + 1
             dups += 1
 
+            {{if dtype == 'object'}}
+            val = util.get_value_at(sorted_data, i)
+            {{else}}
             val = sorted_data[i]
+            {{endif}}
 
             {{if dtype != 'uint64'}}
-            if (val == nan_value) and keep_na:
-                ranks[argsorted[i]] = nan
+            isnan = sorted_mask[i]
+            if isnan and keep_na:
+                ranks[argsorted[i]] = NaN
                 continue
             {{endif}}
 
             count += 1.0
 
-            if i == n - 1 or sorted_data[i + 1] != val:
+            {{if dtype == 'object'}}
+            if (i == n - 1 or
+                    are_diff(util.get_value_at(sorted_data, i + 1), val) or
+                    i == non_na_idx):
+            {{else}}
+            if (i == n - 1 or sorted_data[i + 1] != val or i == non_na_idx):
+            {{endif}}
+
                 if tiebreak == TIEBREAK_AVERAGE:
                     for j in range(i - dups + 1, i + 1):
                         ranks[argsorted[j]] = sum_ranks / dups
@@ -186,8 +165,13 @@ def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
                     for j in range(i - dups + 1, i + 1):
                         ranks[argsorted[j]] = i + 1
                 elif tiebreak == TIEBREAK_FIRST:
+                    {{if dtype == 'object'}}
+                    raise ValueError('first not supported for '
+                                     'non-numeric data')
+                    {{else}}
                     for j in range(i - dups + 1, i + 1):
                         ranks[argsorted[j]] = j + 1
+                    {{endif}}
                 elif tiebreak == TIEBREAK_FIRST_DESCENDING:
                     for j in range(i - dups + 1, i + 1):
                         ranks[argsorted[j]] = 2 * i - j - dups + 2
@@ -196,9 +180,11 @@ def rank_1d_{{dtype}}(object in_arr, ties_method='average', ascending=True,
                     for j in range(i - dups + 1, i + 1):
                         ranks[argsorted[j]] = total_tie_count
                 sum_ranks = dups = 0
-    {{endif}}
     if pct:
-        return ranks / count
+        if tiebreak == TIEBREAK_DENSE:
+            return ranks / total_tie_count
+        else:
+            return ranks / count
     else:
         return ranks
 
@@ -234,7 +220,7 @@ def rank_2d_{{dtype}}(object in_arr, axis=0, ties_method='average',
         float64_t sum_ranks = 0
         int tiebreak = 0
         bint keep_na = 0
-        float count = 0.0
+        float64_t count = 0.0
 
     tiebreak = tiebreakers[ties_method]
 
@@ -259,17 +245,17 @@ def rank_2d_{{dtype}}(object in_arr, axis=0, ties_method='average',
         nan_value = {{neg_nan_value}}
 
     {{if dtype == 'object'}}
-    mask = lib.isnullobj2d(values)
+    mask = missing.isnaobj2d(values)
     {{elif dtype == 'float64'}}
     mask = np.isnan(values)
     {{elif dtype == 'int64'}}
-    mask = values == iNaT
+    mask = values == NPY_NAT
     {{endif}}
 
     np.putmask(values, mask, nan_value)
     {{endif}}
 
-    n, k = (<object> values).shape
+    n, k = (<object>values).shape
     ranks = np.empty((n, k), dtype='f8')
 
     {{if dtype == 'object'}}
@@ -323,7 +309,7 @@ def rank_2d_{{dtype}}(object in_arr, axis=0, ties_method='average',
             {{else}}
             if (val == nan_value) and keep_na:
             {{endif}}
-                ranks[i, argsorted[i, j]] = nan
+                ranks[i, argsorted[i, j]] = NaN
 
                 {{if dtype == 'object'}}
                 infs += 1
@@ -370,7 +356,10 @@ def rank_2d_{{dtype}}(object in_arr, axis=0, ties_method='average',
                         ranks[i, argsorted[i, z]] = total_tie_count
                 sum_ranks = dups = 0
         if pct:
-            ranks[i, :] /= count
+            if tiebreak == TIEBREAK_DENSE:
+                ranks[i, :] /= total_tie_count
+            else:
+                ranks[i, :] /= count
     if axis == 0:
         return ranks.T
     else:
diff --git a/pandas/_libs/algos_take_helper.pxi.in b/pandas/_libs/algos_take_helper.pxi.in
index 71bb1bb4fe9be..2fea8b17fd9d7 100644
--- a/pandas/_libs/algos_take_helper.pxi.in
+++ b/pandas/_libs/algos_take_helper.pxi.in
@@ -4,9 +4,9 @@ Template for each `dtype` helper function for take
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # take_1d, take_2d
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -46,7 +46,7 @@ def get_dispatch(dtypes):
     fv = fill_value
 
     %(nogil_str)s
-    %(tab)sfor i from 0 <= i < n:
+    %(tab)sfor i in range(n):
     %(tab)s    idx = indexer[i]
     %(tab)s    if idx == -1:
     %(tab)s        out[i] = fv
@@ -74,10 +74,10 @@ def get_dispatch(dtypes):
             values.strides[1] == sizeof(%(c_type_out)s) and
             sizeof(%(c_type_out)s) * n >= 256):
 
-            for i from 0 <= i < n:
+            for i in range(n):
                 idx = indexer[i]
                 if idx == -1:
-                    for j from 0 <= j < k:
+                    for j in range(k):
                         out[i, j] = fv
                 else:
                     v = &values[idx, 0]
@@ -85,13 +85,13 @@ def get_dispatch(dtypes):
                     memmove(o, v, <size_t>(sizeof(%(c_type_out)s) * k))
             return
 
-    for i from 0 <= i < n:
+    for i in range(n):
         idx = indexer[i]
         if idx == -1:
-            for j from 0 <= j < k:
+            for j in range(k):
                 out[i, j] = fv
         else:
-            for j from 0 <= j < k:
+            for j in range(k):
                 out[i, j] = %(preval)svalues[idx, j]%(postval)s
 """
 
@@ -108,8 +108,8 @@ def get_dispatch(dtypes):
 
     fv = fill_value
 
-    for i from 0 <= i < n:
-        for j from 0 <= j < k:
+    for i in range(n):
+        for j in range(k):
             idx = indexer[j]
             if idx == -1:
                 out[i, j] = fv
@@ -246,13 +246,13 @@ def take_2d_multi_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=2] values,
     k = len(idx1)
 
     fv = fill_value
-    for i from 0 <= i < n:
+    for i in range(n):
         idx = idx0[i]
         if idx == -1:
-            for j from 0 <= j < k:
+            for j in range(k):
                 out[i, j] = fv
         else:
-            for j from 0 <= j < k:
+            for j in range(k):
                 if idx1[j] == -1:
                     out[i, j] = fv
                 else:
@@ -260,33 +260,39 @@ def take_2d_multi_{{name}}_{{dest}}(ndarray[{{c_type_in}}, ndim=2] values,
 
 {{endfor}}
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # take_2d internal function
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
-{{py:
-
-# dtype, ctype, init_result
-dtypes = [('float64', 'float64_t', 'np.empty_like(values)'),
-          ('uint64', 'uint64_t', 'np.empty_like(values)'),
-          ('object', 'object', 'values.copy()'),
-          ('int64', 'int64_t', 'np.empty_like(values)')]
-}}
+ctypedef fused take_t:
+    float64_t
+    uint64_t
+    int64_t
+    object
 
-{{for dtype, ctype, init_result in dtypes}}
 
-cdef _take_2d_{{dtype}}(ndarray[{{ctype}}, ndim=2] values, object idx):
+cdef _take_2d(ndarray[take_t, ndim=2] values, object idx):
     cdef:
         Py_ssize_t i, j, N, K
         ndarray[Py_ssize_t, ndim=2, cast=True] indexer = idx
-        ndarray[{{ctype}}, ndim=2] result
+        ndarray[take_t, ndim=2] result
         object val
 
-    N, K = (<object> values).shape
-    result = {{init_result}}
+    N, K = (<object>values).shape
+
+    if take_t is object:
+        # evaluated at compile-time
+        result = values.copy()
+    else:
+        result = np.empty_like(values)
+
     for i in range(N):
         for j in range(K):
             result[i, j] = values[i, indexer[i, j]]
     return result
 
-{{endfor}}
+
+_take_2d_object = _take_2d[object]
+_take_2d_float64 = _take_2d[float64_t]
+_take_2d_int64 = _take_2d[int64_t]
+_take_2d_uint64 = _take_2d[uint64_t]
diff --git a/pandas/_libs/groupby.pxd b/pandas/_libs/groupby.pxd
new file mode 100644
index 0000000000000..70ad8a62871e9
--- /dev/null
+++ b/pandas/_libs/groupby.pxd
@@ -0,0 +1,6 @@
+cdef enum InterpolationEnumType:
+    INTERPOLATION_LINEAR,
+    INTERPOLATION_LOWER,
+    INTERPOLATION_HIGHER,
+    INTERPOLATION_NEAREST,
+    INTERPOLATION_MIDPOINT
diff --git a/pandas/_libs/groupby.pyx b/pandas/_libs/groupby.pyx
index c6ff602cfef1c..71e25c3955a6d 100644
--- a/pandas/_libs/groupby.pyx
+++ b/pandas/_libs/groupby.pyx
@@ -1,290 +1,748 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
+
+import cython
+from cython import Py_ssize_t
+from cython cimport floating
+
+from libc.stdlib cimport malloc, free
 
-from numpy cimport *
-cimport numpy as np
 import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+cnp.import_array()
 
-cimport cython
 
-import_array()
+from pandas._libs.util cimport numeric, get_nat
 
-cimport util
+from pandas._libs.algos cimport (swap, TiebreakEnumType, TIEBREAK_AVERAGE,
+                                 TIEBREAK_MIN, TIEBREAK_MAX, TIEBREAK_FIRST,
+                                 TIEBREAK_DENSE)
+from pandas._libs.algos import (take_2d_axis1_float64_float64,
+                                groupsort_indexer, tiebreakers)
 
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
+cdef int64_t NPY_NAT = get_nat()
 
-from libc.stdlib cimport malloc, free
+cdef float64_t NaN = <float64_t>np.NaN
 
-from util cimport numeric, get_nat
-from algos cimport swap
-from algos import take_2d_axis1_float64_float64, groupsort_indexer
 
-cdef int64_t iNaT = get_nat()
+cdef inline float64_t median_linear(float64_t* a, int n) nogil:
+    cdef:
+        int i, j, na_count = 0
+        float64_t result
+        float64_t* tmp
 
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
+    if n == 0:
+        return NaN
 
+    # count NAs
+    for i in range(n):
+        if a[i] != a[i]:
+            na_count += 1
 
-# TODO: aggregate multiple columns in single pass
-#----------------------------------------------------------------------
-# first, nth, last
+    if na_count:
+        if na_count == n:
+            return NaN
+
+        tmp = <float64_t*>malloc((n - na_count) * sizeof(float64_t))
+
+        j = 0
+        for i in range(n):
+            if a[i] == a[i]:
+                tmp[j] = a[i]
+                j += 1
+
+        a = tmp
+        n -= na_count
+
+    if n % 2:
+        result = kth_smallest_c( a, n / 2, n)
+    else:
+        result = (kth_smallest_c(a, n / 2, n) +
+                  kth_smallest_c(a, n / 2 - 1, n)) / 2
+
+    if na_count:
+        free(a)
+
+    return result
+
+
+# TODO: Is this redundant with algos.kth_smallest
+cdef inline float64_t kth_smallest_c(float64_t* a,
+                                     Py_ssize_t k,
+                                     Py_ssize_t n) nogil:
+    cdef:
+        Py_ssize_t i, j, l, m
+        float64_t x, t
+
+    l = 0
+    m = n - 1
+    while l < m:
+        x = a[k]
+        i = l
+        j = m
+
+        while 1:
+            while a[i] < x: i += 1
+            while x < a[j]: j -= 1
+            if i <= j:
+                swap(&a[i], &a[j])
+                i += 1; j -= 1
+
+            if i > j: break
+
+        if j < k: l = i
+        if k < i: m = j
+    return a[k]
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def group_nth_object(ndarray[object, ndim=2] out,
-                     ndarray[int64_t] counts,
-                     ndarray[object, ndim=2] values,
-                     ndarray[int64_t] labels,
-                     int64_t rank):
+def group_median_float64(ndarray[float64_t, ndim=2] out,
+                         ndarray[int64_t] counts,
+                         ndarray[float64_t, ndim=2] values,
+                         ndarray[int64_t] labels,
+                         Py_ssize_t min_count=-1):
     """
     Only aggregates on axis=0
     """
     cdef:
-        Py_ssize_t i, j, N, K, lab
-        object val
-        float64_t count
-        ndarray[int64_t, ndim=2] nobs
-        ndarray[object, ndim=2] resx
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    N, K = (<object> values).shape
-
-    for i in range(N):
-        lab = labels[i]
-        if lab < 0:
-            continue
-
-        counts[lab] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[lab, j] += 1
-                if nobs[lab, j] == rank:
-                    resx[lab, j] = val
-
-    for i in range(len(counts)):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = <object> nan
-            else:
-                out[i, j] = resx[i, j]
+        Py_ssize_t i, j, N, K, ngroups, size
+        ndarray[int64_t] _counts
+        ndarray[float64_t, ndim=2] data
+        float64_t* ptr
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    ngroups = len(counts)
+    N, K = (<object>values).shape
+
+    indexer, _counts = groupsort_indexer(labels, ngroups)
+    counts[:] = _counts[1:]
+
+    data = np.empty((K, N), dtype=np.float64)
+    ptr = <float64_t*>cnp.PyArray_DATA(data)
+
+    take_2d_axis1_float64_float64(values.T, indexer, out=data)
+
+    with nogil:
+
+        for i in range(K):
+            # exclude NA group
+            ptr += _counts[0]
+            for j in range(ngroups):
+                size = _counts[j + 1]
+                out[j, i] = median_linear(ptr, size)
+                ptr += size
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def group_nth_bin_object(ndarray[object, ndim=2] out,
-                         ndarray[int64_t] counts,
-                         ndarray[object, ndim=2] values,
-                         ndarray[int64_t] bins, int64_t rank):
+def group_cumprod_float64(float64_t[:, :] out,
+                          const float64_t[:, :] values,
+                          const int64_t[:] labels,
+                          bint is_datetimelike,
+                          bint skipna=True):
     """
-    Only aggregates on axis=0
+    Only transforms on axis=0
     """
     cdef:
-        Py_ssize_t i, j, N, K, ngroups, b
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[float64_t, ndim=2] nobs
+        Py_ssize_t i, j, N, K, size
+        float64_t val
+        float64_t[:, :] accum
+        int64_t lab
+
+    N, K = (<object>values).shape
+    accum = np.ones_like(values)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+                if val == val:
+                    accum[lab, j] *= val
+                    out[i, j] = accum[lab, j]
+                else:
+                    out[i, j] = NaN
+                    if not skipna:
+                        accum[lab, j] = NaN
+                        break
 
-    nobs = np.zeros((<object> out).shape, dtype=np.float64)
-    resx = np.empty((<object> out).shape, dtype=object)
 
-    if len(bins) == 0:
-        return
-    if bins[len(bins) - 1] == len(values):
-        ngroups = len(bins)
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_cumsum(numeric[:, :] out,
+                 numeric[:, :] values,
+                 const int64_t[:] labels,
+                 is_datetimelike,
+                 bint skipna=True):
+    """
+    Only transforms on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, size
+        numeric val
+        numeric[:, :] accum
+        int64_t lab
+
+    N, K = (<object>values).shape
+    accum = np.zeros_like(values)
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+
+            if lab < 0:
+                continue
+            for j in range(K):
+                val = values[i, j]
+
+                if numeric == float32_t or numeric == float64_t:
+                    if val == val:
+                        accum[lab, j] += val
+                        out[i, j] = accum[lab, j]
+                    else:
+                        out[i, j] = NaN
+                        if not skipna:
+                            accum[lab, j] = NaN
+                            break
+                else:
+                    accum[lab, j] += val
+                    out[i, j] = accum[lab, j]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_shift_indexer(int64_t[:] out, const int64_t[:] labels,
+                        int ngroups, int periods):
+    cdef:
+        Py_ssize_t N, i, j, ii
+        int offset, sign
+        int64_t lab, idxer, idxer_slot
+        int64_t[:] label_seen = np.zeros(ngroups, dtype=np.int64)
+        int64_t[:, :] label_indexer
+
+    N, = (<object>labels).shape
+
+    if periods < 0:
+        periods = -periods
+        offset = N - 1
+        sign = -1
+    elif periods > 0:
+        offset = 0
+        sign = 1
+
+    if periods == 0:
+        with nogil:
+            for i in range(N):
+                out[i] = i
     else:
-        ngroups = len(bins) + 1
+        # array of each previous indexer seen
+        label_indexer = np.zeros((ngroups, periods), dtype=np.int64)
+        with nogil:
+            for i in range(N):
+                # reverse iterator if shifting backwards
+                ii = offset + sign * i
+                lab = labels[ii]
 
-    N, K = (<object> values).shape
+                # Skip null keys
+                if lab == -1:
+                    out[ii] = -1
+                    continue
 
-    b = 0
-    for i in range(N):
-        while b < ngroups - 1 and i >= bins[b]:
-            b += 1
+                label_seen[lab] += 1
 
-        counts[b] += 1
-        for j in range(K):
-            val = values[i, j]
+                idxer_slot = label_seen[lab] % periods
+                idxer = label_indexer[lab, idxer_slot]
 
-            # not nan
-            if val == val:
-                nobs[b, j] += 1
-                if nobs[b, j] == rank:
-                    resx[b, j] = val
+                if label_seen[lab] > periods:
+                    out[ii] = idxer
+                else:
+                    out[ii] = -1
 
-    for i in range(ngroups):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
+                label_indexer[lab, idxer_slot] = ii
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def group_fillna_indexer(ndarray[int64_t] out, ndarray[int64_t] labels,
+                         ndarray[uint8_t] mask, object direction,
+                         int64_t limit):
+    """Indexes how to fill values forwards or backwards within a group
+
+    Parameters
+    ----------
+    out : array of int64_t values which this method will write its results to
+        Missing values will be written to with a value of -1
+    labels : array containing unique label for each group, with its ordering
+        matching up to the corresponding record in `values`
+    mask : array of int64_t values where a 1 indicates a missing value
+    direction : {'ffill', 'bfill'}
+        Direction for fill to be applied (forwards or backwards, respectively)
+    limit : Consecutive values to fill before stopping, or -1 for no limit
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object
+    """
+    cdef:
+        Py_ssize_t i, N
+        int64_t[:] sorted_labels
+        int64_t idx, curr_fill_idx=-1, filled_vals=0
+
+    N = len(out)
+
+    # Make sure all arrays are the same size
+    assert N == len(labels) == len(mask)
+
+    sorted_labels = np.argsort(labels, kind='mergesort').astype(
+        np.int64, copy=False)
+    if direction == 'bfill':
+        sorted_labels = sorted_labels[::-1]
+
+    with nogil:
+        for i in range(N):
+            idx = sorted_labels[i]
+            if mask[idx] == 1:  # is missing
+                # Stop filling once we've hit the limit
+                if filled_vals >= limit and limit != -1:
+                    curr_fill_idx = -1
+                filled_vals += 1
+            else:  # reset items when not missing
+                filled_vals = 0
+                curr_fill_idx = idx
+
+            out[idx] = curr_fill_idx
+
+            # If we move to the next group, reset
+            # the fill_idx and counter
+            if i == N - 1 or labels[idx] != labels[sorted_labels[i + 1]]:
+                curr_fill_idx = -1
+                filled_vals = 0
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def group_last_object(ndarray[object, ndim=2] out,
-                      ndarray[int64_t] counts,
-                      ndarray[object, ndim=2] values,
-                      ndarray[int64_t] labels):
+def group_any_all(uint8_t[:] out,
+                  const int64_t[:] labels,
+                  const uint8_t[:] values,
+                  const uint8_t[:] mask,
+                  object val_test,
+                  bint skipna):
+    """Aggregated boolean values to show truthfulness of group elements
+
+    Parameters
+    ----------
+    out : array of values which this method will write its results to
+    labels : array containing unique label for each group, with its
+        ordering matching up to the corresponding record in `values`
+    values : array containing the truth value of each element
+    mask : array indicating whether a value is na or not
+    val_test : str {'any', 'all'}
+        String object dictating whether to use any or all truth testing
+    skipna : boolean
+        Flag to ignore nan values during truth testing
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object.
+    The returned values will either be 0 or 1 (False or True, respectively).
+    """
+    cdef:
+        Py_ssize_t i, N = len(labels)
+        int64_t lab
+        uint8_t flag_val
+
+    if val_test == 'all':
+        # Because the 'all' value of an empty iterable in Python is True we can
+        # start with an array full of ones and set to zero when a False value
+        # is encountered
+        flag_val = 0
+    elif val_test == 'any':
+        # Because the 'any' value of an empty iterable in Python is False we
+        # can start with an array full of zeros and set to one only if any
+        # value encountered is True
+        flag_val = 1
+    else:
+        raise ValueError("'bool_func' must be either 'any' or 'all'!")
+
+    out[:] = 1 - flag_val
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0 or (skipna and mask[i]):
+                continue
+
+            if values[i] == flag_val:
+                out[lab] = flag_val
+
+# ----------------------------------------------------------------------
+# group_add, group_prod, group_var, group_mean, group_ohlc
+# ----------------------------------------------------------------------
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def _group_add(floating[:, :] out,
+               int64_t[:] counts,
+               floating[:, :] values,
+               const int64_t[:] labels,
+               Py_ssize_t min_count=0):
     """
     Only aggregates on axis=0
     """
     cdef:
-        Py_ssize_t i, j, N, K, lab
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[int64_t, ndim=2] nobs
-
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
-    resx = np.empty((<object> out).shape, dtype=object)
-
-    N, K = (<object> values).shape
-
-    for i in range(N):
-        lab = labels[i]
-        if lab < 0:
-            continue
-
-        counts[lab] += 1
-        for j in range(K):
-            val = values[i, j]
-
-            # not nan
-            if val == val:
-                nobs[lab, j] += 1
-                resx[lab, j] = val
-
-    for i in range(len(counts)):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        floating val, count
+        floating[:, :] sumx, nobs
+
+    if len(values) != len(labels):
+        raise AssertionError("len(index) != len(labels)")
+
+    nobs = np.zeros_like(out)
+    sumx = np.zeros_like(out)
+
+    N, K = (<object>values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    sumx[lab, j] += val
+
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] < min_count:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = sumx[i, j]
+
+
+group_add_float32 = _group_add['float']
+group_add_float64 = _group_add['double']
 
 
-@cython.boundscheck(False)
 @cython.wraparound(False)
-def group_last_bin_object(ndarray[object, ndim=2] out,
-                          ndarray[int64_t] counts,
-                          ndarray[object, ndim=2] values,
-                          ndarray[int64_t] bins):
+@cython.boundscheck(False)
+def _group_prod(floating[:, :] out,
+                int64_t[:] counts,
+                floating[:, :] values,
+                const int64_t[:] labels,
+                Py_ssize_t min_count=0):
     """
     Only aggregates on axis=0
     """
     cdef:
-        Py_ssize_t i, j, N, K, ngroups, b
-        object val
-        float64_t count
-        ndarray[object, ndim=2] resx
-        ndarray[float64_t, ndim=2] nobs
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        floating val, count
+        floating[:, :] prodx, nobs
 
-    nobs = np.zeros((<object> out).shape, dtype=np.float64)
-    resx = np.empty((<object> out).shape, dtype=object)
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
 
-    if len(bins) == 0:
-        return
-    if bins[len(bins) - 1] == len(values):
-        ngroups = len(bins)
-    else:
-        ngroups = len(bins) + 1
+    nobs = np.zeros_like(out)
+    prodx = np.ones_like(out)
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
 
-    b = 0
-    for i in range(N):
-        while b < ngroups - 1 and i >= bins[b]:
-            b += 1
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
 
-        counts[b] += 1
-        for j in range(K):
-            val = values[i, j]
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
 
-            # not nan
-            if val == val:
-                nobs[b, j] += 1
-                resx[b, j] = val
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    prodx[lab, j] *= val
 
-    for i in range(ngroups):
-        for j in range(K):
-            if nobs[i, j] == 0:
-                out[i, j] = nan
-            else:
-                out[i, j] = resx[i, j]
+        for i in range(ncounts):
+            for j in range(K):
+                if nobs[i, j] < min_count:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = prodx[i, j]
 
 
-cdef inline float64_t _median_linear(float64_t* a, int n) nogil:
-    cdef int i, j, na_count = 0
-    cdef float64_t result
-    cdef float64_t* tmp
+group_prod_float32 = _group_prod['float']
+group_prod_float64 = _group_prod['double']
 
-    if n == 0:
-        return NaN
 
-    # count NAs
-    for i in range(n):
-        if a[i] != a[i]:
-            na_count += 1
+@cython.wraparound(False)
+@cython.boundscheck(False)
+@cython.cdivision(True)
+def _group_var(floating[:, :] out,
+               int64_t[:] counts,
+               floating[:, :] values,
+               const int64_t[:] labels,
+               Py_ssize_t min_count=-1):
+    cdef:
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        floating val, ct, oldmean
+        floating[:, :] nobs, mean
 
-    if na_count:
-        if na_count == n:
-            return NaN
+    assert min_count == -1, "'min_count' only used in add and prod"
 
-        tmp = <float64_t*> malloc((n - na_count) * sizeof(float64_t))
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
 
-        j = 0
-        for i in range(n):
-            if a[i] == a[i]:
-                tmp[j] = a[i]
-                j += 1
+    nobs = np.zeros_like(out)
+    mean = np.zeros_like(out)
 
-        a = tmp
-        n -= na_count
+    N, K = (<object>values).shape
 
-    if n % 2:
-        result = kth_smallest_c( a, n / 2, n)
-    else:
-        result = (kth_smallest_c(a, n / 2, n) +
-                  kth_smallest_c(a, n / 2 - 1, n)) / 2
+    out[:, :] = 0.0
 
-    if na_count:
-        free(a)
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
 
-    return result
+            counts[lab] += 1
 
+            for j in range(K):
+                val = values[i, j]
 
-cdef inline float64_t kth_smallest_c(float64_t* a,
-                                     Py_ssize_t k,
-                                     Py_ssize_t n) nogil:
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    oldmean = mean[lab, j]
+                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
+                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
+
+        for i in range(ncounts):
+            for j in range(K):
+                ct = nobs[i, j]
+                if ct < 2:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] /= (ct - 1)
+
+
+group_var_float32 = _group_var['float']
+group_var_float64 = _group_var['double']
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def _group_mean(floating[:, :] out,
+                int64_t[:] counts,
+                floating[:, :] values,
+                const int64_t[:] labels,
+                Py_ssize_t min_count=-1):
     cdef:
-        Py_ssize_t i, j, l, m
-        double_t x, t
+        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
+        floating val, count
+        floating[:, :] sumx, nobs
 
-    l = 0
-    m = n -1
-    while (l<m):
-        x = a[k]
-        i = l
-        j = m
+    assert min_count == -1, "'min_count' only used in add and prod"
 
-        while 1:
-            while a[i] < x: i += 1
-            while x < a[j]: j -= 1
-            if i <= j:
-                swap(&a[i], &a[j])
-                i += 1; j -= 1
+    if not len(values) == len(labels):
+        raise AssertionError("len(index) != len(labels)")
 
-            if i > j: break
+    nobs = np.zeros_like(out)
+    sumx = np.zeros_like(out)
 
-        if j < k: l = i
-        if k < i: m = j
-    return a[k]
+    N, K = (<object>values).shape
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
+
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
+                # not nan
+                if val == val:
+                    nobs[lab, j] += 1
+                    sumx[lab, j] += val
+
+        for i in range(ncounts):
+            for j in range(K):
+                count = nobs[i, j]
+                if nobs[i, j] == 0:
+                    out[i, j] = NAN
+                else:
+                    out[i, j] = sumx[i, j] / count
+
+
+group_mean_float32 = _group_mean['float']
+group_mean_float64 = _group_mean['double']
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def _group_ohlc(floating[:, :] out,
+                int64_t[:] counts,
+                floating[:, :] values,
+                const int64_t[:] labels,
+                Py_ssize_t min_count=-1):
+    """
+    Only aggregates on axis=0
+    """
+    cdef:
+        Py_ssize_t i, j, N, K, lab
+        floating val, count
+        Py_ssize_t ngroups = len(counts)
+
+    assert min_count == -1, "'min_count' only used in add and prod"
+
+    if len(labels) == 0:
+        return
+
+    N, K = (<object>values).shape
+
+    if out.shape[1] != 4:
+        raise ValueError('Output array must have 4 columns')
+
+    if K > 1:
+        raise NotImplementedError("Argument 'values' must have only "
+                                  "one dimension")
+    out[:] = np.nan
+
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            if lab == -1:
+                continue
+
+            counts[lab] += 1
+            val = values[i, 0]
+            if val != val:
+                continue
+
+            if out[lab, 0] != out[lab, 0]:
+                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
+            else:
+                out[lab, 1] = max(out[lab, 1], val)
+                out[lab, 2] = min(out[lab, 2], val)
+                out[lab, 3] = val
+
+
+group_ohlc_float32 = _group_ohlc['float']
+group_ohlc_float64 = _group_ohlc['double']
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_quantile(ndarray[float64_t] out,
+                   ndarray[int64_t] labels,
+                   numeric[:] values,
+                   ndarray[uint8_t] mask,
+                   float64_t q,
+                   object interpolation):
+    """
+    Calculate the quantile per group.
+
+    Parameters
+    ----------
+    out : ndarray
+        Array of aggregated values that will be written to.
+    labels : ndarray
+        Array containing the unique group labels.
+    values : ndarray
+        Array containing the values to apply the function against.
+    q : float
+        The quantile value to search for.
+
+    Notes
+    -----
+    Rather than explicitly returning a value, this function modifies the
+    provided `out` parameter.
+    """
+    cdef:
+        Py_ssize_t i, N=len(labels), ngroups, grp_sz, non_na_sz
+        Py_ssize_t grp_start=0, idx=0
+        int64_t lab
+        uint8_t interp
+        float64_t q_idx, frac, val, next_val
+        ndarray[int64_t] counts, non_na_counts, sort_arr
+
+    assert values.shape[0] == N
+    inter_methods = {
+        'linear': INTERPOLATION_LINEAR,
+        'lower': INTERPOLATION_LOWER,
+        'higher': INTERPOLATION_HIGHER,
+        'nearest': INTERPOLATION_NEAREST,
+        'midpoint': INTERPOLATION_MIDPOINT,
+    }
+    interp = inter_methods[interpolation]
+
+    counts = np.zeros_like(out, dtype=np.int64)
+    non_na_counts = np.zeros_like(out, dtype=np.int64)
+    ngroups = len(counts)
+
+    # First figure out the size of every group
+    with nogil:
+        for i in range(N):
+            lab = labels[i]
+            counts[lab] += 1
+            if not mask[i]:
+                non_na_counts[lab] += 1
+
+    # Get an index of values sorted by labels and then values
+    order = (values, labels)
+    sort_arr = np.lexsort(order).astype(np.int64, copy=False)
+
+    with nogil:
+        for i in range(ngroups):
+            # Figure out how many group elements there are
+            grp_sz = counts[i]
+            non_na_sz = non_na_counts[i]
+
+            if non_na_sz == 0:
+                out[i] = NaN
+            else:
+                # Calculate where to retrieve the desired value
+                # Casting to int will intentionaly truncate result
+                idx = grp_start + <int64_t>(q * <float64_t>(non_na_sz - 1))
+
+                val = values[sort_arr[idx]]
+                # If requested quantile falls evenly on a particular index
+                # then write that index's value out. Otherwise interpolate
+                q_idx = q * (non_na_sz - 1)
+                frac = q_idx % 1
+
+                if frac == 0.0 or interp == INTERPOLATION_LOWER:
+                    out[i] = val
+                else:
+                    next_val = values[sort_arr[idx + 1]]
+                    if interp == INTERPOLATION_LINEAR:
+                        out[i] = val + (next_val - val) * frac
+                    elif interp == INTERPOLATION_HIGHER:
+                        out[i] = next_val
+                    elif interp == INTERPOLATION_MIDPOINT:
+                        out[i] = (val + next_val) / 2.0
+                    elif interp == INTERPOLATION_NEAREST:
+                        if frac > .5 or (frac == .5 and q > .5):  # Always OK?
+                            out[i] = next_val
+                        else:
+                            out[i] = val
+
+            # Increment the index reference in sorted_arr for the next group
+            grp_start += grp_sz
 
 
 # generated from template
diff --git a/pandas/_libs/groupby_helper.pxi.in b/pandas/_libs/groupby_helper.pxi.in
index d38b677df321c..63cd4d6ac6ff2 100644
--- a/pandas/_libs/groupby_helper.pxi.in
+++ b/pandas/_libs/groupby_helper.pxi.in
@@ -5,352 +5,67 @@ WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
 cdef extern from "numpy/npy_math.h":
-    double NAN "NPY_NAN"
+    float64_t NAN "NPY_NAN"
 _int64_max = np.iinfo(np.int64).max
 
-#----------------------------------------------------------------------
-# group_add, group_prod, group_var, group_mean, group_ohlc
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
+# group_nth, group_last, group_rank
+# ----------------------------------------------------------------------
 
 {{py:
 
-# name, c_type, dest_type, dest_dtype
-dtypes = [('float64', 'float64_t', 'float64_t', 'np.float64'),
-          ('float32', 'float32_t', 'float32_t', 'np.float32')]
+# name, c_type, nan_val
+dtypes = [('float64', 'float64_t', 'NAN'),
+          ('float32', 'float32_t', 'NAN'),
+          ('int64', 'int64_t', 'NPY_NAT'),
+          ('object', 'object', 'NAN')]
 
 def get_dispatch(dtypes):
 
-    for name, c_type, dest_type, dest_dtype in dtypes:
+    for name, c_type, nan_val in dtypes:
 
-        dest_type2 = dest_type
-        dest_type = dest_type.replace('_t', '')
-
-        yield name, c_type, dest_type, dest_type2, dest_dtype
-}}
-
-{{for name, c_type, dest_type, dest_type2, dest_dtype in get_dispatch(dtypes)}}
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_add_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                       ndarray[int64_t] counts,
-                       ndarray[{{c_type}}, ndim=2] values,
-                       ndarray[int64_t] labels):
-    """
-    Only aggregates on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-        raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-
-        if K > 1:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-
-        else:
-
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_prod_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                        ndarray[int64_t] counts,
-                        ndarray[{{c_type}}, ndim=2] values,
-                        ndarray[int64_t] labels):
-    """
-    Only aggregates on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] prodx, nobs
-
-    if not len(values) == len(labels):
-        raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    prodx = np.ones_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        prodx[lab, j] *= val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    prodx[lab, 0] *= val
-
-        for i in range(ncounts):
-            for j in range(K):
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = prodx[i, j]
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-@cython.cdivision(True)
-def group_var_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                       ndarray[int64_t] counts,
-                       ndarray[{{dest_type2}}, ndim=2] values,
-                       ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, ct, oldmean
-        ndarray[{{dest_type2}}, ndim=2] nobs, mean
-
-    if not len(values) == len(labels):
-        raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    mean = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    out[:, :] = 0.0
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab < 0:
-                continue
-
-            counts[lab] += 1
-
-            for j in range(K):
-                val = values[i, j]
-
-                # not nan
-                if val == val:
-                    nobs[lab, j] += 1
-                    oldmean = mean[lab, j]
-                    mean[lab, j] += (val - oldmean) / nobs[lab, j]
-                    out[lab, j] += (val - mean[lab, j]) * (val - oldmean)
-
-        for i in range(ncounts):
-            for j in range(K):
-                ct = nobs[i, j]
-                if ct < 2:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] /= (ct - 1)
-# add passing bin edges, instead of labels
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_mean_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                        ndarray[int64_t] counts,
-                        ndarray[{{dest_type2}}, ndim=2] values,
-                        ndarray[int64_t] labels):
-    cdef:
-        Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] sumx, nobs
-
-    if not len(values) == len(labels):
-        raise AssertionError("len(index) != len(labels)")
-
-    nobs = np.zeros_like(out)
-    sumx = np.zeros_like(out)
-
-    N, K = (<object> values).shape
-
-    with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-                    # not nan
-                    if val == val:
-                        nobs[lab, j] += 1
-                        sumx[lab, j] += val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                val = values[i, 0]
-                # not nan
-                if val == val:
-                    nobs[lab, 0] += 1
-                    sumx[lab, 0] += val
-
-        for i in range(ncounts):
-            for j in range(K):
-                count = nobs[i, j]
-                if nobs[i, j] == 0:
-                    out[i, j] = NAN
-                else:
-                    out[i, j] = sumx[i, j] / count
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def group_ohlc_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                  ndarray[int64_t] counts,
-                  ndarray[{{dest_type2}}, ndim=2] values,
-                  ndarray[int64_t] labels):
-    """
-    Only aggregates on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, lab
-        {{dest_type2}} val, count
-        Py_ssize_t ngroups = len(counts)
-
-    if len(labels) == 0:
-        return
-
-    N, K = (<object> values).shape
-
-    if out.shape[1] != 4:
-        raise ValueError('Output array must have 4 columns')
-
-    if K > 1:
-        raise NotImplementedError("Argument 'values' must have only "
-                                  "one dimension")
-    out.fill(np.nan)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-            if lab == -1:
-                continue
-
-            counts[lab] += 1
-            val = values[i, 0]
-            if val != val:
-                continue
-
-            if out[lab, 0] != out[lab, 0]:
-                out[lab, 0] = out[lab, 1] = out[lab, 2] = out[lab, 3] = val
-            else:
-                out[lab, 1] = max(out[lab, 1], val)
-                out[lab, 2] = min(out[lab, 2], val)
-                out[lab, 3] = val
-
-{{endfor}}
-
-#----------------------------------------------------------------------
-# group_nth, group_last
-#----------------------------------------------------------------------
-
-{{py:
-
-# name, c_type, dest_type2, nan_val
-dtypes = [('float64', 'float64_t', 'float64_t', 'NAN'),
-          ('float32', 'float32_t', 'float32_t', 'NAN'),
-          ('int64', 'int64_t', 'int64_t', 'iNaT')]
-
-def get_dispatch(dtypes):
-
-    for name, c_type, dest_type2, nan_val in dtypes:
-
-        yield name, c_type, dest_type2, nan_val
+        yield name, c_type, nan_val
 }}
 
 
-{{for name, c_type, dest_type2, nan_val in get_dispatch(dtypes)}}
+{{for name, c_type, nan_val in get_dispatch(dtypes)}}
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def group_last_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                        ndarray[int64_t] counts,
-                        ndarray[{{c_type}}, ndim=2] values,
-                        ndarray[int64_t] labels):
+def group_last_{{name}}({{c_type}}[:, :] out,
+                        int64_t[:] counts,
+                        {{c_type}}[:, :] values,
+                        const int64_t[:] labels,
+                        Py_ssize_t min_count=-1):
     """
     Only aggregates on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] resx
+        {{c_type}} val
+        ndarray[{{c_type}}, ndim=2] resx
         ndarray[int64_t, ndim=2] nobs
 
+    assert min_count == -1, "'min_count' only used in add and prod"
+
     if not len(values) == len(labels):
         raise AssertionError("len(index) != len(labels)")
 
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
+    nobs = np.zeros((<object>out).shape, dtype=np.int64)
+    {{if name == 'object'}}
+    resx = np.empty((<object>out).shape, dtype=object)
+    {{else}}
     resx = np.empty_like(out)
+    {{endif}}
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
 
+    {{if name == "object"}}
+    if True:  # make templating happy
+    {{else}}
     with nogil:
+    {{endif}}
         for i in range(N):
             lab = labels[i]
             if lab < 0:
@@ -361,11 +76,7 @@ def group_last_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
                 val = values[i, j]
 
                 # not nan
-                {{if name == 'int64'}}
-                if val != {{nan_val}}:
-                {{else}}
                 if val == val and val != {{nan_val}}:
-                {{endif}}
                     nobs[lab, j] += 1
                     resx[lab, j] = val
 
@@ -379,28 +90,39 @@ def group_last_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def group_nth_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                       ndarray[int64_t] counts,
-                       ndarray[{{c_type}}, ndim=2] values,
-                       ndarray[int64_t] labels, int64_t rank):
+def group_nth_{{name}}({{c_type}}[:, :] out,
+                       int64_t[:] counts,
+                       {{c_type}}[:, :] values,
+                       const int64_t[:] labels, int64_t rank,
+                       Py_ssize_t min_count=-1):
     """
     Only aggregates on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] resx
+        {{c_type}} val
+        ndarray[{{c_type}}, ndim=2] resx
         ndarray[int64_t, ndim=2] nobs
 
+    assert min_count == -1, "'min_count' only used in add and prod"
+
     if not len(values) == len(labels):
         raise AssertionError("len(index) != len(labels)")
 
-    nobs = np.zeros((<object> out).shape, dtype=np.int64)
+    nobs = np.zeros((<object>out).shape, dtype=np.int64)
+    {{if name=='object'}}
+    resx = np.empty((<object>out).shape, dtype=object)
+    {{else}}
     resx = np.empty_like(out)
+    {{endif}}
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
 
+    {{if name == "object"}}
+    if True:  # make templating happy
+    {{else}}
     with nogil:
+    {{endif}}
         for i in range(N):
             lab = labels[i]
             if lab < 0:
@@ -411,11 +133,7 @@ def group_nth_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
                 val = values[i, j]
 
                 # not nan
-                {{if name == 'int64'}}
-                if val != {{nan_val}}:
-                {{else}}
                 if val == val and val != {{nan_val}}:
-                {{endif}}
                     nobs[lab, j] += 1
                     if nobs[lab, j] == rank:
                         resx[lab, j] = val
@@ -427,42 +145,221 @@ def group_nth_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
                 else:
                     out[i, j] = resx[i, j]
 
-{{endfor}}
 
-#----------------------------------------------------------------------
-# group_min, group_max
-#----------------------------------------------------------------------
+{{if name != 'object'}}
 
-{{py:
 
-# name, c_type, dest_type2, nan_val
-dtypes = [('float64', 'float64_t', 'NAN', 'np.inf'),
-          ('float32', 'float32_t', 'NAN', 'np.inf'),
-          ('int64', 'int64_t', 'iNaT', '_int64_max')]
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def group_rank_{{name}}(float64_t[:, :] out,
+                        {{c_type}}[:, :] values,
+                        const int64_t[:] labels,
+                        bint is_datetimelike, object ties_method,
+                        bint ascending, bint pct, object na_option):
+    """
+    Provides the rank of values within each group.
+
+    Parameters
+    ----------
+    out : array of float64_t values which this method will write its results to
+    values : array of {{c_type}} values to be ranked
+    labels : array containing unique label for each group, with its ordering
+        matching up to the corresponding record in `values`
+    is_datetimelike : bool, default False
+        unused in this method but provided for call compatibility with other
+        Cython transformations
+    ties_method : {'average', 'min', 'max', 'first', 'dense'}, default
+        'average'
+        * average: average rank of group
+        * min: lowest rank in group
+        * max: highest rank in group
+        * first: ranks assigned in order they appear in the array
+        * dense: like 'min', but rank always increases by 1 between groups
+    ascending : boolean, default True
+        False for ranks by high (1) to low (N)
+        na_option : {'keep', 'top', 'bottom'}, default 'keep'
+    pct : boolean, default False
+        Compute percentage rank of data within each group
+    na_option : {'keep', 'top', 'bottom'}, default 'keep'
+        * keep: leave NA values where they are
+        * top: smallest rank if ascending
+        * bottom: smallest rank if descending
+
+    Notes
+    -----
+    This method modifies the `out` parameter rather than returning an object
+    """
+    cdef:
+        TiebreakEnumType tiebreak
+        Py_ssize_t i, j, N, K, grp_start=0, dups=0, sum_ranks=0
+        Py_ssize_t grp_vals_seen=1, grp_na_count=0, grp_tie_count=0
+        ndarray[int64_t] _as
+        ndarray[float64_t, ndim=2] grp_sizes
+        ndarray[{{c_type}}] masked_vals
+        ndarray[uint8_t] mask
+        bint keep_na
+        {{c_type}} nan_fill_val
+
+    tiebreak = tiebreakers[ties_method]
+    keep_na = na_option == 'keep'
+    N, K = (<object>values).shape
+    grp_sizes = np.ones_like(out)
+
+    # Copy values into new array in order to fill missing data
+    # with mask, without obfuscating location of missing data
+    # in values array
+    masked_vals = np.array(values[:, 0], copy=True)
+    {{if name == 'int64'}}
+    mask = (masked_vals == {{nan_val}}).astype(np.uint8)
+    {{else}}
+    mask = np.isnan(masked_vals).astype(np.uint8)
+    {{endif}}
+
+    if ascending ^ (na_option == 'top'):
+        {{if name == 'int64'}}
+        nan_fill_val = np.iinfo(np.int64).max
+        {{else}}
+        nan_fill_val = np.inf
+        {{endif}}
+        order = (masked_vals, mask, labels)
+    else:
+        {{if name == 'int64'}}
+        nan_fill_val = np.iinfo(np.int64).min
+        {{else}}
+        nan_fill_val = -np.inf
+        {{endif}}
+        order = (masked_vals, ~mask, labels)
+    np.putmask(masked_vals, mask, nan_fill_val)
+
+    # lexsort using labels, then mask, then actual values
+    # each label corresponds to a different group value,
+    # the mask helps you differentiate missing values before
+    # performing sort on the actual values
+    _as = np.lexsort(order).astype(np.int64, copy=False)
+
+    if not ascending:
+        _as = _as[::-1]
 
-def get_dispatch(dtypes):
+    with nogil:
+        # Loop over the length of the value array
+        # each incremental i value can be looked up in the _as array
+        # that we sorted previously, which gives us the location of
+        # that sorted value for retrieval back from the original
+        # values / masked_vals arrays
+        for i in range(N):
+            # dups and sum_ranks will be incremented each loop where
+            # the value / group remains the same, and should be reset
+            # when either of those change
+            # Used to calculate tiebreakers
+            dups += 1
+            sum_ranks += i - grp_start + 1
+
+            # Update out only when there is a transition of values or labels.
+            # When a new value or group is encountered, go back #dups steps(
+            # the number of occurrence of current value) and assign the ranks
+            # based on the the starting index of the current group (grp_start)
+            # and the current index
+            if (i == N - 1 or
+                    (masked_vals[_as[i]] != masked_vals[_as[i+1]]) or
+                    (mask[_as[i]] ^ mask[_as[i+1]]) or
+                    (labels[_as[i]] != labels[_as[i+1]])):
+                # if keep_na, check for missing values and assign back
+                # to the result where appropriate
+                if keep_na and mask[_as[i]]:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = NaN
+                        grp_na_count = dups
+                elif tiebreak == TIEBREAK_AVERAGE:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = sum_ranks / <float64_t>dups
+                elif tiebreak == TIEBREAK_MIN:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = i - grp_start - dups + 2
+                elif tiebreak == TIEBREAK_MAX:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = i - grp_start + 1
+                elif tiebreak == TIEBREAK_FIRST:
+                    for j in range(i - dups + 1, i + 1):
+                        if ascending:
+                            out[_as[j], 0] = j + 1 - grp_start
+                        else:
+                            out[_as[j], 0] = 2 * i - j - dups + 2 - grp_start
+                elif tiebreak == TIEBREAK_DENSE:
+                    for j in range(i - dups + 1, i + 1):
+                        out[_as[j], 0] = grp_vals_seen
+
+                # look forward to the next value (using the sorting in _as)
+                # if the value does not equal the current value then we need to
+                # reset the dups and sum_ranks, knowing that a new value is
+                # coming up. the conditional also needs to handle nan equality
+                # and the end of iteration
+                if (i == N - 1 or
+                        (masked_vals[_as[i]] != masked_vals[_as[i+1]]) or
+                        (mask[_as[i]] ^ mask[_as[i+1]])):
+                    dups = sum_ranks = 0
+                    grp_vals_seen += 1
+                    grp_tie_count += 1
+
+                # Similar to the previous conditional, check now if we are
+                # moving to a new group. If so, keep track of the index where
+                # the new group occurs, so the tiebreaker calculations can
+                # decrement that from their position. fill in the size of each
+                # group encountered (used by pct calculations later). also be
+                # sure to reset any of the items helping to calculate dups
+                if i == N - 1 or labels[_as[i]] != labels[_as[i+1]]:
+                    if tiebreak != TIEBREAK_DENSE:
+                        for j in range(grp_start, i + 1):
+                            grp_sizes[_as[j], 0] = (i - grp_start + 1 -
+                                                    grp_na_count)
+                    else:
+                        for j in range(grp_start, i + 1):
+                            grp_sizes[_as[j], 0] = (grp_tie_count -
+                                                    (grp_na_count > 0))
+                    dups = sum_ranks = 0
+                    grp_na_count = 0
+                    grp_tie_count = 0
+                    grp_start = i + 1
+                    grp_vals_seen = 1
+
+        if pct:
+            for i in range(N):
+                # We don't include NaN values in percentage
+                # rankings, so we assign them percentages of NaN.
+                if out[i, 0] != out[i, 0] or out[i, 0] == NAN:
+                    out[i, 0] = NAN
+                elif grp_sizes[i, 0] != 0:
+                    out[i, 0] = out[i, 0] / grp_sizes[i, 0]
+{{endif}}
+{{endfor}}
 
-    for name, dest_type2, nan_val, inf_val in dtypes:
-        yield name, dest_type2, nan_val, inf_val
-}}
 
+# ----------------------------------------------------------------------
+# group_min, group_max
+# ----------------------------------------------------------------------
 
-{{for name, dest_type2, nan_val, inf_val in get_dispatch(dtypes)}}
+# TODO: consider implementing for more dtypes
+ctypedef fused groupby_t:
+    float64_t
+    float32_t
+    int64_t
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def group_max_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                       ndarray[int64_t] counts,
-                       ndarray[{{dest_type2}}, ndim=2] values,
-                       ndarray[int64_t] labels):
+def group_max(groupby_t[:, :] out,
+              int64_t[:] counts,
+              groupby_t[:, :] values,
+              const int64_t[:] labels,
+              Py_ssize_t min_count=-1):
     """
     Only aggregates on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] maxx, nobs
+        groupby_t val, count, nan_val
+        ndarray[groupby_t, ndim=2] maxx, nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
 
     if not len(values) == len(labels):
         raise AssertionError("len(index) != len(labels)")
@@ -470,70 +367,62 @@ def group_max_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
     nobs = np.zeros_like(out)
 
     maxx = np.empty_like(out)
-    maxx.fill(-{{inf_val}})
+    if groupby_t is int64_t:
+        # Note: evaluated at compile-time
+        maxx[:] = -_int64_max
+        nan_val = NPY_NAT
+    else:
+        maxx[:] = -np.inf
+        nan_val = NAN
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
 
     with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    {{if name == 'int64'}}
-                    if val != {{nan_val}}:
-                    {{else}}
-                    if val == val and val != {{nan_val}}:
-                    {{endif}}
-                        nobs[lab, j] += 1
-                        if val > maxx[lab, j]:
-                            maxx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
 
-                counts[lab] += 1
-                val = values[i, 0]
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
 
                 # not nan
-                {{if name == 'int64'}}
-                if val != {{nan_val}}:
-                {{else}}
-                if val == val and val != {{nan_val}}:
-                {{endif}}
-                    nobs[lab, 0] += 1
-                    if val > maxx[lab, 0]:
-                        maxx[lab, 0] = val
+                if groupby_t is int64_t:
+                    if val != nan_val:
+                        nobs[lab, j] += 1
+                        if val > maxx[lab, j]:
+                            maxx[lab, j] = val
+                else:
+                    if val == val and val != nan_val:
+                        nobs[lab, j] += 1
+                        if val > maxx[lab, j]:
+                            maxx[lab, j] = val
 
         for i in range(ncounts):
             for j in range(K):
                 if nobs[i, j] == 0:
-                    out[i, j] = {{nan_val}}
+                    out[i, j] = nan_val
                 else:
                     out[i, j] = maxx[i, j]
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def group_min_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                       ndarray[int64_t] counts,
-                       ndarray[{{dest_type2}}, ndim=2] values,
-                       ndarray[int64_t] labels):
+def group_min(groupby_t[:, :] out,
+              int64_t[:] counts,
+              groupby_t[:, :] values,
+              const int64_t[:] labels,
+              Py_ssize_t min_count=-1):
     """
     Only aggregates on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, lab, ncounts = len(counts)
-        {{dest_type2}} val, count
-        ndarray[{{dest_type2}}, ndim=2] minx, nobs
+        groupby_t val, count, nan_val
+        ndarray[groupby_t, ndim=2] minx, nobs
+
+    assert min_count == -1, "'min_count' only used in add and prod"
 
     if not len(values) == len(labels):
         raise AssertionError("len(index) != len(labels)")
@@ -541,75 +430,66 @@ def group_min_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
     nobs = np.zeros_like(out)
 
     minx = np.empty_like(out)
-    minx.fill({{inf_val}})
+    if groupby_t is int64_t:
+        minx[:] = _int64_max
+        nan_val = NPY_NAT
+    else:
+        minx[:] = np.inf
+        nan_val = NAN
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
 
     with nogil:
-        if K > 1:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
-
-                counts[lab] += 1
-                for j in range(K):
-                    val = values[i, j]
-
-                    # not nan
-                    {{if name == 'int64'}}
-                    if val != {{nan_val}}:
-                    {{else}}
-                    if val == val and val != {{nan_val}}:
-                    {{endif}}
-                        nobs[lab, j] += 1
-                        if val < minx[lab, j]:
-                            minx[lab, j] = val
-        else:
-            for i in range(N):
-                lab = labels[i]
-                if lab < 0:
-                    continue
+        for i in range(N):
+            lab = labels[i]
+            if lab < 0:
+                continue
 
-                counts[lab] += 1
-                val = values[i, 0]
+            counts[lab] += 1
+            for j in range(K):
+                val = values[i, j]
 
                 # not nan
-                {{if name == 'int64'}}
-                if val != {{nan_val}}:
-                {{else}}
-                if val == val and val != {{nan_val}}:
-                {{endif}}
-                    nobs[lab, 0] += 1
-                    if val < minx[lab, 0]:
-                        minx[lab, 0] = val
+                if groupby_t is int64_t:
+                    if val != nan_val:
+                        nobs[lab, j] += 1
+                        if val < minx[lab, j]:
+                            minx[lab, j] = val
+                else:
+                    if val == val and val != nan_val:
+                        nobs[lab, j] += 1
+                        if val < minx[lab, j]:
+                            minx[lab, j] = val
 
         for i in range(ncounts):
             for j in range(K):
                 if nobs[i, j] == 0:
-                    out[i, j] = {{nan_val}}
+                    out[i, j] = nan_val
                 else:
                     out[i, j] = minx[i, j]
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def group_cummin_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                          ndarray[{{dest_type2}}, ndim=2] values,
-                          ndarray[int64_t] labels,
-                          bint is_datetimelike):
+def group_cummin(groupby_t[:, :] out,
+                 groupby_t[:, :] values,
+                 const int64_t[:] labels,
+                 bint is_datetimelike):
     """
     Only transforms on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, size
-        {{dest_type2}} val, mval
-        ndarray[{{dest_type2}}, ndim=2] accum
+        groupby_t val, mval
+        ndarray[groupby_t, ndim=2] accum
         int64_t lab
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
     accum = np.empty_like(values)
-    accum.fill({{inf_val}})
+    if groupby_t is int64_t:
+        accum[:] = _int64_max
+    else:
+        accum[:] = np.inf
 
     with nogil:
         for i in range(N):
@@ -621,37 +501,43 @@ def group_cummin_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
                 val = values[i, j]
 
                 # val = nan
-                {{if name == 'int64'}}
-                if is_datetimelike and val == {{nan_val}}:
-                    out[i, j] = {{nan_val}}
+                if groupby_t is int64_t:
+                    if is_datetimelike and val == NPY_NAT:
+                        out[i, j] = NPY_NAT
+                    else:
+                        mval = accum[lab, j]
+                        if val < mval:
+                            accum[lab, j] = mval = val
+                        out[i, j] = mval
                 else:
-                {{else}}
-                if val == val:
-                {{endif}}
-                    mval = accum[lab, j]
-                    if val < mval:
-                        accum[lab, j] = mval = val
-                    out[i, j] = mval
+                    if val == val:
+                        mval = accum[lab, j]
+                        if val < mval:
+                            accum[lab, j] = mval = val
+                        out[i, j] = mval
 
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def group_cummax_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
-                          ndarray[{{dest_type2}}, ndim=2] values,
-                          ndarray[int64_t] labels,
-                          bint is_datetimelike):
+def group_cummax(groupby_t[:, :] out,
+                 groupby_t[:, :] values,
+                 const int64_t[:] labels,
+                 bint is_datetimelike):
     """
     Only transforms on axis=0
     """
     cdef:
         Py_ssize_t i, j, N, K, size
-        {{dest_type2}} val, mval
-        ndarray[{{dest_type2}}, ndim=2] accum
+        groupby_t val, mval
+        ndarray[groupby_t, ndim=2] accum
         int64_t lab
 
-    N, K = (<object> values).shape
+    N, K = (<object>values).shape
     accum = np.empty_like(values)
-    accum.fill(-{{inf_val}})
+    if groupby_t is int64_t:
+        accum[:] = -_int64_max
+    else:
+        accum[:] = -np.inf
 
     with nogil:
         for i in range(N):
@@ -662,175 +548,17 @@ def group_cummax_{{name}}(ndarray[{{dest_type2}}, ndim=2] out,
             for j in range(K):
                 val = values[i, j]
 
-                {{if name == 'int64'}}
-                if is_datetimelike and val == {{nan_val}}:
-                    out[i, j] = {{nan_val}}
+                if groupby_t is int64_t:
+                    if is_datetimelike and val == NPY_NAT:
+                        out[i, j] = NPY_NAT
+                    else:
+                        mval = accum[lab, j]
+                        if val > mval:
+                            accum[lab, j] = mval = val
+                        out[i, j] = mval
                 else:
-                {{else}}
-                if val == val:
-                {{endif}}
-                    mval = accum[lab, j]
-                    if val > mval:
-                        accum[lab, j] = mval = val
-                    out[i, j] = mval
-
-{{endfor}}
-
-#----------------------------------------------------------------------
-# other grouping functions not needing a template
-#----------------------------------------------------------------------
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_median_float64(ndarray[float64_t, ndim=2] out,
-                         ndarray[int64_t] counts,
-                         ndarray[float64_t, ndim=2] values,
-                         ndarray[int64_t] labels):
-    """
-    Only aggregates on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, ngroups, size
-        ndarray[int64_t] _counts
-        ndarray data
-        float64_t* ptr
-    ngroups = len(counts)
-    N, K = (<object> values).shape
-
-    indexer, _counts = groupsort_indexer(labels, ngroups)
-    counts[:] = _counts[1:]
-
-    data = np.empty((K, N), dtype=np.float64)
-    ptr = <float64_t*> data.data
-
-    take_2d_axis1_float64_float64(values.T, indexer, out=data)
-
-    with nogil:
-
-        for i in range(K):
-            # exclude NA group
-            ptr += _counts[0]
-            for j in range(ngroups):
-                size = _counts[j + 1]
-                out[j, i] = _median_linear(ptr, size)
-                ptr += size
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_cumprod_float64(float64_t[:, :] out,
-                          float64_t[:, :] values,
-                          int64_t[:] labels,
-                          bint is_datetimelike):
-    """
-    Only transforms on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, size
-        float64_t val
-        float64_t[:, :] accum
-        int64_t lab
-
-    N, K = (<object> values).shape
-    accum = np.ones_like(values)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-
-            if lab < 0:
-                continue
-            for j in range(K):
-                val = values[i, j]
-                if val == val:
-                    accum[lab, j] *= val
-                    out[i, j] = accum[lab, j]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_cumsum(numeric[:, :] out,
-                 numeric[:, :] values,
-                 int64_t[:] labels,
-                 is_datetimelike):
-    """
-    Only transforms on axis=0
-    """
-    cdef:
-        Py_ssize_t i, j, N, K, size
-        numeric val
-        numeric[:, :] accum
-        int64_t lab
-
-    N, K = (<object> values).shape
-    accum = np.zeros_like(values)
-
-    with nogil:
-        for i in range(N):
-            lab = labels[i]
-
-            if lab < 0:
-                continue
-            for j in range(K):
-                val = values[i, j]
-
-                if numeric == float32_t or numeric == float64_t:
                     if val == val:
-                        accum[lab, j] += val
-                        out[i, j] = accum[lab, j]
-                else:
-                    accum[lab, j] += val
-                    out[i, j] = accum[lab, j]
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def group_shift_indexer(int64_t[:] out, int64_t[:] labels,
-                        int ngroups, int periods):
-    cdef:
-        Py_ssize_t N, i, j, ii
-        int offset, sign
-        int64_t lab, idxer, idxer_slot
-        int64_t[:] label_seen = np.zeros(ngroups, dtype=np.int64)
-        int64_t[:, :] label_indexer
-
-    N, = (<object> labels).shape
-
-    if periods < 0:
-        periods = -periods
-        offset = N - 1
-        sign = -1
-    elif periods > 0:
-        offset = 0
-        sign = 1
-
-    if periods == 0:
-        with nogil:
-            for i in range(N):
-                out[i] = i
-    else:
-        # array of each previous indexer seen
-        label_indexer = np.zeros((ngroups, periods), dtype=np.int64)
-        with nogil:
-            for i in range(N):
-                ## reverse iterator if shifting backwards
-                ii = offset + sign * i
-                lab = labels[ii]
-
-                # Skip null keys
-                if lab == -1:
-                    out[ii] = -1
-                    continue
-
-                label_seen[lab] += 1
-
-                idxer_slot = label_seen[lab] % periods
-                idxer = label_indexer[lab, idxer_slot]
-
-                if label_seen[lab] > periods:
-                    out[ii] = idxer
-                else:
-                    out[ii] = -1
-
-                label_indexer[lab, idxer_slot] = ii
+                        mval = accum[lab, j]
+                        if val > mval:
+                            accum[lab, j] = mval = val
+                        out[i, j] = mval
diff --git a/pandas/_libs/hashing.pyx b/pandas/_libs/hashing.pyx
new file mode 100644
index 0000000000000..21d6c5378e170
--- /dev/null
+++ b/pandas/_libs/hashing.pyx
@@ -0,0 +1,181 @@
+# -*- coding: utf-8 -*-
+# Translated from the reference implementation
+# at https://github.com/veorq/SipHash
+
+import cython
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+from numpy cimport uint8_t, uint32_t, uint64_t, import_array
+import_array()
+
+from pandas._libs.util cimport is_nan
+
+DEF cROUNDS = 2
+DEF dROUNDS = 4
+
+
+@cython.boundscheck(False)
+def hash_object_array(object[:] arr, object key, object encoding='utf8'):
+    """
+    Parameters
+    ----------
+    arr : 1-d object ndarray of objects
+    key : hash key, must be 16 byte len encoded
+    encoding : encoding for key & arr, default to 'utf8'
+
+    Returns
+    -------
+    1-d uint64 ndarray of hashes
+
+    Notes
+    -----
+    allowed values must be strings, or nulls
+    mixed array types will raise TypeError
+
+    """
+    cdef:
+        Py_ssize_t i, l, n
+        uint64_t[:] result
+        bytes data, k
+        uint8_t *kb
+        uint64_t *lens
+        char **vecs
+        char *cdata
+        object val
+        list datas = []
+
+    k = <bytes>key.encode(encoding)
+    kb = <uint8_t *>k
+    if len(k) != 16:
+        raise ValueError("key should be a 16-byte string encoded, "
+                         "got {key} (len {klen})".format(key=k, klen=len(k)))
+
+    n = len(arr)
+
+    # create an array of bytes
+    vecs = <char **>malloc(n * sizeof(char *))
+    lens = <uint64_t*>malloc(n * sizeof(uint64_t))
+
+    for i in range(n):
+        val = arr[i]
+        if isinstance(val, bytes):
+            data = <bytes>val
+        elif isinstance(val, unicode):
+            data = <bytes>val.encode(encoding)
+        elif val is None or is_nan(val):
+            # null, stringify and encode
+            data = <bytes>str(val).encode(encoding)
+
+        else:
+            raise TypeError("{val} of type {typ} is not a valid type "
+                            "for hashing, must be string or null"
+                            .format(val=val, typ=type(val)))
+
+        l = len(data)
+        lens[i] = l
+        cdata = data
+
+        # keep the references alive thru the end of the
+        # function
+        datas.append(data)
+        vecs[i] = cdata
+
+    result = np.empty(n, dtype=np.uint64)
+    with nogil:
+        for i in range(n):
+            result[i] = low_level_siphash(<uint8_t *>vecs[i], lens[i], kb)
+
+    free(vecs)
+    free(lens)
+    return result.base  # .base to retrieve underlying np.ndarray
+
+
+cdef inline uint64_t _rotl(uint64_t x, uint64_t b) nogil:
+    return (x << b) | (x >> (64 - b))
+
+
+cdef inline void u32to8_le(uint8_t* p, uint32_t v) nogil:
+    p[0] = <uint8_t>(v)
+    p[1] = <uint8_t>(v >> 8)
+    p[2] = <uint8_t>(v >> 16)
+    p[3] = <uint8_t>(v >> 24)
+
+
+cdef inline uint64_t u8to64_le(uint8_t* p) nogil:
+    return (<uint64_t>p[0] |
+            <uint64_t>p[1] << 8 |
+            <uint64_t>p[2] << 16 |
+            <uint64_t>p[3] << 24 |
+            <uint64_t>p[4] << 32 |
+            <uint64_t>p[5] << 40 |
+            <uint64_t>p[6] << 48 |
+            <uint64_t>p[7] << 56)
+
+
+cdef inline void _sipround(uint64_t* v0, uint64_t* v1,
+                           uint64_t* v2, uint64_t* v3) nogil:
+    v0[0] += v1[0]
+    v1[0] = _rotl(v1[0], 13)
+    v1[0] ^= v0[0]
+    v0[0] = _rotl(v0[0], 32)
+    v2[0] += v3[0]
+    v3[0] = _rotl(v3[0], 16)
+    v3[0] ^= v2[0]
+    v0[0] += v3[0]
+    v3[0] = _rotl(v3[0], 21)
+    v3[0] ^= v0[0]
+    v2[0] += v1[0]
+    v1[0] = _rotl(v1[0], 17)
+    v1[0] ^= v2[0]
+    v2[0] = _rotl(v2[0], 32)
+
+
+@cython.cdivision(True)
+cdef uint64_t low_level_siphash(uint8_t* data, size_t datalen,
+                                uint8_t* key) nogil:
+    cdef uint64_t v0 = 0x736f6d6570736575ULL
+    cdef uint64_t v1 = 0x646f72616e646f6dULL
+    cdef uint64_t v2 = 0x6c7967656e657261ULL
+    cdef uint64_t v3 = 0x7465646279746573ULL
+    cdef uint64_t b
+    cdef uint64_t k0 = u8to64_le(key)
+    cdef uint64_t k1 = u8to64_le(key + 8)
+    cdef uint64_t m
+    cdef int i
+    cdef uint8_t* end = data + datalen - (datalen % sizeof(uint64_t))
+    cdef int left = datalen & 7
+    cdef int left_byte
+
+    b = (<uint64_t>datalen) << 56
+    v3 ^= k1
+    v2 ^= k0
+    v1 ^= k1
+    v0 ^= k0
+
+    while (data != end):
+        m = u8to64_le(data)
+        v3 ^= m
+        for i in range(cROUNDS):
+            _sipround(&v0, &v1, &v2, &v3)
+        v0 ^= m
+
+        data += sizeof(uint64_t)
+
+    for i in range(left-1, -1, -1):
+        b |= (<uint64_t>data[i]) << (i * 8)
+
+    v3 ^= b
+
+    for i in range(cROUNDS):
+        _sipround(&v0, &v1, &v2, &v3)
+
+    v0 ^= b
+    v2 ^= 0xff
+
+    for i in range(dROUNDS):
+        _sipround(&v0, &v1, &v2, &v3)
+
+    b = v0 ^ v1 ^ v2 ^ v3
+
+    return b
diff --git a/pandas/_libs/hashtable.pxd b/pandas/_libs/hashtable.pxd
index 9b352ae1c003b..609420f429798 100644
--- a/pandas/_libs/hashtable.pxd
+++ b/pandas/_libs/hashtable.pxd
@@ -1,5 +1,6 @@
-from khash cimport (kh_int64_t, kh_uint64_t, kh_float64_t, kh_pymap_t,
-                    kh_str_t, uint64_t, int64_t, float64_t)
+from pandas._libs.khash cimport (
+    kh_int64_t, kh_uint64_t, kh_float64_t, kh_pymap_t, kh_str_t, uint64_t,
+    int64_t, float64_t)
 from numpy cimport ndarray
 
 # prototypes for sharing
@@ -31,13 +32,6 @@ cdef class PyObjectHashTable(HashTable):
     cpdef get_item(self, object val)
     cpdef set_item(self, object key, Py_ssize_t val)
 
-cdef class MultiIndexHashTable(HashTable):
-    cdef:
-        kh_uint64_t *table
-        object mi
-
-    cpdef get_item(self, object val)
-    cpdef set_item(self, object key, Py_ssize_t val)
 
 cdef class StringHashTable(HashTable):
     cdef kh_str_t *table
@@ -52,6 +46,7 @@ cdef struct Int64VectorData:
 cdef class Int64Vector:
     cdef Int64VectorData *data
     cdef ndarray ao
+    cdef bint external_view_exists
 
     cdef resize(self)
     cpdef to_array(self)
diff --git a/pandas/_libs/hashtable.pyx b/pandas/_libs/hashtable.pyx
index eee287b2c157b..8d0c451ad0ab8 100644
--- a/pandas/_libs/hashtable.pyx
+++ b/pandas/_libs/hashtable.pyx
@@ -1,54 +1,61 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
 
-from cpython cimport PyObject, Py_INCREF, PyList_Check, PyTuple_Check
+cimport cython
 
-from khash cimport *
-from numpy cimport *
+from cpython cimport (PyObject, Py_INCREF,
+                      PyMem_Malloc, PyMem_Realloc, PyMem_Free)
 
 from libc.stdlib cimport malloc, free
-from cpython cimport (PyMem_Malloc, PyMem_Realloc, PyMem_Free,
-                      PyString_Check, PyBytes_Check,
-                      PyUnicode_Check)
-
-from util cimport _checknan
-cimport util
 
 import numpy as np
-nan = np.nan
+cimport numpy as cnp
+from numpy cimport ndarray, uint8_t, uint32_t, float64_t
+cnp.import_array()
 
 cdef extern from "numpy/npy_math.h":
-    double NAN "NPY_NAN"
+    float64_t NAN "NPY_NAN"
 
-cimport cython
-cimport numpy as cnp
 
-from pandas._libs.lib import checknull
+from pandas._libs.khash cimport (
+    khiter_t,
 
-cnp.import_array()
-cnp.import_ufunc()
+    kh_str_t, kh_init_str, kh_put_str, kh_exist_str,
+    kh_get_str, kh_destroy_str, kh_resize_str,
 
-cdef int64_t iNaT = util.get_nat()
-_SIZE_HINT_LIMIT = (1 << 20) + 7
+    kh_put_strbox, kh_get_strbox, kh_init_strbox,
 
-cdef extern from "datetime.h":
-    bint PyDateTime_Check(object o)
-    void PyDateTime_IMPORT()
+    kh_int64_t, kh_init_int64, kh_resize_int64, kh_destroy_int64,
+    kh_get_int64, kh_exist_int64, kh_put_int64,
 
-PyDateTime_IMPORT
+    kh_float64_t, kh_exist_float64, kh_put_float64, kh_init_float64,
+    kh_get_float64, kh_destroy_float64, kh_resize_float64,
 
-cdef extern from "Python.h":
-    int PySlice_Check(object)
+    kh_resize_uint64, kh_exist_uint64, kh_destroy_uint64, kh_put_uint64,
+    kh_get_uint64, kh_init_uint64,
 
-cdef size_t _INIT_VEC_CAP = 128
+    kh_destroy_pymap, kh_exist_pymap, kh_init_pymap, kh_get_pymap,
+    kh_put_pymap, kh_resize_pymap)
+
+
+cimport pandas._libs.util as util
 
+from pandas._libs.missing cimport checknull
+
+
+cdef int64_t NPY_NAT = util.get_nat()
+_SIZE_HINT_LIMIT = (1 << 20) + 7
+
+
+cdef size_t _INIT_VEC_CAP = 128
 
 include "hashtable_class_helper.pxi"
 include "hashtable_func_helper.pxi"
 
 cdef class Factorizer:
-    cdef public PyObjectHashTable table
-    cdef public ObjectVector uniques
-    cdef public Py_ssize_t count
+    cdef public:
+        PyObjectHashTable table
+        ObjectVector uniques
+        Py_ssize_t count
 
     def __init__(self, size_hint):
         self.table = PyObjectHashTable(size_hint)
@@ -59,14 +66,18 @@ cdef class Factorizer:
         return self.count
 
     def factorize(self, ndarray[object] values, sort=False, na_sentinel=-1,
-                  check_null=True):
+                  na_value=None):
         """
         Factorize values with nans replaced by na_sentinel
         >>> factorize(np.array([1,2,np.nan], dtype='O'), na_sentinel=20)
         array([ 0,  1, 20])
         """
+        if self.uniques.external_view_exists:
+            uniques = ObjectVector()
+            uniques.extend(self.uniques.to_array())
+            self.uniques = uniques
         labels = self.table.get_labels(values, self.uniques,
-                                       self.count, na_sentinel, check_null)
+                                       self.count, na_sentinel, na_value)
         mask = (labels == na_sentinel)
         # sort on
         if sort:
@@ -86,9 +97,10 @@ cdef class Factorizer:
 
 
 cdef class Int64Factorizer:
-    cdef public Int64HashTable table
-    cdef public Int64Vector uniques
-    cdef public Py_ssize_t count
+    cdef public:
+        Int64HashTable table
+        Int64Vector uniques
+        Py_ssize_t count
 
     def __init__(self, size_hint):
         self.table = Int64HashTable(size_hint)
@@ -99,10 +111,19 @@ cdef class Int64Factorizer:
         return self.count
 
     def factorize(self, int64_t[:] values, sort=False,
-                  na_sentinel=-1, check_null=True):
+                  na_sentinel=-1, na_value=None):
+        """
+        Factorize values with nans replaced by na_sentinel
+        >>> factorize(np.array([1,2,np.nan], dtype='O'), na_sentinel=20)
+        array([ 0,  1, 20])
+        """
+        if self.uniques.external_view_exists:
+            uniques = Int64Vector()
+            uniques.extend(self.uniques.to_array())
+            self.uniques = uniques
         labels = self.table.get_labels(values, self.uniques,
                                        self.count, na_sentinel,
-                                       check_null)
+                                       na_value=na_value)
 
         # sort on
         if sort:
@@ -121,16 +142,16 @@ cdef class Int64Factorizer:
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def unique_label_indices(ndarray[int64_t, ndim=1] labels):
+def unique_label_indices(const int64_t[:] labels):
     """
     indices of the first occurrences of the unique labels
-    *excluding* -1. equivelent to:
+    *excluding* -1. equivalent to:
         np.unique(labels, return_index=True)[1]
     """
     cdef:
         int ret = 0
         Py_ssize_t i, n = len(labels)
-        kh_int64_t * table = kh_init_int64()
+        kh_int64_t *table = kh_init_int64()
         Int64Vector idx = Int64Vector()
         ndarray[int64_t, ndim=1] arr
         Int64VectorData *ud = idx.data
@@ -149,6 +170,6 @@ def unique_label_indices(ndarray[int64_t, ndim=1] labels):
     kh_destroy_int64(table)
 
     arr = idx.to_array()
-    arr = arr[labels[arr].argsort()]
+    arr = arr[np.asarray(labels)[arr].argsort()]
 
     return arr[1:] if arr.size != 0 and labels[arr[0]] == -1 else arr
diff --git a/pandas/_libs/hashtable_class_helper.pxi.in b/pandas/_libs/hashtable_class_helper.pxi.in
index 3ce82dace40a9..3644928d8dedc 100644
--- a/pandas/_libs/hashtable_class_helper.pxi.in
+++ b/pandas/_libs/hashtable_class_helper.pxi.in
@@ -4,9 +4,10 @@ Template for each `dtype` helper function for hashtable
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+
+# ----------------------------------------------------------------------
 # VectorData
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -28,7 +29,7 @@ dtypes = [('Float64', 'float64', 'float64_t'),
 
 ctypedef struct {{name}}VectorData:
     {{arg}} *data
-    size_t n, m
+    Py_ssize_t n, m
 
 {{endif}}
 
@@ -52,9 +53,9 @@ ctypedef fused vector_data:
 cdef inline bint needs_resize(vector_data *data) nogil:
     return data.n == data.m
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Vector
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -71,6 +72,7 @@ cdef class {{name}}Vector:
 
     {{if dtype != 'int64'}}
     cdef:
+        bint external_view_exists
         {{name}}VectorData *data
         ndarray ao
     {{endif}}
@@ -80,15 +82,16 @@ cdef class {{name}}Vector:
             sizeof({{name}}VectorData))
         if not self.data:
             raise MemoryError()
+        self.external_view_exists = False
         self.data.n = 0
         self.data.m = _INIT_VEC_CAP
         self.ao = np.empty(self.data.m, dtype={{idtype}})
-        self.data.data = <{{arg}}*> self.ao.data
+        self.data.data = <{{arg}}*>self.ao.data
 
     cdef resize(self):
         self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
-        self.ao.resize(self.data.m)
-        self.data.data = <{{arg}}*> self.ao.data
+        self.ao.resize(self.data.m, refcheck=False)
+        self.data.data = <{{arg}}*>self.ao.data
 
     def __dealloc__(self):
         if self.data is not NULL:
@@ -99,18 +102,26 @@ cdef class {{name}}Vector:
         return self.data.n
 
     cpdef to_array(self):
-        self.ao.resize(self.data.n)
-        self.data.m = self.data.n
+        if self.data.m != self.data.n:
+            if self.external_view_exists:
+                # should never happen
+                raise ValueError("should have raised on append()")
+            self.ao.resize(self.data.n, refcheck=False)
+            self.data.m = self.data.n
+        self.external_view_exists = True
         return self.ao
 
     cdef inline void append(self, {{arg}} x):
 
         if needs_resize(self.data):
+            if self.external_view_exists:
+                raise ValueError("external reference but "
+                                 "Vector.resize() needed")
             self.resize()
 
         append_data_{{dtype}}(self.data, x)
 
-    cdef extend(self, {{arg}}[:] x):
+    cdef extend(self, const {{arg}}[:] x):
         for i in range(len(x)):
             self.append(x[i])
 
@@ -120,27 +131,31 @@ cdef class StringVector:
 
     cdef:
         StringVectorData *data
+        bint external_view_exists
 
     def __cinit__(self):
-        self.data = <StringVectorData *>PyMem_Malloc(
-            sizeof(StringVectorData))
+        self.data = <StringVectorData *>PyMem_Malloc(sizeof(StringVectorData))
         if not self.data:
             raise MemoryError()
+        self.external_view_exists = False
         self.data.n = 0
         self.data.m = _INIT_VEC_CAP
-        self.data.data = <char **> malloc(self.data.m * sizeof(char *))
+        self.data.data = <char **>malloc(self.data.m * sizeof(char *))
+        if not self.data.data:
+            raise MemoryError()
 
     cdef resize(self):
         cdef:
             char **orig_data
-            size_t i, m
+            Py_ssize_t i, m
 
         m = self.data.m
         self.data.m = max(self.data.m * 4, _INIT_VEC_CAP)
 
-        # TODO: can resize?
         orig_data = self.data.data
-        self.data.data = <char **> malloc(self.data.m * sizeof(char *))
+        self.data.data = <char **>malloc(self.data.m * sizeof(char *))
+        if not self.data.data:
+            raise MemoryError()
         for i in range(m):
             self.data.data[i] = orig_data[i]
 
@@ -157,59 +172,76 @@ cdef class StringVector:
     def to_array(self):
         cdef:
             ndarray ao
-            size_t n
+            Py_ssize_t n
             object val
 
         ao = np.empty(self.data.n, dtype=np.object)
         for i in range(self.data.n):
             val = self.data.data[i]
             ao[i] = val
+        self.external_view_exists = True
         self.data.m = self.data.n
         return ao
 
-    cdef inline void append(self, char * x):
+    cdef inline void append(self, char *x):
 
         if needs_resize(self.data):
             self.resize()
 
         append_data_string(self.data, x)
 
+    cdef extend(self, ndarray[:] x):
+        for i in range(len(x)):
+            self.append(x[i])
+
 
 cdef class ObjectVector:
 
     cdef:
         PyObject **data
-        size_t n, m
+        Py_ssize_t n, m
         ndarray ao
+        bint external_view_exists
 
     def __cinit__(self):
+        self.external_view_exists = False
         self.n = 0
         self.m = _INIT_VEC_CAP
         self.ao = np.empty(_INIT_VEC_CAP, dtype=object)
-        self.data = <PyObject**> self.ao.data
+        self.data = <PyObject**>self.ao.data
 
     def __len__(self):
         return self.n
 
-    cdef inline append(self, object o):
+    cdef inline append(self, object obj):
         if self.n == self.m:
+            if self.external_view_exists:
+                raise ValueError("external reference but "
+                                 "Vector.resize() needed")
             self.m = max(self.m * 2, _INIT_VEC_CAP)
-            self.ao.resize(self.m)
-            self.data = <PyObject**> self.ao.data
+            self.ao.resize(self.m, refcheck=False)
+            self.data = <PyObject**>self.ao.data
 
-        Py_INCREF(o)
-        self.data[self.n] = <PyObject*> o
+        Py_INCREF(obj)
+        self.data[self.n] = <PyObject*>obj
         self.n += 1
 
     def to_array(self):
-        self.ao.resize(self.n)
-        self.m = self.n
+        if self.m != self.n:
+            if self.external_view_exists:
+                raise ValueError("should have raised on append()")
+            self.ao.resize(self.n, refcheck=False)
+            self.m = self.n
+        self.external_view_exists = True
         return self.ao
 
+    cdef extend(self, ndarray[:] x):
+        for i in range(len(x)):
+            self.append(x[i])
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # HashTable
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 
 cdef class HashTable:
@@ -218,21 +250,22 @@ cdef class HashTable:
 
 {{py:
 
-# name, dtype, null_condition, float_group
-dtypes = [('Float64', 'float64', 'val != val', True),
-          ('UInt64', 'uint64', 'False', False),
-          ('Int64', 'int64', 'val == iNaT', False)]
+# name, dtype, float_group, default_na_value
+dtypes = [('Float64', 'float64', True, 'np.nan'),
+          ('UInt64', 'uint64', False, 0),
+          ('Int64', 'int64', False, 'NPY_NAT')]
 
 }}
 
 
-{{for name, dtype, null_condition, float_group in dtypes}}
+{{for name, dtype, float_group, default_na_value in dtypes}}
 
 cdef class {{name}}HashTable(HashTable):
 
-    def __cinit__(self, size_hint=1):
+    def __cinit__(self, int64_t size_hint=1):
         self.table = kh_init_{{dtype}}()
         if size_hint is not None:
+            size_hint = min(size_hint, _SIZE_HINT_LIMIT)
             kh_resize_{{dtype}}(self.table, size_hint)
 
     def __len__(self):
@@ -250,9 +283,9 @@ cdef class {{name}}HashTable(HashTable):
 
     def sizeof(self, deep=False):
         """ return the size of my table in bytes """
-        return self.table.n_buckets * (sizeof({{dtype}}_t) + # keys
-                                       sizeof(size_t) + # vals
-                                       sizeof(uint32_t)) # flags
+        return self.table.n_buckets * (sizeof({{dtype}}_t) +  # keys
+                                       sizeof(Py_ssize_t) +  # vals
+                                       sizeof(uint32_t))  # flags
 
     cpdef get_item(self, {{dtype}}_t val):
         cdef khiter_t k
@@ -275,7 +308,7 @@ cdef class {{name}}HashTable(HashTable):
             raise KeyError(key)
 
     @cython.boundscheck(False)
-    def map(self, {{dtype}}_t[:] keys, int64_t[:] values):
+    def map(self, const {{dtype}}_t[:] keys, const int64_t[:] values):
         cdef:
             Py_ssize_t i, n = len(values)
             int ret = 0
@@ -286,10 +319,10 @@ cdef class {{name}}HashTable(HashTable):
             for i in range(n):
                 key = keys[i]
                 k = kh_put_{{dtype}}(self.table, key, &ret)
-                self.table.vals[k] = <Py_ssize_t> values[i]
+                self.table.vals[k] = <Py_ssize_t>values[i]
 
     @cython.boundscheck(False)
-    def map_locations(self, ndarray[{{dtype}}_t, ndim=1] values):
+    def map_locations(self, const {{dtype}}_t[:] values):
         cdef:
             Py_ssize_t i, n = len(values)
             int ret = 0
@@ -303,7 +336,7 @@ cdef class {{name}}HashTable(HashTable):
                 self.table.vals[k] = i
 
     @cython.boundscheck(False)
-    def lookup(self, {{dtype}}_t[:] values):
+    def lookup(self, const {{dtype}}_t[:] values):
         cdef:
             Py_ssize_t i, n = len(values)
             int ret = 0
@@ -322,55 +355,174 @@ cdef class {{name}}HashTable(HashTable):
 
         return np.asarray(locs)
 
-    def factorize(self, {{dtype}}_t values):
-        uniques = {{name}}Vector()
-        labels = self.get_labels(values, uniques, 0, 0)
-        return uniques.to_array(), labels
-
     @cython.boundscheck(False)
-    def get_labels(self, {{dtype}}_t[:] values, {{name}}Vector uniques,
-                   Py_ssize_t count_prior, Py_ssize_t na_sentinel,
-                   bint check_null=True):
+    @cython.wraparound(False)
+    def _unique(self, const {{dtype}}_t[:] values, {{name}}Vector uniques,
+                Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                object na_value=None, bint ignore_na=False,
+                bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[{{dtype}}]
+            Array of values of which unique will be calculated
+        uniques : {{name}}Vector
+            Vector into which uniques will be written
+        count_prior : Py_ssize_t, default 0
+            Number of existing entries in uniques
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then
+            any value "val" satisfying val != val is considered missing.
+            If na_value is not None, then _additionally_, any value "val"
+            satisfying val == na_value is considered missing.
+        ignore_na : boolean, default False
+            Whether NA-values should be ignored for calculating the uniques. If
+            True, the labels corresponding to missing values will be set to
+            na_sentinel.
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[{{dtype}}]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse=True)
+            The labels from values to uniques
+        """
         cdef:
-            Py_ssize_t i, n = len(values)
+            Py_ssize_t i, idx, count = count_prior, n = len(values)
             int64_t[:] labels
-            Py_ssize_t idx, count = count_prior
             int ret = 0
-            {{dtype}}_t val
+            {{dtype}}_t val, na_value2
             khiter_t k
             {{name}}VectorData *ud
+            bint use_na_value
 
-        labels = np.empty(n, dtype=np.int64)
+        if return_inverse:
+            labels = np.empty(n, dtype=np.int64)
         ud = uniques.data
+        use_na_value = na_value is not None
+
+        if use_na_value:
+            # We need this na_value2 because we want to allow users
+            # to *optionally* specify an NA sentinel *of the correct* type.
+            # We use None, to make it optional, which requires `object` type
+            # for the parameter. To please the compiler, we use na_value2,
+            # which is only used if it's *specified*.
+            na_value2 = <{{dtype}}_t>na_value
+        else:
+            na_value2 = {{default_na_value}}
 
         with nogil:
             for i in range(n):
                 val = values[i]
 
-                if check_null and {{null_condition}}:
+                if ignore_na and (val != val
+                                  or (use_na_value and val == na_value2)):
+                    # if missing values do not count as unique values (i.e. if
+                    # ignore_na is True), skip the hashtable entry for them,
+                    # and replace the corresponding label with na_sentinel
                     labels[i] = na_sentinel
                     continue
 
                 k = kh_get_{{dtype}}(self.table, val)
 
-                if k != self.table.n_buckets:
-                    idx = self.table.vals[k]
-                    labels[i] = idx
-                else:
+                if k == self.table.n_buckets:
+                    # k hasn't been seen yet
                     k = kh_put_{{dtype}}(self.table, val, &ret)
-                    self.table.vals[k] = count
 
                     if needs_resize(ud):
                         with gil:
+                            if uniques.external_view_exists:
+                                raise ValueError("external reference to "
+                                                 "uniques held, but "
+                                                 "Vector.resize() needed")
                             uniques.resize()
                     append_data_{{dtype}}(ud, val)
-                    labels[i] = count
-                    count += 1
+                    if return_inverse:
+                        self.table.vals[k] = count
+                        labels[i] = count
+                        count += 1
+                elif return_inverse:
+                    # k falls into a previous bucket
+                    # only relevant in case we need to construct the inverse
+                    idx = self.table.vals[k]
+                    labels[i] = idx
 
-        return np.asarray(labels)
+        if return_inverse:
+            return uniques.to_array(), np.asarray(labels)
+        return uniques.to_array()
+
+    def unique(self, const {{dtype}}_t[:] values, bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[{{dtype}}]
+            Array of values of which unique will be calculated
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[{{dtype}}]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse)
+            The labels from values to uniques
+        """
+        uniques = {{name}}Vector()
+        return self._unique(values, uniques, ignore_na=False,
+                            return_inverse=return_inverse)
+
+    def factorize(self, const {{dtype}}_t[:] values, Py_ssize_t na_sentinel=-1,
+                  object na_value=None):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Missing values are not included in the "uniques" for this method.
+        The labels for any missing values will be set to "na_sentinel"
+
+        Parameters
+        ----------
+        values : ndarray[{{dtype}}]
+            Array of values of which unique will be calculated
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then
+            any value "val" satisfying val != val is considered missing.
+            If na_value is not None, then _additionally_, any value "val"
+            satisfying val == na_value is considered missing.
+
+        Returns
+        -------
+        uniques : ndarray[{{dtype}}]
+            Unique values of input, not sorted
+        labels : ndarray[int64]
+            The labels from values to uniques
+        """
+        uniques_vector = {{name}}Vector()
+        return self._unique(values, uniques_vector, na_sentinel=na_sentinel,
+                            na_value=na_value, ignore_na=True,
+                            return_inverse=True)
+
+    def get_labels(self, const {{dtype}}_t[:] values, {{name}}Vector uniques,
+                   Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                   object na_value=None):
+        _, labels = self._unique(values, uniques, count_prior=count_prior,
+                                 na_sentinel=na_sentinel, na_value=na_value,
+                                 ignore_na=True, return_inverse=True)
+        return labels
 
     @cython.boundscheck(False)
-    def get_labels_groupby(self, {{dtype}}_t[:] values):
+    def get_labels_groupby(self, const {{dtype}}_t[:] values):
         cdef:
             Py_ssize_t i, n = len(values)
             int64_t[:] labels
@@ -414,50 +566,6 @@ cdef class {{name}}HashTable(HashTable):
 
         return np.asarray(labels), arr_uniques
 
-    @cython.boundscheck(False)
-    def unique(self, {{dtype}}_t[:] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            {{dtype}}_t val
-            khiter_t k
-            bint seen_na = 0
-            {{name}}Vector uniques = {{name}}Vector()
-            {{name}}VectorData *ud
-
-        ud = uniques.data
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-
-                {{if float_group}}
-                if val == val:
-                    k = kh_get_{{dtype}}(self.table, val)
-                    if k == self.table.n_buckets:
-                        kh_put_{{dtype}}(self.table, val, &ret)
-                        if needs_resize(ud):
-                            with gil:
-                                uniques.resize()
-                        append_data_{{dtype}}(ud, val)
-                elif not seen_na:
-                    seen_na = 1
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data_{{dtype}}(ud, NAN)
-                {{else}}
-                k = kh_get_{{dtype}}(self.table, val)
-                if k == self.table.n_buckets:
-                    kh_put_{{dtype}}(self.table, val, &ret)
-                    if needs_resize(ud):
-                        with gil:
-                            uniques.resize()
-                    append_data_{{dtype}}(ud, val)
-                {{endif}}
-
-        return uniques.to_array()
-
 {{endfor}}
 
 
@@ -466,9 +574,10 @@ cdef class StringHashTable(HashTable):
     # or a sentinel np.nan / None missing value
     na_string_sentinel = '__nan__'
 
-    def __init__(self, int size_hint=1):
+    def __init__(self, int64_t size_hint=1):
         self.table = kh_init_str()
         if size_hint is not None:
+            size_hint = min(size_hint, _SIZE_HINT_LIMIT)
             kh_resize_str(self.table, size_hint)
 
     def __dealloc__(self):
@@ -479,13 +588,13 @@ cdef class StringHashTable(HashTable):
     def sizeof(self, deep=False):
         """ return the size of my table in bytes """
         return self.table.n_buckets * (sizeof(char *) + # keys
-                                       sizeof(size_t) + # vals
+                                       sizeof(Py_ssize_t) + # vals
                                        sizeof(uint32_t)) # flags
 
     cpdef get_item(self, object val):
         cdef:
             khiter_t k
-            char *v
+            const char *v
         v = util.get_c_string(val)
 
         k = kh_get_str(self.table, v)
@@ -498,7 +607,7 @@ cdef class StringHashTable(HashTable):
         cdef:
             khiter_t k
             int ret = 0
-            char *v
+            const char *v
 
         v = util.get_c_string(val)
 
@@ -514,13 +623,13 @@ cdef class StringHashTable(HashTable):
         cdef:
             Py_ssize_t i, n = len(values)
             ndarray[int64_t] labels = np.empty(n, dtype=np.int64)
-            int64_t *resbuf = <int64_t*> labels.data
+            int64_t *resbuf = <int64_t*>labels.data
             khiter_t k
             kh_str_t *table = self.table
-            char *v
-            char **vecs
+            const char *v
+            const char **vecs
 
-        vecs = <char **> malloc(n * sizeof(char *))
+        vecs = <const char **>malloc(n * sizeof(char *))
         for i in range(n):
             val = values[i]
             v = util.get_c_string(val)
@@ -537,63 +646,22 @@ cdef class StringHashTable(HashTable):
         free(vecs)
         return labels
 
-    @cython.boundscheck(False)
-    def unique(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, count, n = len(values)
-            int64_t[:] uindexer
-            int ret = 0
-            object val
-            ObjectVector uniques
-            khiter_t k
-            char *v
-            char **vecs
-
-        vecs = <char **> malloc(n * sizeof(char *))
-        uindexer = np.empty(n, dtype=np.int64)
-        for i in range(n):
-            val = values[i]
-            v = util.get_c_string(val)
-            vecs[i] = v
-
-        count = 0
-        with nogil:
-            for i in range(n):
-                v = vecs[i]
-                k = kh_get_str(self.table, v)
-                if k == self.table.n_buckets:
-                    kh_put_str(self.table, v, &ret)
-                    uindexer[count] = i
-                    count += 1
-        free(vecs)
-
-        # uniques
-        uniques = ObjectVector()
-        for i in range(count):
-            uniques.append(values[uindexer[i]])
-        return uniques.to_array()
-
-    def factorize(self, ndarray[object] values):
-        uniques = ObjectVector()
-        labels = self.get_labels(values, uniques, 0, 0)
-        return uniques.to_array(), labels
-
     @cython.boundscheck(False)
     def lookup(self, ndarray[object] values):
         cdef:
             Py_ssize_t i, n = len(values)
             int ret = 0
             object val
-            char *v
+            const char *v
             khiter_t k
             int64_t[:] locs = np.empty(n, dtype=np.int64)
 
         # these by-definition *must* be strings
-        vecs = <char **> malloc(n * sizeof(char *))
+        vecs = <char **>malloc(n * sizeof(char *))
         for i in range(n):
             val = values[i]
 
-            if PyUnicode_Check(val) or PyString_Check(val):
+            if isinstance(val, (str, unicode)):
                 v = util.get_c_string(val)
             else:
                 v = util.get_c_string(self.na_string_sentinel)
@@ -617,16 +685,16 @@ cdef class StringHashTable(HashTable):
             Py_ssize_t i, n = len(values)
             int ret = 0
             object val
-            char *v
-            char **vecs
+            const char *v
+            const char **vecs
             khiter_t k
 
         # these by-definition *must* be strings
-        vecs = <char **> malloc(n * sizeof(char *))
+        vecs = <const char **>malloc(n * sizeof(char *))
         for i in range(n):
             val = values[i]
 
-            if PyUnicode_Check(val) or PyString_Check(val):
+            if isinstance(val, (str, unicode)):
                 v = util.get_c_string(val)
             else:
                 v = util.get_c_string(self.na_string_sentinel)
@@ -640,53 +708,99 @@ cdef class StringHashTable(HashTable):
         free(vecs)
 
     @cython.boundscheck(False)
-    def get_labels(self, ndarray[object] values, ObjectVector uniques,
-                   Py_ssize_t count_prior, int64_t na_sentinel,
-                   bint check_null=1):
+    @cython.wraparound(False)
+    def _unique(self, ndarray[object] values, ObjectVector uniques,
+                Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                object na_value=None, bint ignore_na=False,
+                bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        uniques : ObjectVector
+            Vector into which uniques will be written
+        count_prior : Py_ssize_t, default 0
+            Number of existing entries in uniques
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then any value
+            that is not a string is considered missing. If na_value is
+            not None, then _additionally_ any value "val" satisfying
+            val == na_value is considered missing.
+        ignore_na : boolean, default False
+            Whether NA-values should be ignored for calculating the uniques. If
+            True, the labels corresponding to missing values will be set to
+            na_sentinel.
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse=True)
+            The labels from values to uniques
+        """
         cdef:
-            Py_ssize_t i, n = len(values)
+            Py_ssize_t i, idx, count = count_prior, n = len(values)
             int64_t[:] labels
             int64_t[:] uindexer
-            Py_ssize_t idx, count = count_prior
             int ret = 0
             object val
-            char *v
-            char **vecs
+            const char *v
+            const char **vecs
             khiter_t k
+            bint use_na_value
 
-        # these by-definition *must* be strings
-        labels = np.zeros(n, dtype=np.int64)
+        if return_inverse:
+            labels = np.zeros(n, dtype=np.int64)
         uindexer = np.empty(n, dtype=np.int64)
+        use_na_value = na_value is not None
 
-        # pre-filter out missing
-        # and assign pointers
-        vecs = <char **> malloc(n * sizeof(char *))
+        # assign pointers and pre-filter out missing (if ignore_na)
+        vecs = <const char **>malloc(n * sizeof(char *))
         for i in range(n):
             val = values[i]
 
-            if PyUnicode_Check(val) or PyString_Check(val):
+            if (ignore_na
+                and (not isinstance(val, (str, unicode))
+                     or (use_na_value and val == na_value))):
+                # if missing values do not count as unique values (i.e. if
+                # ignore_na is True), we can skip the actual value, and
+                # replace the label with na_sentinel directly
+                labels[i] = na_sentinel
+            else:
+                # if ignore_na is False, we also stringify NaN/None/etc.
                 v = util.get_c_string(val)
                 vecs[i] = v
-            else:
-                labels[i] = na_sentinel
 
         # compute
         with nogil:
             for i in range(n):
-                if labels[i] == na_sentinel:
+                if ignore_na and labels[i] == na_sentinel:
+                    # skip entries for ignored missing values (see above)
                     continue
 
                 v = vecs[i]
                 k = kh_get_str(self.table, v)
-                if k != self.table.n_buckets:
-                    idx = self.table.vals[k]
-                    labels[i] = <int64_t>idx
-                else:
+                if k == self.table.n_buckets:
+                    # k hasn't been seen yet
                     k = kh_put_str(self.table, v, &ret)
-                    self.table.vals[k] = count
                     uindexer[count] = i
-                    labels[i] = <int64_t>count
+                    if return_inverse:
+                        self.table.vals[k] = count
+                        labels[i] = <int64_t>count
                     count += 1
+                elif return_inverse:
+                    # k falls into a previous bucket
+                    # only relevant in case we need to construct the inverse
+                    idx = self.table.vals[k]
+                    labels[i] = <int64_t>idx
 
         free(vecs)
 
@@ -694,15 +808,81 @@ cdef class StringHashTable(HashTable):
         for i in range(count):
             uniques.append(values[uindexer[i]])
 
-        return np.asarray(labels)
+        if return_inverse:
+            return uniques.to_array(), np.asarray(labels)
+        return uniques.to_array()
+
+    def unique(self, ndarray[object] values, bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse)
+            The labels from values to uniques
+        """
+        uniques = ObjectVector()
+        return self._unique(values, uniques, ignore_na=False,
+                            return_inverse=return_inverse)
+
+    def factorize(self, ndarray[object] values, Py_ssize_t na_sentinel=-1,
+                  object na_value=None):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Missing values are not included in the "uniques" for this method.
+        The labels for any missing values will be set to "na_sentinel"
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then any value
+            that is not a string is considered missing. If na_value is
+            not None, then _additionally_ any value "val" satisfying
+            val == na_value is considered missing.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64]
+            The labels from values to uniques
+        """
+        uniques_vector = ObjectVector()
+        return self._unique(values, uniques_vector, na_sentinel=na_sentinel,
+                            na_value=na_value, ignore_na=True,
+                            return_inverse=True)
+
+    def get_labels(self, ndarray[object] values, ObjectVector uniques,
+                   Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                   object na_value=None):
+        _, labels = self._unique(values, uniques, count_prior=count_prior,
+                                 na_sentinel=na_sentinel, na_value=na_value,
+                                 ignore_na=True, return_inverse=True)
+        return labels
 
-na_sentinel = object
 
 cdef class PyObjectHashTable(HashTable):
 
-    def __init__(self, size_hint=1):
+    def __init__(self, int64_t size_hint=1):
         self.table = kh_init_pymap()
-        kh_resize_pymap(self.table, size_hint)
+        if size_hint is not None:
+            size_hint = min(size_hint, _SIZE_HINT_LIMIT)
+            kh_resize_pymap(self.table, size_hint)
 
     def __dealloc__(self):
         if self.table is not NULL:
@@ -715,21 +895,19 @@ cdef class PyObjectHashTable(HashTable):
     def __contains__(self, object key):
         cdef khiter_t k
         hash(key)
-        if key != key or key is None:
-            key = na_sentinel
+
         k = kh_get_pymap(self.table, <PyObject*>key)
         return k != self.table.n_buckets
 
     def sizeof(self, deep=False):
         """ return the size of my table in bytes """
-        return self.table.n_buckets * (sizeof(PyObject *) + # keys
-                                       sizeof(size_t) + # vals
-                                       sizeof(uint32_t)) # flags
+        return self.table.n_buckets * (sizeof(PyObject *) +  # keys
+                                       sizeof(Py_ssize_t) +  # vals
+                                       sizeof(uint32_t))  # flags
 
     cpdef get_item(self, object val):
         cdef khiter_t k
-        if val != val or val is None:
-            val = na_sentinel
+
         k = kh_get_pymap(self.table, <PyObject*>val)
         if k != self.table.n_buckets:
             return self.table.vals[k]
@@ -743,8 +921,7 @@ cdef class PyObjectHashTable(HashTable):
             char* buf
 
         hash(key)
-        if key != key or key is None:
-            key = na_sentinel
+
         k = kh_put_pymap(self.table, <PyObject*>key, &ret)
         # self.table.keys[k] = key
         if kh_exist_pymap(self.table, k):
@@ -762,8 +939,6 @@ cdef class PyObjectHashTable(HashTable):
         for i in range(n):
             val = values[i]
             hash(val)
-            if val != val or val is None:
-                val = na_sentinel
 
             k = kh_put_pymap(self.table, <PyObject*>val, &ret)
             self.table.vals[k] = i
@@ -779,8 +954,6 @@ cdef class PyObjectHashTable(HashTable):
         for i in range(n):
             val = values[i]
             hash(val)
-            if val != val or val is None:
-                val = na_sentinel
 
             k = kh_get_pymap(self.table, <PyObject*>val)
             if k != self.table.n_buckets:
@@ -790,183 +963,147 @@ cdef class PyObjectHashTable(HashTable):
 
         return np.asarray(locs)
 
-    def unique(self, ndarray[object] values):
-        cdef:
-            Py_ssize_t i, n = len(values)
-            int ret = 0
-            object val
-            khiter_t k
-            ObjectVector uniques = ObjectVector()
-            bint seen_na = 0
-
-        for i in range(n):
-            val = values[i]
-            hash(val)
-            if not _checknan(val):
-                k = kh_get_pymap(self.table, <PyObject*>val)
-                if k == self.table.n_buckets:
-                    kh_put_pymap(self.table, <PyObject*>val, &ret)
-                    uniques.append(val)
-            elif not seen_na:
-                seen_na = 1
-                uniques.append(nan)
-
-        return uniques.to_array()
-
-    def get_labels(self, ndarray[object] values, ObjectVector uniques,
-                   Py_ssize_t count_prior, int64_t na_sentinel,
-                   bint check_null=True):
+    @cython.boundscheck(False)
+    @cython.wraparound(False)
+    def _unique(self, ndarray[object] values, ObjectVector uniques,
+                Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                object na_value=None, bint ignore_na=False,
+                bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        uniques : ObjectVector
+            Vector into which uniques will be written
+        count_prior : Py_ssize_t, default 0
+            Number of existing entries in uniques
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then None _plus_
+            any value "val" satisfying val != val is considered missing.
+            If na_value is not None, then _additionally_, any value "val"
+            satisfying val == na_value is considered missing.
+        ignore_na : boolean, default False
+            Whether NA-values should be ignored for calculating the uniques. If
+            True, the labels corresponding to missing values will be set to
+            na_sentinel.
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse=True)
+            The labels from values to uniques
+        """
         cdef:
-            Py_ssize_t i, n = len(values)
+            Py_ssize_t i, idx, count = count_prior, n = len(values)
             int64_t[:] labels
-            Py_ssize_t idx, count = count_prior
             int ret = 0
             object val
             khiter_t k
+            bint use_na_value
 
-        labels = np.empty(n, dtype=np.int64)
+        if return_inverse:
+            labels = np.empty(n, dtype=np.int64)
+        use_na_value = na_value is not None
 
         for i in range(n):
             val = values[i]
             hash(val)
 
-            if check_null and val != val or val is None:
+            if ignore_na and ((val != val or val is None)
+                              or (use_na_value and val == na_value)):
+                # if missing values do not count as unique values (i.e. if
+                # ignore_na is True), skip the hashtable entry for them, and
+                # replace the corresponding label with na_sentinel
                 labels[i] = na_sentinel
                 continue
 
             k = kh_get_pymap(self.table, <PyObject*>val)
-            if k != self.table.n_buckets:
-                idx = self.table.vals[k]
-                labels[i] = idx
-            else:
+            if k == self.table.n_buckets:
+                # k hasn't been seen yet
                 k = kh_put_pymap(self.table, <PyObject*>val, &ret)
-                self.table.vals[k] = count
                 uniques.append(val)
-                labels[i] = count
-                count += 1
-
-        return np.asarray(labels)
-
-
-cdef class MultiIndexHashTable(HashTable):
-
-    def __init__(self, size_hint=1):
-        self.table = kh_init_uint64()
-        self.mi = None
-        kh_resize_uint64(self.table, size_hint)
-
-    def __dealloc__(self):
-        if self.table is not NULL:
-            kh_destroy_uint64(self.table)
-            self.table = NULL
-
-    def __len__(self):
-        return self.table.size
-
-    def sizeof(self, deep=False):
-        """ return the size of my table in bytes """
-        return self.table.n_buckets * (sizeof(uint64_t) + # keys
-                                       sizeof(size_t) + # vals
-                                       sizeof(uint32_t)) # flags
-
-    def _check_for_collisions(self, int64_t[:] locs, object mi):
-        # validate that the locs map to the actual values
-        # provided in the mi
-        # we can only check if we *don't* have any missing values
-        # :<
-        cdef:
-            ndarray[int64_t] alocs
-
-        alocs = np.asarray(locs)
-        if (alocs != -1).all():
-
-            result = self.mi.take(locs)
-            if isinstance(mi, tuple):
-                from pandas import Index
-                mi = Index([mi])
-            if not result.equals(mi):
-                raise AssertionError(
-                    "hash collision\nlocs:\n{}\n"
-                    "result:\n{}\nmi:\n{}".format(alocs, result, mi))
-
-    def __contains__(self, object key):
-        try:
-            self.get_item(key)
-            return True
-        except (KeyError, ValueError, TypeError):
-            return False
-
-    cpdef get_item(self, object key):
-        cdef:
-            khiter_t k
-            uint64_t value
-            int64_t[:] locs
-            Py_ssize_t loc
-
-        value = self.mi._hashed_indexing_key(key)
-        k = kh_get_uint64(self.table, value)
-        if k != self.table.n_buckets:
-            loc = self.table.vals[k]
-            locs = np.array([loc], dtype=np.int64)
-            self._check_for_collisions(locs, key)
-            return loc
-        else:
-            raise KeyError(key)
-
-    cpdef set_item(self, object key, Py_ssize_t val):
-        raise NotImplementedError
-
-    @cython.boundscheck(False)
-    def map_locations(self, object mi):
-        cdef:
-            Py_ssize_t i, n
-            ndarray[uint64_t] values
-            uint64_t val
-            int ret = 0
-            khiter_t k
-
-        self.mi = mi
-        n = len(mi)
-        values = mi._hashed_values
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_put_uint64(self.table, val, &ret)
-                self.table.vals[k] = i
-
-    @cython.boundscheck(False)
-    def lookup(self, object mi):
-        # look up with a target mi
-        cdef:
-            Py_ssize_t i, n
-            ndarray[uint64_t] values
-            int ret = 0
-            uint64_t val
-            khiter_t k
-            int64_t[:] locs
-
-        n = len(mi)
-        values = mi._hashed_values
-
-        locs = np.empty(n, dtype=np.int64)
-
-        with nogil:
-            for i in range(n):
-                val = values[i]
-                k = kh_get_uint64(self.table, val)
-                if k != self.table.n_buckets:
-                    locs[i] = self.table.vals[k]
-                else:
-                    locs[i] = -1
+                if return_inverse:
+                    self.table.vals[k] = count
+                    labels[i] = count
+                    count += 1
+            elif return_inverse:
+                # k falls into a previous bucket
+                # only relevant in case we need to construct the inverse
+                idx = self.table.vals[k]
+                labels[i] = idx
 
-        self._check_for_collisions(locs, mi)
-        return np.asarray(locs)
+        if return_inverse:
+            return uniques.to_array(), np.asarray(labels)
+        return uniques.to_array()
 
-    def unique(self, object mi):
-        raise NotImplementedError
+    def unique(self, ndarray[object] values, bint return_inverse=False):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        return_inverse : boolean, default False
+            Whether the mapping of the original array values to their location
+            in the vector of uniques should be returned.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64] (if return_inverse)
+            The labels from values to uniques
+        """
+        uniques = ObjectVector()
+        return self._unique(values, uniques, ignore_na=False,
+                            return_inverse=return_inverse)
+
+    def factorize(self, ndarray[object] values, Py_ssize_t na_sentinel=-1,
+                  object na_value=None):
+        """
+        Calculate unique values and labels (no sorting!)
+
+        Missing values are not included in the "uniques" for this method.
+        The labels for any missing values will be set to "na_sentinel"
+
+        Parameters
+        ----------
+        values : ndarray[object]
+            Array of values of which unique will be calculated
+        na_sentinel : Py_ssize_t, default -1
+            Sentinel value used for all NA-values in inverse
+        na_value : object, default None
+            Value to identify as missing. If na_value is None, then None _plus_
+            any value "val" satisfying val != val is considered missing.
+            If na_value is not None, then _additionally_, any value "val"
+            satisfying val == na_value is considered missing.
+
+        Returns
+        -------
+        uniques : ndarray[object]
+            Unique values of input, not sorted
+        labels : ndarray[int64]
+            The labels from values to uniques
+        """
+        uniques_vector = ObjectVector()
+        return self._unique(values, uniques_vector, na_sentinel=na_sentinel,
+                            na_value=na_value, ignore_na=True,
+                            return_inverse=True)
 
-    def get_labels(self, object mi, ObjectVector uniques,
-                   Py_ssize_t count_prior, int64_t na_sentinel,
-                   bint check_null=True):
-        raise NotImplementedError
+    def get_labels(self, ndarray[object] values, ObjectVector uniques,
+                   Py_ssize_t count_prior=0, Py_ssize_t na_sentinel=-1,
+                   object na_value=None):
+        _, labels = self._unique(values, uniques, count_prior=count_prior,
+                                 na_sentinel=na_sentinel, na_value=na_value,
+                                 ignore_na=True, return_inverse=True)
+        return labels
diff --git a/pandas/_libs/hashtable_func_helper.pxi.in b/pandas/_libs/hashtable_func_helper.pxi.in
index c97639481f12c..80d864c65d087 100644
--- a/pandas/_libs/hashtable_func_helper.pxi.in
+++ b/pandas/_libs/hashtable_func_helper.pxi.in
@@ -4,9 +4,9 @@ Template for each `dtype` helper function for hashtable
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # VectorData
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -45,11 +45,11 @@ cdef build_count_table_{{dtype}}({{dtype}}_t[:] values,
         val = values[i]
 
         if not checknull(val) or not dropna:
-            k = kh_get_{{ttype}}(table, <PyObject*> val)
+            k = kh_get_{{ttype}}(table, <PyObject*>val)
             if k != table.n_buckets:
                 table.vals[k] += 1
             else:
-                k = kh_put_{{ttype}}(table, <PyObject*> val, &ret)
+                k = kh_put_{{ttype}}(table, <PyObject*>val, &ret)
                 table.vals[k] = 1
     {{else}}
     with nogil:
@@ -80,7 +80,7 @@ cpdef value_count_{{dtype}}(ndarray[{{dtype}}] values, bint dropna):
 cpdef value_count_{{dtype}}({{scalar}}[:] values, bint dropna):
 {{endif}}
     cdef:
-        Py_ssize_t i=0
+        Py_ssize_t i = 0
         kh_{{ttype}}_t *table
 
         {{if dtype != 'object'}}
@@ -103,7 +103,7 @@ cpdef value_count_{{dtype}}({{scalar}}[:] values, bint dropna):
     {{if dtype == 'object'}}
     for k in range(table.n_buckets):
         if kh_exist_{{ttype}}(table, k):
-            result_keys[i] = <{{dtype}}> table.keys[k]
+            result_keys[i] = <{{dtype}}>table.keys[k]
             result_counts[i] = table.vals[k]
             i += 1
     {{else}}
@@ -128,6 +128,7 @@ cpdef value_count_{{dtype}}({{scalar}}[:] values, bint dropna):
 @cython.boundscheck(False)
 {{if dtype == 'object'}}
 
+
 def duplicated_{{dtype}}(ndarray[{{dtype}}] values, object keep='first'):
 {{else}}
 
@@ -140,7 +141,7 @@ def duplicated_{{dtype}}({{scalar}}[:] values, object keep='first'):
         {{dtype}}_t value
         {{endif}}
         Py_ssize_t k, i, n = len(values)
-        kh_{{ttype}}_t * table = kh_init_{{ttype}}()
+        kh_{{ttype}}_t *table = kh_init_{{ttype}}()
         ndarray[uint8_t, ndim=1, cast=True] out = np.empty(n, dtype='bool')
 
     kh_resize_{{ttype}}(table, min(n, _SIZE_HINT_LIMIT))
@@ -151,7 +152,7 @@ def duplicated_{{dtype}}({{scalar}}[:] values, object keep='first'):
     if keep == 'last':
         {{if dtype == 'object'}}
         for i from n > i >= 0:
-            kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+            kh_put_{{ttype}}(table, <PyObject*>values[i], &ret)
             out[i] = ret == 0
         {{else}}
         with nogil:
@@ -161,31 +162,31 @@ def duplicated_{{dtype}}({{scalar}}[:] values, object keep='first'):
         {{endif}}
     elif keep == 'first':
         {{if dtype == 'object'}}
-        for i from 0 <= i < n:
-            kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+        for i in range(n):
+            kh_put_{{ttype}}(table, <PyObject*>values[i], &ret)
             out[i] = ret == 0
         {{else}}
         with nogil:
-            for i from 0 <= i < n:
+            for i in range(n):
                 kh_put_{{ttype}}(table, values[i], &ret)
                 out[i] = ret == 0
         {{endif}}
     else:
         {{if dtype == 'object'}}
-        for i from 0 <= i < n:
+        for i in range(n):
             value = values[i]
-            k = kh_get_{{ttype}}(table, <PyObject*> value)
+            k = kh_get_{{ttype}}(table, <PyObject*>value)
             if k != table.n_buckets:
                 out[table.vals[k]] = 1
                 out[i] = 1
             else:
-                k = kh_put_{{ttype}}(table, <PyObject*> value, &ret)
-                table.keys[k] = <PyObject*> value
+                k = kh_put_{{ttype}}(table, <PyObject*>value, &ret)
+                table.keys[k] = <PyObject*>value
                 table.vals[k] = i
                 out[i] = 0
         {{else}}
         with nogil:
-            for i from 0 <= i < n:
+            for i in range(n):
                 value = values[i]
                 k = kh_get_{{ttype}}(table, value)
                 if k != table.n_buckets:
@@ -201,19 +202,21 @@ def duplicated_{{dtype}}({{scalar}}[:] values, object keep='first'):
     return out
 
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Membership
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
 {{if dtype == 'object'}}
 
-def ismember_{{dtype}}(ndarray[{{scalar}}] arr, ndarray[{{scalar}}] values, bint hasnans=0):
+
+def ismember_{{dtype}}(ndarray[{{scalar}}] arr, ndarray[{{scalar}}] values):
 {{else}}
 
-def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
+
+def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values):
 {{endif}}
 
     """
@@ -224,7 +227,6 @@ def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
     ----------
     arr : {{dtype}} ndarray
     values : {{dtype}} ndarray
-    hasnans : bint, optional
 
     Returns
     -------
@@ -235,8 +237,7 @@ def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
         int ret = 0
         ndarray[uint8_t] result
         {{scalar}} val
-        kh_{{ttype}}_t * table = kh_init_{{ttype}}()
-
+        kh_{{ttype}}_t *table = kh_init_{{ttype}}()
 
     # construct the table
     n = len(values)
@@ -244,7 +245,7 @@ def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
 
     {{if dtype == 'object'}}
     for i in range(n):
-        kh_put_{{ttype}}(table, <PyObject*> values[i], &ret)
+        kh_put_{{ttype}}(table, <PyObject*>values[i], &ret)
     {{else}}
     with nogil:
         for i in range(n):
@@ -258,20 +259,14 @@ def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
     {{if dtype == 'object'}}
     for i in range(n):
         val = arr[i]
-        k = kh_get_{{ttype}}(table, <PyObject*> val)
-        if k != table.n_buckets:
-            result[i] = 1
-        else:
-            result[i] = hasnans and val != val
+        k = kh_get_{{ttype}}(table, <PyObject*>val)
+        result[i] = (k != table.n_buckets)
     {{else}}
     with nogil:
         for i in range(n):
             val = arr[i]
             k = kh_get_{{ttype}}(table, val)
-            if k != table.n_buckets:
-                result[i] = 1
-            else:
-                result[i] = hasnans and val != val
+            result[i] = (k != table.n_buckets)
     {{endif}}
 
     kh_destroy_{{ttype}}(table)
@@ -280,15 +275,15 @@ def ismember_{{dtype}}({{scalar}}[:] arr, {{scalar}}[:] values, bint hasnans=0):
 {{endfor}}
 
 
-
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Mode Computations
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
 # dtype, ctype, table_type, npy_dtype
-dtypes = [('int64', 'int64_t', 'int64', 'int64'),
+dtypes = [('float64', 'float64_t', 'float64', 'float64'),
+          ('int64', 'int64_t', 'int64', 'int64'),
           ('uint64', 'uint64_t', 'uint64', 'uint64'),
           ('object', 'object', 'pymap', 'object_')]
 }}
@@ -302,25 +297,21 @@ dtypes = [('int64', 'int64_t', 'int64', 'int64'),
 {{if dtype == 'object'}}
 
 
-def mode_{{dtype}}(ndarray[{{ctype}}] values):
+def mode_{{dtype}}(ndarray[{{ctype}}] values, bint dropna):
 {{else}}
 
 
-def mode_{{dtype}}({{ctype}}[:] values):
+def mode_{{dtype}}({{ctype}}[:] values, bint dropna):
 {{endif}}
     cdef:
         int count, max_count = 1
-        int j = -1 # so you can do +=
+        int j = -1  # so you can do +=
         Py_ssize_t k
         kh_{{table_type}}_t *table
         ndarray[{{ctype}}] modes
 
     table = kh_init_{{table_type}}()
-    {{if dtype == 'object'}}
-    build_count_table_{{dtype}}(values, table, 1)
-    {{else}}
-    build_count_table_{{dtype}}(values, table, 0)
-    {{endif}}
+    build_count_table_{{dtype}}(values, table, dropna)
 
     modes = np.empty(table.n_buckets, dtype=np.{{npy_dtype}})
 
@@ -329,7 +320,6 @@ def mode_{{dtype}}({{ctype}}[:] values):
         for k in range(table.n_buckets):
             if kh_exist_{{table_type}}(table, k):
                 count = table.vals[k]
-
                 if count == max_count:
                     j += 1
                 elif count > max_count:
@@ -352,7 +342,7 @@ def mode_{{dtype}}({{ctype}}[:] values):
             else:
                 continue
 
-            modes[j] = <object> table.keys[k]
+            modes[j] = <object>table.keys[k]
     {{endif}}
 
     kh_destroy_{{table_type}}(table)
diff --git a/pandas/_libs/index.pyx b/pandas/_libs/index.pyx
index c7a537acf5d6f..8cea529fbb07e 100644
--- a/pandas/_libs/index.pyx
+++ b/pandas/_libs/index.pyx
@@ -1,72 +1,55 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta, date
 
-from numpy cimport ndarray
-
-from numpy cimport (float64_t, int32_t, int64_t, uint8_t,
-                    NPY_DATETIME, NPY_TIMEDELTA)
-cimport cython
+import cython
 
+import numpy as np
 cimport numpy as cnp
-
+from numpy cimport (ndarray, intp_t,
+                    float64_t, float32_t,
+                    int64_t, int32_t, int16_t, int8_t,
+                    uint64_t, uint32_t, uint16_t, uint8_t,
+                    # Note: NPY_DATETIME, NPY_TIMEDELTA are only available
+                    # for cimport in cython>=0.27.3
+                    NPY_DATETIME, NPY_TIMEDELTA)
 cnp.import_array()
-cnp.import_ufunc()
-
-cimport util
 
-import numpy as np
-
-cimport tslib
-from hashtable cimport *
-from pandas._libs import tslib, algos, hashtable as _hash
-from pandas._libs.tslib import Timestamp, Timedelta
-
-from datetime cimport (get_datetime64_value, _pydatetime_to_dts,
-                       pandas_datetimestruct)
 
-from cpython cimport PyTuple_Check, PyList_Check
+cimport pandas._libs.util as util
 
-cdef extern from "datetime.h":
-    bint PyDateTime_Check(object o)
-    void PyDateTime_IMPORT()
+from pandas._libs.tslibs.conversion cimport maybe_datetimelike_to_i8
 
-cdef int64_t iNaT = util.get_nat()
+from pandas._libs.hashtable cimport HashTable
 
-try:
-    from dateutil.tz import tzutc as _du_utc
-    import pytz
-    UTC = pytz.utc
-    have_pytz = True
-except ImportError:
-    have_pytz = False
+from pandas._libs import algos, hashtable as _hash
+from pandas._libs.tslibs import Timestamp, Timedelta, period as periodlib
+from pandas._libs.missing import checknull
 
-PyDateTime_IMPORT
+cdef int64_t NPY_NAT = util.get_nat()
 
-cdef extern from "Python.h":
-    int PySlice_Check(object)
 
-
-cdef inline is_definitely_invalid_key(object val):
-    if PyTuple_Check(val):
+cdef inline bint is_definitely_invalid_key(object val):
+    if isinstance(val, tuple):
         try:
             hash(val)
         except TypeError:
             return True
 
     # we have a _data, means we are a NDFrame
-    return (PySlice_Check(val) or cnp.PyArray_Check(val)
-            or PyList_Check(val) or hasattr(val, '_data'))
+    return (isinstance(val, slice) or util.is_array(val)
+            or isinstance(val, list) or hasattr(val, '_data'))
 
 
-def get_value_at(ndarray arr, object loc):
+cpdef get_value_at(ndarray arr, object loc, object tz=None):
     if arr.descr.type_num == NPY_DATETIME:
-        return Timestamp(util.get_value_at(arr, loc))
+        return Timestamp(util.get_value_at(arr, loc), tz=tz)
     elif arr.descr.type_num == NPY_TIMEDELTA:
         return Timedelta(util.get_value_at(arr, loc))
     return util.get_value_at(arr, loc)
 
 
-def set_value_at(ndarray arr, object loc, object val):
-    return util.set_value_at(arr, loc, val)
+def get_value_box(arr: ndarray, loc: object) -> object:
+    return get_value_at(arr, loc, tz=None)
 
 
 # Don't populate hash tables in monotonic indexes larger than this
@@ -104,14 +87,10 @@ cdef class IndexEngine:
             void* data_ptr
 
         loc = self.get_loc(key)
-        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
+        if isinstance(loc, slice) or util.is_array(loc):
             return arr[loc]
         else:
-            if arr.descr.type_num == NPY_DATETIME:
-                return Timestamp(util.get_value_at(arr, loc), tz=tz)
-            elif arr.descr.type_num == NPY_TIMEDELTA:
-                return Timedelta(util.get_value_at(arr, loc))
-            return util.get_value_at(arr, loc)
+            return get_value_at(arr, loc, tz=tz)
 
     cpdef set_value(self, ndarray arr, object key, object value):
         """
@@ -124,10 +103,7 @@ cdef class IndexEngine:
         loc = self.get_loc(key)
         value = convert_scalar(arr, value)
 
-        if PySlice_Check(loc) or cnp.PyArray_Check(loc):
-            arr[loc] = value
-        else:
-            util.set_value_at(arr, loc, value)
+        arr[loc] = value
 
     cpdef get_loc(self, object val):
         if is_definitely_invalid_key(val):
@@ -137,7 +113,9 @@ cdef class IndexEngine:
             if not self.is_unique:
                 return self._get_loc_duplicates(val)
             values = self._get_index_values()
-            loc = _bin_search(values, val) # .searchsorted(val, side='left')
+
+            self._check_type(val)
+            loc = _bin_search(values, val)  # .searchsorted(val, side='left')
             if loc >= len(values):
                 raise KeyError(val)
             if util.get_value_at(values, loc) != val:
@@ -152,7 +130,7 @@ cdef class IndexEngine:
 
         try:
             return self.mapping.get_item(val)
-        except TypeError:
+        except (TypeError, ValueError):
             raise KeyError(val)
 
     cdef inline _get_loc_duplicates(self, object val):
@@ -176,32 +154,20 @@ cdef class IndexEngine:
 
     cdef _maybe_get_bool_indexer(self, object val):
         cdef:
-            ndarray[uint8_t] indexer
-            ndarray[object] values
-            int count = 0
-            Py_ssize_t i, n
-            int last_true
-
-        values = np.array(self._get_index_values(), copy=False)
-        n = len(values)
-
-        result = np.empty(n, dtype=bool)
-        indexer = result.view(np.uint8)
+            ndarray[uint8_t, ndim=1, cast=True] indexer
+            ndarray[intp_t, ndim=1] found
+            int count
 
-        for i in range(n):
-            if values[i] == val:
-                count += 1
-                indexer[i] = 1
-                last_true = i
-            else:
-                indexer[i] = 0
+        indexer = self._get_index_values() == val
+        found = np.where(indexer)[0]
+        count = len(found)
 
-        if count == 0:
-            raise KeyError(val)
+        if count > 1:
+            return indexer
         if count == 1:
-            return last_true
+            return int(found[0])
 
-        return result
+        raise KeyError(val)
 
     def sizeof(self, deep=False):
         """ return the sizeof our mapping """
@@ -212,34 +178,31 @@ cdef class IndexEngine:
     def __sizeof__(self):
         return self.sizeof()
 
-    property is_unique:
-
-        def __get__(self):
-            if self.need_unique_check:
-                self._do_unique_check()
+    @property
+    def is_unique(self):
+        if self.need_unique_check:
+            self._do_unique_check()
 
-            return self.unique == 1
+        return self.unique == 1
 
     cdef inline _do_unique_check(self):
 
         # this de-facto the same
         self._ensure_mapping_populated()
 
-    property is_monotonic_increasing:
+    @property
+    def is_monotonic_increasing(self):
+        if self.need_monotonic_check:
+            self._do_monotonic_check()
 
-        def __get__(self):
-            if self.need_monotonic_check:
-                self._do_monotonic_check()
+        return self.monotonic_inc == 1
 
-            return self.monotonic_inc == 1
+    @property
+    def is_monotonic_decreasing(self):
+        if self.need_monotonic_check:
+            self._do_monotonic_check()
 
-    property is_monotonic_decreasing:
-
-        def __get__(self):
-            if self.need_monotonic_check:
-                self._do_monotonic_check()
-
-            return self.monotonic_dec == 1
+        return self.monotonic_dec == 1
 
     cdef inline _do_monotonic_check(self):
         cdef object is_unique
@@ -263,7 +226,13 @@ cdef class IndexEngine:
         return self.vgetter()
 
     def _call_monotonic(self, values):
-        raise NotImplementedError
+        return algos.is_monotonic(values, timelike=False)
+
+    def get_backfill_indexer(self, other, limit=None):
+        return algos.backfill(self._get_index_values(), other, limit=limit)
+
+    def get_pad_indexer(self, other, limit=None):
+        return algos.pad(self._get_index_values(), other, limit=limit)
 
     cdef _make_hash_table(self, n):
         raise NotImplementedError
@@ -271,10 +240,9 @@ cdef class IndexEngine:
     cdef _check_type(self, object val):
         hash(val)
 
-    property is_mapping_populated:
-
-        def __get__(self):
-            return self.mapping is not None
+    @property
+    def is_mapping_populated(self):
+        return self.mapping is not None
 
     cdef inline _ensure_mapping_populated(self):
         # this populates the mapping
@@ -285,13 +253,16 @@ cdef class IndexEngine:
 
             values = self._get_index_values()
             self.mapping = self._make_hash_table(len(values))
-            self.mapping.map_locations(values)
+            self._call_map_locations(values)
 
             if len(self.mapping) == len(values):
                 self.unique = 1
 
         self.need_unique_check = 0
 
+    cpdef _call_map_locations(self, values):
+        self.mapping.map_locations(values)
+
     def clear_mapping(self):
         self.mapping = None
         self.need_monotonic_check = 1
@@ -309,7 +280,7 @@ cdef class IndexEngine:
         """ return an indexer suitable for takng from a non unique index
             return the labels in the same order ast the target
             and a missing indexer into the targets (which correspond
-            to the -1 indicies in the results """
+            to the -1 indices in the results """
 
         cdef:
             ndarray values, x
@@ -333,18 +304,26 @@ cdef class IndexEngine:
         result = np.empty(n_alloc, dtype=np.int64)
         missing = np.empty(n_t, dtype=np.int64)
 
-        # form the set of the results (like ismember)
-        members = np.empty(n, dtype=np.uint8)
-        for i in range(n):
-            val = util.get_value_1d(values, i)
-            if val in stargets:
-                if val not in d:
-                    d[val] = []
-                d[val].append(i)
+        # map each starget to its position in the index
+        if stargets and len(stargets) < 5 and self.is_monotonic_increasing:
+            # if there are few enough stargets and the index is monotonically
+            # increasing, then use binary search for each starget
+            for starget in stargets:
+                start = values.searchsorted(starget, side='left')
+                end = values.searchsorted(starget, side='right')
+                if start != end:
+                    d[starget] = list(range(start, end))
+        else:
+            # otherwise, map by iterating through all items in the index
+            for i in range(n):
+                val = values[i]
+                if val in stargets:
+                    if val not in d:
+                        d[val] = []
+                    d[val].append(i)
 
         for i in range(n_t):
-
-            val = util.get_value_1d(targets, i)
+            val = targets[i]
 
             # found
             if val in d:
@@ -397,17 +376,13 @@ cdef Py_ssize_t _bin_search(ndarray values, object val) except -1:
     else:
         return mid + 1
 
-_pad_functions = {
-    'object': algos.pad_object,
-    'int64': algos.pad_int64,
-    'float64': algos.pad_float64
-}
 
-_backfill_functions = {
-    'object': algos.backfill_object,
-    'int64': algos.backfill_int64,
-    'float64': algos.backfill_float64
-}
+cdef class ObjectEngine(IndexEngine):
+    """
+    Index Engine for use with object-dtype Index, namely the base class Index
+    """
+    cdef _make_hash_table(self, n):
+        return _hash.PyObjectHashTable(n)
 
 
 cdef class DatetimeEngine(Int64Engine):
@@ -420,18 +395,18 @@ cdef class DatetimeEngine(Int64Engine):
             if not self.is_unique:
                 return self._get_loc_duplicates(val)
             values = self._get_index_values()
-            conv = _to_i8(val)
+            conv = maybe_datetimelike_to_i8(val)
             loc = values.searchsorted(conv, side='left')
             return util.get_value_at(values, loc) == conv
 
         self._ensure_mapping_populated()
-        return _to_i8(val) in self.mapping
+        return maybe_datetimelike_to_i8(val) in self.mapping
 
     cdef _get_index_values(self):
         return self.vgetter().view('i8')
 
     def _call_monotonic(self, values):
-        return algos.is_monotonic_int64(values, timelike=True)
+        return algos.is_monotonic(values, timelike=True)
 
     cpdef get_loc(self, object val):
         if is_definitely_invalid_key(val):
@@ -440,12 +415,12 @@ cdef class DatetimeEngine(Int64Engine):
         # Welcome to the spaghetti factory
         if self.over_size_threshold and self.is_monotonic_increasing:
             if not self.is_unique:
-                val = _to_i8(val)
+                val = maybe_datetimelike_to_i8(val)
                 return self._get_loc_duplicates(val)
             values = self._get_index_values()
 
             try:
-                conv = _to_i8(val)
+                conv = maybe_datetimelike_to_i8(val)
                 loc = values.searchsorted(conv, side='left')
             except TypeError:
                 self._date_check_type(val)
@@ -457,7 +432,7 @@ cdef class DatetimeEngine(Int64Engine):
 
         self._ensure_mapping_populated()
         if not self.unique:
-            val = _to_i8(val)
+            val = maybe_datetimelike_to_i8(val)
             return self._get_loc_duplicates(val)
 
         try:
@@ -468,9 +443,9 @@ cdef class DatetimeEngine(Int64Engine):
             pass
 
         try:
-            val = _to_i8(val)
+            val = maybe_datetimelike_to_i8(val)
             return self.mapping.get_item(val)
-        except TypeError:
+        except (TypeError, ValueError):
             self._date_check_type(val)
             raise KeyError(val)
 
@@ -490,15 +465,13 @@ cdef class DatetimeEngine(Int64Engine):
         if other.dtype != self._get_box_dtype():
             return np.repeat(-1, len(other)).astype('i4')
         other = np.asarray(other).view('i8')
-        return algos.pad_int64(self._get_index_values(), other,
-                                limit=limit)
+        return algos.pad(self._get_index_values(), other, limit=limit)
 
     def get_backfill_indexer(self, other, limit=None):
         if other.dtype != self._get_box_dtype():
             return np.repeat(-1, len(other)).astype('i4')
         other = np.asarray(other).view('i8')
-        return algos.backfill_int64(self._get_index_values(), other,
-                                     limit=limit)
+        return algos.backfill(self._get_index_values(), other, limit=limit)
 
 
 cdef class TimedeltaEngine(DatetimeEngine):
@@ -506,25 +479,82 @@ cdef class TimedeltaEngine(DatetimeEngine):
     cdef _get_box_dtype(self):
         return 'm8[ns]'
 
+
+cdef class PeriodEngine(Int64Engine):
+
+    cdef _get_index_values(self):
+        return super(PeriodEngine, self).vgetter()
+
+    cpdef _call_map_locations(self, values):
+        super(PeriodEngine, self)._call_map_locations(values.view('i8'))
+
+    def _call_monotonic(self, values):
+        return super(PeriodEngine, self)._call_monotonic(values.view('i8'))
+
+    def get_indexer(self, values):
+        cdef ndarray[int64_t, ndim=1] ordinals
+
+        super(PeriodEngine, self)._ensure_mapping_populated()
+
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinals = periodlib.extract_ordinals(values, freq)
+
+        return self.mapping.lookup(ordinals)
+
+    def get_pad_indexer(self, other, limit=None):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(other, freq)
+
+        return algos.pad(self._get_index_values(),
+                         np.asarray(ordinal), limit=limit)
+
+    def get_backfill_indexer(self, other, limit=None):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(other, freq)
+
+        return algos.backfill(self._get_index_values(),
+                              np.asarray(ordinal), limit=limit)
+
+    def get_indexer_non_unique(self, targets):
+        freq = super(PeriodEngine, self).vgetter().freq
+        ordinal = periodlib.extract_ordinals(targets, freq)
+        ordinal_array = np.asarray(ordinal)
+
+        return super(PeriodEngine, self).get_indexer_non_unique(ordinal_array)
+
+
 cpdef convert_scalar(ndarray arr, object value):
+    # we don't turn integers
+    # into datetimes/timedeltas
+
+    # we don't turn bools into int/float/complex
+
     if arr.descr.type_num == NPY_DATETIME:
-        if isinstance(value, np.ndarray):
+        if util.is_array(value):
             pass
-        elif isinstance(value, Timestamp):
-            return value.value
+        elif isinstance(value, (datetime, np.datetime64, date)):
+            return Timestamp(value).value
         elif value is None or value != value:
-            return iNaT
-        else:
+            return NPY_NAT
+        elif util.is_string_object(value):
             return Timestamp(value).value
+        raise ValueError("cannot set a Timestamp with a non-timestamp")
+
     elif arr.descr.type_num == NPY_TIMEDELTA:
-        if isinstance(value, np.ndarray):
+        if util.is_array(value):
             pass
-        elif isinstance(value, Timedelta):
-            return value.value
+        elif isinstance(value, timedelta):
+            return Timedelta(value).value
         elif value is None or value != value:
-            return iNaT
-        else:
+            return NPY_NAT
+        elif util.is_string_object(value):
             return Timedelta(value).value
+        raise ValueError("cannot set a Timedelta with a non-timedelta")
+
+    if (issubclass(arr.dtype.type, (np.integer, np.floating, np.complex)) and
+            not issubclass(arr.dtype.type, np.bool_)):
+        if util.is_bool_object(value):
+            raise ValueError('Cannot assign bool to float/integer series')
 
     if issubclass(arr.dtype.type, (np.integer, np.bool_)):
         if util.is_float_object(value) and value != value:
@@ -532,60 +562,138 @@ cpdef convert_scalar(ndarray arr, object value):
 
     return value
 
-cdef inline _to_i8(object val):
-    cdef pandas_datetimestruct dts
-    try:
-        return val.value
-    except AttributeError:
-        if util.is_datetime64_object(val):
-            return get_datetime64_value(val)
-        elif PyDateTime_Check(val):
-            tzinfo = getattr(val, 'tzinfo', None)
-            # Save the original date value so we can get the utcoffset from it.
-            ival = _pydatetime_to_dts(val, &dts)
-            if tzinfo is not None and not _is_utc(tzinfo):
-                offset = tslib._get_utcoffset(tzinfo, val)
-                ival -= tslib._delta_to_nanoseconds(offset)
-            return ival
-        return val
-
-cdef inline bint _is_utc(object tz):
-    return tz is UTC or isinstance(tz, _du_utc)
-
-
-cdef class MultiIndexEngine(IndexEngine):
-
-    def _call_monotonic(self, object mi):
-        # defer these back to the mi iteself
-        return (mi.is_monotonic_increasing,
-                mi.is_monotonic_decreasing,
-                mi.is_unique)
 
-    def get_backfill_indexer(self, other, limit=None):
-        # we coerce to ndarray-of-tuples
-        values = np.array(self._get_index_values())
-        return algos.backfill_object(values, other, limit=limit)
+cdef class BaseMultiIndexCodesEngine:
+    """
+    Base class for MultiIndexUIntEngine and MultiIndexPyIntEngine, which
+    represent each label in a MultiIndex as an integer, by juxtaposing the bits
+    encoding each level, with appropriate offsets.
+
+    For instance: if 3 levels have respectively 3, 6 and 1 possible values,
+    then their labels can be represented using respectively 2, 3 and 1 bits,
+    as follows:
+     _ _ _ _____ _ __ __ __
+    |0|0|0| ... |0| 0|a1|a0| -> offset 0 (first level)
+     — — — ————— — —— —— ——
+    |0|0|0| ... |0|b2|b1|b0| -> offset 2 (bits required for first level)
+     — — — ————— — —— —— ——
+    |0|0|0| ... |0| 0| 0|c0| -> offset 5 (bits required for first two levels)
+     ‾ ‾ ‾ ‾‾‾‾‾ ‾ ‾‾ ‾‾ ‾‾
+    and the resulting unsigned integer representation will be:
+     _ _ _ _____ _ __ __ __ __ __ __
+    |0|0|0| ... |0|c0|b2|b1|b0|a1|a0|
+     ‾ ‾ ‾ ‾‾‾‾‾ ‾ ‾‾ ‾‾ ‾‾ ‾‾ ‾‾ ‾‾
+
+    Offsets are calculated at initialization, labels are transformed by method
+    _codes_to_ints.
+
+    Keys are located by first locating each component against the respective
+    level, then locating (the integer representation of) codes.
+    """
+    def __init__(self, object levels, object labels,
+                 ndarray[uint64_t, ndim=1] offsets):
+        """
+        Parameters
+        ----------
+        levels : list-like of numpy arrays
+            Levels of the MultiIndex
+        labels : list-like of numpy arrays of integer dtype
+            Labels of the MultiIndex
+        offsets : numpy array of uint64 dtype
+            Pre-calculated offsets, one for each level of the index
+        """
 
-    def get_pad_indexer(self, other, limit=None):
-        # we coerce to ndarray-of-tuples
-        values = np.array(self._get_index_values())
-        return algos.pad_object(values, other, limit=limit)
+        self.levels = levels
+        self.offsets = offsets
 
-    cpdef get_loc(self, object val):
-        if is_definitely_invalid_key(val):
-            raise TypeError("'{val}' is an invalid key".format(val=val))
+        # Transform labels in a single array, and add 1 so that we are working
+        # with positive integers (-1 for NaN becomes 0):
+        codes = (np.array(labels, dtype='int64').T + 1).astype('uint64',
+                                                               copy=False)
 
-        self._ensure_mapping_populated()
-        if not self.unique:
-            return self._get_loc_duplicates(val)
+        # Map each codes combination in the index to an integer unambiguously
+        # (no collisions possible), based on the "offsets", which describe the
+        # number of bits to switch labels for each level:
+        lab_ints = self._codes_to_ints(codes)
+
+        # Initialize underlying index (e.g. libindex.UInt64Engine) with
+        # integers representing labels: we will use its get_loc and get_indexer
+        self._base.__init__(self, lambda: lab_ints, len(lab_ints))
+
+    def _extract_level_codes(self, object target, object method=None):
+        """
+        Map the requested list of (tuple) keys to their integer representations
+        for searching in the underlying integer index.
+
+        Parameters
+        ----------
+        target : list-like of keys
+            Each key is a tuple, with a label for each level of the index.
+
+        Returns
+        ------
+        int_keys : 1-dimensional array of dtype uint64 or object
+            Integers representing one combination each
+        """
 
+        level_codes = [lev.get_indexer(codes) + 1 for lev, codes
+                       in zip(self.levels, zip(*target))]
+        return self._codes_to_ints(np.array(level_codes, dtype='uint64').T)
+
+    def get_indexer(self, object target, object method=None,
+                    object limit=None):
+        lab_ints = self._extract_level_codes(target)
+
+        # All methods (exact, backfill, pad) directly map to the respective
+        # methods of the underlying (integers) index...
+        if method is not None:
+            # but underlying backfill and pad methods require index and keys
+            # to be sorted. The index already is (checked in
+            # Index._get_fill_indexer), sort (integer representations of) keys:
+            order = np.argsort(lab_ints)
+            lab_ints = lab_ints[order]
+            indexer = (getattr(self._base, 'get_{}_indexer'.format(method))
+                       (self, lab_ints, limit=limit))
+            indexer = indexer[order]
+        else:
+            indexer = self._base.get_indexer(self, lab_ints)
+
+        return indexer
+
+    def get_loc(self, object key):
+        if is_definitely_invalid_key(key):
+            raise TypeError("'{key}' is an invalid key".format(key=key))
+        if not isinstance(key, tuple):
+            raise KeyError(key)
         try:
-            return self.mapping.get_item(val)
-        except TypeError:
-            raise KeyError(val)
+            indices = [0 if checknull(v) else lev.get_loc(v) + 1
+                       for lev, v in zip(self.levels, key)]
+        except KeyError:
+            raise KeyError(key)
+
+        # Transform indices into single integer:
+        lab_int = self._codes_to_ints(np.array(indices, dtype='uint64'))
+
+        return self._base.get_loc(self, lab_int)
+
+    def get_indexer_non_unique(self, object target):
+        # This needs to be overridden just because the default one works on
+        # target._values, and target can be itself a MultiIndex.
+
+        lab_ints = self._extract_level_codes(target)
+        indexer = self._base.get_indexer_non_unique(self, lab_ints)
+
+        return indexer
+
+    def __contains__(self, object val):
+        # Default __contains__ looks in the underlying mapping, which in this
+        # case only contains integer representations.
+        try:
+            self.get_loc(val)
+            return True
+        except (KeyError, TypeError, ValueError):
+            return False
 
-    cdef _make_hash_table(self, n):
-        return _hash.MultiIndexHashTable(n)
 
 # Generated from template.
 include "index_class_helper.pxi"
diff --git a/pandas/_libs/index_class_helper.pxi.in b/pandas/_libs/index_class_helper.pxi.in
index 76c0deef7ebee..3c9a096e7ecc0 100644
--- a/pandas/_libs/index_class_helper.pxi.in
+++ b/pandas/_libs/index_class_helper.pxi.in
@@ -4,88 +4,71 @@ Template for functions of IndexEngine subclasses.
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # IndexEngine Subclass Methods
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
-# name, dtype, ctype
-dtypes = [('Float64', 'float64', 'float64_t'),
-          ('UInt64', 'uint64', 'uint64_t'),
-          ('Int64', 'int64', 'int64_t'),
-          ('Object', 'object', 'object')]
+# name, dtype, ctype, hashtable_name, hashtable_dtype
+dtypes = [('Float64', 'float64', 'float64_t', 'Float64', 'float64'),
+          ('Float32', 'float32', 'float32_t', 'Float64', 'float64'),
+          ('Int64', 'int64', 'int64_t', 'Int64', 'int64'),
+          ('Int32', 'int32', 'int32_t', 'Int64', 'int64'),
+          ('Int16', 'int16', 'int16_t', 'Int64', 'int64'),
+          ('Int8', 'int8', 'int8_t', 'Int64', 'int64'),
+          ('UInt64', 'uint64', 'uint64_t', 'UInt64', 'uint64'),
+          ('UInt32', 'uint32', 'uint32_t', 'UInt64', 'uint64'),
+          ('UInt16', 'uint16', 'uint16_t', 'UInt64', 'uint64'),
+          ('UInt8', 'uint8', 'uint8_t', 'UInt64', 'uint64'),
+          ]
 }}
 
-{{for name, dtype, ctype in dtypes}}
+{{for name, dtype, ctype, hashtable_name, hashtable_dtype in dtypes}}
 
 
 cdef class {{name}}Engine(IndexEngine):
 
-    def _call_monotonic(self, values):
-        return algos.is_monotonic_{{dtype}}(values, timelike=False)
-
-    def get_backfill_indexer(self, other, limit=None):
-        return algos.backfill_{{dtype}}(self._get_index_values(),
-                                        other, limit=limit)
-
-    def get_pad_indexer(self, other, limit=None):
-        return algos.pad_{{dtype}}(self._get_index_values(),
-                                   other, limit=limit)
-
     cdef _make_hash_table(self, n):
-        {{if name == 'Object'}}
-        return _hash.PyObjectHashTable(n)
-        {{else}}
-        return _hash.{{name}}HashTable(n)
-        {{endif}}
+        return _hash.{{hashtable_name}}HashTable(n)
 
-    {{if name != 'Float64' and name != 'Object'}}
+    {{if name not in {'Float64', 'Float32'} }}
     cdef _check_type(self, object val):
-        hash(val)
-        if util.is_bool_object(val):
-            raise KeyError(val)
-        elif util.is_float_object(val):
+        if not util.is_integer_object(val):
             raise KeyError(val)
     {{endif}}
 
-    {{if name != 'Object'}}
+    cpdef _call_map_locations(self, values):
+        # self.mapping is of type {{hashtable_name}}HashTable,
+        # so convert dtype of values
+        self.mapping.map_locations(algos.ensure_{{hashtable_dtype}}(values))
+
     cdef _get_index_values(self):
         return algos.ensure_{{dtype}}(self.vgetter())
 
     cdef _maybe_get_bool_indexer(self, object val):
         cdef:
-            ndarray[uint8_t, cast=True] indexer
+            ndarray[uint8_t, ndim=1, cast=True] indexer
+            ndarray[intp_t, ndim=1] found
             ndarray[{{ctype}}] values
             int count = 0
-            Py_ssize_t i, n
-            int last_true
 
-        {{if name != 'Float64'}}
+        {{if name not in {'Float64', 'Float32'} }}
         if not util.is_integer_object(val):
             raise KeyError(val)
         {{endif}}
 
-        values = self._get_index_values()
-        n = len(values)
-
-        result = np.empty(n, dtype=bool)
-        indexer = result.view(np.uint8)
-
-        for i in range(n):
-            if values[i] == val:
-                count += 1
-                indexer[i] = 1
-                last_true = i
-            else:
-                indexer[i] = 0
+        # A view is needed for some subclasses, such as PeriodEngine:
+        values = self._get_index_values().view('{{dtype}}')
+        indexer = values == val
+        found = np.where(indexer)[0]
+        count = len(found)
 
-        if count == 0:
-            raise KeyError(val)
+        if count > 1:
+            return indexer
         if count == 1:
-            return last_true
+            return int(found[0])
 
-        return result
-    {{endif}}
+        raise KeyError(val)
 
 {{endfor}}
diff --git a/pandas/_libs/indexing.pyx b/pandas/_libs/indexing.pyx
new file mode 100644
index 0000000000000..af6e00bad7f6b
--- /dev/null
+++ b/pandas/_libs/indexing.pyx
@@ -0,0 +1,23 @@
+# -*- coding: utf-8 -*-
+
+
+cdef class _NDFrameIndexerBase:
+    """
+    A base class for _NDFrameIndexer for fast instantiation and attribute
+    access.
+    """
+    cdef public object obj, name, _ndim
+
+    def __init__(self, name, obj):
+        self.obj = obj
+        self.name = name
+        self._ndim = None
+
+    @property
+    def ndim(self):
+        # Delay `ndim` instantiation until required as reading it
+        # from `obj` isn't entirely cheap.
+        ndim = self._ndim
+        if ndim is None:
+            ndim = self._ndim = self.obj.ndim
+        return ndim
diff --git a/pandas/_libs/internals.pyx b/pandas/_libs/internals.pyx
new file mode 100644
index 0000000000000..f23d2666b4bf4
--- /dev/null
+++ b/pandas/_libs/internals.pyx
@@ -0,0 +1,466 @@
+# -*- coding: utf-8 -*-
+
+import cython
+from cython import Py_ssize_t
+
+from cpython cimport PyObject
+
+cdef extern from "Python.h":
+    Py_ssize_t PY_SSIZE_T_MAX
+
+import numpy as np
+from numpy cimport int64_t
+
+cdef extern from "compat_helper.h":
+    cdef int slice_get_indices(PyObject* s, Py_ssize_t length,
+                               Py_ssize_t *start, Py_ssize_t *stop,
+                               Py_ssize_t *step,
+                               Py_ssize_t *slicelength) except -1
+
+
+from pandas._libs.algos import ensure_int64
+
+
+cdef class BlockPlacement:
+    # __slots__ = '_as_slice', '_as_array', '_len'
+    cdef:
+        slice _as_slice
+        object _as_array
+
+        bint _has_slice, _has_array, _is_known_slice_like
+
+    def __init__(self, val):
+        cdef:
+            slice slc
+
+        self._as_slice = None
+        self._as_array = None
+        self._has_slice = False
+        self._has_array = False
+
+        if isinstance(val, slice):
+            slc = slice_canonize(val)
+
+            if slc.start != slc.stop:
+                self._as_slice = slc
+                self._has_slice = True
+            else:
+                arr = np.empty(0, dtype=np.int64)
+                self._as_array = arr
+                self._has_array = True
+        else:
+            # Cython memoryview interface requires ndarray to be writeable.
+            arr = np.require(val, dtype=np.int64, requirements='W')
+            assert arr.ndim == 1
+            self._as_array = arr
+            self._has_array = True
+
+    def __str__(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+        if s is not None:
+            v = self._as_slice
+        else:
+            v = self._as_array
+
+        return '%s(%r)' % (self.__class__.__name__, v)
+
+    def __repr__(self):
+        return str(self)
+
+    def __len__(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+        if s is not None:
+            return slice_len(s)
+        else:
+            return len(self._as_array)
+
+    def __iter__(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+            Py_ssize_t start, stop, step, _
+        if s is not None:
+            start, stop, step, _ = slice_get_indices_ex(s)
+            return iter(range(start, stop, step))
+        else:
+            return iter(self._as_array)
+
+    @property
+    def as_slice(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+        if s is None:
+            raise TypeError('Not slice-like')
+        else:
+            return s
+
+    @property
+    def indexer(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+        if s is not None:
+            return s
+        else:
+            return self._as_array
+
+    def isin(self, arr):
+        from pandas.core.index import Int64Index
+        return Int64Index(self.as_array, copy=False).isin(arr)
+
+    @property
+    def as_array(self):
+        cdef:
+            Py_ssize_t start, stop, end, _
+        if not self._has_array:
+            start, stop, step, _ = slice_get_indices_ex(self._as_slice)
+            self._as_array = np.arange(start, stop, step,
+                                       dtype=np.int64)
+            self._has_array = True
+        return self._as_array
+
+    @property
+    def is_slice_like(self):
+        cdef:
+            slice s = self._ensure_has_slice()
+        return s is not None
+
+    def __getitem__(self, loc):
+        cdef:
+            slice s = self._ensure_has_slice()
+        if s is not None:
+            val = slice_getitem(s, loc)
+        else:
+            val = self._as_array[loc]
+
+        if not isinstance(val, slice) and val.ndim == 0:
+            return val
+
+        return BlockPlacement(val)
+
+    def delete(self, loc):
+        return BlockPlacement(np.delete(self.as_array, loc, axis=0))
+
+    def append(self, others):
+        if len(others) == 0:
+            return self
+
+        return BlockPlacement(np.concatenate([self.as_array] +
+                                             [o.as_array for o in others]))
+
+    cdef iadd(self, other):
+        cdef:
+            slice s = self._ensure_has_slice()
+            Py_ssize_t other_int, start, stop, step, l
+
+        if isinstance(other, int) and s is not None:
+            other_int = <Py_ssize_t>other
+
+            if other_int == 0:
+                # BlockPlacement is treated as immutable
+                return self
+
+            start, stop, step, l = slice_get_indices_ex(s)
+            start += other_int
+            stop += other_int
+
+            if ((step > 0 and start < 0) or
+                    (step < 0 and stop < step)):
+                raise ValueError("iadd causes length change")
+
+            if stop < 0:
+                val = slice(start, None, step)
+            else:
+                val = slice(start, stop, step)
+
+            return BlockPlacement(val)
+        else:
+            newarr = self.as_array + other
+            if (newarr < 0).any():
+                raise ValueError("iadd causes length change")
+
+            val = newarr
+            return BlockPlacement(val)
+
+    def add(self, other):
+        return self.iadd(other)
+
+    def sub(self, other):
+        return self.add(-other)
+
+    cdef slice _ensure_has_slice(self):
+        if not self._has_slice:
+            self._as_slice = indexer_as_slice(self._as_array)
+            self._has_slice = True
+        return self._as_slice
+
+
+cdef slice slice_canonize(slice s):
+    """
+    Convert slice to canonical bounded form.
+    """
+    cdef:
+        Py_ssize_t start = 0, stop = 0, step = 1, length
+
+    if s.step is None:
+        step = 1
+    else:
+        step = <Py_ssize_t>s.step
+        if step == 0:
+            raise ValueError("slice step cannot be zero")
+
+    if step > 0:
+        if s.stop is None:
+            raise ValueError("unbounded slice")
+
+        stop = <Py_ssize_t>s.stop
+        if s.start is None:
+            start = 0
+        else:
+            start = <Py_ssize_t>s.start
+            if start > stop:
+                start = stop
+    elif step < 0:
+        if s.start is None:
+            raise ValueError("unbounded slice")
+
+        start = <Py_ssize_t>s.start
+        if s.stop is None:
+            stop = -1
+        else:
+            stop = <Py_ssize_t>s.stop
+            if stop > start:
+                stop = start
+
+    if start < 0 or (stop < 0 and s.stop is not None):
+        raise ValueError("unbounded slice")
+
+    if stop < 0:
+        return slice(start, None, step)
+    else:
+        return slice(start, stop, step)
+
+
+cpdef Py_ssize_t slice_len(
+        slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX) except -1:
+    """
+    Get length of a bounded slice.
+
+    The slice must not have any "open" bounds that would create dependency on
+    container size, i.e.:
+    - if ``s.step is None or s.step > 0``, ``s.stop`` is not ``None``
+    - if ``s.step < 0``, ``s.start`` is not ``None``
+
+    Otherwise, the result is unreliable.
+
+    """
+    cdef:
+        Py_ssize_t start, stop, step, length
+
+    if slc is None:
+        raise TypeError("slc must be slice")
+
+    slice_get_indices(<PyObject *>slc, objlen,
+                      &start, &stop, &step, &length)
+
+    return length
+
+
+cdef slice_get_indices_ex(slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX):
+    """
+    Get (start, stop, step, length) tuple for a slice.
+
+    If `objlen` is not specified, slice must be bounded, otherwise the result
+    will be wrong.
+
+    """
+    cdef:
+        Py_ssize_t start, stop, step, length
+
+    if slc is None:
+        raise TypeError("slc should be a slice")
+
+    slice_get_indices(<PyObject *>slc, objlen,
+                      &start, &stop, &step, &length)
+
+    return start, stop, step, length
+
+
+def slice_getitem(slice slc not None, ind):
+    cdef:
+        Py_ssize_t s_start, s_stop, s_step, s_len
+        Py_ssize_t ind_start, ind_stop, ind_step, ind_len
+
+    s_start, s_stop, s_step, s_len = slice_get_indices_ex(slc)
+
+    if isinstance(ind, slice):
+        ind_start, ind_stop, ind_step, ind_len = slice_get_indices_ex(ind,
+                                                                      s_len)
+
+        if ind_step > 0 and ind_len == s_len:
+            # short-cut for no-op slice
+            if ind_len == s_len:
+                return slc
+
+        if ind_step < 0:
+            s_start = s_stop - s_step
+            ind_step = -ind_step
+
+        s_step *= ind_step
+        s_stop = s_start + ind_stop * s_step
+        s_start = s_start + ind_start * s_step
+
+        if s_step < 0 and s_stop < 0:
+            return slice(s_start, None, s_step)
+        else:
+            return slice(s_start, s_stop, s_step)
+
+    else:
+        return np.arange(s_start, s_stop, s_step, dtype=np.int64)[ind]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cpdef slice indexer_as_slice(int64_t[:] vals):
+    cdef:
+        Py_ssize_t i, n, start, stop
+        int64_t d
+
+    if vals is None:
+        raise TypeError("vals must be ndarray")
+
+    n = vals.shape[0]
+
+    if n == 0 or vals[0] < 0:
+        return None
+
+    if n == 1:
+        return slice(vals[0], vals[0] + 1, 1)
+
+    if vals[1] < 0:
+        return None
+
+    # n > 2
+    d = vals[1] - vals[0]
+
+    if d == 0:
+        return None
+
+    for i in range(2, n):
+        if vals[i] < 0 or vals[i] - vals[i - 1] != d:
+            return None
+
+    start = vals[0]
+    stop = start + n * d
+    if stop < 0 and d < 0:
+        return slice(start, None, d)
+    else:
+        return slice(start, stop, d)
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def get_blkno_indexers(int64_t[:] blknos, bint group=True):
+    """
+    Enumerate contiguous runs of integers in ndarray.
+
+    Iterate over elements of `blknos` yielding ``(blkno, slice(start, stop))``
+    pairs for each contiguous run found.
+
+    If `group` is True and there is more than one run for a certain blkno,
+    ``(blkno, array)`` with an array containing positions of all elements equal
+    to blkno.
+
+    Returns
+    -------
+    iter : iterator of (int, slice or array)
+
+    """
+    # There's blkno in this function's name because it's used in block &
+    # blockno handling.
+    cdef:
+        int64_t cur_blkno
+        Py_ssize_t i, start, stop, n, diff
+
+        object blkno
+        list group_order
+        dict group_slices
+        int64_t[:] res_view
+
+    n = blknos.shape[0]
+
+    if n == 0:
+        return
+
+    start = 0
+    cur_blkno = blknos[start]
+
+    if group is False:
+        for i in range(1, n):
+            if blknos[i] != cur_blkno:
+                yield cur_blkno, slice(start, i)
+
+                start = i
+                cur_blkno = blknos[i]
+
+        yield cur_blkno, slice(start, n)
+    else:
+        group_order = []
+        group_dict = {}
+
+        for i in range(1, n):
+            if blknos[i] != cur_blkno:
+                if cur_blkno not in group_dict:
+                    group_order.append(cur_blkno)
+                    group_dict[cur_blkno] = [(start, i)]
+                else:
+                    group_dict[cur_blkno].append((start, i))
+
+                start = i
+                cur_blkno = blknos[i]
+
+        if cur_blkno not in group_dict:
+            group_order.append(cur_blkno)
+            group_dict[cur_blkno] = [(start, n)]
+        else:
+            group_dict[cur_blkno].append((start, n))
+
+        for blkno in group_order:
+            slices = group_dict[blkno]
+            if len(slices) == 1:
+                yield blkno, slice(slices[0][0], slices[0][1])
+            else:
+                tot_len = sum(stop - start for start, stop in slices)
+                result = np.empty(tot_len, dtype=np.int64)
+                res_view = result
+
+                i = 0
+                for start, stop in slices:
+                    for diff in range(start, stop):
+                        res_view[i] = diff
+                        i += 1
+
+                yield blkno, result
+
+
+def get_blkno_placements(blknos, blk_count, group=True):
+    """
+
+    Parameters
+    ----------
+    blknos : array of int64
+    blk_count : int
+    group : bool
+
+    Returns
+    -------
+    iterator
+        yield (BlockPlacement, blkno)
+
+    """
+
+    blknos = ensure_int64(blknos)
+
+    # FIXME: blk_count is unused, but it may avoid the use of dicts in cython
+    for blkno, indexer in get_blkno_indexers(blknos, group):
+        yield blkno, BlockPlacement(indexer)
diff --git a/pandas/_libs/interval.pyx b/pandas/_libs/interval.pyx
new file mode 100644
index 0000000000000..e86b692e9915e
--- /dev/null
+++ b/pandas/_libs/interval.pyx
@@ -0,0 +1,484 @@
+# -*- coding: utf-8 -*-
+import numbers
+from operator import le, lt
+
+from cpython.object cimport (Py_EQ, Py_NE, Py_GT, Py_LT, Py_GE, Py_LE,
+                             PyObject_RichCompare)
+
+import cython
+from cython import Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (
+    int64_t, int32_t, float64_t, float32_t, uint64_t,
+    ndarray,
+    PyArray_ArgSort, NPY_QUICKSORT, PyArray_Take)
+cnp.import_array()
+
+
+cimport pandas._libs.util as util
+
+from pandas._libs.hashtable cimport Int64Vector, Int64VectorData
+
+from pandas._libs.tslibs import Timestamp
+from pandas._libs.tslibs.timezones cimport tz_compare
+
+
+_VALID_CLOSED = frozenset(['left', 'right', 'both', 'neither'])
+
+
+cdef class IntervalMixin(object):
+
+    @property
+    def closed_left(self):
+        """
+        Check if the interval is closed on the left side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return self.closed in ('left', 'both')
+
+    @property
+    def closed_right(self):
+        """
+        Check if the interval is closed on the right side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return self.closed in ('right', 'both')
+
+    @property
+    def open_left(self):
+        """
+        Check if the interval is open on the left side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return not self.closed_left
+
+    @property
+    def open_right(self):
+        """
+        Check if the interval is open on the right side.
+
+        For the meaning of `closed` and `open` see :class:`~pandas.Interval`.
+
+        Returns
+        -------
+        bool
+            ``True`` if the Interval is closed on the left-side, else
+            ``False``.
+        """
+        return not self.closed_right
+
+    @property
+    def mid(self):
+        """
+        Return the midpoint of the Interval
+        """
+        try:
+            return 0.5 * (self.left + self.right)
+        except TypeError:
+            # datetime safe version
+            return self.left + 0.5 * self.length
+
+    @property
+    def length(self):
+        """Return the length of the Interval"""
+        try:
+            return self.right - self.left
+        except TypeError:
+            # length not defined for some types, e.g. string
+            msg = 'cannot compute length between {left!r} and {right!r}'
+            raise TypeError(msg.format(left=self.left, right=self.right))
+
+    def _check_closed_matches(self, other, name='other'):
+        """Check if the closed attribute of `other` matches.
+
+        Note that 'left' and 'right' are considered different from 'both'.
+
+        Parameters
+        ----------
+        other : Interval, IntervalIndex, IntervalArray
+        name : str
+            Name to use for 'other' in the error message.
+
+        Raises
+        ------
+        ValueError
+            When `other` is not closed exactly the same as self.
+        """
+        if self.closed != other.closed:
+            msg = "'{}.closed' is '{}', expected '{}'."
+            raise ValueError(msg.format(name, other.closed, self.closed))
+
+
+cdef _interval_like(other):
+    return (hasattr(other, 'left')
+            and hasattr(other, 'right')
+            and hasattr(other, 'closed'))
+
+
+cdef class Interval(IntervalMixin):
+    """
+    Immutable object implementing an Interval, a bounded slice-like interval.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    left : orderable scalar
+        Left bound for the interval.
+    right : orderable scalar
+        Right bound for the interval.
+    closed : {'right', 'left', 'both', 'neither'}, default 'right'
+        Whether the interval is closed on the left-side, right-side, both or
+        neither. See the Notes for more detailed explanation.
+
+    See Also
+    --------
+    IntervalIndex : An Index of Interval objects that are all closed on the
+        same side.
+    cut : Convert continuous data into discrete bins (Categorical
+        of Interval objects).
+    qcut : Convert continuous data into bins (Categorical of Interval objects)
+        based on quantiles.
+    Period : Represents a period of time.
+
+    Notes
+    -----
+    The parameters `left` and `right` must be from the same type, you must be
+    able to compare them and they must satisfy ``left <= right``.
+
+    A closed interval (in mathematics denoted by square brackets) contains
+    its endpoints, i.e. the closed interval ``[0, 5]`` is characterized by the
+    conditions ``0 <= x <= 5``. This is what ``closed='both'`` stands for.
+    An open interval (in mathematics denoted by parentheses) does not contain
+    its endpoints, i.e. the open interval ``(0, 5)`` is characterized by the
+    conditions ``0 < x < 5``. This is what ``closed='neither'`` stands for.
+    Intervals can also be half-open or half-closed, i.e. ``[0, 5)`` is
+    described by ``0 <= x < 5`` (``closed='left'``) and ``(0, 5]`` is
+    described by ``0 < x <= 5`` (``closed='right'``).
+
+    Examples
+    --------
+    It is possible to build Intervals of different types, like numeric ones:
+
+    >>> iv = pd.Interval(left=0, right=5)
+    >>> iv
+    Interval(0, 5, closed='right')
+
+    You can check if an element belongs to it
+
+    >>> 2.5 in iv
+    True
+
+    You can test the bounds (``closed='right'``, so ``0 < x <= 5``):
+
+    >>> 0 in iv
+    False
+    >>> 5 in iv
+    True
+    >>> 0.0001 in iv
+    True
+
+    Calculate its length
+
+    >>> iv.length
+    5
+
+    You can operate with `+` and `*` over an Interval and the operation
+    is applied to each of its bounds, so the result depends on the type
+    of the bound elements
+
+    >>> shifted_iv = iv + 3
+    >>> shifted_iv
+    Interval(3, 8, closed='right')
+    >>> extended_iv = iv * 10.0
+    >>> extended_iv
+    Interval(0.0, 50.0, closed='right')
+
+    To create a time interval you can use Timestamps as the bounds
+
+    >>> year_2017 = pd.Interval(pd.Timestamp('2017-01-01 00:00:00'),
+    ...                         pd.Timestamp('2018-01-01 00:00:00'),
+    ...                         closed='left')
+    >>> pd.Timestamp('2017-01-01 00:00') in year_2017
+    True
+    >>> year_2017.length
+    Timedelta('365 days 00:00:00')
+
+    And also you can create string intervals
+
+    >>> volume_1 = pd.Interval('Ant', 'Dog', closed='both')
+    >>> 'Bee' in volume_1
+    True
+    """
+    _typ = "interval"
+
+    cdef readonly object left
+    """Left bound for the interval"""
+
+    cdef readonly object right
+    """Right bound for the interval"""
+
+    cdef readonly str closed
+    """
+    Whether the interval is closed on the left-side, right-side, both or
+    neither
+    """
+
+    def __init__(self, left, right, str closed='right'):
+        # note: it is faster to just do these checks than to use a special
+        # constructor (__cinit__/__new__) to avoid them
+        if closed not in _VALID_CLOSED:
+            msg = "invalid option for 'closed': {closed}".format(closed=closed)
+            raise ValueError(msg)
+        if not left <= right:
+            raise ValueError('left side of interval must be <= right side')
+        if (isinstance(left, Timestamp) and
+                not tz_compare(left.tzinfo, right.tzinfo)):
+            # GH 18538
+            msg = ("left and right must have the same time zone, got "
+                   "'{left_tz}' and '{right_tz}'")
+            raise ValueError(msg.format(left_tz=left.tzinfo,
+                                        right_tz=right.tzinfo))
+        self.left = left
+        self.right = right
+        self.closed = closed
+
+    def __hash__(self):
+        return hash((self.left, self.right, self.closed))
+
+    def __contains__(self, key):
+        if _interval_like(key):
+            raise TypeError('__contains__ not defined for two intervals')
+        return ((self.left < key if self.open_left else self.left <= key) and
+                (key < self.right if self.open_right else key <= self.right))
+
+    def __richcmp__(self, other, op: int):
+        if hasattr(other, 'ndim'):
+            # let numpy (or IntervalIndex) handle vectorization
+            return NotImplemented
+
+        if _interval_like(other):
+            self_tuple = (self.left, self.right, self.closed)
+            other_tuple = (other.left, other.right, other.closed)
+            return PyObject_RichCompare(self_tuple, other_tuple, op)
+
+        # nb. could just return NotImplemented now, but handling this
+        # explicitly allows us to opt into the Python 3 behavior, even on
+        # Python 2.
+        if op == Py_EQ or op == Py_NE:
+            return NotImplemented
+        else:
+            name = type(self).__name__
+            other = type(other).__name__
+            op_str = {Py_LT: '<', Py_LE: '<=', Py_GT: '>', Py_GE: '>='}[op]
+            raise TypeError('unorderable types: {name}() {op} {other}()'
+                            .format(name=name, op=op_str, other=other))
+
+    def __reduce__(self):
+        args = (self.left, self.right, self.closed)
+        return (type(self), args)
+
+    def _repr_base(self):
+        left = self.left
+        right = self.right
+
+        # TODO: need more general formatting methodology here
+        if isinstance(left, Timestamp) and isinstance(right, Timestamp):
+            left = left._short_repr
+            right = right._short_repr
+
+        return left, right
+
+    def __repr__(self):
+
+        left, right = self._repr_base()
+        name = type(self).__name__
+        repr_str = '{name}({left!r}, {right!r}, closed={closed!r})'.format(
+            name=name, left=left, right=right, closed=self.closed)
+        return repr_str
+
+    def __str__(self):
+
+        left, right = self._repr_base()
+        start_symbol = '[' if self.closed_left else '('
+        end_symbol = ']' if self.closed_right else ')'
+        return '{start}{left}, {right}{end}'.format(
+            start=start_symbol, left=left, right=right, end=end_symbol)
+
+    def __add__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left + y, self.right + y, closed=self.closed)
+        elif isinstance(y, Interval) and isinstance(self, numbers.Number):
+            return Interval(y.left + self, y.right + self, closed=y.closed)
+        return NotImplemented
+
+    def __sub__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left - y, self.right - y, closed=self.closed)
+        return NotImplemented
+
+    def __mul__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left * y, self.right * y, closed=self.closed)
+        elif isinstance(y, Interval) and isinstance(self, numbers.Number):
+            return Interval(y.left * self, y.right * self, closed=y.closed)
+        return NotImplemented
+
+    def __div__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left / y, self.right / y, closed=self.closed)
+        return NotImplemented
+
+    def __truediv__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(self.left / y, self.right / y, closed=self.closed)
+        return NotImplemented
+
+    def __floordiv__(self, y):
+        if isinstance(y, numbers.Number):
+            return Interval(
+                self.left // y, self.right // y, closed=self.closed)
+        return NotImplemented
+
+    def overlaps(self, other):
+        """
+        Check whether two Interval objects overlap.
+
+        Two intervals overlap if they share a common point, including closed
+        endpoints. Intervals that only have an open endpoint in common do not
+        overlap.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        other : Interval
+            The interval to check against for an overlap.
+
+        Returns
+        -------
+        bool
+            ``True`` if the two intervals overlap, else ``False``.
+
+        See Also
+        --------
+        IntervalArray.overlaps : The corresponding method for IntervalArray.
+        IntervalIndex.overlaps : The corresponding method for IntervalIndex.
+
+        Examples
+        --------
+        >>> i1 = pd.Interval(0, 2)
+        >>> i2 = pd.Interval(1, 3)
+        >>> i1.overlaps(i2)
+        True
+        >>> i3 = pd.Interval(4, 5)
+        >>> i1.overlaps(i3)
+        False
+
+        Intervals that share closed endpoints overlap:
+
+        >>> i4 = pd.Interval(0, 1, closed='both')
+        >>> i5 = pd.Interval(1, 2, closed='both')
+        >>> i4.overlaps(i5)
+        True
+
+        Intervals that only have an open endpoint in common do not overlap:
+
+        >>> i6 = pd.Interval(1, 2, closed='neither')
+        >>> i4.overlaps(i6)
+        False
+        """
+        if not isinstance(other, Interval):
+            msg = '`other` must be an Interval, got {other}'
+            raise TypeError(msg.format(other=type(other).__name__))
+
+        # equality is okay if both endpoints are closed (overlap at a point)
+        op1 = le if (self.closed_left and other.closed_right) else lt
+        op2 = le if (other.closed_left and self.closed_right) else lt
+
+        # overlaps is equivalent negation of two interval being disjoint:
+        # disjoint = (A.left > B.right) or (B.left > A.right)
+        # (simplifying the negation allows this to be done in less operations)
+        return op1(self.left, other.right) and op2(other.left, self.right)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def intervals_to_interval_bounds(ndarray intervals,
+                                 bint validate_closed=True):
+    """
+    Parameters
+    ----------
+    intervals : ndarray
+        object array of Intervals / nulls
+
+    validate_closed: boolean, default True
+        boolean indicating if all intervals must be closed on the same side.
+        Mismatching closed will raise if True, else return None for closed.
+
+    Returns
+    -------
+    tuples (left: ndarray object array,
+            right: ndarray object array,
+            closed: str)
+
+    """
+
+    cdef:
+        object closed = None, interval
+        int64_t n = len(intervals)
+        ndarray left, right
+        bint seen_closed = False
+
+    left = np.empty(n, dtype=intervals.dtype)
+    right = np.empty(n, dtype=intervals.dtype)
+
+    for i in range(len(intervals)):
+        interval = intervals[i]
+        if interval is None or util.is_nan(interval):
+            left[i] = np.nan
+            right[i] = np.nan
+            continue
+
+        if not isinstance(interval, Interval):
+            raise TypeError("type {typ} with value {iv} is not an interval"
+                            .format(typ=type(interval), iv=interval))
+
+        left[i] = interval.left
+        right[i] = interval.right
+        if not seen_closed:
+            seen_closed = True
+            closed = interval.closed
+        elif closed != interval.closed:
+            closed = None
+            if validate_closed:
+                msg = 'intervals must all be closed on the same side'
+                raise ValueError(msg)
+
+    return left, right, closed
+
+
+include "intervaltree.pxi"
diff --git a/pandas/_libs/intervaltree.pxi.in b/pandas/_libs/intervaltree.pxi.in
new file mode 100644
index 0000000000000..196841f35ed8d
--- /dev/null
+++ b/pandas/_libs/intervaltree.pxi.in
@@ -0,0 +1,413 @@
+"""
+Template for intervaltree
+
+WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
+"""
+
+ctypedef fused scalar_t:
+    float64_t
+    float32_t
+    int64_t
+    int32_t
+    uint64_t
+
+# ----------------------------------------------------------------------
+# IntervalTree
+# ----------------------------------------------------------------------
+
+cdef class IntervalTree(IntervalMixin):
+    """A centered interval tree
+
+    Based off the algorithm described on Wikipedia:
+    http://en.wikipedia.org/wiki/Interval_tree
+
+    we are emulating the IndexEngine interface
+    """
+    cdef:
+        readonly object left, right, root, dtype
+        readonly str closed
+        object _is_overlapping, _left_sorter, _right_sorter
+
+    def __init__(self, left, right, closed='right', leaf_size=100):
+        """
+        Parameters
+        ----------
+        left, right : np.ndarray[ndim=1]
+            Left and right bounds for each interval. Assumed to contain no
+            NaNs.
+        closed : {'left', 'right', 'both', 'neither'}, optional
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither. Defaults to 'right'.
+        leaf_size : int, optional
+            Parameter that controls when the tree switches from creating nodes
+            to brute-force search. Tune this parameter to optimize query
+            performance.
+        """
+        if closed not in ['left', 'right', 'both', 'neither']:
+            raise ValueError("invalid option for 'closed': %s" % closed)
+
+        left = np.asarray(left)
+        right = np.asarray(right)
+        self.dtype = np.result_type(left, right)
+        self.left = np.asarray(left, dtype=self.dtype)
+        self.right = np.asarray(right, dtype=self.dtype)
+
+        indices = np.arange(len(left), dtype='int64')
+
+        self.closed = closed
+
+        # GH 23352: ensure no nan in nodes
+        mask = ~np.isnan(self.left)
+        self.left = self.left[mask]
+        self.right = self.right[mask]
+        indices = indices[mask]
+
+        node_cls = NODE_CLASSES[str(self.dtype), closed]
+        self.root = node_cls(self.left, self.right, indices, leaf_size)
+
+    @property
+    def left_sorter(self):
+        """How to sort the left labels; this is used for binary search
+        """
+        if self._left_sorter is None:
+            self._left_sorter = np.argsort(self.left)
+        return self._left_sorter
+
+    @property
+    def right_sorter(self):
+        """How to sort the right labels
+        """
+        if self._right_sorter is None:
+            self._right_sorter = np.argsort(self.right)
+        return self._right_sorter
+
+    @property
+    def is_overlapping(self):
+        """
+        Determine if the IntervalTree contains overlapping intervals.
+        Cached as self._is_overlapping.
+        """
+        if self._is_overlapping is not None:
+            return self._is_overlapping
+
+        # <= when both sides closed since endpoints can overlap
+        op = le if self.closed == 'both' else lt
+
+        # overlap if start of current interval < end of previous interval
+        # (current and previous in terms of sorted order by left/start side)
+        current = self.left[self.left_sorter[1:]]
+        previous = self.right[self.left_sorter[:-1]]
+        self._is_overlapping = bool(op(current, previous).any())
+
+        return self._is_overlapping
+
+    def get_loc(self, scalar_t key):
+        """Return all positions corresponding to intervals that overlap with
+        the given scalar key
+        """
+        result = Int64Vector()
+        self.root.query(result, key)
+        if not result.data.n:
+            raise KeyError(key)
+        return result.to_array().astype('intp')
+
+    def _get_partial_overlap(self, key_left, key_right, side):
+        """Return all positions corresponding to intervals with the given side
+        falling between the left and right bounds of an interval query
+        """
+        if side == 'left':
+            values = self.left
+            sorter = self.left_sorter
+        else:
+            values = self.right
+            sorter = self.right_sorter
+        key = [key_left, key_right]
+        i, j = values.searchsorted(key, sorter=sorter)
+        return sorter[i:j]
+
+    def get_loc_interval(self, key_left, key_right):
+        """Lookup the intervals enclosed in the given interval bounds
+
+        The given interval is presumed to have closed bounds.
+        """
+        import pandas as pd
+        left_overlap = self._get_partial_overlap(key_left, key_right, 'left')
+        right_overlap = self._get_partial_overlap(key_left, key_right, 'right')
+        enclosing = self.get_loc(0.5 * (key_left + key_right))
+        combined = np.concatenate([left_overlap, right_overlap, enclosing])
+        uniques = pd.unique(combined)
+        return uniques.astype('intp')
+
+    def get_indexer(self, scalar_t[:] target):
+        """Return the positions corresponding to unique intervals that overlap
+        with the given array of scalar targets.
+        """
+
+        # TODO: write get_indexer_intervals
+        cdef:
+            size_t old_len
+            Py_ssize_t i
+            Int64Vector result
+
+        result = Int64Vector()
+        old_len = 0
+        for i in range(len(target)):
+            self.root.query(result, target[i])
+            if result.data.n == old_len:
+                result.append(-1)
+            elif result.data.n > old_len + 1:
+                raise KeyError(
+                    'indexer does not intersect a unique set of intervals')
+            old_len = result.data.n
+        return result.to_array().astype('intp')
+
+    def get_indexer_non_unique(self, scalar_t[:] target):
+        """Return the positions corresponding to intervals that overlap with
+        the given array of scalar targets. Non-unique positions are repeated.
+        """
+        cdef:
+            size_t old_len
+            Py_ssize_t i
+            Int64Vector result, missing
+
+        result = Int64Vector()
+        missing = Int64Vector()
+        old_len = 0
+        for i in range(len(target)):
+            self.root.query(result, target[i])
+            if result.data.n == old_len:
+                result.append(-1)
+                missing.append(i)
+            old_len = result.data.n
+        return (result.to_array().astype('intp'),
+                missing.to_array().astype('intp'))
+
+    def __repr__(self):
+        return ('<IntervalTree[{dtype},{closed}]: '
+                '{n_elements} elements>'.format(
+                    dtype=self.dtype, closed=self.closed,
+                    n_elements=self.root.n_elements))
+
+    # compat with IndexEngine interface
+    def clear_mapping(self):
+        pass
+
+
+cdef take(ndarray source, ndarray indices):
+    """Take the given positions from a 1D ndarray
+    """
+    return PyArray_Take(source, indices, 0)
+
+
+cdef sort_values_and_indices(all_values, all_indices, subset):
+    indices = take(all_indices, subset)
+    values = take(all_values, subset)
+    sorter = PyArray_ArgSort(values, 0, NPY_QUICKSORT)
+    sorted_values = take(values, sorter)
+    sorted_indices = take(indices, sorter)
+    return sorted_values, sorted_indices
+
+
+# ----------------------------------------------------------------------
+# Nodes
+# ----------------------------------------------------------------------
+
+# we need specialized nodes and leaves to optimize for different dtype and
+# closed values
+
+{{py:
+
+nodes = []
+for dtype in ['float32', 'float64', 'int32', 'int64', 'uint64']:
+    for closed, cmp_left, cmp_right in [
+        ('left', '<=', '<'),
+        ('right', '<', '<='),
+        ('both', '<=', '<='),
+        ('neither', '<', '<')]:
+        cmp_left_converse = '<' if cmp_left == '<=' else '<='
+        cmp_right_converse = '<' if cmp_right == '<=' else '<='
+        nodes.append((dtype, dtype.title(),
+                      closed, closed.title(),
+                      cmp_left,
+                      cmp_right,
+                      cmp_left_converse,
+                      cmp_right_converse))
+
+}}
+
+NODE_CLASSES = {}
+
+{{for dtype, dtype_title, closed, closed_title, cmp_left, cmp_right,
+      cmp_left_converse, cmp_right_converse in nodes}}
+
+cdef class {{dtype_title}}Closed{{closed_title}}IntervalNode:
+    """Non-terminal node for an IntervalTree
+
+    Categorizes intervals by those that fall to the left, those that fall to
+    the right, and those that overlap with the pivot.
+    """
+    cdef:
+        {{dtype_title}}Closed{{closed_title}}IntervalNode left_node, right_node
+        {{dtype}}_t[:] center_left_values, center_right_values, left, right
+        int64_t[:] center_left_indices, center_right_indices, indices
+        {{dtype}}_t min_left, max_right
+        readonly {{dtype}}_t pivot
+        readonly int64_t n_elements, n_center, leaf_size
+        readonly bint is_leaf_node
+
+    def __init__(self,
+                 ndarray[{{dtype}}_t, ndim=1] left,
+                 ndarray[{{dtype}}_t, ndim=1] right,
+                 ndarray[int64_t, ndim=1] indices,
+                 int64_t leaf_size):
+
+        self.n_elements = len(left)
+        self.leaf_size = leaf_size
+
+        # min_left and min_right are used to speed-up query by skipping
+        # query on sub-nodes. If this node has size 0, query is cheap,
+        # so these values don't matter.
+        if left.size > 0:
+            self.min_left = left.min()
+            self.max_right = right.max()
+        else:
+            self.min_left = 0
+            self.max_right = 0
+
+        if self.n_elements <= leaf_size:
+            # make this a terminal (leaf) node
+            self.is_leaf_node = True
+            self.left = left
+            self.right = right
+            self.indices = indices
+            self.n_center = 0
+        else:
+            # calculate a pivot so we can create child nodes
+            self.is_leaf_node = False
+            self.pivot = np.median(left / 2 + right / 2)
+            left_set, right_set, center_set = self.classify_intervals(
+                left, right)
+
+            self.left_node = self.new_child_node(left, right,
+                                                 indices, left_set)
+            self.right_node = self.new_child_node(left, right,
+                                                  indices, right_set)
+
+            self.center_left_values, self.center_left_indices = \
+                sort_values_and_indices(left, indices, center_set)
+            self.center_right_values, self.center_right_indices = \
+                sort_values_and_indices(right, indices, center_set)
+            self.n_center = len(self.center_left_indices)
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef classify_intervals(self, {{dtype}}_t[:] left, {{dtype}}_t[:] right):
+        """Classify the given intervals based upon whether they fall to the
+        left, right, or overlap with this node's pivot.
+        """
+        cdef:
+            Int64Vector left_ind, right_ind, overlapping_ind
+            Py_ssize_t i
+
+        left_ind = Int64Vector()
+        right_ind = Int64Vector()
+        overlapping_ind = Int64Vector()
+
+        for i in range(self.n_elements):
+            if right[i] {{cmp_right_converse}} self.pivot:
+                left_ind.append(i)
+            elif self.pivot {{cmp_left_converse}} left[i]:
+                right_ind.append(i)
+            else:
+                overlapping_ind.append(i)
+
+        return (left_ind.to_array(),
+                right_ind.to_array(),
+                overlapping_ind.to_array())
+
+    cdef new_child_node(self,
+                        ndarray[{{dtype}}_t, ndim=1] left,
+                        ndarray[{{dtype}}_t, ndim=1] right,
+                        ndarray[int64_t, ndim=1] indices,
+                        ndarray[int64_t, ndim=1] subset):
+        """Create a new child node.
+        """
+        left = take(left, subset)
+        right = take(right, subset)
+        indices = take(indices, subset)
+        return {{dtype_title}}Closed{{closed_title}}IntervalNode(
+            left, right, indices, self.leaf_size)
+
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    @cython.initializedcheck(False)
+    cpdef query(self, Int64Vector result, scalar_t point):
+        """Recursively query this node and its sub-nodes for intervals that
+        overlap with the query point.
+        """
+        cdef:
+            int64_t[:] indices
+            {{dtype}}_t[:] values
+            Py_ssize_t i
+
+        if self.is_leaf_node:
+            # Once we get down to a certain size, it doesn't make sense to
+            # continue the binary tree structure. Instead, we use linear
+            # search.
+            for i in range(self.n_elements):
+                if self.left[i] {{cmp_left}} point {{cmp_right}} self.right[i]:
+                    result.append(self.indices[i])
+        else:
+            # There are child nodes. Based on comparing our query to the pivot,
+            # look at the center values, then go to the relevant child.
+            if point < self.pivot:
+                values = self.center_left_values
+                indices = self.center_left_indices
+                for i in range(self.n_center):
+                    if not values[i] {{cmp_left}} point:
+                        break
+                    result.append(indices[i])
+                if point {{cmp_right}} self.left_node.max_right:
+                    self.left_node.query(result, point)
+            elif point > self.pivot:
+                values = self.center_right_values
+                indices = self.center_right_indices
+                for i in range(self.n_center - 1, -1, -1):
+                    if not point {{cmp_right}} values[i]:
+                        break
+                    result.append(indices[i])
+                if self.right_node.min_left {{cmp_left}} point:
+                    self.right_node.query(result, point)
+            else:
+                result.extend(self.center_left_indices)
+
+    def __repr__(self):
+        if self.is_leaf_node:
+            return ('<{{dtype_title}}Closed{{closed_title}}IntervalNode: '
+                    '%s elements (terminal)>' % self.n_elements)
+        else:
+            n_left = self.left_node.n_elements
+            n_right = self.right_node.n_elements
+            n_center = self.n_elements - n_left - n_right
+            return ('<{{dtype_title}}Closed{{closed_title}}IntervalNode: '
+                    'pivot %s, %s elements (%s left, %s right, %s '
+                    'overlapping)>' % (self.pivot, self.n_elements,
+                                       n_left, n_right, n_center))
+
+    def counts(self):
+        """
+        Inspect counts on this node
+        useful for debugging purposes
+        """
+        if self.is_leaf_node:
+            return self.n_elements
+        else:
+            m = len(self.center_left_values)
+            l = self.left_node.counts()
+            r = self.right_node.counts()
+            return (m, (l, r))
+
+NODE_CLASSES['{{dtype}}',
+             '{{closed}}'] = {{dtype_title}}Closed{{closed_title}}IntervalNode
+
+{{endfor}}
diff --git a/pandas/_libs/join.pyx b/pandas/_libs/join.pyx
index 385a9762ed90d..503867058b3c8 100644
--- a/pandas/_libs/join.pyx
+++ b/pandas/_libs/join.pyx
@@ -1,44 +1,20 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
 
-from numpy cimport *
-cimport numpy as np
-import numpy as np
-
-cimport cython
-
-import_array()
-
-cimport util
-
-from numpy cimport NPY_INT8 as NPY_int8
-from numpy cimport NPY_INT16 as NPY_int16
-from numpy cimport NPY_INT32 as NPY_int32
-from numpy cimport NPY_INT64 as NPY_int64
-from numpy cimport NPY_FLOAT16 as NPY_float16
-from numpy cimport NPY_FLOAT32 as NPY_float32
-from numpy cimport NPY_FLOAT64 as NPY_float64
+import cython
+from cython import Py_ssize_t
 
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
-
-int8 = np.dtype(np.int8)
-int16 = np.dtype(np.int16)
-int32 = np.dtype(np.int32)
-int64 = np.dtype(np.int64)
-float16 = np.dtype(np.float16)
-float32 = np.dtype(np.float32)
-float64 = np.dtype(np.float64)
-
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
+cnp.import_array()
 
 from pandas._libs.algos import groupsort_indexer, ensure_platform_int
 from pandas.core.algorithms import take_nd
 
-include "join_func_helper.pxi"
-
 
-def inner_join(ndarray[int64_t] left, ndarray[int64_t] right,
+def inner_join(const int64_t[:] left, const int64_t[:] right,
                Py_ssize_t max_groups):
     cdef:
         Py_ssize_t i, j, k, count = 0
@@ -89,7 +65,7 @@ def inner_join(ndarray[int64_t] left, ndarray[int64_t] right,
             _get_result_indexer(right_sorter, right_indexer))
 
 
-def left_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
+def left_outer_join(const int64_t[:] left, const int64_t[:] right,
                     Py_ssize_t max_groups, sort=True):
     cdef:
         Py_ssize_t i, j, k, count = 0
@@ -163,8 +139,8 @@ def left_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
     return left_indexer, right_indexer
 
 
-def full_outer_join(ndarray[int64_t] left, ndarray[int64_t] right,
-                          Py_ssize_t max_groups):
+def full_outer_join(const int64_t[:] left, const int64_t[:] right,
+                    Py_ssize_t max_groups):
     cdef:
         Py_ssize_t i, j, k, count = 0
         ndarray[int64_t] left_count, right_count, left_sorter, right_sorter
@@ -232,12 +208,12 @@ def _get_result_indexer(sorter, indexer):
     else:
         # length-0 case
         res = np.empty(len(indexer), dtype=np.int64)
-        res.fill(-1)
+        res[:] = -1
 
     return res
 
 
-def ffill_indexer(ndarray[int64_t] indexer):
+def ffill_indexer(const int64_t[:] indexer):
     cdef:
         Py_ssize_t i, n = len(indexer)
         ndarray[int64_t] result
@@ -257,28 +233,774 @@ def ffill_indexer(ndarray[int64_t] indexer):
     return result
 
 
-def ffill_by_group(ndarray[int64_t] indexer, ndarray[int64_t] group_ids,
-                   int64_t max_group):
+# ----------------------------------------------------------------------
+# left_join_indexer, inner_join_indexer, outer_join_indexer
+# ----------------------------------------------------------------------
+
+ctypedef fused join_t:
+    float64_t
+    float32_t
+    object
+    int32_t
+    int64_t
+    uint64_t
+
+
+# Joins on ordered, unique indices
+
+# right might contain non-unique values
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def left_join_indexer_unique(join_t[:] left, join_t[:] right):
     cdef:
-        Py_ssize_t i, n = len(indexer)
-        ndarray[int64_t] result, last_obs
-        int64_t gid, val
+        Py_ssize_t i, j, nleft, nright
+        ndarray[int64_t] indexer
+        join_t lval, rval
+
+    i = 0
+    j = 0
+    nleft = len(left)
+    nright = len(right)
+
+    indexer = np.empty(nleft, dtype=np.int64)
+    while True:
+        if i == nleft:
+            break
+
+        if j == nright:
+            indexer[i] = -1
+            i += 1
+            continue
+
+        rval = right[j]
+
+        while i < nleft - 1 and left[i] == rval:
+            indexer[i] = j
+            i += 1
+
+        if left[i] == right[j]:
+            indexer[i] = j
+            i += 1
+            while i < nleft - 1 and left[i] == rval:
+                indexer[i] = j
+                i += 1
+            j += 1
+        elif left[i] > rval:
+            indexer[i] = -1
+            j += 1
+        else:
+            indexer[i] = -1
+            i += 1
+    return indexer
 
-    result = np.empty(n, dtype=np.int64)
 
-    last_obs = np.empty(max_group, dtype=np.int64)
-    last_obs.fill(-1)
+left_join_indexer_unique_float64 = left_join_indexer_unique["float64_t"]
+left_join_indexer_unique_float32 = left_join_indexer_unique["float32_t"]
+left_join_indexer_unique_object = left_join_indexer_unique["object"]
+left_join_indexer_unique_int32 = left_join_indexer_unique["int32_t"]
+left_join_indexer_unique_int64 = left_join_indexer_unique["int64_t"]
+left_join_indexer_unique_uint64 = left_join_indexer_unique["uint64_t"]
 
-    for i in range(n):
-        gid = group_ids[i]
-        val = indexer[i]
-        if val == -1:
-            result[i] = last_obs[gid]
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def left_join_indexer(ndarray[join_t] left, ndarray[join_t] right):
+    """
+    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
+    """
+    cdef:
+        Py_ssize_t i, j, k, nright, nleft, count
+        join_t lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[join_t] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0:
+        while i < nleft:
+            if j == nright:
+                count += nleft - i
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                count += 1
+                i += 1
+            else:
+                j += 1
+
+    # do it again now that result size is known
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype=left.dtype)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0:
+        while i < nleft:
+            if j == nright:
+                while i < nleft:
+                    lindexer[count] = i
+                    rindexer[count] = -1
+                    result[count] = left[i]
+                    i += 1
+                    count += 1
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = lval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                lindexer[count] = i
+                rindexer[count] = -1
+                result[count] = left[i]
+                count += 1
+                i += 1
+            else:
+                j += 1
+
+    return result, lindexer, rindexer
+
+
+left_join_indexer_float64 = left_join_indexer["float64_t"]
+left_join_indexer_float32 = left_join_indexer["float32_t"]
+left_join_indexer_object = left_join_indexer["object"]
+left_join_indexer_int32 = left_join_indexer["int32_t"]
+left_join_indexer_int64 = left_join_indexer["int64_t"]
+left_join_indexer_uint64 = left_join_indexer["uint64_t"]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def inner_join_indexer(ndarray[join_t] left, ndarray[join_t] right):
+    """
+    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
+    """
+    cdef:
+        Py_ssize_t i, j, k, nright, nleft, count
+        join_t lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[join_t] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0 and nright > 0:
+        while True:
+            if i == nleft:
+                break
+            if j == nright:
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                i += 1
+            else:
+                j += 1
+
+    # do it again now that result size is known
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype=left.dtype)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft > 0 and nright > 0:
+        while True:
+            if i == nleft:
+                break
+            if j == nright:
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = rval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                i += 1
+            else:
+                j += 1
+
+    return result, lindexer, rindexer
+
+
+inner_join_indexer_float64 = inner_join_indexer["float64_t"]
+inner_join_indexer_float32 = inner_join_indexer["float32_t"]
+inner_join_indexer_object = inner_join_indexer["object"]
+inner_join_indexer_int32 = inner_join_indexer["int32_t"]
+inner_join_indexer_int64 = inner_join_indexer["int64_t"]
+inner_join_indexer_uint64 = inner_join_indexer["uint64_t"]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def outer_join_indexer(ndarray[join_t] left, ndarray[join_t] right):
+    cdef:
+        Py_ssize_t i, j, nright, nleft, count
+        join_t lval, rval
+        ndarray[int64_t] lindexer, rindexer
+        ndarray[join_t] result
+
+    nleft = len(left)
+    nright = len(right)
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft == 0:
+        count = nright
+    elif nright == 0:
+        count = nleft
+    else:
+        while True:
+            if i == nleft:
+                count += nright - j
+                break
+            if j == nright:
+                count += nleft - i
+                break
+
+            lval = left[i]
+            rval = right[j]
+            if lval == rval:
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                count += 1
+                i += 1
+            else:
+                count += 1
+                j += 1
+
+    lindexer = np.empty(count, dtype=np.int64)
+    rindexer = np.empty(count, dtype=np.int64)
+    result = np.empty(count, dtype=left.dtype)
+
+    # do it again, but populate the indexers / result
+
+    i = 0
+    j = 0
+    count = 0
+    if nleft == 0:
+        for j in range(nright):
+            lindexer[j] = -1
+            rindexer[j] = j
+            result[j] = right[j]
+    elif nright == 0:
+        for i in range(nleft):
+            lindexer[i] = i
+            rindexer[i] = -1
+            result[i] = left[i]
+    else:
+        while True:
+            if i == nleft:
+                while j < nright:
+                    lindexer[count] = -1
+                    rindexer[count] = j
+                    result[count] = right[j]
+                    count += 1
+                    j += 1
+                break
+            if j == nright:
+                while i < nleft:
+                    lindexer[count] = i
+                    rindexer[count] = -1
+                    result[count] = left[i]
+                    count += 1
+                    i += 1
+                break
+
+            lval = left[i]
+            rval = right[j]
+
+            if lval == rval:
+                lindexer[count] = i
+                rindexer[count] = j
+                result[count] = lval
+                count += 1
+                if i < nleft - 1:
+                    if j < nright - 1 and right[j + 1] == rval:
+                        j += 1
+                    else:
+                        i += 1
+                        if left[i] != rval:
+                            j += 1
+                elif j < nright - 1:
+                    j += 1
+                    if lval != right[j]:
+                        i += 1
+                else:
+                    # end of the road
+                    break
+            elif lval < rval:
+                lindexer[count] = i
+                rindexer[count] = -1
+                result[count] = lval
+                count += 1
+                i += 1
+            else:
+                lindexer[count] = -1
+                rindexer[count] = j
+                result[count] = rval
+                count += 1
+                j += 1
+
+    return result, lindexer, rindexer
+
+
+outer_join_indexer_float64 = outer_join_indexer["float64_t"]
+outer_join_indexer_float32 = outer_join_indexer["float32_t"]
+outer_join_indexer_object = outer_join_indexer["object"]
+outer_join_indexer_int32 = outer_join_indexer["int32_t"]
+outer_join_indexer_int64 = outer_join_indexer["int64_t"]
+outer_join_indexer_uint64 = outer_join_indexer["uint64_t"]
+
+
+# ----------------------------------------------------------------------
+# asof_join_by
+# ----------------------------------------------------------------------
+
+from pandas._libs.hashtable cimport (
+    HashTable, PyObjectHashTable, UInt64HashTable, Int64HashTable)
+
+ctypedef fused asof_t:
+    uint8_t
+    uint16_t
+    uint32_t
+    uint64_t
+    int8_t
+    int16_t
+    int32_t
+    int64_t
+    float
+    float64_t
+
+ctypedef fused by_t:
+    object
+    int64_t
+    uint64_t
+
+
+def asof_join_backward_on_X_by_Y(asof_t[:] left_values,
+                                 asof_t[:] right_values,
+                                 by_t[:] left_by_values,
+                                 by_t[:] right_by_values,
+                                 bint allow_exact_matches=1,
+                                 tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        asof_t tolerance_ = 0
+        asof_t diff = 0
+        HashTable hash_table
+        by_t by_value
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    if by_t is object:
+        hash_table = PyObjectHashTable(right_size)
+    elif by_t is int64_t:
+        hash_table = Int64HashTable(right_size)
+    elif by_t is uint64_t:
+        hash_table = UInt64HashTable(right_size)
+
+    right_pos = 0
+    for left_pos in range(left_size):
+        # restart right_pos if it went negative in a previous iteration
+        if right_pos < 0:
+            right_pos = 0
+
+        # find last position in right whose value is less than left's
+        if allow_exact_matches:
+            while (right_pos < right_size and
+                   right_values[right_pos] <= left_values[left_pos]):
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos += 1
         else:
-            result[i] = val
-            last_obs[gid] = val
+            while (right_pos < right_size and
+                   right_values[right_pos] < left_values[left_pos]):
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos += 1
+        right_pos -= 1
+
+        # save positions as the desired index
+        by_value = left_by_values[left_pos]
+        found_right_pos = (hash_table.get_item(by_value)
+                           if by_value in hash_table else -1)
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = found_right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and found_right_pos != -1:
+            diff = left_values[left_pos] - right_values[found_right_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
 
-    return result
+    return left_indexer, right_indexer
 
 
-include "join_helper.pxi"
+def asof_join_forward_on_X_by_Y(asof_t[:] left_values,
+                                asof_t[:] right_values,
+                                by_t[:] left_by_values,
+                                by_t[:] right_by_values,
+                                bint allow_exact_matches=1,
+                                tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        asof_t tolerance_ = 0
+        asof_t diff = 0
+        HashTable hash_table
+        by_t by_value
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    if by_t is object:
+        hash_table = PyObjectHashTable(right_size)
+    elif by_t is int64_t:
+        hash_table = Int64HashTable(right_size)
+    elif by_t is uint64_t:
+        hash_table = UInt64HashTable(right_size)
+
+    right_pos = right_size - 1
+    for left_pos in range(left_size - 1, -1, -1):
+        # restart right_pos if it went over in a previous iteration
+        if right_pos == right_size:
+            right_pos = right_size - 1
+
+        # find first position in right whose value is greater than left's
+        if allow_exact_matches:
+            while (right_pos >= 0 and
+                   right_values[right_pos] >= left_values[left_pos]):
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos -= 1
+        else:
+            while (right_pos >= 0 and
+                   right_values[right_pos] > left_values[left_pos]):
+                hash_table.set_item(right_by_values[right_pos], right_pos)
+                right_pos -= 1
+        right_pos += 1
+
+        # save positions as the desired index
+        by_value = left_by_values[left_pos]
+        found_right_pos = (hash_table.get_item(by_value)
+                           if by_value in hash_table else -1)
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = found_right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and found_right_pos != -1:
+            diff = right_values[found_right_pos] - left_values[left_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_nearest_on_X_by_Y(asof_t[:] left_values,
+                                asof_t[:] right_values,
+                                by_t[:] left_by_values,
+                                by_t[:] right_by_values,
+                                bint allow_exact_matches=1,
+                                tolerance=None):
+
+    cdef:
+        Py_ssize_t left_size, right_size, i
+        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
+        asof_t bdiff, fdiff
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    # search both forward and backward
+    bli, bri = asof_join_backward_on_X_by_Y(left_values,
+                                            right_values,
+                                            left_by_values,
+                                            right_by_values,
+                                            allow_exact_matches,
+                                            tolerance)
+    fli, fri = asof_join_forward_on_X_by_Y(left_values,
+                                           right_values,
+                                           left_by_values,
+                                           right_by_values,
+                                           allow_exact_matches,
+                                           tolerance)
+
+    for i in range(len(bri)):
+        # choose timestamp from right with smaller difference
+        if bri[i] != -1 and fri[i] != -1:
+            bdiff = left_values[bli[i]] - right_values[bri[i]]
+            fdiff = right_values[fri[i]] - left_values[fli[i]]
+            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
+        else:
+            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
+        left_indexer[i] = bli[i]
+
+    return left_indexer, right_indexer
+
+
+# ----------------------------------------------------------------------
+# asof_join
+# ----------------------------------------------------------------------
+
+def asof_join_backward(asof_t[:] left_values,
+                       asof_t[:] right_values,
+                       bint allow_exact_matches=1,
+                       tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        asof_t tolerance_ = 0
+        asof_t diff = 0
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    right_pos = 0
+    for left_pos in range(left_size):
+        # restart right_pos if it went negative in a previous iteration
+        if right_pos < 0:
+            right_pos = 0
+
+        # find last position in right whose value is less than left's
+        if allow_exact_matches:
+            while (right_pos < right_size and
+                   right_values[right_pos] <= left_values[left_pos]):
+                right_pos += 1
+        else:
+            while (right_pos < right_size and
+                   right_values[right_pos] < left_values[left_pos]):
+                right_pos += 1
+        right_pos -= 1
+
+        # save positions as the desired index
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = right_pos
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and right_pos != -1:
+            diff = left_values[left_pos] - right_values[right_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_forward(asof_t[:] left_values,
+                      asof_t[:] right_values,
+                      bint allow_exact_matches=1,
+                      tolerance=None):
+
+    cdef:
+        Py_ssize_t left_pos, right_pos, left_size, right_size
+        ndarray[int64_t] left_indexer, right_indexer
+        bint has_tolerance = 0
+        asof_t tolerance_ = 0
+        asof_t diff = 0
+
+    # if we are using tolerance, set our objects
+    if tolerance is not None:
+        has_tolerance = 1
+        tolerance_ = tolerance
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    right_pos = right_size - 1
+    for left_pos in range(left_size - 1, -1, -1):
+        # restart right_pos if it went over in a previous iteration
+        if right_pos == right_size:
+            right_pos = right_size - 1
+
+        # find first position in right whose value is greater than left's
+        if allow_exact_matches:
+            while (right_pos >= 0 and
+                   right_values[right_pos] >= left_values[left_pos]):
+                right_pos -= 1
+        else:
+            while (right_pos >= 0 and
+                   right_values[right_pos] > left_values[left_pos]):
+                right_pos -= 1
+        right_pos += 1
+
+        # save positions as the desired index
+        left_indexer[left_pos] = left_pos
+        right_indexer[left_pos] = (right_pos
+                                   if right_pos != right_size else -1)
+
+        # if needed, verify that tolerance is met
+        if has_tolerance and right_pos != right_size:
+            diff = right_values[right_pos] - left_values[left_pos]
+            if diff > tolerance_:
+                right_indexer[left_pos] = -1
+
+    return left_indexer, right_indexer
+
+
+def asof_join_nearest(asof_t[:] left_values,
+                      asof_t[:] right_values,
+                      bint allow_exact_matches=1,
+                      tolerance=None):
+
+    cdef:
+        Py_ssize_t left_size, right_size, i
+        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
+        asof_t bdiff, fdiff
+
+    left_size = len(left_values)
+    right_size = len(right_values)
+
+    left_indexer = np.empty(left_size, dtype=np.int64)
+    right_indexer = np.empty(left_size, dtype=np.int64)
+
+    # search both forward and backward
+    bli, bri = asof_join_backward(left_values, right_values,
+                                  allow_exact_matches, tolerance)
+    fli, fri = asof_join_forward(left_values, right_values,
+                                 allow_exact_matches, tolerance)
+
+    for i in range(len(bri)):
+        # choose timestamp from right with smaller difference
+        if bri[i] != -1 and fri[i] != -1:
+            bdiff = left_values[bli[i]] - right_values[bri[i]]
+            fdiff = right_values[fri[i]] - left_values[fli[i]]
+            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
+        else:
+            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
+        left_indexer[i] = bli[i]
+
+    return left_indexer, right_indexer
diff --git a/pandas/_libs/join_func_helper.pxi.in b/pandas/_libs/join_func_helper.pxi.in
deleted file mode 100644
index 9cca9bba2a197..0000000000000
--- a/pandas/_libs/join_func_helper.pxi.in
+++ /dev/null
@@ -1,373 +0,0 @@
-# cython: boundscheck=False, wraparound=False
-"""
-Template for each `dtype` helper function for hashtable
-
-WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
-"""
-
-#----------------------------------------------------------------------
-# asof_join_by
-#----------------------------------------------------------------------
-
-{{py:
-
-# table_type, by_dtype
-by_dtypes = [('PyObjectHashTable', 'object'), ('Int64HashTable', 'int64_t'),
-             ('UInt64HashTable', 'uint64_t')]
-
-# on_dtype
-on_dtypes = ['uint8_t', 'uint16_t', 'uint32_t', 'uint64_t',
-             'int8_t', 'int16_t', 'int32_t', 'int64_t',
-             'float', 'double']
-
-}}
-
-
-from hashtable cimport *
-
-{{for table_type, by_dtype in by_dtypes}}
-{{for on_dtype in on_dtypes}}
-
-
-def asof_join_backward_{{on_dtype}}_by_{{by_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        ndarray[{{by_dtype}}] left_by_values,
-        ndarray[{{by_dtype}}] right_by_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
-        ndarray[int64_t] left_indexer, right_indexer
-        bint has_tolerance = 0
-        {{on_dtype}} tolerance_ = 0
-        {{on_dtype}} diff = 0
-        {{table_type}} hash_table
-        {{by_dtype}} by_value
-
-    # if we are using tolerance, set our objects
-    if tolerance is not None:
-        has_tolerance = 1
-        tolerance_ = tolerance
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    hash_table = {{table_type}}(right_size)
-
-    right_pos = 0
-    for left_pos in range(left_size):
-        # restart right_pos if it went negative in a previous iteration
-        if right_pos < 0:
-            right_pos = 0
-
-        # find last position in right whose value is less than left's
-        if allow_exact_matches:
-            while right_pos < right_size and\
-                right_values[right_pos] <= left_values[left_pos]:
-                hash_table.set_item(right_by_values[right_pos], right_pos)
-                right_pos += 1
-        else:
-            while right_pos < right_size and\
-                right_values[right_pos] < left_values[left_pos]:
-                hash_table.set_item(right_by_values[right_pos], right_pos)
-                right_pos += 1
-        right_pos -= 1
-
-        # save positions as the desired index
-        by_value = left_by_values[left_pos]
-        found_right_pos = hash_table.get_item(by_value)\
-                          if by_value in hash_table else -1
-        left_indexer[left_pos] = left_pos
-        right_indexer[left_pos] = found_right_pos
-
-        # if needed, verify that tolerance is met
-        if has_tolerance and found_right_pos != -1:
-            diff = left_values[left_pos] - right_values[found_right_pos]
-            if diff > tolerance_:
-                right_indexer[left_pos] = -1
-
-    return left_indexer, right_indexer
-
-
-def asof_join_forward_{{on_dtype}}_by_{{by_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        ndarray[{{by_dtype}}] left_by_values,
-        ndarray[{{by_dtype}}] right_by_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_pos, right_pos, left_size, right_size, found_right_pos
-        ndarray[int64_t] left_indexer, right_indexer
-        bint has_tolerance = 0
-        {{on_dtype}} tolerance_ = 0
-        {{on_dtype}} diff = 0
-        {{table_type}} hash_table
-        {{by_dtype}} by_value
-
-    # if we are using tolerance, set our objects
-    if tolerance is not None:
-        has_tolerance = 1
-        tolerance_ = tolerance
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    hash_table = {{table_type}}(right_size)
-
-    right_pos = right_size - 1
-    for left_pos in range(left_size - 1, -1, -1):
-        # restart right_pos if it went over in a previous iteration
-        if right_pos == right_size:
-            right_pos = right_size - 1
-
-        # find first position in right whose value is greater than left's
-        if allow_exact_matches:
-            while right_pos >= 0 and\
-                right_values[right_pos] >= left_values[left_pos]:
-                hash_table.set_item(right_by_values[right_pos], right_pos)
-                right_pos -= 1
-        else:
-            while right_pos >= 0 and\
-                right_values[right_pos] > left_values[left_pos]:
-                hash_table.set_item(right_by_values[right_pos], right_pos)
-                right_pos -= 1
-        right_pos += 1
-
-        # save positions as the desired index
-        by_value = left_by_values[left_pos]
-        found_right_pos = hash_table.get_item(by_value)\
-                          if by_value in hash_table else -1
-        left_indexer[left_pos] = left_pos
-        right_indexer[left_pos] = found_right_pos
-
-        # if needed, verify that tolerance is met
-        if has_tolerance and found_right_pos != -1:
-            diff = right_values[found_right_pos] - left_values[left_pos]
-            if diff > tolerance_:
-                right_indexer[left_pos] = -1
-
-    return left_indexer, right_indexer
-
-
-def asof_join_nearest_{{on_dtype}}_by_{{by_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        ndarray[{{by_dtype}}] left_by_values,
-        ndarray[{{by_dtype}}] right_by_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_size, right_size, i
-        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
-        {{on_dtype}} bdiff, fdiff
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    # search both forward and backward
-    bli, bri =\
-        asof_join_backward_{{on_dtype}}_by_{{by_dtype}}(left_values,
-                                                        right_values,
-                                                        left_by_values,
-                                                        right_by_values,
-                                                        allow_exact_matches,
-                                                        tolerance)
-    fli, fri =\
-        asof_join_forward_{{on_dtype}}_by_{{by_dtype}}(left_values,
-                                                       right_values,
-                                                       left_by_values,
-                                                       right_by_values,
-                                                       allow_exact_matches,
-                                                       tolerance)
-
-    for i in range(len(bri)):
-        # choose timestamp from right with smaller difference
-        if bri[i] != -1 and fri[i] != -1:
-            bdiff = left_values[bli[i]] - right_values[bri[i]]
-            fdiff = right_values[fri[i]] - left_values[fli[i]]
-            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
-        else:
-            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
-        left_indexer[i] = bli[i]
-
-    return left_indexer, right_indexer
-
-{{endfor}}
-{{endfor}}
-
-
-#----------------------------------------------------------------------
-# asof_join
-#----------------------------------------------------------------------
-
-{{py:
-
-# on_dtype
-dtypes = ['uint8_t', 'uint16_t', 'uint32_t', 'uint64_t',
-          'int8_t', 'int16_t', 'int32_t', 'int64_t',
-          'float', 'double']
-
-}}
-
-{{for on_dtype in dtypes}}
-
-
-def asof_join_backward_{{on_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_pos, right_pos, left_size, right_size
-        ndarray[int64_t] left_indexer, right_indexer
-        bint has_tolerance = 0
-        {{on_dtype}} tolerance_ = 0
-        {{on_dtype}} diff = 0
-
-    # if we are using tolerance, set our objects
-    if tolerance is not None:
-        has_tolerance = 1
-        tolerance_ = tolerance
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    right_pos = 0
-    for left_pos in range(left_size):
-        # restart right_pos if it went negative in a previous iteration
-        if right_pos < 0:
-            right_pos = 0
-
-        # find last position in right whose value is less than left's
-        if allow_exact_matches:
-            while right_pos < right_size and\
-                right_values[right_pos] <= left_values[left_pos]:
-                right_pos += 1
-        else:
-            while right_pos < right_size and\
-                right_values[right_pos] < left_values[left_pos]:
-                right_pos += 1
-        right_pos -= 1
-
-        # save positions as the desired index
-        left_indexer[left_pos] = left_pos
-        right_indexer[left_pos] = right_pos
-
-        # if needed, verify that tolerance is met
-        if has_tolerance and right_pos != -1:
-            diff = left_values[left_pos] - right_values[right_pos]
-            if diff > tolerance_:
-                right_indexer[left_pos] = -1
-
-    return left_indexer, right_indexer
-
-
-def asof_join_forward_{{on_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_pos, right_pos, left_size, right_size
-        ndarray[int64_t] left_indexer, right_indexer
-        bint has_tolerance = 0
-        {{on_dtype}} tolerance_ = 0
-        {{on_dtype}} diff = 0
-
-    # if we are using tolerance, set our objects
-    if tolerance is not None:
-        has_tolerance = 1
-        tolerance_ = tolerance
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    right_pos = right_size - 1
-    for left_pos in range(left_size - 1, -1, -1):
-        # restart right_pos if it went over in a previous iteration
-        if right_pos == right_size:
-            right_pos = right_size - 1
-
-        # find first position in right whose value is greater than left's
-        if allow_exact_matches:
-            while right_pos >= 0 and\
-                right_values[right_pos] >= left_values[left_pos]:
-                right_pos -= 1
-        else:
-            while right_pos >= 0 and\
-                right_values[right_pos] > left_values[left_pos]:
-                right_pos -= 1
-        right_pos += 1
-
-        # save positions as the desired index
-        left_indexer[left_pos] = left_pos
-        right_indexer[left_pos] = right_pos\
-                                  if right_pos != right_size else -1
-
-        # if needed, verify that tolerance is met
-        if has_tolerance and right_pos != right_size:
-            diff = right_values[right_pos] - left_values[left_pos]
-            if diff > tolerance_:
-                right_indexer[left_pos] = -1
-
-    return left_indexer, right_indexer
-
-
-def asof_join_nearest_{{on_dtype}}(
-        ndarray[{{on_dtype}}] left_values,
-        ndarray[{{on_dtype}}] right_values,
-        bint allow_exact_matches=1,
-        tolerance=None):
-
-    cdef:
-        Py_ssize_t left_size, right_size, i
-        ndarray[int64_t] left_indexer, right_indexer, bli, bri, fli, fri
-        {{on_dtype}} bdiff, fdiff
-
-    left_size = len(left_values)
-    right_size = len(right_values)
-
-    left_indexer = np.empty(left_size, dtype=np.int64)
-    right_indexer = np.empty(left_size, dtype=np.int64)
-
-    # search both forward and backward
-    bli, bri = asof_join_backward_{{on_dtype}}(left_values, right_values,
-                                               allow_exact_matches, tolerance)
-    fli, fri = asof_join_forward_{{on_dtype}}(left_values, right_values,
-                                              allow_exact_matches, tolerance)
-
-    for i in range(len(bri)):
-        # choose timestamp from right with smaller difference
-        if bri[i] != -1 and fri[i] != -1:
-            bdiff = left_values[bli[i]] - right_values[bri[i]]
-            fdiff = right_values[fri[i]] - left_values[fli[i]]
-            right_indexer[i] = bri[i] if bdiff <= fdiff else fri[i]
-        else:
-            right_indexer[i] = bri[i] if bri[i] != -1 else fri[i]
-        left_indexer[i] = bli[i]
-
-    return left_indexer, right_indexer
-
-{{endfor}}
diff --git a/pandas/_libs/join_helper.pxi.in b/pandas/_libs/join_helper.pxi.in
deleted file mode 100644
index feb8cfb76a7f0..0000000000000
--- a/pandas/_libs/join_helper.pxi.in
+++ /dev/null
@@ -1,408 +0,0 @@
-"""
-Template for each `dtype` helper function for join
-
-WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
-"""
-
-#----------------------------------------------------------------------
-# left_join_indexer, inner_join_indexer, outer_join_indexer
-#----------------------------------------------------------------------
-
-{{py:
-
-# name, c_type, dtype
-dtypes = [('float64', 'float64_t', 'np.float64'),
-          ('float32', 'float32_t', 'np.float32'),
-          ('object', 'object', 'object'),
-          ('int32', 'int32_t', 'np.int32'),
-          ('int64', 'int64_t', 'np.int64'),
-          ('uint64', 'uint64_t', 'np.uint64')]
-
-def get_dispatch(dtypes):
-
-    for name, c_type, dtype in dtypes:
-        yield name, c_type, dtype
-
-}}
-
-{{for name, c_type, dtype in get_dispatch(dtypes)}}
-
-# Joins on ordered, unique indices
-
-# right might contain non-unique values
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def left_join_indexer_unique_{{name}}(ndarray[{{c_type}}] left,
-                                      ndarray[{{c_type}}] right):
-    cdef:
-        Py_ssize_t i, j, nleft, nright
-        ndarray[int64_t] indexer
-        {{c_type}} lval, rval
-
-    i = 0
-    j = 0
-    nleft = len(left)
-    nright = len(right)
-
-    indexer = np.empty(nleft, dtype=np.int64)
-    while True:
-        if i == nleft:
-            break
-
-        if j == nright:
-            indexer[i] = -1
-            i += 1
-            continue
-
-        rval = right[j]
-
-        while i < nleft - 1 and left[i] == rval:
-            indexer[i] = j
-            i += 1
-
-        if left[i] == right[j]:
-            indexer[i] = j
-            i += 1
-            while i < nleft - 1 and left[i] == rval:
-                indexer[i] = j
-                i += 1
-            j += 1
-        elif left[i] > rval:
-            indexer[i] = -1
-            j += 1
-        else:
-            indexer[i] = -1
-            i += 1
-    return indexer
-
-
-# @cython.wraparound(False)
-# @cython.boundscheck(False)
-def left_join_indexer_{{name}}(ndarray[{{c_type}}] left,
-                               ndarray[{{c_type}}] right):
-    """
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    """
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        {{c_type}} lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[{{c_type}}] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype={{dtype}})
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0:
-        while i < nleft:
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    i += 1
-                    count += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = left[i]
-                count += 1
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def inner_join_indexer_{{name}}(ndarray[{{c_type}}] left,
-                                ndarray[{{c_type}}] right):
-    """
-    Two-pass algorithm for monotonic indexes. Handles many-to-one merges
-    """
-    cdef:
-        Py_ssize_t i, j, k, nright, nleft, count
-        {{c_type}} lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[{{c_type}}] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    # do it again now that result size is known
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype={{dtype}})
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft > 0 and nright > 0:
-        while True:
-            if i == nleft:
-                break
-            if j == nright:
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                i += 1
-            else:
-                j += 1
-
-    return result, lindexer, rindexer
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def outer_join_indexer_{{name}}(ndarray[{{c_type}}] left,
-                                ndarray[{{c_type}}] right):
-    cdef:
-        Py_ssize_t i, j, nright, nleft, count
-        {{c_type}} lval, rval
-        ndarray[int64_t] lindexer, rindexer
-        ndarray[{{c_type}}] result
-
-    nleft = len(left)
-    nright = len(right)
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        count = nright
-    elif nright == 0:
-        count = nleft
-    else:
-        while True:
-            if i == nleft:
-                count += nright - j
-                break
-            if j == nright:
-                count += nleft - i
-                break
-
-            lval = left[i]
-            rval = right[j]
-            if lval == rval:
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                count += 1
-                i += 1
-            else:
-                count += 1
-                j += 1
-
-    lindexer = np.empty(count, dtype=np.int64)
-    rindexer = np.empty(count, dtype=np.int64)
-    result = np.empty(count, dtype={{dtype}})
-
-    # do it again, but populate the indexers / result
-
-    i = 0
-    j = 0
-    count = 0
-    if nleft == 0:
-        for j in range(nright):
-            lindexer[j] = -1
-            rindexer[j] = j
-            result[j] = right[j]
-    elif nright == 0:
-        for i in range(nleft):
-            lindexer[i] = i
-            rindexer[i] = -1
-            result[i] = left[i]
-    else:
-        while True:
-            if i == nleft:
-                while j < nright:
-                    lindexer[count] = -1
-                    rindexer[count] = j
-                    result[count] = right[j]
-                    count += 1
-                    j += 1
-                break
-            if j == nright:
-                while i < nleft:
-                    lindexer[count] = i
-                    rindexer[count] = -1
-                    result[count] = left[i]
-                    count += 1
-                    i += 1
-                break
-
-            lval = left[i]
-            rval = right[j]
-
-            if lval == rval:
-                lindexer[count] = i
-                rindexer[count] = j
-                result[count] = lval
-                count += 1
-                if i < nleft - 1:
-                    if j < nright - 1 and right[j + 1] == rval:
-                        j += 1
-                    else:
-                        i += 1
-                        if left[i] != rval:
-                            j += 1
-                elif j < nright - 1:
-                    j += 1
-                    if lval != right[j]:
-                        i += 1
-                else:
-                    # end of the road
-                    break
-            elif lval < rval:
-                lindexer[count] = i
-                rindexer[count] = -1
-                result[count] = lval
-                count += 1
-                i += 1
-            else:
-                lindexer[count] = -1
-                rindexer[count] = j
-                result[count] = rval
-                count += 1
-                j += 1
-
-    return result, lindexer, rindexer
-
-{{endfor}}
diff --git a/pandas/_libs/khash.pxd b/pandas/_libs/khash.pxd
new file mode 100644
index 0000000000000..971a45e365586
--- /dev/null
+++ b/pandas/_libs/khash.pxd
@@ -0,0 +1,141 @@
+# -*- coding: utf-8 -*-
+from cpython cimport PyObject
+from numpy cimport int64_t, uint64_t, int32_t, uint32_t, float64_t
+
+cdef extern from "khash_python.h":
+    ctypedef uint32_t khint_t
+    ctypedef khint_t khiter_t
+
+    ctypedef struct kh_pymap_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        PyObject **keys
+        size_t *vals
+
+    kh_pymap_t* kh_init_pymap()
+    void kh_destroy_pymap(kh_pymap_t*)
+    void kh_clear_pymap(kh_pymap_t*)
+    khint_t kh_get_pymap(kh_pymap_t*, PyObject*)
+    void kh_resize_pymap(kh_pymap_t*, khint_t)
+    khint_t kh_put_pymap(kh_pymap_t*, PyObject*, int*)
+    void kh_del_pymap(kh_pymap_t*, khint_t)
+
+    bint kh_exist_pymap(kh_pymap_t*, khiter_t)
+
+    ctypedef struct kh_pyset_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        PyObject **keys
+        size_t *vals
+
+    kh_pyset_t* kh_init_pyset()
+    void kh_destroy_pyset(kh_pyset_t*)
+    void kh_clear_pyset(kh_pyset_t*)
+    khint_t kh_get_pyset(kh_pyset_t*, PyObject*)
+    void kh_resize_pyset(kh_pyset_t*, khint_t)
+    khint_t kh_put_pyset(kh_pyset_t*, PyObject*, int*)
+    void kh_del_pyset(kh_pyset_t*, khint_t)
+
+    bint kh_exist_pyset(kh_pyset_t*, khiter_t)
+
+    ctypedef char* kh_cstr_t
+
+    ctypedef struct kh_str_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        kh_cstr_t *keys
+        size_t *vals
+
+    kh_str_t* kh_init_str() nogil
+    void kh_destroy_str(kh_str_t*) nogil
+    void kh_clear_str(kh_str_t*) nogil
+    khint_t kh_get_str(kh_str_t*, kh_cstr_t) nogil
+    void kh_resize_str(kh_str_t*, khint_t) nogil
+    khint_t kh_put_str(kh_str_t*, kh_cstr_t, int*) nogil
+    void kh_del_str(kh_str_t*, khint_t) nogil
+
+    bint kh_exist_str(kh_str_t*, khiter_t) nogil
+
+    ctypedef struct kh_int64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        int64_t *keys
+        size_t *vals
+
+    kh_int64_t* kh_init_int64() nogil
+    void kh_destroy_int64(kh_int64_t*) nogil
+    void kh_clear_int64(kh_int64_t*) nogil
+    khint_t kh_get_int64(kh_int64_t*, int64_t) nogil
+    void kh_resize_int64(kh_int64_t*, khint_t) nogil
+    khint_t kh_put_int64(kh_int64_t*, int64_t, int*) nogil
+    void kh_del_int64(kh_int64_t*, khint_t) nogil
+
+    bint kh_exist_int64(kh_int64_t*, khiter_t) nogil
+
+    ctypedef uint64_t khuint64_t
+
+    ctypedef struct kh_uint64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        khuint64_t *keys
+        size_t *vals
+
+    kh_uint64_t* kh_init_uint64() nogil
+    void kh_destroy_uint64(kh_uint64_t*) nogil
+    void kh_clear_uint64(kh_uint64_t*) nogil
+    khint_t kh_get_uint64(kh_uint64_t*, uint64_t) nogil
+    void kh_resize_uint64(kh_uint64_t*, khint_t) nogil
+    khint_t kh_put_uint64(kh_uint64_t*, uint64_t, int*) nogil
+    void kh_del_uint64(kh_uint64_t*, khint_t) nogil
+
+    bint kh_exist_uint64(kh_uint64_t*, khiter_t) nogil
+
+    ctypedef struct kh_float64_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        float64_t *keys
+        size_t *vals
+
+    kh_float64_t* kh_init_float64() nogil
+    void kh_destroy_float64(kh_float64_t*) nogil
+    void kh_clear_float64(kh_float64_t*) nogil
+    khint_t kh_get_float64(kh_float64_t*, float64_t) nogil
+    void kh_resize_float64(kh_float64_t*, khint_t) nogil
+    khint_t kh_put_float64(kh_float64_t*, float64_t, int*) nogil
+    void kh_del_float64(kh_float64_t*, khint_t) nogil
+
+    bint kh_exist_float64(kh_float64_t*, khiter_t) nogil
+
+    ctypedef struct kh_int32_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        int32_t *keys
+        size_t *vals
+
+    kh_int32_t* kh_init_int32() nogil
+    void kh_destroy_int32(kh_int32_t*) nogil
+    void kh_clear_int32(kh_int32_t*) nogil
+    khint_t kh_get_int32(kh_int32_t*, int32_t) nogil
+    void kh_resize_int32(kh_int32_t*, khint_t) nogil
+    khint_t kh_put_int32(kh_int32_t*, int32_t, int*) nogil
+    void kh_del_int32(kh_int32_t*, khint_t) nogil
+
+    bint kh_exist_int32(kh_int32_t*, khiter_t) nogil
+
+    # sweep factorize
+
+    ctypedef struct kh_strbox_t:
+        khint_t n_buckets, size, n_occupied, upper_bound
+        uint32_t *flags
+        kh_cstr_t *keys
+        PyObject **vals
+
+    kh_strbox_t* kh_init_strbox() nogil
+    void kh_destroy_strbox(kh_strbox_t*) nogil
+    void kh_clear_strbox(kh_strbox_t*) nogil
+    khint_t kh_get_strbox(kh_strbox_t*, kh_cstr_t) nogil
+    void kh_resize_strbox(kh_strbox_t*, khint_t) nogil
+    khint_t kh_put_strbox(kh_strbox_t*, kh_cstr_t, int*) nogil
+    void kh_del_strbox(kh_strbox_t*, khint_t) nogil
+
+    bint kh_exist_strbox(kh_strbox_t*, khiter_t) nogil
diff --git a/pandas/_libs/lib.pxd b/pandas/_libs/lib.pxd
deleted file mode 100644
index 554b0248e97ea..0000000000000
--- a/pandas/_libs/lib.pxd
+++ /dev/null
@@ -1,4 +0,0 @@
-# prototypes for sharing
-
-cdef bint is_null_datetimelike(v)
-cpdef bint is_period(val)
diff --git a/pandas/_libs/lib.pyx b/pandas/_libs/lib.pyx
index f902422b0916d..34ceeb20e260e 100644
--- a/pandas/_libs/lib.pyx
+++ b/pandas/_libs/lib.pyx
@@ -1,270 +1,188 @@
-# cython: profile=False
-cimport numpy as np
-cimport cython
-import numpy as np
-import sys
+# -*- coding: utf-8 -*-
+from decimal import Decimal
+from fractions import Fraction
+from numbers import Number
 
-cdef bint PY3 = (sys.version_info[0] >= 3)
-
-from numpy cimport *
+import sys
+import warnings
 
-np.import_array()
+import cython
+from cython import Py_ssize_t
 
-cdef extern from "numpy/arrayobject.h":
-    cdef enum NPY_TYPES:
-        NPY_intp "NPY_INTP"
-
-from libc.stdlib cimport malloc, free
-
-from cpython cimport (PyDict_New, PyDict_GetItem, PyDict_SetItem,
-                      PyDict_Contains, PyDict_Keys,
-                      Py_INCREF, PyTuple_SET_ITEM,
-                      PyList_Check, PyFloat_Check,
-                      PyString_Check,
-                      PyBytes_Check,
-                      PyTuple_SetItem,
+from cpython cimport (Py_INCREF, PyTuple_SET_ITEM,
                       PyTuple_New,
-                      PyObject_SetAttrString,
-                      PyObject_RichCompareBool,
-                      PyBytes_GET_SIZE,
-                      PyUnicode_GET_SIZE,
-                      PyObject)
-
-try:
-    from cpython cimport PyString_GET_SIZE
-except ImportError:
-    from cpython cimport PyUnicode_GET_SIZE as PyString_GET_SIZE
-
-cdef extern from "Python.h":
-    Py_ssize_t PY_SSIZE_T_MAX
+                      Py_EQ,
+                      PyObject_RichCompareBool)
 
-cdef extern from "compat_helper.h":
-
-    cdef int slice_get_indices(
-        PyObject* s, Py_ssize_t length,
-        Py_ssize_t *start, Py_ssize_t *stop, Py_ssize_t *step,
-        Py_ssize_t *slicelength) except -1
+from cpython.datetime cimport (PyDateTime_Check, PyDate_Check,
+                               PyTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
 
-cimport cpython
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray, PyArray_GETITEM,
+                    PyArray_ITER_DATA, PyArray_ITER_NEXT, PyArray_IterNew,
+                    flatiter, NPY_OBJECT,
+                    int64_t,
+                    float32_t, float64_t,
+                    uint8_t, uint64_t,
+                    complex128_t)
+cnp.import_array()
 
-isnan = np.isnan
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
-cdef double NAN = nan
+cdef extern from "numpy/arrayobject.h":
+    # cython's numpy.dtype specification is incorrect, which leads to
+    # errors in issubclass(self.dtype.type, np.bool_), so we directly
+    # include the correct version
+    # https://github.com/cython/cython/issues/2022
 
-from datetime import datetime as pydatetime
+    ctypedef class numpy.dtype [object PyArray_Descr]:
+        # Use PyDataType_* macros when possible, however there are no macros
+        # for accessing some of the fields, so some are defined. Please
+        # ask on cython-dev if you need more.
+        cdef:
+            int type_num
+            int itemsize "elsize"
+            char byteorder
+            object fields
+            tuple names
 
-# this is our tseries.pxd
-from datetime cimport *
 
-from tslib cimport (convert_to_tsobject, convert_to_timedelta64,
-                    _check_all_nulls)
-import tslib
-from tslib import NaT, Timestamp, Timedelta
+cdef extern from "src/parse_helper.h":
+    int floatify(object, float64_t *result, int *maybe_int) except -1
 
-cdef int64_t NPY_NAT = util.get_nat()
+cimport pandas._libs.util as util
+from pandas._libs.util cimport is_nan, UINT64_MAX, INT64_MAX, INT64_MIN
 
-ctypedef unsigned char UChar
+from pandas._libs.tslib import array_to_datetime
+from pandas._libs.tslibs.nattype cimport NPY_NAT
+from pandas._libs.tslibs.nattype import NaT
+from pandas._libs.tslibs.conversion cimport convert_to_tsobject
+from pandas._libs.tslibs.timedeltas cimport convert_to_timedelta64
+from pandas._libs.tslibs.timezones cimport get_timezone, tz_compare
 
-cimport util
-from util cimport (is_array, _checknull, _checknan, INT64_MAX,
-                   INT64_MIN, UINT8_MAX)
+from pandas._libs.missing cimport (
+    checknull, isnaobj, is_null_datetime64, is_null_timedelta64, is_null_period
+)
 
-cdef extern from "math.h":
-    double sqrt(double x)
-    double fabs(double)
 
-# import datetime C API
-PyDateTime_IMPORT
+# constants that will be compared to potentially arbitrarily large
+# python int
+cdef:
+    object oINT64_MAX = <int64_t>INT64_MAX
+    object oINT64_MIN = <int64_t>INT64_MIN
+    object oUINT64_MAX = <uint64_t>UINT64_MAX
 
-# initialize numpy
-import_array()
-import_ufunc()
+    bint PY2 = sys.version_info[0] == 2
+    float64_t NaN = <float64_t>np.NaN
 
 
-def values_from_object(object o):
+def values_from_object(obj: object):
     """ return my values or the object if we are say an ndarray """
-    cdef f
-
-    f = getattr(o, 'get_values', None)
-    if f is not None:
-        o = f()
-
-    return o
-
-cpdef map_indices_list(list index):
-    """
-    Produce a dict mapping the values of the input array to their respective
-    locations.
-
-    Example:
-        array(['hi', 'there']) --> {'hi' : 0 , 'there' : 1}
-
-    Better to do this with Cython because of the enormous speed boost.
-    """
-    cdef Py_ssize_t i, length
-    cdef dict result = {}
+    func: object
 
-    length = len(index)
+    func = getattr(obj, 'get_values', None)
+    if func is not None:
+        obj = func()
 
-    for i from 0 <= i < length:
-        result[index[i]] = i
-
-    return result
+    return obj
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def memory_usage_of_objects(ndarray[object, ndim=1] arr):
+def memory_usage_of_objects(arr: object[:]) -> int64_t:
     """ return the memory usage of an object array in bytes,
     does not include the actual bytes of the pointers """
-    cdef Py_ssize_t i, n
-    cdef int64_t s = 0
-
-    n = len(arr)
-    for i from 0 <= i < n:
-        s += arr[i].__sizeof__()
-    return s
-
-#----------------------------------------------------------------------
-# datetime / io related
-
-cdef int _EPOCH_ORD = 719163
-
-from datetime import date as pydate
-
-cdef inline int64_t gmtime(object date):
-    cdef int y, m, d, h, mn, s, days
-
-    y = PyDateTime_GET_YEAR(date)
-    m = PyDateTime_GET_MONTH(date)
-    d = PyDateTime_GET_DAY(date)
-    h = PyDateTime_DATE_GET_HOUR(date)
-    mn = PyDateTime_DATE_GET_MINUTE(date)
-    s = PyDateTime_DATE_GET_SECOND(date)
-
-    days = pydate(y, m, 1).toordinal() - _EPOCH_ORD + d - 1
-    return ((<int64_t> (((days * 24 + h) * 60 + mn))) * 60 + s) * 1000
-
-
-cpdef object to_datetime(int64_t timestamp):
-    return pydatetime.utcfromtimestamp(timestamp / 1000.0)
-
-
-cpdef object to_timestamp(object dt):
-    return gmtime(dt)
-
-
-def array_to_timestamp(ndarray[object, ndim=1] arr):
-    cdef int i, n
-    cdef ndarray[int64_t, ndim=1] result
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.int64)
-
-    for i from 0 <= i < n:
-        result[i] = gmtime(arr[i])
-
-    return result
-
-
-def time64_to_datetime(ndarray[int64_t, ndim=1] arr):
-    cdef int i, n
-    cdef ndarray[object, ndim=1] result
+    i: Py_ssize_t
+    n: Py_ssize_t
+    size: int64_t
 
+    size = 0
     n = len(arr)
-    result = np.empty(n, dtype=object)
-
-    for i from 0 <= i < n:
-        result[i] = to_datetime(arr[i])
-
-    return result
-
-
-#----------------------------------------------------------------------
-# isnull / notnull related
-
-cdef double INF = <double> np.inf
-cdef double NEGINF = -INF
+    for i in range(n):
+        size += arr[i].__sizeof__()
+    return size
 
 
-cpdef bint checknull(object val):
-    if util.is_float_object(val) or util.is_complex_object(val):
-        return val != val # and val != INF and val != NEGINF
-    elif util.is_datetime64_object(val):
-        return get_datetime64_value(val) == NPY_NAT
-    elif val is NaT:
-        return True
-    elif util.is_timedelta64_object(val):
-        return get_timedelta64_value(val) == NPY_NAT
-    elif is_array(val):
-        return False
-    else:
-        return _checknull(val)
+# ----------------------------------------------------------------------
 
 
-cpdef bint checknull_old(object val):
-    if util.is_float_object(val) or util.is_complex_object(val):
-        return val != val or val == INF or val == NEGINF
-    elif util.is_datetime64_object(val):
-        return get_datetime64_value(val) == NPY_NAT
-    elif val is NaT:
-        return True
-    elif util.is_timedelta64_object(val):
-        return get_timedelta64_value(val) == NPY_NAT
-    elif is_array(val):
-        return False
-    else:
-        return util._checknull(val)
+def is_scalar(val: object) -> bool:
+    """
+    Return True if given value is scalar.
 
+    Parameters
+    ----------
+    val : object
+        This includes:
+
+        - numpy array scalar (e.g. np.int64)
+        - Python builtin numerics
+        - Python builtin byte arrays and strings
+        - None
+        - datetime.datetime
+        - datetime.timedelta
+        - Period
+        - decimal.Decimal
+        - Interval
+        - DateOffset
+        - Fraction
+        - Number
 
-cpdef bint isposinf_scalar(object val):
-    if util.is_float_object(val) and val == INF:
-        return True
-    else:
-        return False
+    Returns
+    -------
+    bool
+        Return True if given object is scalar, False otherwise
 
+    Examples
+    --------
+    >>> dt = pd.datetime.datetime(2018, 10, 3)
+    >>> pd.is_scalar(dt)
+    True
 
-cpdef bint isneginf_scalar(object val):
-    if util.is_float_object(val) and val == NEGINF:
-        return True
-    else:
-        return False
+    >>> pd.api.types.is_scalar([2, 3])
+    False
 
+    >>> pd.api.types.is_scalar({0: 1, 2: 3})
+    False
 
-cpdef bint isscalar(object val):
-    """
-    Return True if given value is scalar.
+    >>> pd.api.types.is_scalar((0, 2))
+    False
 
-    This includes:
-    - numpy array scalar (e.g. np.int64)
-    - Python builtin numerics
-    - Python builtin byte arrays and strings
-    - None
-    - instances of datetime.datetime
-    - instances of datetime.timedelta
-    - Period
-    - instances of decimal.Decimal
+    pandas supports PEP 3141 numbers:
 
+    >>> from fractions import Fraction
+    >>> pd.api.types.is_scalar(Fraction(3, 5))
+    True
     """
 
-    return (np.PyArray_IsAnyScalar(val)
-            # As of numpy-1.9, PyArray_IsAnyScalar misses bytearrays on Py3.
-            or PyBytes_Check(val)
-            # We differ from numpy (as of 1.10), which claims that None is
-            # not scalar in np.isscalar().
+    return (cnp.PyArray_IsAnyScalar(val)
+            # PyArray_IsAnyScalar is always False for bytearrays on Py3
+            or isinstance(val, (Fraction, Number))
+            # We differ from numpy, which claims that None is not scalar;
+            # see np.isscalar
             or val is None
             or PyDate_Check(val)
             or PyDelta_Check(val)
             or PyTime_Check(val)
             or util.is_period_object(val)
-            or is_decimal(val))
+            or is_decimal(val)
+            or is_interval(val)
+            or util.is_offset_object(val))
 
 
-def item_from_zerodim(object val):
+def item_from_zerodim(val: object) -> object:
     """
     If the value is a zerodim array, return the item it contains.
 
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : object
+
     Examples
     --------
     >>> item_from_zerodim(1)
@@ -277,123 +195,28 @@ def item_from_zerodim(object val):
     array([1])
 
     """
-    return util.unbox_if_zerodim(val)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj(ndarray arr):
-    cdef Py_ssize_t i, n
-    cdef object val
-    cdef ndarray[uint8_t] result
-
-    assert arr.ndim == 1, "'arr' must be 1-D."
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-    for i from 0 <= i < n:
-        val = arr[i]
-        result[i] = _check_all_nulls(val)
-    return result.view(np.bool_)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj_old(ndarray arr):
-    cdef Py_ssize_t i, n
-    cdef object val
-    cdef ndarray[uint8_t] result
-
-    assert arr.ndim == 1, "'arr' must be 1-D."
-
-    n = len(arr)
-    result = np.zeros(n, dtype=np.uint8)
-    for i from 0 <= i < n:
-        val = arr[i]
-        result[i] = val is NaT or util._checknull_old(val)
-    return result.view(np.bool_)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj2d(ndarray arr):
-    cdef Py_ssize_t i, j, n, m
-    cdef object val
-    cdef ndarray[uint8_t, ndim=2] result
-
-    assert arr.ndim == 2, "'arr' must be 2-D."
-
-    n, m = (<object> arr).shape
-    result = np.zeros((n, m), dtype=np.uint8)
-    for i from 0 <= i < n:
-        for j from 0 <= j < m:
-            val = arr[i, j]
-            if checknull(val):
-                result[i, j] = 1
-    return result.view(np.bool_)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def isnullobj2d_old(ndarray arr):
-    cdef Py_ssize_t i, j, n, m
-    cdef object val
-    cdef ndarray[uint8_t, ndim=2] result
-
-    assert arr.ndim == 2, "'arr' must be 2-D."
-
-    n, m = (<object> arr).shape
-    result = np.zeros((n, m), dtype=np.uint8)
-    for i from 0 <= i < n:
-        for j from 0 <= j < m:
-            val = arr[i, j]
-            if checknull_old(val):
-                result[i, j] = 1
-    return result.view(np.bool_)
+    if cnp.PyArray_IsZeroDim(val):
+        return cnp.PyArray_ToScalar(cnp.PyArray_DATA(val), val)
+    return val
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-cpdef ndarray[object] list_to_object_array(list obj):
-    """
-    Convert list to object ndarray. Seriously can\'t believe
-    I had to write this function.
+def fast_unique_multiple(list arrays, sort: bool=True):
     """
-    cdef:
-        Py_ssize_t i, n = len(obj)
-        ndarray[object] arr = np.empty(n, dtype=object)
-
-    for i in range(n):
-        arr[i] = obj[i]
-
-    return arr
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique(ndarray[object] values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        list uniques = []
-        dict table = {}
-        object val, stub = 0
-
-    for i from 0 <= i < n:
-        val = values[i]
-        if val not in table:
-            table[val] = stub
-            uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
-
-    return uniques
+    Generate a list of unique values from a list of arrays.
 
+    Parameters
+    ----------
+    list : array-like
+        A list of array-like objects
+    sort : boolean
+        Whether or not to sort the resulting unique list
 
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def fast_unique_multiple(list arrays):
+    Returns
+    -------
+    unique_list : list of unique values
+    """
     cdef:
         ndarray[object] buf
         Py_ssize_t k = len(arrays)
@@ -402,25 +225,27 @@ def fast_unique_multiple(list arrays):
         dict table = {}
         object val, stub = 0
 
-    for i from 0 <= i < k:
+    for i in range(k):
         buf = arrays[i]
         n = len(buf)
-        for j from 0 <= j < n:
+        for j in range(n):
             val = buf[j]
             if val not in table:
                 table[val] = stub
                 uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
+    if sort is None:
+        try:
+            uniques.sort()
+        except Exception:
+            # TODO: RuntimeWarning?
+            pass
 
     return uniques
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def fast_unique_multiple_list(list lists):
+def fast_unique_multiple_list(lists: list, sort: bool=True) -> list:
     cdef:
         list buf
         Py_ssize_t k = len(lists)
@@ -429,18 +254,19 @@ def fast_unique_multiple_list(list lists):
         dict table = {}
         object val, stub = 0
 
-    for i from 0 <= i < k:
+    for i in range(k):
         buf = lists[i]
         n = len(buf)
-        for j from 0 <= j < n:
+        for j in range(n):
             val = buf[j]
             if val not in table:
                 table[val] = stub
                 uniques.append(val)
-    try:
-        uniques.sort()
-    except Exception:
-        pass
+    if sort:
+        try:
+            uniques.sort()
+        except Exception:
+            pass
 
     return uniques
 
@@ -471,7 +297,7 @@ def fast_unique_multiple_list_gen(object gen, bint sort=True):
 
     for buf in gen:
         n = len(buf)
-        for j from 0 <= j < n:
+        for j in range(n):
             val = buf[j]
             if val not in table:
                 table[val] = stub
@@ -487,7 +313,7 @@ def fast_unique_multiple_list_gen(object gen, bint sort=True):
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def dicts_to_array(list dicts, list columns):
+def dicts_to_array(dicts: list, columns: list):
     cdef:
         Py_ssize_t i, j, k, n
         ndarray[object, ndim=2] result
@@ -528,7 +354,7 @@ def fast_zip(list ndarrays):
 
     # initialize tuples on first pass
     arr = ndarrays[0]
-    it = <flatiter> PyArray_IterNew(arr)
+    it = <flatiter>PyArray_IterNew(arr)
     for i in range(n):
         val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
         tup = PyTuple_New(k)
@@ -540,7 +366,7 @@ def fast_zip(list ndarrays):
 
     for j in range(1, k):
         arr = ndarrays[j]
-        it = <flatiter> PyArray_IterNew(arr)
+        it = <flatiter>PyArray_IterNew(arr)
         if len(arr) != n:
             raise ValueError('all arrays must be same length')
 
@@ -553,7 +379,7 @@ def fast_zip(list ndarrays):
     return result
 
 
-def get_reverse_indexer(ndarray[int64_t] indexer, Py_ssize_t length):
+def get_reverse_indexer(const int64_t[:] indexer, Py_ssize_t length):
     """
     Reverse indexing operation.
 
@@ -571,7 +397,7 @@ def get_reverse_indexer(ndarray[int64_t] indexer, Py_ssize_t length):
         int64_t idx
 
     rev_indexer = np.empty(length, dtype=np.int64)
-    rev_indexer.fill(-1)
+    rev_indexer[:] = -1
     for i in range(n):
         idx = indexer[i]
         if idx != -1:
@@ -580,7 +406,9 @@ def get_reverse_indexer(ndarray[int64_t] indexer, Py_ssize_t length):
     return rev_indexer
 
 
-def has_infs_f4(ndarray[float32_t] arr):
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def has_infs_f4(const float32_t[:] arr) -> bool:
     cdef:
         Py_ssize_t i, n = len(arr)
         float32_t inf, neginf, val
@@ -595,7 +423,9 @@ def has_infs_f4(ndarray[float32_t] arr):
     return False
 
 
-def has_infs_f8(ndarray[float64_t] arr):
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def has_infs_f8(const float64_t[:] arr) -> bool:
     cdef:
         Py_ssize_t i, n = len(arr)
         float64_t inf, neginf, val
@@ -610,30 +440,6 @@ def has_infs_f8(ndarray[float64_t] arr):
     return False
 
 
-def convert_timestamps(ndarray values):
-    cdef:
-        object val, f, result
-        dict cache = {}
-        Py_ssize_t i, n = len(values)
-        ndarray[object] out
-
-    # for HDFStore, a bit temporary but...
-
-    from datetime import datetime
-    f = datetime.fromtimestamp
-
-    out = np.empty(n, dtype='O')
-
-    for i in range(n):
-        val = util.get_value_1d(values, i)
-        if val in cache:
-            out[i] = cache[val]
-        else:
-            cache[val] = out[i] = f(val)
-
-    return out
-
-
 def maybe_indices_to_slice(ndarray[int64_t] indices, int max_len):
     cdef:
         Py_ssize_t i, n = len(indices)
@@ -671,6 +477,8 @@ def maybe_indices_to_slice(ndarray[int64_t] indices, int max_len):
                 return slice(vstart, vlast - 1, k)
 
 
+@cython.wraparound(False)
+@cython.boundscheck(False)
 def maybe_booleans_to_slice(ndarray[uint8_t] mask):
     cdef:
         Py_ssize_t i, n = len(mask)
@@ -702,74 +510,7 @@ def maybe_booleans_to_slice(ndarray[uint8_t] mask):
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def scalar_compare(ndarray[object] values, object val, object op):
-    import operator
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[uint8_t, cast=True] result
-        bint isnull_val
-        int flag
-        object x
-
-    if op is operator.lt:
-        flag = cpython.Py_LT
-    elif op is operator.le:
-        flag = cpython.Py_LE
-    elif op is operator.gt:
-        flag = cpython.Py_GT
-    elif op is operator.ge:
-        flag = cpython.Py_GE
-    elif op is operator.eq:
-        flag = cpython.Py_EQ
-    elif op is operator.ne:
-        flag = cpython.Py_NE
-    else:
-        raise ValueError('Unrecognized operator')
-
-    result = np.empty(n, dtype=bool).view(np.uint8)
-    isnull_val = checknull(val)
-
-    if flag == cpython.Py_NE:
-        for i in range(n):
-            x = values[i]
-            if checknull(x):
-                result[i] = True
-            elif isnull_val:
-                result[i] = True
-            else:
-                try:
-                    result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-                except (TypeError):
-                    result[i] = True
-    elif flag == cpython.Py_EQ:
-        for i in range(n):
-            x = values[i]
-            if checknull(x):
-                result[i] = False
-            elif isnull_val:
-                result[i] = False
-            else:
-                try:
-                    result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-                except (TypeError):
-                    result[i] = False
-
-    else:
-        for i in range(n):
-            x = values[i]
-            if checknull(x):
-                result[i] = False
-            elif isnull_val:
-                result[i] = False
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, val, flag)
-
-    return result.view(bool)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cpdef bint array_equivalent_object(object[:] left, object[:] right):
+def array_equivalent_object(left: object[:], right: object[:]) -> bool:
     """ perform an element by element comparion on 1-d object arrays
         taking into account nan positions """
     cdef:
@@ -782,387 +523,147 @@ cpdef bint array_equivalent_object(object[:] left, object[:] right):
 
         # we are either not equal or both nan
         # I think None == None will be true here
-        if not (PyObject_RichCompareBool(x, y, cpython.Py_EQ) or
-                _checknull(x) and _checknull(y)):
+        if not (PyObject_RichCompareBool(x, y, Py_EQ) or
+                (x is None or is_nan(x)) and (y is None or is_nan(y))):
             return False
     return True
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def vec_compare(ndarray[object] left, ndarray[object] right, object op):
-    import operator
-    cdef:
-        Py_ssize_t i, n = len(left)
-        ndarray[uint8_t, cast=True] result
-        int flag
-
-    if n != len(right):
-        raise ValueError('Arrays were different lengths: %d vs %d'
-                         % (n, len(right)))
-
-    if op is operator.lt:
-        flag = cpython.Py_LT
-    elif op is operator.le:
-        flag = cpython.Py_LE
-    elif op is operator.gt:
-        flag = cpython.Py_GT
-    elif op is operator.ge:
-        flag = cpython.Py_GE
-    elif op is operator.eq:
-        flag = cpython.Py_EQ
-    elif op is operator.ne:
-        flag = cpython.Py_NE
-    else:
-        raise ValueError('Unrecognized operator')
-
-    result = np.empty(n, dtype=bool).view(np.uint8)
-
-    if flag == cpython.Py_NE:
-        for i in range(n):
-            x = left[i]
-            y = right[i]
-
-            if checknull(x) or checknull(y):
-                result[i] = True
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, y, flag)
-    else:
-        for i in range(n):
-            x = left[i]
-            y = right[i]
-
-            if checknull(x) or checknull(y):
-                result[i] = False
-            else:
-                result[i] = cpython.PyObject_RichCompareBool(x, y, flag)
-
-    return result.view(bool)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def scalar_binop(ndarray[object] values, object val, object op):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] result
-        object x
-
-    result = np.empty(n, dtype=object)
-    if util._checknull(val):
-        result.fill(val)
-        return result
-
-    for i in range(n):
-        x = values[i]
-        if util._checknull(x):
-            result[i] = x
-        else:
-            result[i] = op(x, val)
-
-    return maybe_convert_bool(result)
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def vec_binop(ndarray[object] left, ndarray[object] right, object op):
-    cdef:
-        Py_ssize_t i, n = len(left)
-        ndarray[object] result
-
-    if n != len(right):
-        raise ValueError('Arrays were different lengths: %d vs %d'
-                         % (n, len(right)))
-
-    result = np.empty(n, dtype=object)
-
-    for i in range(n):
-        x = left[i]
-        y = right[i]
-        try:
-            result[i] = op(x, y)
-        except TypeError:
-            if util._checknull(x):
-                result[i] = x
-            elif util._checknull(y):
-                result[i] = y
-            else:
-                raise
-
-    return maybe_convert_bool(result)
-
-
 def astype_intsafe(ndarray[object] arr, new_dtype):
     cdef:
         Py_ssize_t i, n = len(arr)
-        object v
+        object val
         bint is_datelike
         ndarray result
 
-    # on 32-bit, 1.6.2 numpy M8[ns] is a subdtype of integer, which is weird
-    is_datelike = new_dtype in ['M8[ns]', 'm8[ns]']
-
+    is_datelike = new_dtype == 'm8[ns]'
     result = np.empty(n, dtype=new_dtype)
     for i in range(n):
-        v = arr[i]
-        if is_datelike and checknull(v):
+        val = arr[i]
+        if is_datelike and checknull(val):
             result[i] = NPY_NAT
         else:
-            # we can use the unsafe version because we know `result` is mutable
-            # since it was created from `np.empty`
-            util.set_value_at_unsafe(result, i, v)
+            result[i] = val
 
     return result
 
 
-cpdef ndarray[object] astype_unicode(ndarray arr):
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def astype_unicode(arr: ndarray, skipna: bool=False) -> ndarray[object]:
+    """
+    Convert all elements in an array to unicode.
+
+    Parameters
+    ----------
+    arr : ndarray
+        The array whose elements we are casting.
+    skipna : bool, default False
+        Whether or not to coerce nulls to their stringified form
+        (e.g. NaN becomes 'nan').
+
+    Returns
+    -------
+    casted_arr : ndarray
+        A new array with the input array's elements casted.
+    """
     cdef:
+        object arr_i
         Py_ssize_t i, n = arr.size
         ndarray[object] result = np.empty(n, dtype=object)
 
     for i in range(n):
-        # we can use the unsafe version because we know `result` is mutable
-        # since it was created from `np.empty`
-        util.set_value_at_unsafe(result, i, unicode(arr[i]))
+        arr_i = arr[i]
+
+        if not (skipna and checknull(arr_i)):
+            arr_i = unicode(arr_i)
+
+        result[i] = arr_i
 
     return result
 
 
-cpdef ndarray[object] astype_str(ndarray arr):
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def astype_str(arr: ndarray, skipna: bool=False) -> ndarray[object]:
+    """
+    Convert all elements in an array to string.
+
+    Parameters
+    ----------
+    arr : ndarray
+        The array whose elements we are casting.
+    skipna : bool, default False
+        Whether or not to coerce nulls to their stringified form
+        (e.g. NaN becomes 'nan').
+
+    Returns
+    -------
+    casted_arr : ndarray
+        A new array with the input array's elements casted.
+    """
     cdef:
+        object arr_i
         Py_ssize_t i, n = arr.size
         ndarray[object] result = np.empty(n, dtype=object)
 
     for i in range(n):
-        # we can use the unsafe version because we know `result` is mutable
-        # since it was created from `np.empty`
-        util.set_value_at_unsafe(result, i, str(arr[i]))
+        arr_i = arr[i]
+
+        if not (skipna and checknull(arr_i)):
+            arr_i = str(arr_i)
+
+        result[i] = arr_i
 
     return result
 
 
-def clean_index_list(list obj):
-    """
-    Utility used in pandas.core.index._ensure_index
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def clean_index_list(obj: list):
+    """
+    Utility used in pandas.core.index.ensure_index
     """
     cdef:
-        ndarray[object] converted
         Py_ssize_t i, n = len(obj)
-        object v
+        object val
         bint all_arrays = 1
 
     for i in range(n):
-        v = obj[i]
-        if not (PyList_Check(v) or np.PyArray_Check(v) or hasattr(v, '_data')):
+        val = obj[i]
+        if not (isinstance(val, list) or
+                util.is_array(val) or hasattr(val, '_data')):
             all_arrays = 0
             break
 
     if all_arrays:
         return obj, all_arrays
 
-    converted = np.empty(n, dtype=object)
-    for i in range(n):
-        v = obj[i]
-        if PyList_Check(v) or np.PyArray_Check(v) or hasattr(v, '_data'):
-            converted[i] = tuple(v)
-        else:
-            converted[i] = v
-
-    return maybe_convert_objects(converted), 0
-
-
-ctypedef fused pandas_string:
-    str
-    unicode
-    bytes
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-cpdef Py_ssize_t max_len_string_array(pandas_string[:] arr):
-    """ return the maximum size of elements in a 1-dim string array """
-    cdef:
-        Py_ssize_t i, m = 0, l = 0, length = arr.shape[0]
-        pandas_string v
-
-    for i in range(length):
-        v = arr[i]
-        if PyString_Check(v):
-            l = PyString_GET_SIZE(v)
-        elif PyBytes_Check(v):
-            l = PyBytes_GET_SIZE(v)
-        elif PyUnicode_Check(v):
-            l = PyUnicode_GET_SIZE(v)
-
-        if l > m:
-            m = l
-
-    return m
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def string_array_replace_from_nan_rep(
-        ndarray[object, ndim=1] arr, object nan_rep,
-        object replace=None):
-    """
-    Replace the values in the array with 'replacement' if
-    they are 'nan_rep'. Return the same array.
-    """
-
-    cdef int length = arr.shape[0], i = 0
-    if replace is None:
-        replace = np.nan
-
-    for i from 0 <= i < length:
-        if arr[i] == nan_rep:
-            arr[i] = replace
-
-    return arr
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def convert_json_to_lines(object arr):
-    """
-    replace comma separated json with line feeds, paying special attention
-    to quotes & brackets
-    """
-    cdef:
-        Py_ssize_t i = 0, num_open_brackets_seen = 0, length
-        bint in_quotes = 0, is_escaping = 0
-        ndarray[uint8_t] narr
-        unsigned char v, comma, left_bracket, right_brack, newline
-
-    newline = ord('\n')
-    comma = ord(',')
-    left_bracket = ord('{')
-    right_bracket = ord('}')
-    quote = ord('"')
-    backslash = ord('\\')
-
-    narr = np.frombuffer(arr.encode('utf-8'), dtype='u1').copy()
-    length = narr.shape[0]
-    for i in range(length):
-        v = narr[i]
-        if v == quote and i > 0 and not is_escaping:
-            in_quotes = ~in_quotes
-        if v == backslash or is_escaping:
-            is_escaping = ~is_escaping
-        if v == comma: # commas that should be \n
-            if num_open_brackets_seen == 0 and not in_quotes:
-                narr[i] = newline
-        elif v == left_bracket:
-            if not in_quotes:
-                num_open_brackets_seen += 1
-        elif v == right_bracket:
-            if not in_quotes:
-                num_open_brackets_seen -= 1
-
-    return narr.tostring().decode('utf-8')
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def write_csv_rows(list data, ndarray data_index,
-                   int nlevels, ndarray cols, object writer):
-
-    cdef int N, j, i, ncols
-    cdef list rows
-    cdef object val
-
-    # In crude testing, N>100 yields little marginal improvement
-    N=100
-
-    # pre-allocate  rows
-    ncols = len(cols)
-    rows = [[None] * (nlevels + ncols) for x in range(N)]
-
-    j = -1
-    if nlevels == 1:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            row[0] = data_index[j]
-            for i in range(ncols):
-                row[1 + i] = data[i][j]
-
-            if j >= N - 1 and j % N == N - 1:
-                writer.writerows(rows)
-    elif nlevels > 1:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            row[:nlevels] = list(data_index[j])
-            for i in range(ncols):
-                row[nlevels + i] = data[i][j]
-
-            if j >= N - 1 and j % N == N - 1:
-                writer.writerows(rows)
-    else:
-        for j in range(len(data_index)):
-            row = rows[j % N]
-            for i in range(ncols):
-                row[i] = data[i][j]
-
-            if j >= N - 1 and j % N == N - 1:
-                writer.writerows(rows)
+    # don't force numpy coerce with nan's
+    inferred = infer_dtype(obj, skipna=False)
+    if inferred in ['string', 'bytes', 'unicode', 'mixed', 'mixed-integer']:
+        return np.asarray(obj, dtype=object), 0
+    elif inferred in ['integer']:
+        # TODO: we infer an integer but it *could* be a uint64
+        try:
+            return np.asarray(obj, dtype='int64'), 0
+        except OverflowError:
+            return np.asarray(obj, dtype='object'), 0
 
-    if  j >= 0 and (j < N - 1 or (j % N) != N - 1):
-        writer.writerows(rows[:((j + 1) % N)])
+    return np.asarray(obj), 0
 
 
-#------------------------------------------------------------------------------
+# ------------------------------------------------------------------------------
 # Groupby-related functions
-@cython.boundscheck(False)
-def arrmap(ndarray[object] index, object func):
-    cdef int length = index.shape[0]
-    cdef int i = 0
-
-    cdef ndarray[object] result = np.empty(length, dtype=np.object_)
-
-    for i from 0 <= i < length:
-        result[i] = func(index[i])
-
-    return result
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def is_lexsorted(list list_of_arrays):
-    cdef:
-        int i
-        Py_ssize_t n, nlevels
-        int64_t k, cur, pre
-        ndarray arr
-
-    nlevels = len(list_of_arrays)
-    n = len(list_of_arrays[0])
-
-    cdef int64_t **vecs = <int64_t**> malloc(nlevels * sizeof(int64_t*))
-    for i from 0 <= i < nlevels:
-        arr = list_of_arrays[i]
-        vecs[i] = <int64_t *> arr.data
-
-    # Assume uniqueness??
-    for i from 1 <= i < n:
-        for k from 0 <= k < nlevels:
-            cur = vecs[k][i]
-            pre = vecs[k][i - 1]
-            if cur == pre:
-                continue
-            elif cur > pre:
-                break
-            else:
-                return False
-    free(vecs)
-    return True
-
 
 # TODO: could do even better if we know something about the data. eg, index has
-# 1-min data, binner has 5-min data, then  bins are just strides in index. This
+# 1-min data, binner has 5-min data, then bins are just strides in index. This
 # is a general, O(max(len(values), len(binner))) method.
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
+def generate_bins_dt64(ndarray[int64_t] values, const int64_t[:] binner,
                        object closed='left', bint hasnans=0):
     """
     Int64 (datetime64) version of generic python version in groupby.py
@@ -1175,7 +676,7 @@ def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
 
     nat_count = 0
     if hasnans:
-        mask = values == iNaT
+        mask = values == NPY_NAT
         nat_count = np.sum(mask)
         values = values[~mask]
 
@@ -1195,7 +696,7 @@ def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
     bins = np.empty(lenbin - 1, dtype=np.int64)
 
     j = 0  # index into values
-    bc = 0 # bin count
+    bc = 0  # bin count
 
     # linear scan
     if right_closed:
@@ -1225,14 +726,14 @@ def generate_bins_dt64(ndarray[int64_t] values, ndarray[int64_t] binner,
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def row_bool_subset(ndarray[float64_t, ndim=2] values,
+def row_bool_subset(const float64_t[:, :] values,
                     ndarray[uint8_t, cast=True] mask):
     cdef:
         Py_ssize_t i, j, n, k, pos = 0
         ndarray[float64_t, ndim=2] out
 
-    n, k = (<object> values).shape
-    assert(n == len(mask))
+    n, k = (<object>values).shape
+    assert (n == len(mask))
 
     out = np.empty((mask.sum(), k), dtype=np.float64)
 
@@ -1253,8 +754,8 @@ def row_bool_subset_object(ndarray[object, ndim=2] values,
         Py_ssize_t i, j, n, k, pos = 0
         ndarray[object, ndim=2] out
 
-    n, k = (<object> values).shape
-    assert(n == len(mask))
+    n, k = (<object>values).shape
+    assert (n == len(mask))
 
     out = np.empty((mask.sum(), k), dtype=object)
 
@@ -1269,8 +770,8 @@ def row_bool_subset_object(ndarray[object, ndim=2] values,
 
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def get_level_sorter(ndarray[int64_t, ndim=1] label,
-                     ndarray[int64_t, ndim=1] starts):
+def get_level_sorter(const int64_t[:] label,
+                     const int64_t[:] starts):
     """
     argsort for a single level of a multi-index, keeping the order of higher
     levels unchanged. `starts` points to starts of same-key indices w.r.t
@@ -1282,130 +783,46 @@ def get_level_sorter(ndarray[int64_t, ndim=1] label,
         int64_t l, r
         Py_ssize_t i
         ndarray[int64_t, ndim=1] out = np.empty(len(label), dtype=np.int64)
+        ndarray[int64_t, ndim=1] label_arr = np.asarray(label)
 
     for i in range(len(starts) - 1):
         l, r = starts[i], starts[i + 1]
-        out[l:r] = l + label[l:r].argsort(kind='mergesort')
+        out[l:r] = l + label_arr[l:r].argsort(kind='mergesort')
 
     return out
 
 
-def group_count(ndarray[int64_t] values, Py_ssize_t size):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] counts
-
-    counts = np.zeros(size, dtype=np.int64)
-    for i in range(n):
-        counts[values[i]] += 1
-    return counts
-
-
-def lookup_values(ndarray[object] values, dict mapping):
-    cdef:
-        Py_ssize_t i, n = len(values)
-
-    result = np.empty(n, dtype='O')
-    for i in range(n):
-        result[i] = mapping[values[i]]
-    return maybe_convert_objects(result)
-
-
 @cython.boundscheck(False)
 @cython.wraparound(False)
 def count_level_2d(ndarray[uint8_t, ndim=2, cast=True] mask,
-                   ndarray[int64_t, ndim=1] labels,
+                   const int64_t[:] labels,
                    Py_ssize_t max_bin,
                    int axis):
     cdef:
         Py_ssize_t i, j, k, n
         ndarray[int64_t, ndim=2] counts
 
-    assert(axis == 0 or axis == 1)
-    n, k = (<object> mask).shape
+    assert (axis == 0 or axis == 1)
+    n, k = (<object>mask).shape
 
     if axis == 0:
         counts = np.zeros((max_bin, k), dtype='i8')
         with nogil:
-            for i from 0 <= i < n:
-                for j from 0 <= j < k:
+            for i in range(n):
+                for j in range(k):
                     counts[labels[i], j] += mask[i, j]
 
     else:  # axis == 1
         counts = np.zeros((n, max_bin), dtype='i8')
         with nogil:
-            for i from 0 <= i < n:
-                for j from 0 <= j < k:
+            for i in range(n):
+                for j in range(k):
                     counts[i, labels[j]] += mask[i, j]
 
     return counts
 
 
-cdef class _PandasNull:
-
-    def __richcmp__(_PandasNull self, object other, int op):
-        if op == 2: # ==
-            return isinstance(other, _PandasNull)
-        elif op == 3: # !=
-            return not isinstance(other, _PandasNull)
-        else:
-            return False
-
-    def __hash__(self):
-        return 0
-
-pandas_null = _PandasNull()
-
-
-def fast_zip_fillna(list ndarrays, fill_value=pandas_null):
-    """
-    For zipping multiple ndarrays into an ndarray of tuples
-    """
-    cdef:
-        Py_ssize_t i, j, k, n
-        ndarray[object] result
-        flatiter it
-        object val, tup
-
-    k = len(ndarrays)
-    n = len(ndarrays[0])
-
-    result = np.empty(n, dtype=object)
-
-    # initialize tuples on first pass
-    arr = ndarrays[0]
-    it = <flatiter> PyArray_IterNew(arr)
-    for i in range(n):
-        val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-        tup = PyTuple_New(k)
-
-        if val != val:
-            val = fill_value
-
-        PyTuple_SET_ITEM(tup, 0, val)
-        Py_INCREF(val)
-        result[i] = tup
-        PyArray_ITER_NEXT(it)
-
-    for j in range(1, k):
-        arr = ndarrays[j]
-        it = <flatiter> PyArray_IterNew(arr)
-        if len(arr) != n:
-            raise ValueError('all arrays must be same length')
-
-        for i in range(n):
-            val = PyArray_GETITEM(arr, PyArray_ITER_DATA(it))
-            if val != val:
-                val = fill_value
-
-            PyTuple_SET_ITEM(result[i], j, val)
-            Py_INCREF(val)
-            PyArray_ITER_NEXT(it)
-
-    return result
-
-
-def generate_slices(ndarray[int64_t] labels, Py_ssize_t ngroups):
+def generate_slices(const int64_t[:] labels, Py_ssize_t ngroups):
     cdef:
         Py_ssize_t i, group_size, n, start
         int64_t lab
@@ -1434,7 +851,7 @@ def generate_slices(ndarray[int64_t] labels, Py_ssize_t ngroups):
     return starts, ends
 
 
-def indices_fast(object index, ndarray[int64_t] labels, list keys,
+def indices_fast(object index, const int64_t[:] labels, list keys,
                  list sorted_labels):
     cdef:
         Py_ssize_t i, j, k, lab, cur, start, n = len(labels)
@@ -1475,425 +892,1470 @@ def indices_fast(object index, ndarray[int64_t] labels, list keys,
     return result
 
 
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def get_blkno_indexers(int64_t[:] blknos, bint group=True):
+# core.common import for fast inference checks
+
+def is_float(obj: object) -> bool:
+    return util.is_float_object(obj)
+
+
+def is_integer(obj: object) -> bool:
+    return util.is_integer_object(obj)
+
+
+def is_bool(obj: object) -> bool:
+    return util.is_bool_object(obj)
+
+
+def is_complex(obj: object) -> bool:
+    return util.is_complex_object(obj)
+
+
+cpdef bint is_decimal(object obj):
+    return isinstance(obj, Decimal)
+
+
+cpdef bint is_interval(object obj):
+    return getattr(obj, '_typ', '_typ') == 'interval'
+
+
+def is_period(val: object) -> bool:
+    """ Return a boolean if this is a Period object """
+    return util.is_period_object(val)
+
+
+_TYPE_MAP = {
+    'categorical': 'categorical',
+    'category': 'categorical',
+    'int8': 'integer',
+    'int16': 'integer',
+    'int32': 'integer',
+    'int64': 'integer',
+    'i': 'integer',
+    'uint8': 'integer',
+    'uint16': 'integer',
+    'uint32': 'integer',
+    'uint64': 'integer',
+    'u': 'integer',
+    'float32': 'floating',
+    'float64': 'floating',
+    'f': 'floating',
+    'complex64': 'complex',
+    'complex128': 'complex',
+    'c': 'complex',
+    'string': 'string' if PY2 else 'bytes',
+    'S': 'string' if PY2 else 'bytes',
+    'unicode': 'unicode' if PY2 else 'string',
+    'U': 'unicode' if PY2 else 'string',
+    'bool': 'boolean',
+    'b': 'boolean',
+    'datetime64[ns]': 'datetime64',
+    'M': 'datetime64',
+    'timedelta64[ns]': 'timedelta64',
+    'm': 'timedelta64',
+}
+
+# types only exist on certain platform
+try:
+    np.float128
+    _TYPE_MAP['float128'] = 'floating'
+except AttributeError:
+    pass
+try:
+    np.complex256
+    _TYPE_MAP['complex256'] = 'complex'
+except AttributeError:
+    pass
+try:
+    np.float16
+    _TYPE_MAP['float16'] = 'floating'
+except AttributeError:
+    pass
+
+
+cdef class Seen(object):
+    """
+    Class for keeping track of the types of elements
+    encountered when trying to perform type conversions.
     """
-    Enumerate contiguous runs of integers in ndarray.
 
-    Iterate over elements of `blknos` yielding ``(blkno, slice(start, stop))``
-    pairs for each contiguous run found.
+    cdef:
+        bint int_             # seen_int
+        bint bool_            # seen_bool
+        bint null_            # seen_null
+        bint uint_            # seen_uint (unsigned integer)
+        bint sint_            # seen_sint (signed integer)
+        bint float_           # seen_float
+        bint object_          # seen_object
+        bint complex_         # seen_complex
+        bint datetime_        # seen_datetime
+        bint coerce_numeric   # coerce data to numeric
+        bint timedelta_       # seen_timedelta
+        bint datetimetz_      # seen_datetimetz
+
+    def __cinit__(self, bint coerce_numeric=0):
+        """
+        Initialize a Seen instance.
+
+        Parameters
+        ----------
+        coerce_numeric : bint, default 0
+            Whether or not to force conversion to a numeric data type if
+            initial methods to convert to numeric fail.
+        """
+        self.int_ = 0
+        self.bool_ = 0
+        self.null_ = 0
+        self.uint_ = 0
+        self.sint_ = 0
+        self.float_ = 0
+        self.object_ = 0
+        self.complex_ = 0
+        self.datetime_ = 0
+        self.timedelta_ = 0
+        self.datetimetz_ = 0
+        self.coerce_numeric = coerce_numeric
+
+    cdef inline bint check_uint64_conflict(self) except -1:
+        """
+        Check whether we can safely convert a uint64 array to a numeric dtype.
+
+        There are two cases when conversion to numeric dtype with a uint64
+        array is not safe (and will therefore not be performed)
+
+        1) A NaN element is encountered.
+
+           uint64 cannot be safely cast to float64 due to truncation issues
+           at the extreme ends of the range.
+
+        2) A negative number is encountered.
+
+           There is no numerical dtype that can hold both negative numbers
+           and numbers greater than INT64_MAX. Hence, at least one number
+           will be improperly cast if we convert to a numeric dtype.
+
+        Returns
+        -------
+        return_values : bool
+            Whether or not we should return the original input array to avoid
+            data truncation.
+
+        Raises
+        ------
+        ValueError : uint64 elements were detected, and at least one of the
+                     two conflict cases was also detected. However, we are
+                     trying to force conversion to a numeric dtype.
+        """
+        return (self.uint_ and (self.null_ or self.sint_)
+                and not self.coerce_numeric)
+
+    cdef inline saw_null(self):
+        """
+        Set flags indicating that a null value was encountered.
+        """
+        self.null_ = 1
+        self.float_ = 1
+
+    cdef saw_int(self, object val):
+        """
+        Set flags indicating that an integer value was encountered.
+
+        In addition to setting a flag that an integer was seen, we
+        also set two flags depending on the type of integer seen:
+
+        1) sint_ : a negative (signed) number in the
+                   range of [-2**63, 0) was encountered
+        2) uint_ : a positive number in the range of
+                   [2**63, 2**64) was encountered
+
+        Parameters
+        ----------
+        val : Python int
+            Value with which to set the flags.
+        """
+        self.int_ = 1
+        self.sint_ = self.sint_ or (oINT64_MIN <= val < 0)
+        self.uint_ = self.uint_ or (oINT64_MAX < val <= oUINT64_MAX)
 
-    If `group` is True and there is more than one run for a certain blkno,
-    ``(blkno, array)`` with an array containing positions of all elements equal
-    to blkno.
+    @property
+    def numeric_(self):
+        return self.complex_ or self.float_ or self.int_
+
+    @property
+    def is_bool(self):
+        return not (self.datetime_ or self.numeric_ or self.timedelta_)
+
+    @property
+    def is_float_or_complex(self):
+        return not (self.bool_ or self.datetime_ or self.timedelta_)
+
+
+cdef _try_infer_map(v):
+    """ if its in our map, just return the dtype """
+    cdef:
+        object attr, val
+    for attr in ['name', 'kind', 'base']:
+        val = getattr(v.dtype, attr)
+        if val in _TYPE_MAP:
+            return _TYPE_MAP[val]
+    return None
+
+
+def infer_dtype(value: object, skipna: object=None) -> str:
+    """
+    Efficiently infer the type of a passed val, or list-like
+    array of values. Return a string describing the type.
+
+    Parameters
+    ----------
+    value : scalar, list, ndarray, or pandas type
+    skipna : bool, default False
+        Ignore NaN values when inferring the type.
+
+        .. versionadded:: 0.21.0
 
     Returns
     -------
-    iter : iterator of (int, slice or array)
+    string describing the common type of the input data.
+    Results can include:
+
+    - string
+    - unicode
+    - bytes
+    - floating
+    - integer
+    - mixed-integer
+    - mixed-integer-float
+    - decimal
+    - complex
+    - categorical
+    - boolean
+    - datetime64
+    - datetime
+    - date
+    - timedelta64
+    - timedelta
+    - time
+    - period
+    - mixed
+
+    Raises
+    ------
+    TypeError if ndarray-like but cannot infer the dtype
+
+    Notes
+    -----
+    - 'mixed' is the catchall for anything that is not otherwise
+      specialized
+    - 'mixed-integer-float' are floats and integers
+    - 'mixed-integer' are integers mixed with non-integers
+
+    Examples
+    --------
+    >>> infer_dtype(['foo', 'bar'])
+    'string'
+
+    >>> infer_dtype(['a', np.nan, 'b'], skipna=True)
+    'string'
 
+    >>> infer_dtype(['a', np.nan, 'b'], skipna=False)
+    'mixed'
+
+    >>> infer_dtype([b'foo', b'bar'])
+    'bytes'
+
+    >>> infer_dtype([1, 2, 3])
+    'integer'
+
+    >>> infer_dtype([1, 2, 3.5])
+    'mixed-integer-float'
+
+    >>> infer_dtype([1.0, 2.0, 3.5])
+    'floating'
+
+    >>> infer_dtype(['a', 1])
+    'mixed-integer'
+
+    >>> infer_dtype([Decimal(1), Decimal(2.0)])
+    'decimal'
+
+    >>> infer_dtype([True, False])
+    'boolean'
+
+    >>> infer_dtype([True, False, np.nan])
+    'mixed'
+
+    >>> infer_dtype([pd.Timestamp('20130101')])
+    'datetime'
+
+    >>> infer_dtype([datetime.date(2013, 1, 1)])
+    'date'
+
+    >>> infer_dtype([np.datetime64('2013-01-01')])
+    'datetime64'
+
+    >>> infer_dtype([datetime.timedelta(0, 1, 1)])
+    'timedelta'
+
+    >>> infer_dtype(pd.Series(list('aabc')).astype('category'))
+    'categorical'
     """
-    # There's blkno in this function's name because it's used in block &
-    # blockno handling.
     cdef:
-        int64_t cur_blkno
-        Py_ssize_t i, start, stop, n, diff
+        Py_ssize_t i, n
+        object val
+        ndarray values
+        bint seen_pdnat = False
+        bint seen_val = False
+
+    if skipna is None:
+        msg = ('A future version of pandas will default to `skipna=True`. To '
+               'silence this warning, pass `skipna=True|False` explicitly.')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        skipna = False
+
+    if util.is_array(value):
+        values = value
+    elif hasattr(value, 'dtype'):
+        # this will handle ndarray-like
+        # e.g. categoricals
+        try:
+            values = getattr(value, '_values', getattr(value, 'values', value))
+        except:
+            value = _try_infer_map(value)
+            if value is not None:
+                return value
 
-        object blkno
-        list group_order
-        dict group_slices
-        int64_t[:] res_view
+            # its ndarray like but we can't handle
+            raise ValueError("cannot infer type for {typ}"
+                             .format(typ=type(value)))
 
-    n = blknos.shape[0]
+    else:
+        if not isinstance(value, list):
+            value = list(value)
+        from pandas.core.dtypes.cast import (
+            construct_1d_object_array_from_listlike)
+        values = construct_1d_object_array_from_listlike(value)
 
-    if n == 0:
-        return
+    values = getattr(values, 'values', values)
 
-    start = 0
-    cur_blkno = blknos[start]
+    # make contiguous
+    values = values.ravel()
 
-    if group == False:
-        for i in range(1, n):
-            if blknos[i] != cur_blkno:
-                yield cur_blkno, slice(start, i)
+    if skipna:
+        values = values[~isnaobj(values)]
 
-                start = i
-                cur_blkno = blknos[i]
+    val = _try_infer_map(values)
+    if val is not None:
+        return val
 
-        yield cur_blkno, slice(start, n)
-    else:
-        group_order = []
-        group_dict = {}
-
-        for i in range(1, n):
-            if blknos[i] != cur_blkno:
-                if cur_blkno not in group_dict:
-                    group_order.append(cur_blkno)
-                    group_dict[cur_blkno] = [(start, i)]
-                else:
-                    group_dict[cur_blkno].append((start, i))
+    if values.dtype != np.object_:
+        values = values.astype('O')
 
-                start = i
-                cur_blkno = blknos[i]
+    n = len(values)
+    if n == 0:
+        return 'empty'
 
-        if cur_blkno not in group_dict:
-            group_order.append(cur_blkno)
-            group_dict[cur_blkno] = [(start, n)]
+    # try to use a valid value
+    for i in range(n):
+        val = values[i]
+
+        # do not use is_nul_datetimelike to keep
+        # np.datetime64('nat') and np.timedelta64('nat')
+        if val is None or util.is_nan(val):
+            pass
+        elif val is NaT:
+            seen_pdnat = True
         else:
-            group_dict[cur_blkno].append((start, n))
+            seen_val = True
+            break
 
-        for blkno in group_order:
-            slices = group_dict[blkno]
-            if len(slices) == 1:
-                yield blkno, slice(slices[0][0], slices[0][1])
-            else:
-                tot_len = sum([stop - start for start, stop in slices])
-                result = np.empty(tot_len, dtype=np.int64)
-                res_view = result
+    # if all values are nan/NaT
+    if seen_val is False and seen_pdnat is True:
+        return 'datetime'
+        # float/object nan is handled in latter logic
 
-                i = 0
-                for start, stop in slices:
-                    for diff in range(start, stop):
-                        res_view[i] = diff
-                        i += 1
+    if util.is_datetime64_object(val):
+        if is_datetime64_array(values):
+            return 'datetime64'
 
-                yield blkno, result
+    elif is_timedelta(val):
+        if is_timedelta_or_timedelta64_array(values):
+            return 'timedelta'
 
+    elif util.is_integer_object(val):
+        # ordering matters here; this check must come after the is_timedelta
+        #  check otherwise numpy timedelta64 objects would come through here
 
-@cython.boundscheck(False)
-@cython.wraparound(False)
-cpdef slice indexer_as_slice(int64_t[:] vals):
-    cdef:
-        Py_ssize_t i, n, start, stop
-        int64_t d
+        if is_integer_array(values):
+            return 'integer'
+        elif is_integer_float_array(values):
+            return 'mixed-integer-float'
+        return 'mixed-integer'
 
-    if vals is None:
-        raise TypeError("vals must be ndarray")
+    elif PyDateTime_Check(val):
+        if is_datetime_array(values):
+            return 'datetime'
 
-    n = vals.shape[0]
+    elif PyDate_Check(val):
+        if is_date_array(values, skipna=skipna):
+            return 'date'
 
-    if n == 0 or vals[0] < 0:
-        return None
+    elif PyTime_Check(val):
+        if is_time_array(values, skipna=skipna):
+            return 'time'
 
-    if n == 1:
-        return slice(vals[0], vals[0] + 1, 1)
+    elif is_decimal(val):
+        return 'decimal'
 
-    if vals[1] < 0:
-        return None
+    elif is_complex(val):
+        return 'complex'
 
-    # n > 2
-    d = vals[1] - vals[0]
+    elif util.is_float_object(val):
+        if is_float_array(values):
+            return 'floating'
+        elif is_integer_float_array(values):
+            return 'mixed-integer-float'
 
-    if d == 0:
-        return None
+    elif util.is_bool_object(val):
+        if is_bool_array(values, skipna=skipna):
+            return 'boolean'
 
-    for i in range(2, n):
-        if vals[i] < 0 or vals[i] - vals[i - 1] != d:
-            return None
+    elif isinstance(val, str):
+        if is_string_array(values, skipna=skipna):
+            return 'string'
 
-    start = vals[0]
-    stop = start + n * d
-    if stop < 0 and d < 0:
-        return slice(start, None, d)
-    else:
-        return slice(start, stop, d)
+    elif isinstance(val, unicode):
+        if is_unicode_array(values, skipna=skipna):
+            return 'unicode'
+
+    elif isinstance(val, bytes):
+        if is_bytes_array(values, skipna=skipna):
+            return 'bytes'
+
+    elif util.is_period_object(val):
+        if is_period_array(values):
+            return 'period'
+
+    elif is_interval(val):
+        if is_interval_array(values):
+            return 'interval'
+
+    for i in range(n):
+        val = values[i]
+        if (util.is_integer_object(val) and
+                not util.is_timedelta64_object(val) and
+                not util.is_datetime64_object(val)):
+            return 'mixed-integer'
+
+    return 'mixed'
 
 
-cpdef slice_canonize(slice s):
+def infer_datetimelike_array(arr: object) -> object:
     """
-    Convert slice to canonical bounded form.
+    infer if we have a datetime or timedelta array
+    - date: we have *only* date and maybe strings, nulls
+    - datetime: we have *only* datetimes and maybe strings, nulls
+    - timedelta: we have *only* timedeltas and maybe strings, nulls
+    - nat: we do not have *any* date, datetimes or timedeltas, but do have
+      at least a NaT
+    - mixed: other objects (strings, a mix of tz-aware and tz-naive, or
+                            actual objects)
+
+    Parameters
+    ----------
+    arr : object array
+
+    Returns
+    -------
+    string: {datetime, timedelta, date, nat, mixed}
     """
+
     cdef:
-        Py_ssize_t start = 0, stop = 0, step = 1, length
+        Py_ssize_t i, n = len(arr)
+        bint seen_timedelta = 0, seen_date = 0, seen_datetime = 0
+        bint seen_tz_aware = 0, seen_tz_naive = 0
+        bint seen_nat = 0
+        list objs = []
+        object v
 
-    if s.step is None:
-        step = 1
-    else:
-        step = <Py_ssize_t>s.step
-        if step == 0:
-            raise ValueError("slice step cannot be zero")
+    for i in range(n):
+        v = arr[i]
+        if util.is_string_object(v):
+            objs.append(v)
 
-    if step > 0:
-        if s.stop is None:
-            raise ValueError("unbounded slice")
+            if len(objs) == 3:
+                break
 
-        stop = <Py_ssize_t>s.stop
-        if s.start is None:
-            start = 0
+        elif v is None or util.is_nan(v):
+            # nan or None
+            pass
+        elif v is NaT:
+            seen_nat = 1
+        elif PyDateTime_Check(v):
+            # datetime
+            seen_datetime = 1
+
+            # disambiguate between tz-naive and tz-aware
+            if v.tzinfo is None:
+                seen_tz_naive = 1
+            else:
+                seen_tz_aware = 1
+
+            if seen_tz_naive and seen_tz_aware:
+                return 'mixed'
+        elif util.is_datetime64_object(v):
+            # np.datetime64
+            seen_datetime = 1
+        elif PyDate_Check(v):
+            seen_date = 1
+        elif is_timedelta(v):
+            # timedelta, or timedelta64
+            seen_timedelta = 1
         else:
-            start = <Py_ssize_t>s.start
-            if start > stop:
-                start = stop
-    elif step < 0:
-        if s.start is None:
-            raise ValueError("unbounded slice")
-
-        start = <Py_ssize_t>s.start
-        if s.stop is None:
-            stop = -1
+            return 'mixed'
+
+    if seen_date and not (seen_datetime or seen_timedelta):
+        return 'date'
+    elif seen_datetime and not seen_timedelta:
+        return 'datetime'
+    elif seen_timedelta and not seen_datetime:
+        return 'timedelta'
+    elif seen_nat:
+        return 'nat'
+
+    # short-circuit by trying to
+    # actually convert these strings
+    # this is for performance as we don't need to try
+    # convert *every* string array
+    if len(objs):
+        try:
+            array_to_datetime(objs, errors='raise')
+            return 'datetime'
+        except:
+            pass
+
+        # we are *not* going to infer from strings
+        # for timedelta as too much ambiguity
+
+    return 'mixed'
+
+
+cdef inline bint is_timedelta(object o):
+    return PyDelta_Check(o) or util.is_timedelta64_object(o)
+
+
+cdef class Validator:
+
+    cdef:
+        Py_ssize_t n
+        dtype dtype
+        bint skipna
+
+    def __cinit__(self, Py_ssize_t n, dtype dtype=np.dtype(np.object_),
+                  bint skipna=False):
+        self.n = n
+        self.dtype = dtype
+        self.skipna = skipna
+
+    cdef bint validate(self, ndarray values) except -1:
+        if not self.n:
+            return False
+
+        if self.is_array_typed():
+            return True
+        elif self.dtype.type_num == NPY_OBJECT:
+            if self.skipna:
+                return self._validate_skipna(values)
+            else:
+                return self._validate(values)
         else:
-            stop = <Py_ssize_t>s.stop
-            if stop > start:
-                stop = start
+            return False
 
-    if start < 0 or (stop < 0 and s.stop is not None):
-        raise ValueError("unbounded slice")
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef bint _validate(self, ndarray values) except -1:
+        cdef:
+            Py_ssize_t i
+            Py_ssize_t n = self.n
 
-    if stop < 0:
-        return slice(start, None, step)
-    else:
-        return slice(start, stop, step)
+        for i in range(n):
+            if not self.is_valid(values[i]):
+                return False
 
+        return self.finalize_validate()
 
-cpdef slice_get_indices_ex(slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX):
-    """
-    Get (start, stop, step, length) tuple for a slice.
+    @cython.wraparound(False)
+    @cython.boundscheck(False)
+    cdef bint _validate_skipna(self, ndarray values) except -1:
+        cdef:
+            Py_ssize_t i
+            Py_ssize_t n = self.n
+
+        for i in range(n):
+            if not self.is_valid_skipna(values[i]):
+                return False
 
-    If `objlen` is not specified, slice must be bounded, otherwise the result
-    will be wrong.
+        return self.finalize_validate_skipna()
 
-    """
+    cdef bint is_valid(self, object value) except -1:
+        return self.is_value_typed(value)
+
+    cdef bint is_valid_skipna(self, object value) except -1:
+        return self.is_valid(value) or self.is_valid_null(value)
+
+    cdef bint is_value_typed(self, object value) except -1:
+        raise NotImplementedError(
+            '{typ} child class must define is_value_typed'
+            .format(typ=type(self).__name__))
+
+    cdef bint is_valid_null(self, object value) except -1:
+        return value is None or util.is_nan(value)
+
+    cdef bint is_array_typed(self) except -1:
+        return False
+
+    cdef inline bint finalize_validate(self):
+        return True
+
+    cdef bint finalize_validate_skipna(self):
+        # TODO(phillipc): Remove the existing validate methods and replace them
+        # with the skipna versions upon full deprecation of skipna=False
+        return True
+
+
+cdef class BoolValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_bool_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.bool_)
+
+
+cpdef bint is_bool_array(ndarray values, bint skipna=False):
     cdef:
-        Py_ssize_t start, stop, step, length
+        BoolValidator validator = BoolValidator(len(values),
+                                                values.dtype,
+                                                skipna=skipna)
+    return validator.validate(values)
 
-    if slc is None:
-        raise TypeError("slc should be a slice")
 
-    slice_get_indices(<PyObject *>slc, objlen,
-                      &start, &stop, &step, &length)
+cdef class IntegerValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_integer_object(value)
 
-    return start, stop, step, length
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.integer)
 
 
-cpdef Py_ssize_t slice_len(
-        slice slc, Py_ssize_t objlen=PY_SSIZE_T_MAX) except -1:
-    """
-    Get length of a bounded slice.
+cpdef bint is_integer_array(ndarray values):
+    cdef:
+        IntegerValidator validator = IntegerValidator(len(values),
+                                                      values.dtype)
+    return validator.validate(values)
+
+
+cdef class IntegerFloatValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_integer_object(value) or util.is_float_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.integer)
+
+
+cdef bint is_integer_float_array(ndarray values):
+    cdef:
+        IntegerFloatValidator validator = IntegerFloatValidator(len(values),
+                                                                values.dtype)
+    return validator.validate(values)
+
+
+cdef class FloatValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_float_object(value)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.floating)
+
+
+cpdef bint is_float_array(ndarray values):
+    cdef:
+        FloatValidator validator = FloatValidator(len(values), values.dtype)
+    return validator.validate(values)
+
+
+cdef class StringValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return isinstance(value, str)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.str_)
+
+
+cpdef bint is_string_array(ndarray values, bint skipna=False):
+    cdef:
+        StringValidator validator = StringValidator(len(values),
+                                                    values.dtype,
+                                                    skipna=skipna)
+    return validator.validate(values)
+
+
+cdef class UnicodeValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return isinstance(value, unicode)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.unicode_)
+
+
+cdef bint is_unicode_array(ndarray values, bint skipna=False):
+    cdef:
+        UnicodeValidator validator = UnicodeValidator(len(values),
+                                                      values.dtype,
+                                                      skipna=skipna)
+    return validator.validate(values)
+
+
+cdef class BytesValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return isinstance(value, bytes)
+
+    cdef inline bint is_array_typed(self) except -1:
+        return issubclass(self.dtype.type, np.bytes_)
+
+
+cdef bint is_bytes_array(ndarray values, bint skipna=False):
+    cdef:
+        BytesValidator validator = BytesValidator(len(values), values.dtype,
+                                                  skipna=skipna)
+    return validator.validate(values)
+
+
+cdef class TemporalValidator(Validator):
+    cdef:
+        Py_ssize_t generic_null_count
+
+    def __cinit__(self, Py_ssize_t n, dtype dtype=np.dtype(np.object_),
+                  bint skipna=False):
+        self.n = n
+        self.dtype = dtype
+        self.skipna = skipna
+        self.generic_null_count = 0
+
+    cdef inline bint is_valid(self, object value) except -1:
+        return self.is_value_typed(value) or self.is_valid_null(value)
+
+    cdef bint is_valid_null(self, object value) except -1:
+        raise NotImplementedError(
+            '{typ} child class must define is_valid_null'
+            .format(typ=type(self).__name__))
+
+    cdef inline bint is_valid_skipna(self, object value) except -1:
+        cdef:
+            bint is_typed_null = self.is_valid_null(value)
+            bint is_generic_null = value is None or util.is_nan(value)
+        self.generic_null_count += is_typed_null and is_generic_null
+        return self.is_value_typed(value) or is_typed_null or is_generic_null
 
-    The slice must not have any "open" bounds that would create dependency on
-    container size, i.e.:
-    - if ``s.step is None or s.step > 0``, ``s.stop`` is not ``None``
-    - if ``s.step < 0``, ``s.start`` is not ``None``
+    cdef inline bint finalize_validate_skipna(self):
+        return self.generic_null_count != self.n
 
-    Otherwise, the result is unreliable.
 
+cdef class DatetimeValidator(TemporalValidator):
+    cdef bint is_value_typed(self, object value) except -1:
+        return PyDateTime_Check(value)
+
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_datetime64(value)
+
+
+cpdef bint is_datetime_array(ndarray values):
+    cdef:
+        DatetimeValidator validator = DatetimeValidator(len(values),
+                                                        skipna=True)
+    return validator.validate(values)
+
+
+cdef class Datetime64Validator(DatetimeValidator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_datetime64_object(value)
+
+
+cpdef bint is_datetime64_array(ndarray values):
+    cdef:
+        Datetime64Validator validator = Datetime64Validator(len(values),
+                                                            skipna=True)
+    return validator.validate(values)
+
+
+def is_datetime_with_singletz_array(values: ndarray) -> bool:
+    """
+    Check values have the same tzinfo attribute.
+    Doesn't check values are datetime-like types.
     """
     cdef:
-        Py_ssize_t start, stop, step, length
+        Py_ssize_t i, j, n = len(values)
+        object base_val, base_tz, val, tz
 
-    if slc is None:
-        raise TypeError("slc must be slice")
+    if n == 0:
+        return False
+    # Get a reference timezone to compare with the rest of the tzs in the array
+    for i in range(n):
+        base_val = values[i]
+        if base_val is not NaT:
+            base_tz = get_timezone(getattr(base_val, 'tzinfo', None))
+            break
+
+    for j in range(i, n):
+        # Compare val's timezone with the reference timezone
+        # NaT can coexist with tz-aware datetimes, so skip if encountered
+        val = values[j]
+        if val is not NaT:
+            tz = getattr(val, 'tzinfo', None)
+            if not tz_compare(base_tz, tz):
+                return False
+
+    return True
+
+
+cdef class TimedeltaValidator(TemporalValidator):
+    cdef bint is_value_typed(self, object value) except -1:
+        return PyDelta_Check(value)
 
-    slice_get_indices(<PyObject *>slc, objlen,
-                      &start, &stop, &step, &length)
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_timedelta64(value)
 
-    return length
 
+cdef class AnyTimedeltaValidator(TimedeltaValidator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_timedelta(value)
 
-def slice_getitem(slice slc not None, ind):
+
+cpdef bint is_timedelta_or_timedelta64_array(ndarray values):
+    """ infer with timedeltas and/or nat/none """
     cdef:
-        Py_ssize_t s_start, s_stop, s_step, s_len
-        Py_ssize_t ind_start, ind_stop, ind_step, ind_len
+        AnyTimedeltaValidator validator = AnyTimedeltaValidator(len(values),
+                                                                skipna=True)
+    return validator.validate(values)
 
-    s_start, s_stop, s_step, s_len = slice_get_indices_ex(slc)
 
-    if isinstance(ind, slice):
-        ind_start, ind_stop, ind_step, ind_len = slice_get_indices_ex(ind,
-                                                                      s_len)
+cdef class DateValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return PyDate_Check(value)
 
-        if ind_step > 0 and ind_len == s_len:
-            # short-cut for no-op slice
-            if ind_len == s_len:
-                return slc
 
-        if ind_step < 0:
-            s_start = s_stop - s_step
-            ind_step = -ind_step
+cpdef bint is_date_array(ndarray values, bint skipna=False):
+    cdef:
+        DateValidator validator = DateValidator(len(values), skipna=skipna)
+    return validator.validate(values)
 
-        s_step *= ind_step
-        s_stop = s_start + ind_stop * s_step
-        s_start = s_start + ind_start * s_step
 
-        if s_step < 0 and s_stop < 0:
-            return slice(s_start, None, s_step)
-        else:
-            return slice(s_start, s_stop, s_step)
+cdef class TimeValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return PyTime_Check(value)
+
+
+cpdef bint is_time_array(ndarray values, bint skipna=False):
+    cdef:
+        TimeValidator validator = TimeValidator(len(values), skipna=skipna)
+    return validator.validate(values)
 
-    else:
-        return np.arange(s_start, s_stop, s_step, dtype=np.int64)[ind]
 
+cdef class PeriodValidator(TemporalValidator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return util.is_period_object(value)
 
-cdef class BlockPlacement:
-    # __slots__ = '_as_slice', '_as_array', '_len'
-    cdef slice _as_slice
-    cdef object _as_array
+    cdef inline bint is_valid_null(self, object value) except -1:
+        return is_null_period(value)
 
-    cdef bint _has_slice, _has_array, _is_known_slice_like
 
-    def __init__(self, val):
-        cdef slice slc
+cpdef bint is_period_array(ndarray values):
+    cdef:
+        PeriodValidator validator = PeriodValidator(len(values), skipna=True)
+    return validator.validate(values)
+
+
+cdef class IntervalValidator(Validator):
+    cdef inline bint is_value_typed(self, object value) except -1:
+        return is_interval(value)
+
 
-        self._has_slice = False
-        self._has_array = False
+cpdef bint is_interval_array(ndarray values):
+    cdef:
+        IntervalValidator validator = IntervalValidator(len(values),
+                                                        skipna=True)
+    return validator.validate(values)
 
-        if isinstance(val, slice):
-            slc = slice_canonize(val)
 
-            if slc.start != slc.stop:
-                self._as_slice = slc
-                self._has_slice = True
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def maybe_convert_numeric(ndarray[object] values, set na_values,
+                          bint convert_empty=True, bint coerce_numeric=False):
+    """
+    Convert object array to a numeric array if possible.
+
+    Parameters
+    ----------
+    values : ndarray
+        Array of object elements to convert.
+    na_values : set
+        Set of values that should be interpreted as NaN.
+    convert_empty : bool, default True
+        If an empty array-like object is encountered, whether to interpret
+        that element as NaN or not. If set to False, a ValueError will be
+        raised if such an element is encountered and 'coerce_numeric' is False.
+    coerce_numeric : bool, default False
+        If initial attempts to convert to numeric have failed, whether to
+        force conversion to numeric via alternative methods or by setting the
+        element to NaN. Otherwise, an Exception will be raised when such an
+        element is encountered.
+
+        This boolean also has an impact on how conversion behaves when a
+        numeric array has no suitable numerical dtype to return (i.e. uint64,
+        int32, uint8). If set to False, the original object array will be
+        returned. Otherwise, a ValueError will be raised.
+
+    Returns
+    -------
+    numeric_array : array of converted object values to numerical ones
+    """
+
+    if len(values) == 0:
+        return np.array([], dtype='i8')
+
+    # fastpath for ints - try to convert all based on first value
+    cdef:
+        object val = values[0]
+
+    if util.is_integer_object(val):
+        try:
+            maybe_ints = values.astype('i8')
+            if (maybe_ints == values).all():
+                return maybe_ints
+        except (ValueError, OverflowError, TypeError):
+            pass
+
+    # Otherwise, iterate and do full inference.
+    cdef:
+        int status, maybe_int
+        Py_ssize_t i, n = values.size
+        Seen seen = Seen(coerce_numeric)
+        ndarray[float64_t] floats = np.empty(n, dtype='f8')
+        ndarray[complex128_t] complexes = np.empty(n, dtype='c16')
+        ndarray[int64_t] ints = np.empty(n, dtype='i8')
+        ndarray[uint64_t] uints = np.empty(n, dtype='u8')
+        ndarray[uint8_t] bools = np.empty(n, dtype='u1')
+        float64_t fval
+
+    for i in range(n):
+        val = values[i]
+
+        if val.__hash__ is not None and val in na_values:
+            seen.saw_null()
+            floats[i] = complexes[i] = NaN
+        elif util.is_float_object(val):
+            fval = val
+            if fval != fval:
+                seen.null_ = True
+
+            floats[i] = complexes[i] = fval
+            seen.float_ = True
+        elif util.is_integer_object(val):
+            floats[i] = complexes[i] = val
+
+            val = int(val)
+            seen.saw_int(val)
+
+            if val >= 0:
+                if val <= oUINT64_MAX:
+                    uints[i] = val
+                else:
+                    seen.float_ = True
+
+            if oINT64_MIN <= val <= oINT64_MAX:
+                ints[i] = val
+
+            if val < oINT64_MIN or (seen.sint_ and seen.uint_):
+                seen.float_ = True
+
+        elif util.is_bool_object(val):
+            floats[i] = uints[i] = ints[i] = bools[i] = val
+            seen.bool_ = True
+        elif val is None:
+            seen.saw_null()
+            floats[i] = complexes[i] = NaN
+        elif hasattr(val, '__len__') and len(val) == 0:
+            if convert_empty or seen.coerce_numeric:
+                seen.saw_null()
+                floats[i] = complexes[i] = NaN
             else:
-                arr = np.empty(0, dtype=np.int64)
-                self._as_array = arr
-                self._has_array = True
-        else:
-            # Cython memoryview interface requires ndarray to be writeable.
-            arr = np.require(val, dtype=np.int64, requirements='W')
-            assert arr.ndim == 1
-            self._as_array = arr
-            self._has_array = True
-
-    def __str__(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            v = self._as_slice
+                raise ValueError('Empty string encountered')
+        elif util.is_complex_object(val):
+            complexes[i] = val
+            seen.complex_ = True
+        elif is_decimal(val):
+            floats[i] = complexes[i] = val
+            seen.float_ = True
         else:
-            v = self._as_array
+            try:
+                status = floatify(val, &fval, &maybe_int)
 
-        return '%s(%r)' % (self.__class__.__name__, v)
+                if fval in na_values:
+                    seen.saw_null()
+                    floats[i] = complexes[i] = NaN
+                else:
+                    if fval != fval:
+                        seen.null_ = True
 
-    __repr__ = __str__
+                    floats[i] = fval
 
-    def __len__(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return slice_len(s)
-        else:
-            return len(self._as_array)
-
-    def __iter__(self):
-        cdef slice s = self._ensure_has_slice()
-        cdef Py_ssize_t start, stop, step, _
-        if s is not None:
-            start, stop, step, _ = slice_get_indices_ex(s)
-            return iter(range(start, stop, step))
+                if maybe_int:
+                    as_int = int(val)
+
+                    if as_int in na_values:
+                        seen.saw_null()
+                    else:
+                        seen.saw_int(as_int)
+
+                    if as_int not in na_values:
+                        if as_int < oINT64_MIN or as_int > oUINT64_MAX:
+                            if seen.coerce_numeric:
+                                seen.float_ = True
+                            else:
+                                raise ValueError("Integer out of range.")
+                        else:
+                            if as_int >= 0:
+                                uints[i] = as_int
+
+                            if as_int <= oINT64_MAX:
+                                ints[i] = as_int
+
+                    seen.float_ = seen.float_ or (seen.uint_ and seen.sint_)
+                else:
+                    seen.float_ = True
+            except (TypeError, ValueError) as e:
+                if not seen.coerce_numeric:
+                    raise type(e)(str(e) + " at position {pos}".format(pos=i))
+                elif "uint64" in str(e):  # Exception from check functions.
+                    raise
+
+                seen.saw_null()
+                floats[i] = NaN
+
+    if seen.check_uint64_conflict():
+        return values
+
+    if seen.complex_:
+        return complexes
+    elif seen.float_:
+        return floats
+    elif seen.int_:
+        if seen.uint_:
+            return uints
         else:
-            return iter(self._as_array)
+            return ints
+    elif seen.bool_:
+        return bools.view(np.bool_)
+    elif seen.uint_:
+        return uints
+    return ints
 
-    @property
-    def as_slice(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is None:
-            raise TypeError('Not slice-like')
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def maybe_convert_objects(ndarray[object] objects, bint try_float=0,
+                          bint safe=0, bint convert_datetime=0,
+                          bint convert_timedelta=0):
+    """
+    Type inference function-- convert object array to proper dtype
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[float64_t] floats
+        ndarray[complex128_t] complexes
+        ndarray[int64_t] ints
+        ndarray[uint64_t] uints
+        ndarray[uint8_t] bools
+        ndarray[int64_t] idatetimes
+        ndarray[int64_t] itimedeltas
+        Seen seen = Seen()
+        object val
+        float64_t fval, fnan
+
+    n = len(objects)
+
+    floats = np.empty(n, dtype='f8')
+    complexes = np.empty(n, dtype='c16')
+    ints = np.empty(n, dtype='i8')
+    uints = np.empty(n, dtype='u8')
+    bools = np.empty(n, dtype=np.uint8)
+
+    if convert_datetime:
+        datetimes = np.empty(n, dtype='M8[ns]')
+        idatetimes = datetimes.view(np.int64)
+
+    if convert_timedelta:
+        timedeltas = np.empty(n, dtype='m8[ns]')
+        itimedeltas = timedeltas.view(np.int64)
+
+    fnan = np.nan
+
+    for i in range(n):
+        val = objects[i]
+
+        if val is None:
+            seen.null_ = 1
+            floats[i] = complexes[i] = fnan
+        elif val is NaT:
+            if convert_datetime:
+                idatetimes[i] = NPY_NAT
+                seen.datetime_ = 1
+            if convert_timedelta:
+                itimedeltas[i] = NPY_NAT
+                seen.timedelta_ = 1
+            if not (convert_datetime or convert_timedelta):
+                seen.object_ = 1
+        elif util.is_bool_object(val):
+            seen.bool_ = 1
+            bools[i] = val
+        elif util.is_float_object(val):
+            floats[i] = complexes[i] = val
+            seen.float_ = 1
+        elif util.is_datetime64_object(val):
+            if convert_datetime:
+                idatetimes[i] = convert_to_tsobject(
+                    val, None, None, 0, 0).value
+                seen.datetime_ = 1
+            else:
+                seen.object_ = 1
+                break
+        elif is_timedelta(val):
+            if convert_timedelta:
+                itimedeltas[i] = convert_to_timedelta64(val, 'ns')
+                seen.timedelta_ = 1
+            else:
+                seen.object_ = 1
+                break
+        elif util.is_integer_object(val):
+            seen.int_ = 1
+            floats[i] = <float64_t>val
+            complexes[i] = <double complex>val
+            if not seen.null_:
+                val = int(val)
+                seen.saw_int(val)
+
+                if ((seen.uint_ and seen.sint_) or
+                        val > oUINT64_MAX or val < oINT64_MIN):
+                    seen.object_ = 1
+                    break
+
+                if seen.uint_:
+                    uints[i] = val
+                elif seen.sint_:
+                    ints[i] = val
+                else:
+                    uints[i] = val
+                    ints[i] = val
+
+        elif util.is_complex_object(val):
+            complexes[i] = val
+            seen.complex_ = 1
+        elif PyDateTime_Check(val) or util.is_datetime64_object(val):
+
+            # if we have an tz's attached then return the objects
+            if convert_datetime:
+                if getattr(val, 'tzinfo', None) is not None:
+                    seen.datetimetz_ = 1
+                    break
+                else:
+                    seen.datetime_ = 1
+                    idatetimes[i] = convert_to_tsobject(
+                        val, None, None, 0, 0).value
+            else:
+                seen.object_ = 1
+                break
+        elif try_float and not util.is_string_object(val):
+            # this will convert Decimal objects
+            try:
+                floats[i] = float(val)
+                complexes[i] = complex(val)
+                seen.float_ = 1
+            except Exception:
+                seen.object_ = 1
+                break
         else:
-            return s
+            seen.object_ = 1
+            break
+
+    # we try to coerce datetime w/tz but must all have the same tz
+    if seen.datetimetz_:
+        if is_datetime_with_singletz_array(objects):
+            from pandas import DatetimeIndex
+            return DatetimeIndex(objects)
+        seen.object_ = 1
+
+    if not seen.object_:
+        if not safe:
+            if seen.null_:
+                if seen.is_float_or_complex:
+                    if seen.complex_:
+                        return complexes
+                    elif seen.float_ or seen.int_:
+                        return floats
+            else:
+                if not seen.bool_:
+                    if seen.datetime_:
+                        if not seen.numeric_:
+                            return datetimes
+                    elif seen.timedelta_:
+                        if not seen.numeric_:
+                            return timedeltas
+                    else:
+                        if seen.complex_:
+                            return complexes
+                        elif seen.float_:
+                            return floats
+                        elif seen.int_:
+                            if seen.uint_:
+                                return uints
+                            else:
+                                return ints
+                elif seen.is_bool:
+                    return bools.view(np.bool_)
 
-    @property
-    def indexer(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return s
         else:
-            return self._as_array
+            # don't cast int to float, etc.
+            if seen.null_:
+                if seen.is_float_or_complex:
+                    if seen.complex_:
+                        if not seen.int_:
+                            return complexes
+                    elif seen.float_:
+                        if not seen.int_:
+                            return floats
+            else:
+                if not seen.bool_:
+                    if seen.datetime_:
+                        if not seen.numeric_:
+                            return datetimes
+                    elif seen.timedelta_:
+                        if not seen.numeric_:
+                            return timedeltas
+                    else:
+                        if seen.complex_:
+                            if not seen.int_:
+                                return complexes
+                        elif seen.float_:
+                            if not seen.int_:
+                                return floats
+                        elif seen.int_:
+                            if seen.uint_:
+                                return uints
+                            else:
+                                return ints
+                elif seen.is_bool:
+                    return bools.view(np.bool_)
+
+    return objects
 
-    def isin(self, arr):
-        from pandas.core.index import Int64Index
-        return Int64Index(self.as_array, copy=False).isin(arr)
 
-    @property
-    def as_array(self):
-        cdef Py_ssize_t start, stop, end, _
-        if not self._has_array:
-            start, stop, step, _ = slice_get_indices_ex(self._as_slice)
-            self._as_array = np.arange(start, stop, step,
-                                       dtype=np.int64)
-            self._has_array = True
-        return self._as_array
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def map_infer_mask(ndarray arr, object f, const uint8_t[:] mask,
+                   bint convert=1):
+    """
+    Substitute for np.vectorize with pandas-friendly dtype inference
 
-    @property
-    def is_slice_like(self):
-        cdef slice s = self._ensure_has_slice()
-        return s is not None
-
-    def __getitem__(self, loc):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            val = slice_getitem(s, loc)
+    Parameters
+    ----------
+    arr : ndarray
+    f : function
+
+    Returns
+    -------
+    mapped : ndarray
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+        object val
+
+    n = len(arr)
+    result = np.empty(n, dtype=object)
+    for i in range(n):
+        if mask[i]:
+            val = arr[i]
         else:
-            val = self._as_array[loc]
+            val = f(arr[i])
+
+            if cnp.PyArray_IsZeroDim(val):
+                # unbox 0-dim arrays, GH#690
+                # TODO: is there a faster way to unbox?
+                #   item_from_zerodim?
+                val = val.item()
+
+        result[i] = val
+
+    if convert:
+        return maybe_convert_objects(result,
+                                     try_float=0,
+                                     convert_datetime=0,
+                                     convert_timedelta=0)
+
+    return result
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def map_infer(ndarray arr, object f, bint convert=1):
+    """
+    Substitute for np.vectorize with pandas-friendly dtype inference
 
-        if not isinstance(val, slice) and val.ndim == 0:
-            return val
+    Parameters
+    ----------
+    arr : ndarray
+    f : function
 
-        return BlockPlacement(val)
+    Returns
+    -------
+    mapped : ndarray
+    """
+    cdef:
+        Py_ssize_t i, n
+        ndarray[object] result
+        object val
 
-    def delete(self, loc):
-        return BlockPlacement(np.delete(self.as_array, loc, axis=0))
+    n = len(arr)
+    result = np.empty(n, dtype=object)
+    for i in range(n):
+        val = f(arr[i])
 
-    def append(self, others):
-        if len(others) == 0:
-            return self
+        if cnp.PyArray_IsZeroDim(val):
+            # unbox 0-dim arrays, GH#690
+            # TODO: is there a faster way to unbox?
+            #   item_from_zerodim?
+            val = val.item()
 
-        return BlockPlacement(np.concatenate([self.as_array] +
-                                             [o.as_array for o in others]))
+        result[i] = val
 
-    cdef iadd(self, other):
-        cdef slice s = self._ensure_has_slice()
-        cdef Py_ssize_t other_int, start, stop, step, l
+    if convert:
+        return maybe_convert_objects(result,
+                                     try_float=0,
+                                     convert_datetime=0,
+                                     convert_timedelta=0)
 
-        if isinstance(other, int) and s is not None:
-            other_int = <Py_ssize_t>other
+    return result
 
-            if other_int == 0:
-                return self
 
-            start, stop, step, l = slice_get_indices_ex(s)
-            start += other_int
-            stop += other_int
+def to_object_array(rows: object, int min_width=0):
+    """
+    Convert a list of lists into an object array.
 
-            if ((step > 0 and start < 0) or
-                (step < 0 and stop < step)):
-                raise ValueError("iadd causes length change")
+    Parameters
+    ----------
+    rows : 2-d array (N, K)
+        A list of lists to be converted into an array
+    min_width : int
+        The minimum width of the object array. If a list
+        in `rows` contains fewer than `width` elements,
+        the remaining elements in the corresponding row
+        will all be `NaN`.
 
-            if stop < 0:
-                self._as_slice = slice(start, None, step)
-            else:
-                self._as_slice = slice(start, stop, step)
+    Returns
+    -------
+    obj_array : numpy array of the object dtype
+    """
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        list input_rows
+        list row
 
-            self._has_array = False
-            self._as_array = None
-        else:
-            newarr = self.as_array + other
-            if (newarr < 0).any():
-                raise ValueError("iadd causes length change")
+    input_rows = <list>rows
+    n = len(input_rows)
+
+    k = min_width
+    for i in range(n):
+        tmp = len(input_rows[i])
+        if tmp > k:
+            k = tmp
+
+    result = np.empty((n, k), dtype=object)
 
-            self._as_array = newarr
-            self._has_array = True
-            self._has_slice = False
-            self._as_slice = None
+    for i in range(n):
+        row = list(input_rows[i])
 
-        return self
+        for j in range(len(row)):
+            result[i, j] = row[j]
 
-    cdef BlockPlacement copy(self):
-        cdef slice s = self._ensure_has_slice()
-        if s is not None:
-            return BlockPlacement(s)
-        else:
-            return BlockPlacement(self._as_array)
+    return result
+
+
+def tuples_to_object_array(ndarray[object] tuples):
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        tuple tup
+
+    n = len(tuples)
+    k = len(tuples[0])
+    result = np.empty((n, k), dtype=object)
+    for i in range(n):
+        tup = tuples[i]
+        for j in range(k):
+            result[i, j] = tup[j]
 
-    def add(self, other):
-        return self.copy().iadd(other)
+    return result
 
-    def sub(self, other):
-        return self.add(-other)
 
-    cdef slice _ensure_has_slice(self):
-        if not self._has_slice:
-            self._as_slice = indexer_as_slice(self._as_array)
-            self._has_slice = True
-        return self._as_slice
+def to_object_array_tuples(rows: list):
+    cdef:
+        Py_ssize_t i, j, n, k, tmp
+        ndarray[object, ndim=2] result
+        tuple row
 
+    n = len(rows)
+
+    k = 0
+    for i in range(n):
+        tmp = 1 if checknull(rows[i]) else len(rows[i])
+        if tmp > k:
+            k = tmp
+
+    result = np.empty((n, k), dtype=object)
+
+    try:
+        for i in range(n):
+            row = rows[i]
+            for j in range(len(row)):
+                result[i, j] = row[j]
+    except Exception:
+        # upcast any subclasses to tuple
+        for i in range(n):
+            row = (rows[i],) if checknull(rows[i]) else tuple(rows[i])
+            for j in range(len(row)):
+                result[i, j] = row[j]
+
+    return result
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def fast_multiget(dict mapping, ndarray keys, default=np.nan):
+    cdef:
+        Py_ssize_t i, n = len(keys)
+        object val
+        ndarray[object] output = np.empty(n, dtype='O')
+
+    if n == 0:
+        # kludge, for Series
+        return np.empty(0, dtype='f8')
+
+    keys = getattr(keys, 'values', keys)
+
+    for i in range(n):
+        val = keys[i]
+        if val in mapping:
+            output[i] = mapping[val]
+        else:
+            output[i] = default
 
-include "reduce.pyx"
-include "properties.pyx"
-include "inference.pyx"
+    return maybe_convert_objects(output)
diff --git a/pandas/_libs/missing.pxd b/pandas/_libs/missing.pxd
new file mode 100644
index 0000000000000..d0dd306680ae8
--- /dev/null
+++ b/pandas/_libs/missing.pxd
@@ -0,0 +1,11 @@
+# -*- coding: utf-8 -*-
+
+from numpy cimport ndarray, uint8_t
+
+cpdef bint checknull(object val)
+cpdef bint checknull_old(object val)
+cpdef ndarray[uint8_t] isnaobj(ndarray arr)
+
+cdef bint is_null_datetime64(v)
+cdef bint is_null_timedelta64(v)
+cdef bint is_null_period(v)
diff --git a/pandas/_libs/missing.pyx b/pandas/_libs/missing.pyx
new file mode 100644
index 0000000000000..ab0e4cd6cc765
--- /dev/null
+++ b/pandas/_libs/missing.pyx
@@ -0,0 +1,285 @@
+# -*- coding: utf-8 -*-
+
+import cython
+from cython import Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, uint8_t, float64_t
+cnp.import_array()
+
+cimport pandas._libs.util as util
+
+from pandas._libs.tslibs.np_datetime cimport (
+    get_timedelta64_value, get_datetime64_value)
+from pandas._libs.tslibs.nattype cimport (
+    checknull_with_nat, c_NaT as NaT, is_null_datetimelike)
+
+
+cdef:
+    float64_t INF = <float64_t>np.inf
+    float64_t NEGINF = -INF
+
+    int64_t NPY_NAT = util.get_nat()
+
+
+cpdef bint checknull(object val):
+    """
+    Return boolean describing of the input is NA-like, defined here as any
+    of:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : bool
+
+    Notes
+    -----
+    The difference between `checknull` and `checknull_old` is that `checknull`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    return is_null_datetimelike(val, inat_is_null=False)
+
+
+cpdef bint checknull_old(object val):
+    """
+    Return boolean describing of the input is NA-like, defined here as any
+    of:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    result : bool
+
+    Notes
+    -----
+    The difference between `checknull` and `checknull_old` is that `checknull`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    if checknull(val):
+        return True
+    elif util.is_float_object(val) or util.is_complex_object(val):
+        return val == INF or val == NEGINF
+    return False
+
+
+cdef inline bint _check_none_nan_inf_neginf(object val):
+    try:
+        return val is None or (isinstance(val, float) and
+                               (val != val or val == INF or val == NEGINF))
+    except ValueError:
+        return False
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef ndarray[uint8_t] isnaobj(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 1-D array are na-like,
+    according to the criteria defined in `checknull`:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val
+        ndarray[uint8_t] result
+
+    assert arr.ndim == 1, "'arr' must be 1-D."
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.uint8)
+    for i in range(n):
+        val = arr[i]
+        result[i] = checknull(val)
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj_old(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 1-D array are na-like,
+    defined as being any of:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+    """
+    cdef:
+        Py_ssize_t i, n
+        object val
+        ndarray[uint8_t] result
+
+    assert arr.ndim == 1, "'arr' must be 1-D."
+
+    n = len(arr)
+    result = np.zeros(n, dtype=np.uint8)
+    for i in range(n):
+        val = arr[i]
+        result[i] = val is NaT or _check_none_nan_inf_neginf(val)
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj2d(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 2-D array are na-like,
+    according to the criteria defined in `checknull`:
+     - None
+     - nan
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+
+    Notes
+    -----
+    The difference between `isnaobj2d` and `isnaobj2d_old` is that `isnaobj2d`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    cdef:
+        Py_ssize_t i, j, n, m
+        object val
+        ndarray[uint8_t, ndim=2] result
+
+    assert arr.ndim == 2, "'arr' must be 2-D."
+
+    n, m = (<object>arr).shape
+    result = np.zeros((n, m), dtype=np.uint8)
+    for i in range(n):
+        for j in range(m):
+            val = arr[i, j]
+            if checknull(val):
+                result[i, j] = 1
+    return result.view(np.bool_)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def isnaobj2d_old(ndarray arr):
+    """
+    Return boolean mask denoting which elements of a 2-D array are na-like,
+    according to the criteria defined in `checknull_old`:
+     - None
+     - nan
+     - INF
+     - NEGINF
+     - NaT
+     - np.datetime64 representation of NaT
+     - np.timedelta64 representation of NaT
+
+    Parameters
+    ----------
+    arr : ndarray
+
+    Returns
+    -------
+    result : ndarray (dtype=np.bool_)
+
+    Notes
+    -----
+    The difference between `isnaobj2d` and `isnaobj2d_old` is that `isnaobj2d`
+    does *not* consider INF or NEGINF to be NA.
+    """
+    cdef:
+        Py_ssize_t i, j, n, m
+        object val
+        ndarray[uint8_t, ndim=2] result
+
+    assert arr.ndim == 2, "'arr' must be 2-D."
+
+    n, m = (<object>arr).shape
+    result = np.zeros((n, m), dtype=np.uint8)
+    for i in range(n):
+        for j in range(m):
+            val = arr[i, j]
+            if checknull_old(val):
+                result[i, j] = 1
+    return result.view(np.bool_)
+
+
+def isposinf_scalar(val: object) -> bool:
+    if util.is_float_object(val) and val == INF:
+        return True
+    else:
+        return False
+
+
+def isneginf_scalar(val: object) -> bool:
+    if util.is_float_object(val) and val == NEGINF:
+        return True
+    else:
+        return False
+
+
+cdef inline bint is_null_datetime64(v):
+    # determine if we have a null for a datetime (or integer versions),
+    # excluding np.timedelta64('nat')
+    if checknull_with_nat(v):
+        return True
+    elif util.is_datetime64_object(v):
+        return get_datetime64_value(v) == NPY_NAT
+    return False
+
+
+cdef inline bint is_null_timedelta64(v):
+    # determine if we have a null for a timedelta (or integer versions),
+    # excluding np.datetime64('nat')
+    if checknull_with_nat(v):
+        return True
+    elif util.is_timedelta64_object(v):
+        return get_timedelta64_value(v) == NPY_NAT
+    return False
+
+
+cdef inline bint is_null_period(v):
+    # determine if we have a null for a Period (or integer versions),
+    # excluding np.datetime64('nat') and np.timedelta64('nat')
+    return checknull_with_nat(v)
diff --git a/pandas/_libs/ops.pyx b/pandas/_libs/ops.pyx
new file mode 100644
index 0000000000000..fb1d2e379958c
--- /dev/null
+++ b/pandas/_libs/ops.pyx
@@ -0,0 +1,295 @@
+# -*- coding: utf-8 -*-
+import operator
+
+from cpython cimport (PyObject_RichCompareBool,
+                      Py_EQ, Py_NE, Py_LT, Py_LE, Py_GT, Py_GE)
+
+import cython
+from cython import Py_ssize_t
+
+import numpy as np
+from numpy cimport ndarray, uint8_t, import_array
+import_array()
+
+
+from pandas._libs.util cimport UINT8_MAX, is_nan
+
+from pandas._libs.missing cimport checknull
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def scalar_compare(object[:] values, object val, object op):
+    """
+    Compare each element of `values` array with the scalar `val`, with
+    the comparison operation described by `op`.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    val : object
+    op : {operator.eq, operator.ne,
+          operator.le, operator.lt,
+          operator.ge, operator.gt}
+
+    Returns
+    -------
+    result : ndarray[bool]
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        ndarray[uint8_t, cast=True] result
+        bint isnull_val
+        int flag
+        object x
+
+    if op is operator.lt:
+        flag = Py_LT
+    elif op is operator.le:
+        flag = Py_LE
+    elif op is operator.gt:
+        flag = Py_GT
+    elif op is operator.ge:
+        flag = Py_GE
+    elif op is operator.eq:
+        flag = Py_EQ
+    elif op is operator.ne:
+        flag = Py_NE
+    else:
+        raise ValueError('Unrecognized operator')
+
+    result = np.empty(n, dtype=bool).view(np.uint8)
+    isnull_val = checknull(val)
+
+    if flag == Py_NE:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = True
+            elif isnull_val:
+                result[i] = True
+            else:
+                try:
+                    result[i] = PyObject_RichCompareBool(x, val, flag)
+                except TypeError:
+                    result[i] = True
+    elif flag == Py_EQ:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = False
+            elif isnull_val:
+                result[i] = False
+            else:
+                try:
+                    result[i] = PyObject_RichCompareBool(x, val, flag)
+                except TypeError:
+                    result[i] = False
+
+    else:
+        for i in range(n):
+            x = values[i]
+            if checknull(x):
+                result[i] = False
+            elif isnull_val:
+                result[i] = False
+            else:
+                result[i] = PyObject_RichCompareBool(x, val, flag)
+
+    return result.view(bool)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def vec_compare(object[:] left, object[:] right, object op):
+    """
+    Compare the elements of `left` with the elements of `right` pointwise,
+    with the comparison operation described by `op`.
+
+    Parameters
+    ----------
+    left : ndarray[object]
+    right : ndarray[object]
+    op : {operator.eq, operator.ne,
+          operator.le, operator.lt,
+          operator.ge, operator.gt}
+
+    Returns
+    -------
+    result : ndarray[bool]
+    """
+    cdef:
+        Py_ssize_t i, n = len(left)
+        ndarray[uint8_t, cast=True] result
+        int flag
+
+    if n != len(right):
+        raise ValueError('Arrays were different lengths: {n} vs {nright}'
+                         .format(n=n, nright=len(right)))
+
+    if op is operator.lt:
+        flag = Py_LT
+    elif op is operator.le:
+        flag = Py_LE
+    elif op is operator.gt:
+        flag = Py_GT
+    elif op is operator.ge:
+        flag = Py_GE
+    elif op is operator.eq:
+        flag = Py_EQ
+    elif op is operator.ne:
+        flag = Py_NE
+    else:
+        raise ValueError('Unrecognized operator')
+
+    result = np.empty(n, dtype=bool).view(np.uint8)
+
+    if flag == Py_NE:
+        for i in range(n):
+            x = left[i]
+            y = right[i]
+
+            if checknull(x) or checknull(y):
+                result[i] = True
+            else:
+                result[i] = PyObject_RichCompareBool(x, y, flag)
+    else:
+        for i in range(n):
+            x = left[i]
+            y = right[i]
+
+            if checknull(x) or checknull(y):
+                result[i] = False
+            else:
+                result[i] = PyObject_RichCompareBool(x, y, flag)
+
+    return result.view(bool)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def scalar_binop(object[:] values, object val, object op):
+    """
+    Apply the given binary operator `op` between each element of the array
+    `values` and the scalar `val`.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    val : object
+    op : binary operator
+
+    Returns
+    -------
+    result : ndarray[object]
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object[:] result
+        object x
+
+    result = np.empty(n, dtype=object)
+    if val is None or is_nan(val):
+        result[:] = val
+        return result.base  # `.base` to access underlying np.ndarray
+
+    for i in range(n):
+        x = values[i]
+        if x is None or is_nan(x):
+            result[i] = x
+        else:
+            result[i] = op(x, val)
+
+    return maybe_convert_bool(result.base)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def vec_binop(object[:] left, object[:] right, object op):
+    """
+    Apply the given binary operator `op` pointwise to the elements of
+    arrays `left` and `right`.
+
+    Parameters
+    ----------
+    left : ndarray[object]
+    right : ndarray[object]
+    op : binary operator
+
+    Returns
+    -------
+    result : ndarray[object]
+    """
+    cdef:
+        Py_ssize_t i, n = len(left)
+        object[:] result
+
+    if n != len(right):
+        raise ValueError('Arrays were different lengths: {n} vs {nright}'
+                         .format(n=n, nright=len(right)))
+
+    result = np.empty(n, dtype=object)
+
+    for i in range(n):
+        x = left[i]
+        y = right[i]
+        try:
+            result[i] = op(x, y)
+        except TypeError:
+            if x is None or is_nan(x):
+                result[i] = x
+            elif y is None or is_nan(y):
+                result[i] = y
+            else:
+                raise
+
+    return maybe_convert_bool(result.base)  # `.base` to access np.ndarray
+
+
+def maybe_convert_bool(ndarray[object] arr,
+                       true_values=None, false_values=None):
+    cdef:
+        Py_ssize_t i, n
+        ndarray[uint8_t] result
+        object val
+        set true_vals, false_vals
+        int na_count = 0
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.uint8)
+
+    # the defaults
+    true_vals = {'True', 'TRUE', 'true'}
+    false_vals = {'False', 'FALSE', 'false'}
+
+    if true_values is not None:
+        true_vals = true_vals | set(true_values)
+
+    if false_values is not None:
+        false_vals = false_vals | set(false_values)
+
+    for i in range(n):
+        val = arr[i]
+
+        if isinstance(val, bool):
+            if val is True:
+                result[i] = 1
+            else:
+                result[i] = 0
+        elif val in true_vals:
+            result[i] = 1
+        elif val in false_vals:
+            result[i] = 0
+        elif isinstance(val, float):
+            result[i] = UINT8_MAX
+            na_count += 1
+        else:
+            return arr
+
+    if na_count > 0:
+        mask = result == UINT8_MAX
+        arr = result.view(np.bool_).astype(object)
+        np.putmask(arr, mask, np.nan)
+        return arr
+    else:
+        return result.view(np.bool_)
diff --git a/pandas/io/parsers.pyx b/pandas/_libs/parsers.pyx
similarity index 79%
rename from pandas/io/parsers.pyx
rename to pandas/_libs/parsers.pyx
index 3728cda559050..f679746643643 100644
--- a/pandas/io/parsers.pyx
+++ b/pandas/_libs/parsers.pyx
@@ -1,24 +1,25 @@
 # Copyright (c) 2012, Lambda Foundry, Inc.
 # See LICENSE for the license
-
-from libc.stdio cimport fopen, fclose
-from libc.stdlib cimport malloc, free
-from libc.string cimport strncpy, strlen, strcmp, strcasecmp
-cimport libc.stdio as stdio
+import os
+import sys
+import time
 import warnings
 
 from csv import QUOTE_MINIMAL, QUOTE_NONNUMERIC, QUOTE_NONE
+from errno import ENOENT
+
+from libc.stdlib cimport free
+from libc.string cimport strncpy, strlen, strcasecmp
+
+import cython
+from cython import Py_ssize_t
+
 from cpython cimport (PyObject, PyBytes_FromString,
-                      PyBytes_AsString, PyBytes_Check,
-                      PyUnicode_Check, PyUnicode_AsUTF8String,
+                      PyBytes_AsString,
+                      PyUnicode_AsUTF8String,
                       PyErr_Occurred, PyErr_Fetch)
-from cpython.ref cimport PyObject, Py_XDECREF
-from pandas.io.common import (ParserError, DtypeWarning,
-                              EmptyDataError, ParserWarning)
+from cpython.ref cimport Py_XDECREF
 
-# Import CParserError as alias of ParserError for backwards compatibility.
-# Ultimately, we want to remove this import. See gh-12665 and gh-14479.
-from pandas.io.common import CParserError
 
 cdef extern from "Python.h":
     object PyUnicode_FromString(char *v)
@@ -26,68 +27,68 @@ cdef extern from "Python.h":
     object PyUnicode_Decode(char *v, Py_ssize_t size, char *encoding,
                             char *errors)
 
-cdef extern from "stdlib.h":
-    void memcpy(void *dst, void *src, size_t n)
 
-cimport cython
+import numpy as np
 cimport numpy as cnp
+from numpy cimport ndarray, uint8_t, uint64_t, int64_t, float64_t
+cnp.import_array()
 
-from numpy cimport ndarray, uint8_t, uint64_t
+from pandas._libs.util cimport UINT64_MAX, INT64_MAX, INT64_MIN
+import pandas._libs.lib as lib
 
-import numpy as np
-cimport util
+from pandas._libs.khash cimport (
+    khiter_t,
+    kh_str_t, kh_init_str, kh_put_str, kh_exist_str,
+    kh_get_str, kh_destroy_str,
+    kh_float64_t, kh_get_float64, kh_destroy_float64,
+    kh_put_float64, kh_init_float64,
+    kh_strbox_t, kh_put_strbox, kh_get_strbox, kh_init_strbox,
+    kh_destroy_strbox)
 
-import pandas._libs.lib as lib
 import pandas.compat as compat
-from pandas.types.common import (is_categorical_dtype, CategoricalDtype,
-                                 is_integer_dtype, is_float_dtype,
-                                 is_bool_dtype, is_object_dtype,
-                                 is_string_dtype, is_datetime64_dtype,
-                                 pandas_dtype)
-from pandas.core.categorical import Categorical
-from pandas.core.algorithms import take_1d
-from pandas.types.concat import union_categoricals
-from pandas import Index
+from pandas.core.dtypes.common import (
+    is_categorical_dtype,
+    is_integer_dtype, is_float_dtype,
+    is_bool_dtype, is_object_dtype,
+    is_datetime64_dtype,
+    pandas_dtype, is_extension_array_dtype)
+from pandas.core.arrays import Categorical
+from pandas.core.dtypes.concat import union_categoricals
+import pandas.io.common as icom
+
+from pandas.errors import (ParserError, DtypeWarning,
+                           EmptyDataError, ParserWarning)
 
-import time
-import os
-
-cnp.import_array()
+# Import CParserError as alias of ParserError for backwards compatibility.
+# Ultimately, we want to remove this import. See gh-12665 and gh-14479.
+CParserError = ParserError
 
-from khash cimport *
 
-import sys
+cdef:
+    bint PY3 = (sys.version_info[0] >= 3)
 
-cdef bint PY3 = (sys.version_info[0] >= 3)
-
-cdef double INF = <double> np.inf
-cdef double NEGINF = -INF
-
-cdef extern from "headers/stdint.h":
-    enum: UINT8_MAX
-    enum: UINT16_MAX
-    enum: UINT32_MAX
-    enum: UINT64_MAX
-    enum: INT8_MIN
-    enum: INT8_MAX
-    enum: INT16_MIN
-    enum: INT16_MAX
-    enum: INT32_MAX
-    enum: INT32_MIN
-    enum: INT64_MAX
-    enum: INT64_MIN
+    float64_t INF = <float64_t>np.inf
+    float64_t NEGINF = -INF
 
-cdef extern from "headers/portable.h":
-    pass
 
 cdef extern from "errno.h":
     int errno
 
+cdef extern from "headers/portable.h":
+    # I *think* this is here so that strcasecmp is defined on Windows
+    # so we don't get
+    # `parsers.obj : error LNK2001: unresolved external symbol strcasecmp`
+    # in Appveyor.
+    # In a sane world, the `from libc.string cimport` above would fail
+    # loudly.
+    pass
+
 try:
     basestring
 except NameError:
     basestring = str
 
+
 cdef extern from "parser/tokenizer.h":
 
     ctypedef enum ParserState:
@@ -118,30 +119,31 @@ cdef extern from "parser/tokenizer.h":
         io_callback cb_io
         io_cleanup cb_cleanup
 
-        int chunksize  # Number of bytes to prepare for each chunk
-        char *data     # pointer to data to be processed
-        int datalen    # amount of data available
-        int datapos
+        int64_t chunksize  # Number of bytes to prepare for each chunk
+        char *data         # pointer to data to be processed
+        int64_t datalen    # amount of data available
+        int64_t datapos
 
         # where to write out tokenized data
         char *stream
-        int stream_len
-        int stream_cap
+        int64_t stream_len
+        int64_t stream_cap
 
         # Store words in (potentially ragged) matrix for now, hmm
         char **words
-        int *word_starts # where we are in the stream
-        int words_len
-        int words_cap
+        int64_t *word_starts  # where we are in the stream
+        int64_t words_len
+        int64_t words_cap
+        int64_t max_words_cap    # maximum word cap encountered
 
-        char *pword_start    # pointer to stream start of current field
-        int word_start       # position start of current field
+        char *pword_start        # pointer to stream start of current field
+        int64_t word_start       # position start of current field
 
-        int *line_start      # position in words for start of line
-        int *line_fields     # Number of fields in each line
-        int lines            # Number of lines observed
-        int file_lines       # Number of file lines observed (with bad/skipped)
-        int lines_cap        # Vector capacity
+        int64_t *line_start      # position in words for start of line
+        int64_t *line_fields     # Number of fields in each line
+        int64_t lines            # Number of lines observed
+        int64_t file_lines       # Number of lines observed (with bad/skipped)
+        int64_t lines_cap        # Vector capacity
 
         # Tokenizing stuff
         ParserState state
@@ -155,7 +157,7 @@ cdef extern from "parser/tokenizer.h":
         int quoting                # style of quoting to write */
 
         # hmm =/
-#        int numeric_field
+        # int numeric_field
 
         char commentchar
         int allow_embedded_newline
@@ -174,30 +176,30 @@ cdef extern from "parser/tokenizer.h":
         # thousands separator (comma, period)
         char thousands
 
-        int header # Boolean: 1: has header, 0: no header
-        int header_start # header row start
-        int header_end # header row end
+        int header                  # Boolean: 1: has header, 0: no header
+        int64_t header_start        # header row start
+        int64_t header_end          # header row end
 
         void *skipset
         PyObject *skipfunc
         int64_t skip_first_N_rows
-        int skipfooter
+        int64_t skipfooter
         # pick one, depending on whether the converter requires GIL
-        double (*double_converter_nogil)(const char *, char **,
-                                         char, char, char, int) nogil
-        double (*double_converter_withgil)(const char *, char **,
-                                           char, char, char, int)
+        float64_t (*double_converter_nogil)(const char *, char **,
+                                            char, char, char, int) nogil
+        float64_t (*double_converter_withgil)(const char *, char **,
+                                              char, char, char, int)
 
         #  error handling
         char *warn_msg
         char *error_msg
 
-        int skip_empty_lines
+        int64_t skip_empty_lines
 
     ctypedef struct coliter_t:
         char **words
-        int *line_start
-        int col
+        int64_t *line_start
+        int64_t col
 
     ctypedef struct uint_state:
         int seen_sint
@@ -207,7 +209,8 @@ cdef extern from "parser/tokenizer.h":
     void uint_state_init(uint_state *self)
     int uint64_conflict(uint_state *self)
 
-    void coliter_setup(coliter_t *it, parser_t *parser, int i, int start) nogil
+    void coliter_setup(coliter_t *it, parser_t *parser,
+                       int64_t i, int64_t start) nogil
     void COLITER_NEXT(coliter_t, const char *) nogil
 
     parser_t* parser_new()
@@ -225,8 +228,6 @@ cdef extern from "parser/tokenizer.h":
 
     int parser_trim_buffers(parser_t *self)
 
-    void debug_print_parser(parser_t *self)
-
     int tokenize_all_rows(parser_t *self) nogil
     int tokenize_nrows(parser_t *self, size_t nrows) nogil
 
@@ -235,18 +236,13 @@ cdef extern from "parser/tokenizer.h":
     uint64_t str_to_uint64(uint_state *state, char *p_item, int64_t int_max,
                            uint64_t uint_max, int *error, char tsep) nogil
 
-    double xstrtod(const char *p, char **q, char decimal, char sci,
-                   char tsep, int skip_trailing) nogil
-    double precise_xstrtod(const char *p, char **q, char decimal, char sci,
-                           char tsep, int skip_trailing) nogil
-    double round_trip(const char *p, char **q, char decimal, char sci,
+    float64_t xstrtod(const char *p, char **q, char decimal, char sci,
                       char tsep, int skip_trailing) nogil
+    float64_t precise_xstrtod(const char *p, char **q, char decimal, char sci,
+                              char tsep, int skip_trailing) nogil
+    float64_t round_trip(const char *p, char **q, char decimal, char sci,
+                         char tsep, int skip_trailing) nogil
 
-#    inline int to_complex(char *item, double *p_real,
-#                          double *p_imag, char sci, char decimal)
-    inline int to_longlong(char *item, long long *p_value) nogil
-#    inline int to_longlong_thousands(char *item, long long *p_value,
-#                                     char tsep)
     int to_boolean(const char *item, uint8_t *val) nogil
 
 
@@ -272,13 +268,6 @@ cdef extern from "parser/io.h":
 
 DEFAULT_CHUNKSIZE = 256 * 1024
 
-# common NA values
-# no longer excluding inf representations
-# '1.#INF','-1.#INF', '1.#INF000000',
-_NA_VALUES = [b'-1.#IND', b'1.#QNAN', b'1.#IND', b'-1.#QNAN',
-              b'#N/A N/A', b'NA', b'#NA', b'NULL', b'NaN',
-              b'nan', b'']
-
 
 cdef class TextReader:
     """
@@ -292,25 +281,23 @@ cdef class TextReader:
         object file_handle, na_fvalues
         object true_values, false_values
         object handle
-        bint na_filter, verbose, has_usecols, has_mi_columns
-        int parser_start
+        bint na_filter, keep_default_na, verbose, has_usecols, has_mi_columns
+        int64_t parser_start
         list clocks
         char *c_encoding
         kh_str_t *false_set
         kh_str_t *true_set
 
     cdef public:
-        int leading_cols, table_width, skipfooter, buffer_lines
+        int64_t leading_cols, table_width, skipfooter, buffer_lines
         object allow_leading_cols
         object delimiter, converters, delim_whitespace
         object na_values
         object memory_map
-        object as_recarray
         object header, orig_header, names, header_start, header_end
         object index_col
         object low_memory
         object skiprows
-        object compact_ints, use_unsigned
         object dtype
         object encoding
         object compression
@@ -318,6 +305,7 @@ cdef class TextReader:
         object tupleize_cols
         object usecols
         list dtype_cast_order
+        set unnamed_cols
         set noconvert
 
     def __cinit__(self, source,
@@ -337,8 +325,6 @@ cdef class TextReader:
 
                   converters=None,
 
-                  as_recarray=False,
-
                   skipinitialspace=False,
                   escapechar=None,
                   doublequote=True,
@@ -360,14 +346,12 @@ cdef class TextReader:
                   na_filter=True,
                   na_values=None,
                   na_fvalues=None,
+                  keep_default_na=True,
+
                   true_values=None,
                   false_values=None,
-
-                  compact_ints=False,
                   allow_leading_cols=True,
-                  use_unsigned=False,
                   low_memory=False,
-                  buffer_lines=None,
                   skiprows=None,
                   skipfooter=0,
                   verbose=False,
@@ -376,11 +360,22 @@ cdef class TextReader:
                   float_precision=None,
                   skip_blank_lines=True):
 
+        # set encoding for native Python and C library
+        if encoding is not None:
+            if not isinstance(encoding, bytes):
+                encoding = encoding.encode('utf-8')
+            encoding = encoding.lower()
+            self.c_encoding = <char*>encoding
+        else:
+            self.c_encoding = NULL
+
+        self.encoding = encoding
+
         self.parser = parser_new()
         self.parser.chunksize = tokenize_chunksize
 
-        self.mangle_dupe_cols=mangle_dupe_cols
-        self.tupleize_cols=tupleize_cols
+        self.mangle_dupe_cols = mangle_dupe_cols
+        self.tupleize_cols = tupleize_cols
 
         # For timekeeping
         self.clocks = []
@@ -402,7 +397,7 @@ cdef class TextReader:
                 raise ValueError('only length-1 separators excluded right now')
             self.parser.delimiter = ord(delimiter)
 
-        #----------------------------------------
+        # ----------------------------------------
         # parser options
 
         self.parser.doublequote = doublequote
@@ -425,7 +420,7 @@ cdef class TextReader:
 
         if escapechar is not None:
             if len(escapechar) != 1:
-                raise ValueError('Only length-1 escapes  supported')
+                raise ValueError('Only length-1 escapes supported')
             self.parser.escapechar = ord(escapechar)
 
         self._set_quoting(quotechar, quoting)
@@ -454,10 +449,9 @@ cdef class TextReader:
         # suboptimal
         if usecols is not None:
             self.has_usecols = 1
-            if callable(usecols):
-                self.usecols = usecols
-            else:
-                self.usecols = set(usecols)
+            # GH-20558, validate usecols at higher level and only pass clean
+            # usecols into TextReader.
+            self.usecols = usecols
 
         # XXX
         if skipfooter > 0:
@@ -478,13 +472,9 @@ cdef class TextReader:
         self.true_set = kset_from_list(self.true_values)
         self.false_set = kset_from_list(self.false_values)
 
+        self.keep_default_na = keep_default_na
         self.converters = converters
-
         self.na_filter = na_filter
-        self.as_recarray = as_recarray
-
-        self.compact_ints = compact_ints
-        self.use_unsigned = use_unsigned
 
         self.verbose = verbose
         self.low_memory = low_memory
@@ -497,17 +487,6 @@ cdef class TextReader:
             self.parser.double_converter_nogil = NULL
             self.parser.double_converter_withgil = round_trip
 
-        # encoding
-        if encoding is not None:
-            if not isinstance(encoding, bytes):
-                encoding = encoding.encode('utf-8')
-            encoding = encoding.lower()
-            self.c_encoding = <char*> encoding
-        else:
-            self.c_encoding = NULL
-
-        self.encoding = encoding
-
         if isinstance(dtype, dict):
             dtype = {k: pandas_dtype(dtype[k])
                      for k in dtype}
@@ -521,7 +500,7 @@ cdef class TextReader:
 
         self.index_col = index_col
 
-        #----------------------------------------
+        # ----------------------------------------
         # header stuff
 
         self.allow_leading_cols = allow_leading_cols
@@ -538,38 +517,41 @@ cdef class TextReader:
             self.parser_start = 0
             self.header = []
         else:
-            if isinstance(header, list) and len(header):
-                # need to artifically skip the final line
-                # which is still a header line
-                header = list(header)
-                header.append(header[-1] + 1)
+            if isinstance(header, list):
+                if len(header) > 1:
+                    # need to artificially skip the final line
+                    # which is still a header line
+                    header = list(header)
+                    header.append(header[-1] + 1)
+                    self.parser.header_end = header[-1]
+                    self.has_mi_columns = 1
+                else:
+                    self.parser.header_end = header[0]
 
+                self.parser_start = header[-1] + 1
                 self.parser.header_start = header[0]
-                self.parser.header_end = header[-1]
                 self.parser.header = header[0]
-                self.parser_start = header[-1] + 1
-                self.has_mi_columns = 1
                 self.header = header
             else:
                 self.parser.header_start = header
                 self.parser.header_end = header
-                self.parser.header = header
                 self.parser_start = header + 1
+                self.parser.header = header
                 self.header = [ header ]
 
         self.names = names
-        self.header, self.table_width = self._get_header()
+        self.header, self.table_width, self.unnamed_cols = self._get_header()
 
         if not self.table_width:
             raise EmptyDataError("No columns to parse from file")
 
-        # compute buffer_lines as function of table width
+        # Compute buffer_lines as function of table width.
         heuristic = 2**20 // self.table_width
         self.buffer_lines = 1
-        while self.buffer_lines * 2< heuristic:
+        while self.buffer_lines * 2 < heuristic:
             self.buffer_lines *= 2
 
-    def __init__(self, *args, **kwards):
+    def __init__(self, *args, **kwargs):
         pass
 
     def __dealloc__(self):
@@ -633,7 +615,7 @@ cdef class TextReader:
             for i in self.skiprows:
                 parser_add_skiprow(self.parser, i)
         else:
-            self.parser.skipfunc = <PyObject *> self.skiprows
+            self.parser.skipfunc = <PyObject *>self.skiprows
 
     cdef _setup_parser_source(self, source):
         cdef:
@@ -683,11 +665,26 @@ cdef class TextReader:
             else:
                 raise ValueError('Unrecognized compression type: %s' %
                                  self.compression)
+
+            if b'utf-16' in (self.encoding or b''):
+                # we need to read utf-16 through UTF8Recoder.
+                # if source is utf-16, convert source to utf-8 by UTF8Recoder.
+                source = icom.UTF8Recoder(source,
+                                          self.encoding.decode('utf-8'))
+                self.encoding = b'utf-8'
+                self.c_encoding = <char*>self.encoding
+
             self.handle = source
 
         if isinstance(source, basestring):
             if not isinstance(source, bytes):
-                source = source.encode(sys.getfilesystemencoding() or 'utf-8')
+                if compat.PY36 and compat.is_platform_windows():
+                    # see gh-15086.
+                    encoding = "mbcs"
+                else:
+                    encoding = sys.getfilesystemencoding() or "utf-8"
+
+                source = source.encode(encoding)
 
             if self.memory_map:
                 ptr = new_mmap(source)
@@ -707,7 +704,9 @@ cdef class TextReader:
             if ptr == NULL:
                 if not os.path.exists(source):
                     raise compat.FileNotFoundError(
-                        'File %s does not exist' % source)
+                        ENOENT,
+                        'File {source} does not exist'.format(source=source),
+                        source)
                 raise IOError('Initializing from file failed')
 
             self.parser.source = ptr
@@ -733,12 +732,15 @@ cdef class TextReader:
         cdef:
             Py_ssize_t i, start, field_count, passed_count, unnamed_count  # noqa
             char *word
-            object name
-            int status, hr, data_line
+            object name, old_name
+            int status
+            int64_t hr, data_line
             char *errors = "strict"
-            cdef StringPath path = _string_path(self.c_encoding)
+            StringPath path = _string_path(self.c_encoding)
 
         header = []
+        unnamed_cols = set()
+
         if self.parser.header_start >= 0:
 
             # Header is in the file
@@ -760,7 +762,7 @@ cdef class TextReader:
                     msg = self.orig_header
                     if isinstance(msg, list):
                         msg = "[%s], len of %d," % (
-                            ','.join([ str(m) for m in msg ]), len(msg))
+                            ','.join(str(m) for m in msg), len(msg))
                     raise ParserError(
                         'Passed header=%s but only %d lines in file'
                         % (msg, self.parser.lines))
@@ -771,6 +773,7 @@ cdef class TextReader:
 
                 counts = {}
                 unnamed_count = 0
+
                 for i in range(field_count):
                     word = self.parser.words[start + i]
 
@@ -782,19 +785,29 @@ cdef class TextReader:
                         name = PyUnicode_Decode(word, strlen(word),
                                                 self.c_encoding, errors)
 
+                    # We use this later when collecting placeholder names.
+                    old_name = name
+
                     if name == '':
                         if self.has_mi_columns:
-                            name = 'Unnamed: %d_level_%d' % (i, level)
+                            name = ('Unnamed: {i}_level_{lvl}'
+                                    .format(i=i, lvl=level))
                         else:
-                            name = 'Unnamed: %d' % i
+                            name = 'Unnamed: {i}'.format(i=i)
                         unnamed_count += 1
 
                     count = counts.get(name, 0)
-                    if (count > 0 and self.mangle_dupe_cols
-                        and not self.has_mi_columns):
-                        this_header.append('%s.%d' % (name, count))
-                    else:
-                        this_header.append(name)
+
+                    if not self.has_mi_columns and self.mangle_dupe_cols:
+                        while count > 0:
+                            counts[name] = count + 1
+                            name = '%s.%d' % (name, count)
+                            count = counts.get(name, 0)
+
+                    if old_name == '':
+                        unnamed_cols.add(name)
+
+                    this_header.append(name)
                     counts[name] = count + 1
 
                 if self.has_mi_columns:
@@ -805,7 +818,8 @@ cdef class TextReader:
                     if hr == self.header[-1]:
                         lc = len(this_header)
                         ic = (len(self.index_col) if self.index_col
-                                                     is not None else 0)
+                              is not None else 0)
+
                         if lc != unnamed_count and lc - ic > unnamed_count:
                             hr -= 1
                             self.parser_start -= 1
@@ -838,12 +852,12 @@ cdef class TextReader:
             if self.parser.lines < 1:
                 self._tokenize_rows(1)
 
-            return None, self.parser.line_fields[0]
+            return None, self.parser.line_fields[0], unnamed_cols
 
         # Corner case, not enough lines in the file
         if self.parser.lines < data_line + 1:
             field_count = len(header[0])
-        else: # not self.has_usecols:
+        else:  # not self.has_usecols:
 
             field_count = self.parser.line_fields[data_line]
 
@@ -858,8 +872,8 @@ cdef class TextReader:
             #                        'data has %d fields'
             #                        % (passed_count, field_count))
 
-            if self.has_usecols and self.allow_leading_cols and \
-                    not callable(self.usecols):
+            if (self.has_usecols and self.allow_leading_cols and
+                    not callable(self.usecols)):
                 nuse = len(self.usecols)
                 if nuse == passed_count:
                     self.leading_cols = 0
@@ -872,10 +886,7 @@ cdef class TextReader:
             elif self.allow_leading_cols and passed_count < field_count:
                 self.leading_cols = field_count - passed_count
 
-        return header, field_count
-
-    cdef _implicit_index_count(self):
-        pass
+        return header, field_count, unnamed_cols
 
     def read(self, rows=None):
         """
@@ -891,14 +902,7 @@ cdef class TextReader:
             # Don't care about memory usage
             columns = self._read_rows(rows, 1)
 
-        if self.as_recarray:
-            self._start_clock()
-            result = _to_structured_array(columns, self.header, self.usecols)
-            self._end_clock('Conversion to structured array')
-
-            return result
-        else:
-            return columns
+        return columns
 
     cdef _read_low_memory(self, rows):
         cdef:
@@ -953,8 +957,8 @@ cdef class TextReader:
 
     cdef _read_rows(self, rows, bint trim):
         cdef:
-            int buffered_lines
-            int irows, footer = 0
+            int64_t buffered_lines
+            int64_t irows, footer = 0
 
         self._start_clock()
 
@@ -987,9 +991,8 @@ cdef class TextReader:
         self._start_clock()
         columns = self._convert_column_data(rows=rows,
                                             footer=footer,
-                                            upcast_na=not self.as_recarray)
+                                            upcast_na=True)
         self._end_clock('Type conversion')
-
         self._start_clock()
         if len(columns) > 0:
             rows_read = len(list(columns.values())[0])
@@ -1003,16 +1006,13 @@ cdef class TextReader:
 
         return columns
 
-    def debug_print(self):
-        debug_print_parser(self.parser)
-
     cdef _start_clock(self):
         self.clocks.append(time.time())
 
     cdef _end_clock(self, what):
         if self.verbose:
             elapsed = time.time() - self.clocks.pop(-1)
-            print '%s took: %.2f ms' % (what, elapsed * 1000)
+            print('%s took: %.2f ms' % (what, elapsed * 1000))
 
     def set_noconvert(self, i):
         self.noconvert.add(i)
@@ -1022,12 +1022,13 @@ cdef class TextReader:
 
     def _convert_column_data(self, rows=None, upcast_na=False, footer=0):
         cdef:
-            Py_ssize_t i, nused
+            int64_t i
+            int nused
             kh_str_t *na_hashset = NULL
-            int start, end
+            int64_t start, end
             object name, na_flist, col_dtype = None
             bint na_filter = 0
-            Py_ssize_t num_cols
+            int64_t num_cols
 
         start = self.parser_start
 
@@ -1048,8 +1049,10 @@ cdef class TextReader:
 
         if self.table_width - self.leading_cols > num_cols:
             raise ParserError(
-                "Too many columns specified: expected %s and found %s" %
-                (self.table_width - self.leading_cols, num_cols))
+                "Too many columns specified: expected {expected} and "
+                "found {found}"
+                .format(expected=self.table_width - self.leading_cols,
+                        found=num_cols))
 
         results = {}
         nused = 0
@@ -1057,8 +1060,8 @@ cdef class TextReader:
             if i < self.leading_cols:
                 # Pass through leading columns always
                 name = i
-            elif self.usecols and not callable(self.usecols) and \
-                    nused == len(self.usecols):
+            elif (self.usecols and not callable(self.usecols) and
+                    nused == len(self.usecols)):
                 # Once we've gathered all requested columns, stop. GH5766
                 break
             else:
@@ -1066,7 +1069,7 @@ cdef class TextReader:
                 usecols = set()
                 if callable(self.usecols):
                     if self.usecols(name):
-                        usecols = set([i])
+                        usecols = {i}
                 else:
                     usecols = self.usecols
                 if self.has_usecols and not (i in usecols or
@@ -1076,18 +1079,6 @@ cdef class TextReader:
 
             conv = self._get_converter(i, name)
 
-            # XXX
-            na_flist = set()
-            if self.na_filter:
-                na_list, na_flist = self._get_na_list(i, name)
-                if na_list is None:
-                    na_filter = 0
-                else:
-                    na_filter = 1
-                    na_hashset = kset_from_list(na_list)
-            else:
-                na_filter = 0
-
             col_dtype = None
             if self.dtype is not None:
                 if isinstance(self.dtype, dict):
@@ -1112,24 +1103,42 @@ cdef class TextReader:
                                               self.c_encoding)
                 continue
 
-            # Should return as the desired dtype (inferred or specified)
-            col_res, na_count = self._convert_tokens(
-                i, start, end, name, na_filter, na_hashset,
-                na_flist, col_dtype)
+            # Collect the list of NaN values associated with the column.
+            # If we aren't supposed to do that, or none are collected,
+            # we set `na_filter` to `0` (`1` otherwise).
+            na_flist = set()
 
-            if na_filter:
-                self._free_na_set(na_hashset)
+            if self.na_filter:
+                na_list, na_flist = self._get_na_list(i, name)
+                if na_list is None:
+                    na_filter = 0
+                else:
+                    na_filter = 1
+                    na_hashset = kset_from_list(na_list)
+            else:
+                na_filter = 0
 
-            if upcast_na and na_count > 0:
+            # Attempt to parse tokens and infer dtype of the column.
+            # Should return as the desired dtype (inferred or specified).
+            try:
+                col_res, na_count = self._convert_tokens(
+                    i, start, end, name, na_filter, na_hashset,
+                    na_flist, col_dtype)
+            finally:
+                # gh-21353
+                #
+                # Cleanup the NaN hash that we generated
+                # to avoid memory leaks.
+                if na_filter:
+                    self._free_na_set(na_hashset)
+
+            # don't try to upcast EAs
+            try_upcast = upcast_na and na_count > 0
+            if try_upcast and not is_extension_array_dtype(col_dtype):
                 col_res = _maybe_upcast(col_res)
 
-            if issubclass(col_res.dtype.type,
-                          np.integer) and self.compact_ints:
-                col_res = lib.downcast_int64(col_res, na_values,
-                                             self.use_unsigned)
-
             if col_res is None:
-                raise ParserError('Unable to parse column %d' % i)
+                raise ParserError('Unable to parse column {i}'.format(i=i))
 
             results[i] = col_res
 
@@ -1199,12 +1208,41 @@ cdef class TextReader:
         return col_res, na_count
 
     cdef _convert_with_dtype(self, object dtype, Py_ssize_t i,
-                             int start, int end,
+                             int64_t start, int64_t end,
                              bint na_filter,
                              bint user_dtype,
                              kh_str_t *na_hashset,
                              object na_flist):
-        if is_integer_dtype(dtype):
+        if is_categorical_dtype(dtype):
+            # TODO: I suspect that _categorical_convert could be
+            # optimized when dtype is an instance of CategoricalDtype
+            codes, cats, na_count = _categorical_convert(
+                self.parser, i, start, end, na_filter,
+                na_hashset, self.c_encoding)
+
+            # Method accepts list of strings, not encoded ones.
+            true_values = [x.decode() for x in self.true_values]
+            cat = Categorical._from_inferred_categories(
+                cats, codes, dtype, true_values=true_values)
+            return cat, na_count
+
+        elif is_extension_array_dtype(dtype):
+            result, na_count = self._string_convert(i, start, end, na_filter,
+                                                    na_hashset)
+            array_type = dtype.construct_array_type()
+            try:
+                # use _from_sequence_of_strings if the class defines it
+                result = array_type._from_sequence_of_strings(result,
+                                                              dtype=dtype)
+            except NotImplementedError:
+                raise NotImplementedError(
+                    "Extension Array: {ea} must implement "
+                    "_from_sequence_of_strings in order "
+                    "to be used in parser methods".format(ea=array_type))
+
+            return result, na_count
+
+        elif is_integer_dtype(dtype):
             try:
                 result, na_count = _try_int64(self.parser, i, start,
                                               end, na_filter, na_hashset)
@@ -1229,12 +1267,16 @@ cdef class TextReader:
             if result is not None and dtype != 'float64':
                 result = result.astype(dtype)
             return result, na_count
-
         elif is_bool_dtype(dtype):
             result, na_count = _try_bool_flex(self.parser, i, start, end,
                                               na_filter, na_hashset,
                                               self.true_set, self.false_set)
+            if user_dtype and na_count is not None:
+                if na_count > 0:
+                    raise ValueError("Bool column has NA values in "
+                                     "column {column}".format(column=i))
             return result, na_count
+
         elif dtype.kind == 'S':
             # TODO: na handling
             width = dtype.itemsize
@@ -1248,38 +1290,24 @@ cdef class TextReader:
         elif dtype.kind == 'U':
             width = dtype.itemsize
             if width > 0:
-                raise TypeError("the dtype %s is not "
-                                "supported for parsing" % dtype)
+                raise TypeError("the dtype {dtype} is not "
+                                "supported for parsing".format(dtype=dtype))
 
             # unicode variable width
             return self._string_convert(i, start, end, na_filter,
                                         na_hashset)
-        elif is_categorical_dtype(dtype):
-            codes, cats, na_count = _categorical_convert(
-                self.parser, i, start, end, na_filter,
-                na_hashset, self.c_encoding)
-            # sort categories and recode if necessary
-            cats = Index(cats)
-            if not cats.is_monotonic_increasing:
-                unsorted = cats.copy()
-                cats = cats.sort_values()
-                indexer = cats.get_indexer(unsorted)
-                codes = take_1d(indexer, codes, fill_value=-1)
-
-            return Categorical(codes, categories=cats, ordered=False,
-                               fastpath=True), na_count
         elif is_object_dtype(dtype):
             return self._string_convert(i, start, end, na_filter,
                                         na_hashset)
         elif is_datetime64_dtype(dtype):
-            raise TypeError("the dtype %s is not supported "
+            raise TypeError("the dtype {dtype} is not supported "
                             "for parsing, pass this column "
-                            "using parse_dates instead" % dtype)
+                            "using parse_dates instead".format(dtype=dtype))
         else:
-            raise TypeError("the dtype %s is not "
-                            "supported for parsing" % dtype)
+            raise TypeError("the dtype {dtype} is not "
+                            "supported for parsing".format(dtype=dtype))
 
-    cdef _string_convert(self, Py_ssize_t i, int start, int end,
+    cdef _string_convert(self, Py_ssize_t i, int64_t start, int64_t end,
                          bint na_filter, kh_str_t *na_hashset):
 
         cdef StringPath path = _string_path(self.c_encoding)
@@ -1317,7 +1345,10 @@ cdef class TextReader:
             elif i in self.na_values:
                 key = i
             else:  # No na_values provided for this column.
-                return _NA_VALUES, set()
+                if self.keep_default_na:
+                    return _NA_VALUES, set()
+
+                return list(), set()
 
             values = self.na_values[key]
             if values is not None and not isinstance(values, list):
@@ -1340,6 +1371,7 @@ cdef class TextReader:
         kh_destroy_str(table)
 
     cdef _get_column_name(self, Py_ssize_t i, Py_ssize_t nused):
+        cdef int64_t j
         if self.has_usecols and self.names is not None:
             if (not callable(self.usecols) and
                     len(self.names) == len(self.usecols)):
@@ -1357,21 +1389,24 @@ cdef class TextReader:
             else:
                 return None
 
-cdef object _true_values = [b'True', b'TRUE', b'true']
-cdef object _false_values = [b'False', b'FALSE', b'false']
+
+cdef:
+    object _true_values = [b'True', b'TRUE', b'true']
+    object _false_values = [b'False', b'FALSE', b'false']
 
 
 def _ensure_encoded(list lst):
     cdef list result = []
     for x in lst:
-        if PyUnicode_Check(x):
+        if isinstance(x, unicode):
             x = PyUnicode_AsUTF8String(x)
-        elif not PyBytes_Check(x):
+        elif not isinstance(x, bytes):
             x = asbytes(x)
 
         result.append(x)
     return result
 
+
 cdef asbytes(object o):
     if PY3:
         return str(o).encode('utf-8')
@@ -1379,19 +1414,10 @@ cdef asbytes(object o):
         return str(o)
 
 
-def _is_file_like(obj):
-    if PY3:
-        import io
-        if isinstance(obj, io.TextIOWrapper):
-            raise ParserError('Cannot handle open unicode files (yet)')
-
-        # BufferedReader is a byte reader for Python 3
-        file = io.BufferedReader
-    else:
-        import __builtin__
-        file = __builtin__.file
-
-    return isinstance(obj, (basestring, file))
+# common NA values
+# no longer excluding inf representations
+# '1.#INF','-1.#INF', '1.#INF000000',
+_NA_VALUES = _ensure_encoded(list(icom._NA_VALUES))
 
 
 def _maybe_upcast(arr):
@@ -1409,11 +1435,13 @@ def _maybe_upcast(arr):
 
     return arr
 
+
 cdef enum StringPath:
     CSTRING
     UTF8
     ENCODED
 
+
 # factored out logic to pick string converter
 cdef inline StringPath _string_path(char *encoding):
     if encoding != NULL and encoding != b"utf-8":
@@ -1422,11 +1450,14 @@ cdef inline StringPath _string_path(char *encoding):
         return UTF8
     else:
         return CSTRING
+
+
 # ----------------------------------------------------------------------
 # Type conversions / inference support code
 
-cdef _string_box_factorize(parser_t *parser, int col,
-                           int line_start, int line_end,
+
+cdef _string_box_factorize(parser_t *parser, int64_t col,
+                           int64_t line_start, int64_t line_end,
                            bint na_filter, kh_str_t *na_hashset):
     cdef:
         int error, na_count = 0
@@ -1464,13 +1495,13 @@ cdef _string_box_factorize(parser_t *parser, int col,
         # in the hash table
         if k != table.n_buckets:
             # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
+            pyval = <object>table.vals[k]
         else:
             # box it. new ref?
             pyval = PyBytes_FromString(word)
 
             k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject*> pyval
+            table.vals[k] = <PyObject*>pyval
 
         result[i] = pyval
 
@@ -1478,8 +1509,9 @@ cdef _string_box_factorize(parser_t *parser, int col,
 
     return result, na_count
 
-cdef _string_box_utf8(parser_t *parser, int col,
-                      int line_start, int line_end,
+
+cdef _string_box_utf8(parser_t *parser, int64_t col,
+                      int64_t line_start, int64_t line_end,
                       bint na_filter, kh_str_t *na_hashset):
     cdef:
         int error, na_count = 0
@@ -1517,13 +1549,13 @@ cdef _string_box_utf8(parser_t *parser, int col,
         # in the hash table
         if k != table.n_buckets:
             # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
+            pyval = <object>table.vals[k]
         else:
             # box it. new ref?
             pyval = PyUnicode_FromString(word)
 
             k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject *> pyval
+            table.vals[k] = <PyObject *>pyval
 
         result[i] = pyval
 
@@ -1531,8 +1563,9 @@ cdef _string_box_utf8(parser_t *parser, int col,
 
     return result, na_count
 
-cdef _string_box_decode(parser_t *parser, int col,
-                        int line_start, int line_end,
+
+cdef _string_box_decode(parser_t *parser, int64_t col,
+                        int64_t line_start, int64_t line_end,
                         bint na_filter, kh_str_t *na_hashset,
                         char *encoding):
     cdef:
@@ -1573,14 +1606,14 @@ cdef _string_box_decode(parser_t *parser, int col,
         # in the hash table
         if k != table.n_buckets:
             # this increments the refcount, but need to test
-            pyval = <object> table.vals[k]
+            pyval = <object>table.vals[k]
         else:
             # box it. new ref?
             size = strlen(word)
             pyval = PyUnicode_Decode(word, size, encoding, errors)
 
             k = kh_put_strbox(table, word, &ret)
-            table.vals[k] = <PyObject *> pyval
+            table.vals[k] = <PyObject *>pyval
 
         result[i] = pyval
 
@@ -1590,8 +1623,8 @@ cdef _string_box_decode(parser_t *parser, int col,
 
 
 @cython.boundscheck(False)
-cdef _categorical_convert(parser_t *parser, int col,
-                          int line_start, int line_end,
+cdef _categorical_convert(parser_t *parser, int64_t col,
+                          int64_t line_start, int64_t line_end,
                           bint na_filter, kh_str_t *na_hashset,
                           char *encoding):
     "Convert column data into codes, categories"
@@ -1606,7 +1639,7 @@ cdef _categorical_convert(parser_t *parser, int col,
         int64_t current_category = 0
 
         char *errors = "strict"
-        cdef StringPath path = _string_path(encoding)
+        StringPath path = _string_path(encoding)
 
         int ret = 0
         kh_str_t *table
@@ -1661,8 +1694,9 @@ cdef _categorical_convert(parser_t *parser, int col,
     kh_destroy_str(table)
     return np.asarray(codes), result, na_count
 
-cdef _to_fw_string(parser_t *parser, int col, int line_start,
-                   int line_end, size_t width):
+
+cdef _to_fw_string(parser_t *parser, int64_t col, int64_t line_start,
+                   int64_t line_end, int64_t width):
     cdef:
         Py_ssize_t i
         coliter_t it
@@ -1671,18 +1705,19 @@ cdef _to_fw_string(parser_t *parser, int col, int line_start,
         ndarray result
 
     result = np.empty(line_end - line_start, dtype='|S%d' % width)
-    data = <char*> result.data
+    data = <char*>result.data
 
     with nogil:
         _to_fw_string_nogil(parser, col, line_start, line_end, width, data)
 
     return result
 
-cdef inline void _to_fw_string_nogil(parser_t *parser, int col,
-                                     int line_start, int line_end,
+
+cdef inline void _to_fw_string_nogil(parser_t *parser, int64_t col,
+                                     int64_t line_start, int64_t line_end,
                                      size_t width, char *data) nogil:
     cdef:
-        Py_ssize_t i
+        int64_t i
         coliter_t it
         const char *word = NULL
 
@@ -1693,11 +1728,15 @@ cdef inline void _to_fw_string_nogil(parser_t *parser, int col,
         strncpy(data, word, width)
         data += width
 
-cdef char* cinf = b'inf'
-cdef char* cposinf = b'+inf'
-cdef char* cneginf = b'-inf'
 
-cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
+cdef:
+    char* cinf = b'inf'
+    char* cposinf = b'+inf'
+    char* cneginf = b'-inf'
+
+
+cdef _try_double(parser_t *parser, int64_t col,
+                 int64_t line_start, int64_t line_end,
                  bint na_filter, kh_str_t *na_hashset, object na_flist):
     cdef:
         int error, na_count = 0
@@ -1705,8 +1744,8 @@ cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
         coliter_t it
         const char *word = NULL
         char *p_end
-        double *data
-        double NA = na_values[np.float64]
+        float64_t *data
+        float64_t NA = na_values[np.float64]
         kh_float64_t *na_fset
         ndarray result
         khiter_t k
@@ -1714,7 +1753,7 @@ cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
 
     lines = line_end - line_start
     result = np.empty(lines, dtype=np.float64)
-    data = <double *> result.data
+    data = <float64_t *>result.data
     na_fset = kset_float64_from_list(na_flist)
     if parser.double_converter_nogil != NULL:  # if it can run without the GIL
         with nogil:
@@ -1725,8 +1764,8 @@ cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
     else:
         assert parser.double_converter_withgil != NULL
         error = _try_double_nogil(parser,
-                                  <double (*)(const char *, char **,
-                                              char, char, char, int)
+                                  <float64_t (*)(const char *, char **,
+                                                 char, char, char, int)
                                   nogil>parser.double_converter_withgil,
                                   col, line_start, line_end,
                                   na_filter, na_hashset, use_na_flist,
@@ -1736,15 +1775,16 @@ cdef _try_double(parser_t *parser, int col, int line_start, int line_end,
         return None, None
     return result, na_count
 
+
 cdef inline int _try_double_nogil(parser_t *parser,
-                                  double (*double_converter)(
+                                  float64_t (*double_converter)(
                                       const char *, char **, char,
                                       char, char, int) nogil,
                                   int col, int line_start, int line_end,
                                   bint na_filter, kh_str_t *na_hashset,
                                   bint use_na_flist,
                                   const kh_float64_t *na_flist,
-                                  double NA, double *data,
+                                  float64_t NA, float64_t *data,
                                   int *na_count) nogil:
     cdef:
         int error,
@@ -1773,7 +1813,7 @@ cdef inline int _try_double_nogil(parser_t *parser,
                                            parser.sci, parser.thousands, 1)
                 if errno != 0 or p_end[0] or p_end == word:
                     if (strcasecmp(word, cinf) == 0 or
-                                strcasecmp(word, cposinf) == 0):
+                            strcasecmp(word, cposinf) == 0):
                         data[0] = INF
                     elif strcasecmp(word, cneginf) == 0:
                         data[0] = NEGINF
@@ -1794,7 +1834,7 @@ cdef inline int _try_double_nogil(parser_t *parser,
                                        parser.sci, parser.thousands, 1)
             if errno != 0 or p_end[0] or p_end == word:
                 if (strcasecmp(word, cinf) == 0 or
-                            strcasecmp(word, cposinf) == 0):
+                        strcasecmp(word, cposinf) == 0):
                     data[0] = INF
                 elif strcasecmp(word, cneginf) == 0:
                     data[0] = NEGINF
@@ -1806,7 +1846,9 @@ cdef inline int _try_double_nogil(parser_t *parser,
 
     return 0
 
-cdef _try_uint64(parser_t *parser, int col, int line_start, int line_end,
+
+cdef _try_uint64(parser_t *parser, int64_t col,
+                 int64_t line_start, int64_t line_end,
                  bint na_filter, kh_str_t *na_hashset):
     cdef:
         int error
@@ -1819,7 +1861,7 @@ cdef _try_uint64(parser_t *parser, int col, int line_start, int line_end,
 
     lines = line_end - line_start
     result = np.empty(lines, dtype=np.uint64)
-    data = <uint64_t *> result.data
+    data = <uint64_t *>result.data
 
     uint_state_init(&state)
     coliter_setup(&it, parser, col, line_start)
@@ -1840,8 +1882,10 @@ cdef _try_uint64(parser_t *parser, int col, int line_start, int line_end,
 
     return result
 
-cdef inline int _try_uint64_nogil(parser_t *parser, int col, int line_start,
-                                  int line_end, bint na_filter,
+
+cdef inline int _try_uint64_nogil(parser_t *parser, int64_t col,
+                                  int64_t line_start,
+                                  int64_t line_end, bint na_filter,
                                   const kh_str_t *na_hashset,
                                   uint64_t *data, uint_state *state) nogil:
     cdef:
@@ -1877,7 +1921,9 @@ cdef inline int _try_uint64_nogil(parser_t *parser, int col, int line_start,
 
     return 0
 
-cdef _try_int64(parser_t *parser, int col, int line_start, int line_end,
+
+cdef _try_int64(parser_t *parser, int64_t col,
+                int64_t line_start, int64_t line_end,
                 bint na_filter, kh_str_t *na_hashset):
     cdef:
         int error, na_count = 0
@@ -1891,7 +1937,7 @@ cdef _try_int64(parser_t *parser, int col, int line_start, int line_end,
 
     lines = line_end - line_start
     result = np.empty(lines, dtype=np.int64)
-    data = <int64_t *> result.data
+    data = <int64_t *>result.data
     coliter_setup(&it, parser, col, line_start)
     with nogil:
         error = _try_int64_nogil(parser, col, line_start, line_end,
@@ -1904,8 +1950,10 @@ cdef _try_int64(parser_t *parser, int col, int line_start, int line_end,
 
     return result, na_count
 
-cdef inline int _try_int64_nogil(parser_t *parser, int col, int line_start,
-                                 int line_end, bint na_filter,
+
+cdef inline int _try_int64_nogil(parser_t *parser, int64_t col,
+                                 int64_t line_start,
+                                 int64_t line_end, bint na_filter,
                                  const kh_str_t *na_hashset, int64_t NA,
                                  int64_t *data, int *na_count) nogil:
     cdef:
@@ -1942,69 +1990,9 @@ cdef inline int _try_int64_nogil(parser_t *parser, int col, int line_start,
 
     return 0
 
-cdef _try_bool(parser_t *parser, int col, int line_start, int line_end,
-               bint na_filter, kh_str_t *na_hashset):
-    cdef:
-        int na_count
-        Py_ssize_t lines = line_end - line_start
-        uint8_t *data
-        cnp.ndarray[cnp.uint8_t, ndim=1] result
-
-        uint8_t NA = na_values[np.bool_]
-
-    result = np.empty(lines)
-    data = <uint8_t *> result.data
-
-    with nogil:
-        error = _try_bool_nogil(parser, col, line_start,
-                                line_end, na_filter,
-                                na_hashset, NA, data,
-                                &na_count)
-    if error != 0:
-        return None, None
-    return result.view(np.bool_), na_count
-
-cdef inline int _try_bool_nogil(parser_t *parser, int col, int line_start,
-                                int line_end, bint na_filter,
-                                const kh_str_t *na_hashset, uint8_t NA,
-                                uint8_t *data, int *na_count) nogil:
-    cdef:
-        int error
-        Py_ssize_t i, lines = line_end - line_start
-        coliter_t it
-        const char *word = NULL
-        khiter_t k
-    na_count[0] = 0
-
-    coliter_setup(&it, parser, col, line_start)
-
-    if na_filter:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
 
-            k = kh_get_str(na_hashset, word)
-            # in the hash table
-            if k != na_hashset.n_buckets:
-                na_count[0] += 1
-                data[0] = NA
-                data += 1
-                continue
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return error
-            data += 1
-    else:
-        for i in range(lines):
-            COLITER_NEXT(it, word)
-
-            error = to_boolean(word, data)
-            if error != 0:
-                return error
-            data += 1
-    return 0
-
-cdef _try_bool_flex(parser_t *parser, int col, int line_start, int line_end,
+cdef _try_bool_flex(parser_t *parser, int64_t col,
+                    int64_t line_start, int64_t line_end,
                     bint na_filter, const kh_str_t *na_hashset,
                     const kh_str_t *true_hashset,
                     const kh_str_t *false_hashset):
@@ -2021,7 +2009,7 @@ cdef _try_bool_flex(parser_t *parser, int col, int line_start, int line_end,
 
     lines = line_end - line_start
     result = np.empty(lines, dtype=np.uint8)
-    data = <uint8_t *> result.data
+    data = <uint8_t *>result.data
     with nogil:
         error = _try_bool_flex_nogil(parser, col, line_start, line_end,
                                      na_filter, na_hashset, true_hashset,
@@ -2030,8 +2018,10 @@ cdef _try_bool_flex(parser_t *parser, int col, int line_start, int line_end,
         return None, None
     return result.view(np.bool_), na_count
 
-cdef inline int _try_bool_flex_nogil(parser_t *parser, int col, int line_start,
-                                     int line_end, bint na_filter,
+
+cdef inline int _try_bool_flex_nogil(parser_t *parser, int64_t col,
+                                     int64_t line_start,
+                                     int64_t line_end, bint na_filter,
                                      const kh_str_t *na_hashset,
                                      const kh_str_t *true_hashset,
                                      const kh_str_t *false_hashset,
@@ -2114,13 +2104,15 @@ cdef kh_str_t* kset_from_list(list values) except NULL:
         val = values[i]
 
         # None creeps in sometimes, which isn't possible here
-        if not PyBytes_Check(val):
+        if not isinstance(val, bytes):
+            kh_destroy_str(table)
             raise ValueError('Must be all encoded bytes')
 
         k = kh_put_str(table, PyBytes_AsString(val), &ret)
 
     return table
 
+
 cdef kh_float64_t* kset_float64_from_list(values) except NULL:
     # caller takes responsibility for freeing the hash table
     cdef:
@@ -2128,7 +2120,7 @@ cdef kh_float64_t* kset_float64_from_list(values) except NULL:
         khiter_t k
         kh_float64_t *table
         int ret = 0
-        cnp.float64_t val
+        float64_t val
         object value
 
     table = kh_init_float64()
@@ -2154,14 +2146,14 @@ cdef raise_parser_error(object base, parser_t *parser):
         Py_XDECREF(traceback)
 
         if value != NULL:
-            old_exc = <object> value
+            old_exc = <object>value
             Py_XDECREF(value)
 
             # PyErr_Fetch only returned the error message in *value,
             # so the Exception class must be extracted from *type.
             if isinstance(old_exc, compat.string_types):
                 if type != NULL:
-                    exc_type = <object> type
+                    exc_type = <object>type
                 else:
                     exc_type = ParserError
 
@@ -2171,7 +2163,7 @@ cdef raise_parser_error(object base, parser_t *parser):
                 Py_XDECREF(type)
                 raise old_exc
 
-    message = '%s. C error: ' % base
+    message = '{base}. C error: '.format(base=base)
     if parser.error_msg != NULL:
         if PY3:
             message += parser.error_msg.decode('utf-8')
@@ -2196,16 +2188,24 @@ def _concatenate_chunks(list chunks):
     for name in names:
         arrs = [chunk.pop(name) for chunk in chunks]
         # Check each arr for consistent types.
-        dtypes = set([a.dtype for a in arrs])
-        if len(dtypes) > 1:
-            common_type = np.find_common_type(dtypes, [])
+        dtypes = {a.dtype for a in arrs}
+        numpy_dtypes = {x for x in dtypes if not is_categorical_dtype(x)}
+        if len(numpy_dtypes) > 1:
+            common_type = np.find_common_type(numpy_dtypes, [])
             if common_type == np.object:
                 warning_columns.append(str(name))
 
-        if is_categorical_dtype(dtypes.pop()):
-            result[name] = union_categoricals(arrs, sort_categories=True)
+        dtype = dtypes.pop()
+        if is_categorical_dtype(dtype):
+            sort_categories = isinstance(dtype, str)
+            result[name] = union_categoricals(arrs,
+                                              sort_categories=sort_categories)
         else:
-            result[name] = np.concatenate(arrs)
+            if is_extension_array_dtype(dtype):
+                array_type = dtype.construct_array_type()
+                result[name] = array_type._concat_same_type(arrs)
+            else:
+                result[name] = np.concatenate(arrs)
 
     if warning_columns:
         warning_names = ','.join(warning_columns)
@@ -2243,14 +2243,15 @@ def _compute_na_values():
     }
     return na_values
 
+
 na_values = _compute_na_values()
 
 for k in list(na_values):
     na_values[np.dtype(k)] = na_values[k]
 
 
-cdef _apply_converter(object f, parser_t *parser, int col,
-                      int line_start, int line_end,
+cdef _apply_converter(object f, parser_t *parser, int64_t col,
+                      int64_t line_start, int64_t line_end,
                       char* c_encoding):
     cdef:
         int error
@@ -2286,77 +2287,41 @@ cdef _apply_converter(object f, parser_t *parser, int col,
     return lib.maybe_convert_objects(result)
 
 
-def _to_structured_array(dict columns, object names, object usecols):
-    cdef:
-        ndarray recs, column
-        cnp.dtype dt
-        dict fields
-
-        object name, fnames, field_type
-        Py_ssize_t i, offset, nfields, length
-        int stride, elsize
-        char *buf
-
-    if names is None:
-        names = ['%d' % i for i in range(len(columns))]
-    else:
-        # single line header
-        names = names[0]
-
-    if usecols is not None:
-        names = [n for i, n in enumerate(names)
-                 if i in usecols or n in usecols]
-
-    dt = np.dtype([(str(name), columns[i].dtype)
-                   for i, name in enumerate(names)])
-    fnames = dt.names
-    fields = dt.fields
-
-    nfields = len(fields)
-
-    if PY3:
-        length = len(list(columns.values())[0])
-    else:
-        length = len(columns.values()[0])
-
-    stride = dt.itemsize
-
-    # We own the data.
-    buf = <char*> malloc(length * stride)
-
-    recs = util.sarr_from_data(dt, length, buf)
-    assert(recs.flags.owndata)
-
-    for i in range(nfields):
-        # XXX
-        field_type = fields[fnames[i]]
-
-        # (dtype, stride) tuple
-        offset = field_type[1]
-        elsize = field_type[0].itemsize
-        column = columns[i]
-
-        _fill_structured_column(buf + offset, <char*> column.data,
-                                elsize, stride, length,
-                                field_type[0] == np.object_)
+def _maybe_encode(values):
+    if values is None:
+        return []
+    return [x.encode('utf-8') if isinstance(x, unicode) else x for x in values]
 
-    return recs
 
-cdef _fill_structured_column(char *dst, char* src, int elsize,
-                             int stride, int length, bint incref):
+def sanitize_objects(ndarray[object] values, set na_values,
+                     convert_empty=True):
+    """
+    Convert specified values, including the given set na_values and empty
+    strings if convert_empty is True, to np.nan.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+    na_values : set
+    convert_empty : bool (default True)
+    """
     cdef:
-        Py_ssize_t i
+        Py_ssize_t i, n
+        object val, onan
+        Py_ssize_t na_count = 0
+        dict memo = {}
 
-    if incref:
-        util.transfer_object_column(dst, src, stride, length)
-    else:
-        for i in range(length):
-            memcpy(dst, src, elsize)
-            dst += stride
-            src += elsize
+    n = len(values)
+    onan = np.nan
 
+    for i in range(n):
+        val = values[i]
+        if (convert_empty and val == '') or (val in na_values):
+            values[i] = onan
+            na_count += 1
+        elif val in memo:
+            values[i] = memo[val]
+        else:
+            memo[val] = val
 
-def _maybe_encode(values):
-    if values is None:
-        return []
-    return [x.encode('utf-8') if isinstance(x, unicode) else x for x in values]
+    return na_count
diff --git a/pandas/_libs/period.pyx b/pandas/_libs/period.pyx
deleted file mode 100644
index f30035910a62f..0000000000000
--- a/pandas/_libs/period.pyx
+++ /dev/null
@@ -1,1258 +0,0 @@
-from datetime import datetime, date, timedelta
-import operator
-
-from cpython cimport (
-    PyObject_RichCompareBool,
-    Py_EQ, Py_NE,
-)
-
-from numpy cimport (int8_t, int32_t, int64_t, import_array, ndarray,
-                    NPY_INT64, NPY_DATETIME, NPY_TIMEDELTA)
-import numpy as np
-
-cdef extern from "datetime_helper.h":
-    double total_seconds(object)
-
-from libc.stdlib cimport free
-
-from pandas import compat
-from pandas.compat import PY2
-
-cimport cython
-from datetime cimport *
-cimport util, lib
-from lib cimport is_null_datetimelike, is_period
-from pandas._libs import tslib, lib
-from pandas._libs.tslib import (Timedelta, Timestamp, iNaT,
-                                NaT, have_pytz, _get_utcoffset)
-from tslib cimport (
-    maybe_get_tz,
-    _is_utc,
-    _is_tzlocal,
-    _get_dst_info,
-    _nat_scalar_rules,
-)
-
-from pandas.tseries import offsets
-from pandas.tseries.tools import parse_time_string
-from pandas.tseries import frequencies
-
-cdef int64_t NPY_NAT = util.get_nat()
-
-cdef int RESO_US = frequencies.RESO_US
-cdef int RESO_MS = frequencies.RESO_MS
-cdef int RESO_SEC = frequencies.RESO_SEC
-cdef int RESO_MIN = frequencies.RESO_MIN
-cdef int RESO_HR = frequencies.RESO_HR
-cdef int RESO_DAY = frequencies.RESO_DAY
-
-cdef extern from "period_helper.h":
-    ctypedef struct date_info:
-        int64_t absdate
-        double abstime
-        double second
-        int minute
-        int hour
-        int day
-        int month
-        int quarter
-        int year
-        int day_of_week
-        int day_of_year
-        int calendar
-
-    ctypedef struct asfreq_info:
-        int from_week_end
-        int to_week_end
-
-        int from_a_year_end
-        int to_a_year_end
-
-        int from_q_year_end
-        int to_q_year_end
-
-    ctypedef int64_t (*freq_conv_func)(int64_t, char, asfreq_info*)
-
-    void initialize_daytime_conversion_factor_matrix()
-    int64_t asfreq(int64_t dtordinal, int freq1, int freq2,
-                   char relation) except INT32_MIN
-    freq_conv_func get_asfreq_func(int fromFreq, int toFreq)
-    void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info)
-
-    int64_t get_period_ordinal(int year, int month, int day,
-                               int hour, int minute, int second,
-                               int microseconds, int picoseconds,
-                               int freq) nogil except INT32_MIN
-
-    int64_t get_python_ordinal(int64_t period_ordinal,
-                               int freq) except INT32_MIN
-
-    int get_date_info(int64_t ordinal, int freq,
-                      date_info *dinfo) nogil except INT32_MIN
-    double getAbsTime(int, int64_t, int64_t)
-
-    int pyear(int64_t ordinal, int freq) except INT32_MIN
-    int pqyear(int64_t ordinal, int freq) except INT32_MIN
-    int pquarter(int64_t ordinal, int freq) except INT32_MIN
-    int pmonth(int64_t ordinal, int freq) except INT32_MIN
-    int pday(int64_t ordinal, int freq) except INT32_MIN
-    int pweekday(int64_t ordinal, int freq) except INT32_MIN
-    int pday_of_week(int64_t ordinal, int freq) except INT32_MIN
-    int pday_of_year(int64_t ordinal, int freq) except INT32_MIN
-    int pweek(int64_t ordinal, int freq) except INT32_MIN
-    int phour(int64_t ordinal, int freq) except INT32_MIN
-    int pminute(int64_t ordinal, int freq) except INT32_MIN
-    int psecond(int64_t ordinal, int freq) except INT32_MIN
-    int pdays_in_month(int64_t ordinal, int freq) except INT32_MIN
-    char *c_strftime(date_info *dinfo, char *fmt)
-    int get_yq(int64_t ordinal, int freq, int *quarter, int *year)
-
-initialize_daytime_conversion_factor_matrix()
-
-# Period logic
-#----------------------------------------------------------------------
-
-cdef inline int64_t apply_mult(int64_t period_ord, int64_t mult):
-    """
-    Get freq+multiple ordinal value from corresponding freq-only ordinal value.
-    For example, 5min ordinal will be 1/5th the 1min ordinal (rounding down to
-    integer).
-    """
-    if mult == 1:
-        return period_ord
-
-    return (period_ord - 1) // mult
-
-cdef inline int64_t remove_mult(int64_t period_ord_w_mult, int64_t mult):
-    """
-    Get freq-only ordinal value from corresponding freq+multiple ordinal.
-    """
-    if mult == 1:
-        return period_ord_w_mult
-
-    return period_ord_w_mult * mult + 1;
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def dt64arr_to_periodarr(ndarray[int64_t] dtarr, int freq, tz=None):
-    """
-    Convert array of datetime64 values (passed in as 'i8' dtype) to a set of
-    periods corresponding to desired frequency, per period convention.
-    """
-    cdef:
-        ndarray[int64_t] out
-        Py_ssize_t i, l
-        pandas_datetimestruct dts
-
-    l = len(dtarr)
-
-    out = np.empty(l, dtype='i8')
-
-    if tz is None:
-        with nogil:
-            for i in range(l):
-                if dtarr[i] == NPY_NAT:
-                    out[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(dtarr[i], PANDAS_FR_ns, &dts)
-                out[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                            dts.hour, dts.min, dts.sec,
-                                            dts.us, dts.ps, freq)
-    else:
-        out = localize_dt64arr_to_period(dtarr, freq, tz)
-    return out
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def periodarr_to_dt64arr(ndarray[int64_t] periodarr, int freq):
-    """
-    Convert array to datetime64 values from a set of ordinals corresponding to
-    periods per period convention.
-    """
-    cdef:
-        ndarray[int64_t] out
-        Py_ssize_t i, l
-
-    l = len(periodarr)
-
-    out = np.empty(l, dtype='i8')
-
-    with nogil:
-        for i in range(l):
-            if periodarr[i] == NPY_NAT:
-                out[i] = NPY_NAT
-                continue
-            out[i] = period_ordinal_to_dt64(periodarr[i], freq)
-
-    return out
-
-cdef char START = 'S'
-cdef char END = 'E'
-
-cpdef int64_t period_asfreq(int64_t period_ordinal, int freq1, int freq2,
-                            bint end):
-    """
-    Convert period ordinal from one frequency to another, and if upsampling,
-    choose to use start ('S') or end ('E') of period.
-    """
-    cdef:
-        int64_t retval
-
-    if period_ordinal == iNaT:
-        return iNaT
-
-    if end:
-        retval = asfreq(period_ordinal, freq1, freq2, END)
-    else:
-        retval = asfreq(period_ordinal, freq1, freq2, START)
-
-    if retval == INT32_MIN:
-        raise ValueError('Frequency conversion failed')
-
-    return retval
-
-
-def period_asfreq_arr(ndarray[int64_t] arr, int freq1, int freq2, bint end):
-    """
-    Convert int64-array of period ordinals from one frequency to another, and
-    if upsampling, choose to use start ('S') or end ('E') of period.
-    """
-    cdef:
-        ndarray[int64_t] result
-        Py_ssize_t i, n
-        freq_conv_func func
-        asfreq_info finfo
-        int64_t val, ordinal
-        char relation
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.int64)
-
-    func = get_asfreq_func(freq1, freq2)
-    get_asfreq_info(freq1, freq2, &finfo)
-
-    if end:
-        relation = END
-    else:
-        relation = START
-
-    mask = arr == iNaT
-    if mask.any():      # NaT process
-        for i in range(n):
-            val = arr[i]
-            if val != iNaT:
-                val = func(val, relation, &finfo)
-                if val == INT32_MIN:
-                    raise ValueError("Unable to convert to desired frequency.")
-            result[i] = val
-    else:
-        for i in range(n):
-            val = func(arr[i], relation, &finfo)
-            if val == INT32_MIN:
-                raise ValueError("Unable to convert to desired frequency.")
-            result[i] = val
-
-    return result
-
-
-def period_ordinal(int y, int m, int d, int h, int min,
-                   int s, int us, int ps, int freq):
-    cdef:
-        int64_t ordinal
-
-    return get_period_ordinal(y, m, d, h, min, s, us, ps, freq)
-
-
-cpdef int64_t period_ordinal_to_dt64(int64_t ordinal, int freq) nogil:
-    cdef:
-        pandas_datetimestruct dts
-        date_info dinfo
-        float subsecond_fraction
-
-    if ordinal == NPY_NAT:
-        return NPY_NAT
-
-    get_date_info(ordinal, freq, &dinfo)
-
-    dts.year = dinfo.year
-    dts.month = dinfo.month
-    dts.day = dinfo.day
-    dts.hour = dinfo.hour
-    dts.min = dinfo.minute
-    dts.sec = int(dinfo.second)
-    subsecond_fraction = dinfo.second - dts.sec
-    dts.us = int((subsecond_fraction) * 1e6)
-    dts.ps = int(((subsecond_fraction) * 1e6 - dts.us) * 1e6)
-
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-
-
-def period_format(int64_t value, int freq, object fmt=None):
-    cdef:
-        int freq_group
-
-    if value == iNaT:
-        return repr(NaT)
-
-    if fmt is None:
-        freq_group = (freq // 1000) * 1000
-        if freq_group == 1000: # FR_ANN
-            fmt = b'%Y'
-        elif freq_group == 2000: # FR_QTR
-            fmt = b'%FQ%q'
-        elif freq_group == 3000: # FR_MTH
-            fmt = b'%Y-%m'
-        elif freq_group == 4000: # WK
-            left = period_asfreq(value, freq, 6000, 0)
-            right = period_asfreq(value, freq, 6000, 1)
-            return '%s/%s' % (period_format(left, 6000),
-                              period_format(right, 6000))
-        elif (freq_group == 5000 # BUS
-              or freq_group == 6000): # DAY
-            fmt = b'%Y-%m-%d'
-        elif freq_group == 7000: # HR
-            fmt = b'%Y-%m-%d %H:00'
-        elif freq_group == 8000: # MIN
-            fmt = b'%Y-%m-%d %H:%M'
-        elif freq_group == 9000: # SEC
-            fmt = b'%Y-%m-%d %H:%M:%S'
-        elif freq_group == 10000: # MILLISEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%l'
-        elif freq_group == 11000: # MICROSEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%u'
-        elif freq_group == 12000: # NANOSEC
-            fmt = b'%Y-%m-%d %H:%M:%S.%n'
-        else:
-            raise ValueError('Unknown freq: %d' % freq)
-
-    return _period_strftime(value, freq, fmt)
-
-
-cdef list extra_fmts = [(b"%q", b"^`AB`^"),
-                        (b"%f", b"^`CD`^"),
-                        (b"%F", b"^`EF`^"),
-                        (b"%l", b"^`GH`^"),
-                        (b"%u", b"^`IJ`^"),
-                        (b"%n", b"^`KL`^")]
-
-cdef list str_extra_fmts = ["^`AB`^", "^`CD`^", "^`EF`^",
-                            "^`GH`^", "^`IJ`^", "^`KL`^"]
-
-cdef object _period_strftime(int64_t value, int freq, object fmt):
-    import sys
-
-    cdef:
-        Py_ssize_t i
-        date_info dinfo
-        char *formatted
-        object pat, repl, result
-        list found_pat = [False] * len(extra_fmts)
-        int year, quarter
-
-    if PyUnicode_Check(fmt):
-        fmt = fmt.encode('utf-8')
-
-    get_date_info(value, freq, &dinfo)
-    for i in range(len(extra_fmts)):
-        pat = extra_fmts[i][0]
-        repl = extra_fmts[i][1]
-        if pat in fmt:
-            fmt = fmt.replace(pat, repl)
-            found_pat[i] = True
-
-    formatted = c_strftime(&dinfo, <char*> fmt)
-
-    result = util.char_to_string(formatted)
-    free(formatted)
-
-    for i in range(len(extra_fmts)):
-        if found_pat[i]:
-            if get_yq(value, freq, &quarter, &year) < 0:
-                raise ValueError('Unable to get quarter and year')
-
-            if i == 0:
-                repl = '%d' % quarter
-            elif i == 1:  # %f, 2-digit year
-                repl = '%.2d' % (year % 100)
-            elif i == 2:
-                repl = '%d' % year
-            elif i == 3:
-                repl = '%03d' % (value % 1000)
-            elif i == 4:
-                repl = '%06d' % (value % 1000000)
-            elif i == 5:
-                repl = '%09d' % (value % 1000000000)
-
-            result = result.replace(str_extra_fmts[i], repl)
-
-    if PY2:
-        result = result.decode('utf-8', 'ignore')
-
-    return result
-
-# period accessors
-
-ctypedef int (*accessor)(int64_t ordinal, int freq) except INT32_MIN
-
-
-def get_period_field(int code, int64_t value, int freq):
-    cdef accessor f = _get_accessor_func(code)
-    if f is NULL:
-        raise ValueError('Unrecognized period code: %d' % code)
-    if value == iNaT:
-        return np.nan
-    return f(value, freq)
-
-
-def get_period_field_arr(int code, ndarray[int64_t] arr, int freq):
-    cdef:
-        Py_ssize_t i, sz
-        ndarray[int64_t] out
-        accessor f
-
-    f = _get_accessor_func(code)
-    if f is NULL:
-        raise ValueError('Unrecognized period code: %d' % code)
-
-    sz = len(arr)
-    out = np.empty(sz, dtype=np.int64)
-
-    for i in range(sz):
-        if arr[i] == iNaT:
-            out[i] = -1
-            continue
-        out[i] = f(arr[i], freq)
-
-    return out
-
-
-cdef accessor _get_accessor_func(int code):
-    if code == 0:
-        return &pyear
-    elif code == 1:
-        return &pqyear
-    elif code == 2:
-        return &pquarter
-    elif code == 3:
-        return &pmonth
-    elif code == 4:
-        return &pday
-    elif code == 5:
-        return &phour
-    elif code == 6:
-        return &pminute
-    elif code == 7:
-        return &psecond
-    elif code == 8:
-        return &pweek
-    elif code == 9:
-        return &pday_of_year
-    elif code == 10:
-        return &pweekday
-    elif code == 11:
-        return &pdays_in_month
-    return NULL
-
-
-def extract_ordinals(ndarray[object] values, freq):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[int64_t] ordinals = np.empty(n, dtype=np.int64)
-        object p
-
-    freqstr = Period._maybe_convert_freq(freq).freqstr
-
-    for i in range(n):
-        p = values[i]
-
-        if is_null_datetimelike(p):
-            ordinals[i] = iNaT
-        else:
-            try:
-                ordinals[i] = p.ordinal
-
-                if p.freqstr != freqstr:
-                    msg = _DIFFERENT_FREQ_INDEX.format(freqstr, p.freqstr)
-                    raise IncompatibleFrequency(msg)
-
-            except AttributeError:
-                p = Period(p, freq=freq)
-                if p is NaT:
-                    # input may contain NaT-like string
-                    ordinals[i] = iNaT
-                else:
-                    ordinals[i] = p.ordinal
-
-    return ordinals
-
-
-def extract_freq(ndarray[object] values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object p
-
-    for i in range(n):
-        p = values[i]
-
-        try:
-            # now Timestamp / NaT has freq attr
-            if is_period(p):
-                return p.freq
-        except AttributeError:
-            pass
-
-    raise ValueError('freq not specified and cannot be inferred')
-
-
-cpdef resolution(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-        int reso = RESO_DAY, curr_reso
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-        return _reso_local(stamps, tz)
-    else:
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-        return reso
-
-
-cdef inline int _reso_stamp(pandas_datetimestruct *dts):
-    if dts.us != 0:
-        if dts.us % 1000 == 0:
-            return RESO_MS
-        return RESO_US
-    elif dts.sec != 0:
-        return RESO_SEC
-    elif dts.min != 0:
-        return RESO_MIN
-    elif dts.hour != 0:
-        return RESO_HR
-    return RESO_DAY
-
-cdef _reso_local(ndarray[int64_t] stamps, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        int reso = RESO_DAY, curr_reso
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
-
-    if _is_utc(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns,
-                                              &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            curr_reso = _reso_stamp(&dts)
-            if curr_reso < reso:
-                reso = curr_reso
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
-
-        # statictzinfo
-        if typ not in ['pytz', 'dateutil']:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                curr_reso = _reso_stamp(&dts)
-                if curr_reso < reso:
-                    reso = curr_reso
-        else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                curr_reso = _reso_stamp(&dts)
-                if curr_reso < reso:
-                    reso = curr_reso
-
-    return reso
-
-
-# period helpers
-
-cdef ndarray[int64_t] localize_dt64arr_to_period(ndarray[int64_t] stamps,
-                                                 int freq, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
-
-    if not have_pytz:
-        raise Exception('Could not find pytz module')
-
-    if _is_utc(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                           dts.hour, dts.min, dts.sec,
-                                           dts.us, dts.ps, freq)
-
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns,
-                                              &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                           dts.hour, dts.min, dts.sec,
-                                           dts.us, dts.ps, freq)
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
-
-        # statictzinfo
-        if typ not in ['pytz', 'dateutil']:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                               dts.hour, dts.min, dts.sec,
-                                               dts.us, dts.ps, freq)
-        else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = get_period_ordinal(dts.year, dts.month, dts.day,
-                                               dts.hour, dts.min, dts.sec,
-                                               dts.us, dts.ps, freq)
-
-    return result
-
-
-_DIFFERENT_FREQ = "Input has different freq={1} from Period(freq={0})"
-_DIFFERENT_FREQ_INDEX = ("Input has different freq={1} "
-                         "from PeriodIndex(freq={0})")
-
-
-class IncompatibleFrequency(ValueError):
-    pass
-
-
-cdef class _Period(object):
-
-    cdef public:
-        int64_t ordinal
-        object freq
-
-    _comparables = ['name', 'freqstr']
-    _typ = 'period'
-
-    @classmethod
-    def _maybe_convert_freq(cls, object freq):
-
-        if isinstance(freq, (int, tuple)):
-            code, stride = frequencies.get_freq_code(freq)
-            freq = frequencies._get_freq_str(code, stride)
-
-        freq = frequencies.to_offset(freq)
-
-        if freq.n <= 0:
-            raise ValueError('Frequency must be positive, because it'
-                             ' represents span: {0}'.format(freq.freqstr))
-
-        return freq
-
-    @classmethod
-    def _from_ordinal(cls, ordinal, freq):
-        """
-        Fast creation from an ordinal and freq that are already validated!
-        """
-        if ordinal == iNaT:
-            return NaT
-        else:
-            self = _Period.__new__(cls)
-            self.ordinal = ordinal
-            self.freq = cls._maybe_convert_freq(freq)
-            return self
-
-    def __richcmp__(self, other, op):
-        if isinstance(other, Period):
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
-                raise IncompatibleFrequency(msg)
-            return PyObject_RichCompareBool(self.ordinal, other.ordinal, op)
-        elif other is NaT:
-            return _nat_scalar_rules[op]
-        # index/series like
-        elif hasattr(other, '_typ'):
-            return NotImplemented
-        else:
-            if op == Py_EQ:
-                return NotImplemented
-            elif op == Py_NE:
-                return NotImplemented
-            raise TypeError('Cannot compare type %r with type %r' %
-                            (type(self).__name__, type(other).__name__))
-
-    def __hash__(self):
-        return hash((self.ordinal, self.freqstr))
-
-    def _add_delta(self, other):
-        if isinstance(other, (timedelta, np.timedelta64,
-                              offsets.Tick, Timedelta)):
-            offset = frequencies.to_offset(self.freq.rule_code)
-            if isinstance(offset, offsets.Tick):
-                nanos = tslib._delta_to_nanoseconds(other)
-                offset_nanos = tslib._delta_to_nanoseconds(offset)
-
-                if nanos % offset_nanos == 0:
-                    ordinal = self.ordinal + (nanos // offset_nanos)
-                    return Period(ordinal=ordinal, freq=self.freq)
-            msg = 'Input cannot be converted to Period(freq={0})'
-            raise IncompatibleFrequency(msg.format(self.freqstr))
-        elif isinstance(other, offsets.DateOffset):
-            freqstr = other.rule_code
-            base = frequencies.get_base_alias(freqstr)
-            if base == self.freq.rule_code:
-                ordinal = self.ordinal + other.n
-                return Period(ordinal=ordinal, freq=self.freq)
-            msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-        else: # pragma no cover
-            return NotImplemented
-
-    def __add__(self, other):
-        if isinstance(self, Period):
-            if isinstance(other, (timedelta, np.timedelta64,
-                                  offsets.Tick, offsets.DateOffset,
-                                  Timedelta)):
-                return self._add_delta(other)
-            elif other is NaT:
-                return NaT
-            elif lib.is_integer(other):
-                ordinal = self.ordinal + other * self.freq.n
-                return Period(ordinal=ordinal, freq=self.freq)
-            else:  # pragma: no cover
-                return NotImplemented
-        elif isinstance(other, Period):
-            return other + self
-        else:
-            return NotImplemented
-
-    def __sub__(self, other):
-        if isinstance(self, Period):
-            if isinstance(other, (timedelta, np.timedelta64,
-                                  offsets.Tick, offsets.DateOffset,
-                                  Timedelta)):
-                neg_other = -other
-                return self + neg_other
-            elif lib.is_integer(other):
-                ordinal = self.ordinal - other * self.freq.n
-                return Period(ordinal=ordinal, freq=self.freq)
-            elif isinstance(other, Period):
-                if other.freq != self.freq:
-                    msg = _DIFFERENT_FREQ.format(self.freqstr, other.freqstr)
-                    raise IncompatibleFrequency(msg)
-                return self.ordinal - other.ordinal
-            elif getattr(other, '_typ', None) == 'periodindex':
-                return -other.__sub__(self)
-            else:  # pragma: no cover
-                return NotImplemented
-        elif isinstance(other, Period):
-            if self is NaT:
-                return NaT
-            return NotImplemented
-        else:
-            return NotImplemented
-
-    def asfreq(self, freq, how='E'):
-        """
-        Convert Period to desired frequency, either at the start or end of the
-        interval
-
-        Parameters
-        ----------
-        freq : string
-        how : {'E', 'S', 'end', 'start'}, default 'end'
-            Start or end of the timespan
-
-        Returns
-        -------
-        resampled : Period
-        """
-        freq = self._maybe_convert_freq(freq)
-        how = _validate_end_alias(how)
-        base1, mult1 = frequencies.get_freq_code(self.freq)
-        base2, mult2 = frequencies.get_freq_code(freq)
-
-        # mult1 can't be negative or 0
-        end = how == 'E'
-        if end:
-            ordinal = self.ordinal + mult1 - 1
-        else:
-            ordinal = self.ordinal
-        ordinal = period_asfreq(ordinal, base1, base2, end)
-
-        return Period(ordinal=ordinal, freq=freq)
-
-    @property
-    def start_time(self):
-        return self.to_timestamp(how='S')
-
-    @property
-    def end_time(self):
-        # freq.n can't be negative or 0
-        # ordinal = (self + self.freq.n).start_time.value - 1
-        ordinal = (self + 1).start_time.value - 1
-        return Timestamp(ordinal)
-
-    def to_timestamp(self, freq=None, how='start', tz=None):
-        """
-        Return the Timestamp representation of the Period at the target
-        frequency at the specified end (how) of the Period
-
-        Parameters
-        ----------
-        freq : string or DateOffset, default is 'D' if self.freq is week or
-               longer and 'S' otherwise
-            Target frequency
-        how: str, default 'S' (start)
-            'S', 'E'. Can be aliased as case insensitive
-            'Start', 'Finish', 'Begin', 'End'
-
-        Returns
-        -------
-        Timestamp
-        """
-        if freq is not None:
-            freq = self._maybe_convert_freq(freq)
-        how = _validate_end_alias(how)
-
-        if freq is None:
-            base, mult = frequencies.get_freq_code(self.freq)
-            freq = frequencies.get_to_timestamp_base(base)
-
-        base, mult = frequencies.get_freq_code(freq)
-        val = self.asfreq(freq, how)
-
-        dt64 = period_ordinal_to_dt64(val.ordinal, base)
-        return Timestamp(dt64, tz=tz)
-
-    cdef _field(self, alias):
-        base, mult = frequencies.get_freq_code(self.freq)
-        return get_period_field(alias, self.ordinal, base)
-
-    property year:
-        def __get__(self):
-            return self._field(0)
-    property month:
-        def __get__(self):
-            return self._field(3)
-    property day:
-        def __get__(self):
-            return self._field(4)
-    property hour:
-        def __get__(self):
-            return self._field(5)
-    property minute:
-        def __get__(self):
-            return self._field(6)
-    property second:
-        def __get__(self):
-            return self._field(7)
-    property weekofyear:
-        def __get__(self):
-            return self._field(8)
-    property week:
-        def __get__(self):
-            return self.weekofyear
-    property dayofweek:
-        def __get__(self):
-            return self._field(10)
-    property weekday:
-        def __get__(self):
-            return self.dayofweek
-    property dayofyear:
-        def __get__(self):
-            return self._field(9)
-    property quarter:
-        def __get__(self):
-            return self._field(2)
-    property qyear:
-        def __get__(self):
-            return self._field(1)
-    property days_in_month:
-        def __get__(self):
-            return self._field(11)
-    property daysinmonth:
-        def __get__(self):
-            return self.days_in_month
-    property is_leap_year:
-        def __get__(self):
-            return bool(is_leapyear(self._field(0)))
-
-    @classmethod
-    def now(cls, freq=None):
-        return Period(datetime.now(), freq=freq)
-
-    # HACK IT UP AND YOU BETTER FIX IT SOON
-    def __str__(self):
-        return self.__unicode__()
-
-    @property
-    def freqstr(self):
-        return self.freq.freqstr
-
-    def __repr__(self):
-        base, mult = frequencies.get_freq_code(self.freq)
-        formatted = period_format(self.ordinal, base)
-        return "Period('%s', '%s')" % (formatted, self.freqstr)
-
-    def __unicode__(self):
-        """
-        Return a string representation for a particular DataFrame
-
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
-        """
-        base, mult = frequencies.get_freq_code(self.freq)
-        formatted = period_format(self.ordinal, base)
-        value = ("%s" % formatted)
-        return value
-
-    def __setstate__(self, state):
-        self.freq=state[1]
-        self.ordinal=state[2]
-
-    def __reduce__(self):
-        object_state = None, self.freq, self.ordinal
-        return (Period, object_state)
-
-    def strftime(self, fmt):
-        """
-        Returns the string representation of the :class:`Period`, depending
-        on the selected :keyword:`format`. :keyword:`format` must be a string
-        containing one or several directives.  The method recognizes the same
-        directives as the :func:`time.strftime` function of the standard Python
-        distribution, as well as the specific additional directives ``%f``,
-        ``%F``, ``%q``. (formatting & docs originally from scikits.timeries)
-
-        +-----------+--------------------------------+-------+
-        | Directive | Meaning                        | Notes |
-        +===========+================================+=======+
-        | ``%a``    | Locale's abbreviated weekday   |       |
-        |           | name.                          |       |
-        +-----------+--------------------------------+-------+
-        | ``%A``    | Locale's full weekday name.    |       |
-        +-----------+--------------------------------+-------+
-        | ``%b``    | Locale's abbreviated month     |       |
-        |           | name.                          |       |
-        +-----------+--------------------------------+-------+
-        | ``%B``    | Locale's full month name.      |       |
-        +-----------+--------------------------------+-------+
-        | ``%c``    | Locale's appropriate date and  |       |
-        |           | time representation.           |       |
-        +-----------+--------------------------------+-------+
-        | ``%d``    | Day of the month as a decimal  |       |
-        |           | number [01,31].                |       |
-        +-----------+--------------------------------+-------+
-        | ``%f``    | 'Fiscal' year without a        | \(1)  |
-        |           | century  as a decimal number   |       |
-        |           | [00,99]                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%F``    | 'Fiscal' year with a century   | \(2)  |
-        |           | as a decimal number            |       |
-        +-----------+--------------------------------+-------+
-        | ``%H``    | Hour (24-hour clock) as a      |       |
-        |           | decimal number [00,23].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%I``    | Hour (12-hour clock) as a      |       |
-        |           | decimal number [01,12].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%j``    | Day of the year as a decimal   |       |
-        |           | number [001,366].              |       |
-        +-----------+--------------------------------+-------+
-        | ``%m``    | Month as a decimal number      |       |
-        |           | [01,12].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%M``    | Minute as a decimal number     |       |
-        |           | [00,59].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%p``    | Locale's equivalent of either  | \(3)  |
-        |           | AM or PM.                      |       |
-        +-----------+--------------------------------+-------+
-        | ``%q``    | Quarter as a decimal number    |       |
-        |           | [01,04]                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%S``    | Second as a decimal number     | \(4)  |
-        |           | [00,61].                       |       |
-        +-----------+--------------------------------+-------+
-        | ``%U``    | Week number of the year        | \(5)  |
-        |           | (Sunday as the first day of    |       |
-        |           | the week) as a decimal number  |       |
-        |           | [00,53].  All days in a new    |       |
-        |           | year preceding the first       |       |
-        |           | Sunday are considered to be in |       |
-        |           | week 0.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%w``    | Weekday as a decimal number    |       |
-        |           | [0(Sunday),6].                 |       |
-        +-----------+--------------------------------+-------+
-        | ``%W``    | Week number of the year        | \(5)  |
-        |           | (Monday as the first day of    |       |
-        |           | the week) as a decimal number  |       |
-        |           | [00,53].  All days in a new    |       |
-        |           | year preceding the first       |       |
-        |           | Monday are considered to be in |       |
-        |           | week 0.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%x``    | Locale's appropriate date      |       |
-        |           | representation.                |       |
-        +-----------+--------------------------------+-------+
-        | ``%X``    | Locale's appropriate time      |       |
-        |           | representation.                |       |
-        +-----------+--------------------------------+-------+
-        | ``%y``    | Year without century as a      |       |
-        |           | decimal number [00,99].        |       |
-        +-----------+--------------------------------+-------+
-        | ``%Y``    | Year with century as a decimal |       |
-        |           | number.                        |       |
-        +-----------+--------------------------------+-------+
-        | ``%Z``    | Time zone name (no characters  |       |
-        |           | if no time zone exists).       |       |
-        +-----------+--------------------------------+-------+
-        | ``%%``    | A literal ``'%'`` character.   |       |
-        +-----------+--------------------------------+-------+
-
-        .. note::
-
-            (1)
-                The ``%f`` directive is the same as ``%y`` if the frequency is
-                not quarterly.
-                Otherwise, it corresponds to the 'fiscal' year, as defined by
-                the :attr:`qyear` attribute.
-
-            (2)
-                The ``%F`` directive is the same as ``%Y`` if the frequency is
-                not quarterly.
-                Otherwise, it corresponds to the 'fiscal' year, as defined by
-                the :attr:`qyear` attribute.
-
-            (3)
-                The ``%p`` directive only affects the output hour field
-                if the ``%I`` directive is used to parse the hour.
-
-            (4)
-                The range really is ``0`` to ``61``; this accounts for leap
-                seconds and the (very rare) double leap seconds.
-
-            (5)
-                The ``%U`` and ``%W`` directives are only used in calculations
-                when the day of the week and the year are specified.
-
-        .. rubric::  Examples
-
-            >>> a = Period(freq='Q@JUL', year=2006, quarter=1)
-            >>> a.strftime('%F-Q%q')
-            '2006-Q1'
-            >>> # Output the last month in the quarter of this date
-            >>> a.strftime('%b-%Y')
-            'Oct-2005'
-            >>>
-            >>> a = Period(freq='D', year=2001, month=1, day=1)
-            >>> a.strftime('%d-%b-%Y')
-            '01-Jan-2006'
-            >>> a.strftime('%b. %d, %Y was a %A')
-            'Jan. 01, 2001 was a Monday'
-        """
-        base, mult = frequencies.get_freq_code(self.freq)
-        return period_format(self.ordinal, base, fmt)
-
-
-class Period(_Period):
-    """
-    Represents an period of time
-
-    Parameters
-    ----------
-    value : Period or compat.string_types, default None
-        The time period represented (e.g., '4Q2005')
-    freq : str, default None
-        One of pandas period strings or corresponding objects
-    year : int, default None
-    month : int, default 1
-    quarter : int, default None
-    day : int, default 1
-    hour : int, default 0
-    minute : int, default 0
-    second : int, default 0
-    """
-
-    def __new__(cls, value=None, freq=None, ordinal=None,
-                year=None, month=None, quarter=None, day=None,
-                hour=None, minute=None, second=None):
-        # freq points to a tuple (base, mult);  base is one of the defined
-        # periods such as A, Q, etc. Every five minutes would be, e.g.,
-        # ('T', 5) but may be passed in as a string like '5T'
-
-        # ordinal is the period offset from the gregorian proleptic epoch
-
-        cdef _Period self
-
-        if freq is not None:
-            freq = cls._maybe_convert_freq(freq)
-
-        if ordinal is not None and value is not None:
-            raise ValueError(("Only value or ordinal but not both should be "
-                              "given but not both"))
-        elif ordinal is not None:
-            if not lib.is_integer(ordinal):
-                raise ValueError("Ordinal must be an integer")
-            if freq is None:
-                raise ValueError('Must supply freq for ordinal value')
-
-        elif value is None:
-            if (year is None and month is None and
-                        quarter is None and day is None and
-                        hour is None and minute is None and second is None):
-                ordinal = iNaT
-            else:
-                if freq is None:
-                    raise ValueError("If value is None, freq cannot be None")
-
-                # set defaults
-                month = 1 if month is None else month
-                day = 1 if day is None else day
-                hour = 0 if hour is None else hour
-                minute = 0 if minute is None else minute
-                second = 0 if second is None else second
-
-                ordinal = _ordinal_from_fields(year, month, quarter, day,
-                                               hour, minute, second, freq)
-
-        elif isinstance(value, Period):
-            other = value
-            if freq is None or frequencies.get_freq_code(
-                    freq) == frequencies.get_freq_code(other.freq):
-                ordinal = other.ordinal
-                freq = other.freq
-            else:
-                converted = other.asfreq(freq)
-                ordinal = converted.ordinal
-
-        elif is_null_datetimelike(value) or value in tslib._nat_strings:
-            ordinal = iNaT
-
-        elif isinstance(value, compat.string_types) or lib.is_integer(value):
-            if lib.is_integer(value):
-                value = str(value)
-            value = value.upper()
-            dt, _, reso = parse_time_string(value, freq)
-
-            if freq is None:
-                try:
-                    freq = frequencies.Resolution.get_freq(reso)
-                except KeyError:
-                    raise ValueError(
-                        "Invalid frequency or could not infer: %s" % reso)
-
-        elif isinstance(value, datetime):
-            dt = value
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        elif isinstance(value, np.datetime64):
-            dt = Timestamp(value)
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        elif isinstance(value, date):
-            dt = datetime(year=value.year, month=value.month, day=value.day)
-            if freq is None:
-                raise ValueError('Must supply freq for datetime value')
-        else:
-            msg = "Value must be Period, string, integer, or datetime"
-            raise ValueError(msg)
-
-        if ordinal is None:
-            base, mult = frequencies.get_freq_code(freq)
-            ordinal = get_period_ordinal(dt.year, dt.month, dt.day,
-                                         dt.hour, dt.minute, dt.second,
-                                         dt.microsecond, 0, base)
-
-        return cls._from_ordinal(ordinal, freq)
-
-
-def _ordinal_from_fields(year, month, quarter, day,
-                         hour, minute, second, freq):
-    base, mult = frequencies.get_freq_code(freq)
-    if quarter is not None:
-        year, month = _quarter_to_myear(year, quarter, freq)
-
-    return get_period_ordinal(year, month, day, hour,
-                              minute, second, 0, 0, base)
-
-
-def _quarter_to_myear(year, quarter, freq):
-    if quarter is not None:
-        if quarter <= 0 or quarter > 4:
-            raise ValueError('Quarter must be 1 <= q <= 4')
-
-        mnum = frequencies._month_numbers[
-            frequencies._get_rule_month(freq)] + 1
-        month = (mnum + (quarter - 1) * 3) % 12 + 1
-        if month > mnum:
-            year -= 1
-
-    return year, month
-
-
-def _validate_end_alias(how):
-    how_dict = {'S': 'S', 'E': 'E',
-                'START': 'S', 'FINISH': 'E',
-                'BEGIN': 'S', 'END': 'E'}
-    how = how_dict.get(str(how).upper())
-    if how not in set(['S', 'E']):
-        raise ValueError('How must be one of S or E')
-    return how
diff --git a/pandas/_libs/properties.pyx b/pandas/_libs/properties.pyx
new file mode 100644
index 0000000000000..d2fbf5aa66fbf
--- /dev/null
+++ b/pandas/_libs/properties.pyx
@@ -0,0 +1,69 @@
+# -*- coding: utf-8 -*-
+
+from cython import Py_ssize_t
+
+from cpython cimport (
+    PyDict_Contains, PyDict_GetItem, PyDict_SetItem)
+
+
+cdef class CachedProperty(object):
+
+    cdef readonly:
+        object func, name, __doc__
+
+    def __init__(self, func):
+        self.func = func
+        self.name = func.__name__
+        self.__doc__ = getattr(func, '__doc__', None)
+
+    def __get__(self, obj, typ):
+        if obj is None:
+            # accessed on the class, not the instance
+            return self
+
+        # Get the cache or set a default one if needed
+        cache = getattr(obj, '_cache', None)
+        if cache is None:
+            try:
+                cache = obj._cache = {}
+            except (AttributeError):
+                return self
+
+        if PyDict_Contains(cache, self.name):
+            # not necessary to Py_INCREF
+            val = <object>PyDict_GetItem(cache, self.name)
+        else:
+            val = self.func(obj)
+            PyDict_SetItem(cache, self.name, val)
+        return val
+
+    def __set__(self, obj, value):
+        raise AttributeError("Can't set attribute")
+
+
+cache_readonly = CachedProperty
+
+
+cdef class AxisProperty(object):
+
+    cdef readonly:
+        Py_ssize_t axis
+        object __doc__
+
+    def __init__(self, axis=0, doc=""):
+        self.axis = axis
+        self.__doc__ = doc
+
+    def __get__(self, obj, type):
+        cdef:
+            list axes
+
+        if obj is None:
+            # Only instances have _data, not classes
+            return self
+        else:
+            axes = obj._data.axes
+        return axes[self.axis]
+
+    def __set__(self, obj, value):
+        obj._set_axis(self.axis, value)
diff --git a/pandas/_libs/reduction.pyx b/pandas/_libs/reduction.pyx
new file mode 100644
index 0000000000000..517d59c399179
--- /dev/null
+++ b/pandas/_libs/reduction.pyx
@@ -0,0 +1,643 @@
+# -*- coding: utf-8 -*-
+from distutils.version import LooseVersion
+
+from cython import Py_ssize_t
+from cpython cimport Py_INCREF
+
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport (ndarray,
+                    int64_t,
+                    PyArray_SETITEM,
+                    PyArray_ITER_NEXT, PyArray_ITER_DATA, PyArray_IterNew,
+                    flatiter)
+cnp.import_array()
+
+cimport pandas._libs.util as util
+from pandas._libs.lib import maybe_convert_objects
+
+
+cdef _get_result_array(object obj, Py_ssize_t size, Py_ssize_t cnt):
+
+    if (util.is_array(obj) or
+            (isinstance(obj, list) and len(obj) == cnt) or
+            getattr(obj, 'shape', None) == (cnt,)):
+        raise ValueError('function does not reduce')
+
+    return np.empty(size, dtype='O')
+
+
+cdef class Reducer:
+    """
+    Performs generic reduction operation on a C or Fortran-contiguous ndarray
+    while avoiding ndarray construction overhead
+    """
+    cdef:
+        Py_ssize_t increment, chunksize, nresults
+        object arr, dummy, f, labels, typ, ityp, index
+
+    def __init__(self, object arr, object f, axis=1, dummy=None,
+                 labels=None):
+        n, k = arr.shape
+
+        if axis == 0:
+            if not arr.flags.f_contiguous:
+                arr = arr.copy('F')
+
+            self.nresults = k
+            self.chunksize = n
+            self.increment = n * arr.dtype.itemsize
+        else:
+            if not arr.flags.c_contiguous:
+                arr = arr.copy('C')
+
+            self.nresults = n
+            self.chunksize = k
+            self.increment = k * arr.dtype.itemsize
+
+        self.f = f
+        self.arr = arr
+        self.labels = labels
+        self.dummy, self.typ, self.index, self.ityp = self._check_dummy(
+            dummy=dummy)
+
+    def _check_dummy(self, dummy=None):
+        cdef object index=None, typ=None, ityp=None
+
+        if dummy is None:
+            dummy = np.empty(self.chunksize, dtype=self.arr.dtype)
+
+            # our ref is stolen later since we are creating this array
+            # in cython, so increment first
+            Py_INCREF(dummy)
+
+        else:
+
+            # we passed a series-like
+            if hasattr(dummy, 'values'):
+
+                typ = type(dummy)
+                index = getattr(dummy, 'index', None)
+                dummy = dummy.values
+
+            if dummy.dtype != self.arr.dtype:
+                raise ValueError('Dummy array must be same dtype')
+            if len(dummy) != self.chunksize:
+                raise ValueError('Dummy array must be length %d' %
+                                 self.chunksize)
+
+        return dummy, typ, index, ityp
+
+    def get_result(self):
+        cdef:
+            char* dummy_buf
+            ndarray arr, result, chunk
+            Py_ssize_t i, incr
+            flatiter it
+            bint has_labels
+            object res, name, labels, index
+            object cached_typ=None
+
+        arr = self.arr
+        chunk = self.dummy
+        dummy_buf = chunk.data
+        chunk.data = arr.data
+        labels = self.labels
+        has_labels = labels is not None
+        has_index = self.index is not None
+        incr = self.increment
+
+        try:
+            for i in range(self.nresults):
+
+                if has_labels:
+                    name = util.get_value_at(labels, i)
+                else:
+                    name = None
+
+                # create the cached type
+                # each time just reassign the data
+                if i == 0:
+
+                    if self.typ is not None:
+
+                        # recreate with the index if supplied
+                        if has_index:
+
+                            cached_typ = self.typ(
+                                chunk, index=self.index, name=name)
+
+                        else:
+
+                            # use the passsed typ, sans index
+                            cached_typ = self.typ(chunk, name=name)
+
+                # use the cached_typ if possible
+                if cached_typ is not None:
+
+                    if has_index:
+                        object.__setattr__(cached_typ, 'index', self.index)
+
+                    object.__setattr__(
+                        cached_typ._data._block, 'values', chunk)
+                    object.__setattr__(cached_typ, 'name', name)
+                    res = self.f(cached_typ)
+                else:
+                    res = self.f(chunk)
+
+                if hasattr(res, 'values') and util.is_array(res.values):
+                    res = res.values
+                if i == 0:
+                    result = _get_result_array(res,
+                                               self.nresults,
+                                               len(self.dummy))
+                    it = <flatiter>PyArray_IterNew(result)
+
+                PyArray_SETITEM(result, PyArray_ITER_DATA(it), res)
+                chunk.data = chunk.data + self.increment
+                PyArray_ITER_NEXT(it)
+        except Exception, e:
+            if hasattr(e, 'args'):
+                e.args = e.args + (i,)
+            raise
+        finally:
+            # so we don't free the wrong memory
+            chunk.data = dummy_buf
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result
+
+
+cdef class SeriesBinGrouper:
+    """
+    Performs grouping operation according to bin edges, rather than labels
+    """
+    cdef:
+        Py_ssize_t nresults, ngroups
+        bint passed_dummy
+
+    cdef public:
+        object arr, index, dummy_arr, dummy_index
+        object values, f, bins, typ, ityp, name
+
+    def __init__(self, object series, object f, object bins, object dummy):
+        n = len(series)
+
+        self.bins = bins
+        self.f = f
+
+        values = series.values
+        if not values.flags.c_contiguous:
+            values = values.copy('C')
+        self.arr = values
+        self.typ = series._constructor
+        self.ityp = series.index._constructor
+        self.index = series.index.values
+        self.name = getattr(series, 'name', None)
+
+        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
+        self.passed_dummy = dummy is not None
+
+        # kludge for #1688
+        if len(bins) > 0 and bins[-1] == len(series):
+            self.ngroups = len(bins)
+        else:
+            self.ngroups = len(bins) + 1
+
+    def _check_dummy(self, dummy=None):
+        # both values and index must be an ndarray!
+
+        if dummy is None:
+            values = np.empty(0, dtype=self.arr.dtype)
+            index = None
+        else:
+            values = dummy.values
+            if values.dtype != self.arr.dtype:
+                raise ValueError('Dummy array must be same dtype')
+            if not values.flags.contiguous:
+                values = values.copy()
+            index = dummy.index.values
+            if not index.flags.contiguous:
+                index = index.copy()
+
+        return values, index
+
+    def get_result(self):
+        cdef:
+            ndarray arr, result
+            ndarray[int64_t] counts
+            Py_ssize_t i, n, group_size
+            object res
+            bint initialized = 0
+            Slider vslider, islider
+            object name, cached_typ=None, cached_ityp=None
+
+        counts = np.zeros(self.ngroups, dtype=np.int64)
+
+        if self.ngroups > 0:
+            counts[0] = self.bins[0]
+            for i in range(1, self.ngroups):
+                if i == self.ngroups - 1:
+                    counts[i] = len(self.arr) - self.bins[i - 1]
+                else:
+                    counts[i] = self.bins[i] - self.bins[i - 1]
+
+        group_size = 0
+        n = len(self.arr)
+        name = self.name
+
+        vslider = Slider(self.arr, self.dummy_arr)
+        islider = Slider(self.index, self.dummy_index)
+
+        try:
+            for i in range(self.ngroups):
+                group_size = counts[i]
+
+                islider.set_length(group_size)
+                vslider.set_length(group_size)
+
+                if cached_typ is None:
+                    cached_ityp = self.ityp(islider.buf)
+                    cached_typ = self.typ(vslider.buf, index=cached_ityp,
+                                          name=name)
+                else:
+                    # See the comment in indexes/base.py about _index_data.
+                    # We need this for EA-backed indexes that have a reference
+                    # to a 1-d ndarray like datetime / timedelta / period.
+                    object.__setattr__(cached_ityp, '_index_data', islider.buf)
+                    cached_ityp._engine.clear_mapping()
+                    object.__setattr__(
+                        cached_typ._data._block, 'values', vslider.buf)
+                    object.__setattr__(cached_typ, '_index', cached_ityp)
+                    object.__setattr__(cached_typ, 'name', name)
+
+                cached_ityp._engine.clear_mapping()
+                res = self.f(cached_typ)
+                res = _extract_result(res)
+                if not initialized:
+                    initialized = 1
+                    result = _get_result_array(res,
+                                               self.ngroups,
+                                               len(self.dummy_arr))
+                result[i] = res
+
+                islider.advance(group_size)
+                vslider.advance(group_size)
+
+        except:
+            raise
+        finally:
+            # so we don't free the wrong memory
+            islider.reset()
+            vslider.reset()
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result, counts
+
+
+cdef class SeriesGrouper:
+    """
+    Performs generic grouping operation while avoiding ndarray construction
+    overhead
+    """
+    cdef:
+        Py_ssize_t nresults, ngroups
+        bint passed_dummy
+
+    cdef public:
+        object arr, index, dummy_arr, dummy_index
+        object f, labels, values, typ, ityp, name
+
+    def __init__(self, object series, object f, object labels,
+                 Py_ssize_t ngroups, object dummy):
+        n = len(series)
+
+        self.labels = labels
+        self.f = f
+
+        values = series.values
+        if not values.flags.c_contiguous:
+            values = values.copy('C')
+        self.arr = values
+        self.typ = series._constructor
+        self.ityp = series.index._constructor
+        self.index = series.index.values
+        self.name = getattr(series, 'name', None)
+
+        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
+        self.passed_dummy = dummy is not None
+        self.ngroups = ngroups
+
+    def _check_dummy(self, dummy=None):
+        # both values and index must be an ndarray!
+
+        if dummy is None:
+            values = np.empty(0, dtype=self.arr.dtype)
+            index = None
+        else:
+            values = dummy.values
+            # GH 23683: datetimetz types are equivalent to datetime types here
+            if (dummy.dtype != self.arr.dtype
+                    and values.dtype != self.arr.dtype):
+                raise ValueError('Dummy array must be same dtype')
+            if not values.flags.contiguous:
+                values = values.copy()
+            index = dummy.index.values
+            if not index.flags.contiguous:
+                index = index.copy()
+
+        return values, index
+
+    def get_result(self):
+        cdef:
+            ndarray arr, result
+            ndarray[int64_t] labels, counts
+            Py_ssize_t i, n, group_size, lab
+            object res
+            bint initialized = 0
+            Slider vslider, islider
+            object name, cached_typ=None, cached_ityp=None
+
+        labels = self.labels
+        counts = np.zeros(self.ngroups, dtype=np.int64)
+        group_size = 0
+        n = len(self.arr)
+        name = self.name
+
+        vslider = Slider(self.arr, self.dummy_arr)
+        islider = Slider(self.index, self.dummy_index)
+
+        try:
+            for i in range(n):
+                group_size += 1
+
+                lab = labels[i]
+
+                if i == n - 1 or lab != labels[i + 1]:
+                    if lab == -1:
+                        islider.advance(group_size)
+                        vslider.advance(group_size)
+                        group_size = 0
+                        continue
+
+                    islider.set_length(group_size)
+                    vslider.set_length(group_size)
+
+                    if cached_typ is None:
+                        cached_ityp = self.ityp(islider.buf)
+                        cached_typ = self.typ(vslider.buf, index=cached_ityp,
+                                              name=name)
+                    else:
+                        object.__setattr__(cached_ityp, '_data', islider.buf)
+                        cached_ityp._engine.clear_mapping()
+                        object.__setattr__(
+                            cached_typ._data._block, 'values', vslider.buf)
+                        object.__setattr__(cached_typ, '_index', cached_ityp)
+                        object.__setattr__(cached_typ, 'name', name)
+
+                    cached_ityp._engine.clear_mapping()
+                    res = self.f(cached_typ)
+                    res = _extract_result(res)
+                    if not initialized:
+                        initialized = 1
+                        result = _get_result_array(res,
+                                                   self.ngroups,
+                                                   len(self.dummy_arr))
+
+                    result[lab] = res
+                    counts[lab] = group_size
+                    islider.advance(group_size)
+                    vslider.advance(group_size)
+
+                    group_size = 0
+
+        except:
+            raise
+        finally:
+            # so we don't free the wrong memory
+            islider.reset()
+            vslider.reset()
+
+        if result.dtype == np.object_:
+            result = maybe_convert_objects(result)
+
+        return result, counts
+
+
+cdef inline _extract_result(object res):
+    """ extract the result object, it might be a 0-dim ndarray
+        or a len-1 0-dim, or a scalar """
+    if hasattr(res, 'values') and util.is_array(res.values):
+        res = res.values
+    if not np.isscalar(res):
+        if util.is_array(res):
+            if res.ndim == 0:
+                res = res.item()
+            elif res.ndim == 1 and len(res) == 1:
+                res = res[0]
+    return res
+
+
+cdef class Slider:
+    """
+    Only handles contiguous data for now
+    """
+    cdef:
+        ndarray values, buf
+        Py_ssize_t stride, orig_len, orig_stride
+        char *orig_data
+
+    def __init__(self, object values, object buf):
+        assert(values.ndim == 1)
+
+        if not values.flags.contiguous:
+            values = values.copy()
+
+        assert(values.dtype == buf.dtype)
+        self.values = values
+        self.buf = buf
+        self.stride = values.strides[0]
+
+        self.orig_data = self.buf.data
+        self.orig_len = self.buf.shape[0]
+        self.orig_stride = self.buf.strides[0]
+
+        self.buf.data = self.values.data
+        self.buf.strides[0] = self.stride
+
+    cpdef advance(self, Py_ssize_t k):
+        self.buf.data = <char*>self.buf.data + self.stride * k
+
+    cdef move(self, int start, int end):
+        """
+        For slicing
+        """
+        self.buf.data = self.values.data + self.stride * start
+        self.buf.shape[0] = end - start
+
+    cpdef set_length(self, Py_ssize_t length):
+        self.buf.shape[0] = length
+
+    cpdef reset(self):
+
+        self.buf.shape[0] = self.orig_len
+        self.buf.data = self.orig_data
+        self.buf.strides[0] = self.orig_stride
+
+
+class InvalidApply(Exception):
+    pass
+
+
+def apply_frame_axis0(object frame, object f, object names,
+                      const int64_t[:] starts, const int64_t[:] ends):
+    cdef:
+        BlockSlider slider
+        Py_ssize_t i, n = len(starts)
+        list results
+        object piece
+        dict item_cache
+
+    if frame.index._has_complex_internals:
+        raise InvalidApply('Cannot modify frame index internals')
+
+    results = []
+
+    # Need to infer if our low-level mucking is going to cause a segfault
+    if n > 0:
+        chunk = frame.iloc[starts[0]:ends[0]]
+        object.__setattr__(chunk, 'name', names[0])
+        try:
+            result = f(chunk)
+            if result is chunk:
+                raise InvalidApply('Function unsafe for fast apply')
+        except:
+            raise InvalidApply('Let this error raise above us')
+
+    slider = BlockSlider(frame)
+
+    mutated = False
+    item_cache = slider.dummy._item_cache
+    try:
+        for i in range(n):
+            slider.move(starts[i], ends[i])
+
+            item_cache.clear()  # ugh
+
+            object.__setattr__(slider.dummy, 'name', names[i])
+            piece = f(slider.dummy)
+
+            # I'm paying the price for index-sharing, ugh
+            try:
+                if piece.index is slider.dummy.index:
+                    piece = piece.copy(deep='all')
+                else:
+                    mutated = True
+            except AttributeError:
+                pass
+
+            results.append(piece)
+    finally:
+        slider.reset()
+
+    return results, mutated
+
+
+cdef class BlockSlider:
+    """
+    Only capable of sliding on axis=0
+    """
+
+    cdef public:
+        object frame, dummy, index
+        int nblocks
+        Slider idx_slider
+        list blocks
+
+    cdef:
+        char **base_ptrs
+
+    def __init__(self, frame):
+        self.frame = frame
+        self.dummy = frame[:0]
+        self.index = self.dummy.index
+
+        self.blocks = [b.values for b in self.dummy._data.blocks]
+
+        for x in self.blocks:
+            util.set_array_not_contiguous(x)
+
+        self.nblocks = len(self.blocks)
+        # See the comment in indexes/base.py about _index_data.
+        # We need this for EA-backed indexes that have a reference to a 1-d
+        # ndarray like datetime / timedelta / period.
+        self.idx_slider = Slider(
+            self.frame.index._index_data, self.dummy.index._index_data)
+
+        self.base_ptrs = <char**>malloc(sizeof(char*) * len(self.blocks))
+        for i, block in enumerate(self.blocks):
+            self.base_ptrs[i] = (<ndarray>block).data
+
+    def __dealloc__(self):
+        free(self.base_ptrs)
+
+    cpdef move(self, int start, int end):
+        cdef:
+            ndarray arr
+            object index
+
+        # move blocks
+        for i in range(self.nblocks):
+            arr = self.blocks[i]
+
+            # axis=1 is the frame's axis=0
+            arr.data = self.base_ptrs[i] + arr.strides[1] * start
+            arr.shape[1] = end - start
+
+        # move and set the index
+        self.idx_slider.move(start, end)
+
+        object.__setattr__(self.index, '_index_data', self.idx_slider.buf)
+        self.index._engine.clear_mapping()
+
+    cdef reset(self):
+        cdef:
+            ndarray arr
+
+        # reset blocks
+        for i in range(self.nblocks):
+            arr = self.blocks[i]
+
+            # axis=1 is the frame's axis=0
+            arr.data = self.base_ptrs[i]
+            arr.shape[1] = 0
+
+
+def reduce(arr, f, axis=0, dummy=None, labels=None):
+    """
+
+    Parameters
+    -----------
+    arr : NDFrame object
+    f : function
+    axis : integer axis
+    dummy : type of reduced output (series)
+    labels : Index or None
+    """
+
+    if labels is not None:
+        if labels._has_complex_internals:
+            raise Exception('Cannot use shortcut')
+
+        # pass as an ndarray
+        if hasattr(labels, 'values'):
+            labels = labels.values
+
+    reducer = Reducer(arr, f, axis=axis, dummy=dummy, labels=labels)
+    return reducer.get_result()
diff --git a/pandas/_libs/reshape.pyx b/pandas/_libs/reshape.pyx
index 82851b7e80994..9f4e67ca4e256 100644
--- a/pandas/_libs/reshape.pyx
+++ b/pandas/_libs/reshape.pyx
@@ -1,35 +1,95 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
 
-from numpy cimport *
-cimport numpy as np
-import numpy as np
+import cython
+from cython import Py_ssize_t
 
-cimport cython
+from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
+                    uint32_t, uint64_t, float32_t, float64_t)
 
-import_array()
 
-cimport util
+ctypedef fused reshape_t:
+    uint8_t
+    uint16_t
+    uint32_t
+    uint64_t
+    int8_t
+    int16_t
+    int32_t
+    int64_t
+    float32_t
+    float64_t
+    object
 
-from numpy cimport NPY_INT8 as NPY_int8
-from numpy cimport NPY_INT16 as NPY_int16
-from numpy cimport NPY_INT32 as NPY_int32
-from numpy cimport NPY_INT64 as NPY_int64
-from numpy cimport NPY_FLOAT16 as NPY_float16
-from numpy cimport NPY_FLOAT32 as NPY_float32
-from numpy cimport NPY_FLOAT64 as NPY_float64
 
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def unstack(reshape_t[:, :] values, uint8_t[:] mask,
+            Py_ssize_t stride, Py_ssize_t length, Py_ssize_t width,
+            reshape_t[:, :] new_values, uint8_t[:, :] new_mask):
+    """
+    transform long sorted_values to wide new_values
+
+    Parameters
+    ----------
+    values : typed ndarray
+    mask : boolean ndarray
+    stride : int
+    length : int
+    width : int
+    new_values : typed ndarray
+        result array
+    new_mask : boolean ndarray
+        result mask
+    """
+    cdef:
+        Py_ssize_t i, j, w, nulls, s, offset
+
+    if reshape_t is not object:
+        # evaluated at compile-time
+        with nogil:
+            for i in range(stride):
+
+                nulls = 0
+                for j in range(length):
+
+                    for w in range(width):
+
+                        offset = j * width + w
+
+                        if mask[offset]:
+                            s = i * width + w
+                            new_values[j, s] = values[offset - nulls, i]
+                            new_mask[j, s] = 1
+                        else:
+                            nulls += 1
+
+    else:
+        # object-dtype, identical to above but we cannot use nogil
+        for i in range(stride):
+
+            nulls = 0
+            for j in range(length):
+
+                for w in range(width):
+
+                    offset = j * width + w
 
-int8 = np.dtype(np.int8)
-int16 = np.dtype(np.int16)
-int32 = np.dtype(np.int32)
-int64 = np.dtype(np.int64)
-float16 = np.dtype(np.float16)
-float32 = np.dtype(np.float32)
-float64 = np.dtype(np.float64)
+                    if mask[offset]:
+                        s = i * width + w
+                        new_values[j, s] = values[offset - nulls, i]
+                        new_mask[j, s] = 1
+                    else:
+                        nulls += 1
 
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
 
-include "reshape_helper.pxi"
+unstack_uint8 = unstack["uint8_t"]
+unstack_uint16 = unstack["uint16_t"]
+unstack_uint32 = unstack["uint32_t"]
+unstack_uint64 = unstack["uint64_t"]
+unstack_int8 = unstack["int8_t"]
+unstack_int16 = unstack["int16_t"]
+unstack_int32 = unstack["int32_t"]
+unstack_int64 = unstack["int64_t"]
+unstack_float32 = unstack["float32_t"]
+unstack_float64 = unstack["float64_t"]
+unstack_object = unstack["object"]
diff --git a/pandas/_libs/reshape_helper.pxi.in b/pandas/_libs/reshape_helper.pxi.in
deleted file mode 100644
index bb9a5977f8b45..0000000000000
--- a/pandas/_libs/reshape_helper.pxi.in
+++ /dev/null
@@ -1,81 +0,0 @@
-"""
-Template for each `dtype` helper function for take
-
-WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
-"""
-
-# ----------------------------------------------------------------------
-# reshape
-# ----------------------------------------------------------------------
-
-{{py:
-
-# name, c_type
-dtypes = [('uint8', 'uint8_t'),
-          ('uint16', 'uint16_t'),
-          ('uint32', 'uint32_t'),
-          ('uint64', 'uint64_t'),
-          ('int8', 'int8_t'),
-          ('int16', 'int16_t'),
-          ('int32', 'int32_t'),
-          ('int64', 'int64_t'),
-          ('float32', 'float32_t'),
-          ('float64', 'float64_t'),
-          ('object', 'object')]
-}}
-
-{{for dtype, c_type in dtypes}}
-
-
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def unstack_{{dtype}}(ndarray[{{c_type}}, ndim=2] values,
-                      ndarray[uint8_t, ndim=1] mask,
-                      Py_ssize_t stride,
-                      Py_ssize_t length,
-                      Py_ssize_t width,
-                      ndarray[{{c_type}}, ndim=2] new_values,
-                      ndarray[uint8_t, ndim=2] new_mask):
-    """
-    transform long sorted_values to wide new_values
-
-    Parameters
-    ----------
-    values : typed ndarray
-    mask : boolean ndarray
-    stride : int
-    length : int
-    width : int
-    new_values : typed ndarray
-        result array
-    new_mask : boolean ndarray
-        result mask
-
-    """
-
-    cdef:
-        Py_ssize_t i, j, w, nulls, s, offset
-
-    {{if dtype == 'object'}}
-    if True:
-    {{else}}
-    with nogil:
-    {{endif}}
-
-        for i in range(stride):
-
-            nulls = 0
-            for j in range(length):
-
-                for w in range(width):
-
-                    offset = j * width + w
-
-                    if mask[offset]:
-                        s = i * width + w
-                        new_values[j, s] = values[offset - nulls, i]
-                        new_mask[j, s] = 1
-                    else:
-                        nulls += 1
-
-{{endfor}}
diff --git a/pandas/_libs/skiplist.pxd b/pandas/_libs/skiplist.pxd
new file mode 100644
index 0000000000000..a273d2c445d18
--- /dev/null
+++ b/pandas/_libs/skiplist.pxd
@@ -0,0 +1,45 @@
+# -*- coding: utf-8 -*-
+
+from cython cimport Py_ssize_t
+
+
+cdef extern from "src/skiplist.h":
+    ctypedef struct node_t:
+        node_t **next
+        int *width
+        double value
+        int is_nil
+        int levels
+        int ref_count
+
+    ctypedef struct skiplist_t:
+        node_t *head
+        node_t **tmp_chain
+        int *tmp_steps
+        int size
+        int maxlevels
+
+    skiplist_t* skiplist_init(int) nogil
+    void skiplist_destroy(skiplist_t*) nogil
+    double skiplist_get(skiplist_t*, int, int*) nogil
+    int skiplist_insert(skiplist_t*, double) nogil
+    int skiplist_remove(skiplist_t*, double) nogil
+
+
+# Note: Node is declared here so that IndexableSkiplist can be exposed;
+# Node itself not intended to be exposed.
+cdef class Node:
+    cdef public:
+        double value
+        list next
+        list width
+
+
+cdef class IndexableSkiplist:
+    cdef:
+        Py_ssize_t size, maxlevels
+        Node head
+
+    cpdef get(self, Py_ssize_t i)
+    cpdef insert(self, double value)
+    cpdef remove(self, double value)
diff --git a/pandas/_libs/src/skiplist.pyx b/pandas/_libs/skiplist.pyx
similarity index 79%
rename from pandas/_libs/src/skiplist.pyx
rename to pandas/_libs/skiplist.pyx
index 3017931e25115..2fdee72f9d588 100644
--- a/pandas/_libs/src/skiplist.pyx
+++ b/pandas/_libs/skiplist.pyx
@@ -5,52 +5,45 @@
 # Link: http://code.activestate.com/recipes/576930/
 
 # Cython version: Wes McKinney
+from random import random
 
-cdef extern from "numpy/arrayobject.h":
+from libc.math cimport log
 
-    void import_array()
+import numpy as np
 
-cdef extern from "math.h":
-    double log(double x)
 
 # MSVC does not have log2!
 
 cdef double Log2(double x):
     return log(x) / log(2.)
 
-cimport numpy as np
-from numpy cimport *
-import numpy as np
-
-from random import random
-
-# initialize numpy
-import_array()
 
 # TODO: optimize this, make less messy
 
 cdef class Node:
-    cdef public:
-        double_t value
-        list next
-        list width
+    # cdef public:
+    #    double value
+    #    list next
+    #    list width
 
-    def __init__(self, double_t value, list next, list width):
+    def __init__(self, double value, list next, list width):
         self.value = value
         self.next = next
         self.width = width
 
+
 # Singleton terminator node
 NIL = Node(np.inf, [], [])
 
+
 cdef class IndexableSkiplist:
     """
     Sorted collection supporting O(lg n) insertion, removal, and
     lookup by rank.
     """
-    cdef:
-        Py_ssize_t size, maxlevels
-        Node head
+    # cdef:
+    #    Py_ssize_t size, maxlevels
+    #    Node head
 
     def __init__(self, expected_size=100):
         self.size = 0
@@ -64,8 +57,9 @@ cdef class IndexableSkiplist:
         return self.get(i)
 
     cpdef get(self, Py_ssize_t i):
-        cdef Py_ssize_t level
-        cdef Node node
+        cdef:
+            Py_ssize_t level
+            Node node
 
         node = self.head
         i += 1
@@ -78,9 +72,10 @@ cdef class IndexableSkiplist:
         return node.value
 
     cpdef insert(self, double value):
-        cdef Py_ssize_t level, steps, d
-        cdef Node node, prevnode, newnode, next_at_level, tmp
-        cdef list chain, steps_at_level
+        cdef:
+            Py_ssize_t level, steps, d
+            Node node, prevnode, newnode, next_at_level, tmp
+            list chain, steps_at_level
 
         # find first node on each level where node.next[levels].value > value
         chain = [None] * self.maxlevels
@@ -112,14 +107,15 @@ cdef class IndexableSkiplist:
             steps += steps_at_level[level]
 
         for level in range(d, self.maxlevels):
-            (<Node> chain[level]).width[level] += 1
+            (<Node>chain[level]).width[level] += 1
 
         self.size += 1
 
     cpdef remove(self, double value):
-        cdef Py_ssize_t level, d
-        cdef Node node, prevnode, tmpnode, next_at_level
-        cdef list chain
+        cdef:
+            Py_ssize_t level, d
+            Node node, prevnode, tmpnode, next_at_level
+            list chain
 
         # find first node on each level where node.next[levels].value >= value
         chain = [None] * self.maxlevels
@@ -133,11 +129,11 @@ cdef class IndexableSkiplist:
 
             chain[level] = node
 
-        if value != (<Node> (<Node> (<Node> chain[0]).next)[0]).value:
+        if value != (<Node>(<Node>(<Node>chain[0]).next)[0]).value:
             raise KeyError('Not Found')
 
         # remove one link at each level
-        d = len((<Node> (<Node> (<Node> chain[0]).next)[0]).next)
+        d = len((<Node>(<Node>(<Node>chain[0]).next)[0]).next)
 
         for level in range(d):
             prevnode = chain[level]
diff --git a/pandas/sparse/sparse.pyx b/pandas/_libs/sparse.pyx
similarity index 86%
rename from pandas/sparse/sparse.pyx
rename to pandas/_libs/sparse.pyx
index 00d317c42b18d..5471c8184e458 100644
--- a/pandas/sparse/sparse.pyx
+++ b/pandas/_libs/sparse.pyx
@@ -1,41 +1,27 @@
-from numpy cimport (ndarray, uint8_t, int64_t, int32_t, int16_t, int8_t,
-                    float64_t, float32_t, float16_t)
-cimport numpy as np
-
-cimport cython
+# -*- coding: utf-8 -*-
+import cython
 
 import numpy as np
-import operator
-import sys
-
-from distutils.version import LooseVersion
-
-# numpy versioning
-_np_version = np.version.short_version
-_np_version_under1p8 = LooseVersion(_np_version) < '1.8'
-_np_version_under1p9 = LooseVersion(_np_version) < '1.9'
-_np_version_under1p10 = LooseVersion(_np_version) < '1.10'
-_np_version_under1p11 = LooseVersion(_np_version) < '1.11'
+cimport numpy as cnp
+from numpy cimport (ndarray, uint8_t, int64_t, int32_t, int16_t, int8_t,
+                    float64_t, float32_t)
+cnp.import_array()
 
-np.import_array()
-np.import_ufunc()
 
 # -----------------------------------------------------------------------------
 # Preamble stuff
 
-cdef float64_t NaN = <float64_t> np.NaN
-cdef float64_t INF = <float64_t> np.inf
-
-cdef inline int int_max(int a, int b): return a if a >= b else b
-cdef inline int int_min(int a, int b): return a if a <= b else b
+cdef float64_t NaN = <float64_t>np.NaN
+cdef float64_t INF = <float64_t>np.inf
 
 # -----------------------------------------------------------------------------
 
 
 cdef class SparseIndex:
     """
-    Abstract superclass for sparse index types
+    Abstract superclass for sparse index types.
     """
+
     def __init__(self):
         raise NotImplementedError
 
@@ -48,8 +34,9 @@ cdef class IntIndex(SparseIndex):
     ----------
     length : integer
     indices : array-like
-        Contains integers corresponding to
+        Contains integers corresponding to the indices.
     """
+
     cdef readonly:
         Py_ssize_t length, npoints
         ndarray indices
@@ -59,21 +46,52 @@ cdef class IntIndex(SparseIndex):
         self.indices = np.ascontiguousarray(indices, dtype=np.int32)
         self.npoints = len(self.indices)
 
+        self.check_integrity()
+
     def __reduce__(self):
         args = (self.length, self.indices)
-        return (IntIndex, args)
+        return IntIndex, args
 
     def __repr__(self):
         output = 'IntIndex\n'
         output += 'Indices: %s\n' % repr(self.indices)
         return output
 
+    @property
+    def nbytes(self):
+        return self.indices.nbytes
+
     def check_integrity(self):
         """
-        Only need be strictly ascending and nothing less than 0 or greater than
-        total length
+        Checks the following:
+
+        - Indices are strictly ascending
+        - Number of indices is at most self.length
+        - Indices are at least 0 and at most the total length less one
+
+        A ValueError is raised if any of these conditions is violated.
         """
-        pass
+
+        if self.npoints > self.length:
+            msg = ("Too many indices. Expected "
+                   "{exp} but found {act}").format(
+                exp=self.length, act=self.npoints)
+            raise ValueError(msg)
+
+        # Indices are vacuously ordered and non-negative
+        # if the sequence of indices is empty.
+        if self.npoints == 0:
+            return
+
+        if self.indices.min() < 0:
+            raise ValueError("No index can be less than zero")
+
+        if self.indices.max() >= self.length:
+            raise ValueError("All indices must be less than the length")
+
+        monotonic = np.all(self.indices[:-1] < self.indices[1:])
+        if not monotonic:
+            raise ValueError("Indices must be strictly increasing")
 
     def equals(self, other):
         if not isinstance(other, IntIndex):
@@ -115,7 +133,7 @@ cdef class IntIndex(SparseIndex):
         new_indices = np.empty(min(
             len(xindices), len(yindices)), dtype=np.int32)
 
-        for xi from 0 <= xi < self.npoints:
+        for xi in range(self.npoints):
             xind = xindices[xi]
 
             while yi < y.npoints and yindices[yi] < xind:
@@ -187,7 +205,7 @@ cdef class IntIndex(SparseIndex):
 
         n = len(indexer)
         results = np.empty(n, dtype=np.int32)
-        results.fill(-1)
+        results[:] = -1
 
         if self.npoints == 0:
             return results
@@ -216,9 +234,9 @@ cdef class IntIndex(SparseIndex):
         sinds = self.indices
 
         result = np.empty(other.npoints, dtype=np.float64)
-        result.fill(fill_value)
+        result[:] = fill_value
 
-        for 0 <= i < other.npoints:
+        for i in range(other.npoints):
             while oinds[i] > sinds[j] and j < self.npoints:
                 j += 1
 
@@ -241,6 +259,7 @@ cdef class IntIndex(SparseIndex):
                ndarray[int32_t, ndim=1] indices):
         pass
 
+
 cpdef get_blocks(ndarray[int32_t, ndim=1] indices):
     cdef:
         Py_ssize_t init_len, i, npoints, result_indexer = 0
@@ -259,7 +278,7 @@ cpdef get_blocks(ndarray[int32_t, ndim=1] indices):
 
     # TODO: two-pass algorithm faster?
     prev = block = indices[0]
-    for i from 1 <= i < npoints:
+    for i in range(1, npoints):
         cur = indices[i]
         if cur - prev > 1:
             # new block
@@ -281,6 +300,7 @@ cpdef get_blocks(ndarray[int32_t, ndim=1] indices):
     lens = lens[:result_indexer]
     return locs, lens
 
+
 # -----------------------------------------------------------------------------
 # BlockIndex
 
@@ -296,7 +316,7 @@ cdef class BlockIndex(SparseIndex):
         ndarray blocs, blengths
 
     cdef:
-        object __weakref__ # need to be picklable
+        object __weakref__  # need to be picklable
         int32_t *locbuf
         int32_t *lenbuf
 
@@ -306,8 +326,8 @@ cdef class BlockIndex(SparseIndex):
         self.blengths = np.ascontiguousarray(blengths, dtype=np.int32)
 
         # in case we need
-        self.locbuf = <int32_t*> self.blocs.data
-        self.lenbuf = <int32_t*> self.blengths.data
+        self.locbuf = <int32_t*>self.blocs.data
+        self.lenbuf = <int32_t*>self.blengths.data
 
         self.length = length
         self.nblocks = np.int32(len(self.blocs))
@@ -320,7 +340,7 @@ cdef class BlockIndex(SparseIndex):
 
     def __reduce__(self):
         args = (self.length, self.blocs, self.blengths)
-        return (BlockIndex, args)
+        return BlockIndex, args
 
     def __repr__(self):
         output = 'BlockIndex\n'
@@ -329,6 +349,10 @@ cdef class BlockIndex(SparseIndex):
 
         return output
 
+    @property
+    def nbytes(self):
+        return self.blocs.nbytes + self.blengths.nbytes
+
     @property
     def ngaps(self):
         return self.length - self.npoints
@@ -350,21 +374,22 @@ cdef class BlockIndex(SparseIndex):
         if len(blocs) != len(blengths):
             raise ValueError('block bound arrays must be same length')
 
-        for i from 0 <= i < self.nblocks:
+        for i in range(self.nblocks):
             if i > 0:
                 if blocs[i] <= blocs[i - 1]:
                     raise ValueError('Locations not in ascending order')
 
             if i < self.nblocks - 1:
                 if blocs[i] + blengths[i] > blocs[i + 1]:
-                    raise ValueError('Block %d overlaps' % i)
+                    raise ValueError('Block {idx} overlaps'.format(idx=i))
             else:
                 if blocs[i] + blengths[i] > self.length:
-                    raise ValueError('Block %d extends beyond end' % i)
+                    raise ValueError('Block {idx} extends beyond end'
+                                     .format(idx=i))
 
             # no zero-length blocks
             if blengths[i] == 0:
-                raise ValueError('Zero-length block %d' % i)
+                raise ValueError('Zero-length block {idx}'.format(idx=i))
 
     def equals(self, other):
         if not isinstance(other, BlockIndex):
@@ -389,10 +414,10 @@ cdef class BlockIndex(SparseIndex):
 
         indices = np.empty(self.npoints, dtype=np.int32)
 
-        for b from 0 <= b < self.nblocks:
+        for b in range(self.nblocks):
             offset = self.locbuf[b]
 
-            for j from 0 <= j < self.lenbuf[b]:
+            for j in range(self.lenbuf[b]):
                 indices[i] = offset + j
                 i += 1
 
@@ -454,7 +479,7 @@ cdef class BlockIndex(SparseIndex):
                     cur_length = xlen[xi]
                     xi += 1
 
-            else: # xloc[xi] < yloc[yi]
+            else:  # xloc[xi] < yloc[yi]
                 cur_loc = yloc[yi]
                 diff = yloc[yi] - xloc[xi]
 
@@ -518,7 +543,7 @@ cdef class BlockIndex(SparseIndex):
             return -1
 
         cum_len = 0
-        for i from 0 <= i < self.nblocks:
+        for i in range(self.nblocks):
             if index >= locs[i] and index < locs[i] + lens[i]:
                 return cum_len + index - locs[i]
             cum_len += lens[i]
@@ -541,16 +566,16 @@ cdef class BlockIndex(SparseIndex):
 
         n = len(indexer)
         results = np.empty(n, dtype=np.int32)
-        results.fill(-1)
+        results[:] = -1
 
         if self.npoints == 0:
             return results
 
-        for i from 0 <= i < n:
+        for i in range(n):
             ind_val = indexer[i]
             if not (ind_val < 0 or self.length <= ind_val):
                 cum_len = 0
-                for j from 0 <= j < self.nblocks:
+                for j in range(self.nblocks):
                     if ind_val >= locs[j] and ind_val < locs[j] + lens[j]:
                         results[i] = cum_len + ind_val - locs[j]
                     cum_len += lens[j]
@@ -597,7 +622,7 @@ cdef class BlockMerge(object):
     cdef:
         BlockIndex x, y, result
         ndarray xstart, xlen, xend, ystart, ylen, yend
-        int32_t xi, yi # block indices
+        int32_t xi, yi  # block indices
 
     def __init__(self, BlockIndex x, BlockIndex y):
         self.x = x
@@ -631,11 +656,6 @@ cdef class BlockMerge(object):
             self.xi = yi
             self.yi = xi
 
-cdef class BlockIntersection(BlockMerge):
-    """
-    not done yet
-    """
-    pass
 
 cdef class BlockUnion(BlockMerge):
     """
@@ -763,56 +783,20 @@ include "sparse_op_helper.pxi"
 
 
 # -----------------------------------------------------------------------------
-# Indexing operations
+# SparseArray mask create operations
 
-def get_reindexer(ndarray[object, ndim=1] values, dict index_map):
-    cdef object idx
-    cdef Py_ssize_t i
-    cdef Py_ssize_t new_length = len(values)
-    cdef ndarray[int32_t, ndim=1] indexer
+def make_mask_object_ndarray(ndarray[object, ndim=1] arr, object fill_value):
+    cdef:
+        object value
+        Py_ssize_t i
+        Py_ssize_t new_length = len(arr)
+        ndarray[int8_t, ndim=1] mask
 
-    indexer = np.empty(new_length, dtype=np.int32)
+    mask = np.ones(new_length, dtype=np.int8)
 
     for i in range(new_length):
-        idx = values[i]
-        if idx in index_map:
-            indexer[i] = index_map[idx]
-        else:
-            indexer[i] = -1
-
-    return indexer
-
-# def reindex_block(ndarray[float64_t, ndim=1] values,
-#                   BlockIndex sparse_index,
-#                   ndarray[int32_t, ndim=1] indexer):
-#     cdef:
-#         Py_ssize_t i, length
-#         ndarray[float64_t, ndim=1] out
-
-#     out = np.empty(length, dtype=np.float64)
-
-#     for i from 0 <= i < length:
-#         if indexer[i] == -1:
-#             pass
-
-
-# cdef class SparseCruncher(object):
-#     """
-#     Class to acquire float pointer for convenient operations on sparse data
-#     structures
-#     """
-#     cdef:
-#         SparseIndex index
-#         float64_t* buf
-
-#     def __init__(self, ndarray[float64_t, ndim=1, mode='c'] values,
-#                  SparseIndex index):
-
-#         self.index = index
-#         self.buf = <float64_t*> values.data
-
+        value = arr[i]
+        if value == fill_value and type(value) == type(fill_value):
+            mask[i] = 0
 
-def reindex_integer(ndarray[float64_t, ndim=1] values,
-                    IntIndex sparse_index,
-                    ndarray[int32_t, ndim=1] indexer):
-    pass
+    return mask.view(dtype=np.bool)
diff --git a/pandas/sparse/sparse_op_helper.pxi.in b/pandas/_libs/sparse_op_helper.pxi.in
similarity index 75%
rename from pandas/sparse/sparse_op_helper.pxi.in
rename to pandas/_libs/sparse_op_helper.pxi.in
index d1d9a6f02a72c..5949a3fd0ed81 100644
--- a/pandas/sparse/sparse_op_helper.pxi.in
+++ b/pandas/_libs/sparse_op_helper.pxi.in
@@ -4,22 +4,16 @@ Template for each `dtype` helper function for sparse ops
 WARNING: DO NOT edit .pxi FILE directly, .pxi is generated from .pxi.in
 """
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # Sparse op
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
-{{py:
-
-# dtype, float_group
-dtypes = [('float64', True), ('int64', False)]
-
-}}
+ctypedef fused sparse_t:
+    float64_t
+    int64_t
 
-{{for dtype, float_group in dtypes}}
 
-{{if float_group}}
-
-cdef inline {{dtype}}_t __div_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+cdef inline float64_t __div__(sparse_t a, sparse_t b):
     if b == 0:
         if a > 0:
             return INF
@@ -30,63 +24,34 @@ cdef inline {{dtype}}_t __div_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
     else:
         return float(a) / b
 
-cdef inline {{dtype}}_t __truediv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
-    return __div_{{dtype}}(a, b)
-
-cdef inline {{dtype}}_t __floordiv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
-    if b == 0:
-        # numpy >= 1.11 returns NaN
-        # for a // 0, rather than +-inf
-        if _np_version_under1p11:
-            if a > 0:
-                return INF
-            elif a < 0:
-                return -INF
-        return NaN
-    else:
-        return a // b
 
-cdef inline {{dtype}}_t __mod_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
-    if b == 0:
-        return NaN
-    else:
-        return a % b
+cdef inline float64_t __truediv__(sparse_t a, sparse_t b):
+    return __div__(a, b)
 
-{{else}}
 
-cdef inline float64_t __div_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+cdef inline sparse_t __mod__(sparse_t a, sparse_t b):
     if b == 0:
-        if a > 0:
-            return INF
-        elif a < 0:
-            return -INF
-        else:
+        if sparse_t is float64_t:
             return NaN
+        else:
+            return 0
     else:
-        return float(a) / b
+        return a % b
 
-cdef inline float64_t __truediv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
-    return __div_{{dtype}}(a, b)
 
-cdef inline {{dtype}}_t __floordiv_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
+cdef inline sparse_t __floordiv__(sparse_t a, sparse_t b):
     if b == 0:
-        return 0
+        if sparse_t is float64_t:
+            return NaN
+        else:
+            return 0
     else:
         return a // b
 
-cdef inline {{dtype}}_t __mod_{{dtype}}({{dtype}}_t a, {{dtype}}_t b):
-    if b == 0:
-        return 0
-    else:
-        return a % b
-
-{{endif}}
-
-{{endfor}}
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # sparse array op
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 
 {{py:
 
@@ -106,10 +71,10 @@ def get_op(tup):
     ops_dict = {'add': '{0} + {1}',
                 'sub': '{0} - {1}',
                 'mul': '{0} * {1}',
-                'div': '__div_{2}({0}, {1})',
-                'mod': '__mod_{2}({0}, {1})',
-                'truediv': '__truediv_{2}({0}, {1})',
-                'floordiv': '__floordiv_{2}({0}, {1})',
+                'div': '__div__({0}, {1})',
+                'mod': '__mod__({0}, {1})',
+                'truediv': '__truediv__({0}, {1})',
+                'floordiv': '__floordiv__({0}, {1})',
                 'pow': '{0} ** {1}',
                 'eq': '{0} == {1}',
                 'ne': '{0} != {1}',
@@ -160,10 +125,10 @@ def get_dispatch(dtypes):
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-cdef inline tuple block_op_{{opname}}_{{dtype}}(ndarray x_,
+cdef inline tuple block_op_{{opname}}_{{dtype}}({{dtype}}_t[:] x_,
                                                 BlockIndex xindex,
                                                 {{dtype}}_t xfill,
-                                                ndarray y_,
+                                                {{dtype}}_t[:] y_,
                                                 BlockIndex yindex,
                                                 {{dtype}}_t yfill):
     '''
@@ -177,7 +142,7 @@ cdef inline tuple block_op_{{opname}}_{{dtype}}(ndarray x_,
         int32_t xloc, yloc
         Py_ssize_t xblock = 0, yblock = 0 # block numbers
 
-        ndarray[{{dtype}}_t, ndim=1] x, y
+        {{dtype}}_t[:] x, y
         ndarray[{{rdtype}}_t, ndim=1] out
 
     # to suppress Cython warning
@@ -190,7 +155,7 @@ cdef inline tuple block_op_{{opname}}_{{dtype}}(ndarray x_,
     # Wow, what a hack job. Need to do something about this
 
     # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
+    for out_i in range(out_index.npoints):
         if yblock == yindex.nblocks:
             # use y fill value
             out[out_i] = {{(opname, 'x[xi]', 'yfill', dtype) | get_op}}
@@ -261,16 +226,18 @@ cdef inline tuple block_op_{{opname}}_{{dtype}}(ndarray x_,
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-cdef inline tuple int_op_{{opname}}_{{dtype}}(ndarray x_, IntIndex xindex,
+cdef inline tuple int_op_{{opname}}_{{dtype}}({{dtype}}_t[:] x_,
+                                              IntIndex xindex,
                                               {{dtype}}_t xfill,
-                                              ndarray y_, IntIndex yindex,
+                                              {{dtype}}_t[:] y_,
+                                              IntIndex yindex,
                                               {{dtype}}_t yfill):
     cdef:
         IntIndex out_index
         Py_ssize_t xi = 0, yi = 0, out_i = 0 # fp buf indices
         int32_t xloc, yloc
-        ndarray[int32_t, ndim=1] xindices, yindices, out_indices
-        ndarray[{{dtype}}_t, ndim=1] x, y
+        int32_t[:] xindices, yindices, out_indices
+        {{dtype}}_t[:] x, y
         ndarray[{{rdtype}}_t, ndim=1] out
 
     # suppress Cython compiler warnings due to inlining
@@ -286,7 +253,7 @@ cdef inline tuple int_op_{{opname}}_{{dtype}}(ndarray x_, IntIndex xindex,
     out_indices = out_index.indices
 
     # walk the two SparseVectors, adding matched locations...
-    for out_i from 0 <= out_i < out_index.npoints:
+    for out_i in range(out_index.npoints):
         if xi == xindex.npoints:
             # use x fill value
             out[out_i] = {{(opname, 'xfill', 'y[yi]', dtype) | get_op}}
@@ -319,9 +286,9 @@ cdef inline tuple int_op_{{opname}}_{{dtype}}(ndarray x_, IntIndex xindex,
     return out, out_index, {{(opname, 'xfill', 'yfill', dtype) | get_op}}
 
 
-cpdef sparse_{{opname}}_{{dtype}}(ndarray[{{dtype}}_t, ndim=1] x,
+cpdef sparse_{{opname}}_{{dtype}}({{dtype}}_t[:] x,
                                   SparseIndex xindex, {{dtype}}_t xfill,
-                                  ndarray[{{dtype}}_t, ndim=1] y,
+                                  {{dtype}}_t[:] y,
                                   SparseIndex yindex, {{dtype}}_t yfill):
 
     if isinstance(xindex, BlockIndex):
diff --git a/pandas/_libs/src/compat_helper.h b/pandas/_libs/src/compat_helper.h
index e3c40d2ca65f4..078069fb48af2 100644
--- a/pandas/_libs/src/compat_helper.h
+++ b/pandas/_libs/src/compat_helper.h
@@ -11,14 +11,27 @@ The full license is in the LICENSE file, distributed with this software.
 #define PANDAS__LIBS_SRC_COMPAT_HELPER_H_
 
 #include "Python.h"
-#include "numpy_helper.h"
+#include "inline_helper.h"
 
 /*
 PySlice_GetIndicesEx changes signature in PY3
 but 3.6.1 in particular changes the behavior of this function slightly
 https://bugs.python.org/issue27867
+
+
+In 3.6.1 PySlice_GetIndicesEx was changed to a macro
+inadvertently breaking ABI compat.  For now, undefing
+the macro, which restores compat.
+https://github.com/pandas-dev/pandas/issues/15961
+https://bugs.python.org/issue29943
 */
 
+#ifndef PYPY_VERSION
+# if PY_VERSION_HEX < 0x03070000 && defined(PySlice_GetIndicesEx)
+#   undef PySlice_GetIndicesEx
+# endif  // PY_VERSION_HEX
+#endif  // PYPY_VERSION
+
 PANDAS_INLINE int slice_get_indices(PyObject *s,
                                     Py_ssize_t length,
                                     Py_ssize_t *start,
@@ -31,7 +44,7 @@ PANDAS_INLINE int slice_get_indices(PyObject *s,
 #else
   return PySlice_GetIndicesEx((PySliceObject *)s, length, start,
                               stop, step, slicelength);
-#endif
+#endif  // PY_VERSION_HEX
 }
 
 #endif  // PANDAS__LIBS_SRC_COMPAT_HELPER_H_
diff --git a/pandas/_libs/src/datetime.pxd b/pandas/_libs/src/datetime.pxd
deleted file mode 100644
index 2267c8282ec14..0000000000000
--- a/pandas/_libs/src/datetime.pxd
+++ /dev/null
@@ -1,195 +0,0 @@
-# cython: profile=False
-from numpy cimport int64_t, int32_t, npy_int64, npy_int32, ndarray
-from cpython cimport PyObject
-
-from cpython cimport PyUnicode_Check, PyUnicode_AsASCIIString
-
-
-cdef extern from "headers/stdint.h":
-    enum: INT64_MIN
-    enum: INT32_MIN
-
-
-
-cdef extern from "datetime.h":
-
-    ctypedef class datetime.date [object PyDateTime_Date]:
-        pass
-
-    ctypedef class datetime.datetime [object PyDateTime_DateTime]:
-        pass
-
-    ctypedef class datetime.timedelta [object PyDateTime_Delta]:
-        pass
-
-    void PyDateTime_IMPORT()
-
-    int PyDateTime_GET_YEAR(date)
-    int PyDateTime_GET_MONTH(date)
-    int PyDateTime_GET_DAY(date)
-    int PyDateTime_DATE_GET_HOUR(object o)
-    int PyDateTime_DATE_GET_MINUTE(object o)
-    int PyDateTime_DATE_GET_SECOND(object o)
-    int PyDateTime_DATE_GET_MICROSECOND(object o)
-    int PyDateTime_TIME_GET_HOUR(object o)
-    int PyDateTime_TIME_GET_MINUTE(object o)
-    int PyDateTime_TIME_GET_SECOND(object o)
-    int PyDateTime_TIME_GET_MICROSECOND(object o)
-    bint PyDateTime_Check(object o)
-    bint PyDate_Check(object o)
-    bint PyTime_Check(object o)
-    bint PyDelta_Check(object o)
-    object PyDateTime_FromDateAndTime(int year, int month, int day, int hour,
-                                      int minute, int second, int us)
-
-cdef extern from "numpy/ndarrayobject.h":
-
-    ctypedef int64_t npy_timedelta
-    ctypedef int64_t npy_datetime
-
-    ctypedef enum NPY_CASTING:
-            NPY_NO_CASTING
-            NPY_EQUIV_CASTING
-            NPY_SAFE_CASTING
-            NPY_SAME_KIND_CASTING
-            NPY_UNSAFE_CASTING
-
-
-cdef extern from "numpy_helper.h":
-    npy_datetime get_datetime64_value(object o)
-    npy_timedelta get_timedelta64_value(object o)
-
-cdef extern from "numpy/npy_common.h":
-
-    ctypedef unsigned char npy_bool
-
-cdef extern from "datetime/np_datetime.h":
-
-    ctypedef enum PANDAS_DATETIMEUNIT:
-        PANDAS_FR_Y
-        PANDAS_FR_M
-        PANDAS_FR_W
-        PANDAS_FR_D
-        PANDAS_FR_B
-        PANDAS_FR_h
-        PANDAS_FR_m
-        PANDAS_FR_s
-        PANDAS_FR_ms
-        PANDAS_FR_us
-        PANDAS_FR_ns
-        PANDAS_FR_ps
-        PANDAS_FR_fs
-        PANDAS_FR_as
-
-    ctypedef struct pandas_datetimestruct:
-        npy_int64 year
-        npy_int32 month, day, hour, min, sec, us, ps, as
-
-    int cmp_pandas_datetimestruct(pandas_datetimestruct *a,
-                                  pandas_datetimestruct *b)
-
-    int convert_pydatetime_to_datetimestruct(PyObject *obj,
-                                             pandas_datetimestruct *out,
-                                             PANDAS_DATETIMEUNIT *out_bestunit,
-                                             int apply_tzinfo)
-
-    npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
-                                                   pandas_datetimestruct *d) nogil
-    void pandas_datetime_to_datetimestruct(npy_datetime val,
-                                           PANDAS_DATETIMEUNIT fr,
-                                           pandas_datetimestruct *result) nogil
-    int days_per_month_table[2][12]
-
-    int dayofweek(int y, int m, int d) nogil
-    int is_leapyear(int64_t year) nogil
-    PANDAS_DATETIMEUNIT get_datetime64_unit(object o)
-
-cdef extern from "datetime/np_datetime_strings.h":
-
-    int parse_iso_8601_datetime(char *str, int len, PANDAS_DATETIMEUNIT unit,
-                                NPY_CASTING casting, pandas_datetimestruct *out,
-                                int *out_local, int *out_tzoffset,
-                                PANDAS_DATETIMEUNIT *out_bestunit,
-                                npy_bool *out_special)
-
-    int make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                               int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                               NPY_CASTING casting)
-
-    int get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base)
-
-    # int parse_python_string(object obj, pandas_datetimestruct *out) except -1
-
-
-
-
-cdef inline int _string_to_dts(object val, pandas_datetimestruct* dts,
-                           int* out_local, int* out_tzoffset) except? -1:
-    cdef int result
-    cdef char *tmp
-
-    if PyUnicode_Check(val):
-        val = PyUnicode_AsASCIIString(val);
-
-    tmp = val
-    result = _cstring_to_dts(tmp, len(val), dts, out_local, out_tzoffset)
-
-    if result == -1:
-        raise ValueError('Unable to parse %s' % str(val))
-    return result
-
-cdef inline int _cstring_to_dts(char *val, int length,
-                                pandas_datetimestruct* dts,
-                                int* out_local, int* out_tzoffset) except? -1:
-    cdef:
-        npy_bool special
-        PANDAS_DATETIMEUNIT out_bestunit
-        int result
-
-    result = parse_iso_8601_datetime(val, length, PANDAS_FR_ns,
-                                     NPY_UNSAFE_CASTING,
-                                     dts, out_local, out_tzoffset, &out_bestunit, &special)
-    return result
-
-
-cdef inline object _datetime64_to_datetime(int64_t val):
-    cdef pandas_datetimestruct dts
-    pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-    return _dts_to_pydatetime(&dts)
-
-cdef inline object _dts_to_pydatetime(pandas_datetimestruct *dts):
-    return <object> PyDateTime_FromDateAndTime(dts.year, dts.month,
-                                               dts.day, dts.hour,
-                                               dts.min, dts.sec, dts.us)
-
-cdef inline int64_t _pydatetime_to_dts(object val, pandas_datetimestruct *dts):
-    dts.year = PyDateTime_GET_YEAR(val)
-    dts.month = PyDateTime_GET_MONTH(val)
-    dts.day = PyDateTime_GET_DAY(val)
-    dts.hour = PyDateTime_DATE_GET_HOUR(val)
-    dts.min = PyDateTime_DATE_GET_MINUTE(val)
-    dts.sec = PyDateTime_DATE_GET_SECOND(val)
-    dts.us = PyDateTime_DATE_GET_MICROSECOND(val)
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-cdef inline int64_t _dtlike_to_datetime64(object val,
-                                          pandas_datetimestruct *dts):
-    dts.year = val.year
-    dts.month = val.month
-    dts.day = val.day
-    dts.hour = val.hour
-    dts.min = val.minute
-    dts.sec = val.second
-    dts.us = val.microsecond
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-cdef inline int64_t _date_to_datetime64(object val,
-                                        pandas_datetimestruct *dts):
-    dts.year = PyDateTime_GET_YEAR(val)
-    dts.month = PyDateTime_GET_MONTH(val)
-    dts.day = PyDateTime_GET_DAY(val)
-    dts.hour = dts.min = dts.sec = dts.us = 0
-    dts.ps = dts.as = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
diff --git a/pandas/_libs/src/datetime/np_datetime.c b/pandas/_libs/src/datetime/np_datetime.c
deleted file mode 100644
index 8458418988863..0000000000000
--- a/pandas/_libs/src/datetime/np_datetime.c
+++ /dev/null
@@ -1,976 +0,0 @@
-/*
-
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Copyright (c) 2005-2011, NumPy Developers
-All rights reserved.
-
-This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
-
-*/
-
-#define NO_IMPORT
-
-#include <Python.h>
-#include <datetime.h>
-
-#include <numpy/arrayobject.h>
-#include <numpy/arrayscalars.h>
-#include "np_datetime.h"
-
-#if PY_MAJOR_VERSION >= 3
-#define PyIntObject PyLongObject
-#define PyInt_Type PyLong_Type
-#define PyInt_Check(op) PyLong_Check(op)
-#define PyInt_CheckExact(op) PyLong_CheckExact(op)
-#define PyInt_FromString PyLong_FromString
-#define PyInt_FromUnicode PyLong_FromUnicode
-#define PyInt_FromLong PyLong_FromLong
-#define PyInt_FromSize_t PyLong_FromSize_t
-#define PyInt_FromSsize_t PyLong_FromSsize_t
-#define PyInt_AsLong PyLong_AsLong
-#define PyInt_AS_LONG PyLong_AS_LONG
-#define PyInt_AsSsize_t PyLong_AsSsize_t
-#define PyInt_AsUnsignedLongMask PyLong_AsUnsignedLongMask
-#define PyInt_AsUnsignedLongLongMask PyLong_AsUnsignedLongLongMask
-#endif
-
-const int days_per_month_table[2][12] = {
-    {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31},
-    {31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31}};
-
-/*
- * Returns 1 if the given year is a leap year, 0 otherwise.
- */
-int is_leapyear(npy_int64 year) {
-    return (year & 0x3) == 0 && /* year % 4 == 0 */
-           ((year % 100) != 0 || (year % 400) == 0);
-}
-
-/*
- * Sakamoto's method, from wikipedia
- */
-int dayofweek(int y, int m, int d) {
-    int day;
-    static const int t[] = {0, 3, 2, 5, 0, 3, 5, 1, 4, 6, 2, 4};
-    y -= m < 3;
-    day = (y + y / 4 - y / 100 + y / 400 + t[m - 1] + d) % 7;
-    // convert to python day
-    return (day + 6) % 7;
-}
-
-/*
- * Adjusts a datetimestruct based on a minutes offset. Assumes
- * the current values are valid.g
- */
-void add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes) {
-    int isleap;
-
-    /* MINUTES */
-    dts->min += minutes;
-    while (dts->min < 0) {
-        dts->min += 60;
-        dts->hour--;
-    }
-    while (dts->min >= 60) {
-        dts->min -= 60;
-        dts->hour++;
-    }
-
-    /* HOURS */
-    while (dts->hour < 0) {
-        dts->hour += 24;
-        dts->day--;
-    }
-    while (dts->hour >= 24) {
-        dts->hour -= 24;
-        dts->day++;
-    }
-
-    /* DAYS */
-    if (dts->day < 1) {
-        dts->month--;
-        if (dts->month < 1) {
-            dts->year--;
-            dts->month = 12;
-        }
-        isleap = is_leapyear(dts->year);
-        dts->day += days_per_month_table[isleap][dts->month - 1];
-    } else if (dts->day > 28) {
-        isleap = is_leapyear(dts->year);
-        if (dts->day > days_per_month_table[isleap][dts->month - 1]) {
-            dts->day -= days_per_month_table[isleap][dts->month - 1];
-            dts->month++;
-            if (dts->month > 12) {
-                dts->year++;
-                dts->month = 1;
-            }
-        }
-    }
-}
-
-/*
- * Calculates the days offset from the 1970 epoch.
- */
-npy_int64 get_datetimestruct_days(const pandas_datetimestruct *dts) {
-    int i, month;
-    npy_int64 year, days = 0;
-    const int *month_lengths;
-
-    year = dts->year - 1970;
-    days = year * 365;
-
-    /* Adjust for leap years */
-    if (days >= 0) {
-        /*
-         * 1968 is the closest leap year before 1970.
-         * Exclude the current year, so add 1.
-         */
-        year += 1;
-        /* Add one day for each 4 years */
-        days += year / 4;
-        /* 1900 is the closest previous year divisible by 100 */
-        year += 68;
-        /* Subtract one day for each 100 years */
-        days -= year / 100;
-        /* 1600 is the closest previous year divisible by 400 */
-        year += 300;
-        /* Add one day for each 400 years */
-        days += year / 400;
-    } else {
-        /*
-         * 1972 is the closest later year after 1970.
-         * Include the current year, so subtract 2.
-         */
-        year -= 2;
-        /* Subtract one day for each 4 years */
-        days += year / 4;
-        /* 2000 is the closest later year divisible by 100 */
-        year -= 28;
-        /* Add one day for each 100 years */
-        days -= year / 100;
-        /* 2000 is also the closest later year divisible by 400 */
-        /* Subtract one day for each 400 years */
-        days += year / 400;
-    }
-
-    month_lengths = days_per_month_table[is_leapyear(dts->year)];
-    month = dts->month - 1;
-
-    /* Add the months */
-    for (i = 0; i < month; ++i) {
-        days += month_lengths[i];
-    }
-
-    /* Add the days */
-    days += dts->day - 1;
-
-    return days;
-}
-
-/*
- * Modifies '*days_' to be the day offset within the year,
- * and returns the year.
- */
-static npy_int64 days_to_yearsdays(npy_int64 *days_) {
-    const npy_int64 days_per_400years = (400 * 365 + 100 - 4 + 1);
-    /* Adjust so it's relative to the year 2000 (divisible by 400) */
-    npy_int64 days = (*days_) - (365 * 30 + 7);
-    npy_int64 year;
-
-    /* Break down the 400 year cycle to get the year and day within the year */
-    if (days >= 0) {
-        year = 400 * (days / days_per_400years);
-        days = days % days_per_400years;
-    } else {
-        year = 400 * ((days - (days_per_400years - 1)) / days_per_400years);
-        days = days % days_per_400years;
-        if (days < 0) {
-            days += days_per_400years;
-        }
-    }
-
-    /* Work out the year/day within the 400 year cycle */
-    if (days >= 366) {
-        year += 100 * ((days - 1) / (100 * 365 + 25 - 1));
-        days = (days - 1) % (100 * 365 + 25 - 1);
-        if (days >= 365) {
-            year += 4 * ((days + 1) / (4 * 365 + 1));
-            days = (days + 1) % (4 * 365 + 1);
-            if (days >= 366) {
-                year += (days - 1) / 365;
-                days = (days - 1) % 365;
-            }
-        }
-    }
-
-    *days_ = days;
-    return year + 2000;
-}
-
-/*
- * Adjusts a datetimestruct based on a seconds offset. Assumes
- * the current values are valid.
- */
-NPY_NO_EXPORT void add_seconds_to_datetimestruct(pandas_datetimestruct *dts,
-                                                 int seconds) {
-    int minutes;
-
-    dts->sec += seconds;
-    if (dts->sec < 0) {
-        minutes = dts->sec / 60;
-        dts->sec = dts->sec % 60;
-        if (dts->sec < 0) {
-            --minutes;
-            dts->sec += 60;
-        }
-        add_minutes_to_datetimestruct(dts, minutes);
-    } else if (dts->sec >= 60) {
-        minutes = dts->sec / 60;
-        dts->sec = dts->sec % 60;
-        add_minutes_to_datetimestruct(dts, minutes);
-    }
-}
-
-/*
- * Fills in the year, month, day in 'dts' based on the days
- * offset from 1970.
- */
-static void set_datetimestruct_days(npy_int64 days,
-                                    pandas_datetimestruct *dts) {
-    const int *month_lengths;
-    int i;
-
-    dts->year = days_to_yearsdays(&days);
-    month_lengths = days_per_month_table[is_leapyear(dts->year)];
-
-    for (i = 0; i < 12; ++i) {
-        if (days < month_lengths[i]) {
-            dts->month = i + 1;
-            dts->day = days + 1;
-            return;
-        } else {
-            days -= month_lengths[i];
-        }
-    }
-}
-
-/*
- * Compares two pandas_datetimestruct objects chronologically
- */
-int cmp_pandas_datetimestruct(pandas_datetimestruct *a,
-                              pandas_datetimestruct *b) {
-    if (a->year > b->year) {
-        return 1;
-    } else if (a->year < b->year) {
-        return -1;
-    }
-
-    if (a->month > b->month) {
-        return 1;
-    } else if (a->month < b->month) {
-        return -1;
-    }
-
-    if (a->day > b->day) {
-        return 1;
-    } else if (a->day < b->day) {
-        return -1;
-    }
-
-    if (a->hour > b->hour) {
-        return 1;
-    } else if (a->hour < b->hour) {
-        return -1;
-    }
-
-    if (a->min > b->min) {
-        return 1;
-    } else if (a->min < b->min) {
-        return -1;
-    }
-
-    if (a->sec > b->sec) {
-        return 1;
-    } else if (a->sec < b->sec) {
-        return -1;
-    }
-
-    if (a->us > b->us) {
-        return 1;
-    } else if (a->us < b->us) {
-        return -1;
-    }
-
-    if (a->ps > b->ps) {
-        return 1;
-    } else if (a->ps < b->ps) {
-        return -1;
-    }
-
-    if (a->as > b->as) {
-        return 1;
-    } else if (a->as < b->as) {
-        return -1;
-    }
-
-    return 0;
-}
-
-/*
- *
- * Tests for and converts a Python datetime.datetime or datetime.date
- * object into a NumPy pandas_datetimestruct.
- *
- * While the C API has PyDate_* and PyDateTime_* functions, the following
- * implementation just asks for attributes, and thus supports
- * datetime duck typing. The tzinfo time zone conversion would require
- * this style of access anyway.
- *
- * 'out_bestunit' gives a suggested unit based on whether the object
- *      was a datetime.date or datetime.datetime object.
- *
- * If 'apply_tzinfo' is 1, this function uses the tzinfo to convert
- * to UTC time, otherwise it returns the struct with the local time.
- *
- * Returns -1 on error, 0 on success, and 1 (with no error set)
- * if obj doesn't have the neeeded date or datetime attributes.
- */
-int convert_pydatetime_to_datetimestruct(PyObject *obj,
-                                         pandas_datetimestruct *out,
-                                         PANDAS_DATETIMEUNIT *out_bestunit,
-                                         int apply_tzinfo) {
-    PyObject *tmp;
-    int isleap;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->month = 1;
-    out->day = 1;
-
-    /* Need at least year/month/day attributes */
-    if (!PyObject_HasAttrString(obj, "year") ||
-        !PyObject_HasAttrString(obj, "month") ||
-        !PyObject_HasAttrString(obj, "day")) {
-        return 1;
-    }
-
-    /* Get the year */
-    tmp = PyObject_GetAttrString(obj, "year");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->year = PyInt_AsLong(tmp);
-    if (out->year == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the month */
-    tmp = PyObject_GetAttrString(obj, "month");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->month = PyInt_AsLong(tmp);
-    if (out->month == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the day */
-    tmp = PyObject_GetAttrString(obj, "day");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->day = PyInt_AsLong(tmp);
-    if (out->day == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Validate that the month and day are valid for the year */
-    if (out->month < 1 || out->month > 12) {
-        goto invalid_date;
-    }
-    isleap = is_leapyear(out->year);
-    if (out->day < 1 ||
-        out->day > days_per_month_table[isleap][out->month - 1]) {
-        goto invalid_date;
-    }
-
-    /* Check for time attributes (if not there, return success as a date) */
-    if (!PyObject_HasAttrString(obj, "hour") ||
-        !PyObject_HasAttrString(obj, "minute") ||
-        !PyObject_HasAttrString(obj, "second") ||
-        !PyObject_HasAttrString(obj, "microsecond")) {
-        /* The best unit for date is 'D' */
-        if (out_bestunit != NULL) {
-            *out_bestunit = PANDAS_FR_D;
-        }
-        return 0;
-    }
-
-    /* Get the hour */
-    tmp = PyObject_GetAttrString(obj, "hour");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->hour = PyInt_AsLong(tmp);
-    if (out->hour == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the minute */
-    tmp = PyObject_GetAttrString(obj, "minute");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->min = PyInt_AsLong(tmp);
-    if (out->min == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the second */
-    tmp = PyObject_GetAttrString(obj, "second");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->sec = PyInt_AsLong(tmp);
-    if (out->sec == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    /* Get the microsecond */
-    tmp = PyObject_GetAttrString(obj, "microsecond");
-    if (tmp == NULL) {
-        return -1;
-    }
-    out->us = PyInt_AsLong(tmp);
-    if (out->us == -1 && PyErr_Occurred()) {
-        Py_DECREF(tmp);
-        return -1;
-    }
-    Py_DECREF(tmp);
-
-    if (out->hour < 0 || out->hour >= 24 || out->min < 0 || out->min >= 60 ||
-        out->sec < 0 || out->sec >= 60 || out->us < 0 || out->us >= 1000000) {
-        goto invalid_time;
-    }
-
-    /* Apply the time zone offset if it exists */
-    if (apply_tzinfo && PyObject_HasAttrString(obj, "tzinfo")) {
-        tmp = PyObject_GetAttrString(obj, "tzinfo");
-        if (tmp == NULL) {
-            return -1;
-        }
-        if (tmp == Py_None) {
-            Py_DECREF(tmp);
-        } else {
-            PyObject *offset;
-            int seconds_offset, minutes_offset;
-
-            /* The utcoffset function should return a timedelta */
-            offset = PyObject_CallMethod(tmp, "utcoffset", "O", obj);
-            if (offset == NULL) {
-                Py_DECREF(tmp);
-                return -1;
-            }
-            Py_DECREF(tmp);
-
-            /*
-             * The timedelta should have a function "total_seconds"
-             * which contains the value we want.
-             */
-            tmp = PyObject_CallMethod(offset, "total_seconds", "");
-            if (tmp == NULL) {
-                return -1;
-            }
-            seconds_offset = PyInt_AsLong(tmp);
-            if (seconds_offset == -1 && PyErr_Occurred()) {
-                Py_DECREF(tmp);
-                return -1;
-            }
-            Py_DECREF(tmp);
-
-            /* Convert to a minutes offset and apply it */
-            minutes_offset = seconds_offset / 60;
-
-            add_minutes_to_datetimestruct(out, -minutes_offset);
-        }
-    }
-
-    /* The resolution of Python's datetime is 'us' */
-    if (out_bestunit != NULL) {
-        *out_bestunit = PANDAS_FR_us;
-    }
-
-    return 0;
-
-invalid_date:
-    PyErr_Format(PyExc_ValueError,
-                 "Invalid date (%d,%d,%d) when converting to NumPy datetime",
-                 (int)out->year, (int)out->month, (int)out->day);
-    return -1;
-
-invalid_time:
-    PyErr_Format(PyExc_ValueError,
-                 "Invalid time (%d,%d,%d,%d) when converting "
-                 "to NumPy datetime",
-                 (int)out->hour, (int)out->min, (int)out->sec, (int)out->us);
-    return -1;
-}
-
-npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
-                                               pandas_datetimestruct *d) {
-    pandas_datetime_metadata meta;
-    npy_datetime result = PANDAS_DATETIME_NAT;
-
-    meta.base = fr;
-    meta.num = 1;
-
-    convert_datetimestruct_to_datetime(&meta, d, &result);
-    return result;
-}
-
-void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
-                                       pandas_datetimestruct *result) {
-    pandas_datetime_metadata meta;
-
-    meta.base = fr;
-    meta.num = 1;
-
-    convert_datetime_to_datetimestruct(&meta, val, result);
-}
-
-PANDAS_DATETIMEUNIT get_datetime64_unit(PyObject *obj) {
-    return (PANDAS_DATETIMEUNIT)((PyDatetimeScalarObject *)obj)->obmeta.base;
-}
-
-/*
- * Converts a datetime from a datetimestruct to a datetime based
- * on some metadata. The date is assumed to be valid.
- *
- * TODO: If meta->num is really big, there could be overflow
- *
- * Returns 0 on success, -1 on failure.
- */
-int convert_datetimestruct_to_datetime(pandas_datetime_metadata *meta,
-                                       const pandas_datetimestruct *dts,
-                                       npy_datetime *out) {
-    npy_datetime ret;
-    PANDAS_DATETIMEUNIT base = meta->base;
-
-    if (base == PANDAS_FR_Y) {
-        /* Truncate to the year */
-        ret = dts->year - 1970;
-    } else if (base == PANDAS_FR_M) {
-        /* Truncate to the month */
-        ret = 12 * (dts->year - 1970) + (dts->month - 1);
-    } else {
-        /* Otherwise calculate the number of days to start */
-        npy_int64 days = get_datetimestruct_days(dts);
-
-        switch (base) {
-            case PANDAS_FR_W:
-                /* Truncate to weeks */
-                if (days >= 0) {
-                    ret = days / 7;
-                } else {
-                    ret = (days - 6) / 7;
-                }
-                break;
-            case PANDAS_FR_D:
-                ret = days;
-                break;
-            case PANDAS_FR_h:
-                ret = days * 24 + dts->hour;
-                break;
-            case PANDAS_FR_m:
-                ret = (days * 24 + dts->hour) * 60 + dts->min;
-                break;
-            case PANDAS_FR_s:
-                ret = ((days * 24 + dts->hour) * 60 + dts->min) * 60 + dts->sec;
-                break;
-            case PANDAS_FR_ms:
-                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                       dts->sec) *
-                          1000 +
-                      dts->us / 1000;
-                break;
-            case PANDAS_FR_us:
-                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                       dts->sec) *
-                          1000000 +
-                      dts->us;
-                break;
-            case PANDAS_FR_ns:
-                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                        dts->sec) *
-                           1000000 +
-                       dts->us) *
-                          1000 +
-                      dts->ps / 1000;
-                break;
-            case PANDAS_FR_ps:
-                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                        dts->sec) *
-                           1000000 +
-                       dts->us) *
-                          1000000 +
-                      dts->ps;
-                break;
-            case PANDAS_FR_fs:
-                /* only 2.6 hours */
-                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                         dts->sec) *
-                            1000000 +
-                        dts->us) *
-                           1000000 +
-                       dts->ps) *
-                          1000 +
-                      dts->as / 1000;
-                break;
-            case PANDAS_FR_as:
-                /* only 9.2 secs */
-                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
-                         dts->sec) *
-                            1000000 +
-                        dts->us) *
-                           1000000 +
-                       dts->ps) *
-                          1000000 +
-                      dts->as;
-                break;
-            default:
-                /* Something got corrupted */
-                PyErr_SetString(
-                    PyExc_ValueError,
-                    "NumPy datetime metadata with corrupt unit value");
-                return -1;
-        }
-    }
-
-    /* Divide by the multiplier */
-    if (meta->num > 1) {
-        if (ret >= 0) {
-            ret /= meta->num;
-        } else {
-            ret = (ret - meta->num + 1) / meta->num;
-        }
-    }
-
-    *out = ret;
-
-    return 0;
-}
-
-/*
- * This provides the casting rules for the TIMEDELTA data type units.
- *
- * Notably, there is a barrier between the nonlinear years and
- * months units, and all the other units.
- */
-npy_bool can_cast_timedelta64_units(PANDAS_DATETIMEUNIT src_unit,
-                                    PANDAS_DATETIMEUNIT dst_unit,
-                                    NPY_CASTING casting) {
-    switch (casting) {
-        /* Allow anything with unsafe casting */
-        case NPY_UNSAFE_CASTING:
-            return 1;
-
-        /*
-         * Only enforce the 'date units' vs 'time units' barrier with
-         * 'same_kind' casting.
-         */
-        case NPY_SAME_KIND_CASTING:
-            return (src_unit <= PANDAS_FR_M && dst_unit <= PANDAS_FR_M) ||
-                   (src_unit > PANDAS_FR_M && dst_unit > PANDAS_FR_M);
-
-        /*
-         * Enforce the 'date units' vs 'time units' barrier and that
-         * casting is only allowed towards more precise units with
-         * 'safe' casting.
-         */
-        case NPY_SAFE_CASTING:
-            return (src_unit <= dst_unit) &&
-                   ((src_unit <= PANDAS_FR_M && dst_unit <= PANDAS_FR_M) ||
-                    (src_unit > PANDAS_FR_M && dst_unit > PANDAS_FR_M));
-
-        /* Enforce equality with 'no' or 'equiv' casting */
-        default:
-            return src_unit == dst_unit;
-    }
-}
-
-/*
- * This provides the casting rules for the DATETIME data type units.
- *
- * Notably, there is a barrier between 'date units' and 'time units'
- * for all but 'unsafe' casting.
- */
-npy_bool can_cast_datetime64_units(PANDAS_DATETIMEUNIT src_unit,
-                                   PANDAS_DATETIMEUNIT dst_unit,
-                                   NPY_CASTING casting) {
-    switch (casting) {
-        /* Allow anything with unsafe casting */
-        case NPY_UNSAFE_CASTING:
-            return 1;
-
-        /*
-         * Only enforce the 'date units' vs 'time units' barrier with
-         * 'same_kind' casting.
-         */
-        case NPY_SAME_KIND_CASTING:
-            return (src_unit <= PANDAS_FR_D && dst_unit <= PANDAS_FR_D) ||
-                   (src_unit > PANDAS_FR_D && dst_unit > PANDAS_FR_D);
-
-        /*
-         * Enforce the 'date units' vs 'time units' barrier and that
-         * casting is only allowed towards more precise units with
-         * 'safe' casting.
-         */
-        case NPY_SAFE_CASTING:
-            return (src_unit <= dst_unit) &&
-                   ((src_unit <= PANDAS_FR_D && dst_unit <= PANDAS_FR_D) ||
-                    (src_unit > PANDAS_FR_D && dst_unit > PANDAS_FR_D));
-
-        /* Enforce equality with 'no' or 'equiv' casting */
-        default:
-            return src_unit == dst_unit;
-    }
-}
-
-/*
- * Converts a datetime based on the given metadata into a datetimestruct
- */
-int convert_datetime_to_datetimestruct(pandas_datetime_metadata *meta,
-                                       npy_datetime dt,
-                                       pandas_datetimestruct *out) {
-    npy_int64 perday;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->year = 1970;
-    out->month = 1;
-    out->day = 1;
-
-    /* TODO: Change to a mechanism that avoids the potential overflow */
-    dt *= meta->num;
-
-    /*
-     * Note that care must be taken with the / and % operators
-     * for negative values.
-     */
-    switch (meta->base) {
-        case PANDAS_FR_Y:
-            out->year = 1970 + dt;
-            break;
-
-        case PANDAS_FR_M:
-            if (dt >= 0) {
-                out->year = 1970 + dt / 12;
-                out->month = dt % 12 + 1;
-            } else {
-                out->year = 1969 + (dt + 1) / 12;
-                out->month = 12 + (dt + 1) % 12;
-            }
-            break;
-
-        case PANDAS_FR_W:
-            /* A week is 7 days */
-            set_datetimestruct_days(dt * 7, out);
-            break;
-
-        case PANDAS_FR_D:
-            set_datetimestruct_days(dt, out);
-            break;
-
-        case PANDAS_FR_h:
-            perday = 24LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt;
-            break;
-
-        case PANDAS_FR_m:
-            perday = 24LL * 60;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / 60;
-            out->min = dt % 60;
-            break;
-
-        case PANDAS_FR_s:
-            perday = 24LL * 60 * 60;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60 * 60);
-            out->min = (dt / 60) % 60;
-            out->sec = dt % 60;
-            break;
-
-        case PANDAS_FR_ms:
-            perday = 24LL * 60 * 60 * 1000;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60 * 60 * 1000LL);
-            out->min = (dt / (60 * 1000LL)) % 60;
-            out->sec = (dt / 1000LL) % 60;
-            out->us = (dt % 1000LL) * 1000;
-            break;
-
-        case PANDAS_FR_us:
-            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60 * 60 * 1000000LL);
-            out->min = (dt / (60 * 1000000LL)) % 60;
-            out->sec = (dt / 1000000LL) % 60;
-            out->us = dt % 1000000LL;
-            break;
-
-        case PANDAS_FR_ns:
-            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL * 1000LL;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60 * 60 * 1000000000LL);
-            out->min = (dt / (60 * 1000000000LL)) % 60;
-            out->sec = (dt / 1000000000LL) % 60;
-            out->us = (dt / 1000LL) % 1000000LL;
-            out->ps = (dt % 1000LL) * 1000;
-            break;
-
-        case PANDAS_FR_ps:
-            perday = 24LL * 60 * 60 * 1000 * 1000 * 1000 * 1000;
-
-            if (dt >= 0) {
-                set_datetimestruct_days(dt / perday, out);
-                dt = dt % perday;
-            } else {
-                set_datetimestruct_days(
-                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
-                dt = (perday - 1) + (dt + 1) % perday;
-            }
-            out->hour = dt / (60 * 60 * 1000000000000LL);
-            out->min = (dt / (60 * 1000000000000LL)) % 60;
-            out->sec = (dt / 1000000000000LL) % 60;
-            out->us = (dt / 1000000LL) % 1000000LL;
-            out->ps = dt % 1000000LL;
-            break;
-
-        case PANDAS_FR_fs:
-            /* entire range is only +- 2.6 hours */
-            if (dt >= 0) {
-                out->hour = dt / (60 * 60 * 1000000000000000LL);
-                out->min = (dt / (60 * 1000000000000000LL)) % 60;
-                out->sec = (dt / 1000000000000000LL) % 60;
-                out->us = (dt / 1000000000LL) % 1000000LL;
-                out->ps = (dt / 1000LL) % 1000000LL;
-                out->as = (dt % 1000LL) * 1000;
-            } else {
-                npy_datetime minutes;
-
-                minutes = dt / (60 * 1000000000000000LL);
-                dt = dt % (60 * 1000000000000000LL);
-                if (dt < 0) {
-                    dt += (60 * 1000000000000000LL);
-                    --minutes;
-                }
-                /* Offset the negative minutes */
-                add_minutes_to_datetimestruct(out, minutes);
-                out->sec = (dt / 1000000000000000LL) % 60;
-                out->us = (dt / 1000000000LL) % 1000000LL;
-                out->ps = (dt / 1000LL) % 1000000LL;
-                out->as = (dt % 1000LL) * 1000;
-            }
-            break;
-
-        case PANDAS_FR_as:
-            /* entire range is only +- 9.2 seconds */
-            if (dt >= 0) {
-                out->sec = (dt / 1000000000000000000LL) % 60;
-                out->us = (dt / 1000000000000LL) % 1000000LL;
-                out->ps = (dt / 1000000LL) % 1000000LL;
-                out->as = dt % 1000000LL;
-            } else {
-                npy_datetime seconds;
-
-                seconds = dt / 1000000000000000000LL;
-                dt = dt % 1000000000000000000LL;
-                if (dt < 0) {
-                    dt += 1000000000000000000LL;
-                    --seconds;
-                }
-                /* Offset the negative seconds */
-                add_seconds_to_datetimestruct(out, seconds);
-                out->us = (dt / 1000000000000LL) % 1000000LL;
-                out->ps = (dt / 1000000LL) % 1000000LL;
-                out->as = dt % 1000000LL;
-            }
-            break;
-
-        default:
-            PyErr_SetString(PyExc_RuntimeError,
-                            "NumPy datetime metadata is corrupted with invalid "
-                            "base unit");
-            return -1;
-    }
-
-    return 0;
-}
diff --git a/pandas/_libs/src/datetime/np_datetime.h b/pandas/_libs/src/datetime/np_datetime.h
deleted file mode 100644
index 97ec5782b625b..0000000000000
--- a/pandas/_libs/src/datetime/np_datetime.h
+++ /dev/null
@@ -1,127 +0,0 @@
-/*
-
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Copyright (c) 2005-2011, NumPy Developers
-All rights reserved.
-
-This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
-
-*/
-
-#ifndef PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
-#define PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
-
-#include <numpy/ndarraytypes.h>
-
-typedef enum {
-        PANDAS_FR_Y = 0,  // Years
-        PANDAS_FR_M = 1,  // Months
-        PANDAS_FR_W = 2,  // Weeks
-        // Gap where NPY_FR_B was
-        PANDAS_FR_D = 4,  // Days
-        PANDAS_FR_h = 5,  // hours
-        PANDAS_FR_m = 6,  // minutes
-        PANDAS_FR_s = 7,  // seconds
-        PANDAS_FR_ms = 8,  // milliseconds
-        PANDAS_FR_us = 9,  // microseconds
-        PANDAS_FR_ns = 10,  // nanoseconds
-        PANDAS_FR_ps = 11,  // picoseconds
-        PANDAS_FR_fs = 12,  // femtoseconds
-        PANDAS_FR_as = 13,  // attoseconds
-        PANDAS_FR_GENERIC = 14  // Generic, unbound units, can
-                                // convert to anything
-} PANDAS_DATETIMEUNIT;
-
-#define PANDAS_DATETIME_NUMUNITS 13
-
-#define PANDAS_DATETIME_MAX_ISO8601_STRLEN (21+3*5+1+3*6+6+1)
-
-#define PANDAS_DATETIME_NAT NPY_MIN_INT64
-
-typedef struct {
-        npy_int64 year;
-        npy_int32 month, day, hour, min, sec, us, ps, as;
-} pandas_datetimestruct;
-
-typedef struct {
-    PANDAS_DATETIMEUNIT base;
-    int num;
-} pandas_datetime_metadata;
-
-// stuff pandas needs
-// ----------------------------------------------------------------------------
-
-int convert_pydatetime_to_datetimestruct(PyObject *obj,
-                                         pandas_datetimestruct *out,
-                                         PANDAS_DATETIMEUNIT *out_bestunit,
-                                         int apply_tzinfo);
-
-npy_datetime pandas_datetimestruct_to_datetime(PANDAS_DATETIMEUNIT fr,
-                                               pandas_datetimestruct *d);
-
-void pandas_datetime_to_datetimestruct(npy_datetime val, PANDAS_DATETIMEUNIT fr,
-                                       pandas_datetimestruct *result);
-
-int dayofweek(int y, int m, int d);
-
-extern const int days_per_month_table[2][12];
-
-// stuff numpy-derived code needs in header
-// ----------------------------------------------------------------------------
-
-int is_leapyear(npy_int64 year);
-
-/*
- * Converts a datetime from a datetimestruct to a datetime based
- * on some metadata. The date is assumed to be valid.
- *
- * TODO: If meta->num is really big, there could be overflow
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-convert_datetimestruct_to_datetime(pandas_datetime_metadata *meta,
-                                   const pandas_datetimestruct *dts,
-                                   npy_datetime *out);
-
-/*
- * Calculates the days offset from the 1970 epoch.
- */
-npy_int64
-get_datetimestruct_days(const pandas_datetimestruct *dts);
-
-/*
- * Adjusts a datetimestruct based on a minutes offset. Assumes
- * the current values are valid.
- */
-void
-add_minutes_to_datetimestruct(pandas_datetimestruct *dts, int minutes);
-
-/*
- * This provides the casting rules for the TIMEDELTA data type units.
- *
- * Notably, there is a barrier between the nonlinear years and
- * months units, and all the other units.
- */
-npy_bool
-can_cast_datetime64_units(PANDAS_DATETIMEUNIT src_unit,
-                          PANDAS_DATETIMEUNIT dst_unit,
-                          NPY_CASTING casting);
-
-
-int
-convert_datetime_to_datetimestruct(pandas_datetime_metadata *meta,
-                                   npy_datetime dt,
-                                   pandas_datetimestruct *out);
-
-
-PANDAS_DATETIMEUNIT get_datetime64_unit(PyObject *obj);
-
-
-#endif  // PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_H_
diff --git a/pandas/_libs/src/datetime/np_datetime_strings.c b/pandas/_libs/src/datetime/np_datetime_strings.c
deleted file mode 100644
index 5307d394423ff..0000000000000
--- a/pandas/_libs/src/datetime/np_datetime_strings.c
+++ /dev/null
@@ -1,1475 +0,0 @@
-/*
-
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Written by Mark Wiebe (mwwiebe@gmail.com)
-Copyright (c) 2011 by Enthought, Inc.
-
-Copyright (c) 2005-2011, NumPy Developers
-All rights reserved.
-
-See NUMPY_LICENSE.txt for the license.
-
-This file implements string parsing and creation for NumPy datetime.
-
-*/
-
-#define PY_SSIZE_T_CLEAN
-#define NO_IMPORT
-
-#include <Python.h>
-
-#include <time.h>
-
-#include <numpy/arrayobject.h>
-#include "numpy/arrayscalars.h"
-
-#include "np_datetime.h"
-#include "np_datetime_strings.h"
-
-NPY_NO_EXPORT const char *npy_casting_to_string(NPY_CASTING casting) {
-    switch (casting) {
-        case NPY_NO_CASTING:
-            return "'no'";
-        case NPY_EQUIV_CASTING:
-            return "'equiv'";
-        case NPY_SAFE_CASTING:
-            return "'safe'";
-        case NPY_SAME_KIND_CASTING:
-            return "'same_kind'";
-        case NPY_UNSAFE_CASTING:
-            return "'unsafe'";
-        default:
-            return "<unknown>";
-    }
-}
-
-/* Platform-specific time_t typedef */
-typedef time_t NPY_TIME_T;
-
-/* We *do* want these symbols, but for Cython, not for C.
-   Fine in Mac OSX, but Linux complains.
-
-static void _suppress_unused_variable_warning(void) {
-    int x = days_per_month_table[0][0];
-    x = x;
-
-    int y = _month_offset[0][0];
-    y = y;
-
-    char *z = _datetime_strings[0];
-    z = z;
-} */
-
-/* Exported as DATETIMEUNITS in multiarraymodule.c */
-static char *_datetime_strings[PANDAS_DATETIME_NUMUNITS] = {
-    "Y", "M", "W", "D", "h", "m", "s", "ms", "us", "ns", "ps", "fs", "as",
-};
-/*
- * Wraps `localtime` functionality for multiple platforms. This
- * converts a time value to a time structure in the local timezone.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int get_localtime(NPY_TIME_T *ts, struct tm *tms) {
-    char *func_name = "<unknown>";
-#if defined(_WIN32)
-#if defined(_MSC_VER) && (_MSC_VER >= 1400)
-    if (localtime_s(tms, ts) != 0) {
-        func_name = "localtime_s";
-        goto fail;
-    }
-#elif defined(__GNUC__) && defined(NPY_MINGW_USE_CUSTOM_MSVCR)
-    if (_localtime64_s(tms, ts) != 0) {
-        func_name = "_localtime64_s";
-        goto fail;
-    }
-#else
-    struct tm *tms_tmp;
-    localtime_r(ts, tms_tmp);
-    if (tms_tmp == NULL) {
-        func_name = "localtime";
-        goto fail;
-    }
-    memcpy(tms, tms_tmp, sizeof(struct tm));
-#endif
-#else
-    if (localtime_r(ts, tms) == NULL) {
-        func_name = "localtime_r";
-        goto fail;
-    }
-#endif
-
-    return 0;
-
-fail:
-    PyErr_Format(PyExc_OSError,
-                 "Failed to use '%s' to convert "
-                 "to a local time",
-                 func_name);
-    return -1;
-}
-
-#if 0
-/*
- * Wraps `gmtime` functionality for multiple platforms. This
- * converts a time value to a time structure in UTC.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-get_gmtime(NPY_TIME_T *ts, struct tm *tms) {
-    char *func_name = "<unknown>";
-#if defined(_WIN32)
-#if defined(_MSC_VER) && (_MSC_VER >= 1400)
-    if (gmtime_s(tms, ts) != 0) {
-        func_name = "gmtime_s";
-        goto fail;
-    }
-#elif defined(__GNUC__) && defined(NPY_MINGW_USE_CUSTOM_MSVCR)
-    if (_gmtime64_s(tms, ts) != 0) {
-        func_name = "_gmtime64_s";
-        goto fail;
-    }
-#else
-    struct tm *tms_tmp;
-    gmtime_r(ts, tms_tmp);
-    if (tms_tmp == NULL) {
-        func_name = "gmtime";
-        goto fail;
-    }
-    memcpy(tms, tms_tmp, sizeof(struct tm));
-#endif
-#else
-    if (gmtime_r(ts, tms) == NULL) {
-        func_name = "gmtime_r";
-        goto fail;
-    }
-#endif
-
-    return 0;
-
-fail:
-    PyErr_Format(PyExc_OSError, "Failed to use '%s' to convert "
-                                "to a UTC time", func_name);
-    return -1;
-}
-#endif
-
-/*
- * Converts a datetimestruct in UTC to a datetimestruct in local time,
- * also returning the timezone offset applied.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int convert_datetimestruct_utc_to_local(
-    pandas_datetimestruct *out_dts_local, const pandas_datetimestruct *dts_utc,
-    int *out_timezone_offset) {
-    NPY_TIME_T rawtime = 0, localrawtime;
-    struct tm tm_;
-    npy_int64 year_correction = 0;
-
-    /* Make a copy of the input 'dts' to modify */
-    *out_dts_local = *dts_utc;
-
-    /* HACK: Use a year < 2038 for later years for small time_t */
-    if (sizeof(NPY_TIME_T) == 4 && out_dts_local->year >= 2038) {
-        if (is_leapyear(out_dts_local->year)) {
-            /* 2036 is a leap year */
-            year_correction = out_dts_local->year - 2036;
-            out_dts_local->year -= year_correction;
-        } else {
-            /* 2037 is not a leap year */
-            year_correction = out_dts_local->year - 2037;
-            out_dts_local->year -= year_correction;
-        }
-    }
-
-    /*
-     * Convert everything in 'dts' to a time_t, to minutes precision.
-     * This is POSIX time, which skips leap-seconds, but because
-     * we drop the seconds value from the pandas_datetimestruct, everything
-     * is ok for this operation.
-     */
-    rawtime = (time_t)get_datetimestruct_days(out_dts_local) * 24 * 60 * 60;
-    rawtime += dts_utc->hour * 60 * 60;
-    rawtime += dts_utc->min * 60;
-
-    /* localtime converts a 'time_t' into a local 'struct tm' */
-    if (get_localtime(&rawtime, &tm_) < 0) {
-        return -1;
-    }
-
-    /* Copy back all the values except seconds */
-    out_dts_local->min = tm_.tm_min;
-    out_dts_local->hour = tm_.tm_hour;
-    out_dts_local->day = tm_.tm_mday;
-    out_dts_local->month = tm_.tm_mon + 1;
-    out_dts_local->year = tm_.tm_year + 1900;
-
-    /* Extract the timezone offset that was applied */
-    rawtime /= 60;
-    localrawtime = (time_t)get_datetimestruct_days(out_dts_local) * 24 * 60;
-    localrawtime += out_dts_local->hour * 60;
-    localrawtime += out_dts_local->min;
-
-    *out_timezone_offset = localrawtime - rawtime;
-
-    /* Reapply the year 2038 year correction HACK */
-    out_dts_local->year += year_correction;
-
-    return 0;
-}
-
-#if 0
-/*
- * Converts a datetimestruct in local time to a datetimestruct in UTC.
- *
- * Returns 0 on success, -1 on failure.
- */
-static int
-convert_datetimestruct_local_to_utc(pandas_datetimestruct *out_dts_utc,
-                const pandas_datetimestruct *dts_local) {
-    npy_int64 year_correction = 0;
-
-    /* Make a copy of the input 'dts' to modify */
-    *out_dts_utc = *dts_local;
-
-    /* HACK: Use a year < 2038 for later years for small time_t */
-    if (sizeof(NPY_TIME_T) == 4 && out_dts_utc->year >= 2038) {
-        if (is_leapyear(out_dts_utc->year)) {
-            /* 2036 is a leap year */
-            year_correction = out_dts_utc->year - 2036;
-            out_dts_utc->year -= year_correction;
-        } else {
-            /* 2037 is not a leap year */
-            year_correction = out_dts_utc->year - 2037;
-            out_dts_utc->year -= year_correction;
-        }
-    }
-
-    /*
-     * ISO 8601 states to treat date-times without a timezone offset
-     * or 'Z' for UTC as local time. The C standard libary functions
-     * mktime and gmtime allow us to do this conversion.
-     *
-     * Only do this timezone adjustment for recent and future years.
-     * In this case, "recent" is defined to be 1970 and later, because
-     * on MS Windows, mktime raises an error when given an earlier date.
-     */
-    if (out_dts_utc->year >= 1970) {
-        NPY_TIME_T rawtime = 0;
-        struct tm tm_;
-
-        tm_.tm_sec = out_dts_utc->sec;
-        tm_.tm_min = out_dts_utc->min;
-        tm_.tm_hour = out_dts_utc->hour;
-        tm_.tm_mday = out_dts_utc->day;
-        tm_.tm_mon = out_dts_utc->month - 1;
-        tm_.tm_year = out_dts_utc->year - 1900;
-        tm_.tm_isdst = -1;
-
-        /* mktime converts a local 'struct tm' into a time_t */
-        rawtime = mktime(&tm_);
-        if (rawtime == -1) {
-            PyErr_SetString(PyExc_OSError, "Failed to use mktime to "
-                                        "convert local time to UTC");
-            return -1;
-        }
-
-        /* gmtime converts a 'time_t' into a UTC 'struct tm' */
-        if (get_gmtime(&rawtime, &tm_) < 0) {
-            return -1;
-        }
-        out_dts_utc->sec = tm_.tm_sec;
-        out_dts_utc->min = tm_.tm_min;
-        out_dts_utc->hour = tm_.tm_hour;
-        out_dts_utc->day = tm_.tm_mday;
-        out_dts_utc->month = tm_.tm_mon + 1;
-        out_dts_utc->year = tm_.tm_year + 1900;
-    }
-
-    /* Reapply the year 2038 year correction HACK */
-    out_dts_utc->year += year_correction;
-
-    return 0;
-}
-#endif
-
-/* int */
-/* parse_python_string(PyObject* obj, pandas_datetimestruct *dts) { */
-/*     PyObject *bytes = NULL; */
-/*     char *str = NULL; */
-/*     Py_ssize_t len = 0; */
-/*     PANDAS_DATETIMEUNIT bestunit = -1; */
-
-/*     /\* Convert to an ASCII string for the date parser *\/ */
-/*     if (PyUnicode_Check(obj)) { */
-/*         bytes = PyUnicode_AsASCIIString(obj); */
-/*         if (bytes == NULL) { */
-/*             return -1; */
-/*         } */
-/*     } */
-/*     else { */
-/*         bytes = obj; */
-/*         Py_INCREF(bytes); */
-/*     } */
-/*     if (PyBytes_AsStringAndSize(bytes, &str, &len) == -1) { */
-/*         Py_DECREF(bytes); */
-/*         return -1; */
-/*     } */
-
-/*     /\* Parse the ISO date *\/ */
-/*     if (parse_iso_8601_datetime(str, len, PANDAS_FR_us, NPY_UNSAFE_CASTING,
- */
-/*                             dts, NULL, &bestunit, NULL) < 0) { */
-/*         Py_DECREF(bytes); */
-/*         return -1; */
-/*     } */
-/*     Py_DECREF(bytes); */
-
-/*     return 0; */
-/* } */
-
-/*
- * Parses (almost) standard ISO 8601 date strings. The differences are:
- *
- * + Only seconds may have a decimal point, with up to 18 digits after it
- *   (maximum attoseconds precision).
- * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
- *   the date and the time. Both are treated equivalently.
- * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
- * + Doesn't handle leap seconds (seconds value has 60 in these cases).
- * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
- * + Accepts special values "NaT" (not a time), "Today", (current
- *   day according to local time) and "Now" (current time in UTC).
- * + ':' separator between hours, minutes, and seconds is optional. When
- *   omitted, each component must be 2 digits if it appears. (GH-10041)
- *
- * 'str' must be a NULL-terminated string, and 'len' must be its length.
- * 'unit' should contain -1 if the unit is unknown, or the unit
- *      which will be used if it is.
- * 'casting' controls how the detected unit from the string is allowed
- *           to be cast to the 'unit' parameter.
- *
- * 'out' gets filled with the parsed date-time.
- * 'out_local' gets set to 1 if the parsed time contains timezone,
- *      to 0 otherwise.
- * 'out_tzoffset' gets set to timezone offset by minutes
- *      if the parsed time was in local time,
- *      to 0 otherwise. The values 'now' and 'today' don't get counted
- *      as local, and neither do UTC +/-#### timezone offsets, because
- *      they aren't using the computer's local timezone offset.
- * 'out_bestunit' gives a suggested unit based on the amount of
- *      resolution provided in the string, or -1 for NaT.
- * 'out_special' gets set to 1 if the parsed time was 'today',
- *      'now', or ''/'NaT'. For 'today', the unit recommended is
- *      'D', for 'now', the unit recommended is 's', and for 'NaT'
- *      the unit recommended is 'Y'.
- *
- * Returns 0 on success, -1 on failure.
- */
-int parse_iso_8601_datetime(char *str, int len, PANDAS_DATETIMEUNIT unit,
-                            NPY_CASTING casting, pandas_datetimestruct *out,
-                            int *out_local, int *out_tzoffset,
-                            PANDAS_DATETIMEUNIT *out_bestunit,
-                            npy_bool *out_special) {
-    int year_leap = 0;
-    int i, numdigits;
-    char *substr, sublen;
-    PANDAS_DATETIMEUNIT bestunit;
-
-    /* If year-month-day are separated by a valid separator,
-     * months/days without leading zeroes will be parsed
-     * (though not iso8601). If the components aren't separated,
-     * 4 (YYYY) or 8 (YYYYMMDD) digits are expected. 6 digits are
-     * forbidden here (but parsed as YYMMDD elsewhere).
-    */
-    int has_ymd_sep = 0;
-    char ymd_sep = '\0';
-    char valid_ymd_sep[] = {'-', '.', '/', '\\', ' '};
-    int valid_ymd_sep_len = sizeof(valid_ymd_sep);
-
-    /* hour-minute-second may or may not separated by ':'. If not, then
-     * each component must be 2 digits. */
-    int has_hms_sep = 0;
-    int hour_was_2_digits = 0;
-
-    /* Initialize the output to all zeros */
-    memset(out, 0, sizeof(pandas_datetimestruct));
-    out->month = 1;
-    out->day = 1;
-
-    /*
-     * The string "today" means take today's date in local time, and
-     * convert it to a date representation. This date representation, if
-     * forced into a time unit, will be at midnight UTC.
-     * This is perhaps a little weird, but done so that the
-     * 'datetime64[D]' type produces the date you expect, rather than
-     * switching to an adjacent day depending on the current time and your
-     * timezone.
-     */
-    if (len == 5 && tolower(str[0]) == 't' && tolower(str[1]) == 'o' &&
-        tolower(str[2]) == 'd' && tolower(str[3]) == 'a' &&
-        tolower(str[4]) == 'y') {
-        NPY_TIME_T rawtime = 0;
-        struct tm tm_;
-
-        time(&rawtime);
-        if (get_localtime(&rawtime, &tm_) < 0) {
-            return -1;
-        }
-        out->year = tm_.tm_year + 1900;
-        out->month = tm_.tm_mon + 1;
-        out->day = tm_.tm_mday;
-
-        bestunit = PANDAS_FR_D;
-
-        /*
-         * Indicate that this was a special value, and
-         * is a date (unit 'D').
-         */
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        if (out_bestunit != NULL) {
-            *out_bestunit = bestunit;
-        }
-        if (out_special != NULL) {
-            *out_special = 1;
-        }
-
-        /* Check the casting rule */
-        if (!can_cast_datetime64_units(bestunit, unit, casting)) {
-            PyErr_Format(PyExc_TypeError,
-                         "Cannot parse \"%s\" as unit "
-                         "'%s' using casting rule %s",
-                         str, _datetime_strings[unit],
-                         npy_casting_to_string(casting));
-            return -1;
-        }
-
-        return 0;
-    }
-
-    /* The string "now" resolves to the current UTC time */
-    if (len == 3 && tolower(str[0]) == 'n' && tolower(str[1]) == 'o' &&
-        tolower(str[2]) == 'w') {
-        NPY_TIME_T rawtime = 0;
-        pandas_datetime_metadata meta;
-
-        time(&rawtime);
-
-        /* Set up a dummy metadata for the conversion */
-        meta.base = PANDAS_FR_s;
-        meta.num = 1;
-
-        bestunit = PANDAS_FR_s;
-
-        /*
-         * Indicate that this was a special value, and
-         * use 's' because the time() function has resolution
-         * seconds.
-         */
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        if (out_bestunit != NULL) {
-            *out_bestunit = bestunit;
-        }
-        if (out_special != NULL) {
-            *out_special = 1;
-        }
-
-        /* Check the casting rule */
-        if (!can_cast_datetime64_units(bestunit, unit, casting)) {
-            PyErr_Format(PyExc_TypeError,
-                         "Cannot parse \"%s\" as unit "
-                         "'%s' using casting rule %s",
-                         str, _datetime_strings[unit],
-                         npy_casting_to_string(casting));
-            return -1;
-        }
-
-        return convert_datetime_to_datetimestruct(&meta, rawtime, out);
-    }
-
-    /* Anything else isn't a special value */
-    if (out_special != NULL) {
-        *out_special = 0;
-    }
-
-    substr = str;
-    sublen = len;
-
-    /* Skip leading whitespace */
-    while (sublen > 0 && isspace(*substr)) {
-        ++substr;
-        --sublen;
-    }
-
-    /* Leading '-' sign for negative year */
-    if (*substr == '-') {
-        ++substr;
-        --sublen;
-    }
-
-    if (sublen == 0) {
-        goto parse_error;
-    }
-
-    /* PARSE THE YEAR (4 digits) */
-    out->year = 0;
-    if (sublen >= 4 && isdigit(substr[0]) && isdigit(substr[1]) &&
-        isdigit(substr[2]) && isdigit(substr[3])) {
-        out->year = 1000 * (substr[0] - '0') + 100 * (substr[1] - '0') +
-                    10 * (substr[2] - '0') + (substr[3] - '0');
-
-        substr += 4;
-        sublen -= 4;
-    }
-
-    /* Negate the year if necessary */
-    if (str[0] == '-') {
-        out->year = -out->year;
-    }
-    /* Check whether it's a leap-year */
-    year_leap = is_leapyear(out->year);
-
-    /* Next character must be a separator, start of month, or end of string */
-    if (sublen == 0) {
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_Y;
-        goto finish;
-    }
-
-    if (!isdigit(*substr)) {
-        for (i = 0; i < valid_ymd_sep_len; ++i) {
-            if (*substr == valid_ymd_sep[i]) {
-                break;
-            }
-        }
-        if (i == valid_ymd_sep_len) {
-            goto parse_error;
-        }
-        has_ymd_sep = 1;
-        ymd_sep = valid_ymd_sep[i];
-        ++substr;
-        --sublen;
-        /* Cannot have trailing separator */
-        if (sublen == 0 || !isdigit(*substr)) {
-            goto parse_error;
-        }
-    }
-
-    /* PARSE THE MONTH */
-    /* First digit required */
-    out->month = (*substr - '0');
-    ++substr;
-    --sublen;
-    /* Second digit optional if there was a separator */
-    if (isdigit(*substr)) {
-        out->month = 10 * out->month + (*substr - '0');
-        ++substr;
-        --sublen;
-    } else if (!has_ymd_sep) {
-        goto parse_error;
-    }
-    if (out->month < 1 || out->month > 12) {
-        PyErr_Format(PyExc_ValueError,
-                     "Month out of range in datetime string \"%s\"", str);
-        goto error;
-    }
-
-    /* Next character must be the separator, start of day, or end of string */
-    if (sublen == 0) {
-        /* Forbid YYYYMM. Parsed instead as YYMMDD by someone else. */
-        if (!has_ymd_sep) {
-            goto parse_error;
-        }
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_M;
-        goto finish;
-    }
-
-    if (has_ymd_sep) {
-        /* Must have separator, but cannot be trailing */
-        if (*substr != ymd_sep || sublen == 1) {
-            goto parse_error;
-        }
-        ++substr;
-        --sublen;
-    }
-
-    /* PARSE THE DAY */
-    /* First digit required */
-    if (!isdigit(*substr)) {
-        goto parse_error;
-    }
-    out->day = (*substr - '0');
-    ++substr;
-    --sublen;
-    /* Second digit optional if there was a separator */
-    if (isdigit(*substr)) {
-        out->day = 10 * out->day + (*substr - '0');
-        ++substr;
-        --sublen;
-    } else if (!has_ymd_sep) {
-        goto parse_error;
-    }
-    if (out->day < 1 ||
-        out->day > days_per_month_table[year_leap][out->month - 1]) {
-        PyErr_Format(PyExc_ValueError,
-                     "Day out of range in datetime string \"%s\"", str);
-        goto error;
-    }
-
-    /* Next character must be a 'T', ' ', or end of string */
-    if (sublen == 0) {
-        if (out_local != NULL) {
-            *out_local = 0;
-        }
-        bestunit = PANDAS_FR_D;
-        goto finish;
-    }
-
-    if ((*substr != 'T' && *substr != ' ') || sublen == 1) {
-        goto parse_error;
-    }
-    ++substr;
-    --sublen;
-
-    /* PARSE THE HOURS */
-    /* First digit required */
-    if (!isdigit(*substr)) {
-        goto parse_error;
-    }
-    out->hour = (*substr - '0');
-    ++substr;
-    --sublen;
-    /* Second digit optional */
-    if (isdigit(*substr)) {
-        hour_was_2_digits = 1;
-        out->hour = 10 * out->hour + (*substr - '0');
-        ++substr;
-        --sublen;
-        if (out->hour >= 24) {
-            PyErr_Format(PyExc_ValueError,
-                         "Hours out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-    }
-
-    /* Next character must be a ':' or the end of the string */
-    if (sublen == 0) {
-        if (!hour_was_2_digits) {
-            goto parse_error;
-        }
-        bestunit = PANDAS_FR_h;
-        goto finish;
-    }
-
-    if (*substr == ':') {
-        has_hms_sep = 1;
-        ++substr;
-        --sublen;
-        /* Cannot have a trailing separator */
-        if (sublen == 0 || !isdigit(*substr)) {
-            goto parse_error;
-        }
-    } else if (!isdigit(*substr)) {
-        if (!hour_was_2_digits) {
-            goto parse_error;
-        }
-        bestunit = PANDAS_FR_h;
-        goto parse_timezone;
-    }
-
-    /* PARSE THE MINUTES */
-    /* First digit required */
-    out->min = (*substr - '0');
-    ++substr;
-    --sublen;
-    /* Second digit optional if there was a separator */
-    if (isdigit(*substr)) {
-        out->min = 10 * out->min + (*substr - '0');
-        ++substr;
-        --sublen;
-        if (out->min >= 60) {
-            PyErr_Format(PyExc_ValueError,
-                         "Minutes out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-    } else if (!has_hms_sep) {
-        goto parse_error;
-    }
-
-    if (sublen == 0) {
-        bestunit = PANDAS_FR_m;
-        goto finish;
-    }
-
-    /* If we make it through this condition block, then the next
-     * character is a digit. */
-    if (has_hms_sep && *substr == ':') {
-        ++substr;
-        --sublen;
-        /* Cannot have a trailing ':' */
-        if (sublen == 0 || !isdigit(*substr)) {
-            goto parse_error;
-        }
-    } else if (!has_hms_sep && isdigit(*substr)) {
-    } else {
-        bestunit = PANDAS_FR_m;
-        goto parse_timezone;
-    }
-
-    /* PARSE THE SECONDS */
-    /* First digit required */
-    out->sec = (*substr - '0');
-    ++substr;
-    --sublen;
-    /* Second digit optional if there was a separator */
-    if (isdigit(*substr)) {
-        out->sec = 10 * out->sec + (*substr - '0');
-        ++substr;
-        --sublen;
-        if (out->sec >= 60) {
-            PyErr_Format(PyExc_ValueError,
-                         "Seconds out of range in datetime string \"%s\"", str);
-            goto error;
-        }
-    } else if (!has_hms_sep) {
-        goto parse_error;
-    }
-
-    /* Next character may be a '.' indicating fractional seconds */
-    if (sublen > 0 && *substr == '.') {
-        ++substr;
-        --sublen;
-    } else {
-        bestunit = PANDAS_FR_s;
-        goto parse_timezone;
-    }
-
-    /* PARSE THE MICROSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->us *= 10;
-        if (sublen > 0 && isdigit(*substr)) {
-            out->us += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (sublen == 0 || !isdigit(*substr)) {
-        if (numdigits > 3) {
-            bestunit = PANDAS_FR_us;
-        } else {
-            bestunit = PANDAS_FR_ms;
-        }
-        goto parse_timezone;
-    }
-
-    /* PARSE THE PICOSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->ps *= 10;
-        if (sublen > 0 && isdigit(*substr)) {
-            out->ps += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (sublen == 0 || !isdigit(*substr)) {
-        if (numdigits > 3) {
-            bestunit = PANDAS_FR_ps;
-        } else {
-            bestunit = PANDAS_FR_ns;
-        }
-        goto parse_timezone;
-    }
-
-    /* PARSE THE ATTOSECONDS (0 to 6 digits) */
-    numdigits = 0;
-    for (i = 0; i < 6; ++i) {
-        out->as *= 10;
-        if (sublen > 0 && isdigit(*substr)) {
-            out->as += (*substr - '0');
-            ++substr;
-            --sublen;
-            ++numdigits;
-        }
-    }
-
-    if (numdigits > 3) {
-        bestunit = PANDAS_FR_as;
-    } else {
-        bestunit = PANDAS_FR_fs;
-    }
-
-parse_timezone:
-    /* trim any whitepsace between time/timeezone */
-    while (sublen > 0 && isspace(*substr)) {
-        ++substr;
-        --sublen;
-    }
-
-    if (sublen == 0) {
-        // Unlike NumPy, treating no time zone as naive
-        goto finish;
-    }
-
-    /* UTC specifier */
-    if (*substr == 'Z') {
-        /* "Z" should be equivalent to tz offset "+00:00" */
-        if (out_local != NULL) {
-            *out_local = 1;
-        }
-
-        if (out_tzoffset != NULL) {
-            *out_tzoffset = 0;
-        }
-
-        if (sublen == 1) {
-            goto finish;
-        } else {
-            ++substr;
-            --sublen;
-        }
-    } else if (*substr == '-' || *substr == '+') {
-        /* Time zone offset */
-        int offset_neg = 0, offset_hour = 0, offset_minute = 0;
-
-        /*
-         * Since "local" means local with respect to the current
-         * machine, we say this is non-local.
-         */
-
-        if (*substr == '-') {
-            offset_neg = 1;
-        }
-        ++substr;
-        --sublen;
-
-        /* The hours offset */
-        if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-            offset_hour = 10 * (substr[0] - '0') + (substr[1] - '0');
-            substr += 2;
-            sublen -= 2;
-            if (offset_hour >= 24) {
-                PyErr_Format(PyExc_ValueError,
-                             "Timezone hours offset out of range "
-                             "in datetime string \"%s\"",
-                             str);
-                goto error;
-            }
-        } else if (sublen >= 1 && isdigit(substr[0])) {
-            offset_hour = substr[0] - '0';
-            ++substr;
-            --sublen;
-        } else {
-            goto parse_error;
-        }
-
-        /* The minutes offset is optional */
-        if (sublen > 0) {
-            /* Optional ':' */
-            if (*substr == ':') {
-                ++substr;
-                --sublen;
-            }
-
-            /* The minutes offset (at the end of the string) */
-            if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
-                offset_minute = 10 * (substr[0] - '0') + (substr[1] - '0');
-                substr += 2;
-                sublen -= 2;
-                if (offset_minute >= 60) {
-                    PyErr_Format(PyExc_ValueError,
-                                 "Timezone minutes offset out of range "
-                                 "in datetime string \"%s\"",
-                                 str);
-                    goto error;
-                }
-            } else if (sublen >= 1 && isdigit(substr[0])) {
-                offset_minute = substr[0] - '0';
-                ++substr;
-                --sublen;
-            } else {
-                goto parse_error;
-            }
-        }
-
-        /* Apply the time zone offset */
-        if (offset_neg) {
-            offset_hour = -offset_hour;
-            offset_minute = -offset_minute;
-        }
-        if (out_local != NULL) {
-            *out_local = 1;
-            // Unlike NumPy, do not change internal value to local time
-            *out_tzoffset = 60 * offset_hour + offset_minute;
-        }
-    }
-
-    /* Skip trailing whitespace */
-    while (sublen > 0 && isspace(*substr)) {
-        ++substr;
-        --sublen;
-    }
-
-    if (sublen != 0) {
-        goto parse_error;
-    }
-
-finish:
-    if (out_bestunit != NULL) {
-        *out_bestunit = bestunit;
-    }
-
-    /* Check the casting rule */
-    if (!can_cast_datetime64_units(bestunit, unit, casting)) {
-        PyErr_Format(PyExc_TypeError,
-                     "Cannot parse \"%s\" as unit "
-                     "'%s' using casting rule %s",
-                     str, _datetime_strings[unit],
-                     npy_casting_to_string(casting));
-        return -1;
-    }
-
-    return 0;
-
-parse_error:
-    PyErr_Format(PyExc_ValueError,
-                 "Error parsing datetime string \"%s\" at position %d", str,
-                 (int)(substr - str));
-    return -1;
-
-error:
-    return -1;
-}
-
-/*
- * Provides a string length to use for converting datetime
- * objects with the given local and unit settings.
- */
-int get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base) {
-    int len = 0;
-
-    switch (base) {
-        /* Generic units can only be used to represent NaT */
-        /*case PANDAS_FR_GENERIC:*/
-        /*    return 4;*/
-        case PANDAS_FR_as:
-            len += 3; /* "###" */
-        case PANDAS_FR_fs:
-            len += 3; /* "###" */
-        case PANDAS_FR_ps:
-            len += 3; /* "###" */
-        case PANDAS_FR_ns:
-            len += 3; /* "###" */
-        case PANDAS_FR_us:
-            len += 3; /* "###" */
-        case PANDAS_FR_ms:
-            len += 4; /* ".###" */
-        case PANDAS_FR_s:
-            len += 3; /* ":##" */
-        case PANDAS_FR_m:
-            len += 3; /* ":##" */
-        case PANDAS_FR_h:
-            len += 3; /* "T##" */
-        case PANDAS_FR_D:
-        case PANDAS_FR_W:
-            len += 3; /* "-##" */
-        case PANDAS_FR_M:
-            len += 3; /* "-##" */
-        case PANDAS_FR_Y:
-            len += 21; /* 64-bit year */
-            break;
-        default:
-            len += 3; /* handle the now defunct NPY_FR_B */
-            break;
-    }
-
-    if (base >= PANDAS_FR_h) {
-        if (local) {
-            len += 5; /* "+####" or "-####" */
-        } else {
-            len += 1; /* "Z" */
-        }
-    }
-
-    len += 1; /* NULL terminator */
-
-    return len;
-}
-
-/*
- * Finds the largest unit whose value is nonzero, and for which
- * the remainder for the rest of the units is zero.
- */
-static PANDAS_DATETIMEUNIT lossless_unit_from_datetimestruct(
-    pandas_datetimestruct *dts) {
-    if (dts->as % 1000 != 0) {
-        return PANDAS_FR_as;
-    } else if (dts->as != 0) {
-        return PANDAS_FR_fs;
-    } else if (dts->ps % 1000 != 0) {
-        return PANDAS_FR_ps;
-    } else if (dts->ps != 0) {
-        return PANDAS_FR_ns;
-    } else if (dts->us % 1000 != 0) {
-        return PANDAS_FR_us;
-    } else if (dts->us != 0) {
-        return PANDAS_FR_ms;
-    } else if (dts->sec != 0) {
-        return PANDAS_FR_s;
-    } else if (dts->min != 0) {
-        return PANDAS_FR_m;
-    } else if (dts->hour != 0) {
-        return PANDAS_FR_h;
-    } else if (dts->day != 1) {
-        return PANDAS_FR_D;
-    } else if (dts->month != 1) {
-        return PANDAS_FR_M;
-    } else {
-        return PANDAS_FR_Y;
-    }
-}
-
-/*
- * Converts an pandas_datetimestruct to an (almost) ISO 8601
- * NULL-terminated string. If the string fits in the space exactly,
- * it leaves out the NULL terminator and returns success.
- *
- * The differences from ISO 8601 are the 'NaT' string, and
- * the number of year digits is >= 4 instead of strictly 4.
- *
- * If 'local' is non-zero, it produces a string in local time with
- * a +-#### timezone offset, otherwise it uses timezone Z (UTC).
- *
- * 'base' restricts the output to that unit. Set 'base' to
- * -1 to auto-detect a base after which all the values are zero.
- *
- *  'tzoffset' is used if 'local' is enabled, and 'tzoffset' is
- *  set to a value other than -1. This is a manual override for
- *  the local time zone to use, as an offset in minutes.
- *
- *  'casting' controls whether data loss is allowed by truncating
- *  the data to a coarser unit. This interacts with 'local', slightly,
- *  in order to form a date unit string as a local time, the casting
- *  must be unsafe.
- *
- *  Returns 0 on success, -1 on failure (for example if the output
- *  string was too short).
- */
-int make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                           int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                           NPY_CASTING casting) {
-    pandas_datetimestruct dts_local;
-    int timezone_offset = 0;
-
-    char *substr = outstr, sublen = outlen;
-    int tmplen;
-
-    /* Only do local time within a reasonable year range */
-    if ((dts->year <= 1800 || dts->year >= 10000) && tzoffset == -1) {
-        local = 0;
-    }
-
-    /*
-     * Print weeks with the same precision as days.
-     *
-     * TODO: Could print weeks with YYYY-Www format if the week
-     *       epoch is a Monday.
-     */
-    if (base == PANDAS_FR_W) {
-        base = PANDAS_FR_D;
-    }
-
-    /* Use the C API to convert from UTC to local time */
-    if (local && tzoffset == -1) {
-        if (convert_datetimestruct_utc_to_local(&dts_local, dts,
-                                                &timezone_offset) < 0) {
-            return -1;
-        }
-
-        /* Set dts to point to our local time instead of the UTC time */
-        dts = &dts_local;
-    } else if (local) {
-        // Use the manually provided tzoffset.
-        // Make a copy of the pandas_datetimestruct we can modify.
-        dts_local = *dts;
-        dts = &dts_local;
-
-        /* Set and apply the required timezone offset */
-        timezone_offset = tzoffset;
-        add_minutes_to_datetimestruct(dts, timezone_offset);
-    }
-
-    /*
-     * Now the datetimestruct data is in the final form for
-     * the string representation, so ensure that the data
-     * is being cast according to the casting rule.
-     */
-    if (casting != NPY_UNSAFE_CASTING) {
-        /* Producing a date as a local time is always 'unsafe' */
-        if (base <= PANDAS_FR_D && local) {
-            PyErr_SetString(PyExc_TypeError,
-                            "Cannot create a local "
-                            "timezone-based date string from a NumPy "
-                            "datetime without forcing 'unsafe' casting");
-            return -1;
-        } else {
-            /* Only 'unsafe' and 'same_kind' allow data loss */
-            PANDAS_DATETIMEUNIT unitprec;
-
-            unitprec = lossless_unit_from_datetimestruct(dts);
-            if (casting != NPY_SAME_KIND_CASTING && unitprec > base) {
-                PyErr_Format(PyExc_TypeError,
-                             "Cannot create a "
-                             "string with unit precision '%s' "
-                             "from the NumPy datetime, which has data at "
-                             "unit precision '%s', "
-                             "requires 'unsafe' or 'same_kind' casting",
-                             _datetime_strings[base],
-                             _datetime_strings[unitprec]);
-                return -1;
-            }
-        }
-    }
-
-/* YEAR */
-/*
- * Can't use PyOS_snprintf, because it always produces a '\0'
- * character at the end, and NumPy string types are permitted
- * to have data all the way to the end of the buffer.
- */
-#ifdef _WIN32
-    tmplen = _snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
-#else
-    tmplen = snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
-#endif
-    /* If it ran out of space or there isn't space for the NULL terminator */
-    if (tmplen < 0 || tmplen > sublen) {
-        goto string_too_short;
-    }
-    substr += tmplen;
-    sublen -= tmplen;
-
-    /* Stop if the unit is years */
-    if (base == PANDAS_FR_Y) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* MONTH */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = '-';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->month / 10) + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->month % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is months */
-    if (base == PANDAS_FR_M) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* DAY */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = '-';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->day / 10) + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->day % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is days */
-    if (base == PANDAS_FR_D) {
-        if (sublen > 0) {
-            *substr = '\0';
-        }
-        return 0;
-    }
-
-    /* HOUR */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = 'T';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->hour / 10) + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->hour % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is hours */
-    if (base == PANDAS_FR_h) {
-        goto add_time_zone;
-    }
-
-    /* MINUTE */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = ':';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->min / 10) + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->min % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is minutes */
-    if (base == PANDAS_FR_m) {
-        goto add_time_zone;
-    }
-
-    /* SECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = ':';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->sec / 10) + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->sec % 10) + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is seconds */
-    if (base == PANDAS_FR_s) {
-        goto add_time_zone;
-    }
-
-    /* MILLISECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = '.';
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->us / 100000) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->us / 10000) % 10 + '0');
-    if (sublen < 4) {
-        goto string_too_short;
-    }
-    substr[3] = (char)((dts->us / 1000) % 10 + '0');
-    substr += 4;
-    sublen -= 4;
-
-    /* Stop if the unit is milliseconds */
-    if (base == PANDAS_FR_ms) {
-        goto add_time_zone;
-    }
-
-    /* MICROSECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->us / 100) % 10 + '0');
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->us / 10) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->us % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is microseconds */
-    if (base == PANDAS_FR_us) {
-        goto add_time_zone;
-    }
-
-    /* NANOSECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->ps / 100000) % 10 + '0');
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->ps / 10000) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->ps / 1000) % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is nanoseconds */
-    if (base == PANDAS_FR_ns) {
-        goto add_time_zone;
-    }
-
-    /* PICOSECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->ps / 100) % 10 + '0');
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->ps / 10) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->ps % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is picoseconds */
-    if (base == PANDAS_FR_ps) {
-        goto add_time_zone;
-    }
-
-    /* FEMTOSECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->as / 100000) % 10 + '0');
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->as / 10000) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)((dts->as / 1000) % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-    /* Stop if the unit is femtoseconds */
-    if (base == PANDAS_FR_fs) {
-        goto add_time_zone;
-    }
-
-    /* ATTOSECOND */
-    if (sublen < 1) {
-        goto string_too_short;
-    }
-    substr[0] = (char)((dts->as / 100) % 10 + '0');
-    if (sublen < 2) {
-        goto string_too_short;
-    }
-    substr[1] = (char)((dts->as / 10) % 10 + '0');
-    if (sublen < 3) {
-        goto string_too_short;
-    }
-    substr[2] = (char)(dts->as % 10 + '0');
-    substr += 3;
-    sublen -= 3;
-
-add_time_zone:
-    if (local) {
-        /* Add the +/- sign */
-        if (sublen < 1) {
-            goto string_too_short;
-        }
-        if (timezone_offset < 0) {
-            substr[0] = '-';
-            timezone_offset = -timezone_offset;
-        } else {
-            substr[0] = '+';
-        }
-        substr += 1;
-        sublen -= 1;
-
-        /* Add the timezone offset */
-        if (sublen < 1) {
-            goto string_too_short;
-        }
-        substr[0] = (char)((timezone_offset / (10 * 60)) % 10 + '0');
-        if (sublen < 2) {
-            goto string_too_short;
-        }
-        substr[1] = (char)((timezone_offset / 60) % 10 + '0');
-        if (sublen < 3) {
-            goto string_too_short;
-        }
-        substr[2] = (char)(((timezone_offset % 60) / 10) % 10 + '0');
-        if (sublen < 4) {
-            goto string_too_short;
-        }
-        substr[3] = (char)((timezone_offset % 60) % 10 + '0');
-        substr += 4;
-        sublen -= 4;
-    } else {
-        /* UTC "Zulu" time */
-        if (sublen < 1) {
-            goto string_too_short;
-        }
-        substr[0] = 'Z';
-        substr += 1;
-        sublen -= 1;
-    }
-
-    /* Add a NULL terminator, and return */
-    if (sublen > 0) {
-        substr[0] = '\0';
-    }
-
-    return 0;
-
-string_too_short:
-    PyErr_Format(PyExc_RuntimeError,
-                 "The string provided for NumPy ISO datetime formatting "
-                 "was too short, with length %d",
-                 outlen);
-    return -1;
-}
diff --git a/pandas/_libs/src/datetime/np_datetime_strings.h b/pandas/_libs/src/datetime/np_datetime_strings.h
deleted file mode 100644
index 833c1869c1664..0000000000000
--- a/pandas/_libs/src/datetime/np_datetime_strings.h
+++ /dev/null
@@ -1,106 +0,0 @@
-/*
-
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Written by Mark Wiebe (mwwiebe@gmail.com)
-Copyright (c) 2011 by Enthought, Inc.
-
-Copyright (c) 2005-2011, NumPy Developers
-All rights reserved.
-
-See NUMPY_LICENSE.txt for the license.
-
-This file implements string parsing and creation for NumPy datetime.
-
-*/
-
-#ifndef PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
-#define PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
-
-/*
- * Parses (almost) standard ISO 8601 date strings. The differences are:
- *
- * + The date "20100312" is parsed as the year 20100312, not as
- *   equivalent to "2010-03-12". The '-' in the dates are not optional.
- * + Only seconds may have a decimal point, with up to 18 digits after it
- *   (maximum attoseconds precision).
- * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
- *   the date and the time. Both are treated equivalently.
- * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
- * + Doesn't handle leap seconds (seconds value has 60 in these cases).
- * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
- * + Accepts special values "NaT" (not a time), "Today", (current
- *   day according to local time) and "Now" (current time in UTC).
- *
- * 'str' must be a NULL-terminated string, and 'len' must be its length.
- * 'unit' should contain -1 if the unit is unknown, or the unit
- *      which will be used if it is.
- * 'casting' controls how the detected unit from the string is allowed
- *           to be cast to the 'unit' parameter.
- *
- * 'out' gets filled with the parsed date-time.
- * 'out_local' gets whether returned value contains timezone. 0 for UTC, 1 for local time.
- * 'out_tzoffset' gets set to timezone offset by minutes
- *      if the parsed time was in local time,
- *      to 0 otherwise. The values 'now' and 'today' don't get counted
- *      as local, and neither do UTC +/-#### timezone offsets, because
- *      they aren't using the computer's local timezone offset.
- * 'out_bestunit' gives a suggested unit based on the amount of
- *      resolution provided in the string, or -1 for NaT.
- * 'out_special' gets set to 1 if the parsed time was 'today',
- *      'now', or ''/'NaT'. For 'today', the unit recommended is
- *      'D', for 'now', the unit recommended is 's', and for 'NaT'
- *      the unit recommended is 'Y'.
- *
- * Returns 0 on success, -1 on failure.
- */
-int
-parse_iso_8601_datetime(char *str, int len,
-                    PANDAS_DATETIMEUNIT unit,
-                    NPY_CASTING casting,
-                    pandas_datetimestruct *out,
-                    int *out_local,
-                    int *out_tzoffset,
-                    PANDAS_DATETIMEUNIT *out_bestunit,
-                    npy_bool *out_special);
-
-/*
- * Provides a string length to use for converting datetime
- * objects with the given local and unit settings.
- */
-int
-get_datetime_iso_8601_strlen(int local, PANDAS_DATETIMEUNIT base);
-
-/*
- * Converts an pandas_datetimestruct to an (almost) ISO 8601
- * NULL-terminated string.
- *
- * If 'local' is non-zero, it produces a string in local time with
- * a +-#### timezone offset, otherwise it uses timezone Z (UTC).
- *
- * 'base' restricts the output to that unit. Set 'base' to
- * -1 to auto-detect a base after which all the values are zero.
- *
- *  'tzoffset' is used if 'local' is enabled, and 'tzoffset' is
- *  set to a value other than -1. This is a manual override for
- *  the local time zone to use, as an offset in minutes.
- *
- *  'casting' controls whether data loss is allowed by truncating
- *  the data to a coarser unit. This interacts with 'local', slightly,
- *  in order to form a date unit string as a local time, the casting
- *  must be unsafe.
- *
- *  Returns 0 on success, -1 on failure (for example if the output
- *  string was too short).
- */
-int
-make_iso_8601_datetime(pandas_datetimestruct *dts, char *outstr, int outlen,
-                    int local, PANDAS_DATETIMEUNIT base, int tzoffset,
-                    NPY_CASTING casting);
-
-#endif  // PANDAS__LIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
diff --git a/pandas/_libs/src/datetime_helper.h b/pandas/_libs/src/datetime_helper.h
deleted file mode 100644
index 8023285f85b9b..0000000000000
--- a/pandas/_libs/src/datetime_helper.h
+++ /dev/null
@@ -1,36 +0,0 @@
-/*
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-*/
-
-#ifndef PANDAS__LIBS_SRC_DATETIME_HELPER_H_
-#define PANDAS__LIBS_SRC_DATETIME_HELPER_H_
-
-#include <stdio.h>
-#include "datetime.h"
-#include "numpy/arrayobject.h"
-#include "numpy/arrayscalars.h"
-
-npy_int64 get_long_attr(PyObject *o, const char *attr) {
-  npy_int64 long_val;
-  PyObject *value = PyObject_GetAttrString(o, attr);
-  long_val = (PyLong_Check(value) ?
-              PyLong_AsLongLong(value) : PyInt_AS_LONG(value));
-  Py_DECREF(value);
-  return long_val;
-}
-
-npy_float64 total_seconds(PyObject *td) {
-  // Python 2.6 compat
-  npy_int64 microseconds = get_long_attr(td, "microseconds");
-  npy_int64 seconds = get_long_attr(td, "seconds");
-  npy_int64 days = get_long_attr(td, "days");
-  npy_int64 days_in_seconds = days * 24LL * 3600LL;
-  return (microseconds + (seconds + days_in_seconds) * 1000000.0) / 1000000.0;
-}
-
-#endif  // PANDAS__LIBS_SRC_DATETIME_HELPER_H_
diff --git a/pandas/_libs/src/headers/cmath b/pandas/_libs/src/headers/cmath
new file mode 100644
index 0000000000000..632e1fc2390d0
--- /dev/null
+++ b/pandas/_libs/src/headers/cmath
@@ -0,0 +1,36 @@
+#ifndef _PANDAS_MATH_H_
+#define _PANDAS_MATH_H_
+
+// MSVC 2017 has a bug where `x == x` can be true for NaNs.
+// MSC_VER from https://stackoverflow.com/a/70630/1889400
+// Place upper bound on this check once a fixed MSVC is released.
+#if defined(_MSC_VER) && (_MSC_VER < 1800)
+#include <cmath>
+// In older versions of Visual Studio there wasn't a std::signbit defined
+// This defines it using _copysign
+namespace std {
+   __inline int isnan(double x) { return _isnan(x); }
+   __inline int signbit(double num) { return _copysign(1.0, num) < 0; }
+   __inline int notnan(double x) { return !isnan(x); }
+}
+#elif defined(_MSC_VER) && (_MSC_VER >= 1900)
+#include <cmath>
+namespace std {
+  __inline int isnan(double x) { return _isnan(x); }
+  __inline int notnan(double x) { return !isnan(x); }
+}
+#elif defined(_MSC_VER)
+#include <cmath>
+namespace std {
+  __inline int isnan(double x) { return _isnan(x); }
+  __inline int notnan(double x) { return x == x; }
+}
+#else
+#include <cmath>
+
+namespace std {
+  __inline int notnan(double x) { return x == x; }
+}
+
+#endif
+#endif
diff --git a/pandas/_libs/src/headers/math.h b/pandas/_libs/src/headers/math.h
deleted file mode 100644
index 34ad9f24a58f9..0000000000000
--- a/pandas/_libs/src/headers/math.h
+++ /dev/null
@@ -1,11 +0,0 @@
-#ifndef _PANDAS_MATH_H_
-#define _PANDAS_MATH_H_
-
-#if defined(_MSC_VER) && (_MSC_VER < 1800)
-#include <math.h>
-__inline int signbit(double num) { return _copysign(1.0, num) < 0; }
-#else
-#include <math.h>
-#endif
-
-#endif
diff --git a/pandas/_libs/src/headers/portable.h b/pandas/_libs/src/headers/portable.h
index b9868276ef6e6..9ac4ebc306baa 100644
--- a/pandas/_libs/src/headers/portable.h
+++ b/pandas/_libs/src/headers/portable.h
@@ -5,4 +5,10 @@
 #define strcasecmp( s1, s2 ) _stricmp( s1, s2 )
 #endif
 
+// GH-23516 - works around locale perf issues
+// from MUSL libc, MIT Licensed - see LICENSES
+#define isdigit_ascii(c) ((unsigned)c - '0' < 10)
+#define isspace_ascii(c) (c == ' ' || (unsigned)c-'\t' < 5)
+#define toupper_ascii(c) (((unsigned)c-'a' < 26) ? (c & 0x5f) : c)
+
 #endif
diff --git a/pandas/_libs/src/helper.h b/pandas/_libs/src/helper.h
deleted file mode 100644
index 26b4d033b963b..0000000000000
--- a/pandas/_libs/src/helper.h
+++ /dev/null
@@ -1,25 +0,0 @@
-/*
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-*/
-
-#ifndef PANDAS__LIBS_SRC_HELPER_H_
-#define PANDAS__LIBS_SRC_HELPER_H_
-
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE static __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE static __inline
-  #elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE static inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
-#endif  // PANDAS__LIBS_SRC_HELPER_H_
diff --git a/pandas/_libs/src/inference.pyx b/pandas/_libs/src/inference.pyx
deleted file mode 100644
index 933fc8fb1cc9b..0000000000000
--- a/pandas/_libs/src/inference.pyx
+++ /dev/null
@@ -1,1587 +0,0 @@
-import sys
-from decimal import Decimal
-cimport util
-from tslib import NaT, get_timezone
-from datetime import datetime, timedelta
-iNaT = util.get_nat()
-
-cdef bint PY2 = sys.version_info[0] == 2
-
-from util cimport (UINT8_MAX, UINT16_MAX, UINT32_MAX, UINT64_MAX,
-                   INT8_MIN, INT8_MAX, INT16_MIN, INT16_MAX,
-                   INT32_MAX, INT32_MIN, INT64_MAX, INT64_MIN)
-
-# core.common import for fast inference checks
-
-cpdef bint is_float(object obj):
-    return util.is_float_object(obj)
-
-
-cpdef bint is_integer(object obj):
-    return util.is_integer_object(obj)
-
-
-cpdef bint is_bool(object obj):
-    return util.is_bool_object(obj)
-
-
-cpdef bint is_complex(object obj):
-    return util.is_complex_object(obj)
-
-
-cpdef bint is_decimal(object obj):
-    return isinstance(obj, Decimal)
-
-
-cpdef bint is_period(object val):
-    """ Return a boolean if this is a Period object """
-    return util.is_period_object(val)
-
-
-_TYPE_MAP = {
-    'categorical': 'categorical',
-    'category': 'categorical',
-    'int8': 'integer',
-    'int16': 'integer',
-    'int32': 'integer',
-    'int64': 'integer',
-    'i': 'integer',
-    'uint8': 'integer',
-    'uint16': 'integer',
-    'uint32': 'integer',
-    'uint64': 'integer',
-    'u': 'integer',
-    'float32': 'floating',
-    'float64': 'floating',
-    'f': 'floating',
-    'complex128': 'complex',
-    'c': 'complex',
-    'string': 'string' if PY2 else 'bytes',
-    'S': 'string' if PY2 else 'bytes',
-    'unicode': 'unicode' if PY2 else 'string',
-    'U': 'unicode' if PY2 else 'string',
-    'bool': 'boolean',
-    'b': 'boolean',
-    'datetime64[ns]': 'datetime64',
-    'M': 'datetime64',
-    'timedelta64[ns]': 'timedelta64',
-    'm': 'timedelta64',
-}
-
-# types only exist on certain platform
-try:
-    np.float128
-    _TYPE_MAP['float128'] = 'floating'
-except AttributeError:
-    pass
-try:
-    np.complex256
-    _TYPE_MAP['complex256'] = 'complex'
-except AttributeError:
-    pass
-try:
-    np.float16
-    _TYPE_MAP['float16'] = 'floating'
-except AttributeError:
-    pass
-
-
-cdef class Seen(object):
-    """
-    Class for keeping track of the types of elements
-    encountered when trying to perform type conversions.
-    """
-
-    cdef public:
-        bint int_             # seen_int
-        bint bool_            # seen_bool
-        bint null_            # seen_null
-        bint uint_            # seen_uint (unsigned integer)
-        bint sint_            # seen_sint (signed integer)
-        bint float_           # seen_float
-        bint object_          # seen_object
-        bint complex_         # seen_complex
-        bint datetime_        # seen_datetime
-        bint coerce_numeric   # coerce data to numeric
-        bint timedelta_       # seen_timedelta
-        bint datetimetz_      # seen_datetimetz
-
-    def __cinit__(self, bint coerce_numeric=0):
-        """
-        Initialize a Seen instance.
-
-        Parameters
-        ----------
-        coerce_numeric : bint, default 0
-            Whether or not to force conversion to a numeric data type if
-            initial methods to convert to numeric fail.
-        """
-        self.int_ = 0
-        self.bool_ = 0
-        self.null_ = 0
-        self.uint_ = 0
-        self.sint_ = 0
-        self.float_ = 0
-        self.object_ = 0
-        self.complex_ = 0
-        self.datetime_ = 0
-        self.timedelta_ = 0
-        self.datetimetz_ = 0
-        self.coerce_numeric = coerce_numeric
-
-    cdef inline bint check_uint64_conflict(self) except -1:
-        """
-        Check whether we can safely convert a uint64 array to a numeric dtype.
-
-        There are two cases when conversion to numeric dtype with a uint64
-        array is not safe (and will therefore not be performed)
-
-        1) A NaN element is encountered.
-
-           uint64 cannot be safely cast to float64 due to truncation issues
-           at the extreme ends of the range.
-
-        2) A negative number is encountered.
-
-           There is no numerical dtype that can hold both negative numbers
-           and numbers greater than INT64_MAX. Hence, at least one number
-           will be improperly cast if we convert to a numeric dtype.
-
-        Returns
-        -------
-        return_values : bool
-            Whether or not we should return the original input array to avoid
-            data truncation.
-
-        Raises
-        ------
-        ValueError : uint64 elements were detected, and at least one of the
-                     two conflict cases was also detected. However, we are
-                     trying to force conversion to a numeric dtype.
-        """
-        if self.uint_ and (self.null_ or self.sint_):
-            if not self.coerce_numeric:
-                return True
-
-            if self.null_:
-                msg = ("uint64 array detected, and such an "
-                       "array cannot contain NaN.")
-            else:  # self.sint_ = 1
-                msg = ("uint64 and negative values detected. "
-                       "Cannot safely return a numeric array "
-                       "without truncating data.")
-
-            raise ValueError(msg)
-        return False
-
-    cdef inline saw_null(self):
-        """
-        Set flags indicating that a null value was encountered.
-        """
-        self.null_ = 1
-        self.float_ = 1
-
-    def saw_int(self, val):
-        """
-        Set flags indicating that an integer value was encountered.
-
-        Parameters
-        ----------
-        val : Python int
-            Value with which to set the flags.
-        """
-        self.int_ = 1
-        self.sint_ = self.sint_ or (val < 0)
-        self.uint_ = self.uint_ or (val > iINT64_MAX)
-
-    @property
-    def numeric_(self):
-        return self.complex_ or self.float_ or self.int_
-
-    @property
-    def is_bool(self):
-        return not (self.datetime_ or self.numeric_ or self.timedelta_)
-
-    @property
-    def is_float_or_complex(self):
-        return not (self.bool_ or self.datetime_ or self.timedelta_)
-
-
-cdef _try_infer_map(v):
-    """ if its in our map, just return the dtype """
-    cdef:
-        object attr, val
-    for attr in ['name', 'kind', 'base']:
-        val = getattr(v.dtype, attr)
-        if val in _TYPE_MAP:
-            return _TYPE_MAP[val]
-    return None
-
-
-def infer_dtype(object _values):
-    """
-    we are coercing to an ndarray here
-    """
-
-    cdef:
-        Py_ssize_t i, n
-        object val
-        ndarray values
-        bint seen_pdnat = False, seen_val = False
-
-    if isinstance(_values, np.ndarray):
-        values = _values
-    elif hasattr(_values, 'dtype'):
-
-        # this will handle ndarray-like
-        # e.g. categoricals
-        try:
-            values = getattr(_values, '_values', getattr(
-                _values, 'values', _values))
-        except:
-            val = _try_infer_map(_values)
-            if val is not None:
-                return val
-
-            # its ndarray like but we can't handle
-            raise ValueError("cannot infer type for {0}".format(type(_values)))
-
-    else:
-        if not isinstance(_values, list):
-            _values = list(_values)
-        values = list_to_object_array(_values)
-
-    values = getattr(values, 'values', values)
-    val = _try_infer_map(values)
-    if val is not None:
-        return val
-
-    if values.dtype != np.object_:
-        values = values.astype('O')
-
-    n = len(values)
-    if n == 0:
-        return 'empty'
-
-    # make contiguous
-    values = values.ravel()
-
-    # try to use a valid value
-    for i from 0 <= i < n:
-        val = util.get_value_1d(values, i)
-
-        # do not use is_nul_datetimelike to keep
-        # np.datetime64('nat') and np.timedelta64('nat')
-        if util._checknull(val):
-            pass
-        elif val is NaT:
-            seen_pdnat = True
-        else:
-            seen_val = True
-            break
-
-    # if all values are nan/NaT
-    if seen_val is False and seen_pdnat is True:
-        return 'datetime'
-        # float/object nan is handled in latter logic
-
-    if util.is_datetime64_object(val):
-        if is_datetime64_array(values):
-            return 'datetime64'
-        elif is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-
-    elif is_timedelta(val):
-        if is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-
-    elif util.is_integer_object(val):
-        # a timedelta will show true here as well
-        if is_timedelta(val):
-            if is_timedelta_or_timedelta64_array(values):
-                return 'timedelta'
-
-        if is_integer_array(values):
-            return 'integer'
-        elif is_integer_float_array(values):
-            return 'mixed-integer-float'
-        elif is_timedelta_or_timedelta64_array(values):
-            return 'timedelta'
-        return 'mixed-integer'
-
-    elif is_datetime(val):
-        if is_datetime_array(values):
-            return 'datetime'
-
-    elif is_date(val):
-        if is_date_array(values):
-            return 'date'
-
-    elif is_time(val):
-        if is_time_array(values):
-            return 'time'
-
-    elif util.is_float_object(val):
-        if is_float_array(values):
-            return 'floating'
-        elif is_integer_float_array(values):
-            return 'mixed-integer-float'
-
-    elif util.is_bool_object(val):
-        if is_bool_array(values):
-            return 'boolean'
-
-    elif PyString_Check(val):
-        if is_string_array(values):
-            return 'string'
-
-    elif PyUnicode_Check(val):
-        if is_unicode_array(values):
-            return 'unicode'
-
-    elif PyBytes_Check(val):
-        if is_bytes_array(values):
-            return 'bytes'
-
-    elif is_period(val):
-        if is_period_array(values):
-            return 'period'
-
-    for i in range(n):
-        val = util.get_value_1d(values, i)
-        if (util.is_integer_object(val) and
-            not util.is_timedelta64_object(val) and
-            not util.is_datetime64_object(val)):
-            return 'mixed-integer'
-
-    return 'mixed'
-
-
-cpdef bint is_possible_datetimelike_array(object arr):
-    # determine if we have a possible datetimelike (or null-like) array
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        bint seen_timedelta = 0, seen_datetime = 0
-        object v
-
-    for i in range(n):
-        v = arr[i]
-        if util.is_string_object(v):
-            continue
-        elif util._checknull(v):
-            continue
-        elif is_datetime(v):
-            seen_datetime=1
-        elif is_timedelta(v):
-            seen_timedelta=1
-        else:
-            return False
-    return seen_datetime or seen_timedelta
-
-
-cdef inline bint is_null_datetimelike(v):
-    # determine if we have a null for a timedelta/datetime (or integer
-    # versions)x
-    if util._checknull(v):
-        return True
-    elif v is NaT:
-        return True
-    elif util.is_timedelta64_object(v):
-        return v.view('int64') == iNaT
-    elif util.is_datetime64_object(v):
-        return v.view('int64') == iNaT
-    elif util.is_integer_object(v):
-        return v == iNaT
-    return False
-
-
-cdef inline bint is_null_datetime64(v):
-    # determine if we have a null for a datetime (or integer versions),
-    # excluding np.timedelta64('nat')
-    if util._checknull(v):
-        return True
-    elif v is NaT:
-        return True
-    elif util.is_datetime64_object(v):
-        return v.view('int64') == iNaT
-    return False
-
-
-cdef inline bint is_null_timedelta64(v):
-    # determine if we have a null for a timedelta (or integer versions),
-    # excluding np.datetime64('nat')
-    if util._checknull(v):
-        return True
-    elif v is NaT:
-        return True
-    elif util.is_timedelta64_object(v):
-        return v.view('int64') == iNaT
-    return False
-
-
-cdef inline bint is_null_period(v):
-    # determine if we have a null for a Period (or integer versions),
-    # excluding np.datetime64('nat') and np.timedelta64('nat')
-    if util._checknull(v):
-        return True
-    elif v is NaT:
-        return True
-    return False
-
-
-cdef inline bint is_datetime(object o):
-    return PyDateTime_Check(o)
-
-cdef inline bint is_date(object o):
-    return PyDate_Check(o)
-
-cdef inline bint is_time(object o):
-    return PyTime_Check(o)
-
-cdef inline bint is_timedelta(object o):
-    return PyDelta_Check(o) or util.is_timedelta64_object(o)
-
-
-cpdef bint is_bool_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.bool_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_bool_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_integer_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.integer):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_integer_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_integer_float_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.integer):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not (util.is_integer_object(objbuf[i]) or
-                    util.is_float_object(objbuf[i])):
-
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_float_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.floating):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not util.is_float_object(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_string_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if ((PY2 and issubclass(values.dtype.type, np.string_)) or
-        not PY2 and issubclass(values.dtype.type, np.unicode_)):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyString_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_unicode_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.unicode_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyUnicode_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_bytes_array(ndarray values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        ndarray[object] objbuf
-
-    if issubclass(values.dtype.type, np.bytes_):
-        return True
-    elif values.dtype == np.object_:
-        objbuf = values
-
-        if n == 0:
-            return False
-
-        for i in range(n):
-            if not PyBytes_Check(objbuf[i]):
-                return False
-        return True
-    else:
-        return False
-
-
-cpdef bint is_datetime_array(ndarray[object] values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-
-    # return False for all nulls
-    for i in range(n):
-        v = values[i]
-        if is_null_datetime64(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not is_datetime(v):
-            return False
-    return null_count != n
-
-
-cpdef bint is_datetime64_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-
-    # return False for all nulls
-    for i in range(n):
-        v = values[i]
-        if is_null_datetime64(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not util.is_datetime64_object(v):
-            return False
-    return null_count != n
-
-
-cpdef bint is_datetime_with_singletz_array(ndarray[object] values):
-    """
-    Check values have the same tzinfo attribute.
-    Doesn't check values are datetime-like types.
-    """
-
-    cdef Py_ssize_t i, j, n = len(values)
-    cdef object base_val, base_tz, val, tz
-
-    if n == 0:
-        return False
-
-    for i in range(n):
-        base_val = values[i]
-        if base_val is not NaT:
-            base_tz = get_timezone(getattr(base_val, 'tzinfo', None))
-
-            for j in range(i, n):
-                val = values[j]
-                if val is not NaT:
-                    tz = getattr(val, 'tzinfo', None)
-                    if base_tz != tz and base_tz != get_timezone(tz):
-                        return False
-            break
-
-    return True
-
-
-cpdef bint is_timedelta_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_timedelta64(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not PyDelta_Check(v):
-            return False
-    return null_count != n
-
-
-cpdef bint is_timedelta64_array(ndarray values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_timedelta64(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not util.is_timedelta64_object(v):
-            return False
-    return null_count != n
-
-
-cpdef bint is_timedelta_or_timedelta64_array(ndarray values):
-    """ infer with timedeltas and/or nat/none """
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-    for i in range(n):
-        v = values[i]
-        if is_null_timedelta64(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not is_timedelta(v):
-            return False
-    return null_count != n
-
-
-cpdef bint is_date_array(ndarray[object] values):
-    cdef Py_ssize_t i, n = len(values)
-    if n == 0:
-        return False
-    for i in range(n):
-        if not is_date(values[i]):
-            return False
-    return True
-
-
-cpdef bint is_time_array(ndarray[object] values):
-    cdef Py_ssize_t i, n = len(values)
-    if n == 0:
-        return False
-    for i in range(n):
-        if not is_time(values[i]):
-            return False
-    return True
-
-
-cpdef bint is_period_array(ndarray[object] values):
-    cdef Py_ssize_t i, null_count = 0, n = len(values)
-    cdef object v
-    if n == 0:
-        return False
-
-    # return False for all nulls
-    for i in range(n):
-        v = values[i]
-        if is_null_period(v):
-            # we are a regular null
-            if util._checknull(v):
-                null_count += 1
-        elif not is_period(v):
-            return False
-    return null_count != n
-
-
-cdef extern from "parse_helper.h":
-    inline int floatify(object, double *result, int *maybe_int) except -1
-
-cdef int64_t iINT64_MAX = <int64_t> INT64_MAX
-cdef int64_t iINT64_MIN = <int64_t> INT64_MIN
-cdef uint64_t iUINT64_MAX = <uint64_t> UINT64_MAX
-
-
-def maybe_convert_numeric(ndarray[object] values, set na_values,
-                          bint convert_empty=True, bint coerce_numeric=False):
-    """
-    Convert object array to a numeric array if possible.
-
-    Parameters
-    ----------
-    values : ndarray
-        Array of object elements to convert.
-    na_values : set
-        Set of values that should be interpreted as NaN.
-    convert_empty : bool, default True
-        If an empty array-like object is encountered, whether to interpret
-        that element as NaN or not. If set to False, a ValueError will be
-        raised if such an element is encountered and 'coerce_numeric' is False.
-    coerce_numeric : bool, default False
-        If initial attempts to convert to numeric have failed, whether to
-        force conversion to numeric via alternative methods or by setting the
-        element to NaN. Otherwise, an Exception will be raised when such an
-        element is encountered.
-
-        This boolean also has an impact on how conversion behaves when a
-        numeric array has no suitable numerical dtype to return (i.e. uint64,
-        int32, uint8). If set to False, the original object array will be
-        returned. Otherwise, a ValueError will be raised.
-
-    Returns
-    -------
-    numeric_array : array of converted object values to numerical ones
-    """
-    cdef:
-        int status, maybe_int
-        Py_ssize_t i, n = values.size
-        Seen seen = Seen(coerce_numeric);
-        ndarray[float64_t] floats = np.empty(n, dtype='f8')
-        ndarray[complex128_t] complexes = np.empty(n, dtype='c16')
-        ndarray[int64_t] ints = np.empty(n, dtype='i8')
-        ndarray[uint64_t] uints = np.empty(n, dtype='u8')
-        ndarray[uint8_t] bools = np.empty(n, dtype='u1')
-        object val
-        float64_t fval
-
-    for i in range(n):
-        val = values[i]
-
-        if val.__hash__ is not None and val in na_values:
-            seen.saw_null()
-            floats[i] = complexes[i] = nan
-        elif util.is_float_object(val):
-            if val != val:
-                seen.null_ = True
-
-            floats[i] = complexes[i] = val
-            seen.float_ = True
-        elif util.is_integer_object(val):
-            floats[i] = complexes[i] = val
-
-            as_int = int(val)
-            seen.saw_int(as_int)
-
-            if as_int >= 0:
-                uints[i] = as_int
-            if as_int <= iINT64_MAX:
-                ints[i] = as_int
-        elif util.is_bool_object(val):
-            floats[i] = uints[i] = ints[i] = bools[i] = val
-            seen.bool_ = True
-        elif val is None:
-            seen.saw_null()
-            floats[i] = complexes[i] = nan
-        elif hasattr(val, '__len__') and len(val) == 0:
-            if convert_empty or seen.coerce_numeric:
-                seen.saw_null()
-                floats[i] = complexes[i] = nan
-            else:
-                raise ValueError('Empty string encountered')
-        elif util.is_complex_object(val):
-            complexes[i] = val
-            seen.complex_ = True
-        elif is_decimal(val):
-            floats[i] = complexes[i] = val
-            seen.float_ = True
-        else:
-            try:
-                status = floatify(val, &fval, &maybe_int)
-
-                if fval in na_values:
-                    seen.saw_null()
-                    floats[i] = complexes[i] = nan
-                else:
-                    if fval != fval:
-                        seen.null_ = True
-
-                    floats[i] = fval
-
-                if maybe_int:
-                    as_int = int(val)
-
-                    if as_int in na_values:
-                        seen.saw_null()
-                    else:
-                        seen.saw_int(as_int)
-
-                    if not (seen.float_ or as_int in na_values):
-                        if as_int < iINT64_MIN or as_int > iUINT64_MAX:
-                            raise ValueError('Integer out of range.')
-
-                        if as_int >= 0:
-                            uints[i] = as_int
-                        if as_int <= iINT64_MAX:
-                            ints[i] = as_int
-                else:
-                    seen.float_ = True
-            except (TypeError, ValueError) as e:
-                if not seen.coerce_numeric:
-                    raise type(e)(str(e) + ' at position {}'.format(i))
-                elif "uint64" in str(e):  # Exception from check functions.
-                    raise
-                seen.saw_null()
-                floats[i] = nan
-
-    if seen.check_uint64_conflict():
-        return values
-
-    if seen.complex_:
-        return complexes
-    elif seen.float_:
-        return floats
-    elif seen.int_:
-        if seen.uint_:
-            return uints
-        else:
-            return ints
-    elif seen.bool_:
-        return bools.view(np.bool_)
-    elif seen.uint_:
-        return uints
-    return ints
-
-
-def maybe_convert_objects(ndarray[object] objects, bint try_float=0,
-                          bint safe=0, bint convert_datetime=0,
-                          bint convert_timedelta=0):
-    """
-    Type inference function-- convert object array to proper dtype
-    """
-    cdef:
-        Py_ssize_t i, n
-        ndarray[float64_t] floats
-        ndarray[complex128_t] complexes
-        ndarray[int64_t] ints
-        ndarray[uint64_t] uints
-        ndarray[uint8_t] bools
-        ndarray[int64_t] idatetimes
-        ndarray[int64_t] itimedeltas
-        Seen seen = Seen();
-        object val, onan
-        float64_t fval, fnan
-
-    n = len(objects)
-
-    floats = np.empty(n, dtype='f8')
-    complexes = np.empty(n, dtype='c16')
-    ints = np.empty(n, dtype='i8')
-    uints = np.empty(n, dtype='u8')
-    bools = np.empty(n, dtype=np.uint8)
-
-    if convert_datetime:
-        datetimes = np.empty(n, dtype='M8[ns]')
-        idatetimes = datetimes.view(np.int64)
-
-    if convert_timedelta:
-        timedeltas = np.empty(n, dtype='m8[ns]')
-        itimedeltas = timedeltas.view(np.int64)
-
-    onan = np.nan
-    fnan = np.nan
-
-    for i from 0 <= i < n:
-        val = objects[i]
-
-        if val is None:
-            seen.null_ = 1
-            floats[i] = complexes[i] = fnan
-        elif val is NaT:
-            if convert_datetime:
-                idatetimes[i] = iNaT
-                seen.datetime_ = 1
-            if convert_timedelta:
-                itimedeltas[i] = iNaT
-                seen.timedelta_ = 1
-            if not (convert_datetime or convert_timedelta):
-                seen.object_ = 1
-        elif util.is_bool_object(val):
-            seen.bool_ = 1
-            bools[i] = val
-        elif util.is_float_object(val):
-            floats[i] = complexes[i] = val
-            seen.float_ = 1
-        elif util.is_datetime64_object(val):
-            if convert_datetime:
-                idatetimes[i] = convert_to_tsobject(
-                    val, None, None, 0, 0).value
-                seen.datetime_ = 1
-            else:
-                seen.object_ = 1
-                break
-        elif is_timedelta(val):
-            if convert_timedelta:
-                itimedeltas[i] = convert_to_timedelta64(val, 'ns')
-                seen.timedelta_ = 1
-            else:
-                seen.object_ = 1
-                break
-        elif util.is_integer_object(val):
-            seen.int_ = 1
-            floats[i] = <float64_t> val
-            complexes[i] = <double complex> val
-            if not seen.null_:
-                seen.saw_int(int(val))
-
-                if seen.uint_ and seen.sint_:
-                    seen.object_ = 1
-                    break
-
-                if seen.uint_:
-                    uints[i] = val
-                elif seen.sint_:
-                    ints[i] = val
-                else:
-                    uints[i] = val
-                    ints[i] = val
-
-        elif util.is_complex_object(val):
-            complexes[i] = val
-            seen.complex_ = 1
-        elif PyDateTime_Check(val) or util.is_datetime64_object(val):
-
-            # if we have an tz's attached then return the objects
-            if convert_datetime:
-                if getattr(val, 'tzinfo', None) is not None:
-                    seen.datetimetz_ = 1
-                    break
-                else:
-                    seen.datetime_ = 1
-                    idatetimes[i] = convert_to_tsobject(
-                        val, None, None, 0, 0).value
-            else:
-                seen.object_ = 1
-                break
-        elif try_float and not util.is_string_object(val):
-            # this will convert Decimal objects
-            try:
-                floats[i] = float(val)
-                complexes[i] = complex(val)
-                seen.float_ = 1
-            except Exception:
-                seen.object_ = 1
-                break
-        else:
-            seen.object_ = 1
-            break
-
-    # we try to coerce datetime w/tz but must all have the same tz
-    if seen.datetimetz_:
-        if len(set([getattr(val, 'tzinfo', None) for val in objects])) == 1:
-            from pandas import DatetimeIndex
-            return DatetimeIndex(objects)
-        seen.object_ = 1
-
-    if not seen.object_:
-        if not safe:
-            if seen.null_:
-                if seen.is_float_or_complex:
-                    if seen.complex_:
-                        return complexes
-                    elif seen.float_ or seen.int_:
-                        return floats
-            else:
-                if not seen.bool_:
-                    if seen.datetime_:
-                        if not seen.numeric_:
-                            return datetimes
-                    elif seen.timedelta_:
-                        if not seen.numeric_:
-                            return timedeltas
-                    else:
-                        if seen.complex_:
-                            return complexes
-                        elif seen.float_:
-                            return floats
-                        elif seen.int_:
-                            if seen.uint_:
-                                return uints
-                            else:
-                                return ints
-                elif seen.is_bool:
-                    return bools.view(np.bool_)
-
-        else:
-            # don't cast int to float, etc.
-            if seen.null_:
-                if seen.is_float_or_complex:
-                    if seen.complex_:
-                        if not seen.int_:
-                            return complexes
-                    elif seen.float_:
-                        if not seen.int_:
-                            return floats
-            else:
-                if not seen.bool_:
-                    if seen.datetime_:
-                        if not seen.numeric_:
-                            return datetimes
-                    elif seen.timedelta_:
-                        if not seen.numeric_:
-                            return timedeltas
-                    else:
-                        if seen.complex_:
-                            if not seen.int_:
-                                return complexes
-                        elif seen.float_:
-                            if not seen.int_:
-                                return floats
-                        elif seen.int_:
-                            if seen.uint_:
-                                return uints
-                            else:
-                                return ints
-                elif seen.is_bool:
-                    return bools.view(np.bool_)
-
-    return objects
-
-
-def convert_sql_column(x):
-    return maybe_convert_objects(x, try_float=1)
-
-
-def try_parse_dates(ndarray[object] values, parser=None,
-                    dayfirst=False, default=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    n = len(values)
-    result = np.empty(n, dtype='O')
-
-    if parser is None:
-        if default is None: # GH2618
-            date=datetime.now()
-            default=datetime(date.year, date.month, 1)
-
-        try:
-            from dateutil.parser import parse
-            parse_date = lambda x: parse(x, dayfirst=dayfirst, default=default)
-        except ImportError: # pragma: no cover
-            def parse_date(s):
-                try:
-                    return datetime.strptime(s, '%m/%d/%Y')
-                except Exception:
-                    return s
-        # EAFP here
-        try:
-            for i from 0 <= i < n:
-                if values[i] == '':
-                    result[i] = np.nan
-                else:
-                    result[i] = parse_date(values[i])
-        except Exception:
-            # failed
-            return values
-    else:
-        parse_date = parser
-
-        try:
-            for i from 0 <= i < n:
-                if values[i] == '':
-                    result[i] = np.nan
-                else:
-                    result[i] = parse_date(values[i])
-        except Exception:
-            # raise if passed parser and it failed
-            raise
-
-    return result
-
-
-def try_parse_date_and_time(ndarray[object] dates, ndarray[object] times,
-                            date_parser=None, time_parser=None,
-                            dayfirst=False, default=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    from datetime import date, time, datetime, timedelta
-
-    n = len(dates)
-    if len(times) != n:
-        raise ValueError('Length of dates and times must be equal')
-    result = np.empty(n, dtype='O')
-
-    if date_parser is None:
-        if default is None: # GH2618
-            date=datetime.now()
-            default=datetime(date.year, date.month, 1)
-
-        try:
-            from dateutil.parser import parse
-            parse_date = lambda x: parse(x, dayfirst=dayfirst, default=default)
-        except ImportError: # pragma: no cover
-            def parse_date(s):
-                try:
-                    return date.strptime(s, '%m/%d/%Y')
-                except Exception:
-                    return s
-    else:
-        parse_date = date_parser
-
-    if time_parser is None:
-        try:
-            from dateutil.parser import parse
-            parse_time = lambda x: parse(x)
-        except ImportError: # pragma: no cover
-            def parse_time(s):
-                try:
-                    return time.strptime(s, '%H:%M:%S')
-                except Exception:
-                    return s
-
-    else:
-        parse_time = time_parser
-
-    for i from 0 <= i < n:
-        d = parse_date(str(dates[i]))
-        t = parse_time(str(times[i]))
-        result[i] = datetime(d.year, d.month, d.day,
-                             t.hour, t.minute, t.second)
-
-    return result
-
-
-def try_parse_year_month_day(ndarray[object] years, ndarray[object] months,
-                             ndarray[object] days):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-
-    from datetime import datetime
-
-    n = len(years)
-    if len(months) != n or len(days) != n:
-        raise ValueError('Length of years/months/days must all be equal')
-    result = np.empty(n, dtype='O')
-
-    for i from 0 <= i < n:
-        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]))
-
-    return result
-
-
-def try_parse_datetime_components(ndarray[object] years,
-                                  ndarray[object] months,
-                                  ndarray[object] days,
-                                  ndarray[object] hours,
-                                  ndarray[object] minutes,
-                                  ndarray[object] seconds):
-
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        int secs
-        double float_secs
-        double micros
-
-    from datetime import datetime
-
-    n = len(years)
-    if (len(months) != n or len(days) != n or len(hours) != n or
-        len(minutes) != n or len(seconds) != n):
-        raise ValueError('Length of all datetime components must be equal')
-    result = np.empty(n, dtype='O')
-
-    for i from 0 <= i < n:
-        float_secs = float(seconds[i])
-        secs = int(float_secs)
-
-        micros = float_secs - secs
-        if micros > 0:
-            micros = micros * 1000000
-
-        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]),
-                             int(hours[i]), int(minutes[i]), secs,
-                             int(micros))
-
-    return result
-
-
-def sanitize_objects(ndarray[object] values, set na_values,
-                     convert_empty=True):
-    cdef:
-        Py_ssize_t i, n
-        object val, onan
-        Py_ssize_t na_count = 0
-        dict memo = {}
-
-    n = len(values)
-    onan = np.nan
-
-    for i from 0 <= i < n:
-        val = values[i]
-        if (convert_empty and val == '') or (val in na_values):
-            values[i] = onan
-            na_count += 1
-        elif val in memo:
-            values[i] = memo[val]
-        else:
-            memo[val] = val
-
-    return na_count
-
-
-def maybe_convert_bool(ndarray[object] arr,
-                       true_values=None, false_values=None):
-    cdef:
-        Py_ssize_t i, n
-        ndarray[uint8_t] result
-        object val
-        set true_vals, false_vals
-        int na_count = 0
-
-    n = len(arr)
-    result = np.empty(n, dtype=np.uint8)
-
-    # the defaults
-    true_vals = set(('True', 'TRUE', 'true'))
-    false_vals = set(('False', 'FALSE', 'false'))
-
-    if true_values is not None:
-        true_vals = true_vals | set(true_values)
-
-    if false_values is not None:
-        false_vals = false_vals | set(false_values)
-
-    for i from 0 <= i < n:
-        val = arr[i]
-
-        if cpython.PyBool_Check(val):
-            if val is True:
-                result[i] = 1
-            else:
-                result[i] = 0
-        elif val in true_vals:
-            result[i] = 1
-        elif val in false_vals:
-            result[i] = 0
-        elif PyFloat_Check(val):
-            result[i] = UINT8_MAX
-            na_count += 1
-        else:
-            return arr
-
-    if na_count > 0:
-        mask = result == UINT8_MAX
-        arr = result.view(np.bool_).astype(object)
-        np.putmask(arr, mask, np.nan)
-        return arr
-    else:
-        return result.view(np.bool_)
-
-
-def map_infer_mask(ndarray arr, object f, ndarray[uint8_t] mask,
-                   bint convert=1):
-    """
-    Substitute for np.vectorize with pandas-friendly dtype inference
-
-    Parameters
-    ----------
-    arr : ndarray
-    f : function
-
-    Returns
-    -------
-    mapped : ndarray
-    """
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        object val
-
-    n = len(arr)
-    result = np.empty(n, dtype=object)
-    for i in range(n):
-        if mask[i]:
-            val = util.get_value_at(arr, i)
-        else:
-            val = f(util.get_value_at(arr, i))
-
-            # unbox 0-dim arrays, GH #690
-            if is_array(val) and PyArray_NDIM(val) == 0:
-                # is there a faster way to unbox?
-                val = val.item()
-
-        result[i] = val
-
-    if convert:
-        return maybe_convert_objects(result,
-                                     try_float=0,
-                                     convert_datetime=0,
-                                     convert_timedelta=0)
-
-    return result
-
-
-def map_infer(ndarray arr, object f, bint convert=1):
-    """
-    Substitute for np.vectorize with pandas-friendly dtype inference
-
-    Parameters
-    ----------
-    arr : ndarray
-    f : function
-
-    Returns
-    -------
-    mapped : ndarray
-    """
-    cdef:
-        Py_ssize_t i, n
-        ndarray[object] result
-        object val
-
-    n = len(arr)
-    result = np.empty(n, dtype=object)
-    for i in range(n):
-        val = f(util.get_value_at(arr, i))
-
-        # unbox 0-dim arrays, GH #690
-        if is_array(val) and PyArray_NDIM(val) == 0:
-            # is there a faster way to unbox?
-            val = val.item()
-
-        result[i] = val
-
-    if convert:
-        return maybe_convert_objects(result,
-                                     try_float=0,
-                                     convert_datetime=0,
-                                     convert_timedelta=0)
-
-    return result
-
-
-def to_object_array(list rows, int min_width=0):
-    """
-    Convert a list of lists into an object array.
-
-    Parameters
-    ----------
-    rows : 2-d array (N, K)
-        A list of lists to be converted into an array
-    min_width : int
-        The minimum width of the object array. If a list
-        in `rows` contains fewer than `width` elements,
-        the remaining elements in the corresponding row
-        will all be `NaN`.
-
-    Returns
-    -------
-    obj_array : numpy array of the object dtype
-    """
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        list row
-
-    n = len(rows)
-
-    k = min_width
-    for i from 0 <= i < n:
-        tmp = len(rows[i])
-        if tmp > k:
-            k = tmp
-
-    result = np.empty((n, k), dtype=object)
-
-    for i from 0 <= i < n:
-        row = rows[i]
-
-        for j from 0 <= j < len(row):
-            result[i, j] = row[j]
-
-    return result
-
-
-def tuples_to_object_array(ndarray[object] tuples):
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        tuple tup
-
-    n = len(tuples)
-    k = len(tuples[0])
-    result = np.empty((n, k), dtype=object)
-    for i in range(n):
-        tup = tuples[i]
-        for j in range(k):
-            result[i, j] = tup[j]
-
-    return result
-
-
-def to_object_array_tuples(list rows):
-    cdef:
-        Py_ssize_t i, j, n, k, tmp
-        ndarray[object, ndim=2] result
-        tuple row
-
-    n = len(rows)
-
-    k = 0
-    for i from 0 <= i < n:
-        tmp = len(rows[i])
-        if tmp > k:
-            k = tmp
-
-    result = np.empty((n, k), dtype=object)
-
-    try:
-        for i in range(n):
-            row = rows[i]
-            for j from 0 <= j < len(row):
-                result[i, j] = row[j]
-    except Exception:
-        # upcast any subclasses to tuple
-        for i in range(n):
-            row = tuple(rows[i])
-            for j from 0 <= j < len(row):
-                result[i, j] = row[j]
-
-    return result
-
-
-def fast_multiget(dict mapping, ndarray keys, default=np.nan):
-    cdef:
-        Py_ssize_t i, n = len(keys)
-        object val
-        ndarray[object] output = np.empty(n, dtype='O')
-
-    if n == 0:
-        # kludge, for Series
-        return np.empty(0, dtype='f8')
-
-    keys = getattr(keys, 'values', keys)
-
-    for i in range(n):
-        val = util.get_value_1d(keys, i)
-        if val in mapping:
-            output[i] = mapping[val]
-        else:
-            output[i] = default
-
-    return maybe_convert_objects(output)
-
-
-def downcast_int64(ndarray[int64_t] arr, object na_values,
-                   bint use_unsigned=0):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t mx = INT64_MIN + 1, mn = INT64_MAX
-        int64_t NA = na_values[np.int64]
-        int64_t val
-        ndarray[uint8_t] mask
-        int na_count = 0
-
-    _mask = np.empty(n, dtype=bool)
-    mask = _mask.view(np.uint8)
-
-    for i in range(n):
-        val = arr[i]
-
-        if val == NA:
-            mask[i] = 1
-            na_count += 1
-            continue
-
-        # not NA
-        mask[i] = 0
-
-        if val > mx:
-            mx = val
-
-        if val < mn:
-            mn = val
-
-    if mn >= 0 and use_unsigned:
-        if mx <= UINT8_MAX - 1:
-            result = arr.astype(np.uint8)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint8])
-            return result
-
-        if mx <= UINT16_MAX - 1:
-            result = arr.astype(np.uint16)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint16])
-            return result
-
-        if mx <= UINT32_MAX - 1:
-            result = arr.astype(np.uint32)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.uint32])
-            return result
-
-    else:
-        if mn >= INT8_MIN + 1 and mx <= INT8_MAX:
-            result = arr.astype(np.int8)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int8])
-            return result
-
-        if mn >= INT16_MIN + 1 and mx <= INT16_MAX:
-            result = arr.astype(np.int16)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int16])
-            return result
-
-        if mn >= INT32_MIN + 1 and mx <= INT32_MAX:
-            result = arr.astype(np.int32)
-            if na_count:
-                np.putmask(result, _mask, na_values[np.int32])
-            return result
-
-    return arr
diff --git a/pandas/_libs/src/inline_helper.h b/pandas/_libs/src/inline_helper.h
new file mode 100644
index 0000000000000..e203a05d2eb56
--- /dev/null
+++ b/pandas/_libs/src/inline_helper.h
@@ -0,0 +1,25 @@
+/*
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
+#ifndef PANDAS__LIBS_SRC_INLINE_HELPER_H_
+#define PANDAS__LIBS_SRC_INLINE_HELPER_H_
+
+#ifndef PANDAS_INLINE
+  #if defined(__GNUC__)
+    #define PANDAS_INLINE static __inline__
+  #elif defined(_MSC_VER)
+    #define PANDAS_INLINE static __inline
+  #elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
+    #define PANDAS_INLINE static inline
+  #else
+    #define PANDAS_INLINE
+  #endif  // __GNUC__
+#endif  // PANDAS_INLINE
+
+#endif  // PANDAS__LIBS_SRC_INLINE_HELPER_H_
diff --git a/pandas/_libs/src/khash.pxd b/pandas/_libs/src/khash.pxd
deleted file mode 100644
index adb0fe285dbb8..0000000000000
--- a/pandas/_libs/src/khash.pxd
+++ /dev/null
@@ -1,140 +0,0 @@
-from cpython cimport PyObject
-from numpy cimport int64_t, uint64_t, int32_t, uint32_t, float64_t
-
-cdef extern from "khash_python.h":
-    ctypedef uint32_t khint_t
-    ctypedef khint_t khiter_t
-
-    ctypedef struct kh_pymap_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        PyObject **keys
-        size_t *vals
-
-    inline kh_pymap_t* kh_init_pymap()
-    inline void kh_destroy_pymap(kh_pymap_t*)
-    inline void kh_clear_pymap(kh_pymap_t*)
-    inline khint_t kh_get_pymap(kh_pymap_t*, PyObject*)
-    inline void kh_resize_pymap(kh_pymap_t*, khint_t)
-    inline khint_t kh_put_pymap(kh_pymap_t*, PyObject*, int*)
-    inline void kh_del_pymap(kh_pymap_t*, khint_t)
-
-    bint kh_exist_pymap(kh_pymap_t*, khiter_t)
-
-    ctypedef struct kh_pyset_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        PyObject **keys
-        size_t *vals
-
-    inline kh_pyset_t* kh_init_pyset()
-    inline void kh_destroy_pyset(kh_pyset_t*)
-    inline void kh_clear_pyset(kh_pyset_t*)
-    inline khint_t kh_get_pyset(kh_pyset_t*, PyObject*)
-    inline void kh_resize_pyset(kh_pyset_t*, khint_t)
-    inline khint_t kh_put_pyset(kh_pyset_t*, PyObject*, int*)
-    inline void kh_del_pyset(kh_pyset_t*, khint_t)
-
-    bint kh_exist_pyset(kh_pyset_t*, khiter_t)
-
-    ctypedef char* kh_cstr_t
-
-    ctypedef struct kh_str_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        kh_cstr_t *keys
-        size_t *vals
-
-    inline kh_str_t* kh_init_str() nogil
-    inline void kh_destroy_str(kh_str_t*) nogil
-    inline void kh_clear_str(kh_str_t*) nogil
-    inline khint_t kh_get_str(kh_str_t*, kh_cstr_t) nogil
-    inline void kh_resize_str(kh_str_t*, khint_t) nogil
-    inline khint_t kh_put_str(kh_str_t*, kh_cstr_t, int*) nogil
-    inline void kh_del_str(kh_str_t*, khint_t) nogil
-
-    bint kh_exist_str(kh_str_t*, khiter_t) nogil
-
-    ctypedef struct kh_int64_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        int64_t *keys
-        size_t *vals
-
-    inline kh_int64_t* kh_init_int64() nogil
-    inline void kh_destroy_int64(kh_int64_t*) nogil
-    inline void kh_clear_int64(kh_int64_t*) nogil
-    inline khint_t kh_get_int64(kh_int64_t*, int64_t) nogil
-    inline void kh_resize_int64(kh_int64_t*, khint_t) nogil
-    inline khint_t kh_put_int64(kh_int64_t*, int64_t, int*) nogil
-    inline void kh_del_int64(kh_int64_t*, khint_t) nogil
-
-    bint kh_exist_int64(kh_int64_t*, khiter_t) nogil
-
-    ctypedef uint64_t khuint64_t
-
-    ctypedef struct kh_uint64_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        khuint64_t *keys
-        size_t *vals
-
-    inline kh_uint64_t* kh_init_uint64() nogil
-    inline void kh_destroy_uint64(kh_uint64_t*) nogil
-    inline void kh_clear_uint64(kh_uint64_t*) nogil
-    inline khint_t kh_get_uint64(kh_uint64_t*, int64_t) nogil
-    inline void kh_resize_uint64(kh_uint64_t*, khint_t) nogil
-    inline khint_t kh_put_uint64(kh_uint64_t*, int64_t, int*) nogil
-    inline void kh_del_uint64(kh_uint64_t*, khint_t) nogil
-
-    bint kh_exist_uint64(kh_uint64_t*, khiter_t) nogil
-
-    ctypedef struct kh_float64_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        float64_t *keys
-        size_t *vals
-
-    inline kh_float64_t* kh_init_float64() nogil
-    inline void kh_destroy_float64(kh_float64_t*) nogil
-    inline void kh_clear_float64(kh_float64_t*) nogil
-    inline khint_t kh_get_float64(kh_float64_t*, float64_t) nogil
-    inline void kh_resize_float64(kh_float64_t*, khint_t) nogil
-    inline khint_t kh_put_float64(kh_float64_t*, float64_t, int*) nogil
-    inline void kh_del_float64(kh_float64_t*, khint_t) nogil
-
-    bint kh_exist_float64(kh_float64_t*, khiter_t) nogil
-
-    ctypedef struct kh_int32_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        int32_t *keys
-        size_t *vals
-
-    inline kh_int32_t* kh_init_int32() nogil
-    inline void kh_destroy_int32(kh_int32_t*) nogil
-    inline void kh_clear_int32(kh_int32_t*) nogil
-    inline khint_t kh_get_int32(kh_int32_t*, int32_t) nogil
-    inline void kh_resize_int32(kh_int32_t*, khint_t) nogil
-    inline khint_t kh_put_int32(kh_int32_t*, int32_t, int*) nogil
-    inline void kh_del_int32(kh_int32_t*, khint_t) nogil
-
-    bint kh_exist_int32(kh_int32_t*, khiter_t) nogil
-
-    # sweep factorize
-
-    ctypedef struct kh_strbox_t:
-        khint_t n_buckets, size, n_occupied, upper_bound
-        uint32_t *flags
-        kh_cstr_t *keys
-        PyObject **vals
-
-    inline kh_strbox_t* kh_init_strbox() nogil
-    inline void kh_destroy_strbox(kh_strbox_t*) nogil
-    inline void kh_clear_strbox(kh_strbox_t*) nogil
-    inline khint_t kh_get_strbox(kh_strbox_t*, kh_cstr_t) nogil
-    inline void kh_resize_strbox(kh_strbox_t*, khint_t) nogil
-    inline khint_t kh_put_strbox(kh_strbox_t*, kh_cstr_t, int*) nogil
-    inline void kh_del_strbox(kh_strbox_t*, khint_t) nogil
-
-    bint kh_exist_strbox(kh_strbox_t*, khiter_t) nogil
diff --git a/pandas/_libs/src/klib/khash.h b/pandas/_libs/src/klib/khash.h
index 869607a44c001..77ec519cc24da 100644
--- a/pandas/_libs/src/klib/khash.h
+++ b/pandas/_libs/src/klib/khash.h
@@ -112,6 +112,7 @@ int main() {
 #include <stdlib.h>
 #include <string.h>
 #include <limits.h>
+#include "../inline_helper.h"
 
 
 #if UINT_MAX == 0xffffffffu
@@ -130,18 +131,6 @@ typedef signed long long khint64_t;
 
 typedef double khfloat64_t;
 
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE static __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE static __inline
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE static inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
 typedef khint32_t khint_t;
 typedef khint_t khiter_t;
 
diff --git a/pandas/_libs/src/klib/khash_python.h b/pandas/_libs/src/klib/khash_python.h
index a375a73b04c9e..45a93051f78d3 100644
--- a/pandas/_libs/src/klib/khash_python.h
+++ b/pandas/_libs/src/klib/khash_python.h
@@ -1,3 +1,4 @@
+#include <string.h>
 #include <Python.h>
 
 #include "khash.h"
@@ -14,9 +15,24 @@
 // hash for 64 bit integers.
 // GH 13436
 khint64_t PANDAS_INLINE asint64(double key) {
-  return *(khint64_t *)(&key);
+  khint64_t val;
+  memcpy(&val, &key, sizeof(double));
+  return val;
 }
-#define kh_float64_hash_func(key) (khint32_t)((asint64(key))>>33^(asint64(key))^(asint64(key))<<11)
+
+// correct for all inputs but not -0.0 and NaNs
+#define kh_float64_hash_func_0_NAN(key) (khint32_t)((asint64(key))>>33^(asint64(key))^(asint64(key))<<11)
+
+// correct for all inputs but not NaNs
+#define kh_float64_hash_func_NAN(key) ((key) == 0.0 ?                       \
+                                        kh_float64_hash_func_0_NAN(0.0) : \
+                                        kh_float64_hash_func_0_NAN(key))
+
+// correct for all
+#define kh_float64_hash_func(key) ((key) != (key) ?                       \
+                                   kh_float64_hash_func_NAN(Py_NAN) :     \
+                                   kh_float64_hash_func_NAN(key))
+
 #define kh_float64_hash_equal(a, b) ((a) == (b) || ((b) != (b) && (a) != (a)))
 
 #define KHASH_MAP_INIT_FLOAT64(name, khval_t)								\
@@ -31,10 +47,19 @@ int PANDAS_INLINE pyobject_cmp(PyObject* a, PyObject* b) {
 		PyErr_Clear();
 		return 0;
 	}
+    if (result == 0) {  // still could be two NaNs
+        return PyFloat_CheckExact(a) &&
+               PyFloat_CheckExact(b) &&
+               Py_IS_NAN(PyFloat_AS_DOUBLE(a)) &&
+               Py_IS_NAN(PyFloat_AS_DOUBLE(b));
+    }
 	return result;
 }
 
-
+// For PyObject_Hash holds:
+//    hash(0.0) == 0 == hash(-0.0)
+//    hash(X) == 0 if X is a NaN-value
+// so it is OK to use it directly
 #define kh_python_hash_func(key) (PyObject_Hash(key))
 #define kh_python_hash_equal(a, b) (pyobject_cmp(a, b))
 
diff --git a/pandas/_libs/src/klib/ktypes.h b/pandas/_libs/src/klib/ktypes.h
deleted file mode 100644
index 981f17372a2d5..0000000000000
--- a/pandas/_libs/src/klib/ktypes.h
+++ /dev/null
@@ -1,6 +0,0 @@
-#ifndef __KTYPES_H
-#define __KTYPES_H
-
-/* compipler specific configuration */
-
-#endif /* __KTYPES_H */
diff --git a/pandas/_libs/src/klib/kvec.h b/pandas/_libs/src/klib/kvec.h
deleted file mode 100644
index c5e6e6c407dfc..0000000000000
--- a/pandas/_libs/src/klib/kvec.h
+++ /dev/null
@@ -1,151 +0,0 @@
-/* The MIT License
-
-   Copyright (c) 2008, by Attractive Chaos <attractor@live.co.uk>
-
-   Permission is hereby granted, free of charge, to any person obtaining
-   a copy of this software and associated documentation files (the
-   "Software"), to deal in the Software without restriction, including
-   without limitation the rights to use, copy, modify, merge, publish,
-   distribute, sublicense, and/or sell copies of the Software, and to
-   permit persons to whom the Software is furnished to do so, subject to
-   the following conditions:
-
-   The above copyright notice and this permission notice shall be
-   included in all copies or substantial portions of the Software.
-
-   THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-   EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-   MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
-   NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
-   BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
-   ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
-   CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-   SOFTWARE.
-*/
-
-/*
-  An example:
-
-#include "kvec.h"
-int main() {
-	kvec_t(int) array;
-	kv_init(array);
-	kv_push(int, array, 10); // append
-	kv_a(int, array, 20) = 5; // dynamic
-	kv_A(array, 20) = 4; // static
-	kv_destroy(array);
-	return 0;
-}
-*/
-
-/*
-  2008-09-22 (0.1.0):
-
-	* The initial version.
-
-*/
-
-#ifndef AC_KVEC_H
-#define AC_KVEC_H
-
-#include <stdlib.h>
-#include <Python.h>
-#include <numpy/ndarraytypes.h>
-
-#ifndef PANDAS_INLINE
-  #if defined(__GNUC__)
-    #define PANDAS_INLINE static __inline__
-  #elif defined(_MSC_VER)
-    #define PANDAS_INLINE static __inline
-  #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-    #define PANDAS_INLINE static inline
-  #else
-    #define PANDAS_INLINE
-  #endif
-#endif
-
-#define kv_roundup32(x) (--(x), (x)|=(x)>>1, (x)|=(x)>>2, (x)|=(x)>>4, (x)|=(x)>>8, (x)|=(x)>>16, ++(x))
-
-#define kvec_t(type) struct { size_t n, m; type *a; }
-#define kv_init(v) ((v).n = (v).m = 0, (v).a = 0)
-#define kv_destroy(v) free((v).a)
-#define kv_A(v, i) ((v).a[(i)])
-#define kv_pop(v) ((v).a[--(v).n])
-#define kv_size(v) ((v).n)
-#define kv_max(v) ((v).m)
-
-#define kv_resize(type, v, s)  ((v).m = (s), (v).a = (type*)realloc((v).a, sizeof(type) * (v).m))
-
-#define kv_copy(type, v1, v0) do {							\
-		if ((v1).m < (v0).n) kv_resize(type, v1, (v0).n);	\
-		(v1).n = (v0).n;									\
-		memcpy((v1).a, (v0).a, sizeof(type) * (v0).n);		\
-	} while (0)												\
-
-#define kv_push(type, v, x) do {									\
-		if ((v)->n == (v)->m) {										\
-			(v)->m = (v)->m? (v)->m<<1 : 2;							\
-			(v)->a = (type*)realloc((v)->a, sizeof(type) * (v)->m);	\
-		}															\
-		(v)->a[(v)->n++] = (x);										\
-	} while (0)
-
-#define kv_pushp(type, v) (((v).n == (v).m)?							\
-						   ((v).m = ((v).m? (v).m<<1 : 2),				\
-							(v).a = (type*)realloc((v).a, sizeof(type) * (v).m), 0)	\
-						   : 0), ((v).a + ((v).n++))
-
-#define kv_a(type, v, i) ((v).m <= (size_t)(i)?						\
-						  ((v).m = (v).n = (i) + 1, kv_roundup32((v).m), \
-						   (v).a = (type*)realloc((v).a, sizeof(type) * (v).m), 0) \
-						  : (v).n <= (size_t)(i)? (v).n = (i)			\
-						  : 0), (v).a[(i)]
-
-// #define kv_int64_push(v, x) (kv_push(int64_t, (v), (x)))
-
-typedef struct {
-  size_t n, m;
-  int64_t* a;
-} kv_int64_t;
-
-typedef struct {
-  size_t n, m;
-  double* a;
-} kv_double;
-
-typedef struct {
-  size_t n, m;
-  PyObject** a;
-} kv_object_t;
-
-void PANDAS_INLINE kv_object_push(kv_object_t *v, PyObject *x) {
-  do {
-		if (v->n == v->m) {
-			v->m = v->m? v->m<<1 : 2;
-			v->a = (PyObject**)realloc(v->a, sizeof(PyObject*) * v->m);
-		}
-		v->a[v->n++] = x;
-	} while (0);
-  // kv_push(PyObject*, v, x);
-  Py_INCREF(x);
-}
-
-void PANDAS_INLINE kv_int64_push(kv_int64_t *v, int64_t x) {
-  kv_push(int64_t, v, x);
-}
-
-void PANDAS_INLINE kv_double_push(kv_double *v, double x) {
-  kv_push(double, v, x);
-}
-
-void PANDAS_INLINE kv_object_destroy(kv_object_t *v) {
-  int i;
-  for (i = 0; i < v->n; ++i)
-  {
-    Py_XDECREF(v->a[i]);
-  }
-  free(v->a);
-}
-
-
-#endif
diff --git a/pandas/_libs/src/msgpack/unpack_template.h b/pandas/_libs/src/msgpack/unpack_template.h
index fba372ddcb3e4..402dcd48cb35a 100644
--- a/pandas/_libs/src/msgpack/unpack_template.h
+++ b/pandas/_libs/src/msgpack/unpack_template.h
@@ -210,7 +210,7 @@ static inline int unpack_execute(unpack_context* ctx, const char* data, size_t l
                 case 0xd5:  // fixext 2
                 case 0xd6:  // fixext 4
                 case 0xd7:  // fixext 8
-                    again_fixed_trail_if_zero(ACS_EXT_VALUE, 
+                    again_fixed_trail_if_zero(ACS_EXT_VALUE,
                                               (1 << (((unsigned int)*p) & 0x03))+1,
                                               _ext_zero);
                 case 0xd8:  // fixext 16
diff --git a/pandas/_libs/src/numpy.pxd b/pandas/_libs/src/numpy.pxd
deleted file mode 100644
index 9ab3b9b1b81ae..0000000000000
--- a/pandas/_libs/src/numpy.pxd
+++ /dev/null
@@ -1,984 +0,0 @@
-# NumPy static imports for Cython
-#
-# If any of the PyArray_* functions are called, import_array must be
-# called first.
-#
-# This also defines backwards-compatability buffer acquisition
-# code for use in Python 2.x (or Python <= 2.5 when NumPy starts
-# implementing PEP-3118 directly).
-#
-# Because of laziness, the format string of the buffer is statically
-# allocated. Increase the size if this is not enough, or submit a
-# patch to do this properly.
-#
-# Author: Dag Sverre Seljebotn
-#
-
-DEF _buffer_format_string_len = 255
-
-cimport cpython.buffer as pybuf
-from cpython.ref cimport Py_INCREF, Py_XDECREF
-from cpython.object cimport PyObject
-cimport libc.stdlib as stdlib
-cimport libc.stdio as stdio
-
-cdef extern from "Python.h":
-    ctypedef int Py_intptr_t
-
-cdef extern from "numpy/arrayobject.h":
-    ctypedef Py_intptr_t npy_intp
-    ctypedef size_t npy_uintp
-
-    cdef enum NPY_TYPES:
-        NPY_BOOL
-        NPY_BYTE
-        NPY_UBYTE
-        NPY_SHORT
-        NPY_USHORT
-        NPY_INT
-        NPY_UINT
-        NPY_LONG
-        NPY_ULONG
-        NPY_LONGLONG
-        NPY_ULONGLONG
-        NPY_FLOAT
-        NPY_DOUBLE
-        NPY_LONGDOUBLE
-        NPY_CFLOAT
-        NPY_CDOUBLE
-        NPY_CLONGDOUBLE
-        NPY_OBJECT
-        NPY_STRING
-        NPY_UNICODE
-        NPY_VOID
-        NPY_NTYPES
-        NPY_NOTYPE
-
-        NPY_INT8
-        NPY_INT16
-        NPY_INT32
-        NPY_INT64
-        NPY_INT128
-        NPY_INT256
-        NPY_UINT8
-        NPY_UINT16
-        NPY_UINT32
-        NPY_UINT64
-        NPY_UINT128
-        NPY_UINT256
-        NPY_FLOAT16
-        NPY_FLOAT32
-        NPY_FLOAT64
-        NPY_FLOAT80
-        NPY_FLOAT96
-        NPY_FLOAT128
-        NPY_FLOAT256
-        NPY_COMPLEX32
-        NPY_COMPLEX64
-        NPY_COMPLEX128
-        NPY_COMPLEX160
-        NPY_COMPLEX192
-        NPY_COMPLEX256
-        NPY_COMPLEX512
-
-        NPY_DATETIME
-        NPY_TIMEDELTA
-
-        NPY_INTP
-
-    ctypedef enum NPY_ORDER:
-        NPY_ANYORDER
-        NPY_CORDER
-        NPY_FORTRANORDER
-
-    ctypedef enum NPY_CLIPMODE:
-        NPY_CLIP
-        NPY_WRAP
-        NPY_RAISE
-
-    ctypedef enum NPY_SCALARKIND:
-        NPY_NOSCALAR,
-        NPY_BOOL_SCALAR,
-        NPY_INTPOS_SCALAR,
-        NPY_INTNEG_SCALAR,
-        NPY_FLOAT_SCALAR,
-        NPY_COMPLEX_SCALAR,
-        NPY_OBJECT_SCALAR
-
-    ctypedef enum NPY_SORTKIND:
-        NPY_QUICKSORT
-        NPY_HEAPSORT
-        NPY_MERGESORT
-
-    ctypedef enum NPY_SEARCHSIDE:
-        NPY_SEARCHLEFT
-        NPY_SEARCHRIGHT
-
-    enum:
-        NPY_C_CONTIGUOUS
-        NPY_F_CONTIGUOUS
-        NPY_CONTIGUOUS
-        NPY_FORTRAN
-        NPY_OWNDATA
-        NPY_FORCECAST
-        NPY_ENSURECOPY
-        NPY_ENSUREARRAY
-        NPY_ELEMENTSTRIDES
-        NPY_ALIGNED
-        NPY_NOTSWAPPED
-        NPY_WRITEABLE
-        NPY_UPDATEIFCOPY
-        NPY_ARR_HAS_DESCR
-
-        NPY_BEHAVED
-        NPY_BEHAVED_NS
-        NPY_CARRAY
-        NPY_CARRAY_RO
-        NPY_FARRAY
-        NPY_FARRAY_RO
-        NPY_DEFAULT
-
-        NPY_IN_ARRAY
-        NPY_OUT_ARRAY
-        NPY_INOUT_ARRAY
-        NPY_IN_FARRAY
-        NPY_OUT_FARRAY
-        NPY_INOUT_FARRAY
-
-        NPY_UPDATE_ALL
-
-    cdef enum:
-        NPY_MAXDIMS
-
-    npy_intp NPY_MAX_ELSIZE
-
-    ctypedef void (*PyArray_VectorUnaryFunc)(void *, void *, npy_intp, void *,  void *)
-
-    ctypedef class numpy.dtype [object PyArray_Descr]:
-        # Use PyDataType_* macros when possible, however there are no macros
-        # for accessing some of the fields, so some are defined. Please
-        # ask on cython-dev if you need more.
-        cdef int type_num
-        cdef int itemsize "elsize"
-        cdef char byteorder
-        cdef object fields
-        cdef tuple names
-
-    ctypedef extern class numpy.flatiter [object PyArrayIterObject]:
-        # Use through macros
-        pass
-
-    ctypedef extern class numpy.broadcast [object PyArrayMultiIterObject]:
-        # Use through macros
-        pass
-
-    ctypedef struct PyArrayObject:
-        # For use in situations where ndarray can't replace PyArrayObject*,
-        # like PyArrayObject**.
-        pass
-
-    ctypedef class numpy.ndarray [object PyArrayObject]:
-        cdef __cythonbufferdefaults__ = {"mode": "strided"}
-
-        cdef:
-            # Only taking a few of the most commonly used and stable fields.
-            # One should use PyArray_* macros instead to access the C fields.
-            char *data
-            int ndim "nd"
-            npy_intp *shape "dimensions"
-            npy_intp *strides
-            dtype descr
-            PyObject* base
-
-        # Note: This syntax (function definition in pxd files) is an
-        # experimental exception made for __getbuffer__ and __releasebuffer__
-        # -- the details of this may change.
-        def __getbuffer__(ndarray self, Py_buffer* info, int flags):
-            # This implementation of getbuffer is geared towards Cython
-            # requirements, and does not yet fullfill the PEP.
-            # In particular strided access is always provided regardless
-            # of flags
-
-            if info == NULL: return
-
-            cdef int copy_shape, i, ndim
-            cdef int endian_detector = 1
-            cdef bint little_endian = ((<char*>&endian_detector)[0] != 0)
-
-            ndim = PyArray_NDIM(self)
-
-            if sizeof(npy_intp) != sizeof(Py_ssize_t):
-                copy_shape = 1
-            else:
-                copy_shape = 0
-
-            if ((flags & pybuf.PyBUF_C_CONTIGUOUS == pybuf.PyBUF_C_CONTIGUOUS)
-                and not PyArray_CHKFLAGS(self, NPY_C_CONTIGUOUS)):
-                raise ValueError(u"ndarray is not C contiguous")
-
-            if ((flags & pybuf.PyBUF_F_CONTIGUOUS == pybuf.PyBUF_F_CONTIGUOUS)
-                and not PyArray_CHKFLAGS(self, NPY_F_CONTIGUOUS)):
-                raise ValueError(u"ndarray is not Fortran contiguous")
-
-            info.buf = PyArray_DATA(self)
-            info.ndim = ndim
-            if copy_shape:
-                # Allocate new buffer for strides and shape info.
-                # This is allocated as one block, strides first.
-                info.strides = <Py_ssize_t*>stdlib.malloc(sizeof(Py_ssize_t) * <size_t>ndim * 2)
-                info.shape = info.strides + ndim
-                for i in range(ndim):
-                    info.strides[i] = PyArray_STRIDES(self)[i]
-                    info.shape[i] = PyArray_DIMS(self)[i]
-            else:
-                info.strides = <Py_ssize_t*>PyArray_STRIDES(self)
-                info.shape = <Py_ssize_t*>PyArray_DIMS(self)
-            info.suboffsets = NULL
-            info.itemsize = PyArray_ITEMSIZE(self)
-            info.readonly = not PyArray_ISWRITEABLE(self)
-
-            cdef int t
-            cdef char* f = NULL
-            cdef dtype descr = self.descr
-            cdef list stack
-            cdef int offset
-
-            cdef bint hasfields = PyDataType_HASFIELDS(descr)
-
-            if not hasfields and not copy_shape:
-                # do not call releasebuffer
-                info.obj = None
-            else:
-                # need to call releasebuffer
-                info.obj = self
-
-            if not hasfields:
-                t = descr.type_num
-                if ((descr.byteorder == '>' and little_endian) or
-                    (descr.byteorder == '<' and not little_endian)):
-                    raise ValueError(u"Non-native byte order not supported")
-                if   t == NPY_BYTE:        f = "b"
-                elif t == NPY_UBYTE:       f = "B"
-                elif t == NPY_SHORT:       f = "h"
-                elif t == NPY_USHORT:      f = "H"
-                elif t == NPY_INT:         f = "i"
-                elif t == NPY_UINT:        f = "I"
-                elif t == NPY_LONG:        f = "l"
-                elif t == NPY_ULONG:       f = "L"
-                elif t == NPY_LONGLONG:    f = "q"
-                elif t == NPY_ULONGLONG:   f = "Q"
-                elif t == NPY_FLOAT:       f = "f"
-                elif t == NPY_DOUBLE:      f = "d"
-                elif t == NPY_LONGDOUBLE:  f = "g"
-                elif t == NPY_CFLOAT:      f = "Zf"
-                elif t == NPY_CDOUBLE:     f = "Zd"
-                elif t == NPY_CLONGDOUBLE: f = "Zg"
-                elif t == NPY_OBJECT:      f = "O"
-                else:
-                    raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t)
-                info.format = f
-                return
-            else:
-                info.format = <char*>stdlib.malloc(_buffer_format_string_len)
-                info.format[0] = '^' # Native data types, manual alignment
-                offset = 0
-                f = _util_dtypestring(descr, info.format + 1,
-                                      info.format + _buffer_format_string_len,
-                                      &offset)
-                f[0] = 0 # Terminate format string
-
-        def __releasebuffer__(ndarray self, Py_buffer* info):
-            if PyArray_HASFIELDS(self):
-                stdlib.free(info.format)
-            if sizeof(npy_intp) != sizeof(Py_ssize_t):
-                stdlib.free(info.strides)
-                # info.shape was stored after info.strides in the same block
-
-
-    ctypedef signed char      npy_bool
-
-    ctypedef signed char      npy_byte
-    ctypedef signed short     npy_short
-    ctypedef signed int       npy_int
-    ctypedef signed long      npy_long
-    ctypedef signed long long npy_longlong
-
-    ctypedef unsigned char      npy_ubyte
-    ctypedef unsigned short     npy_ushort
-    ctypedef unsigned int       npy_uint
-    ctypedef unsigned long      npy_ulong
-    ctypedef unsigned long long npy_ulonglong
-
-    ctypedef float        npy_float
-    ctypedef double       npy_double
-    ctypedef long double  npy_longdouble
-
-    ctypedef signed char        npy_int8
-    ctypedef signed short       npy_int16
-    ctypedef signed int         npy_int32
-    ctypedef signed long long   npy_int64
-    ctypedef signed long long   npy_int96
-    ctypedef signed long long   npy_int128
-
-    ctypedef unsigned char      npy_uint8
-    ctypedef unsigned short     npy_uint16
-    ctypedef unsigned int       npy_uint32
-    ctypedef unsigned long long npy_uint64
-    ctypedef unsigned long long npy_uint96
-    ctypedef unsigned long long npy_uint128
-
-    ctypedef float        npy_float16
-    ctypedef float        npy_float32
-    ctypedef double       npy_float64
-    ctypedef long double  npy_float80
-    ctypedef long double  npy_float96
-    ctypedef long double  npy_float128
-
-    ctypedef struct npy_cfloat:
-        double real
-        double imag
-
-    ctypedef struct npy_cdouble:
-        double real
-        double imag
-
-    ctypedef struct npy_clongdouble:
-        double real
-        double imag
-
-    ctypedef struct npy_complex64:
-        double real
-        double imag
-
-    ctypedef struct npy_complex128:
-        double real
-        double imag
-
-    ctypedef struct npy_complex160:
-        double real
-        double imag
-
-    ctypedef struct npy_complex192:
-        double real
-        double imag
-
-    ctypedef struct npy_complex256:
-        double real
-        double imag
-
-    ctypedef struct PyArray_Dims:
-        npy_intp *ptr
-        int len
-
-    void import_array()
-
-    #
-    # Macros from ndarrayobject.h
-    #
-    bint PyArray_CHKFLAGS(ndarray m, int flags)
-    bint PyArray_ISCONTIGUOUS(ndarray m)
-    bint PyArray_ISWRITEABLE(ndarray m)
-    bint PyArray_ISALIGNED(ndarray m)
-
-    int PyArray_NDIM(ndarray)
-    bint PyArray_ISONESEGMENT(ndarray)
-    bint PyArray_ISFORTRAN(ndarray)
-    int PyArray_FORTRANIF(ndarray)
-
-    void* PyArray_DATA(ndarray)
-    char* PyArray_BYTES(ndarray)
-    npy_intp* PyArray_DIMS(ndarray)
-    npy_intp* PyArray_STRIDES(ndarray)
-    npy_intp PyArray_DIM(ndarray, size_t)
-    npy_intp PyArray_STRIDE(ndarray, size_t)
-
-    # object PyArray_BASE(ndarray) wrong refcount semantics
-    # dtype PyArray_DESCR(ndarray) wrong refcount semantics
-    int PyArray_FLAGS(ndarray)
-    npy_intp PyArray_ITEMSIZE(ndarray)
-    int PyArray_TYPE(ndarray arr)
-
-    object PyArray_GETITEM(ndarray arr, void *itemptr)
-    int PyArray_SETITEM(ndarray arr, void *itemptr, object obj)
-
-    bint PyTypeNum_ISBOOL(int)
-    bint PyTypeNum_ISUNSIGNED(int)
-    bint PyTypeNum_ISSIGNED(int)
-    bint PyTypeNum_ISINTEGER(int)
-    bint PyTypeNum_ISFLOAT(int)
-    bint PyTypeNum_ISNUMBER(int)
-    bint PyTypeNum_ISSTRING(int)
-    bint PyTypeNum_ISCOMPLEX(int)
-    bint PyTypeNum_ISPYTHON(int)
-    bint PyTypeNum_ISFLEXIBLE(int)
-    bint PyTypeNum_ISUSERDEF(int)
-    bint PyTypeNum_ISEXTENDED(int)
-    bint PyTypeNum_ISOBJECT(int)
-
-    bint PyDataType_ISBOOL(dtype)
-    bint PyDataType_ISUNSIGNED(dtype)
-    bint PyDataType_ISSIGNED(dtype)
-    bint PyDataType_ISINTEGER(dtype)
-    bint PyDataType_ISFLOAT(dtype)
-    bint PyDataType_ISNUMBER(dtype)
-    bint PyDataType_ISSTRING(dtype)
-    bint PyDataType_ISCOMPLEX(dtype)
-    bint PyDataType_ISPYTHON(dtype)
-    bint PyDataType_ISFLEXIBLE(dtype)
-    bint PyDataType_ISUSERDEF(dtype)
-    bint PyDataType_ISEXTENDED(dtype)
-    bint PyDataType_ISOBJECT(dtype)
-    bint PyDataType_HASFIELDS(dtype)
-
-    bint PyArray_ISBOOL(ndarray)
-    bint PyArray_ISUNSIGNED(ndarray)
-    bint PyArray_ISSIGNED(ndarray)
-    bint PyArray_ISINTEGER(ndarray)
-    bint PyArray_ISFLOAT(ndarray)
-    bint PyArray_ISNUMBER(ndarray)
-    bint PyArray_ISSTRING(ndarray)
-    bint PyArray_ISCOMPLEX(ndarray)
-    bint PyArray_ISPYTHON(ndarray)
-    bint PyArray_ISFLEXIBLE(ndarray)
-    bint PyArray_ISUSERDEF(ndarray)
-    bint PyArray_ISEXTENDED(ndarray)
-    bint PyArray_ISOBJECT(ndarray)
-    bint PyArray_HASFIELDS(ndarray)
-
-    bint PyArray_ISVARIABLE(ndarray)
-
-    bint PyArray_SAFEALIGNEDCOPY(ndarray)
-    bint PyArray_ISNBO(ndarray)
-    bint PyArray_IsNativeByteOrder(ndarray)
-    bint PyArray_ISNOTSWAPPED(ndarray)
-    bint PyArray_ISBYTESWAPPED(ndarray)
-
-    bint PyArray_FLAGSWAP(ndarray, int)
-
-    bint PyArray_ISCARRAY(ndarray)
-    bint PyArray_ISCARRAY_RO(ndarray)
-    bint PyArray_ISFARRAY(ndarray)
-    bint PyArray_ISFARRAY_RO(ndarray)
-    bint PyArray_ISBEHAVED(ndarray)
-    bint PyArray_ISBEHAVED_RO(ndarray)
-
-
-    bint PyDataType_ISNOTSWAPPED(dtype)
-    bint PyDataType_ISBYTESWAPPED(dtype)
-
-    bint PyArray_DescrCheck(object)
-
-    bint PyArray_Check(object)
-    bint PyArray_CheckExact(object)
-
-    # Cannot be supported due to out arg:
-    # bint PyArray_HasArrayInterfaceType(object, dtype, object, object&)
-    # bint PyArray_HasArrayInterface(op, out)
-
-
-    bint PyArray_IsZeroDim(object)
-    # Cannot be supported due to ## ## in macro:
-    # bint PyArray_IsScalar(object, verbatim work)
-    bint PyArray_CheckScalar(object)
-    bint PyArray_IsPythonNumber(object)
-    bint PyArray_IsPythonScalar(object)
-    bint PyArray_IsAnyScalar(object)
-    bint PyArray_CheckAnyScalar(object)
-    ndarray PyArray_GETCONTIGUOUS(ndarray)
-    bint PyArray_SAMESHAPE(ndarray, ndarray)
-    npy_intp PyArray_SIZE(ndarray)
-    npy_intp PyArray_NBYTES(ndarray)
-
-    object PyArray_FROM_O(object)
-    object PyArray_FROM_OF(object m, int flags)
-    bint PyArray_FROM_OT(object m, int type)
-    bint PyArray_FROM_OTF(object m, int type, int flags)
-    object PyArray_FROMANY(object m, int type, int min, int max, int flags)
-    object PyArray_ZEROS(int nd, npy_intp* dims, int type, int fortran)
-    object PyArray_EMPTY(int nd, npy_intp* dims, int type, int fortran)
-    void PyArray_FILLWBYTE(object, int val)
-    npy_intp PyArray_REFCOUNT(object)
-    object PyArray_ContiguousFromAny(op, int, int min_depth, int max_depth)
-    unsigned char PyArray_EquivArrTypes(ndarray a1, ndarray a2)
-    bint PyArray_EquivByteorders(int b1, int b2)
-    object PyArray_SimpleNew(int nd, npy_intp* dims, int typenum)
-    object PyArray_SimpleNewFromData(int nd, npy_intp* dims, int typenum, void* data)
-    #object PyArray_SimpleNewFromDescr(int nd, npy_intp* dims, dtype descr)
-    object PyArray_ToScalar(void* data, ndarray arr)
-
-    void* PyArray_GETPTR1(ndarray m, npy_intp i)
-    void* PyArray_GETPTR2(ndarray m, npy_intp i, npy_intp j)
-    void* PyArray_GETPTR3(ndarray m, npy_intp i, npy_intp j, npy_intp k)
-    void* PyArray_GETPTR4(ndarray m, npy_intp i, npy_intp j, npy_intp k, npy_intp l)
-
-    void PyArray_XDECREF_ERR(ndarray)
-    # Cannot be supported due to out arg
-    # void PyArray_DESCR_REPLACE(descr)
-
-
-    object PyArray_Copy(ndarray)
-    object PyArray_FromObject(object op, int type, int min_depth, int max_depth)
-    object PyArray_ContiguousFromObject(object op, int type, int min_depth, int max_depth)
-    object PyArray_CopyFromObject(object op, int type, int min_depth, int max_depth)
-
-    object PyArray_Cast(ndarray mp, int type_num)
-    object PyArray_Take(ndarray ap, object items, int axis)
-    object PyArray_Put(ndarray ap, object items, object values)
-
-    void PyArray_ITER_RESET(flatiter it) nogil
-    void PyArray_ITER_NEXT(flatiter it) nogil
-    void PyArray_ITER_GOTO(flatiter it, npy_intp* destination) nogil
-    void PyArray_ITER_GOTO1D(flatiter it, npy_intp ind) nogil
-    void* PyArray_ITER_DATA(flatiter it) nogil
-    bint PyArray_ITER_NOTDONE(flatiter it) nogil
-
-    void PyArray_MultiIter_RESET(broadcast multi) nogil
-    void PyArray_MultiIter_NEXT(broadcast multi) nogil
-    void PyArray_MultiIter_GOTO(broadcast multi, npy_intp dest) nogil
-    void PyArray_MultiIter_GOTO1D(broadcast multi, npy_intp ind) nogil
-    void* PyArray_MultiIter_DATA(broadcast multi, npy_intp i) nogil
-    void PyArray_MultiIter_NEXTi(broadcast multi, npy_intp i) nogil
-    bint PyArray_MultiIter_NOTDONE(broadcast multi) nogil
-
-    # Functions from __multiarray_api.h
-
-    # Functions taking dtype and returning object/ndarray are disabled
-    # for now as they steal dtype references. I'm conservative and disable
-    # more than is probably needed until it can be checked further.
-    int PyArray_SetNumericOps        (object)
-    object PyArray_GetNumericOps ()
-    int PyArray_INCREF (ndarray)
-    int PyArray_XDECREF (ndarray)
-    void PyArray_SetStringFunction (object, int)
-    dtype PyArray_DescrFromType (int)
-    object PyArray_TypeObjectFromType (int)
-    char * PyArray_Zero (ndarray)
-    char * PyArray_One (ndarray)
-    #object PyArray_CastToType (ndarray, dtype, int)
-    int PyArray_CastTo (ndarray, ndarray)
-    int PyArray_CastAnyTo (ndarray, ndarray)
-    int PyArray_CanCastSafely (int, int)
-    npy_bool PyArray_CanCastTo (dtype, dtype)
-    int PyArray_ObjectType (object, int)
-    dtype PyArray_DescrFromObject (object, dtype)
-    #ndarray* PyArray_ConvertToCommonType (object, int *)
-    dtype PyArray_DescrFromScalar (object)
-    dtype PyArray_DescrFromTypeObject (object)
-    npy_intp PyArray_Size (object)
-    #object PyArray_Scalar (void *, dtype, object)
-    #object PyArray_FromScalar (object, dtype)
-    void PyArray_ScalarAsCtype (object, void *)
-    #int PyArray_CastScalarToCtype (object, void *, dtype)
-    #int PyArray_CastScalarDirect (object, dtype, void *, int)
-    object PyArray_ScalarFromObject (object)
-    #PyArray_VectorUnaryFunc * PyArray_GetCastFunc (dtype, int)
-    object PyArray_FromDims (int, int *, int)
-    #object PyArray_FromDimsAndDataAndDescr (int, int *, dtype, char *)
-    #object PyArray_FromAny (object, dtype, int, int, int, object)
-    object PyArray_EnsureArray (object)
-    object PyArray_EnsureAnyArray (object)
-    #object PyArray_FromFile (stdio.FILE *, dtype, npy_intp, char *)
-    #object PyArray_FromString (char *, npy_intp, dtype, npy_intp, char *)
-    #object PyArray_FromBuffer (object, dtype, npy_intp, npy_intp)
-    #object PyArray_FromIter (object, dtype, npy_intp)
-    object PyArray_Return (ndarray)
-    #object PyArray_GetField (ndarray, dtype, int)
-    #int PyArray_SetField (ndarray, dtype, int, object)
-    object PyArray_Byteswap (ndarray, npy_bool)
-    object PyArray_Resize (ndarray, PyArray_Dims *, int, NPY_ORDER)
-    int PyArray_MoveInto (ndarray, ndarray)
-    int PyArray_CopyInto (ndarray, ndarray)
-    int PyArray_CopyAnyInto (ndarray, ndarray)
-    int PyArray_CopyObject (ndarray, object)
-    object PyArray_NewCopy (ndarray, NPY_ORDER)
-    object PyArray_ToList (ndarray)
-    object PyArray_ToString (ndarray, NPY_ORDER)
-    int PyArray_ToFile (ndarray, stdio.FILE *, char *, char *)
-    int PyArray_Dump (object, object, int)
-    object PyArray_Dumps (object, int)
-    int PyArray_ValidType (int)
-    void PyArray_UpdateFlags (ndarray, int)
-    object PyArray_New (type, int, npy_intp *, int, npy_intp *, void *, int, int, object)
-    #object PyArray_NewFromDescr (type, dtype, int, npy_intp *, npy_intp *, void *, int, object)
-    #dtype PyArray_DescrNew (dtype)
-    dtype PyArray_DescrNewFromType (int)
-    double PyArray_GetPriority (object, double)
-    object PyArray_IterNew (object)
-    object PyArray_MultiIterNew (int, ...)
-
-    int PyArray_PyIntAsInt (object)
-    npy_intp PyArray_PyIntAsIntp (object)
-    int PyArray_Broadcast (broadcast)
-    void PyArray_FillObjectArray (ndarray, object)
-    int PyArray_FillWithScalar (ndarray, object)
-    npy_bool PyArray_CheckStrides (int, int, npy_intp, npy_intp, npy_intp *, npy_intp *)
-    dtype PyArray_DescrNewByteorder (dtype, char)
-    object PyArray_IterAllButAxis (object, int *)
-    #object PyArray_CheckFromAny (object, dtype, int, int, int, object)
-    #object PyArray_FromArray (ndarray, dtype, int)
-    object PyArray_FromInterface (object)
-    object PyArray_FromStructInterface (object)
-    #object PyArray_FromArrayAttr (object, dtype, object)
-    #NPY_SCALARKIND PyArray_ScalarKind (int, ndarray*)
-    int PyArray_CanCoerceScalar (int, int, NPY_SCALARKIND)
-    object PyArray_NewFlagsObject (object)
-    npy_bool PyArray_CanCastScalar (type, type)
-    #int PyArray_CompareUCS4 (npy_ucs4 *, npy_ucs4 *, register size_t)
-    int PyArray_RemoveSmallest (broadcast)
-    int PyArray_ElementStrides (object)
-    void PyArray_Item_INCREF (char *, dtype)
-    void PyArray_Item_XDECREF (char *, dtype)
-    object PyArray_FieldNames (object)
-    object PyArray_Transpose (ndarray, PyArray_Dims *)
-    object PyArray_TakeFrom (ndarray, object, int, ndarray, NPY_CLIPMODE)
-    object PyArray_PutTo (ndarray, object, object, NPY_CLIPMODE)
-    object PyArray_PutMask (ndarray, object, object)
-    object PyArray_Repeat (ndarray, object, int)
-    object PyArray_Choose (ndarray, object, ndarray, NPY_CLIPMODE)
-    int PyArray_Sort (ndarray, int, NPY_SORTKIND)
-    object PyArray_ArgSort (ndarray, int, NPY_SORTKIND)
-    object PyArray_SearchSorted (ndarray, object, NPY_SEARCHSIDE)
-    object PyArray_ArgMax (ndarray, int, ndarray)
-    object PyArray_ArgMin (ndarray, int, ndarray)
-    object PyArray_Reshape (ndarray, object)
-    object PyArray_Newshape (ndarray, PyArray_Dims *, NPY_ORDER)
-    object PyArray_Squeeze (ndarray)
-    #object PyArray_View (ndarray, dtype, type)
-    object PyArray_SwapAxes (ndarray, int, int)
-    object PyArray_Max (ndarray, int, ndarray)
-    object PyArray_Min (ndarray, int, ndarray)
-    object PyArray_Ptp (ndarray, int, ndarray)
-    object PyArray_Mean (ndarray, int, int, ndarray)
-    object PyArray_Trace (ndarray, int, int, int, int, ndarray)
-    object PyArray_Diagonal (ndarray, int, int, int)
-    object PyArray_Clip (ndarray, object, object, ndarray)
-    object PyArray_Conjugate (ndarray, ndarray)
-    object PyArray_Nonzero (ndarray)
-    object PyArray_Std (ndarray, int, int, ndarray, int)
-    object PyArray_Sum (ndarray, int, int, ndarray)
-    object PyArray_CumSum (ndarray, int, int, ndarray)
-    object PyArray_Prod (ndarray, int, int, ndarray)
-    object PyArray_CumProd (ndarray, int, int, ndarray)
-    object PyArray_All (ndarray, int, ndarray)
-    object PyArray_Any (ndarray, int, ndarray)
-    object PyArray_Compress (ndarray, object, int, ndarray)
-    object PyArray_Flatten (ndarray, NPY_ORDER)
-    object PyArray_Ravel (ndarray, NPY_ORDER)
-    npy_intp PyArray_MultiplyList (npy_intp *, int)
-    int PyArray_MultiplyIntList (int *, int)
-    void * PyArray_GetPtr (ndarray, npy_intp*)
-    int PyArray_CompareLists (npy_intp *, npy_intp *, int)
-    #int PyArray_AsCArray (object*, void *, npy_intp *, int, dtype)
-    #int PyArray_As1D (object*, char **, int *, int)
-    #int PyArray_As2D (object*, char ***, int *, int *, int)
-    int PyArray_Free (object, void *)
-    #int PyArray_Converter (object, object*)
-    int PyArray_IntpFromSequence (object, npy_intp *, int)
-    object PyArray_Concatenate (object, int)
-    object PyArray_InnerProduct (object, object)
-    object PyArray_MatrixProduct (object, object)
-    object PyArray_CopyAndTranspose (object)
-    object PyArray_Correlate (object, object, int)
-    int PyArray_TypestrConvert (int, int)
-    #int PyArray_DescrConverter (object, dtype*)
-    #int PyArray_DescrConverter2 (object, dtype*)
-    int PyArray_IntpConverter (object, PyArray_Dims *)
-    #int PyArray_BufferConverter (object, chunk)
-    int PyArray_AxisConverter (object, int *)
-    int PyArray_BoolConverter (object, npy_bool *)
-    int PyArray_ByteorderConverter (object, char *)
-    int PyArray_OrderConverter (object, NPY_ORDER *)
-    unsigned char PyArray_EquivTypes (dtype, dtype)
-    #object PyArray_Zeros (int, npy_intp *, dtype, int)
-    #object PyArray_Empty (int, npy_intp *, dtype, int)
-    object PyArray_Where (object, object, object)
-    object PyArray_Arange (double, double, double, int)
-    #object PyArray_ArangeObj (object, object, object, dtype)
-    int PyArray_SortkindConverter (object, NPY_SORTKIND *)
-    object PyArray_LexSort (object, int)
-    object PyArray_Round (ndarray, int, ndarray)
-    unsigned char PyArray_EquivTypenums (int, int)
-    int PyArray_RegisterDataType (dtype)
-    int PyArray_RegisterCastFunc (dtype, int, PyArray_VectorUnaryFunc *)
-    int PyArray_RegisterCanCast (dtype, int, NPY_SCALARKIND)
-    #void PyArray_InitArrFuncs (PyArray_ArrFuncs *)
-    object PyArray_IntTupleFromIntp (int, npy_intp *)
-    int PyArray_TypeNumFromName (char *)
-    int PyArray_ClipmodeConverter (object, NPY_CLIPMODE *)
-    #int PyArray_OutputConverter (object, ndarray*)
-    object PyArray_BroadcastToShape (object, npy_intp *, int)
-    void _PyArray_SigintHandler (int)
-    void* _PyArray_GetSigintBuf ()
-    #int PyArray_DescrAlignConverter (object, dtype*)
-    #int PyArray_DescrAlignConverter2 (object, dtype*)
-    int PyArray_SearchsideConverter (object, void *)
-    object PyArray_CheckAxis (ndarray, int *, int)
-    npy_intp PyArray_OverflowMultiplyList (npy_intp *, int)
-    int PyArray_CompareString (char *, char *, size_t)
-
-
-# Typedefs that matches the runtime dtype objects in
-# the numpy module.
-
-# The ones that are commented out needs an IFDEF function
-# in Cython to enable them only on the right systems.
-
-ctypedef npy_int8       int8_t
-ctypedef npy_int16      int16_t
-ctypedef npy_int32      int32_t
-ctypedef npy_int64      int64_t
-#ctypedef npy_int96      int96_t
-#ctypedef npy_int128     int128_t
-
-ctypedef npy_uint8      uint8_t
-ctypedef npy_uint16     uint16_t
-ctypedef npy_uint32     uint32_t
-ctypedef npy_uint64     uint64_t
-#ctypedef npy_uint96     uint96_t
-#ctypedef npy_uint128    uint128_t
-
-ctypedef npy_float16    float16_t
-ctypedef npy_float32    float32_t
-ctypedef npy_float64    float64_t
-#ctypedef npy_float80    float80_t
-#ctypedef npy_float128   float128_t
-
-ctypedef float complex  complex64_t
-ctypedef double complex complex128_t
-
-# The int types are mapped a bit surprising --
-# numpy.int corresponds to 'l' and numpy.long to 'q'
-ctypedef npy_long       int_t
-ctypedef npy_longlong   long_t
-ctypedef npy_longlong   longlong_t
-
-ctypedef npy_ulong      uint_t
-ctypedef npy_ulonglong  ulong_t
-ctypedef npy_ulonglong  ulonglong_t
-
-ctypedef npy_intp       intp_t
-ctypedef npy_uintp      uintp_t
-
-ctypedef npy_double     float_t
-ctypedef npy_double     double_t
-ctypedef npy_longdouble longdouble_t
-
-ctypedef npy_cfloat      cfloat_t
-ctypedef npy_cdouble     cdouble_t
-ctypedef npy_clongdouble clongdouble_t
-
-ctypedef npy_cdouble     complex_t
-
-cdef inline object PyArray_MultiIterNew1(a):
-    return PyArray_MultiIterNew(1, <void*>a)
-
-cdef inline object PyArray_MultiIterNew2(a, b):
-    return PyArray_MultiIterNew(2, <void*>a, <void*>b)
-
-cdef inline object PyArray_MultiIterNew3(a, b, c):
-    return PyArray_MultiIterNew(3, <void*>a, <void*>b, <void*> c)
-
-cdef inline object PyArray_MultiIterNew4(a, b, c, d):
-    return PyArray_MultiIterNew(4, <void*>a, <void*>b, <void*>c, <void*> d)
-
-cdef inline object PyArray_MultiIterNew5(a, b, c, d, e):
-    return PyArray_MultiIterNew(5, <void*>a, <void*>b, <void*>c, <void*> d, <void*> e)
-
-cdef inline char* _util_dtypestring(dtype descr, char* f, char* end, int* offset) except NULL:
-    # Recursive utility function used in __getbuffer__ to get format
-    # string. The new location in the format string is returned.
-
-    cdef dtype child
-    cdef int delta_offset
-    cdef tuple i
-    cdef int endian_detector = 1
-    cdef bint little_endian = ((<char*>&endian_detector)[0] != 0)
-    cdef tuple fields
-
-    for childname in descr.names:
-        fields = descr.fields[childname]
-        child, new_offset = fields
-
-        if (end - f) - (new_offset - offset[0]) < 15:
-            raise RuntimeError(u"Format string allocated too short, see comment in numpy.pxd")
-
-        if ((child.byteorder == '>' and little_endian) or
-            (child.byteorder == '<' and not little_endian)):
-            raise ValueError(u"Non-native byte order not supported")
-            # One could encode it in the format string and have Cython
-            # complain instead, BUT: < and > in format strings also imply
-            # standardized sizes for datatypes, and we rely on native in
-            # order to avoid reencoding data types based on their size.
-            #
-            # A proper PEP 3118 exporter for other clients than Cython
-            # must deal properly with this!
-
-        # Output padding bytes
-        while offset[0] < new_offset:
-            f[0] = 120 # "x"; pad byte
-            f += 1
-            offset[0] += 1
-
-        offset[0] += child.itemsize
-
-        if not PyDataType_HASFIELDS(child):
-            t = child.type_num
-            if end - f < 5:
-                raise RuntimeError(u"Format string allocated too short.")
-
-            # Until ticket #99 is fixed, use integers to avoid warnings
-            if   t == NPY_BYTE:        f[0] =  98 #"b"
-            elif t == NPY_UBYTE:       f[0] =  66 #"B"
-            elif t == NPY_SHORT:       f[0] = 104 #"h"
-            elif t == NPY_USHORT:      f[0] =  72 #"H"
-            elif t == NPY_INT:         f[0] = 105 #"i"
-            elif t == NPY_UINT:        f[0] =  73 #"I"
-            elif t == NPY_LONG:        f[0] = 108 #"l"
-            elif t == NPY_ULONG:       f[0] = 76  #"L"
-            elif t == NPY_LONGLONG:    f[0] = 113 #"q"
-            elif t == NPY_ULONGLONG:   f[0] = 81  #"Q"
-            elif t == NPY_FLOAT:       f[0] = 102 #"f"
-            elif t == NPY_DOUBLE:      f[0] = 100 #"d"
-            elif t == NPY_LONGDOUBLE:  f[0] = 103 #"g"
-            elif t == NPY_CFLOAT:      f[0] = 90; f[1] = 102; f += 1 # Zf
-            elif t == NPY_CDOUBLE:     f[0] = 90; f[1] = 100; f += 1 # Zd
-            elif t == NPY_CLONGDOUBLE: f[0] = 90; f[1] = 103; f += 1 # Zg
-            elif t == NPY_OBJECT:      f[0] = 79 #"O"
-            else:
-                raise ValueError(u"unknown dtype code in numpy.pxd (%d)" % t)
-            f += 1
-        else:
-            # Cython ignores struct boundary information ("T{...}"),
-            # so don't output it
-            f = _util_dtypestring(child, f, end, offset)
-    return f
-
-
-#
-# ufunc API
-#
-
-cdef extern from "numpy/ufuncobject.h":
-
-    ctypedef void (*PyUFuncGenericFunction) (char **, npy_intp *, npy_intp *, void *)
-
-    ctypedef extern class numpy.ufunc [object PyUFuncObject]:
-        cdef:
-            int nin, nout, nargs
-            int identity
-            PyUFuncGenericFunction *functions
-            void **data
-            int ntypes
-            int check_return
-            char *name
-            char *types
-            char *doc
-            void *ptr
-            PyObject *obj
-            PyObject *userloops
-
-    cdef enum:
-        PyUFunc_Zero
-        PyUFunc_One
-        PyUFunc_None
-        UFUNC_ERR_IGNORE
-        UFUNC_ERR_WARN
-        UFUNC_ERR_RAISE
-        UFUNC_ERR_CALL
-        UFUNC_ERR_PRINT
-        UFUNC_ERR_LOG
-        UFUNC_MASK_DIVIDEBYZERO
-        UFUNC_MASK_OVERFLOW
-        UFUNC_MASK_UNDERFLOW
-        UFUNC_MASK_INVALID
-        UFUNC_SHIFT_DIVIDEBYZERO
-        UFUNC_SHIFT_OVERFLOW
-        UFUNC_SHIFT_UNDERFLOW
-        UFUNC_SHIFT_INVALID
-        UFUNC_FPE_DIVIDEBYZERO
-        UFUNC_FPE_OVERFLOW
-        UFUNC_FPE_UNDERFLOW
-        UFUNC_FPE_INVALID
-        UFUNC_ERR_DEFAULT
-        UFUNC_ERR_DEFAULT2
-
-    object PyUFunc_FromFuncAndData(PyUFuncGenericFunction *,
-          void **, char *, int, int, int, int, char *, char *, int)
-    int PyUFunc_RegisterLoopForType(ufunc, int,
-                                    PyUFuncGenericFunction, int *, void *)
-    int PyUFunc_GenericFunction \
-        (ufunc, PyObject *, PyObject *, PyArrayObject **)
-    void PyUFunc_f_f_As_d_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_d_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_f_f \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_g_g \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_F_F_As_D_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_F_F \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_D_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_G_G \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_O_O \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_ff_f_As_dd_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_ff_f \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_dd_d \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_gg_g \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_FF_F_As_DD_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_DD_D \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_FF_F \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_GG_G \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_OO_O \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_O_O_method \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_OO_O_method \
-         (char **, npy_intp *, npy_intp *, void *)
-    void PyUFunc_On_Om \
-         (char **, npy_intp *, npy_intp *, void *)
-    int PyUFunc_GetPyValues \
-        (char *, int *, int *, PyObject **)
-    int PyUFunc_checkfperr \
-           (int, PyObject *, int *)
-    void PyUFunc_clearfperr()
-    int PyUFunc_getfperr()
-    int PyUFunc_handlefperr \
-        (int, PyObject *, int, int *)
-    int PyUFunc_ReplaceLoopBySignature \
-        (ufunc, PyUFuncGenericFunction, int *, PyUFuncGenericFunction *)
-    object PyUFunc_FromFuncAndDataAndSignature \
-             (PyUFuncGenericFunction *, void **, char *, int, int, int,
-              int, char *, char *, int, char *)
-
-    void import_ufunc()
-
-
-cdef inline void set_array_base(ndarray arr, object base):
-     cdef PyObject* baseptr
-     if base is None:
-         baseptr = NULL
-     else:
-         Py_INCREF(base) # important to do this before decref below!
-         baseptr = <PyObject*>base
-     Py_XDECREF(arr.base)
-     arr.base = baseptr
-
-cdef inline object get_array_base(ndarray arr):
-    if arr.base is NULL:
-        return None
-    else:
-        return <object>arr.base
diff --git a/pandas/_libs/src/numpy_helper.h b/pandas/_libs/src/numpy_helper.h
deleted file mode 100644
index 5f4db5b2f55d3..0000000000000
--- a/pandas/_libs/src/numpy_helper.h
+++ /dev/null
@@ -1,162 +0,0 @@
-/*
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-*/
-
-#ifndef PANDAS__LIBS_SRC_NUMPY_HELPER_H_
-#define PANDAS__LIBS_SRC_NUMPY_HELPER_H_
-
-#include "Python.h"
-#include "helper.h"
-#include "numpy/arrayobject.h"
-#include "numpy/arrayscalars.h"
-
-#define PANDAS_FLOAT 0
-#define PANDAS_INT 1
-#define PANDAS_BOOL 2
-#define PANDAS_STRING 3
-#define PANDAS_OBJECT 4
-#define PANDAS_DATETIME 5
-
-PANDAS_INLINE int infer_type(PyObject* obj) {
-    if (PyBool_Check(obj)) {
-        return PANDAS_BOOL;
-    } else if (PyArray_IsIntegerScalar(obj)) {
-        return PANDAS_INT;
-    } else if (PyArray_IsScalar(obj, Datetime)) {
-        return PANDAS_DATETIME;
-    } else if (PyFloat_Check(obj) || PyArray_IsScalar(obj, Floating)) {
-        return PANDAS_FLOAT;
-    } else if (PyString_Check(obj) || PyUnicode_Check(obj)) {
-        return PANDAS_STRING;
-    } else {
-        return PANDAS_OBJECT;
-    }
-}
-
-PANDAS_INLINE npy_int64 get_nat(void) { return NPY_MIN_INT64; }
-
-PANDAS_INLINE npy_datetime get_datetime64_value(PyObject* obj) {
-    return ((PyDatetimeScalarObject*)obj)->obval;
-}
-
-PANDAS_INLINE npy_timedelta get_timedelta64_value(PyObject* obj) {
-    return ((PyTimedeltaScalarObject*)obj)->obval;
-}
-
-PANDAS_INLINE int is_integer_object(PyObject* obj) {
-    return (!PyBool_Check(obj)) && PyArray_IsIntegerScalar(obj);
-}
-
-PANDAS_INLINE int is_float_object(PyObject* obj) {
-    return (PyFloat_Check(obj) || PyArray_IsScalar(obj, Floating));
-}
-PANDAS_INLINE int is_complex_object(PyObject* obj) {
-    return (PyComplex_Check(obj) || PyArray_IsScalar(obj, ComplexFloating));
-}
-
-PANDAS_INLINE int is_bool_object(PyObject* obj) {
-    return (PyBool_Check(obj) || PyArray_IsScalar(obj, Bool));
-}
-
-PANDAS_INLINE int is_string_object(PyObject* obj) {
-    return (PyString_Check(obj) || PyUnicode_Check(obj));
-}
-
-PANDAS_INLINE int is_datetime64_object(PyObject* obj) {
-    return PyArray_IsScalar(obj, Datetime);
-}
-
-PANDAS_INLINE int is_timedelta64_object(PyObject* obj) {
-    return PyArray_IsScalar(obj, Timedelta);
-}
-
-PANDAS_INLINE int assign_value_1d(PyArrayObject* ap, Py_ssize_t _i,
-                                  PyObject* v) {
-    npy_intp i = (npy_intp)_i;
-    char* item = (char*)PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
-    return PyArray_DESCR(ap)->f->setitem(v, item, ap);
-}
-
-PANDAS_INLINE PyObject* get_value_1d(PyArrayObject* ap, Py_ssize_t i) {
-    char* item = (char*)PyArray_DATA(ap) + i * PyArray_STRIDE(ap, 0);
-    return PyArray_Scalar(item, PyArray_DESCR(ap), (PyObject*)ap);
-}
-
-PANDAS_INLINE char* get_c_string(PyObject* obj) {
-#if PY_VERSION_HEX >= 0x03000000
-    PyObject* enc_str = PyUnicode_AsEncodedString(obj, "utf-8", "error");
-
-    char* ret;
-    ret = PyBytes_AS_STRING(enc_str);
-
-    // TODO(general): memory leak here
-
-    return ret;
-#else
-    return PyString_AsString(obj);
-#endif
-}
-
-PANDAS_INLINE PyObject* char_to_string(char* data) {
-#if PY_VERSION_HEX >= 0x03000000
-    return PyUnicode_FromString(data);
-#else
-    return PyString_FromString(data);
-#endif
-}
-
-PyObject* sarr_from_data(PyArray_Descr* descr, int length, void* data) {
-    PyArrayObject* result;
-    npy_intp dims[1] = {length};
-    Py_INCREF(descr);  // newfromdescr steals a reference to descr
-    result = (PyArrayObject*)PyArray_NewFromDescr(&PyArray_Type, descr, 1, dims,
-                                                  NULL, data, 0, NULL);
-
-    // Returned array doesn't own data by default
-    result->flags |= NPY_OWNDATA;
-
-    return (PyObject*)result;
-}
-
-void transfer_object_column(char* dst, char* src, size_t stride,
-                            size_t length) {
-    size_t i;
-    size_t sz = sizeof(PyObject*);
-
-    for (i = 0; i < length; ++i) {
-        // uninitialized data
-
-        // Py_XDECREF(*((PyObject**) dst));
-
-        memcpy(dst, src, sz);
-        Py_INCREF(*((PyObject**)dst));
-        src += sz;
-        dst += stride;
-    }
-}
-
-void set_array_owndata(PyArrayObject* ao) { ao->flags |= NPY_OWNDATA; }
-
-void set_array_not_contiguous(PyArrayObject* ao) {
-    ao->flags &= ~(NPY_C_CONTIGUOUS | NPY_F_CONTIGUOUS);
-}
-
-// If arr is zerodim array, return a proper array scalar (e.g. np.int64).
-// Otherwise, return arr as is.
-PANDAS_INLINE PyObject* unbox_if_zerodim(PyObject* arr) {
-    if (PyArray_IsZeroDim(arr)) {
-        PyObject* ret;
-        ret = PyArray_ToScalar(PyArray_DATA(arr), arr);
-        return ret;
-    } else {
-        Py_INCREF(arr);
-        return arr;
-    }
-}
-
-#endif  // PANDAS__LIBS_SRC_NUMPY_HELPER_H_
diff --git a/pandas/_libs/src/offsets.pyx b/pandas/_libs/src/offsets.pyx
deleted file mode 100644
index c963e256d0aa5..0000000000000
--- a/pandas/_libs/src/offsets.pyx
+++ /dev/null
@@ -1,367 +0,0 @@
-
-ctypedef enum time_res:
-    r_min = 0
-    r_microsecond
-    r_second
-    r_minute
-    r_hour
-    r_day
-    r_month
-    r_year
-    r_max = 98
-    r_invalid = 99
-
-
-cdef conversion_factor(time_res res1, time_res res2):
-    cdef:
-        time_res min_res, max_res
-        int64_t factor
-
-    min_res = min(res1, res2)
-    max_res = max(res1, res2)
-    factor = 1
-
-    if min_res == max_res:
-        return factor
-
-    while min_res < max_res:
-        if min_res < r_microsecond:
-            raise "Cannot convert from less than us"
-        elif min_res == r_microsecond:
-            factor *= 1000000
-            min_res = r_second
-        elif min_res == r_second:
-            factor *= 60
-            min_res = r_minute
-        elif min_res == r_minute:
-            factor *= 60
-            min_res = r_hour
-        elif min_res == r_hour:
-            factor *= 24
-            min_res = r_day
-        else:
-            raise "Cannot convert to month or year"
-
-    return factor
-
-# Logic to generate ranges
-# -----------------------------------------------------------------------------
-
-cdef inline int64_t weekend_adjustment(int64_t dow, int bkwd):
-    if dow > 4:                         # sat or sun?
-        if bkwd:                        # roll back 1 or 2 days
-            return (4 - dow)
-        else:                           # roll forward 2 or 1 days
-            return (7 - dow)
-    return 0
-
-cdef int64_t us_in_day = conversion_factor(r_microsecond, r_day)
-
-cdef class _Offset:
-    """
-    Base class to generate timestamps. Set the anchor, and then move offsets
-    with next & prev. Retrieve timestamp with ts attribute.
-    """
-    cdef:
-        int64_t t, dow, biz, dayoffset
-        object start
-        _TSObject ts
-
-    def __cinit__(self):
-        self.t=0
-        self.dow=0
-        self.biz=0
-        self.dayoffset=0
-
-    cpdef anchor(self, object start=None):
-        if start is not None:
-            self.start = start
-        self.ts = convert_to_tsobject(self.start, None, None)
-        self._setup()
-
-    cdef _setup(self):
-        pass
-
-    cpdef next(self):
-        pass
-
-    cpdef __next__(self):
-        """wrapper around next"""
-        return self.next()
-
-    cpdef prev(self):
-        pass
-
-    cdef int64_t _ts(self):
-        """
-        Access the current timestamp value, with a possible weekday
-        adjustment.
-        """
-        cdef int64_t adj
-
-        if self.biz != 0:
-            adj = weekend_adjustment(self.dow, self.biz < 0)
-            return self.t + us_in_day * adj
-        else:
-            return self.t
-
-    cdef int64_t _get_anchor(self):
-        """
-        Retrieve an anchor relating to current offset we're on.
-        """
-        return self.t - self.dayoffset * us_in_day
-
-    property ts:
-        def __get__(self):
-            return self._ts()
-
-cdef class YearOffset(_Offset):
-    """
-    Generate annual timestamps from provided start time; apply dayoffset to
-    each timestamp. If biz > 0, we choose the next business day at each time;
-    previous if < 0.
-
-    Parameters
-    ----------
-    dayoffset : int
-    biz : int
-    """
-    cdef:
-        int64_t y, ly
-
-    def __init__(self, int64_t dayoffset=0, int64_t biz=0, object anchor=None):
-        self.dayoffset = dayoffset
-        self.biz = biz
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        self.t = ts.value + self.dayoffset * us_in_day
-        self.y = ts.dts.year
-
-        self.ly = (ts.dts.month > 2 or
-                   ts.dts.month == 2 and ts.dts.day == 29)
-
-        if self.biz != 0:
-            self.dow = (ts_dayofweek(ts) + self.dayoffset) % 7
-
-    cpdef next(self):
-        cdef int64_t days
-
-        days = 365 + is_leapyear(self.y + self.ly)
-
-        self.t += days * us_in_day
-        self.y += 1
-
-        if self.biz != 0:
-            self.dow = (self.dow + days) % 7
-
-    cpdef prev(self):
-        cdef int64_t days
-
-        days = 365 + is_leapyear(self.y - (1 - self.ly))
-
-        self.t -= days * us_in_day
-        self.y -= 1
-
-        if self.biz != 0:
-            self.dow = (self.dow - days) % 7
-
-cdef class MonthOffset(_Offset):
-    """
-    Generate monthly timestamps from provided start time, and apply dayoffset
-    to each timestamp.  Stride to construct strided timestamps (eg quarterly).
-    If biz > 0, we choose the next business day at each time; previous if < 0.
-
-    Parameters
-    ----------
-    dayoffset : int
-    stride : int, > 0
-    biz : int
-    """
-    cdef:
-        Py_ssize_t stride, ly, m
-        int64_t y
-
-    def __init__(self, int64_t dayoffset=0, Py_ssize_t stride=1,
-                 int64_t biz=0, object anchor=None):
-        self.dayoffset = dayoffset
-        self.stride = stride
-        self.biz = biz
-
-        if stride <= 0:
-            raise ValueError("Stride must be positive")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        self.t = ts.value + (self.dayoffset * us_in_day)
-
-        # for day counting
-        self.m = ts.dts.month - 1
-        self.y = ts.dts.year
-        self.ly = is_leapyear(self.y)
-
-        if self.biz != 0:
-            self.dow = (ts_dayofweek(ts) + self.dayoffset) % 7
-
-    cpdef next(self):
-        cdef:
-            int64_t tmp, days
-            Py_ssize_t j
-
-        days = 0
-        for j in range(0, self.stride):
-            if self.m >= 12:
-                self.m -= 12
-                self.y += 1
-                self.ly = is_leapyear(self.y)
-            days += days_per_month_table[self.ly][self.m]
-            self.m += 1
-
-        self.t += days * us_in_day
-
-        if self.biz != 0:
-            self.dow = (self.dow + days) % 7
-
-    cpdef prev(self):
-        cdef:
-            int64_t tmp, days
-            Py_ssize_t j
-
-        days = 0
-        for j in range(0, self.stride):
-            self.m -= 1
-            if self.m < 0:
-                self.m += 12
-                self.y -= 1
-                self.ly = is_leapyear(self.y)
-            days += days_per_month_table[self.ly][self.m]
-
-        self.t -= days * us_in_day
-
-        if self.biz != 0:
-            self.dow = (self.dow - days) % 7
-
-cdef class DayOfMonthOffset(_Offset):
-    """
-    Generate relative monthly timestamps from month & year of provided start
-    time. For example, fridays of the third week of each month (week=3, day=4);
-    or, thursdays of the last week of each month (week=-1, day=3).
-
-    Parameters
-    ----------
-    week : int
-    day : int, 0 to 6
-    """
-    cdef:
-        Py_ssize_t ly, m
-        int64_t y, day, week
-
-    def __init__(self, int64_t week=0, int64_t day=0, object anchor=None):
-        self.week = week
-        self.day = day
-
-        if self.day < 0 or self.day > 6:
-            raise ValueError("Day offset must be 0 to 6")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-
-        # rewind to beginning of month
-        self.t = ts.value - (ts.dts.day - 1) * us_in_day
-        self.dow = dayofweek(ts.dts.year, ts.dts.month, 1)
-
-        # for day counting
-        self.m = ts.dts.month - 1
-        self.y = ts.dts.year
-        self.ly = is_leapyear(self.y)
-
-    cpdef next(self):
-        cdef:
-            int64_t tmp, days
-
-        days = days_per_month_table[self.ly][self.m]
-        self.t += days * us_in_day
-        self.dow = (self.dow + days) % 7
-
-        self.m += 1
-        if self.m >= 12:
-            self.m -= 12
-            self.y += 1
-            self.ly = is_leapyear(self.y)
-
-    cpdef prev(self):
-        cdef:
-            int64_t tmp, days
-
-        days = days_per_month_table[self.ly][(self.m - 1) % 12]
-        self.t -= days * us_in_day
-        self.dow = (self.dow - days) % 7
-
-        self.m -= 1
-        if self.m < 0:
-            self.m += 12
-            self.y -= 1
-            self.ly = is_leapyear(self.y)
-
-    cdef int64_t _ts(self):
-        """
-        Overwrite default adjustment
-        """
-        cdef int64_t adj = (self.week * 7) + (self.day - self.dow) % 7
-        return self.t + us_in_day * adj
-
-cdef class DayOffset(_Offset):
-    """
-    Generate daily timestamps beginning with first valid time >= start time. If
-    biz != 0, we skip weekends. Stride, to construct weekly timestamps.
-
-    Parameters
-    ----------
-    stride : int, > 0
-    biz : boolean
-    """
-    cdef:
-        Py_ssize_t stride
-
-    def __init__(self, int64_t stride=1, int64_t biz=0, object anchor=None):
-        self.stride = stride
-        self.biz = biz
-
-        if self.stride <= 0:
-            raise ValueError("Stride must be positive")
-
-        if anchor is not None:
-            self.anchor(anchor)
-
-    cdef _setup(self):
-        cdef _TSObject ts = self.ts
-        self.t = ts.value
-        if self.biz != 0:
-            self.dow = ts_dayofweek(ts)
-
-    cpdef next(self):
-        self.t += (self.stride * us_in_day)
-        if self.biz != 0:
-            self.dow = (self.dow + self.stride) % 7
-            if self.dow >= 5:
-                self.t += (7 - self.dow) * us_in_day
-                self.dow = 0
-
-    cpdef prev(self):
-        self.t -= (self.stride * us_in_day)
-        if self.biz != 0:
-            self.dow = (self.dow - self.stride) % 7
-            if self.dow >= 5:
-                self.t += (4 - self.dow) * us_in_day
-                self.dow = 4
diff --git a/pandas/_libs/src/parse_helper.h b/pandas/_libs/src/parse_helper.h
index 6dd8b66eab33d..6fcd2ed0a9ea0 100644
--- a/pandas/_libs/src/parse_helper.h
+++ b/pandas/_libs/src/parse_helper.h
@@ -12,6 +12,7 @@ The full license is in the LICENSE file, distributed with this software.
 
 #include <errno.h>
 #include <float.h>
+#include "inline_helper.h"
 #include "headers/portable.h"
 
 static double xstrtod(const char *p, char **q, char decimal, char sci,
@@ -29,7 +30,7 @@ int to_double(char *item, double *p_value, char sci, char decimal,
 #if PY_VERSION_HEX < 0x02060000
 #define PyBytes_Check PyString_Check
 #define PyBytes_AS_STRING PyString_AS_STRING
-#endif
+#endif  // PY_VERSION_HEX
 
 int floatify(PyObject *str, double *result, int *maybe_int) {
     int status;
@@ -137,11 +138,11 @@ int floatify(PyObject *str, double *result, int *maybe_int) {
 //
 
 PANDAS_INLINE void lowercase(char *p) {
-    for (; *p; ++p) *p = tolower(*p);
+    for (; *p; ++p) *p = tolower_ascii(*p);
 }
 
 PANDAS_INLINE void uppercase(char *p) {
-    for (; *p; ++p) *p = toupper(*p);
+    for (; *p; ++p) *p = toupper_ascii(*p);
 }
 
 static double xstrtod(const char *str, char **endptr, char decimal, char sci,
@@ -176,7 +177,7 @@ static double xstrtod(const char *str, char **endptr, char decimal, char sci,
     num_decimals = 0;
 
     // Process string of digits
-    while (isdigit(*p)) {
+    while (isdigit_ascii(*p)) {
         number = number * 10. + (*p - '0');
         p++;
         num_digits++;
@@ -187,7 +188,7 @@ static double xstrtod(const char *str, char **endptr, char decimal, char sci,
         *maybe_int = 0;
         p++;
 
-        while (isdigit(*p)) {
+        while (isdigit_ascii(*p)) {
             number = number * 10. + (*p - '0');
             p++;
             num_digits++;
@@ -206,7 +207,7 @@ static double xstrtod(const char *str, char **endptr, char decimal, char sci,
     if (negative) number = -number;
 
     // Process an exponent string
-    if (toupper(*p) == toupper(sci)) {
+    if (toupper_ascii(*p) == toupper_ascii(sci)) {
         *maybe_int = 0;
 
         // Handle optional sign
@@ -221,7 +222,7 @@ static double xstrtod(const char *str, char **endptr, char decimal, char sci,
         // Process string of digits
         num_digits = 0;
         n = 0;
-        while (isdigit(*p)) {
+        while (isdigit_ascii(*p)) {
             n = n * 10 + (*p - '0');
             num_digits++;
             p++;
@@ -262,7 +263,7 @@ static double xstrtod(const char *str, char **endptr, char decimal, char sci,
 
     if (skip_trailing) {
         // Skip trailing whitespace
-        while (isspace(*p)) p++;
+        while (isspace_ascii(*p)) p++;
     }
 
     if (endptr) *endptr = p;
diff --git a/pandas/_libs/src/parser/.gitignore b/pandas/_libs/src/parser/.gitignore
deleted file mode 100644
index f07e771a35eec..0000000000000
--- a/pandas/_libs/src/parser/.gitignore
+++ /dev/null
@@ -1,2 +0,0 @@
-!*.c
-test*
\ No newline at end of file
diff --git a/pandas/_libs/src/parser/Makefile b/pandas/_libs/src/parser/Makefile
deleted file mode 100644
index ec88eaf44ba15..0000000000000
--- a/pandas/_libs/src/parser/Makefile
+++ /dev/null
@@ -1,13 +0,0 @@
-PYTHONBASE = /Library/Frameworks/EPD64.framework/Versions/Current
-NUMPY_INC = /Library/Frameworks/EPD64.framework/Versions/7.1/lib/python2.7/site-packages/numpy/core/include
-PYTHON_INC = -I$(PYTHONBASE)/include/python2.7 -I$(NUMPY_INC)
-PYTHON_LINK = -L$(PYTHONBASE)/lib -lpython
-
-SOURCES = conversions.c parser.c str_to.c
-
-check-syntax:
-	gcc -g $(PYTHON_INC) -o /dev/null -S ${CHK_SOURCES}
-
-test: $(SOURCES)
-	gcc $(PYTHON_INC) -o test $(SOURCES)
-	./test
\ No newline at end of file
diff --git a/pandas/_libs/src/parser/io.c b/pandas/_libs/src/parser/io.c
index 4381ef19e991b..f578ce138e274 100644
--- a/pandas/_libs/src/parser/io.c
+++ b/pandas/_libs/src/parser/io.c
@@ -9,31 +9,41 @@ The full license is in the LICENSE file, distributed with this software.
 
 #include "io.h"
 
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+
+#ifndef O_BINARY
+#define O_BINARY 0
+#endif  // O_BINARY
+
 /*
   On-disk FILE, uncompressed
 */
 
 void *new_file_source(char *fname, size_t buffer_size) {
     file_source *fs = (file_source *)malloc(sizeof(file_source));
-    fs->fp = fopen(fname, "rb");
+    if (fs == NULL) {
+        return NULL;
+    }
 
-    if (fs->fp == NULL) {
+    fs->fd = open(fname, O_RDONLY | O_BINARY);
+    if (fs->fd == -1) {
         free(fs);
         return NULL;
     }
-    setbuf(fs->fp, NULL);
-
-    fs->initial_file_pos = ftell(fs->fp);
 
     // Only allocate this heap memory if we are not memory-mapping the file
     fs->buffer = (char *)malloc((buffer_size + 1) * sizeof(char));
 
     if (fs->buffer == NULL) {
+        close(fs->fd);
+        free(fs);
         return NULL;
     }
 
-    memset(fs->buffer, 0, buffer_size + 1);
-    fs->buffer[buffer_size] = '\0';
+    memset(fs->buffer, '\0', buffer_size + 1);
+    fs->size = buffer_size;
 
     return (void *)fs;
 }
@@ -56,12 +66,12 @@ void *new_rd_source(PyObject *obj) {
 
  */
 
-int del_file_source(void *fs) {
+int del_file_source(void *ptr) {
+    file_source *fs = ptr;
     if (fs == NULL) return 0;
 
-    /* allocated on the heap */
-    free(FS(fs)->buffer);
-    fclose(FS(fs)->fp);
+    free(fs->buffer);
+    close(fs->fd);
     free(fs);
 
     return 0;
@@ -83,17 +93,31 @@ int del_rd_source(void *rds) {
 
 void *buffer_file_bytes(void *source, size_t nbytes, size_t *bytes_read,
                         int *status) {
-    file_source *src = FS(source);
+    file_source *fs = FS(source);
+    ssize_t rv;
 
-    *bytes_read = fread((void *)src->buffer, sizeof(char), nbytes, src->fp);
+    if (nbytes > fs->size) {
+        nbytes = fs->size;
+    }
 
-    if (*bytes_read == 0) {
+    rv = read(fs->fd, fs->buffer, nbytes);
+    switch (rv) {
+    case -1:
+        *status = CALLING_READ_FAILED;
+        *bytes_read = 0;
+        return NULL;
+    case 0:
         *status = REACHED_EOF;
-    } else {
+        *bytes_read = 0;
+        return NULL;
+    default:
         *status = 0;
+        *bytes_read = rv;
+        fs->buffer[rv] = '\0';
+        break;
     }
 
-    return (void *)src->buffer;
+    return (void *)fs->buffer;
 }
 
 void *buffer_rd_bytes(void *source, size_t nbytes, size_t *bytes_read,
@@ -126,7 +150,11 @@ void *buffer_rd_bytes(void *source, size_t nbytes, size_t *bytes_read,
         return NULL;
     } else if (!PyBytes_Check(result)) {
         tmp = PyUnicode_AsUTF8String(result);
-        Py_XDECREF(result);
+        Py_DECREF(result);
+        if (tmp == NULL) {
+            PyGILState_Release(state);
+            return NULL;
+        }
         result = tmp;
     }
 
@@ -152,52 +180,57 @@ void *buffer_rd_bytes(void *source, size_t nbytes, size_t *bytes_read,
 #ifdef HAVE_MMAP
 
 #include <sys/mman.h>
-#include <sys/stat.h>
 
 void *new_mmap(char *fname) {
-    struct stat buf;
-    int fd;
     memory_map *mm;
-    off_t filesize;
+    struct stat stat;
+    size_t filesize;
 
     mm = (memory_map *)malloc(sizeof(memory_map));
-    mm->fp = fopen(fname, "rb");
-
-    fd = fileno(mm->fp);
-    if (fstat(fd, &buf) == -1) {
-        fprintf(stderr, "new_file_buffer: fstat() failed. errno =%d\n", errno);
-        return NULL;
-    }
-    filesize = buf.st_size; /* XXX This might be 32 bits. */
-
     if (mm == NULL) {
-        /* XXX Eventually remove this print statement. */
         fprintf(stderr, "new_file_buffer: malloc() failed.\n");
+        return (NULL);
+    }
+    mm->fd = open(fname, O_RDONLY | O_BINARY);
+    if (mm->fd == -1) {
+        fprintf(stderr, "new_file_buffer: open(%s) failed. errno =%d\n",
+          fname, errno);
+        free(mm);
         return NULL;
     }
-    mm->size = (off_t)filesize;
-    mm->line_number = 0;
 
-    mm->fileno = fd;
-    mm->position = ftell(mm->fp);
-    mm->last_pos = (off_t)filesize;
+    if (fstat(mm->fd, &stat) == -1) {
+        fprintf(stderr, "new_file_buffer: fstat() failed. errno =%d\n",
+          errno);
+        close(mm->fd);
+        free(mm);
+        return NULL;
+    }
+    filesize = stat.st_size; /* XXX This might be 32 bits. */
 
-    mm->memmap = mmap(NULL, filesize, PROT_READ, MAP_SHARED, fd, 0);
-    if (mm->memmap == NULL) {
+    mm->memmap = mmap(NULL, filesize, PROT_READ, MAP_SHARED, mm->fd, 0);
+    if (mm->memmap == MAP_FAILED) {
         /* XXX Eventually remove this print statement. */
         fprintf(stderr, "new_file_buffer: mmap() failed.\n");
+        close(mm->fd);
         free(mm);
-        mm = NULL;
+        return NULL;
     }
 
-    return (void *)mm;
+    mm->size = (off_t)filesize;
+    mm->position = 0;
+
+    return mm;
 }
 
-int del_mmap(void *src) {
-    munmap(MM(src)->memmap, MM(src)->size);
+int del_mmap(void *ptr) {
+    memory_map *mm = ptr;
+
+    if (mm == NULL) return 0;
 
-    fclose(MM(src)->fp);
-    free(src);
+    munmap(mm->memmap, mm->size);
+    close(mm->fd);
+    free(mm);
 
     return 0;
 }
@@ -205,27 +238,26 @@ int del_mmap(void *src) {
 void *buffer_mmap_bytes(void *source, size_t nbytes, size_t *bytes_read,
                         int *status) {
     void *retval;
-    memory_map *src = MM(source);
+    memory_map *src = source;
+    size_t remaining = src->size - src->position;
 
-    if (src->position == src->last_pos) {
+    if (remaining == 0) {
         *bytes_read = 0;
         *status = REACHED_EOF;
         return NULL;
     }
 
-    retval = src->memmap + src->position;
-
-    if (src->position + (off_t)nbytes > src->last_pos) {
-        // fewer than nbytes remaining
-        *bytes_read = src->last_pos - src->position;
-    } else {
-        *bytes_read = nbytes;
+    if (nbytes > remaining) {
+        nbytes = remaining;
     }
 
-    *status = 0;
+    retval = src->memmap + src->position;
 
     /* advance position in mmap data structure */
-    src->position += *bytes_read;
+    src->position += nbytes;
+
+    *bytes_read = nbytes;
+    *status = 0;
 
     return retval;
 }
@@ -245,4 +277,4 @@ void *buffer_mmap_bytes(void *source, size_t nbytes, size_t *bytes_read,
     return NULL;
 }
 
-#endif
+#endif  // HAVE_MMAP
diff --git a/pandas/_libs/src/parser/io.h b/pandas/_libs/src/parser/io.h
index 77121e9a169c1..074322c7bdf78 100644
--- a/pandas/_libs/src/parser/io.h
+++ b/pandas/_libs/src/parser/io.h
@@ -15,42 +15,26 @@ The full license is in the LICENSE file, distributed with this software.
 
 typedef struct _file_source {
     /* The file being read. */
-    FILE *fp;
+    int fd;
 
     char *buffer;
-
-    /* file position when the file_buffer was created. */
-    off_t initial_file_pos;
-
-    /* Offset in the file of the data currently in the buffer. */
-    off_t buffer_file_pos;
-
-    /* Actual number of bytes in the current buffer. (Can be less than
-     * buffer_size.) */
-    off_t last_pos;
+    size_t size;
 } file_source;
 
 #define FS(source) ((file_source *)source)
 
 #if !defined(_WIN32) && !defined(HAVE_MMAP)
 #define HAVE_MMAP
-#endif
+#endif  // HAVE_MMAP
 
 typedef struct _memory_map {
-    FILE *fp;
+    int fd;
 
     /* Size of the file, in bytes. */
-    off_t size;
-
-    /* file position when the file_buffer was created. */
-    off_t initial_file_pos;
-
-    int line_number;
-
-    int fileno;
-    off_t position;
-    off_t last_pos;
     char *memmap;
+    size_t size;
+
+    size_t position;
 } memory_map;
 
 #define MM(src) ((memory_map *)src)
diff --git a/pandas/_libs/src/parser/tokenizer.c b/pandas/_libs/src/parser/tokenizer.c
index 6b0775e54da0c..6acf3c3de0c91 100644
--- a/pandas/_libs/src/parser/tokenizer.c
+++ b/pandas/_libs/src/parser/tokenizer.c
@@ -23,6 +23,8 @@ GitHub. See Python Software Foundation License and BSD licenses for these.
 #include <float.h>
 #include <math.h>
 
+#include "../headers/portable.h"
+
 static void *safe_realloc(void *buffer, size_t size) {
     void *result;
     // OSX is weird.
@@ -69,9 +71,9 @@ static void free_if_not_null(void **ptr) {
 
 */
 
-static void *grow_buffer(void *buffer, int length, int *capacity, int space,
-                         int elsize, int *error) {
-    int cap = *capacity;
+static void *grow_buffer(void *buffer, int64_t length, int64_t *capacity,
+                         int64_t space, int64_t elsize, int *error) {
+    int64_t cap = *capacity;
     void *newbuffer = buffer;
 
     // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
@@ -169,7 +171,7 @@ int parser_cleanup(parser_t *self) {
 }
 
 int parser_init(parser_t *self) {
-    int sz;
+    int64_t sz;
 
     /*
       Initialize data buffers
@@ -196,14 +198,15 @@ int parser_init(parser_t *self) {
     sz = STREAM_INIT_SIZE / 10;
     sz = sz ? sz : 1;
     self->words = (char **)malloc(sz * sizeof(char *));
-    self->word_starts = (int *)malloc(sz * sizeof(int));
+    self->word_starts = (int64_t *)malloc(sz * sizeof(int64_t));
+    self->max_words_cap = sz;
     self->words_cap = sz;
     self->words_len = 0;
 
     // line pointers and metadata
-    self->line_start = (int *)malloc(sz * sizeof(int));
+    self->line_start = (int64_t *)malloc(sz * sizeof(int64_t));
 
-    self->line_fields = (int *)malloc(sz * sizeof(int));
+    self->line_fields = (int64_t *)malloc(sz * sizeof(int64_t));
 
     self->lines_cap = sz;
     self->lines = 0;
@@ -247,7 +250,8 @@ void parser_del(parser_t *self) {
 }
 
 static int make_stream_space(parser_t *self, size_t nbytes) {
-    int i, status, cap;
+    int64_t i, cap, length;
+    int status;
     void *orig_ptr, *newptr;
 
     // Can we fit potentially nbytes tokens (+ null terminators) in the stream?
@@ -261,7 +265,7 @@ static int make_stream_space(parser_t *self, size_t nbytes) {
         ("\n\nmake_stream_space: nbytes = %zu.  grow_buffer(self->stream...)\n",
          nbytes))
     self->stream = (char *)grow_buffer((void *)self->stream, self->stream_len,
-                                       &self->stream_cap, nbytes * 2,
+                                       (int64_t*)&self->stream_cap, nbytes * 2,
                                        sizeof(char), &status);
     TRACE(
         ("make_stream_space: self->stream=%p, self->stream_len = %zu, "
@@ -286,9 +290,25 @@ static int make_stream_space(parser_t *self, size_t nbytes) {
     */
 
     cap = self->words_cap;
+
+    /**
+     * If we are reading in chunks, we need to be aware of the maximum number
+     * of words we have seen in previous chunks (self->max_words_cap), so
+     * that way, we can properly allocate when reading subsequent ones.
+     *
+     * Otherwise, we risk a buffer overflow if we mistakenly under-allocate
+     * just because a recent chunk did not have as many words.
+     */
+    if (self->words_len + nbytes < self->max_words_cap) {
+        length = self->max_words_cap - nbytes - 1;
+    } else {
+        length = self->words_len;
+    }
+
     self->words =
-        (char **)grow_buffer((void *)self->words, self->words_len,
-                             &self->words_cap, nbytes, sizeof(char *), &status);
+        (char **)grow_buffer((void *)self->words, length,
+                             (int64_t*)&self->words_cap, nbytes,
+                             sizeof(char *), &status);
     TRACE(
         ("make_stream_space: grow_buffer(self->self->words, %zu, %zu, %zu, "
          "%d)\n",
@@ -304,11 +324,11 @@ static int make_stream_space(parser_t *self, size_t nbytes) {
              "self->words_cap=%d\n",
              nbytes, self->words_cap))
         newptr = safe_realloc((void *)self->word_starts,
-                              sizeof(int) * self->words_cap);
+                              sizeof(int64_t) * self->words_cap);
         if (newptr == NULL) {
             return PARSER_OUT_OF_MEMORY;
         } else {
-            self->word_starts = (int *)newptr;
+            self->word_starts = (int64_t *)newptr;
         }
     }
 
@@ -317,8 +337,9 @@ static int make_stream_space(parser_t *self, size_t nbytes) {
     */
     cap = self->lines_cap;
     self->line_start =
-        (int *)grow_buffer((void *)self->line_start, self->lines + 1,
-                           &self->lines_cap, nbytes, sizeof(int), &status);
+        (int64_t *)grow_buffer((void *)self->line_start, self->lines + 1,
+                           (int64_t*)&self->lines_cap, nbytes,
+                           sizeof(int64_t), &status);
     TRACE((
         "make_stream_space: grow_buffer(self->line_start, %zu, %zu, %zu, %d)\n",
         self->lines + 1, self->lines_cap, nbytes, status))
@@ -331,11 +352,11 @@ static int make_stream_space(parser_t *self, size_t nbytes) {
         TRACE(("make_stream_space: cap != self->lines_cap, nbytes = %d\n",
                nbytes))
         newptr = safe_realloc((void *)self->line_fields,
-                              sizeof(int) * self->lines_cap);
+                              sizeof(int64_t) * self->lines_cap);
         if (newptr == NULL) {
             return PARSER_OUT_OF_MEMORY;
         } else {
-            self->line_fields = (int *)newptr;
+            self->line_fields = (int64_t *)newptr;
         }
     }
 
@@ -350,7 +371,7 @@ static int push_char(parser_t *self, char c) {
             ("push_char: ERROR!!! self->stream_len(%d) >= "
              "self->stream_cap(%d)\n",
              self->stream_len, self->stream_cap))
-        int bufsize = 100;
+        int64_t bufsize = 100;
         self->error_msg = (char *)malloc(bufsize);
         snprintf(self->error_msg, bufsize,
                  "Buffer overflow caught - possible malformed input file.\n");
@@ -360,14 +381,14 @@ static int push_char(parser_t *self, char c) {
     return 0;
 }
 
-int P_INLINE end_field(parser_t *self) {
+int PANDAS_INLINE end_field(parser_t *self) {
     // XXX cruft
     if (self->words_len >= self->words_cap) {
         TRACE(
             ("end_field: ERROR!!! self->words_len(%zu) >= "
              "self->words_cap(%zu)\n",
              self->words_len, self->words_cap))
-        int bufsize = 100;
+        int64_t bufsize = 100;
         self->error_msg = (char *)malloc(bufsize);
         snprintf(self->error_msg, bufsize,
                  "Buffer overflow caught - possible malformed input file.\n");
@@ -399,8 +420,8 @@ int P_INLINE end_field(parser_t *self) {
 }
 
 static void append_warning(parser_t *self, const char *msg) {
-    int ex_length;
-    int length = strlen(msg);
+    int64_t ex_length;
+    int64_t length = strlen(msg);
     void *newptr;
 
     if (self->warn_msg == NULL) {
@@ -418,14 +439,15 @@ static void append_warning(parser_t *self, const char *msg) {
 
 static int end_line(parser_t *self) {
     char *msg;
-    int fields;
+    int64_t fields;
     int ex_fields = self->expected_fields;
-    int bufsize = 100;  // for error or warning messages
+    int64_t bufsize = 100;  // for error or warning messages
 
     fields = self->line_fields[self->lines];
 
     TRACE(("end_line: Line end, nfields: %d\n", fields));
 
+    TRACE(("end_line: lines: %d\n", self->lines));
     if (self->lines > 0) {
         if (self->expected_fields >= 0) {
             ex_fields = self->expected_fields;
@@ -433,6 +455,7 @@ static int end_line(parser_t *self) {
             ex_fields = self->line_fields[self->lines - 1];
         }
     }
+    TRACE(("end_line: ex_fields: %d\n", ex_fields));
 
     if (self->state == START_FIELD_IN_SKIP_LINE ||
         self->state == IN_FIELD_IN_SKIP_LINE ||
@@ -450,7 +473,7 @@ static int end_line(parser_t *self) {
         return 0;
     }
 
-    if (!(self->lines <= self->header_end + 1) &&
+    if (!(self->lines <= (int64_t) self->header_end + 1) &&
         (self->expected_fields < 0 && fields > ex_fields) && !(self->usecols)) {
         // increment file line count
         self->file_lines++;
@@ -465,8 +488,8 @@ static int end_line(parser_t *self) {
         if (self->error_bad_lines) {
             self->error_msg = (char *)malloc(bufsize);
             snprintf(self->error_msg, bufsize,
-                    "Expected %d fields in line %d, saw %d\n",
-                    ex_fields, self->file_lines, fields);
+                    "Expected %d fields in line %lld, saw %lld\n",
+                    ex_fields, (long long)self->file_lines, (long long)fields);
 
             TRACE(("Error at line %d, %d fields\n", self->file_lines, fields));
 
@@ -477,18 +500,22 @@ static int end_line(parser_t *self) {
                 // pass up error message
                 msg = (char *)malloc(bufsize);
                 snprintf(msg, bufsize,
-                        "Skipping line %d: expected %d fields, saw %d\n",
-                         self->file_lines, ex_fields, fields);
+                        "Skipping line %lld: expected %d fields, saw %lld\n",
+                         (long long)self->file_lines, ex_fields,
+                         (long long)fields);
                 append_warning(self, msg);
                 free(msg);
             }
         }
     } else {
         // missing trailing delimiters
-        if ((self->lines >= self->header_end + 1) && fields < ex_fields) {
+        if ((self->lines >= (int64_t) self->header_end + 1) &&
+                fields < ex_fields) {
             // might overrun the buffer when closing fields
             if (make_stream_space(self, ex_fields - fields) < 0) {
-                self->error_msg = "out of memory";
+                int64_t bufsize = 100;
+                self->error_msg = (char *)malloc(bufsize);
+                snprintf(self->error_msg, bufsize, "out of memory");
                 return -1;
             }
 
@@ -507,7 +534,7 @@ static int end_line(parser_t *self) {
             TRACE((
                 "end_line: ERROR!!! self->lines(%zu) >= self->lines_cap(%zu)\n",
                 self->lines, self->lines_cap))
-            int bufsize = 100;
+            int64_t bufsize = 100;
             self->error_msg = (char *)malloc(bufsize);
             snprintf(self->error_msg, bufsize,
                      "Buffer overflow caught - "
@@ -568,7 +595,7 @@ static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
     self->datalen = bytes_read;
 
     if (status != REACHED_EOF && self->data == NULL) {
-        int bufsize = 200;
+        int64_t bufsize = 200;
         self->error_msg = (char *)malloc(bufsize);
 
         if (status == CALLING_READ_FAILED) {
@@ -599,7 +626,7 @@ static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
     if (slen >= self->stream_cap) {                                           \
         TRACE(("PUSH_CHAR: ERROR!!! slen(%d) >= stream_cap(%d)\n", slen,      \
                self->stream_cap))                                             \
-        int bufsize = 100;                                                    \
+        int64_t bufsize = 100;                                                \
         self->error_msg = (char *)malloc(bufsize);                            \
         snprintf(self->error_msg, bufsize,                                    \
                  "Buffer overflow caught - possible malformed input file.\n");\
@@ -626,7 +653,7 @@ static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
     stream = self->stream + self->stream_len;                        \
     slen = self->stream_len;                                         \
     self->state = STATE;                                             \
-    if (line_limit > 0 && self->lines == start_lines + (int)line_limit) {  \
+    if (line_limit > 0 && self->lines == start_lines + (int64_t)line_limit) {  \
         goto linelimit;                                              \
     }
 
@@ -641,7 +668,7 @@ static int parser_buffer_bytes(parser_t *self, size_t nbytes) {
     stream = self->stream + self->stream_len;                        \
     slen = self->stream_len;                                         \
     self->state = STATE;                                             \
-    if (line_limit > 0 && self->lines == start_lines + (int)line_limit) { \
+    if (line_limit > 0 && self->lines == start_lines + (int64_t)line_limit) { \
         goto linelimit;                                              \
     }
 
@@ -712,15 +739,17 @@ int skip_this_line(parser_t *self, int64_t rownum) {
     }
 }
 
-int tokenize_bytes(parser_t *self, size_t line_limit, int start_lines) {
-    int i, slen;
+int tokenize_bytes(parser_t *self, size_t line_limit, int64_t start_lines) {
+    int64_t i, slen;
     int should_skip;
     char c;
     char *stream;
     char *buf = self->data + self->datapos;
 
     if (make_stream_space(self, self->datalen - self->datapos) < 0) {
-        self->error_msg = "out of memory";
+        int64_t bufsize = 100;
+        self->error_msg = (char *)malloc(bufsize);
+        snprintf(self->error_msg, bufsize, "out of memory");
         return -1;
     }
 
@@ -832,6 +861,9 @@ int tokenize_bytes(parser_t *self, size_t line_limit, int start_lines) {
                 } else if (IS_CARRIAGE(c)) {
                     self->state = EAT_CRNL;
                     break;
+                } else if (IS_COMMENT_CHAR(c)) {
+                    self->state = EAT_COMMENT;
+                    break;
                 } else if (!IS_WHITESPACE(c)) {
                     self->state = START_FIELD;
                     // fall through to subsequent state
@@ -1022,7 +1054,7 @@ int tokenize_bytes(parser_t *self, size_t line_limit, int start_lines) {
                     PUSH_CHAR(c);
                     self->state = IN_FIELD;
                 } else {
-                    int bufsize = 100;
+                    int64_t bufsize = 100;
                     self->error_msg = (char *)malloc(bufsize);
                     snprintf(self->error_msg, bufsize,
                             "delimiter expected after quote in quote");
@@ -1076,7 +1108,7 @@ int tokenize_bytes(parser_t *self, size_t line_limit, int start_lines) {
                         --i;
                         buf--;  // let's try this character again (HACK!)
                         if (line_limit > 0 &&
-                            self->lines == start_lines + (int)line_limit) {
+                            self->lines == start_lines + line_limit) {
                             goto linelimit;
                         }
                     }
@@ -1118,7 +1150,7 @@ int tokenize_bytes(parser_t *self, size_t line_limit, int start_lines) {
 }
 
 static int parser_handle_eof(parser_t *self) {
-    int bufsize = 100;
+    int64_t bufsize = 100;
 
     TRACE(
         ("handling eof, datalen: %d, pstate: %d\n", self->datalen, self->state))
@@ -1136,7 +1168,8 @@ static int parser_handle_eof(parser_t *self) {
         case IN_QUOTED_FIELD:
             self->error_msg = (char *)malloc(bufsize);
             snprintf(self->error_msg, bufsize,
-                    "EOF inside string starting at line %d", self->file_lines);
+                    "EOF inside string starting at row %lld",
+                    (long long)self->file_lines);
             return -1;
 
         case ESCAPED_CHAR:
@@ -1162,9 +1195,9 @@ static int parser_handle_eof(parser_t *self) {
 }
 
 int parser_consume_rows(parser_t *self, size_t nrows) {
-    int i, offset, word_deletions, char_count;
+    int64_t i, offset, word_deletions, char_count;
 
-    if ((int)nrows > self->lines) {
+    if (nrows > self->lines) {
         nrows = self->lines;
     }
 
@@ -1201,7 +1234,7 @@ int parser_consume_rows(parser_t *self, size_t nrows) {
     self->word_start -= char_count;
 
     /* move line metadata */
-    for (i = 0; i < self->lines - (int)nrows + 1; ++i) {
+    for (i = 0; i < self->lines - nrows + 1; ++i) {
         offset = i + nrows;
         self->line_start[i] = self->line_start[offset] - word_deletions;
         self->line_fields[i] = self->line_fields[offset];
@@ -1224,11 +1257,24 @@ int parser_trim_buffers(parser_t *self) {
     size_t new_cap;
     void *newptr;
 
-    int i;
+    int64_t i;
+
+    /**
+     * Before we free up space and trim, we should
+     * save how many words we saw when parsing, if
+     * it exceeds the maximum number we saw before.
+     *
+     * This is important for when we read in chunks,
+     * so that we can inform subsequent chunk parsing
+     * as to how many words we could possibly see.
+     */
+    if (self->words_cap > self->max_words_cap) {
+        self->max_words_cap = self->words_cap;
+    }
 
     /* trim words, word_starts */
     new_cap = _next_pow2(self->words_len) + 1;
-    if ((int)new_cap < self->words_cap) {
+    if (new_cap < self->words_cap) {
         TRACE(("parser_trim_buffers: new_cap < self->words_cap\n"));
         newptr = safe_realloc((void *)self->words, new_cap * sizeof(char *));
         if (newptr == NULL) {
@@ -1236,11 +1282,12 @@ int parser_trim_buffers(parser_t *self) {
         } else {
             self->words = (char **)newptr;
         }
-        newptr = safe_realloc((void *)self->word_starts, new_cap * sizeof(int));
+        newptr = safe_realloc((void *)self->word_starts,
+                              new_cap * sizeof(int64_t));
         if (newptr == NULL) {
             return PARSER_OUT_OF_MEMORY;
         } else {
-            self->word_starts = (int *)newptr;
+            self->word_starts = (int64_t *)newptr;
             self->words_cap = new_cap;
         }
     }
@@ -1251,7 +1298,7 @@ int parser_trim_buffers(parser_t *self) {
         ("parser_trim_buffers: new_cap = %zu, stream_cap = %zu, lines_cap = "
          "%zu\n",
          new_cap, self->stream_cap, self->lines_cap));
-    if ((int)new_cap < self->stream_cap) {
+    if (new_cap < self->stream_cap) {
         TRACE(
             ("parser_trim_buffers: new_cap < self->stream_cap, calling "
              "safe_realloc\n"));
@@ -1279,19 +1326,21 @@ int parser_trim_buffers(parser_t *self) {
 
     /* trim line_start, line_fields */
     new_cap = _next_pow2(self->lines) + 1;
-    if ((int)new_cap < self->lines_cap) {
+    if (new_cap < self->lines_cap) {
         TRACE(("parser_trim_buffers: new_cap < self->lines_cap\n"));
-        newptr = safe_realloc((void *)self->line_start, new_cap * sizeof(int));
+        newptr = safe_realloc((void *)self->line_start,
+                              new_cap * sizeof(int64_t));
         if (newptr == NULL) {
             return PARSER_OUT_OF_MEMORY;
         } else {
-            self->line_start = (int *)newptr;
+            self->line_start = (int64_t *)newptr;
         }
-        newptr = safe_realloc((void *)self->line_fields, new_cap * sizeof(int));
+        newptr = safe_realloc((void *)self->line_fields,
+                              new_cap * sizeof(int64_t));
         if (newptr == NULL) {
             return PARSER_OUT_OF_MEMORY;
         } else {
-            self->line_fields = (int *)newptr;
+            self->line_fields = (int64_t *)newptr;
             self->lines_cap = new_cap;
         }
     }
@@ -1299,21 +1348,6 @@ int parser_trim_buffers(parser_t *self) {
     return 0;
 }
 
-void debug_print_parser(parser_t *self) {
-    int j, line;
-    char *token;
-
-    for (line = 0; line < self->lines; ++line) {
-        printf("(Parsed) Line %d: ", line);
-
-        for (j = 0; j < self->line_fields[j]; ++j) {
-            token = self->words[j + self->line_start[line]];
-            printf("%s ", token);
-        }
-        printf("\n");
-    }
-}
-
 /*
   nrows : number of rows to tokenize (or until reach EOF)
   all : tokenize all the data vs. certain number of rows
@@ -1321,7 +1355,7 @@ void debug_print_parser(parser_t *self) {
 
 int _tokenize_helper(parser_t *self, size_t nrows, int all) {
     int status = 0;
-    int start_lines = self->lines;
+    int64_t start_lines = self->lines;
 
     if (self->state == FINISHED) {
         return 0;
@@ -1329,10 +1363,10 @@ int _tokenize_helper(parser_t *self, size_t nrows, int all) {
 
     TRACE((
         "_tokenize_helper: Asked to tokenize %d rows, datapos=%d, datalen=%d\n",
-        (int)nrows, self->datapos, self->datalen));
+        nrows, self->datapos, self->datalen));
 
     while (1) {
-        if (!all && self->lines - start_lines >= (int)nrows) break;
+        if (!all && self->lines - start_lines >= nrows) break;
 
         if (self->datapos == self->datalen) {
             status = parser_buffer_bytes(self, self->chunksize);
@@ -1378,11 +1412,11 @@ int tokenize_all_rows(parser_t *self) {
     return status;
 }
 
-P_INLINE void uppercase(char *p) {
-    for (; *p; ++p) *p = toupper(*p);
+PANDAS_INLINE void uppercase(char *p) {
+    for (; *p; ++p) *p = toupper_ascii(*p);
 }
 
-int P_INLINE to_longlong(char *item, long long *p_value) {
+int PANDAS_INLINE to_longlong(char *item, long long *p_value) {
     char *p_end;
 
     // Try integer conversion.  We explicitly give the base to be 10. If
@@ -1392,7 +1426,7 @@ int P_INLINE to_longlong(char *item, long long *p_value) {
     *p_value = strtoll(item, &p_end, 10);
 
     // Allow trailing spaces.
-    while (isspace(*p_end)) ++p_end;
+    while (isspace_ascii(*p_end)) ++p_end;
 
     return (errno == 0) && (!*p_end);
 }
@@ -1446,7 +1480,7 @@ int main(int argc, char *argv[]) {
 
     return 0;
 }
-#endif
+#endif  // TEST
 
 // ---------------------------------------------------------------------------
 // Implementation of xstrtod
@@ -1509,7 +1543,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
     errno = 0;
 
     // Skip leading whitespace.
-    while (isspace(*p)) p++;
+    while (isspace_ascii(*p)) p++;
 
     // Handle optional sign.
     negative = 0;
@@ -1526,7 +1560,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
     num_decimals = 0;
 
     // Process string of digits.
-    while (isdigit(*p)) {
+    while (isdigit_ascii(*p)) {
         number = number * 10. + (*p - '0');
         p++;
         num_digits++;
@@ -1538,7 +1572,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
     if (*p == decimal) {
         p++;
 
-        while (isdigit(*p)) {
+        while (isdigit_ascii(*p)) {
             number = number * 10. + (*p - '0');
             p++;
             num_digits++;
@@ -1557,7 +1591,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
     if (negative) number = -number;
 
     // Process an exponent string.
-    if (toupper(*p) == toupper(sci)) {
+    if (toupper_ascii(*p) == toupper_ascii(sci)) {
         // Handle optional sign.
         negative = 0;
         switch (*++p) {
@@ -1570,7 +1604,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
         // Process string of digits.
         num_digits = 0;
         n = 0;
-        while (isdigit(*p)) {
+        while (isdigit_ascii(*p)) {
             n = n * 10 + (*p - '0');
             num_digits++;
             p++;
@@ -1611,7 +1645,7 @@ double xstrtod(const char *str, char **endptr, char decimal, char sci,
 
     if (skip_trailing) {
         // Skip trailing whitespace.
-        while (isspace(*p)) p++;
+        while (isspace_ascii(*p)) p++;
     }
 
     if (endptr) *endptr = p;
@@ -1665,7 +1699,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
     errno = 0;
 
     // Skip leading whitespace.
-    while (isspace(*p)) p++;
+    while (isspace_ascii(*p)) p++;
 
     // Handle optional sign.
     negative = 0;
@@ -1682,7 +1716,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
     num_decimals = 0;
 
     // Process string of digits.
-    while (isdigit(*p)) {
+    while (isdigit_ascii(*p)) {
         if (num_digits < max_digits) {
             number = number * 10. + (*p - '0');
             num_digits++;
@@ -1698,7 +1732,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
     if (*p == decimal) {
         p++;
 
-        while (num_digits < max_digits && isdigit(*p)) {
+        while (num_digits < max_digits && isdigit_ascii(*p)) {
             number = number * 10. + (*p - '0');
             p++;
             num_digits++;
@@ -1706,7 +1740,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
         }
 
         if (num_digits >= max_digits)  // Consume extra decimal digits.
-            while (isdigit(*p)) ++p;
+            while (isdigit_ascii(*p)) ++p;
 
         exponent -= num_decimals;
     }
@@ -1720,7 +1754,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
     if (negative) number = -number;
 
     // Process an exponent string.
-    if (toupper(*p) == toupper(sci)) {
+    if (toupper_ascii(*p) == toupper_ascii(sci)) {
         // Handle optional sign
         negative = 0;
         switch (*++p) {
@@ -1733,7 +1767,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
         // Process string of digits.
         num_digits = 0;
         n = 0;
-        while (isdigit(*p)) {
+        while (isdigit_ascii(*p)) {
             n = n * 10 + (*p - '0');
             num_digits++;
             p++;
@@ -1766,7 +1800,7 @@ double precise_xstrtod(const char *str, char **endptr, char decimal, char sci,
 
     if (skip_trailing) {
         // Skip trailing whitespace.
-        while (isspace(*p)) p++;
+        while (isspace_ascii(*p)) p++;
     }
 
     if (endptr) *endptr = p;
@@ -1801,7 +1835,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
     int d;
 
     // Skip leading spaces.
-    while (isspace(*p)) {
+    while (isspace_ascii(*p)) {
         ++p;
     }
 
@@ -1814,7 +1848,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
     }
 
     // Check that there is a first digit.
-    if (!isdigit(*p)) {
+    if (!isdigit_ascii(*p)) {
         // Error...
         *error = ERROR_NO_DIGITS;
         return 0;
@@ -1833,7 +1867,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
                 if (d == tsep) {
                     d = *++p;
                     continue;
-                } else if (!isdigit(d)) {
+                } else if (!isdigit_ascii(d)) {
                     break;
                 }
                 if ((number > pre_min) ||
@@ -1846,7 +1880,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
                 }
             }
         } else {
-            while (isdigit(d)) {
+            while (isdigit_ascii(d)) {
                 if ((number > pre_min) ||
                     ((number == pre_min) && (d - '0' <= dig_pre_min))) {
                     number = number * 10 - (d - '0');
@@ -1870,7 +1904,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
                 if (d == tsep) {
                     d = *++p;
                     continue;
-                } else if (!isdigit(d)) {
+                } else if (!isdigit_ascii(d)) {
                     break;
                 }
                 if ((number < pre_max) ||
@@ -1884,7 +1918,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
                 }
             }
         } else {
-            while (isdigit(d)) {
+            while (isdigit_ascii(d)) {
                 if ((number < pre_max) ||
                     ((number == pre_max) && (d - '0' <= dig_pre_max))) {
                     number = number * 10 + (d - '0');
@@ -1899,7 +1933,7 @@ int64_t str_to_int64(const char *p_item, int64_t int_min, int64_t int_max,
     }
 
     // Skip trailing spaces.
-    while (isspace(*p)) {
+    while (isspace_ascii(*p)) {
         ++p;
     }
 
@@ -1922,7 +1956,7 @@ uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
     int d;
 
     // Skip leading spaces.
-    while (isspace(*p)) {
+    while (isspace_ascii(*p)) {
         ++p;
     }
 
@@ -1936,7 +1970,7 @@ uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
     }
 
     // Check that there is a first digit.
-    if (!isdigit(*p)) {
+    if (!isdigit_ascii(*p)) {
         // Error...
         *error = ERROR_NO_DIGITS;
         return 0;
@@ -1952,7 +1986,7 @@ uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
             if (d == tsep) {
                 d = *++p;
                 continue;
-            } else if (!isdigit(d)) {
+            } else if (!isdigit_ascii(d)) {
                 break;
             }
             if ((number < pre_max) ||
@@ -1966,7 +2000,7 @@ uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
             }
         }
     } else {
-        while (isdigit(d)) {
+        while (isdigit_ascii(d)) {
             if ((number < pre_max) ||
                 ((number == pre_max) && (d - '0' <= dig_pre_max))) {
                 number = number * 10 + (d - '0');
@@ -1980,7 +2014,7 @@ uint64_t str_to_uint64(uint_state *state, const char *p_item, int64_t int_max,
     }
 
     // Skip trailing spaces.
-    while (isspace(*p)) {
+    while (isspace_ascii(*p)) {
         ++p;
     }
 
diff --git a/pandas/_libs/src/parser/tokenizer.h b/pandas/_libs/src/parser/tokenizer.h
index b4344e8a6c070..ce9dd39b16222 100644
--- a/pandas/_libs/src/parser/tokenizer.h
+++ b/pandas/_libs/src/parser/tokenizer.h
@@ -27,6 +27,7 @@ See LICENSE for the license
 #define ERROR_INVALID_CHARS 3
 
 #include "../headers/stdint.h"
+#include "../inline_helper.h"
 
 #include "khash.h"
 
@@ -38,21 +39,10 @@ See LICENSE for the license
 #define REACHED_EOF 1
 #define CALLING_READ_FAILED 2
 
-#ifndef P_INLINE
-#if defined(__GNUC__)
-#define P_INLINE static __inline__
-#elif defined(_MSC_VER)
-#define P_INLINE
-#elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-#define P_INLINE static inline
-#else
-#define P_INLINE
-#endif
-#endif
 
 #if defined(_MSC_VER)
 #define strtoll _strtoi64
-#endif
+#endif  // _MSC_VER
 
 /*
 
@@ -85,7 +75,7 @@ See LICENSE for the license
 #define TRACE(X) printf X;
 #else
 #define TRACE(X)
-#endif
+#endif  // VERBOSE
 
 #define PARSER_OUT_OF_MEMORY -1
 
@@ -137,30 +127,31 @@ typedef struct parser_t {
     io_callback cb_io;
     io_cleanup cb_cleanup;
 
-    int chunksize;  // Number of bytes to prepare for each chunk
-    char *data;     // pointer to data to be processed
-    int datalen;    // amount of data available
-    int datapos;
+    int64_t chunksize;      // Number of bytes to prepare for each chunk
+    char *data;             // pointer to data to be processed
+    int64_t datalen;        // amount of data available
+    int64_t datapos;
 
     // where to write out tokenized data
     char *stream;
-    int stream_len;
-    int stream_cap;
+    int64_t stream_len;
+    int64_t stream_cap;
 
     // Store words in (potentially ragged) matrix for now, hmm
     char **words;
-    int *word_starts;  // where we are in the stream
-    int words_len;
-    int words_cap;
+    int64_t *word_starts;   // where we are in the stream
+    int64_t words_len;
+    int64_t words_cap;
+    int64_t max_words_cap;  // maximum word cap encountered
 
-    char *pword_start;  // pointer to stream start of current field
-    int word_start;     // position start of current field
+    char *pword_start;      // pointer to stream start of current field
+    int64_t word_start;     // position start of current field
 
-    int *line_start;   // position in words for start of line
-    int *line_fields;  // Number of fields in each line
-    int lines;         // Number of (good) lines observed
-    int file_lines;  // Number of file lines observed (including bad or skipped)
-    int lines_cap;   // Vector capacity
+    int64_t *line_start;    // position in words for start of line
+    int64_t *line_fields;   // Number of fields in each line
+    int64_t lines;          // Number of (good) lines observed
+    int64_t file_lines;     // Number of lines (including bad or skipped)
+    int64_t lines_cap;      // Vector capacity
 
     // Tokenizing stuff
     ParserState state;
@@ -193,9 +184,9 @@ typedef struct parser_t {
     // thousands separator (comma, period)
     char thousands;
 
-    int header;        // Boolean: 1: has header, 0: no header
-    int header_start;  // header row start
-    int header_end;    // header row end
+    int header;            // Boolean: 1: has header, 0: no header
+    int64_t header_start;  // header row start
+    int64_t header_end;    // header row end
 
     void *skipset;
     PyObject *skipfunc;
@@ -216,7 +207,7 @@ typedef struct parser_t {
 
 typedef struct coliter_t {
     char **words;
-    int *line_start;
+    int64_t *line_start;
     int col;
 } coliter_t;
 
@@ -225,7 +216,7 @@ coliter_t *coliter_new(parser_t *self, int i);
 
 #define COLITER_NEXT(iter, word)                          \
     do {                                                  \
-        const int i = *iter.line_start++ + iter.col;      \
+        const int64_t i = *iter.line_start++ + iter.col;      \
         word = i < *iter.line_start ? iter.words[i] : ""; \
     } while (0)
 
@@ -247,8 +238,6 @@ void parser_del(parser_t *self);
 
 void parser_set_default_options(parser_t *self);
 
-void debug_print_parser(parser_t *self);
-
 int tokenize_nrows(parser_t *self, size_t nrows);
 
 int tokenize_all_rows(parser_t *self);
diff --git a/pandas/_libs/src/period_helper.c b/pandas/_libs/src/period_helper.c
deleted file mode 100644
index 19f810eb54ea7..0000000000000
--- a/pandas/_libs/src/period_helper.c
+++ /dev/null
@@ -1,1518 +0,0 @@
-/*
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Borrowed and derived code from scikits.timeseries that we will expose via
-Cython to pandas. This primarily concerns interval representation and
-frequency conversion routines.
-
-See end of file for stuff pandas uses (search for 'pandas').
-*/
-
-#include "period_helper.h"
-
-/* ------------------------------------------------------------------
- * Code derived from scikits.timeseries
- * ------------------------------------------------------------------*/
-
-static int mod_compat(int x, int m) {
-    int result = x % m;
-    if (result < 0) return result + m;
-    return result;
-}
-
-static int floordiv(int x, int divisor) {
-    if (x < 0) {
-        if (mod_compat(x, divisor)) {
-            return x / divisor - 1;
-        } else {
-            return x / divisor;
-        }
-    } else {
-        return x / divisor;
-    }
-}
-
-/* Table with day offsets for each month (0-based, without and with leap) */
-static int month_offset[2][13] = {
-    {0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365},
-    {0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366}};
-
-/* Table of number of days in a month (0-based, without and with leap) */
-static int days_in_month[2][12] = {
-    {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31},
-    {31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31}};
-
-/* Return 1/0 iff year points to a leap year in calendar. */
-static int dInfoCalc_Leapyear(npy_int64 year, int calendar) {
-    if (calendar == GREGORIAN_CALENDAR) {
-        return (year % 4 == 0) && ((year % 100 != 0) || (year % 400 == 0));
-    } else {
-        return (year % 4 == 0);
-    }
-}
-
-/* Return the day of the week for the given absolute date. */
-static int dInfoCalc_DayOfWeek(npy_int64 absdate) {
-    int day_of_week;
-
-    if (absdate >= 1) {
-        day_of_week = (absdate - 1) % 7;
-    } else {
-        day_of_week = 6 - ((-absdate) % 7);
-    }
-    return day_of_week;
-}
-
-static int monthToQuarter(int month) { return ((month - 1) / 3) + 1; }
-
-/* Return the year offset, that is the absolute date of the day
-   31.12.(year-1) in the given calendar.
-
-   Note:
-   For the Julian calendar we shift the absdate (which is measured
-   using the Gregorian Epoch) value by two days because the Epoch
-   (0001-01-01) in the Julian calendar lies 2 days before the Epoch in
-   the Gregorian calendar. */
-static int dInfoCalc_YearOffset(npy_int64 year, int calendar) {
-    year--;
-    if (calendar == GREGORIAN_CALENDAR) {
-        if (year >= 0 || -1 / 4 == -1)
-            return year * 365 + year / 4 - year / 100 + year / 400;
-        else
-            return year * 365 + (year - 3) / 4 - (year - 99) / 100 +
-                   (year - 399) / 400;
-    } else if (calendar == JULIAN_CALENDAR) {
-        if (year >= 0 || -1 / 4 == -1)
-            return year * 365 + year / 4 - 2;
-        else
-            return year * 365 + (year - 3) / 4 - 2;
-    }
-    Py_Error(PyExc_ValueError, "unknown calendar");
-onError:
-    return INT_ERR_CODE;
-}
-
-/* Set the instance's value using the given date and time. calendar may be set
- * to the flags: GREGORIAN_CALENDAR, JULIAN_CALENDAR to indicate the calendar
- * to be used. */
-
-static int dInfoCalc_SetFromDateAndTime(struct date_info *dinfo, int year,
-                                        int month, int day, int hour,
-                                        int minute, double second,
-                                        int calendar) {
-    /* Calculate the absolute date */
-    {
-        int leap;
-        npy_int64 absdate;
-        int yearoffset;
-
-        /* Range check */
-        Py_AssertWithArg(year > -(INT_MAX / 366) && year < (INT_MAX / 366),
-                         PyExc_ValueError, "year out of range: %i", year);
-
-        /* Is it a leap year ? */
-        leap = dInfoCalc_Leapyear(year, calendar);
-
-        /* Negative month values indicate months relative to the years end */
-        if (month < 0) month += 13;
-        Py_AssertWithArg(month >= 1 && month <= 12, PyExc_ValueError,
-                         "month out of range (1-12): %i", month);
-
-        /* Negative values indicate days relative to the months end */
-        if (day < 0) day += days_in_month[leap][month - 1] + 1;
-        Py_AssertWithArg(day >= 1 && day <= days_in_month[leap][month - 1],
-                         PyExc_ValueError, "day out of range: %i", day);
-
-        yearoffset = dInfoCalc_YearOffset(year, calendar);
-        if (yearoffset == INT_ERR_CODE) goto onError;
-
-        absdate = day + month_offset[leap][month - 1] + yearoffset;
-
-        dinfo->absdate = absdate;
-
-        dinfo->year = year;
-        dinfo->month = month;
-        dinfo->quarter = ((month - 1) / 3) + 1;
-        dinfo->day = day;
-
-        dinfo->day_of_week = dInfoCalc_DayOfWeek(absdate);
-        dinfo->day_of_year = (short)(absdate - yearoffset);
-
-        dinfo->calendar = calendar;
-    }
-
-    /* Calculate the absolute time */
-    {
-        Py_AssertWithArg(hour >= 0 && hour <= 23, PyExc_ValueError,
-                         "hour out of range (0-23): %i", hour);
-        Py_AssertWithArg(minute >= 0 && minute <= 59, PyExc_ValueError,
-                         "minute out of range (0-59): %i", minute);
-        Py_AssertWithArg(
-            second >= (double)0.0 &&
-                (second < (double)60.0 ||
-                 (hour == 23 && minute == 59 && second < (double)61.0)),
-            PyExc_ValueError,
-            "second out of range (0.0 - <60.0; <61.0 for 23:59): %f", second);
-
-        dinfo->abstime = (double)(hour * 3600 + minute * 60) + second;
-
-        dinfo->hour = hour;
-        dinfo->minute = minute;
-        dinfo->second = second;
-    }
-    return 0;
-
-onError:
-    return INT_ERR_CODE;
-}
-
-/* Sets the date part of the date_info struct using the indicated
-   calendar.
-
-   XXX This could also be done using some integer arithmetics rather
-       than with this iterative approach... */
-static int dInfoCalc_SetFromAbsDate(register struct date_info *dinfo,
-                                    npy_int64 absdate, int calendar) {
-    register npy_int64 year;
-    npy_int64 yearoffset;
-    int leap, dayoffset;
-    int *monthoffset;
-
-    /* Approximate year */
-    if (calendar == GREGORIAN_CALENDAR) {
-        year = (npy_int64)(((double)absdate) / 365.2425);
-    } else if (calendar == JULIAN_CALENDAR) {
-        year = (npy_int64)(((double)absdate) / 365.25);
-    } else {
-        Py_Error(PyExc_ValueError, "unknown calendar");
-    }
-
-    if (absdate > 0) year++;
-
-    /* Apply corrections to reach the correct year */
-    while (1) {
-        /* Calculate the year offset */
-        yearoffset = dInfoCalc_YearOffset(year, calendar);
-        if (yearoffset == INT_ERR_CODE) goto onError;
-
-        /* Backward correction: absdate must be greater than the
-           yearoffset */
-        if (yearoffset >= absdate) {
-            year--;
-            continue;
-        }
-
-        dayoffset = absdate - yearoffset;
-        leap = dInfoCalc_Leapyear(year, calendar);
-
-        /* Forward correction: non leap years only have 365 days */
-        if (dayoffset > 365 && !leap) {
-            year++;
-            continue;
-        }
-        break;
-    }
-
-    dinfo->year = year;
-    dinfo->calendar = calendar;
-
-    /* Now iterate to find the month */
-    monthoffset = month_offset[leap];
-    {
-        register int month;
-
-        for (month = 1; month < 13; month++) {
-            if (monthoffset[month] >= dayoffset) break;
-        }
-
-        dinfo->month = month;
-        dinfo->quarter = monthToQuarter(month);
-        dinfo->day = dayoffset - month_offset[leap][month - 1];
-    }
-
-    dinfo->day_of_week = dInfoCalc_DayOfWeek(absdate);
-    dinfo->day_of_year = dayoffset;
-    dinfo->absdate = absdate;
-
-    return 0;
-
-onError:
-    return INT_ERR_CODE;
-}
-
-///////////////////////////////////////////////
-
-// frequency specifc conversion routines
-// each function must take an integer fromDate and
-// a char relation ('S' or 'E' for 'START' or 'END')
-///////////////////////////////////////////////////////////////////////
-
-// helpers for frequency conversion routines //
-
-static int daytime_conversion_factors[][2] = {
-    {FR_DAY, 1},   {FR_HR, 24},   {FR_MIN, 60},  {FR_SEC, 60},
-    {FR_MS, 1000}, {FR_US, 1000}, {FR_NS, 1000}, {0, 0}};
-
-static npy_int64 **daytime_conversion_factor_matrix = NULL;
-
-PANDAS_INLINE int max_value(int a, int b) { return a > b ? a : b; }
-
-PANDAS_INLINE int min_value(int a, int b) { return a < b ? a : b; }
-
-PANDAS_INLINE int get_freq_group(int freq) { return (freq / 1000) * 1000; }
-
-PANDAS_INLINE int get_freq_group_index(int freq) { return freq / 1000; }
-
-static int calc_conversion_factors_matrix_size(void) {
-    int matrix_size = 0;
-    int index;
-    for (index = 0;; index++) {
-        int period_value =
-            get_freq_group_index(daytime_conversion_factors[index][0]);
-        if (period_value == 0) {
-            break;
-        }
-        matrix_size = max_value(matrix_size, period_value);
-    }
-    return matrix_size + 1;
-}
-
-static void alloc_conversion_factors_matrix(int matrix_size) {
-    int row_index;
-    int column_index;
-    daytime_conversion_factor_matrix =
-        malloc(matrix_size * sizeof(**daytime_conversion_factor_matrix));
-    for (row_index = 0; row_index < matrix_size; row_index++) {
-        daytime_conversion_factor_matrix[row_index] =
-            malloc(matrix_size * sizeof(**daytime_conversion_factor_matrix));
-        for (column_index = 0; column_index < matrix_size; column_index++) {
-            daytime_conversion_factor_matrix[row_index][column_index] = 0;
-        }
-    }
-}
-
-static npy_int64 calculate_conversion_factor(int start_value, int end_value) {
-    npy_int64 conversion_factor = 0;
-    int index;
-    for (index = 0;; index++) {
-        int freq_group = daytime_conversion_factors[index][0];
-
-        if (freq_group == 0) {
-            conversion_factor = 0;
-            break;
-        }
-
-        if (freq_group == start_value) {
-            conversion_factor = 1;
-        } else {
-            conversion_factor *= daytime_conversion_factors[index][1];
-        }
-
-        if (freq_group == end_value) {
-            break;
-        }
-    }
-    return conversion_factor;
-}
-
-static void populate_conversion_factors_matrix(void) {
-    int row_index_index;
-    int row_value, row_index;
-    int column_index_index;
-    int column_value, column_index;
-
-    for (row_index_index = 0;; row_index_index++) {
-        row_value = daytime_conversion_factors[row_index_index][0];
-        if (row_value == 0) {
-            break;
-        }
-        row_index = get_freq_group_index(row_value);
-        for (column_index_index = row_index_index;; column_index_index++) {
-            column_value = daytime_conversion_factors[column_index_index][0];
-            if (column_value == 0) {
-                break;
-            }
-            column_index = get_freq_group_index(column_value);
-
-            daytime_conversion_factor_matrix[row_index][column_index] =
-                calculate_conversion_factor(row_value, column_value);
-        }
-    }
-}
-
-void initialize_daytime_conversion_factor_matrix() {
-    if (daytime_conversion_factor_matrix == NULL) {
-        int matrix_size = calc_conversion_factors_matrix_size();
-        alloc_conversion_factors_matrix(matrix_size);
-        populate_conversion_factors_matrix();
-    }
-}
-
-PANDAS_INLINE npy_int64 get_daytime_conversion_factor(int from_index,
-                                                      int to_index) {
-    return daytime_conversion_factor_matrix[min_value(from_index, to_index)]
-                                           [max_value(from_index, to_index)];
-}
-
-PANDAS_INLINE npy_int64 upsample_daytime(npy_int64 ordinal,
-                                         asfreq_info *af_info, int atEnd) {
-    if (atEnd) {
-        return (ordinal + 1) * af_info->intraday_conversion_factor - 1;
-    } else {
-        return ordinal * af_info->intraday_conversion_factor;
-    }
-}
-
-PANDAS_INLINE npy_int64 downsample_daytime(npy_int64 ordinal,
-                                           asfreq_info *af_info, int atEnd) {
-    return ordinal / (af_info->intraday_conversion_factor);
-}
-
-PANDAS_INLINE npy_int64 transform_via_day(npy_int64 ordinal, char relation,
-                                          asfreq_info *af_info,
-                                          freq_conv_func first_func,
-                                          freq_conv_func second_func) {
-    // printf("transform_via_day(%ld, %ld, %d)\n", ordinal,
-    // af_info->intraday_conversion_factor,
-    // af_info->intraday_conversion_upsample);
-    npy_int64 result;
-
-    result = (*first_func)(ordinal, relation, af_info);
-    result = (*second_func)(result, relation, af_info);
-
-    return result;
-}
-
-static npy_int64 DtoB_weekday(npy_int64 absdate) {
-    return (((absdate) / 7) * 5) + (absdate) % 7 - BDAY_OFFSET;
-}
-
-static npy_int64 DtoB_WeekendToMonday(npy_int64 absdate, int day_of_week) {
-    if (day_of_week > 4) {
-        // change to Monday after weekend
-        absdate += (7 - day_of_week);
-    }
-    return DtoB_weekday(absdate);
-}
-
-static npy_int64 DtoB_WeekendToFriday(npy_int64 absdate, int day_of_week) {
-    if (day_of_week > 4) {
-        // change to friday before weekend
-        absdate -= (day_of_week - 4);
-    }
-    return DtoB_weekday(absdate);
-}
-
-static npy_int64 absdate_from_ymd(int y, int m, int d) {
-    struct date_info tempDate;
-    if (dInfoCalc_SetFromDateAndTime(&tempDate, y, m, d, 0, 0, 0,
-                                     GREGORIAN_CALENDAR)) {
-        return INT_ERR_CODE;
-    }
-    return tempDate.absdate;
-}
-
-//************ FROM DAILY ***************
-
-static npy_int64 asfreq_DTtoA(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    struct date_info dinfo;
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET,
-                                 GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-    if (dinfo.month > af_info->to_a_year_end) {
-        return (npy_int64)(dinfo.year + 1 - BASE_YEAR);
-    } else {
-        return (npy_int64)(dinfo.year - BASE_YEAR);
-    }
-}
-
-static npy_int64 DtoQ_yq(npy_int64 ordinal, asfreq_info *af_info, int *year,
-                         int *quarter) {
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET,
-                                 GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-    if (af_info->to_q_year_end != 12) {
-        dinfo.month -= af_info->to_q_year_end;
-        if (dinfo.month <= 0) {
-            dinfo.month += 12;
-        } else {
-            dinfo.year += 1;
-        }
-        dinfo.quarter = monthToQuarter(dinfo.month);
-    }
-
-    *year = dinfo.year;
-    *quarter = dinfo.quarter;
-
-    return 0;
-}
-
-static npy_int64 asfreq_DTtoQ(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    int year, quarter;
-
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (DtoQ_yq(ordinal, af_info, &year, &quarter) == INT_ERR_CODE) {
-        return INT_ERR_CODE;
-    }
-
-    return (npy_int64)((year - BASE_YEAR) * 4 + quarter - 1);
-}
-
-static npy_int64 asfreq_DTtoM(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    struct date_info dinfo;
-
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET,
-                                 GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-    return (npy_int64)((dinfo.year - BASE_YEAR) * 12 + dinfo.month - 1);
-}
-
-static npy_int64 asfreq_DTtoW(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-    return (ordinal + ORD_OFFSET - (1 + af_info->to_week_end)) / 7 + 1 -
-           WEEK_OFFSET;
-}
-
-static npy_int64 asfreq_DTtoB(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    struct date_info dinfo;
-
-    ordinal = downsample_daytime(ordinal, af_info, 0);
-
-    if (dInfoCalc_SetFromAbsDate(&dinfo, ordinal + ORD_OFFSET,
-                                 GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-// all intra day calculations are now done within one function
-static npy_int64 asfreq_DownsampleWithinDay(npy_int64 ordinal, char relation,
-                                            asfreq_info *af_info) {
-    return downsample_daytime(ordinal, af_info, relation == 'E');
-}
-
-static npy_int64 asfreq_UpsampleWithinDay(npy_int64 ordinal, char relation,
-                                          asfreq_info *af_info) {
-    return upsample_daytime(ordinal, af_info, relation == 'E');
-}
-//************ FROM BUSINESS ***************
-
-static npy_int64 asfreq_BtoDT(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    ordinal += BDAY_OFFSET;
-    ordinal =
-        (((ordinal - 1) / 5) * 7 + mod_compat(ordinal - 1, 5) + 1 - ORD_OFFSET);
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_BtoA(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT,
-                             asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_BtoQ(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT,
-                             asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_BtoM(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT,
-                             asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_BtoW(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_BtoDT,
-                             asfreq_DTtoW);
-}
-
-//************ FROM WEEKLY ***************
-
-static npy_int64 asfreq_WtoDT(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    ordinal += WEEK_OFFSET;
-    if (relation != 'S') {
-        ordinal += 1;
-    }
-
-    ordinal = ordinal * 7 - 6 + af_info->from_week_end - ORD_OFFSET;
-
-    if (relation != 'S') {
-        ordinal -= 1;
-    }
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_WtoA(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT,
-                             asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_WtoQ(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT,
-                             asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_WtoM(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT,
-                             asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_WtoW(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_WtoDT,
-                             asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_WtoB(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(
-            &dinfo, asfreq_WtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-            GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-//************ FROM MONTHLY ***************
-static void MtoD_ym(npy_int64 ordinal, int *y, int *m) {
-    *y = floordiv(ordinal, 12) + BASE_YEAR;
-    *m = mod_compat(ordinal, 12) + 1;
-}
-
-static npy_int64 asfreq_MtoDT(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    npy_int64 absdate;
-    int y, m;
-
-    if (relation == 'E') {
-        ordinal += 1;
-    }
-    MtoD_ym(ordinal, &y, &m);
-    if ((absdate = absdate_from_ymd(y, m, 1)) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    ordinal = absdate - ORD_OFFSET;
-
-    if (relation == 'E') {
-        ordinal -= 1;
-    }
-
-    return upsample_daytime(ordinal, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_MtoA(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT,
-                             asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_MtoQ(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT,
-                             asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_MtoW(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_MtoDT,
-                             asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_MtoB(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    struct date_info dinfo;
-
-    if (dInfoCalc_SetFromAbsDate(
-            &dinfo, asfreq_MtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-            GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-//************ FROM QUARTERLY ***************
-
-static void QtoD_ym(npy_int64 ordinal, int *y, int *m, asfreq_info *af_info) {
-    *y = floordiv(ordinal, 4) + BASE_YEAR;
-    *m = mod_compat(ordinal, 4) * 3 + 1;
-
-    if (af_info->from_q_year_end != 12) {
-        *m += af_info->from_q_year_end;
-        if (*m > 12) {
-            *m -= 12;
-        } else {
-            *y -= 1;
-        }
-    }
-}
-
-static npy_int64 asfreq_QtoDT(npy_int64 ordinal, char relation,
-                              asfreq_info *af_info) {
-    npy_int64 absdate;
-    int y, m;
-
-    if (relation == 'E') {
-        ordinal += 1;
-    }
-
-    QtoD_ym(ordinal, &y, &m, af_info);
-
-    if ((absdate = absdate_from_ymd(y, m, 1)) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-
-    if (relation == 'E') {
-        absdate -= 1;
-    }
-
-    return upsample_daytime(absdate - ORD_OFFSET, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_QtoQ(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT,
-                             asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_QtoA(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT,
-                             asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_QtoM(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT,
-                             asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_QtoW(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_QtoDT,
-                             asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_QtoB(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(
-            &dinfo, asfreq_QtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-            GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-//************ FROM ANNUAL ***************
-
-static npy_int64 asfreq_AtoDT(npy_int64 year, char relation,
-                              asfreq_info *af_info) {
-    npy_int64 absdate;
-    int month = (af_info->from_a_year_end) % 12;
-
-    // start from 1970
-    year += BASE_YEAR;
-
-    month += 1;
-
-    if (af_info->from_a_year_end != 12) {
-        year -= 1;
-    }
-
-    if (relation == 'E') {
-        year += 1;
-    }
-
-    absdate = absdate_from_ymd(year, month, 1);
-
-    if (absdate == INT_ERR_CODE) {
-        return INT_ERR_CODE;
-    }
-
-    if (relation == 'E') {
-        absdate -= 1;
-    }
-
-    return upsample_daytime(absdate - ORD_OFFSET, af_info, relation != 'S');
-}
-
-static npy_int64 asfreq_AtoA(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT,
-                             asfreq_DTtoA);
-}
-
-static npy_int64 asfreq_AtoQ(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT,
-                             asfreq_DTtoQ);
-}
-
-static npy_int64 asfreq_AtoM(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT,
-                             asfreq_DTtoM);
-}
-
-static npy_int64 asfreq_AtoW(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    return transform_via_day(ordinal, relation, af_info, asfreq_AtoDT,
-                             asfreq_DTtoW);
-}
-
-static npy_int64 asfreq_AtoB(npy_int64 ordinal, char relation,
-                             asfreq_info *af_info) {
-    struct date_info dinfo;
-    if (dInfoCalc_SetFromAbsDate(
-            &dinfo, asfreq_AtoDT(ordinal, relation, af_info) + ORD_OFFSET,
-            GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    if (relation == 'S') {
-        return DtoB_WeekendToMonday(dinfo.absdate, dinfo.day_of_week);
-    } else {
-        return DtoB_WeekendToFriday(dinfo.absdate, dinfo.day_of_week);
-    }
-}
-
-static npy_int64 nofunc(npy_int64 ordinal, char relation,
-                        asfreq_info *af_info) {
-    return INT_ERR_CODE;
-}
-static npy_int64 no_op(npy_int64 ordinal, char relation, asfreq_info *af_info) {
-    return ordinal;
-}
-
-// end of frequency specific conversion routines
-
-static int calc_a_year_end(int freq, int group) {
-    int result = (freq - group) % 12;
-    if (result == 0) {
-        return 12;
-    } else {
-        return result;
-    }
-}
-
-static int calc_week_end(int freq, int group) { return freq - group; }
-
-void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info) {
-    int fromGroup = get_freq_group(fromFreq);
-    int toGroup = get_freq_group(toFreq);
-
-    af_info->intraday_conversion_factor = get_daytime_conversion_factor(
-        get_freq_group_index(max_value(fromGroup, FR_DAY)),
-        get_freq_group_index(max_value(toGroup, FR_DAY)));
-
-    // printf("get_asfreq_info(%d, %d) %ld, %d\n", fromFreq, toFreq,
-    // af_info->intraday_conversion_factor,
-    // af_info->intraday_conversion_upsample);
-
-    switch (fromGroup) {
-        case FR_WK:
-            af_info->from_week_end = calc_week_end(fromFreq, fromGroup);
-            break;
-        case FR_ANN:
-            af_info->from_a_year_end = calc_a_year_end(fromFreq, fromGroup);
-            break;
-        case FR_QTR:
-            af_info->from_q_year_end = calc_a_year_end(fromFreq, fromGroup);
-            break;
-    }
-
-    switch (toGroup) {
-        case FR_WK:
-            af_info->to_week_end = calc_week_end(toFreq, toGroup);
-            break;
-        case FR_ANN:
-            af_info->to_a_year_end = calc_a_year_end(toFreq, toGroup);
-            break;
-        case FR_QTR:
-            af_info->to_q_year_end = calc_a_year_end(toFreq, toGroup);
-            break;
-    }
-}
-
-freq_conv_func get_asfreq_func(int fromFreq, int toFreq) {
-    int fromGroup = get_freq_group(fromFreq);
-    int toGroup = get_freq_group(toFreq);
-
-    if (fromGroup == FR_UND) {
-        fromGroup = FR_DAY;
-    }
-
-    switch (fromGroup) {
-        case FR_ANN:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_AtoA;
-                case FR_QTR:
-                    return &asfreq_AtoQ;
-                case FR_MTH:
-                    return &asfreq_AtoM;
-                case FR_WK:
-                    return &asfreq_AtoW;
-                case FR_BUS:
-                    return &asfreq_AtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    return &asfreq_AtoDT;
-
-                default:
-                    return &nofunc;
-            }
-
-        case FR_QTR:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_QtoA;
-                case FR_QTR:
-                    return &asfreq_QtoQ;
-                case FR_MTH:
-                    return &asfreq_QtoM;
-                case FR_WK:
-                    return &asfreq_QtoW;
-                case FR_BUS:
-                    return &asfreq_QtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    return &asfreq_QtoDT;
-                default:
-                    return &nofunc;
-            }
-
-        case FR_MTH:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_MtoA;
-                case FR_QTR:
-                    return &asfreq_MtoQ;
-                case FR_MTH:
-                    return &no_op;
-                case FR_WK:
-                    return &asfreq_MtoW;
-                case FR_BUS:
-                    return &asfreq_MtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    return &asfreq_MtoDT;
-                default:
-                    return &nofunc;
-            }
-
-        case FR_WK:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_WtoA;
-                case FR_QTR:
-                    return &asfreq_WtoQ;
-                case FR_MTH:
-                    return &asfreq_WtoM;
-                case FR_WK:
-                    return &asfreq_WtoW;
-                case FR_BUS:
-                    return &asfreq_WtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    return &asfreq_WtoDT;
-                default:
-                    return &nofunc;
-            }
-
-        case FR_BUS:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_BtoA;
-                case FR_QTR:
-                    return &asfreq_BtoQ;
-                case FR_MTH:
-                    return &asfreq_BtoM;
-                case FR_WK:
-                    return &asfreq_BtoW;
-                case FR_BUS:
-                    return &no_op;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    return &asfreq_BtoDT;
-                default:
-                    return &nofunc;
-            }
-
-        case FR_DAY:
-        case FR_HR:
-        case FR_MIN:
-        case FR_SEC:
-        case FR_MS:
-        case FR_US:
-        case FR_NS:
-            switch (toGroup) {
-                case FR_ANN:
-                    return &asfreq_DTtoA;
-                case FR_QTR:
-                    return &asfreq_DTtoQ;
-                case FR_MTH:
-                    return &asfreq_DTtoM;
-                case FR_WK:
-                    return &asfreq_DTtoW;
-                case FR_BUS:
-                    return &asfreq_DTtoB;
-                case FR_DAY:
-                case FR_HR:
-                case FR_MIN:
-                case FR_SEC:
-                case FR_MS:
-                case FR_US:
-                case FR_NS:
-                    if (fromGroup > toGroup) {
-                        return &asfreq_DownsampleWithinDay;
-                    } else {
-                        return &asfreq_UpsampleWithinDay;
-                    }
-                default:
-                    return &nofunc;
-            }
-
-        default:
-            return &nofunc;
-    }
-}
-
-double get_abs_time(int freq, npy_int64 date_ordinal, npy_int64 ordinal) {
-    // printf("get_abs_time %d %lld %lld\n", freq, date_ordinal, ordinal);
-
-    int freq_index, day_index, base_index;
-    npy_int64 per_day, start_ord;
-    double unit, result;
-
-    if (freq <= FR_DAY) {
-        return 0;
-    }
-
-    freq_index = get_freq_group_index(freq);
-    day_index = get_freq_group_index(FR_DAY);
-    base_index = get_freq_group_index(FR_SEC);
-
-    // printf("  indices: day %d, freq %d, base %d\n", day_index, freq_index,
-    // base_index);
-
-    per_day = get_daytime_conversion_factor(day_index, freq_index);
-    unit = get_daytime_conversion_factor(freq_index, base_index);
-
-    // printf("  per_day: %lld, unit: %f\n", per_day, unit);
-
-    if (base_index < freq_index) {
-        unit = 1 / unit;
-        // printf("  corrected unit: %f\n", unit);
-    }
-
-    start_ord = date_ordinal * per_day;
-    // printf("start_ord: %lld\n", start_ord);
-    result = (double)(unit * (ordinal - start_ord));
-    // printf("  result: %f\n", result);
-    return result;
-}
-
-/* Sets the time part of the DateTime object. */
-static int dInfoCalc_SetFromAbsTime(struct date_info *dinfo, double abstime) {
-    int inttime;
-    int hour, minute;
-    double second;
-
-    inttime = (int)abstime;
-    hour = inttime / 3600;
-    minute = (inttime % 3600) / 60;
-    second = abstime - (double)(hour * 3600 + minute * 60);
-
-    dinfo->hour = hour;
-    dinfo->minute = minute;
-    dinfo->second = second;
-
-    dinfo->abstime = abstime;
-
-    return 0;
-}
-
-/* Set the instance's value using the given date and time. calendar
-   may be set to the flags: GREGORIAN_CALENDAR, JULIAN_CALENDAR to
-   indicate the calendar to be used. */
-static int dInfoCalc_SetFromAbsDateTime(struct date_info *dinfo,
-                                        npy_int64 absdate, double abstime,
-                                        int calendar) {
-    /* Bounds check */
-    Py_AssertWithArg(abstime >= 0.0 && abstime <= SECONDS_PER_DAY,
-                     PyExc_ValueError,
-                     "abstime out of range (0.0 - 86400.0): %f", abstime);
-
-    /* Calculate the date */
-    if (dInfoCalc_SetFromAbsDate(dinfo, absdate, calendar)) goto onError;
-
-    /* Calculate the time */
-    if (dInfoCalc_SetFromAbsTime(dinfo, abstime)) goto onError;
-
-    return 0;
-onError:
-    return INT_ERR_CODE;
-}
-
-/* ------------------------------------------------------------------
- * New pandas API-helper code, to expose to cython
- * ------------------------------------------------------------------*/
-
-npy_int64 asfreq(npy_int64 period_ordinal, int freq1, int freq2,
-                 char relation) {
-    npy_int64 val;
-    freq_conv_func func;
-    asfreq_info finfo;
-
-    func = get_asfreq_func(freq1, freq2);
-
-    get_asfreq_info(freq1, freq2, &finfo);
-
-    // printf("\n%x %d %d %ld %ld\n", func, freq1, freq2,
-    // finfo.intraday_conversion_factor, -finfo.intraday_conversion_factor);
-
-    val = (*func)(period_ordinal, relation, &finfo);
-
-    if (val == INT_ERR_CODE) {
-        // Py_Error(PyExc_ValueError, "Unable to convert to desired
-        // frequency.");
-        goto onError;
-    }
-    return val;
-onError:
-    return INT_ERR_CODE;
-}
-
-/* generate an ordinal in period space */
-npy_int64 get_period_ordinal(int year, int month, int day, int hour, int minute,
-                             int second, int microseconds, int picoseconds,
-                             int freq) {
-    npy_int64 absdays, delta, seconds;
-    npy_int64 weeks, days;
-    npy_int64 ordinal, day_adj;
-    int freq_group, fmonth, mdiff;
-    freq_group = get_freq_group(freq);
-
-    if (freq == FR_SEC || freq == FR_MS || freq == FR_US || freq == FR_NS) {
-        absdays = absdate_from_ymd(year, month, day);
-        delta = (absdays - ORD_OFFSET);
-        seconds =
-            (npy_int64)(delta * 86400 + hour * 3600 + minute * 60 + second);
-
-        switch (freq) {
-            case FR_MS:
-                return seconds * 1000 + microseconds / 1000;
-
-            case FR_US:
-                return seconds * 1000000 + microseconds;
-
-            case FR_NS:
-                return seconds * 1000000000 + microseconds * 1000 +
-                       picoseconds / 1000;
-        }
-
-        return seconds;
-    }
-
-    if (freq == FR_MIN) {
-        absdays = absdate_from_ymd(year, month, day);
-        delta = (absdays - ORD_OFFSET);
-        return (npy_int64)(delta * 1440 + hour * 60 + minute);
-    }
-
-    if (freq == FR_HR) {
-        if ((absdays = absdate_from_ymd(year, month, day)) == INT_ERR_CODE) {
-            goto onError;
-        }
-        delta = (absdays - ORD_OFFSET);
-        return (npy_int64)(delta * 24 + hour);
-    }
-
-    if (freq == FR_DAY) {
-        return (npy_int64)(absdate_from_ymd(year, month, day) - ORD_OFFSET);
-    }
-
-    if (freq == FR_UND) {
-        return (npy_int64)(absdate_from_ymd(year, month, day) - ORD_OFFSET);
-    }
-
-    if (freq == FR_BUS) {
-        if ((days = absdate_from_ymd(year, month, day)) == INT_ERR_CODE) {
-            goto onError;
-        }
-        // calculate the current week assuming sunday as last day of a week
-        weeks = (days - BASE_WEEK_TO_DAY_OFFSET) / DAYS_PER_WEEK;
-        // calculate the current weekday (in range 1 .. 7)
-        delta = (days - BASE_WEEK_TO_DAY_OFFSET) % DAYS_PER_WEEK + 1;
-        // return the number of business days in full weeks plus the business
-        // days in the last - possible partial - week
-        return (npy_int64)(weeks * BUSINESS_DAYS_PER_WEEK) +
-               (delta <= BUSINESS_DAYS_PER_WEEK ? delta
-                                                : BUSINESS_DAYS_PER_WEEK + 1) -
-               BDAY_OFFSET;
-    }
-
-    if (freq_group == FR_WK) {
-        if ((ordinal = (npy_int64)absdate_from_ymd(year, month, day)) ==
-            INT_ERR_CODE) {
-            goto onError;
-        }
-        day_adj = freq - FR_WK;
-        return (ordinal - (1 + day_adj)) / 7 + 1 - WEEK_OFFSET;
-    }
-
-    if (freq == FR_MTH) {
-        return (year - BASE_YEAR) * 12 + month - 1;
-    }
-
-    if (freq_group == FR_QTR) {
-        fmonth = freq - FR_QTR;
-        if (fmonth == 0) fmonth = 12;
-
-        mdiff = month - fmonth;
-        if (mdiff < 0) mdiff += 12;
-        if (month >= fmonth) mdiff += 12;
-
-        return (year - BASE_YEAR) * 4 + (mdiff - 1) / 3;
-    }
-
-    if (freq_group == FR_ANN) {
-        fmonth = freq - FR_ANN;
-        if (fmonth == 0) fmonth = 12;
-        if (month <= fmonth) {
-            return year - BASE_YEAR;
-        } else {
-            return year - BASE_YEAR + 1;
-        }
-    }
-
-    Py_Error(PyExc_RuntimeError, "Unable to generate frequency ordinal");
-
-onError:
-    return INT_ERR_CODE;
-}
-
-/*
-   Returns the proleptic Gregorian ordinal of the date, as an integer.
-   This corresponds to the number of days since Jan., 1st, 1AD.
-   When the instance has a frequency less than daily, the proleptic date
-   is calculated for the last day of the period.
- */
-
-npy_int64 get_python_ordinal(npy_int64 period_ordinal, int freq) {
-    asfreq_info af_info;
-    freq_conv_func toDaily = NULL;
-
-    if (freq == FR_DAY) return period_ordinal + ORD_OFFSET;
-
-    toDaily = get_asfreq_func(freq, FR_DAY);
-    get_asfreq_info(freq, FR_DAY, &af_info);
-
-    return toDaily(period_ordinal, 'E', &af_info) + ORD_OFFSET;
-}
-
-char *str_replace(const char *s, const char *old, const char *new) {
-    char *ret;
-    int i, count = 0;
-    size_t newlen = strlen(new);
-    size_t oldlen = strlen(old);
-
-    for (i = 0; s[i] != '\0'; i++) {
-        if (strstr(&s[i], old) == &s[i]) {
-            count++;
-            i += oldlen - 1;
-        }
-    }
-
-    ret = PyArray_malloc(i + 1 + count * (newlen - oldlen));
-    if (ret == NULL) {
-        return (char *)PyErr_NoMemory();
-    }
-
-    i = 0;
-    while (*s) {
-        if (strstr(s, old) == s) {
-            strncpy(&ret[i], new, sizeof(char) * newlen);
-            i += newlen;
-            s += oldlen;
-        } else {
-            ret[i++] = *s++;
-        }
-    }
-    ret[i] = '\0';
-
-    return ret;
-}
-
-// function to generate a nice string representation of the period
-// object, originally from DateObject_strftime
-
-char *c_strftime(struct date_info *tmp, char *fmt) {
-    struct tm c_date;
-    char *result;
-    struct date_info dinfo = *tmp;
-    int result_len = strlen(fmt) + 50;
-
-    c_date.tm_sec = (int)dinfo.second;
-    c_date.tm_min = dinfo.minute;
-    c_date.tm_hour = dinfo.hour;
-    c_date.tm_mday = dinfo.day;
-    c_date.tm_mon = dinfo.month - 1;
-    c_date.tm_year = dinfo.year - 1900;
-    c_date.tm_wday = (dinfo.day_of_week + 1) % 7;
-    c_date.tm_yday = dinfo.day_of_year - 1;
-    c_date.tm_isdst = -1;
-
-    result = malloc(result_len * sizeof(char));
-
-    strftime(result, result_len, fmt, &c_date);
-
-    return result;
-}
-
-int get_yq(npy_int64 ordinal, int freq, int *quarter, int *year) {
-    asfreq_info af_info;
-    int qtr_freq;
-    npy_int64 daily_ord;
-    npy_int64 (*toDaily)(npy_int64, char, asfreq_info *) = NULL;
-
-    toDaily = get_asfreq_func(freq, FR_DAY);
-    get_asfreq_info(freq, FR_DAY, &af_info);
-
-    daily_ord = toDaily(ordinal, 'E', &af_info);
-
-    if (get_freq_group(freq) == FR_QTR) {
-        qtr_freq = freq;
-    } else {
-        qtr_freq = FR_QTR;
-    }
-    get_asfreq_info(FR_DAY, qtr_freq, &af_info);
-
-    if (DtoQ_yq(daily_ord, &af_info, year, quarter) == INT_ERR_CODE) return -1;
-
-    return 0;
-}
-
-static int _quarter_year(npy_int64 ordinal, int freq, int *year, int *quarter) {
-    asfreq_info af_info;
-    int qtr_freq;
-
-    ordinal = get_python_ordinal(ordinal, freq) - ORD_OFFSET;
-
-    if (get_freq_group(freq) == FR_QTR)
-        qtr_freq = freq;
-    else
-        qtr_freq = FR_QTR;
-
-    get_asfreq_info(FR_DAY, qtr_freq, &af_info);
-
-    if (DtoQ_yq(ordinal, &af_info, year, quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-
-    if ((qtr_freq % 1000) > 12) *year -= 1;
-
-    return 0;
-}
-
-static int _ISOWeek(struct date_info *dinfo) {
-    int week;
-
-    /* Estimate */
-    week = (dinfo->day_of_year - 1) - dinfo->day_of_week + 3;
-    if (week >= 0) week = week / 7 + 1;
-
-    /* Verify */
-    if (week < 0) {
-        /* The day lies in last week of the previous year */
-        if ((week > -2) || (week == -2 && dInfoCalc_Leapyear(dinfo->year - 1,
-                                                             dinfo->calendar)))
-            week = 53;
-        else
-            week = 52;
-    } else if (week == 53) {
-        /* Check if the week belongs to year or year+1 */
-        if (31 - dinfo->day + dinfo->day_of_week < 3) {
-            week = 1;
-        }
-    }
-
-    return week;
-}
-
-int get_date_info(npy_int64 ordinal, int freq, struct date_info *dinfo) {
-    npy_int64 absdate = get_python_ordinal(ordinal, freq);
-    double abstime = get_abs_time(freq, absdate - ORD_OFFSET, ordinal);
-
-    while (abstime < 0) {
-        abstime += 86400;
-        absdate -= 1;
-    }
-    while (abstime >= 86400) {
-        abstime -= 86400;
-        absdate += 1;
-    }
-
-    if (dInfoCalc_SetFromAbsDateTime(dinfo, absdate, abstime,
-                                     GREGORIAN_CALENDAR))
-        return INT_ERR_CODE;
-
-    return 0;
-}
-
-int pyear(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    get_date_info(ordinal, freq, &dinfo);
-    return dinfo.year;
-}
-
-int pqyear(npy_int64 ordinal, int freq) {
-    int year, quarter;
-    if (_quarter_year(ordinal, freq, &year, &quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return year;
-}
-
-int pquarter(npy_int64 ordinal, int freq) {
-    int year, quarter;
-    if (_quarter_year(ordinal, freq, &year, &quarter) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return quarter;
-}
-
-int pmonth(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.month;
-}
-
-int pday(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day;
-}
-
-int pweekday(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_week;
-}
-
-int pday_of_week(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_week;
-}
-
-int pday_of_year(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.day_of_year;
-}
-
-int pweek(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return _ISOWeek(&dinfo);
-}
-
-int phour(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.hour;
-}
-
-int pminute(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return dinfo.minute;
-}
-
-int psecond(npy_int64 ordinal, int freq) {
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-    return (int)dinfo.second;
-}
-
-int pdays_in_month(npy_int64 ordinal, int freq) {
-    int days;
-    struct date_info dinfo;
-    if (get_date_info(ordinal, freq, &dinfo) == INT_ERR_CODE)
-        return INT_ERR_CODE;
-
-    days = days_in_month[dInfoCalc_Leapyear(dinfo.year, dinfo.calendar)]
-                        [dinfo.month - 1];
-    return days;
-}
diff --git a/pandas/_libs/src/period_helper.h b/pandas/_libs/src/period_helper.h
deleted file mode 100644
index 45afc074cab72..0000000000000
--- a/pandas/_libs/src/period_helper.h
+++ /dev/null
@@ -1,191 +0,0 @@
-/*
-Copyright (c) 2016, PyData Development Team
-All rights reserved.
-
-Distributed under the terms of the BSD Simplified License.
-
-The full license is in the LICENSE file, distributed with this software.
-
-Borrowed and derived code from scikits.timeseries that we will expose via
-Cython to pandas. This primarily concerns interval representation and
-frequency conversion routines.
-*/
-
-#ifndef PANDAS__LIBS_SRC_PERIOD_HELPER_H_
-#define PANDAS__LIBS_SRC_PERIOD_HELPER_H_
-
-#include <Python.h>
-#include "headers/stdint.h"
-#include "helper.h"
-#include "limits.h"
-#include "numpy/ndarraytypes.h"
-
-/*
- * declarations from period here
- */
-
-#define GREGORIAN_CALENDAR 0
-#define JULIAN_CALENDAR 1
-
-#define SECONDS_PER_DAY ((double)86400.0)
-
-#define Py_AssertWithArg(x, errortype, errorstr, a1) \
-    {                                                \
-        if (!(x)) {                                  \
-            PyErr_Format(errortype, errorstr, a1);   \
-            goto onError;                            \
-        }                                            \
-    }
-#define Py_Error(errortype, errorstr)         \
-    {                                         \
-        PyErr_SetString(errortype, errorstr); \
-        goto onError;                         \
-    }
-
-/*** FREQUENCY CONSTANTS ***/
-
-// HIGHFREQ_ORIG is the datetime ordinal from which to begin the second
-// frequency ordinal sequence
-
-// #define HIGHFREQ_ORIG 62135683200LL
-#define BASE_YEAR 1970
-#define ORD_OFFSET 719163LL   // days until 1970-01-01
-#define BDAY_OFFSET 513689LL  // days until 1970-01-01
-#define WEEK_OFFSET 102737LL
-#define BASE_WEEK_TO_DAY_OFFSET \
-    1  // difference between day 0 and end of week in days
-#define DAYS_PER_WEEK 7
-#define BUSINESS_DAYS_PER_WEEK 5
-#define HIGHFREQ_ORIG 0  // ORD_OFFSET * 86400LL // days until 1970-01-01
-
-#define FR_ANN 1000      /* Annual */
-#define FR_ANNDEC FR_ANN /* Annual - December year end*/
-#define FR_ANNJAN 1001   /* Annual - January year end*/
-#define FR_ANNFEB 1002   /* Annual - February year end*/
-#define FR_ANNMAR 1003   /* Annual - March year end*/
-#define FR_ANNAPR 1004   /* Annual - April year end*/
-#define FR_ANNMAY 1005   /* Annual - May year end*/
-#define FR_ANNJUN 1006   /* Annual - June year end*/
-#define FR_ANNJUL 1007   /* Annual - July year end*/
-#define FR_ANNAUG 1008   /* Annual - August year end*/
-#define FR_ANNSEP 1009   /* Annual - September year end*/
-#define FR_ANNOCT 1010   /* Annual - October year end*/
-#define FR_ANNNOV 1011   /* Annual - November year end*/
-
-/* The standard quarterly frequencies with various fiscal year ends
-   eg, Q42005 for Q@OCT runs Aug 1, 2005 to Oct 31, 2005 */
-#define FR_QTR 2000      /* Quarterly - December year end (default quarterly) */
-#define FR_QTRDEC FR_QTR /* Quarterly - December year end */
-#define FR_QTRJAN 2001   /* Quarterly - January year end */
-#define FR_QTRFEB 2002   /* Quarterly - February year end */
-#define FR_QTRMAR 2003   /* Quarterly - March year end */
-#define FR_QTRAPR 2004   /* Quarterly - April year end */
-#define FR_QTRMAY 2005   /* Quarterly - May year end */
-#define FR_QTRJUN 2006   /* Quarterly - June year end */
-#define FR_QTRJUL 2007   /* Quarterly - July year end */
-#define FR_QTRAUG 2008   /* Quarterly - August year end */
-#define FR_QTRSEP 2009   /* Quarterly - September year end */
-#define FR_QTROCT 2010   /* Quarterly - October year end */
-#define FR_QTRNOV 2011   /* Quarterly - November year end */
-
-#define FR_MTH 3000 /* Monthly */
-
-#define FR_WK 4000     /* Weekly */
-#define FR_WKSUN FR_WK /* Weekly - Sunday end of week */
-#define FR_WKMON 4001  /* Weekly - Monday end of week */
-#define FR_WKTUE 4002  /* Weekly - Tuesday end of week */
-#define FR_WKWED 4003  /* Weekly - Wednesday end of week */
-#define FR_WKTHU 4004  /* Weekly - Thursday end of week */
-#define FR_WKFRI 4005  /* Weekly - Friday end of week */
-#define FR_WKSAT 4006  /* Weekly - Saturday end of week */
-
-#define FR_BUS 5000 /* Business days */
-#define FR_DAY 6000 /* Daily */
-#define FR_HR 7000  /* Hourly */
-#define FR_MIN 8000 /* Minutely */
-#define FR_SEC 9000 /* Secondly */
-#define FR_MS 10000 /* Millisecondly */
-#define FR_US 11000 /* Microsecondly */
-#define FR_NS 12000 /* Nanosecondly */
-
-#define FR_UND -10000 /* Undefined */
-
-#define INT_ERR_CODE INT32_MIN
-
-#define MEM_CHECK(item)          \
-    if (item == NULL) {          \
-        return PyErr_NoMemory(); \
-    }
-#define ERR_CHECK(item) \
-    if (item == NULL) { \
-        return NULL;    \
-    }
-
-typedef struct asfreq_info {
-    int from_week_end;  // day the week ends on in the "from" frequency
-    int to_week_end;    // day the week ends on in the "to" frequency
-
-    int from_a_year_end;  // month the year ends on in the "from" frequency
-    int to_a_year_end;    // month the year ends on in the "to" frequency
-
-    int from_q_year_end;  // month the year ends on in the "from" frequency
-    int to_q_year_end;    // month the year ends on in the "to" frequency
-
-    npy_int64 intraday_conversion_factor;
-} asfreq_info;
-
-typedef struct date_info {
-    npy_int64 absdate;
-    double abstime;
-
-    double second;
-    int minute;
-    int hour;
-    int day;
-    int month;
-    int quarter;
-    int year;
-    int day_of_week;
-    int day_of_year;
-    int calendar;
-} date_info;
-
-typedef npy_int64 (*freq_conv_func)(npy_int64, char, asfreq_info *);
-
-/*
- * new pandas API helper functions here
- */
-
-npy_int64 asfreq(npy_int64 period_ordinal, int freq1, int freq2, char relation);
-
-npy_int64 get_period_ordinal(int year, int month, int day, int hour, int minute,
-                             int second, int microseconds, int picoseconds,
-                             int freq);
-
-npy_int64 get_python_ordinal(npy_int64 period_ordinal, int freq);
-
-int get_date_info(npy_int64 ordinal, int freq, struct date_info *dinfo);
-freq_conv_func get_asfreq_func(int fromFreq, int toFreq);
-void get_asfreq_info(int fromFreq, int toFreq, asfreq_info *af_info);
-
-int pyear(npy_int64 ordinal, int freq);
-int pqyear(npy_int64 ordinal, int freq);
-int pquarter(npy_int64 ordinal, int freq);
-int pmonth(npy_int64 ordinal, int freq);
-int pday(npy_int64 ordinal, int freq);
-int pweekday(npy_int64 ordinal, int freq);
-int pday_of_week(npy_int64 ordinal, int freq);
-int pday_of_year(npy_int64 ordinal, int freq);
-int pweek(npy_int64 ordinal, int freq);
-int phour(npy_int64 ordinal, int freq);
-int pminute(npy_int64 ordinal, int freq);
-int psecond(npy_int64 ordinal, int freq);
-int pdays_in_month(npy_int64 ordinal, int freq);
-
-double getAbsTime(int freq, npy_int64 dailyDate, npy_int64 originalDate);
-char *c_strftime(struct date_info *dinfo, char *fmt);
-int get_yq(npy_int64 ordinal, int freq, int *quarter, int *year);
-
-void initialize_daytime_conversion_factor_matrix(void);
-
-#endif  // PANDAS__LIBS_SRC_PERIOD_HELPER_H_
diff --git a/pandas/_libs/src/properties.pyx b/pandas/_libs/src/properties.pyx
deleted file mode 100644
index e619a3b6edd9a..0000000000000
--- a/pandas/_libs/src/properties.pyx
+++ /dev/null
@@ -1,65 +0,0 @@
-from cpython cimport PyDict_Contains, PyDict_GetItem, PyDict_GetItem
-
-
-cdef class cache_readonly(object):
-
-    cdef readonly:
-        object func, name, allow_setting
-
-    def __init__(self, func=None, allow_setting=False):
-        if func is not None:
-            self.func = func
-            self.name = func.__name__
-        self.allow_setting = allow_setting
-
-    def __call__(self, func, doc=None):
-        self.func = func
-        self.name = func.__name__
-        return self
-
-    def __get__(self, obj, typ):
-        # Get the cache or set a default one if needed
-
-        cache = getattr(obj, '_cache', None)
-        if cache is None:
-            try:
-                cache = obj._cache = {}
-            except (AttributeError):
-                return
-
-        if PyDict_Contains(cache, self.name):
-            # not necessary to Py_INCREF
-            val = <object> PyDict_GetItem(cache, self.name)
-        else:
-            val = self.func(obj)
-            PyDict_SetItem(cache, self.name, val)
-        return val
-
-    def __set__(self, obj, value):
-
-        if not self.allow_setting:
-            raise Exception("cannot set values for [%s]" % self.name)
-
-        # Get the cache or set a default one if needed
-        cache = getattr(obj, '_cache', None)
-        if cache is None:
-            try:
-                cache = obj._cache = {}
-            except (AttributeError):
-                return
-
-        PyDict_SetItem(cache, self.name, value)
-
-cdef class AxisProperty(object):
-    cdef:
-        Py_ssize_t axis
-
-    def __init__(self, axis=0):
-        self.axis = axis
-
-    def __get__(self, obj, type):
-        cdef list axes = obj._data.axes
-        return axes[self.axis]
-
-    def __set__(self, obj, value):
-        obj._set_axis(self.axis, value)
diff --git a/pandas/_libs/src/reduce.pyx b/pandas/_libs/src/reduce.pyx
deleted file mode 100644
index 2bba07256305a..0000000000000
--- a/pandas/_libs/src/reduce.pyx
+++ /dev/null
@@ -1,623 +0,0 @@
-#cython=False
-from numpy cimport *
-import numpy as np
-
-from distutils.version import LooseVersion
-
-is_numpy_prior_1_6_2 = LooseVersion(np.__version__) < '1.6.2'
-
-cdef _get_result_array(object obj,
-                       Py_ssize_t size,
-                       Py_ssize_t cnt):
-
-    if isinstance(obj, np.ndarray) \
-            or isinstance(obj, list) and len(obj) == cnt \
-            or getattr(obj, 'shape', None) == (cnt,):
-        raise ValueError('function does not reduce')
-
-    return np.empty(size, dtype='O')
-
-
-cdef class Reducer:
-    """
-    Performs generic reduction operation on a C or Fortran-contiguous ndarray
-    while avoiding ndarray construction overhead
-    """
-    cdef:
-        Py_ssize_t increment, chunksize, nresults
-        object arr, dummy, f, labels, typ, ityp, index
-
-    def __init__(self, object arr, object f, axis=1, dummy=None,
-                 labels=None):
-        n, k = arr.shape
-
-        if axis == 0:
-            if not arr.flags.f_contiguous:
-                arr = arr.copy('F')
-
-            self.nresults = k
-            self.chunksize = n
-            self.increment = n * arr.dtype.itemsize
-        else:
-            if not arr.flags.c_contiguous:
-                arr = arr.copy('C')
-
-            self.nresults = n
-            self.chunksize = k
-            self.increment = k * arr.dtype.itemsize
-
-        self.f = f
-        self.arr = arr
-        self.labels = labels
-        self.dummy, self.typ, self.index, self.ityp = self._check_dummy(
-            dummy=dummy)
-
-    def _check_dummy(self, dummy=None):
-        cdef object index=None, typ=None, ityp=None
-
-        if dummy is None:
-            dummy = np.empty(self.chunksize, dtype=self.arr.dtype)
-
-            # our ref is stolen later since we are creating this array
-            # in cython, so increment first
-            Py_INCREF(dummy)
-
-        else:
-
-            # we passed a series-like
-            if hasattr(dummy, 'values'):
-
-                typ = type(dummy)
-                index = getattr(dummy, 'index', None)
-                dummy = dummy.values
-
-            if dummy.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if len(dummy) != self.chunksize:
-                raise ValueError('Dummy array must be length %d' %
-                                 self.chunksize)
-
-        return dummy, typ, index, ityp
-
-    def get_result(self):
-        cdef:
-            char* dummy_buf
-            ndarray arr, result, chunk
-            Py_ssize_t i, incr
-            flatiter it
-            bint has_labels
-            object res, name, labels, index
-            object cached_typ=None
-
-        arr = self.arr
-        chunk = self.dummy
-        dummy_buf = chunk.data
-        chunk.data = arr.data
-        labels = self.labels
-        has_labels = labels is not None
-        has_index = self.index is not None
-        incr = self.increment
-
-        try:
-            for i in range(self.nresults):
-
-                if has_labels:
-                    name = util.get_value_at(labels, i)
-                else:
-                    name = None
-
-                # create the cached type
-                # each time just reassign the data
-                if i == 0:
-
-                    if self.typ is not None:
-
-                        # recreate with the index if supplied
-                        if has_index:
-
-                            cached_typ = self.typ(
-                                chunk, index=self.index, name=name)
-
-                        else:
-
-                            # use the passsed typ, sans index
-                            cached_typ = self.typ(chunk, name=name)
-
-                # use the cached_typ if possible
-                if cached_typ is not None:
-
-                    if has_index:
-                        object.__setattr__(cached_typ, 'index', self.index)
-
-                    object.__setattr__(
-                        cached_typ._data._block, 'values', chunk)
-                    object.__setattr__(cached_typ, 'name', name)
-                    res = self.f(cached_typ)
-                else:
-                    res = self.f(chunk)
-
-                if hasattr(res, 'values') and isinstance(
-                        res.values, np.ndarray):
-                    res = res.values
-                if i == 0:
-                    result = _get_result_array(res,
-                                               self.nresults,
-                                               len(self.dummy))
-                    it = <flatiter> PyArray_IterNew(result)
-
-                PyArray_SETITEM(result, PyArray_ITER_DATA(it), res)
-                chunk.data = chunk.data + self.increment
-                PyArray_ITER_NEXT(it)
-        except Exception, e:
-            if hasattr(e, 'args'):
-                e.args = e.args + (i,)
-            raise
-        finally:
-            # so we don't free the wrong memory
-            chunk.data = dummy_buf
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result
-
-
-cdef class SeriesBinGrouper:
-    """
-    Performs grouping operation according to bin edges, rather than labels
-    """
-    cdef:
-        Py_ssize_t nresults, ngroups
-        bint passed_dummy
-
-    cdef public:
-        object arr, index, dummy_arr, dummy_index
-        object values, f, bins, typ, ityp, name
-
-    def __init__(self, object series, object f, object bins, object dummy):
-        n = len(series)
-
-        self.bins = bins
-        self.f = f
-
-        values = series.values
-        if not values.flags.c_contiguous:
-            values = values.copy('C')
-        self.arr = values
-        self.typ = series._constructor
-        self.ityp = series.index._constructor
-        self.index = series.index.values
-        self.name = getattr(series, 'name', None)
-
-        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
-        self.passed_dummy = dummy is not None
-
-        # kludge for #1688
-        if len(bins) > 0 and bins[-1] == len(series):
-            self.ngroups = len(bins)
-        else:
-            self.ngroups = len(bins) + 1
-
-    def _check_dummy(self, dummy=None):
-        # both values and index must be an ndarray!
-
-        if dummy is None:
-            values = np.empty(0, dtype=self.arr.dtype)
-            index = None
-        else:
-            values = dummy.values
-            if values.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if not values.flags.contiguous:
-                values = values.copy()
-            index = dummy.index.values
-            if not index.flags.contiguous:
-                index = index.copy()
-
-        return values, index
-
-    def get_result(self):
-        cdef:
-            ndarray arr, result
-            ndarray[int64_t] counts
-            Py_ssize_t i, n, group_size
-            object res
-            bint initialized = 0
-            Slider vslider, islider
-            object name, cached_typ=None, cached_ityp=None
-
-        counts = np.zeros(self.ngroups, dtype=np.int64)
-
-        if self.ngroups > 0:
-            counts[0] = self.bins[0]
-            for i in range(1, self.ngroups):
-                if i == self.ngroups - 1:
-                    counts[i] = len(self.arr) - self.bins[i - 1]
-                else:
-                    counts[i] = self.bins[i] - self.bins[i - 1]
-
-        group_size = 0
-        n = len(self.arr)
-        name = self.name
-
-        vslider = Slider(self.arr, self.dummy_arr)
-        islider = Slider(self.index, self.dummy_index)
-
-        try:
-            for i in range(self.ngroups):
-                group_size = counts[i]
-
-                islider.set_length(group_size)
-                vslider.set_length(group_size)
-
-                if cached_typ is None:
-                    cached_ityp = self.ityp(islider.buf)
-                    cached_typ = self.typ(vslider.buf, index=cached_ityp,
-                                          name=name)
-                else:
-                    object.__setattr__(cached_ityp, '_data', islider.buf)
-                    cached_ityp._engine.clear_mapping()
-                    object.__setattr__(
-                        cached_typ._data._block, 'values', vslider.buf)
-                    object.__setattr__(cached_typ, '_index', cached_ityp)
-                    object.__setattr__(cached_typ, 'name', name)
-
-                cached_ityp._engine.clear_mapping()
-                res = self.f(cached_typ)
-                res = _extract_result(res)
-                if not initialized:
-                    initialized = 1
-                    result = _get_result_array(res,
-                                               self.ngroups,
-                                               len(self.dummy_arr))
-
-                util.assign_value_1d(result, i, res)
-
-                islider.advance(group_size)
-                vslider.advance(group_size)
-
-        except:
-            raise
-        finally:
-            # so we don't free the wrong memory
-            islider.reset()
-            vslider.reset()
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result, counts
-
-
-cdef class SeriesGrouper:
-    """
-    Performs generic grouping operation while avoiding ndarray construction
-    overhead
-    """
-    cdef:
-        Py_ssize_t nresults, ngroups
-        bint passed_dummy
-
-    cdef public:
-        object arr, index, dummy_arr, dummy_index
-        object f, labels, values, typ, ityp, name
-
-    def __init__(self, object series, object f, object labels,
-                 Py_ssize_t ngroups, object dummy):
-        n = len(series)
-
-        self.labels = labels
-        self.f = f
-
-        values = series.values
-        if not values.flags.c_contiguous:
-            values = values.copy('C')
-        self.arr = values
-        self.typ = series._constructor
-        self.ityp = series.index._constructor
-        self.index = series.index.values
-        self.name = getattr(series, 'name', None)
-
-        self.dummy_arr, self.dummy_index = self._check_dummy(dummy)
-        self.passed_dummy = dummy is not None
-        self.ngroups = ngroups
-
-    def _check_dummy(self, dummy=None):
-        # both values and index must be an ndarray!
-
-        if dummy is None:
-            values = np.empty(0, dtype=self.arr.dtype)
-            index = None
-        else:
-            values = dummy.values
-            if dummy.dtype != self.arr.dtype:
-                raise ValueError('Dummy array must be same dtype')
-            if not values.flags.contiguous:
-                values = values.copy()
-            index = dummy.index.values
-            if not index.flags.contiguous:
-                index = index.copy()
-
-        return values, index
-
-    def get_result(self):
-        cdef:
-            ndarray arr, result
-            ndarray[int64_t] labels, counts
-            Py_ssize_t i, n, group_size, lab
-            object res
-            bint initialized = 0
-            Slider vslider, islider
-            object name, cached_typ=None, cached_ityp=None
-
-        labels = self.labels
-        counts = np.zeros(self.ngroups, dtype=np.int64)
-        group_size = 0
-        n = len(self.arr)
-        name = self.name
-
-        vslider = Slider(self.arr, self.dummy_arr)
-        islider = Slider(self.index, self.dummy_index)
-
-        try:
-            for i in range(n):
-                group_size += 1
-
-                lab = labels[i]
-
-                if i == n - 1 or lab != labels[i + 1]:
-                    if lab == -1:
-                        islider.advance(group_size)
-                        vslider.advance(group_size)
-                        group_size = 0
-                        continue
-
-                    islider.set_length(group_size)
-                    vslider.set_length(group_size)
-
-                    if cached_typ is None:
-                        cached_ityp = self.ityp(islider.buf)
-                        cached_typ = self.typ(vslider.buf, index=cached_ityp,
-                                              name=name)
-                    else:
-                        object.__setattr__(cached_ityp, '_data', islider.buf)
-                        cached_ityp._engine.clear_mapping()
-                        object.__setattr__(
-                            cached_typ._data._block, 'values', vslider.buf)
-                        object.__setattr__(cached_typ, '_index', cached_ityp)
-                        object.__setattr__(cached_typ, 'name', name)
-
-                    cached_ityp._engine.clear_mapping()
-                    res = self.f(cached_typ)
-                    res = _extract_result(res)
-                    if not initialized:
-                        initialized = 1
-                        result = _get_result_array(res,
-                                                   self.ngroups,
-                                                   len(self.dummy_arr))
-
-                    util.assign_value_1d(result, lab, res)
-                    counts[lab] = group_size
-                    islider.advance(group_size)
-                    vslider.advance(group_size)
-
-                    group_size = 0
-
-        except:
-            raise
-        finally:
-            # so we don't free the wrong memory
-            islider.reset()
-            vslider.reset()
-
-        if result.dtype == np.object_:
-            result = maybe_convert_objects(result)
-
-        return result, counts
-
-
-cdef inline _extract_result(object res):
-    """ extract the result object, it might be a 0-dim ndarray
-        or a len-1 0-dim, or a scalar """
-    if hasattr(res, 'values'):
-        res = res.values
-    if not np.isscalar(res):
-        if isinstance(res, np.ndarray):
-            if res.ndim == 0:
-                res = res.item()
-            elif res.ndim == 1 and len(res) == 1:
-                res = res[0]
-    return res
-
-cdef class Slider:
-    """
-    Only handles contiguous data for now
-    """
-    cdef:
-        ndarray values, buf
-        Py_ssize_t stride, orig_len, orig_stride
-        char *orig_data
-
-    def __init__(self, object values, object buf):
-        assert(values.ndim == 1)
-
-        if not values.flags.contiguous:
-            values = values.copy()
-
-        assert(values.dtype == buf.dtype)
-        self.values = values
-        self.buf = buf
-        self.stride = values.strides[0]
-
-        self.orig_data = self.buf.data
-        self.orig_len = self.buf.shape[0]
-        self.orig_stride = self.buf.strides[0]
-
-        self.buf.data = self.values.data
-        self.buf.strides[0] = self.stride
-
-    cpdef advance(self, Py_ssize_t k):
-        self.buf.data = <char*> self.buf.data + self.stride * k
-
-    cdef move(self, int start, int end):
-        """
-        For slicing
-        """
-        self.buf.data = self.values.data + self.stride * start
-        self.buf.shape[0] = end - start
-
-    cpdef set_length(self, Py_ssize_t length):
-        self.buf.shape[0] = length
-
-    cpdef reset(self):
-
-        self.buf.shape[0] = self.orig_len
-        self.buf.data = self.orig_data
-        self.buf.strides[0] = self.orig_stride
-
-
-class InvalidApply(Exception):
-    pass
-
-
-def apply_frame_axis0(object frame, object f, object names,
-                      ndarray[int64_t] starts, ndarray[int64_t] ends):
-    cdef:
-        BlockSlider slider
-        Py_ssize_t i, n = len(starts)
-        list results
-        object piece
-        dict item_cache
-
-    if frame.index._has_complex_internals:
-        raise InvalidApply('Cannot modify frame index internals')
-
-    results = []
-
-    # Need to infer if our low-level mucking is going to cause a segfault
-    if n > 0:
-        chunk = frame.iloc[starts[0]:ends[0]]
-        object.__setattr__(chunk, 'name', names[0])
-        try:
-            result = f(chunk)
-            if result is chunk:
-                raise InvalidApply('Function unsafe for fast apply')
-        except:
-            raise InvalidApply('Let this error raise above us')
-
-    slider = BlockSlider(frame)
-
-    mutated = False
-    item_cache = slider.dummy._item_cache
-    try:
-        for i in range(n):
-            slider.move(starts[i], ends[i])
-
-            item_cache.clear() # ugh
-
-            object.__setattr__(slider.dummy, 'name', names[i])
-            piece = f(slider.dummy)
-
-            # I'm paying the price for index-sharing, ugh
-            try:
-                if piece.index is slider.dummy.index:
-                    piece = piece.copy(deep='all')
-                else:
-                    mutated = True
-            except AttributeError:
-                pass
-
-            results.append(piece)
-    finally:
-        slider.reset()
-
-    return results, mutated
-
-cdef class BlockSlider:
-    """
-    Only capable of sliding on axis=0
-    """
-
-    cdef public:
-        object frame, dummy, index
-        int nblocks
-        Slider idx_slider
-        list blocks
-
-    cdef:
-        char **base_ptrs
-
-    def __init__(self, frame):
-        self.frame = frame
-        self.dummy = frame[:0]
-        self.index = self.dummy.index
-
-        self.blocks = [b.values for b in self.dummy._data.blocks]
-
-        for x in self.blocks:
-            util.set_array_not_contiguous(x)
-
-        self.nblocks = len(self.blocks)
-        self.idx_slider = Slider(
-            self.frame.index.values, self.dummy.index.values)
-
-        self.base_ptrs = <char**> malloc(sizeof(char*) * len(self.blocks))
-        for i, block in enumerate(self.blocks):
-            self.base_ptrs[i] = (<ndarray> block).data
-
-    def __dealloc__(self):
-        free(self.base_ptrs)
-
-    cpdef move(self, int start, int end):
-        cdef:
-            ndarray arr
-            object index
-
-        # move blocks
-        for i in range(self.nblocks):
-            arr = self.blocks[i]
-
-            # axis=1 is the frame's axis=0
-            arr.data = self.base_ptrs[i] + arr.strides[1] * start
-            arr.shape[1] = end - start
-
-        # move and set the index
-        self.idx_slider.move(start, end)
-        object.__setattr__(self.index, '_data', self.idx_slider.buf)
-        self.index._engine.clear_mapping()
-
-    cdef reset(self):
-        cdef:
-            ndarray arr
-
-        # reset blocks
-        for i in range(self.nblocks):
-            arr = self.blocks[i]
-
-            # axis=1 is the frame's axis=0
-            arr.data = self.base_ptrs[i]
-            arr.shape[1] = 0
-
-
-def reduce(arr, f, axis=0, dummy=None, labels=None):
-    """
-
-    Parameters
-    -----------
-    arr : NDFrame object
-    f : function
-    axis : integer axis
-    dummy : type of reduced output (series)
-    labels : Index or None
-    """
-
-    if labels is not None:
-        if labels._has_complex_internals:
-            raise Exception('Cannot use shortcut')
-
-        # pass as an ndarray
-        if hasattr(labels, 'values'):
-            labels = labels.values
-
-    reducer = Reducer(arr, f, axis=axis, dummy=dummy, labels=labels)
-    return reducer.get_result()
diff --git a/pandas/_libs/src/skiplist.h b/pandas/_libs/src/skiplist.h
index f9527e72f577e..60c1a56727777 100644
--- a/pandas/_libs/src/skiplist.h
+++ b/pandas/_libs/src/skiplist.h
@@ -20,18 +20,7 @@ Python recipe (http://rhettinger.wordpress.com/2010/02/06/lost-knowledge/)
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
-
-#ifndef PANDAS_INLINE
-#if defined(__GNUC__)
-#define PANDAS_INLINE static __inline__
-#elif defined(_MSC_VER)
-#define PANDAS_INLINE static __inline
-#elif defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L
-#define PANDAS_INLINE static inline
-#else
-#define PANDAS_INLINE
-#endif
-#endif
+#include "inline_helper.h"
 
 PANDAS_INLINE float __skiplist_nanf(void) {
     const union {
diff --git a/pandas/_libs/src/skiplist.pxd b/pandas/_libs/src/skiplist.pxd
deleted file mode 100644
index 69e9df5b542aa..0000000000000
--- a/pandas/_libs/src/skiplist.pxd
+++ /dev/null
@@ -1,22 +0,0 @@
-cdef extern from "skiplist.h":
-    ctypedef struct node_t:
-        node_t **next
-        int *width
-        double value
-        int is_nil
-        int levels
-        int ref_count
-
-    ctypedef struct skiplist_t:
-        node_t *head
-        node_t **tmp_chain
-        int *tmp_steps
-        int size
-        int maxlevels
-
-    inline skiplist_t* skiplist_init(int) nogil
-    inline void skiplist_destroy(skiplist_t*) nogil
-    inline double skiplist_get(skiplist_t*, int, int*) nogil
-    inline int skiplist_insert(skiplist_t*, double) nogil
-    inline int skiplist_remove(skiplist_t*, double) nogil
-
diff --git a/pandas/_libs/src/ujson/lib/ultrajson.h b/pandas/_libs/src/ujson/lib/ultrajson.h
index 4f51fa8b3eb38..0470fef450dde 100644
--- a/pandas/_libs/src/ujson/lib/ultrajson.h
+++ b/pandas/_libs/src/ujson/lib/ultrajson.h
@@ -140,7 +140,7 @@ typedef int64_t JSLONG;
 #endif
 
 #if !defined(__LITTLE_ENDIAN__) && !defined(__BIG_ENDIAN__)
-#error "Endianess not supported"
+#error "Endianness not supported"
 #endif
 
 enum JSTYPES {
@@ -245,7 +245,7 @@ typedef struct __JSONObjectEncoder {
   int encodeHTMLChars;
 
   /*
-  Set to an error message if error occured */
+  Set to an error message if error occurred */
   const char *errorMsg;
   JSOBJ errorObj;
 
@@ -307,4 +307,11 @@ EXPORTFUNCTION JSOBJ JSON_DecodeObject(JSONObjectDecoder *dec,
                                        const char *buffer, size_t cbBuffer);
 EXPORTFUNCTION void encode(JSOBJ, JSONObjectEncoder *, const char *, size_t);
 
+#define Buffer_Reserve(__enc, __len)                                  \
+    if ((size_t)((__enc)->end - (__enc)->offset) < (size_t)(__len)) { \
+        Buffer_Realloc((__enc), (__len));                             \
+    }
+
+void Buffer_Realloc(JSONObjectEncoder *enc, size_t cbNeeded);
+
 #endif  // PANDAS__LIBS_SRC_UJSON_LIB_ULTRAJSON_H_
diff --git a/pandas/_libs/src/ujson/lib/ultrajsonenc.c b/pandas/_libs/src/ujson/lib/ultrajsonenc.c
index 5a15071938c1a..2d6c823a45515 100644
--- a/pandas/_libs/src/ujson/lib/ultrajsonenc.c
+++ b/pandas/_libs/src/ujson/lib/ultrajsonenc.c
@@ -714,11 +714,6 @@ int Buffer_EscapeStringValidated(JSOBJ obj, JSONObjectEncoder *enc,
     }
 }
 
-#define Buffer_Reserve(__enc, __len)                                  \
-    if ((size_t)((__enc)->end - (__enc)->offset) < (size_t)(__len)) { \
-        Buffer_Realloc((__enc), (__len));                             \
-    }
-
 #define Buffer_AppendCharUnchecked(__enc, __chr) *((__enc)->offset++) = __chr;
 
 FASTCALL_ATTR INLINE_PREFIX void FASTCALL_MSVC strreverse(char *begin,
@@ -823,17 +818,19 @@ int Buffer_AppendDoubleUnchecked(JSOBJ obj, JSONObjectEncoder *enc,
 
     if (diff > 0.5) {
         ++frac;
-        /* handle rollover, e.g.  case 0.99 with prec 1 is 1.0  */
-        if (frac >= pow10) {
-            frac = 0;
-            ++whole;
-        }
     } else if (diff == 0.5 && ((frac == 0) || (frac & 1))) {
         /* if halfway, round up if odd, OR
         if last digit is 0.  That last part is strange */
         ++frac;
     }
 
+    // handle rollover, e.g.
+    // case 0.99 with prec 1 is 1.0 and case 0.95 with prec is 1.0 as well
+    if (frac >= pow10) {
+        frac = 0;
+        ++whole;
+    }
+
     if (enc->doublePrecision == 0) {
         diff = value - whole;
 
@@ -974,6 +971,7 @@ void encode(JSOBJ obj, JSONObjectEncoder *enc, const char *name,
             }
 
             enc->iterEnd(obj, &tc);
+            Buffer_Reserve(enc, 2);
             Buffer_AppendCharUnchecked(enc, ']');
             break;
         }
@@ -1001,6 +999,7 @@ void encode(JSOBJ obj, JSONObjectEncoder *enc, const char *name,
             }
 
             enc->iterEnd(obj, &tc);
+            Buffer_Reserve(enc, 2);
             Buffer_AppendCharUnchecked(enc, '}');
             break;
         }
diff --git a/pandas/_libs/src/ujson/python/JSONtoObj.c b/pandas/_libs/src/ujson/python/JSONtoObj.c
index b0132532c16af..85cf1d5e5e7a1 100644
--- a/pandas/_libs/src/ujson/python/JSONtoObj.c
+++ b/pandas/_libs/src/ujson/python/JSONtoObj.c
@@ -409,7 +409,7 @@ JSOBJ Object_npyEndObject(void *prv, JSOBJ obj) {
 }
 
 int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
-    PyObject *label;
+    PyObject *label, *labels;
     npy_intp labelidx;
     // add key to label array, value to values array
     NpyArrContext *npyarr = (NpyArrContext *)obj;
@@ -424,11 +424,11 @@ int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
     if (!npyarr->labels[labelidx]) {
         npyarr->labels[labelidx] = PyList_New(0);
     }
-
+    labels = npyarr->labels[labelidx];
     // only fill label array once, assumes all column labels are the same
     // for 2-dimensional arrays.
-    if (PyList_GET_SIZE(npyarr->labels[labelidx]) <= npyarr->elcount) {
-        PyList_Append(npyarr->labels[labelidx], label);
+    if (PyList_Check(labels) && PyList_GET_SIZE(labels) <= npyarr->elcount) {
+        PyList_Append(labels, label);
     }
 
     if (((JSONObjectDecoder *)npyarr->dec)->arrayAddItem(prv, obj, value)) {
@@ -439,16 +439,16 @@ int Object_npyObjectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
 }
 
 int Object_objectAddKey(void *prv, JSOBJ obj, JSOBJ name, JSOBJ value) {
-    PyDict_SetItem(obj, name, value);
+    int ret = PyDict_SetItem(obj, name, value);
     Py_DECREF((PyObject *)name);
     Py_DECREF((PyObject *)value);
-    return 1;
+    return ret == 0 ? 1 : 0;
 }
 
 int Object_arrayAddItem(void *prv, JSOBJ obj, JSOBJ value) {
-    PyList_Append(obj, value);
+    int ret = PyList_Append(obj, value);
     Py_DECREF((PyObject *)value);
-    return 1;
+    return ret == 0 ? 1 : 0;
 }
 
 JSOBJ Object_newString(void *prv, wchar_t *start, wchar_t *end) {
diff --git a/pandas/_libs/src/ujson/python/objToJSON.c b/pandas/_libs/src/ujson/python/objToJSON.c
index 26a68b8a9ae3a..d0caeb3333548 100644
--- a/pandas/_libs/src/ujson/python/objToJSON.c
+++ b/pandas/_libs/src/ujson/python/objToJSON.c
@@ -43,13 +43,13 @@ Numeric decoder derived from from TCL library
 #include <math.h>                 // NOLINT(build/include_order)
 #include <numpy/arrayobject.h>    // NOLINT(build/include_order)
 #include <numpy/arrayscalars.h>   // NOLINT(build/include_order)
+#include <numpy/ndarraytypes.h>   // NOLINT(build/include_order)
 #include <numpy/npy_math.h>       // NOLINT(build/include_order)
-#include <numpy_helper.h>         // NOLINT(build/include_order)
 #include <stdio.h>                // NOLINT(build/include_order)
 #include <ultrajson.h>            // NOLINT(build/include_order)
-#include <datetime_helper.h>      // NOLINT(build/include_order)
-#include <np_datetime.h>          // NOLINT(build/include_order)
-#include <np_datetime_strings.h>  // NOLINT(build/include_order)
+#include <../../../tslibs/src/datetime/np_datetime.h>          // NOLINT(build/include_order)
+#include <../../../tslibs/src/datetime/np_datetime_strings.h>  // NOLINT(build/include_order)
+#include "datetime.h"
 
 static PyObject *type_decimal;
 
@@ -60,6 +60,8 @@ static PyTypeObject *cls_series;
 static PyTypeObject *cls_index;
 static PyTypeObject *cls_nat;
 
+npy_int64 get_nat(void) { return NPY_MIN_INT64; }
+
 typedef void *(*PFN_PyTypeToJSON)(JSOBJ obj, JSONTypeContext *ti,
                                   void *outValue, size_t *_outLen);
 
@@ -137,7 +139,7 @@ typedef struct __PyObjectEncoder {
     TypeContext basicTypeContext;
 
     int datetimeIso;
-    PANDAS_DATETIMEUNIT datetimeUnit;
+    NPY_DATETIMEUNIT datetimeUnit;
 
     // output format style for pandas data types
     int outputFormat;
@@ -162,7 +164,7 @@ void initObjToJSON(void)
 #endif
 {
     PyObject *mod_pandas;
-    PyObject *mod_tslib;
+    PyObject *mod_nattype;
     PyObject *mod_decimal = PyImport_ImportModule("decimal");
     type_decimal = PyObject_GetAttrString(mod_decimal, "Decimal");
     Py_INCREF(type_decimal);
@@ -180,10 +182,11 @@ void initObjToJSON(void)
         Py_DECREF(mod_pandas);
     }
 
-    mod_tslib = PyImport_ImportModule("pandas._libs.tslib");
-    if (mod_tslib) {
-        cls_nat = (PyTypeObject *)PyObject_GetAttrString(mod_tslib, "NaTType");
-        Py_DECREF(mod_tslib);
+    mod_nattype = PyImport_ImportModule("pandas._libs.tslibs.nattype");
+    if (mod_nattype) {
+        cls_nat = (PyTypeObject *)PyObject_GetAttrString(mod_nattype,
+                                                         "NaTType");
+        Py_DECREF(mod_nattype);
     }
 
     /* Initialise numpy API and use 2/3 compatible return */
@@ -225,6 +228,11 @@ static PyObject *get_values(PyObject *obj) {
     PRINTMARK();
 
     if (values && !PyArray_CheckExact(values)) {
+
+        if (PyObject_HasAttrString(values, "to_numpy")) {
+            values = PyObject_CallMethod(values, "to_numpy", NULL);
+        }
+
         if (PyObject_HasAttrString(values, "values")) {
             PyObject *subvals = get_values(values);
             PyErr_Clear();
@@ -276,8 +284,8 @@ static PyObject *get_values(PyObject *obj) {
             repr = PyString_FromString("<unknown dtype>");
         }
 
-        PyErr_Format(PyExc_ValueError, "%s or %s are not JSON serializable yet",
-                     PyString_AS_STRING(repr), PyString_AS_STRING(typeRepr));
+        PyErr_Format(PyExc_ValueError, "%R or %R are not JSON serializable yet",
+                     repr, typeRepr);
         Py_DECREF(repr);
         Py_DECREF(typeRepr);
 
@@ -329,6 +337,23 @@ static Py_ssize_t get_attr_length(PyObject *obj, char *attr) {
     return ret;
 }
 
+static npy_int64 get_long_attr(PyObject *o, const char *attr) {
+  npy_int64 long_val;
+  PyObject *value = PyObject_GetAttrString(o, attr);
+  long_val = (PyLong_Check(value) ?
+              PyLong_AsLongLong(value) : PyInt_AS_LONG(value));
+  Py_DECREF(value);
+  return long_val;
+}
+
+static npy_float64 total_seconds(PyObject *td) {
+  npy_float64 double_val;
+  PyObject *value = PyObject_CallMethod(td, "total_seconds", NULL);
+  double_val = PyFloat_AS_DOUBLE(value);
+  Py_DECREF(value);
+  return double_val;
+}
+
 static PyObject *get_item(PyObject *obj, Py_ssize_t i) {
     PyObject *tmp = PyInt_FromSsize_t(i);
     PyObject *ret;
@@ -401,19 +426,19 @@ static void *PyStringToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
 
 static void *PyUnicodeToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
                              size_t *_outLen) {
-    PyObject *obj = (PyObject *)_obj;
+    PyObject *obj, *newObj;
+    obj = (PyObject *)_obj;
 
 #if (PY_VERSION_HEX >= 0x03030000)
     if (PyUnicode_IS_COMPACT_ASCII(obj)) {
         Py_ssize_t len;
-        char *data = PyUnicode_AsUTF8AndSize(obj, &len);
+        char *data = (char*)PyUnicode_AsUTF8AndSize(obj, &len);
         *_outLen = len;
         return data;
     }
 #endif
 
-    PyObject *newObj = PyUnicode_EncodeUTF8(PyUnicode_AS_UNICODE(obj),
-                                            PyUnicode_GET_SIZE(obj), NULL);
+    newObj = PyUnicode_AsUTF8String(obj);
 
     GET_TC(tc)->newObj = newObj;
 
@@ -421,10 +446,10 @@ static void *PyUnicodeToUTF8(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
     return PyString_AS_STRING(newObj);
 }
 
-static void *PandasDateTimeStructToJSON(pandas_datetimestruct *dts,
+static void *PandasDateTimeStructToJSON(npy_datetimestruct *dts,
                                         JSONTypeContext *tc, void *outValue,
                                         size_t *_outLen) {
-    PANDAS_DATETIMEUNIT base = ((PyObjectEncoder *)tc->encoder)->datetimeUnit;
+    NPY_DATETIMEUNIT base = ((PyObjectEncoder *)tc->encoder)->datetimeUnit;
 
     if (((PyObjectEncoder *)tc->encoder)->datetimeIso) {
         PRINTMARK();
@@ -436,8 +461,7 @@ static void *PandasDateTimeStructToJSON(pandas_datetimestruct *dts,
             return NULL;
         }
 
-        if (!make_iso_8601_datetime(dts, GET_TC(tc)->cStr, *_outLen, 0, base,
-                                    -1, NPY_UNSAFE_CASTING)) {
+        if (!make_iso_8601_datetime(dts, GET_TC(tc)->cStr, *_outLen, base)) {
             PRINTMARK();
             *_outLen = strlen(GET_TC(tc)->cStr);
             return GET_TC(tc)->cStr;
@@ -451,30 +475,31 @@ static void *PandasDateTimeStructToJSON(pandas_datetimestruct *dts,
         }
     } else {
         PRINTMARK();
-        *((JSINT64 *)outValue) = pandas_datetimestruct_to_datetime(base, dts);
+        *((JSINT64 *)outValue) = npy_datetimestruct_to_datetime(base, dts);
         return NULL;
     }
 }
 
 static void *NpyDateTimeScalarToJSON(JSOBJ _obj, JSONTypeContext *tc,
                                      void *outValue, size_t *_outLen) {
-    pandas_datetimestruct dts;
+    npy_datetimestruct dts;
     PyDatetimeScalarObject *obj = (PyDatetimeScalarObject *)_obj;
     PRINTMARK();
+    // TODO(anyone): Does not appear to be reached in tests.
 
-    pandas_datetime_to_datetimestruct(
-        obj->obval, (PANDAS_DATETIMEUNIT)obj->obmeta.base, &dts);
+    pandas_datetime_to_datetimestruct(obj->obval,
+                                     (NPY_DATETIMEUNIT)obj->obmeta.base, &dts);
     return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
 }
 
 static void *PyDateTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
                               size_t *_outLen) {
-    pandas_datetimestruct dts;
-    PyObject *obj = (PyObject *)_obj;
+    npy_datetimestruct dts;
+    PyDateTime_Date *obj = (PyDateTime_Date *)_obj;
 
     PRINTMARK();
 
-    if (!convert_pydatetime_to_datetimestruct(obj, &dts, NULL, 1)) {
+    if (!convert_pydatetime_to_datetimestruct(obj, &dts)) {
         PRINTMARK();
         return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
     } else {
@@ -489,11 +514,11 @@ static void *PyDateTimeToJSON(JSOBJ _obj, JSONTypeContext *tc, void *outValue,
 
 static void *NpyDatetime64ToJSON(JSOBJ _obj, JSONTypeContext *tc,
                                  void *outValue, size_t *_outLen) {
-    pandas_datetimestruct dts;
+    npy_datetimestruct dts;
     PRINTMARK();
 
     pandas_datetime_to_datetimestruct((npy_datetime)GET_TC(tc)->longValue,
-                                      PANDAS_FR_ns, &dts);
+                                      NPY_FR_ns, &dts);
     return PandasDateTimeStructToJSON(&dts, tc, outValue, _outLen);
 }
 
@@ -765,6 +790,7 @@ static void NpyArr_getLabel(JSOBJ obj, JSONTypeContext *tc, size_t *outLen,
     JSONObjectEncoder *enc = (JSONObjectEncoder *)tc->encoder;
     PRINTMARK();
     *outLen = strlen(labels[idx]);
+    Buffer_Reserve(enc, *outLen);
     memcpy(enc->offset, labels[idx], sizeof(char) * (*outLen));
     enc->offset += *outLen;
     *outLen = 0;
@@ -861,7 +887,7 @@ int PdBlock_iterNext(JSOBJ obj, JSONTypeContext *tc) {
     NpyArrContext *npyarr;
     PRINTMARK();
 
-    if (PyErr_Occurred()) {
+    if (PyErr_Occurred() || ((JSONObjectEncoder *)tc->encoder)->errorMsg) {
         return 0;
     }
 
@@ -1206,6 +1232,10 @@ int Dir_iterNext(JSOBJ _obj, JSONTypeContext *tc) {
     PyObject *attrName;
     char *attrStr;
 
+    if (PyErr_Occurred() || ((JSONObjectEncoder *)tc->encoder)->errorMsg) {
+        return 0;
+    }
+
     if (itemValue) {
         Py_DECREF(GET_TC(tc)->itemValue);
         GET_TC(tc)->itemValue = itemValue = NULL;
@@ -1840,15 +1870,15 @@ void Object_beginTypeContext(JSOBJ _obj, JSONTypeContext *tc) {
 
         base = ((PyObjectEncoder *)tc->encoder)->datetimeUnit;
         switch (base) {
-            case PANDAS_FR_ns:
+            case NPY_FR_ns:
                 break;
-            case PANDAS_FR_us:
+            case NPY_FR_us:
                 value /= 1000LL;
                 break;
-            case PANDAS_FR_ms:
+            case NPY_FR_ms:
                 value /= 1000000LL;
                 break;
-            case PANDAS_FR_s:
+            case NPY_FR_s:
                 value /= 1000000000LL;
                 break;
         }
@@ -2334,7 +2364,7 @@ PyObject *objToJSON(PyObject *self, PyObject *args, PyObject *kwargs) {
     pyEncoder.npyType = -1;
     pyEncoder.npyValue = NULL;
     pyEncoder.datetimeIso = 0;
-    pyEncoder.datetimeUnit = PANDAS_FR_ms;
+    pyEncoder.datetimeUnit = NPY_FR_ms;
     pyEncoder.outputFormat = COLUMNS;
     pyEncoder.defaultHandler = 0;
     pyEncoder.basicTypeContext.newObj = NULL;
@@ -2392,13 +2422,13 @@ PyObject *objToJSON(PyObject *self, PyObject *args, PyObject *kwargs) {
 
     if (sdateFormat != NULL) {
         if (strcmp(sdateFormat, "s") == 0) {
-            pyEncoder.datetimeUnit = PANDAS_FR_s;
+            pyEncoder.datetimeUnit = NPY_FR_s;
         } else if (strcmp(sdateFormat, "ms") == 0) {
-            pyEncoder.datetimeUnit = PANDAS_FR_ms;
+            pyEncoder.datetimeUnit = NPY_FR_ms;
         } else if (strcmp(sdateFormat, "us") == 0) {
-            pyEncoder.datetimeUnit = PANDAS_FR_us;
+            pyEncoder.datetimeUnit = NPY_FR_us;
         } else if (strcmp(sdateFormat, "ns") == 0) {
-            pyEncoder.datetimeUnit = PANDAS_FR_ns;
+            pyEncoder.datetimeUnit = NPY_FR_ns;
         } else {
             PyErr_Format(PyExc_ValueError,
                          "Invalid value '%s' for option 'date_unit'",
diff --git a/pandas/_libs/src/ujson/python/ujson.c b/pandas/_libs/src/ujson/python/ujson.c
index ec6720f16bc77..da19afab030b1 100644
--- a/pandas/_libs/src/ujson/python/ujson.c
+++ b/pandas/_libs/src/ujson/python/ujson.c
@@ -58,12 +58,12 @@ PyObject *JSONFileToObj(PyObject *self, PyObject *args, PyObject *kwargs);
 
 static PyMethodDef ujsonMethods[] = {
     {"encode", (PyCFunction)objToJSON, METH_VARARGS | METH_KEYWORDS,
-     "Converts arbitrary object recursivly into JSON. " ENCODER_HELP_TEXT},
+     "Converts arbitrary object recursively into JSON. " ENCODER_HELP_TEXT},
     {"decode", (PyCFunction)JSONToObj, METH_VARARGS | METH_KEYWORDS,
      "Converts JSON as string to dict object structure. Use precise_float=True "
      "to use high precision float decoder."},
     {"dumps", (PyCFunction)objToJSON, METH_VARARGS | METH_KEYWORDS,
-     "Converts arbitrary object recursivly into JSON. " ENCODER_HELP_TEXT},
+     "Converts arbitrary object recursively into JSON. " ENCODER_HELP_TEXT},
     {"loads", (PyCFunction)JSONToObj, METH_VARARGS | METH_KEYWORDS,
      "Converts JSON as string to dict object structure. Use precise_float=True "
      "to use high precision float decoder."},
@@ -90,14 +90,14 @@ static struct PyModuleDef moduledef = {
     NULL          /* m_free */
 };
 
-#define PYMODINITFUNC PyMODINIT_FUNC PyInit_libjson(void)
+#define PYMODINITFUNC PyMODINIT_FUNC PyInit_json(void)
 #define PYMODULE_CREATE() PyModule_Create(&moduledef)
 #define MODINITERROR return NULL
 
 #else
 
-#define PYMODINITFUNC PyMODINIT_FUNC initlibjson(void)
-#define PYMODULE_CREATE() Py_InitModule("libjson", ujsonMethods)
+#define PYMODINITFUNC PyMODINIT_FUNC initjson(void)
+#define PYMODULE_CREATE() Py_InitModule("json", ujsonMethods)
 #define MODINITERROR return
 
 #endif
diff --git a/pandas/_libs/src/util.pxd b/pandas/_libs/src/util.pxd
deleted file mode 100644
index be8d0d4aa6302..0000000000000
--- a/pandas/_libs/src/util.pxd
+++ /dev/null
@@ -1,128 +0,0 @@
-from numpy cimport ndarray
-cimport numpy as cnp
-cimport cpython
-
-cdef extern from "numpy_helper.h":
-    inline void set_array_owndata(ndarray ao)
-    inline void set_array_not_contiguous(ndarray ao)
-
-    inline int is_integer_object(object)
-    inline int is_float_object(object)
-    inline int is_complex_object(object)
-    inline int is_bool_object(object)
-    inline int is_string_object(object)
-    inline int is_datetime64_object(object)
-    inline int is_timedelta64_object(object)
-    inline int assign_value_1d(ndarray, Py_ssize_t, object) except -1
-    inline cnp.int64_t get_nat()
-    inline object get_value_1d(ndarray, Py_ssize_t)
-    inline int floatify(object, double*) except -1
-    inline char *get_c_string(object)
-    inline object char_to_string(char*)
-    inline void transfer_object_column(char *dst, char *src, size_t stride,
-                                       size_t length)
-    object sarr_from_data(cnp.dtype, int length, void* data)
-    inline object unbox_if_zerodim(object arr)
-
-ctypedef fused numeric:
-    cnp.int8_t
-    cnp.int16_t
-    cnp.int32_t
-    cnp.int64_t
-
-    cnp.uint8_t
-    cnp.uint16_t
-    cnp.uint32_t
-    cnp.uint64_t
-
-    cnp.float32_t
-    cnp.float64_t
-
-cdef extern from "headers/stdint.h":
-    enum: UINT8_MAX
-    enum: UINT16_MAX
-    enum: UINT32_MAX
-    enum: UINT64_MAX
-    enum: INT8_MIN
-    enum: INT8_MAX
-    enum: INT16_MIN
-    enum: INT16_MAX
-    enum: INT32_MAX
-    enum: INT32_MIN
-    enum: INT64_MAX
-    enum: INT64_MIN
-
-cdef inline object get_value_at(ndarray arr, object loc):
-    cdef:
-        Py_ssize_t i, sz
-        void* data_ptr
-    if is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = cnp.PyArray_SIZE(arr)
-
-    if i < 0 and sz > 0:
-        i += sz
-    elif i >= sz or sz == 0:
-        raise IndexError('index out of bounds')
-
-    return get_value_1d(arr, i)
-
-cdef inline set_value_at_unsafe(ndarray arr, object loc, object value):
-    """Sets a value into the array without checking the writeable flag.
-
-    This should be used when setting values in a loop, check the writeable
-    flag above the loop and then eschew the check on each iteration.
-    """
-    cdef:
-        Py_ssize_t i, sz
-    if is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = cnp.PyArray_SIZE(arr)
-
-    if i < 0:
-        i += sz
-    elif i >= sz:
-        raise IndexError('index out of bounds')
-
-    assign_value_1d(arr, i, value)
-
-cdef inline set_value_at(ndarray arr, object loc, object value):
-    """Sets a value into the array after checking that the array is mutable.
-    """
-    if not cnp.PyArray_ISWRITEABLE(arr):
-        raise ValueError('assignment destination is read-only')
-
-    set_value_at_unsafe(arr, loc, value)
-
-cdef inline int is_contiguous(ndarray arr):
-    return cnp.PyArray_CHKFLAGS(arr, cnp.NPY_C_CONTIGUOUS)
-
-cdef inline is_array(object o):
-    return cnp.PyArray_Check(o)
-
-cdef inline bint _checknull(object val):
-    try:
-        return val is None or (cpython.PyFloat_Check(val) and val != val)
-    except ValueError:
-        return False
-
-cdef inline bint _checknull_old(object val):
-    import numpy as np
-    cdef double INF = <double> np.inf
-    cdef double NEGINF = -INF
-    try:
-        return val is None or (cpython.PyFloat_Check(val) and (val != val or val == INF or val == NEGINF))
-    except ValueError:
-        return False
-
-cdef inline bint _checknan(object val):
-    return not cnp.PyArray_Check(val) and val != val
-
-cdef inline bint is_period_object(object val):
-    return getattr(val, '_typ', '_typ') == 'period'
diff --git a/pandas/util/testing.pyx b/pandas/_libs/testing.pyx
similarity index 97%
rename from pandas/util/testing.pyx
rename to pandas/_libs/testing.pyx
index cda21ba9c4ce1..10f68187938c0 100644
--- a/pandas/util/testing.pyx
+++ b/pandas/_libs/testing.pyx
@@ -1,8 +1,8 @@
 import numpy as np
 
 from pandas import compat
-from pandas.types.missing import isnull, array_equivalent
-from pandas.types.common import is_dtype_equal
+from pandas.core.dtypes.missing import isna, array_equivalent
+from pandas.core.dtypes.common import is_dtype_equal
 
 cdef NUMERIC_TYPES = (
     bool,
@@ -22,24 +22,30 @@ cdef NUMERIC_TYPES = (
     np.float64,
 )
 
+
 cdef bint is_comparable_as_number(obj):
     return isinstance(obj, NUMERIC_TYPES)
 
+
 cdef bint isiterable(obj):
     return hasattr(obj, '__iter__')
 
+
 cdef bint has_length(obj):
     return hasattr(obj, '__len__')
 
+
 cdef bint is_dictlike(obj):
     return hasattr(obj, 'keys') and hasattr(obj, '__getitem__')
 
+
 cdef bint decimal_almost_equal(double desired, double actual, int decimal):
     # Code from
     # http://docs.scipy.org/doc/numpy/reference/generated
     # /numpy.testing.assert_almost_equal.html
     return abs(desired - actual) < (0.5 * 10.0 ** -decimal)
 
+
 cpdef assert_dict_equal(a, b, bint compare_keys=True):
     assert is_dictlike(a) and is_dictlike(b), (
         "Cannot compare dict objects, one or both is not dict-like"
@@ -56,6 +62,7 @@ cpdef assert_dict_equal(a, b, bint compare_keys=True):
 
     return True
 
+
 cpdef assert_almost_equal(a, b,
                           check_less_precise=False,
                           bint check_dtype=True,
@@ -182,7 +189,7 @@ cpdef assert_almost_equal(a, b,
     if a == b:
         # object comparison
         return True
-    if isnull(a) and isnull(b):
+    if isna(a) and isna(b):
         # nan / None comparison
         return True
     if is_comparable_as_number(a) and is_comparable_as_number(b):
diff --git a/pandas/_libs/tslib.pxd b/pandas/_libs/tslib.pxd
deleted file mode 100644
index aa8cbcb2cedc7..0000000000000
--- a/pandas/_libs/tslib.pxd
+++ /dev/null
@@ -1,10 +0,0 @@
-from numpy cimport ndarray, int64_t
-
-cdef convert_to_tsobject(object, object, object, bint, bint)
-cpdef convert_to_timedelta64(object, object)
-cpdef object maybe_get_tz(object)
-cdef bint _is_utc(object)
-cdef bint _is_tzlocal(object)
-cdef object _get_dst_info(object)
-cdef bint _nat_scalar_rules[6]
-cdef bint _check_all_nulls(obj)
diff --git a/pandas/_libs/tslib.pyx b/pandas/_libs/tslib.pyx
index d441f1ec4759b..624872c1c56c6 100644
--- a/pandas/_libs/tslib.pyx
+++ b/pandas/_libs/tslib.pyx
@@ -1,5658 +1,832 @@
-# cython: profile=False
+# -*- coding: utf-8 -*-
+import cython
 
-import warnings
+from cpython.datetime cimport (PyDateTime_Check, PyDate_Check,
+                               PyDateTime_CheckExact,
+                               PyDateTime_IMPORT,
+                               timedelta, datetime, date, time)
+# import datetime C API
+PyDateTime_IMPORT
 
-cimport numpy as np
-from numpy cimport (int8_t, int32_t, int64_t, import_array, ndarray,
-                    NPY_INT64, NPY_DATETIME, NPY_TIMEDELTA)
-from datetime cimport get_datetime64_value, get_timedelta64_value
+
+cimport numpy as cnp
+from numpy cimport int64_t, ndarray, float64_t
 import numpy as np
+cnp.import_array()
 
-import sys
-cdef bint PY3 = (sys.version_info[0] >= 3)
-
-from cpython cimport (
-    PyTypeObject,
-    PyFloat_Check,
-    PyLong_Check,
-    PyObject_RichCompareBool,
-    PyObject_RichCompare,
-    Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE,
-    PyUnicode_Check,
-    PyUnicode_AsUTF8String,
-)
-
-cdef extern from "Python.h":
-    cdef PyTypeObject *Py_TYPE(object)
-
-cdef extern from "datetime_helper.h":
-    double total_seconds(object)
-
-# this is our datetime.pxd
-from datetime cimport cmp_pandas_datetimestruct
-from libc.stdlib cimport free
-
-from util cimport (is_integer_object, is_float_object, is_datetime64_object,
-                   is_timedelta64_object, INT64_MAX)
-cimport util
-
-from datetime cimport *
-from khash cimport *
-cimport cython
-
-from datetime import timedelta, datetime
-from datetime import time as datetime_time
-
-import re
-
-# dateutil compat
-from dateutil.tz import (tzoffset, tzlocal as _dateutil_tzlocal,
-                         tzfile as _dateutil_tzfile,
-                         tzutc as _dateutil_tzutc,
-                         tzstr as _dateutil_tzstr)
-
-from pandas.compat import is_platform_windows
-if is_platform_windows():
-    from dateutil.zoneinfo import gettz as _dateutil_gettz
-else:
-    from dateutil.tz import gettz as _dateutil_gettz
-from dateutil.relativedelta import relativedelta
-from dateutil.parser import DEFAULTPARSER
-
-from pytz.tzinfo import BaseTzInfo as _pytz_BaseTzInfo
-from pandas.compat import (parse_date, string_types, iteritems,
-                           StringIO, callable)
-
-import operator
-import collections
-import warnings
-
-# initialize numpy
-import_array()
-#import_ufunc()
+import pytz
 
-# import datetime C API
-PyDateTime_IMPORT
+from pandas._libs.util cimport (
+    is_integer_object, is_float_object, is_string_object, is_datetime64_object)
 
-# in numpy 1.7, will prob need the following:
-# numpy_pydatetime_import
 
-cdef int64_t NPY_NAT = util.get_nat()
-iNaT = NPY_NAT
+from pandas._libs.tslibs.np_datetime cimport (
+    check_dts_bounds, npy_datetimestruct, _string_to_dts, dt64_to_dtstruct,
+    dtstruct_to_dt64, pydatetime_to_dt64, pydate_to_dt64, get_datetime64_value)
+from pandas._libs.tslibs.np_datetime import OutOfBoundsDatetime
 
-# < numpy 1.7 compat for NaT
-compat_NaT = np.array([NPY_NAT]).astype('m8[ns]').item()
+from pandas._libs.tslibs.parsing import parse_datetime_string
 
+from pandas._libs.tslibs.timedeltas cimport cast_from_unit
+from pandas._libs.tslibs.timezones cimport is_utc, is_tzlocal, get_dst_info
+from pandas._libs.tslibs.timezones import UTC
+from pandas._libs.tslibs.conversion cimport (
+    tz_convert_single, _TSObject, convert_datetime_to_tsobject,
+    get_datetime64_nanos, tz_convert_utc_to_tzlocal)
 
-try:
-    basestring
-except NameError: # py3
-    basestring = str
+# many modules still look for NaT and iNaT here despite them not being needed
+from pandas._libs.tslibs.nattype import nat_strings, iNaT  # noqa:F821
+from pandas._libs.tslibs.nattype cimport (
+    checknull_with_nat, NPY_NAT, c_NaT as NaT)
 
+from pandas._libs.tslibs.offsets cimport to_offset
 
-cdef inline object create_timestamp_from_ts(
-        int64_t value, pandas_datetimestruct dts,
-        object tz, object freq):
-    """ convenience routine to construct a Timestamp from its parts """
-    cdef _Timestamp ts_base
-    ts_base = _Timestamp.__new__(Timestamp, dts.year, dts.month,
-                                 dts.day, dts.hour, dts.min,
-                                 dts.sec, dts.us, tz)
-    ts_base.value = value
-    ts_base.freq = freq
-    ts_base.nanosecond = dts.ps / 1000
+from pandas._libs.tslibs.timestamps cimport create_timestamp_from_ts
+from pandas._libs.tslibs.timestamps import Timestamp
 
-    return ts_base
+
+cdef bint PY2 = str == bytes
 
 
 cdef inline object create_datetime_from_ts(
-        int64_t value, pandas_datetimestruct dts,
+        int64_t value, npy_datetimestruct dts,
         object tz, object freq):
     """ convenience routine to construct a datetime.datetime from its parts """
     return datetime(dts.year, dts.month, dts.day, dts.hour,
                     dts.min, dts.sec, dts.us, tz)
 
 
-def ints_to_pydatetime(ndarray[int64_t] arr, tz=None, freq=None, box=False):
-    # convert an i8 repr to an ndarray of datetimes or Timestamp (if box ==
-    # True)
+cdef inline object create_date_from_ts(
+        int64_t value, npy_datetimestruct dts,
+        object tz, object freq):
+    """ convenience routine to construct a datetime.date from its parts """
+    return date(dts.year, dts.month, dts.day)
+
+
+cdef inline object create_time_from_ts(
+        int64_t value, npy_datetimestruct dts,
+        object tz, object freq):
+    """ convenience routine to construct a datetime.time from its parts """
+    return time(dts.hour, dts.min, dts.sec, dts.us, tz)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def ints_to_pydatetime(int64_t[:] arr, object tz=None, object freq=None,
+                       str box="datetime"):
+    """
+    Convert an i8 repr to an ndarray of datetimes, date, time or Timestamp
+
+    Parameters
+    ----------
+    arr  : array of i8
+    tz   : str, default None
+         convert to this timezone
+    freq : str/Offset, default None
+         freq to convert
+    box  : {'datetime', 'timestamp', 'date', 'time'}, default 'datetime'
+         If datetime, convert to datetime.datetime
+         If date, convert to datetime.date
+         If time, convert to datetime.time
+         If Timestamp, convert to pandas.Timestamp
+
+    Returns
+    -------
+    result : array of dtype specified by box
+    """
 
     cdef:
         Py_ssize_t i, n = len(arr)
-        pandas_datetimestruct dts
-        object dt
-        int64_t value
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        Py_ssize_t pos
+        npy_datetimestruct dts
+        object dt, new_tz
+        str typ
+        int64_t value, delta, local_value
         ndarray[object] result = np.empty(n, dtype=object)
-        object (*func_create)(int64_t, pandas_datetimestruct, object, object)
+        object (*func_create)(int64_t, npy_datetimestruct, object, object)
 
-    if box and util.is_string_object(freq):
-        from pandas.tseries.frequencies import to_offset
-        freq = to_offset(freq)
+    if box == "date":
+        assert (tz is None), "tz should be None when converting to date"
 
-    if box:
+        func_create = create_date_from_ts
+    elif box == "timestamp":
         func_create = create_timestamp_from_ts
-    else:
+
+        if is_string_object(freq):
+            freq = to_offset(freq)
+    elif box == "time":
+        func_create = create_time_from_ts
+    elif box == "datetime":
         func_create = create_datetime_from_ts
+    else:
+        raise ValueError("box must be one of 'datetime', 'date', 'time' or"
+                         " 'timestamp'")
+
+    if is_utc(tz) or tz is None:
+        for i in range(n):
+            value = arr[i]
+            if value == NPY_NAT:
+                result[i] = NaT
+            else:
+                dt64_to_dtstruct(value, &dts)
+                result[i] = func_create(value, dts, tz, freq)
+    elif is_tzlocal(tz):
+        for i in range(n):
+            value = arr[i]
+            if value == NPY_NAT:
+                result[i] = NaT
+            else:
+                # Python datetime objects do not support nanosecond
+                # resolution (yet, PEP 564). Need to compute new value
+                # using the i8 representation.
+                local_value = tz_convert_utc_to_tzlocal(value, tz)
+                dt64_to_dtstruct(local_value, &dts)
+                result[i] = func_create(value, dts, tz, freq)
+    else:
+        trans, deltas, typ = get_dst_info(tz)
 
-    if tz is not None:
-        if _is_utc(tz):
+        if typ not in ['pytz', 'dateutil']:
+            # static/fixed; in this case we know that len(delta) == 1
+            delta = deltas[0]
             for i in range(n):
                 value = arr[i]
                 if value == NPY_NAT:
                     result[i] = NaT
                 else:
-                    pandas_datetime_to_datetimestruct(
-                        value, PANDAS_FR_ns, &dts)
+                    # Adjust datetime64 timestamp, recompute datetimestruct
+                    dt64_to_dtstruct(value + delta, &dts)
                     result[i] = func_create(value, dts, tz, freq)
-        elif _is_tzlocal(tz) or _is_fixed_offset(tz):
+
+        elif typ == 'dateutil':
+            # no zone-name change for dateutil tzs - dst etc
+            # represented in single object.
             for i in range(n):
                 value = arr[i]
                 if value == NPY_NAT:
                     result[i] = NaT
                 else:
-                    pandas_datetime_to_datetimestruct(
-                        value, PANDAS_FR_ns, &dts)
-                    dt = create_datetime_from_ts(value, dts, tz, freq)
-                    dt = dt + tz.utcoffset(dt)
-                    if box:
-                        dt = Timestamp(dt)
-                    result[i] = dt
+                    # Adjust datetime64 timestamp, recompute datetimestruct
+                    pos = trans.searchsorted(value, side='right') - 1
+                    dt64_to_dtstruct(value + deltas[pos], &dts)
+                    result[i] = func_create(value, dts, tz, freq)
         else:
-            trans, deltas, typ = _get_dst_info(tz)
-
+            # pytz
             for i in range(n):
-
                 value = arr[i]
                 if value == NPY_NAT:
                     result[i] = NaT
                 else:
-
                     # Adjust datetime64 timestamp, recompute datetimestruct
                     pos = trans.searchsorted(value, side='right') - 1
-                    if _treat_tz_as_pytz(tz):
-                        # find right representation of dst etc in pytz timezone
-                        new_tz = tz._tzinfos[tz._transition_info[pos]]
-                    else:
-                        # no zone-name change for dateutil tzs - dst etc
-                        # represented in single object.
-                        new_tz = tz
+                    # find right representation of dst etc in pytz timezone
+                    new_tz = tz._tzinfos[tz._transition_info[pos]]
 
-                    pandas_datetime_to_datetimestruct(
-                        value + deltas[pos], PANDAS_FR_ns, &dts)
+                    dt64_to_dtstruct(value + deltas[pos], &dts)
                     result[i] = func_create(value, dts, new_tz, freq)
-    else:
-        for i in range(n):
-
-            value = arr[i]
-            if value == NPY_NAT:
-                result[i] = NaT
-            else:
-                pandas_datetime_to_datetimestruct(value, PANDAS_FR_ns, &dts)
-                result[i] = func_create(value, dts, None, freq)
 
     return result
 
 
-def ints_to_pytimedelta(ndarray[int64_t] arr, box=False):
-    # convert an i8 repr to an ndarray of timedelta or Timedelta (if box ==
-    # True)
-
+def _test_parse_iso8601(object ts):
+    """
+    TESTING ONLY: Parse string into Timestamp using iso8601 parser. Used
+    only for testing, actual construction uses `convert_str_to_tsobject`
+    """
     cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t value
-        ndarray[object] result = np.empty(n, dtype=object)
-
-    for i in range(n):
-
-        value = arr[i]
-        if value == NPY_NAT:
-            result[i] = NaT
-        else:
-            if box:
-                result[i] = Timedelta(value)
-            else:
-                result[i] = timedelta(microseconds=int(value) / 1000)
-
-    return result
-
-
-cdef inline bint _is_tzlocal(object tz):
-    return isinstance(tz, _dateutil_tzlocal)
-
-
-cdef inline bint _is_fixed_offset(object tz):
-    if _treat_tz_as_dateutil(tz):
-        if len(tz._trans_idx) == 0 and len(tz._trans_list) == 0:
-            return 1
-        else:
-            return 0
-    elif _treat_tz_as_pytz(tz):
-        if (len(tz._transition_info) == 0
-            and len(tz._utc_transition_times) == 0):
-            return 1
-        else:
-            return 0
-    return 1
+        _TSObject obj
+        int out_local = 0, out_tzoffset = 0
 
-_zero_time = datetime_time(0, 0)
-_no_input = object()
+    obj = _TSObject()
 
-# Python front end to C extension type _Timestamp
-# This serves as the box for datetime64
+    if ts == 'now':
+        return Timestamp.utcnow()
+    elif ts == 'today':
+        return Timestamp.now().normalize()
 
+    _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
+    obj.value = dtstruct_to_dt64(&obj.dts)
+    check_dts_bounds(&obj.dts)
+    if out_local == 1:
+        obj.tzinfo = pytz.FixedOffset(out_tzoffset)
+        obj.value = tz_convert_single(obj.value, obj.tzinfo, UTC)
+        return Timestamp(obj.value, tz=obj.tzinfo)
+    else:
+        return Timestamp(obj.value)
 
-class Timestamp(_Timestamp):
-    """TimeStamp is the pandas equivalent of python's Datetime
-    and is interchangable with it in most cases. It's the type used
-    for the entries that make up a DatetimeIndex, and other timeseries
-    oriented data structures in pandas.
 
-    There are essentially three calling conventions for the constructor. The
-    primary form accepts four parameters. They can be passed by position or
-    keyword.
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def format_array_from_datetime(ndarray[int64_t] values, object tz=None,
+                               object format=None, object na_rep=None):
+    """
+    return a np object array of the string formatted values
 
     Parameters
     ----------
-    ts_input : datetime-like, str, int, float
-        Value to be converted to Timestamp
-    freq : str, DateOffset
-        Offset which Timestamp will have
-    tz : string, pytz.timezone, dateutil.tz.tzfile or None
-        Time zone for time which Timestamp will have.
-    unit : string
-        numpy unit used for conversion, if ts_input is int or float
-    offset : str, DateOffset
-        Deprecated, use freq
-
-    The other two forms mimic the parameters from ``datetime.datetime``. They
-    can be passed by either position or keyword, but not both mixed together.
-
-    :func:`datetime.datetime` Parameters
-    ------------------------------------
-
-    .. versionadded:: 0.19.0
-
-    year : int
-    month : int
-    day : int
-    hour : int, optional, default is 0
-    minute : int, optional, default is 0
-    second : int, optional, default is 0
-    microsecond : int, optional, default is 0
-    tzinfo : datetime.tzinfo, optional, default is None
-    """
-
-    @classmethod
-    def fromordinal(cls, ordinal, freq=None, tz=None, offset=None):
-        """
-        passed an ordinal, translate and convert to a ts
-        note: by definition there cannot be any tz info on the ordinal itself
-
-        Parameters
-        ----------
-        ordinal : int
-            date corresponding to a proleptic Gregorian ordinal
-        freq : str, DateOffset
-            Offset which Timestamp will have
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time which Timestamp will have.
-        offset : str, DateOffset
-            Deprecated, use freq
-        """
-        return cls(datetime.fromordinal(ordinal),
-                   freq=freq, tz=tz, offset=offset)
-
-    @classmethod
-    def now(cls, tz=None):
-        """
-        Return the current time in the local timezone.  Equivalent
-        to datetime.now([tz])
-
-        Parameters
-        ----------
-        tz : string / timezone object, default None
-            Timezone to localize to
-        """
-        if isinstance(tz, basestring):
-            tz = maybe_get_tz(tz)
-        return cls(datetime.now(tz))
-
-    @classmethod
-    def today(cls, tz=None):
-        """
-        Return the current time in the local timezone.  This differs
-        from datetime.today() in that it can be localized to a
-        passed timezone.
-
-        Parameters
-        ----------
-        tz : string / timezone object, default None
-            Timezone to localize to
-        """
-        return cls.now(tz)
-
-    @classmethod
-    def utcnow(cls):
-        return cls.now('UTC')
-
-    @classmethod
-    def utcfromtimestamp(cls, ts):
-        return cls(datetime.utcfromtimestamp(ts))
-
-    @classmethod
-    def fromtimestamp(cls, ts):
-        return cls(datetime.fromtimestamp(ts))
-
-    @classmethod
-    def combine(cls, date, time):
-        return cls(datetime.combine(date, time))
-
-    def __new__(cls, object ts_input=_no_input,
-                object freq=None, tz=None, unit=None,
-                year=None, month=None, day=None,
-                hour=None, minute=None, second=None, microsecond=None,
-                tzinfo=None,
-                object offset=None):
-        # The parameter list folds together legacy parameter names (the first
-        # four) and positional and keyword parameter names from pydatetime.
-        #
-        # There are three calling forms:
-        #
-        # - In the legacy form, the first parameter, ts_input, is required
-        #   and may be datetime-like, str, int, or float. The second
-        #   parameter, offset, is optional and may be str or DateOffset.
-        #
-        # - ints in the first, second, and third arguments indicate
-        #   pydatetime positional arguments. Only the first 8 arguments
-        #   (standing in for year, month, day, hour, minute, second,
-        #   microsecond, tzinfo) may be non-None. As a shortcut, we just
-        #   check that the second argument is an int.
-        #
-        # - Nones for the first four (legacy) arguments indicate pydatetime
-        #   keyword arguments. year, month, and day are required. As a
-        #   shortcut, we just check that the first argument was not passed.
-        #
-        # Mixing pydatetime positional and keyword arguments is forbidden!
-
-        cdef _TSObject ts
-
-        if offset is not None:
-            # deprecate offset kwd in 0.19.0, GH13593
-            if freq is not None:
-                msg = "Can only specify freq or offset, not both"
-                raise TypeError(msg)
-            warnings.warn("offset is deprecated. Use freq instead",
-                          FutureWarning)
-            freq = offset
-
-        if ts_input is _no_input:
-            # User passed keyword arguments.
-            return Timestamp(datetime(year, month, day, hour or 0,
-                                      minute or 0, second or 0,
-                                      microsecond or 0, tzinfo),
-                             tz=tzinfo)
-        elif is_integer_object(freq):
-            # User passed positional arguments:
-            # Timestamp(year, month, day[, hour[, minute[, second[,
-            # microsecond[, tzinfo]]]]])
-            return Timestamp(datetime(ts_input, freq, tz, unit or 0,
-                                      year or 0, month or 0, day or 0,
-                                      hour), tz=hour)
-
-        ts = convert_to_tsobject(ts_input, tz, unit, 0, 0)
-
-        if ts.value == NPY_NAT:
-            return NaT
-
-        if util.is_string_object(freq):
-            from pandas.tseries.frequencies import to_offset
-            freq = to_offset(freq)
-
-        return create_timestamp_from_ts(ts.value, ts.dts, ts.tzinfo, freq)
+    values : a 1-d i8 array
+    tz : the timezone (or None)
+    format : optional, default is None
+          a strftime capable string
+    na_rep : optional, default is None
+          a nat format
 
-    def _round(self, freq, rounder):
+    """
+    cdef:
+        int64_t val, ns, N = len(values)
+        ndarray[int64_t] consider_values
+        bint show_ms = 0, show_us = 0, show_ns = 0, basic_format = 0
+        ndarray[object] result = np.empty(N, dtype=object)
+        object ts, res
+        npy_datetimestruct dts
 
-        cdef int64_t unit
-        cdef object result, value
+    if na_rep is None:
+        na_rep = 'NaT'
 
-        from pandas.tseries.frequencies import to_offset
-        unit = to_offset(freq).nanos
-        if self.tz is not None:
-            value = self.tz_localize(None).value
-        else:
-            value = self.value
-        if unit < 1000 and unit % 1000 != 0:
-            # for nano rounding, work with the last 6 digits separately
-            # due to float precision
-            buff = 1000000
-            result = (buff * (value // buff) + unit *
-                      (rounder((value % buff) / float(unit))).astype('i8'))
-        elif unit >= 1000 and unit % 1000 != 0:
-            msg = 'Precision will be lost using frequency: {}'
-            warnings.warn(msg.format(freq))
-            result = (unit * rounder(value / float(unit)).astype('i8'))
-        else:
-            result = (unit * rounder(value / float(unit)).astype('i8'))
-        result = Timestamp(result, unit='ns')
-        if self.tz is not None:
-            result = result.tz_localize(self.tz)
-        return result
+    # if we don't have a format nor tz, then choose
+    # a format based on precision
+    basic_format = format is None and tz is None
+    if basic_format:
+        consider_values = values[values != NPY_NAT]
+        show_ns = (consider_values % 1000).any()
 
-    def round(self, freq):
-        """
-        Round the Timestamp to the specified resolution
-
-        Returns
-        -------
-        a new Timestamp rounded to the given resolution of `freq`
-
-        Parameters
-        ----------
-        freq : a freq string indicating the rounding resolution
-
-        Raises
-        ------
-        ValueError if the freq cannot be converted
-        """
-        return self._round(freq, np.round)
-
-    def floor(self, freq):
-        """
-        return a new Timestamp floored to this resolution
-
-        Parameters
-        ----------
-        freq : a freq string indicating the flooring resolution
-        """
-        return self._round(freq, np.floor)
-
-    def ceil(self, freq):
-        """
-        return a new Timestamp ceiled to this resolution
-
-        Parameters
-        ----------
-        freq : a freq string indicating the ceiling resolution
-        """
-        return self._round(freq, np.ceil)
-
-    @property
-    def tz(self):
-        """
-        Alias for tzinfo
-        """
-        return self.tzinfo
-
-    @property
-    def offset(self):
-        warnings.warn(".offset is deprecated. Use .freq instead",
-                      FutureWarning)
-        return self.freq
-
-    def __setstate__(self, state):
-        self.value = state[0]
-        self.freq = state[1]
-        self.tzinfo = state[2]
-
-    def __reduce__(self):
-        object_state = self.value, self.freq, self.tzinfo
-        return (Timestamp, object_state)
-
-    def to_period(self, freq=None):
-        """
-        Return an period of which this timestamp is an observation.
-        """
-        from pandas.tseries.period import Period
-
-        if freq is None:
-            freq = self.freq
-
-        return Period(self, freq=freq)
-
-    @property
-    def dayofweek(self):
-        return self.weekday()
-
-    @property
-    def weekday_name(self):
-        out = get_date_name_field(
-            np.array([self.value], dtype=np.int64), 'weekday_name')
-        return out[0]
-
-    @property
-    def dayofyear(self):
-        return self._get_field('doy')
-
-    @property
-    def week(self):
-        return self._get_field('woy')
-
-    weekofyear = week
-
-    @property
-    def microsecond(self):
-        return self._get_field('us')
-
-    @property
-    def quarter(self):
-        return self._get_field('q')
-
-    @property
-    def days_in_month(self):
-        return self._get_field('dim')
-
-    daysinmonth = days_in_month
-
-    @property
-    def freqstr(self):
-        return getattr(self.freq, 'freqstr', self.freq)
-
-    @property
-    def is_month_start(self):
-        return self._get_start_end_field('is_month_start')
-
-    @property
-    def is_month_end(self):
-        return self._get_start_end_field('is_month_end')
-
-    @property
-    def is_quarter_start(self):
-        return self._get_start_end_field('is_quarter_start')
-
-    @property
-    def is_quarter_end(self):
-        return self._get_start_end_field('is_quarter_end')
-
-    @property
-    def is_year_start(self):
-        return self._get_start_end_field('is_year_start')
-
-    @property
-    def is_year_end(self):
-        return self._get_start_end_field('is_year_end')
-
-    @property
-    def is_leap_year(self):
-        return bool(is_leapyear(self.year))
-
-    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
-        """
-        Convert naive Timestamp to local time zone, or remove
-        timezone from tz-aware Timestamp.
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time which Timestamp will be converted to.
-            None will remove timezone holding local time.
-        ambiguous : bool, 'NaT', default 'raise'
-            - bool contains flags to determine if time is dst or not (note
-            that this flag is only applicable for ambiguous fall dst dates)
-            - 'NaT' will return NaT for an ambiguous time
-            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
-        errors : 'raise', 'coerce', default 'raise'
-            - 'raise' will raise a NonExistentTimeError if a timestamp is not
-               valid in the specified timezone (e.g. due to a transition from
-               or to DST time)
-            - 'coerce' will return NaT if the timestamp can not be converted
-              into the specified timezone
-
-              .. versionadded:: 0.19.0
-
-        Returns
-        -------
-        localized : Timestamp
-
-        Raises
-        ------
-        TypeError
-            If the Timestamp is tz-aware and tz is not None.
-        """
-        if ambiguous == 'infer':
-            raise ValueError('Cannot infer offset with only one time.')
-
-        if self.tzinfo is None:
-            # tz naive, localize
-            tz = maybe_get_tz(tz)
-            if not isinstance(ambiguous, basestring):
-                ambiguous =   [ambiguous]
-            value = tz_localize_to_utc(np.array([self.value], dtype='i8'), tz,
-                                       ambiguous=ambiguous, errors=errors)[0]
-            return Timestamp(value, tz=tz)
-        else:
-            if tz is None:
-                # reset tz
-                value = tz_convert_single(self.value, 'UTC', self.tz)
-                return Timestamp(value, tz=None)
-            else:
-                raise TypeError('Cannot localize tz-aware Timestamp, use '
-                                'tz_convert for conversions')
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware Timestamp to another time zone.
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time which Timestamp will be converted to.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        converted : Timestamp
-
-        Raises
-        ------
-        TypeError
-            If Timestamp is tz-naive.
-        """
-        if self.tzinfo is None:
-            # tz naive, use tz_localize
-            raise TypeError('Cannot convert tz-naive Timestamp, use '
-                            'tz_localize to localize')
-        else:
-            # Same UTC timestamp, different time zone
-            return Timestamp(self.value, tz=tz)
-
-    astimezone = tz_convert
-
-    def replace(self, year=None, month=None, day=None,
-                hour=None, minute=None, second=None, microsecond=None,
-                nanosecond=None, tzinfo=object, fold=0):
-        """
-        implements datetime.replace, handles nanoseconds
-
-        Parameters
-        ----------
-        year : int, optional
-        month : int, optional
-        day : int, optional
-        hour : int, optional
-        minute : int, optional
-        second : int, optional
-        microsecond : int, optional
-        nanosecond: int, optional
-        tzinfo : tz-convertible, optional
-        fold : int, optional, default is 0
-            added in 3.6, NotImplemented
-
-        Returns
-        -------
-        Timestamp with fields replaced
-        """
-
-        cdef:
-            pandas_datetimestruct dts
-            int64_t value
-            object _tzinfo, result, k, v
-            _TSObject ts
-
-        # set to naive if needed
-        _tzinfo = self.tzinfo
-        value = self.value
-        if _tzinfo is not None:
-            value = tz_convert_single(value, 'UTC', _tzinfo)
-
-        # setup components
-        pandas_datetime_to_datetimestruct(value, PANDAS_FR_ns, &dts)
-        dts.ps = self.nanosecond * 1000
-
-        # replace
-        def validate(k, v):
-            """ validate integers """
-            if not is_integer_object(v):
-                raise ValueError("value must be an integer, received "
-                                 "{v} for {k}".format(v=type(v), k=k))
-            return v
-
-        if year is not None:
-            dts.year = validate('year', year)
-        if month is not None:
-            dts.month = validate('month', month)
-        if day is not None:
-            dts.day = validate('day', day)
-        if hour is not None:
-            dts.hour = validate('hour', hour)
-        if minute is not None:
-            dts.min = validate('minute', minute)
-        if second is not None:
-            dts.sec = validate('second', second)
-        if microsecond is not None:
-            dts.us = validate('microsecond', microsecond)
-        if nanosecond is not None:
-            dts.ps = validate('nanosecond', nanosecond) * 1000
-        if tzinfo is not object:
-            _tzinfo = tzinfo
-
-        # reconstruct & check bounds
-        value = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-        if value != NPY_NAT:
-            _check_dts_bounds(&dts)
-
-        # set tz if needed
-        if _tzinfo is not None:
-            value = tz_convert_single(value, _tzinfo, 'UTC')
-
-        result = create_timestamp_from_ts(value, dts, _tzinfo, self.freq)
-        return result
+        if not show_ns:
+            consider_values //= 1000
+            show_us = (consider_values % 1000).any()
 
-    def isoformat(self, sep='T'):
-        base = super(_Timestamp, self).isoformat(sep=sep)
-        if self.nanosecond == 0:
-            return base
+            if not show_ms:
+                consider_values //= 1000
+                show_ms = (consider_values % 1000).any()
 
-        if self.tzinfo is not None:
-            base1, base2 = base[:-6], base[-6:]
-        else:
-            base1, base2 = base, ""
+    for i in range(N):
+        val = values[i]
 
-        if self.microsecond != 0:
-            base1 += "%.3d" % self.nanosecond
-        else:
-            base1 += ".%.9d" % self.nanosecond
-
-        return base1 + base2
-
-    def _has_time_component(self):
-        """
-        Returns if the Timestamp has a time component
-        in addition to the date part
-        """
-        return (self.time() != _zero_time
-                or self.tzinfo is not None
-                or self.nanosecond != 0)
-
-    def to_julian_date(self):
-        """
-        Convert TimeStamp to a Julian Date.
-        0 Julian date is noon January 1, 4713 BC.
-        """
-        year = self.year
-        month = self.month
-        day = self.day
-        if month <= 2:
-            year -= 1
-            month += 12
-        return (day +
-                np.fix((153 * month - 457) / 5) +
-                365 * year +
-                np.floor(year / 4) -
-                np.floor(year / 100) +
-                np.floor(year / 400) +
-                1721118.5 +
-                (self.hour +
-                 self.minute / 60.0 +
-                 self.second / 3600.0 +
-                 self.microsecond / 3600.0 / 1e+6 +
-                 self.nanosecond / 3600.0 / 1e+9
-                ) / 24.0)
-
-    def normalize(self):
-        """
-        Normalize Timestamp to midnight, preserving
-        tz information.
-        """
-        normalized_value = date_normalize(
-            np.array([self.value], dtype='i8'), tz=self.tz)[0]
-        return Timestamp(normalized_value).tz_localize(self.tz)
-
-    def __radd__(self, other):
-        # __radd__ on cython extension types like _Timestamp is not used, so
-        # define it here instead
-        return self + other
-
-
-_nat_strings = set(['NaT', 'nat', 'NAT', 'nan', 'NaN', 'NAN'])
-
-
-class NaTType(_NaT):
-    """(N)ot-(A)-(T)ime, the time equivalent of NaN"""
-
-    def __new__(cls):
-        cdef _NaT base
-
-        base = _NaT.__new__(cls, 1, 1, 1)
-        base._day = -1
-        base._month = -1
-        base.value = NPY_NAT
-
-        return base
-
-    def __repr__(self):
-        return 'NaT'
-
-    def __str__(self):
-        return 'NaT'
-
-    def isoformat(self, sep='T'):
-        # This allows Timestamp(ts.isoformat()) to always correctly roundtrip.
-        return 'NaT'
-
-    def __hash__(self):
-        return NPY_NAT
-
-    def __int__(self):
-        return NPY_NAT
-
-    def __long__(self):
-        return NPY_NAT
-
-    def __reduce__(self):
-        return (__nat_unpickle, (None, ))
-
-    def total_seconds(self):
-        # GH 10939
-        return np.nan
-
-    @property
-    def is_leap_year(self):
-        return False
-
-    @property
-    def is_month_start(self):
-        return False
-
-    @property
-    def is_quarter_start(self):
-        return False
-
-    @property
-    def is_year_start(self):
-        return False
-
-    @property
-    def is_month_end(self):
-        return False
-
-    @property
-    def is_quarter_end(self):
-        return False
-
-    @property
-    def is_year_end(self):
-        return False
-
-    def __rdiv__(self, other):
-        return _nat_rdivide_op(self, other)
-
-    def __rtruediv__(self, other):
-        return _nat_rdivide_op(self, other)
+        if val == NPY_NAT:
+            result[i] = na_rep
+        elif basic_format:
 
-    def __rfloordiv__(self, other):
-        return _nat_rdivide_op(self, other)
+            dt64_to_dtstruct(val, &dts)
+            res = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year,
+                                                   dts.month,
+                                                   dts.day,
+                                                   dts.hour,
+                                                   dts.min,
+                                                   dts.sec)
 
-    def __rmul__(self, other):
-        if is_integer_object(other) or is_float_object(other):
-            return NaT
-        return NotImplemented
+            if show_ns:
+                ns = dts.ps / 1000
+                res += '.%.9d' % (ns + 1000 * dts.us)
+            elif show_us:
+                res += '.%.6d' % dts.us
+            elif show_ms:
+                res += '.%.3d' % (dts.us /1000)
 
+            result[i] = res
 
-def __nat_unpickle(*args):
-    # return constant defined in the module
-    return NaT
+        else:
 
-NaT = NaTType()
+            ts = Timestamp(val, tz=tz)
+            if format is None:
+                result[i] = str(ts)
+            else:
 
-cdef inline bint _checknull_with_nat(object val):
-    """ utility to check if a value is a nat or not """
-    return val is None or (
-        PyFloat_Check(val) and val != val) or val is NaT
+                # invalid format string
+                # requires dates > 1900
+                try:
+                    result[i] = ts.strftime(format)
+                except ValueError:
+                    result[i] = str(ts)
 
-cdef inline bint _check_all_nulls(object val):
-    """ utility to check if a value is any type of null """
-    cdef bint res
-    if PyFloat_Check(val):
-        res = val != val
-    elif val is NaT:
-        res = 1
-    elif val is None:
-        res = 1
-    elif is_datetime64_object(val):
-        res = get_datetime64_value(val) == NPY_NAT
-    elif is_timedelta64_object(val):
-        res = get_timedelta64_value(val) == NPY_NAT
-    else:
-        res = 0
-    return res
+    return result
 
-cdef inline bint _cmp_nat_dt(_NaT lhs, _Timestamp rhs, int op) except -1:
-    return _nat_scalar_rules[op]
 
+def array_with_unit_to_datetime(ndarray values, object unit,
+                                str errors='coerce'):
+    """
+    convert the ndarray according to the unit
+    if errors:
+      - raise: return converted values or raise OutOfBoundsDatetime
+          if out of range on the conversion or
+          ValueError for other conversions (e.g. a string)
+      - ignore: return non-convertible values as the same unit
+      - coerce: NaT for non-convertibles
 
-cpdef object get_value_box(ndarray arr, object loc):
+    """
     cdef:
-        Py_ssize_t i, sz
-        void* data_ptr
-
-    if util.is_float_object(loc):
-        casted = int(loc)
-        if casted == loc:
-            loc = casted
-    i = <Py_ssize_t> loc
-    sz = np.PyArray_SIZE(arr)
-
-    if i < 0 and sz > 0:
-        i += sz
-
-    if i >= sz or sz == 0 or i < 0:
-        raise IndexError('index out of bounds')
-
-    if arr.descr.type_num == NPY_DATETIME:
-        return Timestamp(util.get_value_1d(arr, i))
-    elif arr.descr.type_num == NPY_TIMEDELTA:
-        return Timedelta(util.get_value_1d(arr, i))
-    else:
-        return util.get_value_1d(arr, i)
+        Py_ssize_t i, j, n=len(values)
+        int64_t m
+        ndarray[float64_t] fvalues
+        ndarray mask
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+        bint is_raise = errors=='raise'
+        bint need_to_iterate = True
+        ndarray[int64_t] iresult
+        ndarray[object] oresult
 
+    assert is_ignore or is_coerce or is_raise
 
-# Add the min and max fields at the class level
-cdef int64_t _NS_UPPER_BOUND = INT64_MAX
-# the smallest value we could actually represent is
-#   INT64_MIN + 1 == -9223372036854775807
-# but to allow overflow free conversion with a microsecond resolution
-# use the smallest value with a 0 nanosecond unit (0s in last 3 digits)
-cdef int64_t _NS_LOWER_BOUND = -9223372036854775000
+    if unit == 'ns':
+        if issubclass(values.dtype.type, np.integer):
+            return values.astype('M8[ns]')
+        return array_to_datetime(values.astype(object), errors=errors)[0]
 
-cdef pandas_datetimestruct _NS_MIN_DTS, _NS_MAX_DTS
-pandas_datetime_to_datetimestruct(_NS_LOWER_BOUND, PANDAS_FR_ns, &_NS_MIN_DTS)
-pandas_datetime_to_datetimestruct(_NS_UPPER_BOUND, PANDAS_FR_ns, &_NS_MAX_DTS)
+    m = cast_from_unit(None, unit)
 
-# Resolution is in nanoseconds
-Timestamp.min = Timestamp(_NS_LOWER_BOUND)
-Timestamp.max = Timestamp(_NS_UPPER_BOUND)
+    if is_raise:
 
+        # try a quick conversion to i8
+        # if we have nulls that are not type-compat
+        # then need to iterate
+        try:
+            iresult = values.astype('i8', casting='same_kind', copy=False)
+            mask = iresult == NPY_NAT
+            iresult[mask] = 0
+            fvalues = iresult.astype('f8') * m
+            need_to_iterate = False
+        except:
+            pass
 
-#----------------------------------------------------------------------
-# Frequency inference
+        # check the bounds
+        if not need_to_iterate:
 
-def unique_deltas(ndarray[int64_t] arr):
-    cdef:
-        Py_ssize_t i, n = len(arr)
-        int64_t val
-        khiter_t k
-        kh_int64_t *table
-        int ret = 0
-        list uniques = []
-
-    table = kh_init_int64()
-    kh_resize_int64(table, 10)
-    for i in range(n - 1):
-        val = arr[i + 1] - arr[i]
-        k = kh_get_int64(table, val)
-        if k == table.n_buckets:
-            kh_put_int64(table, val, &ret)
-            uniques.append(val)
-    kh_destroy_int64(table)
-
-    result = np.array(uniques, dtype=np.int64)
-    result.sort()
-    return result
+            if ((fvalues < Timestamp.min.value).any()
+                    or (fvalues > Timestamp.max.value).any()):
+                raise OutOfBoundsDatetime("cannot convert input with unit "
+                                          "'{unit}'".format(unit=unit))
+            result = (iresult * m).astype('M8[ns]')
+            iresult = result.view('i8')
+            iresult[mask] = NPY_NAT
+            return result
 
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
 
-cdef inline bint _is_multiple(int64_t us, int64_t mult):
-    return us % mult == 0
+    try:
+        for i in range(n):
+            val = values[i]
 
+            if checknull_with_nat(val):
+                iresult[i] = NPY_NAT
 
-cdef inline bint _cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1:
-    if op == Py_EQ:
-        return lhs == rhs
-    elif op == Py_NE:
-        return lhs != rhs
-    elif op == Py_LT:
-        return lhs < rhs
-    elif op == Py_LE:
-        return lhs <= rhs
-    elif op == Py_GT:
-        return lhs > rhs
-    elif op == Py_GE:
-        return lhs >= rhs
+            elif is_integer_object(val) or is_float_object(val):
 
+                if val != val or val == NPY_NAT:
+                    iresult[i] = NPY_NAT
+                else:
+                    try:
+                        iresult[i] = cast_from_unit(val, unit)
+                    except OverflowError:
+                        if is_raise:
+                            raise OutOfBoundsDatetime(
+                                "cannot convert input {val} with the unit "
+                                "'{unit}'".format(val=val, unit=unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
 
-cdef int _reverse_ops[6]
+            elif is_string_object(val):
+                if len(val) == 0 or val in nat_strings:
+                    iresult[i] = NPY_NAT
 
-_reverse_ops[Py_LT] = Py_GT
-_reverse_ops[Py_LE] = Py_GE
-_reverse_ops[Py_EQ] = Py_EQ
-_reverse_ops[Py_NE] = Py_NE
-_reverse_ops[Py_GT] = Py_LT
-_reverse_ops[Py_GE] = Py_LE
+                else:
+                    try:
+                        iresult[i] = cast_from_unit(float(val), unit)
+                    except ValueError:
+                        if is_raise:
+                            raise ValueError(
+                                "non convertible value {val} with the unit "
+                                "'{unit}'".format(val=val, unit=unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
+                    except:
+                        if is_raise:
+                            raise OutOfBoundsDatetime(
+                                "cannot convert input {val} with the unit "
+                                "'{unit}'".format(val=val, unit=unit))
+                        elif is_ignore:
+                            raise AssertionError
+                        iresult[i] = NPY_NAT
 
+            else:
 
-cdef str _NDIM_STRING = "ndim"
+                if is_raise:
+                    raise ValueError("unit='{0}' not valid with non-numerical "
+                                     "val='{1}'".format(unit, val))
+                if is_ignore:
+                    raise AssertionError
 
-# This is PITA. Because we inherit from datetime, which has very specific
-# construction requirements, we need to do object instantiation in python
-# (see Timestamp class above). This will serve as a C extension type that
-# shadows the python class, where we do any heavy lifting.
-cdef class _Timestamp(datetime):
+                iresult[i] = NPY_NAT
 
-    cdef readonly:
-        int64_t value, nanosecond
-        object freq       # frequency reference
+        return result
 
-    def __hash__(_Timestamp self):
-        if self.nanosecond:
-            return hash(self.value)
-        return datetime.__hash__(self)
+    except AssertionError:
+        pass
 
-    def __richcmp__(_Timestamp self, object other, int op):
-        cdef:
-            _Timestamp ots
-            int ndim
+    # we have hit an exception
+    # and are in ignore mode
+    # redo as object
 
-        if isinstance(other, _Timestamp):
-            if isinstance(other, _NaT):
-                return _cmp_nat_dt(other, self, _reverse_ops[op])
-            ots = other
-        elif isinstance(other, datetime):
-            if self.nanosecond == 0:
-                val = self.to_pydatetime()
-                return PyObject_RichCompareBool(val, other, op)
+    oresult = np.empty(n, dtype=object)
+    for i in range(n):
+        val = values[i]
 
-            try:
-                ots = Timestamp(other)
-            except ValueError:
-                return self._compare_outside_nanorange(other, op)
-        else:
-            ndim = getattr(other, _NDIM_STRING, -1)
-
-            if ndim != -1:
-                if ndim == 0:
-                    if isinstance(other, np.datetime64):
-                        other = Timestamp(other)
-                    else:
-                        if op == Py_EQ:
-                            return False
-                        elif op == Py_NE:
-                            return True
-
-                        # only allow ==, != ops
-                        raise TypeError('Cannot compare type %r with type %r' %
-                                        (type(self).__name__,
-                                         type(other).__name__))
-                return PyObject_RichCompare(other, self, _reverse_ops[op])
-            else:
-                if op == Py_EQ:
-                    return False
-                elif op == Py_NE:
-                    return True
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-
-        self._assert_tzawareness_compat(other)
-        return _cmp_scalar(self.value, ots.value, op)
-
-    def __reduce_ex__(self, protocol):
-        # python 3.6 compat
-        # http://bugs.python.org/issue28730
-        # now __reduce_ex__ is defined and higher priority than __reduce__
-        return self.__reduce__()
-
-    def __repr__(self):
-        stamp = self._repr_base
-        zone = None
-
-        try:
-            stamp += self.strftime('%z')
-            if self.tzinfo:
-                zone = _get_zone(self.tzinfo)
-        except ValueError:
-            year2000 = self.replace(year=2000)
-            stamp += year2000.strftime('%z')
-            if self.tzinfo:
-                zone = _get_zone(self.tzinfo)
-
-        try:
-            stamp += zone.strftime(' %%Z')
-        except:
-            pass
-
-        tz = ", tz='{0}'".format(zone) if zone is not None else ""
-        freq = ", freq='{0}'".format(
-            self.freq.freqstr) if self.freq is not None else ""
-
-        return "Timestamp('{stamp}'{tz}{freq})".format(
-            stamp=stamp, tz=tz, freq=freq)
-
-    cdef bint _compare_outside_nanorange(_Timestamp self, datetime other,
-                                         int op) except -1:
-        cdef datetime dtval = self.to_pydatetime()
-
-        self._assert_tzawareness_compat(other)
-
-        if self.nanosecond == 0:
-            return PyObject_RichCompareBool(dtval, other, op)
-        else:
-            if op == Py_EQ:
-                return False
-            elif op == Py_NE:
-                return True
-            elif op == Py_LT:
-                return dtval < other
-            elif op == Py_LE:
-                return dtval < other
-            elif op == Py_GT:
-                return dtval >= other
-            elif op == Py_GE:
-                return dtval >= other
-
-    cdef int _assert_tzawareness_compat(_Timestamp self,
-                                        object other) except -1:
-        if self.tzinfo is None:
-            if other.tzinfo is not None:
-                raise TypeError('Cannot compare tz-naive and tz-aware '
-                                 'timestamps')
-        elif other.tzinfo is None:
-            raise TypeError('Cannot compare tz-naive and tz-aware timestamps')
-
-    cpdef datetime to_datetime(_Timestamp self):
-        """
-        DEPRECATED: use :meth:`to_pydatetime` instead.
-
-        Convert a Timestamp object to a native Python datetime object.
-        """
-        warnings.warn("to_datetime is deprecated. Use self.to_pydatetime()",
-                      FutureWarning, stacklevel=2)
-        return self.to_pydatetime(warn=False)
-
-    cpdef datetime to_pydatetime(_Timestamp self, warn=True):
-        """
-        Convert a Timestamp object to a native Python datetime object.
-
-        If warn=True, issue a warning if nanoseconds is nonzero.
-        """
-        cdef:
-            pandas_datetimestruct dts
-            _TSObject ts
-
-        if self.nanosecond != 0 and warn:
-            warnings.warn("Discarding nonzero nanoseconds in conversion",
-                          UserWarning, stacklevel=2)
-        ts = convert_to_tsobject(self, self.tzinfo, None, 0, 0)
-        dts = ts.dts
-        return datetime(dts.year, dts.month, dts.day,
-                        dts.hour, dts.min, dts.sec,
-                        dts.us, ts.tzinfo)
-
-    cpdef to_datetime64(self):
-        """ Returns a numpy.datetime64 object with 'ns' precision """
-        return np.datetime64(self.value, 'ns')
-
-    def __add__(self, other):
-        cdef int64_t other_int
-
-        if is_timedelta64_object(other):
-            other_int = other.astype('timedelta64[ns]').view('i8')
-            return Timestamp(self.value + other_int,
-                             tz=self.tzinfo, freq=self.freq)
-
-        elif is_integer_object(other):
-            if self is NaT:
-                # to be compat with Period
-                return NaT
-            elif self.freq is None:
-                raise ValueError("Cannot add integral value to Timestamp "
-                                 "without freq.")
-            return Timestamp((self.freq * other).apply(self), freq=self.freq)
-
-        elif isinstance(other, timedelta) or hasattr(other, 'delta'):
-            nanos = _delta_to_nanoseconds(other)
-            result = Timestamp(self.value + nanos,
-                               tz=self.tzinfo, freq=self.freq)
-            if getattr(other, 'normalize', False):
-                result = Timestamp(normalize_date(result))
-            return result
-
-        # index/series like
-        elif hasattr(other, '_typ'):
-            return NotImplemented
-
-        result = datetime.__add__(self, other)
-        if isinstance(result, datetime):
-            result = Timestamp(result)
-            result.nanosecond = self.nanosecond
-        return result
-
-    def __sub__(self, other):
-        if is_timedelta64_object(other) or is_integer_object(other) \
-                or isinstance(other, timedelta) or hasattr(other, 'delta'):
-            neg_other = -other
-            return self + neg_other
-
-        # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
-        elif getattr(other, '_typ', None) == 'datetimeindex':
-            # timezone comparison is performed in DatetimeIndex._sub_datelike
-            return -other.__sub__(self)
-
-        # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
-        elif getattr(other, '_typ', None) == 'timedeltaindex':
-            return (-other).__add__(self)
-
-        elif other is NaT:
-            return NaT
-
-        # coerce if necessary if we are a Timestamp-like
-        if (isinstance(self, datetime)
-            and (isinstance(other, datetime)
-                 or is_datetime64_object(other))):
-            self = Timestamp(self)
-            other = Timestamp(other)
-
-            # validate tz's
-            if get_timezone(self.tzinfo) != get_timezone(other.tzinfo):
-                raise TypeError(
-                    "Timestamp subtraction must have the "
-                    "same timezones or no timezones")
-
-            # scalar Timestamp/datetime - Timestamp/datetime -> yields a
-            # Timedelta
-            try:
-                return Timedelta(self.value -other.value)
-            except (OverflowError, OutOfBoundsDatetime):
-                pass
-
-        # scalar Timestamp/datetime - Timedelta -> yields a Timestamp (with
-        # same timezone if specified)
-        return datetime.__sub__(self, other)
-
-    cpdef _get_field(self, field):
-        val = self.value
-        if self.tz is not None and not _is_utc(self.tz):
-            val = tz_convert_single(self.value, 'UTC', self.tz)
-        out = get_date_field(np.array([val], dtype=np.int64), field)
-        return int(out[0])
-
-    cpdef _get_start_end_field(self, field):
-        month_kw = self.freq.kwds.get(
-            'startingMonth', self.freq.kwds.get(
-                'month', 12)) if self.freq else 12
-        freqstr = self.freqstr if self.freq else None
-        val = self.value
-        if self.tz is not None and not _is_utc(self.tz):
-            val = tz_convert_single(self.value, 'UTC', self.tz)
-        out = get_start_end_field(
-            np.array([val], dtype=np.int64), field, freqstr, month_kw)
-        return out[0]
-
-    property _repr_base:
-        def __get__(self):
-            return '%s %s' % (self._date_repr, self._time_repr)
-
-    property _date_repr:
-        def __get__(self):
-            # Ideal here would be self.strftime("%Y-%m-%d"), but
-            # the datetime strftime() methods require year >= 1900
-            return '%d-%.2d-%.2d' % (self.year, self.month, self.day)
-
-    property _time_repr:
-        def __get__(self):
-            result = '%.2d:%.2d:%.2d' % (self.hour, self.minute, self.second)
-
-            if self.nanosecond != 0:
-                result += '.%.9d' % (self.nanosecond + 1000 * self.microsecond)
-            elif self.microsecond != 0:
-                result += '.%.6d' % self.microsecond
-
-            return result
-
-    property asm8:
-        def __get__(self):
-            return np.datetime64(self.value, 'ns')
-
-
-cdef PyTypeObject* ts_type = <PyTypeObject*> Timestamp
-
-
-cdef inline bint is_timestamp(object o):
-    return Py_TYPE(o) == ts_type # isinstance(o, Timestamp)
-
-
-cdef bint _nat_scalar_rules[6]
-
-_nat_scalar_rules[Py_EQ] = False
-_nat_scalar_rules[Py_NE] = True
-_nat_scalar_rules[Py_LT] = False
-_nat_scalar_rules[Py_LE] = False
-_nat_scalar_rules[Py_GT] = False
-_nat_scalar_rules[Py_GE] = False
-
-
-cdef _nat_divide_op(self, other):
-    if isinstance(other, (Timedelta, np.timedelta64)) or other is NaT:
-        return np.nan
-    if is_integer_object(other) or is_float_object(other):
-        return NaT
-    return NotImplemented
-
-cdef _nat_rdivide_op(self, other):
-    if isinstance(other, Timedelta):
-        return np.nan
-    return NotImplemented
-
-cdef class _NaT(_Timestamp):
-
-    def __hash__(_NaT self):
-        # py3k needs this defined here
-        return hash(self.value)
-
-    def __richcmp__(_NaT self, object other, int op):
-        cdef int ndim = getattr(other, 'ndim', -1)
-
-        if ndim == -1:
-            return _nat_scalar_rules[op]
-
-        if ndim == 0:
-            if isinstance(other, np.datetime64):
-                other = Timestamp(other)
-            else:
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-        return PyObject_RichCompare(other, self, _reverse_ops[op])
-
-    def __add__(self, other):
-        try:
-            if isinstance(other, datetime):
-                return NaT
-            result = _Timestamp.__add__(self, other)
-            # Timestamp.__add__ doesn't return DatetimeIndex/TimedeltaIndex
-            if result is NotImplemented:
-                return result
-        except (OverflowError, OutOfBoundsDatetime):
-            pass
-        return NaT
-
-    def __sub__(self, other):
-        if isinstance(other, (datetime, timedelta)):
-            return NaT
-        try:
-            result = _Timestamp.__sub__(self, other)
-            # Timestamp.__sub__ may return DatetimeIndex/TimedeltaIndex
-            if result is NotImplemented or hasattr(result, '_typ'):
-                return result
-        except (OverflowError, OutOfBoundsDatetime):
-            pass
-        return NaT
-
-    def __pos__(self):
-        return NaT
-
-    def __neg__(self):
-        return NaT
-
-    def __div__(self, other):
-        return _nat_divide_op(self, other)
-
-    def __truediv__(self, other):
-        return _nat_divide_op(self, other)
-
-    def __floordiv__(self, other):
-        return _nat_divide_op(self, other)
-
-    def __mul__(self, other):
-        if is_integer_object(other) or is_float_object(other):
-            return NaT
-        return NotImplemented
-
-
-# lightweight C object to hold datetime & int64 pair
-cdef class _TSObject:
-    cdef:
-        pandas_datetimestruct dts      # pandas_datetimestruct
-        int64_t value               # numpy dt64
-        object tzinfo
-
-    property value:
-        def __get__(self):
-            return self.value
-
-cpdef _get_utcoffset(tzinfo, obj):
-    try:
-        return tzinfo._utcoffset
-    except AttributeError:
-        return tzinfo.utcoffset(obj)
-
-# helper to extract datetime and int64 from several different possibilities
-cdef convert_to_tsobject(object ts, object tz, object unit,
-                         bint dayfirst, bint yearfirst):
-    """
-    Extract datetime and int64 from any of:
-        - np.int64 (with unit providing a possible modifier)
-        - np.datetime64
-        - a float (with unit providing a possible modifier)
-        - python int or long object (with unit providing a possible modifier)
-        - iso8601 string object
-        - python datetime object
-        - another timestamp object
-    """
-    cdef:
-        _TSObject obj
-        bint utc_convert = 1
-        int out_local = 0, out_tzoffset = 0
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-
-    obj = _TSObject()
-
-    if util.is_string_object(ts):
-        return convert_str_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
-
-    if ts is None or ts is NaT:
-        obj.value = NPY_NAT
-    elif is_datetime64_object(ts):
-        if ts.view('i8') == NPY_NAT:
-            obj.value = NPY_NAT
-        else:
-            obj.value = _get_datetime64_nanos(ts)
-            pandas_datetime_to_datetimestruct(
-                obj.value, PANDAS_FR_ns, &obj.dts)
-    elif is_integer_object(ts):
-        if ts == NPY_NAT:
-            obj.value = NPY_NAT
-        else:
-            ts = ts * cast_from_unit(None, unit)
-            obj.value = ts
-            pandas_datetime_to_datetimestruct(ts, PANDAS_FR_ns, &obj.dts)
-    elif util.is_float_object(ts):
-        if ts != ts or ts == NPY_NAT:
-            obj.value = NPY_NAT
-        else:
-            ts = cast_from_unit(ts, unit)
-            obj.value = ts
-            pandas_datetime_to_datetimestruct(ts, PANDAS_FR_ns, &obj.dts)
-    elif PyDateTime_Check(ts):
-        if tz is not None:
-            # sort of a temporary hack
-            if ts.tzinfo is not None:
-                if (hasattr(tz, 'normalize') and
-                    hasattr(ts.tzinfo, '_utcoffset')):
-                    ts = tz.normalize(ts)
-                    obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                    obj.tzinfo = ts.tzinfo
-                else: #tzoffset
-                    try:
-                        tz = ts.astimezone(tz).tzinfo
-                    except:
-                        pass
-                    obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                    ts_offset = _get_utcoffset(ts.tzinfo, ts)
-                    obj.value -= _delta_to_nanoseconds(ts_offset)
-                    tz_offset = _get_utcoffset(tz, ts)
-                    obj.value += _delta_to_nanoseconds(tz_offset)
-                    pandas_datetime_to_datetimestruct(obj.value,
-                                                      PANDAS_FR_ns, &obj.dts)
-                    obj.tzinfo = tz
-            elif not _is_utc(tz):
-                ts = _localize_pydatetime(ts, tz)
-                obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                obj.tzinfo = ts.tzinfo
-            else:
-                # UTC
-                obj.value = _pydatetime_to_dts(ts, &obj.dts)
-                obj.tzinfo = pytz.utc
-        else:
-            obj.value = _pydatetime_to_dts(ts, &obj.dts)
-            obj.tzinfo = ts.tzinfo
-
-        if obj.tzinfo is not None and not _is_utc(obj.tzinfo):
-            offset = _get_utcoffset(obj.tzinfo, ts)
-            obj.value -= _delta_to_nanoseconds(offset)
-
-        if is_timestamp(ts):
-            obj.value += ts.nanosecond
-            obj.dts.ps = ts.nanosecond * 1000
-        _check_dts_bounds(&obj.dts)
-        return obj
-    elif PyDate_Check(ts):
-        # Keep the converter same as PyDateTime's
-        ts = datetime.combine(ts, datetime_time())
-        return convert_to_tsobject(ts, tz, None, 0, 0)
-    elif getattr(ts, '_typ', None) == 'period':
-        raise ValueError(
-            "Cannot convert Period to Timestamp "
-            "unambiguously. Use to_timestamp")
-    else:
-        raise TypeError('Cannot convert input [{}] of type {} to '
-                        'Timestamp'.format(ts, type(ts)))
-
-    if obj.value != NPY_NAT:
-        _check_dts_bounds(&obj.dts)
-
-    if tz is not None:
-        _localize_tso(obj, tz)
-
-    return obj
-
-
-cpdef convert_str_to_tsobject(object ts, object tz, object unit,
-                              dayfirst=False, yearfirst=False):
-    """ ts must be a string """
-
-    cdef:
-        _TSObject obj
-        int out_local = 0, out_tzoffset = 0
-
-    if tz is not None:
-        tz = maybe_get_tz(tz)
-
-    obj = _TSObject()
-
-    assert util.is_string_object(ts)
-
-    if len(ts) == 0 or ts in _nat_strings:
-        ts = NaT
-    elif ts == 'now':
-        # Issue 9000, we short-circuit rather than going
-        # into np_datetime_strings which returns utc
-        ts = Timestamp.now(tz)
-    elif ts == 'today':
-        # Issue 9000, we short-circuit rather than going
-        # into np_datetime_strings which returns a normalized datetime
-        ts = Timestamp.today(tz)
-    else:
-        try:
-            _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
-            obj.value = pandas_datetimestruct_to_datetime(
-                PANDAS_FR_ns, &obj.dts)
-            _check_dts_bounds(&obj.dts)
-            if out_local == 1:
-                obj.tzinfo = pytz.FixedOffset(out_tzoffset)
-                obj.value = tz_convert_single(obj.value, obj.tzinfo, 'UTC')
-                if tz is None:
-                    _check_dts_bounds(&obj.dts)
-                    return obj
-                else:
-                    # Keep the converter same as PyDateTime's
-                    ts = Timestamp(obj.value, tz=obj.tzinfo)
-            else:
-                ts = obj.value
-                if tz is not None:
-                    # shift for _localize_tso
-                    ts = tz_convert_single(ts, tz, 'UTC')
-        except ValueError:
-            try:
-                ts = parse_datetime_string(
-                    ts, dayfirst=dayfirst, yearfirst=yearfirst)
-            except Exception:
-                raise ValueError("could not convert string to Timestamp")
-
-    return convert_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
-
-
-def _test_parse_iso8601(object ts):
-    """
-    TESTING ONLY: Parse string into Timestamp using iso8601 parser. Used
-    only for testing, actual construction uses `convert_str_to_tsobject`
-    """
-    cdef:
-        _TSObject obj
-        int out_local = 0, out_tzoffset = 0
-
-    obj = _TSObject()
-
-    _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
-    obj.value = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &obj.dts)
-    _check_dts_bounds(&obj.dts)
-    if out_local == 1:
-        obj.tzinfo = pytz.FixedOffset(out_tzoffset)
-        obj.value = tz_convert_single(obj.value, obj.tzinfo, 'UTC')
-        return Timestamp(obj.value, tz=obj.tzinfo)
-    else:
-        return Timestamp(obj.value)
-
-cdef inline void _localize_tso(_TSObject obj, object tz):
-    """
-    Take a TSObject in UTC and localizes to timezone tz.
-    """
-    if _is_utc(tz):
-        obj.tzinfo = tz
-    elif _is_tzlocal(tz):
-        pandas_datetime_to_datetimestruct(obj.value, PANDAS_FR_ns, &obj.dts)
-        dt = datetime(obj.dts.year, obj.dts.month, obj.dts.day, obj.dts.hour,
-                      obj.dts.min, obj.dts.sec, obj.dts.us, tz)
-        delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-        if obj.value != NPY_NAT:
-            pandas_datetime_to_datetimestruct(obj.value + delta,
-                                              PANDAS_FR_ns, &obj.dts)
-        else:
-            pandas_datetime_to_datetimestruct(obj.value,
-                                              PANDAS_FR_ns, &obj.dts)
-        obj.tzinfo = tz
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
-
-        pos = trans.searchsorted(obj.value, side='right') - 1
-
-        # static/pytz/dateutil specific code
-        if _is_fixed_offset(tz):
-            # statictzinfo
-            if len(deltas) > 0 and obj.value != NPY_NAT:
-                pandas_datetime_to_datetimestruct(obj.value + deltas[0],
-                                                  PANDAS_FR_ns, &obj.dts)
-            else:
-                pandas_datetime_to_datetimestruct(
-                    obj.value, PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz
-        elif _treat_tz_as_pytz(tz):
-            inf = tz._transition_info[pos]
-            if obj.value != NPY_NAT:
-                pandas_datetime_to_datetimestruct(obj.value + deltas[pos],
-                                                  PANDAS_FR_ns, &obj.dts)
-            else:
-                pandas_datetime_to_datetimestruct(obj.value,
-                                                  PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz._tzinfos[inf]
-        elif _treat_tz_as_dateutil(tz):
-            if obj.value != NPY_NAT:
-                pandas_datetime_to_datetimestruct(obj.value + deltas[pos],
-                                                  PANDAS_FR_ns, &obj.dts)
-            else:
-                pandas_datetime_to_datetimestruct(obj.value,
-                                                  PANDAS_FR_ns, &obj.dts)
-            obj.tzinfo = tz
-        else:
-            obj.tzinfo = tz
-
-
-def _localize_pydatetime(object dt, object tz):
-    """
-    Take a datetime/Timestamp in UTC and localizes to timezone tz.
-    """
-    if tz is None:
-        return dt
-    elif isinstance(dt, Timestamp):
-        return dt.tz_localize(tz)
-    elif tz == 'UTC' or tz is UTC:
-        return UTC.localize(dt)
-    try:
-        # datetime.replace with pytz may be incorrect result
-        return tz.localize(dt)
-    except AttributeError:
-        return dt.replace(tzinfo=tz)
-
-
-def get_timezone(tz):
-    return _get_zone(tz)
-
-cdef inline bint _is_utc(object tz):
-    return tz is UTC or isinstance(tz, _dateutil_tzutc)
-
-cdef inline object _get_zone(object tz):
-    """
-    We need to do several things here:
-    1) Distinguish between pytz and dateutil timezones
-    2) Not be over-specific (e.g. US/Eastern with/without DST is same *zone*
-       but a different tz object)
-    3) Provide something to serialize when we're storing a datetime object
-       in pytables.
-
-    We return a string prefaced with dateutil if it's a dateutil tz, else just
-    the tz name. It needs to be a string so that we can serialize it with
-    UJSON/pytables. maybe_get_tz (below) is the inverse of this process.
-    """
-    if _is_utc(tz):
-        return 'UTC'
-    else:
-        if _treat_tz_as_dateutil(tz):
-            if '.tar.gz' in tz._filename:
-                raise ValueError(
-                    'Bad tz filename. Dateutil on python 3 on windows has a '
-                    'bug which causes tzfile._filename to be the same for all '
-                    'timezone files. Please construct dateutil timezones '
-                    'implicitly by passing a string like "dateutil/Europe'
-                    '/London" when you construct your pandas objects instead '
-                    'of passing a timezone object. See '
-                    'https://github.com/pandas-dev/pandas/pull/7362')
-            return 'dateutil/' + tz._filename
-        else:
-            # tz is a pytz timezone or unknown.
-            try:
-                zone = tz.zone
-                if zone is None:
-                    return tz
-                return zone
-            except AttributeError:
-                return tz
-
-
-cpdef inline object maybe_get_tz(object tz):
-    """
-    (Maybe) Construct a timezone object from a string. If tz is a string, use
-    it to construct a timezone object. Otherwise, just return tz.
-    """
-    if isinstance(tz, string_types):
-        if tz == 'tzlocal()':
-            tz = _dateutil_tzlocal()
-        elif tz.startswith('dateutil/'):
-            zone = tz[9:]
-            tz = _dateutil_gettz(zone)
-            # On Python 3 on Windows, the filename is not always set correctly.
-            if isinstance(tz, _dateutil_tzfile) and '.tar.gz' in tz._filename:
-                tz._filename = zone
-        else:
-            tz = pytz.timezone(tz)
-    elif is_integer_object(tz):
-        tz = pytz.FixedOffset(tz / 60)
-    return tz
-
-
-class OutOfBoundsDatetime(ValueError):
-    pass
-
-cdef inline _check_dts_bounds(pandas_datetimestruct *dts):
-    cdef:
-        bint error = False
-
-    if dts.year <= 1677 and cmp_pandas_datetimestruct(dts, &_NS_MIN_DTS) == -1:
-        error = True
-    elif (
-            dts.year >= 2262 and
-            cmp_pandas_datetimestruct(dts, &_NS_MAX_DTS) == 1):
-        error = True
-
-    if error:
-        fmt = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year, dts.month,
-                                               dts.day, dts.hour,
-                                               dts.min, dts.sec)
-
-        raise OutOfBoundsDatetime(
-            'Out of bounds nanosecond timestamp: %s' % fmt)
-
-
-def datetime_to_datetime64(ndarray[object] values):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object val, inferred_tz = None
-        ndarray[int64_t] iresult
-        pandas_datetimestruct dts
-        _TSObject _ts
-
-    result = np.empty(n, dtype='M8[ns]')
-    iresult = result.view('i8')
-    for i in range(n):
-        val = values[i]
-        if _checknull_with_nat(val):
-            iresult[i] = NPY_NAT
-        elif PyDateTime_Check(val):
-            if val.tzinfo is not None:
-                if inferred_tz is not None:
-                    if _get_zone(val.tzinfo) != inferred_tz:
-                        raise ValueError('Array must be all same time zone')
-                else:
-                    inferred_tz = _get_zone(val.tzinfo)
-
-                _ts = convert_to_tsobject(val, None, None, 0, 0)
-                iresult[i] = _ts.value
-                _check_dts_bounds(&_ts.dts)
-            else:
-                if inferred_tz is not None:
-                    raise ValueError(
-                        'Cannot mix tz-aware with tz-naive values')
-                iresult[i] = _pydatetime_to_dts(val, &dts)
-                _check_dts_bounds(&dts)
-        else:
-            raise TypeError('Unrecognized value type: %s' % type(val))
-
-    return result, inferred_tz
-
-cdef:
-    set _not_datelike_strings = set(['a', 'A', 'm', 'M', 'p', 'P', 't', 'T'])
-
-cpdef bint _does_string_look_like_datetime(object date_string):
-    if date_string.startswith('0'):
-        # Strings starting with 0 are more consistent with a
-        # date-like string than a number
-        return True
-
-    try:
-        if float(date_string) < 1000:
-            return False
-    except ValueError:
-        pass
-
-    if date_string in _not_datelike_strings:
-        return False
-
-    return True
-
-
-def format_array_from_datetime(ndarray[int64_t] values, object tz=None,
-                               object format=None, object na_rep=None):
-    """
-    return a np object array of the string formatted values
-
-    Parameters
-    ----------
-    values : a 1-d i8 array
-    tz : the timezone (or None)
-    format : optional, default is None
-          a strftime capable string
-    na_rep : optional, default is None
-          a nat format
-
-    """
-    cdef:
-        int64_t val, ns, N = len(values)
-        ndarray[int64_t] consider_values
-        bint show_ms = 0, show_us = 0, show_ns = 0, basic_format = 0
-        ndarray[object] result = np.empty(N, dtype=object)
-        object ts, res
-        pandas_datetimestruct dts
-
-    if na_rep is None:
-        na_rep = 'NaT'
-
-    # if we don't have a format nor tz, then choose
-    # a format based on precision
-    basic_format = format is None and tz is None
-    if basic_format:
-        consider_values = values[values != NPY_NAT]
-        show_ns = (consider_values%1000).any()
-
-        if not show_ns:
-            consider_values //= 1000
-            show_us = (consider_values%1000).any()
-
-            if not show_ms:
-                consider_values //= 1000
-                show_ms = (consider_values%1000).any()
-
-    for i in range(N):
-        val = values[i]
-
-        if val == NPY_NAT:
-            result[i] = na_rep
-        elif basic_format:
-
-            pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-            res = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year,
-                                                   dts.month,
-                                                   dts.day,
-                                                   dts.hour,
-                                                   dts.min,
-                                                   dts.sec)
-
-            if show_ns:
-                ns = dts.ps / 1000
-                res += '.%.9d' % (ns + 1000 * dts.us)
-            elif show_us:
-                res += '.%.6d' % dts.us
-            elif show_ms:
-                res += '.%.3d' % (dts.us /1000)
-
-            result[i] = res
-
-        else:
-
-            ts = Timestamp(val, tz=tz)
-            if format is None:
-                result[i] = str(ts)
-            else:
-
-                # invalid format string
-                # requires dates > 1900
-                try:
-                    result[i] = ts.strftime(format)
-                except ValueError:
-                    result[i] = str(ts)
-
-    return result
-
-
-class DateParseError(ValueError):
-    pass
-
-
-cdef object _TIMEPAT = re.compile(r'^([01]?[0-9]|2[0-3]):([0-5][0-9])')
-
-
-def parse_datetime_string(object date_string, object freq=None,
-                          dayfirst=False, yearfirst=False, **kwargs):
-    """parse datetime string, only returns datetime.
-    Also cares special handling matching time patterns.
-
-    Returns
-    -------
-    datetime
-    """
-
-    cdef:
-        object dt
-
-    if not _does_string_look_like_datetime(date_string):
-        raise ValueError('Given date string not likely a datetime.')
-
-    if _TIMEPAT.match(date_string):
-        # use current datetime as default, not pass _DEFAULT_DATETIME
-        dt = parse_date(date_string, dayfirst=dayfirst,
-                        yearfirst=yearfirst, **kwargs)
-        return dt
-    try:
-        dt, _, _ = _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
-        return dt
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    try:
-        dt = parse_date(date_string, default=_DEFAULT_DATETIME,
-                        dayfirst=dayfirst, yearfirst=yearfirst, **kwargs)
-    except TypeError:
-        # following may be raised from dateutil
-        # TypeError: 'NoneType' object is not iterable
-        raise ValueError('Given date string not likely a datetime.')
-
-    return dt
-
-
-def parse_datetime_string_with_reso(object date_string, object freq=None,
-                                    dayfirst=False, yearfirst=False, **kwargs):
-    """parse datetime string, only returns datetime
-
-    Returns
-    -------
-    datetime
-    """
-
-    cdef:
-        object parsed, reso
-
-    if not _does_string_look_like_datetime(date_string):
-        raise ValueError('Given date string not likely a datetime.')
-
-    try:
-        return _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    try:
-        parsed, reso = dateutil_parse(date_string, _DEFAULT_DATETIME,
-                                      dayfirst=dayfirst, yearfirst=yearfirst)
-    except Exception as e:
-        # TODO: allow raise of errors within instead
-        raise DateParseError(e)
-    if parsed is None:
-        raise DateParseError("Could not parse %s" % date_string)
-    return parsed, parsed, reso
-
-
-cdef inline object _parse_dateabbr_string(object date_string, object default,
-                                          object freq):
-    cdef:
-        object ret
-        int year, quarter = -1, month, mnum, date_len
-
-    # special handling for possibilities eg, 2Q2005, 2Q05, 2005Q1, 05Q1
-    assert util.is_string_object(date_string)
-
-    # len(date_string) == 0
-    # should be NaT???
-
-    if date_string in _nat_strings:
-        return NaT, NaT, ''
-
-    date_string = date_string.upper()
-    date_len = len(date_string)
-
-    if date_len == 4:
-        # parse year only like 2000
-        try:
-            ret = default.replace(year=int(date_string))
-            return ret, ret, 'year'
-        except ValueError:
-            pass
-
-    try:
-        if 4 <= date_len <= 7:
-            i = date_string.index('Q', 1, 6)
-            if i == 1:
-                quarter = int(date_string[0])
-                if date_len == 4 or (date_len == 5
-                                     and date_string[i + 1] == '-'):
-                    # r'(\d)Q-?(\d\d)')
-                    year = 2000 + int(date_string[-2:])
-                elif date_len == 6 or (date_len == 7
-                                       and date_string[i + 1] == '-'):
-                    # r'(\d)Q-?(\d\d\d\d)')
-                    year = int(date_string[-4:])
-                else:
-                    raise ValueError
-            elif i == 2 or i == 3:
-                # r'(\d\d)-?Q(\d)'
-                if date_len == 4 or (date_len == 5
-                                     and date_string[i - 1] == '-'):
-                    quarter = int(date_string[-1])
-                    year = 2000 + int(date_string[:2])
-                else:
-                    raise ValueError
-            elif i == 4 or i == 5:
-                if date_len == 6 or (date_len == 7
-                                     and date_string[i - 1] == '-'):
-                    # r'(\d\d\d\d)-?Q(\d)'
-                    quarter = int(date_string[-1])
-                    year = int(date_string[:4])
-                else:
-                    raise ValueError
-
-            if not (1 <= quarter <= 4):
-                msg = ('Incorrect quarterly string is given, quarter must be '
-                       'between 1 and 4: {0}')
-                raise DateParseError(msg.format(date_string))
-
-            if freq is not None:
-                # hack attack, #1228
-                try:
-                    mnum = _MONTH_NUMBERS[_get_rule_month(freq)] + 1
-                except (KeyError, ValueError):
-                    msg = ('Unable to retrieve month information from given '
-                           'freq: {0}').format(freq)
-                    raise DateParseError(msg)
-
-                month = (mnum + (quarter - 1) * 3) % 12 + 1
-                if month > mnum:
-                    year -= 1
-            else:
-                month = (quarter - 1) * 3 + 1
-
-            ret = default.replace(year=year, month=month)
-            return ret, ret, 'quarter'
-
-    except DateParseError:
-        raise
-    except ValueError:
-        pass
-
-    if date_len == 6 and (freq == 'M' or getattr(
-            freq, 'rule_code', None) == 'M'):
-        year = int(date_string[:4])
-        month = int(date_string[4:6])
-        try:
-            ret = default.replace(year=year, month=month)
-            return ret, ret, 'month'
-        except ValueError:
-            pass
-
-    for pat in ['%Y-%m', '%m-%Y', '%b %Y', '%b-%Y']:
-        try:
-            ret = datetime.strptime(date_string, pat)
-            return ret, ret, 'month'
-        except ValueError:
-            pass
-
-    raise ValueError('Unable to parse {0}'.format(date_string))
-
-
-def dateutil_parse(object timestr, object default, ignoretz=False,
-                   tzinfos=None, **kwargs):
-    """ lifted from dateutil to get resolution"""
-
-    cdef:
-        object fobj, res, attr, ret, tzdata
-        object reso = None
-        dict repl = {}
-
-    fobj = StringIO(str(timestr))
-    res = DEFAULTPARSER._parse(fobj, **kwargs)
-
-    # dateutil 2.2 compat
-    if isinstance(res, tuple):
-        res, _ = res
-
-    if res is None:
-        msg = "Unknown datetime string format, unable to parse: {0}"
-        raise ValueError(msg.format(timestr))
-
-    for attr in ["year", "month", "day", "hour",
-                 "minute", "second", "microsecond"]:
-        value = getattr(res, attr)
-        if value is not None:
-            repl[attr] = value
-            reso = attr
-
-    if reso is None:
-        msg = "Unable to parse datetime string: {0}"
-        raise ValueError(msg.format(timestr))
-
-    if reso == 'microsecond':
-        if repl['microsecond'] == 0:
-            reso = 'second'
-        elif repl['microsecond'] % 1000 == 0:
-            reso = 'millisecond'
-
-    ret = default.replace(**repl)
-    if res.weekday is not None and not res.day:
-        ret = ret + relativedelta.relativedelta(weekday=res.weekday)
-    if not ignoretz:
-        if callable(tzinfos) or tzinfos and res.tzname in tzinfos:
-            if callable(tzinfos):
-                tzdata = tzinfos(res.tzname, res.tzoffset)
-            else:
-                tzdata = tzinfos.get(res.tzname)
-            if isinstance(tzdata, datetime.tzinfo):
-                tzinfo = tzdata
-            elif isinstance(tzdata, string_types):
-                tzinfo = _dateutil_tzstr(tzdata)
-            elif isinstance(tzdata, int):
-                tzinfo = tzoffset(res.tzname, tzdata)
-            else:
-                raise ValueError("offset must be tzinfo subclass, "
-                                 "tz string, or int offset")
-            ret = ret.replace(tzinfo=tzinfo)
-        elif res.tzname and res.tzname in time.tzname:
-            ret = ret.replace(tzinfo=_dateutil_tzlocal())
-        elif res.tzoffset == 0:
-            ret = ret.replace(tzinfo=_dateutil_tzutc())
-        elif res.tzoffset:
-            ret = ret.replace(tzinfo=tzoffset(res.tzname, res.tzoffset))
-    return ret, reso
-
-
-# const for parsers
-
-_DEFAULT_DATETIME = datetime(1, 1, 1).replace(
-    hour=0, minute=0, second=0, microsecond=0)
-_MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
-           'AUG', 'SEP', 'OCT', 'NOV', 'DEC']
-_MONTH_NUMBERS = {k: i for i, k in enumerate(_MONTHS)}
-_MONTH_ALIASES = {(k + 1): v for k, v in enumerate(_MONTHS)}
-
-
-cpdef object _get_rule_month(object source, object default='DEC'):
-    """
-    Return starting month of given freq, default is December.
-
-    Example
-    -------
-    >>> _get_rule_month('D')
-    'DEC'
-
-    >>> _get_rule_month('A-JAN')
-    'JAN'
-    """
-    if hasattr(source, 'freqstr'):
-        source = source.freqstr
-    source = source.upper()
-    if '-' not in source:
-        return default
-    else:
-        return source.split('-')[1]
-
-
-cpdef array_with_unit_to_datetime(ndarray values, unit, errors='coerce'):
-    """
-    convert the ndarray according to the unit
-    if errors:
-      - raise: return converted values or raise OutOfBoundsDatetime
-          if out of range on the conversion or
-          ValueError for other conversions (e.g. a string)
-      - ignore: return non-convertible values as the same unit
-      - coerce: NaT for non-convertibles
-
-    """
-    cdef:
-        Py_ssize_t i, j, n=len(values)
-        int64_t m
-        ndarray[float64_t] fvalues
-        ndarray mask
-        bint is_ignore = errors=='ignore'
-        bint is_coerce = errors=='coerce'
-        bint is_raise = errors=='raise'
-        bint need_to_iterate=True
-        ndarray[int64_t] iresult
-        ndarray[object] oresult
-
-    assert is_ignore or is_coerce or is_raise
-
-    if unit == 'ns':
-        if issubclass(values.dtype.type, np.integer):
-            return values.astype('M8[ns]')
-        return array_to_datetime(values.astype(object), errors=errors)
-
-    m = cast_from_unit(None, unit)
-
-    if is_raise:
-
-        # try a quick conversion to i8
-        # if we have nulls that are not type-compat
-        # then need to iterate
-        try:
-            iresult = values.astype('i8', casting='same_kind', copy=False)
-            mask = iresult == iNaT
-            iresult[mask] = 0
-            fvalues = iresult.astype('f8') * m
-            need_to_iterate=False
-        except:
-            pass
-
-        # check the bounds
-        if not need_to_iterate:
-
-            if ((fvalues < _NS_LOWER_BOUND).any()
-                or (fvalues > _NS_UPPER_BOUND).any()):
-                raise OutOfBoundsDatetime(
-                    "cannot convert input with unit '{0}'".format(unit))
-            result = (iresult *m).astype('M8[ns]')
-            iresult = result.view('i8')
-            iresult[mask] = iNaT
-            return result
-
-    result = np.empty(n, dtype='M8[ns]')
-    iresult = result.view('i8')
-
-    try:
-        for i in range(n):
-            val = values[i]
-
-            if _checknull_with_nat(val):
-                iresult[i] = NPY_NAT
-
-            elif is_integer_object(val) or is_float_object(val):
-
-                if val != val or val == NPY_NAT:
-                    iresult[i] = NPY_NAT
-                else:
-                    try:
-                        iresult[i] = cast_from_unit(val, unit)
-                    except OverflowError:
-                        if is_raise:
-                            raise OutOfBoundsDatetime(
-                                "cannot convert input {0} with the unit "
-                                "'{1}'".format(val, unit))
-                        elif is_ignore:
-                            raise AssertionError
-                        iresult[i] = NPY_NAT
-
-            elif util.is_string_object(val):
-                if len(val) == 0 or val in _nat_strings:
-                    iresult[i] = NPY_NAT
-
-                else:
-                    try:
-                        iresult[i] = cast_from_unit(float(val), unit)
-                    except ValueError:
-                        if is_raise:
-                            raise ValueError(
-                                "non convertible value {0} with the unit "
-                                "'{1}'".format(val, unit))
-                        elif is_ignore:
-                            raise AssertionError
-                        iresult[i] = NPY_NAT
-                    except:
-                        if is_raise:
-                            raise OutOfBoundsDatetime(
-                                "cannot convert input {0} with the unit "
-                                "'{1}'".format(val, unit))
-                        elif is_ignore:
-                            raise AssertionError
-                        iresult[i] = NPY_NAT
-
-            else:
-
-                if is_raise:
-                    raise ValueError("non convertible value {0}"
-                                     "with the unit '{1}'".format(
-                                         val,
-                                         unit))
-                if is_ignore:
-                    raise AssertionError
-
-                iresult[i] = NPY_NAT
-
-        return result
-
-    except AssertionError:
-        pass
-
-    # we have hit an exception
-    # and are in ignore mode
-    # redo as object
-
-    oresult = np.empty(n, dtype=object)
-    for i in range(n):
-        val = values[i]
-
-        if _checknull_with_nat(val):
-            oresult[i] = NaT
-        elif is_integer_object(val) or is_float_object(val):
-
-            if val != val or val == NPY_NAT:
-                oresult[i] = NaT
-            else:
-                try:
-                    oresult[i] = Timestamp(cast_from_unit(val, unit))
-                except:
-                    oresult[i] = val
-
-        elif util.is_string_object(val):
-            if len(val) == 0 or val in _nat_strings:
-                oresult[i] = NaT
-
-            else:
-                oresult[i] = val
-
-    return oresult
-
-
-cpdef array_to_datetime(ndarray[object] values, errors='raise',
-                        dayfirst=False, yearfirst=False,
-                        format=None, utc=None,
-                        require_iso8601=False):
-    cdef:
-        Py_ssize_t i, n = len(values)
-        object val, py_dt
-        ndarray[int64_t] iresult
-        ndarray[object] oresult
-        pandas_datetimestruct dts
-        bint utc_convert = bool(utc)
-        bint seen_integer = 0
-        bint seen_string = 0
-        bint seen_datetime = 0
-        bint is_raise = errors=='raise'
-        bint is_ignore = errors=='ignore'
-        bint is_coerce = errors=='coerce'
-        _TSObject _ts
-        int out_local=0, out_tzoffset=0
-
-    # specify error conditions
-    assert is_raise or is_ignore or is_coerce
-
-    try:
-        result = np.empty(n, dtype='M8[ns]')
-        iresult = result.view('i8')
-        for i in range(n):
-            val = values[i]
-
-            if _checknull_with_nat(val):
-                iresult[i] = NPY_NAT
-
-            elif PyDateTime_Check(val):
-                seen_datetime=1
-                if val.tzinfo is not None:
-                    if utc_convert:
-                        _ts = convert_to_tsobject(val, None, 'ns', 0, 0)
-                        iresult[i] = _ts.value
-                        try:
-                            _check_dts_bounds(&_ts.dts)
-                        except ValueError:
-                            if is_coerce:
-                                iresult[i] = NPY_NAT
-                                continue
-                            raise
-                    else:
-                        raise ValueError('Tz-aware datetime.datetime cannot '
-                                         'be converted to datetime64 unless '
-                                         'utc=True')
-                else:
-                    iresult[i] = _pydatetime_to_dts(val, &dts)
-                    if is_timestamp(val):
-                        iresult[i] += (<_Timestamp>val).nanosecond
-                    try:
-                        _check_dts_bounds(&dts)
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = NPY_NAT
-                            continue
-                        raise
-
-            elif PyDate_Check(val):
-                iresult[i] = _date_to_datetime64(val, &dts)
-                try:
-                    _check_dts_bounds(&dts)
-                    seen_datetime=1
-                except ValueError:
-                    if is_coerce:
-                        iresult[i] = NPY_NAT
-                        continue
-                    raise
-
-            elif util.is_datetime64_object(val):
-                if get_datetime64_value(val) == NPY_NAT:
-                    iresult[i] = NPY_NAT
-                else:
-                    try:
-                        iresult[i] = _get_datetime64_nanos(val)
-                        seen_datetime=1
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = NPY_NAT
-                            continue
-                        raise
-
-            elif is_integer_object(val) or is_float_object(val):
-                # these must be ns unit by-definition
-
-                if val != val or val == NPY_NAT:
-                    iresult[i] = NPY_NAT
-                elif is_raise or is_ignore:
-                    iresult[i] = val
-                    seen_integer=1
-                else:
-                    # coerce
-                    # we now need to parse this as if unit='ns'
-                    # we can ONLY accept integers at this point
-                    # if we have previously (or in future accept
-                    # datetimes/strings, then we must coerce)
-                    seen_integer = 1
-                    try:
-                        iresult[i] = cast_from_unit(val, 'ns')
-                    except:
-                        iresult[i] = NPY_NAT
-
-            elif util.is_string_object(val):
-                # string
-
-                try:
-                    if len(val) == 0 or val in _nat_strings:
-                        iresult[i] = NPY_NAT
-                        continue
-
-                    seen_string=1
-                    _string_to_dts(val, &dts, &out_local, &out_tzoffset)
-                    value = pandas_datetimestruct_to_datetime(
-                        PANDAS_FR_ns, &dts)
-                    if out_local == 1:
-                        tz = pytz.FixedOffset(out_tzoffset)
-                        value = tz_convert_single(value, tz, 'UTC')
-                    iresult[i] = value
-                    _check_dts_bounds(&dts)
-                except ValueError:
-                    # if requiring iso8601 strings, skip trying other formats
-                    if require_iso8601:
-                        if is_coerce:
-                            iresult[i] = NPY_NAT
-                            continue
-                        elif is_raise:
-                            raise ValueError(
-                                "time data %r doesn't match format "
-                                "specified" % (val,))
-                        else:
-                            return values
-
-                    try:
-                        py_dt = parse_datetime_string(val, dayfirst=dayfirst,
-                                                      yearfirst=yearfirst)
-                    except Exception:
-                        if is_coerce:
-                            iresult[i] = NPY_NAT
-                            continue
-                        raise TypeError("invalid string coercion to datetime")
-
-                    try:
-                        _ts = convert_to_tsobject(py_dt, None, None, 0, 0)
-                        iresult[i] = _ts.value
-                    except ValueError:
-                        if is_coerce:
-                            iresult[i] = NPY_NAT
-                            continue
-                        raise
-                except:
-                    if is_coerce:
-                        iresult[i] = NPY_NAT
-                        continue
-                    raise
-            else:
-                if is_coerce:
-                    iresult[i] = NPY_NAT
-                else:
-                    raise TypeError("{0} is not convertible to datetime"
-                                    .format(type(val)))
-
-        if  seen_datetime and seen_integer:
-            # we have mixed datetimes & integers
-
-            if is_coerce:
-                # coerce all of the integers/floats to NaT, preserve
-                # the datetimes and other convertibles
-                for i in range(n):
-                    val = values[i]
-                    if is_integer_object(val) or is_float_object(val):
-                        result[i] = NPY_NAT
-            elif is_raise:
-                raise ValueError(
-                    "mixed datetimes and integers in passed array")
-            else:
-                raise TypeError
-
-        return result
-    except OutOfBoundsDatetime:
-        if is_raise:
-            raise
-
-        oresult = np.empty(n, dtype=object)
-        for i in range(n):
-            val = values[i]
-
-            # set as nan except if its a NaT
-            if _checknull_with_nat(val):
-                if PyFloat_Check(val):
-                    oresult[i] = np.nan
-                else:
-                    oresult[i] = NaT
-            elif util.is_datetime64_object(val):
-                if get_datetime64_value(val) == NPY_NAT:
-                    oresult[i] = NaT
-                else:
-                    oresult[i] = val.item()
-            else:
-                oresult[i] = val
-        return oresult
-    except TypeError:
-        oresult = np.empty(n, dtype=object)
-
-        for i in range(n):
-            val = values[i]
-            if _checknull_with_nat(val):
-                oresult[i] = val
-            elif util.is_string_object(val):
-
-                if len(val) == 0 or val in _nat_strings:
-                    oresult[i] = 'NaT'
-                    continue
-
-                try:
-                    oresult[i] = parse_datetime_string(val, dayfirst=dayfirst,
-                                                       yearfirst=yearfirst)
-                    _pydatetime_to_dts(oresult[i], &dts)
-                    _check_dts_bounds(&dts)
-                except Exception:
-                    if is_raise:
-                        raise
-                    return values
-                    # oresult[i] = val
-            else:
-                if is_raise:
-                    raise
-                return values
-
-        return oresult
-
-
-# Similar to Timestamp/datetime, this is a construction requirement for
-# timedeltas that we need to do object instantiation in python. This will
-# serve as a C extension type that shadows the Python class, where we do any
-# heavy lifting.
-cdef class _Timedelta(timedelta):
-
-    cdef readonly:
-        int64_t value     # nanoseconds
-        object freq       # frequency reference
-        bint is_populated # are my components populated
-        int64_t _sign, _d, _h, _m, _s, _ms, _us, _ns
-
-    def __hash__(_Timedelta self):
-        if self._has_ns():
-            return hash(self.value)
-        else:
-            return timedelta.__hash__(self)
-
-    def __richcmp__(_Timedelta self, object other, int op):
-        cdef:
-            _Timedelta ots
-            int ndim
-
-        if isinstance(other, _Timedelta):
-            if isinstance(other, _NaT):
-                return _cmp_nat_dt(other, self, _reverse_ops[op])
-            ots = other
-        elif isinstance(other, timedelta):
-            ots = Timedelta(other)
-        else:
-            ndim = getattr(other, _NDIM_STRING, -1)
-
-            if ndim != -1:
-                if ndim == 0:
-                    if isinstance(other, np.timedelta64):
-                        other = Timedelta(other)
-                    else:
-                        if op == Py_EQ:
-                            return False
-                        elif op == Py_NE:
-                            return True
-
-                        # only allow ==, != ops
-                        raise TypeError('Cannot compare type %r with type %r' %
-                                        (type(self).__name__,
-                                         type(other).__name__))
-                if isinstance(other, np.ndarray):
-                    return PyObject_RichCompare(np.array([self]), other, op)
-                return PyObject_RichCompare(other, self, _reverse_ops[op])
-            else:
-                if op == Py_EQ:
-                    return False
-                elif op == Py_NE:
-                    return True
-                raise TypeError('Cannot compare type %r with type %r' %
-                                (type(self).__name__, type(other).__name__))
-
-        return _cmp_scalar(self.value, ots.value, op)
-
-    def _ensure_components(_Timedelta self):
-        """
-        compute the components
-        """
-        cdef int64_t sfrac, ifrac, frac, ivalue = self.value
-
-        if self.is_populated:
-            return
-
-        # put frac in seconds
-        frac = ivalue /(1000 *1000 *1000)
-        if frac < 0:
-            self._sign = -1
-
-            # even fraction
-            if (-frac % 86400) != 0:
-                self._d = -frac /86400 + 1
-                frac += 86400 *self._d
-            else:
-                frac = -frac
-        else:
-            self._sign = 1
-            self._d = 0
-
-        if frac >= 86400:
-            self._d += frac / 86400
-            frac -= self._d * 86400
-
-        if frac >= 3600:
-            self._h = frac / 3600
-            frac -= self._h * 3600
-        else:
-            self._h = 0
-
-        if frac >= 60:
-            self._m = frac / 60
-            frac -= self._m * 60
-        else:
-            self._m = 0
-
-        if frac >= 0:
-            self._s = frac
-            frac -= self._s
-        else:
-            self._s = 0
-
-        sfrac = (self._h * 3600 + self._m * 60
-                 + self._s) * (1000 * 1000 * 1000)
-        if self._sign < 0:
-            ifrac = ivalue + self._d *DAY_NS - sfrac
-        else:
-            ifrac = ivalue - (self._d *DAY_NS + sfrac)
-
-        if ifrac != 0:
-            self._ms = ifrac /(1000 *1000)
-            ifrac -= self._ms *1000 *1000
-            self._us = ifrac /1000
-            ifrac -= self._us *1000
-            self._ns = ifrac
-        else:
-            self._ms = 0
-            self._us = 0
-            self._ns = 0
-
-        self.is_populated = 1
-
-    cpdef timedelta to_pytimedelta(_Timedelta self):
-        """
-        return an actual datetime.timedelta object
-        note: we lose nanosecond resolution if any
-        """
-        return timedelta(microseconds=int(self.value) /1000)
-
-    cpdef bint _has_ns(self):
-        return self.value % 1000 != 0
-
-# components named tuple
-Components = collections.namedtuple('Components', [
-    'days', 'hours', 'minutes', 'seconds',
-    'milliseconds', 'microseconds', 'nanoseconds'])
-
-# Python front end to C extension type _Timedelta
-# This serves as the box for timedelta64
-
-
-class Timedelta(_Timedelta):
-    """
-    Represents a duration, the difference between two dates or times.
-
-    Timedelta is the pandas equivalent of python's ``datetime.timedelta``
-    and is interchangable with it in most cases.
-
-    Parameters
-    ----------
-    value : Timedelta, timedelta, np.timedelta64, string, or integer
-    unit : string, [D,h,m,s,ms,us,ns]
-        Denote the unit of the input, if input is an integer. Default 'ns'.
-    days, seconds, microseconds,
-    milliseconds, minutes, hours, weeks : numeric, optional
-        Values for construction in compat with datetime.timedelta.
-        np ints and floats will be coereced to python ints and floats.
-
-    Notes
-    -----
-    The ``.value`` attribute is always in ns.
-
-    """
-
-    def __new__(cls, object value=_no_input, unit=None, **kwargs):
-        cdef _Timedelta td_base
-
-        if value is _no_input:
-            if not len(kwargs):
-                raise ValueError(
-                    "cannot construct a Timedelta without a value/unit or "
-                    "descriptive keywords (days,seconds....)")
-
-            def _to_py_int_float(v):
-                if is_integer_object(v):
-                    return int(v)
-                elif is_float_object(v):
-                    return float(v)
-                raise TypeError(
-                    "Invalid type {0}. Must be int or float.".format(type(v)))
-
-            kwargs = dict([ (k, _to_py_int_float(v))
-                            for k, v in iteritems(kwargs) ])
-
-            try:
-                nano = kwargs.pop('nanoseconds', 0)
-                value = convert_to_timedelta64(
-                    timedelta(**kwargs), 'ns') + nano
-            except TypeError as e:
-                raise ValueError("cannot construct a Timedelta from the "
-                                 "passed arguments, allowed keywords are "
-                                 "[weeks, days, hours, minutes, seconds, "
-                                 "milliseconds, microseconds, nanoseconds]")
-
-        if isinstance(value, Timedelta):
-            value = value.value
-        elif util.is_string_object(value):
-            value = np.timedelta64(parse_timedelta_string(value))
-        elif isinstance(value, timedelta):
-            value = convert_to_timedelta64(value, 'ns')
-        elif isinstance(value, np.timedelta64):
-            if unit is not None:
-                value = value.astype('timedelta64[{0}]'.format(unit))
-            value = value.astype('timedelta64[ns]')
-        elif hasattr(value, 'delta'):
-            value = np.timedelta64(_delta_to_nanoseconds(value.delta), 'ns')
-        elif is_integer_object(value) or util.is_float_object(value):
-            # unit=None is de-facto 'ns'
-            value = convert_to_timedelta64(value, unit)
-        elif _checknull_with_nat(value):
-            return NaT
-        else:
-            raise ValueError(
-                "Value must be Timedelta, string, integer, "
-                "float, timedelta or convertible")
-
-        if isinstance(value, np.timedelta64):
-            value = value.view('i8')
-
-        # nat
-        if value == NPY_NAT:
-            return NaT
-
-        # make timedelta happy
-        td_base = _Timedelta.__new__(cls, microseconds=int(value) /1000)
-        td_base.value = value
-        td_base.is_populated = 0
-        return td_base
-
-    @property
-    def delta(self):
-        """ return out delta in ns (for internal compat) """
-        return self.value
-
-    @property
-    def asm8(self):
-        """ return a numpy timedelta64 array view of myself """
-        return np.int64(self.value).view('m8[ns]')
-
-    @property
-    def resolution(self):
-        """ return a string representing the lowest resolution that we have """
-
-        self._ensure_components()
-        if self._ns:
-            return "N"
-        elif self._us:
-            return "U"
-        elif self._ms:
-            return "L"
-        elif self._s:
-            return "S"
-        elif self._m:
-            return "T"
-        elif self._h:
-            return "H"
-        else:
-            return "D"
-
-    def _round(self, freq, rounder):
-
-        cdef int64_t result, unit
-
-        from pandas.tseries.frequencies import to_offset
-        unit = to_offset(freq).nanos
-        result = unit *rounder(self.value /float(unit))
-        return Timedelta(result, unit='ns')
-
-    def round(self, freq):
-        """
-        Round the Timedelta to the specified resolution
-
-        Returns
-        -------
-        a new Timedelta rounded to the given resolution of `freq`
-
-        Parameters
-        ----------
-        freq : a freq string indicating the rounding resolution
-
-        Raises
-        ------
-        ValueError if the freq cannot be converted
-        """
-        return self._round(freq, np.round)
-
-    def floor(self, freq):
-        """
-        return a new Timedelta floored to this resolution
-
-        Parameters
-        ----------
-        freq : a freq string indicating the flooring resolution
-        """
-        return self._round(freq, np.floor)
-
-    def ceil(self, freq):
-        """
-        return a new Timedelta ceiled to this resolution
-
-        Parameters
-        ----------
-        freq : a freq string indicating the ceiling resolution
-        """
-        return self._round(freq, np.ceil)
-
-    def _repr_base(self, format=None):
-        """
-
-        Parameters
-        ----------
-        format : None|all|even_day|sub_day|long
-
-        Returns
-        -------
-        converted : string of a Timedelta
-
-        """
-        cdef object sign_pretty, sign2_pretty, seconds_pretty, subs
-
-        self._ensure_components()
-
-        if self._sign < 0:
-            sign_pretty = "-"
-            sign2_pretty = " +"
-        else:
-            sign_pretty = ""
-            sign2_pretty = " "
-
-        # show everything
-        if format == 'all':
-            seconds_pretty = "%02d.%03d%03d%03d" % (
-                self._s, self._ms, self._us, self._ns)
-            return "%s%d days%s%02d:%02d:%s" % (sign_pretty, self._d,
-                                                sign2_pretty, self._h,
-                                                self._m, seconds_pretty)
-
-        # by default not showing nano
-        if self._ms or self._us or self._ns:
-            seconds_pretty = "%02d.%03d%03d" % (self._s, self._ms, self._us)
-        else:
-            seconds_pretty = "%02d" % self._s
-
-        # if we have a partial day
-        subs = (self._h or self._m or self._s or
-                self._ms or self._us or self._ns)
-
-        if format == 'even_day':
-            if not subs:
-                return "%s%d days" % (sign_pretty, self._d)
-
-        elif format == 'sub_day':
-            if not self._d:
-
-                # degenerate, don't need the extra space
-                if self._sign > 0:
-                    sign2_pretty = ""
-                return "%s%s%02d:%02d:%s" % (sign_pretty, sign2_pretty,
-                                             self._h, self._m, seconds_pretty)
-
-        if subs or format=='long':
-            return "%s%d days%s%02d:%02d:%s" % (sign_pretty, self._d,
-                                                sign2_pretty, self._h,
-                                                self._m, seconds_pretty)
-        return "%s%d days" % (sign_pretty, self._d)
-
-    def __repr__(self):
-        return "Timedelta('{0}')".format(self._repr_base(format='long'))
-    def __str__(self):
-        return self._repr_base(format='long')
-
-    @property
-    def components(self):
-        """ Return a Components NamedTuple-like """
-        self._ensure_components()
-        if self._sign < 0:
-            return Components(-self._d, self._h, self._m, self._s,
-                              self._ms, self._us, self._ns)
-
-        # return the named tuple
-        return Components(self._d, self._h, self._m, self._s,
-                          self._ms, self._us, self._ns)
-
-    @property
-    def days(self):
-        """
-        Number of Days
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        if self._sign < 0:
-            return -1 *self._d
-        return self._d
-
-    @property
-    def seconds(self):
-        """
-        Number of seconds (>= 0 and less than 1 day).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._h *3600 + self._m *60 + self._s
-
-    @property
-    def microseconds(self):
-        """
-        Number of microseconds (>= 0 and less than 1 second).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._ms *1000 + self._us
-
-    @property
-    def nanoseconds(self):
-        """
-        Number of nanoseconds (>= 0 and less than 1 microsecond).
-
-        .components will return the shown components
-        """
-        self._ensure_components()
-        return self._ns
-
-    def total_seconds(self):
-        """
-        Total duration of timedelta in seconds (to ns precision)
-        """
-        return 1e-9 *self.value
-
-    def isoformat(self):
-        """
-        Format Timedelta as ISO 8601 Duration like
-        `P[n]Y[n]M[n]DT[n]H[n]M[n]S`, where the `[n]`s are replaced by the
-        values. See https://en.wikipedia.org/wiki/ISO_8601#Durations
-
-        .. versionadded:: 0.20.0
-
-        Returns
-        -------
-        formatted : str
-
-        Notes
-        -----
-        The longest component is days, whose value may be larger than
-        365.
-        Every component is always included, even if its value is 0.
-        Pandas uses nanosecond precision, so up to 9 decimal places may
-        be included in the seconds component.
-        Trailing 0's are removed from the seconds component after the decimal.
-        We do not 0 pad components, so it's `...T5H...`, not `...T05H...`
-
-        Examples
-        --------
-        >>> td = pd.Timedelta(days=6, minutes=50, seconds=3,
-        ...                   milliseconds=10, microseconds=10, nanoseconds=12)
-        >>> td.isoformat()
-        'P6DT0H50M3.010010012S'
-        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
-        'P0DT0H0M10S'
-        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
-        'P0DT0H0M10S'
-        >>> pd.Timedelta(days=500.5).isoformat()
-        'P500DT12H0MS'
-
-        See Also
-        --------
-        Timestamp.isoformat
-        """
-        components = self.components
-        seconds = '{}.{:0>3}{:0>3}{:0>3}'.format(components.seconds,
-                                                 components.milliseconds,
-                                                 components.microseconds,
-                                                 components.nanoseconds)
-        # Trim unnecessary 0s, 1.000000000 -> 1
-        seconds = seconds.rstrip('0').rstrip('.')
-        tpl = 'P{td.days}DT{td.hours}H{td.minutes}M{seconds}S'.format(
-            td=components, seconds=seconds)
-        return tpl
-
-    def __setstate__(self, state):
-        (value) = state
-        self.value = value
-
-    def __reduce__(self):
-        object_state = self.value,
-        return (Timedelta, object_state)
-
-    def view(self, dtype):
-        """ array view compat """
-        return np.timedelta64(self.value).view(dtype)
-
-    def to_timedelta64(self):
-        """ Returns a numpy.timedelta64 object with 'ns' precision """
-        return np.timedelta64(self.value, 'ns')
-
-    def _validate_ops_compat(self, other):
-        # return True if we are compat with operating
-        if _checknull_with_nat(other):
-            return True
-        elif isinstance(other, (Timedelta, timedelta, np.timedelta64)):
-            return True
-        elif util.is_string_object(other):
-            return True
-        elif hasattr(other, 'delta'):
-            return True
-        return False
-
-    # higher than np.ndarray and np.matrix
-    __array_priority__ = 100
-
-    def _binary_op_method_timedeltalike(op, name):
-        # define a binary operation that only works if the other argument is
-        # timedelta like or an array of timedeltalike
-        def f(self, other):
-            # an offset
-            if hasattr(other, 'delta') and not isinstance(other, Timedelta):
-                return op(self, other.delta)
-
-            # a datetimelike
-            if (isinstance(other, (datetime, np.datetime64))
-                    and not isinstance(other, (Timestamp, NaTType))):
-                return op(self, Timestamp(other))
-
-            # nd-array like
-            if hasattr(other, 'dtype'):
-                if other.dtype.kind not in ['m', 'M']:
-                    # raise rathering than letting numpy return wrong answer
-                    return NotImplemented
-                return op(self.to_timedelta64(), other)
-
-            if not self._validate_ops_compat(other):
-                return NotImplemented
-
-            if other is NaT:
-                return NaT
-
-            try:
-                other = Timedelta(other)
-            except ValueError:
-                # failed to parse as timedelta
-                return NotImplemented
-
-            return Timedelta(op(self.value, other.value), unit='ns')
-
-        f.__name__ = name
-        return f
-
-    __add__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__add__')
-    __radd__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__radd__')
-    __sub__ = _binary_op_method_timedeltalike(lambda x, y: x - y, '__sub__')
-    __rsub__ = _binary_op_method_timedeltalike(lambda x, y: y - x, '__rsub__')
-
-    def __mul__(self, other):
-
-        # nd-array like
-        if hasattr(other, 'dtype'):
-            return other * self.to_timedelta64()
-
-        if other is NaT:
-            return NaT
-
-        # only integers and floats allowed
-        if not (is_integer_object(other) or is_float_object(other)):
-            return NotImplemented
-
-        return Timedelta(other * self.value, unit='ns')
-
-    __rmul__ = __mul__
-
-    def __truediv__(self, other):
-
-        if hasattr(other, 'dtype'):
-            return self.to_timedelta64() / other
-
-        # integers or floats
-        if is_integer_object(other) or is_float_object(other):
-            return Timedelta(self.value /other, unit='ns')
-
-        if not self._validate_ops_compat(other):
-            return NotImplemented
-
-        other = Timedelta(other)
-        if other is NaT:
-            return np.nan
-        return self.value /float(other.value)
-
-    def __rtruediv__(self, other):
-        if hasattr(other, 'dtype'):
-            return other / self.to_timedelta64()
-
-        if not self._validate_ops_compat(other):
-            return NotImplemented
-
-        other = Timedelta(other)
-        if other is NaT:
-            return NaT
-        return float(other.value) / self.value
-
-    if not PY3:
-        __div__ = __truediv__
-        __rdiv__ = __rtruediv__
-
-    def _not_implemented(self, *args, **kwargs):
-        return NotImplemented
-
-    __floordiv__ = _not_implemented
-    __rfloordiv__ = _not_implemented
-
-    def _op_unary_method(func, name):
-
-        def f(self):
-            return Timedelta(func(self.value), unit='ns')
-        f.__name__ = name
-        return f
-
-    __inv__ = _op_unary_method(lambda x: -x, '__inv__')
-    __neg__ = _op_unary_method(lambda x: -x, '__neg__')
-    __pos__ = _op_unary_method(lambda x: x, '__pos__')
-    __abs__ = _op_unary_method(lambda x: abs(x), '__abs__')
-
-# resolution in ns
-Timedelta.min = Timedelta(np.iinfo(np.int64).min +1)
-Timedelta.max = Timedelta(np.iinfo(np.int64).max)
-
-cdef PyTypeObject* td_type = <PyTypeObject*> Timedelta
-
-
-cdef inline bint is_timedelta(object o):
-    return Py_TYPE(o) == td_type # isinstance(o, Timedelta)
-
-
-cpdef array_to_timedelta64(ndarray[object] values, unit='ns', errors='raise'):
-    """
-    Convert an ndarray to an array of timedeltas. If errors == 'coerce',
-    coerce non-convertible objects to NaT. Otherwise, raise.
-    """
-
-    cdef:
-        Py_ssize_t i, n
-        ndarray[int64_t] iresult
-
-    if errors not in ('ignore', 'raise', 'coerce'):
-        raise ValueError("errors must be one of 'ignore', "
-                         "'raise', or 'coerce'}")
-
-    n = values.shape[0]
-    result = np.empty(n, dtype='m8[ns]')
-    iresult = result.view('i8')
-
-    # Usually, we have all strings. If so, we hit the fast path.
-    # If this path fails, we try conversion a different way, and
-    # this is where all of the error handling will take place.
-    try:
-        for i in range(n):
-            result[i] = parse_timedelta_string(values[i])
-    except:
-        for i in range(n):
-            try:
-                result[i] = convert_to_timedelta64(values[i], unit)
-            except ValueError:
-                if errors == 'coerce':
-                    result[i] = NPY_NAT
-                else:
-                    raise
-
-    return iresult
-
-cdef dict timedelta_abbrevs = { 'D': 'd',
-                                'd': 'd',
-                                'days': 'd',
-                                'day': 'd',
-                                'hours': 'h',
-                                'hour': 'h',
-                                'hr': 'h',
-                                'h': 'h',
-                                'm': 'm',
-                                'minute': 'm',
-                                'min': 'm',
-                                'minutes': 'm',
-                                's': 's',
-                                'seconds': 's',
-                                'sec': 's',
-                                'second': 's',
-                                'ms': 'ms',
-                                'milliseconds': 'ms',
-                                'millisecond': 'ms',
-                                'milli': 'ms',
-                                'millis': 'ms',
-                                'us': 'us',
-                                'microseconds': 'us',
-                                'microsecond': 'us',
-                                'micro': 'us',
-                                'micros': 'us',
-                                'ns': 'ns',
-                                'nanoseconds': 'ns',
-                                'nano': 'ns',
-                                'nanos': 'ns',
-                                'nanosecond': 'ns',
-                                }
-timedelta_abbrevs_map = timedelta_abbrevs
-
-cdef inline int64_t timedelta_as_neg(int64_t value, bint neg):
-    """
-
-    Parameters
-    ----------
-    value : int64_t of the timedelta value
-    neg : boolean if the a negative value
-    """
-    if neg:
-        return -value
-    return value
-
-cdef inline timedelta_from_spec(object number, object frac, object unit):
-    """
-
-    Parameters
-    ----------
-    number : a list of number digits
-    frac : a list of frac digits
-    unit : a list of unit characters
-    """
-    cdef object n
-
-    try:
-        unit = ''.join(unit)
-        unit = timedelta_abbrevs[unit.lower()]
-    except KeyError:
-        raise ValueError("invalid abbreviation: {0}".format(unit))
-
-    n = ''.join(number) + '.' + ''.join(frac)
-    return cast_from_unit(float(n), unit)
-
-cdef inline parse_timedelta_string(object ts):
-    """
-    Parse a regular format timedelta string. Return an int64_t (in ns)
-    or raise a ValueError on an invalid parse.
-    """
-
-    cdef:
-        unicode c
-        bint neg=0, have_dot=0, have_value=0, have_hhmmss=0
-        object current_unit=None
-        int64_t result=0, m=0, r
-        list number=[], frac=[], unit=[]
-
-    # neg : tracks if we have a leading negative for the value
-    # have_dot : tracks if we are processing a dot (either post hhmmss or
-    #            inside an expression)
-    # have_value : track if we have at least 1 leading unit
-    # have_hhmmss : tracks if we have a regular format hh:mm:ss
-
-    if len(ts) == 0 or ts in _nat_strings:
-        return NPY_NAT
-
-    # decode ts if necessary
-    if not PyUnicode_Check(ts) and not PY3:
-        ts = str(ts).decode('utf-8')
-
-    for c in ts:
-
-        # skip whitespace / commas
-        if c == ' ' or c == ',':
-            pass
-
-        # positive signs are ignored
-        elif c == '+':
-            pass
-
-        # neg
-        elif c == '-':
-
-            if neg or have_value or have_hhmmss:
-                raise ValueError("only leading negative signs are allowed")
-
-            neg = 1
-
-        # number (ascii codes)
-        elif ord(c) >= 48 and ord(c) <= 57:
-
-            if have_dot:
-
-                # we found a dot, but now its just a fraction
-                if len(unit):
-                    number.append(c)
-                    have_dot = 0
-                else:
-                    frac.append(c)
-
-            elif not len(unit):
-                number.append(c)
-
-            else:
-                r = timedelta_from_spec(number, frac, unit)
-                unit, number, frac = [], [c], []
-
-                result += timedelta_as_neg(r, neg)
-
-        # hh:mm:ss.
-        elif c == ':':
-
-            # we flip this off if we have a leading value
-            if have_value:
-                neg = 0
-
-            # we are in the pattern hh:mm:ss pattern
-            if len(number):
-                if current_unit is None:
-                    current_unit = 'h'
-                    m = 1000000000L * 3600
-                elif current_unit == 'h':
-                    current_unit = 'm'
-                    m = 1000000000L * 60
-                elif current_unit == 'm':
-                    current_unit = 's'
-                    m = 1000000000L
-                r = <int64_t> int(''.join(number)) * m
-                result += timedelta_as_neg(r, neg)
-                have_hhmmss = 1
-            else:
-                raise ValueError("expecting hh:mm:ss format, "
-                                 "received: {0}".format(ts))
-
-            unit, number = [], []
-
-        # after the decimal point
-        elif c == '.':
-
-            if len(number) and current_unit is not None:
-
-                # by definition we had something like
-                # so we need to evaluate the final field from a
-                # hh:mm:ss (so current_unit is 'm')
-                if current_unit != 'm':
-                    raise ValueError("expected hh:mm:ss format before .")
-                m = 1000000000L
-                r = <int64_t> int(''.join(number)) * m
-                result += timedelta_as_neg(r, neg)
-                have_value = 1
-                unit, number, frac = [], [], []
-
-            have_dot = 1
-
-        # unit
-        else:
-            unit.append(c)
-            have_value = 1
-            have_dot = 0
-
-    # we had a dot, but we have a fractional
-    # value since we have an unit
-    if have_dot and len(unit):
-        r = timedelta_from_spec(number, frac, unit)
-        result += timedelta_as_neg(r, neg)
-
-    # we have a dot as part of a regular format
-    # e.g. hh:mm:ss.fffffff
-    elif have_dot:
-
-        if ((len(number) or len(frac)) and not len(unit)
-            and current_unit is None):
-            raise ValueError("no units specified")
-
-        if len(frac) > 0 and len(frac) <= 3:
-            m = 10**(3 -len(frac)) * 1000L * 1000L
-        elif len(frac) > 3 and len(frac) <= 6:
-            m = 10**(6 -len(frac)) * 1000L
-        else:
-            m = 10**(9 -len(frac))
-
-        r = <int64_t> int(''.join(frac)) * m
-        result += timedelta_as_neg(r, neg)
-
-    # we have a regular format
-    # we must have seconds at this point (hence the unit is still 'm')
-    elif current_unit is not None:
-        if current_unit != 'm':
-            raise ValueError("expected hh:mm:ss format")
-        m = 1000000000L
-        r = <int64_t> int(''.join(number)) * m
-        result += timedelta_as_neg(r, neg)
-
-    # we have a last abbreviation
-    elif len(unit):
-        if len(number):
-            r = timedelta_from_spec(number, frac, unit)
-            result += timedelta_as_neg(r, neg)
-        else:
-            raise ValueError("unit abbreviation w/o a number")
-
-    # treat as nanoseconds
-    # but only if we don't have anything else
-    else:
-        if have_value:
-            raise ValueError("have leftover units")
-        if len(number):
-            r = timedelta_from_spec(number, frac, 'ns')
-            result += timedelta_as_neg(r, neg)
-
-    return result
-
-cpdef convert_to_timedelta64(object ts, object unit):
-    """
-    Convert an incoming object to a timedelta64 if possible
-
-    Handle these types of objects:
-        - timedelta/Timedelta
-        - timedelta64
-        - an offset
-        - np.int64 (with unit providing a possible modifier)
-        - None/NaT
-
-    Return an ns based int64
-
-    # kludgy here until we have a timedelta scalar
-    # handle the numpy < 1.7 case
-    """
-    if _checknull_with_nat(ts):
-        return np.timedelta64(NPY_NAT)
-    elif isinstance(ts, Timedelta):
-        # already in the proper format
-        ts = np.timedelta64(ts.value)
-    elif util.is_datetime64_object(ts):
-        # only accept a NaT here
-        if ts.astype('int64') == NPY_NAT:
-            return np.timedelta64(NPY_NAT)
-    elif isinstance(ts, np.timedelta64):
-        ts = ts.astype("m8[{0}]".format(unit.lower()))
-    elif is_integer_object(ts):
-        if ts == NPY_NAT:
-            return np.timedelta64(NPY_NAT)
-        else:
-            if util.is_array(ts):
-                ts = ts.astype('int64').item()
-            if unit in ['Y', 'M', 'W']:
-                ts = np.timedelta64(ts, unit)
-            else:
-                ts = cast_from_unit(ts, unit)
-                ts = np.timedelta64(ts)
-    elif is_float_object(ts):
-        if util.is_array(ts):
-            ts = ts.astype('int64').item()
-        if unit in ['Y', 'M', 'W']:
-            ts = np.timedelta64(int(ts), unit)
-        else:
-            ts = cast_from_unit(ts, unit)
-            ts = np.timedelta64(ts)
-    elif util.is_string_object(ts):
-        ts = np.timedelta64(parse_timedelta_string(ts))
-    elif hasattr(ts, 'delta'):
-        ts = np.timedelta64(_delta_to_nanoseconds(ts), 'ns')
-
-    if isinstance(ts, timedelta):
-        ts = np.timedelta64(ts)
-    elif not isinstance(ts, np.timedelta64):
-        raise ValueError("Invalid type for timedelta "
-                         "scalar: %s" % type(ts))
-    return ts.astype('timedelta64[ns]')
-
-
-def array_strptime(ndarray[object] values, object fmt,
-                   bint exact=True, errors='raise'):
-    """
-    Parameters
-    ----------
-    values : ndarray of string-like objects
-    fmt : string-like regex
-    exact : matches must be exact if True, search if False
-    coerce : if invalid values found, coerce to NaT
-    """
-
-    cdef:
-        Py_ssize_t i, n = len(values)
-        pandas_datetimestruct dts
-        ndarray[int64_t] iresult
-        int year, month, day, minute, hour, second, weekday, julian, tz
-        int week_of_year, week_of_year_start
-        int64_t us, ns
-        object val, group_key, ampm, found
-        dict found_key
-        bint is_raise = errors=='raise'
-        bint is_ignore = errors=='ignore'
-        bint is_coerce = errors=='coerce'
-
-    assert is_raise or is_ignore or is_coerce
-
-    global _TimeRE_cache, _regex_cache
-    with _cache_lock:
-        if _getlang() != _TimeRE_cache.locale_time.lang:
-            _TimeRE_cache = TimeRE()
-            _regex_cache.clear()
-        if len(_regex_cache) > _CACHE_MAX_SIZE:
-            _regex_cache.clear()
-        locale_time = _TimeRE_cache.locale_time
-        format_regex = _regex_cache.get(fmt)
-        if not format_regex:
-            try:
-                format_regex = _TimeRE_cache.compile(fmt)
-            # KeyError raised when a bad format is found; can be specified as
-            # \\, in which case it was a stray % but with a space after it
-            except KeyError, err:
-                bad_directive = err.args[0]
-                if bad_directive == "\\":
-                    bad_directive = "%"
-                del err
-                raise ValueError("'%s' is a bad directive in format '%s'" %
-                                    (bad_directive, fmt))
-            # IndexError only occurs when the format string is "%"
-            except IndexError:
-                raise ValueError("stray %% in format '%s'" % fmt)
-            _regex_cache[fmt] = format_regex
-
-    result = np.empty(n, dtype='M8[ns]')
-    iresult = result.view('i8')
-
-    dts.us = dts.ps = dts.as = 0
-
-    cdef dict _parse_code_table = {
-        'y': 0,
-        'Y': 1,
-        'm': 2,
-        'B': 3,
-        'b': 4,
-        'd': 5,
-        'H': 6,
-        'I': 7,
-        'M': 8,
-        'S': 9,
-        'f': 10,
-        'A': 11,
-        'a': 12,
-        'w': 13,
-        'j': 14,
-        'U': 15,
-        'W': 16,
-        'Z': 17,
-        'p': 18   # just an additional key, works only with I
-    }
-    cdef int parse_code
-
-    for i in range(n):
-        val = values[i]
-        if util.is_string_object(val):
-            if val in _nat_strings:
-                iresult[i] = NPY_NAT
-                continue
-        else:
-            if _checknull_with_nat(val):
-                iresult[i] = NPY_NAT
-                continue
-            else:
-                val = str(val)
-
-        # exact matching
-        if exact:
-            found = format_regex.match(val)
-            if not found:
-                if is_coerce:
-                    iresult[i] = NPY_NAT
-                    continue
-                raise ValueError("time data %r does not match "
-                                 "format %r (match)" % (values[i], fmt))
-            if len(val) != found.end():
-                if is_coerce:
-                    iresult[i] = NPY_NAT
-                    continue
-                raise ValueError("unconverted data remains: %s" %
-                                  values[i][found.end():])
-
-        # search
-        else:
-            found = format_regex.search(val)
-            if not found:
-                if is_coerce:
-                    iresult[i] = NPY_NAT
-                    continue
-                raise ValueError("time data %r does not match format "
-                                 "%r (search)" % (values[i], fmt))
-
-        year = 1900
-        month = day = 1
-        hour = minute = second = ns = us = 0
-        tz = -1
-        # Default to -1 to signify that values not known; not critical to have,
-        # though
-        week_of_year = -1
-        week_of_year_start = -1
-        # weekday and julian defaulted to -1 so as to signal need to calculate
-        # values
-        weekday = julian = -1
-        found_dict = found.groupdict()
-        for group_key in found_dict.iterkeys():
-            # Directives not explicitly handled below:
-            #   c, x, X
-            #      handled by making out of other directives
-            #   U, W
-            #      worthless without day of the week
-            parse_code = _parse_code_table[group_key]
-
-            if parse_code == 0:
-                year = int(found_dict['y'])
-                # Open Group specification for strptime() states that a %y
-                #value in the range of [00, 68] is in the century 2000, while
-                #[69,99] is in the century 1900
-                if year <= 68:
-                    year += 2000
-                else:
-                    year += 1900
-            elif parse_code == 1:
-                year = int(found_dict['Y'])
-            elif parse_code == 2:
-                month = int(found_dict['m'])
-            elif parse_code == 3:
-            # elif group_key == 'B':
-                month = locale_time.f_month.index(found_dict['B'].lower())
-            elif parse_code == 4:
-            # elif group_key == 'b':
-                month = locale_time.a_month.index(found_dict['b'].lower())
-            elif parse_code == 5:
-            # elif group_key == 'd':
-                day = int(found_dict['d'])
-            elif parse_code == 6:
-            # elif group_key == 'H':
-                hour = int(found_dict['H'])
-            elif parse_code == 7:
-                hour = int(found_dict['I'])
-                ampm = found_dict.get('p', '').lower()
-                # If there was no AM/PM indicator, we'll treat this like AM
-                if ampm in ('', locale_time.am_pm[0]):
-                    # We're in AM so the hour is correct unless we're
-                    # looking at 12 midnight.
-                    # 12 midnight == 12 AM == hour 0
-                    if hour == 12:
-                        hour = 0
-                elif ampm == locale_time.am_pm[1]:
-                    # We're in PM so we need to add 12 to the hour unless
-                    # we're looking at 12 noon.
-                    # 12 noon == 12 PM == hour 12
-                    if hour != 12:
-                        hour += 12
-            elif parse_code == 8:
-                minute = int(found_dict['M'])
-            elif parse_code == 9:
-                second = int(found_dict['S'])
-            elif parse_code == 10:
-                s = found_dict['f']
-                # Pad to always return nanoseconds
-                s += "0" * (9 - len(s))
-                us = long(s)
-                ns = us % 1000
-                us = us / 1000
-            elif parse_code == 11:
-                weekday = locale_time.f_weekday.index(found_dict['A'].lower())
-            elif parse_code == 12:
-                weekday = locale_time.a_weekday.index(found_dict['a'].lower())
-            elif parse_code == 13:
-                weekday = int(found_dict['w'])
-                if weekday == 0:
-                    weekday = 6
-                else:
-                    weekday -= 1
-            elif parse_code == 14:
-                julian = int(found_dict['j'])
-            elif parse_code == 15 or parse_code == 16:
-                week_of_year = int(found_dict[group_key])
-                if group_key == 'U':
-                    # U starts week on Sunday.
-                    week_of_year_start = 6
-                else:
-                    # W starts week on Monday.
-                    week_of_year_start = 0
-            elif parse_code == 17:
-                # Since -1 is default value only need to worry about setting tz
-                # if it can be something other than -1.
-                found_zone = found_dict['Z'].lower()
-                for value, tz_values in enumerate(locale_time.timezone):
-                    if found_zone in tz_values:
-                        # Deal w/ bad locale setup where timezone names are the
-                        # same and yet time.daylight is true; too ambiguous to
-                        # be able to tell what timezone has daylight savings
-                        if (time.tzname[0] == time.tzname[1] and
-                            time.daylight and found_zone not in (
-                                "utc", "gmt")):
-                            break
-                        else:
-                            tz = value
-                            break
-        # If we know the wk of the year and what day of that wk, we can figure
-        # out the Julian day of the year.
-        if julian == -1 and week_of_year != -1 and weekday != -1:
-            week_starts_Mon = True if week_of_year_start == 0 else False
-            julian = _calc_julian_from_U_or_W(year, week_of_year, weekday,
-                                                week_starts_Mon)
-        # Cannot pre-calculate datetime_date() since can change in Julian
-        # calculation and thus could have different value for the day of the wk
-        # calculation.
-        try:
-            if julian == -1:
-                # Need to add 1 to result since first day of the year is 1, not
-                # 0.
-                julian = datetime_date(year, month, day).toordinal() - \
-                    datetime_date(year, 1, 1).toordinal() + 1
-            else: # Assume that if they bothered to include Julian day it will
-                # be accurate.
-                datetime_result = datetime_date.fromordinal(
-                    (julian - 1) + datetime_date(year, 1, 1).toordinal())
-                year = datetime_result.year
-                month = datetime_result.month
-                day = datetime_result.day
-        except ValueError:
-            if is_coerce:
-                iresult[i] = NPY_NAT
-                continue
-            raise
-        if weekday == -1:
-            weekday = datetime_date(year, month, day).weekday()
-
-        dts.year = year
-        dts.month = month
-        dts.day = day
-        dts.hour = hour
-        dts.min = minute
-        dts.sec = second
-        dts.us = us
-        dts.ps = ns * 1000
-
-        iresult[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-        try:
-            _check_dts_bounds(&dts)
-        except ValueError:
-            if is_coerce:
-                iresult[i] = NPY_NAT
-                continue
-            raise
-
-    return result
-
-
-#----------------------------------------------------------------------
-# NaT methods/property setups
-
-
-# inject the Timestamp field properties
-# these by definition return np.nan
-fields = ['year', 'quarter', 'month', 'day', 'hour',
-          'minute', 'second', 'millisecond', 'microsecond', 'nanosecond',
-          'week', 'dayofyear', 'weekofyear', 'days_in_month', 'daysinmonth',
-          'dayofweek', 'weekday_name', 'days', 'seconds', 'microseconds',
-          'nanoseconds', 'qyear', 'quarter']
-for field in fields:
-    prop = property(fget=lambda self: np.nan)
-    setattr(NaTType, field, prop)
-
-
-# define how we are handling NaT methods & inject
-# to the NaTType class; these can return NaT, np.nan
-# or raise respectively
-_nat_methods = ['date', 'now', 'replace', 'to_pydatetime',
-                'today', 'round', 'floor', 'ceil']
-_nan_methods = ['weekday', 'isoweekday', 'total_seconds']
-_implemented_methods = ['to_datetime', 'to_datetime64', 'isoformat']
-_implemented_methods.extend(_nat_methods)
-_implemented_methods.extend(_nan_methods)
-
-
-def _get_docstring(_method_name):
-    # NaT serves double duty as Timestamp & Timedelta
-    # missing value, so need to acquire doc-strings for both
-
-    try:
-        return getattr(Timestamp, _method_name).__doc__
-    except AttributeError:
-        pass
-
-    try:
-        return getattr(Timedelta, _method_name).__doc__
-    except AttributeError:
-        pass
-
-    return None
-
-
-for _method_name in _nat_methods:
-
-    def _make_nat_func(func_name):
-        def f(*args, **kwargs):
-            return NaT
-        f.__name__ = func_name
-        f.__doc__ = _get_docstring(_method_name)
-        return f
-
-    setattr(NaTType, _method_name, _make_nat_func(_method_name))
-
-
-for _method_name in _nan_methods:
-
-    def _make_nan_func(func_name):
-        def f(*args, **kwargs):
-            return np.nan
-        f.__name__ = func_name
-        f.__doc__ = _get_docstring(_method_name)
-        return f
-
-    setattr(NaTType, _method_name, _make_nan_func(_method_name))
-
-
-# GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or
-# return NaT create functions that raise, for binding to NaTType
-for _maybe_method_name in dir(NaTType):
-    _maybe_method = getattr(NaTType, _maybe_method_name)
-    if (callable(_maybe_method)
-        and not _maybe_method_name.startswith("_")
-        and _maybe_method_name not in _implemented_methods):
-
-        def _make_error_func(func_name):
-            def f(*args, **kwargs):
-                raise ValueError("NaTType does not support " + func_name)
-            f.__name__ = func_name
-            f.__doc__ = _get_docstring(_method_name)
-            return f
-
-        setattr(NaTType, _maybe_method_name,
-                _make_error_func(_maybe_method_name))
-
-
-#----------------------------------------------------------------------
-# Conversion routines
-
-
-def _delta_to_nanoseconds(delta):
-    if isinstance(delta, np.ndarray):
-        return delta.astype('m8[ns]').astype('int64')
-    if hasattr(delta, 'nanos'):
-        return delta.nanos
-    if hasattr(delta, 'delta'):
-        delta = delta.delta
-    if is_timedelta64_object(delta):
-        return delta.astype("timedelta64[ns]").item()
-    if is_integer_object(delta):
-        return delta
-    return (delta.days * 24 * 60 * 60 * 1000000
-            + delta.seconds * 1000000
-            + delta.microseconds) * 1000
-
-
-cdef inline _get_datetime64_nanos(object val):
-    cdef:
-        pandas_datetimestruct dts
-        PANDAS_DATETIMEUNIT unit
-        npy_datetime ival
-
-    unit = get_datetime64_unit(val)
-    ival = get_datetime64_value(val)
-
-    if unit != PANDAS_FR_ns:
-        pandas_datetime_to_datetimestruct(ival, unit, &dts)
-        _check_dts_bounds(&dts)
-        return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    else:
-        return ival
-
-cpdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
-    """ return a casting of the unit represented to nanoseconds
-        round the fractional part of a float to our precision, p """
-    cdef:
-        int64_t m
-        int p
-
-    if unit == 'D' or unit == 'd':
-        m = 1000000000L * 86400
-        p = 6
-    elif unit == 'h':
-        m = 1000000000L * 3600
-        p = 6
-    elif unit == 'm':
-        m = 1000000000L * 60
-        p = 6
-    elif unit == 's':
-        m = 1000000000L
-        p = 6
-    elif unit == 'ms':
-        m = 1000000L
-        p = 3
-    elif unit == 'us':
-        m = 1000L
-        p = 0
-    elif unit == 'ns' or unit is None:
-        m = 1L
-        p = 0
-    else:
-        raise ValueError("cannot cast unit {0}".format(unit))
-
-    # just give me the unit back
-    if ts is None:
-        return m
-
-    # cast the unit, multiply base/frace separately
-    # to avoid precision issues from float -> int
-    base = <int64_t> ts
-    frac = ts -base
-    if p:
-        frac = round(frac, p)
-    return <int64_t> (base *m) + <int64_t> (frac *m)
-
-
-def cast_to_nanoseconds(ndarray arr):
-    cdef:
-        Py_ssize_t i, n = arr.size
-        ndarray[int64_t] ivalues, iresult
-        PANDAS_DATETIMEUNIT unit
-        pandas_datetimestruct dts
-
-    shape = (<object> arr).shape
-
-    ivalues = arr.view(np.int64).ravel()
-
-    result = np.empty(shape, dtype='M8[ns]')
-    iresult = result.ravel().view(np.int64)
-
-    if len(iresult) == 0:
-        return result
-
-    unit = get_datetime64_unit(arr.flat[0])
-    for i in range(n):
-        if ivalues[i] != NPY_NAT:
-            pandas_datetime_to_datetimestruct(ivalues[i], unit, &dts)
-            iresult[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-            _check_dts_bounds(&dts)
-        else:
-            iresult[i] = NPY_NAT
-
-    return result
-
-
-def pydt_to_i8(object pydt):
-    """
-    Convert to int64 representation compatible with numpy datetime64; converts
-    to UTC
-    """
-    cdef:
-        _TSObject ts
-
-    ts = convert_to_tsobject(pydt, None, None, 0, 0)
-
-    return ts.value
-
-
-def i8_to_pydt(int64_t i8, object tzinfo = None):
-    """
-    Inverse of pydt_to_i8
-    """
-    return Timestamp(i8)
-
-#----------------------------------------------------------------------
-# time zone conversion helpers
-
-try:
-    import pytz
-    UTC = pytz.utc
-    have_pytz = True
-except:
-    have_pytz = False
-
-
-def tz_convert(ndarray[int64_t] vals, object tz1, object tz2):
-    cdef:
-        ndarray[int64_t] utc_dates, tt, result, trans, deltas
-        Py_ssize_t i, j, pos, n = len(vals)
-        ndarray[Py_ssize_t] posn
-        int64_t v, offset, delta
-        pandas_datetimestruct dts
-
-    if not have_pytz:
-        import pytz
-
-    if len(vals) == 0:
-        return np.array([], dtype=np.int64)
-
-    # Convert to UTC
-    if _get_zone(tz1) != 'UTC':
-        utc_dates = np.empty(n, dtype=np.int64)
-        if _is_tzlocal(tz1):
-            for i in range(n):
-                v = vals[i]
-                if v == NPY_NAT:
-                    utc_dates[i] = NPY_NAT
-                else:
-                    pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-                    dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                                  dts.min, dts.sec, dts.us, tz1)
-                    delta = (int(total_seconds(_get_utcoffset(tz1, dt)))
-                             * 1000000000)
-                    utc_dates[i] = v - delta
-        else:
-            trans, deltas, typ = _get_dst_info(tz1)
-
-            # all-NaT
-            tt = vals[vals!=NPY_NAT]
-            if not len(tt):
-                return vals
-
-            posn = trans.searchsorted(tt, side='right')
-            j = 0
-            for i in range(n):
-                v = vals[i]
-                if v == NPY_NAT:
-                    utc_dates[i] = NPY_NAT
-                else:
-                    pos = posn[j] - 1
-                    j = j + 1
-                    if pos < 0:
-                        raise ValueError('First time before start of DST info')
-                    offset = deltas[pos]
-                    utc_dates[i] = v - offset
-    else:
-        utc_dates = vals
-
-    if _get_zone(tz2) == 'UTC':
-        return utc_dates
-
-    result = np.zeros(n, dtype=np.int64)
-    if _is_tzlocal(tz2):
-        for i in range(n):
-            v = utc_dates[i]
-            if v == NPY_NAT:
-                result[i] = NPY_NAT
-            else:
-                pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-                dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                              dts.min, dts.sec, dts.us, tz2)
-                delta = int(total_seconds(
-                    _get_utcoffset(tz2, dt))) * 1000000000
-                result[i] = v + delta
-        return result
-
-    # Convert UTC to other timezone
-    trans, deltas, typ = _get_dst_info(tz2)
-
-    # use first non-NaT element
-    # if all-NaT, return all-NaT
-    if (result==NPY_NAT).all():
-        return result
-
-    # if all NaT, return all NaT
-    tt = utc_dates[utc_dates!=NPY_NAT]
-    if not len(tt):
-        return utc_dates
-
-    posn = trans.searchsorted(tt, side='right')
-
-    j = 0
-    for i in range(n):
-        v = utc_dates[i]
-        if vals[i] == NPY_NAT:
-            result[i] = vals[i]
-        else:
-            pos = posn[j] - 1
-            j = j + 1
-            if pos < 0:
-                raise ValueError('First time before start of DST info')
-            offset = deltas[pos]
-            result[i] = v + offset
-    return result
-
-
-def tz_convert_single(int64_t val, object tz1, object tz2):
-    cdef:
-        ndarray[int64_t] trans, deltas
-        Py_ssize_t pos
-        int64_t v, offset, utc_date
-        pandas_datetimestruct dts
-
-    if not have_pytz:
-        import pytz
-
-    if val == NPY_NAT:
-        return val
-
-    # Convert to UTC
-    if _is_tzlocal(tz1):
-        pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-        dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                      dts.min, dts.sec, dts.us, tz1)
-        delta = int(total_seconds(_get_utcoffset(tz1, dt))) * 1000000000
-        utc_date = val - delta
-    elif _get_zone(tz1) != 'UTC':
-        trans, deltas, typ = _get_dst_info(tz1)
-        pos = trans.searchsorted(val, side='right') - 1
-        if pos < 0:
-            raise ValueError('First time before start of DST info')
-        offset = deltas[pos]
-        utc_date = val - offset
-    else:
-        utc_date = val
-
-    if _get_zone(tz2) == 'UTC':
-        return utc_date
-    if _is_tzlocal(tz2):
-        pandas_datetime_to_datetimestruct(val, PANDAS_FR_ns, &dts)
-        dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                      dts.min, dts.sec, dts.us, tz2)
-        delta = int(total_seconds(_get_utcoffset(tz2, dt))) * 1000000000
-        return utc_date + delta
-
-    # Convert UTC to other timezone
-    trans, deltas, typ = _get_dst_info(tz2)
-
-    pos = trans.searchsorted(utc_date, side='right') - 1
-    if pos < 0:
-        raise ValueError('First time before start of DST info')
-
-    offset = deltas[pos]
-    return utc_date + offset
-
-# Timezone data caches, key is the pytz string or dateutil file name.
-dst_cache = {}
-
-cdef inline bint _treat_tz_as_pytz(object tz):
-    return hasattr(tz, '_utc_transition_times') and hasattr(
-        tz, '_transition_info')
-
-cdef inline bint _treat_tz_as_dateutil(object tz):
-    return hasattr(tz, '_trans_list') and hasattr(tz, '_trans_idx')
-
-
-def _p_tz_cache_key(tz):
-    """ Python interface for cache function to facilitate testing."""
-    return _tz_cache_key(tz)
-
-
-cdef inline object _tz_cache_key(object tz):
-    """
-    Return the key in the cache for the timezone info object or None
-    if unknown.
-
-    The key is currently the tz string for pytz timezones, the filename for
-    dateutil timezones.
-
-    Notes
-    =====
-    This cannot just be the hash of a timezone object. Unfortunately, the
-    hashes of two dateutil tz objects which represent the same timezone are
-    not equal (even though the tz objects will compare equal and represent
-    the same tz file). Also, pytz objects are not always hashable so we use
-    str(tz) instead.
-    """
-    if isinstance(tz, _pytz_BaseTzInfo):
-        return tz.zone
-    elif isinstance(tz, _dateutil_tzfile):
-        if '.tar.gz' in tz._filename:
-            raise ValueError('Bad tz filename. Dateutil on python 3 on '
-                             'windows has a bug which causes tzfile._filename '
-                             'to be the same for all timezone files. Please '
-                             'construct dateutil timezones implicitly by '
-                             'passing a string like "dateutil/Europe/London" '
-                             'when you construct your pandas objects instead '
-                             'of passing a timezone object. See '
-                             'https://github.com/pandas-dev/pandas/pull/7362')
-        return 'dateutil' + tz._filename
-    else:
-        return None
-
-
-cdef object _get_dst_info(object tz):
-    """
-    return a tuple of :
-      (UTC times of DST transitions,
-       UTC offsets in microseconds corresponding to DST transitions,
-       string of type of transitions)
-
-    """
-    cache_key = _tz_cache_key(tz)
-    if cache_key is None:
-        num = int(total_seconds(_get_utcoffset(tz, None))) * 1000000000
-        return (np.array([NPY_NAT + 1], dtype=np.int64),
-                np.array([num], dtype=np.int64),
-                None)
-
-    if cache_key not in dst_cache:
-        if _treat_tz_as_pytz(tz):
-            trans = np.array(tz._utc_transition_times, dtype='M8[ns]')
-            trans = trans.view('i8')
-            try:
-                if tz._utc_transition_times[0].year == 1:
-                    trans[0] = NPY_NAT + 1
-            except Exception:
-                pass
-            deltas = _unbox_utcoffsets(tz._transition_info)
-            typ = 'pytz'
-
-        elif _treat_tz_as_dateutil(tz):
-            if len(tz._trans_list):
-                # get utc trans times
-                trans_list = _get_utc_trans_times_from_dateutil_tz(tz)
-                trans = np.hstack([
-                    np.array([0], dtype='M8[s]'), # place holder for first item
-                    np.array(trans_list, dtype='M8[s]')]).astype(
-                    'M8[ns]')  # all trans listed
-                trans = trans.view('i8')
-                trans[0] = NPY_NAT + 1
-
-                # deltas
-                deltas = np.array([v.offset for v in (
-                    tz._ttinfo_before,) + tz._trans_idx], dtype='i8')
-                deltas *= 1000000000
-                typ = 'dateutil'
-
-            elif _is_fixed_offset(tz):
-                trans = np.array([NPY_NAT + 1], dtype=np.int64)
-                deltas = np.array([tz._ttinfo_std.offset],
-                                  dtype='i8') * 1000000000
-                typ = 'fixed'
-            else:
-                trans = np.array([], dtype='M8[ns]')
-                deltas = np.array([], dtype='i8')
-                typ = None
-
-        else:
-            # static tzinfo
-            trans = np.array([NPY_NAT + 1], dtype=np.int64)
-            num = int(total_seconds(_get_utcoffset(tz, None))) * 1000000000
-            deltas = np.array([num], dtype=np.int64)
-            typ = 'static'
-
-        dst_cache[cache_key] = (trans, deltas, typ)
-
-    return dst_cache[cache_key]
-
-cdef object _get_utc_trans_times_from_dateutil_tz(object tz):
-    """
-    Transition times in dateutil timezones are stored in local non-dst
-    time.  This code converts them to UTC. It's the reverse of the code
-    in dateutil.tz.tzfile.__init__.
-    """
-    new_trans = list(tz._trans_list)
-    last_std_offset = 0
-    for i, (trans, tti) in enumerate(zip(tz._trans_list, tz._trans_idx)):
-        if not tti.isdst:
-            last_std_offset = tti.offset
-        new_trans[i] = trans - last_std_offset
-    return new_trans
-
-
-def tot_seconds(td):
-    return total_seconds(td)
-
-cpdef ndarray _unbox_utcoffsets(object transinfo):
-    cdef:
-        Py_ssize_t i, sz
-        ndarray[int64_t] arr
-
-    sz = len(transinfo)
-    arr = np.empty(sz, dtype='i8')
-
-    for i in range(sz):
-        arr[i] = int(total_seconds(transinfo[i][0])) * 1000000000
-
-    return arr
-
-
-@cython.boundscheck(False)
-@cython.wraparound(False)
-def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
-                       object errors='raise'):
-    """
-    Localize tzinfo-naive DateRange to given time zone (using pytz). If
-    there are ambiguities in the values, raise AmbiguousTimeError.
-
-    Returns
-    -------
-    localized : DatetimeIndex
-    """
-    cdef:
-        ndarray[int64_t] trans, deltas, idx_shifted
-        ndarray ambiguous_array
-        Py_ssize_t i, idx, pos, ntrans, n = len(vals)
-        int64_t *tdata
-        int64_t v, left, right
-        ndarray[int64_t] result, result_a, result_b, dst_hours
-        pandas_datetimestruct dts
-        bint infer_dst = False, is_dst = False, fill = False
-        bint is_coerce = errors == 'coerce', is_raise = errors == 'raise'
-
-    # Vectorized version of DstTzInfo.localize
-
-    assert is_coerce or is_raise
-
-    if not have_pytz:
-        raise Exception("Could not find pytz module")
-
-    if tz == UTC or tz is None:
-        return vals
-
-    result = np.empty(n, dtype=np.int64)
-
-    if _is_tzlocal(tz):
-        for i in range(n):
-            v = vals[i]
-            pandas_datetime_to_datetimestruct(v, PANDAS_FR_ns, &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            result[i] = v - delta
-        return result
-
-    if isinstance(ambiguous, string_types):
-        if ambiguous == 'infer':
-            infer_dst = True
-        elif ambiguous == 'NaT':
-            fill = True
-    elif isinstance(ambiguous, bool):
-        is_dst = True
-        if ambiguous:
-            ambiguous_array = np.ones(len(vals), dtype=bool)
-        else:
-            ambiguous_array = np.zeros(len(vals), dtype=bool)
-    elif hasattr(ambiguous, '__iter__'):
-        is_dst = True
-        if len(ambiguous) != len(vals):
-            raise ValueError(
-                "Length of ambiguous bool-array must be the same size as vals")
-        ambiguous_array = np.asarray(ambiguous)
-
-    trans, deltas, typ = _get_dst_info(tz)
-
-    tdata = <int64_t*> trans.data
-    ntrans = len(trans)
-
-    result_a = np.empty(n, dtype=np.int64)
-    result_b = np.empty(n, dtype=np.int64)
-    result_a.fill(NPY_NAT)
-    result_b.fill(NPY_NAT)
-
-    # left side
-    idx_shifted = (np.maximum(0, trans.searchsorted(
-        vals - DAY_NS, side='right') - 1)).astype(np.int64)
-
-    for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
-
-        # timestamp falls to the left side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_a[i] = v
-
-    # right side
-    idx_shifted = (np.maximum(0, trans.searchsorted(
-        vals + DAY_NS, side='right') - 1)).astype(np.int64)
-
-    for i in range(n):
-        v = vals[i] - deltas[idx_shifted[i]]
-        pos = bisect_right_i8(tdata, v, ntrans) - 1
-
-        # timestamp falls to the right side of the DST transition
-        if v + deltas[pos] == vals[i]:
-            result_b[i] = v
-
-    if infer_dst:
-        dst_hours = np.empty(n, dtype=np.int64)
-        dst_hours.fill(NPY_NAT)
-
-        # Get the ambiguous hours (given the above, these are the hours
-        # where result_a != result_b and neither of them are NAT)
-        both_nat = np.logical_and(result_a != NPY_NAT, result_b != NPY_NAT)
-        both_eq = result_a == result_b
-        trans_idx = np.squeeze(np.nonzero(np.logical_and(both_nat, ~both_eq)))
-        if trans_idx.size == 1:
-            stamp = Timestamp(vals[trans_idx])
-            raise pytz.AmbiguousTimeError(
-                "Cannot infer dst time from %s as there "
-                "are no repeated times" % stamp)
-        # Split the array into contiguous chunks (where the difference between
-        # indices is 1).  These are effectively dst transitions in different
-        # years which is useful for checking that there is not an ambiguous
-        # transition in an individual year.
-        if trans_idx.size > 0:
-            one_diff = np.where(np.diff(trans_idx) != 1)[0] +1
-            trans_grp = np.array_split(trans_idx, one_diff)
-
-            # Iterate through each day, if there are no hours where the
-            # delta is negative (indicates a repeat of hour) the switch
-            # cannot be inferred
-            for grp in trans_grp:
-
-                delta = np.diff(result_a[grp])
-                if grp.size == 1 or np.all(delta > 0):
-                    stamp = Timestamp(vals[grp[0]])
-                    raise pytz.AmbiguousTimeError(stamp)
-
-                # Find the index for the switch and pull from a for dst and b
-                # for standard
-                switch_idx = (delta <= 0).nonzero()[0]
-                if switch_idx.size > 1:
-                    raise pytz.AmbiguousTimeError(
-                        "There are %i dst switches when "
-                        "there should only be 1." % switch_idx.size)
-                switch_idx = switch_idx[0] + 1 # Pull the only index and adjust
-                a_idx = grp[:switch_idx]
-                b_idx = grp[switch_idx:]
-                dst_hours[grp] = np.hstack((result_a[a_idx], result_b[b_idx]))
+        if checknull_with_nat(val):
+            oresult[i] = NaT
+        elif is_integer_object(val) or is_float_object(val):
 
-    for i in range(n):
-        left = result_a[i]
-        right = result_b[i]
-        if vals[i] == NPY_NAT:
-            result[i] = vals[i]
-        elif left != NPY_NAT and right != NPY_NAT:
-            if left == right:
-                result[i] = left
-            else:
-                if infer_dst and dst_hours[i] != NPY_NAT:
-                    result[i] = dst_hours[i]
-                elif is_dst:
-                    if ambiguous_array[i]:
-                        result[i] = left
-                    else:
-                        result[i] = right
-                elif fill:
-                    result[i] = NPY_NAT
-                else:
-                    stamp = Timestamp(vals[i])
-                    raise pytz.AmbiguousTimeError(
-                        "Cannot infer dst time from %r, try using the "
-                        "'ambiguous' argument" % stamp)
-        elif left != NPY_NAT:
-            result[i] = left
-        elif right != NPY_NAT:
-            result[i] = right
-        else:
-            if is_coerce:
-                result[i] = NPY_NAT
+            if val != val or val == NPY_NAT:
+                oresult[i] = NaT
             else:
-                stamp = Timestamp(vals[i])
-                raise pytz.NonExistentTimeError(stamp)
-
-    return result
-
-cdef inline bisect_right_i8(int64_t *data, int64_t val, Py_ssize_t n):
-    cdef Py_ssize_t pivot, left = 0, right = n
-
-    # edge cases
-    if val > data[n - 1]:
-        return n
-
-    if val < data[0]:
-        return 0
-
-    while left < right:
-        pivot = left + (right - left) // 2
-
-        if data[pivot] <= val:
-            left = pivot + 1
-        else:
-            right = pivot
-
-    return left
-
-
-# Accessors
-#----------------------------------------------------------------------
-
-def build_field_sarray(ndarray[int64_t] dtindex):
-    """
-    Datetime as int64 representation to a structured array of fields
-    """
-    cdef:
-        Py_ssize_t i, count = 0
-        int isleap
-        pandas_datetimestruct dts
-        ndarray[int32_t] years, months, days, hours, minutes, seconds, mus
-
-    count = len(dtindex)
-
-    sa_dtype = [('Y', 'i4'), # year
-                ('M', 'i4'), # month
-                ('D', 'i4'), # day
-                ('h', 'i4'), # hour
-                ('m', 'i4'), # min
-                ('s', 'i4'), # second
-                ('u', 'i4')] # microsecond
-
-    out = np.empty(count, dtype=sa_dtype)
-
-    years = out['Y']
-    months = out['M']
-    days = out['D']
-    hours = out['h']
-    minutes = out['m']
-    seconds = out['s']
-    mus = out['u']
-
-    for i in range(count):
-        pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-        years[i] = dts.year
-        months[i] = dts.month
-        days[i] = dts.day
-        hours[i] = dts.hour
-        minutes[i] = dts.min
-        seconds[i] = dts.sec
-        mus[i] = dts.us
-
-    return out
-
-
-def get_time_micros(ndarray[int64_t] dtindex):
-    """
-    Datetime as int64 representation to a structured array of fields
-    """
-    cdef:
-        Py_ssize_t i, n = len(dtindex)
-        pandas_datetimestruct dts
-        ndarray[int64_t] micros
+                try:
+                    oresult[i] = Timestamp(cast_from_unit(val, unit))
+                except:
+                    oresult[i] = val
 
-    micros = np.empty(n, dtype=np.int64)
+        elif is_string_object(val):
+            if len(val) == 0 or val in nat_strings:
+                oresult[i] = NaT
 
-    for i in range(n):
-        pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-        micros[i] = 1000000LL * (dts.hour * 60 * 60 +
-                                 60 * dts.min + dts.sec) + dts.us
+            else:
+                oresult[i] = val
 
-    return micros
+    return oresult
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def get_date_field(ndarray[int64_t] dtindex, object field):
+cpdef array_to_datetime(ndarray[object] values, str errors='raise',
+                        bint dayfirst=False, bint yearfirst=False,
+                        object utc=None, bint require_iso8601=False):
     """
-    Given a int64-based datetime index, extract the year, month, etc.,
-    field and return an array of these values.
-    """
-    cdef:
-        _TSObject ts
-        Py_ssize_t i, count = 0
-        ndarray[int32_t] out
-        ndarray[int32_t, ndim=2] _month_offset
-        int isleap, isleap_prev
-        pandas_datetimestruct dts
-        int mo_off, doy, dow, woy
-
-    _month_offset = np.array(
-        [[ 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 ],
-         [ 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 ]],
-        dtype=np.int32 )
-
-    count = len(dtindex)
-    out = np.empty(count, dtype='i4')
-
-    if field == 'Y':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.year
-        return out
-
-    elif field == 'M':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.month
-        return out
-
-    elif field == 'D':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.day
-        return out
-
-    elif field == 'h':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.hour
-        return out
-
-    elif field == 'm':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.min
-        return out
-
-    elif field == 's':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.sec
-        return out
-
-    elif field == 'us':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.us
-        return out
-
-    elif field == 'ns':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.ps / 1000
-        return out
-    elif field == 'doy':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                out[i] = _month_offset[isleap, dts.month -1] + dts.day
-        return out
-
-    elif field == 'dow':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dayofweek(dts.year, dts.month, dts.day)
-        return out
-
-    elif field == 'woy':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                isleap_prev = is_leapyear(dts.year - 1)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                doy = mo_off + dts.day
-                dow = dayofweek(dts.year, dts.month, dts.day)
-
-                #estimate
-                woy = (doy - 1) - dow + 3
-                if woy >= 0:
-                    woy = woy / 7 + 1
-
-                # verify
-                if woy < 0:
-                    if (woy > -2) or (woy == -2 and isleap_prev):
-                        woy = 53
-                    else:
-                        woy = 52
-                elif woy == 53:
-                    if 31 - dts.day + dow < 3:
-                        woy = 1
-
-                out[i] = woy
-        return out
+    Converts a 1D array of date-like values to a numpy array of either:
+        1) datetime64[ns] data
+        2) datetime.datetime objects, if OutOfBoundsDatetime or TypeError
+           is encountered
 
-    elif field == 'q':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
+    Also returns a pytz.FixedOffset if an array of strings with the same
+    timezone offset is passed and utc=True is not passed. Otherwise, None
+    is returned
 
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = dts.month
-                out[i] = ((out[i] - 1) / 3) + 1
-        return out
-
-    elif field == 'dim':
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = -1; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                out[i] = days_in_month(dts)
-        return out
-    elif field == 'is_leap_year':
-        return _isleapyear_arr(get_date_field(dtindex, 'Y'))
-
-    raise ValueError("Field %s not supported" % field)
+    Handles datetime.date, datetime.datetime, np.datetime64 objects, numeric,
+    strings
 
+    Parameters
+    ----------
+    values : ndarray of object
+         date-like objects to convert
+    errors : str, default 'raise'
+         error behavior when parsing
+    dayfirst : bool, default False
+         dayfirst parsing behavior when encountering datetime strings
+    yearfirst : bool, default False
+         yearfirst parsing behavior when encountering datetime strings
+    utc : bool, default None
+         indicator whether the dates should be UTC
+    require_iso8601 : bool, default False
+         indicator whether the datetime string should be iso8601
 
-@cython.wraparound(False)
-def get_start_end_field(ndarray[int64_t] dtindex, object field,
-                        object freqstr=None, int month_kw=12):
-    """
-    Given an int64-based datetime index return array of indicators
-    of whether timestamps are at the start/end of the month/quarter/year
-    (defined by frequency).
+    Returns
+    -------
+    tuple (ndarray, tzoffset)
     """
     cdef:
-        _TSObject ts
-        Py_ssize_t i
-        int count = 0
-        bint is_business = 0
-        int end_month = 12
-        int start_month = 1
-        ndarray[int8_t] out
-        ndarray[int32_t, ndim=2] _month_offset
-        bint isleap
-        pandas_datetimestruct dts
-        int mo_off, dom, doy, dow, ldom
-
-    _month_offset = np.array(
-        [[ 0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365 ],
-         [ 0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366 ]],
-        dtype=np.int32 )
-
-    count = len(dtindex)
-    out = np.zeros(count, dtype='int8')
-
-    if freqstr:
-        if freqstr == 'C':
-            raise ValueError(
-                "Custom business days is not supported by %s" % field)
-        is_business = freqstr[0] == 'B'
-
-        # YearBegin(), BYearBegin() use month = starting month of year.
-        # QuarterBegin(), BQuarterBegin() use startingMonth = starting
-        # month of year. Other offests use month, startingMonth as ending
-        # month of year.
-
-        if (freqstr[0:2] in ['MS', 'QS', 'AS']) or (
-                freqstr[1:3] in ['MS', 'QS', 'AS']):
-            end_month = 12 if month_kw == 1 else month_kw - 1
-            start_month = month_kw
-        else:
-            end_month = month_kw
-            start_month = (end_month % 12) + 1
-    else:
-        end_month = 12
-        start_month = 1
-
-    if field == 'is_month_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if (dom == 1 and dow < 5) or (dom <= 3 and dow == 0):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_month_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-                dow = ts_dayofweek(ts)
-
-                if (ldom == doy and dow < 5) or (
-                        dow == 4 and (ldom - doy <= 2)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if ldom == doy:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_quarter_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if ((dts.month - start_month) % 3 == 0) and (
-                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if ((dts.month - start_month) % 3 == 0) and dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_quarter_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-                dow = ts_dayofweek(ts)
-
-                if ((dts.month - end_month) % 3 == 0) and (
-                        (ldom == doy and dow < 5) or (
-                            dow == 4 and (ldom - doy <= 2))):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if ((dts.month - end_month) % 3 == 0) and (ldom == doy):
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_year_start':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                dom = dts.day
-                dow = ts_dayofweek(ts)
-
-                if (dts.month == start_month) and (
-                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                dom = dts.day
-
-                if (dts.month == start_month) and dom == 1:
-                    out[i] = 1
-            return out.view(bool)
-
-    elif field == 'is_year_end':
-        if is_business:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                isleap = is_leapyear(dts.year)
-                dom = dts.day
-                mo_off = _month_offset[isleap, dts.month - 1]
-                doy = mo_off + dom
-                dow = ts_dayofweek(ts)
-                ldom = _month_offset[isleap, dts.month]
-
-                if (dts.month == end_month) and (
-                        (ldom == doy and dow < 5) or (
-                            dow == 4 and (ldom - doy <= 2))):
-                    out[i] = 1
-            return out.view(bool)
-        else:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = 0; continue
-
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                ts = convert_to_tsobject(dtindex[i], None, None, 0, 0)
-                isleap = is_leapyear(dts.year)
-                mo_off = _month_offset[isleap, dts.month - 1]
-                dom = dts.day
-                doy = mo_off + dom
-                ldom = _month_offset[isleap, dts.month]
-
-                if (dts.month == end_month) and (ldom == doy):
-                    out[i] = 1
-            return out.view(bool)
+        Py_ssize_t i, n = len(values)
+        object val, py_dt, tz, tz_out = None
+        ndarray[int64_t] iresult
+        ndarray[object] oresult
+        npy_datetimestruct dts
+        bint utc_convert = bool(utc)
+        bint seen_integer = 0
+        bint seen_string = 0
+        bint seen_datetime = 0
+        bint seen_datetime_offset = 0
+        bint is_raise = errors=='raise'
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+        bint is_same_offsets
+        _TSObject _ts
+        int64_t value
+        int out_local=0, out_tzoffset=0
+        float offset_seconds, tz_offset
+        set out_tzoffset_vals = set()
 
-    raise ValueError("Field %s not supported" % field)
+    # specify error conditions
+    assert is_raise or is_ignore or is_coerce
 
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
 
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def get_date_name_field(ndarray[int64_t] dtindex, object field):
-    """
-    Given a int64-based datetime index, return array of strings of date
-    name based on requested field (e.g. weekday_name)
-    """
-    cdef:
-        _TSObject ts
-        Py_ssize_t i, count = 0
-        ndarray[object] out
-        pandas_datetimestruct dts
-        int dow
+    try:
+        for i in range(n):
+            val = values[i]
 
-    _dayname = np.array(
-        ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
-            'Friday', 'Saturday', 'Sunday'],
-        dtype=np.object_ )
+            try:
+                if checknull_with_nat(val):
+                    iresult[i] = NPY_NAT
 
-    count = len(dtindex)
-    out = np.empty(count, dtype=object)
+                elif PyDateTime_Check(val):
+                    seen_datetime = 1
+                    if val.tzinfo is not None:
+                        if utc_convert:
+                            _ts = convert_datetime_to_tsobject(val, None)
+                            iresult[i] = _ts.value
+                        else:
+                            raise ValueError('Tz-aware datetime.datetime '
+                                             'cannot be converted to '
+                                             'datetime64 unless utc=True')
+                    else:
+                        iresult[i] = pydatetime_to_dt64(val, &dts)
+                        if not PyDateTime_CheckExact(val):
+                            # i.e. a Timestamp object
+                            iresult[i] += val.nanosecond
+                        check_dts_bounds(&dts)
+
+                elif PyDate_Check(val):
+                    seen_datetime = 1
+                    iresult[i] = pydate_to_dt64(val, &dts)
+                    check_dts_bounds(&dts)
+
+                elif is_datetime64_object(val):
+                    seen_datetime = 1
+                    iresult[i] = get_datetime64_nanos(val)
+
+                elif is_integer_object(val) or is_float_object(val):
+                    # these must be ns unit by-definition
+                    seen_integer = 1
 
-    if field == 'weekday_name':
-        for i in range(count):
-            if dtindex[i] == NPY_NAT: out[i] = np.nan; continue
+                    if val != val or val == NPY_NAT:
+                        iresult[i] = NPY_NAT
+                    elif is_raise or is_ignore:
+                        iresult[i] = val
+                    else:
+                        # coerce
+                        # we now need to parse this as if unit='ns'
+                        # we can ONLY accept integers at this point
+                        # if we have previously (or in future accept
+                        # datetimes/strings, then we must coerce)
+                        try:
+                            iresult[i] = cast_from_unit(val, 'ns')
+                        except:
+                            iresult[i] = NPY_NAT
 
-            pandas_datetime_to_datetimestruct(dtindex[i], PANDAS_FR_ns, &dts)
-            dow = dayofweek(dts.year, dts.month, dts.day)
-            out[i] = _dayname[dow]
-        return out
+                elif is_string_object(val):
+                    # string
+                    seen_string = 1
 
-    raise ValueError("Field %s not supported" % field)
+                    if len(val) == 0 or val in nat_strings:
+                        iresult[i] = NPY_NAT
+                        continue
+                    if isinstance(val, unicode) and PY2:
+                        val = val.encode('utf-8')
 
+                    try:
+                        _string_to_dts(val, &dts, &out_local, &out_tzoffset)
+                    except ValueError:
+                        # A ValueError at this point is a _parsing_ error
+                        # specifically _not_ OutOfBoundsDatetime
+                        if _parse_today_now(val, &iresult[i]):
+                            continue
+                        elif require_iso8601:
+                            # if requiring iso8601 strings, skip trying
+                            # other formats
+                            if is_coerce:
+                                iresult[i] = NPY_NAT
+                                continue
+                            elif is_raise:
+                                raise ValueError("time data {val} doesn't "
+                                                 "match format specified"
+                                                 .format(val=val))
+                            return values, tz_out
 
-cdef inline int m8_weekday(int64_t val):
-    ts = convert_to_tsobject(val, None, None, 0, 0)
-    return ts_dayofweek(ts)
+                        try:
+                            py_dt = parse_datetime_string(val,
+                                                          dayfirst=dayfirst,
+                                                          yearfirst=yearfirst)
+                        except Exception:
+                            if is_coerce:
+                                iresult[i] = NPY_NAT
+                                continue
+                            raise TypeError("invalid string coercion to "
+                                            "datetime")
+
+                        # If the dateutil parser returned tzinfo, capture it
+                        # to check if all arguments have the same tzinfo
+                        tz = py_dt.utcoffset()
+                        if tz is not None:
+                            seen_datetime_offset = 1
+                            # dateutil timezone objects cannot be hashed, so
+                            # store the UTC offsets in seconds instead
+                            out_tzoffset_vals.add(tz.total_seconds())
+                        else:
+                            # Add a marker for naive string, to track if we are
+                            # parsing mixed naive and aware strings
+                            out_tzoffset_vals.add('naive')
 
-cdef int64_t DAY_NS = 86400000000000LL
+                        _ts = convert_datetime_to_tsobject(py_dt, None)
+                        iresult[i] = _ts.value
+                    except:
+                        # TODO: What exception are we concerned with here?
+                        if is_coerce:
+                            iresult[i] = NPY_NAT
+                            continue
+                        raise
+                    else:
+                        # No error raised by string_to_dts, pick back up
+                        # where we left off
+                        value = dtstruct_to_dt64(&dts)
+                        if out_local == 1:
+                            seen_datetime_offset = 1
+                            # Store the out_tzoffset in seconds
+                            # since we store the total_seconds of
+                            # dateutil.tz.tzoffset objects
+                            out_tzoffset_vals.add(out_tzoffset * 60.)
+                            tz = pytz.FixedOffset(out_tzoffset)
+                            value = tz_convert_single(value, tz, UTC)
+                            out_local = 0
+                            out_tzoffset = 0
+                        else:
+                            # Add a marker for naive string, to track if we are
+                            # parsing mixed naive and aware strings
+                            out_tzoffset_vals.add('naive')
+                        iresult[i] = value
+                        check_dts_bounds(&dts)
 
+                else:
+                    if is_coerce:
+                        iresult[i] = NPY_NAT
+                    else:
+                        raise TypeError("{typ} is not convertible to datetime"
+                                        .format(typ=type(val)))
 
-@cython.wraparound(False)
-@cython.boundscheck(False)
-def date_normalize(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-        _TSObject tso
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-
-    if tz is not None:
-        tso = _TSObject()
-        tz = maybe_get_tz(tz)
-        result = _normalize_local(stamps, tz)
-    else:
-        with nogil:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
+            except OutOfBoundsDatetime:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
                     continue
-                pandas_datetime_to_datetimestruct(
-                    stamps[i], PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
+                elif require_iso8601 and is_string_object(val):
+                    # GH#19382 for just-barely-OutOfBounds falling back to
+                    # dateutil parser will return incorrect result because
+                    # it will ignore nanoseconds
+                    if is_raise:
 
-    return result
+                        # Still raise OutOfBoundsDatetime,
+                        # as error message is informative.
+                        raise
 
+                    assert is_ignore
+                    return values, tz_out
+                raise
 
-@cython.wraparound(False)
-@cython.boundscheck(False)
-cdef _normalize_local(ndarray[int64_t] stamps, object tz):
-    cdef:
-        Py_ssize_t n = len(stamps)
-        ndarray[int64_t] result = np.empty(n, dtype=np.int64)
-        ndarray[int64_t] trans, deltas, pos
-        pandas_datetimestruct dts
+    except OutOfBoundsDatetime:
+        if is_raise:
+            raise
 
-    if _is_utc(tz):
-        with nogil:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(
-                    stamps[i], PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            if stamps[i] == NPY_NAT:
-                result[i] = NPY_NAT
-                continue
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour,
-                          dts.min, dts.sec, dts.us, tz)
-            delta = int(total_seconds(_get_utcoffset(tz, dt))) * 1000000000
-            pandas_datetime_to_datetimestruct(stamps[i] + delta,
-                                              PANDAS_FR_ns, &dts)
-            result[i] = _normalized_stamp(&dts)
-    else:
-        # Adjust datetime64 timestamp, recompute datetimestruct
-        trans, deltas, typ = _get_dst_info(tz)
+        return ignore_errors_out_of_bounds_fallback(values), tz_out
+
+    except TypeError:
+        return array_to_datetime_object(values, is_raise, dayfirst, yearfirst)
 
-        _pos = trans.searchsorted(stamps, side='right') - 1
-        if _pos.dtype != np.int64:
-            _pos = _pos.astype(np.int64)
-        pos = _pos
+    if seen_datetime and seen_integer:
+        # we have mixed datetimes & integers
 
-        # statictzinfo
-        if typ not in ['pytz', 'dateutil']:
+        if is_coerce:
+            # coerce all of the integers/floats to NaT, preserve
+            # the datetimes and other convertibles
             for i in range(n):
-                if stamps[i] == NPY_NAT:
+                val = values[i]
+                if is_integer_object(val) or is_float_object(val):
                     result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[0],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
+        elif is_raise:
+            raise ValueError("mixed datetimes and integers in passed array")
         else:
-            for i in range(n):
-                if stamps[i] == NPY_NAT:
-                    result[i] = NPY_NAT
-                    continue
-                pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos[i]],
-                                                  PANDAS_FR_ns, &dts)
-                result[i] = _normalized_stamp(&dts)
-
-    return result
-
-cdef inline int64_t _normalized_stamp(pandas_datetimestruct *dts) nogil:
-    dts.hour = 0
-    dts.min = 0
-    dts.sec = 0
-    dts.us = 0
-    dts.ps = 0
-    return pandas_datetimestruct_to_datetime(PANDAS_FR_ns, dts)
-
-
-def dates_normalized(ndarray[int64_t] stamps, tz=None):
-    cdef:
-        Py_ssize_t i, n = len(stamps)
-        pandas_datetimestruct dts
-
-    if tz is None or _is_utc(tz):
-        for i in range(n):
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
-                return False
-    elif _is_tzlocal(tz):
-        for i in range(n):
-            pandas_datetime_to_datetimestruct(stamps[i], PANDAS_FR_ns, &dts)
-            dt = datetime(dts.year, dts.month, dts.day, dts.hour, dts.min,
-                          dts.sec, dts.us, tz)
-            dt = dt + tz.utcoffset(dt)
-            if (dt.hour + dt.minute + dt.second + dt.microsecond) > 0:
-                return False
-    else:
-        trans, deltas, typ = _get_dst_info(tz)
-
-        for i in range(n):
-            # Adjust datetime64 timestamp, recompute datetimestruct
-            pos = trans.searchsorted(stamps[i]) - 1
-            inf = tz._transition_info[pos]
-
-            pandas_datetime_to_datetimestruct(stamps[i] + deltas[pos],
-                                              PANDAS_FR_ns, &dts)
-            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
-                return False
-
-    return True
-
-# Some general helper functions
-#----------------------------------------------------------------------
-
-
-cpdef _isleapyear_arr(ndarray years):
-    cdef:
-        ndarray[int8_t] out
-
-    # to make NaT result as False
-    out = np.zeros(len(years), dtype='int8')
-    out[np.logical_or(years % 400 == 0,
-                      np.logical_and(years % 4 == 0,
-                                     years % 100 > 0))] = 1
-    return out.view(bool)
-
-
-def monthrange(int64_t year, int64_t month):
-    cdef:
-        int64_t days
-        int64_t day_of_week
-
-    if month < 1 or month > 12:
-        raise ValueError("bad month number 0; must be 1-12")
-
-    days = days_per_month_table[is_leapyear(year)][month -1]
+            return array_to_datetime_object(values, is_raise,
+                                            dayfirst, yearfirst)
 
-    return (dayofweek(year, month, 1), days)
-
-cdef inline int64_t ts_dayofweek(_TSObject ts):
-    return dayofweek(ts.dts.year, ts.dts.month, ts.dts.day)
+    if seen_datetime_offset and not utc_convert:
+        # GH#17697
+        # 1) If all the offsets are equal, return one offset for
+        #    the parsed dates to (maybe) pass to DatetimeIndex
+        # 2) If the offsets are different, then force the parsing down the
+        #    object path where an array of datetimes
+        #    (with individual dateutil.tzoffsets) are returned
+        is_same_offsets = len(out_tzoffset_vals) == 1
+        if not is_same_offsets:
+            return array_to_datetime_object(values, is_raise,
+                                            dayfirst, yearfirst)
+        else:
+            tz_offset = out_tzoffset_vals.pop()
+            tz_out = pytz.FixedOffset(tz_offset / 60.)
+    return result, tz_out
 
-cdef inline int days_in_month(pandas_datetimestruct dts) nogil:
-    return days_per_month_table[is_leapyear(dts.year)][dts.month -1]
 
-cpdef normalize_date(object dt):
+cdef inline ignore_errors_out_of_bounds_fallback(ndarray[object] values):
     """
-    Normalize datetime.datetime value to midnight. Returns datetime.date as a
-    datetime.datetime at midnight
+    Fallback for array_to_datetime if an OutOfBoundsDatetime is raised
+    and errors == "ignore"
+
+    Parameters
+    ----------
+    values : ndarray[object]
 
     Returns
     -------
-    normalized : datetime.datetime or Timestamp
+    ndarray[object]
     """
-    if is_timestamp(dt):
-        return dt.replace(hour=0, minute=0, second=0, microsecond=0,
-                          nanosecond=0)
-    elif PyDateTime_Check(dt):
-        return dt.replace(hour=0, minute=0, second=0, microsecond=0)
-    elif PyDate_Check(dt):
-        return datetime(dt.year, dt.month, dt.day)
-    else:
-        raise TypeError('Unrecognized type: %s' % type(dt))
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object val
 
+    oresult = np.empty(n, dtype=object)
 
-cdef inline int _year_add_months(pandas_datetimestruct dts,
-                                 int months) nogil:
-    """new year number after shifting pandas_datetimestruct number of months"""
-    return dts.year + (dts.month + months - 1) / 12
+    for i in range(n):
+        val = values[i]
 
-cdef inline int _month_add_months(pandas_datetimestruct dts,
-                                  int months) nogil:
-    """
-    New month number after shifting pandas_datetimestruct
-    number of months.
-    """
-    cdef int new_month = (dts.month + months) % 12
-    return 12 if new_month == 0 else new_month
+        # set as nan except if its a NaT
+        if checknull_with_nat(val):
+            if isinstance(val, float):
+                oresult[i] = np.nan
+            else:
+                oresult[i] = NaT
+        elif is_datetime64_object(val):
+            if get_datetime64_value(val) == NPY_NAT:
+                oresult[i] = NaT
+            else:
+                oresult[i] = val.item()
+        else:
+            oresult[i] = val
+    return oresult
 
 
 @cython.wraparound(False)
 @cython.boundscheck(False)
-def shift_months(int64_t[:] dtindex, int months, object day=None):
-    """
-    Given an int64-based datetime index, shift all elements
-    specified number of months using DateOffset semantics
-
-    day: {None, 'start', 'end'}
-       * None: day of month
-       * 'start' 1st day of month
-       * 'end' last day of month
+cdef array_to_datetime_object(ndarray[object] values, bint is_raise,
+                              bint dayfirst=False, bint yearfirst=False):
     """
-    cdef:
-        Py_ssize_t i
-        pandas_datetimestruct dts
-        int count = len(dtindex)
-        int months_to_roll
-        bint roll_check
-        int64_t[:] out = np.empty(count, dtype='int64')
-
-    if day is None:
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = NPY_NAT; continue
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                dts.year = _year_add_months(dts, months)
-                dts.month = _month_add_months(dts, months)
-
-                dts.day = min(dts.day, days_in_month(dts))
-                out[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    elif day == 'start':
-        roll_check = False
-        if months <= 0:
-            months += 1
-            roll_check = True
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = NPY_NAT; continue
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                months_to_roll = months
-
-                # offset semantics - if on the anchor point and going backwards
-                # shift to next
-                if roll_check and dts.day == 1:
-                    months_to_roll -= 1
-
-                dts.year = _year_add_months(dts, months_to_roll)
-                dts.month = _month_add_months(dts, months_to_roll)
-                dts.day = 1
-
-                out[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    elif day == 'end':
-        roll_check = False
-        if months > 0:
-            months -= 1
-            roll_check = True
-        with nogil:
-            for i in range(count):
-                if dtindex[i] == NPY_NAT: out[i] = NPY_NAT; continue
-                pandas_datetime_to_datetimestruct(
-                    dtindex[i], PANDAS_FR_ns, &dts)
-                months_to_roll = months
-
-                # similar semantics - when adding shift forward by one
-                # month if already at an end of month
-                if roll_check and dts.day == days_in_month(dts):
-                    months_to_roll += 1
-
-                dts.year = _year_add_months(dts, months_to_roll)
-                dts.month = _month_add_months(dts, months_to_roll)
-
-                dts.day = days_in_month(dts)
-                out[i] = pandas_datetimestruct_to_datetime(PANDAS_FR_ns, &dts)
-    else:
-        raise ValueError("day must be None, 'start' or 'end'")
-
-    return np.asarray(out)
-
-#----------------------------------------------------------------------
-# Don't even ask
-
-"""Strptime-related classes and functions.
-
-CLASSES:
-    LocaleTime -- Discovers and stores locale-specific time information
-    TimeRE -- Creates regexes for pattern matching a string of text containing
-                time information
-
-FUNCTIONS:
-    _getlang -- Figure out what language is being used for the locale
-    strptime -- Calculates the time struct represented by the passed-in string
-
-"""
-import time
-import locale
-import calendar
-from re import compile as re_compile
-from re import IGNORECASE
-from re import escape as re_escape
-from datetime import date as datetime_date
-
-# Python 2 vs Python 3
-try:
-    from thread import allocate_lock as _thread_allocate_lock
-except:
-    try:
-        from _thread import allocate_lock as _thread_allocate_lock
-    except:
-        try:
-            from dummy_thread import allocate_lock as _thread_allocate_lock
-        except:
-            from _dummy_thread import allocate_lock as _thread_allocate_lock
-
-__all__ = []
-
-
-def _getlang():
-    # Figure out what the current language is set to.
-    return locale.getlocale(locale.LC_TIME)
+    Fall back function for array_to_datetime
 
+    Attempts to parse datetime strings with dateutil to return an array
+    of datetime objects
 
-class LocaleTime(object):
-    """Stores and handles locale-specific information related to time.
+    Parameters
+    ----------
+    values : ndarray of object
+         date-like objects to convert
+    is_raise : bool
+         error behavior when parsing
+    dayfirst : bool, default False
+         dayfirst parsing behavior when encountering datetime strings
+    yearfirst : bool, default False
+         yearfirst parsing behavior when encountering datetime strings
 
-    ATTRIBUTES:
-        f_weekday -- full weekday names (7-item list)
-        a_weekday -- abbreviated weekday names (7-item list)
-        f_month -- full month names (13-item list; dummy value in [0], which
-                    is added by code)
-        a_month -- abbreviated month names (13-item list, dummy value in
-                    [0], which is added by code)
-        am_pm -- AM/PM representation (2-item list)
-        LC_date_time -- format string for date/time representation (string)
-        LC_date -- format string for date representation (string)
-        LC_time -- format string for time representation (string)
-        timezone -- daylight- and non-daylight-savings timezone representation
-                    (2-item list of sets)
-        lang -- Language used by instance (2-item tuple)
+    Returns
+    -------
+    tuple (ndarray, None)
     """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object val,
+        ndarray[object] oresult
+        npy_datetimestruct dts
 
-    def __init__(self):
-        """Set all attributes.
-
-        Order of methods called matters for dependency reasons.
-
-        The locale language is set at the offset and then checked again before
-        exiting.  This is to make sure that the attributes were not set with a
-        mix of information from more than one locale.  This would most likely
-        happen when using threads where one thread calls a locale-dependent
-        function while another thread changes the locale while the function in
-        the other thread is still running.  Proper coding would call for
-        locks to prevent changing the locale while locale-dependent code is
-        running.  The check here is done in case someone does not think about
-        doing this.
-
-        Only other possible issue is if someone changed the timezone and did
-        not call tz.tzset .  That is an issue for the programmer, though,
-        since changing the timezone is worthless without that call.
-
-        """
-        self.lang = _getlang()
-        self.__calc_weekday()
-        self.__calc_month()
-        self.__calc_am_pm()
-        self.__calc_timezone()
-        self.__calc_date_time()
-        if _getlang() != self.lang:
-            raise ValueError("locale changed during initialization")
-
-    def __pad(self, seq, front):
-        # Add '' to seq to either the front (is True), else the back.
-        seq = list(seq)
-        if front:
-            seq.insert(0, '')
-        else:
-            seq.append('')
-        return seq
-
-    def __calc_weekday(self):
-        # Set self.a_weekday and self.f_weekday using the calendar
-        # module.
-        a_weekday = [calendar.day_abbr[i].lower() for i in range(7)]
-        f_weekday = [calendar.day_name[i].lower() for i in range(7)]
-        self.a_weekday = a_weekday
-        self.f_weekday = f_weekday
-
-    def __calc_month(self):
-        # Set self.f_month and self.a_month using the calendar module.
-        a_month = [calendar.month_abbr[i].lower() for i in range(13)]
-        f_month = [calendar.month_name[i].lower() for i in range(13)]
-        self.a_month = a_month
-        self.f_month = f_month
-
-    def __calc_am_pm(self):
-        # Set self.am_pm by using time.strftime().
-
-        # The magic date (1999,3,17,hour,44,55,2,76,0) is not really that
-        # magical; just happened to have used it everywhere else where a
-        # static date was needed.
-        am_pm = []
-        for hour in (01, 22):
-            time_tuple = time.struct_time(
-                (1999, 3, 17, hour, 44, 55, 2, 76, 0))
-            am_pm.append(time.strftime("%p", time_tuple).lower())
-        self.am_pm = am_pm
-
-    def __calc_date_time(self):
-        # Set self.date_time, self.date, & self.time by using
-        # time.strftime().
-
-        # Use (1999,3,17,22,44,55,2,76,0) for magic date because the amount of
-        # overloaded numbers is minimized.  The order in which searches for
-        # values within the format string is very important; it eliminates
-        # possible ambiguity for what something represents.
-        time_tuple = time.struct_time((1999, 3, 17, 22, 44, 55, 2, 76, 0))
-        date_time = [None, None, None]
-        date_time[0] = time.strftime("%c", time_tuple).lower()
-        date_time[1] = time.strftime("%x", time_tuple).lower()
-        date_time[2] = time.strftime("%X", time_tuple).lower()
-        replacement_pairs = [('%', '%%'), (self.f_weekday[2], '%A'),
-                             (self.f_month[3],
-                              '%B'), (self.a_weekday[2], '%a'),
-                             (self.a_month[3], '%b'), (self.am_pm[1], '%p'),
-                             ('1999', '%Y'), ('99', '%y'), ('22', '%H'),
-                             ('44', '%M'), ('55', '%S'), ('76', '%j'),
-                             ('17', '%d'), ('03', '%m'), ('3', '%m'),
-                             # '3' needed for when no leading zero.
-                             ('2', '%w'), ('10', '%I')]
-        replacement_pairs.extend([(tz, "%Z") for tz_values in self.timezone
-                                                for tz in tz_values])
-        for offset, directive in ((0, '%c'), (1, '%x'), (2, '%X')):
-            current_format = date_time[offset]
-            for old, new in replacement_pairs:
-                # Must deal with possible lack of locale info
-                # manifesting itself as the empty string (e.g., Swedish's
-                # lack of AM/PM info) or a platform returning a tuple of empty
-                # strings (e.g., MacOS 9 having timezone as ('','')).
-                if old:
-                    current_format = current_format.replace(old, new)
-            # If %W is used, then Sunday, 2005-01-03 will fall on week 0 since
-            # 2005-01-03 occurs before the first Monday of the year.  Otherwise
-            # %U is used.
-            time_tuple = time.struct_time((1999, 1, 3, 1, 1, 1, 6, 3, 0))
-            if '00' in time.strftime(directive, time_tuple):
-                U_W = '%W'
-            else:
-                U_W = '%U'
-            date_time[offset] = current_format.replace('11', U_W)
-        self.LC_date_time = date_time[0]
-        self.LC_date = date_time[1]
-        self.LC_time = date_time[2]
-
-    def __calc_timezone(self):
-        # Set self.timezone by using time.tzname.
-        # Do not worry about possibility of time.tzname[0] == timetzname[1]
-        # and time.daylight; handle that in strptime .
-        try:
-            time.tzset()
-        except AttributeError:
-            pass
-        no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()])
-        if time.daylight:
-            has_saving = frozenset([time.tzname[1].lower()])
-        else:
-            has_saving = frozenset()
-        self.timezone = (no_saving, has_saving)
-
-
-class TimeRE(dict):
-    """Handle conversion from format directives to regexes."""
-
-    def __init__(self, locale_time=None):
-        """Create keys/values.
-
-        Order of execution is important for dependency reasons.
+    oresult = np.empty(n, dtype=object)
 
-        """
-        if locale_time:
-            self.locale_time = locale_time
-        else:
-            self.locale_time = LocaleTime()
-        base = super(TimeRE, self)
-        base.__init__({
-            # The " \d" part of the regex is to make %c from ANSI C work
-            'd': r"(?P<d>3[0-1]|[1-2]\d|0[1-9]|[1-9]| [1-9])",
-            'f': r"(?P<f>[0-9]{1,9})",
-            'H': r"(?P<H>2[0-3]|[0-1]\d|\d)",
-            'I': r"(?P<I>1[0-2]|0[1-9]|[1-9])",
-            'j': (r"(?P<j>36[0-6]|3[0-5]\d|[1-2]\d\d|0[1-9]\d|00[1-9]|"
-                  r"[1-9]\d|0[1-9]|[1-9])"),
-            'm': r"(?P<m>1[0-2]|0[1-9]|[1-9])",
-            'M': r"(?P<M>[0-5]\d|\d)",
-            'S': r"(?P<S>6[0-1]|[0-5]\d|\d)",
-            'U': r"(?P<U>5[0-3]|[0-4]\d|\d)",
-            'w': r"(?P<w>[0-6])",
-            # W is set below by using 'U'
-            'y': r"(?P<y>\d\d)",
-            #XXX: Does 'Y' need to worry about having less or more than
-            #     4 digits?
-            'Y': r"(?P<Y>\d\d\d\d)",
-            'A': self.__seqToRE(self.locale_time.f_weekday, 'A'),
-            'a': self.__seqToRE(self.locale_time.a_weekday, 'a'),
-            'B': self.__seqToRE(self.locale_time.f_month[1:], 'B'),
-            'b': self.__seqToRE(self.locale_time.a_month[1:], 'b'),
-            'p': self.__seqToRE(self.locale_time.am_pm, 'p'),
-            'Z': self.__seqToRE([tz for tz_names in self.locale_time.timezone
-                                 for tz in tz_names],
-                                'Z'),
-            '%': '%'})
-        base.__setitem__('W', base.__getitem__('U').replace('U', 'W'))
-        base.__setitem__('c', self.pattern(self.locale_time.LC_date_time))
-        base.__setitem__('x', self.pattern(self.locale_time.LC_date))
-        base.__setitem__('X', self.pattern(self.locale_time.LC_time))
-
-    def __seqToRE(self, to_convert, directive):
-        """Convert a list to a regex string for matching a directive.
-
-        Want possible matching values to be from longest to shortest.  This
-        prevents the possibility of a match occuring for a value that also
-        a substring of a larger value that should have matched (e.g., 'abc'
-        matching when 'abcdef' should have been the match).
-
-        """
-        to_convert = sorted(to_convert, key=len, reverse=True)
-        for value in to_convert:
-            if value != '':
-                break
+    # We return an object array and only attempt to parse:
+    # 1) NaT or NaT-like values
+    # 2) datetime strings, which we return as datetime.datetime
+    for i in range(n):
+        val = values[i]
+        if checknull_with_nat(val):
+            oresult[i] = val
+        elif is_string_object(val):
+            if len(val) == 0 or val in nat_strings:
+                oresult[i] = 'NaT'
+                continue
+            try:
+                oresult[i] = parse_datetime_string(val, dayfirst=dayfirst,
+                                                   yearfirst=yearfirst)
+                pydatetime_to_dt64(oresult[i], &dts)
+                check_dts_bounds(&dts)
+            except (ValueError, OverflowError):
+                if is_raise:
+                    raise
+                return values, None
         else:
-            return ''
-        regex = '|'.join([re_escape(stuff) for stuff in to_convert])
-        regex = '(?P<%s>%s' % (directive, regex)
-        return '%s)' % regex
-
-    def pattern(self, format):
-        """Return regex pattern for the format string.
-
-        Need to make sure that any characters that might be interpreted as
-        regex syntax are escaped.
-
-        """
-        processed_format = ''
-        # The sub() call escapes all characters that might be misconstrued
-        # as regex syntax.  Cannot use re.escape since we have to deal with
-        # format directives (%m, etc.).
-        regex_chars = re_compile(r"([\\.^$*+?\(\){}\[\]|])")
-        format = regex_chars.sub(r"\\\1", format)
-        whitespace_replacement = re_compile(r'\s+')
-        format = whitespace_replacement.sub(r'\\s+', format)
-        while '%' in format:
-            directive_index = format.index('%') +1
-            processed_format = "%s%s%s" % (processed_format,
-                                           format[:directive_index -1],
-                                           self[format[directive_index]])
-            format = format[directive_index +1:]
-        return "%s%s" % (processed_format, format)
-
-    def compile(self, format):
-        """Return a compiled re object for the format string."""
-        return re_compile(self.pattern(format), IGNORECASE)
-
-_cache_lock = _thread_allocate_lock()
-# DO NOT modify _TimeRE_cache or _regex_cache without acquiring the cache lock
-# first!
-_TimeRE_cache = TimeRE()
-_CACHE_MAX_SIZE = 5 # Max number of regexes stored in _regex_cache
-_regex_cache = {}
-
-cdef _calc_julian_from_U_or_W(int year, int week_of_year,
-                              int day_of_week, int week_starts_Mon):
-    """Calculate the Julian day based on the year, week of the year, and day of
-    the week, with week_start_day representing whether the week of the year
-    assumes the week starts on Sunday or Monday (6 or 0)."""
+            if is_raise:
+                raise
+            return values, None
+    return oresult, None
 
-    cdef:
-        int first_weekday,  week_0_length, days_to_week
-
-    first_weekday = datetime_date(year, 1, 1).weekday()
-    # If we are dealing with the %U directive (week starts on Sunday), it's
-    # easier to just shift the view to Sunday being the first day of the
-    # week.
-    if not week_starts_Mon:
-        first_weekday = (first_weekday + 1) % 7
-        day_of_week = (day_of_week + 1) % 7
-    # Need to watch out for a week 0 (when the first day of the year is not
-    # the same as that specified by %U or %W).
-    week_0_length = (7 - first_weekday) % 7
-    if week_of_year == 0:
-        return 1 + day_of_week - first_weekday
-    else:
-        days_to_week = week_0_length + (7 * (week_of_year - 1))
-        return 1 + days_to_week + day_of_week
 
-# def _strptime_time(data_string, format="%a %b %d %H:%M:%S %Y"):
-#     return _strptime(data_string, format)[0]
+cdef inline bint _parse_today_now(str val, int64_t* iresult):
+    # We delay this check for as long as possible
+    # because it catches relatively rare cases
+    if val == 'now':
+        # Note: this is *not* the same as Timestamp('now')
+        iresult[0] = Timestamp.utcnow().value
+        return True
+    elif val == 'today':
+        iresult[0] = Timestamp.today().value
+        return True
+    return False
diff --git a/pandas/_libs/tslibs/__init__.py b/pandas/_libs/tslibs/__init__.py
new file mode 100644
index 0000000000000..38401cab57f5d
--- /dev/null
+++ b/pandas/_libs/tslibs/__init__.py
@@ -0,0 +1,9 @@
+# -*- coding: utf-8 -*-
+# flake8: noqa
+
+from .conversion import normalize_date, localize_pydatetime, tz_convert_single
+from .nattype import NaT, iNaT, is_null_datetimelike
+from .np_datetime import OutOfBoundsDatetime
+from .period import Period, IncompatibleFrequency
+from .timestamps import Timestamp
+from .timedeltas import delta_to_nanoseconds, ints_to_pytimedelta, Timedelta
diff --git a/pandas/_libs/tslibs/ccalendar.pxd b/pandas/_libs/tslibs/ccalendar.pxd
new file mode 100644
index 0000000000000..08f539a70a7ed
--- /dev/null
+++ b/pandas/_libs/tslibs/ccalendar.pxd
@@ -0,0 +1,12 @@
+# -*- coding: utf-8 -*-
+
+from cython cimport Py_ssize_t
+
+from numpy cimport int64_t, int32_t
+
+
+cdef int dayofweek(int y, int m, int d) nogil
+cdef bint is_leapyear(int64_t year) nogil
+cpdef int32_t get_days_in_month(int year, Py_ssize_t month) nogil
+cpdef int32_t get_week_of_year(int year, int month, int day) nogil
+cpdef int32_t get_day_of_year(int year, int month, int day) nogil
diff --git a/pandas/_libs/tslibs/ccalendar.pyx b/pandas/_libs/tslibs/ccalendar.pyx
new file mode 100644
index 0000000000000..c48812acd3de1
--- /dev/null
+++ b/pandas/_libs/tslibs/ccalendar.pyx
@@ -0,0 +1,226 @@
+# -*- coding: utf-8 -*-
+# cython: boundscheck=False
+"""
+Cython implementations of functions resembling the stdlib calendar module
+"""
+
+import cython
+
+from numpy cimport int64_t, int32_t
+
+from locale import LC_TIME
+from pandas._libs.tslibs.strptime import LocaleTime
+
+# ----------------------------------------------------------------------
+# Constants
+
+# Slightly more performant cython lookups than a 2D table
+# The first 12 entries correspond to month lengths for non-leap years.
+# The remaining 12 entries give month lengths for leap years
+cdef int32_t* days_per_month_array = [
+    31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31,
+    31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31]
+
+cdef int* sakamoto_arr = [0, 3, 2, 5, 0, 3, 5, 1, 4, 6, 2, 4]
+
+# The first 13 entries give the month days elapsed as of the first of month N
+# (or the total number of days in the year for N=13) in non-leap years.
+# The remaining 13 entries give the days elapsed in leap years.
+cdef int32_t* _month_offset = [
+    0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365,
+    0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366]
+
+# Canonical location for other modules to find name constants
+MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
+          'AUG', 'SEP', 'OCT', 'NOV', 'DEC']
+# The first blank line is consistent with calendar.month_name in the calendar
+# standard library
+MONTHS_FULL = ['', 'January', 'February', 'March', 'April', 'May', 'June',
+               'July', 'August', 'September', 'October', 'November',
+               'December']
+MONTH_NUMBERS = {name: num for num, name in enumerate(MONTHS)}
+MONTH_ALIASES = {(num + 1): name for num, name in enumerate(MONTHS)}
+MONTH_TO_CAL_NUM = {name: num + 1 for num, name in enumerate(MONTHS)}
+
+DAYS = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+DAYS_FULL = ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday',
+             'Saturday', 'Sunday']
+int_to_weekday = {num: name for num, name in enumerate(DAYS)}
+weekday_to_int = {int_to_weekday[key]: key for key in int_to_weekday}
+
+DAY_SECONDS = 86400
+HOUR_SECONDS = 3600
+
+# ----------------------------------------------------------------------
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef int32_t get_days_in_month(int year, Py_ssize_t month) nogil:
+    """Return the number of days in the given month of the given year.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    days_in_month : int
+
+    Notes
+    -----
+    Assumes that the arguments are valid.  Passing a month not between 1 and 12
+    risks a segfault.
+    """
+    return days_per_month_array[12 * is_leapyear(year) + month - 1]
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+@cython.cdivision
+cdef int dayofweek(int y, int m, int d) nogil:
+    """Find the day of week for the date described by the Y/M/D triple y, m, d
+    using Sakamoto's method, from wikipedia.
+
+    0 represents Monday.  See [1]_.
+
+    Parameters
+    ----------
+    y : int
+    m : int
+    d : int
+
+    Returns
+    -------
+    weekday : int
+
+    Notes
+    -----
+    Assumes that y, m, d, represents a valid date.
+
+    See Also
+    --------
+    [1] https://docs.python.org/3/library/calendar.html#calendar.weekday
+
+    [2] https://en.wikipedia.org/wiki/\
+    Determination_of_the_day_of_the_week#Sakamoto.27s_methods
+    """
+    cdef:
+        int day
+
+    y -= m < 3
+    day = (y + y / 4 - y / 100 + y / 400 + sakamoto_arr[m - 1] + d) % 7
+    # convert to python day
+    return (day + 6) % 7
+
+
+cdef bint is_leapyear(int64_t year) nogil:
+    """Returns 1 if the given year is a leap year, 0 otherwise.
+
+    Parameters
+    ----------
+    year : int
+
+    Returns
+    -------
+    is_leap : bool
+    """
+    return ((year & 0x3) == 0 and  # year % 4 == 0
+            ((year % 100) != 0 or (year % 400) == 0))
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef int32_t get_week_of_year(int year, int month, int day) nogil:
+    """Return the ordinal week-of-year for the given day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+    day : int
+
+    Returns
+    -------
+    week_of_year : int32_t
+
+    Notes
+    -----
+    Assumes the inputs describe a valid date.
+    """
+    cdef:
+        int32_t doy, dow
+        int woy
+
+    doy = get_day_of_year(year, month, day)
+    dow = dayofweek(year, month, day)
+
+    # estimate
+    woy = (doy - 1) - dow + 3
+    if woy >= 0:
+        woy = woy / 7 + 1
+
+    # verify
+    if woy < 0:
+        if (woy > -2) or (woy == -2 and is_leapyear(year - 1)):
+            woy = 53
+        else:
+            woy = 52
+    elif woy == 53:
+        if 31 - day + dow < 3:
+            woy = 1
+
+    return woy
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cpdef int32_t get_day_of_year(int year, int month, int day) nogil:
+    """Return the ordinal day-of-year for the given day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+    day : int
+
+    Returns
+    -------
+    day_of_year : int32_t
+
+    Notes
+    -----
+    Assumes the inputs describe a valid date.
+    """
+    cdef:
+        bint isleap
+        int32_t mo_off
+        int day_of_year
+
+    isleap = is_leapyear(year)
+
+    mo_off = _month_offset[isleap * 13 + month - 1]
+
+    day_of_year = mo_off + day
+    return day_of_year
+
+
+cpdef get_locale_names(object name_type, object locale=None):
+    """Returns an array of localized day or month names
+
+    Parameters
+    ----------
+    name_type : string, attribute of LocaleTime() in which to return localized
+        names
+    locale : string
+
+    Returns
+    -------
+    list of locale names
+
+    """
+    from pandas.util.testing import set_locale
+
+    with set_locale(locale, LC_TIME):
+        return getattr(LocaleTime(), name_type)
diff --git a/pandas/_libs/tslibs/conversion.pxd b/pandas/_libs/tslibs/conversion.pxd
new file mode 100644
index 0000000000000..8aca9ca185243
--- /dev/null
+++ b/pandas/_libs/tslibs/conversion.pxd
@@ -0,0 +1,34 @@
+# -*- coding: utf-8 -*-
+
+from cpython.datetime cimport datetime, tzinfo
+
+from numpy cimport int64_t, int32_t
+
+from pandas._libs.tslibs.np_datetime cimport npy_datetimestruct
+
+
+cdef class _TSObject:
+    cdef:
+        npy_datetimestruct dts      # npy_datetimestruct
+        int64_t value               # numpy dt64
+        object tzinfo
+
+
+cdef convert_to_tsobject(object ts, object tz, object unit,
+                         bint dayfirst, bint yearfirst,
+                         int32_t nanos=*)
+
+cdef _TSObject convert_datetime_to_tsobject(datetime ts, object tz,
+                                            int32_t nanos=*)
+
+cpdef int64_t tz_convert_single(int64_t val, object tz1, object tz2)
+
+cdef int64_t get_datetime64_nanos(object val) except? -1
+
+cpdef int64_t pydt_to_i8(object pydt) except? -1
+
+cdef maybe_datetimelike_to_i8(object val)
+
+cdef int64_t tz_convert_utc_to_tzlocal(int64_t utc_val, tzinfo tz)
+
+cpdef datetime localize_pydatetime(datetime dt, object tz)
diff --git a/pandas/_libs/tslibs/conversion.pyx b/pandas/_libs/tslibs/conversion.pyx
new file mode 100644
index 0000000000000..1c0adaaa288a9
--- /dev/null
+++ b/pandas/_libs/tslibs/conversion.pyx
@@ -0,0 +1,1335 @@
+# -*- coding: utf-8 -*-
+import cython
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport uint8_t, int64_t, int32_t, intp_t, ndarray
+cnp.import_array()
+
+import pytz
+from dateutil.tz import tzutc
+
+# stdlib datetime imports
+from datetime import time as datetime_time
+from cpython.datetime cimport (datetime, tzinfo,
+                               PyDateTime_Check, PyDate_Check,
+                               PyDateTime_CheckExact, PyDateTime_IMPORT,
+                               PyDelta_Check)
+PyDateTime_IMPORT
+
+from pandas._libs.tslibs.ccalendar import DAY_SECONDS, HOUR_SECONDS
+
+from pandas._libs.tslibs.np_datetime cimport (
+    check_dts_bounds, npy_datetimestruct, pandas_datetime_to_datetimestruct,
+    _string_to_dts, npy_datetime, dt64_to_dtstruct, dtstruct_to_dt64,
+    get_datetime64_unit, get_datetime64_value, pydatetime_to_dt64,
+    NPY_DATETIMEUNIT, NPY_FR_ns)
+from pandas._libs.tslibs.np_datetime import OutOfBoundsDatetime
+
+from pandas._libs.tslibs.util cimport (
+    is_string_object, is_datetime64_object, is_integer_object, is_float_object)
+
+from pandas._libs.tslibs.timedeltas cimport (cast_from_unit,
+                                             delta_to_nanoseconds)
+from pandas._libs.tslibs.timezones cimport (
+    is_utc, is_tzlocal, is_fixed_offset, get_utcoffset, get_dst_info,
+    get_timezone, maybe_get_tz, tz_compare)
+from pandas._libs.tslibs.timezones import UTC
+from pandas._libs.tslibs.parsing import parse_datetime_string
+
+from pandas._libs.tslibs.nattype import nat_strings
+from pandas._libs.tslibs.nattype cimport (
+    NPY_NAT, checknull_with_nat, c_NaT as NaT)
+
+# ----------------------------------------------------------------------
+# Constants
+
+NS_DTYPE = np.dtype('M8[ns]')
+TD_DTYPE = np.dtype('m8[ns]')
+
+
+# ----------------------------------------------------------------------
+# Misc Helpers
+
+cdef inline int64_t get_datetime64_nanos(object val) except? -1:
+    """
+    Extract the value and unit from a np.datetime64 object, then convert the
+    value to nanoseconds if necessary.
+    """
+    cdef:
+        npy_datetimestruct dts
+        NPY_DATETIMEUNIT unit
+        npy_datetime ival
+
+    ival = get_datetime64_value(val)
+    if ival == NPY_NAT:
+        return NPY_NAT
+
+    unit = get_datetime64_unit(val)
+
+    if unit != NPY_FR_ns:
+        pandas_datetime_to_datetimestruct(ival, unit, &dts)
+        check_dts_bounds(&dts)
+        ival = dtstruct_to_dt64(&dts)
+
+    return ival
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def ensure_datetime64ns(arr: ndarray, copy: bool=True):
+    """
+    Ensure a np.datetime64 array has dtype specifically 'datetime64[ns]'
+
+    Parameters
+    ----------
+    arr : ndarray
+    copy : boolean, default True
+
+    Returns
+    -------
+    result : ndarray with dtype datetime64[ns]
+
+    """
+    cdef:
+        Py_ssize_t i, n = arr.size
+        int64_t[:] ivalues, iresult
+        NPY_DATETIMEUNIT unit
+        npy_datetimestruct dts
+
+    shape = (<object>arr).shape
+
+    ivalues = arr.view(np.int64).ravel()
+
+    result = np.empty(shape, dtype=NS_DTYPE)
+    iresult = result.ravel().view(np.int64)
+
+    if len(iresult) == 0:
+        result = arr.view(NS_DTYPE)
+        if copy:
+            result = result.copy()
+        return result
+
+    unit = get_datetime64_unit(arr.flat[0])
+    if unit == NPY_FR_ns:
+        if copy:
+            arr = arr.copy()
+        result = arr
+    else:
+        for i in range(n):
+            if ivalues[i] != NPY_NAT:
+                pandas_datetime_to_datetimestruct(ivalues[i], unit, &dts)
+                iresult[i] = dtstruct_to_dt64(&dts)
+                check_dts_bounds(&dts)
+            else:
+                iresult[i] = NPY_NAT
+
+    return result
+
+
+def ensure_timedelta64ns(arr: ndarray, copy: bool=True):
+    """
+    Ensure a np.timedelta64 array has dtype specifically 'timedelta64[ns]'
+
+    Parameters
+    ----------
+    arr : ndarray
+    copy : boolean, default True
+
+    Returns
+    -------
+    result : ndarray with dtype timedelta64[ns]
+
+    """
+    return arr.astype(TD_DTYPE, copy=copy)
+    # TODO: check for overflows when going from a lower-resolution to nanos
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def datetime_to_datetime64(object[:] values):
+    """
+    Convert ndarray of datetime-like objects to int64 array representing
+    nanosecond timestamps.
+
+    Parameters
+    ----------
+    values : ndarray[object]
+
+    Returns
+    -------
+    result : ndarray[int64_t]
+    inferred_tz : tzinfo or None
+    """
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object val, inferred_tz = None
+        int64_t[:] iresult
+        npy_datetimestruct dts
+        _TSObject _ts
+        bint found_naive = False
+
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
+    for i in range(n):
+        val = values[i]
+        if checknull_with_nat(val):
+            iresult[i] = NPY_NAT
+        elif PyDateTime_Check(val):
+            if val.tzinfo is not None:
+                if found_naive:
+                    raise ValueError('Cannot mix tz-aware with '
+                                     'tz-naive values')
+                if inferred_tz is not None:
+                    if not tz_compare(val.tzinfo, inferred_tz):
+                        raise ValueError('Array must be all same time zone')
+                else:
+                    inferred_tz = get_timezone(val.tzinfo)
+
+                _ts = convert_datetime_to_tsobject(val, None)
+                iresult[i] = _ts.value
+                check_dts_bounds(&_ts.dts)
+            else:
+                found_naive = True
+                if inferred_tz is not None:
+                    raise ValueError('Cannot mix tz-aware with '
+                                     'tz-naive values')
+                iresult[i] = pydatetime_to_dt64(val, &dts)
+                check_dts_bounds(&dts)
+        else:
+            raise TypeError('Unrecognized value type: %s' % type(val))
+
+    return result, inferred_tz
+
+
+cdef inline maybe_datetimelike_to_i8(object val):
+    """
+    Try to convert to a nanosecond timestamp.  Fall back to returning the
+    input value.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    val : int64 timestamp or original input
+    """
+    cdef:
+        npy_datetimestruct dts
+    try:
+        return val.value
+    except AttributeError:
+        if is_datetime64_object(val):
+            return get_datetime64_value(val)
+        elif PyDateTime_Check(val):
+            return convert_datetime_to_tsobject(val, None).value
+        return val
+
+
+# ----------------------------------------------------------------------
+# _TSObject Conversion
+
+# lightweight C object to hold datetime & int64 pair
+cdef class _TSObject:
+    # cdef:
+    #    npy_datetimestruct dts      # npy_datetimestruct
+    #    int64_t value               # numpy dt64
+    #    object tzinfo
+
+    @property
+    def value(self):
+        # This is needed in order for `value` to be accessible in lib.pyx
+        return self.value
+
+
+cpdef int64_t pydt_to_i8(object pydt) except? -1:
+    """
+    Convert to int64 representation compatible with numpy datetime64; converts
+    to UTC
+
+    Parameters
+    ----------
+    pydt : object
+
+    Returns
+    -------
+    i8value : np.int64
+    """
+    cdef:
+        _TSObject ts
+
+    ts = convert_to_tsobject(pydt, None, None, 0, 0)
+
+    return ts.value
+
+
+cdef convert_to_tsobject(object ts, object tz, object unit,
+                         bint dayfirst, bint yearfirst, int32_t nanos=0):
+    """
+    Extract datetime and int64 from any of:
+        - np.int64 (with unit providing a possible modifier)
+        - np.datetime64
+        - a float (with unit providing a possible modifier)
+        - python int or long object (with unit providing a possible modifier)
+        - iso8601 string object
+        - python datetime object
+        - another timestamp object
+    """
+    cdef:
+        _TSObject obj
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+    obj = _TSObject()
+
+    if is_string_object(ts):
+        return convert_str_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
+
+    if ts is None or ts is NaT:
+        obj.value = NPY_NAT
+    elif is_datetime64_object(ts):
+        obj.value = get_datetime64_nanos(ts)
+        if obj.value != NPY_NAT:
+            dt64_to_dtstruct(obj.value, &obj.dts)
+    elif is_integer_object(ts):
+        if ts == NPY_NAT:
+            obj.value = NPY_NAT
+        else:
+            ts = ts * cast_from_unit(None, unit)
+            obj.value = ts
+            dt64_to_dtstruct(ts, &obj.dts)
+    elif is_float_object(ts):
+        if ts != ts or ts == NPY_NAT:
+            obj.value = NPY_NAT
+        else:
+            ts = cast_from_unit(ts, unit)
+            obj.value = ts
+            dt64_to_dtstruct(ts, &obj.dts)
+    elif PyDateTime_Check(ts):
+        return convert_datetime_to_tsobject(ts, tz, nanos)
+    elif PyDate_Check(ts):
+        # Keep the converter same as PyDateTime's
+        ts = datetime.combine(ts, datetime_time())
+        return convert_datetime_to_tsobject(ts, tz)
+    elif getattr(ts, '_typ', None) == 'period':
+        raise ValueError("Cannot convert Period to Timestamp "
+                         "unambiguously. Use to_timestamp")
+    else:
+        raise TypeError('Cannot convert input [{}] of type {} to '
+                        'Timestamp'.format(ts, type(ts)))
+
+    if tz is not None:
+        localize_tso(obj, tz)
+
+    if obj.value != NPY_NAT:
+        # check_overflows needs to run after localize_tso
+        check_dts_bounds(&obj.dts)
+        check_overflows(obj)
+    return obj
+
+
+cdef _TSObject convert_datetime_to_tsobject(datetime ts, object tz,
+                                            int32_t nanos=0):
+    """
+    Convert a datetime (or Timestamp) input `ts`, along with optional timezone
+    object `tz` to a _TSObject.
+
+    The optional argument `nanos` allows for cases where datetime input
+    needs to be supplemented with higher-precision information.
+
+    Parameters
+    ----------
+    ts : datetime or Timestamp
+        Value to be converted to _TSObject
+    tz : tzinfo or None
+        timezone for the timezone-aware output
+    nanos : int32_t, default is 0
+        nanoseconds supplement the precision of the datetime input ts
+
+    Returns
+    -------
+    obj : _TSObject
+    """
+    cdef:
+        _TSObject obj = _TSObject()
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+        if ts.tzinfo is not None:
+            # Convert the current timezone to the passed timezone
+            ts = ts.astimezone(tz)
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = ts.tzinfo
+        elif not is_utc(tz):
+            ts = _localize_pydatetime(ts, tz)
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = ts.tzinfo
+        else:
+            # UTC
+            obj.value = pydatetime_to_dt64(ts, &obj.dts)
+            obj.tzinfo = tz
+    else:
+        obj.value = pydatetime_to_dt64(ts, &obj.dts)
+        obj.tzinfo = ts.tzinfo
+
+    if obj.tzinfo is not None and not is_utc(obj.tzinfo):
+        offset = get_utcoffset(obj.tzinfo, ts)
+        obj.value -= int(offset.total_seconds() * 1e9)
+
+    if not PyDateTime_CheckExact(ts):
+        # datetime instance but not datetime type --> Timestamp
+        obj.value += ts.nanosecond
+        obj.dts.ps = ts.nanosecond * 1000
+
+    if nanos:
+        obj.value += nanos
+        obj.dts.ps = nanos * 1000
+
+    check_dts_bounds(&obj.dts)
+    check_overflows(obj)
+    return obj
+
+
+cdef _TSObject convert_str_to_tsobject(object ts, object tz, object unit,
+                                       bint dayfirst=False,
+                                       bint yearfirst=False):
+    """
+    Convert a string-like (bytes or unicode) input `ts`, along with optional
+    timezone object `tz` to a _TSObject.
+
+    The optional arguments `dayfirst` and `yearfirst` are passed to the
+    dateutil parser.
+
+    Parameters
+    ----------
+    ts : bytes or unicode
+        Value to be converted to _TSObject
+    tz : tzinfo or None
+        timezone for the timezone-aware output
+    dayfirst : bool, default False
+        When parsing an ambiguous date string, interpret e.g. "3/4/1975" as
+        April 3, as opposed to the standard US interpretation March 4.
+    yearfirst : bool, default False
+        When parsing an ambiguous date string, interpret e.g. "01/05/09"
+        as "May 9, 2001", as opposed to the default "Jan 5, 2009"
+
+    Returns
+    -------
+    obj : _TSObject
+    """
+    cdef:
+        _TSObject obj
+        int out_local = 0, out_tzoffset = 0
+        datetime dt
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+
+    obj = _TSObject()
+
+    assert is_string_object(ts)
+
+    if len(ts) == 0 or ts in nat_strings:
+        ts = NaT
+    elif ts == 'now':
+        # Issue 9000, we short-circuit rather than going
+        # into np_datetime_strings which returns utc
+        ts = datetime.now(tz)
+    elif ts == 'today':
+        # Issue 9000, we short-circuit rather than going
+        # into np_datetime_strings which returns a normalized datetime
+        ts = datetime.now(tz)
+        # equiv: datetime.today().replace(tzinfo=tz)
+    else:
+        try:
+            _string_to_dts(ts, &obj.dts, &out_local, &out_tzoffset)
+            obj.value = dtstruct_to_dt64(&obj.dts)
+            check_dts_bounds(&obj.dts)
+            if out_local == 1:
+                obj.tzinfo = pytz.FixedOffset(out_tzoffset)
+                obj.value = tz_convert_single(obj.value, obj.tzinfo, UTC)
+                if tz is None:
+                    check_dts_bounds(&obj.dts)
+                    check_overflows(obj)
+                    return obj
+                else:
+                    # Keep the converter same as PyDateTime's
+                    obj = convert_to_tsobject(obj.value, obj.tzinfo,
+                                              None, 0, 0)
+                    dt = datetime(obj.dts.year, obj.dts.month, obj.dts.day,
+                                  obj.dts.hour, obj.dts.min, obj.dts.sec,
+                                  obj.dts.us, obj.tzinfo)
+                    obj = convert_datetime_to_tsobject(dt, tz,
+                                                       nanos=obj.dts.ps / 1000)
+                    return obj
+
+            else:
+                ts = obj.value
+                if tz is not None:
+                    # shift for localize_tso
+                    ts = tz_localize_to_utc(np.array([ts], dtype='i8'), tz,
+                                            ambiguous='raise')[0]
+
+        except OutOfBoundsDatetime:
+            # GH#19382 for just-barely-OutOfBounds falling back to dateutil
+            # parser will return incorrect result because it will ignore
+            # nanoseconds
+            raise
+
+        except ValueError:
+            try:
+                ts = parse_datetime_string(ts, dayfirst=dayfirst,
+                                           yearfirst=yearfirst)
+            except Exception:
+                raise ValueError("could not convert string to Timestamp")
+
+    return convert_to_tsobject(ts, tz, unit, dayfirst, yearfirst)
+
+
+cdef inline check_overflows(_TSObject obj):
+    """
+    Check that we haven't silently overflowed in timezone conversion
+
+    Parameters
+    ----------
+    obj : _TSObject
+
+    Returns
+    -------
+    None
+
+    Raises
+    ------
+    OutOfBoundsDatetime
+    """
+    # GH#12677
+    if obj.dts.year == 1677:
+        if not (obj.value < 0):
+            raise OutOfBoundsDatetime
+    elif obj.dts.year == 2262:
+        if not (obj.value > 0):
+            raise OutOfBoundsDatetime
+
+
+# ----------------------------------------------------------------------
+# Localization
+
+cdef inline void localize_tso(_TSObject obj, tzinfo tz):
+    """
+    Given the UTC nanosecond timestamp in obj.value, find the wall-clock
+    representation of that timestamp in the given timezone.
+
+    Parameters
+    ----------
+    obj : _TSObject
+    tz : tzinfo
+
+    Returns
+    -------
+    None
+
+    Notes
+    -----
+    Sets obj.tzinfo inplace, alters obj.dts inplace.
+    """
+    cdef:
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        int64_t local_val
+        Py_ssize_t pos
+        str typ
+
+    assert obj.tzinfo is None
+
+    if is_utc(tz):
+        pass
+    elif obj.value == NPY_NAT:
+        pass
+    elif is_tzlocal(tz):
+        local_val = _tz_convert_tzlocal_utc(obj.value, tz, to_utc=False)
+        dt64_to_dtstruct(local_val, &obj.dts)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        if is_fixed_offset(tz):
+            # static/fixed tzinfo; in this case we know len(deltas) == 1
+            # This can come back with `typ` of either "fixed" or None
+            dt64_to_dtstruct(obj.value + deltas[0], &obj.dts)
+        elif typ == 'pytz':
+            # i.e. treat_tz_as_pytz(tz)
+            pos = trans.searchsorted(obj.value, side='right') - 1
+            tz = tz._tzinfos[tz._transition_info[pos]]
+            dt64_to_dtstruct(obj.value + deltas[pos], &obj.dts)
+        elif typ == 'dateutil':
+            # i.e. treat_tz_as_dateutil(tz)
+            pos = trans.searchsorted(obj.value, side='right') - 1
+            dt64_to_dtstruct(obj.value + deltas[pos], &obj.dts)
+        else:
+            # Note: as of 2018-07-17 all tzinfo objects that are _not_
+            # either pytz or dateutil have is_fixed_offset(tz) == True,
+            # so this branch will never be reached.
+            pass
+
+    obj.tzinfo = tz
+
+
+cdef inline datetime _localize_pydatetime(datetime dt, tzinfo tz):
+    """
+    Take a datetime/Timestamp in UTC and localizes to timezone tz.
+
+    NB: Unlike the public version, this treats datetime and Timestamp objects
+        identically, i.e. discards nanos from Timestamps.
+        It also assumes that the `tz` input is not None.
+    """
+    try:
+        # datetime.replace with pytz may be incorrect result
+        return tz.localize(dt)
+    except AttributeError:
+        return dt.replace(tzinfo=tz)
+
+
+cpdef inline datetime localize_pydatetime(datetime dt, object tz):
+    """
+    Take a datetime/Timestamp in UTC and localizes to timezone tz.
+
+    Parameters
+    ----------
+    dt : datetime or Timestamp
+    tz : tzinfo, "UTC", or None
+
+    Returns
+    -------
+    localized : datetime or Timestamp
+    """
+    if tz is None:
+        return dt
+    elif not PyDateTime_CheckExact(dt):
+        # i.e. is a Timestamp
+        return dt.tz_localize(tz)
+    elif is_utc(tz):
+        return _localize_pydatetime(dt, tz)
+    try:
+        # datetime.replace with pytz may be incorrect result
+        return tz.localize(dt)
+    except AttributeError:
+        return dt.replace(tzinfo=tz)
+
+
+# ----------------------------------------------------------------------
+# Timezone Conversion
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cdef inline int64_t[:] _tz_convert_dst(int64_t[:] values, tzinfo tz,
+                                       bint to_utc=True):
+    """
+    tz_convert for non-UTC non-tzlocal cases where we have to check
+    DST transitions pointwise.
+
+    Parameters
+    ----------
+    values : ndarray[int64_t]
+    tz : tzinfo
+    to_utc : bool
+        True if converting _to_ UTC, False if converting _from_ utc
+
+    Returns
+    -------
+    result : ndarray[int64_t]
+    """
+    cdef:
+        Py_ssize_t n = len(values)
+        Py_ssize_t i
+        intp_t[:] pos
+        int64_t[:] result = np.empty(n, dtype=np.int64)
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        int64_t v
+        bint tz_is_local
+
+    tz_is_local = is_tzlocal(tz)
+
+    if not tz_is_local:
+        # get_dst_info cannot extract offsets from tzlocal because its
+        # dependent on a datetime
+        trans, deltas, _ = get_dst_info(tz)
+        if not to_utc:
+            # We add `offset` below instead of subtracting it
+            deltas = -1 * np.array(deltas, dtype='i8')
+
+        # Previously, this search was done pointwise to try and benefit
+        # from getting to skip searches for iNaTs. However, it seems call
+        # overhead dominates the search time so doing it once in bulk
+        # is substantially faster (GH#24603)
+        pos = trans.searchsorted(values, side='right') - 1
+
+    for i in range(n):
+        v = values[i]
+        if v == NPY_NAT:
+            result[i] = v
+        elif tz_is_local:
+            result[i] = _tz_convert_tzlocal_utc(v, tz, to_utc=to_utc)
+        else:
+            if pos[i] < 0:
+                raise ValueError('First time before start of DST info')
+            result[i] = v - deltas[pos[i]]
+
+    return result
+
+
+cdef inline int64_t _tz_convert_tzlocal_utc(int64_t val, tzinfo tz,
+                                            bint to_utc=True):
+    """
+    Convert the i8 representation of a datetime from a tzlocal timezone to
+    UTC, or vice-versa.
+
+    Private, not intended for use outside of tslibs.conversion
+
+    Parameters
+    ----------
+    val : int64_t
+    tz : tzinfo
+    to_utc : bint
+        True if converting tzlocal _to_ UTC, False if going the other direction
+
+    Returns
+    -------
+    result : int64_t
+    """
+    cdef:
+        npy_datetimestruct dts
+        int64_t delta
+        datetime dt
+
+    dt64_to_dtstruct(val, &dts)
+    dt = datetime(dts.year, dts.month, dts.day, dts.hour,
+                  dts.min, dts.sec, dts.us)
+    # get_utcoffset (tz.utcoffset under the hood) only makes sense if datetime
+    # is _wall time_, so if val is a UTC timestamp convert to wall time
+    if not to_utc:
+        dt = dt.replace(tzinfo=tzutc())
+        dt = dt.astimezone(tz)
+    delta = int(get_utcoffset(tz, dt).total_seconds()) * 1000000000
+
+    if not to_utc:
+        return val + delta
+    return val - delta
+
+
+cdef inline int64_t tz_convert_utc_to_tzlocal(int64_t utc_val, tzinfo tz):
+    """
+    Parameters
+    ----------
+    utc_val : int64_t
+    tz : tzinfo
+
+    Returns
+    -------
+    local_val : int64_t
+    """
+    return _tz_convert_tzlocal_utc(utc_val, tz, to_utc=False)
+
+
+cpdef int64_t tz_convert_single(int64_t val, object tz1, object tz2):
+    """
+    Convert the val (in i8) from timezone1 to timezone2
+
+    This is a single timezone version of tz_convert
+
+    Parameters
+    ----------
+    val : int64
+    tz1 : string / timezone object
+    tz2 : string / timezone object
+
+    Returns
+    -------
+    converted: int64
+    """
+    cdef:
+        int64_t[:] deltas
+        Py_ssize_t pos
+        int64_t v, offset, utc_date
+        npy_datetimestruct dts
+        int64_t arr[1]
+
+    # See GH#17734 We should always be converting either from UTC or to UTC
+    assert is_utc(tz1) or is_utc(tz2)
+
+    if val == NPY_NAT:
+        return val
+
+    # Convert to UTC
+    if is_tzlocal(tz1):
+        utc_date = _tz_convert_tzlocal_utc(val, tz1, to_utc=True)
+    elif not is_utc(get_timezone(tz1)):
+        arr[0] = val
+        utc_date = _tz_convert_dst(arr, tz1, to_utc=True)[0]
+    else:
+        utc_date = val
+
+    if is_utc(get_timezone(tz2)):
+        return utc_date
+    elif is_tzlocal(tz2):
+        return _tz_convert_tzlocal_utc(utc_date, tz2, to_utc=False)
+    else:
+        # Convert UTC to other timezone
+        arr[0] = utc_date
+        # Note: at least with cython 0.28.3, doing a lookup `[0]` in the next
+        # line is sensitive to the declared return type of _tz_convert_dst;
+        # if it is declared as returning ndarray[int64_t], a compile-time error
+        # is raised.
+        return _tz_convert_dst(arr, tz2, to_utc=False)[0]
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+cdef inline int64_t[:] _tz_convert_one_way(int64_t[:] vals, object tz,
+                                           bint to_utc):
+    """
+    Convert the given values (in i8) either to UTC or from UTC.
+
+    Parameters
+    ----------
+    vals : int64 ndarray
+    tz1 : string / timezone object
+    to_utc : bint
+
+    Returns
+    -------
+    converted : ndarray[int64_t]
+    """
+    cdef:
+        int64_t[:] converted, result
+        Py_ssize_t i, n = len(vals)
+        int64_t val
+
+    if not is_utc(get_timezone(tz)):
+        converted = np.empty(n, dtype=np.int64)
+        if is_tzlocal(tz):
+            for i in range(n):
+                val = vals[i]
+                if val == NPY_NAT:
+                    converted[i] = NPY_NAT
+                else:
+                    converted[i] = _tz_convert_tzlocal_utc(val, tz, to_utc)
+        else:
+            converted = _tz_convert_dst(vals, tz, to_utc)
+    else:
+        converted = vals
+
+    return converted
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def tz_convert(int64_t[:] vals, object tz1, object tz2):
+    """
+    Convert the values (in i8) from timezone1 to timezone2
+
+    Parameters
+    ----------
+    vals : int64 ndarray
+    tz1 : string / timezone object
+    tz2 : string / timezone object
+
+    Returns
+    -------
+    int64 ndarray of converted
+    """
+    cdef:
+        int64_t[:] utc_dates, converted
+
+    if len(vals) == 0:
+        return np.array([], dtype=np.int64)
+
+    # Convert to UTC
+    utc_dates = _tz_convert_one_way(vals, tz1, to_utc=True)
+    converted = _tz_convert_one_way(utc_dates, tz2, to_utc=False)
+    return np.array(converted, dtype=np.int64)
+
+
+# TODO: cdef scalar version to call from convert_str_to_tsobject
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def tz_localize_to_utc(ndarray[int64_t] vals, object tz, object ambiguous=None,
+                       object nonexistent=None):
+    """
+    Localize tzinfo-naive i8 to given time zone (using pytz). If
+    there are ambiguities in the values, raise AmbiguousTimeError.
+
+    Parameters
+    ----------
+    vals : ndarray[int64_t]
+    tz : tzinfo or None
+    ambiguous : str, bool, or arraylike
+        When clocks moved backward due to DST, ambiguous times may arise.
+        For example in Central European Time (UTC+01), when going from 03:00
+        DST to 02:00 non-DST, 02:30:00 local time occurs both at 00:30:00 UTC
+        and at 01:30:00 UTC. In such a situation, the `ambiguous` parameter
+        dictates how ambiguous times should be handled.
+
+        - 'infer' will attempt to infer fall dst-transition hours based on
+          order
+        - bool-ndarray where True signifies a DST time, False signifies a
+          non-DST time (note that this flag is only applicable for ambiguous
+          times, but the array must have the same length as vals)
+        - bool if True, treat all vals as DST. If False, treat them as non-DST
+        - 'NaT' will return NaT where there are ambiguous times
+
+    nonexistent : {None, "NaT", "shift_forward", "shift_backward", "raise",
+                   timedelta-like}
+        How to handle non-existent times when converting wall times to UTC
+
+        .. versionadded:: 0.24.0
+
+    Returns
+    -------
+    localized : ndarray[int64_t]
+    """
+    cdef:
+        int64_t[:] deltas, idx_shifted, idx_shifted_left, idx_shifted_right
+        ndarray[uint8_t, cast=True] ambiguous_array, both_nat, both_eq
+        Py_ssize_t i, idx, pos, ntrans, n = len(vals)
+        Py_ssize_t delta_idx_offset, delta_idx, pos_left, pos_right
+        int64_t *tdata
+        int64_t v, left, right, val, v_left, v_right, new_local, remaining_mins
+        int64_t first_delta
+        int64_t HOURS_NS = HOUR_SECONDS * 1000000000, shift_delta = 0
+        ndarray[int64_t] trans, result, result_a, result_b, dst_hours, delta
+        ndarray trans_idx, grp, a_idx, b_idx, one_diff
+        npy_datetimestruct dts
+        bint infer_dst = False, is_dst = False, fill = False
+        bint shift_forward = False, shift_backward = False
+        bint fill_nonexist = False
+        list trans_grp
+        str stamp
+
+    # Vectorized version of DstTzInfo.localize
+    if is_utc(tz) or tz is None:
+        return vals
+
+    result = np.empty(n, dtype=np.int64)
+
+    if is_tzlocal(tz):
+        for i in range(n):
+            v = vals[i]
+            if v == NPY_NAT:
+                result[i] = NPY_NAT
+            else:
+                result[i] = _tz_convert_tzlocal_utc(v, tz, to_utc=True)
+        return result
+
+    if is_string_object(ambiguous):
+        if ambiguous == 'infer':
+            infer_dst = True
+        elif ambiguous == 'NaT':
+            fill = True
+    elif isinstance(ambiguous, bool):
+        is_dst = True
+        if ambiguous:
+            ambiguous_array = np.ones(len(vals), dtype=bool)
+        else:
+            ambiguous_array = np.zeros(len(vals), dtype=bool)
+    elif hasattr(ambiguous, '__iter__'):
+        is_dst = True
+        if len(ambiguous) != len(vals):
+            raise ValueError("Length of ambiguous bool-array must be "
+                             "the same size as vals")
+        ambiguous_array = np.asarray(ambiguous, dtype=bool)
+
+    if nonexistent == 'NaT':
+        fill_nonexist = True
+    elif nonexistent == 'shift_forward':
+        shift_forward = True
+    elif nonexistent == 'shift_backward':
+        shift_backward = True
+    elif PyDelta_Check(nonexistent):
+        shift_delta = delta_to_nanoseconds(nonexistent)
+    elif nonexistent not in ('raise', None):
+        msg = ("nonexistent must be one of {'NaT', 'raise', 'shift_forward', "
+               "shift_backwards} or a timedelta object")
+        raise ValueError(msg)
+
+    trans, deltas, _ = get_dst_info(tz)
+
+    tdata = <int64_t*>cnp.PyArray_DATA(trans)
+    ntrans = len(trans)
+
+    # Determine whether each date lies left of the DST transition (store in
+    # result_a) or right of the DST transition (store in result_b)
+    result_a = np.empty(n, dtype=np.int64)
+    result_b = np.empty(n, dtype=np.int64)
+    result_a[:] = NPY_NAT
+    result_b[:] = NPY_NAT
+
+    idx_shifted_left = (np.maximum(0, trans.searchsorted(
+        vals - DAY_SECONDS * 1000000000, side='right') - 1)).astype(np.int64)
+
+    idx_shifted_right = (np.maximum(0, trans.searchsorted(
+        vals + DAY_SECONDS * 1000000000, side='right') - 1)).astype(np.int64)
+
+    for i in range(n):
+        val = vals[i]
+        v_left = val - deltas[idx_shifted_left[i]]
+        pos_left = bisect_right_i8(tdata, v_left, ntrans) - 1
+        # timestamp falls to the left side of the DST transition
+        if v_left + deltas[pos_left] == val:
+            result_a[i] = v_left
+
+        v_right = val - deltas[idx_shifted_right[i]]
+        pos_right = bisect_right_i8(tdata, v_right, ntrans) - 1
+        # timestamp falls to the right side of the DST transition
+        if v_right + deltas[pos_right] == val:
+            result_b[i] = v_right
+
+    if infer_dst:
+        dst_hours = np.empty(n, dtype=np.int64)
+        dst_hours[:] = NPY_NAT
+
+        # Get the ambiguous hours (given the above, these are the hours
+        # where result_a != result_b and neither of them are NAT)
+        both_nat = np.logical_and(result_a != NPY_NAT, result_b != NPY_NAT)
+        both_eq = result_a == result_b
+        trans_idx = np.squeeze(np.nonzero(np.logical_and(both_nat, ~both_eq)))
+        if trans_idx.size == 1:
+            stamp = _render_tstamp(vals[trans_idx])
+            raise pytz.AmbiguousTimeError(
+                "Cannot infer dst time from %s as there "
+                "are no repeated times".format(stamp))
+        # Split the array into contiguous chunks (where the difference between
+        # indices is 1).  These are effectively dst transitions in different
+        # years which is useful for checking that there is not an ambiguous
+        # transition in an individual year.
+        if trans_idx.size > 0:
+            one_diff = np.where(np.diff(trans_idx) != 1)[0] + 1
+            trans_grp = np.array_split(trans_idx, one_diff)
+
+            # Iterate through each day, if there are no hours where the
+            # delta is negative (indicates a repeat of hour) the switch
+            # cannot be inferred
+            for grp in trans_grp:
+
+                delta = np.diff(result_a[grp])
+                if grp.size == 1 or np.all(delta > 0):
+                    stamp = _render_tstamp(vals[grp[0]])
+                    raise pytz.AmbiguousTimeError(stamp)
+
+                # Find the index for the switch and pull from a for dst and b
+                # for standard
+                switch_idx = (delta <= 0).nonzero()[0]
+                if switch_idx.size > 1:
+                    raise pytz.AmbiguousTimeError(
+                        "There are %i dst switches when "
+                        "there should only be 1.".format(switch_idx.size))
+                switch_idx = switch_idx[0] + 1
+                # Pull the only index and adjust
+                a_idx = grp[:switch_idx]
+                b_idx = grp[switch_idx:]
+                dst_hours[grp] = np.hstack((result_a[a_idx], result_b[b_idx]))
+
+    for i in range(n):
+        val = vals[i]
+        left = result_a[i]
+        right = result_b[i]
+        if val == NPY_NAT:
+            result[i] = val
+        elif left != NPY_NAT and right != NPY_NAT:
+            if left == right:
+                result[i] = left
+            else:
+                if infer_dst and dst_hours[i] != NPY_NAT:
+                    result[i] = dst_hours[i]
+                elif is_dst:
+                    if ambiguous_array[i]:
+                        result[i] = left
+                    else:
+                        result[i] = right
+                elif fill:
+                    result[i] = NPY_NAT
+                else:
+                    stamp = _render_tstamp(val)
+                    raise pytz.AmbiguousTimeError(
+                        "Cannot infer dst time from %r, try using the "
+                        "'ambiguous' argument".format(stamp))
+        elif left != NPY_NAT:
+            result[i] = left
+        elif right != NPY_NAT:
+            result[i] = right
+        else:
+            # Handle nonexistent times
+            if shift_forward or shift_backward or shift_delta != 0:
+                # Shift the nonexistent time to the closest existing time
+                remaining_mins = val % HOURS_NS
+                if shift_delta != 0:
+                    # Validate that we don't relocalize on another nonexistent
+                    # time
+                    if -1 < shift_delta + remaining_mins < HOURS_NS:
+                        raise ValueError(
+                            "The provided timedelta will relocalize on a "
+                            "nonexistent time: {}".format(nonexistent)
+                        )
+                    new_local = val + shift_delta
+                elif shift_forward:
+                    new_local = val + (HOURS_NS - remaining_mins)
+                else:
+                    # Subtract 1 since the beginning hour is _inclusive_ of
+                    # nonexistent times
+                    new_local = val - remaining_mins - 1
+                delta_idx = trans.searchsorted(new_local, side='right')
+                # Shift the delta_idx by if the UTC offset of
+                # the target tz is greater than 0 and we're moving forward
+                # or vice versa
+                first_delta = deltas[0]
+                if (shift_forward or shift_delta > 0) and first_delta > 0:
+                    delta_idx_offset = 1
+                elif (shift_backward or shift_delta < 0) and first_delta < 0:
+                    delta_idx_offset = 1
+                else:
+                    delta_idx_offset = 0
+                delta_idx = delta_idx - delta_idx_offset
+                result[i] = new_local - deltas[delta_idx]
+            elif fill_nonexist:
+                result[i] = NPY_NAT
+            else:
+                stamp = _render_tstamp(val)
+                raise pytz.NonExistentTimeError(stamp)
+
+    return result
+
+
+cdef inline Py_ssize_t bisect_right_i8(int64_t *data,
+                                       int64_t val, Py_ssize_t n):
+    cdef:
+        Py_ssize_t pivot, left = 0, right = n
+
+    assert n >= 1
+
+    # edge cases
+    if val > data[n - 1]:
+        return n
+
+    if val < data[0]:
+        return 0
+
+    while left < right:
+        pivot = left + (right - left) // 2
+
+        if data[pivot] <= val:
+            left = pivot + 1
+        else:
+            right = pivot
+
+    return left
+
+
+cdef inline str _render_tstamp(int64_t val):
+    """ Helper function to render exception messages"""
+    from pandas._libs.tslibs.timestamps import Timestamp
+    return str(Timestamp(val))
+
+
+# ----------------------------------------------------------------------
+# Normalization
+
+
+def normalize_date(dt: object) -> datetime:
+    """
+    Normalize datetime.datetime value to midnight. Returns datetime.date as a
+    datetime.datetime at midnight
+
+    Parameters
+    ----------
+    dt : date, datetime, or Timestamp
+
+    Returns
+    -------
+    normalized : datetime.datetime or Timestamp
+
+    Raises
+    ------
+    TypeError : if input is not datetime.date, datetime.datetime, or Timestamp
+    """
+    if PyDateTime_Check(dt):
+        if not PyDateTime_CheckExact(dt):
+            # i.e. a Timestamp object
+            return dt.replace(hour=0, minute=0, second=0, microsecond=0,
+                              nanosecond=0)
+        else:
+            # regular datetime object
+            return dt.replace(hour=0, minute=0, second=0, microsecond=0)
+            # TODO: Make sure DST crossing is handled correctly here
+    elif PyDate_Check(dt):
+        return datetime(dt.year, dt.month, dt.day)
+    else:
+        raise TypeError('Unrecognized type: %s' % type(dt))
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def normalize_i8_timestamps(int64_t[:] stamps, object tz):
+    """
+    Normalize each of the (nanosecond) timezone aware timestamps in the given
+    array by rounding down to the beginning of the day (i.e. midnight).
+    This is midnight for timezone, `tz`.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo or None
+
+    Returns
+    -------
+    result : int64 ndarray of converted of normalized nanosecond timestamps
+    """
+    cdef:
+        Py_ssize_t n = len(stamps)
+        int64_t[:] result = np.empty(n, dtype=np.int64)
+
+    result = _normalize_local(stamps, tz)
+
+    return result.base  # .base to access underlying np.ndarray
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef int64_t[:] _normalize_local(int64_t[:] stamps, tzinfo tz):
+    """
+    Normalize each of the (nanosecond) timestamps in the given array by
+    rounding down to the beginning of the day (i.e. midnight) for the
+    given timezone `tz`.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo
+
+    Returns
+    -------
+    result : int64 ndarray of converted of normalized nanosecond timestamps
+    """
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        int64_t[:] result = np.empty(n, dtype=np.int64)
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        str typ
+        Py_ssize_t[:] pos
+        npy_datetimestruct dts
+        int64_t delta, local_val
+
+    if is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                result[i] = NPY_NAT
+                continue
+            local_val = _tz_convert_tzlocal_utc(stamps[i], tz, to_utc=False)
+            dt64_to_dtstruct(local_val, &dts)
+            result[i] = _normalized_stamp(&dts)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        if typ not in ['pytz', 'dateutil']:
+            # static/fixed; in this case we know that len(delta) == 1
+            delta = deltas[0]
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + delta, &dts)
+                result[i] = _normalized_stamp(&dts)
+        else:
+            pos = trans.searchsorted(stamps, side='right') - 1
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                result[i] = _normalized_stamp(&dts)
+
+    return result
+
+
+cdef inline int64_t _normalized_stamp(npy_datetimestruct *dts) nogil:
+    """
+    Normalize the given datetimestruct to midnight, then convert to int64_t.
+
+    Parameters
+    ----------
+    *dts : pointer to npy_datetimestruct
+
+    Returns
+    -------
+    stamp : int64
+    """
+    dts.hour = 0
+    dts.min = 0
+    dts.sec = 0
+    dts.us = 0
+    dts.ps = 0
+    return dtstruct_to_dt64(dts)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def is_date_array_normalized(int64_t[:] stamps, object tz=None):
+    """
+    Check if all of the given (nanosecond) timestamps are normalized to
+    midnight, i.e. hour == minute == second == 0.  If the optional timezone
+    `tz` is not None, then this is midnight for this timezone.
+
+    Parameters
+    ----------
+    stamps : int64 ndarray
+    tz : tzinfo or None
+
+    Returns
+    -------
+    is_normalized : bool True if all stamps are normalized
+    """
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        intp_t[:] pos
+        npy_datetimestruct dts
+        int64_t local_val, delta
+        str typ
+
+    if tz is None or is_utc(tz):
+        for i in range(n):
+            dt64_to_dtstruct(stamps[i], &dts)
+            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                return False
+    elif is_tzlocal(tz):
+        for i in range(n):
+            local_val = _tz_convert_tzlocal_utc(stamps[i], tz, to_utc=False)
+            dt64_to_dtstruct(local_val, &dts)
+            if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                return False
+    else:
+        trans, deltas, typ = get_dst_info(tz)
+
+        if typ not in ['pytz', 'dateutil']:
+            # static/fixed; in this case we know that len(delta) == 1
+            delta = deltas[0]
+            for i in range(n):
+                # Adjust datetime64 timestamp, recompute datetimestruct
+                dt64_to_dtstruct(stamps[i] + delta, &dts)
+                if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                    return False
+
+        else:
+            pos = trans.searchsorted(stamps) - 1
+            for i in range(n):
+                # Adjust datetime64 timestamp, recompute datetimestruct
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                if (dts.hour + dts.min + dts.sec + dts.us) > 0:
+                    return False
+
+    return True
diff --git a/pandas/_libs/tslibs/fields.pyx b/pandas/_libs/tslibs/fields.pyx
new file mode 100644
index 0000000000000..240f008394099
--- /dev/null
+++ b/pandas/_libs/tslibs/fields.pyx
@@ -0,0 +1,669 @@
+# -*- coding: utf-8 -*-
+"""
+Functions for accessing attributes of Timestamp/datetime64/datetime-like
+objects and arrays
+"""
+
+import cython
+from cython import Py_ssize_t
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, int32_t, int8_t
+cnp.import_array()
+
+from pandas._libs.tslibs.ccalendar import (
+    get_locale_names, MONTHS_FULL, DAYS_FULL, DAY_SECONDS)
+from pandas._libs.tslibs.ccalendar cimport (
+    get_days_in_month, is_leapyear, dayofweek, get_week_of_year,
+    get_day_of_year)
+from pandas._libs.tslibs.np_datetime cimport (
+    npy_datetimestruct, pandas_timedeltastruct, dt64_to_dtstruct,
+    td64_to_tdstruct)
+from pandas._libs.tslibs.nattype cimport NPY_NAT
+
+
+def get_time_micros(ndarray[int64_t] dtindex):
+    """
+    Return the number of microseconds in the time component of a
+    nanosecond timestamp.
+
+    Parameters
+    ----------
+    dtindex : ndarray[int64_t]
+
+    Returns
+    -------
+    micros : ndarray[int64_t]
+    """
+    cdef:
+        ndarray[int64_t] micros
+
+    micros = np.mod(dtindex, DAY_SECONDS * 1000000000, dtype=np.int64)
+    micros //= 1000
+    return micros
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def build_field_sarray(int64_t[:] dtindex):
+    """
+    Datetime as int64 representation to a structured array of fields
+    """
+    cdef:
+        Py_ssize_t i, count = len(dtindex)
+        npy_datetimestruct dts
+        ndarray[int32_t] years, months, days, hours, minutes, seconds, mus
+
+    sa_dtype = [('Y', 'i4'),  # year
+                ('M', 'i4'),  # month
+                ('D', 'i4'),  # day
+                ('h', 'i4'),  # hour
+                ('m', 'i4'),  # min
+                ('s', 'i4'),  # second
+                ('u', 'i4')]  # microsecond
+
+    out = np.empty(count, dtype=sa_dtype)
+
+    years = out['Y']
+    months = out['M']
+    days = out['D']
+    hours = out['h']
+    minutes = out['m']
+    seconds = out['s']
+    mus = out['u']
+
+    for i in range(count):
+        dt64_to_dtstruct(dtindex[i], &dts)
+        years[i] = dts.year
+        months[i] = dts.month
+        days[i] = dts.day
+        hours[i] = dts.hour
+        minutes[i] = dts.min
+        seconds[i] = dts.sec
+        mus[i] = dts.us
+
+    return out
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_date_name_field(int64_t[:] dtindex, object field, object locale=None):
+    """
+    Given a int64-based datetime index, return array of strings of date
+    name based on requested field (e.g. weekday_name)
+    """
+    cdef:
+        Py_ssize_t i, count = len(dtindex)
+        ndarray[object] out, names
+        npy_datetimestruct dts
+        int dow
+
+    out = np.empty(count, dtype=object)
+
+    if field == 'day_name' or field == 'weekday_name':
+        if locale is None:
+            names = np.array(DAYS_FULL, dtype=np.object_)
+        else:
+            names = np.array(get_locale_names('f_weekday', locale),
+                             dtype=np.object_)
+        for i in range(count):
+            if dtindex[i] == NPY_NAT:
+                out[i] = np.nan
+                continue
+
+            dt64_to_dtstruct(dtindex[i], &dts)
+            dow = dayofweek(dts.year, dts.month, dts.day)
+            out[i] = names[dow].capitalize()
+
+    elif field == 'month_name':
+        if locale is None:
+            names = np.array(MONTHS_FULL, dtype=np.object_)
+        else:
+            names = np.array(get_locale_names('f_month', locale),
+                             dtype=np.object_)
+        for i in range(count):
+            if dtindex[i] == NPY_NAT:
+                out[i] = np.nan
+                continue
+
+            dt64_to_dtstruct(dtindex[i], &dts)
+            out[i] = names[dts.month].capitalize()
+
+    else:
+        raise ValueError("Field {field} not supported".format(field=field))
+
+    return out
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_start_end_field(int64_t[:] dtindex, object field,
+                        object freqstr=None, int month_kw=12):
+    """
+    Given an int64-based datetime index return array of indicators
+    of whether timestamps are at the start/end of the month/quarter/year
+    (defined by frequency).
+    """
+    cdef:
+        Py_ssize_t i
+        int count = len(dtindex)
+        bint is_business = 0
+        int end_month = 12
+        int start_month = 1
+        ndarray[int8_t] out
+        ndarray[int32_t, ndim=2] _month_offset
+        bint isleap
+        npy_datetimestruct dts
+        int mo_off, dom, doy, dow, ldom
+
+    _month_offset = np.array(
+        [[0, 31, 59, 90, 120, 151, 181, 212, 243, 273, 304, 334, 365],
+         [0, 31, 60, 91, 121, 152, 182, 213, 244, 274, 305, 335, 366]],
+        dtype=np.int32)
+
+    out = np.zeros(count, dtype='int8')
+
+    if freqstr:
+        if freqstr == 'C':
+            raise ValueError("Custom business days is not supported by {field}"
+                             .format(field=field))
+        is_business = freqstr[0] == 'B'
+
+        # YearBegin(), BYearBegin() use month = starting month of year.
+        # QuarterBegin(), BQuarterBegin() use startingMonth = starting
+        # month of year. Other offests use month, startingMonth as ending
+        # month of year.
+
+        if (freqstr[0:2] in ['MS', 'QS', 'AS']) or (
+                freqstr[1:3] in ['MS', 'QS', 'AS']):
+            end_month = 12 if month_kw == 1 else month_kw - 1
+            start_month = month_kw
+        else:
+            end_month = month_kw
+            start_month = (end_month % 12) + 1
+    else:
+        end_month = 12
+        start_month = 1
+
+    if field == 'is_month_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (dom == 1 and dow < 5) or (dom <= 3 and dow == 0):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if dom == 1:
+                    out[i] = 1
+
+    elif field == 'is_month_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (ldom == doy and dow < 5) or (
+                        dow == 4 and (ldom - doy <= 2)):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if ldom == doy:
+                    out[i] = 1
+
+    elif field == 'is_quarter_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if ((dts.month - start_month) % 3 == 0) and (
+                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if ((dts.month - start_month) % 3 == 0) and dom == 1:
+                    out[i] = 1
+
+    elif field == 'is_quarter_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if ((dts.month - end_month) % 3 == 0) and (
+                        (ldom == doy and dow < 5) or (
+                            dow == 4 and (ldom - doy <= 2))):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if ((dts.month - end_month) % 3 == 0) and (ldom == doy):
+                    out[i] = 1
+
+    elif field == 'is_year_start':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+                dow = dayofweek(dts.year, dts.month, dts.day)
+
+                if (dts.month == start_month) and (
+                        (dom == 1 and dow < 5) or (dom <= 3 and dow == 0)):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dom = dts.day
+
+                if (dts.month == start_month) and dom == 1:
+                    out[i] = 1
+
+    elif field == 'is_year_end':
+        if is_business:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                dom = dts.day
+                mo_off = _month_offset[isleap, dts.month - 1]
+                doy = mo_off + dom
+                dow = dayofweek(dts.year, dts.month, dts.day)
+                ldom = _month_offset[isleap, dts.month]
+
+                if (dts.month == end_month) and (
+                        (ldom == doy and dow < 5) or (
+                            dow == 4 and (ldom - doy <= 2))):
+                    out[i] = 1
+
+        else:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = 0
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                isleap = is_leapyear(dts.year)
+                mo_off = _month_offset[isleap, dts.month - 1]
+                dom = dts.day
+                doy = mo_off + dom
+                ldom = _month_offset[isleap, dts.month]
+
+                if (dts.month == end_month) and (ldom == doy):
+                    out[i] = 1
+
+    else:
+        raise ValueError("Field {field} not supported".format(field=field))
+
+    return out.view(bool)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_date_field(int64_t[:] dtindex, object field):
+    """
+    Given a int64-based datetime index, extract the year, month, etc.,
+    field and return an array of these values.
+    """
+    cdef:
+        Py_ssize_t i, count = len(dtindex)
+        ndarray[int32_t] out
+        npy_datetimestruct dts
+
+    out = np.empty(count, dtype='i4')
+
+    if field == 'Y':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.year
+        return out
+
+    elif field == 'M':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.month
+        return out
+
+    elif field == 'D':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.day
+        return out
+
+    elif field == 'h':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.hour
+        return out
+
+    elif field == 'm':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.min
+        return out
+
+    elif field == 's':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.sec
+        return out
+
+    elif field == 'us':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.us
+        return out
+
+    elif field == 'ns':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.ps / 1000
+        return out
+    elif field == 'doy':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_day_of_year(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'dow':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dayofweek(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'woy':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_week_of_year(dts.year, dts.month, dts.day)
+        return out
+
+    elif field == 'q':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = dts.month
+                out[i] = ((out[i] - 1) / 3) + 1
+        return out
+
+    elif field == 'dim':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                out[i] = get_days_in_month(dts.year, dts.month)
+        return out
+    elif field == 'is_leap_year':
+        return isleapyear_arr(get_date_field(dtindex, 'Y'))
+
+    raise ValueError("Field %s not supported" % field)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_timedelta_field(int64_t[:] tdindex, object field):
+    """
+    Given a int64-based timedelta index, extract the days, hrs, sec.,
+    field and return an array of these values.
+    """
+    cdef:
+        Py_ssize_t i, count = len(tdindex)
+        ndarray[int32_t] out
+        pandas_timedeltastruct tds
+
+    out = np.empty(count, dtype='i4')
+
+    if field == 'days':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.days
+        return out
+
+    elif field == 'h':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.hrs
+        return out
+
+    elif field == 's':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.sec
+        return out
+
+    elif field == 'seconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.seconds
+        return out
+
+    elif field == 'ms':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.ms
+        return out
+
+    elif field == 'microseconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.microseconds
+        return out
+
+    elif field == 'us':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.us
+        return out
+
+    elif field == 'ns':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.ns
+        return out
+
+    elif field == 'nanoseconds':
+        with nogil:
+            for i in range(count):
+                if tdindex[i] == NPY_NAT:
+                    out[i] = -1
+                    continue
+
+                td64_to_tdstruct(tdindex[i], &tds)
+                out[i] = tds.nanoseconds
+        return out
+
+    raise ValueError("Field %s not supported" % field)
+
+
+cpdef isleapyear_arr(ndarray years):
+    """vectorized version of isleapyear; NaT evaluates as False"""
+    cdef:
+        ndarray[int8_t] out
+
+    out = np.zeros(len(years), dtype='int8')
+    out[np.logical_or(years % 400 == 0,
+                      np.logical_and(years % 4 == 0,
+                                     years % 100 > 0))] = 1
+    return out.view(bool)
diff --git a/pandas/_libs/tslibs/frequencies.pxd b/pandas/_libs/tslibs/frequencies.pxd
new file mode 100644
index 0000000000000..4e7949e55c836
--- /dev/null
+++ b/pandas/_libs/tslibs/frequencies.pxd
@@ -0,0 +1,9 @@
+# -*- coding: utf-8 -*-
+
+cpdef object get_rule_month(object source, object default=*)
+
+cpdef get_freq_code(freqstr)
+cpdef object get_freq(object freq)
+cpdef str get_base_alias(freqstr)
+cpdef int get_to_timestamp_base(int base)
+cpdef str get_freq_str(base, mult=*)
diff --git a/pandas/_libs/tslibs/frequencies.pyx b/pandas/_libs/tslibs/frequencies.pyx
new file mode 100644
index 0000000000000..bd9e68e134407
--- /dev/null
+++ b/pandas/_libs/tslibs/frequencies.pyx
@@ -0,0 +1,512 @@
+# -*- coding: utf-8 -*-
+import re
+
+cimport numpy as cnp
+cnp.import_array()
+
+from pandas._libs.tslibs.util cimport is_integer_object, is_string_object
+
+from pandas._libs.tslibs.ccalendar import MONTH_NUMBERS
+
+# ----------------------------------------------------------------------
+# Constants
+
+# hack to handle WOM-1MON
+opattern = re.compile(
+    r'([+\-]?\d*|[+\-]?\d*\.\d*)\s*([A-Za-z]+([\-][\dA-Za-z\-]+)?)'
+)
+
+INVALID_FREQ_ERR_MSG = "Invalid frequency: {0}"
+
+# ---------------------------------------------------------------------
+# Period codes
+
+
+class FreqGroup(object):
+    FR_ANN = 1000
+    FR_QTR = 2000
+    FR_MTH = 3000
+    FR_WK = 4000
+    FR_BUS = 5000
+    FR_DAY = 6000
+    FR_HR = 7000
+    FR_MIN = 8000
+    FR_SEC = 9000
+    FR_MS = 10000
+    FR_US = 11000
+    FR_NS = 12000
+
+
+# period frequency constants corresponding to scikits timeseries
+# originals
+_period_code_map = {
+    # Annual freqs with various fiscal year ends.
+    # eg, 2005 for A-FEB runs Mar 1, 2004 to Feb 28, 2005
+    "A-DEC": 1000,  # Annual - December year end
+    "A-JAN": 1001,  # Annual - January year end
+    "A-FEB": 1002,  # Annual - February year end
+    "A-MAR": 1003,  # Annual - March year end
+    "A-APR": 1004,  # Annual - April year end
+    "A-MAY": 1005,  # Annual - May year end
+    "A-JUN": 1006,  # Annual - June year end
+    "A-JUL": 1007,  # Annual - July year end
+    "A-AUG": 1008,  # Annual - August year end
+    "A-SEP": 1009,  # Annual - September year end
+    "A-OCT": 1010,  # Annual - October year end
+    "A-NOV": 1011,  # Annual - November year end
+
+    # Quarterly frequencies with various fiscal year ends.
+    # eg, Q42005 for Q-OCT runs Aug 1, 2005 to Oct 31, 2005
+    "Q-DEC": 2000,    # Quarterly - December year end
+    "Q-JAN": 2001,    # Quarterly - January year end
+    "Q-FEB": 2002,    # Quarterly - February year end
+    "Q-MAR": 2003,    # Quarterly - March year end
+    "Q-APR": 2004,    # Quarterly - April year end
+    "Q-MAY": 2005,    # Quarterly - May year end
+    "Q-JUN": 2006,    # Quarterly - June year end
+    "Q-JUL": 2007,    # Quarterly - July year end
+    "Q-AUG": 2008,    # Quarterly - August year end
+    "Q-SEP": 2009,    # Quarterly - September year end
+    "Q-OCT": 2010,    # Quarterly - October year end
+    "Q-NOV": 2011,    # Quarterly - November year end
+
+    "M": 3000,        # Monthly
+
+    "W-SUN": 4000,    # Weekly - Sunday end of week
+    "W-MON": 4001,    # Weekly - Monday end of week
+    "W-TUE": 4002,    # Weekly - Tuesday end of week
+    "W-WED": 4003,    # Weekly - Wednesday end of week
+    "W-THU": 4004,    # Weekly - Thursday end of week
+    "W-FRI": 4005,    # Weekly - Friday end of week
+    "W-SAT": 4006,    # Weekly - Saturday end of week
+
+    "B": 5000,        # Business days
+    "D": 6000,        # Daily
+    "H": 7000,        # Hourly
+    "T": 8000,        # Minutely
+    "S": 9000,        # Secondly
+    "L": 10000,       # Millisecondly
+    "U": 11000,       # Microsecondly
+    "N": 12000}       # Nanosecondly
+
+
+_reverse_period_code_map = {
+    _period_code_map[key]: key for key in _period_code_map}
+
+# Yearly aliases; careful not to put these in _reverse_period_code_map
+_period_code_map.update({'Y' + key[1:]: _period_code_map[key]
+                         for key in _period_code_map
+                         if key.startswith('A-')})
+
+_period_code_map.update({
+    "Q": 2000,   # Quarterly - December year end (default quarterly)
+    "A": 1000,   # Annual
+    "W": 4000,   # Weekly
+    "C": 5000})  # Custom Business Day
+
+_lite_rule_alias = {
+    'W': 'W-SUN',
+    'Q': 'Q-DEC',
+
+    'A': 'A-DEC',      # YearEnd(month=12),
+    'Y': 'A-DEC',
+    'AS': 'AS-JAN',    # YearBegin(month=1),
+    'YS': 'AS-JAN',
+    'BA': 'BA-DEC',    # BYearEnd(month=12),
+    'BY': 'BA-DEC',
+    'BAS': 'BAS-JAN',  # BYearBegin(month=1),
+    'BYS': 'BAS-JAN',
+
+    'Min': 'T',
+    'min': 'T',
+    'ms': 'L',
+    'us': 'U',
+    'ns': 'N'}
+
+_dont_uppercase = {'MS', 'ms'}
+
+# ----------------------------------------------------------------------
+
+cpdef get_freq_code(freqstr):
+    """
+    Return freq str or tuple to freq code and stride (mult)
+
+    Parameters
+    ----------
+    freqstr : str or tuple
+
+    Returns
+    -------
+    return : tuple of base frequency code and stride (mult)
+
+    Examples
+    --------
+    >>> get_freq_code('3D')
+    (6000, 3)
+
+    >>> get_freq_code('D')
+    (6000, 1)
+
+    >>> get_freq_code(('D', 3))
+    (6000, 3)
+    """
+    if getattr(freqstr, '_typ', None) == 'dateoffset':
+        freqstr = (freqstr.rule_code, freqstr.n)
+
+    if isinstance(freqstr, tuple):
+        if is_integer_object(freqstr[0]) and is_integer_object(freqstr[1]):
+            # e.g., freqstr = (2000, 1)
+            return freqstr
+        else:
+            # e.g., freqstr = ('T', 5)
+            try:
+                code = _period_str_to_code(freqstr[0])
+                stride = freqstr[1]
+            except:
+                if is_integer_object(freqstr[1]):
+                    raise
+                code = _period_str_to_code(freqstr[1])
+                stride = freqstr[0]
+            return code, stride
+
+    if is_integer_object(freqstr):
+        return freqstr, 1
+
+    base, stride = _base_and_stride(freqstr)
+    code = _period_str_to_code(base)
+
+    return code, stride
+
+
+cpdef _base_and_stride(freqstr):
+    """
+    Return base freq and stride info from string representation
+
+    Returns
+    -------
+    base : str
+    stride : int
+
+    Examples
+    --------
+    _freq_and_stride('5Min') -> 'Min', 5
+    """
+    groups = opattern.match(freqstr)
+
+    if not groups:
+        raise ValueError("Could not evaluate {freq}".format(freq=freqstr))
+
+    stride = groups.group(1)
+
+    if len(stride):
+        stride = int(stride)
+    else:
+        stride = 1
+
+    base = groups.group(2)
+
+    return base, stride
+
+
+cpdef _period_str_to_code(freqstr):
+    freqstr = _lite_rule_alias.get(freqstr, freqstr)
+
+    if freqstr not in _dont_uppercase:
+        lower = freqstr.lower()
+        freqstr = _lite_rule_alias.get(lower, freqstr)
+
+    if freqstr not in _dont_uppercase:
+        freqstr = freqstr.upper()
+    try:
+        return _period_code_map[freqstr]
+    except KeyError:
+        raise ValueError(INVALID_FREQ_ERR_MSG.format(freqstr))
+
+
+cpdef str get_freq_str(base, mult=1):
+    """
+    Return the summary string associated with this offset code, possibly
+    adjusted by a multiplier.
+
+    Parameters
+    ----------
+    base : int (member of FreqGroup)
+
+    Returns
+    -------
+    freq_str : str
+
+    Examples
+    --------
+    >>> get_freq_str(1000)
+    'A-DEC'
+
+    >>> get_freq_str(2000, 2)
+    '2Q-DEC'
+
+    >>> get_freq_str("foo")
+    """
+    code = _reverse_period_code_map.get(base)
+    if mult == 1:
+        return code
+    return str(mult) + code
+
+
+cpdef str get_base_alias(freqstr):
+    """
+    Returns the base frequency alias, e.g., '5D' -> 'D'
+
+    Parameters
+    ----------
+    freqstr : str
+
+    Returns
+    -------
+    base_alias : str
+    """
+    return _base_and_stride(freqstr)[0]
+
+
+cpdef int get_to_timestamp_base(int base):
+    """
+    Return frequency code group used for base of to_timestamp against
+    frequency code.
+
+    Parameters
+    ----------
+    base : int (member of FreqGroup)
+
+    Returns
+    -------
+    base : int
+
+    Examples
+    --------
+    # Return day freq code against longer freq than day
+    >>> get_to_timestamp_base(get_freq_code('D')[0])
+    6000
+    >>> get_to_timestamp_base(get_freq_code('W')[0])
+    6000
+    >>> get_to_timestamp_base(get_freq_code('M')[0])
+    6000
+
+    # Return second freq code against hour between second
+    >>> get_to_timestamp_base(get_freq_code('H')[0])
+    9000
+    >>> get_to_timestamp_base(get_freq_code('S')[0])
+    9000
+    """
+    if base < FreqGroup.FR_BUS:
+        return FreqGroup.FR_DAY
+    elif FreqGroup.FR_HR <= base <= FreqGroup.FR_SEC:
+        return FreqGroup.FR_SEC
+    return base
+
+
+cpdef object get_freq(object freq):
+    """
+    Return frequency code of given frequency str.
+    If input is not string, return input as it is.
+
+    Examples
+    --------
+    >>> get_freq('A')
+    1000
+
+    >>> get_freq('3A')
+    1000
+    """
+    if is_string_object(freq):
+        base, mult = get_freq_code(freq)
+        freq = base
+    return freq
+
+
+# ----------------------------------------------------------------------
+# Frequency comparison
+
+def is_subperiod(source, target) -> bint:
+    """
+    Returns True if downsampling is possible between source and target
+    frequencies
+
+    Parameters
+    ----------
+    source : string or DateOffset
+        Frequency converting from
+    target : string or DateOffset
+        Frequency converting to
+
+    Returns
+    -------
+    is_subperiod : boolean
+    """
+
+    if target is None or source is None:
+        return False
+    source = _maybe_coerce_freq(source)
+    target = _maybe_coerce_freq(target)
+
+    if _is_annual(target):
+        if _is_quarterly(source):
+            return _quarter_months_conform(get_rule_month(source),
+                                           get_rule_month(target))
+        return source in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_quarterly(target):
+        return source in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_monthly(target):
+        return source in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_weekly(target):
+        return source in {target, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'B':
+        return source in {'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'C':
+        return source in {'C', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'D':
+        return source in {'D', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'H':
+        return source in {'H', 'T', 'S', 'L', 'U', 'N'}
+    elif target == 'T':
+        return source in {'T', 'S', 'L', 'U', 'N'}
+    elif target == 'S':
+        return source in {'S', 'L', 'U', 'N'}
+    elif target == 'L':
+        return source in {'L', 'U', 'N'}
+    elif target == 'U':
+        return source in {'U', 'N'}
+    elif target == 'N':
+        return source in {'N'}
+
+
+def is_superperiod(source, target) -> bint:
+    """
+    Returns True if upsampling is possible between source and target
+    frequencies
+
+    Parameters
+    ----------
+    source : string
+        Frequency converting from
+    target : string
+        Frequency converting to
+
+    Returns
+    -------
+    is_superperiod : boolean
+    """
+    if target is None or source is None:
+        return False
+    source = _maybe_coerce_freq(source)
+    target = _maybe_coerce_freq(target)
+
+    if _is_annual(source):
+        if _is_annual(target):
+            return get_rule_month(source) == get_rule_month(target)
+
+        if _is_quarterly(target):
+            smonth = get_rule_month(source)
+            tmonth = get_rule_month(target)
+            return _quarter_months_conform(smonth, tmonth)
+        return target in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_quarterly(source):
+        return target in {'D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_monthly(source):
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif _is_weekly(source):
+        return target in {source, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'B':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'C':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'D':
+        return target in {'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'H':
+        return target in {'H', 'T', 'S', 'L', 'U', 'N'}
+    elif source == 'T':
+        return target in {'T', 'S', 'L', 'U', 'N'}
+    elif source == 'S':
+        return target in {'S', 'L', 'U', 'N'}
+    elif source == 'L':
+        return target in {'L', 'U', 'N'}
+    elif source == 'U':
+        return target in {'U', 'N'}
+    elif source == 'N':
+        return target in {'N'}
+
+
+cdef str _maybe_coerce_freq(code):
+    """ we might need to coerce a code to a rule_code
+    and uppercase it
+
+    Parameters
+    ----------
+    source : string or DateOffset
+        Frequency converting from
+
+    Returns
+    -------
+    code : string
+    """
+    assert code is not None
+    if getattr(code, '_typ', None) == 'dateoffset':
+        # i.e. isinstance(code, ABCDateOffset):
+        code = code.rule_code
+    return code.upper()
+
+
+cdef bint _quarter_months_conform(str source, str target):
+    snum = MONTH_NUMBERS[source]
+    tnum = MONTH_NUMBERS[target]
+    return snum % 3 == tnum % 3
+
+
+cdef bint _is_annual(str rule):
+    rule = rule.upper()
+    return rule == 'A' or rule.startswith('A-')
+
+
+cdef bint _is_quarterly(str rule):
+    rule = rule.upper()
+    return rule == 'Q' or rule.startswith('Q-') or rule.startswith('BQ')
+
+
+cdef bint _is_monthly(str rule):
+    rule = rule.upper()
+    return rule == 'M' or rule == 'BM'
+
+
+cdef bint _is_weekly(str rule):
+    rule = rule.upper()
+    return rule == 'W' or rule.startswith('W-')
+
+
+# ----------------------------------------------------------------------
+
+cpdef object get_rule_month(object source, object default='DEC'):
+    """
+    Return starting month of given freq, default is December.
+
+    Parameters
+    ----------
+    source : object
+    default : object (default "DEC")
+
+    Returns
+    -------
+    rule_month: object (usually string)
+
+    Examples
+    --------
+    >>> get_rule_month('D')
+    'DEC'
+
+    >>> get_rule_month('A-JAN')
+    'JAN'
+    """
+    if hasattr(source, 'freqstr'):
+        source = source.freqstr
+    source = source.upper()
+    if '-' not in source:
+        return default
+    else:
+        return source.split('-')[1]
diff --git a/pandas/_libs/tslibs/nattype.pxd b/pandas/_libs/tslibs/nattype.pxd
new file mode 100644
index 0000000000000..dae5bdc3f93b1
--- /dev/null
+++ b/pandas/_libs/tslibs/nattype.pxd
@@ -0,0 +1,20 @@
+# -*- coding: utf-8 -*-
+
+from cpython.datetime cimport datetime
+
+from numpy cimport int64_t
+cdef int64_t NPY_NAT
+
+cdef bint _nat_scalar_rules[6]
+
+
+cdef class _NaT(datetime):
+    cdef readonly:
+        int64_t value
+        object freq
+
+cdef _NaT c_NaT
+
+
+cdef bint checknull_with_nat(object val)
+cpdef bint is_null_datetimelike(object val, bint inat_is_null=*)
diff --git a/pandas/_libs/tslibs/nattype.pyx b/pandas/_libs/tslibs/nattype.pyx
new file mode 100644
index 0000000000000..79e2e256c501d
--- /dev/null
+++ b/pandas/_libs/tslibs/nattype.pyx
@@ -0,0 +1,745 @@
+# -*- coding: utf-8 -*-
+
+from cpython cimport (
+    PyObject_RichCompare,
+    Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE)
+
+from cpython.datetime cimport (datetime,
+                               PyDateTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+from pandas._libs.tslibs.np_datetime cimport (
+    get_datetime64_value, get_timedelta64_value)
+cimport pandas._libs.tslibs.util as util
+from pandas._libs.tslibs.util cimport (
+    get_nat, is_integer_object, is_float_object, is_datetime64_object,
+    is_timedelta64_object)
+
+# ----------------------------------------------------------------------
+# Constants
+nat_strings = {'NaT', 'nat', 'NAT', 'nan', 'NaN', 'NAN'}
+
+cdef int64_t NPY_NAT = get_nat()
+iNaT = NPY_NAT  # python-visible constant
+
+cdef bint _nat_scalar_rules[6]
+_nat_scalar_rules[Py_EQ] = False
+_nat_scalar_rules[Py_NE] = True
+_nat_scalar_rules[Py_LT] = False
+_nat_scalar_rules[Py_LE] = False
+_nat_scalar_rules[Py_GT] = False
+_nat_scalar_rules[Py_GE] = False
+
+# ----------------------------------------------------------------------
+
+
+def _make_nan_func(func_name, doc):
+    def f(*args, **kwargs):
+        return np.nan
+    f.__name__ = func_name
+    f.__doc__ = doc
+    return f
+
+
+def _make_nat_func(func_name, doc):
+    def f(*args, **kwargs):
+        return c_NaT
+    f.__name__ = func_name
+    f.__doc__ = doc
+    return f
+
+
+def _make_error_func(func_name, cls):
+    def f(*args, **kwargs):
+        raise ValueError("NaTType does not support " + func_name)
+
+    f.__name__ = func_name
+    if isinstance(cls, str):
+        # passed the literal docstring directly
+        f.__doc__ = cls
+    elif cls is not None:
+        f.__doc__ = getattr(cls, func_name).__doc__
+    return f
+
+
+cdef _nat_divide_op(self, other):
+    if PyDelta_Check(other) or is_timedelta64_object(other) or other is c_NaT:
+        return np.nan
+    if is_integer_object(other) or is_float_object(other):
+        return c_NaT
+    return NotImplemented
+
+
+cdef _nat_rdivide_op(self, other):
+    if PyDelta_Check(other):
+        return np.nan
+    return NotImplemented
+
+
+def __nat_unpickle(*args):
+    # return constant defined in the module
+    return c_NaT
+
+# ----------------------------------------------------------------------
+
+
+cdef class _NaT(datetime):
+    # cdef readonly:
+    #    int64_t value
+    #    object freq
+
+    def __hash__(_NaT self):
+        # py3k needs this defined here
+        return hash(self.value)
+
+    def __richcmp__(_NaT self, object other, int op):
+        cdef:
+            int ndim = getattr(other, 'ndim', -1)
+
+        if ndim == -1:
+            return _nat_scalar_rules[op]
+
+        if ndim == 0:
+            if is_datetime64_object(other):
+                return _nat_scalar_rules[op]
+            else:
+                raise TypeError('Cannot compare type %r with type %r' %
+                                (type(self).__name__, type(other).__name__))
+        # Note: instead of passing "other, self, _reverse_ops[op]", we observe
+        # that `_nat_scalar_rules` is invariant under `_reverse_ops`,
+        # rendering it unnecessary.
+        return PyObject_RichCompare(other, self, op)
+
+    def __add__(self, other):
+        if PyDateTime_Check(other):
+            return c_NaT
+
+        elif hasattr(other, 'delta'):
+            # Timedelta, offsets.Tick, offsets.Week
+            return c_NaT
+        elif getattr(other, '_typ', None) in ['dateoffset', 'series',
+                                              'period', 'datetimeindex',
+                                              'timedeltaindex']:
+            # Duplicate logic in _Timestamp.__add__ to avoid needing
+            # to subclass; allows us to @final(_Timestamp.__add__)
+            return NotImplemented
+        return c_NaT
+
+    def __sub__(self, other):
+        # Duplicate some logic from _Timestamp.__sub__ to avoid needing
+        # to subclass; allows us to @final(_Timestamp.__sub__)
+        if PyDateTime_Check(other):
+            return NaT
+        elif PyDelta_Check(other):
+            return NaT
+
+        elif getattr(other, '_typ', None) == 'datetimeindex':
+            # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
+            return -other.__sub__(self)
+
+        elif getattr(other, '_typ', None) == 'timedeltaindex':
+            # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
+            return (-other).__add__(self)
+
+        elif hasattr(other, 'delta'):
+            # offsets.Tick, offsets.Week
+            neg_other = -other
+            return self + neg_other
+
+        elif getattr(other, '_typ', None) in ['period', 'series',
+                                              'periodindex', 'dateoffset']:
+            return NotImplemented
+
+        return NaT
+
+    def __pos__(self):
+        return NaT
+
+    def __neg__(self):
+        return NaT
+
+    def __div__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __truediv__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __floordiv__(self, other):
+        return _nat_divide_op(self, other)
+
+    def __mul__(self, other):
+        if is_integer_object(other) or is_float_object(other):
+            return NaT
+        return NotImplemented
+
+    @property
+    def asm8(self):
+        return np.datetime64(NPY_NAT, 'ns')
+
+    def to_datetime64(self):
+        """
+        Return a numpy.datetime64 object with 'ns' precision.
+        """
+        return np.datetime64('NaT', 'ns')
+
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        Convert the Timestamp to a NumPy datetime64.
+
+        .. versionadded:: 0.25.0
+
+        This is an alias method for `Timestamp.to_datetime64()`. The dtype and
+        copy parameters are available here only for compatibility. Their values
+        will not affect the return value.
+
+        Returns
+        -------
+        numpy.datetime64
+
+        See Also
+        --------
+        DatetimeIndex.to_numpy : Similar method for DatetimeIndex.
+        """
+        return self.to_datetime64()
+
+    def __repr__(self):
+        return 'NaT'
+
+    def __str__(self):
+        return 'NaT'
+
+    def isoformat(self, sep='T'):
+        # This allows Timestamp(ts.isoformat()) to always correctly roundtrip.
+        return 'NaT'
+
+    def __hash__(self):
+        return NPY_NAT
+
+    def __int__(self):
+        return NPY_NAT
+
+    def __long__(self):
+        return NPY_NAT
+
+    def total_seconds(self):
+        """
+        Total duration of timedelta in seconds (to ns precision)
+        """
+        # GH#10939
+        return np.nan
+
+    @property
+    def is_leap_year(self):
+        return False
+
+    @property
+    def is_month_start(self):
+        return False
+
+    @property
+    def is_quarter_start(self):
+        return False
+
+    @property
+    def is_year_start(self):
+        return False
+
+    @property
+    def is_month_end(self):
+        return False
+
+    @property
+    def is_quarter_end(self):
+        return False
+
+    @property
+    def is_year_end(self):
+        return False
+
+
+class NaTType(_NaT):
+    """(N)ot-(A)-(T)ime, the time equivalent of NaN"""
+
+    def __new__(cls):
+        cdef _NaT base
+
+        base = _NaT.__new__(cls, 1, 1, 1)
+        base.value = NPY_NAT
+        base.freq = None
+
+        return base
+
+    def __reduce_ex__(self, protocol):
+        # python 3.6 compat
+        # http://bugs.python.org/issue28730
+        # now __reduce_ex__ is defined and higher priority than __reduce__
+        return self.__reduce__()
+
+    def __reduce__(self):
+        return (__nat_unpickle, (None, ))
+
+    def __rdiv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rtruediv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rfloordiv__(self, other):
+        return _nat_rdivide_op(self, other)
+
+    def __rmul__(self, other):
+        if is_integer_object(other) or is_float_object(other):
+            return c_NaT
+        return NotImplemented
+
+    # ----------------------------------------------------------------------
+    # inject the Timestamp field properties
+    # these by definition return np.nan
+
+    year = property(fget=lambda self: np.nan)
+    quarter = property(fget=lambda self: np.nan)
+    month = property(fget=lambda self: np.nan)
+    day = property(fget=lambda self: np.nan)
+    hour = property(fget=lambda self: np.nan)
+    minute = property(fget=lambda self: np.nan)
+    second = property(fget=lambda self: np.nan)
+    millisecond = property(fget=lambda self: np.nan)
+    microsecond = property(fget=lambda self: np.nan)
+    nanosecond = property(fget=lambda self: np.nan)
+
+    week = property(fget=lambda self: np.nan)
+    dayofyear = property(fget=lambda self: np.nan)
+    weekofyear = property(fget=lambda self: np.nan)
+    days_in_month = property(fget=lambda self: np.nan)
+    daysinmonth = property(fget=lambda self: np.nan)
+    dayofweek = property(fget=lambda self: np.nan)
+    weekday_name = property(fget=lambda self: np.nan)
+
+    # inject Timedelta properties
+    days = property(fget=lambda self: np.nan)
+    seconds = property(fget=lambda self: np.nan)
+    microseconds = property(fget=lambda self: np.nan)
+    nanoseconds = property(fget=lambda self: np.nan)
+
+    # inject pd.Period properties
+    qyear = property(fget=lambda self: np.nan)
+
+    # ----------------------------------------------------------------------
+    # GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or
+    # return NaT create functions that raise, for binding to NaTType
+    # These are the ones that can get their docstrings from datetime.
+
+    # nan methods
+    weekday = _make_nan_func('weekday', datetime.weekday.__doc__)
+    isoweekday = _make_nan_func('isoweekday', datetime.isoweekday.__doc__)
+    month_name = _make_nan_func('month_name',  # noqa:E128
+        """
+        Return the month name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the month name
+
+        Returns
+        -------
+        month_name : string
+
+        .. versionadded:: 0.23.0
+        """)
+    day_name = _make_nan_func('day_name', # noqa:E128
+        """
+        Return the day name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the day name
+
+        Returns
+        -------
+        day_name : string
+
+        .. versionadded:: 0.23.0
+        """)
+    # _nat_methods
+    date = _make_nat_func('date', datetime.date.__doc__)
+
+    utctimetuple = _make_error_func('utctimetuple', datetime)
+    timetz = _make_error_func('timetz', datetime)
+    timetuple = _make_error_func('timetuple', datetime)
+    strftime = _make_error_func('strftime', datetime)
+    isocalendar = _make_error_func('isocalendar', datetime)
+    dst = _make_error_func('dst', datetime)
+    ctime = _make_error_func('ctime', datetime)
+    time = _make_error_func('time', datetime)
+    toordinal = _make_error_func('toordinal', datetime)
+    tzname = _make_error_func('tzname', datetime)
+    utcoffset = _make_error_func('utcoffset', datetime)
+
+    # ----------------------------------------------------------------------
+    # The remaining methods have docstrings copy/pasted from the analogous
+    # Timestamp methods.
+
+    strptime = _make_error_func('strptime',  # noqa:E128
+        """
+        Timestamp.strptime(string, format)
+
+        Function is not implemented. Use pd.to_datetime().
+        """
+    )
+
+    utcfromtimestamp = _make_error_func('utcfromtimestamp',  # noqa:E128
+        """
+        Timestamp.utcfromtimestamp(ts)
+
+        Construct a naive UTC datetime from a POSIX timestamp.
+        """
+    )
+    fromtimestamp = _make_error_func('fromtimestamp',  # noqa:E128
+        """
+        Timestamp.fromtimestamp(ts)
+
+        timestamp[, tz] -> tz's local time from POSIX timestamp.
+        """
+    )
+    combine = _make_error_func('combine',  # noqa:E128
+        """
+        Timestamp.combine(date, time)
+
+        date, time -> datetime with same date and time fields
+        """
+    )
+    utcnow = _make_error_func('utcnow',  # noqa:E128
+        """
+        Timestamp.utcnow()
+
+        Return a new Timestamp representing UTC day and time.
+        """
+    )
+
+    timestamp = _make_error_func('timestamp',  # noqa:E128
+        """Return POSIX timestamp as float.""")
+
+    # GH9513 NaT methods (except to_datetime64) to raise, return np.nan, or
+    # return NaT create functions that raise, for binding to NaTType
+    astimezone = _make_error_func('astimezone',  # noqa:E128
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """)
+    fromordinal = _make_error_func('fromordinal',  # noqa:E128
+        """
+        Timestamp.fromordinal(ordinal, freq=None, tz=None)
+
+        passed an ordinal, translate and convert to a ts
+        note: by definition there cannot be any tz info on the ordinal itself
+
+        Parameters
+        ----------
+        ordinal : int
+            date corresponding to a proleptic Gregorian ordinal
+        freq : str, DateOffset
+            Offset which Timestamp will have
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will have.
+        """)
+
+    # _nat_methods
+    to_pydatetime = _make_nat_func('to_pydatetime',  # noqa:E128
+        """
+        Convert a Timestamp object to a native Python datetime object.
+
+        If warn=True, issue a warning if nanoseconds is nonzero.
+        """)
+
+    now = _make_nat_func('now',  # noqa:E128
+        """
+        Timestamp.now(tz=None)
+
+        Return new Timestamp object representing current time local to
+        tz.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """)
+    today = _make_nat_func('today',  # noqa:E128
+        """
+        Timestamp.today(cls, tz=None)
+
+        Return the current time in the local timezone.  This differs
+        from datetime.today() in that it can be localized to a
+        passed timezone.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """)
+    round = _make_nat_func('round',  # noqa:E128
+        """
+        Round the Timestamp to the specified resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        a new Timestamp rounded to the given resolution of `freq`
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """)
+    floor = _make_nat_func('floor',  # noqa:E128
+        """
+        return a new Timestamp floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """)
+    ceil = _make_nat_func('ceil',  # noqa:E128
+        """
+        return a new Timestamp ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """)
+
+    tz_convert = _make_nat_func('tz_convert',  # noqa:E128
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """)
+    tz_localize = _make_nat_func('tz_localize',  # noqa:E128
+        """
+        Convert naive Timestamp to local time zone, or remove
+        timezone from tz-aware Timestamp.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding local time.
+
+        ambiguous : bool, 'NaT', default 'raise'
+            When clocks moved backward due to DST, ambiguous times may arise.
+            For example in Central European Time (UTC+01), when going from
+            03:00 DST to 02:00 non-DST, 02:30:00 local time occurs both at
+            00:30:00 UTC and at 01:30:00 UTC. In such a situation, the
+            `ambiguous` parameter dictates how ambiguous times should be
+            handled.
+
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : 'raise', 'coerce', default None
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+               valid in the specified timezone (e.g. due to a transition from
+               or to DST time). Use ``nonexistent='raise'`` instead.
+            - 'coerce' will return NaT if the timestamp can not be converted
+              into the specified timezone. Use ``nonexistent='NaT'`` instead.
+
+              .. deprecated:: 0.24.0
+
+        Returns
+        -------
+        localized : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If the Timestamp is tz-aware and tz is not None.
+        """)
+    replace = _make_nat_func('replace',  # noqa:E128
+        """
+        implements datetime.replace, handles nanoseconds
+
+        Parameters
+        ----------
+        year : int, optional
+        month : int, optional
+        day : int, optional
+        hour : int, optional
+        minute : int, optional
+        second : int, optional
+        microsecond : int, optional
+        nanosecond : int, optional
+        tzinfo : tz-convertible, optional
+        fold : int, optional, default is 0
+
+        Returns
+        -------
+        Timestamp with fields replaced
+        """)
+
+
+c_NaT = NaTType()  # C-visible
+NaT = c_NaT        # Python-visible
+
+
+# ----------------------------------------------------------------------
+
+cdef inline bint checknull_with_nat(object val):
+    """ utility to check if a value is a nat or not """
+    return val is None or util.is_nan(val) or val is c_NaT
+
+
+cpdef bint is_null_datetimelike(object val, bint inat_is_null=True):
+    """
+    Determine if we have a null for a timedelta/datetime (or integer versions)
+
+    Parameters
+    ----------
+    val : object
+    inat_is_null : bool, default True
+        Whether to treat integer iNaT value as null
+
+    Returns
+    -------
+    null_datetimelike : bool
+    """
+    if val is None:
+        return True
+    elif val is c_NaT:
+        return True
+    elif util.is_float_object(val) or util.is_complex_object(val):
+        return val != val
+    elif util.is_timedelta64_object(val):
+        return get_timedelta64_value(val) == NPY_NAT
+    elif util.is_datetime64_object(val):
+        return get_datetime64_value(val) == NPY_NAT
+    elif inat_is_null and util.is_integer_object(val):
+        return val == NPY_NAT
+    return False
diff --git a/pandas/_libs/tslibs/np_datetime.pxd b/pandas/_libs/tslibs/np_datetime.pxd
new file mode 100644
index 0000000000000..803c8cb18e3d5
--- /dev/null
+++ b/pandas/_libs/tslibs/np_datetime.pxd
@@ -0,0 +1,76 @@
+# -*- coding: utf-8 -*-
+
+from cpython.datetime cimport date, datetime
+
+from numpy cimport int64_t, int32_t
+
+cdef extern from "numpy/ndarrayobject.h":
+    ctypedef int64_t npy_timedelta
+    ctypedef int64_t npy_datetime
+
+cdef extern from "numpy/ndarraytypes.h":
+    ctypedef struct PyArray_DatetimeMetaData:
+        NPY_DATETIMEUNIT base
+        int64_t num
+
+cdef extern from "numpy/arrayscalars.h":
+    ctypedef struct PyDatetimeScalarObject:
+        # PyObject_HEAD
+        npy_datetime obval
+        PyArray_DatetimeMetaData obmeta
+
+    ctypedef struct PyTimedeltaScalarObject:
+        # PyObject_HEAD
+        npy_timedelta obval
+        PyArray_DatetimeMetaData obmeta
+
+cdef extern from "numpy/ndarraytypes.h":
+    ctypedef struct npy_datetimestruct:
+        int64_t year
+        int32_t month, day, hour, min, sec, us, ps, as
+
+    ctypedef enum NPY_DATETIMEUNIT:
+        NPY_FR_Y
+        NPY_FR_M
+        NPY_FR_W
+        NPY_FR_D
+        NPY_FR_B
+        NPY_FR_h
+        NPY_FR_m
+        NPY_FR_s
+        NPY_FR_ms
+        NPY_FR_us
+        NPY_FR_ns
+        NPY_FR_ps
+        NPY_FR_fs
+        NPY_FR_as
+
+cdef extern from "src/datetime/np_datetime.h":
+    ctypedef struct pandas_timedeltastruct:
+        int64_t days
+        int32_t hrs, min, sec, ms, us, ns, seconds, microseconds, nanoseconds
+
+    void pandas_datetime_to_datetimestruct(npy_datetime val,
+                                           NPY_DATETIMEUNIT fr,
+                                           npy_datetimestruct *result) nogil
+
+
+cdef int reverse_ops[6]
+
+cdef bint cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1
+
+cdef check_dts_bounds(npy_datetimestruct *dts)
+
+cdef int64_t dtstruct_to_dt64(npy_datetimestruct* dts) nogil
+cdef void dt64_to_dtstruct(int64_t dt64, npy_datetimestruct* out) nogil
+cdef void td64_to_tdstruct(int64_t td64, pandas_timedeltastruct* out) nogil
+
+cdef int64_t pydatetime_to_dt64(datetime val, npy_datetimestruct *dts)
+cdef int64_t pydate_to_dt64(date val, npy_datetimestruct *dts)
+
+cdef npy_datetime get_datetime64_value(object obj) nogil
+cdef npy_timedelta get_timedelta64_value(object obj) nogil
+cdef NPY_DATETIMEUNIT get_datetime64_unit(object obj) nogil
+
+cdef int _string_to_dts(object val, npy_datetimestruct* dts,
+                        int* out_local, int* out_tzoffset) except? -1
diff --git a/pandas/_libs/tslibs/np_datetime.pyx b/pandas/_libs/tslibs/np_datetime.pyx
new file mode 100644
index 0000000000000..dbbe9da381f0a
--- /dev/null
+++ b/pandas/_libs/tslibs/np_datetime.pyx
@@ -0,0 +1,203 @@
+# -*- coding: utf-8 -*-
+
+from cpython cimport (Py_EQ, Py_NE, Py_GE, Py_GT, Py_LT, Py_LE,
+                      PyUnicode_AsASCIIString)
+
+from cpython.datetime cimport (datetime, date,
+                               PyDateTime_IMPORT,
+                               PyDateTime_GET_YEAR, PyDateTime_GET_MONTH,
+                               PyDateTime_GET_DAY, PyDateTime_DATE_GET_HOUR,
+                               PyDateTime_DATE_GET_MINUTE,
+                               PyDateTime_DATE_GET_SECOND,
+                               PyDateTime_DATE_GET_MICROSECOND)
+PyDateTime_IMPORT
+
+from numpy cimport int64_t
+
+cdef extern from "src/datetime/np_datetime.h":
+    int cmp_npy_datetimestruct(npy_datetimestruct *a,
+                               npy_datetimestruct *b)
+
+    npy_datetime npy_datetimestruct_to_datetime(NPY_DATETIMEUNIT fr,
+                                                npy_datetimestruct *d) nogil
+
+    void pandas_datetime_to_datetimestruct(npy_datetime val,
+                                           NPY_DATETIMEUNIT fr,
+                                           npy_datetimestruct *result) nogil
+
+    void pandas_timedelta_to_timedeltastruct(npy_timedelta val,
+                                             NPY_DATETIMEUNIT fr,
+                                             pandas_timedeltastruct *result
+                                            ) nogil
+
+    npy_datetimestruct _NS_MIN_DTS, _NS_MAX_DTS
+
+cdef extern from "src/datetime/np_datetime_strings.h":
+    int parse_iso_8601_datetime(char *str, int len,
+                                npy_datetimestruct *out,
+                                int *out_local, int *out_tzoffset)
+
+
+# ----------------------------------------------------------------------
+# numpy object inspection
+
+cdef inline npy_datetime get_datetime64_value(object obj) nogil:
+    """
+    returns the int64 value underlying scalar numpy datetime64 object
+
+    Note that to interpret this as a datetime, the corresponding unit is
+    also needed.  That can be found using `get_datetime64_unit`.
+    """
+    return (<PyDatetimeScalarObject*>obj).obval
+
+
+cdef inline npy_timedelta get_timedelta64_value(object obj) nogil:
+    """
+    returns the int64 value underlying scalar numpy timedelta64 object
+    """
+    return (<PyTimedeltaScalarObject*>obj).obval
+
+
+cdef inline NPY_DATETIMEUNIT get_datetime64_unit(object obj) nogil:
+    """
+    returns the unit part of the dtype for a numpy datetime64 object.
+    """
+    return <NPY_DATETIMEUNIT>(<PyDatetimeScalarObject*>obj).obmeta.base
+
+# ----------------------------------------------------------------------
+# Comparison
+
+cdef int reverse_ops[6]
+
+reverse_ops[Py_LT] = Py_GT
+reverse_ops[Py_LE] = Py_GE
+reverse_ops[Py_EQ] = Py_EQ
+reverse_ops[Py_NE] = Py_NE
+reverse_ops[Py_GT] = Py_LT
+reverse_ops[Py_GE] = Py_LE
+
+
+cdef inline bint cmp_scalar(int64_t lhs, int64_t rhs, int op) except -1:
+    """
+    cmp_scalar is a more performant version of PyObject_RichCompare
+    typed for int64_t arguments.
+    """
+    if op == Py_EQ:
+        return lhs == rhs
+    elif op == Py_NE:
+        return lhs != rhs
+    elif op == Py_LT:
+        return lhs < rhs
+    elif op == Py_LE:
+        return lhs <= rhs
+    elif op == Py_GT:
+        return lhs > rhs
+    elif op == Py_GE:
+        return lhs >= rhs
+
+
+class OutOfBoundsDatetime(ValueError):
+    pass
+
+
+cdef inline check_dts_bounds(npy_datetimestruct *dts):
+    """Raises OutOfBoundsDatetime if the given date is outside the range that
+    can be represented by nanosecond-resolution 64-bit integers."""
+    cdef:
+        bint error = False
+
+    if (dts.year <= 1677 and
+            cmp_npy_datetimestruct(dts, &_NS_MIN_DTS) == -1):
+        error = True
+    elif (dts.year >= 2262 and
+          cmp_npy_datetimestruct(dts, &_NS_MAX_DTS) == 1):
+        error = True
+
+    if error:
+        fmt = '%d-%.2d-%.2d %.2d:%.2d:%.2d' % (dts.year, dts.month,
+                                               dts.day, dts.hour,
+                                               dts.min, dts.sec)
+        raise OutOfBoundsDatetime(
+            'Out of bounds nanosecond timestamp: {fmt}'.format(fmt=fmt))
+
+
+# ----------------------------------------------------------------------
+# Conversion
+
+cdef inline int64_t dtstruct_to_dt64(npy_datetimestruct* dts) nogil:
+    """Convenience function to call npy_datetimestruct_to_datetime
+    with the by-far-most-common frequency NPY_FR_ns"""
+    return npy_datetimestruct_to_datetime(NPY_FR_ns, dts)
+
+
+cdef inline void dt64_to_dtstruct(int64_t dt64,
+                                  npy_datetimestruct* out) nogil:
+    """Convenience function to call pandas_datetime_to_datetimestruct
+    with the by-far-most-common frequency NPY_FR_ns"""
+    pandas_datetime_to_datetimestruct(dt64, NPY_FR_ns, out)
+    return
+
+
+cdef inline void td64_to_tdstruct(int64_t td64,
+                                  pandas_timedeltastruct* out) nogil:
+    """Convenience function to call pandas_timedelta_to_timedeltastruct
+    with the by-far-most-common frequency NPY_FR_ns"""
+    pandas_timedelta_to_timedeltastruct(td64, NPY_FR_ns, out)
+    return
+
+
+cdef inline int64_t pydatetime_to_dt64(datetime val,
+                                       npy_datetimestruct *dts):
+    """
+    Note we are assuming that the datetime object is timezone-naive.
+    """
+    dts.year = PyDateTime_GET_YEAR(val)
+    dts.month = PyDateTime_GET_MONTH(val)
+    dts.day = PyDateTime_GET_DAY(val)
+    dts.hour = PyDateTime_DATE_GET_HOUR(val)
+    dts.min = PyDateTime_DATE_GET_MINUTE(val)
+    dts.sec = PyDateTime_DATE_GET_SECOND(val)
+    dts.us = PyDateTime_DATE_GET_MICROSECOND(val)
+    dts.ps = dts.as = 0
+    return dtstruct_to_dt64(dts)
+
+
+cdef inline int64_t pydate_to_dt64(date val, npy_datetimestruct *dts):
+    dts.year = PyDateTime_GET_YEAR(val)
+    dts.month = PyDateTime_GET_MONTH(val)
+    dts.day = PyDateTime_GET_DAY(val)
+    dts.hour = dts.min = dts.sec = dts.us = 0
+    dts.ps = dts.as = 0
+    return dtstruct_to_dt64(dts)
+
+
+cdef inline int _string_to_dts(object val, npy_datetimestruct* dts,
+                               int* out_local, int* out_tzoffset) except? -1:
+    cdef:
+        int result
+        char *tmp
+
+    if isinstance(val, unicode):
+        val = PyUnicode_AsASCIIString(val)
+
+    tmp = val
+    result = _cstring_to_dts(tmp, len(val), dts, out_local, out_tzoffset)
+
+    if result == -1:
+        raise ValueError('Unable to parse %s' % str(val))
+    return result
+
+
+cdef inline int _cstring_to_dts(char *val, int length,
+                                npy_datetimestruct* dts,
+                                int* out_local, int* out_tzoffset) except? -1:
+    # Note: without this "extra layer" between _string_to_dts
+    # and parse_iso_8601_datetime, calling _string_to_dts raises
+    # `SystemError: <class 'str'> returned a result with an error set`
+    # in Python3
+    cdef:
+        int result
+
+    result = parse_iso_8601_datetime(val, length,
+                                     dts, out_local, out_tzoffset)
+    return result
diff --git a/pandas/_libs/tslibs/offsets.pxd b/pandas/_libs/tslibs/offsets.pxd
new file mode 100644
index 0000000000000..2829a27b9905c
--- /dev/null
+++ b/pandas/_libs/tslibs/offsets.pxd
@@ -0,0 +1,3 @@
+# -*- coding: utf-8 -*-
+
+cdef to_offset(object obj)
diff --git a/pandas/_libs/tslibs/offsets.pyx b/pandas/_libs/tslibs/offsets.pyx
new file mode 100644
index 0000000000000..e28462f7103b9
--- /dev/null
+++ b/pandas/_libs/tslibs/offsets.pyx
@@ -0,0 +1,1143 @@
+# -*- coding: utf-8 -*-
+
+import cython
+
+import time
+from cpython.datetime cimport (PyDateTime_IMPORT,
+                               PyDateTime_Check,
+                               PyDelta_Check,
+                               datetime, timedelta,
+                               time as dt_time)
+PyDateTime_IMPORT
+
+from dateutil.relativedelta import relativedelta
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+
+from pandas._libs.tslibs cimport util
+from pandas._libs.tslibs.util cimport is_string_object, is_integer_object
+
+from pandas._libs.tslibs.ccalendar import MONTHS, DAYS
+from pandas._libs.tslibs.ccalendar cimport get_days_in_month, dayofweek
+from pandas._libs.tslibs.conversion cimport (
+    tz_convert_single, pydt_to_i8, localize_pydatetime)
+from pandas._libs.tslibs.nattype cimport NPY_NAT
+from pandas._libs.tslibs.np_datetime cimport (
+    npy_datetimestruct, dtstruct_to_dt64, dt64_to_dtstruct)
+from pandas._libs.tslibs.timezones import UTC
+
+
+PY2 = bytes == str
+
+# ---------------------------------------------------------------------
+# Constants
+
+
+_offset_to_period_map = {
+    'WEEKDAY': 'D',
+    'EOM': 'M',
+    'BM': 'M',
+    'BQS': 'Q',
+    'QS': 'Q',
+    'BQ': 'Q',
+    'BA': 'A',
+    'AS': 'A',
+    'BAS': 'A',
+    'MS': 'M',
+    'D': 'D',
+    'C': 'C',
+    'B': 'B',
+    'T': 'T',
+    'S': 'S',
+    'L': 'L',
+    'U': 'U',
+    'N': 'N',
+    'H': 'H',
+    'Q': 'Q',
+    'A': 'A',
+    'W': 'W',
+    'M': 'M',
+    'Y': 'A',
+    'BY': 'A',
+    'YS': 'A',
+    'BYS': 'A'}
+
+need_suffix = ['QS', 'BQ', 'BQS', 'YS', 'AS', 'BY', 'BA', 'BYS', 'BAS']
+
+for __prefix in need_suffix:
+    for _m in MONTHS:
+        key = '%s-%s' % (__prefix, _m)
+        _offset_to_period_map[key] = _offset_to_period_map[__prefix]
+
+for __prefix in ['A', 'Q']:
+    for _m in MONTHS:
+        _alias = '%s-%s' % (__prefix, _m)
+        _offset_to_period_map[_alias] = _alias
+
+for _d in DAYS:
+    _offset_to_period_map['W-%s' % _d] = 'W-%s' % _d
+
+
+# ---------------------------------------------------------------------
+# Misc Helpers
+
+cdef to_offset(object obj):
+    """
+    Wrap pandas.tseries.frequencies.to_offset to keep centralize runtime
+    imports
+    """
+    if isinstance(obj, _BaseOffset):
+        return obj
+    from pandas.tseries.frequencies import to_offset
+    return to_offset(obj)
+
+
+def as_datetime(obj):
+    f = getattr(obj, 'to_pydatetime', None)
+    if f is not None:
+        obj = f()
+    return obj
+
+
+cpdef bint _is_normalized(dt):
+    if (dt.hour != 0 or dt.minute != 0 or dt.second != 0 or
+            dt.microsecond != 0 or getattr(dt, 'nanosecond', 0) != 0):
+        return False
+    return True
+
+
+def apply_index_wraps(func):
+    # Note: normally we would use `@functools.wraps(func)`, but this does
+    # not play nicely with cython class methods
+    def wrapper(self, other):
+        result = func(self, other)
+        if self.normalize:
+            result = result.to_period('D').to_timestamp()
+        return result
+
+    # do @functools.wraps(func) manually since it doesn't work on cdef funcs
+    wrapper.__name__ = func.__name__
+    wrapper.__doc__ = func.__doc__
+    try:
+        wrapper.__module__ = func.__module__
+    except AttributeError:
+        # AttributeError: 'method_descriptor' object has no
+        # attribute '__module__'
+        pass
+    return wrapper
+
+
+cdef _wrap_timedelta_result(result):
+    """
+    Tick operations dispatch to their Timedelta counterparts.  Wrap the result
+    of these operations in a Tick if possible.
+
+    Parameters
+    ----------
+    result : object
+
+    Returns
+    -------
+    object
+    """
+    if PyDelta_Check(result):
+        # convert Timedelta back to a Tick
+        from pandas.tseries.offsets import _delta_to_tick
+        return _delta_to_tick(result)
+
+    return result
+
+# ---------------------------------------------------------------------
+# Business Helpers
+
+cpdef int get_lastbday(int year, int month) nogil:
+    """
+    Find the last day of the month that is a business day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    last_bday : int
+    """
+    cdef:
+        int wkday, days_in_month
+
+    wkday = dayofweek(year, month, 1)
+    days_in_month = get_days_in_month(year, month)
+    return days_in_month - max(((wkday + days_in_month - 1) % 7) - 4, 0)
+
+
+cpdef int get_firstbday(int year, int month) nogil:
+    """
+    Find the first day of the month that is a business day.
+
+    Parameters
+    ----------
+    year : int
+    month : int
+
+    Returns
+    -------
+    first_bday : int
+    """
+    cdef:
+        int first, wkday
+
+    wkday = dayofweek(year, month, 1)
+    first = 1
+    if wkday == 5:  # on Saturday
+        first = 3
+    elif wkday == 6:  # on Sunday
+        first = 2
+    return first
+
+
+def _get_calendar(weekmask, holidays, calendar):
+    """Generate busdaycalendar"""
+    if isinstance(calendar, np.busdaycalendar):
+        if not holidays:
+            holidays = tuple(calendar.holidays)
+        elif not isinstance(holidays, tuple):
+            holidays = tuple(holidays)
+        else:
+            # trust that calendar.holidays and holidays are
+            # consistent
+            pass
+        return calendar, holidays
+
+    if holidays is None:
+        holidays = []
+    try:
+        holidays = holidays + calendar.holidays().tolist()
+    except AttributeError:
+        pass
+    holidays = [_to_dt64(dt, dtype='datetime64[D]') for dt in holidays]
+    holidays = tuple(sorted(holidays))
+
+    kwargs = {'weekmask': weekmask}
+    if holidays:
+        kwargs['holidays'] = holidays
+
+    busdaycalendar = np.busdaycalendar(**kwargs)
+    return busdaycalendar, holidays
+
+
+def _to_dt64(dt, dtype='datetime64'):
+    # Currently
+    # > np.datetime64(dt.datetime(2013,5,1),dtype='datetime64[D]')
+    # numpy.datetime64('2013-05-01T02:00:00.000000+0200')
+    # Thus astype is needed to cast datetime to datetime64[D]
+    if getattr(dt, 'tzinfo', None) is not None:
+        i8 = pydt_to_i8(dt)
+        dt = tz_convert_single(i8, UTC, dt.tzinfo)
+        dt = np.int64(dt).astype('datetime64[ns]')
+    else:
+        dt = np.datetime64(dt)
+    if dt.dtype.name != dtype:
+        dt = dt.astype(dtype)
+    return dt
+
+
+# ---------------------------------------------------------------------
+# Validation
+
+
+def _validate_business_time(t_input):
+    if is_string_object(t_input):
+        try:
+            t = time.strptime(t_input, '%H:%M')
+            return dt_time(hour=t.tm_hour, minute=t.tm_min)
+        except ValueError:
+            raise ValueError("time data must match '%H:%M' format")
+    elif isinstance(t_input, dt_time):
+        if t_input.second != 0 or t_input.microsecond != 0:
+            raise ValueError(
+                "time data must be specified only with hour and minute")
+        return t_input
+    else:
+        raise ValueError("time data must be string or datetime.time")
+
+
+# ---------------------------------------------------------------------
+# Constructor Helpers
+
+relativedelta_kwds = {'years', 'months', 'weeks', 'days', 'year', 'month',
+                      'day', 'weekday', 'hour', 'minute', 'second',
+                      'microsecond', 'nanosecond', 'nanoseconds', 'hours',
+                      'minutes', 'seconds', 'microseconds'}
+
+
+def _determine_offset(kwds):
+    # timedelta is used for sub-daily plural offsets and all singular
+    # offsets relativedelta is used for plural offsets of daily length or
+    # more nanosecond(s) are handled by apply_wraps
+    kwds_no_nanos = dict(
+        (k, v) for k, v in kwds.items()
+        if k not in ('nanosecond', 'nanoseconds')
+    )
+    # TODO: Are nanosecond and nanoseconds allowed somewhere?
+
+    _kwds_use_relativedelta = ('years', 'months', 'weeks', 'days',
+                               'year', 'month', 'week', 'day', 'weekday',
+                               'hour', 'minute', 'second', 'microsecond')
+
+    use_relativedelta = False
+    if len(kwds_no_nanos) > 0:
+        if any(k in _kwds_use_relativedelta for k in kwds_no_nanos):
+            offset = relativedelta(**kwds_no_nanos)
+            use_relativedelta = True
+        else:
+            # sub-daily offset - use timedelta (tz-aware)
+            offset = timedelta(**kwds_no_nanos)
+    else:
+        offset = timedelta(1)
+    return offset, use_relativedelta
+
+
+# ---------------------------------------------------------------------
+# Mixins & Singletons
+
+
+class ApplyTypeError(TypeError):
+    # sentinel class for catching the apply error to return NotImplemented
+    pass
+
+
+# ---------------------------------------------------------------------
+# Base Classes
+
+class _BaseOffset(object):
+    """
+    Base class for DateOffset methods that are not overridden by subclasses
+    and will (after pickle errors are resolved) go into a cdef class.
+    """
+    _typ = "dateoffset"
+    _day_opt = None
+    _attributes = frozenset(['n', 'normalize'])
+
+    def __init__(self, n=1, normalize=False):
+        n = self._validate_n(n)
+        object.__setattr__(self, "n", n)
+        object.__setattr__(self, "normalize", normalize)
+        object.__setattr__(self, "_cache", {})
+
+    def __setattr__(self, name, value):
+        raise AttributeError("DateOffset objects are immutable.")
+
+    def __eq__(self, other):
+        if is_string_object(other):
+            try:
+                # GH#23524 if to_offset fails, we are dealing with an
+                #  incomparable type so == is False and != is True
+                other = to_offset(other)
+            except ValueError:
+                # e.g. "infer"
+                return False
+        try:
+            return self._params == other._params
+        except AttributeError:
+            # other is not a DateOffset object
+            return False
+
+    def __ne__(self, other):
+        return not self == other
+
+    def __hash__(self):
+        return hash(self._params)
+
+    @property
+    def _params(self):
+        """
+        Returns a tuple containing all of the attributes needed to evaluate
+        equality between two DateOffset objects.
+        """
+        # NB: non-cython subclasses override property with cache_readonly
+        all_paras = self.__dict__.copy()
+        if 'holidays' in all_paras and not all_paras['holidays']:
+            all_paras.pop('holidays')
+        exclude = ['kwds', 'name', 'calendar']
+        attrs = [(k, v) for k, v in all_paras.items()
+                 if (k not in exclude) and (k[0] != '_')]
+        attrs = sorted(set(attrs))
+        params = tuple([str(self.__class__)] + attrs)
+        return params
+
+    @property
+    def kwds(self):
+        # for backwards-compatibility
+        kwds = {name: getattr(self, name, None) for name in self._attributes
+                if name not in ['n', 'normalize']}
+        return {name: kwds[name] for name in kwds if kwds[name] is not None}
+
+    @property
+    def base(self):
+        """
+        Returns a copy of the calling offset object with n=1 and all other
+        attributes equal.
+        """
+        return type(self)(n=1, normalize=self.normalize, **self.kwds)
+
+    def __add__(self, other):
+        if getattr(other, "_typ", None) in ["datetimeindex", "periodindex",
+                                            "datetimearray", "periodarray",
+                                            "series", "period", "dataframe"]:
+            # defer to the other class's implementation
+            return other + self
+        try:
+            return self.apply(other)
+        except ApplyTypeError:
+            return NotImplemented
+
+    def __sub__(self, other):
+        if PyDateTime_Check(other):
+            raise TypeError('Cannot subtract datetime from offset.')
+        elif type(other) == type(self):
+            return type(self)(self.n - other.n, normalize=self.normalize,
+                              **self.kwds)
+        else:  # pragma: no cover
+            return NotImplemented
+
+    def __call__(self, other):
+        return self.apply(other)
+
+    def __mul__(self, other):
+        if hasattr(other, "_typ"):
+            return NotImplemented
+        if util.is_array(other):
+            return np.array([self * x for x in other])
+        return type(self)(n=other * self.n, normalize=self.normalize,
+                          **self.kwds)
+
+    def __neg__(self):
+        # Note: we are deferring directly to __mul__ instead of __rmul__, as
+        # that allows us to use methods that can go in a `cdef class`
+        return self * -1
+
+    def copy(self):
+        # Note: we are deferring directly to __mul__ instead of __rmul__, as
+        # that allows us to use methods that can go in a `cdef class`
+        return self * 1
+
+    def __repr__(self):
+        className = getattr(self, '_outputName', type(self).__name__)
+
+        if abs(self.n) != 1:
+            plural = 's'
+        else:
+            plural = ''
+
+        n_str = ""
+        if self.n != 1:
+            n_str = "%s * " % self.n
+
+        out = '<%s' % n_str + className + plural + self._repr_attrs() + '>'
+        return out
+
+    def _get_offset_day(self, datetime other):
+        # subclass must implement `_day_opt`; calling from the base class
+        # will raise NotImplementedError.
+        return get_day_of_month(other, self._day_opt)
+
+    def _validate_n(self, n):
+        """
+        Require that `n` be a nonzero integer.
+
+        Parameters
+        ----------
+        n : int
+
+        Returns
+        -------
+        nint : int
+
+        Raises
+        ------
+        TypeError if `int(n)` raises
+        ValueError if n != int(n)
+        """
+        if util.is_timedelta64_object(n):
+            raise TypeError('`n` argument must be an integer, '
+                            'got {ntype}'.format(ntype=type(n)))
+        try:
+            nint = int(n)
+        except (ValueError, TypeError):
+            raise TypeError('`n` argument must be an integer, '
+                            'got {ntype}'.format(ntype=type(n)))
+        if n != nint:
+            raise ValueError('`n` argument must be an integer, '
+                             'got {n}'.format(n=n))
+        return nint
+
+    def __setstate__(self, state):
+        """Reconstruct an instance from a pickled state"""
+        if 'offset' in state:
+            # Older (<0.22.0) versions have offset attribute instead of _offset
+            if '_offset' in state:  # pragma: no cover
+                raise AssertionError('Unexpected key `_offset`')
+            state['_offset'] = state.pop('offset')
+            state['kwds']['offset'] = state['_offset']
+
+        if '_offset' in state and not isinstance(state['_offset'], timedelta):
+            # relativedelta, we need to populate using its kwds
+            offset = state['_offset']
+            odict = offset.__dict__
+            kwds = {key: odict[key] for key in odict if odict[key]}
+            state.update(kwds)
+
+        if '_cache' not in state:
+            state['_cache'] = {}
+
+        self.__dict__.update(state)
+
+        if 'weekmask' in state and 'holidays' in state:
+            calendar, holidays = _get_calendar(weekmask=self.weekmask,
+                                               holidays=self.holidays,
+                                               calendar=None)
+            object.__setattr__(self, "calendar", calendar)
+            object.__setattr__(self, "holidays", holidays)
+
+    def __getstate__(self):
+        """Return a pickleable state"""
+        state = self.__dict__.copy()
+
+        # we don't want to actually pickle the calendar object
+        # as its a np.busyday; we recreate on deserilization
+        if 'calendar' in state:
+            del state['calendar']
+        try:
+            state['kwds'].pop('calendar')
+        except KeyError:
+            pass
+
+        return state
+
+
+class BaseOffset(_BaseOffset):
+    # Here we add __rfoo__ methods that don't play well with cdef classes
+    def __rmul__(self, other):
+        return self.__mul__(other)
+
+    def __radd__(self, other):
+        return self.__add__(other)
+
+    def __rsub__(self, other):
+        if getattr(other, '_typ', None) in ['datetimeindex', 'series']:
+            # i.e. isinstance(other, (ABCDatetimeIndex, ABCSeries))
+            return other - self
+        return -self + other
+
+
+class _Tick(object):
+    """
+    dummy class to mix into tseries.offsets.Tick so that in tslibs.period we
+    can do isinstance checks on _Tick and avoid importing tseries.offsets
+    """
+
+    # ensure that reversed-ops with numpy scalars return NotImplemented
+    __array_priority__ = 1000
+
+    def __truediv__(self, other):
+        result = self.delta.__truediv__(other)
+        return _wrap_timedelta_result(result)
+
+    def __rtruediv__(self, other):
+        result = self.delta.__rtruediv__(other)
+        return _wrap_timedelta_result(result)
+
+    if PY2:
+        __div__ = __truediv__
+        __rdiv__ = __rtruediv__
+
+
+# ----------------------------------------------------------------------
+# RelativeDelta Arithmetic
+
+def shift_day(other: datetime, days: int) -> datetime:
+    """
+    Increment the datetime `other` by the given number of days, retaining
+    the time-portion of the datetime.  For tz-naive datetimes this is
+    equivalent to adding a timedelta.  For tz-aware datetimes it is similar to
+    dateutil's relativedelta.__add__, but handles pytz tzinfo objects.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    days : int
+
+    Returns
+    -------
+    shifted: datetime or Timestamp
+    """
+    if other.tzinfo is None:
+        return other + timedelta(days=days)
+
+    tz = other.tzinfo
+    naive = other.replace(tzinfo=None)
+    shifted = naive + timedelta(days=days)
+    return localize_pydatetime(shifted, tz)
+
+
+cdef inline int year_add_months(npy_datetimestruct dts, int months) nogil:
+    """new year number after shifting npy_datetimestruct number of months"""
+    return dts.year + (dts.month + months - 1) / 12
+
+
+cdef inline int month_add_months(npy_datetimestruct dts, int months) nogil:
+    """
+    New month number after shifting npy_datetimestruct
+    number of months.
+    """
+    cdef:
+        int new_month = (dts.month + months) % 12
+    return 12 if new_month == 0 else new_month
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def shift_quarters(int64_t[:] dtindex, int quarters,
+                   int q1start_month, object day, int modby=3):
+    """
+    Given an int64 array representing nanosecond timestamps, shift all elements
+    by the specified number of quarters using DateOffset semantics.
+
+    Parameters
+    ----------
+    dtindex : int64_t[:] timestamps for input dates
+    quarters : int number of quarters to shift
+    q1start_month : int month in which Q1 begins by convention
+    day : {'start', 'end', 'business_start', 'business_end'}
+    modby : int (3 for quarters, 12 for years)
+
+    Returns
+    -------
+    out : ndarray[int64_t]
+    """
+    cdef:
+        Py_ssize_t i
+        npy_datetimestruct dts
+        int count = len(dtindex)
+        int months_to_roll, months_since, n, compare_day
+        bint roll_check
+        int64_t[:] out = np.empty(count, dtype='int64')
+
+    if day == 'start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+
+                # offset semantics - if on the anchor point and going backwards
+                # shift to next
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > 1)):
+                    n += 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+                dts.day = 1
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+
+                if n <= 0 and months_since != 0:
+                    # The general case of this condition would be
+                    # `months_since != 0 or (months_since == 0 and
+                    #    dts.day > get_days_in_month(dts.year, dts.month))`
+                    # but the get_days_in_month inequality would never hold.
+                    n += 1
+                elif n > 0 and (months_since == 0 and
+                                dts.day < get_days_in_month(dts.year,
+                                                            dts.month)):
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+                dts.day = get_days_in_month(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+                # compare_day is only relevant for comparison in the case
+                # where months_since == 0.
+                compare_day = get_firstbday(dts.year, dts.month)
+
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > compare_day)):
+                    # make sure to roll forward, so negate
+                    n += 1
+                elif n > 0 and (months_since == 0 and dts.day < compare_day):
+                    # pretend to roll back if on same month but
+                    # before compare_day
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+
+                dts.day = get_firstbday(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                n = quarters
+
+                months_since = (dts.month - q1start_month) % modby
+                # compare_day is only relevant for comparison in the case
+                # where months_since == 0.
+                compare_day = get_lastbday(dts.year, dts.month)
+
+                if n <= 0 and (months_since != 0 or
+                               (months_since == 0 and dts.day > compare_day)):
+                    # make sure to roll forward, so negate
+                    n += 1
+                elif n > 0 and (months_since == 0 and dts.day < compare_day):
+                    # pretend to roll back if on same month but
+                    # before compare_day
+                    n -= 1
+
+                dts.year = year_add_months(dts, modby * n - months_since)
+                dts.month = month_add_months(dts, modby * n - months_since)
+
+                dts.day = get_lastbday(dts.year, dts.month)
+
+                out[i] = dtstruct_to_dt64(&dts)
+
+    else:
+        raise ValueError("day must be None, 'start', 'end', "
+                         "'business_start', or 'business_end'")
+
+    return np.asarray(out)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def shift_months(int64_t[:] dtindex, int months, object day=None):
+    """
+    Given an int64-based datetime index, shift all elements
+    specified number of months using DateOffset semantics
+
+    day: {None, 'start', 'end'}
+       * None: day of month
+       * 'start' 1st day of month
+       * 'end' last day of month
+    """
+    cdef:
+        Py_ssize_t i
+        npy_datetimestruct dts
+        int count = len(dtindex)
+        int months_to_roll
+        bint roll_check
+        int64_t[:] out = np.empty(count, dtype='int64')
+
+    if day is None:
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                dts.year = year_add_months(dts, months)
+                dts.month = month_add_months(dts, months)
+
+                dts.day = min(dts.day, get_days_in_month(dts.year, dts.month))
+                out[i] = dtstruct_to_dt64(&dts)
+    elif day == 'start':
+        roll_check = False
+        if months <= 0:
+            months += 1
+            roll_check = True
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+
+                # offset semantics - if on the anchor point and going backwards
+                # shift to next
+                if roll_check and dts.day == 1:
+                    months_to_roll -= 1
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+                dts.day = 1
+
+                out[i] = dtstruct_to_dt64(&dts)
+    elif day == 'end':
+        roll_check = False
+        if months > 0:
+            months -= 1
+            roll_check = True
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+
+                # similar semantics - when adding shift forward by one
+                # month if already at an end of month
+                if roll_check and dts.day == get_days_in_month(dts.year,
+                                                               dts.month):
+                    months_to_roll += 1
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_days_in_month(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_start':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+                compare_day = get_firstbday(dts.year, dts.month)
+
+                months_to_roll = roll_convention(dts.day, months_to_roll,
+                                                 compare_day)
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_firstbday(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    elif day == 'business_end':
+        with nogil:
+            for i in range(count):
+                if dtindex[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+
+                dt64_to_dtstruct(dtindex[i], &dts)
+                months_to_roll = months
+                compare_day = get_lastbday(dts.year, dts.month)
+
+                months_to_roll = roll_convention(dts.day, months_to_roll,
+                                                 compare_day)
+
+                dts.year = year_add_months(dts, months_to_roll)
+                dts.month = month_add_months(dts, months_to_roll)
+
+                dts.day = get_lastbday(dts.year, dts.month)
+                out[i] = dtstruct_to_dt64(&dts)
+
+    else:
+        raise ValueError("day must be None, 'start', 'end', "
+                         "'business_start', or 'business_end'")
+
+    return np.asarray(out)
+
+
+def shift_month(stamp: datetime, months: int,
+                day_opt: object=None) -> datetime:
+    """
+    Given a datetime (or Timestamp) `stamp`, an integer `months` and an
+    option `day_opt`, return a new datetimelike that many months later,
+    with day determined by `day_opt` using relativedelta semantics.
+
+    Scalar analogue of shift_months
+
+    Parameters
+    ----------
+    stamp : datetime or Timestamp
+    months : int
+    day_opt : None, 'start', 'end', 'business_start', 'business_end', or int
+        None: returned datetimelike has the same day as the input, or the
+              last day of the month if the new month is too short
+        'start': returned datetimelike has day=1
+        'end': returned datetimelike has day on the last day of the month
+        'business_start': returned datetimelike has day on the first
+            business day of the month
+        'business_end': returned datetimelike has day on the last
+            business day of the month
+        int: returned datetimelike has day equal to day_opt
+
+    Returns
+    -------
+    shifted : datetime or Timestamp (same as input `stamp`)
+    """
+    cdef:
+        int year, month, day
+        int days_in_month, dy
+
+    dy = (stamp.month + months) // 12
+    month = (stamp.month + months) % 12
+
+    if month == 0:
+        month = 12
+        dy -= 1
+    year = stamp.year + dy
+
+    if day_opt is None:
+        days_in_month = get_days_in_month(year, month)
+        day = min(stamp.day, days_in_month)
+    elif day_opt == 'start':
+        day = 1
+    elif day_opt == 'end':
+        day = get_days_in_month(year, month)
+    elif day_opt == 'business_start':
+        # first business day of month
+        day = get_firstbday(year, month)
+    elif day_opt == 'business_end':
+        # last business day of month
+        day = get_lastbday(year, month)
+    elif is_integer_object(day_opt):
+        days_in_month = get_days_in_month(year, month)
+        day = min(day_opt, days_in_month)
+    else:
+        raise ValueError(day_opt)
+    return stamp.replace(year=year, month=month, day=day)
+
+
+cpdef int get_day_of_month(datetime other, day_opt) except? -1:
+    """
+    Find the day in `other`'s month that satisfies a DateOffset's onOffset
+    policy, as described by the `day_opt` argument.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    day_opt : 'start', 'end', 'business_start', 'business_end', or int
+        'start': returns 1
+        'end': returns last day of the month
+        'business_start': returns the first business day of the month
+        'business_end': returns the last business day of the month
+        int: returns the day in the month indicated by `other`, or the last of
+            day the month if the value exceeds in that month's number of days.
+
+    Returns
+    -------
+    day_of_month : int
+
+    Examples
+    -------
+    >>> other = datetime(2017, 11, 14)
+    >>> get_day_of_month(other, 'start')
+    1
+    >>> get_day_of_month(other, 'end')
+    30
+
+    """
+    cdef:
+        int days_in_month
+
+    if day_opt == 'start':
+        return 1
+    elif day_opt == 'end':
+        days_in_month = get_days_in_month(other.year, other.month)
+        return days_in_month
+    elif day_opt == 'business_start':
+        # first business day of month
+        return get_firstbday(other.year, other.month)
+    elif day_opt == 'business_end':
+        # last business day of month
+        return get_lastbday(other.year, other.month)
+    elif is_integer_object(day_opt):
+        days_in_month = get_days_in_month(other.year, other.month)
+        return min(day_opt, days_in_month)
+    elif day_opt is None:
+        # Note: unlike `shift_month`, get_day_of_month does not
+        # allow day_opt = None
+        raise NotImplementedError
+    else:
+        raise ValueError(day_opt)
+
+
+cpdef int roll_convention(int other, int n, int compare) nogil:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : int, generally the day component of a datetime
+    n : number of periods to increment, before adjusting for rolling
+    compare : int, generally the day component of a datetime, in the same
+              month as the datetime form which `other` was taken.
+
+    Returns
+    -------
+    n : int number of periods to increment
+    """
+    if n > 0 and other < compare:
+        n -= 1
+    elif n <= 0 and other > compare:
+        # as if rolled forward already
+        n += 1
+    return n
+
+
+def roll_qtrday(other: datetime, n: int, month: int,
+                day_opt: object, modby: int=3) -> int:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    n : number of periods to increment, before adjusting for rolling
+    month : int reference month giving the first month of the year
+    day_opt : 'start', 'end', 'business_start', 'business_end', or int
+        The convention to use in finding the day in a given month against
+        which to compare for rollforward/rollbackward decisions.
+    modby : int 3 for quarters, 12 for years
+
+    Returns
+    -------
+    n : int number of periods to increment
+
+    See Also
+    --------
+    get_day_of_month : Find the day in a month provided an offset.
+    """
+    cdef:
+        int months_since
+    # TODO: Merge this with roll_yearday by setting modby=12 there?
+    #       code de-duplication versus perf hit?
+    # TODO: with small adjustments this could be used in shift_quarters
+    months_since = other.month % modby - month % modby
+
+    if n > 0:
+        if months_since < 0 or (months_since == 0 and
+                                other.day < get_day_of_month(other,
+                                                             day_opt)):
+            # pretend to roll back if on same month but
+            # before compare_day
+            n -= 1
+    else:
+        if months_since > 0 or (months_since == 0 and
+                                other.day > get_day_of_month(other,
+                                                             day_opt)):
+            # make sure to roll forward, so negate
+            n += 1
+    return n
+
+
+def roll_yearday(other: datetime, n: int, month: int, day_opt: object) -> int:
+    """
+    Possibly increment or decrement the number of periods to shift
+    based on rollforward/rollbackward conventions.
+
+    Parameters
+    ----------
+    other : datetime or Timestamp
+    n : number of periods to increment, before adjusting for rolling
+    month : reference month giving the first month of the year
+    day_opt : 'start', 'end', 'business_start', 'business_end', or int
+        The day of the month to compare against that of `other` when
+        incrementing or decrementing the number of periods:
+
+        'start': 1
+        'end': last day of the month
+        'business_start': first business day of the month
+        'business_end': last business day of the month
+        int: day in the month indicated by `other`, or the last of day
+            the month if the value exceeds in that month's number of days.
+
+    Returns
+    -------
+    n : int number of periods to increment
+
+    Notes
+    -----
+    * Mirrors `roll_check` in shift_months
+
+    Examples
+    -------
+    >>> month = 3
+    >>> day_opt = 'start'              # `other` will be compared to March 1
+    >>> other = datetime(2017, 2, 10)  # before March 1
+    >>> roll_yearday(other, 2, month, day_opt)
+    1
+    >>> roll_yearday(other, -7, month, day_opt)
+    -7
+    >>>
+    >>> other = Timestamp('2014-03-15', tz='US/Eastern')  # after March 1
+    >>> roll_yearday(other, 2, month, day_opt)
+    2
+    >>> roll_yearday(other, -7, month, day_opt)
+    -6
+
+    >>> month = 6
+    >>> day_opt = 'end'                # `other` will be compared to June 30
+    >>> other = datetime(1999, 6, 29)  # before June 30
+    >>> roll_yearday(other, 5, month, day_opt)
+    4
+    >>> roll_yearday(other, -7, month, day_opt)
+    -7
+    >>>
+    >>> other = Timestamp(2072, 8, 24, 6, 17, 18)  # after June 30
+    >>> roll_yearday(other, 5, month, day_opt)
+    5
+    >>> roll_yearday(other, -7, month, day_opt)
+    -6
+
+    """
+    # Note: The other.day < ... condition will never hold when day_opt=='start'
+    # and the other.day > ... condition will never hold when day_opt=='end'.
+    # At some point these extra checks may need to be optimized away.
+    # But that point isn't today.
+    if n > 0:
+        if other.month < month or (other.month == month and
+                                   other.day < get_day_of_month(other,
+                                                                day_opt)):
+            n -= 1
+    else:
+        if other.month > month or (other.month == month and
+                                   other.day > get_day_of_month(other,
+                                                                day_opt)):
+            n += 1
+    return n
diff --git a/pandas/_libs/tslibs/parsing.pyx b/pandas/_libs/tslibs/parsing.pyx
new file mode 100644
index 0000000000000..7759e165b7193
--- /dev/null
+++ b/pandas/_libs/tslibs/parsing.pyx
@@ -0,0 +1,750 @@
+# -*- coding: utf-8 -*-
+"""
+Parsing functions for datetime and datetime-like strings.
+"""
+import sys
+import re
+import time
+
+from cpython.datetime cimport datetime
+
+
+import numpy as np
+
+import six
+from six import binary_type, text_type
+
+# Avoid import from outside _libs
+if sys.version_info.major == 2:
+    from StringIO import StringIO
+else:
+    from io import StringIO
+
+
+# dateutil compat
+from dateutil.tz import (tzoffset,
+                         tzlocal as _dateutil_tzlocal,
+                         tzutc as _dateutil_tzutc,
+                         tzstr as _dateutil_tzstr)
+from dateutil.relativedelta import relativedelta
+from dateutil.parser import DEFAULTPARSER
+from dateutil.parser import parse as du_parse
+
+from pandas._libs.tslibs.ccalendar import MONTH_NUMBERS
+from pandas._libs.tslibs.nattype import nat_strings, NaT
+
+# ----------------------------------------------------------------------
+# Constants
+
+
+class DateParseError(ValueError):
+    pass
+
+
+_DEFAULT_DATETIME = datetime(1, 1, 1).replace(hour=0, minute=0,
+                                              second=0, microsecond=0)
+
+cdef:
+    object _TIMEPAT = re.compile(r'^([01]?[0-9]|2[0-3]):([0-5][0-9])')
+
+    set _not_datelike_strings = {'a', 'A', 'm', 'M', 'p', 'P', 't', 'T'}
+
+# ----------------------------------------------------------------------
+
+_get_option = None
+
+
+def get_option(param):
+    """ Defer import of get_option to break an import cycle that caused
+    significant performance degradation in Period construction. See
+    GH#24118 for details
+    """
+    global _get_option
+    if _get_option is None:
+        from pandas.core.config import get_option
+        _get_option = get_option
+    return _get_option(param)
+
+
+def parse_datetime_string(date_string, freq=None, dayfirst=False,
+                          yearfirst=False, **kwargs):
+    """parse datetime string, only returns datetime.
+    Also cares special handling matching time patterns.
+
+    Returns
+    -------
+    datetime
+    """
+
+    cdef:
+        object dt
+
+    if not _does_string_look_like_datetime(date_string):
+        raise ValueError('Given date string not likely a datetime.')
+
+    if _TIMEPAT.match(date_string):
+        # use current datetime as default, not pass _DEFAULT_DATETIME
+        dt = du_parse(date_string, dayfirst=dayfirst,
+                      yearfirst=yearfirst, **kwargs)
+        return dt
+
+    try:
+        dt, _, _ = _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
+        return dt
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    try:
+        dt = du_parse(date_string, default=_DEFAULT_DATETIME,
+                      dayfirst=dayfirst, yearfirst=yearfirst, **kwargs)
+    except TypeError:
+        # following may be raised from dateutil
+        # TypeError: 'NoneType' object is not iterable
+        raise ValueError('Given date string not likely a datetime.')
+
+    return dt
+
+
+def parse_time_string(arg, freq=None, dayfirst=None, yearfirst=None):
+    """
+    Try hard to parse datetime string, leveraging dateutil plus some extra
+    goodies like quarter recognition.
+
+    Parameters
+    ----------
+    arg : compat.string_types
+    freq : str or DateOffset, default None
+        Helps with interpreting time string if supplied
+    dayfirst : bool, default None
+        If None uses default from print_config
+    yearfirst : bool, default None
+        If None uses default from print_config
+
+    Returns
+    -------
+    datetime, datetime/dateutil.parser._result, str
+    """
+    if not isinstance(arg, (str, unicode)):
+        # Note: cython recognizes `unicode` in both py2/py3, optimizes
+        # this check into a C call.
+        return arg
+
+    if getattr(freq, "_typ", None) == "dateoffset":
+        freq = freq.rule_code
+
+    if dayfirst is None or yearfirst is None:
+        if dayfirst is None:
+            dayfirst = get_option("display.date_dayfirst")
+        if yearfirst is None:
+            yearfirst = get_option("display.date_yearfirst")
+
+    res = parse_datetime_string_with_reso(arg, freq=freq,
+                                          dayfirst=dayfirst,
+                                          yearfirst=yearfirst)
+    return res
+
+
+cdef parse_datetime_string_with_reso(date_string, freq=None, dayfirst=False,
+                                     yearfirst=False):
+    """parse datetime string, only returns datetime
+
+    Returns
+    -------
+    parsed : datetime
+    parsed2 : datetime/dateutil.parser._result
+    reso : str
+        inferred resolution
+
+    Raises
+    ------
+    ValueError : preliminary check suggests string is not datetime
+    DateParseError : error within dateutil
+    """
+    cdef:
+        object parsed, reso
+
+    if not _does_string_look_like_datetime(date_string):
+        raise ValueError('Given date string not likely a datetime.')
+
+    try:
+        return _parse_dateabbr_string(date_string, _DEFAULT_DATETIME, freq)
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    try:
+        parsed, reso = dateutil_parse(date_string, _DEFAULT_DATETIME,
+                                      dayfirst=dayfirst, yearfirst=yearfirst,
+                                      ignoretz=False, tzinfos=None)
+    except Exception as e:
+        # TODO: allow raise of errors within instead
+        raise DateParseError(e)
+    if parsed is None:
+        raise DateParseError("Could not parse {dstr}".format(dstr=date_string))
+    return parsed, parsed, reso
+
+
+cpdef bint _does_string_look_like_datetime(object date_string):
+    if date_string.startswith('0'):
+        # Strings starting with 0 are more consistent with a
+        # date-like string than a number
+        return True
+
+    try:
+        if float(date_string) < 1000:
+            return False
+    except ValueError:
+        pass
+
+    if date_string in _not_datelike_strings:
+        return False
+
+    return True
+
+
+cdef inline object _parse_dateabbr_string(object date_string, object default,
+                                          object freq):
+    cdef:
+        object ret
+        int year, quarter = -1, month, mnum, date_len
+
+    # special handling for possibilities eg, 2Q2005, 2Q05, 2005Q1, 05Q1
+    assert isinstance(date_string, (str, unicode))
+
+    # len(date_string) == 0
+    # should be NaT???
+
+    if date_string in nat_strings:
+        return NaT, NaT, ''
+
+    date_string = date_string.upper()
+    date_len = len(date_string)
+
+    if date_len == 4:
+        # parse year only like 2000
+        try:
+            ret = default.replace(year=int(date_string))
+            return ret, ret, 'year'
+        except ValueError:
+            pass
+
+    try:
+        if 4 <= date_len <= 7:
+            i = date_string.index('Q', 1, 6)
+            if i == 1:
+                quarter = int(date_string[0])
+                if date_len == 4 or (date_len == 5
+                                     and date_string[i + 1] == '-'):
+                    # r'(\d)Q-?(\d\d)')
+                    year = 2000 + int(date_string[-2:])
+                elif date_len == 6 or (date_len == 7
+                                       and date_string[i + 1] == '-'):
+                    # r'(\d)Q-?(\d\d\d\d)')
+                    year = int(date_string[-4:])
+                else:
+                    raise ValueError
+            elif i == 2 or i == 3:
+                # r'(\d\d)-?Q(\d)'
+                if date_len == 4 or (date_len == 5
+                                     and date_string[i - 1] == '-'):
+                    quarter = int(date_string[-1])
+                    year = 2000 + int(date_string[:2])
+                else:
+                    raise ValueError
+            elif i == 4 or i == 5:
+                if date_len == 6 or (date_len == 7
+                                     and date_string[i - 1] == '-'):
+                    # r'(\d\d\d\d)-?Q(\d)'
+                    quarter = int(date_string[-1])
+                    year = int(date_string[:4])
+                else:
+                    raise ValueError
+
+            if not (1 <= quarter <= 4):
+                msg = ('Incorrect quarterly string is given, quarter must be '
+                       'between 1 and 4: {dstr}')
+                raise DateParseError(msg.format(dstr=date_string))
+
+            if freq is not None:
+                # hack attack, #1228
+                try:
+                    mnum = MONTH_NUMBERS[_get_rule_month(freq)] + 1
+                except (KeyError, ValueError):
+                    msg = ('Unable to retrieve month information from given '
+                           'freq: {freq}'.format(freq=freq))
+                    raise DateParseError(msg)
+
+                month = (mnum + (quarter - 1) * 3) % 12 + 1
+                if month > mnum:
+                    year -= 1
+            else:
+                month = (quarter - 1) * 3 + 1
+
+            ret = default.replace(year=year, month=month)
+            return ret, ret, 'quarter'
+
+    except DateParseError:
+        raise
+    except ValueError:
+        pass
+
+    if date_len == 6 and (freq == 'M' or
+                          getattr(freq, 'rule_code', None) == 'M'):
+        year = int(date_string[:4])
+        month = int(date_string[4:6])
+        try:
+            ret = default.replace(year=year, month=month)
+            return ret, ret, 'month'
+        except ValueError:
+            pass
+
+    for pat in ['%Y-%m', '%m-%Y', '%b %Y', '%b-%Y']:
+        try:
+            ret = datetime.strptime(date_string, pat)
+            return ret, ret, 'month'
+        except ValueError:
+            pass
+
+    raise ValueError('Unable to parse {0}'.format(date_string))
+
+
+cdef dateutil_parse(object timestr, object default, ignoretz=False,
+                    tzinfos=None, dayfirst=None, yearfirst=None):
+    """ lifted from dateutil to get resolution"""
+
+    cdef:
+        object fobj, res, attr, ret, tzdata
+        object reso = None
+        dict repl = {}
+
+    fobj = StringIO(str(timestr))
+    res = DEFAULTPARSER._parse(fobj, dayfirst=dayfirst, yearfirst=yearfirst)
+
+    # dateutil 2.2 compat
+    if isinstance(res, tuple):  # PyTuple_Check
+        res, _ = res
+
+    if res is None:
+        msg = "Unknown datetime string format, unable to parse: {timestr}"
+        raise ValueError(msg.format(timestr=timestr))
+
+    for attr in ["year", "month", "day", "hour",
+                 "minute", "second", "microsecond"]:
+        value = getattr(res, attr)
+        if value is not None:
+            repl[attr] = value
+            reso = attr
+
+    if reso is None:
+        msg = "Unable to parse datetime string: {timestr}"
+        raise ValueError(msg.format(timestr=timestr))
+
+    if reso == 'microsecond':
+        if repl['microsecond'] == 0:
+            reso = 'second'
+        elif repl['microsecond'] % 1000 == 0:
+            reso = 'millisecond'
+
+    ret = default.replace(**repl)
+    if res.weekday is not None and not res.day:
+        ret = ret + relativedelta.relativedelta(weekday=res.weekday)
+    if not ignoretz:
+        if callable(tzinfos) or tzinfos and res.tzname in tzinfos:
+            if callable(tzinfos):
+                tzdata = tzinfos(res.tzname, res.tzoffset)
+            else:
+                tzdata = tzinfos.get(res.tzname)
+            if isinstance(tzdata, datetime.tzinfo):
+                tzinfo = tzdata
+            elif isinstance(tzdata, (str, unicode)):
+                tzinfo = _dateutil_tzstr(tzdata)
+            elif isinstance(tzdata, int):
+                tzinfo = tzoffset(res.tzname, tzdata)
+            else:
+                raise ValueError("offset must be tzinfo subclass, "
+                                 "tz string, or int offset")
+            ret = ret.replace(tzinfo=tzinfo)
+        elif res.tzname and res.tzname in time.tzname:
+            ret = ret.replace(tzinfo=_dateutil_tzlocal())
+        elif res.tzoffset == 0:
+            ret = ret.replace(tzinfo=_dateutil_tzutc())
+        elif res.tzoffset:
+            ret = ret.replace(tzinfo=tzoffset(res.tzname, res.tzoffset))
+    return ret, reso
+
+
+cdef object _get_rule_month(object source, object default='DEC'):
+    """
+    Return starting month of given freq, default is December.
+
+    Example
+    -------
+    >>> _get_rule_month('D')
+    'DEC'
+
+    >>> _get_rule_month('A-JAN')
+    'JAN'
+    """
+    if hasattr(source, 'freqstr'):
+        source = source.freqstr
+    source = source.upper()
+    if '-' not in source:
+        return default
+    else:
+        return source.split('-')[1]
+
+
+# ----------------------------------------------------------------------
+# Parsing for type-inference
+
+
+def try_parse_dates(object[:] values, parser=None,
+                    dayfirst=False, default=None):
+    cdef:
+        Py_ssize_t i, n
+        object[:] result
+
+    n = len(values)
+    result = np.empty(n, dtype='O')
+
+    if parser is None:
+        if default is None:  # GH2618
+            date = datetime.now()
+            default = datetime(date.year, date.month, 1)
+
+        parse_date = lambda x: du_parse(x, dayfirst=dayfirst, default=default)
+
+        # EAFP here
+        try:
+            for i in range(n):
+                if values[i] == '':
+                    result[i] = np.nan
+                else:
+                    result[i] = parse_date(values[i])
+        except Exception:
+            # failed
+            return values
+    else:
+        parse_date = parser
+
+        try:
+            for i in range(n):
+                if values[i] == '':
+                    result[i] = np.nan
+                else:
+                    result[i] = parse_date(values[i])
+        except Exception:
+            # raise if passed parser and it failed
+            raise
+
+    return result.base  # .base to access underlying ndarray
+
+
+def try_parse_date_and_time(object[:] dates, object[:] times,
+                            date_parser=None, time_parser=None,
+                            dayfirst=False, default=None):
+    cdef:
+        Py_ssize_t i, n
+        object[:] result
+
+    n = len(dates)
+    if len(times) != n:
+        raise ValueError('Length of dates and times must be equal')
+    result = np.empty(n, dtype='O')
+
+    if date_parser is None:
+        if default is None:  # GH2618
+            date = datetime.now()
+            default = datetime(date.year, date.month, 1)
+
+        parse_date = lambda x: du_parse(x, dayfirst=dayfirst, default=default)
+
+    else:
+        parse_date = date_parser
+
+    if time_parser is None:
+        parse_time = lambda x: du_parse(x)
+
+    else:
+        parse_time = time_parser
+
+    for i in range(n):
+        d = parse_date(str(dates[i]))
+        t = parse_time(str(times[i]))
+        result[i] = datetime(d.year, d.month, d.day,
+                             t.hour, t.minute, t.second)
+
+    return result.base  # .base to access underlying ndarray
+
+
+def try_parse_year_month_day(object[:] years, object[:] months,
+                             object[:] days):
+    cdef:
+        Py_ssize_t i, n
+        object[:] result
+
+    n = len(years)
+    if len(months) != n or len(days) != n:
+        raise ValueError('Length of years/months/days must all be equal')
+    result = np.empty(n, dtype='O')
+
+    for i in range(n):
+        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]))
+
+    return result.base  # .base to access underlying ndarray
+
+
+def try_parse_datetime_components(object[:] years,
+                                  object[:] months,
+                                  object[:] days,
+                                  object[:] hours,
+                                  object[:] minutes,
+                                  object[:] seconds):
+
+    cdef:
+        Py_ssize_t i, n
+        object[:] result
+        int secs
+        double float_secs
+        double micros
+
+    n = len(years)
+    if (len(months) != n or len(days) != n or len(hours) != n or
+            len(minutes) != n or len(seconds) != n):
+        raise ValueError('Length of all datetime components must be equal')
+    result = np.empty(n, dtype='O')
+
+    for i in range(n):
+        float_secs = float(seconds[i])
+        secs = int(float_secs)
+
+        micros = float_secs - secs
+        if micros > 0:
+            micros = micros * 1000000
+
+        result[i] = datetime(int(years[i]), int(months[i]), int(days[i]),
+                             int(hours[i]), int(minutes[i]), secs,
+                             int(micros))
+
+    return result.base  # .base to access underlying ndarray
+
+
+# ----------------------------------------------------------------------
+# Miscellaneous
+
+
+# Class copied verbatim from https://github.com/dateutil/dateutil/pull/732
+#
+# We use this class to parse and tokenize date strings. However, as it is
+# a private class in the dateutil library, relying on backwards compatibility
+# is not practical. In fact, using this class issues warnings (xref gh-21322).
+# Thus, we port the class over so that both issues are resolved.
+#
+# Copyright (c) 2017 - dateutil contributors
+class _timelex(object):
+    def __init__(self, instream):
+        if six.PY2:
+            # In Python 2, we can't duck type properly because unicode has
+            # a 'decode' function, and we'd be double-decoding
+            if isinstance(instream, (binary_type, bytearray)):
+                instream = instream.decode()
+        else:
+            if getattr(instream, 'decode', None) is not None:
+                instream = instream.decode()
+
+        if isinstance(instream, text_type):
+            self.stream = instream
+        elif getattr(instream, 'read', None) is None:
+            raise TypeError(
+                'Parser must be a string or character stream, not '
+                '{itype}'.format(itype=instream.__class__.__name__))
+        else:
+            self.stream = instream.read()
+
+    def get_tokens(self):
+        """
+        This function breaks the time string into lexical units (tokens), which
+        can be parsed by the parser. Lexical units are demarcated by changes in
+        the character set, so any continuous string of letters is considered
+        one unit, any continuous string of numbers is considered one unit.
+        The main complication arises from the fact that dots ('.') can be used
+        both as separators (e.g. "Sep.20.2009") or decimal points (e.g.
+        "4:30:21.447"). As such, it is necessary to read the full context of
+        any dot-separated strings before breaking it into tokens; as such, this
+        function maintains a "token stack", for when the ambiguous context
+        demands that multiple tokens be parsed at once.
+        """
+        stream = self.stream.replace('\x00', '')
+
+        # TODO: Change \s --> \s+ (this doesn't match existing behavior)
+        # TODO: change the punctuation block to punc+ (doesnt match existing)
+        # TODO: can we merge the two digit patterns?
+        tokens = re.findall('\s|'
+                            '(?<![\.\d])\d+\.\d+(?![\.\d])'
+                            '|\d+'
+                            '|[a-zA-Z]+'
+                            '|[\./:]+'
+                            '|[^\da-zA-Z\./:\s]+', stream)
+
+        # Re-combine token tuples of the form ["59", ",", "456"] because
+        # in this context the "," is treated as a decimal
+        # (e.g. in python's default logging format)
+        for n, token in enumerate(tokens[:-2]):
+            # Kludge to match ,-decimal behavior; it'd be better to do this
+            # later in the process and have a simpler tokenization
+            if (token is not None and token.isdigit() and
+                    tokens[n + 1] == ',' and tokens[n + 2].isdigit()):
+                # Have to check None b/c it might be replaced during the loop
+                # TODO: I _really_ don't faking the value here
+                tokens[n] = token + '.' + tokens[n + 2]
+                tokens[n + 1] = None
+                tokens[n + 2] = None
+
+        tokens = [x for x in tokens if x is not None]
+        return tokens
+
+    @classmethod
+    def split(cls, s):
+        return cls(s).get_tokens()
+
+
+_DATEUTIL_LEXER_SPLIT = _timelex.split
+
+
+def _format_is_iso(f) -> bint:
+    """
+    Does format match the iso8601 set that can be handled by the C parser?
+    Generally of form YYYY-MM-DDTHH:MM:SS - date separator can be different
+    but must be consistent.  Leading 0s in dates and times are optional.
+    """
+    iso_template = '%Y{date_sep}%m{date_sep}%d{time_sep}%H:%M:%S.%f'.format
+    excluded_formats = ['%Y%m%d', '%Y%m', '%Y']
+
+    for date_sep in [' ', '/', '\\', '-', '.', '']:
+        for time_sep in [' ', 'T']:
+            if (iso_template(date_sep=date_sep,
+                             time_sep=time_sep
+                             ).startswith(f) and f not in excluded_formats):
+                return True
+    return False
+
+
+def _guess_datetime_format(dt_str, dayfirst=False, dt_str_parse=du_parse,
+                           dt_str_split=_DATEUTIL_LEXER_SPLIT):
+    """
+    Guess the datetime format of a given datetime string.
+
+    Parameters
+    ----------
+    dt_str : string, datetime string to guess the format of
+    dayfirst : boolean, default False
+        If True parses dates with the day first, eg 20/01/2005
+        Warning: dayfirst=True is not strict, but will prefer to parse
+        with day first (this is a known bug).
+    dt_str_parse : function, defaults to `compat.parse_date` (dateutil)
+        This function should take in a datetime string and return
+        a `datetime.datetime` guess that the datetime string represents
+    dt_str_split : function, defaults to `_DATEUTIL_LEXER_SPLIT` (dateutil)
+        This function should take in a datetime string and return
+        a list of strings, the guess of the various specific parts
+        e.g. '2011/12/30' -> ['2011', '/', '12', '/', '30']
+
+    Returns
+    -------
+    ret : datetime format string (for `strftime` or `strptime`)
+    """
+    if dt_str_parse is None or dt_str_split is None:
+        return None
+
+    if not isinstance(dt_str, (str, unicode)):
+        return None
+
+    day_attribute_and_format = (('day',), '%d', 2)
+
+    # attr name, format, padding (if any)
+    datetime_attrs_to_format = [
+        (('year', 'month', 'day'), '%Y%m%d', 0),
+        (('year',), '%Y', 0),
+        (('month',), '%B', 0),
+        (('month',), '%b', 0),
+        (('month',), '%m', 2),
+        day_attribute_and_format,
+        (('hour',), '%H', 2),
+        (('minute',), '%M', 2),
+        (('second',), '%S', 2),
+        (('microsecond',), '%f', 6),
+        (('second', 'microsecond'), '%S.%f', 0),
+    ]
+
+    if dayfirst:
+        datetime_attrs_to_format.remove(day_attribute_and_format)
+        datetime_attrs_to_format.insert(0, day_attribute_and_format)
+
+    try:
+        parsed_datetime = dt_str_parse(dt_str, dayfirst=dayfirst)
+    except:
+        # In case the datetime can't be parsed, its format cannot be guessed
+        return None
+
+    if parsed_datetime is None:
+        return None
+
+    try:
+        tokens = dt_str_split(dt_str)
+    except:
+        # In case the datetime string can't be split, its format cannot
+        # be guessed
+        return None
+
+    format_guess = [None] * len(tokens)
+    found_attrs = set()
+
+    for attrs, attr_format, padding in datetime_attrs_to_format:
+        # If a given attribute has been placed in the format string, skip
+        # over other formats for that same underlying attribute (IE, month
+        # can be represented in multiple different ways)
+        if set(attrs) & found_attrs:
+            continue
+
+        if all(getattr(parsed_datetime, attr) is not None for attr in attrs):
+            for i, token_format in enumerate(format_guess):
+                token_filled = tokens[i].zfill(padding)
+                if (token_format is None and
+                        token_filled == parsed_datetime.strftime(attr_format)):
+                    format_guess[i] = attr_format
+                    tokens[i] = token_filled
+                    found_attrs.update(attrs)
+                    break
+
+    # Only consider it a valid guess if we have a year, month and day
+    if len({'year', 'month', 'day'} & found_attrs) != 3:
+        return None
+
+    output_format = []
+    for i, guess in enumerate(format_guess):
+        if guess is not None:
+            # Either fill in the format placeholder (like %Y)
+            output_format.append(guess)
+        else:
+            # Or just the token separate (IE, the dashes in "01-01-2013")
+            try:
+                # If the token is numeric, then we likely didn't parse it
+                # properly, so our guess is wrong
+                float(tokens[i])
+                return None
+            except ValueError:
+                pass
+
+            output_format.append(tokens[i])
+
+    guessed_format = ''.join(output_format)
+
+    # rebuild string, capturing any inferred padding
+    dt_str = ''.join(tokens)
+    if parsed_datetime.strftime(guessed_format) == dt_str:
+        return guessed_format
+    else:
+        return None
diff --git a/pandas/_libs/tslibs/period.pyx b/pandas/_libs/tslibs/period.pyx
new file mode 100644
index 0000000000000..c8eaa2cfd85c2
--- /dev/null
+++ b/pandas/_libs/tslibs/period.pyx
@@ -0,0 +1,2554 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+from cpython cimport (
+    PyObject_RichCompareBool,
+    Py_EQ, Py_NE)
+
+from numpy cimport int64_t, import_array, ndarray
+import numpy as np
+import_array()
+
+from libc.stdlib cimport free, malloc
+from libc.time cimport strftime, tm
+from libc.string cimport strlen, memset
+
+import cython
+
+from cpython.datetime cimport (PyDateTime_Check, PyDelta_Check, PyDate_Check,
+                               PyDateTime_IMPORT)
+# import datetime C API
+PyDateTime_IMPORT
+
+from pandas._libs.tslibs.np_datetime cimport (
+    npy_datetimestruct, dtstruct_to_dt64, dt64_to_dtstruct,
+    pandas_datetime_to_datetimestruct, NPY_DATETIMEUNIT, NPY_FR_D)
+
+cdef extern from "src/datetime/np_datetime.h":
+    int64_t npy_datetimestruct_to_datetime(NPY_DATETIMEUNIT fr,
+                                           npy_datetimestruct *d) nogil
+
+cimport pandas._libs.tslibs.util as util
+from pandas._libs.tslibs.util cimport is_period_object, is_string_object
+
+from pandas._libs.tslibs.timestamps import Timestamp
+from pandas._libs.tslibs.timezones cimport is_utc, is_tzlocal, get_dst_info
+from pandas._libs.tslibs.timedeltas import Timedelta
+from pandas._libs.tslibs.timedeltas cimport delta_to_nanoseconds
+
+cimport pandas._libs.tslibs.ccalendar as ccalendar
+from pandas._libs.tslibs.ccalendar cimport (
+    dayofweek, get_day_of_year, is_leapyear)
+from pandas._libs.tslibs.ccalendar import MONTH_NUMBERS
+from pandas._libs.tslibs.conversion cimport tz_convert_utc_to_tzlocal
+from pandas._libs.tslibs.frequencies cimport (
+    get_freq_code, get_base_alias, get_to_timestamp_base, get_freq_str,
+    get_rule_month)
+from pandas._libs.tslibs.parsing import parse_time_string
+from pandas._libs.tslibs.resolution import Resolution
+from pandas._libs.tslibs.nattype import nat_strings
+from pandas._libs.tslibs.nattype cimport (
+    _nat_scalar_rules, NPY_NAT, is_null_datetimelike, c_NaT as NaT)
+from pandas._libs.tslibs.offsets cimport to_offset
+from pandas._libs.tslibs.offsets import _Tick
+
+cdef:
+    bint PY2 = str == bytes
+    enum:
+        INT32_MIN = -2147483648
+
+
+ctypedef struct asfreq_info:
+    int64_t intraday_conversion_factor
+    int is_end
+    int to_end
+    int from_end
+
+ctypedef int64_t (*freq_conv_func)(int64_t, asfreq_info*) nogil
+
+
+cdef extern from *:
+    """
+    /*** FREQUENCY CONSTANTS ***/
+    // See frequencies.pyx for more detailed variants
+
+    #define FR_ANN 1000      /* Annual */
+    #define FR_QTR 2000      /* Quarterly - December year end (default Q) */
+    #define FR_MTH 3000      /* Monthly */
+    #define FR_WK 4000       /* Weekly */
+    #define FR_BUS 5000      /* Business days */
+    #define FR_DAY 6000      /* Daily */
+    #define FR_HR 7000       /* Hourly */
+    #define FR_MIN 8000      /* Minutely */
+    #define FR_SEC 9000      /* Secondly */
+    #define FR_MS 10000      /* Millisecondly */
+    #define FR_US 11000      /* Microsecondly */
+    #define FR_NS 12000      /* Nanosecondly */
+    #define FR_UND -10000    /* Undefined */
+
+    // must use npy typedef b/c int64_t is aliased in cython-generated c
+    static npy_int64 daytime_conversion_factor_matrix[7][7] = {
+        {1, 24, 1440, 86400, 86400000, 86400000000, 86400000000000},
+        {0,  1,   60,  3600,  3600000,  3600000000,  3600000000000},
+        {0,  0,   1,     60,    60000,    60000000,    60000000000},
+        {0,  0,   0,      1,     1000,     1000000,     1000000000},
+        {0,  0,   0,      0,        1,        1000,        1000000},
+        {0,  0,   0,      0,        0,           1,           1000},
+        {0,  0,   0,      0,        0,           0,              1}};
+    """
+    int64_t daytime_conversion_factor_matrix[7][7]
+    # TODO: Can we get these frequencies from frequencies.FreqGroup?
+    int FR_ANN
+    int FR_QTR
+    int FR_MTH
+    int FR_WK
+    int FR_DAY
+    int FR_HR
+    int FR_MIN
+    int FR_SEC
+    int FR_MS
+    int FR_US
+    int FR_NS
+    int FR_BUS
+    int FR_UND
+
+
+cdef int max_value(int left, int right) nogil:
+    if left > right:
+        return left
+    return right
+
+
+cdef int min_value(int left, int right) nogil:
+    if left < right:
+        return left
+    return right
+
+
+cdef int64_t get_daytime_conversion_factor(int from_index, int to_index) nogil:
+    cdef:
+        int row = min_value(from_index, to_index)
+        int col = max_value(from_index, to_index)
+    # row or col < 6 means frequency strictly lower than Daily, which
+    # do not use daytime_conversion_factors
+    if row < 6:
+        return 0
+    elif col < 6:
+        return 0
+    return daytime_conversion_factor_matrix[row - 6][col - 6]
+
+
+cdef int64_t nofunc(int64_t ordinal, asfreq_info *af_info) nogil:
+    return INT32_MIN
+
+
+cdef int64_t no_op(int64_t ordinal, asfreq_info *af_info) nogil:
+    return ordinal
+
+
+cdef freq_conv_func get_asfreq_func(int from_freq, int to_freq) nogil:
+    cdef:
+        int from_group = get_freq_group(from_freq)
+        int to_group = get_freq_group(to_freq)
+
+    if from_group == FR_UND:
+        from_group = FR_DAY
+
+    if from_group == FR_BUS:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_BtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_BtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>asfreq_BtoM
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_BtoW
+        elif to_group == FR_BUS:
+            return <freq_conv_func>no_op
+        elif to_group  in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_BtoDT
+        else:
+            return <freq_conv_func>nofunc
+
+    elif to_group == FR_BUS:
+        if from_group == FR_ANN:
+            return <freq_conv_func>asfreq_AtoB
+        elif from_group == FR_QTR:
+            return <freq_conv_func>asfreq_QtoB
+        elif from_group == FR_MTH:
+            return <freq_conv_func>asfreq_MtoB
+        elif from_group == FR_WK:
+            return <freq_conv_func>asfreq_WtoB
+        elif from_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC,
+                            FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_DTtoB
+        else:
+            return <freq_conv_func>nofunc
+
+    elif from_group == FR_ANN:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_AtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_AtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>asfreq_AtoM
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_AtoW
+        elif to_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_AtoDT
+        else:
+            return <freq_conv_func>nofunc
+
+    elif from_group == FR_QTR:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_QtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_QtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>asfreq_QtoM
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_QtoW
+        elif to_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_QtoDT
+        else:
+            return <freq_conv_func>nofunc
+
+    elif from_group == FR_MTH:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_MtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_MtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>no_op
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_MtoW
+        elif to_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_MtoDT
+        else:
+            return <freq_conv_func>nofunc
+
+    elif from_group == FR_WK:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_WtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_WtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>asfreq_WtoM
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_WtoW
+        elif to_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            return <freq_conv_func>asfreq_WtoDT
+        else:
+            return <freq_conv_func>nofunc
+
+    elif from_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+        if to_group == FR_ANN:
+            return <freq_conv_func>asfreq_DTtoA
+        elif to_group == FR_QTR:
+            return <freq_conv_func>asfreq_DTtoQ
+        elif to_group == FR_MTH:
+            return <freq_conv_func>asfreq_DTtoM
+        elif to_group == FR_WK:
+            return <freq_conv_func>asfreq_DTtoW
+        elif to_group in [FR_DAY, FR_HR, FR_MIN, FR_SEC, FR_MS, FR_US, FR_NS]:
+            if from_group > to_group:
+                return <freq_conv_func>downsample_daytime
+            else:
+                return <freq_conv_func>upsample_daytime
+
+        else:
+            return <freq_conv_func>nofunc
+
+    else:
+        return <freq_conv_func>nofunc
+
+
+# --------------------------------------------------------------------
+# Frequency Conversion Helpers
+
+cdef int64_t DtoB_weekday(int64_t unix_date) nogil:
+    return ((unix_date + 4) // 7) * 5 + ((unix_date + 4) % 7) - 4
+
+
+cdef int64_t DtoB(npy_datetimestruct *dts, int roll_back,
+                  int64_t unix_date) nogil:
+    cdef:
+        int day_of_week = dayofweek(dts.year, dts.month, dts.day)
+
+    if roll_back == 1:
+        if day_of_week > 4:
+            # change to friday before weekend
+            unix_date -= (day_of_week - 4)
+    else:
+        if day_of_week > 4:
+            # change to Monday after weekend
+            unix_date += (7 - day_of_week)
+
+    return DtoB_weekday(unix_date)
+
+
+cdef inline int64_t upsample_daytime(int64_t ordinal,
+                                     asfreq_info *af_info) nogil:
+    if (af_info.is_end):
+        return (ordinal + 1) * af_info.intraday_conversion_factor - 1
+    else:
+        return ordinal * af_info.intraday_conversion_factor
+
+
+cdef inline int64_t downsample_daytime(int64_t ordinal,
+                                       asfreq_info *af_info) nogil:
+    return ordinal // (af_info.intraday_conversion_factor)
+
+
+cdef inline int64_t transform_via_day(int64_t ordinal,
+                                      asfreq_info *af_info,
+                                      freq_conv_func first_func,
+                                      freq_conv_func second_func) nogil:
+    cdef:
+        int64_t result
+
+    result = first_func(ordinal, af_info)
+    result = second_func(result, af_info)
+    return result
+
+
+# --------------------------------------------------------------------
+# Conversion _to_ Daily Freq
+
+cdef void AtoD_ym(int64_t ordinal, int64_t *year,
+                  int *month, asfreq_info *af_info) nogil:
+    year[0] = ordinal + 1970
+    month[0] = 1
+
+    if af_info.from_end != 12:
+        month[0] += af_info.from_end
+        if month[0] > 12:
+            #  This case is never reached, but is kept for symmetry
+            # with QtoD_ym
+            month[0] -= 12
+        else:
+            year[0] -= 1
+
+
+cdef int64_t asfreq_AtoDT(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int64_t unix_date, year
+        int month
+
+    ordinal += af_info.is_end
+    AtoD_ym(ordinal, &year, &month, af_info)
+
+    unix_date = unix_date_from_ymd(year, month, 1)
+    unix_date -= af_info.is_end
+    return upsample_daytime(unix_date, af_info)
+
+
+cdef void QtoD_ym(int64_t ordinal, int *year,
+                  int *month, asfreq_info *af_info) nogil:
+    year[0] = ordinal // 4 + 1970
+    month[0] = (ordinal % 4) * 3 + 1
+
+    if af_info.from_end != 12:
+        month[0] += af_info.from_end
+        if month[0] > 12:
+            month[0] -= 12
+        else:
+            year[0] -= 1
+
+
+cdef int64_t asfreq_QtoDT(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int64_t unix_date
+        int year, month
+
+    ordinal += af_info.is_end
+    QtoD_ym(ordinal, &year, &month, af_info)
+
+    unix_date = unix_date_from_ymd(year, month, 1)
+    unix_date -= af_info.is_end
+    return upsample_daytime(unix_date, af_info)
+
+
+cdef void MtoD_ym(int64_t ordinal, int *year, int *month) nogil:
+    year[0] = ordinal // 12 + 1970
+    month[0] = ordinal % 12 + 1
+
+
+cdef int64_t asfreq_MtoDT(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int64_t unix_date
+        int year, month
+
+    ordinal += af_info.is_end
+    MtoD_ym(ordinal, &year, &month)
+
+    unix_date = unix_date_from_ymd(year, month, 1)
+    unix_date -= af_info.is_end
+    return upsample_daytime(unix_date, af_info)
+
+
+cdef int64_t asfreq_WtoDT(int64_t ordinal, asfreq_info *af_info) nogil:
+    ordinal = (ordinal * 7 + af_info.from_end - 4 +
+               (7 - 1) * (af_info.is_end - 1))
+    return upsample_daytime(ordinal, af_info)
+
+
+# --------------------------------------------------------------------
+# Conversion _to_ BusinessDay Freq
+
+cdef int64_t asfreq_AtoB(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int roll_back
+        npy_datetimestruct dts
+        int64_t unix_date = asfreq_AtoDT(ordinal, af_info)
+
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, &dts)
+    roll_back = af_info.is_end
+    return DtoB(&dts, roll_back, unix_date)
+
+
+cdef int64_t asfreq_QtoB(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int roll_back
+        npy_datetimestruct dts
+        int64_t unix_date = asfreq_QtoDT(ordinal, af_info)
+
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, &dts)
+    roll_back = af_info.is_end
+    return DtoB(&dts, roll_back, unix_date)
+
+
+cdef int64_t asfreq_MtoB(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int roll_back
+        npy_datetimestruct dts
+        int64_t unix_date = asfreq_MtoDT(ordinal, af_info)
+
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, &dts)
+    roll_back = af_info.is_end
+    return DtoB(&dts, roll_back, unix_date)
+
+
+cdef int64_t asfreq_WtoB(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int roll_back
+        npy_datetimestruct dts
+        int64_t unix_date = asfreq_WtoDT(ordinal, af_info)
+
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, &dts)
+    roll_back = af_info.is_end
+    return DtoB(&dts, roll_back, unix_date)
+
+
+cdef int64_t asfreq_DTtoB(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int roll_back
+        npy_datetimestruct dts
+        int64_t unix_date = downsample_daytime(ordinal, af_info)
+
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, &dts)
+    # This usage defines roll_back the opposite way from the others
+    roll_back = 1 - af_info.is_end
+    return DtoB(&dts, roll_back, unix_date)
+
+
+# ----------------------------------------------------------------------
+# Conversion _from_ Daily Freq
+
+cdef int64_t asfreq_DTtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        npy_datetimestruct dts
+
+    ordinal = downsample_daytime(ordinal, af_info)
+    pandas_datetime_to_datetimestruct(ordinal, NPY_FR_D, &dts)
+    if dts.month > af_info.to_end:
+        return <int64_t>(dts.year + 1 - 1970)
+    else:
+        return <int64_t>(dts.year - 1970)
+
+
+cdef int DtoQ_yq(int64_t ordinal, asfreq_info *af_info, int *year) nogil:
+    cdef:
+        npy_datetimestruct dts
+        int quarter
+
+    pandas_datetime_to_datetimestruct(ordinal, NPY_FR_D, &dts)
+    # TODO: Another version of this function used
+    # date_info_from_days_and_time(&dts, unix_date, 0)
+    # instead of pandas_datetime_to_datetimestruct; is one more performant?
+    if af_info.to_end != 12:
+        dts.month -= af_info.to_end
+        if dts.month <= 0:
+            dts.month += 12
+        else:
+            dts.year += 1
+
+    year[0] = dts.year
+    quarter = month_to_quarter(dts.month)
+    return quarter
+
+
+cdef int64_t asfreq_DTtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        int year, quarter
+
+    ordinal = downsample_daytime(ordinal, af_info)
+
+    quarter = DtoQ_yq(ordinal, af_info, &year)
+    return <int64_t>((year - 1970) * 4 + quarter - 1)
+
+
+cdef int64_t asfreq_DTtoM(int64_t ordinal, asfreq_info *af_info) nogil:
+    cdef:
+        npy_datetimestruct dts
+
+    ordinal = downsample_daytime(ordinal, af_info)
+    pandas_datetime_to_datetimestruct(ordinal, NPY_FR_D, &dts)
+    return <int64_t>((dts.year - 1970) * 12 + dts.month - 1)
+
+
+cdef int64_t asfreq_DTtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    ordinal = downsample_daytime(ordinal, af_info)
+    return (ordinal + 3 - af_info.to_end) // 7 + 1
+
+
+# --------------------------------------------------------------------
+# Conversion _from_ BusinessDay Freq
+
+cdef int64_t asfreq_BtoDT(int64_t ordinal, asfreq_info *af_info) nogil:
+    ordinal = ((ordinal + 3) // 5) * 7 + (ordinal + 3) % 5 -3
+    return upsample_daytime(ordinal, af_info)
+
+
+cdef int64_t asfreq_BtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_BtoDT,
+                             <freq_conv_func>asfreq_DTtoA)
+
+
+cdef int64_t asfreq_BtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_BtoDT,
+                             <freq_conv_func>asfreq_DTtoQ)
+
+
+cdef int64_t asfreq_BtoM(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_BtoDT,
+                             <freq_conv_func>asfreq_DTtoM)
+
+
+cdef int64_t asfreq_BtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_BtoDT,
+                             <freq_conv_func>asfreq_DTtoW)
+
+
+# ----------------------------------------------------------------------
+# Conversion _from_ Annual Freq
+
+cdef int64_t asfreq_AtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_AtoDT,
+                             <freq_conv_func>asfreq_DTtoA)
+
+
+cdef int64_t asfreq_AtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_AtoDT,
+                             <freq_conv_func>asfreq_DTtoQ)
+
+
+cdef int64_t asfreq_AtoM(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_AtoDT,
+                             <freq_conv_func>asfreq_DTtoM)
+
+
+cdef int64_t asfreq_AtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_AtoDT,
+                             <freq_conv_func>asfreq_DTtoW)
+
+
+# ----------------------------------------------------------------------
+# Conversion _from_ Quarterly Freq
+
+cdef int64_t asfreq_QtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_QtoDT,
+                             <freq_conv_func>asfreq_DTtoQ)
+
+
+cdef int64_t asfreq_QtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_QtoDT,
+                             <freq_conv_func>asfreq_DTtoA)
+
+
+cdef int64_t asfreq_QtoM(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_QtoDT,
+                             <freq_conv_func>asfreq_DTtoM)
+
+
+cdef int64_t asfreq_QtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_QtoDT,
+                             <freq_conv_func>asfreq_DTtoW)
+
+
+# ----------------------------------------------------------------------
+# Conversion _from_ Monthly Freq
+
+cdef int64_t asfreq_MtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_MtoDT,
+                             <freq_conv_func>asfreq_DTtoA)
+
+
+cdef int64_t asfreq_MtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_MtoDT,
+                             <freq_conv_func>asfreq_DTtoQ)
+
+
+cdef int64_t asfreq_MtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_MtoDT,
+                             <freq_conv_func>asfreq_DTtoW)
+
+
+# ----------------------------------------------------------------------
+# Conversion _from_ Weekly Freq
+
+cdef int64_t asfreq_WtoA(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_WtoDT,
+                             <freq_conv_func>asfreq_DTtoA)
+
+
+cdef int64_t asfreq_WtoQ(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_WtoDT,
+                             <freq_conv_func>asfreq_DTtoQ)
+
+
+cdef int64_t asfreq_WtoM(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_WtoDT,
+                             <freq_conv_func>asfreq_DTtoM)
+
+
+cdef int64_t asfreq_WtoW(int64_t ordinal, asfreq_info *af_info) nogil:
+    return transform_via_day(ordinal, af_info,
+                             <freq_conv_func>asfreq_WtoDT,
+                             <freq_conv_func>asfreq_DTtoW)
+
+
+# ----------------------------------------------------------------------
+
+@cython.cdivision
+cdef char* c_strftime(npy_datetimestruct *dts, char *fmt):
+    """
+    Generate a nice string representation of the period
+    object, originally from DateObject_strftime
+
+    Parameters
+    ----------
+    dts : npy_datetimestruct*
+    fmt : char*
+
+    Returns
+    -------
+    result : char*
+    """
+    cdef:
+        tm c_date
+        char *result
+        int result_len = strlen(fmt) + 50
+
+    c_date.tm_sec = dts.sec
+    c_date.tm_min = dts.min
+    c_date.tm_hour = dts.hour
+    c_date.tm_mday = dts.day
+    c_date.tm_mon = dts.month - 1
+    c_date.tm_year = dts.year - 1900
+    c_date.tm_wday = (dayofweek(dts.year, dts.month, dts.day) + 1) % 7
+    c_date.tm_yday = get_day_of_year(dts.year, dts.month, dts.day) - 1
+    c_date.tm_isdst = -1
+
+    result = <char*>malloc(result_len * sizeof(char))
+
+    strftime(result, result_len, fmt, &c_date)
+
+    return result
+
+
+# ----------------------------------------------------------------------
+# Conversion between date_info and npy_datetimestruct
+
+cdef inline int get_freq_group(int freq) nogil:
+    return (freq // 1000) * 1000
+
+
+cdef inline int get_freq_group_index(int freq) nogil:
+    return freq // 1000
+
+
+# Find the unix_date (days elapsed since datetime(1970, 1, 1)
+# for the given year/month/day.
+# Assumes GREGORIAN_CALENDAR */
+cdef int64_t unix_date_from_ymd(int year, int month, int day) nogil:
+    # Calculate the absolute date
+    cdef:
+        npy_datetimestruct dts
+        int64_t unix_date
+
+    memset(&dts, 0, sizeof(npy_datetimestruct))
+    dts.year = year
+    dts.month = month
+    dts.day = day
+    unix_date = npy_datetimestruct_to_datetime(NPY_FR_D, &dts)
+    return unix_date
+
+
+# specifically _dont_ use cdvision or else ordinals near -1 are assigned to
+# incorrect dates GH#19643
+@cython.cdivision(False)
+cdef int64_t get_period_ordinal(npy_datetimestruct *dts, int freq) nogil:
+    """
+    Generate an ordinal in period space
+
+    Parameters
+    ----------
+    dts: npy_datetimestruct*
+    freq : int
+
+    Returns
+    -------
+    period_ordinal : int64_t
+    """
+    cdef:
+        int64_t unix_date, seconds, delta
+        int64_t weeks
+        int64_t day_adj
+        int freq_group, fmonth, mdiff
+
+    freq_group = get_freq_group(freq)
+
+    if freq_group == FR_ANN:
+        fmonth = freq - FR_ANN
+        if fmonth == 0:
+            fmonth = 12
+
+        mdiff = dts.month - fmonth
+        if mdiff <= 0:
+            return dts.year - 1970
+        else:
+            return dts.year - 1970 + 1
+
+    elif freq_group == FR_QTR:
+        fmonth = freq - FR_QTR
+        if fmonth == 0:
+            fmonth = 12
+
+        mdiff = dts.month - fmonth
+        # TODO: Aren't the next two conditions equivalent to
+        # unconditional incrementing?
+        if mdiff < 0:
+            mdiff += 12
+        if dts.month >= fmonth:
+            mdiff += 12
+
+        return (dts.year - 1970) * 4 + (mdiff - 1) // 3
+
+    elif freq == FR_MTH:
+        return (dts.year - 1970) * 12 + dts.month - 1
+
+    unix_date = npy_datetimestruct_to_datetime(NPY_FR_D, dts)
+
+    if freq >= FR_SEC:
+        seconds = unix_date * 86400 + dts.hour * 3600 + dts.min * 60 + dts.sec
+
+        if freq == FR_MS:
+            return seconds * 1000 + dts.us // 1000
+
+        elif freq == FR_US:
+            return seconds * 1000000 + dts.us
+
+        elif freq == FR_NS:
+            return (seconds * 1000000000 +
+                    dts.us * 1000 + dts.ps // 1000)
+
+        else:
+            return seconds
+
+    elif freq == FR_MIN:
+        return unix_date * 1440 + dts.hour * 60 + dts.min
+
+    elif freq == FR_HR:
+        return unix_date * 24 + dts.hour
+
+    elif freq == FR_DAY:
+        return unix_date
+
+    elif freq == FR_UND:
+        return unix_date
+
+    elif freq == FR_BUS:
+        # calculate the current week (counting from 1970-01-01) treating
+        # sunday as last day of a week
+        weeks = (unix_date + 3) // 7
+        # calculate the current weekday (in range 1 .. 7)
+        delta = (unix_date + 3) % 7 + 1
+        # return the number of business days in full weeks plus the business
+        # days in the last - possible partial - week
+        if delta <= 5:
+            return (5 * weeks) + delta - 4
+        else:
+            return (5 * weeks) + (5 + 1) - 4
+
+    elif freq_group == FR_WK:
+        day_adj = freq - FR_WK
+        return (unix_date + 3 - day_adj) // 7 + 1
+
+    # raise ValueError
+
+
+cdef void get_date_info(int64_t ordinal, int freq,
+                        npy_datetimestruct *dts) nogil:
+    cdef:
+        int64_t unix_date
+        double abstime
+
+    unix_date = get_unix_date(ordinal, freq)
+    abstime = get_abs_time(freq, unix_date, ordinal)
+
+    while abstime < 0:
+        abstime += 86400
+        unix_date -= 1
+
+    while abstime >= 86400:
+        abstime -= 86400
+        unix_date += 1
+
+    date_info_from_days_and_time(dts, unix_date, abstime)
+
+
+cdef int64_t get_unix_date(int64_t period_ordinal, int freq) nogil:
+    """
+    Returns the proleptic Gregorian ordinal of the date, as an integer.
+    This corresponds to the number of days since Jan., 1st, 1970 AD.
+    When the instance has a frequency less than daily, the proleptic date
+    is calculated for the last day of the period.
+
+    Parameters
+    ----------
+    period_ordinal : int64_t
+    freq : int
+
+    Returns
+    -------
+    unix_date : int64_t number of days since datetime(1970, 1, 1)
+    """
+    cdef:
+        asfreq_info af_info
+        freq_conv_func toDaily = NULL
+
+    if freq == FR_DAY:
+        return period_ordinal
+
+    toDaily = get_asfreq_func(freq, FR_DAY)
+    get_asfreq_info(freq, FR_DAY, True, &af_info)
+    return toDaily(period_ordinal, &af_info)
+
+
+@cython.cdivision
+cdef void date_info_from_days_and_time(npy_datetimestruct *dts,
+                                       int64_t unix_date,
+                                       double abstime) nogil:
+    """
+    Set the instance's value using the given date and time.
+
+    Parameters
+    ----------
+    dts : npy_datetimestruct*
+    unix_date : int64_t
+        days elapsed since datetime(1970, 1, 1)
+    abstime : double
+        seconds elapsed since beginning of day described by unix_date
+
+    Notes
+    -----
+    Updates dts inplace
+    """
+    cdef:
+        int inttime
+        int hour, minute
+        double second, subsecond_fraction
+
+    # Bounds check
+    # The calling function is responsible for ensuring that
+    # abstime >= 0.0 and abstime <= 86400
+
+    # Calculate the date
+    pandas_datetime_to_datetimestruct(unix_date, NPY_FR_D, dts)
+
+    # Calculate the time
+    inttime = <int>abstime
+    hour = inttime / 3600
+    minute = (inttime % 3600) / 60
+    second = abstime - <double>(hour * 3600 + minute * 60)
+
+    dts.hour = hour
+    dts.min = minute
+    dts.sec = <int>second
+
+    subsecond_fraction = second - dts.sec
+    dts.us = int((subsecond_fraction) * 1e6)
+    dts.ps = int(((subsecond_fraction) * 1e6 - dts.us) * 1e6)
+
+
+@cython.cdivision
+cdef double get_abs_time(int freq, int64_t unix_date, int64_t ordinal) nogil:
+    cdef:
+        int freq_index, day_index, base_index
+        int64_t per_day, start_ord
+        double unit, result
+
+    if freq <= FR_DAY:
+        return 0
+
+    freq_index = freq // 1000
+    day_index = FR_DAY // 1000
+    base_index = FR_SEC // 1000
+
+    per_day = get_daytime_conversion_factor(day_index, freq_index)
+    unit = get_daytime_conversion_factor(freq_index, base_index)
+
+    if base_index < freq_index:
+        unit = 1 / unit
+
+    start_ord = unix_date * per_day
+    result = <double>(unit * (ordinal - start_ord))
+    return result
+
+
+cdef int get_yq(int64_t ordinal, int freq, int *quarter, int *year):
+    """
+    Find the year and quarter of a Period with the given ordinal and frequency
+
+    Parameters
+    ----------
+    ordinal : int64_t
+    freq : int
+    quarter : *int
+    year : *int
+
+    Returns
+    -------
+    qtr_freq : int
+        describes the implied quarterly frequency associated with `freq`
+
+    Notes
+    -----
+    Sets quarter and year inplace
+    """
+    cdef:
+        asfreq_info af_info
+        int qtr_freq
+        int64_t unix_date
+
+    unix_date = get_unix_date(ordinal, freq)
+
+    if get_freq_group(freq) == FR_QTR:
+        qtr_freq = freq
+    else:
+        qtr_freq = FR_QTR
+
+    assert (qtr_freq % 1000) <= 12
+    get_asfreq_info(FR_DAY, qtr_freq, True, &af_info)
+
+    quarter[0] = DtoQ_yq(unix_date, &af_info, year)
+    return qtr_freq
+
+
+cdef inline int month_to_quarter(int month) nogil:
+    return (month - 1) // 3 + 1
+
+
+# ----------------------------------------------------------------------
+# Period logic
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def dt64arr_to_periodarr(int64_t[:] dtarr, int freq, tz=None):
+    """
+    Convert array of datetime64 values (passed in as 'i8' dtype) to a set of
+    periods corresponding to desired frequency, per period convention.
+    """
+    cdef:
+        int64_t[:] out
+        Py_ssize_t i, l
+        npy_datetimestruct dts
+
+    l = len(dtarr)
+
+    out = np.empty(l, dtype='i8')
+
+    if tz is None:
+        with nogil:
+            for i in range(l):
+                if dtarr[i] == NPY_NAT:
+                    out[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(dtarr[i], &dts)
+                out[i] = get_period_ordinal(&dts, freq)
+    else:
+        out = localize_dt64arr_to_period(dtarr, freq, tz)
+    return out.base  # .base to access underlying np.ndarray
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def periodarr_to_dt64arr(int64_t[:] periodarr, int freq):
+    """
+    Convert array to datetime64 values from a set of ordinals corresponding to
+    periods per period convention.
+    """
+    cdef:
+        int64_t[:] out
+        Py_ssize_t i, l
+
+    l = len(periodarr)
+
+    out = np.empty(l, dtype='i8')
+
+    with nogil:
+        for i in range(l):
+            out[i] = period_ordinal_to_dt64(periodarr[i], freq)
+
+    return out.base  # .base to access underlying np.ndarray
+
+
+cpdef int64_t period_asfreq(int64_t ordinal, int freq1, int freq2, bint end):
+    """
+    Convert period ordinal from one frequency to another, and if upsampling,
+    choose to use start ('S') or end ('E') of period.
+    """
+    cdef:
+        int64_t retval
+        freq_conv_func func
+        asfreq_info af_info
+
+    if ordinal == NPY_NAT:
+        return NPY_NAT
+
+    func = get_asfreq_func(freq1, freq2)
+    get_asfreq_info(freq1, freq2, end, &af_info)
+    retval = func(ordinal, &af_info)
+
+    if retval == INT32_MIN:
+        raise ValueError('Frequency conversion failed')
+
+    return retval
+
+
+cdef void get_asfreq_info(int from_freq, int to_freq,
+                          bint is_end, asfreq_info *af_info) nogil:
+    """
+    Construct the `asfreq_info` object used to convert an ordinal from
+    `from_freq` to `to_freq`.
+
+    Parameters
+    ----------
+    from_freq : int
+    to_freq int
+    is_end : bool
+    af_info : *asfreq_info
+    """
+    cdef:
+        int from_group = get_freq_group(from_freq)
+        int to_group = get_freq_group(to_freq)
+
+    af_info.is_end = is_end
+
+    af_info.intraday_conversion_factor = get_daytime_conversion_factor(
+        get_freq_group_index(max_value(from_group, FR_DAY)),
+        get_freq_group_index(max_value(to_group, FR_DAY)))
+
+    if from_group == FR_WK:
+        af_info.from_end = calc_week_end(from_freq, from_group)
+    elif from_group == FR_ANN:
+        af_info.from_end = calc_a_year_end(from_freq, from_group)
+    elif from_group == FR_QTR:
+        af_info.from_end = calc_a_year_end(from_freq, from_group)
+
+    if to_group == FR_WK:
+        af_info.to_end = calc_week_end(to_freq, to_group)
+    elif to_group == FR_ANN:
+        af_info.to_end = calc_a_year_end(to_freq, to_group)
+    elif to_group == FR_QTR:
+        af_info.to_end = calc_a_year_end(to_freq, to_group)
+
+
+@cython.cdivision
+cdef int calc_a_year_end(int freq, int group) nogil:
+    cdef:
+        int result = (freq - group) % 12
+    if result == 0:
+        return 12
+    else:
+        return result
+
+
+cdef inline int calc_week_end(int freq, int group) nogil:
+    return freq - group
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def period_asfreq_arr(ndarray[int64_t] arr, int freq1, int freq2, bint end):
+    """
+    Convert int64-array of period ordinals from one frequency to another, and
+    if upsampling, choose to use start ('S') or end ('E') of period.
+    """
+    cdef:
+        int64_t[:] result
+        Py_ssize_t i, n
+        freq_conv_func func
+        asfreq_info af_info
+        int64_t val
+
+    n = len(arr)
+    result = np.empty(n, dtype=np.int64)
+
+    func = get_asfreq_func(freq1, freq2)
+    get_asfreq_info(freq1, freq2, end, &af_info)
+
+    mask = arr == NPY_NAT
+    if mask.any():      # NaT process
+        for i in range(n):
+            val = arr[i]
+            if val != NPY_NAT:
+                val = func(val, &af_info)
+                if val == INT32_MIN:
+                    raise ValueError("Unable to convert to desired frequency.")
+            result[i] = val
+    else:
+        for i in range(n):
+            val = func(arr[i], &af_info)
+            if val == INT32_MIN:
+                raise ValueError("Unable to convert to desired frequency.")
+            result[i] = val
+
+    return result.base  # .base to access underlying np.ndarray
+
+
+cpdef int64_t period_ordinal(int y, int m, int d, int h, int min,
+                             int s, int us, int ps, int freq):
+    """
+    Find the ordinal representation of the given datetime components at the
+    frequency `freq`.
+
+    Parameters
+    ----------
+    y : int
+    m : int
+    d : int
+    h : int
+    min : int
+    s : int
+    us : int
+    ps : int
+
+    Returns
+    -------
+    ordinal : int64_t
+    """
+    cdef:
+        npy_datetimestruct dts
+    dts.year = y
+    dts.month = m
+    dts.day = d
+    dts.hour = h
+    dts.min = min
+    dts.sec = s
+    dts.us = us
+    dts.ps = ps
+    return get_period_ordinal(&dts, freq)
+
+
+cpdef int64_t period_ordinal_to_dt64(int64_t ordinal, int freq) nogil:
+    cdef:
+        npy_datetimestruct dts
+
+    if ordinal == NPY_NAT:
+        return NPY_NAT
+
+    get_date_info(ordinal, freq, &dts)
+    return dtstruct_to_dt64(&dts)
+
+
+def period_format(int64_t value, int freq, object fmt=None):
+    cdef:
+        int freq_group
+
+    if value == NPY_NAT:
+        return repr(NaT)
+
+    if fmt is None:
+        freq_group = get_freq_group(freq)
+        if freq_group == 1000:    # FR_ANN
+            fmt = b'%Y'
+        elif freq_group == 2000:  # FR_QTR
+            fmt = b'%FQ%q'
+        elif freq_group == 3000:  # FR_MTH
+            fmt = b'%Y-%m'
+        elif freq_group == 4000:  # WK
+            left = period_asfreq(value, freq, 6000, 0)
+            right = period_asfreq(value, freq, 6000, 1)
+            return '%s/%s' % (period_format(left, 6000),
+                              period_format(right, 6000))
+        elif (freq_group == 5000      # BUS
+              or freq_group == 6000):  # DAY
+            fmt = b'%Y-%m-%d'
+        elif freq_group == 7000:   # HR
+            fmt = b'%Y-%m-%d %H:00'
+        elif freq_group == 8000:   # MIN
+            fmt = b'%Y-%m-%d %H:%M'
+        elif freq_group == 9000:   # SEC
+            fmt = b'%Y-%m-%d %H:%M:%S'
+        elif freq_group == 10000:  # MILLISEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%l'
+        elif freq_group == 11000:  # MICROSEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%u'
+        elif freq_group == 12000:  # NANOSEC
+            fmt = b'%Y-%m-%d %H:%M:%S.%n'
+        else:
+            raise ValueError('Unknown freq: {freq}'.format(freq=freq))
+
+    return _period_strftime(value, freq, fmt)
+
+
+cdef list extra_fmts = [(b"%q", b"^`AB`^"),
+                        (b"%f", b"^`CD`^"),
+                        (b"%F", b"^`EF`^"),
+                        (b"%l", b"^`GH`^"),
+                        (b"%u", b"^`IJ`^"),
+                        (b"%n", b"^`KL`^")]
+
+cdef list str_extra_fmts = ["^`AB`^", "^`CD`^", "^`EF`^",
+                            "^`GH`^", "^`IJ`^", "^`KL`^"]
+
+cdef object _period_strftime(int64_t value, int freq, object fmt):
+    cdef:
+        Py_ssize_t i
+        npy_datetimestruct dts
+        char *formatted
+        object pat, repl, result
+        list found_pat = [False] * len(extra_fmts)
+        int year, quarter
+
+    if isinstance(fmt, unicode):
+        fmt = fmt.encode('utf-8')
+
+    get_date_info(value, freq, &dts)
+    for i in range(len(extra_fmts)):
+        pat = extra_fmts[i][0]
+        repl = extra_fmts[i][1]
+        if pat in fmt:
+            fmt = fmt.replace(pat, repl)
+            found_pat[i] = True
+
+    formatted = c_strftime(&dts, <char*>fmt)
+
+    result = util.char_to_string(formatted)
+    free(formatted)
+
+    for i in range(len(extra_fmts)):
+        if found_pat[i]:
+            if get_yq(value, freq, &quarter, &year) < 0:
+                raise ValueError('Unable to get quarter and year')
+
+            if i == 0:
+                repl = '%d' % quarter
+            elif i == 1:  # %f, 2-digit year
+                repl = '%.2d' % (year % 100)
+            elif i == 2:
+                repl = '%d' % year
+            elif i == 3:
+                repl = '%03d' % (value % 1000)
+            elif i == 4:
+                repl = '%06d' % (value % 1000000)
+            elif i == 5:
+                repl = '%09d' % (value % 1000000000)
+
+            result = result.replace(str_extra_fmts[i], repl)
+
+    if PY2:
+        result = result.decode('utf-8', 'ignore')
+
+    return result
+
+
+# ----------------------------------------------------------------------
+# period accessors
+
+ctypedef int (*accessor)(int64_t ordinal, int freq) except INT32_MIN
+
+
+cdef int pyear(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.year
+
+
+@cython.cdivision
+cdef int pqyear(int64_t ordinal, int freq):
+    cdef:
+        int year, quarter
+    get_yq(ordinal, freq, &quarter, &year)
+    return year
+
+
+cdef int pquarter(int64_t ordinal, int freq):
+    cdef:
+        int year, quarter
+    get_yq(ordinal, freq, &quarter, &year)
+    return quarter
+
+
+cdef int pmonth(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.month
+
+
+cdef int pday(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.day
+
+
+cdef int pweekday(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dayofweek(dts.year, dts.month, dts.day)
+
+
+cdef int pday_of_year(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return get_day_of_year(dts.year, dts.month, dts.day)
+
+
+cdef int pweek(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return ccalendar.get_week_of_year(dts.year, dts.month, dts.day)
+
+
+cdef int phour(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.hour
+
+
+cdef int pminute(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return dts.min
+
+
+cdef int psecond(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return <int>dts.sec
+
+
+cdef int pdays_in_month(int64_t ordinal, int freq):
+    cdef:
+        npy_datetimestruct dts
+    get_date_info(ordinal, freq, &dts)
+    return ccalendar.get_days_in_month(dts.year, dts.month)
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def get_period_field_arr(int code, int64_t[:] arr, int freq):
+    cdef:
+        Py_ssize_t i, sz
+        int64_t[:] out
+        accessor f
+
+    func = _get_accessor_func(code)
+    if func is NULL:
+        raise ValueError('Unrecognized period code: {code}'.format(code=code))
+
+    sz = len(arr)
+    out = np.empty(sz, dtype=np.int64)
+
+    for i in range(sz):
+        if arr[i] == NPY_NAT:
+            out[i] = -1
+            continue
+        out[i] = func(arr[i], freq)
+
+    return out.base  # .base to access underlying np.ndarray
+
+
+cdef accessor _get_accessor_func(int code):
+    if code == 0:
+        return <accessor>pyear
+    elif code == 1:
+        return <accessor>pqyear
+    elif code == 2:
+        return <accessor>pquarter
+    elif code == 3:
+        return <accessor>pmonth
+    elif code == 4:
+        return <accessor>pday
+    elif code == 5:
+        return <accessor>phour
+    elif code == 6:
+        return <accessor>pminute
+    elif code == 7:
+        return <accessor>psecond
+    elif code == 8:
+        return <accessor>pweek
+    elif code == 9:
+        return <accessor>pday_of_year
+    elif code == 10:
+        return <accessor>pweekday
+    elif code == 11:
+        return <accessor>pdays_in_month
+    return NULL
+
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+def extract_ordinals(ndarray[object] values, freq):
+    # TODO: Change type to const object[:] when Cython supports that.
+
+    cdef:
+        Py_ssize_t i, n = len(values)
+        int64_t[:] ordinals = np.empty(n, dtype=np.int64)
+        object p
+
+    freqstr = Period._maybe_convert_freq(freq).freqstr
+
+    for i in range(n):
+        p = values[i]
+
+        if is_null_datetimelike(p):
+            ordinals[i] = NPY_NAT
+        else:
+            try:
+                ordinals[i] = p.ordinal
+
+                if p.freqstr != freqstr:
+                    msg = DIFFERENT_FREQ.format(cls="PeriodIndex",
+                                                own_freq=freqstr,
+                                                other_freq=p.freqstr)
+                    raise IncompatibleFrequency(msg)
+
+            except AttributeError:
+                p = Period(p, freq=freq)
+                if p is NaT:
+                    # input may contain NaT-like string
+                    ordinals[i] = NPY_NAT
+                else:
+                    ordinals[i] = p.ordinal
+
+    return ordinals.base  # .base to access underlying np.ndarray
+
+
+def extract_freq(ndarray[object] values):
+    # TODO: Change type to const object[:] when Cython supports that.
+
+    cdef:
+        Py_ssize_t i, n = len(values)
+        object p
+
+    for i in range(n):
+        p = values[i]
+
+        try:
+            # now Timestamp / NaT has freq attr
+            if is_period_object(p):
+                return p.freq
+        except AttributeError:
+            pass
+
+    raise ValueError('freq not specified and cannot be inferred')
+
+
+# -----------------------------------------------------------------------
+# period helpers
+
+@cython.wraparound(False)
+@cython.boundscheck(False)
+cdef int64_t[:] localize_dt64arr_to_period(int64_t[:] stamps,
+                                           int freq, object tz):
+    cdef:
+        Py_ssize_t n = len(stamps)
+        int64_t[:] result = np.empty(n, dtype=np.int64)
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        Py_ssize_t[:] pos
+        npy_datetimestruct dts
+        int64_t local_val
+
+    if is_utc(tz) or tz is None:
+        with nogil:
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i], &dts)
+                result[i] = get_period_ordinal(&dts, freq)
+
+    elif is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                result[i] = NPY_NAT
+                continue
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            result[i] = get_period_ordinal(&dts, freq)
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        if typ not in ['pytz', 'dateutil']:
+            # static/fixed; in this case we know that len(delta) == 1
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[0], &dts)
+                result[i] = get_period_ordinal(&dts, freq)
+        else:
+            pos = trans.searchsorted(stamps, side='right') - 1
+
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    result[i] = NPY_NAT
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                result[i] = get_period_ordinal(&dts, freq)
+
+    return result
+
+
+DIFFERENT_FREQ = ("Input has different freq={other_freq} "
+                  "from {cls}(freq={own_freq})")
+
+
+class IncompatibleFrequency(ValueError):
+    pass
+
+
+cdef class _Period(object):
+
+    cdef readonly:
+        int64_t ordinal
+        object freq
+
+    _typ = 'period'
+
+    def __cinit__(self, ordinal, freq):
+        self.ordinal = ordinal
+        self.freq = freq
+
+    @classmethod
+    def _maybe_convert_freq(cls, object freq):
+        if isinstance(freq, (int, tuple)):
+            code, stride = get_freq_code(freq)
+            freq = get_freq_str(code, stride)
+
+        freq = to_offset(freq)
+
+        if freq.n <= 0:
+            raise ValueError('Frequency must be positive, because it'
+                             ' represents span: {freqstr}'
+                             .format(freqstr=freq.freqstr))
+
+        return freq
+
+    @classmethod
+    def _from_ordinal(cls, ordinal, freq):
+        """
+        Fast creation from an ordinal and freq that are already validated!
+        """
+        if ordinal == NPY_NAT:
+            return NaT
+        else:
+            freq = cls._maybe_convert_freq(freq)
+            self = _Period.__new__(cls, ordinal, freq)
+            return self
+
+    def __richcmp__(self, other, op):
+        if is_period_object(other):
+            if other.freq != self.freq:
+                msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                            own_freq=self.freqstr,
+                                            other_freq=other.freqstr)
+                raise IncompatibleFrequency(msg)
+            return PyObject_RichCompareBool(self.ordinal, other.ordinal, op)
+        elif other is NaT:
+            return _nat_scalar_rules[op]
+        # index/series like
+        elif hasattr(other, '_typ'):
+            return NotImplemented
+        else:
+            if op == Py_EQ:
+                return NotImplemented
+            elif op == Py_NE:
+                return NotImplemented
+            raise TypeError('Cannot compare type {cls} with type {typ}'
+                            .format(cls=type(self).__name__,
+                                    typ=type(other).__name__))
+
+    def __hash__(self):
+        return hash((self.ordinal, self.freqstr))
+
+    def _add_delta(self, other):
+        cdef:
+            int64_t nanos, offset_nanos
+
+        if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                isinstance(other, _Tick)):
+            offset = to_offset(self.freq.rule_code)
+            if isinstance(offset, _Tick):
+                nanos = delta_to_nanoseconds(other)
+                offset_nanos = delta_to_nanoseconds(offset)
+                if nanos % offset_nanos == 0:
+                    ordinal = self.ordinal + (nanos // offset_nanos)
+                    return Period(ordinal=ordinal, freq=self.freq)
+            msg = 'Input cannot be converted to Period(freq={0})'
+            raise IncompatibleFrequency(msg.format(self.freqstr))
+        elif util.is_offset_object(other):
+            freqstr = other.rule_code
+            base = get_base_alias(freqstr)
+            if base == self.freq.rule_code:
+                ordinal = self.ordinal + other.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                        own_freq=self.freqstr,
+                                        other_freq=other.freqstr)
+            raise IncompatibleFrequency(msg)
+        else:  # pragma no cover
+            return NotImplemented
+
+    def __add__(self, other):
+        if is_period_object(self):
+            if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                    util.is_offset_object(other)):
+                return self._add_delta(other)
+            elif other is NaT:
+                return NaT
+            elif util.is_integer_object(other):
+                ordinal = self.ordinal + other * self.freq.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            elif (PyDateTime_Check(other) or
+                  is_period_object(other) or util.is_datetime64_object(other)):
+                # can't add datetime-like
+                # GH#17983
+                sname = type(self).__name__
+                oname = type(other).__name__
+                raise TypeError("unsupported operand type(s) for +: '{self}' "
+                                "and '{other}'".format(self=sname,
+                                                       other=oname))
+            else:  # pragma: no cover
+                return NotImplemented
+        elif is_period_object(other):
+            # this can be reached via __radd__ because of cython rules
+            return other + self
+        else:
+            return NotImplemented
+
+    def __sub__(self, other):
+        if is_period_object(self):
+            if (PyDelta_Check(other) or util.is_timedelta64_object(other) or
+                    util.is_offset_object(other)):
+                neg_other = -other
+                return self + neg_other
+            elif util.is_integer_object(other):
+                ordinal = self.ordinal - other * self.freq.n
+                return Period(ordinal=ordinal, freq=self.freq)
+            elif is_period_object(other):
+                if other.freq != self.freq:
+                    msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                                own_freq=self.freqstr,
+                                                other_freq=other.freqstr)
+                    raise IncompatibleFrequency(msg)
+                # GH 23915 - mul by base freq since __add__ is agnostic of n
+                return (self.ordinal - other.ordinal) * self.freq.base
+            elif getattr(other, '_typ', None) == 'periodindex':
+                # GH#21314 PeriodIndex - Period returns an object-index
+                # of DateOffset objects, for which we cannot use __neg__
+                # directly, so we have to apply it pointwise
+                return other.__sub__(self).map(lambda x: -x)
+            else:  # pragma: no cover
+                return NotImplemented
+        elif is_period_object(other):
+            if self is NaT:
+                return NaT
+            return NotImplemented
+        else:
+            return NotImplemented
+
+    def asfreq(self, freq, how='E'):
+        """
+        Convert Period to desired frequency, either at the start or end of the
+        interval
+
+        Parameters
+        ----------
+        freq : string
+        how : {'E', 'S', 'end', 'start'}, default 'end'
+            Start or end of the timespan
+
+        Returns
+        -------
+        resampled : Period
+        """
+        freq = self._maybe_convert_freq(freq)
+        how = _validate_end_alias(how)
+        base1, mult1 = get_freq_code(self.freq)
+        base2, mult2 = get_freq_code(freq)
+
+        # mult1 can't be negative or 0
+        end = how == 'E'
+        if end:
+            ordinal = self.ordinal + mult1 - 1
+        else:
+            ordinal = self.ordinal
+        ordinal = period_asfreq(ordinal, base1, base2, end)
+
+        return Period(ordinal=ordinal, freq=freq)
+
+    @property
+    def start_time(self):
+        """
+        Get the Timestamp for the start of the period.
+
+        Returns
+        -------
+        Timestamp
+
+        See Also
+        --------
+        Period.end_time : Return the end Timestamp.
+        Period.dayofyear : Return the day of year.
+        Period.daysinmonth : Return the days in that month.
+        Period.dayofweek : Return the day of the week.
+
+        Examples
+        --------
+        >>> period = pd.Period('2012-1-1', freq='D')
+        >>> period
+        Period('2012-01-01', 'D')
+
+        >>> period.start_time
+        Timestamp('2012-01-01 00:00:00')
+
+        >>> period.end_time
+        Timestamp('2012-01-01 23:59:59.999999999')
+        """
+        return self.to_timestamp(how='S')
+
+    @property
+    def end_time(self):
+        # freq.n can't be negative or 0
+        # ordinal = (self + self.freq.n).start_time.value - 1
+        ordinal = (self + self.freq).start_time.value - 1
+        return Timestamp(ordinal)
+
+    def to_timestamp(self, freq=None, how='start', tz=None):
+        """
+        Return the Timestamp representation of the Period at the target
+        frequency at the specified end (how) of the Period
+
+        Parameters
+        ----------
+        freq : string or DateOffset
+            Target frequency. Default is 'D' if self.freq is week or
+            longer and 'S' otherwise
+        how : str, default 'S' (start)
+            'S', 'E'. Can be aliased as case insensitive
+            'Start', 'Finish', 'Begin', 'End'
+
+        Returns
+        -------
+        Timestamp
+        """
+        if freq is not None:
+            freq = self._maybe_convert_freq(freq)
+        how = _validate_end_alias(how)
+
+        end = how == 'E'
+        if end:
+            endpoint = (self + self.freq).to_timestamp(how='start')
+            return endpoint - Timedelta(1, 'ns')
+
+        if freq is None:
+            base, mult = get_freq_code(self.freq)
+            freq = get_to_timestamp_base(base)
+
+        base, mult = get_freq_code(freq)
+        val = self.asfreq(freq, how)
+
+        dt64 = period_ordinal_to_dt64(val.ordinal, base)
+        return Timestamp(dt64, tz=tz)
+
+    @property
+    def year(self):
+        base, mult = get_freq_code(self.freq)
+        return pyear(self.ordinal, base)
+
+    @property
+    def month(self):
+        base, mult = get_freq_code(self.freq)
+        return pmonth(self.ordinal, base)
+
+    @property
+    def day(self):
+        """
+        Get day of the month that a Period falls on.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.dayofweek : Get the day of the week.
+        Period.dayofyear : Get the day of the year.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", freq='H')
+        >>> p.day
+        11
+        """
+        base, mult = get_freq_code(self.freq)
+        return pday(self.ordinal, base)
+
+    @property
+    def hour(self):
+        """
+        Get the hour of the day component of the Period.
+
+        Returns
+        -------
+        int
+            The hour as an integer, between 0 and 23.
+
+        See Also
+        --------
+        Period.second : Get the second component of the Period.
+        Period.minute : Get the minute component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.hour
+        13
+
+        Period longer than a day
+
+        >>> p = pd.Period("2018-03-11", freq="M")
+        >>> p.hour
+        0
+        """
+        base, mult = get_freq_code(self.freq)
+        return phour(self.ordinal, base)
+
+    @property
+    def minute(self):
+        """
+        Get minute of the hour component of the Period.
+
+        Returns
+        -------
+        int
+            The minute as an integer, between 0 and 59.
+
+        See Also
+        --------
+        Period.hour : Get the hour component of the Period.
+        Period.second : Get the second component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.minute
+        3
+        """
+        base, mult = get_freq_code(self.freq)
+        return pminute(self.ordinal, base)
+
+    @property
+    def second(self):
+        """
+        Get the second component of the Period.
+
+        Returns
+        -------
+        int
+            The second of the Period (ranges from 0 to 59).
+
+        See Also
+        --------
+        Period.hour : Get the hour component of the Period.
+        Period.minute : Get the minute component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11 13:03:12.050000")
+        >>> p.second
+        12
+        """
+        base, mult = get_freq_code(self.freq)
+        return psecond(self.ordinal, base)
+
+    @property
+    def weekofyear(self):
+        base, mult = get_freq_code(self.freq)
+        return pweek(self.ordinal, base)
+
+    @property
+    def week(self):
+        """
+        Get the week of the year on the given Period.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.dayofweek : Get the day component of the Period.
+        Period.weekday : Get the day component of the Period.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", "H")
+        >>> p.week
+        10
+
+        >>> p = pd.Period("2018-02-01", "D")
+        >>> p.week
+        5
+
+        >>> p = pd.Period("2018-01-06", "D")
+        >>> p.week
+        1
+        """
+        return self.weekofyear
+
+    @property
+    def dayofweek(self):
+        """
+        Day of the week the period lies in, with Monday=0 and Sunday=6.
+
+        If the period frequency is lower than daily (e.g. hourly), and the
+        period spans over multiple days, the day at the start of the period is
+        used.
+
+        If the frequency is higher than daily (e.g. monthly), the last day
+        of the period is used.
+
+        Returns
+        -------
+        int
+            Day of the week.
+
+        See Also
+        --------
+        Period.dayofweek : Day of the week the period lies in.
+        Period.weekday : Alias of Period.dayofweek.
+        Period.day : Day of the month.
+        Period.dayofyear : Day of the year.
+
+        Examples
+        --------
+        >>> per = pd.Period('2017-12-31 22:00', 'H')
+        >>> per.dayofweek
+        6
+
+        For periods that span over multiple days, the day at the beginning of
+        the period is returned.
+
+        >>> per = pd.Period('2017-12-31 22:00', '4H')
+        >>> per.dayofweek
+        6
+        >>> per.start_time.dayofweek
+        6
+
+        For periods with a frequency higher than days, the last day of the
+        period is returned.
+
+        >>> per = pd.Period('2018-01', 'M')
+        >>> per.dayofweek
+        2
+        >>> per.end_time.dayofweek
+        2
+        """
+        base, mult = get_freq_code(self.freq)
+        return pweekday(self.ordinal, base)
+
+    @property
+    def weekday(self):
+        """
+        Day of the week the period lies in, with Monday=0 and Sunday=6.
+
+        If the period frequency is lower than daily (e.g. hourly), and the
+        period spans over multiple days, the day at the start of the period is
+        used.
+
+        If the frequency is higher than daily (e.g. monthly), the last day
+        of the period is used.
+
+        Returns
+        -------
+        int
+            Day of the week.
+
+        See Also
+        --------
+        Period.dayofweek : Day of the week the period lies in.
+        Period.weekday : Alias of Period.dayofweek.
+        Period.day : Day of the month.
+        Period.dayofyear : Day of the year.
+
+        Examples
+        --------
+        >>> per = pd.Period('2017-12-31 22:00', 'H')
+        >>> per.dayofweek
+        6
+
+        For periods that span over multiple days, the day at the beginning of
+        the period is returned.
+
+        >>> per = pd.Period('2017-12-31 22:00', '4H')
+        >>> per.dayofweek
+        6
+        >>> per.start_time.dayofweek
+        6
+
+        For periods with a frequency higher than days, the last day of the
+        period is returned.
+
+        >>> per = pd.Period('2018-01', 'M')
+        >>> per.dayofweek
+        2
+        >>> per.end_time.dayofweek
+        2
+        """
+        # Docstring is a duplicate from dayofweek. Reusing docstrings with
+        # Appender doesn't work for properties in Cython files, and setting
+        # the __doc__ attribute is also not possible.
+        return self.dayofweek
+
+    @property
+    def dayofyear(self):
+        """
+        Return the day of the year.
+
+        This attribute returns the day of the year on which the particular
+        date occurs. The return value ranges between 1 to 365 for regular
+        years and 1 to 366 for leap years.
+
+        Returns
+        -------
+        int
+            The day of year.
+
+        See Also
+        --------
+        Period.day : Return the day of the month.
+        Period.dayofweek : Return the day of week.
+        PeriodIndex.dayofyear : Return the day of year of all indexes.
+
+        Examples
+        --------
+        >>> period = pd.Period("2015-10-23", freq='H')
+        >>> period.dayofyear
+        296
+        >>> period = pd.Period("2012-12-31", freq='D')
+        >>> period.dayofyear
+        366
+        >>> period = pd.Period("2013-01-01", freq='D')
+        >>> period.dayofyear
+        1
+        """
+        base, mult = get_freq_code(self.freq)
+        return pday_of_year(self.ordinal, base)
+
+    @property
+    def quarter(self):
+        base, mult = get_freq_code(self.freq)
+        return pquarter(self.ordinal, base)
+
+    @property
+    def qyear(self):
+        """
+        Fiscal year the Period lies in according to its starting-quarter.
+
+        The `year` and the `qyear` of the period will be the same if the fiscal
+        and calendar years are the same. When they are not, the fiscal year
+        can be different from the calendar year of the period.
+
+        Returns
+        -------
+        int
+            The fiscal year of the period.
+
+        See Also
+        --------
+        Period.year : Return the calendar year of the period.
+
+        Examples
+        --------
+        If the natural and fiscal year are the same, `qyear` and `year` will
+        be the same.
+
+        >>> per = pd.Period('2018Q1', freq='Q')
+        >>> per.qyear
+        2018
+        >>> per.year
+        2018
+
+        If the fiscal year starts in April (`Q-MAR`), the first quarter of
+        2018 will start in April 2017. `year` will then be 2018, but `qyear`
+        will be the fiscal year, 2018.
+
+        >>> per = pd.Period('2018Q1', freq='Q-MAR')
+        >>> per.start_time
+        Timestamp('2017-04-01 00:00:00')
+        >>> per.qyear
+        2018
+        >>> per.year
+        2017
+        """
+        base, mult = get_freq_code(self.freq)
+        return pqyear(self.ordinal, base)
+
+    @property
+    def days_in_month(self):
+        """
+        Get the total number of days in the month that this period falls on.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.daysinmonth : Gets the number of days in the month.
+        DatetimeIndex.daysinmonth : Gets the number of days in the month.
+        calendar.monthrange : Returns a tuple containing weekday
+            (0-6 ~ Mon-Sun) and number of days (28-31).
+
+        Examples
+        --------
+        >>> p = pd.Period('2018-2-17')
+        >>> p.days_in_month
+        28
+
+        >>> pd.Period('2018-03-01').days_in_month
+        31
+
+        Handles the leap year case as well:
+
+        >>> p = pd.Period('2016-2-17')
+        >>> p.days_in_month
+        29
+        """
+        base, mult = get_freq_code(self.freq)
+        return pdays_in_month(self.ordinal, base)
+
+    @property
+    def daysinmonth(self):
+        """
+        Get the total number of days of the month that the Period falls in.
+
+        Returns
+        -------
+        int
+
+        See Also
+        --------
+        Period.days_in_month : Return the days of the month.
+        Period.dayofyear : Return the day of the year.
+
+        Examples
+        --------
+        >>> p = pd.Period("2018-03-11", freq='H')
+        >>> p.daysinmonth
+        31
+        """
+        return self.days_in_month
+
+    @property
+    def is_leap_year(self):
+        return bool(is_leapyear(self.year))
+
+    @classmethod
+    def now(cls, freq=None):
+        return Period(datetime.now(), freq=freq)
+
+    # HACK IT UP AND YOU BETTER FIX IT SOON
+    def __str__(self):
+        return self.__unicode__()
+
+    @property
+    def freqstr(self):
+        return self.freq.freqstr
+
+    def __repr__(self):
+        base, mult = get_freq_code(self.freq)
+        formatted = period_format(self.ordinal, base)
+        return "Period('%s', '%s')" % (formatted, self.freqstr)
+
+    def __unicode__(self):
+        """
+        Return a string representation for a particular DataFrame
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        base, mult = get_freq_code(self.freq)
+        formatted = period_format(self.ordinal, base)
+        value = ("%s" % formatted)
+        return value
+
+    def __setstate__(self, state):
+        self.freq = state[1]
+        self.ordinal = state[2]
+
+    def __reduce__(self):
+        object_state = None, self.freq, self.ordinal
+        return (Period, object_state)
+
+    def strftime(self, fmt):
+        """
+        Returns the string representation of the :class:`Period`, depending
+        on the selected ``fmt``. ``fmt`` must be a string
+        containing one or several directives.  The method recognizes the same
+        directives as the :func:`time.strftime` function of the standard Python
+        distribution, as well as the specific additional directives ``%f``,
+        ``%F``, ``%q``. (formatting & docs originally from scikits.timeries)
+
+        +-----------+--------------------------------+-------+
+        | Directive | Meaning                        | Notes |
+        +===========+================================+=======+
+        | ``%a``    | Locale's abbreviated weekday   |       |
+        |           | name.                          |       |
+        +-----------+--------------------------------+-------+
+        | ``%A``    | Locale's full weekday name.    |       |
+        +-----------+--------------------------------+-------+
+        | ``%b``    | Locale's abbreviated month     |       |
+        |           | name.                          |       |
+        +-----------+--------------------------------+-------+
+        | ``%B``    | Locale's full month name.      |       |
+        +-----------+--------------------------------+-------+
+        | ``%c``    | Locale's appropriate date and  |       |
+        |           | time representation.           |       |
+        +-----------+--------------------------------+-------+
+        | ``%d``    | Day of the month as a decimal  |       |
+        |           | number [01,31].                |       |
+        +-----------+--------------------------------+-------+
+        | ``%f``    | 'Fiscal' year without a        | \(1)  |
+        |           | century  as a decimal number   |       |
+        |           | [00,99]                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%F``    | 'Fiscal' year with a century   | \(2)  |
+        |           | as a decimal number            |       |
+        +-----------+--------------------------------+-------+
+        | ``%H``    | Hour (24-hour clock) as a      |       |
+        |           | decimal number [00,23].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%I``    | Hour (12-hour clock) as a      |       |
+        |           | decimal number [01,12].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%j``    | Day of the year as a decimal   |       |
+        |           | number [001,366].              |       |
+        +-----------+--------------------------------+-------+
+        | ``%m``    | Month as a decimal number      |       |
+        |           | [01,12].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%M``    | Minute as a decimal number     |       |
+        |           | [00,59].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%p``    | Locale's equivalent of either  | \(3)  |
+        |           | AM or PM.                      |       |
+        +-----------+--------------------------------+-------+
+        | ``%q``    | Quarter as a decimal number    |       |
+        |           | [01,04]                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%S``    | Second as a decimal number     | \(4)  |
+        |           | [00,61].                       |       |
+        +-----------+--------------------------------+-------+
+        | ``%U``    | Week number of the year        | \(5)  |
+        |           | (Sunday as the first day of    |       |
+        |           | the week) as a decimal number  |       |
+        |           | [00,53].  All days in a new    |       |
+        |           | year preceding the first       |       |
+        |           | Sunday are considered to be in |       |
+        |           | week 0.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%w``    | Weekday as a decimal number    |       |
+        |           | [0(Sunday),6].                 |       |
+        +-----------+--------------------------------+-------+
+        | ``%W``    | Week number of the year        | \(5)  |
+        |           | (Monday as the first day of    |       |
+        |           | the week) as a decimal number  |       |
+        |           | [00,53].  All days in a new    |       |
+        |           | year preceding the first       |       |
+        |           | Monday are considered to be in |       |
+        |           | week 0.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%x``    | Locale's appropriate date      |       |
+        |           | representation.                |       |
+        +-----------+--------------------------------+-------+
+        | ``%X``    | Locale's appropriate time      |       |
+        |           | representation.                |       |
+        +-----------+--------------------------------+-------+
+        | ``%y``    | Year without century as a      |       |
+        |           | decimal number [00,99].        |       |
+        +-----------+--------------------------------+-------+
+        | ``%Y``    | Year with century as a decimal |       |
+        |           | number.                        |       |
+        +-----------+--------------------------------+-------+
+        | ``%Z``    | Time zone name (no characters  |       |
+        |           | if no time zone exists).       |       |
+        +-----------+--------------------------------+-------+
+        | ``%%``    | A literal ``'%'`` character.   |       |
+        +-----------+--------------------------------+-------+
+
+        Notes
+        -----
+
+        (1)
+            The ``%f`` directive is the same as ``%y`` if the frequency is
+            not quarterly.
+            Otherwise, it corresponds to the 'fiscal' year, as defined by
+            the :attr:`qyear` attribute.
+
+        (2)
+            The ``%F`` directive is the same as ``%Y`` if the frequency is
+            not quarterly.
+            Otherwise, it corresponds to the 'fiscal' year, as defined by
+            the :attr:`qyear` attribute.
+
+        (3)
+            The ``%p`` directive only affects the output hour field
+            if the ``%I`` directive is used to parse the hour.
+
+        (4)
+            The range really is ``0`` to ``61``; this accounts for leap
+            seconds and the (very rare) double leap seconds.
+
+        (5)
+            The ``%U`` and ``%W`` directives are only used in calculations
+            when the day of the week and the year are specified.
+
+        Examples
+        --------
+
+        >>> a = Period(freq='Q-JUL', year=2006, quarter=1)
+        >>> a.strftime('%F-Q%q')
+        '2006-Q1'
+        >>> # Output the last month in the quarter of this date
+        >>> a.strftime('%b-%Y')
+        'Oct-2005'
+        >>>
+        >>> a = Period(freq='D', year=2001, month=1, day=1)
+        >>> a.strftime('%d-%b-%Y')
+        '01-Jan-2006'
+        >>> a.strftime('%b. %d, %Y was a %A')
+        'Jan. 01, 2001 was a Monday'
+        """
+        base, mult = get_freq_code(self.freq)
+        return period_format(self.ordinal, base, fmt)
+
+
+class Period(_Period):
+    """
+    Represents a period of time
+
+    Parameters
+    ----------
+    value : Period or compat.string_types, default None
+        The time period represented (e.g., '4Q2005')
+    freq : str, default None
+        One of pandas period strings or corresponding objects
+    year : int, default None
+    month : int, default 1
+    quarter : int, default None
+    day : int, default 1
+    hour : int, default 0
+    minute : int, default 0
+    second : int, default 0
+    """
+
+    def __new__(cls, value=None, freq=None, ordinal=None,
+                year=None, month=None, quarter=None, day=None,
+                hour=None, minute=None, second=None):
+        # freq points to a tuple (base, mult);  base is one of the defined
+        # periods such as A, Q, etc. Every five minutes would be, e.g.,
+        # ('T', 5) but may be passed in as a string like '5T'
+
+        # ordinal is the period offset from the gregorian proleptic epoch
+        cdef _Period self
+
+        if freq is not None:
+            freq = cls._maybe_convert_freq(freq)
+
+        if ordinal is not None and value is not None:
+            raise ValueError("Only value or ordinal but not both should be "
+                             "given but not both")
+        elif ordinal is not None:
+            if not util.is_integer_object(ordinal):
+                raise ValueError("Ordinal must be an integer")
+            if freq is None:
+                raise ValueError('Must supply freq for ordinal value')
+
+        elif value is None:
+            if (year is None and month is None and
+                    quarter is None and day is None and
+                    hour is None and minute is None and second is None):
+                ordinal = NPY_NAT
+            else:
+                if freq is None:
+                    raise ValueError("If value is None, freq cannot be None")
+
+                # set defaults
+                month = 1 if month is None else month
+                day = 1 if day is None else day
+                hour = 0 if hour is None else hour
+                minute = 0 if minute is None else minute
+                second = 0 if second is None else second
+
+                ordinal = _ordinal_from_fields(year, month, quarter, day,
+                                               hour, minute, second, freq)
+
+        elif is_period_object(value):
+            other = value
+            if freq is None or get_freq_code(
+                    freq) == get_freq_code(other.freq):
+                ordinal = other.ordinal
+                freq = other.freq
+            else:
+                converted = other.asfreq(freq)
+                ordinal = converted.ordinal
+
+        elif is_null_datetimelike(value) or value in nat_strings:
+            ordinal = NPY_NAT
+
+        elif is_string_object(value) or util.is_integer_object(value):
+            if util.is_integer_object(value):
+                value = str(value)
+            value = value.upper()
+            dt, _, reso = parse_time_string(value, freq)
+            if dt is NaT:
+                ordinal = NPY_NAT
+
+            if freq is None:
+                try:
+                    freq = Resolution.get_freq(reso)
+                except KeyError:
+                    raise ValueError(
+                        "Invalid frequency or could not infer: {reso}"
+                        .format(reso=reso))
+
+        elif PyDateTime_Check(value):
+            dt = value
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        elif util.is_datetime64_object(value):
+            dt = Timestamp(value)
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        elif PyDate_Check(value):
+            dt = datetime(year=value.year, month=value.month, day=value.day)
+            if freq is None:
+                raise ValueError('Must supply freq for datetime value')
+        else:
+            msg = "Value must be Period, string, integer, or datetime"
+            raise ValueError(msg)
+
+        if ordinal is None:
+            base, mult = get_freq_code(freq)
+            ordinal = period_ordinal(dt.year, dt.month, dt.day,
+                                     dt.hour, dt.minute, dt.second,
+                                     dt.microsecond, 0, base)
+
+        return cls._from_ordinal(ordinal, freq)
+
+
+cdef int64_t _ordinal_from_fields(int year, int month, quarter, int day,
+                                  int hour, int minute, int second, freq):
+    base, mult = get_freq_code(freq)
+    if quarter is not None:
+        year, month = quarter_to_myear(year, quarter, freq)
+
+    return period_ordinal(year, month, day, hour,
+                          minute, second, 0, 0, base)
+
+
+def quarter_to_myear(year: int, quarter: int, freq):
+    """
+    A quarterly frequency defines a "year" which may not coincide with
+    the calendar-year.  Find the calendar-year and calendar-month associated
+    with the given year and quarter under the `freq`-derived calendar.
+
+    Parameters
+    ----------
+    year : int
+    quarter : int
+    freq : DateOffset
+
+    Returns
+    -------
+    year : int
+    month : int
+
+    See Also
+    --------
+    Period.qyear
+    """
+    if quarter <= 0 or quarter > 4:
+        raise ValueError('Quarter must be 1 <= q <= 4')
+
+    mnum = MONTH_NUMBERS[get_rule_month(freq)] + 1
+    month = (mnum + (quarter - 1) * 3) % 12 + 1
+    if month > mnum:
+        year -= 1
+
+    return year, month
+
+
+def _validate_end_alias(how):
+    how_dict = {'S': 'S', 'E': 'E',
+                'START': 'S', 'FINISH': 'E',
+                'BEGIN': 'S', 'END': 'E'}
+    how = how_dict.get(str(how).upper())
+    if how not in {'S', 'E'}:
+        raise ValueError('How must be one of S or E')
+    return how
diff --git a/pandas/_libs/tslibs/resolution.pyx b/pandas/_libs/tslibs/resolution.pyx
new file mode 100644
index 0000000000000..13a4f5ba48557
--- /dev/null
+++ b/pandas/_libs/tslibs/resolution.pyx
@@ -0,0 +1,355 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+from numpy cimport ndarray, int64_t, int32_t
+
+from pandas._libs.tslibs.util cimport is_string_object, get_nat
+
+from pandas._libs.tslibs.np_datetime cimport (
+    npy_datetimestruct, dt64_to_dtstruct)
+from pandas._libs.tslibs.frequencies cimport get_freq_code
+from pandas._libs.tslibs.timezones cimport (
+    is_utc, is_tzlocal, maybe_get_tz, get_dst_info)
+from pandas._libs.tslibs.conversion cimport tz_convert_utc_to_tzlocal
+from pandas._libs.tslibs.ccalendar cimport get_days_in_month
+
+# ----------------------------------------------------------------------
+# Constants
+
+cdef:
+    int64_t NPY_NAT = get_nat()
+
+    int RESO_NS = 0
+    int RESO_US = 1
+    int RESO_MS = 2
+    int RESO_SEC = 3
+    int RESO_MIN = 4
+    int RESO_HR = 5
+    int RESO_DAY = 6
+
+# ----------------------------------------------------------------------
+
+cpdef resolution(int64_t[:] stamps, tz=None):
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        npy_datetimestruct dts
+        int reso = RESO_DAY, curr_reso
+
+    if tz is not None:
+        tz = maybe_get_tz(tz)
+    return _reso_local(stamps, tz)
+
+
+cdef _reso_local(int64_t[:] stamps, object tz):
+    cdef:
+        Py_ssize_t i, n = len(stamps)
+        int reso = RESO_DAY, curr_reso
+        ndarray[int64_t] trans
+        int64_t[:] deltas
+        Py_ssize_t[:] pos
+        npy_datetimestruct dts
+        int64_t local_val, delta
+
+    if is_utc(tz) or tz is None:
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                continue
+            dt64_to_dtstruct(stamps[i], &dts)
+            curr_reso = _reso_stamp(&dts)
+            if curr_reso < reso:
+                reso = curr_reso
+    elif is_tzlocal(tz):
+        for i in range(n):
+            if stamps[i] == NPY_NAT:
+                continue
+            local_val = tz_convert_utc_to_tzlocal(stamps[i], tz)
+            dt64_to_dtstruct(local_val, &dts)
+            curr_reso = _reso_stamp(&dts)
+            if curr_reso < reso:
+                reso = curr_reso
+    else:
+        # Adjust datetime64 timestamp, recompute datetimestruct
+        trans, deltas, typ = get_dst_info(tz)
+
+        if typ not in ['pytz', 'dateutil']:
+            # static/fixed; in this case we know that len(delta) == 1
+            delta = deltas[0]
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    continue
+                dt64_to_dtstruct(stamps[i] + delta, &dts)
+                curr_reso = _reso_stamp(&dts)
+                if curr_reso < reso:
+                    reso = curr_reso
+        else:
+            pos = trans.searchsorted(stamps, side='right') - 1
+            for i in range(n):
+                if stamps[i] == NPY_NAT:
+                    continue
+                dt64_to_dtstruct(stamps[i] + deltas[pos[i]], &dts)
+                curr_reso = _reso_stamp(&dts)
+                if curr_reso < reso:
+                    reso = curr_reso
+
+    return reso
+
+
+cdef inline int _reso_stamp(npy_datetimestruct *dts):
+    if dts.us != 0:
+        if dts.us % 1000 == 0:
+            return RESO_MS
+        return RESO_US
+    elif dts.sec != 0:
+        return RESO_SEC
+    elif dts.min != 0:
+        return RESO_MIN
+    elif dts.hour != 0:
+        return RESO_HR
+    return RESO_DAY
+
+
+def get_freq_group(freq):
+    """
+    Return frequency code group of given frequency str or offset.
+
+    Example
+    -------
+    >>> get_freq_group('W-MON')
+    4000
+
+    >>> get_freq_group('W-FRI')
+    4000
+    """
+    if getattr(freq, '_typ', None) == 'dateoffset':
+        freq = freq.rule_code
+
+    if is_string_object(freq):
+        base, mult = get_freq_code(freq)
+        freq = base
+    elif isinstance(freq, int):
+        pass
+    else:
+        raise ValueError('input must be str, offset or int')
+    return (freq // 1000) * 1000
+
+
+class Resolution(object):
+
+    # Note: cython won't allow us to reference the cdef versions at the
+    # module level
+    RESO_NS = 0
+    RESO_US = 1
+    RESO_MS = 2
+    RESO_SEC = 3
+    RESO_MIN = 4
+    RESO_HR = 5
+    RESO_DAY = 6
+
+    _reso_str_map = {
+        RESO_NS: 'nanosecond',
+        RESO_US: 'microsecond',
+        RESO_MS: 'millisecond',
+        RESO_SEC: 'second',
+        RESO_MIN: 'minute',
+        RESO_HR: 'hour',
+        RESO_DAY: 'day'}
+
+    # factor to multiply a value by to convert it to the next finer grained
+    # resolution
+    _reso_mult_map = {
+        RESO_NS: None,
+        RESO_US: 1000,
+        RESO_MS: 1000,
+        RESO_SEC: 1000,
+        RESO_MIN: 60,
+        RESO_HR: 60,
+        RESO_DAY: 24}
+
+    _reso_str_bump_map = {
+        'D': 'H',
+        'H': 'T',
+        'T': 'S',
+        'S': 'L',
+        'L': 'U',
+        'U': 'N',
+        'N': None}
+
+    _str_reso_map = {v: k for k, v in _reso_str_map.items()}
+
+    _reso_freq_map = {
+        'year': 'A',
+        'quarter': 'Q',
+        'month': 'M',
+        'day': 'D',
+        'hour': 'H',
+        'minute': 'T',
+        'second': 'S',
+        'millisecond': 'L',
+        'microsecond': 'U',
+        'nanosecond': 'N'}
+
+    _freq_reso_map = {v: k for k, v in _reso_freq_map.items()}
+
+    @classmethod
+    def get_str(cls, reso):
+        """
+        Return resolution str against resolution code.
+
+        Example
+        -------
+        >>> Resolution.get_str(Resolution.RESO_SEC)
+        'second'
+        """
+        return cls._reso_str_map.get(reso, 'day')
+
+    @classmethod
+    def get_reso(cls, resostr):
+        """
+        Return resolution str against resolution code.
+
+        Example
+        -------
+        >>> Resolution.get_reso('second')
+        2
+
+        >>> Resolution.get_reso('second') == Resolution.RESO_SEC
+        True
+        """
+        return cls._str_reso_map.get(resostr, cls.RESO_DAY)
+
+    @classmethod
+    def get_freq_group(cls, resostr):
+        """
+        Return frequency str against resolution str.
+
+        Example
+        -------
+        >>> f.Resolution.get_freq_group('day')
+        4000
+        """
+        return get_freq_group(cls.get_freq(resostr))
+
+    @classmethod
+    def get_freq(cls, resostr):
+        """
+        Return frequency str against resolution str.
+
+        Example
+        -------
+        >>> f.Resolution.get_freq('day')
+        'D'
+        """
+        return cls._reso_freq_map[resostr]
+
+    @classmethod
+    def get_str_from_freq(cls, freq):
+        """
+        Return resolution str against frequency str.
+
+        Example
+        -------
+        >>> Resolution.get_str_from_freq('H')
+        'hour'
+        """
+        return cls._freq_reso_map.get(freq, 'day')
+
+    @classmethod
+    def get_reso_from_freq(cls, freq):
+        """
+        Return resolution code against frequency str.
+
+        Example
+        -------
+        >>> Resolution.get_reso_from_freq('H')
+        4
+
+        >>> Resolution.get_reso_from_freq('H') == Resolution.RESO_HR
+        True
+        """
+        return cls.get_reso(cls.get_str_from_freq(freq))
+
+    @classmethod
+    def get_stride_from_decimal(cls, value, freq):
+        """
+        Convert freq with decimal stride into a higher freq with integer stride
+
+        Parameters
+        ----------
+        value : integer or float
+        freq : string
+            Frequency string
+
+        Raises
+        ------
+        ValueError
+            If the float cannot be converted to an integer at any resolution.
+
+        Example
+        -------
+        >>> Resolution.get_stride_from_decimal(1.5, 'T')
+        (90, 'S')
+
+        >>> Resolution.get_stride_from_decimal(1.04, 'H')
+        (3744, 'S')
+
+        >>> Resolution.get_stride_from_decimal(1, 'D')
+        (1, 'D')
+        """
+        if np.isclose(value % 1, 0):
+            return int(value), freq
+        else:
+            start_reso = cls.get_reso_from_freq(freq)
+            if start_reso == 0:
+                raise ValueError("Could not convert to integer offset "
+                                 "at any resolution")
+
+            next_value = cls._reso_mult_map[start_reso] * value
+            next_name = cls._reso_str_bump_map[freq]
+            return cls.get_stride_from_decimal(next_value, next_name)
+
+
+# ----------------------------------------------------------------------
+# Frequency Inference
+
+def month_position_check(fields, weekdays):
+    cdef:
+        int32_t daysinmonth, y, m, d
+        bint calendar_end = True
+        bint business_end = True
+        bint calendar_start = True
+        bint business_start = True
+        bint cal
+        int32_t[:] years
+        int32_t[:] months
+        int32_t[:] days
+
+    years = fields['Y']
+    months = fields['M']
+    days = fields['D']
+
+    for y, m, d, wd in zip(years, months, days, weekdays):
+        if calendar_start:
+            calendar_start &= d == 1
+        if business_start:
+            business_start &= d == 1 or (d <= 3 and wd == 0)
+
+        if calendar_end or business_end:
+            daysinmonth = get_days_in_month(y, m)
+            cal = d == daysinmonth
+            if calendar_end:
+                calendar_end &= cal
+            if business_end:
+                business_end &= cal or (daysinmonth - d < 3 and wd == 4)
+        elif not calendar_start and not business_start:
+            break
+
+    if calendar_end:
+        return 'ce'
+    elif business_end:
+        return 'be'
+    elif calendar_start:
+        return 'cs'
+    elif business_start:
+        return 'bs'
+    else:
+        return None
diff --git a/pandas/_libs/tslibs/src/datetime/np_datetime.c b/pandas/_libs/tslibs/src/datetime/np_datetime.c
new file mode 100644
index 0000000000000..87866d804503e
--- /dev/null
+++ b/pandas/_libs/tslibs/src/datetime/np_datetime.c
@@ -0,0 +1,814 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
+
+*/
+
+#define NO_IMPORT
+
+#ifndef NPY_NO_DEPRECATED_API
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+#endif  // NPY_NO_DEPRECATED_API
+
+#include <Python.h>
+#include <datetime.h>
+
+#include <numpy/arrayobject.h>
+#include <numpy/arrayscalars.h>
+#include <numpy/ndarraytypes.h>
+#include "np_datetime.h"
+
+#if PY_MAJOR_VERSION >= 3
+#define PyInt_AsLong PyLong_AsLong
+#endif  // PyInt_AsLong
+
+const npy_datetimestruct _NS_MIN_DTS = {
+    1677, 9, 21, 0, 12, 43, 145225, 0, 0};
+const npy_datetimestruct _NS_MAX_DTS = {
+    2262, 4, 11, 23, 47, 16, 854775, 807000, 0};
+
+
+const int days_per_month_table[2][12] = {
+    {31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31},
+    {31, 29, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31}};
+
+/*
+ * Returns 1 if the given year is a leap year, 0 otherwise.
+ */
+int is_leapyear(npy_int64 year) {
+    return (year & 0x3) == 0 && /* year % 4 == 0 */
+           ((year % 100) != 0 || (year % 400) == 0);
+}
+
+/*
+ * Adjusts a datetimestruct based on a minutes offset. Assumes
+ * the current values are valid.g
+ */
+void add_minutes_to_datetimestruct(npy_datetimestruct *dts, int minutes) {
+    int isleap;
+
+    /* MINUTES */
+    dts->min += minutes;
+    while (dts->min < 0) {
+        dts->min += 60;
+        dts->hour--;
+    }
+    while (dts->min >= 60) {
+        dts->min -= 60;
+        dts->hour++;
+    }
+
+    /* HOURS */
+    while (dts->hour < 0) {
+        dts->hour += 24;
+        dts->day--;
+    }
+    while (dts->hour >= 24) {
+        dts->hour -= 24;
+        dts->day++;
+    }
+
+    /* DAYS */
+    if (dts->day < 1) {
+        dts->month--;
+        if (dts->month < 1) {
+            dts->year--;
+            dts->month = 12;
+        }
+        isleap = is_leapyear(dts->year);
+        dts->day += days_per_month_table[isleap][dts->month - 1];
+    } else if (dts->day > 28) {
+        isleap = is_leapyear(dts->year);
+        if (dts->day > days_per_month_table[isleap][dts->month - 1]) {
+            dts->day -= days_per_month_table[isleap][dts->month - 1];
+            dts->month++;
+            if (dts->month > 12) {
+                dts->year++;
+                dts->month = 1;
+            }
+        }
+    }
+}
+
+/*
+ * Calculates the days offset from the 1970 epoch.
+ */
+npy_int64 get_datetimestruct_days(const npy_datetimestruct *dts) {
+    int i, month;
+    npy_int64 year, days = 0;
+    const int *month_lengths;
+
+    year = dts->year - 1970;
+    days = year * 365;
+
+    /* Adjust for leap years */
+    if (days >= 0) {
+        /*
+         * 1968 is the closest leap year before 1970.
+         * Exclude the current year, so add 1.
+         */
+        year += 1;
+        /* Add one day for each 4 years */
+        days += year / 4;
+        /* 1900 is the closest previous year divisible by 100 */
+        year += 68;
+        /* Subtract one day for each 100 years */
+        days -= year / 100;
+        /* 1600 is the closest previous year divisible by 400 */
+        year += 300;
+        /* Add one day for each 400 years */
+        days += year / 400;
+    } else {
+        /*
+         * 1972 is the closest later year after 1970.
+         * Include the current year, so subtract 2.
+         */
+        year -= 2;
+        /* Subtract one day for each 4 years */
+        days += year / 4;
+        /* 2000 is the closest later year divisible by 100 */
+        year -= 28;
+        /* Add one day for each 100 years */
+        days -= year / 100;
+        /* 2000 is also the closest later year divisible by 400 */
+        /* Subtract one day for each 400 years */
+        days += year / 400;
+    }
+
+    month_lengths = days_per_month_table[is_leapyear(dts->year)];
+    month = dts->month - 1;
+
+    /* Add the months */
+    for (i = 0; i < month; ++i) {
+        days += month_lengths[i];
+    }
+
+    /* Add the days */
+    days += dts->day - 1;
+
+    return days;
+}
+
+/*
+ * Modifies '*days_' to be the day offset within the year,
+ * and returns the year.
+ */
+static npy_int64 days_to_yearsdays(npy_int64 *days_) {
+    const npy_int64 days_per_400years = (400 * 365 + 100 - 4 + 1);
+    /* Adjust so it's relative to the year 2000 (divisible by 400) */
+    npy_int64 days = (*days_) - (365 * 30 + 7);
+    npy_int64 year;
+
+    /* Break down the 400 year cycle to get the year and day within the year */
+    if (days >= 0) {
+        year = 400 * (days / days_per_400years);
+        days = days % days_per_400years;
+    } else {
+        year = 400 * ((days - (days_per_400years - 1)) / days_per_400years);
+        days = days % days_per_400years;
+        if (days < 0) {
+            days += days_per_400years;
+        }
+    }
+
+    /* Work out the year/day within the 400 year cycle */
+    if (days >= 366) {
+        year += 100 * ((days - 1) / (100 * 365 + 25 - 1));
+        days = (days - 1) % (100 * 365 + 25 - 1);
+        if (days >= 365) {
+            year += 4 * ((days + 1) / (4 * 365 + 1));
+            days = (days + 1) % (4 * 365 + 1);
+            if (days >= 366) {
+                year += (days - 1) / 365;
+                days = (days - 1) % 365;
+            }
+        }
+    }
+
+    *days_ = days;
+    return year + 2000;
+}
+
+/*
+ * Adjusts a datetimestruct based on a seconds offset. Assumes
+ * the current values are valid.
+ */
+NPY_NO_EXPORT void add_seconds_to_datetimestruct(npy_datetimestruct *dts,
+                                                 int seconds) {
+    int minutes;
+
+    dts->sec += seconds;
+    if (dts->sec < 0) {
+        minutes = dts->sec / 60;
+        dts->sec = dts->sec % 60;
+        if (dts->sec < 0) {
+            --minutes;
+            dts->sec += 60;
+        }
+        add_minutes_to_datetimestruct(dts, minutes);
+    } else if (dts->sec >= 60) {
+        minutes = dts->sec / 60;
+        dts->sec = dts->sec % 60;
+        add_minutes_to_datetimestruct(dts, minutes);
+    }
+}
+
+/*
+ * Fills in the year, month, day in 'dts' based on the days
+ * offset from 1970.
+ */
+static void set_datetimestruct_days(npy_int64 days, npy_datetimestruct *dts) {
+    const int *month_lengths;
+    int i;
+
+    dts->year = days_to_yearsdays(&days);
+    month_lengths = days_per_month_table[is_leapyear(dts->year)];
+
+    for (i = 0; i < 12; ++i) {
+        if (days < month_lengths[i]) {
+            dts->month = i + 1;
+            dts->day = days + 1;
+            return;
+        } else {
+            days -= month_lengths[i];
+        }
+    }
+}
+
+/*
+ * Compares two npy_datetimestruct objects chronologically
+ */
+int cmp_npy_datetimestruct(const npy_datetimestruct *a,
+                           const npy_datetimestruct *b) {
+    if (a->year > b->year) {
+        return 1;
+    } else if (a->year < b->year) {
+        return -1;
+    }
+
+    if (a->month > b->month) {
+        return 1;
+    } else if (a->month < b->month) {
+        return -1;
+    }
+
+    if (a->day > b->day) {
+        return 1;
+    } else if (a->day < b->day) {
+        return -1;
+    }
+
+    if (a->hour > b->hour) {
+        return 1;
+    } else if (a->hour < b->hour) {
+        return -1;
+    }
+
+    if (a->min > b->min) {
+        return 1;
+    } else if (a->min < b->min) {
+        return -1;
+    }
+
+    if (a->sec > b->sec) {
+        return 1;
+    } else if (a->sec < b->sec) {
+        return -1;
+    }
+
+    if (a->us > b->us) {
+        return 1;
+    } else if (a->us < b->us) {
+        return -1;
+    }
+
+    if (a->ps > b->ps) {
+        return 1;
+    } else if (a->ps < b->ps) {
+        return -1;
+    }
+
+    if (a->as > b->as) {
+        return 1;
+    } else if (a->as < b->as) {
+        return -1;
+    }
+
+    return 0;
+}
+
+/*
+ *
+ * Converts a Python datetime.datetime or datetime.date
+ * object into a NumPy npy_datetimestruct.  Uses tzinfo (if present)
+ * to convert to UTC time.
+ *
+ * While the C API has PyDate_* and PyDateTime_* functions, the following
+ * implementation just asks for attributes, and thus supports
+ * datetime duck typing. The tzinfo time zone conversion would require
+ * this style of access anyway.
+ *
+ * Returns -1 on error, 0 on success, and 1 (with no error set)
+ * if obj doesn't have the needed date or datetime attributes.
+ */
+int convert_pydatetime_to_datetimestruct(PyDateTime_Date *dtobj,
+                                         npy_datetimestruct *out) {
+    // Assumes that obj is a valid datetime object
+    PyObject *tmp;
+    PyObject *obj = (PyObject*)dtobj;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(npy_datetimestruct));
+    out->month = 1;
+    out->day = 1;
+
+    out->year = PyInt_AsLong(PyObject_GetAttrString(obj, "year"));
+    out->month = PyInt_AsLong(PyObject_GetAttrString(obj, "month"));
+    out->day = PyInt_AsLong(PyObject_GetAttrString(obj, "day"));
+
+    // TODO(anyone): If we can get PyDateTime_IMPORT to work, we could use
+    // PyDateTime_Check here, and less verbose attribute lookups.
+
+    /* Check for time attributes (if not there, return success as a date) */
+    if (!PyObject_HasAttrString(obj, "hour") ||
+        !PyObject_HasAttrString(obj, "minute") ||
+        !PyObject_HasAttrString(obj, "second") ||
+        !PyObject_HasAttrString(obj, "microsecond")) {
+        return 0;
+    }
+
+    out->hour = PyInt_AsLong(PyObject_GetAttrString(obj, "hour"));
+    out->min = PyInt_AsLong(PyObject_GetAttrString(obj, "minute"));
+    out->sec = PyInt_AsLong(PyObject_GetAttrString(obj, "second"));
+    out->us = PyInt_AsLong(PyObject_GetAttrString(obj, "microsecond"));
+
+    /* Apply the time zone offset if datetime obj is tz-aware */
+    if (PyObject_HasAttrString((PyObject*)obj, "tzinfo")) {
+        tmp = PyObject_GetAttrString(obj, "tzinfo");
+        if (tmp == NULL) {
+            return -1;
+        }
+        if (tmp == Py_None) {
+            Py_DECREF(tmp);
+        } else {
+            PyObject *offset;
+            int seconds_offset, minutes_offset;
+
+            /* The utcoffset function should return a timedelta */
+            offset = PyObject_CallMethod(tmp, "utcoffset", "O", obj);
+            if (offset == NULL) {
+                Py_DECREF(tmp);
+                return -1;
+            }
+            Py_DECREF(tmp);
+
+            /*
+             * The timedelta should have a function "total_seconds"
+             * which contains the value we want.
+             */
+            tmp = PyObject_CallMethod(offset, "total_seconds", "");
+            if (tmp == NULL) {
+                return -1;
+            }
+            seconds_offset = PyInt_AsLong(tmp);
+            if (seconds_offset == -1 && PyErr_Occurred()) {
+                Py_DECREF(tmp);
+                return -1;
+            }
+            Py_DECREF(tmp);
+
+            /* Convert to a minutes offset and apply it */
+            minutes_offset = seconds_offset / 60;
+
+            add_minutes_to_datetimestruct(out, -minutes_offset);
+        }
+    }
+
+    return 0;
+}
+
+
+/*
+ * Converts a datetime from a datetimestruct to a datetime based
+ * on a metadata unit. The date is assumed to be valid.
+ */
+npy_datetime npy_datetimestruct_to_datetime(NPY_DATETIMEUNIT base,
+                                            const npy_datetimestruct *dts) {
+    npy_datetime ret;
+
+    if (base == NPY_FR_Y) {
+        /* Truncate to the year */
+        ret = dts->year - 1970;
+    } else if (base == NPY_FR_M) {
+        /* Truncate to the month */
+        ret = 12 * (dts->year - 1970) + (dts->month - 1);
+    } else {
+        /* Otherwise calculate the number of days to start */
+        npy_int64 days = get_datetimestruct_days(dts);
+
+        switch (base) {
+            case NPY_FR_W:
+                /* Truncate to weeks */
+                if (days >= 0) {
+                    ret = days / 7;
+                } else {
+                    ret = (days - 6) / 7;
+                }
+                break;
+            case NPY_FR_D:
+                ret = days;
+                break;
+            case NPY_FR_h:
+                ret = days * 24 + dts->hour;
+                break;
+            case NPY_FR_m:
+                ret = (days * 24 + dts->hour) * 60 + dts->min;
+                break;
+            case NPY_FR_s:
+                ret = ((days * 24 + dts->hour) * 60 + dts->min) * 60 + dts->sec;
+                break;
+            case NPY_FR_ms:
+                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                       dts->sec) *
+                          1000 +
+                      dts->us / 1000;
+                break;
+            case NPY_FR_us:
+                ret = (((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                       dts->sec) *
+                          1000000 +
+                      dts->us;
+                break;
+            case NPY_FR_ns:
+                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                        dts->sec) *
+                           1000000 +
+                       dts->us) *
+                          1000 +
+                      dts->ps / 1000;
+                break;
+            case NPY_FR_ps:
+                ret = ((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                        dts->sec) *
+                           1000000 +
+                       dts->us) *
+                          1000000 +
+                      dts->ps;
+                break;
+            case NPY_FR_fs:
+                /* only 2.6 hours */
+                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                         dts->sec) *
+                            1000000 +
+                        dts->us) *
+                           1000000 +
+                       dts->ps) *
+                          1000 +
+                      dts->as / 1000;
+                break;
+            case NPY_FR_as:
+                /* only 9.2 secs */
+                ret = (((((days * 24 + dts->hour) * 60 + dts->min) * 60 +
+                         dts->sec) *
+                            1000000 +
+                        dts->us) *
+                           1000000 +
+                       dts->ps) *
+                          1000000 +
+                      dts->as;
+                break;
+            default:
+                /* Something got corrupted */
+                PyErr_SetString(
+                    PyExc_ValueError,
+                    "NumPy datetime metadata with corrupt unit value");
+                return -1;
+        }
+    }
+    return ret;
+}
+
+/*
+ * Converts a datetime based on the given metadata into a datetimestruct
+ */
+void pandas_datetime_to_datetimestruct(npy_datetime dt,
+                                       NPY_DATETIMEUNIT base,
+                                       npy_datetimestruct *out) {
+    npy_int64 perday;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(npy_datetimestruct));
+    out->year = 1970;
+    out->month = 1;
+    out->day = 1;
+
+    /*
+     * Note that care must be taken with the / and % operators
+     * for negative values.
+     */
+    switch (base) {
+        case NPY_FR_Y:
+            out->year = 1970 + dt;
+            break;
+
+        case NPY_FR_M:
+            if (dt >= 0) {
+                out->year = 1970 + dt / 12;
+                out->month = dt % 12 + 1;
+            } else {
+                out->year = 1969 + (dt + 1) / 12;
+                out->month = 12 + (dt + 1) % 12;
+            }
+            break;
+
+        case NPY_FR_W:
+            /* A week is 7 days */
+            set_datetimestruct_days(dt * 7, out);
+            break;
+
+        case NPY_FR_D:
+            set_datetimestruct_days(dt, out);
+            break;
+
+        case NPY_FR_h:
+            perday = 24LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt;
+            break;
+
+        case NPY_FR_m:
+            perday = 24LL * 60;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / 60;
+            out->min = dt % 60;
+            break;
+
+        case NPY_FR_s:
+            perday = 24LL * 60 * 60;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60);
+            out->min = (dt / 60) % 60;
+            out->sec = dt % 60;
+            break;
+
+        case NPY_FR_ms:
+            perday = 24LL * 60 * 60 * 1000;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000LL);
+            out->min = (dt / (60 * 1000LL)) % 60;
+            out->sec = (dt / 1000LL) % 60;
+            out->us = (dt % 1000LL) * 1000;
+            break;
+
+        case NPY_FR_us:
+            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000LL);
+            out->min = (dt / (60 * 1000000LL)) % 60;
+            out->sec = (dt / 1000000LL) % 60;
+            out->us = dt % 1000000LL;
+            break;
+
+        case NPY_FR_ns:
+            perday = 24LL * 60LL * 60LL * 1000LL * 1000LL * 1000LL;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000000LL);
+            out->min = (dt / (60 * 1000000000LL)) % 60;
+            out->sec = (dt / 1000000000LL) % 60;
+            out->us = (dt / 1000LL) % 1000000LL;
+            out->ps = (dt % 1000LL) * 1000;
+            break;
+
+        case NPY_FR_ps:
+            perday = 24LL * 60 * 60 * 1000 * 1000 * 1000 * 1000;
+
+            if (dt >= 0) {
+                set_datetimestruct_days(dt / perday, out);
+                dt = dt % perday;
+            } else {
+                set_datetimestruct_days(
+                    dt / perday - (dt % perday == 0 ? 0 : 1), out);
+                dt = (perday - 1) + (dt + 1) % perday;
+            }
+            out->hour = dt / (60 * 60 * 1000000000000LL);
+            out->min = (dt / (60 * 1000000000000LL)) % 60;
+            out->sec = (dt / 1000000000000LL) % 60;
+            out->us = (dt / 1000000LL) % 1000000LL;
+            out->ps = dt % 1000000LL;
+            break;
+
+        case NPY_FR_fs:
+            /* entire range is only +- 2.6 hours */
+            if (dt >= 0) {
+                out->hour = dt / (60 * 60 * 1000000000000000LL);
+                out->min = (dt / (60 * 1000000000000000LL)) % 60;
+                out->sec = (dt / 1000000000000000LL) % 60;
+                out->us = (dt / 1000000000LL) % 1000000LL;
+                out->ps = (dt / 1000LL) % 1000000LL;
+                out->as = (dt % 1000LL) * 1000;
+            } else {
+                npy_datetime minutes;
+
+                minutes = dt / (60 * 1000000000000000LL);
+                dt = dt % (60 * 1000000000000000LL);
+                if (dt < 0) {
+                    dt += (60 * 1000000000000000LL);
+                    --minutes;
+                }
+                /* Offset the negative minutes */
+                add_minutes_to_datetimestruct(out, minutes);
+                out->sec = (dt / 1000000000000000LL) % 60;
+                out->us = (dt / 1000000000LL) % 1000000LL;
+                out->ps = (dt / 1000LL) % 1000000LL;
+                out->as = (dt % 1000LL) * 1000;
+            }
+            break;
+
+        case NPY_FR_as:
+            /* entire range is only +- 9.2 seconds */
+            if (dt >= 0) {
+                out->sec = (dt / 1000000000000000000LL) % 60;
+                out->us = (dt / 1000000000000LL) % 1000000LL;
+                out->ps = (dt / 1000000LL) % 1000000LL;
+                out->as = dt % 1000000LL;
+            } else {
+                npy_datetime seconds;
+
+                seconds = dt / 1000000000000000000LL;
+                dt = dt % 1000000000000000000LL;
+                if (dt < 0) {
+                    dt += 1000000000000000000LL;
+                    --seconds;
+                }
+                /* Offset the negative seconds */
+                add_seconds_to_datetimestruct(out, seconds);
+                out->us = (dt / 1000000000000LL) % 1000000LL;
+                out->ps = (dt / 1000000LL) % 1000000LL;
+                out->as = dt % 1000000LL;
+            }
+            break;
+
+        default:
+            PyErr_SetString(PyExc_RuntimeError,
+                            "NumPy datetime metadata is corrupted with invalid "
+                            "base unit");
+    }
+}
+
+/*
+ * Converts a timedelta from a timedeltastruct to a timedelta based
+ * on a metadata unit. The timedelta is assumed to be valid.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+void pandas_timedelta_to_timedeltastruct(npy_timedelta td,
+                                         NPY_DATETIMEUNIT base,
+                                         pandas_timedeltastruct *out) {
+    npy_int64 frac;
+    npy_int64 sfrac;
+    npy_int64 ifrac;
+    int sign;
+    npy_int64 DAY_NS = 86400000000000LL;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(pandas_timedeltastruct));
+
+    switch (base) {
+        case NPY_FR_ns:
+
+        // put frac in seconds
+        if (td < 0 && td % (1000LL * 1000LL * 1000LL) != 0)
+            frac = td / (1000LL * 1000LL * 1000LL) - 1;
+        else
+            frac = td / (1000LL * 1000LL * 1000LL);
+
+        if (frac < 0) {
+            sign = -1;
+
+            // even fraction
+            if ((-frac % 86400LL) != 0) {
+              out->days = -frac / 86400LL + 1;
+              frac += 86400LL * out->days;
+            } else {
+              frac = -frac;
+            }
+        } else {
+            sign = 1;
+            out->days = 0;
+        }
+
+        if (frac >= 86400) {
+            out->days += frac / 86400LL;
+            frac -= out->days * 86400LL;
+        }
+
+        if (frac >= 3600) {
+            out->hrs = frac / 3600LL;
+            frac -= out->hrs * 3600LL;
+        } else {
+            out->hrs = 0;
+        }
+
+        if (frac >= 60) {
+            out->min = frac / 60LL;
+            frac -= out->min * 60LL;
+        } else {
+            out->min = 0;
+        }
+
+        if (frac >= 0) {
+            out->sec = frac;
+            frac -= out->sec;
+        } else {
+            out->sec = 0;
+        }
+
+        sfrac = (out->hrs * 3600LL + out->min * 60LL
+                 + out->sec) * (1000LL * 1000LL * 1000LL);
+
+        if (sign < 0)
+            out->days = -out->days;
+
+        ifrac = td - (out->days * DAY_NS + sfrac);
+
+        if (ifrac != 0) {
+            out->ms = ifrac / (1000LL * 1000LL);
+            ifrac -= out->ms * 1000LL * 1000LL;
+            out->us = ifrac / 1000LL;
+            ifrac -= out->us * 1000LL;
+            out->ns = ifrac;
+        } else {
+            out->ms = 0;
+            out->us = 0;
+            out->ns = 0;
+        }
+
+        out->seconds = out->hrs * 3600 + out->min * 60 + out->sec;
+        out->microseconds = out->ms * 1000 + out->us;
+        out->nanoseconds = out->ns;
+        break;
+
+        default:
+            PyErr_SetString(PyExc_RuntimeError,
+                            "NumPy timedelta metadata is corrupted with "
+                            "invalid base unit");
+    }
+}
diff --git a/pandas/_libs/tslibs/src/datetime/np_datetime.h b/pandas/_libs/tslibs/src/datetime/np_datetime.h
new file mode 100644
index 0000000000000..549d38409ca83
--- /dev/null
+++ b/pandas/_libs/tslibs/src/datetime/np_datetime.h
@@ -0,0 +1,80 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+This file is derived from NumPy 1.7. See NUMPY_LICENSE.txt
+
+*/
+
+#ifndef PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_H_
+#define PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_H_
+
+#ifndef NPY_NO_DEPRECATED_API
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+#endif  // NPY_NO_DEPRECATED_API
+
+#include <numpy/ndarraytypes.h>
+#include <datetime.h>
+
+typedef struct {
+        npy_int64 days;
+        npy_int32 hrs, min, sec, ms, us, ns, seconds, microseconds, nanoseconds;
+} pandas_timedeltastruct;
+
+extern const npy_datetimestruct _NS_MIN_DTS;
+extern const npy_datetimestruct _NS_MAX_DTS;
+
+// stuff pandas needs
+// ----------------------------------------------------------------------------
+
+int convert_pydatetime_to_datetimestruct(PyDateTime_Date *dtobj,
+                                         npy_datetimestruct *out);
+
+npy_datetime npy_datetimestruct_to_datetime(NPY_DATETIMEUNIT base,
+                                            const npy_datetimestruct *dts);
+
+void pandas_datetime_to_datetimestruct(npy_datetime val, NPY_DATETIMEUNIT fr,
+                                       npy_datetimestruct *result);
+
+void pandas_timedelta_to_timedeltastruct(npy_timedelta val,
+                                         NPY_DATETIMEUNIT fr,
+                                         pandas_timedeltastruct *result);
+
+extern const int days_per_month_table[2][12];
+
+// stuff numpy-derived code needs in header
+// ----------------------------------------------------------------------------
+
+int is_leapyear(npy_int64 year);
+
+/*
+ * Calculates the days offset from the 1970 epoch.
+ */
+npy_int64
+get_datetimestruct_days(const npy_datetimestruct *dts);
+
+
+/*
+ * Compares two npy_datetimestruct objects chronologically
+ */
+int cmp_npy_datetimestruct(const npy_datetimestruct *a,
+                           const npy_datetimestruct *b);
+
+
+/*
+ * Adjusts a datetimestruct based on a minutes offset. Assumes
+ * the current values are valid.
+ */
+void
+add_minutes_to_datetimestruct(npy_datetimestruct *dts, int minutes);
+
+
+#endif  // PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_H_
diff --git a/pandas/_libs/tslibs/src/datetime/np_datetime_strings.c b/pandas/_libs/tslibs/src/datetime/np_datetime_strings.c
new file mode 100644
index 0000000000000..207da4b8f8340
--- /dev/null
+++ b/pandas/_libs/tslibs/src/datetime/np_datetime_strings.c
@@ -0,0 +1,886 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Written by Mark Wiebe (mwwiebe@gmail.com)
+Copyright (c) 2011 by Enthought, Inc.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+See NUMPY_LICENSE.txt for the license.
+
+This file implements string parsing and creation for NumPy datetime.
+
+*/
+
+#define PY_SSIZE_T_CLEAN
+#define NO_IMPORT
+
+#ifndef NPY_NO_DEPRECATED_API
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+#endif  // NPY_NO_DEPRECATED_API
+
+#include <Python.h>
+
+#include <time.h>
+
+#include <numpy/arrayobject.h>
+#include <numpy/arrayscalars.h>
+#include <numpy/ndarraytypes.h>
+
+#include "np_datetime.h"
+#include "np_datetime_strings.h"
+
+
+/*
+ * Parses (almost) standard ISO 8601 date strings. The differences are:
+ *
+ * + Only seconds may have a decimal point, with up to 18 digits after it
+ *   (maximum attoseconds precision).
+ * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
+ *   the date and the time. Both are treated equivalently.
+ * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
+ * + Doesn't handle leap seconds (seconds value has 60 in these cases).
+ * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
+ * + Accepts special values "NaT" (not a time), "Today", (current
+ *   day according to local time) and "Now" (current time in UTC).
+ * + ':' separator between hours, minutes, and seconds is optional. When
+ *   omitted, each component must be 2 digits if it appears. (GH-10041)
+ *
+ * 'str' must be a NULL-terminated string, and 'len' must be its length.
+ *
+ * 'out' gets filled with the parsed date-time.
+ * 'out_local' gets set to 1 if the parsed time contains timezone,
+ *      to 0 otherwise.
+ * 'out_tzoffset' gets set to timezone offset by minutes
+ *      if the parsed time was in local time,
+ *      to 0 otherwise. The values 'now' and 'today' don't get counted
+ *      as local, and neither do UTC +/-#### timezone offsets, because
+ *      they aren't using the computer's local timezone offset.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int parse_iso_8601_datetime(char *str, int len,
+                            npy_datetimestruct *out,
+                            int *out_local, int *out_tzoffset) {
+    int year_leap = 0;
+    int i, numdigits;
+    char *substr, sublen;
+
+    /* If year-month-day are separated by a valid separator,
+     * months/days without leading zeroes will be parsed
+     * (though not iso8601). If the components aren't separated,
+     * 4 (YYYY) or 8 (YYYYMMDD) digits are expected. 6 digits are
+     * forbidden here (but parsed as YYMMDD elsewhere).
+    */
+    int has_ymd_sep = 0;
+    char ymd_sep = '\0';
+    char valid_ymd_sep[] = {'-', '.', '/', '\\', ' '};
+    int valid_ymd_sep_len = sizeof(valid_ymd_sep);
+
+    /* hour-minute-second may or may not separated by ':'. If not, then
+     * each component must be 2 digits. */
+    int has_hms_sep = 0;
+    int hour_was_2_digits = 0;
+
+    /* Initialize the output to all zeros */
+    memset(out, 0, sizeof(npy_datetimestruct));
+    out->month = 1;
+    out->day = 1;
+
+    substr = str;
+    sublen = len;
+
+    /* Skip leading whitespace */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    /* Leading '-' sign for negative year */
+    if (*substr == '-') {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen == 0) {
+        goto parse_error;
+    }
+
+    /* PARSE THE YEAR (4 digits) */
+    out->year = 0;
+    if (sublen >= 4 && isdigit(substr[0]) && isdigit(substr[1]) &&
+        isdigit(substr[2]) && isdigit(substr[3])) {
+        out->year = 1000 * (substr[0] - '0') + 100 * (substr[1] - '0') +
+                    10 * (substr[2] - '0') + (substr[3] - '0');
+
+        substr += 4;
+        sublen -= 4;
+    }
+
+    /* Negate the year if necessary */
+    if (str[0] == '-') {
+        out->year = -out->year;
+    }
+    /* Check whether it's a leap-year */
+    year_leap = is_leapyear(out->year);
+
+    /* Next character must be a separator, start of month, or end of string */
+    if (sublen == 0) {
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if (!isdigit(*substr)) {
+        for (i = 0; i < valid_ymd_sep_len; ++i) {
+            if (*substr == valid_ymd_sep[i]) {
+                break;
+            }
+        }
+        if (i == valid_ymd_sep_len) {
+            goto parse_error;
+        }
+        has_ymd_sep = 1;
+        ymd_sep = valid_ymd_sep[i];
+        ++substr;
+        --sublen;
+        /* Cannot have trailing separator */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    }
+
+    /* PARSE THE MONTH */
+    /* First digit required */
+    out->month = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->month = 10 * out->month + (*substr - '0');
+        ++substr;
+        --sublen;
+    } else if (!has_ymd_sep) {
+        goto parse_error;
+    }
+    if (out->month < 1 || out->month > 12) {
+        PyErr_Format(PyExc_ValueError,
+                     "Month out of range in datetime string \"%s\"", str);
+        goto error;
+    }
+
+    /* Next character must be the separator, start of day, or end of string */
+    if (sublen == 0) {
+        /* Forbid YYYYMM. Parsed instead as YYMMDD by someone else. */
+        if (!has_ymd_sep) {
+            goto parse_error;
+        }
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if (has_ymd_sep) {
+        /* Must have separator, but cannot be trailing */
+        if (*substr != ymd_sep || sublen == 1) {
+            goto parse_error;
+        }
+        ++substr;
+        --sublen;
+    }
+
+    /* PARSE THE DAY */
+    /* First digit required */
+    if (!isdigit(*substr)) {
+        goto parse_error;
+    }
+    out->day = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->day = 10 * out->day + (*substr - '0');
+        ++substr;
+        --sublen;
+    } else if (!has_ymd_sep) {
+        goto parse_error;
+    }
+    if (out->day < 1 ||
+        out->day > days_per_month_table[year_leap][out->month - 1]) {
+        PyErr_Format(PyExc_ValueError,
+                     "Day out of range in datetime string \"%s\"", str);
+        goto error;
+    }
+
+    /* Next character must be a 'T', ' ', or end of string */
+    if (sublen == 0) {
+        if (out_local != NULL) {
+            *out_local = 0;
+        }
+        goto finish;
+    }
+
+    if ((*substr != 'T' && *substr != ' ') || sublen == 1) {
+        goto parse_error;
+    }
+    ++substr;
+    --sublen;
+
+    /* PARSE THE HOURS */
+    /* First digit required */
+    if (!isdigit(*substr)) {
+        goto parse_error;
+    }
+    out->hour = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional */
+    if (isdigit(*substr)) {
+        hour_was_2_digits = 1;
+        out->hour = 10 * out->hour + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->hour >= 24) {
+            PyErr_Format(PyExc_ValueError,
+                         "Hours out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    }
+
+    /* Next character must be a ':' or the end of the string */
+    if (sublen == 0) {
+        if (!hour_was_2_digits) {
+            goto parse_error;
+        }
+        goto finish;
+    }
+
+    if (*substr == ':') {
+        has_hms_sep = 1;
+        ++substr;
+        --sublen;
+        /* Cannot have a trailing separator */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    } else if (!isdigit(*substr)) {
+        if (!hour_was_2_digits) {
+            goto parse_error;
+        }
+        goto parse_timezone;
+    }
+
+    /* PARSE THE MINUTES */
+    /* First digit required */
+    out->min = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->min = 10 * out->min + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->min >= 60) {
+            PyErr_Format(PyExc_ValueError,
+                         "Minutes out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    } else if (!has_hms_sep) {
+        goto parse_error;
+    }
+
+    if (sublen == 0) {
+        goto finish;
+    }
+
+    /* If we make it through this condition block, then the next
+     * character is a digit. */
+    if (has_hms_sep && *substr == ':') {
+        ++substr;
+        --sublen;
+        /* Cannot have a trailing ':' */
+        if (sublen == 0 || !isdigit(*substr)) {
+            goto parse_error;
+        }
+    } else if (!has_hms_sep && isdigit(*substr)) {
+    } else {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE SECONDS */
+    /* First digit required */
+    out->sec = (*substr - '0');
+    ++substr;
+    --sublen;
+    /* Second digit optional if there was a separator */
+    if (isdigit(*substr)) {
+        out->sec = 10 * out->sec + (*substr - '0');
+        ++substr;
+        --sublen;
+        if (out->sec >= 60) {
+            PyErr_Format(PyExc_ValueError,
+                         "Seconds out of range in datetime string \"%s\"", str);
+            goto error;
+        }
+    } else if (!has_hms_sep) {
+        goto parse_error;
+    }
+
+    /* Next character may be a '.' indicating fractional seconds */
+    if (sublen > 0 && *substr == '.') {
+        ++substr;
+        --sublen;
+    } else {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE MICROSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->us *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->us += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+    if (sublen == 0 || !isdigit(*substr)) {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE PICOSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->ps *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->ps += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+    if (sublen == 0 || !isdigit(*substr)) {
+        goto parse_timezone;
+    }
+
+    /* PARSE THE ATTOSECONDS (0 to 6 digits) */
+    numdigits = 0;
+    for (i = 0; i < 6; ++i) {
+        out->as *= 10;
+        if (sublen > 0 && isdigit(*substr)) {
+            out->as += (*substr - '0');
+            ++substr;
+            --sublen;
+            ++numdigits;
+        }
+    }
+
+parse_timezone:
+    /* trim any whitepsace between time/timeezone */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen == 0) {
+        // Unlike NumPy, treating no time zone as naive
+        goto finish;
+    }
+
+    /* UTC specifier */
+    if (*substr == 'Z') {
+        /* "Z" should be equivalent to tz offset "+00:00" */
+        if (out_local != NULL) {
+            *out_local = 1;
+        }
+
+        if (out_tzoffset != NULL) {
+            *out_tzoffset = 0;
+        }
+
+        if (sublen == 1) {
+            goto finish;
+        } else {
+            ++substr;
+            --sublen;
+        }
+    } else if (*substr == '-' || *substr == '+') {
+        /* Time zone offset */
+        int offset_neg = 0, offset_hour = 0, offset_minute = 0;
+
+        /*
+         * Since "local" means local with respect to the current
+         * machine, we say this is non-local.
+         */
+
+        if (*substr == '-') {
+            offset_neg = 1;
+        }
+        ++substr;
+        --sublen;
+
+        /* The hours offset */
+        if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
+            offset_hour = 10 * (substr[0] - '0') + (substr[1] - '0');
+            substr += 2;
+            sublen -= 2;
+            if (offset_hour >= 24) {
+                PyErr_Format(PyExc_ValueError,
+                             "Timezone hours offset out of range "
+                             "in datetime string \"%s\"",
+                             str);
+                goto error;
+            }
+        } else if (sublen >= 1 && isdigit(substr[0])) {
+            offset_hour = substr[0] - '0';
+            ++substr;
+            --sublen;
+        } else {
+            goto parse_error;
+        }
+
+        /* The minutes offset is optional */
+        if (sublen > 0) {
+            /* Optional ':' */
+            if (*substr == ':') {
+                ++substr;
+                --sublen;
+            }
+
+            /* The minutes offset (at the end of the string) */
+            if (sublen >= 2 && isdigit(substr[0]) && isdigit(substr[1])) {
+                offset_minute = 10 * (substr[0] - '0') + (substr[1] - '0');
+                substr += 2;
+                sublen -= 2;
+                if (offset_minute >= 60) {
+                    PyErr_Format(PyExc_ValueError,
+                                 "Timezone minutes offset out of range "
+                                 "in datetime string \"%s\"",
+                                 str);
+                    goto error;
+                }
+            } else if (sublen >= 1 && isdigit(substr[0])) {
+                offset_minute = substr[0] - '0';
+                ++substr;
+                --sublen;
+            } else {
+                goto parse_error;
+            }
+        }
+
+        /* Apply the time zone offset */
+        if (offset_neg) {
+            offset_hour = -offset_hour;
+            offset_minute = -offset_minute;
+        }
+        if (out_local != NULL) {
+            *out_local = 1;
+            // Unlike NumPy, do not change internal value to local time
+            *out_tzoffset = 60 * offset_hour + offset_minute;
+        }
+    }
+
+    /* Skip trailing whitespace */
+    while (sublen > 0 && isspace(*substr)) {
+        ++substr;
+        --sublen;
+    }
+
+    if (sublen != 0) {
+        goto parse_error;
+    }
+
+finish:
+    return 0;
+
+parse_error:
+    PyErr_Format(PyExc_ValueError,
+                 "Error parsing datetime string \"%s\" at position %d", str,
+                 (int)(substr - str));
+    return -1;
+
+error:
+    return -1;
+}
+
+/*
+ * Provides a string length to use for converting datetime
+ * objects with the given local and unit settings.
+ */
+int get_datetime_iso_8601_strlen(int local, NPY_DATETIMEUNIT base) {
+    int len = 0;
+
+    switch (base) {
+        /* Generic units can only be used to represent NaT */
+        /*    return 4;*/
+        case NPY_FR_as:
+            len += 3; /* "###" */
+        case NPY_FR_fs:
+            len += 3; /* "###" */
+        case NPY_FR_ps:
+            len += 3; /* "###" */
+        case NPY_FR_ns:
+            len += 3; /* "###" */
+        case NPY_FR_us:
+            len += 3; /* "###" */
+        case NPY_FR_ms:
+            len += 4; /* ".###" */
+        case NPY_FR_s:
+            len += 3; /* ":##" */
+        case NPY_FR_m:
+            len += 3; /* ":##" */
+        case NPY_FR_h:
+            len += 3; /* "T##" */
+        case NPY_FR_D:
+        case NPY_FR_W:
+            len += 3; /* "-##" */
+        case NPY_FR_M:
+            len += 3; /* "-##" */
+        case NPY_FR_Y:
+            len += 21; /* 64-bit year */
+            break;
+        default:
+            len += 3; /* handle the now defunct NPY_FR_B */
+            break;
+    }
+
+    if (base >= NPY_FR_h) {
+        if (local) {
+            len += 5; /* "+####" or "-####" */
+        } else {
+            len += 1; /* "Z" */
+        }
+    }
+
+    len += 1; /* NULL terminator */
+
+    return len;
+}
+
+
+/*
+ * Converts an npy_datetimestruct to an (almost) ISO 8601
+ * NULL-terminated string using timezone Z (UTC). If the string fits in
+ * the space exactly, it leaves out the NULL terminator and returns success.
+ *
+ * The differences from ISO 8601 are the 'NaT' string, and
+ * the number of year digits is >= 4 instead of strictly 4.
+ *
+ * 'base' restricts the output to that unit. Set 'base' to
+ * -1 to auto-detect a base after which all the values are zero.
+ *
+ *  Returns 0 on success, -1 on failure (for example if the output
+ *  string was too short).
+ */
+int make_iso_8601_datetime(npy_datetimestruct *dts, char *outstr, int outlen,
+                           NPY_DATETIMEUNIT base) {
+    char *substr = outstr, sublen = outlen;
+    int tmplen;
+
+    /*
+     * Print weeks with the same precision as days.
+     *
+     * TODO: Could print weeks with YYYY-Www format if the week
+     *       epoch is a Monday.
+     */
+    if (base == NPY_FR_W) {
+        base = NPY_FR_D;
+    }
+
+/* YEAR */
+/*
+ * Can't use PyOS_snprintf, because it always produces a '\0'
+ * character at the end, and NumPy string types are permitted
+ * to have data all the way to the end of the buffer.
+ */
+#ifdef _WIN32
+    tmplen = _snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
+#else
+    tmplen = snprintf(substr, sublen, "%04" NPY_INT64_FMT, dts->year);
+#endif  // _WIN32
+    /* If it ran out of space or there isn't space for the NULL terminator */
+    if (tmplen < 0 || tmplen > sublen) {
+        goto string_too_short;
+    }
+    substr += tmplen;
+    sublen -= tmplen;
+
+    /* Stop if the unit is years */
+    if (base == NPY_FR_Y) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* MONTH */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '-';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->month / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->month % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is months */
+    if (base == NPY_FR_M) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* DAY */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '-';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->day / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->day % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is days */
+    if (base == NPY_FR_D) {
+        if (sublen > 0) {
+            *substr = '\0';
+        }
+        return 0;
+    }
+
+    /* HOUR */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = 'T';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->hour / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->hour % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is hours */
+    if (base == NPY_FR_h) {
+        goto add_time_zone;
+    }
+
+    /* MINUTE */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = ':';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->min / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->min % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is minutes */
+    if (base == NPY_FR_m) {
+        goto add_time_zone;
+    }
+
+    /* SECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = ':';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->sec / 10) + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->sec % 10) + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is seconds */
+    if (base == NPY_FR_s) {
+        goto add_time_zone;
+    }
+
+    /* MILLISECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = '.';
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->us / 100000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->us / 10000) % 10 + '0');
+    if (sublen < 4) {
+        goto string_too_short;
+    }
+    substr[3] = (char)((dts->us / 1000) % 10 + '0');
+    substr += 4;
+    sublen -= 4;
+
+    /* Stop if the unit is milliseconds */
+    if (base == NPY_FR_ms) {
+        goto add_time_zone;
+    }
+
+    /* MICROSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->us / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->us / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->us % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is microseconds */
+    if (base == NPY_FR_us) {
+        goto add_time_zone;
+    }
+
+    /* NANOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->ps / 100000) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->ps / 10000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->ps / 1000) % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is nanoseconds */
+    if (base == NPY_FR_ns) {
+        goto add_time_zone;
+    }
+
+    /* PICOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->ps / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->ps / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->ps % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is picoseconds */
+    if (base == NPY_FR_ps) {
+        goto add_time_zone;
+    }
+
+    /* FEMTOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->as / 100000) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->as / 10000) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)((dts->as / 1000) % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+    /* Stop if the unit is femtoseconds */
+    if (base == NPY_FR_fs) {
+        goto add_time_zone;
+    }
+
+    /* ATTOSECOND */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = (char)((dts->as / 100) % 10 + '0');
+    if (sublen < 2) {
+        goto string_too_short;
+    }
+    substr[1] = (char)((dts->as / 10) % 10 + '0');
+    if (sublen < 3) {
+        goto string_too_short;
+    }
+    substr[2] = (char)(dts->as % 10 + '0');
+    substr += 3;
+    sublen -= 3;
+
+add_time_zone:
+    /* UTC "Zulu" time */
+    if (sublen < 1) {
+        goto string_too_short;
+    }
+    substr[0] = 'Z';
+    substr += 1;
+    sublen -= 1;
+
+    /* Add a NULL terminator, and return */
+    if (sublen > 0) {
+        substr[0] = '\0';
+    }
+
+    return 0;
+
+string_too_short:
+    PyErr_Format(PyExc_RuntimeError,
+                 "The string provided for NumPy ISO datetime formatting "
+                 "was too short, with length %d",
+                 outlen);
+    return -1;
+}
diff --git a/pandas/_libs/tslibs/src/datetime/np_datetime_strings.h b/pandas/_libs/tslibs/src/datetime/np_datetime_strings.h
new file mode 100644
index 0000000000000..15d5dd357eaef
--- /dev/null
+++ b/pandas/_libs/tslibs/src/datetime/np_datetime_strings.h
@@ -0,0 +1,83 @@
+/*
+
+Copyright (c) 2016, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+
+Written by Mark Wiebe (mwwiebe@gmail.com)
+Copyright (c) 2011 by Enthought, Inc.
+
+Copyright (c) 2005-2011, NumPy Developers
+All rights reserved.
+
+See NUMPY_LICENSE.txt for the license.
+
+This file implements string parsing and creation for NumPy datetime.
+
+*/
+
+#ifndef PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
+#define PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
+
+#ifndef NPY_NO_DEPRECATED_API
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+#endif  // NPY_NO_DEPRECATED_API
+
+/*
+ * Parses (almost) standard ISO 8601 date strings. The differences are:
+ *
+ * + The date "20100312" is parsed as the year 20100312, not as
+ *   equivalent to "2010-03-12". The '-' in the dates are not optional.
+ * + Only seconds may have a decimal point, with up to 18 digits after it
+ *   (maximum attoseconds precision).
+ * + Either a 'T' as in ISO 8601 or a ' ' may be used to separate
+ *   the date and the time. Both are treated equivalently.
+ * + Doesn't (yet) handle the "YYYY-DDD" or "YYYY-Www" formats.
+ * + Doesn't handle leap seconds (seconds value has 60 in these cases).
+ * + Doesn't handle 24:00:00 as synonym for midnight (00:00:00) tomorrow
+ * + Accepts special values "NaT" (not a time), "Today", (current
+ *   day according to local time) and "Now" (current time in UTC).
+ *
+ * 'str' must be a NULL-terminated string, and 'len' must be its length.
+ *
+ * 'out' gets filled with the parsed date-time.
+ * 'out_local' gets whether returned value contains timezone. 0 for UTC, 1 for local time.
+ * 'out_tzoffset' gets set to timezone offset by minutes
+ *      if the parsed time was in local time,
+ *      to 0 otherwise. The values 'now' and 'today' don't get counted
+ *      as local, and neither do UTC +/-#### timezone offsets, because
+ *      they aren't using the computer's local timezone offset.
+ *
+ * Returns 0 on success, -1 on failure.
+ */
+int
+parse_iso_8601_datetime(char *str, int len,
+                        npy_datetimestruct *out,
+                        int *out_local,
+                        int *out_tzoffset);
+
+/*
+ * Provides a string length to use for converting datetime
+ * objects with the given local and unit settings.
+ */
+int
+get_datetime_iso_8601_strlen(int local, NPY_DATETIMEUNIT base);
+
+/*
+ * Converts an npy_datetimestruct to an (almost) ISO 8601
+ * NULL-terminated string using timezone Z (UTC).
+ *
+ * 'base' restricts the output to that unit. Set 'base' to
+ * -1 to auto-detect a base after which all the values are zero.
+ *
+ *  Returns 0 on success, -1 on failure (for example if the output
+ *  string was too short).
+ */
+int
+make_iso_8601_datetime(npy_datetimestruct *dts, char *outstr, int outlen,
+                       NPY_DATETIMEUNIT base);
+
+#endif  // PANDAS__LIBS_TSLIBS_SRC_DATETIME_NP_DATETIME_STRINGS_H_
diff --git a/pandas/_libs/tslibs/strptime.pyx b/pandas/_libs/tslibs/strptime.pyx
new file mode 100644
index 0000000000000..87658ae92175e
--- /dev/null
+++ b/pandas/_libs/tslibs/strptime.pyx
@@ -0,0 +1,668 @@
+# -*- coding: utf-8 -*-
+"""Strptime-related classes and functions.
+"""
+import time
+import locale
+import calendar
+import re
+from datetime import date as datetime_date
+
+
+# Python 2 vs Python 3
+try:
+    from thread import allocate_lock as _thread_allocate_lock
+except:
+    try:
+        from _thread import allocate_lock as _thread_allocate_lock
+    except:
+        try:
+            from dummy_thread import allocate_lock as _thread_allocate_lock
+        except:
+            from _dummy_thread import allocate_lock as _thread_allocate_lock
+
+
+import pytz
+
+import numpy as np
+from numpy cimport int64_t
+
+
+from pandas._libs.tslibs.np_datetime cimport (
+    check_dts_bounds, dtstruct_to_dt64, npy_datetimestruct)
+
+from pandas._libs.tslibs.util cimport is_string_object
+
+from pandas._libs.tslibs.nattype cimport checknull_with_nat, NPY_NAT
+from pandas._libs.tslibs.nattype import nat_strings
+
+cdef dict _parse_code_table = {'y': 0,
+                               'Y': 1,
+                               'm': 2,
+                               'B': 3,
+                               'b': 4,
+                               'd': 5,
+                               'H': 6,
+                               'I': 7,
+                               'M': 8,
+                               'S': 9,
+                               'f': 10,
+                               'A': 11,
+                               'a': 12,
+                               'w': 13,
+                               'j': 14,
+                               'U': 15,
+                               'W': 16,
+                               'Z': 17,
+                               'p': 18,  # an additional key, only with I
+                               'z': 19}
+
+
+def array_strptime(object[:] values, object fmt,
+                   bint exact=True, errors='raise'):
+    """
+    Calculates the datetime structs represented by the passed array of strings
+
+    Parameters
+    ----------
+    values : ndarray of string-like objects
+    fmt : string-like regex
+    exact : matches must be exact if True, search if False
+    errors : string specifying error handling, {'raise', 'ignore', 'coerce'}
+    """
+
+    cdef:
+        Py_ssize_t i, n = len(values)
+        npy_datetimestruct dts
+        int64_t[:] iresult
+        object[:] result_timezone
+        int year, month, day, minute, hour, second, weekday, julian
+        int week_of_year, week_of_year_start, parse_code, ordinal
+        int64_t us, ns
+        object val, group_key, ampm, found, timezone
+        dict found_key
+        bint is_raise = errors=='raise'
+        bint is_ignore = errors=='ignore'
+        bint is_coerce = errors=='coerce'
+
+    assert is_raise or is_ignore or is_coerce
+
+    if fmt is not None:
+        if '%W' in fmt or '%U' in fmt:
+            if '%Y' not in fmt and '%y' not in fmt:
+                raise ValueError("Cannot use '%W' or '%U' without "
+                                 "day and year")
+            if ('%A' not in fmt and '%a' not in fmt and '%w' not
+                    in fmt):
+                raise ValueError("Cannot use '%W' or '%U' without "
+                                 "day and year")
+        elif '%Z' in fmt and '%z' in fmt:
+            raise ValueError("Cannot parse both %Z and %z")
+
+    global _TimeRE_cache, _regex_cache
+    with _cache_lock:
+        if _getlang() != _TimeRE_cache.locale_time.lang:
+            _TimeRE_cache = TimeRE()
+            _regex_cache.clear()
+        if len(_regex_cache) > _CACHE_MAX_SIZE:
+            _regex_cache.clear()
+        locale_time = _TimeRE_cache.locale_time
+        format_regex = _regex_cache.get(fmt)
+        if not format_regex:
+            try:
+                format_regex = _TimeRE_cache.compile(fmt)
+            # KeyError raised when a bad format is found; can be specified as
+            # \\, in which case it was a stray % but with a space after it
+            except KeyError, err:
+                bad_directive = err.args[0]
+                if bad_directive == "\\":
+                    bad_directive = "%"
+                del err
+                raise ValueError("'%s' is a bad directive in format '%s'" %
+                                 (bad_directive, fmt))
+            # IndexError only occurs when the format string is "%"
+            except IndexError:
+                raise ValueError("stray %% in format '%s'" % fmt)
+            _regex_cache[fmt] = format_regex
+
+    result = np.empty(n, dtype='M8[ns]')
+    iresult = result.view('i8')
+    result_timezone = np.empty(n, dtype='object')
+
+    dts.us = dts.ps = dts.as = 0
+
+    for i in range(n):
+        val = values[i]
+        if is_string_object(val):
+            if val in nat_strings:
+                iresult[i] = NPY_NAT
+                continue
+        else:
+            if checknull_with_nat(val):
+                iresult[i] = NPY_NAT
+                continue
+            else:
+                val = str(val)
+
+        # exact matching
+        if exact:
+            found = format_regex.match(val)
+            if not found:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("time data %r does not match "
+                                 "format %r (match)" % (values[i], fmt))
+            if len(val) != found.end():
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("unconverted data remains: %s" %
+                                 values[i][found.end():])
+
+        # search
+        else:
+            found = format_regex.search(val)
+            if not found:
+                if is_coerce:
+                    iresult[i] = NPY_NAT
+                    continue
+                raise ValueError("time data %r does not match format "
+                                 "%r (search)" % (values[i], fmt))
+
+        year = 1900
+        month = day = 1
+        hour = minute = second = ns = us = 0
+        timezone = None
+        # Default to -1 to signify that values not known; not critical to have,
+        # though
+        week_of_year = -1
+        week_of_year_start = -1
+        # weekday and julian defaulted to -1 so as to signal need to calculate
+        # values
+        weekday = julian = -1
+        found_dict = found.groupdict()
+        for group_key in found_dict.iterkeys():
+            # Directives not explicitly handled below:
+            #   c, x, X
+            #      handled by making out of other directives
+            #   U, W
+            #      worthless without day of the week
+            parse_code = _parse_code_table[group_key]
+
+            if parse_code == 0:
+                year = int(found_dict['y'])
+                # Open Group specification for strptime() states that a %y
+                # value in the range of [00, 68] is in the century 2000, while
+                # [69,99] is in the century 1900
+                if year <= 68:
+                    year += 2000
+                else:
+                    year += 1900
+            elif parse_code == 1:
+                year = int(found_dict['Y'])
+            elif parse_code == 2:
+                month = int(found_dict['m'])
+            elif parse_code == 3:
+            # elif group_key == 'B':
+                month = locale_time.f_month.index(found_dict['B'].lower())
+            elif parse_code == 4:
+            # elif group_key == 'b':
+                month = locale_time.a_month.index(found_dict['b'].lower())
+            elif parse_code == 5:
+            # elif group_key == 'd':
+                day = int(found_dict['d'])
+            elif parse_code == 6:
+            # elif group_key == 'H':
+                hour = int(found_dict['H'])
+            elif parse_code == 7:
+                hour = int(found_dict['I'])
+                ampm = found_dict.get('p', '').lower()
+                # If there was no AM/PM indicator, we'll treat this like AM
+                if ampm in ('', locale_time.am_pm[0]):
+                    # We're in AM so the hour is correct unless we're
+                    # looking at 12 midnight.
+                    # 12 midnight == 12 AM == hour 0
+                    if hour == 12:
+                        hour = 0
+                elif ampm == locale_time.am_pm[1]:
+                    # We're in PM so we need to add 12 to the hour unless
+                    # we're looking at 12 noon.
+                    # 12 noon == 12 PM == hour 12
+                    if hour != 12:
+                        hour += 12
+            elif parse_code == 8:
+                minute = int(found_dict['M'])
+            elif parse_code == 9:
+                second = int(found_dict['S'])
+            elif parse_code == 10:
+                s = found_dict['f']
+                # Pad to always return nanoseconds
+                s += "0" * (9 - len(s))
+                us = long(s)
+                ns = us % 1000
+                us = us / 1000
+            elif parse_code == 11:
+                weekday = locale_time.f_weekday.index(found_dict['A'].lower())
+            elif parse_code == 12:
+                weekday = locale_time.a_weekday.index(found_dict['a'].lower())
+            elif parse_code == 13:
+                weekday = int(found_dict['w'])
+                if weekday == 0:
+                    weekday = 6
+                else:
+                    weekday -= 1
+            elif parse_code == 14:
+                julian = int(found_dict['j'])
+            elif parse_code == 15 or parse_code == 16:
+                week_of_year = int(found_dict[group_key])
+                if group_key == 'U':
+                    # U starts week on Sunday.
+                    week_of_year_start = 6
+                else:
+                    # W starts week on Monday.
+                    week_of_year_start = 0
+            elif parse_code == 17:
+                timezone = pytz.timezone(found_dict['Z'])
+            elif parse_code == 19:
+                timezone = parse_timezone_directive(found_dict['z'])
+
+        # If we know the wk of the year and what day of that wk, we can figure
+        # out the Julian day of the year.
+        if julian == -1 and week_of_year != -1 and weekday != -1:
+            week_starts_Mon = True if week_of_year_start == 0 else False
+            julian = _calc_julian_from_U_or_W(year, week_of_year, weekday,
+                                              week_starts_Mon)
+        # Cannot pre-calculate datetime_date() since can change in Julian
+        # calculation and thus could have different value for the day of the wk
+        # calculation.
+        try:
+            if julian == -1:
+                # Need to add 1 to result since first day of the year is 1, not
+                # 0.
+                ordinal = datetime_date(year, month, day).toordinal()
+                julian = ordinal - datetime_date(year, 1, 1).toordinal() + 1
+            else:
+                # Assume that if they bothered to include Julian day it will
+                # be accurate.
+                datetime_result = datetime_date.fromordinal(
+                    (julian - 1) + datetime_date(year, 1, 1).toordinal())
+                year = datetime_result.year
+                month = datetime_result.month
+                day = datetime_result.day
+        except ValueError:
+            if is_coerce:
+                iresult[i] = NPY_NAT
+                continue
+            raise
+        if weekday == -1:
+            weekday = datetime_date(year, month, day).weekday()
+
+        dts.year = year
+        dts.month = month
+        dts.day = day
+        dts.hour = hour
+        dts.min = minute
+        dts.sec = second
+        dts.us = us
+        dts.ps = ns * 1000
+
+        iresult[i] = dtstruct_to_dt64(&dts)
+        try:
+            check_dts_bounds(&dts)
+        except ValueError:
+            if is_coerce:
+                iresult[i] = NPY_NAT
+                continue
+            raise
+
+        result_timezone[i] = timezone
+
+    return result, result_timezone.base
+
+
+"""_getlang, LocaleTime, TimeRE, _calc_julian_from_U_or_W are vendored
+from the standard library, see
+https://github.com/python/cpython/blob/master/Lib/_strptime.py
+The original module-level docstring follows.
+
+Strptime-related classes and functions.
+CLASSES:
+    LocaleTime -- Discovers and stores locale-specific time information
+    TimeRE -- Creates regexes for pattern matching a string of text containing
+                time information
+FUNCTIONS:
+    _getlang -- Figure out what language is being used for the locale
+    strptime -- Calculates the time struct represented by the passed-in string
+"""
+
+
+def _getlang():
+    """Figure out what language is being used for the locale"""
+    return locale.getlocale(locale.LC_TIME)
+
+
+class LocaleTime(object):
+    """Stores and handles locale-specific information related to time.
+
+    ATTRIBUTES:
+        f_weekday -- full weekday names (7-item list)
+        a_weekday -- abbreviated weekday names (7-item list)
+        f_month -- full month names (13-item list; dummy value in [0], which
+                    is added by code)
+        a_month -- abbreviated month names (13-item list, dummy value in
+                    [0], which is added by code)
+        am_pm -- AM/PM representation (2-item list)
+        LC_date_time -- format string for date/time representation (string)
+        LC_date -- format string for date representation (string)
+        LC_time -- format string for time representation (string)
+        timezone -- daylight- and non-daylight-savings timezone representation
+                    (2-item list of sets)
+        lang -- Language used by instance (2-item tuple)
+    """
+
+    def __init__(self):
+        """Set all attributes.
+
+        Order of methods called matters for dependency reasons.
+
+        The locale language is set at the offset and then checked again before
+        exiting.  This is to make sure that the attributes were not set with a
+        mix of information from more than one locale.  This would most likely
+        happen when using threads where one thread calls a locale-dependent
+        function while another thread changes the locale while the function in
+        the other thread is still running.  Proper coding would call for
+        locks to prevent changing the locale while locale-dependent code is
+        running.  The check here is done in case someone does not think about
+        doing this.
+
+        Only other possible issue is if someone changed the timezone and did
+        not call tz.tzset .  That is an issue for the programmer, though,
+        since changing the timezone is worthless without that call.
+
+        """
+        self.lang = _getlang()
+        self.__calc_weekday()
+        self.__calc_month()
+        self.__calc_am_pm()
+        self.__calc_timezone()
+        self.__calc_date_time()
+        if _getlang() != self.lang:
+            raise ValueError("locale changed during initialization")
+
+    def __pad(self, seq, front):
+        # Add '' to seq to either the front (is True), else the back.
+        seq = list(seq)
+        if front:
+            seq.insert(0, '')
+        else:
+            seq.append('')
+        return seq
+
+    def __calc_weekday(self):
+        # Set self.a_weekday and self.f_weekday using the calendar
+        # module.
+        a_weekday = [calendar.day_abbr[i].lower() for i in range(7)]
+        f_weekday = [calendar.day_name[i].lower() for i in range(7)]
+        self.a_weekday = a_weekday
+        self.f_weekday = f_weekday
+
+    def __calc_month(self):
+        # Set self.f_month and self.a_month using the calendar module.
+        a_month = [calendar.month_abbr[i].lower() for i in range(13)]
+        f_month = [calendar.month_name[i].lower() for i in range(13)]
+        self.a_month = a_month
+        self.f_month = f_month
+
+    def __calc_am_pm(self):
+        # Set self.am_pm by using time.strftime().
+
+        # The magic date (1999,3,17,hour,44,55,2,76,0) is not really that
+        # magical; just happened to have used it everywhere else where a
+        # static date was needed.
+        am_pm = []
+        for hour in (01, 22):
+            time_tuple = time.struct_time(
+                (1999, 3, 17, hour, 44, 55, 2, 76, 0))
+            am_pm.append(time.strftime("%p", time_tuple).lower())
+        self.am_pm = am_pm
+
+    def __calc_date_time(self):
+        # Set self.date_time, self.date, & self.time by using
+        # time.strftime().
+
+        # Use (1999,3,17,22,44,55,2,76,0) for magic date because the amount of
+        # overloaded numbers is minimized.  The order in which searches for
+        # values within the format string is very important; it eliminates
+        # possible ambiguity for what something represents.
+        time_tuple = time.struct_time((1999, 3, 17, 22, 44, 55, 2, 76, 0))
+        date_time = [None, None, None]
+        date_time[0] = time.strftime("%c", time_tuple).lower()
+        date_time[1] = time.strftime("%x", time_tuple).lower()
+        date_time[2] = time.strftime("%X", time_tuple).lower()
+        replacement_pairs = [('%', '%%'), (self.f_weekday[2], '%A'),
+                             (self.f_month[3], '%B'),
+                             (self.a_weekday[2], '%a'),
+                             (self.a_month[3], '%b'), (self.am_pm[1], '%p'),
+                             ('1999', '%Y'), ('99', '%y'), ('22', '%H'),
+                             ('44', '%M'), ('55', '%S'), ('76', '%j'),
+                             ('17', '%d'), ('03', '%m'), ('3', '%m'),
+                             # '3' needed for when no leading zero.
+                             ('2', '%w'), ('10', '%I')]
+        replacement_pairs.extend([(tz, "%Z") for tz_values in self.timezone
+                                  for tz in tz_values])
+        for offset, directive in ((0, '%c'), (1, '%x'), (2, '%X')):
+            current_format = date_time[offset]
+            for old, new in replacement_pairs:
+                # Must deal with possible lack of locale info
+                # manifesting itself as the empty string (e.g., Swedish's
+                # lack of AM/PM info) or a platform returning a tuple of empty
+                # strings (e.g., MacOS 9 having timezone as ('','')).
+                if old:
+                    current_format = current_format.replace(old, new)
+            # If %W is used, then Sunday, 2005-01-03 will fall on week 0 since
+            # 2005-01-03 occurs before the first Monday of the year.  Otherwise
+            # %U is used.
+            time_tuple = time.struct_time((1999, 1, 3, 1, 1, 1, 6, 3, 0))
+            if '00' in time.strftime(directive, time_tuple):
+                U_W = '%W'
+            else:
+                U_W = '%U'
+            date_time[offset] = current_format.replace('11', U_W)
+        self.LC_date_time = date_time[0]
+        self.LC_date = date_time[1]
+        self.LC_time = date_time[2]
+
+    def __calc_timezone(self):
+        # Set self.timezone by using time.tzname.
+        # Do not worry about possibility of time.tzname[0] == timetzname[1]
+        # and time.daylight; handle that in strptime .
+        try:
+            time.tzset()
+        except AttributeError:
+            pass
+        no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()])
+        if time.daylight:
+            has_saving = frozenset([time.tzname[1].lower()])
+        else:
+            has_saving = frozenset()
+        self.timezone = (no_saving, has_saving)
+
+
+class TimeRE(dict):
+    """
+    Handle conversion from format directives to regexes.
+
+    Creates regexes for pattern matching a string of text containing
+    time information
+    """
+
+    def __init__(self, locale_time=None):
+        """Create keys/values.
+
+        Order of execution is important for dependency reasons.
+
+        """
+        if locale_time:
+            self.locale_time = locale_time
+        else:
+            self.locale_time = LocaleTime()
+        base = super(TimeRE, self)
+        base.__init__({
+            # The " \d" part of the regex is to make %c from ANSI C work
+            'd': r"(?P<d>3[0-1]|[1-2]\d|0[1-9]|[1-9]| [1-9])",
+            'f': r"(?P<f>[0-9]{1,9})",
+            'H': r"(?P<H>2[0-3]|[0-1]\d|\d)",
+            'I': r"(?P<I>1[0-2]|0[1-9]|[1-9])",
+            'j': (r"(?P<j>36[0-6]|3[0-5]\d|[1-2]\d\d|0[1-9]\d|00[1-9]|"
+                  r"[1-9]\d|0[1-9]|[1-9])"),
+            'm': r"(?P<m>1[0-2]|0[1-9]|[1-9])",
+            'M': r"(?P<M>[0-5]\d|\d)",
+            'S': r"(?P<S>6[0-1]|[0-5]\d|\d)",
+            'U': r"(?P<U>5[0-3]|[0-4]\d|\d)",
+            'w': r"(?P<w>[0-6])",
+            # W is set below by using 'U'
+            'y': r"(?P<y>\d\d)",
+            # XXX: Does 'Y' need to worry about having less or more than
+            #     4 digits?
+            'Y': r"(?P<Y>\d\d\d\d)",
+            'z': r"(?P<z>[+-]\d\d:?[0-5]\d(:?[0-5]\d(\.\d{1,6})?)?|Z)",
+            'A': self.__seqToRE(self.locale_time.f_weekday, 'A'),
+            'a': self.__seqToRE(self.locale_time.a_weekday, 'a'),
+            'B': self.__seqToRE(self.locale_time.f_month[1:], 'B'),
+            'b': self.__seqToRE(self.locale_time.a_month[1:], 'b'),
+            'p': self.__seqToRE(self.locale_time.am_pm, 'p'),
+            'Z': self.__seqToRE(pytz.all_timezones, 'Z'),
+            '%': '%'})
+        base.__setitem__('W', base.__getitem__('U').replace('U', 'W'))
+        base.__setitem__('c', self.pattern(self.locale_time.LC_date_time))
+        base.__setitem__('x', self.pattern(self.locale_time.LC_date))
+        base.__setitem__('X', self.pattern(self.locale_time.LC_time))
+
+    def __seqToRE(self, to_convert, directive):
+        """Convert a list to a regex string for matching a directive.
+
+        Want possible matching values to be from longest to shortest.  This
+        prevents the possibility of a match occurring for a value that also
+        a substring of a larger value that should have matched (e.g., 'abc'
+        matching when 'abcdef' should have been the match).
+
+        """
+        to_convert = sorted(to_convert, key=len, reverse=True)
+        for value in to_convert:
+            if value != '':
+                break
+        else:
+            return ''
+        regex = '|'.join(re.escape(stuff) for stuff in to_convert)
+        regex = '(?P<%s>%s' % (directive, regex)
+        return '%s)' % regex
+
+    def pattern(self, format):
+        """Return regex pattern for the format string.
+
+        Need to make sure that any characters that might be interpreted as
+        regex syntax are escaped.
+
+        """
+        processed_format = ''
+        # The sub() call escapes all characters that might be misconstrued
+        # as regex syntax.  Cannot use re.escape since we have to deal with
+        # format directives (%m, etc.).
+        regex_chars = re.compile(r"([\\.^$*+?\(\){}\[\]|])")
+        format = regex_chars.sub(r"\\\1", format)
+        whitespace_replacement = re.compile(r'\s+')
+        format = whitespace_replacement.sub(r'\\s+', format)
+        while '%' in format:
+            directive_index = format.index('%') +1
+            processed_format = "%s%s%s" % (processed_format,
+                                           format[:directive_index -1],
+                                           self[format[directive_index]])
+            format = format[directive_index +1:]
+        return "%s%s" % (processed_format, format)
+
+    def compile(self, format):
+        """Return a compiled re object for the format string."""
+        return re.compile(self.pattern(format), re.IGNORECASE)
+
+
+_cache_lock = _thread_allocate_lock()
+# DO NOT modify _TimeRE_cache or _regex_cache without acquiring the cache lock
+# first!
+_TimeRE_cache = TimeRE()
+_CACHE_MAX_SIZE = 5  # Max number of regexes stored in _regex_cache
+_regex_cache = {}
+
+
+cdef _calc_julian_from_U_or_W(int year, int week_of_year,
+                              int day_of_week, int week_starts_Mon):
+    """Calculate the Julian day based on the year, week of the year, and day of
+    the week, with week_start_day representing whether the week of the year
+    assumes the week starts on Sunday or Monday (6 or 0)."""
+
+    cdef:
+        int first_weekday, week_0_length, days_to_week
+
+    first_weekday = datetime_date(year, 1, 1).weekday()
+    # If we are dealing with the %U directive (week starts on Sunday), it's
+    # easier to just shift the view to Sunday being the first day of the
+    # week.
+    if not week_starts_Mon:
+        first_weekday = (first_weekday + 1) % 7
+        day_of_week = (day_of_week + 1) % 7
+
+    # Need to watch out for a week 0 (when the first day of the year is not
+    # the same as that specified by %U or %W).
+    week_0_length = (7 - first_weekday) % 7
+    if week_of_year == 0:
+        return 1 + day_of_week - first_weekday
+    else:
+        days_to_week = week_0_length + (7 * (week_of_year - 1))
+        return 1 + days_to_week + day_of_week
+
+
+cdef parse_timezone_directive(object z):
+    """
+    Parse the '%z' directive and return a pytz.FixedOffset
+
+    Parameters
+    ----------
+    z : string of the UTC offset
+
+    Returns
+    -------
+    pytz.FixedOffset
+
+    Notes
+    -----
+    This is essentially similar to the cpython implementation
+    https://github.com/python/cpython/blob/master/Lib/_strptime.py#L457-L479
+    """
+
+    cdef:
+        int gmtoff_fraction, hours, minutes, seconds, pad_number, microseconds
+        int total_minutes
+        object gmtoff_remainder, gmtoff_remainder_padding
+
+    if z == 'Z':
+        return pytz.FixedOffset(0)
+    if z[3] == ':':
+        z = z[:3] + z[4:]
+        if len(z) > 5:
+            if z[5] != ':':
+                msg = "Inconsistent use of : in {0}"
+                raise ValueError(msg.format(z))
+            z = z[:5] + z[6:]
+    hours = int(z[1:3])
+    minutes = int(z[3:5])
+    seconds = int(z[5:7] or 0)
+
+    # Pad to always return microseconds.
+    gmtoff_remainder = z[8:]
+    pad_number = 6 - len(gmtoff_remainder)
+    gmtoff_remainder_padding = "0" * pad_number
+    microseconds = int(gmtoff_remainder + gmtoff_remainder_padding)
+
+    total_minutes = ((hours * 60) + minutes + (seconds / 60) +
+                     (microseconds / 60000000))
+    total_minutes = -total_minutes if z.startswith("-") else total_minutes
+    return pytz.FixedOffset(total_minutes)
diff --git a/pandas/_libs/tslibs/timedeltas.pxd b/pandas/_libs/tslibs/timedeltas.pxd
new file mode 100644
index 0000000000000..097309b17823b
--- /dev/null
+++ b/pandas/_libs/tslibs/timedeltas.pxd
@@ -0,0 +1,8 @@
+# -*- coding: utf-8 -*-
+
+from numpy cimport int64_t
+
+# Exposed for tslib, not intended for outside use.
+cdef int64_t cast_from_unit(object ts, object unit) except? -1
+cpdef int64_t delta_to_nanoseconds(delta) except? -1
+cdef convert_to_timedelta64(object ts, object unit)
diff --git a/pandas/_libs/tslibs/timedeltas.pyx b/pandas/_libs/tslibs/timedeltas.pyx
new file mode 100644
index 0000000000000..6e40063fb925a
--- /dev/null
+++ b/pandas/_libs/tslibs/timedeltas.pyx
@@ -0,0 +1,1547 @@
+# -*- coding: utf-8 -*-
+import collections
+import textwrap
+import warnings
+
+import sys
+cdef bint PY3 = (sys.version_info[0] >= 3)
+
+import cython
+
+from cpython cimport Py_NE, Py_EQ, PyObject_RichCompare
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+from cpython.datetime cimport (datetime, timedelta,
+                               PyDateTime_CheckExact,
+                               PyDateTime_Check, PyDelta_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+
+cimport pandas._libs.tslibs.util as util
+from pandas._libs.tslibs.util cimport (
+    is_timedelta64_object, is_datetime64_object, is_integer_object,
+    is_float_object, is_string_object)
+
+from pandas._libs.tslibs.ccalendar import DAY_SECONDS
+
+from pandas._libs.tslibs.np_datetime cimport (
+    cmp_scalar, reverse_ops, td64_to_tdstruct, pandas_timedeltastruct)
+
+from pandas._libs.tslibs.nattype import nat_strings
+from pandas._libs.tslibs.nattype cimport (
+    checknull_with_nat, NPY_NAT, c_NaT as NaT)
+from pandas._libs.tslibs.offsets cimport to_offset
+from pandas._libs.tslibs.offsets import _Tick as Tick
+
+# ----------------------------------------------------------------------
+# Constants
+
+# components named tuple
+Components = collections.namedtuple('Components', [
+    'days', 'hours', 'minutes', 'seconds',
+    'milliseconds', 'microseconds', 'nanoseconds'])
+
+
+cdef dict timedelta_abbrevs = { 'Y': 'Y',
+                                'y': 'Y',
+                                'M': 'M',
+                                'W': 'W',
+                                'w': 'W',
+                                'D': 'D',
+                                'd': 'D',
+                                'days': 'D',
+                                'day': 'D',
+                                'hours': 'h',
+                                'hour': 'h',
+                                'hr': 'h',
+                                'h': 'h',
+                                'm': 'm',
+                                'minute': 'm',
+                                'min': 'm',
+                                'minutes': 'm',
+                                't': 'm',
+                                's': 's',
+                                'seconds': 's',
+                                'sec': 's',
+                                'second': 's',
+                                'ms': 'ms',
+                                'milliseconds': 'ms',
+                                'millisecond': 'ms',
+                                'milli': 'ms',
+                                'millis': 'ms',
+                                'l': 'ms',
+                                'us': 'us',
+                                'microseconds': 'us',
+                                'microsecond': 'us',
+                                'micro': 'us',
+                                'micros': 'us',
+                                'u': 'us',
+                                'ns': 'ns',
+                                'nanoseconds': 'ns',
+                                'nano': 'ns',
+                                'nanos': 'ns',
+                                'nanosecond': 'ns',
+                                'n': 'ns'}
+
+_no_input = object()
+
+
+# ----------------------------------------------------------------------
+# API
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def ints_to_pytimedelta(int64_t[:] arr, box=False):
+    """
+    convert an i8 repr to an ndarray of timedelta or Timedelta (if box ==
+    True)
+
+    Parameters
+    ----------
+    arr : ndarray[int64_t]
+    box : bool, default False
+
+    Returns
+    -------
+    result : ndarray[object]
+        array of Timedelta or timedeltas objects
+    """
+    cdef:
+        Py_ssize_t i, n = len(arr)
+        int64_t value
+        object[:] result = np.empty(n, dtype=object)
+
+    for i in range(n):
+
+        value = arr[i]
+        if value == NPY_NAT:
+            result[i] = NaT
+        else:
+            if box:
+                result[i] = Timedelta(value)
+            else:
+                result[i] = timedelta(microseconds=int(value) / 1000)
+
+    return result.base  # .base to access underlying np.ndarray
+
+
+# ----------------------------------------------------------------------
+
+cpdef int64_t delta_to_nanoseconds(delta) except? -1:
+    if hasattr(delta, 'nanos'):
+        return delta.nanos
+    if hasattr(delta, 'delta'):
+        delta = delta.delta
+    if is_timedelta64_object(delta):
+        return delta.astype("timedelta64[ns]").item()
+    if is_integer_object(delta):
+        return delta
+    if PyDelta_Check(delta):
+        return (delta.days * 24 * 60 * 60 * 1000000 +
+                delta.seconds * 1000000 +
+                delta.microseconds) * 1000
+
+    raise TypeError(type(delta))
+
+
+cdef convert_to_timedelta64(object ts, object unit):
+    """
+    Convert an incoming object to a timedelta64 if possible.
+    Before calling, unit must be standardized to avoid repeated unit conversion
+
+    Handle these types of objects:
+        - timedelta/Timedelta
+        - timedelta64
+        - an offset
+        - np.int64 (with unit providing a possible modifier)
+        - None/NaT
+
+    Return an ns based int64
+    """
+    if checknull_with_nat(ts):
+        return np.timedelta64(NPY_NAT)
+    elif isinstance(ts, Timedelta):
+        # already in the proper format
+        ts = np.timedelta64(ts.value)
+    elif is_datetime64_object(ts):
+        # only accept a NaT here
+        if ts.astype('int64') == NPY_NAT:
+            return np.timedelta64(NPY_NAT)
+    elif is_timedelta64_object(ts):
+        ts = ts.astype("m8[{unit}]".format(unit=unit.lower()))
+    elif is_integer_object(ts):
+        if ts == NPY_NAT:
+            return np.timedelta64(NPY_NAT)
+        else:
+            if unit in ['Y', 'M', 'W']:
+                ts = np.timedelta64(ts, unit)
+            else:
+                ts = cast_from_unit(ts, unit)
+                ts = np.timedelta64(ts)
+    elif is_float_object(ts):
+        if unit in ['Y', 'M', 'W']:
+            ts = np.timedelta64(int(ts), unit)
+        else:
+            ts = cast_from_unit(ts, unit)
+            ts = np.timedelta64(ts)
+    elif is_string_object(ts):
+        if len(ts) > 0 and ts[0] == 'P':
+            ts = parse_iso_format_string(ts)
+        else:
+            ts = parse_timedelta_string(ts)
+        ts = np.timedelta64(ts)
+    elif hasattr(ts, 'delta'):
+        ts = np.timedelta64(delta_to_nanoseconds(ts), 'ns')
+
+    if PyDelta_Check(ts):
+        ts = np.timedelta64(delta_to_nanoseconds(ts), 'ns')
+    elif not is_timedelta64_object(ts):
+        raise ValueError("Invalid type for timedelta "
+                         "scalar: {ts_type}".format(ts_type=type(ts)))
+    return ts.astype('timedelta64[ns]')
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def array_to_timedelta64(object[:] values, unit='ns', errors='raise'):
+    """
+    Convert an ndarray to an array of timedeltas. If errors == 'coerce',
+    coerce non-convertible objects to NaT. Otherwise, raise.
+    """
+
+    cdef:
+        Py_ssize_t i, n
+        int64_t[:] iresult
+
+    if errors not in ('ignore', 'raise', 'coerce'):
+        raise ValueError("errors must be one of 'ignore', "
+                         "'raise', or 'coerce'}")
+
+    n = values.shape[0]
+    result = np.empty(n, dtype='m8[ns]')
+    iresult = result.view('i8')
+
+    # Usually, we have all strings. If so, we hit the fast path.
+    # If this path fails, we try conversion a different way, and
+    # this is where all of the error handling will take place.
+    try:
+        for i in range(n):
+            result[i] = parse_timedelta_string(values[i])
+    except:
+        unit = parse_timedelta_unit(unit)
+        for i in range(n):
+            try:
+                result[i] = convert_to_timedelta64(values[i], unit)
+            except ValueError:
+                if errors == 'coerce':
+                    result[i] = NPY_NAT
+                else:
+                    raise
+
+    return iresult.base  # .base to access underlying np.ndarray
+
+
+cdef inline int64_t cast_from_unit(object ts, object unit) except? -1:
+    """ return a casting of the unit represented to nanoseconds
+        round the fractional part of a float to our precision, p """
+    cdef:
+        int64_t m
+        int p
+
+    if unit == 'Y':
+        m = 1000000000L * 31556952
+        p = 9
+    elif unit == 'M':
+        m = 1000000000L * 2629746
+        p = 9
+    elif unit == 'W':
+        m = 1000000000L * DAY_SECONDS * 7
+        p = 9
+    elif unit == 'D' or unit == 'd':
+        m = 1000000000L * DAY_SECONDS
+        p = 9
+    elif unit == 'h':
+        m = 1000000000L * 3600
+        p = 9
+    elif unit == 'm':
+        m = 1000000000L * 60
+        p = 9
+    elif unit == 's':
+        m = 1000000000L
+        p = 9
+    elif unit == 'ms':
+        m = 1000000L
+        p = 6
+    elif unit == 'us':
+        m = 1000L
+        p = 3
+    elif unit == 'ns' or unit is None:
+        m = 1L
+        p = 0
+    else:
+        raise ValueError("cannot cast unit {unit}".format(unit=unit))
+
+    # just give me the unit back
+    if ts is None:
+        return m
+
+    # cast the unit, multiply base/frace separately
+    # to avoid precision issues from float -> int
+    base = <int64_t>ts
+    frac = ts - base
+    if p:
+        frac = round(frac, p)
+    return <int64_t>(base * m) + <int64_t>(frac * m)
+
+
+cdef inline _decode_if_necessary(object ts):
+    # decode ts if necessary
+    if not isinstance(ts, unicode) and not PY3:
+        ts = str(ts).decode('utf-8')
+
+    return ts
+
+
+cdef inline parse_timedelta_string(object ts):
+    """
+    Parse a regular format timedelta string. Return an int64_t (in ns)
+    or raise a ValueError on an invalid parse.
+    """
+
+    cdef:
+        unicode c
+        bint neg = 0, have_dot = 0, have_value = 0, have_hhmmss = 0
+        object current_unit = None
+        int64_t result = 0, m = 0, r
+        list number = [], frac = [], unit = []
+
+    # neg : tracks if we have a leading negative for the value
+    # have_dot : tracks if we are processing a dot (either post hhmmss or
+    #            inside an expression)
+    # have_value : track if we have at least 1 leading unit
+    # have_hhmmss : tracks if we have a regular format hh:mm:ss
+
+    if len(ts) == 0 or ts in nat_strings:
+        return NPY_NAT
+
+    ts = _decode_if_necessary(ts)
+
+    for c in ts:
+
+        # skip whitespace / commas
+        if c == ' ' or c == ',':
+            pass
+
+        # positive signs are ignored
+        elif c == '+':
+            pass
+
+        # neg
+        elif c == '-':
+
+            if neg or have_value or have_hhmmss:
+                raise ValueError("only leading negative signs are allowed")
+
+            neg = 1
+
+        # number (ascii codes)
+        elif ord(c) >= 48 and ord(c) <= 57:
+
+            if have_dot:
+
+                # we found a dot, but now its just a fraction
+                if len(unit):
+                    number.append(c)
+                    have_dot = 0
+                else:
+                    frac.append(c)
+
+            elif not len(unit):
+                number.append(c)
+
+            else:
+                r = timedelta_from_spec(number, frac, unit)
+                unit, number, frac = [], [c], []
+
+                result += timedelta_as_neg(r, neg)
+
+        # hh:mm:ss.
+        elif c == ':':
+
+            # we flip this off if we have a leading value
+            if have_value:
+                neg = 0
+
+            # we are in the pattern hh:mm:ss pattern
+            if len(number):
+                if current_unit is None:
+                    current_unit = 'h'
+                    m = 1000000000L * 3600
+                elif current_unit == 'h':
+                    current_unit = 'm'
+                    m = 1000000000L * 60
+                elif current_unit == 'm':
+                    current_unit = 's'
+                    m = 1000000000L
+                r = <int64_t>int(''.join(number)) * m
+                result += timedelta_as_neg(r, neg)
+                have_hhmmss = 1
+            else:
+                raise ValueError("expecting hh:mm:ss format, "
+                                 "received: {ts}".format(ts=ts))
+
+            unit, number = [], []
+
+        # after the decimal point
+        elif c == '.':
+
+            if len(number) and current_unit is not None:
+
+                # by definition we had something like
+                # so we need to evaluate the final field from a
+                # hh:mm:ss (so current_unit is 'm')
+                if current_unit != 'm':
+                    raise ValueError("expected hh:mm:ss format before .")
+                m = 1000000000L
+                r = <int64_t>int(''.join(number)) * m
+                result += timedelta_as_neg(r, neg)
+                have_value = 1
+                unit, number, frac = [], [], []
+
+            have_dot = 1
+
+        # unit
+        else:
+            unit.append(c)
+            have_value = 1
+            have_dot = 0
+
+    # we had a dot, but we have a fractional
+    # value since we have an unit
+    if have_dot and len(unit):
+        r = timedelta_from_spec(number, frac, unit)
+        result += timedelta_as_neg(r, neg)
+
+    # we have a dot as part of a regular format
+    # e.g. hh:mm:ss.fffffff
+    elif have_dot:
+
+        if ((len(number) or len(frac)) and not len(unit)
+                and current_unit is None):
+            raise ValueError("no units specified")
+
+        if len(frac) > 0 and len(frac) <= 3:
+            m = 10**(3 -len(frac)) * 1000L * 1000L
+        elif len(frac) > 3 and len(frac) <= 6:
+            m = 10**(6 -len(frac)) * 1000L
+        else:
+            m = 10**(9 -len(frac))
+
+        r = <int64_t>int(''.join(frac)) * m
+        result += timedelta_as_neg(r, neg)
+
+    # we have a regular format
+    # we must have seconds at this point (hence the unit is still 'm')
+    elif current_unit is not None:
+        if current_unit != 'm':
+            raise ValueError("expected hh:mm:ss format")
+        m = 1000000000L
+        r = <int64_t>int(''.join(number)) * m
+        result += timedelta_as_neg(r, neg)
+
+    # we have a last abbreviation
+    elif len(unit):
+        if len(number):
+            r = timedelta_from_spec(number, frac, unit)
+            result += timedelta_as_neg(r, neg)
+        else:
+            raise ValueError("unit abbreviation w/o a number")
+
+    # treat as nanoseconds
+    # but only if we don't have anything else
+    else:
+        if have_value:
+            raise ValueError("have leftover units")
+        if len(number):
+            r = timedelta_from_spec(number, frac, 'ns')
+            result += timedelta_as_neg(r, neg)
+
+    return result
+
+
+cdef inline int64_t timedelta_as_neg(int64_t value, bint neg):
+    """
+
+    Parameters
+    ----------
+    value : int64_t of the timedelta value
+    neg : boolean if the a negative value
+    """
+    if neg:
+        return -value
+    return value
+
+
+cdef inline timedelta_from_spec(object number, object frac, object unit):
+    """
+
+    Parameters
+    ----------
+    number : a list of number digits
+    frac : a list of frac digits
+    unit : a list of unit characters
+    """
+    cdef object n
+
+    try:
+        unit = ''.join(unit)
+        if unit == 'M':
+            # To parse ISO 8601 string, 'M' should be treated as minute,
+            # not month
+            unit = 'm'
+        unit = parse_timedelta_unit(unit)
+    except KeyError:
+        raise ValueError("invalid abbreviation: {unit}".format(unit=unit))
+
+    n = ''.join(number) + '.' + ''.join(frac)
+    return cast_from_unit(float(n), unit)
+
+
+cpdef inline object parse_timedelta_unit(object unit):
+    """
+    Parameters
+    ----------
+    unit : an unit string
+    """
+    if unit is None:
+        return 'ns'
+    elif unit == 'M':
+        return unit
+    try:
+        return timedelta_abbrevs[unit.lower()]
+    except (KeyError, AttributeError):
+        raise ValueError("invalid unit abbreviation: {unit}"
+                         .format(unit=unit))
+
+# ----------------------------------------------------------------------
+# Timedelta ops utilities
+
+cdef bint _validate_ops_compat(other):
+    # return True if we are compat with operating
+    if checknull_with_nat(other):
+        return True
+    elif PyDelta_Check(other) or is_timedelta64_object(other):
+        return True
+    elif is_string_object(other):
+        return True
+    elif hasattr(other, 'delta'):
+        return True
+    return False
+
+
+def _op_unary_method(func, name):
+    def f(self):
+        return Timedelta(func(self.value), unit='ns')
+    f.__name__ = name
+    return f
+
+
+def _binary_op_method_timedeltalike(op, name):
+    # define a binary operation that only works if the other argument is
+    # timedelta like or an array of timedeltalike
+    def f(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return op(self, other.delta)
+            return NotImplemented
+
+        elif other is NaT:
+            return NaT
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below; avoid catching this in
+            # has-dtype check before then
+            pass
+
+        elif is_datetime64_object(other) or PyDateTime_CheckExact(other):
+            # the PyDateTime_CheckExact case is for a datetime object that
+            # is specifically *not* a Timestamp, as the Timestamp case will be
+            # handled after `_validate_ops_compat` returns False below
+            from timestamps import Timestamp
+            return op(self, Timestamp(other))
+            # We are implicitly requiring the canonical behavior to be
+            # defined by Timestamp methods.
+
+        elif hasattr(other, 'dtype'):
+            # nd-array like
+            if other.dtype.kind in ['m', 'M']:
+                return op(self.to_timedelta64(), other)
+            elif other.dtype.kind == 'O':
+                return np.array([op(self, x) for x in other])
+            else:
+                return NotImplemented
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        try:
+            other = Timedelta(other)
+        except ValueError:
+            # failed to parse as timedelta
+            return NotImplemented
+
+        if other is NaT:
+            # e.g. if original other was timedelta64('NaT')
+            return NaT
+        return Timedelta(op(self.value, other.value), unit='ns')
+
+    f.__name__ = name
+    return f
+
+
+# ----------------------------------------------------------------------
+# Timedelta Construction
+
+cdef inline int64_t parse_iso_format_string(object ts) except? -1:
+    """
+    Extracts and cleanses the appropriate values from a match object with
+    groups for each component of an ISO 8601 duration
+
+    Parameters
+    ----------
+    ts:
+        ISO 8601 Duration formatted string
+
+    Returns
+    -------
+    ns: int64_t
+        Precision in nanoseconds of matched ISO 8601 duration
+
+    Raises
+    ------
+    ValueError
+        If ``ts`` cannot be parsed
+    """
+
+    cdef:
+        unicode c
+        int64_t result = 0, r
+        int p = 0
+        object dec_unit = 'ms', err_msg
+        bint have_dot = 0, have_value = 0, neg = 0
+        list number = [], unit = []
+
+    ts = _decode_if_necessary(ts)
+
+    err_msg = "Invalid ISO 8601 Duration format - {}".format(ts)
+
+    for c in ts:
+        # number (ascii codes)
+        if ord(c) >= 48 and ord(c) <= 57:
+
+            have_value = 1
+            if have_dot:
+                if p == 3 and dec_unit != 'ns':
+                    unit.append(dec_unit)
+                    if dec_unit == 'ms':
+                        dec_unit = 'us'
+                    elif dec_unit == 'us':
+                        dec_unit = 'ns'
+                    p = 0
+                p += 1
+
+            if not len(unit):
+                number.append(c)
+            else:
+                # if in days, pop trailing T
+                if unit[-1] == 'T':
+                    unit.pop()
+                elif 'H' in unit or 'M' in unit:
+                    if len(number) > 2:
+                        raise ValueError(err_msg)
+                r = timedelta_from_spec(number, '0', unit)
+                result += timedelta_as_neg(r, neg)
+
+                neg = 0
+                unit, number = [], [c]
+        else:
+            if c == 'P':
+                pass  # ignore leading character
+            elif c == '-':
+                if neg or have_value:
+                    raise ValueError(err_msg)
+                else:
+                    neg = 1
+            elif c in ['D', 'T', 'H', 'M']:
+                unit.append(c)
+            elif c == '.':
+                # append any seconds
+                if len(number):
+                    r = timedelta_from_spec(number, '0', 'S')
+                    result += timedelta_as_neg(r, neg)
+                    unit, number = [], []
+                have_dot = 1
+            elif c == 'S':
+                if have_dot:  # ms, us, or ns
+                    if not len(number) or p > 3:
+                        raise ValueError(err_msg)
+                    # pad to 3 digits as required
+                    pad = 3 - p
+                    while pad > 0:
+                        number.append('0')
+                        pad -= 1
+
+                    r = timedelta_from_spec(number, '0', dec_unit)
+                    result += timedelta_as_neg(r, neg)
+                else:  # seconds
+                    if len(number) <= 2:
+                        r = timedelta_from_spec(number, '0', 'S')
+                        result += timedelta_as_neg(r, neg)
+                    else:
+                        raise ValueError(err_msg)
+            else:
+                raise ValueError(err_msg)
+
+    if not have_value:
+        # Received string only - never parsed any values
+        raise ValueError(err_msg)
+
+    return result
+
+
+cdef _to_py_int_float(v):
+    # Note: This used to be defined inside Timedelta.__new__
+    # but cython will not allow `cdef` functions to be defined dynamically.
+    if is_integer_object(v):
+        return int(v)
+    elif is_float_object(v):
+        return float(v)
+    raise TypeError("Invalid type {typ}. Must be int or "
+                    "float.".format(typ=type(v)))
+
+
+# Similar to Timestamp/datetime, this is a construction requirement for
+# timedeltas that we need to do object instantiation in python. This will
+# serve as a C extension type that shadows the Python class, where we do any
+# heavy lifting.
+cdef class _Timedelta(timedelta):
+    cdef readonly:
+        int64_t value      # nanoseconds
+        object freq        # frequency reference
+        bint is_populated  # are my components populated
+        int64_t _d, _h, _m, _s, _ms, _us, _ns
+
+    # higher than np.ndarray and np.matrix
+    __array_priority__ = 100
+
+    def __hash__(_Timedelta self):
+        if self._has_ns():
+            return hash(self.value)
+        else:
+            return timedelta.__hash__(self)
+
+    def __richcmp__(_Timedelta self, object other, int op):
+        cdef:
+            _Timedelta ots
+            int ndim
+
+        if isinstance(other, _Timedelta):
+            ots = other
+        elif PyDelta_Check(other) or isinstance(other, Tick):
+            ots = Timedelta(other)
+        else:
+            ndim = getattr(other, "ndim", -1)
+
+            if ndim != -1:
+                if ndim == 0:
+                    if is_timedelta64_object(other):
+                        other = Timedelta(other)
+                    else:
+                        if op == Py_EQ:
+                            return False
+                        elif op == Py_NE:
+                            return True
+                        # only allow ==, != ops
+                        raise TypeError('Cannot compare type {cls} with '
+                                        'type {other}'
+                                        .format(cls=type(self).__name__,
+                                                other=type(other).__name__))
+                if util.is_array(other):
+                    return PyObject_RichCompare(np.array([self]), other, op)
+                return PyObject_RichCompare(other, self, reverse_ops[op])
+            else:
+                if op == Py_EQ:
+                    return False
+                elif op == Py_NE:
+                    return True
+                raise TypeError('Cannot compare type {cls} with type {other}'
+                                .format(cls=type(self).__name__,
+                                        other=type(other).__name__))
+
+        return cmp_scalar(self.value, ots.value, op)
+
+    cpdef bint _has_ns(self):
+        return self.value % 1000 != 0
+
+    def _ensure_components(_Timedelta self):
+        """
+        compute the components
+        """
+        if self.is_populated:
+            return
+
+        cdef:
+            pandas_timedeltastruct tds
+
+        td64_to_tdstruct(self.value, &tds)
+        self._d = tds.days
+        self._h = tds.hrs
+        self._m = tds.min
+        self._s = tds.sec
+        self._ms = tds.ms
+        self._us = tds.us
+        self._ns = tds.ns
+        self._seconds = tds.seconds
+        self._microseconds = tds.microseconds
+
+        self.is_populated = 1
+
+    cpdef timedelta to_pytimedelta(_Timedelta self):
+        """
+        return an actual datetime.timedelta object
+        note: we lose nanosecond resolution if any
+        """
+        return timedelta(microseconds=int(self.value) / 1000)
+
+    def to_timedelta64(self):
+        """ Returns a numpy.timedelta64 object with 'ns' precision """
+        return np.timedelta64(self.value, 'ns')
+
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        Convert the Timestamp to a NumPy timedelta64.
+
+        .. versionadded:: 0.25.0
+
+        This is an alias method for `Timedelta.to_timedelta64()`. The dtype and
+        copy parameters are available here only for compatibility. Their values
+        will not affect the return value.
+
+        Returns
+        -------
+        numpy.timedelta64
+
+        See Also
+        --------
+        Series.to_numpy : Similar method for Series.
+        """
+        return self.to_timedelta64()
+
+    def total_seconds(self):
+        """
+        Total duration of timedelta in seconds (to ns precision)
+        """
+        return self.value / 1e9
+
+    def view(self, dtype):
+        """ array view compat """
+        return np.timedelta64(self.value).view(dtype)
+
+    @property
+    def components(self):
+        """ Return a Components NamedTuple-like """
+        self._ensure_components()
+        # return the named tuple
+        return Components(self._d, self._h, self._m, self._s,
+                          self._ms, self._us, self._ns)
+
+    @property
+    def delta(self):
+        """
+        Return the timedelta in nanoseconds (ns), for internal compatibility.
+
+        Returns
+        -------
+        int
+            Timedelta in nanoseconds.
+
+        Examples
+        --------
+        >>> td = pd.Timedelta('1 days 42 ns')
+        >>> td.delta
+        86400000000042
+
+        >>> td = pd.Timedelta('3 s')
+        >>> td.delta
+        3000000000
+
+        >>> td = pd.Timedelta('3 ms 5 us')
+        >>> td.delta
+        3005000
+
+        >>> td = pd.Timedelta(42, unit='ns')
+        >>> td.delta
+        42
+        """
+        return self.value
+
+    @property
+    def asm8(self):
+        """
+        Return a numpy timedelta64 array scalar view.
+
+        Provides access to the array scalar view (i.e. a combination of the
+        value and the units) associated with the numpy.timedelta64().view(),
+        including a 64-bit integer representation of the timedelta in
+        nanoseconds (Python int compatible).
+
+        Returns
+        -------
+        numpy timedelta64 array scalar view
+            Array scalar view of the timedelta in nanoseconds.
+
+        Examples
+        --------
+        >>> td = pd.Timedelta('1 days 2 min 3 us 42 ns')
+        >>> td.asm8
+        numpy.timedelta64(86520000003042,'ns')
+
+        >>> td = pd.Timedelta('2 min 3 s')
+        >>> td.asm8
+        numpy.timedelta64(123000000000,'ns')
+
+        >>> td = pd.Timedelta('3 ms 5 us')
+        >>> td.asm8
+        numpy.timedelta64(3005000,'ns')
+
+        >>> td = pd.Timedelta(42, unit='ns')
+        >>> td.asm8
+        numpy.timedelta64(42,'ns')
+        """
+        return np.int64(self.value).view('m8[ns]')
+
+    @property
+    def resolution(self):
+        """
+        Return a string representing the lowest timedelta resolution.
+
+        Each timedelta has a defined resolution that represents the lowest OR
+        most granular level of precision. Each level of resolution is
+        represented by a short string as defined below:
+
+        Resolution:     Return value
+
+        * Days:         'D'
+        * Hours:        'H'
+        * Minutes:      'T'
+        * Seconds:      'S'
+        * Milliseconds: 'L'
+        * Microseconds: 'U'
+        * Nanoseconds:  'N'
+
+        Returns
+        -------
+        str
+            Timedelta resolution.
+
+        Examples
+        --------
+        >>> td = pd.Timedelta('1 days 2 min 3 us 42 ns')
+        >>> td.resolution
+        'N'
+
+        >>> td = pd.Timedelta('1 days 2 min 3 us')
+        >>> td.resolution
+        'U'
+
+        >>> td = pd.Timedelta('2 min 3 s')
+        >>> td.resolution
+        'S'
+
+        >>> td = pd.Timedelta(36, unit='us')
+        >>> td.resolution
+        'U'
+        """
+
+        self._ensure_components()
+        if self._ns:
+            return "N"
+        elif self._us:
+            return "U"
+        elif self._ms:
+            return "L"
+        elif self._s:
+            return "S"
+        elif self._m:
+            return "T"
+        elif self._h:
+            return "H"
+        else:
+            return "D"
+
+    @property
+    def nanoseconds(self):
+        """
+        Return the number of nanoseconds (n), where 0 <= n < 1 microsecond.
+
+        Returns
+        -------
+        int
+            Number of nanoseconds.
+
+        See Also
+        --------
+        Timedelta.components : Return all attributes with assigned values
+            (i.e. days, hours, minutes, seconds, milliseconds, microseconds,
+            nanoseconds).
+
+        Examples
+        --------
+        **Using string input**
+
+        >>> td = pd.Timedelta('1 days 2 min 3 us 42 ns')
+        >>> td.nanoseconds
+        42
+
+        **Using integer input**
+
+        >>> td = pd.Timedelta(42, unit='ns')
+        >>> td.nanoseconds
+        42
+        """
+        self._ensure_components()
+        return self._ns
+
+    def _repr_base(self, format=None):
+        """
+
+        Parameters
+        ----------
+        format : None|all|sub_day|long
+
+        Returns
+        -------
+        converted : string of a Timedelta
+
+        """
+        cdef object sign, seconds_pretty, subs, fmt, comp_dict
+
+        self._ensure_components()
+
+        if self._d < 0:
+            sign = " +"
+        else:
+            sign = " "
+
+        if format == 'all':
+            fmt = ("{days} days{sign}{hours:02}:{minutes:02}:{seconds:02}."
+                   "{milliseconds:03}{microseconds:03}{nanoseconds:03}")
+        else:
+            # if we have a partial day
+            subs = (self._h or self._m or self._s or
+                    self._ms or self._us or self._ns)
+
+            # by default not showing nano
+            if self._ms or self._us or self._ns:
+                seconds_fmt = "{seconds:02}.{milliseconds:03}{microseconds:03}"
+            else:
+                seconds_fmt = "{seconds:02}"
+
+            if format == 'sub_day' and not self._d:
+                fmt = "{hours:02}:{minutes:02}:" + seconds_fmt
+            elif subs or format == 'long':
+                fmt = "{days} days{sign}{hours:02}:{minutes:02}:" + seconds_fmt
+            else:
+                fmt = "{days} days"
+
+        comp_dict = self.components._asdict()
+        comp_dict['sign'] = sign
+
+        return fmt.format(**comp_dict)
+
+    def __repr__(self):
+        return "Timedelta('{val}')".format(val=self._repr_base(format='long'))
+
+    def __str__(self):
+        return self._repr_base(format='long')
+
+    def __bool__(self):
+        return self.value != 0
+
+    def isoformat(self):
+        """
+        Format Timedelta as ISO 8601 Duration like
+        ``P[n]Y[n]M[n]DT[n]H[n]M[n]S``, where the ``[n]`` s are replaced by the
+        values. See https://en.wikipedia.org/wiki/ISO_8601#Durations
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        formatted : str
+
+        See Also
+        --------
+        Timestamp.isoformat
+
+        Notes
+        -----
+        The longest component is days, whose value may be larger than
+        365.
+        Every component is always included, even if its value is 0.
+        Pandas uses nanosecond precision, so up to 9 decimal places may
+        be included in the seconds component.
+        Trailing 0's are removed from the seconds component after the decimal.
+        We do not 0 pad components, so it's `...T5H...`, not `...T05H...`
+
+        Examples
+        --------
+        >>> td = pd.Timedelta(days=6, minutes=50, seconds=3,
+        ...                   milliseconds=10, microseconds=10, nanoseconds=12)
+        >>> td.isoformat()
+        'P6DT0H50M3.010010012S'
+        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
+        'P0DT0H0M10S'
+        >>> pd.Timedelta(hours=1, seconds=10).isoformat()
+        'P0DT0H0M10S'
+        >>> pd.Timedelta(days=500.5).isoformat()
+        'P500DT12H0MS'
+        """
+        components = self.components
+        seconds = '{}.{:0>3}{:0>3}{:0>3}'.format(components.seconds,
+                                                 components.milliseconds,
+                                                 components.microseconds,
+                                                 components.nanoseconds)
+        # Trim unnecessary 0s, 1.000000000 -> 1
+        seconds = seconds.rstrip('0').rstrip('.')
+        tpl = ('P{td.days}DT{td.hours}H{td.minutes}M{seconds}S'
+               .format(td=components, seconds=seconds))
+        return tpl
+
+
+# Python front end to C extension type _Timedelta
+# This serves as the box for timedelta64
+
+class Timedelta(_Timedelta):
+    """
+    Represents a duration, the difference between two dates or times.
+
+    Timedelta is the pandas equivalent of python's ``datetime.timedelta``
+    and is interchangeable with it in most cases.
+
+    Parameters
+    ----------
+    value : Timedelta, timedelta, np.timedelta64, string, or integer
+    unit : str, optional
+        Denote the unit of the input, if input is an integer. Default 'ns'.
+        Possible values:
+        {'Y', 'M', 'W', 'D', 'days', 'day', 'hours', hour', 'hr', 'h',
+        'm', 'minute', 'min', 'minutes', 'T', 'S', 'seconds', 'sec', 'second',
+        'ms', 'milliseconds', 'millisecond', 'milli', 'millis', 'L',
+        'us', 'microseconds', 'microsecond', 'micro', 'micros', 'U',
+        'ns', 'nanoseconds', 'nano', 'nanos', 'nanosecond', 'N'}
+    **kwargs
+        Available kwargs: {days, seconds, microseconds,
+        milliseconds, minutes, hours, weeks}.
+        Values for construction in compat with datetime.timedelta.
+        Numpy ints and floats will be coerced to python ints and floats.
+
+    Notes
+    -----
+    The ``.value`` attribute is always in ns.
+
+    """
+    def __new__(cls, object value=_no_input, unit=None, **kwargs):
+        cdef _Timedelta td_base
+
+        if value is _no_input:
+            if not len(kwargs):
+                raise ValueError("cannot construct a Timedelta without a "
+                                 "value/unit or descriptive keywords "
+                                 "(days,seconds....)")
+
+            kwargs = {key: _to_py_int_float(kwargs[key]) for key in kwargs}
+
+            nano = kwargs.pop('nanoseconds', 0)
+            try:
+                value = nano + convert_to_timedelta64(timedelta(**kwargs),
+                                                      'ns')
+            except TypeError as e:
+                raise ValueError("cannot construct a Timedelta from the "
+                                 "passed arguments, allowed keywords are "
+                                 "[weeks, days, hours, minutes, seconds, "
+                                 "milliseconds, microseconds, nanoseconds]")
+
+        if unit in {'Y', 'y', 'M'}:
+            warnings.warn("M and Y units are deprecated and "
+                          "will be removed in a future version.",
+                          FutureWarning, stacklevel=1)
+
+        if isinstance(value, Timedelta):
+            value = value.value
+        elif is_string_object(value):
+            if len(value) > 0 and value[0] == 'P':
+                value = parse_iso_format_string(value)
+            else:
+                value = parse_timedelta_string(value)
+            value = np.timedelta64(value)
+        elif PyDelta_Check(value):
+            value = convert_to_timedelta64(value, 'ns')
+        elif is_timedelta64_object(value):
+            if unit is not None:
+                value = value.astype('timedelta64[{0}]'.format(unit))
+            value = value.astype('timedelta64[ns]')
+        elif hasattr(value, 'delta'):
+            value = np.timedelta64(delta_to_nanoseconds(value.delta), 'ns')
+        elif is_integer_object(value) or is_float_object(value):
+            # unit=None is de-facto 'ns'
+            unit = parse_timedelta_unit(unit)
+            value = convert_to_timedelta64(value, unit)
+        elif checknull_with_nat(value):
+            return NaT
+        else:
+            raise ValueError(
+                "Value must be Timedelta, string, integer, "
+                "float, timedelta or convertible")
+
+        if is_timedelta64_object(value):
+            value = value.view('i8')
+
+        # nat
+        if value == NPY_NAT:
+            return NaT
+
+        # make timedelta happy
+        td_base = _Timedelta.__new__(cls, microseconds=int(value) / 1000)
+        td_base.value = value
+        td_base.is_populated = 0
+        return td_base
+
+    def __setstate__(self, state):
+        (value) = state
+        self.value = value
+
+    def __reduce__(self):
+        object_state = self.value,
+        return (Timedelta, object_state)
+
+    def _round(self, freq, rounder):
+        cdef:
+            int64_t result, unit
+
+        unit = to_offset(freq).nanos
+        result = unit * rounder(self.value / float(unit))
+        return Timedelta(result, unit='ns')
+
+    def round(self, freq):
+        """
+        Round the Timedelta to the specified resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+
+        Returns
+        -------
+        a new Timedelta rounded to the given resolution of `freq`
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(freq, np.round)
+
+    def floor(self, freq):
+        """
+        return a new Timedelta floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        """
+        return self._round(freq, np.floor)
+
+    def ceil(self, freq):
+        """
+        return a new Timedelta ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        """
+        return self._round(freq, np.ceil)
+
+    # ----------------------------------------------------------------
+    # Arithmetic Methods
+    # TODO: Can some of these be defined in the cython class?
+
+    __inv__ = _op_unary_method(lambda x: -x, '__inv__')
+    __neg__ = _op_unary_method(lambda x: -x, '__neg__')
+    __pos__ = _op_unary_method(lambda x: x, '__pos__')
+    __abs__ = _op_unary_method(lambda x: abs(x), '__abs__')
+
+    __add__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__add__')
+    __radd__ = _binary_op_method_timedeltalike(lambda x, y: x + y, '__radd__')
+    __sub__ = _binary_op_method_timedeltalike(lambda x, y: x - y, '__sub__')
+    __rsub__ = _binary_op_method_timedeltalike(lambda x, y: y - x, '__rsub__')
+
+    def __mul__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset; this op will raise TypeError
+                return other.delta * self
+            return NotImplemented
+
+        elif util.is_nan(other):
+            # i.e. np.nan, but also catch np.float64("NaN") which would
+            #  otherwise get caught by the hasattr(other, "dtype") branch
+            #  incorrectly return a np.timedelta64 object.
+            return NaT
+
+        elif hasattr(other, 'dtype'):
+            # ndarray-like
+            return other * self.to_timedelta64()
+
+        elif other is NaT:
+            raise TypeError('Cannot multiply Timedelta with NaT')
+
+        elif not (is_integer_object(other) or is_float_object(other)):
+            # only integers and floats allowed
+            return NotImplemented
+
+        return Timedelta(other * self.value, unit='ns')
+
+    __rmul__ = __mul__
+
+    def __truediv__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return self / other.delta
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif util.is_nan(other):
+            # i.e. np.nan, but also catch np.float64("NaN") which would
+            #  otherwise get caught by the hasattr(other, "dtype") branch
+            #  incorrectly return a np.timedelta64 object.
+            return NaT
+
+        elif hasattr(other, 'dtype'):
+            return self.to_timedelta64() / other
+
+        elif is_integer_object(other) or is_float_object(other):
+            # integers or floats
+            return Timedelta(self.value / other, unit='ns')
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return self.value / float(other.value)
+
+    def __rtruediv__(self, other):
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return other.delta / self
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            return other / self.to_timedelta64()
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return NaT
+        return float(other.value) / self.value
+
+    if not PY3:
+        __div__ = __truediv__
+        __rdiv__ = __rtruediv__
+
+    def __floordiv__(self, other):
+        # numpy does not implement floordiv for timedelta64 dtype, so we cannot
+        # just defer
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return self // other.delta
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            if other.dtype.kind == 'm':
+                # also timedelta-like
+                return _broadcast_floordiv_td64(self.value, other, _floordiv)
+            elif other.dtype.kind in ['i', 'u', 'f']:
+                if other.ndim == 0:
+                    return Timedelta(self.value // other)
+                else:
+                    return self.to_timedelta64() // other
+
+            raise TypeError('Invalid dtype {dtype} for '
+                            '{op}'.format(dtype=other.dtype,
+                                          op='__floordiv__'))
+
+        elif is_integer_object(other) or is_float_object(other):
+            return Timedelta(self.value // other, unit='ns')
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return self.value // other.value
+
+    def __rfloordiv__(self, other):
+        # numpy does not implement floordiv for timedelta64 dtype, so we cannot
+        # just defer
+        if hasattr(other, '_typ'):
+            # Series, DataFrame, ...
+            if other._typ == 'dateoffset' and hasattr(other, 'delta'):
+                # Tick offset
+                return other.delta // self
+            return NotImplemented
+
+        elif is_timedelta64_object(other):
+            # convert to Timedelta below
+            pass
+
+        elif hasattr(other, 'dtype'):
+            if other.dtype.kind == 'm':
+                # also timedelta-like
+                return _broadcast_floordiv_td64(self.value, other, _rfloordiv)
+            elif other.dtype.kind == 'i':
+                # Backwards compatibility
+                # GH-19761
+                msg = textwrap.dedent("""\
+                Floor division between integer array and Timedelta is
+                deprecated. Use 'array // timedelta.value' instead.
+                If you want to obtain epochs from an array of timestamps,
+                you can rather use
+                '(array - pd.Timestamp("1970-01-01")) // pd.Timedelta("1s")'.
+                """)
+                warnings.warn(msg, FutureWarning)
+                return other // self.value
+            raise TypeError('Invalid dtype {dtype} for '
+                            '{op}'.format(dtype=other.dtype,
+                                          op='__floordiv__'))
+
+        elif is_float_object(other) and util.is_nan(other):
+            # i.e. np.nan
+            return NotImplemented
+
+        elif not _validate_ops_compat(other):
+            return NotImplemented
+
+        other = Timedelta(other)
+        if other is NaT:
+            return np.nan
+        return other.value // self.value
+
+    def __mod__(self, other):
+        # Naive implementation, room for optimization
+        return self.__divmod__(other)[1]
+
+    def __rmod__(self, other):
+        # Naive implementation, room for optimization
+        if hasattr(other, 'dtype') and other.dtype.kind == 'i':
+            # TODO: Remove this check with backwards-compat shim
+            # for integer / Timedelta is removed.
+            raise TypeError("Invalid type {dtype} for "
+                            "{op}".format(dtype=other.dtype, op='__mod__'))
+        return self.__rdivmod__(other)[1]
+
+    def __divmod__(self, other):
+        # Naive implementation, room for optimization
+        div = self // other
+        return div, self - div * other
+
+    def __rdivmod__(self, other):
+        # Naive implementation, room for optimization
+        if hasattr(other, 'dtype') and other.dtype.kind == 'i':
+            # TODO: Remove this check with backwards-compat shim
+            # for integer / Timedelta is removed.
+            raise TypeError("Invalid type {dtype} for "
+                            "{op}".format(dtype=other.dtype, op='__mod__'))
+        div = other // self
+        return div, other - div * self
+
+
+cdef _floordiv(int64_t value, right):
+    return value // right
+
+
+cdef _rfloordiv(int64_t value, right):
+    # analogous to referencing operator.div, but there is no operator.rfloordiv
+    return right // value
+
+
+cdef _broadcast_floordiv_td64(int64_t value, object other,
+                              object (*operation)(int64_t value,
+                                                  object right)):
+    """Boilerplate code shared by Timedelta.__floordiv__ and
+    Timedelta.__rfloordiv__ because np.timedelta64 does not implement these.
+
+    Parameters
+    ----------
+    value : int64_t; `self.value` from a Timedelta object
+    other : object
+    operation : function, either _floordiv or _rfloordiv
+
+    Returns
+    -------
+    result : varies based on `other`
+    """
+    # assumes other.dtype.kind == 'm', i.e. other is timedelta-like
+    cdef:
+        int ndim = getattr(other, 'ndim', -1)
+
+    # We need to watch out for np.timedelta64('NaT').
+    mask = other.view('i8') == NPY_NAT
+
+    if ndim == 0:
+        if mask:
+            return np.nan
+
+        return operation(value, other.astype('m8[ns]').astype('i8'))
+
+    else:
+        res = operation(value, other.astype('m8[ns]').astype('i8'))
+
+        if mask.any():
+            res = res.astype('f8')
+            res[mask] = np.nan
+        return res
+
+
+# resolution in ns
+Timedelta.min = Timedelta(np.iinfo(np.int64).min + 1)
+Timedelta.max = Timedelta(np.iinfo(np.int64).max)
diff --git a/pandas/_libs/tslibs/timestamps.pxd b/pandas/_libs/tslibs/timestamps.pxd
new file mode 100644
index 0000000000000..b7282e02ff117
--- /dev/null
+++ b/pandas/_libs/tslibs/timestamps.pxd
@@ -0,0 +1,8 @@
+# -*- coding: utf-8 -*-
+
+from numpy cimport int64_t
+from pandas._libs.tslibs.np_datetime cimport npy_datetimestruct
+
+cdef object create_timestamp_from_ts(int64_t value,
+                                     npy_datetimestruct dts,
+                                     object tz, object freq)
diff --git a/pandas/_libs/tslibs/timestamps.pyx b/pandas/_libs/tslibs/timestamps.pyx
new file mode 100644
index 0000000000000..8d825e0a6179e
--- /dev/null
+++ b/pandas/_libs/tslibs/timestamps.pyx
@@ -0,0 +1,1432 @@
+# -*- coding: utf-8 -*-
+import sys
+import warnings
+
+from cpython cimport (PyObject_RichCompareBool, PyObject_RichCompare,
+                      Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE)
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t, int32_t, int8_t
+cnp.import_array()
+
+from datetime import time as datetime_time, timedelta
+from cpython.datetime cimport (datetime,
+                               PyDateTime_Check, PyDelta_Check, PyTZInfo_Check,
+                               PyDateTime_IMPORT)
+PyDateTime_IMPORT
+
+from pandas._libs.tslibs.util cimport (
+    is_datetime64_object, is_timedelta64_object, is_integer_object,
+    is_string_object, is_array, is_offset_object)
+
+cimport pandas._libs.tslibs.ccalendar as ccalendar
+from pandas._libs.tslibs.ccalendar import DAY_SECONDS
+from pandas._libs.tslibs.conversion import (
+    tz_localize_to_utc, normalize_i8_timestamps)
+from pandas._libs.tslibs.conversion cimport (
+    tz_convert_single, _TSObject, convert_to_tsobject,
+    convert_datetime_to_tsobject)
+from pandas._libs.tslibs.fields import get_start_end_field, get_date_name_field
+from pandas._libs.tslibs.nattype cimport NPY_NAT, c_NaT as NaT
+from pandas._libs.tslibs.np_datetime import OutOfBoundsDatetime
+from pandas._libs.tslibs.np_datetime cimport (
+    reverse_ops, cmp_scalar, check_dts_bounds, npy_datetimestruct,
+    dt64_to_dtstruct)
+from pandas._libs.tslibs.offsets cimport to_offset
+from pandas._libs.tslibs.timedeltas import Timedelta
+from pandas._libs.tslibs.timedeltas cimport delta_to_nanoseconds
+from pandas._libs.tslibs.timezones cimport (
+    get_timezone, is_utc, maybe_get_tz, treat_tz_as_pytz, tz_compare)
+from pandas._libs.tslibs.timezones import UTC
+
+# ----------------------------------------------------------------------
+# Constants
+_zero_time = datetime_time(0, 0)
+_no_input = object()
+PY36 = sys.version_info >= (3, 6)
+
+# ----------------------------------------------------------------------
+
+
+def maybe_integer_op_deprecated(obj):
+    # GH#22535 add/sub of integers and int-arrays is deprecated
+    if obj.freq is not None:
+        warnings.warn("Addition/subtraction of integers and integer-arrays "
+                      "to {cls} is deprecated, will be removed in a future "
+                      "version.  Instead of adding/subtracting `n`, use "
+                      "`n * self.freq`"
+                      .format(cls=type(obj).__name__),
+                      FutureWarning)
+
+
+cdef inline object create_timestamp_from_ts(int64_t value,
+                                            npy_datetimestruct dts,
+                                            object tz, object freq):
+    """ convenience routine to construct a Timestamp from its parts """
+    cdef _Timestamp ts_base
+    ts_base = _Timestamp.__new__(Timestamp, dts.year, dts.month,
+                                 dts.day, dts.hour, dts.min,
+                                 dts.sec, dts.us, tz)
+    ts_base.value = value
+    ts_base.freq = freq
+    ts_base.nanosecond = dts.ps / 1000
+
+    return ts_base
+
+
+class RoundTo(object):
+    """
+    enumeration defining the available rounding modes
+
+    Attributes
+    ----------
+    MINUS_INFTY
+        round towards -∞, or floor [2]_
+    PLUS_INFTY
+        round towards +∞, or ceil [3]_
+    NEAREST_HALF_EVEN
+        round to nearest, tie-break half to even [6]_
+    NEAREST_HALF_MINUS_INFTY
+        round to nearest, tie-break half to -∞ [5]_
+    NEAREST_HALF_PLUS_INFTY
+        round to nearest, tie-break half to +∞ [4]_
+
+
+    References
+    ----------
+    .. [1] "Rounding - Wikipedia"
+           https://en.wikipedia.org/wiki/Rounding
+    .. [2] "Rounding down"
+           https://en.wikipedia.org/wiki/Rounding#Rounding_down
+    .. [3] "Rounding up"
+           https://en.wikipedia.org/wiki/Rounding#Rounding_up
+    .. [4] "Round half up"
+           https://en.wikipedia.org/wiki/Rounding#Round_half_up
+    .. [5] "Round half down"
+           https://en.wikipedia.org/wiki/Rounding#Round_half_down
+    .. [6] "Round half to even"
+           https://en.wikipedia.org/wiki/Rounding#Round_half_to_even
+    """
+    @property
+    def MINUS_INFTY(self):
+        return 0
+
+    @property
+    def PLUS_INFTY(self):
+        return 1
+
+    @property
+    def NEAREST_HALF_EVEN(self):
+        return 2
+
+    @property
+    def NEAREST_HALF_PLUS_INFTY(self):
+        return 3
+
+    @property
+    def NEAREST_HALF_MINUS_INFTY(self):
+        return 4
+
+
+cdef inline _npdivmod(x1, x2):
+    """implement divmod for numpy < 1.13"""
+    return np.floor_divide(x1, x2), np.remainder(x1, x2)
+
+
+try:
+    from numpy import divmod as npdivmod
+except ImportError:
+    # numpy < 1.13
+    npdivmod = _npdivmod
+
+
+cdef inline _floor_int64(values, unit):
+    return values - np.remainder(values, unit)
+
+cdef inline _ceil_int64(values, unit):
+    return values + np.remainder(-values, unit)
+
+cdef inline _rounddown_int64(values, unit):
+    return _ceil_int64(values - unit//2, unit)
+
+cdef inline _roundup_int64(values, unit):
+    return _floor_int64(values + unit//2, unit)
+
+
+def round_nsint64(values, mode, freq):
+    """
+    Applies rounding mode at given frequency
+
+    Parameters
+    ----------
+    values : :obj:`ndarray`
+    mode : instance of `RoundTo` enumeration
+    freq : str, obj
+
+    Returns
+    -------
+    :obj:`ndarray`
+    """
+
+    unit = to_offset(freq).nanos
+
+    if mode == RoundTo.MINUS_INFTY:
+        return _floor_int64(values, unit)
+    elif mode == RoundTo.PLUS_INFTY:
+        return _ceil_int64(values, unit)
+    elif mode == RoundTo.NEAREST_HALF_MINUS_INFTY:
+        return _rounddown_int64(values, unit)
+    elif mode == RoundTo.NEAREST_HALF_PLUS_INFTY:
+        return _roundup_int64(values, unit)
+    elif mode == RoundTo.NEAREST_HALF_EVEN:
+        # for odd unit there is no need of a tie break
+        if unit % 2:
+            return _rounddown_int64(values, unit)
+        quotient, remainder = npdivmod(values, unit)
+        mask = np.logical_or(
+            remainder > (unit // 2),
+            np.logical_and(remainder == (unit // 2), quotient % 2)
+        )
+        quotient[mask] += 1
+        return quotient * unit
+
+    # if/elif above should catch all rounding modes defined in enum 'RoundTo':
+    # if flow of control arrives here, it is a bug
+    raise ValueError("round_nsint64 called with an unrecognized "
+                     "rounding mode")
+
+
+# This is PITA. Because we inherit from datetime, which has very specific
+# construction requirements, we need to do object instantiation in python
+# (see Timestamp class below). This will serve as a C extension type that
+# shadows the python class, where we do any heavy lifting.
+cdef class _Timestamp(datetime):
+
+    cdef readonly:
+        int64_t value, nanosecond
+        object freq       # frequency reference
+        list _date_attributes
+
+    def __hash__(_Timestamp self):
+        if self.nanosecond:
+            return hash(self.value)
+        return datetime.__hash__(self)
+
+    def __richcmp__(_Timestamp self, object other, int op):
+        cdef:
+            _Timestamp ots
+            int ndim
+
+        if isinstance(other, _Timestamp):
+            ots = other
+        elif other is NaT:
+            return op == Py_NE
+        elif PyDateTime_Check(other):
+            if self.nanosecond == 0:
+                val = self.to_pydatetime()
+                return PyObject_RichCompareBool(val, other, op)
+
+            try:
+                ots = Timestamp(other)
+            except ValueError:
+                return self._compare_outside_nanorange(other, op)
+        else:
+            ndim = getattr(other, "ndim", -1)
+
+            if ndim != -1:
+                if ndim == 0:
+                    if is_datetime64_object(other):
+                        other = Timestamp(other)
+                    else:
+                        if op == Py_EQ:
+                            return False
+                        elif op == Py_NE:
+                            return True
+
+                        # only allow ==, != ops
+                        raise TypeError('Cannot compare type %r with type %r' %
+                                        (type(self).__name__,
+                                         type(other).__name__))
+                elif is_array(other):
+                    # avoid recursion error GH#15183
+                    return PyObject_RichCompare(np.array([self]), other, op)
+                return PyObject_RichCompare(other, self, reverse_ops[op])
+            else:
+                if op == Py_EQ:
+                    return False
+                elif op == Py_NE:
+                    return True
+                raise TypeError('Cannot compare type %r with type %r' %
+                                (type(self).__name__, type(other).__name__))
+
+        self._assert_tzawareness_compat(other)
+        return cmp_scalar(self.value, ots.value, op)
+
+    def __reduce_ex__(self, protocol):
+        # python 3.6 compat
+        # http://bugs.python.org/issue28730
+        # now __reduce_ex__ is defined and higher priority than __reduce__
+        return self.__reduce__()
+
+    def __repr__(self):
+        stamp = self._repr_base
+        zone = None
+
+        try:
+            stamp += self.strftime('%z')
+            if self.tzinfo:
+                zone = get_timezone(self.tzinfo)
+        except ValueError:
+            year2000 = self.replace(year=2000)
+            stamp += year2000.strftime('%z')
+            if self.tzinfo:
+                zone = get_timezone(self.tzinfo)
+
+        try:
+            stamp += zone.strftime(' %%Z')
+        except:
+            pass
+
+        tz = ", tz='{0}'".format(zone) if zone is not None else ""
+        freq = "" if self.freq is None else ", freq='{0}'".format(self.freqstr)
+
+        return "Timestamp('{stamp}'{tz}{freq})".format(stamp=stamp,
+                                                       tz=tz, freq=freq)
+
+    cdef bint _compare_outside_nanorange(_Timestamp self, datetime other,
+                                         int op) except -1:
+        cdef:
+            datetime dtval = self.to_pydatetime()
+
+        self._assert_tzawareness_compat(other)
+
+        if self.nanosecond == 0:
+            return PyObject_RichCompareBool(dtval, other, op)
+        else:
+            if op == Py_EQ:
+                return False
+            elif op == Py_NE:
+                return True
+            elif op == Py_LT:
+                return dtval < other
+            elif op == Py_LE:
+                return dtval < other
+            elif op == Py_GT:
+                return dtval >= other
+            elif op == Py_GE:
+                return dtval >= other
+
+    cdef _assert_tzawareness_compat(_Timestamp self, datetime other):
+        if self.tzinfo is None:
+            if other.tzinfo is not None:
+                raise TypeError('Cannot compare tz-naive and tz-aware '
+                                'timestamps')
+        elif other.tzinfo is None:
+            raise TypeError('Cannot compare tz-naive and tz-aware timestamps')
+
+    cpdef datetime to_pydatetime(_Timestamp self, bint warn=True):
+        """
+        Convert a Timestamp object to a native Python datetime object.
+
+        If warn=True, issue a warning if nanoseconds is nonzero.
+        """
+        if self.nanosecond != 0 and warn:
+            warnings.warn("Discarding nonzero nanoseconds in conversion",
+                          UserWarning, stacklevel=2)
+
+        return datetime(self.year, self.month, self.day,
+                        self.hour, self.minute, self.second,
+                        self.microsecond, self.tzinfo)
+
+    cpdef to_datetime64(self):
+        """
+        Return a numpy.datetime64 object with 'ns' precision.
+        """
+        return np.datetime64(self.value, 'ns')
+
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        Convert the Timestamp to a NumPy datetime64.
+
+        .. versionadded:: 0.25.0
+
+        This is an alias method for `Timestamp.to_datetime64()`. The dtype and
+        copy parameters are available here only for compatibility. Their values
+        will not affect the return value.
+
+        Returns
+        -------
+        numpy.datetime64
+
+        See Also
+        --------
+        DatetimeIndex.to_numpy : Similar method for DatetimeIndex.
+        """
+        return self.to_datetime64()
+
+    def __add__(self, other):
+        cdef:
+            int64_t other_int, nanos
+
+        if is_timedelta64_object(other):
+            other_int = other.astype('timedelta64[ns]').view('i8')
+            return Timestamp(self.value + other_int,
+                             tz=self.tzinfo, freq=self.freq)
+
+        elif is_integer_object(other):
+            maybe_integer_op_deprecated(self)
+
+            if self is NaT:
+                # to be compat with Period
+                return NaT
+            elif self.freq is None:
+                raise ValueError("Cannot add integral value to Timestamp "
+                                 "without freq.")
+            return Timestamp((self.freq * other).apply(self), freq=self.freq)
+
+        elif PyDelta_Check(other) or hasattr(other, 'delta'):
+            # delta --> offsets.Tick
+            nanos = delta_to_nanoseconds(other)
+            result = Timestamp(self.value + nanos,
+                               tz=self.tzinfo, freq=self.freq)
+            if getattr(other, 'normalize', False):
+                # DateOffset
+                result = result.normalize()
+            return result
+
+        # index/series like
+        elif hasattr(other, '_typ'):
+            return NotImplemented
+
+        result = datetime.__add__(self, other)
+        if PyDateTime_Check(result):
+            result = Timestamp(result)
+            result.nanosecond = self.nanosecond
+        return result
+
+    def __sub__(self, other):
+        if (is_timedelta64_object(other) or is_integer_object(other) or
+                PyDelta_Check(other) or hasattr(other, 'delta')):
+            # `delta` attribute is for offsets.Tick or offsets.Week obj
+            neg_other = -other
+            return self + neg_other
+
+        typ = getattr(other, '_typ', None)
+
+        # a Timestamp-DatetimeIndex -> yields a negative TimedeltaIndex
+        if typ in ('datetimeindex', 'datetimearray'):
+            # timezone comparison is performed in DatetimeIndex._sub_datelike
+            return -other.__sub__(self)
+
+        # a Timestamp-TimedeltaIndex -> yields a negative TimedeltaIndex
+        elif typ in ('timedeltaindex', 'timedeltaarray'):
+            return (-other).__add__(self)
+
+        elif other is NaT:
+            return NaT
+
+        # coerce if necessary if we are a Timestamp-like
+        if (PyDateTime_Check(self)
+                and (PyDateTime_Check(other) or is_datetime64_object(other))):
+            self = Timestamp(self)
+            other = Timestamp(other)
+
+            # validate tz's
+            if not tz_compare(self.tzinfo, other.tzinfo):
+                raise TypeError("Timestamp subtraction must have the "
+                                "same timezones or no timezones")
+
+            # scalar Timestamp/datetime - Timestamp/datetime -> yields a
+            # Timedelta
+            try:
+                return Timedelta(self.value - other.value)
+            except (OverflowError, OutOfBoundsDatetime):
+                pass
+
+        # scalar Timestamp/datetime - Timedelta -> yields a Timestamp (with
+        # same timezone if specified)
+        return datetime.__sub__(self, other)
+
+    cdef int64_t _maybe_convert_value_to_local(self):
+        """Convert UTC i8 value to local i8 value if tz exists"""
+        cdef:
+            int64_t val
+        val = self.value
+        if self.tz is not None and not is_utc(self.tz):
+            val = tz_convert_single(self.value, UTC, self.tz)
+        return val
+
+    cpdef bint _get_start_end_field(self, str field):
+        cdef:
+            int64_t val
+            dict kwds
+            int8_t out[1]
+            int month_kw
+
+        freq = self.freq
+        if freq:
+            kwds = freq.kwds
+            month_kw = kwds.get('startingMonth', kwds.get('month', 12))
+            freqstr = self.freqstr
+        else:
+            month_kw = 12
+            freqstr = None
+
+        val = self._maybe_convert_value_to_local()
+        out = get_start_end_field(np.array([val], dtype=np.int64),
+                                  field, freqstr, month_kw)
+        return out[0]
+
+    cpdef _get_date_name_field(self, object field, object locale):
+        cdef:
+            int64_t val
+            object[:] out
+
+        val = self._maybe_convert_value_to_local()
+        out = get_date_name_field(np.array([val], dtype=np.int64),
+                                  field, locale=locale)
+        return out[0]
+
+    @property
+    def _repr_base(self):
+        return '{date} {time}'.format(date=self._date_repr,
+                                      time=self._time_repr)
+
+    @property
+    def _date_repr(self):
+        # Ideal here would be self.strftime("%Y-%m-%d"), but
+        # the datetime strftime() methods require year >= 1900
+        return '%d-%.2d-%.2d' % (self.year, self.month, self.day)
+
+    @property
+    def _time_repr(self):
+        result = '%.2d:%.2d:%.2d' % (self.hour, self.minute, self.second)
+
+        if self.nanosecond != 0:
+            result += '.%.9d' % (self.nanosecond + 1000 * self.microsecond)
+        elif self.microsecond != 0:
+            result += '.%.6d' % self.microsecond
+
+        return result
+
+    @property
+    def _short_repr(self):
+        # format a Timestamp with only _date_repr if possible
+        # otherwise _repr_base
+        if (self.hour == 0 and
+                self.minute == 0 and
+                self.second == 0 and
+                self.microsecond == 0 and
+                self.nanosecond == 0):
+            return self._date_repr
+        return self._repr_base
+
+    @property
+    def asm8(self):
+        """
+        Return numpy datetime64 format in nanoseconds.
+        """
+        return np.datetime64(self.value, 'ns')
+
+    @property
+    def resolution(self):
+        """
+        Return resolution describing the smallest difference between two
+        times that can be represented by Timestamp object_state
+        """
+        # GH#21336, GH#21365
+        return Timedelta(nanoseconds=1)
+
+    def timestamp(self):
+        """Return POSIX timestamp as float."""
+        # py27 compat, see GH#17329
+        return round(self.value / 1e9, 6)
+
+
+# ----------------------------------------------------------------------
+
+# Python front end to C extension type _Timestamp
+# This serves as the box for datetime64
+
+
+class Timestamp(_Timestamp):
+    """Pandas replacement for datetime.datetime
+
+    Timestamp is the pandas equivalent of python's Datetime
+    and is interchangeable with it in most cases. It's the type used
+    for the entries that make up a DatetimeIndex, and other timeseries
+    oriented data structures in pandas.
+
+    Parameters
+    ----------
+    ts_input : datetime-like, str, int, float
+        Value to be converted to Timestamp
+    freq : str, DateOffset
+        Offset which Timestamp will have
+    tz : str, pytz.timezone, dateutil.tz.tzfile or None
+        Time zone for time which Timestamp will have.
+    unit : str
+        Unit used for conversion if ts_input is of type int or float. The
+        valid values are 'D', 'h', 'm', 's', 'ms', 'us', and 'ns'. For
+        example, 's' means seconds and 'ms' means milliseconds.
+    year, month, day : int
+        .. versionadded:: 0.19.0
+    hour, minute, second, microsecond : int, optional, default 0
+        .. versionadded:: 0.19.0
+    nanosecond : int, optional, default 0
+        .. versionadded:: 0.23.0
+    tzinfo : datetime.tzinfo, optional, default None
+        .. versionadded:: 0.19.0
+
+    Notes
+    -----
+    There are essentially three calling conventions for the constructor. The
+    primary form accepts four parameters. They can be passed by position or
+    keyword.
+
+    The other two forms mimic the parameters from ``datetime.datetime``. They
+    can be passed by either position or keyword, but not both mixed together.
+
+    Examples
+    --------
+    Using the primary calling convention:
+
+    This converts a datetime-like string
+
+    >>> pd.Timestamp('2017-01-01T12')
+    Timestamp('2017-01-01 12:00:00')
+
+    This converts a float representing a Unix epoch in units of seconds
+
+    >>> pd.Timestamp(1513393355.5, unit='s')
+    Timestamp('2017-12-16 03:02:35.500000')
+
+    This converts an int representing a Unix-epoch in units of seconds
+    and for a particular timezone
+
+    >>> pd.Timestamp(1513393355, unit='s', tz='US/Pacific')
+    Timestamp('2017-12-15 19:02:35-0800', tz='US/Pacific')
+
+    Using the other two forms that mimic the API for ``datetime.datetime``:
+
+    >>> pd.Timestamp(2017, 1, 1, 12)
+    Timestamp('2017-01-01 12:00:00')
+
+    >>> pd.Timestamp(year=2017, month=1, day=1, hour=12)
+    Timestamp('2017-01-01 12:00:00')
+    """
+
+    @classmethod
+    def fromordinal(cls, ordinal, freq=None, tz=None):
+        """
+        Timestamp.fromordinal(ordinal, freq=None, tz=None)
+
+        passed an ordinal, translate and convert to a ts
+        note: by definition there cannot be any tz info on the ordinal itself
+
+        Parameters
+        ----------
+        ordinal : int
+            date corresponding to a proleptic Gregorian ordinal
+        freq : str, DateOffset
+            Offset which Timestamp will have
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will have.
+        """
+        return cls(datetime.fromordinal(ordinal),
+                   freq=freq, tz=tz)
+
+    @classmethod
+    def now(cls, tz=None):
+        """
+        Timestamp.now(tz=None)
+
+        Return new Timestamp object representing current time local to
+        tz.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """
+        if is_string_object(tz):
+            tz = maybe_get_tz(tz)
+        return cls(datetime.now(tz))
+
+    @classmethod
+    def today(cls, tz=None):
+        """
+        Timestamp.today(cls, tz=None)
+
+        Return the current time in the local timezone.  This differs
+        from datetime.today() in that it can be localized to a
+        passed timezone.
+
+        Parameters
+        ----------
+        tz : str or timezone object, default None
+            Timezone to localize to
+        """
+        return cls.now(tz)
+
+    @classmethod
+    def utcnow(cls):
+        """
+        Timestamp.utcnow()
+
+        Return a new Timestamp representing UTC day and time.
+        """
+        return cls.now(UTC)
+
+    @classmethod
+    def utcfromtimestamp(cls, ts):
+        """
+        Timestamp.utcfromtimestamp(ts)
+
+        Construct a naive UTC datetime from a POSIX timestamp.
+        """
+        return cls(datetime.utcfromtimestamp(ts))
+
+    @classmethod
+    def fromtimestamp(cls, ts):
+        """
+        Timestamp.fromtimestamp(ts)
+
+        timestamp[, tz] -> tz's local time from POSIX timestamp.
+        """
+        return cls(datetime.fromtimestamp(ts))
+
+    # Issue 25016.
+    @classmethod
+    def strptime(cls, date_string, format):
+        """
+        Timestamp.strptime(string, format)
+
+        Function is not implemented. Use pd.to_datetime().
+        """
+        raise NotImplementedError("Timestamp.strptime() is not implmented."
+                                  "Use to_datetime() to parse date strings.")
+
+    @classmethod
+    def combine(cls, date, time):
+        """
+        Timestamp.combine(date, time)
+
+        date, time -> datetime with same date and time fields
+        """
+        return cls(datetime.combine(date, time))
+
+    def __new__(cls, object ts_input=_no_input,
+                object freq=None, tz=None, unit=None,
+                year=None, month=None, day=None,
+                hour=None, minute=None, second=None, microsecond=None,
+                nanosecond=None, tzinfo=None):
+        # The parameter list folds together legacy parameter names (the first
+        # four) and positional and keyword parameter names from pydatetime.
+        #
+        # There are three calling forms:
+        #
+        # - In the legacy form, the first parameter, ts_input, is required
+        #   and may be datetime-like, str, int, or float. The second
+        #   parameter, offset, is optional and may be str or DateOffset.
+        #
+        # - ints in the first, second, and third arguments indicate
+        #   pydatetime positional arguments. Only the first 8 arguments
+        #   (standing in for year, month, day, hour, minute, second,
+        #   microsecond, tzinfo) may be non-None. As a shortcut, we just
+        #   check that the second argument is an int.
+        #
+        # - Nones for the first four (legacy) arguments indicate pydatetime
+        #   keyword arguments. year, month, and day are required. As a
+        #   shortcut, we just check that the first argument was not passed.
+        #
+        # Mixing pydatetime positional and keyword arguments is forbidden!
+
+        cdef _TSObject ts
+
+        _date_attributes = [year, month, day, hour, minute, second,
+                            microsecond, nanosecond]
+
+        if tzinfo is not None:
+            if not PyTZInfo_Check(tzinfo):
+                # tzinfo must be a datetime.tzinfo object, GH#17690
+                raise TypeError('tzinfo must be a datetime.tzinfo object, '
+                                'not %s' % type(tzinfo))
+            elif tz is not None:
+                raise ValueError('Can provide at most one of tz, tzinfo')
+
+            # User passed tzinfo instead of tz; avoid silently ignoring
+            tz, tzinfo = tzinfo, None
+
+        if is_string_object(ts_input):
+            # User passed a date string to parse.
+            # Check that the user didn't also pass a date attribute kwarg.
+            if any(arg is not None for arg in _date_attributes):
+                raise ValueError('Cannot pass a date attribute keyword '
+                                 'argument when passing a date string')
+
+        elif ts_input is _no_input:
+            # User passed keyword arguments.
+            ts_input = datetime(year, month, day, hour or 0,
+                                minute or 0, second or 0,
+                                microsecond or 0)
+        elif is_integer_object(freq):
+            # User passed positional arguments:
+            # Timestamp(year, month, day[, hour[, minute[, second[,
+            # microsecond[, nanosecond[, tzinfo]]]]]])
+            ts_input = datetime(ts_input, freq, tz, unit or 0,
+                                year or 0, month or 0, day or 0)
+            nanosecond = hour
+            tz = minute
+            freq = None
+
+        if getattr(ts_input, 'tzinfo', None) is not None and tz is not None:
+            warnings.warn("Passing a datetime or Timestamp with tzinfo and the"
+                          " tz parameter will raise in the future. Use"
+                          " tz_convert instead.", FutureWarning)
+
+        ts = convert_to_tsobject(ts_input, tz, unit, 0, 0, nanosecond or 0)
+
+        if ts.value == NPY_NAT:
+            return NaT
+
+        if freq is None:
+            # GH 22311: Try to extract the frequency of a given Timestamp input
+            freq = getattr(ts_input, 'freq', None)
+        elif not is_offset_object(freq):
+            freq = to_offset(freq)
+
+        return create_timestamp_from_ts(ts.value, ts.dts, ts.tzinfo, freq)
+
+    def _round(self, freq, mode, ambiguous='raise', nonexistent='raise'):
+        if self.tz is not None:
+            value = self.tz_localize(None).value
+        else:
+            value = self.value
+
+        value = np.array([value], dtype=np.int64)
+
+        # Will only ever contain 1 element for timestamp
+        r = round_nsint64(value, mode, freq)[0]
+        result = Timestamp(r, unit='ns')
+        if self.tz is not None:
+            result = result.tz_localize(
+                self.tz, ambiguous=ambiguous, nonexistent=nonexistent
+            )
+        return result
+
+    def round(self, freq, ambiguous='raise', nonexistent='raise'):
+        """
+        Round the Timestamp to the specified resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the rounding resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        a new Timestamp rounded to the given resolution of `freq`
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(
+            freq, RoundTo.NEAREST_HALF_EVEN, ambiguous, nonexistent
+        )
+
+    def floor(self, freq, ambiguous='raise', nonexistent='raise'):
+        """
+        return a new Timestamp floored to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the flooring resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(freq, RoundTo.MINUS_INFTY, ambiguous, nonexistent)
+
+    def ceil(self, freq, ambiguous='raise', nonexistent='raise'):
+        """
+        return a new Timestamp ceiled to this resolution
+
+        Parameters
+        ----------
+        freq : a freq string indicating the ceiling resolution
+        ambiguous : bool, 'NaT', default 'raise'
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+            .. versionadded:: 0.24.0
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Raises
+        ------
+        ValueError if the freq cannot be converted
+        """
+        return self._round(freq, RoundTo.PLUS_INFTY, ambiguous, nonexistent)
+
+    @property
+    def tz(self):
+        """
+        Alias for tzinfo
+        """
+        return self.tzinfo
+
+    @tz.setter
+    def tz(self, value):
+        # GH 3746: Prevent localizing or converting the index by setting tz
+        raise AttributeError("Cannot directly set timezone. Use tz_localize() "
+                             "or tz_convert() as appropriate")
+
+    def __setstate__(self, state):
+        self.value = state[0]
+        self.freq = state[1]
+        self.tzinfo = state[2]
+
+    def __reduce__(self):
+        object_state = self.value, self.freq, self.tzinfo
+        return (Timestamp, object_state)
+
+    def to_period(self, freq=None):
+        """
+        Return an period of which this timestamp is an observation.
+        """
+        from pandas import Period
+
+        if self.tz is not None:
+            # GH#21333
+            warnings.warn("Converting to Period representation will "
+                          "drop timezone information.",
+                          UserWarning)
+
+        if freq is None:
+            freq = self.freq
+
+        return Period(self, freq=freq)
+
+    @property
+    def dayofweek(self):
+        """
+        Return day of whe week.
+        """
+        return self.weekday()
+
+    def day_name(self, locale=None):
+        """
+        Return the day name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the day name
+
+        Returns
+        -------
+        day_name : string
+
+        .. versionadded:: 0.23.0
+        """
+        return self._get_date_name_field('day_name', locale)
+
+    def month_name(self, locale=None):
+        """
+        Return the month name of the Timestamp with specified locale.
+
+        Parameters
+        ----------
+        locale : string, default None (English locale)
+            locale determining the language in which to return the month name
+
+        Returns
+        -------
+        month_name : string
+
+        .. versionadded:: 0.23.0
+        """
+        return self._get_date_name_field('month_name', locale)
+
+    @property
+    def weekday_name(self):
+        """
+        .. deprecated:: 0.23.0
+            Use ``Timestamp.day_name()`` instead
+        """
+        warnings.warn("`weekday_name` is deprecated and will be removed in a "
+                      "future version. Use `day_name` instead",
+                      FutureWarning)
+        return self.day_name()
+
+    @property
+    def dayofyear(self):
+        """
+        Return the day of the year.
+        """
+        return ccalendar.get_day_of_year(self.year, self.month, self.day)
+
+    @property
+    def week(self):
+        """
+        Return the week number of the year.
+        """
+        return ccalendar.get_week_of_year(self.year, self.month, self.day)
+
+    weekofyear = week
+
+    @property
+    def quarter(self):
+        """
+        Return the quarter of the year.
+        """
+        return ((self.month - 1) // 3) + 1
+
+    @property
+    def days_in_month(self):
+        """
+        Return the number of days in the month.
+        """
+        return ccalendar.get_days_in_month(self.year, self.month)
+
+    daysinmonth = days_in_month
+
+    @property
+    def freqstr(self):
+        """
+        Return the total number of days in the month.
+        """
+        return getattr(self.freq, 'freqstr', self.freq)
+
+    @property
+    def is_month_start(self):
+        """
+        Return True if date is first day of month.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == 1
+        return self._get_start_end_field('is_month_start')
+
+    @property
+    def is_month_end(self):
+        """
+        Return True if date is last day of month.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == self.days_in_month
+        return self._get_start_end_field('is_month_end')
+
+    @property
+    def is_quarter_start(self):
+        """
+        Return True if date is first day of the quarter.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == 1 and self.month % 3 == 1
+        return self._get_start_end_field('is_quarter_start')
+
+    @property
+    def is_quarter_end(self):
+        """
+        Return True if date is last day of the quarter.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return (self.month % 3) == 0 and self.day == self.days_in_month
+        return self._get_start_end_field('is_quarter_end')
+
+    @property
+    def is_year_start(self):
+        """
+        Return True if date is first day of the year.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.day == self.month == 1
+        return self._get_start_end_field('is_year_start')
+
+    @property
+    def is_year_end(self):
+        """
+        Return True if date is last day of the year.
+        """
+        if self.freq is None:
+            # fast-path for non-business frequencies
+            return self.month == 12 and self.day == 31
+        return self._get_start_end_field('is_year_end')
+
+    @property
+    def is_leap_year(self):
+        """
+        Return True if year is a leap year.
+        """
+        return bool(ccalendar.is_leapyear(self.year))
+
+    def tz_localize(self, tz, ambiguous='raise', nonexistent='raise',
+                    errors=None):
+        """
+        Convert naive Timestamp to local time zone, or remove
+        timezone from tz-aware Timestamp.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding local time.
+
+        ambiguous : bool, 'NaT', default 'raise'
+            When clocks moved backward due to DST, ambiguous times may arise.
+            For example in Central European Time (UTC+01), when going from
+            03:00 DST to 02:00 non-DST, 02:30:00 local time occurs both at
+            00:30:00 UTC and at 01:30:00 UTC. In such a situation, the
+            `ambiguous` parameter dictates how ambiguous times should be
+            handled.
+
+            - bool contains flags to determine if time is dst or not (note
+              that this flag is only applicable for ambiguous fall dst dates)
+            - 'NaT' will return NaT for an ambiguous time
+            - 'raise' will raise an AmbiguousTimeError for an ambiguous time
+
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : 'raise', 'coerce', default None
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+               valid in the specified timezone (e.g. due to a transition from
+               or to DST time). Use ``nonexistent='raise'`` instead.
+            - 'coerce' will return NaT if the timestamp can not be converted
+              into the specified timezone. Use ``nonexistent='NaT'`` instead.
+
+              .. deprecated:: 0.24.0
+
+        Returns
+        -------
+        localized : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If the Timestamp is tz-aware and tz is not None.
+        """
+        if ambiguous == 'infer':
+            raise ValueError('Cannot infer offset with only one time.')
+
+        if errors is not None:
+            warnings.warn("The errors argument is deprecated and will be "
+                          "removed in a future release. Use "
+                          "nonexistent='NaT' or nonexistent='raise' "
+                          "instead.", FutureWarning)
+            if errors == 'coerce':
+                nonexistent = 'NaT'
+            elif errors == 'raise':
+                nonexistent = 'raise'
+            else:
+                raise ValueError("The errors argument must be either 'coerce' "
+                                 "or 'raise'.")
+
+        nonexistent_options = ('raise', 'NaT', 'shift_forward',
+                               'shift_backward')
+        if nonexistent not in nonexistent_options and not isinstance(
+            nonexistent, timedelta):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT', 'shift_forward', 'shift_backward' or"
+                             " a timedelta object")
+
+        if self.tzinfo is None:
+            # tz naive, localize
+            tz = maybe_get_tz(tz)
+            if not is_string_object(ambiguous):
+                ambiguous = [ambiguous]
+            value = tz_localize_to_utc(np.array([self.value], dtype='i8'), tz,
+                                       ambiguous=ambiguous,
+                                       nonexistent=nonexistent)[0]
+            return Timestamp(value, tz=tz, freq=self.freq)
+        else:
+            if tz is None:
+                # reset tz
+                value = tz_convert_single(self.value, UTC, self.tz)
+                return Timestamp(value, tz=tz, freq=self.freq)
+            else:
+                raise TypeError('Cannot localize tz-aware Timestamp, use '
+                                'tz_convert for conversions')
+
+    def tz_convert(self, tz):
+        """
+        Convert tz-aware Timestamp to another time zone.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time which Timestamp will be converted to.
+            None will remove timezone holding UTC time.
+
+        Returns
+        -------
+        converted : Timestamp
+
+        Raises
+        ------
+        TypeError
+            If Timestamp is tz-naive.
+        """
+        if self.tzinfo is None:
+            # tz naive, use tz_localize
+            raise TypeError('Cannot convert tz-naive Timestamp, use '
+                            'tz_localize to localize')
+        else:
+            # Same UTC timestamp, different time zone
+            return Timestamp(self.value, tz=tz, freq=self.freq)
+
+    astimezone = tz_convert
+
+    def replace(self, year=None, month=None, day=None,
+                hour=None, minute=None, second=None, microsecond=None,
+                nanosecond=None, tzinfo=object, fold=0):
+        """
+        implements datetime.replace, handles nanoseconds
+
+        Parameters
+        ----------
+        year : int, optional
+        month : int, optional
+        day : int, optional
+        hour : int, optional
+        minute : int, optional
+        second : int, optional
+        microsecond : int, optional
+        nanosecond : int, optional
+        tzinfo : tz-convertible, optional
+        fold : int, optional, default is 0
+
+        Returns
+        -------
+        Timestamp with fields replaced
+        """
+
+        cdef:
+            npy_datetimestruct dts
+            int64_t value, value_tz, offset
+            object _tzinfo, result, k, v
+            datetime ts_input
+
+        # set to naive if needed
+        _tzinfo = self.tzinfo
+        value = self.value
+        if _tzinfo is not None:
+            value_tz = tz_convert_single(value, _tzinfo, UTC)
+            value += value - value_tz
+
+        # setup components
+        dt64_to_dtstruct(value, &dts)
+        dts.ps = self.nanosecond * 1000
+
+        # replace
+        def validate(k, v):
+            """ validate integers """
+            if not is_integer_object(v):
+                raise ValueError("value must be an integer, received "
+                                 "{v} for {k}".format(v=type(v), k=k))
+            return v
+
+        if year is not None:
+            dts.year = validate('year', year)
+        if month is not None:
+            dts.month = validate('month', month)
+        if day is not None:
+            dts.day = validate('day', day)
+        if hour is not None:
+            dts.hour = validate('hour', hour)
+        if minute is not None:
+            dts.min = validate('minute', minute)
+        if second is not None:
+            dts.sec = validate('second', second)
+        if microsecond is not None:
+            dts.us = validate('microsecond', microsecond)
+        if nanosecond is not None:
+            dts.ps = validate('nanosecond', nanosecond) * 1000
+        if tzinfo is not object:
+            _tzinfo = tzinfo
+
+        # reconstruct & check bounds
+        if _tzinfo is not None and treat_tz_as_pytz(_tzinfo):
+            # replacing across a DST boundary may induce a new tzinfo object
+            # see GH#18319
+            ts_input = _tzinfo.localize(datetime(dts.year, dts.month, dts.day,
+                                                 dts.hour, dts.min, dts.sec,
+                                                 dts.us),
+                                        is_dst=not bool(fold))
+            _tzinfo = ts_input.tzinfo
+        else:
+            kwargs = {'year': dts.year, 'month': dts.month, 'day': dts.day,
+                      'hour': dts.hour, 'minute': dts.min, 'second': dts.sec,
+                      'microsecond': dts.us, 'tzinfo': _tzinfo}
+            if PY36:
+                kwargs['fold'] = fold
+            ts_input = datetime(**kwargs)
+
+        ts = convert_datetime_to_tsobject(ts_input, _tzinfo)
+        value = ts.value + (dts.ps // 1000)
+        if value != NPY_NAT:
+            check_dts_bounds(&dts)
+
+        return create_timestamp_from_ts(value, dts, _tzinfo, self.freq)
+
+    def isoformat(self, sep='T'):
+        base = super(_Timestamp, self).isoformat(sep=sep)
+        if self.nanosecond == 0:
+            return base
+
+        if self.tzinfo is not None:
+            base1, base2 = base[:-6], base[-6:]
+        else:
+            base1, base2 = base, ""
+
+        if self.microsecond != 0:
+            base1 += "%.3d" % self.nanosecond
+        else:
+            base1 += ".%.9d" % self.nanosecond
+
+        return base1 + base2
+
+    def _has_time_component(self):
+        """
+        Returns if the Timestamp has a time component
+        in addition to the date part
+        """
+        return (self.time() != _zero_time
+                or self.tzinfo is not None
+                or self.nanosecond != 0)
+
+    def to_julian_date(self):
+        """
+        Convert TimeStamp to a Julian Date.
+        0 Julian date is noon January 1, 4713 BC.
+        """
+        year = self.year
+        month = self.month
+        day = self.day
+        if month <= 2:
+            year -= 1
+            month += 12
+        return (day +
+                np.fix((153 * month - 457) / 5) +
+                365 * year +
+                np.floor(year / 4) -
+                np.floor(year / 100) +
+                np.floor(year / 400) +
+                1721118.5 +
+                (self.hour +
+                 self.minute / 60.0 +
+                 self.second / 3600.0 +
+                 self.microsecond / 3600.0 / 1e+6 +
+                 self.nanosecond / 3600.0 / 1e+9
+                ) / 24.0)
+
+    def normalize(self):
+        """
+        Normalize Timestamp to midnight, preserving
+        tz information.
+        """
+        if self.tz is None or is_utc(self.tz):
+            DAY_NS = DAY_SECONDS * 1000000000
+            normalized_value = self.value - (self.value % DAY_NS)
+            return Timestamp(normalized_value).tz_localize(self.tz)
+        normalized_value = normalize_i8_timestamps(
+            np.array([self.value], dtype='i8'), tz=self.tz)[0]
+        return Timestamp(normalized_value).tz_localize(self.tz)
+
+    def __radd__(self, other):
+        # __radd__ on cython extension types like _Timestamp is not used, so
+        # define it here instead
+        return self + other
+
+
+# Add the min and max fields at the class level
+cdef int64_t _NS_UPPER_BOUND = np.iinfo(np.int64).max
+# the smallest value we could actually represent is
+#   INT64_MIN + 1 == -9223372036854775807
+# but to allow overflow free conversion with a microsecond resolution
+# use the smallest value with a 0 nanosecond unit (0s in last 3 digits)
+cdef int64_t _NS_LOWER_BOUND = -9223372036854775000
+
+# Resolution is in nanoseconds
+Timestamp.min = Timestamp(_NS_LOWER_BOUND)
+Timestamp.max = Timestamp(_NS_UPPER_BOUND)
diff --git a/pandas/_libs/tslibs/timezones.pxd b/pandas/_libs/tslibs/timezones.pxd
new file mode 100644
index 0000000000000..50c4a41f97a82
--- /dev/null
+++ b/pandas/_libs/tslibs/timezones.pxd
@@ -0,0 +1,16 @@
+# -*- coding: utf-8 -*-
+
+cpdef bint is_utc(object tz)
+cdef bint is_tzlocal(object tz)
+
+cdef bint treat_tz_as_pytz(object tz)
+cdef bint treat_tz_as_dateutil(object tz)
+
+cpdef bint tz_compare(object start, object end)
+cpdef object get_timezone(object tz)
+cpdef object maybe_get_tz(object tz)
+
+cdef get_utcoffset(tzinfo, obj)
+cdef bint is_fixed_offset(object tz)
+
+cdef object get_dst_info(object tz)
diff --git a/pandas/_libs/tslibs/timezones.pyx b/pandas/_libs/tslibs/timezones.pyx
new file mode 100644
index 0000000000000..43a35d77dd127
--- /dev/null
+++ b/pandas/_libs/tslibs/timezones.pyx
@@ -0,0 +1,359 @@
+# -*- coding: utf-8 -*-
+
+# dateutil compat
+from dateutil.tz import (
+    tzutc as _dateutil_tzutc,
+    tzlocal as _dateutil_tzlocal,
+    tzfile as _dateutil_tzfile)
+
+from dateutil.tz import gettz as dateutil_gettz
+
+from pytz.tzinfo import BaseTzInfo as _pytz_BaseTzInfo
+import pytz
+UTC = pytz.utc
+
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport int64_t
+cnp.import_array()
+
+# ----------------------------------------------------------------------
+from pandas._libs.tslibs.util cimport (
+    is_string_object, is_integer_object, get_nat)
+
+cdef int64_t NPY_NAT = get_nat()
+
+# ----------------------------------------------------------------------
+
+cpdef inline bint is_utc(object tz):
+    return tz is UTC or isinstance(tz, _dateutil_tzutc)
+
+
+cdef inline bint is_tzlocal(object tz):
+    return isinstance(tz, _dateutil_tzlocal)
+
+
+cdef inline bint treat_tz_as_pytz(object tz):
+    return (hasattr(tz, '_utc_transition_times') and
+            hasattr(tz, '_transition_info'))
+
+
+cdef inline bint treat_tz_as_dateutil(object tz):
+    return hasattr(tz, '_trans_list') and hasattr(tz, '_trans_idx')
+
+
+cpdef inline object get_timezone(object tz):
+    """
+    We need to do several things here:
+    1) Distinguish between pytz and dateutil timezones
+    2) Not be over-specific (e.g. US/Eastern with/without DST is same *zone*
+       but a different tz object)
+    3) Provide something to serialize when we're storing a datetime object
+       in pytables.
+
+    We return a string prefaced with dateutil if it's a dateutil tz, else just
+    the tz name. It needs to be a string so that we can serialize it with
+    UJSON/pytables. maybe_get_tz (below) is the inverse of this process.
+    """
+    if is_utc(tz):
+        return tz
+    else:
+        if treat_tz_as_dateutil(tz):
+            if '.tar.gz' in tz._filename:
+                raise ValueError(
+                    'Bad tz filename. Dateutil on python 3 on windows has a '
+                    'bug which causes tzfile._filename to be the same for all '
+                    'timezone files. Please construct dateutil timezones '
+                    'implicitly by passing a string like "dateutil/Europe'
+                    '/London" when you construct your pandas objects instead '
+                    'of passing a timezone object. See '
+                    'https://github.com/pandas-dev/pandas/pull/7362')
+            return 'dateutil/' + tz._filename
+        else:
+            # tz is a pytz timezone or unknown.
+            try:
+                zone = tz.zone
+                if zone is None:
+                    return tz
+                return zone
+            except AttributeError:
+                return tz
+
+
+cpdef inline object maybe_get_tz(object tz):
+    """
+    (Maybe) Construct a timezone object from a string. If tz is a string, use
+    it to construct a timezone object. Otherwise, just return tz.
+    """
+    if is_string_object(tz):
+        if tz == 'tzlocal()':
+            tz = _dateutil_tzlocal()
+        elif tz.startswith('dateutil/'):
+            zone = tz[9:]
+            tz = dateutil_gettz(zone)
+            # On Python 3 on Windows, the filename is not always set correctly.
+            if isinstance(tz, _dateutil_tzfile) and '.tar.gz' in tz._filename:
+                tz._filename = zone
+        else:
+            tz = pytz.timezone(tz)
+    elif is_integer_object(tz):
+        tz = pytz.FixedOffset(tz / 60)
+    return tz
+
+
+def _p_tz_cache_key(tz):
+    """ Python interface for cache function to facilitate testing."""
+    return tz_cache_key(tz)
+
+
+# Timezone data caches, key is the pytz string or dateutil file name.
+dst_cache = {}
+
+
+cdef inline object tz_cache_key(object tz):
+    """
+    Return the key in the cache for the timezone info object or None
+    if unknown.
+
+    The key is currently the tz string for pytz timezones, the filename for
+    dateutil timezones.
+
+    Notes
+    =====
+    This cannot just be the hash of a timezone object. Unfortunately, the
+    hashes of two dateutil tz objects which represent the same timezone are
+    not equal (even though the tz objects will compare equal and represent
+    the same tz file). Also, pytz objects are not always hashable so we use
+    str(tz) instead.
+    """
+    if isinstance(tz, _pytz_BaseTzInfo):
+        return tz.zone
+    elif isinstance(tz, _dateutil_tzfile):
+        if '.tar.gz' in tz._filename:
+            raise ValueError('Bad tz filename. Dateutil on python 3 on '
+                             'windows has a bug which causes tzfile._filename '
+                             'to be the same for all timezone files. Please '
+                             'construct dateutil timezones implicitly by '
+                             'passing a string like "dateutil/Europe/London" '
+                             'when you construct your pandas objects instead '
+                             'of passing a timezone object. See '
+                             'https://github.com/pandas-dev/pandas/pull/7362')
+        return 'dateutil' + tz._filename
+    else:
+        return None
+
+
+# ----------------------------------------------------------------------
+# UTC Offsets
+
+
+cdef get_utcoffset(tzinfo, obj):
+    try:
+        return tzinfo._utcoffset
+    except AttributeError:
+        return tzinfo.utcoffset(obj)
+
+
+cdef inline bint is_fixed_offset(object tz):
+    if treat_tz_as_dateutil(tz):
+        if len(tz._trans_idx) == 0 and len(tz._trans_list) == 0:
+            return 1
+        else:
+            return 0
+    elif treat_tz_as_pytz(tz):
+        if (len(tz._transition_info) == 0
+                and len(tz._utc_transition_times) == 0):
+            return 1
+        else:
+            return 0
+    return 1
+
+
+cdef object get_utc_trans_times_from_dateutil_tz(object tz):
+    """
+    Transition times in dateutil timezones are stored in local non-dst
+    time.  This code converts them to UTC. It's the reverse of the code
+    in dateutil.tz.tzfile.__init__.
+    """
+    new_trans = list(tz._trans_list)
+    last_std_offset = 0
+    for i, (trans, tti) in enumerate(zip(tz._trans_list, tz._trans_idx)):
+        if not tti.isdst:
+            last_std_offset = tti.offset
+        new_trans[i] = trans - last_std_offset
+    return new_trans
+
+
+cdef int64_t[:] unbox_utcoffsets(object transinfo):
+    cdef:
+        Py_ssize_t i, sz
+        int64_t[:] arr
+
+    sz = len(transinfo)
+    arr = np.empty(sz, dtype='i8')
+
+    for i in range(sz):
+        arr[i] = int(transinfo[i][0].total_seconds()) * 1000000000
+
+    return arr
+
+
+# ----------------------------------------------------------------------
+# Daylight Savings
+
+
+cdef object get_dst_info(object tz):
+    """
+    return a tuple of :
+      (UTC times of DST transitions,
+       UTC offsets in microseconds corresponding to DST transitions,
+       string of type of transitions)
+
+    """
+    cache_key = tz_cache_key(tz)
+    if cache_key is None:
+        # e.g. pytz.FixedOffset, matplotlib.dates._UTC,
+        # psycopg2.tz.FixedOffsetTimezone
+        num = int(get_utcoffset(tz, None).total_seconds()) * 1000000000
+        return (np.array([NPY_NAT + 1], dtype=np.int64),
+                np.array([num], dtype=np.int64),
+                None)
+
+    if cache_key not in dst_cache:
+        if treat_tz_as_pytz(tz):
+            trans = np.array(tz._utc_transition_times, dtype='M8[ns]')
+            trans = trans.view('i8')
+            try:
+                if tz._utc_transition_times[0].year == 1:
+                    trans[0] = NPY_NAT + 1
+            except Exception:
+                pass
+            deltas = unbox_utcoffsets(tz._transition_info)
+            typ = 'pytz'
+
+        elif treat_tz_as_dateutil(tz):
+            if len(tz._trans_list):
+                # get utc trans times
+                trans_list = get_utc_trans_times_from_dateutil_tz(tz)
+                trans = np.hstack([
+                    np.array([0], dtype='M8[s]'),  # place holder for 1st item
+                    np.array(trans_list, dtype='M8[s]')]).astype(
+                    'M8[ns]')  # all trans listed
+                trans = trans.view('i8')
+                trans[0] = NPY_NAT + 1
+
+                # deltas
+                deltas = np.array([v.offset for v in (
+                    tz._ttinfo_before,) + tz._trans_idx], dtype='i8')
+                deltas *= 1000000000
+                typ = 'dateutil'
+
+            elif is_fixed_offset(tz):
+                trans = np.array([NPY_NAT + 1], dtype=np.int64)
+                deltas = np.array([tz._ttinfo_std.offset],
+                                  dtype='i8') * 1000000000
+                typ = 'fixed'
+            else:
+                # 2018-07-12 this is not reached in the tests, and this case
+                # is not handled in any of the functions that call
+                # get_dst_info.  If this case _were_ hit the calling
+                # functions would then hit an IndexError because they assume
+                # `deltas` is non-empty.
+                # (under the just-deleted code that returned empty arrays)
+                raise AssertionError("dateutil tzinfo is not a FixedOffset "
+                                     "and has an empty `_trans_list`.", tz)
+
+        else:
+            # static tzinfo
+            # TODO: This case is not hit in tests (2018-07-17); is it possible?
+            trans = np.array([NPY_NAT + 1], dtype=np.int64)
+            num = int(get_utcoffset(tz, None).total_seconds()) * 1000000000
+            deltas = np.array([num], dtype=np.int64)
+            typ = 'static'
+
+        dst_cache[cache_key] = (trans, deltas, typ)
+
+    return dst_cache[cache_key]
+
+
+def infer_tzinfo(start, end):
+    if start is not None and end is not None:
+        tz = start.tzinfo
+        if not tz_compare(tz, end.tzinfo):
+            msg = 'Inputs must both have the same timezone, {tz1} != {tz2}'
+            raise AssertionError(msg.format(tz1=tz, tz2=end.tzinfo))
+    elif start is not None:
+        tz = start.tzinfo
+    elif end is not None:
+        tz = end.tzinfo
+    else:
+        tz = None
+    return tz
+
+
+cpdef bint tz_compare(object start, object end):
+    """
+    Compare string representations of timezones
+
+    The same timezone can be represented as different instances of
+    timezones. For example
+    `<DstTzInfo 'Europe/Paris' LMT+0:09:00 STD>` and
+    `<DstTzInfo 'Europe/Paris' CET+1:00:00 STD>` are essentially same
+    timezones but aren't evaluated such, but the string representation
+    for both of these is `'Europe/Paris'`.
+
+    This exists only to add a notion of equality to pytz-style zones
+    that is compatible with the notion of equality expected of tzinfo
+    subclasses.
+
+    Parameters
+    ----------
+    start : tzinfo
+    end : tzinfo
+
+    Returns:
+    -------
+    compare : bint
+
+    """
+    # GH 18523
+    return get_timezone(start) == get_timezone(end)
+
+
+def tz_standardize(tz: object):
+    """
+    If the passed tz is a pytz timezone object, "normalize" it to the a
+    consistent version
+
+    Parameters
+    ----------
+    tz : tz object
+
+    Returns:
+    -------
+    tz object
+
+    Examples:
+    --------
+    >>> tz
+    <DstTzInfo 'US/Pacific' PST-1 day, 16:00:00 STD>
+
+    >>> tz_standardize(tz)
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz_standardize(tz)
+    <DstTzInfo 'US/Pacific' LMT-1 day, 16:07:00 STD>
+
+    >>> tz
+    dateutil.tz.tz.tzutc
+
+    >>> tz_standardize(tz)
+    dateutil.tz.tz.tzutc
+    """
+    if treat_tz_as_pytz(tz):
+        return pytz.timezone(str(tz))
+    return tz
diff --git a/pandas/_libs/tslibs/util.pxd b/pandas/_libs/tslibs/util.pxd
new file mode 100644
index 0000000000000..ef7065a44f18b
--- /dev/null
+++ b/pandas/_libs/tslibs/util.pxd
@@ -0,0 +1,229 @@
+
+from cpython cimport PyTypeObject
+
+cdef extern from *:
+    """
+    PyObject* char_to_string(const char* data) {
+    #if PY_VERSION_HEX >= 0x03000000
+        return PyUnicode_FromString(data);
+    #else
+        return PyString_FromString(data);
+    #endif
+    }
+    """
+    object char_to_string(const char* data)
+
+
+cdef extern from "Python.h":
+    # Note: importing extern-style allows us to declare these as nogil
+    # functions, whereas `from cpython cimport` does not.
+    bint PyUnicode_Check(object obj) nogil
+    bint PyString_Check(object obj) nogil
+    bint PyBool_Check(object obj) nogil
+    bint PyFloat_Check(object obj) nogil
+    bint PyComplex_Check(object obj) nogil
+    bint PyObject_TypeCheck(object obj, PyTypeObject* type) nogil
+
+from numpy cimport int64_t
+
+cdef extern from "numpy/arrayobject.h":
+    PyTypeObject PyFloatingArrType_Type
+    int _import_array() except -1
+
+cdef extern from "numpy/ndarrayobject.h":
+    PyTypeObject PyTimedeltaArrType_Type
+    PyTypeObject PyDatetimeArrType_Type
+    PyTypeObject PyComplexFloatingArrType_Type
+    PyTypeObject PyBoolArrType_Type
+
+    bint PyArray_IsIntegerScalar(obj) nogil
+    bint PyArray_Check(obj) nogil
+
+cdef extern from  "numpy/npy_common.h":
+    int64_t NPY_MIN_INT64
+
+
+cdef inline int64_t get_nat():
+    return NPY_MIN_INT64
+
+
+cdef inline int import_array() except -1:
+    _import_array()
+
+
+# --------------------------------------------------------------------
+# Type Checking
+
+cdef inline bint is_string_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, compat.string_types)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_string : bool
+    """
+    return PyString_Check(obj) or PyUnicode_Check(obj)
+
+
+cdef inline bint is_integer_object(object obj) nogil:
+    """
+    Cython equivalent of
+
+    `isinstance(val, (int, long, np.integer)) and not isinstance(val, bool)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_integer : bool
+
+    Notes
+    -----
+    This counts np.timedelta64 objects as integers.
+    """
+    return not PyBool_Check(obj) and PyArray_IsIntegerScalar(obj)
+
+
+cdef inline bint is_float_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, (float, np.complex_))`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_float : bool
+    """
+    return (PyFloat_Check(obj) or
+            (PyObject_TypeCheck(obj, &PyFloatingArrType_Type)))
+
+
+cdef inline bint is_complex_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, (complex, np.complex_))`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_complex : bool
+    """
+    return (PyComplex_Check(obj) or
+            PyObject_TypeCheck(obj, &PyComplexFloatingArrType_Type))
+
+
+cdef inline bint is_bool_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, (bool, np.bool_))`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_bool : bool
+    """
+    return (PyBool_Check(obj) or
+            PyObject_TypeCheck(obj, &PyBoolArrType_Type))
+
+
+cdef inline bint is_timedelta64_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, np.timedelta64)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_timedelta64 : bool
+    """
+    return PyObject_TypeCheck(obj, &PyTimedeltaArrType_Type)
+
+
+cdef inline bint is_datetime64_object(object obj) nogil:
+    """
+    Cython equivalent of `isinstance(val, np.datetime64)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_datetime64 : bool
+    """
+    return PyObject_TypeCheck(obj, &PyDatetimeArrType_Type)
+
+
+cdef inline bint is_array(object val):
+    """
+    Cython equivalent of `isinstance(val, np.ndarray)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_ndarray : bool
+    """
+    return PyArray_Check(val)
+
+
+cdef inline bint is_period_object(object val):
+    """
+    Cython equivalent of `isinstance(val, pd.Period)`
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_period : bool
+    """
+    return getattr(val, '_typ', '_typ') == 'period'
+
+
+cdef inline bint is_offset_object(object val):
+    """
+    Check if an object is a DateOffset object.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_date_offset : bool
+    """
+    return getattr(val, '_typ', None) == "dateoffset"
+
+
+cdef inline bint is_nan(object val):
+    """
+    Check if val is a Not-A-Number float or complex, including
+    float('NaN') and np.nan.
+
+    Parameters
+    ----------
+    val : object
+
+    Returns
+    -------
+    is_nan : bool
+    """
+    return (is_float_object(val) or is_complex_object(val)) and val != val
diff --git a/pandas/_libs/util.pxd b/pandas/_libs/util.pxd
new file mode 100644
index 0000000000000..05a013ec0d7c9
--- /dev/null
+++ b/pandas/_libs/util.pxd
@@ -0,0 +1,114 @@
+from pandas._libs.tslibs.util cimport *
+
+from cython cimport Py_ssize_t
+
+cimport numpy as cnp
+from numpy cimport ndarray
+
+cdef extern from "numpy/ndarraytypes.h":
+    void PyArray_CLEARFLAGS(ndarray arr, int flags) nogil
+
+
+cdef extern from "numpy/arrayobject.h":
+    enum:
+        NPY_ARRAY_C_CONTIGUOUS
+        NPY_ARRAY_F_CONTIGUOUS
+
+
+cdef extern from *:
+    """
+    // returns ASCII or UTF8 (py3) view on python str
+    // python object owns memory, should not be freed
+    static const char* get_c_string(PyObject* obj) {
+    #if PY_VERSION_HEX >= 0x03000000
+        return PyUnicode_AsUTF8(obj);
+    #else
+        return PyString_AsString(obj);
+    #endif
+    }
+    """
+    const char *get_c_string(object) except NULL
+
+
+cdef extern from "src/headers/stdint.h":
+    enum: UINT8_MAX
+    enum: UINT16_MAX
+    enum: UINT32_MAX
+    enum: UINT64_MAX
+    enum: INT8_MIN
+    enum: INT8_MAX
+    enum: INT16_MIN
+    enum: INT16_MAX
+    enum: INT32_MAX
+    enum: INT32_MIN
+    enum: INT64_MAX
+    enum: INT64_MIN
+
+
+ctypedef fused numeric:
+    cnp.int8_t
+    cnp.int16_t
+    cnp.int32_t
+    cnp.int64_t
+
+    cnp.uint8_t
+    cnp.uint16_t
+    cnp.uint32_t
+    cnp.uint64_t
+
+    cnp.float32_t
+    cnp.float64_t
+
+
+cdef inline void set_array_not_contiguous(ndarray ao) nogil:
+    # Numpy>=1.8-compliant equivalent to:
+    # ao->flags &= ~(NPY_ARRAY_C_CONTIGUOUS | NPY_ARRAY_F_CONTIGUOUS);
+    PyArray_CLEARFLAGS(ao,
+                       (NPY_ARRAY_C_CONTIGUOUS | NPY_ARRAY_F_CONTIGUOUS))
+
+
+cdef inline Py_ssize_t validate_indexer(ndarray arr, object loc) except -1:
+    """
+    Cast the given indexer `loc` to an integer.  If it is negative, i.e. a
+    python-style indexing-from-the-end indexer, translate it to a
+    from-the-front indexer.  Raise if this is not possible.
+
+    Parameters
+    ----------
+    arr : ndarray
+    loc : object
+
+    Returns
+    -------
+    idx : Py_ssize_t
+
+    Raises
+    ------
+    IndexError
+    """
+    cdef:
+        Py_ssize_t idx, size
+        int casted
+
+    if is_float_object(loc):
+        casted = int(loc)
+        if casted == loc:
+            loc = casted
+
+    idx = <Py_ssize_t>loc
+    size = cnp.PyArray_SIZE(arr)
+
+    if idx < 0 and size > 0:
+        idx += size
+    if idx >= size or size == 0 or idx < 0:
+        raise IndexError('index out of bounds')
+
+    return idx
+
+
+cdef inline object get_value_at(ndarray arr, object loc):
+    cdef:
+        Py_ssize_t i
+
+    i = validate_indexer(arr, loc)
+    return arr[i]
diff --git a/pandas/_libs/window.pyx b/pandas/_libs/window.pyx
new file mode 100644
index 0000000000000..cc5b3b63f5b04
--- /dev/null
+++ b/pandas/_libs/window.pyx
@@ -0,0 +1,1911 @@
+# -*- coding: utf-8 -*-
+# cython: boundscheck=False, wraparound=False, cdivision=True
+
+import cython
+from cython import Py_ssize_t
+from libcpp.deque cimport deque
+
+from libc.stdlib cimport malloc, free
+
+import numpy as np
+cimport numpy as cnp
+from numpy cimport ndarray, int64_t, float64_t, float32_t
+cnp.import_array()
+
+
+cdef extern from "src/headers/cmath" namespace "std":
+    bint isnan(float64_t) nogil
+    bint notnan(float64_t) nogil
+    int signbit(float64_t) nogil
+    float64_t sqrt(float64_t x) nogil
+
+cimport pandas._libs.util as util
+from pandas._libs.util cimport numeric
+
+from pandas._libs.skiplist cimport (
+    skiplist_t, skiplist_init, skiplist_destroy, skiplist_get, skiplist_insert,
+    skiplist_remove)
+
+cdef:
+    float32_t MINfloat32 = np.NINF
+    float64_t MINfloat64 = np.NINF
+
+    float32_t MAXfloat32 = np.inf
+    float64_t MAXfloat64 = np.inf
+
+    float64_t NaN = <float64_t>np.NaN
+
+cdef inline int int_max(int a, int b): return a if a >= b else b
+cdef inline int int_min(int a, int b): return a if a <= b else b
+
+
+# Cython implementations of rolling sum, mean, variance, skewness,
+# other statistical moment functions
+#
+# Misc implementation notes
+# -------------------------
+#
+# - In Cython x * x is faster than x ** 2 for C types, this should be
+#   periodically revisited to see if it's still true.
+#
+
+
+def _check_minp(win, minp, N, floor=None):
+    """
+    Parameters
+    ----------
+    win: int
+    minp: int or None
+    N: len of window
+    floor: int, optional
+        default 1
+
+    Returns
+    -------
+    minimum period
+    """
+
+    if minp is None:
+        minp = 1
+    if not util.is_integer_object(minp):
+        raise ValueError("min_periods must be an integer")
+    if minp > win:
+        raise ValueError("min_periods (%d) must be <= "
+                         "window (%d)" % (minp, win))
+    elif minp > N:
+        minp = N + 1
+    elif minp < 0:
+        raise ValueError('min_periods must be >= 0')
+    if floor is None:
+        floor = 1
+
+    return max(minp, floor)
+
+
+# original C implementation by N. Devillard.
+# This code in public domain.
+# Function :   kth_smallest()
+# In       :   array of elements, # of elements in the array, rank k
+# Out      :   one element
+# Job      :   find the kth smallest element in the array
+
+#             Reference:
+
+#               Author: Wirth, Niklaus
+#                Title: Algorithms + data structures = programs
+#            Publisher: Englewood Cliffs: Prentice-Hall, 1976
+# Physical description: 366 p.
+#               Series: Prentice-Hall Series in Automatic Computation
+
+# ----------------------------------------------------------------------
+# The indexer objects for rolling
+# These define start/end indexers to compute offsets
+
+
+cdef class WindowIndexer:
+
+    cdef:
+        ndarray start, end
+        int64_t N, minp, win
+        bint is_variable
+
+    def get_data(self):
+        return (self.start, self.end, <int64_t>self.N,
+                <int64_t>self.win, <int64_t>self.minp,
+                self.is_variable)
+
+
+cdef class MockFixedWindowIndexer(WindowIndexer):
+    """
+
+    We are just checking parameters of the indexer,
+    and returning a consistent API with fixed/variable
+    indexers.
+
+    Parameters
+    ----------
+    values: ndarray
+        values data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: object
+        index of the values
+    floor: optional
+        unit for flooring
+    left_closed: bint
+        left endpoint closedness
+    right_closed: bint
+        right endpoint closedness
+
+    """
+    def __init__(self, ndarray values, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed,
+                 object index=None, object floor=None):
+
+        assert index is None
+        self.is_variable = 0
+        self.N = len(values)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+        self.start = np.empty(0, dtype='int64')
+        self.end = np.empty(0, dtype='int64')
+        self.win = win
+
+
+cdef class FixedWindowIndexer(WindowIndexer):
+    """
+    create a fixed length window indexer object
+    that has start & end, that point to offsets in
+    the index object; these are defined based on the win
+    arguments
+
+    Parameters
+    ----------
+    values: ndarray
+        values data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: object
+        index of the values
+    floor: optional
+        unit for flooring the unit
+    left_closed: bint
+        left endpoint closedness
+    right_closed: bint
+        right endpoint closedness
+
+    """
+    def __init__(self, ndarray values, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed,
+                 object index=None, object floor=None):
+        cdef ndarray start_s, start_e, end_s, end_e
+
+        assert index is None
+        self.is_variable = 0
+        self.N = len(values)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+
+        start_s = np.zeros(win, dtype='int64')
+        start_e = np.arange(win, self.N, dtype='int64') - win + 1
+        self.start = np.concatenate([start_s, start_e])
+
+        end_s = np.arange(win, dtype='int64') + 1
+        end_e = start_e + win
+        self.end = np.concatenate([end_s, end_e])
+        self.win = win
+
+
+cdef class VariableWindowIndexer(WindowIndexer):
+    """
+    create a variable length window indexer object
+    that has start & end, that point to offsets in
+    the index object; these are defined based on the win
+    arguments
+
+    Parameters
+    ----------
+    values: ndarray
+        values data array
+    win: int64_t
+        window size
+    minp: int64_t
+        min number of obs in a window to consider non-NaN
+    index: ndarray
+        index of the values
+    left_closed: bint
+        left endpoint closedness
+        True if the left endpoint is closed, False if open
+    right_closed: bint
+        right endpoint closedness
+        True if the right endpoint is closed, False if open
+    floor: optional
+        unit for flooring the unit
+    """
+    def __init__(self, ndarray values, int64_t win, int64_t minp,
+                 bint left_closed, bint right_closed, ndarray index,
+                 object floor=None):
+
+        self.is_variable = 1
+        self.N = len(index)
+        self.minp = _check_minp(win, minp, self.N, floor=floor)
+
+        self.start = np.empty(self.N, dtype='int64')
+        self.start.fill(-1)
+
+        self.end = np.empty(self.N, dtype='int64')
+        self.end.fill(-1)
+
+        self.build(index, win, left_closed, right_closed)
+
+        # max window size
+        self.win = (self.end - self.start).max()
+
+    def build(self, const int64_t[:] index, int64_t win, bint left_closed,
+              bint right_closed):
+
+        cdef:
+            ndarray[int64_t] start, end
+            int64_t start_bound, end_bound, N
+            Py_ssize_t i, j
+
+        start = self.start
+        end = self.end
+        N = self.N
+
+        start[0] = 0
+
+        # right endpoint is closed
+        if right_closed:
+            end[0] = 1
+        # right endpoint is open
+        else:
+            end[0] = 0
+
+        with nogil:
+
+            # start is start of slice interval (including)
+            # end is end of slice interval (not including)
+            for i in range(1, N):
+                end_bound = index[i]
+                start_bound = index[i] - win
+
+                # left endpoint is closed
+                if left_closed:
+                    start_bound -= 1
+
+                # advance the start bound until we are
+                # within the constraint
+                start[i] = i
+                for j in range(start[i - 1], i):
+                    if index[j] > start_bound:
+                        start[i] = j
+                        break
+
+                # end bound is previous end
+                # or current index
+                if index[end[i - 1]] <= end_bound:
+                    end[i] = i + 1
+                else:
+                    end[i] = end[i - 1]
+
+                # right endpoint is open
+                if not right_closed:
+                    end[i] -= 1
+
+
+def get_window_indexer(values, win, minp, index, closed,
+                       floor=None, use_mock=True):
+    """
+    return the correct window indexer for the computation
+
+    Parameters
+    ----------
+    values: 1d ndarray
+    win: integer, window size
+    minp: integer, minimum periods
+    index: 1d ndarray, optional
+        index to the values array
+    closed: string, default None
+        {'right', 'left', 'both', 'neither'}
+        window endpoint closedness. Defaults to 'right' in
+        VariableWindowIndexer and to 'both' in FixedWindowIndexer
+    floor: optional
+        unit for flooring the unit
+    use_mock: boolean, default True
+        if we are a fixed indexer, return a mock indexer
+        instead of the FixedWindow Indexer. This is a type
+        compat Indexer that allows us to use a standard
+        code path with all of the indexers.
+
+
+    Returns
+    -------
+    tuple of 1d int64 ndarrays of the offsets & data about the window
+
+    """
+
+    cdef:
+        bint left_closed = False
+        bint right_closed = False
+
+    assert closed is None or closed in ['right', 'left', 'both', 'neither']
+
+    # if windows is variable, default is 'right', otherwise default is 'both'
+    if closed is None:
+        closed = 'right' if index is not None else 'both'
+
+    if closed in ['right', 'both']:
+        right_closed = True
+
+    if closed in ['left', 'both']:
+        left_closed = True
+
+    if index is not None:
+        indexer = VariableWindowIndexer(values, win, minp, left_closed,
+                                        right_closed, index, floor)
+    elif use_mock:
+        indexer = MockFixedWindowIndexer(values, win, minp, left_closed,
+                                         right_closed, index, floor)
+    else:
+        indexer = FixedWindowIndexer(values, win, minp, left_closed,
+                                     right_closed, index, floor)
+    return indexer.get_data()
+
+
+# ----------------------------------------------------------------------
+# Rolling count
+# this is only an impl for index not None, IOW, freq aware
+
+
+def roll_count(ndarray[float64_t] values, int64_t win, int64_t minp,
+               object index, object closed):
+    cdef:
+        float64_t val, count_x = 0.0
+        int64_t s, e, nobs, N
+        Py_ssize_t i, j
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, _ = get_window_indexer(values, win,
+                                                     minp, index, closed)
+    output = np.empty(N, dtype=float)
+
+    with nogil:
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                count_x = 0.0
+                for j in range(s, e):
+                    val = values[j]
+                    if notnan(val):
+                        count_x += 1.0
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = values[j]
+                    if notnan(val):
+                        count_x -= 1.0
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = values[j]
+                    if notnan(val):
+                        count_x += 1.0
+
+            if count_x >= minp:
+                output[i] = count_x
+            else:
+                output[i] = NaN
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling sum
+
+
+cdef inline float64_t calc_sum(int64_t minp, int64_t nobs,
+                               float64_t sum_x) nogil:
+    cdef:
+        float64_t result
+
+    if nobs >= minp:
+        result = sum_x
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_sum(float64_t val, int64_t *nobs, float64_t *sum_x) nogil:
+    """ add a value from the sum calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] + 1
+        sum_x[0] = sum_x[0] + val
+
+
+cdef inline void remove_sum(float64_t val,
+                            int64_t *nobs, float64_t *sum_x) nogil:
+    """ remove a value from the sum calc """
+
+    if notnan(val):
+        nobs[0] = nobs[0] - 1
+        sum_x[0] = sum_x[0] - val
+
+
+def roll_sum(ndarray[float64_t] values, int64_t win, int64_t minp,
+             object index, object closed):
+    cdef:
+        float64_t val, prev_x, sum_x = 0
+        int64_t s, e, range_endpoint
+        int64_t nobs = 0, i, j, N
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(values, win,
+                                                               minp, index,
+                                                               closed,
+                                                               floor=0)
+    output = np.empty(N, dtype=float)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we have 2 paths
+    # but is faster
+
+    if is_variable:
+
+        # variable window
+        with nogil:
+
+            for i in range(0, N):
+                s = start[i]
+                e = end[i]
+
+                if i == 0:
+
+                    # setup
+                    sum_x = 0.0
+                    nobs = 0
+                    for j in range(s, e):
+                        add_sum(values[j], &nobs, &sum_x)
+
+                else:
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_sum(values[j], &nobs, &sum_x)
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_sum(values[j], &nobs, &sum_x)
+
+                output[i] = calc_sum(minp, nobs, sum_x)
+
+    else:
+
+        # fixed window
+
+        range_endpoint = int_max(minp, 1) - 1
+
+        with nogil:
+
+            for i in range(0, range_endpoint):
+                add_sum(values[i], &nobs, &sum_x)
+                output[i] = NaN
+
+            for i in range(range_endpoint, N):
+                val = values[i]
+                add_sum(val, &nobs, &sum_x)
+
+                if i > win - 1:
+                    prev_x = values[i - win]
+                    remove_sum(prev_x, &nobs, &sum_x)
+
+                output[i] = calc_sum(minp, nobs, sum_x)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling mean
+
+
+cdef inline float64_t calc_mean(int64_t minp, Py_ssize_t nobs,
+                                Py_ssize_t neg_ct, float64_t sum_x) nogil:
+    cdef:
+        float64_t result
+
+    if nobs >= minp:
+        result = sum_x / <float64_t>nobs
+        if neg_ct == 0 and result < 0:
+            # all positive
+            result = 0
+        elif neg_ct == nobs and result > 0:
+            # all negative
+            result = 0
+        else:
+            pass
+    else:
+        result = NaN
+    return result
+
+
+cdef inline void add_mean(float64_t val, Py_ssize_t *nobs, float64_t *sum_x,
+                          Py_ssize_t *neg_ct) nogil:
+    """ add a value from the mean calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] + 1
+        sum_x[0] = sum_x[0] + val
+        if signbit(val):
+            neg_ct[0] = neg_ct[0] + 1
+
+
+cdef inline void remove_mean(float64_t val, Py_ssize_t *nobs, float64_t *sum_x,
+                             Py_ssize_t *neg_ct) nogil:
+    """ remove a value from the mean calc """
+
+    if notnan(val):
+        nobs[0] = nobs[0] - 1
+        sum_x[0] = sum_x[0] - val
+        if signbit(val):
+            neg_ct[0] = neg_ct[0] - 1
+
+
+def roll_mean(ndarray[float64_t] values, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        float64_t val, prev_x, result, sum_x = 0
+        int64_t s, e
+        bint is_variable
+        Py_ssize_t nobs = 0, i, j, neg_ct = 0, N
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(values, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we have 2 paths
+    # but is faster
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+                s = start[i]
+                e = end[i]
+
+                if i == 0:
+
+                    # setup
+                    sum_x = 0.0
+                    nobs = 0
+                    for j in range(s, e):
+                        val = values[j]
+                        add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                else:
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        val = values[j]
+                        remove_mean(val, &nobs, &sum_x, &neg_ct)
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        val = values[j]
+                        add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
+
+    else:
+
+        with nogil:
+            for i in range(minp - 1):
+                val = values[i]
+                add_mean(val, &nobs, &sum_x, &neg_ct)
+                output[i] = NaN
+
+            for i in range(minp - 1, N):
+                val = values[i]
+                add_mean(val, &nobs, &sum_x, &neg_ct)
+
+                if i > win - 1:
+                    prev_x = values[i - win]
+                    remove_mean(prev_x, &nobs, &sum_x, &neg_ct)
+
+                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling variance
+
+
+cdef inline float64_t calc_var(int64_t minp, int ddof, float64_t nobs,
+                               float64_t ssqdm_x) nogil:
+    cdef:
+        float64_t result
+
+    # Variance is unchanged if no observation is added or removed
+    if (nobs >= minp) and (nobs > ddof):
+
+        # pathological case
+        if nobs == 1:
+            result = 0
+        else:
+            result = ssqdm_x / (nobs - <float64_t>ddof)
+            if result < 0:
+                result = 0
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_var(float64_t val, float64_t *nobs, float64_t *mean_x,
+                         float64_t *ssqdm_x) nogil:
+    """ add a value from the var calc """
+    cdef:
+        float64_t delta
+
+    # `isnan` instead of equality as fix for GH-21813, msvc 2017 bug
+    if isnan(val):
+        return
+
+    nobs[0] = nobs[0] + 1
+    # a part of Welford's method for the online variance-calculation
+    # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+    delta = val - mean_x[0]
+    mean_x[0] = mean_x[0] + delta / nobs[0]
+    ssqdm_x[0] = ssqdm_x[0] + ((nobs[0] - 1) * delta ** 2) / nobs[0]
+
+
+cdef inline void remove_var(float64_t val, float64_t *nobs, float64_t *mean_x,
+                            float64_t *ssqdm_x) nogil:
+    """ remove a value from the var calc """
+    cdef:
+        float64_t delta
+
+    if notnan(val):
+        nobs[0] = nobs[0] - 1
+        if nobs[0]:
+            # a part of Welford's method for the online variance-calculation
+            # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+            delta = val - mean_x[0]
+            mean_x[0] = mean_x[0] - delta / nobs[0]
+            ssqdm_x[0] = ssqdm_x[0] - ((nobs[0] + 1) * delta ** 2) / nobs[0]
+        else:
+            mean_x[0] = 0
+            ssqdm_x[0] = 0
+
+
+def roll_var(ndarray[float64_t] values, int64_t win, int64_t minp,
+             object index, object closed, int ddof=1):
+    """
+    Numerically stable implementation using Welford's method.
+    """
+    cdef:
+        float64_t mean_x = 0, ssqdm_x = 0, nobs = 0,
+        float64_t val, prev, delta, mean_x_old
+        int64_t s, e
+        bint is_variable
+        Py_ssize_t i, j, N
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(values, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    # Check for windows larger than array, addresses #7297
+    win = min(win, N)
+
+    # for performance we are going to iterate
+    # fixed windows separately, makes the code more complex as we
+    # have 2 paths but is faster
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        add_var(values[j], &nobs, &mean_x, &ssqdm_x)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_var(values[j], &nobs, &mean_x, &ssqdm_x)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_var(values[j], &nobs, &mean_x, &ssqdm_x)
+
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+    else:
+
+        with nogil:
+
+            # Over the first window, observations can only be added, never
+            # removed
+            for i in range(win):
+                add_var(values[i], &nobs, &mean_x, &ssqdm_x)
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+            # a part of Welford's method for the online variance-calculation
+            # https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance
+
+            # After the first window, observations can both be added and
+            # removed
+            for i in range(win, N):
+                val = values[i]
+                prev = values[i - win]
+
+                if notnan(val):
+                    if prev == prev:
+
+                        # Adding one observation and removing another one
+                        delta = val - prev
+                        mean_x_old = mean_x
+
+                        mean_x += delta / nobs
+                        ssqdm_x += ((nobs - 1) * val
+                                    + (nobs + 1) * prev
+                                    - 2 * nobs * mean_x_old) * delta / nobs
+
+                    else:
+                        add_var(val, &nobs, &mean_x, &ssqdm_x)
+                elif prev == prev:
+                    remove_var(prev, &nobs, &mean_x, &ssqdm_x)
+
+                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling skewness
+
+cdef inline float64_t calc_skew(int64_t minp, int64_t nobs,
+                                float64_t x, float64_t xx,
+                                float64_t xxx) nogil:
+    cdef:
+        float64_t result, dnobs
+        float64_t A, B, C, R
+
+    if nobs >= minp:
+        dnobs = <float64_t>nobs
+        A = x / dnobs
+        B = xx / dnobs - A * A
+        C = xxx / dnobs - A * A * A - 3 * A * B
+
+        # #18044: with uniform distribution, floating issue will
+        #         cause B != 0. and cause the result is a very
+        #         large number.
+        #
+        #         in core/nanops.py nanskew/nankurt call the function
+        #         _zero_out_fperr(m2) to fix floating error.
+        #         if the variance is less than 1e-14, it could be
+        #         treat as zero, here we follow the original
+        #         skew/kurt behaviour to check B <= 1e-14
+        if B <= 1e-14 or nobs < 3:
+            result = NaN
+        else:
+            R = sqrt(B)
+            result = ((sqrt(dnobs * (dnobs - 1.)) * C) /
+                      ((dnobs - 2) * R * R * R))
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_skew(float64_t val, int64_t *nobs,
+                          float64_t *x, float64_t *xx,
+                          float64_t *xxx) nogil:
+    """ add a value from the skew calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] + 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] + val
+        xx[0] = xx[0] + val * val
+        xxx[0] = xxx[0] + val * val * val
+
+
+cdef inline void remove_skew(float64_t val, int64_t *nobs,
+                             float64_t *x, float64_t *xx,
+                             float64_t *xxx) nogil:
+    """ remove a value from the skew calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] - 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] - val
+        xx[0] = xx[0] - val * val
+        xxx[0] = xxx[0] - val * val * val
+
+
+def roll_skew(ndarray[float64_t] values, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        float64_t val, prev
+        float64_t x = 0, xx = 0, xxx = 0
+        int64_t nobs = 0, i, j, N
+        int64_t s, e
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(values, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        val = values[j]
+                        add_skew(val, &nobs, &x, &xx, &xxx)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        val = values[j]
+                        add_skew(val, &nobs, &x, &xx, &xxx)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        val = values[j]
+                        remove_skew(val, &nobs, &x, &xx, &xxx)
+
+                output[i] = calc_skew(minp, nobs, x, xx, xxx)
+
+    else:
+
+        with nogil:
+            for i in range(minp - 1):
+                val = values[i]
+                add_skew(val, &nobs, &x, &xx, &xxx)
+                output[i] = NaN
+
+            for i in range(minp - 1, N):
+                val = values[i]
+                add_skew(val, &nobs, &x, &xx, &xxx)
+
+                if i > win - 1:
+                    prev = values[i - win]
+                    remove_skew(prev, &nobs, &x, &xx, &xxx)
+
+                output[i] = calc_skew(minp, nobs, x, xx, xxx)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling kurtosis
+
+
+cdef inline float64_t calc_kurt(int64_t minp, int64_t nobs,
+                                float64_t x, float64_t xx,
+                                float64_t xxx, float64_t xxxx) nogil:
+    cdef:
+        float64_t result, dnobs
+        float64_t A, B, C, D, R, K
+
+    if nobs >= minp:
+        dnobs = <float64_t>nobs
+        A = x / dnobs
+        R = A * A
+        B = xx / dnobs - R
+        R = R * A
+        C = xxx / dnobs - R - 3 * A * B
+        R = R * A
+        D = xxxx / dnobs - R - 6 * B * A * A - 4 * C * A
+
+        # #18044: with uniform distribution, floating issue will
+        #         cause B != 0. and cause the result is a very
+        #         large number.
+        #
+        #         in core/nanops.py nanskew/nankurt call the function
+        #         _zero_out_fperr(m2) to fix floating error.
+        #         if the variance is less than 1e-14, it could be
+        #         treat as zero, here we follow the original
+        #         skew/kurt behaviour to check B <= 1e-14
+        if B <= 1e-14 or nobs < 4:
+            result = NaN
+        else:
+            K = (dnobs * dnobs - 1.) * D / (B * B) - 3 * ((dnobs - 1.) ** 2)
+            result = K / ((dnobs - 2.) * (dnobs - 3.))
+    else:
+        result = NaN
+
+    return result
+
+
+cdef inline void add_kurt(float64_t val, int64_t *nobs,
+                          float64_t *x, float64_t *xx,
+                          float64_t *xxx, float64_t *xxxx) nogil:
+    """ add a value from the kurotic calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] + 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] + val
+        xx[0] = xx[0] + val * val
+        xxx[0] = xxx[0] + val * val * val
+        xxxx[0] = xxxx[0] + val * val * val * val
+
+
+cdef inline void remove_kurt(float64_t val, int64_t *nobs,
+                             float64_t *x, float64_t *xx,
+                             float64_t *xxx, float64_t *xxxx) nogil:
+    """ remove a value from the kurotic calc """
+
+    # Not NaN
+    if notnan(val):
+        nobs[0] = nobs[0] - 1
+
+        # seriously don't ask me why this is faster
+        x[0] = x[0] - val
+        xx[0] = xx[0] - val * val
+        xxx[0] = xxx[0] - val * val * val
+        xxxx[0] = xxxx[0] - val * val * val * val
+
+
+def roll_kurt(ndarray[float64_t] values, int64_t win, int64_t minp,
+              object index, object closed):
+    cdef:
+        float64_t val, prev
+        float64_t x = 0, xx = 0, xxx = 0, xxxx = 0
+        int64_t nobs = 0, i, j, N
+        int64_t s, e
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    start, end, N, win, minp, is_variable = get_window_indexer(values, win,
+                                                               minp, index,
+                                                               closed)
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+
+        with nogil:
+
+            for i in range(0, N):
+
+                s = start[i]
+                e = end[i]
+
+                # Over the first window, observations can only be added
+                # never removed
+                if i == 0:
+
+                    for j in range(s, e):
+                        add_kurt(values[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                else:
+
+                    # After the first window, observations can both be added
+                    # and removed
+
+                    # calculate adds
+                    for j in range(end[i - 1], e):
+                        add_kurt(values[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                    # calculate deletes
+                    for j in range(start[i - 1], s):
+                        remove_kurt(values[j], &nobs, &x, &xx, &xxx, &xxxx)
+
+                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
+
+    else:
+
+        with nogil:
+
+            for i in range(minp - 1):
+                add_kurt(values[i], &nobs, &x, &xx, &xxx, &xxxx)
+                output[i] = NaN
+
+            for i in range(minp - 1, N):
+                add_kurt(values[i], &nobs, &x, &xx, &xxx, &xxxx)
+
+                if i > win - 1:
+                    prev = values[i - win]
+                    remove_kurt(prev, &nobs, &x, &xx, &xxx, &xxxx)
+
+                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Rolling median, min, max
+
+
+def roll_median_c(ndarray[float64_t] values, int64_t win, int64_t minp,
+                  object index, object closed):
+    cdef:
+        float64_t val, res, prev
+        bint err = 0, is_variable
+        int ret = 0
+        skiplist_t *sl
+        Py_ssize_t i, j
+        int64_t nobs = 0, N, s, e
+        int midpoint
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+
+    # we use the Fixed/Variable Indexer here as the
+    # actual skiplist ops outweigh any window computation costs
+    start, end, N, win, minp, is_variable = get_window_indexer(
+        values, win,
+        minp, index, closed,
+        use_mock=False)
+    output = np.empty(N, dtype=float)
+
+    sl = skiplist_init(<int>win)
+    if sl == NULL:
+        raise MemoryError("skiplist_init failed")
+
+    with nogil:
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                val = values[i]
+                if notnan(val):
+                    nobs += 1
+                    err = skiplist_insert(sl, val) != 1
+                    if err:
+                        break
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = values[j]
+                    if notnan(val):
+                        skiplist_remove(sl, val)
+                        nobs -= 1
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = values[j]
+                    if notnan(val):
+                        nobs += 1
+                        err = skiplist_insert(sl, val) != 1
+                        if err:
+                            break
+
+            if nobs >= minp:
+                midpoint = <int>(nobs / 2)
+                if nobs % 2:
+                    res = skiplist_get(sl, midpoint, &ret)
+                else:
+                    res = (skiplist_get(sl, midpoint, &ret) +
+                           skiplist_get(sl, (midpoint - 1), &ret)) / 2
+            else:
+                res = NaN
+
+            output[i] = res
+
+    skiplist_destroy(sl)
+    if err:
+        raise MemoryError("skiplist_insert failed")
+    return output
+
+
+# ----------------------------------------------------------------------
+
+# Moving maximum / minimum code taken from Bottleneck under the terms
+# of its Simplified BSD license
+# https://github.com/kwgoodman/bottleneck
+
+
+cdef inline numeric init_mm(numeric ai, Py_ssize_t *nobs, bint is_max) nogil:
+
+    if numeric in cython.floating:
+        if ai == ai:
+            nobs[0] = nobs[0] + 1
+        elif is_max:
+            if numeric == cython.float:
+                ai = MINfloat32
+            else:
+                ai = MINfloat64
+        else:
+            if numeric == cython.float:
+                ai = MAXfloat32
+            else:
+                ai = MAXfloat64
+
+    else:
+        nobs[0] = nobs[0] + 1
+
+    return ai
+
+
+cdef inline void remove_mm(numeric aold, Py_ssize_t *nobs) nogil:
+    """ remove a value from the mm calc """
+    if numeric in cython.floating and aold == aold:
+        nobs[0] = nobs[0] - 1
+
+
+cdef inline numeric calc_mm(int64_t minp, Py_ssize_t nobs,
+                            numeric value) nogil:
+    cdef:
+        numeric result
+
+    if numeric in cython.floating:
+        if nobs >= minp:
+            result = value
+        else:
+            result = NaN
+    else:
+        result = value
+
+    return result
+
+
+def roll_max(ndarray[numeric] values, int64_t win, int64_t minp,
+             object index, object closed):
+    """
+    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
+
+    Parameters
+    ----------
+    values: numpy array
+    window: int, size of rolling window
+    minp: if number of observations in window
+          is below this, output a NaN
+    index: ndarray, optional
+       index for window computation
+    closed: 'right', 'left', 'both', 'neither'
+            make the interval closed on the right, left,
+            both or neither endpoints
+    """
+    return _roll_min_max(values, win, minp, index, closed=closed, is_max=1)
+
+
+def roll_min(ndarray[numeric] values, int64_t win, int64_t minp,
+             object index, object closed):
+    """
+    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
+
+    Parameters
+    ----------
+    values: numpy array
+    window: int, size of rolling window
+    minp: if number of observations in window
+          is below this, output a NaN
+    index: ndarray, optional
+       index for window computation
+    """
+    return _roll_min_max(values, win, minp, index, is_max=0, closed=closed)
+
+
+cdef _roll_min_max(ndarray[numeric] values, int64_t win, int64_t minp,
+                   object index, object closed, bint is_max):
+    """
+    Moving min/max of 1d array of any numeric type along axis=0
+    ignoring NaNs.
+    """
+    cdef:
+        ndarray[int64_t] starti, endi
+        int64_t N
+        bint is_variable
+
+    starti, endi, N, win, minp, is_variable = get_window_indexer(
+        values, win,
+        minp, index, closed)
+
+    if is_variable:
+        return _roll_min_max_variable(values, starti, endi, N, win, minp,
+                                      is_max)
+    else:
+        return _roll_min_max_fixed(values, starti, endi, N, win, minp, is_max)
+
+
+cdef _roll_min_max_variable(ndarray[numeric] values,
+                            ndarray[int64_t] starti,
+                            ndarray[int64_t] endi,
+                            int64_t N,
+                            int64_t win,
+                            int64_t minp,
+                            bint is_max):
+    cdef:
+        numeric ai
+        int64_t i, close_offset, curr_win_size
+        Py_ssize_t nobs = 0
+        deque Q[int64_t]  # min/max always the front
+        deque W[int64_t]  # track the whole window for nobs compute
+        ndarray[float64_t, ndim=1] output
+
+    output = np.empty(N, dtype=float)
+    Q = deque[int64_t]()
+    W = deque[int64_t]()
+
+    with nogil:
+
+        # This is using a modified version of the C++ code in this
+        # SO post: http://bit.ly/2nOoHlY
+        # The original impl didn't deal with variable window sizes
+        # So the code was optimized for that
+
+        for i from starti[0] <= i < endi[0]:
+            ai = init_mm(values[i], &nobs, is_max)
+
+            # Discard previous entries if we find new min or max
+            if is_max:
+                while not Q.empty() and ((ai >= values[Q.back()]) or
+                                         values[Q.back()] != values[Q.back()]):
+                    Q.pop_back()
+            else:
+                while not Q.empty() and ((ai <= values[Q.back()]) or
+                                         values[Q.back()] != values[Q.back()]):
+                    Q.pop_back()
+            Q.push_back(i)
+            W.push_back(i)
+
+        # if right is open then the first window is empty
+        close_offset = 0 if endi[0] > starti[0] else 1
+
+        for i in range(endi[0], endi[N-1]):
+            if not Q.empty():
+                output[i-1+close_offset] = calc_mm(
+                    minp, nobs, values[Q.front()])
+            else:
+                output[i-1+close_offset] = NaN
+
+            ai = init_mm(values[i], &nobs, is_max)
+
+            # Discard previous entries if we find new min or max
+            if is_max:
+                while not Q.empty() and ((ai >= values[Q.back()]) or
+                                         values[Q.back()] != values[Q.back()]):
+                    Q.pop_back()
+            else:
+                while not Q.empty() and ((ai <= values[Q.back()]) or
+                                         values[Q.back()] != values[Q.back()]):
+                    Q.pop_back()
+
+            # Maintain window/nobs retention
+            curr_win_size = endi[i + close_offset] - starti[i + close_offset]
+            while not Q.empty() and Q.front() <= i - curr_win_size:
+                Q.pop_front()
+            while not W.empty() and W.front() <= i - curr_win_size:
+                remove_mm(values[W.front()], &nobs)
+                W.pop_front()
+
+            Q.push_back(i)
+            W.push_back(i)
+
+        if not Q.empty():
+            output[N-1] = calc_mm(minp, nobs, values[Q.front()])
+        else:
+            output[N-1] = NaN
+
+    return output
+
+
+cdef _roll_min_max_fixed(ndarray[numeric] values,
+                         ndarray[int64_t] starti,
+                         ndarray[int64_t] endi,
+                         int64_t N,
+                         int64_t win,
+                         int64_t minp,
+                         bint is_max):
+    cdef:
+        numeric ai
+        bint should_replace
+        int64_t i, removed, window_i,
+        Py_ssize_t nobs = 0
+        int64_t* death
+        numeric* ring
+        numeric* minvalue
+        numeric* end
+        numeric* last
+        ndarray[float64_t, ndim=1] output
+
+    output = np.empty(N, dtype=float)
+    # setup the rings of death!
+    ring = <numeric *>malloc(win * sizeof(numeric))
+    death = <int64_t *>malloc(win * sizeof(int64_t))
+
+    end = ring + win
+    last = ring
+    minvalue = ring
+    ai = values[0]
+    minvalue[0] = init_mm(values[0], &nobs, is_max)
+    death[0] = win
+    nobs = 0
+
+    with nogil:
+
+        for i in range(N):
+            ai = init_mm(values[i], &nobs, is_max)
+
+            if i >= win:
+                remove_mm(values[i - win], &nobs)
+
+            if death[minvalue - ring] == i:
+                minvalue = minvalue + 1
+                if minvalue >= end:
+                    minvalue = ring
+
+            if is_max:
+                should_replace = ai >= minvalue[0]
+            else:
+                should_replace = ai <= minvalue[0]
+            if should_replace:
+
+                minvalue[0] = ai
+                death[minvalue - ring] = i + win
+                last = minvalue
+
+            else:
+
+                if is_max:
+                    should_replace = last[0] <= ai
+                else:
+                    should_replace = last[0] >= ai
+                while should_replace:
+                    if last == ring:
+                        last = end
+                    last -= 1
+                    if is_max:
+                        should_replace = last[0] <= ai
+                    else:
+                        should_replace = last[0] >= ai
+
+                last += 1
+                if last == end:
+                    last = ring
+                last[0] = ai
+                death[last - ring] = i + win
+
+            output[i] = calc_mm(minp, nobs, minvalue[0])
+
+        for i in range(minp - 1):
+            if numeric in cython.floating:
+                output[i] = NaN
+            else:
+                output[i] = 0
+
+        free(ring)
+        free(death)
+
+    return output
+
+
+cdef enum InterpolationType:
+    LINEAR,
+    LOWER,
+    HIGHER,
+    NEAREST,
+    MIDPOINT
+
+
+interpolation_types = {
+    'linear': LINEAR,
+    'lower': LOWER,
+    'higher': HIGHER,
+    'nearest': NEAREST,
+    'midpoint': MIDPOINT,
+}
+
+
+def roll_quantile(ndarray[float64_t, cast=True] values, int64_t win,
+                  int64_t minp, object index, object closed,
+                  float64_t quantile, str interpolation):
+    """
+    O(N log(window)) implementation using skip list
+    """
+    cdef:
+        float64_t val, prev, midpoint, idx_with_fraction
+        skiplist_t *skiplist
+        int64_t nobs = 0, i, j, s, e, N
+        Py_ssize_t idx
+        bint is_variable
+        ndarray[int64_t] start, end
+        ndarray[float64_t] output
+        float64_t vlow, vhigh
+        InterpolationType interpolation_type
+        int ret = 0
+
+    if quantile <= 0.0 or quantile >= 1.0:
+        raise ValueError("quantile value {0} not in [0, 1]".format(quantile))
+
+    try:
+        interpolation_type = interpolation_types[interpolation]
+    except KeyError:
+        raise ValueError("Interpolation '{interp}' is not supported"
+                         .format(interp=interpolation))
+
+    # we use the Fixed/Variable Indexer here as the
+    # actual skiplist ops outweigh any window computation costs
+    start, end, N, win, minp, is_variable = get_window_indexer(
+        values, win,
+        minp, index, closed,
+        use_mock=False)
+    output = np.empty(N, dtype=float)
+    skiplist = skiplist_init(<int>win)
+    if skiplist == NULL:
+        raise MemoryError("skiplist_init failed")
+
+    with nogil:
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if i == 0:
+
+                # setup
+                val = values[i]
+                if notnan(val):
+                    nobs += 1
+                    skiplist_insert(skiplist, val)
+
+            else:
+
+                # calculate deletes
+                for j in range(start[i - 1], s):
+                    val = values[j]
+                    if notnan(val):
+                        skiplist_remove(skiplist, val)
+                        nobs -= 1
+
+                # calculate adds
+                for j in range(end[i - 1], e):
+                    val = values[j]
+                    if notnan(val):
+                        nobs += 1
+                        skiplist_insert(skiplist, val)
+
+            if nobs >= minp:
+                if nobs == 1:
+                    # Single value in skip list
+                    output[i] = skiplist_get(skiplist, 0, &ret)
+                else:
+                    idx_with_fraction = quantile * (nobs - 1)
+                    idx = <int>idx_with_fraction
+
+                    if idx_with_fraction == idx:
+                        # no need to interpolate
+                        output[i] = skiplist_get(skiplist, idx, &ret)
+                        continue
+
+                    if interpolation_type == LINEAR:
+                        vlow = skiplist_get(skiplist, idx, &ret)
+                        vhigh = skiplist_get(skiplist, idx + 1, &ret)
+                        output[i] = ((vlow + (vhigh - vlow) *
+                                      (idx_with_fraction - idx)))
+                    elif interpolation_type == LOWER:
+                        output[i] = skiplist_get(skiplist, idx, &ret)
+                    elif interpolation_type == HIGHER:
+                        output[i] = skiplist_get(skiplist, idx + 1, &ret)
+                    elif interpolation_type == NEAREST:
+                        # the same behaviour as round()
+                        if idx_with_fraction - idx == 0.5:
+                            if idx % 2 == 0:
+                                output[i] = skiplist_get(skiplist, idx, &ret)
+                            else:
+                                output[i] = skiplist_get(
+                                    skiplist, idx + 1, &ret)
+                        elif idx_with_fraction - idx < 0.5:
+                            output[i] = skiplist_get(skiplist, idx, &ret)
+                        else:
+                            output[i] = skiplist_get(skiplist, idx + 1, &ret)
+                    elif interpolation_type == MIDPOINT:
+                        vlow = skiplist_get(skiplist, idx, &ret)
+                        vhigh = skiplist_get(skiplist, idx + 1, &ret)
+                        output[i] = <float64_t>(vlow + vhigh) / 2
+            else:
+                output[i] = NaN
+
+    skiplist_destroy(skiplist)
+
+    return output
+
+
+def roll_generic(object obj,
+                 int64_t win, int64_t minp, object index, object closed,
+                 int offset, object func, bint raw,
+                 object args, object kwargs):
+    cdef:
+        ndarray[float64_t] output, counts, bufarr
+        ndarray[float64_t, cast=True] arr
+        float64_t *buf
+        float64_t *oldbuf
+        int64_t nobs = 0, i, j, s, e, N
+        bint is_variable
+        ndarray[int64_t] start, end
+
+    n = len(obj)
+    if n == 0:
+        return obj
+
+    arr = np.asarray(obj)
+
+    # ndarray input
+    if raw:
+        if not arr.flags.c_contiguous:
+            arr = arr.copy('C')
+
+    counts = roll_sum(np.concatenate([np.isfinite(arr).astype(float),
+                                      np.array([0.] * offset)]),
+                      win, minp, index, closed)[offset:]
+
+    start, end, N, win, minp, is_variable = get_window_indexer(arr, win,
+                                                               minp, index,
+                                                               closed,
+                                                               floor=0)
+
+    output = np.empty(N, dtype=float)
+
+    if is_variable:
+        # variable window arr or series
+
+        if offset != 0:
+            raise ValueError("unable to roll_generic with a non-zero offset")
+
+        for i in range(0, N):
+            s = start[i]
+            e = end[i]
+
+            if counts[i] >= minp:
+                if raw:
+                    output[i] = func(arr[s:e], *args, **kwargs)
+                else:
+                    output[i] = func(obj.iloc[s:e], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+    elif not raw:
+        # series
+        for i in range(N):
+            if counts[i] >= minp:
+                sl = slice(int_max(i + offset - win + 1, 0),
+                           int_min(i + offset + 1, N))
+                output[i] = func(obj.iloc[sl], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+    else:
+
+        # truncated windows at the beginning, through first full-length window
+        for i from 0 <= i < (int_min(win, N) - offset):
+            if counts[i] >= minp:
+                output[i] = func(arr[0: (i + offset + 1)], *args, **kwargs)
+            else:
+                output[i] = NaN
+
+        # remaining full-length windows
+        buf = <float64_t *>arr.data
+        bufarr = np.empty(win, dtype=float)
+        oldbuf = <float64_t *>bufarr.data
+        for i from (win - offset) <= i < (N - offset):
+            buf = buf + 1
+            bufarr.data = <char *>buf
+            if counts[i] >= minp:
+                output[i] = func(bufarr, *args, **kwargs)
+            else:
+                output[i] = NaN
+        bufarr.data = <char *>oldbuf
+
+        # truncated windows at the end
+        for i from int_max(N - offset, 0) <= i < N:
+            if counts[i] >= minp:
+                output[i] = func(arr[int_max(i + offset - win + 1, 0): N],
+                                 *args,
+                                 **kwargs)
+            else:
+                output[i] = NaN
+
+    return output
+
+
+def roll_window(ndarray[float64_t, ndim=1, cast=True] values,
+                ndarray[float64_t, ndim=1, cast=True] weights,
+                int minp, bint avg=True):
+    """
+    Assume len(weights) << len(values)
+    """
+    cdef:
+        ndarray[float64_t] output, tot_wgt, counts
+        Py_ssize_t in_i, win_i, win_n, win_k, in_n, in_k
+        float64_t val_in, val_win, c, w
+
+    in_n = len(values)
+    win_n = len(weights)
+    output = np.zeros(in_n, dtype=float)
+    counts = np.zeros(in_n, dtype=float)
+    if avg:
+        tot_wgt = np.zeros(in_n, dtype=float)
+
+    minp = _check_minp(len(weights), minp, in_n)
+
+    if avg:
+        for win_i in range(win_n):
+            val_win = weights[win_i]
+            if val_win != val_win:
+                continue
+
+            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
+                val_in = values[in_i]
+                if val_in == val_in:
+                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
+                    counts[in_i + (win_n - win_i) - 1] += 1
+                    tot_wgt[in_i + (win_n - win_i) - 1] += val_win
+
+        for in_i in range(in_n):
+            c = counts[in_i]
+            if c < minp:
+                output[in_i] = NaN
+            else:
+                w = tot_wgt[in_i]
+                if w == 0:
+                    output[in_i] = NaN
+                else:
+                    output[in_i] /= tot_wgt[in_i]
+
+    else:
+        for win_i in range(win_n):
+            val_win = weights[win_i]
+            if val_win != val_win:
+                continue
+
+            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
+                val_in = values[in_i]
+
+                if val_in == val_in:
+                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
+                    counts[in_i + (win_n - win_i) - 1] += 1
+
+        for in_i in range(in_n):
+            c = counts[in_i]
+            if c < minp:
+                output[in_i] = NaN
+
+    return output
+
+# ----------------------------------------------------------------------
+# Exponentially weighted moving average
+
+
+def ewma(float64_t[:] vals, float64_t com,
+         int adjust, int ignore_na, int minp):
+    """
+    Compute exponentially-weighted moving average using center-of-mass.
+
+    Parameters
+    ----------
+    vals : ndarray (float64 type)
+    com : float64
+    adjust: int
+    ignore_na: int
+    minp: int
+
+    Returns
+    -------
+    y : ndarray
+    """
+
+    cdef:
+        Py_ssize_t N = len(vals)
+        ndarray[float64_t] output = np.empty(N, dtype=float)
+        float64_t alpha, old_wt_factor, new_wt, weighted_avg, old_wt, cur
+        Py_ssize_t i, nobs
+
+    if N == 0:
+        return output
+
+    minp = max(minp, 1)
+
+    alpha = 1. / (1. + com)
+    old_wt_factor = 1. - alpha
+    new_wt = 1. if adjust else alpha
+
+    weighted_avg = vals[0]
+    is_observation = (weighted_avg == weighted_avg)
+    nobs = int(is_observation)
+    output[0] = weighted_avg if (nobs >= minp) else NaN
+    old_wt = 1.
+
+    for i in range(1, N):
+        cur = vals[i]
+        is_observation = (cur == cur)
+        nobs += int(is_observation)
+        if weighted_avg == weighted_avg:
+
+            if is_observation or (not ignore_na):
+
+                old_wt *= old_wt_factor
+                if is_observation:
+
+                    # avoid numerical errors on constant series
+                    if weighted_avg != cur:
+                        weighted_avg = ((old_wt * weighted_avg) +
+                                        (new_wt * cur)) / (old_wt + new_wt)
+                    if adjust:
+                        old_wt += new_wt
+                    else:
+                        old_wt = 1.
+        elif is_observation:
+            weighted_avg = cur
+
+        output[i] = weighted_avg if (nobs >= minp) else NaN
+
+    return output
+
+
+# ----------------------------------------------------------------------
+# Exponentially weighted moving covariance
+
+
+def ewmcov(float64_t[:] input_x, float64_t[:] input_y,
+           float64_t com, int adjust, int ignore_na, int minp, int bias):
+    """
+    Compute exponentially-weighted moving variance using center-of-mass.
+
+    Parameters
+    ----------
+    input_x : ndarray (float64 type)
+    input_y : ndarray (float64 type)
+    com : float64
+    adjust: int
+    ignore_na: int
+    minp: int
+    bias: int
+
+    Returns
+    -------
+    y : ndarray
+    """
+
+    cdef:
+        Py_ssize_t N = len(input_x)
+        float64_t alpha, old_wt_factor, new_wt, mean_x, mean_y, cov
+        float64_t sum_wt, sum_wt2, old_wt, cur_x, cur_y, old_mean_x, old_mean_y
+        Py_ssize_t i, nobs
+        ndarray[float64_t] output
+
+    if len(input_y) != N:
+        raise ValueError("arrays are of different lengths "
+                         "({N} and {len_y})".format(N=N, len_y=len(input_y)))
+
+    output = np.empty(N, dtype=float)
+    if N == 0:
+        return output
+
+    minp = max(minp, 1)
+
+    alpha = 1. / (1. + com)
+    old_wt_factor = 1. - alpha
+    new_wt = 1. if adjust else alpha
+
+    mean_x = input_x[0]
+    mean_y = input_y[0]
+    is_observation = ((mean_x == mean_x) and (mean_y == mean_y))
+    nobs = int(is_observation)
+    if not is_observation:
+        mean_x = NaN
+        mean_y = NaN
+    output[0] = (0. if bias else NaN) if (nobs >= minp) else NaN
+    cov = 0.
+    sum_wt = 1.
+    sum_wt2 = 1.
+    old_wt = 1.
+
+    for i in range(1, N):
+        cur_x = input_x[i]
+        cur_y = input_y[i]
+        is_observation = ((cur_x == cur_x) and (cur_y == cur_y))
+        nobs += int(is_observation)
+        if mean_x == mean_x:
+            if is_observation or (not ignore_na):
+                sum_wt *= old_wt_factor
+                sum_wt2 *= (old_wt_factor * old_wt_factor)
+                old_wt *= old_wt_factor
+                if is_observation:
+                    old_mean_x = mean_x
+                    old_mean_y = mean_y
+
+                    # avoid numerical errors on constant series
+                    if mean_x != cur_x:
+                        mean_x = ((old_wt * old_mean_x) +
+                                  (new_wt * cur_x)) / (old_wt + new_wt)
+
+                    # avoid numerical errors on constant series
+                    if mean_y != cur_y:
+                        mean_y = ((old_wt * old_mean_y) +
+                                  (new_wt * cur_y)) / (old_wt + new_wt)
+                    cov = ((old_wt * (cov + ((old_mean_x - mean_x) *
+                                             (old_mean_y - mean_y)))) +
+                           (new_wt * ((cur_x - mean_x) *
+                                      (cur_y - mean_y)))) / (old_wt + new_wt)
+                    sum_wt += new_wt
+                    sum_wt2 += (new_wt * new_wt)
+                    old_wt += new_wt
+                    if not adjust:
+                        sum_wt /= old_wt
+                        sum_wt2 /= (old_wt * old_wt)
+                        old_wt = 1.
+        elif is_observation:
+            mean_x = cur_x
+            mean_y = cur_y
+
+        if nobs >= minp:
+            if not bias:
+                numerator = sum_wt * sum_wt
+                denominator = numerator - sum_wt2
+                if (denominator > 0.):
+                    output[i] = ((numerator / denominator) * cov)
+                else:
+                    output[i] = NaN
+            else:
+                output[i] = cov
+        else:
+            output[i] = NaN
+
+    return output
diff --git a/pandas/_libs/writers.pyx b/pandas/_libs/writers.pyx
new file mode 100644
index 0000000000000..6449a331689ad
--- /dev/null
+++ b/pandas/_libs/writers.pyx
@@ -0,0 +1,167 @@
+# -*- coding: utf-8 -*-
+
+import cython
+from cython import Py_ssize_t
+
+from cpython cimport PyBytes_GET_SIZE, PyUnicode_GET_SIZE
+
+try:
+    from cpython cimport PyString_GET_SIZE
+except ImportError:
+    from cpython cimport PyUnicode_GET_SIZE as PyString_GET_SIZE
+
+import numpy as np
+from numpy cimport ndarray, uint8_t
+
+
+ctypedef fused pandas_string:
+    str
+    unicode
+    bytes
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def write_csv_rows(list data, ndarray data_index,
+                   Py_ssize_t nlevels, ndarray cols, object writer):
+    """
+    Write the given data to the writer object, pre-allocating where possible
+    for performance improvements.
+
+    Parameters
+    ----------
+    data : list
+    data_index : ndarray
+    nlevels : int
+    cols : ndarray
+    writer : object
+    """
+    # In crude testing, N>100 yields little marginal improvement
+    cdef:
+        Py_ssize_t i, j, k = len(data_index), N = 100, ncols = len(cols)
+        list rows
+
+    # pre-allocate rows
+    rows = [[None] * (nlevels + ncols) for _ in range(N)]
+
+    if nlevels == 1:
+        for j in range(k):
+            row = rows[j % N]
+            row[0] = data_index[j]
+            for i in range(ncols):
+                row[1 + i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+    elif nlevels > 1:
+        for j in range(k):
+            row = rows[j % N]
+            row[:nlevels] = list(data_index[j])
+            for i in range(ncols):
+                row[nlevels + i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+    else:
+        for j in range(k):
+            row = rows[j % N]
+            for i in range(ncols):
+                row[i] = data[i][j]
+
+            if j >= N - 1 and j % N == N - 1:
+                writer.writerows(rows)
+
+    if j >= 0 and (j < N - 1 or (j % N) != N - 1):
+        writer.writerows(rows[:((j + 1) % N)])
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def convert_json_to_lines(object arr):
+    """
+    replace comma separated json with line feeds, paying special attention
+    to quotes & brackets
+    """
+    cdef:
+        Py_ssize_t i = 0, num_open_brackets_seen = 0, length
+        bint in_quotes = 0, is_escaping = 0
+        ndarray[uint8_t, ndim=1] narr
+        unsigned char val, newline, comma, left_bracket, right_bracket, quote
+        unsigned char backslash
+
+    newline = ord('\n')
+    comma = ord(',')
+    left_bracket = ord('{')
+    right_bracket = ord('}')
+    quote = ord('"')
+    backslash = ord('\\')
+
+    narr = np.frombuffer(arr.encode('utf-8'), dtype='u1').copy()
+    length = narr.shape[0]
+    for i in range(length):
+        val = narr[i]
+        if val == quote and i > 0 and not is_escaping:
+            in_quotes = ~in_quotes
+        if val == backslash or is_escaping:
+            is_escaping = ~is_escaping
+        if val == comma:  # commas that should be \n
+            if num_open_brackets_seen == 0 and not in_quotes:
+                narr[i] = newline
+        elif val == left_bracket:
+            if not in_quotes:
+                num_open_brackets_seen += 1
+        elif val == right_bracket:
+            if not in_quotes:
+                num_open_brackets_seen -= 1
+
+    return narr.tostring().decode('utf-8')
+
+
+# stata, pytables
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def max_len_string_array(pandas_string[:] arr) -> Py_ssize_t:
+    """ return the maximum size of elements in a 1-dim string array """
+    cdef:
+        Py_ssize_t i, m = 0, l = 0, length = arr.shape[0]
+        pandas_string val
+
+    for i in range(length):
+        val = arr[i]
+        if isinstance(val, str):
+            l = PyString_GET_SIZE(val)
+        elif isinstance(val, bytes):
+            l = PyBytes_GET_SIZE(val)
+        elif isinstance(val, unicode):
+            l = PyUnicode_GET_SIZE(val)
+
+        if l > m:
+            m = l
+
+    return m
+
+
+# ------------------------------------------------------------------
+# PyTables Helpers
+
+
+@cython.boundscheck(False)
+@cython.wraparound(False)
+def string_array_replace_from_nan_rep(
+        ndarray[object, ndim=1] arr, object nan_rep,
+        object replace=None):
+    """
+    Replace the values in the array with 'replacement' if
+    they are 'nan_rep'. Return the same array.
+    """
+    cdef:
+        Py_ssize_t length = len(arr), i = 0
+
+    if replace is None:
+        replace = np.nan
+
+    for i in range(length):
+        if arr[i] == nan_rep:
+            arr[i] = replace
+
+    return arr
diff --git a/pandas/_version.py b/pandas/_version.py
index d764923fd7247..d000539421b91 100644
--- a/pandas/_version.py
+++ b/pandas/_version.py
@@ -1,4 +1,3 @@
-
 # This file helps to compute a version number in source trees obtained from
 # git-archive tarball (such as those provided by githubs download-from-tag
 # feature). Distribution tarballs (built by setup.py sdist) and build
@@ -8,14 +7,14 @@
 # This file is released into the public domain. Generated by
 # versioneer-0.15 (https://github.com/warner/python-versioneer)
 
-# flake8: noqa
-
 import errno
 import os
 import re
 import subprocess
 import sys
 
+from pandas.compat import PY3
+
 
 def get_keywords():
     # these strings will be replaced by git during git-archive.
@@ -28,7 +27,7 @@ def get_keywords():
     return keywords
 
 
-class VersioneerConfig:
+class VersioneerConfig(object):
     pass
 
 
@@ -78,7 +77,7 @@ def run_command(commands, args, cwd=None, verbose=False, hide_stderr=False):
             if e.errno == errno.ENOENT:
                 continue
             if verbose:
-                print("unable to run %s" % dispcmd)
+                print("unable to run {dispcmd}".format(dispcmd=dispcmd))
                 print(e)
             return None
     else:
@@ -86,11 +85,11 @@ def run_command(commands, args, cwd=None, verbose=False, hide_stderr=False):
             print("unable to find command, tried %s" % (commands,))
         return None
     stdout = p.communicate()[0].strip()
-    if sys.version_info[0] >= 3:
+    if PY3:
         stdout = stdout.decode()
     if p.returncode != 0:
         if verbose:
-            print("unable to run %s (error)" % dispcmd)
+            print("unable to run {dispcmd} (error)".format(dispcmd=dispcmd))
         return None
     return stdout
 
@@ -101,8 +100,10 @@ def versions_from_parentdir(parentdir_prefix, root, verbose):
     dirname = os.path.basename(root)
     if not dirname.startswith(parentdir_prefix):
         if verbose:
-            print("guessing rootdir is '%s', but '%s' doesn't start with "
-                  "prefix '%s'" % (root, dirname, parentdir_prefix))
+            print("guessing rootdir is '{root}', but '{dirname}' "
+                  "doesn't start with prefix '{parentdir_prefix}'".format(
+                      root=root, dirname=dirname,
+                      parentdir_prefix=parentdir_prefix))
         raise NotThisMethod("rootdir doesn't start with parentdir_prefix")
     return {"version": dirname[len(parentdir_prefix):],
             "full-revisionid": None,
@@ -142,11 +143,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %d
@@ -155,17 +156,17 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
-            print("discarding '%s', no digits" % ",".join(refs - tags))
+            print("discarding '{}', no digits".format(",".join(refs - tags)))
     if verbose:
-        print("likely tags: %s" % ",".join(sorted(tags)))
+        print("likely tags: {}".format(",".join(sorted(tags))))
     for ref in sorted(tags):
         # sorting will prefer e.g. "2.0" over "2.0rc1"
         if ref.startswith(tag_prefix):
             r = ref[len(tag_prefix):]
             if verbose:
-                print("picking %s" % r)
+                print("picking {r}".format(r=r))
             return {"version": r,
                     "full-revisionid": keywords["full"].strip(),
                     "dirty": False, "error": None
@@ -187,7 +188,7 @@ def git_pieces_from_vcs(tag_prefix, root, verbose, run_command=run_command):
 
     if not os.path.exists(os.path.join(root, ".git")):
         if verbose:
-            print("no .git in %s" % root)
+            print("no .git in {root}".format(root=root))
         raise NotThisMethod("no .git directory")
 
     GITS = ["git"]
@@ -229,19 +230,22 @@ def git_pieces_from_vcs(tag_prefix, root, verbose, run_command=run_command):
         mo = re.search(r'^(.+)-(\d+)-g([0-9a-f]+)$', git_describe)
         if not mo:
             # unparseable. Maybe git-describe is misbehaving?
-            pieces["error"] = ("unable to parse git-describe output: '%s'"
-                               % describe_out)
+            pieces["error"] = ("unable to parse git-describe output: "
+                               "'{describe_out}'".format(
+                                   describe_out=describe_out))
             return pieces
 
         # tag
         full_tag = mo.group(1)
         if not full_tag.startswith(tag_prefix):
+            fmt = ("tag '{full_tag}' doesn't start with prefix "
+                   "'{tag_prefix}'")
+            msg = fmt.format(full_tag=full_tag, tag_prefix=tag_prefix)
             if verbose:
-                fmt = "tag '%s' doesn't start with prefix '%s'"
-                print(fmt % (full_tag, tag_prefix))
-            pieces["error"] = ("tag '%s' doesn't start with prefix '%s'"
-                               % (full_tag, tag_prefix))
+                print(msg)
+            pieces["error"] = msg
             return pieces
+
         pieces["closest-tag"] = full_tag[len(tag_prefix):]
 
         # distance: number of commits since tag
@@ -278,13 +282,13 @@ def render_pep440(pieces):
         rendered = pieces["closest-tag"]
         if pieces["distance"] or pieces["dirty"]:
             rendered += plus_or_dot(pieces)
-            rendered += "%d.g%s" % (pieces["distance"], pieces["short"])
+            rendered += "{:d}.g{}".format(pieces["distance"], pieces["short"])
             if pieces["dirty"]:
                 rendered += ".dirty"
     else:
         # exception #1
-        rendered = "0+untagged.%d.g%s" % (pieces["distance"],
-                                          pieces["short"])
+        rendered = "0+untagged.{:d}.g{}".format(pieces["distance"],
+                                                pieces["short"])
         if pieces["dirty"]:
             rendered += ".dirty"
     return rendered
@@ -318,17 +322,17 @@ def render_pep440_post(pieces):
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
         if pieces["distance"] or pieces["dirty"]:
-            rendered += ".post%d" % pieces["distance"]
+            rendered += ".post{:d}".format(pieces["distance"])
             if pieces["dirty"]:
                 rendered += ".dev0"
             rendered += plus_or_dot(pieces)
-            rendered += "g%s" % pieces["short"]
+            rendered += "g{}".format(pieces["short"])
     else:
         # exception #1
         rendered = "0.post%d" % pieces["distance"]
         if pieces["dirty"]:
             rendered += ".dev0"
-        rendered += "+g%s" % pieces["short"]
+        rendered += "+g{}".format(pieces["short"])
     return rendered
 
 
@@ -362,7 +366,7 @@ def render_git_describe(pieces):
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
         if pieces["distance"]:
-            rendered += "-%d-g%s" % (pieces["distance"], pieces["short"])
+            rendered += "-{:d}-g{}".format(pieces["distance"], pieces["short"])
     else:
         # exception #1
         rendered = pieces["short"]
@@ -380,7 +384,7 @@ def render_git_describe_long(pieces):
 
     if pieces["closest-tag"]:
         rendered = pieces["closest-tag"]
-        rendered += "-%d-g%s" % (pieces["distance"], pieces["short"])
+        rendered += "-{:d}-g{}".format(pieces["distance"], pieces["short"])
     else:
         # exception #1
         rendered = pieces["short"]
@@ -412,7 +416,7 @@ def render(pieces, style):
     elif style == "git-describe-long":
         rendered = render_git_describe_long(pieces)
     else:
-        raise ValueError("unknown style '%s'" % style)
+        raise ValueError("unknown style '{style}'".format(style=style))
 
     return {"version": rendered, "full-revisionid": pieces["long"],
             "dirty": pieces["dirty"], "error": None}
diff --git a/pandas/api/__init__.py b/pandas/api/__init__.py
index fcbf42f6dabc4..afff059e7b601 100644
--- a/pandas/api/__init__.py
+++ b/pandas/api/__init__.py
@@ -1 +1,2 @@
 """ public toolkit API """
+from . import types, extensions  # noqa
diff --git a/pandas/api/extensions/__init__.py b/pandas/api/extensions/__init__.py
new file mode 100644
index 0000000000000..cb6241016d82f
--- /dev/null
+++ b/pandas/api/extensions/__init__.py
@@ -0,0 +1,10 @@
+"""Public API for extending pandas objects."""
+from pandas.core.accessor import (register_dataframe_accessor,  # noqa
+                                  register_index_accessor,
+                                  register_series_accessor)
+from pandas.core.algorithms import take  # noqa
+from pandas.core.arrays import (ExtensionArray,    # noqa
+                                ExtensionScalarOpsMixin)
+from pandas.core.dtypes.dtypes import (  # noqa
+    ExtensionDtype, register_extension_dtype
+)
diff --git a/pandas/api/types/__init__.py b/pandas/api/types/__init__.py
index ee217543f0420..438e4afa3f580 100644
--- a/pandas/api/types/__init__.py
+++ b/pandas/api/types/__init__.py
@@ -1,4 +1,9 @@
 """ public toolkit API """
 
-from pandas.types.api import *  # noqa
-del np  # noqa
+from pandas.core.dtypes.api import *  # noqa
+from pandas.core.dtypes.dtypes import (CategoricalDtype,  # noqa
+                                       DatetimeTZDtype,
+                                       PeriodDtype,
+                                       IntervalDtype)
+from pandas.core.dtypes.concat import union_categoricals  # noqa
+from pandas._libs.lib import infer_dtype  # noqa
diff --git a/pandas/arrays/__init__.py b/pandas/arrays/__init__.py
new file mode 100644
index 0000000000000..7d9b1b7c7a659
--- /dev/null
+++ b/pandas/arrays/__init__.py
@@ -0,0 +1,23 @@
+"""
+All of pandas' ExtensionArrays.
+
+See :ref:`extending.extension-types` for more.
+"""
+from pandas.core.arrays import (
+    IntervalArray, PeriodArray, Categorical, SparseArray, IntegerArray,
+    PandasArray,
+    DatetimeArray,
+    TimedeltaArray,
+)
+
+
+__all__ = [
+    'Categorical',
+    'DatetimeArray',
+    'IntegerArray',
+    'IntervalArray',
+    'PandasArray',
+    'PeriodArray',
+    'SparseArray',
+    'TimedeltaArray',
+]
diff --git a/pandas/compat/__init__.py b/pandas/compat/__init__.py
index 7ebdd9735b967..4036af85b7212 100644
--- a/pandas/compat/__init__.py
+++ b/pandas/compat/__init__.py
@@ -7,9 +7,8 @@
 Key items to import for 2/3 compatible code:
 * iterators: range(), map(), zip(), filter(), reduce()
 * lists: lrange(), lmap(), lzip(), lfilter()
-* unicode: u() [u"" is a syntax error in Python 3.0-3.2]
+* unicode: u() [no unicode builtin in Python 3]
 * longs: long (int in Python 3)
-* callable
 * iterable method compatibility: iteritems, iterkeys, itervalues
   * Uses the original method if available, otherwise uses items, keys, values.
 * types:
@@ -21,27 +20,31 @@
   given metaclass instead (and avoids intermediary class creation)
 
 Other items:
-* OrderedDefaultDict
 * platform checker
 """
 # pylint disable=W0611
 # flake8: noqa
 
+import re
 import functools
 import itertools
 from distutils.version import LooseVersion
 from itertools import product
 import sys
+import platform
 import types
 from unicodedata import east_asian_width
 import struct
 import inspect
 from collections import namedtuple
+import collections
 
 PY2 = sys.version_info[0] == 2
-PY3 = (sys.version_info[0] >= 3)
-PY35 = (sys.version_info >= (3, 5))
-PY36 = (sys.version_info >= (3, 6))
+PY3 = sys.version_info[0] >= 3
+PY35 = sys.version_info >= (3, 5)
+PY36 = sys.version_info >= (3, 6)
+PY37 = sys.version_info >= (3, 7)
+PYPY = platform.python_implementation() == 'PyPy'
 
 try:
     import __builtin__ as builtins
@@ -99,17 +102,22 @@ def signature(f):
                                            'varargs', 'keywords'])
         return argspec(args, defaults, varargs, keywords)
 
+    def get_range_parameters(data):
+        """Gets the start, stop, and step parameters from a range object"""
+        return data.start, data.stop, data.step
+
     # have to explicitly put builtins into the namespace
     range = range
     map = map
     zip = zip
     filter = filter
+    intern = sys.intern
     reduce = functools.reduce
     long = int
     unichr = chr
 
     # This was introduced in Python 3.3, but we don't support
-    # Python 3.x < 3.4, so checking PY3 is safe.
+    # Python 3.x < 3.5, so checking PY3 is safe.
     FileNotFoundError = FileNotFoundError
 
     # list-producing versions of the major Python iterating functions
@@ -125,9 +133,19 @@ def lmap(*args, **kwargs):
     def lfilter(*args, **kwargs):
         return list(filter(*args, **kwargs))
 
+    from importlib import reload
+    reload = reload
+    Hashable = collections.abc.Hashable
+    Iterable = collections.abc.Iterable
+    Iterator = collections.abc.Iterator
+    Mapping = collections.abc.Mapping
+    MutableMapping = collections.abc.MutableMapping
+    Sequence = collections.abc.Sequence
+    Sized = collections.abc.Sized
+    Set = collections.abc.Set
+
 else:
     # Python 2
-    import re
     _name_re = re.compile(r"[a-zA-Z_][a-zA-Z0-9_]*$")
 
     FileNotFoundError = IOError
@@ -144,8 +162,27 @@ def bytes_to_str(b, encoding='ascii'):
     def signature(f):
         return inspect.getargspec(f)
 
+    def get_range_parameters(data):
+        """Gets the start, stop, and step parameters from a range object"""
+        # seems we only have indexing ops to infer
+        # rather than direct accessors
+        if len(data) > 1:
+            step = data[1] - data[0]
+            stop = data[-1] + step
+            start = data[0]
+        elif len(data):
+            start = data[0]
+            stop = data[0] + 1
+            step = 1
+        else:
+            start = stop = 0
+            step = 1
+
+        return start, stop, step
+
     # import iterator versions of these functions
     range = xrange
+    intern = intern
     zip = itertools.izip
     filter = itertools.ifilter
     map = itertools.imap
@@ -159,6 +196,16 @@ def signature(f):
     lmap = builtins.map
     lfilter = builtins.filter
 
+    reload = builtins.reload
+
+    Hashable = collections.Hashable
+    Iterable = collections.Iterable
+    Iterator = collections.Iterator
+    Mapping = collections.Mapping
+    MutableMapping = collections.MutableMapping
+    Sequence = collections.Sequence
+    Sized = collections.Sized
+    Set = collections.Set
 
 if PY2:
     def iteritems(obj, **kw):
@@ -232,6 +279,16 @@ def u(s):
     def u_safe(s):
         return s
 
+    def to_str(s):
+        """
+        Convert bytes and non-string into Python 3 str
+        """
+        if isinstance(s, binary_type):
+            s = bytes_to_str(s)
+        elif not isinstance(s, string_types):
+            s = str(s)
+        return s
+
     def strlen(data, encoding=None):
         # encoding is for compat with PY2
         return len(data)
@@ -241,7 +298,7 @@ def east_asian_len(data, encoding=None, ambiguous_width=1):
         Calculate display width considering unicode East Asian Width
         """
         if isinstance(data, text_type):
-            return sum([_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data])
+            return sum(_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data)
         else:
             return len(data)
 
@@ -277,6 +334,14 @@ def u_safe(s):
         except:
             return s
 
+    def to_str(s):
+        """
+        Convert unicode and non-string into Python 2 str
+        """
+        if not isinstance(s, string_types):
+            s = str(s)
+        return s
+
     def strlen(data, encoding=None):
         try:
             data = data.decode(encoding)
@@ -293,7 +358,7 @@ def east_asian_len(data, encoding=None, ambiguous_width=1):
                 data = data.decode(encoding)
             except UnicodeError:
                 pass
-            return sum([_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data])
+            return sum(_EAW_MAP.get(east_asian_width(c), ambiguous_width) for c in data)
         else:
             return len(data)
 
@@ -314,12 +379,18 @@ class ResourceWarning(Warning):
 string_and_binary_types = string_types + (binary_type,)
 
 
-try:
-    # callable reintroduced in later versions of Python
-    callable = callable
-except NameError:
-    def callable(obj):
-        return any("__call__" in klass.__dict__ for klass in type(obj).__mro__)
+if PY2:
+    # In PY2 functools.wraps doesn't provide metadata pytest needs to generate
+    # decorated tests using parametrization. See pytest GH issue #2782
+    def wraps(wrapped, assigned=functools.WRAPPER_ASSIGNMENTS,
+              updated=functools.WRAPPER_UPDATES):
+        def wrapper(f):
+            f = functools.wraps(wrapped, assigned, updated)(f)
+            f.__wrapped__ = wrapped
+            return f
+        return wrapper
+else:
+    wraps = functools.wraps
 
 
 def add_metaclass(metaclass):
@@ -333,8 +404,6 @@ def wrapper(cls):
         return metaclass(cls.__name__, cls.__bases__, orig_vars)
     return wrapper
 
-from collections import OrderedDict, Counter
-
 if PY3:
     def raise_with_traceback(exc, traceback=Ellipsis):
         if traceback == Ellipsis:
@@ -353,47 +422,22 @@ def raise_with_traceback(exc, traceback=Ellipsis):
 If traceback is not passed, uses sys.exc_info() to get traceback."""
 
 
-# http://stackoverflow.com/questions/4126348
-# Thanks to @martineau at SO
-
-from dateutil import parser as _date_parser
+# dateutil minimum version
 import dateutil
-if LooseVersion(dateutil.__version__) < '2.0':
-    @functools.wraps(_date_parser.parse)
-    def parse_date(timestr, *args, **kwargs):
-        timestr = bytes(timestr)
-        return _date_parser.parse(timestr, *args, **kwargs)
-elif PY2 and LooseVersion(dateutil.__version__) == '2.0':
-    # dateutil brokenness
-    raise Exception('dateutil 2.0 incompatible with Python 2.x, you must '
-                    'install version 1.5 or 2.1+!')
-else:
-    parse_date = _date_parser.parse
-
-
-class OrderedDefaultdict(OrderedDict):
 
-    def __init__(self, *args, **kwargs):
-        newdefault = None
-        newargs = ()
-        if args:
-            newdefault = args[0]
-            if not (newdefault is None or callable(newdefault)):
-                raise TypeError('first argument must be callable or None')
-            newargs = args[1:]
-        self.default_factory = newdefault
-        super(self.__class__, self).__init__(*newargs, **kwargs)
-
-    def __missing__(self, key):
-        if self.default_factory is None:
-            raise KeyError(key)
-        self[key] = value = self.default_factory()
-        return value
+if LooseVersion(dateutil.__version__) < LooseVersion('2.5'):
+    raise ImportError('dateutil 2.5.0 is the minimum required version')
+from dateutil import parser as _date_parser
+parse_date = _date_parser.parse
 
-    def __reduce__(self):  # optional, for pickle support
-        args = self.default_factory if self.default_factory else tuple()
-        return type(self), args, None, None, list(self.items())
 
+# In Python 3.7, the private re._pattern_type is removed.
+# Python 3.5+ have typing.re.Pattern
+if PY36:
+    import typing
+    re_type = typing.re.Pattern
+else:
+    re_type = type(re.compile(''))
 
 # https://github.com/pandas-dev/pandas/pull/9123
 def is_platform_little_endian():
diff --git a/pandas/compat/chainmap_impl.py b/pandas/compat/chainmap_impl.py
index 05a0d5faa4c2a..3ea5414cc41eb 100644
--- a/pandas/compat/chainmap_impl.py
+++ b/pandas/compat/chainmap_impl.py
@@ -1,4 +1,11 @@
-from collections import MutableMapping
+import sys
+
+PY3 = sys.version_info[0] >= 3
+
+if PY3:
+    from collections.abc import MutableMapping
+else:
+    from collections import MutableMapping
 
 try:
     from thread import get_ident
@@ -34,10 +41,10 @@ def wrapper(self):
 
 class ChainMap(MutableMapping):
     """ A ChainMap groups multiple dicts (or other mappings) together
-    to create a single, updateable view.
+    to create a single, updatable view.
 
     The underlying mappings are stored in a list.  That list is public and can
-    accessed or updated using the *maps* attribute.  There is no other state.
+    be accessed / updated using the *maps* attribute.  There is no other state.
 
     Lookups search the underlying mappings successively until a key is found.
     In contrast, writes, updates, and deletions only operate on the first
diff --git a/pandas/compat/numpy/__init__.py b/pandas/compat/numpy/__init__.py
index 4a9a2647ece0f..6e9f768d8bd68 100644
--- a/pandas/compat/numpy/__init__.py
+++ b/pandas/compat/numpy/__init__.py
@@ -9,18 +9,18 @@
 # numpy versioning
 _np_version = np.__version__
 _nlv = LooseVersion(_np_version)
-_np_version_under1p8 = _nlv < '1.8'
-_np_version_under1p9 = _nlv < '1.9'
-_np_version_under1p10 = _nlv < '1.10'
-_np_version_under1p11 = _nlv < '1.11'
-_np_version_under1p12 = _nlv < '1.12'
-_np_version_under1p13 = _nlv < '1.13'
-
-if _nlv < '1.7.0':
+_np_version_under1p13 = _nlv < LooseVersion('1.13')
+_np_version_under1p14 = _nlv < LooseVersion('1.14')
+_np_version_under1p15 = _nlv < LooseVersion('1.15')
+_np_version_under1p16 = _nlv < LooseVersion('1.16')
+_np_version_under1p17 = _nlv < LooseVersion('1.17')
+
+
+if _nlv < '1.12':
     raise ImportError('this version of pandas is incompatible with '
-                      'numpy < 1.7.0\n'
+                      'numpy < 1.12.0\n'
                       'your numpy version is {0}.\n'
-                      'Please upgrade numpy to >= 1.7.0 to use '
+                      'Please upgrade numpy to >= 1.12.0 to use '
                       'this pandas version'.format(_np_version))
 
 
@@ -42,9 +42,7 @@ def np_datetime64_compat(s, *args, **kwargs):
     tz-changes in 1.11 that make '2015-01-01 09:00:00Z' show a deprecation
     warning, when need to pass '2015-01-01 09:00:00'
     """
-
-    if not _np_version_under1p11:
-        s = tz_replacer(s)
+    s = tz_replacer(s)
     return np.datetime64(s, *args, **kwargs)
 
 
@@ -55,23 +53,20 @@ def np_array_datetime64_compat(arr, *args, **kwargs):
     tz-changes in 1.11 that make '2015-01-01 09:00:00Z' show a deprecation
     warning, when need to pass '2015-01-01 09:00:00'
     """
-
-    if not _np_version_under1p11:
-
-        # is_list_like
-        if hasattr(arr, '__iter__') and not \
-           isinstance(arr, string_and_binary_types):
-            arr = [tz_replacer(s) for s in arr]
-        else:
-            arr = tz_replacer(arr)
+    # is_list_like
+    if (hasattr(arr, '__iter__')
+            and not isinstance(arr, string_and_binary_types)):
+        arr = [tz_replacer(s) for s in arr]
+    else:
+        arr = tz_replacer(arr)
 
     return np.array(arr, *args, **kwargs)
 
 
 __all__ = ['np',
-           '_np_version_under1p8',
-           '_np_version_under1p9',
-           '_np_version_under1p10',
-           '_np_version_under1p11',
-           '_np_version_under1p12',
+           '_np_version_under1p13',
+           '_np_version_under1p14',
+           '_np_version_under1p15',
+           '_np_version_under1p16',
+           '_np_version_under1p17'
            ]
diff --git a/pandas/compat/numpy/function.py b/pandas/compat/numpy/function.py
index f448a9aad04c6..f15783ad642b4 100644
--- a/pandas/compat/numpy/function.py
+++ b/pandas/compat/numpy/function.py
@@ -17,13 +17,15 @@
 and methods that are spread throughout the codebase. This module will make it
 easier to adjust to future upstream changes in the analogous numpy signatures.
 """
+from collections import OrderedDict
 
 from numpy import ndarray
-from pandas.util.validators import (validate_args, validate_kwargs,
-                                    validate_args_and_kwargs)
-from pandas.core.common import UnsupportedFunctionCall
-from pandas.types.common import is_integer, is_bool
-from pandas.compat import OrderedDict
+
+from pandas.errors import UnsupportedFunctionCall
+from pandas.util._validators import (
+    validate_args, validate_args_and_kwargs, validate_kwargs)
+
+from pandas.core.dtypes.common import is_bool, is_integer
 
 
 class CompatValidator(object):
@@ -107,6 +109,14 @@ def validate_argmax_with_skipna(skipna, args, kwargs):
 validate_argsort = CompatValidator(ARGSORT_DEFAULTS, fname='argsort',
                                    max_fname_arg_count=0, method='both')
 
+# two different signatures of argsort, this second validation
+# for when the `kind` param is supported
+ARGSORT_DEFAULTS_KIND = OrderedDict()
+ARGSORT_DEFAULTS_KIND['axis'] = -1
+ARGSORT_DEFAULTS_KIND['order'] = None
+validate_argsort_kind = CompatValidator(ARGSORT_DEFAULTS_KIND, fname='argsort',
+                                        max_fname_arg_count=0, method='both')
+
 
 def validate_argsort_with_ascending(ascending, args, kwargs):
     """
@@ -121,7 +131,7 @@ def validate_argsort_with_ascending(ascending, args, kwargs):
         args = (ascending,) + args
         ascending = True
 
-    validate_argsort(args, kwargs, max_fname_arg_count=1)
+    validate_argsort_kind(args, kwargs, max_fname_arg_count=3)
     return ascending
 
 
@@ -176,10 +186,19 @@ def validate_cum_func_with_skipna(skipna, args, kwargs, name):
     return skipna
 
 
-LOGICAL_FUNC_DEFAULTS = dict(out=None)
+ALLANY_DEFAULTS = OrderedDict()
+ALLANY_DEFAULTS['dtype'] = None
+ALLANY_DEFAULTS['out'] = None
+ALLANY_DEFAULTS['keepdims'] = False
+validate_all = CompatValidator(ALLANY_DEFAULTS, fname='all',
+                               method='both', max_fname_arg_count=1)
+validate_any = CompatValidator(ALLANY_DEFAULTS, fname='any',
+                               method='both', max_fname_arg_count=1)
+
+LOGICAL_FUNC_DEFAULTS = dict(out=None, keepdims=False)
 validate_logical_func = CompatValidator(LOGICAL_FUNC_DEFAULTS, method='kwargs')
 
-MINMAX_DEFAULTS = dict(out=None)
+MINMAX_DEFAULTS = dict(out=None, keepdims=False)
 validate_min = CompatValidator(MINMAX_DEFAULTS, fname='min',
                                method='both', max_fname_arg_count=1)
 validate_max = CompatValidator(MINMAX_DEFAULTS, fname='max',
@@ -207,16 +226,32 @@ def validate_cum_func_with_skipna(skipna, args, kwargs, name):
 STAT_FUNC_DEFAULTS = OrderedDict()
 STAT_FUNC_DEFAULTS['dtype'] = None
 STAT_FUNC_DEFAULTS['out'] = None
+
+PROD_DEFAULTS = SUM_DEFAULTS = STAT_FUNC_DEFAULTS.copy()
+SUM_DEFAULTS['keepdims'] = False
+SUM_DEFAULTS['initial'] = None
+
+MEDIAN_DEFAULTS = STAT_FUNC_DEFAULTS.copy()
+MEDIAN_DEFAULTS['overwrite_input'] = False
+MEDIAN_DEFAULTS['keepdims'] = False
+
+STAT_FUNC_DEFAULTS['keepdims'] = False
+
 validate_stat_func = CompatValidator(STAT_FUNC_DEFAULTS,
                                      method='kwargs')
-validate_sum = CompatValidator(STAT_FUNC_DEFAULTS, fname='sort',
+validate_sum = CompatValidator(SUM_DEFAULTS, fname='sum',
                                method='both', max_fname_arg_count=1)
+validate_prod = CompatValidator(PROD_DEFAULTS, fname="prod",
+                                method="both", max_fname_arg_count=1)
 validate_mean = CompatValidator(STAT_FUNC_DEFAULTS, fname='mean',
                                 method='both', max_fname_arg_count=1)
+validate_median = CompatValidator(MEDIAN_DEFAULTS, fname='median',
+                                  method='both', max_fname_arg_count=1)
 
 STAT_DDOF_FUNC_DEFAULTS = OrderedDict()
 STAT_DDOF_FUNC_DEFAULTS['dtype'] = None
 STAT_DDOF_FUNC_DEFAULTS['out'] = None
+STAT_DDOF_FUNC_DEFAULTS['keepdims'] = False
 validate_stat_ddof_func = CompatValidator(STAT_DDOF_FUNC_DEFAULTS,
                                           method='kwargs')
 
@@ -344,3 +379,24 @@ def validate_resampler_func(method, args, kwargs):
                 "{func}() instead".format(func=method)))
         else:
             raise TypeError("too many arguments passed in")
+
+
+def validate_minmax_axis(axis):
+    """
+    Ensure that the axis argument passed to min, max, argmin, or argmax is
+    zero or None, as otherwise it will be incorrectly ignored.
+
+    Parameters
+    ----------
+    axis : int or None
+
+    Raises
+    ------
+    ValueError
+    """
+    ndim = 1  # hard-coded for Index
+    if axis is None:
+        return
+    if axis >= ndim or (axis < 0 and ndim + axis < 0):
+        raise ValueError("`axis` must be fewer than the number of "
+                         "dimensions ({ndim})".format(ndim=ndim))
diff --git a/pandas/compat/openpyxl_compat.py b/pandas/compat/openpyxl_compat.py
deleted file mode 100644
index 87cf52cf00fef..0000000000000
--- a/pandas/compat/openpyxl_compat.py
+++ /dev/null
@@ -1,35 +0,0 @@
-"""
-Detect incompatible version of OpenPyXL
-
-GH7169
-"""
-
-from distutils.version import LooseVersion
-
-start_ver = '1.6.1'
-stop_ver = '2.0.0'
-
-
-def is_compat(major_ver=1):
-    """Detect whether the installed version of openpyxl is supported
-
-    Parameters
-    ----------
-    ver : int
-        1 requests compatibility status among the 1.x.y series
-        2 requests compatibility status of 2.0.0 and later
-    Returns
-    -------
-    compat : bool
-        ``True`` if openpyxl is installed and is a compatible version.
-        ``False`` otherwise.
-    """
-    import openpyxl
-    ver = LooseVersion(openpyxl.__version__)
-    if major_ver == 1:
-        return LooseVersion(start_ver) <= ver < LooseVersion(stop_ver)
-    elif major_ver == 2:
-        return LooseVersion(stop_ver) <= ver
-    else:
-        raise ValueError('cannot test for openpyxl compatibility with ver {0}'
-                         .format(major_ver))
diff --git a/pandas/compat/pickle_compat.py b/pandas/compat/pickle_compat.py
index 279a82fea1cc2..8f16f8154b952 100644
--- a/pandas/compat/pickle_compat.py
+++ b/pandas/compat/pickle_compat.py
@@ -1,13 +1,15 @@
-""" support pre 0.12 series pickle compatibility """
+"""
+Support pre-0.12 series pickle compatibility.
+"""
 
-# flake8: noqa
-
-import sys
-import pandas
 import copy
 import pickle as pkl
-from pandas import compat, Index
-from pandas.compat import u, string_types
+import sys
+
+from pandas.compat import string_types, u  # noqa
+
+import pandas  # noqa
+from pandas import Index, compat
 
 
 def load_reduce(self):
@@ -15,61 +17,124 @@ def load_reduce(self):
     args = stack.pop()
     func = stack[-1]
 
-    if type(args[0]) is type:
-        n = args[0].__name__
+    if len(args) and type(args[0]) is type:
+        n = args[0].__name__  # noqa
 
     try:
         stack[-1] = func(*args)
         return
     except Exception as e:
 
-        # if we have a deprecated function
-        # try to replace and try again
+        # If we have a deprecated function,
+        # try to replace and try again.
+
+        msg = '_reconstruct: First argument must be a sub-type of ndarray'
 
-        if '_reconstruct: First argument must be a sub-type of ndarray' in str(e):
+        if msg in str(e):
             try:
                 cls = args[0]
                 stack[-1] = object.__new__(cls)
                 return
-            except:
+            except TypeError:
                 pass
 
-        # try to reencode the arguments
+        # try to re-encode the arguments
         if getattr(self, 'encoding', None) is not None:
-            args = tuple([arg.encode(self.encoding)
-                          if isinstance(arg, string_types)
-                          else arg for arg in args])
+            args = tuple(arg.encode(self.encoding)
+                         if isinstance(arg, string_types)
+                         else arg for arg in args)
             try:
                 stack[-1] = func(*args)
                 return
-            except:
+            except TypeError:
                 pass
 
+        # unknown exception, re-raise
         if getattr(self, 'is_verbose', None):
             print(sys.exc_info())
             print(func, args)
         raise
 
-    stack[-1] = value
 
-
-# if classes are moved, provide compat here
+# If classes are moved, provide compat here.
 _class_locations_map = {
+    ('pandas.core.sparse.array', 'SparseArray'):
+        ('pandas.core.arrays', 'SparseArray'),
 
     # 15477
-    ('pandas.core.base', 'FrozenNDArray'): ('pandas.indexes.frozen', 'FrozenNDArray'),
-    ('pandas.core.base', 'FrozenList'): ('pandas.indexes.frozen', 'FrozenList'),
+    #
+    # TODO: When FrozenNDArray is removed, add
+    # the following lines for compat:
+    #
+    # ('pandas.core.base', 'FrozenNDArray'):
+    #     ('numpy', 'ndarray'),
+    # ('pandas.core.indexes.frozen', 'FrozenNDArray'):
+    #     ('numpy', 'ndarray'),
+    #
+    # Afterwards, remove the current entry
+    # for `pandas.core.base.FrozenNDArray`.
+    ('pandas.core.base', 'FrozenNDArray'):
+        ('pandas.core.indexes.frozen', 'FrozenNDArray'),
+    ('pandas.core.base', 'FrozenList'):
+        ('pandas.core.indexes.frozen', 'FrozenList'),
 
     # 10890
-    ('pandas.core.series', 'TimeSeries'): ('pandas.core.series', 'Series'),
-    ('pandas.sparse.series', 'SparseTimeSeries'): ('pandas.sparse.series', 'SparseSeries'),
+    ('pandas.core.series', 'TimeSeries'):
+        ('pandas.core.series', 'Series'),
+    ('pandas.sparse.series', 'SparseTimeSeries'):
+        ('pandas.core.sparse.series', 'SparseSeries'),
 
     # 12588, extensions moving
-    ('pandas._sparse', 'BlockIndex'): ('pandas.sparse.libsparse', 'BlockIndex'),
-    ('pandas.tslib', 'Timestamp'): ('pandas._libs.tslib', 'Timestamp'),
-    ('pandas.tslib', '__nat_unpickle'): ('pandas._libs.tslib', '__nat_unpickle'),
-    ('pandas._period', 'Period'): ('pandas._libs.period', 'Period')
-    }
+    ('pandas._sparse', 'BlockIndex'):
+        ('pandas._libs.sparse', 'BlockIndex'),
+    ('pandas.tslib', 'Timestamp'):
+        ('pandas._libs.tslib', 'Timestamp'),
+
+    # 18543 moving period
+    ('pandas._period', 'Period'): ('pandas._libs.tslibs.period', 'Period'),
+    ('pandas._libs.period', 'Period'):
+        ('pandas._libs.tslibs.period', 'Period'),
+
+    # 18014 moved __nat_unpickle from _libs.tslib-->_libs.tslibs.nattype
+    ('pandas.tslib', '__nat_unpickle'):
+        ('pandas._libs.tslibs.nattype', '__nat_unpickle'),
+    ('pandas._libs.tslib', '__nat_unpickle'):
+        ('pandas._libs.tslibs.nattype', '__nat_unpickle'),
+
+    # 15998 top-level dirs moving
+    ('pandas.sparse.array', 'SparseArray'):
+        ('pandas.core.arrays.sparse', 'SparseArray'),
+    ('pandas.sparse.series', 'SparseSeries'):
+        ('pandas.core.sparse.series', 'SparseSeries'),
+    ('pandas.sparse.frame', 'SparseDataFrame'):
+        ('pandas.core.sparse.frame', 'SparseDataFrame'),
+    ('pandas.indexes.base', '_new_Index'):
+        ('pandas.core.indexes.base', '_new_Index'),
+    ('pandas.indexes.base', 'Index'):
+        ('pandas.core.indexes.base', 'Index'),
+    ('pandas.indexes.numeric', 'Int64Index'):
+        ('pandas.core.indexes.numeric', 'Int64Index'),
+    ('pandas.indexes.range', 'RangeIndex'):
+        ('pandas.core.indexes.range', 'RangeIndex'),
+    ('pandas.indexes.multi', 'MultiIndex'):
+        ('pandas.core.indexes.multi', 'MultiIndex'),
+    ('pandas.tseries.index', '_new_DatetimeIndex'):
+        ('pandas.core.indexes.datetimes', '_new_DatetimeIndex'),
+    ('pandas.tseries.index', 'DatetimeIndex'):
+        ('pandas.core.indexes.datetimes', 'DatetimeIndex'),
+    ('pandas.tseries.period', 'PeriodIndex'):
+        ('pandas.core.indexes.period', 'PeriodIndex'),
+
+    # 19269, arrays moving
+    ('pandas.core.categorical', 'Categorical'):
+        ('pandas.core.arrays', 'Categorical'),
+
+    # 19939, add timedeltaindex, float64index compat from 15998 move
+    ('pandas.tseries.tdi', 'TimedeltaIndex'):
+        ('pandas.core.indexes.timedeltas', 'TimedeltaIndex'),
+    ('pandas.indexes.numeric', 'Float64Index'):
+        ('pandas.core.indexes.numeric', 'Float64Index'),
+}
 
 
 # our Unpickler sub-class to override methods and some dispatcher
@@ -112,6 +177,8 @@ def load_newobj(self):
         obj = cls.__new__(cls, *args)
 
     self.stack[-1] = obj
+
+
 Unpickler.dispatch[pkl.NEWOBJ[0]] = load_newobj
 
 
@@ -126,13 +193,15 @@ def load_newobj_ex(self):
     else:
         obj = cls.__new__(cls, *args, **kwargs)
     self.append(obj)
+
+
 try:
     Unpickler.dispatch[pkl.NEWOBJ_EX[0]] = load_newobj_ex
-except:
+except (AttributeError, KeyError):
     pass
 
 
-def load(fh, encoding=None, compat=False, is_verbose=False):
+def load(fh, encoding=None, is_verbose=False):
     """load a pickle, with a provided encoding
 
     if compat is True:
@@ -141,10 +210,9 @@ def load(fh, encoding=None, compat=False, is_verbose=False):
 
     Parameters
     ----------
-    fh: a filelike object
-    encoding: an optional encoding
-    compat: provide Series compatibility mode, boolean, default False
-    is_verbose: show exception output
+    fh : a filelike object
+    encoding : an optional encoding
+    is_verbose : show exception output
     """
 
     try:
@@ -156,5 +224,5 @@ def load(fh, encoding=None, compat=False, is_verbose=False):
         up.is_verbose = is_verbose
 
         return up.load()
-    except:
+    except (ValueError, TypeError):
         raise
diff --git a/pandas/computation/__init__.py b/pandas/computation/__init__.py
deleted file mode 100644
index e13faf890d1f8..0000000000000
--- a/pandas/computation/__init__.py
+++ /dev/null
@@ -1,23 +0,0 @@
-
-import warnings
-from distutils.version import LooseVersion
-
-_NUMEXPR_INSTALLED = False
-_MIN_NUMEXPR_VERSION = "2.4.6"
-
-try:
-    import numexpr as ne
-    ver = ne.__version__
-    _NUMEXPR_INSTALLED = ver >= LooseVersion(_MIN_NUMEXPR_VERSION)
-
-    if not _NUMEXPR_INSTALLED:
-        warnings.warn(
-            "The installed version of numexpr {ver} is not supported "
-            "in pandas and will be not be used\nThe minimum supported "
-            "version is {min_ver}\n".format(
-                ver=ver, min_ver=_MIN_NUMEXPR_VERSION), UserWarning)
-
-except ImportError:  # pragma: no cover
-    pass
-
-__all__ = ['_NUMEXPR_INSTALLED']
diff --git a/pandas/computation/api.py b/pandas/computation/api.py
deleted file mode 100644
index fe3dad015048e..0000000000000
--- a/pandas/computation/api.py
+++ /dev/null
@@ -1,14 +0,0 @@
-# flake8: noqa
-
-from pandas.computation.eval import eval
-
-
-# deprecation, xref #13790
-def Expr(*args, **kwargs):
-    import warnings
-
-    warnings.warn("pd.Expr is deprecated as it is not "
-                  "applicable to user code",
-                  FutureWarning, stacklevel=2)
-    from pandas.computation.expr import Expr
-    return Expr(*args, **kwargs)
diff --git a/pandas/computation/common.py b/pandas/computation/common.py
deleted file mode 100644
index 105cc497a4207..0000000000000
--- a/pandas/computation/common.py
+++ /dev/null
@@ -1,24 +0,0 @@
-import numpy as np
-import pandas as pd
-from pandas.compat import reduce
-
-
-def _ensure_decoded(s):
-    """ if we have bytes, decode them to unicode """
-    if isinstance(s, (np.bytes_, bytes)):
-        s = s.decode(pd.get_option('display.encoding'))
-    return s
-
-
-def _result_type_many(*arrays_and_dtypes):
-    """ wrapper around numpy.result_type which overcomes the NPY_MAXARGS (32)
-    argument limit """
-    try:
-        return np.result_type(*arrays_and_dtypes)
-    except ValueError:
-        # we have > NPY_MAXARGS terms in our expression
-        return reduce(np.result_type, arrays_and_dtypes)
-
-
-class NameResolutionError(NameError):
-    pass
diff --git a/pandas/computation/eval.py b/pandas/computation/eval.py
deleted file mode 100644
index 5b21c753a71da..0000000000000
--- a/pandas/computation/eval.py
+++ /dev/null
@@ -1,310 +0,0 @@
-#!/usr/bin/env python
-
-"""Top level ``eval`` module.
-"""
-
-import warnings
-import tokenize
-from pandas.formats.printing import pprint_thing
-from pandas.computation import _NUMEXPR_INSTALLED
-from pandas.computation.expr import Expr, _parsers, tokenize_string
-from pandas.computation.scope import _ensure_scope
-from pandas.compat import string_types
-from pandas.computation.engines import _engines
-from pandas.util.validators import validate_bool_kwarg
-
-
-def _check_engine(engine):
-    """Make sure a valid engine is passed.
-
-    Parameters
-    ----------
-    engine : str
-
-    Raises
-    ------
-    KeyError
-      * If an invalid engine is passed
-    ImportError
-      * If numexpr was requested but doesn't exist
-
-    Returns
-    -------
-    string engine
-
-    """
-
-    if engine is None:
-        if _NUMEXPR_INSTALLED:
-            engine = 'numexpr'
-        else:
-            engine = 'python'
-
-    if engine not in _engines:
-        raise KeyError('Invalid engine {0!r} passed, valid engines are'
-                       ' {1}'.format(engine, list(_engines.keys())))
-
-    # TODO: validate this in a more general way (thinking of future engines
-    # that won't necessarily be import-able)
-    # Could potentially be done on engine instantiation
-    if engine == 'numexpr':
-        if not _NUMEXPR_INSTALLED:
-            raise ImportError("'numexpr' is not installed or an "
-                              "unsupported version. Cannot use "
-                              "engine='numexpr' for query/eval "
-                              "if 'numexpr' is not installed")
-
-    return engine
-
-
-def _check_parser(parser):
-    """Make sure a valid parser is passed.
-
-    Parameters
-    ----------
-    parser : str
-
-    Raises
-    ------
-    KeyError
-      * If an invalid parser is passed
-    """
-    if parser not in _parsers:
-        raise KeyError('Invalid parser {0!r} passed, valid parsers are'
-                       ' {1}'.format(parser, _parsers.keys()))
-
-
-def _check_resolvers(resolvers):
-    if resolvers is not None:
-        for resolver in resolvers:
-            if not hasattr(resolver, '__getitem__'):
-                name = type(resolver).__name__
-                raise TypeError('Resolver of type %r does not implement '
-                                'the __getitem__ method' % name)
-
-
-def _check_expression(expr):
-    """Make sure an expression is not an empty string
-
-    Parameters
-    ----------
-    expr : object
-        An object that can be converted to a string
-
-    Raises
-    ------
-    ValueError
-      * If expr is an empty string
-    """
-    if not expr:
-        raise ValueError("expr cannot be an empty string")
-
-
-def _convert_expression(expr):
-    """Convert an object to an expression.
-
-    Thus function converts an object to an expression (a unicode string) and
-    checks to make sure it isn't empty after conversion. This is used to
-    convert operators to their string representation for recursive calls to
-    :func:`~pandas.eval`.
-
-    Parameters
-    ----------
-    expr : object
-        The object to be converted to a string.
-
-    Returns
-    -------
-    s : unicode
-        The string representation of an object.
-
-    Raises
-    ------
-    ValueError
-      * If the expression is empty.
-    """
-    s = pprint_thing(expr)
-    _check_expression(s)
-    return s
-
-
-def _check_for_locals(expr, stack_level, parser):
-    at_top_of_stack = stack_level == 0
-    not_pandas_parser = parser != 'pandas'
-
-    if not_pandas_parser:
-        msg = "The '@' prefix is only supported by the pandas parser"
-    elif at_top_of_stack:
-        msg = ("The '@' prefix is not allowed in "
-               "top-level eval calls, \nplease refer to "
-               "your variables by name without the '@' "
-               "prefix")
-
-    if at_top_of_stack or not_pandas_parser:
-        for toknum, tokval in tokenize_string(expr):
-            if toknum == tokenize.OP and tokval == '@':
-                raise SyntaxError(msg)
-
-
-def eval(expr, parser='pandas', engine=None, truediv=True,
-         local_dict=None, global_dict=None, resolvers=(), level=0,
-         target=None, inplace=None):
-    """Evaluate a Python expression as a string using various backends.
-
-    The following arithmetic operations are supported: ``+``, ``-``, ``*``,
-    ``/``, ``**``, ``%``, ``//`` (python engine only) along with the following
-    boolean operations: ``|`` (or), ``&`` (and), and ``~`` (not).
-    Additionally, the ``'pandas'`` parser allows the use of :keyword:`and`,
-    :keyword:`or`, and :keyword:`not` with the same semantics as the
-    corresponding bitwise operators.  :class:`~pandas.Series` and
-    :class:`~pandas.DataFrame` objects are supported and behave as they would
-    with plain ol' Python evaluation.
-
-    Parameters
-    ----------
-    expr : str or unicode
-        The expression to evaluate. This string cannot contain any Python
-        `statements
-        <http://docs.python.org/2/reference/simple_stmts.html#simple-statements>`__,
-        only Python `expressions
-        <http://docs.python.org/2/reference/simple_stmts.html#expression-statements>`__.
-    parser : string, default 'pandas', {'pandas', 'python'}
-        The parser to use to construct the syntax tree from the expression. The
-        default of ``'pandas'`` parses code slightly different than standard
-        Python. Alternatively, you can parse an expression using the
-        ``'python'`` parser to retain strict Python semantics.  See the
-        :ref:`enhancing performance <enhancingperf.eval>` documentation for
-        more details.
-    engine : string or None, default 'numexpr', {'python', 'numexpr'}
-
-        The engine used to evaluate the expression. Supported engines are
-
-        - None         : tries to use ``numexpr``, falls back to ``python``
-        - ``'numexpr'``: This default engine evaluates pandas objects using
-                         numexpr for large speed ups in complex expressions
-                         with large frames.
-        - ``'python'``: Performs operations as if you had ``eval``'d in top
-                        level python. This engine is generally not that useful.
-
-        More backends may be available in the future.
-
-    truediv : bool, optional
-        Whether to use true division, like in Python >= 3
-    local_dict : dict or None, optional
-        A dictionary of local variables, taken from locals() by default.
-    global_dict : dict or None, optional
-        A dictionary of global variables, taken from globals() by default.
-    resolvers : list of dict-like or None, optional
-        A list of objects implementing the ``__getitem__`` special method that
-        you can use to inject an additional collection of namespaces to use for
-        variable lookup. For example, this is used in the
-        :meth:`~pandas.DataFrame.query` method to inject the
-        :attr:`~pandas.DataFrame.index` and :attr:`~pandas.DataFrame.columns`
-        variables that refer to their respective :class:`~pandas.DataFrame`
-        instance attributes.
-    level : int, optional
-        The number of prior stack frames to traverse and add to the current
-        scope. Most users will **not** need to change this parameter.
-    target : a target object for assignment, optional, default is None
-        essentially this is a passed in resolver
-    inplace : bool, default True
-        If expression mutates, whether to modify object inplace or return
-        copy with mutation.
-
-        WARNING: inplace=None currently falls back to to True, but
-        in a future version, will default to False.  Use inplace=True
-        explicitly rather than relying on the default.
-
-    Returns
-    -------
-    ndarray, numeric scalar, DataFrame, Series
-
-    Notes
-    -----
-    The ``dtype`` of any objects involved in an arithmetic ``%`` operation are
-    recursively cast to ``float64``.
-
-    See the :ref:`enhancing performance <enhancingperf.eval>` documentation for
-    more details.
-
-    See Also
-    --------
-    pandas.DataFrame.query
-    pandas.DataFrame.eval
-    """
-    inplace = validate_bool_kwarg(inplace, 'inplace')
-    first_expr = True
-    if isinstance(expr, string_types):
-        _check_expression(expr)
-        exprs = [e.strip() for e in expr.splitlines() if e.strip() != '']
-    else:
-        exprs = [expr]
-    multi_line = len(exprs) > 1
-
-    if multi_line and target is None:
-        raise ValueError("multi-line expressions are only valid in the "
-                         "context of data, use DataFrame.eval")
-
-    first_expr = True
-    for expr in exprs:
-        expr = _convert_expression(expr)
-        engine = _check_engine(engine)
-        _check_parser(parser)
-        _check_resolvers(resolvers)
-        _check_for_locals(expr, level, parser)
-
-        # get our (possibly passed-in) scope
-        env = _ensure_scope(level + 1, global_dict=global_dict,
-                            local_dict=local_dict, resolvers=resolvers,
-                            target=target)
-
-        parsed_expr = Expr(expr, engine=engine, parser=parser, env=env,
-                           truediv=truediv)
-
-        # construct the engine and evaluate the parsed expression
-        eng = _engines[engine]
-        eng_inst = eng(parsed_expr)
-        ret = eng_inst.evaluate()
-
-        if parsed_expr.assigner is None and multi_line:
-            raise ValueError("Multi-line expressions are only valid"
-                             " if all expressions contain an assignment")
-
-        # assign if needed
-        if env.target is not None and parsed_expr.assigner is not None:
-            if inplace is None:
-                warnings.warn(
-                    "eval expressions containing an assignment currently"
-                    "default to operating inplace.\nThis will change in "
-                    "a future version of pandas, use inplace=True to "
-                    "avoid this warning.",
-                    FutureWarning, stacklevel=3)
-                inplace = True
-
-            # if returning a copy, copy only on the first assignment
-            if not inplace and first_expr:
-                target = env.target.copy()
-            else:
-                target = env.target
-
-            target[parsed_expr.assigner] = ret
-
-            if not resolvers:
-                resolvers = ({parsed_expr.assigner: ret},)
-            else:
-                # existing resolver needs updated to handle
-                # case of mutating existing column in copy
-                for resolver in resolvers:
-                    if parsed_expr.assigner in resolver:
-                        resolver[parsed_expr.assigner] = ret
-                        break
-                else:
-                    resolvers += ({parsed_expr.assigner: ret},)
-
-            ret = None
-            first_expr = False
-
-    if not inplace and inplace is not None:
-        return target
-
-    return ret
diff --git a/pandas/computation/expressions.py b/pandas/computation/expressions.py
deleted file mode 100644
index 8fd9ab3477b74..0000000000000
--- a/pandas/computation/expressions.py
+++ /dev/null
@@ -1,256 +0,0 @@
-"""
-Expressions
------------
-
-Offer fast expression evaluation through numexpr
-
-"""
-
-import warnings
-import numpy as np
-from pandas.core.common import _values_from_object
-from pandas.computation import _NUMEXPR_INSTALLED
-
-if _NUMEXPR_INSTALLED:
-    import numexpr as ne
-
-_TEST_MODE = None
-_TEST_RESULT = None
-_USE_NUMEXPR = _NUMEXPR_INSTALLED
-_evaluate = None
-_where = None
-
-# the set of dtypes that we will allow pass to numexpr
-_ALLOWED_DTYPES = {
-    'evaluate': set(['int64', 'int32', 'float64', 'float32', 'bool']),
-    'where': set(['int64', 'float64', 'bool'])
-}
-
-# the minimum prod shape that we will use numexpr
-_MIN_ELEMENTS = 10000
-
-
-def set_use_numexpr(v=True):
-    # set/unset to use numexpr
-    global _USE_NUMEXPR
-    if _NUMEXPR_INSTALLED:
-        _USE_NUMEXPR = v
-
-    # choose what we are going to do
-    global _evaluate, _where
-    if not _USE_NUMEXPR:
-        _evaluate = _evaluate_standard
-        _where = _where_standard
-    else:
-        _evaluate = _evaluate_numexpr
-        _where = _where_numexpr
-
-
-def set_numexpr_threads(n=None):
-    # if we are using numexpr, set the threads to n
-    # otherwise reset
-    if _NUMEXPR_INSTALLED and _USE_NUMEXPR:
-        if n is None:
-            n = ne.detect_number_of_cores()
-        ne.set_num_threads(n)
-
-
-def _evaluate_standard(op, op_str, a, b, raise_on_error=True, **eval_kwargs):
-    """ standard evaluation """
-    if _TEST_MODE:
-        _store_test_result(False)
-    with np.errstate(all='ignore'):
-        return op(a, b)
-
-
-def _can_use_numexpr(op, op_str, a, b, dtype_check):
-    """ return a boolean if we WILL be using numexpr """
-    if op_str is not None:
-
-        # required min elements (otherwise we are adding overhead)
-        if np.prod(a.shape) > _MIN_ELEMENTS:
-
-            # check for dtype compatiblity
-            dtypes = set()
-            for o in [a, b]:
-                if hasattr(o, 'get_dtype_counts'):
-                    s = o.get_dtype_counts()
-                    if len(s) > 1:
-                        return False
-                    dtypes |= set(s.index)
-                elif isinstance(o, np.ndarray):
-                    dtypes |= set([o.dtype.name])
-
-            # allowed are a superset
-            if not len(dtypes) or _ALLOWED_DTYPES[dtype_check] >= dtypes:
-                return True
-
-    return False
-
-
-def _evaluate_numexpr(op, op_str, a, b, raise_on_error=False, truediv=True,
-                      reversed=False, **eval_kwargs):
-    result = None
-
-    if _can_use_numexpr(op, op_str, a, b, 'evaluate'):
-        try:
-
-            # we were originally called by a reversed op
-            # method
-            if reversed:
-                a, b = b, a
-
-            a_value = getattr(a, "values", a)
-            b_value = getattr(b, "values", b)
-            result = ne.evaluate('a_value %s b_value' % op_str,
-                                 local_dict={'a_value': a_value,
-                                             'b_value': b_value},
-                                 casting='safe', truediv=truediv,
-                                 **eval_kwargs)
-        except ValueError as detail:
-            if 'unknown type object' in str(detail):
-                pass
-        except Exception as detail:
-            if raise_on_error:
-                raise
-
-    if _TEST_MODE:
-        _store_test_result(result is not None)
-
-    if result is None:
-        result = _evaluate_standard(op, op_str, a, b, raise_on_error)
-
-    return result
-
-
-def _where_standard(cond, a, b, raise_on_error=True):
-    return np.where(_values_from_object(cond), _values_from_object(a),
-                    _values_from_object(b))
-
-
-def _where_numexpr(cond, a, b, raise_on_error=False):
-    result = None
-
-    if _can_use_numexpr(None, 'where', a, b, 'where'):
-
-        try:
-            cond_value = getattr(cond, 'values', cond)
-            a_value = getattr(a, 'values', a)
-            b_value = getattr(b, 'values', b)
-            result = ne.evaluate('where(cond_value, a_value, b_value)',
-                                 local_dict={'cond_value': cond_value,
-                                             'a_value': a_value,
-                                             'b_value': b_value},
-                                 casting='safe')
-        except ValueError as detail:
-            if 'unknown type object' in str(detail):
-                pass
-        except Exception as detail:
-            if raise_on_error:
-                raise TypeError(str(detail))
-
-    if result is None:
-        result = _where_standard(cond, a, b, raise_on_error)
-
-    return result
-
-
-# turn myself on
-set_use_numexpr(True)
-
-
-def _has_bool_dtype(x):
-    try:
-        return x.dtype == bool
-    except AttributeError:
-        try:
-            return 'bool' in x.blocks
-        except AttributeError:
-            return isinstance(x, (bool, np.bool_))
-
-
-def _bool_arith_check(op_str, a, b, not_allowed=frozenset(('/', '//', '**')),
-                      unsupported=None):
-    if unsupported is None:
-        unsupported = {'+': '|', '*': '&', '-': '^'}
-
-    if _has_bool_dtype(a) and _has_bool_dtype(b):
-        if op_str in unsupported:
-            warnings.warn("evaluating in Python space because the %r operator"
-                          " is not supported by numexpr for the bool "
-                          "dtype, use %r instead" % (op_str,
-                                                     unsupported[op_str]))
-            return False
-
-        if op_str in not_allowed:
-            raise NotImplementedError("operator %r not implemented for bool "
-                                      "dtypes" % op_str)
-    return True
-
-
-def evaluate(op, op_str, a, b, raise_on_error=False, use_numexpr=True,
-             **eval_kwargs):
-    """ evaluate and return the expression of the op on a and b
-
-        Parameters
-        ----------
-
-        op :    the actual operand
-        op_str: the string version of the op
-        a :     left operand
-        b :     right operand
-        raise_on_error : pass the error to the higher level if indicated
-                         (default is False), otherwise evaluate the op with and
-                         return the results
-        use_numexpr : whether to try to use numexpr (default True)
-        """
-    use_numexpr = use_numexpr and _bool_arith_check(op_str, a, b)
-    if use_numexpr:
-        return _evaluate(op, op_str, a, b, raise_on_error=raise_on_error,
-                         **eval_kwargs)
-    return _evaluate_standard(op, op_str, a, b, raise_on_error=raise_on_error)
-
-
-def where(cond, a, b, raise_on_error=False, use_numexpr=True):
-    """ evaluate the where condition cond on a and b
-
-        Parameters
-        ----------
-
-        cond : a boolean array
-        a :    return if cond is True
-        b :    return if cond is False
-        raise_on_error : pass the error to the higher level if indicated
-                         (default is False), otherwise evaluate the op with and
-                         return the results
-        use_numexpr : whether to try to use numexpr (default True)
-        """
-
-    if use_numexpr:
-        return _where(cond, a, b, raise_on_error=raise_on_error)
-    return _where_standard(cond, a, b, raise_on_error=raise_on_error)
-
-
-def set_test_mode(v=True):
-    """
-    Keeps track of whether numexpr  was used.  Stores an additional ``True``
-    for every successful use of evaluate with numexpr since the last
-    ``get_test_result``
-    """
-    global _TEST_MODE, _TEST_RESULT
-    _TEST_MODE = v
-    _TEST_RESULT = []
-
-
-def _store_test_result(used_numexpr):
-    global _TEST_RESULT
-    if used_numexpr:
-        _TEST_RESULT.append(used_numexpr)
-
-
-def get_test_result():
-    """get test result and reset test_results"""
-    global _TEST_RESULT
-    res = _TEST_RESULT
-    _TEST_RESULT = []
-    return res
diff --git a/pandas/computation/ops.py b/pandas/computation/ops.py
deleted file mode 100644
index 6ba2a21940d55..0000000000000
--- a/pandas/computation/ops.py
+++ /dev/null
@@ -1,549 +0,0 @@
-"""Operator classes for eval.
-"""
-
-import operator as op
-from functools import partial
-from datetime import datetime
-
-import numpy as np
-
-from pandas.types.common import is_list_like, is_scalar
-import pandas as pd
-from pandas.compat import PY3, string_types, text_type
-import pandas.core.common as com
-from pandas.formats.printing import pprint_thing, pprint_thing_encoded
-from pandas.core.base import StringMixin
-from pandas.computation.common import _ensure_decoded, _result_type_many
-from pandas.computation.scope import _DEFAULT_GLOBALS
-
-
-_reductions = 'sum', 'prod'
-
-_unary_math_ops = ('sin', 'cos', 'exp', 'log', 'expm1', 'log1p',
-                   'sqrt', 'sinh', 'cosh', 'tanh', 'arcsin', 'arccos',
-                   'arctan', 'arccosh', 'arcsinh', 'arctanh', 'abs')
-_binary_math_ops = ('arctan2',)
-_mathops = _unary_math_ops + _binary_math_ops
-
-
-_LOCAL_TAG = '__pd_eval_local_'
-
-
-class UndefinedVariableError(NameError):
-
-    """NameError subclass for local variables."""
-
-    def __init__(self, name, is_local):
-        if is_local:
-            msg = 'local variable {0!r} is not defined'
-        else:
-            msg = 'name {0!r} is not defined'
-        super(UndefinedVariableError, self).__init__(msg.format(name))
-
-
-class Term(StringMixin):
-
-    def __new__(cls, name, env, side=None, encoding=None):
-        klass = Constant if not isinstance(name, string_types) else cls
-        supr_new = super(Term, klass).__new__
-        return supr_new(klass)
-
-    def __init__(self, name, env, side=None, encoding=None):
-        self._name = name
-        self.env = env
-        self.side = side
-        tname = text_type(name)
-        self.is_local = (tname.startswith(_LOCAL_TAG) or
-                         tname in _DEFAULT_GLOBALS)
-        self._value = self._resolve_name()
-        self.encoding = encoding
-
-    @property
-    def local_name(self):
-        return self.name.replace(_LOCAL_TAG, '')
-
-    def __unicode__(self):
-        return pprint_thing(self.name)
-
-    def __call__(self, *args, **kwargs):
-        return self.value
-
-    def evaluate(self, *args, **kwargs):
-        return self
-
-    def _resolve_name(self):
-        res = self.env.resolve(self.local_name, is_local=self.is_local)
-        self.update(res)
-
-        if hasattr(res, 'ndim') and res.ndim > 2:
-            raise NotImplementedError("N-dimensional objects, where N > 2,"
-                                      " are not supported with eval")
-        return res
-
-    def update(self, value):
-        """
-        search order for local (i.e., @variable) variables:
-
-        scope, key_variable
-        [('locals', 'local_name'),
-         ('globals', 'local_name'),
-         ('locals', 'key'),
-         ('globals', 'key')]
-        """
-        key = self.name
-
-        # if it's a variable name (otherwise a constant)
-        if isinstance(key, string_types):
-            self.env.swapkey(self.local_name, key, new_value=value)
-
-        self.value = value
-
-    @property
-    def isscalar(self):
-        return is_scalar(self._value)
-
-    @property
-    def type(self):
-        try:
-            # potentially very slow for large, mixed dtype frames
-            return self._value.values.dtype
-        except AttributeError:
-            try:
-                # ndarray
-                return self._value.dtype
-            except AttributeError:
-                # scalar
-                return type(self._value)
-
-    return_type = type
-
-    @property
-    def raw(self):
-        return pprint_thing('{0}(name={1!r}, type={2})'
-                            ''.format(self.__class__.__name__, self.name,
-                                      self.type))
-
-    @property
-    def is_datetime(self):
-        try:
-            t = self.type.type
-        except AttributeError:
-            t = self.type
-
-        return issubclass(t, (datetime, np.datetime64))
-
-    @property
-    def value(self):
-        return self._value
-
-    @value.setter
-    def value(self, new_value):
-        self._value = new_value
-
-    @property
-    def name(self):
-        return self._name
-
-    @name.setter
-    def name(self, new_name):
-        self._name = new_name
-
-    @property
-    def ndim(self):
-        return self._value.ndim
-
-
-class Constant(Term):
-
-    def __init__(self, value, env, side=None, encoding=None):
-        super(Constant, self).__init__(value, env, side=side,
-                                       encoding=encoding)
-
-    def _resolve_name(self):
-        return self._name
-
-    @property
-    def name(self):
-        return self.value
-
-    def __unicode__(self):
-        # in python 2 str() of float
-        # can truncate shorter than repr()
-        return repr(self.name)
-
-
-_bool_op_map = {'not': '~', 'and': '&', 'or': '|'}
-
-
-class Op(StringMixin):
-
-    """Hold an operator of arbitrary arity
-    """
-
-    def __init__(self, op, operands, *args, **kwargs):
-        self.op = _bool_op_map.get(op, op)
-        self.operands = operands
-        self.encoding = kwargs.get('encoding', None)
-
-    def __iter__(self):
-        return iter(self.operands)
-
-    def __unicode__(self):
-        """Print a generic n-ary operator and its operands using infix
-        notation"""
-        # recurse over the operands
-        parened = ('({0})'.format(pprint_thing(opr))
-                   for opr in self.operands)
-        return pprint_thing(' {0} '.format(self.op).join(parened))
-
-    @property
-    def return_type(self):
-        # clobber types to bool if the op is a boolean operator
-        if self.op in (_cmp_ops_syms + _bool_ops_syms):
-            return np.bool_
-        return _result_type_many(*(term.type for term in com.flatten(self)))
-
-    @property
-    def has_invalid_return_type(self):
-        types = self.operand_types
-        obj_dtype_set = frozenset([np.dtype('object')])
-        return self.return_type == object and types - obj_dtype_set
-
-    @property
-    def operand_types(self):
-        return frozenset(term.type for term in com.flatten(self))
-
-    @property
-    def isscalar(self):
-        return all(operand.isscalar for operand in self.operands)
-
-    @property
-    def is_datetime(self):
-        try:
-            t = self.return_type.type
-        except AttributeError:
-            t = self.return_type
-
-        return issubclass(t, (datetime, np.datetime64))
-
-
-def _in(x, y):
-    """Compute the vectorized membership of ``x in y`` if possible, otherwise
-    use Python.
-    """
-    try:
-        return x.isin(y)
-    except AttributeError:
-        if is_list_like(x):
-            try:
-                return y.isin(x)
-            except AttributeError:
-                pass
-        return x in y
-
-
-def _not_in(x, y):
-    """Compute the vectorized membership of ``x not in y`` if possible,
-    otherwise use Python.
-    """
-    try:
-        return ~x.isin(y)
-    except AttributeError:
-        if is_list_like(x):
-            try:
-                return ~y.isin(x)
-            except AttributeError:
-                pass
-        return x not in y
-
-
-_cmp_ops_syms = '>', '<', '>=', '<=', '==', '!=', 'in', 'not in'
-_cmp_ops_funcs = op.gt, op.lt, op.ge, op.le, op.eq, op.ne, _in, _not_in
-_cmp_ops_dict = dict(zip(_cmp_ops_syms, _cmp_ops_funcs))
-
-_bool_ops_syms = '&', '|', 'and', 'or'
-_bool_ops_funcs = op.and_, op.or_, op.and_, op.or_
-_bool_ops_dict = dict(zip(_bool_ops_syms, _bool_ops_funcs))
-
-_arith_ops_syms = '+', '-', '*', '/', '**', '//', '%'
-_arith_ops_funcs = (op.add, op.sub, op.mul, op.truediv if PY3 else op.div,
-                    op.pow, op.floordiv, op.mod)
-_arith_ops_dict = dict(zip(_arith_ops_syms, _arith_ops_funcs))
-
-_special_case_arith_ops_syms = '**', '//', '%'
-_special_case_arith_ops_funcs = op.pow, op.floordiv, op.mod
-_special_case_arith_ops_dict = dict(zip(_special_case_arith_ops_syms,
-                                        _special_case_arith_ops_funcs))
-
-_binary_ops_dict = {}
-
-for d in (_cmp_ops_dict, _bool_ops_dict, _arith_ops_dict):
-    _binary_ops_dict.update(d)
-
-
-def _cast_inplace(terms, acceptable_dtypes, dtype):
-    """Cast an expression inplace.
-
-    Parameters
-    ----------
-    terms : Op
-        The expression that should cast.
-    acceptable_dtypes : list of acceptable numpy.dtype
-        Will not cast if term's dtype in this list.
-
-        .. versionadded:: 0.19.0
-
-    dtype : str or numpy.dtype
-        The dtype to cast to.
-    """
-    dt = np.dtype(dtype)
-    for term in terms:
-        if term.type in acceptable_dtypes:
-            continue
-
-        try:
-            new_value = term.value.astype(dt)
-        except AttributeError:
-            new_value = dt.type(term.value)
-        term.update(new_value)
-
-
-def is_term(obj):
-    return isinstance(obj, Term)
-
-
-class BinOp(Op):
-
-    """Hold a binary operator and its operands
-
-    Parameters
-    ----------
-    op : str
-    left : Term or Op
-    right : Term or Op
-    """
-
-    def __init__(self, op, lhs, rhs, **kwargs):
-        super(BinOp, self).__init__(op, (lhs, rhs))
-        self.lhs = lhs
-        self.rhs = rhs
-
-        self._disallow_scalar_only_bool_ops()
-
-        self.convert_values()
-
-        try:
-            self.func = _binary_ops_dict[op]
-        except KeyError:
-            # has to be made a list for python3
-            keys = list(_binary_ops_dict.keys())
-            raise ValueError('Invalid binary operator {0!r}, valid'
-                             ' operators are {1}'.format(op, keys))
-
-    def __call__(self, env):
-        """Recursively evaluate an expression in Python space.
-
-        Parameters
-        ----------
-        env : Scope
-
-        Returns
-        -------
-        object
-            The result of an evaluated expression.
-        """
-        # handle truediv
-        if self.op == '/' and env.scope['truediv']:
-            self.func = op.truediv
-
-        # recurse over the left/right nodes
-        left = self.lhs(env)
-        right = self.rhs(env)
-
-        return self.func(left, right)
-
-    def evaluate(self, env, engine, parser, term_type, eval_in_python):
-        """Evaluate a binary operation *before* being passed to the engine.
-
-        Parameters
-        ----------
-        env : Scope
-        engine : str
-        parser : str
-        term_type : type
-        eval_in_python : list
-
-        Returns
-        -------
-        term_type
-            The "pre-evaluated" expression as an instance of ``term_type``
-        """
-        if engine == 'python':
-            res = self(env)
-        else:
-            # recurse over the left/right nodes
-            left = self.lhs.evaluate(env, engine=engine, parser=parser,
-                                     term_type=term_type,
-                                     eval_in_python=eval_in_python)
-            right = self.rhs.evaluate(env, engine=engine, parser=parser,
-                                      term_type=term_type,
-                                      eval_in_python=eval_in_python)
-
-            # base cases
-            if self.op in eval_in_python:
-                res = self.func(left.value, right.value)
-            else:
-                res = pd.eval(self, local_dict=env, engine=engine,
-                              parser=parser)
-
-        name = env.add_tmp(res)
-        return term_type(name, env=env)
-
-    def convert_values(self):
-        """Convert datetimes to a comparable value in an expression.
-        """
-        def stringify(value):
-            if self.encoding is not None:
-                encoder = partial(pprint_thing_encoded,
-                                  encoding=self.encoding)
-            else:
-                encoder = pprint_thing
-            return encoder(value)
-
-        lhs, rhs = self.lhs, self.rhs
-
-        if is_term(lhs) and lhs.is_datetime and is_term(rhs) and rhs.isscalar:
-            v = rhs.value
-            if isinstance(v, (int, float)):
-                v = stringify(v)
-            v = pd.Timestamp(_ensure_decoded(v))
-            if v.tz is not None:
-                v = v.tz_convert('UTC')
-            self.rhs.update(v)
-
-        if is_term(rhs) and rhs.is_datetime and is_term(lhs) and lhs.isscalar:
-            v = lhs.value
-            if isinstance(v, (int, float)):
-                v = stringify(v)
-            v = pd.Timestamp(_ensure_decoded(v))
-            if v.tz is not None:
-                v = v.tz_convert('UTC')
-            self.lhs.update(v)
-
-    def _disallow_scalar_only_bool_ops(self):
-        if ((self.lhs.isscalar or self.rhs.isscalar) and
-            self.op in _bool_ops_dict and
-            (not (issubclass(self.rhs.return_type, (bool, np.bool_)) and
-                  issubclass(self.lhs.return_type, (bool, np.bool_))))):
-            raise NotImplementedError("cannot evaluate scalar only bool ops")
-
-
-def isnumeric(dtype):
-    return issubclass(np.dtype(dtype).type, np.number)
-
-
-class Div(BinOp):
-
-    """Div operator to special case casting.
-
-    Parameters
-    ----------
-    lhs, rhs : Term or Op
-        The Terms or Ops in the ``/`` expression.
-    truediv : bool
-        Whether or not to use true division. With Python 3 this happens
-        regardless of the value of ``truediv``.
-    """
-
-    def __init__(self, lhs, rhs, truediv, *args, **kwargs):
-        super(Div, self).__init__('/', lhs, rhs, *args, **kwargs)
-
-        if not isnumeric(lhs.return_type) or not isnumeric(rhs.return_type):
-            raise TypeError("unsupported operand type(s) for {0}:"
-                            " '{1}' and '{2}'".format(self.op,
-                                                      lhs.return_type,
-                                                      rhs.return_type))
-
-        if truediv or PY3:
-            # do not upcast float32s to float64 un-necessarily
-            acceptable_dtypes = [np.float32, np.float_]
-            _cast_inplace(com.flatten(self), acceptable_dtypes, np.float_)
-
-
-_unary_ops_syms = '+', '-', '~', 'not'
-_unary_ops_funcs = op.pos, op.neg, op.invert, op.invert
-_unary_ops_dict = dict(zip(_unary_ops_syms, _unary_ops_funcs))
-
-
-class UnaryOp(Op):
-
-    """Hold a unary operator and its operands
-
-    Parameters
-    ----------
-    op : str
-        The token used to represent the operator.
-    operand : Term or Op
-        The Term or Op operand to the operator.
-
-    Raises
-    ------
-    ValueError
-        * If no function associated with the passed operator token is found.
-    """
-
-    def __init__(self, op, operand):
-        super(UnaryOp, self).__init__(op, (operand,))
-        self.operand = operand
-
-        try:
-            self.func = _unary_ops_dict[op]
-        except KeyError:
-            raise ValueError('Invalid unary operator {0!r}, valid operators '
-                             'are {1}'.format(op, _unary_ops_syms))
-
-    def __call__(self, env):
-        operand = self.operand(env)
-        return self.func(operand)
-
-    def __unicode__(self):
-        return pprint_thing('{0}({1})'.format(self.op, self.operand))
-
-    @property
-    def return_type(self):
-        operand = self.operand
-        if operand.return_type == np.dtype('bool'):
-            return np.dtype('bool')
-        if (isinstance(operand, Op) and
-                (operand.op in _cmp_ops_dict or operand.op in _bool_ops_dict)):
-            return np.dtype('bool')
-        return np.dtype('int')
-
-
-class MathCall(Op):
-
-    def __init__(self, func, args):
-        super(MathCall, self).__init__(func.name, args)
-        self.func = func
-
-    def __call__(self, env):
-        operands = [op(env) for op in self.operands]
-        with np.errstate(all='ignore'):
-            return self.func.func(*operands)
-
-    def __unicode__(self):
-        operands = map(str, self.operands)
-        return pprint_thing('{0}({1})'.format(self.op, ','.join(operands)))
-
-
-class FuncNode(object):
-
-    def __init__(self, name):
-        if name not in _mathops:
-            raise ValueError(
-                "\"{0}\" is not a supported function".format(name))
-        self.name = name
-        self.func = getattr(np, name)
-
-    def __call__(self, *args):
-        return MathCall(self, args)
diff --git a/pandas/conftest.py b/pandas/conftest.py
index e0a15f740688b..35a6b5df35ddc 100644
--- a/pandas/conftest.py
+++ b/pandas/conftest.py
@@ -1,16 +1,46 @@
+from datetime import date, time, timedelta
+from decimal import Decimal
+import os
+
+from dateutil.tz import tzlocal, tzutc
+import hypothesis
+from hypothesis import strategies as st
+import numpy as np
 import pytest
+from pytz import FixedOffset, utc
+
+from pandas.compat import PY3, u
+import pandas.util._test_decorators as td
+
+import pandas as pd
 
-import numpy
-import pandas
+hypothesis.settings.register_profile(
+    "ci",
+    # Hypothesis timing checks are tuned for scalars by default, so we bump
+    # them from 200ms to 500ms per test case as the global default.  If this
+    # is too short for a specific test, (a) try to make it faster, and (b)
+    # if it really is slow add `@settings(deadline=...)` with a working value,
+    # or `deadline=None` to entirely disable timeouts for that test.
+    deadline=500,
+    timeout=hypothesis.unlimited,
+    suppress_health_check=(hypothesis.HealthCheck.too_slow,)
+)
+hypothesis.settings.load_profile("ci")
 
 
 def pytest_addoption(parser):
     parser.addoption("--skip-slow", action="store_true",
                      help="skip slow tests")
     parser.addoption("--skip-network", action="store_true",
-                     help="run network tests")
+                     help="skip network tests")
+    parser.addoption("--skip-db", action="store_true",
+                     help="skip db tests")
+    parser.addoption("--run-high-memory", action="store_true",
+                     help="run high memory tests")
     parser.addoption("--only-slow", action="store_true",
                      help="run only slow tests")
+    parser.addoption("--strict-data-files", action="store_true",
+                     help="Fail if a test is skipped for missing data file.")
 
 
 def pytest_runtest_setup(item):
@@ -23,10 +53,625 @@ def pytest_runtest_setup(item):
     if 'network' in item.keywords and item.config.getoption("--skip-network"):
         pytest.skip("skipping due to --skip-network")
 
+    if 'db' in item.keywords and item.config.getoption("--skip-db"):
+        pytest.skip("skipping due to --skip-db")
+
+    if 'high_memory' in item.keywords and not item.config.getoption(
+            "--run-high-memory"):
+        pytest.skip(
+            "skipping high memory test since --run-high-memory was not set")
+
+
+# Configurations for all tests and all test modules
+
+@pytest.fixture(autouse=True)
+def configure_tests():
+    pd.set_option('chained_assignment', 'raise')
+
 
 # For running doctests: make np and pd names available
 
 @pytest.fixture(autouse=True)
 def add_imports(doctest_namespace):
-    doctest_namespace['np'] = numpy
-    doctest_namespace['pd'] = pandas
+    doctest_namespace['np'] = np
+    doctest_namespace['pd'] = pd
+
+
+@pytest.fixture(params=['bsr', 'coo', 'csc', 'csr', 'dia', 'dok', 'lil'])
+def spmatrix(request):
+    from scipy import sparse
+    return getattr(sparse, request.param + '_matrix')
+
+
+@pytest.fixture(params=[0, 1, 'index', 'columns'],
+                ids=lambda x: "axis {!r}".format(x))
+def axis(request):
+    """
+     Fixture for returning the axis numbers of a DataFrame.
+     """
+    return request.param
+
+
+axis_frame = axis
+
+
+@pytest.fixture(params=[0, 'index'], ids=lambda x: "axis {!r}".format(x))
+def axis_series(request):
+    """
+     Fixture for returning the axis numbers of a Series.
+     """
+    return request.param
+
+
+@pytest.fixture
+def ip():
+    """
+    Get an instance of IPython.InteractiveShell.
+
+    Will raise a skip if IPython is not installed.
+    """
+
+    pytest.importorskip('IPython', minversion="6.0.0")
+    from IPython.core.interactiveshell import InteractiveShell
+    return InteractiveShell()
+
+
+@pytest.fixture(params=[True, False, None])
+def observed(request):
+    """ pass in the observed keyword to groupby for [True, False]
+    This indicates whether categoricals should return values for
+    values which are not in the grouper [False / None], or only values which
+    appear in the grouper [True]. [None] is supported for future compatiblity
+    if we decide to change the default (and would need to warn if this
+    parameter is not passed)"""
+    return request.param
+
+
+_all_arithmetic_operators = ['__add__', '__radd__',
+                             '__sub__', '__rsub__',
+                             '__mul__', '__rmul__',
+                             '__floordiv__', '__rfloordiv__',
+                             '__truediv__', '__rtruediv__',
+                             '__pow__', '__rpow__',
+                             '__mod__', '__rmod__']
+if not PY3:
+    _all_arithmetic_operators.extend(['__div__', '__rdiv__'])
+
+
+@pytest.fixture(params=_all_arithmetic_operators)
+def all_arithmetic_operators(request):
+    """
+    Fixture for dunder names for common arithmetic operations
+    """
+    return request.param
+
+
+_all_numeric_reductions = ['sum', 'max', 'min',
+                           'mean', 'prod', 'std', 'var', 'median',
+                           'kurt', 'skew']
+
+
+@pytest.fixture(params=_all_numeric_reductions)
+def all_numeric_reductions(request):
+    """
+    Fixture for numeric reduction names
+    """
+    return request.param
+
+
+_all_boolean_reductions = ['all', 'any']
+
+
+@pytest.fixture(params=_all_boolean_reductions)
+def all_boolean_reductions(request):
+    """
+    Fixture for boolean reduction names
+    """
+    return request.param
+
+
+_cython_table = pd.core.base.SelectionMixin._cython_table.items()
+
+
+@pytest.fixture(params=list(_cython_table))
+def cython_table_items(request):
+    return request.param
+
+
+def _get_cython_table_params(ndframe, func_names_and_expected):
+    """combine frame, functions from SelectionMixin._cython_table
+    keys and expected result.
+
+    Parameters
+    ----------
+    ndframe : DataFrame or Series
+    func_names_and_expected : Sequence of two items
+        The first item is a name of a NDFrame method ('sum', 'prod') etc.
+        The second item is the expected return value
+
+    Returns
+    -------
+    results : list
+        List of three items (DataFrame, function, expected result)
+    """
+    results = []
+    for func_name, expected in func_names_and_expected:
+        results.append((ndframe, func_name, expected))
+        results += [(ndframe, func, expected) for func, name in _cython_table
+                    if name == func_name]
+    return results
+
+
+@pytest.fixture(params=['__eq__', '__ne__', '__le__',
+                        '__lt__', '__ge__', '__gt__'])
+def all_compare_operators(request):
+    """
+    Fixture for dunder names for common compare operations
+
+    * >=
+    * >
+    * ==
+    * !=
+    * <
+    * <=
+    """
+    return request.param
+
+
+@pytest.fixture(params=[None, 'gzip', 'bz2', 'zip',
+                        pytest.param('xz', marks=td.skip_if_no_lzma)])
+def compression(request):
+    """
+    Fixture for trying common compression types in compression tests
+    """
+    return request.param
+
+
+@pytest.fixture(params=['gzip', 'bz2', 'zip',
+                        pytest.param('xz', marks=td.skip_if_no_lzma)])
+def compression_only(request):
+    """
+    Fixture for trying common compression types in compression tests excluding
+    uncompressed case
+    """
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def writable(request):
+    """
+    Fixture that an array is writable
+    """
+    return request.param
+
+
+@pytest.fixture(scope='module')
+def datetime_tz_utc():
+    from datetime import timezone
+    return timezone.utc
+
+
+utc_objs = ['utc', 'dateutil/UTC', utc, tzutc()]
+if PY3:
+    from datetime import timezone
+    utc_objs.append(timezone.utc)
+
+
+@pytest.fixture(params=utc_objs)
+def utc_fixture(request):
+    """
+    Fixture to provide variants of UTC timezone strings and tzinfo objects
+    """
+    return request.param
+
+
+@pytest.fixture(params=['inner', 'outer', 'left', 'right'])
+def join_type(request):
+    """
+    Fixture for trying all types of join operations
+    """
+    return request.param
+
+
+@pytest.fixture
+def strict_data_files(pytestconfig):
+    return pytestconfig.getoption("--strict-data-files")
+
+
+@pytest.fixture
+def datapath(strict_data_files):
+    """Get the path to a data file.
+
+    Parameters
+    ----------
+    path : str
+        Path to the file, relative to ``pandas/tests/``
+
+    Returns
+    -------
+    path : path including ``pandas/tests``.
+
+    Raises
+    ------
+    ValueError
+        If the path doesn't exist and the --strict-data-files option is set.
+    """
+    BASE_PATH = os.path.join(os.path.dirname(__file__), 'tests')
+
+    def deco(*args):
+        path = os.path.join(BASE_PATH, *args)
+        if not os.path.exists(path):
+            if strict_data_files:
+                msg = "Could not find file {} and --strict-data-files is set."
+                raise ValueError(msg.format(path))
+            else:
+                msg = "Could not find {}."
+                pytest.skip(msg.format(path))
+        return path
+    return deco
+
+
+@pytest.fixture
+def iris(datapath):
+    """The iris dataset as a DataFrame."""
+    return pd.read_csv(datapath('data', 'iris.csv'))
+
+
+@pytest.fixture(params=['nlargest', 'nsmallest'])
+def nselect_method(request):
+    """
+    Fixture for trying all nselect methods
+    """
+    return request.param
+
+
+@pytest.fixture(params=['left', 'right', 'both', 'neither'])
+def closed(request):
+    """
+    Fixture for trying all interval closed parameters
+    """
+    return request.param
+
+
+@pytest.fixture(params=['left', 'right', 'both', 'neither'])
+def other_closed(request):
+    """
+    Secondary closed fixture to allow parametrizing over all pairs of closed
+    """
+    return request.param
+
+
+@pytest.fixture(params=[None, np.nan, pd.NaT, float('nan'), np.float('NaN')])
+def nulls_fixture(request):
+    """
+    Fixture for each null type in pandas
+    """
+    return request.param
+
+
+nulls_fixture2 = nulls_fixture  # Generate cartesian product of nulls_fixture
+
+
+@pytest.fixture(params=[None, np.nan, pd.NaT])
+def unique_nulls_fixture(request):
+    """
+    Fixture for each null type in pandas, each null type exactly once
+    """
+    return request.param
+
+
+# Generate cartesian product of unique_nulls_fixture:
+unique_nulls_fixture2 = unique_nulls_fixture
+
+
+TIMEZONES = [None, 'UTC', 'US/Eastern', 'Asia/Tokyo', 'dateutil/US/Pacific',
+             'dateutil/Asia/Singapore', tzutc(), tzlocal(), FixedOffset(300),
+             FixedOffset(0), FixedOffset(-300)]
+
+
+@td.parametrize_fixture_doc(str(TIMEZONES))
+@pytest.fixture(params=TIMEZONES)
+def tz_naive_fixture(request):
+    """
+    Fixture for trying timezones including default (None): {0}
+    """
+    return request.param
+
+
+@td.parametrize_fixture_doc(str(TIMEZONES[1:]))
+@pytest.fixture(params=TIMEZONES[1:])
+def tz_aware_fixture(request):
+    """
+    Fixture for trying explicit timezones: {0}
+    """
+    return request.param
+
+
+# ----------------------------------------------------------------
+# Dtypes
+UNSIGNED_INT_DTYPES = ["uint8", "uint16", "uint32", "uint64"]
+UNSIGNED_EA_INT_DTYPES = ["UInt8", "UInt16", "UInt32", "UInt64"]
+SIGNED_INT_DTYPES = [int, "int8", "int16", "int32", "int64"]
+SIGNED_EA_INT_DTYPES = ["Int8", "Int16", "Int32", "Int64"]
+ALL_INT_DTYPES = UNSIGNED_INT_DTYPES + SIGNED_INT_DTYPES
+ALL_EA_INT_DTYPES = UNSIGNED_EA_INT_DTYPES + SIGNED_EA_INT_DTYPES
+
+FLOAT_DTYPES = [float, "float32", "float64"]
+COMPLEX_DTYPES = [complex, "complex64", "complex128"]
+STRING_DTYPES = [str, 'str', 'U']
+
+DATETIME_DTYPES = ['datetime64[ns]', 'M8[ns]']
+TIMEDELTA_DTYPES = ['timedelta64[ns]', 'm8[ns]']
+
+BOOL_DTYPES = [bool, 'bool']
+BYTES_DTYPES = [bytes, 'bytes']
+OBJECT_DTYPES = [object, 'object']
+
+ALL_REAL_DTYPES = FLOAT_DTYPES + ALL_INT_DTYPES
+ALL_NUMPY_DTYPES = (ALL_REAL_DTYPES + COMPLEX_DTYPES + STRING_DTYPES
+                    + DATETIME_DTYPES + TIMEDELTA_DTYPES + BOOL_DTYPES
+                    + OBJECT_DTYPES + BYTES_DTYPES * PY3)  # bytes only for PY3
+
+
+@pytest.fixture(params=STRING_DTYPES)
+def string_dtype(request):
+    """Parametrized fixture for string dtypes.
+
+    * str
+    * 'str'
+    * 'U'
+    """
+    return request.param
+
+
+@pytest.fixture(params=FLOAT_DTYPES)
+def float_dtype(request):
+    """
+    Parameterized fixture for float dtypes.
+
+    * float
+    * 'float32'
+    * 'float64'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=COMPLEX_DTYPES)
+def complex_dtype(request):
+    """
+    Parameterized fixture for complex dtypes.
+
+    * complex
+    * 'complex64'
+    * 'complex128'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=SIGNED_INT_DTYPES)
+def sint_dtype(request):
+    """
+    Parameterized fixture for signed integer dtypes.
+
+    * int
+    * 'int8'
+    * 'int16'
+    * 'int32'
+    * 'int64'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=UNSIGNED_INT_DTYPES)
+def uint_dtype(request):
+    """
+    Parameterized fixture for unsigned integer dtypes.
+
+    * 'uint8'
+    * 'uint16'
+    * 'uint32'
+    * 'uint64'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=ALL_INT_DTYPES)
+def any_int_dtype(request):
+    """
+    Parameterized fixture for any integer dtype.
+
+    * int
+    * 'int8'
+    * 'uint8'
+    * 'int16'
+    * 'uint16'
+    * 'int32'
+    * 'uint32'
+    * 'int64'
+    * 'uint64'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=ALL_REAL_DTYPES)
+def any_real_dtype(request):
+    """
+    Parameterized fixture for any (purely) real numeric dtype.
+
+    * int
+    * 'int8'
+    * 'uint8'
+    * 'int16'
+    * 'uint16'
+    * 'int32'
+    * 'uint32'
+    * 'int64'
+    * 'uint64'
+    * float
+    * 'float32'
+    * 'float64'
+    """
+
+    return request.param
+
+
+@pytest.fixture(params=ALL_NUMPY_DTYPES)
+def any_numpy_dtype(request):
+    """
+    Parameterized fixture for all numpy dtypes.
+
+    * bool
+    * 'bool'
+    * int
+    * 'int8'
+    * 'uint8'
+    * 'int16'
+    * 'uint16'
+    * 'int32'
+    * 'uint32'
+    * 'int64'
+    * 'uint64'
+    * float
+    * 'float32'
+    * 'float64'
+    * complex
+    * 'complex64'
+    * 'complex128'
+    * str
+    * 'str'
+    * 'U'
+    * bytes
+    * 'bytes'
+    * 'datetime64[ns]'
+    * 'M8[ns]'
+    * 'timedelta64[ns]'
+    * 'm8[ns]'
+    * object
+    * 'object'
+    """
+
+    return request.param
+
+
+# categoricals are handled separately
+_any_skipna_inferred_dtype = [
+    ('string', ['a', np.nan, 'c']),
+    ('unicode' if not PY3 else 'string', [u('a'), np.nan, u('c')]),
+    ('bytes' if PY3 else 'string', [b'a', np.nan, b'c']),
+    ('empty', [np.nan, np.nan, np.nan]),
+    ('empty', []),
+    ('mixed-integer', ['a', np.nan, 2]),
+    ('mixed', ['a', np.nan, 2.0]),
+    ('floating', [1.0, np.nan, 2.0]),
+    ('integer', [1, np.nan, 2]),
+    ('mixed-integer-float', [1, np.nan, 2.0]),
+    ('decimal', [Decimal(1), np.nan, Decimal(2)]),
+    ('boolean', [True, np.nan, False]),
+    ('datetime64', [np.datetime64('2013-01-01'), np.nan,
+                    np.datetime64('2018-01-01')]),
+    ('datetime', [pd.Timestamp('20130101'), np.nan, pd.Timestamp('20180101')]),
+    ('date', [date(2013, 1, 1), np.nan, date(2018, 1, 1)]),
+    # The following two dtypes are commented out due to GH 23554
+    # ('complex', [1 + 1j, np.nan, 2 + 2j]),
+    # ('timedelta64', [np.timedelta64(1, 'D'),
+    #                  np.nan, np.timedelta64(2, 'D')]),
+    ('timedelta', [timedelta(1), np.nan, timedelta(2)]),
+    ('time', [time(1), np.nan, time(2)]),
+    ('period', [pd.Period(2013), pd.NaT, pd.Period(2018)]),
+    ('interval', [pd.Interval(0, 1), np.nan, pd.Interval(0, 2)])]
+ids, _ = zip(*_any_skipna_inferred_dtype)  # use inferred type as fixture-id
+
+
+@pytest.fixture(params=_any_skipna_inferred_dtype, ids=ids)
+def any_skipna_inferred_dtype(request):
+    """
+    Fixture for all inferred dtypes from _libs.lib.infer_dtype
+
+    The covered (inferred) types are:
+    * 'string'
+    * 'unicode' (if PY2)
+    * 'empty'
+    * 'bytes' (if PY3)
+    * 'mixed'
+    * 'mixed-integer'
+    * 'mixed-integer-float'
+    * 'floating'
+    * 'integer'
+    * 'decimal'
+    * 'boolean'
+    * 'datetime64'
+    * 'datetime'
+    * 'date'
+    * 'timedelta'
+    * 'time'
+    * 'period'
+    * 'interval'
+
+    Returns
+    -------
+    inferred_dtype : str
+        The string for the inferred dtype from _libs.lib.infer_dtype
+    values : np.ndarray
+        An array of object dtype that will be inferred to have
+        `inferred_dtype`
+
+    Examples
+    --------
+    >>> import pandas._libs.lib as lib
+    >>>
+    >>> def test_something(any_skipna_inferred_dtype):
+    ...     inferred_dtype, values = any_skipna_inferred_dtype
+    ...     # will pass
+    ...     assert lib.infer_dtype(values, skipna=True) == inferred_dtype
+    """
+    inferred_dtype, values = request.param
+    values = np.array(values, dtype=object)  # object dtype to avoid casting
+
+    # correctness of inference tested in tests/dtypes/test_inference.py
+    return inferred_dtype, values
+
+
+@pytest.fixture(params=[getattr(pd.offsets, o) for o in pd.offsets.__all__ if
+                        issubclass(getattr(pd.offsets, o), pd.offsets.Tick)])
+def tick_classes(request):
+    """
+    Fixture for Tick based datetime offsets available for a time series.
+    """
+    return request.param
+
+# ----------------------------------------------------------------
+# Global setup for tests using Hypothesis
+
+
+# Registering these strategies makes them globally available via st.from_type,
+# which is use for offsets in tests/tseries/offsets/test_offsets_properties.py
+for name in 'MonthBegin MonthEnd BMonthBegin BMonthEnd'.split():
+    cls = getattr(pd.tseries.offsets, name)
+    st.register_type_strategy(cls, st.builds(
+        cls,
+        n=st.integers(-99, 99),
+        normalize=st.booleans(),
+    ))
+
+for name in 'YearBegin YearEnd BYearBegin BYearEnd'.split():
+    cls = getattr(pd.tseries.offsets, name)
+    st.register_type_strategy(cls, st.builds(
+        cls,
+        n=st.integers(-5, 5),
+        normalize=st.booleans(),
+        month=st.integers(min_value=1, max_value=12),
+    ))
+
+for name in 'QuarterBegin QuarterEnd BQuarterBegin BQuarterEnd'.split():
+    cls = getattr(pd.tseries.offsets, name)
+    st.register_type_strategy(cls, st.builds(
+        cls,
+        n=st.integers(-24, 24),
+        normalize=st.booleans(),
+        startingMonth=st.integers(min_value=1, max_value=12)
+    ))
diff --git a/pandas/core/accessor.py b/pandas/core/accessor.py
new file mode 100644
index 0000000000000..050749741e7bd
--- /dev/null
+++ b/pandas/core/accessor.py
@@ -0,0 +1,285 @@
+# -*- coding: utf-8 -*-
+"""
+
+accessor.py contains base classes for implementing accessor properties
+that can be mixed into or pinned onto other pandas classes.
+
+"""
+import warnings
+
+from pandas.util._decorators import Appender
+
+
+class DirNamesMixin(object):
+    _accessors = frozenset()
+    _deprecations = frozenset(
+        ['asobject', 'base', 'data', 'flags', 'itemsize', 'strides'])
+
+    def _dir_deletions(self):
+        """
+        Delete unwanted __dir__ for this object.
+        """
+        return self._accessors | self._deprecations
+
+    def _dir_additions(self):
+        """
+        Add additional __dir__ for this object.
+        """
+        rv = set()
+        for accessor in self._accessors:
+            try:
+                getattr(self, accessor)
+                rv.add(accessor)
+            except AttributeError:
+                pass
+        return rv
+
+    def __dir__(self):
+        """
+        Provide method name lookup and completion
+        Only provide 'public' methods.
+        """
+        rv = set(dir(type(self)))
+        rv = (rv - self._dir_deletions()) | self._dir_additions()
+        return sorted(rv)
+
+
+class PandasDelegate(object):
+    """
+    An abstract base class for delegating methods/properties.
+    """
+
+    def _delegate_property_get(self, name, *args, **kwargs):
+        raise TypeError("You cannot access the "
+                        "property {name}".format(name=name))
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        raise TypeError("The property {name} cannot be set".format(name=name))
+
+    def _delegate_method(self, name, *args, **kwargs):
+        raise TypeError("You cannot call method {name}".format(name=name))
+
+    @classmethod
+    def _add_delegate_accessors(cls, delegate, accessors, typ,
+                                overwrite=False):
+        """
+        Add accessors to cls from the delegate class.
+
+        Parameters
+        ----------
+        cls : the class to add the methods/properties to
+        delegate : the class to get methods/properties & doc-strings
+        accessors : string list of accessors to add
+        typ : 'property' or 'method'
+        overwrite : boolean, default False
+           overwrite the method/property in the target class if it exists.
+        """
+
+        def _create_delegator_property(name):
+
+            def _getter(self):
+                return self._delegate_property_get(name)
+
+            def _setter(self, new_values):
+                return self._delegate_property_set(name, new_values)
+
+            _getter.__name__ = name
+            _setter.__name__ = name
+
+            return property(fget=_getter, fset=_setter,
+                            doc=getattr(delegate, name).__doc__)
+
+        def _create_delegator_method(name):
+
+            def f(self, *args, **kwargs):
+                return self._delegate_method(name, *args, **kwargs)
+
+            f.__name__ = name
+            f.__doc__ = getattr(delegate, name).__doc__
+
+            return f
+
+        for name in accessors:
+
+            if typ == 'property':
+                f = _create_delegator_property(name)
+            else:
+                f = _create_delegator_method(name)
+
+            # don't overwrite existing methods/properties
+            if overwrite or not hasattr(cls, name):
+                setattr(cls, name, f)
+
+
+def delegate_names(delegate, accessors, typ, overwrite=False):
+    """
+    Add delegated names to a class using a class decorator.  This provides
+    an alternative usage to directly calling `_add_delegate_accessors`
+    below a class definition.
+
+    Parameters
+    ----------
+    delegate : object
+        the class to get methods/properties & doc-strings
+    accessors : Sequence[str]
+        List of accessor to add
+    typ : {'property', 'method'}
+    overwrite : boolean, default False
+       overwrite the method/property in the target class if it exists
+
+    Returns
+    -------
+    callable
+        A class decorator.
+
+    Examples
+    --------
+    @delegate_names(Categorical, ["categories", "ordered"], "property")
+    class CategoricalAccessor(PandasDelegate):
+        [...]
+    """
+    def add_delegate_accessors(cls):
+        cls._add_delegate_accessors(delegate, accessors, typ,
+                                    overwrite=overwrite)
+        return cls
+
+    return add_delegate_accessors
+
+
+# Ported with modifications from xarray
+# https://github.com/pydata/xarray/blob/master/xarray/core/extensions.py
+# 1. We don't need to catch and re-raise AttributeErrors as RuntimeErrors
+# 2. We use a UserWarning instead of a custom Warning
+
+class CachedAccessor(object):
+    """
+    Custom property-like object (descriptor) for caching accessors.
+
+    Parameters
+    ----------
+    name : str
+        The namespace this will be accessed under, e.g. ``df.foo``
+    accessor : cls
+        The class with the extension methods. The class' __init__ method
+        should expect one of a ``Series``, ``DataFrame`` or ``Index`` as
+        the single argument ``data``
+    """
+    def __init__(self, name, accessor):
+        self._name = name
+        self._accessor = accessor
+
+    def __get__(self, obj, cls):
+        if obj is None:
+            # we're accessing the attribute of the class, i.e., Dataset.geo
+            return self._accessor
+        accessor_obj = self._accessor(obj)
+        # Replace the property with the accessor object. Inspired by:
+        # http://www.pydanny.com/cached-property.html
+        # We need to use object.__setattr__ because we overwrite __setattr__ on
+        # NDFrame
+        object.__setattr__(obj, self._name, accessor_obj)
+        return accessor_obj
+
+
+def _register_accessor(name, cls):
+    def decorator(accessor):
+        if hasattr(cls, name):
+            warnings.warn(
+                'registration of accessor {!r} under name {!r} for type '
+                '{!r} is overriding a preexisting attribute with the same '
+                'name.'.format(accessor, name, cls),
+                UserWarning,
+                stacklevel=2)
+        setattr(cls, name, CachedAccessor(name, accessor))
+        cls._accessors.add(name)
+        return accessor
+    return decorator
+
+
+_doc = """\
+Register a custom accessor on %(klass)s objects.
+
+Parameters
+----------
+name : str
+    Name under which the accessor should be registered. A warning is issued
+    if this name conflicts with a preexisting attribute.
+
+See Also
+--------
+%(others)s
+
+Notes
+-----
+When accessed, your accessor will be initialized with the pandas object
+the user is interacting with. So the signature must be
+
+.. code-block:: python
+
+    def __init__(self, pandas_object):  # noqa: E999
+        ...
+
+For consistency with pandas methods, you should raise an ``AttributeError``
+if the data passed to your accessor has an incorrect dtype.
+
+>>> pd.Series(['a', 'b']).dt
+Traceback (most recent call last):
+...
+AttributeError: Can only use .dt accessor with datetimelike values
+
+Examples
+--------
+
+In your library code::
+
+    import pandas as pd
+
+    @pd.api.extensions.register_dataframe_accessor("geo")
+    class GeoAccessor(object):
+        def __init__(self, pandas_obj):
+            self._obj = pandas_obj
+
+        @property
+        def center(self):
+            # return the geographic center point of this DataFrame
+            lat = self._obj.latitude
+            lon = self._obj.longitude
+            return (float(lon.mean()), float(lat.mean()))
+
+        def plot(self):
+            # plot this array's data on a map, e.g., using Cartopy
+            pass
+
+Back in an interactive IPython session:
+
+    >>> ds = pd.DataFrame({'longitude': np.linspace(0, 10),
+    ...                    'latitude': np.linspace(0, 20)})
+    >>> ds.geo.center
+    (5.0, 10.0)
+    >>> ds.geo.plot()
+    # plots data on a map
+"""
+
+
+@Appender(_doc % dict(klass="DataFrame",
+                      others=("register_series_accessor, "
+                              "register_index_accessor")))
+def register_dataframe_accessor(name):
+    from pandas import DataFrame
+    return _register_accessor(name, DataFrame)
+
+
+@Appender(_doc % dict(klass="Series",
+                      others=("register_dataframe_accessor, "
+                              "register_index_accessor")))
+def register_series_accessor(name):
+    from pandas import Series
+    return _register_accessor(name, Series)
+
+
+@Appender(_doc % dict(klass="Index",
+                      others=("register_dataframe_accessor, "
+                              "register_series_accessor")))
+def register_index_accessor(name):
+    from pandas import Index
+    return _register_accessor(name, Index)
diff --git a/pandas/core/algorithms.py b/pandas/core/algorithms.py
index a62d290277443..4a71951e2435e 100644
--- a/pandas/core/algorithms.py
+++ b/pandas/core/algorithms.py
@@ -3,41 +3,234 @@
 intended for public consumption
 """
 from __future__ import division
-from warnings import warn
+
+from textwrap import dedent
+from warnings import catch_warnings, simplefilter, warn
+
 import numpy as np
 
-from pandas import compat, _np_version_under1p8
-from pandas.types.cast import maybe_promote
-from pandas.types.generic import ABCSeries, ABCIndex
-from pandas.types.common import (is_unsigned_integer_dtype,
-                                 is_signed_integer_dtype,
-                                 is_integer_dtype,
-                                 is_categorical_dtype,
-                                 is_extension_type,
-                                 is_datetimetz,
-                                 is_period_dtype,
-                                 is_period_arraylike,
-                                 is_numeric_dtype,
-                                 is_float_dtype,
-                                 is_bool_dtype,
-                                 needs_i8_conversion,
-                                 is_categorical,
-                                 is_datetime64_dtype,
-                                 is_timedelta64_dtype,
-                                 is_scalar,
-                                 _ensure_platform_int,
-                                 _ensure_object,
-                                 _ensure_float64,
-                                 _ensure_uint64,
-                                 _ensure_int64,
-                                 is_list_like)
-from pandas.compat.numpy import _np_version_under1p10
-from pandas.types.missing import isnull
-
-import pandas.core.common as com
-from pandas.compat import string_types
-from pandas._libs import algos, lib, hashtable as htable
+from pandas._libs import algos, hashtable as htable, lib
 from pandas._libs.tslib import iNaT
+from pandas.util._decorators import Appender, Substitution, deprecate_kwarg
+
+from pandas.core.dtypes.cast import (
+    construct_1d_object_array_from_listlike, maybe_promote)
+from pandas.core.dtypes.common import (
+    ensure_float64, ensure_int64, ensure_object, ensure_platform_int,
+    ensure_uint64, is_array_like, is_bool_dtype, is_categorical_dtype,
+    is_complex_dtype, is_datetime64_any_dtype, is_datetime64tz_dtype,
+    is_datetimelike, is_extension_array_dtype, is_float_dtype, is_integer,
+    is_integer_dtype, is_interval_dtype, is_list_like, is_numeric_dtype,
+    is_object_dtype, is_period_dtype, is_scalar, is_signed_integer_dtype,
+    is_sparse, is_timedelta64_dtype, is_unsigned_integer_dtype,
+    needs_i8_conversion)
+from pandas.core.dtypes.generic import ABCIndex, ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import isna, na_value_for_dtype
+
+from pandas.core import common as com
+
+_shared_docs = {}
+
+
+# --------------- #
+# dtype access    #
+# --------------- #
+def _ensure_data(values, dtype=None):
+    """
+    routine to ensure that our data is of the correct
+    input dtype for lower-level routines
+
+    This will coerce:
+    - ints -> int64
+    - uint -> uint64
+    - bool -> uint64 (TODO this should be uint8)
+    - datetimelike -> i8
+    - datetime64tz -> i8 (in local tz)
+    - categorical -> codes
+
+    Parameters
+    ----------
+    values : array-like
+    dtype : pandas_dtype, optional
+        coerce to this dtype
+
+    Returns
+    -------
+    (ndarray, pandas_dtype, algo dtype as a string)
+
+    """
+
+    # we check some simple dtypes first
+    try:
+        if is_object_dtype(dtype):
+            return ensure_object(np.asarray(values)), 'object', 'object'
+        if is_bool_dtype(values) or is_bool_dtype(dtype):
+            # we are actually coercing to uint64
+            # until our algos support uint8 directly (see TODO)
+            return np.asarray(values).astype('uint64'), 'bool', 'uint64'
+        elif is_signed_integer_dtype(values) or is_signed_integer_dtype(dtype):
+            return ensure_int64(values), 'int64', 'int64'
+        elif (is_unsigned_integer_dtype(values) or
+              is_unsigned_integer_dtype(dtype)):
+            return ensure_uint64(values), 'uint64', 'uint64'
+        elif is_float_dtype(values) or is_float_dtype(dtype):
+            return ensure_float64(values), 'float64', 'float64'
+        elif is_object_dtype(values) and dtype is None:
+            return ensure_object(np.asarray(values)), 'object', 'object'
+        elif is_complex_dtype(values) or is_complex_dtype(dtype):
+
+            # ignore the fact that we are casting to float
+            # which discards complex parts
+            with catch_warnings():
+                simplefilter("ignore", np.ComplexWarning)
+                values = ensure_float64(values)
+            return values, 'float64', 'float64'
+
+    except (TypeError, ValueError, OverflowError):
+        # if we are trying to coerce to a dtype
+        # and it is incompat this will fall thru to here
+        return ensure_object(values), 'object', 'object'
+
+    # datetimelike
+    if (needs_i8_conversion(values) or
+            is_period_dtype(dtype) or
+            is_datetime64_any_dtype(dtype) or
+            is_timedelta64_dtype(dtype)):
+        if is_period_dtype(values) or is_period_dtype(dtype):
+            from pandas import PeriodIndex
+            values = PeriodIndex(values)
+            dtype = values.dtype
+        elif is_timedelta64_dtype(values) or is_timedelta64_dtype(dtype):
+            from pandas import TimedeltaIndex
+            values = TimedeltaIndex(values)
+            dtype = values.dtype
+        else:
+            # Datetime
+            from pandas import DatetimeIndex
+            values = DatetimeIndex(values)
+            dtype = values.dtype
+
+        return values.asi8, dtype, 'int64'
+
+    elif (is_categorical_dtype(values) and
+          (is_categorical_dtype(dtype) or dtype is None)):
+        values = getattr(values, 'values', values)
+        values = values.codes
+        dtype = 'category'
+
+        # we are actually coercing to int64
+        # until our algos support int* directly (not all do)
+        values = ensure_int64(values)
+
+        return values, dtype, 'int64'
+
+    # we have failed, return object
+    values = np.asarray(values, dtype=np.object)
+    return ensure_object(values), 'object', 'object'
+
+
+def _reconstruct_data(values, dtype, original):
+    """
+    reverse of _ensure_data
+
+    Parameters
+    ----------
+    values : ndarray
+    dtype : pandas_dtype
+    original : ndarray-like
+
+    Returns
+    -------
+    Index for extension types, otherwise ndarray casted to dtype
+    """
+    from pandas import Index
+    if is_extension_array_dtype(dtype):
+        values = dtype.construct_array_type()._from_sequence(values)
+    elif is_datetime64tz_dtype(dtype) or is_period_dtype(dtype):
+        values = Index(original)._shallow_copy(values, name=None)
+    elif is_bool_dtype(dtype):
+        values = values.astype(dtype)
+
+        # we only support object dtypes bool Index
+        if isinstance(original, Index):
+            values = values.astype(object)
+    elif dtype is not None:
+        values = values.astype(dtype)
+
+    return values
+
+
+def _ensure_arraylike(values):
+    """
+    ensure that we are arraylike if not already
+    """
+    if not is_array_like(values):
+        inferred = lib.infer_dtype(values, skipna=False)
+        if inferred in ['mixed', 'string', 'unicode']:
+            if isinstance(values, tuple):
+                values = list(values)
+            values = construct_1d_object_array_from_listlike(values)
+        else:
+            values = np.asarray(values)
+    return values
+
+
+_hashtables = {
+    'float64': (htable.Float64HashTable, htable.Float64Vector),
+    'uint64': (htable.UInt64HashTable, htable.UInt64Vector),
+    'int64': (htable.Int64HashTable, htable.Int64Vector),
+    'string': (htable.StringHashTable, htable.ObjectVector),
+    'object': (htable.PyObjectHashTable, htable.ObjectVector)
+}
+
+
+def _get_hashtable_algo(values):
+    """
+    Parameters
+    ----------
+    values : arraylike
+
+    Returns
+    -------
+    tuples(hashtable class,
+           vector class,
+           values,
+           dtype,
+           ndtype)
+    """
+    values, dtype, ndtype = _ensure_data(values)
+
+    if ndtype == 'object':
+
+        # it's cheaper to use a String Hash Table than Object; we infer
+        # including nulls because that is the only difference between
+        # StringHashTable and ObjectHashtable
+        if lib.infer_dtype(values, skipna=False) in ['string']:
+            ndtype = 'string'
+        else:
+            ndtype = 'object'
+
+    htable, table = _hashtables[ndtype]
+    return (htable, table, values, dtype, ndtype)
+
+
+def _get_data_algo(values, func_map):
+
+    if is_categorical_dtype(values):
+        values = values._values_for_rank()
+
+    values, dtype, ndtype = _ensure_data(values)
+    if ndtype == 'object':
+
+        # it's cheaper to use a String Hash Table than Object; we infer
+        # including nulls because that is the only difference between
+        # StringHashTable and ObjectHashtable
+        if lib.infer_dtype(values, skipna=False) in ['string']:
+            ndtype = 'string'
+
+    f = func_map.get(ndtype, func_map['object'])
+
+    return f, values
 
 
 # --------------- #
@@ -64,101 +257,129 @@ def match(to_match, values, na_sentinel=-1):
     -------
     match : ndarray of integers
     """
-    values = com._asarray_tuplesafe(values)
-    if issubclass(values.dtype.type, string_types):
-        values = np.array(values, dtype='O')
-
-    f = lambda htype, caster: _match_object(to_match, values, htype, caster)
-    result = _hashtable_algo(f, values, np.int64)
+    values = com.asarray_tuplesafe(values)
+    htable, _, values, dtype, ndtype = _get_hashtable_algo(values)
+    to_match, _, _ = _ensure_data(to_match, dtype)
+    table = htable(min(len(to_match), 1000000))
+    table.map_locations(values)
+    result = table.lookup(to_match)
 
     if na_sentinel != -1:
 
         # replace but return a numpy array
         # use a Series because it handles dtype conversions properly
-        from pandas.core.series import Series
-        result = Series(result.ravel()).replace(-1, na_sentinel).values.\
-            reshape(result.shape)
+        from pandas import Series
+        result = Series(result.ravel()).replace(-1, na_sentinel)
+        result = result.values.reshape(result.shape)
 
     return result
 
 
-def _match_object(values, index, table_type, type_caster):
-    values = type_caster(values)
-    index = type_caster(index)
-    table = table_type(min(len(index), 1000000))
-    table.map_locations(index)
-    return table.lookup(values)
-
-
 def unique(values):
     """
-    Compute unique values (not necessarily sorted) efficiently from input array
-    of values
+    Hash table-based unique. Uniques are returned in order
+    of appearance. This does NOT sort.
+
+    Significantly faster than numpy.unique. Includes NA values.
 
     Parameters
     ----------
-    values : array-like
+    values : 1d array-like
 
     Returns
     -------
-    uniques
-    """
-    values = com._asarray_tuplesafe(values)
+    numpy.ndarray or ExtensionArray
 
-    f = lambda htype, caster: _unique_object(values, htype, caster)
-    return _hashtable_algo(f, values)
+        The return can be:
 
+        * Index : when the input is an Index
+        * Categorical : when the input is a Categorical dtype
+        * ndarray : when the input is a Series/ndarray
 
-def _unique_object(values, table_type, type_caster):
-    values = type_caster(values)
-    table = table_type(min(len(values), 1000000))
-    uniques = table.unique(values)
-    return type_caster(uniques)
+        Return numpy.ndarray or ExtensionArray.
 
+    See Also
+    --------
+    Index.unique
+    Series.unique
 
-def unique1d(values):
-    """
-    Hash table-based unique
+    Examples
+    --------
+    >>> pd.unique(pd.Series([2, 1, 3, 3]))
+    array([2, 1, 3])
+
+    >>> pd.unique(pd.Series([2] + [1] * 5))
+    array([2, 1])
+
+    >>> pd.unique(pd.Series([pd.Timestamp('20160101'),
+    ...                     pd.Timestamp('20160101')]))
+    array(['2016-01-01T00:00:00.000000000'], dtype='datetime64[ns]')
+
+    >>> pd.unique(pd.Series([pd.Timestamp('20160101', tz='US/Eastern'),
+    ...                      pd.Timestamp('20160101', tz='US/Eastern')]))
+    array([Timestamp('2016-01-01 00:00:00-0500', tz='US/Eastern')],
+          dtype=object)
+
+    >>> pd.unique(pd.Index([pd.Timestamp('20160101', tz='US/Eastern'),
+    ...                     pd.Timestamp('20160101', tz='US/Eastern')]))
+    DatetimeIndex(['2016-01-01 00:00:00-05:00'],
+    ...           dtype='datetime64[ns, US/Eastern]', freq=None)
+
+    >>> pd.unique(list('baabc'))
+    array(['b', 'a', 'c'], dtype=object)
+
+    An unordered Categorical will return categories in the
+    order of appearance.
+
+    >>> pd.unique(pd.Series(pd.Categorical(list('baabc'))))
+    [b, a, c]
+    Categories (3, object): [b, a, c]
+
+    >>> pd.unique(pd.Series(pd.Categorical(list('baabc'),
+    ...                                    categories=list('abc'))))
+    [b, a, c]
+    Categories (3, object): [b, a, c]
+
+    An ordered Categorical preserves the category ordering.
+
+    >>> pd.unique(pd.Series(pd.Categorical(list('baabc'),
+    ...                                    categories=list('abc'),
+    ...                                    ordered=True)))
+    [b, a, c]
+    Categories (3, object): [a < b < c]
+
+    An array of tuples
+
+    >>> pd.unique([('a', 'b'), ('b', 'a'), ('a', 'c'), ('b', 'a')])
+    array([('a', 'b'), ('b', 'a'), ('a', 'c')], dtype=object)
     """
-    if np.issubdtype(values.dtype, np.floating):
-        table = htable.Float64HashTable(len(values))
-        uniques = np.array(table.unique(_ensure_float64(values)),
-                           dtype=np.float64)
-    elif np.issubdtype(values.dtype, np.datetime64):
-        table = htable.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-        uniques = uniques.view('M8[ns]')
-    elif np.issubdtype(values.dtype, np.timedelta64):
-        table = htable.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-        uniques = uniques.view('m8[ns]')
-    elif np.issubdtype(values.dtype, np.signedinteger):
-        table = htable.Int64HashTable(len(values))
-        uniques = table.unique(_ensure_int64(values))
-    elif np.issubdtype(values.dtype, np.unsignedinteger):
-        table = htable.UInt64HashTable(len(values))
-        uniques = table.unique(_ensure_uint64(values))
-    else:
 
-        # its cheaper to use a String Hash Table than Object
-        if lib.infer_dtype(values) in ['string']:
-            table = htable.StringHashTable(len(values))
-        else:
-            table = htable.PyObjectHashTable(len(values))
+    values = _ensure_arraylike(values)
+
+    if is_extension_array_dtype(values):
+        # Dispatch to extension dtype's unique.
+        return values.unique()
 
-        uniques = table.unique(_ensure_object(values))
+    original = values
+    htable, _, values, dtype, ndtype = _get_hashtable_algo(values)
 
+    table = htable(len(values))
+    uniques = table.unique(values)
+    uniques = _reconstruct_data(uniques, dtype, original)
     return uniques
 
 
+unique1d = unique
+
+
 def isin(comps, values):
     """
     Compute the isin boolean array
 
     Parameters
     ----------
-    comps: array-like
-    values: array-like
+    comps : array-like
+    values : array-like
 
     Returns
     -------
@@ -167,58 +388,39 @@ def isin(comps, values):
 
     if not is_list_like(comps):
         raise TypeError("only list-like objects are allowed to be passed"
-                        " to isin(), you passed a "
-                        "[{0}]".format(type(comps).__name__))
+                        " to isin(), you passed a [{comps_type}]"
+                        .format(comps_type=type(comps).__name__))
     if not is_list_like(values):
         raise TypeError("only list-like objects are allowed to be passed"
-                        " to isin(), you passed a "
-                        "[{0}]".format(type(values).__name__))
-
-    from pandas import DatetimeIndex, TimedeltaIndex, PeriodIndex
+                        " to isin(), you passed a [{values_type}]"
+                        .format(values_type=type(values).__name__))
 
     if not isinstance(values, (ABCIndex, ABCSeries, np.ndarray)):
-        values = np.array(list(values), dtype='object')
+        values = construct_1d_object_array_from_listlike(list(values))
 
-    if needs_i8_conversion(comps):
-        if is_period_dtype(values):
-            comps = PeriodIndex(comps)
-            values = PeriodIndex(values)
-        elif is_timedelta64_dtype(comps):
-            comps = TimedeltaIndex(comps)
-            values = TimedeltaIndex(values)
-        else:
-            comps = DatetimeIndex(comps)
-            values = DatetimeIndex(values)
+    if is_categorical_dtype(comps):
+        # TODO(extension)
+        # handle categoricals
+        return comps._values.isin(values)
 
-        values = values.asi8
-        comps = comps.asi8
-    elif is_bool_dtype(comps):
+    comps = com.values_from_object(comps)
 
-        try:
-            comps = np.asarray(comps).view('uint8')
-            values = np.asarray(values).view('uint8')
-        except TypeError:
-            # object array conversion will fail
-            pass
-    elif is_numeric_dtype(comps):
-        comps = np.asarray(comps)
-        values = np.asarray(values)
-    else:
-        comps = np.asarray(comps).astype(object)
-        values = np.asarray(values).astype(object)
+    comps, dtype, _ = _ensure_data(comps)
+    values, _, _ = _ensure_data(values, dtype=dtype)
 
-    # GH11232
-    # work-around for numpy < 1.8 and comparisions on py3
     # faster for larger cases to use np.in1d
     f = lambda x, y: htable.ismember_object(x, values)
-    if (_np_version_under1p8 and compat.PY3) or len(comps) > 1000000:
+
+    # GH16012
+    # Ensure np.in1d doesn't get object types or it *may* throw an exception
+    if len(comps) > 1000000 and not is_object_dtype(comps):
         f = lambda x, y: np.in1d(x, y)
     elif is_integer_dtype(comps):
         try:
             values = values.astype('int64', copy=False)
             comps = comps.astype('int64', copy=False)
             f = lambda x, y: htable.ismember_int64(x, y)
-        except (TypeError, ValueError):
+        except (TypeError, ValueError, OverflowError):
             values = values.astype(object)
             comps = comps.astype(object)
 
@@ -226,8 +428,7 @@ def isin(comps, values):
         try:
             values = values.astype('float64', copy=False)
             comps = comps.astype('float64', copy=False)
-            checknull = isnull(values).any()
-            f = lambda x, y: htable.ismember_float64(x, y, checknull)
+            f = lambda x, y: htable.ismember_float64(x, y)
         except (TypeError, ValueError):
             values = values.astype(object)
             comps = comps.astype(object)
@@ -235,175 +436,209 @@ def isin(comps, values):
     return f(comps, values)
 
 
-def safe_sort(values, labels=None, na_sentinel=-1, assume_unique=False):
-    """
-    Sort ``values`` and reorder corresponding ``labels``.
-    ``values`` should be unique if ``labels`` is not None.
-    Safe for use with mixed types (int, str), orders ints before strs.
+def _factorize_array(values, na_sentinel=-1, size_hint=None,
+                     na_value=None):
+    """Factorize an array-like to labels and uniques.
 
-    .. versionadded:: 0.19.0
+    This doesn't do any coercion of types or unboxing before factorization.
 
     Parameters
     ----------
-    values : list-like
-        Sequence; must be unique if ``labels`` is not None.
-    labels : list_like
-        Indices to ``values``. All out of bound indices are treated as
-        "not found" and will be masked with ``na_sentinel``.
+    values : ndarray
     na_sentinel : int, default -1
-        Value in ``labels`` to mark "not found".
-        Ignored when ``labels`` is None.
-    assume_unique : bool, default False
-        When True, ``values`` are assumed to be unique, which can speed up
-        the calculation. Ignored when ``labels`` is None.
+    size_hint : int, optional
+        Passsed through to the hashtable's 'get_labels' method
+    na_value : object, optional
+        A value in `values` to consider missing. Note: only use this
+        parameter when you know that you don't have any values pandas would
+        consider missing in the array (NaN for float data, iNaT for
+        datetimes, etc.).
 
     Returns
     -------
-    ordered : ndarray
-        Sorted ``values``
-    new_labels : ndarray
-        Reordered ``labels``; returned when ``labels`` is not None.
-
-    Raises
-    ------
-    TypeError
-        * If ``values`` is not list-like or if ``labels`` is neither None
-        nor list-like
-        * If ``values`` cannot be sorted
-    ValueError
-        * If ``labels`` is not None and ``values`` contain duplicates.
+    labels, uniques : ndarray
     """
-    if not is_list_like(values):
-        raise TypeError("Only list-like objects are allowed to be passed to"
-                        "safe_sort as values")
-    values = np.array(values, copy=False)
-
-    def sort_mixed(values):
-        # order ints before strings, safe in py3
-        str_pos = np.array([isinstance(x, string_types) for x in values],
-                           dtype=bool)
-        nums = np.sort(values[~str_pos])
-        strs = np.sort(values[str_pos])
-        return _ensure_object(np.concatenate([nums, strs]))
-
-    sorter = None
-    if compat.PY3 and lib.infer_dtype(values) == 'mixed-integer':
-        # unorderable in py3 if mixed str/int
-        ordered = sort_mixed(values)
-    else:
-        try:
-            sorter = values.argsort()
-            ordered = values.take(sorter)
-        except TypeError:
-            # try this anyway
-            ordered = sort_mixed(values)
-
-    # labels:
+    (hash_klass, _), values = _get_data_algo(values, _hashtables)
 
-    if labels is None:
-        return ordered
+    table = hash_klass(size_hint or len(values))
+    uniques, labels = table.factorize(values, na_sentinel=na_sentinel,
+                                      na_value=na_value)
 
-    if not is_list_like(labels):
-        raise TypeError("Only list-like objects or None are allowed to be"
-                        "passed to safe_sort as labels")
-    labels = _ensure_platform_int(np.asarray(labels))
-
-    from pandas import Index
-    if not assume_unique and not Index(values).is_unique:
-        raise ValueError("values should be unique if labels is not None")
-
-    if sorter is None:
-        # mixed types
-        (hash_klass, _), values = _get_data_algo(values, _hashtables)
-        t = hash_klass(len(values))
-        t.map_locations(values)
-        sorter = _ensure_platform_int(t.lookup(ordered))
-
-    reverse_indexer = np.empty(len(sorter), dtype=np.int_)
-    reverse_indexer.put(sorter, np.arange(len(sorter)))
-
-    mask = (labels < -len(values)) | (labels >= len(values)) | \
-        (labels == na_sentinel)
-
-    # (Out of bound indices will be masked with `na_sentinel` next, so we may
-    # deal with them here without performance loss using `mode='wrap'`.)
-    new_labels = reverse_indexer.take(labels, mode='wrap')
-    np.putmask(new_labels, mask, na_sentinel)
+    labels = ensure_platform_int(labels)
+    return labels, uniques
 
-    return ordered, _ensure_platform_int(new_labels)
 
+_shared_docs['factorize'] = """
+    Encode the object as an enumerated type or categorical variable.
 
-def factorize(values, sort=False, order=None, na_sentinel=-1, size_hint=None):
-    """
-    Encode input values as an enumerated type or categorical variable
+    This method is useful for obtaining a numeric representation of an
+    array when all that matters is identifying distinct values. `factorize`
+    is available as both a top-level function :func:`pandas.factorize`,
+    and as a method :meth:`Series.factorize` and :meth:`Index.factorize`.
 
     Parameters
     ----------
-    values : ndarray (1-d)
-        Sequence
-    sort : boolean, default False
-        Sort by values
+    %(values)s%(sort)s%(order)s
     na_sentinel : int, default -1
-        Value to mark "not found"
-    size_hint : hint to the hashtable sizer
+        Value to mark "not found".
+    %(size_hint)s\
 
     Returns
     -------
-    labels : the indexer to the original array
-    uniques : ndarray (1-d) or Index
-        the unique values. Index is returned when passed values is Index or
-        Series
+    labels : ndarray
+        An integer ndarray that's an indexer into `uniques`.
+        ``uniques.take(labels)`` will have the same values as `values`.
+    uniques : ndarray, Index, or Categorical
+        The unique valid values. When `values` is Categorical, `uniques`
+        is a Categorical. When `values` is some other pandas object, an
+        `Index` is returned. Otherwise, a 1-D ndarray is returned.
 
-    note: an array of Periods will ignore sort as it returns an always sorted
-    PeriodIndex
-    """
-    from pandas import Index, Series, DatetimeIndex, PeriodIndex
-
-    # handling possibilities here
-    # - for a numpy datetimelike simply view as i8 then cast back
-    # - bool handled as uint8 then cast back
-    # - for an extension datetimelike view as i8 then
-    #   reconstruct from boxed values to transfer metadata
-    dtype = None
-    if needs_i8_conversion(values):
-        if is_period_dtype(values):
-            values = PeriodIndex(values)
-            vals = values.asi8
-        elif is_datetimetz(values):
-            values = DatetimeIndex(values)
-            vals = values.asi8
-        else:
-            # numpy dtype
-            dtype = values.dtype
-            vals = values.view(np.int64)
-    elif is_bool_dtype(values):
-        dtype = bool
-        vals = np.asarray(values).view('uint8')
-    else:
-        vals = np.asarray(values)
+        .. note ::
 
-    (hash_klass, vec_klass), vals = _get_data_algo(vals, _hashtables)
+           Even if there's a missing value in `values`, `uniques` will
+           *not* contain an entry for it.
 
-    table = hash_klass(size_hint or len(vals))
-    uniques = vec_klass()
-    check_nulls = not is_integer_dtype(values)
-    labels = table.get_labels(vals, uniques, 0, na_sentinel, check_nulls)
+    See Also
+    --------
+    cut : Discretize continuous-valued array.
+    unique : Find the unique value in an array.
 
-    labels = _ensure_platform_int(labels)
+    Examples
+    --------
+    These examples all show factorize as a top-level method like
+    ``pd.factorize(values)``. The results are identical for methods like
+    :meth:`Series.factorize`.
+
+    >>> labels, uniques = pd.factorize(['b', 'b', 'a', 'c', 'b'])
+    >>> labels
+    array([0, 0, 1, 2, 0])
+    >>> uniques
+    array(['b', 'a', 'c'], dtype=object)
+
+    With ``sort=True``, the `uniques` will be sorted, and `labels` will be
+    shuffled so that the relationship is the maintained.
+
+    >>> labels, uniques = pd.factorize(['b', 'b', 'a', 'c', 'b'], sort=True)
+    >>> labels
+    array([1, 1, 0, 2, 1])
+    >>> uniques
+    array(['a', 'b', 'c'], dtype=object)
+
+    Missing values are indicated in `labels` with `na_sentinel`
+    (``-1`` by default). Note that missing values are never
+    included in `uniques`.
+
+    >>> labels, uniques = pd.factorize(['b', None, 'a', 'c', 'b'])
+    >>> labels
+    array([ 0, -1,  1,  2,  0])
+    >>> uniques
+    array(['b', 'a', 'c'], dtype=object)
+
+    Thus far, we've only factorized lists (which are internally coerced to
+    NumPy arrays). When factorizing pandas objects, the type of `uniques`
+    will differ. For Categoricals, a `Categorical` is returned.
+
+    >>> cat = pd.Categorical(['a', 'a', 'c'], categories=['a', 'b', 'c'])
+    >>> labels, uniques = pd.factorize(cat)
+    >>> labels
+    array([0, 0, 1])
+    >>> uniques
+    [a, c]
+    Categories (3, object): [a, b, c]
+
+    Notice that ``'b'`` is in ``uniques.categories``, despite not being
+    present in ``cat.values``.
+
+    For all other pandas objects, an Index of the appropriate type is
+    returned.
+
+    >>> cat = pd.Series(['a', 'a', 'c'])
+    >>> labels, uniques = pd.factorize(cat)
+    >>> labels
+    array([0, 0, 1])
+    >>> uniques
+    Index(['a', 'c'], dtype='object')
+    """
 
-    uniques = uniques.to_array()
 
-    if sort and len(uniques) > 0:
-        uniques, labels = safe_sort(uniques, labels, na_sentinel=na_sentinel,
-                                    assume_unique=True)
+@Substitution(
+    values=dedent("""\
+    values : sequence
+        A 1-D sequence. Sequences that aren't pandas objects are
+        coerced to ndarrays before factorization.
+    """),
+    order=dedent("""\
+    order : None
+        .. deprecated:: 0.23.0
+
+           This parameter has no effect and is deprecated.
+    """),
+    sort=dedent("""\
+    sort : bool, default False
+        Sort `uniques` and shuffle `labels` to maintain the
+        relationship.
+    """),
+    size_hint=dedent("""\
+    size_hint : int, optional
+        Hint to the hashtable sizer.
+    """),
+)
+@Appender(_shared_docs['factorize'])
+@deprecate_kwarg(old_arg_name='order', new_arg_name=None)
+def factorize(values, sort=False, order=None, na_sentinel=-1, size_hint=None):
+    # Implementation notes: This method is responsible for 3 things
+    # 1.) coercing data to array-like (ndarray, Index, extension array)
+    # 2.) factorizing labels and uniques
+    # 3.) Maybe boxing the output in an Index
+    #
+    # Step 2 is dispatched to extension types (like Categorical). They are
+    # responsible only for factorization. All data coercion, sorting and boxing
+    # should happen here.
+
+    values = _ensure_arraylike(values)
+    original = values
+
+    if is_extension_array_dtype(values):
+        values = getattr(values, '_values', values)
+        labels, uniques = values.factorize(na_sentinel=na_sentinel)
+        dtype = original.dtype
+    else:
+        values, dtype, _ = _ensure_data(values)
+
+        if (is_datetime64_any_dtype(original) or
+                is_timedelta64_dtype(original) or
+                is_period_dtype(original)):
+            na_value = na_value_for_dtype(original.dtype)
+        else:
+            na_value = None
 
-    if dtype is not None:
-        uniques = uniques.astype(dtype)
+        labels, uniques = _factorize_array(values,
+                                           na_sentinel=na_sentinel,
+                                           size_hint=size_hint,
+                                           na_value=na_value)
 
-    if isinstance(values, Index):
-        uniques = values._shallow_copy(uniques, name=None)
-    elif isinstance(values, Series):
+    if sort and len(uniques) > 0:
+        from pandas.core.sorting import safe_sort
+        try:
+            order = uniques.argsort()
+            order2 = order.argsort()
+            labels = take_1d(order2, labels, fill_value=na_sentinel)
+            uniques = uniques.take(order)
+        except TypeError:
+            # Mixed types, where uniques.argsort fails.
+            uniques, labels = safe_sort(uniques, labels,
+                                        na_sentinel=na_sentinel,
+                                        assume_unique=True)
+
+    uniques = _reconstruct_data(uniques, dtype, original)
+
+    # return original tenor
+    if isinstance(original, ABCIndexClass):
+        uniques = original._shallow_copy(uniques, name=None)
+    elif isinstance(original, ABCSeries):
+        from pandas import Index
         uniques = Index(uniques)
+
     return labels, uniques
 
 
@@ -432,38 +667,45 @@ def value_counts(values, sort=True, ascending=False, normalize=False,
     value_counts : Series
 
     """
-    from pandas.core.series import Series
+    from pandas.core.series import Series, Index
     name = getattr(values, 'name', None)
 
     if bins is not None:
         try:
-            from pandas.tools.tile import cut
-            values = Series(values).values
-            cat, bins = cut(values, bins, retbins=True)
+            from pandas.core.reshape.tile import cut
+            values = Series(values)
+            ii = cut(values, bins, include_lowest=True)
         except TypeError:
             raise TypeError("bins argument only works with numeric data.")
-        values = cat.codes
-
-    if is_extension_type(values) and not is_datetimetz(values):
-        # handle Categorical and sparse,
-        # datetime tz can be handeled in ndarray path
-        result = Series(values).values.value_counts(dropna=dropna)
-        result.name = name
-        counts = result.values
+
+        # count, remove nulls (from the index), and but the bins
+        result = ii.value_counts(dropna=dropna)
+        result = result[result.index.notna()]
+        result.index = result.index.astype('interval')
+        result = result.sort_index()
+
+        # if we are dropna and we have NO values
+        if dropna and (result.values == 0).all():
+            result = result.iloc[0:0]
+
+        # normalizing is by len of all (regardless of dropna)
+        counts = np.array([len(ii)])
+
     else:
-        # ndarray path. pass original to handle DatetimeTzBlock
-        keys, counts = _value_counts_arraylike(values, dropna=dropna)
 
-        from pandas import Index, Series
-        if not isinstance(keys, Index):
-            keys = Index(keys)
-        result = Series(counts, index=keys, name=name)
+        if is_extension_array_dtype(values) or is_sparse(values):
 
-    if bins is not None:
-        # TODO: This next line should be more efficient
-        result = result.reindex(np.arange(len(cat.categories)),
-                                fill_value=0)
-        result.index = bins[:-1]
+            # handle Categorical and sparse,
+            result = Series(values)._values.value_counts(dropna=dropna)
+            result.name = name
+            counts = result.values
+
+        else:
+            keys, counts = _value_counts_arraylike(values, dropna)
+
+            if not isinstance(keys, Index):
+                keys = Index(keys)
+            result = Series(counts, index=keys, name=name)
 
     if sort:
         result = result.sort_values(ascending=ascending)
@@ -474,60 +716,45 @@ def value_counts(values, sort=True, ascending=False, normalize=False,
     return result
 
 
-def _value_counts_arraylike(values, dropna=True):
-    is_datetimetz_type = is_datetimetz(values)
-    is_period_type = (is_period_dtype(values) or
-                      is_period_arraylike(values))
-
-    orig = values
-
-    from pandas.core.series import Series
-    values = Series(values).values
-    dtype = values.dtype
+def _value_counts_arraylike(values, dropna):
+    """
+    Parameters
+    ----------
+    values : arraylike
+    dropna : boolean
 
-    if needs_i8_conversion(dtype) or is_period_type:
+    Returns
+    -------
+    (uniques, counts)
 
-        from pandas.tseries.index import DatetimeIndex
-        from pandas.tseries.period import PeriodIndex
+    """
+    values = _ensure_arraylike(values)
+    original = values
+    values, dtype, ndtype = _ensure_data(values)
 
-        if is_period_type:
-            # values may be an object
-            values = PeriodIndex(values)
-            freq = values.freq
+    if needs_i8_conversion(dtype):
+        # i8
 
-        values = values.view(np.int64)
         keys, counts = htable.value_count_int64(values, dropna)
 
         if dropna:
             msk = keys != iNaT
             keys, counts = keys[msk], counts[msk]
 
-        # convert the keys back to the dtype we came in
-        keys = keys.astype(dtype)
-
-        # dtype handling
-        if is_datetimetz_type:
-            keys = DatetimeIndex._simple_new(keys, tz=orig.dtype.tz)
-        elif is_period_type:
-            keys = PeriodIndex._from_ordinals(keys, freq=freq)
-
-    elif is_signed_integer_dtype(dtype):
-        values = _ensure_int64(values)
-        keys, counts = htable.value_count_int64(values, dropna)
-    elif is_unsigned_integer_dtype(dtype):
-        values = _ensure_uint64(values)
-        keys, counts = htable.value_count_uint64(values, dropna)
-    elif is_float_dtype(dtype):
-        values = _ensure_float64(values)
-        keys, counts = htable.value_count_float64(values, dropna)
     else:
-        values = _ensure_object(values)
-        keys, counts = htable.value_count_object(values, dropna)
+        # ndarray like
+
+        # TODO: handle uint8
+        f = getattr(htable, "value_count_{dtype}".format(dtype=ndtype))
+        keys, counts = f(values, dropna)
 
-        mask = isnull(values)
+        mask = isna(values)
         if not dropna and mask.any():
-            keys = np.insert(keys, 0, np.NaN)
-            counts = np.insert(counts, 0, mask.sum())
+            if not isna(keys).any():
+                keys = np.insert(keys, 0, np.NaN)
+                counts = np.insert(counts, 0, mask.sum())
+
+    keys = _reconstruct_data(keys, original.dtype, original)
 
     return keys, counts
 
@@ -554,36 +781,12 @@ def duplicated(values, keep='first'):
     duplicated : ndarray
     """
 
-    dtype = values.dtype
-
-    # no need to revert to original type
-    if needs_i8_conversion(dtype):
-        values = values.view(np.int64)
-    elif is_period_arraylike(values):
-        from pandas.tseries.period import PeriodIndex
-        values = PeriodIndex(values).asi8
-    elif is_categorical_dtype(dtype):
-        values = values.values.codes
-    elif isinstance(values, (ABCSeries, ABCIndex)):
-        values = values.values
-
-    if is_signed_integer_dtype(dtype):
-        values = _ensure_int64(values)
-        duplicated = htable.duplicated_int64(values, keep=keep)
-    elif is_unsigned_integer_dtype(dtype):
-        values = _ensure_uint64(values)
-        duplicated = htable.duplicated_uint64(values, keep=keep)
-    elif is_float_dtype(dtype):
-        values = _ensure_float64(values)
-        duplicated = htable.duplicated_float64(values, keep=keep)
-    else:
-        values = _ensure_object(values)
-        duplicated = htable.duplicated_object(values, keep=keep)
+    values, dtype, ndtype = _ensure_data(values)
+    f = getattr(htable, "duplicated_{dtype}".format(dtype=ndtype))
+    return f(values, keep=keep)
 
-    return duplicated
 
-
-def mode(values):
+def mode(values, dropna=True):
     """
     Returns the mode(s) of an array.
 
@@ -591,45 +794,41 @@ def mode(values):
     ----------
     values : array-like
         Array over which to check for duplicate values.
+    dropna : boolean, default True
+        Don't consider counts of NaN/NaT.
+
+        .. versionadded:: 0.24.0
 
     Returns
     -------
     mode : Series
     """
+    from pandas import Series
 
-    # must sort because hash order isn't necessarily defined.
-    from pandas.core.series import Series
+    values = _ensure_arraylike(values)
+    original = values
 
-    if isinstance(values, Series):
-        constructor = values._constructor
-        values = values.values
-    else:
-        values = np.asanyarray(values)
-        constructor = Series
-
-    dtype = values.dtype
-    if is_signed_integer_dtype(values):
-        values = _ensure_int64(values)
-        result = constructor(np.sort(htable.mode_int64(values)), dtype=dtype)
-    elif is_unsigned_integer_dtype(values):
-        values = _ensure_uint64(values)
-        result = constructor(np.sort(htable.mode_uint64(values)), dtype=dtype)
-    elif issubclass(values.dtype.type, (np.datetime64, np.timedelta64)):
-        dtype = values.dtype
-        values = values.view(np.int64)
-        result = constructor(np.sort(htable.mode_int64(values)), dtype=dtype)
-    elif is_categorical_dtype(values):
-        result = constructor(values.mode())
-    else:
-        values = _ensure_object(values)
-        res = htable.mode_object(values)
-        try:
-            res = np.sort(res)
-        except TypeError as e:
-            warn("Unable to sort modes: %s" % e)
-        result = constructor(res, dtype=dtype)
+    # categorical is a fast-path
+    if is_categorical_dtype(values):
+        if isinstance(values, Series):
+            return Series(values.values.mode(dropna=dropna), name=values.name)
+        return values.mode(dropna=dropna)
 
-    return result
+    if dropna and is_datetimelike(values):
+        mask = values.isnull()
+        values = values[~mask]
+
+    values, dtype, ndtype = _ensure_data(values)
+
+    f = getattr(htable, "mode_{dtype}".format(dtype=ndtype))
+    result = f(values, dropna=dropna)
+    try:
+        result = np.sort(result)
+    except TypeError as e:
+        warn("Unable to sort modes: {error}".format(error=e))
+
+    result = _reconstruct_data(result, original.dtype, original)
+    return Series(result)
 
 
 def rank(values, axis=0, method='average', na_option='keep',
@@ -699,26 +898,12 @@ def checked_add_with_arr(arr, b, arr_mask=None, b_mask=None):
     ------
     OverflowError if any x + y exceeds the maximum or minimum int64 value.
     """
-    def _broadcast(arr_or_scalar, shape):
-        """
-        Helper function to broadcast arrays / scalars to the desired shape.
-        """
-        if _np_version_under1p10:
-            if lib.isscalar(arr_or_scalar):
-                out = np.empty(shape)
-                out.fill(arr_or_scalar)
-            else:
-                out = arr_or_scalar
-        else:
-            out = np.broadcast_to(arr_or_scalar, shape)
-        return out
-
     # For performance reasons, we broadcast 'b' to the new array 'b2'
     # so that it has the same size as 'arr'.
-    b2 = _broadcast(b, arr.shape)
+    b2 = np.broadcast_to(b, arr.shape)
     if b_mask is not None:
         # We do the same broadcasting for b_mask as well.
-        b2_mask = _broadcast(b_mask, arr.shape)
+        b2_mask = np.broadcast_to(b_mask, arr.shape)
     else:
         b2_mask = None
 
@@ -814,12 +999,18 @@ def quantile(x, q, interpolation_method='fraction'):
 
     """
     x = np.asarray(x)
-    mask = isnull(x)
+    mask = isna(x)
 
     x = x[~mask]
 
     values = np.sort(x)
 
+    def _interpolate(a, b, fraction):
+        """Returns the point at the given fraction between a and b, where
+        'fraction' must be between 0 and 1.
+        """
+        return a + (b - a) * fraction
+
     def _get_score(at):
         if len(values) == 0:
             return np.nan
@@ -848,205 +1039,208 @@ def _get_score(at):
         return algos.arrmap_float64(q, _get_score)
 
 
-def _interpolate(a, b, fraction):
-    """Returns the point at the given fraction between a and b, where
-    'fraction' must be between 0 and 1.
-    """
-    return a + (b - a) * fraction
+# --------------- #
+# select n        #
+# --------------- #
 
+class SelectN(object):
 
-def nsmallest(arr, n, keep='first'):
-    """
-    Find the indices of the n smallest values of a numpy array.
+    def __init__(self, obj, n, keep):
+        self.obj = obj
+        self.n = n
+        self.keep = keep
 
-    Note: Fails silently with NaN.
-    """
-    if keep == 'last':
-        arr = arr[::-1]
+        if self.keep not in ('first', 'last', 'all'):
+            raise ValueError('keep must be either "first", "last" or "all"')
 
-    narr = len(arr)
-    n = min(n, narr)
+    def nlargest(self):
+        return self.compute('nlargest')
 
-    sdtype = str(arr.dtype)
-    arr = arr.view(_dtype_map.get(sdtype, sdtype))
-
-    kth_val = algos.kth_smallest(arr.copy(), n - 1)
-    return _finalize_nsmallest(arr, kth_val, n, keep, narr)
+    def nsmallest(self):
+        return self.compute('nsmallest')
 
+    @staticmethod
+    def is_valid_dtype_n_method(dtype):
+        """
+        Helper function to determine if dtype is valid for
+        nsmallest/nlargest methods
+        """
+        return ((is_numeric_dtype(dtype) and not is_complex_dtype(dtype)) or
+                needs_i8_conversion(dtype))
 
-def nlargest(arr, n, keep='first'):
-    """
-    Find the indices of the n largest values of a numpy array.
 
-    Note: Fails silently with NaN.
+class SelectNSeries(SelectN):
     """
-    sdtype = str(arr.dtype)
-    arr = arr.view(_dtype_map.get(sdtype, sdtype))
-    return nsmallest(-arr, n, keep=keep)
-
-
-def select_n_slow(dropped, n, keep, method):
-    reverse_it = (keep == 'last' or method == 'nlargest')
-    ascending = method == 'nsmallest'
-    slc = np.s_[::-1] if reverse_it else np.s_[:]
-    return dropped[slc].sort_values(ascending=ascending).head(n)
-
-
-_select_methods = {'nsmallest': nsmallest, 'nlargest': nlargest}
-
-
-def select_n_series(series, n, keep, method):
-    """Implement n largest/smallest for pandas Series
+    Implement n largest/smallest for Series
 
     Parameters
     ----------
-    series : pandas.Series object
+    obj : Series
     n : int
     keep : {'first', 'last'}, default 'first'
-    method : str, {'nlargest', 'nsmallest'}
 
     Returns
     -------
     nordered : Series
     """
-    dtype = series.dtype
-    if not issubclass(dtype.type, (np.integer, np.floating, np.datetime64,
-                                   np.timedelta64)):
-        raise TypeError("Cannot use method %r with dtype %s" % (method, dtype))
 
-    if keep not in ('first', 'last'):
-        raise ValueError('keep must be either "first", "last"')
+    def compute(self, method):
 
-    if n <= 0:
-        return series[[]]
+        n = self.n
+        dtype = self.obj.dtype
+        if not self.is_valid_dtype_n_method(dtype):
+            raise TypeError("Cannot use method '{method}' with "
+                            "dtype {dtype}".format(method=method,
+                                                   dtype=dtype))
 
-    dropped = series.dropna()
+        if n <= 0:
+            return self.obj[[]]
 
-    if n >= len(series):
-        return select_n_slow(dropped, n, keep, method)
+        dropped = self.obj.dropna()
 
-    inds = _select_methods[method](dropped.values, n, keep)
-    return dropped.iloc[inds]
+        # slow method
+        if n >= len(self.obj):
 
+            reverse_it = (self.keep == 'last' or method == 'nlargest')
+            ascending = method == 'nsmallest'
+            slc = np.s_[::-1] if reverse_it else np.s_[:]
+            return dropped[slc].sort_values(ascending=ascending).head(n)
 
-def select_n_frame(frame, columns, n, method, keep):
-    """Implement n largest/smallest for pandas DataFrame
+        # fast method
+        arr, pandas_dtype, _ = _ensure_data(dropped.values)
+        if method == 'nlargest':
+            arr = -arr
+            if is_integer_dtype(pandas_dtype):
+                # GH 21426: ensure reverse ordering at boundaries
+                arr -= 1
 
-    Parameters
-    ----------
-    frame : pandas.DataFrame object
-    columns : list or str
-    n : int
-    keep : {'first', 'last'}, default 'first'
-    method : str, {'nlargest', 'nsmallest'}
-
-    Returns
-    -------
-    nordered : DataFrame
-    """
-    from pandas.core.series import Series
-    if not is_list_like(columns):
-        columns = [columns]
-    columns = list(columns)
-    ser = getattr(frame[columns[0]], method)(n, keep=keep)
-    if isinstance(ser, Series):
-        ser = ser.to_frame()
-    return ser.merge(frame, on=columns[0], left_index=True)[frame.columns]
-
-
-def _finalize_nsmallest(arr, kth_val, n, keep, narr):
-    ns, = np.nonzero(arr <= kth_val)
-    inds = ns[arr[ns].argsort(kind='mergesort')][:n]
-    if keep == 'last':
-        # reverse indices
-        return narr - 1 - inds
-    else:
-        return inds
+        if self.keep == 'last':
+            arr = arr[::-1]
 
+        narr = len(arr)
+        n = min(n, narr)
 
-_dtype_map = {'datetime64[ns]': 'int64', 'timedelta64[ns]': 'int64'}
+        kth_val = algos.kth_smallest(arr.copy(), n - 1)
+        ns, = np.nonzero(arr <= kth_val)
+        inds = ns[arr[ns].argsort(kind='mergesort')]
 
+        if self.keep != 'all':
+            inds = inds[:n]
 
-# ------- #
-# helpers #
-# ------- #
+        if self.keep == 'last':
+            # reverse indices
+            inds = narr - 1 - inds
 
-def _hashtable_algo(f, values, return_dtype=None):
-    """
-    f(HashTable, type_caster) -> result
-    """
+        return dropped.iloc[inds]
 
-    dtype = values.dtype
-    if is_float_dtype(dtype):
-        return f(htable.Float64HashTable, _ensure_float64)
-    elif is_signed_integer_dtype(dtype):
-        return f(htable.Int64HashTable, _ensure_int64)
-    elif is_unsigned_integer_dtype(dtype):
-        return f(htable.UInt64HashTable, _ensure_uint64)
-    elif is_datetime64_dtype(dtype):
-        return_dtype = return_dtype or 'M8[ns]'
-        return f(htable.Int64HashTable, _ensure_int64).view(return_dtype)
-    elif is_timedelta64_dtype(dtype):
-        return_dtype = return_dtype or 'm8[ns]'
-        return f(htable.Int64HashTable, _ensure_int64).view(return_dtype)
-
-    # its cheaper to use a String Hash Table than Object
-    if lib.infer_dtype(values) in ['string']:
-        return f(htable.StringHashTable, _ensure_object)
-
-    # use Object
-    return f(htable.PyObjectHashTable, _ensure_object)
-
-
-_hashtables = {
-    'float64': (htable.Float64HashTable, htable.Float64Vector),
-    'uint64': (htable.UInt64HashTable, htable.UInt64Vector),
-    'int64': (htable.Int64HashTable, htable.Int64Vector),
-    'string': (htable.StringHashTable, htable.ObjectVector),
-    'object': (htable.PyObjectHashTable, htable.ObjectVector)
-}
 
+class SelectNFrame(SelectN):
+    """
+    Implement n largest/smallest for DataFrame
 
-def _get_data_algo(values, func_map):
-
-    f = None
-
-    if is_categorical_dtype(values):
-        values = values._values_for_rank()
-
-    if is_float_dtype(values):
-        f = func_map['float64']
-        values = _ensure_float64(values)
-
-    elif needs_i8_conversion(values):
-        f = func_map['int64']
-        values = values.view('i8')
-
-    elif is_signed_integer_dtype(values):
-        f = func_map['int64']
-        values = _ensure_int64(values)
-
-    elif is_unsigned_integer_dtype(values):
-        f = func_map['uint64']
-        values = _ensure_uint64(values)
-
-    else:
-        values = _ensure_object(values)
-
-        # its cheaper to use a String Hash Table than Object
-        if lib.infer_dtype(values) in ['string']:
-            try:
-                f = func_map['string']
-            except KeyError:
-                pass
-
-    if f is None:
-        f = func_map['object']
-
-    return f, values
+    Parameters
+    ----------
+    obj : DataFrame
+    n : int
+    keep : {'first', 'last'}, default 'first'
+    columns : list or str
 
+    Returns
+    -------
+    nordered : DataFrame
+    """
 
-# ---- #
+    def __init__(self, obj, n, keep, columns):
+        super(SelectNFrame, self).__init__(obj, n, keep)
+        if not is_list_like(columns) or isinstance(columns, tuple):
+            columns = [columns]
+        columns = list(columns)
+        self.columns = columns
+
+    def compute(self, method):
+
+        from pandas import Int64Index
+        n = self.n
+        frame = self.obj
+        columns = self.columns
+
+        for column in columns:
+            dtype = frame[column].dtype
+            if not self.is_valid_dtype_n_method(dtype):
+                raise TypeError((
+                    "Column {column!r} has dtype {dtype}, cannot use method "
+                    "{method!r} with this dtype"
+                ).format(column=column, dtype=dtype, method=method))
+
+        def get_indexer(current_indexer, other_indexer):
+            """Helper function to concat `current_indexer` and `other_indexer`
+            depending on `method`
+            """
+            if method == 'nsmallest':
+                return current_indexer.append(other_indexer)
+            else:
+                return other_indexer.append(current_indexer)
+
+        # Below we save and reset the index in case index contains duplicates
+        original_index = frame.index
+        cur_frame = frame = frame.reset_index(drop=True)
+        cur_n = n
+        indexer = Int64Index([])
+
+        for i, column in enumerate(columns):
+            # For each column we apply method to cur_frame[column].
+            # If it's the last column or if we have the number of
+            # results desired we are done.
+            # Otherwise there are duplicates of the largest/smallest
+            # value and we need to look at the rest of the columns
+            # to determine which of the rows with the largest/smallest
+            # value in the column to keep.
+            series = cur_frame[column]
+            is_last_column = len(columns) - 1 == i
+            values = getattr(series, method)(
+                cur_n,
+                keep=self.keep if is_last_column else 'all')
+
+            if is_last_column or len(values) <= cur_n:
+                indexer = get_indexer(indexer, values.index)
+                break
+
+            # Now find all values which are equal to
+            # the (nsmallest: largest)/(nlarrgest: smallest)
+            # from our series.
+            border_value = values == values[values.index[-1]]
+
+            # Some of these values are among the top-n
+            # some aren't.
+            unsafe_values = values[border_value]
+
+            # These values are definitely among the top-n
+            safe_values = values[~border_value]
+            indexer = get_indexer(indexer, safe_values.index)
+
+            # Go on and separate the unsafe_values on the remaining
+            # columns.
+            cur_frame = cur_frame.loc[unsafe_values.index]
+            cur_n = n - len(indexer)
+
+        frame = frame.take(indexer)
+
+        # Restore the index on frame
+        frame.index = original_index.take(indexer)
+
+        # If there is only one column, the frame is already sorted.
+        if len(columns) == 1:
+            return frame
+
+        ascending = method == 'nsmallest'
+
+        return frame.sort_values(
+            columns,
+            ascending=ascending,
+            kind='mergesort')
+
+
+# ------- ## ---- #
 # take #
 # ---- #
 
@@ -1104,7 +1298,7 @@ def _take_nd_object(arr, indexer, out, axis, fill_value, mask_info):
     if arr.dtype != out.dtype:
         arr = arr.astype(out.dtype)
     if arr.shape[axis] > 0:
-        arr.take(_ensure_platform_int(indexer), axis=axis, out=out)
+        arr.take(ensure_platform_int(indexer), axis=axis, out=out)
     if needs_masking:
         outindexer = [slice(None)] * arr.ndim
         outindexer[axis] = mask
@@ -1245,25 +1439,122 @@ def _get_take_nd_function(ndim, arr_dtype, out_dtype, axis=0, mask_info=None):
             return func
 
     def func(arr, indexer, out, fill_value=np.nan):
-        indexer = _ensure_int64(indexer)
+        indexer = ensure_int64(indexer)
         _take_nd_object(arr, indexer, out, axis=axis, fill_value=fill_value,
                         mask_info=mask_info)
 
     return func
 
 
+def take(arr, indices, axis=0, allow_fill=False, fill_value=None):
+    """
+    Take elements from an array.
+
+    .. versionadded:: 0.23.0
+
+    Parameters
+    ----------
+    arr : sequence
+        Non array-likes (sequences without a dtype) are coerced
+        to an ndarray.
+    indices : sequence of integers
+        Indices to be taken.
+    axis : int, default 0
+        The axis over which to select values.
+    allow_fill : bool, default False
+        How to handle negative values in `indices`.
+
+        * False: negative values in `indices` indicate positional indices
+          from the right (the default). This is similar to :func:`numpy.take`.
+
+        * True: negative values in `indices` indicate
+          missing values. These values are set to `fill_value`. Any other
+          other negative values raise a ``ValueError``.
+
+    fill_value : any, optional
+        Fill value to use for NA-indices when `allow_fill` is True.
+        This may be ``None``, in which case the default NA value for
+        the type (``self.dtype.na_value``) is used.
+
+        For multi-dimensional `arr`, each *element* is filled with
+        `fill_value`.
+
+    Returns
+    -------
+    ndarray or ExtensionArray
+        Same type as the input.
+
+    Raises
+    ------
+    IndexError
+        When `indices` is out of bounds for the array.
+    ValueError
+        When the indexer contains negative values other than ``-1``
+        and `allow_fill` is True.
+
+    Notes
+    -----
+    When `allow_fill` is False, `indices` may be whatever dimensionality
+    is accepted by NumPy for `arr`.
+
+    When `allow_fill` is True, `indices` should be 1-D.
+
+    See Also
+    --------
+    numpy.take
+
+    Examples
+    --------
+    >>> from pandas.api.extensions import take
+
+    With the default ``allow_fill=False``, negative numbers indicate
+    positional indices from the right.
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1])
+    array([10, 10, 30])
+
+    Setting ``allow_fill=True`` will place `fill_value` in those positions.
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1], allow_fill=True)
+    array([10., 10., nan])
+
+    >>> take(np.array([10, 20, 30]), [0, 0, -1], allow_fill=True,
+    ...      fill_value=-10)
+    array([ 10,  10, -10])
+    """
+    from pandas.core.indexing import validate_indices
+
+    if not is_array_like(arr):
+        arr = np.asarray(arr)
+
+    indices = np.asarray(indices, dtype=np.intp)
+
+    if allow_fill:
+        # Pandas style, -1 means NA
+        validate_indices(indices, len(arr))
+        result = take_1d(arr, indices, axis=axis, allow_fill=True,
+                         fill_value=fill_value)
+    else:
+        # NumPy style
+        result = arr.take(indices, axis=axis)
+    return result
+
+
 def take_nd(arr, indexer, axis=0, out=None, fill_value=np.nan, mask_info=None,
             allow_fill=True):
     """
     Specialized Cython take which sets NaN values in one pass
 
+    This dispatches to ``take`` defined on ExtensionArrays. It does not
+    currently dispatch to ``SparseArray.take`` for sparse ``arr``.
+
     Parameters
     ----------
-    arr : ndarray
-        Input array
+    arr : array-like
+        Input array.
     indexer : ndarray
         1-D array of indices to take, subarrays corresponding to -1 value
-        indicies are filed with fill_value
+        indices are filed with fill_value
     axis : int, default 0
         Axis to take from
     out : ndarray or None, default None
@@ -1280,20 +1571,34 @@ def take_nd(arr, indexer, axis=0, out=None, fill_value=np.nan, mask_info=None,
         If False, indexer is assumed to contain no -1 values so no filling
         will be done.  This short-circuits computation of a mask.  Result is
         undefined if allow_fill == False and -1 is present in indexer.
+
+    Returns
+    -------
+    subarray : array-like
+        May be the same type as the input, or cast to an ndarray.
     """
 
+    # TODO(EA): Remove these if / elifs as datetimeTZ, interval, become EAs
     # dispatch to internal type takes
-    if is_categorical(arr):
-        return arr.take_nd(indexer, fill_value=fill_value,
-                           allow_fill=allow_fill)
-    elif is_datetimetz(arr):
+    if is_extension_array_dtype(arr):
+        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+    elif is_datetime64tz_dtype(arr):
         return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+    elif is_interval_dtype(arr):
+        return arr.take(indexer, fill_value=fill_value, allow_fill=allow_fill)
+
+    if is_sparse(arr):
+        arr = arr.get_values()
+    elif isinstance(arr, (ABCIndexClass, ABCSeries)):
+        arr = arr.values
+
+    arr = np.asarray(arr)
 
     if indexer is None:
         indexer = np.arange(arr.shape[axis], dtype=np.int64)
         dtype, fill_value = arr.dtype, arr.dtype.type()
     else:
-        indexer = _ensure_int64(indexer, copy=False)
+        indexer = ensure_int64(indexer, copy=False)
         if not allow_fill:
             dtype, fill_value = arr.dtype, arr.dtype.type()
             mask_info = None, False
@@ -1371,11 +1676,11 @@ def take_2d_multi(arr, indexer, out=None, fill_value=np.nan, mask_info=None,
         if row_idx is None:
             row_idx = np.arange(arr.shape[0], dtype=np.int64)
         else:
-            row_idx = _ensure_int64(row_idx)
+            row_idx = ensure_int64(row_idx)
         if col_idx is None:
             col_idx = np.arange(arr.shape[1], dtype=np.int64)
         else:
-            col_idx = _ensure_int64(col_idx)
+            col_idx = ensure_int64(col_idx)
         indexer = row_idx, col_idx
         if not allow_fill:
             dtype, fill_value = arr.dtype, arr.dtype.type()
@@ -1424,6 +1729,89 @@ def func(arr, indexer, out, fill_value=np.nan):
     return out
 
 
+# ------------ #
+# searchsorted #
+# ------------ #
+
+def searchsorted(arr, value, side="left", sorter=None):
+    """
+    Find indices where elements should be inserted to maintain order.
+
+    .. versionadded:: 0.25.0
+
+    Find the indices into a sorted array `arr` (a) such that, if the
+    corresponding elements in `value` were inserted before the indices,
+    the order of `arr` would be preserved.
+
+    Assuming that `arr` is sorted:
+
+    ======  ================================
+    `side`  returned index `i` satisfies
+    ======  ================================
+    left    ``arr[i-1] < value <= self[i]``
+    right   ``arr[i-1] <= value < self[i]``
+    ======  ================================
+
+    Parameters
+    ----------
+    arr: array-like
+        Input array. If `sorter` is None, then it must be sorted in
+        ascending order, otherwise `sorter` must be an array of indices
+        that sort it.
+    value : array_like
+        Values to insert into `arr`.
+    side : {'left', 'right'}, optional
+        If 'left', the index of the first suitable location found is given.
+        If 'right', return the last such index.  If there is no suitable
+        index, return either 0 or N (where N is the length of `self`).
+    sorter : 1-D array_like, optional
+        Optional array of integer indices that sort array a into ascending
+        order. They are typically the result of argsort.
+
+    Returns
+    -------
+    array of ints
+        Array of insertion points with the same shape as `value`.
+
+    See Also
+    --------
+    numpy.searchsorted : Similar method from NumPy.
+    """
+    if sorter is not None:
+        sorter = ensure_platform_int(sorter)
+
+    if isinstance(arr, np.ndarray) and is_integer_dtype(arr) and (
+            is_integer(value) or is_integer_dtype(value)):
+        from .arrays.array_ import array
+        # if `arr` and `value` have different dtypes, `arr` would be
+        # recast by numpy, causing a slow search.
+        # Before searching below, we therefore try to give `value` the
+        # same dtype as `arr`, while guarding against integer overflows.
+        iinfo = np.iinfo(arr.dtype.type)
+        value_arr = np.array([value]) if is_scalar(value) else np.array(value)
+        if (value_arr >= iinfo.min).all() and (value_arr <= iinfo.max).all():
+            # value within bounds, so no overflow, so can convert value dtype
+            # to dtype of arr
+            dtype = arr.dtype
+        else:
+            dtype = value_arr.dtype
+
+        if is_scalar(value):
+            value = dtype.type(value)
+        else:
+            value = array(value, dtype=dtype)
+    elif not (is_object_dtype(arr) or is_numeric_dtype(arr) or
+              is_categorical_dtype(arr)):
+        from pandas.core.series import Series
+        # E.g. if `arr` is an array with dtype='datetime64[ns]'
+        # and `value` is a pd.Timestamp, we may need to convert value
+        value_ser = Series(value)._values
+        value = value_ser[0] if is_scalar(value) else value_ser
+
+    result = arr.searchsorted(value, side=side, sorter=sorter)
+    return result
+
+
 # ---- #
 # diff #
 # ---- #
@@ -1439,23 +1827,41 @@ def func(arr, indexer, out, fill_value=np.nan):
 
 
 def diff(arr, n, axis=0):
-    """ difference of n between self,
-        analagoust to s-s.shift(n) """
+    """
+    difference of n between self,
+    analogous to s-s.shift(n)
+
+    Parameters
+    ----------
+    arr : ndarray
+    n : int
+        number of periods
+    axis : int
+        axis to shift on
+
+    Returns
+    -------
+    shifted
+
+    """
 
     n = int(n)
     na = np.nan
     dtype = arr.dtype
+
     is_timedelta = False
     if needs_i8_conversion(arr):
         dtype = np.float64
         arr = arr.view('i8')
         na = iNaT
         is_timedelta = True
-    elif issubclass(dtype.type, np.integer):
-        dtype = np.float64
-    elif issubclass(dtype.type, np.bool_):
+
+    elif is_bool_dtype(dtype):
         dtype = np.object_
 
+    elif is_integer_dtype(dtype):
+        dtype = np.float64
+
     dtype = np.dtype(dtype)
     out_arr = np.empty(arr.shape, dtype=dtype)
 
diff --git a/pandas/core/api.py b/pandas/core/api.py
index 65253dedb8b53..8c92287e212a6 100644
--- a/pandas/core/api.py
+++ b/pandas/core/api.py
@@ -4,61 +4,61 @@
 
 import numpy as np
 
+from pandas.core.arrays.integer import (
+    Int8Dtype,
+    Int16Dtype,
+    Int32Dtype,
+    Int64Dtype,
+    UInt8Dtype,
+    UInt16Dtype,
+    UInt32Dtype,
+    UInt64Dtype,
+)
 from pandas.core.algorithms import factorize, unique, value_counts
-from pandas.types.missing import isnull, notnull
-from pandas.core.categorical import Categorical
+from pandas.core.dtypes.missing import isna, isnull, notna, notnull
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype,
+    PeriodDtype,
+    IntervalDtype,
+    DatetimeTZDtype,
+)
+from pandas.core.arrays import Categorical, array
 from pandas.core.groupby import Grouper
-from pandas.formats.format import set_eng_float_format
+from pandas.io.formats.format import set_eng_float_format
 from pandas.core.index import (Index, CategoricalIndex, Int64Index,
                                UInt64Index, RangeIndex, Float64Index,
-                               MultiIndex)
+                               MultiIndex, IntervalIndex,
+                               TimedeltaIndex, DatetimeIndex,
+                               PeriodIndex, NaT)
+from pandas.core.indexes.period import Period, period_range
+from pandas.core.indexes.timedeltas import Timedelta, timedelta_range
+from pandas.core.indexes.datetimes import Timestamp, date_range, bdate_range
+from pandas.core.indexes.interval import Interval, interval_range
 
 from pandas.core.series import Series
 from pandas.core.frame import DataFrame
-from pandas.core.panel import Panel, WidePanel
-from pandas.core.panel4d import Panel4D
-from pandas.core.reshape import (pivot_simple as pivot, get_dummies,
-                                 lreshape, wide_to_long)
+from pandas.core.panel import Panel
+
+# TODO: Remove import when statsmodels updates #18264
+from pandas.core.reshape.reshape import get_dummies
 
 from pandas.core.indexing import IndexSlice
+from pandas.core.tools.numeric import to_numeric
 from pandas.tseries.offsets import DateOffset
-from pandas.tseries.tools import to_datetime
-from pandas.tseries.index import (DatetimeIndex, Timestamp,
-                                  date_range, bdate_range)
-from pandas.tseries.tdi import TimedeltaIndex, Timedelta
-from pandas.tseries.period import Period, PeriodIndex
-
-# see gh-14094.
-from pandas.util.depr_module import _DeprecatedModule
-
-_removals = ['day', 'bday', 'businessDay', 'cday', 'customBusinessDay',
-             'customBusinessMonthEnd', 'customBusinessMonthBegin',
-             'monthEnd', 'yearEnd', 'yearBegin', 'bmonthEnd', 'bmonthBegin',
-             'cbmonthEnd', 'cbmonthBegin', 'bquarterEnd', 'quarterEnd',
-             'byearEnd', 'week']
-datetools = _DeprecatedModule(deprmod='pandas.core.datetools',
-                              removals=_removals)
+from pandas.core.tools.datetimes import to_datetime
+from pandas.core.tools.timedeltas import to_timedelta
 
 from pandas.core.config import (get_option, set_option, reset_option,
                                 describe_option, option_context, options)
 
 
-# deprecation, xref #13790
-def match(*args, **kwargs):
-    import warnings
-
-    warnings.warn("pd.match() is deprecated and will be removed "
-                  "in a future version",
-                  FutureWarning, stacklevel=2)
-    from pandas.core.algorithms import match
-    return match(*args, **kwargs)
-
-
-def groupby(*args, **kwargs):
-    import warnings
+# Deprecation: xref gh-16747
+class TimeGrouper(object):
 
-    warnings.warn("pd.groupby() is deprecated and will be removed "
-                  "Please use the Series.groupby() or "
-                  "DataFrame.groupby() methods",
-                  FutureWarning, stacklevel=2)
-    return args[0].groupby(*args[1:], **kwargs)
+    def __new__(cls, *args, **kwargs):
+        from pandas.core.resample import TimeGrouper
+        import warnings
+        warnings.warn("pd.TimeGrouper is deprecated and will be removed; "
+                      "Please use pd.Grouper(freq=...)",
+                      FutureWarning, stacklevel=2)
+        return TimeGrouper(*args, **kwargs)
diff --git a/pandas/core/apply.py b/pandas/core/apply.py
new file mode 100644
index 0000000000000..5658094ec36c6
--- /dev/null
+++ b/pandas/core/apply.py
@@ -0,0 +1,411 @@
+import warnings
+
+import numpy as np
+
+from pandas._libs import reduction
+import pandas.compat as compat
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.common import (
+    is_dict_like, is_extension_type, is_list_like, is_sequence)
+from pandas.core.dtypes.generic import ABCSeries
+
+from pandas.io.formats.printing import pprint_thing
+
+
+def frame_apply(obj, func, axis=0, broadcast=None,
+                raw=False, reduce=None, result_type=None,
+                ignore_failures=False,
+                args=None, kwds=None):
+    """ construct and return a row or column based frame apply object """
+
+    axis = obj._get_axis_number(axis)
+    if axis == 0:
+        klass = FrameRowApply
+    elif axis == 1:
+        klass = FrameColumnApply
+
+    return klass(obj, func, broadcast=broadcast,
+                 raw=raw, reduce=reduce, result_type=result_type,
+                 ignore_failures=ignore_failures,
+                 args=args, kwds=kwds)
+
+
+class FrameApply(object):
+
+    def __init__(self, obj, func, broadcast, raw, reduce, result_type,
+                 ignore_failures, args, kwds):
+        self.obj = obj
+        self.raw = raw
+        self.ignore_failures = ignore_failures
+        self.args = args or ()
+        self.kwds = kwds or {}
+
+        if result_type not in [None, 'reduce', 'broadcast', 'expand']:
+            raise ValueError("invalid value for result_type, must be one "
+                             "of {None, 'reduce', 'broadcast', 'expand'}")
+
+        if broadcast is not None:
+            warnings.warn("The broadcast argument is deprecated and will "
+                          "be removed in a future version. You can specify "
+                          "result_type='broadcast' to broadcast the result "
+                          "to the original dimensions",
+                          FutureWarning, stacklevel=4)
+            if broadcast:
+                result_type = 'broadcast'
+
+        if reduce is not None:
+            warnings.warn("The reduce argument is deprecated and will "
+                          "be removed in a future version. You can specify "
+                          "result_type='reduce' to try to reduce the result "
+                          "to the original dimensions",
+                          FutureWarning, stacklevel=4)
+            if reduce:
+
+                if result_type is not None:
+                    raise ValueError(
+                        "cannot pass both reduce=True and result_type")
+
+                result_type = 'reduce'
+
+        self.result_type = result_type
+
+        # curry if needed
+        if ((kwds or args) and
+                not isinstance(func, (np.ufunc, compat.string_types))):
+
+            def f(x):
+                return func(x, *args, **kwds)
+        else:
+            f = func
+
+        self.f = f
+
+        # results
+        self.result = None
+        self.res_index = None
+        self.res_columns = None
+
+    @property
+    def columns(self):
+        return self.obj.columns
+
+    @property
+    def index(self):
+        return self.obj.index
+
+    @cache_readonly
+    def values(self):
+        return self.obj.values
+
+    @cache_readonly
+    def dtypes(self):
+        return self.obj.dtypes
+
+    @property
+    def agg_axis(self):
+        return self.obj._get_agg_axis(self.axis)
+
+    def get_result(self):
+        """ compute the results """
+
+        # dispatch to agg
+        if is_list_like(self.f) or is_dict_like(self.f):
+            return self.obj.aggregate(self.f, axis=self.axis,
+                                      *self.args, **self.kwds)
+
+        # all empty
+        if len(self.columns) == 0 and len(self.index) == 0:
+            return self.apply_empty_result()
+
+        # string dispatch
+        if isinstance(self.f, compat.string_types):
+            # Support for `frame.transform('method')`
+            # Some methods (shift, etc.) require the axis argument, others
+            # don't, so inspect and insert if necessary.
+            func = getattr(self.obj, self.f)
+            sig = compat.signature(func)
+            if 'axis' in sig.args:
+                self.kwds['axis'] = self.axis
+            return func(*self.args, **self.kwds)
+
+        # ufunc
+        elif isinstance(self.f, np.ufunc):
+            with np.errstate(all='ignore'):
+                results = self.obj._data.apply('apply', func=self.f)
+            return self.obj._constructor(data=results, index=self.index,
+                                         columns=self.columns, copy=False)
+
+        # broadcasting
+        if self.result_type == 'broadcast':
+            return self.apply_broadcast()
+
+        # one axis empty
+        elif not all(self.obj.shape):
+            return self.apply_empty_result()
+
+        # raw
+        elif self.raw and not self.obj._is_mixed_type:
+            return self.apply_raw()
+
+        return self.apply_standard()
+
+    def apply_empty_result(self):
+        """
+        we have an empty result; at least 1 axis is 0
+
+        we will try to apply the function to an empty
+        series in order to see if this is a reduction function
+        """
+
+        # we are not asked to reduce or infer reduction
+        # so just return a copy of the existing object
+        if self.result_type not in ['reduce', None]:
+            return self.obj.copy()
+
+        # we may need to infer
+        reduce = self.result_type == 'reduce'
+
+        from pandas import Series
+        if not reduce:
+
+            EMPTY_SERIES = Series([])
+            try:
+                r = self.f(EMPTY_SERIES, *self.args, **self.kwds)
+                reduce = not isinstance(r, Series)
+            except Exception:
+                pass
+
+        if reduce:
+            return self.obj._constructor_sliced(np.nan, index=self.agg_axis)
+        else:
+            return self.obj.copy()
+
+    def apply_raw(self):
+        """ apply to the values as a numpy array """
+
+        try:
+            result = reduction.reduce(self.values, self.f, axis=self.axis)
+        except Exception:
+            result = np.apply_along_axis(self.f, self.axis, self.values)
+
+        # TODO: mixed type case
+        if result.ndim == 2:
+            return self.obj._constructor(result,
+                                         index=self.index,
+                                         columns=self.columns)
+        else:
+            return self.obj._constructor_sliced(result,
+                                                index=self.agg_axis)
+
+    def apply_broadcast(self, target):
+        result_values = np.empty_like(target.values)
+
+        # axis which we want to compare compliance
+        result_compare = target.shape[0]
+
+        for i, col in enumerate(target.columns):
+            res = self.f(target[col])
+            ares = np.asarray(res).ndim
+
+            # must be a scalar or 1d
+            if ares > 1:
+                raise ValueError("too many dims to broadcast")
+            elif ares == 1:
+
+                # must match return dim
+                if result_compare != len(res):
+                    raise ValueError("cannot broadcast result")
+
+            result_values[:, i] = res
+
+        # we *always* preserve the original index / columns
+        result = self.obj._constructor(result_values,
+                                       index=target.index,
+                                       columns=target.columns)
+        return result
+
+    def apply_standard(self):
+
+        # try to reduce first (by default)
+        # this only matters if the reduction in values is of different dtype
+        # e.g. if we want to apply to a SparseFrame, then can't directly reduce
+
+        # we cannot reduce using non-numpy dtypes,
+        # as demonstrated in gh-12244
+        if (self.result_type in ['reduce', None] and
+                not self.dtypes.apply(is_extension_type).any()):
+
+            # Create a dummy Series from an empty array
+            from pandas import Series
+            values = self.values
+            index = self.obj._get_axis(self.axis)
+            labels = self.agg_axis
+            empty_arr = np.empty(len(index), dtype=values.dtype)
+            dummy = Series(empty_arr, index=index, dtype=values.dtype)
+
+            try:
+                result = reduction.reduce(values, self.f,
+                                          axis=self.axis,
+                                          dummy=dummy,
+                                          labels=labels)
+                return self.obj._constructor_sliced(result, index=labels)
+            except Exception:
+                pass
+
+        # compute the result using the series generator
+        self.apply_series_generator()
+
+        # wrap results
+        return self.wrap_results()
+
+    def apply_series_generator(self):
+        series_gen = self.series_generator
+        res_index = self.result_index
+
+        i = None
+        keys = []
+        results = {}
+        if self.ignore_failures:
+            successes = []
+            for i, v in enumerate(series_gen):
+                try:
+                    results[i] = self.f(v)
+                    keys.append(v.name)
+                    successes.append(i)
+                except Exception:
+                    pass
+
+            # so will work with MultiIndex
+            if len(successes) < len(res_index):
+                res_index = res_index.take(successes)
+
+        else:
+            try:
+                for i, v in enumerate(series_gen):
+                    results[i] = self.f(v)
+                    keys.append(v.name)
+            except Exception as e:
+                if hasattr(e, 'args'):
+
+                    # make sure i is defined
+                    if i is not None:
+                        k = res_index[i]
+                        e.args = e.args + ('occurred at index %s' %
+                                           pprint_thing(k), )
+                raise
+
+        self.results = results
+        self.res_index = res_index
+        self.res_columns = self.result_columns
+
+    def wrap_results(self):
+        results = self.results
+
+        # see if we can infer the results
+        if len(results) > 0 and is_sequence(results[0]):
+
+            return self.wrap_results_for_axis()
+
+        # dict of scalars
+        result = self.obj._constructor_sliced(results)
+        result.index = self.res_index
+
+        return result
+
+
+class FrameRowApply(FrameApply):
+    axis = 0
+
+    def apply_broadcast(self):
+        return super(FrameRowApply, self).apply_broadcast(self.obj)
+
+    @property
+    def series_generator(self):
+        return (self.obj._ixs(i, axis=1)
+                for i in range(len(self.columns)))
+
+    @property
+    def result_index(self):
+        return self.columns
+
+    @property
+    def result_columns(self):
+        return self.index
+
+    def wrap_results_for_axis(self):
+        """ return the results for the rows """
+
+        results = self.results
+        result = self.obj._constructor(data=results)
+
+        if not isinstance(results[0], ABCSeries):
+            try:
+                result.index = self.res_columns
+            except ValueError:
+                pass
+
+        try:
+            result.columns = self.res_index
+        except ValueError:
+            pass
+
+        return result
+
+
+class FrameColumnApply(FrameApply):
+    axis = 1
+
+    def apply_broadcast(self):
+        result = super(FrameColumnApply, self).apply_broadcast(self.obj.T)
+        return result.T
+
+    @property
+    def series_generator(self):
+        constructor = self.obj._constructor_sliced
+        return (constructor(arr, index=self.columns, name=name)
+                for i, (arr, name) in enumerate(zip(self.values,
+                                                    self.index)))
+
+    @property
+    def result_index(self):
+        return self.index
+
+    @property
+    def result_columns(self):
+        return self.columns
+
+    def wrap_results_for_axis(self):
+        """ return the results for the columns """
+        results = self.results
+
+        # we have requested to expand
+        if self.result_type == 'expand':
+            result = self.infer_to_same_shape()
+
+        # we have a non-series and don't want inference
+        elif not isinstance(results[0], ABCSeries):
+            from pandas import Series
+            result = Series(results)
+            result.index = self.res_index
+
+        # we may want to infer results
+        else:
+            result = self.infer_to_same_shape()
+
+        return result
+
+    def infer_to_same_shape(self):
+        """ infer the results to the same shape as the input object """
+        results = self.results
+
+        result = self.obj._constructor(data=results)
+        result = result.T
+
+        # set the index
+        result.index = self.res_index
+
+        # infer dtypes
+        result = result.infer_objects()
+
+        return result
diff --git a/pandas/core/arrays/__init__.py b/pandas/core/arrays/__init__.py
new file mode 100644
index 0000000000000..1033ce784046e
--- /dev/null
+++ b/pandas/core/arrays/__init__.py
@@ -0,0 +1,13 @@
+from .array_ import array  # noqa
+from .base import (ExtensionArray,    # noqa
+                   ExtensionOpsMixin,
+                   ExtensionScalarOpsMixin)
+from .categorical import Categorical  # noqa
+from .datetimes import DatetimeArray  # noqa
+from .interval import IntervalArray  # noqa
+from .period import PeriodArray, period_array  # noqa
+from .timedeltas import TimedeltaArray  # noqa
+from .integer import (  # noqa
+    IntegerArray, integer_array)
+from .sparse import SparseArray  # noqa
+from .numpy_ import PandasArray, PandasDtype  # noqa
diff --git a/pandas/core/arrays/_ranges.py b/pandas/core/arrays/_ranges.py
new file mode 100644
index 0000000000000..66c1b8e158672
--- /dev/null
+++ b/pandas/core/arrays/_ranges.py
@@ -0,0 +1,188 @@
+# -*- coding: utf-8 -*-
+"""
+Helper functions to generate range-like data for DatetimeArray
+(and possibly TimedeltaArray/PeriodArray)
+"""
+
+import numpy as np
+
+from pandas._libs.tslibs import OutOfBoundsDatetime, Timestamp
+
+from pandas.tseries.offsets import Tick, generate_range
+
+
+def generate_regular_range(start, end, periods, freq):
+    """
+    Generate a range of dates with the spans between dates described by
+    the given `freq` DateOffset.
+
+    Parameters
+    ----------
+    start : Timestamp or None
+        first point of produced date range
+    end : Timestamp or None
+        last point of produced date range
+    periods : int
+        number of periods in produced date range
+    freq : DateOffset
+        describes space between dates in produced date range
+
+    Returns
+    -------
+    ndarray[np.int64] representing nanosecond unix timestamps
+    """
+    if isinstance(freq, Tick):
+        stride = freq.nanos
+        if periods is None:
+            b = Timestamp(start).value
+            # cannot just use e = Timestamp(end) + 1 because arange breaks when
+            # stride is too large, see GH10887
+            e = (b + (Timestamp(end).value - b) // stride * stride +
+                 stride // 2 + 1)
+            # end.tz == start.tz by this point due to _generate implementation
+            tz = start.tz
+        elif start is not None:
+            b = Timestamp(start).value
+            e = _generate_range_overflow_safe(b, periods, stride, side='start')
+            tz = start.tz
+        elif end is not None:
+            e = Timestamp(end).value + stride
+            b = _generate_range_overflow_safe(e, periods, stride, side='end')
+            tz = end.tz
+        else:
+            raise ValueError("at least 'start' or 'end' should be specified "
+                             "if a 'period' is given.")
+
+        with np.errstate(over="raise"):
+            # If the range is sufficiently large, np.arange may overflow
+            #  and incorrectly return an empty array if not caught.
+            try:
+                values = np.arange(b, e, stride, dtype=np.int64)
+            except FloatingPointError:
+                xdr = [b]
+                while xdr[-1] != e:
+                    xdr.append(xdr[-1] + stride)
+                values = np.array(xdr[:-1], dtype=np.int64)
+
+    else:
+        tz = None
+        # start and end should have the same timezone by this point
+        if start is not None:
+            tz = start.tz
+        elif end is not None:
+            tz = end.tz
+
+        xdr = generate_range(start=start, end=end,
+                             periods=periods, offset=freq)
+
+        values = np.array([x.value for x in xdr], dtype=np.int64)
+
+    return values, tz
+
+
+def _generate_range_overflow_safe(endpoint, periods, stride, side='start'):
+    """
+    Calculate the second endpoint for passing to np.arange, checking
+    to avoid an integer overflow.  Catch OverflowError and re-raise
+    as OutOfBoundsDatetime.
+
+    Parameters
+    ----------
+    endpoint : int
+        nanosecond timestamp of the known endpoint of the desired range
+    periods : int
+        number of periods in the desired range
+    stride : int
+        nanoseconds between periods in the desired range
+    side : {'start', 'end'}
+        which end of the range `endpoint` refers to
+
+    Returns
+    -------
+    other_end : int
+
+    Raises
+    ------
+    OutOfBoundsDatetime
+    """
+    # GH#14187 raise instead of incorrectly wrapping around
+    assert side in ['start', 'end']
+
+    i64max = np.uint64(np.iinfo(np.int64).max)
+    msg = ('Cannot generate range with {side}={endpoint} and '
+           'periods={periods}'
+           .format(side=side, endpoint=endpoint, periods=periods))
+
+    with np.errstate(over="raise"):
+        # if periods * strides cannot be multiplied within the *uint64* bounds,
+        #  we cannot salvage the operation by recursing, so raise
+        try:
+            addend = np.uint64(periods) * np.uint64(np.abs(stride))
+        except FloatingPointError:
+            raise OutOfBoundsDatetime(msg)
+
+    if np.abs(addend) <= i64max:
+        # relatively easy case without casting concerns
+        return _generate_range_overflow_safe_signed(
+            endpoint, periods, stride, side)
+
+    elif ((endpoint > 0 and side == 'start' and stride > 0) or
+          (endpoint < 0 and side == 'end' and stride > 0)):
+        # no chance of not-overflowing
+        raise OutOfBoundsDatetime(msg)
+
+    elif (side == 'end' and endpoint > i64max and endpoint - stride <= i64max):
+        # in _generate_regular_range we added `stride` thereby overflowing
+        #  the bounds.  Adjust to fix this.
+        return _generate_range_overflow_safe(endpoint - stride,
+                                             periods - 1, stride, side)
+
+    # split into smaller pieces
+    mid_periods = periods // 2
+    remaining = periods - mid_periods
+    assert 0 < remaining < periods, (remaining, periods, endpoint, stride)
+
+    midpoint = _generate_range_overflow_safe(endpoint, mid_periods,
+                                             stride, side)
+    return _generate_range_overflow_safe(midpoint, remaining, stride, side)
+
+
+def _generate_range_overflow_safe_signed(endpoint, periods, stride, side):
+    """
+    A special case for _generate_range_overflow_safe where `periods * stride`
+    can be calculated without overflowing int64 bounds.
+    """
+    assert side in ['start', 'end']
+    if side == 'end':
+        stride *= -1
+
+    with np.errstate(over="raise"):
+        addend = np.int64(periods) * np.int64(stride)
+        try:
+            # easy case with no overflows
+            return np.int64(endpoint) + addend
+        except (FloatingPointError, OverflowError):
+            # with endpoint negative and addend positive we risk
+            #  FloatingPointError; with reversed signed we risk OverflowError
+            pass
+
+        # if stride and endpoint had opposite signs, then endpoint + addend
+        #  should never overflow.  so they must have the same signs
+        assert (stride > 0 and endpoint >= 0) or (stride < 0 and endpoint <= 0)
+
+        if stride > 0:
+            # watch out for very special case in which we just slightly
+            #  exceed implementation bounds, but when passing the result to
+            #  np.arange will get a result slightly within the bounds
+            assert endpoint >= 0
+            result = np.uint64(endpoint) + np.uint64(addend)
+            i64max = np.uint64(np.iinfo(np.int64).max)
+            assert result > i64max
+            if result <= i64max + np.uint64(stride):
+                return result
+
+    raise OutOfBoundsDatetime('Cannot generate range with '
+                              '{side}={endpoint} and '
+                              'periods={periods}'
+                              .format(side=side, endpoint=endpoint,
+                                      periods=periods))
diff --git a/pandas/core/arrays/array_.py b/pandas/core/arrays/array_.py
new file mode 100644
index 0000000000000..41d623c7efd9c
--- /dev/null
+++ b/pandas/core/arrays/array_.py
@@ -0,0 +1,274 @@
+from pandas._libs import lib, tslibs
+
+from pandas.core.dtypes.common import (
+    is_datetime64_ns_dtype, is_extension_array_dtype, is_timedelta64_ns_dtype)
+from pandas.core.dtypes.dtypes import registry
+
+from pandas import compat
+
+
+def array(data,         # type: Sequence[object]
+          dtype=None,   # type: Optional[Union[str, np.dtype, ExtensionDtype]]
+          copy=True,    # type: bool
+          ):
+    # type: (...) -> ExtensionArray
+    """
+    Create an array.
+
+    .. versionadded:: 0.24.0
+
+    Parameters
+    ----------
+    data : Sequence of objects
+        The scalars inside `data` should be instances of the
+        scalar type for `dtype`. It's expected that `data`
+        represents a 1-dimensional array of data.
+
+        When `data` is an Index or Series, the underlying array
+        will be extracted from `data`.
+
+    dtype : str, np.dtype, or ExtensionDtype, optional
+        The dtype to use for the array. This may be a NumPy
+        dtype or an extension type registered with pandas using
+        :meth:`pandas.api.extensions.register_extension_dtype`.
+
+        If not specified, there are two possibilities:
+
+        1. When `data` is a :class:`Series`, :class:`Index`, or
+           :class:`ExtensionArray`, the `dtype` will be taken
+           from the data.
+        2. Otherwise, pandas will attempt to infer the `dtype`
+           from the data.
+
+        Note that when `data` is a NumPy array, ``data.dtype`` is
+        *not* used for inferring the array type. This is because
+        NumPy cannot represent all the types of data that can be
+        held in extension arrays.
+
+        Currently, pandas will infer an extension dtype for sequences of
+
+        ============================== =====================================
+        Scalar Type                    Array Type
+        ============================== =====================================
+        :class:`pandas.Interval`       :class:`pandas.arrays.IntervalArray`
+        :class:`pandas.Period`         :class:`pandas.arrays.PeriodArray`
+        :class:`datetime.datetime`     :class:`pandas.arrays.DatetimeArray`
+        :class:`datetime.timedelta`    :class:`pandas.arrays.TimedeltaArray`
+        ============================== =====================================
+
+        For all other cases, NumPy's usual inference rules will be used.
+
+    copy : bool, default True
+        Whether to copy the data, even if not necessary. Depending
+        on the type of `data`, creating the new array may require
+        copying data, even if ``copy=False``.
+
+    Returns
+    -------
+    ExtensionArray
+        The newly created array.
+
+    Raises
+    ------
+    ValueError
+        When `data` is not 1-dimensional.
+
+    See Also
+    --------
+    numpy.array : Construct a NumPy array.
+    Series : Construct a pandas Series.
+    Index : Construct a pandas Index.
+    arrays.PandasArray : ExtensionArray wrapping a NumPy array.
+    Series.array : Extract the array stored within a Series.
+
+    Notes
+    -----
+    Omitting the `dtype` argument means pandas will attempt to infer the
+    best array type from the values in the data. As new array types are
+    added by pandas and 3rd party libraries, the "best" array type may
+    change. We recommend specifying `dtype` to ensure that
+
+    1. the correct array type for the data is returned
+    2. the returned array type doesn't change as new extension types
+       are added by pandas and third-party libraries
+
+    Additionally, if the underlying memory representation of the returned
+    array matters, we recommend specifying the `dtype` as a concrete object
+    rather than a string alias or allowing it to be inferred. For example,
+    a future version of pandas or a 3rd-party library may include a
+    dedicated ExtensionArray for string data. In this event, the following
+    would no longer return a :class:`arrays.PandasArray` backed by a NumPy
+    array.
+
+    >>> pd.array(['a', 'b'], dtype=str)
+    <PandasArray>
+    ['a', 'b']
+    Length: 2, dtype: str32
+
+    This would instead return the new ExtensionArray dedicated for string
+    data. If you really need the new array to be backed by a  NumPy array,
+    specify that in the dtype.
+
+    >>> pd.array(['a', 'b'], dtype=np.dtype("<U1"))
+    <PandasArray>
+    ['a', 'b']
+    Length: 2, dtype: str32
+
+    Or use the dedicated constructor for the array you're expecting, and
+    wrap that in a PandasArray
+
+    >>> pd.array(np.array(['a', 'b'], dtype='<U1'))
+    <PandasArray>
+    ['a', 'b']
+    Length: 2, dtype: str32
+
+    Finally, Pandas has arrays that mostly overlap with NumPy
+
+      * :class:`arrays.DatetimeArray`
+      * :class:`arrays.TimedeltaArray`
+
+    When data with a ``datetime64[ns]`` or ``timedelta64[ns]`` dtype is
+    passed, pandas will always return a ``DatetimeArray`` or ``TimedeltaArray``
+    rather than a ``PandasArray``. This is for symmetry with the case of
+    timezone-aware data, which NumPy does not natively support.
+
+    >>> pd.array(['2015', '2016'], dtype='datetime64[ns]')
+    <DatetimeArray>
+    ['2015-01-01 00:00:00', '2016-01-01 00:00:00']
+    Length: 2, dtype: datetime64[ns]
+
+    >>> pd.array(["1H", "2H"], dtype='timedelta64[ns]')
+    <TimedeltaArray>
+    ['01:00:00', '02:00:00']
+    Length: 2, dtype: timedelta64[ns]
+
+    Examples
+    --------
+    If a dtype is not specified, `data` is passed through to
+    :meth:`numpy.array`, and a :class:`arrays.PandasArray` is returned.
+
+    >>> pd.array([1, 2])
+    <PandasArray>
+    [1, 2]
+    Length: 2, dtype: int64
+
+    Or the NumPy dtype can be specified
+
+    >>> pd.array([1, 2], dtype=np.dtype("int32"))
+    <PandasArray>
+    [1, 2]
+    Length: 2, dtype: int32
+
+    You can use the string alias for `dtype`
+
+    >>> pd.array(['a', 'b', 'a'], dtype='category')
+    [a, b, a]
+    Categories (2, object): [a, b]
+
+    Or specify the actual dtype
+
+    >>> pd.array(['a', 'b', 'a'],
+    ...          dtype=pd.CategoricalDtype(['a', 'b', 'c'], ordered=True))
+    [a, b, a]
+    Categories (3, object): [a < b < c]
+
+    Because omitting the `dtype` passes the data through to NumPy,
+    a mixture of valid integers and NA will return a floating-point
+    NumPy array.
+
+    >>> pd.array([1, 2, np.nan])
+    <PandasArray>
+    [1.0,  2.0, nan]
+    Length: 3, dtype: float64
+
+    To use pandas' nullable :class:`pandas.arrays.IntegerArray`, specify
+    the dtype:
+
+    >>> pd.array([1, 2, np.nan], dtype='Int64')
+    <IntegerArray>
+    [1, 2, NaN]
+    Length: 3, dtype: Int64
+
+    Pandas will infer an ExtensionArray for some types of data:
+
+    >>> pd.array([pd.Period('2000', freq="D"), pd.Period("2000", freq="D")])
+    <PeriodArray>
+    ['2000-01-01', '2000-01-01']
+    Length: 2, dtype: period[D]
+
+    `data` must be 1-dimensional. A ValueError is raised when the input
+    has the wrong dimensionality.
+
+    >>> pd.array(1)
+    Traceback (most recent call last):
+      ...
+    ValueError: Cannot pass scalar '1' to 'pandas.array'.
+    """
+    from pandas.core.arrays import (
+        period_array, ExtensionArray, IntervalArray, PandasArray,
+        DatetimeArray,
+        TimedeltaArray,
+    )
+    from pandas.core.internals.arrays import extract_array
+
+    if lib.is_scalar(data):
+        msg = (
+            "Cannot pass scalar '{}' to 'pandas.array'."
+        )
+        raise ValueError(msg.format(data))
+
+    data = extract_array(data, extract_numpy=True)
+
+    if dtype is None and isinstance(data, ExtensionArray):
+        dtype = data.dtype
+
+    # this returns None for not-found dtypes.
+    if isinstance(dtype, compat.string_types):
+        dtype = registry.find(dtype) or dtype
+
+    if is_extension_array_dtype(dtype):
+        cls = dtype.construct_array_type()
+        return cls._from_sequence(data, dtype=dtype, copy=copy)
+
+    if dtype is None:
+        inferred_dtype = lib.infer_dtype(data, skipna=False)
+        if inferred_dtype == 'period':
+            try:
+                return period_array(data, copy=copy)
+            except tslibs.IncompatibleFrequency:
+                # We may have a mixture of frequencies.
+                # We choose to return an ndarray, rather than raising.
+                pass
+        elif inferred_dtype == 'interval':
+            try:
+                return IntervalArray(data, copy=copy)
+            except ValueError:
+                # We may have a mixture of `closed` here.
+                # We choose to return an ndarray, rather than raising.
+                pass
+
+        elif inferred_dtype.startswith('datetime'):
+            # datetime, datetime64
+            try:
+                return DatetimeArray._from_sequence(data, copy=copy)
+            except ValueError:
+                # Mixture of timezones, fall back to PandasArray
+                pass
+
+        elif inferred_dtype.startswith('timedelta'):
+            # timedelta, timedelta64
+            return TimedeltaArray._from_sequence(data, copy=copy)
+
+        # TODO(BooleanArray): handle this type
+
+    # Pandas overrides NumPy for
+    #   1. datetime64[ns]
+    #   2. timedelta64[ns]
+    # so that a DatetimeArray is returned.
+    if is_datetime64_ns_dtype(dtype):
+        return DatetimeArray._from_sequence(data, dtype=dtype, copy=copy)
+    elif is_timedelta64_ns_dtype(dtype):
+        return TimedeltaArray._from_sequence(data, dtype=dtype, copy=copy)
+
+    result = PandasArray._from_sequence(data, dtype=dtype, copy=copy)
+    return result
diff --git a/pandas/core/arrays/base.py b/pandas/core/arrays/base.py
new file mode 100644
index 0000000000000..e770281596134
--- /dev/null
+++ b/pandas/core/arrays/base.py
@@ -0,0 +1,1120 @@
+"""An interface for extending pandas with custom arrays.
+
+.. warning::
+
+   This is an experimental API and subject to breaking changes
+   without warning.
+"""
+import operator
+
+import numpy as np
+
+from pandas.compat import PY3, set_function_name
+from pandas.compat.numpy import function as nv
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.common import is_list_like
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import ops
+
+_not_implemented_message = "{} does not implement {}."
+
+_extension_array_shared_docs = dict()
+
+
+class ExtensionArray(object):
+    """
+    Abstract base class for custom 1-D array types.
+
+    pandas will recognize instances of this class as proper arrays
+    with a custom type and will not attempt to coerce them to objects. They
+    may be stored directly inside a :class:`DataFrame` or :class:`Series`.
+
+    .. versionadded:: 0.23.0
+
+    Notes
+    -----
+    The interface includes the following abstract methods that must be
+    implemented by subclasses:
+
+    * _from_sequence
+    * _from_factorized
+    * __getitem__
+    * __len__
+    * dtype
+    * nbytes
+    * isna
+    * take
+    * copy
+    * _concat_same_type
+
+    A default repr displaying the type, (truncated) data, length,
+    and dtype is provided. It can be customized or replaced by
+    by overriding:
+
+    * __repr__ : A default repr for the ExtensionArray.
+    * _formatter : Print scalars inside a Series or DataFrame.
+
+    Some methods require casting the ExtensionArray to an ndarray of Python
+    objects with ``self.astype(object)``, which may be expensive. When
+    performance is a concern, we highly recommend overriding the following
+    methods:
+
+    * fillna
+    * dropna
+    * unique
+    * factorize / _values_for_factorize
+    * argsort / _values_for_argsort
+    * searchsorted
+
+    The remaining methods implemented on this class should be performant,
+    as they only compose abstract methods. Still, a more efficient
+    implementation may be available, and these methods can be overridden.
+
+    One can implement methods to handle array reductions.
+
+    * _reduce
+
+    One can implement methods to handle parsing from strings that will be used
+    in methods such as ``pandas.io.parsers.read_csv``.
+
+    * _from_sequence_of_strings
+
+    This class does not inherit from 'abc.ABCMeta' for performance reasons.
+    Methods and properties required by the interface raise
+    ``pandas.errors.AbstractMethodError`` and no ``register`` method is
+    provided for registering virtual subclasses.
+
+    ExtensionArrays are limited to 1 dimension.
+
+    They may be backed by none, one, or many NumPy arrays. For example,
+    ``pandas.Categorical`` is an extension array backed by two arrays,
+    one for codes and one for categories. An array of IPv6 address may
+    be backed by a NumPy structured array with two fields, one for the
+    lower 64 bits and one for the upper 64 bits. Or they may be backed
+    by some other storage type, like Python lists. Pandas makes no
+    assumptions on how the data are stored, just that it can be converted
+    to a NumPy array.
+    The ExtensionArray interface does not impose any rules on how this data
+    is stored. However, currently, the backing data cannot be stored in
+    attributes called ``.values`` or ``._values`` to ensure full compatibility
+    with pandas internals. But other names as ``.data``, ``._data``,
+    ``._items``, ... can be freely used.
+    """
+    # '_typ' is for pandas.core.dtypes.generic.ABCExtensionArray.
+    # Don't override this.
+    _typ = 'extension'
+
+    # ------------------------------------------------------------------------
+    # Constructors
+    # ------------------------------------------------------------------------
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        """
+        Construct a new ExtensionArray from a sequence of scalars.
+
+        Parameters
+        ----------
+        scalars : Sequence
+            Each element will be an instance of the scalar type for this
+            array, ``cls.dtype.type``.
+        dtype : dtype, optional
+            Construct for this particular dtype. This should be a Dtype
+            compatible with the ExtensionArray.
+        copy : boolean, default False
+            If True, copy the underlying data.
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(cls)
+
+    @classmethod
+    def _from_sequence_of_strings(cls, strings, dtype=None, copy=False):
+        """Construct a new ExtensionArray from a sequence of strings.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        strings : Sequence
+            Each element will be an instance of the scalar type for this
+            array, ``cls.dtype.type``.
+        dtype : dtype, optional
+            Construct for this particular dtype. This should be a Dtype
+            compatible with the ExtensionArray.
+        copy : boolean, default False
+            If True, copy the underlying data.
+
+        Returns
+        -------
+        ExtensionArray
+
+        """
+        raise AbstractMethodError(cls)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        """
+        Reconstruct an ExtensionArray after factorization.
+
+        Parameters
+        ----------
+        values : ndarray
+            An integer ndarray with the factorized values.
+        original : ExtensionArray
+            The original ExtensionArray that factorize was called on.
+
+        See Also
+        --------
+        pandas.factorize
+        ExtensionArray.factorize
+        """
+        raise AbstractMethodError(cls)
+
+    # ------------------------------------------------------------------------
+    # Must be a Sequence
+    # ------------------------------------------------------------------------
+
+    def __getitem__(self, item):
+        # type (Any) -> Any
+        """
+        Select a subset of self.
+
+        Parameters
+        ----------
+        item : int, slice, or ndarray
+            * int: The position in 'self' to get.
+
+            * slice: A slice object, where 'start', 'stop', and 'step' are
+              integers or None
+
+            * ndarray: A 1-d boolean NumPy ndarray the same length as 'self'
+
+        Returns
+        -------
+        item : scalar or ExtensionArray
+
+        Notes
+        -----
+        For scalar ``item``, return a scalar value suitable for the array's
+        type. This should be an instance of ``self.dtype.type``.
+
+        For slice ``key``, return an instance of ``ExtensionArray``, even
+        if the slice is length 0 or 1.
+
+        For a boolean mask, return an instance of ``ExtensionArray``, filtered
+        to the values where ``item`` is True.
+        """
+        raise AbstractMethodError(self)
+
+    def __setitem__(self, key, value):
+        # type: (Union[int, np.ndarray], Any) -> None
+        """
+        Set one or more values inplace.
+
+        This method is not required to satisfy the pandas extension array
+        interface.
+
+        Parameters
+        ----------
+        key : int, ndarray, or slice
+            When called from, e.g. ``Series.__setitem__``, ``key`` will be
+            one of
+
+            * scalar int
+            * ndarray of integers.
+            * boolean ndarray
+            * slice object
+
+        value : ExtensionDtype.type, Sequence[ExtensionDtype.type], or object
+            value or values to be set of ``key``.
+
+        Returns
+        -------
+        None
+        """
+        # Some notes to the ExtensionArray implementor who may have ended up
+        # here. While this method is not required for the interface, if you
+        # *do* choose to implement __setitem__, then some semantics should be
+        # observed:
+        #
+        # * Setting multiple values : ExtensionArrays should support setting
+        #   multiple values at once, 'key' will be a sequence of integers and
+        #  'value' will be a same-length sequence.
+        #
+        # * Broadcasting : For a sequence 'key' and a scalar 'value',
+        #   each position in 'key' should be set to 'value'.
+        #
+        # * Coercion : Most users will expect basic coercion to work. For
+        #   example, a string like '2018-01-01' is coerced to a datetime
+        #   when setting on a datetime64ns array. In general, if the
+        #   __init__ method coerces that value, then so should __setitem__
+        # Note, also, that Series/DataFrame.where internally use __setitem__
+        # on a copy of the data.
+        raise NotImplementedError(_not_implemented_message.format(
+            type(self), '__setitem__')
+        )
+
+    def __len__(self):
+        # type: () -> int
+        """
+        Length of this array
+
+        Returns
+        -------
+        length : int
+        """
+        raise AbstractMethodError(self)
+
+    def __iter__(self):
+        """
+        Iterate over elements of the array.
+        """
+        # This needs to be implemented so that pandas recognizes extension
+        # arrays as list-like. The default implementation makes successive
+        # calls to ``__getitem__``, which may be slower than necessary.
+        for i in range(len(self)):
+            yield self[i]
+
+    # ------------------------------------------------------------------------
+    # Required attributes
+    # ------------------------------------------------------------------------
+    @property
+    def dtype(self):
+        # type: () -> ExtensionDtype
+        """
+        An instance of 'ExtensionDtype'.
+        """
+        raise AbstractMethodError(self)
+
+    @property
+    def shape(self):
+        # type: () -> Tuple[int, ...]
+        """
+        Return a tuple of the array dimensions.
+        """
+        return (len(self),)
+
+    @property
+    def ndim(self):
+        # type: () -> int
+        """
+        Extension Arrays are only allowed to be 1-dimensional.
+        """
+        return 1
+
+    @property
+    def nbytes(self):
+        # type: () -> int
+        """
+        The number of bytes needed to store this object in memory.
+        """
+        # If this is expensive to compute, return an approximate lower bound
+        # on the number of bytes needed.
+        raise AbstractMethodError(self)
+
+    # ------------------------------------------------------------------------
+    # Additional Methods
+    # ------------------------------------------------------------------------
+    def astype(self, dtype, copy=True):
+        """
+        Cast to a NumPy array with 'dtype'.
+
+        Parameters
+        ----------
+        dtype : str or dtype
+            Typecode or data-type to which the array is cast.
+        copy : bool, default True
+            Whether to copy the data, even if not necessary. If False,
+            a copy is made only if the old dtype does not match the
+            new dtype.
+
+        Returns
+        -------
+        array : ndarray
+            NumPy ndarray with 'dtype' for its dtype.
+        """
+        return np.array(self, dtype=dtype, copy=copy)
+
+    def isna(self):
+        # type: () -> Union[ExtensionArray, np.ndarray]
+        """
+        A 1-D array indicating if each value is missing.
+
+        Returns
+        -------
+        na_values : Union[np.ndarray, ExtensionArray]
+            In most cases, this should return a NumPy ndarray. For
+            exceptional cases like ``SparseArray``, where returning
+            an ndarray would be expensive, an ExtensionArray may be
+            returned.
+
+        Notes
+        -----
+        If returning an ExtensionArray, then
+
+        * ``na_values._is_boolean`` should be True
+        * `na_values` should implement :func:`ExtensionArray._reduce`
+        * ``na_values.any`` and ``na_values.all`` should be implemented
+        """
+        raise AbstractMethodError(self)
+
+    def _values_for_argsort(self):
+        # type: () -> ndarray
+        """
+        Return values for sorting.
+
+        Returns
+        -------
+        ndarray
+            The transformed values should maintain the ordering between values
+            within the array.
+
+        See Also
+        --------
+        ExtensionArray.argsort
+        """
+        # Note: this is used in `ExtensionArray.argsort`.
+        return np.array(self)
+
+    def argsort(self, ascending=True, kind='quicksort', *args, **kwargs):
+        """
+        Return the indices that would sort this array.
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            Whether the indices should result in an ascending
+            or descending sort.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, optional
+            Sorting algorithm.
+        *args, **kwargs:
+            passed through to :func:`numpy.argsort`.
+
+        Returns
+        -------
+        index_array : ndarray
+            Array of indices that sort ``self``.
+
+        See Also
+        --------
+        numpy.argsort : Sorting implementation used internally.
+        """
+        # Implementor note: You have two places to override the behavior of
+        # argsort.
+        # 1. _values_for_argsort : construct the values passed to np.argsort
+        # 2. argsort : total control over sorting.
+        ascending = nv.validate_argsort_with_ascending(ascending, args, kwargs)
+        values = self._values_for_argsort()
+        result = np.argsort(values, kind=kind, **kwargs)
+        if not ascending:
+            result = result[::-1]
+        return result
+
+    def fillna(self, value=None, method=None, limit=None):
+        """
+        Fill NA/NaN values using the specified method.
+
+        Parameters
+        ----------
+        value : scalar, array-like
+            If a scalar value is passed it is used to fill all missing values.
+            Alternatively, an array-like 'value' can be given. It's expected
+            that the array-like have the same length as 'self'.
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            Method to use for filling holes in reindexed Series
+            pad / ffill: propagate last valid observation forward to next valid
+            backfill / bfill: use NEXT valid observation to fill gap
+        limit : int, default None
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled.
+
+        Returns
+        -------
+        filled : ExtensionArray with NA/NaN filled
+        """
+        from pandas.api.types import is_array_like
+        from pandas.util._validators import validate_fillna_kwargs
+        from pandas.core.missing import pad_1d, backfill_1d
+
+        value, method = validate_fillna_kwargs(value, method)
+
+        mask = self.isna()
+
+        if is_array_like(value):
+            if len(value) != len(self):
+                raise ValueError("Length of 'value' does not match. Got ({}) "
+                                 " expected {}".format(len(value), len(self)))
+            value = value[mask]
+
+        if mask.any():
+            if method is not None:
+                func = pad_1d if method == 'pad' else backfill_1d
+                new_values = func(self.astype(object), limit=limit,
+                                  mask=mask)
+                new_values = self._from_sequence(new_values, dtype=self.dtype)
+            else:
+                # fill with value
+                new_values = self.copy()
+                new_values[mask] = value
+        else:
+            new_values = self.copy()
+        return new_values
+
+    def dropna(self):
+        """
+        Return ExtensionArray without NA values
+
+        Returns
+        -------
+        valid : ExtensionArray
+        """
+        return self[~self.isna()]
+
+    def shift(self, periods=1, fill_value=None):
+        # type: (int, object) -> ExtensionArray
+        """
+        Shift values by desired number.
+
+        Newly introduced missing values are filled with
+        ``self.dtype.na_value``.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        periods : int, default 1
+            The number of periods to shift. Negative values are allowed
+            for shifting backwards.
+
+        fill_value : object, optional
+            The scalar value to use for newly introduced missing values.
+            The default is ``self.dtype.na_value``
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        shifted : ExtensionArray
+
+        Notes
+        -----
+        If ``self`` is empty or ``periods`` is 0, a copy of ``self`` is
+        returned.
+
+        If ``periods > len(self)``, then an array of size
+        len(self) is returned, with all values filled with
+        ``self.dtype.na_value``.
+        """
+        # Note: this implementation assumes that `self.dtype.na_value` can be
+        # stored in an instance of your ExtensionArray with `self.dtype`.
+        if not len(self) or periods == 0:
+            return self.copy()
+
+        if isna(fill_value):
+            fill_value = self.dtype.na_value
+
+        empty = self._from_sequence(
+            [fill_value] * min(abs(periods), len(self)),
+            dtype=self.dtype
+        )
+        if periods > 0:
+            a = empty
+            b = self[:-periods]
+        else:
+            a = self[abs(periods):]
+            b = empty
+        return self._concat_same_type([a, b])
+
+    def unique(self):
+        """
+        Compute the ExtensionArray of unique values.
+
+        Returns
+        -------
+        uniques : ExtensionArray
+        """
+        from pandas import unique
+
+        uniques = unique(self.astype(object))
+        return self._from_sequence(uniques, dtype=self.dtype)
+
+    def searchsorted(self, value, side="left", sorter=None):
+        """
+        Find indices where elements should be inserted to maintain order.
+
+        .. versionadded:: 0.24.0
+
+        Find the indices into a sorted array `self` (a) such that, if the
+        corresponding elements in `value` were inserted before the indices,
+        the order of `self` would be preserved.
+
+        Assuming that `self` is sorted:
+
+        ======  ================================
+        `side`  returned index `i` satisfies
+        ======  ================================
+        left    ``self[i-1] < value <= self[i]``
+        right   ``self[i-1] <= value < self[i]``
+        ======  ================================
+
+        Parameters
+        ----------
+        value : array_like
+            Values to insert into `self`.
+        side : {'left', 'right'}, optional
+            If 'left', the index of the first suitable location found is given.
+            If 'right', return the last such index.  If there is no suitable
+            index, return either 0 or N (where N is the length of `self`).
+        sorter : 1-D array_like, optional
+            Optional array of integer indices that sort array a into ascending
+            order. They are typically the result of argsort.
+
+        Returns
+        -------
+        array of ints
+            Array of insertion points with the same shape as `value`.
+
+        See Also
+        --------
+        numpy.searchsorted : Similar method from NumPy.
+        """
+        # Note: the base tests provided by pandas only test the basics.
+        # We do not test
+        # 1. Values outside the range of the `data_for_sorting` fixture
+        # 2. Values between the values in the `data_for_sorting` fixture
+        # 3. Missing values.
+        arr = self.astype(object)
+        return arr.searchsorted(value, side=side, sorter=sorter)
+
+    def _values_for_factorize(self):
+        # type: () -> Tuple[ndarray, Any]
+        """
+        Return an array and missing value suitable for factorization.
+
+        Returns
+        -------
+        values : ndarray
+
+            An array suitable for factorization. This should maintain order
+            and be a supported dtype (Float64, Int64, UInt64, String, Object).
+            By default, the extension array is cast to object dtype.
+        na_value : object
+            The value in `values` to consider missing. This will be treated
+            as NA in the factorization routines, so it will be coded as
+            `na_sentinal` and not included in `uniques`. By default,
+            ``np.nan`` is used.
+
+        Notes
+        -----
+        The values returned by this method are also used in
+        :func:`pandas.util.hash_pandas_object`.
+        """
+        return self.astype(object), np.nan
+
+    def factorize(self, na_sentinel=-1):
+        # type: (int) -> Tuple[ndarray, ExtensionArray]
+        """
+        Encode the extension array as an enumerated type.
+
+        Parameters
+        ----------
+        na_sentinel : int, default -1
+            Value to use in the `labels` array to indicate missing values.
+
+        Returns
+        -------
+        labels : ndarray
+            An integer NumPy array that's an indexer into the original
+            ExtensionArray.
+        uniques : ExtensionArray
+            An ExtensionArray containing the unique values of `self`.
+
+            .. note::
+
+               uniques will *not* contain an entry for the NA value of
+               the ExtensionArray if there are any missing values present
+               in `self`.
+
+        See Also
+        --------
+        pandas.factorize : Top-level factorize method that dispatches here.
+
+        Notes
+        -----
+        :meth:`pandas.factorize` offers a `sort` keyword as well.
+        """
+        # Impelmentor note: There are two ways to override the behavior of
+        # pandas.factorize
+        # 1. _values_for_factorize and _from_factorize.
+        #    Specify the values passed to pandas' internal factorization
+        #    routines, and how to convert from those values back to the
+        #    original ExtensionArray.
+        # 2. ExtensionArray.factorize.
+        #    Complete control over factorization.
+        from pandas.core.algorithms import _factorize_array
+
+        arr, na_value = self._values_for_factorize()
+
+        labels, uniques = _factorize_array(arr, na_sentinel=na_sentinel,
+                                           na_value=na_value)
+
+        uniques = self._from_factorized(uniques, self)
+        return labels, uniques
+
+    _extension_array_shared_docs['repeat'] = """
+        Repeat elements of a %(klass)s.
+
+        Returns a new %(klass)s where each element of the current %(klass)s
+        is repeated consecutively a given number of times.
+
+        Parameters
+        ----------
+        repeats : int or array of ints
+            The number of repetitions for each element. This should be a
+            non-negative integer. Repeating 0 times will return an empty
+            %(klass)s.
+        axis : None
+            Must be ``None``. Has no effect but is accepted for compatibility
+            with numpy.
+
+        Returns
+        -------
+        repeated_array : %(klass)s
+            Newly created %(klass)s with repeated elements.
+
+        See Also
+        --------
+        Series.repeat : Equivalent function for Series.
+        Index.repeat : Equivalent function for Index.
+        numpy.repeat : Similar method for :class:`numpy.ndarray`.
+        ExtensionArray.take : Take arbitrary positions.
+
+        Examples
+        --------
+        >>> cat = pd.Categorical(['a', 'b', 'c'])
+        >>> cat
+        [a, b, c]
+        Categories (3, object): [a, b, c]
+        >>> cat.repeat(2)
+        [a, a, b, b, c, c]
+        Categories (3, object): [a, b, c]
+        >>> cat.repeat([1, 2, 3])
+        [a, b, b, c, c, c]
+        Categories (3, object): [a, b, c]
+        """
+
+    @Substitution(klass='ExtensionArray')
+    @Appender(_extension_array_shared_docs['repeat'])
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        ind = np.arange(len(self)).repeat(repeats)
+        return self.take(ind)
+
+    # ------------------------------------------------------------------------
+    # Indexing methods
+    # ------------------------------------------------------------------------
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        # type: (Sequence[int], bool, Optional[Any]) -> ExtensionArray
+        """
+        Take elements from an array.
+
+        Parameters
+        ----------
+        indices : sequence of integers
+            Indices to be taken.
+        allow_fill : bool, default False
+            How to handle negative values in `indices`.
+
+            * False: negative values in `indices` indicate positional indices
+              from the right (the default). This is similar to
+              :func:`numpy.take`.
+
+            * True: negative values in `indices` indicate
+              missing values. These values are set to `fill_value`. Any other
+              other negative values raise a ``ValueError``.
+
+        fill_value : any, optional
+            Fill value to use for NA-indices when `allow_fill` is True.
+            This may be ``None``, in which case the default NA value for
+            the type, ``self.dtype.na_value``, is used.
+
+            For many ExtensionArrays, there will be two representations of
+            `fill_value`: a user-facing "boxed" scalar, and a low-level
+            physical NA value. `fill_value` should be the user-facing version,
+            and the implementation should handle translating that to the
+            physical version for processing the take if necessary.
+
+        Returns
+        -------
+        ExtensionArray
+
+        Raises
+        ------
+        IndexError
+            When the indices are out of bounds for the array.
+        ValueError
+            When `indices` contains negative values other than ``-1``
+            and `allow_fill` is True.
+
+        Notes
+        -----
+        ExtensionArray.take is called by ``Series.__getitem__``, ``.loc``,
+        ``iloc``, when `indices` is a sequence of values. Additionally,
+        it's called by :meth:`Series.reindex`, or any other method
+        that causes realignment, with a `fill_value`.
+
+        See Also
+        --------
+        numpy.take
+        pandas.api.extensions.take
+
+        Examples
+        --------
+        Here's an example implementation, which relies on casting the
+        extension array to object dtype. This uses the helper method
+        :func:`pandas.api.extensions.take`.
+
+        .. code-block:: python
+
+           def take(self, indices, allow_fill=False, fill_value=None):
+               from pandas.core.algorithms import take
+
+               # If the ExtensionArray is backed by an ndarray, then
+               # just pass that here instead of coercing to object.
+               data = self.astype(object)
+
+               if allow_fill and fill_value is None:
+                   fill_value = self.dtype.na_value
+
+               # fill value should always be translated from the scalar
+               # type for the array, to the physical storage type for
+               # the data, before passing to take.
+
+               result = take(data, indices, fill_value=fill_value,
+                             allow_fill=allow_fill)
+               return self._from_sequence(result, dtype=self.dtype)
+        """
+        # Implementer note: The `fill_value` parameter should be a user-facing
+        # value, an instance of self.dtype.type. When passed `fill_value=None`,
+        # the default of `self.dtype.na_value` should be used.
+        # This may differ from the physical storage type your ExtensionArray
+        # uses. In this case, your implementation is responsible for casting
+        # the user-facing type to the storage type, before using
+        # pandas.api.extensions.take
+        raise AbstractMethodError(self)
+
+    def copy(self, deep=False):
+        # type: (bool) -> ExtensionArray
+        """
+        Return a copy of the array.
+
+        Parameters
+        ----------
+        deep : bool, default False
+            Also copy the underlying data backing this array.
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(self)
+
+    # ------------------------------------------------------------------------
+    # Printing
+    # ------------------------------------------------------------------------
+    def __repr__(self):
+        from pandas.io.formats.printing import format_object_summary
+
+        template = (
+            u'{class_name}'
+            u'{data}\n'
+            u'Length: {length}, dtype: {dtype}'
+        )
+        # the short repr has no trailing newline, while the truncated
+        # repr does. So we include a newline in our template, and strip
+        # any trailing newlines from format_object_summary
+        data = format_object_summary(self, self._formatter(),
+                                     indent_for_name=False).rstrip(', \n')
+        class_name = u'<{}>\n'.format(self.__class__.__name__)
+        return template.format(class_name=class_name, data=data,
+                               length=len(self),
+                               dtype=self.dtype)
+
+    def _formatter(self, boxed=False):
+        # type: (bool) -> Callable[[Any], Optional[str]]
+        """Formatting function for scalar values.
+
+        This is used in the default '__repr__'. The returned formatting
+        function receives instances of your scalar type.
+
+        Parameters
+        ----------
+        boxed: bool, default False
+            An indicated for whether or not your array is being printed
+            within a Series, DataFrame, or Index (True), or just by
+            itself (False). This may be useful if you want scalar values
+            to appear differently within a Series versus on its own (e.g.
+            quoted or not).
+
+        Returns
+        -------
+        Callable[[Any], str]
+            A callable that gets instances of the scalar type and
+            returns a string. By default, :func:`repr` is used
+            when ``boxed=False`` and :func:`str` is used when
+            ``boxed=True``.
+        """
+        if boxed:
+            return str
+        return repr
+
+    def _formatting_values(self):
+        # type: () -> np.ndarray
+        # At the moment, this has to be an array since we use result.dtype
+        """
+        An array of values to be printed in, e.g. the Series repr
+
+        .. deprecated:: 0.24.0
+
+           Use :meth:`ExtensionArray._formatter` instead.
+        """
+        return np.array(self)
+
+    # ------------------------------------------------------------------------
+    # Reshaping
+    # ------------------------------------------------------------------------
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        # type: (Sequence[ExtensionArray]) -> ExtensionArray
+        """
+        Concatenate multiple array
+
+        Parameters
+        ----------
+        to_concat : sequence of this type
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        raise AbstractMethodError(cls)
+
+    # The _can_hold_na attribute is set to True so that pandas internals
+    # will use the ExtensionDtype.na_value as the NA value in operations
+    # such as take(), reindex(), shift(), etc.  In addition, those results
+    # will then be of the ExtensionArray subclass rather than an array
+    # of objects
+    _can_hold_na = True
+
+    @property
+    def _ndarray_values(self):
+        # type: () -> np.ndarray
+        """
+        Internal pandas method for lossy conversion to a NumPy ndarray.
+
+        This method is not part of the pandas interface.
+
+        The expectation is that this is cheap to compute, and is primarily
+        used for interacting with our indexers.
+        """
+        return np.array(self)
+
+    def _reduce(self, name, skipna=True, **kwargs):
+        """
+        Return a scalar result of performing the reduction operation.
+
+        Parameters
+        ----------
+        name : str
+            Name of the function, supported values are:
+            { any, all, min, max, sum, mean, median, prod,
+            std, var, sem, kurt, skew }.
+        skipna : bool, default True
+            If True, skip NaN values.
+        **kwargs
+            Additional keyword arguments passed to the reduction function.
+            Currently, `ddof` is the only supported kwarg.
+
+        Returns
+        -------
+        scalar
+
+        Raises
+        ------
+        TypeError : subclass does not define reductions
+        """
+        raise TypeError("cannot perform {name} with type {dtype}".format(
+            name=name, dtype=self.dtype))
+
+
+class ExtensionOpsMixin(object):
+    """
+    A base class for linking the operators to their dunder names.
+
+    .. note::
+
+       You may want to set ``__array_priority__`` if you want your
+       implementation to be called when involved in binary operations
+       with NumPy arrays.
+    """
+
+    @classmethod
+    def _add_arithmetic_ops(cls):
+        cls.__add__ = cls._create_arithmetic_method(operator.add)
+        cls.__radd__ = cls._create_arithmetic_method(ops.radd)
+        cls.__sub__ = cls._create_arithmetic_method(operator.sub)
+        cls.__rsub__ = cls._create_arithmetic_method(ops.rsub)
+        cls.__mul__ = cls._create_arithmetic_method(operator.mul)
+        cls.__rmul__ = cls._create_arithmetic_method(ops.rmul)
+        cls.__pow__ = cls._create_arithmetic_method(operator.pow)
+        cls.__rpow__ = cls._create_arithmetic_method(ops.rpow)
+        cls.__mod__ = cls._create_arithmetic_method(operator.mod)
+        cls.__rmod__ = cls._create_arithmetic_method(ops.rmod)
+        cls.__floordiv__ = cls._create_arithmetic_method(operator.floordiv)
+        cls.__rfloordiv__ = cls._create_arithmetic_method(ops.rfloordiv)
+        cls.__truediv__ = cls._create_arithmetic_method(operator.truediv)
+        cls.__rtruediv__ = cls._create_arithmetic_method(ops.rtruediv)
+        if not PY3:
+            cls.__div__ = cls._create_arithmetic_method(operator.div)
+            cls.__rdiv__ = cls._create_arithmetic_method(ops.rdiv)
+
+        cls.__divmod__ = cls._create_arithmetic_method(divmod)
+        cls.__rdivmod__ = cls._create_arithmetic_method(ops.rdivmod)
+
+    @classmethod
+    def _add_comparison_ops(cls):
+        cls.__eq__ = cls._create_comparison_method(operator.eq)
+        cls.__ne__ = cls._create_comparison_method(operator.ne)
+        cls.__lt__ = cls._create_comparison_method(operator.lt)
+        cls.__gt__ = cls._create_comparison_method(operator.gt)
+        cls.__le__ = cls._create_comparison_method(operator.le)
+        cls.__ge__ = cls._create_comparison_method(operator.ge)
+
+
+class ExtensionScalarOpsMixin(ExtensionOpsMixin):
+    """
+    A mixin for defining  ops on an ExtensionArray.
+
+    It is assumed that the underlying scalar objects have the operators
+    already defined.
+
+    Notes
+    -----
+    If you have defined a subclass MyExtensionArray(ExtensionArray), then
+    use MyExtensionArray(ExtensionArray, ExtensionScalarOpsMixin) to
+    get the arithmetic operators.  After the definition of MyExtensionArray,
+    insert the lines
+
+    MyExtensionArray._add_arithmetic_ops()
+    MyExtensionArray._add_comparison_ops()
+
+    to link the operators to your class.
+
+    .. note::
+
+       You may want to set ``__array_priority__`` if you want your
+       implementation to be called when involved in binary operations
+       with NumPy arrays.
+    """
+
+    @classmethod
+    def _create_method(cls, op, coerce_to_dtype=True):
+        """
+        A class method that returns a method that will correspond to an
+        operator for an ExtensionArray subclass, by dispatching to the
+        relevant operator defined on the individual elements of the
+        ExtensionArray.
+
+        Parameters
+        ----------
+        op : function
+            An operator that takes arguments op(a, b)
+        coerce_to_dtype :  bool, default True
+            boolean indicating whether to attempt to convert
+            the result to the underlying ExtensionArray dtype.
+            If it's not possible to create a new ExtensionArray with the
+            values, an ndarray is returned instead.
+
+        Returns
+        -------
+        Callable[[Any, Any], Union[ndarray, ExtensionArray]]
+            A method that can be bound to a class. When used, the method
+            receives the two arguments, one of which is the instance of
+            this class, and should return an ExtensionArray or an ndarray.
+
+            Returning an ndarray may be necessary when the result of the
+            `op` cannot be stored in the ExtensionArray. The dtype of the
+            ndarray uses NumPy's normal inference rules.
+
+        Example
+        -------
+        Given an ExtensionArray subclass called MyExtensionArray, use
+
+        >>> __add__ = cls._create_method(operator.add)
+
+        in the class definition of MyExtensionArray to create the operator
+        for addition, that will be based on the operator implementation
+        of the underlying elements of the ExtensionArray
+        """
+
+        def _binop(self, other):
+            def convert_values(param):
+                if isinstance(param, ExtensionArray) or is_list_like(param):
+                    ovalues = param
+                else:  # Assume its an object
+                    ovalues = [param] * len(self)
+                return ovalues
+
+            if isinstance(other, (ABCSeries, ABCIndexClass)):
+                # rely on pandas to unbox and dispatch to us
+                return NotImplemented
+
+            lvalues = self
+            rvalues = convert_values(other)
+
+            # If the operator is not defined for the underlying objects,
+            # a TypeError should be raised
+            res = [op(a, b) for (a, b) in zip(lvalues, rvalues)]
+
+            def _maybe_convert(arr):
+                if coerce_to_dtype:
+                    # https://github.com/pandas-dev/pandas/issues/22850
+                    # We catch all regular exceptions here, and fall back
+                    # to an ndarray.
+                    try:
+                        res = self._from_sequence(arr)
+                    except Exception:
+                        res = np.asarray(arr)
+                else:
+                    res = np.asarray(arr)
+                return res
+
+            if op.__name__ in {'divmod', 'rdivmod'}:
+                a, b = zip(*res)
+                res = _maybe_convert(a), _maybe_convert(b)
+            else:
+                res = _maybe_convert(res)
+            return res
+
+        op_name = ops._get_op_name(op, True)
+        return set_function_name(_binop, op_name, cls)
+
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        return cls._create_method(op)
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        return cls._create_method(op, coerce_to_dtype=False)
diff --git a/pandas/core/arrays/categorical.py b/pandas/core/arrays/categorical.py
new file mode 100644
index 0000000000000..7f77a5dcce613
--- /dev/null
+++ b/pandas/core/arrays/categorical.py
@@ -0,0 +1,2704 @@
+# pylint: disable=E1101,W0232
+
+import textwrap
+from warnings import warn
+
+import numpy as np
+
+from pandas._libs import algos as libalgos, lib
+import pandas.compat as compat
+from pandas.compat import lzip, u
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import (
+    Appender, Substitution, cache_readonly, deprecate_kwarg)
+from pandas.util._validators import validate_bool_kwarg, validate_fillna_kwargs
+
+from pandas.core.dtypes.cast import (
+    coerce_indexer_dtype, maybe_infer_to_datetimelike)
+from pandas.core.dtypes.common import (
+    ensure_int64, ensure_object, ensure_platform_int, is_categorical,
+    is_categorical_dtype, is_datetime64_dtype, is_datetimelike, is_dict_like,
+    is_dtype_equal, is_extension_array_dtype, is_float_dtype, is_integer_dtype,
+    is_iterator, is_list_like, is_object_dtype, is_scalar, is_sequence,
+    is_timedelta64_dtype)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.generic import (
+    ABCCategoricalIndex, ABCDataFrame, ABCIndexClass, ABCSeries)
+from pandas.core.dtypes.inference import is_hashable
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.core.accessor import PandasDelegate, delegate_names
+import pandas.core.algorithms as algorithms
+from pandas.core.algorithms import factorize, take, take_1d, unique1d
+from pandas.core.base import NoNewAttributesMixin, PandasObject, _shared_docs
+import pandas.core.common as com
+from pandas.core.config import get_option
+from pandas.core.missing import interpolate_2d
+from pandas.core.sorting import nargsort
+
+from pandas.io.formats import console
+from pandas.io.formats.terminal import get_terminal_size
+
+from .base import ExtensionArray, _extension_array_shared_docs
+
+_take_msg = textwrap.dedent("""\
+    Interpreting negative values in 'indexer' as missing values.
+    In the future, this will change to meaning positional indices
+    from the right.
+
+    Use 'allow_fill=True' to retain the previous behavior and silence this
+    warning.
+
+    Use 'allow_fill=False' to accept the new behavior.""")
+
+
+def _cat_compare_op(op):
+    def f(self, other):
+        # On python2, you can usually compare any type to any type, and
+        # Categoricals can be seen as a custom type, but having different
+        # results depending whether categories are the same or not is kind of
+        # insane, so be a bit stricter here and use the python3 idea of
+        # comparing only things of equal type.
+        if isinstance(other, (ABCDataFrame, ABCSeries, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+
+        if not self.ordered:
+            if op in ['__lt__', '__gt__', '__le__', '__ge__']:
+                raise TypeError("Unordered Categoricals can only compare "
+                                "equality or not")
+        if isinstance(other, Categorical):
+            # Two Categoricals can only be be compared if the categories are
+            # the same (maybe up to ordering, depending on ordered)
+
+            msg = ("Categoricals can only be compared if "
+                   "'categories' are the same.")
+            if len(self.categories) != len(other.categories):
+                raise TypeError(msg + " Categories are different lengths")
+            elif (self.ordered and not (self.categories ==
+                                        other.categories).all()):
+                raise TypeError(msg)
+            elif not set(self.categories) == set(other.categories):
+                raise TypeError(msg)
+
+            if not (self.ordered == other.ordered):
+                raise TypeError("Categoricals can only be compared if "
+                                "'ordered' is the same")
+            if not self.ordered and not self.categories.equals(
+                    other.categories):
+                # both unordered and different order
+                other_codes = _get_codes_for_values(other, self.categories)
+            else:
+                other_codes = other._codes
+
+            na_mask = (self._codes == -1) | (other_codes == -1)
+            f = getattr(self._codes, op)
+            ret = f(other_codes)
+            if na_mask.any():
+                # In other series, the leads to False, so do that here too
+                ret[na_mask] = False
+            return ret
+
+        # Numpy < 1.13 may convert a scalar to a zerodim array during
+        # comparison operation when second arg has higher priority, e.g.
+        #
+        #     cat[0] < cat
+        #
+        # With cat[0], for example, being ``np.int64(1)`` by the time it gets
+        # into this function would become ``np.array(1)``.
+        if is_scalar(other):
+            if other in self.categories:
+                i = self.categories.get_loc(other)
+                return getattr(self._codes, op)(i)
+            else:
+                if op == '__eq__':
+                    return np.repeat(False, len(self))
+                elif op == '__ne__':
+                    return np.repeat(True, len(self))
+                else:
+                    msg = ("Cannot compare a Categorical for op {op} with a "
+                           "scalar, which is not a category.")
+                    raise TypeError(msg.format(op=op))
+        else:
+
+            # allow categorical vs object dtype array comparisons for equality
+            # these are only positional comparisons
+            if op in ['__eq__', '__ne__']:
+                return getattr(np.array(self), op)(np.array(other))
+
+            msg = ("Cannot compare a Categorical for op {op} with type {typ}."
+                   "\nIf you want to compare values, use 'np.asarray(cat) "
+                   "<op> other'.")
+            raise TypeError(msg.format(op=op, typ=type(other)))
+
+    f.__name__ = op
+
+    return f
+
+
+def _maybe_to_categorical(array):
+    """
+    Coerce to a categorical if a series is given.
+
+    Internal use ONLY.
+    """
+    if isinstance(array, (ABCSeries, ABCCategoricalIndex)):
+        return array._values
+    elif isinstance(array, np.ndarray):
+        return Categorical(array)
+    return array
+
+
+def contains(cat, key, container):
+    """
+    Helper for membership check for ``key`` in ``cat``.
+
+    This is a helper method for :method:`__contains__`
+    and :class:`CategoricalIndex.__contains__`.
+
+    Returns True if ``key`` is in ``cat.categories`` and the
+    location of ``key`` in ``categories`` is in ``container``.
+
+    Parameters
+    ----------
+    cat : :class:`Categorical`or :class:`categoricalIndex`
+    key : a hashable object
+        The key to check membership for.
+    container : Container (e.g. list-like or mapping)
+        The container to check for membership in.
+
+    Returns
+    -------
+    is_in : bool
+        True if ``key`` is in ``self.categories`` and location of
+        ``key`` in ``categories`` is in ``container``, else False.
+
+    Notes
+    -----
+    This method does not check for NaN values. Do that separately
+    before calling this method.
+    """
+    hash(key)
+
+    # get location of key in categories.
+    # If a KeyError, the key isn't in categories, so logically
+    #  can't be in container either.
+    try:
+        loc = cat.categories.get_loc(key)
+    except KeyError:
+        return False
+
+    # loc is the location of key in categories, but also the *value*
+    # for key in container. So, `key` may be in categories,
+    # but still not in `container`. Example ('b' in categories,
+    # but not in values):
+    # 'b' in Categorical(['a'], categories=['a', 'b'])  # False
+    if is_scalar(loc):
+        return loc in container
+    else:
+        # if categories is an IntervalIndex, loc is an array.
+        return any(loc_ in container for loc_ in loc)
+
+
+_codes_doc = """\
+The category codes of this categorical.
+
+Level codes are an array if integer which are the positions of the real
+values in the categories array.
+
+There is not setter, use the other categorical methods and the normal item
+setter to change values in the categorical.
+"""
+
+
+class Categorical(ExtensionArray, PandasObject):
+    """
+    Represent a categorical variable in classic R / S-plus fashion.
+
+    `Categoricals` can only take on only a limited, and usually fixed, number
+    of possible values (`categories`). In contrast to statistical categorical
+    variables, a `Categorical` might have an order, but numerical operations
+    (additions, divisions, ...) are not possible.
+
+    All values of the `Categorical` are either in `categories` or `np.nan`.
+    Assigning values outside of `categories` will raise a `ValueError`. Order
+    is defined by the order of the `categories`, not lexical order of the
+    values.
+
+    Parameters
+    ----------
+    values : list-like
+        The values of the categorical. If categories are given, values not in
+        categories will be replaced with NaN.
+    categories : Index-like (unique), optional
+        The unique categories for this categorical. If not given, the
+        categories are assumed to be the unique values of `values` (sorted, if
+        possible, otherwise in the order in which they appear).
+    ordered : bool, default False
+        Whether or not this categorical is treated as a ordered categorical.
+        If True, the resulting categorical will be ordered.
+        An ordered categorical respects, when sorted, the order of its
+        `categories` attribute (which in turn is the `categories` argument, if
+        provided).
+    dtype : CategoricalDtype
+        An instance of ``CategoricalDtype`` to use for this categorical
+
+        .. versionadded:: 0.21.0
+
+    Attributes
+    ----------
+    categories : Index
+        The categories of this categorical
+    codes : ndarray
+        The codes (integer positions, which point to the categories) of this
+        categorical, read only.
+    ordered : bool
+        Whether or not this Categorical is ordered.
+    dtype : CategoricalDtype
+        The instance of ``CategoricalDtype`` storing the ``categories``
+        and ``ordered``.
+
+        .. versionadded:: 0.21.0
+
+    Methods
+    -------
+    from_codes
+    __array__
+
+    Raises
+    ------
+    ValueError
+        If the categories do not validate.
+    TypeError
+        If an explicit ``ordered=True`` is given but no `categories` and the
+        `values` are not sortable.
+
+    See Also
+    --------
+    api.types.CategoricalDtype : Type for categorical data.
+    CategoricalIndex : An Index with an underlying ``Categorical``.
+
+    Notes
+    -----
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/categorical.html>`_ for more.
+
+    Examples
+    --------
+    >>> pd.Categorical([1, 2, 3, 1, 2, 3])
+    [1, 2, 3, 1, 2, 3]
+    Categories (3, int64): [1, 2, 3]
+
+    >>> pd.Categorical(['a', 'b', 'c', 'a', 'b', 'c'])
+    [a, b, c, a, b, c]
+    Categories (3, object): [a, b, c]
+
+    Ordered `Categoricals` can be sorted according to the custom order
+    of the categories and can have a min and max value.
+
+    >>> c = pd.Categorical(['a', 'b', 'c', 'a', 'b', 'c'], ordered=True,
+    ...                    categories=['c', 'b', 'a'])
+    >>> c
+    [a, b, c, a, b, c]
+    Categories (3, object): [c < b < a]
+    >>> c.min()
+    'c'
+    """
+
+    # For comparisons, so that numpy uses our implementation if the compare
+    # ops, which raise
+    __array_priority__ = 1000
+    _dtype = CategoricalDtype(ordered=False)
+    # tolist is not actually deprecated, just suppressed in the __dir__
+    _deprecations = frozenset(['labels', 'tolist'])
+    _typ = 'categorical'
+
+    def __init__(self, values, categories=None, ordered=None, dtype=None,
+                 fastpath=False):
+
+        dtype = CategoricalDtype._from_values_or_dtype(values, categories,
+                                                       ordered, dtype)
+        # At this point, dtype is always a CategoricalDtype, but
+        # we may have dtype.categories be None, and we need to
+        # infer categories in a factorization step futher below
+
+        if fastpath:
+            self._codes = coerce_indexer_dtype(values, dtype.categories)
+            self._dtype = self._dtype.update_dtype(dtype)
+            return
+
+        # null_mask indicates missing values we want to exclude from inference.
+        # This means: only missing values in list-likes (not arrays/ndframes).
+        null_mask = np.array(False)
+
+        # sanitize input
+        if is_categorical_dtype(values):
+            if dtype.categories is None:
+                dtype = CategoricalDtype(values.categories, dtype.ordered)
+        elif not isinstance(values, (ABCIndexClass, ABCSeries)):
+            # sanitize_array coerces np.nan to a string under certain versions
+            # of numpy
+            values = maybe_infer_to_datetimelike(values, convert_dates=True)
+            if not isinstance(values, np.ndarray):
+                values = _convert_to_list_like(values)
+                from pandas.core.internals.construction import sanitize_array
+                # By convention, empty lists result in object dtype:
+                if len(values) == 0:
+                    sanitize_dtype = 'object'
+                else:
+                    sanitize_dtype = None
+                null_mask = isna(values)
+                if null_mask.any():
+                    values = [values[idx] for idx in np.where(~null_mask)[0]]
+                values = sanitize_array(values, None, dtype=sanitize_dtype)
+
+        if dtype.categories is None:
+            try:
+                codes, categories = factorize(values, sort=True)
+            except TypeError:
+                codes, categories = factorize(values, sort=False)
+                if dtype.ordered:
+                    # raise, as we don't have a sortable data structure and so
+                    # the user should give us one by specifying categories
+                    raise TypeError("'values' is not ordered, please "
+                                    "explicitly specify the categories order "
+                                    "by passing in a categories argument.")
+            except ValueError:
+
+                # FIXME
+                raise NotImplementedError("> 1 ndim Categorical are not "
+                                          "supported at this time")
+
+            # we're inferring from values
+            dtype = CategoricalDtype(categories, dtype.ordered)
+
+        elif is_categorical_dtype(values):
+            old_codes = (values._values.codes if isinstance(values, ABCSeries)
+                         else values.codes)
+            codes = _recode_for_categories(old_codes, values.dtype.categories,
+                                           dtype.categories)
+
+        else:
+            codes = _get_codes_for_values(values, dtype.categories)
+
+        if null_mask.any():
+            # Reinsert -1 placeholders for previously removed missing values
+            full_codes = - np.ones(null_mask.shape, dtype=codes.dtype)
+            full_codes[~null_mask] = codes
+            codes = full_codes
+
+        self._dtype = self._dtype.update_dtype(dtype)
+        self._codes = coerce_indexer_dtype(codes, dtype.categories)
+
+    @property
+    def categories(self):
+        """
+        The categories of this categorical.
+
+        Setting assigns new values to each category (effectively a rename of
+        each individual category).
+
+        The assigned value has to be a list-like object. All items must be
+        unique and the number of items in the new categories must be the same
+        as the number of items in the old categories.
+
+        Assigning to `categories` is a inplace operation!
+
+        Raises
+        ------
+        ValueError
+            If the new categories do not validate as categories or if the
+            number of new categories is unequal the number of old categories
+
+        See Also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        return self.dtype.categories
+
+    @categories.setter
+    def categories(self, categories):
+        new_dtype = CategoricalDtype(categories, ordered=self.ordered)
+        if (self.dtype.categories is not None and
+                len(self.dtype.categories) != len(new_dtype.categories)):
+            raise ValueError("new categories need to have the same number of "
+                             "items as the old categories!")
+        self._dtype = new_dtype
+
+    @property
+    def ordered(self):
+        """
+        Whether the categories have an ordered relationship.
+        """
+        return self.dtype.ordered
+
+    @property
+    def dtype(self):
+        """
+        The :class:`~pandas.api.types.CategoricalDtype` for this instance
+        """
+        return self._dtype
+
+    @property
+    def _ndarray_values(self):
+        return self.codes
+
+    @property
+    def _constructor(self):
+        return Categorical
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return Categorical(scalars, dtype=dtype)
+
+    def _formatter(self, boxed=False):
+        # Defer to CategoricalFormatter's formatter.
+        return None
+
+    def copy(self):
+        """
+        Copy constructor.
+        """
+        return self._constructor(values=self._codes.copy(),
+                                 dtype=self.dtype,
+                                 fastpath=True)
+
+    def astype(self, dtype, copy=True):
+        """
+        Coerce this type to another dtype
+
+        Parameters
+        ----------
+        dtype : numpy dtype or pandas type
+        copy : bool, default True
+            By default, astype always returns a newly allocated object.
+            If copy is set to False and dtype is categorical, the original
+            object is returned.
+
+            .. versionadded:: 0.19.0
+
+        """
+        if is_categorical_dtype(dtype):
+            # GH 10696/18593
+            dtype = self.dtype.update_dtype(dtype)
+            self = self.copy() if copy else self
+            if dtype == self.dtype:
+                return self
+            return self._set_dtype(dtype)
+        return np.array(self, dtype=dtype, copy=copy)
+
+    @cache_readonly
+    def ndim(self):
+        """
+        Number of dimensions of the Categorical
+        """
+        return self._codes.ndim
+
+    @cache_readonly
+    def size(self):
+        """
+        return the len of myself
+        """
+        return len(self)
+
+    @cache_readonly
+    def itemsize(self):
+        """
+        return the size of a single category
+        """
+        return self.categories.itemsize
+
+    def tolist(self):
+        """
+        Return a list of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+        """
+        return list(self)
+
+    to_list = tolist
+
+    @property
+    def base(self):
+        """
+        compat, we are always our own object
+        """
+        return None
+
+    @classmethod
+    def _from_inferred_categories(cls, inferred_categories, inferred_codes,
+                                  dtype, true_values=None):
+        """
+        Construct a Categorical from inferred values.
+
+        For inferred categories (`dtype` is None) the categories are sorted.
+        For explicit `dtype`, the `inferred_categories` are cast to the
+        appropriate type.
+
+        Parameters
+        ----------
+        inferred_categories : Index
+        inferred_codes : Index
+        dtype : CategoricalDtype or 'category'
+        true_values : list, optional
+            If none are provided, the default ones are
+            "True", "TRUE", and "true."
+
+        Returns
+        -------
+        Categorical
+        """
+        from pandas import Index, to_numeric, to_datetime, to_timedelta
+
+        cats = Index(inferred_categories)
+        known_categories = (isinstance(dtype, CategoricalDtype) and
+                            dtype.categories is not None)
+
+        if known_categories:
+            # Convert to a specialized type with `dtype` if specified.
+            if dtype.categories.is_numeric():
+                cats = to_numeric(inferred_categories, errors="coerce")
+            elif is_datetime64_dtype(dtype.categories):
+                cats = to_datetime(inferred_categories, errors="coerce")
+            elif is_timedelta64_dtype(dtype.categories):
+                cats = to_timedelta(inferred_categories, errors="coerce")
+            elif dtype.categories.is_boolean():
+                if true_values is None:
+                    true_values = ["True", "TRUE", "true"]
+
+                cats = cats.isin(true_values)
+
+        if known_categories:
+            # Recode from observation order to dtype.categories order.
+            categories = dtype.categories
+            codes = _recode_for_categories(inferred_codes, cats, categories)
+        elif not cats.is_monotonic_increasing:
+            # Sort categories and recode for unknown categories.
+            unsorted = cats.copy()
+            categories = cats.sort_values()
+
+            codes = _recode_for_categories(inferred_codes, unsorted,
+                                           categories)
+            dtype = CategoricalDtype(categories, ordered=False)
+        else:
+            dtype = CategoricalDtype(cats, ordered=False)
+            codes = inferred_codes
+
+        return cls(codes, dtype=dtype, fastpath=True)
+
+    @classmethod
+    def from_codes(cls, codes, categories=None, ordered=None, dtype=None):
+        """
+        Make a Categorical type from codes and categories or dtype.
+
+        This constructor is useful if you already have codes and
+        categories/dtype and so do not need the (computation intensive)
+        factorization step, which is usually done on the constructor.
+
+        If your data does not follow this convention, please use the normal
+        constructor.
+
+        Parameters
+        ----------
+        codes : array-like, integers
+            An integer array, where each integer points to a category in
+            categories or dtype.categories, or else is -1 for NaN.
+        categories : index-like, optional
+            The categories for the categorical. Items need to be unique.
+            If the categories are not given here, then they must be provided
+            in `dtype`.
+        ordered : bool, optional
+            Whether or not this categorical is treated as an ordered
+            categorical. If not given here or in `dtype`, the resulting
+            categorical will be unordered.
+        dtype : CategoricalDtype or the string "category", optional
+            If :class:`CategoricalDtype`, cannot be used together with
+            `categories` or `ordered`.
+
+            .. versionadded:: 0.24.0
+
+               When `dtype` is provided, neither `categories` nor `ordered`
+               should be provided.
+
+        Examples
+        --------
+        >>> dtype = pd.CategoricalDtype(['a', 'b'], ordered=True)
+        >>> pd.Categorical.from_codes(codes=[0, 1, 0, 1], dtype=dtype)
+        [a, b, a, b]
+        Categories (2, object): [a < b]
+        """
+        dtype = CategoricalDtype._from_values_or_dtype(categories=categories,
+                                                       ordered=ordered,
+                                                       dtype=dtype)
+        if dtype.categories is None:
+            msg = ("The categories must be provided in 'categories' or "
+                   "'dtype'. Both were None.")
+            raise ValueError(msg)
+
+        codes = np.asarray(codes)  # #21767
+        if not is_integer_dtype(codes):
+            msg = "codes need to be array-like integers"
+            if is_float_dtype(codes):
+                icodes = codes.astype('i8')
+                if (icodes == codes).all():
+                    msg = None
+                    codes = icodes
+                    warn(("float codes will be disallowed in the future and "
+                          "raise a ValueError"), FutureWarning, stacklevel=2)
+            if msg:
+                raise ValueError(msg)
+
+        if len(codes) and (
+                codes.max() >= len(dtype.categories) or codes.min() < -1):
+            raise ValueError("codes need to be between -1 and "
+                             "len(categories)-1")
+
+        return cls(codes, dtype=dtype, fastpath=True)
+
+    _codes = None
+
+    def _get_codes(self):
+        """
+        Get the codes.
+
+        Returns
+        -------
+        codes : integer array view
+            A non writable view of the `codes` array.
+        """
+        v = self._codes.view()
+        v.flags.writeable = False
+        return v
+
+    def _set_codes(self, codes):
+        """
+        Not settable by the user directly
+        """
+        raise ValueError("cannot set Categorical codes directly")
+
+    codes = property(fget=_get_codes, fset=_set_codes, doc=_codes_doc)
+
+    def _set_categories(self, categories, fastpath=False):
+        """
+        Sets new categories inplace
+
+        Parameters
+        ----------
+        fastpath : bool, default False
+           Don't perform validation of the categories for uniqueness or nulls
+
+        Examples
+        --------
+        >>> c = pd.Categorical(['a', 'b'])
+        >>> c
+        [a, b]
+        Categories (2, object): [a, b]
+
+        >>> c._set_categories(pd.Index(['a', 'c']))
+        >>> c
+        [a, c]
+        Categories (2, object): [a, c]
+        """
+
+        if fastpath:
+            new_dtype = CategoricalDtype._from_fastpath(categories,
+                                                        self.ordered)
+        else:
+            new_dtype = CategoricalDtype(categories, ordered=self.ordered)
+        if (not fastpath and self.dtype.categories is not None and
+                len(new_dtype.categories) != len(self.dtype.categories)):
+            raise ValueError("new categories need to have the same number of "
+                             "items than the old categories!")
+
+        self._dtype = new_dtype
+
+    def _set_dtype(self, dtype):
+        """
+        Internal method for directly updating the CategoricalDtype
+
+        Parameters
+        ----------
+        dtype : CategoricalDtype
+
+        Notes
+        -----
+        We don't do any validation here. It's assumed that the dtype is
+        a (valid) instance of `CategoricalDtype`.
+        """
+        codes = _recode_for_categories(self.codes, self.categories,
+                                       dtype.categories)
+        return type(self)(codes, dtype=dtype, fastpath=True)
+
+    def set_ordered(self, value, inplace=False):
+        """
+        Set the ordered attribute to the boolean value.
+
+        Parameters
+        ----------
+        value : bool
+           Set whether this categorical is ordered (True) or not (False).
+        inplace : bool, default False
+           Whether or not to set the ordered attribute in-place or return
+           a copy of this categorical with ordered set to the value.
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        new_dtype = CategoricalDtype(self.categories, ordered=value)
+        cat = self if inplace else self.copy()
+        cat._dtype = new_dtype
+        if not inplace:
+            return cat
+
+    def as_ordered(self, inplace=False):
+        """
+        Set the Categorical to be ordered.
+
+        Parameters
+        ----------
+        inplace : bool, default False
+           Whether or not to set the ordered attribute in-place or return
+           a copy of this categorical with ordered set to True.
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        return self.set_ordered(True, inplace=inplace)
+
+    def as_unordered(self, inplace=False):
+        """
+        Set the Categorical to be unordered.
+
+        Parameters
+        ----------
+        inplace : bool, default False
+           Whether or not to set the ordered attribute in-place or return
+           a copy of this categorical with ordered set to False.
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        return self.set_ordered(False, inplace=inplace)
+
+    def set_categories(self, new_categories, ordered=None, rename=False,
+                       inplace=False):
+        """
+        Set the categories to the specified new_categories.
+
+        `new_categories` can include new categories (which will result in
+        unused categories) or remove old categories (which results in values
+        set to NaN). If `rename==True`, the categories will simple be renamed
+        (less or more items than in old categories will result in values set to
+        NaN or in unused categories respectively).
+
+        This method can be used to perform more than one action of adding,
+        removing, and reordering simultaneously and is therefore faster than
+        performing the individual steps via the more specialised methods.
+
+        On the other hand this methods does not do checks (e.g., whether the
+        old categories are included in the new categories on a reorder), which
+        can result in surprising changes, for example when using special string
+        dtypes on python3, which does not considers a S1 string equal to a
+        single char python string.
+
+        Parameters
+        ----------
+        new_categories : Index-like
+           The categories in new order.
+        ordered : bool, default False
+           Whether or not the categorical is treated as a ordered categorical.
+           If not given, do not change the ordered information.
+        rename : bool, default False
+           Whether or not the new_categories should be considered as a rename
+           of the old categories or as reordered categories.
+        inplace : bool, default False
+           Whether or not to reorder the categories in-place or return a copy
+           of this categorical with reordered categories.
+
+        Returns
+        -------
+        Categorical with reordered categories or None if inplace.
+
+        Raises
+        ------
+        ValueError
+            If new_categories does not validate as categories
+
+        See Also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if ordered is None:
+            ordered = self.dtype.ordered
+        new_dtype = CategoricalDtype(new_categories, ordered=ordered)
+
+        cat = self if inplace else self.copy()
+        if rename:
+            if (cat.dtype.categories is not None and
+                    len(new_dtype.categories) < len(cat.dtype.categories)):
+                # remove all _codes which are larger and set to -1/NaN
+                cat._codes[cat._codes >= len(new_dtype.categories)] = -1
+        else:
+            codes = _recode_for_categories(cat.codes, cat.categories,
+                                           new_dtype.categories)
+            cat._codes = codes
+        cat._dtype = new_dtype
+
+        if not inplace:
+            return cat
+
+    def rename_categories(self, new_categories, inplace=False):
+        """
+        Rename categories.
+
+        Parameters
+        ----------
+        new_categories : list-like, dict-like or callable
+
+           * list-like: all items must be unique and the number of items in
+             the new categories must match the existing number of categories.
+
+           * dict-like: specifies a mapping from
+             old categories to new. Categories not contained in the mapping
+             are passed through and extra categories in the mapping are
+             ignored.
+
+             .. versionadded:: 0.21.0
+
+           * callable : a callable that is called on all items in the old
+             categories and whose return values comprise the new categories.
+
+             .. versionadded:: 0.23.0
+
+           .. warning::
+
+              Currently, Series are considered list like. In a future version
+              of pandas they'll be considered dict-like.
+
+        inplace : bool, default False
+           Whether or not to rename the categories inplace or return a copy of
+           this categorical with renamed categories.
+
+        Returns
+        -------
+        cat : Categorical or None
+           With ``inplace=False``, the new categorical is returned.
+           With ``inplace=True``, there is no return value.
+
+        Raises
+        ------
+        ValueError
+            If new categories are list-like and do not have the same number of
+            items than the current categories or do not validate as categories
+
+        See Also
+        --------
+        reorder_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+
+        Examples
+        --------
+        >>> c = pd.Categorical(['a', 'a', 'b'])
+        >>> c.rename_categories([0, 1])
+        [0, 0, 1]
+        Categories (2, int64): [0, 1]
+
+        For dict-like ``new_categories``, extra keys are ignored and
+        categories not in the dictionary are passed through
+
+        >>> c.rename_categories({'a': 'A', 'c': 'C'})
+        [A, A, b]
+        Categories (2, object): [A, b]
+
+        You may also provide a callable to create the new categories
+
+        >>> c.rename_categories(lambda x: x.upper())
+        [A, A, B]
+        Categories (2, object): [A, B]
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        cat = self if inplace else self.copy()
+
+        if isinstance(new_categories, ABCSeries):
+            msg = ("Treating Series 'new_categories' as a list-like and using "
+                   "the values. In a future version, 'rename_categories' will "
+                   "treat Series like a dictionary.\n"
+                   "For dict-like, use 'new_categories.to_dict()'\n"
+                   "For list-like, use 'new_categories.values'.")
+            warn(msg, FutureWarning, stacklevel=2)
+            new_categories = list(new_categories)
+
+        if is_dict_like(new_categories):
+            cat.categories = [new_categories.get(item, item)
+                              for item in cat.categories]
+        elif callable(new_categories):
+            cat.categories = [new_categories(item) for item in cat.categories]
+        else:
+            cat.categories = new_categories
+        if not inplace:
+            return cat
+
+    def reorder_categories(self, new_categories, ordered=None, inplace=False):
+        """
+        Reorder categories as specified in new_categories.
+
+        `new_categories` need to include all old categories and no new category
+        items.
+
+        Parameters
+        ----------
+        new_categories : Index-like
+           The categories in new order.
+        ordered : bool, optional
+           Whether or not the categorical is treated as a ordered categorical.
+           If not given, do not change the ordered information.
+        inplace : bool, default False
+           Whether or not to reorder the categories inplace or return a copy of
+           this categorical with reordered categories.
+
+        Returns
+        -------
+        cat : Categorical with reordered categories or None if inplace.
+
+        Raises
+        ------
+        ValueError
+            If the new categories do not contain all old category items or any
+            new ones
+
+        See Also
+        --------
+        rename_categories
+        add_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if set(self.dtype.categories) != set(new_categories):
+            raise ValueError("items in new_categories are not the same as in "
+                             "old categories")
+        return self.set_categories(new_categories, ordered=ordered,
+                                   inplace=inplace)
+
+    def add_categories(self, new_categories, inplace=False):
+        """
+        Add new categories.
+
+        `new_categories` will be included at the last/highest place in the
+        categories and will be unused directly after this call.
+
+        Parameters
+        ----------
+        new_categories : category or list-like of category
+           The new categories to be included.
+        inplace : bool, default False
+           Whether or not to add the categories inplace or return a copy of
+           this categorical with added categories.
+
+        Returns
+        -------
+        cat : Categorical with new categories added or None if inplace.
+
+        Raises
+        ------
+        ValueError
+            If the new categories include old categories or do not validate as
+            categories
+
+        See Also
+        --------
+        rename_categories
+        reorder_categories
+        remove_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not is_list_like(new_categories):
+            new_categories = [new_categories]
+        already_included = set(new_categories) & set(self.dtype.categories)
+        if len(already_included) != 0:
+            msg = ("new categories must not include old categories: "
+                   "{already_included!s}")
+            raise ValueError(msg.format(already_included=already_included))
+        new_categories = list(self.dtype.categories) + list(new_categories)
+        new_dtype = CategoricalDtype(new_categories, self.ordered)
+
+        cat = self if inplace else self.copy()
+        cat._dtype = new_dtype
+        cat._codes = coerce_indexer_dtype(cat._codes, new_dtype.categories)
+        if not inplace:
+            return cat
+
+    def remove_categories(self, removals, inplace=False):
+        """
+        Remove the specified categories.
+
+        `removals` must be included in the old categories. Values which were in
+        the removed categories will be set to NaN
+
+        Parameters
+        ----------
+        removals : category or list of categories
+           The categories which should be removed.
+        inplace : bool, default False
+           Whether or not to remove the categories inplace or return a copy of
+           this categorical with removed categories.
+
+        Returns
+        -------
+        cat : Categorical with removed categories or None if inplace.
+
+        Raises
+        ------
+        ValueError
+            If the removals are not contained in the categories
+
+        See Also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_unused_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if not is_list_like(removals):
+            removals = [removals]
+
+        removal_set = set(list(removals))
+        not_included = removal_set - set(self.dtype.categories)
+        new_categories = [c for c in self.dtype.categories
+                          if c not in removal_set]
+
+        # GH 10156
+        if any(isna(removals)):
+            not_included = [x for x in not_included if notna(x)]
+            new_categories = [x for x in new_categories if notna(x)]
+
+        if len(not_included) != 0:
+            msg = "removals must all be in old categories: {not_included!s}"
+            raise ValueError(msg.format(not_included=not_included))
+
+        return self.set_categories(new_categories, ordered=self.ordered,
+                                   rename=False, inplace=inplace)
+
+    def remove_unused_categories(self, inplace=False):
+        """
+        Remove categories which are not used.
+
+        Parameters
+        ----------
+        inplace : bool, default False
+           Whether or not to drop unused categories inplace or return a copy of
+           this categorical with unused categories dropped.
+
+        Returns
+        -------
+        cat : Categorical with unused categories dropped or None if inplace.
+
+        See Also
+        --------
+        rename_categories
+        reorder_categories
+        add_categories
+        remove_categories
+        set_categories
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        cat = self if inplace else self.copy()
+        idx, inv = np.unique(cat._codes, return_inverse=True)
+
+        if idx.size != 0 and idx[0] == -1:  # na sentinel
+            idx, inv = idx[1:], inv - 1
+
+        new_categories = cat.dtype.categories.take(idx)
+        new_dtype = CategoricalDtype._from_fastpath(new_categories,
+                                                    ordered=self.ordered)
+        cat._dtype = new_dtype
+        cat._codes = coerce_indexer_dtype(inv, new_dtype.categories)
+
+        if not inplace:
+            return cat
+
+    def map(self, mapper):
+        """
+        Map categories using input correspondence (dict, Series, or function).
+
+        Maps the categories to new categories. If the mapping correspondence is
+        one-to-one the result is a :class:`~pandas.Categorical` which has the
+        same order property as the original, otherwise a :class:`~pandas.Index`
+        is returned. NaN values are unaffected.
+
+        If a `dict` or :class:`~pandas.Series` is used any unmapped category is
+        mapped to `NaN`. Note that if this happens an :class:`~pandas.Index`
+        will be returned.
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+
+        Returns
+        -------
+        pandas.Categorical or pandas.Index
+            Mapped categorical.
+
+        See Also
+        --------
+        CategoricalIndex.map : Apply a mapping correspondence on a
+            :class:`~pandas.CategoricalIndex`.
+        Index.map : Apply a mapping correspondence on an
+            :class:`~pandas.Index`.
+        Series.map : Apply a mapping correspondence on a
+            :class:`~pandas.Series`.
+        Series.apply : Apply more complex functions on a
+            :class:`~pandas.Series`.
+
+        Examples
+        --------
+        >>> cat = pd.Categorical(['a', 'b', 'c'])
+        >>> cat
+        [a, b, c]
+        Categories (3, object): [a, b, c]
+        >>> cat.map(lambda x: x.upper())
+        [A, B, C]
+        Categories (3, object): [A, B, C]
+        >>> cat.map({'a': 'first', 'b': 'second', 'c': 'third'})
+        [first, second, third]
+        Categories (3, object): [first, second, third]
+
+        If the mapping is one-to-one the ordering of the categories is
+        preserved:
+
+        >>> cat = pd.Categorical(['a', 'b', 'c'], ordered=True)
+        >>> cat
+        [a, b, c]
+        Categories (3, object): [a < b < c]
+        >>> cat.map({'a': 3, 'b': 2, 'c': 1})
+        [3, 2, 1]
+        Categories (3, int64): [3 < 2 < 1]
+
+        If the mapping is not one-to-one an :class:`~pandas.Index` is returned:
+
+        >>> cat.map({'a': 'first', 'b': 'second', 'c': 'first'})
+        Index(['first', 'second', 'first'], dtype='object')
+
+        If a `dict` is used, all unmapped categories are mapped to `NaN` and
+        the result is an :class:`~pandas.Index`:
+
+        >>> cat.map({'a': 'first', 'b': 'second'})
+        Index(['first', 'second', nan], dtype='object')
+        """
+        new_categories = self.categories.map(mapper)
+        try:
+            return self.from_codes(self._codes.copy(),
+                                   categories=new_categories,
+                                   ordered=self.ordered)
+        except ValueError:
+            # NA values are represented in self._codes with -1
+            # np.take causes NA values to take final element in new_categories
+            if np.any(self._codes == -1):
+                new_categories = new_categories.insert(len(new_categories),
+                                                       np.nan)
+            return np.take(new_categories, self._codes)
+
+    __eq__ = _cat_compare_op('__eq__')
+    __ne__ = _cat_compare_op('__ne__')
+    __lt__ = _cat_compare_op('__lt__')
+    __gt__ = _cat_compare_op('__gt__')
+    __le__ = _cat_compare_op('__le__')
+    __ge__ = _cat_compare_op('__ge__')
+
+    # for Series/ndarray like compat
+    @property
+    def shape(self):
+        """
+        Shape of the Categorical.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        shape : tuple
+        """
+
+        return tuple([len(self._codes)])
+
+    def shift(self, periods, fill_value=None):
+        """
+        Shift Categorical by desired number of periods.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods to move, can be positive or negative
+        fill_value : object, optional
+            The scalar value to use for newly introduced missing values.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        shifted : Categorical
+        """
+        # since categoricals always have ndim == 1, an axis parameter
+        # doesn't make any sense here.
+        codes = self.codes
+        if codes.ndim > 1:
+            raise NotImplementedError("Categorical with ndim > 1.")
+        if np.prod(codes.shape) and (periods != 0):
+            codes = np.roll(codes, ensure_platform_int(periods), axis=0)
+            if isna(fill_value):
+                fill_value = -1
+            elif fill_value in self.categories:
+                fill_value = self.categories.get_loc(fill_value)
+            else:
+                raise ValueError("'fill_value={}' is not present "
+                                 "in this Categorical's "
+                                 "categories".format(fill_value))
+            if periods > 0:
+                codes[:periods] = fill_value
+            else:
+                codes[periods:] = fill_value
+
+        return self.from_codes(codes, dtype=self.dtype)
+
+    def __array__(self, dtype=None):
+        """
+        The numpy array interface.
+
+        Returns
+        -------
+        numpy.array
+            A numpy array of either the specified dtype or,
+            if dtype==None (default), the same dtype as
+            categorical.categories.dtype.
+        """
+        ret = take_1d(self.categories.values, self._codes)
+        if dtype and not is_dtype_equal(dtype, self.categories.dtype):
+            return np.asarray(ret, dtype)
+        if is_extension_array_dtype(ret):
+            # When we're a Categorical[ExtensionArray], like Interval,
+            # we need to ensure __array__ get's all the way to an
+            # ndarray.
+            ret = np.asarray(ret)
+        return ret
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if not isinstance(state, dict):
+            raise Exception('invalid pickle state')
+
+        # Provide compatibility with pre-0.15.0 Categoricals.
+        if '_categories' not in state and '_levels' in state:
+            state['_categories'] = self.dtype.validate_categories(state.pop(
+                '_levels'))
+        if '_codes' not in state and 'labels' in state:
+            state['_codes'] = coerce_indexer_dtype(
+                state.pop('labels'), state['_categories'])
+
+        # 0.16.0 ordered change
+        if '_ordered' not in state:
+
+            # >=15.0 < 0.16.0
+            if 'ordered' in state:
+                state['_ordered'] = state.pop('ordered')
+            else:
+                state['_ordered'] = False
+
+        # 0.21.0 CategoricalDtype change
+        if '_dtype' not in state:
+            state['_dtype'] = CategoricalDtype(state['_categories'],
+                                               state['_ordered'])
+
+        for k, v in compat.iteritems(state):
+            setattr(self, k, v)
+
+    @property
+    def T(self):
+        """
+        Return transposed numpy array.
+        """
+        return self
+
+    @property
+    def nbytes(self):
+        return self._codes.nbytes + self.dtype.categories.values.nbytes
+
+    def memory_usage(self, deep=False):
+        """
+        Memory usage of my values
+
+        Parameters
+        ----------
+        deep : bool
+            Introspect the data deeply, interrogate
+            `object` dtypes for system-level memory consumption
+
+        Returns
+        -------
+        bytes used
+
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False
+
+        See Also
+        --------
+        numpy.ndarray.nbytes
+        """
+        return self._codes.nbytes + self.dtype.categories.memory_usage(
+            deep=deep)
+
+    @Substitution(klass='Categorical')
+    @Appender(_shared_docs['searchsorted'])
+    def searchsorted(self, value, side='left', sorter=None):
+        if not self.ordered:
+            raise ValueError("Categorical not ordered\nyou can use "
+                             ".as_ordered() to change the Categorical to an "
+                             "ordered one")
+
+        from pandas.core.series import Series
+        codes = _get_codes_for_values(Series(value).values, self.categories)
+        if -1 in codes:
+            raise KeyError("Value(s) to be inserted must be in categories.")
+
+        codes = codes[0] if is_scalar(value) else codes
+
+        return self.codes.searchsorted(codes, side=side, sorter=sorter)
+
+    def isna(self):
+        """
+        Detect missing values
+
+        Missing values (-1 in .codes) are detected.
+
+        Returns
+        -------
+        a boolean array of whether my values are null
+
+        See Also
+        --------
+        isna : Top-level isna.
+        isnull : Alias of isna.
+        Categorical.notna : Boolean inverse of Categorical.isna.
+
+        """
+
+        ret = self._codes == -1
+        return ret
+    isnull = isna
+
+    def notna(self):
+        """
+        Inverse of isna
+
+        Both missing values (-1 in .codes) and NA as a category are detected as
+        null.
+
+        Returns
+        -------
+        a boolean array of whether my values are not null
+
+        See Also
+        --------
+        notna : Top-level notna.
+        notnull : Alias of notna.
+        Categorical.isna : Boolean inverse of Categorical.notna.
+
+        """
+        return ~self.isna()
+    notnull = notna
+
+    def put(self, *args, **kwargs):
+        """
+        Replace specific elements in the Categorical with given values.
+        """
+        raise NotImplementedError(("'put' is not yet implemented "
+                                   "for Categorical"))
+
+    def dropna(self):
+        """
+        Return the Categorical without null values.
+
+        Missing values (-1 in .codes) are detected.
+
+        Returns
+        -------
+        valid : Categorical
+        """
+        result = self[self.notna()]
+
+        return result
+
+    def value_counts(self, dropna=True):
+        """
+        Return a Series containing counts of each category.
+
+        Every category will have an entry, even those with a count of 0.
+
+        Parameters
+        ----------
+        dropna : bool, default True
+            Don't include counts of NaN.
+
+        Returns
+        -------
+        counts : Series
+
+        See Also
+        --------
+        Series.value_counts
+
+        """
+        from numpy import bincount
+        from pandas import Series, CategoricalIndex
+
+        code, cat = self._codes, self.categories
+        ncat, mask = len(cat), 0 <= code
+        ix, clean = np.arange(ncat), mask.all()
+
+        if dropna or clean:
+            obs = code if clean else code[mask]
+            count = bincount(obs, minlength=ncat or None)
+        else:
+            count = bincount(np.where(mask, code, ncat))
+            ix = np.append(ix, -1)
+
+        ix = self._constructor(ix, dtype=self.dtype,
+                               fastpath=True)
+
+        return Series(count, index=CategoricalIndex(ix), dtype='int64')
+
+    def get_values(self):
+        """
+        Return the values.
+
+        For internal compatibility with pandas formatting.
+
+        Returns
+        -------
+        numpy.array
+            A numpy array of the same dtype as categorical.categories.dtype or
+            Index if datetime / periods.
+        """
+        # if we are a datetime and period index, return Index to keep metadata
+        if is_datetimelike(self.categories):
+            return self.categories.take(self._codes, fill_value=np.nan)
+        elif is_integer_dtype(self.categories) and -1 in self._codes:
+            return self.categories.astype("object").take(self._codes,
+                                                         fill_value=np.nan)
+        return np.array(self)
+
+    def check_for_ordered(self, op):
+        """ assert that we are ordered """
+        if not self.ordered:
+            raise TypeError("Categorical is not ordered for operation {op}\n"
+                            "you can use .as_ordered() to change the "
+                            "Categorical to an ordered one\n".format(op=op))
+
+    def _values_for_argsort(self):
+        return self._codes.copy()
+
+    def argsort(self, *args, **kwargs):
+        # TODO(PY2): use correct signature
+        # We have to do *args, **kwargs to avoid a a py2-only signature
+        # issue since np.argsort differs from argsort.
+        """
+        Return the indices that would sort the Categorical.
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            Whether the indices should result in an ascending
+            or descending sort.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, optional
+            Sorting algorithm.
+        *args, **kwargs:
+            passed through to :func:`numpy.argsort`.
+
+        Returns
+        -------
+        numpy.array
+
+        See Also
+        --------
+        numpy.ndarray.argsort
+
+        Notes
+        -----
+        While an ordering is applied to the category values, arg-sorting
+        in this context refers more to organizing and grouping together
+        based on matching category values. Thus, this function can be
+        called on an unordered Categorical instance unlike the functions
+        'Categorical.min' and 'Categorical.max'.
+
+        Examples
+        --------
+        >>> pd.Categorical(['b', 'b', 'a', 'c']).argsort()
+        array([2, 0, 1, 3])
+
+        >>> cat = pd.Categorical(['b', 'b', 'a', 'c'],
+        ...                      categories=['c', 'b', 'a'],
+        ...                      ordered=True)
+        >>> cat.argsort()
+        array([3, 0, 1, 2])
+        """
+        # Keep the implementation here just for the docstring.
+        return super(Categorical, self).argsort(*args, **kwargs)
+
+    def sort_values(self, inplace=False, ascending=True, na_position='last'):
+        """
+        Sort the Categorical by category value returning a new
+        Categorical by default.
+
+        While an ordering is applied to the category values, sorting in this
+        context refers more to organizing and grouping together based on
+        matching category values. Thus, this function can be called on an
+        unordered Categorical instance unlike the functions 'Categorical.min'
+        and 'Categorical.max'.
+
+        Parameters
+        ----------
+        inplace : bool, default False
+            Do operation in place.
+        ascending : bool, default True
+            Order ascending. Passing False orders descending. The
+            ordering parameter provides the method by which the
+            category values are organized.
+        na_position : {'first', 'last'} (optional, default='last')
+            'first' puts NaNs at the beginning
+            'last' puts NaNs at the end
+
+        Returns
+        -------
+        Categorical or None
+
+        See Also
+        --------
+        Categorical.sort
+        Series.sort_values
+
+        Examples
+        --------
+        >>> c = pd.Categorical([1, 2, 2, 1, 5])
+        >>> c
+        [1, 2, 2, 1, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>> c.sort_values()
+        [1, 1, 2, 2, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>> c.sort_values(ascending=False)
+        [5, 2, 2, 1, 1]
+        Categories (3, int64): [1, 2, 5]
+
+        Inplace sorting can be done as well:
+
+        >>> c.sort_values(inplace=True)
+        >>> c
+        [1, 1, 2, 2, 5]
+        Categories (3, int64): [1, 2, 5]
+        >>>
+        >>> c = pd.Categorical([1, 2, 2, 1, 5])
+
+        'sort_values' behaviour with NaNs. Note that 'na_position'
+        is independent of the 'ascending' parameter:
+
+        >>> c = pd.Categorical([np.nan, 2, 2, np.nan, 5])
+        >>> c
+        [NaN, 2.0, 2.0, NaN, 5.0]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values()
+        [2.0, 2.0, 5.0, NaN, NaN]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(ascending=False)
+        [5.0, 2.0, 2.0, NaN, NaN]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(na_position='first')
+        [NaN, NaN, 2.0, 2.0, 5.0]
+        Categories (2, int64): [2, 5]
+        >>> c.sort_values(ascending=False, na_position='first')
+        [NaN, NaN, 5.0, 2.0, 2.0]
+        Categories (2, int64): [2, 5]
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        if na_position not in ['last', 'first']:
+            msg = 'invalid na_position: {na_position!r}'
+            raise ValueError(msg.format(na_position=na_position))
+
+        sorted_idx = nargsort(self,
+                              ascending=ascending,
+                              na_position=na_position)
+
+        if inplace:
+            self._codes = self._codes[sorted_idx]
+        else:
+            return self._constructor(values=self._codes[sorted_idx],
+                                     dtype=self.dtype,
+                                     fastpath=True)
+
+    def _values_for_rank(self):
+        """
+        For correctly ranking ordered categorical data. See GH#15420
+
+        Ordered categorical data should be ranked on the basis of
+        codes with -1 translated to NaN.
+
+        Returns
+        -------
+        numpy.array
+
+        """
+        from pandas import Series
+        if self.ordered:
+            values = self.codes
+            mask = values == -1
+            if mask.any():
+                values = values.astype('float64')
+                values[mask] = np.nan
+        elif self.categories.is_numeric():
+            values = np.array(self)
+        else:
+            #  reorder the categories (so rank can use the float codes)
+            #  instead of passing an object array to rank
+            values = np.array(
+                self.rename_categories(Series(self.categories).rank().values)
+            )
+        return values
+
+    def ravel(self, order='C'):
+        """
+        Return a flattened (numpy) array.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        numpy.array
+        """
+        return np.array(self)
+
+    def view(self):
+        """
+        Return a view of myself.
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        view : Categorical
+           Returns `self`!
+        """
+        return self
+
+    def to_dense(self):
+        """
+        Return my 'dense' representation
+
+        For internal compatibility with numpy arrays.
+
+        Returns
+        -------
+        dense : array
+        """
+        return np.asarray(self)
+
+    @deprecate_kwarg(old_arg_name='fill_value', new_arg_name='value')
+    def fillna(self, value=None, method=None, limit=None):
+        """
+        Fill NA/NaN values using the specified method.
+
+        Parameters
+        ----------
+        value : scalar, dict, Series
+            If a scalar value is passed it is used to fill all missing values.
+            Alternatively, a Series or dict can be used to fill in different
+            values for each index. The value should not be a list. The
+            value(s) passed should either be in the categories or should be
+            NaN.
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            Method to use for filling holes in reindexed Series
+            pad / ffill: propagate last valid observation forward to next valid
+            backfill / bfill: use NEXT valid observation to fill gap
+        limit : int, default None
+            (Not implemented yet for Categorical!)
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled.
+
+        Returns
+        -------
+        filled : Categorical with NA/NaN filled
+        """
+        value, method = validate_fillna_kwargs(
+            value, method, validate_scalar_dict_value=False
+        )
+
+        if value is None:
+            value = np.nan
+        if limit is not None:
+            raise NotImplementedError("specifying a limit for fillna has not "
+                                      "been implemented yet")
+
+        codes = self._codes
+
+        # pad / bfill
+        if method is not None:
+
+            values = self.to_dense().reshape(-1, len(self))
+            values = interpolate_2d(values, method, 0, None,
+                                    value).astype(self.categories.dtype)[0]
+            codes = _get_codes_for_values(values, self.categories)
+
+        else:
+
+            # If value is a dict or a Series (a dict value has already
+            # been converted to a Series)
+            if isinstance(value, ABCSeries):
+                if not value[~value.isin(self.categories)].isna().all():
+                    raise ValueError("fill value must be in categories")
+
+                values_codes = _get_codes_for_values(value, self.categories)
+                indexer = np.where(values_codes != -1)
+                codes[indexer] = values_codes[values_codes != -1]
+
+            # If value is not a dict or Series it should be a scalar
+            elif is_hashable(value):
+                if not isna(value) and value not in self.categories:
+                    raise ValueError("fill value must be in categories")
+
+                mask = codes == -1
+                if mask.any():
+                    codes = codes.copy()
+                    if isna(value):
+                        codes[mask] = -1
+                    else:
+                        codes[mask] = self.categories.get_loc(value)
+
+            else:
+                raise TypeError('"value" parameter must be a scalar, dict '
+                                'or Series, but you passed a '
+                                '"{0}"'.format(type(value).__name__))
+
+        return self._constructor(codes, dtype=self.dtype, fastpath=True)
+
+    def take_nd(self, indexer, allow_fill=None, fill_value=None):
+        """
+        Take elements from the Categorical.
+
+        Parameters
+        ----------
+        indexer : sequence of int
+            The indices in `self` to take. The meaning of negative values in
+            `indexer` depends on the value of `allow_fill`.
+        allow_fill : bool, default None
+            How to handle negative values in `indexer`.
+
+            * False: negative values in `indices` indicate positional indices
+              from the right. This is similar to
+              :func:`numpy.take`.
+
+            * True: negative values in `indices` indicate missing values
+              (the default). These values are set to `fill_value`. Any other
+              other negative values raise a ``ValueError``.
+
+            .. versionchanged:: 0.23.0
+
+               Deprecated the default value of `allow_fill`. The deprecated
+               default is ``True``. In the future, this will change to
+               ``False``.
+
+        fill_value : object
+            The value to use for `indices` that are missing (-1), when
+            ``allow_fill=True``. This should be the category, i.e. a value
+            in ``self.categories``, not a code.
+
+        Returns
+        -------
+        Categorical
+            This Categorical will have the same categories and ordered as
+            `self`.
+
+        See Also
+        --------
+        Series.take : Similar method for Series.
+        numpy.ndarray.take : Similar method for NumPy arrays.
+
+        Examples
+        --------
+        >>> cat = pd.Categorical(['a', 'a', 'b'])
+        >>> cat
+        [a, a, b]
+        Categories (2, object): [a, b]
+
+        Specify ``allow_fill==False`` to have negative indices mean indexing
+        from the right.
+
+        >>> cat.take([0, -1, -2], allow_fill=False)
+        [a, b, a]
+        Categories (2, object): [a, b]
+
+        With ``allow_fill=True``, indices equal to ``-1`` mean "missing"
+        values that should be filled with the `fill_value`, which is
+        ``np.nan`` by default.
+
+        >>> cat.take([0, -1, -1], allow_fill=True)
+        [a, NaN, NaN]
+        Categories (2, object): [a, b]
+
+        The fill value can be specified.
+
+        >>> cat.take([0, -1, -1], allow_fill=True, fill_value='a')
+        [a, a, a]
+        Categories (3, object): [a, b]
+
+        Specifying a fill value that's not in ``self.categories``
+        will raise a ``TypeError``.
+        """
+        indexer = np.asarray(indexer, dtype=np.intp)
+        if allow_fill is None:
+            if (indexer < 0).any():
+                warn(_take_msg, FutureWarning, stacklevel=2)
+                allow_fill = True
+
+        dtype = self.dtype
+
+        if isna(fill_value):
+            fill_value = -1
+        elif allow_fill:
+            # convert user-provided `fill_value` to codes
+            if fill_value in self.categories:
+                fill_value = self.categories.get_loc(fill_value)
+            else:
+                msg = (
+                    "'fill_value' ('{}') is not in this Categorical's "
+                    "categories."
+                )
+                raise TypeError(msg.format(fill_value))
+
+        codes = take(self._codes, indexer, allow_fill=allow_fill,
+                     fill_value=fill_value)
+        result = type(self).from_codes(codes, dtype=dtype)
+        return result
+
+    take = take_nd
+
+    def _slice(self, slicer):
+        """
+        Return a slice of myself.
+
+        For internal compatibility with numpy arrays.
+        """
+
+        # only allow 1 dimensional slicing, but can
+        # in a 2-d case be passd (slice(None),....)
+        if isinstance(slicer, tuple) and len(slicer) == 2:
+            if not com.is_null_slice(slicer[0]):
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+            slicer = slicer[1]
+
+        codes = self._codes[slicer]
+        return self._constructor(values=codes, dtype=self.dtype, fastpath=True)
+
+    def __len__(self):
+        """
+        The length of this Categorical.
+        """
+        return len(self._codes)
+
+    def __iter__(self):
+        """
+        Returns an Iterator over the values of this Categorical.
+        """
+        return iter(self.get_values().tolist())
+
+    def __contains__(self, key):
+        """
+        Returns True if `key` is in this Categorical.
+        """
+        # if key is a NaN, check if any NaN is in self.
+        if isna(key):
+            return self.isna().any()
+
+        return contains(self, key, container=self._codes)
+
+    def _tidy_repr(self, max_vals=10, footer=True):
+        """ a short repr displaying only max_vals and an optional (but default
+        footer)
+        """
+        num = max_vals // 2
+        head = self[:num]._get_repr(length=False, footer=False)
+        tail = self[-(max_vals - num):]._get_repr(length=False, footer=False)
+
+        result = u('{head}, ..., {tail}').format(head=head[:-1], tail=tail[1:])
+        if footer:
+            result = u('{result}\n{footer}').format(result=result,
+                                                    footer=self._repr_footer())
+
+        return compat.text_type(result)
+
+    def _repr_categories(self):
+        """
+        return the base repr for the categories
+        """
+        max_categories = (10 if get_option("display.max_categories") == 0 else
+                          get_option("display.max_categories"))
+        from pandas.io.formats import format as fmt
+        if len(self.categories) > max_categories:
+            num = max_categories // 2
+            head = fmt.format_array(self.categories[:num], None)
+            tail = fmt.format_array(self.categories[-num:], None)
+            category_strs = head + ["..."] + tail
+        else:
+            category_strs = fmt.format_array(self.categories, None)
+
+        # Strip all leading spaces, which format_array adds for columns...
+        category_strs = [x.strip() for x in category_strs]
+        return category_strs
+
+    def _repr_categories_info(self):
+        """
+        Returns a string representation of the footer.
+        """
+
+        category_strs = self._repr_categories()
+        dtype = getattr(self.categories, 'dtype_str',
+                        str(self.categories.dtype))
+
+        levheader = "Categories ({length}, {dtype}): ".format(
+            length=len(self.categories), dtype=dtype)
+        width, height = get_terminal_size()
+        max_width = get_option("display.width") or width
+        if console.in_ipython_frontend():
+            # 0 = no breaks
+            max_width = 0
+        levstring = ""
+        start = True
+        cur_col_len = len(levheader)  # header
+        sep_len, sep = (3, " < ") if self.ordered else (2, ", ")
+        linesep = sep.rstrip() + "\n"  # remove whitespace
+        for val in category_strs:
+            if max_width != 0 and cur_col_len + sep_len + len(val) > max_width:
+                levstring += linesep + (" " * (len(levheader) + 1))
+                cur_col_len = len(levheader) + 1  # header + a whitespace
+            elif not start:
+                levstring += sep
+                cur_col_len += len(val)
+            levstring += val
+            start = False
+        # replace to simple save space by
+        return levheader + "[" + levstring.replace(" < ... < ", " ... ") + "]"
+
+    def _repr_footer(self):
+
+        return u('Length: {length}\n{info}').format(
+            length=len(self), info=self._repr_categories_info())
+
+    def _get_repr(self, length=True, na_rep='NaN', footer=True):
+        from pandas.io.formats import format as fmt
+        formatter = fmt.CategoricalFormatter(self, length=length,
+                                             na_rep=na_rep, footer=footer)
+        result = formatter.to_string()
+        return compat.text_type(result)
+
+    def __unicode__(self):
+        """
+        Unicode representation.
+        """
+        _maxlen = 10
+        if len(self._codes) > _maxlen:
+            result = self._tidy_repr(_maxlen)
+        elif len(self._codes) > 0:
+            result = self._get_repr(length=len(self) > _maxlen)
+        else:
+            msg = self._get_repr(length=False, footer=True).replace("\n", ", ")
+            result = ('[], {repr_msg}'.format(repr_msg=msg))
+
+        return result
+
+    def __repr__(self):
+        # We want PandasObject.__repr__, which dispatches to __unicode__
+        return super(ExtensionArray, self).__repr__()
+
+    def _maybe_coerce_indexer(self, indexer):
+        """
+        return an indexer coerced to the codes dtype
+        """
+        if isinstance(indexer, np.ndarray) and indexer.dtype.kind == 'i':
+            indexer = indexer.astype(self._codes.dtype)
+        return indexer
+
+    def __getitem__(self, key):
+        """
+        Return an item.
+        """
+        if isinstance(key, (int, np.integer)):
+            i = self._codes[key]
+            if i == -1:
+                return np.nan
+            else:
+                return self.categories[i]
+        else:
+            return self._constructor(values=self._codes[key],
+                                     dtype=self.dtype, fastpath=True)
+
+    def __setitem__(self, key, value):
+        """
+        Item assignment.
+
+
+        Raises
+        ------
+        ValueError
+            If (one or more) Value is not in categories or if a assigned
+            `Categorical` does not have the same categories
+        """
+        from pandas.core.internals.arrays import extract_array
+
+        value = extract_array(value, extract_numpy=True)
+
+        # require identical categories set
+        if isinstance(value, Categorical):
+            if not is_dtype_equal(self, value):
+                raise ValueError("Cannot set a Categorical with another, "
+                                 "without identical categories")
+            if not self.categories.equals(value.categories):
+                new_codes = _recode_for_categories(
+                    value.codes, value.categories, self.categories
+                )
+                value = Categorical.from_codes(new_codes, dtype=self.dtype)
+
+        rvalue = value if is_list_like(value) else [value]
+
+        from pandas import Index
+        to_add = Index(rvalue).difference(self.categories)
+
+        # no assignments of values not in categories, but it's always ok to set
+        # something to np.nan
+        if len(to_add) and not isna(to_add).all():
+            raise ValueError("Cannot setitem on a Categorical with a new "
+                             "category, set the categories first")
+
+        # set by position
+        if isinstance(key, (int, np.integer)):
+            pass
+
+        # tuple of indexers (dataframe)
+        elif isinstance(key, tuple):
+            # only allow 1 dimensional slicing, but can
+            # in a 2-d case be passd (slice(None),....)
+            if len(key) == 2:
+                if not com.is_null_slice(key[0]):
+                    raise AssertionError("invalid slicing for a 1-ndim "
+                                         "categorical")
+                key = key[1]
+            elif len(key) == 1:
+                key = key[0]
+            else:
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+
+        # slicing in Series or Categorical
+        elif isinstance(key, slice):
+            pass
+
+        # else: array of True/False in Series or Categorical
+
+        lindexer = self.categories.get_indexer(rvalue)
+        lindexer = self._maybe_coerce_indexer(lindexer)
+        self._codes[key] = lindexer
+
+    def _reverse_indexer(self):
+        """
+        Compute the inverse of a categorical, returning
+        a dict of categories -> indexers.
+
+        *This is an internal function*
+
+        Returns
+        -------
+        dict of categories -> indexers
+
+        Example
+        -------
+        In [1]: c = pd.Categorical(list('aabca'))
+
+        In [2]: c
+        Out[2]:
+        [a, a, b, c, a]
+        Categories (3, object): [a, b, c]
+
+        In [3]: c.categories
+        Out[3]: Index([u'a', u'b', u'c'], dtype='object')
+
+        In [4]: c.codes
+        Out[4]: array([0, 0, 1, 2, 0], dtype=int8)
+
+        In [5]: c._reverse_indexer()
+        Out[5]: {'a': array([0, 1, 4]), 'b': array([2]), 'c': array([3])}
+
+        """
+        categories = self.categories
+        r, counts = libalgos.groupsort_indexer(self.codes.astype('int64'),
+                                               categories.size)
+        counts = counts.cumsum()
+        result = (r[start:end] for start, end in zip(counts, counts[1:]))
+        result = dict(zip(categories, result))
+        return result
+
+    # reduction ops #
+    def _reduce(self, name, axis=0, **kwargs):
+        func = getattr(self, name, None)
+        if func is None:
+            msg = 'Categorical cannot perform the operation {op}'
+            raise TypeError(msg.format(op=name))
+        return func(**kwargs)
+
+    def min(self, numeric_only=None, **kwargs):
+        """
+        The minimum value of the object.
+
+        Only ordered `Categoricals` have a minimum!
+
+        Raises
+        ------
+        TypeError
+            If the `Categorical` is not `ordered`.
+
+        Returns
+        -------
+        min : the minimum of this `Categorical`
+        """
+        self.check_for_ordered('min')
+        if numeric_only:
+            good = self._codes != -1
+            pointer = self._codes[good].min(**kwargs)
+        else:
+            pointer = self._codes.min(**kwargs)
+        if pointer == -1:
+            return np.nan
+        else:
+            return self.categories[pointer]
+
+    def max(self, numeric_only=None, **kwargs):
+        """
+        The maximum value of the object.
+
+        Only ordered `Categoricals` have a maximum!
+
+        Raises
+        ------
+        TypeError
+            If the `Categorical` is not `ordered`.
+
+        Returns
+        -------
+        max : the maximum of this `Categorical`
+        """
+        self.check_for_ordered('max')
+        if numeric_only:
+            good = self._codes != -1
+            pointer = self._codes[good].max(**kwargs)
+        else:
+            pointer = self._codes.max(**kwargs)
+        if pointer == -1:
+            return np.nan
+        else:
+            return self.categories[pointer]
+
+    def mode(self, dropna=True):
+        """
+        Returns the mode(s) of the Categorical.
+
+        Always returns `Categorical` even if only one value.
+
+        Parameters
+        ----------
+        dropna : bool, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        modes : `Categorical` (sorted)
+        """
+
+        import pandas._libs.hashtable as htable
+        codes = self._codes
+        if dropna:
+            good = self._codes != -1
+            codes = self._codes[good]
+        codes = sorted(htable.mode_int64(ensure_int64(codes), dropna))
+        return self._constructor(values=codes, dtype=self.dtype, fastpath=True)
+
+    def unique(self):
+        """
+        Return the ``Categorical`` which ``categories`` and ``codes`` are
+        unique. Unused categories are NOT returned.
+
+        - unordered category: values and categories are sorted by appearance
+          order.
+        - ordered category: values are sorted by appearance order, categories
+          keeps existing order.
+
+        Returns
+        -------
+        unique values : ``Categorical``
+
+        Examples
+        --------
+        An unordered Categorical will return categories in the
+        order of appearance.
+
+        >>> pd.Categorical(list('baabc'))
+        [b, a, c]
+        Categories (3, object): [b, a, c]
+
+        >>> pd.Categorical(list('baabc'), categories=list('abc'))
+        [b, a, c]
+        Categories (3, object): [b, a, c]
+
+        An ordered Categorical preserves the category ordering.
+
+        >>> pd.Categorical(list('baabc'),
+        ...                categories=list('abc'),
+        ...                ordered=True)
+        [b, a, c]
+        Categories (3, object): [a < b < c]
+
+        See Also
+        --------
+        unique
+        CategoricalIndex.unique
+        Series.unique
+
+        """
+
+        # unlike np.unique, unique1d does not sort
+        unique_codes = unique1d(self.codes)
+        cat = self.copy()
+
+        # keep nan in codes
+        cat._codes = unique_codes
+
+        # exclude nan from indexer for categories
+        take_codes = unique_codes[unique_codes != -1]
+        if self.ordered:
+            take_codes = np.sort(take_codes)
+        return cat.set_categories(cat.categories.take(take_codes))
+
+    def _values_for_factorize(self):
+        codes = self.codes.astype('int64')
+        return codes, -1
+
+    @classmethod
+    def _from_factorized(cls, uniques, original):
+        return original._constructor(original.categories.take(uniques),
+                                     dtype=original.dtype)
+
+    def equals(self, other):
+        """
+        Returns True if categorical arrays are equal.
+
+        Parameters
+        ----------
+        other : `Categorical`
+
+        Returns
+        -------
+        bool
+        """
+        if self.is_dtype_equal(other):
+            if self.categories.equals(other.categories):
+                # fastpath to avoid re-coding
+                other_codes = other._codes
+            else:
+                other_codes = _recode_for_categories(other.codes,
+                                                     other.categories,
+                                                     self.categories)
+            return np.array_equal(self._codes, other_codes)
+        return False
+
+    def is_dtype_equal(self, other):
+        """
+        Returns True if categoricals are the same dtype
+          same categories, and same ordered
+
+        Parameters
+        ----------
+        other : Categorical
+
+        Returns
+        -------
+        bool
+        """
+
+        try:
+            return hash(self.dtype) == hash(other.dtype)
+        except (AttributeError, TypeError):
+            return False
+
+    def describe(self):
+        """
+        Describes this Categorical
+
+        Returns
+        -------
+        description: `DataFrame`
+            A dataframe with frequency and counts by category.
+        """
+        counts = self.value_counts(dropna=False)
+        freqs = counts / float(counts.sum())
+
+        from pandas.core.reshape.concat import concat
+        result = concat([counts, freqs], axis=1)
+        result.columns = ['counts', 'freqs']
+        result.index.name = 'categories'
+
+        return result
+
+    @Substitution(klass='Categorical')
+    @Appender(_extension_array_shared_docs['repeat'])
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        codes = self._codes.repeat(repeats)
+        return self._constructor(values=codes, dtype=self.dtype, fastpath=True)
+
+    # Implement the ExtensionArray interface
+    @property
+    def _can_hold_na(self):
+        return True
+
+    @classmethod
+    def _concat_same_type(self, to_concat):
+        from pandas.core.dtypes.concat import _concat_categorical
+
+        return _concat_categorical(to_concat)
+
+    def isin(self, values):
+        """
+        Check whether `values` are contained in Categorical.
+
+        Return a boolean NumPy Array showing whether each element in
+        the Categorical matches an element in the passed sequence of
+        `values` exactly.
+
+        Parameters
+        ----------
+        values : set or list-like
+            The sequence of values to test. Passing in a single string will
+            raise a ``TypeError``. Instead, turn a single string into a
+            list of one element.
+
+        Returns
+        -------
+        isin : numpy.ndarray (bool dtype)
+
+        Raises
+        ------
+        TypeError
+          * If `values` is not a set or list-like
+
+        See Also
+        --------
+        pandas.Series.isin : Equivalent method on Series.
+
+        Examples
+        --------
+
+        >>> s = pd.Categorical(['lama', 'cow', 'lama', 'beetle', 'lama',
+        ...                'hippo'])
+        >>> s.isin(['cow', 'lama'])
+        array([ True,  True,  True, False,  True, False])
+
+        Passing a single string as ``s.isin('lama')`` will raise an error. Use
+        a list of one element instead:
+
+        >>> s.isin(['lama'])
+        array([ True, False,  True, False,  True, False])
+        """
+        from pandas.core.internals.construction import sanitize_array
+        if not is_list_like(values):
+            raise TypeError("only list-like objects are allowed to be passed"
+                            " to isin(), you passed a [{values_type}]"
+                            .format(values_type=type(values).__name__))
+        values = sanitize_array(values, None, None)
+        null_mask = np.asarray(isna(values))
+        code_values = self.categories.get_indexer(values)
+        code_values = code_values[null_mask | (code_values >= 0)]
+        return algorithms.isin(self.codes, code_values)
+
+
+# The Series.cat accessor
+
+
+@delegate_names(delegate=Categorical,
+                accessors=["categories", "ordered"],
+                typ="property")
+@delegate_names(delegate=Categorical,
+                accessors=["rename_categories", "reorder_categories",
+                           "add_categories", "remove_categories",
+                           "remove_unused_categories", "set_categories",
+                           "as_ordered", "as_unordered"],
+                typ="method")
+class CategoricalAccessor(PandasDelegate, PandasObject, NoNewAttributesMixin):
+    """
+    Accessor object for categorical properties of the Series values.
+
+    Be aware that assigning to `categories` is a inplace operation, while all
+    methods return new categorical data per default (but can be called with
+    `inplace=True`).
+
+    Parameters
+    ----------
+    data : Series or CategoricalIndex
+
+    Examples
+    --------
+    >>> s.cat.categories
+    >>> s.cat.categories = list('abc')
+    >>> s.cat.rename_categories(list('cab'))
+    >>> s.cat.reorder_categories(list('cab'))
+    >>> s.cat.add_categories(['d','e'])
+    >>> s.cat.remove_categories(['d'])
+    >>> s.cat.remove_unused_categories()
+    >>> s.cat.set_categories(list('abcde'))
+    >>> s.cat.as_ordered()
+    >>> s.cat.as_unordered()
+    """
+
+    def __init__(self, data):
+        self._validate(data)
+        self._parent = data.values
+        self._index = data.index
+        self._name = data.name
+        self._freeze()
+
+    @staticmethod
+    def _validate(data):
+        if not is_categorical_dtype(data.dtype):
+            raise AttributeError("Can only use .cat accessor with a "
+                                 "'category' dtype")
+
+    def _delegate_property_get(self, name):
+        return getattr(self._parent, name)
+
+    def _delegate_property_set(self, name, new_values):
+        return setattr(self._parent, name, new_values)
+
+    @property
+    def codes(self):
+        """
+        Return Series of codes as well as the index.
+        """
+        from pandas import Series
+        return Series(self._parent.codes, index=self._index)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        from pandas import Series
+        method = getattr(self._parent, name)
+        res = method(*args, **kwargs)
+        if res is not None:
+            return Series(res, index=self._index, name=self._name)
+
+    @property
+    def categorical(self):
+        # Note: Upon deprecation, `test_tab_completion_with_categorical` will
+        # need to be updated. `categorical` will need to be removed from
+        # `ok_for_cat`.
+        warn("`Series.cat.categorical` has been deprecated. Use the "
+             "attributes on 'Series.cat' directly instead.",
+             FutureWarning,
+             stacklevel=2)
+        return self._parent
+
+    @property
+    def name(self):
+        # Note: Upon deprecation, `test_tab_completion_with_categorical` will
+        # need to be updated. `name` will need to be removed from
+        # `ok_for_cat`.
+        warn("`Series.cat.name` has been deprecated. Use `Series.name` "
+             "instead.",
+             FutureWarning,
+             stacklevel=2)
+        return self._name
+
+    @property
+    def index(self):
+        # Note: Upon deprecation, `test_tab_completion_with_categorical` will
+        # need to be updated. `index` will need to be removed from
+        # ok_for_cat`.
+        warn("`Series.cat.index` has been deprecated. Use `Series.index` "
+             "instead.",
+             FutureWarning,
+             stacklevel=2)
+        return self._index
+
+# utility routines
+
+
+def _get_codes_for_values(values, categories):
+    """
+    utility routine to turn values into codes given the specified categories
+    """
+    from pandas.core.algorithms import _get_data_algo, _hashtables
+    dtype_equal = is_dtype_equal(values.dtype, categories.dtype)
+
+    if dtype_equal:
+        # To prevent erroneous dtype coercion in _get_data_algo, retrieve
+        # the underlying numpy array. gh-22702
+        values = getattr(values, '_ndarray_values', values)
+        categories = getattr(categories, '_ndarray_values', categories)
+    elif (is_extension_array_dtype(categories.dtype) and
+          is_object_dtype(values)):
+        # Support inferring the correct extension dtype from an array of
+        # scalar objects. e.g.
+        # Categorical(array[Period, Period], categories=PeriodIndex(...))
+        try:
+            values = (
+                categories.dtype.construct_array_type()._from_sequence(values)
+            )
+        except Exception:
+            # but that may fail for any reason, so fall back to object
+            values = ensure_object(values)
+            categories = ensure_object(categories)
+    else:
+        values = ensure_object(values)
+        categories = ensure_object(categories)
+
+    (hash_klass, vec_klass), vals = _get_data_algo(values, _hashtables)
+    (_, _), cats = _get_data_algo(categories, _hashtables)
+    t = hash_klass(len(cats))
+    t.map_locations(cats)
+    return coerce_indexer_dtype(t.lookup(vals), cats)
+
+
+def _recode_for_categories(codes, old_categories, new_categories):
+    """
+    Convert a set of codes for to a new set of categories
+
+    Parameters
+    ----------
+    codes : array
+    old_categories, new_categories : Index
+
+    Returns
+    -------
+    new_codes : array
+
+    Examples
+    --------
+    >>> old_cat = pd.Index(['b', 'a', 'c'])
+    >>> new_cat = pd.Index(['a', 'b'])
+    >>> codes = np.array([0, 1, 1, 2])
+    >>> _recode_for_categories(codes, old_cat, new_cat)
+    array([ 1,  0,  0, -1])
+    """
+    from pandas.core.algorithms import take_1d
+
+    if len(old_categories) == 0:
+        # All null anyway, so just retain the nulls
+        return codes.copy()
+    elif new_categories.equals(old_categories):
+        # Same categories, so no need to actually recode
+        return codes.copy()
+    indexer = coerce_indexer_dtype(new_categories.get_indexer(old_categories),
+                                   new_categories)
+    new_codes = take_1d(indexer, codes.copy(), fill_value=-1)
+    return new_codes
+
+
+def _convert_to_list_like(list_like):
+    if hasattr(list_like, "dtype"):
+        return list_like
+    if isinstance(list_like, list):
+        return list_like
+    if (is_sequence(list_like) or isinstance(list_like, tuple) or
+            is_iterator(list_like)):
+        return list(list_like)
+    elif is_scalar(list_like):
+        return [list_like]
+    else:
+        # is this reached?
+        return [list_like]
+
+
+def _factorize_from_iterable(values):
+    """
+    Factorize an input `values` into `categories` and `codes`. Preserves
+    categorical dtype in `categories`.
+
+    *This is an internal function*
+
+    Parameters
+    ----------
+    values : list-like
+
+    Returns
+    -------
+    codes : ndarray
+    categories : Index
+        If `values` has a categorical dtype, then `categories` is
+        a CategoricalIndex keeping the categories and order of `values`.
+    """
+    from pandas.core.indexes.category import CategoricalIndex
+
+    if not is_list_like(values):
+        raise TypeError("Input must be list-like")
+
+    if is_categorical(values):
+        if isinstance(values, (ABCCategoricalIndex, ABCSeries)):
+            values = values._values
+        categories = CategoricalIndex(values.categories, dtype=values.dtype)
+        codes = values.codes
+    else:
+        # The value of ordered is irrelevant since we don't use cat as such,
+        # but only the resulting categories, the order of which is independent
+        # from ordered. Set ordered to False as default. See GH #15457
+        cat = Categorical(values, ordered=False)
+        categories = cat.categories
+        codes = cat.codes
+    return codes, categories
+
+
+def _factorize_from_iterables(iterables):
+    """
+    A higher-level wrapper over `_factorize_from_iterable`.
+
+    *This is an internal function*
+
+    Parameters
+    ----------
+    iterables : list-like of list-likes
+
+    Returns
+    -------
+    codes_list : list of ndarrays
+    categories_list : list of Indexes
+
+    Notes
+    -----
+    See `_factorize_from_iterable` for more info.
+    """
+    if len(iterables) == 0:
+        # For consistency, it should return a list of 2 lists.
+        return [[], []]
+    return map(list, lzip(*[_factorize_from_iterable(it) for it in iterables]))
diff --git a/pandas/core/arrays/datetimelike.py b/pandas/core/arrays/datetimelike.py
new file mode 100644
index 0000000000000..94668c74c1693
--- /dev/null
+++ b/pandas/core/arrays/datetimelike.py
@@ -0,0 +1,1598 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta
+import operator
+import warnings
+
+import numpy as np
+
+from pandas._libs import NaT, algos, iNaT, lib
+from pandas._libs.tslibs.period import (
+    DIFFERENT_FREQ, IncompatibleFrequency, Period)
+from pandas._libs.tslibs.timedeltas import Timedelta, delta_to_nanoseconds
+from pandas._libs.tslibs.timestamps import (
+    RoundTo, maybe_integer_op_deprecated, round_nsint64)
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+from pandas.errors import (
+    AbstractMethodError, NullFrequencyError, PerformanceWarning)
+from pandas.util._decorators import Appender, Substitution
+from pandas.util._validators import validate_fillna_kwargs
+
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64_any_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_datetime_or_timedelta_dtype, is_dtype_equal,
+    is_extension_array_dtype, is_float_dtype, is_integer_dtype, is_list_like,
+    is_object_dtype, is_offsetlike, is_period_dtype, is_string_dtype,
+    is_timedelta64_dtype, is_unsigned_integer_dtype, pandas_dtype)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCIndexClass, ABCSeries
+from pandas.core.dtypes.inference import is_array_like
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import missing, nanops
+from pandas.core.algorithms import (
+    checked_add_with_arr, take, unique1d, value_counts)
+import pandas.core.common as com
+
+from pandas.tseries import frequencies
+from pandas.tseries.offsets import DateOffset, Tick
+
+from .base import ExtensionArray, ExtensionOpsMixin
+
+
+class AttributesMixin(object):
+
+    @property
+    def _attributes(self):
+        # Inheriting subclass should implement _attributes as a list of strings
+        raise AbstractMethodError(self)
+
+    @classmethod
+    def _simple_new(cls, values, **kwargs):
+        raise AbstractMethodError(cls)
+
+    def _get_attributes_dict(self):
+        """
+        return an attributes dict for my class
+        """
+        return {k: getattr(self, k, None) for k in self._attributes}
+
+    @property
+    def _scalar_type(self):
+        # type: () -> Union[type, Tuple[type]]
+        """The scalar associated with this datelike
+
+        * PeriodArray : Period
+        * DatetimeArray : Timestamp
+        * TimedeltaArray : Timedelta
+        """
+        raise AbstractMethodError(self)
+
+    def _scalar_from_string(self, value):
+        # type: (str) -> Union[Period, Timestamp, Timedelta, NaTType]
+        """
+        Construct a scalar type from a string.
+
+        Parameters
+        ----------
+        value : str
+
+        Returns
+        -------
+        Period, Timestamp, or Timedelta, or NaT
+            Whatever the type of ``self._scalar_type`` is.
+
+        Notes
+        -----
+        This should call ``self._check_compatible_with`` before
+        unboxing the result.
+        """
+        raise AbstractMethodError(self)
+
+    def _unbox_scalar(self, value):
+        # type: (Union[Period, Timestamp, Timedelta, NaTType]) -> int
+        """
+        Unbox the integer value of a scalar `value`.
+
+        Parameters
+        ----------
+        value : Union[Period, Timestamp, Timedelta]
+
+        Returns
+        -------
+        int
+
+        Examples
+        --------
+        >>> self._unbox_scalar(Timedelta('10s'))  # DOCTEST: +SKIP
+        10000000000
+        """
+        raise AbstractMethodError(self)
+
+    def _check_compatible_with(self, other):
+        # type: (Union[Period, Timestamp, Timedelta, NaTType]) -> None
+        """
+        Verify that `self` and `other` are compatible.
+
+        * DatetimeArray verifies that the timezones (if any) match
+        * PeriodArray verifies that the freq matches
+        * Timedelta has no verification
+
+        In each case, NaT is considered compatible.
+
+        Parameters
+        ----------
+        other
+
+        Raises
+        ------
+        Exception
+        """
+        raise AbstractMethodError(self)
+
+
+class DatelikeOps(object):
+    """
+    Common ops for DatetimeIndex/PeriodIndex, but not TimedeltaIndex.
+    """
+
+    @Substitution(URL="https://docs.python.org/3/library/datetime.html"
+                      "#strftime-and-strptime-behavior")
+    def strftime(self, date_format):
+        """
+        Convert to Index using specified date_format.
+
+        Return an Index of formatted strings specified by date_format, which
+        supports the same string format as the python standard library. Details
+        of the string format can be found in `python string format
+        doc <%(URL)s>`__.
+
+        Parameters
+        ----------
+        date_format : str
+            Date format string (e.g. "%%Y-%%m-%%d").
+
+        Returns
+        -------
+        Index
+            Index of formatted strings.
+
+        See Also
+        --------
+        to_datetime : Convert the given argument to datetime.
+        DatetimeIndex.normalize : Return DatetimeIndex with times to midnight.
+        DatetimeIndex.round : Round the DatetimeIndex to the specified freq.
+        DatetimeIndex.floor : Floor the DatetimeIndex to the specified freq.
+
+        Examples
+        --------
+        >>> rng = pd.date_range(pd.Timestamp("2018-03-10 09:00"),
+        ...                     periods=3, freq='s')
+        >>> rng.strftime('%%B %%d, %%Y, %%r')
+        Index(['March 10, 2018, 09:00:00 AM', 'March 10, 2018, 09:00:01 AM',
+               'March 10, 2018, 09:00:02 AM'],
+              dtype='object')
+        """
+        from pandas import Index
+        return Index(self._format_native_types(date_format=date_format))
+
+
+class TimelikeOps(object):
+    """
+    Common ops for TimedeltaIndex/DatetimeIndex, but not PeriodIndex.
+    """
+
+    _round_doc = (
+        """
+        Perform {op} operation on the data to the specified `freq`.
+
+        Parameters
+        ----------
+        freq : str or Offset
+            The frequency level to {op} the index to. Must be a fixed
+            frequency like 'S' (second) not 'ME' (month end). See
+            :ref:`frequency aliases <timeseries.offset_aliases>` for
+            a list of possible `freq` values.
+        ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
+            Only relevant for DatetimeIndex:
+
+            - 'infer' will attempt to infer fall dst-transition hours based on
+              order
+            - bool-ndarray where True signifies a DST time, False designates
+              a non-DST time (note that this flag is only applicable for
+              ambiguous times)
+            - 'NaT' will return NaT where there are ambiguous times
+            - 'raise' will raise an AmbiguousTimeError if there are ambiguous
+              times
+
+            .. versionadded:: 0.24.0
+
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        DatetimeIndex, TimedeltaIndex, or Series
+            Index of the same type for a DatetimeIndex or TimedeltaIndex,
+            or a Series with the same index for a Series.
+
+        Raises
+        ------
+        ValueError if the `freq` cannot be converted.
+
+        Examples
+        --------
+        **DatetimeIndex**
+
+        >>> rng = pd.date_range('1/1/2018 11:59:00', periods=3, freq='min')
+        >>> rng
+        DatetimeIndex(['2018-01-01 11:59:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:01:00'],
+                      dtype='datetime64[ns]', freq='T')
+        """)
+
+    _round_example = (
+        """>>> rng.round('H')
+        DatetimeIndex(['2018-01-01 12:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.round("H")
+        0   2018-01-01 12:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 12:00:00
+        dtype: datetime64[ns]
+        """)
+
+    _floor_example = (
+        """>>> rng.floor('H')
+        DatetimeIndex(['2018-01-01 11:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 12:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.floor("H")
+        0   2018-01-01 11:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 12:00:00
+        dtype: datetime64[ns]
+        """
+    )
+
+    _ceil_example = (
+        """>>> rng.ceil('H')
+        DatetimeIndex(['2018-01-01 12:00:00', '2018-01-01 12:00:00',
+                       '2018-01-01 13:00:00'],
+                      dtype='datetime64[ns]', freq=None)
+
+        **Series**
+
+        >>> pd.Series(rng).dt.ceil("H")
+        0   2018-01-01 12:00:00
+        1   2018-01-01 12:00:00
+        2   2018-01-01 13:00:00
+        dtype: datetime64[ns]
+        """
+    )
+
+    def _round(self, freq, mode, ambiguous, nonexistent):
+        # round the local times
+        values = _ensure_datetimelike_to_i8(self)
+        result = round_nsint64(values, mode, freq)
+        result = self._maybe_mask_results(result, fill_value=NaT)
+
+        dtype = self.dtype
+        if is_datetime64tz_dtype(self):
+            dtype = None
+        return self._ensure_localized(
+            self._simple_new(result, dtype=dtype), ambiguous, nonexistent
+        )
+
+    @Appender((_round_doc + _round_example).format(op="round"))
+    def round(self, freq, ambiguous='raise', nonexistent='raise'):
+        return self._round(
+            freq, RoundTo.NEAREST_HALF_EVEN, ambiguous, nonexistent
+        )
+
+    @Appender((_round_doc + _floor_example).format(op="floor"))
+    def floor(self, freq, ambiguous='raise', nonexistent='raise'):
+        return self._round(freq, RoundTo.MINUS_INFTY, ambiguous, nonexistent)
+
+    @Appender((_round_doc + _ceil_example).format(op="ceil"))
+    def ceil(self, freq, ambiguous='raise', nonexistent='raise'):
+        return self._round(freq, RoundTo.PLUS_INFTY, ambiguous, nonexistent)
+
+
+class DatetimeLikeArrayMixin(ExtensionOpsMixin,
+                             AttributesMixin,
+                             ExtensionArray):
+    """
+    Shared Base/Mixin class for DatetimeArray, TimedeltaArray, PeriodArray
+
+    Assumes that __new__/__init__ defines:
+        _data
+        _freq
+
+    and that the inheriting class has methods:
+        _generate_range
+    """
+
+    @property
+    def _box_func(self):
+        """
+        box function to get object from internal representation
+        """
+        raise AbstractMethodError(self)
+
+    def _box_values(self, values):
+        """
+        apply box func to passed values
+        """
+        return lib.map_infer(values, self._box_func)
+
+    def __iter__(self):
+        return (self._box_func(v) for v in self.asi8)
+
+    @property
+    def asi8(self):
+        # type: () -> ndarray
+        """
+        Integer representation of the values.
+
+        Returns
+        -------
+        ndarray
+            An ndarray with int64 dtype.
+        """
+        # do not cache or you'll create a memory leak
+        return self._data.view('i8')
+
+    @property
+    def _ndarray_values(self):
+        return self._data
+
+    # ----------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_native_types(self, na_rep='NaT', date_format=None):
+        """
+        Helper method for astype when converting to strings.
+
+        Returns
+        -------
+        ndarray[str]
+        """
+        raise AbstractMethodError(self)
+
+    def _formatter(self, boxed=False):
+        # TODO: Remove Datetime & DatetimeTZ formatters.
+        return "'{}'".format
+
+    # ----------------------------------------------------------------
+    # Array-Like / EA-Interface Methods
+
+    @property
+    def nbytes(self):
+        return self._data.nbytes
+
+    def __array__(self, dtype=None):
+        # used for Timedelta/DatetimeArray, overwritten by PeriodArray
+        if is_object_dtype(dtype):
+            return np.array(list(self), dtype=object)
+        return self._data
+
+    @property
+    def shape(self):
+        return (len(self),)
+
+    @property
+    def size(self):
+        # type: () -> int
+        """The number of elements in this array."""
+        return np.prod(self.shape)
+
+    def __len__(self):
+        return len(self._data)
+
+    def __getitem__(self, key):
+        """
+        This getitem defers to the underlying array, which by-definition can
+        only handle list-likes, slices, and integer scalars
+        """
+
+        is_int = lib.is_integer(key)
+        if lib.is_scalar(key) and not is_int:
+            raise IndexError("only integers, slices (`:`), ellipsis (`...`), "
+                             "numpy.newaxis (`None`) and integer or boolean "
+                             "arrays are valid indices")
+
+        getitem = self._data.__getitem__
+        if is_int:
+            val = getitem(key)
+            return self._box_func(val)
+
+        if com.is_bool_indexer(key):
+            key = np.asarray(key, dtype=bool)
+            if key.all():
+                key = slice(0, None, None)
+            else:
+                key = lib.maybe_booleans_to_slice(key.view(np.uint8))
+
+        is_period = is_period_dtype(self)
+        if is_period:
+            freq = self.freq
+        else:
+            freq = None
+            if isinstance(key, slice):
+                if self.freq is not None and key.step is not None:
+                    freq = key.step * self.freq
+                else:
+                    freq = self.freq
+            elif key is Ellipsis:
+                # GH#21282 indexing with Ellipsis is similar to a full slice,
+                #  should preserve `freq` attribute
+                freq = self.freq
+
+        result = getitem(key)
+        if result.ndim > 1:
+            # To support MPL which performs slicing with 2 dim
+            # even though it only has 1 dim by definition
+            if is_period:
+                return self._simple_new(result, dtype=self.dtype, freq=freq)
+            return result
+
+        return self._simple_new(result, dtype=self.dtype, freq=freq)
+
+    def __setitem__(
+            self,
+            key,    # type: Union[int, Sequence[int], Sequence[bool], slice]
+            value,  # type: Union[NaTType, Scalar, Sequence[Scalar]]
+    ):
+        # type: (...) -> None
+        # I'm fudging the types a bit here. The "Scalar" above really depends
+        # on type(self). For PeriodArray, it's Period (or stuff coercible
+        # to a period in from_sequence). For DatetimeArray, it's Timestamp...
+        # I don't know if mypy can do that, possibly with Generics.
+        # https://mypy.readthedocs.io/en/latest/generics.html
+
+        if is_list_like(value):
+            is_slice = isinstance(key, slice)
+
+            if lib.is_scalar(key):
+                raise ValueError("setting an array element with a sequence.")
+
+            if (not is_slice
+                    and len(key) != len(value)
+                    and not com.is_bool_indexer(key)):
+                msg = ("shape mismatch: value array of length '{}' does not "
+                       "match indexing result of length '{}'.")
+                raise ValueError(msg.format(len(key), len(value)))
+            if not is_slice and len(key) == 0:
+                return
+
+            value = type(self)._from_sequence(value, dtype=self.dtype)
+            self._check_compatible_with(value)
+            value = value.asi8
+        elif isinstance(value, self._scalar_type):
+            self._check_compatible_with(value)
+            value = self._unbox_scalar(value)
+        elif isna(value) or value == iNaT:
+            value = iNaT
+        else:
+            msg = (
+                "'value' should be a '{scalar}', 'NaT', or array of those. "
+                "Got '{typ}' instead."
+            )
+            raise TypeError(msg.format(scalar=self._scalar_type.__name__,
+                                       typ=type(value).__name__))
+        self._data[key] = value
+        self._maybe_clear_freq()
+
+    def _maybe_clear_freq(self):
+        # inplace operations like __setitem__ may invalidate the freq of
+        # DatetimeArray and TimedeltaArray
+        pass
+
+    def astype(self, dtype, copy=True):
+        # Some notes on cases we don't have to handle here in the base class:
+        #   1. PeriodArray.astype handles period -> period
+        #   2. DatetimeArray.astype handles conversion between tz.
+        #   3. DatetimeArray.astype handles datetime -> period
+        from pandas import Categorical
+        dtype = pandas_dtype(dtype)
+
+        if is_object_dtype(dtype):
+            return self._box_values(self.asi8)
+        elif is_string_dtype(dtype) and not is_categorical_dtype(dtype):
+            return self._format_native_types()
+        elif is_integer_dtype(dtype):
+            # we deliberately ignore int32 vs. int64 here.
+            # See https://github.com/pandas-dev/pandas/issues/24381 for more.
+            values = self.asi8
+
+            if is_unsigned_integer_dtype(dtype):
+                # Again, we ignore int32 vs. int64
+                values = values.view("uint64")
+
+            if copy:
+                values = values.copy()
+            return values
+        elif (is_datetime_or_timedelta_dtype(dtype) and
+              not is_dtype_equal(self.dtype, dtype)) or is_float_dtype(dtype):
+            # disallow conversion between datetime/timedelta,
+            # and conversions for any datetimelike to float
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+        elif is_categorical_dtype(dtype):
+            return Categorical(self, dtype=dtype)
+        else:
+            return np.asarray(self, dtype=dtype)
+
+    def view(self, dtype=None):
+        """
+        New view on this array with the same data.
+
+        Parameters
+        ----------
+        dtype : numpy dtype, optional
+
+        Returns
+        -------
+        ndarray
+            With the specified `dtype`.
+        """
+        return self._data.view(dtype=dtype)
+
+    # ------------------------------------------------------------------
+    # ExtensionArray Interface
+
+    def unique(self):
+        result = unique1d(self.asi8)
+        return type(self)(result, dtype=self.dtype)
+
+    def _validate_fill_value(self, fill_value):
+        """
+        If a fill_value is passed to `take` convert it to an i8 representation,
+        raising ValueError if this is not possible.
+
+        Parameters
+        ----------
+        fill_value : object
+
+        Returns
+        -------
+        fill_value : np.int64
+
+        Raises
+        ------
+        ValueError
+        """
+        raise AbstractMethodError(self)
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        if allow_fill:
+            fill_value = self._validate_fill_value(fill_value)
+
+        new_values = take(self.asi8,
+                          indices,
+                          allow_fill=allow_fill,
+                          fill_value=fill_value)
+
+        return type(self)(new_values, dtype=self.dtype)
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        dtypes = {x.dtype for x in to_concat}
+        assert len(dtypes) == 1
+        dtype = list(dtypes)[0]
+
+        values = np.concatenate([x.asi8 for x in to_concat])
+        return cls(values, dtype=dtype)
+
+    def copy(self, deep=False):
+        values = self.asi8.copy()
+        return type(self)._simple_new(values, dtype=self.dtype, freq=self.freq)
+
+    def _values_for_factorize(self):
+        return self.asi8, iNaT
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls(values, dtype=original.dtype)
+
+    def _values_for_argsort(self):
+        return self._data
+
+    # ------------------------------------------------------------------
+    # Additional array methods
+    #  These are not part of the EA API, but we implement them because
+    #  pandas assumes they're there.
+
+    def searchsorted(self, value, side='left', sorter=None):
+        """
+        Find indices where elements should be inserted to maintain order.
+
+        Find the indices into a sorted array `self` such that, if the
+        corresponding elements in `value` were inserted before the indices,
+        the order of `self` would be preserved.
+
+        Parameters
+        ----------
+        value : array_like
+            Values to insert into `self`.
+        side : {'left', 'right'}, optional
+            If 'left', the index of the first suitable location found is given.
+            If 'right', return the last such index.  If there is no suitable
+            index, return either 0 or N (where N is the length of `self`).
+        sorter : 1-D array_like, optional
+            Optional array of integer indices that sort `self` into ascending
+            order. They are typically the result of ``np.argsort``.
+
+        Returns
+        -------
+        indices : array of ints
+            Array of insertion points with the same shape as `value`.
+        """
+        if isinstance(value, compat.string_types):
+            value = self._scalar_from_string(value)
+
+        if not (isinstance(value, (self._scalar_type, type(self)))
+                or isna(value)):
+            raise ValueError("Unexpected type for 'value': {valtype}"
+                             .format(valtype=type(value)))
+
+        self._check_compatible_with(value)
+        if isinstance(value, type(self)):
+            value = value.asi8
+        else:
+            value = self._unbox_scalar(value)
+
+        return self.asi8.searchsorted(value, side=side, sorter=sorter)
+
+    def repeat(self, repeats, *args, **kwargs):
+        """
+        Repeat elements of an array.
+
+        See Also
+        --------
+        numpy.ndarray.repeat
+        """
+        nv.validate_repeat(args, kwargs)
+        values = self._data.repeat(repeats)
+        return type(self)(values.view('i8'), dtype=self.dtype)
+
+    def value_counts(self, dropna=False):
+        """
+        Return a Series containing counts of unique values.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaT values.
+
+        Returns
+        -------
+        Series
+        """
+        from pandas import Series, Index
+
+        if dropna:
+            values = self[~self.isna()]._data
+        else:
+            values = self._data
+
+        cls = type(self)
+
+        result = value_counts(values, sort=False, dropna=dropna)
+        index = Index(cls(result.index.view('i8'), dtype=self.dtype),
+                      name=result.index.name)
+        return Series(result.values, index=index, name=result.name)
+
+    def map(self, mapper):
+        # TODO(GH-23179): Add ExtensionArray.map
+        # Need to figure out if we want ExtensionArray.map first.
+        # If so, then we can refactor IndexOpsMixin._map_values to
+        # a standalone function and call from here..
+        # Else, just rewrite _map_infer_values to do the right thing.
+        from pandas import Index
+
+        return Index(self).map(mapper).array
+
+    # ------------------------------------------------------------------
+    # Null Handling
+
+    def isna(self):
+        return self._isnan
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def _isnan(self):
+        """
+        return if each value is nan
+        """
+        return (self.asi8 == iNaT)
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def _hasnans(self):
+        """
+        return if I have any nans; enables various perf speedups
+        """
+        return bool(self._isnan.any())
+
+    def _maybe_mask_results(self, result, fill_value=iNaT, convert=None):
+        """
+        Parameters
+        ----------
+        result : a ndarray
+        fill_value : object, default iNaT
+        convert : string/dtype or None
+
+        Returns
+        -------
+        result : ndarray with values replace by the fill_value
+
+        mask the result if needed, convert to the provided dtype if its not
+        None
+
+        This is an internal routine.
+        """
+
+        if self._hasnans:
+            if convert:
+                result = result.astype(convert)
+            if fill_value is None:
+                fill_value = np.nan
+            result[self._isnan] = fill_value
+        return result
+
+    def fillna(self, value=None, method=None, limit=None):
+        # TODO(GH-20300): remove this
+        # Just overriding to ensure that we avoid an astype(object).
+        # Either 20300 or a `_values_for_fillna` would avoid this duplication.
+        if isinstance(value, ABCSeries):
+            value = value.array
+
+        value, method = validate_fillna_kwargs(value, method)
+
+        mask = self.isna()
+
+        if is_array_like(value):
+            if len(value) != len(self):
+                raise ValueError("Length of 'value' does not match. Got ({}) "
+                                 " expected {}".format(len(value), len(self)))
+            value = value[mask]
+
+        if mask.any():
+            if method is not None:
+                if method == 'pad':
+                    func = missing.pad_1d
+                else:
+                    func = missing.backfill_1d
+
+                values = self._data
+                if not is_period_dtype(self):
+                    # For PeriodArray self._data is i8, which gets copied
+                    #  by `func`.  Otherwise we need to make a copy manually
+                    # to avoid modifying `self` in-place.
+                    values = values.copy()
+
+                new_values = func(values, limit=limit,
+                                  mask=mask)
+                if is_datetime64tz_dtype(self):
+                    # we need to pass int64 values to the constructor to avoid
+                    #  re-localizing incorrectly
+                    new_values = new_values.view("i8")
+                new_values = type(self)(new_values, dtype=self.dtype)
+            else:
+                # fill with value
+                new_values = self.copy()
+                new_values[mask] = value
+        else:
+            new_values = self.copy()
+        return new_values
+
+    # ------------------------------------------------------------------
+    # Frequency Properties/Methods
+
+    @property
+    def freq(self):
+        """
+        Return the frequency object if it is set, otherwise None.
+        """
+        return self._freq
+
+    @freq.setter
+    def freq(self, value):
+        if value is not None:
+            value = frequencies.to_offset(value)
+            self._validate_frequency(self, value)
+
+        self._freq = value
+
+    @property
+    def freqstr(self):
+        """
+        Return the frequency object as a string if its set, otherwise None
+        """
+        if self.freq is None:
+            return None
+        return self.freq.freqstr
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def inferred_freq(self):
+        """
+        Tryies to return a string representing a frequency guess,
+        generated by infer_freq.  Returns None if it can't autodetect the
+        frequency.
+        """
+        try:
+            return frequencies.infer_freq(self)
+        except ValueError:
+            return None
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def _resolution(self):
+        return frequencies.Resolution.get_reso_from_freq(self.freqstr)
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def resolution(self):
+        """
+        Returns day, hour, minute, second, millisecond or microsecond
+        """
+        return frequencies.Resolution.get_str(self._resolution)
+
+    @classmethod
+    def _validate_frequency(cls, index, freq, **kwargs):
+        """
+        Validate that a frequency is compatible with the values of a given
+        Datetime Array/Index or Timedelta Array/Index
+
+        Parameters
+        ----------
+        index : DatetimeIndex or TimedeltaIndex
+            The index on which to determine if the given frequency is valid
+        freq : DateOffset
+            The frequency to validate
+        """
+        if is_period_dtype(cls):
+            # Frequency validation is not meaningful for Period Array/Index
+            return None
+
+        inferred = index.inferred_freq
+        if index.size == 0 or inferred == freq.freqstr:
+            return None
+
+        try:
+            on_freq = cls._generate_range(start=index[0], end=None,
+                                          periods=len(index), freq=freq,
+                                          **kwargs)
+            if not np.array_equal(index.asi8, on_freq.asi8):
+                raise ValueError
+        except ValueError as e:
+            if "non-fixed" in str(e):
+                # non-fixed frequencies are not meaningful for timedelta64;
+                #  we retain that error message
+                raise e
+            # GH#11587 the main way this is reached is if the `np.array_equal`
+            #  check above is False.  This can also be reached if index[0]
+            #  is `NaT`, in which case the call to `cls._generate_range` will
+            #  raise a ValueError, which we re-raise with a more targeted
+            #  message.
+            raise ValueError('Inferred frequency {infer} from passed values '
+                             'does not conform to passed frequency {passed}'
+                             .format(infer=inferred, passed=freq.freqstr))
+
+    # monotonicity/uniqueness properties are called via frequencies.infer_freq,
+    #  see GH#23789
+
+    @property
+    def _is_monotonic_increasing(self):
+        return algos.is_monotonic(self.asi8, timelike=True)[0]
+
+    @property
+    def _is_monotonic_decreasing(self):
+        return algos.is_monotonic(self.asi8, timelike=True)[1]
+
+    @property
+    def _is_unique(self):
+        return len(unique1d(self.asi8)) == len(self)
+
+    # ------------------------------------------------------------------
+    # Arithmetic Methods
+
+    def _add_datetimelike_scalar(self, other):
+        # Overriden by TimedeltaArray
+        raise TypeError("cannot add {cls} and {typ}"
+                        .format(cls=type(self).__name__,
+                                typ=type(other).__name__))
+
+    _add_datetime_arraylike = _add_datetimelike_scalar
+
+    def _sub_datetimelike_scalar(self, other):
+        # Overridden by DatetimeArray
+        assert other is not NaT
+        raise TypeError("cannot subtract a datelike from a {cls}"
+                        .format(cls=type(self).__name__))
+
+    _sub_datetime_arraylike = _sub_datetimelike_scalar
+
+    def _sub_period(self, other):
+        # Overriden by PeriodArray
+        raise TypeError("cannot subtract Period from a {cls}"
+                        .format(cls=type(self).__name__))
+
+    def _add_offset(self, offset):
+        raise AbstractMethodError(self)
+
+    def _add_delta(self, other):
+        """
+        Add a timedelta-like, Tick or TimedeltaIndex-like object
+        to self, yielding an int64 numpy array
+
+        Parameters
+        ----------
+        delta : {timedelta, np.timedelta64, Tick,
+                 TimedeltaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : ndarray[int64]
+
+        Notes
+        -----
+        The result's name is set outside of _add_delta by the calling
+        method (__add__ or __sub__), if necessary (i.e. for Indexes).
+        """
+        if isinstance(other, (Tick, timedelta, np.timedelta64)):
+            new_values = self._add_timedeltalike_scalar(other)
+        elif is_timedelta64_dtype(other):
+            # ndarray[timedelta64] or TimedeltaArray/index
+            new_values = self._add_delta_tdi(other)
+
+        return new_values
+
+    def _add_timedeltalike_scalar(self, other):
+        """
+        Add a delta of a timedeltalike
+        return the i8 result view
+        """
+        if isna(other):
+            # i.e np.timedelta64("NaT"), not recognized by delta_to_nanoseconds
+            new_values = np.empty(len(self), dtype='i8')
+            new_values[:] = iNaT
+            return new_values
+
+        inc = delta_to_nanoseconds(other)
+        new_values = checked_add_with_arr(self.asi8, inc,
+                                          arr_mask=self._isnan).view('i8')
+        new_values = self._maybe_mask_results(new_values)
+        return new_values.view('i8')
+
+    def _add_delta_tdi(self, other):
+        """
+        Add a delta of a TimedeltaIndex
+        return the i8 result view
+        """
+        if len(self) != len(other):
+            raise ValueError("cannot add indices of unequal length")
+
+        if isinstance(other, np.ndarray):
+            # ndarray[timedelta64]; wrap in TimedeltaIndex for op
+            from pandas import TimedeltaIndex
+            other = TimedeltaIndex(other)
+
+        self_i8 = self.asi8
+        other_i8 = other.asi8
+        new_values = checked_add_with_arr(self_i8, other_i8,
+                                          arr_mask=self._isnan,
+                                          b_mask=other._isnan)
+        if self._hasnans or other._hasnans:
+            mask = (self._isnan) | (other._isnan)
+            new_values[mask] = iNaT
+        return new_values.view('i8')
+
+    def _add_nat(self):
+        """
+        Add pd.NaT to self
+        """
+        if is_period_dtype(self):
+            raise TypeError('Cannot add {cls} and {typ}'
+                            .format(cls=type(self).__name__,
+                                    typ=type(NaT).__name__))
+
+        # GH#19124 pd.NaT is treated like a timedelta for both timedelta
+        # and datetime dtypes
+        result = np.zeros(len(self), dtype=np.int64)
+        result.fill(iNaT)
+        return type(self)(result, dtype=self.dtype, freq=None)
+
+    def _sub_nat(self):
+        """
+        Subtract pd.NaT from self
+        """
+        # GH#19124 Timedelta - datetime is not in general well-defined.
+        # We make an exception for pd.NaT, which in this case quacks
+        # like a timedelta.
+        # For datetime64 dtypes by convention we treat NaT as a datetime, so
+        # this subtraction returns a timedelta64 dtype.
+        # For period dtype, timedelta64 is a close-enough return dtype.
+        result = np.zeros(len(self), dtype=np.int64)
+        result.fill(iNaT)
+        return result.view('timedelta64[ns]')
+
+    def _sub_period_array(self, other):
+        """
+        Subtract a Period Array/Index from self.  This is only valid if self
+        is itself a Period Array/Index, raises otherwise.  Both objects must
+        have the same frequency.
+
+        Parameters
+        ----------
+        other : PeriodIndex or PeriodArray
+
+        Returns
+        -------
+        result : np.ndarray[object]
+            Array of DateOffset objects; nulls represented by NaT.
+        """
+        if not is_period_dtype(self):
+            raise TypeError("cannot subtract {dtype}-dtype from {cls}"
+                            .format(dtype=other.dtype,
+                                    cls=type(self).__name__))
+
+        if len(self) != len(other):
+            raise ValueError("cannot subtract arrays/indices of "
+                             "unequal length")
+        if self.freq != other.freq:
+            msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                        own_freq=self.freqstr,
+                                        other_freq=other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        new_values = checked_add_with_arr(self.asi8, -other.asi8,
+                                          arr_mask=self._isnan,
+                                          b_mask=other._isnan)
+
+        new_values = np.array([self.freq.base * x for x in new_values])
+        if self._hasnans or other._hasnans:
+            mask = (self._isnan) | (other._isnan)
+            new_values[mask] = NaT
+        return new_values
+
+    def _addsub_int_array(self, other, op):
+        """
+        Add or subtract array-like of integers equivalent to applying
+        `_time_shift` pointwise.
+
+        Parameters
+        ----------
+        other : Index, ExtensionArray, np.ndarray
+            integer-dtype
+        op : {operator.add, operator.sub}
+
+        Returns
+        -------
+        result : same class as self
+        """
+        # _addsub_int_array is overriden by PeriodArray
+        assert not is_period_dtype(self)
+        assert op in [operator.add, operator.sub]
+
+        if self.freq is None:
+            # GH#19123
+            raise NullFrequencyError("Cannot shift with no freq")
+
+        elif isinstance(self.freq, Tick):
+            # easy case where we can convert to timedelta64 operation
+            td = Timedelta(self.freq)
+            return op(self, td * other)
+
+        # We should only get here with DatetimeIndex; dispatch
+        # to _addsub_offset_array
+        assert not is_timedelta64_dtype(self)
+        return op(self, np.array(other) * self.freq)
+
+    def _addsub_offset_array(self, other, op):
+        """
+        Add or subtract array-like of DateOffset objects
+
+        Parameters
+        ----------
+        other : Index, np.ndarray
+            object-dtype containing pd.DateOffset objects
+        op : {operator.add, operator.sub}
+
+        Returns
+        -------
+        result : same class as self
+        """
+        assert op in [operator.add, operator.sub]
+        if len(other) == 1:
+            return op(self, other[0])
+
+        warnings.warn("Adding/subtracting array of DateOffsets to "
+                      "{cls} not vectorized"
+                      .format(cls=type(self).__name__), PerformanceWarning)
+
+        # For EA self.astype('O') returns a numpy array, not an Index
+        left = lib.values_from_object(self.astype('O'))
+
+        res_values = op(left, np.array(other))
+        kwargs = {}
+        if not is_period_dtype(self):
+            kwargs['freq'] = 'infer'
+        return self._from_sequence(res_values, **kwargs)
+
+    def _time_shift(self, periods, freq=None):
+        """
+        Shift each value by `periods`.
+
+        Note this is different from ExtensionArray.shift, which
+        shifts the *position* of each element, padding the end with
+        missing values.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods to shift by.
+        freq : pandas.DateOffset, pandas.Timedelta, or string
+            Frequency increment to shift by.
+        """
+        if freq is not None and freq != self.freq:
+            if isinstance(freq, compat.string_types):
+                freq = frequencies.to_offset(freq)
+            offset = periods * freq
+            result = self + offset
+            return result
+
+        if periods == 0:
+            # immutable so OK
+            return self.copy()
+
+        if self.freq is None:
+            raise NullFrequencyError("Cannot shift with no freq")
+
+        start = self[0] + periods * self.freq
+        end = self[-1] + periods * self.freq
+
+        # Note: in the DatetimeTZ case, _generate_range will infer the
+        #  appropriate timezone from `start` and `end`, so tz does not need
+        #  to be passed explicitly.
+        return self._generate_range(start=start, end=end, periods=None,
+                                    freq=self.freq)
+
+    def __add__(self, other):
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+
+        # scalar others
+        elif other is NaT:
+            result = self._add_nat()
+        elif isinstance(other, (Tick, timedelta, np.timedelta64)):
+            result = self._add_delta(other)
+        elif isinstance(other, DateOffset):
+            # specifically _not_ a Tick
+            result = self._add_offset(other)
+        elif isinstance(other, (datetime, np.datetime64)):
+            result = self._add_datetimelike_scalar(other)
+        elif lib.is_integer(other):
+            # This check must come after the check for np.timedelta64
+            # as is_integer returns True for these
+            if not is_period_dtype(self):
+                maybe_integer_op_deprecated(self)
+            result = self._time_shift(other)
+
+        # array-like others
+        elif is_timedelta64_dtype(other):
+            # TimedeltaIndex, ndarray[timedelta64]
+            result = self._add_delta(other)
+        elif is_offsetlike(other):
+            # Array/Index of DateOffset objects
+            result = self._addsub_offset_array(other, operator.add)
+        elif is_datetime64_dtype(other) or is_datetime64tz_dtype(other):
+            # DatetimeIndex, ndarray[datetime64]
+            return self._add_datetime_arraylike(other)
+        elif is_integer_dtype(other):
+            if not is_period_dtype(self):
+                maybe_integer_op_deprecated(self)
+            result = self._addsub_int_array(other, operator.add)
+        elif is_float_dtype(other):
+            # Explicitly catch invalid dtypes
+            raise TypeError("cannot add {dtype}-dtype to {cls}"
+                            .format(dtype=other.dtype,
+                                    cls=type(self).__name__))
+        elif is_period_dtype(other):
+            # if self is a TimedeltaArray and other is a PeriodArray with
+            #  a timedelta-like (i.e. Tick) freq, this operation is valid.
+            #  Defer to the PeriodArray implementation.
+            # In remaining cases, this will end up raising TypeError.
+            return NotImplemented
+        elif is_extension_array_dtype(other):
+            # Categorical op will raise; defer explicitly
+            return NotImplemented
+        else:  # pragma: no cover
+            return NotImplemented
+
+        if is_timedelta64_dtype(result) and isinstance(result, np.ndarray):
+            from pandas.core.arrays import TimedeltaArray
+            # TODO: infer freq?
+            return TimedeltaArray(result)
+        return result
+
+    def __radd__(self, other):
+        # alias for __add__
+        return self.__add__(other)
+
+    def __sub__(self, other):
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+
+        # scalar others
+        elif other is NaT:
+            result = self._sub_nat()
+        elif isinstance(other, (Tick, timedelta, np.timedelta64)):
+            result = self._add_delta(-other)
+        elif isinstance(other, DateOffset):
+            # specifically _not_ a Tick
+            result = self._add_offset(-other)
+        elif isinstance(other, (datetime, np.datetime64)):
+            result = self._sub_datetimelike_scalar(other)
+        elif lib.is_integer(other):
+            # This check must come after the check for np.timedelta64
+            # as is_integer returns True for these
+            if not is_period_dtype(self):
+                maybe_integer_op_deprecated(self)
+            result = self._time_shift(-other)
+
+        elif isinstance(other, Period):
+            result = self._sub_period(other)
+
+        # array-like others
+        elif is_timedelta64_dtype(other):
+            # TimedeltaIndex, ndarray[timedelta64]
+            result = self._add_delta(-other)
+        elif is_offsetlike(other):
+            # Array/Index of DateOffset objects
+            result = self._addsub_offset_array(other, operator.sub)
+        elif is_datetime64_dtype(other) or is_datetime64tz_dtype(other):
+            # DatetimeIndex, ndarray[datetime64]
+            result = self._sub_datetime_arraylike(other)
+        elif is_period_dtype(other):
+            # PeriodIndex
+            result = self._sub_period_array(other)
+        elif is_integer_dtype(other):
+            if not is_period_dtype(self):
+                maybe_integer_op_deprecated(self)
+            result = self._addsub_int_array(other, operator.sub)
+        elif isinstance(other, ABCIndexClass):
+            raise TypeError("cannot subtract {cls} and {typ}"
+                            .format(cls=type(self).__name__,
+                                    typ=type(other).__name__))
+        elif is_float_dtype(other):
+            # Explicitly catch invalid dtypes
+            raise TypeError("cannot subtract {dtype}-dtype from {cls}"
+                            .format(dtype=other.dtype,
+                                    cls=type(self).__name__))
+        elif is_extension_array_dtype(other):
+            # Categorical op will raise; defer explicitly
+            return NotImplemented
+        else:  # pragma: no cover
+            return NotImplemented
+
+        if is_timedelta64_dtype(result) and isinstance(result, np.ndarray):
+            from pandas.core.arrays import TimedeltaArray
+            # TODO: infer freq?
+            return TimedeltaArray(result)
+        return result
+
+    def __rsub__(self, other):
+        if is_datetime64_dtype(other) and is_timedelta64_dtype(self):
+            # ndarray[datetime64] cannot be subtracted from self, so
+            # we need to wrap in DatetimeArray/Index and flip the operation
+            if not isinstance(other, DatetimeLikeArrayMixin):
+                # Avoid down-casting DatetimeIndex
+                from pandas.core.arrays import DatetimeArray
+                other = DatetimeArray(other)
+            return other - self
+        elif (is_datetime64_any_dtype(self) and hasattr(other, 'dtype') and
+              not is_datetime64_any_dtype(other)):
+            # GH#19959 datetime - datetime is well-defined as timedelta,
+            # but any other type - datetime is not well-defined.
+            raise TypeError("cannot subtract {cls} from {typ}"
+                            .format(cls=type(self).__name__,
+                                    typ=type(other).__name__))
+        elif is_period_dtype(self) and is_timedelta64_dtype(other):
+            # TODO: Can we simplify/generalize these cases at all?
+            raise TypeError("cannot subtract {cls} from {dtype}"
+                            .format(cls=type(self).__name__,
+                                    dtype=other.dtype))
+        return -(self - other)
+
+    # FIXME: DTA/TDA/PA inplace methods should actually be inplace, GH#24115
+    def __iadd__(self, other):
+        # alias for __add__
+        return self.__add__(other)
+
+    def __isub__(self, other):
+        # alias for __sub__
+        return self.__sub__(other)
+
+    # --------------------------------------------------------------
+    # Comparison Methods
+
+    def _ensure_localized(self, arg, ambiguous='raise', nonexistent='raise',
+                          from_utc=False):
+        """
+        Ensure that we are re-localized.
+
+        This is for compat as we can then call this on all datetimelike
+        arrays generally (ignored for Period/Timedelta)
+
+        Parameters
+        ----------
+        arg : Union[DatetimeLikeArray, DatetimeIndexOpsMixin, ndarray]
+        ambiguous : str, bool, or bool-ndarray, default 'raise'
+        nonexistent : str, default 'raise'
+        from_utc : bool, default False
+            If True, localize the i8 ndarray to UTC first before converting to
+            the appropriate tz. If False, localize directly to the tz.
+
+        Returns
+        -------
+        localized array
+        """
+
+        # reconvert to local tz
+        tz = getattr(self, 'tz', None)
+        if tz is not None:
+            if not isinstance(arg, type(self)):
+                arg = self._simple_new(arg)
+            if from_utc:
+                arg = arg.tz_localize('UTC').tz_convert(self.tz)
+            else:
+                arg = arg.tz_localize(
+                    self.tz, ambiguous=ambiguous, nonexistent=nonexistent
+                )
+        return arg
+
+    # --------------------------------------------------------------
+    # Reductions
+
+    def _reduce(self, name, axis=0, skipna=True, **kwargs):
+        op = getattr(self, name, None)
+        if op:
+            return op(axis=axis, skipna=skipna, **kwargs)
+        else:
+            return super(DatetimeLikeArrayMixin, self)._reduce(
+                name, skipna, **kwargs
+            )
+
+    def min(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Return the minimum value of the Array or minimum along
+        an axis.
+
+        See Also
+        --------
+        numpy.ndarray.min
+        Index.min : Return the minimum value in an Index.
+        Series.min : Return the minimum value in a Series.
+        """
+        nv.validate_min(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        result = nanops.nanmin(self.asi8, skipna=skipna, mask=self.isna())
+        if isna(result):
+            # Period._from_ordinal does not handle np.nan gracefully
+            return NaT
+        return self._box_func(result)
+
+    def max(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Return the maximum value of the Array or maximum along
+        an axis.
+
+        See Also
+        --------
+        numpy.ndarray.max
+        Index.max : Return the maximum value in an Index.
+        Series.max : Return the maximum value in a Series.
+        """
+        # TODO: skipna is broken with max.
+        # See https://github.com/pandas-dev/pandas/issues/24265
+        nv.validate_max(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        mask = self.isna()
+        if skipna:
+            values = self[~mask].asi8
+        elif mask.any():
+            return NaT
+        else:
+            values = self.asi8
+
+        if not len(values):
+            # short-circut for empty max / min
+            return NaT
+
+        result = nanops.nanmax(values, skipna=skipna)
+        # Don't have to worry about NA `result`, since no NA went in.
+        return self._box_func(result)
+
+
+# -------------------------------------------------------------------
+# Shared Constructor Helpers
+
+def validate_periods(periods):
+    """
+    If a `periods` argument is passed to the Datetime/Timedelta Array/Index
+    constructor, cast it to an integer.
+
+    Parameters
+    ----------
+    periods : None, float, int
+
+    Returns
+    -------
+    periods : None or int
+
+    Raises
+    ------
+    TypeError
+        if periods is None, float, or int
+    """
+    if periods is not None:
+        if lib.is_float(periods):
+            periods = int(periods)
+        elif not lib.is_integer(periods):
+            raise TypeError('periods must be a number, got {periods}'
+                            .format(periods=periods))
+    return periods
+
+
+def validate_endpoints(closed):
+    """
+    Check that the `closed` argument is among [None, "left", "right"]
+
+    Parameters
+    ----------
+    closed : {None, "left", "right"}
+
+    Returns
+    -------
+    left_closed : bool
+    right_closed : bool
+
+    Raises
+    ------
+    ValueError : if argument is not among valid values
+    """
+    left_closed = False
+    right_closed = False
+
+    if closed is None:
+        left_closed = True
+        right_closed = True
+    elif closed == "left":
+        left_closed = True
+    elif closed == "right":
+        right_closed = True
+    else:
+        raise ValueError("Closed has to be either 'left', 'right' or None")
+
+    return left_closed, right_closed
+
+
+def validate_inferred_freq(freq, inferred_freq, freq_infer):
+    """
+    If the user passes a freq and another freq is inferred from passed data,
+    require that they match.
+
+    Parameters
+    ----------
+    freq : DateOffset or None
+    inferred_freq : DateOffset or None
+    freq_infer : bool
+
+    Returns
+    -------
+    freq : DateOffset or None
+    freq_infer : bool
+
+    Notes
+    -----
+    We assume at this point that `maybe_infer_freq` has been called, so
+    `freq` is either a DateOffset object or None.
+    """
+    if inferred_freq is not None:
+        if freq is not None and freq != inferred_freq:
+            raise ValueError('Inferred frequency {inferred} from passed '
+                             'values does not conform to passed frequency '
+                             '{passed}'
+                             .format(inferred=inferred_freq,
+                                     passed=freq.freqstr))
+        elif freq is None:
+            freq = inferred_freq
+        freq_infer = False
+
+    return freq, freq_infer
+
+
+def maybe_infer_freq(freq):
+    """
+    Comparing a DateOffset to the string "infer" raises, so we need to
+    be careful about comparisons.  Make a dummy variable `freq_infer` to
+    signify the case where the given freq is "infer" and set freq to None
+    to avoid comparison trouble later on.
+
+    Parameters
+    ----------
+    freq : {DateOffset, None, str}
+
+    Returns
+    -------
+    freq : {DateOffset, None}
+    freq_infer : bool
+    """
+    freq_infer = False
+    if not isinstance(freq, DateOffset):
+        # if a passed freq is None, don't infer automatically
+        if freq != 'infer':
+            freq = frequencies.to_offset(freq)
+        else:
+            freq_infer = True
+            freq = None
+    return freq, freq_infer
+
+
+def _ensure_datetimelike_to_i8(other, to_utc=False):
+    """
+    Helper for coercing an input scalar or array to i8.
+
+    Parameters
+    ----------
+    other : 1d array
+    to_utc : bool, default False
+        If True, convert the values to UTC before extracting the i8 values
+        If False, extract the i8 values directly.
+
+    Returns
+    -------
+    i8 1d array
+    """
+    from pandas import Index
+    from pandas.core.arrays import PeriodArray
+
+    if lib.is_scalar(other) and isna(other):
+        return iNaT
+    elif isinstance(other, (PeriodArray, ABCIndexClass,
+                            DatetimeLikeArrayMixin)):
+        # convert tz if needed
+        if getattr(other, 'tz', None) is not None:
+            if to_utc:
+                other = other.tz_convert('UTC')
+            else:
+                other = other.tz_localize(None)
+    else:
+        try:
+            return np.array(other, copy=False).view('i8')
+        except TypeError:
+            # period array cannot be coerced to int
+            other = Index(other)
+    return other.asi8
diff --git a/pandas/core/arrays/datetimes.py b/pandas/core/arrays/datetimes.py
new file mode 100644
index 0000000000000..75cf658423210
--- /dev/null
+++ b/pandas/core/arrays/datetimes.py
@@ -0,0 +1,2148 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, time, timedelta
+import textwrap
+import warnings
+
+import numpy as np
+from pytz import utc
+
+from pandas._libs import lib, tslib
+from pandas._libs.tslibs import (
+    NaT, Timestamp, ccalendar, conversion, fields, iNaT, normalize_date,
+    resolution as libresolution, timezones)
+import pandas.compat as compat
+from pandas.errors import PerformanceWarning
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.common import (
+    _INT64_DTYPE, _NS_DTYPE, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64_ns_dtype, is_datetime64tz_dtype, is_dtype_equal,
+    is_extension_type, is_float_dtype, is_object_dtype, is_period_dtype,
+    is_string_dtype, is_timedelta64_dtype, pandas_dtype)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndexClass, ABCPandasArray, ABCSeries)
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import ops
+from pandas.core.algorithms import checked_add_with_arr
+from pandas.core.arrays import datetimelike as dtl
+from pandas.core.arrays._ranges import generate_regular_range
+import pandas.core.common as com
+
+from pandas.tseries.frequencies import get_period_alias, to_offset
+from pandas.tseries.offsets import Day, Tick
+
+_midnight = time(0, 0)
+# TODO(GH-24559): Remove warning, int_as_wall_time parameter.
+_i8_message = """
+    Passing integer-dtype data and a timezone to DatetimeIndex. Integer values
+    will be interpreted differently in a future version of pandas. Previously,
+    these were viewed as datetime64[ns] values representing the wall time
+    *in the specified timezone*. In the future, these will be viewed as
+    datetime64[ns] values representing the wall time *in UTC*. This is similar
+    to a nanosecond-precision UNIX epoch. To accept the future behavior, use
+
+        pd.to_datetime(integer_data, utc=True).tz_convert(tz)
+
+    To keep the previous behavior, use
+
+        pd.to_datetime(integer_data).tz_localize(tz)
+"""
+
+
+def tz_to_dtype(tz):
+    """
+    Return a datetime64[ns] dtype appropriate for the given timezone.
+
+    Parameters
+    ----------
+    tz : tzinfo or None
+
+    Returns
+    -------
+    np.dtype or Datetime64TZDType
+    """
+    if tz is None:
+        return _NS_DTYPE
+    else:
+        return DatetimeTZDtype(tz=tz)
+
+
+def _to_M8(key, tz=None):
+    """
+    Timestamp-like => dt64
+    """
+    if not isinstance(key, Timestamp):
+        # this also converts strings
+        key = Timestamp(key)
+        if key.tzinfo is not None and tz is not None:
+            # Don't tz_localize(None) if key is already tz-aware
+            key = key.tz_convert(tz)
+        else:
+            key = key.tz_localize(tz)
+
+    return np.int64(conversion.pydt_to_i8(key)).view(_NS_DTYPE)
+
+
+def _field_accessor(name, field, docstring=None):
+    def f(self):
+        values = self.asi8
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            values = self._local_timestamps()
+
+        if field in self._bool_ops:
+            if field.endswith(('start', 'end')):
+                freq = self.freq
+                month_kw = 12
+                if freq:
+                    kwds = freq.kwds
+                    month_kw = kwds.get('startingMonth', kwds.get('month', 12))
+
+                result = fields.get_start_end_field(values, field,
+                                                    self.freqstr, month_kw)
+            else:
+                result = fields.get_date_field(values, field)
+
+            # these return a boolean by-definition
+            return result
+
+        if field in self._object_ops:
+            result = fields.get_date_name_field(values, field)
+            result = self._maybe_mask_results(result, fill_value=None)
+
+        else:
+            result = fields.get_date_field(values, field)
+            result = self._maybe_mask_results(result, fill_value=None,
+                                              convert='float64')
+
+        return result
+
+    f.__name__ = name
+    f.__doc__ = "\n{}\n".format(docstring)
+    return property(f)
+
+
+def _dt_array_cmp(cls, op):
+    """
+    Wrap comparison operations to convert datetime-like to datetime64
+    """
+    opname = '__{name}__'.format(name=op.__name__)
+    nat_result = opname == '__ne__'
+
+    def wrapper(self, other):
+        if isinstance(other, (ABCDataFrame, ABCSeries, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+
+        if isinstance(other, (datetime, np.datetime64, compat.string_types)):
+            if isinstance(other, (datetime, np.datetime64)):
+                # GH#18435 strings get a pass from tzawareness compat
+                self._assert_tzawareness_compat(other)
+
+            try:
+                other = _to_M8(other, tz=self.tz)
+            except ValueError:
+                # string that cannot be parsed to Timestamp
+                return ops.invalid_comparison(self, other, op)
+
+            result = op(self.asi8, other.view('i8'))
+            if isna(other):
+                result.fill(nat_result)
+        elif lib.is_scalar(other) or np.ndim(other) == 0:
+            return ops.invalid_comparison(self, other, op)
+        elif len(other) != len(self):
+            raise ValueError("Lengths must match")
+        else:
+            if isinstance(other, list):
+                try:
+                    other = type(self)._from_sequence(other)
+                except ValueError:
+                    other = np.array(other, dtype=np.object_)
+            elif not isinstance(other, (np.ndarray, ABCIndexClass, ABCSeries,
+                                        DatetimeArray)):
+                # Following Timestamp convention, __eq__ is all-False
+                # and __ne__ is all True, others raise TypeError.
+                return ops.invalid_comparison(self, other, op)
+
+            if is_object_dtype(other):
+                # We have to use _comp_method_OBJECT_ARRAY instead of numpy
+                #  comparison otherwise it would fail to raise when
+                #  comparing tz-aware and tz-naive
+                with np.errstate(all='ignore'):
+                    result = ops._comp_method_OBJECT_ARRAY(op,
+                                                           self.astype(object),
+                                                           other)
+                o_mask = isna(other)
+            elif not (is_datetime64_dtype(other) or
+                      is_datetime64tz_dtype(other)):
+                # e.g. is_timedelta64_dtype(other)
+                return ops.invalid_comparison(self, other, op)
+            else:
+                self._assert_tzawareness_compat(other)
+                if isinstance(other, (ABCIndexClass, ABCSeries)):
+                    other = other.array
+
+                if (is_datetime64_dtype(other) and
+                        not is_datetime64_ns_dtype(other) or
+                        not hasattr(other, 'asi8')):
+                    # e.g. other.dtype == 'datetime64[s]'
+                    # or an object-dtype ndarray
+                    other = type(self)._from_sequence(other)
+
+                result = op(self.view('i8'), other.view('i8'))
+                o_mask = other._isnan
+
+            result = com.values_from_object(result)
+
+            # Make sure to pass an array to result[...]; indexing with
+            # Series breaks with older version of numpy
+            o_mask = np.array(o_mask)
+            if o_mask.any():
+                result[o_mask] = nat_result
+
+        if self._hasnans:
+            result[self._isnan] = nat_result
+
+        return result
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+class DatetimeArray(dtl.DatetimeLikeArrayMixin,
+                    dtl.TimelikeOps,
+                    dtl.DatelikeOps):
+    """
+    Pandas ExtensionArray for tz-naive or tz-aware datetime data.
+
+    .. versionadded:: 0.24.0
+
+    .. warning::
+
+       DatetimeArray is currently experimental, and its API may change
+       without warning. In particular, :attr:`DatetimeArray.dtype` is
+       expected to change to always be an instance of an ``ExtensionDtype``
+       subclass.
+
+    Parameters
+    ----------
+    values : Series, Index, DatetimeArray, ndarray
+        The datetime data.
+
+        For DatetimeArray `values` (or a Series or Index boxing one),
+        `dtype` and `freq` will be extracted from `values`, with
+        precedence given to
+
+    dtype : numpy.dtype or DatetimeTZDtype
+        Note that the only NumPy dtype allowed is 'datetime64[ns]'.
+    freq : str or Offset, optional
+    copy : bool, default False
+        Whether to copy the underlying array of values.
+    """
+    _typ = "datetimearray"
+    _scalar_type = Timestamp
+
+    # define my properties & methods for delegation
+    _bool_ops = ['is_month_start', 'is_month_end',
+                 'is_quarter_start', 'is_quarter_end', 'is_year_start',
+                 'is_year_end', 'is_leap_year']
+    _object_ops = ['weekday_name', 'freq', 'tz']
+    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'week', 'weekday', 'dayofweek',
+                  'dayofyear', 'quarter', 'days_in_month',
+                  'daysinmonth', 'microsecond',
+                  'nanosecond']
+    _other_ops = ['date', 'time', 'timetz']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops + _other_ops
+    _datetimelike_methods = ['to_period', 'tz_localize',
+                             'tz_convert',
+                             'normalize', 'strftime', 'round', 'floor',
+                             'ceil', 'month_name', 'day_name']
+
+    # dummy attribute so that datetime.__eq__(DatetimeArray) defers
+    # by returning NotImplemented
+    timetuple = None
+
+    # Needed so that Timestamp.__richcmp__(DateTimeArray) operates pointwise
+    ndim = 1
+
+    # ensure that operations with numpy arrays defer to our implementation
+    __array_priority__ = 1000
+
+    # -----------------------------------------------------------------
+    # Constructors
+
+    _attributes = ["freq", "tz"]
+    _dtype = None  # type: Union[np.dtype, DatetimeTZDtype]
+    _freq = None
+
+    def __init__(self, values, dtype=_NS_DTYPE, freq=None, copy=False):
+        if isinstance(values, (ABCSeries, ABCIndexClass)):
+            values = values._values
+
+        inferred_freq = getattr(values, "_freq", None)
+
+        if isinstance(values, type(self)):
+            # validation
+            dtz = getattr(dtype, 'tz', None)
+            if dtz and values.tz is None:
+                dtype = DatetimeTZDtype(tz=dtype.tz)
+            elif dtz and values.tz:
+                if not timezones.tz_compare(dtz, values.tz):
+                    msg = (
+                        "Timezone of the array and 'dtype' do not match. "
+                        "'{}' != '{}'"
+                    )
+                    raise TypeError(msg.format(dtz, values.tz))
+            elif values.tz:
+                dtype = values.dtype
+            # freq = validate_values_freq(values, freq)
+            if freq is None:
+                freq = values.freq
+            values = values._data
+
+        if not isinstance(values, np.ndarray):
+            msg = (
+                "Unexpected type '{}'. 'values' must be a DatetimeArray "
+                "ndarray, or Series or Index containing one of those."
+            )
+            raise ValueError(msg.format(type(values).__name__))
+
+        if values.dtype == 'i8':
+            # for compat with datetime/timedelta/period shared methods,
+            #  we can sometimes get here with int64 values.  These represent
+            #  nanosecond UTC (or tz-naive) unix timestamps
+            values = values.view(_NS_DTYPE)
+
+        if values.dtype != _NS_DTYPE:
+            msg = (
+                "The dtype of 'values' is incorrect. Must be 'datetime64[ns]'."
+                " Got {} instead."
+            )
+            raise ValueError(msg.format(values.dtype))
+
+        dtype = _validate_dt64_dtype(dtype)
+
+        if freq == "infer":
+            msg = (
+                "Frequency inference not allowed in DatetimeArray.__init__. "
+                "Use 'pd.array()' instead."
+            )
+            raise ValueError(msg)
+
+        if copy:
+            values = values.copy()
+        if freq:
+            freq = to_offset(freq)
+        if getattr(dtype, 'tz', None):
+            # https://github.com/pandas-dev/pandas/issues/18595
+            # Ensure that we have a standard timezone for pytz objects.
+            # Without this, things like adding an array of timedeltas and
+            # a  tz-aware Timestamp (with a tz specific to its datetime) will
+            # be incorrect(ish?) for the array as a whole
+            dtype = DatetimeTZDtype(tz=timezones.tz_standardize(dtype.tz))
+
+        self._data = values
+        self._dtype = dtype
+        self._freq = freq
+
+        if inferred_freq is None and freq is not None:
+            type(self)._validate_frequency(self, freq)
+
+    @classmethod
+    def _simple_new(cls, values, freq=None, dtype=_NS_DTYPE):
+        assert isinstance(values, np.ndarray)
+        if values.dtype == 'i8':
+            values = values.view(_NS_DTYPE)
+
+        result = object.__new__(cls)
+        result._data = values
+        result._freq = freq
+        result._dtype = dtype
+        return result
+
+    @classmethod
+    def _from_sequence(cls, data, dtype=None, copy=False,
+                       tz=None, freq=None,
+                       dayfirst=False, yearfirst=False, ambiguous='raise',
+                       int_as_wall_time=False):
+
+        freq, freq_infer = dtl.maybe_infer_freq(freq)
+
+        subarr, tz, inferred_freq = sequence_to_dt64ns(
+            data, dtype=dtype, copy=copy, tz=tz,
+            dayfirst=dayfirst, yearfirst=yearfirst,
+            ambiguous=ambiguous, int_as_wall_time=int_as_wall_time)
+
+        freq, freq_infer = dtl.validate_inferred_freq(freq, inferred_freq,
+                                                      freq_infer)
+
+        dtype = tz_to_dtype(tz)
+        result = cls._simple_new(subarr, freq=freq, dtype=dtype)
+
+        if inferred_freq is None and freq is not None:
+            # this condition precludes `freq_infer`
+            cls._validate_frequency(result, freq, ambiguous=ambiguous)
+
+        elif freq_infer:
+            # Set _freq directly to bypass duplicative _validate_frequency
+            # check.
+            result._freq = to_offset(result.inferred_freq)
+
+        return result
+
+    @classmethod
+    def _generate_range(cls, start, end, periods, freq, tz=None,
+                        normalize=False, ambiguous='raise',
+                        nonexistent='raise', closed=None):
+
+        periods = dtl.validate_periods(periods)
+        if freq is None and any(x is None for x in [periods, start, end]):
+            raise ValueError('Must provide freq argument if no data is '
+                             'supplied')
+
+        if com.count_not_none(start, end, periods, freq) != 3:
+            raise ValueError('Of the four parameters: start, end, periods, '
+                             'and freq, exactly three must be specified')
+        freq = to_offset(freq)
+
+        if start is not None:
+            start = Timestamp(start)
+
+        if end is not None:
+            end = Timestamp(end)
+
+        if start is None and end is None:
+            if closed is not None:
+                raise ValueError("Closed has to be None if not both of start"
+                                 "and end are defined")
+        if start is NaT or end is NaT:
+            raise ValueError("Neither `start` nor `end` can be NaT")
+
+        left_closed, right_closed = dtl.validate_endpoints(closed)
+
+        start, end, _normalized = _maybe_normalize_endpoints(start, end,
+                                                             normalize)
+
+        tz = _infer_tz_from_endpoints(start, end, tz)
+
+        if tz is not None:
+            # Localize the start and end arguments
+            start = _maybe_localize_point(
+                start, getattr(start, 'tz', None), start, freq, tz
+            )
+            end = _maybe_localize_point(
+                end, getattr(end, 'tz', None), end, freq, tz
+            )
+        if freq is not None:
+            # We break Day arithmetic (fixed 24 hour) here and opt for
+            # Day to mean calendar day (23/24/25 hour). Therefore, strip
+            # tz info from start and day to avoid DST arithmetic
+            if isinstance(freq, Day):
+                if start is not None:
+                    start = start.tz_localize(None)
+                if end is not None:
+                    end = end.tz_localize(None)
+            # TODO: consider re-implementing _cached_range; GH#17914
+            values, _tz = generate_regular_range(start, end, periods, freq)
+            index = cls._simple_new(values, freq=freq, dtype=tz_to_dtype(_tz))
+
+            if tz is not None and index.tz is None:
+                arr = conversion.tz_localize_to_utc(
+                    index.asi8,
+                    tz, ambiguous=ambiguous, nonexistent=nonexistent)
+
+                index = cls(arr)
+
+                # index is localized datetime64 array -> have to convert
+                # start/end as well to compare
+                if start is not None:
+                    start = start.tz_localize(tz).asm8
+                if end is not None:
+                    end = end.tz_localize(tz).asm8
+        else:
+            # Create a linearly spaced date_range in local time
+            # Nanosecond-granularity timestamps aren't always correctly
+            # representable with doubles, so we limit the range that we
+            # pass to np.linspace as much as possible
+            arr = np.linspace(
+                0, end.value - start.value,
+                periods, dtype='int64') + start.value
+            dtype = tz_to_dtype(tz)
+            index = cls._simple_new(
+                arr.astype('M8[ns]', copy=False), freq=None, dtype=dtype
+            )
+
+        if not left_closed and len(index) and index[0] == start:
+            index = index[1:]
+        if not right_closed and len(index) and index[-1] == end:
+            index = index[:-1]
+
+        dtype = tz_to_dtype(tz)
+        return cls._simple_new(index.asi8, freq=freq, dtype=dtype)
+
+    # -----------------------------------------------------------------
+    # DatetimeLike Interface
+
+    def _unbox_scalar(self, value):
+        if not isinstance(value, self._scalar_type) and value is not NaT:
+            raise ValueError("'value' should be a Timestamp.")
+        if not isna(value):
+            self._check_compatible_with(value)
+        return value.value
+
+    def _scalar_from_string(self, value):
+        return Timestamp(value, tz=self.tz)
+
+    def _check_compatible_with(self, other):
+        if other is NaT:
+            return
+        if not timezones.tz_compare(self.tz, other.tz):
+            raise ValueError("Timezones don't match. '{own} != {other}'"
+                             .format(own=self.tz, other=other.tz))
+
+    def _maybe_clear_freq(self):
+        self._freq = None
+
+    # -----------------------------------------------------------------
+    # Descriptive Properties
+
+    @property
+    def _box_func(self):
+        return lambda x: Timestamp(x, freq=self.freq, tz=self.tz)
+
+    @property
+    def dtype(self):
+        # type: () -> Union[np.dtype, DatetimeTZDtype]
+        """
+        The dtype for the DatetimeArray.
+
+        .. warning::
+
+           A future version of pandas will change dtype to never be a
+           ``numpy.dtype``. Instead, :attr:`DatetimeArray.dtype` will
+           always be an instance of an ``ExtensionDtype`` subclass.
+
+        Returns
+        -------
+        numpy.dtype or DatetimeTZDtype
+            If the values are tz-naive, then ``np.dtype('datetime64[ns]')``
+            is returned.
+
+            If the values are tz-aware, then the ``DatetimeTZDtype``
+            is returned.
+        """
+        return self._dtype
+
+    @property
+    def tz(self):
+        """
+        Return timezone, if any.
+
+        Returns
+        -------
+        datetime.tzinfo, pytz.tzinfo.BaseTZInfo, dateutil.tz.tz.tzfile, or None
+            Returns None when the array is tz-naive.
+        """
+        # GH 18595
+        return getattr(self.dtype, "tz", None)
+
+    @tz.setter
+    def tz(self, value):
+        # GH 3746: Prevent localizing or converting the index by setting tz
+        raise AttributeError("Cannot directly set timezone. Use tz_localize() "
+                             "or tz_convert() as appropriate")
+
+    @property
+    def tzinfo(self):
+        """
+        Alias for tz attribute
+        """
+        return self.tz
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def _timezone(self):
+        """
+        Comparable timezone both for pytz / dateutil
+        """
+        return timezones.get_timezone(self.tzinfo)
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def is_normalized(self):
+        """
+        Returns True if all of the dates are at midnight ("no time")
+        """
+        return conversion.is_date_array_normalized(self.asi8, self.tz)
+
+    @property  # NB: override with cache_readonly in immutable subclasses
+    def _resolution(self):
+        return libresolution.resolution(self.asi8, self.tz)
+
+    # ----------------------------------------------------------------
+    # Array-Like / EA-Interface Methods
+
+    def __array__(self, dtype=None):
+        if dtype is None and self.tz:
+            # The default for tz-aware is object, to preserve tz info
+            dtype = object
+
+        return super(DatetimeArray, self).__array__(dtype=dtype)
+
+    def __iter__(self):
+        """
+        Return an iterator over the boxed values
+
+        Yields
+        -------
+        tstamp : Timestamp
+        """
+
+        # convert in chunks of 10k for efficiency
+        data = self.asi8
+        length = len(self)
+        chunksize = 10000
+        chunks = int(length / chunksize) + 1
+        for i in range(chunks):
+            start_i = i * chunksize
+            end_i = min((i + 1) * chunksize, length)
+            converted = tslib.ints_to_pydatetime(data[start_i:end_i],
+                                                 tz=self.tz, freq=self.freq,
+                                                 box="timestamp")
+            for v in converted:
+                yield v
+
+    def astype(self, dtype, copy=True):
+        # We handle
+        #   --> datetime
+        #   --> period
+        # DatetimeLikeArrayMixin Super handles the rest.
+        dtype = pandas_dtype(dtype)
+
+        if (is_datetime64_ns_dtype(dtype) and
+                not is_dtype_equal(dtype, self.dtype)):
+            # GH#18951: datetime64_ns dtype but not equal means different tz
+            new_tz = getattr(dtype, 'tz', None)
+            if getattr(self.dtype, 'tz', None) is None:
+                return self.tz_localize(new_tz)
+            result = self.tz_convert(new_tz)
+            if new_tz is None:
+                # Do we want .astype('datetime64[ns]') to be an ndarray.
+                # The astype in Block._astype expects this to return an
+                # ndarray, but we could maybe work around it there.
+                result = result._data
+            return result
+        elif is_datetime64tz_dtype(self.dtype) and is_dtype_equal(self.dtype,
+                                                                  dtype):
+            if copy:
+                return self.copy()
+            return self
+        elif is_period_dtype(dtype):
+            return self.to_period(freq=dtype.freq)
+        return dtl.DatetimeLikeArrayMixin.astype(self, dtype, copy)
+
+    # ----------------------------------------------------------------
+    # ExtensionArray Interface
+
+    @Appender(dtl.DatetimeLikeArrayMixin._validate_fill_value.__doc__)
+    def _validate_fill_value(self, fill_value):
+        if isna(fill_value):
+            fill_value = iNaT
+        elif isinstance(fill_value, (datetime, np.datetime64)):
+            self._assert_tzawareness_compat(fill_value)
+            fill_value = Timestamp(fill_value).value
+        else:
+            raise ValueError("'fill_value' should be a Timestamp. "
+                             "Got '{got}'.".format(got=fill_value))
+        return fill_value
+
+    # -----------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_native_types(self, na_rep='NaT', date_format=None, **kwargs):
+        from pandas.io.formats.format import _get_format_datetime64_from_values
+        fmt = _get_format_datetime64_from_values(self, date_format)
+
+        return tslib.format_array_from_datetime(self.asi8,
+                                                tz=self.tz,
+                                                format=fmt,
+                                                na_rep=na_rep)
+
+    # -----------------------------------------------------------------
+    # Comparison Methods
+
+    _create_comparison_method = classmethod(_dt_array_cmp)
+
+    def _has_same_tz(self, other):
+        zzone = self._timezone
+
+        # vzone sholdn't be None if value is non-datetime like
+        if isinstance(other, np.datetime64):
+            # convert to Timestamp as np.datetime64 doesn't have tz attr
+            other = Timestamp(other)
+        vzone = timezones.get_timezone(getattr(other, 'tzinfo', '__no_tz__'))
+        return zzone == vzone
+
+    def _assert_tzawareness_compat(self, other):
+        # adapted from _Timestamp._assert_tzawareness_compat
+        other_tz = getattr(other, 'tzinfo', None)
+        if is_datetime64tz_dtype(other):
+            # Get tzinfo from Series dtype
+            other_tz = other.dtype.tz
+        if other is NaT:
+            # pd.NaT quacks both aware and naive
+            pass
+        elif self.tz is None:
+            if other_tz is not None:
+                raise TypeError('Cannot compare tz-naive and tz-aware '
+                                'datetime-like objects.')
+        elif other_tz is None:
+            raise TypeError('Cannot compare tz-naive and tz-aware '
+                            'datetime-like objects')
+
+    # -----------------------------------------------------------------
+    # Arithmetic Methods
+
+    def _sub_datetime_arraylike(self, other):
+        """subtract DatetimeArray/Index or ndarray[datetime64]"""
+        if len(self) != len(other):
+            raise ValueError("cannot add indices of unequal length")
+
+        if isinstance(other, np.ndarray):
+            assert is_datetime64_dtype(other)
+            other = type(self)(other)
+
+        if not self._has_same_tz(other):
+            # require tz compat
+            raise TypeError("{cls} subtraction must have the same "
+                            "timezones or no timezones"
+                            .format(cls=type(self).__name__))
+
+        self_i8 = self.asi8
+        other_i8 = other.asi8
+        arr_mask = self._isnan | other._isnan
+        new_values = checked_add_with_arr(self_i8, -other_i8,
+                                          arr_mask=arr_mask)
+        if self._hasnans or other._hasnans:
+            new_values[arr_mask] = iNaT
+        return new_values.view('timedelta64[ns]')
+
+    def _add_offset(self, offset):
+        assert not isinstance(offset, Tick)
+        try:
+            if self.tz is not None:
+                values = self.tz_localize(None)
+            else:
+                values = self
+            result = offset.apply_index(values)
+            if self.tz is not None:
+                result = result.tz_localize(self.tz)
+
+        except NotImplementedError:
+            warnings.warn("Non-vectorized DateOffset being applied to Series "
+                          "or DatetimeIndex", PerformanceWarning)
+            result = self.astype('O') + offset
+
+        return type(self)._from_sequence(result, freq='infer')
+
+    def _sub_datetimelike_scalar(self, other):
+        # subtract a datetime from myself, yielding a ndarray[timedelta64[ns]]
+        assert isinstance(other, (datetime, np.datetime64))
+        assert other is not NaT
+        other = Timestamp(other)
+        if other is NaT:
+            return self - NaT
+
+        if not self._has_same_tz(other):
+            # require tz compat
+            raise TypeError("Timestamp subtraction must have the same "
+                            "timezones or no timezones")
+
+        i8 = self.asi8
+        result = checked_add_with_arr(i8, -other.value,
+                                      arr_mask=self._isnan)
+        result = self._maybe_mask_results(result)
+        return result.view('timedelta64[ns]')
+
+    def _add_delta(self, delta):
+        """
+        Add a timedelta-like, Tick, or TimedeltaIndex-like object
+        to self, yielding a new DatetimeArray
+
+        Parameters
+        ----------
+        other : {timedelta, np.timedelta64, Tick,
+                 TimedeltaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : DatetimeArray
+        """
+        new_values = super(DatetimeArray, self)._add_delta(delta)
+        return type(self)._from_sequence(new_values, tz=self.tz, freq='infer')
+
+    # -----------------------------------------------------------------
+    # Timezone Conversion and Localization Methods
+
+    def _local_timestamps(self):
+        """
+        Convert to an i8 (unix-like nanosecond timestamp) representation
+        while keeping the local timezone and not using UTC.
+        This is used to calculate time-of-day information as if the timestamps
+        were timezone-naive.
+        """
+        return conversion.tz_convert(self.asi8, utc, self.tz)
+
+    def tz_convert(self, tz):
+        """
+        Convert tz-aware Datetime Array/Index from one time zone to another.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone for time. Corresponding timestamps would be converted
+            to this time zone of the Datetime Array/Index. A `tz` of None will
+            convert to UTC and remove the timezone information.
+
+        Returns
+        -------
+        Array or Index
+
+        Raises
+        ------
+        TypeError
+            If Datetime Array/Index is tz-naive.
+
+        See Also
+        --------
+        DatetimeIndex.tz : A timezone that has a variable offset from UTC.
+        DatetimeIndex.tz_localize : Localize tz-naive DatetimeIndex to a
+            given time zone, or remove timezone from a tz-aware DatetimeIndex.
+
+        Examples
+        --------
+        With the `tz` parameter, we can change the DatetimeIndex
+        to other time zones:
+
+        >>> dti = pd.date_range(start='2014-08-01 09:00',
+        ...                     freq='H', periods=3, tz='Europe/Berlin')
+
+        >>> dti
+        DatetimeIndex(['2014-08-01 09:00:00+02:00',
+                       '2014-08-01 10:00:00+02:00',
+                       '2014-08-01 11:00:00+02:00'],
+                      dtype='datetime64[ns, Europe/Berlin]', freq='H')
+
+        >>> dti.tz_convert('US/Central')
+        DatetimeIndex(['2014-08-01 02:00:00-05:00',
+                       '2014-08-01 03:00:00-05:00',
+                       '2014-08-01 04:00:00-05:00'],
+                      dtype='datetime64[ns, US/Central]', freq='H')
+
+        With the ``tz=None``, we can remove the timezone (after converting
+        to UTC if necessary):
+
+        >>> dti = pd.date_range(start='2014-08-01 09:00', freq='H',
+        ...                     periods=3, tz='Europe/Berlin')
+
+        >>> dti
+        DatetimeIndex(['2014-08-01 09:00:00+02:00',
+                       '2014-08-01 10:00:00+02:00',
+                       '2014-08-01 11:00:00+02:00'],
+                        dtype='datetime64[ns, Europe/Berlin]', freq='H')
+
+        >>> dti.tz_convert(None)
+        DatetimeIndex(['2014-08-01 07:00:00',
+                       '2014-08-01 08:00:00',
+                       '2014-08-01 09:00:00'],
+                        dtype='datetime64[ns]', freq='H')
+        """
+        tz = timezones.maybe_get_tz(tz)
+
+        if self.tz is None:
+            # tz naive, use tz_localize
+            raise TypeError('Cannot convert tz-naive timestamps, use '
+                            'tz_localize to localize')
+
+        # No conversion since timestamps are all UTC to begin with
+        dtype = tz_to_dtype(tz)
+        return self._simple_new(self.asi8, dtype=dtype, freq=self.freq)
+
+    def tz_localize(self, tz, ambiguous='raise', nonexistent='raise',
+                    errors=None):
+        """
+        Localize tz-naive Datetime Array/Index to tz-aware
+        Datetime Array/Index.
+
+        This method takes a time zone (tz) naive Datetime Array/Index object
+        and makes this time zone aware. It does not move the time to another
+        time zone.
+        Time zone localization helps to switch from time zone aware to time
+        zone unaware objects.
+
+        Parameters
+        ----------
+        tz : str, pytz.timezone, dateutil.tz.tzfile or None
+            Time zone to convert timestamps to. Passing ``None`` will
+            remove the time zone information preserving local time.
+        ambiguous : 'infer', 'NaT', bool array, default 'raise'
+            When clocks moved backward due to DST, ambiguous times may arise.
+            For example in Central European Time (UTC+01), when going from
+            03:00 DST to 02:00 non-DST, 02:30:00 local time occurs both at
+            00:30:00 UTC and at 01:30:00 UTC. In such a situation, the
+            `ambiguous` parameter dictates how ambiguous times should be
+            handled.
+
+            - 'infer' will attempt to infer fall dst-transition hours based on
+              order
+            - bool-ndarray where True signifies a DST time, False signifies a
+              non-DST time (note that this flag is only applicable for
+              ambiguous times)
+            - 'NaT' will return NaT where there are ambiguous times
+            - 'raise' will raise an AmbiguousTimeError if there are ambiguous
+              times
+
+        nonexistent : 'shift_forward', 'shift_backward, 'NaT', timedelta,
+                      default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST.
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
+
+        errors : {'raise', 'coerce'}, default None
+
+            - 'raise' will raise a NonExistentTimeError if a timestamp is not
+              valid in the specified time zone (e.g. due to a transition from
+              or to DST time). Use ``nonexistent='raise'`` instead.
+            - 'coerce' will return NaT if the timestamp can not be converted
+              to the specified time zone. Use ``nonexistent='NaT'`` instead.
+
+            .. deprecated:: 0.24.0
+
+        Returns
+        -------
+        Same type as self
+            Array/Index converted to the specified time zone.
+
+        Raises
+        ------
+        TypeError
+            If the Datetime Array/Index is tz-aware and tz is not None.
+
+        See Also
+        --------
+        DatetimeIndex.tz_convert : Convert tz-aware DatetimeIndex from
+            one time zone to another.
+
+        Examples
+        --------
+        >>> tz_naive = pd.date_range('2018-03-01 09:00', periods=3)
+        >>> tz_naive
+        DatetimeIndex(['2018-03-01 09:00:00', '2018-03-02 09:00:00',
+                       '2018-03-03 09:00:00'],
+                      dtype='datetime64[ns]', freq='D')
+
+        Localize DatetimeIndex in US/Eastern time zone:
+
+        >>> tz_aware = tz_naive.tz_localize(tz='US/Eastern')
+        >>> tz_aware
+        DatetimeIndex(['2018-03-01 09:00:00-05:00',
+                       '2018-03-02 09:00:00-05:00',
+                       '2018-03-03 09:00:00-05:00'],
+                      dtype='datetime64[ns, US/Eastern]', freq='D')
+
+        With the ``tz=None``, we can remove the time zone information
+        while keeping the local time (not converted to UTC):
+
+        >>> tz_aware.tz_localize(None)
+        DatetimeIndex(['2018-03-01 09:00:00', '2018-03-02 09:00:00',
+                       '2018-03-03 09:00:00'],
+                      dtype='datetime64[ns]', freq='D')
+
+        Be careful with DST changes. When there is sequential data, pandas can
+        infer the DST time:
+        >>> s = pd.to_datetime(pd.Series(['2018-10-28 01:30:00',
+        ...                               '2018-10-28 02:00:00',
+        ...                               '2018-10-28 02:30:00',
+        ...                               '2018-10-28 02:00:00',
+        ...                               '2018-10-28 02:30:00',
+        ...                               '2018-10-28 03:00:00',
+        ...                               '2018-10-28 03:30:00']))
+        >>> s.dt.tz_localize('CET', ambiguous='infer')
+        0   2018-10-28 01:30:00+02:00
+        1   2018-10-28 02:00:00+02:00
+        2   2018-10-28 02:30:00+02:00
+        3   2018-10-28 02:00:00+01:00
+        4   2018-10-28 02:30:00+01:00
+        5   2018-10-28 03:00:00+01:00
+        6   2018-10-28 03:30:00+01:00
+        dtype: datetime64[ns, CET]
+
+        In some cases, inferring the DST is impossible. In such cases, you can
+        pass an ndarray to the ambiguous parameter to set the DST explicitly
+
+        >>> s = pd.to_datetime(pd.Series(['2018-10-28 01:20:00',
+        ...                               '2018-10-28 02:36:00',
+        ...                               '2018-10-28 03:46:00']))
+        >>> s.dt.tz_localize('CET', ambiguous=np.array([True, True, False]))
+        0   2015-03-29 03:00:00+02:00
+        1   2015-03-29 03:30:00+02:00
+        dtype: datetime64[ns, Europe/Warsaw]
+
+        If the DST transition causes nonexistent times, you can shift these
+        dates forward or backwards with a timedelta object or `'shift_forward'`
+        or `'shift_backwards'`.
+        >>> s = pd.to_datetime(pd.Series(['2015-03-29 02:30:00',
+        ...                               '2015-03-29 03:30:00']))
+        >>> s.dt.tz_localize('Europe/Warsaw', nonexistent='shift_forward')
+        0   2015-03-29 03:00:00+02:00
+        1   2015-03-29 03:30:00+02:00
+        dtype: datetime64[ns, 'Europe/Warsaw']
+        >>> s.dt.tz_localize('Europe/Warsaw', nonexistent='shift_backward')
+        0   2015-03-29 01:59:59.999999999+01:00
+        1   2015-03-29 03:30:00+02:00
+        dtype: datetime64[ns, 'Europe/Warsaw']
+        >>> s.dt.tz_localize('Europe/Warsaw', nonexistent=pd.Timedelta('1H'))
+        0   2015-03-29 03:30:00+02:00
+        1   2015-03-29 03:30:00+02:00
+        dtype: datetime64[ns, 'Europe/Warsaw']
+        """
+        if errors is not None:
+            warnings.warn("The errors argument is deprecated and will be "
+                          "removed in a future release. Use "
+                          "nonexistent='NaT' or nonexistent='raise' "
+                          "instead.", FutureWarning)
+            if errors == 'coerce':
+                nonexistent = 'NaT'
+            elif errors == 'raise':
+                nonexistent = 'raise'
+            else:
+                raise ValueError("The errors argument must be either 'coerce' "
+                                 "or 'raise'.")
+
+        nonexistent_options = ('raise', 'NaT', 'shift_forward',
+                               'shift_backward')
+        if nonexistent not in nonexistent_options and not isinstance(
+                nonexistent, timedelta):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT', 'shift_forward', 'shift_backward' or"
+                             " a timedelta object")
+
+        if self.tz is not None:
+            if tz is None:
+                new_dates = conversion.tz_convert(self.asi8, timezones.UTC,
+                                                  self.tz)
+            else:
+                raise TypeError("Already tz-aware, use tz_convert to convert.")
+        else:
+            tz = timezones.maybe_get_tz(tz)
+            # Convert to UTC
+
+            new_dates = conversion.tz_localize_to_utc(
+                self.asi8, tz, ambiguous=ambiguous, nonexistent=nonexistent,
+            )
+        new_dates = new_dates.view(_NS_DTYPE)
+        dtype = tz_to_dtype(tz)
+        return self._simple_new(new_dates, dtype=dtype, freq=self.freq)
+
+    # ----------------------------------------------------------------
+    # Conversion Methods - Vectorized analogues of Timestamp methods
+
+    def to_pydatetime(self):
+        """
+        Return Datetime Array/Index as object ndarray of datetime.datetime
+        objects
+
+        Returns
+        -------
+        datetimes : ndarray
+        """
+        return tslib.ints_to_pydatetime(self.asi8, tz=self.tz)
+
+    def normalize(self):
+        """
+        Convert times to midnight.
+
+        The time component of the date-time is converted to midnight i.e.
+        00:00:00. This is useful in cases, when the time does not matter.
+        Length is unaltered. The timezones are unaffected.
+
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on Datetime Array/Index.
+
+        Returns
+        -------
+        DatetimeArray, DatetimeIndex or Series
+            The same type as the original data. Series will have the same
+            name and index. DatetimeIndex will have the same name.
+
+        See Also
+        --------
+        floor : Floor the datetimes to the specified freq.
+        ceil : Ceil the datetimes to the specified freq.
+        round : Round the datetimes to the specified freq.
+
+        Examples
+        --------
+        >>> idx = pd.date_range(start='2014-08-01 10:00', freq='H',
+        ...                     periods=3, tz='Asia/Calcutta')
+        >>> idx
+        DatetimeIndex(['2014-08-01 10:00:00+05:30',
+                       '2014-08-01 11:00:00+05:30',
+                       '2014-08-01 12:00:00+05:30'],
+                        dtype='datetime64[ns, Asia/Calcutta]', freq='H')
+        >>> idx.normalize()
+        DatetimeIndex(['2014-08-01 00:00:00+05:30',
+                       '2014-08-01 00:00:00+05:30',
+                       '2014-08-01 00:00:00+05:30'],
+                       dtype='datetime64[ns, Asia/Calcutta]', freq=None)
+        """
+        if self.tz is None or timezones.is_utc(self.tz):
+            not_null = ~self.isna()
+            DAY_NS = ccalendar.DAY_SECONDS * 1000000000
+            new_values = self.asi8.copy()
+            adjustment = (new_values[not_null] % DAY_NS)
+            new_values[not_null] = new_values[not_null] - adjustment
+        else:
+            new_values = conversion.normalize_i8_timestamps(self.asi8, self.tz)
+        return type(self)._from_sequence(new_values,
+                                         freq='infer').tz_localize(self.tz)
+
+    def to_period(self, freq=None):
+        """
+        Cast to PeriodArray/Index at a particular frequency.
+
+        Converts DatetimeArray/Index to PeriodArray/Index.
+
+        Parameters
+        ----------
+        freq : str or Offset, optional
+            One of pandas' :ref:`offset strings <timeseries.offset_aliases>`
+            or an Offset object. Will be inferred by default.
+
+        Returns
+        -------
+        PeriodArray/Index
+
+        Raises
+        ------
+        ValueError
+            When converting a DatetimeArray/Index with non-regular values,
+            so that a frequency cannot be inferred.
+
+        See Also
+        --------
+        PeriodIndex: Immutable ndarray holding ordinal values.
+        DatetimeIndex.to_pydatetime: Return DatetimeIndex as object.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({"y": [1, 2, 3]},
+        ...                   index=pd.to_datetime(["2000-03-31 00:00:00",
+        ...                                         "2000-05-31 00:00:00",
+        ...                                         "2000-08-31 00:00:00"]))
+        >>> df.index.to_period("M")
+        PeriodIndex(['2000-03', '2000-05', '2000-08'],
+                    dtype='period[M]', freq='M')
+
+        Infer the daily frequency
+
+        >>> idx = pd.date_range("2017-01-01", periods=2)
+        >>> idx.to_period()
+        PeriodIndex(['2017-01-01', '2017-01-02'],
+                    dtype='period[D]', freq='D')
+        """
+        from pandas.core.arrays import PeriodArray
+
+        if self.tz is not None:
+            warnings.warn("Converting to PeriodArray/Index representation "
+                          "will drop timezone information.", UserWarning)
+
+        if freq is None:
+            freq = self.freqstr or self.inferred_freq
+
+            if freq is None:
+                raise ValueError("You must pass a freq argument as "
+                                 "current index has none.")
+
+            freq = get_period_alias(freq)
+
+        return PeriodArray._from_datetime64(self._data, freq, tz=self.tz)
+
+    def to_perioddelta(self, freq):
+        """
+        Calculate TimedeltaArray of difference between index
+        values and index converted to PeriodArray at specified
+        freq. Used for vectorized offsets
+
+        Parameters
+        ----------
+        freq : Period frequency
+
+        Returns
+        -------
+        TimedeltaArray/Index
+        """
+        # TODO: consider privatizing (discussion in GH#23113)
+        from pandas.core.arrays.timedeltas import TimedeltaArray
+        i8delta = self.asi8 - self.to_period(freq).to_timestamp().asi8
+        m8delta = i8delta.view('m8[ns]')
+        return TimedeltaArray(m8delta)
+
+    # -----------------------------------------------------------------
+    # Properties - Vectorized Timestamp Properties/Methods
+
+    def month_name(self, locale=None):
+        """
+        Return the month names of the DateTimeIndex with specified locale.
+
+        .. versionadded:: 0.23.0
+
+        Parameters
+        ----------
+        locale : str, optional
+            Locale determining the language in which to return the month name.
+            Default is English locale.
+
+        Returns
+        -------
+        Index
+            Index of month names.
+
+        Examples
+        --------
+        >>> idx = pd.date_range(start='2018-01', freq='M', periods=3)
+        >>> idx
+        DatetimeIndex(['2018-01-31', '2018-02-28', '2018-03-31'],
+                      dtype='datetime64[ns]', freq='M')
+        >>> idx.month_name()
+        Index(['January', 'February', 'March'], dtype='object')
+        """
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            values = self._local_timestamps()
+        else:
+            values = self.asi8
+
+        result = fields.get_date_name_field(values, 'month_name',
+                                            locale=locale)
+        result = self._maybe_mask_results(result, fill_value=None)
+        return result
+
+    def day_name(self, locale=None):
+        """
+        Return the day names of the DateTimeIndex with specified locale.
+
+        .. versionadded:: 0.23.0
+
+        Parameters
+        ----------
+        locale : str, optional
+            Locale determining the language in which to return the day name.
+            Default is English locale.
+
+        Returns
+        -------
+        Index
+            Index of day names.
+
+        Examples
+        --------
+        >>> idx = pd.date_range(start='2018-01-01', freq='D', periods=3)
+        >>> idx
+        DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03'],
+                      dtype='datetime64[ns]', freq='D')
+        >>> idx.day_name()
+        Index(['Monday', 'Tuesday', 'Wednesday'], dtype='object')
+        """
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            values = self._local_timestamps()
+        else:
+            values = self.asi8
+
+        result = fields.get_date_name_field(values, 'day_name',
+                                            locale=locale)
+        result = self._maybe_mask_results(result, fill_value=None)
+        return result
+
+    @property
+    def time(self):
+        """
+        Returns numpy array of datetime.time. The time part of the Timestamps.
+        """
+        # If the Timestamps have a timezone that is not UTC,
+        # convert them into their i8 representation while
+        # keeping their timezone and not using UTC
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            timestamps = self._local_timestamps()
+        else:
+            timestamps = self.asi8
+
+        return tslib.ints_to_pydatetime(timestamps, box="time")
+
+    @property
+    def timetz(self):
+        """
+        Returns numpy array of datetime.time also containing timezone
+        information. The time part of the Timestamps.
+        """
+        return tslib.ints_to_pydatetime(self.asi8, self.tz, box="time")
+
+    @property
+    def date(self):
+        """
+        Returns numpy array of python datetime.date objects (namely, the date
+        part of Timestamps without timezone information).
+        """
+        # If the Timestamps have a timezone that is not UTC,
+        # convert them into their i8 representation while
+        # keeping their timezone and not using UTC
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            timestamps = self._local_timestamps()
+        else:
+            timestamps = self.asi8
+
+        return tslib.ints_to_pydatetime(timestamps, box="date")
+
+    year = _field_accessor('year', 'Y', "The year of the datetime.")
+    month = _field_accessor('month', 'M',
+                            "The month as January=1, December=12. ")
+    day = _field_accessor('day', 'D', "The days of the datetime.")
+    hour = _field_accessor('hour', 'h', "The hours of the datetime.")
+    minute = _field_accessor('minute', 'm', "The minutes of the datetime.")
+    second = _field_accessor('second', 's', "The seconds of the datetime.")
+    microsecond = _field_accessor('microsecond', 'us',
+                                  "The microseconds of the datetime.")
+    nanosecond = _field_accessor('nanosecond', 'ns',
+                                 "The nanoseconds of the datetime.")
+    weekofyear = _field_accessor('weekofyear', 'woy',
+                                 "The week ordinal of the year.")
+    week = weekofyear
+    _dayofweek_doc = """
+    The day of the week with Monday=0, Sunday=6.
+
+    Return the day of the week. It is assumed the week starts on
+    Monday, which is denoted by 0 and ends on Sunday which is denoted
+    by 6. This method is available on both Series with datetime
+    values (using the `dt` accessor) or DatetimeIndex.
+
+    Returns
+    -------
+    Series or Index
+        Containing integers indicating the day number.
+
+    See Also
+    --------
+    Series.dt.dayofweek : Alias.
+    Series.dt.weekday : Alias.
+    Series.dt.day_name : Returns the name of the day of the week.
+
+    Examples
+    --------
+    >>> s = pd.date_range('2016-12-31', '2017-01-08', freq='D').to_series()
+    >>> s.dt.dayofweek
+    2016-12-31    5
+    2017-01-01    6
+    2017-01-02    0
+    2017-01-03    1
+    2017-01-04    2
+    2017-01-05    3
+    2017-01-06    4
+    2017-01-07    5
+    2017-01-08    6
+    Freq: D, dtype: int64
+    """
+    dayofweek = _field_accessor('dayofweek', 'dow', _dayofweek_doc)
+    weekday = dayofweek
+
+    weekday_name = _field_accessor(
+        'weekday_name',
+        'weekday_name',
+        "The name of day in a week (ex: Friday)\n\n.. deprecated:: 0.23.0")
+
+    dayofyear = _field_accessor('dayofyear', 'doy',
+                                "The ordinal day of the year.")
+    quarter = _field_accessor('quarter', 'q', "The quarter of the date.")
+    days_in_month = _field_accessor(
+        'days_in_month',
+        'dim',
+        "The number of days in the month.")
+    daysinmonth = days_in_month
+    _is_month_doc = """
+        Indicates whether the date is the {first_or_last} day of the month.
+
+        Returns
+        -------
+        Series or array
+            For Series, returns a Series with boolean values.
+            For DatetimeIndex, returns a boolean array.
+
+        See Also
+        --------
+        is_month_start : Return a boolean indicating whether the date
+            is the first day of the month.
+        is_month_end : Return a boolean indicating whether the date
+            is the last day of the month.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> s = pd.Series(pd.date_range("2018-02-27", periods=3))
+        >>> s
+        0   2018-02-27
+        1   2018-02-28
+        2   2018-03-01
+        dtype: datetime64[ns]
+        >>> s.dt.is_month_start
+        0    False
+        1    False
+        2    True
+        dtype: bool
+        >>> s.dt.is_month_end
+        0    False
+        1    True
+        2    False
+        dtype: bool
+
+        >>> idx = pd.date_range("2018-02-27", periods=3)
+        >>> idx.is_month_start
+        array([False, False, True])
+        >>> idx.is_month_end
+        array([False, True, False])
+    """
+    is_month_start = _field_accessor(
+        'is_month_start',
+        'is_month_start',
+        _is_month_doc.format(first_or_last='first'))
+
+    is_month_end = _field_accessor(
+        'is_month_end',
+        'is_month_end',
+        _is_month_doc.format(first_or_last='last'))
+
+    is_quarter_start = _field_accessor(
+        'is_quarter_start',
+        'is_quarter_start',
+        """
+        Indicator for whether the date is the first day of a quarter.
+
+        Returns
+        -------
+        is_quarter_start : Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        quarter : Return the quarter of the date.
+        is_quarter_end : Similar property for indicating the quarter start.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> df = pd.DataFrame({'dates': pd.date_range("2017-03-30",
+        ...                   periods=4)})
+        >>> df.assign(quarter=df.dates.dt.quarter,
+        ...           is_quarter_start=df.dates.dt.is_quarter_start)
+               dates  quarter  is_quarter_start
+        0 2017-03-30        1             False
+        1 2017-03-31        1             False
+        2 2017-04-01        2              True
+        3 2017-04-02        2             False
+
+        >>> idx = pd.date_range('2017-03-30', periods=4)
+        >>> idx
+        DatetimeIndex(['2017-03-30', '2017-03-31', '2017-04-01', '2017-04-02'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_quarter_start
+        array([False, False,  True, False])
+        """)
+    is_quarter_end = _field_accessor(
+        'is_quarter_end',
+        'is_quarter_end',
+        """
+        Indicator for whether the date is the last day of a quarter.
+
+        Returns
+        -------
+        is_quarter_end : Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        quarter : Return the quarter of the date.
+        is_quarter_start : Similar property indicating the quarter start.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> df = pd.DataFrame({'dates': pd.date_range("2017-03-30",
+        ...                    periods=4)})
+        >>> df.assign(quarter=df.dates.dt.quarter,
+        ...           is_quarter_end=df.dates.dt.is_quarter_end)
+               dates  quarter    is_quarter_end
+        0 2017-03-30        1             False
+        1 2017-03-31        1              True
+        2 2017-04-01        2             False
+        3 2017-04-02        2             False
+
+        >>> idx = pd.date_range('2017-03-30', periods=4)
+        >>> idx
+        DatetimeIndex(['2017-03-30', '2017-03-31', '2017-04-01', '2017-04-02'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_quarter_end
+        array([False,  True, False, False])
+        """)
+    is_year_start = _field_accessor(
+        'is_year_start',
+        'is_year_start',
+        """
+        Indicate whether the date is the first day of a year.
+
+        Returns
+        -------
+        Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        is_year_end : Similar property indicating the last day of the year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> dates = pd.Series(pd.date_range("2017-12-30", periods=3))
+        >>> dates
+        0   2017-12-30
+        1   2017-12-31
+        2   2018-01-01
+        dtype: datetime64[ns]
+
+        >>> dates.dt.is_year_start
+        0    False
+        1    False
+        2    True
+        dtype: bool
+
+        >>> idx = pd.date_range("2017-12-30", periods=3)
+        >>> idx
+        DatetimeIndex(['2017-12-30', '2017-12-31', '2018-01-01'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_year_start
+        array([False, False,  True])
+        """)
+    is_year_end = _field_accessor(
+        'is_year_end',
+        'is_year_end',
+        """
+        Indicate whether the date is the last day of the year.
+
+        Returns
+        -------
+        Series or DatetimeIndex
+            The same type as the original data with boolean values. Series will
+            have the same name and index. DatetimeIndex will have the same
+            name.
+
+        See Also
+        --------
+        is_year_start : Similar property indicating the start of the year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> dates = pd.Series(pd.date_range("2017-12-30", periods=3))
+        >>> dates
+        0   2017-12-30
+        1   2017-12-31
+        2   2018-01-01
+        dtype: datetime64[ns]
+
+        >>> dates.dt.is_year_end
+        0    False
+        1     True
+        2    False
+        dtype: bool
+
+        >>> idx = pd.date_range("2017-12-30", periods=3)
+        >>> idx
+        DatetimeIndex(['2017-12-30', '2017-12-31', '2018-01-01'],
+                      dtype='datetime64[ns]', freq='D')
+
+        >>> idx.is_year_end
+        array([False,  True, False])
+        """)
+    is_leap_year = _field_accessor(
+        'is_leap_year',
+        'is_leap_year',
+        """
+        Boolean indicator if the date belongs to a leap year.
+
+        A leap year is a year, which has 366 days (instead of 365) including
+        29th of February as an intercalary day.
+        Leap years are years which are multiples of four with the exception
+        of years divisible by 100 but not by 400.
+
+        Returns
+        -------
+        Series or ndarray
+             Booleans indicating if dates belong to a leap year.
+
+        Examples
+        --------
+        This method is available on Series with datetime values under
+        the ``.dt`` accessor, and directly on DatetimeIndex.
+
+        >>> idx = pd.date_range("2012-01-01", "2015-01-01", freq="Y")
+        >>> idx
+        DatetimeIndex(['2012-12-31', '2013-12-31', '2014-12-31'],
+                      dtype='datetime64[ns]', freq='A-DEC')
+        >>> idx.is_leap_year
+        array([ True, False, False], dtype=bool)
+
+        >>> dates = pd.Series(idx)
+        >>> dates_series
+        0   2012-12-31
+        1   2013-12-31
+        2   2014-12-31
+        dtype: datetime64[ns]
+        >>> dates_series.dt.is_leap_year
+        0     True
+        1    False
+        2    False
+        dtype: bool
+        """)
+
+    def to_julian_date(self):
+        """
+        Convert Datetime Array to float64 ndarray of Julian Dates.
+        0 Julian date is noon January 1, 4713 BC.
+        http://en.wikipedia.org/wiki/Julian_day
+        """
+
+        # http://mysite.verizon.net/aesir_research/date/jdalg2.htm
+        year = np.asarray(self.year)
+        month = np.asarray(self.month)
+        day = np.asarray(self.day)
+        testarr = month < 3
+        year[testarr] -= 1
+        month[testarr] += 12
+        return (day +
+                np.fix((153 * month - 457) / 5) +
+                365 * year +
+                np.floor(year / 4) -
+                np.floor(year / 100) +
+                np.floor(year / 400) +
+                1721118.5 +
+                (self.hour +
+                 self.minute / 60.0 +
+                 self.second / 3600.0 +
+                 self.microsecond / 3600.0 / 1e+6 +
+                 self.nanosecond / 3600.0 / 1e+9
+                 ) / 24.0)
+
+
+DatetimeArray._add_comparison_ops()
+
+
+# -------------------------------------------------------------------
+# Constructor Helpers
+
+def sequence_to_dt64ns(data, dtype=None, copy=False,
+                       tz=None,
+                       dayfirst=False, yearfirst=False, ambiguous='raise',
+                       int_as_wall_time=False):
+    """
+    Parameters
+    ----------
+    data : list-like
+    dtype : dtype, str, or None, default None
+    copy : bool, default False
+    tz : tzinfo, str, or None, default None
+    dayfirst : bool, default False
+    yearfirst : bool, default False
+    ambiguous : str, bool, or arraylike, default 'raise'
+        See pandas._libs.tslibs.conversion.tz_localize_to_utc
+    int_as_wall_time : bool, default False
+        Whether to treat ints as wall time in specified timezone, or as
+        nanosecond-precision UNIX epoch (wall time in UTC).
+        This is used in DatetimeIndex.__init__ to deprecate the wall-time
+        behaviour.
+
+        ..versionadded:: 0.24.0
+
+    Returns
+    -------
+    result : numpy.ndarray
+        The sequence converted to a numpy array with dtype ``datetime64[ns]``.
+    tz : tzinfo or None
+        Either the user-provided tzinfo or one inferred from the data.
+    inferred_freq : Tick or None
+        The inferred frequency of the sequence.
+
+    Raises
+    ------
+    TypeError : PeriodDType data is passed
+    """
+
+    inferred_freq = None
+
+    dtype = _validate_dt64_dtype(dtype)
+
+    if not hasattr(data, "dtype"):
+        # e.g. list, tuple
+        if np.ndim(data) == 0:
+            # i.e. generator
+            data = list(data)
+        data = np.asarray(data)
+        copy = False
+    elif isinstance(data, ABCSeries):
+        data = data._values
+    if isinstance(data, ABCPandasArray):
+        data = data.to_numpy()
+
+    if hasattr(data, "freq"):
+        # i.e. DatetimeArray/Index
+        inferred_freq = data.freq
+
+    # if dtype has an embedded tz, capture it
+    tz = validate_tz_from_dtype(dtype, tz)
+
+    if isinstance(data, ABCIndexClass):
+        data = data._data
+
+    # By this point we are assured to have either a numpy array or Index
+    data, copy = maybe_convert_dtype(data, copy)
+
+    if is_object_dtype(data) or is_string_dtype(data):
+        # TODO: We do not have tests specific to string-dtypes,
+        #  also complex or categorical or other extension
+        copy = False
+        if lib.infer_dtype(data, skipna=False) == 'integer':
+            data = data.astype(np.int64)
+        else:
+            # data comes back here as either i8 to denote UTC timestamps
+            #  or M8[ns] to denote wall times
+            data, inferred_tz = objects_to_datetime64ns(
+                data, dayfirst=dayfirst, yearfirst=yearfirst)
+            tz = maybe_infer_tz(tz, inferred_tz)
+            # When a sequence of timestamp objects is passed, we always
+            # want to treat the (now i8-valued) data as UTC timestamps,
+            # not wall times.
+            int_as_wall_time = False
+
+    # `data` may have originally been a Categorical[datetime64[ns, tz]],
+    # so we need to handle these types.
+    if is_datetime64tz_dtype(data):
+        # DatetimeArray -> ndarray
+        tz = maybe_infer_tz(tz, data.tz)
+        result = data._data
+
+    elif is_datetime64_dtype(data):
+        # tz-naive DatetimeArray or ndarray[datetime64]
+        data = getattr(data, "_data", data)
+        if data.dtype != _NS_DTYPE:
+            data = conversion.ensure_datetime64ns(data)
+
+        if tz is not None:
+            # Convert tz-naive to UTC
+            tz = timezones.maybe_get_tz(tz)
+            data = conversion.tz_localize_to_utc(data.view('i8'), tz,
+                                                 ambiguous=ambiguous)
+            data = data.view(_NS_DTYPE)
+
+        assert data.dtype == _NS_DTYPE, data.dtype
+        result = data
+
+    else:
+        # must be integer dtype otherwise
+        # assume this data are epoch timestamps
+        if tz:
+            tz = timezones.maybe_get_tz(tz)
+
+        if data.dtype != _INT64_DTYPE:
+            data = data.astype(np.int64, copy=False)
+        if int_as_wall_time and tz is not None and not timezones.is_utc(tz):
+            warnings.warn(_i8_message, FutureWarning, stacklevel=4)
+            data = conversion.tz_localize_to_utc(data.view('i8'), tz,
+                                                 ambiguous=ambiguous)
+            data = data.view(_NS_DTYPE)
+        result = data.view(_NS_DTYPE)
+
+    if copy:
+        # TODO: should this be deepcopy?
+        result = result.copy()
+
+    assert isinstance(result, np.ndarray), type(result)
+    assert result.dtype == 'M8[ns]', result.dtype
+
+    # We have to call this again after possibly inferring a tz above
+    validate_tz_from_dtype(dtype, tz)
+
+    return result, tz, inferred_freq
+
+
+def objects_to_datetime64ns(data, dayfirst, yearfirst,
+                            utc=False, errors="raise",
+                            require_iso8601=False, allow_object=False):
+    """
+    Convert data to array of timestamps.
+
+    Parameters
+    ----------
+    data : np.ndarray[object]
+    dayfirst : bool
+    yearfirst : bool
+    utc : bool, default False
+        Whether to convert timezone-aware timestamps to UTC
+    errors : {'raise', 'ignore', 'coerce'}
+    allow_object : bool
+        Whether to return an object-dtype ndarray instead of raising if the
+        data contains more than one timezone.
+
+    Returns
+    -------
+    result : ndarray
+        np.int64 dtype if returned values represent UTC timestamps
+        np.datetime64[ns] if returned values represent wall times
+        object if mixed timezones
+    inferred_tz : tzinfo or None
+
+    Raises
+    ------
+    ValueError : if data cannot be converted to datetimes
+    """
+    assert errors in ["raise", "ignore", "coerce"]
+
+    # if str-dtype, convert
+    data = np.array(data, copy=False, dtype=np.object_)
+
+    try:
+        result, tz_parsed = tslib.array_to_datetime(
+            data,
+            errors=errors,
+            utc=utc,
+            dayfirst=dayfirst,
+            yearfirst=yearfirst,
+            require_iso8601=require_iso8601
+        )
+    except ValueError as e:
+        try:
+            values, tz_parsed = conversion.datetime_to_datetime64(data)
+            # If tzaware, these values represent unix timestamps, so we
+            #  return them as i8 to distinguish from wall times
+            return values.view('i8'), tz_parsed
+        except (ValueError, TypeError):
+            raise e
+
+    if tz_parsed is not None:
+        # We can take a shortcut since the datetime64 numpy array
+        #  is in UTC
+        # Return i8 values to denote unix timestamps
+        return result.view('i8'), tz_parsed
+    elif is_datetime64_dtype(result):
+        # returning M8[ns] denotes wall-times; since tz is None
+        #  the distinction is a thin one
+        return result, tz_parsed
+    elif is_object_dtype(result):
+        # GH#23675 when called via `pd.to_datetime`, returning an object-dtype
+        #  array is allowed.  When called via `pd.DatetimeIndex`, we can
+        #  only accept datetime64 dtype, so raise TypeError if object-dtype
+        #  is returned, as that indicates the values can be recognized as
+        #  datetimes but they have conflicting timezones/awareness
+        if allow_object:
+            return result, tz_parsed
+        raise TypeError(result)
+    else:  # pragma: no cover
+        # GH#23675 this TypeError should never be hit, whereas the TypeError
+        #  in the object-dtype branch above is reachable.
+        raise TypeError(result)
+
+
+def maybe_convert_dtype(data, copy):
+    """
+    Convert data based on dtype conventions, issuing deprecation warnings
+    or errors where appropriate.
+
+    Parameters
+    ----------
+    data : np.ndarray or pd.Index
+    copy : bool
+
+    Returns
+    -------
+    data : np.ndarray or pd.Index
+    copy : bool
+
+    Raises
+    ------
+    TypeError : PeriodDType data is passed
+    """
+    if is_float_dtype(data):
+        # Note: we must cast to datetime64[ns] here in order to treat these
+        #  as wall-times instead of UTC timestamps.
+        data = data.astype(_NS_DTYPE)
+        copy = False
+        # TODO: deprecate this behavior to instead treat symmetrically
+        #  with integer dtypes.  See discussion in GH#23675
+
+    elif is_timedelta64_dtype(data):
+        warnings.warn("Passing timedelta64-dtype data is deprecated, will "
+                      "raise a TypeError in a future version",
+                      FutureWarning, stacklevel=5)
+        data = data.view(_NS_DTYPE)
+
+    elif is_period_dtype(data):
+        # Note: without explicitly raising here, PeriodIndex
+        #  test_setops.test_join_does_not_recur fails
+        raise TypeError("Passing PeriodDtype data is invalid.  "
+                        "Use `data.to_timestamp()` instead")
+
+    elif is_categorical_dtype(data):
+        # GH#18664 preserve tz in going DTI->Categorical->DTI
+        # TODO: cases where we need to do another pass through this func,
+        #  e.g. the categories are timedelta64s
+        data = data.categories.take(data.codes, fill_value=NaT)._values
+        copy = False
+
+    elif is_extension_type(data) and not is_datetime64tz_dtype(data):
+        # Includes categorical
+        # TODO: We have no tests for these
+        data = np.array(data, dtype=np.object_)
+        copy = False
+
+    return data, copy
+
+
+# -------------------------------------------------------------------
+# Validation and Inference
+
+def maybe_infer_tz(tz, inferred_tz):
+    """
+    If a timezone is inferred from data, check that it is compatible with
+    the user-provided timezone, if any.
+
+    Parameters
+    ----------
+    tz : tzinfo or None
+    inferred_tz : tzinfo or None
+
+    Returns
+    -------
+    tz : tzinfo or None
+
+    Raises
+    ------
+    TypeError : if both timezones are present but do not match
+    """
+    if tz is None:
+        tz = inferred_tz
+    elif inferred_tz is None:
+        pass
+    elif not timezones.tz_compare(tz, inferred_tz):
+        raise TypeError('data is already tz-aware {inferred_tz}, unable to '
+                        'set specified tz: {tz}'
+                        .format(inferred_tz=inferred_tz, tz=tz))
+    return tz
+
+
+def _validate_dt64_dtype(dtype):
+    """
+    Check that a dtype, if passed, represents either a numpy datetime64[ns]
+    dtype or a pandas DatetimeTZDtype.
+
+    Parameters
+    ----------
+    dtype : object
+
+    Returns
+    -------
+    dtype : None, numpy.dtype, or DatetimeTZDtype
+
+    Raises
+    ------
+    ValueError : invalid dtype
+
+    Notes
+    -----
+    Unlike validate_tz_from_dtype, this does _not_ allow non-existent
+    tz errors to go through
+    """
+    if dtype is not None:
+        dtype = pandas_dtype(dtype)
+        if is_dtype_equal(dtype, np.dtype("M8")):
+            # no precision, warn
+            dtype = _NS_DTYPE
+            msg = textwrap.dedent("""\
+                Passing in 'datetime64' dtype with no precision is deprecated
+                and will raise in a future version. Please pass in
+                'datetime64[ns]' instead.""")
+            warnings.warn(msg, FutureWarning, stacklevel=5)
+
+        if ((isinstance(dtype, np.dtype) and dtype != _NS_DTYPE)
+                or not isinstance(dtype, (np.dtype, DatetimeTZDtype))):
+            raise ValueError("Unexpected value for 'dtype': '{dtype}'. "
+                             "Must be 'datetime64[ns]' or DatetimeTZDtype'."
+                             .format(dtype=dtype))
+    return dtype
+
+
+def validate_tz_from_dtype(dtype, tz):
+    """
+    If the given dtype is a DatetimeTZDtype, extract the implied
+    tzinfo object from it and check that it does not conflict with the given
+    tz.
+
+    Parameters
+    ----------
+    dtype : dtype, str
+    tz : None, tzinfo
+
+    Returns
+    -------
+    tz : consensus tzinfo
+
+    Raises
+    ------
+    ValueError : on tzinfo mismatch
+    """
+    if dtype is not None:
+        if isinstance(dtype, compat.string_types):
+            try:
+                dtype = DatetimeTZDtype.construct_from_string(dtype)
+            except TypeError:
+                # Things like `datetime64[ns]`, which is OK for the
+                # constructors, but also nonsense, which should be validated
+                # but not by us. We *do* allow non-existent tz errors to
+                # go through
+                pass
+        dtz = getattr(dtype, 'tz', None)
+        if dtz is not None:
+            if tz is not None and not timezones.tz_compare(tz, dtz):
+                raise ValueError("cannot supply both a tz and a dtype"
+                                 " with a tz")
+            tz = dtz
+
+        if tz is not None and is_datetime64_dtype(dtype):
+            # We also need to check for the case where the user passed a
+            #  tz-naive dtype (i.e. datetime64[ns])
+            if tz is not None and not timezones.tz_compare(tz, dtz):
+                raise ValueError("cannot supply both a tz and a "
+                                 "timezone-naive dtype (i.e. datetime64[ns])")
+
+    return tz
+
+
+def _infer_tz_from_endpoints(start, end, tz):
+    """
+    If a timezone is not explicitly given via `tz`, see if one can
+    be inferred from the `start` and `end` endpoints.  If more than one
+    of these inputs provides a timezone, require that they all agree.
+
+    Parameters
+    ----------
+    start : Timestamp
+    end : Timestamp
+    tz : tzinfo or None
+
+    Returns
+    -------
+    tz : tzinfo or None
+
+    Raises
+    ------
+    TypeError : if start and end timezones do not agree
+    """
+    try:
+        inferred_tz = timezones.infer_tzinfo(start, end)
+    except Exception:
+        raise TypeError('Start and end cannot both be tz-aware with '
+                        'different timezones')
+
+    inferred_tz = timezones.maybe_get_tz(inferred_tz)
+    tz = timezones.maybe_get_tz(tz)
+
+    if tz is not None and inferred_tz is not None:
+        if not timezones.tz_compare(inferred_tz, tz):
+            raise AssertionError("Inferred time zone not equal to passed "
+                                 "time zone")
+
+    elif inferred_tz is not None:
+        tz = inferred_tz
+
+    return tz
+
+
+def _maybe_normalize_endpoints(start, end, normalize):
+    _normalized = True
+
+    if start is not None:
+        if normalize:
+            start = normalize_date(start)
+            _normalized = True
+        else:
+            _normalized = _normalized and start.time() == _midnight
+
+    if end is not None:
+        if normalize:
+            end = normalize_date(end)
+            _normalized = True
+        else:
+            _normalized = _normalized and end.time() == _midnight
+
+    return start, end, _normalized
+
+
+def _maybe_localize_point(ts, is_none, is_not_none, freq, tz):
+    """
+    Localize a start or end Timestamp to the timezone of the corresponding
+    start or end Timestamp
+
+    Parameters
+    ----------
+    ts : start or end Timestamp to potentially localize
+    is_none : argument that should be None
+    is_not_none : argument that should not be None
+    freq : Tick, DateOffset, or None
+    tz : str, timezone object or None
+
+    Returns
+    -------
+    ts : Timestamp
+    """
+    # Make sure start and end are timezone localized if:
+    # 1) freq = a Timedelta-like frequency (Tick)
+    # 2) freq = None i.e. generating a linspaced range
+    if isinstance(freq, Tick) or freq is None:
+        localize_args = {'tz': tz, 'ambiguous': False}
+    else:
+        localize_args = {'tz': None}
+    if is_none is None and is_not_none is not None:
+        ts = ts.tz_localize(**localize_args)
+    return ts
diff --git a/pandas/core/arrays/integer.py b/pandas/core/arrays/integer.py
new file mode 100644
index 0000000000000..fd90aec3b5e8c
--- /dev/null
+++ b/pandas/core/arrays/integer.py
@@ -0,0 +1,706 @@
+import copy
+import sys
+import warnings
+
+import numpy as np
+
+from pandas._libs import lib
+from pandas.compat import range, set_function_name, string_types
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.base import ExtensionDtype
+from pandas.core.dtypes.cast import astype_nansafe
+from pandas.core.dtypes.common import (
+    is_bool_dtype, is_float, is_float_dtype, is_integer, is_integer_dtype,
+    is_list_like, is_object_dtype, is_scalar)
+from pandas.core.dtypes.dtypes import register_extension_dtype
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.core import nanops
+from pandas.core.arrays import ExtensionArray, ExtensionOpsMixin
+from pandas.core.tools.numeric import to_numeric
+
+
+class _IntegerDtype(ExtensionDtype):
+    """
+    An ExtensionDtype to hold a single size & kind of integer dtype.
+
+    These specific implementations are subclasses of the non-public
+    _IntegerDtype. For example we have Int8Dtype to represnt signed int 8s.
+
+    The attributes name & type are set when these subclasses are created.
+    """
+    name = None
+    base = None
+    type = None
+    na_value = np.nan
+
+    def __repr__(self):
+        sign = 'U' if self.is_unsigned_integer else ''
+        return "{sign}Int{size}Dtype()".format(sign=sign,
+                                               size=8 * self.itemsize)
+
+    @cache_readonly
+    def is_signed_integer(self):
+        return self.kind == 'i'
+
+    @cache_readonly
+    def is_unsigned_integer(self):
+        return self.kind == 'u'
+
+    @property
+    def _is_numeric(self):
+        return True
+
+    @cache_readonly
+    def numpy_dtype(self):
+        """ Return an instance of our numpy dtype """
+        return np.dtype(self.type)
+
+    @cache_readonly
+    def kind(self):
+        return self.numpy_dtype.kind
+
+    @cache_readonly
+    def itemsize(self):
+        """ Return the number of bytes in this dtype """
+        return self.numpy_dtype.itemsize
+
+    @classmethod
+    def construct_array_type(cls):
+        """Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        return IntegerArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        Construction from a string, raise a TypeError if not
+        possible
+        """
+        if string == cls.name:
+            return cls()
+        raise TypeError("Cannot construct a '{}' from "
+                        "'{}'".format(cls, string))
+
+
+def integer_array(values, dtype=None, copy=False):
+    """
+    Infer and return an integer array of the values.
+
+    Parameters
+    ----------
+    values : 1D list-like
+    dtype : dtype, optional
+        dtype to coerce
+    copy : boolean, default False
+
+    Returns
+    -------
+    IntegerArray
+
+    Raises
+    ------
+    TypeError if incompatible types
+    """
+    values, mask = coerce_to_array(values, dtype=dtype, copy=copy)
+    return IntegerArray(values, mask)
+
+
+def safe_cast(values, dtype, copy):
+    """
+    Safely cast the values to the dtype if they
+    are equivalent, meaning floats must be equivalent to the
+    ints.
+
+    """
+
+    try:
+        return values.astype(dtype, casting='safe', copy=copy)
+    except TypeError:
+
+        casted = values.astype(dtype, copy=copy)
+        if (casted == values).all():
+            return casted
+
+        raise TypeError("cannot safely cast non-equivalent {} to {}".format(
+            values.dtype, np.dtype(dtype)))
+
+
+def coerce_to_array(values, dtype, mask=None, copy=False):
+    """
+    Coerce the input values array to numpy arrays with a mask
+
+    Parameters
+    ----------
+    values : 1D list-like
+    dtype : integer dtype
+    mask : boolean 1D array, optional
+    copy : boolean, default False
+        if True, copy the input
+
+    Returns
+    -------
+    tuple of (values, mask)
+    """
+    # if values is integer numpy array, preserve it's dtype
+    if dtype is None and hasattr(values, 'dtype'):
+        if is_integer_dtype(values.dtype):
+            dtype = values.dtype
+
+    if dtype is not None:
+        if (isinstance(dtype, string_types) and
+                (dtype.startswith("Int") or dtype.startswith("UInt"))):
+            # Avoid DeprecationWarning from NumPy about np.dtype("Int64")
+            # https://github.com/numpy/numpy/pull/7476
+            dtype = dtype.lower()
+
+        if not issubclass(type(dtype), _IntegerDtype):
+            try:
+                dtype = _dtypes[str(np.dtype(dtype))]
+            except KeyError:
+                raise ValueError("invalid dtype specified {}".format(dtype))
+
+    if isinstance(values, IntegerArray):
+        values, mask = values._data, values._mask
+        if dtype is not None:
+            values = values.astype(dtype.numpy_dtype, copy=False)
+
+        if copy:
+            values = values.copy()
+            mask = mask.copy()
+        return values, mask
+
+    values = np.array(values, copy=copy)
+    if is_object_dtype(values):
+        inferred_type = lib.infer_dtype(values, skipna=True)
+        if inferred_type == 'empty':
+            values = np.empty(len(values))
+            values.fill(np.nan)
+        elif inferred_type not in ['floating', 'integer',
+                                   'mixed-integer', 'mixed-integer-float']:
+            raise TypeError("{} cannot be converted to an IntegerDtype".format(
+                values.dtype))
+
+    elif not (is_integer_dtype(values) or is_float_dtype(values)):
+        raise TypeError("{} cannot be converted to an IntegerDtype".format(
+            values.dtype))
+
+    if mask is None:
+        mask = isna(values)
+    else:
+        assert len(mask) == len(values)
+
+    if not values.ndim == 1:
+        raise TypeError("values must be a 1D list-like")
+    if not mask.ndim == 1:
+        raise TypeError("mask must be a 1D list-like")
+
+    # infer dtype if needed
+    if dtype is None:
+        dtype = np.dtype('int64')
+    else:
+        dtype = dtype.type
+
+    # if we are float, let's make sure that we can
+    # safely cast
+
+    # we copy as need to coerce here
+    if mask.any():
+        values = values.copy()
+        values[mask] = 1
+        values = safe_cast(values, dtype, copy=False)
+    else:
+        values = safe_cast(values, dtype, copy=False)
+
+    return values, mask
+
+
+class IntegerArray(ExtensionArray, ExtensionOpsMixin):
+    """
+    Array of integer (optional missing) values.
+
+    .. versionadded:: 0.24.0
+
+    .. warning::
+
+       IntegerArray is currently experimental, and its API or internal
+       implementation may change without warning.
+
+    We represent an IntegerArray with 2 numpy arrays:
+
+    - data: contains a numpy integer array of the appropriate dtype
+    - mask: a boolean array holding a mask on the data, True is missing
+
+    To construct an IntegerArray from generic array-like input, use
+    :func:`pandas.array` with one of the integer dtypes (see examples).
+
+    See :ref:`integer_na` for more.
+
+    Parameters
+    ----------
+    values : numpy.ndarray
+        A 1-d integer-dtype array.
+    mask : numpy.ndarray
+        A 1-d boolean-dtype array indicating missing values.
+    copy : bool, default False
+        Whether to copy the `values` and `mask`.
+
+    Returns
+    -------
+    IntegerArray
+
+    Examples
+    --------
+    Create an IntegerArray with :func:`pandas.array`.
+
+    >>> int_array = pd.array([1, None, 3], dtype=pd.Int32Dtype())
+    >>> int_array
+    <IntegerArray>
+    [1, NaN, 3]
+    Length: 3, dtype: Int32
+
+    String aliases for the dtypes are also available. They are capitalized.
+
+    >>> pd.array([1, None, 3], dtype='Int32')
+    <IntegerArray>
+    [1, NaN, 3]
+    Length: 3, dtype: Int32
+
+    >>> pd.array([1, None, 3], dtype='UInt16')
+    <IntegerArray>
+    [1, NaN, 3]
+    Length: 3, dtype: UInt16
+    """
+
+    @cache_readonly
+    def dtype(self):
+        return _dtypes[str(self._data.dtype)]
+
+    def __init__(self, values, mask, copy=False):
+        if not (isinstance(values, np.ndarray)
+                and is_integer_dtype(values.dtype)):
+            raise TypeError("values should be integer numpy array. Use "
+                            "the 'integer_array' function instead")
+        if not (isinstance(mask, np.ndarray) and is_bool_dtype(mask.dtype)):
+            raise TypeError("mask should be boolean numpy array. Use "
+                            "the 'integer_array' function instead")
+
+        if copy:
+            values = values.copy()
+            mask = mask.copy()
+
+        self._data = values
+        self._mask = mask
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return integer_array(scalars, dtype=dtype, copy=copy)
+
+    @classmethod
+    def _from_sequence_of_strings(cls, strings, dtype=None, copy=False):
+        scalars = to_numeric(strings, errors="raise")
+        return cls._from_sequence(scalars, dtype, copy)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return integer_array(values, dtype=original.dtype)
+
+    def _formatter(self, boxed=False):
+        def fmt(x):
+            if isna(x):
+                return 'NaN'
+            return str(x)
+        return fmt
+
+    def __getitem__(self, item):
+        if is_integer(item):
+            if self._mask[item]:
+                return self.dtype.na_value
+            return self._data[item]
+        return type(self)(self._data[item], self._mask[item])
+
+    def _coerce_to_ndarray(self):
+        """
+        coerce to an ndarary of object dtype
+        """
+
+        # TODO(jreback) make this better
+        data = self._data.astype(object)
+        data[self._mask] = self._na_value
+        return data
+
+    __array_priority__ = 1000  # higher than ndarray so ops dispatch to us
+
+    def __array__(self, dtype=None):
+        """
+        the array interface, return my values
+        We return an object array here to preserve our scalar values
+        """
+        return self._coerce_to_ndarray()
+
+    def __iter__(self):
+        for i in range(len(self)):
+            if self._mask[i]:
+                yield self.dtype.na_value
+            else:
+                yield self._data[i]
+
+    def take(self, indexer, allow_fill=False, fill_value=None):
+        from pandas.api.extensions import take
+
+        # we always fill with 1 internally
+        # to avoid upcasting
+        data_fill_value = 1 if isna(fill_value) else fill_value
+        result = take(self._data, indexer, fill_value=data_fill_value,
+                      allow_fill=allow_fill)
+
+        mask = take(self._mask, indexer, fill_value=True,
+                    allow_fill=allow_fill)
+
+        # if we are filling
+        # we only fill where the indexer is null
+        # not existing missing values
+        # TODO(jreback) what if we have a non-na float as a fill value?
+        if allow_fill and notna(fill_value):
+            fill_mask = np.asarray(indexer) == -1
+            result[fill_mask] = fill_value
+            mask = mask ^ fill_mask
+
+        return type(self)(result, mask, copy=False)
+
+    def copy(self, deep=False):
+        data, mask = self._data, self._mask
+        if deep:
+            data = copy.deepcopy(data)
+            mask = copy.deepcopy(mask)
+        else:
+            data = data.copy()
+            mask = mask.copy()
+        return type(self)(data, mask, copy=False)
+
+    def __setitem__(self, key, value):
+        _is_scalar = is_scalar(value)
+        if _is_scalar:
+            value = [value]
+        value, mask = coerce_to_array(value, dtype=self.dtype)
+
+        if _is_scalar:
+            value = value[0]
+            mask = mask[0]
+
+        self._data[key] = value
+        self._mask[key] = mask
+
+    def __len__(self):
+        return len(self._data)
+
+    @property
+    def nbytes(self):
+        return self._data.nbytes + self._mask.nbytes
+
+    def isna(self):
+        return self._mask
+
+    @property
+    def _na_value(self):
+        return np.nan
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        data = np.concatenate([x._data for x in to_concat])
+        mask = np.concatenate([x._mask for x in to_concat])
+        return cls(data, mask)
+
+    def astype(self, dtype, copy=True):
+        """
+        Cast to a NumPy array or IntegerArray with 'dtype'.
+
+        Parameters
+        ----------
+        dtype : str or dtype
+            Typecode or data-type to which the array is cast.
+        copy : bool, default True
+            Whether to copy the data, even if not necessary. If False,
+            a copy is made only if the old dtype does not match the
+            new dtype.
+
+        Returns
+        -------
+        array : ndarray or IntegerArray
+            NumPy ndarray or IntergerArray with 'dtype' for its dtype.
+
+        Raises
+        ------
+        TypeError
+            if incompatible type with an IntegerDtype, equivalent of same_kind
+            casting
+        """
+
+        # if we are astyping to an existing IntegerDtype we can fastpath
+        if isinstance(dtype, _IntegerDtype):
+            result = self._data.astype(dtype.numpy_dtype, copy=False)
+            return type(self)(result, mask=self._mask, copy=False)
+
+        # coerce
+        data = self._coerce_to_ndarray()
+        return astype_nansafe(data, dtype, copy=None)
+
+    @property
+    def _ndarray_values(self):
+        # type: () -> np.ndarray
+        """Internal pandas method for lossy conversion to a NumPy ndarray.
+
+        This method is not part of the pandas interface.
+
+        The expectation is that this is cheap to compute, and is primarily
+        used for interacting with our indexers.
+        """
+        return self._data
+
+    def value_counts(self, dropna=True):
+        """
+        Returns a Series containing counts of each category.
+
+        Every category will have an entry, even those with a count of 0.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaN.
+
+        Returns
+        -------
+        counts : Series
+
+        See Also
+        --------
+        Series.value_counts
+
+        """
+
+        from pandas import Index, Series
+
+        # compute counts on the data with no nans
+        data = self._data[~self._mask]
+        value_counts = Index(data).value_counts()
+        array = value_counts.values
+
+        # TODO(extension)
+        # if we have allow Index to hold an ExtensionArray
+        # this is easier
+        index = value_counts.index.astype(object)
+
+        # if we want nans, count the mask
+        if not dropna:
+
+            # TODO(extension)
+            # appending to an Index *always* infers
+            # w/o passing the dtype
+            array = np.append(array, [self._mask.sum()])
+            index = Index(np.concatenate(
+                [index.values,
+                 np.array([np.nan], dtype=object)]), dtype=object)
+
+        return Series(array, index=index)
+
+    def _values_for_argsort(self):
+        # type: () -> ndarray
+        """Return values for sorting.
+
+        Returns
+        -------
+        ndarray
+            The transformed values should maintain the ordering between values
+            within the array.
+
+        See Also
+        --------
+        ExtensionArray.argsort
+        """
+        data = self._data.copy()
+        data[self._mask] = data.min() - 1
+        return data
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        def cmp_method(self, other):
+
+            op_name = op.__name__
+            mask = None
+
+            if isinstance(other, (ABCSeries, ABCIndexClass)):
+                # Rely on pandas to unbox and dispatch to us.
+                return NotImplemented
+
+            if isinstance(other, IntegerArray):
+                other, mask = other._data, other._mask
+
+            elif is_list_like(other):
+                other = np.asarray(other)
+                if other.ndim > 0 and len(self) != len(other):
+                    raise ValueError('Lengths must match to compare')
+
+            other = lib.item_from_zerodim(other)
+
+            # numpy will show a DeprecationWarning on invalid elementwise
+            # comparisons, this will raise in the future
+            with warnings.catch_warnings():
+                warnings.filterwarnings("ignore", "elementwise", FutureWarning)
+                with np.errstate(all='ignore'):
+                    result = op(self._data, other)
+
+            # nans propagate
+            if mask is None:
+                mask = self._mask
+            else:
+                mask = self._mask | mask
+
+            result[mask] = op_name == 'ne'
+            return result
+
+        name = '__{name}__'.format(name=op.__name__)
+        return set_function_name(cmp_method, name, cls)
+
+    def _reduce(self, name, skipna=True, **kwargs):
+        data = self._data
+        mask = self._mask
+
+        # coerce to a nan-aware float if needed
+        if mask.any():
+            data = self._data.astype('float64')
+            data[mask] = self._na_value
+
+        op = getattr(nanops, 'nan' + name)
+        result = op(data, axis=0, skipna=skipna, mask=mask)
+
+        # if we have a boolean op, don't coerce
+        if name in ['any', 'all']:
+            pass
+
+        # if we have a preservable numeric op,
+        # provide coercion back to an integer type if possible
+        elif name in ['sum', 'min', 'max', 'prod'] and notna(result):
+            int_result = int(result)
+            if int_result == result:
+                result = int_result
+
+        return result
+
+    def _maybe_mask_result(self, result, mask, other, op_name):
+        """
+        Parameters
+        ----------
+        result : array-like
+        mask : array-like bool
+        other : scalar or array-like
+        op_name : str
+        """
+
+        # may need to fill infs
+        # and mask wraparound
+        if is_float_dtype(result):
+            mask |= (result == np.inf) | (result == -np.inf)
+
+        # if we have a float operand we are by-definition
+        # a float result
+        # or our op is a divide
+        if ((is_float_dtype(other) or is_float(other)) or
+                (op_name in ['rtruediv', 'truediv', 'rdiv', 'div'])):
+            result[mask] = np.nan
+            return result
+
+        return type(self)(result, mask, copy=False)
+
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        def integer_arithmetic_method(self, other):
+
+            op_name = op.__name__
+            mask = None
+
+            if isinstance(other, (ABCSeries, ABCIndexClass)):
+                # Rely on pandas to unbox and dispatch to us.
+                return NotImplemented
+
+            if getattr(other, 'ndim', 0) > 1:
+                raise NotImplementedError(
+                    "can only perform ops with 1-d structures")
+
+            if isinstance(other, IntegerArray):
+                other, mask = other._data, other._mask
+
+            elif getattr(other, 'ndim', None) == 0:
+                other = other.item()
+
+            elif is_list_like(other):
+                other = np.asarray(other)
+                if not other.ndim:
+                    other = other.item()
+                elif other.ndim == 1:
+                    if not (is_float_dtype(other) or is_integer_dtype(other)):
+                        raise TypeError(
+                            "can only perform ops with numeric values")
+            else:
+                if not (is_float(other) or is_integer(other)):
+                    raise TypeError("can only perform ops with numeric values")
+
+            # nans propagate
+            if mask is None:
+                mask = self._mask
+            else:
+                mask = self._mask | mask
+
+            # 1 ** np.nan is 1. So we have to unmask those.
+            if op_name == 'pow':
+                mask = np.where(self == 1, False, mask)
+
+            elif op_name == 'rpow':
+                mask = np.where(other == 1, False, mask)
+
+            with np.errstate(all='ignore'):
+                result = op(self._data, other)
+
+            # divmod returns a tuple
+            if op_name == 'divmod':
+                div, mod = result
+                return (self._maybe_mask_result(div, mask, other, 'floordiv'),
+                        self._maybe_mask_result(mod, mask, other, 'mod'))
+
+            return self._maybe_mask_result(result, mask, other, op_name)
+
+        name = '__{name}__'.format(name=op.__name__)
+        return set_function_name(integer_arithmetic_method, name, cls)
+
+
+IntegerArray._add_arithmetic_ops()
+IntegerArray._add_comparison_ops()
+
+
+module = sys.modules[__name__]
+
+
+# create the Dtype
+_dtypes = {}
+for dtype in ['int8', 'int16', 'int32', 'int64',
+              'uint8', 'uint16', 'uint32', 'uint64']:
+
+    if dtype.startswith('u'):
+        name = "U{}".format(dtype[1:].capitalize())
+    else:
+        name = dtype.capitalize()
+    classname = "{}Dtype".format(name)
+    numpy_dtype = getattr(np, dtype)
+    attributes_dict = {'type': numpy_dtype,
+                       'name': name}
+    dtype_type = register_extension_dtype(
+        type(classname, (_IntegerDtype, ), attributes_dict)
+    )
+    setattr(module, classname, dtype_type)
+
+    _dtypes[dtype] = dtype_type()
diff --git a/pandas/core/arrays/interval.py b/pandas/core/arrays/interval.py
new file mode 100644
index 0000000000000..1e671c7bd956a
--- /dev/null
+++ b/pandas/core/arrays/interval.py
@@ -0,0 +1,1104 @@
+from operator import le, lt
+import textwrap
+
+import numpy as np
+
+from pandas._libs.interval import (
+    Interval, IntervalMixin, intervals_to_interval_bounds)
+from pandas.compat import add_metaclass
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender
+from pandas.util._doctools import _WritableDoc
+
+from pandas.core.dtypes.cast import maybe_convert_platform
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64_any_dtype, is_float_dtype,
+    is_integer_dtype, is_interval, is_interval_dtype, is_scalar,
+    is_string_dtype, is_timedelta64_dtype, pandas_dtype)
+from pandas.core.dtypes.dtypes import IntervalDtype
+from pandas.core.dtypes.generic import (
+    ABCDatetimeIndex, ABCInterval, ABCIntervalIndex, ABCPeriodIndex, ABCSeries)
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.core.arrays.base import (
+    ExtensionArray, _extension_array_shared_docs)
+from pandas.core.arrays.categorical import Categorical
+import pandas.core.common as com
+from pandas.core.config import get_option
+from pandas.core.indexes.base import Index, ensure_index
+
+_VALID_CLOSED = {'left', 'right', 'both', 'neither'}
+_interval_shared_docs = {}
+
+_shared_docs_kwargs = dict(
+    klass='IntervalArray',
+    qualname='arrays.IntervalArray',
+    name=''
+)
+
+
+_interval_shared_docs['class'] = """
+%(summary)s
+
+.. versionadded:: %(versionadded)s
+
+.. warning::
+
+   The indexing behaviors are provisional and may change in
+   a future version of pandas.
+
+Parameters
+----------
+data : array-like (1-dimensional)
+    Array-like containing Interval objects from which to build the
+    %(klass)s.
+closed : {'left', 'right', 'both', 'neither'}, default 'right'
+    Whether the intervals are closed on the left-side, right-side, both or
+    neither.
+dtype : dtype or None, default None
+    If None, dtype will be inferred.
+
+    .. versionadded:: 0.23.0
+copy : bool, default False
+    Copy the input data.
+%(name)s\
+verify_integrity : bool, default True
+    Verify that the %(klass)s is valid.
+
+Attributes
+----------
+left
+right
+closed
+mid
+length
+is_non_overlapping_monotonic
+%(extra_attributes)s\
+
+Methods
+-------
+from_arrays
+from_tuples
+from_breaks
+overlaps
+set_closed
+to_tuples
+%(extra_methods)s\
+
+See Also
+--------
+Index : The base pandas Index type.
+Interval : A bounded slice-like interval; the elements of an %(klass)s.
+interval_range : Function to create a fixed frequency IntervalIndex.
+cut : Bin values into discrete Intervals.
+qcut : Bin values into equal-sized Intervals based on rank or sample quantiles.
+
+Notes
+------
+See the `user guide
+<http://pandas.pydata.org/pandas-docs/stable/advanced.html#intervalindex>`_
+for more.
+
+%(examples)s\
+"""
+
+
+@Appender(_interval_shared_docs['class'] % dict(
+    klass="IntervalArray",
+    summary="Pandas array for interval data that are closed on the same side.",
+    versionadded="0.24.0",
+    name='',
+    extra_attributes='',
+    extra_methods='',
+    examples=textwrap.dedent("""\
+    Examples
+    --------
+    A new ``IntervalArray`` can be constructed directly from an array-like of
+    ``Interval`` objects:
+
+    >>> pd.arrays.IntervalArray([pd.Interval(0, 1), pd.Interval(1, 5)])
+    IntervalArray([(0, 1], (1, 5]],
+                  closed='right',
+                  dtype='interval[int64]')
+
+    It may also be constructed using one of the constructor
+    methods: :meth:`IntervalArray.from_arrays`,
+    :meth:`IntervalArray.from_breaks`, and :meth:`IntervalArray.from_tuples`.
+    """),
+))
+@add_metaclass(_WritableDoc)
+class IntervalArray(IntervalMixin, ExtensionArray):
+    dtype = IntervalDtype()
+    ndim = 1
+    can_hold_na = True
+    _na_value = _fill_value = np.nan
+
+    def __new__(cls, data, closed=None, dtype=None, copy=False,
+                verify_integrity=True):
+
+        if isinstance(data, ABCSeries) and is_interval_dtype(data):
+            data = data.values
+
+        if isinstance(data, (cls, ABCIntervalIndex)):
+            left = data.left
+            right = data.right
+            closed = closed or data.closed
+        else:
+
+            # don't allow scalars
+            if is_scalar(data):
+                msg = ("{}(...) must be called with a collection of some kind,"
+                       " {} was passed")
+                raise TypeError(msg.format(cls.__name__, data))
+
+            # might need to convert empty or purely na data
+            data = maybe_convert_platform_interval(data)
+            left, right, infer_closed = intervals_to_interval_bounds(
+                data, validate_closed=closed is None)
+            closed = closed or infer_closed
+
+        return cls._simple_new(left, right, closed, copy=copy, dtype=dtype,
+                               verify_integrity=verify_integrity)
+
+    @classmethod
+    def _simple_new(cls, left, right, closed=None,
+                    copy=False, dtype=None, verify_integrity=True):
+        result = IntervalMixin.__new__(cls)
+
+        closed = closed or 'right'
+        left = ensure_index(left, copy=copy)
+        right = ensure_index(right, copy=copy)
+
+        if dtype is not None:
+            # GH 19262: dtype must be an IntervalDtype to override inferred
+            dtype = pandas_dtype(dtype)
+            if not is_interval_dtype(dtype):
+                msg = 'dtype must be an IntervalDtype, got {dtype}'
+                raise TypeError(msg.format(dtype=dtype))
+            elif dtype.subtype is not None:
+                left = left.astype(dtype.subtype)
+                right = right.astype(dtype.subtype)
+
+        # coerce dtypes to match if needed
+        if is_float_dtype(left) and is_integer_dtype(right):
+            right = right.astype(left.dtype)
+        elif is_float_dtype(right) and is_integer_dtype(left):
+            left = left.astype(right.dtype)
+
+        if type(left) != type(right):
+            msg = ('must not have differing left [{ltype}] and right '
+                   '[{rtype}] types')
+            raise ValueError(msg.format(ltype=type(left).__name__,
+                                        rtype=type(right).__name__))
+        elif is_categorical_dtype(left.dtype) or is_string_dtype(left.dtype):
+            # GH 19016
+            msg = ('category, object, and string subtypes are not supported '
+                   'for IntervalArray')
+            raise TypeError(msg)
+        elif isinstance(left, ABCPeriodIndex):
+            msg = 'Period dtypes are not supported, use a PeriodIndex instead'
+            raise ValueError(msg)
+        elif (isinstance(left, ABCDatetimeIndex) and
+                str(left.tz) != str(right.tz)):
+            msg = ("left and right must have the same time zone, got "
+                   "'{left_tz}' and '{right_tz}'")
+            raise ValueError(msg.format(left_tz=left.tz, right_tz=right.tz))
+
+        result._left = left
+        result._right = right
+        result._closed = closed
+        if verify_integrity:
+            result._validate()
+        return result
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return cls(scalars, dtype=dtype, copy=copy)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        if len(values) == 0:
+            # An empty array returns object-dtype here. We can't create
+            # a new IA from an (empty) object-dtype array, so turn it into the
+            # correct dtype.
+            values = values.astype(original.dtype.subtype)
+        return cls(values, closed=original.closed)
+
+    _interval_shared_docs['from_breaks'] = """
+    Construct an %(klass)s from an array of splits.
+
+    Parameters
+    ----------
+    breaks : array-like (1-dimensional)
+        Left and right bounds for each interval.
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the intervals are closed on the left-side, right-side, both
+        or neither.
+    copy : boolean, default False
+        copy the data
+    dtype : dtype or None, default None
+        If None, dtype will be inferred
+
+        .. versionadded:: 0.23.0
+
+    See Also
+    --------
+    interval_range : Function to create a fixed frequency IntervalIndex.
+    %(klass)s.from_arrays : Construct from a left and right array.
+    %(klass)s.from_tuples : Construct from a sequence of tuples.
+
+    Examples
+    --------
+    >>> pd.%(qualname)s.from_breaks([0, 1, 2, 3])
+    %(klass)s([(0, 1], (1, 2], (2, 3]],
+                  closed='right',
+                  dtype='interval[int64]')
+    """
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_breaks'] % _shared_docs_kwargs)
+    def from_breaks(cls, breaks, closed='right', copy=False, dtype=None):
+        breaks = maybe_convert_platform_interval(breaks)
+
+        return cls.from_arrays(breaks[:-1], breaks[1:], closed, copy=copy,
+                               dtype=dtype)
+
+    _interval_shared_docs['from_arrays'] = """
+        Construct from two arrays defining the left and right bounds.
+
+        Parameters
+        ----------
+        left : array-like (1-dimensional)
+            Left bounds for each interval.
+        right : array-like (1-dimensional)
+            Right bounds for each interval.
+        closed : {'left', 'right', 'both', 'neither'}, default 'right'
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.
+        copy : boolean, default False
+            Copy the data.
+        dtype : dtype, optional
+            If None, dtype will be inferred.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        %(klass)s
+
+        Raises
+        ------
+        ValueError
+            When a value is missing in only one of `left` or `right`.
+            When a value in `left` is greater than the corresponding value
+            in `right`.
+
+        See Also
+        --------
+        interval_range : Function to create a fixed frequency IntervalIndex.
+        %(klass)s.from_breaks : Construct an %(klass)s from an array of
+            splits.
+        %(klass)s.from_tuples : Construct an %(klass)s from an
+            array-like of tuples.
+
+        Notes
+        -----
+        Each element of `left` must be less than or equal to the `right`
+        element at the same position. If an element is missing, it must be
+        missing in both `left` and `right`. A TypeError is raised when
+        using an unsupported type for `left` or `right`. At the moment,
+        'category', 'object', and 'string' subtypes are not supported.
+
+        Examples
+        --------
+        >>> %(klass)s.from_arrays([0, 1, 2], [1, 2, 3])
+        %(klass)s([(0, 1], (1, 2], (2, 3]],
+                     closed='right',
+                     dtype='interval[int64]')
+        """
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_arrays'] % _shared_docs_kwargs)
+    def from_arrays(cls, left, right, closed='right', copy=False, dtype=None):
+        left = maybe_convert_platform_interval(left)
+        right = maybe_convert_platform_interval(right)
+
+        return cls._simple_new(left, right, closed, copy=copy,
+                               dtype=dtype, verify_integrity=True)
+
+    _interval_shared_docs['from_intervals'] = """
+    Construct an %(klass)s from a 1d array of Interval objects
+
+    .. deprecated:: 0.23.0
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+        Array of Interval objects. All intervals must be closed on the same
+        sides.
+    copy : boolean, default False
+        by-default copy the data, this is compat only and ignored
+    dtype : dtype or None, default None
+        If None, dtype will be inferred
+
+        ..versionadded:: 0.23.0
+
+    See Also
+    --------
+    interval_range : Function to create a fixed frequency IntervalIndex.
+    %(klass)s.from_arrays : Construct an %(klass)s from a left and
+                                right array.
+    %(klass)s.from_breaks : Construct an %(klass)s from an array of
+                                splits.
+    %(klass)s.from_tuples : Construct an %(klass)s from an
+                                array-like of tuples.
+
+    Examples
+    --------
+    >>> pd.%(qualname)s.from_intervals([pd.Interval(0, 1),
+    ...                                  pd.Interval(1, 2)])
+    %(klass)s([(0, 1], (1, 2]],
+                  closed='right', dtype='interval[int64]')
+
+    The generic Index constructor work identically when it infers an array
+    of all intervals:
+
+    >>> pd.Index([pd.Interval(0, 1), pd.Interval(1, 2)])
+    %(klass)s([(0, 1], (1, 2]],
+                  closed='right', dtype='interval[int64]')
+    """
+
+    _interval_shared_docs['from_tuples'] = """
+    Construct an %(klass)s from an array-like of tuples
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+        Array of tuples
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the intervals are closed on the left-side, right-side, both
+        or neither.
+    copy : boolean, default False
+        by-default copy the data, this is compat only and ignored
+    dtype : dtype or None, default None
+        If None, dtype will be inferred
+
+        ..versionadded:: 0.23.0
+
+    See Also
+    --------
+    interval_range : Function to create a fixed frequency IntervalIndex.
+    %(klass)s.from_arrays : Construct an %(klass)s from a left and
+                                right array.
+    %(klass)s.from_breaks : Construct an %(klass)s from an array of
+                                splits.
+
+    Examples
+    --------
+    >>> pd.%(qualname)s.from_tuples([(0, 1), (1, 2)])
+    %(klass)s([(0, 1], (1, 2]],
+                closed='right', dtype='interval[int64]')
+    """
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_tuples'] % _shared_docs_kwargs)
+    def from_tuples(cls, data, closed='right', copy=False, dtype=None):
+        if len(data):
+            left, right = [], []
+        else:
+            # ensure that empty data keeps input dtype
+            left = right = data
+
+        for d in data:
+            if isna(d):
+                lhs = rhs = np.nan
+            else:
+                name = cls.__name__
+                try:
+                    # need list of length 2 tuples, e.g. [(0, 1), (1, 2), ...]
+                    lhs, rhs = d
+                except ValueError:
+                    msg = ('{name}.from_tuples requires tuples of '
+                           'length 2, got {tpl}').format(name=name, tpl=d)
+                    raise ValueError(msg)
+                except TypeError:
+                    msg = ('{name}.from_tuples received an invalid '
+                           'item, {tpl}').format(name=name, tpl=d)
+                    raise TypeError(msg)
+            left.append(lhs)
+            right.append(rhs)
+
+        return cls.from_arrays(left, right, closed, copy=False,
+                               dtype=dtype)
+
+    def _validate(self):
+        """Verify that the IntervalArray is valid.
+
+        Checks that
+
+        * closed is valid
+        * left and right match lengths
+        * left and right have the same missing values
+        * left is always below right
+        """
+        if self.closed not in _VALID_CLOSED:
+            raise ValueError("invalid option for 'closed': {closed}"
+                             .format(closed=self.closed))
+        if len(self.left) != len(self.right):
+            raise ValueError('left and right must have the same length')
+        left_mask = notna(self.left)
+        right_mask = notna(self.right)
+        if not (left_mask == right_mask).all():
+            raise ValueError('missing values must be missing in the same '
+                             'location both left and right sides')
+        if not (self.left[left_mask] <= self.right[left_mask]).all():
+            raise ValueError('left side of interval must be <= right side')
+
+    # ---------
+    # Interface
+    # ---------
+    def __iter__(self):
+        return iter(np.asarray(self))
+
+    def __len__(self):
+        return len(self.left)
+
+    def __getitem__(self, value):
+        left = self.left[value]
+        right = self.right[value]
+
+        # scalar
+        if not isinstance(left, Index):
+            if isna(left):
+                return self._fill_value
+            return Interval(left, right, self.closed)
+
+        return self._shallow_copy(left, right)
+
+    def __setitem__(self, key, value):
+        # na value: need special casing to set directly on numpy arrays
+        needs_float_conversion = False
+        if is_scalar(value) and isna(value):
+            if is_integer_dtype(self.dtype.subtype):
+                # can't set NaN on a numpy integer array
+                needs_float_conversion = True
+            elif is_datetime64_any_dtype(self.dtype.subtype):
+                # need proper NaT to set directly on the numpy array
+                value = np.datetime64('NaT')
+            elif is_timedelta64_dtype(self.dtype.subtype):
+                # need proper NaT to set directly on the numpy array
+                value = np.timedelta64('NaT')
+            value_left, value_right = value, value
+
+        # scalar interval
+        elif is_interval_dtype(value) or isinstance(value, ABCInterval):
+            self._check_closed_matches(value, name="value")
+            value_left, value_right = value.left, value.right
+
+        else:
+            # list-like of intervals
+            try:
+                array = IntervalArray(value)
+                value_left, value_right = array.left, array.right
+            except TypeError:
+                # wrong type: not interval or NA
+                msg = "'value' should be an interval type, got {} instead."
+                raise TypeError(msg.format(type(value)))
+
+        # Need to ensure that left and right are updated atomically, so we're
+        # forced to copy, update the copy, and swap in the new values.
+        left = self.left.copy(deep=True)
+        if needs_float_conversion:
+            left = left.astype('float')
+        left.values[key] = value_left
+        self._left = left
+
+        right = self.right.copy(deep=True)
+        if needs_float_conversion:
+            right = right.astype('float')
+        right.values[key] = value_right
+        self._right = right
+
+    def fillna(self, value=None, method=None, limit=None):
+        """
+        Fill NA/NaN values using the specified method.
+
+        Parameters
+        ----------
+        value : scalar, dict, Series
+            If a scalar value is passed it is used to fill all missing values.
+            Alternatively, a Series or dict can be used to fill in different
+            values for each index. The value should not be a list. The
+            value(s) passed should be either Interval objects or NA/NaN.
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            (Not implemented yet for IntervalArray)
+            Method to use for filling holes in reindexed Series
+        limit : int, default None
+            (Not implemented yet for IntervalArray)
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled.
+
+        Returns
+        -------
+        filled : IntervalArray with NA/NaN filled
+        """
+        if method is not None:
+            raise TypeError('Filling by method is not supported for '
+                            'IntervalArray.')
+        if limit is not None:
+            raise TypeError('limit is not supported for IntervalArray.')
+
+        if not isinstance(value, ABCInterval):
+            msg = ("'IntervalArray.fillna' only supports filling with a "
+                   "scalar 'pandas.Interval'. Got a '{}' instead."
+                   .format(type(value).__name__))
+            raise TypeError(msg)
+
+        value = getattr(value, '_values', value)
+        self._check_closed_matches(value, name="value")
+
+        left = self.left.fillna(value=value.left)
+        right = self.right.fillna(value=value.right)
+        return self._shallow_copy(left, right)
+
+    @property
+    def dtype(self):
+        return IntervalDtype(self.left.dtype)
+
+    def astype(self, dtype, copy=True):
+        """
+        Cast to an ExtensionArray or NumPy array with dtype 'dtype'.
+
+        Parameters
+        ----------
+        dtype : str or dtype
+            Typecode or data-type to which the array is cast.
+
+        copy : bool, default True
+            Whether to copy the data, even if not necessary. If False,
+            a copy is made only if the old dtype does not match the
+            new dtype.
+
+        Returns
+        -------
+        array : ExtensionArray or ndarray
+            ExtensionArray or NumPy ndarray with 'dtype' for its dtype.
+        """
+        dtype = pandas_dtype(dtype)
+        if is_interval_dtype(dtype):
+            if dtype == self.dtype:
+                return self.copy() if copy else self
+
+            # need to cast to different subtype
+            try:
+                new_left = self.left.astype(dtype.subtype)
+                new_right = self.right.astype(dtype.subtype)
+            except TypeError:
+                msg = ('Cannot convert {dtype} to {new_dtype}; subtypes are '
+                       'incompatible')
+                raise TypeError(msg.format(dtype=self.dtype, new_dtype=dtype))
+            return self._shallow_copy(new_left, new_right)
+        elif is_categorical_dtype(dtype):
+            return Categorical(np.asarray(self))
+        # TODO: This try/except will be repeated.
+        try:
+            return np.asarray(self).astype(dtype, copy=copy)
+        except (TypeError, ValueError):
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        """
+        Concatenate multiple IntervalArray
+
+        Parameters
+        ----------
+        to_concat : sequence of IntervalArray
+
+        Returns
+        -------
+        IntervalArray
+        """
+        closed = {interval.closed for interval in to_concat}
+        if len(closed) != 1:
+            raise ValueError("Intervals must all be closed on the same side.")
+        closed = closed.pop()
+
+        left = np.concatenate([interval.left for interval in to_concat])
+        right = np.concatenate([interval.right for interval in to_concat])
+        return cls._simple_new(left, right, closed=closed, copy=False)
+
+    def _shallow_copy(self, left=None, right=None, closed=None):
+        """
+        Return a new IntervalArray with the replacement attributes
+
+        Parameters
+        ----------
+        left : array-like
+            Values to be used for the left-side of the the intervals.
+            If None, the existing left and right values will be used.
+
+        right : array-like
+            Values to be used for the right-side of the the intervals.
+            If None and left is IntervalArray-like, the left and right
+            of the IntervalArray-like will be used.
+
+        closed : {'left', 'right', 'both', 'neither'}, optional
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.  If None, the existing closed will be used.
+        """
+        if left is None:
+
+            # no values passed
+            left, right = self.left, self.right
+
+        elif right is None:
+
+            # only single value passed, could be an IntervalArray
+            # or array of Intervals
+            if not isinstance(left, (type(self), ABCIntervalIndex)):
+                left = type(self)(left)
+
+            left, right = left.left, left.right
+        else:
+
+            # both left and right are values
+            pass
+
+        closed = closed or self.closed
+        return self._simple_new(
+            left, right, closed=closed, verify_integrity=False)
+
+    def copy(self, deep=False):
+        """
+        Return a copy of the array.
+
+        Parameters
+        ----------
+        deep : bool, default False
+            Also copy the underlying data backing this array.
+
+        Returns
+        -------
+        IntervalArray
+        """
+        left = self.left.copy(deep=True) if deep else self.left
+        right = self.right.copy(deep=True) if deep else self.right
+        closed = self.closed
+        # TODO: Could skip verify_integrity here.
+        return type(self).from_arrays(left, right, closed=closed)
+
+    def isna(self):
+        return isna(self.left)
+
+    @property
+    def nbytes(self):
+        return self.left.nbytes + self.right.nbytes
+
+    @property
+    def size(self):
+        # Avoid materializing self.values
+        return self.left.size
+
+    @property
+    def shape(self):
+        return self.left.shape
+
+    def take(self, indices, allow_fill=False, fill_value=None, axis=None,
+             **kwargs):
+        """
+        Take elements from the IntervalArray.
+
+        Parameters
+        ----------
+        indices : sequence of integers
+            Indices to be taken.
+
+        allow_fill : bool, default False
+            How to handle negative values in `indices`.
+
+            * False: negative values in `indices` indicate positional indices
+              from the right (the default). This is similar to
+              :func:`numpy.take`.
+
+            * True: negative values in `indices` indicate
+              missing values. These values are set to `fill_value`. Any other
+              other negative values raise a ``ValueError``.
+
+        fill_value : Interval or NA, optional
+            Fill value to use for NA-indices when `allow_fill` is True.
+            This may be ``None``, in which case the default NA value for
+            the type, ``self.dtype.na_value``, is used.
+
+            For many ExtensionArrays, there will be two representations of
+            `fill_value`: a user-facing "boxed" scalar, and a low-level
+            physical NA value. `fill_value` should be the user-facing version,
+            and the implementation should handle translating that to the
+            physical version for processing the take if necessary.
+
+        axis : any, default None
+            Present for compat with IntervalIndex; does nothing.
+
+        Returns
+        -------
+        IntervalArray
+
+        Raises
+        ------
+        IndexError
+            When the indices are out of bounds for the array.
+        ValueError
+            When `indices` contains negative values other than ``-1``
+            and `allow_fill` is True.
+        """
+        from pandas.core.algorithms import take
+
+        nv.validate_take(tuple(), kwargs)
+
+        fill_left = fill_right = fill_value
+        if allow_fill:
+            if fill_value is None:
+                fill_left = fill_right = self.left._na_value
+            elif is_interval(fill_value):
+                self._check_closed_matches(fill_value, name='fill_value')
+                fill_left, fill_right = fill_value.left, fill_value.right
+            elif not is_scalar(fill_value) and notna(fill_value):
+                msg = ("'IntervalArray.fillna' only supports filling with a "
+                       "'scalar pandas.Interval or NA'. Got a '{}' instead."
+                       .format(type(fill_value).__name__))
+                raise ValueError(msg)
+
+        left_take = take(self.left, indices,
+                         allow_fill=allow_fill, fill_value=fill_left)
+        right_take = take(self.right, indices,
+                          allow_fill=allow_fill, fill_value=fill_right)
+
+        return self._shallow_copy(left_take, right_take)
+
+    def value_counts(self, dropna=True):
+        """
+        Returns a Series containing counts of each interval.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaN.
+
+        Returns
+        -------
+        counts : Series
+
+        See Also
+        --------
+        Series.value_counts
+        """
+        # TODO: implement this is a non-naive way!
+        from pandas.core.algorithms import value_counts
+        return value_counts(np.asarray(self), dropna=dropna)
+
+    # Formatting
+
+    def _format_data(self):
+
+        # TODO: integrate with categorical and make generic
+        # name argument is unused here; just for compat with base / categorical
+        n = len(self)
+        max_seq_items = min((get_option(
+            'display.max_seq_items') or n) // 10, 10)
+
+        formatter = str
+
+        if n == 0:
+            summary = '[]'
+        elif n == 1:
+            first = formatter(self[0])
+            summary = '[{first}]'.format(first=first)
+        elif n == 2:
+            first = formatter(self[0])
+            last = formatter(self[-1])
+            summary = '[{first}, {last}]'.format(first=first, last=last)
+        else:
+
+            if n > max_seq_items:
+                n = min(max_seq_items // 2, 10)
+                head = [formatter(x) for x in self[:n]]
+                tail = [formatter(x) for x in self[-n:]]
+                summary = '[{head} ... {tail}]'.format(
+                    head=', '.join(head), tail=', '.join(tail))
+            else:
+                tail = [formatter(x) for x in self]
+                summary = '[{tail}]'.format(tail=', '.join(tail))
+
+        return summary
+
+    def __repr__(self):
+        tpl = textwrap.dedent("""\
+        {cls}({data},
+        {lead}closed='{closed}',
+        {lead}dtype='{dtype}')""")
+        return tpl.format(cls=self.__class__.__name__,
+                          data=self._format_data(),
+                          lead=' ' * len(self.__class__.__name__) + ' ',
+                          closed=self.closed, dtype=self.dtype)
+
+    def _format_space(self):
+        space = ' ' * (len(self.__class__.__name__) + 1)
+        return "\n{space}".format(space=space)
+
+    @property
+    def left(self):
+        """
+        Return the left endpoints of each Interval in the IntervalArray as
+        an Index
+        """
+        return self._left
+
+    @property
+    def right(self):
+        """
+        Return the right endpoints of each Interval in the IntervalArray as
+        an Index
+        """
+        return self._right
+
+    @property
+    def closed(self):
+        """
+        Whether the intervals are closed on the left-side, right-side, both or
+        neither
+        """
+        return self._closed
+
+    _interval_shared_docs['set_closed'] = """
+        Return an %(klass)s identical to the current one, but closed on the
+        specified side
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        closed : {'left', 'right', 'both', 'neither'}
+            Whether the intervals are closed on the left-side, right-side, both
+            or neither.
+
+        Returns
+        -------
+        new_index : %(klass)s
+
+        Examples
+        --------
+        >>> index = pd.interval_range(0, 3)
+        >>> index
+        IntervalIndex([(0, 1], (1, 2], (2, 3]],
+              closed='right',
+              dtype='interval[int64]')
+        >>> index.set_closed('both')
+        IntervalIndex([[0, 1], [1, 2], [2, 3]],
+              closed='both',
+              dtype='interval[int64]')
+        """
+
+    @Appender(_interval_shared_docs['set_closed'] % _shared_docs_kwargs)
+    def set_closed(self, closed):
+        if closed not in _VALID_CLOSED:
+            msg = "invalid option for 'closed': {closed}"
+            raise ValueError(msg.format(closed=closed))
+
+        return self._shallow_copy(closed=closed)
+
+    @property
+    def length(self):
+        """
+        Return an Index with entries denoting the length of each Interval in
+        the IntervalArray
+        """
+        try:
+            return self.right - self.left
+        except TypeError:
+            # length not defined for some types, e.g. string
+            msg = ('IntervalArray contains Intervals without defined length, '
+                   'e.g. Intervals with string endpoints')
+            raise TypeError(msg)
+
+    @property
+    def mid(self):
+        """
+        Return the midpoint of each Interval in the IntervalArray as an Index
+        """
+        try:
+            return 0.5 * (self.left + self.right)
+        except TypeError:
+            # datetime safe version
+            return self.left + 0.5 * self.length
+
+    _interval_shared_docs['is_non_overlapping_monotonic'] = """
+        Return True if the %(klass)s is non-overlapping (no Intervals share
+        points) and is either monotonic increasing or monotonic decreasing,
+        else False
+        """
+
+    @property
+    @Appender(_interval_shared_docs['is_non_overlapping_monotonic']
+              % _shared_docs_kwargs)
+    def is_non_overlapping_monotonic(self):
+        # must be increasing  (e.g., [0, 1), [1, 2), [2, 3), ... )
+        # or decreasing (e.g., [-1, 0), [-2, -1), [-3, -2), ...)
+        # we already require left <= right
+
+        # strict inequality for closed == 'both'; equality implies overlapping
+        # at a point when both sides of intervals are included
+        if self.closed == 'both':
+            return bool((self.right[:-1] < self.left[1:]).all() or
+                        (self.left[:-1] > self.right[1:]).all())
+
+        # non-strict inequality when closed != 'both'; at least one side is
+        # not included in the intervals, so equality does not imply overlapping
+        return bool((self.right[:-1] <= self.left[1:]).all() or
+                    (self.left[:-1] >= self.right[1:]).all())
+
+    # Conversion
+    def __array__(self, dtype=None):
+        """
+        Return the IntervalArray's data as a numpy array of Interval
+        objects (with dtype='object')
+        """
+        left = self.left
+        right = self.right
+        mask = self.isna()
+        closed = self._closed
+
+        result = np.empty(len(left), dtype=object)
+        for i in range(len(left)):
+            if mask[i]:
+                result[i] = np.nan
+            else:
+                result[i] = Interval(left[i], right[i], closed)
+        return result
+
+    _interval_shared_docs['to_tuples'] = """\
+        Return an %(return_type)s of tuples of the form (left, right)
+
+        Parameters
+        ----------
+        na_tuple : boolean, default True
+            Returns NA as a tuple if True, ``(nan, nan)``, or just as the NA
+            value itself if False, ``nan``.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        tuples: %(return_type)s
+        %(examples)s\
+    """
+
+    @Appender(_interval_shared_docs['to_tuples'] % dict(
+        return_type='ndarray',
+        examples='',
+    ))
+    def to_tuples(self, na_tuple=True):
+        tuples = com.asarray_tuplesafe(zip(self.left, self.right))
+        if not na_tuple:
+            # GH 18756
+            tuples = np.where(~self.isna(), tuples, np.nan)
+        return tuples
+
+    @Appender(_extension_array_shared_docs['repeat'] % _shared_docs_kwargs)
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        left_repeat = self.left.repeat(repeats)
+        right_repeat = self.right.repeat(repeats)
+        return self._shallow_copy(left=left_repeat, right=right_repeat)
+
+    _interval_shared_docs['overlaps'] = """
+        Check elementwise if an Interval overlaps the values in the %(klass)s.
+
+        Two intervals overlap if they share a common point, including closed
+        endpoints. Intervals that only have an open endpoint in common do not
+        overlap.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        other : Interval
+            Interval to check against for an overlap.
+
+        Returns
+        -------
+        ndarray
+            Boolean array positionally indicating where an overlap occurs.
+
+        See Also
+        --------
+        Interval.overlaps : Check whether two Interval objects overlap.
+
+        Examples
+        --------
+        >>> intervals = pd.%(qualname)s.from_tuples([(0, 1), (1, 3), (2, 4)])
+        >>> intervals
+        %(klass)s([(0, 1], (1, 3], (2, 4]],
+              closed='right',
+              dtype='interval[int64]')
+        >>> intervals.overlaps(pd.Interval(0.5, 1.5))
+        array([ True,  True, False])
+
+        Intervals that share closed endpoints overlap:
+
+        >>> intervals.overlaps(pd.Interval(1, 3, closed='left'))
+        array([ True,  True, True])
+
+        Intervals that only have an open endpoint in common do not overlap:
+
+        >>> intervals.overlaps(pd.Interval(1, 2, closed='right'))
+        array([False,  True, False])
+    """
+
+    @Appender(_interval_shared_docs['overlaps'] % _shared_docs_kwargs)
+    def overlaps(self, other):
+        if isinstance(other, (IntervalArray, ABCIntervalIndex)):
+            raise NotImplementedError
+        elif not isinstance(other, Interval):
+            msg = '`other` must be Interval-like, got {other}'
+            raise TypeError(msg.format(other=type(other).__name__))
+
+        # equality is okay if both endpoints are closed (overlap at a point)
+        op1 = le if (self.closed_left and other.closed_right) else lt
+        op2 = le if (other.closed_left and self.closed_right) else lt
+
+        # overlaps is equivalent negation of two interval being disjoint:
+        # disjoint = (A.left > B.right) or (B.left > A.right)
+        # (simplifying the negation allows this to be done in less operations)
+        return op1(self.left, other.right) & op2(other.left, self.right)
+
+
+def maybe_convert_platform_interval(values):
+    """
+    Try to do platform conversion, with special casing for IntervalArray.
+    Wrapper around maybe_convert_platform that alters the default return
+    dtype in certain cases to be compatible with IntervalArray.  For example,
+    empty lists return with integer dtype instead of object dtype, which is
+    prohibited for IntervalArray.
+
+    Parameters
+    ----------
+    values : array-like
+
+    Returns
+    -------
+    array
+    """
+    if isinstance(values, (list, tuple)) and len(values) == 0:
+        # GH 19016
+        # empty lists/tuples get object dtype by default, but this is not
+        # prohibited for IntervalArray, so coerce to integer instead
+        return np.array([], dtype=np.int64)
+    elif is_categorical_dtype(values):
+        values = np.asarray(values)
+
+    return maybe_convert_platform(values)
diff --git a/pandas/core/arrays/numpy_.py b/pandas/core/arrays/numpy_.py
new file mode 100644
index 0000000000000..8e2ab586cacb6
--- /dev/null
+++ b/pandas/core/arrays/numpy_.py
@@ -0,0 +1,465 @@
+import numbers
+
+import numpy as np
+
+from pandas._libs import lib
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender
+from pandas.util._validators import validate_fillna_kwargs
+
+from pandas.core.dtypes.dtypes import ExtensionDtype
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+from pandas.core.dtypes.inference import is_array_like, is_list_like
+
+from pandas import compat
+from pandas.core import nanops
+from pandas.core.algorithms import searchsorted
+from pandas.core.missing import backfill_1d, pad_1d
+
+from .base import ExtensionArray, ExtensionOpsMixin
+
+
+class PandasDtype(ExtensionDtype):
+    """
+    A Pandas ExtensionDtype for NumPy dtypes.
+
+    .. versionadded:: 0.24.0
+
+    This is mostly for internal compatibility, and is not especially
+    useful on its own.
+
+    Parameters
+    ----------
+    dtype : numpy.dtype
+    """
+    _metadata = ('_dtype',)
+
+    def __init__(self, dtype):
+        dtype = np.dtype(dtype)
+        self._dtype = dtype
+        self._name = dtype.name
+        self._type = dtype.type
+
+    def __repr__(self):
+        return "PandasDtype({!r})".format(self.name)
+
+    @property
+    def numpy_dtype(self):
+        """The NumPy dtype this PandasDtype wraps."""
+        return self._dtype
+
+    @property
+    def name(self):
+        return self._name
+
+    @property
+    def type(self):
+        return self._type
+
+    @property
+    def _is_numeric(self):
+        # exclude object, str, unicode, void.
+        return self.kind in set('biufc')
+
+    @property
+    def _is_boolean(self):
+        return self.kind == 'b'
+
+    @classmethod
+    def construct_from_string(cls, string):
+        return cls(np.dtype(string))
+
+    def construct_array_type(cls):
+        return PandasArray
+
+    @property
+    def kind(self):
+        return self._dtype.kind
+
+    @property
+    def itemsize(self):
+        """The element size of this data-type object."""
+        return self._dtype.itemsize
+
+
+# TODO(NumPy1.13): remove this
+# Compat for NumPy 1.12, which doesn't provide NDArrayOperatorsMixin
+# or __array_ufunc__, so those operations won't be available to people
+# on older NumPys.
+#
+# We would normally write this as bases=(...), then "class Foo(*bases):
+# but Python2 doesn't allow unpacking tuples in the class statement.
+# So, we fall back to "object", to avoid writing a metaclass.
+try:
+    from numpy.lib.mixins import NDArrayOperatorsMixin
+except ImportError:
+    NDArrayOperatorsMixin = object
+
+
+class PandasArray(ExtensionArray, ExtensionOpsMixin, NDArrayOperatorsMixin):
+    """
+    A pandas ExtensionArray for NumPy data.
+
+    .. versionadded :: 0.24.0
+
+    This is mostly for internal compatibility, and is not especially
+    useful on its own.
+
+    Parameters
+    ----------
+    values : ndarray
+        The NumPy ndarray to wrap. Must be 1-dimensional.
+    copy : bool, default False
+        Whether to copy `values`.
+
+    Notes
+    -----
+    Operations like ``+`` and applying ufuncs requires NumPy>=1.13.
+    """
+    # If you're wondering why pd.Series(cls) doesn't put the array in an
+    # ExtensionBlock, search for `ABCPandasArray`. We check for
+    # that _typ to ensure that that users don't unnecessarily use EAs inside
+    # pandas internals, which turns off things like block consolidation.
+    _typ = "npy_extension"
+    __array_priority__ = 1000
+
+    # ------------------------------------------------------------------------
+    # Constructors
+
+    def __init__(self, values, copy=False):
+        if isinstance(values, type(self)):
+            values = values._ndarray
+        if not isinstance(values, np.ndarray):
+            raise ValueError("'values' must be a NumPy array.")
+
+        if values.ndim != 1:
+            raise ValueError("PandasArray must be 1-dimensional.")
+
+        if copy:
+            values = values.copy()
+
+        self._ndarray = values
+        self._dtype = PandasDtype(values.dtype)
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        if isinstance(dtype, PandasDtype):
+            dtype = dtype._dtype
+
+        result = np.asarray(scalars, dtype=dtype)
+        if copy and result is scalars:
+            result = result.copy()
+        return cls(result)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls(values)
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        return cls(np.concatenate(to_concat))
+
+    # ------------------------------------------------------------------------
+    # Data
+
+    @property
+    def dtype(self):
+        return self._dtype
+
+    # ------------------------------------------------------------------------
+    # NumPy Array Interface
+
+    def __array__(self, dtype=None):
+        return np.asarray(self._ndarray, dtype=dtype)
+
+    _HANDLED_TYPES = (np.ndarray, numbers.Number)
+
+    def __array_ufunc__(self, ufunc, method, *inputs, **kwargs):
+        # Lightly modified version of
+        # https://docs.scipy.org/doc/numpy-1.15.1/reference/generated/\
+        # numpy.lib.mixins.NDArrayOperatorsMixin.html
+        # The primary modification is not boxing scalar return values
+        # in PandasArray, since pandas' ExtensionArrays are 1-d.
+        out = kwargs.get('out', ())
+        for x in inputs + out:
+            # Only support operations with instances of _HANDLED_TYPES.
+            # Use PandasArray instead of type(self) for isinstance to
+            # allow subclasses that don't override __array_ufunc__ to
+            # handle PandasArray objects.
+            if not isinstance(x, self._HANDLED_TYPES + (PandasArray,)):
+                return NotImplemented
+
+        # Defer to the implementation of the ufunc on unwrapped values.
+        inputs = tuple(x._ndarray if isinstance(x, PandasArray) else x
+                       for x in inputs)
+        if out:
+            kwargs['out'] = tuple(
+                x._ndarray if isinstance(x, PandasArray) else x
+                for x in out)
+        result = getattr(ufunc, method)(*inputs, **kwargs)
+
+        if type(result) is tuple and len(result):
+            # multiple return values
+            if not lib.is_scalar(result[0]):
+                # re-box array-like results
+                return tuple(type(self)(x) for x in result)
+            else:
+                # but not scalar reductions
+                return result
+        elif method == 'at':
+            # no return value
+            return None
+        else:
+            # one return value
+            if not lib.is_scalar(result):
+                # re-box array-like results, but not scalar reductions
+                result = type(self)(result)
+            return result
+
+    # ------------------------------------------------------------------------
+    # Pandas ExtensionArray Interface
+
+    def __getitem__(self, item):
+        if isinstance(item, type(self)):
+            item = item._ndarray
+
+        result = self._ndarray[item]
+        if not lib.is_scalar(item):
+            result = type(self)(result)
+        return result
+
+    def __setitem__(self, key, value):
+        from pandas.core.internals.arrays import extract_array
+
+        value = extract_array(value, extract_numpy=True)
+
+        if not lib.is_scalar(key) and is_list_like(key):
+            key = np.asarray(key)
+
+        if not lib.is_scalar(value):
+            value = np.asarray(value)
+
+        values = self._ndarray
+        t = np.result_type(value, values)
+        if t != self._ndarray.dtype:
+            values = values.astype(t, casting='safe')
+            values[key] = value
+            self._dtype = PandasDtype(t)
+            self._ndarray = values
+        else:
+            self._ndarray[key] = value
+
+    def __len__(self):
+        return len(self._ndarray)
+
+    @property
+    def nbytes(self):
+        return self._ndarray.nbytes
+
+    def isna(self):
+        from pandas import isna
+
+        return isna(self._ndarray)
+
+    def fillna(self, value=None, method=None, limit=None):
+        # TODO(_values_for_fillna): remove this
+        value, method = validate_fillna_kwargs(value, method)
+
+        mask = self.isna()
+
+        if is_array_like(value):
+            if len(value) != len(self):
+                raise ValueError("Length of 'value' does not match. Got ({}) "
+                                 " expected {}".format(len(value), len(self)))
+            value = value[mask]
+
+        if mask.any():
+            if method is not None:
+                func = pad_1d if method == 'pad' else backfill_1d
+                new_values = func(self._ndarray, limit=limit,
+                                  mask=mask)
+                new_values = self._from_sequence(new_values, dtype=self.dtype)
+            else:
+                # fill with value
+                new_values = self.copy()
+                new_values[mask] = value
+        else:
+            new_values = self.copy()
+        return new_values
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        from pandas.core.algorithms import take
+
+        result = take(self._ndarray, indices, allow_fill=allow_fill,
+                      fill_value=fill_value)
+        return type(self)(result)
+
+    def copy(self, deep=False):
+        return type(self)(self._ndarray.copy())
+
+    def _values_for_argsort(self):
+        return self._ndarray
+
+    def _values_for_factorize(self):
+        return self._ndarray, -1
+
+    def unique(self):
+        from pandas import unique
+
+        return type(self)(unique(self._ndarray))
+
+    # ------------------------------------------------------------------------
+    # Reductions
+
+    def _reduce(self, name, skipna=True, **kwargs):
+        meth = getattr(self, name, None)
+        if meth:
+            return meth(skipna=skipna, **kwargs)
+        else:
+            msg = (
+                "'{}' does not implement reduction '{}'"
+            )
+            raise TypeError(msg.format(type(self).__name__, name))
+
+    def any(self, axis=None, out=None, keepdims=False, skipna=True):
+        nv.validate_any((), dict(out=out, keepdims=keepdims))
+        return nanops.nanany(self._ndarray, axis=axis, skipna=skipna)
+
+    def all(self, axis=None, out=None, keepdims=False, skipna=True):
+        nv.validate_all((), dict(out=out, keepdims=keepdims))
+        return nanops.nanall(self._ndarray, axis=axis, skipna=skipna)
+
+    def min(self, axis=None, out=None, keepdims=False, skipna=True):
+        nv.validate_min((), dict(out=out, keepdims=keepdims))
+        return nanops.nanmin(self._ndarray, axis=axis, skipna=skipna)
+
+    def max(self, axis=None, out=None, keepdims=False, skipna=True):
+        nv.validate_max((), dict(out=out, keepdims=keepdims))
+        return nanops.nanmax(self._ndarray, axis=axis, skipna=skipna)
+
+    def sum(self, axis=None, dtype=None, out=None, keepdims=False,
+            initial=None, skipna=True, min_count=0):
+        nv.validate_sum((), dict(dtype=dtype, out=out, keepdims=keepdims,
+                                 initial=initial))
+        return nanops.nansum(self._ndarray, axis=axis, skipna=skipna,
+                             min_count=min_count)
+
+    def prod(self, axis=None, dtype=None, out=None, keepdims=False,
+             initial=None, skipna=True, min_count=0):
+        nv.validate_prod((), dict(dtype=dtype, out=out, keepdims=keepdims,
+                                  initial=initial))
+        return nanops.nanprod(self._ndarray, axis=axis, skipna=skipna,
+                              min_count=min_count)
+
+    def mean(self, axis=None, dtype=None, out=None, keepdims=False,
+             skipna=True):
+        nv.validate_mean((), dict(dtype=dtype, out=out, keepdims=keepdims))
+        return nanops.nanmean(self._ndarray, axis=axis, skipna=skipna)
+
+    def median(self, axis=None, out=None, overwrite_input=False,
+               keepdims=False, skipna=True):
+        nv.validate_median((), dict(out=out, overwrite_input=overwrite_input,
+                                    keepdims=keepdims))
+        return nanops.nanmedian(self._ndarray, axis=axis, skipna=skipna)
+
+    def std(self, axis=None, dtype=None, out=None, ddof=1, keepdims=False,
+            skipna=True):
+        nv.validate_stat_ddof_func((), dict(dtype=dtype, out=out,
+                                            keepdims=keepdims),
+                                   fname='std')
+        return nanops.nanstd(self._ndarray, axis=axis, skipna=skipna,
+                             ddof=ddof)
+
+    def var(self, axis=None, dtype=None, out=None, ddof=1, keepdims=False,
+            skipna=True):
+        nv.validate_stat_ddof_func((), dict(dtype=dtype, out=out,
+                                            keepdims=keepdims),
+                                   fname='var')
+        return nanops.nanvar(self._ndarray, axis=axis, skipna=skipna,
+                             ddof=ddof)
+
+    def sem(self, axis=None, dtype=None, out=None, ddof=1, keepdims=False,
+            skipna=True):
+        nv.validate_stat_ddof_func((), dict(dtype=dtype, out=out,
+                                            keepdims=keepdims),
+                                   fname='sem')
+        return nanops.nansem(self._ndarray, axis=axis, skipna=skipna,
+                             ddof=ddof)
+
+    def kurt(self, axis=None, dtype=None, out=None, keepdims=False,
+             skipna=True):
+        nv.validate_stat_ddof_func((), dict(dtype=dtype, out=out,
+                                            keepdims=keepdims),
+                                   fname='kurt')
+        return nanops.nankurt(self._ndarray, axis=axis, skipna=skipna)
+
+    def skew(self, axis=None, dtype=None, out=None, keepdims=False,
+             skipna=True):
+        nv.validate_stat_ddof_func((), dict(dtype=dtype, out=out,
+                                            keepdims=keepdims),
+                                   fname='skew')
+        return nanops.nanskew(self._ndarray, axis=axis, skipna=skipna)
+
+    # ------------------------------------------------------------------------
+    # Additional Methods
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        Convert the PandasArray to a :class:`numpy.ndarray`.
+
+        By default, this requires no coercion or copying of data.
+
+        Parameters
+        ----------
+        dtype : numpy.dtype
+            The NumPy dtype to pass to :func:`numpy.asarray`.
+        copy : bool, default False
+            Whether to copy the underlying data.
+
+        Returns
+        -------
+        ndarray
+        """
+        result = np.asarray(self._ndarray, dtype=dtype)
+        if copy and result is self._ndarray:
+            result = result.copy()
+
+        return result
+
+    @Appender(ExtensionArray.searchsorted.__doc__)
+    def searchsorted(self, value, side='left', sorter=None):
+        return searchsorted(self.to_numpy(), value,
+                            side=side, sorter=sorter)
+
+    # ------------------------------------------------------------------------
+    # Ops
+
+    def __invert__(self):
+        return type(self)(~self._ndarray)
+
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        def arithmetic_method(self, other):
+            if isinstance(other, (ABCIndexClass, ABCSeries)):
+                return NotImplemented
+
+            elif isinstance(other, cls):
+                other = other._ndarray
+
+            with np.errstate(all="ignore"):
+                result = op(self._ndarray, other)
+
+            if op is divmod:
+                a, b = result
+                return cls(a), cls(b)
+
+            return cls(result)
+
+        return compat.set_function_name(arithmetic_method,
+                                        "__{}__".format(op.__name__),
+                                        cls)
+
+    _create_comparison_method = _create_arithmetic_method
+
+
+PandasArray._add_arithmetic_ops()
+PandasArray._add_comparison_ops()
diff --git a/pandas/core/arrays/period.py b/pandas/core/arrays/period.py
new file mode 100644
index 0000000000000..0ec1bc7a84231
--- /dev/null
+++ b/pandas/core/arrays/period.py
@@ -0,0 +1,956 @@
+# -*- coding: utf-8 -*-
+from datetime import timedelta
+import operator
+
+import numpy as np
+
+from pandas._libs.tslibs import (
+    NaT, frequencies as libfrequencies, iNaT, period as libperiod)
+from pandas._libs.tslibs.fields import isleapyear_arr
+from pandas._libs.tslibs.period import (
+    DIFFERENT_FREQ, IncompatibleFrequency, Period, get_period_field_arr,
+    period_asfreq_arr)
+from pandas._libs.tslibs.timedeltas import Timedelta, delta_to_nanoseconds
+import pandas.compat as compat
+from pandas.util._decorators import Appender, cache_readonly
+
+from pandas.core.dtypes.common import (
+    _TD_DTYPE, ensure_object, is_datetime64_dtype, is_float_dtype,
+    is_list_like, is_period_dtype, pandas_dtype)
+from pandas.core.dtypes.dtypes import PeriodDtype
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndexClass, ABCPeriodIndex, ABCSeries)
+from pandas.core.dtypes.missing import isna, notna
+
+import pandas.core.algorithms as algos
+from pandas.core.arrays import datetimelike as dtl
+import pandas.core.common as com
+
+from pandas.tseries import frequencies
+from pandas.tseries.offsets import DateOffset, Tick, _delta_to_tick
+
+
+def _field_accessor(name, alias, docstring=None):
+    def f(self):
+        base, mult = libfrequencies.get_freq_code(self.freq)
+        result = get_period_field_arr(alias, self.asi8, base)
+        return result
+
+    f.__name__ = name
+    f.__doc__ = docstring
+    return property(f)
+
+
+def _period_array_cmp(cls, op):
+    """
+    Wrap comparison operations to convert Period-like to PeriodDtype
+    """
+    opname = '__{name}__'.format(name=op.__name__)
+    nat_result = opname == '__ne__'
+
+    def wrapper(self, other):
+        op = getattr(self.asi8, opname)
+
+        if isinstance(other, (ABCDataFrame, ABCSeries, ABCIndexClass)):
+            return NotImplemented
+
+        if is_list_like(other) and len(other) != len(self):
+            raise ValueError("Lengths must match")
+
+        if isinstance(other, Period):
+            self._check_compatible_with(other)
+
+            result = op(other.ordinal)
+        elif isinstance(other, cls):
+            self._check_compatible_with(other)
+
+            result = op(other.asi8)
+
+            mask = self._isnan | other._isnan
+            if mask.any():
+                result[mask] = nat_result
+
+            return result
+        elif other is NaT:
+            result = np.empty(len(self.asi8), dtype=bool)
+            result.fill(nat_result)
+        else:
+            other = Period(other, freq=self.freq)
+            result = op(other.ordinal)
+
+        if self._hasnans:
+            result[self._isnan] = nat_result
+
+        return result
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+class PeriodArray(dtl.DatetimeLikeArrayMixin, dtl.DatelikeOps):
+    """
+    Pandas ExtensionArray for storing Period data.
+
+    Users should use :func:`period_array` to create new instances.
+
+    Parameters
+    ----------
+    values : Union[PeriodArray, Series[period], ndarary[int], PeriodIndex]
+        The data to store. These should be arrays that can be directly
+        converted to ordinals without inference or copy (PeriodArray,
+        ndarray[int64]), or a box around such an array (Series[period],
+        PeriodIndex).
+    freq : str or DateOffset
+        The `freq` to use for the array. Mostly applicable when `values`
+        is an ndarray of integers, when `freq` is required. When `values`
+        is a PeriodArray (or box around), it's checked that ``values.freq``
+        matches `freq`.
+    copy : bool, default False
+        Whether to copy the ordinals before storing.
+
+    See Also
+    --------
+    period_array : Create a new PeriodArray.
+    pandas.PeriodIndex : Immutable Index for period data.
+
+    Notes
+    -----
+    There are two components to a PeriodArray
+
+    - ordinals : integer ndarray
+    - freq : pd.tseries.offsets.Offset
+
+    The values are physically stored as a 1-D ndarray of integers. These are
+    called "ordinals" and represent some kind of offset from a base.
+
+    The `freq` indicates the span covered by each element of the array.
+    All elements in the PeriodArray have the same `freq`.
+    """
+    # array priority higher than numpy scalars
+    __array_priority__ = 1000
+    _attributes = ["freq"]
+    _typ = "periodarray"  # ABCPeriodArray
+    _scalar_type = Period
+
+    # Names others delegate to us
+    _other_ops = []
+    _bool_ops = ['is_leap_year']
+    _object_ops = ['start_time', 'end_time', 'freq']
+    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
+                  'weekofyear', 'weekday', 'week', 'dayofweek',
+                  'dayofyear', 'quarter', 'qyear',
+                  'days_in_month', 'daysinmonth']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
+    _datetimelike_methods = ['strftime', 'to_timestamp', 'asfreq']
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __init__(self, values, freq=None, dtype=None, copy=False):
+        freq = validate_dtype_freq(dtype, freq)
+
+        if freq is not None:
+            freq = Period._maybe_convert_freq(freq)
+
+        if isinstance(values, ABCSeries):
+            values = values._values
+            if not isinstance(values, type(self)):
+                raise TypeError("Incorrect dtype")
+
+        elif isinstance(values, ABCPeriodIndex):
+            values = values._values
+
+        if isinstance(values, type(self)):
+            if freq is not None and freq != values.freq:
+                msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                            own_freq=values.freq.freqstr,
+                                            other_freq=freq.freqstr)
+                raise IncompatibleFrequency(msg)
+            values, freq = values._data, values.freq
+
+        values = np.array(values, dtype='int64', copy=copy)
+        self._data = values
+        if freq is None:
+            raise ValueError('freq is not specified and cannot be inferred')
+        self._dtype = PeriodDtype(freq)
+
+    @classmethod
+    def _simple_new(cls, values, freq=None, **kwargs):
+        # alias for PeriodArray.__init__
+        return cls(values, freq=freq, **kwargs)
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        # type: (Sequence[Optional[Period]], PeriodDtype, bool) -> PeriodArray
+        if dtype:
+            freq = dtype.freq
+        else:
+            freq = None
+
+        if isinstance(scalars, cls):
+            validate_dtype_freq(scalars.dtype, freq)
+            if copy:
+                scalars = scalars.copy()
+            return scalars
+
+        periods = np.asarray(scalars, dtype=object)
+        if copy:
+            periods = periods.copy()
+
+        freq = freq or libperiod.extract_freq(periods)
+        ordinals = libperiod.extract_ordinals(periods, freq)
+        return cls(ordinals, freq=freq)
+
+    @classmethod
+    def _from_datetime64(cls, data, freq, tz=None):
+        """
+        Construct a PeriodArray from a datetime64 array
+
+        Parameters
+        ----------
+        data : ndarray[datetime64[ns], datetime64[ns, tz]]
+        freq : str or Tick
+        tz : tzinfo, optional
+
+        Returns
+        -------
+        PeriodArray[freq]
+        """
+        data, freq = dt64arr_to_periodarr(data, freq, tz)
+        return cls(data, freq=freq)
+
+    @classmethod
+    def _generate_range(cls, start, end, periods, freq, fields):
+        periods = dtl.validate_periods(periods)
+
+        if freq is not None:
+            freq = Period._maybe_convert_freq(freq)
+
+        field_count = len(fields)
+        if start is not None or end is not None:
+            if field_count > 0:
+                raise ValueError('Can either instantiate from fields '
+                                 'or endpoints, but not both')
+            subarr, freq = _get_ordinal_range(start, end, periods, freq)
+        elif field_count > 0:
+            subarr, freq = _range_from_fields(freq=freq, **fields)
+        else:
+            raise ValueError('Not enough parameters to construct '
+                             'Period range')
+
+        return subarr, freq
+
+    # -----------------------------------------------------------------
+    # DatetimeLike Interface
+
+    def _unbox_scalar(self, value):
+        # type: (Union[Period, NaTType]) -> int
+        if value is NaT:
+            return value.value
+        elif isinstance(value, self._scalar_type):
+            if not isna(value):
+                self._check_compatible_with(value)
+            return value.ordinal
+        else:
+            raise ValueError("'value' should be a Period. Got '{val}' instead."
+                             .format(val=value))
+
+    def _scalar_from_string(self, value):
+        # type: (str) -> Period
+        return Period(value, freq=self.freq)
+
+    def _check_compatible_with(self, other):
+        if other is NaT:
+            return
+        if self.freqstr != other.freqstr:
+            _raise_on_incompatible(self, other)
+
+    # --------------------------------------------------------------------
+    # Data / Attributes
+
+    @cache_readonly
+    def dtype(self):
+        return self._dtype
+
+    @property
+    def freq(self):
+        """
+        Return the frequency object for this PeriodArray.
+        """
+        return self.dtype.freq
+
+    def __array__(self, dtype=None):
+        # overriding DatetimelikeArray
+        return np.array(list(self), dtype=object)
+
+    # --------------------------------------------------------------------
+    # Vectorized analogues of Period properties
+
+    year = _field_accessor('year', 0, "The year of the period")
+    month = _field_accessor('month', 3, "The month as January=1, December=12")
+    day = _field_accessor('day', 4, "The days of the period")
+    hour = _field_accessor('hour', 5, "The hour of the period")
+    minute = _field_accessor('minute', 6, "The minute of the period")
+    second = _field_accessor('second', 7, "The second of the period")
+    weekofyear = _field_accessor('week', 8, "The week ordinal of the year")
+    week = weekofyear
+    dayofweek = _field_accessor('dayofweek', 10,
+                                "The day of the week with Monday=0, Sunday=6")
+    weekday = dayofweek
+    dayofyear = day_of_year = _field_accessor('dayofyear', 9,
+                                              "The ordinal day of the year")
+    quarter = _field_accessor('quarter', 2, "The quarter of the date")
+    qyear = _field_accessor('qyear', 1)
+    days_in_month = _field_accessor('days_in_month', 11,
+                                    "The number of days in the month")
+    daysinmonth = days_in_month
+
+    @property
+    def is_leap_year(self):
+        """
+        Logical indicating if the date belongs to a leap year
+        """
+        return isleapyear_arr(np.asarray(self.year))
+
+    @property
+    def start_time(self):
+        return self.to_timestamp(how='start')
+
+    @property
+    def end_time(self):
+        return self.to_timestamp(how='end')
+
+    def to_timestamp(self, freq=None, how='start'):
+        """
+        Cast to DatetimeArray/Index.
+
+        Parameters
+        ----------
+        freq : string or DateOffset, optional
+            Target frequency. The default is 'D' for week or longer,
+            'S' otherwise
+        how : {'s', 'e', 'start', 'end'}
+
+        Returns
+        -------
+        DatetimeArray/Index
+        """
+        from pandas.core.arrays import DatetimeArray
+
+        how = libperiod._validate_end_alias(how)
+
+        end = how == 'E'
+        if end:
+            if freq == 'B':
+                # roll forward to ensure we land on B date
+                adjust = Timedelta(1, 'D') - Timedelta(1, 'ns')
+                return self.to_timestamp(how='start') + adjust
+            else:
+                adjust = Timedelta(1, 'ns')
+                return (self + self.freq).to_timestamp(how='start') - adjust
+
+        if freq is None:
+            base, mult = libfrequencies.get_freq_code(self.freq)
+            freq = libfrequencies.get_to_timestamp_base(base)
+        else:
+            freq = Period._maybe_convert_freq(freq)
+
+        base, mult = libfrequencies.get_freq_code(freq)
+        new_data = self.asfreq(freq, how=how)
+
+        new_data = libperiod.periodarr_to_dt64arr(new_data.asi8, base)
+        return DatetimeArray._from_sequence(new_data, freq='infer')
+
+    # --------------------------------------------------------------------
+    # Array-like / EA-Interface Methods
+
+    def _formatter(self, boxed=False):
+        if boxed:
+            return str
+        return "'{}'".format
+
+    @Appender(dtl.DatetimeLikeArrayMixin._validate_fill_value.__doc__)
+    def _validate_fill_value(self, fill_value):
+        if isna(fill_value):
+            fill_value = iNaT
+        elif isinstance(fill_value, Period):
+            self._check_compatible_with(fill_value)
+            fill_value = fill_value.ordinal
+        else:
+            raise ValueError("'fill_value' should be a Period. "
+                             "Got '{got}'.".format(got=fill_value))
+        return fill_value
+
+    # --------------------------------------------------------------------
+
+    def _time_shift(self, periods, freq=None):
+        """
+        Shift each value by `periods`.
+
+        Note this is different from ExtensionArray.shift, which
+        shifts the *position* of each element, padding the end with
+        missing values.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods to shift by.
+        freq : pandas.DateOffset, pandas.Timedelta, or string
+            Frequency increment to shift by.
+        """
+        if freq is not None:
+            raise TypeError("`freq` argument is not supported for "
+                            "{cls}._time_shift"
+                            .format(cls=type(self).__name__))
+        values = self.asi8 + periods * self.freq.n
+        if self._hasnans:
+            values[self._isnan] = iNaT
+        return type(self)(values, freq=self.freq)
+
+    @property
+    def _box_func(self):
+        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
+
+    def asfreq(self, freq=None, how='E'):
+        """
+        Convert the Period Array/Index to the specified frequency `freq`.
+
+        Parameters
+        ----------
+        freq : str
+            a frequency
+        how : str {'E', 'S'}
+            'E', 'END', or 'FINISH' for end,
+            'S', 'START', or 'BEGIN' for start.
+            Whether the elements should be aligned to the end
+            or start within pa period. January 31st ('END') vs.
+            January 1st ('START') for example.
+
+        Returns
+        -------
+        new : Period Array/Index with the new frequency
+
+        Examples
+        --------
+        >>> pidx = pd.period_range('2010-01-01', '2015-01-01', freq='A')
+        >>> pidx
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010, ..., 2015]
+        Length: 6, Freq: A-DEC
+
+        >>> pidx.asfreq('M')
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010-12, ..., 2015-12]
+        Length: 6, Freq: M
+
+        >>> pidx.asfreq('M', how='S')
+        <class 'pandas.core.indexes.period.PeriodIndex'>
+        [2010-01, ..., 2015-01]
+        Length: 6, Freq: M
+        """
+        how = libperiod._validate_end_alias(how)
+
+        freq = Period._maybe_convert_freq(freq)
+
+        base1, mult1 = libfrequencies.get_freq_code(self.freq)
+        base2, mult2 = libfrequencies.get_freq_code(freq)
+
+        asi8 = self.asi8
+        # mult1 can't be negative or 0
+        end = how == 'E'
+        if end:
+            ordinal = asi8 + mult1 - 1
+        else:
+            ordinal = asi8
+
+        new_data = period_asfreq_arr(ordinal, base1, base2, end)
+
+        if self._hasnans:
+            new_data[self._isnan] = iNaT
+
+        return type(self)(new_data, freq=freq)
+
+    # ------------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_native_types(self, na_rep=u'NaT', date_format=None, **kwargs):
+        """
+        actually format my specific types
+        """
+        values = self.astype(object)
+
+        if date_format:
+            formatter = lambda dt: dt.strftime(date_format)
+        else:
+            formatter = lambda dt: u'%s' % dt
+
+        if self._hasnans:
+            mask = self._isnan
+            values[mask] = na_rep
+            imask = ~mask
+            values[imask] = np.array([formatter(dt) for dt
+                                      in values[imask]])
+        else:
+            values = np.array([formatter(dt) for dt in values])
+        return values
+
+    # ------------------------------------------------------------------
+
+    def astype(self, dtype, copy=True):
+        # We handle Period[T] -> Period[U]
+        # Our parent handles everything else.
+        dtype = pandas_dtype(dtype)
+
+        if is_period_dtype(dtype):
+            return self.asfreq(dtype.freq)
+        return super(PeriodArray, self).astype(dtype, copy=copy)
+
+    @property
+    def flags(self):
+        # TODO: remove
+        # We need this since reduction.SeriesBinGrouper uses values.flags
+        # Ideally, we wouldn't be passing objects down there in the first
+        # place.
+        return self._data.flags
+
+    # ------------------------------------------------------------------
+    # Arithmetic Methods
+    _create_comparison_method = classmethod(_period_array_cmp)
+
+    def _sub_datelike(self, other):
+        assert other is not NaT
+        return NotImplemented
+
+    def _sub_period(self, other):
+        # If the operation is well-defined, we return an object-Index
+        # of DateOffsets.  Null entries are filled with pd.NaT
+        self._check_compatible_with(other)
+        asi8 = self.asi8
+        new_data = asi8 - other.ordinal
+        new_data = np.array([self.freq * x for x in new_data])
+
+        if self._hasnans:
+            new_data[self._isnan] = NaT
+
+        return new_data
+
+    @Appender(dtl.DatetimeLikeArrayMixin._addsub_int_array.__doc__)
+    def _addsub_int_array(
+            self,
+            other,   # type: Union[Index, ExtensionArray, np.ndarray[int]]
+            op      # type: Callable[Any, Any]
+    ):
+        # type: (...) -> PeriodArray
+
+        assert op in [operator.add, operator.sub]
+        if op is operator.sub:
+            other = -other
+        res_values = algos.checked_add_with_arr(self.asi8, other,
+                                                arr_mask=self._isnan)
+        res_values = res_values.view('i8')
+        res_values[self._isnan] = iNaT
+        return type(self)(res_values, freq=self.freq)
+
+    def _add_offset(self, other):
+        assert not isinstance(other, Tick)
+        base = libfrequencies.get_base_alias(other.rule_code)
+        if base != self.freq.rule_code:
+            _raise_on_incompatible(self, other)
+
+        # Note: when calling parent class's _add_timedeltalike_scalar,
+        #  it will call delta_to_nanoseconds(delta).  Because delta here
+        #  is an integer, delta_to_nanoseconds will return it unchanged.
+        result = super(PeriodArray, self)._add_timedeltalike_scalar(other.n)
+        return type(self)(result, freq=self.freq)
+
+    def _add_timedeltalike_scalar(self, other):
+        """
+        Parameters
+        ----------
+        other : timedelta, Tick, np.timedelta64
+
+        Returns
+        -------
+        result : ndarray[int64]
+        """
+        assert isinstance(self.freq, Tick)  # checked by calling function
+        assert isinstance(other, (timedelta, np.timedelta64, Tick))
+
+        if notna(other):
+            # special handling for np.timedelta64("NaT"), avoid calling
+            #  _check_timedeltalike_freq_compat as that would raise TypeError
+            other = self._check_timedeltalike_freq_compat(other)
+
+        # Note: when calling parent class's _add_timedeltalike_scalar,
+        #  it will call delta_to_nanoseconds(delta).  Because delta here
+        #  is an integer, delta_to_nanoseconds will return it unchanged.
+        ordinals = super(PeriodArray, self)._add_timedeltalike_scalar(other)
+        return ordinals
+
+    def _add_delta_tdi(self, other):
+        """
+        Parameters
+        ----------
+        other : TimedeltaArray or ndarray[timedelta64]
+
+        Returns
+        -------
+        result : ndarray[int64]
+        """
+        assert isinstance(self.freq, Tick)  # checked by calling function
+
+        delta = self._check_timedeltalike_freq_compat(other)
+        return self._addsub_int_array(delta, operator.add).asi8
+
+    def _add_delta(self, other):
+        """
+        Add a timedelta-like, Tick, or TimedeltaIndex-like object
+        to self, yielding a new PeriodArray
+
+        Parameters
+        ----------
+        other : {timedelta, np.timedelta64, Tick,
+                 TimedeltaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : PeriodArray
+        """
+        if not isinstance(self.freq, Tick):
+            # We cannot add timedelta-like to non-tick PeriodArray
+            _raise_on_incompatible(self, other)
+
+        new_ordinals = super(PeriodArray, self)._add_delta(other)
+        return type(self)(new_ordinals, freq=self.freq)
+
+    def _check_timedeltalike_freq_compat(self, other):
+        """
+        Arithmetic operations with timedelta-like scalars or array `other`
+        are only valid if `other` is an integer multiple of `self.freq`.
+        If the operation is valid, find that integer multiple.  Otherwise,
+        raise because the operation is invalid.
+
+        Parameters
+        ----------
+        other : timedelta, np.timedelta64, Tick,
+                ndarray[timedelta64], TimedeltaArray, TimedeltaIndex
+
+        Returns
+        -------
+        multiple : int or ndarray[int64]
+
+        Raises
+        ------
+        IncompatibleFrequency
+        """
+        assert isinstance(self.freq, Tick)  # checked by calling function
+        own_offset = frequencies.to_offset(self.freq.rule_code)
+        base_nanos = delta_to_nanoseconds(own_offset)
+
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            nanos = delta_to_nanoseconds(other)
+
+        elif isinstance(other, np.ndarray):
+            # numpy timedelta64 array; all entries must be compatible
+            assert other.dtype.kind == 'm'
+            if other.dtype != _TD_DTYPE:
+                # i.e. non-nano unit
+                # TODO: disallow unit-less timedelta64
+                other = other.astype(_TD_DTYPE)
+            nanos = other.view('i8')
+        else:
+            # TimedeltaArray/Index
+            nanos = other.asi8
+
+        if np.all(nanos % base_nanos == 0):
+            # nanos being added is an integer multiple of the
+            #  base-frequency to self.freq
+            delta = nanos // base_nanos
+            # delta is the integer (or integer-array) number of periods
+            # by which will be added to self.
+            return delta
+
+        _raise_on_incompatible(self, other)
+
+    def _values_for_argsort(self):
+        return self._data
+
+
+PeriodArray._add_comparison_ops()
+
+
+def _raise_on_incompatible(left, right):
+    """
+    Helper function to render a consistent error message when raising
+    IncompatibleFrequency.
+
+    Parameters
+    ----------
+    left : PeriodArray
+    right : DateOffset, Period, ndarray, or timedelta-like
+
+    Raises
+    ------
+    IncompatibleFrequency
+    """
+    # GH#24283 error message format depends on whether right is scalar
+    if isinstance(right, np.ndarray):
+        other_freq = None
+    elif isinstance(right, (ABCPeriodIndex, PeriodArray, Period, DateOffset)):
+        other_freq = right.freqstr
+    else:
+        other_freq = _delta_to_tick(Timedelta(right)).freqstr
+
+    msg = DIFFERENT_FREQ.format(cls=type(left).__name__,
+                                own_freq=left.freqstr,
+                                other_freq=other_freq)
+    raise IncompatibleFrequency(msg)
+
+
+# -------------------------------------------------------------------
+# Constructor Helpers
+
+def period_array(data, freq=None, copy=False):
+    # type: (Sequence[Optional[Period]], Optional[Tick], bool) -> PeriodArray
+    """
+    Construct a new PeriodArray from a sequence of Period scalars.
+
+    Parameters
+    ----------
+    data : Sequence of Period objects
+        A sequence of Period objects. These are required to all have
+        the same ``freq.`` Missing values can be indicated by ``None``
+        or ``pandas.NaT``.
+    freq : str, Tick, or Offset
+        The frequency of every element of the array. This can be specified
+        to avoid inferring the `freq` from `data`.
+    copy : bool, default False
+        Whether to ensure a copy of the data is made.
+
+    Returns
+    -------
+    PeriodArray
+
+    See Also
+    --------
+    PeriodArray
+    pandas.PeriodIndex
+
+    Examples
+    --------
+    >>> period_array([pd.Period('2017', freq='A'),
+    ...               pd.Period('2018', freq='A')])
+    <PeriodArray>
+    ['2017', '2018']
+    Length: 2, dtype: period[A-DEC]
+
+    >>> period_array([pd.Period('2017', freq='A'),
+    ...               pd.Period('2018', freq='A'),
+    ...               pd.NaT])
+    <PeriodArray>
+    ['2017', '2018', 'NaT']
+    Length: 3, dtype: period[A-DEC]
+
+    Integers that look like years are handled
+
+    >>> period_array([2000, 2001, 2002], freq='D')
+    ['2000-01-01', '2001-01-01', '2002-01-01']
+    Length: 3, dtype: period[D]
+
+    Datetime-like strings may also be passed
+
+    >>> period_array(['2000-Q1', '2000-Q2', '2000-Q3', '2000-Q4'], freq='Q')
+    <PeriodArray>
+    ['2000Q1', '2000Q2', '2000Q3', '2000Q4']
+    Length: 4, dtype: period[Q-DEC]
+    """
+    if is_datetime64_dtype(data):
+        return PeriodArray._from_datetime64(data, freq)
+    if isinstance(data, (ABCPeriodIndex, ABCSeries, PeriodArray)):
+        return PeriodArray(data, freq)
+
+    # other iterable of some kind
+    if not isinstance(data, (np.ndarray, list, tuple)):
+        data = list(data)
+
+    data = np.asarray(data)
+
+    if freq:
+        dtype = PeriodDtype(freq)
+    else:
+        dtype = None
+
+    if is_float_dtype(data) and len(data) > 0:
+        raise TypeError("PeriodIndex does not allow "
+                        "floating point in construction")
+
+    data = ensure_object(data)
+
+    return PeriodArray._from_sequence(data, dtype=dtype)
+
+
+def validate_dtype_freq(dtype, freq):
+    """
+    If both a dtype and a freq are available, ensure they match.  If only
+    dtype is available, extract the implied freq.
+
+    Parameters
+    ----------
+    dtype : dtype
+    freq : DateOffset or None
+
+    Returns
+    -------
+    freq : DateOffset
+
+    Raises
+    ------
+    ValueError : non-period dtype
+    IncompatibleFrequency : mismatch between dtype and freq
+    """
+    if freq is not None:
+        freq = frequencies.to_offset(freq)
+
+    if dtype is not None:
+        dtype = pandas_dtype(dtype)
+        if not is_period_dtype(dtype):
+            raise ValueError('dtype must be PeriodDtype')
+        if freq is None:
+            freq = dtype.freq
+        elif freq != dtype.freq:
+            raise IncompatibleFrequency('specified freq and dtype '
+                                        'are different')
+    return freq
+
+
+def dt64arr_to_periodarr(data, freq, tz=None):
+    """
+    Convert an datetime-like array to values Period ordinals.
+
+    Parameters
+    ----------
+    data : Union[Series[datetime64[ns]], DatetimeIndex, ndarray[datetime64ns]]
+    freq : Optional[Union[str, Tick]]
+        Must match the `freq` on the `data` if `data` is a DatetimeIndex
+        or Series.
+    tz : Optional[tzinfo]
+
+    Returns
+    -------
+    ordinals : ndarray[int]
+    freq : Tick
+        The frequencey extracted from the Series or DatetimeIndex if that's
+        used.
+
+    """
+    if data.dtype != np.dtype('M8[ns]'):
+        raise ValueError('Wrong dtype: {dtype}'.format(dtype=data.dtype))
+
+    if freq is None:
+        if isinstance(data, ABCIndexClass):
+            data, freq = data._values, data.freq
+        elif isinstance(data, ABCSeries):
+            data, freq = data._values, data.dt.freq
+
+    freq = Period._maybe_convert_freq(freq)
+
+    if isinstance(data, (ABCIndexClass, ABCSeries)):
+        data = data._values
+
+    base, mult = libfrequencies.get_freq_code(freq)
+    return libperiod.dt64arr_to_periodarr(data.view('i8'), base, tz), freq
+
+
+def _get_ordinal_range(start, end, periods, freq, mult=1):
+    if com.count_not_none(start, end, periods) != 2:
+        raise ValueError('Of the three parameters: start, end, and periods, '
+                         'exactly two must be specified')
+
+    if freq is not None:
+        _, mult = libfrequencies.get_freq_code(freq)
+
+    if start is not None:
+        start = Period(start, freq)
+    if end is not None:
+        end = Period(end, freq)
+
+    is_start_per = isinstance(start, Period)
+    is_end_per = isinstance(end, Period)
+
+    if is_start_per and is_end_per and start.freq != end.freq:
+        raise ValueError('start and end must have same freq')
+    if (start is NaT or end is NaT):
+        raise ValueError('start and end must not be NaT')
+
+    if freq is None:
+        if is_start_per:
+            freq = start.freq
+        elif is_end_per:
+            freq = end.freq
+        else:  # pragma: no cover
+            raise ValueError('Could not infer freq from start/end')
+
+    if periods is not None:
+        periods = periods * mult
+        if start is None:
+            data = np.arange(end.ordinal - periods + mult,
+                             end.ordinal + 1, mult,
+                             dtype=np.int64)
+        else:
+            data = np.arange(start.ordinal, start.ordinal + periods, mult,
+                             dtype=np.int64)
+    else:
+        data = np.arange(start.ordinal, end.ordinal + 1, mult, dtype=np.int64)
+
+    return data, freq
+
+
+def _range_from_fields(year=None, month=None, quarter=None, day=None,
+                       hour=None, minute=None, second=None, freq=None):
+    if hour is None:
+        hour = 0
+    if minute is None:
+        minute = 0
+    if second is None:
+        second = 0
+    if day is None:
+        day = 1
+
+    ordinals = []
+
+    if quarter is not None:
+        if freq is None:
+            freq = 'Q'
+            base = libfrequencies.FreqGroup.FR_QTR
+        else:
+            base, mult = libfrequencies.get_freq_code(freq)
+            if base != libfrequencies.FreqGroup.FR_QTR:
+                raise AssertionError("base must equal FR_QTR")
+
+        year, quarter = _make_field_arrays(year, quarter)
+        for y, q in compat.zip(year, quarter):
+            y, m = libperiod.quarter_to_myear(y, q, freq)
+            val = libperiod.period_ordinal(y, m, 1, 1, 1, 1, 0, 0, base)
+            ordinals.append(val)
+    else:
+        base, mult = libfrequencies.get_freq_code(freq)
+        arrays = _make_field_arrays(year, month, day, hour, minute, second)
+        for y, mth, d, h, mn, s in compat.zip(*arrays):
+            ordinals.append(libperiod.period_ordinal(
+                y, mth, d, h, mn, s, 0, 0, base))
+
+    return np.array(ordinals, dtype=np.int64), freq
+
+
+def _make_field_arrays(*fields):
+    length = None
+    for x in fields:
+        if isinstance(x, (list, np.ndarray, ABCSeries)):
+            if length is not None and len(x) != length:
+                raise ValueError('Mismatched Period array lengths')
+            elif length is None:
+                length = len(x)
+
+    arrays = [np.asarray(x) if isinstance(x, (np.ndarray, list, ABCSeries))
+              else np.repeat(x, length) for x in fields]
+
+    return arrays
diff --git a/pandas/core/arrays/sparse.py b/pandas/core/arrays/sparse.py
new file mode 100644
index 0000000000000..9be2c9af169e8
--- /dev/null
+++ b/pandas/core/arrays/sparse.py
@@ -0,0 +1,2028 @@
+"""
+SparseArray data structure
+"""
+from __future__ import division
+
+import numbers
+import operator
+import re
+import warnings
+
+import numpy as np
+
+from pandas._libs import index as libindex, lib
+import pandas._libs.sparse as splib
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas._libs.tslibs import NaT
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+from pandas.errors import PerformanceWarning
+
+from pandas.core.dtypes.base import ExtensionDtype
+from pandas.core.dtypes.cast import (
+    astype_nansafe, construct_1d_arraylike_from_scalar, find_common_type,
+    infer_dtype_from_scalar, maybe_convert_platform)
+from pandas.core.dtypes.common import (
+    is_array_like, is_bool_dtype, is_datetime64_any_dtype, is_dtype_equal,
+    is_integer, is_list_like, is_object_dtype, is_scalar, is_string_dtype,
+    pandas_dtype)
+from pandas.core.dtypes.dtypes import register_extension_dtype
+from pandas.core.dtypes.generic import (
+    ABCIndexClass, ABCSeries, ABCSparseSeries)
+from pandas.core.dtypes.missing import isna, na_value_for_dtype, notna
+
+from pandas.core.accessor import PandasDelegate, delegate_names
+import pandas.core.algorithms as algos
+from pandas.core.arrays import ExtensionArray, ExtensionOpsMixin
+from pandas.core.base import PandasObject
+import pandas.core.common as com
+from pandas.core.missing import interpolate_2d
+
+import pandas.io.formats.printing as printing
+
+
+# ----------------------------------------------------------------------------
+# Dtype
+@register_extension_dtype
+class SparseDtype(ExtensionDtype):
+    """
+    Dtype for data stored in :class:`SparseArray`.
+
+    This dtype implements the pandas ExtensionDtype interface.
+
+    .. versionadded:: 0.24.0
+
+    Parameters
+    ----------
+    dtype : str, ExtensionDtype, numpy.dtype, type, default numpy.float64
+        The dtype of the underlying array storing the non-fill value values.
+    fill_value : scalar, optional
+        The scalar value not stored in the SparseArray. By default, this
+        depends on `dtype`.
+
+        =========== ==========
+        dtype       na_value
+        =========== ==========
+        float       ``np.nan``
+        int         ``0``
+        bool        ``False``
+        datetime64  ``pd.NaT``
+        timedelta64 ``pd.NaT``
+        =========== ==========
+
+        The default value may be overridden by specifying a `fill_value`.
+    """
+    # We include `_is_na_fill_value` in the metadata to avoid hash collisions
+    # between SparseDtype(float, 0.0) and SparseDtype(float, nan).
+    # Without is_na_fill_value in the comparison, those would be equal since
+    # hash(nan) is (sometimes?) 0.
+    _metadata = ('_dtype', '_fill_value', '_is_na_fill_value')
+
+    def __init__(self, dtype=np.float64, fill_value=None):
+        # type: (Union[str, np.dtype, 'ExtensionDtype', type], Any) -> None
+        from pandas.core.dtypes.missing import na_value_for_dtype
+        from pandas.core.dtypes.common import (
+            pandas_dtype, is_string_dtype, is_scalar
+        )
+
+        if isinstance(dtype, type(self)):
+            if fill_value is None:
+                fill_value = dtype.fill_value
+            dtype = dtype.subtype
+
+        dtype = pandas_dtype(dtype)
+        if is_string_dtype(dtype):
+            dtype = np.dtype('object')
+
+        if fill_value is None:
+            fill_value = na_value_for_dtype(dtype)
+
+        if not is_scalar(fill_value):
+            raise ValueError("fill_value must be a scalar. Got {} "
+                             "instead".format(fill_value))
+        self._dtype = dtype
+        self._fill_value = fill_value
+
+    def __hash__(self):
+        # Python3 doesn't inherit __hash__ when a base class overrides
+        # __eq__, so we explicitly do it here.
+        return super(SparseDtype, self).__hash__()
+
+    def __eq__(self, other):
+        # We have to override __eq__ to handle NA values in _metadata.
+        # The base class does simple == checks, which fail for NA.
+        if isinstance(other, compat.string_types):
+            try:
+                other = self.construct_from_string(other)
+            except TypeError:
+                return False
+
+        if isinstance(other, type(self)):
+            subtype = self.subtype == other.subtype
+            if self._is_na_fill_value:
+                # this case is complicated by two things:
+                # SparseDtype(float, float(nan)) == SparseDtype(float, np.nan)
+                # SparseDtype(float, np.nan)     != SparseDtype(float, pd.NaT)
+                # i.e. we want to treat any floating-point NaN as equal, but
+                # not a floating-point NaN and a datetime NaT.
+                fill_value = (
+                    other._is_na_fill_value and
+                    isinstance(self.fill_value, type(other.fill_value)) or
+                    isinstance(other.fill_value, type(self.fill_value))
+                )
+            else:
+                fill_value = self.fill_value == other.fill_value
+
+            return subtype and fill_value
+        return False
+
+    @property
+    def fill_value(self):
+        """
+        The fill value of the array.
+
+        Converting the SparseArray to a dense ndarray will fill the
+        array with this value.
+
+        .. warning::
+
+           It's possible to end up with a SparseArray that has ``fill_value``
+           values in ``sp_values``. This can occur, for example, when setting
+           ``SparseArray.fill_value`` directly.
+        """
+        return self._fill_value
+
+    @property
+    def _is_na_fill_value(self):
+        from pandas.core.dtypes.missing import isna
+        return isna(self.fill_value)
+
+    @property
+    def _is_numeric(self):
+        from pandas.core.dtypes.common import is_object_dtype
+        return not is_object_dtype(self.subtype)
+
+    @property
+    def _is_boolean(self):
+        from pandas.core.dtypes.common import is_bool_dtype
+        return is_bool_dtype(self.subtype)
+
+    @property
+    def kind(self):
+        """
+        The sparse kind. Either 'integer', or 'block'.
+        """
+        return self.subtype.kind
+
+    @property
+    def type(self):
+        return self.subtype.type
+
+    @property
+    def subtype(self):
+        return self._dtype
+
+    @property
+    def name(self):
+        return 'Sparse[{}, {}]'.format(self.subtype.name, self.fill_value)
+
+    def __repr__(self):
+        return self.name
+
+    @classmethod
+    def construct_array_type(cls):
+        return SparseArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        Construct a SparseDtype from a string form.
+
+        Parameters
+        ----------
+        string : str
+            Can take the following forms.
+
+            string           dtype
+            ================ ============================
+            'int'            SparseDtype[np.int64, 0]
+            'Sparse'         SparseDtype[np.float64, nan]
+            'Sparse[int]'    SparseDtype[np.int64, 0]
+            'Sparse[int, 0]' SparseDtype[np.int64, 0]
+            ================ ============================
+
+            It is not possible to specify non-default fill values
+            with a string. An argument like ``'Sparse[int, 1]'``
+            will raise a ``TypeError`` because the default fill value
+            for integers is 0.
+
+        Returns
+        -------
+        SparseDtype
+        """
+        msg = "Could not construct SparseDtype from '{}'".format(string)
+        if string.startswith("Sparse"):
+            try:
+                sub_type, has_fill_value = cls._parse_subtype(string)
+                result = SparseDtype(sub_type)
+            except Exception:
+                raise TypeError(msg)
+            else:
+                msg = ("Could not construct SparseDtype from '{}'.\n\nIt "
+                       "looks like the fill_value in the string is not "
+                       "the default for the dtype. Non-default fill_values "
+                       "are not supported. Use the 'SparseDtype()' "
+                       "constructor instead.")
+                if has_fill_value and str(result) != string:
+                    raise TypeError(msg.format(string))
+                return result
+        else:
+            raise TypeError(msg)
+
+    @staticmethod
+    def _parse_subtype(dtype):
+        """
+        Parse a string to get the subtype
+
+        Parameters
+        ----------
+        dtype : str
+            A string like
+
+            * Sparse[subtype]
+            * Sparse[subtype, fill_value]
+
+        Returns
+        -------
+        subtype : str
+
+        Raises
+        ------
+        ValueError
+            When the subtype cannot be extracted.
+        """
+        xpr = re.compile(
+            r"Sparse\[(?P<subtype>[^,]*)(, )?(?P<fill_value>.*?)?\]$"
+        )
+        m = xpr.match(dtype)
+        has_fill_value = False
+        if m:
+            subtype = m.groupdict()['subtype']
+            has_fill_value = m.groupdict()['fill_value'] or has_fill_value
+        elif dtype == "Sparse":
+            subtype = 'float64'
+        else:
+            raise ValueError("Cannot parse {}".format(dtype))
+        return subtype, has_fill_value
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        dtype = getattr(dtype, 'dtype', dtype)
+        if (isinstance(dtype, compat.string_types) and
+                dtype.startswith("Sparse")):
+            sub_type, _ = cls._parse_subtype(dtype)
+            dtype = np.dtype(sub_type)
+        elif isinstance(dtype, cls):
+            return True
+        return isinstance(dtype, np.dtype) or dtype == 'Sparse'
+
+    def update_dtype(self, dtype):
+        """
+        Convert the SparseDtype to a new dtype.
+
+        This takes care of converting the ``fill_value``.
+
+        Parameters
+        ----------
+        dtype : Union[str, numpy.dtype, SparseDtype]
+            The new dtype to use.
+
+            * For a SparseDtype, it is simply returned
+            * For a NumPy dtype (or str), the current fill value
+              is converted to the new dtype, and a SparseDtype
+              with `dtype` and the new fill value is returned.
+
+        Returns
+        -------
+        SparseDtype
+            A new SparseDtype with the corret `dtype` and fill value
+            for that `dtype`.
+
+        Raises
+        ------
+        ValueError
+            When the current fill value cannot be converted to the
+            new `dtype` (e.g. trying to convert ``np.nan`` to an
+            integer dtype).
+
+
+        Examples
+        --------
+        >>> SparseDtype(int, 0).update_dtype(float)
+        Sparse[float64, 0.0]
+
+        >>> SparseDtype(int, 1).update_dtype(SparseDtype(float, np.nan))
+        Sparse[float64, nan]
+        """
+        cls = type(self)
+        dtype = pandas_dtype(dtype)
+
+        if not isinstance(dtype, cls):
+            fill_value = astype_nansafe(np.array(self.fill_value),
+                                        dtype).item()
+            dtype = cls(dtype, fill_value=fill_value)
+
+        return dtype
+
+    @property
+    def _subtype_with_str(self):
+        """
+        Whether the SparseDtype's subtype should be considered ``str``.
+
+        Typically, pandas will store string data in an object-dtype array.
+        When converting values to a dtype, e.g. in ``.astype``, we need to
+        be more specific, we need the actual underlying type.
+
+        Returns
+        -------
+
+        >>> SparseDtype(int, 1)._subtype_with_str
+        dtype('int64')
+
+        >>> SparseDtype(object, 1)._subtype_with_str
+        dtype('O')
+
+        >>> dtype = SparseDtype(str, '')
+        >>> dtype.subtype
+        dtype('O')
+
+        >>> dtype._subtype_with_str
+        str
+        """
+        if isinstance(self.fill_value, compat.string_types):
+            return type(self.fill_value)
+        return self.subtype
+
+
+# ----------------------------------------------------------------------------
+# Array
+
+
+_sparray_doc_kwargs = dict(klass='SparseArray')
+
+
+def _get_fill(arr):
+    # type: (SparseArray) -> ndarray
+    """
+    Create a 0-dim ndarray containing the fill value
+
+    Parameters
+    ----------
+    arr : SparseArray
+
+    Returns
+    -------
+    fill_value : ndarray
+        0-dim ndarray with just the fill value.
+
+    Notes
+    -----
+    coerce fill_value to arr dtype if possible
+    int64 SparseArray can have NaN as fill_value if there is no missing
+    """
+    try:
+        return np.asarray(arr.fill_value, dtype=arr.dtype.subtype)
+    except ValueError:
+        return np.asarray(arr.fill_value)
+
+
+def _sparse_array_op(left, right, op, name):
+    # type: (SparseArray, SparseArray, Callable, str) -> Any
+    """
+    Perform a binary operation between two arrays.
+
+    Parameters
+    ----------
+    left : Union[SparseArray, ndarray]
+    right : Union[SparseArray, ndarray]
+    op : Callable
+        The binary operation to perform
+    name str
+        Name of the callable.
+
+    Returns
+    -------
+    SparseArray
+    """
+    if name.startswith('__'):
+        # For lookups in _libs.sparse we need non-dunder op name
+        name = name[2:-2]
+
+    # dtype used to find corresponding sparse method
+    ltype = left.dtype.subtype
+    rtype = right.dtype.subtype
+
+    if not is_dtype_equal(ltype, rtype):
+        subtype = find_common_type([ltype, rtype])
+        ltype = SparseDtype(subtype, left.fill_value)
+        rtype = SparseDtype(subtype, right.fill_value)
+
+        # TODO(GH-23092): pass copy=False. Need to fix astype_nansafe
+        left = left.astype(ltype)
+        right = right.astype(rtype)
+        dtype = ltype.subtype
+    else:
+        dtype = ltype
+
+    # dtype the result must have
+    result_dtype = None
+
+    if left.sp_index.ngaps == 0 or right.sp_index.ngaps == 0:
+        with np.errstate(all='ignore'):
+            result = op(left.get_values(), right.get_values())
+            fill = op(_get_fill(left), _get_fill(right))
+
+        if left.sp_index.ngaps == 0:
+            index = left.sp_index
+        else:
+            index = right.sp_index
+    elif left.sp_index.equals(right.sp_index):
+        with np.errstate(all='ignore'):
+            result = op(left.sp_values, right.sp_values)
+            fill = op(_get_fill(left), _get_fill(right))
+        index = left.sp_index
+    else:
+        if name[0] == 'r':
+            left, right = right, left
+            name = name[1:]
+
+        if name in ('and', 'or') and dtype == 'bool':
+            opname = 'sparse_{name}_uint8'.format(name=name)
+            # to make template simple, cast here
+            left_sp_values = left.sp_values.view(np.uint8)
+            right_sp_values = right.sp_values.view(np.uint8)
+            result_dtype = np.bool
+        else:
+            opname = 'sparse_{name}_{dtype}'.format(name=name, dtype=dtype)
+            left_sp_values = left.sp_values
+            right_sp_values = right.sp_values
+
+        sparse_op = getattr(splib, opname)
+
+        with np.errstate(all='ignore'):
+            result, index, fill = sparse_op(
+                left_sp_values, left.sp_index, left.fill_value,
+                right_sp_values, right.sp_index, right.fill_value)
+
+    if result_dtype is None:
+        result_dtype = result.dtype
+
+    return _wrap_result(name, result, index, fill, dtype=result_dtype)
+
+
+def _wrap_result(name, data, sparse_index, fill_value, dtype=None):
+    """
+    wrap op result to have correct dtype
+    """
+    if name.startswith('__'):
+        # e.g. __eq__ --> eq
+        name = name[2:-2]
+
+    if name in ('eq', 'ne', 'lt', 'gt', 'le', 'ge'):
+        dtype = np.bool
+
+    fill_value = lib.item_from_zerodim(fill_value)
+
+    if is_bool_dtype(dtype):
+        # fill_value may be np.bool_
+        fill_value = bool(fill_value)
+    return SparseArray(data,
+                       sparse_index=sparse_index,
+                       fill_value=fill_value,
+                       dtype=dtype)
+
+
+class SparseArray(PandasObject, ExtensionArray, ExtensionOpsMixin):
+    """
+    An ExtensionArray for storing sparse data.
+
+    .. versionchanged:: 0.24.0
+
+       Implements the ExtensionArray interface.
+
+    Parameters
+    ----------
+    data : array-like
+        A dense array of values to store in the SparseArray. This may contain
+        `fill_value`.
+    sparse_index : SparseIndex, optional
+    index : Index
+    fill_value : scalar, optional
+        Elements in `data` that are `fill_value` are not stored in the
+        SparseArray. For memory savings, this should be the most common value
+        in `data`. By default, `fill_value` depends on the dtype of `data`:
+
+        =========== ==========
+        data.dtype  na_value
+        =========== ==========
+        float       ``np.nan``
+        int         ``0``
+        bool        False
+        datetime64  ``pd.NaT``
+        timedelta64 ``pd.NaT``
+        =========== ==========
+
+        The fill value is potentiall specified in three ways. In order of
+        precedence, these are
+
+        1. The `fill_value` argument
+        2. ``dtype.fill_value`` if `fill_value` is None and `dtype` is
+           a ``SparseDtype``
+        3. ``data.dtype.fill_value`` if `fill_value` is None and `dtype`
+           is not a ``SparseDtype`` and `data` is a ``SparseArray``.
+
+
+    kind : {'integer', 'block'}, default 'integer'
+        The type of storage for sparse locations.
+
+        * 'block': Stores a `block` and `block_length` for each
+          contiguous *span* of sparse values. This is best when
+          sparse data tends to be clumped together, with large
+          regsions of ``fill-value`` values between sparse values.
+        * 'integer': uses an integer to store the location of
+          each sparse value.
+
+    dtype : np.dtype or SparseDtype, optional
+        The dtype to use for the SparseArray. For numpy dtypes, this
+        determines the dtype of ``self.sp_values``. For SparseDtype,
+        this determines ``self.sp_values`` and ``self.fill_value``.
+    copy : bool, default False
+        Whether to explicitly copy the incoming `data` array.
+    """
+
+    __array_priority__ = 15
+    _pandas_ftype = 'sparse'
+    _subtyp = 'sparse_array'  # register ABCSparseArray
+
+    def __init__(self, data, sparse_index=None, index=None, fill_value=None,
+                 kind='integer', dtype=None, copy=False):
+        from pandas.core.internals import SingleBlockManager
+
+        if isinstance(data, SingleBlockManager):
+            data = data.internal_values()
+
+        if fill_value is None and isinstance(dtype, SparseDtype):
+            fill_value = dtype.fill_value
+
+        if isinstance(data, (type(self), ABCSparseSeries)):
+            # disable normal inference on dtype, sparse_index, & fill_value
+            if sparse_index is None:
+                sparse_index = data.sp_index
+            if fill_value is None:
+                fill_value = data.fill_value
+            if dtype is None:
+                dtype = data.dtype
+            # TODO: make kind=None, and use data.kind?
+            data = data.sp_values
+
+        # Handle use-provided dtype
+        if isinstance(dtype, compat.string_types):
+            # Two options: dtype='int', regular numpy dtype
+            # or dtype='Sparse[int]', a sparse dtype
+            try:
+                dtype = SparseDtype.construct_from_string(dtype)
+            except TypeError:
+                dtype = pandas_dtype(dtype)
+
+        if isinstance(dtype, SparseDtype):
+            if fill_value is None:
+                fill_value = dtype.fill_value
+            dtype = dtype.subtype
+
+        if index is not None and not is_scalar(data):
+            raise Exception("must only pass scalars with an index ")
+
+        if is_scalar(data):
+            if index is not None:
+                if data is None:
+                    data = np.nan
+
+            if index is not None:
+                npoints = len(index)
+            elif sparse_index is None:
+                npoints = 1
+            else:
+                npoints = sparse_index.length
+
+            dtype = infer_dtype_from_scalar(data)[0]
+            data = construct_1d_arraylike_from_scalar(
+                data, npoints, dtype
+            )
+
+        if dtype is not None:
+            dtype = pandas_dtype(dtype)
+
+        # TODO: disentangle the fill_value dtype inference from
+        # dtype inference
+        if data is None:
+            # XXX: What should the empty dtype be? Object or float?
+            data = np.array([], dtype=dtype)
+
+        if not is_array_like(data):
+            try:
+                # probably shared code in sanitize_series
+                from pandas.core.internals.construction import sanitize_array
+                data = sanitize_array(data, index=None)
+            except ValueError:
+                # NumPy may raise a ValueError on data like [1, []]
+                # we retry with object dtype here.
+                if dtype is None:
+                    dtype = object
+                    data = np.atleast_1d(np.asarray(data, dtype=dtype))
+                else:
+                    raise
+
+        if copy:
+            # TODO: avoid double copy when dtype forces cast.
+            data = data.copy()
+
+        if fill_value is None:
+            fill_value_dtype = data.dtype if dtype is None else dtype
+            if fill_value_dtype is None:
+                fill_value = np.nan
+            else:
+                fill_value = na_value_for_dtype(fill_value_dtype)
+
+        if isinstance(data, type(self)) and sparse_index is None:
+            sparse_index = data._sparse_index
+            sparse_values = np.asarray(data.sp_values, dtype=dtype)
+        elif sparse_index is None:
+            sparse_values, sparse_index, fill_value = make_sparse(
+                data, kind=kind, fill_value=fill_value, dtype=dtype
+            )
+        else:
+            sparse_values = np.asarray(data, dtype=dtype)
+            if len(sparse_values) != sparse_index.npoints:
+                raise AssertionError("Non array-like type {type} must "
+                                     "have the same length as the index"
+                                     .format(type=type(sparse_values)))
+        self._sparse_index = sparse_index
+        self._sparse_values = sparse_values
+        self._dtype = SparseDtype(sparse_values.dtype, fill_value)
+
+    @classmethod
+    def _simple_new(cls, sparse_array, sparse_index, dtype):
+        # type: (np.ndarray, SparseIndex, SparseDtype) -> 'SparseArray'
+        new = cls([])
+        new._sparse_index = sparse_index
+        new._sparse_values = sparse_array
+        new._dtype = dtype
+        return new
+
+    def __array__(self, dtype=None, copy=True):
+        fill_value = self.fill_value
+
+        if self.sp_index.ngaps == 0:
+            # Compat for na dtype and int values.
+            return self.sp_values
+        if dtype is None:
+            # Can NumPy represent this type?
+            # If not, `np.result_type` will raise. We catch that
+            # and return object.
+            if is_datetime64_any_dtype(self.sp_values.dtype):
+                # However, we *do* special-case the common case of
+                # a datetime64 with pandas NaT.
+                if fill_value is NaT:
+                    # Can't put pd.NaT in a datetime64[ns]
+                    fill_value = np.datetime64('NaT')
+            try:
+                dtype = np.result_type(self.sp_values.dtype, type(fill_value))
+            except TypeError:
+                dtype = object
+
+        out = np.full(self.shape, fill_value, dtype=dtype)
+        out[self.sp_index.to_int_index().indices] = self.sp_values
+        return out
+
+    def __setitem__(self, key, value):
+        # I suppose we could allow setting of non-fill_value elements.
+        # TODO(SparseArray.__setitem__): remove special cases in
+        # ExtensionBlock.where
+        msg = "SparseArray does not support item assignment via setitem"
+        raise TypeError(msg)
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return cls(scalars, dtype=dtype)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls(values, dtype=original.dtype)
+
+    # ------------------------------------------------------------------------
+    # Data
+    # ------------------------------------------------------------------------
+    @property
+    def sp_index(self):
+        """
+        The SparseIndex containing the location of non- ``fill_value`` points.
+        """
+        return self._sparse_index
+
+    @property
+    def sp_values(self):
+        """
+        An ndarray containing the non- ``fill_value`` values.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 0, 2], fill_value=0)
+        >>> s.sp_values
+        array([1, 2])
+        """
+        return self._sparse_values
+
+    @property
+    def dtype(self):
+        return self._dtype
+
+    @property
+    def fill_value(self):
+        """
+        Elements in `data` that are `fill_value` are not stored.
+
+        For memory savings, this should be the most common value in the array.
+        """
+        return self.dtype.fill_value
+
+    @fill_value.setter
+    def fill_value(self, value):
+        self._dtype = SparseDtype(self.dtype.subtype, value)
+
+    @property
+    def kind(self):
+        """
+        The kind of sparse index for this array. One of {'integer', 'block'}.
+        """
+        if isinstance(self.sp_index, IntIndex):
+            return 'integer'
+        else:
+            return 'block'
+
+    @property
+    def _valid_sp_values(self):
+        sp_vals = self.sp_values
+        mask = notna(sp_vals)
+        return sp_vals[mask]
+
+    def __len__(self):
+        return self.sp_index.length
+
+    @property
+    def _null_fill_value(self):
+        return self._dtype._is_na_fill_value
+
+    def _fill_value_matches(self, fill_value):
+        if self._null_fill_value:
+            return isna(fill_value)
+        else:
+            return self.fill_value == fill_value
+
+    @property
+    def nbytes(self):
+        return self.sp_values.nbytes + self.sp_index.nbytes
+
+    @property
+    def density(self):
+        """
+        The percent of non- ``fill_value`` points, as decimal.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 1, 1], fill_value=0)
+        >>> s.density
+        0.6
+        """
+        r = float(self.sp_index.npoints) / float(self.sp_index.length)
+        return r
+
+    @property
+    def npoints(self):
+        """
+        The number of non- ``fill_value`` points.
+
+        Examples
+        --------
+        >>> s = SparseArray([0, 0, 1, 1, 1], fill_value=0)
+        >>> s.npoints
+        3
+        """
+        return self.sp_index.npoints
+
+    @property
+    def values(self):
+        """
+        Dense values
+        """
+        return self.to_dense()
+
+    def isna(self):
+        from pandas import isna
+        # If null fill value, we want SparseDtype[bool, true]
+        # to preserve the same memory usage.
+        dtype = SparseDtype(bool, self._null_fill_value)
+        return type(self)._simple_new(isna(self.sp_values),
+                                      self.sp_index, dtype)
+
+    def fillna(self, value=None, method=None, limit=None):
+        """
+        Fill missing values with `value`.
+
+        Parameters
+        ----------
+        value : scalar, optional
+        method : str, optional
+
+            .. warning::
+
+               Using 'method' will result in high memory use,
+               as all `fill_value` methods will be converted to
+               an in-memory ndarray
+
+        limit : int, optional
+
+        Returns
+        -------
+        SparseArray
+
+        Notes
+        -----
+        When `value` is specified, the result's ``fill_value`` depends on
+        ``self.fill_value``. The goal is to maintain low-memory use.
+
+        If ``self.fill_value`` is NA, the result dtype will be
+        ``SparseDtype(self.dtype, fill_value=value)``. This will preserve
+        amount of memory used before and after filling.
+
+        When ``self.fill_value`` is not NA, the result dtype will be
+        ``self.dtype``. Again, this preserves the amount of memory used.
+        """
+        if ((method is None and value is None) or
+                (method is not None and value is not None)):
+            raise ValueError("Must specify one of 'method' or 'value'.")
+
+        elif method is not None:
+            msg = "fillna with 'method' requires high memory usage."
+            warnings.warn(msg, PerformanceWarning)
+            filled = interpolate_2d(np.asarray(self), method=method,
+                                    limit=limit)
+            return type(self)(filled, fill_value=self.fill_value)
+
+        else:
+            new_values = np.where(isna(self.sp_values), value, self.sp_values)
+
+            if self._null_fill_value:
+                # This is essentially just updating the dtype.
+                new_dtype = SparseDtype(self.dtype.subtype, fill_value=value)
+            else:
+                new_dtype = self.dtype
+
+        return self._simple_new(new_values, self._sparse_index, new_dtype)
+
+    def shift(self, periods=1, fill_value=None):
+
+        if not len(self) or periods == 0:
+            return self.copy()
+
+        if isna(fill_value):
+            fill_value = self.dtype.na_value
+
+        subtype = np.result_type(fill_value, self.dtype.subtype)
+
+        if subtype != self.dtype.subtype:
+            # just coerce up front
+            arr = self.astype(SparseDtype(subtype, self.fill_value))
+        else:
+            arr = self
+
+        empty = self._from_sequence(
+            [fill_value] * min(abs(periods), len(self)),
+            dtype=arr.dtype
+        )
+
+        if periods > 0:
+            a = empty
+            b = arr[:-periods]
+        else:
+            a = arr[abs(periods):]
+            b = empty
+        return arr._concat_same_type([a, b])
+
+    def _first_fill_value_loc(self):
+        """
+        Get the location of the first missing value.
+
+        Returns
+        -------
+        int
+        """
+        if len(self) == 0 or self.sp_index.npoints == len(self):
+            return -1
+
+        indices = self.sp_index.to_int_index().indices
+        if not len(indices) or indices[0] > 0:
+            return 0
+
+        diff = indices[1:] - indices[:-1]
+        return np.searchsorted(diff, 2) + 1
+
+    def unique(self):
+        uniques = list(algos.unique(self.sp_values))
+        fill_loc = self._first_fill_value_loc()
+        if fill_loc >= 0:
+            uniques.insert(fill_loc, self.fill_value)
+        return type(self)._from_sequence(uniques, dtype=self.dtype)
+
+    def _values_for_factorize(self):
+        # Still override this for hash_pandas_object
+        return np.asarray(self), self.fill_value
+
+    def factorize(self, na_sentinel=-1):
+        # Currently, ExtensionArray.factorize -> Tuple[ndarray, EA]
+        # The sparsity on this is backwards from what Sparse would want. Want
+        # ExtensionArray.factorize -> Tuple[EA, EA]
+        # Given that we have to return a dense array of labels, why bother
+        # implementing an efficient factorize?
+        labels, uniques = algos.factorize(np.asarray(self),
+                                          na_sentinel=na_sentinel)
+        uniques = SparseArray(uniques, dtype=self.dtype)
+        return labels, uniques
+
+    def value_counts(self, dropna=True):
+        """
+        Returns a Series containing counts of unique values.
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include counts of NaN, even if NaN is in sp_values.
+
+        Returns
+        -------
+        counts : Series
+        """
+        from pandas import Index, Series
+
+        keys, counts = algos._value_counts_arraylike(self.sp_values,
+                                                     dropna=dropna)
+        fcounts = self.sp_index.ngaps
+        if fcounts > 0:
+            if self._null_fill_value and dropna:
+                pass
+            else:
+                if self._null_fill_value:
+                    mask = isna(keys)
+                else:
+                    mask = keys == self.fill_value
+
+                if mask.any():
+                    counts[mask] += fcounts
+                else:
+                    keys = np.insert(keys, 0, self.fill_value)
+                    counts = np.insert(counts, 0, fcounts)
+
+        if not isinstance(keys, ABCIndexClass):
+            keys = Index(keys)
+        result = Series(counts, index=keys)
+        return result
+
+    # --------
+    # Indexing
+    # --------
+
+    def __getitem__(self, key):
+        if isinstance(key, tuple):
+            if len(key) > 1:
+                raise IndexError("too many indices for array.")
+            key = key[0]
+
+        if is_integer(key):
+            return self._get_val_at(key)
+        elif isinstance(key, tuple):
+            data_slice = self.values[key]
+        elif isinstance(key, slice):
+            # special case to preserve dtypes
+            if key == slice(None):
+                return self.copy()
+            # TODO: this logic is surely elsewhere
+            # TODO: this could be more efficient
+            indices = np.arange(len(self), dtype=np.int32)[key]
+            return self.take(indices)
+        else:
+            # TODO: I think we can avoid densifying when masking a
+            # boolean SparseArray with another. Need to look at the
+            # key's fill_value for True / False, and then do an intersection
+            # on the indicies of the sp_values.
+            if isinstance(key, SparseArray):
+                if is_bool_dtype(key):
+                    key = key.to_dense()
+                else:
+                    key = np.asarray(key)
+
+            if com.is_bool_indexer(key) and len(self) == len(key):
+                return self.take(np.arange(len(key), dtype=np.int32)[key])
+            elif hasattr(key, '__len__'):
+                return self.take(key)
+            else:
+                raise ValueError("Cannot slice with '{}'".format(key))
+
+        return type(self)(data_slice, kind=self.kind)
+
+    def _get_val_at(self, loc):
+        n = len(self)
+        if loc < 0:
+            loc += n
+
+        if loc >= n or loc < 0:
+            raise IndexError('Out of bounds access')
+
+        sp_loc = self.sp_index.lookup(loc)
+        if sp_loc == -1:
+            return self.fill_value
+        else:
+            return libindex.get_value_at(self.sp_values, sp_loc)
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        if is_scalar(indices):
+            raise ValueError("'indices' must be an array, not a "
+                             "scalar '{}'.".format(indices))
+        indices = np.asarray(indices, dtype=np.int32)
+
+        if indices.size == 0:
+            result = []
+            kwargs = {'dtype': self.dtype}
+        elif allow_fill:
+            result = self._take_with_fill(indices, fill_value=fill_value)
+            kwargs = {}
+        else:
+            result = self._take_without_fill(indices)
+            kwargs = {'dtype': self.dtype}
+
+        return type(self)(result, fill_value=self.fill_value, kind=self.kind,
+                          **kwargs)
+
+    def _take_with_fill(self, indices, fill_value=None):
+        if fill_value is None:
+            fill_value = self.dtype.na_value
+
+        if indices.min() < -1:
+            raise ValueError("Invalid value in 'indices'. Must be between -1 "
+                             "and the length of the array.")
+
+        if indices.max() >= len(self):
+            raise IndexError("out of bounds value in 'indices'.")
+
+        if len(self) == 0:
+            # Empty... Allow taking only if all empty
+            if (indices == -1).all():
+                dtype = np.result_type(self.sp_values, type(fill_value))
+                taken = np.empty_like(indices, dtype=dtype)
+                taken.fill(fill_value)
+                return taken
+            else:
+                raise IndexError('cannot do a non-empty take from an empty '
+                                 'axes.')
+
+        sp_indexer = self.sp_index.lookup_array(indices)
+
+        if self.sp_index.npoints == 0:
+            # Avoid taking from the empty self.sp_values
+            taken = np.full(sp_indexer.shape, fill_value=fill_value,
+                            dtype=np.result_type(type(fill_value)))
+        else:
+            taken = self.sp_values.take(sp_indexer)
+
+            # sp_indexer may be -1 for two reasons
+            # 1.) we took for an index of -1 (new)
+            # 2.) we took a value that was self.fill_value (old)
+            new_fill_indices = indices == -1
+            old_fill_indices = (sp_indexer == -1) & ~new_fill_indices
+
+            # Fill in two steps.
+            # Old fill values
+            # New fill values
+            # potentially coercing to a new dtype at each stage.
+
+            m0 = sp_indexer[old_fill_indices] < 0
+            m1 = sp_indexer[new_fill_indices] < 0
+
+            result_type = taken.dtype
+
+            if m0.any():
+                result_type = np.result_type(result_type,
+                                             type(self.fill_value))
+                taken = taken.astype(result_type)
+                taken[old_fill_indices] = self.fill_value
+
+            if m1.any():
+                result_type = np.result_type(result_type, type(fill_value))
+                taken = taken.astype(result_type)
+                taken[new_fill_indices] = fill_value
+
+        return taken
+
+    def _take_without_fill(self, indices):
+        to_shift = indices < 0
+        indices = indices.copy()
+
+        n = len(self)
+
+        if (indices.max() >= n) or (indices.min() < -n):
+            if n == 0:
+                raise IndexError("cannot do a non-empty take from an "
+                                 "empty axes.")
+            else:
+                raise IndexError("out of bounds value in 'indices'.")
+
+        if to_shift.any():
+            indices[to_shift] += n
+
+        if self.sp_index.npoints == 0:
+            # edge case in take...
+            # I think just return
+            out = np.full(indices.shape, self.fill_value,
+                          dtype=np.result_type(type(self.fill_value)))
+            arr, sp_index, fill_value = make_sparse(out,
+                                                    fill_value=self.fill_value)
+            return type(self)(arr, sparse_index=sp_index,
+                              fill_value=fill_value)
+
+        sp_indexer = self.sp_index.lookup_array(indices)
+        taken = self.sp_values.take(sp_indexer)
+        fillable = (sp_indexer < 0)
+
+        if fillable.any():
+            # TODO: may need to coerce array to fill value
+            result_type = np.result_type(taken, type(self.fill_value))
+            taken = taken.astype(result_type)
+            taken[fillable] = self.fill_value
+
+        return taken
+
+    def searchsorted(self, v, side="left", sorter=None):
+        msg = "searchsorted requires high memory usage."
+        warnings.warn(msg, PerformanceWarning, stacklevel=2)
+        if not is_scalar(v):
+            v = np.asarray(v)
+        v = np.asarray(v)
+        return np.asarray(self, dtype=self.dtype.subtype).searchsorted(
+            v, side, sorter
+        )
+
+    def copy(self, deep=False):
+        if deep:
+            values = self.sp_values.copy()
+        else:
+            values = self.sp_values
+
+        return self._simple_new(values, self.sp_index, self.dtype)
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        fill_values = [x.fill_value for x in to_concat]
+
+        fill_value = fill_values[0]
+
+        # np.nan isn't a singleton, so we may end up with multiple
+        # NaNs here, so we ignore tha all NA case too.
+        if not (len(set(fill_values)) == 1 or isna(fill_values).all()):
+            warnings.warn("Concatenating sparse arrays with multiple fill "
+                          "values: '{}'. Picking the first and "
+                          "converting the rest.".format(fill_values),
+                          PerformanceWarning,
+                          stacklevel=6)
+            keep = to_concat[0]
+            to_concat2 = [keep]
+
+            for arr in to_concat[1:]:
+                to_concat2.append(cls(np.asarray(arr), fill_value=fill_value))
+
+            to_concat = to_concat2
+
+        values = []
+        length = 0
+
+        if to_concat:
+            sp_kind = to_concat[0].kind
+        else:
+            sp_kind = 'integer'
+
+        if sp_kind == 'integer':
+            indices = []
+
+            for arr in to_concat:
+                idx = arr.sp_index.to_int_index().indices.copy()
+                idx += length  # TODO: wraparound
+                length += arr.sp_index.length
+
+                values.append(arr.sp_values)
+                indices.append(idx)
+
+            data = np.concatenate(values)
+            indices = np.concatenate(indices)
+            sp_index = IntIndex(length, indices)
+
+        else:
+            # when concatentating block indices, we don't claim that you'll
+            # get an identical index as concating the values and then
+            # creating a new index. We don't want to spend the time trying
+            # to merge blocks across arrays in `to_concat`, so the resulting
+            # BlockIndex may have more blocs.
+            blengths = []
+            blocs = []
+
+            for arr in to_concat:
+                idx = arr.sp_index.to_block_index()
+
+                values.append(arr.sp_values)
+                blocs.append(idx.blocs.copy() + length)
+                blengths.append(idx.blengths)
+                length += arr.sp_index.length
+
+            data = np.concatenate(values)
+            blocs = np.concatenate(blocs)
+            blengths = np.concatenate(blengths)
+
+            sp_index = BlockIndex(length, blocs, blengths)
+
+        return cls(data, sparse_index=sp_index, fill_value=fill_value)
+
+    def astype(self, dtype=None, copy=True):
+        """
+        Change the dtype of a SparseArray.
+
+        The output will always be a SparseArray. To convert to a dense
+        ndarray with a certain dtype, use :meth:`numpy.asarray`.
+
+        Parameters
+        ----------
+        dtype : np.dtype or ExtensionDtype
+            For SparseDtype, this changes the dtype of
+            ``self.sp_values`` and the ``self.fill_value``.
+
+            For other dtypes, this only changes the dtype of
+            ``self.sp_values``.
+
+        copy : bool, default True
+            Whether to ensure a copy is made, even if not necessary.
+
+        Returns
+        -------
+        SparseArray
+
+        Examples
+        --------
+        >>> arr = SparseArray([0, 0, 1, 2])
+        >>> arr
+        [0, 0, 1, 2]
+        Fill: 0
+        IntIndex
+        Indices: array([2, 3], dtype=int32)
+
+        >>> arr.astype(np.dtype('int32'))
+        [0, 0, 1, 2]
+        Fill: 0
+        IntIndex
+        Indices: array([2, 3], dtype=int32)
+
+        Using a NumPy dtype with a different kind (e.g. float) will coerce
+        just ``self.sp_values``.
+
+        >>> arr.astype(np.dtype('float64'))
+        ... # doctest: +NORMALIZE_WHITESPACE
+        [0, 0, 1.0, 2.0]
+        Fill: 0
+        IntIndex
+        Indices: array([2, 3], dtype=int32)
+
+        Use a SparseDtype if you wish to be change the fill value as well.
+
+        >>> arr.astype(SparseDtype("float64", fill_value=np.nan))
+        ... # doctest: +NORMALIZE_WHITESPACE
+        [nan, nan, 1.0, 2.0]
+        Fill: nan
+        IntIndex
+        Indices: array([2, 3], dtype=int32)
+        """
+        dtype = self.dtype.update_dtype(dtype)
+        subtype = dtype._subtype_with_str
+        sp_values = astype_nansafe(self.sp_values,
+                                   subtype,
+                                   copy=copy)
+        if sp_values is self.sp_values and copy:
+            sp_values = sp_values.copy()
+
+        return self._simple_new(sp_values,
+                                self.sp_index,
+                                dtype)
+
+    def map(self, mapper):
+        """
+        Map categories using input correspondence (dict, Series, or function).
+
+        Parameters
+        ----------
+        mapper : dict, Series, callable
+            The correspondence from old values to new.
+
+        Returns
+        -------
+        SparseArray
+            The output array will have the same density as the input.
+            The output fill value will be the result of applying the
+            mapping to ``self.fill_value``
+
+        Examples
+        --------
+        >>> arr = pd.SparseArray([0, 1, 2])
+        >>> arr.apply(lambda x: x + 10)
+        [10, 11, 12]
+        Fill: 10
+        IntIndex
+        Indices: array([1, 2], dtype=int32)
+
+        >>> arr.apply({0: 10, 1: 11, 2: 12})
+        [10, 11, 12]
+        Fill: 10
+        IntIndex
+        Indices: array([1, 2], dtype=int32)
+
+        >>> arr.apply(pd.Series([10, 11, 12], index=[0, 1, 2]))
+        [10, 11, 12]
+        Fill: 10
+        IntIndex
+        Indices: array([1, 2], dtype=int32)
+        """
+        # this is used in apply.
+        # We get hit since we're an "is_extension_type" but regular extension
+        # types are not hit. This may be worth adding to the interface.
+        if isinstance(mapper, ABCSeries):
+            mapper = mapper.to_dict()
+
+        if isinstance(mapper, compat.Mapping):
+            fill_value = mapper.get(self.fill_value, self.fill_value)
+            sp_values = [mapper.get(x, None) for x in self.sp_values]
+        else:
+            fill_value = mapper(self.fill_value)
+            sp_values = [mapper(x) for x in self.sp_values]
+
+        return type(self)(sp_values, sparse_index=self.sp_index,
+                          fill_value=fill_value)
+
+    def to_dense(self):
+        """
+        Convert SparseArray to a NumPy array.
+
+        Returns
+        -------
+        arr : NumPy array
+        """
+        return np.asarray(self, dtype=self.sp_values.dtype)
+
+    # TODO: Look into deprecating this in favor of `to_dense`.
+    get_values = to_dense
+
+    # ------------------------------------------------------------------------
+    # IO
+    # ------------------------------------------------------------------------
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if isinstance(state, tuple):
+            # Compat for pandas < 0.24.0
+            nd_state, (fill_value, sp_index) = state
+            sparse_values = np.array([])
+            sparse_values.__setstate__(nd_state)
+
+            self._sparse_values = sparse_values
+            self._sparse_index = sp_index
+            self._dtype = SparseDtype(sparse_values.dtype, fill_value)
+        else:
+            self.__dict__.update(state)
+
+    def nonzero(self):
+        if self.fill_value == 0:
+            return self.sp_index.to_int_index().indices,
+        else:
+            return self.sp_index.to_int_index().indices[self.sp_values != 0],
+
+    # ------------------------------------------------------------------------
+    # Reductions
+    # ------------------------------------------------------------------------
+
+    def _reduce(self, name, skipna=True, **kwargs):
+        method = getattr(self, name, None)
+
+        if method is None:
+            raise TypeError("cannot perform {name} with type {dtype}".format(
+                name=name, dtype=self.dtype))
+
+        if skipna:
+            arr = self
+        else:
+            arr = self.dropna()
+
+        # we don't support these kwargs.
+        # They should only be present when called via pandas, so do it here.
+        # instead of in `any` / `all` (which will raise if they're present,
+        # thanks to nv.validate
+        kwargs.pop('filter_type', None)
+        kwargs.pop('numeric_only', None)
+        kwargs.pop('op', None)
+        return getattr(arr, name)(**kwargs)
+
+    def all(self, axis=None, *args, **kwargs):
+        """
+        Tests whether all elements evaluate True
+
+        Returns
+        -------
+        all : bool
+
+        See Also
+        --------
+        numpy.all
+        """
+        nv.validate_all(args, kwargs)
+
+        values = self.sp_values
+
+        if len(values) != len(self) and not np.all(self.fill_value):
+            return False
+
+        return values.all()
+
+    def any(self, axis=0, *args, **kwargs):
+        """
+        Tests whether at least one of elements evaluate True
+
+        Returns
+        -------
+        any : bool
+
+        See Also
+        --------
+        numpy.any
+        """
+        nv.validate_any(args, kwargs)
+
+        values = self.sp_values
+
+        if len(values) != len(self) and np.any(self.fill_value):
+            return True
+
+        return values.any().item()
+
+    def sum(self, axis=0, *args, **kwargs):
+        """
+        Sum of non-NA/null values
+
+        Returns
+        -------
+        sum : float
+        """
+        nv.validate_sum(args, kwargs)
+        valid_vals = self._valid_sp_values
+        sp_sum = valid_vals.sum()
+        if self._null_fill_value:
+            return sp_sum
+        else:
+            nsparse = self.sp_index.ngaps
+            return sp_sum + self.fill_value * nsparse
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Cumulative sum of non-NA/null values.
+
+        When performing the cumulative summation, any non-NA/null values will
+        be skipped. The resulting SparseArray will preserve the locations of
+        NaN values, but the fill value will be `np.nan` regardless.
+
+        Parameters
+        ----------
+        axis : int or None
+            Axis over which to perform the cumulative summation. If None,
+            perform cumulative summation over flattened array.
+
+        Returns
+        -------
+        cumsum : SparseArray
+        """
+        nv.validate_cumsum(args, kwargs)
+
+        if axis is not None and axis >= self.ndim:  # Mimic ndarray behaviour.
+            raise ValueError("axis(={axis}) out of bounds".format(axis=axis))
+
+        if not self._null_fill_value:
+            return SparseArray(self.to_dense()).cumsum()
+
+        return SparseArray(self.sp_values.cumsum(), sparse_index=self.sp_index,
+                           fill_value=self.fill_value)
+
+    def mean(self, axis=0, *args, **kwargs):
+        """
+        Mean of non-NA/null values
+
+        Returns
+        -------
+        mean : float
+        """
+        nv.validate_mean(args, kwargs)
+        valid_vals = self._valid_sp_values
+        sp_sum = valid_vals.sum()
+        ct = len(valid_vals)
+
+        if self._null_fill_value:
+            return sp_sum / ct
+        else:
+            nsparse = self.sp_index.ngaps
+            return (sp_sum + self.fill_value * nsparse) / (ct + nsparse)
+
+    def transpose(self, *axes):
+        """
+        Returns the SparseArray.
+        """
+        return self
+
+    @property
+    def T(self):
+        """
+        Returns the SparseArray.
+        """
+        return self
+
+    # ------------------------------------------------------------------------
+    # Ufuncs
+    # ------------------------------------------------------------------------
+
+    def __array_wrap__(self, array, context=None):
+        from pandas.core.dtypes.generic import ABCSparseSeries
+
+        ufunc, inputs, _ = context
+        inputs = tuple(x.values if isinstance(x, ABCSparseSeries) else x
+                       for x in inputs)
+        return self.__array_ufunc__(ufunc, '__call__', *inputs)
+
+    _HANDLED_TYPES = (np.ndarray, numbers.Number)
+
+    def __array_ufunc__(self, ufunc, method, *inputs, **kwargs):
+        out = kwargs.get('out', ())
+
+        for x in inputs + out:
+            if not isinstance(x, self._HANDLED_TYPES + (SparseArray,)):
+                return NotImplemented
+
+        special = {'add', 'sub', 'mul', 'pow', 'mod', 'floordiv', 'truediv',
+                   'divmod', 'eq', 'ne', 'lt', 'gt', 'le', 'ge', 'remainder'}
+        if compat.PY2:
+            special.add('div')
+        aliases = {
+            'subtract': 'sub',
+            'multiply': 'mul',
+            'floor_divide': 'floordiv',
+            'true_divide': 'truediv',
+            'power': 'pow',
+            'remainder': 'mod',
+            'divide': 'div',
+            'equal': 'eq',
+            'not_equal': 'ne',
+            'less': 'lt',
+            'less_equal': 'le',
+            'greater': 'gt',
+            'greater_equal': 'ge',
+        }
+
+        flipped = {
+            'lt': '__gt__',
+            'le': '__ge__',
+            'gt': '__lt__',
+            'ge': '__le__',
+            'eq': '__eq__',
+            'ne': '__ne__',
+        }
+
+        op_name = ufunc.__name__
+        op_name = aliases.get(op_name, op_name)
+
+        if op_name in special and kwargs.get('out') is None:
+            if isinstance(inputs[0], type(self)):
+                return getattr(self, '__{}__'.format(op_name))(inputs[1])
+            else:
+                name = flipped.get(op_name, '__r{}__'.format(op_name))
+                return getattr(self, name)(inputs[0])
+
+        if len(inputs) == 1:
+            # No alignment necessary.
+            sp_values = getattr(ufunc, method)(self.sp_values, **kwargs)
+            fill_value = getattr(ufunc, method)(self.fill_value, **kwargs)
+            return self._simple_new(sp_values,
+                                    self.sp_index,
+                                    SparseDtype(sp_values.dtype, fill_value))
+
+        result = getattr(ufunc, method)(*[np.asarray(x) for x in inputs],
+                                        **kwargs)
+        if out:
+            if len(out) == 1:
+                out = out[0]
+            return out
+
+        if type(result) is tuple:
+            return tuple(type(self)(x) for x in result)
+        elif method == 'at':
+            # no return value
+            return None
+        else:
+            return type(self)(result)
+
+    def __abs__(self):
+        return np.abs(self)
+
+    # ------------------------------------------------------------------------
+    # Ops
+    # ------------------------------------------------------------------------
+
+    @classmethod
+    def _create_unary_method(cls, op):
+        def sparse_unary_method(self):
+            fill_value = op(np.array(self.fill_value)).item()
+            values = op(self.sp_values)
+            dtype = SparseDtype(values.dtype, fill_value)
+            return cls._simple_new(values, self.sp_index, dtype)
+
+        name = '__{name}__'.format(name=op.__name__)
+        return compat.set_function_name(sparse_unary_method, name, cls)
+
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        def sparse_arithmetic_method(self, other):
+            op_name = op.__name__
+
+            if isinstance(other, (ABCSeries, ABCIndexClass)):
+                # Rely on pandas to dispatch to us.
+                return NotImplemented
+
+            if isinstance(other, SparseArray):
+                return _sparse_array_op(self, other, op, op_name)
+
+            elif is_scalar(other):
+                with np.errstate(all='ignore'):
+                    fill = op(_get_fill(self), np.asarray(other))
+                    result = op(self.sp_values, other)
+
+                if op_name == 'divmod':
+                    left, right = result
+                    lfill, rfill = fill
+                    return (_wrap_result(op_name, left, self.sp_index, lfill),
+                            _wrap_result(op_name, right, self.sp_index, rfill))
+
+                return _wrap_result(op_name, result, self.sp_index, fill)
+
+            else:
+                other = np.asarray(other)
+                with np.errstate(all='ignore'):
+                    # TODO: delete sparse stuff in core/ops.py
+                    # TODO: look into _wrap_result
+                    if len(self) != len(other):
+                        raise AssertionError(
+                            ("length mismatch: {self} vs. {other}".format(
+                                self=len(self), other=len(other))))
+                    if not isinstance(other, SparseArray):
+                        dtype = getattr(other, 'dtype', None)
+                        other = SparseArray(other, fill_value=self.fill_value,
+                                            dtype=dtype)
+                    return _sparse_array_op(self, other, op, op_name)
+
+        name = '__{name}__'.format(name=op.__name__)
+        return compat.set_function_name(sparse_arithmetic_method, name, cls)
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        def cmp_method(self, other):
+            op_name = op.__name__
+
+            if op_name in {'and_', 'or_'}:
+                op_name = op_name[:-1]
+
+            if isinstance(other, (ABCSeries, ABCIndexClass)):
+                # Rely on pandas to unbox and dispatch to us.
+                return NotImplemented
+
+            if not is_scalar(other) and not isinstance(other, type(self)):
+                # convert list-like to ndarray
+                other = np.asarray(other)
+
+            if isinstance(other, np.ndarray):
+                # TODO: make this more flexible than just ndarray...
+                if len(self) != len(other):
+                    raise AssertionError("length mismatch: {self} vs. {other}"
+                                         .format(self=len(self),
+                                                 other=len(other)))
+                other = SparseArray(other, fill_value=self.fill_value)
+
+            if isinstance(other, SparseArray):
+                return _sparse_array_op(self, other, op, op_name)
+            else:
+                with np.errstate(all='ignore'):
+                    fill_value = op(self.fill_value, other)
+                    result = op(self.sp_values, other)
+
+                return type(self)(result,
+                                  sparse_index=self.sp_index,
+                                  fill_value=fill_value,
+                                  dtype=np.bool_)
+
+        name = '__{name}__'.format(name=op.__name__)
+        return compat.set_function_name(cmp_method, name, cls)
+
+    @classmethod
+    def _add_unary_ops(cls):
+        cls.__pos__ = cls._create_unary_method(operator.pos)
+        cls.__neg__ = cls._create_unary_method(operator.neg)
+        cls.__invert__ = cls._create_unary_method(operator.invert)
+
+    @classmethod
+    def _add_comparison_ops(cls):
+        cls.__and__ = cls._create_comparison_method(operator.and_)
+        cls.__or__ = cls._create_comparison_method(operator.or_)
+        super(SparseArray, cls)._add_comparison_ops()
+
+    # ----------
+    # Formatting
+    # -----------
+    def __unicode__(self):
+        return '{self}\nFill: {fill}\n{index}'.format(
+            self=printing.pprint_thing(self),
+            fill=printing.pprint_thing(self.fill_value),
+            index=printing.pprint_thing(self.sp_index))
+
+    def _formatter(self, boxed=False):
+        # Defer to the formatter from the GenericArrayFormatter calling us.
+        # This will infer the correct formatter from the dtype of the values.
+        return None
+
+
+SparseArray._add_arithmetic_ops()
+SparseArray._add_comparison_ops()
+SparseArray._add_unary_ops()
+
+
+def _maybe_to_dense(obj):
+    """
+    try to convert to dense
+    """
+    if hasattr(obj, 'to_dense'):
+        return obj.to_dense()
+    return obj
+
+
+def _maybe_to_sparse(array):
+    """
+    array must be SparseSeries or SparseArray
+    """
+    if isinstance(array, ABCSparseSeries):
+        array = array.values.copy()
+    return array
+
+
+def _sanitize_values(arr):
+    """
+    return an ndarray for our input,
+    in a platform independent manner
+    """
+
+    if hasattr(arr, 'values'):
+        arr = arr.values
+    else:
+
+        # scalar
+        if is_scalar(arr):
+            arr = [arr]
+
+        # ndarray
+        if isinstance(arr, np.ndarray):
+            pass
+
+        elif is_list_like(arr) and len(arr) > 0:
+            arr = maybe_convert_platform(arr)
+
+        else:
+            arr = np.asarray(arr)
+
+    return arr
+
+
+def make_sparse(arr, kind='block', fill_value=None, dtype=None, copy=False):
+    """
+    Convert ndarray to sparse format
+
+    Parameters
+    ----------
+    arr : ndarray
+    kind : {'block', 'integer'}
+    fill_value : NaN or another value
+    dtype : np.dtype, optional
+    copy : bool, default False
+
+    Returns
+    -------
+    (sparse_values, index, fill_value) : (ndarray, SparseIndex, Scalar)
+    """
+
+    arr = _sanitize_values(arr)
+
+    if arr.ndim > 1:
+        raise TypeError("expected dimension <= 1 data")
+
+    if fill_value is None:
+        fill_value = na_value_for_dtype(arr.dtype)
+
+    if isna(fill_value):
+        mask = notna(arr)
+    else:
+        # For str arrays in NumPy 1.12.0, operator!= below isn't
+        # element-wise but just returns False if fill_value is not str,
+        # so cast to object comparison to be safe
+        if is_string_dtype(arr):
+            arr = arr.astype(object)
+
+        if is_object_dtype(arr.dtype):
+            # element-wise equality check method in numpy doesn't treat
+            # each element type, eg. 0, 0.0, and False are treated as
+            # same. So we have to check the both of its type and value.
+            mask = splib.make_mask_object_ndarray(arr, fill_value)
+        else:
+            mask = arr != fill_value
+
+    length = len(arr)
+    if length != len(mask):
+        # the arr is a SparseArray
+        indices = mask.sp_index.indices
+    else:
+        indices = mask.nonzero()[0].astype(np.int32)
+
+    index = _make_index(length, indices, kind)
+    sparsified_values = arr[mask]
+    if dtype is not None:
+        sparsified_values = astype_nansafe(sparsified_values, dtype=dtype)
+    # TODO: copy
+    return sparsified_values, index, fill_value
+
+
+def _make_index(length, indices, kind):
+
+    if kind == 'block' or isinstance(kind, BlockIndex):
+        locs, lens = splib.get_blocks(indices)
+        index = BlockIndex(length, locs, lens)
+    elif kind == 'integer' or isinstance(kind, IntIndex):
+        index = IntIndex(length, indices)
+    else:  # pragma: no cover
+        raise ValueError('must be block or integer type')
+    return index
+
+
+# ----------------------------------------------------------------------------
+# Accessor
+
+@delegate_names(SparseArray, ['npoints', 'density', 'fill_value',
+                              'sp_values'],
+                typ='property')
+class SparseAccessor(PandasDelegate):
+    """
+    Accessor for SparseSparse from other sparse matrix data types.
+    """
+
+    def __init__(self, data=None):
+        self._validate(data)
+        # Store the Series since we need that for to_coo
+        self._parent = data
+
+    @staticmethod
+    def _validate(data):
+        if not isinstance(data.dtype, SparseDtype):
+            msg = "Can only use the '.sparse' accessor with Sparse data."
+            raise AttributeError(msg)
+
+    def _delegate_property_get(self, name, *args, **kwargs):
+        return getattr(self._parent.values, name)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        if name == 'from_coo':
+            return self.from_coo(*args, **kwargs)
+        elif name == 'to_coo':
+            return self.to_coo(*args, **kwargs)
+        else:
+            raise ValueError
+
+    @classmethod
+    def from_coo(cls, A, dense_index=False):
+        """
+        Create a SparseSeries from a scipy.sparse.coo_matrix.
+
+        Parameters
+        ----------
+        A : scipy.sparse.coo_matrix
+        dense_index : bool, default False
+            If False (default), the SparseSeries index consists of only the
+            coords of the non-null entries of the original coo_matrix.
+            If True, the SparseSeries index consists of the full sorted
+            (row, col) coordinates of the coo_matrix.
+
+        Returns
+        -------
+        s : SparseSeries
+
+        Examples
+        ---------
+        >>> from scipy import sparse
+        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
+                               shape=(3, 4))
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  2.],
+                [ 3.,  0.,  0.,  0.],
+                [ 0.,  0.,  0.,  0.]])
+        >>> ss = pd.SparseSeries.from_coo(A)
+        >>> ss
+        0  2    1
+           3    2
+        1  0    3
+        dtype: float64
+        BlockIndex
+        Block locations: array([0], dtype=int32)
+        Block lengths: array([3], dtype=int32)
+        """
+        from pandas.core.sparse.scipy_sparse import _coo_to_sparse_series
+        from pandas import Series
+
+        result = _coo_to_sparse_series(A, dense_index=dense_index)
+        # SparseSeries -> Series[sparse]
+        result = Series(result.values, index=result.index, copy=False)
+
+        return result
+
+    def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
+        """
+        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
+
+        Use row_levels and column_levels to determine the row and column
+        coordinates respectively. row_levels and column_levels are the names
+        (labels) or numbers of the levels. {row_levels, column_levels} must be
+        a partition of the MultiIndex level names (or numbers).
+
+        Parameters
+        ----------
+        row_levels : tuple/list
+        column_levels : tuple/list
+        sort_labels : bool, default False
+            Sort the row and column labels before forming the sparse matrix.
+
+        Returns
+        -------
+        y : scipy.sparse.coo_matrix
+        rows : list (row labels)
+        columns : list (column labels)
+
+        Examples
+        --------
+        >>> s = pd.Series([3.0, np.nan, 1.0, 3.0, np.nan, np.nan])
+        >>> s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                                (1, 2, 'a', 1),
+                                                (1, 1, 'b', 0),
+                                                (1, 1, 'b', 1),
+                                                (2, 1, 'b', 0),
+                                                (2, 1, 'b', 1)],
+                                                names=['A', 'B', 'C', 'D'])
+        >>> ss = s.to_sparse()
+        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
+                                         column_levels=['C', 'D'],
+                                         sort_labels=True)
+        >>> A
+        <3x4 sparse matrix of type '<class 'numpy.float64'>'
+                with 3 stored elements in COOrdinate format>
+        >>> A.todense()
+        matrix([[ 0.,  0.,  1.,  3.],
+        [ 3.,  0.,  0.,  0.],
+        [ 0.,  0.,  0.,  0.]])
+        >>> rows
+        [(1, 1), (1, 2), (2, 1)]
+        >>> columns
+        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
+        """
+        from pandas.core.sparse.scipy_sparse import _sparse_series_to_coo
+
+        A, rows, columns = _sparse_series_to_coo(self._parent,
+                                                 row_levels,
+                                                 column_levels,
+                                                 sort_labels=sort_labels)
+        return A, rows, columns
diff --git a/pandas/core/arrays/timedeltas.py b/pandas/core/arrays/timedeltas.py
new file mode 100644
index 0000000000000..74fe8072e6924
--- /dev/null
+++ b/pandas/core/arrays/timedeltas.py
@@ -0,0 +1,1066 @@
+# -*- coding: utf-8 -*-
+from __future__ import division
+
+from datetime import timedelta
+import textwrap
+import warnings
+
+import numpy as np
+
+from pandas._libs import lib, tslibs
+from pandas._libs.tslibs import NaT, Timedelta, Timestamp, iNaT
+from pandas._libs.tslibs.fields import get_timedelta_field
+from pandas._libs.tslibs.timedeltas import (
+    array_to_timedelta64, parse_timedelta_unit)
+import pandas.compat as compat
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, _TD_DTYPE, ensure_int64, is_datetime64_dtype, is_dtype_equal,
+    is_float_dtype, is_integer_dtype, is_list_like, is_object_dtype, is_scalar,
+    is_string_dtype, is_timedelta64_dtype, is_timedelta64_ns_dtype,
+    pandas_dtype)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndexClass, ABCSeries, ABCTimedeltaIndex)
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import ops
+from pandas.core.algorithms import checked_add_with_arr
+import pandas.core.common as com
+
+from pandas.tseries.frequencies import to_offset
+from pandas.tseries.offsets import Tick
+
+from . import datetimelike as dtl
+
+_BAD_DTYPE = "dtype {dtype} cannot be converted to timedelta64[ns]"
+
+
+def _is_convertible_to_td(key):
+    return isinstance(key, (Tick, timedelta,
+                            np.timedelta64, compat.string_types))
+
+
+def _field_accessor(name, alias, docstring=None):
+    def f(self):
+        values = self.asi8
+        result = get_timedelta_field(values, alias)
+        if self._hasnans:
+            result = self._maybe_mask_results(result, fill_value=None,
+                                              convert='float64')
+
+        return result
+
+    f.__name__ = name
+    f.__doc__ = "\n{}\n".format(docstring)
+    return property(f)
+
+
+def _td_array_cmp(cls, op):
+    """
+    Wrap comparison operations to convert timedelta-like to timedelta64
+    """
+    opname = '__{name}__'.format(name=op.__name__)
+    nat_result = opname == '__ne__'
+
+    def wrapper(self, other):
+        if isinstance(other, (ABCDataFrame, ABCSeries, ABCIndexClass)):
+            return NotImplemented
+
+        if _is_convertible_to_td(other) or other is NaT:
+            try:
+                other = Timedelta(other)
+            except ValueError:
+                # failed to parse as timedelta
+                return ops.invalid_comparison(self, other, op)
+
+            result = op(self.view('i8'), other.value)
+            if isna(other):
+                result.fill(nat_result)
+
+        elif not is_list_like(other):
+            return ops.invalid_comparison(self, other, op)
+
+        elif len(other) != len(self):
+            raise ValueError("Lengths must match")
+
+        else:
+            try:
+                other = type(self)._from_sequence(other)._data
+            except (ValueError, TypeError):
+                return ops.invalid_comparison(self, other, op)
+
+            result = op(self.view('i8'), other.view('i8'))
+            result = com.values_from_object(result)
+
+            o_mask = np.array(isna(other))
+            if o_mask.any():
+                result[o_mask] = nat_result
+
+        if self._hasnans:
+            result[self._isnan] = nat_result
+
+        return result
+
+    return compat.set_function_name(wrapper, opname, cls)
+
+
+class TimedeltaArray(dtl.DatetimeLikeArrayMixin, dtl.TimelikeOps):
+    """
+    Pandas ExtensionArray for timedelta data.
+
+    .. versionadded:: 0.24.0
+
+    .. warning::
+
+       TimedeltaArray is currently experimental, and its API may change
+       without warning. In particular, :attr:`TimedeltaArray.dtype` is
+       expected to change to be an instance of an ``ExtensionDtype``
+       subclass.
+
+    Parameters
+    ----------
+    values : array-like
+        The timedelta data.
+
+    dtype : numpy.dtype
+        Currently, only ``numpy.dtype("timedelta64[ns]")`` is accepted.
+    freq : Offset, optional
+    copy : bool, default False
+        Whether to copy the underlying array of data.
+    """
+    _typ = "timedeltaarray"
+    _scalar_type = Timedelta
+    __array_priority__ = 1000
+    # define my properties & methods for delegation
+    _other_ops = []
+    _bool_ops = []
+    _object_ops = ['freq']
+    _field_ops = ['days', 'seconds', 'microseconds', 'nanoseconds']
+    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
+    _datetimelike_methods = ["to_pytimedelta", "total_seconds",
+                             "round", "floor", "ceil"]
+
+    # Needed so that NaT.__richcmp__(DateTimeArray) operates pointwise
+    ndim = 1
+
+    @property
+    def _box_func(self):
+        return lambda x: Timedelta(x, unit='ns')
+
+    @property
+    def dtype(self):
+        """
+        The dtype for the TimedeltaArray.
+
+        .. warning::
+
+           A future version of pandas will change dtype to be an instance
+           of a :class:`pandas.api.extensions.ExtensionDtype` subclass,
+           not a ``numpy.dtype``.
+
+        Returns
+        -------
+        numpy.dtype
+        """
+        return _TD_DTYPE
+
+    # ----------------------------------------------------------------
+    # Constructors
+    _attributes = ["freq"]
+
+    def __init__(self, values, dtype=_TD_DTYPE, freq=None, copy=False):
+        if isinstance(values, (ABCSeries, ABCIndexClass)):
+            values = values._values
+
+        inferred_freq = getattr(values, "_freq", None)
+
+        if isinstance(values, type(self)):
+            if freq is None:
+                freq = values.freq
+            elif freq and values.freq:
+                freq = to_offset(freq)
+                freq, _ = dtl.validate_inferred_freq(freq, values.freq, False)
+            values = values._data
+
+        if not isinstance(values, np.ndarray):
+            msg = (
+                "Unexpected type '{}'. 'values' must be a TimedeltaArray "
+                "ndarray, or Series or Index containing one of those."
+            )
+            raise ValueError(msg.format(type(values).__name__))
+        if values.ndim != 1:
+            raise ValueError("Only 1-dimensional input arrays are supported.")
+
+        if values.dtype == 'i8':
+            # for compat with datetime/timedelta/period shared methods,
+            #  we can sometimes get here with int64 values.  These represent
+            #  nanosecond UTC (or tz-naive) unix timestamps
+            values = values.view(_TD_DTYPE)
+
+        _validate_td64_dtype(values.dtype)
+        dtype = _validate_td64_dtype(dtype)
+
+        if freq == "infer":
+            msg = (
+                "Frequency inference not allowed in TimedeltaArray.__init__. "
+                "Use 'pd.array()' instead."
+            )
+            raise ValueError(msg)
+
+        if copy:
+            values = values.copy()
+        if freq:
+            freq = to_offset(freq)
+
+        self._data = values
+        self._dtype = dtype
+        self._freq = freq
+
+        if inferred_freq is None and freq is not None:
+            type(self)._validate_frequency(self, freq)
+
+    @classmethod
+    def _simple_new(cls, values, freq=None, dtype=_TD_DTYPE):
+        assert dtype == _TD_DTYPE, dtype
+        assert isinstance(values, np.ndarray), type(values)
+
+        result = object.__new__(cls)
+        result._data = values.view(_TD_DTYPE)
+        result._freq = to_offset(freq)
+        result._dtype = _TD_DTYPE
+        return result
+
+    @classmethod
+    def _from_sequence(cls, data, dtype=_TD_DTYPE, copy=False,
+                       freq=None, unit=None):
+        if dtype:
+            _validate_td64_dtype(dtype)
+        freq, freq_infer = dtl.maybe_infer_freq(freq)
+
+        data, inferred_freq = sequence_to_td64ns(data, copy=copy, unit=unit)
+        freq, freq_infer = dtl.validate_inferred_freq(freq, inferred_freq,
+                                                      freq_infer)
+
+        result = cls._simple_new(data, freq=freq)
+
+        if inferred_freq is None and freq is not None:
+            # this condition precludes `freq_infer`
+            cls._validate_frequency(result, freq)
+
+        elif freq_infer:
+            # Set _freq directly to bypass duplicative _validate_frequency
+            # check.
+            result._freq = to_offset(result.inferred_freq)
+
+        return result
+
+    @classmethod
+    def _generate_range(cls, start, end, periods, freq, closed=None):
+
+        periods = dtl.validate_periods(periods)
+        if freq is None and any(x is None for x in [periods, start, end]):
+            raise ValueError('Must provide freq argument if no data is '
+                             'supplied')
+
+        if com.count_not_none(start, end, periods, freq) != 3:
+            raise ValueError('Of the four parameters: start, end, periods, '
+                             'and freq, exactly three must be specified')
+
+        if start is not None:
+            start = Timedelta(start)
+
+        if end is not None:
+            end = Timedelta(end)
+
+        if start is None and end is None:
+            if closed is not None:
+                raise ValueError("Closed has to be None if not both of start"
+                                 "and end are defined")
+
+        left_closed, right_closed = dtl.validate_endpoints(closed)
+
+        if freq is not None:
+            index = _generate_regular_range(start, end, periods, freq)
+        else:
+            index = np.linspace(start.value, end.value, periods).astype('i8')
+
+        if not left_closed:
+            index = index[1:]
+        if not right_closed:
+            index = index[:-1]
+
+        return cls._simple_new(index, freq=freq)
+
+    # ----------------------------------------------------------------
+    # DatetimeLike Interface
+
+    def _unbox_scalar(self, value):
+        if not isinstance(value, self._scalar_type) and value is not NaT:
+            raise ValueError("'value' should be a Timedelta.")
+        self._check_compatible_with(value)
+        return value.value
+
+    def _scalar_from_string(self, value):
+        return Timedelta(value)
+
+    def _check_compatible_with(self, other):
+        # we don't have anything to validate.
+        pass
+
+    def _maybe_clear_freq(self):
+        self._freq = None
+
+    # ----------------------------------------------------------------
+    # Array-Like / EA-Interface Methods
+
+    @Appender(dtl.DatetimeLikeArrayMixin._validate_fill_value.__doc__)
+    def _validate_fill_value(self, fill_value):
+        if isna(fill_value):
+            fill_value = iNaT
+        elif isinstance(fill_value, (timedelta, np.timedelta64, Tick)):
+            fill_value = Timedelta(fill_value).value
+        else:
+            raise ValueError("'fill_value' should be a Timedelta. "
+                             "Got '{got}'.".format(got=fill_value))
+        return fill_value
+
+    def astype(self, dtype, copy=True):
+        # We handle
+        #   --> timedelta64[ns]
+        #   --> timedelta64
+        # DatetimeLikeArrayMixin super call handles other cases
+        dtype = pandas_dtype(dtype)
+
+        if is_timedelta64_dtype(dtype) and not is_timedelta64_ns_dtype(dtype):
+            # by pandas convention, converting to non-nano timedelta64
+            #  returns an int64-dtyped array with ints representing multiples
+            #  of the desired timedelta unit.  This is essentially division
+            if self._hasnans:
+                # avoid double-copying
+                result = self._data.astype(dtype, copy=False)
+                values = self._maybe_mask_results(result,
+                                                  fill_value=None,
+                                                  convert='float64')
+                return values
+            result = self._data.astype(dtype, copy=copy)
+            return result.astype('i8')
+        elif is_timedelta64_ns_dtype(dtype):
+            if copy:
+                return self.copy()
+            return self
+        return dtl.DatetimeLikeArrayMixin.astype(self, dtype, copy=copy)
+
+    # ----------------------------------------------------------------
+    # Rendering Methods
+
+    def _formatter(self, boxed=False):
+        from pandas.io.formats.format import _get_format_timedelta64
+        return _get_format_timedelta64(self, box=True)
+
+    def _format_native_types(self, na_rep='NaT', date_format=None):
+        from pandas.io.formats.format import _get_format_timedelta64
+
+        formatter = _get_format_timedelta64(self._data, na_rep)
+        return np.array([formatter(x) for x in self._data])
+
+    # ----------------------------------------------------------------
+    # Arithmetic Methods
+
+    _create_comparison_method = classmethod(_td_array_cmp)
+
+    def _add_offset(self, other):
+        assert not isinstance(other, Tick)
+        raise TypeError("cannot add the type {typ} to a {cls}"
+                        .format(typ=type(other).__name__,
+                                cls=type(self).__name__))
+
+    def _add_delta(self, delta):
+        """
+        Add a timedelta-like, Tick, or TimedeltaIndex-like object
+        to self, yielding a new TimedeltaArray.
+
+        Parameters
+        ----------
+        other : {timedelta, np.timedelta64, Tick,
+                 TimedeltaIndex, ndarray[timedelta64]}
+
+        Returns
+        -------
+        result : TimedeltaArray
+        """
+        new_values = super(TimedeltaArray, self)._add_delta(delta)
+        return type(self)._from_sequence(new_values, freq='infer')
+
+    def _add_datetime_arraylike(self, other):
+        """
+        Add DatetimeArray/Index or ndarray[datetime64] to TimedeltaArray.
+        """
+        if isinstance(other, np.ndarray):
+            # At this point we have already checked that dtype is datetime64
+            from pandas.core.arrays import DatetimeArray
+            other = DatetimeArray(other)
+
+        # defer to implementation in DatetimeArray
+        return other + self
+
+    def _add_datetimelike_scalar(self, other):
+        # adding a timedeltaindex to a datetimelike
+        from pandas.core.arrays import DatetimeArray
+
+        assert other is not NaT
+        other = Timestamp(other)
+        if other is NaT:
+            # In this case we specifically interpret NaT as a datetime, not
+            # the timedelta interpretation we would get by returning self + NaT
+            result = self.asi8.view('m8[ms]') + NaT.to_datetime64()
+            return DatetimeArray(result)
+
+        i8 = self.asi8
+        result = checked_add_with_arr(i8, other.value,
+                                      arr_mask=self._isnan)
+        result = self._maybe_mask_results(result)
+        dtype = DatetimeTZDtype(tz=other.tz) if other.tz else _NS_DTYPE
+        return DatetimeArray(result, dtype=dtype, freq=self.freq)
+
+    def _addsub_offset_array(self, other, op):
+        # Add or subtract Array-like of DateOffset objects
+        try:
+            # TimedeltaIndex can only operate with a subset of DateOffset
+            # subclasses.  Incompatible classes will raise AttributeError,
+            # which we re-raise as TypeError
+            return super(TimedeltaArray, self)._addsub_offset_array(
+                other, op
+            )
+        except AttributeError:
+            raise TypeError("Cannot add/subtract non-tick DateOffset to {cls}"
+                            .format(cls=type(self).__name__))
+
+    def __mul__(self, other):
+        other = lib.item_from_zerodim(other)
+
+        if isinstance(other, (ABCDataFrame, ABCSeries, ABCIndexClass)):
+            return NotImplemented
+
+        if is_scalar(other):
+            # numpy will accept float and int, raise TypeError for others
+            result = self._data * other
+            freq = None
+            if self.freq is not None and not isna(other):
+                freq = self.freq * other
+            return type(self)(result, freq=freq)
+
+        if not hasattr(other, "dtype"):
+            # list, tuple
+            other = np.array(other)
+        if len(other) != len(self) and not is_timedelta64_dtype(other):
+            # Exclude timedelta64 here so we correctly raise TypeError
+            #  for that instead of ValueError
+            raise ValueError("Cannot multiply with unequal lengths")
+
+        if is_object_dtype(other):
+            # this multiplication will succeed only if all elements of other
+            #  are int or float scalars, so we will end up with
+            #  timedelta64[ns]-dtyped result
+            result = [self[n] * other[n] for n in range(len(self))]
+            result = np.array(result)
+            return type(self)(result)
+
+        # numpy will accept float or int dtype, raise TypeError for others
+        result = self._data * other
+        return type(self)(result)
+
+    __rmul__ = __mul__
+
+    def __truediv__(self, other):
+        # timedelta / X is well-defined for timedelta-like or numeric X
+        other = lib.item_from_zerodim(other)
+
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+            if other is NaT:
+                # specifically timedelta64-NaT
+                result = np.empty(self.shape, dtype=np.float64)
+                result.fill(np.nan)
+                return result
+
+            # otherwise, dispatch to Timedelta implementation
+            return self._data / other
+
+        elif lib.is_scalar(other):
+            # assume it is numeric
+            result = self._data / other
+            freq = None
+            if self.freq is not None:
+                # Tick division is not implemented, so operate on Timedelta
+                freq = self.freq.delta / other
+            return type(self)(result, freq=freq)
+
+        if not hasattr(other, "dtype"):
+            # e.g. list, tuple
+            other = np.array(other)
+
+        if len(other) != len(self):
+            raise ValueError("Cannot divide vectors with unequal lengths")
+
+        elif is_timedelta64_dtype(other):
+            # let numpy handle it
+            return self._data / other
+
+        elif is_object_dtype(other):
+            # Note: we do not do type inference on the result, so either
+            #  an object array or numeric-dtyped (if numpy does inference)
+            #  will be returned.  GH#23829
+            result = [self[n] / other[n] for n in range(len(self))]
+            result = np.array(result)
+            return result
+
+        else:
+            result = self._data / other
+            return type(self)(result)
+
+    def __rtruediv__(self, other):
+        # X / timedelta is defined only for timedelta-like X
+        other = lib.item_from_zerodim(other)
+
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+            if other is NaT:
+                # specifically timedelta64-NaT
+                result = np.empty(self.shape, dtype=np.float64)
+                result.fill(np.nan)
+                return result
+
+            # otherwise, dispatch to Timedelta implementation
+            return other / self._data
+
+        elif lib.is_scalar(other):
+            raise TypeError("Cannot divide {typ} by {cls}"
+                            .format(typ=type(other).__name__,
+                                    cls=type(self).__name__))
+
+        if not hasattr(other, "dtype"):
+            # e.g. list, tuple
+            other = np.array(other)
+
+        if len(other) != len(self):
+            raise ValueError("Cannot divide vectors with unequal lengths")
+
+        elif is_timedelta64_dtype(other):
+            # let numpy handle it
+            return other / self._data
+
+        elif is_object_dtype(other):
+            # Note: unlike in __truediv__, we do not _need_ to do type#
+            #  inference on the result.  It does not raise, a numeric array
+            #  is returned.  GH#23829
+            result = [other[n] / self[n] for n in range(len(self))]
+            return np.array(result)
+
+        else:
+            raise TypeError("Cannot divide {dtype} data by {cls}"
+                            .format(dtype=other.dtype,
+                                    cls=type(self).__name__))
+
+    if compat.PY2:
+        __div__ = __truediv__
+        __rdiv__ = __rtruediv__
+
+    def __floordiv__(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if is_scalar(other):
+            if isinstance(other, (timedelta, np.timedelta64, Tick)):
+                other = Timedelta(other)
+                if other is NaT:
+                    # treat this specifically as timedelta-NaT
+                    result = np.empty(self.shape, dtype=np.float64)
+                    result.fill(np.nan)
+                    return result
+
+                # dispatch to Timedelta implementation
+                result = other.__rfloordiv__(self._data)
+                return result
+
+            # at this point we should only have numeric scalars; anything
+            #  else will raise
+            result = self.asi8 // other
+            result[self._isnan] = iNaT
+            freq = None
+            if self.freq is not None:
+                # Note: freq gets division, not floor-division
+                freq = self.freq / other
+            return type(self)(result.view('m8[ns]'), freq=freq)
+
+        if not hasattr(other, "dtype"):
+            # list, tuple
+            other = np.array(other)
+        if len(other) != len(self):
+            raise ValueError("Cannot divide with unequal lengths")
+
+        elif is_timedelta64_dtype(other):
+            other = type(self)(other)
+
+            # numpy timedelta64 does not natively support floordiv, so operate
+            #  on the i8 values
+            result = self.asi8 // other.asi8
+            mask = self._isnan | other._isnan
+            if mask.any():
+                result = result.astype(np.int64)
+                result[mask] = np.nan
+            return result
+
+        elif is_object_dtype(other):
+            result = [self[n] // other[n] for n in range(len(self))]
+            result = np.array(result)
+            if lib.infer_dtype(result, skipna=False) == 'timedelta':
+                result, _ = sequence_to_td64ns(result)
+                return type(self)(result)
+            return result
+
+        elif is_integer_dtype(other) or is_float_dtype(other):
+            result = self._data // other
+            return type(self)(result)
+
+        else:
+            dtype = getattr(other, "dtype", type(other).__name__)
+            raise TypeError("Cannot divide {typ} by {cls}"
+                            .format(typ=dtype, cls=type(self).__name__))
+
+    def __rfloordiv__(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if is_scalar(other):
+            if isinstance(other, (timedelta, np.timedelta64, Tick)):
+                other = Timedelta(other)
+                if other is NaT:
+                    # treat this specifically as timedelta-NaT
+                    result = np.empty(self.shape, dtype=np.float64)
+                    result.fill(np.nan)
+                    return result
+
+                # dispatch to Timedelta implementation
+                result = other.__floordiv__(self._data)
+                return result
+
+            raise TypeError("Cannot divide {typ} by {cls}"
+                            .format(typ=type(other).__name__,
+                                    cls=type(self).__name__))
+
+        if not hasattr(other, "dtype"):
+            # list, tuple
+            other = np.array(other)
+        if len(other) != len(self):
+            raise ValueError("Cannot divide with unequal lengths")
+
+        elif is_timedelta64_dtype(other):
+            other = type(self)(other)
+
+            # numpy timedelta64 does not natively support floordiv, so operate
+            #  on the i8 values
+            result = other.asi8 // self.asi8
+            mask = self._isnan | other._isnan
+            if mask.any():
+                result = result.astype(np.int64)
+                result[mask] = np.nan
+            return result
+
+        elif is_object_dtype(other):
+            result = [other[n] // self[n] for n in range(len(self))]
+            result = np.array(result)
+            return result
+
+        else:
+            dtype = getattr(other, "dtype", type(other).__name__)
+            raise TypeError("Cannot divide {typ} by {cls}"
+                            .format(typ=dtype, cls=type(self).__name__))
+
+    def __mod__(self, other):
+        # Note: This is a naive implementation, can likely be optimized
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+        return self - (self // other) * other
+
+    def __rmod__(self, other):
+        # Note: This is a naive implementation, can likely be optimized
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+        return other - (other // self) * self
+
+    def __divmod__(self, other):
+        # Note: This is a naive implementation, can likely be optimized
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+
+        res1 = self // other
+        res2 = self - res1 * other
+        return res1, res2
+
+    def __rdivmod__(self, other):
+        # Note: This is a naive implementation, can likely be optimized
+        if isinstance(other, (ABCSeries, ABCDataFrame, ABCIndexClass)):
+            return NotImplemented
+
+        other = lib.item_from_zerodim(other)
+        if isinstance(other, (timedelta, np.timedelta64, Tick)):
+            other = Timedelta(other)
+
+        res1 = other // self
+        res2 = other - res1 * self
+        return res1, res2
+
+    # Note: TimedeltaIndex overrides this in call to cls._add_numeric_methods
+    def __neg__(self):
+        if self.freq is not None:
+            return type(self)(-self._data, freq=-self.freq)
+        return type(self)(-self._data)
+
+    def __abs__(self):
+        # Note: freq is not preserved
+        return type(self)(np.abs(self._data))
+
+    # ----------------------------------------------------------------
+    # Conversion Methods - Vectorized analogues of Timedelta methods
+
+    def total_seconds(self):
+        """
+        Return total duration of each element expressed in seconds.
+
+        This method is available directly on TimedeltaArray, TimedeltaIndex
+        and on Series containing timedelta values under the ``.dt`` namespace.
+
+        Returns
+        -------
+        seconds : [ndarray, Float64Index, Series]
+            When the calling object is a TimedeltaArray, the return type
+            is ndarray.  When the calling object is a TimedeltaIndex,
+            the return type is a Float64Index. When the calling object
+            is a Series, the return type is Series of type `float64` whose
+            index is the same as the original.
+
+        See Also
+        --------
+        datetime.timedelta.total_seconds : Standard library version
+            of this method.
+        TimedeltaIndex.components : Return a DataFrame with components of
+            each Timedelta.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series(pd.to_timedelta(np.arange(5), unit='d'))
+        >>> s
+        0   0 days
+        1   1 days
+        2   2 days
+        3   3 days
+        4   4 days
+        dtype: timedelta64[ns]
+
+        >>> s.dt.total_seconds()
+        0         0.0
+        1     86400.0
+        2    172800.0
+        3    259200.0
+        4    345600.0
+        dtype: float64
+
+        **TimedeltaIndex**
+
+        >>> idx = pd.to_timedelta(np.arange(5), unit='d')
+        >>> idx
+        TimedeltaIndex(['0 days', '1 days', '2 days', '3 days', '4 days'],
+                       dtype='timedelta64[ns]', freq=None)
+
+        >>> idx.total_seconds()
+        Float64Index([0.0, 86400.0, 172800.0, 259200.00000000003, 345600.0],
+                     dtype='float64')
+        """
+        return self._maybe_mask_results(1e-9 * self.asi8, fill_value=None)
+
+    def to_pytimedelta(self):
+        """
+        Return Timedelta Array/Index as object ndarray of datetime.timedelta
+        objects.
+
+        Returns
+        -------
+        datetimes : ndarray
+        """
+        return tslibs.ints_to_pytimedelta(self.asi8)
+
+    days = _field_accessor("days", "days",
+                           "Number of days for each element.")
+    seconds = _field_accessor("seconds", "seconds",
+                              "Number of seconds (>= 0 and less than 1 day) "
+                              "for each element.")
+    microseconds = _field_accessor("microseconds", "microseconds",
+                                   "Number of microseconds (>= 0 and less "
+                                   "than 1 second) for each element.")
+    nanoseconds = _field_accessor("nanoseconds", "nanoseconds",
+                                  "Number of nanoseconds (>= 0 and less "
+                                  "than 1 microsecond) for each element.")
+
+    @property
+    def components(self):
+        """
+        Return a dataframe of the components (days, hours, minutes,
+        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
+
+        Returns
+        -------
+        a DataFrame
+        """
+        from pandas import DataFrame
+
+        columns = ['days', 'hours', 'minutes', 'seconds',
+                   'milliseconds', 'microseconds', 'nanoseconds']
+        hasnans = self._hasnans
+        if hasnans:
+            def f(x):
+                if isna(x):
+                    return [np.nan] * len(columns)
+                return x.components
+        else:
+            def f(x):
+                return x.components
+
+        result = DataFrame([f(x) for x in self], columns=columns)
+        if not hasnans:
+            result = result.astype('int64')
+        return result
+
+
+TimedeltaArray._add_comparison_ops()
+
+
+# ---------------------------------------------------------------------
+# Constructor Helpers
+
+def sequence_to_td64ns(data, copy=False, unit="ns", errors="raise"):
+    """
+    Parameters
+    ----------
+    array : list-like
+    copy : bool, default False
+    unit : str, default "ns"
+        The timedelta unit to treat integers as multiples of.
+    errors : {"raise", "coerce", "ignore"}, default "raise"
+        How to handle elements that cannot be converted to timedelta64[ns].
+        See ``pandas.to_timedelta`` for details.
+
+    Returns
+    -------
+    converted : numpy.ndarray
+        The sequence converted to a numpy array with dtype ``timedelta64[ns]``.
+    inferred_freq : Tick or None
+        The inferred frequency of the sequence.
+
+    Raises
+    ------
+    ValueError : Data cannot be converted to timedelta64[ns].
+
+    Notes
+    -----
+    Unlike `pandas.to_timedelta`, if setting ``errors=ignore`` will not cause
+    errors to be ignored; they are caught and subsequently ignored at a
+    higher level.
+    """
+    inferred_freq = None
+    unit = parse_timedelta_unit(unit)
+
+    # Unwrap whatever we have into a np.ndarray
+    if not hasattr(data, 'dtype'):
+        # e.g. list, tuple
+        if np.ndim(data) == 0:
+            # i.e. generator
+            data = list(data)
+        data = np.array(data, copy=False)
+    elif isinstance(data, ABCSeries):
+        data = data._values
+    elif isinstance(data, (ABCTimedeltaIndex, TimedeltaArray)):
+        inferred_freq = data.freq
+        data = data._data
+
+    # Convert whatever we have into timedelta64[ns] dtype
+    if is_object_dtype(data.dtype) or is_string_dtype(data.dtype):
+        # no need to make a copy, need to convert if string-dtyped
+        data = objects_to_td64ns(data, unit=unit, errors=errors)
+        copy = False
+
+    elif is_integer_dtype(data.dtype):
+        # treat as multiples of the given unit
+        data, copy_made = ints_to_td64ns(data, unit=unit)
+        copy = copy and not copy_made
+
+    elif is_float_dtype(data.dtype):
+        # treat as multiples of the given unit.  If after converting to nanos,
+        #  there are fractional components left, these are truncated
+        #  (i.e. NOT rounded)
+        mask = np.isnan(data)
+        coeff = np.timedelta64(1, unit) / np.timedelta64(1, 'ns')
+        data = (coeff * data).astype(np.int64).view('timedelta64[ns]')
+        data[mask] = iNaT
+        copy = False
+
+    elif is_timedelta64_dtype(data.dtype):
+        if data.dtype != _TD_DTYPE:
+            # non-nano unit
+            # TODO: watch out for overflows
+            data = data.astype(_TD_DTYPE)
+            copy = False
+
+    elif is_datetime64_dtype(data):
+        # GH#23539
+        warnings.warn("Passing datetime64-dtype data to TimedeltaIndex is "
+                      "deprecated, will raise a TypeError in a future "
+                      "version",
+                      FutureWarning, stacklevel=4)
+        data = ensure_int64(data).view(_TD_DTYPE)
+
+    else:
+        raise TypeError("dtype {dtype} cannot be converted to timedelta64[ns]"
+                        .format(dtype=data.dtype))
+
+    data = np.array(data, copy=copy)
+    if data.ndim != 1:
+        raise ValueError("Only 1-dimensional input arrays are supported.")
+
+    assert data.dtype == 'm8[ns]', data
+    return data, inferred_freq
+
+
+def ints_to_td64ns(data, unit="ns"):
+    """
+    Convert an ndarray with integer-dtype to timedelta64[ns] dtype, treating
+    the integers as multiples of the given timedelta unit.
+
+    Parameters
+    ----------
+    data : numpy.ndarray with integer-dtype
+    unit : str, default "ns"
+        The timedelta unit to treat integers as multiples of.
+
+    Returns
+    -------
+    numpy.ndarray : timedelta64[ns] array converted from data
+    bool : whether a copy was made
+    """
+    copy_made = False
+    unit = unit if unit is not None else "ns"
+
+    if data.dtype != np.int64:
+        # converting to int64 makes a copy, so we can avoid
+        # re-copying later
+        data = data.astype(np.int64)
+        copy_made = True
+
+    if unit != "ns":
+        dtype_str = "timedelta64[{unit}]".format(unit=unit)
+        data = data.view(dtype_str)
+
+        # TODO: watch out for overflows when converting from lower-resolution
+        data = data.astype("timedelta64[ns]")
+        # the astype conversion makes a copy, so we can avoid re-copying later
+        copy_made = True
+
+    else:
+        data = data.view("timedelta64[ns]")
+
+    return data, copy_made
+
+
+def objects_to_td64ns(data, unit="ns", errors="raise"):
+    """
+    Convert a object-dtyped or string-dtyped array into an
+    timedelta64[ns]-dtyped array.
+
+    Parameters
+    ----------
+    data : ndarray or Index
+    unit : str, default "ns"
+        The timedelta unit to treat integers as multiples of.
+    errors : {"raise", "coerce", "ignore"}, default "raise"
+        How to handle elements that cannot be converted to timedelta64[ns].
+        See ``pandas.to_timedelta`` for details.
+
+    Returns
+    -------
+    numpy.ndarray : timedelta64[ns] array converted from data
+
+    Raises
+    ------
+    ValueError : Data cannot be converted to timedelta64[ns].
+
+    Notes
+    -----
+    Unlike `pandas.to_timedelta`, if setting `errors=ignore` will not cause
+    errors to be ignored; they are caught and subsequently ignored at a
+    higher level.
+    """
+    # coerce Index to np.ndarray, converting string-dtype if necessary
+    values = np.array(data, dtype=np.object_, copy=False)
+
+    result = array_to_timedelta64(values,
+                                  unit=unit, errors=errors)
+    return result.view('timedelta64[ns]')
+
+
+def _validate_td64_dtype(dtype):
+    dtype = pandas_dtype(dtype)
+    if is_dtype_equal(dtype, np.dtype("timedelta64")):
+        dtype = _TD_DTYPE
+        msg = textwrap.dedent("""\
+            Passing in 'timedelta' dtype with no precision is deprecated
+            and will raise in a future version. Please pass in
+            'timedelta64[ns]' instead.""")
+        warnings.warn(msg, FutureWarning, stacklevel=4)
+
+    if not is_dtype_equal(dtype, _TD_DTYPE):
+        raise ValueError(_BAD_DTYPE.format(dtype=dtype))
+
+    return dtype
+
+
+def _generate_regular_range(start, end, periods, offset):
+    stride = offset.nanos
+    if periods is None:
+        b = Timedelta(start).value
+        e = Timedelta(end).value
+        e += stride - e % stride
+    elif start is not None:
+        b = Timedelta(start).value
+        e = b + periods * stride
+    elif end is not None:
+        e = Timedelta(end).value + stride
+        b = e - periods * stride
+    else:
+        raise ValueError("at least 'start' or 'end' should be specified "
+                         "if a 'period' is given.")
+
+    data = np.arange(b, e, stride, dtype=np.int64)
+    return data
diff --git a/pandas/core/base.py b/pandas/core/base.py
index 3401c7c59cb56..f896596dd5216 100644
--- a/pandas/core/base.py
+++ b/pandas/core/base.py
@@ -1,22 +1,30 @@
 """
 Base and utility classes for pandas objects.
 """
-from pandas import compat
-from pandas.compat import builtins
-import numpy as np
+from collections import OrderedDict
+import textwrap
+import warnings
 
-from pandas.types.missing import isnull
-from pandas.types.generic import ABCDataFrame, ABCSeries, ABCIndexClass
-from pandas.types.common import is_object_dtype, is_list_like, is_scalar
-from pandas.util.validators import validate_bool_kwarg
+import numpy as np
 
-from pandas.core import common as com
-import pandas.core.nanops as nanops
 import pandas._libs.lib as lib
+import pandas.compat as compat
+from pandas.compat import PYPY, builtins, map, range
 from pandas.compat.numpy import function as nv
-from pandas.util.decorators import (Appender, cache_readonly,
-                                    deprecate_kwarg, Substitution)
-from pandas.core.common import AbstractMethodError
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+from pandas.util._validators import validate_bool_kwarg
+
+from pandas.core.dtypes.common import (
+    is_datetime64_ns_dtype, is_datetime64tz_dtype, is_datetimelike,
+    is_extension_array_dtype, is_extension_type, is_list_like, is_object_dtype,
+    is_scalar, is_timedelta64_ns_dtype)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import algorithms, common as com
+from pandas.core.accessor import DirNamesMixin
+import pandas.core.nanops as nanops
 
 _shared_docs = dict()
 _indexops_doc_kwargs = dict(klass='IndexOpsMixin', inplace='',
@@ -71,7 +79,7 @@ def __repr__(self):
         return str(self)
 
 
-class PandasObject(StringMixin):
+class PandasObject(StringMixin, DirNamesMixin):
 
     """baseclass for various pandas objects"""
 
@@ -90,23 +98,6 @@ def __unicode__(self):
         # Should be overwritten by base classes
         return object.__repr__(self)
 
-    def _dir_additions(self):
-        """ add addtional __dir__ for this object """
-        return set()
-
-    def _dir_deletions(self):
-        """ delete unwanted __dir__ for this object """
-        return set()
-
-    def __dir__(self):
-        """
-        Provide method name lookup and completion
-        Only provide 'public' methods
-        """
-        rv = set(dir(type(self)))
-        rv = (rv - self._dir_deletions()) | self._dir_additions()
-        return sorted(rv)
-
     def _reset_cache(self, key=None):
         """
         Reset cached properties. If ``key`` is passed, only clears that key.
@@ -120,7 +111,7 @@ def _reset_cache(self, key=None):
 
     def __sizeof__(self):
         """
-        Generates the total memory usage for a object that returns
+        Generates the total memory usage for an object that returns
         either a value or Series of values
         """
         if hasattr(self, 'memory_usage'):
@@ -139,7 +130,7 @@ class NoNewAttributesMixin(object):
 
     Prevents additional attributes via xxx.attribute = "something" after a
     call to `self.__freeze()`. Mainly used to prevent the user from using
-    wrong attrirbutes on a accessor (`Series.cat/.str/.dt`).
+    wrong attributes on a accessor (`Series.cat/.str/.dt`).
 
     If you really want to add a new attribute at a later time, you need to use
     `object.__setattr__(self, key, value)`.
@@ -152,102 +143,19 @@ def _freeze(self):
     # prevent adding any attribute via s.xxx.new_attribute = ...
     def __setattr__(self, key, value):
         # _cache is used by a decorator
-        # dict lookup instead of getattr as getattr is false for getter
-        # which error
-        if getattr(self, "__frozen", False) and not \
-                (key in type(self).__dict__ or key == "_cache"):
+        # We need to check both 1.) cls.__dict__ and 2.) getattr(self, key)
+        # because
+        # 1.) getattr is false for attributes that raise errors
+        # 2.) cls.__dict__ doesn't traverse into base classes
+        if (getattr(self, "__frozen", False) and not
+                (key == "_cache" or
+                 key in type(self).__dict__ or
+                 getattr(self, key, None) is not None)):
             raise AttributeError("You cannot add any new attribute '{key}'".
                                  format(key=key))
         object.__setattr__(self, key, value)
 
 
-class PandasDelegate(PandasObject):
-    """ an abstract base class for delegating methods/properties """
-
-    def _delegate_property_get(self, name, *args, **kwargs):
-        raise TypeError("You cannot access the "
-                        "property {name}".format(name=name))
-
-    def _delegate_property_set(self, name, value, *args, **kwargs):
-        raise TypeError("The property {name} cannot be set".format(name=name))
-
-    def _delegate_method(self, name, *args, **kwargs):
-        raise TypeError("You cannot call method {name}".format(name=name))
-
-    @classmethod
-    def _add_delegate_accessors(cls, delegate, accessors, typ,
-                                overwrite=False):
-        """
-        add accessors to cls from the delegate class
-
-        Parameters
-        ----------
-        cls : the class to add the methods/properties to
-        delegate : the class to get methods/properties & doc-strings
-        acccessors : string list of accessors to add
-        typ : 'property' or 'method'
-        overwrite : boolean, default False
-           overwrite the method/property in the target class if it exists
-        """
-
-        def _create_delegator_property(name):
-
-            def _getter(self):
-                return self._delegate_property_get(name)
-
-            def _setter(self, new_values):
-                return self._delegate_property_set(name, new_values)
-
-            _getter.__name__ = name
-            _setter.__name__ = name
-
-            return property(fget=_getter, fset=_setter,
-                            doc=getattr(delegate, name).__doc__)
-
-        def _create_delegator_method(name):
-
-            def f(self, *args, **kwargs):
-                return self._delegate_method(name, *args, **kwargs)
-
-            f.__name__ = name
-            f.__doc__ = getattr(delegate, name).__doc__
-
-            return f
-
-        for name in accessors:
-
-            if typ == 'property':
-                f = _create_delegator_property(name)
-            else:
-                f = _create_delegator_method(name)
-
-            # don't overwrite existing methods/properties
-            if overwrite or not hasattr(cls, name):
-                setattr(cls, name, f)
-
-
-class AccessorProperty(object):
-    """Descriptor for implementing accessor properties like Series.str
-    """
-
-    def __init__(self, accessor_cls, construct_accessor):
-        self.accessor_cls = accessor_cls
-        self.construct_accessor = construct_accessor
-        self.__doc__ = accessor_cls.__doc__
-
-    def __get__(self, instance, owner=None):
-        if instance is None:
-            # this ensures that Series.str.<method> is well defined
-            return self.accessor_cls
-        return self.construct_accessor(instance)
-
-    def __set__(self, instance, value):
-        raise AttributeError("can't set attribute")
-
-    def __delete__(self, instance):
-        raise AttributeError("can't delete attribute")
-
-
 class GroupByError(Exception):
     pass
 
@@ -268,29 +176,48 @@ class SelectionMixin(object):
     _selection = None
     _internal_names = ['_cache', '__setstate__']
     _internal_names_set = set(_internal_names)
-    _builtin_table = {
-        builtins.sum: np.sum,
-        builtins.max: np.max,
-        builtins.min: np.min
-    }
-    _cython_table = {
-        builtins.sum: 'sum',
-        builtins.max: 'max',
-        builtins.min: 'min',
-        np.sum: 'sum',
-        np.mean: 'mean',
-        np.prod: 'prod',
-        np.std: 'std',
-        np.var: 'var',
-        np.median: 'median',
-        np.max: 'max',
-        np.min: 'min',
-        np.cumprod: 'cumprod',
-        np.cumsum: 'cumsum'
-    }
+
+    _builtin_table = OrderedDict((
+        (builtins.sum, np.sum),
+        (builtins.max, np.max),
+        (builtins.min, np.min),
+    ))
+
+    _cython_table = OrderedDict((
+        (builtins.sum, 'sum'),
+        (builtins.max, 'max'),
+        (builtins.min, 'min'),
+        (np.all, 'all'),
+        (np.any, 'any'),
+        (np.sum, 'sum'),
+        (np.nansum, 'sum'),
+        (np.mean, 'mean'),
+        (np.nanmean, 'mean'),
+        (np.prod, 'prod'),
+        (np.nanprod, 'prod'),
+        (np.std, 'std'),
+        (np.nanstd, 'std'),
+        (np.var, 'var'),
+        (np.nanvar, 'var'),
+        (np.median, 'median'),
+        (np.nanmedian, 'median'),
+        (np.max, 'max'),
+        (np.nanmax, 'max'),
+        (np.min, 'min'),
+        (np.nanmin, 'min'),
+        (np.cumprod, 'cumprod'),
+        (np.nancumprod, 'cumprod'),
+        (np.cumsum, 'cumsum'),
+        (np.nancumsum, 'cumsum'),
+    ))
 
     @property
-    def name(self):
+    def _selection_name(self):
+        """
+        return a name for myself; this would ideally be called
+        the 'name' property, but we cannot conflict with the
+        Series.name property which can be set
+        """
         if self._selection is None:
             return None  # 'result'
         else:
@@ -328,24 +255,25 @@ def _obj_with_exclusions(self):
 
     def __getitem__(self, key):
         if self._selection is not None:
-            raise Exception('Column(s) %s already selected' % self._selection)
+            raise IndexError('Column(s) {selection} already selected'
+                             .format(selection=self._selection))
 
         if isinstance(key, (list, tuple, ABCSeries, ABCIndexClass,
                             np.ndarray)):
             if len(self.obj.columns.intersection(key)) != len(key):
                 bad_keys = list(set(key).difference(self.obj.columns))
-                raise KeyError("Columns not found: %s"
-                               % str(bad_keys)[1:-1])
+                raise KeyError("Columns not found: {missing}"
+                               .format(missing=str(bad_keys)[1:-1]))
             return self._gotitem(list(key), ndim=2)
 
         elif not getattr(self, 'as_index', False):
             if key not in self.obj.columns:
-                raise KeyError("Column not found: %s" % key)
+                raise KeyError("Column not found: {key}".format(key=key))
             return self._gotitem(key, ndim=2)
 
         else:
             if key not in self.obj:
-                raise KeyError("Column not found: %s" % key)
+                raise KeyError("Column not found: {key}".format(key=key))
             return self._gotitem(key, ndim=1)
 
     def _gotitem(self, key, ndim, subset=None):
@@ -364,47 +292,39 @@ def _gotitem(self, key, ndim, subset=None):
         """
         raise AbstractMethodError(self)
 
-    _agg_doc = """Aggregate using input function or dict of {column ->
-function}
-
-Parameters
-----------
-arg : function or dict
-    Function to use for aggregating groups. If a function, must either
-    work when passed a DataFrame or when passed to DataFrame.apply. If
-    passed a dict, the keys must be DataFrame column names.
-
-    Accepted Combinations are:
-      - string cythonized function name
-      - function
-      - list of functions
-      - dict of columns -> functions
-      - nested dict of names -> dicts of functions
-
-Notes
------
-Numpy functions mean/median/prod/sum/std/var are special cased so the
-default behavior is applying the function along axis=0
-(e.g., np.mean(arr_2d, axis=0)) as opposed to
-mimicking the default Numpy behavior (e.g., np.mean(arr_2d)).
-
-Returns
--------
-aggregated : DataFrame
-"""
-
-    _see_also_template = """
-See also
---------
-pandas.Series.%(name)s
-pandas.DataFrame.%(name)s
-"""
-
     def aggregate(self, func, *args, **kwargs):
         raise AbstractMethodError(self)
 
     agg = aggregate
 
+    def _try_aggregate_string_function(self, arg, *args, **kwargs):
+        """
+        if arg is a string, then try to operate on it:
+        - try to find a function (or attribute) on ourselves
+        - try to find a numpy function
+        - raise
+
+        """
+        assert isinstance(arg, compat.string_types)
+
+        f = getattr(self, arg, None)
+        if f is not None:
+            if callable(f):
+                return f(*args, **kwargs)
+
+            # people may try to aggregate on a non-callable attribute
+            # but don't let them think they can pass args to it
+            assert len(args) == 0
+            assert len([kwarg for kwarg in kwargs
+                        if kwarg not in ['axis', '_level']]) == 0
+            return f
+
+        f = getattr(np, arg, None)
+        if f is not None:
+            return f(self, *args, **kwargs)
+
+        raise ValueError("{arg} is an unknown string function".format(arg=arg))
+
     def _aggregate(self, arg, *args, **kwargs):
         """
         provide an implementation for the aggregators
@@ -424,27 +344,40 @@ def _aggregate(self, arg, *args, **kwargs):
         how can be a string describe the required post-processing, or
         None if not required
         """
-
         is_aggregator = lambda x: isinstance(x, (list, tuple, dict))
         is_nested_renamer = False
 
+        _axis = kwargs.pop('_axis', None)
+        if _axis is None:
+            _axis = getattr(self, 'axis', 0)
         _level = kwargs.pop('_level', None)
+
         if isinstance(arg, compat.string_types):
-            return getattr(self, arg)(*args, **kwargs), None
+            return self._try_aggregate_string_function(arg, *args,
+                                                       **kwargs), None
 
         if isinstance(arg, dict):
 
             # aggregate based on the passed dict
-            if self.axis != 0:  # pragma: no cover
+            if _axis != 0:  # pragma: no cover
                 raise ValueError('Can only pass dict with axis=0')
 
             obj = self._selected_obj
 
+            def nested_renaming_depr(level=4):
+                # deprecation of nested renaming
+                # GH 15931
+                warnings.warn(
+                    ("using a dict with renaming "
+                     "is deprecated and will be removed in a future "
+                     "version"),
+                    FutureWarning, stacklevel=level)
+
             # if we have a dict of any non-scalars
             # eg. {'A' : ['mean']}, normalize all to
             # be list-likes
             if any(is_aggregator(x) for x in compat.itervalues(arg)):
-                new_arg = compat.OrderedDict()
+                new_arg = OrderedDict()
                 for k, v in compat.iteritems(arg):
                     if not isinstance(v, (tuple, list, dict)):
                         new_arg[k] = [v]
@@ -454,7 +387,7 @@ def _aggregate(self, arg, *args, **kwargs):
                     # the keys must be in the columns
                     # for ndim=2, or renamers for ndim=1
 
-                    # ok
+                    # ok for now, but deprecated
                     # {'A': { 'ra': 'mean' }}
                     # {'A': { 'ra': ['mean'] }}
                     # {'ra': ['mean']}
@@ -465,13 +398,29 @@ def _aggregate(self, arg, *args, **kwargs):
                         is_nested_renamer = True
 
                         if k not in obj.columns:
-                            raise SpecificationError('cannot perform renaming '
-                                                     'for {0} with a nested '
-                                                     'dictionary'.format(k))
+                            msg = ('cannot perform renaming for {key} with a '
+                                   'nested dictionary').format(key=k)
+                            raise SpecificationError(msg)
+                        nested_renaming_depr(4 + (_level or 0))
+
+                    elif isinstance(obj, ABCSeries):
+                        nested_renaming_depr()
+                    elif (isinstance(obj, ABCDataFrame) and
+                          k not in obj.columns):
+                        raise KeyError(
+                            "Column '{col}' does not exist!".format(col=k))
 
                 arg = new_arg
 
-            from pandas.tools.concat import concat
+            else:
+                # deprecation of renaming keys
+                # GH 15931
+                keys = list(compat.iterkeys(arg))
+                if (isinstance(obj, ABCDataFrame) and
+                        len(obj.columns.intersection(keys)) != len(keys)):
+                    nested_renaming_depr()
+
+            from pandas.core.reshape.concat import concat
 
             def _agg_1dim(name, how, subset=None):
                 """
@@ -496,14 +445,14 @@ def _agg(arg, func):
                 run the aggregations over the arg with func
                 return an OrderedDict
                 """
-                result = compat.OrderedDict()
+                result = OrderedDict()
                 for fname, agg_how in compat.iteritems(arg):
                     result[fname] = func(fname, agg_how)
                 return result
 
             # set the final keys
             keys = list(compat.iterkeys(arg))
-            result = compat.OrderedDict()
+            result = OrderedDict()
 
             # nested renamer
             if is_nested_renamer:
@@ -511,7 +460,7 @@ def _agg(arg, func):
 
                 if all(isinstance(r, dict) for r in result):
 
-                    result, results = compat.OrderedDict(), result
+                    result, results = OrderedDict(), result
                     for r in results:
                         result.update(r)
                     keys = list(compat.iterkeys(result))
@@ -534,7 +483,7 @@ def _agg(arg, func):
                                   agg_how: _agg_1dim(self._selection, agg_how))
 
                 # we are selecting the same set as we are aggregating
-                elif not len(sl - set(compat.iterkeys(arg))):
+                elif not len(sl - set(keys)):
 
                     result = _agg(arg, _agg_1dim)
 
@@ -555,32 +504,74 @@ def _agg(arg, func):
                     result = _agg(arg, _agg_2dim)
 
             # combine results
+
+            def is_any_series():
+                # return a boolean if we have *any* nested series
+                return any(isinstance(r, ABCSeries)
+                           for r in compat.itervalues(result))
+
+            def is_any_frame():
+                # return a boolean if we have *any* nested series
+                return any(isinstance(r, ABCDataFrame)
+                           for r in compat.itervalues(result))
+
             if isinstance(result, list):
-                result = concat(result, keys=keys, axis=1)
-            elif isinstance(list(compat.itervalues(result))[0],
-                            ABCDataFrame):
-                result = concat([result[k] for k in keys], keys=keys, axis=1)
-            else:
-                from pandas import DataFrame
+                return concat(result, keys=keys, axis=1, sort=True), True
+
+            elif is_any_frame():
+                # we have a dict of DataFrames
+                # return a MI DataFrame
+
+                return concat([result[k] for k in keys],
+                              keys=keys, axis=1), True
+
+            elif isinstance(self, ABCSeries) and is_any_series():
+
+                # we have a dict of Series
+                # return a MI Series
+                try:
+                    result = concat(result)
+                except TypeError:
+                    # we want to give a nice error here if
+                    # we have non-same sized objects, so
+                    # we don't automatically broadcast
+
+                    raise ValueError("cannot perform both aggregation "
+                                     "and transformation operations "
+                                     "simultaneously")
+
+                return result, True
+
+            # fall thru
+            from pandas import DataFrame, Series
+            try:
                 result = DataFrame(result)
+            except ValueError:
+
+                # we have a dict of scalars
+                result = Series(result,
+                                name=getattr(self, 'name', None))
 
             return result, True
-        elif hasattr(arg, '__iter__'):
-            return self._aggregate_multiple_funcs(arg, _level=_level), None
+        elif is_list_like(arg) and arg not in compat.string_types:
+            # we require a list, but not an 'str'
+            return self._aggregate_multiple_funcs(arg,
+                                                  _level=_level,
+                                                  _axis=_axis), None
         else:
             result = None
 
-        cy_func = self._is_cython_func(arg)
-        if cy_func and not args and not kwargs:
-            return getattr(self, cy_func)(), None
+        f = self._is_cython_func(arg)
+        if f and not args and not kwargs:
+            return getattr(self, f)(), None
 
         # caller can react
         return result, True
 
-    def _aggregate_multiple_funcs(self, arg, _level):
-        from pandas.tools.concat import concat
+    def _aggregate_multiple_funcs(self, arg, _level, _axis):
+        from pandas.core.reshape.concat import concat
 
-        if self.axis != 0:
+        if _axis != 0:
             raise NotImplementedError("axis other than 0 is not supported")
 
         if self._selected_obj.ndim == 1:
@@ -599,7 +590,7 @@ def _aggregate_multiple_funcs(self, arg, _level):
                     results.append(colg.aggregate(a))
 
                     # make sure we find a good name
-                    name = com._get_callable_name(a) or a
+                    name = com.get_callable_name(a) or a
                     keys.append(name)
                 except (TypeError, DataError):
                     pass
@@ -608,20 +599,43 @@ def _aggregate_multiple_funcs(self, arg, _level):
 
         # multiples
         else:
-            for col in obj:
+            for index, col in enumerate(obj):
                 try:
-                    colg = self._gotitem(col, ndim=1, subset=obj[col])
+                    colg = self._gotitem(col, ndim=1,
+                                         subset=obj.iloc[:, index])
                     results.append(colg.aggregate(arg))
                     keys.append(col)
                 except (TypeError, DataError):
                     pass
+                except ValueError:
+                    # cannot aggregate
+                    continue
                 except SpecificationError:
                     raise
 
-        return concat(results, keys=keys, axis=1)
+        # if we are empty
+        if not len(results):
+            raise ValueError("no results")
+
+        try:
+            return concat(results, keys=keys, axis=1, sort=False)
+        except TypeError:
+
+            # we are concatting non-NDFrame objects,
+            # e.g. a list of scalars
+
+            from pandas.core.dtypes.cast import is_nested_object
+            from pandas import Series
+            result = Series(results, index=keys, name=self.name)
+            if is_nested_object(result):
+                raise ValueError("cannot combine transform and "
+                                 "aggregation operations")
+            return result
 
     def _shallow_copy(self, obj=None, obj_type=None, **kwargs):
-        """ return a new object with the replacement attributes """
+        """
+        return a new object with the replacement attributes
+        """
         if obj is None:
             obj = self._selected_obj.copy()
         if obj_type is None:
@@ -634,7 +648,9 @@ def _shallow_copy(self, obj=None, obj_type=None, **kwargs):
         return obj_type(obj, **kwargs)
 
     def _is_cython_func(self, arg):
-        """ if we define an internal function for this argument, return it """
+        """
+        if we define an internal function for this argument, return it
+        """
         return self._cython_table.get(arg)
 
     def _is_builtin_func(self, arg):
@@ -645,56 +661,8 @@ def _is_builtin_func(self, arg):
         return self._builtin_table.get(arg, arg)
 
 
-class GroupByMixin(object):
-    """ provide the groupby facilities to the mixed object """
-
-    @staticmethod
-    def _dispatch(name, *args, **kwargs):
-        """ dispatch to apply """
-
-        def outer(self, *args, **kwargs):
-            def f(x):
-                x = self._shallow_copy(x, groupby=self._groupby)
-                return getattr(x, name)(*args, **kwargs)
-            return self._groupby.apply(f)
-        outer.__name__ = name
-        return outer
-
-    def _gotitem(self, key, ndim, subset=None):
-        """
-        sub-classes to define
-        return a sliced object
-
-        Parameters
-        ----------
-        key : string / list of selections
-        ndim : 1,2
-            requested ndim of result
-        subset : object, default None
-            subset to act on
-        """
-
-        # create a new object to prevent aliasing
-        if subset is None:
-            subset = self.obj
-
-        # we need to make a shallow copy of ourselves
-        # with the same groupby
-        kwargs = dict([(attr, getattr(self, attr))
-                       for attr in self._attributes])
-        self = self.__class__(subset,
-                              groupby=self._groupby[key],
-                              parent=self,
-                              **kwargs)
-        self._reset_cache()
-        if subset.ndim == 2:
-            if is_scalar(key) and key in subset or is_list_like(key):
-                self._selection = key
-        return self
-
-
 class IndexOpsMixin(object):
-    """ common ops mixin to support a unified inteface / docs for Series /
+    """ common ops mixin to support a unified interface / docs for Series /
     Index
     """
 
@@ -702,28 +670,48 @@ class IndexOpsMixin(object):
     __array_priority__ = 1000
 
     def transpose(self, *args, **kwargs):
-        """ return the transpose, which is by definition self """
+        """
+        Return the transpose, which is by definition self.
+        """
         nv.validate_transpose(args, kwargs)
         return self
 
-    T = property(transpose, doc="return the transpose, which is by "
-                                "definition self")
+    T = property(transpose, doc="Return the transpose, which is by "
+                                "definition self.")
+
+    @property
+    def _is_homogeneous_type(self):
+        """
+        Whether the object has a single dtype.
+
+        By definition, Series and Index are always considered homogeneous.
+        A MultiIndex may or may not be homogeneous, depending on the
+        dtypes of the levels.
+
+        See Also
+        --------
+        DataFrame._is_homogeneous_type
+        MultiIndex._is_homogeneous_type
+        """
+        return True
 
     @property
     def shape(self):
-        """ return a tuple of the shape of the underlying data """
+        """
+        Return a tuple of the shape of the underlying data.
+        """
         return self._values.shape
 
     @property
     def ndim(self):
-        """ return the number of dimensions of the underlying data,
-        by definition 1
+        """
+        Number of dimensions of the underlying data, by definition 1.
         """
         return 1
 
     def item(self):
-        """ return the first element of the underlying data as a python
-        scalar
+        """
+        Return the first element of the underlying data as a python scalar.
         """
         try:
             return self.values.item()
@@ -734,82 +722,429 @@ def item(self):
 
     @property
     def data(self):
-        """ return the data pointer of the underlying data """
+        """
+        Return the data pointer of the underlying data.
+        """
+        warnings.warn("{obj}.data is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.data
 
     @property
     def itemsize(self):
-        """ return the size of the dtype of the item of the underlying data """
-        return self._values.itemsize
+        """
+        Return the size of the dtype of the item of the underlying data.
+        """
+        warnings.warn("{obj}.itemsize is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.itemsize
 
     @property
     def nbytes(self):
-        """ return the number of bytes in the underlying data """
+        """
+        Return the number of bytes in the underlying data.
+        """
         return self._values.nbytes
 
     @property
     def strides(self):
-        """ return the strides of the underlying data """
-        return self._values.strides
+        """
+        Return the strides of the underlying data.
+        """
+        warnings.warn("{obj}.strides is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.strides
 
     @property
     def size(self):
-        """ return the number of elements in the underlying data """
+        """
+        Return the number of elements in the underlying data.
+        """
         return self._values.size
 
     @property
     def flags(self):
-        """ return the ndarray.flags for the underlying data """
+        """
+        Return the ndarray.flags for the underlying data.
+        """
+        warnings.warn("{obj}.flags is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.flags
 
     @property
     def base(self):
-        """ return the base object if the memory of the underlying data is
-        shared
         """
+        Return the base object if the memory of the underlying data is shared.
+        """
+        warnings.warn("{obj}.base is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
         return self.values.base
 
     @property
-    def _values(self):
-        """ the internal implementation """
+    def array(self):
+        # type: () -> ExtensionArray
+        """
+        The ExtensionArray of the data backing this Series or Index.
+
+        .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        ExtensionArray
+            An ExtensionArray of the values stored within. For extension
+            types, this is the actual array. For NumPy native types, this
+            is a thin (no copy) wrapper around :class:`numpy.ndarray`.
+
+            ``.array`` differs ``.values`` which may require converting the
+            data to a different form.
+
+        See Also
+        --------
+        Index.to_numpy : Similar method that always returns a NumPy array.
+        Series.to_numpy : Similar method that always returns a NumPy array.
+
+        Notes
+        -----
+        This table lays out the different array types for each extension
+        dtype within pandas.
+
+        ================== =============================
+        dtype              array type
+        ================== =============================
+        category           Categorical
+        period             PeriodArray
+        interval           IntervalArray
+        IntegerNA          IntegerArray
+        datetime64[ns, tz] DatetimeArray
+        ================== =============================
+
+        For any 3rd-party extension types, the array type will be an
+        ExtensionArray.
+
+        For all remaining dtypes ``.array`` will be a
+        :class:`arrays.NumpyExtensionArray` wrapping the actual ndarray
+        stored within. If you absolutely need a NumPy array (possibly with
+        copying / coercing data), then use :meth:`Series.to_numpy` instead.
+
+        Examples
+        --------
+
+        For regular NumPy types like int, and float, a PandasArray
+        is returned.
+
+        >>> pd.Series([1, 2, 3]).array
+        <PandasArray>
+        [1, 2, 3]
+        Length: 3, dtype: int64
+
+        For extension types, like Categorical, the actual ExtensionArray
+        is returned
+
+        >>> ser = pd.Series(pd.Categorical(['a', 'b', 'a']))
+        >>> ser.array
+        [a, b, a]
+        Categories (2, object): [a, b]
+        """
+        result = self._values
+
+        if is_datetime64_ns_dtype(result.dtype):
+            from pandas.arrays import DatetimeArray
+            result = DatetimeArray(result)
+        elif is_timedelta64_ns_dtype(result.dtype):
+            from pandas.arrays import TimedeltaArray
+            result = TimedeltaArray(result)
+
+        elif not is_extension_array_dtype(result.dtype):
+            from pandas.core.arrays.numpy_ import PandasArray
+            result = PandasArray(result)
+
+        return result
+
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        A NumPy ndarray representing the values in this Series or Index.
+
+        .. versionadded:: 0.24.0
+
+
+        Parameters
+        ----------
+        dtype : str or numpy.dtype, optional
+            The dtype to pass to :meth:`numpy.asarray`
+        copy : bool, default False
+            Whether to ensure that the returned value is a not a view on
+            another array. Note that ``copy=False`` does not *ensure* that
+            ``to_numpy()`` is no-copy. Rather, ``copy=True`` ensure that
+            a copy is made, even if not strictly necessary.
+
+        Returns
+        -------
+        numpy.ndarray
+
+        See Also
+        --------
+        Series.array : Get the actual data stored within.
+        Index.array : Get the actual data stored within.
+        DataFrame.to_numpy : Similar method for DataFrame.
+
+        Notes
+        -----
+        The returned array will be the same up to equality (values equal
+        in `self` will be equal in the returned array; likewise for values
+        that are not equal). When `self` contains an ExtensionArray, the
+        dtype may be different. For example, for a category-dtype Series,
+        ``to_numpy()`` will return a NumPy array and the categorical dtype
+        will be lost.
+
+        For NumPy dtypes, this will be a reference to the actual data stored
+        in this Series or Index (assuming ``copy=False``). Modifying the result
+        in place will modify the data stored in the Series or Index (not that
+        we recommend doing that).
+
+        For extension types, ``to_numpy()`` *may* require copying data and
+        coercing the result to a NumPy type (possibly object), which may be
+        expensive. When you need a no-copy reference to the underlying data,
+        :attr:`Series.array` should be used instead.
+
+        This table lays out the different dtypes and default return types of
+        ``to_numpy()`` for various dtypes within pandas.
+
+        ================== ================================
+        dtype              array type
+        ================== ================================
+        category[T]        ndarray[T] (same dtype as input)
+        period             ndarray[object] (Periods)
+        interval           ndarray[object] (Intervals)
+        IntegerNA          ndarray[object]
+        datetime64[ns]     datetime64[ns]
+        datetime64[ns, tz] ndarray[object] (Timestamps)
+        ================== ================================
+
+        Examples
+        --------
+        >>> ser = pd.Series(pd.Categorical(['a', 'b', 'a']))
+        >>> ser.to_numpy()
+        array(['a', 'b', 'a'], dtype=object)
+
+        Specify the `dtype` to control how datetime-aware data is represented.
+        Use ``dtype=object`` to return an ndarray of pandas :class:`Timestamp`
+        objects, each with the correct ``tz``.
+
+        >>> ser = pd.Series(pd.date_range('2000', periods=2, tz="CET"))
+        >>> ser.to_numpy(dtype=object)
+        array([Timestamp('2000-01-01 00:00:00+0100', tz='CET', freq='D'),
+               Timestamp('2000-01-02 00:00:00+0100', tz='CET', freq='D')],
+              dtype=object)
+
+        Or ``dtype='datetime64[ns]'`` to return an ndarray of native
+        datetime64 values. The values are converted to UTC and the timezone
+        info is dropped.
+
+        >>> ser.to_numpy(dtype="datetime64[ns]")
+        ... # doctest: +ELLIPSIS
+        array(['1999-12-31T23:00:00.000000000', '2000-01-01T23:00:00...'],
+              dtype='datetime64[ns]')
+        """
+        if is_datetime64tz_dtype(self.dtype) and dtype is None:
+            # note: this is going to change very soon.
+            # I have a WIP PR making this unnecessary, but it's
+            # a bit out of scope for the DatetimeArray PR.
+            dtype = "object"
+
+        result = np.asarray(self._values, dtype=dtype)
+        # TODO(GH-24345): Avoid potential double copy
+        if copy:
+            result = result.copy()
+        return result
+
+    @property
+    def _ndarray_values(self):
+        # type: () -> np.ndarray
+        """
+        The data as an ndarray, possibly losing information.
+
+        The expectation is that this is cheap to compute, and is primarily
+        used for interacting with our indexers.
+
+        - categorical -> codes
+        """
+        if is_extension_array_dtype(self):
+            return self.array._ndarray_values
         return self.values
 
     @property
     def empty(self):
         return not self.size
 
-    def max(self):
-        """ The maximum value of the object """
-        return nanops.nanmax(self.values)
+    def max(self, axis=None, skipna=True):
+        """
+        Return the maximum value of the Index.
+
+        Parameters
+        ----------
+        axis : int, optional
+            For compatibility with NumPy. Only 0 or None are allowed.
+        skipna : bool, default True
+
+        Returns
+        -------
+        scalar
+            Maximum value.
+
+        See Also
+        --------
+        Index.min : Return the minimum value in an Index.
+        Series.max : Return the maximum value in a Series.
+        DataFrame.max : Return the maximum values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([3, 2, 1])
+        >>> idx.max()
+        3
+
+        >>> idx = pd.Index(['c', 'b', 'a'])
+        >>> idx.max()
+        'c'
+
+        For a MultiIndex, the maximum is determined lexicographically.
 
-    def argmax(self, axis=None):
+        >>> idx = pd.MultiIndex.from_product([('a', 'b'), (2, 1)])
+        >>> idx.max()
+        ('b', 2)
         """
-        return a ndarray of the maximum argument indexer
+        nv.validate_minmax_axis(axis)
+        return nanops.nanmax(self._values, skipna=skipna)
 
-        See also
+    def argmax(self, axis=None, skipna=True):
+        """
+        Return an ndarray of the maximum argument indexer.
+
+        Parameters
+        ----------
+        axis : {None}
+            Dummy argument for consistency with Series
+        skipna : bool, default True
+
+        See Also
         --------
         numpy.ndarray.argmax
         """
-        return nanops.nanargmax(self.values)
+        nv.validate_minmax_axis(axis)
+        return nanops.nanargmax(self._values, skipna=skipna)
+
+    def min(self, axis=None, skipna=True):
+        """
+        Return the minimum value of the Index.
+
+        Parameters
+        ----------
+        axis : {None}
+            Dummy argument for consistency with Series
+        skipna : bool, default True
+
+        Returns
+        -------
+        scalar
+            Minimum value.
+
+        See Also
+        --------
+        Index.max : Return the maximum value of the object.
+        Series.min : Return the minimum value in a Series.
+        DataFrame.min : Return the minimum values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([3, 2, 1])
+        >>> idx.min()
+        1
+
+        >>> idx = pd.Index(['c', 'b', 'a'])
+        >>> idx.min()
+        'a'
 
-    def min(self):
-        """ The minimum value of the object """
-        return nanops.nanmin(self.values)
+        For a MultiIndex, the minimum is determined lexicographically.
 
-    def argmin(self, axis=None):
+        >>> idx = pd.MultiIndex.from_product([('a', 'b'), (2, 1)])
+        >>> idx.min()
+        ('a', 1)
         """
-        return a ndarray of the minimum argument indexer
+        nv.validate_minmax_axis(axis)
+        return nanops.nanmin(self._values, skipna=skipna)
 
-        See also
+    def argmin(self, axis=None, skipna=True):
+        """
+        Return a ndarray of the minimum argument indexer.
+
+        Parameters
+        ----------
+        axis : {None}
+            Dummy argument for consistency with Series
+        skipna : bool, default True
+
+        Returns
+        -------
+        numpy.ndarray
+
+        See Also
         --------
         numpy.ndarray.argmin
         """
-        return nanops.nanargmin(self.values)
+        nv.validate_minmax_axis(axis)
+        return nanops.nanargmin(self._values, skipna=skipna)
+
+    def tolist(self):
+        """
+        Return a list of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+
+        Returns
+        -------
+        list
+
+        See Also
+        --------
+        numpy.ndarray.tolist
+        """
+        if is_datetimelike(self._values):
+            return [com.maybe_box_datetimelike(x) for x in self._values]
+        elif is_extension_array_dtype(self._values):
+            return list(self._values)
+        else:
+            return self._values.tolist()
+
+    to_list = tolist
+
+    def __iter__(self):
+        """
+        Return an iterator of the values.
+
+        These are each a scalar type, which is a Python scalar
+        (for str, int, float) or a pandas scalar
+        (for Timestamp/Timedelta/Interval/Period)
+        """
+        # We are explicity making element iterators.
+        if is_datetimelike(self._values):
+            return map(com.maybe_box_datetimelike, self._values)
+        elif is_extension_array_dtype(self._values):
+            return iter(self._values)
+        else:
+            return map(self._values.item, range(self._values.size))
 
     @cache_readonly
     def hasnans(self):
-        """ return if I have any nans; enables various perf speedups """
-        return isnull(self).any()
+        """
+        Return if I have any nans; enables various perf speedups.
+        """
+        return bool(isna(self).any())
 
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
@@ -818,12 +1153,85 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
         if func is None:
             raise TypeError("{klass} cannot perform the operation {op}".format(
                             klass=self.__class__.__name__, op=name))
-        return func(**kwds)
+        return func(skipna=skipna, **kwds)
+
+    def _map_values(self, mapper, na_action=None):
+        """
+        An internal function that maps values using the input
+        correspondence (which can be a dict, Series, or function).
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            The input correspondence object
+        na_action : {None, 'ignore'}
+            If 'ignore', propagate NA values, without passing them to the
+            mapping function
+
+        Returns
+        -------
+        Union[Index, MultiIndex], inferred
+            The output of the mapping function applied to the index.
+            If the function returns a tuple with more than one element
+            a MultiIndex will be returned.
+
+        """
+
+        # we can fastpath dict/Series to an efficient map
+        # as we know that we are not going to have to yield
+        # python types
+        if isinstance(mapper, dict):
+            if hasattr(mapper, '__missing__'):
+                # If a dictionary subclass defines a default value method,
+                # convert mapper to a lookup function (GH #15999).
+                dict_with_default = mapper
+                mapper = lambda x: dict_with_default[x]
+            else:
+                # Dictionary does not have a default. Thus it's safe to
+                # convert to an Series for efficiency.
+                # we specify the keys here to handle the
+                # possibility that they are tuples
+                from pandas import Series
+                mapper = Series(mapper)
+
+        if isinstance(mapper, ABCSeries):
+            # Since values were input this means we came from either
+            # a dict or a series and mapper should be an index
+            if is_extension_type(self.dtype):
+                values = self._values
+            else:
+                values = self.values
+
+            indexer = mapper.index.get_indexer(values)
+            new_values = algorithms.take_1d(mapper._values, indexer)
+
+            return new_values
+
+        # we must convert to python types
+        if is_extension_type(self.dtype):
+            values = self._values
+            if na_action is not None:
+                raise NotImplementedError
+            map_f = lambda values, f: values.map(f)
+        else:
+            values = self.astype(object)
+            values = getattr(values, 'values', values)
+            if na_action == 'ignore':
+                def map_f(values, f):
+                    return lib.map_infer_mask(values, f,
+                                              isna(values).view(np.uint8))
+            else:
+                map_f = lib.map_infer
+
+        # mapper is a function
+        new_values = map_f(values, mapper)
+
+        return new_values
 
     def value_counts(self, normalize=False, sort=True, ascending=False,
                      bins=None, dropna=True):
         """
-        Returns object containing counts of unique values.
+        Return a Series containing counts of unique values.
 
         The resulting object will be in descending order so that the
         first element is the most frequently-occurring element.
@@ -835,44 +1243,85 @@ def value_counts(self, normalize=False, sort=True, ascending=False,
             If True then the object returned will contain the relative
             frequencies of the unique values.
         sort : boolean, default True
-            Sort by values
+            Sort by frequencies.
         ascending : boolean, default False
-            Sort in ascending order
+            Sort in ascending order.
         bins : integer, optional
             Rather than count values, group them into half-open bins,
-            a convenience for pd.cut, only works with numeric data
+            a convenience for ``pd.cut``, only works with numeric data.
         dropna : boolean, default True
             Don't include counts of NaN.
 
         Returns
         -------
-        counts : Series
+        Series
+
+        See Also
+        --------
+        Series.count: Number of non-NA elements in a Series.
+        DataFrame.count: Number of non-NA elements in a DataFrame.
+
+        Examples
+        --------
+        >>> index = pd.Index([3, 1, 2, 3, 4, np.nan])
+        >>> index.value_counts()
+        3.0    2
+        4.0    1
+        2.0    1
+        1.0    1
+        dtype: int64
+
+        With `normalize` set to `True`, returns the relative frequency by
+        dividing all values by the sum of values.
+
+        >>> s = pd.Series([3, 1, 2, 3, 4, np.nan])
+        >>> s.value_counts(normalize=True)
+        3.0    0.4
+        4.0    0.2
+        2.0    0.2
+        1.0    0.2
+        dtype: float64
+
+        **bins**
+
+        Bins can be useful for going from a continuous variable to a
+        categorical variable; instead of counting unique
+        apparitions of values, divide the index in the specified
+        number of half-open bins.
+
+        >>> s.value_counts(bins=3)
+        (2.0, 3.0]      2
+        (0.996, 2.0]    2
+        (3.0, 4.0]      1
+        dtype: int64
+
+        **dropna**
+
+        With `dropna` set to `False` we can also see NaN index values.
+
+        >>> s.value_counts(dropna=False)
+        3.0    2
+        NaN    1
+        4.0    1
+        2.0    1
+        1.0    1
+        dtype: int64
         """
         from pandas.core.algorithms import value_counts
         result = value_counts(self, sort=sort, ascending=ascending,
                               normalize=normalize, bins=bins, dropna=dropna)
         return result
 
-    _shared_docs['unique'] = (
-        """
-        Return %(unique)s of unique values in the object.
-        Significantly faster than numpy.unique. Includes NA values.
-        The order of the original is preserved.
-
-        Returns
-        -------
-        uniques : %(unique)s
-        """)
-
-    @Appender(_shared_docs['unique'] % _indexops_doc_kwargs)
     def unique(self):
         values = self._values
 
         if hasattr(values, 'unique'):
+
             result = values.unique()
         else:
             from pandas.core.algorithms import unique1d
             result = unique1d(values)
+
         return result
 
     def nunique(self, dropna=True):
@@ -883,41 +1332,60 @@ def nunique(self, dropna=True):
 
         Parameters
         ----------
-        dropna : boolean, default True
+        dropna : bool, default True
             Don't include NaN in the count.
 
         Returns
         -------
-        nunique : int
+        int
+
+        See Also
+        --------
+        DataFrame.nunique: Method nunique for DataFrame.
+        Series.count: Count non-NA/null observations in the Series.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 3, 5, 7, 7])
+        >>> s
+        0    1
+        1    3
+        2    5
+        3    7
+        4    7
+        dtype: int64
+
+        >>> s.nunique()
+        4
         """
         uniqs = self.unique()
         n = len(uniqs)
-        if dropna and isnull(uniqs).any():
+        if dropna and isna(uniqs).any():
             n -= 1
         return n
 
     @property
     def is_unique(self):
         """
-        Return boolean if values in the object are unique
+        Return boolean if values in the object are unique.
 
         Returns
         -------
-        is_unique : boolean
+        bool
         """
-        return self.nunique() == len(self)
+        return self.nunique(dropna=False) == len(self)
 
     @property
     def is_monotonic(self):
         """
         Return boolean if values in the object are
-        monotonic_increasing
+        monotonic_increasing.
 
         .. versionadded:: 0.19.0
 
         Returns
         -------
-        is_monotonic : boolean
+        bool
         """
         from pandas import Index
         return Index(self).is_monotonic
@@ -928,20 +1396,20 @@ def is_monotonic(self):
     def is_monotonic_decreasing(self):
         """
         Return boolean if values in the object are
-        monotonic_decreasing
+        monotonic_decreasing.
 
         .. versionadded:: 0.19.0
 
         Returns
         -------
-        is_monotonic_decreasing : boolean
+        bool
         """
         from pandas import Index
         return Index(self).is_monotonic_decreasing
 
     def memory_usage(self, deep=False):
         """
-        Memory usage of my values
+        Memory usage of the values
 
         Parameters
         ----------
@@ -953,45 +1421,37 @@ def memory_usage(self, deep=False):
         -------
         bytes used
 
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array if deep=False
-
         See Also
         --------
         numpy.ndarray.nbytes
-        """
-        if hasattr(self.values, 'memory_usage'):
-            return self.values.memory_usage(deep=deep)
 
-        v = self.values.nbytes
-        if deep and is_object_dtype(self):
-            v += lib.memory_usage_of_objects(self.values)
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False or if used on PyPy
+        """
+        if hasattr(self.array, 'memory_usage'):
+            return self.array.memory_usage(deep=deep)
 
+        v = self.array.nbytes
+        if deep and is_object_dtype(self) and not PYPY:
+            v += lib.memory_usage_of_objects(self.array)
         return v
 
+    @Substitution(
+        values='', order='', size_hint='',
+        sort=textwrap.dedent("""\
+            sort : boolean, default False
+                Sort `uniques` and shuffle `labels` to maintain the
+                relationship.
+            """))
+    @Appender(algorithms._shared_docs['factorize'])
     def factorize(self, sort=False, na_sentinel=-1):
-        """
-        Encode the object as an enumerated type or categorical variable
-
-        Parameters
-        ----------
-        sort : boolean, default False
-            Sort by values
-        na_sentinel: int, default -1
-            Value to mark "not found"
-
-        Returns
-        -------
-        labels : the indexer to the original array
-        uniques : the unique Index
-        """
-        from pandas.core.algorithms import factorize
-        return factorize(self, sort=sort, na_sentinel=na_sentinel)
+        return algorithms.factorize(self, sort=sort, na_sentinel=na_sentinel)
 
     _shared_docs['searchsorted'] = (
-        """Find indices where elements should be inserted to maintain order.
+        """
+        Find indices where elements should be inserted to maintain order.
 
         Find the indices into a sorted %(klass)s `self` such that, if the
         corresponding elements in `value` were inserted before the indices,
@@ -1011,8 +1471,14 @@ def factorize(self, sort=False, na_sentinel=-1):
 
         Returns
         -------
-        indices : array of ints
-            Array of insertion points with the same shape as `value`.
+        int or array of int
+            A scalar or array of insertion points with the
+            same shape as `value`.
+
+            .. versionchanged :: 0.24.0
+                If `value` is a scalar, an int is now always returned.
+                Previously, scalar inputs returned an 1-item array for
+                :class:`Series` and :class:`Categorical`.
 
         See Also
         --------
@@ -1024,59 +1490,44 @@ def factorize(self, sort=False, na_sentinel=-1):
 
         Examples
         --------
+
         >>> x = pd.Series([1, 2, 3])
         >>> x
         0    1
         1    2
         2    3
         dtype: int64
+
         >>> x.searchsorted(4)
-        array([3])
+        3
+
         >>> x.searchsorted([0, 4])
         array([0, 3])
+
         >>> x.searchsorted([1, 3], side='left')
         array([0, 2])
+
         >>> x.searchsorted([1, 3], side='right')
         array([1, 3])
-        >>>
-        >>> x = pd.Categorical(['apple', 'bread', 'bread', 'cheese', 'milk' ])
+
+        >>> x = pd.Categorical(['apple', 'bread', 'bread',
+                                'cheese', 'milk'], ordered=True)
         [apple, bread, bread, cheese, milk]
         Categories (4, object): [apple < bread < cheese < milk]
+
         >>> x.searchsorted('bread')
-        array([1])     # Note: an array, not a scalar
-        >>> x.searchsorted(['bread'])
-        array([1])
-        >>> x.searchsorted(['bread', 'eggs'])
-        array([1, 4])
-        >>> x.searchsorted(['bread', 'eggs'], side='right')
-        array([3, 4])    # eggs before milk
+        1
+
+        >>> x.searchsorted(['bread'], side='right')
+        array([3])
         """)
 
-    @Substitution(klass='IndexOpsMixin')
+    @Substitution(klass='Index')
     @Appender(_shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
     def searchsorted(self, value, side='left', sorter=None):
-        # needs coercion on the key (DatetimeIndex does already)
-        return self.values.searchsorted(value, side=side, sorter=sorter)
-
-    _shared_docs['drop_duplicates'] = (
-        """Return %(klass)s with duplicate values removed
+        return algorithms.searchsorted(self._values, value,
+                                       side=side, sorter=sorter)
 
-        Parameters
-        ----------
-
-        keep : {'first', 'last', False}, default 'first'
-            - ``first`` : Drop duplicates except for the first occurrence.
-            - ``last`` : Drop duplicates except for the last occurrence.
-            - False : Drop all duplicates.
-        %(inplace)s
-
-        Returns
-        -------
-        deduplicated : %(klass)s
-        """)
-
-    @Appender(_shared_docs['drop_duplicates'] % _indexops_doc_kwargs)
     def drop_duplicates(self, keep='first', inplace=False):
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if isinstance(self, ABCIndexClass):
@@ -1090,24 +1541,6 @@ def drop_duplicates(self, keep='first', inplace=False):
         else:
             return result
 
-    _shared_docs['duplicated'] = (
-        """Return boolean %(duplicated)s denoting duplicate values
-
-        Parameters
-        ----------
-        keep : {'first', 'last', False}, default 'first'
-            - ``first`` : Mark duplicates as ``True`` except for the first
-              occurrence.
-            - ``last`` : Mark duplicates as ``True`` except for the last
-              occurrence.
-            - False : Mark all duplicates as ``True``.
-
-        Returns
-        -------
-        duplicated : %(duplicated)s
-        """)
-
-    @Appender(_shared_docs['duplicated'] % _indexops_doc_kwargs)
     def duplicated(self, keep='first'):
         from pandas.core.algorithms import duplicated
         if isinstance(self, ABCIndexClass):
diff --git a/pandas/core/categorical.py b/pandas/core/categorical.py
index 0fcf8664e755d..43c35c4000bb6 100644
--- a/pandas/core/categorical.py
+++ b/pandas/core/categorical.py
@@ -1,2133 +1,9 @@
-# pylint: disable=E1101,W0232
+import warnings
 
-import numpy as np
-from warnings import warn
-import types
+from pandas.core.dtypes.dtypes import CategoricalDtype  # noqa
 
-from pandas import compat
-from pandas.compat import u, lzip
-from pandas._libs import lib, algos as libalgos
+from pandas.core.arrays import Categorical  # noqa
 
-from pandas.types.generic import ABCSeries, ABCIndexClass, ABCCategoricalIndex
-from pandas.types.missing import isnull, notnull
-from pandas.types.cast import (maybe_infer_to_datetimelike,
-                               coerce_indexer_dtype)
-from pandas.types.dtypes import CategoricalDtype
-from pandas.types.common import (_ensure_int64,
-                                 _ensure_object,
-                                 _ensure_platform_int,
-                                 is_dtype_equal,
-                                 is_datetimelike,
-                                 is_categorical,
-                                 is_categorical_dtype,
-                                 is_integer_dtype, is_bool,
-                                 is_list_like, is_sequence,
-                                 is_scalar)
-from pandas.core.common import is_null_slice
-
-from pandas.core.algorithms import factorize, take_1d, unique1d
-from pandas.core.base import (PandasObject, PandasDelegate,
-                              NoNewAttributesMixin, _shared_docs)
-import pandas.core.common as com
-from pandas.core.missing import interpolate_2d
-from pandas.compat.numpy import function as nv
-from pandas.util.decorators import (Appender, cache_readonly,
-                                    deprecate_kwarg, Substitution)
-
-from pandas.util.terminal import get_terminal_size
-from pandas.util.validators import validate_bool_kwarg
-from pandas.core.config import get_option
-
-
-def _cat_compare_op(op):
-    def f(self, other):
-        # On python2, you can usually compare any type to any type, and
-        # Categoricals can be seen as a custom type, but having different
-        # results depending whether categories are the same or not is kind of
-        # insane, so be a bit stricter here and use the python3 idea of
-        # comparing only things of equal type.
-        if not self.ordered:
-            if op in ['__lt__', '__gt__', '__le__', '__ge__']:
-                raise TypeError("Unordered Categoricals can only compare "
-                                "equality or not")
-        if isinstance(other, Categorical):
-            # Two Categoricals can only be be compared if the categories are
-            # the same
-            if ((len(self.categories) != len(other.categories)) or
-                    not ((self.categories == other.categories).all())):
-                raise TypeError("Categoricals can only be compared if "
-                                "'categories' are the same")
-            if not (self.ordered == other.ordered):
-                raise TypeError("Categoricals can only be compared if "
-                                "'ordered' is the same")
-            na_mask = (self._codes == -1) | (other._codes == -1)
-            f = getattr(self._codes, op)
-            ret = f(other._codes)
-            if na_mask.any():
-                # In other series, the leads to False, so do that here too
-                ret[na_mask] = False
-            return ret
-
-        # Numpy-1.9 and earlier may convert a scalar to a zerodim array during
-        # comparison operation when second arg has higher priority, e.g.
-        #
-        #     cat[0] < cat
-        #
-        # With cat[0], for example, being ``np.int64(1)`` by the time it gets
-        # into this function would become ``np.array(1)``.
-        other = lib.item_from_zerodim(other)
-        if is_scalar(other):
-            if other in self.categories:
-                i = self.categories.get_loc(other)
-                return getattr(self._codes, op)(i)
-            else:
-                if op == '__eq__':
-                    return np.repeat(False, len(self))
-                elif op == '__ne__':
-                    return np.repeat(True, len(self))
-                else:
-                    msg = ("Cannot compare a Categorical for op {op} with a "
-                           "scalar, which is not a category.")
-                    raise TypeError(msg.format(op=op))
-        else:
-
-            # allow categorical vs object dtype array comparisons for equality
-            # these are only positional comparisons
-            if op in ['__eq__', '__ne__']:
-                return getattr(np.array(self), op)(np.array(other))
-
-            msg = ("Cannot compare a Categorical for op {op} with type {typ}."
-                   "\nIf you want to compare values, use 'np.asarray(cat) "
-                   "<op> other'.")
-            raise TypeError(msg.format(op=op, typ=type(other)))
-
-    f.__name__ = op
-
-    return f
-
-
-def maybe_to_categorical(array):
-    """ coerce to a categorical if a series is given """
-    if isinstance(array, (ABCSeries, ABCCategoricalIndex)):
-        return array._values
-    return array
-
-
-_codes_doc = """The category codes of this categorical.
-
-Level codes are an array if integer which are the positions of the real
-values in the categories array.
-
-There is not setter, use the other categorical methods and the normal item
-setter to change values in the categorical.
-"""
-
-_categories_doc = """The categories of this categorical.
-
-Setting assigns new values to each category (effectively a rename of
-each individual category).
-
-The assigned value has to be a list-like object. All items must be unique and
-the number of items in the new categories must be the same as the number of
-items in the old categories.
-
-Assigning to `categories` is a inplace operation!
-
-Raises
-------
-ValueError
-    If the new categories do not validate as categories or if the number of new
-    categories is unequal the number of old categories
-
-See also
---------
-rename_categories
-reorder_categories
-add_categories
-remove_categories
-remove_unused_categories
-set_categories
-"""
-
-
-class Categorical(PandasObject):
-    """
-    Represents a categorical variable in classic R / S-plus fashion
-
-    `Categoricals` can only take on only a limited, and usually fixed, number
-    of possible values (`categories`). In contrast to statistical categorical
-    variables, a `Categorical` might have an order, but numerical operations
-    (additions, divisions, ...) are not possible.
-
-    All values of the `Categorical` are either in `categories` or `np.nan`.
-    Assigning values outside of `categories` will raise a `ValueError`. Order
-    is defined by the order of the `categories`, not lexical order of the
-    values.
-
-    Parameters
-    ----------
-    values : list-like
-        The values of the categorical. If categories are given, values not in
-        categories will be replaced with NaN.
-    categories : Index-like (unique), optional
-        The unique categories for this categorical. If not given, the
-        categories are assumed to be the unique values of values.
-    ordered : boolean, (default False)
-        Whether or not this categorical is treated as a ordered categorical.
-        If not given, the resulting categorical will not be ordered.
-
-    Attributes
-    ----------
-    categories : Index
-        The categories of this categorical
-    codes : ndarray
-        The codes (integer positions, which point to the categories) of this
-        categorical, read only.
-    ordered : boolean
-        Whether or not this Categorical is ordered.
-
-    Raises
-    ------
-    ValueError
-        If the categories do not validate.
-    TypeError
-        If an explicit ``ordered=True`` is given but no `categories` and the
-        `values` are not sortable.
-
-
-    Examples
-    --------
-    >>> from pandas import Categorical
-    >>> Categorical([1, 2, 3, 1, 2, 3])
-    [1, 2, 3, 1, 2, 3]
-    Categories (3, int64): [1 < 2 < 3]
-
-    >>> Categorical(['a', 'b', 'c', 'a', 'b', 'c'])
-    [a, b, c, a, b, c]
-    Categories (3, object): [a < b < c]
-
-    >>> a = Categorical(['a','b','c','a','b','c'], ['c', 'b', 'a'],
-                        ordered=True)
-    >>> a.min()
-    'c'
-    """
-    dtype = CategoricalDtype()
-    """The dtype (always "category")"""
-    """Whether or not this Categorical is ordered.
-
-    Only ordered `Categoricals` can be sorted (according to the order
-    of the categories) and have a min and max value.
-
-    See also
-    --------
-    Categorical.sort
-    Categorical.order
-    Categorical.min
-    Categorical.max
-    """
-
-    # For comparisons, so that numpy uses our implementation if the compare
-    # ops, which raise
-    __array_priority__ = 1000
-    _typ = 'categorical'
-
-    def __init__(self, values, categories=None, ordered=False, fastpath=False):
-
-        self._validate_ordered(ordered)
-
-        if fastpath:
-            # fast path
-            self._codes = coerce_indexer_dtype(values, categories)
-            self._categories = self._validate_categories(
-                categories, fastpath=isinstance(categories, ABCIndexClass))
-            self._ordered = ordered
-            return
-
-        # sanitize input
-        if is_categorical_dtype(values):
-
-            # we are either a Series or a CategoricalIndex
-            if isinstance(values, (ABCSeries, ABCCategoricalIndex)):
-                values = values._values
-
-            if ordered is None:
-                ordered = values.ordered
-            if categories is None:
-                categories = values.categories
-            values = values.get_values()
-
-        elif isinstance(values, (ABCIndexClass, ABCSeries)):
-            pass
-
-        else:
-
-            # on numpy < 1.6 datetimelike get inferred to all i8 by
-            # _sanitize_array which is fine, but since factorize does this
-            # correctly no need here this is an issue because _sanitize_array
-            # also coerces np.nan to a string under certain versions of numpy
-            # as well
-            values = maybe_infer_to_datetimelike(values, convert_dates=True)
-            if not isinstance(values, np.ndarray):
-                values = _convert_to_list_like(values)
-                from pandas.core.series import _sanitize_array
-                # On list with NaNs, int values will be converted to float. Use
-                # "object" dtype to prevent this. In the end objects will be
-                # casted to int/... in the category assignment step.
-                dtype = 'object' if isnull(values).any() else None
-                values = _sanitize_array(values, None, dtype=dtype)
-
-        if categories is None:
-            try:
-                codes, categories = factorize(values, sort=True)
-            except TypeError:
-                codes, categories = factorize(values, sort=False)
-                if ordered:
-                    # raise, as we don't have a sortable data structure and so
-                    # the user should give us one by specifying categories
-                    raise TypeError("'values' is not ordered, please "
-                                    "explicitly specify the categories order "
-                                    "by passing in a categories argument.")
-            except ValueError:
-
-                # FIXME
-                raise NotImplementedError("> 1 ndim Categorical are not "
-                                          "supported at this time")
-
-            categories = self._validate_categories(categories)
-
-        else:
-            # there were two ways if categories are present
-            # - the old one, where each value is a int pointer to the levels
-            #   array -> not anymore possible, but code outside of pandas could
-            #   call us like that, so make some checks
-            # - the new one, where each value is also in the categories array
-            #   (or np.nan)
-
-            # make sure that we always have the same type here, no matter what
-            # we get passed in
-            categories = self._validate_categories(categories)
-            codes = _get_codes_for_values(values, categories)
-
-            # TODO: check for old style usage. These warnings should be removes
-            # after 0.18/ in 2016
-            if is_integer_dtype(values) and not is_integer_dtype(categories):
-                warn("Values and categories have different dtypes. Did you "
-                     "mean to use\n'Categorical.from_codes(codes, "
-                     "categories)'?", RuntimeWarning, stacklevel=2)
-
-            if (len(values) and is_integer_dtype(values) and
-                    (codes == -1).all()):
-                warn("None of the categories were found in values. Did you "
-                     "mean to use\n'Categorical.from_codes(codes, "
-                     "categories)'?", RuntimeWarning, stacklevel=2)
-
-        self.set_ordered(ordered or False, inplace=True)
-        self._categories = categories
-        self._codes = coerce_indexer_dtype(codes, categories)
-
-    @property
-    def _constructor(self):
-        return Categorical
-
-    def copy(self):
-        """ Copy constructor. """
-        return self._constructor(values=self._codes.copy(),
-                                 categories=self.categories,
-                                 ordered=self.ordered,
-                                 fastpath=True)
-
-    def astype(self, dtype, copy=True):
-        """
-        Coerce this type to another dtype
-
-        Parameters
-        ----------
-        dtype : numpy dtype or pandas type
-        copy : bool, default True
-            By default, astype always returns a newly allocated object.
-            If copy is set to False and dtype is categorical, the original
-            object is returned.
-
-            .. versionadded:: 0.19.0
-
-        """
-        if is_categorical_dtype(dtype):
-            if copy is True:
-                return self.copy()
-            return self
-        return np.array(self, dtype=dtype, copy=copy)
-
-    @cache_readonly
-    def ndim(self):
-        """Number of dimensions of the Categorical """
-        return self._codes.ndim
-
-    @cache_readonly
-    def size(self):
-        """ return the len of myself """
-        return len(self)
-
-    @cache_readonly
-    def itemsize(self):
-        """ return the size of a single category """
-        return self.categories.itemsize
-
-    def reshape(self, new_shape, *args, **kwargs):
-        """
-        DEPRECATED: calling this method will raise an error in a
-        future release.
-
-        An ndarray-compatible method that returns `self` because
-        `Categorical` instances cannot actually be reshaped.
-
-        Parameters
-        ----------
-        new_shape : int or tuple of ints
-            A 1-D array of integers that correspond to the new
-            shape of the `Categorical`. For more information on
-            the parameter, please refer to `np.reshape`.
-        """
-        warn("reshape is deprecated and will raise "
-             "in a subsequent release", FutureWarning, stacklevel=2)
-
-        nv.validate_reshape(args, kwargs)
-
-        # while the 'new_shape' parameter has no effect,
-        # we should still enforce valid shape parameters
-        np.reshape(self.codes, new_shape)
-
-        return self
-
-    @property
-    def base(self):
-        """ compat, we are always our own object """
-        return None
-
-    @classmethod
-    def from_array(cls, data, **kwargs):
-        """
-        DEPRECATED: Use ``Categorical`` instead.
-
-        Make a Categorical type from a single array-like object.
-
-        For internal compatibility with numpy arrays.
-
-        Parameters
-        ----------
-        data : array-like
-            Can be an Index or array-like. The categories are assumed to be
-            the unique values of `data`.
-        """
-        warn("Categorical.from_array is deprecated, use Categorical instead",
-             FutureWarning, stacklevel=2)
-        return cls(data, **kwargs)
-
-    @classmethod
-    def from_codes(cls, codes, categories, ordered=False):
-        """
-        Make a Categorical type from codes and categories arrays.
-
-        This constructor is useful if you already have codes and categories and
-        so do not need the (computation intensive) factorization step, which is
-        usually done on the constructor.
-
-        If your data does not follow this convention, please use the normal
-        constructor.
-
-        Parameters
-        ----------
-        codes : array-like, integers
-            An integer array, where each integer points to a category in
-            categories or -1 for NaN
-        categories : index-like
-            The categories for the categorical. Items need to be unique.
-        ordered : boolean, (default False)
-            Whether or not this categorical is treated as a ordered
-            categorical. If not given, the resulting categorical will be
-            unordered.
-        """
-        try:
-            codes = np.asarray(codes, np.int64)
-        except:
-            raise ValueError(
-                "codes need to be convertible to an arrays of integers")
-
-        categories = cls._validate_categories(categories)
-
-        if len(codes) and (codes.max() >= len(categories) or codes.min() < -1):
-            raise ValueError("codes need to be between -1 and "
-                             "len(categories)-1")
-
-        return cls(codes, categories=categories, ordered=ordered,
-                   fastpath=True)
-
-    _codes = None
-
-    def _get_codes(self):
-        """ Get the codes.
-
-        Returns
-        -------
-        codes : integer array view
-            A non writable view of the `codes` array.
-        """
-        v = self._codes.view()
-        v.flags.writeable = False
-        return v
-
-    def _set_codes(self, codes):
-        """
-        Not settable by the user directly
-        """
-        raise ValueError("cannot set Categorical codes directly")
-
-    codes = property(fget=_get_codes, fset=_set_codes, doc=_codes_doc)
-
-    def _get_labels(self):
-        """
-        Get the category labels (deprecated).
-
-        Deprecated, use .codes!
-        """
-        warn("'labels' is deprecated. Use 'codes' instead", FutureWarning,
-             stacklevel=2)
-        return self.codes
-
-    labels = property(fget=_get_labels, fset=_set_codes)
-
-    _categories = None
-
-    @classmethod
-    def _validate_ordered(cls, ordered):
-        """
-        Validates that we have a valid ordered parameter. If
-        it is not a boolean, a TypeError will be raised.
-
-        Parameters
-        ----------
-        ordered : object
-            The parameter to be verified.
-
-        Raises
-        ------
-        TypeError
-            If 'ordered' is not a boolean.
-        """
-        if not is_bool(ordered):
-            raise TypeError("'ordered' must either be 'True' or 'False'")
-
-    @classmethod
-    def _validate_categories(cls, categories, fastpath=False):
-        """
-        Validates that we have good categories
-
-        Parameters
-        ----------
-        fastpath : boolean (default: False)
-           Don't perform validation of the categories for uniqueness or nulls
-
-        """
-        if not isinstance(categories, ABCIndexClass):
-            dtype = None
-            if not hasattr(categories, "dtype"):
-                categories = _convert_to_list_like(categories)
-                # On categories with NaNs, int values would be converted to
-                # float. Use "object" dtype to prevent this.
-                if isnull(categories).any():
-                    without_na = np.array([x for x in categories
-                                           if notnull(x)])
-                    with_na = np.array(categories)
-                    if with_na.dtype != without_na.dtype:
-                        dtype = "object"
-
-            from pandas import Index
-            categories = Index(categories, dtype=dtype)
-
-        if not fastpath:
-
-            # Categories cannot contain NaN.
-            if categories.hasnans:
-                raise ValueError('Categorial categories cannot be null')
-
-            # Categories must be unique.
-            if not categories.is_unique:
-                raise ValueError('Categorical categories must be unique')
-
-        return categories
-
-    def _set_categories(self, categories, fastpath=False):
-        """ Sets new categories
-
-        Parameters
-        ----------
-        fastpath : boolean (default: False)
-           Don't perform validation of the categories for uniqueness or nulls
-
-        """
-
-        categories = self._validate_categories(categories, fastpath=fastpath)
-        if (not fastpath and self._categories is not None and
-                len(categories) != len(self._categories)):
-            raise ValueError("new categories need to have the same number of "
-                             "items than the old categories!")
-
-        self._categories = categories
-
-    def _get_categories(self):
-        """ Gets the categories """
-        # categories is an Index, which is immutable -> no need to copy
-        return self._categories
-
-    categories = property(fget=_get_categories, fset=_set_categories,
-                          doc=_categories_doc)
-
-    def _codes_for_groupby(self, sort):
-        """
-        If sort=False, return a copy of self, coded with categories as
-        returned by .unique(), followed by any categories not appearing in
-        the data. If sort=True, return self.
-
-        This method is needed solely to ensure the categorical index of the
-        GroupBy result has categories in the order of appearance in the data
-        (GH-8868).
-
-        Parameters
-        ----------
-        sort : boolean
-            The value of the sort paramter groupby was called with.
-
-        Returns
-        -------
-        Categorical
-            If sort=False, the new categories are set to the order of
-            appearance in codes (unless ordered=True, in which case the
-            original order is preserved), followed by any unrepresented
-            categories in the original order.
-        """
-
-        # Already sorted according to self.categories; all is fine
-        if sort:
-            return self
-
-        # sort=False should order groups in as-encountered order (GH-8868)
-        cat = self.unique()
-
-        # But for groupby to work, all categories should be present,
-        # including those missing from the data (GH-13179), which .unique()
-        # above dropped
-        cat.add_categories(
-            self.categories[~self.categories.isin(cat.categories)],
-            inplace=True)
-
-        return self.reorder_categories(cat.categories)
-
-    _ordered = None
-
-    def set_ordered(self, value, inplace=False):
-        """
-        Sets the ordered attribute to the boolean value
-
-        Parameters
-        ----------
-        value : boolean to set whether this categorical is ordered (True) or
-           not (False)
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy
-           of this categorical with ordered set to the value
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        self._validate_ordered(value)
-        cat = self if inplace else self.copy()
-        cat._ordered = value
-        if not inplace:
-            return cat
-
-    def as_ordered(self, inplace=False):
-        """
-        Sets the Categorical to be ordered
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy
-           of this categorical with ordered set to True
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        return self.set_ordered(True, inplace=inplace)
-
-    def as_unordered(self, inplace=False):
-        """
-        Sets the Categorical to be unordered
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to set the ordered attribute inplace or return a copy
-           of this categorical with ordered set to False
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        return self.set_ordered(False, inplace=inplace)
-
-    def _get_ordered(self):
-        """ Gets the ordered attribute """
-        return self._ordered
-
-    ordered = property(fget=_get_ordered)
-
-    def set_categories(self, new_categories, ordered=None, rename=False,
-                       inplace=False):
-        """ Sets the categories to the specified new_categories.
-
-        `new_categories` can include new categories (which will result in
-        unused categories) or remove old categories (which results in values
-        set to NaN). If `rename==True`, the categories will simple be renamed
-        (less or more items than in old categories will result in values set to
-        NaN or in unused categories respectively).
-
-        This method can be used to perform more than one action of adding,
-        removing, and reordering simultaneously and is therefore faster than
-        performing the individual steps via the more specialised methods.
-
-        On the other hand this methods does not do checks (e.g., whether the
-        old categories are included in the new categories on a reorder), which
-        can result in surprising changes, for example when using special string
-        dtypes on python3, which does not considers a S1 string equal to a
-        single char python string.
-
-        Raises
-        ------
-        ValueError
-            If new_categories does not validate as categories
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The categories in new order.
-        ordered : boolean, (default: False)
-           Whether or not the categorical is treated as a ordered categorical.
-           If not given, do not change the ordered information.
-        rename : boolean (default: False)
-           Whether or not the new_categories should be considered as a rename
-           of the old  categories or as reordered categories.
-        inplace : boolean (default: False)
-           Whether or not to reorder the categories inplace or return a copy of
-           this categorical with reordered categories.
-
-        Returns
-        -------
-        cat : Categorical with reordered categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        new_categories = self._validate_categories(new_categories)
-        cat = self if inplace else self.copy()
-        if rename:
-            if (cat._categories is not None and
-                    len(new_categories) < len(cat._categories)):
-                # remove all _codes which are larger and set to -1/NaN
-                self._codes[self._codes >= len(new_categories)] = -1
-        else:
-            values = cat.__array__()
-            cat._codes = _get_codes_for_values(values, new_categories)
-        cat._categories = new_categories
-
-        if ordered is None:
-            ordered = self.ordered
-        cat.set_ordered(ordered, inplace=True)
-
-        if not inplace:
-            return cat
-
-    def rename_categories(self, new_categories, inplace=False):
-        """ Renames categories.
-
-        The new categories has to be a list-like object. All items must be
-        unique and the number of items in the new categories must be the same
-        as the number of items in the old categories.
-
-        Raises
-        ------
-        ValueError
-            If the new categories do not have the same number of items than the
-            current categories or do not validate as categories
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The renamed categories.
-        inplace : boolean (default: False)
-           Whether or not to rename the categories inplace or return a copy of
-           this categorical with renamed categories.
-
-        Returns
-        -------
-        cat : Categorical with renamed categories added or None if inplace.
-
-        See also
-        --------
-        reorder_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        cat = self if inplace else self.copy()
-        cat.categories = new_categories
-        if not inplace:
-            return cat
-
-    def reorder_categories(self, new_categories, ordered=None, inplace=False):
-        """ Reorders categories as specified in new_categories.
-
-        `new_categories` need to include all old categories and no new category
-        items.
-
-        Raises
-        ------
-        ValueError
-            If the new categories do not contain all old category items or any
-            new ones
-
-        Parameters
-        ----------
-        new_categories : Index-like
-           The categories in new order.
-        ordered : boolean, optional
-           Whether or not the categorical is treated as a ordered categorical.
-           If not given, do not change the ordered information.
-        inplace : boolean (default: False)
-           Whether or not to reorder the categories inplace or return a copy of
-           this categorical with reordered categories.
-
-        Returns
-        -------
-        cat : Categorical with reordered categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        add_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        if set(self._categories) != set(new_categories):
-            raise ValueError("items in new_categories are not the same as in "
-                             "old categories")
-        return self.set_categories(new_categories, ordered=ordered,
-                                   inplace=inplace)
-
-    def add_categories(self, new_categories, inplace=False):
-        """ Add new categories.
-
-        `new_categories` will be included at the last/highest place in the
-        categories and will be unused directly after this call.
-
-        Raises
-        ------
-        ValueError
-            If the new categories include old categories or do not validate as
-            categories
-
-        Parameters
-        ----------
-        new_categories : category or list-like of category
-           The new categories to be included.
-        inplace : boolean (default: False)
-           Whether or not to add the categories inplace or return a copy of
-           this categorical with added categories.
-
-        Returns
-        -------
-        cat : Categorical with new categories added or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        remove_categories
-        remove_unused_categories
-        set_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        if not is_list_like(new_categories):
-            new_categories = [new_categories]
-        already_included = set(new_categories) & set(self._categories)
-        if len(already_included) != 0:
-            msg = ("new categories must not include old categories: %s" %
-                   str(already_included))
-            raise ValueError(msg)
-        new_categories = list(self._categories) + list(new_categories)
-        cat = self if inplace else self.copy()
-        cat._categories = self._validate_categories(new_categories)
-        cat._codes = coerce_indexer_dtype(cat._codes, new_categories)
-        if not inplace:
-            return cat
-
-    def remove_categories(self, removals, inplace=False):
-        """ Removes the specified categories.
-
-        `removals` must be included in the old categories. Values which were in
-        the removed categories will be set to NaN
-
-        Raises
-        ------
-        ValueError
-            If the removals are not contained in the categories
-
-        Parameters
-        ----------
-        removals : category or list of categories
-           The categories which should be removed.
-        inplace : boolean (default: False)
-           Whether or not to remove the categories inplace or return a copy of
-           this categorical with removed categories.
-
-        Returns
-        -------
-        cat : Categorical with removed categories or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_unused_categories
-        set_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        if not is_list_like(removals):
-            removals = [removals]
-
-        removal_set = set(list(removals))
-        not_included = removal_set - set(self._categories)
-        new_categories = [c for c in self._categories if c not in removal_set]
-
-        # GH 10156
-        if any(isnull(removals)):
-            not_included = [x for x in not_included if notnull(x)]
-            new_categories = [x for x in new_categories if notnull(x)]
-
-        if len(not_included) != 0:
-            raise ValueError("removals must all be in old categories: %s" %
-                             str(not_included))
-
-        return self.set_categories(new_categories, ordered=self.ordered,
-                                   rename=False, inplace=inplace)
-
-    def remove_unused_categories(self, inplace=False):
-        """ Removes categories which are not used.
-
-        Parameters
-        ----------
-        inplace : boolean (default: False)
-           Whether or not to drop unused categories inplace or return a copy of
-           this categorical with unused categories dropped.
-
-        Returns
-        -------
-        cat : Categorical with unused categories dropped or None if inplace.
-
-        See also
-        --------
-        rename_categories
-        reorder_categories
-        add_categories
-        remove_categories
-        set_categories
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        cat = self if inplace else self.copy()
-        idx, inv = np.unique(cat._codes, return_inverse=True)
-
-        if idx.size != 0 and idx[0] == -1:  # na sentinel
-            idx, inv = idx[1:], inv - 1
-
-        cat._categories = cat.categories.take(idx)
-        cat._codes = coerce_indexer_dtype(inv, self._categories)
-
-        if not inplace:
-            return cat
-
-    def map(self, mapper):
-        """Apply mapper function to its categories (not codes).
-
-        Parameters
-        ----------
-        mapper : callable
-            Function to be applied. When all categories are mapped
-            to different categories, the result will be Categorical which has
-            the same order property as the original. Otherwise, the result will
-            be np.ndarray.
-
-        Returns
-        -------
-        applied : Categorical or Index.
-
-        """
-        new_categories = self.categories.map(mapper)
-        try:
-            return self.from_codes(self._codes.copy(),
-                                   categories=new_categories,
-                                   ordered=self.ordered)
-        except ValueError:
-            return np.take(new_categories, self._codes)
-
-    __eq__ = _cat_compare_op('__eq__')
-    __ne__ = _cat_compare_op('__ne__')
-    __lt__ = _cat_compare_op('__lt__')
-    __gt__ = _cat_compare_op('__gt__')
-    __le__ = _cat_compare_op('__le__')
-    __ge__ = _cat_compare_op('__ge__')
-
-    # for Series/ndarray like compat
-    @property
-    def shape(self):
-        """ Shape of the Categorical.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        shape : tuple
-        """
-
-        return tuple([len(self._codes)])
-
-    def shift(self, periods):
-        """
-        Shift Categorical by desired number of periods.
-
-        Parameters
-        ----------
-        periods : int
-            Number of periods to move, can be positive or negative
-
-        Returns
-        -------
-        shifted : Categorical
-        """
-        # since categoricals always have ndim == 1, an axis parameter
-        # doesnt make any sense here.
-        codes = self.codes
-        if codes.ndim > 1:
-            raise NotImplementedError("Categorical with ndim > 1.")
-        if np.prod(codes.shape) and (periods != 0):
-            codes = np.roll(codes, _ensure_platform_int(periods), axis=0)
-            if periods > 0:
-                codes[:periods] = -1
-            else:
-                codes[periods:] = -1
-
-        return self.from_codes(codes, categories=self.categories,
-                               ordered=self.ordered)
-
-    def __array__(self, dtype=None):
-        """
-        The numpy array interface.
-
-        Returns
-        -------
-        values : numpy array
-            A numpy array of either the specified dtype or,
-            if dtype==None (default), the same dtype as
-            categorical.categories.dtype
-        """
-        ret = take_1d(self.categories.values, self._codes)
-        if dtype and not is_dtype_equal(dtype, self.categories.dtype):
-            return np.asarray(ret, dtype)
-        return ret
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if not isinstance(state, dict):
-            raise Exception('invalid pickle state')
-
-        # Provide compatibility with pre-0.15.0 Categoricals.
-        if '_categories' not in state and '_levels' in state:
-            state['_categories'] = self._validate_categories(state.pop(
-                '_levels'))
-        if '_codes' not in state and 'labels' in state:
-            state['_codes'] = coerce_indexer_dtype(
-                state.pop('labels'), state['_categories'])
-
-        # 0.16.0 ordered change
-        if '_ordered' not in state:
-
-            # >=15.0 < 0.16.0
-            if 'ordered' in state:
-                state['_ordered'] = state.pop('ordered')
-            else:
-                state['_ordered'] = False
-
-        for k, v in compat.iteritems(state):
-            setattr(self, k, v)
-
-    @property
-    def T(self):
-        return self
-
-    @property
-    def nbytes(self):
-        return self._codes.nbytes + self._categories.values.nbytes
-
-    def memory_usage(self, deep=False):
-        """
-        Memory usage of my values
-
-        Parameters
-        ----------
-        deep : bool
-            Introspect the data deeply, interrogate
-            `object` dtypes for system-level memory consumption
-
-        Returns
-        -------
-        bytes used
-
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array if deep=False
-
-        See Also
-        --------
-        numpy.ndarray.nbytes
-        """
-        return self._codes.nbytes + self._categories.memory_usage(deep=deep)
-
-    @Substitution(klass='Categorical')
-    @Appender(_shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='v', new_arg_name='value')
-    def searchsorted(self, value, side='left', sorter=None):
-        if not self.ordered:
-            raise ValueError("Categorical not ordered\nyou can use "
-                             ".as_ordered() to change the Categorical to an "
-                             "ordered one")
-
-        from pandas.core.series import Series
-
-        values_as_codes = _get_codes_for_values(Series(value).values,
-                                                self.categories)
-
-        if -1 in values_as_codes:
-            raise ValueError("Value(s) to be inserted must be in categories.")
-
-        return self.codes.searchsorted(values_as_codes, side=side,
-                                       sorter=sorter)
-
-    def isnull(self):
-        """
-        Detect missing values
-
-        Both missing values (-1 in .codes) and NA as a category are detected.
-
-        Returns
-        -------
-        a boolean array of whether my values are null
-
-        See also
-        --------
-        pandas.isnull : pandas version
-        Categorical.notnull : boolean inverse of Categorical.isnull
-        """
-
-        ret = self._codes == -1
-
-        # String/object and float categories can hold np.nan
-        if self.categories.dtype.kind in ['S', 'O', 'f']:
-            if np.nan in self.categories:
-                nan_pos = np.where(isnull(self.categories))[0]
-                # we only have one NA in categories
-                ret = np.logical_or(ret, self._codes == nan_pos)
-        return ret
-
-    def notnull(self):
-        """
-        Reverse of isnull
-
-        Both missing values (-1 in .codes) and NA as a category are detected as
-        null.
-
-        Returns
-        -------
-        a boolean array of whether my values are not null
-
-        See also
-        --------
-        pandas.notnull : pandas version
-        Categorical.isnull : boolean inverse of Categorical.notnull
-        """
-        return ~self.isnull()
-
-    def put(self, *args, **kwargs):
-        """
-        Replace specific elements in the Categorical with given values.
-        """
-        raise NotImplementedError(("'put' is not yet implemented "
-                                   "for Categorical"))
-
-    def dropna(self):
-        """
-        Return the Categorical without null values.
-
-        Both missing values (-1 in .codes) and NA as a category are detected.
-        NA is removed from the categories if present.
-
-        Returns
-        -------
-        valid : Categorical
-        """
-        result = self[self.notnull()]
-        if isnull(result.categories).any():
-            result = result.remove_categories([np.nan])
-        return result
-
-    def value_counts(self, dropna=True):
-        """
-        Returns a Series containing counts of each category.
-
-        Every category will have an entry, even those with a count of 0.
-
-        Parameters
-        ----------
-        dropna : boolean, default True
-            Don't include counts of NaN, even if NaN is a category.
-
-        Returns
-        -------
-        counts : Series
-        """
-        from numpy import bincount
-        from pandas.types.missing import isnull
-        from pandas.core.series import Series
-        from pandas.core.index import CategoricalIndex
-
-        obj = (self.remove_categories([np.nan]) if dropna and
-               isnull(self.categories).any() else self)
-        code, cat = obj._codes, obj.categories
-        ncat, mask = len(cat), 0 <= code
-        ix, clean = np.arange(ncat), mask.all()
-
-        if dropna or clean:
-            obs = code if clean else code[mask]
-            count = bincount(obs, minlength=ncat or None)
-        else:
-            count = bincount(np.where(mask, code, ncat))
-            ix = np.append(ix, -1)
-
-        ix = self._constructor(ix, categories=cat, ordered=obj.ordered,
-                               fastpath=True)
-
-        return Series(count, index=CategoricalIndex(ix), dtype='int64')
-
-    def get_values(self):
-        """ Return the values.
-
-        For internal compatibility with pandas formatting.
-
-        Returns
-        -------
-        values : numpy array
-            A numpy array of the same dtype as categorical.categories.dtype or
-            Index if datetime / periods
-        """
-        # if we are a datetime and period index, return Index to keep metadata
-        if is_datetimelike(self.categories):
-            return self.categories.take(self._codes, fill_value=np.nan)
-        return np.array(self)
-
-    def check_for_ordered(self, op):
-        """ assert that we are ordered """
-        if not self.ordered:
-            raise TypeError("Categorical is not ordered for operation {op}\n"
-                            "you can use .as_ordered() to change the "
-                            "Categorical to an ordered one\n".format(op=op))
-
-    def argsort(self, ascending=True, *args, **kwargs):
-        """
-        Returns the indices that would sort the Categorical instance if
-        'sort_values' was called. This function is implemented to provide
-        compatibility with numpy ndarray objects.
-
-        While an ordering is applied to the category values, arg-sorting
-        in this context refers more to organizing and grouping together
-        based on matching category values. Thus, this function can be
-        called on an unordered Categorical instance unlike the functions
-        'Categorical.min' and 'Categorical.max'.
-
-        Returns
-        -------
-        argsorted : numpy array
-
-        See also
-        --------
-        numpy.ndarray.argsort
-        """
-        ascending = nv.validate_argsort_with_ascending(ascending, args, kwargs)
-        result = np.argsort(self._codes.copy(), **kwargs)
-        if not ascending:
-            result = result[::-1]
-        return result
-
-    def sort_values(self, inplace=False, ascending=True, na_position='last'):
-        """ Sorts the Categorical by category value returning a new
-        Categorical by default.
-
-        While an ordering is applied to the category values, sorting in this
-        context refers more to organizing and grouping together based on
-        matching category values. Thus, this function can be called on an
-        unordered Categorical instance unlike the functions 'Categorical.min'
-        and 'Categorical.max'.
-
-        Parameters
-        ----------
-        inplace : boolean, default False
-            Do operation in place.
-        ascending : boolean, default True
-            Order ascending. Passing False orders descending. The
-            ordering parameter provides the method by which the
-            category values are organized.
-        na_position : {'first', 'last'} (optional, default='last')
-            'first' puts NaNs at the beginning
-            'last' puts NaNs at the end
-
-        Returns
-        -------
-        y : Categorical or None
-
-        See Also
-        --------
-        Categorical.sort
-
-        Examples
-        --------
-        >>> c = pd.Categorical([1, 2, 2, 1, 5])
-        >>> c
-        [1, 2, 2, 1, 5]
-        Categories (3, int64): [1, 2, 5]
-        >>> c.sort_values()
-        [1, 1, 2, 2, 5]
-        Categories (3, int64): [1, 2, 5]
-        >>> c.sort_values(ascending=False)
-        [5, 2, 2, 1, 1]
-        Categories (3, int64): [1, 2, 5]
-
-        Inplace sorting can be done as well:
-
-        >>> c.sort_values(inplace=True)
-        >>> c
-        [1, 1, 2, 2, 5]
-        Categories (3, int64): [1, 2, 5]
-        >>>
-        >>> c = pd.Categorical([1, 2, 2, 1, 5])
-
-        'sort_values' behaviour with NaNs. Note that 'na_position'
-        is independent of the 'ascending' parameter:
-
-        >>> c = pd.Categorical([np.nan, 2, 2, np.nan, 5])
-        >>> c
-        [NaN, 2.0, 2.0, NaN, 5.0]
-        Categories (2, int64): [2, 5]
-        >>> c.sort_values()
-        [2.0, 2.0, 5.0, NaN, NaN]
-        Categories (2, int64): [2, 5]
-        >>> c.sort_values(ascending=False)
-        [5.0, 2.0, 2.0, NaN, NaN]
-        Categories (2, int64): [2, 5]
-        >>> c.sort_values(na_position='first')
-        [NaN, NaN, 2.0, 2.0, 5.0]
-        Categories (2, int64): [2, 5]
-        >>> c.sort_values(ascending=False, na_position='first')
-        [NaN, NaN, 5.0, 2.0, 2.0]
-        Categories (2, int64): [2, 5]
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        if na_position not in ['last', 'first']:
-            raise ValueError('invalid na_position: {!r}'.format(na_position))
-
-        codes = np.sort(self._codes)
-        if not ascending:
-            codes = codes[::-1]
-
-        # NaN handling
-        na_mask = (codes == -1)
-        if na_mask.any():
-            n_nans = len(codes[na_mask])
-            if na_position == "first":
-                # in this case sort to the front
-                new_codes = codes.copy()
-                new_codes[0:n_nans] = -1
-                new_codes[n_nans:] = codes[~na_mask]
-                codes = new_codes
-            elif na_position == "last":
-                # ... and to the end
-                new_codes = codes.copy()
-                pos = len(codes) - n_nans
-                new_codes[0:pos] = codes[~na_mask]
-                new_codes[pos:] = -1
-                codes = new_codes
-        if inplace:
-            self._codes = codes
-            return
-        else:
-            return self._constructor(values=codes, categories=self.categories,
-                                     ordered=self.ordered, fastpath=True)
-
-    def _values_for_rank(self):
-        """
-        For correctly ranking ordered categorical data. See GH#15420
-
-        Ordered categorical data should be ranked on the basis of
-        codes with -1 translated to NaN.
-
-        Returns
-        -------
-        numpy array
-
-        """
-        from pandas import Series
-        if self.ordered:
-            values = self.codes
-            mask = values == -1
-            if mask.any():
-                values = values.astype('float64')
-                values[mask] = np.nan
-        elif self.categories.is_numeric():
-            values = np.array(self)
-        else:
-            #  reorder the categories (so rank can use the float codes)
-            #  instead of passing an object array to rank
-            values = np.array(
-                self.rename_categories(Series(self.categories).rank())
-            )
-        return values
-
-    def order(self, inplace=False, ascending=True, na_position='last'):
-        """
-        DEPRECATED: use :meth:`Categorical.sort_values`. That function
-        is entirely equivalent to this one.
-
-        See Also
-        --------
-        Categorical.sort_values
-        """
-        warn("order is deprecated, use sort_values(...)", FutureWarning,
-             stacklevel=2)
-        return self.sort_values(inplace=inplace, ascending=ascending,
-                                na_position=na_position)
-
-    def sort(self, inplace=True, ascending=True, na_position='last', **kwargs):
-        """
-        DEPRECATED: use :meth:`Categorical.sort_values`. That function
-        is just like this one, except that a new Categorical is returned
-        by default, so make sure to pass in 'inplace=True' to get
-        inplace sorting.
-
-        See Also
-        --------
-        Categorical.sort_values
-        """
-        warn("sort is deprecated, use sort_values(...)", FutureWarning,
-             stacklevel=2)
-        nv.validate_sort(tuple(), kwargs)
-        return self.sort_values(inplace=inplace, ascending=ascending,
-                                na_position=na_position)
-
-    def ravel(self, order='C'):
-        """ Return a flattened (numpy) array.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        raveled : numpy array
-        """
-        return np.array(self)
-
-    def view(self):
-        """Return a view of myself.
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        view : Categorical
-           Returns `self`!
-        """
-        return self
-
-    def to_dense(self):
-        """Return my 'dense' representation
-
-        For internal compatibility with numpy arrays.
-
-        Returns
-        -------
-        dense : array
-        """
-        return np.asarray(self)
-
-    @deprecate_kwarg(old_arg_name='fill_value', new_arg_name='value')
-    def fillna(self, value=None, method=None, limit=None):
-        """ Fill NA/NaN values using the specified method.
-
-        Parameters
-        ----------
-        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
-            Method to use for filling holes in reindexed Series
-            pad / ffill: propagate last valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill gap
-        value : scalar
-            Value to use to fill holes (e.g. 0)
-        limit : int, default None
-            (Not implemented yet for Categorical!)
-            If method is specified, this is the maximum number of consecutive
-            NaN values to forward/backward fill. In other words, if there is
-            a gap with more than this number of consecutive NaNs, it will only
-            be partially filled. If method is not specified, this is the
-            maximum number of entries along the entire axis where NaNs will be
-            filled.
-
-        Returns
-        -------
-        filled : Categorical with NA/NaN filled
-        """
-
-        if value is None:
-            value = np.nan
-        if limit is not None:
-            raise NotImplementedError("specifying a limit for fillna has not "
-                                      "been implemented yet")
-
-        values = self._codes
-
-        # Make sure that we also get NA in categories
-        if self.categories.dtype.kind in ['S', 'O', 'f']:
-            if np.nan in self.categories:
-                values = values.copy()
-                nan_pos = np.where(isnull(self.categories))[0]
-                # we only have one NA in categories
-                values[values == nan_pos] = -1
-
-        # pad / bfill
-        if method is not None:
-
-            values = self.to_dense().reshape(-1, len(self))
-            values = interpolate_2d(values, method, 0, None,
-                                    value).astype(self.categories.dtype)[0]
-            values = _get_codes_for_values(values, self.categories)
-
-        else:
-
-            if not isnull(value) and value not in self.categories:
-                raise ValueError("fill value must be in categories")
-
-            mask = values == -1
-            if mask.any():
-                values = values.copy()
-                if isnull(value):
-                    values[mask] = -1
-                else:
-                    values[mask] = self.categories.get_loc(value)
-
-        return self._constructor(values, categories=self.categories,
-                                 ordered=self.ordered, fastpath=True)
-
-    def take_nd(self, indexer, allow_fill=True, fill_value=None):
-        """ Take the codes by the indexer, fill with the fill_value.
-
-        For internal compatibility with numpy arrays.
-        """
-
-        # filling must always be None/nan here
-        # but is passed thru internally
-        assert isnull(fill_value)
-
-        codes = take_1d(self._codes, indexer, allow_fill=True, fill_value=-1)
-        result = self._constructor(codes, categories=self.categories,
-                                   ordered=self.ordered, fastpath=True)
-        return result
-
-    take = take_nd
-
-    def _slice(self, slicer):
-        """ Return a slice of myself.
-
-        For internal compatibility with numpy arrays.
-        """
-
-        # only allow 1 dimensional slicing, but can
-        # in a 2-d case be passd (slice(None),....)
-        if isinstance(slicer, tuple) and len(slicer) == 2:
-            if not is_null_slice(slicer[0]):
-                raise AssertionError("invalid slicing for a 1-ndim "
-                                     "categorical")
-            slicer = slicer[1]
-
-        _codes = self._codes[slicer]
-        return self._constructor(values=_codes, categories=self.categories,
-                                 ordered=self.ordered, fastpath=True)
-
-    def __len__(self):
-        """The length of this Categorical."""
-        return len(self._codes)
-
-    def __iter__(self):
-        """Returns an Iterator over the values of this Categorical."""
-        return iter(self.get_values())
-
-    def _tidy_repr(self, max_vals=10, footer=True):
-        """ a short repr displaying only max_vals and an optional (but default
-        footer)
-        """
-        num = max_vals // 2
-        head = self[:num]._get_repr(length=False, footer=False)
-        tail = self[-(max_vals - num):]._get_repr(length=False, footer=False)
-
-        result = '%s, ..., %s' % (head[:-1], tail[1:])
-        if footer:
-            result = '%s\n%s' % (result, self._repr_footer())
-
-        return compat.text_type(result)
-
-    def _repr_categories(self):
-        """ return the base repr for the categories """
-        max_categories = (10 if get_option("display.max_categories") == 0 else
-                          get_option("display.max_categories"))
-        from pandas.formats import format as fmt
-        if len(self.categories) > max_categories:
-            num = max_categories // 2
-            head = fmt.format_array(self.categories[:num], None)
-            tail = fmt.format_array(self.categories[-num:], None)
-            category_strs = head + ["..."] + tail
-        else:
-            category_strs = fmt.format_array(self.categories, None)
-
-        # Strip all leading spaces, which format_array adds for columns...
-        category_strs = [x.strip() for x in category_strs]
-        return category_strs
-
-    def _repr_categories_info(self):
-        """ Returns a string representation of the footer."""
-
-        category_strs = self._repr_categories()
-        dtype = getattr(self.categories, 'dtype_str',
-                        str(self.categories.dtype))
-
-        levheader = "Categories (%d, %s): " % (len(self.categories), dtype)
-        width, height = get_terminal_size()
-        max_width = get_option("display.width") or width
-        if com.in_ipython_frontend():
-            # 0 = no breaks
-            max_width = 0
-        levstring = ""
-        start = True
-        cur_col_len = len(levheader)  # header
-        sep_len, sep = (3, " < ") if self.ordered else (2, ", ")
-        linesep = sep.rstrip() + "\n"  # remove whitespace
-        for val in category_strs:
-            if max_width != 0 and cur_col_len + sep_len + len(val) > max_width:
-                levstring += linesep + (" " * (len(levheader) + 1))
-                cur_col_len = len(levheader) + 1  # header + a whitespace
-            elif not start:
-                levstring += sep
-                cur_col_len += len(val)
-            levstring += val
-            start = False
-        # replace to simple save space by
-        return levheader + "[" + levstring.replace(" < ... < ", " ... ") + "]"
-
-    def _repr_footer(self):
-
-        return u('Length: %d\n%s') % (len(self), self._repr_categories_info())
-
-    def _get_repr(self, length=True, na_rep='NaN', footer=True):
-        from pandas.formats import format as fmt
-        formatter = fmt.CategoricalFormatter(self, length=length,
-                                             na_rep=na_rep, footer=footer)
-        result = formatter.to_string()
-        return compat.text_type(result)
-
-    def __unicode__(self):
-        """ Unicode representation. """
-        _maxlen = 10
-        if len(self._codes) > _maxlen:
-            result = self._tidy_repr(_maxlen)
-        elif len(self._codes) > 0:
-            result = self._get_repr(length=len(self) > _maxlen)
-        else:
-            result = ('[], %s' %
-                      self._get_repr(length=False,
-                                     footer=True, ).replace("\n", ", "))
-
-        return result
-
-    def _maybe_coerce_indexer(self, indexer):
-        """ return an indexer coerced to the codes dtype """
-        if isinstance(indexer, np.ndarray) and indexer.dtype.kind == 'i':
-            indexer = indexer.astype(self._codes.dtype)
-        return indexer
-
-    def __getitem__(self, key):
-        """ Return an item. """
-        if isinstance(key, (int, np.integer)):
-            i = self._codes[key]
-            if i == -1:
-                return np.nan
-            else:
-                return self.categories[i]
-        else:
-            return self._constructor(values=self._codes[key],
-                                     categories=self.categories,
-                                     ordered=self.ordered, fastpath=True)
-
-    def __setitem__(self, key, value):
-        """ Item assignment.
-
-
-        Raises
-        ------
-        ValueError
-            If (one or more) Value is not in categories or if a assigned
-            `Categorical` does not have the same categories
-        """
-
-        # require identical categories set
-        if isinstance(value, Categorical):
-            if not value.categories.equals(self.categories):
-                raise ValueError("Cannot set a Categorical with another, "
-                                 "without identical categories")
-
-        rvalue = value if is_list_like(value) else [value]
-
-        from pandas import Index
-        to_add = Index(rvalue).difference(self.categories)
-
-        # no assignments of values not in categories, but it's always ok to set
-        # something to np.nan
-        if len(to_add) and not isnull(to_add).all():
-            raise ValueError("Cannot setitem on a Categorical with a new "
-                             "category, set the categories first")
-
-        # set by position
-        if isinstance(key, (int, np.integer)):
-            pass
-
-        # tuple of indexers (dataframe)
-        elif isinstance(key, tuple):
-            # only allow 1 dimensional slicing, but can
-            # in a 2-d case be passd (slice(None),....)
-            if len(key) == 2:
-                if not is_null_slice(key[0]):
-                    raise AssertionError("invalid slicing for a 1-ndim "
-                                         "categorical")
-                key = key[1]
-            elif len(key) == 1:
-                key = key[0]
-            else:
-                raise AssertionError("invalid slicing for a 1-ndim "
-                                     "categorical")
-
-        # slicing in Series or Categorical
-        elif isinstance(key, slice):
-            pass
-
-        # Array of True/False in Series or Categorical
-        else:
-            # There is a bug in numpy, which does not accept a Series as a
-            # indexer
-            # https://github.com/pandas-dev/pandas/issues/6168
-            # https://github.com/numpy/numpy/issues/4240 -> fixed in numpy 1.9
-            # FIXME: remove when numpy 1.9 is the lowest numpy version pandas
-            # accepts...
-            key = np.asarray(key)
-
-        lindexer = self.categories.get_indexer(rvalue)
-
-        # FIXME: the following can be removed after GH7820 is fixed:
-        # https://github.com/pandas-dev/pandas/issues/7820
-        # float categories do currently return -1 for np.nan, even if np.nan is
-        # included in the index -> "repair" this here
-        if isnull(rvalue).any() and isnull(self.categories).any():
-            nan_pos = np.where(isnull(self.categories))[0]
-            lindexer[lindexer == -1] = nan_pos
-
-        lindexer = self._maybe_coerce_indexer(lindexer)
-        self._codes[key] = lindexer
-
-    def _reverse_indexer(self):
-        """
-        Compute the inverse of a categorical, returning
-        a dict of categories -> indexers.
-
-        *This is an internal function*
-
-        Returns
-        -------
-        dict of categories -> indexers
-
-        Example
-        -------
-        In [1]: c = pd.Categorical(list('aabca'))
-
-        In [2]: c
-        Out[2]:
-        [a, a, b, c, a]
-        Categories (3, object): [a, b, c]
-
-        In [3]: c.categories
-        Out[3]: Index([u'a', u'b', u'c'], dtype='object')
-
-        In [4]: c.codes
-        Out[4]: array([0, 0, 1, 2, 0], dtype=int8)
-
-        In [5]: c._reverse_indexer()
-        Out[5]: {'a': array([0, 1, 4]), 'b': array([2]), 'c': array([3])}
-
-        """
-        categories = self.categories
-        r, counts = libalgos.groupsort_indexer(self.codes.astype('int64'),
-                                               categories.size)
-        counts = counts.cumsum()
-        result = [r[counts[indexer]:counts[indexer + 1]]
-                  for indexer in range(len(counts) - 1)]
-        result = dict(zip(categories, result))
-        return result
-
-    # reduction ops #
-    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
-                filter_type=None, **kwds):
-        """ perform the reduction type operation """
-        func = getattr(self, name, None)
-        if func is None:
-            raise TypeError("Categorical cannot perform the operation "
-                            "{op}".format(op=name))
-        return func(numeric_only=numeric_only, **kwds)
-
-    def min(self, numeric_only=None, **kwargs):
-        """ The minimum value of the object.
-
-        Only ordered `Categoricals` have a minimum!
-
-        Raises
-        ------
-        TypeError
-            If the `Categorical` is not `ordered`.
-
-        Returns
-        -------
-        min : the minimum of this `Categorical`
-        """
-        self.check_for_ordered('min')
-        if numeric_only:
-            good = self._codes != -1
-            pointer = self._codes[good].min(**kwargs)
-        else:
-            pointer = self._codes.min(**kwargs)
-        if pointer == -1:
-            return np.nan
-        else:
-            return self.categories[pointer]
-
-    def max(self, numeric_only=None, **kwargs):
-        """ The maximum value of the object.
-
-        Only ordered `Categoricals` have a maximum!
-
-        Raises
-        ------
-        TypeError
-            If the `Categorical` is not `ordered`.
-
-        Returns
-        -------
-        max : the maximum of this `Categorical`
-        """
-        self.check_for_ordered('max')
-        if numeric_only:
-            good = self._codes != -1
-            pointer = self._codes[good].max(**kwargs)
-        else:
-            pointer = self._codes.max(**kwargs)
-        if pointer == -1:
-            return np.nan
-        else:
-            return self.categories[pointer]
-
-    def mode(self):
-        """
-        Returns the mode(s) of the Categorical.
-
-        Always returns `Categorical` even if only one value.
-
-        Returns
-        -------
-        modes : `Categorical` (sorted)
-        """
-
-        import pandas._libs.hashtable as htable
-        good = self._codes != -1
-        values = sorted(htable.mode_int64(_ensure_int64(self._codes[good])))
-        result = self._constructor(values=values, categories=self.categories,
-                                   ordered=self.ordered, fastpath=True)
-        return result
-
-    def unique(self):
-        """
-        Return the ``Categorical`` which ``categories`` and ``codes`` are
-        unique. Unused categories are NOT returned.
-
-        - unordered category: values and categories are sorted by appearance
-          order.
-        - ordered category: values are sorted by appearance order, categories
-          keeps existing order.
-
-        Returns
-        -------
-        unique values : ``Categorical``
-        """
-
-        # unlike np.unique, unique1d does not sort
-        unique_codes = unique1d(self.codes)
-        cat = self.copy()
-
-        # keep nan in codes
-        cat._codes = unique_codes
-
-        # exclude nan from indexer for categories
-        take_codes = unique_codes[unique_codes != -1]
-        if self.ordered:
-            take_codes = sorted(take_codes)
-        return cat.set_categories(cat.categories.take(take_codes))
-
-    def equals(self, other):
-        """
-        Returns True if categorical arrays are equal.
-
-        Parameters
-        ----------
-        other : `Categorical`
-
-        Returns
-        -------
-        are_equal : boolean
-        """
-        return (self.is_dtype_equal(other) and
-                np.array_equal(self._codes, other._codes))
-
-    def is_dtype_equal(self, other):
-        """
-        Returns True if categoricals are the same dtype
-          same categories, and same ordered
-
-        Parameters
-        ----------
-        other : Categorical
-
-        Returns
-        -------
-        are_equal : boolean
-        """
-
-        try:
-            return (self.categories.equals(other.categories) and
-                    self.ordered == other.ordered)
-        except (AttributeError, TypeError):
-            return False
-
-    def describe(self):
-        """ Describes this Categorical
-
-        Returns
-        -------
-        description: `DataFrame`
-            A dataframe with frequency and counts by category.
-        """
-        counts = self.value_counts(dropna=False)
-        freqs = counts / float(counts.sum())
-
-        from pandas.tools.concat import concat
-        result = concat([counts, freqs], axis=1)
-        result.columns = ['counts', 'freqs']
-        result.index.name = 'categories'
-
-        return result
-
-    def repeat(self, repeats, *args, **kwargs):
-        """
-        Repeat elements of a Categorical.
-
-        See also
-        --------
-        numpy.ndarray.repeat
-
-        """
-        nv.validate_repeat(args, kwargs)
-        codes = self._codes.repeat(repeats)
-        return self._constructor(values=codes, categories=self.categories,
-                                 ordered=self.ordered, fastpath=True)
-
-# The Series.cat accessor
-
-
-class CategoricalAccessor(PandasDelegate, NoNewAttributesMixin):
-    """
-    Accessor object for categorical properties of the Series values.
-
-    Be aware that assigning to `categories` is a inplace operation, while all
-    methods return new categorical data per default (but can be called with
-    `inplace=True`).
-
-    Examples
-    --------
-    >>> s.cat.categories
-    >>> s.cat.categories = list('abc')
-    >>> s.cat.rename_categories(list('cab'))
-    >>> s.cat.reorder_categories(list('cab'))
-    >>> s.cat.add_categories(['d','e'])
-    >>> s.cat.remove_categories(['d'])
-    >>> s.cat.remove_unused_categories()
-    >>> s.cat.set_categories(list('abcde'))
-    >>> s.cat.as_ordered()
-    >>> s.cat.as_unordered()
-
-    """
-
-    def __init__(self, values, index):
-        self.categorical = values
-        self.index = index
-        self._freeze()
-
-    def _delegate_property_get(self, name):
-        return getattr(self.categorical, name)
-
-    def _delegate_property_set(self, name, new_values):
-        return setattr(self.categorical, name, new_values)
-
-    @property
-    def codes(self):
-        from pandas import Series
-        return Series(self.categorical.codes, index=self.index)
-
-    def _delegate_method(self, name, *args, **kwargs):
-        from pandas import Series
-        method = getattr(self.categorical, name)
-        res = method(*args, **kwargs)
-        if res is not None:
-            return Series(res, index=self.index)
-
-
-CategoricalAccessor._add_delegate_accessors(delegate=Categorical,
-                                            accessors=["categories",
-                                                       "ordered"],
-                                            typ='property')
-CategoricalAccessor._add_delegate_accessors(delegate=Categorical, accessors=[
-    "rename_categories", "reorder_categories", "add_categories",
-    "remove_categories", "remove_unused_categories", "set_categories",
-    "as_ordered", "as_unordered"], typ='method')
-
-# utility routines
-
-
-def _get_codes_for_values(values, categories):
-    """
-    utility routine to turn values into codes given the specified categories
-    """
-
-    from pandas.core.algorithms import _get_data_algo, _hashtables
-    if not is_dtype_equal(values.dtype, categories.dtype):
-        values = _ensure_object(values)
-        categories = _ensure_object(categories)
-
-    (hash_klass, vec_klass), vals = _get_data_algo(values, _hashtables)
-    (_, _), cats = _get_data_algo(categories, _hashtables)
-    t = hash_klass(len(cats))
-    t.map_locations(cats)
-    return coerce_indexer_dtype(t.lookup(vals), cats)
-
-
-def _convert_to_list_like(list_like):
-    if hasattr(list_like, "dtype"):
-        return list_like
-    if isinstance(list_like, list):
-        return list_like
-    if (is_sequence(list_like) or isinstance(list_like, tuple) or
-            isinstance(list_like, types.GeneratorType)):
-        return list(list_like)
-    elif is_scalar(list_like):
-        return [list_like]
-    else:
-        # is this reached?
-        return [list_like]
-
-
-def _factorize_from_iterable(values):
-    """
-    Factorize an input `values` into `categories` and `codes`. Preserves
-    categorical dtype in `categories`.
-
-    *This is an internal function*
-
-    Parameters
-    ----------
-    values : list-like
-
-    Returns
-    -------
-    codes : ndarray
-    categories : Index
-        If `values` has a categorical dtype, then `categories` is
-        a CategoricalIndex keeping the categories and order of `values`.
-    """
-    from pandas.indexes.category import CategoricalIndex
-
-    if not is_list_like(values):
-        raise TypeError("Input must be list-like")
-
-    if is_categorical(values):
-        if isinstance(values, (ABCCategoricalIndex, ABCSeries)):
-            values = values._values
-        categories = CategoricalIndex(values.categories,
-                                      categories=values.categories,
-                                      ordered=values.ordered)
-        codes = values.codes
-    else:
-        cat = Categorical(values, ordered=True)
-        categories = cat.categories
-        codes = cat.codes
-    return codes, categories
-
-
-def _factorize_from_iterables(iterables):
-    """
-    A higher-level wrapper over `_factorize_from_iterable`.
-
-    *This is an internal function*
-
-    Parameters
-    ----------
-    iterables : list-like of list-likes
-
-    Returns
-    -------
-    codes_list : list of ndarrays
-    categories_list : list of Indexes
-
-    Notes
-    -----
-    See `_factorize_from_iterable` for more info.
-    """
-    if len(iterables) == 0:
-        # For consistency, it should return a list of 2 lists.
-        return [[], []]
-    return map(list, lzip(*[_factorize_from_iterable(it) for it in iterables]))
+# TODO: Remove after 0.23.x
+warnings.warn("'pandas.core' is private. Use 'pandas.Categorical'",
+              FutureWarning, stacklevel=2)
diff --git a/pandas/core/common.py b/pandas/core/common.py
index 93e24dce8b623..5b83cb344b1e7 100644
--- a/pandas/core/common.py
+++ b/pandas/core/common.py
@@ -1,84 +1,27 @@
 """
 Misc tools for implementing data structures
+
+Note: pandas.core.common is *not* part of the public API.
 """
 
-import sys
-import warnings
+import collections
+from collections import OrderedDict
 from datetime import datetime, timedelta
 from functools import partial
+import inspect
 
 import numpy as np
-from pandas._libs import lib, tslib
-
-from pandas import compat
-from pandas.compat import long, zip, iteritems
-from pandas.core.config import get_option
-from pandas.types.generic import ABCSeries
-from pandas.types.common import _NS_DTYPE
-from pandas.types.inference import _iterable_not_string
-from pandas.types.missing import isnull
-from pandas.api import types
-from pandas.types import common
-
-# back-compat of public API
-# deprecate these functions
-m = sys.modules['pandas.core.common']
-for t in [t for t in dir(types) if not t.startswith('_')]:
-
-    def outer(t=t):
-
-        def wrapper(*args, **kwargs):
-            warnings.warn("pandas.core.common.{t} is deprecated. "
-                          "import from the public API: "
-                          "pandas.api.types.{t} instead".format(t=t),
-                          DeprecationWarning, stacklevel=3)
-            return getattr(types, t)(*args, **kwargs)
-        return wrapper
-
-    setattr(m, t, outer(t))
-
-# back-compat for non-public functions
-# deprecate these functions
-for t in ['is_datetime_arraylike',
-          'is_datetime_or_timedelta_dtype',
-          'is_datetimelike',
-          'is_datetimelike_v_numeric',
-          'is_datetimelike_v_object',
-          'is_datetimetz',
-          'is_int_or_datetime_dtype',
-          'is_period_arraylike',
-          'is_string_like',
-          'is_string_like_dtype']:
-
-    def outer(t=t):
-
-        def wrapper(*args, **kwargs):
-            warnings.warn("pandas.core.common.{t} is deprecated. "
-                          "These are not longer public API functions, "
-                          "but can be imported from "
-                          "pandas.types.common.{t} instead".format(t=t),
-                          DeprecationWarning, stacklevel=3)
-            return getattr(common, t)(*args, **kwargs)
-        return wrapper
-
-    setattr(m, t, outer(t))
-
-
-# deprecate array_equivalent
-
-def array_equivalent(*args, **kwargs):
-    warnings.warn("'pandas.core.common.array_equivalent' is deprecated and "
-                  "is no longer public API", DeprecationWarning, stacklevel=2)
-    from pandas.types import missing
-    return missing.array_equivalent(*args, **kwargs)
-
-
-class PandasError(Exception):
-    pass
 
+from pandas._libs import lib, tslibs
+import pandas.compat as compat
+from pandas.compat import PY36, iteritems
 
-class PerformanceWarning(Warning):
-    pass
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+from pandas.core.dtypes.common import (
+    is_array_like, is_bool_dtype, is_extension_array_dtype, is_integer)
+from pandas.core.dtypes.generic import ABCIndex, ABCIndexClass, ABCSeries
+from pandas.core.dtypes.inference import _iterable_not_string
+from pandas.core.dtypes.missing import isna, isnull, notnull  # noqa
 
 
 class SettingWithCopyError(ValueError):
@@ -89,39 +32,9 @@ class SettingWithCopyWarning(Warning):
     pass
 
 
-class AmbiguousIndexError(PandasError, KeyError):
-    pass
-
-
-class UnsupportedFunctionCall(ValueError):
-    pass
-
-
-class UnsortedIndexError(KeyError):
-    """ Error raised when attempting to get a slice of a MultiIndex
-    and the index has not been lexsorted. Subclass of `KeyError`.
-
-    .. versionadded:: 0.20.0
-
-    """
-    pass
-
-
-class AbstractMethodError(NotImplementedError):
-    """Raise this error instead of NotImplementedError for abstract methods
-    while keeping compatibility with Python 2 and Python 3.
-    """
-
-    def __init__(self, class_instance):
-        self.class_instance = class_instance
-
-    def __str__(self):
-        return ("This method must be defined in the concrete class of %s" %
-                self.class_instance.__class__.__name__)
-
-
 def flatten(l):
-    """Flatten an arbitrarily nested sequence.
+    """
+    Flatten an arbitrarily nested sequence.
 
     Parameters
     ----------
@@ -144,40 +57,18 @@ def flatten(l):
             yield el
 
 
-def _consensus_name_attr(objs):
+def consensus_name_attr(objs):
     name = objs[0].name
     for obj in objs[1:]:
-        if obj.name != name:
-            return None
+        try:
+            if obj.name != name:
+                name = None
+        except ValueError:
+            name = None
     return name
 
 
-def _maybe_match_name(a, b):
-    a_has = hasattr(a, 'name')
-    b_has = hasattr(b, 'name')
-    if a_has and b_has:
-        if a.name == b.name:
-            return a.name
-        else:
-            return None
-    elif a_has:
-        return a.name
-    elif b_has:
-        return b.name
-    return None
-
-
-def _get_info_slice(obj, indexer):
-    """Slice the info axis of `obj` with `indexer`."""
-    if not hasattr(obj, '_info_axis_number'):
-        raise TypeError('object of type %r has no info axis' %
-                        type(obj).__name__)
-    slices = [slice(None)] * obj.ndim
-    slices[obj._info_axis_number] = indexer
-    return tuple(slices)
-
-
-def _maybe_box(indexer, values, obj, key):
+def maybe_box(indexer, values, obj, key):
 
     # if we have multiples coming back, box em
     if isinstance(values, np.ndarray):
@@ -187,32 +78,60 @@ def _maybe_box(indexer, values, obj, key):
     return values
 
 
-def _maybe_box_datetimelike(value):
+def maybe_box_datetimelike(value):
     # turn a datetime like into a Timestamp/timedelta as needed
 
     if isinstance(value, (np.datetime64, datetime)):
-        value = tslib.Timestamp(value)
+        value = tslibs.Timestamp(value)
     elif isinstance(value, (np.timedelta64, timedelta)):
-        value = tslib.Timedelta(value)
+        value = tslibs.Timedelta(value)
 
     return value
 
 
-_values_from_object = lib.values_from_object
+values_from_object = lib.values_from_object
 
 
 def is_bool_indexer(key):
-    if isinstance(key, (ABCSeries, np.ndarray)):
+    # type: (Any) -> bool
+    """
+    Check whether `key` is a valid boolean indexer.
+
+    Parameters
+    ----------
+    key : Any
+        Only list-likes may be considered boolean indexers.
+        All other types are not considered a boolean indexer.
+        For array-like input, boolean ndarrays or ExtensionArrays
+        with ``_is_boolean`` set are considered boolean indexers.
+
+    Returns
+    -------
+    bool
+
+    Raises
+    ------
+    ValueError
+        When the array is an object-dtype ndarray or ExtensionArray
+        and contains missing values.
+    """
+    na_msg = 'cannot index with vector containing NA / NaN values'
+    if (isinstance(key, (ABCSeries, np.ndarray, ABCIndex)) or
+            (is_array_like(key) and is_extension_array_dtype(key.dtype))):
         if key.dtype == np.object_:
-            key = np.asarray(_values_from_object(key))
+            key = np.asarray(values_from_object(key))
 
             if not lib.is_bool_array(key):
-                if isnull(key).any():
-                    raise ValueError('cannot index with vector containing '
-                                     'NA / NaN values')
+                if isna(key).any():
+                    raise ValueError(na_msg)
                 return False
             return True
-        elif key.dtype == np.bool_:
+        elif is_bool_dtype(key.dtype):
+            # an ndarray with bool-dtype by definition has no missing values.
+            # So we only need to check for NAs in ExtensionArrays
+            if is_extension_array_dtype(key.dtype):
+                if np.any(key.isna()):
+                    raise ValueError(na_msg)
             return True
     elif isinstance(key, list):
         try:
@@ -224,164 +143,105 @@ def is_bool_indexer(key):
     return False
 
 
-def _default_index(n):
-    from pandas.core.index import RangeIndex
-    return RangeIndex(0, n, name=None)
+def cast_scalar_indexer(val):
+    """
+    To avoid numpy DeprecationWarnings, cast float to integer where valid.
 
+    Parameters
+    ----------
+    val : scalar
 
-def _mut_exclusive(**kwargs):
-    item1, item2 = kwargs.items()
-    label1, val1 = item1
-    label2, val2 = item2
-    if val1 is not None and val2 is not None:
-        raise TypeError('mutually exclusive arguments: %r and %r' %
-                        (label1, label2))
-    elif val1 is not None:
-        return val1
-    else:
-        return val2
+    Returns
+    -------
+    outval : scalar
+    """
+    # assumes lib.is_scalar(val)
+    if lib.is_float(val) and val == int(val):
+        return int(val)
+    return val
 
 
 def _not_none(*args):
+    """
+    Returns a generator consisting of the arguments that are not None.
+    """
     return (arg for arg in args if arg is not None)
 
 
 def _any_none(*args):
+    """
+    Returns a boolean indicating if any argument is None.
+    """
     for arg in args:
         if arg is None:
             return True
     return False
 
 
-def _all_not_none(*args):
+def _all_none(*args):
+    """
+    Returns a boolean indicating if all arguments are None.
+    """
     for arg in args:
-        if arg is None:
+        if arg is not None:
             return False
     return True
 
 
-def _count_not_none(*args):
-    return sum(x is not None for x in args)
-
-
-def _try_sort(iterable):
-    listed = list(iterable)
-    try:
-        return sorted(listed)
-    except Exception:
-        return listed
-
-
-def iterpairs(seq):
-    """
-    Parameters
-    ----------
-    seq : sequence
-
-    Returns
-    -------
-    iterator returning overlapping pairs of elements
-
-    Examples
-    --------
-    >>> list(iterpairs([1, 2, 3, 4]))
-    [(1, 2), (2, 3), (3, 4)]
+def _any_not_none(*args):
     """
-    # input may not be sliceable
-    seq_it = iter(seq)
-    seq_it_next = iter(seq)
-    next(seq_it_next)
-
-    return zip(seq_it, seq_it_next)
-
-
-def split_ranges(mask):
-    """ Generates tuples of ranges which cover all True value in mask
-
-    >>> list(split_ranges([1,0,0,1,0]))
-    [(0, 1), (3, 4)]
+    Returns a boolean indicating if any argument is not None.
     """
-    ranges = [(0, len(mask))]
-
-    for pos, val in enumerate(mask):
-        if not val:  # this pos should be ommited, split off the prefix range
-            r = ranges.pop()
-            if pos > r[0]:  # yield non-zero range
-                yield (r[0], pos)
-            if pos + 1 < len(mask):  # save the rest for processing
-                ranges.append((pos + 1, len(mask)))
-    if ranges:
-        yield ranges[-1]
-
-
-def _long_prod(vals):
-    result = long(1)
-    for x in vals:
-        result *= x
-    return result
+    for arg in args:
+        if arg is not None:
+            return True
+    return False
 
 
-class groupby(dict):
+def _all_not_none(*args):
     """
-    A simple groupby different from the one in itertools.
-
-    Does not require the sequence elements to be sorted by keys,
-    however it is slower.
+    Returns a boolean indicating if all arguments are not None.
     """
-
-    def __init__(self, seq, key=lambda x: x):
-        for value in seq:
-            k = key(value)
-            self.setdefault(k, []).append(value)
-
-    try:
-        __iter__ = dict.iteritems
-    except AttributeError:  # pragma: no cover
-        # Python 3
-        def __iter__(self):
-            return iter(dict.items(self))
+    for arg in args:
+        if arg is None:
+            return False
+    return True
 
 
-def map_indices_py(arr):
+def count_not_none(*args):
     """
-    Returns a dictionary with (element, index) pairs for each element in the
-    given array/list
+    Returns the count of arguments that are not None.
     """
-    return dict([(x, i) for i, x in enumerate(arr)])
-
-
-def union(*seqs):
-    result = set([])
-    for seq in seqs:
-        if not isinstance(seq, set):
-            seq = set(seq)
-        result |= seq
-    return type(seqs[0])(list(result))
+    return sum(x is not None for x in args)
 
 
-def difference(a, b):
-    return type(a)(list(set(a) - set(b)))
+def try_sort(iterable):
+    listed = list(iterable)
+    try:
+        return sorted(listed)
+    except Exception:
+        return listed
 
 
-def intersection(*seqs):
-    result = set(seqs[0])
-    for seq in seqs:
-        if not isinstance(seq, set):
-            seq = set(seq)
-        result &= seq
-    return type(seqs[0])(list(result))
+def dict_keys_to_ordered_list(mapping):
+    # when pandas drops support for Python < 3.6, this function
+    # can be replaced by a simple list(mapping.keys())
+    if PY36 or isinstance(mapping, OrderedDict):
+        keys = list(mapping.keys())
+    else:
+        keys = try_sort(mapping)
+    return keys
 
 
-def _asarray_tuplesafe(values, dtype=None):
-    from pandas.core.index import Index
+def asarray_tuplesafe(values, dtype=None):
 
     if not (isinstance(values, (list, tuple)) or hasattr(values, '__array__')):
         values = list(values)
-    elif isinstance(values, Index):
+    elif isinstance(values, ABCIndexClass):
         return values.values
 
     if isinstance(values, list) and dtype in [np.object_, object]:
-        return lib.list_to_object_array(values)
+        return construct_1d_object_array_from_listlike(values)
 
     result = np.asarray(values, dtype=dtype)
 
@@ -389,22 +249,27 @@ def _asarray_tuplesafe(values, dtype=None):
         result = np.asarray(values, dtype=object)
 
     if result.ndim == 2:
-        if isinstance(values, list):
-            return lib.list_to_object_array(values)
-        else:
-            # Making a 1D array that safely contains tuples is a bit tricky
-            # in numpy, leading to the following
-            try:
-                result = np.empty(len(values), dtype=object)
-                result[:] = values
-            except ValueError:
-                # we have a list-of-list
-                result[:] = [tuple(x) for x in values]
+        # Avoid building an array of arrays:
+        # TODO: verify whether any path hits this except #18819 (invalid)
+        values = [tuple(x) for x in values]
+        result = construct_1d_object_array_from_listlike(values)
 
     return result
 
 
-def _index_labels_to_array(labels):
+def index_labels_to_array(labels, dtype=None):
+    """
+    Transform label or iterable of labels to array, for use in Index.
+
+    Parameters
+    ----------
+    dtype : dtype
+        If specified, use as dtype of the resulting array, otherwise infer.
+
+    Returns
+    -------
+    array
+    """
     if isinstance(labels, (compat.string_types, tuple)):
         labels = [labels]
 
@@ -414,36 +279,48 @@ def _index_labels_to_array(labels):
         except TypeError:  # non-iterable
             labels = [labels]
 
-    labels = _asarray_tuplesafe(labels)
+    labels = asarray_tuplesafe(labels, dtype=dtype)
 
     return labels
 
 
-def _maybe_make_list(obj):
+def maybe_make_list(obj):
     if obj is not None and not isinstance(obj, (tuple, list)):
         return [obj]
     return obj
 
 
 def is_null_slice(obj):
-    """ we have a null slice """
+    """
+    We have a null slice.
+    """
     return (isinstance(obj, slice) and obj.start is None and
             obj.stop is None and obj.step is None)
 
 
+def is_true_slices(l):
+    """
+    Find non-trivial slices in "l": return a list of booleans with same length.
+    """
+    return [isinstance(k, slice) and not is_null_slice(k) for k in l]
+
+
+# TODO: used only once in indexing; belongs elsewhere?
 def is_full_slice(obj, l):
-    """ we have a full length slice """
+    """
+    We have a full length slice.
+    """
     return (isinstance(obj, slice) and obj.start == 0 and obj.stop == l and
             obj.step is None)
 
 
-def _get_callable_name(obj):
+def get_callable_name(obj):
     # typical case has name
     if hasattr(obj, '__name__'):
         return getattr(obj, '__name__')
     # some objects don't; could recurse
     if isinstance(obj, partial):
-        return _get_callable_name(obj.func)
+        return get_callable_name(obj.func)
     # fall back to class name
     if hasattr(obj, '__call__'):
         return obj.__class__.__name__
@@ -454,39 +331,28 @@ def _get_callable_name(obj):
     return None
 
 
-def _apply_if_callable(maybe_callable, obj, **kwargs):
+def apply_if_callable(maybe_callable, obj, **kwargs):
     """
     Evaluate possibly callable input using obj and kwargs if it is callable,
-    otherwise return as it is
+    otherwise return as it is.
+
+    Parameters
+    ----------
+    maybe_callable : possibly a callable
+    obj : NDFrame
+    **kwargs
     """
+
     if callable(maybe_callable):
         return maybe_callable(obj, **kwargs)
-    return maybe_callable
-
 
-def _all_none(*args):
-    for arg in args:
-        if arg is not None:
-            return False
-    return True
-
-
-def _where_compat(mask, arr1, arr2):
-    if arr1.dtype == _NS_DTYPE and arr2.dtype == _NS_DTYPE:
-        new_vals = np.where(mask, arr1.view('i8'), arr2.view('i8'))
-        return new_vals.view(_NS_DTYPE)
-
-    if arr1.dtype == _NS_DTYPE:
-        arr1 = tslib.ints_to_pydatetime(arr1.view('i8'))
-    if arr2.dtype == _NS_DTYPE:
-        arr2 = tslib.ints_to_pydatetime(arr2.view('i8'))
-
-    return np.where(mask, arr1, arr2)
+    return maybe_callable
 
 
-def _dict_compat(d):
+def dict_compat(d):
     """
-    Helper function to convert datetimelike-keyed dicts to Timestamp-keyed dict
+    Helper function to convert datetimelike-keyed dicts
+    to Timestamp-keyed dict.
 
     Parameters
     ----------
@@ -497,88 +363,46 @@ def _dict_compat(d):
     dict
 
     """
-    return dict((_maybe_box_datetimelike(key), value)
-                for key, value in iteritems(d))
-
-
-def sentinel_factory():
-    class Sentinel(object):
-        pass
-
-    return Sentinel()
-
-
-# ----------------------------------------------------------------------
-# Detect our environment
+    return {maybe_box_datetimelike(key): value for key, value in iteritems(d)}
 
-def in_interactive_session():
-    """ check if we're running in an interactive shell
 
-    returns True if running under python/ipython interactive shell
+def standardize_mapping(into):
     """
+    Helper function to standardize a supplied mapping.
 
-    def check_main():
-        import __main__ as main
-        return (not hasattr(main, '__file__') or
-                get_option('mode.sim_interactive'))
+    .. versionadded:: 0.21.0
 
-    try:
-        return __IPYTHON__ or check_main()  # noqa
-    except:
-        return check_main()
-
-
-def in_qtconsole():
-    """
-    check if we're inside an IPython qtconsole
-
-    DEPRECATED: This is no longer needed, or working, in IPython 3 and above.
-    """
-    try:
-        ip = get_ipython()  # noqa
-        front_end = (
-            ip.config.get('KernelApp', {}).get('parent_appname', "") or
-            ip.config.get('IPKernelApp', {}).get('parent_appname', ""))
-        if 'qtconsole' in front_end.lower():
-            return True
-    except:
-        return False
-    return False
-
-
-def in_ipnb():
-    """
-    check if we're inside an IPython Notebook
-
-    DEPRECATED: This is no longer used in pandas, and won't work in IPython 3
-    and above.
-    """
-    try:
-        ip = get_ipython()  # noqa
-        front_end = (
-            ip.config.get('KernelApp', {}).get('parent_appname', "") or
-            ip.config.get('IPKernelApp', {}).get('parent_appname', ""))
-        if 'notebook' in front_end.lower():
-            return True
-    except:
-        return False
-    return False
+    Parameters
+    ----------
+    into : instance or subclass of collections.Mapping
+        Must be a class, an initialized collections.defaultdict,
+        or an instance of a collections.Mapping subclass.
 
+    Returns
+    -------
+    mapping : a collections.Mapping subclass or other constructor
+        a callable object that can accept an iterator to create
+        the desired Mapping.
 
-def in_ipython_frontend():
-    """
-    check if we're inside an an IPython zmq frontend
+    See Also
+    --------
+    DataFrame.to_dict
+    Series.to_dict
     """
-    try:
-        ip = get_ipython()  # noqa
-        return 'zmq' in str(type(ip)).lower()
-    except:
-        pass
-
-    return False
-
-
-def _random_state(state=None):
+    if not inspect.isclass(into):
+        if isinstance(into, collections.defaultdict):
+            return partial(
+                collections.defaultdict, into.default_factory)
+        into = type(into)
+    if not issubclass(into, compat.Mapping):
+        raise TypeError('unsupported type: {into}'.format(into=into))
+    elif into == collections.defaultdict:
+        raise TypeError(
+            'to_dict() only accepts initialized defaultdicts')
+    return into
+
+
+def random_state(state=None):
     """
     Helper function for processing random_state arguments.
 
@@ -596,7 +420,7 @@ def _random_state(state=None):
     np.random.RandomState
     """
 
-    if types.is_integer(state):
+    if is_integer(state):
         return np.random.RandomState(state)
     elif isinstance(state, np.random.RandomState):
         return state
@@ -605,3 +429,56 @@ def _random_state(state=None):
     else:
         raise ValueError("random_state must be an integer, a numpy "
                          "RandomState, or None")
+
+
+def _pipe(obj, func, *args, **kwargs):
+    """
+    Apply a function ``func`` to object ``obj`` either by passing obj as the
+    first argument to the function or, in the case that the func is a tuple,
+    interpret the first element of the tuple as a function and pass the obj to
+    that function as a keyword argument whose key is the value of the second
+    element of the tuple.
+
+    Parameters
+    ----------
+    func : callable or tuple of (callable, string)
+        Function to apply to this object or, alternatively, a
+        ``(callable, data_keyword)`` tuple where ``data_keyword`` is a
+        string indicating the keyword of `callable`` that expects the
+        object.
+    args : iterable, optional
+        positional arguments passed into ``func``.
+    kwargs : dict, optional
+        a dictionary of keyword arguments passed into ``func``.
+
+    Returns
+    -------
+    object : the return type of ``func``.
+    """
+    if isinstance(func, tuple):
+        func, target = func
+        if target in kwargs:
+            msg = '%s is both the pipe target and a keyword argument' % target
+            raise ValueError(msg)
+        kwargs[target] = obj
+        return func(*args, **kwargs)
+    else:
+        return func(obj, *args, **kwargs)
+
+
+def _get_rename_function(mapper):
+    """
+    Returns a function that will map names/labels, dependent if mapper
+    is a dict, Series or just a function.
+    """
+    if isinstance(mapper, (compat.Mapping, ABCSeries)):
+
+        def f(x):
+            if x in mapper:
+                return mapper[x]
+            else:
+                return x
+    else:
+        f = mapper
+
+    return f
diff --git a/pandas/formats/__init__.py b/pandas/core/computation/__init__.py
similarity index 100%
rename from pandas/formats/__init__.py
rename to pandas/core/computation/__init__.py
diff --git a/pandas/computation/align.py b/pandas/core/computation/align.py
similarity index 83%
rename from pandas/computation/align.py
rename to pandas/core/computation/align.py
index 4e12d58a4ab85..951174648091f 100644
--- a/pandas/computation/align.py
+++ b/pandas/core/computation/align.py
@@ -1,16 +1,18 @@
 """Core eval alignment algorithms
 """
 
-import warnings
 from functools import partial, wraps
-from pandas.compat import zip, range
+import warnings
 
 import numpy as np
 
+from pandas.compat import range, zip
+from pandas.errors import PerformanceWarning
+
 import pandas as pd
 from pandas import compat
 import pandas.core.common as com
-from pandas.computation.common import _result_type_many
+from pandas.core.computation.common import _result_type_many
 
 
 def _align_core_single_unary_op(term):
@@ -28,9 +30,8 @@ def _align_core_single_unary_op(term):
 
 
 def _zip_axes_from_type(typ, new_axes):
-    axes = {}
-    for ax_ind, ax_name in compat.iteritems(typ._AXIS_NAMES):
-        axes[ax_name] = new_axes[ax_ind]
+    axes = {ax_name: new_axes[ax_ind]
+            for ax_ind, ax_name in compat.iteritems(typ._AXIS_NAMES)}
     return axes
 
 
@@ -88,7 +89,7 @@ def _align_core(terms):
         for axis, items in zip(range(ndim), axes):
             ti = terms[i].value
 
-            if hasattr(ti, 'reindex_axis'):
+            if hasattr(ti, 'reindex'):
                 transpose = isinstance(ti, pd.Series) and naxes > 1
                 reindexer = axes[naxes - 1] if transpose else items
 
@@ -97,18 +98,13 @@ def _align_core(terms):
 
                 ordm = np.log10(max(1, abs(reindexer_size - term_axis_size)))
                 if ordm >= 1 and reindexer_size >= 10000:
-                    warnings.warn('Alignment difference on axis {0} is larger '
-                                  'than an order of magnitude on term {1!r}, '
-                                  'by more than {2:.4g}; performance may '
-                                  'suffer'.format(axis, terms[i].name, ordm),
-                                  category=pd.core.common.PerformanceWarning,
-                                  stacklevel=6)
-
-                if transpose:
-                    f = partial(ti.reindex, index=reindexer, copy=False)
-                else:
-                    f = partial(ti.reindex_axis, reindexer, axis=axis,
-                                copy=False)
+                    w = ('Alignment difference on axis {axis} is larger '
+                         'than an order of magnitude on term {term!r}, by '
+                         'more than {ordm:.4g}; performance may suffer'
+                         ).format(axis=axis, term=terms[i].name, ordm=ordm)
+                    warnings.warn(w, category=PerformanceWarning, stacklevel=6)
+
+                f = partial(ti.reindex, reindexer, axis=axis, copy=False)
 
                 terms[i].update(f())
 
@@ -130,7 +126,7 @@ def _align(terms):
         return np.result_type(terms.type), None
 
     # if all resolved variables are numeric scalars
-    if all(term.isscalar for term in terms):
+    if all(term.is_scalar for term in terms):
         return _result_type_many(*(term.value for term in terms)).type, None
 
     # perform the main alignment
diff --git a/pandas/core/computation/api.py b/pandas/core/computation/api.py
new file mode 100644
index 0000000000000..31e8a4873b0ad
--- /dev/null
+++ b/pandas/core/computation/api.py
@@ -0,0 +1,3 @@
+# flake8: noqa
+
+from pandas.core.computation.eval import eval
diff --git a/pandas/core/computation/check.py b/pandas/core/computation/check.py
new file mode 100644
index 0000000000000..da89bde56fe18
--- /dev/null
+++ b/pandas/core/computation/check.py
@@ -0,0 +1,24 @@
+from distutils.version import LooseVersion
+import warnings
+
+_NUMEXPR_INSTALLED = False
+_MIN_NUMEXPR_VERSION = "2.6.1"
+_NUMEXPR_VERSION = None
+
+try:
+    import numexpr as ne
+    ver = LooseVersion(ne.__version__)
+    _NUMEXPR_INSTALLED = ver >= LooseVersion(_MIN_NUMEXPR_VERSION)
+    _NUMEXPR_VERSION = ver
+
+    if not _NUMEXPR_INSTALLED:
+        warnings.warn(
+            "The installed version of numexpr {ver} is not supported "
+            "in pandas and will be not be used\nThe minimum supported "
+            "version is {min_ver}\n".format(
+                ver=ver, min_ver=_MIN_NUMEXPR_VERSION), UserWarning)
+
+except ImportError:  # pragma: no cover
+    pass
+
+__all__ = ['_NUMEXPR_INSTALLED', '_NUMEXPR_VERSION']
diff --git a/pandas/core/computation/common.py b/pandas/core/computation/common.py
new file mode 100644
index 0000000000000..e7eca04e413c5
--- /dev/null
+++ b/pandas/core/computation/common.py
@@ -0,0 +1,26 @@
+import numpy as np
+
+from pandas.compat import reduce
+
+import pandas as pd
+
+
+def _ensure_decoded(s):
+    """ if we have bytes, decode them to unicode """
+    if isinstance(s, (np.bytes_, bytes)):
+        s = s.decode(pd.get_option('display.encoding'))
+    return s
+
+
+def _result_type_many(*arrays_and_dtypes):
+    """ wrapper around numpy.result_type which overcomes the NPY_MAXARGS (32)
+    argument limit """
+    try:
+        return np.result_type(*arrays_and_dtypes)
+    except ValueError:
+        # we have > NPY_MAXARGS terms in our expression
+        return reduce(np.result_type, arrays_and_dtypes)
+
+
+class NameResolutionError(NameError):
+    pass
diff --git a/pandas/computation/engines.py b/pandas/core/computation/engines.py
similarity index 86%
rename from pandas/computation/engines.py
rename to pandas/core/computation/engines.py
index a3de78c2f2089..bccd37131c81a 100644
--- a/pandas/computation/engines.py
+++ b/pandas/core/computation/engines.py
@@ -1,18 +1,17 @@
-"""Engine classes for :func:`~pandas.eval`
 """
-
-# flake8: noqa
+Engine classes for :func:`~pandas.eval`
+"""
 
 import abc
 
+from pandas.compat import map
+
 from pandas import compat
-from pandas.compat import DeepChainMap, map
-import pandas.core.common as com
-import pandas.formats.printing as printing
-from pandas.computation.align import _align, _reconstruct_object
-from pandas.computation.ops import (UndefinedVariableError,
-                                    _mathops, _reductions)
+from pandas.core.computation.align import _align, _reconstruct_object
+from pandas.core.computation.ops import (
+    UndefinedVariableError, _mathops, _reductions)
 
+import pandas.io.formats.printing as printing
 
 _ne_builtins = frozenset(_mathops + _reductions)
 
@@ -34,8 +33,9 @@ def _check_ne_builtin_clash(expr):
 
     if overlap:
         s = ', '.join(map(repr, overlap))
-        raise NumExprClobberingError('Variables in expression "%s" '
-                                     'overlap with builtins: (%s)' % (expr, s))
+        raise NumExprClobberingError('Variables in expression "{expr}" '
+                                     'overlap with builtins: ({s})'
+                                     .format(expr=expr, s=s))
 
 
 class AbstractEngine(object):
diff --git a/pandas/core/computation/eval.py b/pandas/core/computation/eval.py
new file mode 100644
index 0000000000000..23c3e0eaace81
--- /dev/null
+++ b/pandas/core/computation/eval.py
@@ -0,0 +1,351 @@
+#!/usr/bin/env python
+
+"""Top level ``eval`` module.
+"""
+
+import tokenize
+import warnings
+
+from pandas.compat import string_types
+from pandas.util._validators import validate_bool_kwarg
+
+from pandas.core.computation.engines import _engines
+from pandas.core.computation.scope import _ensure_scope
+
+from pandas.io.formats.printing import pprint_thing
+
+
+def _check_engine(engine):
+    """Make sure a valid engine is passed.
+
+    Parameters
+    ----------
+    engine : str
+
+    Raises
+    ------
+    KeyError
+      * If an invalid engine is passed
+    ImportError
+      * If numexpr was requested but doesn't exist
+
+    Returns
+    -------
+    string engine
+
+    """
+    from pandas.core.computation.check import _NUMEXPR_INSTALLED
+
+    if engine is None:
+        if _NUMEXPR_INSTALLED:
+            engine = 'numexpr'
+        else:
+            engine = 'python'
+
+    if engine not in _engines:
+        valid = list(_engines.keys())
+        raise KeyError('Invalid engine {engine!r} passed, valid engines are'
+                       ' {valid}'.format(engine=engine, valid=valid))
+
+    # TODO: validate this in a more general way (thinking of future engines
+    # that won't necessarily be import-able)
+    # Could potentially be done on engine instantiation
+    if engine == 'numexpr':
+        if not _NUMEXPR_INSTALLED:
+            raise ImportError("'numexpr' is not installed or an "
+                              "unsupported version. Cannot use "
+                              "engine='numexpr' for query/eval "
+                              "if 'numexpr' is not installed")
+
+    return engine
+
+
+def _check_parser(parser):
+    """Make sure a valid parser is passed.
+
+    Parameters
+    ----------
+    parser : str
+
+    Raises
+    ------
+    KeyError
+      * If an invalid parser is passed
+    """
+    from pandas.core.computation.expr import _parsers
+
+    if parser not in _parsers:
+        raise KeyError('Invalid parser {parser!r} passed, valid parsers are'
+                       ' {valid}'.format(parser=parser, valid=_parsers.keys()))
+
+
+def _check_resolvers(resolvers):
+    if resolvers is not None:
+        for resolver in resolvers:
+            if not hasattr(resolver, '__getitem__'):
+                name = type(resolver).__name__
+                raise TypeError('Resolver of type {name!r} does not implement '
+                                'the __getitem__ method'.format(name=name))
+
+
+def _check_expression(expr):
+    """Make sure an expression is not an empty string
+
+    Parameters
+    ----------
+    expr : object
+        An object that can be converted to a string
+
+    Raises
+    ------
+    ValueError
+      * If expr is an empty string
+    """
+    if not expr:
+        raise ValueError("expr cannot be an empty string")
+
+
+def _convert_expression(expr):
+    """Convert an object to an expression.
+
+    Thus function converts an object to an expression (a unicode string) and
+    checks to make sure it isn't empty after conversion. This is used to
+    convert operators to their string representation for recursive calls to
+    :func:`~pandas.eval`.
+
+    Parameters
+    ----------
+    expr : object
+        The object to be converted to a string.
+
+    Returns
+    -------
+    s : unicode
+        The string representation of an object.
+
+    Raises
+    ------
+    ValueError
+      * If the expression is empty.
+    """
+    s = pprint_thing(expr)
+    _check_expression(s)
+    return s
+
+
+def _check_for_locals(expr, stack_level, parser):
+    from pandas.core.computation.expr import tokenize_string
+
+    at_top_of_stack = stack_level == 0
+    not_pandas_parser = parser != 'pandas'
+
+    if not_pandas_parser:
+        msg = "The '@' prefix is only supported by the pandas parser"
+    elif at_top_of_stack:
+        msg = ("The '@' prefix is not allowed in "
+               "top-level eval calls, \nplease refer to "
+               "your variables by name without the '@' "
+               "prefix")
+
+    if at_top_of_stack or not_pandas_parser:
+        for toknum, tokval in tokenize_string(expr):
+            if toknum == tokenize.OP and tokval == '@':
+                raise SyntaxError(msg)
+
+
+def eval(expr, parser='pandas', engine=None, truediv=True,
+         local_dict=None, global_dict=None, resolvers=(), level=0,
+         target=None, inplace=False):
+    """Evaluate a Python expression as a string using various backends.
+
+    The following arithmetic operations are supported: ``+``, ``-``, ``*``,
+    ``/``, ``**``, ``%``, ``//`` (python engine only) along with the following
+    boolean operations: ``|`` (or), ``&`` (and), and ``~`` (not).
+    Additionally, the ``'pandas'`` parser allows the use of :keyword:`and`,
+    :keyword:`or`, and :keyword:`not` with the same semantics as the
+    corresponding bitwise operators.  :class:`~pandas.Series` and
+    :class:`~pandas.DataFrame` objects are supported and behave as they would
+    with plain ol' Python evaluation.
+
+    Parameters
+    ----------
+    expr : str or unicode
+        The expression to evaluate. This string cannot contain any Python
+        `statements
+        <https://docs.python.org/3/reference/simple_stmts.html#simple-statements>`__,
+        only Python `expressions
+        <https://docs.python.org/3/reference/simple_stmts.html#expression-statements>`__.
+    parser : string, default 'pandas', {'pandas', 'python'}
+        The parser to use to construct the syntax tree from the expression. The
+        default of ``'pandas'`` parses code slightly different than standard
+        Python. Alternatively, you can parse an expression using the
+        ``'python'`` parser to retain strict Python semantics.  See the
+        :ref:`enhancing performance <enhancingperf.eval>` documentation for
+        more details.
+    engine : string or None, default 'numexpr', {'python', 'numexpr'}
+
+        The engine used to evaluate the expression. Supported engines are
+
+        - None         : tries to use ``numexpr``, falls back to ``python``
+        - ``'numexpr'``: This default engine evaluates pandas objects using
+                         numexpr for large speed ups in complex expressions
+                         with large frames.
+        - ``'python'``: Performs operations as if you had ``eval``'d in top
+                        level python. This engine is generally not that useful.
+
+        More backends may be available in the future.
+
+    truediv : bool, optional
+        Whether to use true division, like in Python >= 3
+    local_dict : dict or None, optional
+        A dictionary of local variables, taken from locals() by default.
+    global_dict : dict or None, optional
+        A dictionary of global variables, taken from globals() by default.
+    resolvers : list of dict-like or None, optional
+        A list of objects implementing the ``__getitem__`` special method that
+        you can use to inject an additional collection of namespaces to use for
+        variable lookup. For example, this is used in the
+        :meth:`~DataFrame.query` method to inject the
+        ``DataFrame.index`` and ``DataFrame.columns``
+        variables that refer to their respective :class:`~pandas.DataFrame`
+        instance attributes.
+    level : int, optional
+        The number of prior stack frames to traverse and add to the current
+        scope. Most users will **not** need to change this parameter.
+    target : object, optional, default None
+        This is the target object for assignment. It is used when there is
+        variable assignment in the expression. If so, then `target` must
+        support item assignment with string keys, and if a copy is being
+        returned, it must also support `.copy()`.
+    inplace : bool, default False
+        If `target` is provided, and the expression mutates `target`, whether
+        to modify `target` inplace. Otherwise, return a copy of `target` with
+        the mutation.
+
+    Returns
+    -------
+    ndarray, numeric scalar, DataFrame, Series
+
+    Raises
+    ------
+    ValueError
+        There are many instances where such an error can be raised:
+
+        - `target=None`, but the expression is multiline.
+        - The expression is multiline, but not all them have item assignment.
+          An example of such an arrangement is this:
+
+          a = b + 1
+          a + 2
+
+          Here, there are expressions on different lines, making it multiline,
+          but the last line has no variable assigned to the output of `a + 2`.
+        - `inplace=True`, but the expression is missing item assignment.
+        - Item assignment is provided, but the `target` does not support
+          string item assignment.
+        - Item assignment is provided and `inplace=False`, but the `target`
+          does not support the `.copy()` method
+
+    See Also
+    --------
+    DataFrame.query
+    DataFrame.eval
+
+    Notes
+    -----
+    The ``dtype`` of any objects involved in an arithmetic ``%`` operation are
+    recursively cast to ``float64``.
+
+    See the :ref:`enhancing performance <enhancingperf.eval>` documentation for
+    more details.
+    """
+    from pandas.core.computation.expr import Expr
+
+    inplace = validate_bool_kwarg(inplace, "inplace")
+
+    if isinstance(expr, string_types):
+        _check_expression(expr)
+        exprs = [e.strip() for e in expr.splitlines() if e.strip() != '']
+    else:
+        exprs = [expr]
+    multi_line = len(exprs) > 1
+
+    if multi_line and target is None:
+        raise ValueError("multi-line expressions are only valid in the "
+                         "context of data, use DataFrame.eval")
+
+    ret = None
+    first_expr = True
+    target_modified = False
+
+    for expr in exprs:
+        expr = _convert_expression(expr)
+        engine = _check_engine(engine)
+        _check_parser(parser)
+        _check_resolvers(resolvers)
+        _check_for_locals(expr, level, parser)
+
+        # get our (possibly passed-in) scope
+        env = _ensure_scope(level + 1, global_dict=global_dict,
+                            local_dict=local_dict, resolvers=resolvers,
+                            target=target)
+
+        parsed_expr = Expr(expr, engine=engine, parser=parser, env=env,
+                           truediv=truediv)
+
+        # construct the engine and evaluate the parsed expression
+        eng = _engines[engine]
+        eng_inst = eng(parsed_expr)
+        ret = eng_inst.evaluate()
+
+        if parsed_expr.assigner is None:
+            if multi_line:
+                raise ValueError("Multi-line expressions are only valid"
+                                 " if all expressions contain an assignment")
+            elif inplace:
+                raise ValueError("Cannot operate inplace "
+                                 "if there is no assignment")
+
+        # assign if needed
+        assigner = parsed_expr.assigner
+        if env.target is not None and assigner is not None:
+            target_modified = True
+
+            # if returning a copy, copy only on the first assignment
+            if not inplace and first_expr:
+                try:
+                    target = env.target.copy()
+                except AttributeError:
+                    raise ValueError("Cannot return a copy of the target")
+            else:
+                target = env.target
+
+            # TypeError is most commonly raised (e.g. int, list), but you
+            # get IndexError if you try to do this assignment on np.ndarray.
+            # we will ignore numpy warnings here; e.g. if trying
+            # to use a non-numeric indexer
+            try:
+                with warnings.catch_warnings(record=True):
+                    # TODO: Filter the warnings we actually care about here.
+                    target[assigner] = ret
+            except (TypeError, IndexError):
+                raise ValueError("Cannot assign expression output to target")
+
+            if not resolvers:
+                resolvers = ({assigner: ret},)
+            else:
+                # existing resolver needs updated to handle
+                # case of mutating existing column in copy
+                for resolver in resolvers:
+                    if assigner in resolver:
+                        resolver[assigner] = ret
+                        break
+                else:
+                    resolvers += ({assigner: ret},)
+
+            ret = None
+            first_expr = False
+
+    # We want to exclude `inplace=None` as being False.
+    if inplace is False:
+        return target if target_modified else ret
diff --git a/pandas/computation/expr.py b/pandas/core/computation/expr.py
similarity index 88%
rename from pandas/computation/expr.py
rename to pandas/core/computation/expr.py
index e78806b38c667..d840bf6ae71a2 100644
--- a/pandas/computation/expr.py
+++ b/pandas/core/computation/expr.py
@@ -2,24 +2,24 @@
 """
 
 import ast
+from functools import partial
 import tokenize
 
-from functools import partial
 import numpy as np
 
+from pandas.compat import StringIO, lmap, reduce, string_types, zip
+
 import pandas as pd
 from pandas import compat
-from pandas.compat import StringIO, lmap, zip, reduce, string_types
-from pandas.core.base import StringMixin
 from pandas.core import common as com
-import pandas.formats.printing as printing
-from pandas.tools.util import compose
-from pandas.computation.ops import (_cmp_ops_syms, _bool_ops_syms,
-                                    _arith_ops_syms, _unary_ops_syms, is_term)
-from pandas.computation.ops import _reductions, _mathops, _LOCAL_TAG
-from pandas.computation.ops import Op, BinOp, UnaryOp, Term, Constant, Div
-from pandas.computation.ops import UndefinedVariableError, FuncNode
-from pandas.computation.scope import Scope
+from pandas.core.base import StringMixin
+from pandas.core.computation.ops import (
+    _LOCAL_TAG, BinOp, Constant, Div, FuncNode, Op, Term, UnaryOp,
+    UndefinedVariableError, _arith_ops_syms, _bool_ops_syms, _cmp_ops_syms,
+    _mathops, _reductions, _unary_ops_syms, is_term)
+from pandas.core.computation.scope import Scope
+
+import pandas.io.formats.printing as printing
 
 
 def tokenize_string(source):
@@ -102,8 +102,19 @@ def _replace_locals(tok):
     return toknum, tokval
 
 
-def _preparse(source, f=compose(_replace_locals, _replace_booleans,
-                                _rewrite_assign)):
+def _compose2(f, g):
+    """Compose 2 callables"""
+    return lambda *args, **kwargs: f(g(*args, **kwargs))
+
+
+def _compose(*funcs):
+    """Compose 2 or more callables"""
+    assert len(funcs) > 1, 'At least 2 callables must be passed to compose'
+    return reduce(_compose2, funcs)
+
+
+def _preparse(source, f=_compose(_replace_locals, _replace_booleans,
+                                 _rewrite_assign)):
     """Compose a collection of tokenization functions
 
     Parameters
@@ -188,8 +199,8 @@ def _filter_nodes(superclass, all_nodes=_all_nodes):
 # and we don't want `stmt` and friends in their so get only the class whose
 # names are capitalized
 _base_supported_nodes = (_all_node_names - _unsupported_nodes) | _hacked_nodes
-_msg = 'cannot both support and not support {0}'.format(_unsupported_nodes &
-                                                        _base_supported_nodes)
+_msg = 'cannot both support and not support {intersection}'.format(
+    intersection=_unsupported_nodes & _base_supported_nodes)
 assert not _unsupported_nodes & _base_supported_nodes, _msg
 
 
@@ -199,8 +210,8 @@ def _node_not_implemented(node_name, cls):
     """
 
     def f(self, *args, **kwargs):
-        raise NotImplementedError("{0!r} nodes are not "
-                                  "implemented".format(node_name))
+        raise NotImplementedError("{name!r} nodes are not "
+                                  "implemented".format(name=node_name))
     return f
 
 
@@ -216,7 +227,7 @@ def disallowed(cls):
         cls.unsupported_nodes = ()
         for node in nodes:
             new_method = _node_not_implemented(node, cls)
-            name = 'visit_{0}'.format(node)
+            name = 'visit_{node}'.format(node=node)
             cls.unsupported_nodes += (name,)
             setattr(cls, name, new_method)
         return cls
@@ -250,13 +261,14 @@ def add_ops(op_classes):
     """Decorator to add default implementation of ops."""
     def f(cls):
         for op_attr_name, op_class in compat.iteritems(op_classes):
-            ops = getattr(cls, '{0}_ops'.format(op_attr_name))
-            ops_map = getattr(cls, '{0}_op_nodes_map'.format(op_attr_name))
+            ops = getattr(cls, '{name}_ops'.format(name=op_attr_name))
+            ops_map = getattr(cls, '{name}_op_nodes_map'.format(
+                name=op_attr_name))
             for op in ops:
                 op_node = ops_map[op]
                 if op_node is not None:
                     made_op = _op_maker(op_class, op)
-                    setattr(cls, 'visit_{0}'.format(op_node), made_op)
+                    setattr(cls, 'visit_{node}'.format(node=op_node), made_op)
         return cls
     return f
 
@@ -305,7 +317,14 @@ def __init__(self, env, engine, parser, preparser=_preparse):
     def visit(self, node, **kwargs):
         if isinstance(node, string_types):
             clean = self.preparser(node)
-            node = ast.fix_missing_locations(ast.parse(clean))
+            try:
+                node = ast.fix_missing_locations(ast.parse(clean))
+            except SyntaxError as e:
+                from keyword import iskeyword
+                if any(iskeyword(x) for x in clean.split()):
+                    e.msg = ("Python keyword not valid identifier"
+                             " in numexpr query")
+                raise e
 
         method = 'visit_' + node.__class__.__name__
         visitor = getattr(self, method)
@@ -359,11 +378,11 @@ def _maybe_transform_eq_ne(self, node, left=None, right=None):
 
     def _maybe_downcast_constants(self, left, right):
         f32 = np.dtype(np.float32)
-        if left.isscalar and not right.isscalar and right.return_type == f32:
+        if left.is_scalar and not right.is_scalar and right.return_type == f32:
             # right is a float32 array, left is a scalar
             name = self.env.add_tmp(np.float32(left.value))
             left = self.term_type(name, self.env)
-        if right.isscalar and not left.isscalar and left.return_type == f32:
+        if right.is_scalar and not left.is_scalar and left.return_type == f32:
             # left is a float32 array, right is a scalar
             name = self.env.add_tmp(np.float32(right.value))
             right = self.term_type(name, self.env)
@@ -387,9 +406,10 @@ def _maybe_evaluate_binop(self, op, op_class, lhs, rhs,
         res = op(lhs, rhs)
 
         if res.has_invalid_return_type:
-            raise TypeError("unsupported operand type(s) for {0}:"
-                            " '{1}' and '{2}'".format(res.op, lhs.type,
-                                                      rhs.type))
+            raise TypeError("unsupported operand type(s) for {op}:"
+                            " '{lhs}' and '{rhs}'".format(op=res.op,
+                                                          lhs=lhs.type,
+                                                          rhs=rhs.type))
 
         if self.engine != 'pytables':
             if (res.op in _cmp_ops_syms and
@@ -526,7 +546,8 @@ def visit_Attribute(self, node, **kwargs):
                 if isinstance(value, ast.Name) and value.id == attr:
                     return resolved
 
-        raise ValueError("Invalid Attribute context {0}".format(ctx.__name__))
+        raise ValueError("Invalid Attribute context {name}"
+                         .format(name=ctx.__name__))
 
     def visit_Call_35(self, node, side=None, **kwargs):
         """ in 3.5 the starargs attribute was changed to be more flexible,
@@ -548,7 +569,8 @@ def visit_Call_35(self, node, side=None, **kwargs):
                     raise
 
         if res is None:
-            raise ValueError("Invalid function call {0}".format(node.func.id))
+            raise ValueError("Invalid function call {func}"
+                             .format(func=node.func.id))
         if hasattr(res, 'value'):
             res = res.value
 
@@ -557,8 +579,8 @@ def visit_Call_35(self, node, side=None, **kwargs):
             new_args = [self.visit(arg) for arg in node.args]
 
             if node.keywords:
-                raise TypeError("Function \"{0}\" does not support keyword "
-                                "arguments".format(res.name))
+                raise TypeError("Function \"{name}\" does not support keyword "
+                                "arguments".format(name=res.name))
 
             return res(*new_args, **kwargs)
 
@@ -569,7 +591,7 @@ def visit_Call_35(self, node, side=None, **kwargs):
             for key in node.keywords:
                 if not isinstance(key, ast.keyword):
                     raise ValueError("keyword error in function call "
-                                     "'{0}'".format(node.func.id))
+                                     "'{func}'".format(func=node.func.id))
 
                 if key.arg:
                     # TODO: bug?
@@ -597,7 +619,8 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
                     raise
 
         if res is None:
-            raise ValueError("Invalid function call {0}".format(node.func.id))
+            raise ValueError("Invalid function call {func}"
+                             .format(func=node.func.id))
         if hasattr(res, 'value'):
             res = res.value
 
@@ -608,8 +631,8 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
                 args += self.visit(node.starargs)
 
             if node.keywords or node.kwargs:
-                raise TypeError("Function \"{0}\" does not support keyword "
-                                "arguments".format(res.name))
+                raise TypeError("Function \"{name}\" does not support keyword "
+                                "arguments".format(name=res.name))
 
             return res(*args, **kwargs)
 
@@ -622,7 +645,7 @@ def visit_Call_legacy(self, node, side=None, **kwargs):
             for key in node.keywords:
                 if not isinstance(key, ast.keyword):
                     raise ValueError("keyword error in function call "
-                                     "'{0}'".format(node.func.id))
+                                     "'{func}'".format(func=node.func.id))
                 keywords[key.arg] = self.visit(key.value).value
             if node.kwargs is not None:
                 keywords.update(self.visit(node.kwargs).value)
@@ -688,8 +711,8 @@ def visitor(x, y):
 class PandasExprVisitor(BaseExprVisitor):
 
     def __init__(self, env, engine, parser,
-                 preparser=partial(_preparse, f=compose(_replace_locals,
-                                                        _replace_booleans))):
+                 preparser=partial(_preparse, f=_compose(_replace_locals,
+                                                         _replace_booleans))):
         super(PandasExprVisitor, self).__init__(env, engine, parser, preparser)
 
 
diff --git a/pandas/core/computation/expressions.py b/pandas/core/computation/expressions.py
new file mode 100644
index 0000000000000..a91ef7592a36d
--- /dev/null
+++ b/pandas/core/computation/expressions.py
@@ -0,0 +1,251 @@
+"""
+Expressions
+-----------
+
+Offer fast expression evaluation through numexpr
+
+"""
+
+import warnings
+
+import numpy as np
+
+from pandas.core.dtypes.generic import ABCDataFrame
+
+import pandas.core.common as com
+from pandas.core.computation.check import _NUMEXPR_INSTALLED
+from pandas.core.config import get_option
+
+if _NUMEXPR_INSTALLED:
+    import numexpr as ne
+
+_TEST_MODE = None
+_TEST_RESULT = None
+_USE_NUMEXPR = _NUMEXPR_INSTALLED
+_evaluate = None
+_where = None
+
+# the set of dtypes that we will allow pass to numexpr
+_ALLOWED_DTYPES = {
+    'evaluate': {'int64', 'int32', 'float64', 'float32', 'bool'},
+    'where': {'int64', 'float64', 'bool'}
+}
+
+# the minimum prod shape that we will use numexpr
+_MIN_ELEMENTS = 10000
+
+
+def set_use_numexpr(v=True):
+    # set/unset to use numexpr
+    global _USE_NUMEXPR
+    if _NUMEXPR_INSTALLED:
+        _USE_NUMEXPR = v
+
+    # choose what we are going to do
+    global _evaluate, _where
+    if not _USE_NUMEXPR:
+        _evaluate = _evaluate_standard
+        _where = _where_standard
+    else:
+        _evaluate = _evaluate_numexpr
+        _where = _where_numexpr
+
+
+def set_numexpr_threads(n=None):
+    # if we are using numexpr, set the threads to n
+    # otherwise reset
+    if _NUMEXPR_INSTALLED and _USE_NUMEXPR:
+        if n is None:
+            n = ne.detect_number_of_cores()
+        ne.set_num_threads(n)
+
+
+def _evaluate_standard(op, op_str, a, b, **eval_kwargs):
+    """ standard evaluation """
+    if _TEST_MODE:
+        _store_test_result(False)
+    with np.errstate(all='ignore'):
+        return op(a, b)
+
+
+def _can_use_numexpr(op, op_str, a, b, dtype_check):
+    """ return a boolean if we WILL be using numexpr """
+    if op_str is not None:
+
+        # required min elements (otherwise we are adding overhead)
+        if np.prod(a.shape) > _MIN_ELEMENTS:
+
+            # check for dtype compatibility
+            dtypes = set()
+            for o in [a, b]:
+                if hasattr(o, 'get_dtype_counts'):
+                    s = o.get_dtype_counts()
+                    if len(s) > 1:
+                        return False
+                    dtypes |= set(s.index)
+                elif isinstance(o, np.ndarray):
+                    dtypes |= {o.dtype.name}
+
+            # allowed are a superset
+            if not len(dtypes) or _ALLOWED_DTYPES[dtype_check] >= dtypes:
+                return True
+
+    return False
+
+
+def _evaluate_numexpr(op, op_str, a, b, truediv=True,
+                      reversed=False, **eval_kwargs):
+    result = None
+
+    if _can_use_numexpr(op, op_str, a, b, 'evaluate'):
+        try:
+
+            # we were originally called by a reversed op
+            # method
+            if reversed:
+                a, b = b, a
+
+            a_value = getattr(a, "values", a)
+            b_value = getattr(b, "values", b)
+            result = ne.evaluate('a_value {op} b_value'.format(op=op_str),
+                                 local_dict={'a_value': a_value,
+                                             'b_value': b_value},
+                                 casting='safe', truediv=truediv,
+                                 **eval_kwargs)
+        except ValueError as detail:
+            if 'unknown type object' in str(detail):
+                pass
+
+    if _TEST_MODE:
+        _store_test_result(result is not None)
+
+    if result is None:
+        result = _evaluate_standard(op, op_str, a, b)
+
+    return result
+
+
+def _where_standard(cond, a, b):
+    return np.where(com.values_from_object(cond), com.values_from_object(a),
+                    com.values_from_object(b))
+
+
+def _where_numexpr(cond, a, b):
+    result = None
+
+    if _can_use_numexpr(None, 'where', a, b, 'where'):
+
+        try:
+            cond_value = getattr(cond, 'values', cond)
+            a_value = getattr(a, 'values', a)
+            b_value = getattr(b, 'values', b)
+            result = ne.evaluate('where(cond_value, a_value, b_value)',
+                                 local_dict={'cond_value': cond_value,
+                                             'a_value': a_value,
+                                             'b_value': b_value},
+                                 casting='safe')
+        except ValueError as detail:
+            if 'unknown type object' in str(detail):
+                pass
+        except Exception as detail:
+            raise TypeError(str(detail))
+
+    if result is None:
+        result = _where_standard(cond, a, b)
+
+    return result
+
+
+# turn myself on
+set_use_numexpr(get_option('compute.use_numexpr'))
+
+
+def _has_bool_dtype(x):
+    try:
+        if isinstance(x, ABCDataFrame):
+            return 'bool' in x.dtypes
+        else:
+            return x.dtype == bool
+    except AttributeError:
+        return isinstance(x, (bool, np.bool_))
+
+
+def _bool_arith_check(op_str, a, b, not_allowed=frozenset(('/', '//', '**')),
+                      unsupported=None):
+    if unsupported is None:
+        unsupported = {'+': '|', '*': '&', '-': '^'}
+
+    if _has_bool_dtype(a) and _has_bool_dtype(b):
+        if op_str in unsupported:
+            warnings.warn("evaluating in Python space because the {op!r} "
+                          "operator is not supported by numexpr for "
+                          "the bool dtype, use {alt_op!r} instead"
+                          .format(op=op_str, alt_op=unsupported[op_str]))
+            return False
+
+        if op_str in not_allowed:
+            raise NotImplementedError("operator {op!r} not implemented for "
+                                      "bool dtypes".format(op=op_str))
+    return True
+
+
+def evaluate(op, op_str, a, b, use_numexpr=True,
+             **eval_kwargs):
+    """ evaluate and return the expression of the op on a and b
+
+        Parameters
+        ----------
+
+        op :    the actual operand
+        op_str: the string version of the op
+        a :     left operand
+        b :     right operand
+        use_numexpr : whether to try to use numexpr (default True)
+        """
+
+    use_numexpr = use_numexpr and _bool_arith_check(op_str, a, b)
+    if use_numexpr:
+        return _evaluate(op, op_str, a, b, **eval_kwargs)
+    return _evaluate_standard(op, op_str, a, b)
+
+
+def where(cond, a, b, use_numexpr=True):
+    """ evaluate the where condition cond on a and b
+
+        Parameters
+        ----------
+
+        cond : a boolean array
+        a :    return if cond is True
+        b :    return if cond is False
+        use_numexpr : whether to try to use numexpr (default True)
+        """
+
+    if use_numexpr:
+        return _where(cond, a, b)
+    return _where_standard(cond, a, b)
+
+
+def set_test_mode(v=True):
+    """
+    Keeps track of whether numexpr was used.  Stores an additional ``True``
+    for every successful use of evaluate with numexpr since the last
+    ``get_test_result``
+    """
+    global _TEST_MODE, _TEST_RESULT
+    _TEST_MODE = v
+    _TEST_RESULT = []
+
+
+def _store_test_result(used_numexpr):
+    global _TEST_RESULT
+    if used_numexpr:
+        _TEST_RESULT.append(used_numexpr)
+
+
+def get_test_result():
+    """get test result and reset test_results"""
+    global _TEST_RESULT
+    res = _TEST_RESULT
+    _TEST_RESULT = []
+    return res
diff --git a/pandas/core/computation/ops.py b/pandas/core/computation/ops.py
new file mode 100644
index 0000000000000..5c70255982e54
--- /dev/null
+++ b/pandas/core/computation/ops.py
@@ -0,0 +1,562 @@
+"""Operator classes for eval.
+"""
+
+from datetime import datetime
+from distutils.version import LooseVersion
+from functools import partial
+import operator as op
+
+import numpy as np
+
+from pandas._libs.tslibs import Timestamp
+from pandas.compat import PY3, string_types, text_type
+
+from pandas.core.dtypes.common import is_list_like, is_scalar
+
+from pandas.core.base import StringMixin
+import pandas.core.common as com
+from pandas.core.computation.common import _ensure_decoded, _result_type_many
+from pandas.core.computation.scope import _DEFAULT_GLOBALS
+
+from pandas.io.formats.printing import pprint_thing, pprint_thing_encoded
+
+_reductions = 'sum', 'prod'
+
+_unary_math_ops = ('sin', 'cos', 'exp', 'log', 'expm1', 'log1p',
+                   'sqrt', 'sinh', 'cosh', 'tanh', 'arcsin', 'arccos',
+                   'arctan', 'arccosh', 'arcsinh', 'arctanh', 'abs', 'log10',
+                   'floor', 'ceil'
+                   )
+_binary_math_ops = ('arctan2',)
+
+_mathops = _unary_math_ops + _binary_math_ops
+
+
+_LOCAL_TAG = '__pd_eval_local_'
+
+
+class UndefinedVariableError(NameError):
+
+    """NameError subclass for local variables."""
+
+    def __init__(self, name, is_local):
+        if is_local:
+            msg = 'local variable {0!r} is not defined'
+        else:
+            msg = 'name {0!r} is not defined'
+        super(UndefinedVariableError, self).__init__(msg.format(name))
+
+
+class Term(StringMixin):
+
+    def __new__(cls, name, env, side=None, encoding=None):
+        klass = Constant if not isinstance(name, string_types) else cls
+        supr_new = super(Term, klass).__new__
+        return supr_new(klass)
+
+    def __init__(self, name, env, side=None, encoding=None):
+        self._name = name
+        self.env = env
+        self.side = side
+        tname = text_type(name)
+        self.is_local = (tname.startswith(_LOCAL_TAG) or
+                         tname in _DEFAULT_GLOBALS)
+        self._value = self._resolve_name()
+        self.encoding = encoding
+
+    @property
+    def local_name(self):
+        return self.name.replace(_LOCAL_TAG, '')
+
+    def __unicode__(self):
+        return pprint_thing(self.name)
+
+    def __call__(self, *args, **kwargs):
+        return self.value
+
+    def evaluate(self, *args, **kwargs):
+        return self
+
+    def _resolve_name(self):
+        res = self.env.resolve(self.local_name, is_local=self.is_local)
+        self.update(res)
+
+        if hasattr(res, 'ndim') and res.ndim > 2:
+            raise NotImplementedError("N-dimensional objects, where N > 2,"
+                                      " are not supported with eval")
+        return res
+
+    def update(self, value):
+        """
+        search order for local (i.e., @variable) variables:
+
+        scope, key_variable
+        [('locals', 'local_name'),
+         ('globals', 'local_name'),
+         ('locals', 'key'),
+         ('globals', 'key')]
+        """
+        key = self.name
+
+        # if it's a variable name (otherwise a constant)
+        if isinstance(key, string_types):
+            self.env.swapkey(self.local_name, key, new_value=value)
+
+        self.value = value
+
+    @property
+    def is_scalar(self):
+        return is_scalar(self._value)
+
+    @property
+    def type(self):
+        try:
+            # potentially very slow for large, mixed dtype frames
+            return self._value.values.dtype
+        except AttributeError:
+            try:
+                # ndarray
+                return self._value.dtype
+            except AttributeError:
+                # scalar
+                return type(self._value)
+
+    return_type = type
+
+    @property
+    def raw(self):
+        return pprint_thing('{0}(name={1!r}, type={2})'
+                            ''.format(self.__class__.__name__, self.name,
+                                      self.type))
+
+    @property
+    def is_datetime(self):
+        try:
+            t = self.type.type
+        except AttributeError:
+            t = self.type
+
+        return issubclass(t, (datetime, np.datetime64))
+
+    @property
+    def value(self):
+        return self._value
+
+    @value.setter
+    def value(self, new_value):
+        self._value = new_value
+
+    @property
+    def name(self):
+        return self._name
+
+    @name.setter
+    def name(self, new_name):
+        self._name = new_name
+
+    @property
+    def ndim(self):
+        return self._value.ndim
+
+
+class Constant(Term):
+
+    def __init__(self, value, env, side=None, encoding=None):
+        super(Constant, self).__init__(value, env, side=side,
+                                       encoding=encoding)
+
+    def _resolve_name(self):
+        return self._name
+
+    @property
+    def name(self):
+        return self.value
+
+    def __unicode__(self):
+        # in python 2 str() of float
+        # can truncate shorter than repr()
+        return repr(self.name)
+
+
+_bool_op_map = {'not': '~', 'and': '&', 'or': '|'}
+
+
+class Op(StringMixin):
+
+    """Hold an operator of arbitrary arity
+    """
+
+    def __init__(self, op, operands, *args, **kwargs):
+        self.op = _bool_op_map.get(op, op)
+        self.operands = operands
+        self.encoding = kwargs.get('encoding', None)
+
+    def __iter__(self):
+        return iter(self.operands)
+
+    def __unicode__(self):
+        """Print a generic n-ary operator and its operands using infix
+        notation"""
+        # recurse over the operands
+        parened = ('({0})'.format(pprint_thing(opr))
+                   for opr in self.operands)
+        return pprint_thing(' {0} '.format(self.op).join(parened))
+
+    @property
+    def return_type(self):
+        # clobber types to bool if the op is a boolean operator
+        if self.op in (_cmp_ops_syms + _bool_ops_syms):
+            return np.bool_
+        return _result_type_many(*(term.type for term in com.flatten(self)))
+
+    @property
+    def has_invalid_return_type(self):
+        types = self.operand_types
+        obj_dtype_set = frozenset([np.dtype('object')])
+        return self.return_type == object and types - obj_dtype_set
+
+    @property
+    def operand_types(self):
+        return frozenset(term.type for term in com.flatten(self))
+
+    @property
+    def is_scalar(self):
+        return all(operand.is_scalar for operand in self.operands)
+
+    @property
+    def is_datetime(self):
+        try:
+            t = self.return_type.type
+        except AttributeError:
+            t = self.return_type
+
+        return issubclass(t, (datetime, np.datetime64))
+
+
+def _in(x, y):
+    """Compute the vectorized membership of ``x in y`` if possible, otherwise
+    use Python.
+    """
+    try:
+        return x.isin(y)
+    except AttributeError:
+        if is_list_like(x):
+            try:
+                return y.isin(x)
+            except AttributeError:
+                pass
+        return x in y
+
+
+def _not_in(x, y):
+    """Compute the vectorized membership of ``x not in y`` if possible,
+    otherwise use Python.
+    """
+    try:
+        return ~x.isin(y)
+    except AttributeError:
+        if is_list_like(x):
+            try:
+                return ~y.isin(x)
+            except AttributeError:
+                pass
+        return x not in y
+
+
+_cmp_ops_syms = '>', '<', '>=', '<=', '==', '!=', 'in', 'not in'
+_cmp_ops_funcs = op.gt, op.lt, op.ge, op.le, op.eq, op.ne, _in, _not_in
+_cmp_ops_dict = dict(zip(_cmp_ops_syms, _cmp_ops_funcs))
+
+_bool_ops_syms = '&', '|', 'and', 'or'
+_bool_ops_funcs = op.and_, op.or_, op.and_, op.or_
+_bool_ops_dict = dict(zip(_bool_ops_syms, _bool_ops_funcs))
+
+_arith_ops_syms = '+', '-', '*', '/', '**', '//', '%'
+_arith_ops_funcs = (op.add, op.sub, op.mul, op.truediv if PY3 else op.div,
+                    op.pow, op.floordiv, op.mod)
+_arith_ops_dict = dict(zip(_arith_ops_syms, _arith_ops_funcs))
+
+_special_case_arith_ops_syms = '**', '//', '%'
+_special_case_arith_ops_funcs = op.pow, op.floordiv, op.mod
+_special_case_arith_ops_dict = dict(zip(_special_case_arith_ops_syms,
+                                        _special_case_arith_ops_funcs))
+
+_binary_ops_dict = {}
+
+for d in (_cmp_ops_dict, _bool_ops_dict, _arith_ops_dict):
+    _binary_ops_dict.update(d)
+
+
+def _cast_inplace(terms, acceptable_dtypes, dtype):
+    """Cast an expression inplace.
+
+    Parameters
+    ----------
+    terms : Op
+        The expression that should cast.
+    acceptable_dtypes : list of acceptable numpy.dtype
+        Will not cast if term's dtype in this list.
+
+        .. versionadded:: 0.19.0
+
+    dtype : str or numpy.dtype
+        The dtype to cast to.
+    """
+    dt = np.dtype(dtype)
+    for term in terms:
+        if term.type in acceptable_dtypes:
+            continue
+
+        try:
+            new_value = term.value.astype(dt)
+        except AttributeError:
+            new_value = dt.type(term.value)
+        term.update(new_value)
+
+
+def is_term(obj):
+    return isinstance(obj, Term)
+
+
+class BinOp(Op):
+
+    """Hold a binary operator and its operands
+
+    Parameters
+    ----------
+    op : str
+    left : Term or Op
+    right : Term or Op
+    """
+
+    def __init__(self, op, lhs, rhs, **kwargs):
+        super(BinOp, self).__init__(op, (lhs, rhs))
+        self.lhs = lhs
+        self.rhs = rhs
+
+        self._disallow_scalar_only_bool_ops()
+
+        self.convert_values()
+
+        try:
+            self.func = _binary_ops_dict[op]
+        except KeyError:
+            # has to be made a list for python3
+            keys = list(_binary_ops_dict.keys())
+            raise ValueError('Invalid binary operator {0!r}, valid'
+                             ' operators are {1}'.format(op, keys))
+
+    def __call__(self, env):
+        """Recursively evaluate an expression in Python space.
+
+        Parameters
+        ----------
+        env : Scope
+
+        Returns
+        -------
+        object
+            The result of an evaluated expression.
+        """
+        # handle truediv
+        if self.op == '/' and env.scope['truediv']:
+            self.func = op.truediv
+
+        # recurse over the left/right nodes
+        left = self.lhs(env)
+        right = self.rhs(env)
+
+        return self.func(left, right)
+
+    def evaluate(self, env, engine, parser, term_type, eval_in_python):
+        """Evaluate a binary operation *before* being passed to the engine.
+
+        Parameters
+        ----------
+        env : Scope
+        engine : str
+        parser : str
+        term_type : type
+        eval_in_python : list
+
+        Returns
+        -------
+        term_type
+            The "pre-evaluated" expression as an instance of ``term_type``
+        """
+        if engine == 'python':
+            res = self(env)
+        else:
+            # recurse over the left/right nodes
+            left = self.lhs.evaluate(env, engine=engine, parser=parser,
+                                     term_type=term_type,
+                                     eval_in_python=eval_in_python)
+            right = self.rhs.evaluate(env, engine=engine, parser=parser,
+                                      term_type=term_type,
+                                      eval_in_python=eval_in_python)
+
+            # base cases
+            if self.op in eval_in_python:
+                res = self.func(left.value, right.value)
+            else:
+                from pandas.core.computation.eval import eval
+                res = eval(self, local_dict=env, engine=engine,
+                           parser=parser)
+
+        name = env.add_tmp(res)
+        return term_type(name, env=env)
+
+    def convert_values(self):
+        """Convert datetimes to a comparable value in an expression.
+        """
+        def stringify(value):
+            if self.encoding is not None:
+                encoder = partial(pprint_thing_encoded,
+                                  encoding=self.encoding)
+            else:
+                encoder = pprint_thing
+            return encoder(value)
+
+        lhs, rhs = self.lhs, self.rhs
+
+        if is_term(lhs) and lhs.is_datetime and is_term(rhs) and rhs.is_scalar:
+            v = rhs.value
+            if isinstance(v, (int, float)):
+                v = stringify(v)
+            v = Timestamp(_ensure_decoded(v))
+            if v.tz is not None:
+                v = v.tz_convert('UTC')
+            self.rhs.update(v)
+
+        if is_term(rhs) and rhs.is_datetime and is_term(lhs) and lhs.is_scalar:
+            v = lhs.value
+            if isinstance(v, (int, float)):
+                v = stringify(v)
+            v = Timestamp(_ensure_decoded(v))
+            if v.tz is not None:
+                v = v.tz_convert('UTC')
+            self.lhs.update(v)
+
+    def _disallow_scalar_only_bool_ops(self):
+        if ((self.lhs.is_scalar or self.rhs.is_scalar) and
+            self.op in _bool_ops_dict and
+            (not (issubclass(self.rhs.return_type, (bool, np.bool_)) and
+                  issubclass(self.lhs.return_type, (bool, np.bool_))))):
+            raise NotImplementedError("cannot evaluate scalar only bool ops")
+
+
+def isnumeric(dtype):
+    return issubclass(np.dtype(dtype).type, np.number)
+
+
+class Div(BinOp):
+
+    """Div operator to special case casting.
+
+    Parameters
+    ----------
+    lhs, rhs : Term or Op
+        The Terms or Ops in the ``/`` expression.
+    truediv : bool
+        Whether or not to use true division. With Python 3 this happens
+        regardless of the value of ``truediv``.
+    """
+
+    def __init__(self, lhs, rhs, truediv, *args, **kwargs):
+        super(Div, self).__init__('/', lhs, rhs, *args, **kwargs)
+
+        if not isnumeric(lhs.return_type) or not isnumeric(rhs.return_type):
+            raise TypeError("unsupported operand type(s) for {0}:"
+                            " '{1}' and '{2}'".format(self.op,
+                                                      lhs.return_type,
+                                                      rhs.return_type))
+
+        if truediv or PY3:
+            # do not upcast float32s to float64 un-necessarily
+            acceptable_dtypes = [np.float32, np.float_]
+            _cast_inplace(com.flatten(self), acceptable_dtypes, np.float_)
+
+
+_unary_ops_syms = '+', '-', '~', 'not'
+_unary_ops_funcs = op.pos, op.neg, op.invert, op.invert
+_unary_ops_dict = dict(zip(_unary_ops_syms, _unary_ops_funcs))
+
+
+class UnaryOp(Op):
+
+    """Hold a unary operator and its operands
+
+    Parameters
+    ----------
+    op : str
+        The token used to represent the operator.
+    operand : Term or Op
+        The Term or Op operand to the operator.
+
+    Raises
+    ------
+    ValueError
+        * If no function associated with the passed operator token is found.
+    """
+
+    def __init__(self, op, operand):
+        super(UnaryOp, self).__init__(op, (operand,))
+        self.operand = operand
+
+        try:
+            self.func = _unary_ops_dict[op]
+        except KeyError:
+            raise ValueError('Invalid unary operator {0!r}, valid operators '
+                             'are {1}'.format(op, _unary_ops_syms))
+
+    def __call__(self, env):
+        operand = self.operand(env)
+        return self.func(operand)
+
+    def __unicode__(self):
+        return pprint_thing('{0}({1})'.format(self.op, self.operand))
+
+    @property
+    def return_type(self):
+        operand = self.operand
+        if operand.return_type == np.dtype('bool'):
+            return np.dtype('bool')
+        if (isinstance(operand, Op) and
+                (operand.op in _cmp_ops_dict or operand.op in _bool_ops_dict)):
+            return np.dtype('bool')
+        return np.dtype('int')
+
+
+class MathCall(Op):
+
+    def __init__(self, func, args):
+        super(MathCall, self).__init__(func.name, args)
+        self.func = func
+
+    def __call__(self, env):
+        operands = [op(env) for op in self.operands]
+        with np.errstate(all='ignore'):
+            return self.func.func(*operands)
+
+    def __unicode__(self):
+        operands = map(str, self.operands)
+        return pprint_thing('{0}({1})'.format(self.op, ','.join(operands)))
+
+
+class FuncNode(object):
+    def __init__(self, name):
+        from pandas.core.computation.check import (_NUMEXPR_INSTALLED,
+                                                   _NUMEXPR_VERSION)
+        if name not in _mathops or (
+                _NUMEXPR_INSTALLED and
+                _NUMEXPR_VERSION < LooseVersion('2.6.9') and
+                name in ('floor', 'ceil')
+        ):
+            raise ValueError(
+                "\"{0}\" is not a supported function".format(name))
+
+        self.name = name
+        self.func = getattr(np, name)
+
+    def __call__(self, *args):
+        return MathCall(self, args)
diff --git a/pandas/computation/pytables.py b/pandas/core/computation/pytables.py
similarity index 84%
rename from pandas/computation/pytables.py
rename to pandas/core/computation/pytables.py
index 2a5056963fe8d..18f13e17c046e 100644
--- a/pandas/computation/pytables.py
+++ b/pandas/core/computation/pytables.py
@@ -2,19 +2,23 @@
 
 import ast
 from functools import partial
+
 import numpy as np
-import pandas as pd
 
-from pandas.types.common import is_list_like
-import pandas.core.common as com
-from pandas.compat import u, string_types, DeepChainMap
+from pandas._libs.tslibs import Timedelta, Timestamp
+from pandas.compat import DeepChainMap, string_types, u
+
+from pandas.core.dtypes.common import is_list_like
+
+import pandas as pd
 from pandas.core.base import StringMixin
-from pandas.formats.printing import pprint_thing, pprint_thing_encoded
-from pandas.computation import expr, ops
-from pandas.computation.ops import is_term, UndefinedVariableError
-from pandas.computation.expr import BaseExprVisitor
-from pandas.computation.common import _ensure_decoded
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
+import pandas.core.common as com
+from pandas.core.computation import expr, ops
+from pandas.core.computation.common import _ensure_decoded
+from pandas.core.computation.expr import BaseExprVisitor
+from pandas.core.computation.ops import UndefinedVariableError, is_term
+
+from pandas.io.formats.printing import pprint_thing, pprint_thing_encoded
 
 
 class Scope(expr.Scope):
@@ -41,7 +45,8 @@ def _resolve_name(self):
         # must be a queryables
         if self.side == 'left':
             if self.name not in self.env.queryables:
-                raise NameError('name {0!r} is not defined'.format(self.name))
+                raise NameError('name {name!r} is not defined'
+                                .format(name=self.name))
             return self.name
 
         # resolve the rhs (and allow it to be None)
@@ -161,7 +166,7 @@ def metadata(self):
     def generate(self, v):
         """ create and return the op string for this TermValue """
         val = v.tostring(self.encoding)
-        return "(%s %s %s)" % (self.lhs, self.op, val)
+        return "({lhs} {op} {val})".format(lhs=self.lhs, op=self.op, val=val)
 
     def convert_value(self, v):
         """ convert the expression that is in the term to something that is
@@ -181,15 +186,15 @@ def stringify(value):
             if isinstance(v, (int, float)):
                 v = stringify(v)
             v = _ensure_decoded(v)
-            v = pd.Timestamp(v)
+            v = Timestamp(v)
             if v.tz is not None:
                 v = v.tz_convert('UTC')
             return TermValue(v, v.value, kind)
         elif kind == u('timedelta64') or kind == u('timedelta'):
-            v = _coerce_scalar_to_timedelta_type(v, unit='s').value
+            v = Timedelta(v, unit='s').value
             return TermValue(int(v), v, kind)
         elif meta == u('category'):
-            metadata = com._values_from_object(self.metadata)
+            metadata = com.values_from_object(self.metadata)
             result = metadata.searchsorted(v, side='left')
 
             # result returns 0 if v is first element or if v is not in metadata
@@ -215,9 +220,8 @@ def stringify(value):
             # string quoting
             return TermValue(v, stringify(v), u('string'))
         else:
-            raise TypeError(("Cannot compare {v} of type {typ}"
-                            " to {kind} column").format(v=v, typ=type(v),
-                                                        kind=kind))
+            raise TypeError("Cannot compare {v} of type {typ} to {kind} column"
+                            .format(v=v, typ=type(v), kind=kind))
 
     def convert_values(self):
         pass
@@ -226,8 +230,8 @@ def convert_values(self):
 class FilterBinOp(BinOp):
 
     def __unicode__(self):
-        return pprint_thing("[Filter : [{0}] -> "
-                            "[{1}]".format(self.filter[0], self.filter[1]))
+        return pprint_thing("[Filter : [{lhs}] -> [{op}]"
+                            .format(lhs=self.filter[0], op=self.filter[1]))
 
     def invert(self):
         """ invert the filter """
@@ -244,10 +248,11 @@ def format(self):
     def evaluate(self):
 
         if not self.is_valid:
-            raise ValueError("query term is not valid [%s]" % self)
+            raise ValueError("query term is not valid [{slf}]"
+                             .format(slf=self))
 
         rhs = self.conform(self.rhs)
-        values = [TermValue(v, v, self.kind) for v in rhs]
+        values = [TermValue(v, v, self.kind).value for v in rhs]
 
         if self.is_in_table:
 
@@ -258,7 +263,7 @@ def evaluate(self):
                 self.filter = (
                     self.lhs,
                     filter_op,
-                    pd.Index([v.value for v in values]))
+                    pd.Index(values))
 
                 return self
             return None
@@ -270,12 +275,11 @@ def evaluate(self):
             self.filter = (
                 self.lhs,
                 filter_op,
-                pd.Index([v.value for v in values]))
+                pd.Index(values))
 
         else:
-            raise TypeError(
-                "passing a filterable condition to a non-table indexer [%s]" %
-                self)
+            raise TypeError("passing a filterable condition to a non-table "
+                            "indexer [{slf}]".format(slf=self))
 
         return self
 
@@ -298,7 +302,8 @@ def evaluate(self):
 class ConditionBinOp(BinOp):
 
     def __unicode__(self):
-        return pprint_thing("[Condition : [{0}]]".format(self.condition))
+        return pprint_thing("[Condition : [{cond}]]"
+                            .format(cond=self.condition))
 
     def invert(self):
         """ invert the condition """
@@ -315,7 +320,8 @@ def format(self):
     def evaluate(self):
 
         if not self.is_valid:
-            raise ValueError("query term is not valid [%s]" % self)
+            raise ValueError("query term is not valid [{slf}]"
+                             .format(slf=self))
 
         # convert values if we are in the table
         if not self.is_in_table:
@@ -330,7 +336,7 @@ def evaluate(self):
             # too many values to create the expression?
             if len(values) <= self._max_selectors:
                 vs = [self.generate(v) for v in values]
-                self.condition = "(%s)" % ' | '.join(vs)
+                self.condition = "({cond})".format(cond=' | '.join(vs))
 
             # use a filter after reading
             else:
@@ -344,10 +350,9 @@ def evaluate(self):
 class JointConditionBinOp(ConditionBinOp):
 
     def evaluate(self):
-        self.condition = "(%s %s %s)" % (
-            self.lhs.condition,
-            self.op,
-            self.rhs.condition)
+        self.condition = "({lhs} {op} {rhs})".format(lhs=self.lhs.condition,
+                                                     op=self.op,
+                                                     rhs=self.rhs.condition)
         return self
 
 
@@ -382,7 +387,8 @@ class ExprVisitor(BaseExprVisitor):
     def __init__(self, env, engine, parser, **kwargs):
         super(ExprVisitor, self).__init__(env, engine, parser)
         for bin_op in self.binary_ops:
-            setattr(self, 'visit_{0}'.format(self.binary_op_nodes_map[bin_op]),
+            bin_node = self.binary_op_nodes_map[bin_op]
+            setattr(self, 'visit_{node}'.format(node=bin_node),
                     lambda node, bin_op=bin_op: partial(BinOp, bin_op,
                                                         **kwargs))
 
@@ -409,14 +415,14 @@ def visit_Subscript(self, node, **kwargs):
         slobj = self.visit(node.slice)
         try:
             value = value.value
-        except:
+        except AttributeError:
             pass
 
         try:
             return self.const_type(value[slobj], self.env)
         except TypeError:
-            raise ValueError("cannot subscript {0!r} with "
-                             "{1!r}".format(value, slobj))
+            raise ValueError("cannot subscript {value!r} with "
+                             "{slobj!r}".format(value=value, slobj=slobj))
 
     def visit_Attribute(self, node, **kwargs):
         attr = node.attr
@@ -437,11 +443,12 @@ def visit_Attribute(self, node, **kwargs):
                 return self.term_type(getattr(resolved, attr), self.env)
             except AttributeError:
 
-                # something like datetime.datetime where scope is overriden
+                # something like datetime.datetime where scope is overridden
                 if isinstance(value, ast.Name) and value.id == attr:
                     return resolved
 
-        raise ValueError("Invalid Attribute context {0}".format(ctx.__name__))
+        raise ValueError("Invalid Attribute context {name}"
+                         .format(name=ctx.__name__))
 
     def translate_In(self, op):
         return ast.Eq() if isinstance(op, ast.In) else op
@@ -529,7 +536,7 @@ def __init__(self, where, queryables=None, encoding=None, scope_level=0):
                 else:
                     w = _validate_where(w)
                     where[idx] = w
-            where = ' & ' .join(["(%s)" % w for w in where])  # noqa
+            where = ' & '.join(map('({})'.format, com.flatten(where)))  # noqa
 
         self.expr = where
         self.env = Scope(scope_level + 1, local_dict=local_dict)
@@ -552,13 +559,15 @@ def evaluate(self):
         try:
             self.condition = self.terms.prune(ConditionBinOp)
         except AttributeError:
-            raise ValueError("cannot process expression [{0}], [{1}] is not a "
-                             "valid condition".format(self.expr, self))
+            raise ValueError("cannot process expression [{expr}], [{slf}] "
+                             "is not a valid condition".format(expr=self.expr,
+                                                               slf=self))
         try:
             self.filter = self.terms.prune(FilterBinOp)
         except AttributeError:
-            raise ValueError("cannot process expression [{0}], [{1}] is not a "
-                             "valid filter".format(self.expr, self))
+            raise ValueError("cannot process expression [{expr}], [{slf}] "
+                             "is not a valid filter".format(expr=self.expr,
+                                                            slf=self))
 
         return self.condition, self.filter
 
@@ -578,7 +587,7 @@ def tostring(self, encoding):
         if self.kind == u'string':
             if encoding is not None:
                 return self.converted
-            return '"%s"' % self.converted
+            return '"{converted}"'.format(converted=self.converted)
         elif self.kind == u'float':
             # python 2 str(float) is not always
             # round-trippable so use repr()
diff --git a/pandas/computation/scope.py b/pandas/core/computation/scope.py
similarity index 93%
rename from pandas/computation/scope.py
rename to pandas/core/computation/scope.py
index 9ade755e0ff12..e158bc8c568eb 100644
--- a/pandas/computation/scope.py
+++ b/pandas/core/computation/scope.py
@@ -2,20 +2,20 @@
 Module for scope operations
 """
 
-import sys
-import struct
-import inspect
 import datetime
+import inspect
 import itertools
 import pprint
+import struct
+import sys
 
 import numpy as np
 
-import pandas
-import pandas as pd  # noqa
-from pandas.compat import DeepChainMap, map, StringIO
+from pandas._libs.tslibs import Timestamp
+from pandas.compat import DeepChainMap, StringIO, map
+
 from pandas.core.base import StringMixin
-import pandas.computation as compu
+import pandas.core.computation as compu
 
 
 def _ensure_scope(level, global_dict=None, local_dict=None, resolvers=(),
@@ -48,7 +48,7 @@ def _raw_hex_id(obj):
 
 
 _DEFAULT_GLOBALS = {
-    'Timestamp': pandas._libs.lib.Timestamp,
+    'Timestamp': Timestamp,
     'datetime': datetime.datetime,
     'True': True,
     'False': False,
@@ -137,8 +137,10 @@ def __init__(self, level, global_dict=None, local_dict=None, resolvers=(),
     def __unicode__(self):
         scope_keys = _get_pretty_string(list(self.scope.keys()))
         res_keys = _get_pretty_string(list(self.resolvers.keys()))
-        return '%s(scope=%s, resolvers=%s)' % (type(self).__name__, scope_keys,
-                                               res_keys)
+        unicode_str = '{name}(scope={scope_keys}, resolvers={res_keys})'
+        return unicode_str.format(name=type(self).__name__,
+                                  scope_keys=scope_keys,
+                                  res_keys=res_keys)
 
     @property
     def has_resolvers(self):
@@ -269,8 +271,9 @@ def add_tmp(self, value):
         name : basestring
             The name of the temporary variable created.
         """
-        name = '{0}_{1}_{2}'.format(type(value).__name__, self.ntemps,
-                                    _raw_hex_id(self))
+        name = '{name}_{num}_{hex_id}'.format(name=type(value).__name__,
+                                              num=self.ntemps,
+                                              hex_id=_raw_hex_id(self))
 
         # add to inner most scope
         assert name not in self.temps
diff --git a/pandas/core/config.py b/pandas/core/config.py
index 39ed2f9545266..01664fffb1e27 100644
--- a/pandas/core/config.py
+++ b/pandas/core/config.py
@@ -23,7 +23,7 @@
 - all options in a certain sub - namespace can be reset at once.
 - the user can set / get / reset or ask for the description of an option.
 - a developer can register and mark an option as deprecated.
-- you can register a callback to be invoked when the the option value
+- you can register a callback to be invoked when the option value
   is set or reset. Changing the stored value is considered misuse, but
   is not verboten.
 
@@ -33,8 +33,8 @@
 - Data is stored using nested dictionaries, and should be accessed
   through the provided API.
 
-- "Registered options" and "Deprecated options" have metadata associcated
-  with them, which are stored in auxilary dictionaries keyed on the
+- "Registered options" and "Deprecated options" have metadata associated
+  with them, which are stored in auxiliary dictionaries keyed on the
   fully-qualified key, e.g. "x.y.z.option".
 
 - the config_init module is imported by the package's __init__.py file.
@@ -48,13 +48,13 @@
 
 """
 
-import re
-
 from collections import namedtuple
 from contextlib import contextmanager
+import re
 import warnings
-from pandas.compat import map, lmap, u
+
 import pandas.compat as compat
+from pandas.compat import lmap, map, u
 
 DeprecatedOption = namedtuple('DeprecatedOption', 'key msg rkey removal_ver')
 RegisteredOption = namedtuple('RegisteredOption',
@@ -80,7 +80,7 @@ def _get_single_key(pat, silent):
     if len(keys) == 0:
         if not silent:
             _warn_if_deprecated(pat)
-        raise OptionError('No such keys(s): %r' % pat)
+        raise OptionError('No such keys(s): {pat!r}'.format(pat=pat))
     if len(keys) > 1:
         raise OptionError('Pattern matched multiple keys')
     key = keys[0]
@@ -112,8 +112,8 @@ def _set_option(*args, **kwargs):
     silent = kwargs.pop('silent', False)
 
     if kwargs:
-        raise TypeError('_set_option() got an unexpected keyword '
-                        'argument "{0}"'.format(list(kwargs.keys())[0]))
+        msg = '_set_option() got an unexpected keyword argument "{kwarg}"'
+        raise TypeError(msg.format(list(kwargs.keys())[0]))
 
     for k, v in zip(args[::2], args[1::2]):
         key = _get_single_key(k, silent)
@@ -196,7 +196,10 @@ def __getattr__(self, key):
         if prefix:
             prefix += "."
         prefix += key
-        v = object.__getattribute__(self, "d")[key]
+        try:
+            v = object.__getattribute__(self, "d")[key]
+        except KeyError:
+            raise OptionError("No such option")
         if isinstance(v, dict):
             return DictWrapper(v, prefix)
         else:
@@ -209,7 +212,7 @@ def __dir__(self):
 # in the docstring. For dev convenience we'd like to generate the docstrings
 # dynamically instead of maintaining them by hand. To this, we use the
 # class below which wraps functions inside a callable, and converts
-# __doc__ into a propery function. The doctsrings below are templates
+# __doc__ into a property function. The doctsrings below are templates
 # using the py2.6+ advanced formatting syntax to plug in a concise list
 # of options, and option descriptions.
 
@@ -279,8 +282,8 @@ def __doc__(self):
     Note: partial matches are supported for convenience, but unless you use the
     full option name (e.g. x.y.z.option_name), your code may break in future
     versions if new options with similar names are introduced.
-value :
-    new value of option.
+value : object
+    New value of option.
 
 Returns
 -------
@@ -381,23 +384,19 @@ class option_context(object):
     --------
 
     >>> with option_context('display.max_rows', 10, 'display.max_columns', 5):
-            ...
-
+    ...     ...
     """
 
     def __init__(self, *args):
         if not (len(args) % 2 == 0 and len(args) >= 2):
             raise ValueError('Need to invoke as'
-                             'option_context(pat, val, [(pat, val), ...)).')
+                             ' option_context(pat, val, [(pat, val), ...]).')
 
         self.ops = list(zip(args[::2], args[1::2]))
 
     def __enter__(self):
-        undo = []
-        for pat, val in self.ops:
-            undo.append((pat, _get_option(pat, silent=True)))
-
-        self.undo = undo
+        self.undo = [(pat, _get_option(pat, silent=True))
+                     for pat, val in self.ops]
 
         for pat, val in self.ops:
             _set_option(pat, val, silent=True)
@@ -436,9 +435,11 @@ def register_option(key, defval, doc='', validator=None, cb=None):
     key = key.lower()
 
     if key in _registered_options:
-        raise OptionError("Option '%s' has already been registered" % key)
+        msg = "Option '{key}' has already been registered"
+        raise OptionError(msg.format(key=key))
     if key in _reserved_keys:
-        raise OptionError("Option '%s' is a reserved key" % key)
+        msg = "Option '{key}' is a reserved key"
+        raise OptionError(msg.format(key=key))
 
     # the default value should be legal
     if validator:
@@ -449,22 +450,21 @@ def register_option(key, defval, doc='', validator=None, cb=None):
 
     for k in path:
         if not bool(re.match('^' + tokenize.Name + '$', k)):
-            raise ValueError("%s is not a valid identifier" % k)
+            raise ValueError("{k} is not a valid identifier".format(k=k))
         if keyword.iskeyword(k):
-            raise ValueError("%s is a python keyword" % k)
+            raise ValueError("{k} is a python keyword".format(k=k))
 
     cursor = _global_config
+    msg = "Path prefix to option '{option}' is already an option"
     for i, p in enumerate(path[:-1]):
         if not isinstance(cursor, dict):
-            raise OptionError("Path prefix to option '%s' is already an option"
-                              % '.'.join(path[:i]))
+            raise OptionError(msg.format(option='.'.join(path[:i])))
         if p not in cursor:
             cursor[p] = {}
         cursor = cursor[p]
 
     if not isinstance(cursor, dict):
-        raise OptionError("Path prefix to option '%s' is already an option" %
-                          '.'.join(path[:-1]))
+        raise OptionError(msg.format(option='.'.join(path[:-1])))
 
     cursor[path[-1]] = defval  # initialize
 
@@ -516,8 +516,8 @@ def deprecate_option(key, msg=None, rkey=None, removal_ver=None):
     key = key.lower()
 
     if key in _deprecated_options:
-        raise OptionError("Option '%s' has already been defined as deprecated."
-                          % key)
+        msg = "Option '{key}' has already been defined as deprecated."
+        raise OptionError(msg.format(key=key))
 
     _deprecated_options[key] = DeprecatedOption(key, msg, rkey, removal_ver)
 
@@ -612,17 +612,18 @@ def _warn_if_deprecated(key):
     if d:
         if d.msg:
             print(d.msg)
-            warnings.warn(d.msg, DeprecationWarning)
+            warnings.warn(d.msg, FutureWarning)
         else:
-            msg = "'%s' is deprecated" % key
+            msg = "'{key}' is deprecated".format(key=key)
             if d.removal_ver:
-                msg += ' and will be removed in %s' % d.removal_ver
+                msg += (' and will be removed in {version}'
+                        .format(version=d.removal_ver))
             if d.rkey:
-                msg += ", please use '%s' instead." % d.rkey
+                msg += ", please use '{rkey}' instead.".format(rkey=d.rkey)
             else:
                 msg += ', please refrain from using it.'
 
-            warnings.warn(msg, DeprecationWarning)
+            warnings.warn(msg, FutureWarning)
         return True
     return False
 
@@ -633,7 +634,7 @@ def _build_option_description(k):
     o = _get_registered_option(k)
     d = _get_deprecated_option(k)
 
-    s = u('%s ') % k
+    s = u('{k} ').format(k=k)
 
     if o.doc:
         s += '\n'.join(o.doc.strip().split('\n'))
@@ -641,12 +642,13 @@ def _build_option_description(k):
         s += 'No description available.'
 
     if o:
-        s += u('\n    [default: %s] [currently: %s]') % (o.defval,
-                                                         _get_option(k, True))
+        s += (u('\n    [default: {default}] [currently: {current}]')
+              .format(default=o.defval, current=_get_option(k, True)))
 
     if d:
         s += u('\n    (Deprecated')
-        s += (u(', use `%s` instead.') % d.rkey if d.rkey else '')
+        s += (u(', use `{rkey}` instead.')
+              .format(rkey=d.rkey if d.rkey else ''))
         s += u(')')
 
     s += '\n\n'
@@ -688,7 +690,7 @@ def pp(name, ks):
 
 @contextmanager
 def config_prefix(prefix):
-    """contextmanager for multiple invocations of API  with a common prefix
+    """contextmanager for multiple invocations of API with a common prefix
 
     supported API functions: (register / get / set )__option
 
@@ -718,7 +720,7 @@ def config_prefix(prefix):
 
     def wrap(func):
         def inner(key, *args, **kwds):
-            pkey = '%s.%s' % (prefix, key)
+            pkey = '{prefix}.{key}'.format(prefix=prefix, key=key)
             return func(pkey, *args, **kwds)
 
         return inner
@@ -754,7 +756,8 @@ def is_type_factory(_type):
 
     def inner(x):
         if type(x) != _type:
-            raise ValueError("Value must have type '%s'" % str(_type))
+            msg = "Value must have type '{typ!s}'"
+            raise ValueError(msg.format(typ=_type))
 
     return inner
 
@@ -774,14 +777,15 @@ def is_instance_factory(_type):
     """
     if isinstance(_type, (tuple, list)):
         _type = tuple(_type)
-        from pandas.formats.printing import pprint_thing
+        from pandas.io.formats.printing import pprint_thing
         type_repr = "|".join(map(pprint_thing, _type))
     else:
-        type_repr = "'%s'" % _type
+        type_repr = "'{typ}'".format(typ=_type)
 
     def inner(x):
         if not isinstance(x, _type):
-            raise ValueError("Value must be an instance of %s" % type_repr)
+            msg = "Value must be an instance of {type_repr}"
+            raise ValueError(msg.format(type_repr=type_repr))
 
     return inner
 
@@ -792,15 +796,15 @@ def is_one_of_factory(legal_values):
     legal_values = [c for c in legal_values if not callable(c)]
 
     def inner(x):
-        from pandas.formats.printing import pprint_thing as pp
+        from pandas.io.formats.printing import pprint_thing as pp
         if x not in legal_values:
 
-            if not any([c(x) for c in callables]):
+            if not any(c(x) for c in callables):
                 pp_values = pp("|".join(lmap(pp, legal_values)))
-                msg = "Value must be one of {0}".format(pp_values)
+                msg = "Value must be one of {pp_values}"
                 if len(callables):
                     msg += " or a callable"
-                raise ValueError(msg)
+                raise ValueError(msg.format(pp_values=pp_values))
 
     return inner
 
diff --git a/pandas/core/config_init.py b/pandas/core/config_init.py
index 931fe0661818d..d42a1ab72b156 100644
--- a/pandas/core/config_init.py
+++ b/pandas/core/config_init.py
@@ -9,14 +9,47 @@
 module is imported, register them here rather then in the module.
 
 """
-import warnings
-
 import pandas.core.config as cf
-from pandas.core.config import (is_int, is_bool, is_text, is_instance_factory,
-                                is_one_of_factory, get_default_val,
-                                is_callable)
-from pandas.formats.format import detect_console_encoding
+from pandas.core.config import (
+    is_bool, is_callable, is_instance_factory, is_int, is_one_of_factory,
+    is_text)
+
+from pandas.io.formats.console import detect_console_encoding
+from pandas.io.formats.terminal import is_terminal
+
+# compute
+
+use_bottleneck_doc = """
+: bool
+    Use the bottleneck library to accelerate if it is installed,
+    the default is True
+    Valid values: False,True
+"""
+
+
+def use_bottleneck_cb(key):
+    from pandas.core import nanops
+    nanops.set_use_bottleneck(cf.get_option(key))
+
 
+use_numexpr_doc = """
+: bool
+    Use the numexpr library to accelerate computation if it is installed,
+    the default is True
+    Valid values: False,True
+"""
+
+
+def use_numexpr_cb(key):
+    from pandas.core.computation import expressions
+    expressions.set_use_numexpr(cf.get_option(key))
+
+
+with cf.config_prefix('compute'):
+    cf.register_option('use_bottleneck', True, use_bottleneck_doc,
+                       validator=is_bool, cb=use_bottleneck_cb)
+    cf.register_option('use_numexpr', True, use_numexpr_doc,
+                       validator=is_bool, cb=use_numexpr_cb)
 #
 # options from the "display" namespace
 
@@ -139,11 +172,6 @@
     frame is truncated (e.g. not display all rows and/or columns)
 """
 
-pc_line_width_doc = """
-: int
-    Deprecated.
-"""
-
 pc_east_asian_width_doc = """
 : boolean
     Whether to use the Unicode East Asian Width to calculate the display text
@@ -171,13 +199,22 @@
     (default: False)
 """
 
-pc_line_width_deprecation_warning = """\
-line_width has been deprecated, use display.width instead (currently both are
-identical)
+pc_html_border_doc = """
+: int
+    A ``border=value`` attribute is inserted in the ``<table>`` tag
+    for the DataFrame HTML repr.
+"""
+
+pc_html_border_deprecation_warning = """\
+html.border has been deprecated, use display.html.border instead
+(currently both are identical)
 """
 
-pc_height_deprecation_warning = """\
-height has been deprecated.
+pc_html_use_mathjax_doc = """\
+: boolean
+    When True, Jupyter notebook will process table contents using MathJax,
+    rendering mathematical expressions enclosed by the dollar symbol.
+    (default: True)
 """
 
 pc_width_doc = """
@@ -189,11 +226,6 @@
     terminal and hence it is not possible to correctly detect the width.
 """
 
-pc_height_doc = """
-: int
-    Deprecated.
-"""
-
 pc_chop_threshold_doc = """
 : float or None
     if set to a float value, all float values smaller then the given threshold
@@ -224,18 +256,6 @@
     df.info() (the behaviour in earlier versions of pandas).
 """
 
-pc_mpl_style_doc = """
-: bool
-    Setting this to 'default' will modify the rcParams used by matplotlib
-    to give plots a more pleasing visual style by default.
-    Setting this to None/False restores the values to their initial value.
-"""
-
-pc_mpl_style_deprecation_warning = """
-mpl_style had been deprecated and will be removed in a future version.
-Use `matplotlib.pyplot.style.use` instead.
-"""
-
 pc_memory_usage_doc = """
 : bool, string or None
     This specifies if the memory usage of a DataFrame should be displayed when
@@ -280,31 +300,9 @@
 style_backup = dict()
 
 
-def mpl_style_cb(key):
-    warnings.warn(pc_mpl_style_deprecation_warning, FutureWarning,
-                  stacklevel=5)
-
-    import sys
-    from pandas.tools.plotting import mpl_stylesheet
-    global style_backup
-
-    val = cf.get_option(key)
-
-    if 'matplotlib' not in sys.modules.keys():
-        if not val:  # starting up, we get reset to None
-            return val
-        raise Exception("matplotlib has not been imported. aborting")
-
-    import matplotlib.pyplot as plt
-
-    if val == 'default':
-        style_backup = dict([(k, plt.rcParams[k]) for k in mpl_stylesheet])
-        plt.rcParams.update(mpl_stylesheet)
-    elif not val:
-        if style_backup:
-            plt.rcParams.update(style_backup)
-
-    return val
+def table_schema_cb(key):
+    from pandas.io.formats.printing import _enable_data_resource_formatter
+    _enable_data_resource_formatter(cf.get_option(key))
 
 
 with cf.config_prefix('display'):
@@ -319,7 +317,11 @@ def mpl_style_cb(key):
     cf.register_option('max_categories', 8, pc_max_categories_doc,
                        validator=is_int)
     cf.register_option('max_colwidth', 50, max_colwidth_doc, validator=is_int)
-    cf.register_option('max_columns', 20, pc_max_cols_doc,
+    if is_terminal():
+        max_cols = 0  # automatically determine optimal number of columns
+    else:
+        max_cols = 20  # cannot determine optimal number of columns
+    cf.register_option('max_columns', max_cols, pc_max_cols_doc,
                        validator=is_instance_factory([type(None), int]))
     cf.register_option('large_repr', 'truncate', pc_large_repr_doc,
                        validator=is_one_of_factory(['truncate', 'info']))
@@ -344,16 +346,8 @@ def mpl_style_cb(key):
                        validator=is_one_of_factory([True, False, 'truncate']))
     cf.register_option('chop_threshold', None, pc_chop_threshold_doc)
     cf.register_option('max_seq_items', 100, pc_max_seq_items)
-    cf.register_option('mpl_style', None, pc_mpl_style_doc,
-                       validator=is_one_of_factory([None, False, 'default']),
-                       cb=mpl_style_cb)
-    cf.register_option('height', 60, pc_height_doc,
-                       validator=is_instance_factory([type(None), int]))
     cf.register_option('width', 80, pc_width_doc,
                        validator=is_instance_factory([type(None), int]))
-    # redirected to width, make defval identical
-    cf.register_option('line_width', get_default_val('display.width'),
-                       pc_line_width_doc)
     cf.register_option('memory_usage', True, pc_memory_usage_doc,
                        validator=is_one_of_factory([None, True,
                                                     False, 'deep']))
@@ -374,26 +368,19 @@ def mpl_style_cb(key):
     cf.register_option('latex.multirow', False, pc_latex_multirow,
                        validator=is_bool)
     cf.register_option('html.table_schema', False, pc_table_schema_doc,
+                       validator=is_bool, cb=table_schema_cb)
+    cf.register_option('html.border', 1, pc_html_border_doc,
+                       validator=is_int)
+    cf.register_option('html.use_mathjax', True, pc_html_use_mathjax_doc,
                        validator=is_bool)
 
-
-cf.deprecate_option('display.line_width',
-                    msg=pc_line_width_deprecation_warning,
-                    rkey='display.width')
-
-cf.deprecate_option('display.height', msg=pc_height_deprecation_warning,
-                    rkey='display.max_rows')
-
-pc_html_border_doc = """
-: int
-    A ``border=value`` attribute is inserted in the ``<table>`` tag
-    for the DataFrame HTML repr.
-"""
-
 with cf.config_prefix('html'):
     cf.register_option('border', 1, pc_html_border_doc,
                        validator=is_int)
 
+cf.deprecate_option('html.border', msg=pc_html_border_deprecation_warning,
+                    rkey='display.html.border')
+
 
 tc_sim_interactive_doc = """
 : boolean
@@ -405,8 +392,14 @@ def mpl_style_cb(key):
 
 use_inf_as_null_doc = """
 : boolean
-    True means treat None, NaN, INF, -INF as null (old way),
-    False means None and NaN are null, but INF, -INF are not null
+    use_inf_as_null had been deprecated and will be removed in a future
+    version. Use `use_inf_as_na` instead.
+"""
+
+use_inf_as_na_doc = """
+: boolean
+    True means treat None, NaN, INF, -INF as NA (old way),
+    False means None and NaN are null, but INF, -INF are not NA
     (new way).
 """
 
@@ -414,14 +407,20 @@ def mpl_style_cb(key):
 # or we'll hit circular deps.
 
 
-def use_inf_as_null_cb(key):
-    from pandas.types.missing import _use_inf_as_null
-    _use_inf_as_null(key)
+def use_inf_as_na_cb(key):
+    from pandas.core.dtypes.missing import _use_inf_as_na
+    _use_inf_as_na(key)
 
 
 with cf.config_prefix('mode'):
+    cf.register_option('use_inf_as_na', False, use_inf_as_na_doc,
+                       cb=use_inf_as_na_cb)
     cf.register_option('use_inf_as_null', False, use_inf_as_null_doc,
-                       cb=use_inf_as_null_cb)
+                       cb=use_inf_as_na_cb)
+
+cf.deprecate_option('mode.use_inf_as_null', msg=use_inf_as_null_doc,
+                    rkey='mode.use_inf_as_na')
+
 
 # user warnings
 chained_assignment = """
@@ -438,31 +437,71 @@ def use_inf_as_null_cb(key):
 writer_engine_doc = """
 : string
     The default Excel writer engine for '{ext}' files. Available options:
-    '{default}' (the default){others}.
-"""
-
-with cf.config_prefix('io.excel'):
-    # going forward, will be additional writers
-    for ext, options in [('xls', ['xlwt']), ('xlsm', ['openpyxl'])]:
-        default = options.pop(0)
-        if options:
-            options = " " + ", ".join(options)
-        else:
-            options = ""
-        doc = writer_engine_doc.format(ext=ext, default=default,
-                                       others=options)
-        cf.register_option(ext + '.writer', default, doc, validator=str)
-
-    def _register_xlsx(engine, other):
-        cf.register_option('xlsx.writer', engine,
-                           writer_engine_doc.format(ext='xlsx', default=engine,
-                                                    others=", '%s'" % other),
-                           validator=str)
-
-    try:
-        # better memory footprint
-        import xlsxwriter  # noqa
-        _register_xlsx('xlsxwriter', 'openpyxl')
-    except ImportError:
-        # fallback
-        _register_xlsx('openpyxl', 'xlsxwriter')
+    auto, {others}.
+"""
+
+_xls_options = ['xlwt']
+_xlsm_options = ['openpyxl']
+_xlsx_options = ['openpyxl', 'xlsxwriter']
+
+
+with cf.config_prefix("io.excel.xls"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xls',
+                           others=', '.join(_xls_options)),
+                       validator=str)
+
+with cf.config_prefix("io.excel.xlsm"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xlsm',
+                           others=', '.join(_xlsm_options)),
+                       validator=str)
+
+
+with cf.config_prefix("io.excel.xlsx"):
+    cf.register_option("writer", "auto",
+                       writer_engine_doc.format(
+                           ext='xlsx',
+                           others=', '.join(_xlsx_options)),
+                       validator=str)
+
+
+# Set up the io.parquet specific configuration.
+parquet_engine_doc = """
+: string
+    The default parquet reader/writer engine. Available options:
+    'auto', 'pyarrow', 'fastparquet', the default is 'auto'
+"""
+
+with cf.config_prefix('io.parquet'):
+    cf.register_option(
+        'engine', 'auto', parquet_engine_doc,
+        validator=is_one_of_factory(['auto', 'pyarrow', 'fastparquet']))
+
+# --------
+# Plotting
+# ---------
+
+register_converter_doc = """
+: bool
+    Whether to register converters with matplotlib's units registry for
+    dates, times, datetimes, and Periods. Toggling to False will remove
+    the converters, restoring any converters that pandas overwrote.
+"""
+
+
+def register_converter_cb(key):
+    from pandas.plotting import register_matplotlib_converters
+    from pandas.plotting import deregister_matplotlib_converters
+
+    if cf.get_option(key):
+        register_matplotlib_converters()
+    else:
+        deregister_matplotlib_converters()
+
+
+with cf.config_prefix("plotting.matplotlib"):
+    cf.register_option("register_converters", True, register_converter_doc,
+                       validator=bool, cb=register_converter_cb)
diff --git a/pandas/core/datetools.py b/pandas/core/datetools.py
deleted file mode 100644
index bfc3f3d4e4743..0000000000000
--- a/pandas/core/datetools.py
+++ /dev/null
@@ -1,51 +0,0 @@
-"""A collection of random tools for dealing with dates in Python"""
-
-# flake8: noqa
-
-import warnings
-
-from pandas.tseries.tools import *
-from pandas.tseries.offsets import *
-from pandas.tseries.frequencies import *
-
-warnings.warn("The pandas.core.datetools module is deprecated and will be "
-              "removed in a future version. Please use the pandas.tseries "
-              "module instead.", FutureWarning, stacklevel=2)
-
-day = DateOffset()
-bday = BDay()
-businessDay = bday
-try:
-    cday = CDay()
-    customBusinessDay = CustomBusinessDay()
-    customBusinessMonthEnd = CBMonthEnd()
-    customBusinessMonthBegin = CBMonthBegin()
-except NotImplementedError:
-    cday = None
-    customBusinessDay = None
-    customBusinessMonthEnd = None
-    customBusinessMonthBegin = None
-monthEnd = MonthEnd()
-yearEnd = YearEnd()
-yearBegin = YearBegin()
-bmonthEnd = BMonthEnd()
-bmonthBegin = BMonthBegin()
-cbmonthEnd = customBusinessMonthEnd
-cbmonthBegin = customBusinessMonthBegin
-bquarterEnd = BQuarterEnd()
-quarterEnd = QuarterEnd()
-byearEnd = BYearEnd()
-week = Week()
-
-# Functions/offsets to roll dates forward
-thisMonthEnd = MonthEnd(0)
-thisBMonthEnd = BMonthEnd(0)
-thisYearEnd = YearEnd(0)
-thisYearBegin = YearBegin(0)
-thisBQuarterEnd = BQuarterEnd(0)
-thisQuarterEnd = QuarterEnd(0)
-
-# Functions to check where a date lies
-isBusinessDay = BDay().onOffset
-isMonthEnd = MonthEnd().onOffset
-isBMonthEnd = BMonthEnd().onOffset
diff --git a/pandas/indexes/__init__.py b/pandas/core/dtypes/__init__.py
similarity index 100%
rename from pandas/indexes/__init__.py
rename to pandas/core/dtypes/__init__.py
diff --git a/pandas/core/dtypes/api.py b/pandas/core/dtypes/api.py
new file mode 100644
index 0000000000000..e9d7b9c4281bd
--- /dev/null
+++ b/pandas/core/dtypes/api.py
@@ -0,0 +1,14 @@
+# flake8: noqa
+
+from .common import (
+    is_array_like, is_bool, is_bool_dtype, is_categorical,
+    is_categorical_dtype, is_complex, is_complex_dtype,
+    is_datetime64_any_dtype, is_datetime64_dtype, is_datetime64_ns_dtype,
+    is_datetime64tz_dtype, is_datetimetz, is_dict_like, is_dtype_equal,
+    is_extension_array_dtype, is_extension_type, is_file_like, is_float,
+    is_float_dtype, is_hashable, is_int64_dtype, is_integer, is_integer_dtype,
+    is_interval, is_interval_dtype, is_iterator, is_list_like, is_named_tuple,
+    is_number, is_numeric_dtype, is_object_dtype, is_period, is_period_dtype,
+    is_re, is_re_compilable, is_scalar, is_signed_integer_dtype, is_sparse,
+    is_string_dtype, is_timedelta64_dtype, is_timedelta64_ns_dtype,
+    is_unsigned_integer_dtype, pandas_dtype)
diff --git a/pandas/core/dtypes/base.py b/pandas/core/dtypes/base.py
new file mode 100644
index 0000000000000..88bbdcf342d66
--- /dev/null
+++ b/pandas/core/dtypes/base.py
@@ -0,0 +1,294 @@
+"""Extend pandas with custom array types"""
+import numpy as np
+
+from pandas.errors import AbstractMethodError
+
+from pandas.core.dtypes.generic import ABCDataFrame, ABCIndexClass, ABCSeries
+
+from pandas import compat
+
+
+class _DtypeOpsMixin(object):
+    # Not all of pandas' extension dtypes are compatibile with
+    # the new ExtensionArray interface. This means PandasExtensionDtype
+    # can't subclass ExtensionDtype yet, as is_extension_array_dtype would
+    # incorrectly say that these types are extension types.
+    #
+    # In the interim, we put methods that are shared between the two base
+    # classes ExtensionDtype and PandasExtensionDtype here. Both those base
+    # classes will inherit from this Mixin. Once everything is compatible, this
+    # class's methods can be moved to ExtensionDtype and removed.
+
+    # na_value is the default NA value to use for this type. This is used in
+    # e.g. ExtensionArray.take. This should be the user-facing "boxed" version
+    # of the NA value, not the physical NA vaalue for storage.
+    # e.g. for JSONArray, this is an empty dictionary.
+    na_value = np.nan
+    _metadata = ()
+
+    def __eq__(self, other):
+        """Check whether 'other' is equal to self.
+
+        By default, 'other' is considered equal if either
+
+        * it's a string matching 'self.name'.
+        * it's an instance of this type and all of the
+          the attributes in ``self._metadata`` are equal between
+          `self` and `other`.
+
+        Parameters
+        ----------
+        other : Any
+
+        Returns
+        -------
+        bool
+        """
+        if isinstance(other, compat.string_types):
+            try:
+                other = self.construct_from_string(other)
+            except TypeError:
+                return False
+        if isinstance(other, type(self)):
+            return all(
+                getattr(self, attr) == getattr(other, attr)
+                for attr in self._metadata
+            )
+        return False
+
+    def __hash__(self):
+        return hash(tuple(getattr(self, attr) for attr in self._metadata))
+
+    def __ne__(self, other):
+        return not self.__eq__(other)
+
+    @property
+    def names(self):
+        # type: () -> Optional[List[str]]
+        """Ordered list of field names, or None if there are no fields.
+
+        This is for compatibility with NumPy arrays, and may be removed in the
+        future.
+        """
+        return None
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """Check if we match 'dtype'.
+
+        Parameters
+        ----------
+        dtype : object
+            The object to check.
+
+        Returns
+        -------
+        is_dtype : bool
+
+        Notes
+        -----
+        The default implementation is True if
+
+        1. ``cls.construct_from_string(dtype)`` is an instance
+           of ``cls``.
+        2. ``dtype`` is an object and is an instance of ``cls``
+        3. ``dtype`` has a ``dtype`` attribute, and any of the above
+           conditions is true for ``dtype.dtype``.
+        """
+        dtype = getattr(dtype, 'dtype', dtype)
+
+        if isinstance(dtype, (ABCSeries, ABCIndexClass,
+                              ABCDataFrame, np.dtype)):
+            # https://github.com/pandas-dev/pandas/issues/22960
+            # avoid passing data to `construct_from_string`. This could
+            # cause a FutureWarning from numpy about failing elementwise
+            # comparison from, e.g., comparing DataFrame == 'category'.
+            return False
+        elif dtype is None:
+            return False
+        elif isinstance(dtype, cls):
+            return True
+        try:
+            return cls.construct_from_string(dtype) is not None
+        except TypeError:
+            return False
+
+    @property
+    def _is_numeric(self):
+        # type: () -> bool
+        """
+        Whether columns with this dtype should be considered numeric.
+
+        By default ExtensionDtypes are assumed to be non-numeric.
+        They'll be excluded from operations that exclude non-numeric
+        columns, like (groupby) reductions, plotting, etc.
+        """
+        return False
+
+    @property
+    def _is_boolean(self):
+        # type: () -> bool
+        """
+        Whether this dtype should be considered boolean.
+
+        By default, ExtensionDtypes are assumed to be non-numeric.
+        Setting this to True will affect the behavior of several places,
+        e.g.
+
+        * is_bool
+        * boolean indexing
+
+        Returns
+        -------
+        bool
+        """
+        return False
+
+
+class ExtensionDtype(_DtypeOpsMixin):
+    """
+    A custom data type, to be paired with an ExtensionArray.
+
+    .. versionadded:: 0.23.0
+
+    See Also
+    --------
+    extensions.register_extension_dtype
+    extensions.ExtensionArray
+
+    Notes
+    -----
+    The interface includes the following abstract methods that must
+    be implemented by subclasses:
+
+    * type
+    * name
+    * construct_from_string
+
+    The following attributes influence the behavior of the dtype in
+    pandas operations
+
+    * _is_numeric
+    * _is_boolean
+
+    Optionally one can override construct_array_type for construction
+    with the name of this dtype via the Registry. See
+    :meth:`extensions.register_extension_dtype`.
+
+    * construct_array_type
+
+    The `na_value` class attribute can be used to set the default NA value
+    for this type. :attr:`numpy.nan` is used by default.
+
+    ExtensionDtypes are required to be hashable. The base class provides
+    a default implementation, which relies on the ``_metadata`` class
+    attribute. ``_metadata`` should be a tuple containing the strings
+    that define your data type. For example, with ``PeriodDtype`` that's
+    the ``freq`` attribute.
+
+    **If you have a parametrized dtype you should set the ``_metadata``
+    class property**.
+
+    Ideally, the attributes in ``_metadata`` will match the
+    parameters to your ``ExtensionDtype.__init__`` (if any). If any of
+    the attributes in ``_metadata`` don't implement the standard
+    ``__eq__`` or ``__hash__``, the default implementations here will not
+    work.
+
+    .. versionchanged:: 0.24.0
+
+       Added ``_metadata``, ``__hash__``, and changed the default definition
+       of ``__eq__``.
+
+    This class does not inherit from 'abc.ABCMeta' for performance reasons.
+    Methods and properties required by the interface raise
+    ``pandas.errors.AbstractMethodError`` and no ``register`` method is
+    provided for registering virtual subclasses.
+    """
+
+    def __str__(self):
+        return self.name
+
+    @property
+    def type(self):
+        # type: () -> type
+        """
+        The scalar type for the array, e.g. ``int``
+
+        It's expected ``ExtensionArray[item]`` returns an instance
+        of ``ExtensionDtype.type`` for scalar ``item``, assuming
+        that value is valid (not NA). NA values do not need to be
+        instances of `type`.
+        """
+        raise AbstractMethodError(self)
+
+    @property
+    def kind(self):
+        # type () -> str
+        """
+        A character code (one of 'biufcmMOSUV'), default 'O'
+
+        This should match the NumPy dtype used when the array is
+        converted to an ndarray, which is probably 'O' for object if
+        the extension type cannot be represented as a built-in NumPy
+        type.
+
+        See Also
+        --------
+        numpy.dtype.kind
+        """
+        return 'O'
+
+    @property
+    def name(self):
+        # type: () -> str
+        """
+        A string identifying the data type.
+
+        Will be used for display in, e.g. ``Series.dtype``
+        """
+        raise AbstractMethodError(self)
+
+    @classmethod
+    def construct_array_type(cls):
+        """
+        Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        raise NotImplementedError
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        Attempt to construct this type from a string.
+
+        Parameters
+        ----------
+        string : str
+
+        Returns
+        -------
+        self : instance of 'cls'
+
+        Raises
+        ------
+        TypeError
+            If a class cannot be constructed from this 'string'.
+
+        Examples
+        --------
+        If the extension dtype can be constructed without any arguments,
+        the following may be an adequate implementation.
+
+        >>> @classmethod
+        ... def construct_from_string(cls, string)
+        ...     if string == cls.name:
+        ...         return cls()
+        ...     else:
+        ...         raise TypeError("Cannot construct a '{}' from "
+        ...                         "'{}'".format(cls, string))
+        """
+        raise AbstractMethodError(cls)
diff --git a/pandas/core/dtypes/cast.py b/pandas/core/dtypes/cast.py
new file mode 100644
index 0000000000000..f6561948df99a
--- /dev/null
+++ b/pandas/core/dtypes/cast.py
@@ -0,0 +1,1326 @@
+""" routings for casting """
+
+from datetime import datetime, timedelta
+
+import numpy as np
+
+from pandas._libs import lib, tslib, tslibs
+from pandas._libs.tslibs import NaT, OutOfBoundsDatetime, Period, iNaT
+from pandas.compat import PY3, string_types, text_type, to_str
+
+from .common import (
+    _INT64_DTYPE, _NS_DTYPE, _POSSIBLY_CAST_DTYPES, _TD_DTYPE, ensure_int8,
+    ensure_int16, ensure_int32, ensure_int64, ensure_object, is_bool,
+    is_bool_dtype, is_categorical_dtype, is_complex, is_complex_dtype,
+    is_datetime64_dtype, is_datetime64_ns_dtype, is_datetime64tz_dtype,
+    is_datetime_or_timedelta_dtype, is_datetimelike, is_dtype_equal,
+    is_extension_array_dtype, is_extension_type, is_float, is_float_dtype,
+    is_integer, is_integer_dtype, is_object_dtype, is_scalar, is_string_dtype,
+    is_timedelta64_dtype, is_timedelta64_ns_dtype, is_unsigned_integer_dtype,
+    pandas_dtype)
+from .dtypes import (
+    DatetimeTZDtype, ExtensionDtype, PandasExtensionDtype, PeriodDtype)
+from .generic import (
+    ABCDatetimeArray, ABCDatetimeIndex, ABCPeriodArray, ABCPeriodIndex,
+    ABCSeries)
+from .inference import is_list_like
+from .missing import isna, notna
+
+_int8_max = np.iinfo(np.int8).max
+_int16_max = np.iinfo(np.int16).max
+_int32_max = np.iinfo(np.int32).max
+_int64_max = np.iinfo(np.int64).max
+
+
+def maybe_convert_platform(values):
+    """ try to do platform conversion, allow ndarray or list here """
+
+    if isinstance(values, (list, tuple)):
+        values = construct_1d_object_array_from_listlike(list(values))
+    if getattr(values, 'dtype', None) == np.object_:
+        if hasattr(values, '_values'):
+            values = values._values
+        values = lib.maybe_convert_objects(values)
+
+    return values
+
+
+def is_nested_object(obj):
+    """
+    return a boolean if we have a nested object, e.g. a Series with 1 or
+    more Series elements
+
+    This may not be necessarily be performant.
+
+    """
+
+    if isinstance(obj, ABCSeries) and is_object_dtype(obj):
+
+        if any(isinstance(v, ABCSeries) for v in obj.values):
+            return True
+
+    return False
+
+
+def maybe_downcast_to_dtype(result, dtype):
+    """ try to cast to the specified dtype (e.g. convert back to bool/int
+    or could be an astype of float64->float32
+    """
+
+    if is_scalar(result):
+        return result
+
+    def trans(x):
+        return x
+
+    if isinstance(dtype, string_types):
+        if dtype == 'infer':
+            inferred_type = lib.infer_dtype(ensure_object(result.ravel()),
+                                            skipna=False)
+            if inferred_type == 'boolean':
+                dtype = 'bool'
+            elif inferred_type == 'integer':
+                dtype = 'int64'
+            elif inferred_type == 'datetime64':
+                dtype = 'datetime64[ns]'
+            elif inferred_type == 'timedelta64':
+                dtype = 'timedelta64[ns]'
+
+            # try to upcast here
+            elif inferred_type == 'floating':
+                dtype = 'int64'
+                if issubclass(result.dtype.type, np.number):
+
+                    def trans(x):  # noqa
+                        return x.round()
+            else:
+                dtype = 'object'
+
+    if isinstance(dtype, string_types):
+        dtype = np.dtype(dtype)
+
+    try:
+
+        # don't allow upcasts here (except if empty)
+        if dtype.kind == result.dtype.kind:
+            if (result.dtype.itemsize <= dtype.itemsize and
+                    np.prod(result.shape)):
+                return result
+
+        if is_bool_dtype(dtype) or is_integer_dtype(dtype):
+
+            # if we don't have any elements, just astype it
+            if not np.prod(result.shape):
+                return trans(result).astype(dtype)
+
+            # do a test on the first element, if it fails then we are done
+            r = result.ravel()
+            arr = np.array([r[0]])
+
+            # if we have any nulls, then we are done
+            if (isna(arr).any() or
+                    not np.allclose(arr, trans(arr).astype(dtype), rtol=0)):
+                return result
+
+            # a comparable, e.g. a Decimal may slip in here
+            elif not isinstance(r[0], (np.integer, np.floating, np.bool, int,
+                                       float, bool)):
+                return result
+
+            if (issubclass(result.dtype.type, (np.object_, np.number)) and
+                    notna(result).all()):
+                new_result = trans(result).astype(dtype)
+                try:
+                    if np.allclose(new_result, result, rtol=0):
+                        return new_result
+                except Exception:
+
+                    # comparison of an object dtype with a number type could
+                    # hit here
+                    if (new_result == result).all():
+                        return new_result
+        elif (issubclass(dtype.type, np.floating) and
+                not is_bool_dtype(result.dtype)):
+            return result.astype(dtype)
+
+        # a datetimelike
+        # GH12821, iNaT is casted to float
+        elif dtype.kind in ['M', 'm'] and result.dtype.kind in ['i', 'f']:
+            try:
+                result = result.astype(dtype)
+            except Exception:
+                if dtype.tz:
+                    # convert to datetime and change timezone
+                    from pandas import to_datetime
+                    result = to_datetime(result).tz_localize('utc')
+                    result = result.tz_convert(dtype.tz)
+
+        elif dtype.type == Period:
+            # TODO(DatetimeArray): merge with previous elif
+            from pandas.core.arrays import PeriodArray
+
+            return PeriodArray(result, freq=dtype.freq)
+
+    except Exception:
+        pass
+
+    return result
+
+
+def maybe_upcast_putmask(result, mask, other):
+    """
+    A safe version of putmask that potentially upcasts the result
+
+    Parameters
+    ----------
+    result : ndarray
+        The destination array. This will be mutated in-place if no upcasting is
+        necessary.
+    mask : boolean ndarray
+    other : ndarray or scalar
+        The source array or value
+
+    Returns
+    -------
+    result : ndarray
+    changed : boolean
+        Set to true if the result array was upcasted
+    """
+
+    if mask.any():
+        # Two conversions for date-like dtypes that can't be done automatically
+        # in np.place:
+        #   NaN -> NaT
+        #   integer or integer array -> date-like array
+        if is_datetimelike(result.dtype):
+            if is_scalar(other):
+                if isna(other):
+                    other = result.dtype.type('nat')
+                elif is_integer(other):
+                    other = np.array(other, dtype=result.dtype)
+            elif is_integer_dtype(other):
+                other = np.array(other, dtype=result.dtype)
+
+        def changeit():
+
+            # try to directly set by expanding our array to full
+            # length of the boolean
+            try:
+                om = other[mask]
+                om_at = om.astype(result.dtype)
+                if (om == om_at).all():
+                    new_result = result.values.copy()
+                    new_result[mask] = om_at
+                    result[:] = new_result
+                    return result, False
+            except Exception:
+                pass
+
+            # we are forced to change the dtype of the result as the input
+            # isn't compatible
+            r, _ = maybe_upcast(result, fill_value=other, copy=True)
+            np.place(r, mask, other)
+
+            return r, True
+
+        # we want to decide whether place will work
+        # if we have nans in the False portion of our mask then we need to
+        # upcast (possibly), otherwise we DON't want to upcast (e.g. if we
+        # have values, say integers, in the success portion then it's ok to not
+        # upcast)
+        new_dtype, _ = maybe_promote(result.dtype, other)
+        if new_dtype != result.dtype:
+
+            # we have a scalar or len 0 ndarray
+            # and its nan and we are changing some values
+            if (is_scalar(other) or
+                    (isinstance(other, np.ndarray) and other.ndim < 1)):
+                if isna(other):
+                    return changeit()
+
+            # we have an ndarray and the masking has nans in it
+            else:
+
+                if isna(other[mask]).any():
+                    return changeit()
+
+        try:
+            np.place(result, mask, other)
+        except Exception:
+            return changeit()
+
+    return result, False
+
+
+def maybe_promote(dtype, fill_value=np.nan):
+    # if we passed an array here, determine the fill value by dtype
+    if isinstance(fill_value, np.ndarray):
+        if issubclass(fill_value.dtype.type, (np.datetime64, np.timedelta64)):
+            fill_value = iNaT
+        else:
+
+            # we need to change to object type as our
+            # fill_value is of object type
+            if fill_value.dtype == np.object_:
+                dtype = np.dtype(np.object_)
+            fill_value = np.nan
+
+    # returns tuple of (dtype, fill_value)
+    if issubclass(dtype.type, np.datetime64):
+        fill_value = tslibs.Timestamp(fill_value).value
+    elif issubclass(dtype.type, np.timedelta64):
+        fill_value = tslibs.Timedelta(fill_value).value
+    elif is_datetime64tz_dtype(dtype):
+        if isna(fill_value):
+            fill_value = NaT
+    elif is_extension_array_dtype(dtype) and isna(fill_value):
+        fill_value = dtype.na_value
+    elif is_float(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, np.integer):
+            dtype = np.float64
+    elif is_bool(fill_value):
+        if not issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+    elif is_integer(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, np.integer):
+            # upcast to prevent overflow
+            arr = np.asarray(fill_value)
+            if arr != arr.astype(dtype):
+                dtype = arr.dtype
+    elif is_complex(fill_value):
+        if issubclass(dtype.type, np.bool_):
+            dtype = np.object_
+        elif issubclass(dtype.type, (np.integer, np.floating)):
+            dtype = np.complex128
+    elif fill_value is None:
+        if is_float_dtype(dtype) or is_complex_dtype(dtype):
+            fill_value = np.nan
+        elif is_integer_dtype(dtype):
+            dtype = np.float64
+            fill_value = np.nan
+        elif is_datetime_or_timedelta_dtype(dtype):
+            fill_value = iNaT
+        else:
+            dtype = np.object_
+            fill_value = np.nan
+    else:
+        dtype = np.object_
+
+    # in case we have a string that looked like a number
+    if is_extension_array_dtype(dtype):
+        pass
+    elif is_datetime64tz_dtype(dtype):
+        pass
+    elif issubclass(np.dtype(dtype).type, string_types):
+        dtype = np.object_
+
+    return dtype, fill_value
+
+
+def infer_dtype_from(val, pandas_dtype=False):
+    """
+    interpret the dtype from a scalar or array. This is a convenience
+    routines to infer dtype from a scalar or an array
+
+    Parameters
+    ----------
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, scalar/array belongs to pandas extension types is inferred as
+        object
+    """
+    if is_scalar(val):
+        return infer_dtype_from_scalar(val, pandas_dtype=pandas_dtype)
+    return infer_dtype_from_array(val, pandas_dtype=pandas_dtype)
+
+
+def infer_dtype_from_scalar(val, pandas_dtype=False):
+    """
+    interpret the dtype from a scalar
+
+    Parameters
+    ----------
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, scalar belongs to pandas extension types is inferred as
+        object
+    """
+
+    dtype = np.object_
+
+    # a 1-element ndarray
+    if isinstance(val, np.ndarray):
+        msg = "invalid ndarray passed to infer_dtype_from_scalar"
+        if val.ndim != 0:
+            raise ValueError(msg)
+
+        dtype = val.dtype
+        val = val.item()
+
+    elif isinstance(val, string_types):
+
+        # If we create an empty array using a string to infer
+        # the dtype, NumPy will only allocate one character per entry
+        # so this is kind of bad. Alternately we could use np.repeat
+        # instead of np.empty (but then you still don't want things
+        # coming out as np.str_!
+
+        dtype = np.object_
+
+    elif isinstance(val, (np.datetime64, datetime)):
+        val = tslibs.Timestamp(val)
+        if val is tslibs.NaT or val.tz is None:
+            dtype = np.dtype('M8[ns]')
+        else:
+            if pandas_dtype:
+                dtype = DatetimeTZDtype(unit='ns', tz=val.tz)
+            else:
+                # return datetimetz as object
+                return np.object_, val
+        val = val.value
+
+    elif isinstance(val, (np.timedelta64, timedelta)):
+        val = tslibs.Timedelta(val).value
+        dtype = np.dtype('m8[ns]')
+
+    elif is_bool(val):
+        dtype = np.bool_
+
+    elif is_integer(val):
+        if isinstance(val, np.integer):
+            dtype = type(val)
+        else:
+            dtype = np.int64
+
+    elif is_float(val):
+        if isinstance(val, np.floating):
+            dtype = type(val)
+        else:
+            dtype = np.float64
+
+    elif is_complex(val):
+        dtype = np.complex_
+
+    elif pandas_dtype:
+        if lib.is_period(val):
+            dtype = PeriodDtype(freq=val.freq)
+            val = val.ordinal
+
+    return dtype, val
+
+
+def infer_dtype_from_array(arr, pandas_dtype=False):
+    """
+    infer the dtype from a scalar or array
+
+    Parameters
+    ----------
+    arr : scalar or array
+    pandas_dtype : bool, default False
+        whether to infer dtype including pandas extension types.
+        If False, array belongs to pandas extension types
+        is inferred as object
+
+    Returns
+    -------
+    tuple (numpy-compat/pandas-compat dtype, array)
+
+    Notes
+    -----
+    if pandas_dtype=False. these infer to numpy dtypes
+    exactly with the exception that mixed / object dtypes
+    are not coerced by stringifying or conversion
+
+    if pandas_dtype=True. datetime64tz-aware/categorical
+    types will retain there character.
+
+    Examples
+    --------
+    >>> np.asarray([1, '1'])
+    array(['1', '1'], dtype='<U21')
+
+    >>> infer_dtype_from_array([1, '1'])
+    (numpy.object_, [1, '1'])
+
+    """
+
+    if isinstance(arr, np.ndarray):
+        return arr.dtype, arr
+
+    if not is_list_like(arr):
+        arr = [arr]
+
+    if pandas_dtype and is_extension_type(arr):
+        return arr.dtype, arr
+
+    elif isinstance(arr, ABCSeries):
+        return arr.dtype, np.asarray(arr)
+
+    # don't force numpy coerce with nan's
+    inferred = lib.infer_dtype(arr, skipna=False)
+    if inferred in ['string', 'bytes', 'unicode',
+                    'mixed', 'mixed-integer']:
+        return (np.object_, arr)
+
+    arr = np.asarray(arr)
+    return arr.dtype, arr
+
+
+def maybe_infer_dtype_type(element):
+    """Try to infer an object's dtype, for use in arithmetic ops
+
+    Uses `element.dtype` if that's available.
+    Objects implementing the iterator protocol are cast to a NumPy array,
+    and from there the array's type is used.
+
+    Parameters
+    ----------
+    element : object
+        Possibly has a `.dtype` attribute, and possibly the iterator
+        protocol.
+
+    Returns
+    -------
+    tipo : type
+
+    Examples
+    --------
+    >>> from collections import namedtuple
+    >>> Foo = namedtuple("Foo", "dtype")
+    >>> maybe_infer_dtype_type(Foo(np.dtype("i8")))
+    numpy.int64
+    """
+    tipo = None
+    if hasattr(element, 'dtype'):
+        tipo = element.dtype
+    elif is_list_like(element):
+        element = np.asarray(element)
+        tipo = element.dtype
+    return tipo
+
+
+def maybe_upcast(values, fill_value=np.nan, dtype=None, copy=False):
+    """ provide explicit type promotion and coercion
+
+    Parameters
+    ----------
+    values : the ndarray that we want to maybe upcast
+    fill_value : what we want to fill with
+    dtype : if None, then use the dtype of the values, else coerce to this type
+    copy : if True always make a copy even if no upcast is required
+    """
+
+    if is_extension_type(values):
+        if copy:
+            values = values.copy()
+    else:
+        if dtype is None:
+            dtype = values.dtype
+        new_dtype, fill_value = maybe_promote(dtype, fill_value)
+        if new_dtype != values.dtype:
+            values = values.astype(new_dtype)
+        elif copy:
+            values = values.copy()
+
+    return values, fill_value
+
+
+def maybe_cast_item(obj, item, dtype):
+    chunk = obj[item]
+
+    if chunk.values.dtype != dtype:
+        if dtype in (np.object_, np.bool_):
+            obj[item] = chunk.astype(np.object_)
+        elif not issubclass(dtype, (np.integer, np.bool_)):  # pragma: no cover
+            raise ValueError("Unexpected dtype encountered: {dtype}"
+                             .format(dtype=dtype))
+
+
+def invalidate_string_dtypes(dtype_set):
+    """Change string like dtypes to object for
+    ``DataFrame.select_dtypes()``.
+    """
+    non_string_dtypes = dtype_set - {np.dtype('S').type, np.dtype('<U').type}
+    if non_string_dtypes != dtype_set:
+        raise TypeError("string dtypes are not allowed, use 'object' instead")
+
+
+def coerce_indexer_dtype(indexer, categories):
+    """ coerce the indexer input array to the smallest dtype possible """
+    length = len(categories)
+    if length < _int8_max:
+        return ensure_int8(indexer)
+    elif length < _int16_max:
+        return ensure_int16(indexer)
+    elif length < _int32_max:
+        return ensure_int32(indexer)
+    return ensure_int64(indexer)
+
+
+def coerce_to_dtypes(result, dtypes):
+    """
+    given a dtypes and a result set, coerce the result elements to the
+    dtypes
+    """
+    if len(result) != len(dtypes):
+        raise AssertionError("_coerce_to_dtypes requires equal len arrays")
+
+    def conv(r, dtype):
+        try:
+            if isna(r):
+                pass
+            elif dtype == _NS_DTYPE:
+                r = tslibs.Timestamp(r)
+            elif dtype == _TD_DTYPE:
+                r = tslibs.Timedelta(r)
+            elif dtype == np.bool_:
+                # messy. non 0/1 integers do not get converted.
+                if is_integer(r) and r not in [0, 1]:
+                    return int(r)
+                r = bool(r)
+            elif dtype.kind == 'f':
+                r = float(r)
+            elif dtype.kind == 'i':
+                r = int(r)
+        except Exception:
+            pass
+
+        return r
+
+    return [conv(r, dtype) for r, dtype in zip(result, dtypes)]
+
+
+def astype_nansafe(arr, dtype, copy=True, skipna=False):
+    """
+    Cast the elements of an array to a given dtype a nan-safe manner.
+
+    Parameters
+    ----------
+    arr : ndarray
+    dtype : np.dtype
+    copy : bool, default True
+        If False, a view will be attempted but may fail, if
+        e.g. the item sizes don't align.
+    skipna: bool, default False
+        Whether or not we should skip NaN when casting as a string-type.
+
+    Raises
+    ------
+    ValueError
+        The dtype was a datetime64/timedelta64 dtype, but it had no unit.
+    """
+
+    # dispatch on extension dtype if needed
+    if is_extension_array_dtype(dtype):
+        return dtype.construct_array_type()._from_sequence(
+            arr, dtype=dtype, copy=copy)
+
+    if not isinstance(dtype, np.dtype):
+        dtype = pandas_dtype(dtype)
+
+    if issubclass(dtype.type, text_type):
+        # in Py3 that's str, in Py2 that's unicode
+        return lib.astype_unicode(arr.ravel(),
+                                  skipna=skipna).reshape(arr.shape)
+
+    elif issubclass(dtype.type, string_types):
+        return lib.astype_str(arr.ravel(),
+                              skipna=skipna).reshape(arr.shape)
+
+    elif is_datetime64_dtype(arr):
+        if is_object_dtype(dtype):
+            return tslib.ints_to_pydatetime(arr.view(np.int64))
+        elif dtype == np.int64:
+            return arr.view(dtype)
+
+        # allow frequency conversions
+        if dtype.kind == 'M':
+            return arr.astype(dtype)
+
+        raise TypeError("cannot astype a datetimelike from [{from_dtype}] "
+                        "to [{to_dtype}]".format(from_dtype=arr.dtype,
+                                                 to_dtype=dtype))
+
+    elif is_timedelta64_dtype(arr):
+        if is_object_dtype(dtype):
+            return tslibs.ints_to_pytimedelta(arr.view(np.int64))
+        elif dtype == np.int64:
+            return arr.view(dtype)
+
+        # in py3, timedelta64[ns] are int64
+        if ((PY3 and dtype not in [_INT64_DTYPE, _TD_DTYPE]) or
+                (not PY3 and dtype != _TD_DTYPE)):
+
+            # allow frequency conversions
+            # we return a float here!
+            if dtype.kind == 'm':
+                mask = isna(arr)
+                result = arr.astype(dtype).astype(np.float64)
+                result[mask] = np.nan
+                return result
+        elif dtype == _TD_DTYPE:
+            return arr.astype(_TD_DTYPE, copy=copy)
+
+        raise TypeError("cannot astype a timedelta from [{from_dtype}] "
+                        "to [{to_dtype}]".format(from_dtype=arr.dtype,
+                                                 to_dtype=dtype))
+
+    elif (np.issubdtype(arr.dtype, np.floating) and
+          np.issubdtype(dtype, np.integer)):
+
+        if not np.isfinite(arr).all():
+            raise ValueError('Cannot convert non-finite values (NA or inf) to '
+                             'integer')
+
+    elif is_object_dtype(arr):
+
+        # work around NumPy brokenness, #1987
+        if np.issubdtype(dtype.type, np.integer):
+            return lib.astype_intsafe(arr.ravel(), dtype).reshape(arr.shape)
+
+        # if we have a datetime/timedelta array of objects
+        # then coerce to a proper dtype and recall astype_nansafe
+
+        elif is_datetime64_dtype(dtype):
+            from pandas import to_datetime
+            return astype_nansafe(to_datetime(arr).values, dtype, copy=copy)
+        elif is_timedelta64_dtype(dtype):
+            from pandas import to_timedelta
+            return astype_nansafe(to_timedelta(arr).values, dtype, copy=copy)
+
+    if dtype.name in ("datetime64", "timedelta64"):
+        msg = ("The '{dtype}' dtype has no unit. "
+               "Please pass in '{dtype}[ns]' instead.")
+        raise ValueError(msg.format(dtype=dtype.name))
+
+    if copy or is_object_dtype(arr) or is_object_dtype(dtype):
+        # Explicit copy, or required since NumPy can't view from / to object.
+        return arr.astype(dtype, copy=True)
+
+    return arr.view(dtype)
+
+
+def maybe_convert_objects(values, convert_dates=True, convert_numeric=True,
+                          convert_timedeltas=True, copy=True):
+    """ if we have an object dtype, try to coerce dates and/or numbers """
+
+    # if we have passed in a list or scalar
+    if isinstance(values, (list, tuple)):
+        values = np.array(values, dtype=np.object_)
+    if not hasattr(values, 'dtype'):
+        values = np.array([values], dtype=np.object_)
+
+    # convert dates
+    if convert_dates and values.dtype == np.object_:
+
+        # we take an aggressive stance and convert to datetime64[ns]
+        if convert_dates == 'coerce':
+            new_values = maybe_cast_to_datetime(
+                values, 'M8[ns]', errors='coerce')
+
+            # if we are all nans then leave me alone
+            if not isna(new_values).all():
+                values = new_values
+
+        else:
+            values = lib.maybe_convert_objects(values,
+                                               convert_datetime=convert_dates)
+
+    # convert timedeltas
+    if convert_timedeltas and values.dtype == np.object_:
+
+        if convert_timedeltas == 'coerce':
+            from pandas.core.tools.timedeltas import to_timedelta
+            new_values = to_timedelta(values, errors='coerce')
+
+            # if we are all nans then leave me alone
+            if not isna(new_values).all():
+                values = new_values
+
+        else:
+            values = lib.maybe_convert_objects(
+                values, convert_timedelta=convert_timedeltas)
+
+    # convert to numeric
+    if values.dtype == np.object_:
+        if convert_numeric:
+            try:
+                new_values = lib.maybe_convert_numeric(values, set(),
+                                                       coerce_numeric=True)
+
+                # if we are all nans then leave me alone
+                if not isna(new_values).all():
+                    values = new_values
+
+            except Exception:
+                pass
+        else:
+            # soft-conversion
+            values = lib.maybe_convert_objects(values)
+
+    values = values.copy() if copy else values
+
+    return values
+
+
+def soft_convert_objects(values, datetime=True, numeric=True, timedelta=True,
+                         coerce=False, copy=True):
+    """ if we have an object dtype, try to coerce dates and/or numbers """
+
+    conversion_count = sum((datetime, numeric, timedelta))
+    if conversion_count == 0:
+        raise ValueError('At least one of datetime, numeric or timedelta must '
+                         'be True.')
+    elif conversion_count > 1 and coerce:
+        raise ValueError("Only one of 'datetime', 'numeric' or "
+                         "'timedelta' can be True when when coerce=True.")
+
+    if isinstance(values, (list, tuple)):
+        # List or scalar
+        values = np.array(values, dtype=np.object_)
+    elif not hasattr(values, 'dtype'):
+        values = np.array([values], dtype=np.object_)
+    elif not is_object_dtype(values.dtype):
+        # If not object, do not attempt conversion
+        values = values.copy() if copy else values
+        return values
+
+    # If 1 flag is coerce, ensure 2 others are False
+    if coerce:
+        # Immediate return if coerce
+        if datetime:
+            from pandas import to_datetime
+            return to_datetime(values, errors='coerce', box=False)
+        elif timedelta:
+            from pandas import to_timedelta
+            return to_timedelta(values, errors='coerce', box=False)
+        elif numeric:
+            from pandas import to_numeric
+            return to_numeric(values, errors='coerce')
+
+    # Soft conversions
+    if datetime:
+        # GH 20380, when datetime is beyond year 2262, hence outside
+        # bound of nanosecond-resolution 64-bit integers.
+        try:
+            values = lib.maybe_convert_objects(values,
+                                               convert_datetime=datetime)
+        except OutOfBoundsDatetime:
+            pass
+
+    if timedelta and is_object_dtype(values.dtype):
+        # Object check to ensure only run if previous did not convert
+        values = lib.maybe_convert_objects(values, convert_timedelta=timedelta)
+
+    if numeric and is_object_dtype(values.dtype):
+        try:
+            converted = lib.maybe_convert_numeric(values, set(),
+                                                  coerce_numeric=True)
+            # If all NaNs, then do not-alter
+            values = converted if not isna(converted).all() else values
+            values = values.copy() if copy else values
+        except Exception:
+            pass
+
+    return values
+
+
+def maybe_castable(arr):
+    # return False to force a non-fastpath
+
+    # check datetime64[ns]/timedelta64[ns] are valid
+    # otherwise try to coerce
+    kind = arr.dtype.kind
+    if kind == 'M':
+        return is_datetime64_ns_dtype(arr.dtype)
+    elif kind == 'm':
+        return is_timedelta64_ns_dtype(arr.dtype)
+
+    return arr.dtype.name not in _POSSIBLY_CAST_DTYPES
+
+
+def maybe_infer_to_datetimelike(value, convert_dates=False):
+    """
+    we might have a array (or single object) that is datetime like,
+    and no dtype is passed don't change the value unless we find a
+    datetime/timedelta set
+
+    this is pretty strict in that a datetime/timedelta is REQUIRED
+    in addition to possible nulls/string likes
+
+    Parameters
+    ----------
+    value : np.array / Series / Index / list-like
+    convert_dates : boolean, default False
+       if True try really hard to convert dates (such as datetime.date), other
+       leave inferred dtype 'date' alone
+
+    """
+
+    # TODO: why not timedelta?
+    if isinstance(value, (ABCDatetimeIndex, ABCPeriodIndex,
+                          ABCDatetimeArray, ABCPeriodArray)):
+        return value
+    elif isinstance(value, ABCSeries):
+        if isinstance(value._values, ABCDatetimeIndex):
+            return value._values
+
+    v = value
+
+    if not is_list_like(v):
+        v = [v]
+    v = np.array(v, copy=False)
+
+    # we only care about object dtypes
+    if not is_object_dtype(v):
+        return value
+
+    shape = v.shape
+    if not v.ndim == 1:
+        v = v.ravel()
+
+    if not len(v):
+        return value
+
+    def try_datetime(v):
+        # safe coerce to datetime64
+        try:
+            # GH19671
+            v = tslib.array_to_datetime(v,
+                                        require_iso8601=True,
+                                        errors='raise')[0]
+        except ValueError:
+
+            # we might have a sequence of the same-datetimes with tz's
+            # if so coerce to a DatetimeIndex; if they are not the same,
+            # then these stay as object dtype, xref GH19671
+            try:
+                from pandas._libs.tslibs import conversion
+                from pandas import DatetimeIndex
+
+                values, tz = conversion.datetime_to_datetime64(v)
+                return DatetimeIndex(values).tz_localize(
+                    'UTC').tz_convert(tz=tz)
+            except (ValueError, TypeError):
+                pass
+
+        except Exception:
+            pass
+
+        return v.reshape(shape)
+
+    def try_timedelta(v):
+        # safe coerce to timedelta64
+
+        # will try first with a string & object conversion
+        from pandas import to_timedelta
+        try:
+            return to_timedelta(v)._ndarray_values.reshape(shape)
+        except Exception:
+            return v.reshape(shape)
+
+    inferred_type = lib.infer_datetimelike_array(ensure_object(v))
+
+    if inferred_type == 'date' and convert_dates:
+        value = try_datetime(v)
+    elif inferred_type == 'datetime':
+        value = try_datetime(v)
+    elif inferred_type == 'timedelta':
+        value = try_timedelta(v)
+    elif inferred_type == 'nat':
+
+        # if all NaT, return as datetime
+        if isna(v).all():
+            value = try_datetime(v)
+        else:
+
+            # We have at least a NaT and a string
+            # try timedelta first to avoid spurious datetime conversions
+            # e.g. '00:00:01' is a timedelta but technically is also a datetime
+            value = try_timedelta(v)
+            if lib.infer_dtype(value, skipna=False) in ['mixed']:
+                # cannot skip missing values, as NaT implies that the string
+                # is actually a datetime
+                value = try_datetime(v)
+
+    return value
+
+
+def maybe_cast_to_datetime(value, dtype, errors='raise'):
+    """ try to cast the array/value to a datetimelike dtype, converting float
+    nan to iNaT
+    """
+    from pandas.core.tools.timedeltas import to_timedelta
+    from pandas.core.tools.datetimes import to_datetime
+
+    if dtype is not None:
+        if isinstance(dtype, string_types):
+            dtype = np.dtype(dtype)
+
+        is_datetime64 = is_datetime64_dtype(dtype)
+        is_datetime64tz = is_datetime64tz_dtype(dtype)
+        is_timedelta64 = is_timedelta64_dtype(dtype)
+
+        if is_datetime64 or is_datetime64tz or is_timedelta64:
+
+            # Force the dtype if needed.
+            msg = ("The '{dtype}' dtype has no unit. "
+                   "Please pass in '{dtype}[ns]' instead.")
+
+            if is_datetime64 and not is_dtype_equal(dtype, _NS_DTYPE):
+                if dtype.name in ('datetime64', 'datetime64[ns]'):
+                    if dtype.name == 'datetime64':
+                        raise ValueError(msg.format(dtype=dtype.name))
+                    dtype = _NS_DTYPE
+                else:
+                    raise TypeError("cannot convert datetimelike to "
+                                    "dtype [{dtype}]".format(dtype=dtype))
+            elif is_datetime64tz:
+
+                # our NaT doesn't support tz's
+                # this will coerce to DatetimeIndex with
+                # a matching dtype below
+                if is_scalar(value) and isna(value):
+                    value = [value]
+
+            elif is_timedelta64 and not is_dtype_equal(dtype, _TD_DTYPE):
+                if dtype.name in ('timedelta64', 'timedelta64[ns]'):
+                    if dtype.name == 'timedelta64':
+                        raise ValueError(msg.format(dtype=dtype.name))
+                    dtype = _TD_DTYPE
+                else:
+                    raise TypeError("cannot convert timedeltalike to "
+                                    "dtype [{dtype}]".format(dtype=dtype))
+
+            if is_scalar(value):
+                if value == iNaT or isna(value):
+                    value = iNaT
+            else:
+                value = np.array(value, copy=False)
+
+                # have a scalar array-like (e.g. NaT)
+                if value.ndim == 0:
+                    value = iNaT
+
+                # we have an array of datetime or timedeltas & nulls
+                elif np.prod(value.shape) or not is_dtype_equal(value.dtype,
+                                                                dtype):
+                    try:
+                        if is_datetime64:
+                            value = to_datetime(value, errors=errors)._values
+                        elif is_datetime64tz:
+                            # The string check can be removed once issue #13712
+                            # is solved. String data that is passed with a
+                            # datetime64tz is assumed to be naive which should
+                            # be localized to the timezone.
+                            is_dt_string = is_string_dtype(value)
+                            value = to_datetime(value, errors=errors).array
+                            if is_dt_string:
+                                # Strings here are naive, so directly localize
+                                value = value.tz_localize(dtype.tz)
+                            else:
+                                # Numeric values are UTC at this point,
+                                # so localize and convert
+                                value = (value.tz_localize('UTC')
+                                         .tz_convert(dtype.tz))
+                        elif is_timedelta64:
+                            value = to_timedelta(value, errors=errors)._values
+                    except (AttributeError, ValueError, TypeError):
+                        pass
+
+        # coerce datetimelike to object
+        elif is_datetime64_dtype(value) and not is_datetime64_dtype(dtype):
+            if is_object_dtype(dtype):
+                if value.dtype != _NS_DTYPE:
+                    value = value.astype(_NS_DTYPE)
+                ints = np.asarray(value).view('i8')
+                return tslib.ints_to_pydatetime(ints)
+
+            # we have a non-castable dtype that was passed
+            raise TypeError('Cannot cast datetime64 to {dtype}'
+                            .format(dtype=dtype))
+
+    else:
+
+        is_array = isinstance(value, np.ndarray)
+
+        # catch a datetime/timedelta that is not of ns variety
+        # and no coercion specified
+        if is_array and value.dtype.kind in ['M', 'm']:
+            dtype = value.dtype
+
+            if dtype.kind == 'M' and dtype != _NS_DTYPE:
+                value = value.astype(_NS_DTYPE)
+
+            elif dtype.kind == 'm' and dtype != _TD_DTYPE:
+                value = to_timedelta(value)
+
+        # only do this if we have an array and the dtype of the array is not
+        # setup already we are not an integer/object, so don't bother with this
+        # conversion
+        elif not (is_array and not (issubclass(value.dtype.type, np.integer) or
+                                    value.dtype == np.object_)):
+            value = maybe_infer_to_datetimelike(value)
+
+    return value
+
+
+def find_common_type(types):
+    """
+    Find a common data type among the given dtypes.
+
+    Parameters
+    ----------
+    types : list of dtypes
+
+    Returns
+    -------
+    pandas extension or numpy dtype
+
+    See Also
+    --------
+    numpy.find_common_type
+
+    """
+
+    if len(types) == 0:
+        raise ValueError('no types given')
+
+    first = types[0]
+
+    # workaround for find_common_type([np.dtype('datetime64[ns]')] * 2)
+    # => object
+    if all(is_dtype_equal(first, t) for t in types[1:]):
+        return first
+
+    if any(isinstance(t, (PandasExtensionDtype, ExtensionDtype))
+           for t in types):
+        return np.object
+
+    # take lowest unit
+    if all(is_datetime64_dtype(t) for t in types):
+        return np.dtype('datetime64[ns]')
+    if all(is_timedelta64_dtype(t) for t in types):
+        return np.dtype('timedelta64[ns]')
+
+    # don't mix bool / int or float or complex
+    # this is different from numpy, which casts bool with float/int as int
+    has_bools = any(is_bool_dtype(t) for t in types)
+    if has_bools:
+        for t in types:
+            if is_integer_dtype(t) or is_float_dtype(t) or is_complex_dtype(t):
+                return np.object
+
+    return np.find_common_type(types, [])
+
+
+def cast_scalar_to_array(shape, value, dtype=None):
+    """
+    create np.ndarray of specified shape and dtype, filled with values
+
+    Parameters
+    ----------
+    shape : tuple
+    value : scalar value
+    dtype : np.dtype, optional
+        dtype to coerce
+
+    Returns
+    -------
+    ndarray of shape, filled with value, of specified / inferred dtype
+
+    """
+
+    if dtype is None:
+        dtype, fill_value = infer_dtype_from_scalar(value)
+    else:
+        fill_value = value
+
+    values = np.empty(shape, dtype=dtype)
+    values.fill(fill_value)
+
+    return values
+
+
+def construct_1d_arraylike_from_scalar(value, length, dtype):
+    """
+    create a np.ndarray / pandas type of specified shape and dtype
+    filled with values
+
+    Parameters
+    ----------
+    value : scalar value
+    length : int
+    dtype : pandas_dtype / np.dtype
+
+    Returns
+    -------
+    np.ndarray / pandas type of length, filled with value
+
+    """
+    if is_datetime64tz_dtype(dtype):
+        from pandas import DatetimeIndex
+        subarr = DatetimeIndex([value] * length, dtype=dtype)
+    elif is_categorical_dtype(dtype):
+        from pandas import Categorical
+        subarr = Categorical([value] * length, dtype=dtype)
+    else:
+        if not isinstance(dtype, (np.dtype, type(np.dtype))):
+            dtype = dtype.dtype
+
+        if length and is_integer_dtype(dtype) and isna(value):
+            # coerce if we have nan for an integer dtype
+            dtype = np.dtype('float64')
+        elif isinstance(dtype, np.dtype) and dtype.kind in ("U", "S"):
+            # we need to coerce to object dtype to avoid
+            # to allow numpy to take our string as a scalar value
+            dtype = object
+            if not isna(value):
+                value = to_str(value)
+
+        subarr = np.empty(length, dtype=dtype)
+        subarr.fill(value)
+
+    return subarr
+
+
+def construct_1d_object_array_from_listlike(values):
+    """
+    Transform any list-like object in a 1-dimensional numpy array of object
+    dtype.
+
+    Parameters
+    ----------
+    values : any iterable which has a len()
+
+    Raises
+    ------
+    TypeError
+        * If `values` does not have a len()
+
+    Returns
+    -------
+    1-dimensional numpy array of dtype object
+    """
+    # numpy will try to interpret nested lists as further dimensions, hence
+    # making a 1D array that contains list-likes is a bit tricky:
+    result = np.empty(len(values), dtype='object')
+    result[:] = values
+    return result
+
+
+def construct_1d_ndarray_preserving_na(values, dtype=None, copy=False):
+    """
+    Construct a new ndarray, coercing `values` to `dtype`, preserving NA.
+
+    Parameters
+    ----------
+    values : Sequence
+    dtype : numpy.dtype, optional
+    copy : bool, default False
+        Note that copies may still be made with ``copy=False`` if casting
+        is required.
+
+    Returns
+    -------
+    arr : ndarray[dtype]
+
+    Examples
+    --------
+    >>> np.array([1.0, 2.0, None], dtype='str')
+    array(['1.0', '2.0', 'None'], dtype='<U4')
+
+    >>> construct_1d_ndarray_preserving_na([1.0, 2.0, None], dtype='str')
+
+
+    """
+    subarr = np.array(values, dtype=dtype, copy=copy)
+
+    if dtype is not None and dtype.kind in ("U", "S"):
+        # GH-21083
+        # We can't just return np.array(subarr, dtype='str') since
+        # NumPy will convert the non-string objects into strings
+        # Including NA values. Se we have to go
+        # string -> object -> update NA, which requires an
+        # additional pass over the data.
+        na_values = isna(values)
+        subarr2 = subarr.astype(object)
+        subarr2[na_values] = np.asarray(values, dtype=object)[na_values]
+        subarr = subarr2
+
+    return subarr
+
+
+def maybe_cast_to_integer_array(arr, dtype, copy=False):
+    """
+    Takes any dtype and returns the casted version, raising for when data is
+    incompatible with integer/unsigned integer dtypes.
+
+    .. versionadded:: 0.24.0
+
+    Parameters
+    ----------
+    arr : array-like
+        The array to cast.
+    dtype : str, np.dtype
+        The integer dtype to cast the array to.
+    copy: boolean, default False
+        Whether to make a copy of the array before returning.
+
+    Returns
+    -------
+    int_arr : ndarray
+        An array of integer or unsigned integer dtype
+
+    Raises
+    ------
+    OverflowError : the dtype is incompatible with the data
+    ValueError : loss of precision has occurred during casting
+
+    Examples
+    --------
+    If you try to coerce negative values to unsigned integers, it raises:
+
+    >>> Series([-1], dtype="uint64")
+    Traceback (most recent call last):
+        ...
+    OverflowError: Trying to coerce negative values to unsigned integers
+
+    Also, if you try to coerce float values to integers, it raises:
+
+    >>> Series([1, 2, 3.5], dtype="int64")
+    Traceback (most recent call last):
+        ...
+    ValueError: Trying to coerce float values to integers
+    """
+
+    try:
+        if not hasattr(arr, "astype"):
+            casted = np.array(arr, dtype=dtype, copy=copy)
+        else:
+            casted = arr.astype(dtype, copy=copy)
+    except OverflowError:
+        raise OverflowError("The elements provided in the data cannot all be "
+                            "casted to the dtype {dtype}".format(dtype=dtype))
+
+    if np.array_equal(arr, casted):
+        return casted
+
+    # We do this casting to allow for proper
+    # data and dtype checking.
+    #
+    # We didn't do this earlier because NumPy
+    # doesn't handle `uint64` correctly.
+    arr = np.asarray(arr)
+
+    if is_unsigned_integer_dtype(dtype) and (arr < 0).any():
+        raise OverflowError("Trying to coerce negative values "
+                            "to unsigned integers")
+
+    if is_integer_dtype(dtype) and (is_float_dtype(arr) or
+                                    is_object_dtype(arr)):
+        raise ValueError("Trying to coerce float values to integers")
diff --git a/pandas/core/dtypes/common.py b/pandas/core/dtypes/common.py
new file mode 100644
index 0000000000000..4be7eb8ddb890
--- /dev/null
+++ b/pandas/core/dtypes/common.py
@@ -0,0 +1,2057 @@
+""" common type operations """
+import warnings
+
+import numpy as np
+
+from pandas._libs import algos, lib
+from pandas._libs.tslibs import conversion
+from pandas.compat import PY3, PY36, string_types
+
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, DatetimeTZDtype, ExtensionDtype, IntervalDtype,
+    PandasExtensionDtype, PeriodDtype, registry)
+from pandas.core.dtypes.generic import (
+    ABCCategorical, ABCDateOffset, ABCDatetimeIndex, ABCIndexClass,
+    ABCPeriodArray, ABCPeriodIndex, ABCSeries)
+from pandas.core.dtypes.inference import (  # noqa:F401
+    is_array_like, is_bool, is_complex, is_decimal, is_dict_like, is_file_like,
+    is_float, is_hashable, is_integer, is_interval, is_iterator, is_list_like,
+    is_named_tuple, is_nested_list_like, is_number, is_re, is_re_compilable,
+    is_scalar, is_sequence, is_string_like)
+
+_POSSIBLY_CAST_DTYPES = {np.dtype(t).name
+                         for t in ['O', 'int8', 'uint8', 'int16', 'uint16',
+                                   'int32', 'uint32', 'int64', 'uint64']}
+
+_NS_DTYPE = conversion.NS_DTYPE
+_TD_DTYPE = conversion.TD_DTYPE
+_INT64_DTYPE = np.dtype(np.int64)
+
+# oh the troubles to reduce import time
+_is_scipy_sparse = None
+
+ensure_float64 = algos.ensure_float64
+ensure_float32 = algos.ensure_float32
+
+_ensure_datetime64ns = conversion.ensure_datetime64ns
+_ensure_timedelta64ns = conversion.ensure_timedelta64ns
+
+
+def ensure_float(arr):
+    """
+    Ensure that an array object has a float dtype if possible.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array whose data type we want to enforce as float.
+
+    Returns
+    -------
+    float_arr : The original array cast to the float dtype if
+                possible. Otherwise, the original array is returned.
+    """
+
+    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
+        arr = arr.astype(float)
+    return arr
+
+
+ensure_uint64 = algos.ensure_uint64
+ensure_int64 = algos.ensure_int64
+ensure_int32 = algos.ensure_int32
+ensure_int16 = algos.ensure_int16
+ensure_int8 = algos.ensure_int8
+ensure_platform_int = algos.ensure_platform_int
+ensure_object = algos.ensure_object
+
+
+def ensure_categorical(arr):
+    """
+    Ensure that an array-like object is a Categorical (if not already).
+
+    Parameters
+    ----------
+    arr : array-like
+        The array that we want to convert into a Categorical.
+
+    Returns
+    -------
+    cat_arr : The original array cast as a Categorical. If it already
+              is a Categorical, we return as is.
+    """
+
+    if not is_categorical(arr):
+        from pandas import Categorical
+        arr = Categorical(arr)
+    return arr
+
+
+def ensure_int64_or_float64(arr, copy=False):
+    """
+    Ensure that an dtype array of some integer dtype
+    has an int64 dtype if possible
+    If it's not possible, potentially because of overflow,
+    convert the array to float64 instead.
+
+    Parameters
+    ----------
+    arr : array-like
+          The array whose data type we want to enforce.
+    copy: boolean
+          Whether to copy the original array or reuse
+          it in place, if possible.
+
+    Returns
+    -------
+    out_arr : The input array cast as int64 if
+              possible without overflow.
+              Otherwise the input array cast to float64.
+    """
+    try:
+        return arr.astype('int64', copy=copy, casting='safe')
+    except TypeError:
+        return arr.astype('float64', copy=copy)
+
+
+def classes(*klasses):
+    """ evaluate if the tipo is a subclass of the klasses """
+    return lambda tipo: issubclass(tipo, klasses)
+
+
+def classes_and_not_datetimelike(*klasses):
+    """
+    evaluate if the tipo is a subclass of the klasses
+    and not a datetimelike
+    """
+    return lambda tipo: (issubclass(tipo, klasses) and
+                         not issubclass(tipo, (np.datetime64, np.timedelta64)))
+
+
+def is_object_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the object dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the object dtype.
+
+    Examples
+    --------
+    >>> is_object_dtype(object)
+    True
+    >>> is_object_dtype(int)
+    False
+    >>> is_object_dtype(np.array([], dtype=object))
+    True
+    >>> is_object_dtype(np.array([], dtype=int))
+    False
+    >>> is_object_dtype([1, 2, 3])
+    False
+    """
+    return _is_dtype_type(arr_or_dtype, classes(np.object_))
+
+
+def is_sparse(arr):
+    """
+    Check whether an array-like is a 1-D pandas sparse array.
+
+    Check that the one-dimensional array-like is a pandas sparse array.
+    Returns True if it is a pandas sparse array, not another type of
+    sparse array.
+
+    Parameters
+    ----------
+    arr : array-like
+        Array-like to check.
+
+    Returns
+    -------
+    bool
+        Whether or not the array-like is a pandas sparse array.
+
+    See Also
+    --------
+    DataFrame.to_sparse : Convert DataFrame to a SparseDataFrame.
+    Series.to_sparse : Convert Series to SparseSeries.
+    Series.to_dense : Return dense representation of a Series.
+
+    Examples
+    --------
+    Returns `True` if the parameter is a 1-D pandas sparse array.
+
+    >>> is_sparse(pd.SparseArray([0, 0, 1, 0]))
+    True
+    >>> is_sparse(pd.SparseSeries([0, 0, 1, 0]))
+    True
+
+    Returns `False` if the parameter is not sparse.
+
+    >>> is_sparse(np.array([0, 0, 1, 0]))
+    False
+    >>> is_sparse(pd.Series([0, 1, 0, 0]))
+    False
+
+    Returns `False` if the parameter is not a pandas sparse array.
+
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_sparse(bsr_matrix([0, 1, 0, 0]))
+    False
+
+    Returns `False` if the parameter has more than one dimension.
+
+    >>> df = pd.SparseDataFrame([389., 24., 80.5, np.nan],
+                                columns=['max_speed'],
+                                index=['falcon', 'parrot', 'lion', 'monkey'])
+    >>> is_sparse(df)
+    False
+    >>> is_sparse(df.max_speed)
+    True
+    """
+    from pandas.core.arrays.sparse import SparseDtype
+
+    dtype = getattr(arr, 'dtype', arr)
+    return isinstance(dtype, SparseDtype)
+
+
+def is_scipy_sparse(arr):
+    """
+    Check whether an array-like is a scipy.sparse.spmatrix instance.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a scipy.sparse.spmatrix instance.
+
+    Notes
+    -----
+    If scipy is not installed, this function will always return False.
+
+    Examples
+    --------
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_scipy_sparse(bsr_matrix([1, 2, 3]))
+    True
+    >>> is_scipy_sparse(pd.SparseArray([1, 2, 3]))
+    False
+    >>> is_scipy_sparse(pd.SparseSeries([1, 2, 3]))
+    False
+    """
+
+    global _is_scipy_sparse
+
+    if _is_scipy_sparse is None:
+        try:
+            from scipy.sparse import issparse as _is_scipy_sparse
+        except ImportError:
+            _is_scipy_sparse = lambda _: False
+
+    return _is_scipy_sparse(arr)
+
+
+def is_categorical(arr):
+    """
+    Check whether an array-like is a Categorical instance.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is of a Categorical instance.
+
+    Examples
+    --------
+    >>> is_categorical([1, 2, 3])
+    False
+
+    Categoricals, Series Categoricals, and CategoricalIndex will return True.
+
+    >>> cat = pd.Categorical([1, 2, 3])
+    >>> is_categorical(cat)
+    True
+    >>> is_categorical(pd.Series(cat))
+    True
+    >>> is_categorical(pd.CategoricalIndex([1, 2, 3]))
+    True
+    """
+
+    return isinstance(arr, ABCCategorical) or is_categorical_dtype(arr)
+
+
+def is_datetimetz(arr):
+    """
+    Check whether an array-like is a datetime array-like with a timezone
+    component in its dtype.
+
+    .. deprecated:: 0.24.0
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a datetime array-like with a
+        timezone component in its dtype.
+
+    Examples
+    --------
+    >>> is_datetimetz([1, 2, 3])
+    False
+
+    Although the following examples are both DatetimeIndex objects,
+    the first one returns False because it has no timezone component
+    unlike the second one, which returns True.
+
+    >>> is_datetimetz(pd.DatetimeIndex([1, 2, 3]))
+    False
+    >>> is_datetimetz(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+
+    The object need not be a DatetimeIndex object. It just needs to have
+    a dtype which has a timezone component.
+
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetimetz(s)
+    True
+    """
+
+    warnings.warn("'is_datetimetz' is deprecated and will be removed in a "
+                  "future version.  Use 'is_datetime64tz_dtype' instead.",
+                  FutureWarning, stacklevel=2)
+    return is_datetime64tz_dtype(arr)
+
+
+def is_offsetlike(arr_or_obj):
+    """
+    Check if obj or all elements of list-like is DateOffset
+
+    Parameters
+    ----------
+    arr_or_obj : object
+
+    Returns
+    -------
+    boolean
+        Whether the object is a DateOffset or listlike of DatetOffsets
+
+    Examples
+    --------
+    >>> is_offsetlike(pd.DateOffset(days=1))
+    True
+    >>> is_offsetlike('offset')
+    False
+    >>> is_offsetlike([pd.offsets.Minute(4), pd.offsets.MonthEnd()])
+    True
+    >>> is_offsetlike(np.array([pd.DateOffset(months=3), pd.Timestamp.now()]))
+    False
+    """
+    if isinstance(arr_or_obj, ABCDateOffset):
+        return True
+    elif (is_list_like(arr_or_obj) and len(arr_or_obj) and
+          is_object_dtype(arr_or_obj)):
+        return all(isinstance(x, ABCDateOffset) for x in arr_or_obj)
+    return False
+
+
+def is_period(arr):
+    """
+    Check whether an array-like is a periodical index.
+
+    .. deprecated:: 0.24.0
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a periodical index.
+
+    Examples
+    --------
+    >>> is_period([1, 2, 3])
+    False
+    >>> is_period(pd.Index([1, 2, 3]))
+    False
+    >>> is_period(pd.PeriodIndex(["2017-01-01"], freq="D"))
+    True
+    """
+
+    warnings.warn("'is_period' is deprecated and will be removed in a future "
+                  "version.  Use 'is_period_dtype' or is_period_arraylike' "
+                  "instead.", FutureWarning, stacklevel=2)
+
+    return isinstance(arr, ABCPeriodIndex) or is_period_arraylike(arr)
+
+
+def is_datetime64_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_dtype(object)
+    False
+    >>> is_datetime64_dtype(np.datetime64)
+    True
+    >>> is_datetime64_dtype(np.array([], dtype=int))
+    False
+    >>> is_datetime64_dtype(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetime64_dtype([1, 2, 3])
+    False
+    """
+
+    return _is_dtype_type(arr_or_dtype, classes(np.datetime64))
+
+
+def is_datetime64tz_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of a DatetimeTZDtype dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of a DatetimeTZDtype dtype.
+
+    Examples
+    --------
+    >>> is_datetime64tz_dtype(object)
+    False
+    >>> is_datetime64tz_dtype([1, 2, 3])
+    False
+    >>> is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3]))  # tz-naive
+    False
+    >>> is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetime64tz_dtype(dtype)
+    True
+    >>> is_datetime64tz_dtype(s)
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return DatetimeTZDtype.is_dtype(arr_or_dtype)
+
+
+def is_timedelta64_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the timedelta64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the timedelta64 dtype.
+
+    Examples
+    --------
+    >>> is_timedelta64_dtype(object)
+    False
+    >>> is_timedelta64_dtype(np.timedelta64)
+    True
+    >>> is_timedelta64_dtype([1, 2, 3])
+    False
+    >>> is_timedelta64_dtype(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>> is_timedelta64_dtype('0 days')
+    False
+    """
+
+    return _is_dtype_type(arr_or_dtype, classes(np.timedelta64))
+
+
+def is_period_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Period dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the Period dtype.
+
+    Examples
+    --------
+    >>> is_period_dtype(object)
+    False
+    >>> is_period_dtype(PeriodDtype(freq="D"))
+    True
+    >>> is_period_dtype([1, 2, 3])
+    False
+    >>> is_period_dtype(pd.Period("2017-01-01"))
+    False
+    >>> is_period_dtype(pd.PeriodIndex([], freq="A"))
+    True
+    """
+
+    # TODO: Consider making Period an instance of PeriodDtype
+    if arr_or_dtype is None:
+        return False
+    return PeriodDtype.is_dtype(arr_or_dtype)
+
+
+def is_interval_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Interval dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the Interval dtype.
+
+    Examples
+    --------
+    >>> is_interval_dtype(object)
+    False
+    >>> is_interval_dtype(IntervalDtype())
+    True
+    >>> is_interval_dtype([1, 2, 3])
+    False
+    >>>
+    >>> interval = pd.Interval(1, 2, closed="right")
+    >>> is_interval_dtype(interval)
+    False
+    >>> is_interval_dtype(pd.IntervalIndex([interval]))
+    True
+    """
+
+    # TODO: Consider making Interval an instance of IntervalDtype
+    if arr_or_dtype is None:
+        return False
+    return IntervalDtype.is_dtype(arr_or_dtype)
+
+
+def is_categorical_dtype(arr_or_dtype):
+    """
+    Check whether an array-like or dtype is of the Categorical dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like or dtype is of the Categorical dtype.
+
+    Examples
+    --------
+    >>> is_categorical_dtype(object)
+    False
+    >>> is_categorical_dtype(CategoricalDtype())
+    True
+    >>> is_categorical_dtype([1, 2, 3])
+    False
+    >>> is_categorical_dtype(pd.Categorical([1, 2, 3]))
+    True
+    >>> is_categorical_dtype(pd.CategoricalIndex([1, 2, 3]))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return CategoricalDtype.is_dtype(arr_or_dtype)
+
+
+def is_string_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the string dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the string dtype.
+
+    Examples
+    --------
+    >>> is_string_dtype(str)
+    True
+    >>> is_string_dtype(object)
+    True
+    >>> is_string_dtype(int)
+    False
+    >>>
+    >>> is_string_dtype(np.array(['a', 'b']))
+    True
+    >>> is_string_dtype(pd.Series([1, 2]))
+    False
+    """
+
+    # TODO: gh-15585: consider making the checks stricter.
+    def condition(dtype):
+        return dtype.kind in ('O', 'S', 'U') and not is_period_dtype(dtype)
+    return _is_dtype(arr_or_dtype, condition)
+
+
+def is_period_arraylike(arr):
+    """
+    Check whether an array-like is a periodical array-like or PeriodIndex.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a periodical array-like or
+        PeriodIndex instance.
+
+    Examples
+    --------
+    >>> is_period_arraylike([1, 2, 3])
+    False
+    >>> is_period_arraylike(pd.Index([1, 2, 3]))
+    False
+    >>> is_period_arraylike(pd.PeriodIndex(["2017-01-01"], freq="D"))
+    True
+    """
+
+    if isinstance(arr, (ABCPeriodIndex, ABCPeriodArray)):
+        return True
+    elif isinstance(arr, (np.ndarray, ABCSeries)):
+        return is_period_dtype(arr.dtype)
+    return getattr(arr, 'inferred_type', None) == 'period'
+
+
+def is_datetime_arraylike(arr):
+    """
+    Check whether an array-like is a datetime array-like or DatetimeIndex.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a datetime array-like or
+        DatetimeIndex.
+
+    Examples
+    --------
+    >>> is_datetime_arraylike([1, 2, 3])
+    False
+    >>> is_datetime_arraylike(pd.Index([1, 2, 3]))
+    False
+    >>> is_datetime_arraylike(pd.DatetimeIndex([1, 2, 3]))
+    True
+    """
+
+    if isinstance(arr, ABCDatetimeIndex):
+        return True
+    elif isinstance(arr, (np.ndarray, ABCSeries)):
+        return (is_object_dtype(arr.dtype)
+                and lib.infer_dtype(arr, skipna=False) == 'datetime')
+    return getattr(arr, 'inferred_type', None) == 'datetime'
+
+
+def is_datetimelike(arr):
+    """
+    Check whether an array-like is a datetime-like array-like.
+
+    Acceptable datetime-like objects are (but not limited to) datetime
+    indices, periodic indices, and timedelta indices.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is a datetime-like array-like.
+
+    Examples
+    --------
+    >>> is_datetimelike([1, 2, 3])
+    False
+    >>> is_datetimelike(pd.Index([1, 2, 3]))
+    False
+    >>> is_datetimelike(pd.DatetimeIndex([1, 2, 3]))
+    True
+    >>> is_datetimelike(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    >>> is_datetimelike(pd.PeriodIndex([], freq="A"))
+    True
+    >>> is_datetimelike(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetimelike(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>>
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_datetimelike(s)
+    True
+    """
+
+    return (is_datetime64_dtype(arr) or is_datetime64tz_dtype(arr) or
+            is_timedelta64_dtype(arr) or
+            isinstance(arr, ABCPeriodIndex))
+
+
+def is_dtype_equal(source, target):
+    """
+    Check if two dtypes are equal.
+
+    Parameters
+    ----------
+    source : The first dtype to compare
+    target : The second dtype to compare
+
+    Returns
+    ----------
+    boolean
+        Whether or not the two dtypes are equal.
+
+    Examples
+    --------
+    >>> is_dtype_equal(int, float)
+    False
+    >>> is_dtype_equal("int", int)
+    True
+    >>> is_dtype_equal(object, "category")
+    False
+    >>> is_dtype_equal(CategoricalDtype(), "category")
+    True
+    >>> is_dtype_equal(DatetimeTZDtype(), "datetime64")
+    False
+    """
+
+    try:
+        source = _get_dtype(source)
+        target = _get_dtype(target)
+        return source == target
+    except (TypeError, AttributeError):
+
+        # invalid comparison
+        # object == category will hit this
+        return False
+
+
+def is_dtype_union_equal(source, target):
+    """
+    Check whether two arrays have compatible dtypes to do a union.
+    numpy types are checked with ``is_dtype_equal``. Extension types are
+    checked separately.
+
+    Parameters
+    ----------
+    source : The first dtype to compare
+    target : The second dtype to compare
+
+    Returns
+    ----------
+    boolean
+        Whether or not the two dtypes are equal.
+
+    >>> is_dtype_equal("int", int)
+    True
+
+    >>> is_dtype_equal(CategoricalDtype(['a', 'b'],
+    ...                CategoricalDtype(['b', 'c']))
+    True
+
+    >>> is_dtype_equal(CategoricalDtype(['a', 'b'],
+    ...                CategoricalDtype(['b', 'c'], ordered=True))
+    False
+    """
+    source = _get_dtype(source)
+    target = _get_dtype(target)
+    if is_categorical_dtype(source) and is_categorical_dtype(target):
+        # ordered False for both
+        return source.ordered is target.ordered
+    return is_dtype_equal(source, target)
+
+
+def is_any_int_dtype(arr_or_dtype):
+    """Check whether the provided array or dtype is of an integer dtype.
+
+    In this function, timedelta64 instances are also considered "any-integer"
+    type objects and will return True.
+
+    This function is internal and should not be exposed in the public API.
+
+    .. versionchanged:: 0.24.0
+
+       The nullable Integer dtypes (e.g. pandas.Int64Dtype) are also considered
+       as integer by this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of an integer dtype.
+
+    Examples
+    --------
+    >>> is_any_int_dtype(str)
+    False
+    >>> is_any_int_dtype(int)
+    True
+    >>> is_any_int_dtype(float)
+    False
+    >>> is_any_int_dtype(np.uint64)
+    True
+    >>> is_any_int_dtype(np.datetime64)
+    False
+    >>> is_any_int_dtype(np.timedelta64)
+    True
+    >>> is_any_int_dtype(np.array(['a', 'b']))
+    False
+    >>> is_any_int_dtype(pd.Series([1, 2]))
+    True
+    >>> is_any_int_dtype(np.array([], dtype=np.timedelta64))
+    True
+    >>> is_any_int_dtype(pd.Index([1, 2.]))  # float
+    False
+    """
+
+    return _is_dtype_type(
+        arr_or_dtype, classes(np.integer, np.timedelta64))
+
+
+def is_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of an integer dtype.
+
+    Unlike in `in_any_int_dtype`, timedelta64 instances will return False.
+
+    .. versionchanged:: 0.24.0
+
+       The nullable Integer dtypes (e.g. pandas.Int64Dtype) are also considered
+       as integer by this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of an integer dtype and
+        not an instance of timedelta64.
+
+    Examples
+    --------
+    >>> is_integer_dtype(str)
+    False
+    >>> is_integer_dtype(int)
+    True
+    >>> is_integer_dtype(float)
+    False
+    >>> is_integer_dtype(np.uint64)
+    True
+    >>> is_integer_dtype('int8')
+    True
+    >>> is_integer_dtype('Int8')
+    True
+    >>> is_integer_dtype(pd.Int8Dtype)
+    True
+    >>> is_integer_dtype(np.datetime64)
+    False
+    >>> is_integer_dtype(np.timedelta64)
+    False
+    >>> is_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_integer_dtype(pd.Series([1, 2]))
+    True
+    >>> is_integer_dtype(np.array([], dtype=np.timedelta64))
+    False
+    >>> is_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    """
+
+    return _is_dtype_type(
+        arr_or_dtype, classes_and_not_datetimelike(np.integer))
+
+
+def is_signed_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a signed integer dtype.
+
+    Unlike in `in_any_int_dtype`, timedelta64 instances will return False.
+
+    .. versionchanged:: 0.24.0
+
+       The nullable Integer dtypes (e.g. pandas.Int64Dtype) are also considered
+       as integer by this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a signed integer dtype
+        and not an instance of timedelta64.
+
+    Examples
+    --------
+    >>> is_signed_integer_dtype(str)
+    False
+    >>> is_signed_integer_dtype(int)
+    True
+    >>> is_signed_integer_dtype(float)
+    False
+    >>> is_signed_integer_dtype(np.uint64)  # unsigned
+    False
+    >>> is_signed_integer_dtype('int8')
+    True
+    >>> is_signed_integer_dtype('Int8')
+    True
+    >>> is_signed_dtype(pd.Int8Dtype)
+    True
+    >>> is_signed_integer_dtype(np.datetime64)
+    False
+    >>> is_signed_integer_dtype(np.timedelta64)
+    False
+    >>> is_signed_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_signed_integer_dtype(pd.Series([1, 2]))
+    True
+    >>> is_signed_integer_dtype(np.array([], dtype=np.timedelta64))
+    False
+    >>> is_signed_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_signed_integer_dtype(np.array([1, 2], dtype=np.uint32))  # unsigned
+    False
+    """
+
+    return _is_dtype_type(
+        arr_or_dtype, classes_and_not_datetimelike(np.signedinteger))
+
+
+def is_unsigned_integer_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of an unsigned integer dtype.
+
+    .. versionchanged:: 0.24.0
+
+       The nullable Integer dtypes (e.g. pandas.UInt64Dtype) are also
+       considered as integer by this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of an unsigned integer dtype.
+
+    Examples
+    --------
+    >>> is_unsigned_integer_dtype(str)
+    False
+    >>> is_unsigned_integer_dtype(int)  # signed
+    False
+    >>> is_unsigned_integer_dtype(float)
+    False
+    >>> is_unsigned_integer_dtype(np.uint64)
+    True
+    >>> is_unsigned_integer_dtype('uint8')
+    True
+    >>> is_unsigned_integer_dtype('UInt8')
+    True
+    >>> is_unsigned_integer_dtype(pd.UInt8Dtype)
+    True
+    >>> is_unsigned_integer_dtype(np.array(['a', 'b']))
+    False
+    >>> is_unsigned_integer_dtype(pd.Series([1, 2]))  # signed
+    False
+    >>> is_unsigned_integer_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_unsigned_integer_dtype(np.array([1, 2], dtype=np.uint32))
+    True
+    """
+    return _is_dtype_type(
+        arr_or_dtype, classes_and_not_datetimelike(np.unsignedinteger))
+
+
+def is_int64_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the int64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the int64 dtype.
+
+    Notes
+    -----
+    Depending on system architecture, the return value of `is_int64_dtype(
+    int)` will be True if the OS uses 64-bit integers and False if the OS
+    uses 32-bit integers.
+
+    Examples
+    --------
+    >>> is_int64_dtype(str)
+    False
+    >>> is_int64_dtype(np.int32)
+    False
+    >>> is_int64_dtype(np.int64)
+    True
+    >>> is_int64_dtype('int8')
+    False
+    >>> is_int64_dtype('Int8')
+    False
+    >>> is_int64_dtype(pd.Int64Dtype)
+    True
+    >>> is_int64_dtype(float)
+    False
+    >>> is_int64_dtype(np.uint64)  # unsigned
+    False
+    >>> is_int64_dtype(np.array(['a', 'b']))
+    False
+    >>> is_int64_dtype(np.array([1, 2], dtype=np.int64))
+    True
+    >>> is_int64_dtype(pd.Index([1, 2.]))  # float
+    False
+    >>> is_int64_dtype(np.array([1, 2], dtype=np.uint32))  # unsigned
+    False
+    """
+
+    return _is_dtype_type(arr_or_dtype, classes(np.int64))
+
+
+def is_datetime64_any_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_any_dtype(str)
+    False
+    >>> is_datetime64_any_dtype(int)
+    False
+    >>> is_datetime64_any_dtype(np.datetime64)  # can be tz-naive
+    True
+    >>> is_datetime64_any_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    True
+    >>> is_datetime64_any_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime64_any_dtype(np.array([1, 2]))
+    False
+    >>> is_datetime64_any_dtype(np.array([], dtype=np.datetime64))
+    True
+    >>> is_datetime64_any_dtype(pd.DatetimeIndex([1, 2, 3],
+                                dtype=np.datetime64))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return (is_datetime64_dtype(arr_or_dtype) or
+            is_datetime64tz_dtype(arr_or_dtype))
+
+
+def is_datetime64_ns_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the datetime64[ns] dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the datetime64[ns] dtype.
+
+    Examples
+    --------
+    >>> is_datetime64_ns_dtype(str)
+    False
+    >>> is_datetime64_ns_dtype(int)
+    False
+    >>> is_datetime64_ns_dtype(np.datetime64)  # no unit
+    False
+    >>> is_datetime64_ns_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    True
+    >>> is_datetime64_ns_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime64_ns_dtype(np.array([1, 2]))
+    False
+    >>> is_datetime64_ns_dtype(np.array([], dtype=np.datetime64))  # no unit
+    False
+    >>> is_datetime64_ns_dtype(np.array([],
+                               dtype="datetime64[ps]"))  # wrong unit
+    False
+    >>> is_datetime64_ns_dtype(pd.DatetimeIndex([1, 2, 3],
+                               dtype=np.datetime64))  # has 'ns' unit
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        tipo = _get_dtype(arr_or_dtype)
+    except TypeError:
+        if is_datetime64tz_dtype(arr_or_dtype):
+            tipo = _get_dtype(arr_or_dtype.dtype)
+        else:
+            return False
+    return tipo == _NS_DTYPE or getattr(tipo, 'base', None) == _NS_DTYPE
+
+
+def is_timedelta64_ns_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of the timedelta64[ns] dtype.
+
+    This is a very specific dtype, so generic ones like `np.timedelta64`
+    will return False if passed into this function.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the timedelta64[ns] dtype.
+
+    Examples
+    --------
+    >>> is_timedelta64_ns_dtype(np.dtype('m8[ns]'))
+    True
+    >>> is_timedelta64_ns_dtype(np.dtype('m8[ps]'))  # Wrong frequency
+    False
+    >>> is_timedelta64_ns_dtype(np.array([1, 2], dtype='m8[ns]'))
+    True
+    >>> is_timedelta64_ns_dtype(np.array([1, 2], dtype=np.timedelta64))
+    False
+    """
+    return _is_dtype(arr_or_dtype, lambda dtype: dtype == _TD_DTYPE)
+
+
+def is_datetime_or_timedelta_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of
+    a timedelta64 or datetime64 dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a timedelta64,
+        or datetime64 dtype.
+
+    Examples
+    --------
+    >>> is_datetime_or_timedelta_dtype(str)
+    False
+    >>> is_datetime_or_timedelta_dtype(int)
+    False
+    >>> is_datetime_or_timedelta_dtype(np.datetime64)
+    True
+    >>> is_datetime_or_timedelta_dtype(np.timedelta64)
+    True
+    >>> is_datetime_or_timedelta_dtype(np.array(['a', 'b']))
+    False
+    >>> is_datetime_or_timedelta_dtype(pd.Series([1, 2]))
+    False
+    >>> is_datetime_or_timedelta_dtype(np.array([], dtype=np.timedelta64))
+    True
+    >>> is_datetime_or_timedelta_dtype(np.array([], dtype=np.datetime64))
+    True
+    """
+
+    return _is_dtype_type(
+        arr_or_dtype, classes(np.datetime64, np.timedelta64))
+
+
+def _is_unorderable_exception(e):
+    """
+    Check if the exception raised is an unorderable exception.
+
+    The error message differs for 3 <= PY <= 3.5 and PY >= 3.6, so
+    we need to condition based on Python version.
+
+    Parameters
+    ----------
+    e : Exception or sub-class
+        The exception object to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the exception raised is an unorderable exception.
+    """
+
+    if PY36:
+        return "'>' not supported between instances of" in str(e)
+
+    elif PY3:
+        return 'unorderable' in str(e)
+    return False
+
+
+def is_numeric_v_string_like(a, b):
+    """
+    Check if we are comparing a string-like object to a numeric ndarray.
+
+    NumPy doesn't like to compare such objects, especially numeric arrays
+    and scalar string-likes.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean
+        Whether we return a comparing a string-like object to a numeric array.
+
+    Examples
+    --------
+    >>> is_numeric_v_string_like(1, 1)
+    False
+    >>> is_numeric_v_string_like("foo", "foo")
+    False
+    >>> is_numeric_v_string_like(1, "foo")  # non-array numeric
+    False
+    >>> is_numeric_v_string_like(np.array([1]), "foo")
+    True
+    >>> is_numeric_v_string_like("foo", np.array([1]))  # symmetric check
+    True
+    >>> is_numeric_v_string_like(np.array([1, 2]), np.array(["foo"]))
+    True
+    >>> is_numeric_v_string_like(np.array(["foo"]), np.array([1, 2]))
+    True
+    >>> is_numeric_v_string_like(np.array([1]), np.array([2]))
+    False
+    >>> is_numeric_v_string_like(np.array(["foo"]), np.array(["foo"]))
+    False
+    """
+
+    is_a_array = isinstance(a, np.ndarray)
+    is_b_array = isinstance(b, np.ndarray)
+
+    is_a_numeric_array = is_a_array and is_numeric_dtype(a)
+    is_b_numeric_array = is_b_array and is_numeric_dtype(b)
+    is_a_string_array = is_a_array and is_string_like_dtype(a)
+    is_b_string_array = is_b_array and is_string_like_dtype(b)
+
+    is_a_scalar_string_like = not is_a_array and is_string_like(a)
+    is_b_scalar_string_like = not is_b_array and is_string_like(b)
+
+    return ((is_a_numeric_array and is_b_scalar_string_like) or
+            (is_b_numeric_array and is_a_scalar_string_like) or
+            (is_a_numeric_array and is_b_string_array) or
+            (is_b_numeric_array and is_a_string_array))
+
+
+def is_datetimelike_v_numeric(a, b):
+    """
+    Check if we are comparing a datetime-like object to a numeric object.
+
+    By "numeric," we mean an object that is either of an int or float dtype.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean
+        Whether we return a comparing a datetime-like to a numeric object.
+
+    Examples
+    --------
+    >>> dt = np.datetime64(pd.datetime(2017, 1, 1))
+    >>>
+    >>> is_datetimelike_v_numeric(1, 1)
+    False
+    >>> is_datetimelike_v_numeric(dt, dt)
+    False
+    >>> is_datetimelike_v_numeric(1, dt)
+    True
+    >>> is_datetimelike_v_numeric(dt, 1)  # symmetric check
+    True
+    >>> is_datetimelike_v_numeric(np.array([dt]), 1)
+    True
+    >>> is_datetimelike_v_numeric(np.array([1]), dt)
+    True
+    >>> is_datetimelike_v_numeric(np.array([dt]), np.array([1]))
+    True
+    >>> is_datetimelike_v_numeric(np.array([1]), np.array([2]))
+    False
+    >>> is_datetimelike_v_numeric(np.array([dt]), np.array([dt]))
+    False
+    """
+
+    if not hasattr(a, 'dtype'):
+        a = np.asarray(a)
+    if not hasattr(b, 'dtype'):
+        b = np.asarray(b)
+
+    def is_numeric(x):
+        """
+        Check if an object has a numeric dtype (i.e. integer or float).
+        """
+        return is_integer_dtype(x) or is_float_dtype(x)
+
+    is_datetimelike = needs_i8_conversion
+    return ((is_datetimelike(a) and is_numeric(b)) or
+            (is_datetimelike(b) and is_numeric(a)))
+
+
+def is_datetimelike_v_object(a, b):
+    """
+    Check if we are comparing a datetime-like object to an object instance.
+
+    Parameters
+    ----------
+    a : array-like, scalar
+        The first object to check.
+    b : array-like, scalar
+        The second object to check.
+
+    Returns
+    -------
+    boolean
+        Whether we return a comparing a datetime-like to an object instance.
+
+    Examples
+    --------
+    >>> obj = object()
+    >>> dt = np.datetime64(pd.datetime(2017, 1, 1))
+    >>>
+    >>> is_datetimelike_v_object(obj, obj)
+    False
+    >>> is_datetimelike_v_object(dt, dt)
+    False
+    >>> is_datetimelike_v_object(obj, dt)
+    True
+    >>> is_datetimelike_v_object(dt, obj)  # symmetric check
+    True
+    >>> is_datetimelike_v_object(np.array([dt]), obj)
+    True
+    >>> is_datetimelike_v_object(np.array([obj]), dt)
+    True
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([obj]))
+    True
+    >>> is_datetimelike_v_object(np.array([obj]), np.array([obj]))
+    False
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([1]))
+    False
+    >>> is_datetimelike_v_object(np.array([dt]), np.array([dt]))
+    False
+    """
+
+    if not hasattr(a, 'dtype'):
+        a = np.asarray(a)
+    if not hasattr(b, 'dtype'):
+        b = np.asarray(b)
+
+    is_datetimelike = needs_i8_conversion
+    return ((is_datetimelike(a) and is_object_dtype(b)) or
+            (is_datetimelike(b) and is_object_dtype(a)))
+
+
+def needs_i8_conversion(arr_or_dtype):
+    """
+    Check whether the array or dtype should be converted to int64.
+
+    An array-like or dtype "needs" such a conversion if the array-like
+    or dtype is of a datetime-like dtype
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype should be converted to int64.
+
+    Examples
+    --------
+    >>> needs_i8_conversion(str)
+    False
+    >>> needs_i8_conversion(np.int64)
+    False
+    >>> needs_i8_conversion(np.datetime64)
+    True
+    >>> needs_i8_conversion(np.array(['a', 'b']))
+    False
+    >>> needs_i8_conversion(pd.Series([1, 2]))
+    False
+    >>> needs_i8_conversion(pd.Series([], dtype="timedelta64[ns]"))
+    True
+    >>> needs_i8_conversion(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    """
+
+    if arr_or_dtype is None:
+        return False
+    return (is_datetime_or_timedelta_dtype(arr_or_dtype) or
+            is_datetime64tz_dtype(arr_or_dtype) or
+            is_period_dtype(arr_or_dtype))
+
+
+def is_numeric_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a numeric dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a numeric dtype.
+
+    Examples
+    --------
+    >>> is_numeric_dtype(str)
+    False
+    >>> is_numeric_dtype(int)
+    True
+    >>> is_numeric_dtype(float)
+    True
+    >>> is_numeric_dtype(np.uint64)
+    True
+    >>> is_numeric_dtype(np.datetime64)
+    False
+    >>> is_numeric_dtype(np.timedelta64)
+    False
+    >>> is_numeric_dtype(np.array(['a', 'b']))
+    False
+    >>> is_numeric_dtype(pd.Series([1, 2]))
+    True
+    >>> is_numeric_dtype(pd.Index([1, 2.]))
+    True
+    >>> is_numeric_dtype(np.array([], dtype=np.timedelta64))
+    False
+    """
+
+    return _is_dtype_type(
+        arr_or_dtype, classes_and_not_datetimelike(np.number, np.bool_))
+
+
+def is_string_like_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a string-like dtype.
+
+    Unlike `is_string_dtype`, the object dtype is excluded because it
+    is a mixed dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of the string dtype.
+
+    Examples
+    --------
+    >>> is_string_like_dtype(str)
+    True
+    >>> is_string_like_dtype(object)
+    False
+    >>> is_string_like_dtype(np.array(['a', 'b']))
+    True
+    >>> is_string_like_dtype(pd.Series([1, 2]))
+    False
+    """
+
+    return _is_dtype(
+        arr_or_dtype, lambda dtype: dtype.kind in ('S', 'U'))
+
+
+def is_float_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a float dtype.
+
+    This function is internal and should not be exposed in the public API.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a float dtype.
+
+    Examples
+    --------
+    >>> is_float_dtype(str)
+    False
+    >>> is_float_dtype(int)
+    False
+    >>> is_float_dtype(float)
+    True
+    >>> is_float_dtype(np.array(['a', 'b']))
+    False
+    >>> is_float_dtype(pd.Series([1, 2]))
+    False
+    >>> is_float_dtype(pd.Index([1, 2.]))
+    True
+    """
+    return _is_dtype_type(arr_or_dtype, classes(np.floating))
+
+
+def is_bool_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a boolean dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a boolean dtype.
+
+    Notes
+    -----
+    An ExtensionArray is considered boolean when the ``_is_boolean``
+    attribute is set to True.
+
+    Examples
+    --------
+    >>> is_bool_dtype(str)
+    False
+    >>> is_bool_dtype(int)
+    False
+    >>> is_bool_dtype(bool)
+    True
+    >>> is_bool_dtype(np.bool)
+    True
+    >>> is_bool_dtype(np.array(['a', 'b']))
+    False
+    >>> is_bool_dtype(pd.Series([1, 2]))
+    False
+    >>> is_bool_dtype(np.array([True, False]))
+    True
+    >>> is_bool_dtype(pd.Categorical([True, False]))
+    True
+    >>> is_bool_dtype(pd.SparseArray([True, False]))
+    True
+    """
+    if arr_or_dtype is None:
+        return False
+    try:
+        dtype = _get_dtype(arr_or_dtype)
+    except TypeError:
+        return False
+
+    if isinstance(arr_or_dtype, CategoricalDtype):
+        arr_or_dtype = arr_or_dtype.categories
+        # now we use the special definition for Index
+
+    if isinstance(arr_or_dtype, ABCIndexClass):
+
+        # TODO(jreback)
+        # we don't have a boolean Index class
+        # so its object, we need to infer to
+        # guess this
+        return (arr_or_dtype.is_object and
+                arr_or_dtype.inferred_type == 'boolean')
+    elif is_extension_array_dtype(arr_or_dtype):
+        dtype = getattr(arr_or_dtype, 'dtype', arr_or_dtype)
+        return dtype._is_boolean
+
+    return issubclass(dtype.type, np.bool_)
+
+
+def is_extension_type(arr):
+    """
+    Check whether an array-like is of a pandas extension class instance.
+
+    Extension classes include categoricals, pandas sparse objects (i.e.
+    classes represented within the pandas library and not ones external
+    to it like scipy sparse matrices), and datetime-like arrays.
+
+    Parameters
+    ----------
+    arr : array-like
+        The array-like to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array-like is of a pandas extension class instance.
+
+    Examples
+    --------
+    >>> is_extension_type([1, 2, 3])
+    False
+    >>> is_extension_type(np.array([1, 2, 3]))
+    False
+    >>>
+    >>> cat = pd.Categorical([1, 2, 3])
+    >>>
+    >>> is_extension_type(cat)
+    True
+    >>> is_extension_type(pd.Series(cat))
+    True
+    >>> is_extension_type(pd.SparseArray([1, 2, 3]))
+    True
+    >>> is_extension_type(pd.SparseSeries([1, 2, 3]))
+    True
+    >>>
+    >>> from scipy.sparse import bsr_matrix
+    >>> is_extension_type(bsr_matrix([1, 2, 3]))
+    False
+    >>> is_extension_type(pd.DatetimeIndex([1, 2, 3]))
+    False
+    >>> is_extension_type(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+    True
+    >>>
+    >>> dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    >>> s = pd.Series([], dtype=dtype)
+    >>> is_extension_type(s)
+    True
+    """
+
+    if is_categorical(arr):
+        return True
+    elif is_sparse(arr):
+        return True
+    elif is_datetime64tz_dtype(arr):
+        return True
+    return False
+
+
+def is_extension_array_dtype(arr_or_dtype):
+    """
+    Check if an object is a pandas extension array type.
+
+    See the :ref:`Use Guide <extending.extension-types>` for more.
+
+    Parameters
+    ----------
+    arr_or_dtype : object
+        For array-like input, the ``.dtype`` attribute will
+        be extracted.
+
+    Returns
+    -------
+    bool
+        Whether the `arr_or_dtype` is an extension array type.
+
+    Notes
+    -----
+    This checks whether an object implements the pandas extension
+    array interface. In pandas, this includes:
+
+    * Categorical
+    * Sparse
+    * Interval
+    * Period
+    * DatetimeArray
+    * TimedeltaArray
+
+    Third-party libraries may implement arrays or types satisfying
+    this interface as well.
+
+    Examples
+    --------
+    >>> from pandas.api.types import is_extension_array_dtype
+    >>> arr = pd.Categorical(['a', 'b'])
+    >>> is_extension_array_dtype(arr)
+    True
+    >>> is_extension_array_dtype(arr.dtype)
+    True
+
+    >>> arr = np.array(['a', 'b'])
+    >>> is_extension_array_dtype(arr.dtype)
+    False
+    """
+    dtype = getattr(arr_or_dtype, 'dtype', arr_or_dtype)
+    return (isinstance(dtype, ExtensionDtype) or
+            registry.find(dtype) is not None)
+
+
+def is_complex_dtype(arr_or_dtype):
+    """
+    Check whether the provided array or dtype is of a complex dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array or dtype to check.
+
+    Returns
+    -------
+    boolean
+        Whether or not the array or dtype is of a compex dtype.
+
+    Examples
+    --------
+    >>> is_complex_dtype(str)
+    False
+    >>> is_complex_dtype(int)
+    False
+    >>> is_complex_dtype(np.complex)
+    True
+    >>> is_complex_dtype(np.array(['a', 'b']))
+    False
+    >>> is_complex_dtype(pd.Series([1, 2]))
+    False
+    >>> is_complex_dtype(np.array([1 + 1j, 5]))
+    True
+    """
+
+    return _is_dtype_type(arr_or_dtype, classes(np.complexfloating))
+
+
+def _is_dtype(arr_or_dtype, condition):
+    """
+    Return a boolean if the condition is satisfied for the arr_or_dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like, str, np.dtype, or ExtensionArrayType
+        The array-like or dtype object whose dtype we want to extract.
+    condition : callable[Union[np.dtype, ExtensionDtype]]
+
+    Returns
+    -------
+    bool
+
+    """
+
+    if arr_or_dtype is None:
+        return False
+    try:
+        dtype = _get_dtype(arr_or_dtype)
+    except (TypeError, ValueError, UnicodeEncodeError):
+        return False
+    return condition(dtype)
+
+
+def _get_dtype(arr_or_dtype):
+    """
+    Get the dtype instance associated with an array
+    or dtype object.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype object whose dtype we want to extract.
+
+    Returns
+    -------
+    obj_dtype : The extract dtype instance from the
+                passed in array or dtype object.
+
+    Raises
+    ------
+    TypeError : The passed in object is None.
+    """
+
+    if arr_or_dtype is None:
+        raise TypeError("Cannot deduce dtype from null object")
+
+    # fastpath
+    elif isinstance(arr_or_dtype, np.dtype):
+        return arr_or_dtype
+    elif isinstance(arr_or_dtype, type):
+        return np.dtype(arr_or_dtype)
+
+    # if we have an array-like
+    elif hasattr(arr_or_dtype, 'dtype'):
+        arr_or_dtype = arr_or_dtype.dtype
+
+    return pandas_dtype(arr_or_dtype)
+
+
+def _is_dtype_type(arr_or_dtype, condition):
+    """
+    Return a boolean if the condition is satisfied for the arr_or_dtype.
+
+    Parameters
+    ----------
+    arr_or_dtype : array-like
+        The array-like or dtype object whose dtype we want to extract.
+    condition : callable[Union[np.dtype, ExtensionDtypeType]]
+
+    Returns
+    -------
+    bool : if the condition is satisifed for the arr_or_dtype
+    """
+
+    if arr_or_dtype is None:
+        return condition(type(None))
+
+    # fastpath
+    if isinstance(arr_or_dtype, np.dtype):
+        return condition(arr_or_dtype.type)
+    elif isinstance(arr_or_dtype, type):
+        if issubclass(arr_or_dtype, (PandasExtensionDtype, ExtensionDtype)):
+            arr_or_dtype = arr_or_dtype.type
+        return condition(np.dtype(arr_or_dtype).type)
+    elif arr_or_dtype is None:
+        return condition(type(None))
+
+    # if we have an array-like
+    if hasattr(arr_or_dtype, 'dtype'):
+        arr_or_dtype = arr_or_dtype.dtype
+
+    # we are not possibly a dtype
+    elif is_list_like(arr_or_dtype):
+        return condition(type(None))
+
+    try:
+        tipo = pandas_dtype(arr_or_dtype).type
+    except (TypeError, ValueError, UnicodeEncodeError):
+        if is_scalar(arr_or_dtype):
+            return condition(type(None))
+
+        return False
+
+    return condition(tipo)
+
+
+def infer_dtype_from_object(dtype):
+    """
+    Get a numpy dtype.type-style object for a dtype object.
+
+    This methods also includes handling of the datetime64[ns] and
+    datetime64[ns, TZ] objects.
+
+    If no dtype can be found, we return ``object``.
+
+    Parameters
+    ----------
+    dtype : dtype, type
+        The dtype object whose numpy dtype.type-style
+        object we want to extract.
+
+    Returns
+    -------
+    dtype_object : The extracted numpy dtype.type-style object.
+    """
+
+    if isinstance(dtype, type) and issubclass(dtype, np.generic):
+        # Type object from a dtype
+        return dtype
+    elif isinstance(dtype, (np.dtype, PandasExtensionDtype, ExtensionDtype)):
+        # dtype object
+        try:
+            _validate_date_like_dtype(dtype)
+        except TypeError:
+            # Should still pass if we don't have a date-like
+            pass
+        return dtype.type
+
+    try:
+        dtype = pandas_dtype(dtype)
+    except TypeError:
+        pass
+
+    if is_extension_array_dtype(dtype):
+        return dtype.type
+    elif isinstance(dtype, string_types):
+
+        # TODO(jreback)
+        # should deprecate these
+        if dtype in ['datetimetz', 'datetime64tz']:
+            return DatetimeTZDtype.type
+        elif dtype in ['period']:
+            raise NotImplementedError
+
+        if dtype == 'datetime' or dtype == 'timedelta':
+            dtype += '64'
+        try:
+            return infer_dtype_from_object(getattr(np, dtype))
+        except (AttributeError, TypeError):
+            # Handles cases like _get_dtype(int) i.e.,
+            # Python objects that are valid dtypes
+            # (unlike user-defined types, in general)
+            #
+            # TypeError handles the float16 type code of 'e'
+            # further handle internal types
+            pass
+
+    return infer_dtype_from_object(np.dtype(dtype))
+
+
+def _validate_date_like_dtype(dtype):
+    """
+    Check whether the dtype is a date-like dtype. Raises an error if invalid.
+
+    Parameters
+    ----------
+    dtype : dtype, type
+        The dtype to check.
+
+    Raises
+    ------
+    TypeError : The dtype could not be casted to a date-like dtype.
+    ValueError : The dtype is an illegal date-like dtype (e.g. the
+                 the frequency provided is too specific)
+    """
+
+    try:
+        typ = np.datetime_data(dtype)[0]
+    except ValueError as e:
+        raise TypeError('{error}'.format(error=e))
+    if typ != 'generic' and typ != 'ns':
+        msg = '{name!r} is too specific of a frequency, try passing {type!r}'
+        raise ValueError(msg.format(name=dtype.name, type=dtype.type.__name__))
+
+
+def pandas_dtype(dtype):
+    """
+    Convert input into a pandas only dtype object or a numpy dtype object.
+
+    Parameters
+    ----------
+    dtype : object to be converted
+
+    Returns
+    -------
+    np.dtype or a pandas dtype
+
+    Raises
+    ------
+    TypeError if not a dtype
+    """
+    # short-circuit
+    if isinstance(dtype, np.ndarray):
+        return dtype.dtype
+    elif isinstance(dtype, (np.dtype, PandasExtensionDtype, ExtensionDtype)):
+        return dtype
+
+    # registered extension types
+    result = registry.find(dtype)
+    if result is not None:
+        return result
+
+    # try a numpy dtype
+    # raise a consistent TypeError if failed
+    try:
+        npdtype = np.dtype(dtype)
+    except Exception:
+        # we don't want to force a repr of the non-string
+        if not isinstance(dtype, string_types):
+            raise TypeError("data type not understood")
+        raise TypeError("data type '{}' not understood".format(
+            dtype))
+
+    # Any invalid dtype (such as pd.Timestamp) should raise an error.
+    # np.dtype(invalid_type).kind = 0 for such objects. However, this will
+    # also catch some valid dtypes such as object, np.object_ and 'object'
+    # which we safeguard against by catching them earlier and returning
+    # np.dtype(valid_dtype) before this condition is evaluated.
+    if is_hashable(dtype) and dtype in [object, np.object_, 'object', 'O']:
+        # check hashability to avoid errors/DeprecationWarning when we get
+        # here and `dtype` is an array
+        return npdtype
+    elif npdtype.kind == 'O':
+        raise TypeError("dtype '{}' not understood".format(dtype))
+
+    return npdtype
diff --git a/pandas/core/dtypes/concat.py b/pandas/core/dtypes/concat.py
new file mode 100644
index 0000000000000..10e903acbe538
--- /dev/null
+++ b/pandas/core/dtypes/concat.py
@@ -0,0 +1,581 @@
+"""
+Utility functions related to concat
+"""
+
+import numpy as np
+
+from pandas._libs import tslib, tslibs
+
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, _TD_DTYPE, is_bool_dtype, is_categorical_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype, is_dtype_equal,
+    is_extension_array_dtype, is_object_dtype, is_sparse, is_timedelta64_dtype)
+from pandas.core.dtypes.generic import (
+    ABCDatetimeArray, ABCDatetimeIndex, ABCIndexClass, ABCPeriodIndex,
+    ABCRangeIndex, ABCSparseDataFrame, ABCTimedeltaIndex)
+
+from pandas import compat
+
+
+def get_dtype_kinds(l):
+    """
+    Parameters
+    ----------
+    l : list of arrays
+
+    Returns
+    -------
+    a set of kinds that exist in this list of arrays
+    """
+
+    typs = set()
+    for arr in l:
+
+        dtype = arr.dtype
+        if is_categorical_dtype(dtype):
+            typ = 'category'
+        elif is_sparse(arr):
+            typ = 'sparse'
+        elif isinstance(arr, ABCRangeIndex):
+            typ = 'range'
+        elif is_datetime64tz_dtype(arr):
+            # if to_concat contains different tz,
+            # the result must be object dtype
+            typ = str(arr.dtype)
+        elif is_datetime64_dtype(dtype):
+            typ = 'datetime'
+        elif is_timedelta64_dtype(dtype):
+            typ = 'timedelta'
+        elif is_object_dtype(dtype):
+            typ = 'object'
+        elif is_bool_dtype(dtype):
+            typ = 'bool'
+        elif is_extension_array_dtype(dtype):
+            typ = str(arr.dtype)
+        else:
+            typ = dtype.kind
+        typs.add(typ)
+    return typs
+
+
+def _get_series_result_type(result, objs=None):
+    """
+    return appropriate class of Series concat
+    input is either dict or array-like
+    """
+    from pandas import SparseSeries, SparseDataFrame, DataFrame
+
+    # concat Series with axis 1
+    if isinstance(result, dict):
+        # concat Series with axis 1
+        if all(isinstance(c, (SparseSeries, SparseDataFrame))
+               for c in compat.itervalues(result)):
+            return SparseDataFrame
+        else:
+            return DataFrame
+
+    # otherwise it is a SingleBlockManager (axis = 0)
+    if result._block.is_sparse:
+        return SparseSeries
+    else:
+        return objs[0]._constructor
+
+
+def _get_frame_result_type(result, objs):
+    """
+    return appropriate class of DataFrame-like concat
+    if all blocks are sparse, return SparseDataFrame
+    otherwise, return 1st obj
+    """
+
+    if (result.blocks and (
+            all(is_sparse(b) for b in result.blocks) or
+            all(isinstance(obj, ABCSparseDataFrame) for obj in objs))):
+        from pandas.core.sparse.api import SparseDataFrame
+        return SparseDataFrame
+    else:
+        return next(obj for obj in objs if not isinstance(obj,
+                                                          ABCSparseDataFrame))
+
+
+def _concat_compat(to_concat, axis=0):
+    """
+    provide concatenation of an array of arrays each of which is a single
+    'normalized' dtypes (in that for example, if it's object, then it is a
+    non-datetimelike and provide a combined dtype for the resulting array that
+    preserves the overall dtype if possible)
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    # filter empty arrays
+    # 1-d dtypes always are included here
+    def is_nonempty(x):
+        try:
+            return x.shape[axis] > 0
+        except Exception:
+            return True
+
+    # If all arrays are empty, there's nothing to convert, just short-cut to
+    # the concatenation, #3121.
+    #
+    # Creating an empty array directly is tempting, but the winnings would be
+    # marginal given that it would still require shape & dtype calculation and
+    # np.concatenate which has them both implemented is compiled.
+
+    typs = get_dtype_kinds(to_concat)
+    _contains_datetime = any(typ.startswith('datetime') for typ in typs)
+    _contains_period = any(typ.startswith('period') for typ in typs)
+
+    if 'category' in typs:
+        # this must be priort to _concat_datetime,
+        # to support Categorical + datetime-like
+        return _concat_categorical(to_concat, axis=axis)
+
+    elif _contains_datetime or 'timedelta' in typs or _contains_period:
+        return _concat_datetime(to_concat, axis=axis, typs=typs)
+
+    # these are mandated to handle empties as well
+    elif 'sparse' in typs:
+        return _concat_sparse(to_concat, axis=axis, typs=typs)
+
+    all_empty = all(not is_nonempty(x) for x in to_concat)
+    if any(is_extension_array_dtype(x) for x in to_concat) and axis == 1:
+        to_concat = [np.atleast_2d(x.astype('object')) for x in to_concat]
+
+    if all_empty:
+        # we have all empties, but may need to coerce the result dtype to
+        # object if we have non-numeric type operands (numpy would otherwise
+        # cast this to float)
+        typs = get_dtype_kinds(to_concat)
+        if len(typs) != 1:
+
+            if (not len(typs - {'i', 'u', 'f'}) or
+                    not len(typs - {'bool', 'i', 'u'})):
+                # let numpy coerce
+                pass
+            else:
+                # coerce to object
+                to_concat = [x.astype('object') for x in to_concat]
+
+    return np.concatenate(to_concat, axis=axis)
+
+
+def _concat_categorical(to_concat, axis=0):
+    """Concatenate an object/categorical array of arrays, each of which is a
+    single dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : int
+        Axis to provide concatenation in the current implementation this is
+        always 0, e.g. we only have 1D categoricals
+
+    Returns
+    -------
+    Categorical
+        A single array, preserving the combined dtypes
+    """
+
+    # we could have object blocks and categoricals here
+    # if we only have a single categoricals then combine everything
+    # else its a non-compat categorical
+    categoricals = [x for x in to_concat if is_categorical_dtype(x.dtype)]
+
+    # validate the categories
+    if len(categoricals) != len(to_concat):
+        pass
+    else:
+        # when all categories are identical
+        first = to_concat[0]
+        if all(first.is_dtype_equal(other) for other in to_concat[1:]):
+            return union_categoricals(categoricals)
+
+    # extract the categoricals & coerce to object if needed
+    to_concat = [x.get_values() if is_categorical_dtype(x.dtype)
+                 else np.asarray(x).ravel() if not is_datetime64tz_dtype(x)
+                 else np.asarray(x.astype(object)) for x in to_concat]
+    result = _concat_compat(to_concat)
+    if axis == 1:
+        result = result.reshape(1, len(result))
+    return result
+
+
+def union_categoricals(to_union, sort_categories=False, ignore_order=False):
+    """
+    Combine list-like of Categorical-like, unioning categories. All
+    categories must have the same dtype.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    to_union : list-like of Categorical, CategoricalIndex,
+               or Series with dtype='category'
+    sort_categories : boolean, default False
+        If true, resulting categories will be lexsorted, otherwise
+        they will be ordered as they appear in the data.
+    ignore_order : boolean, default False
+        If true, the ordered attribute of the Categoricals will be ignored.
+        Results in an unordered categorical.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    result : Categorical
+
+    Raises
+    ------
+    TypeError
+        - all inputs do not have the same dtype
+        - all inputs do not have the same ordered property
+        - all inputs are ordered and their categories are not identical
+        - sort_categories=True and Categoricals are ordered
+    ValueError
+        Empty list of categoricals passed
+
+    Notes
+    -----
+
+    To learn more about categories, see `link
+    <http://pandas.pydata.org/pandas-docs/stable/categorical.html#unioning>`__
+
+    Examples
+    --------
+
+    >>> from pandas.api.types import union_categoricals
+
+    If you want to combine categoricals that do not necessarily have
+    the same categories, `union_categoricals` will combine a list-like
+    of categoricals. The new categories will be the union of the
+    categories being combined.
+
+    >>> a = pd.Categorical(["b", "c"])
+    >>> b = pd.Categorical(["a", "b"])
+    >>> union_categoricals([a, b])
+    [b, c, a, b]
+    Categories (3, object): [b, c, a]
+
+    By default, the resulting categories will be ordered as they appear
+    in the `categories` of the data. If you want the categories to be
+    lexsorted, use `sort_categories=True` argument.
+
+    >>> union_categoricals([a, b], sort_categories=True)
+    [b, c, a, b]
+    Categories (3, object): [a, b, c]
+
+    `union_categoricals` also works with the case of combining two
+    categoricals of the same categories and order information (e.g. what
+    you could also `append` for).
+
+    >>> a = pd.Categorical(["a", "b"], ordered=True)
+    >>> b = pd.Categorical(["a", "b", "a"], ordered=True)
+    >>> union_categoricals([a, b])
+    [a, b, a, b, a]
+    Categories (2, object): [a < b]
+
+    Raises `TypeError` because the categories are ordered and not identical.
+
+    >>> a = pd.Categorical(["a", "b"], ordered=True)
+    >>> b = pd.Categorical(["a", "b", "c"], ordered=True)
+    >>> union_categoricals([a, b])
+    TypeError: to union ordered Categoricals, all categories must be the same
+
+    New in version 0.20.0
+
+    Ordered categoricals with different categories or orderings can be
+    combined by using the `ignore_ordered=True` argument.
+
+    >>> a = pd.Categorical(["a", "b", "c"], ordered=True)
+    >>> b = pd.Categorical(["c", "b", "a"], ordered=True)
+    >>> union_categoricals([a, b], ignore_order=True)
+    [a, b, c, c, b, a]
+    Categories (3, object): [a, b, c]
+
+    `union_categoricals` also works with a `CategoricalIndex`, or `Series`
+    containing categorical data, but note that the resulting array will
+    always be a plain `Categorical`
+
+    >>> a = pd.Series(["b", "c"], dtype='category')
+    >>> b = pd.Series(["a", "b"], dtype='category')
+    >>> union_categoricals([a, b])
+    [b, c, a, b]
+    Categories (3, object): [b, c, a]
+    """
+    from pandas import Index, Categorical, CategoricalIndex, Series
+    from pandas.core.arrays.categorical import _recode_for_categories
+
+    if len(to_union) == 0:
+        raise ValueError('No Categoricals to union')
+
+    def _maybe_unwrap(x):
+        if isinstance(x, (CategoricalIndex, Series)):
+            return x.values
+        elif isinstance(x, Categorical):
+            return x
+        else:
+            raise TypeError("all components to combine must be Categorical")
+
+    to_union = [_maybe_unwrap(x) for x in to_union]
+    first = to_union[0]
+
+    if not all(is_dtype_equal(other.categories.dtype, first.categories.dtype)
+               for other in to_union[1:]):
+        raise TypeError("dtype of categories must be the same")
+
+    ordered = False
+    if all(first.is_dtype_equal(other) for other in to_union[1:]):
+        # identical categories - fastpath
+        categories = first.categories
+        ordered = first.ordered
+
+        if all(first.categories.equals(other.categories)
+               for other in to_union[1:]):
+            new_codes = np.concatenate([c.codes for c in to_union])
+        else:
+            codes = [first.codes] + [_recode_for_categories(other.codes,
+                                                            other.categories,
+                                                            first.categories)
+                                     for other in to_union[1:]]
+            new_codes = np.concatenate(codes)
+
+        if sort_categories and not ignore_order and ordered:
+            raise TypeError("Cannot use sort_categories=True with "
+                            "ordered Categoricals")
+
+        if sort_categories and not categories.is_monotonic_increasing:
+            categories = categories.sort_values()
+            indexer = categories.get_indexer(first.categories)
+
+            from pandas.core.algorithms import take_1d
+            new_codes = take_1d(indexer, new_codes, fill_value=-1)
+    elif ignore_order or all(not c.ordered for c in to_union):
+        # different categories - union and recode
+        cats = first.categories.append([c.categories for c in to_union[1:]])
+        categories = Index(cats.unique())
+        if sort_categories:
+            categories = categories.sort_values()
+
+        new_codes = [_recode_for_categories(c.codes, c.categories, categories)
+                     for c in to_union]
+        new_codes = np.concatenate(new_codes)
+    else:
+        # ordered - to show a proper error message
+        if all(c.ordered for c in to_union):
+            msg = ("to union ordered Categoricals, "
+                   "all categories must be the same")
+            raise TypeError(msg)
+        else:
+            raise TypeError('Categorical.ordered must be the same')
+
+    if ignore_order:
+        ordered = False
+
+    return Categorical(new_codes, categories=categories, ordered=ordered,
+                       fastpath=True)
+
+
+def _concatenate_2d(to_concat, axis):
+    # coerce to 2d if needed & concatenate
+    if axis == 1:
+        to_concat = [np.atleast_2d(x) for x in to_concat]
+    return np.concatenate(to_concat, axis=axis)
+
+
+def _concat_datetime(to_concat, axis=0, typs=None):
+    """
+    provide concatenation of an datetimelike array of arrays each of which is a
+    single M8[ns], datetimet64[ns, tz] or m8[ns] dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+    typs : set of to_concat dtypes
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    if typs is None:
+        typs = get_dtype_kinds(to_concat)
+
+    # multiple types, need to coerce to object
+    if len(typs) != 1:
+        return _concatenate_2d([_convert_datetimelike_to_object(x)
+                                for x in to_concat],
+                               axis=axis)
+
+    # must be single dtype
+    if any(typ.startswith('datetime') for typ in typs):
+
+        if 'datetime' in typs:
+            to_concat = [x.astype(np.int64, copy=False) for x in to_concat]
+            return _concatenate_2d(to_concat, axis=axis).view(_NS_DTYPE)
+        else:
+            # when to_concat has different tz, len(typs) > 1.
+            # thus no need to care
+            return _concat_datetimetz(to_concat)
+
+    elif 'timedelta' in typs:
+        return _concatenate_2d([x.view(np.int64) for x in to_concat],
+                               axis=axis).view(_TD_DTYPE)
+
+    elif any(typ.startswith('period') for typ in typs):
+        assert len(typs) == 1
+        cls = to_concat[0]
+        new_values = cls._concat_same_type(to_concat)
+        return new_values
+
+
+def _convert_datetimelike_to_object(x):
+    # coerce datetimelike array to object dtype
+
+    # if dtype is of datetimetz or timezone
+    if x.dtype.kind == _NS_DTYPE.kind:
+        if getattr(x, 'tz', None) is not None:
+            x = np.asarray(x.astype(object))
+        else:
+            shape = x.shape
+            x = tslib.ints_to_pydatetime(x.view(np.int64).ravel(),
+                                         box="timestamp")
+            x = x.reshape(shape)
+
+    elif x.dtype == _TD_DTYPE:
+        shape = x.shape
+        x = tslibs.ints_to_pytimedelta(x.view(np.int64).ravel(), box=True)
+        x = x.reshape(shape)
+
+    return x
+
+
+def _concat_datetimetz(to_concat, name=None):
+    """
+    concat DatetimeIndex with the same tz
+    all inputs must be DatetimeIndex
+    it is used in DatetimeIndex.append also
+    """
+    # Right now, internals will pass a List[DatetimeArray] here
+    # for reductions like quantile. I would like to disentangle
+    # all this before we get here.
+    sample = to_concat[0]
+
+    if isinstance(sample, ABCIndexClass):
+        return sample._concat_same_dtype(to_concat, name=name)
+    elif isinstance(sample, ABCDatetimeArray):
+        return sample._concat_same_type(to_concat)
+
+
+def _concat_index_same_dtype(indexes, klass=None):
+    klass = klass if klass is not None else indexes[0].__class__
+    return klass(np.concatenate([x._values for x in indexes]))
+
+
+def _concat_index_asobject(to_concat, name=None):
+    """
+    concat all inputs as object. DatetimeIndex, TimedeltaIndex and
+    PeriodIndex are converted to object dtype before concatenation
+    """
+    from pandas import Index
+    from pandas.core.arrays import ExtensionArray
+
+    klasses = (ABCDatetimeIndex, ABCTimedeltaIndex, ABCPeriodIndex,
+               ExtensionArray)
+    to_concat = [x.astype(object) if isinstance(x, klasses) else x
+                 for x in to_concat]
+
+    self = to_concat[0]
+    attribs = self._get_attributes_dict()
+    attribs['name'] = name
+
+    to_concat = [x._values if isinstance(x, Index) else x
+                 for x in to_concat]
+
+    return self._shallow_copy_with_infer(np.concatenate(to_concat), **attribs)
+
+
+def _concat_sparse(to_concat, axis=0, typs=None):
+    """
+    provide concatenation of an sparse/dense array of arrays each of which is a
+    single dtype
+
+    Parameters
+    ----------
+    to_concat : array of arrays
+    axis : axis to provide concatenation
+    typs : set of to_concat dtypes
+
+    Returns
+    -------
+    a single array, preserving the combined dtypes
+    """
+
+    from pandas.core.arrays import SparseArray
+
+    fill_values = [x.fill_value for x in to_concat
+                   if isinstance(x, SparseArray)]
+    fill_value = fill_values[0]
+
+    # TODO: Fix join unit generation so we aren't passed this.
+    to_concat = [x if isinstance(x, SparseArray)
+                 else SparseArray(x.squeeze(), fill_value=fill_value)
+                 for x in to_concat]
+
+    return SparseArray._concat_same_type(to_concat)
+
+
+def _concat_rangeindex_same_dtype(indexes):
+    """
+    Concatenates multiple RangeIndex instances. All members of "indexes" must
+    be of type RangeIndex; result will be RangeIndex if possible, Int64Index
+    otherwise. E.g.:
+    indexes = [RangeIndex(3), RangeIndex(3, 6)] -> RangeIndex(6)
+    indexes = [RangeIndex(3), RangeIndex(4, 6)] -> Int64Index([0,1,2,4,5])
+    """
+    from pandas import Int64Index, RangeIndex
+
+    start = step = next = None
+
+    # Filter the empty indexes
+    non_empty_indexes = [obj for obj in indexes if len(obj)]
+
+    for obj in non_empty_indexes:
+
+        if start is None:
+            # This is set by the first non-empty index
+            start = obj._start
+            if step is None and len(obj) > 1:
+                step = obj._step
+        elif step is None:
+            # First non-empty index had only one element
+            if obj._start == start:
+                return _concat_index_same_dtype(indexes, klass=Int64Index)
+            step = obj._start - start
+
+        non_consecutive = ((step != obj._step and len(obj) > 1) or
+                           (next is not None and obj._start != next))
+        if non_consecutive:
+            return _concat_index_same_dtype(indexes, klass=Int64Index)
+
+        if step is not None:
+            next = obj[-1] + step
+
+    if non_empty_indexes:
+        # Get the stop value from "next" or alternatively
+        # from the last non-empty index
+        stop = non_empty_indexes[-1]._stop if next is None else next
+        return RangeIndex(start, stop, step)
+
+    # Here all "indexes" had 0 length, i.e. were empty.
+    # In this case return an empty range index.
+    return RangeIndex(0, 0)
diff --git a/pandas/core/dtypes/dtypes.py b/pandas/core/dtypes/dtypes.py
new file mode 100644
index 0000000000000..11a132c4d14ee
--- /dev/null
+++ b/pandas/core/dtypes/dtypes.py
@@ -0,0 +1,990 @@
+""" define extension dtypes """
+import re
+import warnings
+
+import numpy as np
+import pytz
+
+from pandas._libs.interval import Interval
+from pandas._libs.tslibs import NaT, Period, Timestamp, timezones
+
+from pandas.core.dtypes.generic import (
+    ABCCategoricalIndex, ABCDateOffset, ABCIndexClass)
+
+from pandas import compat
+
+from .base import ExtensionDtype, _DtypeOpsMixin
+from .inference import is_list_like
+
+
+def register_extension_dtype(cls):
+    """
+    Register an ExtensionType with pandas as class decorator.
+
+    .. versionadded:: 0.24.0
+
+    This enables operations like ``.astype(name)`` for the name
+    of the ExtensionDtype.
+
+    Examples
+    --------
+    >>> from pandas.api.extensions import register_extension_dtype
+    >>> from pandas.api.extensions import ExtensionDtype
+    >>> @register_extension_dtype
+    ... class MyExtensionDtype(ExtensionDtype):
+    ...     pass
+    """
+    registry.register(cls)
+    return cls
+
+
+class Registry(object):
+    """
+    Registry for dtype inference
+
+    The registry allows one to map a string repr of a extension
+    dtype to an extension dtype. The string alias can be used in several
+    places, including
+
+    * Series and Index constructors
+    * :meth:`pandas.array`
+    * :meth:`pandas.Series.astype`
+
+    Multiple extension types can be registered.
+    These are tried in order.
+    """
+    def __init__(self):
+        self.dtypes = []
+
+    def register(self, dtype):
+        """
+        Parameters
+        ----------
+        dtype : ExtensionDtype
+        """
+        if not issubclass(dtype, (PandasExtensionDtype, ExtensionDtype)):
+            raise ValueError("can only register pandas extension dtypes")
+
+        self.dtypes.append(dtype)
+
+    def find(self, dtype):
+        """
+        Parameters
+        ----------
+        dtype : PandasExtensionDtype or string
+
+        Returns
+        -------
+        return the first matching dtype, otherwise return None
+        """
+        if not isinstance(dtype, compat.string_types):
+            dtype_type = dtype
+            if not isinstance(dtype, type):
+                dtype_type = type(dtype)
+            if issubclass(dtype_type, ExtensionDtype):
+                return dtype
+
+            return None
+
+        for dtype_type in self.dtypes:
+            try:
+                return dtype_type.construct_from_string(dtype)
+            except TypeError:
+                pass
+
+        return None
+
+
+registry = Registry()
+
+
+class PandasExtensionDtype(_DtypeOpsMixin):
+    """
+    A np.dtype duck-typed class, suitable for holding a custom dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE
+    """
+    type = None
+    subdtype = None
+    kind = None
+    str = None
+    num = 100
+    shape = tuple()
+    itemsize = 8
+    base = None
+    isbuiltin = 0
+    isnative = 0
+    _cache = {}
+
+    def __unicode__(self):
+        return self.name
+
+    def __str__(self):
+        """
+        Return a string representation for a particular Object
+
+        Invoked by str(df) in both py2/py3.
+        Yields Bytestring in Py2, Unicode String in py3.
+        """
+
+        if compat.PY3:
+            return self.__unicode__()
+        return self.__bytes__()
+
+    def __bytes__(self):
+        """
+        Return a string representation for a particular object.
+
+        Invoked by bytes(obj) in py3 only.
+        Yields a bytestring in both py2/py3.
+        """
+        from pandas.core.config import get_option
+
+        encoding = get_option("display.encoding")
+        return self.__unicode__().encode(encoding, 'replace')
+
+    def __repr__(self):
+        """
+        Return a string representation for a particular object.
+
+        Yields Bytestring in Py2, Unicode String in py3.
+        """
+        return str(self)
+
+    def __hash__(self):
+        raise NotImplementedError("sub-classes should implement an __hash__ "
+                                  "method")
+
+    def __getstate__(self):
+        # pickle support; we don't want to pickle the cache
+        return {k: getattr(self, k, None) for k in self._metadata}
+
+    @classmethod
+    def reset_cache(cls):
+        """ clear the cache """
+        cls._cache = {}
+
+
+class CategoricalDtypeType(type):
+    """
+    the type of CategoricalDtype, this metaclass determines subclass ability
+    """
+    pass
+
+
+@register_extension_dtype
+class CategoricalDtype(PandasExtensionDtype, ExtensionDtype):
+    """
+    Type for categorical data with the categories and orderedness
+
+    .. versionchanged:: 0.21.0
+
+    Parameters
+    ----------
+    categories : sequence, optional
+        Must be unique, and must not contain any nulls.
+    ordered : bool, default False
+
+    Attributes
+    ----------
+    categories
+    ordered
+
+    Methods
+    -------
+    None
+
+    See Also
+    --------
+    Categorical
+
+    Notes
+    -----
+    This class is useful for specifying the type of a ``Categorical``
+    independent of the values. See :ref:`categorical.categoricaldtype`
+    for more.
+
+    Examples
+    --------
+    >>> t = pd.CategoricalDtype(categories=['b', 'a'], ordered=True)
+    >>> pd.Series(['a', 'b', 'a', 'c'], dtype=t)
+    0      a
+    1      b
+    2      a
+    3    NaN
+    dtype: category
+    Categories (2, object): [b < a]
+    """
+    # TODO: Document public vs. private API
+    name = 'category'
+    type = CategoricalDtypeType
+    kind = 'O'
+    str = '|O08'
+    base = np.dtype('O')
+    _metadata = ('categories', 'ordered')
+    _cache = {}
+
+    def __init__(self, categories=None, ordered=None):
+        self._finalize(categories, ordered, fastpath=False)
+
+    @classmethod
+    def _from_fastpath(cls, categories=None, ordered=None):
+        self = cls.__new__(cls)
+        self._finalize(categories, ordered, fastpath=True)
+        return self
+
+    @classmethod
+    def _from_categorical_dtype(cls, dtype, categories=None, ordered=None):
+        if categories is ordered is None:
+            return dtype
+        if categories is None:
+            categories = dtype.categories
+        if ordered is None:
+            ordered = dtype.ordered
+        return cls(categories, ordered)
+
+    @classmethod
+    def _from_values_or_dtype(cls, values=None, categories=None, ordered=None,
+                              dtype=None):
+        """
+        Construct dtype from the input parameters used in :class:`Categorical`.
+
+        This constructor method specifically does not do the factorization
+        step, if that is needed to find the categories. This constructor may
+        therefore return ``CategoricalDtype(categories=None, ordered=None)``,
+        which may not be useful. Additional steps may therefore have to be
+        taken to create the final dtype.
+
+        The return dtype is specified from the inputs in this prioritized
+        order:
+        1. if dtype is a CategoricalDtype, return dtype
+        2. if dtype is the string 'category', create a CategoricalDtype from
+           the supplied categories and ordered parameters, and return that.
+        3. if values is a categorical, use value.dtype, but override it with
+           categories and ordered if either/both of those are not None.
+        4. if dtype is None and values is not a categorical, construct the
+           dtype from categories and ordered, even if either of those is None.
+
+        Parameters
+        ----------
+        values : list-like, optional
+            The list-like must be 1-dimensional.
+        categories : list-like, optional
+            Categories for the CategoricalDtype.
+        ordered : bool, optional
+            Designating if the categories are ordered.
+        dtype : CategoricalDtype or the string "category", optional
+            If ``CategoricalDtype``, cannot be used together with
+            `categories` or `ordered`.
+
+        Returns
+        -------
+        CategoricalDtype
+
+        Examples
+        --------
+        >>> CategoricalDtype._from_values_or_dtype()
+        CategoricalDtype(categories=None, ordered=None)
+        >>> CategoricalDtype._from_values_or_dtype(categories=['a', 'b'],
+        ...                                        ordered=True)
+        CategoricalDtype(categories=['a', 'b'], ordered=True)
+        >>> dtype1 = CategoricalDtype(['a', 'b'], ordered=True)
+        >>> dtype2 = CategoricalDtype(['x', 'y'], ordered=False)
+        >>> c = Categorical([0, 1], dtype=dtype1, fastpath=True)
+        >>> CategoricalDtype._from_values_or_dtype(c, ['x', 'y'], ordered=True,
+        ...                                        dtype=dtype2)
+        ValueError: Cannot specify `categories` or `ordered` together with
+        `dtype`.
+
+        The supplied dtype takes precedence over values' dtype:
+
+        >>> CategoricalDtype._from_values_or_dtype(c, dtype=dtype2)
+        CategoricalDtype(['x', 'y'], ordered=False)
+        """
+        from pandas.core.dtypes.common import is_categorical
+
+        if dtype is not None:
+            # The dtype argument takes precedence over values.dtype (if any)
+            if isinstance(dtype, compat.string_types):
+                if dtype == 'category':
+                    dtype = CategoricalDtype(categories, ordered)
+                else:
+                    msg = "Unknown dtype {dtype!r}"
+                    raise ValueError(msg.format(dtype=dtype))
+            elif categories is not None or ordered is not None:
+                raise ValueError("Cannot specify `categories` or `ordered` "
+                                 "together with `dtype`.")
+        elif is_categorical(values):
+            # If no "dtype" was passed, use the one from "values", but honor
+            # the "ordered" and "categories" arguments
+            dtype = values.dtype._from_categorical_dtype(values.dtype,
+                                                         categories, ordered)
+        else:
+            # If dtype=None and values is not categorical, create a new dtype.
+            # Note: This could potentially have categories=None and
+            # ordered=None.
+            dtype = CategoricalDtype(categories, ordered)
+
+        return dtype
+
+    def _finalize(self, categories, ordered, fastpath=False):
+
+        if ordered is not None:
+            self.validate_ordered(ordered)
+
+        if categories is not None:
+            categories = self.validate_categories(categories,
+                                                  fastpath=fastpath)
+
+        self._categories = categories
+        self._ordered = ordered
+
+    def __setstate__(self, state):
+        self._categories = state.pop('categories', None)
+        self._ordered = state.pop('ordered', False)
+
+    def __hash__(self):
+        # _hash_categories returns a uint64, so use the negative
+        # space for when we have unknown categories to avoid a conflict
+        if self.categories is None:
+            if self.ordered:
+                return -1
+            else:
+                return -2
+        # We *do* want to include the real self.ordered here
+        return int(self._hash_categories(self.categories, self.ordered))
+
+    def __eq__(self, other):
+        """
+        Rules for CDT equality:
+        1) Any CDT is equal to the string 'category'
+        2) Any CDT is equal to itself
+        3) Any CDT is equal to a CDT with categories=None regardless of ordered
+        4) A CDT with ordered=True is only equal to another CDT with
+           ordered=True and identical categories in the same order
+        5) A CDT with ordered={False, None} is only equal to another CDT with
+           ordered={False, None} and identical categories, but same order is
+           not required. There is no distinction between False/None.
+        6) Any other comparison returns False
+        """
+        if isinstance(other, compat.string_types):
+            return other == self.name
+        elif other is self:
+            return True
+        elif not (hasattr(other, 'ordered') and hasattr(other, 'categories')):
+            return False
+        elif self.categories is None or other.categories is None:
+            # We're forced into a suboptimal corner thanks to math and
+            # backwards compatibility. We require that `CDT(...) == 'category'`
+            # for all CDTs **including** `CDT(None, ...)`. Therefore, *all*
+            # CDT(., .) = CDT(None, False) and *all*
+            # CDT(., .) = CDT(None, True).
+            return True
+        elif self.ordered or other.ordered:
+            # At least one has ordered=True; equal if both have ordered=True
+            # and the same values for categories in the same order.
+            return ((self.ordered == other.ordered) and
+                    self.categories.equals(other.categories))
+        else:
+            # Neither has ordered=True; equal if both have the same categories,
+            # but same order is not necessary.  There is no distinction between
+            # ordered=False and ordered=None: CDT(., False) and CDT(., None)
+            # will be equal if they have the same categories.
+            return hash(self) == hash(other)
+
+    def __repr__(self):
+        tpl = u'CategoricalDtype(categories={}ordered={})'
+        if self.categories is None:
+            data = u"None, "
+        else:
+            data = self.categories._format_data(name=self.__class__.__name__)
+        return tpl.format(data, self.ordered)
+
+    @staticmethod
+    def _hash_categories(categories, ordered=True):
+        from pandas.core.util.hashing import (
+            hash_array, _combine_hash_arrays, hash_tuples
+        )
+        from pandas.core.dtypes.common import is_datetime64tz_dtype, _NS_DTYPE
+
+        if len(categories) and isinstance(categories[0], tuple):
+            # assumes if any individual category is a tuple, then all our. ATM
+            # I don't really want to support just some of the categories being
+            # tuples.
+            categories = list(categories)  # breaks if a np.array of categories
+            cat_array = hash_tuples(categories)
+        else:
+            if categories.dtype == 'O':
+                if len({type(x) for x in categories}) != 1:
+                    # TODO: hash_array doesn't handle mixed types. It casts
+                    # everything to a str first, which means we treat
+                    # {'1', '2'} the same as {'1', 2}
+                    # find a better solution
+                    hashed = hash((tuple(categories), ordered))
+                    return hashed
+
+            if is_datetime64tz_dtype(categories.dtype):
+                # Avoid future warning.
+                categories = categories.astype(_NS_DTYPE)
+
+            cat_array = hash_array(np.asarray(categories), categorize=False)
+        if ordered:
+            cat_array = np.vstack([
+                cat_array, np.arange(len(cat_array), dtype=cat_array.dtype)
+            ])
+        else:
+            cat_array = [cat_array]
+        hashed = _combine_hash_arrays(iter(cat_array),
+                                      num_items=len(cat_array))
+        return np.bitwise_xor.reduce(hashed)
+
+    @classmethod
+    def construct_array_type(cls):
+        """
+        Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        from pandas import Categorical
+        return Categorical
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        attempt to construct this type from a string, raise a TypeError if
+        it's not possible """
+        try:
+            if string == 'category':
+                return cls()
+            else:
+                raise TypeError("cannot construct a CategoricalDtype")
+        except AttributeError:
+            pass
+
+    @staticmethod
+    def validate_ordered(ordered):
+        """
+        Validates that we have a valid ordered parameter. If
+        it is not a boolean, a TypeError will be raised.
+
+        Parameters
+        ----------
+        ordered : object
+            The parameter to be verified.
+
+        Raises
+        ------
+        TypeError
+            If 'ordered' is not a boolean.
+        """
+        from pandas.core.dtypes.common import is_bool
+        if not is_bool(ordered):
+            raise TypeError("'ordered' must either be 'True' or 'False'")
+
+    @staticmethod
+    def validate_categories(categories, fastpath=False):
+        """
+        Validates that we have good categories
+
+        Parameters
+        ----------
+        categories : array-like
+        fastpath : bool
+            Whether to skip nan and uniqueness checks
+
+        Returns
+        -------
+        categories : Index
+        """
+        from pandas import Index
+
+        if not fastpath and not is_list_like(categories):
+            msg = "Parameter 'categories' must be list-like, was {!r}"
+            raise TypeError(msg.format(categories))
+        elif not isinstance(categories, ABCIndexClass):
+            categories = Index(categories, tupleize_cols=False)
+
+        if not fastpath:
+
+            if categories.hasnans:
+                raise ValueError('Categorial categories cannot be null')
+
+            if not categories.is_unique:
+                raise ValueError('Categorical categories must be unique')
+
+        if isinstance(categories, ABCCategoricalIndex):
+            categories = categories.categories
+
+        return categories
+
+    def update_dtype(self, dtype):
+        """
+        Returns a CategoricalDtype with categories and ordered taken from dtype
+        if specified, otherwise falling back to self if unspecified
+
+        Parameters
+        ----------
+        dtype : CategoricalDtype
+
+        Returns
+        -------
+        new_dtype : CategoricalDtype
+        """
+        if isinstance(dtype, compat.string_types) and dtype == 'category':
+            # dtype='category' should not change anything
+            return self
+        elif not self.is_dtype(dtype):
+            msg = ('a CategoricalDtype must be passed to perform an update, '
+                   'got {dtype!r}').format(dtype=dtype)
+            raise ValueError(msg)
+        elif dtype.categories is not None and dtype.ordered is self.ordered:
+            return dtype
+
+        # dtype is CDT: keep current categories/ordered if None
+        new_categories = dtype.categories
+        if new_categories is None:
+            new_categories = self.categories
+
+        new_ordered = dtype.ordered
+        if new_ordered is None:
+            new_ordered = self.ordered
+
+        return CategoricalDtype(new_categories, new_ordered)
+
+    @property
+    def categories(self):
+        """
+        An ``Index`` containing the unique categories allowed.
+        """
+        return self._categories
+
+    @property
+    def ordered(self):
+        """
+        Whether the categories have an ordered relationship.
+        """
+        return self._ordered
+
+    @property
+    def _is_boolean(self):
+        from pandas.core.dtypes.common import is_bool_dtype
+
+        return is_bool_dtype(self.categories)
+
+
+@register_extension_dtype
+class DatetimeTZDtype(PandasExtensionDtype, ExtensionDtype):
+
+    """
+    A np.dtype duck-typed class, suitable for holding a custom datetime with tz
+    dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of
+    np.datetime64[ns]
+    """
+    type = Timestamp
+    kind = 'M'
+    str = '|M8[ns]'
+    num = 101
+    base = np.dtype('M8[ns]')
+    na_value = NaT
+    _metadata = ('unit', 'tz')
+    _match = re.compile(r"(datetime64|M8)\[(?P<unit>.+), (?P<tz>.+)\]")
+    _cache = {}
+
+    def __init__(self, unit="ns", tz=None):
+        """
+        An ExtensionDtype for timezone-aware datetime data.
+
+        Parameters
+        ----------
+        unit : str, default "ns"
+            The precision of the datetime data. Currently limited
+            to ``"ns"``.
+        tz : str, int, or datetime.tzinfo
+            The timezone.
+
+        Raises
+        ------
+        pytz.UnknownTimeZoneError
+            When the requested timezone cannot be found.
+
+        Examples
+        --------
+        >>> pd.core.dtypes.dtypes.DatetimeTZDtype(tz='UTC')
+        datetime64[ns, UTC]
+
+        >>> pd.core.dtypes.dtypes.DatetimeTZDtype(tz='dateutil/US/Central')
+        datetime64[ns, tzfile('/usr/share/zoneinfo/US/Central')]
+        """
+        if isinstance(unit, DatetimeTZDtype):
+            unit, tz = unit.unit, unit.tz
+
+        if unit != 'ns':
+            if isinstance(unit, compat.string_types) and tz is None:
+                # maybe a string like datetime64[ns, tz], which we support for
+                # now.
+                result = type(self).construct_from_string(unit)
+                unit = result.unit
+                tz = result.tz
+                msg = (
+                    "Passing a dtype alias like 'datetime64[ns, {tz}]' "
+                    "to DatetimeTZDtype is deprecated. Use "
+                    "'DatetimeTZDtype.construct_from_string()' instead."
+                )
+                warnings.warn(msg.format(tz=tz), FutureWarning, stacklevel=2)
+            else:
+                raise ValueError("DatetimeTZDtype only supports ns units")
+
+        if tz:
+            tz = timezones.maybe_get_tz(tz)
+            tz = timezones.tz_standardize(tz)
+        elif tz is not None:
+            raise pytz.UnknownTimeZoneError(tz)
+        elif tz is None:
+            raise TypeError("A 'tz' is required.")
+
+        self._unit = unit
+        self._tz = tz
+
+    @property
+    def unit(self):
+        """The precision of the datetime data."""
+        return self._unit
+
+    @property
+    def tz(self):
+        """The timezone."""
+        return self._tz
+
+    @classmethod
+    def construct_array_type(cls):
+        """
+        Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        from pandas.core.arrays import DatetimeArray
+        return DatetimeArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        Construct a DatetimeTZDtype from a string.
+
+        Parameters
+        ----------
+        string : str
+            The string alias for this DatetimeTZDtype.
+            Should be formatted like ``datetime64[ns, <tz>]``,
+            where ``<tz>`` is the timezone name.
+
+        Examples
+        --------
+        >>> DatetimeTZDtype.construct_from_string('datetime64[ns, UTC]')
+        datetime64[ns, UTC]
+        """
+        if isinstance(string, compat.string_types):
+            msg = "Could not construct DatetimeTZDtype from '{}'"
+            try:
+                match = cls._match.match(string)
+                if match:
+                    d = match.groupdict()
+                    return cls(unit=d['unit'], tz=d['tz'])
+            except Exception:
+                # TODO(py3): Change this pass to `raise TypeError(msg) from e`
+                pass
+            raise TypeError(msg.format(string))
+
+        raise TypeError("Could not construct DatetimeTZDtype")
+
+    def __unicode__(self):
+        return "datetime64[{unit}, {tz}]".format(unit=self.unit, tz=self.tz)
+
+    @property
+    def name(self):
+        """A string representation of the dtype."""
+        return str(self)
+
+    def __hash__(self):
+        # make myself hashable
+        # TODO: update this.
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other == self.name
+
+        return (isinstance(other, DatetimeTZDtype) and
+                self.unit == other.unit and
+                str(self.tz) == str(other.tz))
+
+    def __setstate__(self, state):
+        # for pickle compat.
+        self._tz = state['tz']
+        self._unit = state['unit']
+
+
+@register_extension_dtype
+class PeriodDtype(ExtensionDtype, PandasExtensionDtype):
+    """
+    A Period duck-typed class, suitable for holding a period with freq dtype.
+
+    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.int64.
+    """
+    type = Period
+    kind = 'O'
+    str = '|O08'
+    base = np.dtype('O')
+    num = 102
+    _metadata = ('freq',)
+    _match = re.compile(r"(P|p)eriod\[(?P<freq>.+)\]")
+    _cache = {}
+
+    def __new__(cls, freq=None):
+        """
+        Parameters
+        ----------
+        freq : frequency
+        """
+
+        if isinstance(freq, PeriodDtype):
+            return freq
+
+        elif freq is None:
+            # empty constructor for pickle compat
+            return object.__new__(cls)
+
+        if not isinstance(freq, ABCDateOffset):
+            freq = cls._parse_dtype_strict(freq)
+
+        try:
+            return cls._cache[freq.freqstr]
+        except KeyError:
+            u = object.__new__(cls)
+            u.freq = freq
+            cls._cache[freq.freqstr] = u
+            return u
+
+    @classmethod
+    def _parse_dtype_strict(cls, freq):
+        if isinstance(freq, compat.string_types):
+            if freq.startswith('period[') or freq.startswith('Period['):
+                m = cls._match.search(freq)
+                if m is not None:
+                    freq = m.group('freq')
+            from pandas.tseries.frequencies import to_offset
+            freq = to_offset(freq)
+            if freq is not None:
+                return freq
+
+        raise ValueError("could not construct PeriodDtype")
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        Strict construction from a string, raise a TypeError if not
+        possible
+        """
+        if (isinstance(string, compat.string_types) and
+            (string.startswith('period[') or
+             string.startswith('Period[')) or
+                isinstance(string, ABCDateOffset)):
+            # do not parse string like U as period[U]
+            # avoid tuple to be regarded as freq
+            try:
+                return cls(freq=string)
+            except ValueError:
+                pass
+        raise TypeError("could not construct PeriodDtype")
+
+    def __unicode__(self):
+        return compat.text_type(self.name)
+
+    @property
+    def name(self):
+        return str("period[{freq}]".format(freq=self.freq.freqstr))
+
+    @property
+    def na_value(self):
+        return NaT
+
+    def __hash__(self):
+        # make myself hashable
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other == self.name or other == self.name.title()
+
+        return isinstance(other, PeriodDtype) and self.freq == other.freq
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """
+        Return a boolean if we if the passed type is an actual dtype that we
+        can match (via string or type)
+        """
+
+        if isinstance(dtype, compat.string_types):
+            # PeriodDtype can be instantiated from freq string like "U",
+            # but doesn't regard freq str like "U" as dtype.
+            if dtype.startswith('period[') or dtype.startswith('Period['):
+                try:
+                    if cls._parse_dtype_strict(dtype) is not None:
+                        return True
+                    else:
+                        return False
+                except ValueError:
+                    return False
+            else:
+                return False
+        return super(PeriodDtype, cls).is_dtype(dtype)
+
+    @classmethod
+    def construct_array_type(cls):
+        from pandas.core.arrays import PeriodArray
+
+        return PeriodArray
+
+
+@register_extension_dtype
+class IntervalDtype(PandasExtensionDtype, ExtensionDtype):
+    """
+    A Interval duck-typed class, suitable for holding an interval
+
+    THIS IS NOT A REAL NUMPY DTYPE
+    """
+    name = 'interval'
+    kind = None
+    str = '|O08'
+    base = np.dtype('O')
+    num = 103
+    _metadata = ('subtype',)
+    _match = re.compile(r"(I|i)nterval\[(?P<subtype>.+)\]")
+    _cache = {}
+
+    def __new__(cls, subtype=None):
+        """
+        Parameters
+        ----------
+        subtype : the dtype of the Interval
+        """
+        from pandas.core.dtypes.common import (
+            is_categorical_dtype, is_string_dtype, pandas_dtype)
+
+        if isinstance(subtype, IntervalDtype):
+            return subtype
+        elif subtype is None:
+            # we are called as an empty constructor
+            # generally for pickle compat
+            u = object.__new__(cls)
+            u.subtype = None
+            return u
+        elif (isinstance(subtype, compat.string_types) and
+              subtype.lower() == 'interval'):
+            subtype = None
+        else:
+            if isinstance(subtype, compat.string_types):
+                m = cls._match.search(subtype)
+                if m is not None:
+                    subtype = m.group('subtype')
+
+            try:
+                subtype = pandas_dtype(subtype)
+            except TypeError:
+                raise TypeError("could not construct IntervalDtype")
+
+        if is_categorical_dtype(subtype) or is_string_dtype(subtype):
+            # GH 19016
+            msg = ('category, object, and string subtypes are not supported '
+                   'for IntervalDtype')
+            raise TypeError(msg)
+
+        try:
+            return cls._cache[str(subtype)]
+        except KeyError:
+            u = object.__new__(cls)
+            u.subtype = subtype
+            cls._cache[str(subtype)] = u
+            return u
+
+    @classmethod
+    def construct_array_type(cls):
+        """
+        Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        from pandas.core.arrays import IntervalArray
+        return IntervalArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        """
+        attempt to construct this type from a string, raise a TypeError
+        if its not possible
+        """
+        if not isinstance(string, compat.string_types):
+            msg = "a string needs to be passed, got type {typ}"
+            raise TypeError(msg.format(typ=type(string)))
+
+        if (string.lower() == 'interval' or
+           cls._match.search(string) is not None):
+                return cls(string)
+
+        msg = ('Incorrectly formatted string passed to constructor. '
+               'Valid formats include Interval or Interval[dtype] '
+               'where dtype is numeric, datetime, or timedelta')
+        raise TypeError(msg)
+
+    @property
+    def type(self):
+        return Interval
+
+    def __unicode__(self):
+        if self.subtype is None:
+            return "interval"
+        return "interval[{subtype}]".format(subtype=self.subtype)
+
+    def __hash__(self):
+        # make myself hashable
+        return hash(str(self))
+
+    def __eq__(self, other):
+        if isinstance(other, compat.string_types):
+            return other.lower() in (self.name.lower(), str(self).lower())
+        elif not isinstance(other, IntervalDtype):
+            return False
+        elif self.subtype is None or other.subtype is None:
+            # None should match any subtype
+            return True
+        else:
+            from pandas.core.dtypes.common import is_dtype_equal
+            return is_dtype_equal(self.subtype, other.subtype)
+
+    @classmethod
+    def is_dtype(cls, dtype):
+        """
+        Return a boolean if we if the passed type is an actual dtype that we
+        can match (via string or type)
+        """
+
+        if isinstance(dtype, compat.string_types):
+            if dtype.lower().startswith('interval'):
+                try:
+                    if cls.construct_from_string(dtype) is not None:
+                        return True
+                    else:
+                        return False
+                except (ValueError, TypeError):
+                    return False
+            else:
+                return False
+        return super(IntervalDtype, cls).is_dtype(dtype)
diff --git a/pandas/core/dtypes/generic.py b/pandas/core/dtypes/generic.py
new file mode 100644
index 0000000000000..134ec95729833
--- /dev/null
+++ b/pandas/core/dtypes/generic.py
@@ -0,0 +1,84 @@
+""" define generic base classes for pandas objects """
+
+
+# define abstract base classes to enable isinstance type checking on our
+# objects
+def create_pandas_abc_type(name, attr, comp):
+    @classmethod
+    def _check(cls, inst):
+        return getattr(inst, attr, '_typ') in comp
+
+    dct = dict(__instancecheck__=_check, __subclasscheck__=_check)
+    meta = type("ABCBase", (type, ), dct)
+    return meta(name, tuple(), dct)
+
+
+ABCIndex = create_pandas_abc_type("ABCIndex", "_typ", ("index", ))
+ABCInt64Index = create_pandas_abc_type("ABCInt64Index", "_typ",
+                                       ("int64index", ))
+ABCUInt64Index = create_pandas_abc_type("ABCUInt64Index", "_typ",
+                                        ("uint64index", ))
+ABCRangeIndex = create_pandas_abc_type("ABCRangeIndex", "_typ",
+                                       ("rangeindex", ))
+ABCFloat64Index = create_pandas_abc_type("ABCFloat64Index", "_typ",
+                                         ("float64index", ))
+ABCMultiIndex = create_pandas_abc_type("ABCMultiIndex", "_typ",
+                                       ("multiindex", ))
+ABCDatetimeIndex = create_pandas_abc_type("ABCDatetimeIndex", "_typ",
+                                          ("datetimeindex", ))
+ABCTimedeltaIndex = create_pandas_abc_type("ABCTimedeltaIndex", "_typ",
+                                           ("timedeltaindex", ))
+ABCPeriodIndex = create_pandas_abc_type("ABCPeriodIndex", "_typ",
+                                        ("periodindex", ))
+ABCCategoricalIndex = create_pandas_abc_type("ABCCategoricalIndex", "_typ",
+                                             ("categoricalindex", ))
+ABCIntervalIndex = create_pandas_abc_type("ABCIntervalIndex", "_typ",
+                                          ("intervalindex", ))
+ABCIndexClass = create_pandas_abc_type("ABCIndexClass", "_typ",
+                                       ("index", "int64index", "rangeindex",
+                                        "float64index", "uint64index",
+                                        "multiindex", "datetimeindex",
+                                        "timedeltaindex", "periodindex",
+                                        "categoricalindex", "intervalindex"))
+
+ABCSeries = create_pandas_abc_type("ABCSeries", "_typ", ("series", ))
+ABCDataFrame = create_pandas_abc_type("ABCDataFrame", "_typ", ("dataframe", ))
+ABCSparseDataFrame = create_pandas_abc_type("ABCSparseDataFrame", "_subtyp",
+                                            ("sparse_frame", ))
+ABCPanel = create_pandas_abc_type("ABCPanel", "_typ", ("panel",))
+ABCSparseSeries = create_pandas_abc_type("ABCSparseSeries", "_subtyp",
+                                         ('sparse_series',
+                                          'sparse_time_series'))
+ABCSparseArray = create_pandas_abc_type("ABCSparseArray", "_subtyp",
+                                        ('sparse_array', 'sparse_series'))
+ABCCategorical = create_pandas_abc_type("ABCCategorical", "_typ",
+                                        ("categorical"))
+ABCDatetimeArray = create_pandas_abc_type("ABCDatetimeArray", "_typ",
+                                          ("datetimearray"))
+ABCTimedeltaArray = create_pandas_abc_type("ABCTimedeltaArray", "_typ",
+                                           ("timedeltaarray"))
+ABCPeriodArray = create_pandas_abc_type("ABCPeriodArray", "_typ",
+                                        ("periodarray", ))
+ABCPeriod = create_pandas_abc_type("ABCPeriod", "_typ", ("period", ))
+ABCDateOffset = create_pandas_abc_type("ABCDateOffset", "_typ",
+                                       ("dateoffset",))
+ABCInterval = create_pandas_abc_type("ABCInterval", "_typ", ("interval", ))
+ABCExtensionArray = create_pandas_abc_type("ABCExtensionArray", "_typ",
+                                           ("extension",
+                                            "categorical",
+                                            "periodarray",
+                                            "datetimearray",
+                                            "timedeltaarray",
+                                            ))
+ABCPandasArray = create_pandas_abc_type("ABCPandasArray",
+                                        "_typ",
+                                        ("npy_extension",))
+
+
+class _ABCGeneric(type):
+
+    def __instancecheck__(cls, inst):
+        return hasattr(inst, "_data")
+
+
+ABCGeneric = _ABCGeneric("ABCGeneric", tuple(), {})
diff --git a/pandas/core/dtypes/inference.py b/pandas/core/dtypes/inference.py
new file mode 100644
index 0000000000000..1a02623fa6072
--- /dev/null
+++ b/pandas/core/dtypes/inference.py
@@ -0,0 +1,499 @@
+""" basic inference routines """
+
+from numbers import Number
+import re
+
+import numpy as np
+
+from pandas._libs import lib
+from pandas.compat import (
+    PY2, Set, re_type, string_and_binary_types, string_types, text_type)
+
+from pandas import compat
+
+is_bool = lib.is_bool
+
+is_integer = lib.is_integer
+
+is_float = lib.is_float
+
+is_complex = lib.is_complex
+
+is_scalar = lib.is_scalar
+
+is_decimal = lib.is_decimal
+
+is_interval = lib.is_interval
+
+
+def is_number(obj):
+    """
+    Check if the object is a number.
+
+    Returns True when the object is a number, and False if is not.
+
+    Parameters
+    ----------
+    obj : any type
+        The object to check if is a number.
+
+    Returns
+    -------
+    is_number : bool
+        Whether `obj` is a number or not.
+
+    See Also
+    --------
+    api.types.is_integer: Checks a subgroup of numbers.
+
+    Examples
+    --------
+    >>> pd.api.types.is_number(1)
+    True
+    >>> pd.api.types.is_number(7.15)
+    True
+
+    Booleans are valid because they are int subclass.
+
+    >>> pd.api.types.is_number(False)
+    True
+
+    >>> pd.api.types.is_number("foo")
+    False
+    >>> pd.api.types.is_number("5")
+    False
+    """
+
+    return isinstance(obj, (Number, np.number))
+
+
+def is_string_like(obj):
+    """
+    Check if the object is a string.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Examples
+    --------
+    >>> is_string_like("foo")
+    True
+    >>> is_string_like(1)
+    False
+
+    Returns
+    -------
+    is_str_like : bool
+        Whether `obj` is a string or not.
+    """
+
+    return isinstance(obj, (text_type, string_types))
+
+
+def _iterable_not_string(obj):
+    """
+    Check if the object is an iterable but not a string.
+
+    Parameters
+    ----------
+    obj : The object to check.
+
+    Returns
+    -------
+    is_iter_not_string : bool
+        Whether `obj` is a non-string iterable.
+
+    Examples
+    --------
+    >>> _iterable_not_string([1, 2, 3])
+    True
+    >>> _iterable_not_string("foo")
+    False
+    >>> _iterable_not_string(1)
+    False
+    """
+
+    return (isinstance(obj, compat.Iterable) and
+            not isinstance(obj, string_types))
+
+
+def is_iterator(obj):
+    """
+    Check if the object is an iterator.
+
+    For example, lists are considered iterators
+    but not strings or datetime objects.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_iter : bool
+        Whether `obj` is an iterator.
+
+    Examples
+    --------
+    >>> is_iterator([1, 2, 3])
+    True
+    >>> is_iterator(datetime(2017, 1, 1))
+    False
+    >>> is_iterator("foo")
+    False
+    >>> is_iterator(1)
+    False
+    """
+
+    if not hasattr(obj, '__iter__'):
+        return False
+
+    if PY2:
+        return hasattr(obj, 'next')
+    else:
+        # Python 3 generators have
+        # __next__ instead of next
+        return hasattr(obj, '__next__')
+
+
+def is_file_like(obj):
+    """
+    Check if the object is a file-like object.
+
+    For objects to be considered file-like, they must
+    be an iterator AND have either a `read` and/or `write`
+    method as an attribute.
+
+    Note: file-like objects must be iterable, but
+    iterable objects need not be file-like.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_file_like : bool
+        Whether `obj` has file-like properties.
+
+    Examples
+    --------
+    >>> buffer(StringIO("data"))
+    >>> is_file_like(buffer)
+    True
+    >>> is_file_like([1, 2, 3])
+    False
+    """
+
+    if not (hasattr(obj, 'read') or hasattr(obj, 'write')):
+        return False
+
+    if not hasattr(obj, "__iter__"):
+        return False
+
+    return True
+
+
+def is_re(obj):
+    """
+    Check if the object is a regex pattern instance.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_regex : bool
+        Whether `obj` is a regex pattern.
+
+    Examples
+    --------
+    >>> is_re(re.compile(".*"))
+    True
+    >>> is_re("foo")
+    False
+    """
+
+    return isinstance(obj, re_type)
+
+
+def is_re_compilable(obj):
+    """
+    Check if the object can be compiled into a regex pattern instance.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_regex_compilable : bool
+        Whether `obj` can be compiled as a regex pattern.
+
+    Examples
+    --------
+    >>> is_re_compilable(".*")
+    True
+    >>> is_re_compilable(1)
+    False
+    """
+
+    try:
+        re.compile(obj)
+    except TypeError:
+        return False
+    else:
+        return True
+
+
+def is_list_like(obj, allow_sets=True):
+    """
+    Check if the object is list-like.
+
+    Objects that are considered list-like are for example Python
+    lists, tuples, sets, NumPy arrays, and Pandas Series.
+
+    Strings and datetime objects, however, are not considered list-like.
+
+    Parameters
+    ----------
+    obj : The object to check
+    allow_sets : boolean, default True
+        If this parameter is False, sets will not be considered list-like
+
+        .. versionadded:: 0.24.0
+
+    Returns
+    -------
+    is_list_like : bool
+        Whether `obj` has list-like properties.
+
+    Examples
+    --------
+    >>> is_list_like([1, 2, 3])
+    True
+    >>> is_list_like({1, 2, 3})
+    True
+    >>> is_list_like(datetime(2017, 1, 1))
+    False
+    >>> is_list_like("foo")
+    False
+    >>> is_list_like(1)
+    False
+    >>> is_list_like(np.array([2]))
+    True
+    >>> is_list_like(np.array(2)))
+    False
+    """
+
+    return (isinstance(obj, compat.Iterable)
+            # we do not count strings/unicode/bytes as list-like
+            and not isinstance(obj, string_and_binary_types)
+
+            # exclude zero-dimensional numpy arrays, effectively scalars
+            and not (isinstance(obj, np.ndarray) and obj.ndim == 0)
+
+            # exclude sets if allow_sets is False
+            and not (allow_sets is False and isinstance(obj, Set)))
+
+
+def is_array_like(obj):
+    """
+    Check if the object is array-like.
+
+    For an object to be considered array-like, it must be list-like and
+    have a `dtype` attribute.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_array_like : bool
+        Whether `obj` has array-like properties.
+
+    Examples
+    --------
+    >>> is_array_like(np.array([1, 2, 3]))
+    True
+    >>> is_array_like(pd.Series(["a", "b"]))
+    True
+    >>> is_array_like(pd.Index(["2016-01-01"]))
+    True
+    >>> is_array_like([1, 2, 3])
+    False
+    >>> is_array_like(("a", "b"))
+    False
+    """
+
+    return is_list_like(obj) and hasattr(obj, "dtype")
+
+
+def is_nested_list_like(obj):
+    """
+    Check if the object is list-like, and that all of its elements
+    are also list-like.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_list_like : bool
+        Whether `obj` has list-like properties.
+
+    Examples
+    --------
+    >>> is_nested_list_like([[1, 2, 3]])
+    True
+    >>> is_nested_list_like([{1, 2, 3}, {1, 2, 3}])
+    True
+    >>> is_nested_list_like(["foo"])
+    False
+    >>> is_nested_list_like([])
+    False
+    >>> is_nested_list_like([[1, 2, 3], 1])
+    False
+
+    Notes
+    -----
+    This won't reliably detect whether a consumable iterator (e. g.
+    a generator) is a nested-list-like without consuming the iterator.
+    To avoid consuming it, we always return False if the outer container
+    doesn't define `__len__`.
+
+    See Also
+    --------
+    is_list_like
+    """
+    return (is_list_like(obj) and hasattr(obj, '__len__') and
+            len(obj) > 0 and all(is_list_like(item) for item in obj))
+
+
+def is_dict_like(obj):
+    """
+    Check if the object is dict-like.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_dict_like : bool
+        Whether `obj` has dict-like properties.
+
+    Examples
+    --------
+    >>> is_dict_like({1: 2})
+    True
+    >>> is_dict_like([1, 2, 3])
+    False
+    >>> is_dict_like(dict)
+    False
+    >>> is_dict_like(dict())
+    True
+    """
+    dict_like_attrs = ("__getitem__", "keys", "__contains__")
+    return (all(hasattr(obj, attr) for attr in dict_like_attrs)
+            # [GH 25196] exclude classes
+            and not isinstance(obj, type))
+
+
+def is_named_tuple(obj):
+    """
+    Check if the object is a named tuple.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_named_tuple : bool
+        Whether `obj` is a named tuple.
+
+    Examples
+    --------
+    >>> Point = namedtuple("Point", ["x", "y"])
+    >>> p = Point(1, 2)
+    >>>
+    >>> is_named_tuple(p)
+    True
+    >>> is_named_tuple((1, 2))
+    False
+    """
+
+    return isinstance(obj, tuple) and hasattr(obj, '_fields')
+
+
+def is_hashable(obj):
+    """Return True if hash(obj) will succeed, False otherwise.
+
+    Some types will pass a test against collections.Hashable but fail when they
+    are actually hashed with hash().
+
+    Distinguish between these and other types by trying the call to hash() and
+    seeing if they raise TypeError.
+
+    Examples
+    --------
+    >>> a = ([],)
+    >>> isinstance(a, collections.Hashable)
+    True
+    >>> is_hashable(a)
+    False
+    """
+    # Unfortunately, we can't use isinstance(obj, collections.Hashable), which
+    # can be faster than calling hash. That is because numpy scalars on Python
+    # 3 fail this test.
+
+    # Reconsider this decision once this numpy bug is fixed:
+    # https://github.com/numpy/numpy/issues/5562
+
+    try:
+        hash(obj)
+    except TypeError:
+        return False
+    else:
+        return True
+
+
+def is_sequence(obj):
+    """
+    Check if the object is a sequence of objects.
+    String types are not included as sequences here.
+
+    Parameters
+    ----------
+    obj : The object to check
+
+    Returns
+    -------
+    is_sequence : bool
+        Whether `obj` is a sequence of objects.
+
+    Examples
+    --------
+    >>> l = [1, 2, 3]
+    >>>
+    >>> is_sequence(l)
+    True
+    >>> is_sequence(iter(l))
+    False
+    """
+
+    try:
+        iter(obj)  # Can iterate over it.
+        len(obj)   # Has a length associated with it.
+        return not isinstance(obj, string_and_binary_types)
+    except (TypeError, AttributeError):
+        return False
diff --git a/pandas/core/dtypes/missing.py b/pandas/core/dtypes/missing.py
new file mode 100644
index 0000000000000..697c58a365233
--- /dev/null
+++ b/pandas/core/dtypes/missing.py
@@ -0,0 +1,529 @@
+"""
+missing types & inference
+"""
+import numpy as np
+
+from pandas._libs import lib, missing as libmissing
+from pandas._libs.tslibs import NaT, iNaT
+
+from .common import (
+    _NS_DTYPE, _TD_DTYPE, ensure_object, is_bool_dtype, is_complex_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype, is_datetimelike,
+    is_datetimelike_v_numeric, is_dtype_equal, is_extension_array_dtype,
+    is_float_dtype, is_integer_dtype, is_object_dtype, is_period_dtype,
+    is_scalar, is_string_dtype, is_string_like_dtype, is_timedelta64_dtype,
+    needs_i8_conversion, pandas_dtype)
+from .generic import (
+    ABCDatetimeArray, ABCExtensionArray, ABCGeneric, ABCIndexClass,
+    ABCMultiIndex, ABCSeries, ABCTimedeltaArray)
+from .inference import is_list_like
+
+isposinf_scalar = libmissing.isposinf_scalar
+isneginf_scalar = libmissing.isneginf_scalar
+
+
+def isna(obj):
+    """
+    Detect missing values for an array-like object.
+
+    This function takes a scalar or array-like object and indicates
+    whether values are missing (``NaN`` in numeric arrays, ``None`` or ``NaN``
+    in object arrays, ``NaT`` in datetimelike).
+
+    Parameters
+    ----------
+    obj : scalar or array-like
+        Object to check for null or missing values.
+
+    Returns
+    -------
+    bool or array-like of bool
+        For scalar input, returns a scalar boolean.
+        For array input, returns an array of boolean indicating whether each
+        corresponding element is missing.
+
+    See Also
+    --------
+    notna : Boolean inverse of pandas.isna.
+    Series.isna : Detect missing values in a Series.
+    DataFrame.isna : Detect missing values in a DataFrame.
+    Index.isna : Detect missing values in an Index.
+
+    Examples
+    --------
+    Scalar arguments (including strings) result in a scalar boolean.
+
+    >>> pd.isna('dog')
+    False
+
+    >>> pd.isna(np.nan)
+    True
+
+    ndarrays result in an ndarray of booleans.
+
+    >>> array = np.array([[1, np.nan, 3], [4, 5, np.nan]])
+    >>> array
+    array([[ 1., nan,  3.],
+           [ 4.,  5., nan]])
+    >>> pd.isna(array)
+    array([[False,  True, False],
+           [False, False,  True]])
+
+    For indexes, an ndarray of booleans is returned.
+
+    >>> index = pd.DatetimeIndex(["2017-07-05", "2017-07-06", None,
+    ...                           "2017-07-08"])
+    >>> index
+    DatetimeIndex(['2017-07-05', '2017-07-06', 'NaT', '2017-07-08'],
+                  dtype='datetime64[ns]', freq=None)
+    >>> pd.isna(index)
+    array([False, False,  True, False])
+
+    For Series and DataFrame, the same type is returned, containing booleans.
+
+    >>> df = pd.DataFrame([['ant', 'bee', 'cat'], ['dog', None, 'fly']])
+    >>> df
+         0     1    2
+    0  ant   bee  cat
+    1  dog  None  fly
+    >>> pd.isna(df)
+           0      1      2
+    0  False  False  False
+    1  False   True  False
+
+    >>> pd.isna(df[1])
+    0    False
+    1     True
+    Name: 1, dtype: bool
+    """
+    return _isna(obj)
+
+
+isnull = isna
+
+
+def _isna_new(obj):
+    if is_scalar(obj):
+        return libmissing.checknull(obj)
+    # hack (for now) because MI registers as ndarray
+    elif isinstance(obj, ABCMultiIndex):
+        raise NotImplementedError("isna is not defined for MultiIndex")
+    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass,
+                          ABCExtensionArray,
+                          ABCDatetimeArray, ABCTimedeltaArray)):
+        return _isna_ndarraylike(obj)
+    elif isinstance(obj, ABCGeneric):
+        return obj._constructor(obj._data.isna(func=isna))
+    elif isinstance(obj, list):
+        return _isna_ndarraylike(np.asarray(obj, dtype=object))
+    elif hasattr(obj, '__array__'):
+        return _isna_ndarraylike(np.asarray(obj))
+    else:
+        return obj is None
+
+
+def _isna_old(obj):
+    """Detect missing values. Treat None, NaN, INF, -INF as null.
+
+    Parameters
+    ----------
+    arr: ndarray or object value
+
+    Returns
+    -------
+    boolean ndarray or boolean
+    """
+    if is_scalar(obj):
+        return libmissing.checknull_old(obj)
+    # hack (for now) because MI registers as ndarray
+    elif isinstance(obj, ABCMultiIndex):
+        raise NotImplementedError("isna is not defined for MultiIndex")
+    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass)):
+        return _isna_ndarraylike_old(obj)
+    elif isinstance(obj, ABCGeneric):
+        return obj._constructor(obj._data.isna(func=_isna_old))
+    elif isinstance(obj, list):
+        return _isna_ndarraylike_old(np.asarray(obj, dtype=object))
+    elif hasattr(obj, '__array__'):
+        return _isna_ndarraylike_old(np.asarray(obj))
+    else:
+        return obj is None
+
+
+_isna = _isna_new
+
+
+def _use_inf_as_na(key):
+    """Option change callback for na/inf behaviour
+    Choose which replacement for numpy.isnan / -numpy.isfinite is used.
+
+    Parameters
+    ----------
+    flag: bool
+        True means treat None, NaN, INF, -INF as null (old way),
+        False means None and NaN are null, but INF, -INF are not null
+        (new way).
+
+    Notes
+    -----
+    This approach to setting global module values is discussed and
+    approved here:
+
+    * http://stackoverflow.com/questions/4859217/
+      programmatically-creating-variables-in-python/4859312#4859312
+    """
+    from pandas.core.config import get_option
+    flag = get_option(key)
+    if flag:
+        globals()['_isna'] = _isna_old
+    else:
+        globals()['_isna'] = _isna_new
+
+
+def _isna_ndarraylike(obj):
+    is_extension = is_extension_array_dtype(obj)
+
+    if not is_extension:
+        # Avoid accessing `.values` on things like
+        # PeriodIndex, which may be expensive.
+        values = getattr(obj, 'values', obj)
+    else:
+        values = obj
+
+    dtype = values.dtype
+
+    if is_extension:
+        if isinstance(obj, (ABCIndexClass, ABCSeries)):
+            values = obj._values
+        else:
+            values = obj
+        result = values.isna()
+    elif isinstance(obj, ABCDatetimeArray):
+        return obj.isna()
+    elif is_string_dtype(dtype):
+        # Working around NumPy ticket 1542
+        shape = values.shape
+
+        if is_string_like_dtype(dtype):
+            # object array of strings
+            result = np.zeros(values.shape, dtype=bool)
+        else:
+            # object array of non-strings
+            result = np.empty(shape, dtype=bool)
+            vec = libmissing.isnaobj(values.ravel())
+            result[...] = vec.reshape(shape)
+
+    elif needs_i8_conversion(dtype):
+        # this is the NaT pattern
+        result = values.view('i8') == iNaT
+    else:
+        result = np.isnan(values)
+
+    # box
+    if isinstance(obj, ABCSeries):
+        result = obj._constructor(
+            result, index=obj.index, name=obj.name, copy=False)
+
+    return result
+
+
+def _isna_ndarraylike_old(obj):
+    values = getattr(obj, 'values', obj)
+    dtype = values.dtype
+
+    if is_string_dtype(dtype):
+        # Working around NumPy ticket 1542
+        shape = values.shape
+
+        if is_string_like_dtype(dtype):
+            result = np.zeros(values.shape, dtype=bool)
+        else:
+            result = np.empty(shape, dtype=bool)
+            vec = libmissing.isnaobj_old(values.ravel())
+            result[:] = vec.reshape(shape)
+
+    elif is_datetime64_dtype(dtype):
+        # this is the NaT pattern
+        result = values.view('i8') == iNaT
+    else:
+        result = ~np.isfinite(values)
+
+    # box
+    if isinstance(obj, ABCSeries):
+        result = obj._constructor(
+            result, index=obj.index, name=obj.name, copy=False)
+
+    return result
+
+
+def notna(obj):
+    """
+    Detect non-missing values for an array-like object.
+
+    This function takes a scalar or array-like object and indicates
+    whether values are valid (not missing, which is ``NaN`` in numeric
+    arrays, ``None`` or ``NaN`` in object arrays, ``NaT`` in datetimelike).
+
+    Parameters
+    ----------
+    obj : array-like or object value
+        Object to check for *not* null or *non*-missing values.
+
+    Returns
+    -------
+    bool or array-like of bool
+        For scalar input, returns a scalar boolean.
+        For array input, returns an array of boolean indicating whether each
+        corresponding element is valid.
+
+    See Also
+    --------
+    isna : Boolean inverse of pandas.notna.
+    Series.notna : Detect valid values in a Series.
+    DataFrame.notna : Detect valid values in a DataFrame.
+    Index.notna : Detect valid values in an Index.
+
+    Examples
+    --------
+    Scalar arguments (including strings) result in a scalar boolean.
+
+    >>> pd.notna('dog')
+    True
+
+    >>> pd.notna(np.nan)
+    False
+
+    ndarrays result in an ndarray of booleans.
+
+    >>> array = np.array([[1, np.nan, 3], [4, 5, np.nan]])
+    >>> array
+    array([[ 1., nan,  3.],
+           [ 4.,  5., nan]])
+    >>> pd.notna(array)
+    array([[ True, False,  True],
+           [ True,  True, False]])
+
+    For indexes, an ndarray of booleans is returned.
+
+    >>> index = pd.DatetimeIndex(["2017-07-05", "2017-07-06", None,
+    ...                          "2017-07-08"])
+    >>> index
+    DatetimeIndex(['2017-07-05', '2017-07-06', 'NaT', '2017-07-08'],
+                  dtype='datetime64[ns]', freq=None)
+    >>> pd.notna(index)
+    array([ True,  True, False,  True])
+
+    For Series and DataFrame, the same type is returned, containing booleans.
+
+    >>> df = pd.DataFrame([['ant', 'bee', 'cat'], ['dog', None, 'fly']])
+    >>> df
+         0     1    2
+    0  ant   bee  cat
+    1  dog  None  fly
+    >>> pd.notna(df)
+          0      1     2
+    0  True   True  True
+    1  True  False  True
+
+    >>> pd.notna(df[1])
+    0     True
+    1    False
+    Name: 1, dtype: bool
+    """
+    res = isna(obj)
+    if is_scalar(res):
+        return not res
+    return ~res
+
+
+notnull = notna
+
+
+def _isna_compat(arr, fill_value=np.nan):
+    """
+    Parameters
+    ----------
+    arr: a numpy array
+    fill_value: fill value, default to np.nan
+
+    Returns
+    -------
+    True if we can fill using this fill_value
+    """
+    dtype = arr.dtype
+    if isna(fill_value):
+        return not (is_bool_dtype(dtype) or
+                    is_integer_dtype(dtype))
+    return True
+
+
+def array_equivalent(left, right, strict_nan=False):
+    """
+    True if two arrays, left and right, have equal non-NaN elements, and NaNs
+    in corresponding locations.  False otherwise. It is assumed that left and
+    right are NumPy arrays of the same dtype. The behavior of this function
+    (particularly with respect to NaNs) is not defined if the dtypes are
+    different.
+
+    Parameters
+    ----------
+    left, right : ndarrays
+    strict_nan : bool, default False
+        If True, consider NaN and None to be different.
+
+    Returns
+    -------
+    b : bool
+        Returns True if the arrays are equivalent.
+
+    Examples
+    --------
+    >>> array_equivalent(
+    ...     np.array([1, 2, np.nan]),
+    ...     np.array([1, 2, np.nan]))
+    True
+    >>> array_equivalent(
+    ...     np.array([1, np.nan, 2]),
+    ...     np.array([1, 2, np.nan]))
+    False
+    """
+
+    left, right = np.asarray(left), np.asarray(right)
+
+    # shape compat
+    if left.shape != right.shape:
+        return False
+
+    # Object arrays can contain None, NaN and NaT.
+    # string dtypes must be come to this path for NumPy 1.7.1 compat
+    if is_string_dtype(left) or is_string_dtype(right):
+
+        if not strict_nan:
+            # isna considers NaN and None to be equivalent.
+            return lib.array_equivalent_object(
+                ensure_object(left.ravel()), ensure_object(right.ravel()))
+
+        for left_value, right_value in zip(left, right):
+            if left_value is NaT and right_value is not NaT:
+                return False
+
+            elif isinstance(left_value, float) and np.isnan(left_value):
+                if (not isinstance(right_value, float) or
+                        not np.isnan(right_value)):
+                    return False
+            else:
+                if left_value != right_value:
+                    return False
+        return True
+
+    # NaNs can occur in float and complex arrays.
+    if is_float_dtype(left) or is_complex_dtype(left):
+
+        # empty
+        if not (np.prod(left.shape) and np.prod(right.shape)):
+            return True
+        return ((left == right) | (isna(left) & isna(right))).all()
+
+    # numpy will will not allow this type of datetimelike vs integer comparison
+    elif is_datetimelike_v_numeric(left, right):
+        return False
+
+    # M8/m8
+    elif needs_i8_conversion(left) and needs_i8_conversion(right):
+        if not is_dtype_equal(left.dtype, right.dtype):
+            return False
+
+        left = left.view('i8')
+        right = right.view('i8')
+
+    # if we have structured dtypes, compare first
+    if (left.dtype.type is np.void or
+            right.dtype.type is np.void):
+        if left.dtype != right.dtype:
+            return False
+
+    return np.array_equal(left, right)
+
+
+def _infer_fill_value(val):
+    """
+    infer the fill value for the nan/NaT from the provided
+    scalar/ndarray/list-like if we are a NaT, return the correct dtyped
+    element to provide proper block construction
+    """
+
+    if not is_list_like(val):
+        val = [val]
+    val = np.array(val, copy=False)
+    if is_datetimelike(val):
+        return np.array('NaT', dtype=val.dtype)
+    elif is_object_dtype(val.dtype):
+        dtype = lib.infer_dtype(ensure_object(val), skipna=False)
+        if dtype in ['datetime', 'datetime64']:
+            return np.array('NaT', dtype=_NS_DTYPE)
+        elif dtype in ['timedelta', 'timedelta64']:
+            return np.array('NaT', dtype=_TD_DTYPE)
+    return np.nan
+
+
+def _maybe_fill(arr, fill_value=np.nan):
+    """
+    if we have a compatible fill_value and arr dtype, then fill
+    """
+    if _isna_compat(arr, fill_value):
+        arr.fill(fill_value)
+    return arr
+
+
+def na_value_for_dtype(dtype, compat=True):
+    """
+    Return a dtype compat na value
+
+    Parameters
+    ----------
+    dtype : string / dtype
+    compat : boolean, default True
+
+    Returns
+    -------
+    np.dtype or a pandas dtype
+
+    Examples
+    --------
+    >>> na_value_for_dtype(np.dtype('int64'))
+    0
+    >>> na_value_for_dtype(np.dtype('int64'), compat=False)
+    nan
+    >>> na_value_for_dtype(np.dtype('float64'))
+    nan
+    >>> na_value_for_dtype(np.dtype('bool'))
+    False
+    >>> na_value_for_dtype(np.dtype('datetime64[ns]'))
+    NaT
+    """
+    dtype = pandas_dtype(dtype)
+
+    if is_extension_array_dtype(dtype):
+        return dtype.na_value
+    if (is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype) or
+            is_timedelta64_dtype(dtype) or is_period_dtype(dtype)):
+        return NaT
+    elif is_float_dtype(dtype):
+        return np.nan
+    elif is_integer_dtype(dtype):
+        if compat:
+            return 0
+        return np.nan
+    elif is_bool_dtype(dtype):
+        return False
+    return np.nan
+
+
+def remove_na_arraylike(arr):
+    """
+    Return array-like containing only true/non-NaN values, possibly empty.
+    """
+    if is_extension_array_dtype(arr):
+        return arr[notna(arr)]
+    else:
+        return arr[notna(lib.values_from_object(arr))]
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
index ffae22447cc65..eadffb779734f 100644
--- a/pandas/core/frame.py
+++ b/pandas/core/frame.py
@@ -1,3 +1,5 @@
+# pylint: disable=E1101
+# pylint: disable=W0212,W0703,W0622
 """
 DataFrame
 ---------
@@ -9,92 +11,99 @@
 labeling information
 """
 from __future__ import division
-# pylint: disable=E1101,E1103
-# pylint: disable=W0212,W0231,W0703,W0622
 
-import functools
 import collections
+from collections import OrderedDict
+import functools
 import itertools
 import sys
-import types
 import warnings
+from textwrap import dedent
 
-from numpy import nan as NA
 import numpy as np
 import numpy.ma as ma
 
-from pandas.types.cast import (maybe_upcast, infer_dtype_from_scalar,
-                               maybe_cast_to_datetime,
-                               maybe_infer_to_datetimelike,
-                               maybe_convert_platform,
-                               maybe_downcast_to_dtype,
-                               invalidate_string_dtypes,
-                               coerce_to_dtypes,
-                               maybe_upcast_putmask,
-                               find_common_type)
-from pandas.types.common import (is_categorical_dtype,
-                                 is_object_dtype,
-                                 is_extension_type,
-                                 is_datetimetz,
-                                 is_datetime64_any_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_bool_dtype,
-                                 is_integer_dtype,
-                                 is_float_dtype,
-                                 is_integer,
-                                 is_scalar,
-                                 is_dtype_equal,
-                                 needs_i8_conversion,
-                                 _get_dtype_from_object,
-                                 _ensure_float,
-                                 _ensure_float64,
-                                 _ensure_int64,
-                                 _ensure_platform_int,
-                                 is_list_like,
-                                 is_iterator,
-                                 is_sequence,
-                                 is_named_tuple)
-from pandas.types.missing import isnull, notnull
-
-from pandas.core.common import (PandasError, _try_sort,
-                                _default_index,
-                                _values_from_object,
-                                _maybe_box_datetimelike,
-                                _dict_compat)
+from pandas._libs import lib, algos as libalgos
+
+from pandas.util._decorators import (Appender, Substitution,
+                                     rewrite_axis_style_signature,
+                                     deprecate_kwarg)
+from pandas.util._validators import (validate_bool_kwarg,
+                                     validate_axis_style_args)
+
+from pandas import compat
+from pandas.compat import (range, map, zip, lmap, lzip, StringIO, u,
+                           PY36, raise_with_traceback, Iterator,
+                           string_and_binary_types)
+from pandas.compat.numpy import function as nv
+from pandas.core.dtypes.cast import (
+    maybe_upcast,
+    cast_scalar_to_array,
+    infer_dtype_from_scalar,
+    maybe_cast_to_datetime,
+    maybe_infer_to_datetimelike,
+    maybe_convert_platform,
+    maybe_downcast_to_dtype,
+    invalidate_string_dtypes,
+    coerce_to_dtypes,
+    maybe_upcast_putmask,
+    find_common_type)
+from pandas.core.dtypes.common import (
+    is_dict_like,
+    is_datetime64tz_dtype,
+    is_object_dtype,
+    is_extension_type,
+    is_extension_array_dtype,
+    is_datetime64_any_dtype,
+    is_bool_dtype,
+    is_integer_dtype,
+    is_float_dtype,
+    is_integer,
+    is_scalar,
+    is_dtype_equal,
+    needs_i8_conversion,
+    infer_dtype_from_object,
+    ensure_float64,
+    ensure_int64,
+    ensure_platform_int,
+    is_list_like,
+    is_nested_list_like,
+    is_iterator,
+    is_sequence,
+    is_named_tuple)
+from pandas.core.dtypes.generic import ABCSeries, ABCIndexClass, ABCMultiIndex
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.core import algorithms
+from pandas.core import common as com
+from pandas.core import nanops
+from pandas.core import ops
+from pandas.core.accessor import CachedAccessor
+from pandas.core.arrays import Categorical, ExtensionArray
+from pandas.core.arrays.datetimelike import (
+    DatetimeLikeArrayMixin as DatetimeLikeArray
+)
+from pandas.core.config import get_option
 from pandas.core.generic import NDFrame, _shared_docs
-from pandas.core.index import Index, MultiIndex, _ensure_index
+from pandas.core.index import (Index, MultiIndex, ensure_index,
+                               ensure_index_from_sequences)
+from pandas.core.indexes import base as ibase
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex
 from pandas.core.indexing import (maybe_droplevels, convert_to_index_sliceable,
                                   check_bool_indexer)
-from pandas.core.internals import (BlockManager,
-                                   create_block_manager_from_arrays,
-                                   create_block_manager_from_blocks)
+from pandas.core.internals import BlockManager
+from pandas.core.internals.construction import (
+    masked_rec_array_to_mgr, get_names_from_index, to_arrays,
+    reorder_arrays, init_ndarray, init_dict,
+    arrays_to_mgr, sanitize_index)
 from pandas.core.series import Series
-from pandas.core.categorical import Categorical
-import pandas.computation.expressions as expressions
-import pandas.core.algorithms as algorithms
-from pandas.computation.eval import eval as _eval
-from pandas.compat import (range, map, zip, lrange, lmap, lzip, StringIO, u,
-                           OrderedDict, raise_with_traceback)
-from pandas import compat
-from pandas.compat.numpy import function as nv
-from pandas.util.decorators import Appender, Substitution
-from pandas.util.validators import validate_bool_kwarg
-
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.tdi import TimedeltaIndex
-
-import pandas.core.base as base
-import pandas.core.common as com
-import pandas.core.nanops as nanops
-import pandas.core.ops as ops
-import pandas.formats.format as fmt
-from pandas.formats.printing import pprint_thing
-import pandas.tools.plotting as gfx
 
-from pandas._libs import lib, algos as libalgos
+from pandas.io.formats import console
+from pandas.io.formats import format as fmt
+from pandas.io.formats.printing import pprint_thing
 
-from pandas.core.config import get_option
+import pandas.plotting._core as gfx
 
 # ---------------------------------------------------------------------
 # Docstring templates
@@ -102,10 +111,27 @@
 _shared_doc_kwargs = dict(
     axes='index, columns', klass='DataFrame',
     axes_single_arg="{0 or 'index', 1 or 'columns'}",
+    axis="""axis : {0 or 'index', 1 or 'columns'}, default 0
+        If 0 or 'index': apply function to each column.
+        If 1 or 'columns': apply function to each row.""",
     optional_by="""
         by : str or list of str
-            Name or list of names which refer to the axis items.""",
-    versionadded_to_excel='')
+            Name or list of names to sort by.
+
+            - if `axis` is 0 or `'index'` then `by` may contain index
+              levels and/or column labels
+            - if `axis` is 1 or `'columns'` then `by` may contain column
+              levels and/or index labels
+
+            .. versionchanged:: 0.23.0
+               Allow specifying index or column level names.""",
+    versionadded_to_excel='',
+    optional_labels="""labels : array-like, optional
+            New labels / index to conform the axis specified by 'axis' to.""",
+    optional_axis="""axis : int or str, optional
+            Axis to target. Can be either the axis name ('index', 'columns')
+            or number (0, 1).""",
+)
 
 _numeric_only_doc = """numeric_only : boolean, default None
     Include only float, int, boolean data. If None, will attempt to use
@@ -113,52 +139,56 @@
 """
 
 _merge_doc = """
-Merge DataFrame objects by performing a database-style join operation by
-columns or indexes.
+Merge DataFrame or named Series objects with a database-style join.
 
-If joining columns on columns, the DataFrame indexes *will be
-ignored*. Otherwise if joining indexes on indexes or indexes on a column or
-columns, the index will be passed on.
+The join is done on columns or indexes. If joining columns on
+columns, the DataFrame indexes *will be ignored*. Otherwise if joining indexes
+on indexes or indexes on a column or columns, the index will be passed on.
 
 Parameters
 ----------%s
-right : DataFrame
+right : DataFrame or named Series
+    Object to merge with.
 how : {'left', 'right', 'outer', 'inner'}, default 'inner'
+    Type of merge to be performed.
+
     * left: use only keys from left frame, similar to a SQL left outer join;
-      preserve key order
+      preserve key order.
     * right: use only keys from right frame, similar to a SQL right outer join;
-      preserve key order
+      preserve key order.
     * outer: use union of keys from both frames, similar to a SQL full outer
-      join; sort keys lexicographically
+      join; sort keys lexicographically.
     * inner: use intersection of keys from both frames, similar to a SQL inner
-      join; preserve the order of the left keys
+      join; preserve the order of the left keys.
 on : label or list
-    Field names to join on. Must be found in both DataFrames. If on is
-    None and not merging on indexes, then it merges on the intersection of
-    the columns by default.
+    Column or index level names to join on. These must be found in both
+    DataFrames. If `on` is None and not merging on indexes then this defaults
+    to the intersection of the columns in both DataFrames.
 left_on : label or list, or array-like
-    Field names to join on in left DataFrame. Can be a vector or list of
-    vectors of the length of the DataFrame to use a particular vector as
-    the join key instead of columns
+    Column or index level names to join on in the left DataFrame. Can also
+    be an array or list of arrays of the length of the left DataFrame.
+    These arrays are treated as if they are columns.
 right_on : label or list, or array-like
-    Field names to join on in right DataFrame or vector/list of vectors per
-    left_on docs
-left_index : boolean, default False
+    Column or index level names to join on in the right DataFrame. Can also
+    be an array or list of arrays of the length of the right DataFrame.
+    These arrays are treated as if they are columns.
+left_index : bool, default False
     Use the index from the left DataFrame as the join key(s). If it is a
     MultiIndex, the number of keys in the other DataFrame (either the index
-    or a number of columns) must match the number of levels
-right_index : boolean, default False
+    or a number of columns) must match the number of levels.
+right_index : bool, default False
     Use the index from the right DataFrame as the join key. Same caveats as
-    left_index
-sort : boolean, default False
+    left_index.
+sort : bool, default False
     Sort the join keys lexicographically in the result DataFrame. If False,
-    the order of the join keys depends on the join type (how keyword)
-suffixes : 2-length sequence (tuple, list, ...)
+    the order of the join keys depends on the join type (how keyword).
+suffixes : tuple of (str, str), default ('_x', '_y')
     Suffix to apply to overlapping column names in the left and right
-    side, respectively
-copy : boolean, default True
-    If False, do not copy data unnecessarily
-indicator : boolean or string, default False
+    side, respectively. To raise an exception on overlapping columns use
+    (False, False).
+copy : bool, default True
+    If False, avoid copy if possible.
+indicator : bool or str, default False
     If True, adds a column to output DataFrame called "_merge" with
     information on the source of each row.
     If string, column with information on source of each row will be added to
@@ -168,38 +198,89 @@
     "right_only" for observations whose merge key only appears in 'right'
     DataFrame, and "both" if the observation's merge key is found in both.
 
-    .. versionadded:: 0.17.0
+validate : str, optional
+    If specified, checks if merge is of specified type.
 
-Examples
---------
+    * "one_to_one" or "1:1": check if merge keys are unique in both
+      left and right datasets.
+    * "one_to_many" or "1:m": check if merge keys are unique in left
+      dataset.
+    * "many_to_one" or "m:1": check if merge keys are unique in right
+      dataset.
+    * "many_to_many" or "m:m": allowed, but does not result in checks.
 
->>> A              >>> B
-    lkey value         rkey value
-0   foo  1         0   foo  5
-1   bar  2         1   bar  6
-2   baz  3         2   qux  7
-3   foo  4         3   bar  8
-
->>> A.merge(B, left_on='lkey', right_on='rkey', how='outer')
-   lkey  value_x  rkey  value_y
-0  foo   1        foo   5
-1  foo   4        foo   5
-2  bar   2        bar   6
-3  bar   2        bar   8
-4  baz   3        NaN   NaN
-5  NaN   NaN      qux   7
+    .. versionadded:: 0.21.0
 
 Returns
 -------
-merged : DataFrame
-    The output type will the be same as 'left', if it is a subclass
-    of DataFrame.
+DataFrame
+    A DataFrame of the two merged objects.
+
+See Also
+--------
+merge_ordered : Merge with optional filling/interpolation.
+merge_asof : Merge on nearest keys.
+DataFrame.join : Similar method using indices.
 
-See also
+Notes
+-----
+Support for specifying index levels as the `on`, `left_on`, and
+`right_on` parameters was added in version 0.23.0
+Support for merging named Series objects was added in version 0.24.0
+
+Examples
 --------
-merge_ordered
-merge_asof
 
+>>> df1 = pd.DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
+...                     'value': [1, 2, 3, 5]})
+>>> df2 = pd.DataFrame({'rkey': ['foo', 'bar', 'baz', 'foo'],
+...                     'value': [5, 6, 7, 8]})
+>>> df1
+    lkey value
+0   foo      1
+1   bar      2
+2   baz      3
+3   foo      5
+>>> df2
+    rkey value
+0   foo      5
+1   bar      6
+2   baz      7
+3   foo      8
+
+Merge df1 and df2 on the lkey and rkey columns. The value columns have
+the default suffixes, _x and _y, appended.
+
+>>> df1.merge(df2, left_on='lkey', right_on='rkey')
+  lkey  value_x rkey  value_y
+0  foo        1  foo        5
+1  foo        1  foo        8
+2  foo        5  foo        5
+3  foo        5  foo        8
+4  bar        2  bar        6
+5  baz        3  baz        7
+
+Merge DataFrames df1 and df2 with specified left and right suffixes
+appended to any overlapping columns.
+
+>>> df1.merge(df2, left_on='lkey', right_on='rkey',
+...           suffixes=('_left', '_right'))
+  lkey  value_left rkey  value_right
+0  foo           1  foo            5
+1  foo           1  foo            8
+2  foo           5  foo            5
+3  foo           5  foo            8
+4  bar           2  bar            6
+5  baz           3  baz            7
+
+Merge DataFrames df1 and df2, but raise an exception if the DataFrames have
+any overlapping columns.
+
+>>> df1.merge(df2, left_on='lkey', right_on='rkey', suffixes=(False, False))
+Traceback (most recent call last):
+...
+ValueError: columns overlap but no suffix specified:
+    Index(['value'], dtype='object')
 """
 
 # -----------------------------------------------------------------------
@@ -207,40 +288,74 @@
 
 
 class DataFrame(NDFrame):
-    """ Two-dimensional size-mutable, potentially heterogeneous tabular data
+    """
+    Two-dimensional size-mutable, potentially heterogeneous tabular data
     structure with labeled axes (rows and columns). Arithmetic operations
     align on both row and column labels. Can be thought of as a dict-like
-    container for Series objects. The primary pandas data structure
+    container for Series objects. The primary pandas data structure.
 
     Parameters
     ----------
-    data : numpy ndarray (structured or homogeneous), dict, or DataFrame
+    data : ndarray (structured or homogeneous), Iterable, dict, or DataFrame
         Dict can contain Series, arrays, constants, or list-like objects
+
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
     index : Index or array-like
-        Index to use for resulting frame. Will default to np.arange(n) if
+        Index to use for resulting frame. Will default to RangeIndex if
         no indexing information part of input data and no index provided
     columns : Index or array-like
         Column labels to use for resulting frame. Will default to
-        np.arange(n) if no column labels are provided
+        RangeIndex (0, 1, 2, ..., n) if no column labels are provided
     dtype : dtype, default None
-        Data type to force, otherwise infer
+        Data type to force. Only a single dtype is allowed. If None, infer
     copy : boolean, default False
         Copy data from inputs. Only affects DataFrame / 2d ndarray input
 
-    Examples
+    See Also
     --------
-    >>> d = {'col1': ts1, 'col2': ts2}
-    >>> df = DataFrame(data=d, index=index)
-    >>> df2 = DataFrame(np.random.randn(10, 5))
-    >>> df3 = DataFrame(np.random.randn(10, 5),
-    ...                 columns=['a', 'b', 'c', 'd', 'e'])
+    DataFrame.from_records : Constructor from tuples, also record arrays.
+    DataFrame.from_dict : From dicts of Series, arrays, or dicts.
+    DataFrame.from_items : From sequence of (key, value) pairs
+        read_csv, pandas.read_table, pandas.read_clipboard.
 
-    See also
+    Examples
     --------
-    DataFrame.from_records : constructor from tuples, also record arrays
-    DataFrame.from_dict : from dicts of Series, arrays, or dicts
-    DataFrame.from_items : from sequence of (key, value) pairs
-    pandas.read_csv, pandas.read_table, pandas.read_clipboard
+    Constructing DataFrame from a dictionary.
+
+    >>> d = {'col1': [1, 2], 'col2': [3, 4]}
+    >>> df = pd.DataFrame(data=d)
+    >>> df
+       col1  col2
+    0     1     3
+    1     2     4
+
+    Notice that the inferred dtype is int64.
+
+    >>> df.dtypes
+    col1    int64
+    col2    int64
+    dtype: object
+
+    To enforce a single dtype:
+
+    >>> df = pd.DataFrame(data=d, dtype=np.int8)
+    >>> df.dtypes
+    col1    int8
+    col2    int8
+    dtype: object
+
+    Constructing DataFrame from numpy ndarray:
+
+    >>> df2 = pd.DataFrame(np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]]),
+    ...                    columns=['a', 'b', 'c'])
+    >>> df2
+       a  b  c
+    0  1  2  3
+    1  4  5  6
+    2  7  8  9
     """
 
     @property
@@ -248,12 +363,18 @@ def _constructor(self):
         return DataFrame
 
     _constructor_sliced = Series
+    _deprecations = NDFrame._deprecations | frozenset(
+        ['get_value', 'set_value', 'from_csv', 'from_items'])
+    _accessors = set()
 
     @property
     def _constructor_expanddim(self):
         from pandas.core.panel import Panel
         return Panel
 
+    # ----------------------------------------------------------------------
+    # Constructors
+
     def __init__(self, data=None, index=None, columns=None, dtype=None,
                  copy=False):
         if data is None:
@@ -268,230 +389,158 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
             mgr = self._init_mgr(data, axes=dict(index=index, columns=columns),
                                  dtype=dtype, copy=copy)
         elif isinstance(data, dict):
-            mgr = self._init_dict(data, index, columns, dtype=dtype)
+            mgr = init_dict(data, index, columns, dtype=dtype)
         elif isinstance(data, ma.MaskedArray):
             import numpy.ma.mrecords as mrecords
             # masked recarray
             if isinstance(data, mrecords.MaskedRecords):
-                mgr = _masked_rec_array_to_mgr(data, index, columns, dtype,
-                                               copy)
+                mgr = masked_rec_array_to_mgr(data, index, columns, dtype,
+                                              copy)
 
             # a masked array
             else:
                 mask = ma.getmaskarray(data)
                 if mask.any():
                     data, fill_value = maybe_upcast(data, copy=True)
+                    data.soften_mask()  # set hardmask False if it was True
                     data[mask] = fill_value
                 else:
                     data = data.copy()
-                mgr = self._init_ndarray(data, index, columns, dtype=dtype,
-                                         copy=copy)
+                mgr = init_ndarray(data, index, columns, dtype=dtype,
+                                   copy=copy)
 
         elif isinstance(data, (np.ndarray, Series, Index)):
             if data.dtype.names:
                 data_columns = list(data.dtype.names)
-                data = dict((k, data[k]) for k in data_columns)
+                data = {k: data[k] for k in data_columns}
                 if columns is None:
                     columns = data_columns
-                mgr = self._init_dict(data, index, columns, dtype=dtype)
-            elif getattr(data, 'name', None):
-                mgr = self._init_dict({data.name: data}, index, columns,
-                                      dtype=dtype)
+                mgr = init_dict(data, index, columns, dtype=dtype)
+            elif getattr(data, 'name', None) is not None:
+                mgr = init_dict({data.name: data}, index, columns,
+                                dtype=dtype)
             else:
-                mgr = self._init_ndarray(data, index, columns, dtype=dtype,
-                                         copy=copy)
-        elif isinstance(data, (list, types.GeneratorType)):
-            if isinstance(data, types.GeneratorType):
+                mgr = init_ndarray(data, index, columns, dtype=dtype,
+                                   copy=copy)
+
+        # For data is list-like, or Iterable (will consume into list)
+        elif (isinstance(data, compat.Iterable)
+              and not isinstance(data, string_and_binary_types)):
+            if not isinstance(data, compat.Sequence):
                 data = list(data)
             if len(data) > 0:
                 if is_list_like(data[0]) and getattr(data[0], 'ndim', 1) == 1:
                     if is_named_tuple(data[0]) and columns is None:
                         columns = data[0]._fields
-                    arrays, columns = _to_arrays(data, columns, dtype=dtype)
-                    columns = _ensure_index(columns)
+                    arrays, columns = to_arrays(data, columns, dtype=dtype)
+                    columns = ensure_index(columns)
 
                     # set the index
                     if index is None:
                         if isinstance(data[0], Series):
-                            index = _get_names_from_index(data)
+                            index = get_names_from_index(data)
                         elif isinstance(data[0], Categorical):
-                            index = _default_index(len(data[0]))
+                            index = ibase.default_index(len(data[0]))
                         else:
-                            index = _default_index(len(data))
+                            index = ibase.default_index(len(data))
 
-                    mgr = _arrays_to_mgr(arrays, columns, index, columns,
-                                         dtype=dtype)
+                    mgr = arrays_to_mgr(arrays, columns, index, columns,
+                                        dtype=dtype)
                 else:
-                    mgr = self._init_ndarray(data, index, columns, dtype=dtype,
-                                             copy=copy)
+                    mgr = init_ndarray(data, index, columns, dtype=dtype,
+                                       copy=copy)
             else:
-                mgr = self._init_dict({}, index, columns, dtype=dtype)
-        elif isinstance(data, collections.Iterator):
-            raise TypeError("data argument can't be an iterator")
+                mgr = init_dict({}, index, columns, dtype=dtype)
         else:
             try:
                 arr = np.array(data, dtype=dtype, copy=copy)
             except (ValueError, TypeError) as e:
                 exc = TypeError('DataFrame constructor called with '
-                                'incompatible data and dtype: %s' % e)
+                                'incompatible data and dtype: {e}'.format(e=e))
                 raise_with_traceback(exc)
 
             if arr.ndim == 0 and index is not None and columns is not None:
-                if isinstance(data, compat.string_types) and dtype is None:
-                    dtype = np.object_
-                if dtype is None:
-                    dtype, data = infer_dtype_from_scalar(data)
-
-                values = np.empty((len(index), len(columns)), dtype=dtype)
-                values.fill(data)
-                mgr = self._init_ndarray(values, index, columns, dtype=dtype,
-                                         copy=False)
+                values = cast_scalar_to_array((len(index), len(columns)),
+                                              data, dtype=dtype)
+                mgr = init_ndarray(values, index, columns,
+                                   dtype=values.dtype, copy=False)
             else:
-                raise PandasError('DataFrame constructor not properly called!')
+                raise ValueError('DataFrame constructor not properly called!')
 
         NDFrame.__init__(self, mgr, fastpath=True)
 
-    def _init_dict(self, data, index, columns, dtype=None):
-        """
-        Segregate Series based on type and coerce into matrices.
-        Needs to handle a lot of exceptional cases.
-        """
-        if columns is not None:
-            columns = _ensure_index(columns)
-
-            # GH10856
-            # raise ValueError if only scalars in dict
-            if index is None:
-                extract_index(list(data.values()))
-
-            # prefilter if columns passed
-            data = dict((k, v) for k, v in compat.iteritems(data)
-                        if k in columns)
-
-            if index is None:
-                index = extract_index(list(data.values()))
-
-            else:
-                index = _ensure_index(index)
-
-            arrays = []
-            data_names = []
-            for k in columns:
-                if k not in data:
-                    # no obvious "empty" int column
-                    if dtype is not None and issubclass(dtype.type,
-                                                        np.integer):
-                        continue
-
-                    if dtype is None:
-                        # 1783
-                        v = np.empty(len(index), dtype=object)
-                    elif np.issubdtype(dtype, np.flexible):
-                        v = np.empty(len(index), dtype=object)
-                    else:
-                        v = np.empty(len(index), dtype=dtype)
-
-                    v.fill(NA)
-                else:
-                    v = data[k]
-                data_names.append(k)
-                arrays.append(v)
-
-        else:
-            keys = list(data.keys())
-            if not isinstance(data, OrderedDict):
-                keys = _try_sort(keys)
-            columns = data_names = Index(keys)
-            arrays = [data[k] for k in keys]
+    # ----------------------------------------------------------------------
 
-        return _arrays_to_mgr(arrays, data_names, index, columns, dtype=dtype)
+    @property
+    def axes(self):
+        """
+        Return a list representing the axes of the DataFrame.
 
-    def _init_ndarray(self, values, index, columns, dtype=None, copy=False):
-        # input must be a ndarray, list, Series, index
+        It has the row axis labels and column axis labels as the only members.
+        They are returned in that order.
 
-        if isinstance(values, Series):
-            if columns is None:
-                if values.name is not None:
-                    columns = [values.name]
-            if index is None:
-                index = values.index
-            else:
-                values = values.reindex(index)
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.axes
+        [RangeIndex(start=0, stop=2, step=1), Index(['col1', 'col2'],
+        dtype='object')]
+        """
+        return [self.index, self.columns]
 
-            # zero len case (GH #2234)
-            if not len(values) and columns is not None and len(columns):
-                values = np.empty((0, 1), dtype=object)
+    @property
+    def shape(self):
+        """
+        Return a tuple representing the dimensionality of the DataFrame.
 
-        # helper to create the axes as indexes
-        def _get_axes(N, K, index=index, columns=columns):
-            # return axes or defaults
+        See Also
+        --------
+        ndarray.shape
 
-            if index is None:
-                index = _default_index(N)
-            else:
-                index = _ensure_index(index)
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.shape
+        (2, 2)
 
-            if columns is None:
-                columns = _default_index(K)
-            else:
-                columns = _ensure_index(columns)
-            return index, columns
-
-        # we could have a categorical type passed or coerced to 'category'
-        # recast this to an _arrays_to_mgr
-        if (is_categorical_dtype(getattr(values, 'dtype', None)) or
-                is_categorical_dtype(dtype)):
-
-            if not hasattr(values, 'dtype'):
-                values = _prep_ndarray(values, copy=copy)
-                values = values.ravel()
-            elif copy:
-                values = values.copy()
-
-            index, columns = _get_axes(len(values), 1)
-            return _arrays_to_mgr([values], columns, index, columns,
-                                  dtype=dtype)
-        elif is_datetimetz(values):
-            return self._init_dict({0: values}, index, columns, dtype=dtype)
-
-        # by definition an array here
-        # the dtypes will be coerced to a single dtype
-        values = _prep_ndarray(values, copy=copy)
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4],
+        ...                    'col3': [5, 6]})
+        >>> df.shape
+        (2, 3)
+        """
+        return len(self.index), len(self.columns)
 
-        if dtype is not None:
-            if values.dtype != dtype:
-                try:
-                    values = values.astype(dtype)
-                except Exception as orig:
-                    e = ValueError("failed to cast to '%s' (Exception was: %s)"
-                                   % (dtype, orig))
-                    raise_with_traceback(e)
+    @property
+    def _is_homogeneous_type(self):
+        """
+        Whether all the columns in a DataFrame have the same type.
 
-        index, columns = _get_axes(*values.shape)
-        values = values.T
+        Returns
+        -------
+        bool
 
-        # if we don't have a dtype specified, then try to convert objects
-        # on the entire block; this is to convert if we have datetimelike's
-        # embedded in an object type
-        if dtype is None and is_object_dtype(values):
-            values = maybe_infer_to_datetimelike(values)
+        Examples
+        --------
+        >>> DataFrame({"A": [1, 2], "B": [3, 4]})._is_homogeneous_type
+        True
+        >>> DataFrame({"A": [1, 2], "B": [3.0, 4.0]})._is_homogeneous_type
+        False
 
-        return create_block_manager_from_blocks([values], [columns, index])
+        Items with the same type but different sizes are considered
+        different types.
 
-    @property
-    def axes(self):
-        """
-        Return a list with the row axis labels and column axis labels as the
-        only members. They are returned in that order.
+        >>> DataFrame({
+        ...    "A": np.array([1, 2], dtype=np.int32),
+        ...    "B": np.array([1, 2], dtype=np.int64)})._is_homogeneous_type
+        False
         """
-        return [self.index, self.columns]
+        if self._data.any_extension_types:
+            return len({block.dtype for block in self._data.blocks}) == 1
+        else:
+            return not self._data.is_mixed_type
 
-    @property
-    def shape(self):
-        """
-        Return a tuple representing the dimensionality of the DataFrame.
-        """
-        return len(self.index), len(self.columns)
+    # ----------------------------------------------------------------------
+    # Rendering Methods
 
     def _repr_fits_vertical_(self):
         """
@@ -503,15 +552,16 @@ def _repr_fits_vertical_(self):
     def _repr_fits_horizontal_(self, ignore_width=False):
         """
         Check if full repr fits in horizontal boundaries imposed by the display
-        options width and max_columns. In case off non-interactive session, no
-        boundaries apply.
+        options width and max_columns.
+
+        In case off non-interactive session, no boundaries apply.
 
-        ignore_width is here so ipnb+HTML output can behave the way
+        `ignore_width` is here so ipnb+HTML output can behave the way
         users expect. display.max_columns remains in effect.
         GH3541, GH3573
         """
 
-        width, height = fmt.get_console_size()
+        width, height = console.get_console_size()
         max_columns = get_option("display.max_columns")
         nb_columns = len(self.columns)
 
@@ -522,18 +572,18 @@ def _repr_fits_horizontal_(self, ignore_width=False):
 
         # used by repr_html under IPython notebook or scripts ignore terminal
         # dims
-        if ignore_width or not com.in_interactive_session():
+        if ignore_width or not console.in_interactive_session():
             return True
 
         if (get_option('display.width') is not None or
-                com.in_ipython_frontend()):
+                console.in_ipython_frontend()):
             # check at least the column row for excessive width
             max_rows = 1
         else:
             max_rows = get_option("display.max_rows")
 
         # when auto-detecting, so width=None and not in ipython front end
-        # check whether repr fits horizontal by actualy checking
+        # check whether repr fits horizontal by actually checking
         # the width of the rendered repr
         buf = StringIO()
 
@@ -549,19 +599,21 @@ def _repr_fits_horizontal_(self, ignore_width=False):
 
         d.to_string(buf=buf)
         value = buf.getvalue()
-        repr_width = max([len(l) for l in value.split('\n')])
+        repr_width = max(len(l) for l in value.split('\n'))
 
         return repr_width < width
 
     def _info_repr(self):
-        """True if the repr should show the info view."""
+        """
+        True if the repr should show the info view.
+        """
         info_repr_option = (get_option("display.large_repr") == "info")
         return info_repr_option and not (self._repr_fits_horizontal_() and
                                          self._repr_fits_vertical_())
 
     def __unicode__(self):
         """
-        Return a string representation for a particular DataFrame
+        Return a string representation for a particular DataFrame.
 
         Invoked by unicode(df) in py2 only. Yields a Unicode String in both
         py2/py3.
@@ -575,7 +627,7 @@ def __unicode__(self):
         max_cols = get_option("display.max_columns")
         show_dimensions = get_option("display.show_dimensions")
         if get_option("display.expand_frame_repr"):
-            width, _ = fmt.get_console_size()
+            width, _ = console.get_console_size()
         else:
             width = None
         self.to_string(buf=buf, max_rows=max_rows, max_cols=max_cols,
@@ -586,18 +638,9 @@ def __unicode__(self):
     def _repr_html_(self):
         """
         Return a html representation for a particular DataFrame.
+
         Mainly for IPython notebook.
         """
-        # qtconsole doesn't report its line width, and also
-        # behaves badly when outputting an HTML table
-        # that doesn't fit the window, so disable it.
-        # XXX: In IPython 3.x and above, the Qt console will not attempt to
-        # display HTML, so this check can be removed when support for
-        # IPython 2.x is no longer needed.
-        if com.in_qtconsole():
-            # 'HTML output is disabled in QtConsole'
-            return None
-
         if self._info_repr():
             buf = StringIO(u(""))
             self.info(buf=buf)
@@ -616,15 +659,56 @@ def _repr_html_(self):
         else:
             return None
 
-    def _repr_latex_(self):
+    @Substitution(header='Write out the column names. If a list of strings '
+                         'is given, it is assumed to be aliases for the '
+                         'column names')
+    @Substitution(shared_params=fmt.common_docstring,
+                  returns=fmt.return_docstring)
+    def to_string(self, buf=None, columns=None, col_space=None, header=True,
+                  index=True, na_rep='NaN', formatters=None, float_format=None,
+                  sparsify=None, index_names=True, justify=None,
+                  max_rows=None, max_cols=None, show_dimensions=False,
+                  decimal='.', line_width=None):
         """
-        Returns a LaTeX representation for a particular Dataframe.
-        Mainly for use with nbconvert (jupyter notebook conversion to pdf).
+        Render a DataFrame to a console-friendly tabular output.
+        %(shared_params)s
+        line_width : int, optional
+            Width to wrap a line in characters.
+        %(returns)s
+        See Also
+        --------
+        to_html : Convert DataFrame to HTML.
+
+        Examples
+        --------
+        >>> d = {'col1': [1, 2, 3], 'col2': [4, 5, 6]}
+        >>> df = pd.DataFrame(d)
+        >>> print(df.to_string())
+           col1  col2
+        0     1     4
+        1     2     5
+        2     3     6
         """
-        if get_option('display.latex.repr'):
-            return self.to_latex()
-        else:
-            return None
+
+        formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
+                                           col_space=col_space, na_rep=na_rep,
+                                           formatters=formatters,
+                                           float_format=float_format,
+                                           sparsify=sparsify, justify=justify,
+                                           index_names=index_names,
+                                           header=header, index=index,
+                                           max_rows=max_rows,
+                                           max_cols=max_cols,
+                                           show_dimensions=show_dimensions,
+                                           decimal=decimal,
+                                           line_width=line_width)
+        formatter.to_string()
+
+        if buf is None:
+            result = formatter.buf.getvalue()
+            return result
+
+    # ----------------------------------------------------------------------
 
     @property
     def style(self):
@@ -634,20 +718,58 @@ def style(self):
 
         See Also
         --------
-        pandas.formats.style.Styler
+        io.formats.style.Styler
         """
-        from pandas.formats.style import Styler
+        from pandas.io.formats.style import Styler
         return Styler(self)
 
     def iteritems(self):
-        """
+        r"""
         Iterator over (column name, Series) pairs.
 
-        See also
+        Iterates over the DataFrame columns, returning a tuple with
+        the column name and the content as a Series.
+
+        Yields
+        ------
+        label : object
+            The column names for the DataFrame being iterated over.
+        content : Series
+            The column entries belonging to each label, as a Series.
+
+        See Also
         --------
-        iterrows : Iterate over DataFrame rows as (index, Series) pairs.
-        itertuples : Iterate over DataFrame rows as namedtuples of the values.
+        DataFrame.iterrows : Iterate over DataFrame rows as
+            (index, Series) pairs.
+        DataFrame.itertuples : Iterate over DataFrame rows as namedtuples
+            of the values.
 
+        Examples
+        --------
+        >>> df = pd.DataFrame({'species': ['bear', 'bear', 'marsupial'],
+        ...                   'population': [1864, 22000, 80000]},
+        ...                   index=['panda', 'polar', 'koala'])
+        >>> df
+                species   population
+        panda 	bear 	  1864
+        polar 	bear 	  22000
+        koala 	marsupial 80000
+        >>> for label, content in df.iteritems():
+        ...     print('label:', label)
+        ...     print('content:', content, sep='\n')
+        ...
+        label: species
+        content:
+        panda         bear
+        polar         bear
+        koala    marsupial
+        Name: species, dtype: object
+        label: population
+        content:
+        panda     1864
+        polar    22000
+        koala    80000
+        Name: population, dtype: int64
         """
         if self.columns.is_unique and hasattr(self, '_item_cache'):
             for k in self.columns:
@@ -660,6 +782,21 @@ def iterrows(self):
         """
         Iterate over DataFrame rows as (index, Series) pairs.
 
+        Yields
+        ------
+        index : label or tuple of label
+            The index of the row. A tuple for a `MultiIndex`.
+        data : Series
+            The data of the row as a Series.
+
+        it : generator
+            A generator that iterates over the rows of the frame.
+
+        See Also
+        --------
+        itertuples : Iterate over DataFrame rows as namedtuples of the values.
+        iteritems : Iterate over (column name, Series) pairs.
+
         Notes
         -----
 
@@ -686,17 +823,6 @@ def iterrows(self):
            This is not guaranteed to work in all cases. Depending on the
            data types, the iterator returns a copy and not a view, and writing
            to it will have no effect.
-
-        Returns
-        -------
-        it : generator
-            A generator that iterates over the rows of the frame.
-
-        See also
-        --------
-        itertuples : Iterate over DataFrame rows as namedtuples of the values.
-        iteritems : Iterate over (column name, Series) pairs.
-
         """
         columns = self.columns
         klass = self._constructor_sliced
@@ -706,49 +832,72 @@ def iterrows(self):
 
     def itertuples(self, index=True, name="Pandas"):
         """
-        Iterate over DataFrame rows as namedtuples, with index value as first
-        element of the tuple.
+        Iterate over DataFrame rows as namedtuples.
 
         Parameters
         ----------
-        index : boolean, default True
+        index : bool, default True
             If True, return the index as the first element of the tuple.
-        name : string, default "Pandas"
+        name : str or None, default "Pandas"
             The name of the returned namedtuples or None to return regular
             tuples.
 
+        Yields
+        -------
+        collections.namedtuple
+            Yields a namedtuple for each row in the DataFrame with the first
+            field possibly being the index and following fields being the
+            column values.
+
+        See Also
+        --------
+        DataFrame.iterrows : Iterate over DataFrame rows as (index, Series)
+            pairs.
+        DataFrame.iteritems : Iterate over (column name, Series) pairs.
+
         Notes
         -----
         The column names will be renamed to positional names if they are
         invalid Python identifiers, repeated, or start with an underscore.
         With a large number of columns (>255), regular tuples are returned.
 
-        See also
-        --------
-        iterrows : Iterate over DataFrame rows as (index, Series) pairs.
-        iteritems : Iterate over (column name, Series) pairs.
-
         Examples
         --------
-
-        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [0.1, 0.2]},
-                              index=['a', 'b'])
+        >>> df = pd.DataFrame({'num_legs': [4, 2], 'num_wings': [0, 2]},
+        ...                   index=['dog', 'hawk'])
         >>> df
-           col1  col2
-        a     1   0.1
-        b     2   0.2
+              num_legs  num_wings
+        dog          4          0
+        hawk         2          2
         >>> for row in df.itertuples():
         ...     print(row)
         ...
-        Pandas(Index='a', col1=1, col2=0.10000000000000001)
-        Pandas(Index='b', col1=2, col2=0.20000000000000001)
+        Pandas(Index='dog', num_legs=4, num_wings=0)
+        Pandas(Index='hawk', num_legs=2, num_wings=2)
+
+        By setting the `index` parameter to False we can remove the index
+        as the first element of the tuple:
+
+        >>> for row in df.itertuples(index=False):
+        ...     print(row)
+        ...
+        Pandas(num_legs=4, num_wings=0)
+        Pandas(num_legs=2, num_wings=2)
 
+        With the `name` parameter set we set a custom name for the yielded
+        namedtuples:
+
+        >>> for row in df.itertuples(name='Animal'):
+        ...     print(row)
+        ...
+        Animal(Index='dog', num_legs=4, num_wings=0)
+        Animal(Index='hawk', num_legs=2, num_wings=2)
         """
         arrays = []
-        fields = []
+        fields = list(self.columns)
         if index:
             arrays.append(self.index)
-            fields.append("Index")
+            fields.insert(0, "Index")
 
         # use integer indexing because of possible duplicate column names
         arrays.extend(self.iloc[:, k] for k in range(len(self.columns)))
@@ -758,34 +907,89 @@ def itertuples(self, index=True, name="Pandas"):
         if name is not None and len(self.columns) + index < 256:
             # `rename` is unsupported in Python 2.6
             try:
-                itertuple = collections.namedtuple(name,
-                                                   fields + list(self.columns),
-                                                   rename=True)
+                itertuple = collections.namedtuple(name, fields, rename=True)
                 return map(itertuple._make, zip(*arrays))
+
             except Exception:
                 pass
 
         # fallback to regular tuples
         return zip(*arrays)
 
-    if compat.PY3:  # pragma: no cover
-        items = iteritems
+    items = iteritems
 
     def __len__(self):
-        """Returns length of info axis, but here we use the index """
+        """
+        Returns length of info axis, but here we use the index.
+        """
         return len(self.index)
 
     def dot(self, other):
         """
-        Matrix multiplication with DataFrame or Series objects
+        Compute the matrix mutiplication between the DataFrame and other.
+
+        This method computes the matrix product between the DataFrame and the
+        values of an other Series, DataFrame or a numpy array.
+
+        It can also be called using ``self @ other`` in Python >= 3.5.
 
         Parameters
         ----------
-        other : DataFrame or Series
+        other : Series, DataFrame or array-like
+            The other object to compute the matrix product with.
 
         Returns
         -------
-        dot_product : DataFrame or Series
+        Series or DataFrame
+            If other is a Series, return the matrix product between self and
+            other as a Serie. If other is a DataFrame or a numpy.array, return
+            the matrix product of self and other in a DataFrame of a np.array.
+
+        See Also
+        --------
+        Series.dot: Similar method for Series.
+
+        Notes
+        -----
+        The dimensions of DataFrame and other must be compatible in order to
+        compute the matrix multiplication.
+
+        The dot method for Series computes the inner product, instead of the
+        matrix product here.
+
+        Examples
+        --------
+        Here we multiply a DataFrame with a Series.
+
+        >>> df = pd.DataFrame([[0, 1, -2, -1], [1, 1, 1, 1]])
+        >>> s = pd.Series([1, 1, 2, 1])
+        >>> df.dot(s)
+        0    -4
+        1     5
+        dtype: int64
+
+        Here we multiply a DataFrame with another DataFrame.
+
+        >>> other = pd.DataFrame([[0, 1], [1, 2], [-1, -1], [2, 0]])
+        >>> df.dot(other)
+            0   1
+        0   1   4
+        1   2   2
+
+        Note that the dot method give the same result as @
+
+        >>> df @ other
+            0   1
+        0   1   4
+        1   2   2
+
+        The dot method works also if other is an np.array.
+
+        >>> arr = np.array([[0, 1], [1, 2], [-1, -1], [2, 0]])
+        >>> df.dot(arr)
+            0   1
+        0   1   4
+        1   2   2
         """
         if isinstance(other, (Series, DataFrame)):
             common = self.columns.union(other.index)
@@ -802,8 +1006,9 @@ def dot(self, other):
             lvals = self.values
             rvals = np.asarray(other)
             if lvals.shape[1] != rvals.shape[0]:
-                raise ValueError('Dot product shape mismatch, %s vs %s' %
-                                 (lvals.shape, rvals.shape))
+                raise ValueError('Dot product shape mismatch, '
+                                 '{s} vs {r}'.format(s=lvals.shape,
+                                                     r=rvals.shape))
 
         if isinstance(other, DataFrame):
             return self._constructor(np.dot(lvals, rvals), index=left.index,
@@ -817,32 +1022,88 @@ def dot(self, other):
             else:
                 return Series(result, index=left.index)
         else:  # pragma: no cover
-            raise TypeError('unsupported type: %s' % type(other))
+            raise TypeError('unsupported type: {oth}'.format(oth=type(other)))
+
+    def __matmul__(self, other):
+        """
+        Matrix multiplication using binary `@` operator in Python>=3.5.
+        """
+        return self.dot(other)
+
+    def __rmatmul__(self, other):
+        """
+        Matrix multiplication using binary `@` operator in Python>=3.5.
+        """
+        return self.T.dot(np.transpose(other)).T
 
     # ----------------------------------------------------------------------
     # IO methods (to / from other formats)
 
     @classmethod
-    def from_dict(cls, data, orient='columns', dtype=None):
+    def from_dict(cls, data, orient='columns', dtype=None, columns=None):
         """
-        Construct DataFrame from dict of array-like or dicts
+        Construct DataFrame from dict of array-like or dicts.
+
+        Creates DataFrame object from dictionary by columns or by index
+        allowing dtype specification.
 
         Parameters
         ----------
         data : dict
-            {field : array-like} or {field : dict}
+            Of the form {field : array-like} or {field : dict}.
         orient : {'columns', 'index'}, default 'columns'
             The "orientation" of the data. If the keys of the passed dict
             should be the columns of the resulting DataFrame, pass 'columns'
             (default). Otherwise if the keys should be rows, pass 'index'.
         dtype : dtype, default None
-            Data type to force, otherwise infer
+            Data type to force, otherwise infer.
+        columns : list, default None
+            Column labels to use when ``orient='index'``. Raises a ValueError
+            if used with ``orient='columns'``.
+
+            .. versionadded:: 0.23.0
 
         Returns
         -------
         DataFrame
-        """
-        index, columns = None, None
+
+        See Also
+        --------
+        DataFrame.from_records : DataFrame from ndarray (structured
+            dtype), list of tuples, dict, or DataFrame.
+        DataFrame : DataFrame object creation using constructor.
+
+        Examples
+        --------
+        By default the keys of the dict become the DataFrame columns:
+
+        >>> data = {'col_1': [3, 2, 1, 0], 'col_2': ['a', 'b', 'c', 'd']}
+        >>> pd.DataFrame.from_dict(data)
+           col_1 col_2
+        0      3     a
+        1      2     b
+        2      1     c
+        3      0     d
+
+        Specify ``orient='index'`` to create the DataFrame using dictionary
+        keys as rows:
+
+        >>> data = {'row_1': [3, 2, 1, 0], 'row_2': ['a', 'b', 'c', 'd']}
+        >>> pd.DataFrame.from_dict(data, orient='index')
+               0  1  2  3
+        row_1  3  2  1  0
+        row_2  a  b  c  d
+
+        When using the 'index' orientation, the column names can be
+        specified manually:
+
+        >>> pd.DataFrame.from_dict(data, orient='index',
+        ...                        columns=['A', 'B', 'C', 'D'])
+               A  B  C  D
+        row_1  3  2  1  0
+        row_2  a  b  c  d
+        """
+        index = None
         orient = orient.lower()
         if orient == 'index':
             if len(data) > 0:
@@ -851,122 +1112,310 @@ def from_dict(cls, data, orient='columns', dtype=None):
                     data = _from_nested_dict(data)
                 else:
                     data, index = list(data.values()), list(data.keys())
-        elif orient != 'columns':  # pragma: no cover
+        elif orient == 'columns':
+            if columns is not None:
+                raise ValueError("cannot use columns parameter with "
+                                 "orient='columns'")
+        else:  # pragma: no cover
             raise ValueError('only recognize index or columns for orient')
 
         return cls(data, index=index, columns=columns, dtype=dtype)
 
-    def to_dict(self, orient='dict'):
-        """Convert DataFrame to dictionary.
+    def to_numpy(self, dtype=None, copy=False):
+        """
+        Convert the DataFrame to a NumPy array.
+
+        .. versionadded:: 0.24.0
+
+        By default, the dtype of the returned array will be the common NumPy
+        dtype of all types in the DataFrame. For example, if the dtypes are
+        ``float16`` and ``float32``, the results dtype will be ``float32``.
+        This may require copying data and coercing values, which may be
+        expensive.
+
+        Parameters
+        ----------
+        dtype : str or numpy.dtype, optional
+            The dtype to pass to :meth:`numpy.asarray`
+        copy : bool, default False
+            Whether to ensure that the returned value is a not a view on
+            another array. Note that ``copy=False`` does not *ensure* that
+            ``to_numpy()`` is no-copy. Rather, ``copy=True`` ensure that
+            a copy is made, even if not strictly necessary.
+
+        Returns
+        -------
+        numpy.ndarray
+
+        See Also
+        --------
+        Series.to_numpy : Similar method for Series.
+
+        Examples
+        --------
+        >>> pd.DataFrame({"A": [1, 2], "B": [3, 4]}).to_numpy()
+        array([[1, 3],
+               [2, 4]])
+
+        With heterogenous data, the lowest common type will have to
+        be used.
+
+        >>> df = pd.DataFrame({"A": [1, 2], "B": [3.0, 4.5]})
+        >>> df.to_numpy()
+        array([[1. , 3. ],
+               [2. , 4.5]])
+
+        For a mix of numeric and non-numeric types, the output array will
+        have object dtype.
+
+        >>> df['C'] = pd.date_range('2000', periods=2)
+        >>> df.to_numpy()
+        array([[1, 3.0, Timestamp('2000-01-01 00:00:00')],
+               [2, 4.5, Timestamp('2000-01-02 00:00:00')]], dtype=object)
+        """
+        result = np.array(self.values, dtype=dtype, copy=copy)
+        return result
+
+    def to_dict(self, orient='dict', into=dict):
+        """
+        Convert the DataFrame to a dictionary.
+
+        The type of the key-value pairs can be customized with the parameters
+        (see below).
 
         Parameters
         ----------
         orient : str {'dict', 'list', 'series', 'split', 'records', 'index'}
             Determines the type of the values of the dictionary.
 
-            - dict (default) : dict like {column -> {index -> value}}
-            - list : dict like {column -> [values]}
-            - series : dict like {column -> Series(values)}
-            - split : dict like
-              {index -> [index], columns -> [columns], data -> [values]}
-            - records : list like
+            - 'dict' (default) : dict like {column -> {index -> value}}
+            - 'list' : dict like {column -> [values]}
+            - 'series' : dict like {column -> Series(values)}
+            - 'split' : dict like
+              {'index' -> [index], 'columns' -> [columns], 'data' -> [values]}
+            - 'records' : list like
               [{column -> value}, ... , {column -> value}]
-            - index : dict like {index -> {column -> value}}
-
-              .. versionadded:: 0.17.0
+            - 'index' : dict like {index -> {column -> value}}
 
             Abbreviations are allowed. `s` indicates `series` and `sp`
             indicates `split`.
 
+        into : class, default dict
+            The collections.Mapping subclass used for all Mappings
+            in the return value.  Can be the actual class or an empty
+            instance of the mapping type you want.  If you want a
+            collections.defaultdict, you must pass it initialized.
+
+            .. versionadded:: 0.21.0
+
         Returns
         -------
-        result : dict like {column -> {index -> value}}
+        dict, list or collections.Mapping
+            Return a collections.Mapping object representing the DataFrame.
+            The resulting transformation depends on the `orient` parameter.
+
+        See Also
+        --------
+        DataFrame.from_dict: Create a DataFrame from a dictionary.
+        DataFrame.to_json: Convert a DataFrame to JSON format.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'col1': [1, 2],
+        ...                    'col2': [0.5, 0.75]},
+        ...                   index=['row1', 'row2'])
+        >>> df
+              col1  col2
+        row1     1  0.50
+        row2     2  0.75
+        >>> df.to_dict()
+        {'col1': {'row1': 1, 'row2': 2}, 'col2': {'row1': 0.5, 'row2': 0.75}}
+
+        You can specify the return orientation.
+
+        >>> df.to_dict('series')
+        {'col1': row1    1
+                 row2    2
+        Name: col1, dtype: int64,
+        'col2': row1    0.50
+                row2    0.75
+        Name: col2, dtype: float64}
+
+        >>> df.to_dict('split')
+        {'index': ['row1', 'row2'], 'columns': ['col1', 'col2'],
+         'data': [[1, 0.5], [2, 0.75]]}
+
+        >>> df.to_dict('records')
+        [{'col1': 1, 'col2': 0.5}, {'col1': 2, 'col2': 0.75}]
+
+        >>> df.to_dict('index')
+        {'row1': {'col1': 1, 'col2': 0.5}, 'row2': {'col1': 2, 'col2': 0.75}}
+
+        You can also specify the mapping type.
+
+        >>> from collections import OrderedDict, defaultdict
+        >>> df.to_dict(into=OrderedDict)
+        OrderedDict([('col1', OrderedDict([('row1', 1), ('row2', 2)])),
+                     ('col2', OrderedDict([('row1', 0.5), ('row2', 0.75)]))])
+
+        If you want a `defaultdict`, you need to initialize it:
+
+        >>> dd = defaultdict(list)
+        >>> df.to_dict('records', into=dd)
+        [defaultdict(<class 'list'>, {'col1': 1, 'col2': 0.5}),
+         defaultdict(<class 'list'>, {'col1': 2, 'col2': 0.75})]
         """
         if not self.columns.is_unique:
             warnings.warn("DataFrame columns are not unique, some "
-                          "columns will be omitted.", UserWarning)
+                          "columns will be omitted.", UserWarning,
+                          stacklevel=2)
+        # GH16122
+        into_c = com.standardize_mapping(into)
         if orient.lower().startswith('d'):
-            return dict((k, v.to_dict()) for k, v in compat.iteritems(self))
+            return into_c(
+                (k, v.to_dict(into)) for k, v in compat.iteritems(self))
         elif orient.lower().startswith('l'):
-            return dict((k, v.tolist()) for k, v in compat.iteritems(self))
+            return into_c((k, v.tolist()) for k, v in compat.iteritems(self))
         elif orient.lower().startswith('sp'):
-            return {'index': self.index.tolist(),
-                    'columns': self.columns.tolist(),
-                    'data': lib.map_infer(self.values.ravel(),
-                                          _maybe_box_datetimelike)
-                    .reshape(self.values.shape).tolist()}
+            return into_c((('index', self.index.tolist()),
+                           ('columns', self.columns.tolist()),
+                           ('data', [
+                               list(map(com.maybe_box_datetimelike, t))
+                               for t in self.itertuples(index=False, name=None)
+                           ])))
         elif orient.lower().startswith('s'):
-            return dict((k, _maybe_box_datetimelike(v))
-                        for k, v in compat.iteritems(self))
+            return into_c((k, com.maybe_box_datetimelike(v))
+                          for k, v in compat.iteritems(self))
         elif orient.lower().startswith('r'):
-            return [dict((k, _maybe_box_datetimelike(v))
-                         for k, v in zip(self.columns, row))
-                    for row in self.values]
+            columns = self.columns.tolist()
+            rows = (dict(zip(columns, row))
+                    for row in self.itertuples(index=False, name=None))
+            return [
+                into_c((k, com.maybe_box_datetimelike(v))
+                       for k, v in compat.iteritems(row))
+                for row in rows]
         elif orient.lower().startswith('i'):
-            return dict((k, v.to_dict()) for k, v in self.iterrows())
+            if not self.index.is_unique:
+                raise ValueError(
+                    "DataFrame index must be unique for orient='index'."
+                )
+            return into_c((t[0], dict(zip(self.columns, t[1:])))
+                          for t in self.itertuples(name=None))
         else:
-            raise ValueError("orient '%s' not understood" % orient)
+            raise ValueError("orient '{o}' not understood".format(o=orient))
 
-    def to_gbq(self, destination_table, project_id, chunksize=10000,
-               verbose=True, reauth=False, if_exists='fail', private_key=None):
-        """Write a DataFrame to a Google BigQuery table.
+    def to_gbq(self, destination_table, project_id=None, chunksize=None,
+               reauth=False, if_exists='fail', auth_local_webserver=False,
+               table_schema=None, location=None, progress_bar=True,
+               credentials=None, verbose=None, private_key=None):
+        """
+        Write a DataFrame to a Google BigQuery table.
 
-        The main method a user calls to export pandas DataFrame contents to
-        Google BigQuery table.
+        This function requires the `pandas-gbq package
+        <https://pandas-gbq.readthedocs.io>`__.
 
-        Google BigQuery API Client Library v2 for Python is used.
-        Documentation is available `here
-        <https://developers.google.com/api-client-library/python/apis/bigquery/v2>`__
-
-        Authentication to the Google BigQuery service is via OAuth 2.0.
-
-        - If "private_key" is not provided:
-
-          By default "application default credentials" are used.
-
-          If default application credentials are not found or are restrictive,
-          user account credentials are used. In this case, you will be asked to
-          grant permissions for product name 'pandas GBQ'.
-
-        - If "private_key" is provided:
-
-          Service account credentials will be used to authenticate.
+        See the `How to authenticate with Google BigQuery
+        <https://pandas-gbq.readthedocs.io/en/latest/howto/authentication.html>`__
+        guide for authentication instructions.
 
         Parameters
         ----------
-        dataframe : DataFrame
-            DataFrame to be written
-        destination_table : string
-            Name of table to be written, in the form 'dataset.tablename'
-        project_id : str
-            Google BigQuery Account project ID.
-        chunksize : int (default 10000)
+        destination_table : str
+            Name of table to be written, in the form ``dataset.tablename``.
+        project_id : str, optional
+            Google BigQuery Account project ID. Optional when available from
+            the environment.
+        chunksize : int, optional
             Number of rows to be inserted in each chunk from the dataframe.
-        verbose : boolean (default True)
-            Show percentage complete
-        reauth : boolean (default False)
-            Force Google BigQuery to reauthenticate the user. This is useful
+            Set to ``None`` to load the whole dataframe at once.
+        reauth : bool, default False
+            Force Google BigQuery to re-authenticate the user. This is useful
             if multiple accounts are used.
-        if_exists : {'fail', 'replace', 'append'}, default 'fail'
-            'fail': If table exists, do nothing.
-            'replace': If table exists, drop it, recreate it, and insert data.
-            'append': If table exists, insert data. Create if does not exist.
-        private_key : str (optional)
+        if_exists : str, default 'fail'
+            Behavior when the destination table exists. Value can be one of:
+
+            ``'fail'``
+                If table exists, do nothing.
+            ``'replace'``
+                If table exists, drop it, recreate it, and insert data.
+            ``'append'``
+                If table exists, insert data. Create if does not exist.
+        auth_local_webserver : bool, default False
+            Use the `local webserver flow`_ instead of the `console flow`_
+            when getting user credentials.
+
+            .. _local webserver flow:
+                http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_local_server
+            .. _console flow:
+                http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_console
+
+            *New in version 0.2.0 of pandas-gbq*.
+        table_schema : list of dicts, optional
+            List of BigQuery table fields to which according DataFrame
+            columns conform to, e.g. ``[{'name': 'col1', 'type':
+            'STRING'},...]``. If schema is not provided, it will be
+            generated according to dtypes of DataFrame columns. See
+            BigQuery API documentation on available names of a field.
+
+            *New in version 0.3.1 of pandas-gbq*.
+        location : str, optional
+            Location where the load job should run. See the `BigQuery locations
+            documentation
+            <https://cloud.google.com/bigquery/docs/dataset-locations>`__ for a
+            list of available locations. The location must match that of the
+            target dataset.
+
+            *New in version 0.5.0 of pandas-gbq*.
+        progress_bar : bool, default True
+            Use the library `tqdm` to show the progress bar for the upload,
+            chunk by chunk.
+
+            *New in version 0.5.0 of pandas-gbq*.
+        credentials : google.auth.credentials.Credentials, optional
+            Credentials for accessing Google APIs. Use this parameter to
+            override default credentials, such as to use Compute Engine
+            :class:`google.auth.compute_engine.Credentials` or Service
+            Account :class:`google.oauth2.service_account.Credentials`
+            directly.
+
+            *New in version 0.8.0 of pandas-gbq*.
+
+            .. versionadded:: 0.24.0
+        verbose : bool, deprecated
+            Deprecated in pandas-gbq version 0.4.0. Use the `logging module
+            to adjust verbosity instead
+            <https://pandas-gbq.readthedocs.io/en/latest/intro.html#logging>`__.
+        private_key : str, deprecated
+            Deprecated in pandas-gbq version 0.8.0. Use the ``credentials``
+            parameter and
+            :func:`google.oauth2.service_account.Credentials.from_service_account_info`
+            or
+            :func:`google.oauth2.service_account.Credentials.from_service_account_file`
+            instead.
+
             Service account private key in JSON format. Can be file path
             or string contents. This is useful for remote server
-            authentication (eg. jupyter iPython notebook on remote host)
-        """
+            authentication (eg. Jupyter/IPython notebook on remote host).
 
+        See Also
+        --------
+        pandas_gbq.to_gbq : This function in the pandas-gbq library.
+        read_gbq : Read a DataFrame from Google BigQuery.
+        """
         from pandas.io import gbq
-        return gbq.to_gbq(self, destination_table, project_id=project_id,
-                          chunksize=chunksize, verbose=verbose, reauth=reauth,
-                          if_exists=if_exists, private_key=private_key)
+        return gbq.to_gbq(
+            self, destination_table, project_id=project_id,
+            chunksize=chunksize, reauth=reauth, if_exists=if_exists,
+            auth_local_webserver=auth_local_webserver,
+            table_schema=table_schema, location=location,
+            progress_bar=progress_bar, credentials=credentials,
+            verbose=verbose, private_key=private_key)
 
     @classmethod
     def from_records(cls, data, index=None, exclude=None, columns=None,
                      coerce_float=False, nrows=None):
         """
-        Convert structured or record ndarray to DataFrame
+        Convert structured or record ndarray to DataFrame.
 
         Parameters
         ----------
@@ -985,15 +1434,17 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
         coerce_float : boolean, default False
             Attempt to convert values of non-string, non-numeric objects (like
             decimal.Decimal) to floating point, useful for SQL result sets
+        nrows : int, default None
+            Number of rows to read if data is an iterator
 
         Returns
         -------
-        df : DataFrame
+        DataFrame
         """
 
         # Make a copy of the input columns so we can modify it
         if columns is not None:
-            columns = _ensure_index(columns)
+            columns = ensure_index(columns)
 
         if is_iterator(data):
             if nrows == 0:
@@ -1022,7 +1473,7 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
 
         if isinstance(data, dict):
             if columns is None:
-                columns = arr_columns = _ensure_index(sorted(data))
+                columns = arr_columns = ensure_index(sorted(data))
                 arrays = [data[k] for k in columns]
             else:
                 arrays = []
@@ -1032,21 +1483,21 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
                         arr_columns.append(k)
                         arrays.append(v)
 
-                arrays, arr_columns = _reorder_arrays(arrays, arr_columns,
-                                                      columns)
+                arrays, arr_columns = reorder_arrays(arrays, arr_columns,
+                                                     columns)
 
         elif isinstance(data, (np.ndarray, DataFrame)):
-            arrays, columns = _to_arrays(data, columns)
+            arrays, columns = to_arrays(data, columns)
             if columns is not None:
-                columns = _ensure_index(columns)
+                columns = ensure_index(columns)
             arr_columns = columns
         else:
-            arrays, arr_columns = _to_arrays(data, columns,
-                                             coerce_float=coerce_float)
+            arrays, arr_columns = to_arrays(data, columns,
+                                            coerce_float=coerce_float)
 
-            arr_columns = _ensure_index(arr_columns)
+            arr_columns = ensure_index(arr_columns)
             if columns is not None:
-                columns = _ensure_index(columns)
+                columns = ensure_index(columns)
             else:
                 columns = arr_columns
 
@@ -1067,10 +1518,10 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
                     result_index = Index([], name=index)
             else:
                 try:
-                    to_remove = [arr_columns.get_loc(field) for field in index]
-
-                    result_index = MultiIndex.from_arrays(
-                        [arrays[i] for i in to_remove], names=index)
+                    index_data = [arrays[arr_columns.get_loc(field)]
+                                  for field in index]
+                    result_index = ensure_index_from_sequences(index_data,
+                                                               names=index)
 
                     exclude.update(index)
                 except Exception:
@@ -1084,27 +1535,108 @@ def from_records(cls, data, index=None, exclude=None, columns=None,
             arr_columns = arr_columns.drop(arr_exclude)
             columns = columns.drop(exclude)
 
-        mgr = _arrays_to_mgr(arrays, arr_columns, result_index, columns)
+        mgr = arrays_to_mgr(arrays, arr_columns, result_index, columns)
 
         return cls(mgr)
 
-    def to_records(self, index=True, convert_datetime64=True):
+    def to_records(self, index=True, convert_datetime64=None,
+                   column_dtypes=None, index_dtypes=None):
         """
-        Convert DataFrame to record array. Index will be put in the
-        'index' field of the record array if requested
+        Convert DataFrame to a NumPy record array.
+
+        Index will be included as the first field of the record array if
+        requested.
 
         Parameters
         ----------
-        index : boolean, default True
-            Include index in resulting record array, stored in 'index' field
-        convert_datetime64 : boolean, default True
+        index : bool, default True
+            Include index in resulting record array, stored in 'index'
+            field or using the index label, if set.
+        convert_datetime64 : bool, default None
+            .. deprecated:: 0.23.0
+
             Whether to convert the index to datetime.datetime if it is a
-            DatetimeIndex
+            DatetimeIndex.
+        column_dtypes : str, type, dict, default None
+            .. versionadded:: 0.24.0
+
+            If a string or type, the data type to store all columns. If
+            a dictionary, a mapping of column names and indices (zero-indexed)
+            to specific data types.
+        index_dtypes : str, type, dict, default None
+            .. versionadded:: 0.24.0
+
+            If a string or type, the data type to store all index levels. If
+            a dictionary, a mapping of index level names and indices
+            (zero-indexed) to specific data types.
+
+            This mapping is applied only if `index=True`.
 
         Returns
         -------
-        y : recarray
+        numpy.recarray
+            NumPy ndarray with the DataFrame labels as fields and each row
+            of the DataFrame as entries.
+
+        See Also
+        --------
+        DataFrame.from_records: Convert structured or record ndarray
+            to DataFrame.
+        numpy.recarray: An ndarray that allows field access using
+            attributes, analogous to typed columns in a
+            spreadsheet.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2], 'B': [0.5, 0.75]},
+        ...                   index=['a', 'b'])
+        >>> df
+           A     B
+        a  1  0.50
+        b  2  0.75
+        >>> df.to_records()
+        rec.array([('a', 1, 0.5 ), ('b', 2, 0.75)],
+                  dtype=[('index', 'O'), ('A', '<i8'), ('B', '<f8')])
+
+        If the DataFrame index has no label then the recarray field name
+        is set to 'index'. If the index has a label then this is used as the
+        field name:
+
+        >>> df.index = df.index.rename("I")
+        >>> df.to_records()
+        rec.array([('a', 1, 0.5 ), ('b', 2, 0.75)],
+                  dtype=[('I', 'O'), ('A', '<i8'), ('B', '<f8')])
+
+        The index can be excluded from the record array:
+
+        >>> df.to_records(index=False)
+        rec.array([(1, 0.5 ), (2, 0.75)],
+                  dtype=[('A', '<i8'), ('B', '<f8')])
+
+        Data types can be specified for the columns:
+
+        >>> df.to_records(column_dtypes={"A": "int32"})
+        rec.array([('a', 1, 0.5 ), ('b', 2, 0.75)],
+                  dtype=[('I', 'O'), ('A', '<i4'), ('B', '<f8')])
+
+        As well as for the index:
+
+        >>> df.to_records(index_dtypes="<S2")
+        rec.array([(b'a', 1, 0.5 ), (b'b', 2, 0.75)],
+                  dtype=[('I', 'S2'), ('A', '<i8'), ('B', '<f8')])
+
+        >>> index_dtypes = "<S{}".format(df.index.str.len().max())
+        >>> df.to_records(index_dtypes=index_dtypes)
+        rec.array([(b'a', 1, 0.5 ), (b'b', 2, 0.75)],
+                  dtype=[('I', 'S1'), ('A', '<i8'), ('B', '<f8')])
         """
+
+        if convert_datetime64 is not None:
+            warnings.warn("The 'convert_datetime64' parameter is "
+                          "deprecated and will be removed in a future "
+                          "version",
+                          FutureWarning, stacklevel=2)
+
         if index:
             if is_datetime64_any_dtype(self.index) and convert_datetime64:
                 ix_vals = [self.index.to_pydatetime()]
@@ -1119,6 +1651,7 @@ def to_records(self, index=True, convert_datetime64=True):
 
             count = 0
             index_names = list(self.index.names)
+
             if isinstance(self.index, MultiIndex):
                 for i, n in enumerate(index_names):
                     if n is None:
@@ -1126,13 +1659,67 @@ def to_records(self, index=True, convert_datetime64=True):
                         count += 1
             elif index_names[0] is None:
                 index_names = ['index']
+
             names = (lmap(compat.text_type, index_names) +
                      lmap(compat.text_type, self.columns))
         else:
             arrays = [self[c].get_values() for c in self.columns]
             names = lmap(compat.text_type, self.columns)
+            index_names = []
+
+        index_len = len(index_names)
+        formats = []
+
+        for i, v in enumerate(arrays):
+            index = i
+
+            # When the names and arrays are collected, we
+            # first collect those in the DataFrame's index,
+            # followed by those in its columns.
+            #
+            # Thus, the total length of the array is:
+            # len(index_names) + len(DataFrame.columns).
+            #
+            # This check allows us to see whether we are
+            # handling a name / array in the index or column.
+            if index < index_len:
+                dtype_mapping = index_dtypes
+                name = index_names[index]
+            else:
+                index -= index_len
+                dtype_mapping = column_dtypes
+                name = self.columns[index]
+
+            # We have a dictionary, so we get the data type
+            # associated with the index or column (which can
+            # be denoted by its name in the DataFrame or its
+            # position in DataFrame's array of indices or
+            # columns, whichever is applicable.
+            if is_dict_like(dtype_mapping):
+                if name in dtype_mapping:
+                    dtype_mapping = dtype_mapping[name]
+                elif index in dtype_mapping:
+                    dtype_mapping = dtype_mapping[index]
+                else:
+                    dtype_mapping = None
+
+            # If no mapping can be found, use the array's
+            # dtype attribute for formatting.
+            #
+            # A valid dtype must either be a type or
+            # string naming a type.
+            if dtype_mapping is None:
+                formats.append(v.dtype)
+            elif isinstance(dtype_mapping, (type, np.dtype,
+                                            compat.string_types)):
+                formats.append(dtype_mapping)
+            else:
+                element = "row" if i < index_len else "column"
+                msg = ("Invalid dtype {dtype} specified for "
+                       "{element} {name}").format(dtype=dtype_mapping,
+                                                  element=element, name=name)
+                raise ValueError(msg)
 
-        formats = [v.dtype for v in arrays]
         return np.rec.fromarrays(
             arrays,
             dtype={'names': names, 'formats': formats}
@@ -1141,6 +1728,15 @@ def to_records(self, index=True, convert_datetime64=True):
     @classmethod
     def from_items(cls, items, columns=None, orient='columns'):
         """
+        Construct a DataFrame from a list of tuples.
+
+        .. deprecated:: 0.23.0
+          `from_items` is deprecated and will be removed in a future version.
+          Use :meth:`DataFrame.from_dict(dict(items)) <DataFrame.from_dict>`
+          instead.
+          :meth:`DataFrame.from_dict(OrderedDict(items)) <DataFrame.from_dict>`
+          may be used to preserve the key order.
+
         Convert (key, value) pairs to DataFrame. The keys will be the axis
         index (usually the columns, but depends on the specified
         orientation). The values should be arrays or Series.
@@ -1159,58 +1755,85 @@ def from_items(cls, items, columns=None, orient='columns'):
 
         Returns
         -------
-        frame : DataFrame
+        DataFrame
         """
+
+        warnings.warn("from_items is deprecated. Please use "
+                      "DataFrame.from_dict(dict(items), ...) instead. "
+                      "DataFrame.from_dict(OrderedDict(items)) may be used to "
+                      "preserve the key order.",
+                      FutureWarning, stacklevel=2)
+
         keys, values = lzip(*items)
 
         if orient == 'columns':
             if columns is not None:
-                columns = _ensure_index(columns)
+                columns = ensure_index(columns)
 
                 idict = dict(items)
                 if len(idict) < len(items):
-                    if not columns.equals(_ensure_index(keys)):
+                    if not columns.equals(ensure_index(keys)):
                         raise ValueError('With non-unique item names, passed '
                                          'columns must be identical')
                     arrays = values
                 else:
                     arrays = [idict[k] for k in columns if k in idict]
             else:
-                columns = _ensure_index(keys)
+                columns = ensure_index(keys)
                 arrays = values
 
-            return cls._from_arrays(arrays, columns, None)
+            # GH 17312
+            # Provide more informative error msg when scalar values passed
+            try:
+                return cls._from_arrays(arrays, columns, None)
+
+            except ValueError:
+                if not is_nested_list_like(values):
+                    raise ValueError('The value in each (key, value) pair '
+                                     'must be an array, Series, or dict')
+
         elif orient == 'index':
             if columns is None:
                 raise TypeError("Must pass columns with orient='index'")
 
-            keys = _ensure_index(keys)
+            keys = ensure_index(keys)
+
+            # GH 17312
+            # Provide more informative error msg when scalar values passed
+            try:
+                arr = np.array(values, dtype=object).T
+                data = [lib.maybe_convert_objects(v) for v in arr]
+                return cls._from_arrays(data, columns, keys)
+
+            except TypeError:
+                if not is_nested_list_like(values):
+                    raise ValueError('The value in each (key, value) pair '
+                                     'must be an array, Series, or dict')
 
-            arr = np.array(values, dtype=object).T
-            data = [lib.maybe_convert_objects(v) for v in arr]
-            return cls._from_arrays(data, columns, keys)
         else:  # pragma: no cover
             raise ValueError("'orient' must be either 'columns' or 'index'")
 
     @classmethod
     def _from_arrays(cls, arrays, columns, index, dtype=None):
-        mgr = _arrays_to_mgr(arrays, columns, index, columns, dtype=dtype)
+        mgr = arrays_to_mgr(arrays, columns, index, columns, dtype=dtype)
         return cls(mgr)
 
     @classmethod
     def from_csv(cls, path, header=0, sep=',', index_col=0, parse_dates=True,
-                 encoding=None, tupleize_cols=False,
+                 encoding=None, tupleize_cols=None,
                  infer_datetime_format=False):
         """
-        Read CSV file (DISCOURAGED, please use :func:`pandas.read_csv`
-        instead).
+        Read CSV file.
+
+        .. deprecated:: 0.21.0
+            Use :func:`read_csv` instead.
 
-        It is preferable to use the more powerful :func:`pandas.read_csv`
+        It is preferable to use the more powerful :func:`read_csv`
         for most general purposes, but ``from_csv`` makes for an easy
         roundtrip to and from a file (the exact counterpart of
         ``to_csv``), especially with a DataFrame of time series data.
 
-        This method only differs from the preferred :func:`pandas.read_csv`
+        This method only differs from the preferred :func:`read_csv`
         in some defaults:
 
         - `index_col` is ``0`` instead of ``None`` (take first column as index
@@ -1236,40 +1859,87 @@ def from_csv(cls, path, header=0, sep=',', index_col=0, parse_dates=True,
         tupleize_cols : boolean, default False
             write multi_index columns as a list of tuples (if True)
             or new (expanded format) if False)
-        infer_datetime_format: boolean, default False
+        infer_datetime_format : boolean, default False
             If True and `parse_dates` is True for a column, try to infer the
             datetime format based on the first datetime string. If the format
             can be inferred, there often will be a large parsing speed-up.
 
-        See also
-        --------
-        pandas.read_csv
-
         Returns
         -------
-        y : DataFrame
+        DataFrame
 
+        See Also
+        --------
+        read_csv
         """
-        from pandas.io.parsers import read_table
-        return read_table(path, header=header, sep=sep,
-                          parse_dates=parse_dates, index_col=index_col,
-                          encoding=encoding, tupleize_cols=tupleize_cols,
-                          infer_datetime_format=infer_datetime_format)
+
+        warnings.warn("from_csv is deprecated. Please use read_csv(...) "
+                      "instead. Note that some of the default arguments are "
+                      "different, so please refer to the documentation "
+                      "for from_csv when changing your function calls",
+                      FutureWarning, stacklevel=2)
+
+        from pandas.io.parsers import read_csv
+        return read_csv(path, header=header, sep=sep,
+                        parse_dates=parse_dates, index_col=index_col,
+                        encoding=encoding, tupleize_cols=tupleize_cols,
+                        infer_datetime_format=infer_datetime_format)
 
     def to_sparse(self, fill_value=None, kind='block'):
         """
-        Convert to SparseDataFrame
+        Convert to SparseDataFrame.
+
+        Implement the sparse version of the DataFrame meaning that any data
+        matching a specific value it's omitted in the representation.
+        The sparse DataFrame allows for a more efficient storage.
 
         Parameters
         ----------
-        fill_value : float, default NaN
-        kind : {'block', 'integer'}
+        fill_value : float, default None
+            The specific value that should be omitted in the representation.
+        kind : {'block', 'integer'}, default 'block'
+            The kind of the SparseIndex tracking where data is not equal to
+            the fill value:
+
+            - 'block' tracks only the locations and sizes of blocks of data.
+            - 'integer' keeps an array with all the locations of the data.
+
+            In most cases 'block' is recommended, since it's more memory
+            efficient.
 
         Returns
         -------
-        y : SparseDataFrame
-        """
-        from pandas.core.sparse import SparseDataFrame
+        SparseDataFrame
+            The sparse representation of the DataFrame.
+
+        See Also
+        --------
+        DataFrame.to_dense :
+            Converts the DataFrame back to the its dense form.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([(np.nan, np.nan),
+        ...                    (1., np.nan),
+        ...                    (np.nan, 1.)])
+        >>> df
+             0    1
+        0  NaN  NaN
+        1  1.0  NaN
+        2  NaN  1.0
+        >>> type(df)
+        <class 'pandas.core.frame.DataFrame'>
+
+        >>> sdf = df.to_sparse()
+        >>> sdf
+             0    1
+        0  NaN  NaN
+        1  1.0  NaN
+        2  NaN  1.0
+        >>> type(sdf)
+        <class 'pandas.core.sparse.frame.SparseDataFrame'>
+        """
+        from pandas.core.sparse.api import SparseDataFrame
         return SparseDataFrame(self._series, index=self.index,
                                columns=self.columns, default_kind=kind,
                                default_fill_value=fill_value)
@@ -1279,194 +1949,52 @@ def to_panel(self):
         Transform long (stacked) format (DataFrame) into wide (3D, Panel)
         format.
 
+        .. deprecated:: 0.20.0
+
         Currently the index of the DataFrame must be a 2-level MultiIndex. This
         may be generalized later
 
         Returns
         -------
-        panel : Panel
+        Panel
         """
-        # only support this kind for now
-        if (not isinstance(self.index, MultiIndex) or  # pragma: no cover
-                len(self.index.levels) != 2):
-            raise NotImplementedError('Only 2-level MultiIndex are supported.')
-
-        if not self.index.is_unique:
-            raise ValueError("Can't convert non-uniquely indexed "
-                             "DataFrame to Panel")
-
-        self._consolidate_inplace()
-
-        # minor axis must be sorted
-        if self.index.lexsort_depth < 2:
-            selfsorted = self.sort_index(level=0)
-        else:
-            selfsorted = self
-
-        major_axis, minor_axis = selfsorted.index.levels
-        major_labels, minor_labels = selfsorted.index.labels
-        shape = len(major_axis), len(minor_axis)
-
-        # preserve names, if any
-        major_axis = major_axis.copy()
-        major_axis.name = self.index.names[0]
-
-        minor_axis = minor_axis.copy()
-        minor_axis.name = self.index.names[1]
-
-        # create new axes
-        new_axes = [selfsorted.columns, major_axis, minor_axis]
-
-        # create new manager
-        new_mgr = selfsorted._data.reshape_nd(axes=new_axes,
-                                              labels=[major_labels,
-                                                      minor_labels],
-                                              shape=shape,
-                                              ref_items=selfsorted.columns)
-
-        return self._constructor_expanddim(new_mgr)
-
-    def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
-               columns=None, header=True, index=True, index_label=None,
-               mode='w', encoding=None, compression=None, quoting=None,
-               quotechar='"', line_terminator='\n', chunksize=None,
-               tupleize_cols=False, date_format=None, doublequote=True,
-               escapechar=None, decimal='.'):
-        r"""Write DataFrame to a comma-separated values (csv) file
-
-        Parameters
-        ----------
-        path_or_buf : string or file handle, default None
-            File path or object, if None is provided the result is returned as
-            a string.
-        sep : character, default ','
-            Field delimiter for the output file.
-        na_rep : string, default ''
-            Missing data representation
-        float_format : string, default None
-            Format string for floating point numbers
-        columns : sequence, optional
-            Columns to write
-        header : boolean or list of string, default True
-            Write out column names. If a list of string is given it is assumed
-            to be aliases for the column names
-        index : boolean, default True
-            Write row names (index)
-        index_label : string or sequence, or False, default None
-            Column label for index column(s) if desired. If None is given, and
-            `header` and `index` are True, then the index names are used. A
-            sequence should be given if the DataFrame uses MultiIndex.  If
-            False do not print fields for index names. Use index_label=False
-            for easier importing in R
-        mode : str
-            Python write mode, default 'w'
-        encoding : string, optional
-            A string representing the encoding to use in the output file,
-            defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
-        compression : string, optional
-            a string representing the compression to use in the output file,
-            allowed values are 'gzip', 'bz2', 'xz',
-            only used when the first argument is a filename
-        line_terminator : string, default ``'\n'``
-            The newline character or character sequence to use in the output
-            file
-        quoting : optional constant from csv module
-            defaults to csv.QUOTE_MINIMAL. If you have set a `float_format`
-            then floats are converted to strings and thus csv.QUOTE_NONNUMERIC
-            will treat them as non-numeric
-        quotechar : string (length 1), default '\"'
-            character used to quote fields
-        doublequote : boolean, default True
-            Control quoting of `quotechar` inside a field
-        escapechar : string (length 1), default None
-            character used to escape `sep` and `quotechar` when appropriate
-        chunksize : int or None
-            rows to write at a time
-        tupleize_cols : boolean, default False
-            write multi_index columns as a list of tuples (if True)
-            or new (expanded format) if False)
-        date_format : string, default None
-            Format string for datetime objects
-        decimal: string, default '.'
-            Character recognized as decimal separator. E.g. use ',' for
-            European data
-
-            .. versionadded:: 0.16.0
-
-        """
-        formatter = fmt.CSVFormatter(self, path_or_buf,
-                                     line_terminator=line_terminator, sep=sep,
-                                     encoding=encoding,
-                                     compression=compression, quoting=quoting,
-                                     na_rep=na_rep, float_format=float_format,
-                                     cols=columns, header=header, index=index,
-                                     index_label=index_label, mode=mode,
-                                     chunksize=chunksize, quotechar=quotechar,
-                                     tupleize_cols=tupleize_cols,
-                                     date_format=date_format,
-                                     doublequote=doublequote,
-                                     escapechar=escapechar, decimal=decimal)
-        formatter.save()
-
-        if path_or_buf is None:
-            return formatter.path_or_buf.getvalue()
-
-    @Appender(_shared_docs['to_excel'] % _shared_doc_kwargs)
-    def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
-                 float_format=None, columns=None, header=True, index=True,
-                 index_label=None, startrow=0, startcol=0, engine=None,
-                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True,
-                 freeze_panes=None):
-        from pandas.io.excel import ExcelWriter
-        need_save = False
-        if encoding is None:
-            encoding = 'ascii'
-
-        if isinstance(excel_writer, compat.string_types):
-            excel_writer = ExcelWriter(excel_writer, engine=engine)
-            need_save = True
-
-        formatter = fmt.ExcelFormatter(self, na_rep=na_rep, cols=columns,
-                                       header=header,
-                                       float_format=float_format, index=index,
-                                       index_label=index_label,
-                                       merge_cells=merge_cells,
-                                       inf_rep=inf_rep)
-
-        formatted_cells = formatter.get_formatted_cells()
-        excel_writer.write_cells(formatted_cells, sheet_name,
-                                 startrow=startrow, startcol=startcol,
-                                 freeze_panes=freeze_panes)
-        if need_save:
-            excel_writer.save()
+        raise NotImplementedError("Panel is being removed in pandas 0.25.0.")
 
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
     def to_stata(self, fname, convert_dates=None, write_index=True,
                  encoding="latin-1", byteorder=None, time_stamp=None,
-                 data_label=None, variable_labels=None):
+                 data_label=None, variable_labels=None, version=114,
+                 convert_strl=None):
         """
-        A class for writing Stata binary dta files from array-like objects
+        Export DataFrame object to Stata dta format.
+
+        Writes the DataFrame to a Stata dataset file.
+        "dta" files contain a Stata dataset.
 
         Parameters
         ----------
-        fname : str or buffer
-            String path of file-like object
+        fname : str, buffer or path object
+            String, path object (pathlib.Path or py._path.local.LocalPath) or
+            object implementing a binary write() function. If using a buffer
+            then the buffer will not be automatically closed after the file
+            data has been written.
         convert_dates : dict
             Dictionary mapping columns containing datetime types to stata
-            internal format to use when wirting the dates. Options are 'tc',
+            internal format to use when writing the dates. Options are 'tc',
             'td', 'tm', 'tw', 'th', 'tq', 'ty'. Column can be either an integer
             or a name. Datetime columns that do not have a conversion type
             specified will be converted to 'tc'. Raises NotImplementedError if
-            a datetime column has timezone information
+            a datetime column has timezone information.
         write_index : bool
             Write the index to Stata dataset.
         encoding : str
-            Default is latin-1. Unicode is not supported
+            Default is latin-1. Unicode is not supported.
         byteorder : str
-            Can be ">", "<", "little", or "big". default is `sys.byteorder`
+            Can be ">", "<", "little", or "big". default is `sys.byteorder`.
         time_stamp : datetime
             A datetime to use as file creation date.  Default is the current
             time.
-        dataset_label : str
+        data_label : str, optional
             A label for the data set.  Must be 80 characters or smaller.
         variable_labels : dict
             Dictionary containing columns as keys and variable labels as
@@ -1474,40 +2002,70 @@ def to_stata(self, fname, convert_dates=None, write_index=True,
 
             .. versionadded:: 0.19.0
 
+        version : {114, 117}, default 114
+            Version to use in the output dta file.  Version 114 can be used
+            read by Stata 10 and later.  Version 117 can be read by Stata 13
+            or later. Version 114 limits string variables to 244 characters or
+            fewer while 117 allows strings with lengths up to 2,000,000
+            characters.
+
+            .. versionadded:: 0.23.0
+
+        convert_strl : list, optional
+            List of column names to convert to string columns to Stata StrL
+            format. Only available if version is 117.  Storing strings in the
+            StrL format can produce smaller dta files if strings have more than
+            8 characters and values are repeated.
+
+            .. versionadded:: 0.23.0
+
         Raises
         ------
         NotImplementedError
             * If datetimes contain timezone information
             * Column dtype is not representable in Stata
         ValueError
-            * Columns listed in convert_dates are noth either datetime64[ns]
+            * Columns listed in convert_dates are neither datetime64[ns]
               or datetime.datetime
             * Column listed in convert_dates is not in DataFrame
             * Categorical label contains more than 32,000 characters
 
             .. versionadded:: 0.19.0
 
-        Examples
+        See Also
         --------
-        >>> writer = StataWriter('./data_file.dta', data)
-        >>> writer.write_file()
+        read_stata : Import Stata data files.
+        io.stata.StataWriter : Low-level writer for Stata data files.
+        io.stata.StataWriter117 : Low-level writer for version 117 files.
 
-        Or with dates
+        Examples
+        --------
+        >>> df = pd.DataFrame({'animal': ['falcon', 'parrot', 'falcon',
+        ...                               'parrot'],
+        ...                    'speed': [350, 18, 361, 15]})
+        >>> df.to_stata('animals.dta')  # doctest: +SKIP
+        """
+        kwargs = {}
+        if version not in (114, 117):
+            raise ValueError('Only formats 114 and 117 supported.')
+        if version == 114:
+            if convert_strl is not None:
+                raise ValueError('strl support is only available when using '
+                                 'format 117')
+            from pandas.io.stata import StataWriter as statawriter
+        else:
+            from pandas.io.stata import StataWriter117 as statawriter
+            kwargs['convert_strl'] = convert_strl
 
-        >>> writer = StataWriter('./date_data_file.dta', data, {2 : 'tw'})
-        >>> writer.write_file()
-        """
-        from pandas.io.stata import StataWriter
-        writer = StataWriter(fname, self, convert_dates=convert_dates,
-                             encoding=encoding, byteorder=byteorder,
-                             time_stamp=time_stamp, data_label=data_label,
-                             write_index=write_index,
-                             variable_labels=variable_labels)
+        writer = statawriter(fname, self, convert_dates=convert_dates,
+                             byteorder=byteorder, time_stamp=time_stamp,
+                             data_label=data_label, write_index=write_index,
+                             variable_labels=variable_labels, **kwargs)
         writer.write_file()
 
     def to_feather(self, fname):
         """
-        write out the binary feather-format for DataFrames
+        Write out the binary feather-format for DataFrames.
 
         .. versionadded:: 0.20.0
 
@@ -1515,76 +2073,128 @@ def to_feather(self, fname):
         ----------
         fname : str
             string file path
-
         """
         from pandas.io.feather_format import to_feather
         to_feather(self, fname)
 
-    @Substitution(header='Write out column names. If a list of string is given, \
-it is assumed to be aliases for the column names')
-    @Appender(fmt.docstring_to_string, indents=1)
-    def to_string(self, buf=None, columns=None, col_space=None, header=True,
-                  index=True, na_rep='NaN', formatters=None, float_format=None,
-                  sparsify=None, index_names=True, justify=None,
-                  line_width=None, max_rows=None, max_cols=None,
-                  show_dimensions=False):
-        """
-        Render a DataFrame to a console-friendly tabular output.
+    def to_parquet(self, fname, engine='auto', compression='snappy',
+                   index=None, partition_cols=None, **kwargs):
         """
+        Write a DataFrame to the binary parquet format.
 
-        formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
-                                           col_space=col_space, na_rep=na_rep,
-                                           formatters=formatters,
-                                           float_format=float_format,
-                                           sparsify=sparsify, justify=justify,
-                                           index_names=index_names,
-                                           header=header, index=index,
-                                           line_width=line_width,
-                                           max_rows=max_rows,
-                                           max_cols=max_cols,
-                                           show_dimensions=show_dimensions)
-        formatter.to_string()
+        .. versionadded:: 0.21.0
 
-        if buf is None:
-            result = formatter.buf.getvalue()
-            return result
+        This function writes the dataframe as a `parquet file
+        <https://parquet.apache.org/>`_. You can choose different parquet
+        backends, and have the option of compression. See
+        :ref:`the user guide <io.parquet>` for more details.
+
+        Parameters
+        ----------
+        fname : str
+            File path or Root Directory path. Will be used as Root Directory
+            path while writing a partitioned dataset.
+
+            .. versionchanged:: 0.24.0
+
+        engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+            Parquet library to use. If 'auto', then the option
+            ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+            behavior is to try 'pyarrow', falling back to 'fastparquet' if
+            'pyarrow' is unavailable.
+        compression : {'snappy', 'gzip', 'brotli', None}, default 'snappy'
+            Name of the compression to use. Use ``None`` for no compression.
+        index : bool, default None
+            If ``True``, include the dataframe's index(es) in the file output.
+            If ``False``, they will not be written to the file. If ``None``,
+            the behavior depends on the chosen engine.
+
+            .. versionadded:: 0.24.0
 
-    @Substitution(header='whether to print column labels, default True')
-    @Appender(fmt.docstring_to_string, indents=1)
+        partition_cols : list, optional, default None
+            Column names by which to partition the dataset
+            Columns are partitioned in the order they are given
+
+            .. versionadded:: 0.24.0
+
+        **kwargs
+            Additional arguments passed to the parquet library. See
+            :ref:`pandas io <io.parquet>` for more details.
+
+        See Also
+        --------
+        read_parquet : Read a parquet file.
+        DataFrame.to_csv : Write a csv file.
+        DataFrame.to_sql : Write to a sql table.
+        DataFrame.to_hdf : Write to hdf.
+
+        Notes
+        -----
+        This function requires either the `fastparquet
+        <https://pypi.org/project/fastparquet>`_ or `pyarrow
+        <https://arrow.apache.org/docs/python/>`_ library.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(data={'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.to_parquet('df.parquet.gzip',
+        ...               compression='gzip')  # doctest: +SKIP
+        >>> pd.read_parquet('df.parquet.gzip')  # doctest: +SKIP
+           col1  col2
+        0     1     3
+        1     2     4
+        """
+        from pandas.io.parquet import to_parquet
+        to_parquet(self, fname, engine,
+                   compression=compression, index=index,
+                   partition_cols=partition_cols, **kwargs)
+
+    @Substitution(header='Whether to print column labels, default True')
+    @Substitution(shared_params=fmt.common_docstring,
+                  returns=fmt.return_docstring)
     def to_html(self, buf=None, columns=None, col_space=None, header=True,
                 index=True, na_rep='NaN', formatters=None, float_format=None,
-                sparsify=None, index_names=True, justify=None, bold_rows=True,
-                classes=None, escape=True, max_rows=None, max_cols=None,
-                show_dimensions=False, notebook=False, decimal='.',
-                border=None):
+                sparsify=None, index_names=True, justify=None, max_rows=None,
+                max_cols=None, show_dimensions=False, decimal='.',
+                bold_rows=True, classes=None, escape=True, notebook=False,
+                border=None, table_id=None, render_links=False):
         """
         Render a DataFrame as an HTML table.
-
-        `to_html`-specific options:
-
-        bold_rows : boolean, default True
-            Make the row labels bold in the output
+        %(shared_params)s
+        bold_rows : bool, default True
+            Make the row labels bold in the output.
         classes : str or list or tuple, default None
-            CSS class(es) to apply to the resulting html table
-        escape : boolean, default True
-            Convert the characters <, >, and & to HTML-safe sequences.=
-        max_rows : int, optional
-            Maximum number of rows to show before truncating. If None, show
-            all.
-        max_cols : int, optional
-            Maximum number of columns to show before truncating. If None, show
-            all.
-        decimal : string, default '.'
-            Character recognized as decimal separator, e.g. ',' in Europe
-
-            .. versionadded:: 0.18.0
+            CSS class(es) to apply to the resulting html table.
+        escape : bool, default True
+            Convert the characters <, >, and & to HTML-safe sequences.
+        notebook : {True, False}, default False
+            Whether the generated HTML is for IPython Notebook.
         border : int
             A ``border=border`` attribute is included in the opening
             `<table>` tag. Default ``pd.options.html.border``.
 
             .. versionadded:: 0.19.0
+
+        table_id : str, optional
+            A css id is included in the opening `<table>` tag if specified.
+
+            .. versionadded:: 0.23.0
+
+        render_links : bool, default False
+            Convert URLs to HTML links.
+
+            .. versionadded:: 0.24.0
+
+        %(returns)s
+        See Also
+        --------
+        to_string : Convert DataFrame to a string.
         """
 
+        if (justify is not None and
+                justify not in fmt._VALID_JUSTIFY_PARAMETERS):
+            raise ValueError("Invalid value for justify parameter")
+
         formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
                                            col_space=col_space, na_rep=na_rep,
                                            formatters=formatters,
@@ -1596,133 +2206,147 @@ def to_html(self, buf=None, columns=None, col_space=None, header=True,
                                            max_rows=max_rows,
                                            max_cols=max_cols,
                                            show_dimensions=show_dimensions,
-                                           decimal=decimal)
+                                           decimal=decimal, table_id=table_id,
+                                           render_links=render_links)
         # TODO: a generic formatter wld b in DataFrameFormatter
         formatter.to_html(classes=classes, notebook=notebook, border=border)
 
         if buf is None:
             return formatter.buf.getvalue()
 
-    @Substitution(header='Write out column names. If a list of string is given, \
-it is assumed to be aliases for the column names.')
-    @Appender(fmt.common_docstring + fmt.return_docstring, indents=1)
-    def to_latex(self, buf=None, columns=None, col_space=None, header=True,
-                 index=True, na_rep='NaN', formatters=None, float_format=None,
-                 sparsify=None, index_names=True, bold_rows=True,
-                 column_format=None, longtable=None, escape=None,
-                 encoding=None, decimal='.', multicolumn=None,
-                 multicolumn_format=None, multirow=None):
-        r"""
-        Render a DataFrame to a tabular environment table. You can splice
-        this into a LaTeX document. Requires \usepackage{booktabs}.
-
-        `to_latex`-specific options:
-
-        bold_rows : boolean, default True
-            Make the row labels bold in the output
-        column_format : str, default None
-            The columns format as specified in `LaTeX table format
-            <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3
-            columns
-        longtable : boolean, default will be read from the pandas config module
-            Default: False.
-            Use a longtable environment instead of tabular. Requires adding
-            a \usepackage{longtable} to your LaTeX preamble.
-        escape : boolean, default will be read from the pandas config module
-            Default: True.
-            When set to False prevents from escaping latex special
-            characters in column names.
-        encoding : str, default None
-            A string representing the encoding to use in the output file,
-            defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
-        decimal : string, default '.'
-            Character recognized as decimal separator, e.g. ',' in Europe.
-
-            .. versionadded:: 0.18.0
-
-        multicolumn : boolean, default True
-            Use \multicolumn to enhance MultiIndex columns.
-            The default will be read from the config module.
-
-            .. versionadded:: 0.20.0
-
-        multicolumn_format : str, default 'l'
-            The alignment for multicolumns, similar to `column_format`
-            The default will be read from the config module.
-
-            .. versionadded:: 0.20.0
-
-        multirow : boolean, default False
-            Use \multirow to enhance MultiIndex rows.
-            Requires adding a \usepackage{multirow} to your LaTeX preamble.
-            Will print centered labels (instead of top-aligned)
-            across the contained rows, separating groups via clines.
-            The default will be read from the pandas config module.
-
-            .. versionadded:: 0.20.0
-
-        """
-        # Get defaults from the pandas config
-        if longtable is None:
-            longtable = get_option("display.latex.longtable")
-        if escape is None:
-            escape = get_option("display.latex.escape")
-        if multicolumn is None:
-            multicolumn = get_option("display.latex.multicolumn")
-        if multicolumn_format is None:
-            multicolumn_format = get_option("display.latex.multicolumn_format")
-        if multirow is None:
-            multirow = get_option("display.latex.multirow")
-
-        formatter = fmt.DataFrameFormatter(self, buf=buf, columns=columns,
-                                           col_space=col_space, na_rep=na_rep,
-                                           header=header, index=index,
-                                           formatters=formatters,
-                                           float_format=float_format,
-                                           bold_rows=bold_rows,
-                                           sparsify=sparsify,
-                                           index_names=index_names,
-                                           escape=escape, decimal=decimal)
-        formatter.to_latex(column_format=column_format, longtable=longtable,
-                           encoding=encoding, multicolumn=multicolumn,
-                           multicolumn_format=multicolumn_format,
-                           multirow=multirow)
-
-        if buf is None:
-            return formatter.buf.getvalue()
+    # ----------------------------------------------------------------------
 
     def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None,
              null_counts=None):
         """
-        Concise summary of a DataFrame.
+        Print a concise summary of a DataFrame.
+
+        This method prints information about a DataFrame including
+        the index dtype and column dtypes, non-null values and memory usage.
 
         Parameters
         ----------
-        verbose : {None, True, False}, optional
-            Whether to print the full summary.
-            None follows the `display.max_info_columns` setting.
-            True or False overrides the `display.max_info_columns` setting.
+        verbose : bool, optional
+            Whether to print the full summary. By default, the setting in
+            ``pandas.options.display.max_info_columns`` is followed.
         buf : writable buffer, defaults to sys.stdout
-        max_cols : int, default None
-            Determines whether full summary or short summary is printed.
-            None follows the `display.max_info_columns` setting.
-        memory_usage : boolean/string, default None
+            Where to send the output. By default, the output is printed to
+            sys.stdout. Pass a writable buffer if you need to further process
+            the output.
+        max_cols : int, optional
+            When to switch from the verbose to the truncated output. If the
+            DataFrame has more than `max_cols` columns, the truncated output
+            is used. By default, the setting in
+            ``pandas.options.display.max_info_columns`` is used.
+        memory_usage : bool, str, optional
             Specifies whether total memory usage of the DataFrame
-            elements (including index) should be displayed. None follows
-            the `display.memory_usage` setting. True or False overrides
-            the `display.memory_usage` setting. A value of 'deep' is equivalent
-            of True, with deep introspection. Memory usage is shown in
-            human-readable units (base-2 representation).
-        null_counts : boolean, default None
-            Whether to show the non-null counts
+            elements (including the index) should be displayed. By default,
+            this follows the ``pandas.options.display.memory_usage`` setting.
+
+            True always show memory usage. False never shows memory usage.
+            A value of 'deep' is equivalent to "True with deep introspection".
+            Memory usage is shown in human-readable units (base-2
+            representation). Without deep introspection a memory estimation is
+            made based in column dtype and number of rows assuming values
+            consume the same memory amount for corresponding dtypes. With deep
+            memory introspection, a real memory usage calculation is performed
+            at the cost of computational resources.
+        null_counts : bool, optional
+            Whether to show the non-null counts. By default, this is shown
+            only if the frame is smaller than
+            ``pandas.options.display.max_info_rows`` and
+            ``pandas.options.display.max_info_columns``. A value of True always
+            shows the counts, and False never shows the counts.
+
+        Returns
+        -------
+        None
+            This method prints a summary of a DataFrame and returns None.
 
-            - If None, then only show if the frame is smaller than
-              max_info_rows and max_info_columns.
-            - If True, always show counts.
-            - If False, never show counts.
+        See Also
+        --------
+        DataFrame.describe: Generate descriptive statistics of DataFrame
+            columns.
+        DataFrame.memory_usage: Memory usage of DataFrame columns.
 
+        Examples
+        --------
+        >>> int_values = [1, 2, 3, 4, 5]
+        >>> text_values = ['alpha', 'beta', 'gamma', 'delta', 'epsilon']
+        >>> float_values = [0.0, 0.25, 0.5, 0.75, 1.0]
+        >>> df = pd.DataFrame({"int_col": int_values, "text_col": text_values,
+        ...                   "float_col": float_values})
+        >>> df
+           int_col text_col  float_col
+        0        1    alpha       0.00
+        1        2     beta       0.25
+        2        3    gamma       0.50
+        3        4    delta       0.75
+        4        5  epsilon       1.00
+
+        Prints information of all columns:
+
+        >>> df.info(verbose=True)
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 5 entries, 0 to 4
+        Data columns (total 3 columns):
+        int_col      5 non-null int64
+        text_col     5 non-null object
+        float_col    5 non-null float64
+        dtypes: float64(1), int64(1), object(1)
+        memory usage: 200.0+ bytes
+
+        Prints a summary of columns count and its dtypes but not per column
+        information:
+
+        >>> df.info(verbose=False)
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 5 entries, 0 to 4
+        Columns: 3 entries, int_col to float_col
+        dtypes: float64(1), int64(1), object(1)
+        memory usage: 200.0+ bytes
+
+        Pipe output of DataFrame.info to buffer instead of sys.stdout, get
+        buffer content and writes to a text file:
+
+        >>> import io
+        >>> buffer = io.StringIO()
+        >>> df.info(buf=buffer)
+        >>> s = buffer.getvalue()
+        >>> with open("df_info.txt", "w",
+        ...           encoding="utf-8") as f:  # doctest: +SKIP
+        ...     f.write(s)
+        260
+
+        The `memory_usage` parameter allows deep introspection mode, specially
+        useful for big DataFrames and fine-tune memory optimization:
+
+        >>> random_strings_array = np.random.choice(['a', 'b', 'c'], 10 ** 6)
+        >>> df = pd.DataFrame({
+        ...     'column_1': np.random.choice(['a', 'b', 'c'], 10 ** 6),
+        ...     'column_2': np.random.choice(['a', 'b', 'c'], 10 ** 6),
+        ...     'column_3': np.random.choice(['a', 'b', 'c'], 10 ** 6)
+        ... })
+        >>> df.info()
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 1000000 entries, 0 to 999999
+        Data columns (total 3 columns):
+        column_1    1000000 non-null object
+        column_2    1000000 non-null object
+        column_3    1000000 non-null object
+        dtypes: object(3)
+        memory usage: 22.9+ MB
+
+        >>> df.info(memory_usage='deep')
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 1000000 entries, 0 to 999999
+        Data columns (total 3 columns):
+        column_1    1000000 non-null object
+        column_2    1000000 non-null object
+        column_3    1000000 non-null object
+        dtypes: object(3)
+        memory usage: 188.8 MB
         """
-        from pandas.formats.format import _put_lines
 
         if buf is None:  # pragma: no cover
             buf = sys.stdout
@@ -1730,11 +2354,11 @@ def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None,
         lines = []
 
         lines.append(str(type(self)))
-        lines.append(self.index.summary())
+        lines.append(self.index._summary())
 
         if len(self.columns) == 0:
-            lines.append('Empty %s' % type(self).__name__)
-            _put_lines(buf, lines)
+            lines.append('Empty {name}'.format(name=type(self).__name__))
+            fmt.buffer_put_lines(buf, lines)
             return
 
         cols = self.columns
@@ -1756,16 +2380,18 @@ def info(self, verbose=None, buf=None, max_cols=None, memory_usage=None,
         def _verbose_repr():
             lines.append('Data columns (total %d columns):' %
                          len(self.columns))
-            space = max([len(pprint_thing(k)) for k in self.columns]) + 4
+            space = max(len(pprint_thing(k)) for k in self.columns) + 4
             counts = None
 
-            tmpl = "%s%s"
+            tmpl = "{count}{dtype}"
             if show_counts:
                 counts = self.count()
                 if len(cols) != len(counts):  # pragma: no cover
-                    raise AssertionError('Columns must equal counts (%d != %d)'
-                                         % (len(cols), len(counts)))
-                tmpl = "%s non-null %s"
+                    raise AssertionError(
+                        'Columns must equal counts '
+                        '({cols:d} != {counts:d})'.format(
+                            cols=len(cols), counts=len(counts)))
+                tmpl = "{count} non-null {dtype}"
 
             dtypes = self.dtypes
             for i, col in enumerate(self.columns):
@@ -1776,18 +2402,22 @@ def _verbose_repr():
                 if show_counts:
                     count = counts.iloc[i]
 
-                lines.append(_put_str(col, space) + tmpl % (count, dtype))
+                lines.append(_put_str(col, space) + tmpl.format(count=count,
+                                                                dtype=dtype))
 
         def _non_verbose_repr():
-            lines.append(self.columns.summary(name='Columns'))
+            lines.append(self.columns._summary(name='Columns'))
 
         def _sizeof_fmt(num, size_qualifier):
             # returns size in human readable format
             for x in ['bytes', 'KB', 'MB', 'GB', 'TB']:
                 if num < 1024.0:
-                    return "%3.1f%s %s" % (num, size_qualifier, x)
+                    return ("{num:3.1f}{size_q} "
+                            "{x}".format(num=num, size_q=size_qualifier, x=x))
                 num /= 1024.0
-            return "%3.1f%s %s" % (num, size_qualifier, 'PB')
+            return "{num:3.1f}{size_q} {pb}".format(num=num,
+                                                    size_q=size_qualifier,
+                                                    pb='PB')
 
         if verbose:
             _verbose_repr()
@@ -1800,8 +2430,9 @@ def _sizeof_fmt(num, size_qualifier):
                 _verbose_repr()
 
         counts = self.get_dtype_counts()
-        dtypes = ['%s(%d)' % k for k in sorted(compat.iteritems(counts))]
-        lines.append('dtypes: %s' % ', '.join(dtypes))
+        dtypes = ['{k}({kk:d})'.format(k=k[0], kk=k[1]) for k
+                  in sorted(compat.iteritems(counts))]
+        lines.append('dtypes: {types}'.format(types=', '.join(dtypes)))
 
         if memory_usage is None:
             memory_usage = get_option('display.memory_usage')
@@ -1819,37 +2450,94 @@ def _sizeof_fmt(num, size_qualifier):
                         self.index._is_memory_usage_qualified()):
                     size_qualifier = '+'
             mem_usage = self.memory_usage(index=True, deep=deep).sum()
-            lines.append("memory usage: %s\n" %
-                         _sizeof_fmt(mem_usage, size_qualifier))
-        _put_lines(buf, lines)
+            lines.append("memory usage: {mem}\n".format(
+                mem=_sizeof_fmt(mem_usage, size_qualifier)))
+
+        fmt.buffer_put_lines(buf, lines)
 
     def memory_usage(self, index=True, deep=False):
-        """Memory usage of DataFrame columns.
+        """
+        Return the memory usage of each column in bytes.
+
+        The memory usage can optionally include the contribution of
+        the index and elements of `object` dtype.
+
+        This value is displayed in `DataFrame.info` by default. This can be
+        suppressed by setting ``pandas.options.display.memory_usage`` to False.
 
         Parameters
         ----------
-        index : bool
-            Specifies whether to include memory usage of DataFrame's
-            index in returned Series. If `index=True` (default is False)
-            the first index of the Series is `Index`.
-        deep : bool
-            Introspect the data deeply, interrogate
-            `object` dtypes for system-level memory consumption
+        index : bool, default True
+            Specifies whether to include the memory usage of the DataFrame's
+            index in returned Series. If ``index=True`` the memory usage of the
+            index the first item in the output.
+        deep : bool, default False
+            If True, introspect the data deeply by interrogating
+            `object` dtypes for system-level memory consumption, and include
+            it in the returned values.
 
         Returns
         -------
-        sizes : Series
-            A series with column names as index and memory usage of
-            columns with units of bytes.
-
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array if deep=False
+        Series
+            A Series whose index is the original column names and whose values
+            is the memory usage of each column in bytes.
 
         See Also
         --------
-        numpy.ndarray.nbytes
+        numpy.ndarray.nbytes : Total bytes consumed by the elements of an
+            ndarray.
+        Series.memory_usage : Bytes consumed by a Series.
+        Categorical : Memory-efficient array for string values with
+            many repeated values.
+        DataFrame.info : Concise summary of a DataFrame.
+
+        Examples
+        --------
+        >>> dtypes = ['int64', 'float64', 'complex128', 'object', 'bool']
+        >>> data = dict([(t, np.ones(shape=5000).astype(t))
+        ...              for t in dtypes])
+        >>> df = pd.DataFrame(data)
+        >>> df.head()
+           int64  float64  complex128 object  bool
+        0      1      1.0      (1+0j)      1  True
+        1      1      1.0      (1+0j)      1  True
+        2      1      1.0      (1+0j)      1  True
+        3      1      1.0      (1+0j)      1  True
+        4      1      1.0      (1+0j)      1  True
+
+        >>> df.memory_usage()
+        Index            80
+        int64         40000
+        float64       40000
+        complex128    80000
+        object        40000
+        bool           5000
+        dtype: int64
+
+        >>> df.memory_usage(index=False)
+        int64         40000
+        float64       40000
+        complex128    80000
+        object        40000
+        bool           5000
+        dtype: int64
+
+        The memory footprint of `object` dtype columns is ignored by default:
+
+        >>> df.memory_usage(deep=True)
+        Index             80
+        int64          40000
+        float64        40000
+        complex128     80000
+        object        160000
+        bool            5000
+        dtype: int64
+
+        Use a Categorical for efficient storage of an object-dtype column with
+        many repeated values.
+
+        >>> df['object'].astype('category').memory_usage(deep=True)
+        5168
         """
         result = Series([c.memory_usage(index=False, deep=deep)
                          for col, c in self.iteritems()], index=self.columns)
@@ -1859,7 +2547,100 @@ def memory_usage(self, index=True, deep=False):
         return result
 
     def transpose(self, *args, **kwargs):
-        """Transpose index and columns"""
+        """
+        Transpose index and columns.
+
+        Reflect the DataFrame over its main diagonal by writing rows as columns
+        and vice-versa. The property :attr:`.T` is an accessor to the method
+        :meth:`transpose`.
+
+        Parameters
+        ----------
+        copy : bool, default False
+            If True, the underlying data is copied. Otherwise (default), no
+            copy is made if possible.
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted for
+            compatibility with numpy.
+
+        Returns
+        -------
+        DataFrame
+            The transposed DataFrame.
+
+        See Also
+        --------
+        numpy.transpose : Permute the dimensions of a given array.
+
+        Notes
+        -----
+        Transposing a DataFrame with mixed dtypes will result in a homogeneous
+        DataFrame with the `object` dtype. In such a case, a copy of the data
+        is always made.
+
+        Examples
+        --------
+        **Square DataFrame with homogeneous dtype**
+
+        >>> d1 = {'col1': [1, 2], 'col2': [3, 4]}
+        >>> df1 = pd.DataFrame(data=d1)
+        >>> df1
+           col1  col2
+        0     1     3
+        1     2     4
+
+        >>> df1_transposed = df1.T # or df1.transpose()
+        >>> df1_transposed
+              0  1
+        col1  1  2
+        col2  3  4
+
+        When the dtype is homogeneous in the original DataFrame, we get a
+        transposed DataFrame with the same dtype:
+
+        >>> df1.dtypes
+        col1    int64
+        col2    int64
+        dtype: object
+        >>> df1_transposed.dtypes
+        0    int64
+        1    int64
+        dtype: object
+
+        **Non-square DataFrame with mixed dtypes**
+
+        >>> d2 = {'name': ['Alice', 'Bob'],
+        ...       'score': [9.5, 8],
+        ...       'employed': [False, True],
+        ...       'kids': [0, 0]}
+        >>> df2 = pd.DataFrame(data=d2)
+        >>> df2
+            name  score  employed  kids
+        0  Alice    9.5     False     0
+        1    Bob    8.0      True     0
+
+        >>> df2_transposed = df2.T # or df2.transpose()
+        >>> df2_transposed
+                      0     1
+        name      Alice   Bob
+        score       9.5     8
+        employed  False  True
+        kids          0     0
+
+        When the DataFrame has mixed dtypes, we get a transposed DataFrame with
+        the `object` dtype:
+
+        >>> df2.dtypes
+        name         object
+        score       float64
+        employed       bool
+        kids          int64
+        dtype: object
+        >>> df2_transposed.dtypes
+        0    object
+        1    object
+        dtype: object
+        """
         nv.validate_transpose(args, dict())
         return super(DataFrame, self).transpose(1, 0, **kwargs)
 
@@ -1870,30 +2651,28 @@ def transpose(self, *args, **kwargs):
 
     # legacy pickle formats
     def _unpickle_frame_compat(self, state):  # pragma: no cover
-        from pandas.core.common import _unpickle_array
         if len(state) == 2:  # pragma: no cover
             series, idx = state
             columns = sorted(series)
         else:
             series, cols, idx = state
-            columns = _unpickle_array(cols)
+            columns = com._unpickle_array(cols)
 
-        index = _unpickle_array(idx)
+        index = com._unpickle_array(idx)
         self._data = self._init_dict(series, index, columns, None)
 
     def _unpickle_matrix_compat(self, state):  # pragma: no cover
-        from pandas.core.common import _unpickle_array
         # old unpickling
         (vals, idx, cols), object_state = state
 
-        index = _unpickle_array(idx)
-        dm = DataFrame(vals, index=index, columns=_unpickle_array(cols),
+        index = com._unpickle_array(idx)
+        dm = DataFrame(vals, index=index, columns=com._unpickle_array(cols),
                        copy=False)
 
         if object_state is not None:
             ovals, _, ocols = object_state
             objects = DataFrame(ovals, index=index,
-                                columns=_unpickle_array(ocols), copy=False)
+                                columns=com._unpickle_array(ocols), copy=False)
 
             dm = dm.join(objects)
 
@@ -1904,7 +2683,10 @@ def _unpickle_matrix_compat(self, state):  # pragma: no cover
 
     def get_value(self, index, col, takeable=False):
         """
-        Quickly retrieve single value at passed column and index
+        Quickly retrieve single value at passed column and index.
+
+        .. deprecated:: 0.21.0
+            Use .at[] or .iat[] accessors instead.
 
         Parameters
         ----------
@@ -1914,47 +2696,66 @@ def get_value(self, index, col, takeable=False):
 
         Returns
         -------
-        value : scalar value
+        scalar
         """
 
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(index, col, takeable=takeable)
+
+    def _get_value(self, index, col, takeable=False):
+
         if takeable:
             series = self._iget_item_cache(col)
-            return _maybe_box_datetimelike(series._values[index])
+            return com.maybe_box_datetimelike(series._values[index])
 
         series = self._get_item_cache(col)
         engine = self.index._engine
 
         try:
             return engine.get_value(series._values, index)
-        except TypeError:
+        except (TypeError, ValueError):
 
             # we cannot handle direct indexing
             # use positional
             col = self.columns.get_loc(col)
             index = self.index.get_loc(index)
-            return self.get_value(index, col, takeable=True)
+            return self._get_value(index, col, takeable=True)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, index, col, value, takeable=False):
         """
-        Put single value at passed column and index
+        Put single value at passed column and index.
+
+        .. deprecated:: 0.21.0
+            Use .at[] or .iat[] accessors instead.
 
         Parameters
         ----------
         index : row label
         col : column label
-        value : scalar value
+        value : scalar
         takeable : interpret the index/col as indexers, default False
 
         Returns
         -------
-        frame : DataFrame
+        DataFrame
             If label pair is contained, will be reference to calling DataFrame,
-            otherwise a new object
+            otherwise a new object.
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(index, col, value, takeable=takeable)
+
+    def _set_value(self, index, col, value, takeable=False):
         try:
             if takeable is True:
                 series = self._iget_item_cache(col)
-                return series.set_value(index, value, takeable=True)
+                return series._set_value(index, value, takeable=True)
 
             series = self._get_item_cache(col)
             engine = self.index._engine
@@ -1963,25 +2764,28 @@ def set_value(self, index, col, value, takeable=False):
         except (KeyError, TypeError):
 
             # set using a non-recursive method & reset the cache
-            self.loc[index, col] = value
+            if takeable:
+                self.iloc[index, col] = value
+            else:
+                self.loc[index, col] = value
             self._item_cache.pop(col, None)
 
             return self
+    _set_value.__doc__ = set_value.__doc__
 
     def _ixs(self, i, axis=0):
         """
+        Parameters
+        ----------
         i : int, slice, or sequence of integers
         axis : int
-        """
 
+        Notes
+        -----
+        If slice passed, the resulting data will be a view.
+        """
         # irow
         if axis == 0:
-            """
-            Notes
-            -----
-            If slice passed, the resulting data will be a view
-            """
-
             if isinstance(i, slice):
                 return self[i]
             else:
@@ -2007,12 +2811,6 @@ def _ixs(self, i, axis=0):
 
         # icol
         else:
-            """
-            Notes
-            -----
-            If slice passed, the resulting data will be a view
-            """
-
             label = self.columns[i]
             if isinstance(i, slice):
                 # need to return view
@@ -2020,7 +2818,7 @@ def _ixs(self, i, axis=0):
                 return self.loc[:, lab_slice]
             else:
                 if isinstance(label, Index):
-                    return self.take(i, axis=1, convert=True)
+                    return self._take(i, axis=1)
 
                 index_len = len(self.index)
 
@@ -2032,10 +2830,7 @@ def _ixs(self, i, axis=0):
 
                 if index_len and not len(values):
                     values = np.array([np.nan] * index_len, dtype=object)
-                result = self._constructor_sliced.from_array(values,
-                                                             index=self.index,
-                                                             name=label,
-                                                             fastpath=True)
+                result = self._box_col_values(values, label)
 
                 # this is a cached value, mark it so
                 result._set_as_cached(label, self)
@@ -2043,69 +2838,83 @@ def _ixs(self, i, axis=0):
                 return result
 
     def __getitem__(self, key):
-        key = com._apply_if_callable(key, self)
+        key = lib.item_from_zerodim(key)
+        key = com.apply_if_callable(key, self)
 
-        # shortcut if we are an actual column
-        is_mi_columns = isinstance(self.columns, MultiIndex)
+        # shortcut if the key is in columns
         try:
-            if key in self.columns and not is_mi_columns:
-                return self._getitem_column(key)
-        except:
+            if self.columns.is_unique and key in self.columns:
+                if self.columns.nlevels > 1:
+                    return self._getitem_multilevel(key)
+                return self._get_item_cache(key)
+        except (TypeError, ValueError):
+            # The TypeError correctly catches non hashable "key" (e.g. list)
+            # The ValueError can be removed once GH #21729 is fixed
             pass
 
-        # see if we can slice the rows
+        # Do we have a slicer (on rows)?
         indexer = convert_to_index_sliceable(self, key)
         if indexer is not None:
-            return self._getitem_slice(indexer)
+            return self._slice(indexer, axis=0)
 
-        if isinstance(key, (Series, np.ndarray, Index, list)):
-            # either boolean or fancy integer index
-            return self._getitem_array(key)
-        elif isinstance(key, DataFrame):
+        # Do we have a (boolean) DataFrame?
+        if isinstance(key, DataFrame):
             return self._getitem_frame(key)
-        elif is_mi_columns:
-            return self._getitem_multilevel(key)
-        else:
-            return self._getitem_column(key)
 
-    def _getitem_column(self, key):
-        """ return the actual column """
+        # Do we have a (boolean) 1d indexer?
+        if com.is_bool_indexer(key):
+            return self._getitem_bool_array(key)
+
+        # We are left with two options: a single key, and a collection of keys,
+        # We interpret tuples as collections only for non-MultiIndex
+        is_single_key = isinstance(key, tuple) or not is_list_like(key)
+
+        if is_single_key:
+            if self.columns.nlevels > 1:
+                return self._getitem_multilevel(key)
+            indexer = self.columns.get_loc(key)
+            if is_integer(indexer):
+                indexer = [indexer]
+        else:
+            if is_iterator(key):
+                key = list(key)
+            indexer = self.loc._convert_to_indexer(key, axis=1,
+                                                   raise_missing=True)
 
-        # get column
-        if self.columns.is_unique:
-            return self._get_item_cache(key)
+        # take() does not accept boolean indexers
+        if getattr(indexer, "dtype", None) == bool:
+            indexer = np.where(indexer)[0]
 
-        # duplicate columns & possible reduce dimensionality
-        result = self._constructor(self._data.get(key))
-        if result.columns.is_unique:
-            result = result[key]
+        data = self._take(indexer, axis=1)
 
-        return result
+        if is_single_key:
+            # What does looking for a single key in a non-unique index return?
+            # The behavior is inconsistent. It returns a Series, except when
+            # - the key itself is repeated (test on data.shape, #9519), or
+            # - we have a MultiIndex on columns (test on self.columns, #21309)
+            if data.shape[1] == 1 and not isinstance(self.columns, MultiIndex):
+                data = data[key]
 
-    def _getitem_slice(self, key):
-        return self._slice(key, axis=0)
+        return data
 
-    def _getitem_array(self, key):
+    def _getitem_bool_array(self, key):
         # also raises Exception if object array with NA values
-        if com.is_bool_indexer(key):
-            # warning here just in case -- previously __setitem__ was
-            # reindexing but __getitem__ was not; it seems more reasonable to
-            # go with the __setitem__ behavior since that is more consistent
-            # with all other indexing behavior
-            if isinstance(key, Series) and not key.index.equals(self.index):
-                warnings.warn("Boolean Series key will be reindexed to match "
-                              "DataFrame index.", UserWarning, stacklevel=3)
-            elif len(key) != len(self.index):
-                raise ValueError('Item wrong length %d instead of %d.' %
-                                 (len(key), len(self.index)))
-            # check_bool_indexer will throw exception if Series key cannot
-            # be reindexed to match DataFrame rows
-            key = check_bool_indexer(self.index, key)
-            indexer = key.nonzero()[0]
-            return self.take(indexer, axis=0, convert=False)
-        else:
-            indexer = self.loc._convert_to_indexer(key, axis=1)
-            return self.take(indexer, axis=1, convert=True)
+        # warning here just in case -- previously __setitem__ was
+        # reindexing but __getitem__ was not; it seems more reasonable to
+        # go with the __setitem__ behavior since that is more consistent
+        # with all other indexing behavior
+        if isinstance(key, Series) and not key.index.equals(self.index):
+            warnings.warn("Boolean Series key will be reindexed to match "
+                          "DataFrame index.", UserWarning, stacklevel=3)
+        elif len(key) != len(self.index):
+            raise ValueError('Item wrong length %d instead of %d.' %
+                             (len(key), len(self.index)))
+
+        # check_bool_indexer will throw exception if Series key cannot
+        # be reindexed to match DataFrame rows
+        key = check_bool_indexer(self.index, key)
+        indexer = key.nonzero()[0]
+        return self._take(indexer, axis=0)
 
     def _getitem_multilevel(self, key):
         loc = self.columns.get_loc(key)
@@ -2120,10 +2929,18 @@ def _getitem_multilevel(self, key):
                 result = self._constructor(new_values, index=self.index,
                                            columns=result_columns)
                 result = result.__finalize__(self)
+
+            # If there is only one column being returned, and its name is
+            # either an empty string, or a tuple with an empty string as its
+            # first element, then treat the empty string as a placeholder
+            # and return the column as if the user had provided that empty
+            # string in the key. If the result is a Series, exclude the
+            # implied empty string from its name.
             if len(result.columns) == 1:
                 top = result.columns[0]
-                if ((type(top) == str and top == '') or
-                        (type(top) == tuple and top[0] == '')):
+                if isinstance(top, tuple):
+                    top = top[0]
+                if top == '':
                     result = result['']
                     if isinstance(result, Series):
                         result = self._constructor_sliced(result,
@@ -2141,38 +2958,44 @@ def _getitem_frame(self, key):
         return self.where(key)
 
     def query(self, expr, inplace=False, **kwargs):
-        """Query the columns of a frame with a boolean expression.
-
-        .. versionadded:: 0.13
+        """
+        Query the columns of a DataFrame with a boolean expression.
 
         Parameters
         ----------
-        expr : string
+        expr : str
             The query string to evaluate.  You can refer to variables
             in the environment by prefixing them with an '@' character like
             ``@a + b``.
         inplace : bool
             Whether the query should modify the data in place or return
-            a modified copy
+            a modified copy.
+        **kwargs
+            See the documentation for :func:`eval` for complete details
+            on the keyword arguments accepted by :meth:`DataFrame.query`.
 
             .. versionadded:: 0.18.0
 
-        kwargs : dict
-            See the documentation for :func:`pandas.eval` for complete details
-            on the keyword arguments accepted by :meth:`DataFrame.query`.
-
         Returns
         -------
-        q : DataFrame
+        DataFrame
+            DataFrame resulting from the provided query expression.
 
-        Notes
-        -----
+        See Also
+        --------
+        eval : Evaluate a string describing operations on
+            DataFrame columns.
+        DataFrame.eval : Evaluate a string describing operations on
+            DataFrame columns.
+
+        Notes
+        -----
         The result of the evaluation of this expression is first passed to
         :attr:`DataFrame.loc` and if that fails because of a
         multidimensional key (e.g., a DataFrame) then the result will be passed
         to :meth:`DataFrame.__getitem__`.
 
-        This method uses the top-level :func:`pandas.eval` function to
+        This method uses the top-level :func:`eval` function to
         evaluate the passed query.
 
         The :meth:`~pandas.DataFrame.query` method uses a slightly
@@ -2194,23 +3017,31 @@ def query(self, expr, inplace=False, **kwargs):
         by default, which allows you to treat both the index and columns of the
         frame as a column in the frame.
         The identifier ``index`` is used for the frame index; you can also
-        use the name of the index to identify it in a query.
+        use the name of the index to identify it in a query. Please note that
+        Python keywords may not be used as identifiers.
 
         For further details and examples see the ``query`` documentation in
         :ref:`indexing <indexing.query>`.
 
-        See Also
-        --------
-        pandas.eval
-        DataFrame.eval
-
         Examples
         --------
-        >>> from numpy.random import randn
-        >>> from pandas import DataFrame
-        >>> df = DataFrame(randn(10, 2), columns=list('ab'))
-        >>> df.query('a > b')
-        >>> df[df.a > df.b]  # same result as the previous expression
+        >>> df = pd.DataFrame({'A': range(1, 6), 'B': range(10, 0, -2)})
+        >>> df
+           A   B
+        0  1  10
+        1  2   8
+        2  3   6
+        3  4   4
+        4  5   2
+        >>> df.query('A > B')
+           A  B
+        4  5  2
+
+        The previous expression is equivalent to
+
+        >>> df[df.A > df.B]
+           A  B
+        4  5  2
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if not isinstance(expr, compat.string_types):
@@ -2232,53 +3063,98 @@ def query(self, expr, inplace=False, **kwargs):
         else:
             return new_data
 
-    def eval(self, expr, inplace=None, **kwargs):
-        """Evaluate an expression in the context of the calling DataFrame
-        instance.
+    def eval(self, expr, inplace=False, **kwargs):
+        """
+        Evaluate a string describing operations on DataFrame columns.
+
+        Operates on columns only, not specific rows or elements.  This allows
+        `eval` to run arbitrary code, which can make you vulnerable to code
+        injection if you pass user input to this function.
 
         Parameters
         ----------
-        expr : string
+        expr : str
             The expression string to evaluate.
-        inplace : bool
-            If the expression contains an assignment, whether to return a new
-            DataFrame or mutate the existing.
-
-            WARNING: inplace=None currently falls back to to True, but
-            in a future version, will default to False.  Use inplace=True
-            explicitly rather than relying on the default.
-
-            .. versionadded:: 0.18.0
+        inplace : bool, default False
+            If the expression contains an assignment, whether to perform the
+            operation inplace and mutate the existing DataFrame. Otherwise,
+            a new DataFrame is returned.
 
+            .. versionadded:: 0.18.0.
         kwargs : dict
-            See the documentation for :func:`~pandas.eval` for complete details
+            See the documentation for :func:`eval` for complete details
             on the keyword arguments accepted by
             :meth:`~pandas.DataFrame.query`.
 
         Returns
         -------
-        ret : ndarray, scalar, or pandas object
+        ndarray, scalar, or pandas object
+            The result of the evaluation.
 
         See Also
         --------
-        pandas.DataFrame.query
-        pandas.DataFrame.assign
-        pandas.eval
+        DataFrame.query : Evaluates a boolean expression to query the columns
+            of a frame.
+        DataFrame.assign : Can evaluate an expression or function to create new
+            values for a column.
+        eval : Evaluate a Python expression as a string using various
+            backends.
 
         Notes
         -----
-        For more details see the API documentation for :func:`~pandas.eval`.
+        For more details see the API documentation for :func:`~eval`.
         For detailed examples see :ref:`enhancing performance with eval
         <enhancingperf.eval>`.
 
         Examples
         --------
-        >>> from numpy.random import randn
-        >>> from pandas import DataFrame
-        >>> df = DataFrame(randn(10, 2), columns=list('ab'))
-        >>> df.eval('a + b')
-        >>> df.eval('c = a + b')
+        >>> df = pd.DataFrame({'A': range(1, 6), 'B': range(10, 0, -2)})
+        >>> df
+           A   B
+        0  1  10
+        1  2   8
+        2  3   6
+        3  4   4
+        4  5   2
+        >>> df.eval('A + B')
+        0    11
+        1    10
+        2     9
+        3     8
+        4     7
+        dtype: int64
+
+        Assignment is allowed though by default the original DataFrame is not
+        modified.
+
+        >>> df.eval('C = A + B')
+           A   B   C
+        0  1  10  11
+        1  2   8  10
+        2  3   6   9
+        3  4   4   8
+        4  5   2   7
+        >>> df
+           A   B
+        0  1  10
+        1  2   8
+        2  3   6
+        3  4   4
+        4  5   2
+
+        Use ``inplace=True`` to modify the original DataFrame.
+
+        >>> df.eval('C = A + B', inplace=True)
+        >>> df
+           A   B   C
+        0  1  10  11
+        1  2   8  10
+        2  3   6   9
+        3  4   4   8
+        4  5   2   7
         """
+        from pandas.core.computation.eval import eval as _eval
+
         inplace = validate_bool_kwarg(inplace, 'inplace')
         resolvers = kwargs.pop('resolvers', None)
         kwargs['level'] = kwargs.pop('level', 0) + 1
@@ -2291,14 +3167,20 @@ def eval(self, expr, inplace=None, **kwargs):
         return _eval(expr, inplace=inplace, **kwargs)
 
     def select_dtypes(self, include=None, exclude=None):
-        """Return a subset of a DataFrame including/excluding columns based on
-        their ``dtype``.
+        """
+        Return a subset of the DataFrame's columns based on the column dtypes.
 
         Parameters
         ----------
-        include, exclude : list-like
-            A list of dtypes or strings to be included/excluded. You must pass
-            in a non-empty sequence for at least one of these.
+        include, exclude : scalar or list-like
+            A selection of dtypes or strings to be included/excluded. At least
+            one of these parameters must be supplied.
+
+        Returns
+        -------
+        DataFrame
+            The subset of the frame including the dtypes in ``include`` and
+            excluding the dtypes in ``exclude``.
 
         Raises
         ------
@@ -2306,63 +3188,77 @@ def select_dtypes(self, include=None, exclude=None):
             * If both of ``include`` and ``exclude`` are empty
             * If ``include`` and ``exclude`` have overlapping elements
             * If any kind of string dtype is passed in.
-        TypeError
-            * If either of ``include`` or ``exclude`` is not a sequence
-
-        Returns
-        -------
-        subset : DataFrame
-            The subset of the frame including the dtypes in ``include`` and
-            excluding the dtypes in ``exclude``.
 
         Notes
         -----
-        * To select all *numeric* types use the numpy dtype ``numpy.number``
+        * To select all *numeric* types, use ``np.number`` or ``'number'``
         * To select strings you must use the ``object`` dtype, but note that
           this will return *all* object dtype columns
         * See the `numpy dtype hierarchy
           <http://docs.scipy.org/doc/numpy/reference/arrays.scalars.html>`__
-        * To select datetimes, use np.datetime64, 'datetime' or 'datetime64'
-        * To select timedeltas, use np.timedelta64, 'timedelta' or
-          'timedelta64'
-        * To select Pandas categorical dtypes, use 'category'
-        * To select Pandas datetimetz dtypes, use 'datetimetz' (new in 0.20.0),
-          or a 'datetime64[ns, tz]' string
+        * To select datetimes, use ``np.datetime64``, ``'datetime'`` or
+          ``'datetime64'``
+        * To select timedeltas, use ``np.timedelta64``, ``'timedelta'`` or
+          ``'timedelta64'``
+        * To select Pandas categorical dtypes, use ``'category'``
+        * To select Pandas datetimetz dtypes, use ``'datetimetz'`` (new in
+          0.20.0) or ``'datetime64[ns, tz]'``
 
         Examples
         --------
-        >>> df = pd.DataFrame({'a': np.random.randn(6).astype('f4'),
+        >>> df = pd.DataFrame({'a': [1, 2] * 3,
         ...                    'b': [True, False] * 3,
         ...                    'c': [1.0, 2.0] * 3})
         >>> df
                 a      b  c
-        0  0.3962   True  1
-        1  0.1459  False  2
-        2  0.2623   True  1
-        3  0.0764  False  2
-        4 -0.9703   True  1
-        5 -1.2094  False  2
-        >>> df.select_dtypes(include=['float64'])
-           c
-        0  1
-        1  2
-        2  1
-        3  2
-        4  1
-        5  2
-        >>> df.select_dtypes(exclude=['floating'])
-               b
-        0   True
+        0       1   True  1.0
+        1       2  False  2.0
+        2       1   True  1.0
+        3       2  False  2.0
+        4       1   True  1.0
+        5       2  False  2.0
+
+        >>> df.select_dtypes(include='bool')
+           b
+        0  True
         1  False
-        2   True
+        2  True
         3  False
-        4   True
+        4  True
         5  False
-        """
-        include, exclude = include or (), exclude or ()
-        if not (is_list_like(include) and is_list_like(exclude)):
-            raise TypeError('include and exclude must both be non-string'
-                            ' sequences')
+
+        >>> df.select_dtypes(include=['float64'])
+           c
+        0  1.0
+        1  2.0
+        2  1.0
+        3  2.0
+        4  1.0
+        5  2.0
+
+        >>> df.select_dtypes(exclude=['int'])
+               b    c
+        0   True  1.0
+        1  False  2.0
+        2   True  1.0
+        3  False  2.0
+        4   True  1.0
+        5  False  2.0
+        """
+        def _get_info_slice(obj, indexer):
+            """Slice the info axis of `obj` with `indexer`."""
+            if not hasattr(obj, '_info_axis_number'):
+                msg = 'object of type {typ!r} has no info axis'
+                raise TypeError(msg.format(typ=type(obj).__name__))
+            slices = [slice(None)] * obj.ndim
+            slices[obj._info_axis_number] = indexer
+            return tuple(slices)
+
+        if not is_list_like(include):
+            include = (include,) if include is not None else ()
+        if not is_list_like(exclude):
+            exclude = (exclude,) if exclude is not None else ()
+
         selection = tuple(map(frozenset, (include, exclude)))
 
         if not any(selection):
@@ -2371,14 +3267,14 @@ def select_dtypes(self, include=None, exclude=None):
 
         # convert the myriad valid dtypes object to a single representation
         include, exclude = map(
-            lambda x: frozenset(map(_get_dtype_from_object, x)), selection)
+            lambda x: frozenset(map(infer_dtype_from_object, x)), selection)
         for dtypes in (include, exclude):
             invalidate_string_dtypes(dtypes)
 
         # can't both include AND exclude!
         if not include.isdisjoint(exclude):
-            raise ValueError('include and exclude overlap on %s' %
-                             (include & exclude))
+            raise ValueError('include and exclude overlap on {inc_ex}'.format(
+                inc_ex=(include & exclude)))
 
         # empty include/exclude -> defaults to True
         # three cases (we've already raised if both are empty)
@@ -2394,18 +3290,18 @@ def select_dtypes(self, include=None, exclude=None):
         include_these = Series(not bool(include), index=self.columns)
         exclude_these = Series(not bool(exclude), index=self.columns)
 
-        def is_dtype_instance_mapper(column, dtype):
-            return column, functools.partial(issubclass, dtype.type)
+        def is_dtype_instance_mapper(idx, dtype):
+            return idx, functools.partial(issubclass, dtype.type)
 
-        for column, f in itertools.starmap(is_dtype_instance_mapper,
-                                           self.dtypes.iteritems()):
+        for idx, f in itertools.starmap(is_dtype_instance_mapper,
+                                        enumerate(self.dtypes)):
             if include:  # checks for the case of empty include or exclude
-                include_these[column] = any(map(f, include))
+                include_these.iloc[idx] = any(map(f, include))
             if exclude:
-                exclude_these[column] = not any(map(f, exclude))
+                exclude_these.iloc[idx] = not any(map(f, exclude))
 
         dtype_indexer = include_these & exclude_these
-        return self.loc[com._get_info_slice(self, dtype_indexer)]
+        return self.loc[_get_info_slice(self, dtype_indexer)]
 
     def _box_item_values(self, key, values):
         items = self.columns[self.columns.get_loc(key)]
@@ -2415,22 +3311,24 @@ def _box_item_values(self, key, values):
             return self._box_col_values(values, items)
 
     def _box_col_values(self, values, items):
-        """ provide boxed values for a column """
-        return self._constructor_sliced.from_array(values, index=self.index,
-                                                   name=items, fastpath=True)
+        """
+        Provide boxed values for a column.
+        """
+        klass = self._constructor_sliced
+        return klass(values, index=self.index, name=items, fastpath=True)
 
     def __setitem__(self, key, value):
-        key = com._apply_if_callable(key, self)
+        key = com.apply_if_callable(key, self)
 
         # see if we can slice the rows
         indexer = convert_to_index_sliceable(self, key)
         if indexer is not None:
             return self._setitem_slice(indexer, value)
 
-        if isinstance(key, (Series, np.ndarray, list, Index)):
-            self._setitem_array(key, value)
-        elif isinstance(key, DataFrame):
+        if isinstance(key, DataFrame) or getattr(key, 'ndim', None) == 2:
             self._setitem_frame(key, value)
+        elif isinstance(key, (Series, np.ndarray, list, Index)):
+            self._setitem_array(key, value)
         else:
             # set column
             self._set_item(key, value)
@@ -2463,8 +3361,17 @@ def _setitem_array(self, key, value):
     def _setitem_frame(self, key, value):
         # support boolean setting with DataFrame input, e.g.
         # df[df > df2] = 0
+        if isinstance(key, np.ndarray):
+            if key.shape != self.shape:
+                raise ValueError(
+                    'Array conditional must be same shape as self'
+                )
+            key = self._constructor(key, **self._construct_axes_dict())
+
         if key.values.size and not is_bool_dtype(key.values):
-            raise TypeError('Must pass DataFrame with boolean values only')
+            raise TypeError(
+                'Must pass DataFrame or 2-d ndarray with boolean values only'
+            )
 
         self._check_inplace_setting(value)
         self._check_setitem_copy()
@@ -2472,14 +3379,14 @@ def _setitem_frame(self, key, value):
 
     def _ensure_valid_index(self, value):
         """
-        ensure that if we don't have an index, that we can create one from the
-        passed value
+        Ensure that if we don't have an index, that we can create one from the
+        passed value.
         """
         # GH5632, make sure that we are a Series convertible
         if not len(self.index) and is_list_like(value):
             try:
                 value = Series(value)
-            except:
+            except (ValueError, NotImplementedError, TypeError):
                 raise ValueError('Cannot set a frame with no defined index '
                                  'and a value that cannot be converted to a '
                                  'Series')
@@ -2512,15 +3419,17 @@ def insert(self, loc, column, value, allow_duplicates=False):
         """
         Insert column into DataFrame at specified location.
 
-        If `allow_duplicates` is False, raises Exception if column
-        is already contained in the DataFrame.
+        Raises a ValueError if `column` is already contained in the DataFrame,
+        unless `allow_duplicates` is set to True.
 
         Parameters
         ----------
         loc : int
-            Must have 0 <= loc <= len(columns)
-        column : object
-        value : scalar, Series, or array-like
+            Insertion index. Must verify 0 <= loc <= len(columns)
+        column : string, number, or hashable object
+            label of the inserted column
+        value : int, Series, or array-like
+        allow_duplicates : bool, optional
         """
         self._ensure_valid_index(value)
         value = self._sanitize_column(column, value, broadcast=False)
@@ -2528,16 +3437,16 @@ def insert(self, loc, column, value, allow_duplicates=False):
                           allow_duplicates=allow_duplicates)
 
     def assign(self, **kwargs):
-        """
-        Assign new columns to a DataFrame, returning a new object
-        (a copy) with all the original columns in addition to the new ones.
+        r"""
+        Assign new columns to a DataFrame.
 
-        .. versionadded:: 0.16.0
+        Returns a new object with all original columns in addition to new ones.
+        Existing columns that are re-assigned will be overwritten.
 
         Parameters
         ----------
-        kwargs : keyword, value pairs
-            keywords are the column names. If the values are
+        **kwargs : dict of {str: callable or Series}
+            The column names are keywords. If the values are
             callable, they are computed on the DataFrame and
             assigned to the new columns. The callable must not
             change input DataFrame (though pandas doesn't check it).
@@ -2546,65 +3455,75 @@ def assign(self, **kwargs):
 
         Returns
         -------
-        df : DataFrame
+        DataFrame
             A new DataFrame with the new columns in addition to
             all the existing columns.
 
         Notes
         -----
-        Since ``kwargs`` is a dictionary, the order of your
-        arguments may not be preserved. To make things predicatable,
-        the columns are inserted in alphabetical order, at the end of
-        your DataFrame. Assigning multiple columns within the same
-        ``assign`` is possible, but you cannot reference other columns
-        created within the same ``assign`` call.
+        Assigning multiple columns within the same ``assign`` is possible.
+        For Python 3.6 and above, later items in '\*\*kwargs' may refer to
+        newly created or modified columns in 'df'; items are computed and
+        assigned into 'df' in order.  For Python 3.5 and below, the order of
+        keyword arguments is not specified, you cannot refer to newly created
+        or modified columns. All items are computed first, and then assigned
+        in alphabetical order.
+
+        .. versionchanged :: 0.23.0
+
+           Keyword argument order is maintained for Python 3.6 and later.
 
         Examples
         --------
-        >>> df = DataFrame({'A': range(1, 11), 'B': np.random.randn(10)})
+        >>> df = pd.DataFrame({'temp_c': [17.0, 25.0]},
+        ...                   index=['Portland', 'Berkeley'])
+        >>> df
+                  temp_c
+        Portland    17.0
+        Berkeley    25.0
 
         Where the value is a callable, evaluated on `df`:
 
-        >>> df.assign(ln_A = lambda x: np.log(x.A))
-            A         B      ln_A
-        0   1  0.426905  0.000000
-        1   2 -0.780949  0.693147
-        2   3 -0.418711  1.098612
-        3   4 -0.269708  1.386294
-        4   5 -0.274002  1.609438
-        5   6 -0.500792  1.791759
-        6   7  1.649697  1.945910
-        7   8 -1.495604  2.079442
-        8   9  0.549296  2.197225
-        9  10 -0.758542  2.302585
-
-        Where the value already exists and is inserted:
-
-        >>> newcol = np.log(df['A'])
-        >>> df.assign(ln_A=newcol)
-            A         B      ln_A
-        0   1  0.426905  0.000000
-        1   2 -0.780949  0.693147
-        2   3 -0.418711  1.098612
-        3   4 -0.269708  1.386294
-        4   5 -0.274002  1.609438
-        5   6 -0.500792  1.791759
-        6   7  1.649697  1.945910
-        7   8 -1.495604  2.079442
-        8   9  0.549296  2.197225
-        9  10 -0.758542  2.302585
-        """
-        data = self.copy()
+        >>> df.assign(temp_f=lambda x: x.temp_c * 9 / 5 + 32)
+                  temp_c  temp_f
+        Portland    17.0    62.6
+        Berkeley    25.0    77.0
+
+        Alternatively, the same behavior can be achieved by directly
+        referencing an existing Series or sequence:
 
-        # do all calculations first...
-        results = {}
-        for k, v in kwargs.items():
-            results[k] = com._apply_if_callable(v, data)
+        >>> df.assign(temp_f=df['temp_c'] * 9 / 5 + 32)
+                  temp_c  temp_f
+        Portland    17.0    62.6
+        Berkeley    25.0    77.0
 
-        # ... and then assign
-        for k, v in sorted(results.items()):
-            data[k] = v
+        In Python 3.6+, you can create multiple columns within the same assign
+        where one of the columns depends on another one defined within the same
+        assign:
 
+        >>> df.assign(temp_f=lambda x: x['temp_c'] * 9 / 5 + 32,
+        ...           temp_k=lambda x: (x['temp_f'] +  459.67) * 5 / 9)
+                  temp_c  temp_f  temp_k
+        Portland    17.0    62.6  290.15
+        Berkeley    25.0    77.0  298.15
+        """
+        data = self.copy()
+
+        # >= 3.6 preserve order of kwargs
+        if PY36:
+            for k, v in kwargs.items():
+                data[k] = com.apply_if_callable(v, data)
+        else:
+            # <= 3.5: do all calculations first...
+            results = OrderedDict()
+            for k, v in kwargs.items():
+                results[k] = com.apply_if_callable(v, data)
+
+            # <= 3.5 and earlier
+            results = sorted(results.items())
+            # ... and then assign
+            for k, v in results:
+                data[k] = v
         return data
 
     def _sanitize_column(self, key, value, broadcast=True):
@@ -2624,7 +3543,7 @@ def _sanitize_column(self, key, value, broadcast=True):
 
         Returns
         -------
-        sanitized_column : numpy-array
+        numpy.ndarray
         """
 
         def reindexer(value):
@@ -2659,23 +3578,25 @@ def reindexer(value):
                 if isinstance(loc, (slice, Series, np.ndarray, Index)):
                     cols = maybe_droplevels(self.columns[loc], key)
                     if len(cols) and not cols.equals(value.columns):
-                        value = value.reindex_axis(cols, axis=1)
+                        value = value.reindex(cols, axis=1)
             # now align rows
             value = reindexer(value).T
 
-        elif isinstance(value, Categorical):
+        elif isinstance(value, ExtensionArray):
+            # Explicitly copy here, instead of in sanitize_index,
+            # as sanitize_index won't copy an EA, even with copy=True
             value = value.copy()
+            value = sanitize_index(value, self.index, copy=False)
 
         elif isinstance(value, Index) or is_sequence(value):
-            from pandas.core.series import _sanitize_index
 
             # turn me into an ndarray
-            value = _sanitize_index(value, self.index, copy=False)
+            value = sanitize_index(value, self.index, copy=False)
             if not isinstance(value, (np.ndarray, Index)):
                 if isinstance(value, list) and len(value) > 0:
                     value = maybe_convert_platform(value)
                 else:
-                    value = com._asarray_tuplesafe(value)
+                    value = com.asarray_tuplesafe(value)
             elif value.ndim == 2:
                 value = value.copy().T
             elif isinstance(value, Index):
@@ -2688,13 +3609,16 @@ def reindexer(value):
                 value = maybe_infer_to_datetimelike(value)
 
         else:
-            # upcast the scalar
-            dtype, value = infer_dtype_from_scalar(value)
-            value = np.repeat(value, len(self.index)).astype(dtype)
-            value = maybe_cast_to_datetime(value, dtype)
+            # cast ignores pandas dtypes. so save the dtype first
+            infer_dtype, _ = infer_dtype_from_scalar(
+                value, pandas_dtype=True)
+
+            # upcast
+            value = cast_scalar_to_array(len(self.index), value)
+            value = maybe_cast_to_datetime(value, infer_dtype)
 
         # return internal types directly
-        if is_extension_type(value):
+        if is_extension_type(value) or is_extension_array_dtype(value):
             return value
 
         # broadcast across multiple columns if necessary
@@ -2709,14 +3633,13 @@ def reindexer(value):
 
     @property
     def _series(self):
-        result = {}
-        for idx, item in enumerate(self.columns):
-            result[item] = Series(self._data.iget(idx), index=self.index,
-                                  name=item)
-        return result
+        return {item: Series(self._data.iget(idx), index=self.index, name=item)
+                for idx, item in enumerate(self.columns)}
 
     def lookup(self, row_labels, col_labels):
-        """Label-based "fancy indexing" function for DataFrame.
+        """
+        Label-based "fancy indexing" function for DataFrame.
+
         Given equal-length arrays of row and column labels, return an
         array of the values corresponding to each (row, col) pair.
 
@@ -2731,15 +3654,13 @@ def lookup(self, row_labels, col_labels):
         -----
         Akin to::
 
-            result = []
-            for row, col in zip(row_labels, col_labels):
-                result.append(df.get_value(row, col))
+            result = [df.get_value(row, col)
+                      for row, col in zip(row_labels, col_labels)]
 
         Examples
         --------
         values : ndarray
             The found values
-
         """
         n = len(row_labels)
         if n != len(col_labels):
@@ -2759,7 +3680,7 @@ def lookup(self, row_labels, col_labels):
         else:
             result = np.empty(n, dtype='O')
             for i, (r, c) in enumerate(zip(row_labels, col_labels)):
-                result[i] = self.get_value(r, c)
+                result[i] = self._get_value(r, c)
 
         if is_object_dtype(result):
             result = lib.maybe_convert_objects(result)
@@ -2785,7 +3706,7 @@ def _reindex_axes(self, axes, level, limit, tolerance, method, fill_value,
 
         return frame
 
-    def _reindex_index(self, new_index, method, copy, level, fill_value=NA,
+    def _reindex_index(self, new_index, method, copy, level, fill_value=np.nan,
                        limit=None, tolerance=None):
         new_index, indexer = self.index.reindex(new_index, method=method,
                                                 level=level, limit=limit,
@@ -2794,8 +3715,8 @@ def _reindex_index(self, new_index, method, copy, level, fill_value=NA,
                                            copy=copy, fill_value=fill_value,
                                            allow_dups=False)
 
-    def _reindex_columns(self, new_columns, method, copy, level, fill_value=NA,
-                         limit=None, tolerance=None):
+    def _reindex_columns(self, new_columns, method, copy, level,
+                         fill_value=None, limit=None, tolerance=None):
         new_columns, indexer = self.columns.reindex(new_columns, method=method,
                                                     level=level, limit=limit,
                                                     tolerance=tolerance)
@@ -2804,7 +3725,9 @@ def _reindex_columns(self, new_columns, method, copy, level, fill_value=NA,
                                            allow_dups=False)
 
     def _reindex_multi(self, axes, copy, fill_value):
-        """ we are guaranteed non-Nones in the axes! """
+        """
+        We are guaranteed non-Nones in the axes.
+        """
 
         new_index, row_indexer = self.index.reindex(axes['index'])
         new_columns, col_indexer = self.columns.reindex(axes['columns'])
@@ -2832,10 +3755,22 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
                                             fill_axis=fill_axis,
                                             broadcast_axis=broadcast_axis)
 
-    @Appender(_shared_docs['reindex'] % _shared_doc_kwargs)
-    def reindex(self, index=None, columns=None, **kwargs):
-        return super(DataFrame, self).reindex(index=index, columns=columns,
-                                              **kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.reindex.__doc__)
+    @rewrite_axis_style_signature('labels', [('method', None),
+                                             ('copy', True),
+                                             ('level', None),
+                                             ('fill_value', np.nan),
+                                             ('limit', None),
+                                             ('tolerance', None)])
+    def reindex(self, *args, **kwargs):
+        axes = validate_axis_style_args(self, args, kwargs, 'labels',
+                                        'reindex')
+        kwargs.update(axes)
+        # Pop these, since the values are in `kwargs` under different names
+        kwargs.pop('axis', None)
+        kwargs.pop('labels', None)
+        return super(DataFrame, self).reindex(**kwargs)
 
     @Appender(_shared_docs['reindex_axis'] % _shared_doc_kwargs)
     def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
@@ -2845,12 +3780,246 @@ def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
                                         method=method, level=level, copy=copy,
                                         limit=limit, fill_value=fill_value)
 
-    @Appender(_shared_docs['rename'] % _shared_doc_kwargs)
-    def rename(self, index=None, columns=None, **kwargs):
-        return super(DataFrame, self).rename(index=index, columns=columns,
-                                             **kwargs)
+    def drop(self, labels=None, axis=0, index=None, columns=None,
+             level=None, inplace=False, errors='raise'):
+        """
+        Drop specified labels from rows or columns.
+
+        Remove rows or columns by specifying label names and corresponding
+        axis, or by specifying directly index or column names. When using a
+        multi-index, labels on different levels can be removed by specifying
+        the level.
+
+        Parameters
+        ----------
+        labels : single label or list-like
+            Index or column labels to drop.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Whether to drop labels from the index (0 or 'index') or
+            columns (1 or 'columns').
+        index : single label or list-like
+            Alternative to specifying axis (``labels, axis=0``
+            is equivalent to ``index=labels``).
+
+            .. versionadded:: 0.21.0
+        columns : single label or list-like
+            Alternative to specifying axis (``labels, axis=1``
+            is equivalent to ``columns=labels``).
+
+            .. versionadded:: 0.21.0
+        level : int or level name, optional
+            For MultiIndex, level from which the labels will be removed.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and only existing labels are
+            dropped.
+
+        Returns
+        -------
+        DataFrame
+            DataFrame without the removed index or column labels.
+
+        Raises
+        ------
+        KeyError
+            If any of the labels is not found in the selected axis.
+
+        See Also
+        --------
+        DataFrame.loc : Label-location based indexer for selection by label.
+        DataFrame.dropna : Return DataFrame with labels on given axis omitted
+            where (all or any) data are missing.
+        DataFrame.drop_duplicates : Return DataFrame with duplicate rows
+            removed, optionally only considering certain columns.
+        Series.drop : Return Series with specified index labels removed.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.arange(12).reshape(3, 4),
+        ...                   columns=['A', 'B', 'C', 'D'])
+        >>> df
+           A  B   C   D
+        0  0  1   2   3
+        1  4  5   6   7
+        2  8  9  10  11
+
+        Drop columns
+
+        >>> df.drop(['B', 'C'], axis=1)
+           A   D
+        0  0   3
+        1  4   7
+        2  8  11
+
+        >>> df.drop(columns=['B', 'C'])
+           A   D
+        0  0   3
+        1  4   7
+        2  8  11
+
+        Drop a row by index
+
+        >>> df.drop([0, 1])
+           A  B   C   D
+        2  8  9  10  11
+
+        Drop columns and/or rows of MultiIndex DataFrame
+
+        >>> midx = pd.MultiIndex(levels=[['lama', 'cow', 'falcon'],
+        ...                              ['speed', 'weight', 'length']],
+        ...                      codes=[[0, 0, 0, 1, 1, 1, 2, 2, 2],
+        ...                             [0, 1, 2, 0, 1, 2, 0, 1, 2]])
+        >>> df = pd.DataFrame(index=midx, columns=['big', 'small'],
+        ...                   data=[[45, 30], [200, 100], [1.5, 1], [30, 20],
+        ...                         [250, 150], [1.5, 0.8], [320, 250],
+        ...                         [1, 0.8], [0.3, 0.2]])
+        >>> df
+                        big     small
+        lama    speed   45.0    30.0
+                weight  200.0   100.0
+                length  1.5     1.0
+        cow     speed   30.0    20.0
+                weight  250.0   150.0
+                length  1.5     0.8
+        falcon  speed   320.0   250.0
+                weight  1.0     0.8
+                length  0.3     0.2
+
+        >>> df.drop(index='cow', columns='small')
+                        big
+        lama    speed   45.0
+                weight  200.0
+                length  1.5
+        falcon  speed   320.0
+                weight  1.0
+                length  0.3
+
+        >>> df.drop(index='length', level=1)
+                        big     small
+        lama    speed   45.0    30.0
+                weight  200.0   100.0
+        cow     speed   30.0    20.0
+                weight  250.0   150.0
+        falcon  speed   320.0   250.0
+                weight  1.0     0.8
+        """
+        return super(DataFrame, self).drop(labels=labels, axis=axis,
+                                           index=index, columns=columns,
+                                           level=level, inplace=inplace,
+                                           errors=errors)
+
+    @rewrite_axis_style_signature('mapper', [('copy', True),
+                                             ('inplace', False),
+                                             ('level', None),
+                                             ('errors', 'ignore')])
+    def rename(self, *args, **kwargs):
+        """
+        Alter axes labels.
+
+        Function / dict values must be unique (1-to-1). Labels not contained in
+        a dict / Series will be left as-is. Extra labels listed don't throw an
+        error.
+
+        See the :ref:`user guide <basics.rename>` for more.
+
+        Parameters
+        ----------
+        mapper : dict-like or function
+            Dict-like or functions transformations to apply to
+            that axis' values. Use either ``mapper`` and ``axis`` to
+            specify the axis to target with ``mapper``, or ``index`` and
+            ``columns``.
+        index : dict-like or function
+            Alternative to specifying axis (``mapper, axis=0``
+            is equivalent to ``index=mapper``).
+        columns : dict-like or function
+            Alternative to specifying axis (``mapper, axis=1``
+            is equivalent to ``columns=mapper``).
+        axis : int or str
+            Axis to target with ``mapper``. Can be either the axis name
+            ('index', 'columns') or number (0, 1). The default is 'index'.
+        copy : bool, default True
+            Also copy underlying data.
+        inplace : bool, default False
+            Whether to return a new DataFrame. If True then value of copy is
+            ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
+        errors : {'ignore', 'raise'}, default 'ignore'
+            If 'raise', raise a `KeyError` when a dict-like `mapper`, `index`,
+            or `columns` contains labels that are not present in the Index
+            being transformed.
+            If 'ignore', existing keys will be renamed and extra keys will be
+            ignored.
+
+        Returns
+        -------
+        DataFrame
+            DataFrame with the renamed axis labels.
+
+        Raises
+        ------
+        KeyError
+            If any of the labels is not found in the selected axis and
+            "errors='raise'".
+
+        See Also
+        --------
+        DataFrame.rename_axis : Set the name of the axis.
+
+        Examples
+        --------
+
+        ``DataFrame.rename`` supports two calling conventions
+
+        * ``(index=index_mapper, columns=columns_mapper, ...)``
+        * ``(mapper, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        >>> df.rename(index=str, columns={"A": "a", "B": "c"})
+           a  c
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename(index=str, columns={"A": "a", "C": "c"})
+           a  B
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename(index=str, columns={"A": "a", "C": "c"}, errors="raise")
+        Traceback (most recent call last):
+        KeyError: ['C'] not found in axis
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
+        Using axis-style parameters
+
+        >>> df.rename(str.lower, axis='columns')
+           a  b
+        0  1  4
+        1  2  5
+        2  3  6
+
+        >>> df.rename({1: 2, 2: 4}, axis='index')
+           A  B
+        0  1  4
+        2  2  5
+        4  3  6
+        """
+        axes = validate_axis_style_args(self, args, kwargs, 'mapper', 'rename')
+        kwargs.update(axes)
+        # Pop these, since the values are in `kwargs` under different names
+        kwargs.pop('axis', None)
+        kwargs.pop('mapper', None)
+        return super(DataFrame, self).rename(**kwargs)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
         return super(DataFrame,
@@ -2858,45 +4027,140 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                                   inplace=inplace, limit=limit,
                                   downcast=downcast, **kwargs)
 
+    @Appender(_shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
+        return super(DataFrame, self).replace(to_replace=to_replace,
+                                              value=value, inplace=inplace,
+                                              limit=limit, regex=regex,
+                                              method=method)
+
     @Appender(_shared_docs['shift'] % _shared_doc_kwargs)
-    def shift(self, periods=1, freq=None, axis=0):
+    def shift(self, periods=1, freq=None, axis=0, fill_value=None):
         return super(DataFrame, self).shift(periods=periods, freq=freq,
-                                            axis=axis)
+                                            axis=axis, fill_value=fill_value)
 
     def set_index(self, keys, drop=True, append=False, inplace=False,
                   verify_integrity=False):
         """
+        Set the DataFrame index using existing columns.
+
         Set the DataFrame index (row labels) using one or more existing
-        columns. By default yields a new object.
+        columns or arrays (of the correct length). The index can replace the
+        existing index or expand on it.
 
         Parameters
         ----------
-        keys : column label or list of column labels / arrays
-        drop : boolean, default True
-            Delete columns to be used as the new index
-        append : boolean, default False
-            Whether to append columns to existing index
-        inplace : boolean, default False
-            Modify the DataFrame in place (do not create a new object)
-        verify_integrity : boolean, default False
+        keys : label or array-like or list of labels/arrays
+            This parameter can be either a single column key, a single array of
+            the same length as the calling DataFrame, or a list containing an
+            arbitrary combination of column keys and arrays. Here, "array"
+            encompasses :class:`Series`, :class:`Index`, ``np.ndarray``, and
+            instances of :class:`abc.Iterator`.
+        drop : bool, default True
+            Delete columns to be used as the new index.
+        append : bool, default False
+            Whether to append columns to existing index.
+        inplace : bool, default False
+            Modify the DataFrame in place (do not create a new object).
+        verify_integrity : bool, default False
             Check the new index for duplicates. Otherwise defer the check until
             necessary. Setting to False will improve the performance of this
-            method
-
-        Examples
-        --------
-        >>> indexed_df = df.set_index(['A', 'B'])
-        >>> indexed_df2 = df.set_index(['A', [0, 1, 2, 0, 1, 2]])
-        >>> indexed_df3 = df.set_index([[0, 1, 2, 0, 1, 2]])
+            method.
 
         Returns
         -------
-        dataframe : DataFrame
+        DataFrame
+            Changed row labels.
+
+        See Also
+        --------
+        DataFrame.reset_index : Opposite of set_index.
+        DataFrame.reindex : Change to new indices or expand indices.
+        DataFrame.reindex_like : Change to same indices as other DataFrame.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'month': [1, 4, 7, 10],
+        ...                    'year': [2012, 2014, 2013, 2014],
+        ...                    'sale': [55, 40, 84, 31]})
+        >>> df
+           month  year  sale
+        0      1  2012    55
+        1      4  2014    40
+        2      7  2013    84
+        3     10  2014    31
+
+        Set the index to become the 'month' column:
+
+        >>> df.set_index('month')
+               year  sale
+        month
+        1      2012    55
+        4      2014    40
+        7      2013    84
+        10     2014    31
+
+        Create a MultiIndex using columns 'year' and 'month':
+
+        >>> df.set_index(['year', 'month'])
+                    sale
+        year  month
+        2012  1     55
+        2014  4     40
+        2013  7     84
+        2014  10    31
+
+        Create a MultiIndex using an Index and a column:
+
+        >>> df.set_index([pd.Index([1, 2, 3, 4]), 'year'])
+                 month  sale
+           year
+        1  2012  1      55
+        2  2014  4      40
+        3  2013  7      84
+        4  2014  10     31
+
+        Create a MultiIndex using two Series:
+
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> df.set_index([s, s**2])
+              month  year  sale
+        1 1       1  2012    55
+        2 4       4  2014    40
+        3 9       7  2013    84
+        4 16     10  2014    31
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if not isinstance(keys, list):
             keys = [keys]
 
+        err_msg = ('The parameter "keys" may be a column key, one-dimensional '
+                   'array, or a list containing only valid column keys and '
+                   'one-dimensional arrays.')
+
+        missing = []
+        for col in keys:
+            if isinstance(col, (ABCIndexClass, ABCSeries, np.ndarray,
+                                list, Iterator)):
+                # arrays are fine as long as they are one-dimensional
+                # iterators get converted to list below
+                if getattr(col, 'ndim', 1) != 1:
+                    raise ValueError(err_msg)
+            else:
+                # everything else gets tried as a key; see GH 24969
+                try:
+                    found = col in self.columns
+                except TypeError:
+                    raise TypeError(err_msg + ' Received column of '
+                                    'type {}'.format(type(col)))
+                else:
+                    if not found:
+                        missing.append(col)
+
+        if missing:
+            raise KeyError('None of {} are in the columns'.format(missing))
+
         if inplace:
             frame = self
         else:
@@ -2906,7 +4170,7 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
         names = []
         if append:
             names = [x for x in self.index.names]
-            if isinstance(self.index, MultiIndex):
+            if isinstance(self.index, ABCMultiIndex):
                 for i in range(self.index.nlevels):
                     arrays.append(self.index._get_level_values(i))
             else:
@@ -2914,37 +4178,45 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
 
         to_remove = []
         for col in keys:
-            if isinstance(col, MultiIndex):
-                # append all but the last column so we don't have to modify
-                # the end of this loop
-                for n in range(col.nlevels - 1):
+            if isinstance(col, ABCMultiIndex):
+                for n in range(col.nlevels):
                     arrays.append(col._get_level_values(n))
-
-                level = col._get_level_values(col.nlevels - 1)
                 names.extend(col.names)
-            elif isinstance(col, Series):
-                level = col._values
-                names.append(col.name)
-            elif isinstance(col, Index):
-                level = col
+            elif isinstance(col, (ABCIndexClass, ABCSeries)):
+                # if Index then not MultiIndex (treated above)
+                arrays.append(col)
                 names.append(col.name)
-            elif isinstance(col, (list, np.ndarray, Index)):
-                level = col
+            elif isinstance(col, (list, np.ndarray)):
+                arrays.append(col)
                 names.append(None)
+            elif isinstance(col, Iterator):
+                arrays.append(list(col))
+                names.append(None)
+            # from here, col can only be a column label
             else:
-                level = frame[col]._values
+                arrays.append(frame[col]._values)
                 names.append(col)
                 if drop:
                     to_remove.append(col)
-            arrays.append(level)
 
-        index = MultiIndex.from_arrays(arrays, names=names)
+            if len(arrays[-1]) != len(self):
+                # check newest element against length of calling frame, since
+                # ensure_index_from_sequences would not raise for append=False.
+                raise ValueError('Length mismatch: Expected {len_self} rows, '
+                                 'received array of length {len_col}'.format(
+                                     len_self=len(self),
+                                     len_col=len(arrays[-1])
+                                 ))
+
+        index = ensure_index_from_sequences(arrays, names)
 
         if verify_integrity and not index.is_unique:
-            duplicates = index.get_duplicates()
-            raise ValueError('Index has duplicate keys: %s' % duplicates)
+            duplicates = index[index.duplicated()].unique()
+            raise ValueError('Index has duplicate keys: {dup}'.format(
+                dup=duplicates))
 
-        for c in to_remove:
+        # use set to handle duplicate column names gracefully in case of drop
+        for c in set(to_remove):
             del frame[c]
 
         # clear up memory usage
@@ -2958,22 +4230,22 @@ def set_index(self, keys, drop=True, append=False, inplace=False,
     def reset_index(self, level=None, drop=False, inplace=False, col_level=0,
                     col_fill=''):
         """
-        For DataFrame with multi-level index, return new DataFrame with
-        labeling information in the columns under the index names, defaulting
-        to 'level_0', 'level_1', etc. if any are None. For a standard index,
-        the index name will be used (if set), otherwise a default 'index' or
-        'level_0' (if 'index' is already taken) will be used.
+        Reset the index, or a level of it.
+
+        Reset the index of the DataFrame, and use the default one instead.
+        If the DataFrame has a MultiIndex, this method can remove one or more
+        levels.
 
         Parameters
         ----------
         level : int, str, tuple, or list, default None
             Only remove the given levels from the index. Removes all levels by
-            default
-        drop : boolean, default False
+            default.
+        drop : bool, default False
             Do not try to insert index into dataframe columns. This resets
             the index to the default integer index.
-        inplace : boolean, default False
-            Modify the DataFrame in place (do not create a new object)
+        inplace : bool, default False
+            Modify the DataFrame in place (do not create a new object).
         col_level : int or str, default 0
             If the columns have multiple levels, determines which level the
             labels are inserted into. By default it is inserted into the first
@@ -2984,7 +4256,119 @@ def reset_index(self, level=None, drop=False, inplace=False, col_level=0,
 
         Returns
         -------
-        resetted : DataFrame
+        DataFrame
+            DataFrame with the new index.
+
+        See Also
+        --------
+        DataFrame.set_index : Opposite of reset_index.
+        DataFrame.reindex : Change to new indices or expand indices.
+        DataFrame.reindex_like : Change to same indices as other DataFrame.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('bird', 389.0),
+        ...                    ('bird', 24.0),
+        ...                    ('mammal', 80.5),
+        ...                    ('mammal', np.nan)],
+        ...                   index=['falcon', 'parrot', 'lion', 'monkey'],
+        ...                   columns=('class', 'max_speed'))
+        >>> df
+                 class  max_speed
+        falcon    bird      389.0
+        parrot    bird       24.0
+        lion    mammal       80.5
+        monkey  mammal        NaN
+
+        When we reset the index, the old index is added as a column, and a
+        new sequential index is used:
+
+        >>> df.reset_index()
+            index   class  max_speed
+        0  falcon    bird      389.0
+        1  parrot    bird       24.0
+        2    lion  mammal       80.5
+        3  monkey  mammal        NaN
+
+        We can use the `drop` parameter to avoid the old index being added as
+        a column:
+
+        >>> df.reset_index(drop=True)
+            class  max_speed
+        0    bird      389.0
+        1    bird       24.0
+        2  mammal       80.5
+        3  mammal        NaN
+
+        You can also use `reset_index` with `MultiIndex`.
+
+        >>> index = pd.MultiIndex.from_tuples([('bird', 'falcon'),
+        ...                                    ('bird', 'parrot'),
+        ...                                    ('mammal', 'lion'),
+        ...                                    ('mammal', 'monkey')],
+        ...                                   names=['class', 'name'])
+        >>> columns = pd.MultiIndex.from_tuples([('speed', 'max'),
+        ...                                      ('species', 'type')])
+        >>> df = pd.DataFrame([(389.0, 'fly'),
+        ...                    ( 24.0, 'fly'),
+        ...                    ( 80.5, 'run'),
+        ...                    (np.nan, 'jump')],
+        ...                   index=index,
+        ...                   columns=columns)
+        >>> df
+                       speed species
+                         max    type
+        class  name
+        bird   falcon  389.0     fly
+               parrot   24.0     fly
+        mammal lion     80.5     run
+               monkey    NaN    jump
+
+        If the index has multiple levels, we can reset a subset of them:
+
+        >>> df.reset_index(level='class')
+                 class  speed species
+                          max    type
+        name
+        falcon    bird  389.0     fly
+        parrot    bird   24.0     fly
+        lion    mammal   80.5     run
+        monkey  mammal    NaN    jump
+
+        If we are not dropping the index, by default, it is placed in the top
+        level. We can place it in another level:
+
+        >>> df.reset_index(level='class', col_level=1)
+                        speed species
+                 class    max    type
+        name
+        falcon    bird  389.0     fly
+        parrot    bird   24.0     fly
+        lion    mammal   80.5     run
+        monkey  mammal    NaN    jump
+
+        When the index is inserted under another level, we can specify under
+        which one with the parameter `col_fill`:
+
+        >>> df.reset_index(level='class', col_level=1, col_fill='species')
+                      species  speed species
+                        class    max    type
+        name
+        falcon           bird  389.0     fly
+        parrot           bird   24.0     fly
+        lion           mammal   80.5     run
+        monkey         mammal    NaN    jump
+
+        If we specify a nonexistent level for `col_fill`, it is created:
+
+        >>> df.reset_index(level='class', col_level=1, col_fill='genus')
+                        genus  speed species
+                        class    max    type
+        name
+        falcon           bird  389.0     fly
+        parrot           bird   24.0     fly
+        lion           mammal   80.5     run
+        monkey         mammal    NaN    jump
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if inplace:
@@ -2993,12 +4377,8 @@ def reset_index(self, level=None, drop=False, inplace=False, col_level=0,
             new_obj = self.copy()
 
         def _maybe_casted_values(index, labels=None):
-            if isinstance(index, PeriodIndex):
-                values = index.asobject.values
-            elif isinstance(index, DatetimeIndex) and index.tz is not None:
-                values = index
-            else:
-                values = index.values
+            values = index._values
+            if not isinstance(index, (PeriodIndex, DatetimeIndex)):
                 if values.dtype == np.object_:
                     values = lib.maybe_convert_objects(values)
 
@@ -3013,58 +4393,69 @@ def _maybe_casted_values(index, labels=None):
                     values.fill(np.nan)
                 else:
                     values = values.take(labels)
+
+                    # TODO(https://github.com/pandas-dev/pandas/issues/24206)
+                    # Push this into maybe_upcast_putmask?
+                    # We can't pass EAs there right now. Looks a bit
+                    # complicated.
+                    # So we unbox the ndarray_values, op, re-box.
+                    values_type = type(values)
+                    values_dtype = values.dtype
+
+                    if issubclass(values_type, DatetimeLikeArray):
+                        values = values._data
+
                     if mask.any():
                         values, changed = maybe_upcast_putmask(
                             values, mask, np.nan)
+
+                    if issubclass(values_type, DatetimeLikeArray):
+                        values = values_type(values, dtype=values_dtype)
+
             return values
 
-        new_index = _default_index(len(new_obj))
-        if isinstance(self.index, MultiIndex):
-            if level is not None:
-                if not isinstance(level, (tuple, list)):
-                    level = [level]
-                level = [self.index._get_level_number(lev) for lev in level]
-                if len(level) < len(self.index.levels):
-                    new_index = self.index.droplevel(level)
-
-            if not drop:
-                names = self.index.names
-                zipped = lzip(self.index.levels, self.index.labels)
-
-                multi_col = isinstance(self.columns, MultiIndex)
-                for i, (lev, lab) in reversed(list(enumerate(zipped))):
-                    col_name = names[i]
-                    if col_name is None:
-                        col_name = 'level_%d' % i
-
-                    if multi_col:
-                        if col_fill is None:
-                            col_name = tuple([col_name] * self.columns.nlevels)
-                        else:
-                            name_lst = [col_fill] * self.columns.nlevels
-                            lev_num = self.columns._get_level_number(col_level)
-                            name_lst[lev_num] = col_name
-                            col_name = tuple(name_lst)
-
-                    # to ndarray and maybe infer different dtype
-                    level_values = _maybe_casted_values(lev, lab)
-                    if level is None or i in level:
-                        new_obj.insert(0, col_name, level_values)
-
-        elif not drop:
-            name = self.index.name
-            if name is None or name == 'index':
-                name = 'index' if 'index' not in self else 'level_0'
-            if isinstance(self.columns, MultiIndex):
-                if col_fill is None:
-                    name = tuple([name] * self.columns.nlevels)
-                else:
-                    name_lst = [col_fill] * self.columns.nlevels
+        new_index = ibase.default_index(len(new_obj))
+        if level is not None:
+            if not isinstance(level, (tuple, list)):
+                level = [level]
+            level = [self.index._get_level_number(lev) for lev in level]
+            if len(level) < self.index.nlevels:
+                new_index = self.index.droplevel(level)
+
+        if not drop:
+            if isinstance(self.index, MultiIndex):
+                names = [n if n is not None else ('level_%d' % i)
+                         for (i, n) in enumerate(self.index.names)]
+                to_insert = lzip(self.index.levels, self.index.codes)
+            else:
+                default = 'index' if 'index' not in self else 'level_0'
+                names = ([default] if self.index.name is None
+                         else [self.index.name])
+                to_insert = ((self.index, None),)
+
+            multi_col = isinstance(self.columns, MultiIndex)
+            for i, (lev, lab) in reversed(list(enumerate(to_insert))):
+                if not (level is None or i in level):
+                    continue
+                name = names[i]
+                if multi_col:
+                    col_name = (list(name) if isinstance(name, tuple)
+                                else [name])
+                    if col_fill is None:
+                        if len(col_name) not in (1, self.columns.nlevels):
+                            raise ValueError("col_fill=None is incompatible "
+                                             "with incomplete column name "
+                                             "{}".format(name))
+                        col_fill = col_name[0]
+
                     lev_num = self.columns._get_level_number(col_level)
-                    name_lst[lev_num] = name
+                    name_lst = [col_fill] * lev_num + col_name
+                    missing = self.columns.nlevels - len(name_lst)
+                    name_lst += [col_fill] * missing
                     name = tuple(name_lst)
-            values = _maybe_casted_values(self.index)
-            new_obj.insert(0, name, values)
+                # to ndarray and maybe infer different dtype
+                level_values = _maybe_casted_values(lev, lab)
+                new_obj.insert(0, name, level_values)
 
         new_obj.index = new_index
         if not inplace:
@@ -3073,77 +4464,133 @@ def _maybe_casted_values(index, labels=None):
     # ----------------------------------------------------------------------
     # Reindex-based selection methods
 
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return super(DataFrame, self).isna()
+
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isnull(self):
+        return super(DataFrame, self).isnull()
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return super(DataFrame, self).notna()
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notnull(self):
+        return super(DataFrame, self).notnull()
+
     def dropna(self, axis=0, how='any', thresh=None, subset=None,
                inplace=False):
         """
-        Return object with labels on given axis omitted where alternately any
-        or all of the data are missing
+        Remove missing values.
+
+        See the :ref:`User Guide <missing_data>` for more on which values are
+        considered missing, and how to work with missing data.
 
         Parameters
         ----------
-        axis : {0 or 'index', 1 or 'columns'}, or tuple/list thereof
-            Pass tuple or list to drop on multiple axes
-        how : {'any', 'all'}
-            * any : if any NA values are present, drop that label
-            * all : if all values are NA, drop that label
-        thresh : int, default None
-            int value : require that many non-NA values
-        subset : array-like
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Determine if rows or columns which contain missing values are
+            removed.
+
+            * 0, or 'index' : Drop rows which contain missing values.
+            * 1, or 'columns' : Drop columns which contain missing value.
+
+            .. deprecated:: 0.23.0
+
+               Pass tuple or list to drop on multiple axes.
+               Only a single axis is allowed.
+
+        how : {'any', 'all'}, default 'any'
+            Determine if row or column is removed from DataFrame, when we have
+            at least one NA or all NA.
+
+            * 'any' : If any NA values are present, drop that row or column.
+            * 'all' : If all values are NA, drop that row or column.
+
+        thresh : int, optional
+            Require that many non-NA values.
+        subset : array-like, optional
             Labels along other axis to consider, e.g. if you are dropping rows
-            these would be a list of columns to include
-        inplace : boolean, default False
+            these would be a list of columns to include.
+        inplace : bool, default False
             If True, do operation inplace and return None.
 
         Returns
         -------
-        dropped : DataFrame
+        DataFrame
+            DataFrame with NA entries dropped from it.
+
+        See Also
+        --------
+        DataFrame.isna: Indicate missing values.
+        DataFrame.notna : Indicate existing (non-missing) values.
+        DataFrame.fillna : Replace missing values.
+        Series.dropna : Drop missing values.
+        Index.dropna : Drop missing indices.
 
         Examples
         --------
-        >>> df = pd.DataFrame([[np.nan, 2, np.nan, 0], [3, 4, np.nan, 1],
-        ...                    [np.nan, np.nan, np.nan, 5]],
-        ...                   columns=list('ABCD'))
+        >>> df = pd.DataFrame({"name": ['Alfred', 'Batman', 'Catwoman'],
+        ...                    "toy": [np.nan, 'Batmobile', 'Bullwhip'],
+        ...                    "born": [pd.NaT, pd.Timestamp("1940-04-25"),
+        ...                             pd.NaT]})
         >>> df
-             A    B   C  D
-        0  NaN  2.0 NaN  0
-        1  3.0  4.0 NaN  1
-        2  NaN  NaN NaN  5
+               name        toy       born
+        0    Alfred        NaN        NaT
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
 
-        Drop the columns where all elements are nan:
+        Drop the rows where at least one element is missing.
 
-        >>> df.dropna(axis=1, how='all')
-             A    B  D
-        0  NaN  2.0  0
-        1  3.0  4.0  1
-        2  NaN  NaN  5
+        >>> df.dropna()
+             name        toy       born
+        1  Batman  Batmobile 1940-04-25
 
-        Drop the columns where any of the elements is nan
+        Drop the columns where at least one element is missing.
 
-        >>> df.dropna(axis=1, how='any')
-           D
-        0  0
-        1  1
-        2  5
+        >>> df.dropna(axis='columns')
+               name
+        0    Alfred
+        1    Batman
+        2  Catwoman
 
-        Drop the rows where all of the elements are nan
-        (there is no row to drop, so df stays the same):
+        Drop the rows where all elements are missing.
 
-        >>> df.dropna(axis=0, how='all')
-             A    B   C  D
-        0  NaN  2.0 NaN  0
-        1  3.0  4.0 NaN  1
-        2  NaN  NaN NaN  5
+        >>> df.dropna(how='all')
+               name        toy       born
+        0    Alfred        NaN        NaT
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
 
-        Keep only the rows with at least 2 non-na values:
+        Keep only the rows with at least 2 non-NA values.
 
         >>> df.dropna(thresh=2)
-             A    B   C  D
-        0  NaN  2.0 NaN  0
-        1  3.0  4.0 NaN  1
+               name        toy       born
+        1    Batman  Batmobile 1940-04-25
+        2  Catwoman   Bullwhip        NaT
+
+        Define in which columns to look for missing values.
 
+        >>> df.dropna(subset=['name', 'born'])
+               name        toy       born
+        1    Batman  Batmobile 1940-04-25
+
+        Keep the DataFrame with valid entries in the same variable.
+
+        >>> df.dropna(inplace=True)
+        >>> df
+             name        toy       born
+        1  Batman  Batmobile 1940-04-25
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if isinstance(axis, (tuple, list)):
+            # GH20987
+            msg = ("supplying multiple axes to axis is deprecated and "
+                   "will be removed in a future version.")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+
             result = self
             for ax in axis:
                 result = result.dropna(how=how, thresh=thresh, subset=subset,
@@ -3171,11 +4618,11 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None,
                 mask = count > 0
             else:
                 if how is not None:
-                    raise ValueError('invalid how option: %s' % how)
+                    raise ValueError('invalid how option: {h}'.format(h=how))
                 else:
                     raise TypeError('must specify how or thresh')
 
-            result = self.take(mask.nonzero()[0], axis=axis, convert=False)
+            result = self.loc(axis=axis)[mask]
 
         if inplace:
             self._update_inplace(result)
@@ -3185,7 +4632,8 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None,
     def drop_duplicates(self, subset=None, keep='first', inplace=False):
         """
         Return DataFrame with duplicate rows removed, optionally only
-        considering certain columns
+        considering certain columns. Indexes, including time indexes
+        are ignored.
 
         Parameters
         ----------
@@ -3201,13 +4649,16 @@ def drop_duplicates(self, subset=None, keep='first', inplace=False):
 
         Returns
         -------
-        deduplicated : DataFrame
+        DataFrame
         """
+        if self.empty:
+            return self.copy()
+
         inplace = validate_bool_kwarg(inplace, 'inplace')
         duplicated = self.duplicated(subset, keep=keep)
 
         if inplace:
-            inds, = (-duplicated).nonzero()
+            inds, = (-duplicated)._ndarray_values.nonzero()
             new_data = self._data.take(inds)
             self._update_inplace(new_data)
         else:
@@ -3216,7 +4667,7 @@ def drop_duplicates(self, subset=None, keep='first', inplace=False):
     def duplicated(self, subset=None, keep='first'):
         """
         Return boolean Series denoting duplicate rows, optionally only
-        considering certain columns
+        considering certain columns.
 
         Parameters
         ----------
@@ -3232,11 +4683,14 @@ def duplicated(self, subset=None, keep='first'):
 
         Returns
         -------
-        duplicated : Series
+        Series
         """
         from pandas.core.sorting import get_group_index
         from pandas._libs.hashtable import duplicated_int64, _SIZE_HINT_LIMIT
 
+        if self.empty:
+            return Series(dtype=bool)
+
         def f(vals):
             labels, shape = algorithms.factorize(
                 vals, size_hint=min(len(self), _SIZE_HINT_LIMIT))
@@ -3249,7 +4703,15 @@ def f(vals):
               isinstance(subset, tuple) and subset in self.columns):
             subset = subset,
 
-        vals = (self[col].values for col in subset)
+        # Verify all columns in subset exist in the queried dataframe
+        # Otherwise, raise a KeyError, same as if you try to __getitem__ with a
+        # key that doesn't exist.
+        diff = Index(subset).difference(self.columns)
+        if not diff.empty:
+            raise KeyError(diff)
+
+        vals = (col.values for name, col in self.iteritems()
+                if name in subset)
         labels, shape = map(list, zip(*map(f, vals)))
 
         ids = get_group_index(labels, shape, sort=False, xnull=False)
@@ -3258,12 +4720,12 @@ def f(vals):
     # ----------------------------------------------------------------------
     # Sorting
 
-    @Appender(_shared_docs['sort_values'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.sort_values.__doc__)
     def sort_values(self, by, axis=0, ascending=True, inplace=False,
                     kind='quicksort', na_position='last'):
         inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
-        other_axis = 0 if axis == 1 else 1
 
         if not isinstance(by, list):
             by = [by]
@@ -3273,36 +4735,17 @@ def sort_values(self, by, axis=0, ascending=True, inplace=False,
         if len(by) > 1:
             from pandas.core.sorting import lexsort_indexer
 
-            def trans(v):
-                if needs_i8_conversion(v):
-                    return v.view('i8')
-                return v
-
-            keys = []
-            for x in by:
-                k = self.xs(x, axis=other_axis).values
-                if k.ndim == 2:
-                    raise ValueError('Cannot sort by duplicate column %s' %
-                                     str(x))
-                keys.append(trans(k))
+            keys = [self._get_label_or_level_values(x, axis=axis)
+                    for x in by]
             indexer = lexsort_indexer(keys, orders=ascending,
                                       na_position=na_position)
-            indexer = _ensure_platform_int(indexer)
+            indexer = ensure_platform_int(indexer)
         else:
             from pandas.core.sorting import nargsort
 
             by = by[0]
-            k = self.xs(by, axis=other_axis).values
-            if k.ndim == 2:
-
-                # try to be helpful
-                if isinstance(self.columns, MultiIndex):
-                    raise ValueError('Cannot sort by column %s in a '
-                                     'multi-index you need to explicitly '
-                                     'provide all the levels' % str(by))
+            k = self._get_label_or_level_values(by, axis=axis)
 
-                raise ValueError('Cannot sort by duplicate column %s' %
-                                 str(by))
             if isinstance(ascending, (tuple, list)):
                 ascending = ascending[0]
 
@@ -3311,22 +4754,28 @@ def trans(v):
 
         new_data = self._data.take(indexer,
                                    axis=self._get_block_manager_axis(axis),
-                                   convert=False, verify=False)
+                                   verify=False)
 
         if inplace:
             return self._update_inplace(new_data)
         else:
             return self._constructor(new_data).__finalize__(self)
 
-    @Appender(_shared_docs['sort_index'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.sort_index.__doc__)
     def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
                    kind='quicksort', na_position='last', sort_remaining=True,
                    by=None):
+
+        # TODO: this can be combined with Series.sort_index impl as
+        # almost identical
+
         inplace = validate_bool_kwarg(inplace, 'inplace')
         # 10726
         if by is not None:
-            warnings.warn("by argument to sort_index is deprecated, pls use "
-                          ".sort_values(by=...)", FutureWarning, stacklevel=2)
+            warnings.warn("by argument to sort_index is deprecated, "
+                          "please use .sort_values(by=...)",
+                          FutureWarning, stacklevel=2)
             if level is not None:
                 raise ValueError("unable to simultaneously sort by and level")
             return self.sort_values(by, axis=axis, ascending=ascending,
@@ -3335,7 +4784,9 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         axis = self._get_axis_number(axis)
         labels = self._get_axis(axis)
 
-        # sort by the index
+        # make sure that the axis is lexsorted to start
+        # if not we need to reconstruct to get the correct indexer
+        labels = labels._sort_levels_monotonic()
         if level is not None:
 
             new_axis, indexer = labels.sortlevel(level, ascending=ascending,
@@ -3344,19 +4795,14 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         elif isinstance(labels, MultiIndex):
             from pandas.core.sorting import lexsort_indexer
 
-            # make sure that the axis is lexsorted to start
-            # if not we need to reconstruct to get the correct indexer
-            if not labels.is_lexsorted():
-                labels = MultiIndex.from_tuples(labels.values)
-
-            indexer = lexsort_indexer(labels.labels, orders=ascending,
+            indexer = lexsort_indexer(labels._get_codes_for_sorting(),
+                                      orders=ascending,
                                       na_position=na_position)
         else:
             from pandas.core.sorting import nargsort
 
-            # GH11080 - Check monotonic-ness before sort an index
-            # if monotonic (already sorted), return None or copy() according
-            # to 'inplace'
+            # Check monotonic-ness before sort an index
+            # GH11080
             if ((ascending and labels.is_monotonic_increasing) or
                     (not ascending and labels.is_monotonic_decreasing)):
                 if inplace:
@@ -3367,119 +4813,236 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
             indexer = nargsort(labels, kind=kind, ascending=ascending,
                                na_position=na_position)
 
+        baxis = self._get_block_manager_axis(axis)
         new_data = self._data.take(indexer,
-                                   axis=self._get_block_manager_axis(axis),
-                                   convert=False, verify=False)
+                                   axis=baxis,
+                                   verify=False)
+
+        # reconstruct axis if needed
+        new_data.axes[baxis] = new_data.axes[baxis]._sort_levels_monotonic()
 
         if inplace:
             return self._update_inplace(new_data)
         else:
             return self._constructor(new_data).__finalize__(self)
 
-    def sortlevel(self, level=0, axis=0, ascending=True, inplace=False,
-                  sort_remaining=True):
-        """
-        DEPRECATED: use :meth:`DataFrame.sort_index`
-
-        Sort multilevel index by chosen axis and primary level. Data will be
-        lexicographically sorted by the chosen level followed by the other
-        levels (in order)
-
-        Parameters
-        ----------
-        level : int
-        axis : {0 or 'index', 1 or 'columns'}, default 0
-        ascending : boolean, default True
-        inplace : boolean, default False
-            Sort the DataFrame without creating a new instance
-        sort_remaining : boolean, default True
-            Sort by the other levels too.
-
-        Returns
-        -------
-        sorted : DataFrame
-
-        See Also
-        --------
-        DataFrame.sort_index(level=...)
-
+    def nlargest(self, n, columns, keep='first'):
         """
-        warnings.warn("sortlevel is deprecated, use sort_index(level= ...)",
-                      FutureWarning, stacklevel=2)
-        return self.sort_index(level=level, axis=axis, ascending=ascending,
-                               inplace=inplace, sort_remaining=sort_remaining)
+        Return the first `n` rows ordered by `columns` in descending order.
 
-    def nlargest(self, n, columns, keep='first'):
-        """Get the rows of a DataFrame sorted by the `n` largest
-        values of `columns`.
+        Return the first `n` rows with the largest values in `columns`, in
+        descending order. The columns that are not specified are returned as
+        well, but not used for ordering.
 
-        .. versionadded:: 0.17.0
+        This method is equivalent to
+        ``df.sort_values(columns, ascending=False).head(n)``, but more
+        performant.
 
         Parameters
         ----------
         n : int
-            Number of items to retrieve
-        columns : list or str
-            Column name or names to order by
-        keep : {'first', 'last', False}, default 'first'
+            Number of rows to return.
+        columns : label or list of labels
+            Column label(s) to order by.
+        keep : {'first', 'last', 'all'}, default 'first'
             Where there are duplicate values:
-            - ``first`` : take the first occurrence.
-            - ``last`` : take the last occurrence.
+
+            - `first` : prioritize the first occurrence(s)
+            - `last` : prioritize the last occurrence(s)
+            - ``all`` : do not drop any duplicates, even it means
+                        selecting more than `n` items.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
         DataFrame
+            The first `n` rows ordered by the given columns in descending
+            order.
+
+        See Also
+        --------
+        DataFrame.nsmallest : Return the first `n` rows ordered by `columns` in
+            ascending order.
+        DataFrame.sort_values : Sort DataFrame by the values.
+        DataFrame.head : Return the first `n` rows without re-ordering.
+
+        Notes
+        -----
+        This function cannot be used with all column types. For example, when
+        specifying columns with `object` or `category` dtypes, ``TypeError`` is
+        raised.
 
         Examples
         --------
-        >>> df = DataFrame({'a': [1, 10, 8, 11, -1],
-        ...                 'b': list('abdce'),
-        ...                 'c': [1.0, 2.0, np.nan, 3.0, 4.0]})
-        >>> df.nlargest(3, 'a')
-            a  b   c
-        3  11  c   3
-        1  10  b   2
-        2   8  d NaN
-        """
-        return algorithms.select_n_frame(self, columns, n, 'nlargest', keep)
+        >>> df = pd.DataFrame({'population': [59000000, 65000000, 434000,
+        ...                                   434000, 434000, 337000, 11300,
+        ...                                   11300, 11300],
+        ...                    'GDP': [1937894, 2583560 , 12011, 4520, 12128,
+        ...                            17036, 182, 38, 311],
+        ...                    'alpha-2': ["IT", "FR", "MT", "MV", "BN",
+        ...                                "IS", "NR", "TV", "AI"]},
+        ...                   index=["Italy", "France", "Malta",
+        ...                          "Maldives", "Brunei", "Iceland",
+        ...                          "Nauru", "Tuvalu", "Anguilla"])
+        >>> df
+                  population      GDP alpha-2
+        Italy       59000000  1937894      IT
+        France      65000000  2583560      FR
+        Malta         434000    12011      MT
+        Maldives      434000     4520      MV
+        Brunei        434000    12128      BN
+        Iceland       337000    17036      IS
+        Nauru          11300      182      NR
+        Tuvalu         11300       38      TV
+        Anguilla       11300      311      AI
+
+        In the following example, we will use ``nlargest`` to select the three
+        rows having the largest values in column "population".
+
+        >>> df.nlargest(3, 'population')
+                population      GDP alpha-2
+        France    65000000  2583560      FR
+        Italy     59000000  1937894      IT
+        Malta       434000    12011      MT
+
+        When using ``keep='last'``, ties are resolved in reverse order:
+
+        >>> df.nlargest(3, 'population', keep='last')
+                population      GDP alpha-2
+        France    65000000  2583560      FR
+        Italy     59000000  1937894      IT
+        Brunei      434000    12128      BN
+
+        When using ``keep='all'``, all duplicate items are maintained:
+
+        >>> df.nlargest(3, 'population', keep='all')
+                  population      GDP alpha-2
+        France      65000000  2583560      FR
+        Italy       59000000  1937894      IT
+        Malta         434000    12011      MT
+        Maldives      434000     4520      MV
+        Brunei        434000    12128      BN
+
+        To order by the largest values in column "population" and then "GDP",
+        we can specify multiple columns like in the next example.
+
+        >>> df.nlargest(3, ['population', 'GDP'])
+                population      GDP alpha-2
+        France    65000000  2583560      FR
+        Italy     59000000  1937894      IT
+        Brunei      434000    12128      BN
+        """
+        return algorithms.SelectNFrame(self,
+                                       n=n,
+                                       keep=keep,
+                                       columns=columns).nlargest()
 
     def nsmallest(self, n, columns, keep='first'):
-        """Get the rows of a DataFrame sorted by the `n` smallest
-        values of `columns`.
+        """
+        Return the first `n` rows ordered by `columns` in ascending order.
+
+        Return the first `n` rows with the smallest values in `columns`, in
+        ascending order. The columns that are not specified are returned as
+        well, but not used for ordering.
 
-        .. versionadded:: 0.17.0
+        This method is equivalent to
+        ``df.sort_values(columns, ascending=True).head(n)``, but more
+        performant.
 
         Parameters
         ----------
         n : int
-            Number of items to retrieve
+            Number of items to retrieve.
         columns : list or str
-            Column name or names to order by
-        keep : {'first', 'last', False}, default 'first'
+            Column name or names to order by.
+        keep : {'first', 'last', 'all'}, default 'first'
             Where there are duplicate values:
+
             - ``first`` : take the first occurrence.
             - ``last`` : take the last occurrence.
+            - ``all`` : do not drop any duplicates, even it means
+              selecting more than `n` items.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
         DataFrame
 
+        See Also
+        --------
+        DataFrame.nlargest : Return the first `n` rows ordered by `columns` in
+            descending order.
+        DataFrame.sort_values : Sort DataFrame by the values.
+        DataFrame.head : Return the first `n` rows without re-ordering.
+
         Examples
         --------
-        >>> df = DataFrame({'a': [1, 10, 8, 11, -1],
-        ...                 'b': list('abdce'),
-        ...                 'c': [1.0, 2.0, np.nan, 3.0, 4.0]})
-        >>> df.nsmallest(3, 'a')
-           a  b   c
-        4 -1  e   4
-        0  1  a   1
-        2  8  d NaN
-        """
-        return algorithms.select_n_frame(self, columns, n, 'nsmallest', keep)
+        >>> df = pd.DataFrame({'population': [59000000, 65000000, 434000,
+        ...                                   434000, 434000, 337000, 11300,
+        ...                                   11300, 11300],
+        ...                    'GDP': [1937894, 2583560 , 12011, 4520, 12128,
+        ...                            17036, 182, 38, 311],
+        ...                    'alpha-2': ["IT", "FR", "MT", "MV", "BN",
+        ...                                "IS", "NR", "TV", "AI"]},
+        ...                   index=["Italy", "France", "Malta",
+        ...                          "Maldives", "Brunei", "Iceland",
+        ...                          "Nauru", "Tuvalu", "Anguilla"])
+        >>> df
+                  population      GDP alpha-2
+        Italy       59000000  1937894      IT
+        France      65000000  2583560      FR
+        Malta         434000    12011      MT
+        Maldives      434000     4520      MV
+        Brunei        434000    12128      BN
+        Iceland       337000    17036      IS
+        Nauru          11300      182      NR
+        Tuvalu         11300       38      TV
+        Anguilla       11300      311      AI
+
+        In the following example, we will use ``nsmallest`` to select the
+        three rows having the smallest values in column "a".
+
+        >>> df.nsmallest(3, 'population')
+                  population  GDP alpha-2
+        Nauru          11300  182      NR
+        Tuvalu         11300   38      TV
+        Anguilla       11300  311      AI
+
+        When using ``keep='last'``, ties are resolved in reverse order:
+
+        >>> df.nsmallest(3, 'population', keep='last')
+                  population  GDP alpha-2
+        Anguilla       11300  311      AI
+        Tuvalu         11300   38      TV
+        Nauru          11300  182      NR
+
+        When using ``keep='all'``, all duplicate items are maintained:
+
+        >>> df.nsmallest(3, 'population', keep='all')
+                  population  GDP alpha-2
+        Nauru          11300  182      NR
+        Tuvalu         11300   38      TV
+        Anguilla       11300  311      AI
+
+        To order by the largest values in column "a" and then "c", we can
+        specify multiple columns like in the next example.
+
+        >>> df.nsmallest(3, ['population', 'GDP'])
+                  population  GDP alpha-2
+        Tuvalu         11300   38      TV
+        Nauru          11300  182      NR
+        Anguilla       11300  311      AI
+        """
+        return algorithms.SelectNFrame(self,
+                                       n=n,
+                                       keep=keep,
+                                       columns=columns).nsmallest()
 
     def swaplevel(self, i=-2, j=-1, axis=0):
         """
-        Swap levels i and j in a MultiIndex on a particular axis
+        Swap levels i and j in a MultiIndex on a particular axis.
 
         Parameters
         ----------
@@ -3488,13 +5051,12 @@ def swaplevel(self, i=-2, j=-1, axis=0):
 
         Returns
         -------
-        swapped : type of caller (new object)
+        DataFrame
 
         .. versionchanged:: 0.18.1
 
            The indexes ``i`` and ``j`` are now optional, and default to
            the two innermost levels of the index.
-
         """
         result = self.copy()
 
@@ -3507,8 +5069,8 @@ def swaplevel(self, i=-2, j=-1, axis=0):
 
     def reorder_levels(self, order, axis=0):
         """
-        Rearrange index levels using input order.
-        May not drop or duplicate levels
+        Rearrange index levels using input order. May not drop or
+        duplicate levels.
 
         Parameters
         ----------
@@ -3543,158 +5105,153 @@ def _combine_frame(self, other, func, fill_value=None, level=None):
         new_index, new_columns = this.index, this.columns
 
         def _arith_op(left, right):
-            if fill_value is not None:
-                left_mask = isnull(left)
-                right_mask = isnull(right)
-                left = left.copy()
-                right = right.copy()
-
-                # one but not both
-                mask = left_mask ^ right_mask
-                left[left_mask & mask] = fill_value
-                right[right_mask & mask] = fill_value
-
-            return func(left, right)
-
-        if this._is_mixed_type or other._is_mixed_type:
-
-            # unique
-            if this.columns.is_unique:
-
-                def f(col):
-                    r = _arith_op(this[col].values, other[col].values)
-                    return self._constructor_sliced(r, index=new_index,
-                                                    dtype=r.dtype)
-
-                result = dict([(col, f(col)) for col in this])
-
-            # non-unique
-            else:
-
-                def f(i):
-                    r = _arith_op(this.iloc[:, i].values,
-                                  other.iloc[:, i].values)
-                    return self._constructor_sliced(r, index=new_index,
-                                                    dtype=r.dtype)
-
-                result = dict([
-                    (i, f(i)) for i, col in enumerate(this.columns)
-                ])
-                result = self._constructor(result, index=new_index, copy=False)
-                result.columns = new_columns
-                return result
+            # for the mixed_type case where we iterate over columns,
+            # _arith_op(left, right) is equivalent to
+            # left._binop(right, func, fill_value=fill_value)
+            left, right = ops.fill_binop(left, right, fill_value)
+            return func(left, right)
 
+        if ops.should_series_dispatch(this, other, func):
+            # iterate over columns
+            return ops.dispatch_to_series(this, other, _arith_op)
         else:
             result = _arith_op(this.values, other.values)
+            return self._constructor(result,
+                                     index=new_index, columns=new_columns,
+                                     copy=False)
 
-        return self._constructor(result, index=new_index, columns=new_columns,
-                                 copy=False)
-
-    def _combine_series(self, other, func, fill_value=None, axis=None,
-                        level=None):
-        if axis is not None:
-            axis = self._get_axis_name(axis)
-            if axis == 'index':
-                return self._combine_match_index(other, func, level=level,
-                                                 fill_value=fill_value)
-            else:
-                return self._combine_match_columns(other, func, level=level,
-                                                   fill_value=fill_value)
-        return self._combine_series_infer(other, func, level=level,
-                                          fill_value=fill_value)
-
-    def _combine_series_infer(self, other, func, level=None, fill_value=None):
-        if len(other) == 0:
-            return self * NA
-
-        if len(self) == 0:
-            # Ambiguous case, use _series so works with DataFrame
-            return self._constructor(data=self._series, index=self.index,
-                                     columns=self.columns)
-
-        return self._combine_match_columns(other, func, level=level,
-                                           fill_value=fill_value)
-
-    def _combine_match_index(self, other, func, level=None, fill_value=None):
+    def _combine_match_index(self, other, func, level=None):
         left, right = self.align(other, join='outer', axis=0, level=level,
                                  copy=False)
-        if fill_value is not None:
-            raise NotImplementedError("fill_value %r not supported." %
-                                      fill_value)
-        return self._constructor(func(left.values.T, right.values).T,
-                                 index=left.index, columns=self.columns,
-                                 copy=False)
+        assert left.index.equals(right.index)
 
-    def _combine_match_columns(self, other, func, level=None, fill_value=None):
+        if left._is_mixed_type or right._is_mixed_type:
+            # operate column-wise; avoid costly object-casting in `.values`
+            return ops.dispatch_to_series(left, right, func)
+        else:
+            # fastpath --> operate directly on values
+            with np.errstate(all="ignore"):
+                new_data = func(left.values.T, right.values).T
+            return self._constructor(new_data,
+                                     index=left.index, columns=self.columns,
+                                     copy=False)
+
+    def _combine_match_columns(self, other, func, level=None):
+        assert isinstance(other, Series)
         left, right = self.align(other, join='outer', axis=1, level=level,
                                  copy=False)
-        if fill_value is not None:
-            raise NotImplementedError("fill_value %r not supported" %
-                                      fill_value)
+        assert left.columns.equals(right.index)
+        return ops.dispatch_to_series(left, right, func, axis="columns")
 
-        new_data = left._data.eval(func=func, other=right,
-                                   axes=[left.columns, self.index])
-        return self._constructor(new_data)
-
-    def _combine_const(self, other, func, raise_on_error=True):
-        new_data = self._data.eval(func=func, other=other,
-                                   raise_on_error=raise_on_error)
-        return self._constructor(new_data)
-
-    def _compare_frame_evaluate(self, other, func, str_rep):
-
-        # unique
-        if self.columns.is_unique:
-
-            def _compare(a, b):
-                return dict([(col, func(a[col], b[col])) for col in a.columns])
-
-            new_data = expressions.evaluate(_compare, str_rep, self, other)
-            return self._constructor(data=new_data, index=self.index,
-                                     columns=self.columns, copy=False)
-        # non-unique
-        else:
-
-            def _compare(a, b):
-                return dict([(i, func(a.iloc[:, i], b.iloc[:, i]))
-                             for i, col in enumerate(a.columns)])
-
-            new_data = expressions.evaluate(_compare, str_rep, self, other)
-            result = self._constructor(data=new_data, index=self.index,
-                                       copy=False)
-            result.columns = self.columns
-            return result
-
-    def _compare_frame(self, other, func, str_rep):
-        if not self._indexed_same(other):
-            raise ValueError('Can only compare identically-labeled '
-                             'DataFrame objects')
-        return self._compare_frame_evaluate(other, func, str_rep)
-
-    def _flex_compare_frame(self, other, func, str_rep, level):
-        if not self._indexed_same(other):
-            self, other = self.align(other, 'outer', level=level, copy=False)
-        return self._compare_frame_evaluate(other, func, str_rep)
+    def _combine_const(self, other, func):
+        assert lib.is_scalar(other) or np.ndim(other) == 0
+        return ops.dispatch_to_series(self, other, func)
 
     def combine(self, other, func, fill_value=None, overwrite=True):
         """
-        Add two DataFrame objects and do not propagate NaN values, so if for a
-        (column, time) one frame is missing a value, it will default to the
-        other frame's value (which might be NaN as well)
+        Perform column-wise combine with another DataFrame.
+
+        Combines a DataFrame with `other` DataFrame using `func`
+        to element-wise combine columns. The row and column indexes of the
+        resulting DataFrame will be the union of the two.
 
         Parameters
         ----------
         other : DataFrame
+            The DataFrame to merge column-wise.
         func : function
-        fill_value : scalar value
-        overwrite : boolean, default True
-            If True then overwrite values for common keys in the calling frame
+            Function that takes two series as inputs and return a Series or a
+            scalar. Used to merge the two dataframes column by columns.
+        fill_value : scalar value, default None
+            The value to fill NaNs with prior to passing any column to the
+            merge func.
+        overwrite : bool, default True
+            If True, columns in `self` that do not exist in `other` will be
+            overwritten with NaNs.
 
         Returns
         -------
-        result : DataFrame
-        """
+        DataFrame
+            Combination of the provided DataFrames.
 
+        See Also
+        --------
+        DataFrame.combine_first : Combine two DataFrame objects and default to
+            non-null values in frame calling the method.
+
+        Examples
+        --------
+        Combine using a simple function that chooses the smaller column.
+
+        >>> df1 = pd.DataFrame({'A': [0, 0], 'B': [4, 4]})
+        >>> df2 = pd.DataFrame({'A': [1, 1], 'B': [3, 3]})
+        >>> take_smaller = lambda s1, s2: s1 if s1.sum() < s2.sum() else s2
+        >>> df1.combine(df2, take_smaller)
+           A  B
+        0  0  3
+        1  0  3
+
+        Example using a true element-wise combine function.
+
+        >>> df1 = pd.DataFrame({'A': [5, 0], 'B': [2, 4]})
+        >>> df2 = pd.DataFrame({'A': [1, 1], 'B': [3, 3]})
+        >>> df1.combine(df2, np.minimum)
+           A  B
+        0  1  2
+        1  0  3
+
+        Using `fill_value` fills Nones prior to passing the column to the
+        merge function.
+
+        >>> df1 = pd.DataFrame({'A': [0, 0], 'B': [None, 4]})
+        >>> df2 = pd.DataFrame({'A': [1, 1], 'B': [3, 3]})
+        >>> df1.combine(df2, take_smaller, fill_value=-5)
+           A    B
+        0  0 -5.0
+        1  0  4.0
+
+        However, if the same element in both dataframes is None, that None
+        is preserved
+
+        >>> df1 = pd.DataFrame({'A': [0, 0], 'B': [None, 4]})
+        >>> df2 = pd.DataFrame({'A': [1, 1], 'B': [None, 3]})
+        >>> df1.combine(df2, take_smaller, fill_value=-5)
+            A    B
+        0  0 -5.0
+        1  0  3.0
+
+        Example that demonstrates the use of `overwrite` and behavior when
+        the axis differ between the dataframes.
+
+        >>> df1 = pd.DataFrame({'A': [0, 0], 'B': [4, 4]})
+        >>> df2 = pd.DataFrame({'B': [3, 3], 'C': [-10, 1], }, index=[1, 2])
+        >>> df1.combine(df2, take_smaller)
+             A    B     C
+        0  NaN  NaN   NaN
+        1  NaN  3.0 -10.0
+        2  NaN  3.0   1.0
+
+        >>> df1.combine(df2, take_smaller, overwrite=False)
+             A    B     C
+        0  0.0  NaN   NaN
+        1  0.0  3.0 -10.0
+        2  NaN  3.0   1.0
+
+        Demonstrating the preference of the passed in dataframe.
+
+        >>> df2 = pd.DataFrame({'B': [3, 3], 'C': [1, 1], }, index=[1, 2])
+        >>> df2.combine(df1, take_smaller)
+           A    B   C
+        0  0.0  NaN NaN
+        1  0.0  3.0 NaN
+        2  NaN  3.0 NaN
+
+        >>> df2.combine(df1, take_smaller, overwrite=False)
+             A    B   C
+        0  0.0  NaN NaN
+        1  0.0  3.0 1.0
+        2  NaN  3.0 1.0
+        """
         other_idxlen = len(other.index)  # save for compare
 
         this, other = self.align(other, copy=False)
@@ -3709,7 +5266,6 @@ def combine(self, other, func, fill_value=None, overwrite=True):
         # sorts if possible
         new_columns = this.columns.union(other.columns)
         do_fill = fill_value is not None
-
         result = {}
         for col in new_columns:
             series = this[col]
@@ -3718,8 +5274,8 @@ def combine(self, other, func, fill_value=None, overwrite=True):
             this_dtype = series.dtype
             other_dtype = otherSeries.dtype
 
-            this_mask = isnull(series)
-            other_mask = isnull(otherSeries)
+            this_mask = isna(series)
+            other_mask = isna(otherSeries)
 
             # don't overwrite columns unecessarily
             # DO propagate if this column is not in the intersection
@@ -3733,104 +5289,230 @@ def combine(self, other, func, fill_value=None, overwrite=True):
                 series[this_mask] = fill_value
                 otherSeries[other_mask] = fill_value
 
-            # if we have different dtypes, possibily promote
-            new_dtype = this_dtype
-            if not is_dtype_equal(this_dtype, other_dtype):
+            if col not in self.columns:
+                # If self DataFrame does not have col in other DataFrame,
+                # try to promote series, which is all NaN, as other_dtype.
+                new_dtype = other_dtype
+                try:
+                    series = series.astype(new_dtype, copy=False)
+                except ValueError:
+                    # e.g. new_dtype is integer types
+                    pass
+            else:
+                # if we have different dtypes, possibly promote
                 new_dtype = find_common_type([this_dtype, other_dtype])
                 if not is_dtype_equal(this_dtype, new_dtype):
                     series = series.astype(new_dtype)
                 if not is_dtype_equal(other_dtype, new_dtype):
                     otherSeries = otherSeries.astype(new_dtype)
 
-            # see if we need to be represented as i8 (datetimelike)
-            # try to keep us at this dtype
-            needs_i8_conversion_i = needs_i8_conversion(new_dtype)
-            if needs_i8_conversion_i:
-                arr = func(series, otherSeries, True)
-            else:
-                arr = func(series, otherSeries)
-
-            if do_fill:
-                arr = _ensure_float(arr)
-                arr[this_mask & other_mask] = NA
-
-            # try to downcast back to the original dtype
-            if needs_i8_conversion_i:
-                # ToDo: This conversion should be handled in
-                # _maybe_cast_to_datetime but the change affects lot...
-                if is_datetime64tz_dtype(new_dtype):
-                    arr = DatetimeIndex._simple_new(arr, tz=new_dtype.tz)
-                else:
-                    arr = maybe_cast_to_datetime(arr, new_dtype)
-            else:
-                arr = maybe_downcast_to_dtype(arr, this_dtype)
+            arr = func(series, otherSeries)
+            arr = maybe_downcast_to_dtype(arr, this_dtype)
 
             result[col] = arr
 
         # convert_objects just in case
         return self._constructor(result, index=new_index,
-                                 columns=new_columns)._convert(datetime=True,
-                                                               copy=False)
+                                 columns=new_columns)
 
     def combine_first(self, other):
         """
-        Combine two DataFrame objects and default to non-null values in frame
-        calling the method. Result index columns will be the union of the
-        respective indexes and columns
+        Update null elements with value in the same location in `other`.
+
+        Combine two DataFrame objects by filling null values in one DataFrame
+        with non-null values from other DataFrame. The row and column indexes
+        of the resulting DataFrame will be the union of the two.
 
         Parameters
         ----------
         other : DataFrame
+            Provided DataFrame to use to fill null values.
+
+        Returns
+        -------
+        DataFrame
+
+        See Also
+        --------
+        DataFrame.combine : Perform series-wise operation on two DataFrames
+            using a given function.
 
         Examples
         --------
-        a's values prioritized, use values from b to fill holes:
 
-        >>> a.combine_first(b)
+        >>> df1 = pd.DataFrame({'A': [None, 0], 'B': [None, 4]})
+        >>> df2 = pd.DataFrame({'A': [1, 1], 'B': [3, 3]})
+        >>> df1.combine_first(df2)
+             A    B
+        0  1.0  3.0
+        1  0.0  4.0
+
+        Null values still persist if the location of that null value
+        does not exist in `other`
+
+        >>> df1 = pd.DataFrame({'A': [None, 0], 'B': [4, None]})
+        >>> df2 = pd.DataFrame({'B': [3, 3], 'C': [1, 1]}, index=[1, 2])
+        >>> df1.combine_first(df2)
+             A    B    C
+        0  NaN  4.0  NaN
+        1  0.0  3.0  1.0
+        2  NaN  3.0  1.0
+        """
+        import pandas.core.computation.expressions as expressions
+
+        def extract_values(arr):
+            # Does two things:
+            # 1. maybe gets the values from the Series / Index
+            # 2. convert datelike to i8
+            if isinstance(arr, (ABCIndexClass, ABCSeries)):
+                arr = arr._values
+
+            if needs_i8_conversion(arr):
+                if is_extension_array_dtype(arr.dtype):
+                    arr = arr.asi8
+                else:
+                    arr = arr.view('i8')
+            return arr
 
+        def combiner(x, y):
+            mask = isna(x)
+            if isinstance(mask, (ABCIndexClass, ABCSeries)):
+                mask = mask._values
 
-        Returns
-        -------
-        combined : DataFrame
-        """
+            x_values = extract_values(x)
+            y_values = extract_values(y)
 
-        def combiner(x, y, needs_i8_conversion=False):
-            x_values = x.values if hasattr(x, 'values') else x
-            y_values = y.values if hasattr(y, 'values') else y
-            if needs_i8_conversion:
-                mask = isnull(x)
-                x_values = x_values.view('i8')
-                y_values = y_values.view('i8')
-            else:
-                mask = isnull(x_values)
+            # If the column y in other DataFrame is not in first DataFrame,
+            # just return y_values.
+            if y.name not in self.columns:
+                return y_values
 
-            return expressions.where(mask, y_values, x_values,
-                                     raise_on_error=True)
+            return expressions.where(mask, y_values, x_values)
 
         return self.combine(other, combiner, overwrite=False)
 
+    @deprecate_kwarg(old_arg_name='raise_conflict', new_arg_name='errors',
+                     mapping={False: 'ignore', True: 'raise'})
     def update(self, other, join='left', overwrite=True, filter_func=None,
-               raise_conflict=False):
+               errors='ignore'):
         """
-        Modify DataFrame in place using non-NA values from passed
-        DataFrame. Aligns on indices
+        Modify in place using non-NA values from another DataFrame.
+
+        Aligns on indices. There is no return value.
 
         Parameters
         ----------
         other : DataFrame, or object coercible into a DataFrame
+            Should have at least one matching index/column label
+            with the original DataFrame. If a Series is passed,
+            its name attribute must be set, and that will be
+            used as the column name to align with the original DataFrame.
         join : {'left'}, default 'left'
-        overwrite : boolean, default True
-            If True then overwrite values for common keys in the calling frame
-        filter_func : callable(1d-array) -> 1d-array<boolean>, default None
+            Only left join is implemented, keeping the index and columns of the
+            original object.
+        overwrite : bool, default True
+            How to handle non-NA values for overlapping keys:
+
+            * True: overwrite original DataFrame's values
+              with values from `other`.
+            * False: only update values that are NA in
+              the original DataFrame.
+
+        filter_func : callable(1d-array) -> bool 1d-array, optional
             Can choose to replace values other than NA. Return True for values
-            that should be updated
-        raise_conflict : boolean
-            If True, will raise an error if the DataFrame and other both
-            contain data in the same place.
+            that should be updated.
+        errors : {'raise', 'ignore'}, default 'ignore'
+            If 'raise', will raise a ValueError if the DataFrame and `other`
+            both contain non-NA data in the same place.
+
+            .. versionchanged :: 0.24.0
+               Changed from `raise_conflict=False|True`
+               to `errors='ignore'|'raise'`.
+
+        Returns
+        -------
+        None : method directly changes calling object
+
+        Raises
+        ------
+        ValueError
+            * When `errors='raise'` and there's overlapping non-NA data.
+            * When `errors` is not either `'ignore'` or `'raise'`
+        NotImplementedError
+            * If `join != 'left'`
+
+        See Also
+        --------
+        dict.update : Similar method for dictionaries.
+        DataFrame.merge : For column(s)-on-columns(s) operations.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2, 3],
+        ...                    'B': [400, 500, 600]})
+        >>> new_df = pd.DataFrame({'B': [4, 5, 6],
+        ...                        'C': [7, 8, 9]})
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  1  4
+        1  2  5
+        2  3  6
+
+        The DataFrame's length does not increase as a result of the update,
+        only values at matching index/column labels are updated.
+
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_df = pd.DataFrame({'B': ['d', 'e', 'f', 'g', 'h', 'i']})
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  a  d
+        1  b  e
+        2  c  f
+
+        For Series, it's name attribute must be set.
+
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_column = pd.Series(['d', 'e'], name='B', index=[0, 2])
+        >>> df.update(new_column)
+        >>> df
+           A  B
+        0  a  d
+        1  b  y
+        2  c  e
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c'],
+        ...                    'B': ['x', 'y', 'z']})
+        >>> new_df = pd.DataFrame({'B': ['d', 'e']}, index=[1, 2])
+        >>> df.update(new_df)
+        >>> df
+           A  B
+        0  a  x
+        1  b  d
+        2  c  e
+
+        If `other` contains NaNs the corresponding values are not updated
+        in the original dataframe.
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3],
+        ...                    'B': [400, 500, 600]})
+        >>> new_df = pd.DataFrame({'B': [4, np.nan, 6]})
+        >>> df.update(new_df)
+        >>> df
+           A      B
+        0  1    4.0
+        1  2  500.0
+        2  3    6.0
         """
+        import pandas.core.computation.expressions as expressions
         # TODO: Support other joins
         if join != 'left':  # pragma: no cover
             raise NotImplementedError("Only left join is supported")
+        if errors not in ['ignore', 'raise']:
+            raise ValueError("The parameter errors must be either "
+                             "'ignore' or 'raise'")
 
         if not isinstance(other, DataFrame):
             other = DataFrame(other)
@@ -3842,148 +5524,431 @@ def update(self, other, join='left', overwrite=True, filter_func=None,
             that = other[col].values
             if filter_func is not None:
                 with np.errstate(all='ignore'):
-                    mask = ~filter_func(this) | isnull(that)
+                    mask = ~filter_func(this) | isna(that)
             else:
-                if raise_conflict:
-                    mask_this = notnull(that)
-                    mask_that = notnull(this)
+                if errors == 'raise':
+                    mask_this = notna(that)
+                    mask_that = notna(this)
                     if any(mask_this & mask_that):
                         raise ValueError("Data overlaps.")
 
                 if overwrite:
-                    mask = isnull(that)
-
-                    # don't overwrite columns unecessarily
-                    if mask.all():
-                        continue
+                    mask = isna(that)
                 else:
-                    mask = notnull(this)
+                    mask = notna(this)
 
-            self[col] = expressions.where(mask, this, that,
-                                          raise_on_error=True)
-
-    # ----------------------------------------------------------------------
-    # Misc methods
-
-    def first_valid_index(self):
-        """
-        Return label for first non-NA/null value
-        """
-        if len(self) == 0:
-            return None
-
-        return self.index[self.count(1) > 0][0]
-
-    def last_valid_index(self):
-        """
-        Return label for last non-NA/null value
-        """
-        if len(self) == 0:
-            return None
+            # don't overwrite columns unecessarily
+            if mask.all():
+                continue
 
-        return self.index[self.count(1) > 0][-1]
+            self[col] = expressions.where(mask, this, that)
 
     # ----------------------------------------------------------------------
     # Data reshaping
 
-    def pivot(self, index=None, columns=None, values=None):
-        """
+    _shared_docs['pivot'] = """
+        Return reshaped DataFrame organized by given index / column values.
+
         Reshape data (produce a "pivot" table) based on column values. Uses
-        unique values from index / columns to form axes of the resulting
-        DataFrame.
+        unique values from specified `index` / `columns` to form axes of the
+        resulting DataFrame. This function does not support data
+        aggregation, multiple values will result in a MultiIndex in the
+        columns. See the :ref:`User Guide <reshaping>` for more on reshaping.
 
         Parameters
-        ----------
+        ----------%s
         index : string or object, optional
-            Column name to use to make new frame's index. If None, uses
+            Column to use to make new frame's index. If None, uses
             existing index.
         columns : string or object
-            Column name to use to make new frame's columns
-        values : string or object, optional
-            Column name to use for populating new frame's values. If not
+            Column to use to make new frame's columns.
+        values : string, object or a list of the previous, optional
+            Column(s) to use for populating new frame's values. If not
             specified, all remaining columns will be used and the result will
-            have hierarchically indexed columns
+            have hierarchically indexed columns.
+
+            .. versionchanged :: 0.23.0
+               Also accept list of column names.
 
         Returns
         -------
-        pivoted : DataFrame
+        DataFrame
+            Returns reshaped DataFrame.
 
-        See also
+        Raises
+        ------
+        ValueError:
+            When there are any `index`, `columns` combinations with multiple
+            values. `DataFrame.pivot_table` when you need to aggregate.
+
+        See Also
         --------
-        DataFrame.pivot_table : generalization of pivot that can handle
-            duplicate values for one index/column pair
-        DataFrame.unstack : pivot based on the index values instead of a
-            column
+        DataFrame.pivot_table : Generalization of pivot that can handle
+            duplicate values for one index/column pair.
+        DataFrame.unstack : Pivot based on the index values instead of a
+            column.
 
         Notes
         -----
         For finer-tuned control, see hierarchical indexing documentation along
-        with the related stack/unstack methods
+        with the related stack/unstack methods.
 
         Examples
         --------
-
-        >>> df = pd.DataFrame({'foo': ['one','one','one','two','two','two'],
-                               'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
-                               'baz': [1, 2, 3, 4, 5, 6]})
+        >>> df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two',
+        ...                            'two'],
+        ...                    'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+        ...                    'baz': [1, 2, 3, 4, 5, 6],
+        ...                    'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
         >>> df
-            foo   bar  baz
-        0   one   A    1
-        1   one   B    2
-        2   one   C    3
-        3   two   A    4
-        4   two   B    5
-        5   two   C    6
+            foo   bar  baz  zoo
+        0   one   A    1    x
+        1   one   B    2    y
+        2   one   C    3    z
+        3   two   A    4    q
+        4   two   B    5    w
+        5   two   C    6    t
 
         >>> df.pivot(index='foo', columns='bar', values='baz')
-             A   B   C
+        bar  A   B   C
+        foo
         one  1   2   3
         two  4   5   6
 
         >>> df.pivot(index='foo', columns='bar')['baz']
-             A   B   C
+        bar  A   B   C
+        foo
         one  1   2   3
         two  4   5   6
 
+        >>> df.pivot(index='foo', columns='bar', values=['baz', 'zoo'])
+              baz       zoo
+        bar   A  B  C   A  B  C
+        foo
+        one   1  2  3   x  y  z
+        two   4  5  6   q  w  t
 
+        A ValueError is raised if there are any duplicates.
+
+        >>> df = pd.DataFrame({"foo": ['one', 'one', 'two', 'two'],
+        ...                    "bar": ['A', 'A', 'B', 'C'],
+        ...                    "baz": [1, 2, 3, 4]})
+        >>> df
+           foo bar  baz
+        0  one   A    1
+        1  one   A    2
+        2  two   B    3
+        3  two   C    4
+
+        Notice that the first two rows are the same for our `index`
+        and `columns` arguments.
+
+        >>> df.pivot(index='foo', columns='bar', values='baz')
+        Traceback (most recent call last):
+           ...
+        ValueError: Index contains duplicate entries, cannot reshape
         """
-        from pandas.core.reshape import pivot
+
+    @Substitution('')
+    @Appender(_shared_docs['pivot'])
+    def pivot(self, index=None, columns=None, values=None):
+        from pandas.core.reshape.pivot import pivot
         return pivot(self, index=index, columns=columns, values=values)
 
-    def stack(self, level=-1, dropna=True):
-        """
-        Pivot a level of the (possibly hierarchical) column labels, returning a
-        DataFrame (or Series in the case of an object with a single level of
-        column labels) having a hierarchical index with a new inner-most level
-        of row labels.
-        The level involved will automatically get sorted.
+    _shared_docs['pivot_table'] = """
+        Create a spreadsheet-style pivot table as a DataFrame. The levels in
+        the pivot table will be stored in MultiIndex objects (hierarchical
+        indexes) on the index and columns of the result DataFrame.
 
         Parameters
-        ----------
-        level : int, string, or list of these, default last level
-            Level(s) to stack, can pass level name
+        ----------%s
+        values : column to aggregate, optional
+        index : column, Grouper, array, or list of the previous
+            If an array is passed, it must be the same length as the data. The
+            list can contain any of the other types (except list).
+            Keys to group by on the pivot table index.  If an array is passed,
+            it is being used as the same manner as column values.
+        columns : column, Grouper, array, or list of the previous
+            If an array is passed, it must be the same length as the data. The
+            list can contain any of the other types (except list).
+            Keys to group by on the pivot table column.  If an array is passed,
+            it is being used as the same manner as column values.
+        aggfunc : function, list of functions, dict, default numpy.mean
+            If list of functions passed, the resulting pivot table will have
+            hierarchical columns whose top level are the function names
+            (inferred from the function objects themselves)
+            If dict is passed, the key is column to aggregate and value
+            is function or list of functions
+        fill_value : scalar, default None
+            Value to replace missing values with
+        margins : boolean, default False
+            Add all row / columns (e.g. for subtotal / grand totals)
         dropna : boolean, default True
-            Whether to drop rows in the resulting Frame/Series with no valid
-            values
+            Do not include columns whose entries are all NaN
+        margins_name : string, default 'All'
+            Name of the row / column that will contain the totals
+            when margins is True.
+
+        Returns
+        -------
+        DataFrame
+
+        See Also
+        --------
+        DataFrame.pivot : Pivot without aggregation that can handle
+            non-numeric data.
 
         Examples
-        ----------
-        >>> s
-             a   b
-        one  1.  2.
-        two  3.  4.
+        --------
+        >>> df = pd.DataFrame({"A": ["foo", "foo", "foo", "foo", "foo",
+        ...                          "bar", "bar", "bar", "bar"],
+        ...                    "B": ["one", "one", "one", "two", "two",
+        ...                          "one", "one", "two", "two"],
+        ...                    "C": ["small", "large", "large", "small",
+        ...                          "small", "large", "small", "small",
+        ...                          "large"],
+        ...                    "D": [1, 2, 2, 3, 3, 4, 5, 6, 7],
+        ...                    "E": [2, 4, 5, 5, 6, 6, 8, 9, 9]})
+        >>> df
+             A    B      C  D  E
+        0  foo  one  small  1  2
+        1  foo  one  large  2  4
+        2  foo  one  large  2  5
+        3  foo  two  small  3  5
+        4  foo  two  small  3  6
+        5  bar  one  large  4  6
+        6  bar  one  small  5  8
+        7  bar  two  small  6  9
+        8  bar  two  large  7  9
+
+        This first example aggregates values by taking the sum.
+
+        >>> table = pd.pivot_table(df, values='D', index=['A', 'B'],
+        ...                     columns=['C'], aggfunc=np.sum)
+        >>> table
+        C        large  small
+        A   B
+        bar one    4.0    5.0
+            two    7.0    6.0
+        foo one    4.0    1.0
+            two    NaN    6.0
+
+        We can also fill missing values using the `fill_value` parameter.
+
+        >>> table = pd.pivot_table(df, values='D', index=['A', 'B'],
+        ...                     columns=['C'], aggfunc=np.sum, fill_value=0)
+        >>> table
+        C        large  small
+        A   B
+        bar one      4      5
+            two      7      6
+        foo one      4      1
+            two      0      6
+
+        The next example aggregates by taking the mean across multiple columns.
+
+        >>> table = pd.pivot_table(df, values=['D', 'E'], index=['A', 'C'],
+        ...                     aggfunc={'D': np.mean,
+        ...                              'E': np.mean})
+        >>> table
+                        D         E
+        A   C
+        bar large  5.500000  7.500000
+            small  5.500000  8.500000
+        foo large  2.000000  4.500000
+            small  2.333333  4.333333
+
+        We can also calculate multiple types of aggregations for any given
+        value column.
+
+        >>> table = pd.pivot_table(df, values=['D', 'E'], index=['A', 'C'],
+        ...                     aggfunc={'D': np.mean,
+        ...                              'E': [min, max, np.mean]})
+        >>> table
+                        D    E
+                    mean  max      mean  min
+        A   C
+        bar large  5.500000  9.0  7.500000  6.0
+            small  5.500000  9.0  8.500000  8.0
+        foo large  2.000000  5.0  4.500000  4.0
+            small  2.333333  6.0  4.333333  2.0
+        """
 
-        >>> s.stack()
-        one a    1
-            b    2
-        two a    3
-            b    4
+    @Substitution('')
+    @Appender(_shared_docs['pivot_table'])
+    def pivot_table(self, values=None, index=None, columns=None,
+                    aggfunc='mean', fill_value=None, margins=False,
+                    dropna=True, margins_name='All'):
+        from pandas.core.reshape.pivot import pivot_table
+        return pivot_table(self, values=values, index=index, columns=columns,
+                           aggfunc=aggfunc, fill_value=fill_value,
+                           margins=margins, dropna=dropna,
+                           margins_name=margins_name)
+
+    def stack(self, level=-1, dropna=True):
+        """
+        Stack the prescribed level(s) from columns to index.
+
+        Return a reshaped DataFrame or Series having a multi-level
+        index with one or more new inner-most levels compared to the current
+        DataFrame. The new inner-most levels are created by pivoting the
+        columns of the current dataframe:
+
+          - if the columns have a single level, the output is a Series;
+          - if the columns have multiple levels, the new index
+            level(s) is (are) taken from the prescribed level(s) and
+            the output is a DataFrame.
+
+        The new index levels are sorted.
+
+        Parameters
+        ----------
+        level : int, str, list, default -1
+            Level(s) to stack from the column axis onto the index
+            axis, defined as one index or label, or a list of indices
+            or labels.
+        dropna : bool, default True
+            Whether to drop rows in the resulting Frame/Series with
+            missing values. Stacking a column level onto the index
+            axis can create combinations of index and column values
+            that are missing from the original dataframe. See Examples
+            section.
 
         Returns
         -------
-        stacked : DataFrame or Series
-        """
-        from pandas.core.reshape import stack, stack_multiple
+        DataFrame or Series
+            Stacked dataframe or series.
+
+        See Also
+        --------
+        DataFrame.unstack : Unstack prescribed level(s) from index axis
+             onto column axis.
+        DataFrame.pivot : Reshape dataframe from long format to wide
+             format.
+        DataFrame.pivot_table : Create a spreadsheet-style pivot table
+             as a DataFrame.
+
+        Notes
+        -----
+        The function is named by analogy with a collection of books
+        being reorganized from being side by side on a horizontal
+        position (the columns of the dataframe) to being stacked
+        vertically on top of each other (in the index of the
+        dataframe).
+
+        Examples
+        --------
+        **Single level columns**
+
+        >>> df_single_level_cols = pd.DataFrame([[0, 1], [2, 3]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=['weight', 'height'])
+
+        Stacking a dataframe with a single level column axis returns a Series:
+
+        >>> df_single_level_cols
+             weight height
+        cat       0      1
+        dog       2      3
+        >>> df_single_level_cols.stack()
+        cat  weight    0
+             height    1
+        dog  weight    2
+             height    3
+        dtype: int64
+
+        **Multi level columns: simple case**
+
+        >>> multicol1 = pd.MultiIndex.from_tuples([('weight', 'kg'),
+        ...                                        ('weight', 'pounds')])
+        >>> df_multi_level_cols1 = pd.DataFrame([[1, 2], [2, 4]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol1)
+
+        Stacking a dataframe with a multi-level column axis:
+
+        >>> df_multi_level_cols1
+             weight
+                 kg    pounds
+        cat       1        2
+        dog       2        4
+        >>> df_multi_level_cols1.stack()
+                    weight
+        cat kg           1
+            pounds       2
+        dog kg           2
+            pounds       4
+
+        **Missing values**
+
+        >>> multicol2 = pd.MultiIndex.from_tuples([('weight', 'kg'),
+        ...                                        ('height', 'm')])
+        >>> df_multi_level_cols2 = pd.DataFrame([[1.0, 2.0], [3.0, 4.0]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol2)
+
+        It is common to have missing values when stacking a dataframe
+        with multi-level columns, as the stacked dataframe typically
+        has more values than the original dataframe. Missing values
+        are filled with NaNs:
+
+        >>> df_multi_level_cols2
+            weight height
+                kg      m
+        cat    1.0    2.0
+        dog    3.0    4.0
+        >>> df_multi_level_cols2.stack()
+                height  weight
+        cat kg     NaN     1.0
+            m      2.0     NaN
+        dog kg     NaN     3.0
+            m      4.0     NaN
+
+        **Prescribing the level(s) to be stacked**
+
+        The first parameter controls which level or levels are stacked:
+
+        >>> df_multi_level_cols2.stack(0)
+                     kg    m
+        cat height  NaN  2.0
+            weight  1.0  NaN
+        dog height  NaN  4.0
+            weight  3.0  NaN
+        >>> df_multi_level_cols2.stack([0, 1])
+        cat  height  m     2.0
+             weight  kg    1.0
+        dog  height  m     4.0
+             weight  kg    3.0
+        dtype: float64
+
+        **Dropping missing values**
+
+        >>> df_multi_level_cols3 = pd.DataFrame([[None, 1.0], [2.0, 3.0]],
+        ...                                     index=['cat', 'dog'],
+        ...                                     columns=multicol2)
+
+        Note that rows where all values are missing are dropped by
+        default but this behaviour can be controlled via the dropna
+        keyword parameter:
+
+        >>> df_multi_level_cols3
+            weight height
+                kg      m
+        cat    NaN    1.0
+        dog    2.0    3.0
+        >>> df_multi_level_cols3.stack(dropna=False)
+                height  weight
+        cat kg     NaN     NaN
+            m      1.0     NaN
+        dog kg     NaN     2.0
+            m      3.0     NaN
+        >>> df_multi_level_cols3.stack(dropna=True)
+                height  weight
+        cat m      1.0     NaN
+        dog kg     NaN     2.0
+            m      3.0     NaN
+        """
+        from pandas.core.reshape.reshape import stack, stack_multiple
 
         if isinstance(level, (tuple, list)):
             return stack_multiple(self, level, dropna=dropna)
@@ -3994,9 +5959,11 @@ def unstack(self, level=-1, fill_value=None):
         """
         Pivot a level of the (necessarily hierarchical) index labels, returning
         a DataFrame having a new level of column labels whose inner-most level
-        consists of the pivoted index labels. If the index is not a MultiIndex,
-        the output will be a Series (the analogue of stack when the columns are
-        not a MultiIndex).
+        consists of the pivoted index labels.
+
+        If the index is not a MultiIndex, the output will be a Series
+        (the analogue of stack when the columns are not a MultiIndex).
+
         The level involved will automatically get sorted.
 
         Parameters
@@ -4006,9 +5973,13 @@ def unstack(self, level=-1, fill_value=None):
         fill_value : replace NaN with this value if the unstack produces
             missing values
 
-            .. versionadded: 0.18.0
+            .. versionadded:: 0.18.0
+
+        Returns
+        -------
+        Series or DataFrame
 
-        See also
+        See Also
         --------
         DataFrame.pivot : Pivot a table based on column values.
         DataFrame.stack : Pivot a level of the column labels (inverse operation
@@ -4043,33 +6014,201 @@ def unstack(self, level=-1, fill_value=None):
         two  a  3.0
              b  4.0
         dtype: float64
-
-        Returns
-        -------
-        unstacked : DataFrame or Series
         """
-        from pandas.core.reshape import unstack
+        from pandas.core.reshape.reshape import unstack
         return unstack(self, level, fill_value)
 
+    _shared_docs['melt'] = ("""
+    Unpivot a DataFrame from wide format to long format, optionally
+    leaving identifier variables set.
+
+    This function is useful to massage a DataFrame into a format where one
+    or more columns are identifier variables (`id_vars`), while all other
+    columns, considered measured variables (`value_vars`), are "unpivoted" to
+    the row axis, leaving just two non-identifier columns, 'variable' and
+    'value'.
+
+    %(versionadded)s
+    Parameters
+    ----------
+    frame : DataFrame
+    id_vars : tuple, list, or ndarray, optional
+        Column(s) to use as identifier variables.
+    value_vars : tuple, list, or ndarray, optional
+        Column(s) to unpivot. If not specified, uses all columns that
+        are not set as `id_vars`.
+    var_name : scalar
+        Name to use for the 'variable' column. If None it uses
+        ``frame.columns.name`` or 'variable'.
+    value_name : scalar, default 'value'
+        Name to use for the 'value' column.
+    col_level : int or string, optional
+        If columns are a MultiIndex then use this level to melt.
+
+    See Also
+    --------
+    %(other)s
+    pivot_table
+    DataFrame.pivot
+
+    Examples
+    --------
+    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
+    ...                    'B': {0: 1, 1: 3, 2: 5},
+    ...                    'C': {0: 2, 1: 4, 2: 6}})
+    >>> df
+       A  B  C
+    0  a  1  2
+    1  b  3  4
+    2  c  5  6
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B', 'C'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+    3  a        C      2
+    4  b        C      4
+    5  c        C      6
+
+    The names of 'variable' and 'value' columns can be customized:
+
+    >>> %(caller)sid_vars=['A'], value_vars=['B'],
+    ...         var_name='myVarname', value_name='myValname')
+       A myVarname  myValname
+    0  a         B          1
+    1  b         B          3
+    2  c         B          5
+
+    If you have multi-index columns:
+
+    >>> df.columns = [list('ABC'), list('DEF')]
+    >>> df
+       A  B  C
+       D  E  F
+    0  a  1  2
+    1  b  3  4
+    2  c  5  6
+
+    >>> %(caller)scol_level=0, id_vars=['A'], value_vars=['B'])
+       A variable  value
+    0  a        B      1
+    1  b        B      3
+    2  c        B      5
+
+    >>> %(caller)sid_vars=[('A', 'D')], value_vars=[('B', 'E')])
+      (A, D) variable_0 variable_1  value
+    0      a          B          E      1
+    1      b          B          E      3
+    2      c          B          E      5
+    """)
+
+    @Appender(_shared_docs['melt'] %
+              dict(caller='df.melt(',
+                   versionadded='.. versionadded:: 0.20.0\n',
+                   other='melt'))
+    def melt(self, id_vars=None, value_vars=None, var_name=None,
+             value_name='value', col_level=None):
+        from pandas.core.reshape.melt import melt
+        return melt(self, id_vars=id_vars, value_vars=value_vars,
+                    var_name=var_name, value_name=value_name,
+                    col_level=col_level)
+
     # ----------------------------------------------------------------------
     # Time series-related
 
     def diff(self, periods=1, axis=0):
         """
-        1st discrete difference of object
+        First discrete difference of element.
+
+        Calculates the difference of a DataFrame element compared with another
+        element in the DataFrame (default is the element in the same column
+        of the previous row).
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming difference
+            Periods to shift for calculating difference, accepts negative
+            values.
         axis : {0 or 'index', 1 or 'columns'}, default 0
             Take difference over rows (0) or columns (1).
 
-            .. versionadded: 0.16.1
+            .. versionadded:: 0.16.1.
 
         Returns
         -------
-        diffed : DataFrame
+        DataFrame
+
+        See Also
+        --------
+        Series.diff: First discrete difference for a Series.
+        DataFrame.pct_change: Percent change over given number of periods.
+        DataFrame.shift: Shift index by desired number of periods with an
+            optional time freq.
+
+        Examples
+        --------
+        Difference with previous row
+
+        >>> df = pd.DataFrame({'a': [1, 2, 3, 4, 5, 6],
+        ...                    'b': [1, 1, 2, 3, 5, 8],
+        ...                    'c': [1, 4, 9, 16, 25, 36]})
+        >>> df
+           a  b   c
+        0  1  1   1
+        1  2  1   4
+        2  3  2   9
+        3  4  3  16
+        4  5  5  25
+        5  6  8  36
+
+        >>> df.diff()
+             a    b     c
+        0  NaN  NaN   NaN
+        1  1.0  0.0   3.0
+        2  1.0  1.0   5.0
+        3  1.0  1.0   7.0
+        4  1.0  2.0   9.0
+        5  1.0  3.0  11.0
+
+        Difference with previous column
+
+        >>> df.diff(axis=1)
+            a    b     c
+        0 NaN  0.0   0.0
+        1 NaN -1.0   3.0
+        2 NaN -1.0   7.0
+        3 NaN -1.0  13.0
+        4 NaN  0.0  20.0
+        5 NaN  2.0  28.0
+
+        Difference with 3rd previous row
+
+        >>> df.diff(periods=3)
+             a    b     c
+        0  NaN  NaN   NaN
+        1  NaN  NaN   NaN
+        2  NaN  NaN   NaN
+        3  3.0  2.0  15.0
+        4  3.0  4.0  21.0
+        5  3.0  6.0  27.0
+
+        Difference with following row
+
+        >>> df.diff(periods=-1)
+             a    b     c
+        0 -1.0  0.0  -3.0
+        1 -1.0 -1.0  -5.0
+        2 -1.0 -1.0  -7.0
+        3 -1.0 -2.0  -9.0
+        4 -1.0 -3.0 -11.0
+        5  NaN  NaN   NaN
         """
         bm_axis = self._get_block_manager_axis(axis)
         new_data = self._data.diff(n=periods, axis=bm_axis)
@@ -4078,293 +6217,379 @@ def diff(self, periods=1, axis=0):
     # ----------------------------------------------------------------------
     # Function application
 
-    def apply(self, func, axis=0, broadcast=False, raw=False, reduce=None,
-              args=(), **kwds):
+    def _gotitem(self,
+                 key,           # type: Union[str, List[str]]
+                 ndim,          # type: int
+                 subset=None    # type: Union[Series, DataFrame, None]
+                 ):
+        # type: (...) -> Union[Series, DataFrame]
         """
-        Applies function along input axis of DataFrame.
-
-        Objects passed to functions are Series objects having index
-        either the DataFrame's index (axis=0) or the columns (axis=1).
-        Return type depends on whether passed function aggregates, or the
-        reduce argument if the DataFrame is empty.
+        Sub-classes to define. Return a sliced object.
 
         Parameters
         ----------
-        func : function
-            Function to apply to each column/row
-        axis : {0 or 'index', 1 or 'columns'}, default 0
-            * 0 or 'index': apply function to each column
-            * 1 or 'columns': apply function to each row
-        broadcast : boolean, default False
-            For aggregation functions, return object of same size with values
-            propagated
-        raw : boolean, default False
-            If False, convert each row or column into a Series. If raw=True the
-            passed function will receive ndarray objects instead. If you are
-            just applying a NumPy reduction function this will achieve much
-            better performance
-        reduce : boolean or None, default None
-            Try to apply reduction procedures. If the DataFrame is empty,
-            apply will use reduce to determine whether the result should be a
-            Series or a DataFrame. If reduce is None (the default), apply's
-            return value will be guessed by calling func an empty Series (note:
-            while guessing, exceptions raised by func will be ignored). If
-            reduce is True a Series will always be returned, and if False a
-            DataFrame will always be returned.
-        args : tuple
-            Positional arguments to pass to function in addition to the
-            array/series
-        Additional keyword arguments will be passed as keywords to the function
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        if subset is None:
+            subset = self
+        elif subset.ndim == 1:  # is Series
+            return subset
 
-        Notes
-        -----
-        In the current implementation apply calls func twice on the
-        first column/row to decide whether it can take a fast or slow
-        code path. This can lead to unexpected behavior if func has
-        side-effects, as they will take effect twice for the first
-        column/row.
+        # TODO: _shallow_copy(subset)?
+        return subset[key]
 
-        Examples
-        --------
-        >>> df.apply(numpy.sqrt) # returns DataFrame
-        >>> df.apply(numpy.sum, axis=0) # equiv to df.sum(0)
-        >>> df.apply(numpy.sum, axis=1) # equiv to df.sum(1)
+    _agg_summary_and_see_also_doc = dedent("""
+    The aggregation operations are always performed over an axis, either the
+    index (default) or the column axis. This behavior is different from
+    `numpy` aggregation functions (`mean`, `median`, `prod`, `sum`, `std`,
+    `var`), where the default is to compute the aggregation of the flattened
+    array, e.g., ``numpy.mean(arr_2d)`` as opposed to ``numpy.mean(arr_2d,
+    axis=0)``.
 
-        See also
-        --------
-        DataFrame.applymap: For elementwise operations
+    `agg` is an alias for `aggregate`. Use the alias.
 
-        Returns
-        -------
-        applied : Series or DataFrame
-        """
+    See Also
+    --------
+    DataFrame.apply : Perform any type of operations.
+    DataFrame.transform : Perform transformation type operations.
+    core.groupby.GroupBy : Perform operations over groups.
+    core.resample.Resampler : Perform operations over resampled bins.
+    core.window.Rolling : Perform operations over rolling window.
+    core.window.Expanding : Perform operations over expanding window.
+    core.window.EWM : Perform operation over exponential weighted
+        window.
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+    >>> df = pd.DataFrame([[1, 2, 3],
+    ...                    [4, 5, 6],
+    ...                    [7, 8, 9],
+    ...                    [np.nan, np.nan, np.nan]],
+    ...                   columns=['A', 'B', 'C'])
+
+    Aggregate these functions over the rows.
+
+    >>> df.agg(['sum', 'min'])
+            A     B     C
+    sum  12.0  15.0  18.0
+    min   1.0   2.0   3.0
+
+    Different aggregations per column.
+
+    >>> df.agg({'A' : ['sum', 'min'], 'B' : ['min', 'max']})
+            A    B
+    max   NaN  8.0
+    min   1.0  2.0
+    sum  12.0  NaN
+
+    Aggregate over the columns.
+
+    >>> df.agg("mean", axis="columns")
+    0    2.0
+    1    5.0
+    2    8.0
+    3    NaN
+    dtype: float64
+    """)
+
+    @Substitution(see_also=_agg_summary_and_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='.. versionadded:: 0.20.0',
+                  **_shared_doc_kwargs)
+    @Appender(_shared_docs['aggregate'])
+    def aggregate(self, func, axis=0, *args, **kwargs):
         axis = self._get_axis_number(axis)
-        if kwds or args and not isinstance(func, np.ufunc):
 
-            def f(x):
-                return func(x, *args, **kwds)
-        else:
-            f = func
+        result = None
+        try:
+            result, how = self._aggregate(func, axis=axis, *args, **kwargs)
+        except TypeError:
+            pass
+        if result is None:
+            return self.apply(func, axis=axis, args=args, **kwargs)
+        return result
 
-        if len(self.columns) == 0 and len(self.index) == 0:
-            return self._apply_empty_result(func, axis, reduce, *args, **kwds)
+    def _aggregate(self, arg, axis=0, *args, **kwargs):
+        if axis == 1:
+            # NDFrame.aggregate returns a tuple, and we need to transpose
+            # only result
+            result, how = (super(DataFrame, self.T)
+                           ._aggregate(arg, *args, **kwargs))
+            result = result.T if result is not None else result
+            return result, how
+        return super(DataFrame, self)._aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    @Appender(_shared_docs['transform'] % _shared_doc_kwargs)
+    def transform(self, func, axis=0, *args, **kwargs):
+        axis = self._get_axis_number(axis)
+        if axis == 1:
+            return super(DataFrame, self.T).transform(func, *args, **kwargs).T
+        return super(DataFrame, self).transform(func, *args, **kwargs)
 
-        if isinstance(f, np.ufunc):
-            with np.errstate(all='ignore'):
-                results = f(self.values)
-            return self._constructor(data=results, index=self.index,
-                                     columns=self.columns, copy=False)
-        else:
-            if not broadcast:
-                if not all(self.shape):
-                    return self._apply_empty_result(func, axis, reduce, *args,
-                                                    **kwds)
+    def apply(self, func, axis=0, broadcast=None, raw=False, reduce=None,
+              result_type=None, args=(), **kwds):
+        """
+        Apply a function along an axis of the DataFrame.
 
-                if raw and not self._is_mixed_type:
-                    return self._apply_raw(f, axis)
-                else:
-                    if reduce is None:
-                        reduce = True
-                    return self._apply_standard(f, axis, reduce=reduce)
-            else:
-                return self._apply_broadcast(f, axis)
+        Objects passed to the function are Series objects whose index is
+        either the DataFrame's index (``axis=0``) or the DataFrame's columns
+        (``axis=1``). By default (``result_type=None``), the final return type
+        is inferred from the return type of the applied function. Otherwise,
+        it depends on the `result_type` argument.
 
-    def _apply_empty_result(self, func, axis, reduce, *args, **kwds):
-        if reduce is None:
-            reduce = False
-            try:
-                reduce = not isinstance(func(_EMPTY_SERIES, *args, **kwds),
-                                        Series)
-            except Exception:
-                pass
+        Parameters
+        ----------
+        func : function
+            Function to apply to each column or row.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Axis along which the function is applied:
+
+            * 0 or 'index': apply function to each column.
+            * 1 or 'columns': apply function to each row.
+        broadcast : bool, optional
+            Only relevant for aggregation functions:
+
+            * ``False`` or ``None`` : returns a Series whose length is the
+              length of the index or the number of columns (based on the
+              `axis` parameter)
+            * ``True`` : results will be broadcast to the original shape
+              of the frame, the original index and columns will be retained.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='broadcast'.
+
+        raw : bool, default False
+            * ``False`` : passes each row or column as a Series to the
+              function.
+            * ``True`` : the passed function will receive ndarray objects
+              instead.
+              If you are just applying a NumPy reduction function this will
+              achieve much better performance.
+        reduce : bool or None, default None
+            Try to apply reduction procedures. If the DataFrame is empty,
+            `apply` will use `reduce` to determine whether the result
+            should be a Series or a DataFrame. If ``reduce=None`` (the
+            default), `apply`'s return value will be guessed by calling
+            `func` on an empty Series
+            (note: while guessing, exceptions raised by `func` will be
+            ignored).
+            If ``reduce=True`` a Series will always be returned, and if
+            ``reduce=False`` a DataFrame will always be returned.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by ``result_type='reduce'``.
+
+        result_type : {'expand', 'reduce', 'broadcast', None}, default None
+            These only act when ``axis=1`` (columns):
+
+            * 'expand' : list-like results will be turned into columns.
+            * 'reduce' : returns a Series if possible rather than expanding
+              list-like results. This is the opposite of 'expand'.
+            * 'broadcast' : results will be broadcast to the original shape
+              of the DataFrame, the original index and columns will be
+              retained.
+
+            The default behaviour (None) depends on the return value of the
+            applied function: list-like results will be returned as a Series
+            of those. However if the apply function returns a Series these
+            are expanded to columns.
+
+            .. versionadded:: 0.23.0
 
-        if reduce:
-            return Series(NA, index=self._get_agg_axis(axis))
-        else:
-            return self.copy()
+        args : tuple
+            Positional arguments to pass to `func` in addition to the
+            array/series.
+        **kwds
+            Additional keyword arguments to pass as keywords arguments to
+            `func`.
 
-    def _apply_raw(self, func, axis):
-        try:
-            result = lib.reduce(self.values, func, axis=axis)
-        except Exception:
-            result = np.apply_along_axis(func, axis, self.values)
+        Returns
+        -------
+        Series or DataFrame
+            Result of applying ``func`` along the given axis of the
+            DataFrame.
 
-        # TODO: mixed type case
-        if result.ndim == 2:
-            return DataFrame(result, index=self.index, columns=self.columns)
-        else:
-            return Series(result, index=self._get_agg_axis(axis))
+        See Also
+        --------
+        DataFrame.applymap: For elementwise operations.
+        DataFrame.aggregate: Only perform aggregating type operations.
+        DataFrame.transform: Only perform transforming type operations.
 
-    def _apply_standard(self, func, axis, ignore_failures=False, reduce=True):
+        Notes
+        -----
+        In the current implementation apply calls `func` twice on the
+        first column/row to decide whether it can take a fast or slow
+        code path. This can lead to unexpected behavior if `func` has
+        side-effects, as they will take effect twice for the first
+        column/row.
 
-        # skip if we are mixed datelike and trying reduce across axes
-        # GH6125
-        if (reduce and axis == 1 and self._is_mixed_type and
-                self._is_datelike_mixed_type):
-            reduce = False
+        Examples
+        --------
 
-        # try to reduce first (by default)
-        # this only matters if the reduction in values is of different dtype
-        # e.g. if we want to apply to a SparseFrame, then can't directly reduce
-        if reduce:
-            values = self.values
+        >>> df = pd.DataFrame([[4, 9]] * 3, columns=['A', 'B'])
+        >>> df
+           A  B
+        0  4  9
+        1  4  9
+        2  4  9
 
-            # we cannot reduce using non-numpy dtypes,
-            # as demonstrated in gh-12244
-            if not is_extension_type(values):
-                # Create a dummy Series from an empty array
-                index = self._get_axis(axis)
-                empty_arr = np.empty(len(index), dtype=values.dtype)
-                dummy = Series(empty_arr, index=self._get_axis(axis),
-                               dtype=values.dtype)
+        Using a numpy universal function (in this case the same as
+        ``np.sqrt(df)``):
 
-                try:
-                    labels = self._get_agg_axis(axis)
-                    result = lib.reduce(values, func, axis=axis, dummy=dummy,
-                                        labels=labels)
-                    return Series(result, index=labels)
-                except Exception:
-                    pass
+        >>> df.apply(np.sqrt)
+             A    B
+        0  2.0  3.0
+        1  2.0  3.0
+        2  2.0  3.0
 
-        dtype = object if self._is_mixed_type else None
-        if axis == 0:
-            series_gen = (self._ixs(i, axis=1)
-                          for i in range(len(self.columns)))
-            res_index = self.columns
-            res_columns = self.index
-        elif axis == 1:
-            res_index = self.index
-            res_columns = self.columns
-            values = self.values
-            series_gen = (Series.from_array(arr, index=res_columns, name=name,
-                                            dtype=dtype)
-                          for i, (arr, name) in enumerate(zip(values,
-                                                              res_index)))
-        else:  # pragma : no cover
-            raise AssertionError('Axis must be 0 or 1, got %s' % str(axis))
-
-        i = None
-        keys = []
-        results = {}
-        if ignore_failures:
-            successes = []
-            for i, v in enumerate(series_gen):
-                try:
-                    results[i] = func(v)
-                    keys.append(v.name)
-                    successes.append(i)
-                except Exception:
-                    pass
-            # so will work with MultiIndex
-            if len(successes) < len(res_index):
-                res_index = res_index.take(successes)
-        else:
-            try:
-                for i, v in enumerate(series_gen):
-                    results[i] = func(v)
-                    keys.append(v.name)
-            except Exception as e:
-                if hasattr(e, 'args'):
-                    # make sure i is defined
-                    if i is not None:
-                        k = res_index[i]
-                        e.args = e.args + ('occurred at index %s' %
-                                           pprint_thing(k), )
-                raise
-
-        if len(results) > 0 and is_sequence(results[0]):
-            if not isinstance(results[0], Series):
-                index = res_columns
-            else:
-                index = None
+        Using a reducing function on either axis
 
-            result = self._constructor(data=results, index=index)
-            result.columns = res_index
+        >>> df.apply(np.sum, axis=0)
+        A    12
+        B    27
+        dtype: int64
 
-            if axis == 1:
-                result = result.T
-            result = result._convert(datetime=True, timedelta=True, copy=False)
+        >>> df.apply(np.sum, axis=1)
+        0    13
+        1    13
+        2    13
+        dtype: int64
 
-        else:
+        Retuning a list-like will result in a Series
 
-            result = Series(results)
-            result.index = res_index
+        >>> df.apply(lambda x: [1, 2], axis=1)
+        0    [1, 2]
+        1    [1, 2]
+        2    [1, 2]
+        dtype: object
 
-        return result
+        Passing result_type='expand' will expand list-like results
+        to columns of a Dataframe
 
-    def _apply_broadcast(self, func, axis):
-        if axis == 0:
-            target = self
-        elif axis == 1:
-            target = self.T
-        else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1, got %s' % axis)
+        >>> df.apply(lambda x: [1, 2], axis=1, result_type='expand')
+           0  1
+        0  1  2
+        1  1  2
+        2  1  2
 
-        result_values = np.empty_like(target.values)
-        columns = target.columns
-        for i, col in enumerate(columns):
-            result_values[:, i] = func(target[col])
+        Returning a Series inside the function is similar to passing
+        ``result_type='expand'``. The resulting column names
+        will be the Series index.
 
-        result = self._constructor(result_values, index=target.index,
-                                   columns=target.columns)
+        >>> df.apply(lambda x: pd.Series([1, 2], index=['foo', 'bar']), axis=1)
+           foo  bar
+        0    1    2
+        1    1    2
+        2    1    2
 
-        if axis == 1:
-            result = result.T
+        Passing ``result_type='broadcast'`` will ensure the same shape
+        result, whether list-like or scalar is returned by the function,
+        and broadcast it along the axis. The resulting column names will
+        be the originals.
 
-        return result
+        >>> df.apply(lambda x: [1, 2], axis=1, result_type='broadcast')
+           A  B
+        0  1  2
+        1  1  2
+        2  1  2
+        """
+        from pandas.core.apply import frame_apply
+        op = frame_apply(self,
+                         func=func,
+                         axis=axis,
+                         broadcast=broadcast,
+                         raw=raw,
+                         reduce=reduce,
+                         result_type=result_type,
+                         args=args,
+                         kwds=kwds)
+        return op.get_result()
 
     def applymap(self, func):
         """
-        Apply a function to a DataFrame that is intended to operate
-        elementwise, i.e. like doing map(func, series) for each series in the
-        DataFrame
+        Apply a function to a Dataframe elementwise.
+
+        This method applies a function that accepts and returns a scalar
+        to every element of a DataFrame.
 
         Parameters
         ----------
-        func : function
-            Python function, returns a single value from a single value
+        func : callable
+            Python function, returns a single value from a single value.
+
+        Returns
+        -------
+        DataFrame
+            Transformed DataFrame.
+
+        See Also
+        --------
+        DataFrame.apply : Apply a function along input axis of DataFrame.
+
+        Notes
+        -----
+        In the current implementation applymap calls `func` twice on the
+        first column/row to decide whether it can take a fast or slow
+        code path. This can lead to unexpected behavior if `func` has
+        side-effects, as they will take effect twice for the first
+        column/row.
 
         Examples
         --------
-
-        >>> df = pd.DataFrame(np.random.randn(3, 3))
+        >>> df = pd.DataFrame([[1, 2.12], [3.356, 4.567]])
         >>> df
-            0         1          2
-        0  -0.029638  1.081563   1.280300
-        1   0.647747  0.831136  -1.549481
-        2   0.513416 -0.884417   0.195343
-        >>> df = df.applymap(lambda x: '%.2f' % x)
-        >>> df
-            0         1          2
-        0  -0.03      1.08       1.28
-        1   0.65      0.83      -1.55
-        2   0.51     -0.88       0.20
+               0      1
+        0  1.000  2.120
+        1  3.356  4.567
 
-        Returns
-        -------
-        applied : DataFrame
+        >>> df.applymap(lambda x: len(str(x)))
+           0  1
+        0  3  4
+        1  5  5
 
-        See also
-        --------
-        DataFrame.apply : For operations on rows/columns
+        Note that a vectorized version of `func` often exists, which will
+        be much faster. You could square each number elementwise.
+
+        >>> df.applymap(lambda x: x**2)
+                   0          1
+        0   1.000000   4.494400
+        1  11.262736  20.857489
+
+        But it's better to avoid applymap in that case.
 
+        >>> df ** 2
+                   0          1
+        0   1.000000   4.494400
+        1  11.262736  20.857489
         """
 
         # if we have a dtype == 'M8[ns]', provide boxed values
         def infer(x):
             if x.empty:
                 return lib.map_infer(x, func)
-            return lib.map_infer(x.asobject, func)
+            return lib.map_infer(x.astype(object).values, func)
 
         return self.apply(infer)
 
     # ----------------------------------------------------------------------
     # Merging / joining methods
 
-    def append(self, other, ignore_index=False, verify_integrity=False):
+    def append(self, other, ignore_index=False,
+               verify_integrity=False, sort=None):
         """
-        Append rows of `other` to the end of this frame, returning a new
-        object. Columns not in this frame are added as new columns.
+        Append rows of `other` to the end of caller, returning a new object.
+
+        Columns in `other` that are not in the caller are added as new columns.
 
         Parameters
         ----------
@@ -4374,10 +6599,23 @@ def append(self, other, ignore_index=False, verify_integrity=False):
             If True, do not use the index labels.
         verify_integrity : boolean, default False
             If True, raise ValueError on creating index with duplicates.
+        sort : boolean, default None
+            Sort columns if the columns of `self` and `other` are not aligned.
+            The default sorting is deprecated and will change to not-sorting
+            in a future version of pandas. Explicitly pass ``sort=True`` to
+            silence the warning and sort. Explicitly pass ``sort=False`` to
+            silence the warning and not sort.
+
+            .. versionadded:: 0.23.0
 
         Returns
         -------
-        appended : DataFrame
+        DataFrame
+
+        See Also
+        --------
+        concat : General function to concatenate DataFrame, Series
+            or Panel objects.
 
         Notes
         -----
@@ -4385,10 +6623,10 @@ def append(self, other, ignore_index=False, verify_integrity=False):
         the DataFrame's index, the order of the columns in the resulting
         DataFrame will be unchanged.
 
-        See also
-        --------
-        pandas.concat : General function to concatenate DataFrame, Series
-            or Panel objects
+        Iteratively appending rows to a DataFrame can be more computationally
+        intensive than a single concatenate. A better solution is to append
+        those rows to a list and then concatenate the list with the original
+        DataFrame all at once.
 
         Examples
         --------
@@ -4415,6 +6653,32 @@ def append(self, other, ignore_index=False, verify_integrity=False):
         2  5  6
         3  7  8
 
+        The following, while not recommended methods for generating DataFrames,
+        show two ways to generate a DataFrame from multiple data sources.
+
+        Less efficient:
+
+        >>> df = pd.DataFrame(columns=['A'])
+        >>> for i in range(5):
+        ...     df = df.append({'A': i}, ignore_index=True)
+        >>> df
+           A
+        0  0
+        1  1
+        2  2
+        3  3
+        4  4
+
+        More efficient:
+
+        >>> pd.concat([pd.DataFrame([i], columns=['A']) for i in range(5)],
+        ...           ignore_index=True)
+           A
+        0  0
+        1  1
+        2  2
+        3  3
+        4  4
         """
         if isinstance(other, (Series, dict)):
             if isinstance(other, dict):
@@ -4430,8 +6694,11 @@ def append(self, other, ignore_index=False, verify_integrity=False):
                 # index name will be reset
                 index = Index([other.name], name=self.index.name)
 
-            combined_columns = self.columns.tolist() + self.columns.union(
-                other.index).difference(self.columns).tolist()
+            idx_diff = other.index.difference(self.columns)
+            try:
+                combined_columns = self.columns.append(idx_diff)
+            except TypeError:
+                combined_columns = self.columns.astype(object).append(idx_diff)
             other = other.reindex(combined_columns, copy=False)
             other = DataFrame(other.values.reshape((1, len(other))),
                               index=index,
@@ -4444,131 +6711,133 @@ def append(self, other, ignore_index=False, verify_integrity=False):
             if (self.columns.get_indexer(other.columns) >= 0).all():
                 other = other.loc[:, self.columns]
 
-        from pandas.tools.concat import concat
+        from pandas.core.reshape.concat import concat
         if isinstance(other, (list, tuple)):
             to_concat = [self] + other
         else:
             to_concat = [self, other]
         return concat(to_concat, ignore_index=ignore_index,
-                      verify_integrity=verify_integrity)
+                      verify_integrity=verify_integrity,
+                      sort=sort)
 
     def join(self, other, on=None, how='left', lsuffix='', rsuffix='',
              sort=False):
         """
-        Join columns with other DataFrame either on index or on a key
-        column. Efficiently Join multiple DataFrame objects by index at once by
+        Join columns of another DataFrame.
+
+        Join columns with `other` DataFrame either on index or on a key
+        column. Efficiently join multiple DataFrame objects by index at once by
         passing a list.
 
         Parameters
         ----------
-        other : DataFrame, Series with name field set, or list of DataFrame
+        other : DataFrame, Series, or list of DataFrame
             Index should be similar to one of the columns in this one. If a
             Series is passed, its name attribute must be set, and that will be
-            used as the column name in the resulting joined DataFrame
-        on : column name, tuple/list of column names, or array-like
-            Column(s) in the caller to join on the index in other,
-            otherwise joins index-on-index. If multiples
-            columns given, the passed DataFrame must have a MultiIndex. Can
-            pass an array as the join key if not already contained in the
-            calling DataFrame. Like an Excel VLOOKUP operation
-        how : {'left', 'right', 'outer', 'inner'}, default: 'left'
+            used as the column name in the resulting joined DataFrame.
+        on : str, list of str, or array-like, optional
+            Column or index level name(s) in the caller to join on the index
+            in `other`, otherwise joins index-on-index. If multiple
+            values given, the `other` DataFrame must have a MultiIndex. Can
+            pass an array as the join key if it is not already contained in
+            the calling DataFrame. Like an Excel VLOOKUP operation.
+        how : {'left', 'right', 'outer', 'inner'}, default 'left'
             How to handle the operation of the two objects.
 
             * left: use calling frame's index (or column if on is specified)
-            * right: use other frame's index
+            * right: use `other`'s index.
             * outer: form union of calling frame's index (or column if on is
-              specified) with other frame's index, and sort it
-              lexicographically
+              specified) with `other`'s index, and sort it.
+              lexicographically.
             * inner: form intersection of calling frame's index (or column if
-              on is specified) with other frame's index, preserving the order
-              of the calling's one
-        lsuffix : string
-            Suffix to use from left frame's overlapping columns
-        rsuffix : string
-            Suffix to use from right frame's overlapping columns
-        sort : boolean, default False
+              on is specified) with `other`'s index, preserving the order
+              of the calling's one.
+        lsuffix : str, default ''
+            Suffix to use from left frame's overlapping columns.
+        rsuffix : str, default ''
+            Suffix to use from right frame's overlapping columns.
+        sort : bool, default False
             Order result DataFrame lexicographically by the join key. If False,
-            the order of the join key depends on the join type (how keyword)
+            the order of the join key depends on the join type (how keyword).
+
+        Returns
+        -------
+        DataFrame
+            A dataframe containing columns from both the caller and `other`.
+
+        See Also
+        --------
+        DataFrame.merge : For column(s)-on-columns(s) operations.
 
         Notes
         -----
-        on, lsuffix, and rsuffix options are not supported when passing a list
-        of DataFrame objects
+        Parameters `on`, `lsuffix`, and `rsuffix` are not supported when
+        passing a list of `DataFrame` objects.
+
+        Support for specifying index levels as the `on` parameter was added
+        in version 0.23.0.
 
         Examples
         --------
-        >>> caller = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3', 'K4', 'K5'],
-        ...                        'A': ['A0', 'A1', 'A2', 'A3', 'A4', 'A5']})
-
-        >>> caller
-            A key
-        0  A0  K0
-        1  A1  K1
-        2  A2  K2
-        3  A3  K3
-        4  A4  K4
-        5  A5  K5
+        >>> df = pd.DataFrame({'key': ['K0', 'K1', 'K2', 'K3', 'K4', 'K5'],
+        ...                    'A': ['A0', 'A1', 'A2', 'A3', 'A4', 'A5']})
+
+        >>> df
+          key   A
+        0  K0  A0
+        1  K1  A1
+        2  K2  A2
+        3  K3  A3
+        4  K4  A4
+        5  K5  A5
 
         >>> other = pd.DataFrame({'key': ['K0', 'K1', 'K2'],
         ...                       'B': ['B0', 'B1', 'B2']})
 
         >>> other
-            B key
-        0  B0  K0
-        1  B1  K1
-        2  B2  K2
+          key   B
+        0  K0  B0
+        1  K1  B1
+        2  K2  B2
 
         Join DataFrames using their indexes.
 
-        >>> caller.join(other, lsuffix='_caller', rsuffix='_other')
-
-        >>>     A key_caller    B key_other
-            0  A0         K0   B0        K0
-            1  A1         K1   B1        K1
-            2  A2         K2   B2        K2
-            3  A3         K3  NaN       NaN
-            4  A4         K4  NaN       NaN
-            5  A5         K5  NaN       NaN
-
+        >>> df.join(other, lsuffix='_caller', rsuffix='_other')
+          key_caller   A key_other    B
+        0         K0  A0        K0   B0
+        1         K1  A1        K1   B1
+        2         K2  A2        K2   B2
+        3         K3  A3       NaN  NaN
+        4         K4  A4       NaN  NaN
+        5         K5  A5       NaN  NaN
 
         If we want to join using the key columns, we need to set key to be
-        the index in both caller and other. The joined DataFrame will have
+        the index in both `df` and `other`. The joined DataFrame will have
         key as its index.
 
-        >>> caller.set_index('key').join(other.set_index('key'))
-
-        >>>      A    B
-            key
-            K0   A0   B0
-            K1   A1   B1
-            K2   A2   B2
-            K3   A3  NaN
-            K4   A4  NaN
-            K5   A5  NaN
-
-        Another option to join using the key columns is to use the on
-        parameter. DataFrame.join always uses other's index but we can use any
-        column in the caller. This method preserves the original caller's
+        >>> df.set_index('key').join(other.set_index('key'))
+              A    B
+        key
+        K0   A0   B0
+        K1   A1   B1
+        K2   A2   B2
+        K3   A3  NaN
+        K4   A4  NaN
+        K5   A5  NaN
+
+        Another option to join using the key columns is to use the `on`
+        parameter. DataFrame.join always uses `other`'s index but we can use
+        any column in `df`. This method preserves the original DataFrame's
         index in the result.
 
-        >>> caller.join(other.set_index('key'), on='key')
-
-        >>>     A key    B
-            0  A0  K0   B0
-            1  A1  K1   B1
-            2  A2  K2   B2
-            3  A3  K3  NaN
-            4  A4  K4  NaN
-            5  A5  K5  NaN
-
-
-        See also
-        --------
-        DataFrame.merge : For column(s)-on-columns(s) operations
-
-        Returns
-        -------
-        joined : DataFrame
+        >>> df.join(other.set_index('key'), on='key')
+          key   A    B
+        0  K0  A0   B0
+        1  K1  A1   B1
+        2  K2  A2   B2
+        3  K3  A3  NaN
+        4  K4  A4  NaN
+        5  K5  A5  NaN
         """
         # For SparseDataFrame's benefit
         return self._join_compat(other, on=on, how=how, lsuffix=lsuffix,
@@ -4576,8 +6845,8 @@ def join(self, other, on=None, how='left', lsuffix='', rsuffix='',
 
     def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
                      sort=False):
-        from pandas.tools.merge import merge
-        from pandas.tools.concat import concat
+        from pandas.core.reshape.merge import merge
+        from pandas.core.reshape.concat import concat
 
         if isinstance(other, Series):
             if other.name is None:
@@ -4593,18 +6862,17 @@ def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
                 raise ValueError('Joining multiple DataFrames only supported'
                                  ' for joining on index')
 
-            # join indexes only using concat
-            if how == 'left':
-                how = 'outer'
-                join_axes = [self.index]
-            else:
-                join_axes = None
-
             frames = [self] + list(other)
 
             can_concat = all(df.index.is_unique for df in frames)
 
+            # join indexes only using concat
             if can_concat:
+                if how == 'left':
+                    how = 'outer'
+                    join_axes = [self.index]
+                else:
+                    join_axes = None
                 return concat(frames, axis=1, join=how, join_axes=join_axes,
                               verify_integrity=True)
 
@@ -4620,19 +6888,18 @@ def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
     @Appender(_merge_doc, indents=2)
     def merge(self, right, how='inner', on=None, left_on=None, right_on=None,
               left_index=False, right_index=False, sort=False,
-              suffixes=('_x', '_y'), copy=True, indicator=False):
-        from pandas.tools.merge import merge
+              suffixes=('_x', '_y'), copy=True, indicator=False,
+              validate=None):
+        from pandas.core.reshape.merge import merge
         return merge(self, right, how=how, on=on, left_on=left_on,
                      right_on=right_on, left_index=left_index,
                      right_index=right_index, sort=sort, suffixes=suffixes,
-                     copy=copy, indicator=indicator)
+                     copy=copy, indicator=indicator, validate=validate)
 
     def round(self, decimals=0, *args, **kwargs):
         """
         Round a DataFrame to a variable number of decimal places.
 
-        .. versionadded:: 0.17.0
-
         Parameters
         ----------
         decimals : int, dict, Series
@@ -4644,44 +6911,69 @@ def round(self, decimals=0, *args, **kwargs):
             columns not included in `decimals` will be left as is. Elements
             of `decimals` which are not columns of the input will be
             ignored.
-
-        Examples
-        --------
-        >>> df = pd.DataFrame(np.random.random([3, 3]),
-        ...     columns=['A', 'B', 'C'], index=['first', 'second', 'third'])
-        >>> df
-                       A         B         C
-        first   0.028208  0.992815  0.173891
-        second  0.038683  0.645646  0.577595
-        third   0.877076  0.149370  0.491027
-        >>> df.round(2)
-                   A     B     C
-        first   0.03  0.99  0.17
-        second  0.04  0.65  0.58
-        third   0.88  0.15  0.49
-        >>> df.round({'A': 1, 'C': 2})
-                  A         B     C
-        first   0.0  0.992815  0.17
-        second  0.0  0.645646  0.58
-        third   0.9  0.149370  0.49
-        >>> decimals = pd.Series([1, 0, 2], index=['A', 'B', 'C'])
-        >>> df.round(decimals)
-                  A  B     C
-        first   0.0  1  0.17
-        second  0.0  1  0.58
-        third   0.9  0  0.49
+        *args
+            Additional keywords have no effect but might be accepted for
+            compatibility with numpy.
+        **kwargs
+            Additional keywords have no effect but might be accepted for
+            compatibility with numpy.
 
         Returns
         -------
-        DataFrame object
+        DataFrame
+            A DataFrame with the affected columns rounded to the specified
+            number of decimal places.
 
         See Also
         --------
-        numpy.around
-        Series.round
+        numpy.around : Round a numpy array to the given number of decimals.
+        Series.round : Round a Series to the given number of decimals.
 
+        Examples
+        --------
+        >>> df = pd.DataFrame([(.21, .32), (.01, .67), (.66, .03), (.21, .18)],
+        ...                   columns=['dogs', 'cats'])
+        >>> df
+            dogs  cats
+        0  0.21  0.32
+        1  0.01  0.67
+        2  0.66  0.03
+        3  0.21  0.18
+
+        By providing an integer each column is rounded to the same number
+        of decimal places
+
+        >>> df.round(1)
+            dogs  cats
+        0   0.2   0.3
+        1   0.0   0.7
+        2   0.7   0.0
+        3   0.2   0.2
+
+        With a dict, the number of places for specific columns can be
+        specfified with the column names as key and the number of decimal
+        places as value
+
+        >>> df.round({'dogs': 1, 'cats': 0})
+            dogs  cats
+        0   0.2   0.0
+        1   0.0   1.0
+        2   0.7   0.0
+        3   0.2   0.0
+
+        Using a Series, the number of places for specific columns can be
+        specfified with the column names as index and the number of
+        decimal places as value
+
+        >>> decimals = pd.Series([0, 1], index=['cats', 'dogs'])
+        >>> df.round(decimals)
+            dogs  cats
+        0   0.2   0.0
+        1   0.0   1.0
+        2   0.7   0.0
+        3   0.2   0.0
         """
-        from pandas.tools.concat import concat
+        from pandas.core.reshape.concat import concat
 
         def _dict_round(df, decimals):
             for col, vals in df.iteritems():
@@ -4722,22 +7014,45 @@ def _series_round(s, decimals):
 
     def corr(self, method='pearson', min_periods=1):
         """
-        Compute pairwise correlation of columns, excluding NA/null values
+        Compute pairwise correlation of columns, excluding NA/null values.
 
         Parameters
         ----------
-        method : {'pearson', 'kendall', 'spearman'}
+        method : {'pearson', 'kendall', 'spearman'} or callable
             * pearson : standard correlation coefficient
             * kendall : Kendall Tau correlation coefficient
             * spearman : Spearman rank correlation
+            * callable: callable with input two 1d ndarrays
+                and returning a float
+
+                .. versionadded:: 0.24.0
+
         min_periods : int, optional
             Minimum number of observations required per pair of columns
-            to have a valid result. Currently only available for pearson
-            and spearman correlation
+            to have a valid result. Currently only available for Pearson
+            and Spearman correlation.
 
         Returns
         -------
-        y : DataFrame
+        DataFrame
+            Correlation matrix.
+
+        See Also
+        --------
+        DataFrame.corrwith
+        Series.corr
+
+        Examples
+        --------
+        >>> def histogram_intersection(a, b):
+        ...     v = np.minimum(a, b).sum().round(decimals=1)
+        ...     return v
+        >>> df = pd.DataFrame([(.2, .3), (.0, .6), (.6, .0), (.2, .1)],
+        ...                   columns=['dogs', 'cats'])
+        >>> df.corr(method=histogram_intersection)
+              dogs  cats
+        dogs   1.0   0.3
+        cats   0.3   1.0
         """
         numeric_df = self._get_numeric_data()
         cols = numeric_df.columns
@@ -4745,14 +7060,14 @@ def corr(self, method='pearson', min_periods=1):
         mat = numeric_df.values
 
         if method == 'pearson':
-            correl = libalgos.nancorr(_ensure_float64(mat), minp=min_periods)
+            correl = libalgos.nancorr(ensure_float64(mat), minp=min_periods)
         elif method == 'spearman':
-            correl = libalgos.nancorr_spearman(_ensure_float64(mat),
+            correl = libalgos.nancorr_spearman(ensure_float64(mat),
                                                minp=min_periods)
-        else:
+        elif method == 'kendall' or callable(method):
             if min_periods is None:
                 min_periods = 1
-            mat = _ensure_float64(mat).T
+            mat = ensure_float64(mat).T
             corrf = nanops.get_corr_func(method)
             K = len(cols)
             correl = np.empty((K, K), dtype=float)
@@ -4764,7 +7079,7 @@ def corr(self, method='pearson', min_periods=1):
 
                     valid = mask[i] & mask[j]
                     if valid.sum() < min_periods:
-                        c = NA
+                        c = np.nan
                     elif i == j:
                         c = 1.
                     elif not valid.all():
@@ -4773,12 +7088,31 @@ def corr(self, method='pearson', min_periods=1):
                         c = corrf(ac, bc)
                     correl[i, j] = c
                     correl[j, i] = c
+        else:
+            raise ValueError("method must be either 'pearson', "
+                             "'spearman', or 'kendall', '{method}' "
+                             "was supplied".format(method=method))
 
         return self._constructor(correl, index=idx, columns=cols)
 
     def cov(self, min_periods=None):
         """
-        Compute pairwise covariance of columns, excluding NA/null values
+        Compute pairwise covariance of columns, excluding NA/null values.
+
+        Compute the pairwise covariance among the series of a DataFrame.
+        The returned data frame is the `covariance matrix
+        <https://en.wikipedia.org/wiki/Covariance_matrix>`__ of the columns
+        of the DataFrame.
+
+        Both NA and null values are automatically excluded from the
+        calculation. (See the note below about bias from missing values.)
+        A threshold can be set for the minimum number of
+        observations for each value created. Comparisons with observations
+        below this threshold will be returned as ``NaN``.
+
+        This method is generally used for the analysis of time series data to
+        understand the relationship between different measures
+        across time.
 
         Parameters
         ----------
@@ -4788,19 +7122,78 @@ def cov(self, min_periods=None):
 
         Returns
         -------
-        y : DataFrame
+        DataFrame
+            The covariance matrix of the series of the DataFrame.
+
+        See Also
+        --------
+        Series.cov : Compute covariance with another Series.
+        core.window.EWM.cov: Exponential weighted sample covariance.
+        core.window.Expanding.cov : Expanding sample covariance.
+        core.window.Rolling.cov : Rolling sample covariance.
 
         Notes
         -----
-        `y` contains the covariance matrix of the DataFrame's time series.
-        The covariance is normalized by N-1 (unbiased estimator).
+        Returns the covariance matrix of the DataFrame's time series.
+        The covariance is normalized by N-1.
+
+        For DataFrames that have Series that are missing data (assuming that
+        data is `missing at random
+        <https://en.wikipedia.org/wiki/Missing_data#Missing_at_random>`__)
+        the returned covariance matrix will be an unbiased estimate
+        of the variance and covariance between the member Series.
+
+        However, for many applications this estimate may not be acceptable
+        because the estimate covariance matrix is not guaranteed to be positive
+        semi-definite. This could lead to estimate correlations having
+        absolute values which are greater than one, and/or a non-invertible
+        covariance matrix. See `Estimation of covariance matrices
+        <http://en.wikipedia.org/w/index.php?title=Estimation_of_covariance_
+        matrices>`__ for more details.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([(1, 2), (0, 3), (2, 0), (1, 1)],
+        ...                   columns=['dogs', 'cats'])
+        >>> df.cov()
+                  dogs      cats
+        dogs  0.666667 -1.000000
+        cats -1.000000  1.666667
+
+        >>> np.random.seed(42)
+        >>> df = pd.DataFrame(np.random.randn(1000, 5),
+        ...                   columns=['a', 'b', 'c', 'd', 'e'])
+        >>> df.cov()
+                  a         b         c         d         e
+        a  0.998438 -0.020161  0.059277 -0.008943  0.014144
+        b -0.020161  1.059352 -0.008543 -0.024738  0.009826
+        c  0.059277 -0.008543  1.010670 -0.001486 -0.000271
+        d -0.008943 -0.024738 -0.001486  0.921297 -0.013692
+        e  0.014144  0.009826 -0.000271 -0.013692  0.977795
+
+        **Minimum number of periods**
+
+        This method also supports an optional ``min_periods`` keyword
+        that specifies the required minimum number of non-NA observations for
+        each column pair in order to have a valid result:
+
+        >>> np.random.seed(42)
+        >>> df = pd.DataFrame(np.random.randn(20, 3),
+        ...                   columns=['a', 'b', 'c'])
+        >>> df.loc[df.index[:5], 'a'] = np.nan
+        >>> df.loc[df.index[5:10], 'b'] = np.nan
+        >>> df.cov(min_periods=12)
+                  a         b         c
+        a  0.316741       NaN -0.150812
+        b       NaN  1.248003  0.191417
+        c -0.150812  0.191417  0.895202
         """
         numeric_df = self._get_numeric_data()
         cols = numeric_df.columns
         idx = cols.copy()
         mat = numeric_df.values
 
-        if notnull(mat).all():
+        if notna(mat).all():
             if min_periods is not None and min_periods > len(mat):
                 baseCov = np.empty((mat.shape[1], mat.shape[1]))
                 baseCov.fill(np.nan)
@@ -4808,58 +7201,96 @@ def cov(self, min_periods=None):
                 baseCov = np.cov(mat.T)
             baseCov = baseCov.reshape((len(cols), len(cols)))
         else:
-            baseCov = libalgos.nancorr(_ensure_float64(mat), cov=True,
+            baseCov = libalgos.nancorr(ensure_float64(mat), cov=True,
                                        minp=min_periods)
 
         return self._constructor(baseCov, index=idx, columns=cols)
 
-    def corrwith(self, other, axis=0, drop=False):
+    def corrwith(self, other, axis=0, drop=False, method='pearson'):
         """
-        Compute pairwise correlation between rows or columns of two DataFrame
-        objects.
+        Compute pairwise correlation between rows or columns of DataFrame
+        with rows or columns of Series or DataFrame.  DataFrames are first
+        aligned along both axes before computing the correlations.
 
         Parameters
         ----------
-        other : DataFrame
+        other : DataFrame, Series
+            Object with which to compute correlations.
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            0 or 'index' to compute column-wise, 1 or 'columns' for row-wise
-        drop : boolean, default False
-            Drop missing indices from result, default returns union of all
+            0 or 'index' to compute column-wise, 1 or 'columns' for row-wise.
+        drop : bool, default False
+            Drop missing indices from result.
+        method : {'pearson', 'kendall', 'spearman'} or callable
+            * pearson : standard correlation coefficient
+            * kendall : Kendall Tau correlation coefficient
+            * spearman : Spearman rank correlation
+            * callable: callable with input two 1d ndarrays
+                and returning a float
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
-        correls : Series
+        Series
+            Pairwise correlations.
+
+        See Also
+        -------
+        DataFrame.corr
         """
         axis = self._get_axis_number(axis)
+        this = self._get_numeric_data()
+
         if isinstance(other, Series):
-            return self.apply(other.corr, axis=axis)
+            return this.apply(lambda x: other.corr(x, method=method),
+                              axis=axis)
 
-        this = self._get_numeric_data()
         other = other._get_numeric_data()
-
         left, right = this.align(other, join='inner', copy=False)
 
-        # mask missing values
-        left = left + right * 0
-        right = right + left * 0
-
         if axis == 1:
             left = left.T
             right = right.T
 
-        # demeaned data
-        ldem = left - left.mean()
-        rdem = right - right.mean()
+        if method == 'pearson':
+            # mask missing values
+            left = left + right * 0
+            right = right + left * 0
+
+            # demeaned data
+            ldem = left - left.mean()
+            rdem = right - right.mean()
+
+            num = (ldem * rdem).sum()
+            dom = (left.count() - 1) * left.std() * right.std()
+
+            correl = num / dom
+
+        elif method in ['kendall', 'spearman'] or callable(method):
+            def c(x):
+                return nanops.nancorr(x[0], x[1], method=method)
 
-        num = (ldem * rdem).sum()
-        dom = (left.count() - 1) * left.std() * right.std()
+            correl = Series(map(c,
+                                zip(left.values.T, right.values.T)),
+                            index=left.columns)
 
-        correl = num / dom
+        else:
+            raise ValueError("Invalid method {method} was passed, "
+                             "valid methods are: 'pearson', 'kendall', "
+                             "'spearman', or callable".
+                             format(method=method))
 
         if not drop:
+            # Find non-matching labels along the given axis
+            # and append missing correlations (GH 22375)
             raxis = 1 if axis == 0 else 0
-            result_index = this._get_axis(raxis).union(other._get_axis(raxis))
-            correl = correl.reindex(result_index)
+            result_index = (this._get_axis(raxis).
+                            union(other._get_axis(raxis)))
+            idx_diff = result_index.difference(correl.index)
+
+            if len(idx_diff) > 0:
+                correl = correl.append(Series([np.nan] * len(idx_diff),
+                                              index=idx_diff))
 
         return correl
 
@@ -4868,22 +7299,79 @@ def corrwith(self, other, axis=0, drop=False):
 
     def count(self, axis=0, level=None, numeric_only=False):
         """
-        Return Series with number of non-NA/null observations over requested
-        axis. Works with non-floating point data as well (detects NaN and None)
+        Count non-NA cells for each column or row.
+
+        The values `None`, `NaN`, `NaT`, and optionally `numpy.inf` (depending
+        on `pandas.options.mode.use_inf_as_na`) are considered NA.
 
         Parameters
         ----------
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            0 or 'index' for row-wise, 1 or 'columns' for column-wise
-        level : int or level name, default None
-            If the axis is a MultiIndex (hierarchical), count along a
-            particular level, collapsing into a DataFrame
-        numeric_only : boolean, default False
-            Include only float, int, boolean data
+            If 0 or 'index' counts are generated for each column.
+            If 1 or 'columns' counts are generated for each **row**.
+        level : int or str, optional
+            If the axis is a `MultiIndex` (hierarchical), count along a
+            particular `level`, collapsing into a `DataFrame`.
+            A `str` specifies the level name.
+        numeric_only : bool, default False
+            Include only `float`, `int` or `boolean` data.
 
         Returns
         -------
-        count : Series (or DataFrame if level specified)
+        Series or DataFrame
+            For each column/row the number of non-NA/null entries.
+            If `level` is specified returns a `DataFrame`.
+
+        See Also
+        --------
+        Series.count: Number of non-NA elements in a Series.
+        DataFrame.shape: Number of DataFrame rows and columns (including NA
+            elements).
+        DataFrame.isna: Boolean same-sized DataFrame showing places of NA
+            elements.
+
+        Examples
+        --------
+        Constructing DataFrame from a dictionary:
+
+        >>> df = pd.DataFrame({"Person":
+        ...                    ["John", "Myla", "Lewis", "John", "Myla"],
+        ...                    "Age": [24., np.nan, 21., 33, 26],
+        ...                    "Single": [False, True, True, True, False]})
+        >>> df
+           Person   Age  Single
+        0    John  24.0   False
+        1    Myla   NaN    True
+        2   Lewis  21.0    True
+        3    John  33.0    True
+        4    Myla  26.0   False
+
+        Notice the uncounted NA values:
+
+        >>> df.count()
+        Person    5
+        Age       4
+        Single    5
+        dtype: int64
+
+        Counts for each **row**:
+
+        >>> df.count(axis='columns')
+        0    3
+        1    2
+        2    3
+        3    3
+        4    3
+        dtype: int64
+
+        Counts for one level of a `MultiIndex`:
+
+        >>> df.set_index(["Person", "Single"]).count(level="Person")
+                Age
+        Person
+        John      2
+        Lewis     1
+        Myla      1
         """
         axis = self._get_axis_number(axis)
         if level is not None:
@@ -4899,10 +7387,14 @@ def count(self, axis=0, level=None, numeric_only=False):
         if len(frame._get_axis(axis)) == 0:
             result = Series(0, index=frame._get_agg_axis(axis))
         else:
-            if frame._is_mixed_type:
-                result = notnull(frame).sum(axis=axis)
+            if frame._is_mixed_type or frame._data.any_extension_types:
+                # the or any_extension_types is really only hit for single-
+                # column frames with an extension array
+                result = notna(frame).sum(axis=axis)
             else:
-                counts = notnull(frame.values).sum(axis=axis)
+                # GH13407
+                series_counts = notna(frame).sum(axis=axis)
+                counts = series_counts.values
                 result = Series(counts, index=frame._get_agg_axis(axis))
 
         return result.astype('int64')
@@ -4917,16 +7409,16 @@ def _count_level(self, level, axis=0, numeric_only=False):
         agg_axis = frame._get_agg_axis(axis)
 
         if not isinstance(count_axis, MultiIndex):
-            raise TypeError("Can only count levels on hierarchical %s." %
-                            self._get_axis_name(axis))
+            raise TypeError("Can only count levels on hierarchical "
+                            "{ax}.".format(ax=self._get_axis_name(axis)))
 
         if frame._is_mixed_type:
-            # Since we have mixed types, calling notnull(frame.values) might
+            # Since we have mixed types, calling notna(frame.values) might
             # upcast everything to object
-            mask = notnull(frame).values
+            mask = notna(frame).values
         else:
             # But use the speedup when we have homogeneous dtypes
-            mask = notnull(frame.values)
+            mask = notna(frame.values)
 
         if axis == 1:
             # We're transposing the mask rather than frame to avoid potential
@@ -4937,8 +7429,9 @@ def _count_level(self, level, axis=0, numeric_only=False):
             level = count_axis._get_level_number(level)
 
         level_index = count_axis.levels[level]
-        labels = _ensure_int64(count_axis.labels[level])
-        counts = lib.count_level_2d(mask, labels, len(level_index), axis=0)
+        level_codes = ensure_int64(count_axis.codes[level])
+        counts = lib.count_level_2d(mask, level_codes, len(level_index),
+                                    axis=0)
 
         result = DataFrame(counts, index=level_index, columns=agg_axis)
 
@@ -4950,21 +7443,35 @@ def _count_level(self, level, axis=0, numeric_only=False):
 
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
-        axis = self._get_axis_number(axis)
+        if axis is None and filter_type == 'bool':
+            labels = None
+            constructor = None
+        else:
+            # TODO: Make other agg func handle axis=None properly
+            axis = self._get_axis_number(axis)
+            labels = self._get_agg_axis(axis)
+            constructor = self._constructor
 
         def f(x):
             return op(x, axis=axis, skipna=skipna, **kwds)
 
-        labels = self._get_agg_axis(axis)
-
         # exclude timedelta/datetime unless we are uniform types
-        if axis == 1 and self._is_mixed_type and self._is_datelike_mixed_type:
+        if (axis == 1 and self._is_datelike_mixed_type
+                and (not self._is_homogeneous_type
+                     and not is_datetime64tz_dtype(self.dtypes[0]))):
             numeric_only = True
 
         if numeric_only is None:
             try:
                 values = self.values
                 result = f(values)
+
+                if (filter_type == 'bool' and is_object_dtype(values) and
+                        axis is None):
+                    # work around https://github.com/numpy/numpy/issues/10489
+                    # TODO: combine with hasattr(result, 'dtype') further down
+                    # hard since we don't have `values` down there.
+                    result = np.bool_(result)
             except Exception as e:
 
                 # try by-column first
@@ -4974,11 +7481,21 @@ def f(x):
                         # this can end up with a non-reduction
                         # but not always. if the types are mixed
                         # with datelike then need to make sure a series
-                        result = self.apply(f, reduce=False)
+
+                        # we only end up here if we have not specified
+                        # numeric_only and yet we have tried a
+                        # column-by-column reduction, where we have mixed type.
+                        # So let's just do what we can
+                        from pandas.core.apply import frame_apply
+                        opa = frame_apply(self,
+                                          func=f,
+                                          result_type='expand',
+                                          ignore_failures=True)
+                        result = opa.get_result()
                         if result.ndim == self.ndim:
                             result = result.iloc[0]
                         return result
-                    except:
+                    except Exception:
                         pass
 
                 if filter_type is None or filter_type == 'numeric':
@@ -4986,9 +7503,9 @@ def f(x):
                 elif filter_type == 'bool':
                     data = self._get_bool_data()
                 else:  # pragma: no cover
-                    e = NotImplementedError("Handling exception with filter_"
-                                            "type %s not implemented." %
-                                            filter_type)
+                    e = NotImplementedError(
+                        "Handling exception with filter_type {f} not"
+                        "implemented.".format(f=filter_type))
                     raise_with_traceback(e)
                 with np.errstate(all='ignore'):
                     result = f(data.values)
@@ -4998,10 +7515,11 @@ def f(x):
                 if filter_type is None or filter_type == 'numeric':
                     data = self._get_numeric_data()
                 elif filter_type == 'bool':
-                    data = self._get_bool_data()
+                    # GH 25101, # GH 24434
+                    data = self._get_bool_data() if axis == 0 else self
                 else:  # pragma: no cover
-                    msg = ("Generating numeric_only data with filter_type %s"
-                           "not supported." % filter_type)
+                    msg = ("Generating numeric_only data with filter_type {f}"
+                           "not supported.".format(f=filter_type))
                     raise NotImplementedError(msg)
                 values = data.values
                 labels = data._get_agg_axis(axis)
@@ -5013,7 +7531,7 @@ def f(x):
             try:
                 if filter_type is None or filter_type == 'numeric':
                     result = result.astype(np.float64)
-                elif filter_type == 'bool' and notnull(result).all():
+                elif filter_type == 'bool' and notna(result).all():
                     result = result.astype(np.bool_)
             except (ValueError, TypeError):
 
@@ -5021,24 +7539,35 @@ def f(x):
                 if axis == 0:
                     result = coerce_to_dtypes(result, self.dtypes)
 
-        return Series(result, index=labels)
+        if constructor is not None:
+            result = Series(result, index=labels)
+        return result
 
     def nunique(self, axis=0, dropna=True):
         """
-        Return Series with number of distinct observations over requested
-        axis.
+        Count distinct observations over requested axis.
+
+        Return Series with number of distinct observations. Can ignore NaN
+        values.
 
         .. versionadded:: 0.20.0
 
         Parameters
         ----------
         axis : {0 or 'index', 1 or 'columns'}, default 0
-        dropna : boolean, default True
+            The axis to use. 0 or 'index' for row-wise, 1 or 'columns' for
+            column-wise.
+        dropna : bool, default True
             Don't include NaN in the counts.
 
         Returns
         -------
-        nunique : Series
+        Series
+
+        See Also
+        --------
+        Series.nunique: Method nunique for Series.
+        DataFrame.count: Count non-NA cells for each column or row.
 
         Examples
         --------
@@ -5046,11 +7575,13 @@ def nunique(self, axis=0, dropna=True):
         >>> df.nunique()
         A    3
         B    1
+        dtype: int64
 
         >>> df.nunique(axis=1)
         0    1
         1    2
         2    2
+        dtype: int64
         """
         return self.apply(Series.nunique, axis=axis, dropna=dropna)
 
@@ -5065,24 +7596,30 @@ def idxmin(self, axis=0, skipna=True):
             0 or 'index' for row-wise, 1 or 'columns' for column-wise
         skipna : boolean, default True
             Exclude NA/null values. If an entire row/column is NA, the result
-            will be NA
+            will be NA.
 
         Returns
         -------
-        idxmin : Series
+        Series
+            Indexes of minima along the specified axis.
 
-        Notes
-        -----
-        This method is the DataFrame version of ``ndarray.argmin``.
+        Raises
+        ------
+        ValueError
+            * If the row/column is empty
 
         See Also
         --------
         Series.idxmin
+
+        Notes
+        -----
+        This method is the DataFrame version of ``ndarray.argmin``.
         """
         axis = self._get_axis_number(axis)
         indices = nanops.nanargmin(self.values, axis=axis, skipna=skipna)
         index = self._get_axis(axis)
-        result = [index[i] if i >= 0 else NA for i in indices]
+        result = [index[i] if i >= 0 else np.nan for i in indices]
         return Series(result, index=self._get_agg_axis(axis))
 
     def idxmax(self, axis=0, skipna=True):
@@ -5096,28 +7633,36 @@ def idxmax(self, axis=0, skipna=True):
             0 or 'index' for row-wise, 1 or 'columns' for column-wise
         skipna : boolean, default True
             Exclude NA/null values. If an entire row/column is NA, the result
-            will be first index.
+            will be NA.
 
         Returns
         -------
-        idxmax : Series
+        Series
+            Indexes of maxima along the specified axis.
 
-        Notes
-        -----
-        This method is the DataFrame version of ``ndarray.argmax``.
+        Raises
+        ------
+        ValueError
+            * If the row/column is empty
 
         See Also
         --------
         Series.idxmax
+
+        Notes
+        -----
+        This method is the DataFrame version of ``ndarray.argmax``.
         """
         axis = self._get_axis_number(axis)
         indices = nanops.nanargmax(self.values, axis=axis, skipna=skipna)
         index = self._get_axis(axis)
-        result = [index[i] if i >= 0 else NA for i in indices]
+        result = [index[i] if i >= 0 else np.nan for i in indices]
         return Series(result, index=self._get_agg_axis(axis))
 
     def _get_agg_axis(self, axis_num):
-        """ let's be explict about this """
+        """
+        Let's be explicit about this.
+        """
         if axis_num == 0:
             return self.columns
         elif axis_num == 1:
@@ -5125,59 +7670,107 @@ def _get_agg_axis(self, axis_num):
         else:
             raise ValueError('Axis must be 0 or 1 (got %r)' % axis_num)
 
-    def mode(self, axis=0, numeric_only=False):
+    def mode(self, axis=0, numeric_only=False, dropna=True):
         """
-        Gets the mode(s) of each element along the axis selected. Adds a row
-        for each mode per label, fills in gaps with nan.
+        Get the mode(s) of each element along the selected axis.
 
-        Note that there could be multiple values returned for the selected
-        axis (when more than one item share the maximum frequency), which is
-        the reason why a dataframe is returned. If you want to impute missing
-        values with the mode in a dataframe ``df``, you can just do this:
-        ``df.fillna(df.mode().iloc[0])``
+        The mode of a set of values is the value that appears most often.
+        It can be multiple values.
 
         Parameters
         ----------
         axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis to iterate over while searching for the mode:
+
             * 0 or 'index' : get mode of each column
             * 1 or 'columns' : get mode of each row
-        numeric_only : boolean, default False
-            if True, only apply to numeric columns
+        numeric_only : bool, default False
+            If True, only apply to numeric columns.
+        dropna : bool, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
-        modes : DataFrame (sorted)
+        DataFrame
+            The modes of each column or row.
+
+        See Also
+        --------
+        Series.mode : Return the highest frequency value in a Series.
+        Series.value_counts : Return the counts of values in a Series.
 
         Examples
         --------
-        >>> df = pd.DataFrame({'A': [1, 2, 1, 2, 1, 2, 3]})
+        >>> df = pd.DataFrame([('bird', 2, 2),
+        ...                    ('mammal', 4, np.nan),
+        ...                    ('arthropod', 8, 0),
+        ...                    ('bird', 2, np.nan)],
+        ...                   index=('falcon', 'horse', 'spider', 'ostrich'),
+        ...                   columns=('species', 'legs', 'wings'))
+        >>> df
+                   species  legs  wings
+        falcon        bird     2    2.0
+        horse       mammal     4    NaN
+        spider   arthropod     8    0.0
+        ostrich       bird     2    NaN
+
+        By default, missing values are not considered, and the mode of wings
+        are both 0 and 2. The second row of species and legs contains ``NaN``,
+        because they have only one mode, but the DataFrame has two rows.
+
         >>> df.mode()
-           A
-        0  1
-        1  2
+          species  legs  wings
+        0    bird   2.0    0.0
+        1     NaN   NaN    2.0
+
+        Setting ``dropna=False`` ``NaN`` values are considered and they can be
+        the mode (like for wings).
+
+        >>> df.mode(dropna=False)
+          species  legs  wings
+        0    bird     2    NaN
+
+        Setting ``numeric_only=True``, only the mode of numeric columns is
+        computed, and columns of other types are ignored.
+
+        >>> df.mode(numeric_only=True)
+           legs  wings
+        0   2.0    0.0
+        1   NaN    2.0
+
+        To compute the mode over columns and not rows, use the axis parameter:
+
+        >>> df.mode(axis='columns', numeric_only=True)
+                   0    1
+        falcon   2.0  NaN
+        horse    4.0  NaN
+        spider   0.0  8.0
+        ostrich  2.0  NaN
         """
         data = self if not numeric_only else self._get_numeric_data()
 
         def f(s):
-            return s.mode()
+            return s.mode(dropna=dropna)
 
         return data.apply(f, axis=axis)
 
     def quantile(self, q=0.5, axis=0, numeric_only=True,
                  interpolation='linear'):
         """
-        Return values at the given quantile over requested axis, a la
-        numpy.percentile.
+        Return values at the given quantile over requested axis.
 
         Parameters
         ----------
         q : float or array-like, default 0.5 (50% quantile)
-            0 <= q <= 1, the quantile(s) to compute
+            Value between 0 <= q <= 1, the quantile(s) to compute.
         axis : {0, 1, 'index', 'columns'} (default 0)
-            0 or 'index' for row-wise, 1 or 'columns' for column-wise
+            Equals 0 or 'index' for row-wise, 1 or 'columns' for column-wise.
+        numeric_only : bool, default True
+            If False, the quantile of datetime and timedelta data will be
+            computed as well.
         interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
-            .. versionadded:: 0.18.0
-
             This optional parameter specifies the interpolation method to use,
             when the desired quantile lies between two data points `i` and `j`:
 
@@ -5188,29 +7781,49 @@ def quantile(self, q=0.5, axis=0, numeric_only=True,
             * nearest: `i` or `j` whichever is nearest.
             * midpoint: (`i` + `j`) / 2.
 
+            .. versionadded:: 0.18.0
+
         Returns
         -------
-        quantiles : Series or DataFrame
+        Series or DataFrame
 
-            - If ``q`` is an array, a DataFrame will be returned where the
+            If ``q`` is an array, a DataFrame will be returned where the
               index is ``q``, the columns are the columns of self, and the
               values are the quantiles.
-            - If ``q`` is a float, a Series will be returned where the
+            If ``q`` is a float, a Series will be returned where the
               index is the columns of self and the values are the quantiles.
 
-        Examples
+        See Also
         --------
+        core.window.Rolling.quantile: Rolling quantile.
+        numpy.percentile: Numpy function to compute the percentile.
 
-        >>> df = DataFrame(np.array([[1, 1], [2, 10], [3, 100], [4, 100]]),
-                           columns=['a', 'b'])
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.array([[1, 1], [2, 10], [3, 100], [4, 100]]),
+        ...                   columns=['a', 'b'])
         >>> df.quantile(.1)
         a    1.3
         b    3.7
-        dtype: float64
+        Name: 0.1, dtype: float64
         >>> df.quantile([.1, .5])
                a     b
         0.1  1.3   3.7
         0.5  2.5  55.0
+
+        Specifying `numeric_only=False` will also compute the quantile of
+        datetime and timedelta data.
+
+        >>> df = pd.DataFrame({'A': [1, 2],
+        ...                    'B': [pd.Timestamp('2010'),
+        ...                          pd.Timestamp('2011')],
+        ...                    'C': [pd.Timedelta('1 days'),
+        ...                          pd.Timedelta('2 days')]})
+        >>> df.quantile(0.5, numeric_only=False)
+        A                    1.5
+        B    2010-07-02 12:00:00
+        C        1 days 12:00:00
+        Name: 0.5, dtype: object
         """
         self._check_percentile(q)
 
@@ -5238,23 +7851,23 @@ def quantile(self, q=0.5, axis=0, numeric_only=True,
 
     def to_timestamp(self, freq=None, how='start', axis=0, copy=True):
         """
-        Cast to DatetimeIndex of timestamps, at *beginning* of period
+        Cast to DatetimeIndex of timestamps, at *beginning* of period.
 
         Parameters
         ----------
-        freq : string, default frequency of PeriodIndex
-            Desired frequency
+        freq : str, default frequency of PeriodIndex
+            Desired frequency.
         how : {'s', 'e', 'start', 'end'}
             Convention for converting period to timestamp; start of period
-            vs. end
+            vs. end.
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            The axis to convert (the index by default)
-        copy : boolean, default True
-            If false then underlying input data is not copied
+            The axis to convert (the index by default).
+        copy : bool, default True
+            If False then underlying input data is not copied.
 
         Returns
         -------
-        df : DataFrame with DatetimeIndex
+        DataFrame with DatetimeIndex
         """
         new_data = self._data
         if copy:
@@ -5266,26 +7879,28 @@ def to_timestamp(self, freq=None, how='start', axis=0, copy=True):
         elif axis == 1:
             new_data.set_axis(0, self.columns.to_timestamp(freq=freq, how=how))
         else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1. Got %s' % str(axis))
+            raise AssertionError('Axis must be 0 or 1. Got {ax!s}'.format(
+                ax=axis))
 
         return self._constructor(new_data)
 
     def to_period(self, freq=None, axis=0, copy=True):
         """
         Convert DataFrame from DatetimeIndex to PeriodIndex with desired
-        frequency (inferred from index if not passed)
+        frequency (inferred from index if not passed).
 
         Parameters
         ----------
-        freq : string, default
+        freq : str, default
+            Frequency of the PeriodIndex.
         axis : {0 or 'index', 1 or 'columns'}, default 0
-            The axis to convert (the index by default)
-        copy : boolean, default True
-            If False then underlying input data is not copied
+            The axis to convert (the index by default).
+        copy : bool, default True
+            If False then underlying input data is not copied.
 
         Returns
         -------
-        ts : TimeSeries with PeriodIndex
+        TimeSeries with PeriodIndex
         """
         new_data = self._data
         if copy:
@@ -5297,63 +7912,77 @@ def to_period(self, freq=None, axis=0, copy=True):
         elif axis == 1:
             new_data.set_axis(0, self.columns.to_period(freq=freq))
         else:  # pragma: no cover
-            raise AssertionError('Axis must be 0 or 1. Got %s' % str(axis))
+            raise AssertionError('Axis must be 0 or 1. Got {ax!s}'.format(
+                ax=axis))
 
         return self._constructor(new_data)
 
     def isin(self, values):
         """
-        Return boolean DataFrame showing whether each element in the
-        DataFrame is contained in values.
+        Whether each element in the DataFrame is contained in values.
 
         Parameters
         ----------
-        values : iterable, Series, DataFrame or dictionary
+        values : iterable, Series, DataFrame or dict
             The result will only be true at a location if all the
             labels match. If `values` is a Series, that's the index. If
-            `values` is a dictionary, the keys must be the column names,
+            `values` is a dict, the keys must be the column names,
             which must match. If `values` is a DataFrame,
             then both the index and column labels must match.
 
         Returns
         -------
+        DataFrame
+            DataFrame of booleans showing whether each element in the DataFrame
+            is contained in values.
 
-        DataFrame of booleans
+        See Also
+        --------
+        DataFrame.eq: Equality test for DataFrame.
+        Series.isin: Equivalent method on Series.
+        Series.str.contains: Test if pattern or regex is contained within a
+            string of a Series or Index.
 
         Examples
         --------
-        When ``values`` is a list:
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
-        >>> df.isin([1, 3, 12, 'a'])
-               A      B
-        0   True   True
-        1  False  False
-        2   True  False
+        >>> df = pd.DataFrame({'num_legs': [2, 4], 'num_wings': [2, 0]},
+        ...                   index=['falcon', 'dog'])
+        >>> df
+                num_legs  num_wings
+        falcon         2          2
+        dog            4          0
+
+        When ``values`` is a list check whether every value in the DataFrame
+        is present in the list (which animals have 0 or 2 legs or wings)
 
-        When ``values`` is a dict:
+        >>> df.isin([0, 2])
+                num_legs  num_wings
+        falcon      True       True
+        dog        False       True
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': [1, 4, 7]})
-        >>> df.isin({'A': [1, 3], 'B': [4, 7, 12]})
-               A      B
-        0   True  False  # Note that B didn't match the 1 here.
-        1  False   True
-        2   True   True
+        When ``values`` is a dict, we can pass values to check for each
+        column separately:
 
-        When ``values`` is a Series or DataFrame:
+        >>> df.isin({'num_wings': [0, 3]})
+                num_legs  num_wings
+        falcon     False      False
+        dog        False       True
 
-        >>> df = DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
-        >>> other = DataFrame({'A': [1, 3, 3, 2], 'B': ['e', 'f', 'f', 'e']})
+        When ``values`` is a Series or DataFrame the index and column must
+        match. Note that 'falcon' does not match based on the number of legs
+        in df2.
+
+        >>> other = pd.DataFrame({'num_legs': [8, 2], 'num_wings': [0, 2]},
+        ...                      index=['spider', 'falcon'])
         >>> df.isin(other)
-               A      B
-        0   True  False
-        1  False  False  # Column A in `other` has a 3, but not at index 1.
-        2   True   True
+                num_legs  num_wings
+        falcon      True       True
+        dog        False      False
         """
         if isinstance(values, dict):
-            from collections import defaultdict
-            from pandas.tools.concat import concat
-            values = defaultdict(list, values)
+            from pandas.core.reshape.concat import concat
+            values = collections.defaultdict(list, values)
             return concat((self.iloc[:, [i]].isin(values[col])
                            for i, col in enumerate(self.columns)), axis=1)
         elif isinstance(values, Series):
@@ -5377,343 +8006,23 @@ def isin(self, values):
                                 values).reshape(self.shape), self.index,
                 self.columns)
 
+    # ----------------------------------------------------------------------
+    # Add plotting methods to DataFrame
+    plot = CachedAccessor("plot", gfx.FramePlotMethods)
+    hist = gfx.hist_frame
+    boxplot = gfx.boxplot_frame
+
 
 DataFrame._setup_axes(['index', 'columns'], info_axis=1, stat_axis=0,
-                      axes_are_reversed=True, aliases={'rows': 0})
+                      axes_are_reversed=True, aliases={'rows': 0},
+                      docs={
+                          'index': 'The index (row labels) of the DataFrame.',
+                          'columns': 'The column labels of the DataFrame.'})
 DataFrame._add_numeric_operations()
 DataFrame._add_series_or_dataframe_operations()
 
-_EMPTY_SERIES = Series([])
-
-
-def _arrays_to_mgr(arrays, arr_names, index, columns, dtype=None):
-    """
-    Segregate Series based on type and coerce into matrices.
-    Needs to handle a lot of exceptional cases.
-    """
-    # figure out the index, if necessary
-    if index is None:
-        index = extract_index(arrays)
-    else:
-        index = _ensure_index(index)
-
-    # don't force copy because getting jammed in an ndarray anyway
-    arrays = _homogenize(arrays, index, dtype)
-
-    # from BlockManager perspective
-    axes = [_ensure_index(columns), _ensure_index(index)]
-
-    return create_block_manager_from_arrays(arrays, arr_names, axes)
-
-
-def extract_index(data):
-    from pandas.core.index import _union_indexes
-
-    index = None
-    if len(data) == 0:
-        index = Index([])
-    elif len(data) > 0:
-        raw_lengths = []
-        indexes = []
-
-        have_raw_arrays = False
-        have_series = False
-        have_dicts = False
-
-        for v in data:
-            if isinstance(v, Series):
-                have_series = True
-                indexes.append(v.index)
-            elif isinstance(v, dict):
-                have_dicts = True
-                indexes.append(list(v.keys()))
-            elif is_list_like(v) and getattr(v, 'ndim', 1) == 1:
-                have_raw_arrays = True
-                raw_lengths.append(len(v))
-
-        if not indexes and not raw_lengths:
-            raise ValueError('If using all scalar values, you must pass'
-                             ' an index')
-
-        if have_series or have_dicts:
-            index = _union_indexes(indexes)
-
-        if have_raw_arrays:
-            lengths = list(set(raw_lengths))
-            if len(lengths) > 1:
-                raise ValueError('arrays must all be same length')
-
-            if have_dicts:
-                raise ValueError('Mixing dicts with non-Series may lead to '
-                                 'ambiguous ordering.')
-
-            if have_series:
-                if lengths[0] != len(index):
-                    msg = ('array length %d does not match index length %d' %
-                           (lengths[0], len(index)))
-                    raise ValueError(msg)
-            else:
-                index = _default_index(lengths[0])
-
-    return _ensure_index(index)
-
-
-def _prep_ndarray(values, copy=True):
-    if not isinstance(values, (np.ndarray, Series, Index)):
-        if len(values) == 0:
-            return np.empty((0, 0), dtype=object)
-
-        def convert(v):
-            return maybe_convert_platform(v)
-
-        # we could have a 1-dim or 2-dim list here
-        # this is equiv of np.asarray, but does object conversion
-        # and platform dtype preservation
-        try:
-            if is_list_like(values[0]) or hasattr(values[0], 'len'):
-                values = np.array([convert(v) for v in values])
-            else:
-                values = convert(values)
-        except:
-            values = convert(values)
-
-    else:
-
-        # drop subclass info, do not copy data
-        values = np.asarray(values)
-        if copy:
-            values = values.copy()
-
-    if values.ndim == 1:
-        values = values.reshape((values.shape[0], 1))
-    elif values.ndim != 2:
-        raise ValueError('Must pass 2-d input')
-
-    return values
-
-
-def _to_arrays(data, columns, coerce_float=False, dtype=None):
-    """
-    Return list of arrays, columns
-    """
-    if isinstance(data, DataFrame):
-        if columns is not None:
-            arrays = [data._ixs(i, axis=1).values
-                      for i, col in enumerate(data.columns) if col in columns]
-        else:
-            columns = data.columns
-            arrays = [data._ixs(i, axis=1).values for i in range(len(columns))]
-
-        return arrays, columns
-
-    if not len(data):
-        if isinstance(data, np.ndarray):
-            columns = data.dtype.names
-            if columns is not None:
-                return [[]] * len(columns), columns
-        return [], []  # columns if columns is not None else []
-    if isinstance(data[0], (list, tuple)):
-        return _list_to_arrays(data, columns, coerce_float=coerce_float,
-                               dtype=dtype)
-    elif isinstance(data[0], collections.Mapping):
-        return _list_of_dict_to_arrays(data, columns,
-                                       coerce_float=coerce_float, dtype=dtype)
-    elif isinstance(data[0], Series):
-        return _list_of_series_to_arrays(data, columns,
-                                         coerce_float=coerce_float,
-                                         dtype=dtype)
-    elif isinstance(data[0], Categorical):
-        if columns is None:
-            columns = _default_index(len(data))
-        return data, columns
-    elif (isinstance(data, (np.ndarray, Series, Index)) and
-          data.dtype.names is not None):
-
-        columns = list(data.dtype.names)
-        arrays = [data[k] for k in columns]
-        return arrays, columns
-    else:
-        # last ditch effort
-        data = lmap(tuple, data)
-        return _list_to_arrays(data, columns, coerce_float=coerce_float,
-                               dtype=dtype)
-
-
-def _masked_rec_array_to_mgr(data, index, columns, dtype, copy):
-    """ extract from a masked rec array and create the manager """
-
-    # essentially process a record array then fill it
-    fill_value = data.fill_value
-    fdata = ma.getdata(data)
-    if index is None:
-        index = _get_names_from_index(fdata)
-        if index is None:
-            index = _default_index(len(data))
-    index = _ensure_index(index)
-
-    if columns is not None:
-        columns = _ensure_index(columns)
-    arrays, arr_columns = _to_arrays(fdata, columns)
-
-    # fill if needed
-    new_arrays = []
-    for fv, arr, col in zip(fill_value, arrays, arr_columns):
-        mask = ma.getmaskarray(data[col])
-        if mask.any():
-            arr, fv = maybe_upcast(arr, fill_value=fv, copy=True)
-            arr[mask] = fv
-        new_arrays.append(arr)
-
-    # create the manager
-    arrays, arr_columns = _reorder_arrays(new_arrays, arr_columns, columns)
-    if columns is None:
-        columns = arr_columns
-
-    mgr = _arrays_to_mgr(arrays, arr_columns, index, columns)
-
-    if copy:
-        mgr = mgr.copy()
-    return mgr
-
-
-def _reorder_arrays(arrays, arr_columns, columns):
-    # reorder according to the columns
-    if (columns is not None and len(columns) and arr_columns is not None and
-            len(arr_columns)):
-        indexer = _ensure_index(arr_columns).get_indexer(columns)
-        arr_columns = _ensure_index([arr_columns[i] for i in indexer])
-        arrays = [arrays[i] for i in indexer]
-    return arrays, arr_columns
-
-
-def _list_to_arrays(data, columns, coerce_float=False, dtype=None):
-    if len(data) > 0 and isinstance(data[0], tuple):
-        content = list(lib.to_object_array_tuples(data).T)
-    else:
-        # list of lists
-        content = list(lib.to_object_array(data).T)
-    return _convert_object_array(content, columns, dtype=dtype,
-                                 coerce_float=coerce_float)
-
-
-def _list_of_series_to_arrays(data, columns, coerce_float=False, dtype=None):
-    from pandas.core.index import _get_combined_index
-
-    if columns is None:
-        columns = _get_combined_index([
-            s.index for s in data if getattr(s, 'index', None) is not None
-        ])
-
-    indexer_cache = {}
-
-    aligned_values = []
-    for s in data:
-        index = getattr(s, 'index', None)
-        if index is None:
-            index = _default_index(len(s))
-
-        if id(index) in indexer_cache:
-            indexer = indexer_cache[id(index)]
-        else:
-            indexer = indexer_cache[id(index)] = index.get_indexer(columns)
-
-        values = _values_from_object(s)
-        aligned_values.append(algorithms.take_1d(values, indexer))
-
-    values = np.vstack(aligned_values)
-
-    if values.dtype == np.object_:
-        content = list(values.T)
-        return _convert_object_array(content, columns, dtype=dtype,
-                                     coerce_float=coerce_float)
-    else:
-        return values.T, columns
-
-
-def _list_of_dict_to_arrays(data, columns, coerce_float=False, dtype=None):
-    if columns is None:
-        gen = (list(x.keys()) for x in data)
-        sort = not any(isinstance(d, OrderedDict) for d in data)
-        columns = lib.fast_unique_multiple_list_gen(gen, sort=sort)
-
-    # assure that they are of the base dict class and not of derived
-    # classes
-    data = [(type(d) is dict) and d or dict(d) for d in data]
-
-    content = list(lib.dicts_to_array(data, list(columns)).T)
-    return _convert_object_array(content, columns, dtype=dtype,
-                                 coerce_float=coerce_float)
-
-
-def _convert_object_array(content, columns, coerce_float=False, dtype=None):
-    if columns is None:
-        columns = _default_index(len(content))
-    else:
-        if len(columns) != len(content):  # pragma: no cover
-            # caller's responsibility to check for this...
-            raise AssertionError('%d columns passed, passed data had %s '
-                                 'columns' % (len(columns), len(content)))
-
-    # provide soft conversion of object dtypes
-    def convert(arr):
-        if dtype != object and dtype != np.object:
-            arr = lib.maybe_convert_objects(arr, try_float=coerce_float)
-            arr = maybe_cast_to_datetime(arr, dtype)
-        return arr
-
-    arrays = [convert(arr) for arr in content]
-
-    return arrays, columns
-
-
-def _get_names_from_index(data):
-    has_some_name = any([getattr(s, 'name', None) is not None for s in data])
-    if not has_some_name:
-        return _default_index(len(data))
-
-    index = lrange(len(data))
-    count = 0
-    for i, s in enumerate(data):
-        n = getattr(s, 'name', None)
-        if n is not None:
-            index[i] = n
-        else:
-            index[i] = 'Unnamed %d' % count
-            count += 1
-
-    return index
-
-
-def _homogenize(data, index, dtype=None):
-    from pandas.core.series import _sanitize_array
-
-    oindex = None
-    homogenized = []
-
-    for v in data:
-        if isinstance(v, Series):
-            if dtype is not None:
-                v = v.astype(dtype)
-            if v.index is not index:
-                # Forces alignment. No need to copy data since we
-                # are putting it into an ndarray later
-                v = v.reindex(index, copy=False)
-        else:
-            if isinstance(v, dict):
-                if oindex is None:
-                    oindex = index.astype('O')
-
-                if isinstance(index, (DatetimeIndex, TimedeltaIndex)):
-                    v = _dict_compat(v)
-                else:
-                    v = dict(v)
-                v = lib.fast_multiget(v, oindex.values, default=NA)
-            v = _sanitize_array(v, index, dtype=dtype, copy=False,
-                                raise_cast_failure=False)
-
-        homogenized.append(v)
-
-    return homogenized
+ops.add_flex_arithmetic_methods(DataFrame)
+ops.add_special_arithmetic_methods(DataFrame)
 
 
 def _from_nested_dict(data):
@@ -5727,29 +8036,4 @@ def _from_nested_dict(data):
 
 
 def _put_str(s, space):
-    return ('%s' % s)[:space].ljust(space)
-
-
-# ----------------------------------------------------------------------
-# Add plotting methods to DataFrame
-DataFrame.plot = base.AccessorProperty(gfx.FramePlotMethods,
-                                       gfx.FramePlotMethods)
-DataFrame.hist = gfx.hist_frame
-
-
-@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
-def boxplot(self, column=None, by=None, ax=None, fontsize=None, rot=0,
-            grid=True, figsize=None, layout=None, return_type=None, **kwds):
-    import pandas.tools.plotting as plots
-    import matplotlib.pyplot as plt
-    ax = plots.boxplot(self, column=column, by=by, ax=ax, fontsize=fontsize,
-                       grid=grid, rot=rot, figsize=figsize, layout=layout,
-                       return_type=return_type, **kwds)
-    plt.draw_if_interactive()
-    return ax
-
-
-DataFrame.boxplot = boxplot
-
-ops.add_flex_arithmetic_methods(DataFrame, **ops.frame_flex_funcs)
-ops.add_special_arithmetic_methods(DataFrame, **ops.frame_special_funcs)
+    return u'{s}'.format(s=s)[:space].ljust(space)
diff --git a/pandas/core/generic.py b/pandas/core/generic.py
index ad56ea44a0dc6..0b81576404e2f 100644
--- a/pandas/core/generic.py
+++ b/pandas/core/generic.py
@@ -1,58 +1,54 @@
 # pylint: disable=W0231,E1101
 import collections
-import warnings
-import operator
-import weakref
+from datetime import timedelta
+import functools
 import gc
 import json
+import operator
+from textwrap import dedent
+import warnings
+import weakref
 
 import numpy as np
-import pandas as pd
 
-from pandas._libs import tslib, lib
-from pandas.types.common import (_coerce_to_dtype,
-                                 _ensure_int64,
-                                 needs_i8_conversion,
-                                 is_scalar,
-                                 is_integer, is_bool,
-                                 is_bool_dtype,
-                                 is_numeric_dtype,
-                                 is_datetime64_dtype,
-                                 is_timedelta64_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_list_like,
-                                 is_dict_like,
-                                 is_re_compilable)
-from pandas.types.cast import maybe_promote, maybe_upcast_putmask
-from pandas.types.missing import isnull, notnull
-from pandas.types.generic import ABCSeries, ABCPanel
-
-from pandas.core.common import (_values_from_object,
-                                _maybe_box_datetimelike,
-                                SettingWithCopyError, SettingWithCopyWarning,
-                                AbstractMethodError)
-
-from pandas.core.base import PandasObject
-from pandas.core.index import (Index, MultiIndex, _ensure_index,
-                               InvalidIndexError)
-import pandas.core.indexing as indexing
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex, Period
-from pandas.core.internals import BlockManager
+from pandas._libs import Timestamp, iNaT, properties
+import pandas.compat as compat
+from pandas.compat import (
+    cPickle as pkl, isidentifier, lrange, lzip, map, set_function_name,
+    string_types, to_str, zip)
+from pandas.compat.numpy import function as nv
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import (
+    Appender, Substitution, rewrite_axis_style_signature)
+from pandas.util._validators import validate_bool_kwarg, validate_fillna_kwargs
+
+from pandas.core.dtypes.cast import maybe_promote, maybe_upcast_putmask
+from pandas.core.dtypes.common import (
+    ensure_int64, ensure_object, is_bool, is_bool_dtype,
+    is_datetime64_any_dtype, is_datetime64tz_dtype, is_dict_like,
+    is_extension_array_dtype, is_integer, is_list_like, is_number,
+    is_numeric_dtype, is_object_dtype, is_period_arraylike, is_re_compilable,
+    is_scalar, is_timedelta64_dtype, pandas_dtype)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCPanel, ABCSeries
+from pandas.core.dtypes.inference import is_hashable
+from pandas.core.dtypes.missing import isna, notna
+
+import pandas as pd
+from pandas.core import config, missing, nanops
 import pandas.core.algorithms as algos
+from pandas.core.base import PandasObject, SelectionMixin
 import pandas.core.common as com
-import pandas.core.missing as missing
-from pandas.formats.printing import pprint_thing
-from pandas.formats.format import format_percentiles
+from pandas.core.index import (
+    Index, InvalidIndexError, MultiIndex, RangeIndex, ensure_index)
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import Period, PeriodIndex
+import pandas.core.indexing as indexing
+from pandas.core.internals import BlockManager
+from pandas.core.ops import _align_method_FRAME
+
+from pandas.io.formats.format import DataFrameFormatter, format_percentiles
+from pandas.io.formats.printing import pprint_thing
 from pandas.tseries.frequencies import to_offset
-from pandas import compat
-from pandas.compat.numpy import function as nv
-from pandas.compat import (map, zip, lzip, lrange, string_types,
-                           isidentifier, set_function_name)
-import pandas.core.nanops as nanops
-from pandas.util.decorators import Appender, Substitution, deprecate_kwarg
-from pandas.util.validators import validate_bool_kwarg
-from pandas.core import config
 
 # goal is to be able to define the docs close to function, while still being
 # able to share
@@ -63,10 +59,18 @@
     args_transpose='axes to permute (int or label for object)',
     optional_by="""
         by : str or list of str
-            Name or list of names which refer to the axis items.""")
+            Name or list of names to sort by""")
+
+# sentinel value to use as kwarg in place of None when None has special meaning
+# and needs to be distinguished from a user explicitly passing None.
+sentinel = object()
 
 
 def _single_replace(self, to_replace, method, inplace, limit):
+    """
+    Replaces values in a Series using the fill method specified when no
+    replacement value is given in the replace method
+    """
     if self.ndim != 1:
         raise TypeError('cannot replace {0} with method {1} on a {2}'
                         .format(to_replace, method, type(self).__name__))
@@ -91,7 +95,7 @@ def _single_replace(self, to_replace, method, inplace, limit):
     return result
 
 
-class NDFrame(PandasObject):
+class NDFrame(PandasObject, SelectionMixin):
     """
     N-dimensional analogue of DataFrame. Store multi-dimensional in a
     size-mutable, labeled data structure
@@ -102,14 +106,23 @@ class NDFrame(PandasObject):
     axes : list
     copy : boolean, default False
     """
-    _internal_names = ['_data', '_cacher', '_item_cache', '_cache', 'is_copy',
+    _internal_names = ['_data', '_cacher', '_item_cache', '_cache', '_is_copy',
                        '_subtyp', '_name', '_index', '_default_kind',
                        '_default_fill_value', '_metadata', '__array_struct__',
                        '__array_interface__']
     _internal_names_set = set(_internal_names)
-    _accessors = frozenset([])
+    _accessors = frozenset()
+    _deprecations = frozenset(['as_blocks', 'blocks',
+                               'convert_objects', 'is_copy'])
     _metadata = []
-    is_copy = None
+    _is_copy = None
+
+    # dummy attribute so that datetime.__eq__(Series/DataFrame) defers
+    # by returning NotImplemented
+    timetuple = None
+
+    # ----------------------------------------------------------------------
+    # Constructors
 
     def __init__(self, data, axes=None, copy=False, dtype=None,
                  fastpath=False):
@@ -124,54 +137,10 @@ def __init__(self, data, axes=None, copy=False, dtype=None,
                 for i, ax in enumerate(axes):
                     data = data.reindex_axis(ax, axis=i)
 
-        object.__setattr__(self, 'is_copy', None)
+        object.__setattr__(self, '_is_copy', None)
         object.__setattr__(self, '_data', data)
         object.__setattr__(self, '_item_cache', {})
 
-    def _ipython_display_(self):
-        try:
-            from IPython.display import display
-        except ImportError:
-            return None
-
-        # Series doesn't define _repr_html_ or _repr_latex_
-        latex = self._repr_latex_() if hasattr(self, '_repr_latex_') else None
-        html = self._repr_html_() if hasattr(self, '_repr_html_') else None
-        table_schema = self._repr_table_schema_()
-        # We need the inital newline since we aren't going through the
-        # usual __repr__. See
-        # https://github.com/pandas-dev/pandas/pull/14904#issuecomment-277829277
-        text = "\n" + repr(self)
-
-        reprs = {"text/plain": text, "text/html": html, "text/latex": latex,
-                 "application/vnd.dataresource+json": table_schema}
-        reprs = {k: v for k, v in reprs.items() if v}
-        display(reprs, raw=True)
-
-    def _repr_table_schema_(self):
-        """
-        Not a real Jupyter special repr method, but we use the same
-        naming convention.
-        """
-        if config.get_option("display.html.table_schema"):
-            data = self.head(config.get_option('display.max_rows'))
-            payload = json.loads(data.to_json(orient='table'),
-                                 object_pairs_hook=collections.OrderedDict)
-            return payload
-
-    def _validate_dtype(self, dtype):
-        """ validate the passed dtype """
-
-        if dtype is not None:
-            dtype = _coerce_to_dtype(dtype)
-
-            # a compound dtype
-            if dtype.kind == 'V':
-                raise NotImplementedError("compound dtypes are not implemented"
-                                          "in the {0} constructor"
-                                          .format(self.__class__.__name__))
-        return dtype
-
     def _init_mgr(self, mgr, axes=None, dtype=None, copy=False):
         """ passed a manager and a axes dict """
         for a, axe in axes.items():
@@ -189,6 +158,37 @@ def _init_mgr(self, mgr, axes=None, dtype=None, copy=False):
                 mgr = mgr.astype(dtype=dtype)
         return mgr
 
+    # ----------------------------------------------------------------------
+
+    @property
+    def is_copy(self):
+        """
+        Return the copy.
+        """
+        warnings.warn("Attribute 'is_copy' is deprecated and will be removed "
+                      "in a future version.", FutureWarning, stacklevel=2)
+        return self._is_copy
+
+    @is_copy.setter
+    def is_copy(self, msg):
+        warnings.warn("Attribute 'is_copy' is deprecated and will be removed "
+                      "in a future version.", FutureWarning, stacklevel=2)
+        self._is_copy = msg
+
+    def _validate_dtype(self, dtype):
+        """ validate the passed dtype """
+
+        if dtype is not None:
+            dtype = pandas_dtype(dtype)
+
+            # a compound dtype
+            if dtype.kind == 'V':
+                raise NotImplementedError("compound dtypes are not implemented"
+                                          " in the {0} constructor"
+                                          .format(self.__class__.__name__))
+
+        return dtype
+
     # ----------------------------------------------------------------------
     # Construction
 
@@ -199,17 +199,6 @@ def _constructor(self):
         """
         raise AbstractMethodError(self)
 
-    def __unicode__(self):
-        # unicode representation based upon iterating over self
-        # (since, by definition, `PandasContainers` are iterable)
-        prepr = '[%s]' % ','.join(map(pprint_thing, self))
-        return '%s(%s)' % (self.__class__.__name__, prepr)
-
-    def _dir_additions(self):
-        """ add the string-like attributes from the info_axis """
-        return set([c for c in self._info_axis
-                    if isinstance(c, string_types) and isidentifier(c)])
-
     @property
     def _constructor_sliced(self):
         """Used when a manipulation result has one lower dimension(s) as the
@@ -230,7 +219,7 @@ def _constructor_expanddim(self):
     @classmethod
     def _setup_axes(cls, axes, info_axis=None, stat_axis=None, aliases=None,
                     slicers=None, axes_are_reversed=False, build_axes=True,
-                    ns=None):
+                    ns=None, docs=None):
         """Provide axes setup for the major PandasObjects.
 
         Parameters
@@ -246,10 +235,10 @@ def _setup_axes(cls, axes, info_axis=None, stat_axis=None, aliases=None,
         """
 
         cls._AXIS_ORDERS = axes
-        cls._AXIS_NUMBERS = dict((a, i) for i, a in enumerate(axes))
+        cls._AXIS_NUMBERS = {a: i for i, a in enumerate(axes)}
         cls._AXIS_LEN = len(axes)
         cls._AXIS_ALIASES = aliases or dict()
-        cls._AXIS_IALIASES = dict((v, k) for k, v in cls._AXIS_ALIASES.items())
+        cls._AXIS_IALIASES = {v: k for k, v in cls._AXIS_ALIASES.items()}
         cls._AXIS_NAMES = dict(enumerate(axes))
         cls._AXIS_SLICEMAP = slicers or None
         cls._AXIS_REVERSED = axes_are_reversed
@@ -272,7 +261,7 @@ def _setup_axes(cls, axes, info_axis=None, stat_axis=None, aliases=None,
         if build_axes:
 
             def set_axis(a, i):
-                setattr(cls, a, lib.AxisProperty(i))
+                setattr(cls, a, properties.AxisProperty(i, docs.get(a, a)))
                 cls._internal_names_set.add(a)
 
             if axes_are_reversed:
@@ -283,36 +272,38 @@ def set_axis(a, i):
                 for i, a in cls._AXIS_NAMES.items():
                     set_axis(a, i)
 
-        # addtl parms
-        if isinstance(ns, dict):
-            for k, v in ns.items():
-                setattr(cls, k, v)
+        assert not isinstance(ns, dict)
 
     def _construct_axes_dict(self, axes=None, **kwargs):
         """Return an axes dictionary for myself."""
-        d = dict([(a, self._get_axis(a)) for a in (axes or self._AXIS_ORDERS)])
+        d = {a: self._get_axis(a) for a in (axes or self._AXIS_ORDERS)}
         d.update(kwargs)
         return d
 
     @staticmethod
     def _construct_axes_dict_from(self, axes, **kwargs):
         """Return an axes dictionary for the passed axes."""
-        d = dict([(a, ax) for a, ax in zip(self._AXIS_ORDERS, axes)])
+        d = {a: ax for a, ax in zip(self._AXIS_ORDERS, axes)}
         d.update(kwargs)
         return d
 
     def _construct_axes_dict_for_slice(self, axes=None, **kwargs):
         """Return an axes dictionary for myself."""
-        d = dict([(self._AXIS_SLICEMAP[a], self._get_axis(a))
-                  for a in (axes or self._AXIS_ORDERS)])
+        d = {self._AXIS_SLICEMAP[a]: self._get_axis(a)
+             for a in (axes or self._AXIS_ORDERS)}
         d.update(kwargs)
         return d
 
-    def _construct_axes_from_arguments(self, args, kwargs, require_all=False):
+    def _construct_axes_from_arguments(
+            self, args, kwargs, require_all=False, sentinel=None):
         """Construct and returns axes if supplied in args/kwargs.
 
         If require_all, raise if all axis arguments are not supplied
         return a tuple of (axes, kwargs).
+
+        sentinel specifies the default parameter when an axis is not
+        supplied; useful to distinguish when a user explicitly passes None
+        in scenarios where None has special meaning.
         """
 
         # construct the args
@@ -340,7 +331,7 @@ def _construct_axes_from_arguments(self, args, kwargs, require_all=False):
                         raise TypeError("not enough/duplicate arguments "
                                         "specified!")
 
-        axes = dict([(a, kwargs.pop(a, None)) for a in self._AXIS_ORDERS])
+        axes = {a: kwargs.pop(a, sentinel) for a in self._AXIS_ORDERS}
         return axes, kwargs
 
     @classmethod
@@ -355,41 +346,44 @@ def _from_axes(cls, data, axes, **kwargs):
             d.update(kwargs)
             return cls(data, **d)
 
-    def _get_axis_number(self, axis):
-        axis = self._AXIS_ALIASES.get(axis, axis)
+    @classmethod
+    def _get_axis_number(cls, axis):
+        axis = cls._AXIS_ALIASES.get(axis, axis)
         if is_integer(axis):
-            if axis in self._AXIS_NAMES:
+            if axis in cls._AXIS_NAMES:
                 return axis
         else:
             try:
-                return self._AXIS_NUMBERS[axis]
-            except:
+                return cls._AXIS_NUMBERS[axis]
+            except KeyError:
                 pass
         raise ValueError('No axis named {0} for object type {1}'
-                         .format(axis, type(self)))
+                         .format(axis, cls))
 
-    def _get_axis_name(self, axis):
-        axis = self._AXIS_ALIASES.get(axis, axis)
+    @classmethod
+    def _get_axis_name(cls, axis):
+        axis = cls._AXIS_ALIASES.get(axis, axis)
         if isinstance(axis, string_types):
-            if axis in self._AXIS_NUMBERS:
+            if axis in cls._AXIS_NUMBERS:
                 return axis
         else:
             try:
-                return self._AXIS_NAMES[axis]
-            except:
+                return cls._AXIS_NAMES[axis]
+            except KeyError:
                 pass
         raise ValueError('No axis named {0} for object type {1}'
-                         .format(axis, type(self)))
+                         .format(axis, cls))
 
     def _get_axis(self, axis):
         name = self._get_axis_name(axis)
         return getattr(self, name)
 
-    def _get_block_manager_axis(self, axis):
+    @classmethod
+    def _get_block_manager_axis(cls, axis):
         """Map the axis to the block_manager axis."""
-        axis = self._get_axis_number(axis)
-        if self._AXIS_REVERSED:
-            m = self._AXIS_LEN - 1
+        axis = cls._get_axis_number(axis)
+        if cls._AXIS_REVERSED:
+            m = cls._AXIS_LEN - 1
             return m - axis
         return axis
 
@@ -439,26 +433,77 @@ def _stat_axis(self):
 
     @property
     def shape(self):
-        """Return a tuple of axis dimensions"""
+        """
+        Return a tuple of axis dimensions
+        """
         return tuple(len(self._get_axis(a)) for a in self._AXIS_ORDERS)
 
     @property
     def axes(self):
-        """Return index label(s) of the internal NDFrame"""
+        """
+        Return index label(s) of the internal NDFrame
+        """
         # we do it this way because if we have reversed axes, then
         # the block manager shows then reversed
         return [self._get_axis(a) for a in self._AXIS_ORDERS]
 
     @property
     def ndim(self):
-        """Number of axes / array dimensions"""
+        """
+        Return an int representing the number of axes / array dimensions.
+
+        Return 1 if Series. Otherwise return 2 if DataFrame.
+
+        See Also
+        --------
+        ndarray.ndim : Number of array dimensions.
+
+        Examples
+        --------
+        >>> s = pd.Series({'a': 1, 'b': 2, 'c': 3})
+        >>> s.ndim
+        1
+
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.ndim
+        2
+        """
         return self._data.ndim
 
     @property
     def size(self):
-        """number of elements in the NDFrame"""
+        """
+        Return an int representing the number of elements in this object.
+
+        Return the number of rows if Series. Otherwise return the number of
+        rows times number of columns if DataFrame.
+
+        See Also
+        --------
+        ndarray.size : Number of elements in the array.
+
+        Examples
+        --------
+        >>> s = pd.Series({'a': 1, 'b': 2, 'c': 3})
+        >>> s.size
+        3
+
+        >>> df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]})
+        >>> df.size
+        4
+        """
         return np.prod(self.shape)
 
+    @property
+    def _selected_obj(self):
+        """ internal compat with SelectionMixin """
+        return self
+
+    @property
+    def _obj_with_exclusions(self):
+        """ internal compat with SelectionMixin """
+        return self
+
     def _expand_axes(self, key):
         new_axes = []
         for k, ax in zip(key, self.axes):
@@ -471,15 +516,130 @@ def _expand_axes(self, key):
 
         return new_axes
 
-    def set_axis(self, axis, labels):
-        """ public verson of axis assignment """
-        setattr(self, self._get_axis_name(axis), labels)
+    def set_axis(self, labels, axis=0, inplace=None):
+        """
+        Assign desired index to given axis.
+
+        Indexes for column or row labels can be changed by assigning
+        a list-like or Index.
+
+        .. versionchanged:: 0.21.0
+
+           The signature is now `labels` and `axis`, consistent with
+           the rest of pandas API. Previously, the `axis` and `labels`
+           arguments were respectively the first and second positional
+           arguments.
+
+        Parameters
+        ----------
+        labels : list-like, Index
+            The values for the new index.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis to update. The value 0 identifies the rows, and 1
+            identifies the columns.
+
+        inplace : bool, default None
+            Whether to return a new %(klass)s instance.
+
+            .. warning::
+
+               ``inplace=None`` currently falls back to to True, but in a
+               future version, will default to False. Use inplace=True
+               explicitly rather than relying on the default.
+
+        Returns
+        -------
+        renamed : %(klass)s or None
+            An object of same type as caller if inplace=False, None otherwise.
+
+        See Also
+        --------
+        DataFrame.rename_axis : Alter the name of the index or columns.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        >>> s.set_axis(['a', 'b', 'c'], axis=0, inplace=False)
+        a    1
+        b    2
+        c    3
+        dtype: int64
+
+        The original object is not modified.
+
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+
+        **DataFrame**
+
+        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+
+        Change the row labels.
+
+        >>> df.set_axis(['a', 'b', 'c'], axis='index', inplace=False)
+           A  B
+        a  1  4
+        b  2  5
+        c  3  6
+
+        Change the column labels.
+
+        >>> df.set_axis(['I', 'II'], axis='columns', inplace=False)
+           I  II
+        0  1   4
+        1  2   5
+        2  3   6
+
+        Now, update the labels inplace.
+
+        >>> df.set_axis(['i', 'ii'], axis='columns', inplace=True)
+        >>> df
+           i  ii
+        0  1   4
+        1  2   5
+        2  3   6
+        """
+        if is_scalar(labels):
+            warnings.warn(
+                'set_axis now takes "labels" as first argument, and '
+                '"axis" as named parameter. The old form, with "axis" as '
+                'first parameter and \"labels\" as second, is still supported '
+                'but will be deprecated in a future version of pandas.',
+                FutureWarning, stacklevel=2)
+            labels, axis = axis, labels
+
+        if inplace is None:
+            warnings.warn(
+                'set_axis currently defaults to operating inplace.\nThis '
+                'will change in a future version of pandas, use '
+                'inplace=True to avoid this warning.',
+                FutureWarning, stacklevel=2)
+            inplace = True
+        if inplace:
+            setattr(self, self._get_axis_name(axis), labels)
+        else:
+            obj = self.copy()
+            obj.set_axis(labels, axis=axis, inplace=True)
+            return obj
 
     def _set_axis(self, axis, labels):
         self._data.set_axis(axis, labels)
         self._clear_item_cache()
 
-    _shared_docs['transpose'] = """
+    def transpose(self, *args, **kwargs):
+        """
         Permute the dimensions of the %(klass)s
 
         Parameters
@@ -488,27 +648,26 @@ def _set_axis(self, axis, labels):
         copy : boolean, default False
             Make a copy of the underlying data. Mixed-dtype data will
             always result in a copy
+        **kwargs
+            Additional keyword arguments will be passed to the function.
+
+        Returns
+        -------
+        y : same as input
 
         Examples
         --------
         >>> p.transpose(2, 0, 1)
         >>> p.transpose(2, 0, 1, copy=True)
-
-        Returns
-        -------
-        y : same as input
         """
 
-    @Appender(_shared_docs['transpose'] % _shared_doc_kwargs)
-    def transpose(self, *args, **kwargs):
-
         # construct the args
         axes, kwargs = self._construct_axes_from_arguments(args, kwargs,
                                                            require_all=True)
-        axes_names = tuple([self._get_axis_name(axes[a])
-                            for a in self._AXIS_ORDERS])
-        axes_numbers = tuple([self._get_axis_number(axes[a])
-                              for a in self._AXIS_ORDERS])
+        axes_names = tuple(self._get_axis_name(axes[a])
+                           for a in self._AXIS_ORDERS)
+        axes_numbers = tuple(self._get_axis_number(axes[a])
+                             for a in self._AXIS_ORDERS)
 
         # we must have unique axes
         if len(axes) != len(set(axes)):
@@ -525,7 +684,7 @@ def transpose(self, *args, **kwargs):
 
     def swapaxes(self, axis1, axis2, copy=True):
         """
-        Interchange axes and swap values axes appropriately
+        Interchange axes and swap values axes appropriately.
 
         Returns
         -------
@@ -549,9 +708,105 @@ def swapaxes(self, axis1, axis2, copy=True):
 
         return self._constructor(new_values, *new_axes).__finalize__(self)
 
+    def droplevel(self, level, axis=0):
+        """
+        Return DataFrame with requested index / column level(s) removed.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        level : int, str, or list-like
+            If a string is given, must be the name of a level
+            If list-like, elements must be names or positional indexes
+            of levels.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+
+        Returns
+        -------
+        DataFrame.droplevel()
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([
+        ...     [1, 2, 3, 4],
+        ...     [5, 6, 7, 8],
+        ...     [9, 10, 11, 12]
+        ... ]).set_index([0, 1]).rename_axis(['a', 'b'])
+
+        >>> df.columns = pd.MultiIndex.from_tuples([
+        ...    ('c', 'e'), ('d', 'f')
+        ... ], names=['level_1', 'level_2'])
+
+        >>> df
+        level_1   c   d
+        level_2   e   f
+        a b
+        1 2      3   4
+        5 6      7   8
+        9 10    11  12
+
+        >>> df.droplevel('a')
+        level_1   c   d
+        level_2   e   f
+        b
+        2        3   4
+        6        7   8
+        10      11  12
+
+        >>> df.droplevel('level2', axis=1)
+        level_1   c   d
+        a b
+        1 2      3   4
+        5 6      7   8
+        9 10    11  12
+        """
+        labels = self._get_axis(axis)
+        new_labels = labels.droplevel(level)
+        result = self.set_axis(new_labels, axis=axis, inplace=False)
+        return result
+
     def pop(self, item):
         """
         Return item and drop from frame. Raise KeyError if not found.
+
+        Parameters
+        ----------
+        item : str
+            Label of column to be popped.
+
+        Returns
+        -------
+        Series
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('falcon', 'bird', 389.0),
+        ...                    ('parrot', 'bird', 24.0),
+        ...                    ('lion', 'mammal', 80.5),
+        ...                    ('monkey','mammal', np.nan)],
+        ...                   columns=('name', 'class', 'max_speed'))
+        >>> df
+             name   class  max_speed
+        0  falcon    bird      389.0
+        1  parrot    bird       24.0
+        2    lion  mammal       80.5
+        3  monkey  mammal        NaN
+
+        >>> df.pop('class')
+        0      bird
+        1      bird
+        2    mammal
+        3    mammal
+        Name: class, dtype: object
+
+        >>> df
+             name  max_speed
+        0  falcon      389.0
+        1  parrot       24.0
+        2    lion       80.5
+        3  monkey        NaN
         """
         result = self[item]
         del self[item]
@@ -564,26 +819,116 @@ def pop(self, item):
 
     def squeeze(self, axis=None):
         """
-        Squeeze length 1 dimensions.
+        Squeeze 1 dimensional axis objects into scalars.
+
+        Series or DataFrames with a single element are squeezed to a scalar.
+        DataFrames with a single column or a single row are squeezed to a
+        Series. Otherwise the object is unchanged.
+
+        This method is most useful when you don't know if your
+        object is a Series or DataFrame, but you do know it has just a single
+        column. In that case you can safely call `squeeze` to ensure you have a
+        Series.
 
         Parameters
         ----------
-        axis : None, integer or string axis name, optional
-            The axis to squeeze if 1-sized.
+        axis : {0 or 'index', 1 or 'columns', None}, default None
+            A specific axis to squeeze. By default, all length-1 axes are
+            squeezed.
 
             .. versionadded:: 0.20.0
 
         Returns
         -------
-        scalar if 1-sized, else original object
+        DataFrame, Series, or scalar
+            The projection after squeezing `axis` or all the axes.
+
+        See Also
+        --------
+        Series.iloc : Integer-location based indexing for selecting scalars.
+        DataFrame.iloc : Integer-location based indexing for selecting Series.
+        Series.to_frame : Inverse of DataFrame.squeeze for a
+            single-column DataFrame.
+
+        Examples
+        --------
+        >>> primes = pd.Series([2, 3, 5, 7])
+
+        Slicing might produce a Series with a single value:
+
+        >>> even_primes = primes[primes % 2 == 0]
+        >>> even_primes
+        0    2
+        dtype: int64
+
+        >>> even_primes.squeeze()
+        2
+
+        Squeezing objects with more than one value in every axis does nothing:
+
+        >>> odd_primes = primes[primes % 2 == 1]
+        >>> odd_primes
+        1    3
+        2    5
+        3    7
+        dtype: int64
+
+        >>> odd_primes.squeeze()
+        1    3
+        2    5
+        3    7
+        dtype: int64
+
+        Squeezing is even more effective when used with DataFrames.
+
+        >>> df = pd.DataFrame([[1, 2], [3, 4]], columns=['a', 'b'])
+        >>> df
+           a  b
+        0  1  2
+        1  3  4
+
+        Slicing a single column will produce a DataFrame with the columns
+        having only one value:
+
+        >>> df_a = df[['a']]
+        >>> df_a
+           a
+        0  1
+        1  3
+
+        So the columns can be squeezed down, resulting in a Series:
+
+        >>> df_a.squeeze('columns')
+        0    1
+        1    3
+        Name: a, dtype: int64
+
+        Slicing a single row from a single column will produce a single
+        scalar DataFrame:
+
+        >>> df_0a = df.loc[df.index < 1, ['a']]
+        >>> df_0a
+           a
+        0  1
+
+        Squeezing the rows produces a single scalar Series:
+
+        >>> df_0a.squeeze('rows')
+        a    1
+        Name: 0, dtype: int64
+
+        Squeezing all axes wil project directly into a scalar:
+
+        >>> df_0a.squeeze()
+        1
         """
         axis = (self._AXIS_NAMES if axis is None else
                 (self._get_axis_number(axis),))
         try:
             return self.iloc[
-                tuple([0 if i in axis and len(a) == 1 else slice(None)
-                       for i, a in enumerate(self.axes)])]
-        except:
+                tuple(0 if i in axis and len(a) == 1 else slice(None)
+                      for i, a in enumerate(self.axes))]
+        except Exception:
             return self
 
     def swaplevel(self, i=-2, j=-1, axis=0):
@@ -592,12 +937,12 @@ def swaplevel(self, i=-2, j=-1, axis=0):
 
         Parameters
         ----------
-        i, j : int, string (can be mixed)
+        i, j : int, str (can be mixed)
             Level of index to be swapped. Can pass level name as string.
 
         Returns
         -------
-        swapped : type of caller (new object)
+        swapped : same type as caller (new object)
 
         .. versionchanged:: 0.18.1
 
@@ -614,9 +959,8 @@ def swaplevel(self, i=-2, j=-1, axis=0):
     # ----------------------------------------------------------------------
     # Rename
 
-    # TODO: define separate funcs for DataFrame, Series and Panel so you can
-    # get completion on keyword arguments.
-    _shared_docs['rename'] = """
+    def rename(self, *args, **kwargs):
+        """
         Alter axes input function or functions. Function / dict values must be
         unique (1-to-1). Labels not contained in a dict / Series will be left
         as-is. Extra labels listed don't throw an error. Alternatively, change
@@ -629,22 +973,38 @@ def swaplevel(self, i=-2, j=-1, axis=0):
             and raise on DataFrame or Panel.
             dict-like or functions are transformations to apply to
             that axis' values
-        copy : boolean, default True
-            Also copy underlying data
-        inplace : boolean, default False
+        copy : bool, default True
+            Also copy underlying data.
+        inplace : bool, default False
             Whether to return a new %(klass)s. If True then value of copy is
             ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
+        errors : {'ignore', 'raise'}, default 'ignore'
+            If 'raise', raise a `KeyError` when a dict-like `mapper`, `index`,
+            or `columns` contains labels that are not present in the Index
+            being transformed.
+            If 'ignore', existing keys will be renamed and extra keys will be
+            ignored.
 
         Returns
         -------
         renamed : %(klass)s (new object)
 
+        Raises
+        ------
+        KeyError
+            If any of the labels is not found in the selected axis and
+            "errors='raise'".
+
         See Also
         --------
-        pandas.NDFrame.rename_axis
+        NDFrame.rename_axis
 
         Examples
         --------
+
         >>> s = pd.Series([1, 2, 3])
         >>> s
         0    1
@@ -666,52 +1026,69 @@ def swaplevel(self, i=-2, j=-1, axis=0):
         3    2
         5    3
         dtype: int64
+
+        Since ``DataFrame`` doesn't have a ``.name`` attribute,
+        only mapping-type arguments are allowed.
+
         >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
         >>> df.rename(2)
         Traceback (most recent call last):
         ...
         TypeError: 'int' object is not callable
+
+        ``DataFrame.rename`` supports two calling conventions
+
+        * ``(index=index_mapper, columns=columns_mapper, ...)``
+        * ``(mapper, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
         >>> df.rename(index=str, columns={"A": "a", "B": "c"})
            a  c
         0  1  4
         1  2  5
         2  3  6
+
         >>> df.rename(index=str, columns={"A": "a", "C": "c"})
            a  B
         0  1  4
         1  2  5
         2  3  6
-        """
 
-    @Appender(_shared_docs['rename'] % dict(axes='axes keywords for this'
-                                            ' object', klass='NDFrame'))
-    def rename(self, *args, **kwargs):
+        Using axis-style parameters
+
+        >>> df.rename(str.lower, axis='columns')
+           a  b
+        0  1  4
+        1  2  5
+        2  3  6
 
+        >>> df.rename({1: 2, 2: 4}, axis='index')
+           A  B
+        0  1  4
+        2  2  5
+        4  3  6
+
+        See the :ref:`user guide <basics.rename>` for more.
+        """
         axes, kwargs = self._construct_axes_from_arguments(args, kwargs)
         copy = kwargs.pop('copy', True)
         inplace = kwargs.pop('inplace', False)
+        level = kwargs.pop('level', None)
+        axis = kwargs.pop('axis', None)
+        errors = kwargs.pop('errors', 'ignore')
+        if axis is not None:
+            # Validate the axis
+            self._get_axis_number(axis)
 
         if kwargs:
             raise TypeError('rename() got an unexpected keyword '
                             'argument "{0}"'.format(list(kwargs.keys())[0]))
 
-        if com._count_not_none(*axes.values()) == 0:
+        if com.count_not_none(*axes.values()) == 0:
             raise TypeError('must pass an index to rename')
 
-        # renamer function if passed a dict
-        def _get_rename_function(mapper):
-            if isinstance(mapper, (dict, ABCSeries)):
-
-                def f(x):
-                    if x in mapper:
-                        return mapper[x]
-                    else:
-                        return x
-            else:
-                f = mapper
-
-            return f
-
         self._consolidate_inplace()
         result = self if inplace else self.copy(deep=copy)
 
@@ -720,10 +1097,22 @@ def f(x):
             v = axes.get(self._AXIS_NAMES[axis])
             if v is None:
                 continue
-            f = _get_rename_function(v)
-
+            f = com._get_rename_function(v)
             baxis = self._get_block_manager_axis(axis)
-            result._data = result._data.rename_axis(f, axis=baxis, copy=copy)
+            if level is not None:
+                level = self.axes[axis]._get_level_number(level)
+
+            # GH 13473
+            if not callable(v):
+                indexer = self.axes[axis].get_indexer_for(v)
+                if errors == 'raise' and len(indexer[indexer == -1]):
+                    missing_labels = [label for index, label in enumerate(v)
+                                      if indexer[index] == -1]
+                    raise KeyError('{} not found in axis'
+                                   .format(missing_labels))
+
+            result._data = result._data.rename_axis(f, axis=baxis, copy=copy,
+                                                    level=level)
             result._clear_item_cache()
 
         if inplace:
@@ -731,129 +1120,375 @@ def f(x):
         else:
             return result.__finalize__(self)
 
-    rename.__doc__ = _shared_docs['rename']
-
-    def rename_axis(self, mapper, axis=0, copy=True, inplace=False):
+    @rewrite_axis_style_signature('mapper', [('copy', True),
+                                             ('inplace', False)])
+    def rename_axis(self, mapper=sentinel, **kwargs):
         """
-        Alter index and / or columns using input function or functions.
-        A scalar or list-like for ``mapper`` will alter the ``Index.name``
-        or ``MultiIndex.names`` attribute.
-        A function or dict for ``mapper`` will alter the labels.
-        Function / dict values must be unique (1-to-1). Labels not contained in
-        a dict / Series will be left as-is.
+        Set the name of the axis for the index or columns.
 
         Parameters
         ----------
-        mapper : scalar, list-like, dict-like or function, optional
-        axis : int or string, default 0
-        copy : boolean, default True
-            Also copy underlying data
-        inplace : boolean, default False
+        mapper : scalar, list-like, optional
+            Value to set the axis name attribute.
+        index, columns : scalar, list-like, dict-like or function, optional
+            A scalar, list-like, dict-like or functions transformations to
+            apply to that axis' values.
+
+            Use either ``mapper`` and ``axis`` to
+            specify the axis to target with ``mapper``, or ``index``
+            and/or ``columns``.
+
+            .. versionchanged:: 0.24.0
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis to rename.
+        copy : bool, default True
+            Also copy underlying data.
+        inplace : bool, default False
+            Modifies the object directly, instead of creating a new Series
+            or DataFrame.
 
         Returns
         -------
-        renamed : type of caller
+        Series, DataFrame, or None
+            The same type as the caller or None if `inplace` is True.
 
         See Also
         --------
-        pandas.NDFrame.rename
-        pandas.Index.rename
+        Series.rename : Alter Series index labels or name.
+        DataFrame.rename : Alter DataFrame index labels or name.
+        Index.rename : Set new names on index.
+
+        Notes
+        -----
+        Prior to version 0.21.0, ``rename_axis`` could also be used to change
+        the axis *labels* by passing a mapping or scalar. This behavior is
+        deprecated and will be removed in a future version. Use ``rename``
+        instead.
+
+        ``DataFrame.rename_axis`` supports two calling conventions
+
+        * ``(index=index_mapper, columns=columns_mapper, ...)``
+        * ``(mapper, axis={'index', 'columns'}, ...)``
+
+        The first calling convention will only modify the names of
+        the index and/or the names of the Index object that is the columns.
+        In this case, the parameter ``copy`` is ignored.
+
+        The second calling convention will modify the names of the
+        the corresponding index if mapper is a list or a scalar.
+        However, if mapper is dict-like or a function, it will use the
+        deprecated behavior of modifying the axis *labels*.
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
 
         Examples
         --------
-        >>> df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
-        >>> df.rename_axis("foo")  # scalar, alters df.index.name
-             A  B
-        foo
-        0    1  4
-        1    2  5
-        2    3  6
-        >>> df.rename_axis(lambda x: 2 * x)  # function: alters labels
-           A  B
-        0  1  4
-        2  2  5
-        4  3  6
-        >>> df.rename_axis({"A": "ehh", "C": "see"}, axis="columns")  # mapping
-           ehh  B
-        0    1  4
-        1    2  5
-        2    3  6
-        """
+        **Series**
+
+        >>> s = pd.Series(["dog", "cat", "monkey"])
+        >>> s
+        0       dog
+        1       cat
+        2    monkey
+        dtype: object
+        >>> s.rename_axis("animal")
+        animal
+        0    dog
+        1    cat
+        2    monkey
+        dtype: object
+
+        **DataFrame**
+
+        >>> df = pd.DataFrame({"num_legs": [4, 4, 2],
+        ...                    "num_arms": [0, 0, 2]},
+        ...                   ["dog", "cat", "monkey"])
+        >>> df
+                num_legs  num_arms
+        dog            4         0
+        cat            4         0
+        monkey         2         2
+        >>> df = df.rename_axis("animal")
+        >>> df
+                num_legs  num_arms
+        animal
+        dog            4         0
+        cat            4         0
+        monkey         2         2
+        >>> df = df.rename_axis("limbs", axis="columns")
+        >>> df
+        limbs   num_legs  num_arms
+        animal
+        dog            4         0
+        cat            4         0
+        monkey         2         2
+
+        **MultiIndex**
+
+        >>> df.index = pd.MultiIndex.from_product([['mammal'],
+        ...                                        ['dog', 'cat', 'monkey']],
+        ...                                       names=['type', 'name'])
+        >>> df
+        limbs          num_legs  num_arms
+        type   name
+        mammal dog            4         0
+               cat            4         0
+               monkey         2         2
+
+        >>> df.rename_axis(index={'type': 'class'})
+        limbs          num_legs  num_arms
+        class  name
+        mammal dog            4         0
+               cat            4         0
+               monkey         2         2
+
+        >>> df.rename_axis(columns=str.upper)
+        LIMBS          num_legs  num_arms
+        type   name
+        mammal dog            4         0
+               cat            4         0
+               monkey         2         2
+        """
+        axes, kwargs = self._construct_axes_from_arguments(
+            (), kwargs, sentinel=sentinel)
+        copy = kwargs.pop('copy', True)
+        inplace = kwargs.pop('inplace', False)
+        axis = kwargs.pop('axis', 0)
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        if kwargs:
+            raise TypeError('rename_axis() got an unexpected keyword '
+                            'argument "{0}"'.format(list(kwargs.keys())[0]))
+
         inplace = validate_bool_kwarg(inplace, 'inplace')
-        non_mapper = is_scalar(mapper) or (is_list_like(mapper) and not
-                                           is_dict_like(mapper))
-        if non_mapper:
-            return self._set_axis_name(mapper, axis=axis)
+
+        if (mapper is not sentinel):
+            # Use v0.23 behavior if a scalar or list
+            non_mapper = is_scalar(mapper) or (is_list_like(mapper) and not
+                                               is_dict_like(mapper))
+            if non_mapper:
+                return self._set_axis_name(mapper, axis=axis, inplace=inplace)
+            else:
+                # Deprecated (v0.21) behavior is if mapper is specified,
+                # and not a list or scalar, then call rename
+                msg = ("Using 'rename_axis' to alter labels is deprecated. "
+                       "Use '.rename' instead")
+                warnings.warn(msg, FutureWarning, stacklevel=3)
+                axis = self._get_axis_name(axis)
+                d = {'copy': copy, 'inplace': inplace}
+                d[axis] = mapper
+                return self.rename(**d)
         else:
-            axis = self._get_axis_name(axis)
-            d = {'copy': copy, 'inplace': inplace}
-            d[axis] = mapper
-            return self.rename(**d)
+            # Use new behavior.  Means that index and/or columns
+            # is specified
+            result = self if inplace else self.copy(deep=copy)
 
-    def _set_axis_name(self, name, axis=0):
+            for axis in lrange(self._AXIS_LEN):
+                v = axes.get(self._AXIS_NAMES[axis])
+                if v is sentinel:
+                    continue
+                non_mapper = is_scalar(v) or (is_list_like(v) and not
+                                              is_dict_like(v))
+                if non_mapper:
+                    newnames = v
+                else:
+                    f = com._get_rename_function(v)
+                    curnames = self._get_axis(axis).names
+                    newnames = [f(name) for name in curnames]
+                result._set_axis_name(newnames, axis=axis,
+                                      inplace=True)
+            if not inplace:
+                return result
+
+    def _set_axis_name(self, name, axis=0, inplace=False):
         """
-        Alter the name or names of the axis, returning self.
+        Set the name(s) of the axis.
 
         Parameters
         ----------
         name : str or list of str
-            Name for the Index, or list of names for the MultiIndex
-        axis : int or str
-           0 or 'index' for the index; 1 or 'columns' for the columns
+            Name(s) to set.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis to set the label. The value 0 or 'index' specifies index,
+            and the value 1 or 'columns' specifies columns.
+        inplace : bool, default False
+            If `True`, do operation inplace and return None.
+
+            .. versionadded:: 0.21.0
 
         Returns
         -------
-        renamed : type of caller
+        Series, DataFrame, or None
+            The same type as the caller or `None` if `inplace` is `True`.
 
         See Also
         --------
-        pandas.DataFrame.rename
-        pandas.Series.rename
-        pandas.Index.rename
+        DataFrame.rename : Alter the axis labels of :class:`DataFrame`.
+        Series.rename : Alter the index labels or set the index name
+            of :class:`Series`.
+        Index.rename : Set the name of :class:`Index` or :class:`MultiIndex`.
 
         Examples
         --------
-        >>> df._set_axis_name("foo")
-             A
-        foo
-        0    1
-        1    2
-        2    3
-        >>> df.index = pd.MultiIndex.from_product([['A'], ['a', 'b', 'c']])
-        >>> df._set_axis_name(["bar", "baz"])
-                 A
-        bar baz
-        A   a    1
-            b    2
-            c    3
+        >>> df = pd.DataFrame({"num_legs": [4, 4, 2]},
+        ...                   ["dog", "cat", "monkey"])
+        >>> df
+                num_legs
+        dog            4
+        cat            4
+        monkey         2
+        >>> df._set_axis_name("animal")
+                num_legs
+        animal
+        dog            4
+        cat            4
+        monkey         2
+        >>> df.index = pd.MultiIndex.from_product(
+        ...                [["mammal"], ['dog', 'cat', 'monkey']])
+        >>> df._set_axis_name(["type", "name"])
+                       legs
+        type   name
+        mammal dog        4
+               cat        4
+               monkey     2
         """
         axis = self._get_axis_number(axis)
         idx = self._get_axis(axis).set_names(name)
 
-        renamed = self.copy(deep=True)
-        renamed.set_axis(axis, idx)
-        return renamed
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        renamed = self if inplace else self.copy()
+        renamed.set_axis(idx, axis=axis, inplace=True)
+        if not inplace:
+            return renamed
 
     # ----------------------------------------------------------------------
-    # Comparisons
+    # Comparison Methods
 
     def _indexed_same(self, other):
-        return all([self._get_axis(a).equals(other._get_axis(a))
-                    for a in self._AXIS_ORDERS])
+        return all(self._get_axis(a).equals(other._get_axis(a))
+                   for a in self._AXIS_ORDERS)
+
+    def equals(self, other):
+        """
+        Test whether two objects contain the same elements.
+
+        This function allows two Series or DataFrames to be compared against
+        each other to see if they have the same shape and elements. NaNs in
+        the same location are considered equal. The column headers do not
+        need to have the same type, but the elements within the columns must
+        be the same dtype.
+
+        Parameters
+        ----------
+        other : Series or DataFrame
+            The other Series or DataFrame to be compared with the first.
+
+        Returns
+        -------
+        bool
+            True if all elements are the same in both objects, False
+            otherwise.
+
+        See Also
+        --------
+        Series.eq : Compare two Series objects of the same length
+            and return a Series where each element is True if the element
+            in each Series is equal, False otherwise.
+        DataFrame.eq : Compare two DataFrame objects of the same shape and
+            return a DataFrame where each element is True if the respective
+            element in each DataFrame is equal, False otherwise.
+        assert_series_equal : Return True if left and right Series are equal,
+            False otherwise.
+        assert_frame_equal : Return True if left and right DataFrames are
+            equal, False otherwise.
+        numpy.array_equal : Return True if two arrays have the same shape
+            and elements, False otherwise.
+
+        Notes
+        -----
+        This function requires that the elements have the same dtype as their
+        respective elements in the other Series or DataFrame. However, the
+        column labels do not need to have the same type, as long as they are
+        still considered equal.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({1: [10], 2: [20]})
+        >>> df
+            1   2
+        0  10  20
+
+        DataFrames df and exactly_equal have the same types and values for
+        their elements and column labels, which will return True.
+
+        >>> exactly_equal = pd.DataFrame({1: [10], 2: [20]})
+        >>> exactly_equal
+            1   2
+        0  10  20
+        >>> df.equals(exactly_equal)
+        True
+
+        DataFrames df and different_column_type have the same element
+        types and values, but have different types for the column labels,
+        which will still return True.
+
+        >>> different_column_type = pd.DataFrame({1.0: [10], 2.0: [20]})
+        >>> different_column_type
+           1.0  2.0
+        0   10   20
+        >>> df.equals(different_column_type)
+        True
+
+        DataFrames df and different_data_type have different types for the
+        same values for their elements, and will return False even though
+        their column labels are the same values and types.
+
+        >>> different_data_type = pd.DataFrame({1: [10.0], 2: [20.0]})
+        >>> different_data_type
+              1     2
+        0  10.0  20.0
+        >>> df.equals(different_data_type)
+        False
+        """
+        if not isinstance(other, self._constructor):
+            return False
+        return self._data.equals(other._data)
+
+    # -------------------------------------------------------------------------
+    # Unary Methods
 
     def __neg__(self):
-        values = _values_from_object(self)
-        if values.dtype == np.bool_:
+        values = com.values_from_object(self)
+        if is_bool_dtype(values):
             arr = operator.inv(values)
-        else:
+        elif (is_numeric_dtype(values) or is_timedelta64_dtype(values)
+                or is_object_dtype(values)):
             arr = operator.neg(values)
+        else:
+            raise TypeError("Unary negative expects numeric dtype, not {}"
+                            .format(values.dtype))
+        return self.__array_wrap__(arr)
+
+    def __pos__(self):
+        values = com.values_from_object(self)
+        if (is_bool_dtype(values) or is_period_arraylike(values)):
+            arr = values
+        elif (is_numeric_dtype(values) or is_timedelta64_dtype(values)
+                or is_object_dtype(values)):
+            arr = operator.pos(values)
+        else:
+            raise TypeError("Unary plus expects numeric dtype, not {}"
+                            .format(values.dtype))
         return self.__array_wrap__(arr)
 
     def __invert__(self):
         try:
-            arr = operator.inv(_values_from_object(self))
+            arr = operator.inv(com.values_from_object(self))
             return self.__array_wrap__(arr)
-        except:
+        except Exception:
 
             # inv fails with 0 len
             if not np.prod(self.shape):
@@ -861,14 +1496,338 @@ def __invert__(self):
 
             raise
 
-    def equals(self, other):
+    def __nonzero__(self):
+        raise ValueError("The truth value of a {0} is ambiguous. "
+                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
+                         .format(self.__class__.__name__))
+
+    __bool__ = __nonzero__
+
+    def bool(self):
         """
-        Determines if two NDFrame objects contain the same elements. NaNs in
-        the same location are considered equal.
+        Return the bool of a single element PandasObject.
+
+        This must be a boolean scalar value, either True or False.  Raise a
+        ValueError if the PandasObject does not have exactly 1 element, or that
+        element is not boolean
         """
-        if not isinstance(other, self._constructor):
-            return False
-        return self._data.equals(other._data)
+        v = self.squeeze()
+        if isinstance(v, (bool, np.bool_)):
+            return bool(v)
+        elif is_scalar(v):
+            raise ValueError("bool cannot act on a non-boolean single element "
+                             "{0}".format(self.__class__.__name__))
+
+        self.__nonzero__()
+
+    def __abs__(self):
+        return self.abs()
+
+    def __round__(self, decimals=0):
+        return self.round(decimals)
+
+    # -------------------------------------------------------------------------
+    # Label or Level Combination Helpers
+    #
+    # A collection of helper methods for DataFrame/Series operations that
+    # accept a combination of column/index labels and levels.  All such
+    # operations should utilize/extend these methods when possible so that we
+    # have consistent precedence and validation logic throughout the library.
+
+    def _is_level_reference(self, key, axis=0):
+        """
+        Test whether a key is a level reference for a given axis.
+
+        To be considered a level reference, `key` must be a string that:
+          - (axis=0): Matches the name of an index level and does NOT match
+            a column label.
+          - (axis=1): Matches the name of a column level and does NOT match
+            an index label.
+
+        Parameters
+        ----------
+        key : str
+            Potential level name for the given axis
+        axis : int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Returns
+        -------
+        is_level : bool
+        """
+        axis = self._get_axis_number(axis)
+
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_level_reference is not implemented for {type}"
+                .format(type=type(self)))
+
+        return (key is not None and
+                is_hashable(key) and
+                key in self.axes[axis].names and
+                not self._is_label_reference(key, axis=axis))
+
+    def _is_label_reference(self, key, axis=0):
+        """
+        Test whether a key is a label reference for a given axis.
+
+        To be considered a label reference, `key` must be a string that:
+          - (axis=0): Matches a column label
+          - (axis=1): Matches an index label
+
+        Parameters
+        ----------
+        key: str
+            Potential label name
+        axis: int, default 0
+            Axis perpendicular to the axis that labels are associated with
+            (0 means search for column labels, 1 means search for index labels)
+
+        Returns
+        -------
+        is_label: bool
+        """
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_label_reference is not implemented for {type}"
+                .format(type=type(self)))
+
+        axis = self._get_axis_number(axis)
+        other_axes = (ax for ax in range(self._AXIS_LEN) if ax != axis)
+
+        return (key is not None and
+                is_hashable(key) and
+                any(key in self.axes[ax] for ax in other_axes))
+
+    def _is_label_or_level_reference(self, key, axis=0):
+        """
+        Test whether a key is a label or level reference for a given axis.
+
+        To be considered either a label or a level reference, `key` must be a
+        string that:
+          - (axis=0): Matches a column label or an index level
+          - (axis=1): Matches an index label or a column level
+
+        Parameters
+        ----------
+        key: str
+            Potential label or level name
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Returns
+        -------
+        is_label_or_level: bool
+        """
+
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_is_label_or_level_reference is not implemented for {type}"
+                .format(type=type(self)))
+
+        return (self._is_level_reference(key, axis=axis) or
+                self._is_label_reference(key, axis=axis))
+
+    def _check_label_or_level_ambiguity(self, key, axis=0):
+        """
+        Check whether `key` is ambiguous.
+
+        By ambiguous, we mean that it matches both a level of the input
+        `axis` and a label of the other axis.
+
+        Parameters
+        ----------
+        key: str or object
+            label or level name
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Raises
+        ------
+        ValueError: `key` is ambiguous
+        """
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_check_label_or_level_ambiguity is not implemented for {type}"
+                .format(type=type(self)))
+
+        axis = self._get_axis_number(axis)
+        other_axes = (ax for ax in range(self._AXIS_LEN) if ax != axis)
+
+        if (key is not None and
+                is_hashable(key) and
+                key in self.axes[axis].names and
+                any(key in self.axes[ax] for ax in other_axes)):
+
+            # Build an informative and grammatical warning
+            level_article, level_type = (('an', 'index')
+                                         if axis == 0 else
+                                         ('a', 'column'))
+
+            label_article, label_type = (('a', 'column')
+                                         if axis == 0 else
+                                         ('an', 'index'))
+
+            msg = ("'{key}' is both {level_article} {level_type} level and "
+                   "{label_article} {label_type} label, which is ambiguous."
+                   ).format(key=key,
+                            level_article=level_article,
+                            level_type=level_type,
+                            label_article=label_article,
+                            label_type=label_type)
+            raise ValueError(msg)
+
+    def _get_label_or_level_values(self, key, axis=0):
+        """
+        Return a 1-D array of values associated with `key`, a label or level
+        from the given `axis`.
+
+        Retrieval logic:
+          - (axis=0): Return column values if `key` matches a column label.
+            Otherwise return index level values if `key` matches an index
+            level.
+          - (axis=1): Return row values if `key` matches an index label.
+            Otherwise return column level values if 'key' matches a column
+            level
+
+        Parameters
+        ----------
+        key: str
+            Label or level name.
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Returns
+        -------
+        values: np.ndarray
+
+        Raises
+        ------
+        KeyError
+            if `key` matches neither a label nor a level
+        ValueError
+            if `key` matches multiple labels
+        FutureWarning
+            if `key` is ambiguous. This will become an ambiguity error in a
+            future version
+        """
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_get_label_or_level_values is not implemented for {type}"
+                .format(type=type(self)))
+
+        axis = self._get_axis_number(axis)
+        other_axes = [ax for ax in range(self._AXIS_LEN) if ax != axis]
+
+        if self._is_label_reference(key, axis=axis):
+            self._check_label_or_level_ambiguity(key, axis=axis)
+            values = self.xs(key, axis=other_axes[0])._values
+        elif self._is_level_reference(key, axis=axis):
+            values = self.axes[axis].get_level_values(key)._values
+        else:
+            raise KeyError(key)
+
+        # Check for duplicates
+        if values.ndim > 1:
+
+            if other_axes and isinstance(
+                    self._get_axis(other_axes[0]), MultiIndex):
+                multi_message = ('\n'
+                                 'For a multi-index, the label must be a '
+                                 'tuple with elements corresponding to '
+                                 'each level.')
+            else:
+                multi_message = ''
+
+            label_axis_name = 'column' if axis == 0 else 'index'
+            raise ValueError(("The {label_axis_name} label '{key}' "
+                              "is not unique.{multi_message}")
+                             .format(key=key,
+                                     label_axis_name=label_axis_name,
+                                     multi_message=multi_message))
+
+        return values
+
+    def _drop_labels_or_levels(self, keys, axis=0):
+        """
+        Drop labels and/or levels for the given `axis`.
+
+        For each key in `keys`:
+          - (axis=0): If key matches a column label then drop the column.
+            Otherwise if key matches an index level then drop the level.
+          - (axis=1): If key matches an index label then drop the row.
+            Otherwise if key matches a column level then drop the level.
+
+        Parameters
+        ----------
+        keys: str or list of str
+            labels or levels to drop
+        axis: int, default 0
+            Axis that levels are associated with (0 for index, 1 for columns)
+
+        Returns
+        -------
+        dropped: DataFrame
+
+        Raises
+        ------
+        ValueError
+            if any `keys` match neither a label nor a level
+        """
+        if self.ndim > 2:
+            raise NotImplementedError(
+                "_drop_labels_or_levels is not implemented for {type}"
+                .format(type=type(self)))
+
+        axis = self._get_axis_number(axis)
+
+        # Validate keys
+        keys = com.maybe_make_list(keys)
+        invalid_keys = [k for k in keys if not
+                        self._is_label_or_level_reference(k, axis=axis)]
+
+        if invalid_keys:
+            raise ValueError(("The following keys are not valid labels or "
+                              "levels for axis {axis}: {invalid_keys}")
+                             .format(axis=axis,
+                                     invalid_keys=invalid_keys))
+
+        # Compute levels and labels to drop
+        levels_to_drop = [k for k in keys
+                          if self._is_level_reference(k, axis=axis)]
+
+        labels_to_drop = [k for k in keys
+                          if not self._is_level_reference(k, axis=axis)]
+
+        # Perform copy upfront and then use inplace operations below.
+        # This ensures that we always perform exactly one copy.
+        # ``copy`` and/or ``inplace`` options could be added in the future.
+        dropped = self.copy()
+
+        if axis == 0:
+            # Handle dropping index levels
+            if levels_to_drop:
+                dropped.reset_index(levels_to_drop, drop=True, inplace=True)
+
+            # Handle dropping columns labels
+            if labels_to_drop:
+                dropped.drop(labels_to_drop, axis=1, inplace=True)
+        else:
+            # Handle dropping column levels
+            if levels_to_drop:
+                if isinstance(dropped.columns, MultiIndex):
+                    # Drop the specified levels from the MultiIndex
+                    dropped.columns = dropped.columns.droplevel(levels_to_drop)
+                else:
+                    # Drop the last level of Index by replacing with
+                    # a RangeIndex
+                    dropped.columns = RangeIndex(dropped.columns.size)
+
+            # Handle dropping index labels
+            if labels_to_drop:
+                dropped.drop(labels_to_drop, axis=0, inplace=True)
+
+        return dropped
 
     # ----------------------------------------------------------------------
     # Iteration
@@ -878,7 +1837,7 @@ def __hash__(self):
                         ' hashed'.format(self.__class__.__name__))
 
     def __iter__(self):
-        """Iterate over infor axis"""
+        """Iterate over info axis"""
         return iter(self._info_axis)
 
     # can we get a better explanation of this?
@@ -907,14 +1866,27 @@ def __contains__(self, key):
         """True if the key is in the info axis"""
         return key in self._info_axis
 
-    @property
-    def empty(self):
-        """True if NDFrame is entirely empty [no items], meaning any of the
-        axes are of length 0.
+    @property
+    def empty(self):
+        """
+        Indicator whether DataFrame is empty.
+
+        True if DataFrame is entirely empty (no items), meaning any of the
+        axes are of length 0.
+
+        Returns
+        -------
+        bool
+            If DataFrame is empty, return True, if not return False.
+
+        See Also
+        --------
+        Series.dropna
+        DataFrame.dropna
 
         Notes
         -----
-        If NDFrame contains only NaNs, it is still not considered empty. See
+        If DataFrame contains only NaNs, it is still not considered empty. See
         the example below.
 
         Examples
@@ -940,48 +1912,18 @@ def empty(self):
         False
         >>> df.dropna().empty
         True
-
-        See also
-        --------
-        pandas.Series.dropna
-        pandas.DataFrame.dropna
         """
         return any(len(self._get_axis(a)) == 0 for a in self._AXIS_ORDERS)
 
-    def __nonzero__(self):
-        raise ValueError("The truth value of a {0} is ambiguous. "
-                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
-                         .format(self.__class__.__name__))
-
-    __bool__ = __nonzero__
-
-    def bool(self):
-        """Return the bool of a single element PandasObject.
-
-        This must be a boolean scalar value, either True or False.  Raise a
-        ValueError if the PandasObject does not have exactly 1 element, or that
-        element is not boolean
-        """
-        v = self.squeeze()
-        if isinstance(v, (bool, np.bool_)):
-            return bool(v)
-        elif is_scalar(v):
-            raise ValueError("bool cannot act on a non-boolean single element "
-                             "{0}".format(self.__class__.__name__))
-
-        self.__nonzero__()
-
-    def __abs__(self):
-        return self.abs()
-
-    def __round__(self, decimals=0):
-        return self.round(decimals)
-
     # ----------------------------------------------------------------------
     # Array Interface
 
+    # This is also set in IndexOpsMixin
+    # GH#23114 Ensure ndarray.__op__(DataFrame) returns NotImplemented
+    __array_priority__ = 1000
+
     def __array__(self, dtype=None):
-        return _values_from_object(self)
+        return com.values_from_object(self)
 
     def __array_wrap__(self, result, context=None):
         d = self._construct_axes_dict(self._AXIS_ORDERS, copy=False)
@@ -996,7 +1938,9 @@ def __array_wrap__(self, result, context=None):
     #    return dict(typestr=values.dtype.str,shape=values.shape,data=values)
 
     def to_dense(self):
-        """Return dense representation of NDFrame (as opposed to sparse)"""
+        """
+        Return dense representation of NDFrame (as opposed to sparse).
+        """
         # compat
         return self
 
@@ -1004,7 +1948,7 @@ def to_dense(self):
     # Picklability
 
     def __getstate__(self):
-        meta = dict((k, getattr(self, k, None)) for k in self._metadata)
+        meta = {k: getattr(self, k, None) for k in self._metadata}
         return dict(_data=self._data, _typ=self._typ, _metadata=self._metadata,
                     **meta)
 
@@ -1048,76 +1992,165 @@ def __setstate__(self, state):
         self._item_cache = {}
 
     # ----------------------------------------------------------------------
-    # IO
+    # Rendering Methods
+
+    def __unicode__(self):
+        # unicode representation based upon iterating over self
+        # (since, by definition, `PandasContainers` are iterable)
+        prepr = '[%s]' % ','.join(map(pprint_thing, self))
+        return '%s(%s)' % (self.__class__.__name__, prepr)
+
+    def _repr_latex_(self):
+        """
+        Returns a LaTeX representation for a particular object.
+        Mainly for use with nbconvert (jupyter notebook conversion to pdf).
+        """
+        if config.get_option('display.latex.repr'):
+            return self.to_latex()
+        else:
+            return None
+
+    def _repr_data_resource_(self):
+        """
+        Not a real Jupyter special repr method, but we use the same
+        naming convention.
+        """
+        if config.get_option("display.html.table_schema"):
+            data = self.head(config.get_option('display.max_rows'))
+            payload = json.loads(data.to_json(orient='table'),
+                                 object_pairs_hook=collections.OrderedDict)
+            return payload
 
     # ----------------------------------------------------------------------
     # I/O Methods
 
     _shared_docs['to_excel'] = """
-    Write %(klass)s to an excel sheet
-    %(versionadded_to_excel)s
+    Write %(klass)s to an Excel sheet.
+
+    To write a single %(klass)s to an Excel .xlsx file it is only necessary to
+    specify a target file name. To write to multiple sheets it is necessary to
+    create an `ExcelWriter` object with a target file name, and specify a sheet
+    in the file to write to.
+
+    Multiple sheets may be written to by specifying unique `sheet_name`.
+    With all data written to the file it is necessary to save the changes.
+    Note that creating an `ExcelWriter` object with a file name that already
+    exists will result in the contents of the existing file being erased.
 
     Parameters
     ----------
-    excel_writer : string or ExcelWriter object
-        File path or existing ExcelWriter
-    sheet_name : string, default 'Sheet1'
-        Name of sheet which will contain DataFrame
-    na_rep : string, default ''
-        Missing data representation
-    float_format : string, default None
-        Format string for floating point numbers
-    columns : sequence, optional
-        Columns to write
-    header : boolean or list of string, default True
-        Write out column names. If a list of string is given it is
-        assumed to be aliases for the column names
-    index : boolean, default True
-        Write row names (index)
-    index_label : string or sequence, default None
-        Column label for index column(s) if desired. If None is given, and
+    excel_writer : str or ExcelWriter object
+        File path or existing ExcelWriter.
+    sheet_name : str, default 'Sheet1'
+        Name of sheet which will contain DataFrame.
+    na_rep : str, default ''
+        Missing data representation.
+    float_format : str, optional
+        Format string for floating point numbers. For example
+        ``float_format="%%.2f"`` will format 0.1234 to 0.12.
+    columns : sequence or list of str, optional
+        Columns to write.
+    header : bool or list of str, default True
+        Write out the column names. If a list of string is given it is
+        assumed to be aliases for the column names.
+    index : bool, default True
+        Write row names (index).
+    index_label : str or sequence, optional
+        Column label for index column(s) if desired. If not specified, and
         `header` and `index` are True, then the index names are used. A
         sequence should be given if the DataFrame uses MultiIndex.
-    startrow :
-        upper left cell row to dump data frame
-    startcol :
-        upper left cell column to dump data frame
-    engine : string, default None
-        write engine to use - you can also set this via the options
-        ``io.excel.xlsx.writer``, ``io.excel.xls.writer``, and
+    startrow : int, default 0
+        Upper left cell row to dump data frame.
+    startcol : int, default 0
+        Upper left cell column to dump data frame.
+    engine : str, optional
+        Write engine to use, 'openpyxl' or 'xlsxwriter'. You can also set this
+        via the options ``io.excel.xlsx.writer``, ``io.excel.xls.writer``, and
         ``io.excel.xlsm.writer``.
-    merge_cells : boolean, default True
+    merge_cells : bool, default True
         Write MultiIndex and Hierarchical Rows as merged cells.
-    encoding: string, default None
-        encoding of the resulting excel file. Only necessary for xlwt,
+    encoding : str, optional
+        Encoding of the resulting excel file. Only necessary for xlwt,
         other writers support unicode natively.
-    inf_rep : string, default 'inf'
+    inf_rep : str, default 'inf'
         Representation for infinity (there is no native representation for
-        infinity in Excel)
-    freeze_panes : tuple of integer (length 2), default None
+        infinity in Excel).
+    verbose : bool, default True
+        Display more information in the error logs.
+    freeze_panes : tuple of int (length 2), optional
         Specifies the one-based bottommost row and rightmost column that
-        is to be frozen
+        is to be frozen.
+
+        .. versionadded:: 0.20.0.
 
-        .. versionadded:: 0.20.0
+    See Also
+    --------
+    to_csv : Write DataFrame to a comma-separated values (csv) file.
+    ExcelWriter : Class for writing DataFrame objects into excel sheets.
+    read_excel : Read an Excel file into a pandas DataFrame.
+    read_csv : Read a comma-separated values (csv) file into DataFrame.
 
     Notes
     -----
-    If passing an existing ExcelWriter object, then the sheet will be added
-    to the existing workbook.  This can be used to save different
-    DataFrames to one workbook:
+    For compatibility with :meth:`~DataFrame.to_csv`,
+    to_excel serializes lists and dicts to strings before writing.
+
+    Once a workbook has been saved it is not possible write further data
+    without rewriting the whole workbook.
+
+    Examples
+    --------
 
-    >>> writer = pd.ExcelWriter('output.xlsx')
-    >>> df1.to_excel(writer,'Sheet1')
-    >>> df2.to_excel(writer,'Sheet2')
-    >>> writer.save()
+    Create, write to and save a workbook:
 
-    For compatibility with to_csv, to_excel serializes lists and dicts to
-    strings before writing.
+    >>> df1 = pd.DataFrame([['a', 'b'], ['c', 'd']],
+    ...                    index=['row 1', 'row 2'],
+    ...                    columns=['col 1', 'col 2'])
+    >>> df1.to_excel("output.xlsx")  # doctest: +SKIP
+
+    To specify the sheet name:
+
+    >>> df1.to_excel("output.xlsx",
+    ...              sheet_name='Sheet_name_1')  # doctest: +SKIP
+
+    If you wish to write to more than one sheet in the workbook, it is
+    necessary to specify an ExcelWriter object:
+
+    >>> df2 = df1.copy()
+    >>> with pd.ExcelWriter('output.xlsx') as writer:  # doctest: +SKIP
+    ...     df1.to_excel(writer, sheet_name='Sheet_name_1')
+    ...     df2.to_excel(writer, sheet_name='Sheet_name_2')
+
+    To set the library that is used to write the Excel file,
+    you can pass the `engine` keyword (the default engine is
+    automatically chosen depending on the file extension):
+
+    >>> df1.to_excel('output1.xlsx', engine='xlsxwriter')  # doctest: +SKIP
     """
 
+    @Appender(_shared_docs["to_excel"] % dict(klass="object"))
+    def to_excel(self, excel_writer, sheet_name="Sheet1", na_rep="",
+                 float_format=None, columns=None, header=True, index=True,
+                 index_label=None, startrow=0, startcol=0, engine=None,
+                 merge_cells=True, encoding=None, inf_rep="inf", verbose=True,
+                 freeze_panes=None):
+        df = self if isinstance(self, ABCDataFrame) else self.to_frame()
+
+        from pandas.io.formats.excel import ExcelFormatter
+        formatter = ExcelFormatter(df, na_rep=na_rep, cols=columns,
+                                   header=header,
+                                   float_format=float_format, index=index,
+                                   index_label=index_label,
+                                   merge_cells=merge_cells,
+                                   inf_rep=inf_rep)
+        formatter.write(excel_writer, sheet_name=sheet_name, startrow=startrow,
+                        startcol=startcol, freeze_panes=freeze_panes,
+                        engine=engine)
+
     def to_json(self, path_or_buf=None, orient=None, date_format=None,
                 double_precision=10, force_ascii=True, date_unit='ms',
-                default_handler=None, lines=False):
+                default_handler=None, lines=False, compression='infer',
+                index=True):
         """
         Convert the object to a JSON string.
 
@@ -1126,44 +2159,48 @@ def to_json(self, path_or_buf=None, orient=None, date_format=None,
 
         Parameters
         ----------
-        path_or_buf : the path or buffer to write the result string
-            if this is None, return a StringIO of the converted string
+        path_or_buf : string or file handle, optional
+            File path or object. If not specified, the result is returned as
+            a string.
         orient : string
+            Indication of expected JSON string format.
 
             * Series
 
               - default is 'index'
-              - allowed values are: {'split','records','index'}
+              - allowed values are: {'split','records','index','table'}
 
             * DataFrame
 
               - default is 'columns'
               - allowed values are:
-                {'split','records','index','columns','values'}
+                {'split','records','index','columns','values','table'}
 
             * The format of the JSON string
 
-              - split : dict like
-                {index -> [index], columns -> [columns], data -> [values]}
-              - records : list like
+              - 'split' : dict like {'index' -> [index],
+                'columns' -> [columns], 'data' -> [values]}
+              - 'records' : list like
                 [{column -> value}, ... , {column -> value}]
-              - index : dict like {index -> {column -> value}}
-              - columns : dict like {column -> {index -> value}}
-              - values : just the values array
-              - table : dict like {'schema': {schema}, 'data': {data}}
+              - 'index' : dict like {index -> {column -> value}}
+              - 'columns' : dict like {column -> {index -> value}}
+              - 'values' : just the values array
+              - 'table' : dict like {'schema': {schema}, 'data': {data}}
                 describing the data, and the data component is
                 like ``orient='records'``.
 
                 .. versionchanged:: 0.20.0
 
         date_format : {None, 'epoch', 'iso'}
-            Type of date conversion. `epoch` = epoch milliseconds,
-            `iso` = ISO8601. The default depends on the `orient`. For
-            `orient='table'`, the default is `'iso'`. For all other orients,
-            the default is `'epoch'`.
-        double_precision : The number of decimal places to use when encoding
-            floating point values, default 10.
-        force_ascii : force encoded string to be ASCII, default True.
+            Type of date conversion. 'epoch' = epoch milliseconds,
+            'iso' = ISO8601. The default depends on the `orient`. For
+            ``orient='table'``, the default is 'iso'. For all other orients,
+            the default is 'epoch'.
+        double_precision : int, default 10
+            The number of decimal places to use when encoding
+            floating point values.
+        force_ascii : bool, default True
+            Force encoded string to be ASCII.
         date_unit : string, default 'ms' (milliseconds)
             The time unit to encode to, governs timestamp and ISO8601
             precision.  One of 's', 'ms', 'us', 'ns' for second, millisecond,
@@ -1172,20 +2209,32 @@ def to_json(self, path_or_buf=None, orient=None, date_format=None,
             Handler to call if object cannot otherwise be converted to a
             suitable format for JSON. Should receive a single argument which is
             the object to convert and return a serialisable object.
-        lines : boolean, default False
+        lines : bool, default False
             If 'orient' is 'records' write out line delimited json format. Will
             throw ValueError if incorrect 'orient' since others are not list
             like.
 
             .. versionadded:: 0.19.0
 
-        Returns
-        -------
-        same type as input object with filtered info axis
+        compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}
+
+            A string representing the compression to use in the output file,
+            only used when the first argument is a filename. By default, the
+            compression is inferred from the filename.
+
+            .. versionadded:: 0.21.0
+            .. versionchanged:: 0.24.0
+               'infer' option added and set to default
+        index : bool, default True
+            Whether to include the index values in the JSON string. Not
+            including the index (``index=False``) is only supported when
+            orient is 'split' or 'table'.
+
+            .. versionadded:: 0.23.0
 
         See Also
         --------
-        pd.read_json
+        read_json
 
         Examples
         --------
@@ -1198,16 +2247,26 @@ def to_json(self, path_or_buf=None, orient=None, date_format=None,
           "index":["row 1","row 2"],
           "data":[["a","b"],["c","d"]]}'
 
+        Encoding/decoding a Dataframe using ``'records'`` formatted JSON.
+        Note that index labels are not preserved with this encoding.
+
+        >>> df.to_json(orient='records')
+        '[{"col 1":"a","col 2":"b"},{"col 1":"c","col 2":"d"}]'
+
         Encoding/decoding a Dataframe using ``'index'`` formatted JSON:
 
         >>> df.to_json(orient='index')
         '{"row 1":{"col 1":"a","col 2":"b"},"row 2":{"col 1":"c","col 2":"d"}}'
 
-        Encoding/decoding a Dataframe using ``'records'`` formatted JSON.
-        Note that index labels are not preserved with this encoding.
+        Encoding/decoding a Dataframe using ``'columns'`` formatted JSON:
 
-        >>> df.to_json(orient='records')
-        '[{"col 1":"a","col 2":"b"},{"col 1":"c","col 2":"d"}]'
+        >>> df.to_json(orient='columns')
+        '{"col 1":{"row 1":"a","row 2":"c"},"col 2":{"row 1":"b","row 2":"d"}}'
+
+        Encoding/decoding a Dataframe using ``'values'`` formatted JSON:
+
+        >>> df.to_json(orient='values')
+        '[["a","b"],["c","d"]]'
 
         Encoding with Table Schema
 
@@ -1231,60 +2290,116 @@ def to_json(self, path_or_buf=None, orient=None, date_format=None,
                             double_precision=double_precision,
                             force_ascii=force_ascii, date_unit=date_unit,
                             default_handler=default_handler,
-                            lines=lines)
+                            lines=lines, compression=compression,
+                            index=index)
 
     def to_hdf(self, path_or_buf, key, **kwargs):
-        """Write the contained data to an HDF5 file using HDFStore.
+        """
+        Write the contained data to an HDF5 file using HDFStore.
+
+        Hierarchical Data Format (HDF) is self-describing, allowing an
+        application to interpret the structure and contents of a file with
+        no outside information. One HDF file can hold a mix of related objects
+        which can be accessed as a group or as individual objects.
+
+        In order to add another DataFrame or Series to an existing HDF file
+        please use append mode and a different a key.
+
+        For more information see the :ref:`user guide <io.hdf5>`.
 
         Parameters
         ----------
-        path_or_buf : the path (string) or HDFStore object
-        key : string
-            identifier for the group in the store
-        mode : optional, {'a', 'w', 'r+'}, default 'a'
-
-          ``'w'``
-              Write; a new file is created (an existing file with the same
-              name would be deleted).
-          ``'a'``
-              Append; an existing file is opened for reading and writing,
-              and if the file does not exist it is created.
-          ``'r+'``
-              It is similar to ``'a'``, but the file must already exist.
-        format : 'fixed(f)|table(t)', default is 'fixed'
-            fixed(f) : Fixed format
-                       Fast writing/reading. Not-appendable, nor searchable
-            table(t) : Table format
-                       Write as a PyTables Table structure which may perform
-                       worse but allow more flexible operations like searching
-                       / selecting subsets of the data
-        append : boolean, default False
-            For Table formats, append the input data to the existing
-        data_columns :  list of columns, or True, default None
+        path_or_buf : str or pandas.HDFStore
+            File path or HDFStore object.
+        key : str
+            Identifier for the group in the store.
+        mode : {'a', 'w', 'r+'}, default 'a'
+            Mode to open file:
+
+            - 'w': write, a new file is created (an existing file with
+              the same name would be deleted).
+            - 'a': append, an existing file is opened for reading and
+              writing, and if the file does not exist it is created.
+            - 'r+': similar to 'a', but the file must already exist.
+        format : {'fixed', 'table'}, default 'fixed'
+            Possible values:
+
+            - 'fixed': Fixed format. Fast writing/reading. Not-appendable,
+              nor searchable.
+            - 'table': Table format. Write as a PyTables Table structure
+              which may perform worse but allow more flexible operations
+              like searching / selecting subsets of the data.
+        append : bool, default False
+            For Table formats, append the input data to the existing.
+        data_columns :  list of columns or True, optional
             List of columns to create as indexed data columns for on-disk
             queries, or True to use all columns. By default only the axes
-            of the object are indexed. See `here
-            <http://pandas.pydata.org/pandas-docs/stable/io.html#query-via-data-columns>`__.
-
+            of the object are indexed. See :ref:`io.hdf5-query-data-columns`.
             Applicable only to format='table'.
-        complevel : int, 1-9, default 0
-            If a complib is specified compression will be applied
-            where possible
-        complib : {'zlib', 'bzip2', 'lzo', 'blosc', None}, default None
-            If complevel is > 0 apply compression to objects written
-            in the store wherever possible
+        complevel : {0-9}, optional
+            Specifies a compression level for data.
+            A value of 0 disables compression.
+        complib : {'zlib', 'lzo', 'bzip2', 'blosc'}, default 'zlib'
+            Specifies the compression library to be used.
+            As of v0.20.2 these additional compressors for Blosc are supported
+            (default if no compressor specified: 'blosc:blosclz'):
+            {'blosc:blosclz', 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy',
+            'blosc:zlib', 'blosc:zstd'}.
+            Specifying a compression library which is not available issues
+            a ValueError.
         fletcher32 : bool, default False
-            If applying compression use the fletcher32 checksum
-        dropna : boolean, default False.
+            If applying compression use the fletcher32 checksum.
+        dropna : bool, default False
             If true, ALL nan rows will not be written to store.
-        """
+        errors : str, default 'strict'
+            Specifies how encoding and decoding errors are to be handled.
+            See the errors argument for :func:`open` for a full list
+            of options.
+
+        See Also
+        --------
+        DataFrame.read_hdf : Read from HDF file.
+        DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+        DataFrame.to_sql : Write to a sql table.
+        DataFrame.to_feather : Write out feather-format for DataFrames.
+        DataFrame.to_csv : Write out to a csv file.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
+        ...                   index=['a', 'b', 'c'])
+        >>> df.to_hdf('data.h5', key='df', mode='w')
+
+        We can add another object to the same file:
+
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s.to_hdf('data.h5', key='s')
+
+        Reading from HDF file:
+
+        >>> pd.read_hdf('data.h5', 'df')
+        A  B
+        a  1  4
+        b  2  5
+        c  3  6
+        >>> pd.read_hdf('data.h5', 's')
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
 
+        Deleting file with data:
+
+        >>> import os
+        >>> os.remove('data.h5')
+        """
         from pandas.io import pytables
         return pytables.to_hdf(path_or_buf, key, self, **kwargs)
 
     def to_msgpack(self, path_or_buf=None, encoding='utf-8', **kwargs):
         """
-        msgpack (serialize) object to input file path
+        Serialize object to input file path using msgpack format.
 
         THIS IS AN EXPERIMENTAL LIBRARY and the storage format
         may not be stable until a future release.
@@ -1293,7 +2408,7 @@ def to_msgpack(self, path_or_buf=None, encoding='utf-8', **kwargs):
         ----------
         path : string File path, buffer-like, or None
             if None, return generated string
-        append : boolean whether to append to an existing msgpack
+        append : bool whether to append to an existing msgpack
             (default is False)
         compress : type of compressor (zlib or blosc), default to None (no
             compression)
@@ -1303,88 +2418,257 @@ def to_msgpack(self, path_or_buf=None, encoding='utf-8', **kwargs):
         return packers.to_msgpack(path_or_buf, self, encoding=encoding,
                                   **kwargs)
 
-    def to_sql(self, name, con, flavor=None, schema=None, if_exists='fail',
-               index=True, index_label=None, chunksize=None, dtype=None):
+    def to_sql(self, name, con, schema=None, if_exists='fail', index=True,
+               index_label=None, chunksize=None, dtype=None, method=None):
         """
         Write records stored in a DataFrame to a SQL database.
 
+        Databases supported by SQLAlchemy [1]_ are supported. Tables can be
+        newly created, appended to, or overwritten.
+
         Parameters
         ----------
         name : string
-            Name of SQL table
-        con : SQLAlchemy engine or DBAPI2 connection (legacy mode)
+            Name of SQL table.
+        con : sqlalchemy.engine.Engine or sqlite3.Connection
             Using SQLAlchemy makes it possible to use any DB supported by that
-            library. If a DBAPI2 object, only sqlite3 is supported.
-        flavor : 'sqlite', default None
-            DEPRECATED: this parameter will be removed in a future version,
-            as 'sqlite' is the only supported option if SQLAlchemy is not
-            installed.
-        schema : string, default None
+            library. Legacy support is provided for sqlite3.Connection objects.
+        schema : string, optional
             Specify the schema (if database flavor supports this). If None, use
             default schema.
         if_exists : {'fail', 'replace', 'append'}, default 'fail'
-            - fail: If table exists, do nothing.
-            - replace: If table exists, drop it, recreate it, and insert data.
-            - append: If table exists, insert data. Create if does not exist.
-        index : boolean, default True
-            Write DataFrame index as a column.
+            How to behave if the table already exists.
+
+            * fail: Raise a ValueError.
+            * replace: Drop the table before inserting new values.
+            * append: Insert new values to the existing table.
+
+        index : bool, default True
+            Write DataFrame index as a column. Uses `index_label` as the column
+            name in the table.
         index_label : string or sequence, default None
             Column label for index column(s). If None is given (default) and
             `index` is True, then the index names are used.
             A sequence should be given if the DataFrame uses MultiIndex.
-        chunksize : int, default None
-            If not None, then rows will be written in batches of this size at a
-            time.  If None, all rows will be written at once.
-        dtype : dict of column name to SQL type, default None
-            Optional specifying the datatype for columns. The SQL type should
-            be a SQLAlchemy type, or a string for sqlite3 fallback connection.
+        chunksize : int, optional
+            Rows will be written in batches of this size at a time. By default,
+            all rows will be written at once.
+        dtype : dict, optional
+            Specifying the datatype for columns. The keys should be the column
+            names and the values should be the SQLAlchemy types or strings for
+            the sqlite3 legacy mode.
+        method : {None, 'multi', callable}, default None
+            Controls the SQL insertion clause used:
+
+            * None : Uses standard SQL ``INSERT`` clause (one per row).
+            * 'multi': Pass multiple values in a single ``INSERT`` clause.
+            * callable with signature ``(pd_table, conn, keys, data_iter)``.
+
+            Details and a sample callable implementation can be found in the
+            section :ref:`insert method <io.sql.method>`.
+
+            .. versionadded:: 0.24.0
+
+        Raises
+        ------
+        ValueError
+            When the table already exists and `if_exists` is 'fail' (the
+            default).
+
+        See Also
+        --------
+        read_sql : Read a DataFrame from a table.
+
+        Notes
+        -----
+        Timezone aware datetime columns will be written as
+        ``Timestamp with timezone`` type with SQLAlchemy if supported by the
+        database. Otherwise, the datetimes will be stored as timezone unaware
+        timestamps local to the original timezone.
+
+        .. versionadded:: 0.24.0
+
+        References
+        ----------
+        .. [1] http://docs.sqlalchemy.org
+        .. [2] https://www.python.org/dev/peps/pep-0249/
+
+        Examples
+        --------
+
+        Create an in-memory SQLite database.
+
+        >>> from sqlalchemy import create_engine
+        >>> engine = create_engine('sqlite://', echo=False)
+
+        Create a table from scratch with 3 rows.
+
+        >>> df = pd.DataFrame({'name' : ['User 1', 'User 2', 'User 3']})
+        >>> df
+             name
+        0  User 1
+        1  User 2
+        2  User 3
+
+        >>> df.to_sql('users', con=engine)
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 1'), (1, 'User 2'), (2, 'User 3')]
+
+        >>> df1 = pd.DataFrame({'name' : ['User 4', 'User 5']})
+        >>> df1.to_sql('users', con=engine, if_exists='append')
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 1'), (1, 'User 2'), (2, 'User 3'),
+         (0, 'User 4'), (1, 'User 5')]
+
+        Overwrite the table with just ``df1``.
+
+        >>> df1.to_sql('users', con=engine, if_exists='replace',
+        ...            index_label='id')
+        >>> engine.execute("SELECT * FROM users").fetchall()
+        [(0, 'User 4'), (1, 'User 5')]
+
+        Specify the dtype (especially useful for integers with missing values).
+        Notice that while pandas is forced to store the data as floating point,
+        the database supports nullable integers. When fetching the data with
+        Python, we get back integer scalars.
+
+        >>> df = pd.DataFrame({"A": [1, None, 2]})
+        >>> df
+             A
+        0  1.0
+        1  NaN
+        2  2.0
+
+        >>> from sqlalchemy.types import Integer
+        >>> df.to_sql('integers', con=engine, index=False,
+        ...           dtype={"A": Integer()})
 
+        >>> engine.execute("SELECT * FROM integers").fetchall()
+        [(1,), (None,), (2,)]
         """
         from pandas.io import sql
-        sql.to_sql(self, name, con, flavor=flavor, schema=schema,
-                   if_exists=if_exists, index=index, index_label=index_label,
-                   chunksize=chunksize, dtype=dtype)
+        sql.to_sql(self, name, con, schema=schema, if_exists=if_exists,
+                   index=index, index_label=index_label, chunksize=chunksize,
+                   dtype=dtype, method=method)
 
-    def to_pickle(self, path, compression='infer'):
+    def to_pickle(self, path, compression='infer',
+                  protocol=pkl.HIGHEST_PROTOCOL):
         """
-        Pickle (serialize) object to input file path.
+        Pickle (serialize) object to file.
 
         Parameters
         ----------
-        path : string
-            File path
-        compression : {'infer', 'gzip', 'bz2', 'xz', None}, default 'infer'
-            a string representing the compression to use in the output file
+        path : str
+            File path where the pickled object will be stored.
+        compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, \
+        default 'infer'
+            A string representing the compression to use in the output file. By
+            default, infers from the file extension in specified path.
 
             .. versionadded:: 0.20.0
+        protocol : int
+            Int which indicates which protocol should be used by the pickler,
+            default HIGHEST_PROTOCOL (see [1]_ paragraph 12.1.2). The possible
+            values for this parameter depend on the version of Python. For
+            Python 2.x, possible values are 0, 1, 2. For Python>=3.0, 3 is a
+            valid value. For Python >= 3.4, 4 is a valid value. A negative
+            value for the protocol parameter is equivalent to setting its value
+            to HIGHEST_PROTOCOL.
+
+            .. [1] https://docs.python.org/3/library/pickle.html
+            .. versionadded:: 0.21.0
+
+        See Also
+        --------
+        read_pickle : Load pickled pandas object (or any object) from file.
+        DataFrame.to_hdf : Write DataFrame to an HDF5 file.
+        DataFrame.to_sql : Write DataFrame to a SQL database.
+        DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+
+        Examples
+        --------
+        >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+        >>> original_df
+           foo  bar
+        0    0    5
+        1    1    6
+        2    2    7
+        3    3    8
+        4    4    9
+        >>> original_df.to_pickle("./dummy.pkl")
+
+        >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+        >>> unpickled_df
+           foo  bar
+        0    0    5
+        1    1    6
+        2    2    7
+        3    3    8
+        4    4    9
+
+        >>> import os
+        >>> os.remove("./dummy.pkl")
         """
         from pandas.io.pickle import to_pickle
-        return to_pickle(self, path, compression=compression)
+        return to_pickle(self, path, compression=compression,
+                         protocol=protocol)
 
-    def to_clipboard(self, excel=None, sep=None, **kwargs):
-        """
-        Attempt to write text representation of object to the system clipboard
+    def to_clipboard(self, excel=True, sep=None, **kwargs):
+        r"""
+        Copy object to the system clipboard.
+
+        Write a text representation of object to the system clipboard.
         This can be pasted into Excel, for example.
 
         Parameters
         ----------
-        excel : boolean, defaults to True
-                if True, use the provided separator, writing in a csv
-                format for allowing easy pasting into excel.
-                if False, write a string representation of the object
-                to the clipboard
-        sep : optional, defaults to tab
-        other keywords are passed to to_csv
+        excel : bool, default True
+            - True, use the provided separator, writing in a csv format for
+              allowing easy pasting into excel.
+            - False, write a string representation of the object to the
+              clipboard.
+
+        sep : str, default ``'\t'``
+            Field delimiter.
+        **kwargs
+            These parameters will be passed to DataFrame.to_csv.
+
+        See Also
+        --------
+        DataFrame.to_csv : Write a DataFrame to a comma-separated values
+            (csv) file.
+        read_clipboard : Read text from clipboard and pass to read_table.
 
         Notes
         -----
-        Requirements for your platform
-          - Linux: xclip, or xsel (with gtk or PyQt4 modules)
-          - Windows: none
-          - OS X: none
+        Requirements for your platform.
+
+          - Linux : `xclip`, or `xsel` (with `gtk` or `PyQt4` modules)
+          - Windows : none
+          - OS X : none
+
+        Examples
+        --------
+        Copy the contents of a DataFrame to the clipboard.
+
+        >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=['A', 'B', 'C'])
+        >>> df.to_clipboard(sep=',')
+        ... # Wrote the following to the system clipboard:
+        ... # ,A,B,C
+        ... # 0,1,2,3
+        ... # 1,4,5,6
+
+        We can omit the the index by passing the keyword `index` and setting
+        it to false.
+
+        >>> df.to_clipboard(sep=',', index=False)
+        ... # Wrote the following to the system clipboard:
+        ... # A,B,C
+        ... # 1,2,3
+        ... # 4,5,6
         """
-        from pandas.io import clipboard
-        clipboard.to_clipboard(self, excel=excel, sep=sep, **kwargs)
+        from pandas.io import clipboards
+        clipboards.to_clipboard(self, excel=excel, sep=sep, **kwargs)
 
     def to_xarray(self):
         """
@@ -1392,86 +2676,86 @@ def to_xarray(self):
 
         Returns
         -------
-        a DataArray for a Series
-        a Dataset for a DataFrame
-        a DataArray for higher dims
+        xarray.DataArray or xarray.Dataset
+            Data in the pandas structure converted to Dataset if the object is
+            a DataFrame, or a DataArray if the object is a Series.
+
+        See Also
+        --------
+        DataFrame.to_hdf : Write DataFrame to an HDF5 file.
+        DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+
+        Notes
+        -----
+        See the `xarray docs <http://xarray.pydata.org/en/stable/>`__
 
         Examples
         --------
-        >>> df = pd.DataFrame({'A' : [1, 1, 2],
-                               'B' : ['foo', 'bar', 'foo'],
-                               'C' : np.arange(4.,7)})
+        >>> df = pd.DataFrame([('falcon', 'bird',  389.0, 2),
+        ...                    ('parrot', 'bird', 24.0, 2),
+        ...                    ('lion',   'mammal', 80.5, 4),
+        ...                    ('monkey', 'mammal', np.nan, 4)],
+        ...                    columns=['name', 'class', 'max_speed',
+        ...                             'num_legs'])
         >>> df
-           A    B    C
-        0  1  foo  4.0
-        1  1  bar  5.0
-        2  2  foo  6.0
+             name   class  max_speed  num_legs
+        0  falcon    bird      389.0         2
+        1  parrot    bird       24.0         2
+        2    lion  mammal       80.5         4
+        3  monkey  mammal        NaN         4
 
         >>> df.to_xarray()
         <xarray.Dataset>
-        Dimensions:  (index: 3)
+        Dimensions:    (index: 4)
         Coordinates:
-          * index    (index) int64 0 1 2
+          * index      (index) int64 0 1 2 3
         Data variables:
-            A        (index) int64 1 1 2
-            B        (index) object 'foo' 'bar' 'foo'
-            C        (index) float64 4.0 5.0 6.0
-
-        >>> df = pd.DataFrame({'A' : [1, 1, 2],
-                               'B' : ['foo', 'bar', 'foo'],
-                               'C' : np.arange(4.,7)}
-                             ).set_index(['B','A'])
-        >>> df
-                 C
-        B   A
-        foo 1  4.0
-        bar 1  5.0
-        foo 2  6.0
-
-        >>> df.to_xarray()
+            name       (index) object 'falcon' 'parrot' 'lion' 'monkey'
+            class      (index) object 'bird' 'bird' 'mammal' 'mammal'
+            max_speed  (index) float64 389.0 24.0 80.5 nan
+            num_legs   (index) int64 2 2 4 4
+
+        >>> df['max_speed'].to_xarray()
+        <xarray.DataArray 'max_speed' (index: 4)>
+        array([389. ,  24. ,  80.5,   nan])
+        Coordinates:
+          * index    (index) int64 0 1 2 3
+
+        >>> dates = pd.to_datetime(['2018-01-01', '2018-01-01',
+        ...                         '2018-01-02', '2018-01-02'])
+        >>> df_multiindex = pd.DataFrame({'date': dates,
+        ...                    'animal': ['falcon', 'parrot', 'falcon',
+        ...                               'parrot'],
+        ...                    'speed': [350, 18, 361, 15]}).set_index(['date',
+        ...                                                    'animal'])
+        >>> df_multiindex
+                           speed
+        date       animal
+        2018-01-01 falcon    350
+                   parrot     18
+        2018-01-02 falcon    361
+                   parrot     15
+
+        >>> df_multiindex.to_xarray()
         <xarray.Dataset>
-        Dimensions:  (A: 2, B: 2)
+        Dimensions:  (animal: 2, date: 2)
         Coordinates:
-          * B        (B) object 'bar' 'foo'
-          * A        (A) int64 1 2
+          * date     (date) datetime64[ns] 2018-01-01 2018-01-02
+          * animal   (animal) object 'falcon' 'parrot'
         Data variables:
-            C        (B, A) float64 5.0 nan 4.0 6.0
-
-        >>> p = pd.Panel(np.arange(24).reshape(4,3,2),
-                         items=list('ABCD'),
-                         major_axis=pd.date_range('20130101', periods=3),
-                         minor_axis=['first', 'second'])
-        >>> p
-        <class 'pandas.core.panel.Panel'>
-        Dimensions: 4 (items) x 3 (major_axis) x 2 (minor_axis)
-        Items axis: A to D
-        Major_axis axis: 2013-01-01 00:00:00 to 2013-01-03 00:00:00
-        Minor_axis axis: first to second
-
-        >>> p.to_xarray()
-        <xarray.DataArray (items: 4, major_axis: 3, minor_axis: 2)>
-        array([[[ 0,  1],
-                [ 2,  3],
-                [ 4,  5]],
-               [[ 6,  7],
-                [ 8,  9],
-                [10, 11]],
-               [[12, 13],
-                [14, 15],
-                [16, 17]],
-               [[18, 19],
-                [20, 21],
-                [22, 23]]])
-        Coordinates:
-          * items       (items) object 'A' 'B' 'C' 'D'
-          * major_axis  (major_axis) datetime64[ns] 2013-01-01 2013-01-02 2013-01-03  # noqa
-          * minor_axis  (minor_axis) object 'first' 'second'
-
-        Notes
-        -----
-        See the `xarray docs <http://xarray.pydata.org/en/stable/>`__
+            speed    (date, animal) int64 350 18 361 15
         """
-        import xarray
+
+        try:
+            import xarray
+        except ImportError:
+            # Give a nice error message
+            raise ImportError("the xarray library is not installed\n"
+                              "you can install via conda\n"
+                              "conda install xarray\n"
+                              "or via pip\n"
+                              "pip install xarray\n")
+
         if self.ndim == 1:
             return xarray.DataArray.from_series(self)
         elif self.ndim == 2:
@@ -1483,29 +2767,295 @@ def to_xarray(self):
                                 coords=coords,
                                 )
 
+    def to_latex(self, buf=None, columns=None, col_space=None, header=True,
+                 index=True, na_rep='NaN', formatters=None, float_format=None,
+                 sparsify=None, index_names=True, bold_rows=False,
+                 column_format=None, longtable=None, escape=None,
+                 encoding=None, decimal='.', multicolumn=None,
+                 multicolumn_format=None, multirow=None):
+        r"""
+        Render an object to a LaTeX tabular environment table.
+
+        Render an object to a tabular environment table. You can splice
+        this into a LaTeX document. Requires \usepackage{booktabs}.
+
+        .. versionchanged:: 0.20.2
+           Added to Series
+
+        Parameters
+        ----------
+        buf : file descriptor or None
+            Buffer to write to. If None, the output is returned as a string.
+        columns : list of label, optional
+            The subset of columns to write. Writes all columns by default.
+        col_space : int, optional
+            The minimum width of each column.
+        header : bool or list of str, default True
+            Write out the column names. If a list of strings is given,
+            it is assumed to be aliases for the column names.
+        index : bool, default True
+            Write row names (index).
+        na_rep : str, default 'NaN'
+            Missing data representation.
+        formatters : list of functions or dict of {str: function}, optional
+            Formatter functions to apply to columns' elements by position or
+            name. The result of each function must be a unicode string.
+            List must be of length equal to the number of columns.
+        float_format : str, optional
+            Format string for floating point numbers.
+        sparsify : bool, optional
+            Set to False for a DataFrame with a hierarchical index to print
+            every multiindex key at each row. By default, the value will be
+            read from the config module.
+        index_names : bool, default True
+            Prints the names of the indexes.
+        bold_rows : bool, default False
+            Make the row labels bold in the output.
+        column_format : str, optional
+            The columns format as specified in `LaTeX table format
+            <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g. 'rcl' for 3
+            columns. By default, 'l' will be used for all columns except
+            columns of numbers, which default to 'r'.
+        longtable : bool, optional
+            By default, the value will be read from the pandas config
+            module. Use a longtable environment instead of tabular. Requires
+            adding a \usepackage{longtable} to your LaTeX preamble.
+        escape : bool, optional
+            By default, the value will be read from the pandas config
+            module. When set to False prevents from escaping latex special
+            characters in column names.
+        encoding : str, optional
+            A string representing the encoding to use in the output file,
+            defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
+        decimal : str, default '.'
+            Character recognized as decimal separator, e.g. ',' in Europe.
+
+            .. versionadded:: 0.18.0
+        multicolumn : bool, default True
+            Use \multicolumn to enhance MultiIndex columns.
+            The default will be read from the config module.
+
+            .. versionadded:: 0.20.0
+        multicolumn_format : str, default 'l'
+            The alignment for multicolumns, similar to `column_format`
+            The default will be read from the config module.
+
+            .. versionadded:: 0.20.0
+        multirow : bool, default False
+            Use \multirow to enhance MultiIndex rows. Requires adding a
+            \usepackage{multirow} to your LaTeX preamble. Will print
+            centered labels (instead of top-aligned) across the contained
+            rows, separating groups via clines. The default will be read
+            from the pandas config module.
+
+            .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        str or None
+            If buf is None, returns the resulting LateX format as a
+            string. Otherwise returns None.
+
+        See Also
+        --------
+        DataFrame.to_string : Render a DataFrame to a console-friendly
+            tabular output.
+        DataFrame.to_html : Render a DataFrame as an HTML table.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'name': ['Raphael', 'Donatello'],
+        ...                    'mask': ['red', 'purple'],
+        ...                    'weapon': ['sai', 'bo staff']})
+        >>> df.to_latex(index=False) # doctest: +NORMALIZE_WHITESPACE
+        '\\begin{tabular}{lll}\n\\toprule\n      name &    mask &    weapon
+        \\\\\n\\midrule\n   Raphael &     red &       sai \\\\\n Donatello &
+         purple &  bo staff \\\\\n\\bottomrule\n\\end{tabular}\n'
+        """
+        # Get defaults from the pandas config
+        if self.ndim == 1:
+            self = self.to_frame()
+        if longtable is None:
+            longtable = config.get_option("display.latex.longtable")
+        if escape is None:
+            escape = config.get_option("display.latex.escape")
+        if multicolumn is None:
+            multicolumn = config.get_option("display.latex.multicolumn")
+        if multicolumn_format is None:
+            multicolumn_format = config.get_option(
+                "display.latex.multicolumn_format")
+        if multirow is None:
+            multirow = config.get_option("display.latex.multirow")
+
+        formatter = DataFrameFormatter(self, buf=buf, columns=columns,
+                                       col_space=col_space, na_rep=na_rep,
+                                       header=header, index=index,
+                                       formatters=formatters,
+                                       float_format=float_format,
+                                       bold_rows=bold_rows,
+                                       sparsify=sparsify,
+                                       index_names=index_names,
+                                       escape=escape, decimal=decimal)
+        formatter.to_latex(column_format=column_format, longtable=longtable,
+                           encoding=encoding, multicolumn=multicolumn,
+                           multicolumn_format=multicolumn_format,
+                           multirow=multirow)
+
+        if buf is None:
+            return formatter.buf.getvalue()
+
+    def to_csv(self, path_or_buf=None, sep=",", na_rep='', float_format=None,
+               columns=None, header=True, index=True, index_label=None,
+               mode='w', encoding=None, compression='infer', quoting=None,
+               quotechar='"', line_terminator=None, chunksize=None,
+               tupleize_cols=None, date_format=None, doublequote=True,
+               escapechar=None, decimal='.'):
+        r"""
+        Write object to a comma-separated values (csv) file.
+
+        .. versionchanged:: 0.24.0
+            The order of arguments for Series was changed.
+
+        Parameters
+        ----------
+        path_or_buf : str or file handle, default None
+            File path or object, if None is provided the result is returned as
+            a string.
+
+            .. versionchanged:: 0.24.0
+
+               Was previously named "path" for Series.
+
+        sep : str, default ','
+            String of length 1. Field delimiter for the output file.
+        na_rep : str, default ''
+            Missing data representation.
+        float_format : str, default None
+            Format string for floating point numbers.
+        columns : sequence, optional
+            Columns to write.
+        header : bool or list of str, default True
+            Write out the column names. If a list of strings is given it is
+            assumed to be aliases for the column names.
+
+            .. versionchanged:: 0.24.0
+
+               Previously defaulted to False for Series.
+
+        index : bool, default True
+            Write row names (index).
+        index_label : str or sequence, or False, default None
+            Column label for index column(s) if desired. If None is given, and
+            `header` and `index` are True, then the index names are used. A
+            sequence should be given if the object uses MultiIndex. If
+            False do not print fields for index names. Use index_label=False
+            for easier importing in R.
+        mode : str
+            Python write mode, default 'w'.
+        encoding : str, optional
+            A string representing the encoding to use in the output file,
+            defaults to 'ascii' on Python 2 and 'utf-8' on Python 3.
+        compression : str, default 'infer'
+            Compression mode among the following possible values: {'infer',
+            'gzip', 'bz2', 'zip', 'xz', None}. If 'infer' and `path_or_buf`
+            is path-like, then detect compression from the following
+            extensions: '.gz', '.bz2', '.zip' or '.xz'. (otherwise no
+            compression).
+
+            .. versionchanged:: 0.24.0
+
+               'infer' option added and set to default.
+
+        quoting : optional constant from csv module
+            Defaults to csv.QUOTE_MINIMAL. If you have set a `float_format`
+            then floats are converted to strings and thus csv.QUOTE_NONNUMERIC
+            will treat them as non-numeric.
+        quotechar : str, default '\"'
+            String of length 1. Character used to quote fields.
+        line_terminator : str, optional
+            The newline character or character sequence to use in the output
+            file. Defaults to `os.linesep`, which depends on the OS in which
+            this method is called ('\n' for linux, '\r\n' for Windows, i.e.).
+
+            .. versionchanged:: 0.24.0
+        chunksize : int or None
+            Rows to write at a time.
+        tupleize_cols : bool, default False
+            Write MultiIndex columns as a list of tuples (if True) or in
+            the new, expanded format, where each MultiIndex column is a row
+            in the CSV (if False).
+
+            .. deprecated:: 0.21.0
+               This argument will be removed and will always write each row
+               of the multi-index as a separate row in the CSV file.
+        date_format : str, default None
+            Format string for datetime objects.
+        doublequote : bool, default True
+            Control quoting of `quotechar` inside a field.
+        escapechar : str, default None
+            String of length 1. Character used to escape `sep` and `quotechar`
+            when appropriate.
+        decimal : str, default '.'
+            Character recognized as decimal separator. E.g. use ',' for
+            European data.
+
+        Returns
+        -------
+        None or str
+            If path_or_buf is None, returns the resulting csv format as a
+            string. Otherwise returns None.
+
+        See Also
+        --------
+        read_csv : Load a CSV file into a DataFrame.
+        to_excel : Load an Excel file into a DataFrame.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'name': ['Raphael', 'Donatello'],
+        ...                    'mask': ['red', 'purple'],
+        ...                    'weapon': ['sai', 'bo staff']})
+        >>> df.to_csv(index=False)
+        'name,mask,weapon\nRaphael,red,sai\nDonatello,purple,bo staff\n'
+        """
+
+        df = self if isinstance(self, ABCDataFrame) else self.to_frame()
+
+        if tupleize_cols is not None:
+            warnings.warn("The 'tupleize_cols' parameter is deprecated and "
+                          "will be removed in a future version",
+                          FutureWarning, stacklevel=2)
+        else:
+            tupleize_cols = False
+
+        from pandas.io.formats.csvs import CSVFormatter
+        formatter = CSVFormatter(df, path_or_buf,
+                                 line_terminator=line_terminator, sep=sep,
+                                 encoding=encoding,
+                                 compression=compression, quoting=quoting,
+                                 na_rep=na_rep, float_format=float_format,
+                                 cols=columns, header=header, index=index,
+                                 index_label=index_label, mode=mode,
+                                 chunksize=chunksize, quotechar=quotechar,
+                                 tupleize_cols=tupleize_cols,
+                                 date_format=date_format,
+                                 doublequote=doublequote,
+                                 escapechar=escapechar, decimal=decimal)
+        formatter.save()
+
+        if path_or_buf is None:
+            return formatter.path_or_buf.getvalue()
+
     # ----------------------------------------------------------------------
     # Fancy Indexing
 
     @classmethod
     def _create_indexer(cls, name, indexer):
         """Create an indexer like _name in the class."""
-
         if getattr(cls, name, None) is None:
-            iname = '_%s' % name
-            setattr(cls, iname, None)
-
-            def _indexer(self):
-                i = getattr(self, iname)
-                if i is None:
-                    i = indexer(self, name)
-                    setattr(self, iname, i)
-                return i
-
+            _indexer = functools.partial(indexer, name)
             setattr(cls, name, property(_indexer, doc=indexer.__doc__))
 
-            # add to our internal names set
-            cls._internal_names_set.add(iname)
-
     def get(self, key, default=None):
         """
         Get item from object for given key (DataFrame column, Panel slice,
@@ -1517,7 +3067,7 @@ def get(self, key, default=None):
 
         Returns
         -------
-        value : type of items contained in object
+        value : same type as items contained in object
         """
         try:
             return self[key]
@@ -1538,7 +3088,7 @@ def _get_item_cache(self, item):
             res._set_as_cached(item, self)
 
             # for a chain
-            res.is_copy = self.is_copy
+            res._is_copy = self._is_copy
         return res
 
     def _set_as_cached(self, item, cacher):
@@ -1558,7 +3108,7 @@ def _iget_item_cache(self, item):
         if ax.is_unique:
             lower = self._get_item_cache(ax[item])
         else:
-            lower = self.take(item, axis=self._info_axis_number, convert=True)
+            lower = self._take(item, axis=self._info_axis_number)
         return lower
 
     def _box_item_values(self, key, values):
@@ -1566,11 +3116,8 @@ def _box_item_values(self, key, values):
 
     def _maybe_cache_changed(self, item, value):
         """The object has called back to us saying maybe it has changed.
-
-        numpy < 1.8 has an issue with object arrays and aliasing
-        GH6026
         """
-        self._data.set(item, value, check=pd._np_version_under1p8)
+        self._data.set(item, value)
 
     @property
     def _is_cached(self):
@@ -1614,7 +3161,7 @@ def _maybe_update_cacher(self, clear=False, verify_is_copy=True):
             else:
                 try:
                     ref._maybe_cache_changed(cacher[0], self)
-                except:
+                except Exception:
                     pass
 
         if verify_is_copy:
@@ -1651,12 +3198,12 @@ def _set_item(self, key, value):
 
     def _set_is_copy(self, ref=None, copy=True):
         if not copy:
-            self.is_copy = None
+            self._is_copy = None
         else:
             if ref is not None:
-                self.is_copy = weakref.ref(ref)
+                self._is_copy = weakref.ref(ref)
             else:
-                self.is_copy = None
+                self._is_copy = None
 
     def _check_is_chained_assignment_possible(self):
         """
@@ -1675,7 +3222,7 @@ def _check_is_chained_assignment_possible(self):
                 self._check_setitem_copy(stacklevel=4, t='referant',
                                          force=True)
             return True
-        elif self.is_copy:
+        elif self._is_copy:
             self._check_setitem_copy(stacklevel=4, t='referant')
         return False
 
@@ -1710,33 +3257,33 @@ def _check_setitem_copy(self, stacklevel=4, t='setting', force=False):
 
         """
 
-        if force or self.is_copy:
+        if force or self._is_copy:
 
             value = config.get_option('mode.chained_assignment')
             if value is None:
                 return
 
-            # see if the copy is not actually refererd; if so, then disolve
+            # see if the copy is not actually referred; if so, then dissolve
             # the copy weakref
             try:
                 gc.collect(2)
-                if not gc.get_referents(self.is_copy()):
-                    self.is_copy = None
+                if not gc.get_referents(self._is_copy()):
+                    self._is_copy = None
                     return
-            except:
+            except Exception:
                 pass
 
             # we might be a false positive
             try:
-                if self.is_copy().shape == self.shape:
-                    self.is_copy = None
+                if self._is_copy().shape == self.shape:
+                    self._is_copy = None
                     return
-            except:
+            except Exception:
                 pass
 
             # a custom message
-            if isinstance(self.is_copy, string_types):
-                t = self.is_copy
+            if isinstance(self._is_copy, string_types):
+                t = self._is_copy
 
             elif t == 'referant':
                 t = ("\n"
@@ -1758,9 +3305,10 @@ def _check_setitem_copy(self, stacklevel=4, t='setting', force=False):
                      )
 
             if value == 'raise':
-                raise SettingWithCopyError(t)
+                raise com.SettingWithCopyError(t)
             elif value == 'warn':
-                warnings.warn(t, SettingWithCopyWarning, stacklevel=stacklevel)
+                warnings.warn(t, com.SettingWithCopyWarning,
+                              stacklevel=stacklevel)
 
     def __delitem__(self, key):
         """
@@ -1796,103 +3344,242 @@ def __delitem__(self, key):
         except KeyError:
             pass
 
-    def take(self, indices, axis=0, convert=True, is_copy=True, **kwargs):
+    def _take(self, indices, axis=0, is_copy=True):
         """
-        Analogous to ndarray.take
+        Return the elements in the given *positional* indices along an axis.
+
+        This means that we are not indexing according to actual values in
+        the index attribute of the object. We are indexing according to the
+        actual position of the element in the object.
+
+        This is the internal version of ``.take()`` and will contain a wider
+        selection of parameters useful for internal use but not as suitable
+        for public usage.
 
         Parameters
         ----------
-        indices : list / array of ints
+        indices : array-like
+            An array of ints indicating which positions to take.
         axis : int, default 0
-        convert : translate neg to pos indices (default)
-        is_copy : mark the returned frame as a copy
+            The axis on which to select elements. "0" means that we are
+            selecting rows, "1" means that we are selecting columns, etc.
+        is_copy : bool, default True
+            Whether to return a copy of the original object or not.
 
         Returns
         -------
-        taken : type of caller
+        taken : same type as caller
+            An array-like containing the elements taken from the object.
+
+        See Also
+        --------
+        numpy.ndarray.take
+        numpy.take
         """
-        nv.validate_take(tuple(), kwargs)
         self._consolidate_inplace()
+
         new_data = self._data.take(indices,
                                    axis=self._get_block_manager_axis(axis),
-                                   convert=True, verify=True)
+                                   verify=True)
         result = self._constructor(new_data).__finalize__(self)
 
-        # maybe set copy if we didn't actually change the index
-        if is_copy:
-            if not result._get_axis(axis).equals(self._get_axis(axis)):
-                result._set_is_copy(self)
+        # Maybe set copy if we didn't actually change the index.
+        if is_copy:
+            if not result._get_axis(axis).equals(self._get_axis(axis)):
+                result._set_is_copy(self)
+
+        return result
+
+    def take(self, indices, axis=0, convert=None, is_copy=True, **kwargs):
+        """
+        Return the elements in the given *positional* indices along an axis.
+
+        This means that we are not indexing according to actual values in
+        the index attribute of the object. We are indexing according to the
+        actual position of the element in the object.
+
+        Parameters
+        ----------
+        indices : array-like
+            An array of ints indicating which positions to take.
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            The axis on which to select elements. ``0`` means that we are
+            selecting rows, ``1`` means that we are selecting columns.
+        convert : bool, default True
+            Whether to convert negative indices into positive ones.
+            For example, ``-1`` would map to the ``len(axis) - 1``.
+            The conversions are similar to the behavior of indexing a
+            regular Python list.
+
+            .. deprecated:: 0.21.0
+               In the future, negative indices will always be converted.
+
+        is_copy : bool, default True
+            Whether to return a copy of the original object or not.
+        **kwargs
+            For compatibility with :meth:`numpy.take`. Has no effect on the
+            output.
+
+        Returns
+        -------
+        taken : same type as caller
+            An array-like containing the elements taken from the object.
+
+        See Also
+        --------
+        DataFrame.loc : Select a subset of a DataFrame by labels.
+        DataFrame.iloc : Select a subset of a DataFrame by positions.
+        numpy.take : Take elements from an array along an axis.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([('falcon', 'bird',    389.0),
+        ...                    ('parrot', 'bird',     24.0),
+        ...                    ('lion',   'mammal',   80.5),
+        ...                    ('monkey', 'mammal', np.nan)],
+        ...                    columns=['name', 'class', 'max_speed'],
+        ...                    index=[0, 2, 3, 1])
+        >>> df
+             name   class  max_speed
+        0  falcon    bird      389.0
+        2  parrot    bird       24.0
+        3    lion  mammal       80.5
+        1  monkey  mammal        NaN
+
+        Take elements at positions 0 and 3 along the axis 0 (default).
+
+        Note how the actual indices selected (0 and 1) do not correspond to
+        our selected indices 0 and 3. That's because we are selecting the 0th
+        and 3rd rows, not rows whose indices equal 0 and 3.
+
+        >>> df.take([0, 3])
+             name   class  max_speed
+        0  falcon    bird      389.0
+        1  monkey  mammal        NaN
+
+        Take elements at indices 1 and 2 along the axis 1 (column selection).
+
+        >>> df.take([1, 2], axis=1)
+            class  max_speed
+        0    bird      389.0
+        2    bird       24.0
+        3  mammal       80.5
+        1  mammal        NaN
+
+        We may take elements using negative integers for positive indices,
+        starting from the end of the object, just like with Python lists.
 
-        return result
+        >>> df.take([-1, -2])
+             name   class  max_speed
+        1  monkey  mammal        NaN
+        3    lion  mammal       80.5
+        """
+        if convert is not None:
+            msg = ("The 'convert' parameter is deprecated "
+                   "and will be removed in a future version.")
+            warnings.warn(msg, FutureWarning, stacklevel=2)
+
+        nv.validate_take(tuple(), kwargs)
+        return self._take(indices, axis=axis, is_copy=is_copy)
 
     def xs(self, key, axis=0, level=None, drop_level=True):
         """
-        Returns a cross-section (row(s) or column(s)) from the
-        Series/DataFrame. Defaults to cross-section on the rows (axis=0).
+        Return cross-section from the Series/DataFrame.
+
+        This method takes a `key` argument to select data at a particular
+        level of a MultiIndex.
 
         Parameters
         ----------
-        key : object
-            Some label contained in the index, or partially in a MultiIndex
-        axis : int, default 0
-            Axis to retrieve cross-section on
+        key : label or tuple of label
+            Label contained in the index, or partially in a MultiIndex.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Axis to retrieve cross-section on.
         level : object, defaults to first n levels (n=1 or len(key))
             In case of a key partially contained in a MultiIndex, indicate
             which levels are used. Levels can be referred by label or position.
-        drop_level : boolean, default True
+        drop_level : bool, default True
             If False, returns object with same levels as self.
 
-        Examples
-        --------
-        >>> df
-           A  B  C
-        a  4  5  2
-        b  4  0  9
-        c  9  7  3
-        >>> df.xs('a')
-        A    4
-        B    5
-        C    2
-        Name: a
-        >>> df.xs('C', axis=1)
-        a    2
-        b    9
-        c    3
-        Name: C
-
-        >>> df
-                            A  B  C  D
-        first second third
-        bar   one    1      4  1  8  9
-              two    1      7  5  5  0
-        baz   one    1      6  6  8  0
-              three  2      5  3  5  3
-        >>> df.xs(('baz', 'three'))
-               A  B  C  D
-        third
-        2      5  3  5  3
-        >>> df.xs('one', level=1)
-                     A  B  C  D
-        first third
-        bar   1      4  1  8  9
-        baz   1      6  6  8  0
-        >>> df.xs(('baz', 2), level=[0, 'third'])
-                A  B  C  D
-        second
-        three   5  3  5  3
-
         Returns
         -------
-        xs : Series or DataFrame
+        Series or DataFrame
+            Cross-section from the original Series or DataFrame
+            corresponding to the selected index levels.
+
+        See Also
+        --------
+        DataFrame.loc : Access a group of rows and columns
+            by label(s) or a boolean array.
+        DataFrame.iloc : Purely integer-location based indexing
+            for selection by position.
 
         Notes
         -----
-        xs is only for getting, not setting values.
+        `xs` can not be used to set values.
 
-        MultiIndex Slicers is a generic way to get/set values on any level or
-        levels.  It is a superset of xs functionality, see
-        :ref:`MultiIndex Slicers <advanced.mi_slicers>`
+        MultiIndex Slicers is a generic way to get/set values on
+        any level or levels.
+        It is a superset of `xs` functionality, see
+        :ref:`MultiIndex Slicers <advanced.mi_slicers>`.
 
+        Examples
+        --------
+        >>> d = {'num_legs': [4, 4, 2, 2],
+        ...      'num_wings': [0, 0, 2, 2],
+        ...      'class': ['mammal', 'mammal', 'mammal', 'bird'],
+        ...      'animal': ['cat', 'dog', 'bat', 'penguin'],
+        ...      'locomotion': ['walks', 'walks', 'flies', 'walks']}
+        >>> df = pd.DataFrame(data=d)
+        >>> df = df.set_index(['class', 'animal', 'locomotion'])
+        >>> df
+                                   num_legs  num_wings
+        class  animal  locomotion
+        mammal cat     walks              4          0
+               dog     walks              4          0
+               bat     flies              2          2
+        bird   penguin walks              2          2
+
+        Get values at specified index
+
+        >>> df.xs('mammal')
+                           num_legs  num_wings
+        animal locomotion
+        cat    walks              4          0
+        dog    walks              4          0
+        bat    flies              2          2
+
+        Get values at several indexes
+
+        >>> df.xs(('mammal', 'dog'))
+                    num_legs  num_wings
+        locomotion
+        walks              4          0
+
+        Get values at specified index and level
+
+        >>> df.xs('cat', level=1)
+                           num_legs  num_wings
+        class  locomotion
+        mammal walks              4          0
+
+        Get values at several indexes and levels
+
+        >>> df.xs(('bird', 'walks'),
+        ...       level=[0, 'locomotion'])
+                 num_legs  num_wings
+        animal
+        penguin         2          2
+
+        Get values at specified column and axis
+
+        >>> df.xs('num_wings', axis=1)
+        class   animal   locomotion
+        mammal  cat      walks         0
+                dog      walks         0
+                bat      flies         2
+        bird    penguin  walks         2
+        Name: num_wings, dtype: int64
         """
         axis = self._get_axis_number(axis)
         labels = self._get_axis(axis)
@@ -1924,9 +3611,9 @@ def xs(self, key, axis=0, level=None, drop_level=True):
             if isinstance(loc, np.ndarray):
                 if loc.dtype == np.bool_:
                     inds, = loc.nonzero()
-                    return self.take(inds, axis=axis, convert=False)
+                    return self._take(inds, axis=axis)
                 else:
-                    return self.take(loc, axis=axis, convert=True)
+                    return self._take(loc, axis=axis)
 
             if not is_scalar(loc):
                 new_index = self.index[loc]
@@ -1940,7 +3627,7 @@ def xs(self, key, axis=0, level=None, drop_level=True):
             # that means that their are list/ndarrays inside the Series!
             # so just return them (GH 6394)
             if not is_list_like(new_values) or self.ndim == 1:
-                return _maybe_box_datetimelike(new_values)
+                return com.maybe_box_datetimelike(new_values)
 
             result = self._constructor_sliced(
                 new_values, index=self.columns,
@@ -1957,10 +3644,12 @@ def xs(self, key, axis=0, level=None, drop_level=True):
 
     _xs = xs
 
-    # TODO: Check if this was clearer in 0.12
     def select(self, crit, axis=0):
         """
-        Return data corresponding to axis labels matching criteria
+        Return data corresponding to axis labels matching criteria.
+
+        .. deprecated:: 0.21.0
+            Use df.loc[df.index.map(crit)] to select via labels
 
         Parameters
         ----------
@@ -1970,8 +3659,13 @@ def select(self, crit, axis=0):
 
         Returns
         -------
-        selection : type of caller
+        selection : same type as caller
         """
+        warnings.warn("'select' is deprecated and will be removed in a "
+                      "future release. You can use "
+                      ".loc[labels.map(crit)] as a replacement",
+                      FutureWarning, stacklevel=2)
+
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
         axis_values = self._get_axis(axis)
@@ -1986,29 +3680,99 @@ def select(self, crit, axis=0):
 
     def reindex_like(self, other, method=None, copy=True, limit=None,
                      tolerance=None):
-        """Return an object with matching indices to myself.
+        """
+        Return an object with matching indices as other object.
+
+        Conform the object to the same index on all axes. Optional
+        filling logic, placing NaN in locations having no value
+        in the previous index. A new object is produced unless the
+        new index is equivalent to the current one and copy=False.
 
         Parameters
         ----------
-        other : Object
-        method : string or None
-        copy : boolean, default True
+        other : Object of the same data type
+            Its row and column indices are used to define the new indices
+            of this object.
+        method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}
+            Method to use for filling holes in reindexed DataFrame.
+            Please note: this is only applicable to DataFrames/Series with a
+            monotonically increasing/decreasing index.
+
+            * None (default): don't fill gaps
+            * pad / ffill: propagate last valid observation forward to next
+              valid
+            * backfill / bfill: use next valid observation to fill gap
+            * nearest: use nearest valid observations to fill gap
+
+        copy : bool, default True
+            Return a new object, even if the passed indexes are the same.
         limit : int, default None
             Maximum number of consecutive labels to fill for inexact matches.
         tolerance : optional
-            Maximum distance between labels of the other object and this
-            object for inexact matches.
+            Maximum distance between original and new labels for inexact
+            matches. The values of the index at the matching locations most
+            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
 
-            .. versionadded:: 0.17.0
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
 
-        Notes
-        -----
-        Like calling s.reindex(index=other.index, columns=other.columns,
-                               method=...)
+            .. versionadded:: 0.21.0 (list-like tolerance)
 
         Returns
         -------
-        reindexed : same as input
+        Series or DataFrame
+            Same type as caller, but with changed indices on each axis.
+
+        See Also
+        --------
+        DataFrame.set_index : Set row labels.
+        DataFrame.reset_index : Remove row labels or move them to new columns.
+        DataFrame.reindex : Change to new indices or expand indices.
+
+        Notes
+        -----
+        Same as calling
+        ``.reindex(index=other.index, columns=other.columns,...)``.
+
+        Examples
+        --------
+        >>> df1 = pd.DataFrame([[24.3, 75.7, 'high'],
+        ...                     [31, 87.8, 'high'],
+        ...                     [22, 71.6, 'medium'],
+        ...                     [35, 95, 'medium']],
+        ...     columns=['temp_celsius', 'temp_fahrenheit', 'windspeed'],
+        ...     index=pd.date_range(start='2014-02-12',
+        ...                         end='2014-02-15', freq='D'))
+
+        >>> df1
+                    temp_celsius  temp_fahrenheit windspeed
+        2014-02-12          24.3             75.7      high
+        2014-02-13          31.0             87.8      high
+        2014-02-14          22.0             71.6    medium
+        2014-02-15          35.0             95.0    medium
+
+        >>> df2 = pd.DataFrame([[28, 'low'],
+        ...                     [30, 'low'],
+        ...                     [35.1, 'medium']],
+        ...     columns=['temp_celsius', 'windspeed'],
+        ...     index=pd.DatetimeIndex(['2014-02-12', '2014-02-13',
+        ...                             '2014-02-15']))
+
+        >>> df2
+                    temp_celsius windspeed
+        2014-02-12          28.0       low
+        2014-02-13          30.0       low
+        2014-02-15          35.1    medium
+
+        >>> df2.reindex_like(df1)
+                    temp_celsius  temp_fahrenheit windspeed
+        2014-02-12          28.0              NaN       low
+        2014-02-13          30.0              NaN       low
+        2014-02-14           NaN              NaN       NaN
+        2014-02-15          35.1              NaN    medium
         """
         d = other._construct_axes_dict(axes=self._AXIS_ORDERS, method=method,
                                        copy=copy, limit=limit,
@@ -2016,9 +3780,38 @@ def reindex_like(self, other, method=None, copy=True, limit=None,
 
         return self.reindex(**d)
 
-    def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
+    def drop(self, labels=None, axis=0, index=None, columns=None, level=None,
+             inplace=False, errors='raise'):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        if labels is not None:
+            if index is not None or columns is not None:
+                raise ValueError("Cannot specify both 'labels' and "
+                                 "'index'/'columns'")
+            axis_name = self._get_axis_name(axis)
+            axes = {axis_name: labels}
+        elif index is not None or columns is not None:
+            axes, _ = self._construct_axes_from_arguments((index, columns), {})
+        else:
+            raise ValueError("Need to specify at least one of 'labels', "
+                             "'index' or 'columns'")
+
+        obj = self
+
+        for axis, labels in axes.items():
+            if labels is not None:
+                obj = obj._drop_axis(labels, axis, level=level, errors=errors)
+
+        if inplace:
+            self._update_inplace(obj)
+        else:
+            return obj
+
+    def _drop_axis(self, labels, axis, level=None, errors='raise'):
         """
-        Return new object with labels in requested axis removed.
+        Drop labels from specified axis. Used in the ``drop`` method
+        internally.
 
         Parameters
         ----------
@@ -2026,21 +3819,13 @@ def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
         axis : int or axis name
         level : int or level name, default None
             For MultiIndex
-        inplace : bool, default False
-            If True, do operation inplace and return None.
         errors : {'ignore', 'raise'}, default 'raise'
             If 'ignore', suppress error and existing labels are dropped.
 
-            .. versionadded:: 0.16.1
-
-        Returns
-        -------
-        dropped : type of caller
         """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
-        axis, axis_ = self._get_axis(axis), axis
+        axis = self._get_axis(axis)
 
         if axis.is_unique:
             if level is not None:
@@ -2049,31 +3834,32 @@ def drop(self, labels, axis=0, level=None, inplace=False, errors='raise'):
                 new_axis = axis.drop(labels, level=level, errors=errors)
             else:
                 new_axis = axis.drop(labels, errors=errors)
-            dropped = self.reindex(**{axis_name: new_axis})
-            try:
-                dropped.axes[axis_].set_names(axis.names, inplace=True)
-            except AttributeError:
-                pass
-            result = dropped
+            result = self.reindex(**{axis_name: new_axis})
 
+        # Case for non-unique axis
         else:
-            labels = com._index_labels_to_array(labels)
+            labels = ensure_object(com.index_labels_to_array(labels))
             if level is not None:
                 if not isinstance(axis, MultiIndex):
                     raise AssertionError('axis must be a MultiIndex')
                 indexer = ~axis.get_level_values(level).isin(labels)
+
+                # GH 18561 MultiIndex.drop should raise if label is absent
+                if errors == 'raise' and indexer.all():
+                    raise KeyError('{} not found in axis'.format(labels))
             else:
                 indexer = ~axis.isin(labels)
+                # Check if label doesn't exist along axis
+                labels_missing = (axis.get_indexer_for(labels) == -1).any()
+                if errors == 'raise' and labels_missing:
+                    raise KeyError('{} not found in axis'.format(labels))
 
             slicer = [slice(None)] * self.ndim
             slicer[self._get_axis_number(axis_name)] = indexer
 
             result = self.loc[tuple(slicer)]
 
-        if inplace:
-            self._update_inplace(result)
-        else:
-            return result
+        return result
 
     def _update_inplace(self, result, verify_is_copy=True):
         """
@@ -2095,98 +3881,247 @@ def _update_inplace(self, result, verify_is_copy=True):
 
     def add_prefix(self, prefix):
         """
-        Concatenate prefix string with panel items names.
+        Prefix labels with string `prefix`.
+
+        For Series, the row labels are prefixed.
+        For DataFrame, the column labels are prefixed.
 
         Parameters
         ----------
-        prefix : string
+        prefix : str
+            The string to add before each label.
 
         Returns
         -------
-        with_prefix : type of caller
+        Series or DataFrame
+            New Series or DataFrame with updated labels.
+
+        See Also
+        --------
+        Series.add_suffix: Suffix row labels with string `suffix`.
+        DataFrame.add_suffix: Suffix column labels with string `suffix`.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
+
+        >>> s.add_prefix('item_')
+        item_0    1
+        item_1    2
+        item_2    3
+        item_3    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3, 4],  'B': [3, 4, 5, 6]})
+        >>> df
+           A  B
+        0  1  3
+        1  2  4
+        2  3  5
+        3  4  6
+
+        >>> df.add_prefix('col_')
+             col_A  col_B
+        0       1       3
+        1       2       4
+        2       3       5
+        3       4       6
         """
-        new_data = self._data.add_prefix(prefix)
-        return self._constructor(new_data).__finalize__(self)
+        f = functools.partial('{prefix}{}'.format, prefix=prefix)
+
+        mapper = {self._info_axis_name: f}
+        return self.rename(**mapper)
 
     def add_suffix(self, suffix):
         """
-        Concatenate suffix string with panel items names.
+        Suffix labels with string `suffix`.
+
+        For Series, the row labels are suffixed.
+        For DataFrame, the column labels are suffixed.
 
         Parameters
         ----------
-        suffix : string
+        suffix : str
+            The string to add after each label.
 
         Returns
         -------
-        with_suffix : type of caller
+        Series or DataFrame
+            New Series or DataFrame with updated labels.
+
+        See Also
+        --------
+        Series.add_prefix: Prefix row labels with string `prefix`.
+        DataFrame.add_prefix: Prefix column labels with string `prefix`.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        dtype: int64
+
+        >>> s.add_suffix('_item')
+        0_item    1
+        1_item    2
+        2_item    3
+        3_item    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [1, 2, 3, 4],  'B': [3, 4, 5, 6]})
+        >>> df
+           A  B
+        0  1  3
+        1  2  4
+        2  3  5
+        3  4  6
+
+        >>> df.add_suffix('_col')
+             A_col  B_col
+        0       1       3
+        1       2       4
+        2       3       5
+        3       4       6
         """
-        new_data = self._data.add_suffix(suffix)
-        return self._constructor(new_data).__finalize__(self)
+        f = functools.partial('{}{suffix}'.format, suffix=suffix)
 
-    _shared_docs['sort_values'] = """
-        Sort by the values along either axis
+        mapper = {self._info_axis_name: f}
+        return self.rename(**mapper)
 
-        .. versionadded:: 0.17.0
+    def sort_values(self, by=None, axis=0, ascending=True, inplace=False,
+                    kind='quicksort', na_position='last'):
+        """
+        Sort by the values along either axis.
 
         Parameters
         ----------%(optional_by)s
         axis : %(axes_single_arg)s, default 0
-            Axis to direct sorting
+             Axis to be sorted.
         ascending : bool or list of bool, default True
              Sort ascending vs. descending. Specify list for multiple sort
              orders.  If this is a list of bools, must match the length of
              the by.
         inplace : bool, default False
-             if True, perform operation in-place
+             If True, perform operation in-place.
         kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
              Choice of sorting algorithm. See also ndarray.np.sort for more
              information.  `mergesort` is the only stable algorithm. For
              DataFrames, this option is only applied when sorting on a single
              column or label.
         na_position : {'first', 'last'}, default 'last'
-             `first` puts NaNs at the beginning, `last` puts NaNs at the end
+             Puts NaNs at the beginning if `first`; `last` puts NaNs at the
+             end.
 
         Returns
         -------
-        sorted_obj : %(klass)s
-        """
+        sorted_obj : DataFrame or None
+            DataFrame with sorted values if inplace=False, None otherwise.
 
-    def sort_values(self, by, axis=0, ascending=True, inplace=False,
-                    kind='quicksort', na_position='last'):
-        raise AbstractMethodError(self)
+        Examples
+        --------
+        >>> df = pd.DataFrame({
+        ...     'col1': ['A', 'A', 'B', np.nan, 'D', 'C'],
+        ...     'col2': [2, 1, 9, 8, 7, 4],
+        ...     'col3': [0, 1, 9, 4, 2, 3],
+        ... })
+        >>> df
+            col1 col2 col3
+        0   A    2    0
+        1   A    1    1
+        2   B    9    9
+        3   NaN  8    4
+        4   D    7    2
+        5   C    4    3
+
+        Sort by col1
+
+        >>> df.sort_values(by=['col1'])
+            col1 col2 col3
+        0   A    2    0
+        1   A    1    1
+        2   B    9    9
+        5   C    4    3
+        4   D    7    2
+        3   NaN  8    4
+
+        Sort by multiple columns
+
+        >>> df.sort_values(by=['col1', 'col2'])
+            col1 col2 col3
+        1   A    1    1
+        0   A    2    0
+        2   B    9    9
+        5   C    4    3
+        4   D    7    2
+        3   NaN  8    4
+
+        Sort Descending
+
+        >>> df.sort_values(by='col1', ascending=False)
+            col1 col2 col3
+        4   D    7    2
+        5   C    4    3
+        2   B    9    9
+        0   A    2    0
+        1   A    1    1
+        3   NaN  8    4
+
+        Putting NAs first
+
+        >>> df.sort_values(by='col1', ascending=False, na_position='first')
+            col1 col2 col3
+        3   NaN  8    4
+        4   D    7    2
+        5   C    4    3
+        2   B    9    9
+        0   A    2    0
+        1   A    1    1
+        """
+        raise NotImplementedError("sort_values has not been implemented "
+                                  "on Panel or Panel4D objects.")
 
-    _shared_docs['sort_index'] = """
-        Sort object by labels (along an axis)
+    def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
+                   kind='quicksort', na_position='last', sort_remaining=True):
+        """
+        Sort object by labels (along an axis).
 
         Parameters
         ----------
-        axis : %(axes)s to direct sorting
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            The axis along which to sort.  The value 0 identifies the rows,
+            and 1 identifies the columns.
         level : int or level name or list of ints or list of level names
-            if not None, sort on values in specified index level(s)
-        ascending : boolean, default True
-            Sort ascending vs. descending
+            If not None, sort on values in specified index level(s).
+        ascending : bool, default True
+            Sort ascending vs. descending.
         inplace : bool, default False
-            if True, perform operation in-place
+            If True, perform operation in-place.
         kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
-             Choice of sorting algorithm. See also ndarray.np.sort for more
-             information.  `mergesort` is the only stable algorithm. For
-             DataFrames, this option is only applied when sorting on a single
-             column or label.
+            Choice of sorting algorithm. See also ndarray.np.sort for more
+            information.  `mergesort` is the only stable algorithm. For
+            DataFrames, this option is only applied when sorting on a single
+            column or label.
         na_position : {'first', 'last'}, default 'last'
-             `first` puts NaNs at the beginning, `last` puts NaNs at the end.
-             Not implemented for MultiIndex.
+            Puts NaNs at the beginning if `first`; `last` puts NaNs at the end.
+            Not implemented for MultiIndex.
         sort_remaining : bool, default True
-            if true and sorting by level and index is multilevel, sort by other
-            levels too (in order) after sorting by specified level
+            If True and sorting by level and index is multilevel, sort by other
+            levels too (in order) after sorting by specified level.
 
         Returns
         -------
-        sorted_obj : %(klass)s
+        sorted_obj : DataFrame or None
+            DataFrame with sorted index if inplace=False, None otherwise.
         """
-
-    @Appender(_shared_docs['sort_index'] % dict(axes="axes", klass="NDFrame"))
-    def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
-                   kind='quicksort', na_position='last', sort_remaining=True):
         inplace = validate_bool_kwarg(inplace, 'inplace')
         axis = self._get_axis_number(axis)
         axis_name = self._get_axis_name(axis)
@@ -2204,49 +4139,75 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         new_axis = labels.take(sort_index)
         return self.reindex(**{axis_name: new_axis})
 
-    _shared_docs['reindex'] = """
+    def reindex(self, *args, **kwargs):
+        """
         Conform %(klass)s to new index with optional filling logic, placing
         NA/NaN in locations having no value in the previous index. A new object
         is produced unless the new index is equivalent to the current one and
-        copy=False
+        ``copy=False``.
 
         Parameters
         ----------
-        %(axes)s : array-like, optional (can be specified in order, or as
-            keywords)
-            New labels / index to conform to. Preferably an Index object to
-            avoid duplicating data
-        method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}, optional
-            method to use for filling holes in reindexed DataFrame.
-            Please note: this is only  applicable to DataFrames/Series with a
+        %(optional_labels)s
+        %(axes)s : array-like, optional
+            New labels / index to conform to, should be specified using
+            keywords. Preferably an Index object to avoid duplicating data
+        %(optional_axis)s
+        method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}
+            Method to use for filling holes in reindexed DataFrame.
+            Please note: this is only applicable to DataFrames/Series with a
             monotonically increasing/decreasing index.
 
-            * default: don't fill gaps
+            * None (default): don't fill gaps
             * pad / ffill: propagate last valid observation forward to next
               valid
             * backfill / bfill: use next valid observation to fill gap
             * nearest: use nearest valid observations to fill gap
 
-        copy : boolean, default True
-            Return a new object, even if the passed indexes are the same
+        copy : bool, default True
+            Return a new object, even if the passed indexes are the same.
         level : int or name
             Broadcast across a level, matching Index values on the
-            passed MultiIndex level
+            passed MultiIndex level.
         fill_value : scalar, default np.NaN
             Value to use for missing values. Defaults to NaN, but can be any
-            "compatible" value
+            "compatible" value.
         limit : int, default None
-            Maximum number of consecutive elements to forward or backward fill
+            Maximum number of consecutive elements to forward or backward fill.
         tolerance : optional
             Maximum distance between original and new labels for inexact
             matches. The values of the index at the matching locations most
             satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
 
-            .. versionadded:: 0.17.0
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
+
+        Returns
+        -------
+        %(klass)s with changed index.
+
+        See Also
+        --------
+        DataFrame.set_index : Set row labels.
+        DataFrame.reset_index : Remove row labels or move them to new columns.
+        DataFrame.reindex_like : Change to same indices as other DataFrame.
 
         Examples
         --------
 
+        ``DataFrame.reindex`` supports two calling conventions
+
+        * ``(index=index_labels, columns=column_labels, ...)``
+        * ``(labels, axis={'index', 'columns'}, ...)``
+
+        We *highly* recommend using keyword arguments to clarify your
+        intent.
+
         Create a dataframe with some fictional data.
 
         >>> index = ['Firefox', 'Chrome', 'Safari', 'IE10', 'Konqueror']
@@ -2297,6 +4258,26 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         IE10                  404          0.08
         Chrome                200          0.02
 
+        We can also reindex the columns.
+
+        >>> df.reindex(columns=['http_status', 'user_agent'])
+                   http_status  user_agent
+        Firefox            200         NaN
+        Chrome             200         NaN
+        Safari             404         NaN
+        IE10               404         NaN
+        Konqueror          301         NaN
+
+        Or we can use "axis-style" keyword arguments
+
+        >>> df.reindex(['http_status', 'user_agent'], axis="columns")
+                   http_status  user_agent
+        Firefox            200         NaN
+        Chrome             200         NaN
+        Safari             404         NaN
+        IE10               404         NaN
+        Konqueror          301         NaN
+
         To further illustrate the filling functionality in
         ``reindex``, we will create a dataframe with a
         monotonically increasing index (for example, a sequence
@@ -2307,12 +4288,12 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         ...                    index=date_index)
         >>> df2
                     prices
-        2010-01-01     100
-        2010-01-02     101
+        2010-01-01   100.0
+        2010-01-02   101.0
         2010-01-03     NaN
-        2010-01-04     100
-        2010-01-05      89
-        2010-01-06      88
+        2010-01-04   100.0
+        2010-01-05    89.0
+        2010-01-06    88.0
 
         Suppose we decide to expand the dataframe to cover a wider
         date range.
@@ -2323,12 +4304,12 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         2009-12-29     NaN
         2009-12-30     NaN
         2009-12-31     NaN
-        2010-01-01     100
-        2010-01-02     101
+        2010-01-01   100.0
+        2010-01-02   101.0
         2010-01-03     NaN
-        2010-01-04     100
-        2010-01-05      89
-        2010-01-06      88
+        2010-01-04   100.0
+        2010-01-05    89.0
+        2010-01-06    88.0
         2010-01-07     NaN
 
         The index entries that did not have a value in the original data frame
@@ -2336,20 +4317,20 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         If desired, we can fill in the missing values using one of several
         options.
 
-        For example, to backpropagate the last valid value to fill the ``NaN``
+        For example, to back-propagate the last valid value to fill the ``NaN``
         values, pass ``bfill`` as an argument to the ``method`` keyword.
 
         >>> df2.reindex(date_index2, method='bfill')
                     prices
-        2009-12-29     100
-        2009-12-30     100
-        2009-12-31     100
-        2010-01-01     100
-        2010-01-02     101
+        2009-12-29   100.0
+        2009-12-30   100.0
+        2009-12-31   100.0
+        2010-01-01   100.0
+        2010-01-02   101.0
         2010-01-03     NaN
-        2010-01-04     100
-        2010-01-05      89
-        2010-01-06      88
+        2010-01-04   100.0
+        2010-01-05    89.0
+        2010-01-06    88.0
         2010-01-07     NaN
 
         Please note that the ``NaN`` value present in the original dataframe
@@ -2359,16 +4340,10 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
         desired indexes. If you do want to fill in the ``NaN`` values present
         in the original dataframe, use the ``fillna()`` method.
 
-        Returns
-        -------
-        reindexed : %(klass)s
+        See the :ref:`user guide <basics.reindexing>` for more.
         """
-
-    # TODO: Decide if we care about having different examples for different
-    #       kinds
-
-    @Appender(_shared_docs['reindex'] % dict(axes="axes", klass="NDFrame"))
-    def reindex(self, *args, **kwargs):
+        # TODO: Decide if we care about having different examples for different
+        # kinds
 
         # construct the args
         axes, kwargs = self._construct_axes_from_arguments(args, kwargs)
@@ -2377,7 +4352,12 @@ def reindex(self, *args, **kwargs):
         copy = kwargs.pop('copy', True)
         limit = kwargs.pop('limit', None)
         tolerance = kwargs.pop('tolerance', None)
-        fill_value = kwargs.pop('fill_value', np.nan)
+        fill_value = kwargs.pop('fill_value', None)
+
+        # Series.reindex doesn't use / need the axis kwarg
+        # We pop and ignore it here, to make writing Series/Frame generic code
+        # easier
+        kwargs.pop("axis", None)
 
         if kwargs:
             raise TypeError('reindex() got an unexpected keyword '
@@ -2387,8 +4367,8 @@ def reindex(self, *args, **kwargs):
 
         # if all axes that are requested to reindex are equal, then only copy
         # if indicated must have index names equal here as well as values
-        if all([self._get_axis(axis).identical(ax)
-                for axis, ax in axes.items() if ax is not None]):
+        if all(self._get_axis(axis).identical(ax)
+               for axis, ax in axes.items() if ax is not None):
             if copy:
                 return self.copy()
             return self
@@ -2397,7 +4377,7 @@ def reindex(self, *args, **kwargs):
         if self._needs_reindex_multi(axes, method, level):
             try:
                 return self._reindex_multi(axes, copy, fill_value)
-            except:
+            except Exception:
                 pass
 
         # perform the reindex on the axes
@@ -2426,74 +4406,96 @@ def _reindex_axes(self, axes, level, limit, tolerance, method, fill_value,
 
     def _needs_reindex_multi(self, axes, method, level):
         """Check if we do need a multi reindex."""
-        return ((com._count_not_none(*axes.values()) == self._AXIS_LEN) and
+        return ((com.count_not_none(*axes.values()) == self._AXIS_LEN) and
                 method is None and level is None and not self._is_mixed_type)
 
     def _reindex_multi(self, axes, copy, fill_value):
         return NotImplemented
 
-    _shared_docs[
-        'reindex_axis'] = ("""Conform input object to new index with optional
-        filling logic, placing NA/NaN in locations having no value in the
-        previous index. A new object is produced unless the new index is
-        equivalent to the current one and copy=False
+    _shared_docs['reindex_axis'] = ("""
+        Conform input object to new index.
+
+        .. deprecated:: 0.21.0
+            Use `reindex` instead.
+
+        By default, places NaN in locations having no value in the
+        previous index. A new object is produced unless the new index
+        is equivalent to the current one and copy=False.
 
         Parameters
         ----------
         labels : array-like
             New labels / index to conform to. Preferably an Index object to
-            avoid duplicating data
+            avoid duplicating data.
         axis : %(axes_single_arg)s
+            Indicate whether to use rows or columns.
         method : {None, 'backfill'/'bfill', 'pad'/'ffill', 'nearest'}, optional
             Method to use for filling holes in reindexed DataFrame:
 
-            * default: don't fill gaps
+            * default: don't fill gaps.
             * pad / ffill: propagate last valid observation forward to next
-              valid
-            * backfill / bfill: use next valid observation to fill gap
-            * nearest: use nearest valid observations to fill gap
+              valid.
+            * backfill / bfill: use next valid observation to fill gap.
+            * nearest: use nearest valid observations to fill gap.
 
-        copy : boolean, default True
-            Return a new object, even if the passed indexes are the same
-        level : int or name
+        level : int or str
             Broadcast across a level, matching Index values on the
-            passed MultiIndex level
-        limit : int, default None
-            Maximum number of consecutive elements to forward or backward fill
-        tolerance : optional
-            Maximum distance between original and new labels for inexact
-            matches. The values of the index at the matching locations most
-            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
+            passed MultiIndex level.
+        copy : bool, default True
+            Return a new object, even if the passed indexes are the same.
+        limit : int, optional
+            Maximum number of consecutive elements to forward or backward fill.
+        fill_value : float, default NaN
+            Value used to fill in locations having no value in the previous
+            index.
 
-            .. versionadded:: 0.17.0
+            .. versionadded:: 0.21.0 (list-like tolerance)
 
-        Examples
-        --------
-        >>> df.reindex_axis(['A', 'B', 'C'], axis=1)
+        Returns
+        -------
+        %(klass)s
+            Returns a new DataFrame object with new indices, unless the new
+            index is equivalent to the current one and copy=False.
 
         See Also
         --------
-        reindex, reindex_like
+        DataFrame.set_index : Set row labels.
+        DataFrame.reset_index : Remove row labels or move them to new columns.
+        DataFrame.reindex : Change to new indices or expand indices.
+        DataFrame.reindex_like : Change to same indices as other DataFrame.
 
-        Returns
-        -------
-        reindexed : %(klass)s
+        Examples
+        --------
+        >>> df = pd.DataFrame({'num_legs': [4, 2], 'num_wings': [0, 2]},
+        ...                   index=['dog', 'hawk'])
+        >>> df
+              num_legs  num_wings
+        dog          4          0
+        hawk         2          2
+        >>> df.reindex(['num_wings', 'num_legs', 'num_heads'],
+        ...            axis='columns')
+              num_wings  num_legs  num_heads
+        dog           0         4        NaN
+        hawk          2         2        NaN
         """)
 
     @Appender(_shared_docs['reindex_axis'] % _shared_doc_kwargs)
     def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
-                     limit=None, fill_value=np.nan):
+                     limit=None, fill_value=None):
+        msg = ("'.reindex_axis' is deprecated and will be removed in a future "
+               "version. Use '.reindex' instead.")
         self._consolidate_inplace()
 
         axis_name = self._get_axis_name(axis)
         axis_values = self._get_axis(axis_name)
         method = missing.clean_reindex_fill_method(method)
+        warnings.warn(msg, FutureWarning, stacklevel=3)
         new_index, indexer = axis_values.reindex(labels, method, level,
                                                  limit=limit)
         return self._reindex_with_indexers({axis: [new_index, indexer]},
                                            fill_value=fill_value, copy=copy)
 
-    def _reindex_with_indexers(self, reindexers, fill_value=np.nan, copy=False,
+    def _reindex_with_indexers(self, reindexers, fill_value=None, copy=False,
                                allow_dups=False):
         """allow_dups indicates an internal call here """
 
@@ -2506,9 +4508,9 @@ def _reindex_with_indexers(self, reindexers, fill_value=np.nan, copy=False,
             if index is None:
                 continue
 
-            index = _ensure_index(index)
+            index = ensure_index(index)
             if indexer is not None:
-                indexer = _ensure_int64(indexer)
+                indexer = ensure_int64(indexer)
 
             # TODO: speed up on homogeneous DataFrame objects
             new_data = new_data.reindex_indexer(index, indexer, axis=baxis,
@@ -2521,15 +4523,6 @@ def _reindex_with_indexers(self, reindexers, fill_value=np.nan, copy=False,
 
         return self._constructor(new_data).__finalize__(self)
 
-    def _reindex_axis(self, new_index, fill_method, axis, copy):
-        new_data = self._data.reindex_axis(new_index, axis=axis,
-                                           method=fill_method, copy=copy)
-
-        if new_data is self._data and not copy:
-            return self
-        else:
-            return self._constructor(new_data).__finalize__(self)
-
     def filter(self, items=None, like=None, regex=None, axis=None):
         """
         Subset rows or columns of dataframe according to labels in
@@ -2541,91 +4534,199 @@ def filter(self, items=None, like=None, regex=None, axis=None):
         Parameters
         ----------
         items : list-like
-            List of info axis to restrict to (must not all be present)
+            List of axis to restrict to (must not all be present).
         like : string
-            Keep info axis where "arg in col == True"
+            Keep axis where "arg in col == True".
         regex : string (regular expression)
-            Keep info axis with re.search(regex, col) == True
+            Keep axis with re.search(regex, col) == True.
         axis : int or string axis name
             The axis to filter on.  By default this is the info axis,
-            'index' for Series, 'columns' for DataFrame
+            'index' for Series, 'columns' for DataFrame.
 
         Returns
         -------
         same type as input object
 
+        See Also
+        --------
+        DataFrame.loc
+
+        Notes
+        -----
+        The ``items``, ``like``, and ``regex`` parameters are
+        enforced to be mutually exclusive.
+
+        ``axis`` defaults to the info axis that is used when indexing
+        with ``[]``.
+
         Examples
         --------
-        >>> df
-        one  two  three
-        mouse     1    2      3
-        rabbit    4    5      6
+        >>> df = pd.DataFrame(np.array(([1,2,3], [4,5,6])),
+        ...                   index=['mouse', 'rabbit'],
+        ...                   columns=['one', 'two', 'three'])
 
         >>> # select columns by name
         >>> df.filter(items=['one', 'three'])
-        one  three
+                 one  three
         mouse     1      3
         rabbit    4      6
 
         >>> # select columns by regular expression
         >>> df.filter(regex='e$', axis=1)
-        one  three
+                 one  three
         mouse     1      3
         rabbit    4      6
 
         >>> # select rows containing 'bbi'
         >>> df.filter(like='bbi', axis=0)
-        one  two  three
+                 one  two  three
         rabbit    4    5      6
-
-        See Also
-        --------
-        pandas.DataFrame.select
-
-        Notes
-        -----
-        The ``items``, ``like``, and ``regex`` parameters are
-        enforced to be mutually exclusive.
-
-        ``axis`` defaults to the info axis that is used when indexing
-        with ``[]``.
         """
         import re
 
-        nkw = sum([x is not None for x in [items, like, regex]])
+        nkw = com.count_not_none(items, like, regex)
         if nkw > 1:
             raise TypeError('Keyword arguments `items`, `like`, or `regex` '
                             'are mutually exclusive')
 
         if axis is None:
             axis = self._info_axis_name
-        axis_name = self._get_axis_name(axis)
-        axis_values = self._get_axis(axis_name)
+        labels = self._get_axis(axis)
 
         if items is not None:
-            return self.reindex(**{axis_name:
-                                   [r for r in items if r in axis_values]})
+            name = self._get_axis_name(axis)
+            return self.reindex(
+                **{name: [r for r in items if r in labels]})
         elif like:
-            matchf = lambda x: (like in x if isinstance(x, string_types) else
-                                like in str(x))
-            return self.select(matchf, axis=axis_name)
+            def f(x):
+                return like in to_str(x)
+            values = labels.map(f)
+            return self.loc(axis=axis)[values]
         elif regex:
+            def f(x):
+                return matcher.search(to_str(x)) is not None
             matcher = re.compile(regex)
-            return self.select(lambda x: matcher.search(str(x)) is not None,
-                               axis=axis_name)
+            values = labels.map(f)
+            return self.loc(axis=axis)[values]
         else:
             raise TypeError('Must pass either `items`, `like`, or `regex`')
 
     def head(self, n=5):
         """
-        Returns first n rows
+        Return the first `n` rows.
+
+        This function returns the first `n` rows for the object based
+        on position. It is useful for quickly testing if your object
+        has the right type of data in it.
+
+        Parameters
+        ----------
+        n : int, default 5
+            Number of rows to select.
+
+        Returns
+        -------
+        obj_head : same type as caller
+            The first `n` rows of the caller object.
+
+        See Also
+        --------
+        DataFrame.tail: Returns the last `n` rows.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'animal':['alligator', 'bee', 'falcon', 'lion',
+        ...                    'monkey', 'parrot', 'shark', 'whale', 'zebra']})
+        >>> df
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+        5     parrot
+        6      shark
+        7      whale
+        8      zebra
+
+        Viewing the first 5 lines
+
+        >>> df.head()
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+
+        Viewing the first `n` lines (three in this case)
+
+        >>> df.head(3)
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        """
+
+        return self.iloc[:n]
+
+    def tail(self, n=5):
+        """
+        Return the last `n` rows.
+
+        This function returns last `n` rows from the object based on
+        position. It is useful for quickly verifying data, for example,
+        after sorting or appending rows.
+
+        Parameters
+        ----------
+        n : int, default 5
+            Number of rows to select.
+
+        Returns
+        -------
+        type of caller
+            The last `n` rows of the caller object.
+
+        See Also
+        --------
+        DataFrame.head : The first `n` rows of the caller object.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'animal':['alligator', 'bee', 'falcon', 'lion',
+        ...                    'monkey', 'parrot', 'shark', 'whale', 'zebra']})
+        >>> df
+              animal
+        0  alligator
+        1        bee
+        2     falcon
+        3       lion
+        4     monkey
+        5     parrot
+        6      shark
+        7      whale
+        8      zebra
+
+        Viewing the last 5 lines
+
+        >>> df.tail()
+           animal
+        4  monkey
+        5  parrot
+        6   shark
+        7   whale
+        8   zebra
+
+        Viewing the last `n` lines (three in this case)
+
+        >>> df.tail(3)
+          animal
+        6  shark
+        7  whale
+        8  zebra
         """
-        return self.iloc[:n]
 
-    def tail(self, n=5):
-        """
-        Returns last n rows
-        """
         if n == 0:
             return self.iloc[0:0]
         return self.iloc[-n:]
@@ -2633,9 +4734,9 @@ def tail(self, n=5):
     def sample(self, n=None, frac=None, replace=False, weights=None,
                random_state=None, axis=None):
         """
-        Returns a random sample of items from an axis of object.
+        Return a random sample of items from an axis of object.
 
-        .. versionadded:: 0.16.1
+        You can use `random_state` for reproducibility.
 
         Parameters
         ----------
@@ -2644,8 +4745,8 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
             Default = 1 if `frac` = None.
         frac : float, optional
             Fraction of axis items to return. Cannot be used with `n`.
-        replace : boolean, optional
-            Sample with or without replacement. Default = False.
+        replace : bool, default False
+            Sample with or without replacement.
         weights : str or ndarray-like, optional
             Default 'None' results in equal probability weighting.
             If passed a Series, will align with target object on index. Index
@@ -2658,7 +4759,7 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
             being sampled.
             If weights do not sum to 1, they will be normalized to sum to 1.
             Missing values in the weights column will be treated as zero.
-            inf and -inf values not allowed.
+            Infinite values not allowed.
         random_state : int or numpy.random.RandomState, optional
             Seed for the random number generator (if int), or numpy RandomState
             object.
@@ -2668,49 +4769,52 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
 
         Returns
         -------
-        A new object of same type as caller.
+        Series or DataFrame
+            A new object of same type as caller containing `n` items randomly
+            sampled from the caller object.
 
-        Examples
+        See Also
         --------
+        numpy.random.choice: Generates a random sample from a given 1-D numpy
+            array.
 
-        Generate an example ``Series`` and ``DataFrame``:
+        Examples
+        --------
+        >>> df = pd.DataFrame({'num_legs': [2, 4, 8, 0],
+        ...                    'num_wings': [2, 0, 0, 0],
+        ...                    'num_specimen_seen': [10, 2, 1, 8]},
+        ...                   index=['falcon', 'dog', 'spider', 'fish'])
+        >>> df
+                num_legs  num_wings  num_specimen_seen
+        falcon         2          2                 10
+        dog            4          0                  2
+        spider         8          0                  1
+        fish           0          0                  8
 
-        >>> s = pd.Series(np.random.randn(50))
-        >>> s.head()
-        0   -0.038497
-        1    1.820773
-        2   -0.972766
-        3   -1.598270
-        4   -1.095526
-        dtype: float64
-        >>> df = pd.DataFrame(np.random.randn(50, 4), columns=list('ABCD'))
-        >>> df.head()
-                  A         B         C         D
-        0  0.016443 -2.318952 -0.566372 -1.028078
-        1 -1.051921  0.438836  0.658280 -0.175797
-        2 -1.243569 -0.364626 -0.215065  0.057736
-        3  1.768216  0.404512 -0.385604 -1.457834
-        4  1.072446 -1.137172  0.314194 -0.046661
+        Extract 3 random elements from the ``Series`` ``df['num_legs']``:
+        Note that we use `random_state` to ensure the reproducibility of
+        the examples.
 
-        Next extract a random sample from both of these objects...
+        >>> df['num_legs'].sample(n=3, random_state=1)
+        fish      0
+        spider    8
+        falcon    2
+        Name: num_legs, dtype: int64
 
-        3 random elements from the ``Series``:
+        A random 50% sample of the ``DataFrame`` with replacement:
 
-        >>> s.sample(n=3)
-        27   -0.994689
-        55   -1.049016
-        67   -0.224565
-        dtype: float64
+        >>> df.sample(frac=0.5, replace=True, random_state=1)
+              num_legs  num_wings  num_specimen_seen
+        dog          4          0                  2
+        fish         0          0                  8
 
-        And a random 10% of the ``DataFrame`` with replacement:
+        Using a DataFrame column as weights. Rows with larger value in the
+        `num_specimen_seen` column are more likely to be sampled.
 
-        >>> df.sample(frac=0.1, replace=True)
-                   A         B         C         D
-        35  1.981780  0.142106  1.817165 -0.290805
-        49 -1.336199 -0.448634 -0.789640  0.217116
-        40  0.823173 -0.078816  1.009536  1.015108
-        15  1.421154 -0.055301 -1.922594 -0.019696
-        6  -0.148339  0.832938  1.787600 -1.383767
+        >>> df.sample(n=2, weights='num_specimen_seen', random_state=1)
+                num_legs  num_wings  num_specimen_seen
+        falcon         2          2                 10
+        fish           0          0                  8
         """
 
         if axis is None:
@@ -2720,7 +4824,7 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
         axis_length = self.shape[axis]
 
         # Process random_state argument
-        rs = com._random_state(random_state)
+        rs = com.random_state(random_state)
 
         # Check weights for compliance
         if weights is not None:
@@ -2790,10 +4894,8 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
         locs = rs.choice(axis_length, size=n, replace=replace, p=weights)
         return self.take(locs, axis=axis, is_copy=False)
 
-    _shared_docs['pipe'] = ("""
-        Apply func(self, \*args, \*\*kwargs)
-
-        .. versionadded:: 0.16.2
+    _shared_docs['pipe'] = (r"""
+        Apply func(self, \*args, \*\*kwargs).
 
         Parameters
         ----------
@@ -2803,18 +4905,26 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
             Alternatively a ``(callable, data_keyword)`` tuple where
             ``data_keyword`` is a string indicating the keyword of
             ``callable`` that expects the %(klass)s.
-        args : positional arguments passed into ``func``.
-        kwargs : a dictionary of keyword arguments passed into ``func``.
+        args : iterable, optional
+            positional arguments passed into ``func``.
+        kwargs : mapping, optional
+            a dictionary of keyword arguments passed into ``func``.
 
         Returns
         -------
         object : the return type of ``func``.
 
+        See Also
+        --------
+        DataFrame.apply
+        DataFrame.applymap
+        Series.map
+
         Notes
         -----
 
         Use ``.pipe`` when chaining together functions that expect
-        on Series or DataFrames. Instead of writing
+        Series, DataFrames or GroupBy objects. Instead of writing
 
         >>> f(g(h(df), arg1=a), arg2=b, arg3=c)
 
@@ -2833,25 +4943,125 @@ def sample(self, n=None, frac=None, replace=False, weights=None,
         ...    .pipe(g, arg1=a)
         ...    .pipe((f, 'arg2'), arg1=a, arg3=c)
         ...  )
-
-        See Also
-        --------
-        pandas.DataFrame.apply
-        pandas.DataFrame.applymap
-        pandas.Series.map
     """)
 
     @Appender(_shared_docs['pipe'] % _shared_doc_kwargs)
     def pipe(self, func, *args, **kwargs):
-        if isinstance(func, tuple):
-            func, target = func
-            if target in kwargs:
-                raise ValueError('%s is both the pipe target and a keyword '
-                                 'argument' % target)
-            kwargs[target] = self
-            return func(*args, **kwargs)
-        else:
-            return func(self, *args, **kwargs)
+        return com._pipe(self, func, *args, **kwargs)
+
+    _shared_docs['aggregate'] = dedent("""
+    Aggregate using one or more operations over the specified axis.
+
+    %(versionadded)s
+
+    Parameters
+    ----------
+    func : function, str, list or dict
+        Function to use for aggregating the data. If a function, must either
+        work when passed a %(klass)s or when passed to %(klass)s.apply.
+
+        Accepted combinations are:
+
+        - function
+        - string function name
+        - list of functions and/or function names, e.g. ``[np.sum, 'mean']``
+        - dict of axis labels -> functions, function names or list of such.
+    %(axis)s
+    *args
+        Positional arguments to pass to `func`.
+    **kwargs
+        Keyword arguments to pass to `func`.
+
+    Returns
+    -------
+    scalar, Series or DataFrame
+
+        The return can be:
+
+        * scalar : when Series.agg is called with single function
+        * Series : when DataFrame.agg is called with a single function
+        * DataFrame : when DataFrame.agg is called with several functions
+
+        Return scalar, Series or DataFrame.
+
+    %(see_also)s
+
+    Notes
+    -----
+    `agg` is an alias for `aggregate`. Use the alias.
+
+    A passed user-defined-function will be passed a Series for evaluation.
+
+    %(examples)s
+    """)
+
+    _shared_docs['transform'] = ("""
+    Call ``func`` on self producing a %(klass)s with transformed values
+    and that has the same axis length as self.
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    func : function, str, list or dict
+        Function to use for transforming the data. If a function, must either
+        work when passed a %(klass)s or when passed to %(klass)s.apply.
+
+        Accepted combinations are:
+
+        - function
+        - string function name
+        - list of functions and/or function names, e.g. ``[np.exp. 'sqrt']``
+        - dict of axis labels -> functions, function names or list of such.
+    %(axis)s
+    *args
+        Positional arguments to pass to `func`.
+    **kwargs
+        Keyword arguments to pass to `func`.
+
+    Returns
+    -------
+    %(klass)s
+        A %(klass)s that must have the same length as self.
+
+    Raises
+    ------
+    ValueError : If the returned %(klass)s has a different length than self.
+
+    See Also
+    --------
+    %(klass)s.agg : Only perform aggregating type operations.
+    %(klass)s.apply : Invoke function on a %(klass)s.
+
+    Examples
+    --------
+    >>> df = pd.DataFrame({'A': range(3), 'B': range(1, 4)})
+    >>> df
+       A  B
+    0  0  1
+    1  1  2
+    2  2  3
+    >>> df.transform(lambda x: x + 1)
+       A  B
+    0  1  2
+    1  2  3
+    2  3  4
+
+    Even though the resulting %(klass)s must have the same length as the
+    input %(klass)s, it is possible to provide several input functions:
+
+    >>> s = pd.Series(range(3))
+    >>> s
+    0    0
+    1    1
+    2    2
+    dtype: int64
+    >>> s.transform([np.sqrt, np.exp])
+           sqrt        exp
+    0  0.000000   1.000000
+    1  1.000000   2.718282
+    2  1.414214   7.389056
+    """)
 
     # ----------------------------------------------------------------------
     # Attribute access
@@ -2885,7 +5095,7 @@ def __getattr__(self, name):
                 name in self._accessors):
             return object.__getattribute__(self, name)
         else:
-            if name in self._info_axis:
+            if self._info_axis._can_hold_identifiers_and_holds_name(name):
                 return self[name]
             return object.__getattribute__(self, name)
 
@@ -2920,8 +5130,22 @@ def __setattr__(self, name, value):
                 else:
                     object.__setattr__(self, name, value)
             except (AttributeError, TypeError):
+                if isinstance(self, ABCDataFrame) and (is_list_like(value)):
+                    warnings.warn("Pandas doesn't allow columns to be "
+                                  "created via a new attribute name - see "
+                                  "https://pandas.pydata.org/pandas-docs/"
+                                  "stable/indexing.html#attribute-access",
+                                  stacklevel=2)
                 object.__setattr__(self, name, value)
 
+    def _dir_additions(self):
+        """ add the string-like attributes from the info_axis.
+        If info_axis is a MultiIndex, it's first level values are used.
+        """
+        additions = {c for c in self._info_axis.unique(level=0)[:100]
+                     if isinstance(c, string_types) and isidentifier(c)}
+        return super(NDFrame, self)._dir_additions().union(additions)
+
     # ----------------------------------------------------------------------
     # Getting and setting elements
 
@@ -2958,7 +5182,7 @@ def _consolidate(self, inplace=False):
 
         Returns
         -------
-        consolidated : type of caller
+        consolidated : same type as caller
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if inplace:
@@ -2968,15 +5192,6 @@ def _consolidate(self, inplace=False):
             cons_data = self._protect_consolidate(f)
             return self._constructor(cons_data).__finalize__(self)
 
-    def consolidate(self, inplace=False):
-        """
-        DEPRECATED: consolidate will be an internal implementation only.
-        """
-        # 15483
-        warnings.warn("consolidate is deprecated and will be removed in a "
-                      "future release.", FutureWarning, stacklevel=2)
-        return self._consolidate(inplace)
-
     @property
     def _is_mixed_type(self):
         f = lambda: self._data.is_mixed_type
@@ -3002,7 +5217,7 @@ def _check_inplace_setting(self, value):
                 try:
                     if np.isnan(value):
                         return True
-                except:
+                except Exception:
                     pass
 
                 raise TypeError('Cannot do inplace boolean setting on '
@@ -3024,9 +5239,12 @@ def as_matrix(self, columns=None):
         """
         Convert the frame to its Numpy-array representation.
 
+        .. deprecated:: 0.23.0
+            Use :meth:`DataFrame.values` instead.
+
         Parameters
         ----------
-        columns: list, optional, default:None
+        columns : list, optional, default:None
             If None, return all columns, otherwise, returns specified columns.
 
         Returns
@@ -3035,6 +5253,9 @@ def as_matrix(self, columns=None):
             If the caller is heterogeneous and contains booleans or objects,
             the result will be of dtype=object. See Notes.
 
+        See Also
+        --------
+        DataFrame.values
 
         Notes
         -----
@@ -3048,23 +5269,39 @@ def as_matrix(self, columns=None):
         e.g. If the dtypes are float16 and float32, dtype will be upcast to
         float32.  If dtypes are int32 and uint8, dtype will be upcase to
         int32. By numpy.find_common_type convention, mixing int64 and uint64
-        will result in a flot64 dtype.
+        will result in a float64 dtype.
 
         This method is provided for backwards compatibility. Generally,
         it is recommended to use '.values'.
-
-        See Also
-        --------
-        pandas.DataFrame.values
         """
+        warnings.warn("Method .as_matrix will be removed in a future version. "
+                      "Use .values instead.", FutureWarning, stacklevel=2)
         self._consolidate_inplace()
-        if self._AXIS_REVERSED:
-            return self._data.as_matrix(columns).T
-        return self._data.as_matrix(columns)
+        return self._data.as_array(transpose=self._AXIS_REVERSED,
+                                   items=columns)
 
     @property
     def values(self):
-        """Numpy representation of NDFrame
+        """
+        Return a Numpy representation of the DataFrame.
+
+        .. warning::
+
+           We recommend using :meth:`DataFrame.to_numpy` instead.
+
+        Only the values in the DataFrame will be returned, the axes labels
+        will be removed.
+
+        Returns
+        -------
+        numpy.ndarray
+            The values of the DataFrame.
+
+        See Also
+        --------
+        DataFrame.to_numpy : Recommended alternative to this method.
+        DataFrame.index : Retrieve the index labels.
+        DataFrame.columns : Retrieving the column names.
 
         Notes
         -----
@@ -3075,10 +5312,50 @@ def values(self):
 
         e.g. If the dtypes are float16 and float32, dtype will be upcast to
         float32.  If dtypes are int32 and uint8, dtype will be upcast to
-        int32. By numpy.find_common_type convention, mixing int64 and uint64
-        will result in a flot64 dtype.
+        int32. By :func:`numpy.find_common_type` convention, mixing int64
+        and uint64 will result in a float64 dtype.
+
+        Examples
+        --------
+        A DataFrame where all columns are the same type (e.g., int64) results
+        in an array of the same type.
+
+        >>> df = pd.DataFrame({'age':    [ 3,  29],
+        ...                    'height': [94, 170],
+        ...                    'weight': [31, 115]})
+        >>> df
+           age  height  weight
+        0    3      94      31
+        1   29     170     115
+        >>> df.dtypes
+        age       int64
+        height    int64
+        weight    int64
+        dtype: object
+        >>> df.values
+        array([[  3,  94,  31],
+               [ 29, 170, 115]], dtype=int64)
+
+        A DataFrame with mixed type columns(e.g., str/object, int64, float32)
+        results in an ndarray of the broadest type that accommodates these
+        mixed types (e.g., object).
+
+        >>> df2 = pd.DataFrame([('parrot',   24.0, 'second'),
+        ...                     ('lion',     80.5, 1),
+        ...                     ('monkey', np.nan, None)],
+        ...                   columns=('name', 'max_speed', 'rank'))
+        >>> df2.dtypes
+        name          object
+        max_speed    float64
+        rank          object
+        dtype: object
+        >>> df2.values
+        array([['parrot', 24.0, 'second'],
+               ['lion', 80.5, 1],
+               ['monkey', nan, None]], dtype=object)
         """
-        return self.as_matrix()
+        self._consolidate_inplace()
+        return self._data.as_array(transpose=self._AXIS_REVERSED)
 
     @property
     def _values(self):
@@ -3088,25 +5365,160 @@ def _values(self):
     @property
     def _get_values(self):
         # compat
-        return self.as_matrix()
+        return self.values
 
     def get_values(self):
-        """same as values (but handles sparseness conversions)"""
-        return self.as_matrix()
+        """
+        Return an ndarray after converting sparse values to dense.
+
+        This is the same as ``.values`` for non-sparse data. For sparse
+        data contained in a `SparseArray`, the data are first
+        converted to a dense representation.
+
+        Returns
+        -------
+        numpy.ndarray
+            Numpy representation of DataFrame.
+
+        See Also
+        --------
+        values : Numpy representation of DataFrame.
+        SparseArray : Container for sparse data.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'a': [1, 2], 'b': [True, False],
+        ...                    'c': [1.0, 2.0]})
+        >>> df
+           a      b    c
+        0  1   True  1.0
+        1  2  False  2.0
+
+        >>> df.get_values()
+        array([[1, True, 1.0], [2, False, 2.0]], dtype=object)
+
+        >>> df = pd.DataFrame({"a": pd.SparseArray([1, None, None]),
+        ...                    "c": [1.0, 2.0, 3.0]})
+        >>> df
+             a    c
+        0  1.0  1.0
+        1  NaN  2.0
+        2  NaN  3.0
+
+        >>> df.get_values()
+        array([[ 1.,  1.],
+               [nan,  2.],
+               [nan,  3.]])
+        """
+        return self.values
 
     def get_dtype_counts(self):
-        """Return the counts of dtypes in this object."""
+        """
+        Return counts of unique dtypes in this object.
+
+        Returns
+        -------
+        dtype : Series
+            Series with the count of columns with each dtype.
+
+        See Also
+        --------
+        dtypes : Return the dtypes in this object.
+
+        Examples
+        --------
+        >>> a = [['a', 1, 1.0], ['b', 2, 2.0], ['c', 3, 3.0]]
+        >>> df = pd.DataFrame(a, columns=['str', 'int', 'float'])
+        >>> df
+          str  int  float
+        0   a    1    1.0
+        1   b    2    2.0
+        2   c    3    3.0
+
+        >>> df.get_dtype_counts()
+        float64    1
+        int64      1
+        object     1
+        dtype: int64
+        """
         from pandas import Series
         return Series(self._data.get_dtype_counts())
 
     def get_ftype_counts(self):
-        """Return the counts of ftypes in this object."""
+        """
+        Return counts of unique ftypes in this object.
+
+        .. deprecated:: 0.23.0
+
+        This is useful for SparseDataFrame or for DataFrames containing
+        sparse arrays.
+
+        Returns
+        -------
+        dtype : Series
+            Series with the count of columns with each type and
+            sparsity (dense/sparse).
+
+        See Also
+        --------
+        ftypes : Return ftypes (indication of sparse/dense and dtype) in
+            this object.
+
+        Examples
+        --------
+        >>> a = [['a', 1, 1.0], ['b', 2, 2.0], ['c', 3, 3.0]]
+        >>> df = pd.DataFrame(a, columns=['str', 'int', 'float'])
+        >>> df
+          str  int  float
+        0   a    1    1.0
+        1   b    2    2.0
+        2   c    3    3.0
+
+        >>> df.get_ftype_counts()  # doctest: +SKIP
+        float64:dense    1
+        int64:dense      1
+        object:dense     1
+        dtype: int64
+        """
+        warnings.warn("get_ftype_counts is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+
         from pandas import Series
         return Series(self._data.get_ftype_counts())
 
     @property
     def dtypes(self):
-        """Return the dtypes in this object."""
+        """
+        Return the dtypes in the DataFrame.
+
+        This returns a Series with the data type of each column.
+        The result's index is the original DataFrame's columns. Columns
+        with mixed types are stored with the ``object`` dtype. See
+        :ref:`the User Guide <basics.dtypes>` for more.
+
+        Returns
+        -------
+        pandas.Series
+            The data type of each column.
+
+        See Also
+        --------
+        DataFrame.ftypes : Dtype and sparsity information.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'float': [1.0],
+        ...                    'int': [1],
+        ...                    'datetime': [pd.Timestamp('20180310')],
+        ...                    'string': ['foo']})
+        >>> df.dtypes
+        float              float64
+        int                  int64
+        datetime    datetime64[ns]
+        string              object
+        dtype: object
+        """
         from pandas import Series
         return Series(self._data.get_dtypes(), index=self._info_axis,
                       dtype=np.object_)
@@ -3114,8 +5526,44 @@ def dtypes(self):
     @property
     def ftypes(self):
         """
-        Return the ftypes (indication of sparse/dense and dtype)
-        in this object.
+        Return the ftypes (indication of sparse/dense and dtype) in DataFrame.
+
+        This returns a Series with the data type of each column.
+        The result's index is the original DataFrame's columns. Columns
+        with mixed types are stored with the ``object`` dtype.  See
+        :ref:`the User Guide <basics.dtypes>` for more.
+
+        Returns
+        -------
+        pandas.Series
+            The data type and indication of sparse/dense of each column.
+
+        See Also
+        --------
+        DataFrame.dtypes: Series with just dtype information.
+        SparseDataFrame : Container for sparse tabular data.
+
+        Notes
+        -----
+        Sparse data should have the same dtypes as its dense representation.
+
+        Examples
+        --------
+        >>> arr = np.random.RandomState(0).randn(100, 4)
+        >>> arr[arr < .8] = np.nan
+        >>> pd.DataFrame(arr).ftypes
+        0    float64:dense
+        1    float64:dense
+        2    float64:dense
+        3    float64:dense
+        dtype: object
+
+        >>> pd.SparseDataFrame(arr).ftypes
+        0    float64:sparse
+        1    float64:sparse
+        2    float64:sparse
+        3    float64:sparse
+        dtype: object
         """
         from pandas import Series
         return Series(self._data.get_ftypes(), index=self._info_axis,
@@ -3126,6 +5574,8 @@ def as_blocks(self, copy=True):
         Convert the frame to a dict of dtype -> Constructor Types that each has
         a homogeneous dtype.
 
+        .. deprecated:: 0.21.0
+
         NOTE: the dtypes of the blocks WILL BE PRESERVED HERE (unlike in
               as_matrix)
 
@@ -3133,38 +5583,37 @@ def as_blocks(self, copy=True):
         ----------
         copy : boolean, default True
 
-               .. versionadded: 0.16.1
-
         Returns
         -------
         values : a dict of dtype -> Constructor Types
         """
-        self._consolidate_inplace()
-
-        bd = {}
-        for b in self._data.blocks:
-            bd.setdefault(str(b.dtype), []).append(b)
-
-        result = {}
-        for dtype, blocks in bd.items():
-            # Must combine even after consolidation, because there may be
-            # sparse items which are never consolidated into one block.
-            combined = self._data.combine(blocks, copy=copy)
-            result[dtype] = self._constructor(combined).__finalize__(self)
-
-        return result
+        warnings.warn("as_blocks is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+        return self._to_dict_of_blocks(copy=copy)
 
     @property
     def blocks(self):
-        """Internal property, property synonym for as_blocks()"""
+        """
+        Internal property, property synonym for as_blocks().
+
+        .. deprecated:: 0.21.0
+        """
         return self.as_blocks()
 
-    @deprecate_kwarg(old_arg_name='raise_on_error', new_arg_name='errors',
-                     mapping={True: 'raise', False: 'ignore'})
+    def _to_dict_of_blocks(self, copy=True):
+        """
+        Return a dict of dtype -> Constructor Types that
+        each is a homogeneous dtype.
+
+        Internal ONLY
+        """
+        return {k: self._constructor(v).__finalize__(self)
+                for k, v, in self._data.to_dict(copy=copy).items()}
+
     def astype(self, dtype, copy=True, errors='raise', **kwargs):
         """
-        Cast object to input numpy.dtype
-        Return a copy when copy = True (be really careful with this!)
+        Cast a pandas object to a specified dtype ``dtype``.
 
         Parameters
         ----------
@@ -3173,7 +5622,11 @@ def astype(self, dtype, copy=True, errors='raise', **kwargs):
             the same type. Alternatively, use {col: dtype, ...}, where col is a
             column label and dtype is a numpy.dtype or Python type to cast one
             or more of the DataFrame's columns to column-specific types.
-        errors : {'raise', 'ignore'}, default 'raise'.
+        copy : bool, default True
+            Return a copy when ``copy=True`` (be very careful setting
+            ``copy=False`` as changes to values then may propagate to other
+            pandas objects).
+        errors : {'raise', 'ignore'}, default 'raise'
             Control raising of exceptions on invalid data for provided dtype.
 
             - ``raise`` : allow exceptions to be raised
@@ -3181,19 +5634,66 @@ def astype(self, dtype, copy=True, errors='raise', **kwargs):
 
             .. versionadded:: 0.20.0
 
-        raise_on_error : DEPRECATED use ``errors`` instead
         kwargs : keyword arguments to pass on to the constructor
 
         Returns
         -------
-        casted : type of caller
+        casted : same type as caller
+
+        See Also
+        --------
+        to_datetime : Convert argument to datetime.
+        to_timedelta : Convert argument to timedelta.
+        to_numeric : Convert argument to a numeric type.
+        numpy.ndarray.astype : Cast a numpy array to a specified type.
+
+        Examples
+        --------
+        >>> ser = pd.Series([1, 2], dtype='int32')
+        >>> ser
+        0    1
+        1    2
+        dtype: int32
+        >>> ser.astype('int64')
+        0    1
+        1    2
+        dtype: int64
+
+        Convert to categorical type:
+
+        >>> ser.astype('category')
+        0    1
+        1    2
+        dtype: category
+        Categories (2, int64): [1, 2]
+
+        Convert to ordered categorical type with custom ordering:
+
+        >>> cat_dtype = pd.api.types.CategoricalDtype(
+        ...                     categories=[2, 1], ordered=True)
+        >>> ser.astype(cat_dtype)
+        0    1
+        1    2
+        dtype: category
+        Categories (2, int64): [2 < 1]
+
+        Note that using ``copy=False`` and changing data on a new
+        pandas object may propagate changes:
+
+        >>> s1 = pd.Series([1,2])
+        >>> s2 = s1.astype('int64', copy=False)
+        >>> s2[0] = 10
+        >>> s1  # note that s1[0] has changed too
+        0    10
+        1     2
+        dtype: int64
         """
-        if isinstance(dtype, collections.Mapping):
+        if is_dict_like(dtype):
             if self.ndim == 1:  # i.e. Series
-                if len(dtype) > 1 or list(dtype.keys())[0] != self.name:
+                if len(dtype) > 1 or self.name not in dtype:
                     raise KeyError('Only the Series name can be used for '
                                    'the key in Series dtype mappings.')
-                new_type = list(dtype.values())[0]
+                new_type = dtype[self.name]
                 return self.astype(new_type, copy, errors, **kwargs)
             elif self.ndim > 2:
                 raise NotImplementedError(
@@ -3205,38 +5705,134 @@ def astype(self, dtype, copy=True, errors='raise', **kwargs):
                 if col_name not in self:
                     raise KeyError('Only a column name can be used for the '
                                    'key in a dtype mappings argument.')
-            from pandas import concat
             results = []
             for col_name, col in self.iteritems():
                 if col_name in dtype:
                     results.append(col.astype(dtype[col_name], copy=copy))
                 else:
                     results.append(results.append(col.copy() if copy else col))
-            return concat(results, axis=1, copy=False)
 
-        # else, only a single dtype is given
-        new_data = self._data.astype(dtype=dtype, copy=copy, errors=errors,
-                                     **kwargs)
-        return self._constructor(new_data).__finalize__(self)
+        elif is_extension_array_dtype(dtype) and self.ndim > 1:
+            # GH 18099/22869: columnwise conversion to extension dtype
+            # GH 24704: use iloc to handle duplicate column names
+            results = (self.iloc[:, i].astype(dtype, copy=copy)
+                       for i in range(len(self.columns)))
+
+        else:
+            # else, only a single dtype is given
+            new_data = self._data.astype(dtype=dtype, copy=copy, errors=errors,
+                                         **kwargs)
+            return self._constructor(new_data).__finalize__(self)
+
+        # GH 19920: retain column metadata after concat
+        result = pd.concat(results, axis=1, copy=False)
+        result.columns = self.columns
+        return result
 
     def copy(self, deep=True):
         """
-        Make a copy of this objects data.
+        Make a copy of this object's indices and data.
+
+        When ``deep=True`` (default), a new object will be created with a
+        copy of the calling object's data and indices. Modifications to
+        the data or indices of the copy will not be reflected in the
+        original object (see notes below).
+
+        When ``deep=False``, a new object will be created without copying
+        the calling object's data or index (only references to the data
+        and index are copied). Any changes to the data of the original
+        will be reflected in the shallow copy (and vice versa).
 
         Parameters
         ----------
-        deep : boolean or string, default True
+        deep : bool, default True
             Make a deep copy, including a copy of the data and the indices.
-            With ``deep=False`` neither the indices or the data are copied.
-
-            Note that when ``deep=True`` data is copied, actual python objects
-            will not be copied recursively, only the reference to the object.
-            This is in contrast to ``copy.deepcopy`` in the Standard Library,
-            which recursively copies object data.
+            With ``deep=False`` neither the indices nor the data are copied.
 
         Returns
         -------
-        copy : type of caller
+        copy : Series, DataFrame or Panel
+            Object type matches caller.
+
+        Notes
+        -----
+        When ``deep=True``, data is copied but actual Python objects
+        will not be copied recursively, only the reference to the object.
+        This is in contrast to `copy.deepcopy` in the Standard Library,
+        which recursively copies object data (see examples below).
+
+        While ``Index`` objects are copied when ``deep=True``, the underlying
+        numpy array is not copied for performance reasons. Since ``Index`` is
+        immutable, the underlying data can be safely shared and a copy
+        is not needed.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2], index=["a", "b"])
+        >>> s
+        a    1
+        b    2
+        dtype: int64
+
+        >>> s_copy = s.copy()
+        >>> s_copy
+        a    1
+        b    2
+        dtype: int64
+
+        **Shallow copy versus default (deep) copy:**
+
+        >>> s = pd.Series([1, 2], index=["a", "b"])
+        >>> deep = s.copy()
+        >>> shallow = s.copy(deep=False)
+
+        Shallow copy shares data and index with original.
+
+        >>> s is shallow
+        False
+        >>> s.values is shallow.values and s.index is shallow.index
+        True
+
+        Deep copy has own copy of data and index.
+
+        >>> s is deep
+        False
+        >>> s.values is deep.values or s.index is deep.index
+        False
+
+        Updates to the data shared by shallow copy and original is reflected
+        in both; deep copy remains unchanged.
+
+        >>> s[0] = 3
+        >>> shallow[1] = 4
+        >>> s
+        a    3
+        b    4
+        dtype: int64
+        >>> shallow
+        a    3
+        b    4
+        dtype: int64
+        >>> deep
+        a    1
+        b    2
+        dtype: int64
+
+        Note that when copying an object containing Python objects, a deep copy
+        will copy the data, but will not do so recursively. Updating a nested
+        data object will be reflected in the deep copy.
+
+        >>> s = pd.Series([[1, 2], [3, 4]])
+        >>> deep = s.copy()
+        >>> s[0][0] = 10
+        >>> s
+        0    [10, 2]
+        1     [3, 4]
+        dtype: object
+        >>> deep
+        0    [10, 2]
+        1     [3, 4]
+        dtype: object
         """
         data = self._data.copy(deep=deep)
         return self._constructor(data).__finalize__(self)
@@ -3245,6 +5841,12 @@ def __copy__(self, deep=True):
         return self.copy(deep=deep)
 
     def __deepcopy__(self, memo=None):
+        """
+        Parameters
+        ----------
+        memo, default None
+            Standard signature. Unused
+        """
         if memo is None:
             memo = {}
         return self.copy(deep=True)
@@ -3280,13 +5882,12 @@ def _convert(self, datetime=False, numeric=False, timedelta=False,
                                timedelta=timedelta, coerce=coerce,
                                copy=copy)).__finalize__(self)
 
-    # TODO: Remove in 0.18 or 2017, which ever is sooner
     def convert_objects(self, convert_dates=True, convert_numeric=False,
                         convert_timedeltas=True, copy=True):
         """
-        Deprecated.
+        Attempt to infer better dtype for object columns.
 
-        Attempt to infer better dtype for object columns
+        .. deprecated:: 0.21.0
 
         Parameters
         ----------
@@ -3304,21 +5905,22 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
             conversion was done). Note: This is meant for internal use, and
             should not be confused with inplace.
 
-        See Also
-        --------
-        pandas.to_datetime : Convert argument to datetime.
-        pandas.to_timedelta : Convert argument to timedelta.
-        pandas.to_numeric : Return a fixed frequency timedelta index,
-            with day as the default.
-
         Returns
         -------
         converted : same as input object
+
+        See Also
+        --------
+        to_datetime : Convert argument to datetime.
+        to_timedelta : Convert argument to timedelta.
+        to_numeric : Convert argument to numeric type.
         """
-        from warnings import warn
-        warn("convert_objects is deprecated.  Use the data-type specific "
-             "converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.",
-             FutureWarning, stacklevel=2)
+        msg = ("convert_objects is deprecated.  To re-infer data dtypes for "
+               "object columns, use {klass}.infer_objects()\nFor all "
+               "other conversions use the data-type specific converters "
+               "pd.to_datetime, pd.to_timedelta and pd.to_numeric."
+               ).format(klass=self.__class__.__name__)
+        warnings.warn(msg, FutureWarning, stacklevel=2)
 
         return self._constructor(
             self._data.convert(convert_dates=convert_dates,
@@ -3326,28 +5928,78 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
                                convert_timedeltas=convert_timedeltas,
                                copy=copy)).__finalize__(self)
 
+    def infer_objects(self):
+        """
+        Attempt to infer better dtypes for object columns.
+
+        Attempts soft conversion of object-dtyped
+        columns, leaving non-object and unconvertible
+        columns unchanged. The inference rules are the
+        same as during normal Series/DataFrame construction.
+
+        .. versionadded:: 0.21.0
+
+        Returns
+        -------
+        converted : same type as input object
+
+        See Also
+        --------
+        to_datetime : Convert argument to datetime.
+        to_timedelta : Convert argument to timedelta.
+        to_numeric : Convert argument to numeric type.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({"A": ["a", 1, 2, 3]})
+        >>> df = df.iloc[1:]
+        >>> df
+           A
+        1  1
+        2  2
+        3  3
+
+        >>> df.dtypes
+        A    object
+        dtype: object
+
+        >>> df.infer_objects().dtypes
+        A    int64
+        dtype: object
+        """
+        # numeric=False necessary to only soft convert;
+        # python objects will still be converted to
+        # native numpy numeric types
+        return self._constructor(
+            self._data.convert(datetime=True, numeric=False,
+                               timedelta=True, coerce=False,
+                               copy=True)).__finalize__(self)
+
     # ----------------------------------------------------------------------
     # Filling NA's
 
-    _shared_docs['fillna'] = ("""
-        Fill NA/NaN values using the specified method
+    def fillna(self, value=None, method=None, axis=None, inplace=False,
+               limit=None, downcast=None):
+        """
+        Fill NA/NaN values using the specified method.
 
         Parameters
         ----------
         value : scalar, dict, Series, or DataFrame
             Value to use to fill holes (e.g. 0), alternately a
             dict/Series/DataFrame of values specifying which value to use for
-            each index (for a Series) or column (for a DataFrame). (values not
-            in the dict/Series/DataFrame will not be filled). This value cannot
+            each index (for a Series) or column (for a DataFrame).  Values not
+            in the dict/Series/DataFrame will not be filled. This value cannot
             be a list.
         method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
             Method to use for filling holes in reindexed Series
             pad / ffill: propagate last valid observation forward to next valid
-            backfill / bfill: use NEXT valid observation to fill gap
+            backfill / bfill: use next valid observation to fill gap.
         axis : %(axes_single_arg)s
-        inplace : boolean, default False
-            If True, fill in place. Note: this will modify any
-            other views on this object, (e.g. a no-copy slice for a column in a
+            Axis along which to fill missing values.
+        inplace : bool, default False
+            If True, fill in-place. Note: this will modify any
+            other views on this object (e.g., a no-copy slice for a column in a
             DataFrame).
         limit : int, default None
             If method is specified, this is the maximum number of consecutive
@@ -3357,27 +6009,76 @@ def convert_objects(self, convert_dates=True, convert_numeric=False,
             maximum number of entries along the entire axis where NaNs will be
             filled. Must be greater than 0 if not None.
         downcast : dict, default is None
-            a dict of item->dtype of what to downcast if possible,
+            A dict of item->dtype of what to downcast if possible,
             or the string 'infer' which will try to downcast to an appropriate
-            equal type (e.g. float64 to int64 if possible)
-
-        See Also
-        --------
-        reindex, asfreq
+            equal type (e.g. float64 to int64 if possible).
 
         Returns
         -------
-        filled : %(klass)s
-        """)
+        %(klass)s
+            Object with missing values filled.
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
-    def fillna(self, value=None, method=None, axis=None, inplace=False,
-               limit=None, downcast=None):
+        See Also
+        --------
+        interpolate : Fill NaN values using interpolation.
+        reindex : Conform object to new index.
+        asfreq : Convert TimeSeries to specified frequency.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([[np.nan, 2, np.nan, 0],
+        ...                    [3, 4, np.nan, 1],
+        ...                    [np.nan, np.nan, np.nan, 5],
+        ...                    [np.nan, 3, np.nan, 4]],
+        ...                   columns=list('ABCD'))
+        >>> df
+             A    B   C  D
+        0  NaN  2.0 NaN  0
+        1  3.0  4.0 NaN  1
+        2  NaN  NaN NaN  5
+        3  NaN  3.0 NaN  4
+
+        Replace all NaN elements with 0s.
+
+        >>> df.fillna(0)
+            A   B   C   D
+        0   0.0 2.0 0.0 0
+        1   3.0 4.0 0.0 1
+        2   0.0 0.0 0.0 5
+        3   0.0 3.0 0.0 4
+
+        We can also propagate non-null values forward or backward.
+
+        >>> df.fillna(method='ffill')
+            A   B   C   D
+        0   NaN 2.0 NaN 0
+        1   3.0 4.0 NaN 1
+        2   3.0 4.0 NaN 5
+        3   3.0 3.0 NaN 4
+
+        Replace all NaN elements in column 'A', 'B', 'C', and 'D', with 0, 1,
+        2, and 3 respectively.
+
+        >>> values = {'A': 0, 'B': 1, 'C': 2, 'D': 3}
+        >>> df.fillna(value=values)
+            A   B   C   D
+        0   0.0 2.0 2.0 0
+        1   3.0 4.0 2.0 1
+        2   0.0 1.0 2.0 5
+        3   0.0 3.0 2.0 4
+
+        Only replace the first NaN element.
+
+        >>> df.fillna(value=values, limit=1)
+            A   B   C   D
+        0   0.0 2.0 2.0 0
+        1   3.0 4.0 NaN 1
+        2   NaN 1.0 NaN 5
+        3   NaN 3.0 NaN 4
+        """
         inplace = validate_bool_kwarg(inplace, 'inplace')
+        value, method = validate_fillna_kwargs(value, method)
 
-        if isinstance(value, (list, tuple)):
-            raise TypeError('"value" parameter must be a scalar or dict, but '
-                            'you passed a "{0}"'.format(type(value).__name__))
         self._consolidate_inplace()
 
         # set the default here, so functions examining the signaure
@@ -3385,11 +6086,10 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
         if axis is None:
             axis = 0
         axis = self._get_axis_number(axis)
-        method = missing.clean_fill_method(method)
+
         from pandas import DataFrame
         if value is None:
-            if method is None:
-                raise ValueError('must specify a fill method or value')
+
             if self._is_mixed_type and axis == 1:
                 if inplace:
                     raise NotImplementedError()
@@ -3407,25 +6107,20 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
 
             # 3d
             elif self.ndim == 3:
-
                 # fill in 2d chunks
-                result = dict([(col, s.fillna(method=method, value=value))
-                               for col, s in self.iteritems()])
-                new_obj = self._constructor.\
-                    from_dict(result).__finalize__(self)
+                result = {col: s.fillna(method=method, value=value)
+                          for col, s in self.iteritems()}
+                prelim_obj = self._constructor.from_dict(result)
+                new_obj = prelim_obj.__finalize__(self)
                 new_data = new_obj._data
 
             else:
                 # 2d or less
-                method = missing.clean_fill_method(method)
                 new_data = self._data.interpolate(method=method, axis=axis,
                                                   limit=limit, inplace=inplace,
                                                   coerce=True,
                                                   downcast=downcast)
         else:
-            if method is not None:
-                raise ValueError('cannot specify both a fill method and value')
-
             if len(self._get_axis(axis)) == 0:
                 return self
 
@@ -3436,8 +6131,9 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                 elif not is_list_like(value):
                     pass
                 else:
-                    raise ValueError("invalid fill value with a %s" %
-                                     type(value))
+                    raise TypeError('"value" parameter must be a scalar, dict '
+                                    'or Series, but you passed a '
+                                    '"{0}"'.format(type(value).__name__))
 
                 new_data = self._data.fillna(value=value, limit=limit,
                                              inplace=inplace,
@@ -3455,13 +6151,14 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                         continue
                     obj = result[k]
                     obj.fillna(v, limit=limit, inplace=True, downcast=downcast)
-                return result
+                return result if not inplace else None
+
             elif not is_list_like(value):
                 new_data = self._data.fillna(value=value, limit=limit,
                                              inplace=inplace,
                                              downcast=downcast)
             elif isinstance(value, DataFrame) and self.ndim == 2:
-                new_data = self.where(self.notnull(), value)
+                new_data = self.where(self.notna(), value)
             else:
                 raise ValueError("invalid fill value with a %s" % type(value))
 
@@ -3472,29 +6169,34 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
 
     def ffill(self, axis=None, inplace=False, limit=None, downcast=None):
         """
-        Synonym for :meth:`DataFrame.fillna(method='ffill') <DataFrame.fillna>`
+        Synonym for :meth:`DataFrame.fillna` with ``method='ffill'``.
         """
         return self.fillna(method='ffill', axis=axis, inplace=inplace,
                            limit=limit, downcast=downcast)
 
     def bfill(self, axis=None, inplace=False, limit=None, downcast=None):
         """
-        Synonym for :meth:`DataFrame.fillna(method='bfill') <DataFrame.fillna>`
+        Synonym for :meth:`DataFrame.fillna` with ``method='bfill'``.
         """
         return self.fillna(method='bfill', axis=axis, inplace=inplace,
                            limit=limit, downcast=downcast)
 
-    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
-                regex=False, method='pad', axis=None):
-        """
-        Replace values given in 'to_replace' with 'value'.
+    _shared_docs['replace'] = ("""
+        Replace values given in `to_replace` with `value`.
+
+        Values of the %(klass)s are replaced with other values dynamically.
+        This differs from updating with ``.loc`` or ``.iloc``, which require
+        you to specify a location to update with some value.
 
         Parameters
         ----------
-        to_replace : str, regex, list, dict, Series, numeric, or None
+        to_replace : str, regex, list, dict, Series, int, float, or None
+            How to find the values that will be replaced.
 
-            * str or regex:
+            * numeric, str or regex:
 
+                - numeric: numeric values equal to `to_replace` will be
+                  replaced with `value`
                 - str: string exactly matching `to_replace` will be replaced
                   with `value`
                 - regex: regexs matching `to_replace` will be replaced with
@@ -3508,70 +6210,92 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                   lists will be interpreted as regexs otherwise they will match
                   directly. This doesn't matter much for `value` since there
                   are only a few possible substitution regexes you can use.
-                - str and regex rules apply as above.
+                - str, regex and numeric rules apply as above.
 
             * dict:
 
-                - Nested dictionaries, e.g., {'a': {'b': nan}}, are read as
-                  follows: look in column 'a' for the value 'b' and replace it
-                  with nan. You can nest regular expressions as well. Note that
+                - Dicts can be used to specify different replacement values
+                  for different existing values. For example,
+                  ``{'a': 'b', 'y': 'z'}`` replaces the value 'a' with 'b' and
+                  'y' with 'z'. To use a dict in this way the `value`
+                  parameter should be `None`.
+                - For a DataFrame a dict can specify that different values
+                  should be replaced in different columns. For example,
+                  ``{'a': 1, 'b': 'z'}`` looks for the value 1 in column 'a'
+                  and the value 'z' in column 'b' and replaces these values
+                  with whatever is specified in `value`. The `value` parameter
+                  should not be ``None`` in this case. You can treat this as a
+                  special case of passing two lists except that you are
+                  specifying the column to search in.
+                - For a DataFrame nested dictionaries, e.g.,
+                  ``{'a': {'b': np.nan}}``, are read as follows: look in column
+                  'a' for the value 'b' and replace it with NaN. The `value`
+                  parameter should be ``None`` to use a nested dict in this
+                  way. You can nest regular expressions as well. Note that
                   column names (the top-level dictionary keys in a nested
                   dictionary) **cannot** be regular expressions.
-                - Keys map to column names and values map to substitution
-                  values. You can treat this as a special case of passing two
-                  lists except that you are specifying the column to search in.
 
             * None:
 
-                - This means that the ``regex`` argument must be a string,
-                  compiled regular expression, or list, dict, ndarray or Series
-                  of such elements. If `value` is also ``None`` then this
-                  **must** be a nested dictionary or ``Series``.
+                - This means that the `regex` argument must be a string,
+                  compiled regular expression, or list, dict, ndarray or
+                  Series of such elements. If `value` is also ``None`` then
+                  this **must** be a nested dictionary or Series.
 
             See the examples section for examples of each of these.
         value : scalar, dict, list, str, regex, default None
-            Value to use to fill holes (e.g. 0), alternately a dict of values
-            specifying which value to use for each column (columns not in the
-            dict will not be filled). Regular expressions, strings and lists or
-            dicts of such objects are also allowed.
-        inplace : boolean, default False
+            Value to replace any values matching `to_replace` with.
+            For a DataFrame a dict of values can be used to specify which
+            value to use for each column (columns not in the dict will not be
+            filled). Regular expressions, strings and lists or dicts of such
+            objects are also allowed.
+        inplace : bool, default False
             If True, in place. Note: this will modify any
-            other views on this object (e.g. a column form a DataFrame).
+            other views on this object (e.g. a column from a DataFrame).
             Returns the caller if this is True.
         limit : int, default None
-            Maximum size gap to forward or backward fill
+            Maximum size gap to forward or backward fill.
         regex : bool or same types as `to_replace`, default False
             Whether to interpret `to_replace` and/or `value` as regular
             expressions. If this is ``True`` then `to_replace` *must* be a
-            string. Otherwise, `to_replace` must be ``None`` because this
-            parameter will be interpreted as a regular expression or a list,
-            dict, or array of regular expressions.
-        method : string, optional, {'pad', 'ffill', 'bfill'}
-            The method to use when for replacement, when ``to_replace`` is a
-            ``list``.
+            string. Alternatively, this could be a regular expression or a
+            list, dict, or array of regular expressions in which case
+            `to_replace` must be ``None``.
+        method : {'pad', 'ffill', 'bfill', `None`}
+            The method to use when for replacement, when `to_replace` is a
+            scalar, list or tuple and `value` is ``None``.
 
-        See Also
-        --------
-        NDFrame.reindex
-        NDFrame.asfreq
-        NDFrame.fillna
+            .. versionchanged:: 0.23.0
+                Added to DataFrame.
 
         Returns
         -------
-        filled : NDFrame
+        %(klass)s
+            Object after replacement.
 
         Raises
         ------
         AssertionError
-            * If `regex` is not a ``bool`` and `to_replace` is not ``None``.
+            * If `regex` is not a ``bool`` and `to_replace` is not
+              ``None``.
         TypeError
             * If `to_replace` is a ``dict`` and `value` is not a ``list``,
               ``dict``, ``ndarray``, or ``Series``
-            * If `to_replace` is ``None`` and `regex` is not compilable into a
-              regular expression or is a list, dict, ndarray, or Series.
+            * If `to_replace` is ``None`` and `regex` is not compilable
+              into a regular expression or is a list, dict, ndarray, or
+              Series.
+            * When replacing multiple ``bool`` or ``datetime64`` objects and
+              the arguments to `to_replace` does not match the type of the
+              value being replaced
         ValueError
-            * If `to_replace` and `value` are ``list`` s or ``ndarray`` s, but
-              they are not the same length.
+            * If a ``list`` or an ``ndarray`` is passed to `to_replace` and
+              `value` but they are not the same length.
+
+        See Also
+        --------
+        %(klass)s.fillna : Fill NA values.
+        %(klass)s.where : Replace values based on boolean condition.
+        Series.str.replace : Simple string replacement.
 
         Notes
         -----
@@ -3580,20 +6304,181 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
         * Regular expressions will only substitute on strings, meaning you
           cannot provide, for example, a regular expression matching floating
           point numbers and expect the columns in your frame that have a
-          numeric dtype to be matched. However, if those floating point numbers
-          *are* strings, then you can do this.
+          numeric dtype to be matched. However, if those floating point
+          numbers *are* strings, then you can do this.
         * This method has *a lot* of options. You are encouraged to experiment
           and play with this method to gain intuition about how it works.
+        * When dict is used as the `to_replace` value, it is like
+          key(s) in the dict are the to_replace part and
+          value(s) in the dict are the value parameter.
 
-        """
+        Examples
+        --------
+
+        **Scalar `to_replace` and `value`**
+
+        >>> s = pd.Series([0, 1, 2, 3, 4])
+        >>> s.replace(0, 5)
+        0    5
+        1    1
+        2    2
+        3    3
+        4    4
+        dtype: int64
+
+        >>> df = pd.DataFrame({'A': [0, 1, 2, 3, 4],
+        ...                    'B': [5, 6, 7, 8, 9],
+        ...                    'C': ['a', 'b', 'c', 'd', 'e']})
+        >>> df.replace(0, 5)
+           A  B  C
+        0  5  5  a
+        1  1  6  b
+        2  2  7  c
+        3  3  8  d
+        4  4  9  e
+
+        **List-like `to_replace`**
+
+        >>> df.replace([0, 1, 2, 3], 4)
+           A  B  C
+        0  4  5  a
+        1  4  6  b
+        2  4  7  c
+        3  4  8  d
+        4  4  9  e
+
+        >>> df.replace([0, 1, 2, 3], [4, 3, 2, 1])
+           A  B  C
+        0  4  5  a
+        1  3  6  b
+        2  2  7  c
+        3  1  8  d
+        4  4  9  e
+
+        >>> s.replace([1, 2], method='bfill')
+        0    0
+        1    3
+        2    3
+        3    3
+        4    4
+        dtype: int64
+
+        **dict-like `to_replace`**
+
+        >>> df.replace({0: 10, 1: 100})
+             A  B  C
+        0   10  5  a
+        1  100  6  b
+        2    2  7  c
+        3    3  8  d
+        4    4  9  e
+
+        >>> df.replace({'A': 0, 'B': 5}, 100)
+             A    B  C
+        0  100  100  a
+        1    1    6  b
+        2    2    7  c
+        3    3    8  d
+        4    4    9  e
+
+        >>> df.replace({'A': {0: 100, 4: 400}})
+             A  B  C
+        0  100  5  a
+        1    1  6  b
+        2    2  7  c
+        3    3  8  d
+        4  400  9  e
+
+        **Regular expression `to_replace`**
+
+        >>> df = pd.DataFrame({'A': ['bat', 'foo', 'bait'],
+        ...                    'B': ['abc', 'bar', 'xyz']})
+        >>> df.replace(to_replace=r'^ba.$', value='new', regex=True)
+              A    B
+        0   new  abc
+        1   foo  new
+        2  bait  xyz
+
+        >>> df.replace({'A': r'^ba.$'}, {'A': 'new'}, regex=True)
+              A    B
+        0   new  abc
+        1   foo  bar
+        2  bait  xyz
+
+        >>> df.replace(regex=r'^ba.$', value='new')
+              A    B
+        0   new  abc
+        1   foo  new
+        2  bait  xyz
+
+        >>> df.replace(regex={r'^ba.$': 'new', 'foo': 'xyz'})
+              A    B
+        0   new  abc
+        1   xyz  new
+        2  bait  xyz
+
+        >>> df.replace(regex=[r'^ba.$', 'foo'], value='new')
+              A    B
+        0   new  abc
+        1   new  new
+        2  bait  xyz
+
+        Note that when replacing multiple ``bool`` or ``datetime64`` objects,
+        the data types in the `to_replace` parameter must match the data
+        type of the value being replaced:
+
+        >>> df = pd.DataFrame({'A': [True, False, True],
+        ...                    'B': [False, True, False]})
+        >>> df.replace({'a string': 'new value', True: False})  # raises
+        Traceback (most recent call last):
+            ...
+        TypeError: Cannot compare types 'ndarray(dtype=bool)' and 'str'
+
+        This raises a ``TypeError`` because one of the ``dict`` keys is not of
+        the correct type for replacement.
+
+        Compare the behavior of ``s.replace({'a': None})`` and
+        ``s.replace('a', None)`` to understand the peculiarities
+        of the `to_replace` parameter:
+
+        >>> s = pd.Series([10, 'a', 'a', 'b', 'a'])
+
+        When one uses a dict as the `to_replace` value, it is like the
+        value(s) in the dict are equal to the `value` parameter.
+        ``s.replace({'a': None})`` is equivalent to
+        ``s.replace(to_replace={'a': None}, value=None, method=None)``:
+
+        >>> s.replace({'a': None})
+        0      10
+        1    None
+        2    None
+        3       b
+        4    None
+        dtype: object
+
+        When ``value=None`` and `to_replace` is a scalar, list or
+        tuple, `replace` uses the method parameter (default 'pad') to do the
+        replacement. So this is why the 'a' values are being replaced by 10
+        in rows 1 and 2 and 'b' in row 4 in this case.
+        The command ``s.replace('a', None)`` is actually equivalent to
+        ``s.replace(to_replace='a', value=None, method='pad')``:
+
+        >>> s.replace('a', None)
+        0    10
+        1    10
+        2    10
+        3     b
+        4     b
+        dtype: object
+    """)
+
+    @Appender(_shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if not is_bool(regex) and to_replace is not None:
             raise AssertionError("'to_replace' must be 'None' if 'regex' is "
                                  "not a bool")
-        if axis is not None:
-            from warnings import warn
-            warn('the "axis" argument is deprecated and will be removed in'
-                 'v0.13; this argument has no effect')
 
         self._consolidate_inplace()
 
@@ -3604,6 +6489,10 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
                 to_replace = [to_replace]
 
             if isinstance(to_replace, (tuple, list)):
+                if isinstance(self, pd.DataFrame):
+                    return self.apply(_single_replace,
+                                      args=(to_replace, method, inplace,
+                                            limit))
                 return _single_replace(self, to_replace, method, inplace,
                                        limit)
 
@@ -3736,89 +6625,197 @@ def replace(self, to_replace=None, value=None, inplace=False, limit=None,
 
     _shared_docs['interpolate'] = """
         Please note that only ``method='linear'`` is supported for
-        DataFrames/Series with a MultiIndex.
+        DataFrame/Series with a MultiIndex.
 
         Parameters
         ----------
-        method : {'linear', 'time', 'index', 'values', 'nearest', 'zero',
-                  'slinear', 'quadratic', 'cubic', 'barycentric', 'krogh',
-                  'polynomial', 'spline', 'piecewise_polynomial',
-                  'from_derivatives', 'pchip', 'akima'}
+        method : str, default 'linear'
+            Interpolation technique to use. One of:
 
-            * 'linear': ignore the index and treat the values as equally
+            * 'linear': Ignore the index and treat the values as equally
               spaced. This is the only method supported on MultiIndexes.
-              default
-            * 'time': interpolation works on daily and higher resolution
-              data to interpolate given length of interval
-            * 'index', 'values': use the actual numerical values of the index
-            * 'nearest', 'zero', 'slinear', 'quadratic', 'cubic',
-              'barycentric', 'polynomial' is passed to
-              ``scipy.interpolate.interp1d``. Both 'polynomial' and 'spline'
-              require that you also specify an `order` (int),
-              e.g. df.interpolate(method='polynomial', order=4).
-              These use the actual numerical values of the index.
-            * 'krogh', 'piecewise_polynomial', 'spline', 'pchip' and 'akima'
-              are all wrappers around the scipy interpolation methods of
-              similar names. These use the actual numerical values of the
-              index. For more information on their behavior, see the
-              `scipy documentation
-              <http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation>`__
-              and `tutorial documentation
-              <http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html>`__
-            * 'from_derivatives' refers to BPoly.from_derivatives which
+            * 'time': Works on daily and higher resolution data to interpolate
+              given length of interval.
+            * 'index', 'values': use the actual numerical values of the index.
+            * 'pad': Fill in NaNs using existing values.
+            * 'nearest', 'zero', 'slinear', 'quadratic', 'cubic', 'spline',
+              'barycentric', 'polynomial': Passed to
+              `scipy.interpolate.interp1d`. These methods use the numerical
+              values of the index.  Both 'polynomial' and 'spline' require that
+              you also specify an `order` (int), e.g.
+              ``df.interpolate(method='polynomial', order=5)``.
+            * 'krogh', 'piecewise_polynomial', 'spline', 'pchip', 'akima':
+              Wrappers around the SciPy interpolation methods of similar
+              names. See `Notes`.
+            * 'from_derivatives': Refers to
+              `scipy.interpolate.BPoly.from_derivatives` which
               replaces 'piecewise_polynomial' interpolation method in
-              scipy 0.18
+              scipy 0.18.
 
             .. versionadded:: 0.18.1
 
-               Added support for the 'akima' method
+               Added support for the 'akima' method.
                Added interpolate method 'from_derivatives' which replaces
-               'piecewise_polynomial' in scipy 0.18; backwards-compatible with
-               scipy < 0.18
-
-        axis : {0, 1}, default 0
-            * 0: fill column-by-column
-            * 1: fill row-by-row
-        limit : int, default None.
-            Maximum number of consecutive NaNs to fill. Must be greater than 0.
+               'piecewise_polynomial' in SciPy 0.18; backwards-compatible with
+               SciPy < 0.18
+
+        axis : {0 or 'index', 1 or 'columns', None}, default None
+            Axis to interpolate along.
+        limit : int, optional
+            Maximum number of consecutive NaNs to fill. Must be greater than
+            0.
+        inplace : bool, default False
+            Update the data in place if possible.
         limit_direction : {'forward', 'backward', 'both'}, default 'forward'
             If limit is specified, consecutive NaNs will be filled in this
             direction.
+        limit_area : {`None`, 'inside', 'outside'}, default None
+            If limit is specified, consecutive NaNs will be filled with this
+            restriction.
 
-            .. versionadded:: 0.17.0
+            * ``None``: No fill restriction.
+            * 'inside': Only fill NaNs surrounded by valid values
+              (interpolate).
+            * 'outside': Only fill NaNs outside valid values (extrapolate).
+
+            .. versionadded:: 0.23.0
 
-        inplace : bool, default False
-            Update the NDFrame in place if possible.
         downcast : optional, 'infer' or None, defaults to None
             Downcast dtypes if possible.
-        kwargs : keyword arguments to pass on to the interpolating function.
+        **kwargs
+            Keyword arguments to pass on to the interpolating function.
 
         Returns
         -------
-        Series or DataFrame of same shape interpolated at the NaNs
+        Series or DataFrame
+            Returns the same object type as the caller, interpolated at
+            some or all ``NaN`` values.
 
         See Also
         --------
-        reindex, replace, fillna
+        fillna : Fill missing values using different methods.
+        scipy.interpolate.Akima1DInterpolator : Piecewise cubic polynomials
+            (Akima interpolator).
+        scipy.interpolate.BPoly.from_derivatives : Piecewise polynomial in the
+            Bernstein basis.
+        scipy.interpolate.interp1d : Interpolate a 1-D function.
+        scipy.interpolate.KroghInterpolator : Interpolate polynomial (Krogh
+            interpolator).
+        scipy.interpolate.PchipInterpolator : PCHIP 1-d monotonic cubic
+            interpolation.
+        scipy.interpolate.CubicSpline : Cubic spline data interpolator.
+
+        Notes
+        -----
+        The 'krogh', 'piecewise_polynomial', 'spline', 'pchip' and 'akima'
+        methods are wrappers around the respective SciPy implementations of
+        similar names. These use the actual numerical values of the index.
+        For more information on their behavior, see the
+        `SciPy documentation
+        <http://docs.scipy.org/doc/scipy/reference/interpolate.html#univariate-interpolation>`__
+        and `SciPy tutorial
+        <http://docs.scipy.org/doc/scipy/reference/tutorial/interpolate.html>`__.
 
         Examples
         --------
-
-        Filling in NaNs
+        Filling in ``NaN`` in a :class:`~pandas.Series` via linear
+        interpolation.
 
         >>> s = pd.Series([0, 1, np.nan, 3])
+        >>> s
+        0    0.0
+        1    1.0
+        2    NaN
+        3    3.0
+        dtype: float64
         >>> s.interpolate()
-        0    0
-        1    1
-        2    2
-        3    3
+        0    0.0
+        1    1.0
+        2    2.0
+        3    3.0
+        dtype: float64
+
+        Filling in ``NaN`` in a Series by padding, but filling at most two
+        consecutive ``NaN`` at a time.
+
+        >>> s = pd.Series([np.nan, "single_one", np.nan,
+        ...                "fill_two_more", np.nan, np.nan, np.nan,
+        ...                4.71, np.nan])
+        >>> s
+        0              NaN
+        1       single_one
+        2              NaN
+        3    fill_two_more
+        4              NaN
+        5              NaN
+        6              NaN
+        7             4.71
+        8              NaN
+        dtype: object
+        >>> s.interpolate(method='pad', limit=2)
+        0              NaN
+        1       single_one
+        2       single_one
+        3    fill_two_more
+        4    fill_two_more
+        5    fill_two_more
+        6              NaN
+        7             4.71
+        8             4.71
+        dtype: object
+
+        Filling in ``NaN`` in a Series via polynomial interpolation or splines:
+        Both 'polynomial' and 'spline' methods require that you also specify
+        an ``order`` (int).
+
+        >>> s = pd.Series([0, 2, np.nan, 8])
+        >>> s.interpolate(method='polynomial', order=2)
+        0    0.000000
+        1    2.000000
+        2    4.666667
+        3    8.000000
         dtype: float64
 
+        Fill the DataFrame forward (that is, going down) along each column
+        using linear interpolation.
+
+        Note how the last entry in column 'a' is interpolated differently,
+        because there is no entry after it to use for interpolation.
+        Note how the first entry in column 'b' remains ``NaN``, because there
+        is no entry befofe it to use for interpolation.
+
+        >>> df = pd.DataFrame([(0.0, np.nan, -1.0, 1.0),
+        ...                    (np.nan, 2.0, np.nan, np.nan),
+        ...                    (2.0, 3.0, np.nan, 9.0),
+        ...                    (np.nan, 4.0, -4.0, 16.0)],
+        ...                   columns=list('abcd'))
+        >>> df
+             a    b    c     d
+        0  0.0  NaN -1.0   1.0
+        1  NaN  2.0  NaN   NaN
+        2  2.0  3.0  NaN   9.0
+        3  NaN  4.0 -4.0  16.0
+        >>> df.interpolate(method='linear', limit_direction='forward', axis=0)
+             a    b    c     d
+        0  0.0  NaN -1.0   1.0
+        1  1.0  2.0 -2.0   5.0
+        2  2.0  3.0 -3.0   9.0
+        3  2.0  4.0 -4.0  16.0
+
+        Using polynomial interpolation.
+
+        >>> df['d'].interpolate(method='polynomial', order=2)
+        0     1.0
+        1     4.0
+        2     9.0
+        3    16.0
+        Name: d, dtype: float64
         """
 
     @Appender(_shared_docs['interpolate'] % _shared_doc_kwargs)
     def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
-                    limit_direction='forward', downcast=None, **kwargs):
+                    limit_direction='forward', limit_area=None,
+                    downcast=None, **kwargs):
         """
         Interpolate values according to different methods.
         """
@@ -3850,7 +6847,9 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
 
         if _maybe_transposed_self._data.get_dtype_counts().get(
                 'object') == len(_maybe_transposed_self.T):
-            raise TypeError("Cannot interpolate with all NaNs.")
+            raise TypeError("Cannot interpolate with all object-dtype columns "
+                            "in the DataFrame. Try setting at least one "
+                            "column to a numeric dtype.")
 
         # create/use the index
         if method == 'linear':
@@ -3859,7 +6858,7 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
         else:
             index = _maybe_transposed_self._get_axis(alt_ax)
 
-        if pd.isnull(index).any():
+        if isna(index).any():
             raise NotImplementedError("Interpolation with NaNs in the index "
                                       "has not been implemented. Try filling "
                                       "those NaNs before interpolating.")
@@ -3867,6 +6866,7 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
         new_data = data.interpolate(method=method, axis=ax, index=index,
                                     values=_maybe_transposed_self, limit=limit,
                                     limit_direction=limit_direction,
+                                    limit_area=limit_area,
                                     inplace=inplace, downcast=downcast,
                                     **kwargs)
 
@@ -3885,40 +6885,102 @@ def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
 
     def asof(self, where, subset=None):
         """
-        The last row without any NaN is taken (or the last row without
-        NaN considering only the subset of columns in the case of a DataFrame)
+        Return the last row(s) without any NaNs before `where`.
+
+        The last row (for each element in `where`, if list) without any
+        NaN is taken.
+        In case of a :class:`~pandas.DataFrame`, the last row without NaN
+        considering only the subset of columns (if not `None`)
 
         .. versionadded:: 0.19.0 For DataFrame
 
-        If there is no good value, NaN is returned for a Series
+        If there is no good value, NaN is returned for a Series or
         a Series of NaN values for a DataFrame
 
         Parameters
         ----------
-        where : date or array of dates
-        subset : string or list of strings, default None
-           if not None use these columns for NaN propagation
-
-        Notes
-        -----
-        Dates are assumed to be sorted
-        Raises if this is not the case
+        where : date or array-like of dates
+            Date(s) before which the last row(s) are returned.
+        subset : str or array-like of str, default `None`
+            For DataFrame, if not `None`, only use these columns to
+            check for NaNs.
 
         Returns
         -------
-        where is scalar
+        scalar, Series, or DataFrame
+
+            The return can be:
 
-          - value or NaN if input is Series
-          - Series if input is DataFrame
+            * scalar : when `self` is a Series and `where` is a scalar
+            * Series: when `self` is a Series and `where` is an array-like,
+              or when `self` is a DataFrame and `where` is a scalar
+            * DataFrame : when `self` is a DataFrame and `where` is an
+              array-like
 
-        where is Index: same shape object as input
+            Return scalar, Series, or DataFrame.
 
         See Also
         --------
-        merge_asof
+        merge_asof : Perform an asof merge. Similar to left join.
 
-        """
+        Notes
+        -----
+        Dates are assumed to be sorted. Raises if this is not the case.
+
+        Examples
+        --------
+        A Series and a scalar `where`.
+
+        >>> s = pd.Series([1, 2, np.nan, 4], index=[10, 20, 30, 40])
+        >>> s
+        10    1.0
+        20    2.0
+        30    NaN
+        40    4.0
+        dtype: float64
+
+        >>> s.asof(20)
+        2.0
+
+        For a sequence `where`, a Series is returned. The first value is
+        NaN, because the first element of `where` is before the first
+        index value.
+
+        >>> s.asof([5, 20])
+        5     NaN
+        20    2.0
+        dtype: float64
+
+        Missing values are not considered. The following is ``2.0``, not
+        NaN, even though NaN is at the index location for ``30``.
+
+        >>> s.asof(30)
+        2.0
+
+        Take all columns into consideration
 
+        >>> df = pd.DataFrame({'a': [10, 20, 30, 40, 50],
+        ...                    'b': [None, None, None, None, 500]},
+        ...                   index=pd.DatetimeIndex(['2018-02-27 09:01:00',
+        ...                                           '2018-02-27 09:02:00',
+        ...                                           '2018-02-27 09:03:00',
+        ...                                           '2018-02-27 09:04:00',
+        ...                                           '2018-02-27 09:05:00']))
+        >>> df.asof(pd.DatetimeIndex(['2018-02-27 09:03:30',
+        ...                           '2018-02-27 09:04:30']))
+                              a   b
+        2018-02-27 09:03:30 NaN NaN
+        2018-02-27 09:04:30 NaN NaN
+
+        Take a single column into consideration
+
+        >>> df.asof(pd.DatetimeIndex(['2018-02-27 09:03:30',
+        ...                           '2018-02-27 09:04:30']),
+        ...         subset=['a'])
+                                 a   b
+        2018-02-27 09:03:30   30.0 NaN
+        2018-02-27 09:04:30   40.0 NaN
+        """
         if isinstance(where, compat.string_types):
             from pandas import to_datetime
             where = to_datetime(where)
@@ -3932,7 +6994,7 @@ def asof(self, where, subset=None):
                 raise ValueError("subset is not valid for Series")
         elif self.ndim > 2:
             raise NotImplementedError("asof is not implemented "
-                                      "for {type}".format(type(self)))
+                                      "for {type}".format(type=type(self)))
         else:
             if subset is None:
                 subset = self.columns
@@ -3964,14 +7026,14 @@ def asof(self, where, subset=None):
                     loc -= 1
 
                 values = self._values
-                while loc > 0 and isnull(values[loc]):
+                while loc > 0 and isna(values[loc]):
                     loc -= 1
                 return values[loc]
 
         if not isinstance(where, Index):
             where = Index(where) if is_list else Index([where])
 
-        nulls = self.isnull() if is_series else self[subset].isnull().any(1)
+        nulls = self.isna() if is_series else self[subset].isna().any(1)
         if nulls.all():
             if is_series:
                 return self._constructor(np.nan, index=where, name=self.name)
@@ -3994,201 +7056,620 @@ def asof(self, where, subset=None):
     # ----------------------------------------------------------------------
     # Action Methods
 
-    _shared_docs['isnull'] = """
-        Return a boolean same-sized object indicating if the values are null.
+    _shared_docs['isna'] = """
+        Detect missing values.
+
+        Return a boolean same-sized object indicating if the values are NA.
+        NA values, such as None or :attr:`numpy.NaN`, gets mapped to True
+        values.
+        Everything else gets mapped to False values. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+
+        Returns
+        -------
+        %(klass)s
+            Mask of bool values for each element in %(klass)s that
+            indicates whether an element is not an NA value.
 
         See Also
         --------
-        notnull : boolean inverse of isnull
+        %(klass)s.isnull : Alias of isna.
+        %(klass)s.notna : Boolean inverse of isna.
+        %(klass)s.dropna : Omit axes labels with missing values.
+        isna : Top-level isna.
+
+        Examples
+        --------
+        Show which entries in a DataFrame are NA.
+
+        >>> df = pd.DataFrame({'age': [5, 6, np.NaN],
+        ...                    'born': [pd.NaT, pd.Timestamp('1939-05-27'),
+        ...                             pd.Timestamp('1940-04-25')],
+        ...                    'name': ['Alfred', 'Batman', ''],
+        ...                    'toy': [None, 'Batmobile', 'Joker']})
+        >>> df
+           age       born    name        toy
+        0  5.0        NaT  Alfred       None
+        1  6.0 1939-05-27  Batman  Batmobile
+        2  NaN 1940-04-25              Joker
+
+        >>> df.isna()
+             age   born   name    toy
+        0  False   True  False   True
+        1  False  False  False  False
+        2   True  False  False  False
+
+        Show which entries in a Series are NA.
+
+        >>> ser = pd.Series([5, 6, np.NaN])
+        >>> ser
+        0    5.0
+        1    6.0
+        2    NaN
+        dtype: float64
+
+        >>> ser.isna()
+        0    False
+        1    False
+        2     True
+        dtype: bool
         """
 
-    @Appender(_shared_docs['isnull'])
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return isna(self).__finalize__(self)
+
+    @Appender(_shared_docs['isna'] % _shared_doc_kwargs)
     def isnull(self):
-        return isnull(self).__finalize__(self)
+        return isna(self).__finalize__(self)
+
+    _shared_docs['notna'] = """
+        Detect existing (non-missing) values.
 
-    _shared_docs['isnotnull'] = """
-        Return a boolean same-sized object indicating if the values are
-        not null.
+        Return a boolean same-sized object indicating if the values are not NA.
+        Non-missing values get mapped to True. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+        NA values, such as None or :attr:`numpy.NaN`, get mapped to False
+        values.
+
+        Returns
+        -------
+        %(klass)s
+            Mask of bool values for each element in %(klass)s that
+            indicates whether an element is not an NA value.
 
         See Also
         --------
-        isnull : boolean inverse of notnull
+        %(klass)s.notnull : Alias of notna.
+        %(klass)s.isna : Boolean inverse of notna.
+        %(klass)s.dropna : Omit axes labels with missing values.
+        notna : Top-level notna.
+
+        Examples
+        --------
+        Show which entries in a DataFrame are not NA.
+
+        >>> df = pd.DataFrame({'age': [5, 6, np.NaN],
+        ...                    'born': [pd.NaT, pd.Timestamp('1939-05-27'),
+        ...                             pd.Timestamp('1940-04-25')],
+        ...                    'name': ['Alfred', 'Batman', ''],
+        ...                    'toy': [None, 'Batmobile', 'Joker']})
+        >>> df
+           age       born    name        toy
+        0  5.0        NaT  Alfred       None
+        1  6.0 1939-05-27  Batman  Batmobile
+        2  NaN 1940-04-25              Joker
+
+        >>> df.notna()
+             age   born  name    toy
+        0   True  False  True  False
+        1   True   True  True   True
+        2  False   True  True   True
+
+        Show which entries in a Series are not NA.
+
+        >>> ser = pd.Series([5, 6, np.NaN])
+        >>> ser
+        0    5.0
+        1    6.0
+        2    NaN
+        dtype: float64
+
+        >>> ser.notna()
+        0     True
+        1     True
+        2    False
+        dtype: bool
         """
 
-    @Appender(_shared_docs['isnotnull'])
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return notna(self).__finalize__(self)
+
+    @Appender(_shared_docs['notna'] % _shared_doc_kwargs)
     def notnull(self):
-        return notnull(self).__finalize__(self)
+        return notna(self).__finalize__(self)
+
+    def _clip_with_scalar(self, lower, upper, inplace=False):
+        if ((lower is not None and np.any(isna(lower))) or
+                (upper is not None and np.any(isna(upper)))):
+            raise ValueError("Cannot use an NA value as a clip threshold")
+
+        result = self
+        mask = isna(self.values)
+
+        with np.errstate(all='ignore'):
+            if upper is not None:
+                subset = self.to_numpy() <= upper
+                result = result.where(subset, upper, axis=None, inplace=False)
+            if lower is not None:
+                subset = self.to_numpy() >= lower
+                result = result.where(subset, lower, axis=None, inplace=False)
+
+        if np.any(mask):
+            result[mask] = np.nan
+
+        if inplace:
+            self._update_inplace(result)
+        else:
+            return result
+
+    def _clip_with_one_bound(self, threshold, method, axis, inplace):
+
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        # method is self.le for upper bound and self.ge for lower bound
+        if is_scalar(threshold) and is_number(threshold):
+            if method.__name__ == 'le':
+                return self._clip_with_scalar(None, threshold, inplace=inplace)
+            return self._clip_with_scalar(threshold, None, inplace=inplace)
+
+        subset = method(threshold, axis=axis) | isna(self)
 
-    def clip(self, lower=None, upper=None, axis=None, *args, **kwargs):
+        # GH #15390
+        # In order for where method to work, the threshold must
+        # be transformed to NDFrame from other array like structure.
+        if (not isinstance(threshold, ABCSeries)) and is_list_like(threshold):
+            if isinstance(self, ABCSeries):
+                threshold = pd.Series(threshold, index=self.index)
+            else:
+                threshold = _align_method_FRAME(self, threshold,
+                                                axis)
+        return self.where(subset, threshold, axis=axis, inplace=inplace)
+
+    def clip(self, lower=None, upper=None, axis=None, inplace=False,
+             *args, **kwargs):
         """
         Trim values at input threshold(s).
 
+        Assigns values outside boundary to boundary values. Thresholds
+        can be singular values or array like, and in the latter case
+        the clipping is performed element-wise in the specified axis.
+
         Parameters
         ----------
         lower : float or array_like, default None
+            Minimum threshold value. All values below this
+            threshold will be set to it.
         upper : float or array_like, default None
-        axis : int or string axis name, optional
+            Maximum threshold value. All values above this
+            threshold will be set to it.
+        axis : int or str axis name, optional
             Align object with lower and upper along the given axis.
+        inplace : bool, default False
+            Whether to perform the operation in place on the data.
+
+            .. versionadded:: 0.21.0
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted
+            for compatibility with numpy.
 
         Returns
         -------
-        clipped : Series
+        Series or DataFrame
+            Same type as calling object with the values outside the
+            clip boundaries replaced.
 
         Examples
         --------
+        >>> data = {'col_0': [9, -3, 0, -1, 5], 'col_1': [-2, -7, 6, 8, -5]}
+        >>> df = pd.DataFrame(data)
         >>> df
-          0         1
-        0  0.335232 -1.256177
-        1 -1.367855  0.746646
-        2  0.027753 -1.176076
-        3  0.230930 -0.679613
-        4  1.261967  0.570967
-        >>> df.clip(-1.0, 0.5)
-                  0         1
-        0  0.335232 -1.000000
-        1 -1.000000  0.500000
-        2  0.027753 -1.000000
-        3  0.230930 -0.679613
-        4  0.500000  0.500000
+           col_0  col_1
+        0      9     -2
+        1     -3     -7
+        2      0      6
+        3     -1      8
+        4      5     -5
+
+        Clips per column using lower and upper thresholds:
+
+        >>> df.clip(-4, 6)
+           col_0  col_1
+        0      6     -2
+        1     -3     -4
+        2      0      6
+        3     -1      6
+        4      5     -4
+
+        Clips using specific lower and upper thresholds per column element:
+
+        >>> t = pd.Series([2, -4, -1, 6, 3])
         >>> t
-        0   -0.3
-        1   -0.2
-        2   -0.1
-        3    0.0
-        4    0.1
-        dtype: float64
-        >>> df.clip(t, t + 1, axis=0)
-                  0         1
-        0  0.335232 -0.300000
-        1 -0.200000  0.746646
-        2  0.027753 -0.100000
-        3  0.230930  0.000000
-        4  1.100000  0.570967
+        0    2
+        1   -4
+        2   -1
+        3    6
+        4    3
+        dtype: int64
+
+        >>> df.clip(t, t + 4, axis=0)
+           col_0  col_1
+        0      6      2
+        1     -3     -4
+        2      0      3
+        3      6      8
+        4      5      3
         """
         if isinstance(self, ABCPanel):
             raise NotImplementedError("clip is not supported yet for panels")
 
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
         axis = nv.validate_clip_with_axis(axis, args, kwargs)
+        if axis is not None:
+            axis = self._get_axis_number(axis)
+
+        # GH 17276
+        # numpy doesn't like NaN as a clip value
+        # so ignore
+        # GH 19992
+        # numpy doesn't drop a list-like bound containing NaN
+        if not is_list_like(lower) and np.any(pd.isnull(lower)):
+            lower = None
+        if not is_list_like(upper) and np.any(pd.isnull(upper)):
+            upper = None
+
+        # GH 2747 (arguments were reversed)
+        if lower is not None and upper is not None:
+            if is_scalar(lower) and is_scalar(upper):
+                lower, upper = min(lower, upper), max(lower, upper)
+
+        # fast-path for scalars
+        if ((lower is None or (is_scalar(lower) and is_number(lower))) and
+                (upper is None or (is_scalar(upper) and is_number(upper)))):
+            return self._clip_with_scalar(lower, upper, inplace=inplace)
+
+        result = self
+        if lower is not None:
+            result = result._clip_with_one_bound(lower, method=self.ge,
+                                                 axis=axis, inplace=inplace)
+        if upper is not None:
+            if inplace:
+                result = self
+            result = result._clip_with_one_bound(upper, method=self.le,
+                                                 axis=axis, inplace=inplace)
+
+        return result
+
+    def clip_upper(self, threshold, axis=None, inplace=False):
+        """
+        Trim values above a given threshold.
+
+        .. deprecated:: 0.24.0
+            Use clip(upper=threshold) instead.
+
+        Elements above the `threshold` will be changed to match the
+        `threshold` value(s). Threshold can be a single value or an array,
+        in the latter case it performs the truncation element-wise.
+
+        Parameters
+        ----------
+        threshold : numeric or array-like
+            Maximum value allowed. All values above threshold will be set to
+            this value.
+
+            * float : every value is compared to `threshold`.
+            * array-like : The shape of `threshold` should match the object
+              it's compared to. When `self` is a Series, `threshold` should be
+              the length. When `self` is a DataFrame, `threshold` should 2-D
+              and the same shape as `self` for ``axis=None``, or 1-D and the
+              same length as the axis being compared.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Align object with `threshold` along the given axis.
+        inplace : bool, default False
+            Whether to perform the operation in place on the data.
+
+            .. versionadded:: 0.21.0
+
+        Returns
+        -------
+        Series or DataFrame
+            Original data with values trimmed.
+
+        See Also
+        --------
+        Series.clip : General purpose method to trim Series values to given
+            threshold(s).
+        DataFrame.clip : General purpose method to trim DataFrame values to
+            given threshold(s).
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4, 5])
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        4    5
+        dtype: int64
+
+        >>> s.clip(upper=3)
+        0    1
+        1    2
+        2    3
+        3    3
+        4    3
+        dtype: int64
+
+        >>> elemwise_thresholds = [5, 4, 3, 2, 1]
+        >>> elemwise_thresholds
+        [5, 4, 3, 2, 1]
+
+        >>> s.clip(upper=elemwise_thresholds)
+        0    1
+        1    2
+        2    3
+        3    2
+        4    1
+        dtype: int64
+        """
+        warnings.warn('clip_upper(threshold) is deprecated, '
+                      'use clip(upper=threshold) instead',
+                      FutureWarning, stacklevel=2)
+        return self._clip_with_one_bound(threshold, method=self.le,
+                                         axis=axis, inplace=inplace)
+
+    def clip_lower(self, threshold, axis=None, inplace=False):
+        """
+        Trim values below a given threshold.
+
+        .. deprecated:: 0.24.0
+            Use clip(lower=threshold) instead.
+
+        Elements below the `threshold` will be changed to match the
+        `threshold` value(s). Threshold can be a single value or an array,
+        in the latter case it performs the truncation element-wise.
+
+        Parameters
+        ----------
+        threshold : numeric or array-like
+            Minimum value allowed. All values below threshold will be set to
+            this value.
+
+            * float : every value is compared to `threshold`.
+            * array-like : The shape of `threshold` should match the object
+              it's compared to. When `self` is a Series, `threshold` should be
+              the length. When `self` is a DataFrame, `threshold` should 2-D
+              and the same shape as `self` for ``axis=None``, or 1-D and the
+              same length as the axis being compared.
+
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Align `self` with `threshold` along the given axis.
+
+        inplace : bool, default False
+            Whether to perform the operation in place on the data.
+
+            .. versionadded:: 0.21.0
+
+        Returns
+        -------
+        Series or DataFrame
+            Original data with values trimmed.
+
+        See Also
+        --------
+        Series.clip : General purpose method to trim Series values to given
+            threshold(s).
+        DataFrame.clip : General purpose method to trim DataFrame values to
+            given threshold(s).
+
+        Examples
+        --------
 
-        # GH 2747 (arguments were reversed)
-        if lower is not None and upper is not None:
-            if is_scalar(lower) and is_scalar(upper):
-                lower, upper = min(lower, upper), max(lower, upper)
+        Series single threshold clipping:
 
-        result = self
-        if lower is not None:
-            result = result.clip_lower(lower, axis)
-        if upper is not None:
-            result = result.clip_upper(upper, axis)
+        >>> s = pd.Series([5, 6, 7, 8, 9])
+        >>> s.clip(lower=8)
+        0    8
+        1    8
+        2    8
+        3    8
+        4    9
+        dtype: int64
 
-        return result
+        Series clipping element-wise using an array of thresholds. `threshold`
+        should be the same length as the Series.
 
-    def clip_upper(self, threshold, axis=None):
-        """
-        Return copy of input with values above given value(s) truncated.
+        >>> elemwise_thresholds = [4, 8, 7, 2, 5]
+        >>> s.clip(lower=elemwise_thresholds)
+        0    5
+        1    8
+        2    7
+        3    8
+        4    9
+        dtype: int64
 
-        Parameters
-        ----------
-        threshold : float or array_like
-        axis : int or string axis name, optional
-            Align object with threshold along the given axis.
+        DataFrames can be compared to a scalar.
 
-        See Also
-        --------
-        clip
+        >>> df = pd.DataFrame({"A": [1, 3, 5], "B": [2, 4, 6]})
+        >>> df
+           A  B
+        0  1  2
+        1  3  4
+        2  5  6
 
-        Returns
-        -------
-        clipped : same type as input
-        """
-        if np.any(isnull(threshold)):
-            raise ValueError("Cannot use an NA value as a clip threshold")
+        >>> df.clip(lower=3)
+           A  B
+        0  3  3
+        1  3  4
+        2  5  6
 
-        subset = self.le(threshold, axis=axis) | isnull(self)
-        return self.where(subset, threshold, axis=axis)
+        Or to an array of values. By default, `threshold` should be the same
+        shape as the DataFrame.
 
-    def clip_lower(self, threshold, axis=None):
-        """
-        Return copy of the input with values below given value(s) truncated.
+        >>> df.clip(lower=np.array([[3, 4], [2, 2], [6, 2]]))
+           A  B
+        0  3  4
+        1  3  4
+        2  6  6
 
-        Parameters
-        ----------
-        threshold : float or array_like
-        axis : int or string axis name, optional
-            Align object with threshold along the given axis.
+        Control how `threshold` is broadcast with `axis`. In this case
+        `threshold` should be the same length as the axis specified by
+        `axis`.
 
-        See Also
-        --------
-        clip
+        >>> df.clip(lower=[3, 3, 5], axis='index')
+           A  B
+        0  3  3
+        1  3  4
+        2  5  6
 
-        Returns
-        -------
-        clipped : same type as input
+        >>> df.clip(lower=[4, 5], axis='columns')
+           A  B
+        0  4  5
+        1  4  5
+        2  5  6
         """
-        if np.any(isnull(threshold)):
-            raise ValueError("Cannot use an NA value as a clip threshold")
-
-        subset = self.ge(threshold, axis=axis) | isnull(self)
-        return self.where(subset, threshold, axis=axis)
+        warnings.warn('clip_lower(threshold) is deprecated, '
+                      'use clip(lower=threshold) instead',
+                      FutureWarning, stacklevel=2)
+        return self._clip_with_one_bound(threshold, method=self.ge,
+                                         axis=axis, inplace=inplace)
 
     def groupby(self, by=None, axis=0, level=None, as_index=True, sort=True,
-                group_keys=True, squeeze=False, **kwargs):
+                group_keys=True, squeeze=False, observed=False, **kwargs):
         """
-        Group series using mapper (dict or key function, apply given function
-        to group, return result as series) or by a series of columns.
+        Group DataFrame or Series using a mapper or by a Series of columns.
+
+        A groupby operation involves some combination of splitting the
+        object, applying a function, and combining the results. This can be
+        used to group large amounts of data and compute operations on these
+        groups.
 
         Parameters
         ----------
-        by : mapping function / list of functions, dict, Series, ndarray,
-                or tuple / list of column names or index level names or
-                Series or ndarrays
-            Called on each element of the object index to determine the groups.
-            If a dict or Series is passed, the Series or dict VALUES will be
-            used to determine the groups (the Series' values are first
-            aligned; see ``.align()`` method). If ndarray is passed, the
-            values as-is determine the groups.
-        axis : int, default 0
+        by : mapping, function, label, or list of labels
+            Used to determine the groups for the groupby.
+            If ``by`` is a function, it's called on each value of the object's
+            index. If a dict or Series is passed, the Series or dict VALUES
+            will be used to determine the groups (the Series' values are first
+            aligned; see ``.align()`` method). If an ndarray is passed, the
+            values are used as-is determine the groups. A label or list of
+            labels may be passed to group by the columns in ``self``. Notice
+            that a tuple is interpreted a (single) key.
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Split along rows (0) or columns (1).
         level : int, level name, or sequence of such, default None
             If the axis is a MultiIndex (hierarchical), group by a particular
-            level or levels
-        as_index : boolean, default True
+            level or levels.
+        as_index : bool, default True
             For aggregated output, return object with group labels as the
             index. Only relevant for DataFrame input. as_index=False is
-            effectively "SQL-style" grouped output
-        sort : boolean, default True
+            effectively "SQL-style" grouped output.
+        sort : bool, default True
             Sort group keys. Get better performance by turning this off.
             Note this does not influence the order of observations within each
-            group.  groupby preserves the order of rows within each group.
-        group_keys : boolean, default True
-            When calling apply, add group keys to index to identify pieces
-        squeeze : boolean, default False
-            reduce the dimensionality of the return type if possible,
-            otherwise return a consistent type
-
-        Examples
-        --------
-        DataFrame results
-
-        >>> data.groupby(func, axis=0).mean()
-        >>> data.groupby(['col1', 'col2'])['col3'].mean()
-
-        DataFrame with hierarchical index
-
-        >>> data.groupby(['col1', 'col2']).mean()
+            group. Groupby preserves the order of rows within each group.
+        group_keys : bool, default True
+            When calling apply, add group keys to index to identify pieces.
+        squeeze : bool, default False
+            Reduce the dimensionality of the return type if possible,
+            otherwise return a consistent type.
+        observed : bool, default False
+            This only applies if any of the groupers are Categoricals.
+            If True: only show observed values for categorical groupers.
+            If False: show all values for categorical groupers.
+
+            .. versionadded:: 0.23.0
+
+        **kwargs
+            Optional, only accepts keyword argument 'mutated' and is passed
+            to groupby.
 
         Returns
         -------
-        GroupBy object
+        DataFrameGroupBy or SeriesGroupBy
+            Depends on the calling object and returns groupby object that
+            contains information about the groups.
 
-        """
-        from pandas.core.groupby import groupby
+        See Also
+        --------
+        resample : Convenience method for frequency conversion and resampling
+            of time series.
+
+        Notes
+        -----
+        See the `user guide
+        <http://pandas.pydata.org/pandas-docs/stable/groupby.html>`_ for more.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'Animal': ['Falcon', 'Falcon',
+        ...                               'Parrot', 'Parrot'],
+        ...                    'Max Speed': [380., 370., 24., 26.]})
+        >>> df
+           Animal  Max Speed
+        0  Falcon      380.0
+        1  Falcon      370.0
+        2  Parrot       24.0
+        3  Parrot       26.0
+        >>> df.groupby(['Animal']).mean()
+                Max Speed
+        Animal
+        Falcon      375.0
+        Parrot       25.0
+
+        **Hierarchical Indexes**
+
+        We can groupby different levels of a hierarchical index
+        using the `level` parameter:
+
+        >>> arrays = [['Falcon', 'Falcon', 'Parrot', 'Parrot'],
+        ...           ['Captive', 'Wild', 'Captive', 'Wild']]
+        >>> index = pd.MultiIndex.from_arrays(arrays, names=('Animal', 'Type'))
+        >>> df = pd.DataFrame({'Max Speed': [390., 350., 30., 20.]},
+        ...                   index=index)
+        >>> df
+                        Max Speed
+        Animal Type
+        Falcon Captive      390.0
+               Wild         350.0
+        Parrot Captive       30.0
+               Wild          20.0
+        >>> df.groupby(level=0).mean()
+                Max Speed
+        Animal
+        Falcon      370.0
+        Parrot       25.0
+        >>> df.groupby(level=1).mean()
+                 Max Speed
+        Type
+        Captive      210.0
+        Wild         185.0
+        """
+        from pandas.core.groupby.groupby import groupby
 
         if level is None and by is None:
             raise TypeError("You have to supply one of 'by' and 'level'")
         axis = self._get_axis_number(axis)
         return groupby(self, by=by, axis=axis, level=level, as_index=as_index,
                        sort=sort, group_keys=group_keys, squeeze=squeeze,
-                       **kwargs)
+                       observed=observed, **kwargs)
 
     def asfreq(self, freq, method=None, how=None, normalize=False,
                fill_value=None):
@@ -4215,7 +7696,7 @@ def asfreq(self, freq, method=None, how=None, normalize=False,
             For PeriodIndex only, see PeriodIndex.asfreq
         normalize : bool, default False
             Whether to reset output index to midnight
-        fill_value: scalar, optional
+        fill_value : scalar, optional
             Value to use for missing values, applied during upsampling (note
             this does not fill NaNs that already were present).
 
@@ -4223,7 +7704,16 @@ def asfreq(self, freq, method=None, how=None, normalize=False,
 
         Returns
         -------
-        converted : type of caller
+        converted : same type as caller
+
+        See Also
+        --------
+        reindex
+
+        Notes
+        -----
+        To learn more about the frequency strings, please see `this link
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
 
         Examples
         --------
@@ -4275,101 +7765,224 @@ def asfreq(self, freq, method=None, how=None, normalize=False,
         2000-01-01 00:02:00    2.0
         2000-01-01 00:02:30    3.0
         2000-01-01 00:03:00    3.0
-
-        See Also
-        --------
-        reindex
-
-        Notes
-        -----
-        To learn more about the frequency strings, please see `this link
-        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
         """
-        from pandas.tseries.resample import asfreq
+        from pandas.core.resample import asfreq
         return asfreq(self, freq, method=method, how=how, normalize=normalize,
                       fill_value=fill_value)
 
-    def at_time(self, time, asof=False):
+    def at_time(self, time, asof=False, axis=None):
         """
         Select values at particular time of day (e.g. 9:30AM).
 
         Parameters
         ----------
-        time : datetime.time or string
+        time : datetime.time or str
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
-        values_at_time : type of caller
+        Series or DataFrame
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
+
+        See Also
+        --------
+        between_time : Select values between particular times of the day.
+        first : Select initial periods of time series based on a date offset.
+        last : Select final periods of time series based on a date offset.
+        DatetimeIndex.indexer_at_time : Get just the index locations for
+            values at particular time of the day.
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='12H')
+        >>> ts = pd.DataFrame({'A': [1, 2, 3, 4]}, index=i)
+        >>> ts
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-09 12:00:00  2
+        2018-04-10 00:00:00  3
+        2018-04-10 12:00:00  4
+
+        >>> ts.at_time('12:00')
+                             A
+        2018-04-09 12:00:00  2
+        2018-04-10 12:00:00  4
         """
+        if axis is None:
+            axis = self._stat_axis_number
+        axis = self._get_axis_number(axis)
+
+        index = self._get_axis(axis)
         try:
-            indexer = self.index.indexer_at_time(time, asof=asof)
-            return self.take(indexer, convert=False)
+            indexer = index.indexer_at_time(time, asof=asof)
         except AttributeError:
             raise TypeError('Index must be DatetimeIndex')
 
+        return self._take(indexer, axis=axis)
+
     def between_time(self, start_time, end_time, include_start=True,
-                     include_end=True):
+                     include_end=True, axis=None):
         """
         Select values between particular times of the day (e.g., 9:00-9:30 AM).
 
+        By setting ``start_time`` to be later than ``end_time``,
+        you can get the times that are *not* between the two times.
+
         Parameters
         ----------
-        start_time : datetime.time or string
-        end_time : datetime.time or string
-        include_start : boolean, default True
-        include_end : boolean, default True
+        start_time : datetime.time or str
+        end_time : datetime.time or str
+        include_start : bool, default True
+        include_end : bool, default True
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
-        values_between_time : type of caller
+        Series or DataFrame
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
+
+        See Also
+        --------
+        at_time : Select values at a particular time of the day.
+        first : Select initial periods of time series based on a date offset.
+        last : Select final periods of time series based on a date offset.
+        DatetimeIndex.indexer_between_time : Get just the index locations for
+            values between particular times of the day.
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='1D20min')
+        >>> ts = pd.DataFrame({'A': [1, 2, 3, 4]}, index=i)
+        >>> ts
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-10 00:20:00  2
+        2018-04-11 00:40:00  3
+        2018-04-12 01:00:00  4
+
+        >>> ts.between_time('0:15', '0:45')
+                             A
+        2018-04-10 00:20:00  2
+        2018-04-11 00:40:00  3
+
+        You get the times that are *not* between two times by setting
+        ``start_time`` later than ``end_time``:
+
+        >>> ts.between_time('0:45', '0:15')
+                             A
+        2018-04-09 00:00:00  1
+        2018-04-12 01:00:00  4
         """
+        if axis is None:
+            axis = self._stat_axis_number
+        axis = self._get_axis_number(axis)
+
+        index = self._get_axis(axis)
         try:
-            indexer = self.index.indexer_between_time(
+            indexer = index.indexer_between_time(
                 start_time, end_time, include_start=include_start,
                 include_end=include_end)
-            return self.take(indexer, convert=False)
         except AttributeError:
             raise TypeError('Index must be DatetimeIndex')
 
+        return self._take(indexer, axis=axis)
+
     def resample(self, rule, how=None, axis=0, fill_method=None, closed=None,
                  label=None, convention='start', kind=None, loffset=None,
                  limit=None, base=0, on=None, level=None):
         """
+        Resample time-series data.
+
         Convenience method for frequency conversion and resampling of time
-        series.  Object must have a datetime-like index (DatetimeIndex,
-        PeriodIndex, or TimedeltaIndex), or pass datetime-like values
-        to the on or level keyword.
+        series. Object must have a datetime-like index (`DatetimeIndex`,
+        `PeriodIndex`, or `TimedeltaIndex`), or pass datetime-like values
+        to the `on` or `level` keyword.
 
         Parameters
         ----------
-        rule : string
-            the offset string or object representing target conversion
-        axis : int, optional, default 0
-        closed : {'right', 'left'}
-            Which side of bin interval is closed
-        label : {'right', 'left'}
-            Which bin edge label to label bucket with
-        convention : {'start', 'end', 's', 'e'}
-        loffset : timedelta
-            Adjust the resampled time labels
+        rule : str
+            The offset string or object representing target conversion.
+        how : str
+            Method for down/re-sampling, default to 'mean' for downsampling.
+
+            .. deprecated:: 0.18.0
+               The new syntax is ``.resample(...).mean()``, or
+               ``.resample(...).apply(<func>)``
+        axis : {0 or 'index', 1 or 'columns'}, default 0
+            Which axis to use for up- or down-sampling. For `Series` this
+            will default to 0, i.e. along the rows. Must be
+            `DatetimeIndex`, `TimedeltaIndex` or `PeriodIndex`.
+        fill_method : str, default None
+            Filling method for upsampling.
+
+            .. deprecated:: 0.18.0
+               The new syntax is ``.resample(...).<func>()``,
+               e.g. ``.resample(...).pad()``
+        closed : {'right', 'left'}, default None
+            Which side of bin interval is closed. The default is 'left'
+            for all frequency offsets except for 'M', 'A', 'Q', 'BM',
+            'BA', 'BQ', and 'W' which all have a default of 'right'.
+        label : {'right', 'left'}, default None
+            Which bin edge label to label bucket with. The default is 'left'
+            for all frequency offsets except for 'M', 'A', 'Q', 'BM',
+            'BA', 'BQ', and 'W' which all have a default of 'right'.
+        convention : {'start', 'end', 's', 'e'}, default 'start'
+            For `PeriodIndex` only, controls whether to use the start or
+            end of `rule`.
+        kind : {'timestamp', 'period'}, optional, default None
+            Pass 'timestamp' to convert the resulting index to a
+            `DateTimeIndex` or 'period' to convert it to a `PeriodIndex`.
+            By default the input representation is retained.
+        loffset : timedelta, default None
+            Adjust the resampled time labels.
+        limit : int, default None
+            Maximum size gap when reindexing with `fill_method`.
+
+            .. deprecated:: 0.18.0
         base : int, default 0
             For frequencies that evenly subdivide 1 day, the "origin" of the
             aggregated intervals. For example, for '5min' frequency, base could
-            range from 0 through 4. Defaults to 0
-        on : string, optional
+            range from 0 through 4. Defaults to 0.
+        on : str, optional
             For a DataFrame, column to use instead of index for resampling.
             Column must be datetime-like.
 
             .. versionadded:: 0.19.0
 
-        level : string or int, optional
+        level : str or int, optional
             For a MultiIndex, level (name or number) to use for
-            resampling.  Level must be datetime-like.
+            resampling. `level` must be datetime-like.
 
             .. versionadded:: 0.19.0
 
+        Returns
+        -------
+        Resampler object
+
+        See Also
+        --------
+        groupby : Group by mapping, function, label, or list of labels.
+        Series.resample : Resample a Series.
+        DataFrame.resample: Resample a DataFrame.
+
         Notes
         -----
+        See the `user guide
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#resampling>`_
+        for more.
+
         To learn more about the offset strings, please see `this link
         <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
 
@@ -4406,7 +8019,7 @@ def resample(self, rule, how=None, axis=0, fill_method=None, closed=None,
         value in the bucket used as the label is not included in the bucket,
         which it labels. For example, in the original series the
         bucket ``2000-01-01 00:03:00`` contains the value 3, but the summed
-        value in the resampled bucket with the label``2000-01-01 00:03:00``
+        value in the resampled bucket with the label ``2000-01-01 00:03:00``
         does not include 3 (if it did, the summed value would be 6, not 3).
         To include this value close the right side of the bin interval as
         illustrated in the example below this one.
@@ -4429,7 +8042,7 @@ def resample(self, rule, how=None, axis=0, fill_method=None, closed=None,
 
         Upsample the series into 30 second bins.
 
-        >>> series.resample('30S').asfreq()[0:5] #select first 5 rows
+        >>> series.resample('30S').asfreq()[0:5]   # Select first 5 rows
         2000-01-01 00:00:00   0.0
         2000-01-01 00:00:30   NaN
         2000-01-01 00:01:00   1.0
@@ -4462,41 +8075,119 @@ def resample(self, rule, how=None, axis=0, fill_method=None, closed=None,
         Pass a custom function via ``apply``
 
         >>> def custom_resampler(array_like):
-        ...     return np.sum(array_like)+5
-
+        ...     return np.sum(array_like) + 5
+        ...
         >>> series.resample('3T').apply(custom_resampler)
         2000-01-01 00:00:00     8
         2000-01-01 00:03:00    17
         2000-01-01 00:06:00    26
         Freq: 3T, dtype: int64
 
-        For DataFrame objects, the keyword ``on`` can be used to specify the
+        For a Series with a PeriodIndex, the keyword `convention` can be
+        used to control whether to use the start or end of `rule`.
+
+        Resample a year by quarter using 'start' `convention`. Values are
+        assigned to the first quarter of the period.
+
+        >>> s = pd.Series([1, 2], index=pd.period_range('2012-01-01',
+        ...                                             freq='A',
+        ...                                             periods=2))
+        >>> s
+        2012    1
+        2013    2
+        Freq: A-DEC, dtype: int64
+        >>> s.resample('Q', convention='start').asfreq()
+        2012Q1    1.0
+        2012Q2    NaN
+        2012Q3    NaN
+        2012Q4    NaN
+        2013Q1    2.0
+        2013Q2    NaN
+        2013Q3    NaN
+        2013Q4    NaN
+        Freq: Q-DEC, dtype: float64
+
+        Resample quarters by month using 'end' `convention`. Values are
+        assigned to the last month of the period.
+
+        >>> q = pd.Series([1, 2, 3, 4], index=pd.period_range('2018-01-01',
+        ...                                                   freq='Q',
+        ...                                                   periods=4))
+        >>> q
+        2018Q1    1
+        2018Q2    2
+        2018Q3    3
+        2018Q4    4
+        Freq: Q-DEC, dtype: int64
+        >>> q.resample('M', convention='end').asfreq()
+        2018-03    1.0
+        2018-04    NaN
+        2018-05    NaN
+        2018-06    2.0
+        2018-07    NaN
+        2018-08    NaN
+        2018-09    3.0
+        2018-10    NaN
+        2018-11    NaN
+        2018-12    4.0
+        Freq: M, dtype: float64
+
+        For DataFrame objects, the keyword `on` can be used to specify the
         column instead of the index for resampling.
 
-        >>> df = pd.DataFrame(data=9*[range(4)], columns=['a', 'b', 'c', 'd'])
-        >>> df['time'] = pd.date_range('1/1/2000', periods=9, freq='T')
-        >>> df.resample('3T', on='time').sum()
-                             a  b  c  d
-        time
-        2000-01-01 00:00:00  0  3  6  9
-        2000-01-01 00:03:00  0  3  6  9
-        2000-01-01 00:06:00  0  3  6  9
-
-        For a DataFrame with MultiIndex, the keyword ``level`` can be used to
-        specify on level the resampling needs to take place.
-
-        >>> time = pd.date_range('1/1/2000', periods=5, freq='T')
-        >>> df2 = pd.DataFrame(data=10*[range(4)],
-                               columns=['a', 'b', 'c', 'd'],
-                               index=pd.MultiIndex.from_product([time, [1, 2]])
-                               )
-        >>> df2.resample('3T', level=0).sum()
-                             a  b   c   d
-        2000-01-01 00:00:00  0  6  12  18
-        2000-01-01 00:03:00  0  4   8  12
-        """
-        from pandas.tseries.resample import (resample,
-                                             _maybe_process_deprecations)
+        >>> d = dict({'price': [10, 11, 9, 13, 14, 18, 17, 19],
+        ...           'volume': [50, 60, 40, 100, 50, 100, 40, 50]})
+        >>> df = pd.DataFrame(d)
+        >>> df['week_starting'] = pd.date_range('01/01/2018',
+        ...                                     periods=8,
+        ...                                     freq='W')
+        >>> df
+           price  volume week_starting
+        0     10      50    2018-01-07
+        1     11      60    2018-01-14
+        2      9      40    2018-01-21
+        3     13     100    2018-01-28
+        4     14      50    2018-02-04
+        5     18     100    2018-02-11
+        6     17      40    2018-02-18
+        7     19      50    2018-02-25
+        >>> df.resample('M', on='week_starting').mean()
+                       price  volume
+        week_starting
+        2018-01-31     10.75    62.5
+        2018-02-28     17.00    60.0
+
+        For a DataFrame with MultiIndex, the keyword `level` can be used to
+        specify on which level the resampling needs to take place.
+
+        >>> days = pd.date_range('1/1/2000', periods=4, freq='D')
+        >>> d2 = dict({'price': [10, 11, 9, 13, 14, 18, 17, 19],
+        ...            'volume': [50, 60, 40, 100, 50, 100, 40, 50]})
+        >>> df2 = pd.DataFrame(d2,
+        ...                    index=pd.MultiIndex.from_product([days,
+        ...                                                     ['morning',
+        ...                                                      'afternoon']]
+        ...                                                     ))
+        >>> df2
+                              price  volume
+        2000-01-01 morning       10      50
+                   afternoon     11      60
+        2000-01-02 morning        9      40
+                   afternoon     13     100
+        2000-01-03 morning       14      50
+                   afternoon     18     100
+        2000-01-04 morning       17      40
+                   afternoon     19      50
+        >>> df2.resample('D', level=0).sum()
+                    price  volume
+        2000-01-01     21     110
+        2000-01-02     22     140
+        2000-01-03     32     150
+        2000-01-04     36      90
+        """
+
+        from pandas.core.resample import (resample,
+                                          _maybe_process_deprecations)
         axis = self._get_axis_number(axis)
         r = resample(self, freq=rule, label=label, closed=closed,
                      axis=axis, kind=kind, loffset=loffset,
@@ -4516,18 +8207,45 @@ def first(self, offset):
         ----------
         offset : string, DateOffset, dateutil.relativedelta
 
-        Examples
-        --------
-        ts.first('10D') -> First 10 days
-
         Returns
         -------
-        subset : type of caller
+        subset : same type as caller
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
+
+        See Also
+        --------
+        last : Select final periods of time series based on a date offset.
+        at_time : Select values at a particular time of the day.
+        between_time : Select values between particular times of the day.
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='2D')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                    A
+        2018-04-09  1
+        2018-04-11  2
+        2018-04-13  3
+        2018-04-15  4
+
+        Get the rows for the first 3 days:
+
+        >>> ts.first('3D')
+                    A
+        2018-04-09  1
+        2018-04-11  2
+
+        Notice the data for 3 first calender days were returned, not the first
+        3 days observed in the dataset, and therefore data for 2018-04-13 was
+        not returned.
         """
-        from pandas.tseries.frequencies import to_offset
         if not isinstance(self.index, DatetimeIndex):
-            raise NotImplementedError("'first' only supports a DatetimeIndex "
-                                      "index")
+            raise TypeError("'first' only supports a DatetimeIndex index")
 
         if len(self.index) == 0:
             return self
@@ -4552,25 +8270,52 @@ def last(self, offset):
         ----------
         offset : string, DateOffset, dateutil.relativedelta
 
-        Examples
-        --------
-        ts.last('5M') -> Last 5 months
-
         Returns
         -------
-        subset : type of caller
+        subset : same type as caller
+
+        Raises
+        ------
+        TypeError
+            If the index is not  a :class:`DatetimeIndex`
+
+        See Also
+        --------
+        first : Select initial periods of time series based on a date offset.
+        at_time : Select values at a particular time of the day.
+        between_time : Select values between particular times of the day.
+
+        Examples
+        --------
+        >>> i = pd.date_range('2018-04-09', periods=4, freq='2D')
+        >>> ts = pd.DataFrame({'A': [1,2,3,4]}, index=i)
+        >>> ts
+                    A
+        2018-04-09  1
+        2018-04-11  2
+        2018-04-13  3
+        2018-04-15  4
+
+        Get the rows for the last 3 days:
+
+        >>> ts.last('3D')
+                    A
+        2018-04-13  3
+        2018-04-15  4
+
+        Notice the data for 3 last calender days were returned, not the last
+        3 observed days in the dataset, and therefore data for 2018-04-11 was
+        not returned.
         """
-        from pandas.tseries.frequencies import to_offset
         if not isinstance(self.index, DatetimeIndex):
-            raise NotImplementedError("'last' only supports a DatetimeIndex "
-                                      "index")
+            raise TypeError("'last' only supports a DatetimeIndex index")
 
         if len(self.index) == 0:
             return self
 
         offset = to_offset(offset)
 
-        start_date = start = self.index[-1] - offset
+        start_date = self.index[-1] - offset
         start = self.index.searchsorted(start_date, side='right')
         return self.iloc[start:]
 
@@ -4578,7 +8323,7 @@ def rank(self, axis=0, method='average', numeric_only=None,
              na_option='keep', ascending=True, pct=False):
         """
         Compute numerical data ranks (1 through n) along axis. Equal values are
-        assigned a rank that is the average of the ranks of those values
+        assigned a rank that is the average of the ranks of those values.
 
         Parameters
         ----------
@@ -4612,6 +8357,10 @@ def rank(self, axis=0, method='average', numeric_only=None,
             msg = "rank does not make sense when ndim > 2"
             raise NotImplementedError(msg)
 
+        if na_option not in {'keep', 'top', 'bottom'}:
+            msg = "na_option must be one of 'keep', 'top', or 'bottom'"
+            raise ValueError(msg)
+
         def ranker(data):
             ranks = algos.rank(data.values, axis=axis, method=method,
                                ascending=ascending, na_option=na_option,
@@ -4635,8 +8384,8 @@ def ranker(data):
         return ranker(data)
 
     _shared_docs['align'] = ("""
-        Align two object on their axes with the
-        specified join method for each axis Index
+        Align two objects on their axes with the
+        specified join method for each axis Index.
 
         Parameters
         ----------
@@ -4653,20 +8402,27 @@ def ranker(data):
         fill_value : scalar, default np.NaN
             Value to use for missing values. Defaults to NaN, but can be any
             "compatible" value
-        method : str, default None
+        method : {'backfill', 'bfill', 'pad', 'ffill', None}, default None
+            Method to use for filling holes in reindexed Series
+            pad / ffill: propagate last valid observation forward to next valid
+            backfill / bfill: use NEXT valid observation to fill gap
         limit : int, default None
+            If method is specified, this is the maximum number of consecutive
+            NaN values to forward/backward fill. In other words, if there is
+            a gap with more than this number of consecutive NaNs, it will only
+            be partially filled. If method is not specified, this is the
+            maximum number of entries along the entire axis where NaNs will be
+            filled. Must be greater than 0 if not None.
         fill_axis : %(axes_single_arg)s, default 0
             Filling axis, method and limit
         broadcast_axis : %(axes_single_arg)s, default None
             Broadcast values along this axis, if aligning two objects of
             different dimensions
 
-            .. versionadded:: 0.17.0
-
         Returns
         -------
         (left, right) : (%(klass)s, type of other)
-            Aligned objects
+            Aligned objects.
         """)
 
     @Appender(_shared_docs['align'] % _shared_doc_kwargs)
@@ -4681,7 +8437,7 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
                 # this means other is a DataFrame, and we need to broadcast
                 # self
                 cons = self._constructor_expanddim
-                df = cons(dict((c, self) for c in other.columns),
+                df = cons({c: self for c in other.columns},
                           **other._construct_axes_dict())
                 return df._align_frame(other, join=join, axis=axis,
                                        level=level, copy=copy,
@@ -4691,7 +8447,7 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
                 # this means self is a DataFrame, and we need to broadcast
                 # other
                 cons = other._constructor_expanddim
-                df = cons(dict((c, other) for c in self.columns),
+                df = cons({c: other for c in self.columns},
                           **self._construct_axes_dict())
                 return self._align_frame(df, join=join, axis=axis, level=level,
                                          copy=copy, fill_value=fill_value,
@@ -4714,7 +8470,7 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
             raise TypeError('unsupported type: %s' % type(other))
 
     def _align_frame(self, other, join='outer', axis=None, level=None,
-                     copy=True, fill_value=np.nan, method=None, limit=None,
+                     copy=True, fill_value=None, method=None, limit=None,
                      fill_axis=0):
         # defaults
         join_index, join_columns = None, None
@@ -4821,7 +8577,7 @@ def _align_series(self, other, join='outer', axis=None, level=None,
                 right = other.reindex(join_index, level=level)
 
         # fill
-        fill_na = notnull(fill_value) or (method is not None)
+        fill_na = notna(fill_value) or (method is not None)
         if fill_na:
             left = left.fillna(fill_value, method=method, limit=limit,
                                axis=fill_axis)
@@ -4838,7 +8594,7 @@ def _align_series(self, other, join='outer', axis=None, level=None,
         return left.__finalize__(self), right.__finalize__(other)
 
     def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
-               try_cast=False, raise_on_error=True):
+               errors='raise', try_cast=False):
         """
         Equivalent to public method `where`, except that `other` is not
         applied as a function even if callable. Used in __setitem__.
@@ -4846,7 +8602,7 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
         inplace = validate_bool_kwarg(inplace, 'inplace')
 
         # align the cond to same shape as myself
-        cond = com._apply_if_callable(cond, self)
+        cond = com.apply_if_callable(cond, self)
         if isinstance(cond, NDFrame):
             cond, _ = cond.align(self, join='right', broadcast_axis=1)
         else:
@@ -4858,7 +8614,7 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
             cond = self._constructor(cond, **self._construct_axes_dict())
 
         # make sure we are boolean
-        fill_value = True if inplace else False
+        fill_value = bool(inplace)
         cond = cond.fillna(fill_value)
 
         msg = "Boolean array expected for the condition, not {dtype}"
@@ -4867,12 +8623,11 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
             # This is a single-dimensional object.
             if not is_bool_dtype(cond):
                 raise ValueError(msg.format(dtype=cond.dtype))
-        else:
+        elif not cond.empty:
             for dt in cond.dtypes:
                 if not is_bool_dtype(dt):
                     raise ValueError(msg.format(dtype=dt))
 
-        cond = cond.astype(bool, copy=False)
         cond = -cond if inplace else cond
 
         # try to align with other
@@ -4887,56 +8642,14 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
 
                 # if we are NOT aligned, raise as we cannot where index
                 if (axis is None and
-                        not all([other._get_axis(i).equals(ax)
-                                 for i, ax in enumerate(self.axes)])):
+                        not all(other._get_axis(i).equals(ax)
+                                for i, ax in enumerate(self.axes))):
                     raise InvalidIndexError
 
             # slice me out of the other
             else:
-                raise NotImplemented("cannot align with a higher dimensional "
-                                     "NDFrame")
-
-        elif is_list_like(other):
-
-            if self.ndim == 1:
-
-                # try to set the same dtype as ourselves
-                try:
-                    new_other = np.array(other, dtype=self.dtype)
-                except ValueError:
-                    new_other = np.array(other)
-                except TypeError:
-                    new_other = other
-
-                # we can end up comparing integers and m8[ns]
-                # which is a numpy no no
-                is_i8 = needs_i8_conversion(self.dtype)
-                if is_i8:
-                    matches = False
-                else:
-                    matches = (new_other == np.array(other))
-
-                if matches is False or not matches.all():
-
-                    # coerce other to a common dtype if we can
-                    if needs_i8_conversion(self.dtype):
-                        try:
-                            other = np.array(other, dtype=self.dtype)
-                        except:
-                            other = np.array(other)
-                    else:
-                        other = np.asarray(other)
-                        other = np.asarray(other,
-                                           dtype=np.common_type(other,
-                                                                new_other))
-
-                    # we need to use the new dtype
-                    try_quick = False
-                else:
-                    other = new_other
-            else:
-
-                other = np.array(other)
+                raise NotImplementedError("cannot align with a higher "
+                                          "dimensional NDFrame")
 
         if isinstance(other, np.ndarray):
 
@@ -4959,10 +8672,11 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
                         if try_quick:
 
                             try:
-                                new_other = _values_from_object(self).copy()
+                                new_other = com.values_from_object(self)
+                                new_other = new_other.copy()
                                 new_other[icond] = other
                                 other = new_other
-                            except:
+                            except Exception:
                                 try_quick = False
 
                         # let's create a new (if we failed at the above
@@ -5009,21 +8723,21 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
 
         else:
             new_data = self._data.where(other=other, cond=cond, align=align,
-                                        raise_on_error=raise_on_error,
+                                        errors=errors,
                                         try_cast=try_cast, axis=block_axis,
                                         transpose=self._AXIS_REVERSED)
 
             return self._constructor(new_data).__finalize__(self)
 
     _shared_docs['where'] = ("""
-        Return an object of same shape as self and whose corresponding
-        entries are from self where cond is %(cond)s and otherwise are from
-        other.
+        Replace values where the condition is %(cond_rev)s.
 
         Parameters
         ----------
         cond : boolean %(klass)s, array-like, or callable
-            If cond is callable, it is computed on the %(klass)s and
+            Where `cond` is %(cond)s, keep the original value. Where
+            %(cond_rev)s, replace with corresponding value from `other`.
+            If `cond` is callable, it is computed on the %(klass)s and
             should return boolean %(klass)s or array. The callable must
             not change input %(klass)s (though pandas doesn't check it).
 
@@ -5031,6 +8745,8 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
                 A callable can be used as cond.
 
         other : scalar, %(klass)s, or callable
+            Entries where `cond` is %(cond_rev)s are replaced with
+            corresponding value from `other`.
             If other is callable, it is computed on the %(klass)s and
             should return scalar or %(klass)s. The callable must not
             change input %(klass)s (though pandas doesn't check it).
@@ -5039,19 +8755,37 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
                 A callable can be used as other.
 
         inplace : boolean, default False
-            Whether to perform the operation in place on the data
-        axis : alignment axis if needed, default None
-        level : alignment level if needed, default None
+            Whether to perform the operation in place on the data.
+        axis : int, default None
+            Alignment axis if needed.
+        level : int, default None
+            Alignment level if needed.
+        errors : str, {'raise', 'ignore'}, default `raise`
+            Note that currently this parameter won't affect
+            the results and will always coerce to a suitable dtype.
+
+            - `raise` : allow exceptions to be raised.
+            - `ignore` : suppress exceptions. On error return original object.
+
         try_cast : boolean, default False
-            try to cast the result back to the input type (if possible),
+            Try to cast the result back to the input type (if possible).
         raise_on_error : boolean, default True
             Whether to raise on invalid data types (e.g. trying to where on
-            strings)
+            strings).
+
+            .. deprecated:: 0.21.0
+
+               Use `errors`.
 
         Returns
         -------
         wh : same type as caller
 
+        See Also
+        --------
+        :func:`DataFrame.%(name_other)s` : Return an object of same shape as
+            self.
+
         Notes
         -----
         The %(name)s method is an application of the if-then idiom. For each
@@ -5075,6 +8809,23 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
         2    2.0
         3    3.0
         4    4.0
+        dtype: float64
+
+        >>> s.mask(s > 0)
+        0    0.0
+        1    NaN
+        2    NaN
+        3    NaN
+        4    NaN
+        dtype: float64
+
+        >>> s.where(s > 1, 10)
+        0    10
+        1    10
+        2    2
+        3    3
+        4    4
+        dtype: int64
 
         >>> df = pd.DataFrame(np.arange(10).reshape(-1, 2), columns=['A', 'B'])
         >>> m = df %% 3 == 0
@@ -5099,64 +8850,138 @@ def _where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
         2  True  True
         3  True  True
         4  True  True
-
-        See Also
-        --------
-        :func:`DataFrame.%(name_other)s`
         """)
 
     @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="True",
-                                           name='where', name_other='mask'))
+                                           cond_rev="False", name='where',
+                                           name_other='mask'))
     def where(self, cond, other=np.nan, inplace=False, axis=None, level=None,
-              try_cast=False, raise_on_error=True):
+              errors='raise', try_cast=False, raise_on_error=None):
+
+        if raise_on_error is not None:
+            warnings.warn(
+                "raise_on_error is deprecated in "
+                "favor of errors='raise|ignore'",
+                FutureWarning, stacklevel=2)
+
+            if raise_on_error:
+                errors = 'raise'
+            else:
+                errors = 'ignore'
 
-        other = com._apply_if_callable(other, self)
-        return self._where(cond, other, inplace, axis, level, try_cast,
-                           raise_on_error)
+        other = com.apply_if_callable(other, self)
+        return self._where(cond, other, inplace, axis, level,
+                           errors=errors, try_cast=try_cast)
 
     @Appender(_shared_docs['where'] % dict(_shared_doc_kwargs, cond="False",
-                                           name='mask', name_other='where'))
+                                           cond_rev="True", name='mask',
+                                           name_other='where'))
     def mask(self, cond, other=np.nan, inplace=False, axis=None, level=None,
-             try_cast=False, raise_on_error=True):
+             errors='raise', try_cast=False, raise_on_error=None):
+
+        if raise_on_error is not None:
+            warnings.warn(
+                "raise_on_error is deprecated in "
+                "favor of errors='raise|ignore'",
+                FutureWarning, stacklevel=2)
+
+            if raise_on_error:
+                errors = 'raise'
+            else:
+                errors = 'ignore'
 
         inplace = validate_bool_kwarg(inplace, 'inplace')
-        cond = com._apply_if_callable(cond, self)
+        cond = com.apply_if_callable(cond, self)
+
+        # see gh-21891
+        if not hasattr(cond, "__invert__"):
+            cond = np.array(cond)
 
         return self.where(~cond, other=other, inplace=inplace, axis=axis,
                           level=level, try_cast=try_cast,
-                          raise_on_error=raise_on_error)
+                          errors=errors)
 
     _shared_docs['shift'] = ("""
-        Shift index by desired number of periods with an optional time freq
+        Shift index by desired number of periods with an optional time `freq`.
+
+        When `freq` is not passed, shift the index without realigning the data.
+        If `freq` is passed (in this case, the index must be date or datetime,
+        or it will raise a `NotImplementedError`), the index will be
+        increased using the periods and the `freq`.
 
         Parameters
         ----------
         periods : int
-            Number of periods to move, can be positive or negative
-        freq : DateOffset, timedelta, or time rule string, optional
-            Increment to use from the tseries module or time rule (e.g. 'EOM').
-            See Notes.
-        axis : %(axes_single_arg)s
-
-        Notes
-        -----
-        If freq is specified then the index values are shifted but the data
-        is not realigned. That is, use freq if you would like to extend the
-        index when shifting and preserve the original data.
+            Number of periods to shift. Can be positive or negative.
+        freq : DateOffset, tseries.offsets, timedelta, or str, optional
+            Offset to use from the tseries module or time rule (e.g. 'EOM').
+            If `freq` is specified then the index values are shifted but the
+            data is not realigned. That is, use `freq` if you would like to
+            extend the index when shifting and preserve the original data.
+        axis : {0 or 'index', 1 or 'columns', None}, default None
+            Shift direction.
+        fill_value : object, optional
+            The scalar value to use for newly introduced missing values.
+            the default depends on the dtype of `self`.
+            For numeric data, ``np.nan`` is used.
+            For datetime, timedelta, or period data, etc. :attr:`NaT` is used.
+            For extension dtypes, ``self.dtype.na_value`` is used.
+
+            .. versionchanged:: 0.24.0
 
         Returns
         -------
-        shifted : %(klass)s
+        %(klass)s
+            Copy of input object, shifted.
+
+        See Also
+        --------
+        Index.shift : Shift values of Index.
+        DatetimeIndex.shift : Shift values of DatetimeIndex.
+        PeriodIndex.shift : Shift values of PeriodIndex.
+        tshift : Shift the time index, using the index's frequency if
+            available.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'Col1': [10, 20, 15, 30, 45],
+        ...                    'Col2': [13, 23, 18, 33, 48],
+        ...                    'Col3': [17, 27, 22, 37, 52]})
+
+        >>> df.shift(periods=3)
+           Col1  Col2  Col3
+        0   NaN   NaN   NaN
+        1   NaN   NaN   NaN
+        2   NaN   NaN   NaN
+        3  10.0  13.0  17.0
+        4  20.0  23.0  27.0
+
+        >>> df.shift(periods=1, axis='columns')
+           Col1  Col2  Col3
+        0   NaN  10.0  13.0
+        1   NaN  20.0  23.0
+        2   NaN  15.0  18.0
+        3   NaN  30.0  33.0
+        4   NaN  45.0  48.0
+
+        >>> df.shift(periods=3, fill_value=0)
+           Col1  Col2  Col3
+        0     0     0     0
+        1     0     0     0
+        2     0     0     0
+        3    10    13    17
+        4    20    23    27
     """)
 
     @Appender(_shared_docs['shift'] % _shared_doc_kwargs)
-    def shift(self, periods=1, freq=None, axis=0):
+    def shift(self, periods=1, freq=None, axis=0, fill_value=None):
         if periods == 0:
-            return self
+            return self.copy()
 
         block_axis = self._get_block_manager_axis(axis)
         if freq is None:
-            new_data = self._data.shift(periods=periods, axis=block_axis)
+            new_data = self._data.shift(periods=periods, axis=block_axis,
+                                        fill_value=fill_value)
         else:
             return self.tshift(periods, freq)
 
@@ -5173,14 +8998,14 @@ def slice_shift(self, periods=1, axis=0):
         periods : int
             Number of periods to move, can be positive or negative
 
+        Returns
+        -------
+        shifted : same type as caller
+
         Notes
         -----
         While the `slice_shift` is faster than `shift`, you may pay for it
         later during alignment.
-
-        Returns
-        -------
-        shifted : same type as caller
         """
         if periods == 0:
             return self
@@ -5194,7 +9019,7 @@ def slice_shift(self, periods=1, axis=0):
 
         new_obj = self._slice(vslicer, axis=axis)
         shifted_axis = self._get_axis(axis)[islicer]
-        new_obj.set_axis(axis, shifted_axis)
+        new_obj.set_axis(shifted_axis, axis=axis, inplace=True)
 
         return new_obj.__finalize__(self)
 
@@ -5211,15 +9036,15 @@ def tshift(self, periods=1, freq=None, axis=0):
         axis : int or basestring
             Corresponds to the axis that contains the Index
 
+        Returns
+        -------
+        shifted : NDFrame
+
         Notes
         -----
         If freq is not specified then tries to use the freq or inferred_freq
         attributes of the index. If neither of those attributes exist, a
         ValueError is thrown
-
-        Returns
-        -------
-        shifted : NDFrame
         """
 
         index = self._get_axis(axis)
@@ -5255,24 +9080,123 @@ def tshift(self, periods=1, freq=None, axis=0):
 
         return self._constructor(new_data).__finalize__(self)
 
-    def truncate(self, before=None, after=None, axis=None, copy=True):
-        """Truncates a sorted NDFrame before and/or after some particular
-        index value. If the axis contains only datetime values, before/after
-        parameters are converted to datetime values.
+    def truncate(self, before=None, after=None, axis=None, copy=True):
+        """
+        Truncate a Series or DataFrame before and after some index value.
+
+        This is a useful shorthand for boolean indexing based on index
+        values above or below certain thresholds.
+
+        Parameters
+        ----------
+        before : date, string, int
+            Truncate all rows before this index value.
+        after : date, string, int
+            Truncate all rows after this index value.
+        axis : {0 or 'index', 1 or 'columns'}, optional
+            Axis to truncate. Truncates the index (rows) by default.
+        copy : boolean, default is True,
+            Return a copy of the truncated section.
+
+        Returns
+        -------
+        type of caller
+            The truncated Series or DataFrame.
+
+        See Also
+        --------
+        DataFrame.loc : Select a subset of a DataFrame by label.
+        DataFrame.iloc : Select a subset of a DataFrame by position.
+
+        Notes
+        -----
+        If the index being truncated contains only datetime values,
+        `before` and `after` may be specified as strings instead of
+        Timestamps.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': ['a', 'b', 'c', 'd', 'e'],
+        ...                    'B': ['f', 'g', 'h', 'i', 'j'],
+        ...                    'C': ['k', 'l', 'm', 'n', 'o']},
+        ...                    index=[1, 2, 3, 4, 5])
+        >>> df
+           A  B  C
+        1  a  f  k
+        2  b  g  l
+        3  c  h  m
+        4  d  i  n
+        5  e  j  o
+
+        >>> df.truncate(before=2, after=4)
+           A  B  C
+        2  b  g  l
+        3  c  h  m
+        4  d  i  n
 
-        Parameters
-        ----------
-        before : date
-            Truncate before index value
-        after : date
-            Truncate after index value
-        axis : the truncation axis, defaults to the stat axis
-        copy : boolean, default is True,
-            return a copy of the truncated section
+        The columns of a DataFrame can be truncated.
 
-        Returns
-        -------
-        truncated : type of caller
+        >>> df.truncate(before="A", after="B", axis="columns")
+           A  B
+        1  a  f
+        2  b  g
+        3  c  h
+        4  d  i
+        5  e  j
+
+        For Series, only rows can be truncated.
+
+        >>> df['A'].truncate(before=2, after=4)
+        2    b
+        3    c
+        4    d
+        Name: A, dtype: object
+
+        The index values in ``truncate`` can be datetimes or string
+        dates.
+
+        >>> dates = pd.date_range('2016-01-01', '2016-02-01', freq='s')
+        >>> df = pd.DataFrame(index=dates, data={'A': 1})
+        >>> df.tail()
+                             A
+        2016-01-31 23:59:56  1
+        2016-01-31 23:59:57  1
+        2016-01-31 23:59:58  1
+        2016-01-31 23:59:59  1
+        2016-02-01 00:00:00  1
+
+        >>> df.truncate(before=pd.Timestamp('2016-01-05'),
+        ...             after=pd.Timestamp('2016-01-10')).tail()
+                             A
+        2016-01-09 23:59:56  1
+        2016-01-09 23:59:57  1
+        2016-01-09 23:59:58  1
+        2016-01-09 23:59:59  1
+        2016-01-10 00:00:00  1
+
+        Because the index is a DatetimeIndex containing only dates, we can
+        specify `before` and `after` as strings. They will be coerced to
+        Timestamps before truncation.
+
+        >>> df.truncate('2016-01-05', '2016-01-10').tail()
+                             A
+        2016-01-09 23:59:56  1
+        2016-01-09 23:59:57  1
+        2016-01-09 23:59:58  1
+        2016-01-09 23:59:59  1
+        2016-01-10 00:00:00  1
+
+        Note that ``truncate`` assumes a 0 value for any unspecified time
+        component (midnight). This differs from partial string slicing, which
+        returns any partially matching dates.
+
+        >>> df.loc['2016-01-05':'2016-01-10', :].tail()
+                             A
+        2016-01-10 23:59:55  1
+        2016-01-10 23:59:56  1
+        2016-01-10 23:59:57  1
+        2016-01-10 23:59:58  1
+        2016-01-10 23:59:59  1
         """
 
         if axis is None:
@@ -5280,10 +9204,15 @@ def truncate(self, before=None, after=None, axis=None, copy=True):
         axis = self._get_axis_number(axis)
         ax = self._get_axis(axis)
 
+        # GH 17935
+        # Check that index is sorted
+        if not ax.is_monotonic_increasing and not ax.is_monotonic_decreasing:
+            raise ValueError("truncate requires a sorted index")
+
         # if we have a date index, convert to dates, otherwise
         # treat like a slice
         if ax.is_all_dates:
-            from pandas.tseries.tools import to_datetime
+            from pandas.core.tools.datetimes import to_datetime
             before = to_datetime(before)
             after = to_datetime(after)
 
@@ -5354,16 +9283,16 @@ def _tz_convert(ax, tz):
             ax = _tz_convert(ax, tz)
 
         result = self._constructor(self._data, copy=copy)
-        result.set_axis(axis, ax)
+        result = result.set_axis(ax, axis=axis, inplace=False)
         return result.__finalize__(self)
 
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                     mapping={True: 'infer',
-                              False: 'raise'})
     def tz_localize(self, tz, axis=0, level=None, copy=True,
-                    ambiguous='raise'):
+                    ambiguous='raise', nonexistent='raise'):
         """
-        Localize tz-naive TimeSeries to target time zone.
+        Localize tz-naive index of a Series or DataFrame to target time zone.
+
+        This operation localizes the Index. To localize the values in a
+        timezone-naive Series, use :meth:`Series.dt.tz_localize`.
 
         Parameters
         ----------
@@ -5375,6 +9304,13 @@ def tz_localize(self, tz, axis=0, level=None, copy=True,
         copy : boolean, default True
             Also make a copy of the underlying data
         ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
+            When clocks moved backward due to DST, ambiguous times may arise.
+            For example in Central European Time (UTC+01), when going from
+            03:00 DST to 02:00 non-DST, 02:30:00 local time occurs both at
+            00:30:00 UTC and at 01:30:00 UTC. In such a situation, the
+            `ambiguous` parameter dictates how ambiguous times should be
+            handled.
+
             - 'infer' will attempt to infer fall dst-transition hours based on
               order
             - bool-ndarray where True signifies a DST time, False designates
@@ -5383,21 +9319,107 @@ def tz_localize(self, tz, axis=0, level=None, copy=True,
             - 'NaT' will return NaT where there are ambiguous times
             - 'raise' will raise an AmbiguousTimeError if there are ambiguous
               times
-        infer_dst : boolean, default False (DEPRECATED)
-            Attempt to infer fall dst-transition hours based on order
+        nonexistent : str, default 'raise'
+            A nonexistent time does not exist in a particular timezone
+            where clocks moved forward due to DST. Valid values are:
+
+            - 'shift_forward' will shift the nonexistent time forward to the
+              closest existing time
+            - 'shift_backward' will shift the nonexistent time backward to the
+              closest existing time
+            - 'NaT' will return NaT where there are nonexistent times
+            - timedelta objects will shift nonexistent times by the timedelta
+            - 'raise' will raise an NonExistentTimeError if there are
+              nonexistent times
+
+            .. versionadded:: 0.24.0
 
         Returns
         -------
+        Series or DataFrame
+            Same type as the input.
 
         Raises
         ------
         TypeError
             If the TimeSeries is tz-aware and tz is not None.
+
+        Examples
+        --------
+
+        Localize local times:
+
+        >>> s = pd.Series([1],
+        ... index=pd.DatetimeIndex(['2018-09-15 01:30:00']))
+        >>> s.tz_localize('CET')
+        2018-09-15 01:30:00+02:00    1
+        dtype: int64
+
+        Be careful with DST changes. When there is sequential data, pandas
+        can infer the DST time:
+
+        >>> s = pd.Series(range(7), index=pd.DatetimeIndex([
+        ... '2018-10-28 01:30:00',
+        ... '2018-10-28 02:00:00',
+        ... '2018-10-28 02:30:00',
+        ... '2018-10-28 02:00:00',
+        ... '2018-10-28 02:30:00',
+        ... '2018-10-28 03:00:00',
+        ... '2018-10-28 03:30:00']))
+        >>> s.tz_localize('CET', ambiguous='infer')
+        2018-10-28 01:30:00+02:00    0
+        2018-10-28 02:00:00+02:00    1
+        2018-10-28 02:30:00+02:00    2
+        2018-10-28 02:00:00+01:00    3
+        2018-10-28 02:30:00+01:00    4
+        2018-10-28 03:00:00+01:00    5
+        2018-10-28 03:30:00+01:00    6
+        dtype: int64
+
+        In some cases, inferring the DST is impossible. In such cases, you can
+        pass an ndarray to the ambiguous parameter to set the DST explicitly
+
+        >>> s = pd.Series(range(3), index=pd.DatetimeIndex([
+        ... '2018-10-28 01:20:00',
+        ... '2018-10-28 02:36:00',
+        ... '2018-10-28 03:46:00']))
+        >>> s.tz_localize('CET', ambiguous=np.array([True, True, False]))
+        2018-10-28 01:20:00+02:00    0
+        2018-10-28 02:36:00+02:00    1
+        2018-10-28 03:46:00+01:00    2
+        dtype: int64
+
+        If the DST transition causes nonexistent times, you can shift these
+        dates forward or backwards with a timedelta object or `'shift_forward'`
+        or `'shift_backwards'`.
+        >>> s = pd.Series(range(2), index=pd.DatetimeIndex([
+        ... '2015-03-29 02:30:00',
+        ... '2015-03-29 03:30:00']))
+        >>> s.tz_localize('Europe/Warsaw', nonexistent='shift_forward')
+        2015-03-29 03:00:00+02:00    0
+        2015-03-29 03:30:00+02:00    1
+        dtype: int64
+        >>> s.tz_localize('Europe/Warsaw', nonexistent='shift_backward')
+        2015-03-29 01:59:59.999999999+01:00    0
+        2015-03-29 03:30:00+02:00              1
+        dtype: int64
+        >>> s.tz_localize('Europe/Warsaw', nonexistent=pd.Timedelta('1H'))
+        2015-03-29 03:30:00+02:00    0
+        2015-03-29 03:30:00+02:00    1
+        dtype: int64
         """
+        nonexistent_options = ('raise', 'NaT', 'shift_forward',
+                               'shift_backward')
+        if nonexistent not in nonexistent_options and not isinstance(
+                nonexistent, timedelta):
+            raise ValueError("The nonexistent argument must be one of 'raise',"
+                             " 'NaT', 'shift_forward', 'shift_backward' or"
+                             " a timedelta object")
+
         axis = self._get_axis_number(axis)
         ax = self._get_axis(axis)
 
-        def _tz_localize(ax, tz, ambiguous):
+        def _tz_localize(ax, tz, ambiguous, nonexistent):
             if not hasattr(ax, 'tz_localize'):
                 if len(ax) > 0:
                     ax_name = self._get_axis_name(axis)
@@ -5406,40 +9428,102 @@ def _tz_localize(ax, tz, ambiguous):
                 else:
                     ax = DatetimeIndex([], tz=tz)
             else:
-                ax = ax.tz_localize(tz, ambiguous=ambiguous)
+                ax = ax.tz_localize(
+                    tz, ambiguous=ambiguous, nonexistent=nonexistent
+                )
             return ax
 
         # if a level is given it must be a MultiIndex level or
         # equivalent to the axis name
         if isinstance(ax, MultiIndex):
             level = ax._get_level_number(level)
-            new_level = _tz_localize(ax.levels[level], tz, ambiguous)
+            new_level = _tz_localize(
+                ax.levels[level], tz, ambiguous, nonexistent
+            )
             ax = ax.set_levels(new_level, level=level)
         else:
             if level not in (None, 0, ax.name):
                 raise ValueError("The level {0} is not valid".format(level))
-            ax = _tz_localize(ax, tz, ambiguous)
+            ax = _tz_localize(ax, tz, ambiguous, nonexistent)
 
         result = self._constructor(self._data, copy=copy)
-        result.set_axis(axis, ax)
+        result = result.set_axis(ax, axis=axis, inplace=False)
         return result.__finalize__(self)
 
     # ----------------------------------------------------------------------
     # Numeric Methods
     def abs(self):
         """
-        Return an object with absolute value taken--only applicable to objects
-        that are all numeric.
+        Return a Series/DataFrame with absolute numeric value of each element.
+
+        This function only applies to elements that are all numeric.
 
         Returns
         -------
-        abs: type of caller
+        abs
+            Series/DataFrame containing the absolute value of each element.
+
+        See Also
+        --------
+        numpy.absolute : Calculate the absolute value element-wise.
+
+        Notes
+        -----
+        For ``complex`` inputs, ``1.2 + 1j``, the absolute value is
+        :math:`\\sqrt{ a^2 + b^2 }`.
+
+        Examples
+        --------
+        Absolute numeric values in a Series.
+
+        >>> s = pd.Series([-1.10, 2, -3.33, 4])
+        >>> s.abs()
+        0    1.10
+        1    2.00
+        2    3.33
+        3    4.00
+        dtype: float64
+
+        Absolute numeric values in a Series with complex numbers.
+
+        >>> s = pd.Series([1.2 + 1j])
+        >>> s.abs()
+        0    1.56205
+        dtype: float64
+
+        Absolute numeric values in a Series with a Timedelta element.
+
+        >>> s = pd.Series([pd.Timedelta('1 days')])
+        >>> s.abs()
+        0   1 days
+        dtype: timedelta64[ns]
+
+        Select rows with data closest to certain value using argsort (from
+        `StackOverflow <https://stackoverflow.com/a/17758115>`__).
+
+        >>> df = pd.DataFrame({
+        ...     'a': [4, 5, 6, 7],
+        ...     'b': [10, 20, 30, 40],
+        ...     'c': [100, 50, -30, -50]
+        ... })
+        >>> df
+             a    b    c
+        0    4   10  100
+        1    5   20   50
+        2    6   30  -30
+        3    7   40  -50
+        >>> df.loc[(df.c - 43).abs().argsort()]
+             a    b    c
+        1    5   20   50
+        0    4   10  100
+        2    6   30  -30
+        3    7   40  -50
         """
         return np.abs(self)
 
     def describe(self, percentiles=None, include=None, exclude=None):
         """
-        Generates descriptive statistics that summarize the central tendency,
+        Generate descriptive statistics that summarize the central tendency,
         dispersion and shape of a dataset's distribution, excluding
         ``NaN`` values.
 
@@ -5463,25 +9547,38 @@ def describe(self, percentiles=None, include=None, exclude=None):
             - A list-like of dtypes : Limits the results to the
               provided data types.
               To limit the result to numeric types submit
-              ``numpy.number``. To limit it instead to categorical
-              objects submit the ``numpy.object`` data type. Strings
+              ``numpy.number``. To limit it instead to object columns submit
+              the ``numpy.object`` data type. Strings
               can also be used in the style of
-              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``)
+              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``). To
+              select pandas categorical columns, use ``'category'``
             - None (default) : The result will include all numeric columns.
         exclude : list-like of dtypes or None (default), optional,
             A black list of data types to omit from the result. Ignored
             for ``Series``. Here are the options:
 
             - A list-like of dtypes : Excludes the provided data types
-              from the result. To select numeric types submit
-              ``numpy.number``. To select categorical objects submit the data
+              from the result. To exclude numeric types submit
+              ``numpy.number``. To exclude object columns submit the data
               type ``numpy.object``. Strings can also be used in the style of
-              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``)
+              ``select_dtypes`` (e.g. ``df.describe(include=['O'])``). To
+              exclude pandas categorical columns, use ``'category'``
             - None (default) : The result will exclude nothing.
 
         Returns
         -------
-        summary:  Series/DataFrame of summary statistics
+        Series or DataFrame
+            Summary statistics of the Series or Dataframe provided.
+
+        See Also
+        --------
+        DataFrame.count: Count number of non-NA/null observations.
+        DataFrame.max: Maximum of the values in the object.
+        DataFrame.min: Minimum of the values in the object.
+        DataFrame.mean: Mean of the values.
+        DataFrame.std: Standard deviation of the obersvations.
+        DataFrame.select_dtypes: Subset of a DataFrame including/excluding
+            columns based on their dtype.
 
         Notes
         -----
@@ -5501,9 +9598,11 @@ def describe(self, percentiles=None, include=None, exclude=None):
         among those with the highest count.
 
         For mixed data types provided via a ``DataFrame``, the default is to
-        return only an analysis of numeric columns. If ``include='all'``
-        is provided as an option, the result will include a union of
-        attributes of each type.
+        return only an analysis of numeric columns. If the dataframe consists
+        only of object and categorical data without any numeric columns, the
+        default is to return an analysis of both the object and categorical
+        columns. If ``include='all'`` is provided as an option, the result
+        will include a union of attributes of each type.
 
         The `include` and `exclude` parameters can be used to limit
         which columns in a ``DataFrame`` are analyzed for the output.
@@ -5523,6 +9622,7 @@ def describe(self, percentiles=None, include=None, exclude=None):
         50%      2.0
         75%      2.5
         max      3.0
+        dtype: float64
 
         Describing a categorical ``Series``.
 
@@ -5553,8 +9653,10 @@ def describe(self, percentiles=None, include=None, exclude=None):
         Describing a ``DataFrame``. By default only numeric fields
         are returned.
 
-        >>> df = pd.DataFrame([[1, 'a'], [2, 'b'], [3, 'c']],
-        ...                   columns=['numeric', 'object'])
+        >>> df = pd.DataFrame({'categorical': pd.Categorical(['d','e','f']),
+        ...                    'numeric': [1, 2, 3],
+        ...                    'object': ['a', 'b', 'c']
+        ...                   })
         >>> df.describe()
                numeric
         count      3.0
@@ -5569,18 +9671,18 @@ def describe(self, percentiles=None, include=None, exclude=None):
         Describing all columns of a ``DataFrame`` regardless of data type.
 
         >>> df.describe(include='all')
-                numeric object
-        count       3.0      3
-        unique      NaN      3
-        top         NaN      b
-        freq        NaN      1
-        mean        2.0    NaN
-        std         1.0    NaN
-        min         1.0    NaN
-        25%         1.5    NaN
-        50%         2.0    NaN
-        75%         2.5    NaN
-        max         3.0    NaN
+                categorical  numeric object
+        count            3      3.0      3
+        unique           3      NaN      3
+        top              f      NaN      c
+        freq             1      NaN      1
+        mean           NaN      2.0    NaN
+        std            NaN      1.0    NaN
+        min            NaN      1.0    NaN
+        25%            NaN      1.5    NaN
+        50%            NaN      2.0    NaN
+        75%            NaN      2.5    NaN
+        max            NaN      3.0    NaN
 
         Describing a column from a ``DataFrame`` by accessing it as
         an attribute.
@@ -5615,42 +9717,45 @@ def describe(self, percentiles=None, include=None, exclude=None):
                object
         count       3
         unique      3
-        top         b
+        top         c
         freq        1
 
+        Including only categorical columns from a ``DataFrame`` description.
+
+        >>> df.describe(include=['category'])
+               categorical
+        count            3
+        unique           3
+        top              f
+        freq             1
+
         Excluding numeric columns from a ``DataFrame`` description.
 
         >>> df.describe(exclude=[np.number])
-               object
-        count       3
-        unique      3
-        top         b
-        freq        1
+               categorical object
+        count            3      3
+        unique           3      3
+        top              f      c
+        freq             1      1
 
         Excluding object columns from a ``DataFrame`` description.
 
         >>> df.describe(exclude=[np.object])
-               numeric
-        count      3.0
-        mean       2.0
-        std        1.0
-        min        1.0
-        25%        1.5
-        50%        2.0
-        75%        2.5
-        max        3.0
-
-        See Also
-        --------
-        DataFrame.count
-        DataFrame.max
-        DataFrame.min
-        DataFrame.mean
-        DataFrame.std
-        DataFrame.select_dtypes
+               categorical  numeric
+        count            3      3.0
+        unique           3      NaN
+        top              f      NaN
+        freq             1      NaN
+        mean           NaN      2.0
+        std            NaN      1.0
+        min            NaN      1.0
+        25%            NaN      1.5
+        50%            NaN      2.0
+        75%            NaN      2.5
+        max            NaN      3.0
         """
         if self.ndim >= 3:
-            msg = "describe is not implemented on Panel or PanelND objects."
+            msg = "describe is not implemented on Panel objects."
             raise NotImplementedError(msg)
         elif self.ndim == 2 and self.columns.size == 0:
             raise ValueError("Cannot describe a DataFrame without columns")
@@ -5681,7 +9786,7 @@ def describe_numeric_1d(series):
             stat_index = (['count', 'mean', 'std', 'min'] +
                           formatted_percentiles + ['max'])
             d = ([series.count(), series.mean(), series.std(), series.min()] +
-                 [series.quantile(x) for x in percentiles] + [series.max()])
+                 series.quantile(percentiles).tolist() + [series.max()])
             return pd.Series(d, index=stat_index, name=series.name)
 
         def describe_categorical_1d(data):
@@ -5692,12 +9797,19 @@ def describe_categorical_1d(data):
             if result[1] > 0:
                 top, freq = objcounts.index[0], objcounts.iloc[0]
 
-                if is_datetime64_dtype(data):
+                if is_datetime64_any_dtype(data):
+                    tz = data.dt.tz
                     asint = data.dropna().values.view('i8')
+                    top = Timestamp(top)
+                    if top.tzinfo is not None and tz is not None:
+                        # Don't tz_localize(None) if key is already tz-aware
+                        top = top.tz_convert(tz)
+                    else:
+                        top = top.tz_localize(tz)
                     names += ['top', 'freq', 'first', 'last']
-                    result += [lib.Timestamp(top), freq,
-                               lib.Timestamp(asint.min()),
-                               lib.Timestamp(asint.max())]
+                    result += [top, freq,
+                               Timestamp(asint.min(), tz=tz),
+                               Timestamp(asint.max(), tz=tz)]
                 else:
                     names += ['top', 'freq']
                     result += [top, freq]
@@ -5732,7 +9844,7 @@ def describe_1d(data):
         ldesc = [describe_1d(s) for _, s in data.iteritems()]
         # set a convenient order for rows
         names = []
-        ldesc_indexes = sorted([x.index for x in ldesc], key=len)
+        ldesc_indexes = sorted((x.index for x in ldesc), key=len)
         for idxnames in ldesc_indexes:
             for name in idxnames:
                 if name not in names:
@@ -5743,7 +9855,9 @@ def describe_1d(data):
         return d
 
     def _check_percentile(self, q):
-        """Validate percentiles (used by describe and quantile)."""
+        """
+        Validate percentiles (used by describe and quantile).
+        """
 
         msg = ("percentiles should all be in the interval [0, 1]. "
                "Try {0} instead.")
@@ -5757,29 +9871,118 @@ def _check_percentile(self, q):
         return q
 
     _shared_docs['pct_change'] = """
-        Percent change over given number of periods.
+        Percentage change between the current and a prior element.
+
+        Computes the percentage change from the immediately previous row by
+        default. This is useful in comparing the percentage of change in a time
+        series of elements.
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming percent change
+            Periods to shift for forming percent change.
         fill_method : str, default 'pad'
-            How to handle NAs before computing percent changes
+            How to handle NAs before computing percent changes.
         limit : int, default None
-            The number of consecutive NAs to fill before stopping
+            The number of consecutive NAs to fill before stopping.
         freq : DateOffset, timedelta, or offset alias string, optional
-            Increment to use from time series API (e.g. 'M' or BDay())
+            Increment to use from time series API (e.g. 'M' or BDay()).
+        **kwargs
+            Additional keyword arguments are passed into
+            `DataFrame.shift` or `Series.shift`.
 
         Returns
         -------
-        chg : %(klass)s
+        chg : Series or DataFrame
+            The same type as the calling object.
 
-        Notes
-        -----
+        See Also
+        --------
+        Series.diff : Compute the difference of two elements in a Series.
+        DataFrame.diff : Compute the difference of two elements in a DataFrame.
+        Series.shift : Shift the index by some number of periods.
+        DataFrame.shift : Shift the index by some number of periods.
+
+        Examples
+        --------
+        **Series**
+
+        >>> s = pd.Series([90, 91, 85])
+        >>> s
+        0    90
+        1    91
+        2    85
+        dtype: int64
+
+        >>> s.pct_change()
+        0         NaN
+        1    0.011111
+        2   -0.065934
+        dtype: float64
+
+        >>> s.pct_change(periods=2)
+        0         NaN
+        1         NaN
+        2   -0.055556
+        dtype: float64
+
+        See the percentage change in a Series where filling NAs with last
+        valid observation forward to next valid.
+
+        >>> s = pd.Series([90, 91, None, 85])
+        >>> s
+        0    90.0
+        1    91.0
+        2     NaN
+        3    85.0
+        dtype: float64
+
+        >>> s.pct_change(fill_method='ffill')
+        0         NaN
+        1    0.011111
+        2    0.000000
+        3   -0.065934
+        dtype: float64
+
+        **DataFrame**
 
-        By default, the percentage change is calculated along the stat
-        axis: 0, or ``Index``, for ``DataFrame`` and 1, or ``minor`` for
-        ``Panel``. You can change this with the ``axis`` keyword argument.
+        Percentage change in French franc, Deutsche Mark, and Italian lira from
+        1980-01-01 to 1980-03-01.
+
+        >>> df = pd.DataFrame({
+        ...     'FR': [4.0405, 4.0963, 4.3149],
+        ...     'GR': [1.7246, 1.7482, 1.8519],
+        ...     'IT': [804.74, 810.01, 860.13]},
+        ...     index=['1980-01-01', '1980-02-01', '1980-03-01'])
+        >>> df
+                        FR      GR      IT
+        1980-01-01  4.0405  1.7246  804.74
+        1980-02-01  4.0963  1.7482  810.01
+        1980-03-01  4.3149  1.8519  860.13
+
+        >>> df.pct_change()
+                          FR        GR        IT
+        1980-01-01       NaN       NaN       NaN
+        1980-02-01  0.013810  0.013684  0.006549
+        1980-03-01  0.053365  0.059318  0.061876
+
+        Percentage of change in GOOG and APPL stock volume. Shows computing
+        the percentage change between columns.
+
+        >>> df = pd.DataFrame({
+        ...     '2016': [1769950, 30586265],
+        ...     '2015': [1500923, 40912316],
+        ...     '2014': [1371819, 41403351]},
+        ...     index=['GOOG', 'APPL'])
+        >>> df
+                  2016      2015      2014
+        GOOG   1769950   1500923   1371819
+        APPL  30586265  40912316  41403351
+
+        >>> df.pct_change(axis='columns')
+              2016      2015      2014
+        GOOG   NaN -0.151997 -0.086016
+        APPL   NaN  0.337604  0.012002
         """
 
     @Appender(_shared_docs['pct_change'] % _shared_doc_kwargs)
@@ -5794,13 +9997,16 @@ def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None,
 
         rs = (data.div(data.shift(periods=periods, freq=freq, axis=axis,
                                   **kwargs)) - 1)
+        rs = rs.reindex_like(data)
         if freq is None:
-            mask = isnull(_values_from_object(self))
+            mask = isna(com.values_from_object(data))
             np.putmask(rs.values, mask, np.nan)
         return rs
 
     def _agg_by_level(self, name, axis=0, level=0, skipna=True, **kwargs):
-        grouped = self.groupby(level=level, axis=axis)
+        if axis is None:
+            raise ValueError("Must specify 'axis' when aggregating by level.")
+        grouped = self.groupby(level=level, axis=axis, sort=False)
         if hasattr(grouped, name) and skipna:
             return getattr(grouped, name)(**kwargs)
         axis = self._get_axis_number(axis)
@@ -5810,23 +10016,23 @@ def _agg_by_level(self, name, axis=0, level=0, skipna=True, **kwargs):
 
     @classmethod
     def _add_numeric_operations(cls):
-        """Add the operations to the cls; evaluate the doc strings again"""
+        """
+        Add the operations to the cls; evaluate the doc strings again
+        """
 
         axis_descr, name, name2 = _doc_parms(cls)
 
         cls.any = _make_logical_function(
-            cls, 'any', name, name2, axis_descr,
-            'Return whether any element is True over requested axis',
-            nanops.nanany)
+            cls, 'any', name, name2, axis_descr, _any_desc, nanops.nanany,
+            _any_see_also, _any_examples, empty_value=False)
         cls.all = _make_logical_function(
-            cls, 'all', name, name2, axis_descr,
-            'Return whether all elements are True over requested axis',
-            nanops.nanall)
-
-        @Substitution(outname='mad',
-                      desc="Return the mean absolute deviation of the values "
-                           "for the requested axis",
-                      name1=name, name2=name2, axis_descr=axis_descr)
+            cls, 'all', name, name2, axis_descr, _all_desc, nanops.nanall,
+            _all_see_also, _all_examples, empty_value=True)
+
+        @Substitution(desc="Return the mean absolute deviation of the values "
+                           "for the requested axis.",
+                      name1=name, name2=name2, axis_descr=axis_descr,
+                      min_count='', see_also='', examples='')
         @Appender(_num_doc)
         def mad(self, axis=None, skipna=None, level=None):
             if skipna is None:
@@ -5864,10 +10070,10 @@ def mad(self, axis=None, skipna=None, level=None):
             "ddof argument",
             nanops.nanstd)
 
-        @Substitution(outname='compounded',
-                      desc="Return the compound percentage of the values for "
-                      "the requested axis", name1=name, name2=name2,
-                      axis_descr=axis_descr)
+        @Substitution(desc="Return the compound percentage of the values for "
+                      "the requested axis.", name1=name, name2=name2,
+                      axis_descr=axis_descr,
+                      min_count='', see_also='', examples='')
         @Appender(_num_doc)
         def compound(self, axis=None, skipna=None, level=None):
             if skipna is None:
@@ -5877,64 +10083,68 @@ def compound(self, axis=None, skipna=None, level=None):
         cls.compound = compound
 
         cls.cummin = _make_cum_function(
-            cls, 'cummin', name, name2, axis_descr, "cumulative minimum",
+            cls, 'cummin', name, name2, axis_descr, "minimum",
             lambda y, axis: np.minimum.accumulate(y, axis), "min",
-            np.inf, np.nan)
+            np.inf, np.nan, _cummin_examples)
         cls.cumsum = _make_cum_function(
-            cls, 'cumsum', name, name2, axis_descr, "cumulative sum",
-            lambda y, axis: y.cumsum(axis), "sum", 0., np.nan)
+            cls, 'cumsum', name, name2, axis_descr, "sum",
+            lambda y, axis: y.cumsum(axis), "sum", 0.,
+            np.nan, _cumsum_examples)
         cls.cumprod = _make_cum_function(
-            cls, 'cumprod', name, name2, axis_descr, "cumulative product",
-            lambda y, axis: y.cumprod(axis), "prod", 1., np.nan)
+            cls, 'cumprod', name, name2, axis_descr, "product",
+            lambda y, axis: y.cumprod(axis), "prod", 1.,
+            np.nan, _cumprod_examples)
         cls.cummax = _make_cum_function(
-            cls, 'cummax', name, name2, axis_descr, "cumulative max",
+            cls, 'cummax', name, name2, axis_descr, "maximum",
             lambda y, axis: np.maximum.accumulate(y, axis), "max",
-            -np.inf, np.nan)
+            -np.inf, np.nan, _cummax_examples)
 
-        cls.sum = _make_stat_function(
+        cls.sum = _make_min_count_stat_function(
             cls, 'sum', name, name2, axis_descr,
-            'Return the sum of the values for the requested axis',
-            nanops.nansum)
+            """Return the sum of the values for the requested axis.\n
+            This is equivalent to the method ``numpy.sum``.""",
+            nanops.nansum, _stat_func_see_also, _sum_examples)
         cls.mean = _make_stat_function(
             cls, 'mean', name, name2, axis_descr,
-            'Return the mean of the values for the requested axis',
+            'Return the mean of the values for the requested axis.',
             nanops.nanmean)
         cls.skew = _make_stat_function(
             cls, 'skew', name, name2, axis_descr,
-            'Return unbiased skew over requested axis\nNormalized by N-1',
+            'Return unbiased skew over requested axis\nNormalized by N-1.',
             nanops.nanskew)
         cls.kurt = _make_stat_function(
             cls, 'kurt', name, name2, axis_descr,
             "Return unbiased kurtosis over requested axis using Fisher's "
             "definition of\nkurtosis (kurtosis of normal == 0.0). Normalized "
-            "by N-1\n",
+            "by N-1.",
             nanops.nankurt)
         cls.kurtosis = cls.kurt
-        cls.prod = _make_stat_function(
+        cls.prod = _make_min_count_stat_function(
             cls, 'prod', name, name2, axis_descr,
-            'Return the product of the values for the requested axis',
-            nanops.nanprod)
+            'Return the product of the values for the requested axis.',
+            nanops.nanprod, examples=_prod_examples)
         cls.product = cls.prod
         cls.median = _make_stat_function(
             cls, 'median', name, name2, axis_descr,
-            'Return the median of the values for the requested axis',
+            'Return the median of the values for the requested axis.',
             nanops.nanmedian)
         cls.max = _make_stat_function(
             cls, 'max', name, name2, axis_descr,
-            """This method returns the maximum of the values in the object.
+            """Return the maximum of the values for the requested axis.\n
             If you want the *index* of the maximum, use ``idxmax``. This is
             the equivalent of the ``numpy.ndarray`` method ``argmax``.""",
-            nanops.nanmax)
+            nanops.nanmax, _stat_func_see_also, _max_examples)
         cls.min = _make_stat_function(
             cls, 'min', name, name2, axis_descr,
-            """This method returns the minimum of the values in the object.
+            """Return the minimum of the values for the requested axis.\n
             If you want the *index* of the minimum, use ``idxmin``. This is
             the equivalent of the ``numpy.ndarray`` method ``argmin``.""",
-            nanops.nanmin)
+            nanops.nanmin, _stat_func_see_also, _min_examples)
 
     @classmethod
     def _add_series_only_operations(cls):
-        """Add the series only operations to the cls; evaluate the doc
+        """
+        Add the series only operations to the cls; evaluate the doc
         strings again.
         """
 
@@ -5943,58 +10153,133 @@ def _add_series_only_operations(cls):
         def nanptp(values, axis=0, skipna=True):
             nmax = nanops.nanmax(values, axis, skipna)
             nmin = nanops.nanmin(values, axis, skipna)
+            warnings.warn("Method .ptp is deprecated and will be removed "
+                          "in a future version. Use numpy.ptp instead.",
+                          FutureWarning, stacklevel=4)
             return nmax - nmin
 
         cls.ptp = _make_stat_function(
             cls, 'ptp', name, name2, axis_descr,
-            """Returns the difference between the maximum value and the
+            """Return the difference between the maximum value and the
             minimum value in the object. This is the equivalent of the
-            ``numpy.ndarray`` method ``ptp``.""",
+            ``numpy.ndarray`` method ``ptp``.\n\n.. deprecated:: 0.24.0
+                Use numpy.ptp instead""",
             nanptp)
 
     @classmethod
     def _add_series_or_dataframe_operations(cls):
-        """Add the series or dataframe only operations to the cls; evaluate
+        """
+        Add the series or dataframe only operations to the cls; evaluate
         the doc strings again.
         """
 
         from pandas.core import window as rwindow
 
         @Appender(rwindow.rolling.__doc__)
-        def rolling(self, window, min_periods=None, freq=None, center=False,
-                    win_type=None, on=None, axis=0):
+        def rolling(self, window, min_periods=None, center=False,
+                    win_type=None, on=None, axis=0, closed=None):
             axis = self._get_axis_number(axis)
             return rwindow.rolling(self, window=window,
-                                   min_periods=min_periods, freq=freq,
+                                   min_periods=min_periods,
                                    center=center, win_type=win_type,
-                                   on=on, axis=axis)
+                                   on=on, axis=axis, closed=closed)
 
         cls.rolling = rolling
 
         @Appender(rwindow.expanding.__doc__)
-        def expanding(self, min_periods=1, freq=None, center=False, axis=0):
+        def expanding(self, min_periods=1, center=False, axis=0):
             axis = self._get_axis_number(axis)
-            return rwindow.expanding(self, min_periods=min_periods, freq=freq,
+            return rwindow.expanding(self, min_periods=min_periods,
                                      center=center, axis=axis)
 
         cls.expanding = expanding
 
         @Appender(rwindow.ewm.__doc__)
         def ewm(self, com=None, span=None, halflife=None, alpha=None,
-                min_periods=0, freq=None, adjust=True, ignore_na=False,
+                min_periods=0, adjust=True, ignore_na=False,
                 axis=0):
             axis = self._get_axis_number(axis)
             return rwindow.ewm(self, com=com, span=span, halflife=halflife,
-                               alpha=alpha, min_periods=min_periods, freq=freq,
+                               alpha=alpha, min_periods=min_periods,
                                adjust=adjust, ignore_na=ignore_na, axis=axis)
 
         cls.ewm = ewm
 
+    @Appender(_shared_docs['transform'] % dict(axis="", **_shared_doc_kwargs))
+    def transform(self, func, *args, **kwargs):
+        result = self.agg(func, *args, **kwargs)
+        if is_scalar(result) or len(result) != len(self):
+            raise ValueError("transforms cannot produce "
+                             "aggregated results")
+
+        return result
+
+    # ----------------------------------------------------------------------
+    # Misc methods
+
+    _shared_docs['valid_index'] = """
+        Return index for %(position)s non-NA/null value.
+
+        Returns
+        --------
+        scalar : type of index
+
+        Notes
+        --------
+        If all elements are non-NA/null, returns None.
+        Also returns None for empty %(klass)s.
+        """
+
+    def _find_valid_index(self, how):
+        """
+        Retrieves the index of the first valid value.
+
+        Parameters
+        ----------
+        how : {'first', 'last'}
+            Use this parameter to change between the first or last valid index.
+
+        Returns
+        -------
+        idx_first_valid : type of index
+        """
+        assert how in ['first', 'last']
+
+        if len(self) == 0:  # early stop
+            return None
+        is_valid = ~self.isna()
+
+        if self.ndim == 2:
+            is_valid = is_valid.any(1)  # reduce axis 1
+
+        if how == 'first':
+            idxpos = is_valid.values[::].argmax()
+
+        if how == 'last':
+            idxpos = len(self) - 1 - is_valid.values[::-1].argmax()
+
+        chk_notna = is_valid.iat[idxpos]
+        idx = self.index[idxpos]
+
+        if not chk_notna:
+            return None
+        return idx
+
+    @Appender(_shared_docs['valid_index'] % {'position': 'first',
+                                             'klass': 'NDFrame'})
+    def first_valid_index(self):
+        return self._find_valid_index('first')
+
+    @Appender(_shared_docs['valid_index'] % {'position': 'last',
+                                             'klass': 'NDFrame'})
+    def last_valid_index(self):
+        return self._find_valid_index('last')
+
 
 def _doc_parms(cls):
     """Return a tuple of the doc parms."""
-    axis_descr = "{%s}" % ', '.join(["{0} ({1})".format(a, i)
-                                     for i, a in enumerate(cls._AXIS_ORDERS)])
+    axis_descr = "{%s}" % ', '.join("{0} ({1})".format(a, i)
+                                    for i, a in enumerate(cls._AXIS_ORDERS))
     name = (cls._constructor_sliced.__name__
             if cls._AXIS_LEN > 1 else 'scalar')
     name2 = cls.__name__
@@ -6002,99 +10287,702 @@ def _doc_parms(cls):
 
 
 _num_doc = """
-
 %(desc)s
 
 Parameters
 ----------
 axis : %(axis_descr)s
-skipna : boolean, default True
-    Exclude NA/null values. If an entire row/column is NA, the result
-    will be NA
+    Axis for the function to be applied on.
+skipna : bool, default True
+    Exclude NA/null values when computing the result.
 level : int or level name, default None
     If the axis is a MultiIndex (hierarchical), count along a
-    particular level, collapsing into a %(name1)s
-numeric_only : boolean, default None
+    particular level, collapsing into a %(name1)s.
+numeric_only : bool, default None
     Include only float, int, boolean columns. If None, will attempt to use
     everything, then use only numeric data. Not implemented for Series.
+%(min_count)s\
+**kwargs
+    Additional keyword arguments to be passed to the function.
 
 Returns
 -------
-%(outname)s : %(name1)s or %(name2)s (if level specified)\n"""
+%(name1)s or %(name2)s (if level specified)
+%(see_also)s
+%(examples)s\
+"""
 
 _num_ddof_doc = """
-
 %(desc)s
 
 Parameters
 ----------
 axis : %(axis_descr)s
-skipna : boolean, default True
+skipna : bool, default True
     Exclude NA/null values. If an entire row/column is NA, the result
     will be NA
 level : int or level name, default None
     If the axis is a MultiIndex (hierarchical), count along a
     particular level, collapsing into a %(name1)s
 ddof : int, default 1
-    degrees of freedom
-numeric_only : boolean, default None
+    Delta Degrees of Freedom. The divisor used in calculations is N - ddof,
+    where N represents the number of elements.
+numeric_only : bool, default None
     Include only float, int, boolean columns. If None, will attempt to use
     everything, then use only numeric data. Not implemented for Series.
 
 Returns
 -------
-%(outname)s : %(name1)s or %(name2)s (if level specified)\n"""
+%(name1)s or %(name2)s (if level specified)\n"""
 
 _bool_doc = """
-
 %(desc)s
 
 Parameters
 ----------
-axis : %(axis_descr)s
-skipna : boolean, default True
-    Exclude NA/null values. If an entire row/column is NA, the result
-    will be NA
-level : int or level name, default None
-    If the axis is a MultiIndex (hierarchical), count along a
-    particular level, collapsing into a %(name1)s
-bool_only : boolean, default None
+axis : {0 or 'index', 1 or 'columns', None}, default 0
+    Indicate which axis or axes should be reduced.
+
+    * 0 / 'index' : reduce the index, return a Series whose index is the
+      original column labels.
+    * 1 / 'columns' : reduce the columns, return a Series whose index is the
+      original index.
+    * None : reduce all axes, return a scalar.
+
+bool_only : bool, default None
     Include only boolean columns. If None, will attempt to use everything,
     then use only boolean data. Not implemented for Series.
+skipna : bool, default True
+    Exclude NA/null values. If the entire row/column is NA and skipna is
+    True, then the result will be %(empty_value)s, as for an empty row/column.
+    If skipna is False, then NA are treated as True, because these are not
+    equal to zero.
+level : int or level name, default None
+    If the axis is a MultiIndex (hierarchical), count along a
+    particular level, collapsing into a %(name1)s.
+**kwargs : any, default None
+    Additional keywords have no effect but might be accepted for
+    compatibility with NumPy.
 
 Returns
 -------
-%(outname)s : %(name1)s or %(name2)s (if level specified)\n"""
+%(name1)s or %(name2)s
+    If level is specified, then, %(name2)s is returned; otherwise, %(name1)s
+    is returned.
+
+%(see_also)s
+%(examples)s"""
+
+_all_desc = """\
+Return whether all elements are True, potentially over an axis.
+
+Returns True unless there at least one element within a series or
+along a Dataframe axis that is False or equivalent (e.g. zero or
+empty)."""
+
+_all_examples = """\
+Examples
+--------
+**Series**
+
+>>> pd.Series([True, True]).all()
+True
+>>> pd.Series([True, False]).all()
+False
+>>> pd.Series([]).all()
+True
+>>> pd.Series([np.nan]).all()
+True
+>>> pd.Series([np.nan]).all(skipna=False)
+True
+
+**DataFrames**
+
+Create a dataframe from a dictionary.
+
+>>> df = pd.DataFrame({'col1': [True, True], 'col2': [True, False]})
+>>> df
+   col1   col2
+0  True   True
+1  True  False
+
+Default behaviour checks if column-wise values all return True.
+
+>>> df.all()
+col1     True
+col2    False
+dtype: bool
+
+Specify ``axis='columns'`` to check if row-wise values all return True.
+
+>>> df.all(axis='columns')
+0     True
+1    False
+dtype: bool
+
+Or ``axis=None`` for whether every value is True.
+
+>>> df.all(axis=None)
+False
+"""
+
+_all_see_also = """\
+See Also
+--------
+Series.all : Return True if all elements are True.
+DataFrame.any : Return True if one (or more) elements are True.
+"""
 
 _cnum_doc = """
+Return cumulative %(desc)s over a DataFrame or Series axis.
+
+Returns a DataFrame or Series of the same size containing the cumulative
+%(desc)s.
 
 Parameters
 ----------
-axis : %(axis_descr)s
+axis : {0 or 'index', 1 or 'columns'}, default 0
+    The index or the name of the axis. 0 is equivalent to None or 'index'.
 skipna : boolean, default True
     Exclude NA/null values. If an entire row/column is NA, the result
-    will be NA
+    will be NA.
+*args, **kwargs :
+    Additional keywords have no effect but might be accepted for
+    compatibility with NumPy.
 
 Returns
 -------
-%(outname)s : %(name1)s\n
+%(name1)s or %(name2)s\n
+See Also
+--------
+core.window.Expanding.%(accum_func_name)s : Similar functionality
+    but ignores ``NaN`` values.
+%(name2)s.%(accum_func_name)s : Return the %(desc)s over
+    %(name2)s axis.
+%(name2)s.cummax : Return cumulative maximum over %(name2)s axis.
+%(name2)s.cummin : Return cumulative minimum over %(name2)s axis.
+%(name2)s.cumsum : Return cumulative sum over %(name2)s axis.
+%(name2)s.cumprod : Return cumulative product over %(name2)s axis.
+
+%(examples)s
+"""
 
+_cummin_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cummin()
+0    2.0
+1    NaN
+2    2.0
+3   -1.0
+4   -1.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cummin(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the minimum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cummin()
+     A    B
+0  2.0  1.0
+1  2.0  NaN
+2  1.0  0.0
+
+To iterate over columns and find the minimum in each row,
+use ``axis=1``
+
+>>> df.cummin(axis=1)
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+"""
 
-See also
+_cumsum_examples = """\
+Examples
 --------
-pandas.core.window.Expanding.%(accum_func_name)s : Similar functionality
-    but ignores ``NaN`` values.
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cumsum()
+0    2.0
+1    NaN
+2    7.0
+3    6.0
+4    6.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cumsum(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the sum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cumsum()
+     A    B
+0  2.0  1.0
+1  5.0  NaN
+2  6.0  1.0
+
+To iterate over columns and find the sum in each row,
+use ``axis=1``
+
+>>> df.cumsum(axis=1)
+     A    B
+0  2.0  3.0
+1  3.0  NaN
+2  1.0  1.0
+"""
 
+_cumprod_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cumprod()
+0     2.0
+1     NaN
+2    10.0
+3   -10.0
+4    -0.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cumprod(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the product
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cumprod()
+     A    B
+0  2.0  1.0
+1  6.0  NaN
+2  6.0  0.0
+
+To iterate over columns and find the product in each row,
+use ``axis=1``
+
+>>> df.cumprod(axis=1)
+     A    B
+0  2.0  2.0
+1  3.0  NaN
+2  1.0  0.0
 """
 
+_cummax_examples = """\
+Examples
+--------
+**Series**
+
+>>> s = pd.Series([2, np.nan, 5, -1, 0])
+>>> s
+0    2.0
+1    NaN
+2    5.0
+3   -1.0
+4    0.0
+dtype: float64
+
+By default, NA values are ignored.
+
+>>> s.cummax()
+0    2.0
+1    NaN
+2    5.0
+3    5.0
+4    5.0
+dtype: float64
+
+To include NA values in the operation, use ``skipna=False``
+
+>>> s.cummax(skipna=False)
+0    2.0
+1    NaN
+2    NaN
+3    NaN
+4    NaN
+dtype: float64
+
+**DataFrame**
+
+>>> df = pd.DataFrame([[2.0, 1.0],
+...                    [3.0, np.nan],
+...                    [1.0, 0.0]],
+...                    columns=list('AB'))
+>>> df
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  1.0  0.0
+
+By default, iterates over rows and finds the maximum
+in each column. This is equivalent to ``axis=None`` or ``axis='index'``.
+
+>>> df.cummax()
+     A    B
+0  2.0  1.0
+1  3.0  NaN
+2  3.0  1.0
+
+To iterate over columns and find the maximum in each row,
+use ``axis=1``
+
+>>> df.cummax(axis=1)
+     A    B
+0  2.0  2.0
+1  3.0  NaN
+2  1.0  1.0
+"""
 
-def _make_stat_function(cls, name, name1, name2, axis_descr, desc, f):
-    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
-                  axis_descr=axis_descr)
+_any_see_also = """\
+See Also
+--------
+numpy.any : Numpy version of this method.
+Series.any : Return whether any element is True.
+Series.all : Return whether all elements are True.
+DataFrame.any : Return whether any element is True over requested axis.
+DataFrame.all : Return whether all elements are True over requested axis.
+"""
+
+_any_desc = """\
+Return whether any element is True, potentially over an axis.
+
+Returns False unless there at least one element within a series or
+along a Dataframe axis that is True or equivalent (e.g. non-zero or
+non-empty)."""
+
+_any_examples = """\
+Examples
+--------
+**Series**
+
+For Series input, the output is a scalar indicating whether any element
+is True.
+
+>>> pd.Series([False, False]).any()
+False
+>>> pd.Series([True, False]).any()
+True
+>>> pd.Series([]).any()
+False
+>>> pd.Series([np.nan]).any()
+False
+>>> pd.Series([np.nan]).any(skipna=False)
+True
+
+**DataFrame**
+
+Whether each column contains at least one True element (the default).
+
+>>> df = pd.DataFrame({"A": [1, 2], "B": [0, 2], "C": [0, 0]})
+>>> df
+   A  B  C
+0  1  0  0
+1  2  2  0
+
+>>> df.any()
+A     True
+B     True
+C    False
+dtype: bool
+
+Aggregating over the columns.
+
+>>> df = pd.DataFrame({"A": [True, False], "B": [1, 2]})
+>>> df
+       A  B
+0   True  1
+1  False  2
+
+>>> df.any(axis='columns')
+0    True
+1    True
+dtype: bool
+
+>>> df = pd.DataFrame({"A": [True, False], "B": [1, 0]})
+>>> df
+       A  B
+0   True  1
+1  False  0
+
+>>> df.any(axis='columns')
+0    True
+1    False
+dtype: bool
+
+Aggregating over the entire DataFrame with ``axis=None``.
+
+>>> df.any(axis=None)
+True
+
+`any` for an empty DataFrame is an empty Series.
+
+>>> pd.DataFrame([]).any()
+Series([], dtype: bool)
+"""
+
+_shared_docs['stat_func_example'] = """\
+Examples
+--------
+
+>>> idx = pd.MultiIndex.from_arrays([
+...     ['warm', 'warm', 'cold', 'cold'],
+...     ['dog', 'falcon', 'fish', 'spider']],
+...     names=['blooded', 'animal'])
+>>> s = pd.Series([4, 2, 0, 8], name='legs', index=idx)
+>>> s
+blooded  animal
+warm     dog       4
+         falcon    2
+cold     fish      0
+         spider    8
+Name: legs, dtype: int64
+
+>>> s.{stat_func}()
+{default_output}
+
+{verb} using level names, as well as indices.
+
+>>> s.{stat_func}(level='blooded')
+blooded
+warm    {level_output_0}
+cold    {level_output_1}
+Name: legs, dtype: int64
+
+>>> s.{stat_func}(level=0)
+blooded
+warm    {level_output_0}
+cold    {level_output_1}
+Name: legs, dtype: int64
+"""
+
+_sum_examples = _shared_docs['stat_func_example'].format(
+    stat_func='sum',
+    verb='Sum',
+    default_output=14,
+    level_output_0=6,
+    level_output_1=8)
+
+_sum_examples += """
+By default, the sum of an empty or all-NA Series is ``0``.
+
+>>> pd.Series([]).sum()  # min_count=0 is the default
+0.0
+
+This can be controlled with the ``min_count`` parameter. For example, if
+you'd like the sum of an empty series to be NaN, pass ``min_count=1``.
+
+>>> pd.Series([]).sum(min_count=1)
+nan
+
+Thanks to the ``skipna`` parameter, ``min_count`` handles all-NA and
+empty series identically.
+
+>>> pd.Series([np.nan]).sum()
+0.0
+
+>>> pd.Series([np.nan]).sum(min_count=1)
+nan
+"""
+
+_max_examples = _shared_docs['stat_func_example'].format(
+    stat_func='max',
+    verb='Max',
+    default_output=8,
+    level_output_0=4,
+    level_output_1=8)
+
+_min_examples = _shared_docs['stat_func_example'].format(
+    stat_func='min',
+    verb='Min',
+    default_output=0,
+    level_output_0=2,
+    level_output_1=0)
+
+_stat_func_see_also = """
+See Also
+--------
+Series.sum : Return the sum.
+Series.min : Return the minimum.
+Series.max : Return the maximum.
+Series.idxmin : Return the index of the minimum.
+Series.idxmax : Return the index of the maximum.
+DataFrame.sum : Return the sum over the requested axis.
+DataFrame.min : Return the minimum over the requested axis.
+DataFrame.max : Return the maximum over the requested axis.
+DataFrame.idxmin : Return the index of the minimum over the requested axis.
+DataFrame.idxmax : Return the index of the maximum over the requested axis.
+"""
+
+_prod_examples = """\
+Examples
+--------
+By default, the product of an empty or all-NA Series is ``1``
+
+>>> pd.Series([]).prod()
+1.0
+
+This can be controlled with the ``min_count`` parameter
+
+>>> pd.Series([]).prod(min_count=1)
+nan
+
+Thanks to the ``skipna`` parameter, ``min_count`` handles all-NA and
+empty series identically.
+
+>>> pd.Series([np.nan]).prod()
+1.0
+
+>>> pd.Series([np.nan]).prod(min_count=1)
+nan
+"""
+
+_min_count_stub = """\
+min_count : int, default 0
+    The required number of valid values to perform the operation. If fewer than
+    ``min_count`` non-NA values are present the result will be NA.
+
+    .. versionadded :: 0.22.0
+
+       Added with the default being 0. This means the sum of an all-NA
+       or empty Series is 0, and the product of an all-NA or empty
+       Series is 1.
+"""
+
+
+def _make_min_count_stat_function(cls, name, name1, name2, axis_descr, desc,
+                                  f, see_also='', examples=''):
+    @Substitution(desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, min_count=_min_count_stub,
+                  see_also=see_also, examples=examples)
+    @Appender(_num_doc)
+    def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
+                  min_count=0,
+                  **kwargs):
+        if name == 'sum':
+            nv.validate_sum(tuple(), kwargs)
+        elif name == 'prod':
+            nv.validate_prod(tuple(), kwargs)
+        else:
+            nv.validate_stat_func(tuple(), kwargs, fname=name)
+        if skipna is None:
+            skipna = True
+        if axis is None:
+            axis = self._stat_axis_number
+        if level is not None:
+            return self._agg_by_level(name, axis=axis, level=level,
+                                      skipna=skipna, min_count=min_count)
+        return self._reduce(f, name, axis=axis, skipna=skipna,
+                            numeric_only=numeric_only, min_count=min_count)
+
+    return set_function_name(stat_func, name, cls)
+
+
+def _make_stat_function(cls, name, name1, name2, axis_descr, desc, f,
+                        see_also='', examples=''):
+    @Substitution(desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, min_count='', see_also=see_also,
+                  examples=examples)
     @Appender(_num_doc)
     def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
                   **kwargs):
-        nv.validate_stat_func(tuple(), kwargs, fname=name)
+        if name == 'median':
+            nv.validate_median(tuple(), kwargs)
+        else:
+            nv.validate_stat_func(tuple(), kwargs, fname=name)
         if skipna is None:
             skipna = True
         if axis is None:
@@ -6109,7 +10997,7 @@ def stat_func(self, axis=None, skipna=None, level=None, numeric_only=None,
 
 
 def _make_stat_function_ddof(cls, name, name1, name2, axis_descr, desc, f):
-    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
+    @Substitution(desc=desc, name1=name1, name2=name2,
                   axis_descr=axis_descr)
     @Appender(_num_ddof_doc)
     def stat_func(self, axis=None, skipna=None, level=None, ddof=1,
@@ -6129,11 +11017,11 @@ def stat_func(self, axis=None, skipna=None, level=None, ddof=1,
 
 
 def _make_cum_function(cls, name, name1, name2, axis_descr, desc,
-                       accum_func, accum_func_name, mask_a, mask_b):
-    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
-                  axis_descr=axis_descr, accum_func_name=accum_func_name)
-    @Appender("Return {0} over requested axis.".format(desc) +
-              _cnum_doc)
+                       accum_func, accum_func_name, mask_a, mask_b, examples):
+    @Substitution(desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, accum_func_name=accum_func_name,
+                  examples=examples)
+    @Appender(_cnum_doc)
     def cum_func(self, axis=None, skipna=True, *args, **kwargs):
         skipna = nv.validate_cum_func_with_skipna(skipna, args, kwargs, name)
         if axis is None:
@@ -6141,15 +11029,15 @@ def cum_func(self, axis=None, skipna=True, *args, **kwargs):
         else:
             axis = self._get_axis_number(axis)
 
-        y = _values_from_object(self).copy()
+        y = com.values_from_object(self).copy()
 
         if (skipna and
                 issubclass(y.dtype.type, (np.datetime64, np.timedelta64))):
             result = accum_func(y, axis)
-            mask = isnull(self)
-            np.putmask(result, mask, tslib.iNaT)
+            mask = isna(self)
+            np.putmask(result, mask, iNaT)
         elif skipna and not issubclass(y.dtype.type, (np.integer, np.bool_)):
-            mask = isnull(self)
+            mask = isna(self)
             np.putmask(y, mask, mask_a)
             result = accum_func(y, axis)
             np.putmask(result, mask, mask_b)
@@ -6163,26 +11051,23 @@ def cum_func(self, axis=None, skipna=True, *args, **kwargs):
     return set_function_name(cum_func, name, cls)
 
 
-def _make_logical_function(cls, name, name1, name2, axis_descr, desc, f):
-    @Substitution(outname=name, desc=desc, name1=name1, name2=name2,
-                  axis_descr=axis_descr)
+def _make_logical_function(cls, name, name1, name2, axis_descr, desc, f,
+                           see_also, examples, empty_value):
+    @Substitution(desc=desc, name1=name1, name2=name2,
+                  axis_descr=axis_descr, see_also=see_also, examples=examples,
+                  empty_value=empty_value)
     @Appender(_bool_doc)
-    def logical_func(self, axis=None, bool_only=None, skipna=None, level=None,
+    def logical_func(self, axis=0, bool_only=None, skipna=True, level=None,
                      **kwargs):
         nv.validate_logical_func(tuple(), kwargs, fname=name)
-        if skipna is None:
-            skipna = True
-        if axis is None:
-            axis = self._stat_axis_number
         if level is not None:
             if bool_only is not None:
                 raise NotImplementedError("Option bool_only is not "
                                           "implemented with option level.")
             return self._agg_by_level(name, axis=axis, level=level,
                                       skipna=skipna)
-        return self._reduce(f, axis=axis, skipna=skipna,
-                            numeric_only=bool_only, filter_type='bool',
-                            name=name)
+        return self._reduce(f, name, axis=axis, skipna=skipna,
+                            numeric_only=bool_only, filter_type='bool')
 
     return set_function_name(logical_func, name, cls)
 
diff --git a/pandas/core/groupby.py b/pandas/core/groupby.py
deleted file mode 100644
index fe764a099bb63..0000000000000
--- a/pandas/core/groupby.py
+++ /dev/null
@@ -1,4345 +0,0 @@
-import types
-from functools import wraps
-import numpy as np
-import datetime
-import collections
-import warnings
-import copy
-
-from pandas.compat import (
-    zip, range, lzip,
-    callable, map
-)
-
-from pandas import compat
-from pandas.compat.numpy import function as nv, _np_version_under1p8
-from pandas.compat import set_function_name
-
-from pandas.types.common import (is_numeric_dtype,
-                                 is_timedelta64_dtype, is_datetime64_dtype,
-                                 is_categorical_dtype,
-                                 is_datetimelike,
-                                 is_datetime64_any_dtype,
-                                 is_bool, is_integer_dtype,
-                                 is_complex_dtype,
-                                 is_bool_dtype,
-                                 is_scalar,
-                                 is_list_like,
-                                 needs_i8_conversion,
-                                 _ensure_float64,
-                                 _ensure_platform_int,
-                                 _ensure_int64,
-                                 _ensure_object,
-                                 _ensure_categorical,
-                                 _ensure_float)
-from pandas.types.cast import maybe_downcast_to_dtype
-from pandas.types.missing import isnull, notnull, _maybe_fill
-
-from pandas.core.common import (_values_from_object, AbstractMethodError,
-                                _default_index)
-
-from pandas.core.base import (PandasObject, SelectionMixin, GroupByError,
-                              DataError, SpecificationError)
-from pandas.core.categorical import Categorical
-from pandas.core.frame import DataFrame
-from pandas.core.generic import NDFrame
-from pandas.core.index import (Index, MultiIndex, CategoricalIndex,
-                               _ensure_index)
-from pandas.core.internals import BlockManager, make_block
-from pandas.core.series import Series
-from pandas.core.panel import Panel
-from pandas.core.sorting import (get_group_index_sorter, get_group_index,
-                                 compress_group_index, get_flattened_iterator,
-                                 decons_obs_group_ids, get_indexer_dict)
-from pandas.util.decorators import (cache_readonly, Substitution,
-                                    Appender, make_signature)
-from pandas.formats.printing import pprint_thing
-from pandas.util.validators import validate_kwargs
-
-import pandas.core.algorithms as algorithms
-import pandas.core.common as com
-from pandas.core.config import option_context
-
-from pandas._libs import lib, groupby as libgroupby, Timestamp, NaT, iNaT
-from pandas._libs.lib import count_level_2d
-
-_doc_template = """
-
-        See also
-        --------
-        pandas.Series.%(name)s
-        pandas.DataFrame.%(name)s
-        pandas.Panel.%(name)s
-"""
-
-_transform_template = """
-Call function producing a like-indexed %(klass)s on each group and
-return a %(klass)s having the same indexes as the original object
-filled with the transformed values
-
-Parameters
-----------
-f : function
-    Function to apply to each group
-
-Notes
------
-Each group is endowed the attribute 'name' in case you need to know
-which group you are working on.
-
-The current implementation imposes three requirements on f:
-
-* f must return a value that either has the same shape as the input
-  subframe or can be broadcast to the shape of the input subframe.
-  For example, f returns a scalar it will be broadcast to have the
-  same shape as the input subframe.
-* if this is a DataFrame, f must support application column-by-column
-  in the subframe. If f also supports application to the entire subframe,
-  then a fast path is used starting from the second chunk.
-* f must not mutate groups. Mutation is not supported and may
-  produce unexpected results.
-
-Returns
--------
-%(klass)s
-
-See also
---------
-aggregate, transform
-
-Examples
---------
-
-# Same shape
->>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-...                           'foo', 'bar'],
-...                    'B' : ['one', 'one', 'two', 'three',
-...                          'two', 'two'],
-...                    'C' : [1, 5, 5, 2, 5, 5],
-...                    'D' : [2.0, 5., 8., 1., 2., 9.]})
->>> grouped = df.groupby('A')
->>> grouped.transform(lambda x: (x - x.mean()) / x.std())
-          C         D
-0 -1.154701 -0.577350
-1  0.577350  0.000000
-2  0.577350  1.154701
-3 -1.154701 -1.000000
-4  0.577350 -0.577350
-5  0.577350  1.000000
-
-# Broadcastable
->>> grouped.transform(lambda x: x.max() - x.min())
-   C    D
-0  4  6.0
-1  3  8.0
-2  4  6.0
-3  3  8.0
-4  4  6.0
-5  3  8.0
-
-"""
-
-# special case to prevent duplicate plots when catching exceptions when
-# forwarding methods from NDFrames
-_plotting_methods = frozenset(['plot', 'boxplot', 'hist'])
-
-_common_apply_whitelist = frozenset([
-    'last', 'first',
-    'head', 'tail', 'median',
-    'mean', 'sum', 'min', 'max',
-    'cumcount',
-    'resample',
-    'rank', 'quantile',
-    'fillna',
-    'mad',
-    'any', 'all',
-    'take',
-    'idxmax', 'idxmin',
-    'shift', 'tshift',
-    'ffill', 'bfill',
-    'pct_change', 'skew',
-    'corr', 'cov', 'diff',
-]) | _plotting_methods
-
-_series_apply_whitelist = ((_common_apply_whitelist |
-                            {'nlargest', 'nsmallest'}) -
-                           {'boxplot'}) | frozenset(['dtype', 'unique'])
-
-_dataframe_apply_whitelist = (_common_apply_whitelist |
-                              frozenset(['dtypes', 'corrwith']))
-
-_cython_transforms = frozenset(['cumprod', 'cumsum', 'shift',
-                                'cummin', 'cummax'])
-
-
-class Grouper(object):
-    """
-    A Grouper allows the user to specify a groupby instruction for a target
-    object
-
-    This specification will select a column via the key parameter, or if the
-    level and/or axis parameters are given, a level of the index of the target
-    object.
-
-    These are local specifications and will override 'global' settings,
-    that is the parameters axis and level which are passed to the groupby
-    itself.
-
-    Parameters
-    ----------
-    key : string, defaults to None
-        groupby key, which selects the grouping column of the target
-    level : name/number, defaults to None
-        the level for the target index
-    freq : string / frequency object, defaults to None
-        This will groupby the specified frequency if the target selection
-        (via key or level) is a datetime-like object. For full specification
-        of available frequencies, please see `here
-        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`_.
-    axis : number/name of the axis, defaults to 0
-    sort : boolean, default to False
-        whether to sort the resulting labels
-
-    additional kwargs to control time-like groupers (when freq is passed)
-
-    closed : closed end of interval; left or right
-    label : interval boundary to use for labeling; left or right
-    convention : {'start', 'end', 'e', 's'}
-        If grouper is PeriodIndex
-
-    Returns
-    -------
-    A specification for a groupby instruction
-
-    Examples
-    --------
-
-    Syntactic sugar for ``df.groupby('A')``
-
-    >>> df.groupby(Grouper(key='A'))
-
-    Specify a resample operation on the column 'date'
-
-    >>> df.groupby(Grouper(key='date', freq='60s'))
-
-    Specify a resample operation on the level 'date' on the columns axis
-    with a frequency of 60s
-
-    >>> df.groupby(Grouper(level='date', freq='60s', axis=1))
-    """
-
-    def __new__(cls, *args, **kwargs):
-        if kwargs.get('freq') is not None:
-            from pandas.tseries.resample import TimeGrouper
-            cls = TimeGrouper
-        return super(Grouper, cls).__new__(cls)
-
-    def __init__(self, key=None, level=None, freq=None, axis=0, sort=False):
-        self.key = key
-        self.level = level
-        self.freq = freq
-        self.axis = axis
-        self.sort = sort
-
-        self.grouper = None
-        self.obj = None
-        self.indexer = None
-        self.binner = None
-
-    @property
-    def ax(self):
-        return self.grouper
-
-    def _get_grouper(self, obj):
-        """
-        Parameters
-        ----------
-        obj : the subject object
-
-        Returns
-        -------
-        a tuple of binner, grouper, obj (possibly sorted)
-        """
-
-        self._set_grouper(obj)
-        self.grouper, exclusions, self.obj = _get_grouper(self.obj, [self.key],
-                                                          axis=self.axis,
-                                                          level=self.level,
-                                                          sort=self.sort)
-        return self.binner, self.grouper, self.obj
-
-    def _set_grouper(self, obj, sort=False):
-        """
-        given an object and the specifications, setup the internal grouper
-        for this particular specification
-
-        Parameters
-        ----------
-        obj : the subject object
-        sort : bool, default False
-            whether the resulting grouper should be sorted
-        """
-
-        if self.key is not None and self.level is not None:
-            raise ValueError(
-                "The Grouper cannot specify both a key and a level!")
-
-        # the key must be a valid info item
-        if self.key is not None:
-            key = self.key
-            if key not in obj._info_axis:
-                raise KeyError("The grouper name {0} is not found".format(key))
-            ax = Index(obj[key], name=key)
-
-        else:
-            ax = obj._get_axis(self.axis)
-            if self.level is not None:
-                level = self.level
-
-                # if a level is given it must be a mi level or
-                # equivalent to the axis name
-                if isinstance(ax, MultiIndex):
-                    level = ax._get_level_number(level)
-                    ax = Index(ax._get_level_values(level),
-                               name=ax.names[level])
-
-                else:
-                    if level not in (0, ax.name):
-                        raise ValueError(
-                            "The level {0} is not valid".format(level))
-
-        # possibly sort
-        if (self.sort or sort) and not ax.is_monotonic:
-            # use stable sort to support first, last, nth
-            indexer = self.indexer = ax.argsort(kind='mergesort')
-            ax = ax.take(indexer)
-            obj = obj.take(indexer, axis=self.axis,
-                           convert=False, is_copy=False)
-
-        self.obj = obj
-        self.grouper = ax
-        return self.grouper
-
-    def _get_binner_for_grouping(self, obj):
-        """ default to the standard binner here """
-        group_axis = obj._get_axis(self.axis)
-        return Grouping(group_axis, None, obj=obj, name=self.key,
-                        level=self.level, sort=self.sort, in_axis=False)
-
-    @property
-    def groups(self):
-        return self.grouper.groups
-
-
-class GroupByPlot(PandasObject):
-    """
-    Class implementing the .plot attribute for groupby objects
-    """
-
-    def __init__(self, groupby):
-        self._groupby = groupby
-
-    def __call__(self, *args, **kwargs):
-        def f(self):
-            return self.plot(*args, **kwargs)
-        f.__name__ = 'plot'
-        return self._groupby.apply(f)
-
-    def __getattr__(self, name):
-        def attr(*args, **kwargs):
-            def f(self):
-                return getattr(self.plot, name)(*args, **kwargs)
-            return self._groupby.apply(f)
-        return attr
-
-
-class _GroupBy(PandasObject, SelectionMixin):
-    _group_selection = None
-    _apply_whitelist = frozenset([])
-
-    def __init__(self, obj, keys=None, axis=0, level=None,
-                 grouper=None, exclusions=None, selection=None, as_index=True,
-                 sort=True, group_keys=True, squeeze=False, **kwargs):
-
-        self._selection = selection
-
-        if isinstance(obj, NDFrame):
-            obj._consolidate_inplace()
-
-        self.level = level
-
-        if not as_index:
-            if not isinstance(obj, DataFrame):
-                raise TypeError('as_index=False only valid with DataFrame')
-            if axis != 0:
-                raise ValueError('as_index=False only valid for axis=0')
-
-        self.as_index = as_index
-        self.keys = keys
-        self.sort = sort
-        self.group_keys = group_keys
-        self.squeeze = squeeze
-        self.mutated = kwargs.pop('mutated', False)
-
-        if grouper is None:
-            grouper, exclusions, obj = _get_grouper(obj, keys,
-                                                    axis=axis,
-                                                    level=level,
-                                                    sort=sort,
-                                                    mutated=self.mutated)
-
-        self.obj = obj
-        self.axis = obj._get_axis_number(axis)
-        self.grouper = grouper
-        self.exclusions = set(exclusions) if exclusions else set()
-
-        # we accept no other args
-        validate_kwargs('group', kwargs, {})
-
-    def __len__(self):
-        return len(self.groups)
-
-    def __unicode__(self):
-        # TODO: Better unicode/repr for GroupBy object
-        return object.__repr__(self)
-
-    def _assure_grouper(self):
-        """
-        we create the grouper on instantiation
-        sub-classes may have a different policy
-        """
-        pass
-
-    @property
-    def groups(self):
-        """ dict {group name -> group labels} """
-        self._assure_grouper()
-        return self.grouper.groups
-
-    @property
-    def ngroups(self):
-        self._assure_grouper()
-        return self.grouper.ngroups
-
-    @property
-    def indices(self):
-        """ dict {group name -> group indices} """
-        self._assure_grouper()
-        return self.grouper.indices
-
-    def _get_indices(self, names):
-        """
-        safe get multiple indices, translate keys for
-        datelike to underlying repr
-        """
-
-        def get_converter(s):
-            # possibly convert to the actual key types
-            # in the indices, could be a Timestamp or a np.datetime64
-            if isinstance(s, (Timestamp, datetime.datetime)):
-                return lambda key: Timestamp(key)
-            elif isinstance(s, np.datetime64):
-                return lambda key: Timestamp(key).asm8
-            else:
-                return lambda key: key
-
-        if len(names) == 0:
-            return []
-
-        if len(self.indices) > 0:
-            index_sample = next(iter(self.indices))
-        else:
-            index_sample = None     # Dummy sample
-
-        name_sample = names[0]
-        if isinstance(index_sample, tuple):
-            if not isinstance(name_sample, tuple):
-                msg = ("must supply a tuple to get_group with multiple"
-                       " grouping keys")
-                raise ValueError(msg)
-            if not len(name_sample) == len(index_sample):
-                try:
-                    # If the original grouper was a tuple
-                    return [self.indices[name] for name in names]
-                except KeyError:
-                    # turns out it wasn't a tuple
-                    msg = ("must supply a a same-length tuple to get_group"
-                           " with multiple grouping keys")
-                    raise ValueError(msg)
-
-            converters = [get_converter(s) for s in index_sample]
-            names = [tuple([f(n) for f, n in zip(converters, name)])
-                     for name in names]
-
-        else:
-            converter = get_converter(index_sample)
-            names = [converter(name) for name in names]
-
-        return [self.indices.get(name, []) for name in names]
-
-    def _get_index(self, name):
-        """ safe get index, translate keys for datelike to underlying repr """
-        return self._get_indices([name])[0]
-
-    @cache_readonly
-    def _selected_obj(self):
-
-        if self._selection is None or isinstance(self.obj, Series):
-            if self._group_selection is not None:
-                return self.obj[self._group_selection]
-            return self.obj
-        else:
-            return self.obj[self._selection]
-
-    def _reset_group_selection(self):
-        """
-        Clear group based selection. Used for methods needing to return info on
-        each group regardless of whether a group selection was previously set.
-        """
-        if self._group_selection is not None:
-            self._group_selection = None
-            # GH12839 clear cached selection too when changing group selection
-            self._reset_cache('_selected_obj')
-
-    def _set_group_selection(self):
-        """
-        Create group based selection. Used when selection is not passed
-        directly but instead via a grouper.
-        """
-        grp = self.grouper
-        if self.as_index and getattr(grp, 'groupings', None) is not None and \
-           self.obj.ndim > 1:
-            ax = self.obj._info_axis
-            groupers = [g.name for g in grp.groupings
-                        if g.level is None and g.in_axis]
-
-            if len(groupers):
-                self._group_selection = ax.difference(Index(groupers)).tolist()
-                # GH12839 clear selected obj cache when group selection changes
-                self._reset_cache('_selected_obj')
-
-    def _set_result_index_ordered(self, result):
-        # set the result index on the passed values object and
-        # return the new object, xref 8046
-
-        # the values/counts are repeated according to the group index
-        # shortcut if we have an already ordered grouper
-        if not self.grouper.is_monotonic:
-            index = Index(np.concatenate(
-                self._get_indices(self.grouper.result_index)))
-            result.set_axis(self.axis, index)
-            result = result.sort_index(axis=self.axis)
-
-        result.set_axis(self.axis, self.obj._get_axis(self.axis))
-        return result
-
-    def _dir_additions(self):
-        return self.obj._dir_additions() | self._apply_whitelist
-
-    def __getattr__(self, attr):
-        if attr in self._internal_names_set:
-            return object.__getattribute__(self, attr)
-        if attr in self.obj:
-            return self[attr]
-        if hasattr(self.obj, attr):
-            return self._make_wrapper(attr)
-
-        raise AttributeError("%r object has no attribute %r" %
-                             (type(self).__name__, attr))
-
-    plot = property(GroupByPlot)
-
-    def _make_wrapper(self, name):
-        if name not in self._apply_whitelist:
-            is_callable = callable(getattr(self._selected_obj, name, None))
-            kind = ' callable ' if is_callable else ' '
-            msg = ("Cannot access{0}attribute {1!r} of {2!r} objects, try "
-                   "using the 'apply' method".format(kind, name,
-                                                     type(self).__name__))
-            raise AttributeError(msg)
-
-        # need to setup the selection
-        # as are not passed directly but in the grouper
-        self._set_group_selection()
-
-        f = getattr(self._selected_obj, name)
-        if not isinstance(f, types.MethodType):
-            return self.apply(lambda self: getattr(self, name))
-
-        f = getattr(type(self._selected_obj), name)
-
-        def wrapper(*args, **kwargs):
-            # a little trickery for aggregation functions that need an axis
-            # argument
-            kwargs_with_axis = kwargs.copy()
-            if 'axis' not in kwargs_with_axis or \
-               kwargs_with_axis['axis'] is None:
-                kwargs_with_axis['axis'] = self.axis
-
-            def curried_with_axis(x):
-                return f(x, *args, **kwargs_with_axis)
-
-            def curried(x):
-                return f(x, *args, **kwargs)
-
-            # preserve the name so we can detect it when calling plot methods,
-            # to avoid duplicates
-            curried.__name__ = curried_with_axis.__name__ = name
-
-            # special case otherwise extra plots are created when catching the
-            # exception below
-            if name in _plotting_methods:
-                return self.apply(curried)
-
-            try:
-                return self.apply(curried_with_axis)
-            except Exception:
-                try:
-                    return self.apply(curried)
-                except Exception:
-
-                    # related to : GH3688
-                    # try item-by-item
-                    # this can be called recursively, so need to raise
-                    # ValueError
-                    # if we don't have this method to indicated to aggregate to
-                    # mark this column as an error
-                    try:
-                        return self._aggregate_item_by_item(name,
-                                                            *args, **kwargs)
-                    except (AttributeError):
-                        raise ValueError
-
-        return wrapper
-
-    def get_group(self, name, obj=None):
-        """
-        Constructs NDFrame from group with provided name
-
-        Parameters
-        ----------
-        name : object
-            the name of the group to get as a DataFrame
-        obj : NDFrame, default None
-            the NDFrame to take the DataFrame out of.  If
-            it is None, the object groupby was called on will
-            be used
-
-        Returns
-        -------
-        group : type of obj
-        """
-        if obj is None:
-            obj = self._selected_obj
-
-        inds = self._get_index(name)
-        if not len(inds):
-            raise KeyError(name)
-
-        return obj.take(inds, axis=self.axis, convert=False)
-
-    def __iter__(self):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        return self.grouper.get_iterator(self.obj, axis=self.axis)
-
-    @Substitution(name='groupby')
-    def apply(self, func, *args, **kwargs):
-        """
-        Apply function and combine results together in an intelligent way. The
-        split-apply-combine combination rules attempt to be as common sense
-        based as possible. For example:
-
-        case 1:
-        group DataFrame
-        apply aggregation function (f(chunk) -> Series)
-        yield DataFrame, with group axis having group labels
-
-        case 2:
-        group DataFrame
-        apply transform function ((f(chunk) -> DataFrame with same indexes)
-        yield DataFrame with resulting chunks glued together
-
-        case 3:
-        group Series
-        apply function with f(chunk) -> DataFrame
-        yield DataFrame with result of chunks glued together
-
-        Parameters
-        ----------
-        func : function
-
-        Notes
-        -----
-        See online documentation for full exposition on how to use apply.
-
-        In the current implementation apply calls func twice on the
-        first group to decide whether it can take a fast or slow code
-        path. This can lead to unexpected behavior if func has
-        side-effects, as they will take effect twice for the first
-        group.
-
-
-        See also
-        --------
-        aggregate, transform"""
-
-        func = self._is_builtin_func(func)
-
-        # this is needed so we don't try and wrap strings. If we could
-        # resolve functions to their callable functions prior, this
-        # wouldn't be needed
-        if args or kwargs:
-            if callable(func):
-
-                @wraps(func)
-                def f(g):
-                    with np.errstate(all='ignore'):
-                        return func(g, *args, **kwargs)
-            else:
-                raise ValueError('func must be a callable if args or '
-                                 'kwargs are supplied')
-        else:
-            f = func
-
-        # ignore SettingWithCopy here in case the user mutates
-        with option_context('mode.chained_assignment', None):
-            return self._python_apply_general(f)
-
-    def _python_apply_general(self, f):
-        keys, values, mutated = self.grouper.apply(f, self._selected_obj,
-                                                   self.axis)
-
-        return self._wrap_applied_output(
-            keys,
-            values,
-            not_indexed_same=mutated or self.mutated)
-
-    def _iterate_slices(self):
-        yield self.name, self._selected_obj
-
-    def transform(self, func, *args, **kwargs):
-        raise AbstractMethodError(self)
-
-    def _cumcount_array(self, ascending=True):
-        """
-        Parameters
-        ----------
-        ascending : bool, default True
-            If False, number in reverse, from length of group - 1 to 0.
-
-        Note
-        ----
-        this is currently implementing sort=False
-        (though the default is sort=True) for groupby in general
-        """
-        ids, _, ngroups = self.grouper.group_info
-        sorter = get_group_index_sorter(ids, ngroups)
-        ids, count = ids[sorter], len(ids)
-
-        if count == 0:
-            return np.empty(0, dtype=np.int64)
-
-        run = np.r_[True, ids[:-1] != ids[1:]]
-        rep = np.diff(np.r_[np.nonzero(run)[0], count])
-        out = (~run).cumsum()
-
-        if ascending:
-            out -= np.repeat(out[run], rep)
-        else:
-            out = np.repeat(out[np.r_[run[1:], True]], rep) - out
-
-        rev = np.empty(count, dtype=np.intp)
-        rev[sorter] = np.arange(count, dtype=np.intp)
-        return out[rev].astype(np.int64, copy=False)
-
-    def _index_with_as_index(self, b):
-        """
-        Take boolean mask of index to be returned from apply, if as_index=True
-
-        """
-        # TODO perf, it feels like this should already be somewhere...
-        from itertools import chain
-        original = self._selected_obj.index
-        gp = self.grouper
-        levels = chain((gp.levels[i][gp.labels[i][b]]
-                        for i in range(len(gp.groupings))),
-                       (original._get_level_values(i)[b]
-                        for i in range(original.nlevels)))
-        new = MultiIndex.from_arrays(list(levels))
-        new.names = gp.names + original.names
-        return new
-
-    def _try_cast(self, result, obj, numeric_only=False):
-        """
-        try to cast the result to our obj original type,
-        we may have roundtripped thru object in the mean-time
-
-        if numeric_only is True, then only try to cast numerics
-        and not datetimelikes
-
-        """
-        if obj.ndim > 1:
-            dtype = obj.values.dtype
-        else:
-            dtype = obj.dtype
-
-        if not is_scalar(result):
-            if numeric_only and is_numeric_dtype(dtype) or not numeric_only:
-                result = maybe_downcast_to_dtype(result, dtype)
-
-        return result
-
-    def _cython_transform(self, how, numeric_only=True):
-        output = collections.OrderedDict()
-        for name, obj in self._iterate_slices():
-            is_numeric = is_numeric_dtype(obj.dtype)
-            if numeric_only and not is_numeric:
-                continue
-
-            try:
-                result, names = self.grouper.transform(obj.values, how)
-            except NotImplementedError:
-                continue
-            except AssertionError as e:
-                raise GroupByError(str(e))
-            output[name] = self._try_cast(result, obj)
-
-        if len(output) == 0:
-            raise DataError('No numeric types to aggregate')
-
-        return self._wrap_transformed_output(output, names)
-
-    def _cython_agg_general(self, how, alt=None, numeric_only=True):
-        output = {}
-        for name, obj in self._iterate_slices():
-            is_numeric = is_numeric_dtype(obj.dtype)
-            if numeric_only and not is_numeric:
-                continue
-
-            try:
-                result, names = self.grouper.aggregate(obj.values, how)
-            except AssertionError as e:
-                raise GroupByError(str(e))
-            output[name] = self._try_cast(result, obj)
-
-        if len(output) == 0:
-            raise DataError('No numeric types to aggregate')
-
-        return self._wrap_aggregated_output(output, names)
-
-    def _python_agg_general(self, func, *args, **kwargs):
-        func = self._is_builtin_func(func)
-        f = lambda x: func(x, *args, **kwargs)
-
-        # iterate through "columns" ex exclusions to populate output dict
-        output = {}
-        for name, obj in self._iterate_slices():
-            try:
-                result, counts = self.grouper.agg_series(obj, f)
-                output[name] = self._try_cast(result, obj, numeric_only=True)
-            except TypeError:
-                continue
-
-        if len(output) == 0:
-            return self._python_apply_general(f)
-
-        if self.grouper._filter_empty_groups:
-
-            mask = counts.ravel() > 0
-            for name, result in compat.iteritems(output):
-
-                # since we are masking, make sure that we have a float object
-                values = result
-                if is_numeric_dtype(values.dtype):
-                    values = _ensure_float(values)
-
-                output[name] = self._try_cast(values[mask], result)
-
-        return self._wrap_aggregated_output(output)
-
-    def _wrap_applied_output(self, *args, **kwargs):
-        raise AbstractMethodError(self)
-
-    def _concat_objects(self, keys, values, not_indexed_same=False):
-        from pandas.tools.concat import concat
-
-        def reset_identity(values):
-            # reset the identities of the components
-            # of the values to prevent aliasing
-            for v in values:
-                if v is not None:
-                    ax = v._get_axis(self.axis)
-                    ax._reset_identity()
-            return values
-
-        if not not_indexed_same:
-            result = concat(values, axis=self.axis)
-            ax = self._selected_obj._get_axis(self.axis)
-
-            if isinstance(result, Series):
-                result = result.reindex(ax)
-            else:
-
-                # this is a very unfortunate situation
-                # we have a multi-index that is NOT lexsorted
-                # and we have a result which is duplicated
-                # we can't reindex, so we resort to this
-                # GH 14776
-                if isinstance(ax, MultiIndex) and not ax.is_unique:
-                    result = result.take(result.index.get_indexer_for(
-                        ax.values).unique(), axis=self.axis)
-                else:
-                    result = result.reindex_axis(ax, axis=self.axis)
-
-        elif self.group_keys:
-
-            values = reset_identity(values)
-            if self.as_index:
-
-                # possible MI return case
-                group_keys = keys
-                group_levels = self.grouper.levels
-                group_names = self.grouper.names
-
-                result = concat(values, axis=self.axis, keys=group_keys,
-                                levels=group_levels, names=group_names)
-            else:
-
-                # GH5610, returns a MI, with the first level being a
-                # range index
-                keys = list(range(len(values)))
-                result = concat(values, axis=self.axis, keys=keys)
-        else:
-            values = reset_identity(values)
-            result = concat(values, axis=self.axis)
-
-        if (isinstance(result, Series) and
-                getattr(self, 'name', None) is not None):
-
-            result.name = self.name
-
-        return result
-
-    def _apply_filter(self, indices, dropna):
-        if len(indices) == 0:
-            indices = np.array([], dtype='int64')
-        else:
-            indices = np.sort(np.concatenate(indices))
-        if dropna:
-            filtered = self._selected_obj.take(indices, axis=self.axis)
-        else:
-            mask = np.empty(len(self._selected_obj.index), dtype=bool)
-            mask.fill(False)
-            mask[indices.astype(int)] = True
-            # mask fails to broadcast when passed to where; broadcast manually.
-            mask = np.tile(mask, list(self._selected_obj.shape[1:]) + [1]).T
-            filtered = self._selected_obj.where(mask)  # Fill with NaNs.
-        return filtered
-
-
-class GroupBy(_GroupBy):
-
-    """
-    Class for grouping and aggregating relational data. See aggregate,
-    transform, and apply functions on this object.
-
-    It's easiest to use obj.groupby(...) to use GroupBy, but you can also do:
-
-    ::
-
-        grouped = groupby(obj, ...)
-
-    Parameters
-    ----------
-    obj : pandas object
-    axis : int, default 0
-    level : int, default None
-        Level of MultiIndex
-    groupings : list of Grouping objects
-        Most users should ignore this
-    exclusions : array-like, optional
-        List of columns to exclude
-    name : string
-        Most users should ignore this
-
-    Notes
-    -----
-    After grouping, see aggregate, apply, and transform functions. Here are
-    some other brief notes about usage. When grouping by multiple groups, the
-    result index will be a MultiIndex (hierarchical) by default.
-
-    Iteration produces (key, group) tuples, i.e. chunking the data by group. So
-    you can write code like:
-
-    ::
-
-        grouped = obj.groupby(keys, axis=axis)
-        for key, group in grouped:
-            # do something with the data
-
-    Function calls on GroupBy, if not specially implemented, "dispatch" to the
-    grouped data. So if you group a DataFrame and wish to invoke the std()
-    method on each group, you can simply do:
-
-    ::
-
-        df.groupby(mapper).std()
-
-    rather than
-
-    ::
-
-        df.groupby(mapper).aggregate(np.std)
-
-    You can pass arguments to these "wrapped" functions, too.
-
-    See the online documentation for full exposition on these topics and much
-    more
-
-    Returns
-    -------
-    **Attributes**
-    groups : dict
-        {group name -> group labels}
-    len(grouped) : int
-        Number of groups
-    """
-    _apply_whitelist = _common_apply_whitelist
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def count(self):
-        """Compute count of group, excluding missing values"""
-
-        # defined here for API doc
-        raise NotImplementedError
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def mean(self, *args, **kwargs):
-        """
-        Compute mean of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        nv.validate_groupby_func('mean', args, kwargs, ['numeric_only'])
-        try:
-            return self._cython_agg_general('mean', **kwargs)
-        except GroupByError:
-            raise
-        except Exception:  # pragma: no cover
-            self._set_group_selection()
-            f = lambda x: x.mean(axis=self.axis, **kwargs)
-            return self._python_agg_general(f)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def median(self, **kwargs):
-        """
-        Compute median of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-        """
-        try:
-            return self._cython_agg_general('median', **kwargs)
-        except GroupByError:
-            raise
-        except Exception:  # pragma: no cover
-
-            self._set_group_selection()
-
-            def f(x):
-                if isinstance(x, np.ndarray):
-                    x = Series(x)
-                return x.median(axis=self.axis, **kwargs)
-            return self._python_agg_general(f)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def std(self, ddof=1, *args, **kwargs):
-        """
-        Compute standard deviation of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-
-        Parameters
-        ----------
-        ddof : integer, default 1
-            degrees of freedom
-        """
-
-        # TODO: implement at Cython level?
-        nv.validate_groupby_func('std', args, kwargs)
-        return np.sqrt(self.var(ddof=ddof, **kwargs))
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def var(self, ddof=1, *args, **kwargs):
-        """
-        Compute variance of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-
-        Parameters
-        ----------
-        ddof : integer, default 1
-            degrees of freedom
-        """
-        nv.validate_groupby_func('var', args, kwargs)
-        if ddof == 1:
-            return self._cython_agg_general('var', **kwargs)
-        else:
-            self._set_group_selection()
-            f = lambda x: x.var(ddof=ddof, **kwargs)
-            return self._python_agg_general(f)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def sem(self, ddof=1):
-        """
-        Compute standard error of the mean of groups, excluding missing values
-
-        For multiple groupings, the result index will be a MultiIndex
-
-        Parameters
-        ----------
-        ddof : integer, default 1
-            degrees of freedom
-        """
-
-        return self.std(ddof=ddof) / np.sqrt(self.count())
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def size(self):
-        """Compute group sizes"""
-        result = self.grouper.size()
-
-        if isinstance(self.obj, Series):
-            result.name = getattr(self, 'name', None)
-        return result
-
-    @classmethod
-    def _add_numeric_operations(cls):
-        """ add numeric operations to the GroupBy generically """
-
-        def groupby_function(name, alias, npfunc,
-                             numeric_only=True, _convert=False):
-
-            _local_template = "Compute %(f)s of group values"
-
-            @Substitution(name='groupby', f=name)
-            @Appender(_doc_template)
-            @Appender(_local_template)
-            def f(self, **kwargs):
-                if 'numeric_only' not in kwargs:
-                    kwargs['numeric_only'] = numeric_only
-                self._set_group_selection()
-                try:
-                    return self._cython_agg_general(
-                        alias, alt=npfunc, **kwargs)
-                except AssertionError as e:
-                    raise SpecificationError(str(e))
-                except Exception:
-                    result = self.aggregate(
-                        lambda x: npfunc(x, axis=self.axis))
-                    if _convert:
-                        result = result._convert(datetime=True)
-                    return result
-
-            set_function_name(f, name, cls)
-
-            return f
-
-        def first_compat(x, axis=0):
-
-            def first(x):
-
-                x = np.asarray(x)
-                x = x[notnull(x)]
-                if len(x) == 0:
-                    return np.nan
-                return x[0]
-
-            if isinstance(x, DataFrame):
-                return x.apply(first, axis=axis)
-            else:
-                return first(x)
-
-        def last_compat(x, axis=0):
-
-            def last(x):
-
-                x = np.asarray(x)
-                x = x[notnull(x)]
-                if len(x) == 0:
-                    return np.nan
-                return x[-1]
-
-            if isinstance(x, DataFrame):
-                return x.apply(last, axis=axis)
-            else:
-                return last(x)
-
-        cls.sum = groupby_function('sum', 'add', np.sum)
-        cls.prod = groupby_function('prod', 'prod', np.prod)
-        cls.min = groupby_function('min', 'min', np.min, numeric_only=False)
-        cls.max = groupby_function('max', 'max', np.max, numeric_only=False)
-        cls.first = groupby_function('first', 'first', first_compat,
-                                     numeric_only=False, _convert=True)
-        cls.last = groupby_function('last', 'last', last_compat,
-                                    numeric_only=False, _convert=True)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def ohlc(self):
-        """
-        Compute sum of values, excluding missing values
-        For multiple groupings, the result index will be a MultiIndex
-        """
-
-        return self._apply_to_column_groupbys(
-            lambda x: x._cython_agg_general('ohlc'))
-
-    @Appender(DataFrame.describe.__doc__)
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def describe(self, **kwargs):
-        self._set_group_selection()
-        result = self.apply(lambda x: x.describe(**kwargs))
-        if self.axis == 1:
-            return result.T
-        return result.unstack()
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def resample(self, rule, *args, **kwargs):
-        """
-        Provide resampling when using a TimeGrouper
-        Return a new grouper with our resampler appended
-        """
-        from pandas.tseries.resample import get_resampler_for_grouping
-        return get_resampler_for_grouping(self, rule, *args, **kwargs)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def rolling(self, *args, **kwargs):
-        """
-        Return a rolling grouper, providing rolling
-        functionaility per group
-
-        """
-        from pandas.core.window import RollingGroupby
-        return RollingGroupby(self, *args, **kwargs)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def expanding(self, *args, **kwargs):
-        """
-        Return an expanding grouper, providing expanding
-        functionaility per group
-
-        """
-        from pandas.core.window import ExpandingGroupby
-        return ExpandingGroupby(self, *args, **kwargs)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def pad(self, limit=None):
-        """
-        Forward fill the values
-
-        Parameters
-        ----------
-        limit : integer, optional
-            limit of how many values to fill
-
-        See Also
-        --------
-        Series.fillna
-        DataFrame.fillna
-        """
-        return self.apply(lambda x: x.ffill(limit=limit))
-    ffill = pad
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def backfill(self, limit=None):
-        """
-        Backward fill the values
-
-        Parameters
-        ----------
-        limit : integer, optional
-            limit of how many values to fill
-
-        See Also
-        --------
-        Series.fillna
-        DataFrame.fillna
-        """
-        return self.apply(lambda x: x.bfill(limit=limit))
-    bfill = backfill
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def nth(self, n, dropna=None):
-        """
-        Take the nth row from each group if n is an int, or a subset of rows
-        if n is a list of ints.
-
-        If dropna, will take the nth non-null row, dropna is either
-        Truthy (if a Series) or 'all', 'any' (if a DataFrame);
-        this is equivalent to calling dropna(how=dropna) before the
-        groupby.
-
-        Parameters
-        ----------
-        n : int or list of ints
-            a single nth value for the row or a list of nth values
-        dropna : None or str, optional
-            apply the specified dropna operation before counting which row is
-            the nth row. Needs to be None, 'any' or 'all'
-
-        Examples
-        --------
-
-        >>> df = pd.DataFrame({'A': [1, 1, 2, 1, 2],
-        ...                    'B': [np.nan, 2, 3, 4, 5]}, columns=['A', 'B'])
-        >>> g = df.groupby('A')
-        >>> g.nth(0)
-             B
-        A
-        1  NaN
-        2  3.0
-        >>> g.nth(1)
-             B
-        A
-        1  2.0
-        2  5.0
-        >>> g.nth(-1)
-             B
-        A
-        1  4.0
-        2  5.0
-        >>> g.nth([0, 1])
-             B
-        A
-        1  NaN
-        1  2.0
-        2  3.0
-        2  5.0
-
-        Specifying ``dropna`` allows count ignoring NaN
-
-        >>> g.nth(0, dropna='any')
-             B
-        A
-        1  2.0
-        2  3.0
-
-        NaNs denote group exhausted when using dropna
-
-        >>> g.nth(3, dropna='any')
-            B
-        A
-        1 NaN
-        2 NaN
-
-        Specifying ``as_index=False`` in ``groupby`` keeps the original index.
-
-        >>> df.groupby('A', as_index=False).nth(1)
-           A    B
-        1  1  2.0
-        4  2  5.0
-        """
-
-        if isinstance(n, int):
-            nth_values = [n]
-        elif isinstance(n, (set, list, tuple)):
-            nth_values = list(set(n))
-            if dropna is not None:
-                raise ValueError(
-                    "dropna option with a list of nth values is not supported")
-        else:
-            raise TypeError("n needs to be an int or a list/set/tuple of ints")
-
-        nth_values = np.array(nth_values, dtype=np.intp)
-        self._set_group_selection()
-
-        if not dropna:
-            mask = np.in1d(self._cumcount_array(), nth_values) | \
-                np.in1d(self._cumcount_array(ascending=False) + 1, -nth_values)
-
-            out = self._selected_obj[mask]
-            if not self.as_index:
-                return out
-
-            ids, _, _ = self.grouper.group_info
-            out.index = self.grouper.result_index[ids[mask]]
-
-            return out.sort_index() if self.sort else out
-
-        if isinstance(self._selected_obj, DataFrame) and \
-           dropna not in ['any', 'all']:
-            # Note: when agg-ing picker doesn't raise this, just returns NaN
-            raise ValueError("For a DataFrame groupby, dropna must be "
-                             "either None, 'any' or 'all', "
-                             "(was passed %s)." % (dropna),)
-
-        # old behaviour, but with all and any support for DataFrames.
-        # modified in GH 7559 to have better perf
-        max_len = n if n >= 0 else - 1 - n
-        dropped = self.obj.dropna(how=dropna, axis=self.axis)
-
-        # get a new grouper for our dropped obj
-        if self.keys is None and self.level is None:
-
-            # we don't have the grouper info available
-            # (e.g. we have selected out
-            # a column that is not in the current object)
-            axis = self.grouper.axis
-            grouper = axis[axis.isin(dropped.index)]
-
-        else:
-
-            # create a grouper with the original parameters, but on the dropped
-            # object
-            grouper, _, _ = _get_grouper(dropped, key=self.keys,
-                                         axis=self.axis, level=self.level,
-                                         sort=self.sort,
-                                         mutated=self.mutated)
-
-        grb = dropped.groupby(grouper, as_index=self.as_index, sort=self.sort)
-        sizes, result = grb.size(), grb.nth(n)
-        mask = (sizes < max_len).values
-
-        # set the results which don't meet the criteria
-        if len(result) and mask.any():
-            result.loc[mask] = np.nan
-
-        # reset/reindex to the original groups
-        if len(self.obj) == len(dropped) or \
-           len(result) == len(self.grouper.result_index):
-            result.index = self.grouper.result_index
-        else:
-            result = result.reindex(self.grouper.result_index)
-
-        return result
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def cumcount(self, ascending=True):
-        """
-        Number each item in each group from 0 to the length of that group - 1.
-
-        Essentially this is equivalent to
-
-        >>> self.apply(lambda x: Series(np.arange(len(x)), x.index))
-
-        Parameters
-        ----------
-        ascending : bool, default True
-            If False, number in reverse, from length of group - 1 to 0.
-
-        Examples
-        --------
-
-        >>> df = pd.DataFrame([['a'], ['a'], ['a'], ['b'], ['b'], ['a']],
-        ...                   columns=['A'])
-        >>> df
-           A
-        0  a
-        1  a
-        2  a
-        3  b
-        4  b
-        5  a
-        >>> df.groupby('A').cumcount()
-        0    0
-        1    1
-        2    2
-        3    0
-        4    1
-        5    3
-        dtype: int64
-        >>> df.groupby('A').cumcount(ascending=False)
-        0    3
-        1    2
-        2    1
-        3    1
-        4    0
-        5    0
-        dtype: int64
-        """
-
-        self._set_group_selection()
-
-        index = self._selected_obj.index
-        cumcounts = self._cumcount_array(ascending=ascending)
-        return Series(cumcounts, index)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def cumprod(self, axis=0, *args, **kwargs):
-        """Cumulative product for each group"""
-        nv.validate_groupby_func('cumprod', args, kwargs, ['numeric_only'])
-        if axis != 0:
-            return self.apply(lambda x: x.cumprod(axis=axis, **kwargs))
-
-        return self._cython_transform('cumprod', **kwargs)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def cumsum(self, axis=0, *args, **kwargs):
-        """Cumulative sum for each group"""
-        nv.validate_groupby_func('cumsum', args, kwargs, ['numeric_only'])
-        if axis != 0:
-            return self.apply(lambda x: x.cumsum(axis=axis, **kwargs))
-
-        return self._cython_transform('cumsum', **kwargs)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def cummin(self, axis=0, **kwargs):
-        """Cumulative min for each group"""
-        if axis != 0:
-            return self.apply(lambda x: np.minimum.accumulate(x, axis))
-
-        return self._cython_transform('cummin', numeric_only=False)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def cummax(self, axis=0, **kwargs):
-        """Cumulative max for each group"""
-        if axis != 0:
-            return self.apply(lambda x: np.maximum.accumulate(x, axis))
-
-        return self._cython_transform('cummax', numeric_only=False)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def shift(self, periods=1, freq=None, axis=0):
-        """
-        Shift each group by periods observations
-
-        Parameters
-        ----------
-        periods : integer, default 1
-            number of periods to shift
-        freq : frequency string
-        axis : axis to shift, default 0
-        """
-
-        if freq is not None or axis != 0:
-            return self.apply(lambda x: x.shift(periods, freq, axis))
-
-        labels, _, ngroups = self.grouper.group_info
-
-        # filled in by Cython
-        indexer = np.zeros_like(labels)
-        libgroupby.group_shift_indexer(indexer, labels, ngroups, periods)
-
-        output = {}
-        for name, obj in self._iterate_slices():
-            output[name] = algorithms.take_nd(obj.values, indexer)
-
-        return self._wrap_transformed_output(output)
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def head(self, n=5):
-        """
-        Returns first n rows of each group.
-
-        Essentially equivalent to ``.apply(lambda x: x.head(n))``,
-        except ignores as_index flag.
-
-        Examples
-        --------
-
-        >>> df = DataFrame([[1, 2], [1, 4], [5, 6]],
-                           columns=['A', 'B'])
-        >>> df.groupby('A', as_index=False).head(1)
-           A  B
-        0  1  2
-        2  5  6
-        >>> df.groupby('A').head(1)
-           A  B
-        0  1  2
-        2  5  6
-        """
-        self._reset_group_selection()
-        mask = self._cumcount_array() < n
-        return self._selected_obj[mask]
-
-    @Substitution(name='groupby')
-    @Appender(_doc_template)
-    def tail(self, n=5):
-        """
-        Returns last n rows of each group
-
-        Essentially equivalent to ``.apply(lambda x: x.tail(n))``,
-        except ignores as_index flag.
-
-        Examples
-        --------
-
-        >>> df = DataFrame([['a', 1], ['a', 2], ['b', 1], ['b', 2]],
-                           columns=['A', 'B'])
-        >>> df.groupby('A').tail(1)
-           A  B
-        1  a  2
-        3  b  2
-        >>> df.groupby('A').head(1)
-           A  B
-        0  a  1
-        2  b  1
-        """
-        self._reset_group_selection()
-        mask = self._cumcount_array(ascending=False) < n
-        return self._selected_obj[mask]
-
-
-GroupBy._add_numeric_operations()
-
-
-@Appender(GroupBy.__doc__)
-def groupby(obj, by, **kwds):
-    if isinstance(obj, Series):
-        klass = SeriesGroupBy
-    elif isinstance(obj, DataFrame):
-        klass = DataFrameGroupBy
-    else:  # pragma: no cover
-        raise TypeError('invalid type: %s' % type(obj))
-
-    return klass(obj, by, **kwds)
-
-
-def _get_axes(group):
-    if isinstance(group, Series):
-        return [group.index]
-    else:
-        return group.axes
-
-
-def _is_indexed_like(obj, axes):
-    if isinstance(obj, Series):
-        if len(axes) > 1:
-            return False
-        return obj.index.equals(axes[0])
-    elif isinstance(obj, DataFrame):
-        return obj.index.equals(axes[0])
-
-    return False
-
-
-class BaseGrouper(object):
-    """
-    This is an internal Grouper class, which actually holds
-    the generated groups
-    """
-
-    def __init__(self, axis, groupings, sort=True, group_keys=True,
-                 mutated=False):
-        self._filter_empty_groups = self.compressed = len(groupings) != 1
-        self.axis = axis
-        self.groupings = groupings
-        self.sort = sort
-        self.group_keys = group_keys
-        self.mutated = mutated
-
-    @property
-    def shape(self):
-        return tuple(ping.ngroups for ping in self.groupings)
-
-    def __iter__(self):
-        return iter(self.indices)
-
-    @property
-    def nkeys(self):
-        return len(self.groupings)
-
-    def get_iterator(self, data, axis=0):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        splitter = self._get_splitter(data, axis=axis)
-        keys = self._get_group_keys()
-        for key, (i, group) in zip(keys, splitter):
-            yield key, group
-
-    def _get_splitter(self, data, axis=0):
-        comp_ids, _, ngroups = self.group_info
-        return get_splitter(data, comp_ids, ngroups, axis=axis)
-
-    def _get_group_keys(self):
-        if len(self.groupings) == 1:
-            return self.levels[0]
-        else:
-            comp_ids, _, ngroups = self.group_info
-
-            # provide "flattened" iterator for multi-group setting
-            return get_flattened_iterator(comp_ids,
-                                          ngroups,
-                                          self.levels,
-                                          self.labels)
-
-    def apply(self, f, data, axis=0):
-        mutated = self.mutated
-        splitter = self._get_splitter(data, axis=axis)
-        group_keys = self._get_group_keys()
-
-        # oh boy
-        f_name = com._get_callable_name(f)
-        if (f_name not in _plotting_methods and
-                hasattr(splitter, 'fast_apply') and axis == 0):
-            try:
-                values, mutated = splitter.fast_apply(f, group_keys)
-                return group_keys, values, mutated
-            except (lib.InvalidApply):
-                # we detect a mutation of some kind
-                # so take slow path
-                pass
-            except Exception:
-                # raise this error to the caller
-                pass
-
-        result_values = []
-        for key, (i, group) in zip(group_keys, splitter):
-            object.__setattr__(group, 'name', key)
-
-            # group might be modified
-            group_axes = _get_axes(group)
-            res = f(group)
-            if not _is_indexed_like(res, group_axes):
-                mutated = True
-            result_values.append(res)
-
-        return group_keys, result_values, mutated
-
-    @cache_readonly
-    def indices(self):
-        """ dict {group name -> group indices} """
-        if len(self.groupings) == 1:
-            return self.groupings[0].indices
-        else:
-            label_list = [ping.labels for ping in self.groupings]
-            keys = [_values_from_object(ping.group_index)
-                    for ping in self.groupings]
-            return get_indexer_dict(label_list, keys)
-
-    @property
-    def labels(self):
-        return [ping.labels for ping in self.groupings]
-
-    @property
-    def levels(self):
-        return [ping.group_index for ping in self.groupings]
-
-    @property
-    def names(self):
-        return [ping.name for ping in self.groupings]
-
-    def size(self):
-        """
-        Compute group sizes
-
-        """
-        ids, _, ngroup = self.group_info
-        ids = _ensure_platform_int(ids)
-        out = np.bincount(ids[ids != -1], minlength=ngroup or None)
-        return Series(out,
-                      index=self.result_index,
-                      dtype='int64')
-
-    @cache_readonly
-    def _max_groupsize(self):
-        """
-        Compute size of largest group
-        """
-        # For many items in each group this is much faster than
-        # self.size().max(), in worst case marginally slower
-        if self.indices:
-            return max(len(v) for v in self.indices.values())
-        else:
-            return 0
-
-    @cache_readonly
-    def groups(self):
-        """ dict {group name -> group labels} """
-        if len(self.groupings) == 1:
-            return self.groupings[0].groups
-        else:
-            to_groupby = lzip(*(ping.grouper for ping in self.groupings))
-            to_groupby = Index(to_groupby)
-            return self.axis.groupby(to_groupby)
-
-    @cache_readonly
-    def is_monotonic(self):
-        # return if my group orderings are monotonic
-        return Index(self.group_info[0]).is_monotonic
-
-    @cache_readonly
-    def group_info(self):
-        comp_ids, obs_group_ids = self._get_compressed_labels()
-
-        ngroups = len(obs_group_ids)
-        comp_ids = _ensure_int64(comp_ids)
-        return comp_ids, obs_group_ids, ngroups
-
-    def _get_compressed_labels(self):
-        all_labels = [ping.labels for ping in self.groupings]
-        if len(all_labels) > 1:
-            group_index = get_group_index(all_labels, self.shape,
-                                          sort=True, xnull=True)
-            return compress_group_index(group_index, sort=self.sort)
-
-        ping = self.groupings[0]
-        return ping.labels, np.arange(len(ping.group_index))
-
-    @cache_readonly
-    def ngroups(self):
-        return len(self.result_index)
-
-    @property
-    def recons_labels(self):
-        comp_ids, obs_ids, _ = self.group_info
-        labels = (ping.labels for ping in self.groupings)
-        return decons_obs_group_ids(comp_ids,
-                                    obs_ids, self.shape, labels, xnull=True)
-
-    @cache_readonly
-    def result_index(self):
-        if not self.compressed and len(self.groupings) == 1:
-            return self.groupings[0].group_index.rename(self.names[0])
-
-        return MultiIndex(levels=[ping.group_index for ping in self.groupings],
-                          labels=self.recons_labels,
-                          verify_integrity=False,
-                          names=self.names)
-
-    def get_group_levels(self):
-        if not self.compressed and len(self.groupings) == 1:
-            return [self.groupings[0].group_index]
-
-        name_list = []
-        for ping, labels in zip(self.groupings, self.recons_labels):
-            labels = _ensure_platform_int(labels)
-            levels = ping.group_index.take(labels)
-
-            name_list.append(levels)
-
-        return name_list
-
-    # ------------------------------------------------------------
-    # Aggregation functions
-
-    _cython_functions = {
-        'aggregate': {
-            'add': 'group_add',
-            'prod': 'group_prod',
-            'min': 'group_min',
-            'max': 'group_max',
-            'mean': 'group_mean',
-            'median': {
-                'name': 'group_median'
-            },
-            'var': 'group_var',
-            'first': {
-                'name': 'group_nth',
-                'f': lambda func, a, b, c, d: func(a, b, c, d, 1)
-            },
-            'last': 'group_last',
-            'ohlc': 'group_ohlc',
-        },
-
-        'transform': {
-            'cumprod': 'group_cumprod',
-            'cumsum': 'group_cumsum',
-            'cummin': 'group_cummin',
-            'cummax': 'group_cummax',
-        }
-    }
-
-    _cython_arity = {
-        'ohlc': 4,  # OHLC
-    }
-
-    _name_functions = {
-        'ohlc': lambda *args: ['open', 'high', 'low', 'close']
-    }
-
-    def _get_cython_function(self, kind, how, values, is_numeric):
-
-        dtype_str = values.dtype.name
-
-        def get_func(fname):
-            # see if there is a fused-type version of function
-            # only valid for numeric
-            f = getattr(libgroupby, fname, None)
-            if f is not None and is_numeric:
-                return f
-
-            # otherwise find dtype-specific version, falling back to object
-            for dt in [dtype_str, 'object']:
-                f = getattr(libgroupby, "%s_%s" % (fname, dtype_str), None)
-                if f is not None:
-                    return f
-
-        ftype = self._cython_functions[kind][how]
-
-        if isinstance(ftype, dict):
-            func = afunc = get_func(ftype['name'])
-
-            # a sub-function
-            f = ftype.get('f')
-            if f is not None:
-
-                def wrapper(*args, **kwargs):
-                    return f(afunc, *args, **kwargs)
-
-                # need to curry our sub-function
-                func = wrapper
-
-        else:
-            func = get_func(ftype)
-
-        if func is None:
-            raise NotImplementedError("function is not implemented for this"
-                                      "dtype: [how->%s,dtype->%s]" %
-                                      (how, dtype_str))
-        return func, dtype_str
-
-    def _cython_operation(self, kind, values, how, axis):
-        assert kind in ['transform', 'aggregate']
-
-        # can we do this operation with our cython functions
-        # if not raise NotImplementedError
-
-        # we raise NotImplemented if this is an invalid operation
-        # entirely, e.g. adding datetimes
-
-        # categoricals are only 1d, so we
-        # are not setup for dim transforming
-        if is_categorical_dtype(values):
-            raise NotImplementedError(
-                "categoricals are not support in cython ops ATM")
-        elif is_datetime64_any_dtype(values):
-            if how in ['add', 'prod', 'cumsum', 'cumprod']:
-                raise NotImplementedError(
-                    "datetime64 type does not support {} "
-                    "operations".format(how))
-        elif is_timedelta64_dtype(values):
-            if how in ['prod', 'cumprod']:
-                raise NotImplementedError(
-                    "timedelta64 type does not support {} "
-                    "operations".format(how))
-
-        arity = self._cython_arity.get(how, 1)
-
-        vdim = values.ndim
-        swapped = False
-        if vdim == 1:
-            values = values[:, None]
-            out_shape = (self.ngroups, arity)
-        else:
-            if axis > 0:
-                swapped = True
-                values = values.swapaxes(0, axis)
-            if arity > 1:
-                raise NotImplementedError("arity of more than 1 is not "
-                                          "supported for the 'how' argument")
-            out_shape = (self.ngroups,) + values.shape[1:]
-
-        is_datetimelike = needs_i8_conversion(values.dtype)
-        is_numeric = is_numeric_dtype(values.dtype)
-
-        if is_datetimelike:
-            values = values.view('int64')
-            is_numeric = True
-        elif is_bool_dtype(values.dtype):
-            values = _ensure_float64(values)
-        elif is_integer_dtype(values):
-            # we use iNaT for the missing value on ints
-            # so pre-convert to guard this condition
-            if (values == iNaT).any():
-                values = _ensure_float64(values)
-            else:
-                values = values.astype('int64', copy=False)
-        elif is_numeric and not is_complex_dtype(values):
-            values = _ensure_float64(values)
-        else:
-            values = values.astype(object)
-
-        try:
-            func, dtype_str = self._get_cython_function(
-                kind, how, values, is_numeric)
-        except NotImplementedError:
-            if is_numeric:
-                values = _ensure_float64(values)
-                func, dtype_str = self._get_cython_function(
-                    kind, how, values, is_numeric)
-            else:
-                raise
-
-        if is_numeric:
-            out_dtype = '%s%d' % (values.dtype.kind, values.dtype.itemsize)
-        else:
-            out_dtype = 'object'
-
-        labels, _, _ = self.group_info
-
-        if kind == 'aggregate':
-            result = _maybe_fill(np.empty(out_shape, dtype=out_dtype),
-                                 fill_value=np.nan)
-            counts = np.zeros(self.ngroups, dtype=np.int64)
-            result = self._aggregate(
-                result, counts, values, labels, func, is_numeric,
-                is_datetimelike)
-        elif kind == 'transform':
-            result = _maybe_fill(np.empty_like(values, dtype=out_dtype),
-                                 fill_value=np.nan)
-
-            result = self._transform(
-                result, values, labels, func, is_numeric, is_datetimelike)
-
-        if is_integer_dtype(result):
-            mask = result == iNaT
-            if mask.any():
-                result = result.astype('float64')
-                result[mask] = np.nan
-
-        if kind == 'aggregate' and \
-           self._filter_empty_groups and not counts.all():
-            if result.ndim == 2:
-                try:
-                    result = lib.row_bool_subset(
-                        result, (counts > 0).view(np.uint8))
-                except ValueError:
-                    result = lib.row_bool_subset_object(
-                        _ensure_object(result),
-                        (counts > 0).view(np.uint8))
-            else:
-                result = result[counts > 0]
-
-        if vdim == 1 and arity == 1:
-            result = result[:, 0]
-
-        if how in self._name_functions:
-            # TODO
-            names = self._name_functions[how]()
-        else:
-            names = None
-
-        if swapped:
-            result = result.swapaxes(0, axis)
-
-        return result, names
-
-    def aggregate(self, values, how, axis=0):
-        return self._cython_operation('aggregate', values, how, axis)
-
-    def transform(self, values, how, axis=0):
-        return self._cython_operation('transform', values, how, axis)
-
-    def _aggregate(self, result, counts, values, comp_ids, agg_func,
-                   is_numeric, is_datetimelike):
-        if values.ndim > 3:
-            # punting for now
-            raise NotImplementedError("number of dimensions is currently "
-                                      "limited to 3")
-        elif values.ndim > 2:
-            for i, chunk in enumerate(values.transpose(2, 0, 1)):
-
-                chunk = chunk.squeeze()
-                agg_func(result[:, :, i], counts, chunk, comp_ids)
-        else:
-            agg_func(result, counts, values, comp_ids)
-
-        return result
-
-    def _transform(self, result, values, comp_ids, transform_func,
-                   is_numeric, is_datetimelike):
-
-        comp_ids, _, ngroups = self.group_info
-        if values.ndim > 3:
-            # punting for now
-            raise NotImplementedError("number of dimensions is currently "
-                                      "limited to 3")
-        elif values.ndim > 2:
-            for i, chunk in enumerate(values.transpose(2, 0, 1)):
-
-                chunk = chunk.squeeze()
-                transform_func(result[:, :, i], values,
-                               comp_ids, is_datetimelike)
-        else:
-            transform_func(result, values, comp_ids, is_datetimelike)
-
-        return result
-
-    def agg_series(self, obj, func):
-        try:
-            return self._aggregate_series_fast(obj, func)
-        except Exception:
-            return self._aggregate_series_pure_python(obj, func)
-
-    def _aggregate_series_fast(self, obj, func):
-        func = self._is_builtin_func(func)
-
-        if obj.index._has_complex_internals:
-            raise TypeError('Incompatible index for Cython grouper')
-
-        group_index, _, ngroups = self.group_info
-
-        # avoids object / Series creation overhead
-        dummy = obj._get_values(slice(None, 0)).to_dense()
-        indexer = get_group_index_sorter(group_index, ngroups)
-        obj = obj.take(indexer, convert=False)
-        group_index = algorithms.take_nd(
-            group_index, indexer, allow_fill=False)
-        grouper = lib.SeriesGrouper(obj, func, group_index, ngroups,
-                                    dummy)
-        result, counts = grouper.get_result()
-        return result, counts
-
-    def _aggregate_series_pure_python(self, obj, func):
-
-        group_index, _, ngroups = self.group_info
-
-        counts = np.zeros(ngroups, dtype=int)
-        result = None
-
-        splitter = get_splitter(obj, group_index, ngroups, axis=self.axis)
-
-        for label, group in splitter:
-            res = func(group)
-            if result is None:
-                if (isinstance(res, (Series, Index, np.ndarray)) or
-                        isinstance(res, list)):
-                    raise ValueError('Function does not reduce')
-                result = np.empty(ngroups, dtype='O')
-
-            counts[label] = group.shape[0]
-            result[label] = res
-
-        result = lib.maybe_convert_objects(result, try_float=0)
-        return result, counts
-
-
-def generate_bins_generic(values, binner, closed):
-    """
-    Generate bin edge offsets and bin labels for one array using another array
-    which has bin edge values. Both arrays must be sorted.
-
-    Parameters
-    ----------
-    values : array of values
-    binner : a comparable array of values representing bins into which to bin
-        the first array. Note, 'values' end-points must fall within 'binner'
-        end-points.
-    closed : which end of bin is closed; left (default), right
-
-    Returns
-    -------
-    bins : array of offsets (into 'values' argument) of bins.
-        Zero and last edge are excluded in result, so for instance the first
-        bin is values[0:bin[0]] and the last is values[bin[-1]:]
-    """
-    lenidx = len(values)
-    lenbin = len(binner)
-
-    if lenidx <= 0 or lenbin <= 0:
-        raise ValueError("Invalid length for values or for binner")
-
-    # check binner fits data
-    if values[0] < binner[0]:
-        raise ValueError("Values falls before first bin")
-
-    if values[lenidx - 1] > binner[lenbin - 1]:
-        raise ValueError("Values falls after last bin")
-
-    bins = np.empty(lenbin - 1, dtype=np.int64)
-
-    j = 0  # index into values
-    bc = 0  # bin count
-
-    # linear scan, presume nothing about values/binner except that it fits ok
-    for i in range(0, lenbin - 1):
-        r_bin = binner[i + 1]
-
-        # count values in current bin, advance to next bin
-        while j < lenidx and (values[j] < r_bin or
-                              (closed == 'right' and values[j] == r_bin)):
-            j += 1
-
-        bins[bc] = j
-        bc += 1
-
-    return bins
-
-
-class BinGrouper(BaseGrouper):
-
-    def __init__(self, bins, binlabels, filter_empty=False, mutated=False):
-        self.bins = _ensure_int64(bins)
-        self.binlabels = _ensure_index(binlabels)
-        self._filter_empty_groups = filter_empty
-        self.mutated = mutated
-
-    @cache_readonly
-    def groups(self):
-        """ dict {group name -> group labels} """
-
-        # this is mainly for compat
-        # GH 3881
-        result = {}
-        for key, value in zip(self.binlabels, self.bins):
-            if key is not NaT:
-                result[key] = value
-        return result
-
-    @property
-    def nkeys(self):
-        return 1
-
-    def get_iterator(self, data, axis=0):
-        """
-        Groupby iterator
-
-        Returns
-        -------
-        Generator yielding sequence of (name, subsetted object)
-        for each group
-        """
-        if isinstance(data, NDFrame):
-            slicer = lambda start, edge: data._slice(
-                slice(start, edge), axis=axis)
-            length = len(data.axes[axis])
-        else:
-            slicer = lambda start, edge: data[slice(start, edge)]
-            length = len(data)
-
-        start = 0
-        for edge, label in zip(self.bins, self.binlabels):
-            if label is not NaT:
-                yield label, slicer(start, edge)
-            start = edge
-
-        if start < length:
-            yield self.binlabels[-1], slicer(start, None)
-
-    @cache_readonly
-    def indices(self):
-        indices = collections.defaultdict(list)
-
-        i = 0
-        for label, bin in zip(self.binlabels, self.bins):
-            if i < bin:
-                if label is not NaT:
-                    indices[label] = list(range(i, bin))
-                i = bin
-        return indices
-
-    @cache_readonly
-    def group_info(self):
-        ngroups = self.ngroups
-        obs_group_ids = np.arange(ngroups)
-        rep = np.diff(np.r_[0, self.bins])
-
-        rep = _ensure_platform_int(rep)
-        if ngroups == len(self.bins):
-            comp_ids = np.repeat(np.arange(ngroups), rep)
-        else:
-            comp_ids = np.repeat(np.r_[-1, np.arange(ngroups)], rep)
-
-        return comp_ids.astype('int64', copy=False), \
-            obs_group_ids.astype('int64', copy=False), ngroups
-
-    @cache_readonly
-    def ngroups(self):
-        return len(self.result_index)
-
-    @cache_readonly
-    def result_index(self):
-        if len(self.binlabels) != 0 and isnull(self.binlabels[0]):
-            return self.binlabels[1:]
-
-        return self.binlabels
-
-    @property
-    def levels(self):
-        return [self.binlabels]
-
-    @property
-    def names(self):
-        return [self.binlabels.name]
-
-    @property
-    def groupings(self):
-        return [Grouping(lvl, lvl, in_axis=False, level=None, name=name)
-                for lvl, name in zip(self.levels, self.names)]
-
-    def agg_series(self, obj, func):
-        dummy = obj[:0]
-        grouper = lib.SeriesBinGrouper(obj, func, self.bins, dummy)
-        return grouper.get_result()
-
-    # ----------------------------------------------------------------------
-    # cython aggregation
-
-    _cython_functions = copy.deepcopy(BaseGrouper._cython_functions)
-
-
-class Grouping(object):
-
-    """
-    Holds the grouping information for a single key
-
-    Parameters
-    ----------
-    index : Index
-    grouper :
-    obj :
-    name :
-    level :
-    in_axis : if the Grouping is a column in self.obj and hence among
-        Groupby.exclusions list
-
-    Returns
-    -------
-    **Attributes**:
-      * indices : dict of {group -> index_list}
-      * labels : ndarray, group labels
-      * ids : mapping of label -> group
-      * counts : array of group counts
-      * group_index : unique groups
-      * groups : dict of {group -> label_list}
-    """
-
-    def __init__(self, index, grouper=None, obj=None, name=None, level=None,
-                 sort=True, in_axis=False):
-
-        self.name = name
-        self.level = level
-        self.grouper = _convert_grouper(index, grouper)
-        self.index = index
-        self.sort = sort
-        self.obj = obj
-        self.in_axis = in_axis
-
-        # right place for this?
-        if isinstance(grouper, (Series, Index)) and name is None:
-            self.name = grouper.name
-
-        if isinstance(grouper, MultiIndex):
-            self.grouper = grouper.values
-
-        # pre-computed
-        self._should_compress = True
-
-        # we have a single grouper which may be a myriad of things,
-        # some of which are dependent on the passing in level
-
-        if level is not None:
-            if not isinstance(level, int):
-                if level not in index.names:
-                    raise AssertionError('Level %s not in index' % str(level))
-                level = index.names.index(level)
-
-            if self.name is None:
-                self.name = index.names[level]
-
-            self.grouper, self._labels, self._group_index = \
-                index._get_grouper_for_level(self.grouper, level)
-
-        else:
-            if self.grouper is None and self.name is not None:
-                self.grouper = self.obj[self.name]
-
-            elif isinstance(self.grouper, (list, tuple)):
-                self.grouper = com._asarray_tuplesafe(self.grouper)
-
-            # a passed Categorical
-            elif is_categorical_dtype(self.grouper):
-
-                self.grouper = self.grouper._codes_for_groupby(self.sort)
-
-                # we make a CategoricalIndex out of the cat grouper
-                # preserving the categories / ordered attributes
-                self._labels = self.grouper.codes
-
-                c = self.grouper.categories
-                self._group_index = CategoricalIndex(
-                    Categorical.from_codes(np.arange(len(c)),
-                                           categories=c,
-                                           ordered=self.grouper.ordered))
-
-            # a passed Grouper like
-            elif isinstance(self.grouper, Grouper):
-
-                # get the new grouper
-                grouper = self.grouper._get_binner_for_grouping(self.obj)
-                self.obj = self.grouper.obj
-                self.grouper = grouper
-                if self.name is None:
-                    self.name = grouper.name
-
-            # we are done
-            if isinstance(self.grouper, Grouping):
-                self.grouper = self.grouper.grouper
-
-            # no level passed
-            elif not isinstance(self.grouper,
-                                (Series, Index, Categorical, np.ndarray)):
-                if getattr(self.grouper, 'ndim', 1) != 1:
-                    t = self.name or str(type(self.grouper))
-                    raise ValueError("Grouper for '%s' not 1-dimensional" % t)
-                self.grouper = self.index.map(self.grouper)
-                if not (hasattr(self.grouper, "__len__") and
-                        len(self.grouper) == len(self.index)):
-                    errmsg = ('Grouper result violates len(labels) == '
-                              'len(data)\nresult: %s' %
-                              pprint_thing(self.grouper))
-                    self.grouper = None  # Try for sanity
-                    raise AssertionError(errmsg)
-
-        # if we have a date/time-like grouper, make sure that we have
-        # Timestamps like
-        if getattr(self.grouper, 'dtype', None) is not None:
-            if is_datetime64_dtype(self.grouper):
-                from pandas import to_datetime
-                self.grouper = to_datetime(self.grouper)
-            elif is_timedelta64_dtype(self.grouper):
-                from pandas import to_timedelta
-                self.grouper = to_timedelta(self.grouper)
-
-    def __repr__(self):
-        return 'Grouping({0})'.format(self.name)
-
-    def __iter__(self):
-        return iter(self.indices)
-
-    _labels = None
-    _group_index = None
-
-    @property
-    def ngroups(self):
-        return len(self.group_index)
-
-    @cache_readonly
-    def indices(self):
-        values = _ensure_categorical(self.grouper)
-        return values._reverse_indexer()
-
-    @property
-    def labels(self):
-        if self._labels is None:
-            self._make_labels()
-        return self._labels
-
-    @property
-    def group_index(self):
-        if self._group_index is None:
-            self._make_labels()
-        return self._group_index
-
-    def _make_labels(self):
-        if self._labels is None or self._group_index is None:
-            labels, uniques = algorithms.factorize(
-                self.grouper, sort=self.sort)
-            uniques = Index(uniques, name=self.name)
-            self._labels = labels
-            self._group_index = uniques
-
-    @cache_readonly
-    def groups(self):
-        return self.index.groupby(Categorical.from_codes(self.labels,
-                                                         self.group_index))
-
-
-def _get_grouper(obj, key=None, axis=0, level=None, sort=True,
-                 mutated=False):
-    """
-    create and return a BaseGrouper, which is an internal
-    mapping of how to create the grouper indexers.
-    This may be composed of multiple Grouping objects, indicating
-    multiple groupers
-
-    Groupers are ultimately index mappings. They can originate as:
-    index mappings, keys to columns, functions, or Groupers
-
-    Groupers enable local references to axis,level,sort, while
-    the passed in axis, level, and sort are 'global'.
-
-    This routine tries to figure out what the passing in references
-    are and then creates a Grouping for each one, combined into
-    a BaseGrouper.
-
-    """
-    group_axis = obj._get_axis(axis)
-
-    # validate that the passed level is compatible with the passed
-    # axis of the object
-    if level is not None:
-        if not isinstance(group_axis, MultiIndex):
-            # allow level to be a length-one list-like object
-            # (e.g., level=[0])
-            # GH 13901
-            if is_list_like(level):
-                nlevels = len(level)
-                if nlevels == 1:
-                    level = level[0]
-                elif nlevels == 0:
-                    raise ValueError('No group keys passed!')
-                else:
-                    raise ValueError('multiple levels only valid with '
-                                     'MultiIndex')
-
-            if isinstance(level, compat.string_types):
-                if obj.index.name != level:
-                    raise ValueError('level name %s is not the name of the '
-                                     'index' % level)
-            elif level > 0 or level < -1:
-                raise ValueError('level > 0 or level < -1 only valid with '
-                                 ' MultiIndex')
-
-            level = None
-            key = group_axis
-
-    # a passed-in Grouper, directly convert
-    if isinstance(key, Grouper):
-        binner, grouper, obj = key._get_grouper(obj)
-        if key.key is None:
-            return grouper, [], obj
-        else:
-            return grouper, set([key.key]), obj
-
-    # already have a BaseGrouper, just return it
-    elif isinstance(key, BaseGrouper):
-        return key, [], obj
-
-    if not isinstance(key, (tuple, list)):
-        keys = [key]
-        match_axis_length = False
-    else:
-        keys = key
-        match_axis_length = len(keys) == len(group_axis)
-
-    # what are we after, exactly?
-    any_callable = any(callable(g) or isinstance(g, dict) for g in keys)
-    any_groupers = any(isinstance(g, Grouper) for g in keys)
-    any_arraylike = any(isinstance(g, (list, tuple, Series, Index, np.ndarray))
-                        for g in keys)
-
-    try:
-        if isinstance(obj, DataFrame):
-            all_in_columns = all(g in obj.columns for g in keys)
-        else:
-            all_in_columns = False
-    except Exception:
-        all_in_columns = False
-
-    if not any_callable and not all_in_columns and \
-       not any_arraylike and not any_groupers and \
-       match_axis_length and level is None:
-        keys = [com._asarray_tuplesafe(keys)]
-
-    if isinstance(level, (tuple, list)):
-        if key is None:
-            keys = [None] * len(level)
-        levels = level
-    else:
-        levels = [level] * len(keys)
-
-    groupings = []
-    exclusions = []
-
-    # if the actual grouper should be obj[key]
-    def is_in_axis(key):
-        if not _is_label_like(key):
-            try:
-                obj._data.items.get_loc(key)
-            except Exception:
-                return False
-
-        return True
-
-    # if the the grouper is obj[name]
-    def is_in_obj(gpr):
-        try:
-            return id(gpr) == id(obj[gpr.name])
-        except Exception:
-            return False
-
-    for i, (gpr, level) in enumerate(zip(keys, levels)):
-
-        if is_in_obj(gpr):  # df.groupby(df['name'])
-            in_axis, name = True, gpr.name
-            exclusions.append(name)
-
-        elif is_in_axis(gpr):  # df.groupby('name')
-            if gpr in obj:
-                if gpr in obj.index.names:
-                    warnings.warn(
-                        ("'%s' is both a column name and an index level.\n"
-                         "Defaulting to column but "
-                         "this will raise an ambiguity error in a "
-                         "future version") % gpr,
-                        FutureWarning, stacklevel=5)
-                in_axis, name, gpr = True, gpr, obj[gpr]
-                exclusions.append(name)
-            elif gpr in obj.index.names:
-                in_axis, name, level, gpr = False, None, gpr, None
-            else:
-                raise KeyError(gpr)
-        elif isinstance(gpr, Grouper) and gpr.key is not None:
-            # Add key to exclusions
-            exclusions.append(gpr.key)
-            in_axis, name = False, None
-        else:
-            in_axis, name = False, None
-
-        if is_categorical_dtype(gpr) and len(gpr) != len(obj):
-            raise ValueError("Categorical dtype grouper must "
-                             "have len(grouper) == len(data)")
-
-        # create the Grouping
-        # allow us to passing the actual Grouping as the gpr
-        ping = Grouping(group_axis,
-                        gpr,
-                        obj=obj,
-                        name=name,
-                        level=level,
-                        sort=sort,
-                        in_axis=in_axis) \
-            if not isinstance(gpr, Grouping) else gpr
-
-        groupings.append(ping)
-
-    if len(groupings) == 0:
-        raise ValueError('No group keys passed!')
-
-    # create the internals grouper
-    grouper = BaseGrouper(group_axis, groupings, sort=sort, mutated=mutated)
-
-    return grouper, exclusions, obj
-
-
-def _is_label_like(val):
-    return (isinstance(val, compat.string_types) or
-            (val is not None and is_scalar(val)))
-
-
-def _convert_grouper(axis, grouper):
-    if isinstance(grouper, dict):
-        return grouper.get
-    elif isinstance(grouper, Series):
-        if grouper.index.equals(axis):
-            return grouper._values
-        else:
-            return grouper.reindex(axis)._values
-    elif isinstance(grouper, (list, Series, Index, np.ndarray)):
-        if len(grouper) != len(axis):
-            raise AssertionError('Grouper and axis must be same length')
-        return grouper
-    else:
-        return grouper
-
-
-def _whitelist_method_generator(klass, whitelist):
-    """
-    Yields all GroupBy member defs for DataFrame/Series names in _whitelist.
-
-    Parameters
-    ----------
-    klass - class where members are defined.  Should be Series or DataFrame
-
-    whitelist - list of names of klass methods to be constructed
-
-    Returns
-    -------
-    The generator yields a sequence of strings, each suitable for exec'ing,
-    that define implementations of the named methods for DataFrameGroupBy
-    or SeriesGroupBy.
-
-    Since we don't want to override methods explicitly defined in the
-    base class, any such name is skipped.
-    """
-
-    method_wrapper_template = \
-        """def %(name)s(%(sig)s) :
-    \"""
-    %(doc)s
-    \"""
-    f = %(self)s.__getattr__('%(name)s')
-    return f(%(args)s)"""
-    property_wrapper_template = \
-        """@property
-def %(name)s(self) :
-    \"""
-    %(doc)s
-    \"""
-    return self.__getattr__('%(name)s')"""
-    for name in whitelist:
-        # don't override anything that was explicitly defined
-        # in the base class
-        if hasattr(GroupBy, name):
-            continue
-        # ugly, but we need the name string itself in the method.
-        f = getattr(klass, name)
-        doc = f.__doc__
-        doc = doc if type(doc) == str else ''
-        if isinstance(f, types.MethodType):
-            wrapper_template = method_wrapper_template
-            decl, args = make_signature(f)
-            # pass args by name to f because otherwise
-            # GroupBy._make_wrapper won't know whether
-            # we passed in an axis parameter.
-            args_by_name = ['{0}={0}'.format(arg) for arg in args[1:]]
-            params = {'name': name,
-                      'doc': doc,
-                      'sig': ','.join(decl),
-                      'self': args[0],
-                      'args': ','.join(args_by_name)}
-        else:
-            wrapper_template = property_wrapper_template
-            params = {'name': name, 'doc': doc}
-        yield wrapper_template % params
-
-
-class SeriesGroupBy(GroupBy):
-    #
-    # Make class defs of attributes on SeriesGroupBy whitelist
-    _apply_whitelist = _series_apply_whitelist
-    for _def_str in _whitelist_method_generator(Series,
-                                                _series_apply_whitelist):
-        exec(_def_str)
-
-    @property
-    def name(self):
-        """
-        since we are a series, we by definition only have
-        a single name, but may be the result of a selection or
-        the name of our object
-        """
-        if self._selection is None:
-            return self.obj.name
-        else:
-            return self._selection
-
-    def aggregate(self, func_or_funcs, *args, **kwargs):
-        """
-        Apply aggregation function or functions to groups, yielding most likely
-        Series but in some cases DataFrame depending on the output of the
-        aggregation function
-
-        Parameters
-        ----------
-        func_or_funcs : function or list / dict of functions
-            List/dict of functions will produce DataFrame with column names
-            determined by the function names themselves (list) or the keys in
-            the dict
-
-        Notes
-        -----
-        agg is an alias for aggregate. Use it.
-
-        Examples
-        --------
-        >>> series
-        bar    1.0
-        baz    2.0
-        qot    3.0
-        qux    4.0
-
-        >>> mapper = lambda x: x[0] # first letter
-        >>> grouped = series.groupby(mapper)
-
-        >>> grouped.aggregate(np.sum)
-        b    3.0
-        q    7.0
-
-        >>> grouped.aggregate([np.sum, np.mean, np.std])
-           mean  std  sum
-        b  1.5   0.5  3
-        q  3.5   0.5  7
-
-        >>> grouped.agg({'result' : lambda x: x.mean() / x.std(),
-        ...              'total' : np.sum})
-           result  total
-        b  2.121   3
-        q  4.95    7
-
-        See also
-        --------
-        apply, transform
-
-        Returns
-        -------
-        Series or DataFrame
-        """
-        _level = kwargs.pop('_level', None)
-        if isinstance(func_or_funcs, compat.string_types):
-            return getattr(self, func_or_funcs)(*args, **kwargs)
-
-        if hasattr(func_or_funcs, '__iter__'):
-            ret = self._aggregate_multiple_funcs(func_or_funcs,
-                                                 (_level or 0) + 1)
-        else:
-            cyfunc = self._is_cython_func(func_or_funcs)
-            if cyfunc and not args and not kwargs:
-                return getattr(self, cyfunc)()
-
-            if self.grouper.nkeys > 1:
-                return self._python_agg_general(func_or_funcs, *args, **kwargs)
-
-            try:
-                return self._python_agg_general(func_or_funcs, *args, **kwargs)
-            except Exception:
-                result = self._aggregate_named(func_or_funcs, *args, **kwargs)
-
-            index = Index(sorted(result), name=self.grouper.names[0])
-            ret = Series(result, index=index)
-
-        if not self.as_index:  # pragma: no cover
-            print('Warning, ignoring as_index=True')
-
-        # _level handled at higher
-        if not _level and isinstance(ret, dict):
-            from pandas import concat
-            ret = concat(ret, axis=1)
-        return ret
-
-    agg = aggregate
-
-    def _aggregate_multiple_funcs(self, arg, _level):
-        if isinstance(arg, dict):
-            columns = list(arg.keys())
-            arg = list(arg.items())
-        elif any(isinstance(x, (tuple, list)) for x in arg):
-            arg = [(x, x) if not isinstance(x, (tuple, list)) else x
-                   for x in arg]
-
-            # indicated column order
-            columns = lzip(*arg)[0]
-        else:
-            # list of functions / function names
-            columns = []
-            for f in arg:
-                if isinstance(f, compat.string_types):
-                    columns.append(f)
-                else:
-                    # protect against callables without names
-                    columns.append(com._get_callable_name(f))
-            arg = lzip(columns, arg)
-
-        results = {}
-        for name, func in arg:
-            obj = self
-            if name in results:
-                raise SpecificationError('Function names must be unique, '
-                                         'found multiple named %s' % name)
-
-            # reset the cache so that we
-            # only include the named selection
-            if name in self._selected_obj:
-                obj = copy.copy(obj)
-                obj._reset_cache()
-                obj._selection = name
-            results[name] = obj.aggregate(func)
-
-        if isinstance(list(compat.itervalues(results))[0],
-                      DataFrame):
-
-            # let higher level handle
-            if _level:
-                return results
-            return list(compat.itervalues(results))[0]
-        return DataFrame(results, columns=columns)
-
-    def _wrap_output(self, output, index, names=None):
-        """ common agg/transform wrapping logic """
-        output = output[self.name]
-
-        if names is not None:
-            return DataFrame(output, index=index, columns=names)
-        else:
-            name = self.name
-            if name is None:
-                name = self._selected_obj.name
-            return Series(output, index=index, name=name)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        return self._wrap_output(output=output,
-                                 index=self.grouper.result_index,
-                                 names=names)
-
-    def _wrap_transformed_output(self, output, names=None):
-        return self._wrap_output(output=output,
-                                 index=self.obj.index,
-                                 names=names)
-
-    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
-        if len(keys) == 0:
-            # GH #6265
-            return Series([], name=self.name, index=keys)
-
-        def _get_index():
-            if self.grouper.nkeys > 1:
-                index = MultiIndex.from_tuples(keys, names=self.grouper.names)
-            else:
-                index = Index(keys, name=self.grouper.names[0])
-            return index
-
-        if isinstance(values[0], dict):
-            # GH #823
-            index = _get_index()
-            result = DataFrame(values, index=index).stack()
-            result.name = self.name
-            return result
-
-        if isinstance(values[0], (Series, dict)):
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        elif isinstance(values[0], DataFrame):
-            # possible that Series -> DataFrame by applied function
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        else:
-            # GH #6265
-            return Series(values, index=_get_index(), name=self.name)
-
-    def _aggregate_named(self, func, *args, **kwargs):
-        result = {}
-
-        for name, group in self:
-            group.name = name
-            output = func(group, *args, **kwargs)
-            if isinstance(output, (Series, Index, np.ndarray)):
-                raise Exception('Must produce aggregated value')
-            result[name] = self._try_cast(output, group)
-
-        return result
-
-    @Substitution(klass='Series', selected='A.')
-    @Appender(_transform_template)
-    def transform(self, func, *args, **kwargs):
-        func = self._is_cython_func(func) or func
-
-        # if string function
-        if isinstance(func, compat.string_types):
-            if func in _cython_transforms:
-                # cythonized transform
-                return getattr(self, func)(*args, **kwargs)
-            else:
-                # cythonized aggregation and merge
-                return self._transform_fast(
-                    lambda: getattr(self, func)(*args, **kwargs))
-
-        # reg transform
-        klass = self._selected_obj.__class__
-        results = []
-        wrapper = lambda x: func(x, *args, **kwargs)
-        for name, group in self:
-            object.__setattr__(group, 'name', name)
-            res = wrapper(group)
-
-            if hasattr(res, 'values'):
-                res = res.values
-
-            indexer = self._get_index(name)
-            s = klass(res, indexer)
-            results.append(s)
-
-        from pandas.tools.concat import concat
-        result = concat(results).sort_index()
-
-        # we will only try to coerce the result type if
-        # we have a numeric dtype, as these are *always* udfs
-        # the cython take a different path (and casting)
-        dtype = self._selected_obj.dtype
-        if is_numeric_dtype(dtype):
-            result = maybe_downcast_to_dtype(result, dtype)
-
-        result.name = self._selected_obj.name
-        result.index = self._selected_obj.index
-        return result
-
-    def _transform_fast(self, func):
-        """
-        fast version of transform, only applicable to
-        builtin/cythonizable functions
-        """
-        if isinstance(func, compat.string_types):
-            func = getattr(self, func)
-
-        ids, _, ngroup = self.grouper.group_info
-        cast = (self.size().fillna(0) > 0).any()
-        out = algorithms.take_1d(func().values, ids)
-        if cast:
-            out = self._try_cast(out, self.obj)
-        return Series(out, index=self.obj.index, name=self.obj.name)
-
-    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
-        """
-        Return a copy of a Series excluding elements from groups that
-        do not satisfy the boolean criterion specified by func.
-
-        Parameters
-        ----------
-        func : function
-            To apply to each group. Should return True or False.
-        dropna : Drop groups that do not pass the filter. True by default;
-            if False, groups that evaluate False are filled with NaNs.
-
-        Examples
-        --------
-        >>> import pandas as pd
-        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-        ...                           'foo', 'bar'],
-        ...                    'B' : [1, 2, 3, 4, 5, 6],
-        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
-        >>> grouped = df.groupby('A')
-        >>> df.groupby('A').B.filter(lambda x: x.mean() > 3.)
-        1    2
-        3    4
-        5    6
-        Name: B, dtype: int64
-
-        Returns
-        -------
-        filtered : Series
-        """
-        if isinstance(func, compat.string_types):
-            wrapper = lambda x: getattr(x, func)(*args, **kwargs)
-        else:
-            wrapper = lambda x: func(x, *args, **kwargs)
-
-        # Interpret np.nan as False.
-        def true_and_notnull(x, *args, **kwargs):
-            b = wrapper(x, *args, **kwargs)
-            return b and notnull(b)
-
-        try:
-            indices = [self._get_index(name) for name, group in self
-                       if true_and_notnull(group)]
-        except ValueError:
-            raise TypeError("the filter must return a boolean result")
-        except TypeError:
-            raise TypeError("the filter must return a boolean result")
-
-        filtered = self._apply_filter(indices, dropna)
-        return filtered
-
-    def nunique(self, dropna=True):
-        """ Returns number of unique elements in the group """
-        ids, _, _ = self.grouper.group_info
-
-        val = self.obj.get_values()
-
-        try:
-            sorter = np.lexsort((val, ids))
-        except TypeError:  # catches object dtypes
-            assert val.dtype == object, \
-                'val.dtype must be object, got %s' % val.dtype
-            val, _ = algorithms.factorize(val, sort=False)
-            sorter = np.lexsort((val, ids))
-            _isnull = lambda a: a == -1
-        else:
-            _isnull = isnull
-
-        ids, val = ids[sorter], val[sorter]
-
-        # group boundaries are where group ids change
-        # unique observations are where sorted values change
-        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
-        inc = np.r_[1, val[1:] != val[:-1]]
-
-        # 1st item of each group is a new unique observation
-        mask = _isnull(val)
-        if dropna:
-            inc[idx] = 1
-            inc[mask] = 0
-        else:
-            inc[mask & np.r_[False, mask[:-1]]] = 0
-            inc[idx] = 1
-
-        out = np.add.reduceat(inc, idx).astype('int64', copy=False)
-        if len(ids):
-            res = out if ids[0] != -1 else out[1:]
-        else:
-            res = out[1:]
-        ri = self.grouper.result_index
-
-        # we might have duplications among the bins
-        if len(res) != len(ri):
-            res, out = np.zeros(len(ri), dtype=out.dtype), res
-            res[ids[idx]] = out
-
-        return Series(res,
-                      index=ri,
-                      name=self.name)
-
-    @Appender(Series.describe.__doc__)
-    def describe(self, **kwargs):
-        self._set_group_selection()
-        result = self.apply(lambda x: x.describe(**kwargs))
-        if self.axis == 1:
-            return result.T
-        return result.unstack()
-
-    def value_counts(self, normalize=False, sort=True, ascending=False,
-                     bins=None, dropna=True):
-
-        from functools import partial
-        from pandas.tools.tile import cut
-        from pandas.tools.merge import _get_join_indexers
-
-        if bins is not None and not np.iterable(bins):
-            # scalar bins cannot be done at top level
-            # in a backward compatible way
-            return self.apply(Series.value_counts,
-                              normalize=normalize,
-                              sort=sort,
-                              ascending=ascending,
-                              bins=bins)
-
-        ids, _, _ = self.grouper.group_info
-        val = self.obj.get_values()
-
-        # groupby removes null keys from groupings
-        mask = ids != -1
-        ids, val = ids[mask], val[mask]
-
-        if bins is None:
-            lab, lev = algorithms.factorize(val, sort=True)
-        else:
-            cat, bins = cut(val, bins, retbins=True)
-            # bins[:-1] for backward compat;
-            # o.w. cat.categories could be better
-            lab, lev, dropna = cat.codes, bins[:-1], False
-
-        sorter = np.lexsort((lab, ids))
-        ids, lab = ids[sorter], lab[sorter]
-
-        # group boundaries are where group ids change
-        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
-
-        # new values are where sorted labels change
-        inc = np.r_[True, lab[1:] != lab[:-1]]
-        inc[idx] = True  # group boundaries are also new values
-        out = np.diff(np.nonzero(np.r_[inc, True])[0])  # value counts
-
-        # num. of times each group should be repeated
-        rep = partial(np.repeat, repeats=np.add.reduceat(inc, idx))
-
-        # multi-index components
-        labels = list(map(rep, self.grouper.recons_labels)) + [lab[inc]]
-        levels = [ping.group_index for ping in self.grouper.groupings] + [lev]
-        names = self.grouper.names + [self.name]
-
-        if dropna:
-            mask = labels[-1] != -1
-            if mask.all():
-                dropna = False
-            else:
-                out, labels = out[mask], [label[mask] for label in labels]
-
-        if normalize:
-            out = out.astype('float')
-            d = np.diff(np.r_[idx, len(ids)])
-            if dropna:
-                m = ids[lab == -1]
-                if _np_version_under1p8:
-                    mi, ml = algorithms.factorize(m)
-                    d[ml] = d[ml] - np.bincount(mi)
-                else:
-                    np.add.at(d, m, -1)
-                acc = rep(d)[mask]
-            else:
-                acc = rep(d)
-            out /= acc
-
-        if sort and bins is None:
-            cat = ids[inc][mask] if dropna else ids[inc]
-            sorter = np.lexsort((out if ascending else -out, cat))
-            out, labels[-1] = out[sorter], labels[-1][sorter]
-
-        if bins is None:
-            mi = MultiIndex(levels=levels, labels=labels, names=names,
-                            verify_integrity=False)
-
-            if is_integer_dtype(out):
-                out = _ensure_int64(out)
-            return Series(out, index=mi, name=self.name)
-
-        # for compat. with libgroupby.value_counts need to ensure every
-        # bin is present at every index level, null filled with zeros
-        diff = np.zeros(len(out), dtype='bool')
-        for lab in labels[:-1]:
-            diff |= np.r_[True, lab[1:] != lab[:-1]]
-
-        ncat, nbin = diff.sum(), len(levels[-1])
-
-        left = [np.repeat(np.arange(ncat), nbin),
-                np.tile(np.arange(nbin), ncat)]
-
-        right = [diff.cumsum() - 1, labels[-1]]
-
-        _, idx = _get_join_indexers(left, right, sort=False, how='left')
-        out = np.where(idx != -1, out[idx], 0)
-
-        if sort:
-            sorter = np.lexsort((out if ascending else -out, left[0]))
-            out, left[-1] = out[sorter], left[-1][sorter]
-
-        # build the multi-index w/ full levels
-        labels = list(map(lambda lab: np.repeat(lab[diff], nbin), labels[:-1]))
-        labels.append(left[-1])
-
-        mi = MultiIndex(levels=levels, labels=labels, names=names,
-                        verify_integrity=False)
-
-        if is_integer_dtype(out):
-            out = _ensure_int64(out)
-        return Series(out, index=mi, name=self.name)
-
-    def count(self):
-        """ Compute count of group, excluding missing values """
-        ids, _, ngroups = self.grouper.group_info
-        val = self.obj.get_values()
-
-        mask = (ids != -1) & ~isnull(val)
-        ids = _ensure_platform_int(ids)
-        out = np.bincount(ids[mask], minlength=ngroups or None)
-
-        return Series(out,
-                      index=self.grouper.result_index,
-                      name=self.name,
-                      dtype='int64')
-
-    def _apply_to_column_groupbys(self, func):
-        """ return a pass thru """
-        return func(self)
-
-
-class NDFrameGroupBy(GroupBy):
-
-    def _iterate_slices(self):
-        if self.axis == 0:
-            # kludge
-            if self._selection is None:
-                slice_axis = self.obj.columns
-            else:
-                slice_axis = self._selection_list
-            slicer = lambda x: self.obj[x]
-        else:
-            slice_axis = self.obj.index
-            slicer = self.obj.xs
-
-        for val in slice_axis:
-            if val in self.exclusions:
-                continue
-            yield val, slicer(val)
-
-    def _cython_agg_general(self, how, alt=None, numeric_only=True):
-        new_items, new_blocks = self._cython_agg_blocks(
-            how, alt=alt, numeric_only=numeric_only)
-        return self._wrap_agged_blocks(new_items, new_blocks)
-
-    def _wrap_agged_blocks(self, items, blocks):
-        obj = self._obj_with_exclusions
-
-        new_axes = list(obj._data.axes)
-
-        # more kludge
-        if self.axis == 0:
-            new_axes[0], new_axes[1] = new_axes[1], self.grouper.result_index
-        else:
-            new_axes[self.axis] = self.grouper.result_index
-
-        # Make sure block manager integrity check passes.
-        assert new_axes[0].equals(items)
-        new_axes[0] = items
-
-        mgr = BlockManager(blocks, new_axes)
-
-        new_obj = type(obj)(mgr)
-
-        return self._post_process_cython_aggregate(new_obj)
-
-    _block_agg_axis = 0
-
-    def _cython_agg_blocks(self, how, alt=None, numeric_only=True):
-        # TODO: the actual managing of mgr_locs is a PITA
-        # here, it should happen via BlockManager.combine
-
-        data, agg_axis = self._get_data_to_aggregate()
-
-        if numeric_only:
-            data = data.get_numeric_data(copy=False)
-
-        new_blocks = []
-        new_items = []
-        deleted_items = []
-        for block in data.blocks:
-
-            locs = block.mgr_locs.as_array
-            try:
-                result, _ = self.grouper.aggregate(
-                    block.values, how, axis=agg_axis)
-            except NotImplementedError:
-                # generally if we have numeric_only=False
-                # and non-applicable functions
-                # try to python agg
-
-                if alt is None:
-                    # we cannot perform the operation
-                    # in an alternate way, exclude the block
-                    deleted_items.append(locs)
-                    continue
-
-                # call our grouper again with only this block
-                obj = self.obj[data.items[locs]]
-                s = groupby(obj, self.grouper)
-                result = s.aggregate(lambda x: alt(x, axis=self.axis))
-                result = result._data.blocks[0]
-
-            # see if we can cast the block back to the original dtype
-            result = block._try_coerce_and_cast_result(result)
-
-            new_items.append(locs)
-            newb = block.make_block_same_class(result)
-            new_blocks.append(newb)
-
-        if len(new_blocks) == 0:
-            raise DataError('No numeric types to aggregate')
-
-        # reset the locs in the blocks to correspond to our
-        # current ordering
-        indexer = np.concatenate(new_items)
-        new_items = data.items.take(np.sort(indexer))
-
-        if len(deleted_items):
-
-            # we need to adjust the indexer to account for the
-            # items we have removed
-            # really should be done in internals :<
-
-            deleted = np.concatenate(deleted_items)
-            ai = np.arange(len(data))
-            mask = np.zeros(len(data))
-            mask[deleted] = 1
-            indexer = (ai - mask.cumsum())[indexer]
-
-        offset = 0
-        for b in new_blocks:
-            l = len(b.mgr_locs)
-            b.mgr_locs = indexer[offset:(offset + l)]
-            offset += l
-
-        return new_items, new_blocks
-
-    def _get_data_to_aggregate(self):
-        obj = self._obj_with_exclusions
-        if self.axis == 0:
-            return obj.swapaxes(0, 1)._data, 1
-        else:
-            return obj._data, self.axis
-
-    def _post_process_cython_aggregate(self, obj):
-        # undoing kludge from below
-        if self.axis == 0:
-            obj = obj.swapaxes(0, 1)
-        return obj
-
-    def aggregate(self, arg, *args, **kwargs):
-
-        _level = kwargs.pop('_level', None)
-        result, how = self._aggregate(arg, _level=_level, *args, **kwargs)
-        if how is None:
-            return result
-
-        if result is None:
-
-            # grouper specific aggregations
-            if self.grouper.nkeys > 1:
-                return self._python_agg_general(arg, *args, **kwargs)
-            else:
-
-                # try to treat as if we are passing a list
-                try:
-                    assert not args and not kwargs
-                    result = self._aggregate_multiple_funcs(
-                        [arg], _level=_level)
-                    result.columns = Index(
-                        result.columns.levels[0],
-                        name=self._selected_obj.columns.name)
-                except:
-                    result = self._aggregate_generic(arg, *args, **kwargs)
-
-        if not self.as_index:
-            self._insert_inaxis_grouper_inplace(result)
-            result.index = np.arange(len(result))
-
-        return result._convert(datetime=True)
-
-    agg = aggregate
-
-    def _aggregate_generic(self, func, *args, **kwargs):
-        if self.grouper.nkeys != 1:
-            raise AssertionError('Number of keys must be 1')
-
-        axis = self.axis
-        obj = self._obj_with_exclusions
-
-        result = {}
-        if axis != obj._info_axis_number:
-            try:
-                for name, data in self:
-                    result[name] = self._try_cast(func(data, *args, **kwargs),
-                                                  data)
-            except Exception:
-                return self._aggregate_item_by_item(func, *args, **kwargs)
-        else:
-            for name in self.indices:
-                try:
-                    data = self.get_group(name, obj=obj)
-                    result[name] = self._try_cast(func(data, *args, **kwargs),
-                                                  data)
-                except Exception:
-                    wrapper = lambda x: func(x, *args, **kwargs)
-                    result[name] = data.apply(wrapper, axis=axis)
-
-        return self._wrap_generic_output(result, obj)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        raise AbstractMethodError(self)
-
-    def _aggregate_item_by_item(self, func, *args, **kwargs):
-        # only for axis==0
-
-        obj = self._obj_with_exclusions
-        result = {}
-        cannot_agg = []
-        errors = None
-        for item in obj:
-            try:
-                data = obj[item]
-                colg = SeriesGroupBy(data, selection=item,
-                                     grouper=self.grouper)
-                result[item] = self._try_cast(
-                    colg.aggregate(func, *args, **kwargs), data)
-            except ValueError:
-                cannot_agg.append(item)
-                continue
-            except TypeError as e:
-                cannot_agg.append(item)
-                errors = e
-                continue
-
-        result_columns = obj.columns
-        if cannot_agg:
-            result_columns = result_columns.drop(cannot_agg)
-
-            # GH6337
-            if not len(result_columns) and errors is not None:
-                raise errors
-
-        return DataFrame(result, columns=result_columns)
-
-    def _decide_output_index(self, output, labels):
-        if len(output) == len(labels):
-            output_keys = labels
-        else:
-            output_keys = sorted(output)
-            try:
-                output_keys.sort()
-            except Exception:  # pragma: no cover
-                pass
-
-            if isinstance(labels, MultiIndex):
-                output_keys = MultiIndex.from_tuples(output_keys,
-                                                     names=labels.names)
-
-        return output_keys
-
-    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
-        from pandas.core.index import _all_indexes_same
-        from pandas.tools.util import to_numeric
-
-        if len(keys) == 0:
-            return DataFrame(index=keys)
-
-        key_names = self.grouper.names
-
-        # GH12824.
-        def first_non_None_value(values):
-            try:
-                v = next(v for v in values if v is not None)
-            except StopIteration:
-                return None
-            return v
-
-        v = first_non_None_value(values)
-
-        if v is None:
-            # GH9684. If all values are None, then this will throw an error.
-            # We'd prefer it return an empty dataframe.
-            return DataFrame()
-        elif isinstance(v, DataFrame):
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-        elif self.grouper.groupings is not None:
-            if len(self.grouper.groupings) > 1:
-                key_index = MultiIndex.from_tuples(keys, names=key_names)
-
-            else:
-                ping = self.grouper.groupings[0]
-                if len(keys) == ping.ngroups:
-                    key_index = ping.group_index
-                    key_index.name = key_names[0]
-
-                    key_lookup = Index(keys)
-                    indexer = key_lookup.get_indexer(key_index)
-
-                    # reorder the values
-                    values = [values[i] for i in indexer]
-                else:
-
-                    key_index = Index(keys, name=key_names[0])
-
-                # don't use the key indexer
-                if not self.as_index:
-                    key_index = None
-
-            # make Nones an empty object
-            v = first_non_None_value(values)
-            if v is None:
-                return DataFrame()
-            elif isinstance(v, NDFrame):
-                values = [
-                    x if x is not None else
-                    v._constructor(**v._construct_axes_dict())
-                    for x in values
-                ]
-
-            v = values[0]
-
-            if isinstance(v, (np.ndarray, Index, Series)):
-                if isinstance(v, Series):
-                    applied_index = self._selected_obj._get_axis(self.axis)
-                    all_indexed_same = _all_indexes_same([
-                        x.index for x in values
-                    ])
-                    singular_series = (len(values) == 1 and
-                                       applied_index.nlevels == 1)
-
-                    # GH3596
-                    # provide a reduction (Frame -> Series) if groups are
-                    # unique
-                    if self.squeeze:
-
-                        # assign the name to this series
-                        if singular_series:
-                            values[0].name = keys[0]
-
-                            # GH2893
-                            # we have series in the values array, we want to
-                            # produce a series:
-                            # if any of the sub-series are not indexed the same
-                            # OR we don't have a multi-index and we have only a
-                            # single values
-                            return self._concat_objects(
-                                keys, values, not_indexed_same=not_indexed_same
-                            )
-
-                        # still a series
-                        # path added as of GH 5545
-                        elif all_indexed_same:
-                            from pandas.tools.concat import concat
-                            return concat(values)
-
-                    if not all_indexed_same:
-                        # GH 8467
-                        return self._concat_objects(
-                            keys, values, not_indexed_same=True,
-                        )
-
-                try:
-                    if self.axis == 0:
-                        # GH6124 if the list of Series have a consistent name,
-                        # then propagate that name to the result.
-                        index = v.index.copy()
-                        if index.name is None:
-                            # Only propagate the series name to the result
-                            # if all series have a consistent name.  If the
-                            # series do not have a consistent name, do
-                            # nothing.
-                            names = set(v.name for v in values)
-                            if len(names) == 1:
-                                index.name = list(names)[0]
-
-                        # normally use vstack as its faster than concat
-                        # and if we have mi-columns
-                        if isinstance(v.index,
-                                      MultiIndex) or key_index is None:
-                            stacked_values = np.vstack(map(np.asarray, values))
-                            result = DataFrame(stacked_values, index=key_index,
-                                               columns=index)
-                        else:
-                            # GH5788 instead of stacking; concat gets the
-                            # dtypes correct
-                            from pandas.tools.concat import concat
-                            result = concat(values, keys=key_index,
-                                            names=key_index.names,
-                                            axis=self.axis).unstack()
-                            result.columns = index
-                    else:
-                        stacked_values = np.vstack(map(np.asarray, values))
-                        result = DataFrame(stacked_values.T, index=v.index,
-                                           columns=key_index)
-
-                except (ValueError, AttributeError):
-                    # GH1738: values is list of arrays of unequal lengths fall
-                    # through to the outer else caluse
-                    return Series(values, index=key_index, name=self.name)
-
-                # if we have date/time like in the original, then coerce dates
-                # as we are stacking can easily have object dtypes here
-                so = self._selected_obj
-                if (so.ndim == 2 and so.dtypes.apply(is_datetimelike).any()):
-                    result = result.apply(
-                        lambda x: to_numeric(x, errors='ignore'))
-                    date_cols = self._selected_obj.select_dtypes(
-                        include=['datetime', 'timedelta']).columns
-                    date_cols = date_cols.intersection(result.columns)
-                    result[date_cols] = (result[date_cols]
-                                         ._convert(datetime=True,
-                                                   coerce=True))
-                else:
-                    result = result._convert(datetime=True)
-
-                return self._reindex_output(result)
-
-            # values are not series or array-like but scalars
-            else:
-                # only coerce dates if we find at least 1 datetime
-                coerce = True if any([isinstance(x, Timestamp)
-                                      for x in values]) else False
-                # self.name not passed through to Series as the result
-                # should not take the name of original selection of columns
-                return (Series(values, index=key_index)
-                        ._convert(datetime=True,
-                                  coerce=coerce))
-
-        else:
-            # Handle cases like BinGrouper
-            return self._concat_objects(keys, values,
-                                        not_indexed_same=not_indexed_same)
-
-    def _transform_general(self, func, *args, **kwargs):
-        from pandas.tools.concat import concat
-
-        applied = []
-        obj = self._obj_with_exclusions
-        gen = self.grouper.get_iterator(obj, axis=self.axis)
-        fast_path, slow_path = self._define_paths(func, *args, **kwargs)
-
-        path = None
-        for name, group in gen:
-            object.__setattr__(group, 'name', name)
-
-            if path is None:
-                # Try slow path and fast path.
-                try:
-                    path, res = self._choose_path(fast_path, slow_path, group)
-                except TypeError:
-                    return self._transform_item_by_item(obj, fast_path)
-                except ValueError:
-                    msg = 'transform must return a scalar value for each group'
-                    raise ValueError(msg)
-            else:
-                res = path(group)
-
-            if isinstance(res, Series):
-
-                # we need to broadcast across the
-                # other dimension; this will preserve dtypes
-                # GH14457
-                if not np.prod(group.shape):
-                    continue
-                elif res.index.is_(obj.index):
-                    r = concat([res] * len(group.columns), axis=1)
-                    r.columns = group.columns
-                    r.index = group.index
-                else:
-                    r = DataFrame(
-                        np.concatenate([res.values] * len(group.index)
-                                       ).reshape(group.shape),
-                        columns=group.columns, index=group.index)
-
-                applied.append(r)
-            else:
-                applied.append(res)
-
-        concat_index = obj.columns if self.axis == 0 else obj.index
-        concatenated = concat(applied, join_axes=[concat_index],
-                              axis=self.axis, verify_integrity=False)
-        return self._set_result_index_ordered(concatenated)
-
-    @Substitution(klass='DataFrame', selected='')
-    @Appender(_transform_template)
-    def transform(self, func, *args, **kwargs):
-
-        # optimized transforms
-        func = self._is_cython_func(func) or func
-        if isinstance(func, compat.string_types):
-            if func in _cython_transforms:
-                # cythonized transform
-                return getattr(self, func)(*args, **kwargs)
-            else:
-                # cythonized aggregation and merge
-                result = getattr(self, func)(*args, **kwargs)
-        else:
-            return self._transform_general(func, *args, **kwargs)
-
-        # a reduction transform
-        if not isinstance(result, DataFrame):
-            return self._transform_general(func, *args, **kwargs)
-
-        obj = self._obj_with_exclusions
-        # nuiscance columns
-        if not result.columns.equals(obj.columns):
-            return self._transform_general(func, *args, **kwargs)
-
-        return self._transform_fast(result, obj)
-
-    def _transform_fast(self, result, obj):
-        """
-        Fast transform path for aggregations
-        """
-        # if there were groups with no observations (Categorical only?)
-        # try casting data to original dtype
-        cast = (self.size().fillna(0) > 0).any()
-
-        # for each col, reshape to to size of original frame
-        # by take operation
-        ids, _, ngroup = self.grouper.group_info
-        output = []
-        for i, _ in enumerate(result.columns):
-            res = algorithms.take_1d(result.iloc[:, i].values, ids)
-            if cast:
-                res = self._try_cast(res, obj.iloc[:, i])
-            output.append(res)
-
-        return DataFrame._from_arrays(output, columns=result.columns,
-                                      index=obj.index)
-
-    def _define_paths(self, func, *args, **kwargs):
-        if isinstance(func, compat.string_types):
-            fast_path = lambda group: getattr(group, func)(*args, **kwargs)
-            slow_path = lambda group: group.apply(
-                lambda x: getattr(x, func)(*args, **kwargs), axis=self.axis)
-        else:
-            fast_path = lambda group: func(group, *args, **kwargs)
-            slow_path = lambda group: group.apply(
-                lambda x: func(x, *args, **kwargs), axis=self.axis)
-        return fast_path, slow_path
-
-    def _choose_path(self, fast_path, slow_path, group):
-        path = slow_path
-        res = slow_path(group)
-
-        # if we make it here, test if we can use the fast path
-        try:
-            res_fast = fast_path(group)
-
-            # compare that we get the same results
-            if res.shape == res_fast.shape:
-                res_r = res.values.ravel()
-                res_fast_r = res_fast.values.ravel()
-                mask = notnull(res_r)
-            if (res_r[mask] == res_fast_r[mask]).all():
-                path = fast_path
-
-        except:
-            pass
-        return path, res
-
-    def _transform_item_by_item(self, obj, wrapper):
-        # iterate through columns
-        output = {}
-        inds = []
-        for i, col in enumerate(obj):
-            try:
-                output[col] = self[col].transform(wrapper)
-                inds.append(i)
-            except Exception:
-                pass
-
-        if len(output) == 0:  # pragma: no cover
-            raise TypeError('Transform function invalid for data types')
-
-        columns = obj.columns
-        if len(output) < len(obj.columns):
-            columns = columns.take(inds)
-
-        return DataFrame(output, index=obj.index, columns=columns)
-
-    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
-        """
-        Return a copy of a DataFrame excluding elements from groups that
-        do not satisfy the boolean criterion specified by func.
-
-        Parameters
-        ----------
-        f : function
-            Function to apply to each subframe. Should return True or False.
-        dropna : Drop groups that do not pass the filter. True by default;
-            if False, groups that evaluate False are filled with NaNs.
-
-        Notes
-        -----
-        Each subframe is endowed the attribute 'name' in case you need to know
-        which group you are working on.
-
-        Examples
-        --------
-        >>> import pandas as pd
-        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
-        ...                           'foo', 'bar'],
-        ...                    'B' : [1, 2, 3, 4, 5, 6],
-        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
-        >>> grouped = df.groupby('A')
-        >>> grouped.filter(lambda x: x['B'].mean() > 3.)
-             A  B    C
-        1  bar  2  5.0
-        3  bar  4  1.0
-        5  bar  6  9.0
-
-        Returns
-        -------
-        filtered : DataFrame
-        """
-
-        indices = []
-
-        obj = self._selected_obj
-        gen = self.grouper.get_iterator(obj, axis=self.axis)
-
-        for name, group in gen:
-            object.__setattr__(group, 'name', name)
-
-            res = func(group, *args, **kwargs)
-
-            try:
-                res = res.squeeze()
-            except AttributeError:  # allow e.g., scalars and frames to pass
-                pass
-
-            # interpret the result of the filter
-            if is_bool(res) or (is_scalar(res) and isnull(res)):
-                if res and notnull(res):
-                    indices.append(self._get_index(name))
-            else:
-                # non scalars aren't allowed
-                raise TypeError("filter function returned a %s, "
-                                "but expected a scalar bool" %
-                                type(res).__name__)
-
-        return self._apply_filter(indices, dropna)
-
-
-class DataFrameGroupBy(NDFrameGroupBy):
-    _apply_whitelist = _dataframe_apply_whitelist
-    #
-    # Make class defs of attributes on DataFrameGroupBy whitelist.
-    for _def_str in _whitelist_method_generator(DataFrame, _apply_whitelist):
-        exec(_def_str)
-
-    _block_agg_axis = 1
-
-    @Substitution(name='groupby')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
-    def aggregate(self, arg, *args, **kwargs):
-        return super(DataFrameGroupBy, self).aggregate(arg, *args, **kwargs)
-
-    agg = aggregate
-
-    def _gotitem(self, key, ndim, subset=None):
-        """
-        sub-classes to define
-        return a sliced object
-
-        Parameters
-        ----------
-        key : string / list of selections
-        ndim : 1,2
-            requested ndim of result
-        subset : object, default None
-            subset to act on
-        """
-
-        if ndim == 2:
-            if subset is None:
-                subset = self.obj
-            return DataFrameGroupBy(subset, self.grouper, selection=key,
-                                    grouper=self.grouper,
-                                    exclusions=self.exclusions,
-                                    as_index=self.as_index)
-        elif ndim == 1:
-            if subset is None:
-                subset = self.obj[key]
-            return SeriesGroupBy(subset, selection=key,
-                                 grouper=self.grouper)
-
-        raise AssertionError("invalid ndim for _gotitem")
-
-    def _wrap_generic_output(self, result, obj):
-        result_index = self.grouper.levels[0]
-
-        if self.axis == 0:
-            return DataFrame(result, index=obj.columns,
-                             columns=result_index).T
-        else:
-            return DataFrame(result, index=obj.index,
-                             columns=result_index)
-
-    def _get_data_to_aggregate(self):
-        obj = self._obj_with_exclusions
-        if self.axis == 1:
-            return obj.T._data, 1
-        else:
-            return obj._data, 1
-
-    def _insert_inaxis_grouper_inplace(self, result):
-        # zip in reverse so we can always insert at loc 0
-        izip = zip(* map(reversed, (
-            self.grouper.names,
-            self.grouper.get_group_levels(),
-            [grp.in_axis for grp in self.grouper.groupings])))
-
-        for name, lev, in_axis in izip:
-            if in_axis:
-                result.insert(0, name, lev)
-
-    def _wrap_aggregated_output(self, output, names=None):
-        agg_axis = 0 if self.axis == 1 else 1
-        agg_labels = self._obj_with_exclusions._get_axis(agg_axis)
-
-        output_keys = self._decide_output_index(output, agg_labels)
-
-        if not self.as_index:
-            result = DataFrame(output, columns=output_keys)
-            self._insert_inaxis_grouper_inplace(result)
-            result = result._consolidate()
-        else:
-            index = self.grouper.result_index
-            result = DataFrame(output, index=index, columns=output_keys)
-
-        if self.axis == 1:
-            result = result.T
-
-        return self._reindex_output(result)._convert(datetime=True)
-
-    def _wrap_transformed_output(self, output, names=None):
-        return DataFrame(output, index=self.obj.index)
-
-    def _wrap_agged_blocks(self, items, blocks):
-        if not self.as_index:
-            index = np.arange(blocks[0].values.shape[1])
-            mgr = BlockManager(blocks, [items, index])
-            result = DataFrame(mgr)
-
-            self._insert_inaxis_grouper_inplace(result)
-            result = result._consolidate()
-        else:
-            index = self.grouper.result_index
-            mgr = BlockManager(blocks, [items, index])
-            result = DataFrame(mgr)
-
-        if self.axis == 1:
-            result = result.T
-
-        return self._reindex_output(result)._convert(datetime=True)
-
-    def _reindex_output(self, result):
-        """
-        if we have categorical groupers, then we want to make sure that
-        we have a fully reindex-output to the levels. These may have not
-        participated in the groupings (e.g. may have all been
-        nan groups)
-
-        This can re-expand the output space
-        """
-        groupings = self.grouper.groupings
-        if groupings is None:
-            return result
-        elif len(groupings) == 1:
-            return result
-        elif not any([isinstance(ping.grouper, (Categorical, CategoricalIndex))
-                      for ping in groupings]):
-            return result
-
-        levels_list = [ping.group_index for ping in groupings]
-        index, _ = MultiIndex.from_product(
-            levels_list, names=self.grouper.names).sortlevel()
-
-        if self.as_index:
-            d = {self.obj._get_axis_name(self.axis): index, 'copy': False}
-            return result.reindex(**d)
-
-        # GH 13204
-        # Here, the categorical in-axis groupers, which need to be fully
-        # expanded, are columns in `result`. An idea is to do:
-        # result = result.set_index(self.grouper.names)
-        #                .reindex(index).reset_index()
-        # but special care has to be taken because of possible not-in-axis
-        # groupers.
-        # So, we manually select and drop the in-axis grouper columns,
-        # reindex `result`, and then reset the in-axis grouper columns.
-
-        # Select in-axis groupers
-        in_axis_grps = [(i, ping.name) for (i, ping)
-                        in enumerate(groupings) if ping.in_axis]
-        g_nums, g_names = zip(*in_axis_grps)
-
-        result = result.drop(labels=list(g_names), axis=1)
-
-        # Set a temp index and reindex (possibly expanding)
-        result = result.set_index(self.grouper.result_index
-                                  ).reindex(index, copy=False)
-
-        # Reset in-axis grouper columns
-        # (using level numbers `g_nums` because level names may not be unique)
-        result = result.reset_index(level=g_nums)
-
-        return result.reset_index(drop=True)
-
-    def _iterate_column_groupbys(self):
-        for i, colname in enumerate(self._selected_obj.columns):
-            yield colname, SeriesGroupBy(self._selected_obj.iloc[:, i],
-                                         selection=colname,
-                                         grouper=self.grouper,
-                                         exclusions=self.exclusions)
-
-    def _apply_to_column_groupbys(self, func):
-        from pandas.tools.concat import concat
-        return concat(
-            (func(col_groupby) for _, col_groupby
-             in self._iterate_column_groupbys()),
-            keys=self._selected_obj.columns, axis=1)
-
-    def count(self):
-        """ Compute count of group, excluding missing values """
-        from functools import partial
-        from pandas.types.missing import _isnull_ndarraylike as isnull
-
-        data, _ = self._get_data_to_aggregate()
-        ids, _, ngroups = self.grouper.group_info
-        mask = ids != -1
-
-        val = ((mask & ~isnull(blk.get_values())) for blk in data.blocks)
-        loc = (blk.mgr_locs for blk in data.blocks)
-
-        counter = partial(count_level_2d, labels=ids, max_bin=ngroups, axis=1)
-        blk = map(make_block, map(counter, val), loc)
-
-        return self._wrap_agged_blocks(data.items, list(blk))
-
-    def nunique(self, dropna=True):
-        """
-        Return DataFrame with number of distinct observations per group for
-        each column.
-
-        .. versionadded:: 0.20.0
-
-        Parameters
-        ----------
-        dropna : boolean, default True
-            Don't include NaN in the counts.
-
-        Returns
-        -------
-        nunique: DataFrame
-
-        Examples
-        --------
-        >>> df = pd.DataFrame({'id': ['spam', 'egg', 'egg', 'spam',
-        ...                           'ham', 'ham'],
-        ...                    'value1': [1, 5, 5, 2, 5, 5],
-        ...                    'value2': list('abbaxy')})
-        >>> df
-             id  value1 value2
-        0  spam       1      a
-        1   egg       5      b
-        2   egg       5      b
-        3  spam       2      a
-        4   ham       5      x
-        5   ham       5      y
-
-        >>> df.groupby('id').nunique()
-            id  value1  value2
-        id
-        egg    1       1       1
-        ham    1       1       2
-        spam   1       2       1
-
-        # check for rows with the same id but conflicting values
-        >>> df.groupby('id').filter(lambda g: (g.nunique() > 1).any())
-             id  value1 value2
-        0  spam       1      a
-        3  spam       2      a
-        4   ham       5      x
-        5   ham       5      y
-        """
-
-        obj = self._selected_obj
-
-        def groupby_series(obj, col=None):
-            return SeriesGroupBy(obj,
-                                 selection=col,
-                                 grouper=self.grouper).nunique(dropna=dropna)
-
-        if isinstance(obj, Series):
-            results = groupby_series(obj)
-        else:
-            from pandas.tools.concat import concat
-            results = [groupby_series(obj[col], col) for col in obj.columns]
-            results = concat(results, axis=1)
-
-        if not self.as_index:
-            results.index = _default_index(len(results))
-        return results
-
-
-from pandas.tools.plotting import boxplot_frame_groupby  # noqa
-DataFrameGroupBy.boxplot = boxplot_frame_groupby
-
-
-class PanelGroupBy(NDFrameGroupBy):
-
-    @Substitution(name='groupby')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
-    def aggregate(self, arg, *args, **kwargs):
-        return super(PanelGroupBy, self).aggregate(arg, *args, **kwargs)
-
-    agg = aggregate
-
-    def _iterate_slices(self):
-        if self.axis == 0:
-            # kludge
-            if self._selection is None:
-                slice_axis = self._selected_obj.items
-            else:
-                slice_axis = self._selection_list
-            slicer = lambda x: self._selected_obj[x]
-        else:
-            raise NotImplementedError("axis other than 0 is not supported")
-
-        for val in slice_axis:
-            if val in self.exclusions:
-                continue
-
-            yield val, slicer(val)
-
-    def aggregate(self, arg, *args, **kwargs):
-        """
-        Aggregate using input function or dict of {column -> function}
-
-        Parameters
-        ----------
-        arg : function or dict
-            Function to use for aggregating groups. If a function, must either
-            work when passed a Panel or when passed to Panel.apply. If
-            pass a dict, the keys must be DataFrame column names
-
-        Returns
-        -------
-        aggregated : Panel
-        """
-        if isinstance(arg, compat.string_types):
-            return getattr(self, arg)(*args, **kwargs)
-
-        return self._aggregate_generic(arg, *args, **kwargs)
-
-    def _wrap_generic_output(self, result, obj):
-        if self.axis == 0:
-            new_axes = list(obj.axes)
-            new_axes[0] = self.grouper.result_index
-        elif self.axis == 1:
-            x, y, z = obj.axes
-            new_axes = [self.grouper.result_index, z, x]
-        else:
-            x, y, z = obj.axes
-            new_axes = [self.grouper.result_index, y, x]
-
-        result = Panel._from_axes(result, new_axes)
-
-        if self.axis == 1:
-            result = result.swapaxes(0, 1).swapaxes(0, 2)
-        elif self.axis == 2:
-            result = result.swapaxes(0, 2)
-
-        return result
-
-    def _aggregate_item_by_item(self, func, *args, **kwargs):
-        obj = self._obj_with_exclusions
-        result = {}
-
-        if self.axis > 0:
-            for item in obj:
-                try:
-                    itemg = DataFrameGroupBy(obj[item],
-                                             axis=self.axis - 1,
-                                             grouper=self.grouper)
-                    result[item] = itemg.aggregate(func, *args, **kwargs)
-                except (ValueError, TypeError):
-                    raise
-            new_axes = list(obj.axes)
-            new_axes[self.axis] = self.grouper.result_index
-            return Panel._from_axes(result, new_axes)
-        else:
-            raise ValueError("axis value must be greater than 0")
-
-    def _wrap_aggregated_output(self, output, names=None):
-        raise AbstractMethodError(self)
-
-
-class NDArrayGroupBy(GroupBy):
-    pass
-
-
-# ----------------------------------------------------------------------
-# Splitting / application
-
-
-class DataSplitter(object):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        self.data = data
-        self.labels = _ensure_int64(labels)
-        self.ngroups = ngroups
-
-        self.axis = axis
-
-    @cache_readonly
-    def slabels(self):
-        # Sorted labels
-        return algorithms.take_nd(self.labels, self.sort_idx, allow_fill=False)
-
-    @cache_readonly
-    def sort_idx(self):
-        # Counting sort indexer
-        return get_group_index_sorter(self.labels, self.ngroups)
-
-    def __iter__(self):
-        sdata = self._get_sorted_data()
-
-        if self.ngroups == 0:
-            # we are inside a generator, rather than raise StopIteration
-            # we merely return signal the end
-            return
-
-        starts, ends = lib.generate_slices(self.slabels, self.ngroups)
-
-        for i, (start, end) in enumerate(zip(starts, ends)):
-            # Since I'm now compressing the group ids, it's now not "possible"
-            # to produce empty slices because such groups would not be observed
-            # in the data
-            # if start >= end:
-            #     raise AssertionError('Start %s must be less than end %s'
-            #                          % (str(start), str(end)))
-            yield i, self._chop(sdata, slice(start, end))
-
-    def _get_sorted_data(self):
-        return self.data.take(self.sort_idx, axis=self.axis, convert=False)
-
-    def _chop(self, sdata, slice_obj):
-        return sdata.iloc[slice_obj]
-
-    def apply(self, f):
-        raise AbstractMethodError(self)
-
-
-class ArraySplitter(DataSplitter):
-    pass
-
-
-class SeriesSplitter(DataSplitter):
-
-    def _chop(self, sdata, slice_obj):
-        return sdata._get_values(slice_obj).to_dense()
-
-
-class FrameSplitter(DataSplitter):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        super(FrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
-
-    def fast_apply(self, f, names):
-        # must return keys::list, values::list, mutated::bool
-        try:
-            starts, ends = lib.generate_slices(self.slabels, self.ngroups)
-        except:
-            # fails when all -1
-            return [], True
-
-        sdata = self._get_sorted_data()
-        results, mutated = lib.apply_frame_axis0(sdata, f, names, starts, ends)
-
-        return results, mutated
-
-    def _chop(self, sdata, slice_obj):
-        if self.axis == 0:
-            return sdata.iloc[slice_obj]
-        else:
-            return sdata._slice(slice_obj, axis=1)  # .loc[:, slice_obj]
-
-
-class NDFrameSplitter(DataSplitter):
-
-    def __init__(self, data, labels, ngroups, axis=0):
-        super(NDFrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
-
-        self.factory = data._constructor
-
-    def _get_sorted_data(self):
-        # this is the BlockManager
-        data = self.data._data
-
-        # this is sort of wasteful but...
-        sorted_axis = data.axes[self.axis].take(self.sort_idx)
-        sorted_data = data.reindex_axis(sorted_axis, axis=self.axis)
-
-        return sorted_data
-
-    def _chop(self, sdata, slice_obj):
-        return self.factory(sdata.get_slice(slice_obj, axis=self.axis))
-
-
-def get_splitter(data, *args, **kwargs):
-    if isinstance(data, Series):
-        klass = SeriesSplitter
-    elif isinstance(data, DataFrame):
-        klass = FrameSplitter
-    else:
-        klass = NDFrameSplitter
-
-    return klass(data, *args, **kwargs)
diff --git a/pandas/core/groupby/__init__.py b/pandas/core/groupby/__init__.py
new file mode 100644
index 0000000000000..ac35f3825e5e8
--- /dev/null
+++ b/pandas/core/groupby/__init__.py
@@ -0,0 +1,4 @@
+from pandas.core.groupby.groupby import GroupBy  # noqa: F401
+from pandas.core.groupby.generic import (  # noqa: F401
+    SeriesGroupBy, DataFrameGroupBy)
+from pandas.core.groupby.grouper import Grouper  # noqa: F401
diff --git a/pandas/core/groupby/base.py b/pandas/core/groupby/base.py
new file mode 100644
index 0000000000000..ebba4a0a9395d
--- /dev/null
+++ b/pandas/core/groupby/base.py
@@ -0,0 +1,158 @@
+"""
+Provide basic components for groupby. These defintiions
+hold the whitelist of methods that are exposed on the
+SeriesGroupBy and the DataFrameGroupBy objects.
+"""
+
+import types
+
+from pandas.util._decorators import make_signature
+
+from pandas.core.dtypes.common import is_list_like, is_scalar
+
+
+class GroupByMixin(object):
+    """
+    Provide the groupby facilities to the mixed object.
+    """
+
+    @staticmethod
+    def _dispatch(name, *args, **kwargs):
+        """
+        Dispatch to apply.
+        """
+
+        def outer(self, *args, **kwargs):
+            def f(x):
+                x = self._shallow_copy(x, groupby=self._groupby)
+                return getattr(x, name)(*args, **kwargs)
+            return self._groupby.apply(f)
+        outer.__name__ = name
+        return outer
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        Sub-classes to define. Return a sliced object.
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        # create a new object to prevent aliasing
+        if subset is None:
+            subset = self.obj
+
+        # we need to make a shallow copy of ourselves
+        # with the same groupby
+        kwargs = {attr: getattr(self, attr) for attr in self._attributes}
+
+        # Try to select from a DataFrame, falling back to a Series
+        try:
+            groupby = self._groupby[key]
+        except IndexError:
+            groupby = self._groupby
+
+        self = self.__class__(subset,
+                              groupby=groupby,
+                              parent=self,
+                              **kwargs)
+        self._reset_cache()
+        if subset.ndim == 2:
+            if is_scalar(key) and key in subset or is_list_like(key):
+                self._selection = key
+        return self
+
+
+# special case to prevent duplicate plots when catching exceptions when
+# forwarding methods from NDFrames
+plotting_methods = frozenset(['plot', 'hist'])
+
+common_apply_whitelist = frozenset([
+    'quantile', 'fillna', 'mad', 'take',
+    'idxmax', 'idxmin', 'tshift',
+    'skew', 'corr', 'cov', 'diff'
+]) | plotting_methods
+
+series_apply_whitelist = ((common_apply_whitelist |
+                           {'nlargest', 'nsmallest',
+                            'is_monotonic_increasing',
+                            'is_monotonic_decreasing'})
+                          ) | frozenset(['dtype', 'unique'])
+
+dataframe_apply_whitelist = ((common_apply_whitelist |
+                              frozenset(['dtypes', 'corrwith'])))
+
+cython_transforms = frozenset(['cumprod', 'cumsum', 'shift',
+                               'cummin', 'cummax'])
+
+cython_cast_blacklist = frozenset(['rank', 'count', 'size'])
+
+
+def whitelist_method_generator(base, klass, whitelist):
+    """
+    Yields all GroupBy member defs for DataFrame/Series names in whitelist.
+
+    Parameters
+    ----------
+    base : class
+        base class
+    klass : class
+        class where members are defined.
+        Should be Series or DataFrame
+    whitelist : list
+        list of names of klass methods to be constructed
+
+    Returns
+    -------
+    The generator yields a sequence of strings, each suitable for exec'ing,
+    that define implementations of the named methods for DataFrameGroupBy
+    or SeriesGroupBy.
+
+    Since we don't want to override methods explicitly defined in the
+    base class, any such name is skipped.
+    """
+
+    method_wrapper_template = \
+        """def %(name)s(%(sig)s) :
+    \"""
+    %(doc)s
+    \"""
+    f = %(self)s.__getattr__('%(name)s')
+    return f(%(args)s)"""
+    property_wrapper_template = \
+        """@property
+def %(name)s(self) :
+    \"""
+    %(doc)s
+    \"""
+    return self.__getattr__('%(name)s')"""
+
+    for name in whitelist:
+        # don't override anything that was explicitly defined
+        # in the base class
+        if hasattr(base, name):
+            continue
+        # ugly, but we need the name string itself in the method.
+        f = getattr(klass, name)
+        doc = f.__doc__
+        doc = doc if type(doc) == str else ''
+        if isinstance(f, types.MethodType):
+            wrapper_template = method_wrapper_template
+            decl, args = make_signature(f)
+            # pass args by name to f because otherwise
+            # GroupBy._make_wrapper won't know whether
+            # we passed in an axis parameter.
+            args_by_name = ['{0}={0}'.format(arg) for arg in args[1:]]
+            params = {'name': name,
+                      'doc': doc,
+                      'sig': ','.join(decl),
+                      'self': args[0],
+                      'args': ','.join(args_by_name)}
+        else:
+            wrapper_template = property_wrapper_template
+            params = {'name': name, 'doc': doc}
+        yield wrapper_template % params
diff --git a/pandas/core/groupby/categorical.py b/pandas/core/groupby/categorical.py
new file mode 100644
index 0000000000000..85f51323a97b5
--- /dev/null
+++ b/pandas/core/groupby/categorical.py
@@ -0,0 +1,100 @@
+import numpy as np
+
+from pandas.core.algorithms import unique1d
+from pandas.core.arrays.categorical import (
+    Categorical, CategoricalDtype, _recode_for_categories)
+
+
+def recode_for_groupby(c, sort, observed):
+    """
+    Code the categories to ensure we can groupby for categoricals.
+
+    If observed=True, we return a new Categorical with the observed
+    categories only.
+
+    If sort=False, return a copy of self, coded with categories as
+    returned by .unique(), followed by any categories not appearing in
+    the data. If sort=True, return self.
+
+    This method is needed solely to ensure the categorical index of the
+    GroupBy result has categories in the order of appearance in the data
+    (GH-8868).
+
+    Parameters
+    ----------
+    c : Categorical
+    sort : boolean
+        The value of the sort parameter groupby was called with.
+    observed : boolean
+        Account only for the observed values
+
+    Returns
+    -------
+    New Categorical
+        If sort=False, the new categories are set to the order of
+        appearance in codes (unless ordered=True, in which case the
+        original order is preserved), followed by any unrepresented
+        categories in the original order.
+    Categorical or None
+        If we are observed, return the original categorical, otherwise None
+    """
+
+    # we only care about observed values
+    if observed:
+        unique_codes = unique1d(c.codes)
+
+        take_codes = unique_codes[unique_codes != -1]
+        if c.ordered:
+            take_codes = np.sort(take_codes)
+
+        # we recode according to the uniques
+        categories = c.categories.take(take_codes)
+        codes = _recode_for_categories(c.codes,
+                                       c.categories,
+                                       categories)
+
+        # return a new categorical that maps our new codes
+        # and categories
+        dtype = CategoricalDtype(categories, ordered=c.ordered)
+        return Categorical(codes, dtype=dtype, fastpath=True), c
+
+    # Already sorted according to c.categories; all is fine
+    if sort:
+        return c, None
+
+    # sort=False should order groups in as-encountered order (GH-8868)
+    cat = c.unique()
+
+    # But for groupby to work, all categories should be present,
+    # including those missing from the data (GH-13179), which .unique()
+    # above dropped
+    cat = cat.add_categories(
+        c.categories[~c.categories.isin(cat.categories)])
+
+    return c.reorder_categories(cat.categories), None
+
+
+def recode_from_groupby(c, sort, ci):
+    """
+    Reverse the codes_to_groupby to account for sort / observed.
+
+    Parameters
+    ----------
+    c : Categorical
+    sort : boolean
+        The value of the sort parameter groupby was called with.
+    ci : CategoricalIndex
+        The codes / categories to recode
+
+    Returns
+    -------
+    CategoricalIndex
+    """
+
+    # we re-order to the original category orderings
+    if sort:
+        return ci.set_categories(c.categories)
+
+    # we are not sorting, so add unobserved to the end
+    return ci.add_categories(
+        c.categories[~c.categories.isin(ci.categories)])
diff --git a/pandas/core/groupby/generic.py b/pandas/core/groupby/generic.py
new file mode 100644
index 0000000000000..683c21f7bd47a
--- /dev/null
+++ b/pandas/core/groupby/generic.py
@@ -0,0 +1,1588 @@
+"""
+Define the SeriesGroupBy and DataFrameGroupBy
+classes that hold the groupby interfaces (and some implementations).
+
+These are user facing as the result of the ``df.groupby(...)`` operations,
+which here returns a DataFrameGroupBy object.
+"""
+
+import collections
+import copy
+from functools import partial
+from textwrap import dedent
+import warnings
+
+import numpy as np
+
+from pandas._libs import Timestamp, lib
+import pandas.compat as compat
+from pandas.compat import lzip, map
+from pandas.compat.numpy import _np_version_under1p13
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.common import (
+    ensure_int64, ensure_platform_int, is_bool, is_datetimelike,
+    is_integer_dtype, is_interval_dtype, is_numeric_dtype, is_scalar)
+from pandas.core.dtypes.missing import isna, notna
+
+import pandas.core.algorithms as algorithms
+from pandas.core.arrays import Categorical
+from pandas.core.base import DataError, SpecificationError
+import pandas.core.common as com
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame, _shared_docs
+from pandas.core.groupby import base
+from pandas.core.groupby.groupby import (
+    GroupBy, _apply_docs, _transform_template)
+from pandas.core.index import CategoricalIndex, Index, MultiIndex
+import pandas.core.indexes.base as ibase
+from pandas.core.internals import BlockManager, make_block
+from pandas.core.series import Series
+
+from pandas.plotting._core import boxplot_frame_groupby
+
+
+class NDFrameGroupBy(GroupBy):
+
+    def _iterate_slices(self):
+        if self.axis == 0:
+            # kludge
+            if self._selection is None:
+                slice_axis = self.obj.columns
+            else:
+                slice_axis = self._selection_list
+            slicer = lambda x: self.obj[x]
+        else:
+            slice_axis = self.obj.index
+            slicer = self.obj.xs
+
+        for val in slice_axis:
+            if val in self.exclusions:
+                continue
+            yield val, slicer(val)
+
+    def _cython_agg_general(self, how, alt=None, numeric_only=True,
+                            min_count=-1):
+        new_items, new_blocks = self._cython_agg_blocks(
+            how, alt=alt, numeric_only=numeric_only, min_count=min_count)
+        return self._wrap_agged_blocks(new_items, new_blocks)
+
+    def _wrap_agged_blocks(self, items, blocks):
+        obj = self._obj_with_exclusions
+
+        new_axes = list(obj._data.axes)
+
+        # more kludge
+        if self.axis == 0:
+            new_axes[0], new_axes[1] = new_axes[1], self.grouper.result_index
+        else:
+            new_axes[self.axis] = self.grouper.result_index
+
+        # Make sure block manager integrity check passes.
+        assert new_axes[0].equals(items)
+        new_axes[0] = items
+
+        mgr = BlockManager(blocks, new_axes)
+
+        new_obj = type(obj)(mgr)
+
+        return self._post_process_cython_aggregate(new_obj)
+
+    _block_agg_axis = 0
+
+    def _cython_agg_blocks(self, how, alt=None, numeric_only=True,
+                           min_count=-1):
+        # TODO: the actual managing of mgr_locs is a PITA
+        # here, it should happen via BlockManager.combine
+
+        data, agg_axis = self._get_data_to_aggregate()
+
+        if numeric_only:
+            data = data.get_numeric_data(copy=False)
+
+        new_blocks = []
+        new_items = []
+        deleted_items = []
+        for block in data.blocks:
+
+            locs = block.mgr_locs.as_array
+            try:
+                result, _ = self.grouper.aggregate(
+                    block.values, how, axis=agg_axis, min_count=min_count)
+            except NotImplementedError:
+                # generally if we have numeric_only=False
+                # and non-applicable functions
+                # try to python agg
+
+                if alt is None:
+                    # we cannot perform the operation
+                    # in an alternate way, exclude the block
+                    deleted_items.append(locs)
+                    continue
+
+                # call our grouper again with only this block
+                from pandas.core.groupby.groupby import groupby
+
+                obj = self.obj[data.items[locs]]
+                s = groupby(obj, self.grouper)
+                result = s.aggregate(lambda x: alt(x, axis=self.axis))
+
+            finally:
+
+                # see if we can cast the block back to the original dtype
+                result = block._try_coerce_and_cast_result(result)
+                newb = block.make_block(result)
+
+            new_items.append(locs)
+            new_blocks.append(newb)
+
+        if len(new_blocks) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        # reset the locs in the blocks to correspond to our
+        # current ordering
+        indexer = np.concatenate(new_items)
+        new_items = data.items.take(np.sort(indexer))
+
+        if len(deleted_items):
+
+            # we need to adjust the indexer to account for the
+            # items we have removed
+            # really should be done in internals :<
+
+            deleted = np.concatenate(deleted_items)
+            ai = np.arange(len(data))
+            mask = np.zeros(len(data))
+            mask[deleted] = 1
+            indexer = (ai - mask.cumsum())[indexer]
+
+        offset = 0
+        for b in new_blocks:
+            loc = len(b.mgr_locs)
+            b.mgr_locs = indexer[offset:(offset + loc)]
+            offset += loc
+
+        return new_items, new_blocks
+
+    def _get_data_to_aggregate(self):
+        obj = self._obj_with_exclusions
+        if self.axis == 0:
+            return obj.swapaxes(0, 1)._data, 1
+        else:
+            return obj._data, self.axis
+
+    def _post_process_cython_aggregate(self, obj):
+        # undoing kludge from below
+        if self.axis == 0:
+            obj = obj.swapaxes(0, 1)
+        return obj
+
+    def aggregate(self, arg, *args, **kwargs):
+
+        _level = kwargs.pop('_level', None)
+        result, how = self._aggregate(arg, _level=_level, *args, **kwargs)
+        if how is None:
+            return result
+
+        if result is None:
+
+            # grouper specific aggregations
+            if self.grouper.nkeys > 1:
+                return self._python_agg_general(arg, *args, **kwargs)
+            else:
+
+                # try to treat as if we are passing a list
+                try:
+                    assert not args and not kwargs
+                    result = self._aggregate_multiple_funcs(
+                        [arg], _level=_level, _axis=self.axis)
+                    result.columns = Index(
+                        result.columns.levels[0],
+                        name=self._selected_obj.columns.name)
+                except Exception:
+                    result = self._aggregate_generic(arg, *args, **kwargs)
+
+        if not self.as_index:
+            self._insert_inaxis_grouper_inplace(result)
+            result.index = np.arange(len(result))
+
+        return result._convert(datetime=True)
+
+    agg = aggregate
+
+    def _aggregate_generic(self, func, *args, **kwargs):
+        if self.grouper.nkeys != 1:
+            raise AssertionError('Number of keys must be 1')
+
+        axis = self.axis
+        obj = self._obj_with_exclusions
+
+        result = {}
+        if axis != obj._info_axis_number:
+            try:
+                for name, data in self:
+                    result[name] = self._try_cast(func(data, *args, **kwargs),
+                                                  data)
+            except Exception:
+                return self._aggregate_item_by_item(func, *args, **kwargs)
+        else:
+            for name in self.indices:
+                try:
+                    data = self.get_group(name, obj=obj)
+                    result[name] = self._try_cast(func(data, *args, **kwargs),
+                                                  data)
+                except Exception:
+                    wrapper = lambda x: func(x, *args, **kwargs)
+                    result[name] = data.apply(wrapper, axis=axis)
+
+        return self._wrap_generic_output(result, obj)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        raise AbstractMethodError(self)
+
+    def _aggregate_item_by_item(self, func, *args, **kwargs):
+        # only for axis==0
+
+        obj = self._obj_with_exclusions
+        result = {}
+        cannot_agg = []
+        errors = None
+        for item in obj:
+            try:
+                data = obj[item]
+                colg = SeriesGroupBy(data, selection=item,
+                                     grouper=self.grouper)
+                result[item] = self._try_cast(
+                    colg.aggregate(func, *args, **kwargs), data)
+            except ValueError:
+                cannot_agg.append(item)
+                continue
+            except TypeError as e:
+                cannot_agg.append(item)
+                errors = e
+                continue
+
+        result_columns = obj.columns
+        if cannot_agg:
+            result_columns = result_columns.drop(cannot_agg)
+
+            # GH6337
+            if not len(result_columns) and errors is not None:
+                raise errors
+
+        return DataFrame(result, columns=result_columns)
+
+    def _decide_output_index(self, output, labels):
+        if len(output) == len(labels):
+            output_keys = labels
+        else:
+            output_keys = sorted(output)
+            try:
+                output_keys.sort()
+            except Exception:  # pragma: no cover
+                pass
+
+            if isinstance(labels, MultiIndex):
+                output_keys = MultiIndex.from_tuples(output_keys,
+                                                     names=labels.names)
+
+        return output_keys
+
+    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
+        from pandas.core.index import _all_indexes_same
+        from pandas.core.tools.numeric import to_numeric
+
+        if len(keys) == 0:
+            return DataFrame(index=keys)
+
+        key_names = self.grouper.names
+
+        # GH12824.
+        def first_not_none(values):
+            try:
+                return next(com._not_none(*values))
+            except StopIteration:
+                return None
+
+        v = first_not_none(values)
+
+        if v is None:
+            # GH9684. If all values are None, then this will throw an error.
+            # We'd prefer it return an empty dataframe.
+            return DataFrame()
+        elif isinstance(v, DataFrame):
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        elif self.grouper.groupings is not None:
+            if len(self.grouper.groupings) > 1:
+                key_index = self.grouper.result_index
+
+            else:
+                ping = self.grouper.groupings[0]
+                if len(keys) == ping.ngroups:
+                    key_index = ping.group_index
+                    key_index.name = key_names[0]
+
+                    key_lookup = Index(keys)
+                    indexer = key_lookup.get_indexer(key_index)
+
+                    # reorder the values
+                    values = [values[i] for i in indexer]
+                else:
+
+                    key_index = Index(keys, name=key_names[0])
+
+                # don't use the key indexer
+                if not self.as_index:
+                    key_index = None
+
+            # make Nones an empty object
+            v = first_not_none(values)
+            if v is None:
+                return DataFrame()
+            elif isinstance(v, NDFrame):
+                values = [
+                    x if x is not None else
+                    v._constructor(**v._construct_axes_dict())
+                    for x in values
+                ]
+
+            v = values[0]
+
+            if isinstance(v, (np.ndarray, Index, Series)):
+                if isinstance(v, Series):
+                    applied_index = self._selected_obj._get_axis(self.axis)
+                    all_indexed_same = _all_indexes_same([
+                        x.index for x in values
+                    ])
+                    singular_series = (len(values) == 1 and
+                                       applied_index.nlevels == 1)
+
+                    # GH3596
+                    # provide a reduction (Frame -> Series) if groups are
+                    # unique
+                    if self.squeeze:
+
+                        # assign the name to this series
+                        if singular_series:
+                            values[0].name = keys[0]
+
+                            # GH2893
+                            # we have series in the values array, we want to
+                            # produce a series:
+                            # if any of the sub-series are not indexed the same
+                            # OR we don't have a multi-index and we have only a
+                            # single values
+                            return self._concat_objects(
+                                keys, values, not_indexed_same=not_indexed_same
+                            )
+
+                        # still a series
+                        # path added as of GH 5545
+                        elif all_indexed_same:
+                            from pandas.core.reshape.concat import concat
+                            return concat(values)
+
+                    if not all_indexed_same:
+                        # GH 8467
+                        return self._concat_objects(
+                            keys, values, not_indexed_same=True,
+                        )
+
+                try:
+                    if self.axis == 0:
+                        # GH6124 if the list of Series have a consistent name,
+                        # then propagate that name to the result.
+                        index = v.index.copy()
+                        if index.name is None:
+                            # Only propagate the series name to the result
+                            # if all series have a consistent name.  If the
+                            # series do not have a consistent name, do
+                            # nothing.
+                            names = {v.name for v in values}
+                            if len(names) == 1:
+                                index.name = list(names)[0]
+
+                        # normally use vstack as its faster than concat
+                        # and if we have mi-columns
+                        if (isinstance(v.index, MultiIndex) or
+                                key_index is None or
+                                isinstance(key_index, MultiIndex)):
+                            stacked_values = np.vstack([
+                                np.asarray(v) for v in values
+                            ])
+                            result = DataFrame(stacked_values, index=key_index,
+                                               columns=index)
+                        else:
+                            # GH5788 instead of stacking; concat gets the
+                            # dtypes correct
+                            from pandas.core.reshape.concat import concat
+                            result = concat(values, keys=key_index,
+                                            names=key_index.names,
+                                            axis=self.axis).unstack()
+                            result.columns = index
+                    else:
+                        stacked_values = np.vstack([np.asarray(v)
+                                                    for v in values])
+                        result = DataFrame(stacked_values.T, index=v.index,
+                                           columns=key_index)
+
+                except (ValueError, AttributeError):
+                    # GH1738: values is list of arrays of unequal lengths fall
+                    # through to the outer else caluse
+                    return Series(values, index=key_index,
+                                  name=self._selection_name)
+
+                # if we have date/time like in the original, then coerce dates
+                # as we are stacking can easily have object dtypes here
+                so = self._selected_obj
+                if (so.ndim == 2 and so.dtypes.apply(is_datetimelike).any()):
+                    result = result.apply(
+                        lambda x: to_numeric(x, errors='ignore'))
+                    date_cols = self._selected_obj.select_dtypes(
+                        include=['datetime', 'timedelta']).columns
+                    date_cols = date_cols.intersection(result.columns)
+                    result[date_cols] = (result[date_cols]
+                                         ._convert(datetime=True,
+                                                   coerce=True))
+                else:
+                    result = result._convert(datetime=True)
+
+                return self._reindex_output(result)
+
+            # values are not series or array-like but scalars
+            else:
+                # only coerce dates if we find at least 1 datetime
+                coerce = any(isinstance(x, Timestamp) for x in values)
+                # self._selection_name not passed through to Series as the
+                # result should not take the name of original selection
+                # of columns
+                return (Series(values, index=key_index)
+                        ._convert(datetime=True,
+                                  coerce=coerce))
+
+        else:
+            # Handle cases like BinGrouper
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+
+    def _transform_general(self, func, *args, **kwargs):
+        from pandas.core.reshape.concat import concat
+
+        applied = []
+        obj = self._obj_with_exclusions
+        gen = self.grouper.get_iterator(obj, axis=self.axis)
+        fast_path, slow_path = self._define_paths(func, *args, **kwargs)
+
+        path = None
+        for name, group in gen:
+            object.__setattr__(group, 'name', name)
+
+            if path is None:
+                # Try slow path and fast path.
+                try:
+                    path, res = self._choose_path(fast_path, slow_path, group)
+                except TypeError:
+                    return self._transform_item_by_item(obj, fast_path)
+                except ValueError:
+                    msg = 'transform must return a scalar value for each group'
+                    raise ValueError(msg)
+            else:
+                res = path(group)
+
+            if isinstance(res, Series):
+
+                # we need to broadcast across the
+                # other dimension; this will preserve dtypes
+                # GH14457
+                if not np.prod(group.shape):
+                    continue
+                elif res.index.is_(obj.index):
+                    r = concat([res] * len(group.columns), axis=1)
+                    r.columns = group.columns
+                    r.index = group.index
+                else:
+                    r = DataFrame(
+                        np.concatenate([res.values] * len(group.index)
+                                       ).reshape(group.shape),
+                        columns=group.columns, index=group.index)
+
+                applied.append(r)
+            else:
+                applied.append(res)
+
+        concat_index = obj.columns if self.axis == 0 else obj.index
+        concatenated = concat(applied, join_axes=[concat_index],
+                              axis=self.axis, verify_integrity=False)
+        return self._set_result_index_ordered(concatenated)
+
+    @Substitution(klass='DataFrame', selected='')
+    @Appender(_transform_template)
+    def transform(self, func, *args, **kwargs):
+
+        # optimized transforms
+        func = self._is_cython_func(func) or func
+        if isinstance(func, compat.string_types):
+            if func in base.cython_transforms:
+                # cythonized transform
+                return getattr(self, func)(*args, **kwargs)
+            else:
+                # cythonized aggregation and merge
+                result = getattr(self, func)(*args, **kwargs)
+        else:
+            return self._transform_general(func, *args, **kwargs)
+
+        # a reduction transform
+        if not isinstance(result, DataFrame):
+            return self._transform_general(func, *args, **kwargs)
+
+        obj = self._obj_with_exclusions
+
+        # nuiscance columns
+        if not result.columns.equals(obj.columns):
+            return self._transform_general(func, *args, **kwargs)
+
+        return self._transform_fast(result, obj, func)
+
+    def _transform_fast(self, result, obj, func_nm):
+        """
+        Fast transform path for aggregations
+        """
+        # if there were groups with no observations (Categorical only?)
+        # try casting data to original dtype
+        cast = self._transform_should_cast(func_nm)
+
+        # for each col, reshape to to size of original frame
+        # by take operation
+        ids, _, ngroup = self.grouper.group_info
+        output = []
+        for i, _ in enumerate(result.columns):
+            res = algorithms.take_1d(result.iloc[:, i].values, ids)
+            if cast:
+                res = self._try_cast(res, obj.iloc[:, i])
+            output.append(res)
+
+        return DataFrame._from_arrays(output, columns=result.columns,
+                                      index=obj.index)
+
+    def _define_paths(self, func, *args, **kwargs):
+        if isinstance(func, compat.string_types):
+            fast_path = lambda group: getattr(group, func)(*args, **kwargs)
+            slow_path = lambda group: group.apply(
+                lambda x: getattr(x, func)(*args, **kwargs), axis=self.axis)
+        else:
+            fast_path = lambda group: func(group, *args, **kwargs)
+            slow_path = lambda group: group.apply(
+                lambda x: func(x, *args, **kwargs), axis=self.axis)
+        return fast_path, slow_path
+
+    def _choose_path(self, fast_path, slow_path, group):
+        path = slow_path
+        res = slow_path(group)
+
+        # if we make it here, test if we can use the fast path
+        try:
+            res_fast = fast_path(group)
+
+            # verify fast path does not change columns (and names), otherwise
+            # its results cannot be joined with those of the slow path
+            if res_fast.columns != group.columns:
+                return path, res
+            # verify numerical equality with the slow path
+            if res.shape == res_fast.shape:
+                res_r = res.values.ravel()
+                res_fast_r = res_fast.values.ravel()
+                mask = notna(res_r)
+                if (res_r[mask] == res_fast_r[mask]).all():
+                    path = fast_path
+        except Exception:
+            pass
+        return path, res
+
+    def _transform_item_by_item(self, obj, wrapper):
+        # iterate through columns
+        output = {}
+        inds = []
+        for i, col in enumerate(obj):
+            try:
+                output[col] = self[col].transform(wrapper)
+                inds.append(i)
+            except Exception:
+                pass
+
+        if len(output) == 0:  # pragma: no cover
+            raise TypeError('Transform function invalid for data types')
+
+        columns = obj.columns
+        if len(output) < len(obj.columns):
+            columns = columns.take(inds)
+
+        return DataFrame(output, index=obj.index, columns=columns)
+
+    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
+        """
+        Return a copy of a DataFrame excluding elements from groups that
+        do not satisfy the boolean criterion specified by func.
+
+        Parameters
+        ----------
+        f : function
+            Function to apply to each subframe. Should return True or False.
+        dropna : Drop groups that do not pass the filter. True by default;
+            if False, groups that evaluate False are filled with NaNs.
+
+        Returns
+        -------
+        filtered : DataFrame
+
+        Notes
+        -----
+        Each subframe is endowed the attribute 'name' in case you need to know
+        which group you are working on.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+        ...                           'foo', 'bar'],
+        ...                    'B' : [1, 2, 3, 4, 5, 6],
+        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
+        >>> grouped = df.groupby('A')
+        >>> grouped.filter(lambda x: x['B'].mean() > 3.)
+             A  B    C
+        1  bar  2  5.0
+        3  bar  4  1.0
+        5  bar  6  9.0
+        """
+
+        indices = []
+
+        obj = self._selected_obj
+        gen = self.grouper.get_iterator(obj, axis=self.axis)
+
+        for name, group in gen:
+            object.__setattr__(group, 'name', name)
+
+            res = func(group, *args, **kwargs)
+
+            try:
+                res = res.squeeze()
+            except AttributeError:  # allow e.g., scalars and frames to pass
+                pass
+
+            # interpret the result of the filter
+            if is_bool(res) or (is_scalar(res) and isna(res)):
+                if res and notna(res):
+                    indices.append(self._get_index(name))
+            else:
+                # non scalars aren't allowed
+                raise TypeError("filter function returned a %s, "
+                                "but expected a scalar bool" %
+                                type(res).__name__)
+
+        return self._apply_filter(indices, dropna)
+
+
+class SeriesGroupBy(GroupBy):
+    #
+    # Make class defs of attributes on SeriesGroupBy whitelist
+
+    _apply_whitelist = base.series_apply_whitelist
+    for _def_str in base.whitelist_method_generator(
+            GroupBy, Series, _apply_whitelist):
+        exec(_def_str)
+
+    @property
+    def _selection_name(self):
+        """
+        since we are a series, we by definition only have
+        a single name, but may be the result of a selection or
+        the name of our object
+        """
+        if self._selection is None:
+            return self.obj.name
+        else:
+            return self._selection
+
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    pandas.Series.groupby.apply
+    pandas.Series.groupby.transform
+    pandas.Series.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4])
+
+    >>> s
+    0    1
+    1    2
+    2    3
+    3    4
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).min()
+    1    1
+    2    3
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).agg('min')
+    1    1
+    2    3
+    dtype: int64
+
+    >>> s.groupby([1, 1, 2, 2]).agg(['min', 'max'])
+       min  max
+    1    1    2
+    2    3    4
+    """)
+
+    @Appender(_apply_docs['template']
+              .format(input='series',
+                      examples=_apply_docs['series_examples']))
+    def apply(self, func, *args, **kwargs):
+        return super(SeriesGroupBy, self).apply(func, *args, **kwargs)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='Series',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
+    def aggregate(self, func_or_funcs, *args, **kwargs):
+        _level = kwargs.pop('_level', None)
+        if isinstance(func_or_funcs, compat.string_types):
+            return getattr(self, func_or_funcs)(*args, **kwargs)
+
+        if isinstance(func_or_funcs, compat.Iterable):
+            # Catch instances of lists / tuples
+            # but not the class list / tuple itself.
+            ret = self._aggregate_multiple_funcs(func_or_funcs,
+                                                 (_level or 0) + 1)
+        else:
+            cyfunc = self._is_cython_func(func_or_funcs)
+            if cyfunc and not args and not kwargs:
+                return getattr(self, cyfunc)()
+
+            if self.grouper.nkeys > 1:
+                return self._python_agg_general(func_or_funcs, *args, **kwargs)
+
+            try:
+                return self._python_agg_general(func_or_funcs, *args, **kwargs)
+            except Exception:
+                result = self._aggregate_named(func_or_funcs, *args, **kwargs)
+
+            index = Index(sorted(result), name=self.grouper.names[0])
+            ret = Series(result, index=index)
+
+        if not self.as_index:  # pragma: no cover
+            print('Warning, ignoring as_index=True')
+
+        # _level handled at higher
+        if not _level and isinstance(ret, dict):
+            from pandas import concat
+            ret = concat(ret, axis=1)
+        return ret
+
+    agg = aggregate
+
+    def _aggregate_multiple_funcs(self, arg, _level):
+        if isinstance(arg, dict):
+
+            # show the deprecation, but only if we
+            # have not shown a higher level one
+            # GH 15931
+            if isinstance(self._selected_obj, Series) and _level <= 1:
+                warnings.warn(
+                    ("using a dict on a Series for aggregation\n"
+                     "is deprecated and will be removed in a future "
+                     "version"),
+                    FutureWarning, stacklevel=3)
+
+            columns = list(arg.keys())
+            arg = list(arg.items())
+        elif any(isinstance(x, (tuple, list)) for x in arg):
+            arg = [(x, x) if not isinstance(x, (tuple, list)) else x
+                   for x in arg]
+
+            # indicated column order
+            columns = lzip(*arg)[0]
+        else:
+            # list of functions / function names
+            columns = []
+            for f in arg:
+                if isinstance(f, compat.string_types):
+                    columns.append(f)
+                else:
+                    # protect against callables without names
+                    columns.append(com.get_callable_name(f))
+            arg = lzip(columns, arg)
+
+        results = {}
+        for name, func in arg:
+            obj = self
+            if name in results:
+                raise SpecificationError(
+                    'Function names must be unique, found multiple named '
+                    '{}'.format(name))
+
+            # reset the cache so that we
+            # only include the named selection
+            if name in self._selected_obj:
+                obj = copy.copy(obj)
+                obj._reset_cache()
+                obj._selection = name
+            results[name] = obj.aggregate(func)
+
+        if any(isinstance(x, DataFrame) for x in compat.itervalues(results)):
+            # let higher level handle
+            if _level:
+                return results
+
+        return DataFrame(results, columns=columns)
+
+    def _wrap_output(self, output, index, names=None):
+        """ common agg/transform wrapping logic """
+        output = output[self._selection_name]
+
+        if names is not None:
+            return DataFrame(output, index=index, columns=names)
+        else:
+            name = self._selection_name
+            if name is None:
+                name = self._selected_obj.name
+            return Series(output, index=index, name=name)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        return self._wrap_output(output=output,
+                                 index=self.grouper.result_index,
+                                 names=names)
+
+    def _wrap_transformed_output(self, output, names=None):
+        return self._wrap_output(output=output,
+                                 index=self.obj.index,
+                                 names=names)
+
+    def _wrap_applied_output(self, keys, values, not_indexed_same=False):
+        if len(keys) == 0:
+            # GH #6265
+            return Series([], name=self._selection_name, index=keys)
+
+        def _get_index():
+            if self.grouper.nkeys > 1:
+                index = MultiIndex.from_tuples(keys, names=self.grouper.names)
+            else:
+                index = Index(keys, name=self.grouper.names[0])
+            return index
+
+        if isinstance(values[0], dict):
+            # GH #823
+            index = _get_index()
+            result = DataFrame(values, index=index).stack()
+            result.name = self._selection_name
+            return result
+
+        if isinstance(values[0], (Series, dict)):
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        elif isinstance(values[0], DataFrame):
+            # possible that Series -> DataFrame by applied function
+            return self._concat_objects(keys, values,
+                                        not_indexed_same=not_indexed_same)
+        else:
+            # GH #6265
+            return Series(values, index=_get_index(),
+                          name=self._selection_name)
+
+    def _aggregate_named(self, func, *args, **kwargs):
+        result = {}
+
+        for name, group in self:
+            group.name = name
+            output = func(group, *args, **kwargs)
+            if isinstance(output, (Series, Index, np.ndarray)):
+                raise Exception('Must produce aggregated value')
+            result[name] = self._try_cast(output, group)
+
+        return result
+
+    @Substitution(klass='Series', selected='A.')
+    @Appender(_transform_template)
+    def transform(self, func, *args, **kwargs):
+        func = self._is_cython_func(func) or func
+
+        # if string function
+        if isinstance(func, compat.string_types):
+            if func in base.cython_transforms:
+                # cythonized transform
+                return getattr(self, func)(*args, **kwargs)
+            else:
+                # cythonized aggregation and merge
+                return self._transform_fast(
+                    lambda: getattr(self, func)(*args, **kwargs), func)
+
+        # reg transform
+        klass = self._selected_obj.__class__
+        results = []
+        wrapper = lambda x: func(x, *args, **kwargs)
+        for name, group in self:
+            object.__setattr__(group, 'name', name)
+            res = wrapper(group)
+
+            if hasattr(res, 'values'):
+                res = res.values
+
+            indexer = self._get_index(name)
+            s = klass(res, indexer)
+            results.append(s)
+
+        from pandas.core.reshape.concat import concat
+        result = concat(results).sort_index()
+
+        # we will only try to coerce the result type if
+        # we have a numeric dtype, as these are *always* udfs
+        # the cython take a different path (and casting)
+        dtype = self._selected_obj.dtype
+        if is_numeric_dtype(dtype):
+            result = maybe_downcast_to_dtype(result, dtype)
+
+        result.name = self._selected_obj.name
+        result.index = self._selected_obj.index
+        return result
+
+    def _transform_fast(self, func, func_nm):
+        """
+        fast version of transform, only applicable to
+        builtin/cythonizable functions
+        """
+        if isinstance(func, compat.string_types):
+            func = getattr(self, func)
+
+        ids, _, ngroup = self.grouper.group_info
+        cast = self._transform_should_cast(func_nm)
+        out = algorithms.take_1d(func()._values, ids)
+        if cast:
+            out = self._try_cast(out, self.obj)
+        return Series(out, index=self.obj.index, name=self.obj.name)
+
+    def filter(self, func, dropna=True, *args, **kwargs):  # noqa
+        """
+        Return a copy of a Series excluding elements from groups that
+        do not satisfy the boolean criterion specified by func.
+
+        Parameters
+        ----------
+        func : function
+            To apply to each group. Should return True or False.
+        dropna : Drop groups that do not pass the filter. True by default;
+            if False, groups that evaluate False are filled with NaNs.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+        ...                           'foo', 'bar'],
+        ...                    'B' : [1, 2, 3, 4, 5, 6],
+        ...                    'C' : [2.0, 5., 8., 1., 2., 9.]})
+        >>> grouped = df.groupby('A')
+        >>> df.groupby('A').B.filter(lambda x: x.mean() > 3.)
+        1    2
+        3    4
+        5    6
+        Name: B, dtype: int64
+
+        Returns
+        -------
+        filtered : Series
+        """
+        if isinstance(func, compat.string_types):
+            wrapper = lambda x: getattr(x, func)(*args, **kwargs)
+        else:
+            wrapper = lambda x: func(x, *args, **kwargs)
+
+        # Interpret np.nan as False.
+        def true_and_notna(x, *args, **kwargs):
+            b = wrapper(x, *args, **kwargs)
+            return b and notna(b)
+
+        try:
+            indices = [self._get_index(name) for name, group in self
+                       if true_and_notna(group)]
+        except ValueError:
+            raise TypeError("the filter must return a boolean result")
+        except TypeError:
+            raise TypeError("the filter must return a boolean result")
+
+        filtered = self._apply_filter(indices, dropna)
+        return filtered
+
+    def nunique(self, dropna=True):
+        """
+        Return number of unique elements in the group.
+        """
+        ids, _, _ = self.grouper.group_info
+
+        val = self.obj.get_values()
+
+        try:
+            sorter = np.lexsort((val, ids))
+        except TypeError:  # catches object dtypes
+            msg = 'val.dtype must be object, got {}'.format(val.dtype)
+            assert val.dtype == object, msg
+            val, _ = algorithms.factorize(val, sort=False)
+            sorter = np.lexsort((val, ids))
+            _isna = lambda a: a == -1
+        else:
+            _isna = isna
+
+        ids, val = ids[sorter], val[sorter]
+
+        # group boundaries are where group ids change
+        # unique observations are where sorted values change
+        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
+        inc = np.r_[1, val[1:] != val[:-1]]
+
+        # 1st item of each group is a new unique observation
+        mask = _isna(val)
+        if dropna:
+            inc[idx] = 1
+            inc[mask] = 0
+        else:
+            inc[mask & np.r_[False, mask[:-1]]] = 0
+            inc[idx] = 1
+
+        out = np.add.reduceat(inc, idx).astype('int64', copy=False)
+        if len(ids):
+            # NaN/NaT group exists if the head of ids is -1,
+            # so remove it from res and exclude its index from idx
+            if ids[0] == -1:
+                res = out[1:]
+                idx = idx[np.flatnonzero(idx)]
+            else:
+                res = out
+        else:
+            res = out[1:]
+        ri = self.grouper.result_index
+
+        # we might have duplications among the bins
+        if len(res) != len(ri):
+            res, out = np.zeros(len(ri), dtype=out.dtype), res
+            res[ids[idx]] = out
+
+        return Series(res,
+                      index=ri,
+                      name=self._selection_name)
+
+    @Appender(Series.describe.__doc__)
+    def describe(self, **kwargs):
+        result = self.apply(lambda x: x.describe(**kwargs))
+        if self.axis == 1:
+            return result.T
+        return result.unstack()
+
+    def value_counts(self, normalize=False, sort=True, ascending=False,
+                     bins=None, dropna=True):
+
+        from pandas.core.reshape.tile import cut
+        from pandas.core.reshape.merge import _get_join_indexers
+
+        if bins is not None and not np.iterable(bins):
+            # scalar bins cannot be done at top level
+            # in a backward compatible way
+            return self.apply(Series.value_counts,
+                              normalize=normalize,
+                              sort=sort,
+                              ascending=ascending,
+                              bins=bins)
+
+        ids, _, _ = self.grouper.group_info
+        val = self.obj.get_values()
+
+        # groupby removes null keys from groupings
+        mask = ids != -1
+        ids, val = ids[mask], val[mask]
+
+        if bins is None:
+            lab, lev = algorithms.factorize(val, sort=True)
+            llab = lambda lab, inc: lab[inc]
+        else:
+
+            # lab is a Categorical with categories an IntervalIndex
+            lab = cut(Series(val), bins, include_lowest=True)
+            lev = lab.cat.categories
+            lab = lev.take(lab.cat.codes)
+            llab = lambda lab, inc: lab[inc]._multiindex.codes[-1]
+
+        if is_interval_dtype(lab):
+            # TODO: should we do this inside II?
+            sorter = np.lexsort((lab.left, lab.right, ids))
+        else:
+            sorter = np.lexsort((lab, ids))
+
+        ids, lab = ids[sorter], lab[sorter]
+
+        # group boundaries are where group ids change
+        idx = np.r_[0, 1 + np.nonzero(ids[1:] != ids[:-1])[0]]
+
+        # new values are where sorted labels change
+        lchanges = llab(lab, slice(1, None)) != llab(lab, slice(None, -1))
+        inc = np.r_[True, lchanges]
+        inc[idx] = True  # group boundaries are also new values
+        out = np.diff(np.nonzero(np.r_[inc, True])[0])  # value counts
+
+        # num. of times each group should be repeated
+        rep = partial(np.repeat, repeats=np.add.reduceat(inc, idx))
+
+        # multi-index components
+        labels = list(map(rep, self.grouper.recons_labels)) + [llab(lab, inc)]
+        levels = [ping.group_index for ping in self.grouper.groupings] + [lev]
+        names = self.grouper.names + [self._selection_name]
+
+        if dropna:
+            mask = labels[-1] != -1
+            if mask.all():
+                dropna = False
+            else:
+                out, labels = out[mask], [label[mask] for label in labels]
+
+        if normalize:
+            out = out.astype('float')
+            d = np.diff(np.r_[idx, len(ids)])
+            if dropna:
+                m = ids[lab == -1]
+                np.add.at(d, m, -1)
+                acc = rep(d)[mask]
+            else:
+                acc = rep(d)
+            out /= acc
+
+        if sort and bins is None:
+            cat = ids[inc][mask] if dropna else ids[inc]
+            sorter = np.lexsort((out if ascending else -out, cat))
+            out, labels[-1] = out[sorter], labels[-1][sorter]
+
+        if bins is None:
+            mi = MultiIndex(levels=levels, codes=labels, names=names,
+                            verify_integrity=False)
+
+            if is_integer_dtype(out):
+                out = ensure_int64(out)
+            return Series(out, index=mi, name=self._selection_name)
+
+        # for compat. with libgroupby.value_counts need to ensure every
+        # bin is present at every index level, null filled with zeros
+        diff = np.zeros(len(out), dtype='bool')
+        for lab in labels[:-1]:
+            diff |= np.r_[True, lab[1:] != lab[:-1]]
+
+        ncat, nbin = diff.sum(), len(levels[-1])
+
+        left = [np.repeat(np.arange(ncat), nbin),
+                np.tile(np.arange(nbin), ncat)]
+
+        right = [diff.cumsum() - 1, labels[-1]]
+
+        _, idx = _get_join_indexers(left, right, sort=False, how='left')
+        out = np.where(idx != -1, out[idx], 0)
+
+        if sort:
+            sorter = np.lexsort((out if ascending else -out, left[0]))
+            out, left[-1] = out[sorter], left[-1][sorter]
+
+        # build the multi-index w/ full levels
+        codes = list(map(lambda lab: np.repeat(lab[diff], nbin), labels[:-1]))
+        codes.append(left[-1])
+
+        mi = MultiIndex(levels=levels, codes=codes, names=names,
+                        verify_integrity=False)
+
+        if is_integer_dtype(out):
+            out = ensure_int64(out)
+        return Series(out, index=mi, name=self._selection_name)
+
+    def count(self):
+        """ Compute count of group, excluding missing values """
+        ids, _, ngroups = self.grouper.group_info
+        val = self.obj.get_values()
+
+        mask = (ids != -1) & ~isna(val)
+        ids = ensure_platform_int(ids)
+        minlength = ngroups or (None if _np_version_under1p13 else 0)
+        out = np.bincount(ids[mask], minlength=minlength)
+
+        return Series(out,
+                      index=self.grouper.result_index,
+                      name=self._selection_name,
+                      dtype='int64')
+
+    def _apply_to_column_groupbys(self, func):
+        """ return a pass thru """
+        return func(self)
+
+    def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None):
+        """Calcuate pct_change of each value to previous entry in group"""
+        # TODO: Remove this conditional when #23918 is fixed
+        if freq:
+            return self.apply(lambda x: x.pct_change(periods=periods,
+                                                     fill_method=fill_method,
+                                                     limit=limit, freq=freq))
+        filled = getattr(self, fill_method)(limit=limit)
+        fill_grp = filled.groupby(self.grouper.labels)
+        shifted = fill_grp.shift(periods=periods, freq=freq)
+
+        return (filled / shifted) - 1
+
+
+class DataFrameGroupBy(NDFrameGroupBy):
+
+    _apply_whitelist = base.dataframe_apply_whitelist
+
+    #
+    # Make class defs of attributes on DataFrameGroupBy whitelist.
+    for _def_str in base.whitelist_method_generator(
+            GroupBy, DataFrame, _apply_whitelist):
+        exec(_def_str)
+
+    _block_agg_axis = 1
+
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    pandas.DataFrame.groupby.apply
+    pandas.DataFrame.groupby.transform
+    pandas.DataFrame.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame({'A': [1, 1, 2, 2],
+    ...                    'B': [1, 2, 3, 4],
+    ...                    'C': np.random.randn(4)})
+
+    >>> df
+       A  B         C
+    0  1  1  0.362838
+    1  1  2  0.227877
+    2  2  3  1.267767
+    3  2  4 -0.562860
+
+    The aggregation is for each column.
+
+    >>> df.groupby('A').agg('min')
+       B         C
+    A
+    1  1  0.227877
+    2  3 -0.562860
+
+    Multiple aggregations
+
+    >>> df.groupby('A').agg(['min', 'max'])
+        B             C
+      min max       min       max
+    A
+    1   1   2  0.227877  0.362838
+    2   3   4 -0.562860  1.267767
+
+    Select a column for aggregation
+
+    >>> df.groupby('A').B.agg(['min', 'max'])
+       min  max
+    A
+    1    1    2
+    2    3    4
+
+    Different aggregations per column
+
+    >>> df.groupby('A').agg({'B': ['min', 'max'], 'C': 'sum'})
+        B             C
+      min max       sum
+    A
+    1   1   2  0.590716
+    2   3   4  0.704907
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='DataFrame',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
+    def aggregate(self, arg, *args, **kwargs):
+        return super(DataFrameGroupBy, self).aggregate(arg, *args, **kwargs)
+
+    agg = aggregate
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        sub-classes to define
+        return a sliced object
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+
+        if ndim == 2:
+            if subset is None:
+                subset = self.obj
+            return DataFrameGroupBy(subset, self.grouper, selection=key,
+                                    grouper=self.grouper,
+                                    exclusions=self.exclusions,
+                                    as_index=self.as_index,
+                                    observed=self.observed)
+        elif ndim == 1:
+            if subset is None:
+                subset = self.obj[key]
+            return SeriesGroupBy(subset, selection=key,
+                                 grouper=self.grouper)
+
+        raise AssertionError("invalid ndim for _gotitem")
+
+    def _wrap_generic_output(self, result, obj):
+        result_index = self.grouper.levels[0]
+
+        if self.axis == 0:
+            return DataFrame(result, index=obj.columns,
+                             columns=result_index).T
+        else:
+            return DataFrame(result, index=obj.index,
+                             columns=result_index)
+
+    def _get_data_to_aggregate(self):
+        obj = self._obj_with_exclusions
+        if self.axis == 1:
+            return obj.T._data, 1
+        else:
+            return obj._data, 1
+
+    def _insert_inaxis_grouper_inplace(self, result):
+        # zip in reverse so we can always insert at loc 0
+        izip = zip(* map(reversed, (
+            self.grouper.names,
+            self.grouper.get_group_levels(),
+            [grp.in_axis for grp in self.grouper.groupings])))
+
+        for name, lev, in_axis in izip:
+            if in_axis:
+                result.insert(0, name, lev)
+
+    def _wrap_aggregated_output(self, output, names=None):
+        agg_axis = 0 if self.axis == 1 else 1
+        agg_labels = self._obj_with_exclusions._get_axis(agg_axis)
+
+        output_keys = self._decide_output_index(output, agg_labels)
+
+        if not self.as_index:
+            result = DataFrame(output, columns=output_keys)
+            self._insert_inaxis_grouper_inplace(result)
+            result = result._consolidate()
+        else:
+            index = self.grouper.result_index
+            result = DataFrame(output, index=index, columns=output_keys)
+
+        if self.axis == 1:
+            result = result.T
+
+        return self._reindex_output(result)._convert(datetime=True)
+
+    def _wrap_transformed_output(self, output, names=None):
+        return DataFrame(output, index=self.obj.index)
+
+    def _wrap_agged_blocks(self, items, blocks):
+        if not self.as_index:
+            index = np.arange(blocks[0].values.shape[-1])
+            mgr = BlockManager(blocks, [items, index])
+            result = DataFrame(mgr)
+
+            self._insert_inaxis_grouper_inplace(result)
+            result = result._consolidate()
+        else:
+            index = self.grouper.result_index
+            mgr = BlockManager(blocks, [items, index])
+            result = DataFrame(mgr)
+
+        if self.axis == 1:
+            result = result.T
+
+        return self._reindex_output(result)._convert(datetime=True)
+
+    def _reindex_output(self, result):
+        """
+        If we have categorical groupers, then we want to make sure that
+        we have a fully reindex-output to the levels. These may have not
+        participated in the groupings (e.g. may have all been
+        nan groups);
+
+        This can re-expand the output space
+        """
+
+        # we need to re-expand the output space to accomodate all values
+        # whether observed or not in the cartesian product of our groupes
+        groupings = self.grouper.groupings
+        if groupings is None:
+            return result
+        elif len(groupings) == 1:
+            return result
+
+        # if we only care about the observed values
+        # we are done
+        elif self.observed:
+            return result
+
+        # reindexing only applies to a Categorical grouper
+        elif not any(isinstance(ping.grouper, (Categorical, CategoricalIndex))
+                     for ping in groupings):
+            return result
+
+        levels_list = [ping.group_index for ping in groupings]
+        index, _ = MultiIndex.from_product(
+            levels_list, names=self.grouper.names).sortlevel()
+
+        if self.as_index:
+            d = {self.obj._get_axis_name(self.axis): index, 'copy': False}
+            return result.reindex(**d)
+
+        # GH 13204
+        # Here, the categorical in-axis groupers, which need to be fully
+        # expanded, are columns in `result`. An idea is to do:
+        # result = result.set_index(self.grouper.names)
+        #                .reindex(index).reset_index()
+        # but special care has to be taken because of possible not-in-axis
+        # groupers.
+        # So, we manually select and drop the in-axis grouper columns,
+        # reindex `result`, and then reset the in-axis grouper columns.
+
+        # Select in-axis groupers
+        in_axis_grps = ((i, ping.name) for (i, ping)
+                        in enumerate(groupings) if ping.in_axis)
+        g_nums, g_names = zip(*in_axis_grps)
+
+        result = result.drop(labels=list(g_names), axis=1)
+
+        # Set a temp index and reindex (possibly expanding)
+        result = result.set_index(self.grouper.result_index
+                                  ).reindex(index, copy=False)
+
+        # Reset in-axis grouper columns
+        # (using level numbers `g_nums` because level names may not be unique)
+        result = result.reset_index(level=g_nums)
+
+        return result.reset_index(drop=True)
+
+    def _iterate_column_groupbys(self):
+        for i, colname in enumerate(self._selected_obj.columns):
+            yield colname, SeriesGroupBy(self._selected_obj.iloc[:, i],
+                                         selection=colname,
+                                         grouper=self.grouper,
+                                         exclusions=self.exclusions)
+
+    def _apply_to_column_groupbys(self, func):
+        from pandas.core.reshape.concat import concat
+        return concat(
+            (func(col_groupby) for _, col_groupby
+             in self._iterate_column_groupbys()),
+            keys=self._selected_obj.columns, axis=1)
+
+    def _fill(self, direction, limit=None):
+        """Overridden method to join grouped columns in output"""
+        res = super(DataFrameGroupBy, self)._fill(direction, limit=limit)
+        output = collections.OrderedDict(
+            (grp.name, grp.grouper) for grp in self.grouper.groupings)
+
+        from pandas import concat
+        return concat((self._wrap_transformed_output(output), res), axis=1)
+
+    def count(self):
+        """ Compute count of group, excluding missing values """
+        from pandas.core.dtypes.missing import _isna_ndarraylike as _isna
+
+        data, _ = self._get_data_to_aggregate()
+        ids, _, ngroups = self.grouper.group_info
+        mask = ids != -1
+
+        val = ((mask & ~_isna(np.atleast_2d(blk.get_values())))
+               for blk in data.blocks)
+        loc = (blk.mgr_locs for blk in data.blocks)
+
+        counter = partial(
+            lib.count_level_2d, labels=ids, max_bin=ngroups, axis=1)
+        blk = map(make_block, map(counter, val), loc)
+
+        return self._wrap_agged_blocks(data.items, list(blk))
+
+    def nunique(self, dropna=True):
+        """
+        Return DataFrame with number of distinct observations per group for
+        each column.
+
+        .. versionadded:: 0.20.0
+
+        Parameters
+        ----------
+        dropna : boolean, default True
+            Don't include NaN in the counts.
+
+        Returns
+        -------
+        nunique: DataFrame
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'id': ['spam', 'egg', 'egg', 'spam',
+        ...                           'ham', 'ham'],
+        ...                    'value1': [1, 5, 5, 2, 5, 5],
+        ...                    'value2': list('abbaxy')})
+        >>> df
+             id  value1 value2
+        0  spam       1      a
+        1   egg       5      b
+        2   egg       5      b
+        3  spam       2      a
+        4   ham       5      x
+        5   ham       5      y
+
+        >>> df.groupby('id').nunique()
+            id  value1  value2
+        id
+        egg    1       1       1
+        ham    1       1       2
+        spam   1       2       1
+
+        # check for rows with the same id but conflicting values
+        >>> df.groupby('id').filter(lambda g: (g.nunique() > 1).any())
+             id  value1 value2
+        0  spam       1      a
+        3  spam       2      a
+        4   ham       5      x
+        5   ham       5      y
+        """
+
+        obj = self._selected_obj
+
+        def groupby_series(obj, col=None):
+            return SeriesGroupBy(obj,
+                                 selection=col,
+                                 grouper=self.grouper).nunique(dropna=dropna)
+
+        if isinstance(obj, Series):
+            results = groupby_series(obj)
+        else:
+            from pandas.core.reshape.concat import concat
+            results = [groupby_series(obj[col], col) for col in obj.columns]
+            results = concat(results, axis=1)
+            results.columns.names = obj.columns.names
+
+        if not self.as_index:
+            results.index = ibase.default_index(len(results))
+        return results
+
+    boxplot = boxplot_frame_groupby
diff --git a/pandas/core/groupby/groupby.py b/pandas/core/groupby/groupby.py
new file mode 100644
index 0000000000000..36dcb692bb079
--- /dev/null
+++ b/pandas/core/groupby/groupby.py
@@ -0,0 +1,2206 @@
+"""
+Provide the groupby split-apply-combine paradigm. Define the GroupBy
+class providing the base-class of operations.
+
+The SeriesGroupBy and DataFrameGroupBy sub-class
+(defined in pandas.core.groupby.generic)
+expose these user-facing objects to provide specific functionailty.
+"""
+
+import collections
+from contextlib import contextmanager
+import datetime
+from functools import partial, wraps
+import types
+import warnings
+
+import numpy as np
+
+from pandas._libs import Timestamp, groupby as libgroupby
+import pandas.compat as compat
+from pandas.compat import range, set_function_name, zip
+from pandas.compat.numpy import function as nv
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+from pandas.util._validators import validate_kwargs
+
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.common import (
+    ensure_float, is_datetime64tz_dtype, is_extension_array_dtype,
+    is_numeric_dtype, is_scalar)
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.api.types import (
+    is_datetime64_dtype, is_integer_dtype, is_object_dtype)
+import pandas.core.algorithms as algorithms
+from pandas.core.base import (
+    DataError, GroupByError, PandasObject, SelectionMixin, SpecificationError)
+import pandas.core.common as com
+from pandas.core.config import option_context
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame
+from pandas.core.groupby import base
+from pandas.core.index import Index, MultiIndex
+from pandas.core.series import Series
+from pandas.core.sorting import get_group_index_sorter
+
+_common_see_also = """
+        See Also
+        --------
+        Series.%(name)s
+        DataFrame.%(name)s
+        Panel.%(name)s
+"""
+
+_apply_docs = dict(
+    template="""
+    Apply function `func`  group-wise and combine the results together.
+
+    The function passed to `apply` must take a {input} as its first
+    argument and return a DataFrame, Series or scalar. `apply` will
+    then take care of combining the results back together into a single
+    dataframe or series. `apply` is therefore a highly flexible
+    grouping method.
+
+    While `apply` is a very flexible method, its downside is that
+    using it can be quite a bit slower than using more specific methods
+    like `agg` or `transform`. Pandas offers a wide range of method that will
+    be much faster than using `apply` for their specific purposes, so try to
+    use them before reaching for `apply`.
+
+    Parameters
+    ----------
+    func : callable
+        A callable that takes a {input} as its first argument, and
+        returns a dataframe, a series or a scalar. In addition the
+        callable may take positional and keyword arguments.
+    args, kwargs : tuple and dict
+        Optional positional and keyword arguments to pass to `func`.
+
+    Returns
+    -------
+    applied : Series or DataFrame
+
+    See Also
+    --------
+    pipe : Apply function to the full GroupBy object instead of to each
+        group.
+    aggregate : Apply aggregate function to the GroupBy object.
+    transform : Apply function column-by-column to the GroupBy object.
+    Series.apply : Apply a function to a Series.
+    DataFrame.apply : Apply a function to each row or column of a DataFrame.
+    """,
+    dataframe_examples="""
+    >>> df = pd.DataFrame({'A': 'a a b'.split(),
+                           'B': [1,2,3],
+                           'C': [4,6, 5]})
+    >>> g = df.groupby('A')
+
+    Notice that ``g`` has two groups, ``a`` and ``b``.
+    Calling `apply` in various ways, we can get different grouping results:
+
+    Example 1: below the function passed to `apply` takes a DataFrame as
+    its argument and returns a DataFrame. `apply` combines the result for
+    each group together into a new DataFrame:
+
+    >>> g[['B', 'C']].apply(lambda x: x / x.sum())
+              B    C
+    0  0.333333  0.4
+    1  0.666667  0.6
+    2  1.000000  1.0
+
+    Example 2: The function passed to `apply` takes a DataFrame as
+    its argument and returns a Series.  `apply` combines the result for
+    each group together into a new DataFrame:
+
+    >>> g[['B', 'C']].apply(lambda x: x.max() - x.min())
+       B  C
+    A
+    a  1  2
+    b  0  0
+
+    Example 3: The function passed to `apply` takes a DataFrame as
+    its argument and returns a scalar. `apply` combines the result for
+    each group together into a Series, including setting the index as
+    appropriate:
+
+    >>> g.apply(lambda x: x.C.max() - x.B.min())
+    A
+    a    5
+    b    2
+    dtype: int64
+    """,
+    series_examples="""
+    >>> s = pd.Series([0, 1, 2], index='a a b'.split())
+    >>> g = s.groupby(s.index)
+
+    From ``s`` above we can see that ``g`` has two groups, ``a`` and ``b``.
+    Calling `apply` in various ways, we can get different grouping results:
+
+    Example 1: The function passed to `apply` takes a Series as
+    its argument and returns a Series.  `apply` combines the result for
+    each group together into a new Series:
+
+    >>> g.apply(lambda x:  x*2 if x.name == 'b' else x/2)
+    0    0.0
+    1    0.5
+    2    4.0
+    dtype: float64
+
+    Example 2: The function passed to `apply` takes a Series as
+    its argument and returns a scalar. `apply` combines the result for
+    each group together into a Series, including setting the index as
+    appropriate:
+
+    >>> g.apply(lambda x: x.max() - x.min())
+    a    1
+    b    0
+    dtype: int64
+
+    Notes
+    -----
+    In the current implementation `apply` calls `func` twice on the
+    first group to decide whether it can take a fast or slow code
+    path. This can lead to unexpected behavior if `func` has
+    side-effects, as they will take effect twice for the first
+    group.
+
+    Examples
+    --------
+    {examples}
+    """)
+
+_pipe_template = """\
+Apply a function `func` with arguments to this %(klass)s object and return
+the function's result.
+
+%(versionadded)s
+
+Use `.pipe` when you want to improve readability by chaining together
+functions that expect Series, DataFrames, GroupBy or Resampler objects.
+Instead of writing
+
+>>> h(g(f(df.groupby('group')), arg1=a), arg2=b, arg3=c)
+
+You can write
+
+>>> (df.groupby('group')
+...    .pipe(f)
+...    .pipe(g, arg1=a)
+...    .pipe(h, arg2=b, arg3=c))
+
+which is much more readable.
+
+Parameters
+----------
+func : callable or tuple of (callable, string)
+    Function to apply to this %(klass)s object or, alternatively,
+    a `(callable, data_keyword)` tuple where `data_keyword` is a
+    string indicating the keyword of `callable` that expects the
+    %(klass)s object.
+args : iterable, optional
+       positional arguments passed into `func`.
+kwargs : dict, optional
+         a dictionary of keyword arguments passed into `func`.
+
+Returns
+-------
+object : the return type of `func`.
+
+See Also
+--------
+Series.pipe : Apply a function with arguments to a series.
+DataFrame.pipe: Apply a function with arguments to a dataframe.
+apply : Apply function to each group instead of to the
+    full %(klass)s object.
+
+Notes
+-----
+See more `here
+<http://pandas.pydata.org/pandas-docs/stable/groupby.html#piping-function-calls>`_
+
+Examples
+--------
+%(examples)s
+"""
+
+_transform_template = """
+Call function producing a like-indexed %(klass)s on each group and
+return a %(klass)s having the same indexes as the original object
+filled with the transformed values
+
+Parameters
+----------
+f : function
+    Function to apply to each group
+
+Returns
+-------
+%(klass)s
+
+See Also
+--------
+aggregate, transform
+
+Notes
+-----
+Each group is endowed the attribute 'name' in case you need to know
+which group you are working on.
+
+The current implementation imposes three requirements on f:
+
+* f must return a value that either has the same shape as the input
+  subframe or can be broadcast to the shape of the input subframe.
+  For example, f returns a scalar it will be broadcast to have the
+  same shape as the input subframe.
+* if this is a DataFrame, f must support application column-by-column
+  in the subframe. If f also supports application to the entire subframe,
+  then a fast path is used starting from the second chunk.
+* f must not mutate groups. Mutation is not supported and may
+  produce unexpected results.
+
+Examples
+--------
+
+# Same shape
+>>> df = pd.DataFrame({'A' : ['foo', 'bar', 'foo', 'bar',
+...                           'foo', 'bar'],
+...                    'B' : ['one', 'one', 'two', 'three',
+...                          'two', 'two'],
+...                    'C' : [1, 5, 5, 2, 5, 5],
+...                    'D' : [2.0, 5., 8., 1., 2., 9.]})
+>>> grouped = df.groupby('A')
+>>> grouped.transform(lambda x: (x - x.mean()) / x.std())
+          C         D
+0 -1.154701 -0.577350
+1  0.577350  0.000000
+2  0.577350  1.154701
+3 -1.154701 -1.000000
+4  0.577350 -0.577350
+5  0.577350  1.000000
+
+# Broadcastable
+>>> grouped.transform(lambda x: x.max() - x.min())
+   C    D
+0  4  6.0
+1  3  8.0
+2  4  6.0
+3  3  8.0
+4  4  6.0
+5  3  8.0
+"""
+
+
+class GroupByPlot(PandasObject):
+    """
+    Class implementing the .plot attribute for groupby objects.
+    """
+
+    def __init__(self, groupby):
+        self._groupby = groupby
+
+    def __call__(self, *args, **kwargs):
+        def f(self):
+            return self.plot(*args, **kwargs)
+        f.__name__ = 'plot'
+        return self._groupby.apply(f)
+
+    def __getattr__(self, name):
+        def attr(*args, **kwargs):
+            def f(self):
+                return getattr(self.plot, name)(*args, **kwargs)
+            return self._groupby.apply(f)
+        return attr
+
+
+@contextmanager
+def _group_selection_context(groupby):
+    """
+    Set / reset the _group_selection_context.
+    """
+    groupby._set_group_selection()
+    yield groupby
+    groupby._reset_group_selection()
+
+
+class _GroupBy(PandasObject, SelectionMixin):
+    _group_selection = None
+    _apply_whitelist = frozenset()
+
+    def __init__(self, obj, keys=None, axis=0, level=None,
+                 grouper=None, exclusions=None, selection=None, as_index=True,
+                 sort=True, group_keys=True, squeeze=False,
+                 observed=False, **kwargs):
+
+        self._selection = selection
+
+        if isinstance(obj, NDFrame):
+            obj._consolidate_inplace()
+
+        self.level = level
+
+        if not as_index:
+            if not isinstance(obj, DataFrame):
+                raise TypeError('as_index=False only valid with DataFrame')
+            if axis != 0:
+                raise ValueError('as_index=False only valid for axis=0')
+
+        self.as_index = as_index
+        self.keys = keys
+        self.sort = sort
+        self.group_keys = group_keys
+        self.squeeze = squeeze
+        self.observed = observed
+        self.mutated = kwargs.pop('mutated', False)
+
+        if grouper is None:
+            from pandas.core.groupby.grouper import _get_grouper
+            grouper, exclusions, obj = _get_grouper(obj, keys,
+                                                    axis=axis,
+                                                    level=level,
+                                                    sort=sort,
+                                                    observed=observed,
+                                                    mutated=self.mutated)
+
+        self.obj = obj
+        self.axis = obj._get_axis_number(axis)
+        self.grouper = grouper
+        self.exclusions = set(exclusions) if exclusions else set()
+
+        # we accept no other args
+        validate_kwargs('group', kwargs, {})
+
+    def __len__(self):
+        return len(self.groups)
+
+    def __unicode__(self):
+        # TODO: Better unicode/repr for GroupBy object
+        return object.__repr__(self)
+
+    def _assure_grouper(self):
+        """
+        We create the grouper on instantiation sub-classes may have a
+        different policy.
+        """
+        pass
+
+    @property
+    def groups(self):
+        """
+        Dict {group name -> group labels}.
+        """
+        self._assure_grouper()
+        return self.grouper.groups
+
+    @property
+    def ngroups(self):
+        self._assure_grouper()
+        return self.grouper.ngroups
+
+    @property
+    def indices(self):
+        """
+        Dict {group name -> group indices}.
+        """
+        self._assure_grouper()
+        return self.grouper.indices
+
+    def _get_indices(self, names):
+        """
+        Safe get multiple indices, translate keys for
+        datelike to underlying repr.
+        """
+
+        def get_converter(s):
+            # possibly convert to the actual key types
+            # in the indices, could be a Timestamp or a np.datetime64
+            if isinstance(s, (Timestamp, datetime.datetime)):
+                return lambda key: Timestamp(key)
+            elif isinstance(s, np.datetime64):
+                return lambda key: Timestamp(key).asm8
+            else:
+                return lambda key: key
+
+        if len(names) == 0:
+            return []
+
+        if len(self.indices) > 0:
+            index_sample = next(iter(self.indices))
+        else:
+            index_sample = None     # Dummy sample
+
+        name_sample = names[0]
+        if isinstance(index_sample, tuple):
+            if not isinstance(name_sample, tuple):
+                msg = ("must supply a tuple to get_group with multiple"
+                       " grouping keys")
+                raise ValueError(msg)
+            if not len(name_sample) == len(index_sample):
+                try:
+                    # If the original grouper was a tuple
+                    return [self.indices[name] for name in names]
+                except KeyError:
+                    # turns out it wasn't a tuple
+                    msg = ("must supply a same-length tuple to get_group"
+                           " with multiple grouping keys")
+                    raise ValueError(msg)
+
+            converters = [get_converter(s) for s in index_sample]
+            names = (tuple(f(n) for f, n in zip(converters, name))
+                     for name in names)
+
+        else:
+            converter = get_converter(index_sample)
+            names = (converter(name) for name in names)
+
+        return [self.indices.get(name, []) for name in names]
+
+    def _get_index(self, name):
+        """
+        Safe get index, translate keys for datelike to underlying repr.
+        """
+        return self._get_indices([name])[0]
+
+    @cache_readonly
+    def _selected_obj(self):
+
+        if self._selection is None or isinstance(self.obj, Series):
+            if self._group_selection is not None:
+                return self.obj[self._group_selection]
+            return self.obj
+        else:
+            return self.obj[self._selection]
+
+    def _reset_group_selection(self):
+        """
+        Clear group based selection.
+
+        Used for methods needing to return info on each group regardless of
+        whether a group selection was previously set.
+        """
+        if self._group_selection is not None:
+            # GH12839 clear cached selection too when changing group selection
+            self._group_selection = None
+            self._reset_cache('_selected_obj')
+
+    def _set_group_selection(self):
+        """
+        Create group based selection.
+
+        Used when selection is not passed directly but instead via a grouper.
+
+        NOTE: this should be paired with a call to _reset_group_selection
+        """
+        grp = self.grouper
+        if not (self.as_index and
+                getattr(grp, 'groupings', None) is not None and
+                self.obj.ndim > 1 and
+                self._group_selection is None):
+            return
+
+        ax = self.obj._info_axis
+        groupers = [g.name for g in grp.groupings
+                    if g.level is None and g.in_axis]
+
+        if len(groupers):
+            # GH12839 clear selected obj cache when group selection changes
+            self._group_selection = ax.difference(Index(groupers),
+                                                  sort=False).tolist()
+            self._reset_cache('_selected_obj')
+
+    def _set_result_index_ordered(self, result):
+        # set the result index on the passed values object and
+        # return the new object, xref 8046
+
+        # the values/counts are repeated according to the group index
+        # shortcut if we have an already ordered grouper
+        if not self.grouper.is_monotonic:
+            index = Index(np.concatenate(
+                self._get_indices(self.grouper.result_index)))
+            result.set_axis(index, axis=self.axis, inplace=True)
+            result = result.sort_index(axis=self.axis)
+
+        result.set_axis(self.obj._get_axis(self.axis), axis=self.axis,
+                        inplace=True)
+        return result
+
+    def _dir_additions(self):
+        return self.obj._dir_additions() | self._apply_whitelist
+
+    def __getattr__(self, attr):
+        if attr in self._internal_names_set:
+            return object.__getattribute__(self, attr)
+        if attr in self.obj:
+            return self[attr]
+        if hasattr(self.obj, attr):
+            return self._make_wrapper(attr)
+
+        raise AttributeError("%r object has no attribute %r" %
+                             (type(self).__name__, attr))
+
+    @Substitution(klass='GroupBy',
+                  versionadded='.. versionadded:: 0.21.0',
+                  examples="""\
+>>> df = pd.DataFrame({'A': 'a b a b'.split(), 'B': [1, 2, 3, 4]})
+>>> df
+   A  B
+0  a  1
+1  b  2
+2  a  3
+3  b  4
+
+To get the difference between each groups maximum and minimum value in one
+pass, you can do
+
+>>> df.groupby('A').pipe(lambda x: x.max() - x.min())
+   B
+A
+a  2
+b  2""")
+    @Appender(_pipe_template)
+    def pipe(self, func, *args, **kwargs):
+        return com._pipe(self, func, *args, **kwargs)
+
+    plot = property(GroupByPlot)
+
+    def _make_wrapper(self, name):
+        if name not in self._apply_whitelist:
+            is_callable = callable(getattr(self._selected_obj, name, None))
+            kind = ' callable ' if is_callable else ' '
+            msg = ("Cannot access{0}attribute {1!r} of {2!r} objects, try "
+                   "using the 'apply' method".format(kind, name,
+                                                     type(self).__name__))
+            raise AttributeError(msg)
+
+        self._set_group_selection()
+
+        # need to setup the selection
+        # as are not passed directly but in the grouper
+        f = getattr(self._selected_obj, name)
+        if not isinstance(f, types.MethodType):
+            return self.apply(lambda self: getattr(self, name))
+
+        f = getattr(type(self._selected_obj), name)
+
+        def wrapper(*args, **kwargs):
+            # a little trickery for aggregation functions that need an axis
+            # argument
+            kwargs_with_axis = kwargs.copy()
+            if ('axis' not in kwargs_with_axis or
+                    kwargs_with_axis['axis'] is None):
+                kwargs_with_axis['axis'] = self.axis
+
+            def curried_with_axis(x):
+                return f(x, *args, **kwargs_with_axis)
+
+            def curried(x):
+                return f(x, *args, **kwargs)
+
+            # preserve the name so we can detect it when calling plot methods,
+            # to avoid duplicates
+            curried.__name__ = curried_with_axis.__name__ = name
+
+            # special case otherwise extra plots are created when catching the
+            # exception below
+            if name in base.plotting_methods:
+                return self.apply(curried)
+
+            try:
+                return self.apply(curried_with_axis)
+            except Exception:
+                try:
+                    return self.apply(curried)
+                except Exception:
+
+                    # related to : GH3688
+                    # try item-by-item
+                    # this can be called recursively, so need to raise
+                    # ValueError
+                    # if we don't have this method to indicated to aggregate to
+                    # mark this column as an error
+                    try:
+                        return self._aggregate_item_by_item(name,
+                                                            *args, **kwargs)
+                    except (AttributeError):
+                        raise ValueError
+
+        return wrapper
+
+    def get_group(self, name, obj=None):
+        """
+        Construct NDFrame from group with provided name.
+
+        Parameters
+        ----------
+        name : object
+            the name of the group to get as a DataFrame
+        obj : NDFrame, default None
+            the NDFrame to take the DataFrame out of.  If
+            it is None, the object groupby was called on will
+            be used
+
+        Returns
+        -------
+        group : same type as obj
+        """
+        if obj is None:
+            obj = self._selected_obj
+
+        inds = self._get_index(name)
+        if not len(inds):
+            raise KeyError(name)
+
+        return obj._take(inds, axis=self.axis)
+
+    def __iter__(self):
+        """
+        Groupby iterator.
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        return self.grouper.get_iterator(self.obj, axis=self.axis)
+
+    @Appender(_apply_docs['template']
+              .format(input="dataframe",
+                      examples=_apply_docs['dataframe_examples']))
+    def apply(self, func, *args, **kwargs):
+
+        func = self._is_builtin_func(func)
+
+        # this is needed so we don't try and wrap strings. If we could
+        # resolve functions to their callable functions prior, this
+        # wouldn't be needed
+        if args or kwargs:
+            if callable(func):
+
+                @wraps(func)
+                def f(g):
+                    with np.errstate(all='ignore'):
+                        return func(g, *args, **kwargs)
+            else:
+                raise ValueError('func must be a callable if args or '
+                                 'kwargs are supplied')
+        else:
+            f = func
+
+        # ignore SettingWithCopy here in case the user mutates
+        with option_context('mode.chained_assignment', None):
+            try:
+                result = self._python_apply_general(f)
+            except Exception:
+
+                # gh-20949
+                # try again, with .apply acting as a filtering
+                # operation, by excluding the grouping column
+                # This would normally not be triggered
+                # except if the udf is trying an operation that
+                # fails on *some* columns, e.g. a numeric operation
+                # on a string grouper column
+
+                with _group_selection_context(self):
+                    return self._python_apply_general(f)
+
+        return result
+
+    def _python_apply_general(self, f):
+        keys, values, mutated = self.grouper.apply(f, self._selected_obj,
+                                                   self.axis)
+
+        return self._wrap_applied_output(
+            keys,
+            values,
+            not_indexed_same=mutated or self.mutated)
+
+    def _iterate_slices(self):
+        yield self._selection_name, self._selected_obj
+
+    def transform(self, func, *args, **kwargs):
+        raise AbstractMethodError(self)
+
+    def _cumcount_array(self, ascending=True):
+        """
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from length of group - 1 to 0.
+
+        Notes
+        -----
+        this is currently implementing sort=False
+        (though the default is sort=True) for groupby in general
+        """
+        ids, _, ngroups = self.grouper.group_info
+        sorter = get_group_index_sorter(ids, ngroups)
+        ids, count = ids[sorter], len(ids)
+
+        if count == 0:
+            return np.empty(0, dtype=np.int64)
+
+        run = np.r_[True, ids[:-1] != ids[1:]]
+        rep = np.diff(np.r_[np.nonzero(run)[0], count])
+        out = (~run).cumsum()
+
+        if ascending:
+            out -= np.repeat(out[run], rep)
+        else:
+            out = np.repeat(out[np.r_[run[1:], True]], rep) - out
+
+        rev = np.empty(count, dtype=np.intp)
+        rev[sorter] = np.arange(count, dtype=np.intp)
+        return out[rev].astype(np.int64, copy=False)
+
+    def _try_cast(self, result, obj, numeric_only=False):
+        """
+        Try to cast the result to our obj original type,
+        we may have roundtripped through object in the mean-time.
+
+        If numeric_only is True, then only try to cast numerics
+        and not datetimelikes.
+
+        """
+        if obj.ndim > 1:
+            dtype = obj._values.dtype
+        else:
+            dtype = obj.dtype
+
+        if not is_scalar(result):
+            if is_datetime64tz_dtype(dtype):
+                # GH 23683
+                # Prior results _may_ have been generated in UTC.
+                # Ensure we localize to UTC first before converting
+                # to the target timezone
+                try:
+                    result = obj._values._from_sequence(
+                        result, dtype='datetime64[ns, UTC]'
+                    )
+                    result = result.astype(dtype)
+                except TypeError:
+                    # _try_cast was called at a point where the result
+                    # was already tz-aware
+                    pass
+            elif is_extension_array_dtype(dtype):
+                # The function can return something of any type, so check
+                # if the type is compatible with the calling EA.
+                try:
+                    result = obj._values._from_sequence(result, dtype=dtype)
+                except Exception:
+                    # https://github.com/pandas-dev/pandas/issues/22850
+                    # pandas has no control over what 3rd-party ExtensionArrays
+                    # do in _values_from_sequence. We still want ops to work
+                    # though, so we catch any regular Exception.
+                    pass
+            elif numeric_only and is_numeric_dtype(dtype) or not numeric_only:
+                result = maybe_downcast_to_dtype(result, dtype)
+
+        return result
+
+    def _transform_should_cast(self, func_nm):
+        """
+        Parameters:
+        -----------
+        func_nm: str
+            The name of the aggregation function being performed
+
+        Returns:
+        --------
+        bool
+            Whether transform should attempt to cast the result of aggregation
+        """
+        return (self.size().fillna(0) > 0).any() and (
+            func_nm not in base.cython_cast_blacklist)
+
+    def _cython_transform(self, how, numeric_only=True, **kwargs):
+        output = collections.OrderedDict()
+        for name, obj in self._iterate_slices():
+            is_numeric = is_numeric_dtype(obj.dtype)
+            if numeric_only and not is_numeric:
+                continue
+
+            try:
+                result, names = self.grouper.transform(obj.values, how,
+                                                       **kwargs)
+            except NotImplementedError:
+                continue
+            except AssertionError as e:
+                raise GroupByError(str(e))
+            if self._transform_should_cast(how):
+                output[name] = self._try_cast(result, obj)
+            else:
+                output[name] = result
+
+        if len(output) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        return self._wrap_transformed_output(output, names)
+
+    def _cython_agg_general(self, how, alt=None, numeric_only=True,
+                            min_count=-1):
+        output = {}
+        for name, obj in self._iterate_slices():
+            is_numeric = is_numeric_dtype(obj.dtype)
+            if numeric_only and not is_numeric:
+                continue
+
+            try:
+                result, names = self.grouper.aggregate(obj.values, how,
+                                                       min_count=min_count)
+            except AssertionError as e:
+                raise GroupByError(str(e))
+            output[name] = self._try_cast(result, obj)
+
+        if len(output) == 0:
+            raise DataError('No numeric types to aggregate')
+
+        return self._wrap_aggregated_output(output, names)
+
+    def _python_agg_general(self, func, *args, **kwargs):
+        func = self._is_builtin_func(func)
+        f = lambda x: func(x, *args, **kwargs)
+
+        # iterate through "columns" ex exclusions to populate output dict
+        output = {}
+        for name, obj in self._iterate_slices():
+            try:
+                result, counts = self.grouper.agg_series(obj, f)
+                output[name] = self._try_cast(result, obj, numeric_only=True)
+            except TypeError:
+                continue
+
+        if len(output) == 0:
+            return self._python_apply_general(f)
+
+        if self.grouper._filter_empty_groups:
+
+            mask = counts.ravel() > 0
+            for name, result in compat.iteritems(output):
+
+                # since we are masking, make sure that we have a float object
+                values = result
+                if is_numeric_dtype(values.dtype):
+                    values = ensure_float(values)
+
+                output[name] = self._try_cast(values[mask], result)
+
+        return self._wrap_aggregated_output(output)
+
+    def _wrap_applied_output(self, *args, **kwargs):
+        raise AbstractMethodError(self)
+
+    def _concat_objects(self, keys, values, not_indexed_same=False):
+        from pandas.core.reshape.concat import concat
+
+        def reset_identity(values):
+            # reset the identities of the components
+            # of the values to prevent aliasing
+            for v in com._not_none(*values):
+                ax = v._get_axis(self.axis)
+                ax._reset_identity()
+            return values
+
+        if not not_indexed_same:
+            result = concat(values, axis=self.axis)
+            ax = self._selected_obj._get_axis(self.axis)
+
+            if isinstance(result, Series):
+                result = result.reindex(ax)
+            else:
+
+                # this is a very unfortunate situation
+                # we have a multi-index that is NOT lexsorted
+                # and we have a result which is duplicated
+                # we can't reindex, so we resort to this
+                # GH 14776
+                if isinstance(ax, MultiIndex) and not ax.is_unique:
+                    indexer = algorithms.unique1d(
+                        result.index.get_indexer_for(ax.values))
+                    result = result.take(indexer, axis=self.axis)
+                else:
+                    result = result.reindex(ax, axis=self.axis)
+
+        elif self.group_keys:
+
+            values = reset_identity(values)
+            if self.as_index:
+
+                # possible MI return case
+                group_keys = keys
+                group_levels = self.grouper.levels
+                group_names = self.grouper.names
+
+                result = concat(values, axis=self.axis, keys=group_keys,
+                                levels=group_levels, names=group_names,
+                                sort=False)
+            else:
+
+                # GH5610, returns a MI, with the first level being a
+                # range index
+                keys = list(range(len(values)))
+                result = concat(values, axis=self.axis, keys=keys)
+        else:
+            values = reset_identity(values)
+            result = concat(values, axis=self.axis)
+
+        if (isinstance(result, Series) and
+                getattr(self, '_selection_name', None) is not None):
+
+            result.name = self._selection_name
+
+        return result
+
+    def _apply_filter(self, indices, dropna):
+        if len(indices) == 0:
+            indices = np.array([], dtype='int64')
+        else:
+            indices = np.sort(np.concatenate(indices))
+        if dropna:
+            filtered = self._selected_obj.take(indices, axis=self.axis)
+        else:
+            mask = np.empty(len(self._selected_obj.index), dtype=bool)
+            mask.fill(False)
+            mask[indices.astype(int)] = True
+            # mask fails to broadcast when passed to where; broadcast manually.
+            mask = np.tile(mask, list(self._selected_obj.shape[1:]) + [1]).T
+            filtered = self._selected_obj.where(mask)  # Fill with NaNs.
+        return filtered
+
+
+class GroupBy(_GroupBy):
+
+    """
+    Class for grouping and aggregating relational data.
+
+    See aggregate, transform, and apply functions on this object.
+
+    It's easiest to use obj.groupby(...) to use GroupBy, but you can also do:
+
+    ::
+
+        grouped = groupby(obj, ...)
+
+    Parameters
+    ----------
+    obj : pandas object
+    axis : int, default 0
+    level : int, default None
+        Level of MultiIndex
+    groupings : list of Grouping objects
+        Most users should ignore this
+    exclusions : array-like, optional
+        List of columns to exclude
+    name : string
+        Most users should ignore this
+
+    Returns
+    -------
+    **Attributes**
+    groups : dict
+        {group name -> group labels}
+    len(grouped) : int
+        Number of groups
+
+    Notes
+    -----
+    After grouping, see aggregate, apply, and transform functions. Here are
+    some other brief notes about usage. When grouping by multiple groups, the
+    result index will be a MultiIndex (hierarchical) by default.
+
+    Iteration produces (key, group) tuples, i.e. chunking the data by group. So
+    you can write code like:
+
+    ::
+
+        grouped = obj.groupby(keys, axis=axis)
+        for key, group in grouped:
+            # do something with the data
+
+    Function calls on GroupBy, if not specially implemented, "dispatch" to the
+    grouped data. So if you group a DataFrame and wish to invoke the std()
+    method on each group, you can simply do:
+
+    ::
+
+        df.groupby(mapper).std()
+
+    rather than
+
+    ::
+
+        df.groupby(mapper).aggregate(np.std)
+
+    You can pass arguments to these "wrapped" functions, too.
+
+    See the online documentation for full exposition on these topics and much
+    more
+    """
+    def _bool_agg(self, val_test, skipna):
+        """
+        Shared func to call any / all Cython GroupBy implementations.
+        """
+
+        def objs_to_bool(vals):
+            # type: (np.ndarray) -> (np.ndarray, typing.Type)
+            if is_object_dtype(vals):
+                vals = np.array([bool(x) for x in vals])
+            else:
+                vals = vals.astype(np.bool)
+
+            return vals.view(np.uint8), np.bool
+
+        def result_to_bool(result, inference):
+            # type: (np.ndarray, typing.Type) -> np.ndarray
+            return result.astype(inference, copy=False)
+
+        return self._get_cythonized_result('group_any_all', self.grouper,
+                                           aggregate=True,
+                                           cython_dtype=np.uint8,
+                                           needs_values=True,
+                                           needs_mask=True,
+                                           pre_processing=objs_to_bool,
+                                           post_processing=result_to_bool,
+                                           val_test=val_test, skipna=skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def any(self, skipna=True):
+        """
+        Return True if any value in the group is truthful, else False.
+
+        Parameters
+        ----------
+        skipna : bool, default True
+            Flag to ignore nan values during truth testing
+        """
+        return self._bool_agg('any', skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def all(self, skipna=True):
+        """
+        Return True if all values in the group are truthful, else False.
+
+        Parameters
+        ----------
+        skipna : bool, default True
+            Flag to ignore nan values during truth testing
+        """
+        return self._bool_agg('all', skipna)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def count(self):
+        """
+        Compute count of group, excluding missing values.
+        """
+
+        # defined here for API doc
+        raise NotImplementedError
+
+    @Substitution(name='groupby', see_also=_common_see_also)
+    def mean(self, *args, **kwargs):
+        """
+        Compute mean of groups, excluding missing values.
+
+        Returns
+        -------
+        pandas.Series or pandas.DataFrame
+
+        %(see_also)s
+
+        Examples
+        --------
+        >>> df = pd.DataFrame({'A': [1, 1, 2, 1, 2],
+        ...                    'B': [np.nan, 2, 3, 4, 5],
+        ...                    'C': [1, 2, 1, 1, 2]}, columns=['A', 'B', 'C'])
+
+        Groupby one column and return the mean of the remaining columns in
+        each group.
+
+        >>> df.groupby('A').mean()
+        >>>
+             B         C
+        A
+        1  3.0  1.333333
+        2  4.0  1.500000
+
+        Groupby two columns and return the mean of the remaining column.
+
+        >>> df.groupby(['A', 'B']).mean()
+        >>>
+               C
+        A B
+        1 2.0  2
+          4.0  1
+        2 3.0  1
+          5.0  2
+
+        Groupby one column and return the mean of only particular column in
+        the group.
+
+        >>> df.groupby('A')['B'].mean()
+        >>>
+        A
+        1    3.0
+        2    4.0
+        Name: B, dtype: float64
+        """
+        nv.validate_groupby_func('mean', args, kwargs, ['numeric_only'])
+        try:
+            return self._cython_agg_general('mean', **kwargs)
+        except GroupByError:
+            raise
+        except Exception:  # pragma: no cover
+            with _group_selection_context(self):
+                f = lambda x: x.mean(axis=self.axis, **kwargs)
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def median(self, **kwargs):
+        """
+        Compute median of groups, excluding missing values.
+
+        For multiple groupings, the result index will be a MultiIndex
+        """
+        try:
+            return self._cython_agg_general('median', **kwargs)
+        except GroupByError:
+            raise
+        except Exception:  # pragma: no cover
+
+            def f(x):
+                if isinstance(x, np.ndarray):
+                    x = Series(x)
+                return x.median(axis=self.axis, **kwargs)
+            with _group_selection_context(self):
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def std(self, ddof=1, *args, **kwargs):
+        """
+        Compute standard deviation of groups, excluding missing values.
+
+        For multiple groupings, the result index will be a MultiIndex.
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+
+        # TODO: implement at Cython level?
+        nv.validate_groupby_func('std', args, kwargs)
+        return np.sqrt(self.var(ddof=ddof, **kwargs))
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def var(self, ddof=1, *args, **kwargs):
+        """
+        Compute variance of groups, excluding missing values.
+
+        For multiple groupings, the result index will be a MultiIndex.
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+        nv.validate_groupby_func('var', args, kwargs)
+        if ddof == 1:
+            try:
+                return self._cython_agg_general('var', **kwargs)
+            except Exception:
+                f = lambda x: x.var(ddof=ddof, **kwargs)
+                with _group_selection_context(self):
+                    return self._python_agg_general(f)
+        else:
+            f = lambda x: x.var(ddof=ddof, **kwargs)
+            with _group_selection_context(self):
+                return self._python_agg_general(f)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def sem(self, ddof=1):
+        """
+        Compute standard error of the mean of groups, excluding missing values.
+
+        For multiple groupings, the result index will be a MultiIndex.
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+
+        return self.std(ddof=ddof) / np.sqrt(self.count())
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def size(self):
+        """
+        Compute group sizes.
+        """
+        result = self.grouper.size()
+
+        if isinstance(self.obj, Series):
+            result.name = getattr(self.obj, 'name', None)
+        return result
+
+    @classmethod
+    def _add_numeric_operations(cls):
+        """
+        Add numeric operations to the GroupBy generically.
+        """
+
+        def groupby_function(name, alias, npfunc,
+                             numeric_only=True, _convert=False,
+                             min_count=-1):
+
+            _local_template = "Compute %(f)s of group values"
+
+            @Substitution(name='groupby', f=name)
+            @Appender(_common_see_also)
+            @Appender(_local_template)
+            def f(self, **kwargs):
+                if 'numeric_only' not in kwargs:
+                    kwargs['numeric_only'] = numeric_only
+                if 'min_count' not in kwargs:
+                    kwargs['min_count'] = min_count
+
+                self._set_group_selection()
+                try:
+                    return self._cython_agg_general(
+                        alias, alt=npfunc, **kwargs)
+                except AssertionError as e:
+                    raise SpecificationError(str(e))
+                except Exception:
+                    result = self.aggregate(
+                        lambda x: npfunc(x, axis=self.axis))
+                    if _convert:
+                        result = result._convert(datetime=True)
+                    return result
+
+            set_function_name(f, name, cls)
+
+            return f
+
+        def first_compat(x, axis=0):
+
+            def first(x):
+                x = x.to_numpy()
+
+                x = x[notna(x)]
+                if len(x) == 0:
+                    return np.nan
+                return x[0]
+
+            if isinstance(x, DataFrame):
+                return x.apply(first, axis=axis)
+            else:
+                return first(x)
+
+        def last_compat(x, axis=0):
+
+            def last(x):
+                x = x.to_numpy()
+                x = x[notna(x)]
+                if len(x) == 0:
+                    return np.nan
+                return x[-1]
+
+            if isinstance(x, DataFrame):
+                return x.apply(last, axis=axis)
+            else:
+                return last(x)
+
+        cls.sum = groupby_function('sum', 'add', np.sum, min_count=0)
+        cls.prod = groupby_function('prod', 'prod', np.prod, min_count=0)
+        cls.min = groupby_function('min', 'min', np.min, numeric_only=False)
+        cls.max = groupby_function('max', 'max', np.max, numeric_only=False)
+        cls.first = groupby_function('first', 'first', first_compat,
+                                     numeric_only=False)
+        cls.last = groupby_function('last', 'last', last_compat,
+                                    numeric_only=False)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def ohlc(self):
+        """
+        Compute sum of values, excluding missing values.
+
+        For multiple groupings, the result index will be a MultiIndex
+        """
+
+        return self._apply_to_column_groupbys(
+            lambda x: x._cython_agg_general('ohlc'))
+
+    @Appender(DataFrame.describe.__doc__)
+    def describe(self, **kwargs):
+        with _group_selection_context(self):
+            result = self.apply(lambda x: x.describe(**kwargs))
+            if self.axis == 1:
+                return result.T
+            return result.unstack()
+
+    def resample(self, rule, *args, **kwargs):
+        """
+        Provide resampling when using a TimeGrouper.
+
+        Given a grouper, the function resamples it according to a string
+        "string" -> "frequency".
+
+        See the :ref:`frequency aliases <timeseries.offset_aliases>`
+        documentation for more details.
+
+        Parameters
+        ----------
+        rule : str or DateOffset
+            The offset string or object representing target grouper conversion.
+        *args, **kwargs
+            Possible arguments are `how`, `fill_method`, `limit`, `kind` and
+            `on`, and other arguments of `TimeGrouper`.
+
+        Returns
+        -------
+        Grouper
+            Return a new grouper with our resampler appended.
+
+        See Also
+        --------
+        Grouper : Specify a frequency to resample with when
+            grouping by a key.
+        DatetimeIndex.resample : Frequency conversion and resampling of
+            time series.
+
+        Examples
+        --------
+        >>> idx = pd.date_range('1/1/2000', periods=4, freq='T')
+        >>> df = pd.DataFrame(data=4 * [range(2)],
+        ...                   index=idx,
+        ...                   columns=['a', 'b'])
+        >>> df.iloc[2, 0] = 5
+        >>> df
+                            a  b
+        2000-01-01 00:00:00  0  1
+        2000-01-01 00:01:00  0  1
+        2000-01-01 00:02:00  5  1
+        2000-01-01 00:03:00  0  1
+
+        Downsample the DataFrame into 3 minute bins and sum the values of
+        the timestamps falling into a bin.
+
+        >>> df.groupby('a').resample('3T').sum()
+                                 a  b
+        a
+        0   2000-01-01 00:00:00  0  2
+            2000-01-01 00:03:00  0  1
+        5   2000-01-01 00:00:00  5  1
+
+        Upsample the series into 30 second bins.
+
+        >>> df.groupby('a').resample('30S').sum()
+                            a  b
+        a
+        0   2000-01-01 00:00:00  0  1
+            2000-01-01 00:00:30  0  0
+            2000-01-01 00:01:00  0  1
+            2000-01-01 00:01:30  0  0
+            2000-01-01 00:02:00  0  0
+            2000-01-01 00:02:30  0  0
+            2000-01-01 00:03:00  0  1
+        5   2000-01-01 00:02:00  5  1
+
+        Resample by month. Values are assigned to the month of the period.
+
+        >>> df.groupby('a').resample('M').sum()
+                    a  b
+        a
+        0   2000-01-31  0  3
+        5   2000-01-31  5  1
+
+        Downsample the series into 3 minute bins as above, but close the right
+        side of the bin interval.
+
+        >>> df.groupby('a').resample('3T', closed='right').sum()
+                                 a  b
+        a
+        0   1999-12-31 23:57:00  0  1
+            2000-01-01 00:00:00  0  2
+        5   2000-01-01 00:00:00  5  1
+
+        Downsample the series into 3 minute bins and close the right side of
+        the bin interval, but label each bin using the right edge instead of
+        the left.
+
+        >>> df.groupby('a').resample('3T', closed='right', label='right').sum()
+                                 a  b
+        a
+        0   2000-01-01 00:00:00  0  1
+            2000-01-01 00:03:00  0  2
+        5   2000-01-01 00:03:00  5  1
+
+        Add an offset of twenty seconds.
+
+        >>> df.groupby('a').resample('3T', loffset='20s').sum()
+                               a  b
+        a
+        0   2000-01-01 00:00:20  0  2
+            2000-01-01 00:03:20  0  1
+        5   2000-01-01 00:00:20  5  1
+        """
+        from pandas.core.resample import get_resampler_for_grouping
+        return get_resampler_for_grouping(self, rule, *args, **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def rolling(self, *args, **kwargs):
+        """
+        Return a rolling grouper, providing rolling functionality per group.
+        """
+        from pandas.core.window import RollingGroupby
+        return RollingGroupby(self, *args, **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def expanding(self, *args, **kwargs):
+        """
+        Return an expanding grouper, providing expanding
+        functionality per group.
+        """
+        from pandas.core.window import ExpandingGroupby
+        return ExpandingGroupby(self, *args, **kwargs)
+
+    def _fill(self, direction, limit=None):
+        """
+        Shared function for `pad` and `backfill` to call Cython method.
+
+        Parameters
+        ----------
+        direction : {'ffill', 'bfill'}
+            Direction passed to underlying Cython function. `bfill` will cause
+            values to be filled backwards. `ffill` and any other values will
+            default to a forward fill
+        limit : int, default None
+            Maximum number of consecutive values to fill. If `None`, this
+            method will convert to -1 prior to passing to Cython
+
+        Returns
+        -------
+        `Series` or `DataFrame` with filled values
+
+        See Also
+        --------
+        pad
+        backfill
+        """
+        # Need int value for Cython
+        if limit is None:
+            limit = -1
+
+        return self._get_cythonized_result('group_fillna_indexer',
+                                           self.grouper, needs_mask=True,
+                                           cython_dtype=np.int64,
+                                           result_is_index=True,
+                                           direction=direction, limit=limit)
+
+    @Substitution(name='groupby')
+    def pad(self, limit=None):
+        """
+        Forward fill the values.
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        See Also
+        --------
+        Series.pad
+        DataFrame.pad
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._fill('ffill', limit=limit)
+    ffill = pad
+
+    @Substitution(name='groupby')
+    def backfill(self, limit=None):
+        """
+        Backward fill the values.
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        See Also
+        --------
+        Series.backfill
+        DataFrame.backfill
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._fill('bfill', limit=limit)
+    bfill = backfill
+
+    @Substitution(name='groupby', see_also=_common_see_also)
+    def nth(self, n, dropna=None):
+        """
+        Take the nth row from each group if n is an int, or a subset of rows
+        if n is a list of ints.
+
+        If dropna, will take the nth non-null row, dropna is either
+        Truthy (if a Series) or 'all', 'any' (if a DataFrame);
+        this is equivalent to calling dropna(how=dropna) before the
+        groupby.
+
+        Parameters
+        ----------
+        n : int or list of ints
+            a single nth value for the row or a list of nth values
+        dropna : None or str, optional
+            apply the specified dropna operation before counting which row is
+            the nth row. Needs to be None, 'any' or 'all'
+
+        %(see_also)s
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame({'A': [1, 1, 2, 1, 2],
+        ...                    'B': [np.nan, 2, 3, 4, 5]}, columns=['A', 'B'])
+        >>> g = df.groupby('A')
+        >>> g.nth(0)
+             B
+        A
+        1  NaN
+        2  3.0
+        >>> g.nth(1)
+             B
+        A
+        1  2.0
+        2  5.0
+        >>> g.nth(-1)
+             B
+        A
+        1  4.0
+        2  5.0
+        >>> g.nth([0, 1])
+             B
+        A
+        1  NaN
+        1  2.0
+        2  3.0
+        2  5.0
+
+        Specifying `dropna` allows count ignoring ``NaN``
+
+        >>> g.nth(0, dropna='any')
+             B
+        A
+        1  2.0
+        2  3.0
+
+        NaNs denote group exhausted when using dropna
+
+        >>> g.nth(3, dropna='any')
+            B
+        A
+        1 NaN
+        2 NaN
+
+        Specifying `as_index=False` in `groupby` keeps the original index.
+
+        >>> df.groupby('A', as_index=False).nth(1)
+           A    B
+        1  1  2.0
+        4  2  5.0
+        """
+
+        if isinstance(n, int):
+            nth_values = [n]
+        elif isinstance(n, (set, list, tuple)):
+            nth_values = list(set(n))
+            if dropna is not None:
+                raise ValueError(
+                    "dropna option with a list of nth values is not supported")
+        else:
+            raise TypeError("n needs to be an int or a list/set/tuple of ints")
+
+        nth_values = np.array(nth_values, dtype=np.intp)
+        self._set_group_selection()
+
+        if not dropna:
+            mask_left = np.in1d(self._cumcount_array(), nth_values)
+            mask_right = np.in1d(self._cumcount_array(ascending=False) + 1,
+                                 -nth_values)
+            mask = mask_left | mask_right
+
+            out = self._selected_obj[mask]
+            if not self.as_index:
+                return out
+
+            ids, _, _ = self.grouper.group_info
+            out.index = self.grouper.result_index[ids[mask]]
+
+            return out.sort_index() if self.sort else out
+
+        if dropna not in ['any', 'all']:
+            if isinstance(self._selected_obj, Series) and dropna is True:
+                warnings.warn("the dropna={dropna} keyword is deprecated,"
+                              "use dropna='all' instead. "
+                              "For a Series groupby, dropna must be "
+                              "either None, 'any' or 'all'.".format(
+                                  dropna=dropna),
+                              FutureWarning,
+                              stacklevel=2)
+                dropna = 'all'
+            else:
+                # Note: when agg-ing picker doesn't raise this,
+                # just returns NaN
+                raise ValueError("For a DataFrame groupby, dropna must be "
+                                 "either None, 'any' or 'all', "
+                                 "(was passed {dropna}).".format(
+                                     dropna=dropna))
+
+        # old behaviour, but with all and any support for DataFrames.
+        # modified in GH 7559 to have better perf
+        max_len = n if n >= 0 else - 1 - n
+        dropped = self.obj.dropna(how=dropna, axis=self.axis)
+
+        # get a new grouper for our dropped obj
+        if self.keys is None and self.level is None:
+
+            # we don't have the grouper info available
+            # (e.g. we have selected out
+            # a column that is not in the current object)
+            axis = self.grouper.axis
+            grouper = axis[axis.isin(dropped.index)]
+
+        else:
+
+            # create a grouper with the original parameters, but on the dropped
+            # object
+            from pandas.core.groupby.grouper import _get_grouper
+            grouper, _, _ = _get_grouper(dropped, key=self.keys,
+                                         axis=self.axis, level=self.level,
+                                         sort=self.sort,
+                                         mutated=self.mutated)
+
+        grb = dropped.groupby(grouper, as_index=self.as_index, sort=self.sort)
+        sizes, result = grb.size(), grb.nth(n)
+        mask = (sizes < max_len).values
+
+        # set the results which don't meet the criteria
+        if len(result) and mask.any():
+            result.loc[mask] = np.nan
+
+        # reset/reindex to the original groups
+        if (len(self.obj) == len(dropped) or
+                len(result) == len(self.grouper.result_index)):
+            result.index = self.grouper.result_index
+        else:
+            result = result.reindex(self.grouper.result_index)
+
+        return result
+
+    def quantile(self, q=0.5, interpolation='linear'):
+        """
+        Return group values at the given quantile, a la numpy.percentile.
+
+        Parameters
+        ----------
+        q : float or array-like, default 0.5 (50% quantile)
+            Value(s) between 0 and 1 providing the quantile(s) to compute.
+        interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
+            Method to use when the desired quantile falls between two points.
+
+        Returns
+        -------
+        Series or DataFrame
+            Return type determined by caller of GroupBy object.
+
+        See Also
+        --------
+        Series.quantile : Similar method for Series.
+        DataFrame.quantile : Similar method for DataFrame.
+        numpy.percentile : NumPy method to compute qth percentile.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([
+        ...     ['a', 1], ['a', 2], ['a', 3],
+        ...     ['b', 1], ['b', 3], ['b', 5]
+        ... ], columns=['key', 'val'])
+        >>> df.groupby('key').quantile()
+            val
+        key
+        a    2.0
+        b    3.0
+        """
+
+        def pre_processor(vals):
+            # type: (np.ndarray) -> (np.ndarray, Optional[typing.Type])
+            if is_object_dtype(vals):
+                raise TypeError("'quantile' cannot be performed against "
+                                "'object' dtypes!")
+
+            inference = None
+            if is_integer_dtype(vals):
+                inference = np.int64
+            elif is_datetime64_dtype(vals):
+                inference = 'datetime64[ns]'
+                vals = vals.astype(np.float)
+
+            return vals, inference
+
+        def post_processor(vals, inference):
+            # type: (np.ndarray, Optional[typing.Type]) -> np.ndarray
+            if inference:
+                # Check for edge case
+                if not (is_integer_dtype(inference) and
+                        interpolation in {'linear', 'midpoint'}):
+                    vals = vals.astype(inference)
+
+            return vals
+
+        return self._get_cythonized_result('group_quantile', self.grouper,
+                                           aggregate=True,
+                                           needs_values=True,
+                                           needs_mask=True,
+                                           cython_dtype=np.float64,
+                                           pre_processing=pre_processor,
+                                           post_processing=post_processor,
+                                           q=q, interpolation=interpolation)
+
+    @Substitution(name='groupby')
+    def ngroup(self, ascending=True):
+        """
+        Number each group from 0 to the number of groups - 1.
+
+        This is the enumerative complement of cumcount.  Note that the
+        numbers given to the groups match the order in which the groups
+        would be seen when iterating over the groupby object, not the
+        order they are first observed.
+
+        .. versionadded:: 0.20.2
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from number of group - 1 to 0.
+
+        See Also
+        --------
+        .cumcount : Number the rows in each group.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame({"A": list("aaabba")})
+        >>> df
+           A
+        0  a
+        1  a
+        2  a
+        3  b
+        4  b
+        5  a
+        >>> df.groupby('A').ngroup()
+        0    0
+        1    0
+        2    0
+        3    1
+        4    1
+        5    0
+        dtype: int64
+        >>> df.groupby('A').ngroup(ascending=False)
+        0    1
+        1    1
+        2    1
+        3    0
+        4    0
+        5    1
+        dtype: int64
+        >>> df.groupby(["A", [1,1,2,3,2,1]]).ngroup()
+        0    0
+        1    0
+        2    1
+        3    3
+        4    2
+        5    0
+        dtype: int64
+        """
+
+        with _group_selection_context(self):
+            index = self._selected_obj.index
+            result = Series(self.grouper.group_info[0], index)
+            if not ascending:
+                result = self.ngroups - 1 - result
+            return result
+
+    @Substitution(name='groupby')
+    def cumcount(self, ascending=True):
+        """
+        Number each item in each group from 0 to the length of that group - 1.
+
+        Essentially this is equivalent to
+
+        >>> self.apply(lambda x: pd.Series(np.arange(len(x)), x.index))
+
+        Parameters
+        ----------
+        ascending : bool, default True
+            If False, number in reverse, from length of group - 1 to 0.
+
+        See Also
+        --------
+        .ngroup : Number the groups themselves.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame([['a'], ['a'], ['a'], ['b'], ['b'], ['a']],
+        ...                   columns=['A'])
+        >>> df
+           A
+        0  a
+        1  a
+        2  a
+        3  b
+        4  b
+        5  a
+        >>> df.groupby('A').cumcount()
+        0    0
+        1    1
+        2    2
+        3    0
+        4    1
+        5    3
+        dtype: int64
+        >>> df.groupby('A').cumcount(ascending=False)
+        0    3
+        1    2
+        2    1
+        3    1
+        4    0
+        5    0
+        dtype: int64
+        """
+
+        with _group_selection_context(self):
+            index = self._selected_obj.index
+            cumcounts = self._cumcount_array(ascending=ascending)
+            return Series(cumcounts, index)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def rank(self, method='average', ascending=True, na_option='keep',
+             pct=False, axis=0):
+        """
+        Provide the rank of values within each group.
+
+        Parameters
+        ----------
+        method : {'average', 'min', 'max', 'first', 'dense'}, default 'average'
+            * average: average rank of group
+            * min: lowest rank in group
+            * max: highest rank in group
+            * first: ranks assigned in order they appear in the array
+            * dense: like 'min', but rank always increases by 1 between groups
+        ascending : boolean, default True
+            False for ranks by high (1) to low (N)
+        na_option :  {'keep', 'top', 'bottom'}, default 'keep'
+            * keep: leave NA values where they are
+            * top: smallest rank if ascending
+            * bottom: smallest rank if descending
+        pct : boolean, default False
+            Compute percentage rank of data within each group
+        axis : int, default 0
+            The axis of the object over which to compute the rank.
+
+        Returns
+        -------
+        DataFrame with ranking of values within each group
+        """
+        if na_option not in {'keep', 'top', 'bottom'}:
+            msg = "na_option must be one of 'keep', 'top', or 'bottom'"
+            raise ValueError(msg)
+        return self._cython_transform('rank', numeric_only=False,
+                                      ties_method=method, ascending=ascending,
+                                      na_option=na_option, pct=pct, axis=axis)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def cumprod(self, axis=0, *args, **kwargs):
+        """
+        Cumulative product for each group.
+        """
+        nv.validate_groupby_func('cumprod', args, kwargs,
+                                 ['numeric_only', 'skipna'])
+        if axis != 0:
+            return self.apply(lambda x: x.cumprod(axis=axis, **kwargs))
+
+        return self._cython_transform('cumprod', **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Cumulative sum for each group.
+        """
+        nv.validate_groupby_func('cumsum', args, kwargs,
+                                 ['numeric_only', 'skipna'])
+        if axis != 0:
+            return self.apply(lambda x: x.cumsum(axis=axis, **kwargs))
+
+        return self._cython_transform('cumsum', **kwargs)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def cummin(self, axis=0, **kwargs):
+        """
+        Cumulative min for each group.
+        """
+        if axis != 0:
+            return self.apply(lambda x: np.minimum.accumulate(x, axis))
+
+        return self._cython_transform('cummin', numeric_only=False)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def cummax(self, axis=0, **kwargs):
+        """
+        Cumulative max for each group.
+        """
+        if axis != 0:
+            return self.apply(lambda x: np.maximum.accumulate(x, axis))
+
+        return self._cython_transform('cummax', numeric_only=False)
+
+    def _get_cythonized_result(self, how, grouper, aggregate=False,
+                               cython_dtype=None, needs_values=False,
+                               needs_mask=False, needs_ngroups=False,
+                               result_is_index=False,
+                               pre_processing=None, post_processing=None,
+                               **kwargs):
+        """
+        Get result for Cythonized functions.
+
+        Parameters
+        ----------
+        how : str, Cythonized function name to be called
+        grouper : Grouper object containing pertinent group info
+        aggregate : bool, default False
+            Whether the result should be aggregated to match the number of
+            groups
+        cython_dtype : default None
+            Type of the array that will be modified by the Cython call. If
+            `None`, the type will be inferred from the values of each slice
+        needs_values : bool, default False
+            Whether the values should be a part of the Cython call
+            signature
+        needs_mask : bool, default False
+            Whether boolean mask needs to be part of the Cython call
+            signature
+        needs_ngroups : bool, default False
+            Whether number of groups is part of the Cython call signature
+        result_is_index : bool, default False
+            Whether the result of the Cython operation is an index of
+            values to be retrieved, instead of the actual values themselves
+        pre_processing : function, default None
+            Function to be applied to `values` prior to passing to Cython.
+            Function should return a tuple where the first element is the
+            values to be passed to Cython and the second element is an optional
+            type which the values should be converted to after being returned
+            by the Cython operation. Raises if `needs_values` is False.
+        post_processing : function, default None
+            Function to be applied to result of Cython function. Should accept
+            an array of values as the first argument and type inferences as its
+            second argument, i.e. the signature should be
+            (ndarray, typing.Type).
+        **kwargs : dict
+            Extra arguments to be passed back to Cython funcs
+
+        Returns
+        -------
+        `Series` or `DataFrame`  with filled values
+        """
+        if result_is_index and aggregate:
+            raise ValueError("'result_is_index' and 'aggregate' cannot both "
+                             "be True!")
+        if post_processing:
+            if not callable(pre_processing):
+                raise ValueError("'post_processing' must be a callable!")
+        if pre_processing:
+            if not callable(pre_processing):
+                raise ValueError("'pre_processing' must be a callable!")
+            if not needs_values:
+                raise ValueError("Cannot use 'pre_processing' without "
+                                 "specifying 'needs_values'!")
+
+        labels, _, ngroups = grouper.group_info
+        output = collections.OrderedDict()
+        base_func = getattr(libgroupby, how)
+
+        for name, obj in self._iterate_slices():
+            if aggregate:
+                result_sz = ngroups
+            else:
+                result_sz = len(obj.values)
+
+            if not cython_dtype:
+                cython_dtype = obj.values.dtype
+
+            result = np.zeros(result_sz, dtype=cython_dtype)
+            func = partial(base_func, result, labels)
+            inferences = None
+
+            if needs_values:
+                vals = obj.values
+                if pre_processing:
+                    vals, inferences = pre_processing(vals)
+                func = partial(func, vals)
+
+            if needs_mask:
+                mask = isna(obj.values).view(np.uint8)
+                func = partial(func, mask)
+
+            if needs_ngroups:
+                func = partial(func, ngroups)
+
+            func(**kwargs)  # Call func to modify indexer values in place
+
+            if result_is_index:
+                result = algorithms.take_nd(obj.values, result)
+
+            if post_processing:
+                result = post_processing(result, inferences)
+
+            output[name] = result
+
+        if aggregate:
+            return self._wrap_aggregated_output(output)
+        else:
+            return self._wrap_transformed_output(output)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def shift(self, periods=1, freq=None, axis=0, fill_value=None):
+        """
+        Shift each group by periods observations.
+
+        Parameters
+        ----------
+        periods : integer, default 1
+            number of periods to shift
+        freq : frequency string
+        axis : axis to shift, default 0
+        fill_value : optional
+
+            .. versionadded:: 0.24.0
+        """
+
+        if freq is not None or axis != 0 or not isna(fill_value):
+            return self.apply(lambda x: x.shift(periods, freq,
+                                                axis, fill_value))
+
+        return self._get_cythonized_result('group_shift_indexer',
+                                           self.grouper, cython_dtype=np.int64,
+                                           needs_ngroups=True,
+                                           result_is_index=True,
+                                           periods=periods)
+
+    @Substitution(name='groupby')
+    @Appender(_common_see_also)
+    def pct_change(self, periods=1, fill_method='pad', limit=None, freq=None,
+                   axis=0):
+        """
+        Calculate pct_change of each value to previous entry in group.
+        """
+        if freq is not None or axis != 0:
+            return self.apply(lambda x: x.pct_change(periods=periods,
+                                                     fill_method=fill_method,
+                                                     limit=limit, freq=freq,
+                                                     axis=axis))
+        filled = getattr(self, fill_method)(limit=limit)
+        filled = filled.drop(self.grouper.names, axis=1)
+        fill_grp = filled.groupby(self.grouper.labels)
+        shifted = fill_grp.shift(periods=periods, freq=freq)
+        return (filled / shifted) - 1
+
+    @Substitution(name='groupby', see_also=_common_see_also)
+    def head(self, n=5):
+        """
+        Return first n rows of each group.
+
+        Essentially equivalent to ``.apply(lambda x: x.head(n))``,
+        except ignores as_index flag.
+
+        %(see_also)s
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame([[1, 2], [1, 4], [5, 6]],
+                              columns=['A', 'B'])
+        >>> df.groupby('A', as_index=False).head(1)
+           A  B
+        0  1  2
+        2  5  6
+        >>> df.groupby('A').head(1)
+           A  B
+        0  1  2
+        2  5  6
+        """
+        self._reset_group_selection()
+        mask = self._cumcount_array() < n
+        return self._selected_obj[mask]
+
+    @Substitution(name='groupby', see_also=_common_see_also)
+    def tail(self, n=5):
+        """
+        Return last n rows of each group.
+
+        Essentially equivalent to ``.apply(lambda x: x.tail(n))``,
+        except ignores as_index flag.
+
+        %(see_also)s
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame([['a', 1], ['a', 2], ['b', 1], ['b', 2]],
+                              columns=['A', 'B'])
+        >>> df.groupby('A').tail(1)
+           A  B
+        1  a  2
+        3  b  2
+        >>> df.groupby('A').head(1)
+           A  B
+        0  a  1
+        2  b  1
+        """
+        self._reset_group_selection()
+        mask = self._cumcount_array(ascending=False) < n
+        return self._selected_obj[mask]
+
+
+GroupBy._add_numeric_operations()
+
+
+@Appender(GroupBy.__doc__)
+def groupby(obj, by, **kwds):
+    if isinstance(obj, Series):
+        from pandas.core.groupby.generic import SeriesGroupBy
+        klass = SeriesGroupBy
+    elif isinstance(obj, DataFrame):
+        from pandas.core.groupby.generic import DataFrameGroupBy
+        klass = DataFrameGroupBy
+    else:  # pragma: no cover
+        raise TypeError('invalid type: {}'.format(obj))
+
+    return klass(obj, by, **kwds)
diff --git a/pandas/core/groupby/grouper.py b/pandas/core/groupby/grouper.py
new file mode 100644
index 0000000000000..d1ebb9cbe8ac4
--- /dev/null
+++ b/pandas/core/groupby/grouper.py
@@ -0,0 +1,635 @@
+"""
+Provide user facing operators for doing the split part of the
+split-apply-combine paradigm.
+"""
+
+import warnings
+
+import numpy as np
+
+import pandas.compat as compat
+from pandas.compat import zip
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.common import (
+    ensure_categorical, is_categorical_dtype, is_datetime64_dtype, is_hashable,
+    is_list_like, is_scalar, is_timedelta64_dtype)
+from pandas.core.dtypes.generic import ABCSeries
+
+import pandas.core.algorithms as algorithms
+from pandas.core.arrays import Categorical, ExtensionArray
+import pandas.core.common as com
+from pandas.core.frame import DataFrame
+from pandas.core.groupby.ops import BaseGrouper
+from pandas.core.index import CategoricalIndex, Index, MultiIndex
+from pandas.core.series import Series
+
+from pandas.io.formats.printing import pprint_thing
+
+
+class Grouper(object):
+    """
+    A Grouper allows the user to specify a groupby instruction for a target
+    object
+
+    This specification will select a column via the key parameter, or if the
+    level and/or axis parameters are given, a level of the index of the target
+    object.
+
+    These are local specifications and will override 'global' settings,
+    that is the parameters axis and level which are passed to the groupby
+    itself.
+
+    Parameters
+    ----------
+    key : string, defaults to None
+        groupby key, which selects the grouping column of the target
+    level : name/number, defaults to None
+        the level for the target index
+    freq : string / frequency object, defaults to None
+        This will groupby the specified frequency if the target selection
+        (via key or level) is a datetime-like object. For full specification
+        of available frequencies, please see `here
+        <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`_.
+    axis : number/name of the axis, defaults to 0
+    sort : boolean, default to False
+        whether to sort the resulting labels
+    closed : {'left' or 'right'}
+        Closed end of interval. Only when `freq` parameter is passed.
+    label : {'left' or 'right'}
+        Interval boundary to use for labeling.
+        Only when `freq` parameter is passed.
+    convention : {'start', 'end', 'e', 's'}
+        If grouper is PeriodIndex and `freq` parameter is passed.
+    base : int, default 0
+        Only when `freq` parameter is passed.
+    loffset : string, DateOffset, timedelta object
+        Only when `freq` parameter is passed.
+
+    Returns
+    -------
+    A specification for a groupby instruction
+
+    Examples
+    --------
+
+    Syntactic sugar for ``df.groupby('A')``
+
+    >>> df.groupby(Grouper(key='A'))
+
+    Specify a resample operation on the column 'date'
+
+    >>> df.groupby(Grouper(key='date', freq='60s'))
+
+    Specify a resample operation on the level 'date' on the columns axis
+    with a frequency of 60s
+
+    >>> df.groupby(Grouper(level='date', freq='60s', axis=1))
+    """
+    _attributes = ('key', 'level', 'freq', 'axis', 'sort')
+
+    def __new__(cls, *args, **kwargs):
+        if kwargs.get('freq') is not None:
+            from pandas.core.resample import TimeGrouper
+            cls = TimeGrouper
+        return super(Grouper, cls).__new__(cls)
+
+    def __init__(self, key=None, level=None, freq=None, axis=0, sort=False):
+        self.key = key
+        self.level = level
+        self.freq = freq
+        self.axis = axis
+        self.sort = sort
+
+        self.grouper = None
+        self.obj = None
+        self.indexer = None
+        self.binner = None
+        self._grouper = None
+
+    @property
+    def ax(self):
+        return self.grouper
+
+    def _get_grouper(self, obj, validate=True):
+        """
+        Parameters
+        ----------
+        obj : the subject object
+        validate : boolean, default True
+            if True, validate the grouper
+
+        Returns
+        -------
+        a tuple of binner, grouper, obj (possibly sorted)
+        """
+
+        self._set_grouper(obj)
+        self.grouper, exclusions, self.obj = _get_grouper(self.obj, [self.key],
+                                                          axis=self.axis,
+                                                          level=self.level,
+                                                          sort=self.sort,
+                                                          validate=validate)
+        return self.binner, self.grouper, self.obj
+
+    def _set_grouper(self, obj, sort=False):
+        """
+        given an object and the specifications, setup the internal grouper
+        for this particular specification
+
+        Parameters
+        ----------
+        obj : the subject object
+        sort : bool, default False
+            whether the resulting grouper should be sorted
+        """
+
+        if self.key is not None and self.level is not None:
+            raise ValueError(
+                "The Grouper cannot specify both a key and a level!")
+
+        # Keep self.grouper value before overriding
+        if self._grouper is None:
+            self._grouper = self.grouper
+
+        # the key must be a valid info item
+        if self.key is not None:
+            key = self.key
+            # The 'on' is already defined
+            if (getattr(self.grouper, 'name', None) == key and
+                    isinstance(obj, ABCSeries)):
+                ax = self._grouper.take(obj.index)
+            else:
+                if key not in obj._info_axis:
+                    raise KeyError(
+                        "The grouper name {0} is not found".format(key))
+                ax = Index(obj[key], name=key)
+
+        else:
+            ax = obj._get_axis(self.axis)
+            if self.level is not None:
+                level = self.level
+
+                # if a level is given it must be a mi level or
+                # equivalent to the axis name
+                if isinstance(ax, MultiIndex):
+                    level = ax._get_level_number(level)
+                    ax = Index(ax._get_level_values(level),
+                               name=ax.names[level])
+
+                else:
+                    if level not in (0, ax.name):
+                        raise ValueError(
+                            "The level {0} is not valid".format(level))
+
+        # possibly sort
+        if (self.sort or sort) and not ax.is_monotonic:
+            # use stable sort to support first, last, nth
+            indexer = self.indexer = ax.argsort(kind='mergesort')
+            ax = ax.take(indexer)
+            obj = obj._take(indexer, axis=self.axis, is_copy=False)
+
+        self.obj = obj
+        self.grouper = ax
+        return self.grouper
+
+    @property
+    def groups(self):
+        return self.grouper.groups
+
+    def __repr__(self):
+        attrs_list = ("{}={!r}".format(attr_name, getattr(self, attr_name))
+                      for attr_name in self._attributes
+                      if getattr(self, attr_name) is not None)
+        attrs = ", ".join(attrs_list)
+        cls_name = self.__class__.__name__
+        return "{}({})".format(cls_name, attrs)
+
+
+class Grouping(object):
+
+    """
+    Holds the grouping information for a single key
+
+    Parameters
+    ----------
+    index : Index
+    grouper :
+    obj :
+    name :
+    level :
+    observed : boolean, default False
+        If we are a Categorical, use the observed values
+    in_axis : if the Grouping is a column in self.obj and hence among
+        Groupby.exclusions list
+
+    Returns
+    -------
+    **Attributes**:
+      * indices : dict of {group -> index_list}
+      * labels : ndarray, group labels
+      * ids : mapping of label -> group
+      * counts : array of group counts
+      * group_index : unique groups
+      * groups : dict of {group -> label_list}
+    """
+
+    def __init__(self, index, grouper=None, obj=None, name=None, level=None,
+                 sort=True, observed=False, in_axis=False):
+
+        self.name = name
+        self.level = level
+        self.grouper = _convert_grouper(index, grouper)
+        self.all_grouper = None
+        self.index = index
+        self.sort = sort
+        self.obj = obj
+        self.observed = observed
+        self.in_axis = in_axis
+
+        # right place for this?
+        if isinstance(grouper, (Series, Index)) and name is None:
+            self.name = grouper.name
+
+        if isinstance(grouper, MultiIndex):
+            self.grouper = grouper.values
+
+        # we have a single grouper which may be a myriad of things,
+        # some of which are dependent on the passing in level
+
+        if level is not None:
+            if not isinstance(level, int):
+                if level not in index.names:
+                    raise AssertionError('Level {} not in index'.format(level))
+                level = index.names.index(level)
+
+            if self.name is None:
+                self.name = index.names[level]
+
+            self.grouper, self._labels, self._group_index = \
+                index._get_grouper_for_level(self.grouper, level)
+
+        # a passed Grouper like, directly get the grouper in the same way
+        # as single grouper groupby, use the group_info to get labels
+        elif isinstance(self.grouper, Grouper):
+            # get the new grouper; we already have disambiguated
+            # what key/level refer to exactly, don't need to
+            # check again as we have by this point converted these
+            # to an actual value (rather than a pd.Grouper)
+            _, grouper, _ = self.grouper._get_grouper(self.obj, validate=False)
+            if self.name is None:
+                self.name = grouper.result_index.name
+            self.obj = self.grouper.obj
+            self.grouper = grouper
+
+        else:
+            if self.grouper is None and self.name is not None:
+                self.grouper = self.obj[self.name]
+
+            elif isinstance(self.grouper, (list, tuple)):
+                self.grouper = com.asarray_tuplesafe(self.grouper)
+
+            # a passed Categorical
+            elif is_categorical_dtype(self.grouper):
+
+                from pandas.core.groupby.categorical import recode_for_groupby
+                self.grouper, self.all_grouper = recode_for_groupby(
+                    self.grouper, self.sort, observed)
+                categories = self.grouper.categories
+
+                # we make a CategoricalIndex out of the cat grouper
+                # preserving the categories / ordered attributes
+                self._labels = self.grouper.codes
+                if observed:
+                    codes = algorithms.unique1d(self.grouper.codes)
+                    codes = codes[codes != -1]
+                else:
+                    codes = np.arange(len(categories))
+
+                self._group_index = CategoricalIndex(
+                    Categorical.from_codes(
+                        codes=codes,
+                        categories=categories,
+                        ordered=self.grouper.ordered))
+
+            # we are done
+            if isinstance(self.grouper, Grouping):
+                self.grouper = self.grouper.grouper
+
+            # no level passed
+            elif not isinstance(self.grouper,
+                                (Series, Index, ExtensionArray, np.ndarray)):
+                if getattr(self.grouper, 'ndim', 1) != 1:
+                    t = self.name or str(type(self.grouper))
+                    raise ValueError(
+                        "Grouper for '{}' not 1-dimensional".format(t))
+                self.grouper = self.index.map(self.grouper)
+                if not (hasattr(self.grouper, "__len__") and
+                        len(self.grouper) == len(self.index)):
+                    errmsg = ('Grouper result violates len(labels) == '
+                              'len(data)\nresult: %s' %
+                              pprint_thing(self.grouper))
+                    self.grouper = None  # Try for sanity
+                    raise AssertionError(errmsg)
+
+        # if we have a date/time-like grouper, make sure that we have
+        # Timestamps like
+        if getattr(self.grouper, 'dtype', None) is not None:
+            if is_datetime64_dtype(self.grouper):
+                from pandas import to_datetime
+                self.grouper = to_datetime(self.grouper)
+            elif is_timedelta64_dtype(self.grouper):
+                from pandas import to_timedelta
+                self.grouper = to_timedelta(self.grouper)
+
+    def __repr__(self):
+        return 'Grouping({0})'.format(self.name)
+
+    def __iter__(self):
+        return iter(self.indices)
+
+    _labels = None
+    _group_index = None
+
+    @property
+    def ngroups(self):
+        return len(self.group_index)
+
+    @cache_readonly
+    def indices(self):
+        # we have a list of groupers
+        if isinstance(self.grouper, BaseGrouper):
+            return self.grouper.indices
+
+        values = ensure_categorical(self.grouper)
+        return values._reverse_indexer()
+
+    @property
+    def labels(self):
+        if self._labels is None:
+            self._make_labels()
+        return self._labels
+
+    @cache_readonly
+    def result_index(self):
+        if self.all_grouper is not None:
+            from pandas.core.groupby.categorical import recode_from_groupby
+            return recode_from_groupby(self.all_grouper,
+                                       self.sort, self.group_index)
+        return self.group_index
+
+    @property
+    def group_index(self):
+        if self._group_index is None:
+            self._make_labels()
+        return self._group_index
+
+    def _make_labels(self):
+        if self._labels is None or self._group_index is None:
+            # we have a list of groupers
+            if isinstance(self.grouper, BaseGrouper):
+                labels = self.grouper.label_info
+                uniques = self.grouper.result_index
+            else:
+                labels, uniques = algorithms.factorize(
+                    self.grouper, sort=self.sort)
+                uniques = Index(uniques, name=self.name)
+            self._labels = labels
+            self._group_index = uniques
+
+    @cache_readonly
+    def groups(self):
+        return self.index.groupby(Categorical.from_codes(self.labels,
+                                                         self.group_index))
+
+
+def _get_grouper(obj, key=None, axis=0, level=None, sort=True,
+                 observed=False, mutated=False, validate=True):
+    """
+    create and return a BaseGrouper, which is an internal
+    mapping of how to create the grouper indexers.
+    This may be composed of multiple Grouping objects, indicating
+    multiple groupers
+
+    Groupers are ultimately index mappings. They can originate as:
+    index mappings, keys to columns, functions, or Groupers
+
+    Groupers enable local references to axis,level,sort, while
+    the passed in axis, level, and sort are 'global'.
+
+    This routine tries to figure out what the passing in references
+    are and then creates a Grouping for each one, combined into
+    a BaseGrouper.
+
+    If observed & we have a categorical grouper, only show the observed
+    values
+
+    If validate, then check for key/level overlaps
+
+    """
+    group_axis = obj._get_axis(axis)
+
+    # validate that the passed single level is compatible with the passed
+    # axis of the object
+    if level is not None:
+        # TODO: These if-block and else-block are almost same.
+        # MultiIndex instance check is removable, but it seems that there are
+        # some processes only for non-MultiIndex in else-block,
+        # eg. `obj.index.name != level`. We have to consider carefully whether
+        # these are applicable for MultiIndex. Even if these are applicable,
+        # we need to check if it makes no side effect to subsequent processes
+        # on the outside of this condition.
+        # (GH 17621)
+        if isinstance(group_axis, MultiIndex):
+            if is_list_like(level) and len(level) == 1:
+                level = level[0]
+
+            if key is None and is_scalar(level):
+                # Get the level values from group_axis
+                key = group_axis.get_level_values(level)
+                level = None
+
+        else:
+            # allow level to be a length-one list-like object
+            # (e.g., level=[0])
+            # GH 13901
+            if is_list_like(level):
+                nlevels = len(level)
+                if nlevels == 1:
+                    level = level[0]
+                elif nlevels == 0:
+                    raise ValueError('No group keys passed!')
+                else:
+                    raise ValueError('multiple levels only valid with '
+                                     'MultiIndex')
+
+            if isinstance(level, compat.string_types):
+                if obj.index.name != level:
+                    raise ValueError('level name {} is not the name of the '
+                                     'index'.format(level))
+            elif level > 0 or level < -1:
+                raise ValueError(
+                    'level > 0 or level < -1 only valid with MultiIndex')
+
+            # NOTE: `group_axis` and `group_axis.get_level_values(level)`
+            # are same in this section.
+            level = None
+            key = group_axis
+
+    # a passed-in Grouper, directly convert
+    if isinstance(key, Grouper):
+        binner, grouper, obj = key._get_grouper(obj, validate=False)
+        if key.key is None:
+            return grouper, [], obj
+        else:
+            return grouper, {key.key}, obj
+
+    # already have a BaseGrouper, just return it
+    elif isinstance(key, BaseGrouper):
+        return key, [], obj
+
+    # In the future, a tuple key will always mean an actual key,
+    # not an iterable of keys. In the meantime, we attempt to provide
+    # a warning. We can assume that the user wanted a list of keys when
+    # the key is not in the index. We just have to be careful with
+    # unhashble elements of `key`. Any unhashable elements implies that
+    # they wanted a list of keys.
+    # https://github.com/pandas-dev/pandas/issues/18314
+    is_tuple = isinstance(key, tuple)
+    all_hashable = is_tuple and is_hashable(key)
+
+    if is_tuple:
+        if ((all_hashable and key not in obj and set(key).issubset(obj))
+                or not all_hashable):
+            # column names ('a', 'b') -> ['a', 'b']
+            # arrays like (a, b) -> [a, b]
+            msg = ("Interpreting tuple 'by' as a list of keys, rather than "
+                   "a single key. Use 'by=[...]' instead of 'by=(...)'. In "
+                   "the future, a tuple will always mean a single key.")
+            warnings.warn(msg, FutureWarning, stacklevel=5)
+            key = list(key)
+
+    if not isinstance(key, list):
+        keys = [key]
+        match_axis_length = False
+    else:
+        keys = key
+        match_axis_length = len(keys) == len(group_axis)
+
+    # what are we after, exactly?
+    any_callable = any(callable(g) or isinstance(g, dict) for g in keys)
+    any_groupers = any(isinstance(g, Grouper) for g in keys)
+    any_arraylike = any(isinstance(g, (list, tuple, Series, Index, np.ndarray))
+                        for g in keys)
+
+    try:
+        if isinstance(obj, DataFrame):
+            all_in_columns_index = all(g in obj.columns or g in obj.index.names
+                                       for g in keys)
+        else:
+            all_in_columns_index = False
+    except Exception:
+        all_in_columns_index = False
+
+    if (not any_callable and not all_in_columns_index and
+            not any_arraylike and not any_groupers and
+            match_axis_length and level is None):
+        keys = [com.asarray_tuplesafe(keys)]
+
+    if isinstance(level, (tuple, list)):
+        if key is None:
+            keys = [None] * len(level)
+        levels = level
+    else:
+        levels = [level] * len(keys)
+
+    groupings = []
+    exclusions = []
+
+    # if the actual grouper should be obj[key]
+    def is_in_axis(key):
+        if not _is_label_like(key):
+            try:
+                obj._data.items.get_loc(key)
+            except Exception:
+                return False
+
+        return True
+
+    # if the grouper is obj[name]
+    def is_in_obj(gpr):
+        try:
+            return id(gpr) == id(obj[gpr.name])
+        except Exception:
+            return False
+
+    for i, (gpr, level) in enumerate(zip(keys, levels)):
+
+        if is_in_obj(gpr):  # df.groupby(df['name'])
+            in_axis, name = True, gpr.name
+            exclusions.append(name)
+
+        elif is_in_axis(gpr):  # df.groupby('name')
+            if gpr in obj:
+                if validate:
+                    obj._check_label_or_level_ambiguity(gpr)
+                in_axis, name, gpr = True, gpr, obj[gpr]
+                exclusions.append(name)
+            elif obj._is_level_reference(gpr):
+                in_axis, name, level, gpr = False, None, gpr, None
+            else:
+                raise KeyError(gpr)
+        elif isinstance(gpr, Grouper) and gpr.key is not None:
+            # Add key to exclusions
+            exclusions.append(gpr.key)
+            in_axis, name = False, None
+        else:
+            in_axis, name = False, None
+
+        if is_categorical_dtype(gpr) and len(gpr) != obj.shape[axis]:
+            raise ValueError(
+                ("Length of grouper ({len_gpr}) and axis ({len_axis})"
+                 " must be same length"
+                 .format(len_gpr=len(gpr), len_axis=obj.shape[axis])))
+
+        # create the Grouping
+        # allow us to passing the actual Grouping as the gpr
+        ping = (Grouping(group_axis,
+                         gpr,
+                         obj=obj,
+                         name=name,
+                         level=level,
+                         sort=sort,
+                         observed=observed,
+                         in_axis=in_axis)
+                if not isinstance(gpr, Grouping) else gpr)
+
+        groupings.append(ping)
+
+    if len(groupings) == 0:
+        raise ValueError('No group keys passed!')
+
+    # create the internals grouper
+    grouper = BaseGrouper(group_axis, groupings, sort=sort, mutated=mutated)
+    return grouper, exclusions, obj
+
+
+def _is_label_like(val):
+    return (isinstance(val, (compat.string_types, tuple)) or
+            (val is not None and is_scalar(val)))
+
+
+def _convert_grouper(axis, grouper):
+    if isinstance(grouper, dict):
+        return grouper.get
+    elif isinstance(grouper, Series):
+        if grouper.index.equals(axis):
+            return grouper._values
+        else:
+            return grouper.reindex(axis)._values
+    elif isinstance(grouper, (list, Series, Index, np.ndarray)):
+        if len(grouper) != len(axis):
+            raise ValueError('Grouper and axis must be same length')
+        return grouper
+    else:
+        return grouper
diff --git a/pandas/core/groupby/ops.py b/pandas/core/groupby/ops.py
new file mode 100644
index 0000000000000..78c9aa9187135
--- /dev/null
+++ b/pandas/core/groupby/ops.py
@@ -0,0 +1,898 @@
+"""
+Provide classes to perform the groupby aggregate operations.
+
+These are not exposed to the user and provide implementations of the grouping
+operations, primarily in cython. These classes (BaseGrouper and BinGrouper)
+are contained *in* the SeriesGroupBy and DataFrameGroupBy objects.
+"""
+
+import collections
+
+import numpy as np
+
+from pandas._libs import NaT, groupby as libgroupby, iNaT, lib, reduction
+from pandas.compat import lzip, range, zip
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.common import (
+    ensure_float64, ensure_int64, ensure_int64_or_float64, ensure_object,
+    ensure_platform_int, is_bool_dtype, is_categorical_dtype, is_complex_dtype,
+    is_datetime64_any_dtype, is_integer_dtype, is_numeric_dtype,
+    is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.missing import _maybe_fill, isna
+
+import pandas.core.algorithms as algorithms
+from pandas.core.base import SelectionMixin
+import pandas.core.common as com
+from pandas.core.frame import DataFrame
+from pandas.core.generic import NDFrame
+from pandas.core.groupby import base
+from pandas.core.index import Index, MultiIndex, ensure_index
+from pandas.core.series import Series
+from pandas.core.sorting import (
+    compress_group_index, decons_obs_group_ids, get_flattened_iterator,
+    get_group_index, get_group_index_sorter, get_indexer_dict)
+
+
+def generate_bins_generic(values, binner, closed):
+    """
+    Generate bin edge offsets and bin labels for one array using another array
+    which has bin edge values. Both arrays must be sorted.
+
+    Parameters
+    ----------
+    values : array of values
+    binner : a comparable array of values representing bins into which to bin
+        the first array. Note, 'values' end-points must fall within 'binner'
+        end-points.
+    closed : which end of bin is closed; left (default), right
+
+    Returns
+    -------
+    bins : array of offsets (into 'values' argument) of bins.
+        Zero and last edge are excluded in result, so for instance the first
+        bin is values[0:bin[0]] and the last is values[bin[-1]:]
+    """
+    lenidx = len(values)
+    lenbin = len(binner)
+
+    if lenidx <= 0 or lenbin <= 0:
+        raise ValueError("Invalid length for values or for binner")
+
+    # check binner fits data
+    if values[0] < binner[0]:
+        raise ValueError("Values falls before first bin")
+
+    if values[lenidx - 1] > binner[lenbin - 1]:
+        raise ValueError("Values falls after last bin")
+
+    bins = np.empty(lenbin - 1, dtype=np.int64)
+
+    j = 0  # index into values
+    bc = 0  # bin count
+
+    # linear scan, presume nothing about values/binner except that it fits ok
+    for i in range(0, lenbin - 1):
+        r_bin = binner[i + 1]
+
+        # count values in current bin, advance to next bin
+        while j < lenidx and (values[j] < r_bin or
+                              (closed == 'right' and values[j] == r_bin)):
+            j += 1
+
+        bins[bc] = j
+        bc += 1
+
+    return bins
+
+
+class BaseGrouper(object):
+    """
+    This is an internal Grouper class, which actually holds
+    the generated groups
+
+    Parameters
+    ----------
+    axis : int
+        the axis to group
+    groupings : array of grouping
+        all the grouping instances to handle in this grouper
+        for example for grouper list to groupby, need to pass the list
+    sort : boolean, default True
+        whether this grouper will give sorted result or not
+    group_keys : boolean, default True
+    mutated : boolean, default False
+    indexer : intp array, optional
+        the indexer created by Grouper
+        some groupers (TimeGrouper) will sort its axis and its
+        group_info is also sorted, so need the indexer to reorder
+
+    """
+
+    def __init__(self, axis, groupings, sort=True, group_keys=True,
+                 mutated=False, indexer=None):
+        self._filter_empty_groups = self.compressed = len(groupings) != 1
+        self.axis = axis
+        self.groupings = groupings
+        self.sort = sort
+        self.group_keys = group_keys
+        self.mutated = mutated
+        self.indexer = indexer
+
+    @property
+    def shape(self):
+        return tuple(ping.ngroups for ping in self.groupings)
+
+    def __iter__(self):
+        return iter(self.indices)
+
+    @property
+    def nkeys(self):
+        return len(self.groupings)
+
+    def get_iterator(self, data, axis=0):
+        """
+        Groupby iterator
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        splitter = self._get_splitter(data, axis=axis)
+        keys = self._get_group_keys()
+        for key, (i, group) in zip(keys, splitter):
+            yield key, group
+
+    def _get_splitter(self, data, axis=0):
+        comp_ids, _, ngroups = self.group_info
+        return get_splitter(data, comp_ids, ngroups, axis=axis)
+
+    def _get_group_keys(self):
+        if len(self.groupings) == 1:
+            return self.levels[0]
+        else:
+            comp_ids, _, ngroups = self.group_info
+
+            # provide "flattened" iterator for multi-group setting
+            return get_flattened_iterator(comp_ids,
+                                          ngroups,
+                                          self.levels,
+                                          self.labels)
+
+    def apply(self, f, data, axis=0):
+        mutated = self.mutated
+        splitter = self._get_splitter(data, axis=axis)
+        group_keys = self._get_group_keys()
+
+        # oh boy
+        f_name = com.get_callable_name(f)
+        if (f_name not in base.plotting_methods and
+                hasattr(splitter, 'fast_apply') and axis == 0):
+            try:
+                values, mutated = splitter.fast_apply(f, group_keys)
+                return group_keys, values, mutated
+            except reduction.InvalidApply:
+                # we detect a mutation of some kind
+                # so take slow path
+                pass
+            except Exception:
+                # raise this error to the caller
+                pass
+
+        result_values = []
+        for key, (i, group) in zip(group_keys, splitter):
+            object.__setattr__(group, 'name', key)
+
+            # group might be modified
+            group_axes = _get_axes(group)
+            res = f(group)
+            if not _is_indexed_like(res, group_axes):
+                mutated = True
+            result_values.append(res)
+
+        return group_keys, result_values, mutated
+
+    @cache_readonly
+    def indices(self):
+        """ dict {group name -> group indices} """
+        if len(self.groupings) == 1:
+            return self.groupings[0].indices
+        else:
+            label_list = [ping.labels for ping in self.groupings]
+            keys = [com.values_from_object(ping.group_index)
+                    for ping in self.groupings]
+            return get_indexer_dict(label_list, keys)
+
+    @property
+    def labels(self):
+        return [ping.labels for ping in self.groupings]
+
+    @property
+    def levels(self):
+        return [ping.group_index for ping in self.groupings]
+
+    @property
+    def names(self):
+        return [ping.name for ping in self.groupings]
+
+    def size(self):
+        """
+        Compute group sizes
+
+        """
+        ids, _, ngroup = self.group_info
+        ids = ensure_platform_int(ids)
+        if ngroup:
+            out = np.bincount(ids[ids != -1], minlength=ngroup)
+        else:
+            out = ids
+        return Series(out,
+                      index=self.result_index,
+                      dtype='int64')
+
+    @cache_readonly
+    def groups(self):
+        """ dict {group name -> group labels} """
+        if len(self.groupings) == 1:
+            return self.groupings[0].groups
+        else:
+            to_groupby = lzip(*(ping.grouper for ping in self.groupings))
+            to_groupby = Index(to_groupby)
+            return self.axis.groupby(to_groupby)
+
+    @cache_readonly
+    def is_monotonic(self):
+        # return if my group orderings are monotonic
+        return Index(self.group_info[0]).is_monotonic
+
+    @cache_readonly
+    def group_info(self):
+        comp_ids, obs_group_ids = self._get_compressed_labels()
+
+        ngroups = len(obs_group_ids)
+        comp_ids = ensure_int64(comp_ids)
+        return comp_ids, obs_group_ids, ngroups
+
+    @cache_readonly
+    def label_info(self):
+        # return the labels of items in original grouped axis
+        labels, _, _ = self.group_info
+        if self.indexer is not None:
+            sorter = np.lexsort((labels, self.indexer))
+            labels = labels[sorter]
+        return labels
+
+    def _get_compressed_labels(self):
+        all_labels = [ping.labels for ping in self.groupings]
+        if len(all_labels) > 1:
+            group_index = get_group_index(all_labels, self.shape,
+                                          sort=True, xnull=True)
+            return compress_group_index(group_index, sort=self.sort)
+
+        ping = self.groupings[0]
+        return ping.labels, np.arange(len(ping.group_index))
+
+    @cache_readonly
+    def ngroups(self):
+        return len(self.result_index)
+
+    @property
+    def recons_labels(self):
+        comp_ids, obs_ids, _ = self.group_info
+        labels = (ping.labels for ping in self.groupings)
+        return decons_obs_group_ids(
+            comp_ids, obs_ids, self.shape, labels, xnull=True)
+
+    @cache_readonly
+    def result_index(self):
+        if not self.compressed and len(self.groupings) == 1:
+            return self.groupings[0].result_index.rename(self.names[0])
+
+        codes = self.recons_labels
+        levels = [ping.result_index for ping in self.groupings]
+        result = MultiIndex(levels=levels,
+                            codes=codes,
+                            verify_integrity=False,
+                            names=self.names)
+        return result
+
+    def get_group_levels(self):
+        if not self.compressed and len(self.groupings) == 1:
+            return [self.groupings[0].result_index]
+
+        name_list = []
+        for ping, labels in zip(self.groupings, self.recons_labels):
+            labels = ensure_platform_int(labels)
+            levels = ping.result_index.take(labels)
+
+            name_list.append(levels)
+
+        return name_list
+
+    # ------------------------------------------------------------
+    # Aggregation functions
+
+    _cython_functions = {
+        'aggregate': {
+            'add': 'group_add',
+            'prod': 'group_prod',
+            'min': 'group_min',
+            'max': 'group_max',
+            'mean': 'group_mean',
+            'median': {
+                'name': 'group_median'
+            },
+            'var': 'group_var',
+            'first': {
+                'name': 'group_nth',
+                'f': lambda func, a, b, c, d, e: func(a, b, c, d, 1, -1)
+            },
+            'last': 'group_last',
+            'ohlc': 'group_ohlc',
+        },
+
+        'transform': {
+            'cumprod': 'group_cumprod',
+            'cumsum': 'group_cumsum',
+            'cummin': 'group_cummin',
+            'cummax': 'group_cummax',
+            'rank': {
+                'name': 'group_rank',
+                'f': lambda func, a, b, c, d, **kwargs: func(
+                    a, b, c, d,
+                    kwargs.get('ties_method', 'average'),
+                    kwargs.get('ascending', True),
+                    kwargs.get('pct', False),
+                    kwargs.get('na_option', 'keep')
+                )
+            }
+        }
+    }
+
+    _cython_arity = {
+        'ohlc': 4,  # OHLC
+    }
+
+    _name_functions = {
+        'ohlc': lambda *args: ['open', 'high', 'low', 'close']
+    }
+
+    def _is_builtin_func(self, arg):
+        """
+        if we define an builtin function for this argument, return it,
+        otherwise return the arg
+        """
+        return SelectionMixin._builtin_table.get(arg, arg)
+
+    def _get_cython_function(self, kind, how, values, is_numeric):
+
+        dtype_str = values.dtype.name
+
+        def get_func(fname):
+            # see if there is a fused-type version of function
+            # only valid for numeric
+            f = getattr(libgroupby, fname, None)
+            if f is not None and is_numeric:
+                return f
+
+            # otherwise find dtype-specific version, falling back to object
+            for dt in [dtype_str, 'object']:
+                f = getattr(libgroupby, "{fname}_{dtype_str}".format(
+                    fname=fname, dtype_str=dt), None)
+                if f is not None:
+                    return f
+
+        ftype = self._cython_functions[kind][how]
+
+        if isinstance(ftype, dict):
+            func = afunc = get_func(ftype['name'])
+
+            # a sub-function
+            f = ftype.get('f')
+            if f is not None:
+
+                def wrapper(*args, **kwargs):
+                    return f(afunc, *args, **kwargs)
+
+                # need to curry our sub-function
+                func = wrapper
+
+        else:
+            func = get_func(ftype)
+
+        if func is None:
+            raise NotImplementedError(
+                "function is not implemented for this dtype: "
+                "[how->{how},dtype->{dtype_str}]".format(how=how,
+                                                         dtype_str=dtype_str))
+
+        return func
+
+    def _cython_operation(self, kind, values, how, axis, min_count=-1,
+                          **kwargs):
+        assert kind in ['transform', 'aggregate']
+
+        # can we do this operation with our cython functions
+        # if not raise NotImplementedError
+
+        # we raise NotImplemented if this is an invalid operation
+        # entirely, e.g. adding datetimes
+
+        # categoricals are only 1d, so we
+        # are not setup for dim transforming
+        if is_categorical_dtype(values):
+            raise NotImplementedError(
+                "categoricals are not support in cython ops ATM")
+        elif is_datetime64_any_dtype(values):
+            if how in ['add', 'prod', 'cumsum', 'cumprod']:
+                raise NotImplementedError(
+                    "datetime64 type does not support {} "
+                    "operations".format(how))
+        elif is_timedelta64_dtype(values):
+            if how in ['prod', 'cumprod']:
+                raise NotImplementedError(
+                    "timedelta64 type does not support {} "
+                    "operations".format(how))
+
+        arity = self._cython_arity.get(how, 1)
+
+        vdim = values.ndim
+        swapped = False
+        if vdim == 1:
+            values = values[:, None]
+            out_shape = (self.ngroups, arity)
+        else:
+            if axis > 0:
+                swapped = True
+                values = values.swapaxes(0, axis)
+            if arity > 1:
+                raise NotImplementedError("arity of more than 1 is not "
+                                          "supported for the 'how' argument")
+            out_shape = (self.ngroups,) + values.shape[1:]
+
+        is_datetimelike = needs_i8_conversion(values.dtype)
+        is_numeric = is_numeric_dtype(values.dtype)
+
+        if is_datetimelike:
+            values = values.view('int64')
+            is_numeric = True
+        elif is_bool_dtype(values.dtype):
+            values = ensure_float64(values)
+        elif is_integer_dtype(values):
+            # we use iNaT for the missing value on ints
+            # so pre-convert to guard this condition
+            if (values == iNaT).any():
+                values = ensure_float64(values)
+            else:
+                values = ensure_int64_or_float64(values)
+        elif is_numeric and not is_complex_dtype(values):
+            values = ensure_float64(values)
+        else:
+            values = values.astype(object)
+
+        try:
+            func = self._get_cython_function(
+                kind, how, values, is_numeric)
+        except NotImplementedError:
+            if is_numeric:
+                values = ensure_float64(values)
+                func = self._get_cython_function(
+                    kind, how, values, is_numeric)
+            else:
+                raise
+
+        if how == 'rank':
+            out_dtype = 'float'
+        else:
+            if is_numeric:
+                out_dtype = '{kind}{itemsize}'.format(
+                    kind=values.dtype.kind, itemsize=values.dtype.itemsize)
+            else:
+                out_dtype = 'object'
+
+        labels, _, _ = self.group_info
+
+        if kind == 'aggregate':
+            result = _maybe_fill(np.empty(out_shape, dtype=out_dtype),
+                                 fill_value=np.nan)
+            counts = np.zeros(self.ngroups, dtype=np.int64)
+            result = self._aggregate(
+                result, counts, values, labels, func, is_numeric,
+                is_datetimelike, min_count)
+        elif kind == 'transform':
+            result = _maybe_fill(np.empty_like(values, dtype=out_dtype),
+                                 fill_value=np.nan)
+
+            # TODO: min_count
+            result = self._transform(
+                result, values, labels, func, is_numeric, is_datetimelike,
+                **kwargs)
+
+        if is_integer_dtype(result) and not is_datetimelike:
+            mask = result == iNaT
+            if mask.any():
+                result = result.astype('float64')
+                result[mask] = np.nan
+
+        if (kind == 'aggregate' and
+                self._filter_empty_groups and not counts.all()):
+            if result.ndim == 2:
+                try:
+                    result = lib.row_bool_subset(
+                        result, (counts > 0).view(np.uint8))
+                except ValueError:
+                    result = lib.row_bool_subset_object(
+                        ensure_object(result),
+                        (counts > 0).view(np.uint8))
+            else:
+                result = result[counts > 0]
+
+        if vdim == 1 and arity == 1:
+            result = result[:, 0]
+
+        if how in self._name_functions:
+            # TODO
+            names = self._name_functions[how]()
+        else:
+            names = None
+
+        if swapped:
+            result = result.swapaxes(0, axis)
+
+        return result, names
+
+    def aggregate(self, values, how, axis=0, min_count=-1):
+        return self._cython_operation('aggregate', values, how, axis,
+                                      min_count=min_count)
+
+    def transform(self, values, how, axis=0, **kwargs):
+        return self._cython_operation('transform', values, how, axis, **kwargs)
+
+    def _aggregate(self, result, counts, values, comp_ids, agg_func,
+                   is_numeric, is_datetimelike, min_count=-1):
+        if values.ndim > 3:
+            # punting for now
+            raise NotImplementedError("number of dimensions is currently "
+                                      "limited to 3")
+        elif values.ndim > 2:
+            for i, chunk in enumerate(values.transpose(2, 0, 1)):
+
+                chunk = chunk.squeeze()
+                agg_func(result[:, :, i], counts, chunk, comp_ids,
+                         min_count)
+        else:
+            agg_func(result, counts, values, comp_ids, min_count)
+
+        return result
+
+    def _transform(self, result, values, comp_ids, transform_func,
+                   is_numeric, is_datetimelike, **kwargs):
+
+        comp_ids, _, ngroups = self.group_info
+        if values.ndim > 3:
+            # punting for now
+            raise NotImplementedError("number of dimensions is currently "
+                                      "limited to 3")
+        elif values.ndim > 2:
+            for i, chunk in enumerate(values.transpose(2, 0, 1)):
+
+                transform_func(result[:, :, i], values,
+                               comp_ids, is_datetimelike, **kwargs)
+        else:
+            transform_func(result, values, comp_ids, is_datetimelike, **kwargs)
+
+        return result
+
+    def agg_series(self, obj, func):
+        try:
+            return self._aggregate_series_fast(obj, func)
+        except Exception:
+            return self._aggregate_series_pure_python(obj, func)
+
+    def _aggregate_series_fast(self, obj, func):
+        func = self._is_builtin_func(func)
+
+        if obj.index._has_complex_internals:
+            raise TypeError('Incompatible index for Cython grouper')
+
+        group_index, _, ngroups = self.group_info
+
+        # avoids object / Series creation overhead
+        dummy = obj._get_values(slice(None, 0)).to_dense()
+        indexer = get_group_index_sorter(group_index, ngroups)
+        obj = obj._take(indexer).to_dense()
+        group_index = algorithms.take_nd(
+            group_index, indexer, allow_fill=False)
+        grouper = reduction.SeriesGrouper(obj, func, group_index, ngroups,
+                                          dummy)
+        result, counts = grouper.get_result()
+        return result, counts
+
+    def _aggregate_series_pure_python(self, obj, func):
+
+        group_index, _, ngroups = self.group_info
+
+        counts = np.zeros(ngroups, dtype=int)
+        result = None
+
+        splitter = get_splitter(obj, group_index, ngroups, axis=self.axis)
+
+        for label, group in splitter:
+            res = func(group)
+            if result is None:
+                if (isinstance(res, (Series, Index, np.ndarray))):
+                    raise ValueError('Function does not reduce')
+                result = np.empty(ngroups, dtype='O')
+
+            counts[label] = group.shape[0]
+            result[label] = res
+
+        result = lib.maybe_convert_objects(result, try_float=0)
+        return result, counts
+
+
+class BinGrouper(BaseGrouper):
+
+    """
+    This is an internal Grouper class
+
+    Parameters
+    ----------
+    bins : the split index of binlabels to group the item of axis
+    binlabels : the label list
+    filter_empty : boolean, default False
+    mutated : boolean, default False
+    indexer : a intp array
+
+    Examples
+    --------
+    bins: [2, 4, 6, 8, 10]
+    binlabels: DatetimeIndex(['2005-01-01', '2005-01-03',
+        '2005-01-05', '2005-01-07', '2005-01-09'],
+        dtype='datetime64[ns]', freq='2D')
+
+    the group_info, which contains the label of each item in grouped
+    axis, the index of label in label list, group number, is
+
+    (array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4]), array([0, 1, 2, 3, 4]), 5)
+
+    means that, the grouped axis has 10 items, can be grouped into 5
+    labels, the first and second items belong to the first label, the
+    third and forth items belong to the second label, and so on
+
+    """
+
+    def __init__(self, bins, binlabels, filter_empty=False, mutated=False,
+                 indexer=None):
+        self.bins = ensure_int64(bins)
+        self.binlabels = ensure_index(binlabels)
+        self._filter_empty_groups = filter_empty
+        self.mutated = mutated
+        self.indexer = indexer
+
+    @cache_readonly
+    def groups(self):
+        """ dict {group name -> group labels} """
+
+        # this is mainly for compat
+        # GH 3881
+        result = {key: value for key, value in zip(self.binlabels, self.bins)
+                  if key is not NaT}
+        return result
+
+    @property
+    def nkeys(self):
+        return 1
+
+    def get_iterator(self, data, axis=0):
+        """
+        Groupby iterator
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group
+        """
+        if isinstance(data, NDFrame):
+            slicer = lambda start, edge: data._slice(
+                slice(start, edge), axis=axis)
+            length = len(data.axes[axis])
+        else:
+            slicer = lambda start, edge: data[slice(start, edge)]
+            length = len(data)
+
+        start = 0
+        for edge, label in zip(self.bins, self.binlabels):
+            if label is not NaT:
+                yield label, slicer(start, edge)
+            start = edge
+
+        if start < length:
+            yield self.binlabels[-1], slicer(start, None)
+
+    @cache_readonly
+    def indices(self):
+        indices = collections.defaultdict(list)
+
+        i = 0
+        for label, bin in zip(self.binlabels, self.bins):
+            if i < bin:
+                if label is not NaT:
+                    indices[label] = list(range(i, bin))
+                i = bin
+        return indices
+
+    @cache_readonly
+    def group_info(self):
+        ngroups = self.ngroups
+        obs_group_ids = np.arange(ngroups)
+        rep = np.diff(np.r_[0, self.bins])
+
+        rep = ensure_platform_int(rep)
+        if ngroups == len(self.bins):
+            comp_ids = np.repeat(np.arange(ngroups), rep)
+        else:
+            comp_ids = np.repeat(np.r_[-1, np.arange(ngroups)], rep)
+
+        return (comp_ids.astype('int64', copy=False),
+                obs_group_ids.astype('int64', copy=False),
+                ngroups)
+
+    @cache_readonly
+    def result_index(self):
+        if len(self.binlabels) != 0 and isna(self.binlabels[0]):
+            return self.binlabels[1:]
+
+        return self.binlabels
+
+    @property
+    def levels(self):
+        return [self.binlabels]
+
+    @property
+    def names(self):
+        return [self.binlabels.name]
+
+    @property
+    def groupings(self):
+        from pandas.core.groupby.grouper import Grouping
+        return [Grouping(lvl, lvl, in_axis=False, level=None, name=name)
+                for lvl, name in zip(self.levels, self.names)]
+
+    def agg_series(self, obj, func):
+        dummy = obj[:0]
+        grouper = reduction.SeriesBinGrouper(obj, func, self.bins, dummy)
+        return grouper.get_result()
+
+
+def _get_axes(group):
+    if isinstance(group, Series):
+        return [group.index]
+    else:
+        return group.axes
+
+
+def _is_indexed_like(obj, axes):
+    if isinstance(obj, Series):
+        if len(axes) > 1:
+            return False
+        return obj.index.equals(axes[0])
+    elif isinstance(obj, DataFrame):
+        return obj.index.equals(axes[0])
+
+    return False
+
+
+# ----------------------------------------------------------------------
+# Splitting / application
+
+
+class DataSplitter(object):
+
+    def __init__(self, data, labels, ngroups, axis=0):
+        self.data = data
+        self.labels = ensure_int64(labels)
+        self.ngroups = ngroups
+
+        self.axis = axis
+
+    @cache_readonly
+    def slabels(self):
+        # Sorted labels
+        return algorithms.take_nd(self.labels, self.sort_idx, allow_fill=False)
+
+    @cache_readonly
+    def sort_idx(self):
+        # Counting sort indexer
+        return get_group_index_sorter(self.labels, self.ngroups)
+
+    def __iter__(self):
+        sdata = self._get_sorted_data()
+
+        if self.ngroups == 0:
+            # we are inside a generator, rather than raise StopIteration
+            # we merely return signal the end
+            return
+
+        starts, ends = lib.generate_slices(self.slabels, self.ngroups)
+
+        for i, (start, end) in enumerate(zip(starts, ends)):
+            # Since I'm now compressing the group ids, it's now not "possible"
+            # to produce empty slices because such groups would not be observed
+            # in the data
+            # if start >= end:
+            #     raise AssertionError('Start %s must be less than end %s'
+            #                          % (str(start), str(end)))
+            yield i, self._chop(sdata, slice(start, end))
+
+    def _get_sorted_data(self):
+        return self.data._take(self.sort_idx, axis=self.axis)
+
+    def _chop(self, sdata, slice_obj):
+        return sdata.iloc[slice_obj]
+
+    def apply(self, f):
+        raise AbstractMethodError(self)
+
+
+class SeriesSplitter(DataSplitter):
+
+    def _chop(self, sdata, slice_obj):
+        return sdata._get_values(slice_obj).to_dense()
+
+
+class FrameSplitter(DataSplitter):
+
+    def fast_apply(self, f, names):
+        # must return keys::list, values::list, mutated::bool
+        try:
+            starts, ends = lib.generate_slices(self.slabels, self.ngroups)
+        except Exception:
+            # fails when all -1
+            return [], True
+
+        sdata = self._get_sorted_data()
+        results, mutated = reduction.apply_frame_axis0(sdata, f, names,
+                                                       starts, ends)
+
+        return results, mutated
+
+    def _chop(self, sdata, slice_obj):
+        if self.axis == 0:
+            return sdata.iloc[slice_obj]
+        else:
+            return sdata._slice(slice_obj, axis=1)  # .loc[:, slice_obj]
+
+
+class NDFrameSplitter(DataSplitter):
+
+    def __init__(self, data, labels, ngroups, axis=0):
+        super(NDFrameSplitter, self).__init__(data, labels, ngroups, axis=axis)
+
+        self.factory = data._constructor
+
+    def _get_sorted_data(self):
+        # this is the BlockManager
+        data = self.data._data
+
+        # this is sort of wasteful but...
+        sorted_axis = data.axes[self.axis].take(self.sort_idx)
+        sorted_data = data.reindex_axis(sorted_axis, axis=self.axis)
+
+        return sorted_data
+
+    def _chop(self, sdata, slice_obj):
+        return self.factory(sdata.get_slice(slice_obj, axis=self.axis))
+
+
+def get_splitter(data, *args, **kwargs):
+    if isinstance(data, Series):
+        klass = SeriesSplitter
+    elif isinstance(data, DataFrame):
+        klass = FrameSplitter
+    else:
+        klass = NDFrameSplitter
+
+    return klass(data, *args, **kwargs)
diff --git a/pandas/core/index.py b/pandas/core/index.py
index 05f98d59a1f56..2d1c22f5623a1 100644
--- a/pandas/core/index.py
+++ b/pandas/core/index.py
@@ -1,3 +1,3 @@
 # flake8: noqa
-from pandas.indexes.api import *
-from pandas.indexes.multi import _sparsify
+from pandas.core.indexes.api import *
+from pandas.core.indexes.multi import _sparsify
diff --git a/pandas/sparse/__init__.py b/pandas/core/indexes/__init__.py
similarity index 100%
rename from pandas/sparse/__init__.py
rename to pandas/core/indexes/__init__.py
diff --git a/pandas/core/indexes/accessors.py b/pandas/core/indexes/accessors.py
new file mode 100644
index 0000000000000..602e11a08b4ed
--- /dev/null
+++ b/pandas/core/indexes/accessors.py
@@ -0,0 +1,325 @@
+"""
+datetimelike delegation
+"""
+import numpy as np
+
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
+    is_datetime_arraylike, is_integer_dtype, is_list_like, is_period_arraylike,
+    is_timedelta64_dtype)
+from pandas.core.dtypes.generic import ABCSeries
+
+from pandas.core.accessor import PandasDelegate, delegate_names
+from pandas.core.algorithms import take_1d
+from pandas.core.arrays import DatetimeArray, PeriodArray, TimedeltaArray
+from pandas.core.base import NoNewAttributesMixin, PandasObject
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+
+
+class Properties(PandasDelegate, PandasObject, NoNewAttributesMixin):
+
+    def __init__(self, data, orig):
+        if not isinstance(data, ABCSeries):
+            raise TypeError("cannot convert an object of type {0} to a "
+                            "datetimelike index".format(type(data)))
+
+        self._parent = data
+        self.orig = orig
+        self.name = getattr(data, 'name', None)
+        self._freeze()
+
+    def _get_values(self):
+        data = self._parent
+        if is_datetime64_dtype(data.dtype):
+            return DatetimeIndex(data, copy=False, name=self.name)
+
+        elif is_datetime64tz_dtype(data.dtype):
+            return DatetimeIndex(data, copy=False, name=self.name)
+
+        elif is_timedelta64_dtype(data.dtype):
+            return TimedeltaIndex(data, copy=False, name=self.name)
+
+        else:
+            if is_period_arraylike(data):
+                # TODO: use to_period_array
+                return PeriodArray(data, copy=False)
+            if is_datetime_arraylike(data):
+                return DatetimeIndex(data, copy=False, name=self.name)
+
+        raise TypeError("cannot convert an object of type {0} to a "
+                        "datetimelike index".format(type(data)))
+
+    def _delegate_property_get(self, name):
+        from pandas import Series
+        values = self._get_values()
+
+        result = getattr(values, name)
+
+        # maybe need to upcast (ints)
+        if isinstance(result, np.ndarray):
+            if is_integer_dtype(result):
+                result = result.astype('int64')
+        elif not is_list_like(result):
+            return result
+
+        result = np.asarray(result)
+
+        # blow up if we operate on categories
+        if self.orig is not None:
+            result = take_1d(result, self.orig.cat.codes)
+            index = self.orig.index
+        else:
+            index = self._parent.index
+        # return the result as a Series, which is by definition a copy
+        result = Series(result, index=index, name=self.name)
+
+        # setting this object will show a SettingWithCopyWarning/Error
+        result._is_copy = ("modifications to a property of a datetimelike "
+                           "object are not supported and are discarded. "
+                           "Change values on the original.")
+
+        return result
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        raise ValueError("modifications to a property of a datetimelike "
+                         "object are not supported. Change values on the "
+                         "original.")
+
+    def _delegate_method(self, name, *args, **kwargs):
+        from pandas import Series
+        values = self._get_values()
+
+        method = getattr(values, name)
+        result = method(*args, **kwargs)
+
+        if not is_list_like(result):
+            return result
+
+        result = Series(result, index=self._parent.index, name=self.name)
+
+        # setting this object will show a SettingWithCopyWarning/Error
+        result._is_copy = ("modifications to a method of a datetimelike "
+                           "object are not supported and are discarded. "
+                           "Change values on the original.")
+
+        return result
+
+
+@delegate_names(delegate=DatetimeArray,
+                accessors=DatetimeArray._datetimelike_ops,
+                typ="property")
+@delegate_names(delegate=DatetimeArray,
+                accessors=DatetimeArray._datetimelike_methods,
+                typ="method")
+class DatetimeProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hour
+    >>> s.dt.second
+    >>> s.dt.quarter
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+    def to_pydatetime(self):
+        """
+        Return the data as an array of native Python datetime objects.
+
+        Timezone information is retained if present.
+
+        .. warning::
+
+           Python's datetime uses microsecond resolution, which is lower than
+           pandas (nanosecond). The values are truncated.
+
+        Returns
+        -------
+        numpy.ndarray
+            Object dtype array containing native Python datetime objects.
+
+        See Also
+        --------
+        datetime.datetime : Standard library value for a datetime.
+
+        Examples
+        --------
+        >>> s = pd.Series(pd.date_range('20180310', periods=2))
+        >>> s
+        0   2018-03-10
+        1   2018-03-11
+        dtype: datetime64[ns]
+
+        >>> s.dt.to_pydatetime()
+        array([datetime.datetime(2018, 3, 10, 0, 0),
+               datetime.datetime(2018, 3, 11, 0, 0)], dtype=object)
+
+        pandas' nanosecond precision is truncated to microseconds.
+
+        >>> s = pd.Series(pd.date_range('20180310', periods=2, freq='ns'))
+        >>> s
+        0   2018-03-10 00:00:00.000000000
+        1   2018-03-10 00:00:00.000000001
+        dtype: datetime64[ns]
+
+        >>> s.dt.to_pydatetime()
+        array([datetime.datetime(2018, 3, 10, 0, 0),
+               datetime.datetime(2018, 3, 10, 0, 0)], dtype=object)
+        """
+        return self._get_values().to_pydatetime()
+
+    @property
+    def freq(self):
+        return self._get_values().inferred_freq
+
+
+@delegate_names(delegate=TimedeltaArray,
+                accessors=TimedeltaArray._datetimelike_ops,
+                typ="property")
+@delegate_names(delegate=TimedeltaArray,
+                accessors=TimedeltaArray._datetimelike_methods,
+                typ="method")
+class TimedeltaProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hours
+    >>> s.dt.seconds
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+    def to_pytimedelta(self):
+        """
+        Return an array of native `datetime.timedelta` objects.
+
+        Python's standard `datetime` library uses a different representation
+        timedelta's. This method converts a Series of pandas Timedeltas
+        to `datetime.timedelta` format with the same length as the original
+        Series.
+
+        Returns
+        -------
+        a : numpy.ndarray
+            Array of 1D containing data with `datetime.timedelta` type.
+
+        See Also
+        --------
+        datetime.timedelta
+
+        Examples
+        --------
+        >>> s = pd.Series(pd.to_timedelta(np.arange(5), unit='d'))
+        >>> s
+        0   0 days
+        1   1 days
+        2   2 days
+        3   3 days
+        4   4 days
+        dtype: timedelta64[ns]
+
+        >>> s.dt.to_pytimedelta()
+        array([datetime.timedelta(0), datetime.timedelta(1),
+               datetime.timedelta(2), datetime.timedelta(3),
+               datetime.timedelta(4)], dtype=object)
+        """
+        return self._get_values().to_pytimedelta()
+
+    @property
+    def components(self):
+        """
+        Return a Dataframe of the components of the Timedeltas.
+
+        Returns
+        -------
+        DataFrame
+
+        Examples
+        --------
+        >>> s = pd.Series(pd.to_timedelta(np.arange(5), unit='s'))
+        >>> s
+        0   00:00:00
+        1   00:00:01
+        2   00:00:02
+        3   00:00:03
+        4   00:00:04
+        dtype: timedelta64[ns]
+        >>> s.dt.components
+           days  hours  minutes  seconds  milliseconds  microseconds  nanoseconds
+        0     0      0        0        0             0             0            0
+        1     0      0        0        1             0             0            0
+        2     0      0        0        2             0             0            0
+        3     0      0        0        3             0             0            0
+        4     0      0        0        4             0             0            0
+        """  # noqa: E501
+        return self._get_values().components.set_index(self._parent.index)
+
+    @property
+    def freq(self):
+        return self._get_values().inferred_freq
+
+
+@delegate_names(delegate=PeriodArray,
+                accessors=PeriodArray._datetimelike_ops,
+                typ="property")
+@delegate_names(delegate=PeriodArray,
+                accessors=PeriodArray._datetimelike_methods,
+                typ="method")
+class PeriodProperties(Properties):
+    """
+    Accessor object for datetimelike properties of the Series values.
+
+    Examples
+    --------
+    >>> s.dt.hour
+    >>> s.dt.second
+    >>> s.dt.quarter
+
+    Returns a Series indexed like the original Series.
+    Raises TypeError if the Series does not contain datetimelike values.
+    """
+
+
+class CombinedDatetimelikeProperties(DatetimeProperties,
+                                     TimedeltaProperties, PeriodProperties):
+
+    def __new__(cls, data):
+        # CombinedDatetimelikeProperties isn't really instantiated. Instead
+        # we need to choose which parent (datetime or timedelta) is
+        # appropriate. Since we're checking the dtypes anyway, we'll just
+        # do all the validation here.
+        from pandas import Series
+
+        if not isinstance(data, Series):
+            raise TypeError("cannot convert an object of type {0} to a "
+                            "datetimelike index".format(type(data)))
+
+        orig = data if is_categorical_dtype(data) else None
+        if orig is not None:
+            data = Series(orig.values.categories,
+                          name=orig.name,
+                          copy=False)
+
+        try:
+            if is_datetime64_dtype(data.dtype):
+                return DatetimeProperties(data, orig)
+            elif is_datetime64tz_dtype(data.dtype):
+                return DatetimeProperties(data, orig)
+            elif is_timedelta64_dtype(data.dtype):
+                return TimedeltaProperties(data, orig)
+            elif is_period_arraylike(data):
+                return PeriodProperties(data, orig)
+            elif is_datetime_arraylike(data):
+                return DatetimeProperties(data, orig)
+        except Exception:
+            pass  # we raise an attribute error anyway
+
+        raise AttributeError("Can only use .dt accessor with datetimelike "
+                             "values")
diff --git a/pandas/core/indexes/api.py b/pandas/core/indexes/api.py
new file mode 100644
index 0000000000000..6299fc482d0df
--- /dev/null
+++ b/pandas/core/indexes/api.py
@@ -0,0 +1,286 @@
+import textwrap
+import warnings
+
+from pandas._libs import NaT, lib
+
+import pandas.core.common as com
+from pandas.core.indexes.base import (
+    Index, _new_Index, ensure_index, ensure_index_from_sequences)
+from pandas.core.indexes.base import InvalidIndexError  # noqa:F401
+from pandas.core.indexes.category import CategoricalIndex  # noqa:F401
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.interval import IntervalIndex  # noqa:F401
+from pandas.core.indexes.multi import MultiIndex  # noqa:F401
+from pandas.core.indexes.numeric import (  # noqa:F401
+    Float64Index, Int64Index, NumericIndex, UInt64Index)
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.range import RangeIndex  # noqa:F401
+from pandas.core.indexes.timedeltas import TimedeltaIndex
+
+_sort_msg = textwrap.dedent("""\
+Sorting because non-concatenation axis is not aligned. A future version
+of pandas will change to not sort by default.
+
+To accept the future behavior, pass 'sort=False'.
+
+To retain the current behavior and silence the warning, pass 'sort=True'.
+""")
+
+
+# TODO: there are many places that rely on these private methods existing in
+# pandas.core.index
+__all__ = ['Index', 'MultiIndex', 'NumericIndex', 'Float64Index', 'Int64Index',
+           'CategoricalIndex', 'IntervalIndex', 'RangeIndex', 'UInt64Index',
+           'InvalidIndexError', 'TimedeltaIndex',
+           'PeriodIndex', 'DatetimeIndex',
+           '_new_Index', 'NaT',
+           'ensure_index', 'ensure_index_from_sequences',
+           '_get_combined_index',
+           '_get_objs_combined_axis', '_union_indexes',
+           '_get_consensus_names',
+           '_all_indexes_same']
+
+
+def _get_objs_combined_axis(objs, intersect=False, axis=0, sort=True):
+    """
+    Extract combined index: return intersection or union (depending on the
+    value of "intersect") of indexes on given axis, or None if all objects
+    lack indexes (e.g. they are numpy arrays).
+
+    Parameters
+    ----------
+    objs : list of objects
+        Each object will only be considered if it has a _get_axis
+        attribute.
+    intersect : bool, default False
+        If True, calculate the intersection between indexes. Otherwise,
+        calculate the union.
+    axis : {0 or 'index', 1 or 'outer'}, default 0
+        The axis to extract indexes from.
+    sort : bool, default True
+        Whether the result index should come out sorted or not.
+
+    Returns
+    -------
+    Index
+    """
+    obs_idxes = [obj._get_axis(axis) for obj in objs
+                 if hasattr(obj, '_get_axis')]
+    if obs_idxes:
+        return _get_combined_index(obs_idxes, intersect=intersect, sort=sort)
+
+
+def _get_distinct_objs(objs):
+    """
+    Return a list with distinct elements of "objs" (different ids).
+    Preserves order.
+    """
+    ids = set()
+    res = []
+    for obj in objs:
+        if not id(obj) in ids:
+            ids.add(id(obj))
+            res.append(obj)
+    return res
+
+
+def _get_combined_index(indexes, intersect=False, sort=False):
+    """
+    Return the union or intersection of indexes.
+
+    Parameters
+    ----------
+    indexes : list of Index or list objects
+        When intersect=True, do not accept list of lists.
+    intersect : bool, default False
+        If True, calculate the intersection between indexes. Otherwise,
+        calculate the union.
+    sort : bool, default False
+        Whether the result index should come out sorted or not.
+
+    Returns
+    -------
+    Index
+    """
+
+    # TODO: handle index names!
+    indexes = _get_distinct_objs(indexes)
+    if len(indexes) == 0:
+        index = Index([])
+    elif len(indexes) == 1:
+        index = indexes[0]
+    elif intersect:
+        index = indexes[0]
+        for other in indexes[1:]:
+            index = index.intersection(other)
+    else:
+        index = _union_indexes(indexes, sort=sort)
+        index = ensure_index(index)
+
+    if sort:
+        try:
+            index = index.sort_values()
+        except TypeError:
+            pass
+    return index
+
+
+def _union_indexes(indexes, sort=True):
+    """
+    Return the union of indexes.
+
+    The behavior of sort and names is not consistent.
+
+    Parameters
+    ----------
+    indexes : list of Index or list objects
+    sort : bool, default True
+        Whether the result index should come out sorted or not.
+
+    Returns
+    -------
+    Index
+    """
+    if len(indexes) == 0:
+        raise AssertionError('Must have at least 1 Index to union')
+    if len(indexes) == 1:
+        result = indexes[0]
+        if isinstance(result, list):
+            result = Index(sorted(result))
+        return result
+
+    indexes, kind = _sanitize_and_check(indexes)
+
+    def _unique_indices(inds):
+        """
+        Convert indexes to lists and concatenate them, removing duplicates.
+
+        The final dtype is inferred.
+
+        Parameters
+        ----------
+        inds : list of Index or list objects
+
+        Returns
+        -------
+        Index
+        """
+        def conv(i):
+            if isinstance(i, Index):
+                i = i.tolist()
+            return i
+
+        return Index(
+            lib.fast_unique_multiple_list([conv(i) for i in inds], sort=sort))
+
+    if kind == 'special':
+        result = indexes[0]
+
+        if hasattr(result, 'union_many'):
+            return result.union_many(indexes[1:])
+        else:
+            for other in indexes[1:]:
+                result = result.union(other)
+            return result
+    elif kind == 'array':
+        index = indexes[0]
+        for other in indexes[1:]:
+            if not index.equals(other):
+
+                if sort is None:
+                    # TODO: remove once pd.concat sort default changes
+                    warnings.warn(_sort_msg, FutureWarning, stacklevel=8)
+                    sort = True
+
+                return _unique_indices(indexes)
+
+        name = _get_consensus_names(indexes)[0]
+        if name != index.name:
+            index = index._shallow_copy(name=name)
+        return index
+    else:  # kind='list'
+        return _unique_indices(indexes)
+
+
+def _sanitize_and_check(indexes):
+    """
+    Verify the type of indexes and convert lists to Index.
+
+    Cases:
+
+    - [list, list, ...]: Return ([list, list, ...], 'list')
+    - [list, Index, ...]: Return _sanitize_and_check([Index, Index, ...])
+        Lists are sorted and converted to Index.
+    - [Index, Index, ...]: Return ([Index, Index, ...], TYPE)
+        TYPE = 'special' if at least one special type, 'array' otherwise.
+
+    Parameters
+    ----------
+    indexes : list of Index or list objects
+
+    Returns
+    -------
+    sanitized_indexes : list of Index or list objects
+    type : {'list', 'array', 'special'}
+    """
+    kinds = list({type(index) for index in indexes})
+
+    if list in kinds:
+        if len(kinds) > 1:
+            indexes = [Index(com.try_sort(x))
+                       if not isinstance(x, Index) else
+                       x for x in indexes]
+            kinds.remove(list)
+        else:
+            return indexes, 'list'
+
+    if len(kinds) > 1 or Index not in kinds:
+        return indexes, 'special'
+    else:
+        return indexes, 'array'
+
+
+def _get_consensus_names(indexes):
+    """
+    Give a consensus 'names' to indexes.
+
+    If there's exactly one non-empty 'names', return this,
+    otherwise, return empty.
+
+    Parameters
+    ----------
+    indexes : list of Index objects
+
+    Returns
+    -------
+    list
+        A list representing the consensus 'names' found.
+    """
+
+    # find the non-none names, need to tupleify to make
+    # the set hashable, then reverse on return
+    consensus_names = {tuple(i.names) for i in indexes
+                       if com._any_not_none(*i.names)}
+    if len(consensus_names) == 1:
+        return list(list(consensus_names)[0])
+    return [None] * indexes[0].nlevels
+
+
+def _all_indexes_same(indexes):
+    """
+    Determine if all indexes contain the same elements.
+
+    Parameters
+    ----------
+    indexes : list of Index objects
+
+    Returns
+    -------
+    bool
+        True if all indexes contain the same elements, False otherwise.
+    """
+    first = indexes[0]
+    for index in indexes[1:]:
+        if not first.equals(index):
+            return False
+    return True
diff --git a/pandas/core/indexes/base.py b/pandas/core/indexes/base.py
new file mode 100644
index 0000000000000..dee181fc1c569
--- /dev/null
+++ b/pandas/core/indexes/base.py
@@ -0,0 +1,5426 @@
+from datetime import datetime, timedelta
+import operator
+from textwrap import dedent
+import warnings
+
+import numpy as np
+
+from pandas._libs import (
+    algos as libalgos, index as libindex, join as libjoin, lib)
+from pandas._libs.lib import is_datetime_array
+from pandas._libs.tslibs import OutOfBoundsDatetime, Timedelta, Timestamp
+from pandas._libs.tslibs.timezones import tz_compare
+import pandas.compat as compat
+from pandas.compat import range, set_function_name, u
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+
+from pandas.core.dtypes.cast import maybe_cast_to_integer_array
+from pandas.core.dtypes.common import (
+    ensure_categorical, ensure_int64, ensure_object, ensure_platform_int,
+    is_bool, is_bool_dtype, is_categorical, is_categorical_dtype,
+    is_datetime64_any_dtype, is_datetime64tz_dtype, is_dtype_equal,
+    is_dtype_union_equal, is_extension_array_dtype, is_float, is_float_dtype,
+    is_hashable, is_integer, is_integer_dtype, is_interval_dtype, is_iterator,
+    is_list_like, is_object_dtype, is_period_dtype, is_scalar,
+    is_signed_integer_dtype, is_timedelta64_dtype, is_unsigned_integer_dtype,
+    pandas_dtype)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCDateOffset, ABCDatetimeArray, ABCIndexClass,
+    ABCMultiIndex, ABCPandasArray, ABCPeriodIndex, ABCSeries,
+    ABCTimedeltaArray, ABCTimedeltaIndex)
+from pandas.core.dtypes.missing import array_equivalent, isna
+
+from pandas.core import ops
+from pandas.core.accessor import CachedAccessor, DirNamesMixin
+import pandas.core.algorithms as algos
+from pandas.core.arrays import ExtensionArray
+from pandas.core.base import IndexOpsMixin, PandasObject
+import pandas.core.common as com
+from pandas.core.indexes.frozen import FrozenList
+import pandas.core.missing as missing
+from pandas.core.ops import get_op_result_name, make_invalid_op
+import pandas.core.sorting as sorting
+from pandas.core.strings import StringMethods
+
+from pandas.io.formats.printing import (
+    default_pprint, format_object_attrs, format_object_summary, pprint_thing)
+
+__all__ = ['Index']
+
+_unsortable_types = frozenset(('mixed', 'mixed-integer'))
+
+_index_doc_kwargs = dict(klass='Index', inplace='',
+                         target_klass='Index',
+                         unique='Index', duplicated='np.ndarray')
+_index_shared_docs = dict()
+
+
+def _try_get_item(x):
+    try:
+        return x.item()
+    except AttributeError:
+        return x
+
+
+def _make_comparison_op(op, cls):
+    def cmp_method(self, other):
+        if isinstance(other, (np.ndarray, Index, ABCSeries)):
+            if other.ndim > 0 and len(self) != len(other):
+                raise ValueError('Lengths must match to compare')
+
+        if is_object_dtype(self) and not isinstance(self, ABCMultiIndex):
+            # don't pass MultiIndex
+            with np.errstate(all='ignore'):
+                result = ops._comp_method_OBJECT_ARRAY(op, self.values, other)
+
+        else:
+
+            # numpy will show a DeprecationWarning on invalid elementwise
+            # comparisons, this will raise in the future
+            with warnings.catch_warnings(record=True):
+                warnings.filterwarnings("ignore", "elementwise", FutureWarning)
+                with np.errstate(all='ignore'):
+                    result = op(self.values, np.asarray(other))
+
+        # technically we could support bool dtyped Index
+        # for now just return the indexing array directly
+        if is_bool_dtype(result):
+            return result
+        try:
+            return Index(result)
+        except TypeError:
+            return result
+
+    name = '__{name}__'.format(name=op.__name__)
+    # TODO: docstring?
+    return set_function_name(cmp_method, name, cls)
+
+
+def _make_arithmetic_op(op, cls):
+    def index_arithmetic_method(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+        elif isinstance(other, ABCTimedeltaIndex):
+            # Defer to subclass implementation
+            return NotImplemented
+        elif (isinstance(other, (np.ndarray, ABCTimedeltaArray)) and
+              is_timedelta64_dtype(other)):
+            # GH#22390; wrap in Series for op, this will in turn wrap in
+            # TimedeltaIndex, but will correctly raise TypeError instead of
+            # NullFrequencyError for add/sub ops
+            from pandas import Series
+            other = Series(other)
+            out = op(self, other)
+            return Index(out, name=self.name)
+
+        other = self._validate_for_numeric_binop(other, op)
+
+        # handle time-based others
+        if isinstance(other, (ABCDateOffset, np.timedelta64, timedelta)):
+            return self._evaluate_with_timedelta_like(other, op)
+        elif isinstance(other, (datetime, np.datetime64)):
+            return self._evaluate_with_datetime_like(other, op)
+
+        values = self.values
+        with np.errstate(all='ignore'):
+            result = op(values, other)
+
+        result = missing.dispatch_missing(op, values, other, result)
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        if op is divmod:
+            result = (Index(result[0], **attrs), Index(result[1], **attrs))
+        else:
+            result = Index(result, **attrs)
+        return result
+
+    name = '__{name}__'.format(name=op.__name__)
+    # TODO: docstring?
+    return set_function_name(index_arithmetic_method, name, cls)
+
+
+class InvalidIndexError(Exception):
+    pass
+
+
+_o_dtype = np.dtype(object)
+_Identity = object
+
+
+def _new_Index(cls, d):
+    """
+    This is called upon unpickling, rather than the default which doesn't
+    have arguments and breaks __new__.
+    """
+    # required for backward compat, because PI can't be instantiated with
+    # ordinals through __new__ GH #13277
+    if issubclass(cls, ABCPeriodIndex):
+        from pandas.core.indexes.period import _new_PeriodIndex
+        return _new_PeriodIndex(cls, **d)
+    return cls.__new__(cls, **d)
+
+
+class Index(IndexOpsMixin, PandasObject):
+    """
+    Immutable ndarray implementing an ordered, sliceable set. The basic object
+    storing axis labels for all pandas objects.
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+    dtype : NumPy dtype (default: object)
+        If dtype is None, we find the dtype that best fits the data.
+        If an actual dtype is provided, we coerce to that dtype if it's safe.
+        Otherwise, an error will be raised.
+    copy : bool
+        Make a copy of input ndarray
+    name : object
+        Name to be stored in the index
+    tupleize_cols : bool (default: True)
+        When True, attempt to create a MultiIndex if possible
+
+    See Also
+    ---------
+    RangeIndex : Index implementing a monotonic integer range.
+    CategoricalIndex : Index of :class:`Categorical` s.
+    MultiIndex : A multi-level, or hierarchical, Index.
+    IntervalIndex : An Index of :class:`Interval` s.
+    DatetimeIndex, TimedeltaIndex, PeriodIndex
+    Int64Index, UInt64Index,  Float64Index
+
+    Notes
+    -----
+    An Index instance can **only** contain hashable objects
+
+    Examples
+    --------
+    >>> pd.Index([1, 2, 3])
+    Int64Index([1, 2, 3], dtype='int64')
+
+    >>> pd.Index(list('abc'))
+    Index(['a', 'b', 'c'], dtype='object')
+    """
+    # tolist is not actually deprecated, just suppressed in the __dir__
+    _deprecations = DirNamesMixin._deprecations | frozenset(['tolist'])
+
+    # To hand over control to subclasses
+    _join_precedence = 1
+
+    # Cython methods; see github.com/cython/cython/issues/2647
+    #  for why we need to wrap these instead of making them class attributes
+    # Moreover, cython will choose the appropriate-dtyped sub-function
+    #  given the dtypes of the passed arguments
+    def _left_indexer_unique(self, left, right):
+        return libjoin.left_join_indexer_unique(left, right)
+
+    def _left_indexer(self, left, right):
+        return libjoin.left_join_indexer(left, right)
+
+    def _inner_indexer(self, left, right):
+        return libjoin.inner_join_indexer(left, right)
+
+    def _outer_indexer(self, left, right):
+        return libjoin.outer_join_indexer(left, right)
+
+    _typ = 'index'
+    _data = None
+    _id = None
+    name = None
+    asi8 = None
+    _comparables = ['name']
+    _attributes = ['name']
+    _is_numeric_dtype = False
+    _can_hold_na = True
+
+    # would we like our indexing holder to defer to us
+    _defer_to_indexing = False
+
+    # prioritize current class for _shallow_copy_with_infer,
+    # used to infer integers as datetime-likes
+    _infer_as_myclass = False
+
+    _engine_type = libindex.ObjectEngine
+
+    _accessors = {'str'}
+
+    str = CachedAccessor("str", StringMethods)
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, data=None, dtype=None, copy=False, name=None,
+                fastpath=None, tupleize_cols=True, **kwargs):
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if fastpath is not None:
+            warnings.warn("The 'fastpath' keyword is deprecated, and will be "
+                          "removed in a future version.",
+                          FutureWarning, stacklevel=2)
+            if fastpath:
+                return cls._simple_new(data, name)
+
+        from .range import RangeIndex
+        if isinstance(data, ABCPandasArray):
+            # ensure users don't accidentally put a PandasArray in an index.
+            data = data.to_numpy()
+
+        # range
+        if isinstance(data, RangeIndex):
+            return RangeIndex(start=data, copy=copy, dtype=dtype, name=name)
+        elif isinstance(data, range):
+            return RangeIndex.from_range(data, copy=copy, dtype=dtype,
+                                         name=name)
+
+        # categorical
+        elif is_categorical_dtype(data) or is_categorical_dtype(dtype):
+            from .category import CategoricalIndex
+            return CategoricalIndex(data, dtype=dtype, copy=copy, name=name,
+                                    **kwargs)
+
+        # interval
+        elif ((is_interval_dtype(data) or is_interval_dtype(dtype)) and
+              not is_object_dtype(dtype)):
+            from .interval import IntervalIndex
+            closed = kwargs.get('closed', None)
+            return IntervalIndex(data, dtype=dtype, name=name, copy=copy,
+                                 closed=closed)
+
+        elif (is_datetime64_any_dtype(data) or
+              (dtype is not None and is_datetime64_any_dtype(dtype)) or
+                'tz' in kwargs):
+            from pandas import DatetimeIndex
+
+            if dtype is not None and is_dtype_equal(_o_dtype, dtype):
+                # GH#23524 passing `dtype=object` to DatetimeIndex is invalid,
+                #  will raise in the where `data` is already tz-aware.  So
+                #  we leave it out of this step and cast to object-dtype after
+                #  the DatetimeIndex construction.
+                # Note we can pass copy=False because the .astype below
+                #  will always make a copy
+                result = DatetimeIndex(data, copy=False, name=name, **kwargs)
+                return result.astype(object)
+            else:
+                result = DatetimeIndex(data, copy=copy, name=name,
+                                       dtype=dtype, **kwargs)
+                return result
+
+        elif (is_timedelta64_dtype(data) or
+              (dtype is not None and is_timedelta64_dtype(dtype))):
+            from pandas import TimedeltaIndex
+            if dtype is not None and is_dtype_equal(_o_dtype, dtype):
+                # Note we can pass copy=False because the .astype below
+                #  will always make a copy
+                result = TimedeltaIndex(data, copy=False, name=name, **kwargs)
+                return result.astype(object)
+            else:
+                result = TimedeltaIndex(data, copy=copy, name=name,
+                                        dtype=dtype, **kwargs)
+                return result
+
+        elif is_period_dtype(data) and not is_object_dtype(dtype):
+            from pandas import PeriodIndex
+            result = PeriodIndex(data, copy=copy, name=name, **kwargs)
+            return result
+
+        # extension dtype
+        elif is_extension_array_dtype(data) or is_extension_array_dtype(dtype):
+            data = np.asarray(data)
+            if not (dtype is None or is_object_dtype(dtype)):
+
+                # coerce to the provided dtype
+                data = dtype.construct_array_type()._from_sequence(
+                    data, dtype=dtype, copy=False)
+
+            # coerce to the object dtype
+            data = data.astype(object)
+            return Index(data, dtype=object, copy=copy, name=name,
+                         **kwargs)
+
+        # index-like
+        elif isinstance(data, (np.ndarray, Index, ABCSeries)):
+            if dtype is not None:
+                try:
+
+                    # we need to avoid having numpy coerce
+                    # things that look like ints/floats to ints unless
+                    # they are actually ints, e.g. '0' and 0.0
+                    # should not be coerced
+                    # GH 11836
+                    if is_integer_dtype(dtype):
+                        inferred = lib.infer_dtype(data, skipna=False)
+                        if inferred == 'integer':
+                            data = maybe_cast_to_integer_array(data, dtype,
+                                                               copy=copy)
+                        elif inferred in ['floating', 'mixed-integer-float']:
+                            if isna(data).any():
+                                raise ValueError('cannot convert float '
+                                                 'NaN to integer')
+
+                            if inferred == "mixed-integer-float":
+                                data = maybe_cast_to_integer_array(data, dtype)
+
+                            # If we are actually all equal to integers,
+                            # then coerce to integer.
+                            try:
+                                return cls._try_convert_to_int_index(
+                                    data, copy, name, dtype)
+                            except ValueError:
+                                pass
+
+                            # Return an actual float index.
+                            from .numeric import Float64Index
+                            return Float64Index(data, copy=copy, dtype=dtype,
+                                                name=name)
+
+                        elif inferred == 'string':
+                            pass
+                        else:
+                            data = data.astype(dtype)
+                    elif is_float_dtype(dtype):
+                        inferred = lib.infer_dtype(data, skipna=False)
+                        if inferred == 'string':
+                            pass
+                        else:
+                            data = data.astype(dtype)
+                    else:
+                        data = np.array(data, dtype=dtype, copy=copy)
+
+                except (TypeError, ValueError) as e:
+                    msg = str(e)
+                    if ("cannot convert float" in msg or
+                            "Trying to coerce float values to integer" in msg):
+                        raise
+
+            # maybe coerce to a sub-class
+            from pandas.core.indexes.period import (
+                PeriodIndex, IncompatibleFrequency)
+
+            if is_signed_integer_dtype(data.dtype):
+                from .numeric import Int64Index
+                return Int64Index(data, copy=copy, dtype=dtype, name=name)
+            elif is_unsigned_integer_dtype(data.dtype):
+                from .numeric import UInt64Index
+                return UInt64Index(data, copy=copy, dtype=dtype, name=name)
+            elif is_float_dtype(data.dtype):
+                from .numeric import Float64Index
+                return Float64Index(data, copy=copy, dtype=dtype, name=name)
+            elif issubclass(data.dtype.type, np.bool) or is_bool_dtype(data):
+                subarr = data.astype('object')
+            else:
+                subarr = com.asarray_tuplesafe(data, dtype=object)
+
+            # asarray_tuplesafe does not always copy underlying data,
+            # so need to make sure that this happens
+            if copy:
+                subarr = subarr.copy()
+
+            if dtype is None:
+                inferred = lib.infer_dtype(subarr, skipna=False)
+                if inferred == 'integer':
+                    try:
+                        return cls._try_convert_to_int_index(
+                            subarr, copy, name, dtype)
+                    except ValueError:
+                        pass
+
+                    return Index(subarr, copy=copy,
+                                 dtype=object, name=name)
+                elif inferred in ['floating', 'mixed-integer-float']:
+                    from .numeric import Float64Index
+                    return Float64Index(subarr, copy=copy, name=name)
+                elif inferred == 'interval':
+                    from .interval import IntervalIndex
+                    return IntervalIndex(subarr, name=name, copy=copy)
+                elif inferred == 'boolean':
+                    # don't support boolean explicitly ATM
+                    pass
+                elif inferred != 'string':
+                    if inferred.startswith('datetime'):
+                        if (lib.is_datetime_with_singletz_array(subarr) or
+                                'tz' in kwargs):
+                            # only when subarr has the same tz
+                            from pandas import DatetimeIndex
+                            try:
+                                return DatetimeIndex(subarr, copy=copy,
+                                                     name=name, **kwargs)
+                            except OutOfBoundsDatetime:
+                                pass
+
+                    elif inferred.startswith('timedelta'):
+                        from pandas import TimedeltaIndex
+                        return TimedeltaIndex(subarr, copy=copy, name=name,
+                                              **kwargs)
+                    elif inferred == 'period':
+                        try:
+                            return PeriodIndex(subarr, name=name, **kwargs)
+                        except IncompatibleFrequency:
+                            pass
+            return cls._simple_new(subarr, name)
+
+        elif hasattr(data, '__array__'):
+            return Index(np.asarray(data), dtype=dtype, copy=copy, name=name,
+                         **kwargs)
+        elif data is None or is_scalar(data):
+            cls._scalar_data_error(data)
+        else:
+            if tupleize_cols and is_list_like(data):
+                # GH21470: convert iterable to list before determining if empty
+                if is_iterator(data):
+                    data = list(data)
+
+                if data and all(isinstance(e, tuple) for e in data):
+                    # we must be all tuples, otherwise don't construct
+                    # 10697
+                    from .multi import MultiIndex
+                    return MultiIndex.from_tuples(
+                        data, names=name or kwargs.get('names'))
+            # other iterable of some kind
+            subarr = com.asarray_tuplesafe(data, dtype=object)
+            return Index(subarr, dtype=dtype, copy=copy, name=name, **kwargs)
+
+    """
+    NOTE for new Index creation:
+
+    - _simple_new: It returns new Index with the same type as the caller.
+      All metadata (such as name) must be provided by caller's responsibility.
+      Using _shallow_copy is recommended because it fills these metadata
+      otherwise specified.
+
+    - _shallow_copy: It returns new Index with the same type (using
+      _simple_new), but fills caller's metadata otherwise specified. Passed
+      kwargs will overwrite corresponding metadata.
+
+    - _shallow_copy_with_infer: It returns new Index inferring its type
+      from passed values. It fills caller's metadata otherwise specified as the
+      same as _shallow_copy.
+
+    See each method's docstring.
+    """
+
+    @classmethod
+    def _simple_new(cls, values, name=None, dtype=None, **kwargs):
+        """
+        We require that we have a dtype compat for the values. If we are passed
+        a non-dtype compat, then coerce using the constructor.
+
+        Must be careful not to recurse.
+        """
+        if not hasattr(values, 'dtype'):
+            if (values is None or not len(values)) and dtype is not None:
+                values = np.empty(0, dtype=dtype)
+            else:
+                values = np.array(values, copy=False)
+                if is_object_dtype(values):
+                    values = cls(values, name=name, dtype=dtype,
+                                 **kwargs)._ndarray_values
+
+        if isinstance(values, (ABCSeries, ABCIndexClass)):
+            # Index._data must always be an ndarray.
+            # This is no-copy for when _values is an ndarray,
+            # which should be always at this point.
+            values = np.asarray(values._values)
+
+        result = object.__new__(cls)
+        result._data = values
+        # _index_data is a (temporary?) fix to ensure that the direct data
+        # manipulation we do in `_libs/reduction.pyx` continues to work.
+        # We need access to the actual ndarray, since we're messing with
+        # data buffers and strides. We don't re-use `_ndarray_values`, since
+        # we actually set this value too.
+        result._index_data = values
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+        return result._reset_identity()
+
+    @cache_readonly
+    def _constructor(self):
+        return type(self)
+
+    # --------------------------------------------------------------------
+    # Index Internals Methods
+
+    def _get_attributes_dict(self):
+        """
+        Return an attributes dict for my class.
+        """
+        return {k: getattr(self, k, None) for k in self._attributes}
+
+    _index_shared_docs['_shallow_copy'] = """
+        Create a new Index with the same class as the caller, don't copy the
+        data, use the same object attributes with passed in attributes taking
+        precedence.
+
+        *this is an internal non-public method*
+
+        Parameters
+        ----------
+        values : the values to create the new Index, optional
+        kwargs : updates the default attributes for this Index
+        """
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is None:
+            values = self.values
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+
+        # _simple_new expects an the type of self._data
+        values = getattr(values, '_values', values)
+        if isinstance(values, ABCDatetimeArray):
+            # `self.values` returns `self` for tz-aware, so we need to unwrap
+            #  more specifically
+            values = values.asi8
+
+        return self._simple_new(values, **attributes)
+
+    def _shallow_copy_with_infer(self, values, **kwargs):
+        """
+        Create a new Index inferring the class with passed value, don't copy
+        the data, use the same object attributes with passed in attributes
+        taking precedence.
+
+        *this is an internal non-public method*
+
+        Parameters
+        ----------
+        values : the values to create the new Index, optional
+        kwargs : updates the default attributes for this Index
+        """
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        attributes['copy'] = False
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+        if self._infer_as_myclass:
+            try:
+                return self._constructor(values, **attributes)
+            except (TypeError, ValueError):
+                pass
+        return Index(values, **attributes)
+
+    def _update_inplace(self, result, **kwargs):
+        # guard when called from IndexOpsMixin
+        raise TypeError("Index can't be updated inplace")
+
+    def is_(self, other):
+        """
+        More flexible, faster check like ``is`` but that works through views.
+
+        Note: this is *not* the same as ``Index.identical()``, which checks
+        that metadata is also the same.
+
+        Parameters
+        ----------
+        other : object
+            other object to compare against.
+
+        Returns
+        -------
+        True if both have same underlying data, False otherwise : bool
+        """
+        # use something other than None to be clearer
+        return self._id is getattr(
+            other, '_id', Ellipsis) and self._id is not None
+
+    def _reset_identity(self):
+        """
+        Initializes or resets ``_id`` attribute with new object.
+        """
+        self._id = _Identity()
+        return self
+
+    def _cleanup(self):
+        self._engine.clear_mapping()
+
+    @cache_readonly
+    def _engine(self):
+        # property, for now, slow to look up
+        return self._engine_type(lambda: self._ndarray_values, len(self))
+
+    # --------------------------------------------------------------------
+    # Array-Like Methods
+
+    # ndarray compat
+    def __len__(self):
+        """
+        Return the length of the Index.
+        """
+        return len(self._data)
+
+    def __array__(self, dtype=None):
+        """
+        The array interface, return my values.
+        """
+        return np.asarray(self._data, dtype=dtype)
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called after a ufunc.
+        """
+        result = lib.item_from_zerodim(result)
+        if is_bool_dtype(result) or lib.is_scalar(result):
+            return result
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        return Index(result, **attrs)
+
+    @cache_readonly
+    def dtype(self):
+        """
+        Return the dtype object of the underlying data.
+        """
+        return self._data.dtype
+
+    @cache_readonly
+    def dtype_str(self):
+        """
+        Return the dtype str of the underlying data.
+        """
+        return str(self.dtype)
+
+    def ravel(self, order='C'):
+        """
+        Return an ndarray of the flattened values of the underlying data.
+
+        See Also
+        --------
+        numpy.ndarray.ravel
+        """
+        return self._ndarray_values.ravel(order=order)
+
+    def view(self, cls=None):
+
+        # we need to see if we are subclassing an
+        # index type here
+        if cls is not None and not hasattr(cls, '_typ'):
+            result = self._data.view(cls)
+        else:
+            result = self._shallow_copy()
+        if isinstance(result, Index):
+            result._id = self._id
+        return result
+
+    _index_shared_docs['astype'] = """
+        Create an Index with values cast to dtypes. The class of a new Index
+        is determined by dtype. When conversion is impossible, a ValueError
+        exception is raised.
+
+        Parameters
+        ----------
+        dtype : numpy dtype or pandas type
+            Note that any signed integer `dtype` is treated as ``'int64'``,
+            and any unsigned integer `dtype` is treated as ``'uint64'``,
+            regardless of the size.
+        copy : bool, default True
+            By default, astype always returns a newly allocated object.
+            If copy is set to False and internal requirements on dtype are
+            satisfied, the original data is used to create a new Index
+            or the original Index is returned.
+
+            .. versionadded:: 0.19.0
+        """
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        if is_dtype_equal(self.dtype, dtype):
+            return self.copy() if copy else self
+
+        elif is_categorical_dtype(dtype):
+            from .category import CategoricalIndex
+            return CategoricalIndex(self.values, name=self.name, dtype=dtype,
+                                    copy=copy)
+        elif is_datetime64tz_dtype(dtype):
+            # TODO(GH-24559): Remove this block, use the following elif.
+            # avoid FutureWarning from DatetimeIndex constructor.
+            from pandas import DatetimeIndex
+            tz = pandas_dtype(dtype).tz
+            return (DatetimeIndex(np.asarray(self))
+                    .tz_localize("UTC").tz_convert(tz))
+
+        elif is_extension_array_dtype(dtype):
+            return Index(np.asarray(self), dtype=dtype, copy=copy)
+
+        try:
+            if is_datetime64tz_dtype(dtype):
+                from pandas import DatetimeIndex
+                return DatetimeIndex(self.values, name=self.name, dtype=dtype,
+                                     copy=copy)
+            return Index(self.values.astype(dtype, copy=copy), name=self.name,
+                         dtype=dtype)
+        except (TypeError, ValueError):
+            msg = 'Cannot cast {name} to dtype {dtype}'
+            raise TypeError(msg.format(name=type(self).__name__, dtype=dtype))
+
+    _index_shared_docs['take'] = """
+        Return a new %(klass)s of the values selected by the indices.
+
+        For internal compatibility with numpy arrays.
+
+        Parameters
+        ----------
+        indices : list
+            Indices to be taken
+        axis : int, optional
+            The axis over which to select values, always 0.
+        allow_fill : bool, default True
+        fill_value : bool, default None
+            If allow_fill=True and fill_value is not None, indices specified by
+            -1 is regarded as NA. If Index doesn't hold NA, raise ValueError
+
+        See Also
+        --------
+        numpy.ndarray.take
+        """
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        if kwargs:
+            nv.validate_take(tuple(), kwargs)
+        indices = ensure_platform_int(indices)
+        if self._can_hold_na:
+            taken = self._assert_take_fillable(self.values, indices,
+                                               allow_fill=allow_fill,
+                                               fill_value=fill_value,
+                                               na_value=self._na_value)
+        else:
+            if allow_fill and fill_value is not None:
+                msg = 'Unable to fill values because {0} cannot contain NA'
+                raise ValueError(msg.format(self.__class__.__name__))
+            taken = self.values.take(indices)
+        return self._shallow_copy(taken)
+
+    def _assert_take_fillable(self, values, indices, allow_fill=True,
+                              fill_value=None, na_value=np.nan):
+        """
+        Internal method to handle NA filling of take.
+        """
+        indices = ensure_platform_int(indices)
+
+        # only fill if we are passing a non-None fill_value
+        if allow_fill and fill_value is not None:
+            if (indices < -1).any():
+                msg = ('When allow_fill=True and fill_value is not None, '
+                       'all indices must be >= -1')
+                raise ValueError(msg)
+            taken = algos.take(values,
+                               indices,
+                               allow_fill=allow_fill,
+                               fill_value=na_value)
+        else:
+            taken = values.take(indices)
+        return taken
+
+    _index_shared_docs['repeat'] = """
+        Repeat elements of a %(klass)s.
+
+        Returns a new %(klass)s where each element of the current %(klass)s
+        is repeated consecutively a given number of times.
+
+        Parameters
+        ----------
+        repeats : int or array of ints
+            The number of repetitions for each element. This should be a
+            non-negative integer. Repeating 0 times will return an empty
+            %(klass)s.
+        axis : None
+            Must be ``None``. Has no effect but is accepted for compatibility
+            with numpy.
+
+        Returns
+        -------
+        repeated_index : %(klass)s
+            Newly created %(klass)s with repeated elements.
+
+        See Also
+        --------
+        Series.repeat : Equivalent function for Series.
+        numpy.repeat : Similar method for :class:`numpy.ndarray`.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['a', 'b', 'c'])
+        >>> idx
+        Index(['a', 'b', 'c'], dtype='object')
+        >>> idx.repeat(2)
+        Index(['a', 'a', 'b', 'b', 'c', 'c'], dtype='object')
+        >>> idx.repeat([1, 2, 3])
+        Index(['a', 'b', 'b', 'c', 'c', 'c'], dtype='object')
+        """
+
+    @Appender(_index_shared_docs['repeat'] % _index_doc_kwargs)
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        return self._shallow_copy(self._values.repeat(repeats))
+
+    # --------------------------------------------------------------------
+    # Copying Methods
+
+    _index_shared_docs['copy'] = """
+        Make a copy of this object.  Name and dtype sets those attributes on
+        the new object.
+
+        Parameters
+        ----------
+        name : string, optional
+        deep : boolean, default False
+        dtype : numpy dtype or pandas type
+
+        Returns
+        -------
+        copy : Index
+
+        Notes
+        -----
+        In most cases, there should be no functional difference from using
+        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
+        """
+
+    @Appender(_index_shared_docs['copy'])
+    def copy(self, name=None, deep=False, dtype=None, **kwargs):
+        if deep:
+            new_index = self._shallow_copy(self._data.copy())
+        else:
+            new_index = self._shallow_copy()
+
+        names = kwargs.get('names')
+        names = self._validate_names(name=name, names=names, deep=deep)
+        new_index = new_index.set_names(names)
+
+        if dtype:
+            new_index = new_index.astype(dtype)
+        return new_index
+
+    def __copy__(self, **kwargs):
+        return self.copy(**kwargs)
+
+    def __deepcopy__(self, memo=None):
+        """
+        Parameters
+        ----------
+        memo, default None
+            Standard signature. Unused
+        """
+        if memo is None:
+            memo = {}
+        return self.copy(deep=True)
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    def __unicode__(self):
+        """
+        Return a string representation for this object.
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        klass = self.__class__.__name__
+        data = self._format_data()
+        attrs = self._format_attrs()
+        space = self._format_space()
+
+        prepr = (u(",%s") %
+                 space).join(u("%s=%s") % (k, v) for k, v in attrs)
+
+        # no data provided, just attributes
+        if data is None:
+            data = ''
+
+        res = u("%s(%s%s)") % (klass, data, prepr)
+
+        return res
+
+    def _format_space(self):
+
+        # using space here controls if the attributes
+        # are line separated or not (the default)
+
+        # max_seq_items = get_option('display.max_seq_items')
+        # if len(self) > max_seq_items:
+        #    space = "\n%s" % (' ' * (len(klass) + 1))
+        return " "
+
+    @property
+    def _formatter_func(self):
+        """
+        Return the formatter function.
+        """
+        return default_pprint
+
+    def _format_data(self, name=None):
+        """
+        Return the formatted data as a unicode string.
+        """
+
+        # do we want to justify (only do so for non-objects)
+        is_justify = not (self.inferred_type in ('string', 'unicode') or
+                          (self.inferred_type == 'categorical' and
+                           is_object_dtype(self.categories)))
+
+        return format_object_summary(self, self._formatter_func,
+                                     is_justify=is_justify, name=name)
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value).
+        """
+        return format_object_attrs(self)
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return self.values
+
+    def format(self, name=False, formatter=None, **kwargs):
+        """
+        Render a string representation of the Index.
+        """
+        header = []
+        if name:
+            header.append(pprint_thing(self.name,
+                                       escape_chars=('\t', '\r', '\n')) if
+                          self.name is not None else '')
+
+        if formatter is not None:
+            return header + list(self.map(formatter))
+
+        return self._format_with_header(header, **kwargs)
+
+    def _format_with_header(self, header, na_rep='NaN', **kwargs):
+        values = self.values
+
+        from pandas.io.formats.format import format_array
+
+        if is_categorical_dtype(values.dtype):
+            values = np.array(values)
+
+        elif is_object_dtype(values.dtype):
+            values = lib.maybe_convert_objects(values, safe=1)
+
+        if is_object_dtype(values.dtype):
+            result = [pprint_thing(x, escape_chars=('\t', '\r', '\n'))
+                      for x in values]
+
+            # could have nans
+            mask = isna(values)
+            if mask.any():
+                result = np.array(result)
+                result[mask] = na_rep
+                result = result.tolist()
+
+        else:
+            result = _trim_front(format_array(values, None, justify='left'))
+        return header + result
+
+    def to_native_types(self, slicer=None, **kwargs):
+        """
+        Format specified values of `self` and return them.
+
+        Parameters
+        ----------
+        slicer : int, array-like
+            An indexer into `self` that specifies which values
+            are used in the formatting process.
+        kwargs : dict
+            Options for specifying how the values should be formatted.
+            These options include the following:
+
+            1) na_rep : str
+                The value that serves as a placeholder for NULL values
+            2) quoting : bool or None
+                Whether or not there are quoted values in `self`
+            3) date_format : str
+                The format used to represent date-like values
+        """
+
+        values = self
+        if slicer is not None:
+            values = values[slicer]
+        return values._format_native_types(**kwargs)
+
+    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
+        """
+        Actually format specific types of the index.
+        """
+        mask = isna(self)
+        if not self.is_object() and not quoting:
+            values = np.asarray(self).astype(str)
+        else:
+            values = np.array(self, dtype=object, copy=True)
+
+        values[mask] = na_rep
+        return values
+
+    def _summary(self, name=None):
+        """
+        Return a summarized representation.
+
+        Parameters
+        ----------
+        name : str
+            name to use in the summary representation
+
+        Returns
+        -------
+        String with a summarized representation of the index
+        """
+        if len(self) > 0:
+            head = self[0]
+            if (hasattr(head, 'format') and
+                    not isinstance(head, compat.string_types)):
+                head = head.format()
+            tail = self[-1]
+            if (hasattr(tail, 'format') and
+                    not isinstance(tail, compat.string_types)):
+                tail = tail.format()
+            index_summary = ', %s to %s' % (pprint_thing(head),
+                                            pprint_thing(tail))
+        else:
+            index_summary = ''
+
+        if name is None:
+            name = type(self).__name__
+        return '%s: %s entries%s' % (name, len(self), index_summary)
+
+    def summary(self, name=None):
+        """
+        Return a summarized representation.
+
+        .. deprecated:: 0.23.0
+        """
+        warnings.warn("'summary' is deprecated and will be removed in a "
+                      "future version.", FutureWarning, stacklevel=2)
+        return self._summary(name)
+
+    # --------------------------------------------------------------------
+    # Conversion Methods
+
+    def to_flat_index(self):
+        """
+        Identity method.
+
+        .. versionadded:: 0.24.0
+
+        This is implemented for compatability with subclass implementations
+        when chaining.
+
+        Returns
+        -------
+        pd.Index
+            Caller.
+
+        See Also
+        --------
+        MultiIndex.to_flat_index : Subclass implementation.
+        """
+        return self
+
+    def to_series(self, index=None, name=None):
+        """
+        Create a Series with both index and values equal to the index keys
+        useful with map for returning an indexer based on an index.
+
+        Parameters
+        ----------
+        index : Index, optional
+            index of resulting Series. If None, defaults to original index
+        name : string, optional
+            name of resulting Series. If None, defaults to name of original
+            index
+
+        Returns
+        -------
+        Series : dtype will be based on the type of the Index values.
+        """
+
+        from pandas import Series
+
+        if index is None:
+            index = self._shallow_copy()
+        if name is None:
+            name = self.name
+
+        return Series(self.values.copy(), index=index, name=name)
+
+    def to_frame(self, index=True, name=None):
+        """
+        Create a DataFrame with a column containing the Index.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        index : boolean, default True
+            Set the index of the returned DataFrame as the original Index.
+
+        name : object, default None
+            The passed name should substitute for the index name (if it has
+            one).
+
+        Returns
+        -------
+        DataFrame
+            DataFrame containing the original Index data.
+
+        See Also
+        --------
+        Index.to_series : Convert an Index to a Series.
+        Series.to_frame : Convert Series to DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['Ant', 'Bear', 'Cow'], name='animal')
+        >>> idx.to_frame()
+               animal
+        animal
+        Ant       Ant
+        Bear     Bear
+        Cow       Cow
+
+        By default, the original Index is reused. To enforce a new Index:
+
+        >>> idx.to_frame(index=False)
+            animal
+        0   Ant
+        1  Bear
+        2   Cow
+
+        To override the name of the resulting column, specify `name`:
+
+        >>> idx.to_frame(index=False, name='zoo')
+            zoo
+        0   Ant
+        1  Bear
+        2   Cow
+        """
+
+        from pandas import DataFrame
+        if name is None:
+            name = self.name or 0
+        result = DataFrame({name: self.values.copy()})
+
+        if index:
+            result.index = self
+        return result
+
+    # --------------------------------------------------------------------
+    # Name-Centric Methods
+
+    def _validate_names(self, name=None, names=None, deep=False):
+        """
+        Handles the quirks of having a singular 'name' parameter for general
+        Index and plural 'names' parameter for MultiIndex.
+        """
+        from copy import deepcopy
+        if names is not None and name is not None:
+            raise TypeError("Can only provide one of `names` and `name`")
+        elif names is None and name is None:
+            return deepcopy(self.names) if deep else self.names
+        elif names is not None:
+            if not is_list_like(names):
+                raise TypeError("Must pass list-like as `names`.")
+            return names
+        else:
+            if not is_list_like(name):
+                return [name]
+            return name
+
+    def _get_names(self):
+        return FrozenList((self.name, ))
+
+    def _set_names(self, values, level=None):
+        """
+        Set new names on index. Each name has to be a hashable type.
+
+        Parameters
+        ----------
+        values : str or sequence
+            name(s) to set
+        level : int, level name, or sequence of int/level names (default None)
+            If the index is a MultiIndex (hierarchical), level(s) to set (None
+            for all levels).  Otherwise level must be None
+
+        Raises
+        ------
+        TypeError if each name is not hashable.
+        """
+        if not is_list_like(values):
+            raise ValueError('Names must be a list-like')
+        if len(values) != 1:
+            raise ValueError('Length of new names must be 1, got %d' %
+                             len(values))
+
+        # GH 20527
+        # All items in 'name' need to be hashable:
+        for name in values:
+            if not is_hashable(name):
+                raise TypeError('{}.name must be a hashable type'
+                                .format(self.__class__.__name__))
+        self.name = values[0]
+
+    names = property(fset=_set_names, fget=_get_names)
+
+    def set_names(self, names, level=None, inplace=False):
+        """
+        Set Index or MultiIndex name.
+
+        Able to set new names partially and by level.
+
+        Parameters
+        ----------
+        names : label or list of label
+            Name(s) to set.
+        level : int, label or list of int or label, optional
+            If the index is a MultiIndex, level(s) to set (None for all
+            levels). Otherwise level must be None.
+        inplace : bool, default False
+            Modifies the object directly, instead of creating a new Index or
+            MultiIndex.
+
+        Returns
+        -------
+        Index
+            The same type as the caller or None if inplace is True.
+
+        See Also
+        --------
+        Index.rename : Able to set new names without level.
+
+        Examples
+        --------
+        >>> idx = pd.Index([1, 2, 3, 4])
+        >>> idx
+        Int64Index([1, 2, 3, 4], dtype='int64')
+        >>> idx.set_names('quarter')
+        Int64Index([1, 2, 3, 4], dtype='int64', name='quarter')
+
+        >>> idx = pd.MultiIndex.from_product([['python', 'cobra'],
+        ...                                   [2018, 2019]])
+        >>> idx
+        MultiIndex(levels=[['cobra', 'python'], [2018, 2019]],
+                   codes=[[1, 1, 0, 0], [0, 1, 0, 1]])
+        >>> idx.set_names(['kind', 'year'], inplace=True)
+        >>> idx
+        MultiIndex(levels=[['cobra', 'python'], [2018, 2019]],
+                   codes=[[1, 1, 0, 0], [0, 1, 0, 1]],
+                   names=['kind', 'year'])
+        >>> idx.set_names('species', level=0)
+        MultiIndex(levels=[['cobra', 'python'], [2018, 2019]],
+                   codes=[[1, 1, 0, 0], [0, 1, 0, 1]],
+                   names=['species', 'year'])
+        """
+
+        if level is not None and not isinstance(self, ABCMultiIndex):
+            raise ValueError('Level must be None for non-MultiIndex')
+
+        if level is not None and not is_list_like(level) and is_list_like(
+                names):
+            msg = "Names must be a string when a single level is provided."
+            raise TypeError(msg)
+
+        if not is_list_like(names) and level is None and self.nlevels > 1:
+            raise TypeError("Must pass list-like as `names`.")
+
+        if not is_list_like(names):
+            names = [names]
+        if level is not None and not is_list_like(level):
+            level = [level]
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._set_names(names, level=level)
+        if not inplace:
+            return idx
+
+    def rename(self, name, inplace=False):
+        """
+        Alter Index or MultiIndex name.
+
+        Able to set new names without level. Defaults to returning new index.
+        Length of names must match number of levels in MultiIndex.
+
+        Parameters
+        ----------
+        name : label or list of labels
+            Name(s) to set.
+        inplace : boolean, default False
+            Modifies the object directly, instead of creating a new Index or
+            MultiIndex.
+
+        Returns
+        -------
+        Index
+            The same type as the caller or None if inplace is True.
+
+        See Also
+        --------
+        Index.set_names : Able to set new names partially and by level.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['A', 'C', 'A', 'B'], name='score')
+        >>> idx.rename('grade')
+        Index(['A', 'C', 'A', 'B'], dtype='object', name='grade')
+
+        >>> idx = pd.MultiIndex.from_product([['python', 'cobra'],
+        ...                                   [2018, 2019]],
+        ...                                   names=['kind', 'year'])
+        >>> idx
+        MultiIndex(levels=[['cobra', 'python'], [2018, 2019]],
+                   codes=[[1, 1, 0, 0], [0, 1, 0, 1]],
+                   names=['kind', 'year'])
+        >>> idx.rename(['species', 'year'])
+        MultiIndex(levels=[['cobra', 'python'], [2018, 2019]],
+                   codes=[[1, 1, 0, 0], [0, 1, 0, 1]],
+                   names=['species', 'year'])
+        >>> idx.rename('species')
+        Traceback (most recent call last):
+        TypeError: Must pass list-like as `names`.
+        """
+        return self.set_names([name], inplace=inplace)
+
+    # --------------------------------------------------------------------
+    # Level-Centric Methods
+
+    @property
+    def nlevels(self):
+        return 1
+
+    def _sort_levels_monotonic(self):
+        """
+        Compat with MultiIndex.
+        """
+        return self
+
+    def _validate_index_level(self, level):
+        """
+        Validate index level.
+
+        For single-level Index getting level number is a no-op, but some
+        verification must be done like in MultiIndex.
+
+        """
+        if isinstance(level, int):
+            if level < 0 and level != -1:
+                raise IndexError("Too many levels: Index has only 1 level,"
+                                 " %d is not a valid level number" % (level, ))
+            elif level > 0:
+                raise IndexError("Too many levels:"
+                                 " Index has only 1 level, not %d" %
+                                 (level + 1))
+        elif level != self.name:
+            raise KeyError('Level %s must be same as name (%s)' %
+                           (level, self.name))
+
+    def _get_level_number(self, level):
+        self._validate_index_level(level)
+        return 0
+
+    def sortlevel(self, level=None, ascending=True, sort_remaining=None):
+        """
+        For internal compatibility with with the Index API.
+
+        Sort the Index. This is for compat with MultiIndex
+
+        Parameters
+        ----------
+        ascending : boolean, default True
+            False to sort in descending order
+
+        level, sort_remaining are compat parameters
+
+        Returns
+        -------
+        Index
+        """
+        return self.sort_values(return_indexer=True, ascending=ascending)
+
+    def _get_level_values(self, level):
+        """
+        Return an Index of values for requested level.
+
+        This is primarily useful to get an individual level of values from a
+        MultiIndex, but is provided on Index as well for compatability.
+
+        Parameters
+        ----------
+        level : int or str
+            It is either the integer position or the name of the level.
+
+        Returns
+        -------
+        Index
+            Calling object, as there is only one level in the Index.
+
+        See Also
+        --------
+        MultiIndex.get_level_values : Get values for a level of a MultiIndex.
+
+        Notes
+        -----
+        For Index, level should be 0, since there are no multiple levels.
+
+        Examples
+        --------
+
+        >>> idx = pd.Index(list('abc'))
+        >>> idx
+        Index(['a', 'b', 'c'], dtype='object')
+
+        Get level values by supplying `level` as integer:
+
+        >>> idx.get_level_values(0)
+        Index(['a', 'b', 'c'], dtype='object')
+        """
+        self._validate_index_level(level)
+        return self
+
+    get_level_values = _get_level_values
+
+    def droplevel(self, level=0):
+        """
+        Return index with requested level(s) removed.
+
+        If resulting index has only 1 level left, the result will be
+        of Index type, not MultiIndex.
+
+        .. versionadded:: 0.23.1 (support for non-MultiIndex)
+
+        Parameters
+        ----------
+        level : int, str, or list-like, default 0
+            If a string is given, must be the name of a level
+            If list-like, elements must be names or indexes of levels.
+
+        Returns
+        -------
+        Index or MultiIndex
+        """
+        if not isinstance(level, (tuple, list)):
+            level = [level]
+
+        levnums = sorted(self._get_level_number(lev) for lev in level)[::-1]
+
+        if len(level) == 0:
+            return self
+        if len(level) >= self.nlevels:
+            raise ValueError("Cannot remove {} levels from an index with {} "
+                             "levels: at least one level must be "
+                             "left.".format(len(level), self.nlevels))
+        # The two checks above guarantee that here self is a MultiIndex
+
+        new_levels = list(self.levels)
+        new_codes = list(self.codes)
+        new_names = list(self.names)
+
+        for i in levnums:
+            new_levels.pop(i)
+            new_codes.pop(i)
+            new_names.pop(i)
+
+        if len(new_levels) == 1:
+
+            # set nan if needed
+            mask = new_codes[0] == -1
+            result = new_levels[0].take(new_codes[0])
+            if mask.any():
+                result = result.putmask(mask, np.nan)
+
+            result.name = new_names[0]
+            return result
+        else:
+            from .multi import MultiIndex
+            return MultiIndex(levels=new_levels, codes=new_codes,
+                              names=new_names, verify_integrity=False)
+
+    _index_shared_docs['_get_grouper_for_level'] = """
+        Get index grouper corresponding to an index level
+
+        Parameters
+        ----------
+        mapper: Group mapping function or None
+            Function mapping index values to groups
+        level : int or None
+            Index level
+
+        Returns
+        -------
+        grouper : Index
+            Index of values to group on.
+        labels : ndarray of int or None
+            Array of locations in level_index.
+        uniques : Index or None
+            Index of unique values for level.
+        """
+
+    @Appender(_index_shared_docs['_get_grouper_for_level'])
+    def _get_grouper_for_level(self, mapper, level=None):
+        assert level is None or level == 0
+        if mapper is None:
+            grouper = self
+        else:
+            grouper = self.map(mapper)
+
+        return grouper, None, None
+
+    # --------------------------------------------------------------------
+    # Introspection Methods
+
+    @property
+    def is_monotonic(self):
+        """
+        Alias for is_monotonic_increasing.
+        """
+        return self.is_monotonic_increasing
+
+    @property
+    def is_monotonic_increasing(self):
+        """
+        Return if the index is monotonic increasing (only equal or
+        increasing) values.
+
+        Examples
+        --------
+        >>> Index([1, 2, 3]).is_monotonic_increasing
+        True
+        >>> Index([1, 2, 2]).is_monotonic_increasing
+        True
+        >>> Index([1, 3, 2]).is_monotonic_increasing
+        False
+        """
+        return self._engine.is_monotonic_increasing
+
+    @property
+    def is_monotonic_decreasing(self):
+        """
+        Return if the index is monotonic decreasing (only equal or
+        decreasing) values.
+
+        Examples
+        --------
+        >>> Index([3, 2, 1]).is_monotonic_decreasing
+        True
+        >>> Index([3, 2, 2]).is_monotonic_decreasing
+        True
+        >>> Index([3, 1, 2]).is_monotonic_decreasing
+        False
+        """
+        return self._engine.is_monotonic_decreasing
+
+    @property
+    def _is_strictly_monotonic_increasing(self):
+        """
+        Return if the index is strictly monotonic increasing
+        (only increasing) values.
+
+        Examples
+        --------
+        >>> Index([1, 2, 3])._is_strictly_monotonic_increasing
+        True
+        >>> Index([1, 2, 2])._is_strictly_monotonic_increasing
+        False
+        >>> Index([1, 3, 2])._is_strictly_monotonic_increasing
+        False
+        """
+        return self.is_unique and self.is_monotonic_increasing
+
+    @property
+    def _is_strictly_monotonic_decreasing(self):
+        """
+        Return if the index is strictly monotonic decreasing
+        (only decreasing) values.
+
+        Examples
+        --------
+        >>> Index([3, 2, 1])._is_strictly_monotonic_decreasing
+        True
+        >>> Index([3, 2, 2])._is_strictly_monotonic_decreasing
+        False
+        >>> Index([3, 1, 2])._is_strictly_monotonic_decreasing
+        False
+        """
+        return self.is_unique and self.is_monotonic_decreasing
+
+    def is_lexsorted_for_tuple(self, tup):
+        return True
+
+    @cache_readonly
+    def is_unique(self):
+        """
+        Return if the index has unique values.
+        """
+        return self._engine.is_unique
+
+    @property
+    def has_duplicates(self):
+        return not self.is_unique
+
+    def is_boolean(self):
+        return self.inferred_type in ['boolean']
+
+    def is_integer(self):
+        return self.inferred_type in ['integer']
+
+    def is_floating(self):
+        return self.inferred_type in ['floating', 'mixed-integer-float']
+
+    def is_numeric(self):
+        return self.inferred_type in ['integer', 'floating']
+
+    def is_object(self):
+        return is_object_dtype(self.dtype)
+
+    def is_categorical(self):
+        """
+        Check if the Index holds categorical data.
+
+        Returns
+        -------
+        boolean
+            True if the Index is categorical.
+
+        See Also
+        --------
+        CategoricalIndex : Index for categorical data.
+
+        Examples
+        --------
+        >>> idx = pd.Index(["Watermelon", "Orange", "Apple",
+        ...                 "Watermelon"]).astype("category")
+        >>> idx.is_categorical()
+        True
+
+        >>> idx = pd.Index([1, 3, 5, 7])
+        >>> idx.is_categorical()
+        False
+
+        >>> s = pd.Series(["Peter", "Victor", "Elisabeth", "Mar"])
+        >>> s
+        0        Peter
+        1       Victor
+        2    Elisabeth
+        3          Mar
+        dtype: object
+        >>> s.index.is_categorical()
+        False
+        """
+        return self.inferred_type in ['categorical']
+
+    def is_interval(self):
+        return self.inferred_type in ['interval']
+
+    def is_mixed(self):
+        return self.inferred_type in ['mixed']
+
+    def holds_integer(self):
+        return self.inferred_type in ['integer', 'mixed-integer']
+
+    @cache_readonly
+    def inferred_type(self):
+        """
+        Return a string of the type inferred from the values.
+        """
+        return lib.infer_dtype(self, skipna=False)
+
+    @cache_readonly
+    def is_all_dates(self):
+        if self._data is None:
+            return False
+        return is_datetime_array(ensure_object(self.values))
+
+    # --------------------------------------------------------------------
+    # Pickle Methods
+
+    def __reduce__(self):
+        d = dict(data=self._data)
+        d.update(self._get_attributes_dict())
+        return _new_Index, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """
+        Necessary for making this object picklable.
+        """
+
+        if isinstance(state, dict):
+            self._data = state.pop('data')
+            for k, v in compat.iteritems(state):
+                setattr(self, k, v)
+
+        elif isinstance(state, tuple):
+
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+                self.name = own_state[0]
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(data, state)
+
+            self._data = data
+            self._reset_identity()
+        else:
+            raise Exception("invalid pickle state")
+
+    _unpickle_compat = __setstate__
+
+    # --------------------------------------------------------------------
+    # Null Handling Methods
+
+    _na_value = np.nan
+    """The expected NA value to use with this index."""
+
+    @cache_readonly
+    def _isnan(self):
+        """
+        Return if each value is NaN.
+        """
+        if self._can_hold_na:
+            return isna(self)
+        else:
+            # shouldn't reach to this condition by checking hasnans beforehand
+            values = np.empty(len(self), dtype=np.bool_)
+            values.fill(False)
+            return values
+
+    @cache_readonly
+    def _nan_idxs(self):
+        if self._can_hold_na:
+            w, = self._isnan.nonzero()
+            return w
+        else:
+            return np.array([], dtype=np.int64)
+
+    @cache_readonly
+    def hasnans(self):
+        """
+        Return if I have any nans; enables various perf speedups.
+        """
+        if self._can_hold_na:
+            return bool(self._isnan.any())
+        else:
+            return False
+
+    def isna(self):
+        """
+        Detect missing values.
+
+        Return a boolean same-sized object indicating if the values are NA.
+        NA values, such as ``None``, :attr:`numpy.NaN` or :attr:`pd.NaT`, get
+        mapped to ``True`` values.
+        Everything else get mapped to ``False`` values. Characters such as
+        empty strings `''` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        numpy.ndarray
+            A boolean array of whether my values are NA.
+
+        See Also
+        --------
+        Index.notna : Boolean inverse of isna.
+        Index.dropna : Omit entries with missing values.
+        isna : Top-level isna.
+        Series.isna : Detect missing values in Series object.
+
+        Examples
+        --------
+        Show which entries in a pandas.Index are NA. The result is an
+        array.
+
+        >>> idx = pd.Index([5.2, 6.0, np.NaN])
+        >>> idx
+        Float64Index([5.2, 6.0, nan], dtype='float64')
+        >>> idx.isna()
+        array([False, False,  True], dtype=bool)
+
+        Empty strings are not considered NA values. None is considered an NA
+        value.
+
+        >>> idx = pd.Index(['black', '', 'red', None])
+        >>> idx
+        Index(['black', '', 'red', None], dtype='object')
+        >>> idx.isna()
+        array([False, False, False,  True], dtype=bool)
+
+        For datetimes, `NaT` (Not a Time) is considered as an NA value.
+
+        >>> idx = pd.DatetimeIndex([pd.Timestamp('1940-04-25'),
+        ...                         pd.Timestamp(''), None, pd.NaT])
+        >>> idx
+        DatetimeIndex(['1940-04-25', 'NaT', 'NaT', 'NaT'],
+                      dtype='datetime64[ns]', freq=None)
+        >>> idx.isna()
+        array([False,  True,  True,  True], dtype=bool)
+        """
+        return self._isnan
+    isnull = isna
+
+    def notna(self):
+        """
+        Detect existing (non-missing) values.
+
+        Return a boolean same-sized object indicating if the values are not NA.
+        Non-missing values get mapped to ``True``. Characters such as empty
+        strings ``''`` or :attr:`numpy.inf` are not considered NA values
+        (unless you set ``pandas.options.mode.use_inf_as_na = True``).
+        NA values, such as None or :attr:`numpy.NaN`, get mapped to ``False``
+        values.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        numpy.ndarray
+            Boolean array to indicate which entries are not NA.
+
+        See Also
+        --------
+        Index.notnull : Alias of notna.
+        Index.isna: Inverse of notna.
+        notna : Top-level notna.
+
+        Examples
+        --------
+        Show which entries in an Index are not NA. The result is an
+        array.
+
+        >>> idx = pd.Index([5.2, 6.0, np.NaN])
+        >>> idx
+        Float64Index([5.2, 6.0, nan], dtype='float64')
+        >>> idx.notna()
+        array([ True,  True, False])
+
+        Empty strings are not considered NA values. None is considered a NA
+        value.
+
+        >>> idx = pd.Index(['black', '', 'red', None])
+        >>> idx
+        Index(['black', '', 'red', None], dtype='object')
+        >>> idx.notna()
+        array([ True,  True,  True, False])
+        """
+        return ~self.isna()
+    notnull = notna
+
+    _index_shared_docs['fillna'] = """
+        Fill NA/NaN values with the specified value
+
+        Parameters
+        ----------
+        value : scalar
+            Scalar value to use to fill holes (e.g. 0).
+            This value cannot be a list-likes.
+        downcast : dict, default is None
+            a dict of item->dtype of what to downcast if possible,
+            or the string 'infer' which will try to downcast to an appropriate
+            equal type (e.g. float64 to int64 if possible)
+
+        Returns
+        -------
+        filled : Index
+        """
+
+    @Appender(_index_shared_docs['fillna'])
+    def fillna(self, value=None, downcast=None):
+        self._assert_can_do_op(value)
+        if self.hasnans:
+            result = self.putmask(self._isnan, value)
+            if downcast is None:
+                # no need to care metadata other than name
+                # because it can't have freq if
+                return Index(result, name=self.name)
+        return self._shallow_copy()
+
+    _index_shared_docs['dropna'] = """
+        Return Index without NA/NaN values
+
+        Parameters
+        ----------
+        how :  {'any', 'all'}, default 'any'
+            If the Index is a MultiIndex, drop the value when any or all levels
+            are NaN.
+
+        Returns
+        -------
+        valid : Index
+        """
+
+    @Appender(_index_shared_docs['dropna'])
+    def dropna(self, how='any'):
+        if how not in ('any', 'all'):
+            raise ValueError("invalid how option: {0}".format(how))
+
+        if self.hasnans:
+            return self._shallow_copy(self.values[~self._isnan])
+        return self._shallow_copy()
+
+    # --------------------------------------------------------------------
+    # Uniqueness Methods
+
+    _index_shared_docs['index_unique'] = (
+        """
+        Return unique values in the index. Uniques are returned in order
+        of appearance, this does NOT sort.
+
+        Parameters
+        ----------
+        level : int or str, optional, default None
+            Only return values from specified level (for MultiIndex)
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        Index without duplicates
+
+        See Also
+        --------
+        unique
+        Series.unique
+        """)
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        result = super(Index, self).unique()
+        return self._shallow_copy(result)
+
+    def drop_duplicates(self, keep='first'):
+        """
+        Return Index with duplicate values removed.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', ``False``}, default 'first'
+            - 'first' : Drop duplicates except for the first occurrence.
+            - 'last' : Drop duplicates except for the last occurrence.
+            - ``False`` : Drop all duplicates.
+
+        Returns
+        -------
+        deduplicated : Index
+
+        See Also
+        --------
+        Series.drop_duplicates : Equivalent method on Series.
+        DataFrame.drop_duplicates : Equivalent method on DataFrame.
+        Index.duplicated : Related method on Index, indicating duplicate
+            Index values.
+
+        Examples
+        --------
+        Generate an pandas.Index with duplicate values.
+
+        >>> idx = pd.Index(['lama', 'cow', 'lama', 'beetle', 'lama', 'hippo'])
+
+        The `keep` parameter controls  which duplicate values are removed.
+        The value 'first' keeps the first occurrence for each
+        set of duplicated entries. The default value of keep is 'first'.
+
+        >>> idx.drop_duplicates(keep='first')
+        Index(['lama', 'cow', 'beetle', 'hippo'], dtype='object')
+
+        The value 'last' keeps the last occurrence for each set of duplicated
+        entries.
+
+        >>> idx.drop_duplicates(keep='last')
+        Index(['cow', 'beetle', 'lama', 'hippo'], dtype='object')
+
+        The value ``False`` discards all sets of duplicated entries.
+
+        >>> idx.drop_duplicates(keep=False)
+        Index(['cow', 'beetle', 'hippo'], dtype='object')
+        """
+        return super(Index, self).drop_duplicates(keep=keep)
+
+    def duplicated(self, keep='first'):
+        """
+        Indicate duplicate index values.
+
+        Duplicated values are indicated as ``True`` values in the resulting
+        array. Either all duplicates, all except the first, or all except the
+        last occurrence of duplicates can be indicated.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', False}, default 'first'
+            The value or values in a set of duplicates to mark as missing.
+
+            - 'first' : Mark duplicates as ``True`` except for the first
+              occurrence.
+            - 'last' : Mark duplicates as ``True`` except for the last
+              occurrence.
+            - ``False`` : Mark all duplicates as ``True``.
+
+        Returns
+        -------
+        numpy.ndarray
+
+        See Also
+        --------
+        Series.duplicated : Equivalent method on pandas.Series.
+        DataFrame.duplicated : Equivalent method on pandas.DataFrame.
+        Index.drop_duplicates : Remove duplicate values from Index.
+
+        Examples
+        --------
+        By default, for each set of duplicated values, the first occurrence is
+        set to False and all others to True:
+
+        >>> idx = pd.Index(['lama', 'cow', 'lama', 'beetle', 'lama'])
+        >>> idx.duplicated()
+        array([False, False,  True, False,  True])
+
+        which is equivalent to
+
+        >>> idx.duplicated(keep='first')
+        array([False, False,  True, False,  True])
+
+        By using 'last', the last occurrence of each set of duplicated values
+        is set on False and all others on True:
+
+        >>> idx.duplicated(keep='last')
+        array([ True, False,  True, False, False])
+
+        By setting keep on ``False``, all duplicates are True:
+
+        >>> idx.duplicated(keep=False)
+        array([ True, False,  True, False,  True])
+        """
+        return super(Index, self).duplicated(keep=keep)
+
+    def get_duplicates(self):
+        """
+        Extract duplicated index elements.
+
+        .. deprecated:: 0.23.0
+            Use idx[idx.duplicated()].unique() instead
+
+        Returns a sorted list of index elements which appear more than once in
+        the index.
+
+        Returns
+        -------
+        array-like
+            List of duplicated indexes.
+
+        See Also
+        --------
+        Index.duplicated : Return boolean array denoting duplicates.
+        Index.drop_duplicates : Return Index with duplicates removed.
+
+        Examples
+        --------
+
+        Works on different Index of types.
+
+        >>> pd.Index([1, 2, 2, 3, 3, 3, 4]).get_duplicates()  # doctest: +SKIP
+        [2, 3]
+
+        Note that for a DatetimeIndex, it does not return a list but a new
+        DatetimeIndex:
+
+        >>> dates = pd.to_datetime(['2018-01-01', '2018-01-02', '2018-01-03',
+        ...                         '2018-01-03', '2018-01-04', '2018-01-04'],
+        ...                        format='%Y-%m-%d')
+        >>> pd.Index(dates).get_duplicates()  # doctest: +SKIP
+        DatetimeIndex(['2018-01-03', '2018-01-04'],
+                      dtype='datetime64[ns]', freq=None)
+
+        Sorts duplicated elements even when indexes are unordered.
+
+        >>> pd.Index([1, 2, 3, 2, 3, 4, 3]).get_duplicates()  # doctest: +SKIP
+        [2, 3]
+
+        Return empty array-like structure when all elements are unique.
+
+        >>> pd.Index([1, 2, 3, 4]).get_duplicates()  # doctest: +SKIP
+        []
+        >>> dates = pd.to_datetime(['2018-01-01', '2018-01-02', '2018-01-03'],
+        ...                        format='%Y-%m-%d')
+        >>> pd.Index(dates).get_duplicates()  # doctest: +SKIP
+        DatetimeIndex([], dtype='datetime64[ns]', freq=None)
+        """
+        warnings.warn("'get_duplicates' is deprecated and will be removed in "
+                      "a future release. You can use "
+                      "idx[idx.duplicated()].unique() instead",
+                      FutureWarning, stacklevel=2)
+
+        return self[self.duplicated()].unique()
+
+    def _get_unique_index(self, dropna=False):
+        """
+        Returns an index containing unique values.
+
+        Parameters
+        ----------
+        dropna : bool
+            If True, NaN values are dropped.
+
+        Returns
+        -------
+        uniques : index
+        """
+        if self.is_unique and not dropna:
+            return self
+
+        values = self.values
+
+        if not self.is_unique:
+            values = self.unique()
+
+        if dropna:
+            try:
+                if self.hasnans:
+                    values = values[~isna(values)]
+            except NotImplementedError:
+                pass
+
+        return self._shallow_copy(values)
+
+    # --------------------------------------------------------------------
+    # Arithmetic & Logical Methods
+
+    def __add__(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+        return Index(np.array(self) + other)
+
+    def __radd__(self, other):
+        return Index(other + np.array(self))
+
+    def __iadd__(self, other):
+        # alias for __add__
+        return self + other
+
+    def __sub__(self, other):
+        return Index(np.array(self) - other)
+
+    def __rsub__(self, other):
+        return Index(other - np.array(self))
+
+    def __and__(self, other):
+        return self.intersection(other)
+
+    def __or__(self, other):
+        return self.union(other)
+
+    def __xor__(self, other):
+        return self.symmetric_difference(other)
+
+    def __nonzero__(self):
+        raise ValueError("The truth value of a {0} is ambiguous. "
+                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
+                         .format(self.__class__.__name__))
+
+    __bool__ = __nonzero__
+
+    # --------------------------------------------------------------------
+    # Set Operation Methods
+
+    def _get_reconciled_name_object(self, other):
+        """
+        If the result of a set operation will be self,
+        return self, unless the name changes, in which
+        case make a shallow copy of self.
+        """
+        name = get_op_result_name(self, other)
+        if self.name != name:
+            return self._shallow_copy(name=name)
+        return self
+
+    def _validate_sort_keyword(self, sort):
+        if sort not in [None, False]:
+            raise ValueError("The 'sort' keyword only takes the values of "
+                             "None or False; {0} was passed.".format(sort))
+
+    def union(self, other, sort=None):
+        """
+        Form the union of two Index objects.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        sort : bool or None, default None
+            Whether to sort the resulting Index.
+
+            * None : Sort the result, except when
+
+              1. `self` and `other` are equal.
+              2. `self` or `other` has length 0.
+              3. Some values in `self` or `other` cannot be compared.
+                 A RuntimeWarning is issued in this case.
+
+            * False : do not sort the result.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default value from ``True`` to ``None``
+               (without change in behaviour).
+
+        Returns
+        -------
+        union : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.union(idx2)
+        Int64Index([1, 2, 3, 4, 5, 6], dtype='int64')
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other = ensure_index(other)
+
+        if len(other) == 0 or self.equals(other):
+            return self._get_reconciled_name_object(other)
+
+        if len(self) == 0:
+            return other._get_reconciled_name_object(self)
+
+        # TODO: is_dtype_union_equal is a hack around
+        # 1. buggy set ops with duplicates (GH #13432)
+        # 2. CategoricalIndex lacking setops (GH #10186)
+        # Once those are fixed, this workaround can be removed
+        if not is_dtype_union_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.union(other, sort=sort)
+
+        # TODO(EA): setops-refactor, clean all this up
+        if is_period_dtype(self) or is_datetime64tz_dtype(self):
+            lvals = self._ndarray_values
+        else:
+            lvals = self._values
+        if is_period_dtype(other) or is_datetime64tz_dtype(other):
+            rvals = other._ndarray_values
+        else:
+            rvals = other._values
+
+        if self.is_monotonic and other.is_monotonic:
+            try:
+                result = self._outer_indexer(lvals, rvals)[0]
+            except TypeError:
+                # incomparable objects
+                result = list(lvals)
+
+                # worth making this faster? a very unusual case
+                value_set = set(lvals)
+                result.extend([x for x in rvals if x not in value_set])
+        else:
+            indexer = self.get_indexer(other)
+            indexer, = (indexer == -1).nonzero()
+
+            if len(indexer) > 0:
+                other_diff = algos.take_nd(rvals, indexer,
+                                           allow_fill=False)
+                result = _concat._concat_compat((lvals, other_diff))
+
+            else:
+                result = lvals
+
+            if sort is None:
+                try:
+                    result = sorting.safe_sort(result)
+                except TypeError as e:
+                    warnings.warn("{}, sort order is undefined for "
+                                  "incomparable objects".format(e),
+                                  RuntimeWarning, stacklevel=3)
+
+        # for subclasses
+        return self._wrap_setop_result(other, result)
+
+    def _wrap_setop_result(self, other, result):
+        return self._constructor(result, name=get_op_result_name(self, other))
+
+    def intersection(self, other, sort=False):
+        """
+        Form the intersection of two Index objects.
+
+        This returns a new Index with elements common to the index and `other`.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        sort : False or None, default False
+            Whether to sort the resulting index.
+
+            * False : do not sort the result.
+            * None : sort the result, except when `self` and `other` are equal
+              or when the values cannot be compared.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default from ``True`` to ``False``, to match
+               the behaviour of 0.23.4 and earlier.
+
+        Returns
+        -------
+        intersection : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.intersection(idx2)
+        Int64Index([3, 4], dtype='int64')
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other = ensure_index(other)
+
+        if self.equals(other):
+            return self._get_reconciled_name_object(other)
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.intersection(other, sort=sort)
+
+        # TODO(EA): setops-refactor, clean all this up
+        if is_period_dtype(self):
+            lvals = self._ndarray_values
+        else:
+            lvals = self._values
+        if is_period_dtype(other):
+            rvals = other._ndarray_values
+        else:
+            rvals = other._values
+
+        if self.is_monotonic and other.is_monotonic:
+            try:
+                result = self._inner_indexer(lvals, rvals)[0]
+                return self._wrap_setop_result(other, result)
+            except TypeError:
+                pass
+
+        try:
+            indexer = Index(rvals).get_indexer(lvals)
+            indexer = indexer.take((indexer != -1).nonzero()[0])
+        except Exception:
+            # duplicates
+            indexer = algos.unique1d(
+                Index(rvals).get_indexer_non_unique(lvals)[0])
+            indexer = indexer[indexer != -1]
+
+        taken = other.take(indexer)
+
+        if sort is None:
+            taken = sorting.safe_sort(taken.values)
+            if self.name != other.name:
+                name = None
+            else:
+                name = self.name
+            return self._shallow_copy(taken, name=name)
+
+        if self.name != other.name:
+            taken.name = None
+
+        return taken
+
+    def difference(self, other, sort=None):
+        """
+        Return a new Index with elements from the index that are not in
+        `other`.
+
+        This is the set difference of two Index objects.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        sort : False or None, default None
+            Whether to sort the resulting index. By default, the
+            values are attempted to be sorted, but any TypeError from
+            incomparable elements is caught by pandas.
+
+            * None : Attempt to sort the result, but catch any TypeErrors
+              from comparing incomparable elements.
+            * False : Do not sort the result.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default value from ``True`` to ``None``
+               (without change in behaviour).
+
+        Returns
+        -------
+        difference : Index
+
+        Examples
+        --------
+
+        >>> idx1 = pd.Index([2, 1, 3, 4])
+        >>> idx2 = pd.Index([3, 4, 5, 6])
+        >>> idx1.difference(idx2)
+        Int64Index([1, 2], dtype='int64')
+        >>> idx1.difference(idx2, sort=False)
+        Int64Index([2, 1], dtype='int64')
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+
+        if self.equals(other):
+            # pass an empty np.ndarray with the appropriate dtype
+            return self._shallow_copy(self._data[:0])
+
+        other, result_name = self._convert_can_do_setop(other)
+
+        this = self._get_unique_index()
+
+        indexer = this.get_indexer(other)
+        indexer = indexer.take((indexer != -1).nonzero()[0])
+
+        label_diff = np.setdiff1d(np.arange(this.size), indexer,
+                                  assume_unique=True)
+        the_diff = this.values.take(label_diff)
+        if sort is None:
+            try:
+                the_diff = sorting.safe_sort(the_diff)
+            except TypeError:
+                pass
+
+        return this._shallow_copy(the_diff, name=result_name, freq=None)
+
+    def symmetric_difference(self, other, result_name=None, sort=None):
+        """
+        Compute the symmetric difference of two Index objects.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        result_name : str
+        sort : False or None, default None
+            Whether to sort the resulting index. By default, the
+            values are attempted to be sorted, but any TypeError from
+            incomparable elements is caught by pandas.
+
+            * None : Attempt to sort the result, but catch any TypeErrors
+              from comparing incomparable elements.
+            * False : Do not sort the result.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default value from ``True`` to ``None``
+               (without change in behaviour).
+
+        Returns
+        -------
+        symmetric_difference : Index
+
+        Notes
+        -----
+        ``symmetric_difference`` contains elements that appear in either
+        ``idx1`` or ``idx2`` but not both. Equivalent to the Index created by
+        ``idx1.difference(idx2) | idx2.difference(idx1)`` with duplicates
+        dropped.
+
+        Examples
+        --------
+        >>> idx1 = pd.Index([1, 2, 3, 4])
+        >>> idx2 = pd.Index([2, 3, 4, 5])
+        >>> idx1.symmetric_difference(idx2)
+        Int64Index([1, 5], dtype='int64')
+
+        You can also use the ``^`` operator:
+
+        >>> idx1 ^ idx2
+        Int64Index([1, 5], dtype='int64')
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other, result_name_update = self._convert_can_do_setop(other)
+        if result_name is None:
+            result_name = result_name_update
+
+        this = self._get_unique_index()
+        other = other._get_unique_index()
+        indexer = this.get_indexer(other)
+
+        # {this} minus {other}
+        common_indexer = indexer.take((indexer != -1).nonzero()[0])
+        left_indexer = np.setdiff1d(np.arange(this.size), common_indexer,
+                                    assume_unique=True)
+        left_diff = this.values.take(left_indexer)
+
+        # {other} minus {this}
+        right_indexer = (indexer == -1).nonzero()[0]
+        right_diff = other.values.take(right_indexer)
+
+        the_diff = _concat._concat_compat([left_diff, right_diff])
+        if sort is None:
+            try:
+                the_diff = sorting.safe_sort(the_diff)
+            except TypeError:
+                pass
+
+        attribs = self._get_attributes_dict()
+        attribs['name'] = result_name
+        if 'freq' in attribs:
+            attribs['freq'] = None
+        return self._shallow_copy_with_infer(the_diff, **attribs)
+
+    def _assert_can_do_setop(self, other):
+        if not is_list_like(other):
+            raise TypeError('Input must be Index or array-like')
+        return True
+
+    def _convert_can_do_setop(self, other):
+        if not isinstance(other, Index):
+            other = Index(other, name=self.name)
+            result_name = self.name
+        else:
+            result_name = get_op_result_name(self, other)
+        return other, result_name
+
+    # --------------------------------------------------------------------
+    # Indexing Methods
+
+    _index_shared_docs['get_loc'] = """
+        Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
+            * default: exact matches only.
+            * pad / ffill: find the PREVIOUS index value if no exact match.
+            * backfill / bfill: use NEXT index value if no exact match
+            * nearest: use the NEAREST index value if no exact match. Tied
+              distances are broken by preferring the larger index value.
+        tolerance : optional
+            Maximum distance from index value for inexact matches. The value of
+            the index at the matching location most satisfy the equation
+            ``abs(index[loc] - key) <= tolerance``.
+
+            Tolerance may be a scalar
+            value, which applies the same tolerance to all values, or
+            list-like, which applies variable tolerance per element. List-like
+            includes list, tuple, array, Series, and must be the same size as
+            the index and its dtype must exactly match the index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Examples
+        ---------
+        >>> unique_index = pd.Index(list('abc'))
+        >>> unique_index.get_loc('b')
+        1
+
+        >>> monotonic_index = pd.Index(list('abbc'))
+        >>> monotonic_index.get_loc('b')
+        slice(1, 3, None)
+
+        >>> non_monotonic_index = pd.Index(list('abcb'))
+        >>> non_monotonic_index.get_loc('b')
+        array([False,  True, False,  True], dtype=bool)
+        """
+
+    @Appender(_index_shared_docs['get_loc'])
+    def get_loc(self, key, method=None, tolerance=None):
+        if method is None:
+            if tolerance is not None:
+                raise ValueError('tolerance argument only valid if using pad, '
+                                 'backfill or nearest lookups')
+            try:
+                return self._engine.get_loc(key)
+            except KeyError:
+                return self._engine.get_loc(self._maybe_cast_indexer(key))
+        indexer = self.get_indexer([key], method=method, tolerance=tolerance)
+        if indexer.ndim > 1 or indexer.size > 1:
+            raise TypeError('get_loc requires scalar valued input')
+        loc = indexer.item()
+        if loc == -1:
+            raise KeyError(key)
+        return loc
+
+    _index_shared_docs['get_indexer'] = """
+        Compute indexer and mask for new index given the current index. The
+        indexer should be then used as an input to ndarray.take to align the
+        current data to the new index.
+
+        Parameters
+        ----------
+        target : %(target_klass)s
+        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
+            * default: exact matches only.
+            * pad / ffill: find the PREVIOUS index value if no exact match.
+            * backfill / bfill: use NEXT index value if no exact match
+            * nearest: use the NEAREST index value if no exact match. Tied
+              distances are broken by preferring the larger index value.
+        limit : int, optional
+            Maximum number of consecutive labels in ``target`` to match for
+            inexact matches.
+        tolerance : optional
+            Maximum distance between original and new labels for inexact
+            matches. The values of the index at the matching locations most
+            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
+
+            Tolerance may be a scalar value, which applies the same tolerance
+            to all values, or list-like, which applies variable tolerance per
+            element. List-like includes list, tuple, array, Series, and must be
+            the same size as the index and its dtype must exactly match the
+            index's type.
+
+            .. versionadded:: 0.21.0 (list-like tolerance)
+
+        Returns
+        -------
+        indexer : ndarray of int
+            Integers from 0 to n - 1 indicating that the index at these
+            positions matches the corresponding target values. Missing values
+            in the target are marked by -1.
+
+        Examples
+        --------
+        >>> index = pd.Index(['c', 'a', 'b'])
+        >>> index.get_indexer(['a', 'b', 'x'])
+        array([ 1,  2, -1])
+
+        Notice that the return value is an array of locations in ``index``
+        and ``x`` is marked by -1, as it is not in ``index``.
+        """
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        method = missing.clean_reindex_fill_method(method)
+        target = ensure_index(target)
+        if tolerance is not None:
+            tolerance = self._convert_tolerance(tolerance, target)
+
+        # Treat boolean labels passed to a numeric index as not found. Without
+        # this fix False and True would be treated as 0 and 1 respectively.
+        # (GH #16877)
+        if target.is_boolean() and self.is_numeric():
+            return ensure_platform_int(np.repeat(-1, target.size))
+
+        pself, ptarget = self._maybe_promote(target)
+        if pself is not self or ptarget is not target:
+            return pself.get_indexer(ptarget, method=method, limit=limit,
+                                     tolerance=tolerance)
+
+        if not is_dtype_equal(self.dtype, target.dtype):
+            this = self.astype(object)
+            target = target.astype(object)
+            return this.get_indexer(target, method=method, limit=limit,
+                                    tolerance=tolerance)
+
+        if not self.is_unique:
+            raise InvalidIndexError('Reindexing only valid with uniquely'
+                                    ' valued Index objects')
+
+        if method == 'pad' or method == 'backfill':
+            indexer = self._get_fill_indexer(target, method, limit, tolerance)
+        elif method == 'nearest':
+            indexer = self._get_nearest_indexer(target, limit, tolerance)
+        else:
+            if tolerance is not None:
+                raise ValueError('tolerance argument only valid if doing pad, '
+                                 'backfill or nearest reindexing')
+            if limit is not None:
+                raise ValueError('limit argument only valid if doing pad, '
+                                 'backfill or nearest reindexing')
+
+            indexer = self._engine.get_indexer(target._ndarray_values)
+
+        return ensure_platform_int(indexer)
+
+    def _convert_tolerance(self, tolerance, target):
+        # override this method on subclasses
+        tolerance = np.asarray(tolerance)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return tolerance
+
+    def _get_fill_indexer(self, target, method, limit=None, tolerance=None):
+        if self.is_monotonic_increasing and target.is_monotonic_increasing:
+            method = (self._engine.get_pad_indexer if method == 'pad' else
+                      self._engine.get_backfill_indexer)
+            indexer = method(target._ndarray_values, limit)
+        else:
+            indexer = self._get_fill_indexer_searchsorted(target, method,
+                                                          limit)
+        if tolerance is not None:
+            indexer = self._filter_indexer_tolerance(target._ndarray_values,
+                                                     indexer,
+                                                     tolerance)
+        return indexer
+
+    def _get_fill_indexer_searchsorted(self, target, method, limit=None):
+        """
+        Fallback pad/backfill get_indexer that works for monotonic decreasing
+        indexes and non-monotonic targets.
+        """
+        if limit is not None:
+            raise ValueError('limit argument for %r method only well-defined '
+                             'if index and target are monotonic' % method)
+
+        side = 'left' if method == 'pad' else 'right'
+
+        # find exact matches first (this simplifies the algorithm)
+        indexer = self.get_indexer(target)
+        nonexact = (indexer == -1)
+        indexer[nonexact] = self._searchsorted_monotonic(target[nonexact],
+                                                         side)
+        if side == 'left':
+            # searchsorted returns "indices into a sorted array such that,
+            # if the corresponding elements in v were inserted before the
+            # indices, the order of a would be preserved".
+            # Thus, we need to subtract 1 to find values to the left.
+            indexer[nonexact] -= 1
+            # This also mapped not found values (values of 0 from
+            # np.searchsorted) to -1, which conveniently is also our
+            # sentinel for missing values
+        else:
+            # Mark indices to the right of the largest value as not found
+            indexer[indexer == len(self)] = -1
+        return indexer
+
+    def _get_nearest_indexer(self, target, limit, tolerance):
+        """
+        Get the indexer for the nearest index labels; requires an index with
+        values that can be subtracted from each other (e.g., not strings or
+        tuples).
+        """
+        left_indexer = self.get_indexer(target, 'pad', limit=limit)
+        right_indexer = self.get_indexer(target, 'backfill', limit=limit)
+
+        target = np.asarray(target)
+        left_distances = abs(self.values[left_indexer] - target)
+        right_distances = abs(self.values[right_indexer] - target)
+
+        op = operator.lt if self.is_monotonic_increasing else operator.le
+        indexer = np.where(op(left_distances, right_distances) |
+                           (right_indexer == -1), left_indexer, right_indexer)
+        if tolerance is not None:
+            indexer = self._filter_indexer_tolerance(target, indexer,
+                                                     tolerance)
+        return indexer
+
+    def _filter_indexer_tolerance(self, target, indexer, tolerance):
+        distance = abs(self.values[indexer] - target)
+        indexer = np.where(distance <= tolerance, indexer, -1)
+        return indexer
+
+    # --------------------------------------------------------------------
+    # Indexer Conversion Methods
+
+    _index_shared_docs['_convert_scalar_indexer'] = """
+        Convert a scalar indexer.
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+    """
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        if kind == 'iloc':
+            return self._validate_indexer('positional', key, kind)
+
+        if len(self) and not isinstance(self, ABCMultiIndex,):
+
+            # we can raise here if we are definitive that this
+            # is positional indexing (eg. .ix on with a float)
+            # or label indexing if we are using a type able
+            # to be represented in the index
+
+            if kind in ['getitem', 'ix'] and is_float(key):
+                if not self.is_floating():
+                    return self._invalid_indexer('label', key)
+
+            elif kind in ['loc'] and is_float(key):
+
+                # we want to raise KeyError on string/mixed here
+                # technically we *could* raise a TypeError
+                # on anything but mixed though
+                if self.inferred_type not in ['floating',
+                                              'mixed-integer-float',
+                                              'string',
+                                              'unicode',
+                                              'mixed']:
+                    return self._invalid_indexer('label', key)
+
+            elif kind in ['loc'] and is_integer(key):
+                if not self.holds_integer():
+                    return self._invalid_indexer('label', key)
+
+        return key
+
+    _index_shared_docs['_convert_slice_indexer'] = """
+        Convert a slice indexer.
+
+        By definition, these are labels unless 'iloc' is passed in.
+        Floats are not allowed as the start, step, or stop of the slice.
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+    """
+
+    @Appender(_index_shared_docs['_convert_slice_indexer'])
+    def _convert_slice_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # if we are not a slice, then we are done
+        if not isinstance(key, slice):
+            return key
+
+        # validate iloc
+        if kind == 'iloc':
+            return slice(self._validate_indexer('slice', key.start, kind),
+                         self._validate_indexer('slice', key.stop, kind),
+                         self._validate_indexer('slice', key.step, kind))
+
+        # potentially cast the bounds to integers
+        start, stop, step = key.start, key.stop, key.step
+
+        # figure out if this is a positional indexer
+        def is_int(v):
+            return v is None or is_integer(v)
+
+        is_null_slicer = start is None and stop is None
+        is_index_slice = is_int(start) and is_int(stop)
+        is_positional = is_index_slice and not self.is_integer()
+
+        if kind == 'getitem':
+            """
+            called from the getitem slicers, validate that we are in fact
+            integers
+            """
+            if self.is_integer() or is_index_slice:
+                return slice(self._validate_indexer('slice', key.start, kind),
+                             self._validate_indexer('slice', key.stop, kind),
+                             self._validate_indexer('slice', key.step, kind))
+
+        # convert the slice to an indexer here
+
+        # if we are mixed and have integers
+        try:
+            if is_positional and self.is_mixed():
+                # Validate start & stop
+                if start is not None:
+                    self.get_loc(start)
+                if stop is not None:
+                    self.get_loc(stop)
+                is_positional = False
+        except KeyError:
+            if self.inferred_type == 'mixed-integer-float':
+                raise
+
+        if is_null_slicer:
+            indexer = key
+        elif is_positional:
+            indexer = key
+        else:
+            try:
+                indexer = self.slice_indexer(start, stop, step, kind=kind)
+            except Exception:
+                if is_index_slice:
+                    if self.is_integer():
+                        raise
+                    else:
+                        indexer = key
+                else:
+                    raise
+
+        return indexer
+
+    def _convert_listlike_indexer(self, keyarr, kind=None):
+        """
+        Parameters
+        ----------
+        keyarr : list-like
+            Indexer to convert.
+
+        Returns
+        -------
+        indexer : numpy.ndarray or None
+            Return an ndarray or None if cannot convert.
+        keyarr : numpy.ndarray
+            Return tuple-safe keys.
+        """
+        if isinstance(keyarr, Index):
+            keyarr = self._convert_index_indexer(keyarr)
+        else:
+            keyarr = self._convert_arr_indexer(keyarr)
+
+        indexer = self._convert_list_indexer(keyarr, kind=kind)
+        return indexer, keyarr
+
+    _index_shared_docs['_convert_arr_indexer'] = """
+        Convert an array-like indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : array-like
+            Indexer to convert.
+
+        Returns
+        -------
+        converted_keyarr : array-like
+    """
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        keyarr = com.asarray_tuplesafe(keyarr)
+        return keyarr
+
+    _index_shared_docs['_convert_index_indexer'] = """
+        Convert an Index indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : Index (or sub-class)
+            Indexer to convert.
+
+        Returns
+        -------
+        converted_keyarr : Index (or sub-class)
+    """
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        return keyarr
+
+    _index_shared_docs['_convert_list_indexer'] = """
+        Convert a list-like indexer to the appropriate dtype.
+
+        Parameters
+        ----------
+        keyarr : Index (or sub-class)
+            Indexer to convert.
+        kind : iloc, ix, loc, optional
+
+        Returns
+        -------
+        positional indexer or None
+    """
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        if (kind in [None, 'iloc', 'ix'] and
+                is_integer_dtype(keyarr) and not self.is_floating() and
+                not isinstance(keyarr, ABCPeriodIndex)):
+
+            if self.inferred_type == 'mixed-integer':
+                indexer = self.get_indexer(keyarr)
+                if (indexer >= 0).all():
+                    return indexer
+                # missing values are flagged as -1 by get_indexer and negative
+                # indices are already converted to positive indices in the
+                # above if-statement, so the negative flags are changed to
+                # values outside the range of indices so as to trigger an
+                # IndexError in maybe_convert_indices
+                indexer[indexer < 0] = len(self)
+                from pandas.core.indexing import maybe_convert_indices
+                return maybe_convert_indices(indexer, len(self))
+
+            elif not self.inferred_type == 'integer':
+                keyarr = np.where(keyarr < 0, len(self) + keyarr, keyarr)
+                return keyarr
+
+        return None
+
+    def _invalid_indexer(self, form, key):
+        """
+        Consistent invalid indexer message.
+        """
+        raise TypeError("cannot do {form} indexing on {klass} with these "
+                        "indexers [{key}] of {kind}".format(
+                            form=form, klass=type(self), key=key,
+                            kind=type(key)))
+
+    # --------------------------------------------------------------------
+    # Reindex Methods
+
+    def _can_reindex(self, indexer):
+        """
+        Check if we are allowing reindexing with this particular indexer.
+
+        Parameters
+        ----------
+        indexer : an integer indexer
+
+        Raises
+        ------
+        ValueError if its a duplicate axis
+        """
+
+        # trying to reindex on an axis with duplicates
+        if not self.is_unique and len(indexer):
+            raise ValueError("cannot reindex from a duplicate axis")
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values
+        as necessary).
+
+        Parameters
+        ----------
+        target : an iterable
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index.
+        indexer : np.ndarray or None
+            Indices of output values in original index.
+
+        """
+        # GH6552: preserve names when reindexing to non-named target
+        # (i.e. neither Index nor Series).
+        preserve_names = not hasattr(target, 'name')
+
+        # GH7774: preserve dtype/tz if target is empty and not an Index.
+        target = _ensure_has_len(target)  # target may be an iterator
+
+        if not isinstance(target, Index) and len(target) == 0:
+            attrs = self._get_attributes_dict()
+            attrs.pop('freq', None)  # don't preserve freq
+            values = self._data[:0]  # appropriately-dtyped empty array
+            target = self._simple_new(values, dtype=self.dtype, **attrs)
+        else:
+            target = ensure_index(target)
+
+        if level is not None:
+            if method is not None:
+                raise TypeError('Fill method not supported if level passed')
+            _, indexer, _ = self._join_level(target, level, how='right',
+                                             return_indexers=True)
+        else:
+            if self.equals(target):
+                indexer = None
+            else:
+
+                if self.is_unique:
+                    indexer = self.get_indexer(target, method=method,
+                                               limit=limit,
+                                               tolerance=tolerance)
+                else:
+                    if method is not None or limit is not None:
+                        raise ValueError("cannot reindex a non-unique index "
+                                         "with a method or limit")
+                    indexer, missing = self.get_indexer_non_unique(target)
+
+        if preserve_names and target.nlevels == 1 and target.name != self.name:
+            target = target.copy()
+            target.name = self.name
+
+        return target, indexer
+
+    def _reindex_non_unique(self, target):
+        """
+        Create a new index with target's values (move/add/delete values as
+        necessary) use with non-unique Index and a possibly non-unique target.
+
+        Parameters
+        ----------
+        target : an iterable
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index.
+        indexer : np.ndarray or None
+            Indices of output values in original index.
+
+        """
+
+        target = ensure_index(target)
+        indexer, missing = self.get_indexer_non_unique(target)
+        check = indexer != -1
+        new_labels = self.take(indexer[check])
+        new_indexer = None
+
+        if len(missing):
+            length = np.arange(len(indexer))
+
+            missing = ensure_platform_int(missing)
+            missing_labels = target.take(missing)
+            missing_indexer = ensure_int64(length[~check])
+            cur_labels = self.take(indexer[check]).values
+            cur_indexer = ensure_int64(length[check])
+
+            new_labels = np.empty(tuple([len(indexer)]), dtype=object)
+            new_labels[cur_indexer] = cur_labels
+            new_labels[missing_indexer] = missing_labels
+
+            # a unique indexer
+            if target.is_unique:
+
+                # see GH5553, make sure we use the right indexer
+                new_indexer = np.arange(len(indexer))
+                new_indexer[cur_indexer] = np.arange(len(cur_labels))
+                new_indexer[missing_indexer] = -1
+
+            # we have a non_unique selector, need to use the original
+            # indexer here
+            else:
+
+                # need to retake to have the same size as the indexer
+                indexer[~check] = -1
+
+                # reset the new indexer to account for the new size
+                new_indexer = np.arange(len(self.take(indexer)))
+                new_indexer[~check] = -1
+
+        new_index = self._shallow_copy_with_infer(new_labels, freq=None)
+        return new_index, indexer, new_indexer
+
+    # --------------------------------------------------------------------
+    # Join Methods
+
+    _index_shared_docs['join'] = """
+        Compute join_index and indexers to conform data
+        structures to the new index.
+
+        Parameters
+        ----------
+        other : Index
+        how : {'left', 'right', 'inner', 'outer'}
+        level : int or level name, default None
+        return_indexers : boolean, default False
+        sort : boolean, default False
+            Sort the join keys lexicographically in the result Index. If False,
+            the order of the join keys depends on the join type (how keyword)
+
+            .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        join_index, (left_indexer, right_indexer)
+        """
+
+    @Appender(_index_shared_docs['join'])
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        self_is_mi = isinstance(self, ABCMultiIndex)
+        other_is_mi = isinstance(other, ABCMultiIndex)
+
+        # try to figure out the join level
+        # GH3662
+        if level is None and (self_is_mi or other_is_mi):
+
+            # have the same levels/names so a simple join
+            if self.names == other.names:
+                pass
+            else:
+                return self._join_multi(other, how=how,
+                                        return_indexers=return_indexers)
+
+        # join on the level
+        if level is not None and (self_is_mi or other_is_mi):
+            return self._join_level(other, level, how=how,
+                                    return_indexers=return_indexers)
+
+        other = ensure_index(other)
+
+        if len(other) == 0 and how in ('left', 'outer'):
+            join_index = self._shallow_copy()
+            if return_indexers:
+                rindexer = np.repeat(-1, len(join_index))
+                return join_index, None, rindexer
+            else:
+                return join_index
+
+        if len(self) == 0 and how in ('right', 'outer'):
+            join_index = other._shallow_copy()
+            if return_indexers:
+                lindexer = np.repeat(-1, len(join_index))
+                return join_index, lindexer, None
+            else:
+                return join_index
+
+        if self._join_precedence < other._join_precedence:
+            how = {'right': 'left', 'left': 'right'}.get(how, how)
+            result = other.join(self, how=how, level=level,
+                                return_indexers=return_indexers)
+            if return_indexers:
+                x, y, z = result
+                result = x, z, y
+            return result
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            this = self.astype('O')
+            other = other.astype('O')
+            return this.join(other, how=how, return_indexers=return_indexers)
+
+        _validate_join_method(how)
+
+        if not self.is_unique and not other.is_unique:
+            return self._join_non_unique(other, how=how,
+                                         return_indexers=return_indexers)
+        elif not self.is_unique or not other.is_unique:
+            if self.is_monotonic and other.is_monotonic:
+                return self._join_monotonic(other, how=how,
+                                            return_indexers=return_indexers)
+            else:
+                return self._join_non_unique(other, how=how,
+                                             return_indexers=return_indexers)
+        elif self.is_monotonic and other.is_monotonic:
+            try:
+                return self._join_monotonic(other, how=how,
+                                            return_indexers=return_indexers)
+            except TypeError:
+                pass
+
+        if how == 'left':
+            join_index = self
+        elif how == 'right':
+            join_index = other
+        elif how == 'inner':
+            # TODO: sort=False here for backwards compat. It may
+            # be better to use the sort parameter passed into join
+            join_index = self.intersection(other, sort=False)
+        elif how == 'outer':
+            # TODO: sort=True here for backwards compat. It may
+            # be better to use the sort parameter passed into join
+            join_index = self.union(other)
+
+        if sort:
+            join_index = join_index.sort_values()
+
+        if return_indexers:
+            if join_index is self:
+                lindexer = None
+            else:
+                lindexer = self.get_indexer(join_index)
+            if join_index is other:
+                rindexer = None
+            else:
+                rindexer = other.get_indexer(join_index)
+            return join_index, lindexer, rindexer
+        else:
+            return join_index
+
+    def _join_multi(self, other, how, return_indexers=True):
+        from .multi import MultiIndex
+        from pandas.core.reshape.merge import _restore_dropped_levels_multijoin
+
+        # figure out join names
+        self_names = set(com._not_none(*self.names))
+        other_names = set(com._not_none(*other.names))
+        overlap = self_names & other_names
+
+        # need at least 1 in common
+        if not overlap:
+            raise ValueError("cannot join with no overlapping index names")
+
+        self_is_mi = isinstance(self, MultiIndex)
+        other_is_mi = isinstance(other, MultiIndex)
+
+        if self_is_mi and other_is_mi:
+
+            # Drop the non-matching levels from left and right respectively
+            ldrop_names = list(self_names - overlap)
+            rdrop_names = list(other_names - overlap)
+
+            self_jnlevels = self.droplevel(ldrop_names)
+            other_jnlevels = other.droplevel(rdrop_names)
+
+            # Join left and right
+            # Join on same leveled multi-index frames is supported
+            join_idx, lidx, ridx = self_jnlevels.join(other_jnlevels, how,
+                                                      return_indexers=True)
+
+            # Restore the dropped levels
+            # Returned index level order is
+            # common levels, ldrop_names, rdrop_names
+            dropped_names = ldrop_names + rdrop_names
+
+            levels, codes, names = (
+                _restore_dropped_levels_multijoin(self, other,
+                                                  dropped_names,
+                                                  join_idx,
+                                                  lidx, ridx))
+
+            # Re-create the multi-index
+            multi_join_idx = MultiIndex(levels=levels, codes=codes,
+                                        names=names, verify_integrity=False)
+
+            multi_join_idx = multi_join_idx.remove_unused_levels()
+
+            return multi_join_idx, lidx, ridx
+
+        jl = list(overlap)[0]
+
+        # Case where only one index is multi
+        # make the indices into mi's that match
+        flip_order = False
+        if self_is_mi:
+            self, other = other, self
+            flip_order = True
+            # flip if join method is right or left
+            how = {'right': 'left', 'left': 'right'}.get(how, how)
+
+        level = other.names.index(jl)
+        result = self._join_level(other, level, how=how,
+                                  return_indexers=return_indexers)
+
+        if flip_order:
+            if isinstance(result, tuple):
+                return result[0], result[2], result[1]
+        return result
+
+    def _join_non_unique(self, other, how='left', return_indexers=False):
+        from pandas.core.reshape.merge import _get_join_indexers
+
+        left_idx, right_idx = _get_join_indexers([self._ndarray_values],
+                                                 [other._ndarray_values],
+                                                 how=how,
+                                                 sort=True)
+
+        left_idx = ensure_platform_int(left_idx)
+        right_idx = ensure_platform_int(right_idx)
+
+        join_index = np.asarray(self._ndarray_values.take(left_idx))
+        mask = left_idx == -1
+        np.putmask(join_index, mask, other._ndarray_values.take(right_idx))
+
+        join_index = self._wrap_joined_index(join_index, other)
+
+        if return_indexers:
+            return join_index, left_idx, right_idx
+        else:
+            return join_index
+
+    def _join_level(self, other, level, how='left', return_indexers=False,
+                    keep_order=True):
+        """
+        The join method *only* affects the level of the resulting
+        MultiIndex. Otherwise it just exactly aligns the Index data to the
+        labels of the level in the MultiIndex.
+
+        If ```keep_order == True```, the order of the data indexed by the
+        MultiIndex will not be changed; otherwise, it will tie out
+        with `other`.
+        """
+        from .multi import MultiIndex
+
+        def _get_leaf_sorter(labels):
+            """
+            Returns sorter for the inner most level while preserving the
+            order of higher levels.
+            """
+            if labels[0].size == 0:
+                return np.empty(0, dtype='int64')
+
+            if len(labels) == 1:
+                lab = ensure_int64(labels[0])
+                sorter, _ = libalgos.groupsort_indexer(lab, 1 + lab.max())
+                return sorter
+
+            # find indexers of beginning of each set of
+            # same-key labels w.r.t all but last level
+            tic = labels[0][:-1] != labels[0][1:]
+            for lab in labels[1:-1]:
+                tic |= lab[:-1] != lab[1:]
+
+            starts = np.hstack(([True], tic, [True])).nonzero()[0]
+            lab = ensure_int64(labels[-1])
+            return lib.get_level_sorter(lab, ensure_int64(starts))
+
+        if isinstance(self, MultiIndex) and isinstance(other, MultiIndex):
+            raise TypeError('Join on level between two MultiIndex objects '
+                            'is ambiguous')
+
+        left, right = self, other
+
+        flip_order = not isinstance(self, MultiIndex)
+        if flip_order:
+            left, right = right, left
+            how = {'right': 'left', 'left': 'right'}.get(how, how)
+
+        level = left._get_level_number(level)
+        old_level = left.levels[level]
+
+        if not right.is_unique:
+            raise NotImplementedError('Index._join_level on non-unique index '
+                                      'is not implemented')
+
+        new_level, left_lev_indexer, right_lev_indexer = \
+            old_level.join(right, how=how, return_indexers=True)
+
+        if left_lev_indexer is None:
+            if keep_order or len(left) == 0:
+                left_indexer = None
+                join_index = left
+            else:  # sort the leaves
+                left_indexer = _get_leaf_sorter(left.codes[:level + 1])
+                join_index = left[left_indexer]
+
+        else:
+            left_lev_indexer = ensure_int64(left_lev_indexer)
+            rev_indexer = lib.get_reverse_indexer(left_lev_indexer,
+                                                  len(old_level))
+
+            new_lev_codes = algos.take_nd(rev_indexer, left.codes[level],
+                                          allow_fill=False)
+
+            new_codes = list(left.codes)
+            new_codes[level] = new_lev_codes
+
+            new_levels = list(left.levels)
+            new_levels[level] = new_level
+
+            if keep_order:  # just drop missing values. o.w. keep order
+                left_indexer = np.arange(len(left), dtype=np.intp)
+                mask = new_lev_codes != -1
+                if not mask.all():
+                    new_codes = [lab[mask] for lab in new_codes]
+                    left_indexer = left_indexer[mask]
+
+            else:  # tie out the order with other
+                if level == 0:  # outer most level, take the fast route
+                    ngroups = 1 + new_lev_codes.max()
+                    left_indexer, counts = libalgos.groupsort_indexer(
+                        new_lev_codes, ngroups)
+
+                    # missing values are placed first; drop them!
+                    left_indexer = left_indexer[counts[0]:]
+                    new_codes = [lab[left_indexer] for lab in new_codes]
+
+                else:  # sort the leaves
+                    mask = new_lev_codes != -1
+                    mask_all = mask.all()
+                    if not mask_all:
+                        new_codes = [lab[mask] for lab in new_codes]
+
+                    left_indexer = _get_leaf_sorter(new_codes[:level + 1])
+                    new_codes = [lab[left_indexer] for lab in new_codes]
+
+                    # left_indexers are w.r.t masked frame.
+                    # reverse to original frame!
+                    if not mask_all:
+                        left_indexer = mask.nonzero()[0][left_indexer]
+
+            join_index = MultiIndex(levels=new_levels, codes=new_codes,
+                                    names=left.names, verify_integrity=False)
+
+        if right_lev_indexer is not None:
+            right_indexer = algos.take_nd(right_lev_indexer,
+                                          join_index.codes[level],
+                                          allow_fill=False)
+        else:
+            right_indexer = join_index.codes[level]
+
+        if flip_order:
+            left_indexer, right_indexer = right_indexer, left_indexer
+
+        if return_indexers:
+            left_indexer = (None if left_indexer is None
+                            else ensure_platform_int(left_indexer))
+            right_indexer = (None if right_indexer is None
+                             else ensure_platform_int(right_indexer))
+            return join_index, left_indexer, right_indexer
+        else:
+            return join_index
+
+    def _join_monotonic(self, other, how='left', return_indexers=False):
+        if self.equals(other):
+            ret_index = other if how == 'right' else self
+            if return_indexers:
+                return ret_index, None, None
+            else:
+                return ret_index
+
+        sv = self._ndarray_values
+        ov = other._ndarray_values
+
+        if self.is_unique and other.is_unique:
+            # We can perform much better than the general case
+            if how == 'left':
+                join_index = self
+                lidx = None
+                ridx = self._left_indexer_unique(sv, ov)
+            elif how == 'right':
+                join_index = other
+                lidx = self._left_indexer_unique(ov, sv)
+                ridx = None
+            elif how == 'inner':
+                join_index, lidx, ridx = self._inner_indexer(sv, ov)
+                join_index = self._wrap_joined_index(join_index, other)
+            elif how == 'outer':
+                join_index, lidx, ridx = self._outer_indexer(sv, ov)
+                join_index = self._wrap_joined_index(join_index, other)
+        else:
+            if how == 'left':
+                join_index, lidx, ridx = self._left_indexer(sv, ov)
+            elif how == 'right':
+                join_index, ridx, lidx = self._left_indexer(ov, sv)
+            elif how == 'inner':
+                join_index, lidx, ridx = self._inner_indexer(sv, ov)
+            elif how == 'outer':
+                join_index, lidx, ridx = self._outer_indexer(sv, ov)
+            join_index = self._wrap_joined_index(join_index, other)
+
+        if return_indexers:
+            lidx = None if lidx is None else ensure_platform_int(lidx)
+            ridx = None if ridx is None else ensure_platform_int(ridx)
+            return join_index, lidx, ridx
+        else:
+            return join_index
+
+    def _wrap_joined_index(self, joined, other):
+        name = get_op_result_name(self, other)
+        return Index(joined, name=name)
+
+    # --------------------------------------------------------------------
+    # Uncategorized Methods
+
+    @property
+    def values(self):
+        """
+        Return an array representing the data in the Index.
+
+        .. warning::
+
+           We recommend using :attr:`Index.array` or
+           :meth:`Index.to_numpy`, depending on whether you need
+           a reference to the underlying data or a NumPy array.
+
+        Returns
+        -------
+        array: numpy.ndarray or ExtensionArray
+
+        See Also
+        --------
+        Index.array : Reference to the underlying data.
+        Index.to_numpy : A NumPy array representing the underlying data.
+
+        Return the underlying data as an ndarray.
+        """
+        return self._data.view(np.ndarray)
+
+    @property
+    def _values(self):
+        # type: () -> Union[ExtensionArray, Index, np.ndarray]
+        # TODO(EA): remove index types as they become extension arrays
+        """
+        The best array representation.
+
+        This is an ndarray, ExtensionArray, or Index subclass. This differs
+        from ``_ndarray_values``, which always returns an ndarray.
+
+        Both ``_values`` and ``_ndarray_values`` are consistent between
+        ``Series`` and ``Index``.
+
+        It may differ from the public '.values' method.
+
+        index             | values          | _values       | _ndarray_values |
+        ----------------- | --------------- | ------------- | --------------- |
+        Index             | ndarray         | ndarray       | ndarray         |
+        CategoricalIndex  | Categorical     | Categorical   | ndarray[int]    |
+        DatetimeIndex     | ndarray[M8ns]   | ndarray[M8ns] | ndarray[M8ns]   |
+        DatetimeIndex[tz] | ndarray[M8ns]   | DTI[tz]       | ndarray[M8ns]   |
+        PeriodIndex       | ndarray[object] | PeriodArray   | ndarray[int]    |
+        IntervalIndex     | IntervalArray   | IntervalArray | ndarray[object] |
+
+        See Also
+        --------
+        values
+        _ndarray_values
+        """
+        return self._data
+
+    def get_values(self):
+        """
+        Return `Index` data as an `numpy.ndarray`.
+
+        Returns
+        -------
+        numpy.ndarray
+            A one-dimensional numpy array of the `Index` values.
+
+        See Also
+        --------
+        Index.values : The attribute that get_values wraps.
+
+        Examples
+        --------
+        Getting the `Index` values of a `DataFrame`:
+
+        >>> df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+        ...                    index=['a', 'b', 'c'], columns=['A', 'B', 'C'])
+        >>> df
+           A  B  C
+        a  1  2  3
+        b  4  5  6
+        c  7  8  9
+        >>> df.index.get_values()
+        array(['a', 'b', 'c'], dtype=object)
+
+        Standalone `Index` values:
+
+        >>> idx = pd.Index(['1', '2', '3'])
+        >>> idx.get_values()
+        array(['1', '2', '3'], dtype=object)
+
+        `MultiIndex` arrays also have only one dimension:
+
+        >>> midx = pd.MultiIndex.from_arrays([[1, 2, 3], ['a', 'b', 'c']],
+        ...                                  names=('number', 'letter'))
+        >>> midx.get_values()
+        array([(1, 'a'), (2, 'b'), (3, 'c')], dtype=object)
+        >>> midx.get_values().ndim
+        1
+        """
+        return self.values
+
+    @Appender(IndexOpsMixin.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        result = super(Index, self).memory_usage(deep=deep)
+
+        # include our engine hashtable
+        result += self._engine.sizeof(deep=deep)
+        return result
+
+    _index_shared_docs['where'] = """
+        Return an Index of same shape as self and whose corresponding
+        entries are from self where cond is True and otherwise are from
+        other.
+
+        .. versionadded:: 0.19.0
+
+        Parameters
+        ----------
+        cond : boolean array-like with the same length as self
+        other : scalar, or array-like
+        """
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        if other is None:
+            other = self._na_value
+
+        dtype = self.dtype
+        values = self.values
+
+        if is_bool(other) or is_bool_dtype(other):
+
+            # bools force casting
+            values = values.astype(object)
+            dtype = None
+
+        values = np.where(cond, values, other)
+
+        if self._is_numeric_dtype and np.any(isna(values)):
+            # We can't coerce to the numeric dtype of "self" (unless
+            # it's float) if there are NaN values in our output.
+            dtype = None
+
+        return self._shallow_copy_with_infer(values, dtype=dtype)
+
+    # construction helpers
+    @classmethod
+    def _try_convert_to_int_index(cls, data, copy, name, dtype):
+        """
+        Attempt to convert an array of data into an integer index.
+
+        Parameters
+        ----------
+        data : The data to convert.
+        copy : Whether to copy the data or not.
+        name : The name of the index returned.
+
+        Returns
+        -------
+        int_index : data converted to either an Int64Index or a
+                    UInt64Index
+
+        Raises
+        ------
+        ValueError if the conversion was not successful.
+        """
+
+        from .numeric import Int64Index, UInt64Index
+        if not is_unsigned_integer_dtype(dtype):
+            # skip int64 conversion attempt if uint-like dtype is passed, as
+            # this could return Int64Index when UInt64Index is what's desrired
+            try:
+                res = data.astype('i8', copy=False)
+                if (res == data).all():
+                    return Int64Index(res, copy=copy, name=name)
+            except (OverflowError, TypeError, ValueError):
+                pass
+
+        # Conversion to int64 failed (possibly due to overflow) or was skipped,
+        # so let's try now with uint64.
+        try:
+            res = data.astype('u8', copy=False)
+            if (res == data).all():
+                return UInt64Index(res, copy=copy, name=name)
+        except (OverflowError, TypeError, ValueError):
+            pass
+
+        raise ValueError
+
+    @classmethod
+    def _scalar_data_error(cls, data):
+        raise TypeError('{0}(...) must be called with a collection of some '
+                        'kind, {1} was passed'.format(cls.__name__,
+                                                      repr(data)))
+
+    @classmethod
+    def _string_data_error(cls, data):
+        raise TypeError('String dtype not supported, you may need '
+                        'to explicitly cast to a numeric type')
+
+    @classmethod
+    def _coerce_to_ndarray(cls, data):
+        """
+        Coerces data to ndarray.
+
+        Converts other iterables to list first and then to array.
+        Does not touch ndarrays.
+
+        Raises
+        ------
+        TypeError
+            When the data passed in is a scalar.
+        """
+
+        if not isinstance(data, (np.ndarray, Index)):
+            if data is None or is_scalar(data):
+                cls._scalar_data_error(data)
+
+            # other iterable of some kind
+            if not isinstance(data, (ABCSeries, list, tuple)):
+                data = list(data)
+            data = np.asarray(data)
+        return data
+
+    def _coerce_scalar_to_index(self, item):
+        """
+        We need to coerce a scalar to a compat for our index type.
+
+        Parameters
+        ----------
+        item : scalar item to coerce
+        """
+        dtype = self.dtype
+
+        if self._is_numeric_dtype and isna(item):
+            # We can't coerce to the numeric dtype of "self" (unless
+            # it's float) if there are NaN values in our output.
+            dtype = None
+
+        return Index([item], dtype=dtype, **self._get_attributes_dict())
+
+    def _to_safe_for_reshape(self):
+        """
+        Convert to object if we are a categorical.
+        """
+        return self
+
+    def _convert_for_op(self, value):
+        """
+        Convert value to be insertable to ndarray.
+        """
+        return value
+
+    def _assert_can_do_op(self, value):
+        """
+        Check value is valid for scalar op.
+        """
+        if not is_scalar(value):
+            msg = "'value' must be a scalar, passed: {0}"
+            raise TypeError(msg.format(type(value).__name__))
+
+    @property
+    def _has_complex_internals(self):
+        # to disable groupby tricks in MultiIndex
+        return False
+
+    def _is_memory_usage_qualified(self):
+        """
+        Return a boolean if we need a qualified .info display.
+        """
+        return self.is_object()
+
+    def is_type_compatible(self, kind):
+        return kind == self.inferred_type
+
+    _index_shared_docs['contains'] = """
+        Return a boolean indicating whether the provided key is in the index.
+
+        Parameters
+        ----------
+        key : label
+            The key to check if it is present in the index.
+
+        Returns
+        -------
+        bool
+            Whether the key search is in the index.
+
+        See Also
+        --------
+        Index.isin : Returns an ndarray of boolean dtype indicating whether the
+            list-like key is in the index.
+
+        Examples
+        --------
+        >>> idx = pd.Index([1, 2, 3, 4])
+        >>> idx
+        Int64Index([1, 2, 3, 4], dtype='int64')
+
+        >>> idx.contains(2)
+        True
+        >>> idx.contains(6)
+        False
+
+        This is equivalent to:
+
+        >>> 2 in idx
+        True
+        >>> 6 in idx
+        False
+        """
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        hash(key)
+        try:
+            return key in self._engine
+        except (OverflowError, TypeError, ValueError):
+            return False
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def contains(self, key):
+        hash(key)
+        try:
+            return key in self._engine
+        except (TypeError, ValueError):
+            return False
+
+    def __hash__(self):
+        raise TypeError("unhashable type: %r" % type(self).__name__)
+
+    def __setitem__(self, key, value):
+        raise TypeError("Index does not support mutable operations")
+
+    def __getitem__(self, key):
+        """
+        Override numpy.ndarray's __getitem__ method to work as desired.
+
+        This function adds lists and Series as valid boolean indexers
+        (ndarrays only supports ndarray with dtype=bool).
+
+        If resulting ndim != 1, plain ndarray is returned instead of
+        corresponding `Index` subclass.
+
+        """
+        # There's no custom logic to be implemented in __getslice__, so it's
+        # not overloaded intentionally.
+        getitem = self._data.__getitem__
+        promote = self._shallow_copy
+
+        if is_scalar(key):
+            key = com.cast_scalar_indexer(key)
+            return getitem(key)
+
+        if isinstance(key, slice):
+            # This case is separated from the conditional above to avoid
+            # pessimization of basic indexing.
+            return promote(getitem(key))
+
+        if com.is_bool_indexer(key):
+            key = np.asarray(key, dtype=bool)
+
+        key = com.values_from_object(key)
+        result = getitem(key)
+        if not is_scalar(result):
+            return promote(result)
+        else:
+            return result
+
+    def _can_hold_identifiers_and_holds_name(self, name):
+        """
+        Faster check for ``name in self`` when we know `name` is a Python
+        identifier (e.g. in NDFrame.__getattr__, which hits this to support
+        . key lookup). For indexes that can't hold identifiers (everything
+        but object & categorical) we just return False.
+
+        https://github.com/pandas-dev/pandas/issues/19764
+        """
+        if self.is_object() or self.is_categorical():
+            return name in self
+        return False
+
+    def append(self, other):
+        """
+        Append a collection of Index options together.
+
+        Parameters
+        ----------
+        other : Index or list/tuple of indices
+
+        Returns
+        -------
+        appended : Index
+        """
+
+        to_concat = [self]
+
+        if isinstance(other, (list, tuple)):
+            to_concat = to_concat + list(other)
+        else:
+            to_concat.append(other)
+
+        for obj in to_concat:
+            if not isinstance(obj, Index):
+                raise TypeError('all inputs must be Index')
+
+        names = {obj.name for obj in to_concat}
+        name = None if len(names) > 1 else self.name
+
+        return self._concat(to_concat, name)
+
+    def _concat(self, to_concat, name):
+
+        typs = _concat.get_dtype_kinds(to_concat)
+
+        if len(typs) == 1:
+            return self._concat_same_dtype(to_concat, name=name)
+        return _concat._concat_index_asobject(to_concat, name=name)
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class.
+        """
+        # must be overridden in specific classes
+        return _concat._concat_index_asobject(to_concat, name)
+
+    def putmask(self, mask, value):
+        """
+        Return a new Index of the values set with the mask.
+
+        See Also
+        --------
+        numpy.ndarray.putmask
+        """
+        values = self.values.copy()
+        try:
+            np.putmask(values, mask, self._convert_for_op(value))
+            return self._shallow_copy(values)
+        except (ValueError, TypeError) as err:
+            if is_object_dtype(self):
+                raise err
+
+            # coerces to object
+            return self.astype(object).putmask(mask, value)
+
+    def equals(self, other):
+        """
+        Determine if two Index objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        if is_object_dtype(self) and not is_object_dtype(other):
+            # if other is not object, use other's logic for coercion
+            return other.equals(self)
+
+        try:
+            return array_equivalent(com.values_from_object(self),
+                                    com.values_from_object(other))
+        except Exception:
+            return False
+
+    def identical(self, other):
+        """
+        Similar to equals, but check that other comparable attributes are
+        also equal.
+        """
+        return (self.equals(other) and
+                all((getattr(self, c, None) == getattr(other, c, None)
+                     for c in self._comparables)) and
+                type(self) == type(other))
+
+    def asof(self, label):
+        """
+        Return the label from the index, or, if not present, the previous one.
+
+        Assuming that the index is sorted, return the passed index label if it
+        is in the index, or return the previous index label if the passed one
+        is not in the index.
+
+        Parameters
+        ----------
+        label : object
+            The label up to which the method returns the latest index label.
+
+        Returns
+        -------
+        object
+            The passed label if it is in the index. The previous label if the
+            passed label is not in the sorted index or `NaN` if there is no
+            such label.
+
+        See Also
+        --------
+        Series.asof : Return the latest value in a Series up to the
+            passed index.
+        merge_asof : Perform an asof merge (similar to left join but it
+            matches on nearest key rather than equal key).
+        Index.get_loc : An `asof` is a thin wrapper around `get_loc`
+            with method='pad'.
+
+        Examples
+        --------
+        `Index.asof` returns the latest index label up to the passed label.
+
+        >>> idx = pd.Index(['2013-12-31', '2014-01-02', '2014-01-03'])
+        >>> idx.asof('2014-01-01')
+        '2013-12-31'
+
+        If the label is in the index, the method returns the passed label.
+
+        >>> idx.asof('2014-01-02')
+        '2014-01-02'
+
+        If all of the labels in the index are later than the passed label,
+        NaN is returned.
+
+        >>> idx.asof('1999-01-02')
+        nan
+
+        If the index is not sorted, an error is raised.
+
+        >>> idx_not_sorted = pd.Index(['2013-12-31', '2015-01-02',
+        ...                            '2014-01-03'])
+        >>> idx_not_sorted.asof('2013-12-31')
+        Traceback (most recent call last):
+        ValueError: index must be monotonic increasing or decreasing
+        """
+        try:
+            loc = self.get_loc(label, method='pad')
+        except KeyError:
+            return self._na_value
+        else:
+            if isinstance(loc, slice):
+                loc = loc.indices(len(self))[-1]
+            return self[loc]
+
+    def asof_locs(self, where, mask):
+        """
+        Find the locations (indices) of the labels from the index for
+        every entry in the `where` argument.
+
+        As in the `asof` function, if the label (a particular entry in
+        `where`) is not in the index, the latest index label upto the
+        passed label is chosen and its index returned.
+
+        If all of the labels in the index are later than a label in `where`,
+        -1 is returned.
+
+        `mask` is used to ignore NA values in the index during calculation.
+
+        Parameters
+        ----------
+        where : Index
+            An Index consisting of an array of timestamps.
+        mask : array-like
+            Array of booleans denoting where values in the original
+            data are not NA.
+
+        Returns
+        -------
+        numpy.ndarray
+            An array of locations (indices) of the labels from the Index
+            which correspond to the return values of the `asof` function
+            for every element in `where`.
+        """
+        locs = self.values[mask].searchsorted(where.values, side='right')
+        locs = np.where(locs > 0, locs - 1, 0)
+
+        result = np.arange(len(self))[mask].take(locs)
+
+        first = mask.argmax()
+        result[(locs == 0) & (where.values < self.values[first])] = -1
+
+        return result
+
+    def sort_values(self, return_indexer=False, ascending=True):
+        """
+        Return a sorted copy of the index.
+
+        Return a sorted copy of the index, and optionally return the indices
+        that sorted the index itself.
+
+        Parameters
+        ----------
+        return_indexer : bool, default False
+            Should the indices that would sort the index be returned.
+        ascending : bool, default True
+            Should the index values be sorted in an ascending order.
+
+        Returns
+        -------
+        sorted_index : pandas.Index
+            Sorted copy of the index.
+        indexer : numpy.ndarray, optional
+            The indices that the index itself was sorted by.
+
+        See Also
+        --------
+        Series.sort_values : Sort values of a Series.
+        DataFrame.sort_values : Sort values in a DataFrame.
+
+        Examples
+        --------
+        >>> idx = pd.Index([10, 100, 1, 1000])
+        >>> idx
+        Int64Index([10, 100, 1, 1000], dtype='int64')
+
+        Sort values in ascending order (default behavior).
+
+        >>> idx.sort_values()
+        Int64Index([1, 10, 100, 1000], dtype='int64')
+
+        Sort values in descending order, and also get the indices `idx` was
+        sorted by.
+
+        >>> idx.sort_values(ascending=False, return_indexer=True)
+        (Int64Index([1000, 100, 10, 1], dtype='int64'), array([3, 1, 0, 2]))
+        """
+        _as = self.argsort()
+        if not ascending:
+            _as = _as[::-1]
+
+        sorted_index = self.take(_as)
+
+        if return_indexer:
+            return sorted_index, _as
+        else:
+            return sorted_index
+
+    def sort(self, *args, **kwargs):
+        raise TypeError("cannot sort an Index object in-place, use "
+                        "sort_values instead")
+
+    def shift(self, periods=1, freq=None):
+        """
+        Shift index by desired number of time frequency increments.
+
+        This method is for shifting the values of datetime-like indexes
+        by a specified time increment a given number of times.
+
+        Parameters
+        ----------
+        periods : int, default 1
+            Number of periods (or increments) to shift by,
+            can be positive or negative.
+        freq : pandas.DateOffset, pandas.Timedelta or string, optional
+            Frequency increment to shift by.
+            If None, the index is shifted by its own `freq` attribute.
+            Offset aliases are valid strings, e.g., 'D', 'W', 'M' etc.
+
+        Returns
+        -------
+        pandas.Index
+            Shifted index.
+
+        See Also
+        --------
+        Series.shift : Shift values of Series.
+
+        Notes
+        -----
+        This method is only implemented for datetime-like index classes,
+        i.e., DatetimeIndex, PeriodIndex and TimedeltaIndex.
+
+        Examples
+        --------
+        Put the first 5 month starts of 2011 into an index.
+
+        >>> month_starts = pd.date_range('1/1/2011', periods=5, freq='MS')
+        >>> month_starts
+        DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01', '2011-04-01',
+                       '2011-05-01'],
+                      dtype='datetime64[ns]', freq='MS')
+
+        Shift the index by 10 days.
+
+        >>> month_starts.shift(10, freq='D')
+        DatetimeIndex(['2011-01-11', '2011-02-11', '2011-03-11', '2011-04-11',
+                       '2011-05-11'],
+                      dtype='datetime64[ns]', freq=None)
+
+        The default value of `freq` is the `freq` attribute of the index,
+        which is 'MS' (month start) in this example.
+
+        >>> month_starts.shift(10)
+        DatetimeIndex(['2011-11-01', '2011-12-01', '2012-01-01', '2012-02-01',
+                       '2012-03-01'],
+                      dtype='datetime64[ns]', freq='MS')
+        """
+        raise NotImplementedError("Not supported for type %s" %
+                                  type(self).__name__)
+
+    def argsort(self, *args, **kwargs):
+        """
+        Return the integer indices that would sort the index.
+
+        Parameters
+        ----------
+        *args
+            Passed to `numpy.ndarray.argsort`.
+        **kwargs
+            Passed to `numpy.ndarray.argsort`.
+
+        Returns
+        -------
+        numpy.ndarray
+            Integer indices that would sort the index if used as
+            an indexer.
+
+        See Also
+        --------
+        numpy.argsort : Similar method for NumPy arrays.
+        Index.sort_values : Return sorted copy of Index.
+
+        Examples
+        --------
+        >>> idx = pd.Index(['b', 'a', 'd', 'c'])
+        >>> idx
+        Index(['b', 'a', 'd', 'c'], dtype='object')
+
+        >>> order = idx.argsort()
+        >>> order
+        array([1, 0, 3, 2])
+
+        >>> idx[order]
+        Index(['a', 'b', 'c', 'd'], dtype='object')
+        """
+        result = self.asi8
+        if result is None:
+            result = np.array(self)
+        return result.argsort(*args, **kwargs)
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing.
+        """
+
+        # if we have something that is Index-like, then
+        # use this, e.g. DatetimeIndex
+        # Things like `Series._get_value` (via .at) pass the EA directly here.
+        s = getattr(series, '_values', series)
+        if isinstance(s, (ExtensionArray, Index)) and is_scalar(key):
+            # GH 20882, 21257
+            # Unify Index and ExtensionArray treatment
+            # First try to convert the key to a location
+            # If that fails, raise a KeyError if an integer
+            # index, otherwise, see if key is an integer, and
+            # try that
+            try:
+                iloc = self.get_loc(key)
+                return s[iloc]
+            except KeyError:
+                if (len(self) > 0 and
+                        (self.holds_integer() or self.is_boolean())):
+                    raise
+                elif is_integer(key):
+                    return s[key]
+
+        s = com.values_from_object(series)
+        k = com.values_from_object(key)
+
+        k = self._convert_scalar_indexer(k, kind='getitem')
+        try:
+            return self._engine.get_value(s, k,
+                                          tz=getattr(series.dtype, 'tz', None))
+        except KeyError as e1:
+            if len(self) > 0 and (self.holds_integer() or self.is_boolean()):
+                raise
+
+            try:
+                return libindex.get_value_box(s, key)
+            except IndexError:
+                raise
+            except TypeError:
+                # generator/iterator-like
+                if is_iterator(key):
+                    raise InvalidIndexError(key)
+                else:
+                    raise e1
+            except Exception:  # pragma: no cover
+                raise e1
+        except TypeError:
+            # python 3
+            if is_scalar(key):  # pragma: no cover
+                raise IndexError(key)
+            raise InvalidIndexError(key)
+
+    def set_value(self, arr, key, value):
+        """
+        Fast lookup of value from 1-dimensional ndarray.
+
+        Notes
+        -----
+        Only use this if you know what you're doing.
+        """
+        self._engine.set_value(com.values_from_object(arr),
+                               com.values_from_object(key), value)
+
+    _index_shared_docs['get_indexer_non_unique'] = """
+        Compute indexer and mask for new index given the current index. The
+        indexer should be then used as an input to ndarray.take to align the
+        current data to the new index.
+
+        Parameters
+        ----------
+        target : %(target_klass)s
+
+        Returns
+        -------
+        indexer : ndarray of int
+            Integers from 0 to n - 1 indicating that the index at these
+            positions matches the corresponding target values. Missing values
+            in the target are marked by -1.
+        missing : ndarray of int
+            An indexer into the target of the values not found.
+            These correspond to the -1 in the indexer array.
+        """
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = ensure_index(target)
+        if is_categorical(target):
+            target = target.astype(target.dtype.categories.dtype)
+        pself, ptarget = self._maybe_promote(target)
+        if pself is not self or ptarget is not target:
+            return pself.get_indexer_non_unique(ptarget)
+
+        if self.is_all_dates:
+            self = Index(self.asi8)
+            tgt_values = target.asi8
+        else:
+            tgt_values = target._ndarray_values
+
+        indexer, missing = self._engine.get_indexer_non_unique(tgt_values)
+        return ensure_platform_int(indexer), missing
+
+    def get_indexer_for(self, target, **kwargs):
+        """
+        Guaranteed return of an indexer even when non-unique.
+
+        This dispatches to get_indexer or get_indexer_nonunique
+        as appropriate.
+        """
+        if self.is_unique:
+            return self.get_indexer(target, **kwargs)
+        indexer, _ = self.get_indexer_non_unique(target, **kwargs)
+        return indexer
+
+    def _maybe_promote(self, other):
+        # A hack, but it works
+        from pandas import DatetimeIndex
+        if self.inferred_type == 'date' and isinstance(other, DatetimeIndex):
+            return DatetimeIndex(self), other
+        elif self.inferred_type == 'boolean':
+            if not is_object_dtype(self.dtype):
+                return self.astype('object'), other.astype('object')
+        return self, other
+
+    def groupby(self, values):
+        """
+        Group the index labels by a given array of values.
+
+        Parameters
+        ----------
+        values : array
+            Values used to determine the groups.
+
+        Returns
+        -------
+        groups : dict
+            {group name -> group labels}
+        """
+
+        # TODO: if we are a MultiIndex, we can do better
+        # that converting to tuples
+        if isinstance(values, ABCMultiIndex):
+            values = values.values
+        values = ensure_categorical(values)
+        result = values._reverse_indexer()
+
+        # map to the label
+        result = {k: self.take(v) for k, v in compat.iteritems(result)}
+
+        return result
+
+    def map(self, mapper, na_action=None):
+        """
+        Map values using input correspondence (a dict, Series, or function).
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+        na_action : {None, 'ignore'}
+            If 'ignore', propagate NA values, without passing them to the
+            mapping correspondence.
+
+        Returns
+        -------
+        applied : Union[Index, MultiIndex], inferred
+            The output of the mapping function applied to the index.
+            If the function returns a tuple with more than one element
+            a MultiIndex will be returned.
+        """
+
+        from .multi import MultiIndex
+        new_values = super(Index, self)._map_values(
+            mapper, na_action=na_action)
+
+        attributes = self._get_attributes_dict()
+
+        # we can return a MultiIndex
+        if new_values.size and isinstance(new_values[0], tuple):
+            if isinstance(self, MultiIndex):
+                names = self.names
+            elif attributes.get('name'):
+                names = [attributes.get('name')] * len(new_values[0])
+            else:
+                names = None
+            return MultiIndex.from_tuples(new_values,
+                                          names=names)
+
+        attributes['copy'] = False
+        if not new_values.size:
+            # empty
+            attributes['dtype'] = self.dtype
+
+        return Index(new_values, **attributes)
+
+    def isin(self, values, level=None):
+        """
+        Return a boolean array where the index values are in `values`.
+
+        Compute boolean array of whether each index value is found in the
+        passed set of values. The length of the returned boolean array matches
+        the length of the index.
+
+        Parameters
+        ----------
+        values : set or list-like
+            Sought values.
+
+            .. versionadded:: 0.18.1
+
+               Support for values as a set.
+
+        level : str or int, optional
+            Name or position of the index level to use (if the index is a
+            `MultiIndex`).
+
+        Returns
+        -------
+        is_contained : ndarray
+            NumPy array of boolean values.
+
+        See Also
+        --------
+        Series.isin : Same for Series.
+        DataFrame.isin : Same method for DataFrames.
+
+        Notes
+        -----
+        In the case of `MultiIndex` you must either specify `values` as a
+        list-like object containing tuples that are the same length as the
+        number of levels, or specify `level`. Otherwise it will raise a
+        ``ValueError``.
+
+        If `level` is specified:
+
+        - if it is the name of one *and only one* index level, use that level;
+        - otherwise it should be a number indicating level position.
+
+        Examples
+        --------
+        >>> idx = pd.Index([1,2,3])
+        >>> idx
+        Int64Index([1, 2, 3], dtype='int64')
+
+        Check whether each index value in a list of values.
+        >>> idx.isin([1, 4])
+        array([ True, False, False])
+
+        >>> midx = pd.MultiIndex.from_arrays([[1,2,3],
+        ...                                  ['red', 'blue', 'green']],
+        ...                                  names=('number', 'color'))
+        >>> midx
+        MultiIndex(levels=[[1, 2, 3], ['blue', 'green', 'red']],
+                   codes=[[0, 1, 2], [2, 0, 1]],
+                   names=['number', 'color'])
+
+        Check whether the strings in the 'color' level of the MultiIndex
+        are in a list of colors.
+
+        >>> midx.isin(['red', 'orange', 'yellow'], level='color')
+        array([ True, False, False])
+
+        To check across the levels of a MultiIndex, pass a list of tuples:
+
+        >>> midx.isin([(1, 'red'), (3, 'red')])
+        array([ True, False, False])
+
+        For a DatetimeIndex, string values in `values` are converted to
+        Timestamps.
+
+        >>> dates = ['2000-03-11', '2000-03-12', '2000-03-13']
+        >>> dti = pd.to_datetime(dates)
+        >>> dti
+        DatetimeIndex(['2000-03-11', '2000-03-12', '2000-03-13'],
+        dtype='datetime64[ns]', freq=None)
+
+        >>> dti.isin(['2000-03-11'])
+        array([ True, False, False])
+        """
+        if level is not None:
+            self._validate_index_level(level)
+        return algos.isin(self, values)
+
+    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
+        # this is for partial string indexing,
+        # overridden in DatetimeIndex, TimedeltaIndex and PeriodIndex
+        raise NotImplementedError
+
+    def slice_indexer(self, start=None, end=None, step=None, kind=None):
+        """
+        For an ordered or unique index, compute the slice indexer for input
+        labels and step.
+
+        Parameters
+        ----------
+        start : label, default None
+            If None, defaults to the beginning
+        end : label, default None
+            If None, defaults to the end
+        step : int, default None
+        kind : string, default None
+
+        Returns
+        -------
+        indexer : slice
+
+        Raises
+        ------
+        KeyError : If key does not exist, or key is not unique and index is
+            not ordered.
+
+        Notes
+        -----
+        This function assumes that the data is sorted, so use at your own peril
+
+        Examples
+        ---------
+        This is a method on all index types. For example you can do:
+
+        >>> idx = pd.Index(list('abcd'))
+        >>> idx.slice_indexer(start='b', end='c')
+        slice(1, 3)
+
+        >>> idx = pd.MultiIndex.from_arrays([list('abcd'), list('efgh')])
+        >>> idx.slice_indexer(start='b', end=('c', 'g'))
+        slice(1, 3)
+        """
+        start_slice, end_slice = self.slice_locs(start, end, step=step,
+                                                 kind=kind)
+
+        # return a slice
+        if not is_scalar(start_slice):
+            raise AssertionError("Start slice bound is non-scalar")
+        if not is_scalar(end_slice):
+            raise AssertionError("End slice bound is non-scalar")
+
+        return slice(start_slice, end_slice, step)
+
+    def _maybe_cast_indexer(self, key):
+        """
+        If we have a float key and are not a floating index, then try to cast
+        to an int if equivalent.
+        """
+
+        if is_float(key) and not self.is_floating():
+            try:
+                ckey = int(key)
+                if ckey == key:
+                    key = ckey
+            except (OverflowError, ValueError, TypeError):
+                pass
+        return key
+
+    def _validate_indexer(self, form, key, kind):
+        """
+        If we are positional indexer, validate that we have appropriate
+        typed bounds must be an integer.
+        """
+        assert kind in ['ix', 'loc', 'getitem', 'iloc']
+
+        if key is None:
+            pass
+        elif is_integer(key):
+            pass
+        elif kind in ['iloc', 'getitem']:
+            self._invalid_indexer(form, key)
+        return key
+
+    _index_shared_docs['_maybe_cast_slice_bound'] = """
+        This function should be overloaded in subclasses that allow non-trivial
+        casting on label-slice bounds, e.g. datetime-like indices allowing
+        strings containing formatted datetimes.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+
+    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        # We are a plain index here (sub-class override this method if they
+        # wish to have special treatment for floats/ints, e.g. Float64Index and
+        # datetimelike Indexes
+        # reject them
+        if is_float(label):
+            if not (kind in ['ix'] and (self.holds_integer() or
+                                        self.is_floating())):
+                self._invalid_indexer('slice', label)
+
+        # we are trying to find integer bounds on a non-integer based index
+        # this is rejected (generally .loc gets you here)
+        elif is_integer(label):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _searchsorted_monotonic(self, label, side='left'):
+        if self.is_monotonic_increasing:
+            return self.searchsorted(label, side=side)
+        elif self.is_monotonic_decreasing:
+            # np.searchsorted expects ascending sort order, have to reverse
+            # everything for it to work (element ordering, search side and
+            # resulting value).
+            pos = self[::-1].searchsorted(label, side='right' if side == 'left'
+                                          else 'left')
+            return len(self) - pos
+
+        raise ValueError('index must be monotonic increasing or decreasing')
+
+    def _get_loc_only_exact_matches(self, key):
+        """
+        This is overridden on subclasses (namely, IntervalIndex) to control
+        get_slice_bound.
+        """
+        return self.get_loc(key)
+
+    def get_slice_bound(self, label, side, kind):
+        """
+        Calculate slice bound that corresponds to given label.
+
+        Returns leftmost (one-past-the-rightmost if ``side=='right'``) position
+        of given label.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if side not in ('left', 'right'):
+            raise ValueError("Invalid value for side kwarg,"
+                             " must be either 'left' or 'right': %s" %
+                             (side, ))
+
+        original_label = label
+
+        # For datetime indices label may be a string that has to be converted
+        # to datetime boundary according to its resolution.
+        label = self._maybe_cast_slice_bound(label, side, kind)
+
+        # we need to look up the label
+        try:
+            slc = self._get_loc_only_exact_matches(label)
+        except KeyError as err:
+            try:
+                return self._searchsorted_monotonic(label, side)
+            except ValueError:
+                # raise the original KeyError
+                raise err
+
+        if isinstance(slc, np.ndarray):
+            # get_loc may return a boolean array or an array of indices, which
+            # is OK as long as they are representable by a slice.
+            if is_bool_dtype(slc):
+                slc = lib.maybe_booleans_to_slice(slc.view('u1'))
+            else:
+                slc = lib.maybe_indices_to_slice(slc.astype('i8'), len(self))
+            if isinstance(slc, np.ndarray):
+                raise KeyError("Cannot get %s slice bound for non-unique "
+                               "label: %r" % (side, original_label))
+
+        if isinstance(slc, slice):
+            if side == 'left':
+                return slc.start
+            else:
+                return slc.stop
+        else:
+            if side == 'right':
+                return slc + 1
+            else:
+                return slc
+
+    def slice_locs(self, start=None, end=None, step=None, kind=None):
+        """
+        Compute slice locations for input labels.
+
+        Parameters
+        ----------
+        start : label, default None
+            If None, defaults to the beginning
+        end : label, default None
+            If None, defaults to the end
+        step : int, defaults None
+            If None, defaults to 1
+        kind : {'ix', 'loc', 'getitem'} or None
+
+        Returns
+        -------
+        start, end : int
+
+        See Also
+        --------
+        Index.get_loc : Get location for a single label.
+
+        Notes
+        -----
+        This method only works if the index is monotonic or unique.
+
+        Examples
+        ---------
+        >>> idx = pd.Index(list('abcd'))
+        >>> idx.slice_locs(start='b', end='c')
+        (1, 3)
+        """
+        inc = (step is None or step >= 0)
+
+        if not inc:
+            # If it's a reverse slice, temporarily swap bounds.
+            start, end = end, start
+
+        # GH 16785: If start and end happen to be date strings with UTC offsets
+        # attempt to parse and check that the offsets are the same
+        if (isinstance(start, (compat.string_types, datetime))
+                and isinstance(end, (compat.string_types, datetime))):
+            try:
+                ts_start = Timestamp(start)
+                ts_end = Timestamp(end)
+            except (ValueError, TypeError):
+                pass
+            else:
+                if not tz_compare(ts_start.tzinfo, ts_end.tzinfo):
+                    raise ValueError("Both dates must have the "
+                                     "same UTC offset")
+
+        start_slice = None
+        if start is not None:
+            start_slice = self.get_slice_bound(start, 'left', kind)
+        if start_slice is None:
+            start_slice = 0
+
+        end_slice = None
+        if end is not None:
+            end_slice = self.get_slice_bound(end, 'right', kind)
+        if end_slice is None:
+            end_slice = len(self)
+
+        if not inc:
+            # Bounds at this moment are swapped, swap them back and shift by 1.
+            #
+            # slice_locs('B', 'A', step=-1): s='B', e='A'
+            #
+            #              s='A'                 e='B'
+            # AFTER SWAP:    |                     |
+            #                v ------------------> V
+            #           -----------------------------------
+            #           | | |A|A|A|A| | | | | |B|B| | | | |
+            #           -----------------------------------
+            #              ^ <------------------ ^
+            # SHOULD BE:   |                     |
+            #           end=s-1              start=e-1
+            #
+            end_slice, start_slice = start_slice - 1, end_slice - 1
+
+            # i == -1 triggers ``len(self) + i`` selection that points to the
+            # last element, not before-the-first one, subtracting len(self)
+            # compensates that.
+            if end_slice == -1:
+                end_slice -= len(self)
+            if start_slice == -1:
+                start_slice -= len(self)
+
+        return start_slice, end_slice
+
+    def delete(self, loc):
+        """
+        Make new Index with passed location(-s) deleted.
+
+        Returns
+        -------
+        new_index : Index
+        """
+        return self._shallow_copy(np.delete(self._data, loc))
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location.
+
+        Follows Python list.append semantics for negative values.
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : Index
+        """
+        _self = np.asarray(self)
+        item = self._coerce_scalar_to_index(item)._ndarray_values
+        idx = np.concatenate((_self[:loc], item, _self[loc:]))
+        return self._shallow_copy_with_infer(idx)
+
+    def drop(self, labels, errors='raise'):
+        """
+        Make new Index with passed list of labels deleted.
+
+        Parameters
+        ----------
+        labels : array-like
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and existing labels are dropped.
+
+        Returns
+        -------
+        dropped : Index
+
+        Raises
+        ------
+        KeyError
+            If not all of the labels are found in the selected axis
+        """
+        arr_dtype = 'object' if self.dtype == 'object' else None
+        labels = com.index_labels_to_array(labels, dtype=arr_dtype)
+        indexer = self.get_indexer(labels)
+        mask = indexer == -1
+        if mask.any():
+            if errors != 'ignore':
+                raise KeyError(
+                    '{} not found in axis'.format(labels[mask]))
+            indexer = indexer[~mask]
+        return self.delete(indexer)
+
+    # --------------------------------------------------------------------
+    # Generated Arithmetic, Comparison, and Unary Methods
+
+    def _evaluate_with_timedelta_like(self, other, op):
+        # Timedelta knows how to operate with np.array, so dispatch to that
+        # operation and then wrap the results
+        if self._is_numeric_dtype and op.__name__ in ['add', 'sub',
+                                                      'radd', 'rsub']:
+            raise TypeError("Operation {opname} between {cls} and {other} "
+                            "is invalid".format(opname=op.__name__,
+                                                cls=self.dtype,
+                                                other=type(other).__name__))
+
+        other = Timedelta(other)
+        values = self.values
+
+        with np.errstate(all='ignore'):
+            result = op(values, other)
+
+        attrs = self._get_attributes_dict()
+        attrs = self._maybe_update_attributes(attrs)
+        if op == divmod:
+            return Index(result[0], **attrs), Index(result[1], **attrs)
+        return Index(result, **attrs)
+
+    def _evaluate_with_datetime_like(self, other, op):
+        raise TypeError("can only perform ops with datetime like values")
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """
+        Add in comparison methods.
+        """
+        cls.__eq__ = _make_comparison_op(operator.eq, cls)
+        cls.__ne__ = _make_comparison_op(operator.ne, cls)
+        cls.__lt__ = _make_comparison_op(operator.lt, cls)
+        cls.__gt__ = _make_comparison_op(operator.gt, cls)
+        cls.__le__ = _make_comparison_op(operator.le, cls)
+        cls.__ge__ = _make_comparison_op(operator.ge, cls)
+
+    @classmethod
+    def _add_numeric_methods_add_sub_disabled(cls):
+        """
+        Add in the numeric add/sub methods to disable.
+        """
+        cls.__add__ = make_invalid_op('__add__')
+        cls.__radd__ = make_invalid_op('__radd__')
+        cls.__iadd__ = make_invalid_op('__iadd__')
+        cls.__sub__ = make_invalid_op('__sub__')
+        cls.__rsub__ = make_invalid_op('__rsub__')
+        cls.__isub__ = make_invalid_op('__isub__')
+
+    @classmethod
+    def _add_numeric_methods_disabled(cls):
+        """
+        Add in numeric methods to disable other than add/sub.
+        """
+        cls.__pow__ = make_invalid_op('__pow__')
+        cls.__rpow__ = make_invalid_op('__rpow__')
+        cls.__mul__ = make_invalid_op('__mul__')
+        cls.__rmul__ = make_invalid_op('__rmul__')
+        cls.__floordiv__ = make_invalid_op('__floordiv__')
+        cls.__rfloordiv__ = make_invalid_op('__rfloordiv__')
+        cls.__truediv__ = make_invalid_op('__truediv__')
+        cls.__rtruediv__ = make_invalid_op('__rtruediv__')
+        if not compat.PY3:
+            cls.__div__ = make_invalid_op('__div__')
+            cls.__rdiv__ = make_invalid_op('__rdiv__')
+        cls.__mod__ = make_invalid_op('__mod__')
+        cls.__divmod__ = make_invalid_op('__divmod__')
+        cls.__neg__ = make_invalid_op('__neg__')
+        cls.__pos__ = make_invalid_op('__pos__')
+        cls.__abs__ = make_invalid_op('__abs__')
+        cls.__inv__ = make_invalid_op('__inv__')
+
+    def _maybe_update_attributes(self, attrs):
+        """
+        Update Index attributes (e.g. freq) depending on op.
+        """
+        return attrs
+
+    def _validate_for_numeric_unaryop(self, op, opstr):
+        """
+        Validate if we can perform a numeric unary operation.
+        """
+        if not self._is_numeric_dtype:
+            raise TypeError("cannot evaluate a numeric op "
+                            "{opstr} for type: {typ}"
+                            .format(opstr=opstr, typ=type(self).__name__))
+
+    def _validate_for_numeric_binop(self, other, op):
+        """
+        Return valid other; evaluate or raise TypeError if we are not of
+        the appropriate type.
+
+        Notes
+        -----
+        This is an internal method called by ops.
+        """
+        opstr = '__{opname}__'.format(opname=op.__name__)
+        # if we are an inheritor of numeric,
+        # but not actually numeric (e.g. DatetimeIndex/PeriodIndex)
+        if not self._is_numeric_dtype:
+            raise TypeError("cannot evaluate a numeric op {opstr} "
+                            "for type: {typ}"
+                            .format(opstr=opstr, typ=type(self).__name__))
+
+        if isinstance(other, Index):
+            if not other._is_numeric_dtype:
+                raise TypeError("cannot evaluate a numeric op "
+                                "{opstr} with type: {typ}"
+                                .format(opstr=opstr, typ=type(other)))
+        elif isinstance(other, np.ndarray) and not other.ndim:
+            other = other.item()
+
+        if isinstance(other, (Index, ABCSeries, np.ndarray)):
+            if len(self) != len(other):
+                raise ValueError("cannot evaluate a numeric op with "
+                                 "unequal lengths")
+            other = com.values_from_object(other)
+            if other.dtype.kind not in ['f', 'i', 'u']:
+                raise TypeError("cannot evaluate a numeric op "
+                                "with a non-numeric dtype")
+        elif isinstance(other, (ABCDateOffset, np.timedelta64, timedelta)):
+            # higher up to handle
+            pass
+        elif isinstance(other, (datetime, np.datetime64)):
+            # higher up to handle
+            pass
+        else:
+            if not (is_float(other) or is_integer(other)):
+                raise TypeError("can only perform ops with scalar values")
+
+        return other
+
+    @classmethod
+    def _add_numeric_methods_binary(cls):
+        """
+        Add in numeric methods.
+        """
+        cls.__add__ = _make_arithmetic_op(operator.add, cls)
+        cls.__radd__ = _make_arithmetic_op(ops.radd, cls)
+        cls.__sub__ = _make_arithmetic_op(operator.sub, cls)
+        cls.__rsub__ = _make_arithmetic_op(ops.rsub, cls)
+        cls.__rpow__ = _make_arithmetic_op(ops.rpow, cls)
+        cls.__pow__ = _make_arithmetic_op(operator.pow, cls)
+
+        cls.__truediv__ = _make_arithmetic_op(operator.truediv, cls)
+        cls.__rtruediv__ = _make_arithmetic_op(ops.rtruediv, cls)
+        if not compat.PY3:
+            cls.__div__ = _make_arithmetic_op(operator.div, cls)
+            cls.__rdiv__ = _make_arithmetic_op(ops.rdiv, cls)
+
+        # TODO: rmod? rdivmod?
+        cls.__mod__ = _make_arithmetic_op(operator.mod, cls)
+        cls.__floordiv__ = _make_arithmetic_op(operator.floordiv, cls)
+        cls.__rfloordiv__ = _make_arithmetic_op(ops.rfloordiv, cls)
+        cls.__divmod__ = _make_arithmetic_op(divmod, cls)
+        cls.__mul__ = _make_arithmetic_op(operator.mul, cls)
+        cls.__rmul__ = _make_arithmetic_op(ops.rmul, cls)
+
+    @classmethod
+    def _add_numeric_methods_unary(cls):
+        """
+        Add in numeric unary methods.
+        """
+        def _make_evaluate_unary(op, opstr):
+
+            def _evaluate_numeric_unary(self):
+
+                self._validate_for_numeric_unaryop(op, opstr)
+                attrs = self._get_attributes_dict()
+                attrs = self._maybe_update_attributes(attrs)
+                return Index(op(self.values), **attrs)
+
+            _evaluate_numeric_unary.__name__ = opstr
+            return _evaluate_numeric_unary
+
+        cls.__neg__ = _make_evaluate_unary(operator.neg, '__neg__')
+        cls.__pos__ = _make_evaluate_unary(operator.pos, '__pos__')
+        cls.__abs__ = _make_evaluate_unary(np.abs, '__abs__')
+        cls.__inv__ = _make_evaluate_unary(lambda x: -x, '__inv__')
+
+    @classmethod
+    def _add_numeric_methods(cls):
+        cls._add_numeric_methods_unary()
+        cls._add_numeric_methods_binary()
+
+    @classmethod
+    def _add_logical_methods(cls):
+        """
+        Add in logical methods.
+        """
+        _doc = """
+        %(desc)s
+
+        Parameters
+        ----------
+        *args
+            These parameters will be passed to numpy.%(outname)s.
+        **kwargs
+            These parameters will be passed to numpy.%(outname)s.
+
+        Returns
+        -------
+        %(outname)s : bool or array_like (if axis is specified)
+            A single element array_like may be converted to bool."""
+
+        _index_shared_docs['index_all'] = dedent("""
+
+        See Also
+        --------
+        Index.any : Return whether any element in an Index is True.
+        Series.any : Return whether any element in a Series is True.
+        Series.all : Return whether all elements in a Series are True.
+
+        Notes
+        -----
+        Not a Number (NaN), positive infinity and negative infinity
+        evaluate to True because these are not equal to zero.
+
+        Examples
+        --------
+        **all**
+
+        True, because nonzero integers are considered True.
+
+        >>> pd.Index([1, 2, 3]).all()
+        True
+
+        False, because ``0`` is considered False.
+
+        >>> pd.Index([0, 1, 2]).all()
+        False
+
+        **any**
+
+        True, because ``1`` is considered True.
+
+        >>> pd.Index([0, 0, 1]).any()
+        True
+
+        False, because ``0`` is considered False.
+
+        >>> pd.Index([0, 0, 0]).any()
+        False
+        """)
+
+        _index_shared_docs['index_any'] = dedent("""
+
+        See Also
+        --------
+        Index.all : Return whether all elements are True.
+        Series.all : Return whether all elements are True.
+
+        Notes
+        -----
+        Not a Number (NaN), positive infinity and negative infinity
+        evaluate to True because these are not equal to zero.
+
+        Examples
+        --------
+        >>> index = pd.Index([0, 1, 2])
+        >>> index.any()
+        True
+
+        >>> index = pd.Index([0, 0, 0])
+        >>> index.any()
+        False
+        """)
+
+        def _make_logical_function(name, desc, f):
+            @Substitution(outname=name, desc=desc)
+            @Appender(_index_shared_docs['index_' + name])
+            @Appender(_doc)
+            def logical_func(self, *args, **kwargs):
+                result = f(self.values)
+                if (isinstance(result, (np.ndarray, ABCSeries, Index)) and
+                        result.ndim == 0):
+                    # return NumPy type
+                    return result.dtype.type(result.item())
+                else:  # pragma: no cover
+                    return result
+
+            logical_func.__name__ = name
+            return logical_func
+
+        cls.all = _make_logical_function('all', 'Return whether all elements '
+                                                'are True.',
+                                         np.all)
+        cls.any = _make_logical_function('any',
+                                         'Return whether any element is True.',
+                                         np.any)
+
+    @classmethod
+    def _add_logical_methods_disabled(cls):
+        """
+        Add in logical methods to disable.
+        """
+        cls.all = make_invalid_op('all')
+        cls.any = make_invalid_op('any')
+
+
+Index._add_numeric_methods_disabled()
+Index._add_logical_methods()
+Index._add_comparison_methods()
+
+
+def ensure_index_from_sequences(sequences, names=None):
+    """
+    Construct an index from sequences of data.
+
+    A single sequence returns an Index. Many sequences returns a
+    MultiIndex.
+
+    Parameters
+    ----------
+    sequences : sequence of sequences
+    names : sequence of str
+
+    Returns
+    -------
+    index : Index or MultiIndex
+
+    Examples
+    --------
+    >>> ensure_index_from_sequences([[1, 2, 3]], names=['name'])
+    Int64Index([1, 2, 3], dtype='int64', name='name')
+
+    >>> ensure_index_from_sequences([['a', 'a'], ['a', 'b']],
+                                    names=['L1', 'L2'])
+    MultiIndex(levels=[['a'], ['a', 'b']],
+               codes=[[0, 0], [0, 1]],
+               names=['L1', 'L2'])
+
+    See Also
+    --------
+    ensure_index
+    """
+    from .multi import MultiIndex
+
+    if len(sequences) == 1:
+        if names is not None:
+            names = names[0]
+        return Index(sequences[0], name=names)
+    else:
+        return MultiIndex.from_arrays(sequences, names=names)
+
+
+def ensure_index(index_like, copy=False):
+    """
+    Ensure that we have an index from some index-like object.
+
+    Parameters
+    ----------
+    index : sequence
+        An Index or other sequence
+    copy : bool
+
+    Returns
+    -------
+    index : Index or MultiIndex
+
+    Examples
+    --------
+    >>> ensure_index(['a', 'b'])
+    Index(['a', 'b'], dtype='object')
+
+    >>> ensure_index([('a', 'a'),  ('b', 'c')])
+    Index([('a', 'a'), ('b', 'c')], dtype='object')
+
+    >>> ensure_index([['a', 'a'], ['b', 'c']])
+    MultiIndex(levels=[['a'], ['b', 'c']],
+               codes=[[0, 0], [0, 1]])
+
+    See Also
+    --------
+    ensure_index_from_sequences
+    """
+    if isinstance(index_like, Index):
+        if copy:
+            index_like = index_like.copy()
+        return index_like
+    if hasattr(index_like, 'name'):
+        return Index(index_like, name=index_like.name, copy=copy)
+
+    if is_iterator(index_like):
+        index_like = list(index_like)
+
+    # must check for exactly list here because of strict type
+    # check in clean_index_list
+    if isinstance(index_like, list):
+        if type(index_like) != list:
+            index_like = list(index_like)
+
+        converted, all_arrays = lib.clean_index_list(index_like)
+
+        if len(converted) > 0 and all_arrays:
+            from .multi import MultiIndex
+            return MultiIndex.from_arrays(converted)
+        else:
+            index_like = converted
+    else:
+        # clean_index_list does the equivalent of copying
+        # so only need to do this if not list instance
+        if copy:
+            from copy import copy
+            index_like = copy(index_like)
+
+    return Index(index_like)
+
+
+def _ensure_has_len(seq):
+    """
+    If seq is an iterator, put its values into a list.
+    """
+    try:
+        len(seq)
+    except TypeError:
+        return list(seq)
+    else:
+        return seq
+
+
+def _trim_front(strings):
+    """
+    Trims zeros and decimal points.
+    """
+    trimmed = strings
+    while len(strings) > 0 and all(x[0] == ' ' for x in trimmed):
+        trimmed = [x[1:] for x in trimmed]
+    return trimmed
+
+
+def _validate_join_method(method):
+    if method not in ['left', 'right', 'inner', 'outer']:
+        raise ValueError('do not recognize join method %s' % method)
+
+
+def default_index(n):
+    from pandas.core.index import RangeIndex
+    return RangeIndex(0, n, name=None)
diff --git a/pandas/core/indexes/category.py b/pandas/core/indexes/category.py
new file mode 100644
index 0000000000000..b494c41c3b58c
--- /dev/null
+++ b/pandas/core/indexes/category.py
@@ -0,0 +1,903 @@
+import operator
+import warnings
+
+import numpy as np
+
+from pandas._libs import index as libindex
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, cache_readonly
+
+from pandas.core.dtypes.common import (
+    ensure_platform_int, is_categorical_dtype, is_interval_dtype, is_list_like,
+    is_scalar)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.generic import ABCCategorical, ABCSeries
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import accessor
+from pandas.core.algorithms import take_1d
+from pandas.core.arrays.categorical import Categorical, contains
+import pandas.core.common as com
+from pandas.core.config import get_option
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import Index, _index_shared_docs
+import pandas.core.missing as missing
+from pandas.core.ops import get_op_result_name
+
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(dict(target_klass='CategoricalIndex'))
+
+
+@accessor.delegate_names(
+    delegate=Categorical,
+    accessors=["rename_categories",
+               "reorder_categories",
+               "add_categories",
+               "remove_categories",
+               "remove_unused_categories",
+               "set_categories",
+               "as_ordered", "as_unordered",
+               "min", "max"],
+    typ='method', overwrite=True)
+class CategoricalIndex(Index, accessor.PandasDelegate):
+    """
+    Index based on an underlying :class:`Categorical`.
+
+    CategoricalIndex, like Categorical, can only take on a limited,
+    and usually fixed, number of possible values (`categories`). Also,
+    like Categorical, it might have an order, but numerical operations
+    (additions, divisions, ...) are not possible.
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+        The values of the categorical. If `categories` are given, values not in
+        `categories` will be replaced with NaN.
+    categories : index-like, optional
+        The categories for the categorical. Items need to be unique.
+        If the categories are not given here (and also not in `dtype`), they
+        will be inferred from the `data`.
+    ordered : bool, optional
+        Whether or not this categorical is treated as an ordered
+        categorical. If not given here or in `dtype`, the resulting
+        categorical will be unordered.
+    dtype : CategoricalDtype or the string "category", optional
+        If :class:`CategoricalDtype`, cannot be used together with
+        `categories` or `ordered`.
+
+        .. versionadded:: 0.21.0
+    copy : bool, default False
+        Make a copy of input ndarray.
+    name : object, optional
+        Name to be stored in the index.
+
+    Attributes
+    ----------
+    codes
+    categories
+    ordered
+
+    Methods
+    -------
+    rename_categories
+    reorder_categories
+    add_categories
+    remove_categories
+    remove_unused_categories
+    set_categories
+    as_ordered
+    as_unordered
+    map
+
+    Raises
+    ------
+    ValueError
+        If the categories do not validate.
+    TypeError
+        If an explicit ``ordered=True`` is given but no `categories` and the
+        `values` are not sortable.
+
+    See Also
+    --------
+    Index : The base pandas Index type.
+    Categorical : A categorical array.
+    CategoricalDtype : Type for categorical data.
+
+    Notes
+    -----
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/user_guide/advanced.html#categoricalindex>`_
+    for more.
+
+    Examples
+    --------
+    >>> pd.CategoricalIndex(['a', 'b', 'c', 'a', 'b', 'c'])
+    CategoricalIndex(['a', 'b', 'c', 'a', 'b', 'c'], categories=['a', 'b', 'c'], ordered=False, dtype='category')  # noqa
+
+    ``CategoricalIndex`` can also be instantiated from a ``Categorical``:
+
+    >>> c = pd.Categorical(['a', 'b', 'c', 'a', 'b', 'c'])
+    >>> pd.CategoricalIndex(c)
+    CategoricalIndex(['a', 'b', 'c', 'a', 'b', 'c'], categories=['a', 'b', 'c'], ordered=False, dtype='category')  # noqa
+
+    Ordered ``CategoricalIndex`` can have a min and max value.
+
+    >>> ci = pd.CategoricalIndex(['a','b','c','a','b','c'], ordered=True,
+    ...                          categories=['c', 'b', 'a'])
+    >>> ci
+    CategoricalIndex(['a', 'b', 'c', 'a', 'b', 'c'], categories=['c', 'b', 'a'], ordered=True, dtype='category')  # noqa
+    >>> ci.min()
+    'c'
+    """
+
+    _typ = 'categoricalindex'
+
+    @property
+    def _engine_type(self):
+        # self.codes can have dtype int8, int16, int32 or int64, so we need
+        # to return the corresponding engine type (libindex.Int8Engine, etc.).
+        return {np.int8: libindex.Int8Engine,
+                np.int16: libindex.Int16Engine,
+                np.int32: libindex.Int32Engine,
+                np.int64: libindex.Int64Engine,
+                }[self.codes.dtype.type]
+
+    _attributes = ['name']
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, data=None, categories=None, ordered=None, dtype=None,
+                copy=False, name=None, fastpath=None):
+
+        if fastpath is not None:
+            warnings.warn("The 'fastpath' keyword is deprecated, and will be "
+                          "removed in a future version.",
+                          FutureWarning, stacklevel=2)
+            if fastpath:
+                return cls._simple_new(data, name=name, dtype=dtype)
+
+        dtype = CategoricalDtype._from_values_or_dtype(data, categories,
+                                                       ordered, dtype)
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if not is_categorical_dtype(data):
+            # don't allow scalars
+            # if data is None, then categories must be provided
+            if is_scalar(data):
+                if data is not None or categories is None:
+                    cls._scalar_data_error(data)
+                data = []
+
+        data = cls._create_categorical(data, dtype=dtype)
+
+        data = data.copy() if copy else data
+
+        return cls._simple_new(data, name=name)
+
+    def _create_from_codes(self, codes, dtype=None, name=None):
+        """
+        *this is an internal non-public method*
+
+        create the correct categorical from codes
+
+        Parameters
+        ----------
+        codes : new codes
+        dtype: CategoricalDtype, defaults to existing
+        name : optional name attribute, defaults to existing
+
+        Returns
+        -------
+        CategoricalIndex
+        """
+
+        if dtype is None:
+            dtype = self.dtype
+        if name is None:
+            name = self.name
+        cat = Categorical.from_codes(codes, dtype=dtype)
+        return CategoricalIndex(cat, name=name)
+
+    @classmethod
+    def _create_categorical(cls, data, dtype=None):
+        """
+        *this is an internal non-public method*
+
+        create the correct categorical from data and the properties
+
+        Parameters
+        ----------
+        data : data for new Categorical
+        dtype : CategoricalDtype, defaults to existing
+
+        Returns
+        -------
+        Categorical
+        """
+        if (isinstance(data, (cls, ABCSeries)) and
+                is_categorical_dtype(data)):
+            data = data.values
+
+        if not isinstance(data, ABCCategorical):
+            return Categorical(data, dtype=dtype)
+
+        if isinstance(dtype, CategoricalDtype) and dtype != data.dtype:
+            # we want to silently ignore dtype='category'
+            data = data._set_dtype(dtype)
+        return data
+
+    @classmethod
+    def _simple_new(cls, values, name=None, dtype=None, **kwargs):
+        result = object.__new__(cls)
+
+        values = cls._create_categorical(values, dtype=dtype)
+        result._data = values
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+
+        result._reset_identity()
+        return result
+
+    # --------------------------------------------------------------------
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, dtype=None, **kwargs):
+        if dtype is None:
+            dtype = self.dtype
+        return super(CategoricalIndex, self)._shallow_copy(
+            values=values, dtype=dtype, **kwargs)
+
+    def _is_dtype_compat(self, other):
+        """
+        *this is an internal non-public method*
+
+        provide a comparison between the dtype of self and other (coercing if
+        needed)
+
+        Raises
+        ------
+        TypeError if the dtypes are not compatible
+        """
+        if is_categorical_dtype(other):
+            if isinstance(other, CategoricalIndex):
+                other = other._values
+            if not other.is_dtype_equal(self):
+                raise TypeError("categories must match existing categories "
+                                "when appending")
+        else:
+            values = other
+            if not is_list_like(values):
+                values = [values]
+            other = CategoricalIndex(self._create_categorical(
+                other, dtype=self.dtype))
+            if not other.isin(values).all():
+                raise TypeError("cannot append a non-category item to a "
+                                "CategoricalIndex")
+
+        return other
+
+    def equals(self, other):
+        """
+        Determine if two CategorialIndex objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        try:
+            other = self._is_dtype_compat(other)
+            if isinstance(other, type(self)):
+                other = other._data
+            return self._data.equals(other)
+        except (TypeError, ValueError):
+            pass
+
+        return False
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    @property
+    def _formatter_func(self):
+        return self.categories._formatter_func
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        max_categories = (10 if get_option("display.max_categories") == 0 else
+                          get_option("display.max_categories"))
+        attrs = [
+            ('categories',
+             ibase.default_pprint(self.categories,
+                                  max_seq_items=max_categories)),
+            ('ordered', self.ordered)]
+        if self.name is not None:
+            attrs.append(('name', ibase.default_pprint(self.name)))
+        attrs.append(('dtype', "'%s'" % self.dtype.name))
+        max_seq_items = get_option('display.max_seq_items') or len(self)
+        if len(self) > max_seq_items:
+            attrs.append(('length', len(self)))
+        return attrs
+
+    # --------------------------------------------------------------------
+
+    @property
+    def inferred_type(self):
+        return 'categorical'
+
+    @property
+    def values(self):
+        """ return the underlying data, which is a Categorical """
+        return self._data
+
+    @property
+    def itemsize(self):
+        # Size of the items in categories, not codes.
+        return self.values.itemsize
+
+    def _wrap_setop_result(self, other, result):
+        name = get_op_result_name(self, other)
+        return self._shallow_copy(result, name=name)
+
+    def get_values(self):
+        """ return the underlying data as an ndarray """
+        return self._data.get_values()
+
+    def tolist(self):
+        return self._data.tolist()
+
+    @property
+    def codes(self):
+        return self._data.codes
+
+    @property
+    def categories(self):
+        return self._data.categories
+
+    @property
+    def ordered(self):
+        return self._data.ordered
+
+    def _reverse_indexer(self):
+        return self._data._reverse_indexer()
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        # if key is a NaN, check if any NaN is in self.
+        if isna(key):
+            return self.hasnans
+
+        return contains(self, key, container=self._engine)
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def contains(self, key):
+        return key in self
+
+    def __array__(self, dtype=None):
+        """ the array interface, return my values """
+        return np.array(self._data, dtype=dtype)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        if is_interval_dtype(dtype):
+            from pandas import IntervalIndex
+            return IntervalIndex(np.array(self))
+        elif is_categorical_dtype(dtype):
+            # GH 18630
+            dtype = self.dtype.update_dtype(dtype)
+            if dtype == self.dtype:
+                return self.copy() if copy else self
+
+        return super(CategoricalIndex, self).astype(dtype=dtype, copy=copy)
+
+    @cache_readonly
+    def _isnan(self):
+        """ return if each value is nan"""
+        return self._data.codes == -1
+
+    @Appender(ibase._index_shared_docs['fillna'])
+    def fillna(self, value, downcast=None):
+        self._assert_can_do_op(value)
+        return CategoricalIndex(self._data.fillna(value), name=self.name)
+
+    def argsort(self, *args, **kwargs):
+        return self.values.argsort(*args, **kwargs)
+
+    @cache_readonly
+    def _engine(self):
+
+        # we are going to look things up with the codes themselves
+        return self._engine_type(lambda: self.codes, len(self))
+
+    # introspection
+    @cache_readonly
+    def is_unique(self):
+        return self._engine.is_unique
+
+    @property
+    def is_monotonic_increasing(self):
+        return self._engine.is_monotonic_increasing
+
+    @property
+    def is_monotonic_decreasing(self):
+        return self._engine.is_monotonic_decreasing
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        result = self.values.unique()
+        # CategoricalIndex._shallow_copy keeps original dtype
+        # if not otherwise specified
+        return self._shallow_copy(result, dtype=result.dtype)
+
+    @Appender(Index.duplicated.__doc__)
+    def duplicated(self, keep='first'):
+        from pandas._libs.hashtable import duplicated_int64
+        codes = self.codes.astype('i8')
+        return duplicated_int64(codes, keep)
+
+    def _to_safe_for_reshape(self):
+        """ convert to object if we are a categorical """
+        return self.astype('object')
+
+    def get_loc(self, key, method=None):
+        """
+        Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None}
+            * default: exact matches only.
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Raises
+        ------
+        KeyError : if the key is not in the index
+
+        Examples
+        ---------
+        >>> unique_index = pd.CategoricalIndex(list('abc'))
+        >>> unique_index.get_loc('b')
+        1
+
+        >>> monotonic_index = pd.CategoricalIndex(list('abbc'))
+        >>> monotonic_index.get_loc('b')
+        slice(1, 3, None)
+
+        >>> non_monotonic_index = pd.CategoricalIndex(list('abcb'))
+        >>> non_monotonic_index.get_loc('b')
+        array([False,  True, False,  True], dtype=bool)
+        """
+        code = self.categories.get_loc(key)
+        code = self.codes.dtype.type(code)
+        try:
+            return self._engine.get_loc(code)
+        except KeyError:
+            raise KeyError(key)
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+        try:
+            k = com.values_from_object(key)
+            k = self._convert_scalar_indexer(k, kind='getitem')
+            indexer = self.get_loc(k)
+            return series.iloc[indexer]
+        except (KeyError, TypeError):
+            pass
+
+        # we might be a positional inexer
+        return super(CategoricalIndex, self).get_value(series, key)
+
+    def _can_reindex(self, indexer):
+        """ always allow reindexing """
+        pass
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        # TODO: Investigate an alternative implementation with
+        # 1. copy the underyling Categorical
+        # 2. setitem with `cond` and `other`
+        # 3. Rebuild CategoricalIndex.
+        if other is None:
+            other = self._na_value
+        values = np.where(cond, self.values, other)
+        cat = Categorical(values, dtype=self.dtype)
+        return self._shallow_copy(cat, **self._get_attributes_dict())
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values as necessary)
+
+        Returns
+        -------
+        new_index : pd.Index
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index
+
+        """
+
+        if method is not None:
+            raise NotImplementedError("argument method is not implemented for "
+                                      "CategoricalIndex.reindex")
+        if level is not None:
+            raise NotImplementedError("argument level is not implemented for "
+                                      "CategoricalIndex.reindex")
+        if limit is not None:
+            raise NotImplementedError("argument limit is not implemented for "
+                                      "CategoricalIndex.reindex")
+
+        target = ibase.ensure_index(target)
+
+        if self.equals(target):
+            indexer = None
+            missing = []
+        else:
+            if not target.is_unique:
+                raise ValueError("cannot reindex with a non-unique indexer")
+
+            indexer, missing = self.get_indexer_non_unique(np.array(target))
+
+        if len(self.codes) and indexer is not None:
+            new_target = self.take(indexer)
+        else:
+            new_target = target
+
+        # filling in missing if needed
+        if len(missing):
+            cats = self.categories.get_indexer(target)
+
+            if (cats == -1).any():
+                # coerce to a regular index here!
+                result = Index(np.array(self), name=self.name)
+                new_target, indexer, _ = result._reindex_non_unique(
+                    np.array(target))
+            else:
+
+                codes = new_target.codes.copy()
+                codes[indexer == -1] = cats[missing]
+                new_target = self._create_from_codes(codes)
+
+        # we always want to return an Index type here
+        # to be consistent with .reindex for other index types (e.g. they don't
+        # coerce based on the actual values, only on the dtype)
+        # unless we had an initial Categorical to begin with
+        # in which case we are going to conform to the passed Categorical
+        new_target = np.asarray(new_target)
+        if is_categorical_dtype(target):
+            new_target = target._shallow_copy(new_target, name=self.name)
+        else:
+            new_target = Index(new_target, name=self.name)
+
+        return new_target, indexer
+
+    def _reindex_non_unique(self, target):
+        """ reindex from a non-unique; which CategoricalIndex's are almost
+        always
+        """
+        new_target, indexer = self.reindex(target)
+        new_indexer = None
+
+        check = indexer == -1
+        if check.any():
+            new_indexer = np.arange(len(self.take(indexer)))
+            new_indexer[check] = -1
+
+        cats = self.categories.get_indexer(target)
+        if not (cats == -1).any():
+            # .reindex returns normal Index. Revert to CategoricalIndex if
+            # all targets are included in my categories
+            new_target = self._shallow_copy(new_target)
+
+        return new_target, indexer, new_indexer
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        from pandas.core.arrays.categorical import _recode_for_categories
+
+        method = missing.clean_reindex_fill_method(method)
+        target = ibase.ensure_index(target)
+
+        if self.is_unique and self.equals(target):
+            return np.arange(len(self), dtype='intp')
+
+        if method == 'pad' or method == 'backfill':
+            raise NotImplementedError("method='pad' and method='backfill' not "
+                                      "implemented yet for CategoricalIndex")
+        elif method == 'nearest':
+            raise NotImplementedError("method='nearest' not implemented yet "
+                                      'for CategoricalIndex')
+
+        if (isinstance(target, CategoricalIndex) and
+                self.values.is_dtype_equal(target)):
+            if self.values.equals(target.values):
+                # we have the same codes
+                codes = target.codes
+            else:
+                codes = _recode_for_categories(target.codes,
+                                               target.categories,
+                                               self.values.categories)
+        else:
+            if isinstance(target, CategoricalIndex):
+                code_indexer = self.categories.get_indexer(target.categories)
+                codes = take_1d(code_indexer, target.codes, fill_value=-1)
+            else:
+                codes = self.categories.get_indexer(target)
+
+        indexer, _ = self._engine.get_indexer_non_unique(codes)
+        return ensure_platform_int(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = ibase.ensure_index(target)
+
+        if isinstance(target, CategoricalIndex):
+            # Indexing on codes is more efficient if categories are the same:
+            if target.categories is self.categories:
+                target = target.codes
+                indexer, missing = self._engine.get_indexer_non_unique(target)
+                return ensure_platform_int(indexer), missing
+            target = target.values
+
+        codes = self.categories.get_indexer(target)
+        indexer, missing = self._engine.get_indexer_non_unique(codes)
+        return ensure_platform_int(indexer), missing
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        if self.categories._defer_to_indexing:
+            return self.categories._convert_scalar_indexer(key, kind=kind)
+
+        return super(CategoricalIndex, self)._convert_scalar_indexer(
+            key, kind=kind)
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        # Return our indexer or raise if all of the values are not included in
+        # the categories
+
+        if self.categories._defer_to_indexing:
+            indexer = self.categories._convert_list_indexer(keyarr, kind=kind)
+            return Index(self.codes).get_indexer_for(indexer)
+
+        indexer = self.categories.get_indexer(np.asarray(keyarr))
+        if (indexer == -1).any():
+            raise KeyError(
+                "a list-indexer must only "
+                "include values that are "
+                "in the categories")
+
+        return self.get_indexer(keyarr)
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        keyarr = com.asarray_tuplesafe(keyarr)
+
+        if self.categories._defer_to_indexing:
+            return keyarr
+
+        return self._shallow_copy(keyarr)
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        return self._shallow_copy(keyarr)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = ensure_platform_int(indices)
+        taken = self._assert_take_fillable(self.codes, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=-1)
+        return self._create_from_codes(taken)
+
+    def is_dtype_equal(self, other):
+        return self._data.is_dtype_equal(other)
+
+    take_nd = take
+
+    def map(self, mapper):
+        """
+        Map values using input correspondence (a dict, Series, or function).
+
+        Maps the values (their categories, not the codes) of the index to new
+        categories. If the mapping correspondence is one-to-one the result is a
+        :class:`~pandas.CategoricalIndex` which has the same order property as
+        the original, otherwise an :class:`~pandas.Index` is returned.
+
+        If a `dict` or :class:`~pandas.Series` is used any unmapped category is
+        mapped to `NaN`. Note that if this happens an :class:`~pandas.Index`
+        will be returned.
+
+        Parameters
+        ----------
+        mapper : function, dict, or Series
+            Mapping correspondence.
+
+        Returns
+        -------
+        pandas.CategoricalIndex or pandas.Index
+            Mapped index.
+
+        See Also
+        --------
+        Index.map : Apply a mapping correspondence on an
+            :class:`~pandas.Index`.
+        Series.map : Apply a mapping correspondence on a
+            :class:`~pandas.Series`.
+        Series.apply : Apply more complex functions on a
+            :class:`~pandas.Series`.
+
+        Examples
+        --------
+        >>> idx = pd.CategoricalIndex(['a', 'b', 'c'])
+        >>> idx
+        CategoricalIndex(['a', 'b', 'c'], categories=['a', 'b', 'c'],
+                         ordered=False, dtype='category')
+        >>> idx.map(lambda x: x.upper())
+        CategoricalIndex(['A', 'B', 'C'], categories=['A', 'B', 'C'],
+                         ordered=False, dtype='category')
+        >>> idx.map({'a': 'first', 'b': 'second', 'c': 'third'})
+        CategoricalIndex(['first', 'second', 'third'], categories=['first',
+                         'second', 'third'], ordered=False, dtype='category')
+
+        If the mapping is one-to-one the ordering of the categories is
+        preserved:
+
+        >>> idx = pd.CategoricalIndex(['a', 'b', 'c'], ordered=True)
+        >>> idx
+        CategoricalIndex(['a', 'b', 'c'], categories=['a', 'b', 'c'],
+                         ordered=True, dtype='category')
+        >>> idx.map({'a': 3, 'b': 2, 'c': 1})
+        CategoricalIndex([3, 2, 1], categories=[3, 2, 1], ordered=True,
+                         dtype='category')
+
+        If the mapping is not one-to-one an :class:`~pandas.Index` is returned:
+
+        >>> idx.map({'a': 'first', 'b': 'second', 'c': 'first'})
+        Index(['first', 'second', 'first'], dtype='object')
+
+        If a `dict` is used, all unmapped categories are mapped to `NaN` and
+        the result is an :class:`~pandas.Index`:
+
+        >>> idx.map({'a': 'first', 'b': 'second'})
+        Index(['first', 'second', nan], dtype='object')
+        """
+        return self._shallow_copy_with_infer(self.values.map(mapper))
+
+    def delete(self, loc):
+        """
+        Make new Index with passed location(-s) deleted
+
+        Returns
+        -------
+        new_index : Index
+        """
+        return self._create_from_codes(np.delete(self.codes, loc))
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location. Follows
+        Python list.append semantics for negative values
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : Index
+
+        Raises
+        ------
+        ValueError if the item is not in the categories
+
+        """
+        code = self.categories.get_indexer([item])
+        if (code == -1) and not (is_scalar(item) and isna(item)):
+            raise TypeError("cannot insert an item into a CategoricalIndex "
+                            "that is not already an existing category")
+
+        codes = self.codes
+        codes = np.concatenate((codes[:loc], code, codes[loc:]))
+        return self._create_from_codes(codes)
+
+    def _concat(self, to_concat, name):
+        # if calling index is category, don't check dtype of others
+        return CategoricalIndex._concat_same_dtype(self, to_concat, name)
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class
+        ValueError if other is not in the categories
+        """
+        codes = np.concatenate([self._is_dtype_compat(c).codes
+                                for c in to_concat])
+        result = self._create_from_codes(codes, name=name)
+        # if name is None, _create_from_codes sets self.name
+        result.name = name
+        return result
+
+    def _codes_for_groupby(self, sort, observed):
+        """ Return a Categorical adjusted for groupby """
+        return self.values._codes_for_groupby(sort, observed)
+
+    @classmethod
+    def _add_comparison_methods(cls):
+        """ add in comparison methods """
+
+        def _make_compare(op):
+            opname = '__{op}__'.format(op=op.__name__)
+
+            def _evaluate_compare(self, other):
+
+                # if we have a Categorical type, then must have the same
+                # categories
+                if isinstance(other, CategoricalIndex):
+                    other = other._values
+                elif isinstance(other, Index):
+                    other = self._create_categorical(
+                        other._values, dtype=self.dtype)
+
+                if isinstance(other, (ABCCategorical, np.ndarray,
+                                      ABCSeries)):
+                    if len(self.values) != len(other):
+                        raise ValueError("Lengths must match to compare")
+
+                if isinstance(other, ABCCategorical):
+                    if not self.values.is_dtype_equal(other):
+                        raise TypeError("categorical index comparisons must "
+                                        "have the same categories and ordered "
+                                        "attributes")
+
+                result = op(self.values, other)
+                if isinstance(result, ABCSeries):
+                    # Dispatch to pd.Categorical returned NotImplemented
+                    # and we got a Series back; down-cast to ndarray
+                    result = result.values
+                return result
+
+            return compat.set_function_name(_evaluate_compare, opname, cls)
+
+        cls.__eq__ = _make_compare(operator.eq)
+        cls.__ne__ = _make_compare(operator.ne)
+        cls.__lt__ = _make_compare(operator.lt)
+        cls.__gt__ = _make_compare(operator.gt)
+        cls.__le__ = _make_compare(operator.le)
+        cls.__ge__ = _make_compare(operator.ge)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        """ method delegation to the ._values """
+        method = getattr(self._values, name)
+        if 'inplace' in kwargs:
+            raise ValueError("cannot use inplace with CategoricalIndex")
+        res = method(*args, **kwargs)
+        if is_scalar(res):
+            return res
+        return CategoricalIndex(res, name=self.name)
+
+
+CategoricalIndex._add_numeric_methods_add_sub_disabled()
+CategoricalIndex._add_numeric_methods_disabled()
+CategoricalIndex._add_logical_methods_disabled()
+CategoricalIndex._add_comparison_methods()
diff --git a/pandas/core/indexes/datetimelike.py b/pandas/core/indexes/datetimelike.py
new file mode 100644
index 0000000000000..aa7332472fc07
--- /dev/null
+++ b/pandas/core/indexes/datetimelike.py
@@ -0,0 +1,724 @@
+# -*- coding: utf-8 -*-
+"""
+Base and utility classes for tseries type pandas objects.
+"""
+import operator
+import warnings
+
+import numpy as np
+
+from pandas._libs import NaT, iNaT, lib
+from pandas.compat.numpy import function as nv
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, cache_readonly, deprecate_kwarg
+
+from pandas.core.dtypes.common import (
+    ensure_int64, is_dtype_equal, is_float, is_integer, is_list_like,
+    is_period_dtype, is_scalar)
+from pandas.core.dtypes.generic import ABCIndex, ABCIndexClass, ABCSeries
+
+from pandas.core import algorithms, ops
+from pandas.core.accessor import PandasDelegate
+from pandas.core.arrays import ExtensionOpsMixin
+from pandas.core.arrays.datetimelike import (
+    DatetimeLikeArrayMixin, _ensure_datetimelike_to_i8)
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.core.tools.timedeltas import to_timedelta
+
+import pandas.io.formats.printing as printing
+
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+
+
+def ea_passthrough(array_method):
+    """
+    Make an alias for a method of the underlying ExtensionArray.
+
+    Parameters
+    ----------
+    array_method : method on an Array class
+
+    Returns
+    -------
+    method
+    """
+
+    def method(self, *args, **kwargs):
+        return array_method(self._data, *args, **kwargs)
+
+    method.__name__ = array_method.__name__
+    method.__doc__ = array_method.__doc__
+    return method
+
+
+class DatetimeIndexOpsMixin(ExtensionOpsMixin):
+    """
+    common ops mixin to support a unified interface datetimelike Index
+    """
+    _data = None  # type: DatetimeLikeArrayMixin
+
+    # DatetimeLikeArrayMixin assumes subclasses are mutable, so these are
+    # properties there.  They can be made into cache_readonly for Index
+    # subclasses bc they are immutable
+    inferred_freq = cache_readonly(DatetimeLikeArrayMixin.inferred_freq.fget)
+    _isnan = cache_readonly(DatetimeLikeArrayMixin._isnan.fget)
+    hasnans = cache_readonly(DatetimeLikeArrayMixin._hasnans.fget)
+    _hasnans = hasnans  # for index / array -agnostic code
+    _resolution = cache_readonly(DatetimeLikeArrayMixin._resolution.fget)
+    resolution = cache_readonly(DatetimeLikeArrayMixin.resolution.fget)
+
+    _box_values = ea_passthrough(DatetimeLikeArrayMixin._box_values)
+    _maybe_mask_results = ea_passthrough(
+        DatetimeLikeArrayMixin._maybe_mask_results)
+    __iter__ = ea_passthrough(DatetimeLikeArrayMixin.__iter__)
+
+    @property
+    def freq(self):
+        """
+        Return the frequency object if it is set, otherwise None.
+        """
+        return self._data.freq
+
+    @freq.setter
+    def freq(self, value):
+        # validation is handled by _data setter
+        self._data.freq = value
+
+    @property
+    def freqstr(self):
+        """
+        Return the frequency object as a string if it is set, otherwise None.
+        """
+        return self._data.freqstr
+
+    def unique(self, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+
+        result = self._data.unique()
+
+        # Note: if `self` is already unique, then self.unique() should share
+        #  a `freq` with self.  If not already unique, then self.freq must be
+        #  None, so again sharing freq is correct.
+        return self._shallow_copy(result._data)
+
+    @classmethod
+    def _create_comparison_method(cls, op):
+        """
+        Create a comparison method that dispatches to ``cls.values``.
+        """
+        def wrapper(self, other):
+            if isinstance(other, ABCSeries):
+                # the arrays defer to Series for comparison ops but the indexes
+                #  don't, so we have to unwrap here.
+                other = other._values
+
+            result = op(self._data, maybe_unwrap_index(other))
+            return result
+
+        wrapper.__doc__ = op.__doc__
+        wrapper.__name__ = '__{}__'.format(op.__name__)
+        return wrapper
+
+    @property
+    def _ndarray_values(self):
+        return self._data._ndarray_values
+
+    # ------------------------------------------------------------------------
+    # Abstract data attributes
+
+    @property
+    def values(self):
+        # type: () -> np.ndarray
+        # Note: PeriodArray overrides this to return an ndarray of objects.
+        return self._data._data
+
+    @property
+    @Appender(DatetimeLikeArrayMixin.asi8.__doc__)
+    def asi8(self):
+        return self._data.asi8
+
+    # ------------------------------------------------------------------------
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, ABCIndexClass):
+            return False
+        elif not isinstance(other, type(self)):
+            try:
+                other = type(self)(other)
+            except Exception:
+                return False
+
+        if not is_dtype_equal(self.dtype, other.dtype):
+            # have different timezone
+            return False
+
+        elif is_period_dtype(self):
+            if not is_period_dtype(other):
+                return False
+            if self.freq != other.freq:
+                return False
+
+        return np.array_equal(self.asi8, other.asi8)
+
+    @staticmethod
+    def _join_i8_wrapper(joinf, dtype, with_indexers=True):
+        """
+        Create the join wrapper methods.
+        """
+        from pandas.core.arrays.datetimelike import DatetimeLikeArrayMixin
+
+        @staticmethod
+        def wrapper(left, right):
+            if isinstance(left, (np.ndarray, ABCIndex, ABCSeries,
+                                 DatetimeLikeArrayMixin)):
+                left = left.view('i8')
+            if isinstance(right, (np.ndarray, ABCIndex, ABCSeries,
+                                  DatetimeLikeArrayMixin)):
+                right = right.view('i8')
+            results = joinf(left, right)
+            if with_indexers:
+                join_index, left_indexer, right_indexer = results
+                join_index = join_index.view(dtype)
+                return join_index, left_indexer, right_indexer
+            return results
+
+        return wrapper
+
+    def _ensure_localized(self, arg, ambiguous='raise', nonexistent='raise',
+                          from_utc=False):
+        # See DatetimeLikeArrayMixin._ensure_localized.__doc__
+        if getattr(self, 'tz', None):
+            # ensure_localized is only relevant for tz-aware DTI
+            result = self._data._ensure_localized(arg,
+                                                  ambiguous=ambiguous,
+                                                  nonexistent=nonexistent,
+                                                  from_utc=from_utc)
+            return type(self)._simple_new(result, name=self.name)
+        return arg
+
+    def _box_values(self, values):
+        return self._data._box_values(values)
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        try:
+            res = self.get_loc(key)
+            return (is_scalar(res) or isinstance(res, slice) or
+                    (is_list_like(res) and len(res)))
+        except (KeyError, TypeError, ValueError):
+            return False
+
+    contains = __contains__
+
+    # Try to run function on index first, and then on elements of index
+    # Especially important for group-by functionality
+    def map(self, f):
+        try:
+            result = f(self)
+
+            # Try to use this result if we can
+            if isinstance(result, np.ndarray):
+                result = Index(result)
+
+            if not isinstance(result, Index):
+                raise TypeError('The map function must return an Index object')
+            return result
+        except Exception:
+            return self.astype(object).map(f)
+
+    def sort_values(self, return_indexer=False, ascending=True):
+        """
+        Return sorted copy of Index.
+        """
+        if return_indexer:
+            _as = self.argsort()
+            if not ascending:
+                _as = _as[::-1]
+            sorted_index = self.take(_as)
+            return sorted_index, _as
+        else:
+            sorted_values = np.sort(self._ndarray_values)
+            attribs = self._get_attributes_dict()
+            freq = attribs['freq']
+
+            if freq is not None and not is_period_dtype(self):
+                if freq.n > 0 and not ascending:
+                    freq = freq * -1
+                elif freq.n < 0 and ascending:
+                    freq = freq * -1
+            attribs['freq'] = freq
+
+            if not ascending:
+                sorted_values = sorted_values[::-1]
+
+            return self._simple_new(sorted_values, **attribs)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = ensure_int64(indices)
+
+        maybe_slice = lib.maybe_indices_to_slice(indices, len(self))
+        if isinstance(maybe_slice, slice):
+            return self[maybe_slice]
+
+        taken = self._assert_take_fillable(self.asi8, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=iNaT)
+
+        # keep freq in PeriodArray/Index, reset otherwise
+        freq = self.freq if is_period_dtype(self) else None
+        return self._shallow_copy(taken, freq=freq)
+
+    _can_hold_na = True
+
+    _na_value = NaT
+    """The expected NA value to use with this index."""
+
+    @property
+    def asobject(self):
+        """
+        Return object Index which contains boxed values.
+
+        .. deprecated:: 0.23.0
+            Use ``astype(object)`` instead.
+
+        *this is an internal non-public method*
+        """
+        warnings.warn("'asobject' is deprecated. Use 'astype(object)'"
+                      " instead", FutureWarning, stacklevel=2)
+        return self.astype(object)
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = np.asarray(to_timedelta(tolerance, box=False))
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return tolerance
+
+    def tolist(self):
+        """
+        Return a list of the underlying data.
+        """
+        return list(self.astype(object))
+
+    def min(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Return the minimum value of the Index or minimum along
+        an axis.
+
+        See Also
+        --------
+        numpy.ndarray.min
+        Series.min : Return the minimum value in a Series.
+        """
+        nv.validate_min(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        if not len(self):
+            return self._na_value
+
+        i8 = self.asi8
+        try:
+            # quick check
+            if len(i8) and self.is_monotonic:
+                if i8[0] != iNaT:
+                    return self._box_func(i8[0])
+
+            if self.hasnans:
+                if skipna:
+                    min_stamp = self[~self._isnan].asi8.min()
+                else:
+                    return self._na_value
+            else:
+                min_stamp = i8.min()
+            return self._box_func(min_stamp)
+        except ValueError:
+            return self._na_value
+
+    def argmin(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Returns the indices of the minimum values along an axis.
+
+        See `numpy.ndarray.argmin` for more information on the
+        `axis` parameter.
+
+        See Also
+        --------
+        numpy.ndarray.argmin
+        """
+        nv.validate_argmin(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        i8 = self.asi8
+        if self.hasnans:
+            mask = self._isnan
+            if mask.all() or not skipna:
+                return -1
+            i8 = i8.copy()
+            i8[mask] = np.iinfo('int64').max
+        return i8.argmin()
+
+    def max(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Return the maximum value of the Index or maximum along
+        an axis.
+
+        See Also
+        --------
+        numpy.ndarray.max
+        Series.max : Return the maximum value in a Series.
+        """
+        nv.validate_max(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        if not len(self):
+            return self._na_value
+
+        i8 = self.asi8
+        try:
+            # quick check
+            if len(i8) and self.is_monotonic:
+                if i8[-1] != iNaT:
+                    return self._box_func(i8[-1])
+
+            if self.hasnans:
+                if skipna:
+                    max_stamp = self[~self._isnan].asi8.max()
+                else:
+                    return self._na_value
+            else:
+                max_stamp = i8.max()
+            return self._box_func(max_stamp)
+        except ValueError:
+            return self._na_value
+
+    def argmax(self, axis=None, skipna=True, *args, **kwargs):
+        """
+        Returns the indices of the maximum values along an axis.
+
+        See `numpy.ndarray.argmax` for more information on the
+        `axis` parameter.
+
+        See Also
+        --------
+        numpy.ndarray.argmax
+        """
+        nv.validate_argmax(args, kwargs)
+        nv.validate_minmax_axis(axis)
+
+        i8 = self.asi8
+        if self.hasnans:
+            mask = self._isnan
+            if mask.all() or not skipna:
+                return -1
+            i8 = i8.copy()
+            i8[mask] = 0
+        return i8.argmax()
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_with_header(self, header, **kwargs):
+        return header + list(self._format_native_types(**kwargs))
+
+    @property
+    def _formatter_func(self):
+        raise AbstractMethodError(self)
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value).
+        """
+        attrs = super(DatetimeIndexOpsMixin, self)._format_attrs()
+        for attrib in self._attributes:
+            if attrib == 'freq':
+                freq = self.freqstr
+                if freq is not None:
+                    freq = "'%s'" % freq
+                attrs.append(('freq', freq))
+        return attrs
+
+    # --------------------------------------------------------------------
+
+    def _convert_scalar_indexer(self, key, kind=None):
+        """
+        We don't allow integer or float indexing on datetime-like when using
+        loc.
+
+        Parameters
+        ----------
+        key : label of the slice bound
+        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
+        """
+
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # we don't allow integer/float indexing for loc
+        # we don't allow float indexing for ix/getitem
+        if is_scalar(key):
+            is_int = is_integer(key)
+            is_flt = is_float(key)
+            if kind in ['loc'] and (is_int or is_flt):
+                self._invalid_indexer('index', key)
+            elif kind in ['ix', 'getitem'] and is_flt:
+                self._invalid_indexer('index', key)
+
+        return (super(DatetimeIndexOpsMixin, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    @classmethod
+    def _add_datetimelike_methods(cls):
+        """
+        Add in the datetimelike methods (as we may have to override the
+        superclass).
+        """
+
+        def __add__(self, other):
+            # dispatch to ExtensionArray implementation
+            result = self._data.__add__(maybe_unwrap_index(other))
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__add__ = __add__
+
+        def __radd__(self, other):
+            # alias for __add__
+            return self.__add__(other)
+        cls.__radd__ = __radd__
+
+        def __sub__(self, other):
+            # dispatch to ExtensionArray implementation
+            result = self._data.__sub__(maybe_unwrap_index(other))
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__sub__ = __sub__
+
+        def __rsub__(self, other):
+            result = self._data.__rsub__(maybe_unwrap_index(other))
+            return wrap_arithmetic_op(self, other, result)
+
+        cls.__rsub__ = __rsub__
+
+    def isin(self, values):
+        """
+        Compute boolean array of whether each index value is found in the
+        passed set of values.
+
+        Parameters
+        ----------
+        values : set or sequence of values
+
+        Returns
+        -------
+        is_contained : ndarray (boolean dtype)
+        """
+        if not isinstance(values, type(self)):
+            try:
+                values = type(self)(values)
+            except ValueError:
+                return self.astype(object).isin(values)
+
+        return algorithms.isin(self.asi8, values.asi8)
+
+    @Appender(_index_shared_docs['repeat'] % _index_doc_kwargs)
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        freq = self.freq if is_period_dtype(self) else None
+        return self._shallow_copy(self.asi8.repeat(repeats), freq=freq)
+
+    @Appender(_index_shared_docs['where'] % _index_doc_kwargs)
+    def where(self, cond, other=None):
+        other = _ensure_datetimelike_to_i8(other, to_utc=True)
+        values = _ensure_datetimelike_to_i8(self, to_utc=True)
+        result = np.where(cond, values, other).astype('i8')
+
+        result = self._ensure_localized(result, from_utc=True)
+        return self._shallow_copy(result)
+
+    def _summary(self, name=None):
+        """
+        Return a summarized representation.
+
+        Parameters
+        ----------
+        name : str
+            name to use in the summary representation
+
+        Returns
+        -------
+        String with a summarized representation of the index
+        """
+        formatter = self._formatter_func
+        if len(self) > 0:
+            index_summary = ', %s to %s' % (formatter(self[0]),
+                                            formatter(self[-1]))
+        else:
+            index_summary = ''
+
+        if name is None:
+            name = type(self).__name__
+        result = '%s: %s entries%s' % (printing.pprint_thing(name),
+                                       len(self), index_summary)
+        if self.freq:
+            result += '\nFreq: %s' % self.freqstr
+
+        # display as values, not quoted
+        result = result.replace("'", "")
+        return result
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        Concatenate to_concat which has the same class.
+        """
+        attribs = self._get_attributes_dict()
+        attribs['name'] = name
+        # do not pass tz to set because tzlocal cannot be hashed
+        if len({str(x.dtype) for x in to_concat}) != 1:
+            raise ValueError('to_concat must have the same tz')
+
+        if not is_period_dtype(self):
+            # reset freq
+            attribs['freq'] = None
+
+        new_data = type(self._values)._concat_same_type(to_concat).asi8
+        return self._simple_new(new_data, **attribs)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        if is_dtype_equal(self.dtype, dtype) and copy is False:
+            # Ensure that self.astype(self.dtype) is self
+            return self
+
+        new_values = self._data.astype(dtype, copy=copy)
+
+        # pass copy=False because any copying will be done in the
+        #  _data.astype call above
+        return Index(new_values,
+                     dtype=new_values.dtype, name=self.name, copy=False)
+
+    @deprecate_kwarg(old_arg_name='n', new_arg_name='periods')
+    def shift(self, periods, freq=None):
+        """
+        Shift index by desired number of time frequency increments.
+
+        This method is for shifting the values of datetime-like indexes
+        by a specified time increment a given number of times.
+
+        Parameters
+        ----------
+        periods : int
+            Number of periods (or increments) to shift by,
+            can be positive or negative.
+
+            .. versionchanged:: 0.24.0
+
+        freq : pandas.DateOffset, pandas.Timedelta or string, optional
+            Frequency increment to shift by.
+            If None, the index is shifted by its own `freq` attribute.
+            Offset aliases are valid strings, e.g., 'D', 'W', 'M' etc.
+
+        Returns
+        -------
+        pandas.DatetimeIndex
+            Shifted index.
+
+        See Also
+        --------
+        Index.shift : Shift values of Index.
+        PeriodIndex.shift : Shift values of PeriodIndex.
+        """
+        result = self._data._time_shift(periods, freq=freq)
+        return type(self)(result, name=self.name)
+
+
+def wrap_arithmetic_op(self, other, result):
+    if result is NotImplemented:
+        return NotImplemented
+
+    if isinstance(result, tuple):
+        # divmod, rdivmod
+        assert len(result) == 2
+        return (wrap_arithmetic_op(self, other, result[0]),
+                wrap_arithmetic_op(self, other, result[1]))
+
+    if not isinstance(result, Index):
+        # Index.__new__ will choose appropriate subclass for dtype
+        result = Index(result)
+
+    res_name = ops.get_op_result_name(self, other)
+    result.name = res_name
+    return result
+
+
+def maybe_unwrap_index(obj):
+    """
+    If operating against another Index object, we need to unwrap the underlying
+    data before deferring to the DatetimeArray/TimedeltaArray/PeriodArray
+    implementation, otherwise we will incorrectly return NotImplemented.
+
+    Parameters
+    ----------
+    obj : object
+
+    Returns
+    -------
+    unwrapped object
+    """
+    if isinstance(obj, ABCIndexClass):
+        return obj._data
+    return obj
+
+
+class DatetimelikeDelegateMixin(PandasDelegate):
+    """
+    Delegation mechanism, specific for Datetime, Timedelta, and Period types.
+
+    Functionality is delegated from the Index class to an Array class. A
+    few things can be customized
+
+    * _delegate_class : type
+        The class being delegated to.
+    * _delegated_methods, delegated_properties : List
+        The list of property / method names being delagated.
+    * raw_methods : Set
+        The set of methods whose results should should *not* be
+        boxed in an index, after being returned from the array
+    * raw_properties : Set
+        The set of properties whose results should should *not* be
+        boxed in an index, after being returned from the array
+    """
+    # raw_methods : dispatch methods that shouldn't be boxed in an Index
+    _raw_methods = set()
+    # raw_properties : dispatch properties that shouldn't be boxed in an Index
+    _raw_properties = set()
+    name = None
+    _data = None
+
+    @property
+    def _delegate_class(self):
+        raise AbstractMethodError
+
+    def _delegate_property_get(self, name, *args, **kwargs):
+        result = getattr(self._data, name)
+        if name not in self._raw_properties:
+            result = Index(result, name=self.name)
+        return result
+
+    def _delegate_property_set(self, name, value, *args, **kwargs):
+        setattr(self._data, name, value)
+
+    def _delegate_method(self, name, *args, **kwargs):
+        result = operator.methodcaller(name, *args, **kwargs)(self._data)
+        if name not in self._raw_methods:
+            result = Index(result, name=self.name)
+        return result
diff --git a/pandas/core/indexes/datetimes.py b/pandas/core/indexes/datetimes.py
new file mode 100644
index 0000000000000..b8d052ce7be04
--- /dev/null
+++ b/pandas/core/indexes/datetimes.py
@@ -0,0 +1,1706 @@
+# pylint: disable=E1101
+from __future__ import division
+
+from datetime import datetime, time, timedelta
+import operator
+import warnings
+
+import numpy as np
+
+from pandas._libs import (
+    Timestamp, index as libindex, join as libjoin, lib, tslib as libts)
+from pandas._libs.tslibs import ccalendar, fields, parsing, timezones
+import pandas.compat as compat
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, ensure_int64, is_float, is_integer, is_list_like, is_scalar,
+    is_string_like)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.missing import isna
+
+from pandas.core.accessor import delegate_names
+from pandas.core.arrays.datetimes import (
+    DatetimeArray, _to_M8, tz_to_dtype, validate_tz_from_dtype)
+from pandas.core.base import _shared_docs
+import pandas.core.common as com
+from pandas.core.indexes.base import Index
+from pandas.core.indexes.datetimelike import (
+    DatetimeIndexOpsMixin, DatetimelikeDelegateMixin, ea_passthrough)
+from pandas.core.indexes.numeric import Int64Index
+from pandas.core.ops import get_op_result_name
+import pandas.core.tools.datetimes as tools
+
+from pandas.tseries.frequencies import Resolution, to_offset
+from pandas.tseries.offsets import CDay, Nano, prefix_mapping
+
+
+def _new_DatetimeIndex(cls, d):
+    """ This is called upon unpickling, rather than the default which doesn't
+    have arguments and breaks __new__ """
+
+    if "data" in d and not isinstance(d["data"], DatetimeIndex):
+        # Avoid need to verify integrity by calling simple_new directly
+        data = d.pop("data")
+        result = cls._simple_new(data, **d)
+    else:
+        with warnings.catch_warnings():
+            # we ignore warnings from passing verify_integrity=False
+            # TODO: If we knew what was going in to **d, we might be able to
+            #  go through _simple_new instead
+            warnings.simplefilter("ignore")
+            result = cls.__new__(cls, verify_integrity=False, **d)
+
+    return result
+
+
+class DatetimeDelegateMixin(DatetimelikeDelegateMixin):
+    # Most attrs are dispatched via datetimelike_{ops,methods}
+    # Some are "raw" methods, the result is not not re-boxed in an Index
+    # We also have a few "extra" attrs, which may or may not be raw,
+    # which we we dont' want to expose in the .dt accessor.
+    _extra_methods = [
+        'to_period',
+        'to_perioddelta',
+        'to_julian_date',
+    ]
+    _extra_raw_methods = [
+        'to_pydatetime',
+        '_local_timestamps',
+        '_has_same_tz',
+    ]
+    _extra_raw_properties = [
+        '_box_func',
+        'tz', 'tzinfo',
+    ]
+    _delegated_properties = (
+        DatetimeArray._datetimelike_ops + _extra_raw_properties
+    )
+    _delegated_methods = (
+        DatetimeArray._datetimelike_methods + _extra_methods +
+        _extra_raw_methods
+    )
+    _raw_properties = {
+        'date',
+        'time',
+        'timetz',
+    } | set(DatetimeArray._bool_ops) | set(_extra_raw_properties)
+    _raw_methods = set(_extra_raw_methods)
+    _delegate_class = DatetimeArray
+
+
+@delegate_names(DatetimeArray,
+                DatetimeDelegateMixin._delegated_properties,
+                typ="property")
+@delegate_names(DatetimeArray,
+                DatetimeDelegateMixin._delegated_methods,
+                typ="method", overwrite=False)
+class DatetimeIndex(DatetimeIndexOpsMixin, Int64Index, DatetimeDelegateMixin):
+    """
+    Immutable ndarray of datetime64 data, represented internally as int64, and
+    which can be boxed to Timestamp objects that are subclasses of datetime and
+    carry metadata such as frequency information.
+
+    Parameters
+    ----------
+    data  : array-like (1-dimensional), optional
+        Optional datetime-like data to construct index with
+    copy  : bool
+        Make a copy of input ndarray
+    freq : string or pandas offset object, optional
+        One of pandas date offset strings or corresponding objects. The string
+        'infer' can be passed in order to set the frequency of the index as the
+        inferred frequency upon creation
+
+    start : starting value, datetime-like, optional
+        If data is None, start is used as the start point in generating regular
+        timestamp data.
+
+        .. deprecated:: 0.24.0
+
+    periods  : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+
+        .. deprecated:: 0.24.0
+
+    end : end time, datetime-like, optional
+        If periods is none, generated index will extend to first conforming
+        time on or just past end argument
+
+        .. deprecated:: 0.24.0
+
+    closed : string or None, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+        .. deprecated:: 0.24. 0
+
+    tz : pytz.timezone or dateutil.tz.tzfile
+    ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
+        When clocks moved backward due to DST, ambiguous times may arise.
+        For example in Central European Time (UTC+01), when going from 03:00
+        DST to 02:00 non-DST, 02:30:00 local time occurs both at 00:30:00 UTC
+        and at 01:30:00 UTC. In such a situation, the `ambiguous` parameter
+        dictates how ambiguous times should be handled.
+
+        - 'infer' will attempt to infer fall dst-transition hours based on
+          order
+        - bool-ndarray where True signifies a DST time, False signifies a
+          non-DST time (note that this flag is only applicable for ambiguous
+          times)
+        - 'NaT' will return NaT where there are ambiguous times
+        - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
+    name : object
+        Name to be stored in the index
+    dayfirst : bool, default False
+        If True, parse dates in `data` with the day first order
+    yearfirst : bool, default False
+        If True parse dates in `data` with the year first order
+
+    Attributes
+    ----------
+    year
+    month
+    day
+    hour
+    minute
+    second
+    microsecond
+    nanosecond
+    date
+    time
+    timetz
+    dayofyear
+    weekofyear
+    week
+    dayofweek
+    weekday
+    quarter
+    tz
+    freq
+    freqstr
+    is_month_start
+    is_month_end
+    is_quarter_start
+    is_quarter_end
+    is_year_start
+    is_year_end
+    is_leap_year
+    inferred_freq
+
+    Methods
+    -------
+    normalize
+    strftime
+    snap
+    tz_convert
+    tz_localize
+    round
+    floor
+    ceil
+    to_period
+    to_perioddelta
+    to_pydatetime
+    to_series
+    to_frame
+    month_name
+    day_name
+
+    Notes
+    -----
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Creating a DatetimeIndex based on `start`, `periods`, and `end` has
+    been deprecated in favor of :func:`date_range`.
+
+    See Also
+    ---------
+    Index : The base pandas Index type.
+    TimedeltaIndex : Index of timedelta64 data.
+    PeriodIndex : Index of Period data.
+    to_datetime : Convert argument to datetime.
+    date_range : Create a fixed-frequency DatetimeIndex.
+    """
+    _typ = 'datetimeindex'
+    _join_precedence = 10
+
+    def _join_i8_wrapper(joinf, **kwargs):
+        return DatetimeIndexOpsMixin._join_i8_wrapper(joinf, dtype='M8[ns]',
+                                                      **kwargs)
+
+    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
+    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
+    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
+    _left_indexer_unique = _join_i8_wrapper(
+        libjoin.left_join_indexer_unique_int64, with_indexers=False)
+
+    _engine_type = libindex.DatetimeEngine
+
+    _tz = None
+    _freq = None
+    _comparables = ['name', 'freqstr', 'tz']
+    _attributes = ['name', 'tz', 'freq']
+
+    # dummy attribute so that datetime.__eq__(DatetimeArray) defers
+    # by returning NotImplemented
+    timetuple = None
+
+    _is_numeric_dtype = False
+    _infer_as_myclass = True
+
+    # some things like freq inference make use of these attributes.
+    _bool_ops = DatetimeArray._bool_ops
+    _object_ops = DatetimeArray._object_ops
+    _field_ops = DatetimeArray._field_ops
+    _datetimelike_ops = DatetimeArray._datetimelike_ops
+    _datetimelike_methods = DatetimeArray._datetimelike_methods
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, data=None,
+                freq=None, start=None, end=None, periods=None, tz=None,
+                normalize=False, closed=None, ambiguous='raise',
+                dayfirst=False, yearfirst=False, dtype=None,
+                copy=False, name=None, verify_integrity=None):
+
+        if verify_integrity is not None:
+            warnings.warn("The 'verify_integrity' argument is deprecated, "
+                          "will be removed in a future version.",
+                          FutureWarning, stacklevel=2)
+        else:
+            verify_integrity = True
+
+        if data is None:
+            dtarr = DatetimeArray._generate_range(
+                start, end, periods,
+                freq=freq, tz=tz, normalize=normalize,
+                closed=closed, ambiguous=ambiguous)
+            warnings.warn("Creating a DatetimeIndex by passing range "
+                          "endpoints is deprecated.  Use "
+                          "`pandas.date_range` instead.",
+                          FutureWarning, stacklevel=2)
+            return cls._simple_new(
+                dtarr._data, freq=dtarr.freq, tz=dtarr.tz, name=name)
+
+        if is_scalar(data):
+            raise TypeError("{cls}() must be called with a "
+                            "collection of some kind, {data} was passed"
+                            .format(cls=cls.__name__, data=repr(data)))
+
+        # - Cases checked above all return/raise before reaching here - #
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        dtarr = DatetimeArray._from_sequence(
+            data, dtype=dtype, copy=copy, tz=tz, freq=freq,
+            dayfirst=dayfirst, yearfirst=yearfirst, ambiguous=ambiguous,
+            int_as_wall_time=True)
+
+        subarr = cls._simple_new(dtarr, name=name,
+                                 freq=dtarr.freq, tz=dtarr.tz)
+        return subarr
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, tz=None, dtype=None):
+        """
+        we require the we have a dtype compat for the values
+        if we are passed a non-dtype compat, then coerce using the constructor
+        """
+        if isinstance(values, DatetimeArray):
+            if tz:
+                tz = validate_tz_from_dtype(dtype, tz)
+                dtype = DatetimeTZDtype(tz=tz)
+            elif dtype is None:
+                dtype = _NS_DTYPE
+
+            values = DatetimeArray(values, freq=freq, dtype=dtype)
+            tz = values.tz
+            freq = values.freq
+            values = values._data
+
+        # DatetimeArray._simple_new will accept either i8 or M8[ns] dtypes
+        if isinstance(values, DatetimeIndex):
+            values = values._data
+
+        dtype = tz_to_dtype(tz)
+        dtarr = DatetimeArray._simple_new(values, freq=freq, dtype=dtype)
+        assert isinstance(dtarr, DatetimeArray)
+
+        result = object.__new__(cls)
+        result._data = dtarr
+        result.name = name
+        # For groupby perf. See note in indexes/base about _index_data
+        result._index_data = dtarr._data
+        result._reset_identity()
+        return result
+
+    # --------------------------------------------------------------------
+
+    def __array__(self, dtype=None):
+        if (dtype is None and isinstance(self._data, DatetimeArray)
+                and getattr(self.dtype, 'tz', None)):
+            msg = (
+                "Converting timezone-aware DatetimeArray to timezone-naive "
+                "ndarray with 'datetime64[ns]' dtype. In the future, this "
+                "will return an ndarray with 'object' dtype where each "
+                "element is a 'pandas.Timestamp' with the correct 'tz'.\n\t"
+                "To accept the future behavior, pass 'dtype=object'.\n\t"
+                "To keep the old behavior, pass 'dtype=\"datetime64[ns]\"'."
+            )
+            warnings.warn(msg, FutureWarning, stacklevel=3)
+            dtype = 'M8[ns]'
+        return np.asarray(self._data, dtype=dtype)
+
+    @property
+    def dtype(self):
+        return self._data.dtype
+
+    @property
+    def tz(self):
+        # GH 18595
+        return self._data.tz
+
+    @tz.setter
+    def tz(self, value):
+        # GH 3746: Prevent localizing or converting the index by setting tz
+        raise AttributeError("Cannot directly set timezone. Use tz_localize() "
+                             "or tz_convert() as appropriate")
+
+    tzinfo = tz
+
+    @cache_readonly
+    def _is_dates_only(self):
+        """Return a boolean if we are only dates (and don't have a timezone)"""
+        from pandas.io.formats.format import _is_dates_only
+        return _is_dates_only(self.values) and self.tz is None
+
+    def __reduce__(self):
+
+        # we use a special reudce here because we need
+        # to simply set the .tz (and not reinterpret it)
+
+        d = dict(data=self._data)
+        d.update(self._get_attributes_dict())
+        return _new_DatetimeIndex, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if isinstance(state, dict):
+            super(DatetimeIndex, self).__setstate__(state)
+
+        elif isinstance(state, tuple):
+
+            # < 0.15 compat
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+
+                freq = own_state[1]
+                tz = timezones.tz_standardize(own_state[2])
+                dtype = tz_to_dtype(tz)
+                dtarr = DatetimeArray._simple_new(data, freq=freq, dtype=dtype)
+
+                self.name = own_state[0]
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(data, state)
+                dtarr = DatetimeArray(data)
+
+            self._data = dtarr
+            self._reset_identity()
+
+        else:
+            raise Exception("invalid pickle state")
+    _unpickle_compat = __setstate__
+
+    def _convert_for_op(self, value):
+        """ Convert value to be insertable to ndarray """
+        if self._has_same_tz(value):
+            return _to_M8(value)
+        raise ValueError('Passed item and index have different timezone')
+
+    def _maybe_update_attributes(self, attrs):
+        """ Update Index attributes (e.g. freq) depending on op """
+        freq = attrs.get('freq', None)
+        if freq is not None:
+            # no need to infer if freq is None
+            attrs['freq'] = 'infer'
+        return attrs
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return libts.ints_to_pydatetime(self.asi8, self.tz)
+
+    def _format_native_types(self, na_rep='NaT', date_format=None, **kwargs):
+        from pandas.io.formats.format import _get_format_datetime64_from_values
+        fmt = _get_format_datetime64_from_values(self, date_format)
+
+        return libts.format_array_from_datetime(self.asi8,
+                                                tz=self.tz,
+                                                format=fmt,
+                                                na_rep=na_rep)
+
+    @property
+    def _formatter_func(self):
+        from pandas.io.formats.format import _get_format_datetime64
+        formatter = _get_format_datetime64(is_dates_only=self._is_dates_only)
+        return lambda x: "'%s'" % formatter(x, tz=self.tz)
+
+    # --------------------------------------------------------------------
+    # Set Operation Methods
+
+    def union(self, other, sort=None):
+        """
+        Specialized union for DatetimeIndex objects. If combine
+        overlapping ranges with the same DateOffset, will be much
+        faster than Index.union
+
+        Parameters
+        ----------
+        other : DatetimeIndex or array-like
+        sort : bool or None, default None
+            Whether to sort the resulting Index.
+
+            * None : Sort the result, except when
+
+              1. `self` and `other` are equal.
+              2. `self` or `other` has length 0.
+              3. Some values in `self` or `other` cannot be compared.
+                 A RuntimeWarning is issued in this case.
+
+            * False : do not sort the result
+
+            .. versionadded:: 0.25.0
+
+        Returns
+        -------
+        y : Index or DatetimeIndex
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+
+        if len(other) == 0 or self.equals(other) or len(self) == 0:
+            return super(DatetimeIndex, self).union(other, sort=sort)
+
+        if not isinstance(other, DatetimeIndex):
+            try:
+                other = DatetimeIndex(other)
+            except TypeError:
+                pass
+
+        this, other = self._maybe_utc_convert(other)
+
+        if this._can_fast_union(other):
+            return this._fast_union(other, sort=sort)
+        else:
+            result = Index.union(this, other, sort=sort)
+            if isinstance(result, DatetimeIndex):
+                # TODO: we shouldn't be setting attributes like this;
+                #  in all the tests this equality already holds
+                result._data._dtype = this.dtype
+                if (result.freq is None and
+                        (this.freq is not None or other.freq is not None)):
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+    def union_many(self, others):
+        """
+        A bit of a hack to accelerate unioning a collection of indexes
+        """
+        this = self
+
+        for other in others:
+            if not isinstance(this, DatetimeIndex):
+                this = Index.union(this, other)
+                continue
+
+            if not isinstance(other, DatetimeIndex):
+                try:
+                    other = DatetimeIndex(other)
+                except TypeError:
+                    pass
+
+            this, other = this._maybe_utc_convert(other)
+
+            if this._can_fast_union(other):
+                this = this._fast_union(other)
+            else:
+                dtype = this.dtype
+                this = Index.union(this, other)
+                if isinstance(this, DatetimeIndex):
+                    # TODO: we shouldn't be setting attributes like this;
+                    #  in all the tests this equality already holds
+                    this._data._dtype = dtype
+        return this
+
+    def _can_fast_union(self, other):
+        if not isinstance(other, DatetimeIndex):
+            return False
+
+        freq = self.freq
+
+        if freq is None or freq != other.freq:
+            return False
+
+        if not self.is_monotonic or not other.is_monotonic:
+            return False
+
+        if len(self) == 0 or len(other) == 0:
+            return True
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        right_start = right[0]
+        left_end = left[-1]
+
+        # Only need to "adjoin", not overlap
+        try:
+            return (right_start == left_end + freq) or right_start in left
+        except (ValueError):
+
+            # if we are comparing a freq that does not propagate timezones
+            # this will raise
+            return False
+
+    def _fast_union(self, other, sort=None):
+        if len(other) == 0:
+            return self.view(type(self))
+
+        if len(self) == 0:
+            return other.view(type(self))
+
+        # Both DTIs are monotonic. Check if they are already
+        # in the "correct" order
+        if self[0] <= other[0]:
+            left, right = self, other
+        # DTIs are not in the "correct" order and we don't want
+        # to sort but want to remove overlaps
+        elif sort is False:
+            left, right = self, other
+            left_start = left[0]
+            loc = right.searchsorted(left_start, side='left')
+            right_chunk = right.values[:loc]
+            dates = _concat._concat_compat((left.values, right_chunk))
+            return self._shallow_copy(dates)
+        # DTIs are not in the "correct" order and we want
+        # to sort
+        else:
+            left, right = other, self
+
+        left_end = left[-1]
+        right_end = right[-1]
+
+        # TODO: consider re-implementing freq._should_cache for fastpath
+
+        # concatenate dates
+        if left_end < right_end:
+            loc = right.searchsorted(left_end, side='right')
+            right_chunk = right.values[loc:]
+            dates = _concat._concat_compat((left.values, right_chunk))
+            return self._shallow_copy(dates)
+        else:
+            return left
+
+    def _wrap_setop_result(self, other, result):
+        name = get_op_result_name(self, other)
+        return self._shallow_copy(result, name=name, freq=None, tz=self.tz)
+
+    def intersection(self, other, sort=False):
+        """
+        Specialized intersection for DatetimeIndex objects. May be much faster
+        than Index.intersection
+
+        Parameters
+        ----------
+        other : DatetimeIndex or array-like
+        sort : False or None, default False
+            Sort the resulting index if possible.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default to ``False`` to match the behaviour
+               from before 0.24.0.
+
+        Returns
+        -------
+        y : Index or DatetimeIndex
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+
+        if self.equals(other):
+            return self._get_reconciled_name_object(other)
+
+        if not isinstance(other, DatetimeIndex):
+            try:
+                other = DatetimeIndex(other)
+            except (TypeError, ValueError):
+                pass
+            result = Index.intersection(self, other, sort=sort)
+            if isinstance(result, DatetimeIndex):
+                if result.freq is None:
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+        elif (other.freq is None or self.freq is None or
+              other.freq != self.freq or
+              not other.freq.isAnchored() or
+              (not self.is_monotonic or not other.is_monotonic)):
+            result = Index.intersection(self, other, sort=sort)
+            # Invalidate the freq of `result`, which may not be correct at
+            # this point, depending on the values.
+            result.freq = None
+            result = self._shallow_copy(result._values, name=result.name,
+                                        tz=result.tz, freq=None)
+            if result.freq is None:
+                result.freq = to_offset(result.inferred_freq)
+            return result
+
+        if len(self) == 0:
+            return self
+        if len(other) == 0:
+            return other
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        end = min(left[-1], right[-1])
+        start = right[0]
+
+        if end < start:
+            return type(self)(data=[])
+        else:
+            lslice = slice(*left.slice_locs(start, end))
+            left_chunk = left.values[lslice]
+            return self._shallow_copy(left_chunk)
+
+    # --------------------------------------------------------------------
+
+    def _get_time_micros(self):
+        values = self.asi8
+        if self.tz is not None and not timezones.is_utc(self.tz):
+            values = self._data._local_timestamps()
+        return fields.get_time_micros(values)
+
+    def to_series(self, keep_tz=None, index=None, name=None):
+        """
+        Create a Series with both index and values equal to the index keys
+        useful with map for returning an indexer based on an index
+
+        Parameters
+        ----------
+        keep_tz : optional, defaults False
+            Return the data keeping the timezone.
+
+            If keep_tz is True:
+
+              If the timezone is not set, the resulting
+              Series will have a datetime64[ns] dtype.
+
+              Otherwise the Series will have an datetime64[ns, tz] dtype; the
+              tz will be preserved.
+
+            If keep_tz is False:
+
+              Series will have a datetime64[ns] dtype. TZ aware
+              objects will have the tz removed.
+
+            .. versionchanged:: 0.24
+                The default value will change to True in a future release.
+                You can set ``keep_tz=True`` to already obtain the future
+                behaviour and silence the warning.
+
+        index : Index, optional
+            index of resulting Series. If None, defaults to original index
+        name : string, optional
+            name of resulting Series. If None, defaults to name of original
+            index
+
+        Returns
+        -------
+        Series
+        """
+        from pandas import Series
+
+        if index is None:
+            index = self._shallow_copy()
+        if name is None:
+            name = self.name
+
+        if keep_tz is None and self.tz is not None:
+            warnings.warn("The default of the 'keep_tz' keyword will change "
+                          "to True in a future release. You can set "
+                          "'keep_tz=True' to obtain the future behaviour and "
+                          "silence this warning.", FutureWarning, stacklevel=2)
+            keep_tz = False
+        elif keep_tz is False:
+            warnings.warn("Specifying 'keep_tz=False' is deprecated and this "
+                          "option will be removed in a future release. If "
+                          "you want to remove the timezone information, you "
+                          "can do 'idx.tz_convert(None)' before calling "
+                          "'to_series'.", FutureWarning, stacklevel=2)
+
+        if keep_tz and self.tz is not None:
+            # preserve the tz & copy
+            values = self.copy(deep=True)
+        else:
+            values = self.values.copy()
+
+        return Series(values, index=index, name=name)
+
+    def snap(self, freq='S'):
+        """
+        Snap time stamps to nearest occurring frequency
+        """
+        # Superdumb, punting on any optimizing
+        freq = to_offset(freq)
+
+        snapped = np.empty(len(self), dtype=_NS_DTYPE)
+
+        for i, v in enumerate(self):
+            s = v
+            if not freq.onOffset(s):
+                t0 = freq.rollback(s)
+                t1 = freq.rollforward(s)
+                if abs(s - t0) < abs(t1 - s):
+                    s = t0
+                else:
+                    s = t1
+            snapped[i] = s
+
+        # we know it conforms; skip check
+        return DatetimeIndex._simple_new(snapped, freq=freq)
+        # TODO: what about self.name?  tz? if so, use shallow_copy?
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        if (not isinstance(other, DatetimeIndex) and len(other) > 0 and
+            other.inferred_type not in ('floating', 'integer', 'mixed-integer',
+                                        'mixed-integer-float', 'mixed')):
+            try:
+                other = DatetimeIndex(other)
+            except (TypeError, ValueError):
+                pass
+
+        this, other = self._maybe_utc_convert(other)
+        return Index.join(this, other, how=how, level=level,
+                          return_indexers=return_indexers, sort=sort)
+
+    def _maybe_utc_convert(self, other):
+        this = self
+        if isinstance(other, DatetimeIndex):
+            if self.tz is not None:
+                if other.tz is None:
+                    raise TypeError('Cannot join tz-naive with tz-aware '
+                                    'DatetimeIndex')
+            elif other.tz is not None:
+                raise TypeError('Cannot join tz-naive with tz-aware '
+                                'DatetimeIndex')
+
+            if not timezones.tz_compare(self.tz, other.tz):
+                this = self.tz_convert('UTC')
+                other = other.tz_convert('UTC')
+        return this, other
+
+    def _wrap_joined_index(self, joined, other):
+        name = get_op_result_name(self, other)
+        if (isinstance(other, DatetimeIndex) and
+                self.freq == other.freq and
+                self._can_fast_union(other)):
+            joined = self._shallow_copy(joined)
+            joined.name = name
+            return joined
+        else:
+            tz = getattr(other, 'tz', None)
+            return self._simple_new(joined, name, tz=tz)
+
+    def _parsed_string_to_bounds(self, reso, parsed):
+        """
+        Calculate datetime bounds for parsed time string and its resolution.
+
+        Parameters
+        ----------
+        reso : Resolution
+            Resolution provided by parsed string.
+        parsed : datetime
+            Datetime from parsed string.
+
+        Returns
+        -------
+        lower, upper: pd.Timestamp
+
+        """
+        valid_resos = {'year', 'month', 'quarter', 'day', 'hour', 'minute',
+                       'second', 'minute', 'second', 'microsecond'}
+        if reso not in valid_resos:
+            raise KeyError
+        if reso == 'year':
+            start = Timestamp(parsed.year, 1, 1)
+            end = Timestamp(parsed.year, 12, 31, 23, 59, 59, 999999)
+        elif reso == 'month':
+            d = ccalendar.get_days_in_month(parsed.year, parsed.month)
+            start = Timestamp(parsed.year, parsed.month, 1)
+            end = Timestamp(parsed.year, parsed.month, d, 23, 59, 59, 999999)
+        elif reso == 'quarter':
+            qe = (((parsed.month - 1) + 2) % 12) + 1  # two months ahead
+            d = ccalendar.get_days_in_month(parsed.year, qe)  # at end of month
+            start = Timestamp(parsed.year, parsed.month, 1)
+            end = Timestamp(parsed.year, qe, d, 23, 59, 59, 999999)
+        elif reso == 'day':
+            start = Timestamp(parsed.year, parsed.month, parsed.day)
+            end = start + timedelta(days=1) - Nano(1)
+        elif reso == 'hour':
+            start = Timestamp(parsed.year, parsed.month, parsed.day,
+                              parsed.hour)
+            end = start + timedelta(hours=1) - Nano(1)
+        elif reso == 'minute':
+            start = Timestamp(parsed.year, parsed.month, parsed.day,
+                              parsed.hour, parsed.minute)
+            end = start + timedelta(minutes=1) - Nano(1)
+        elif reso == 'second':
+            start = Timestamp(parsed.year, parsed.month, parsed.day,
+                              parsed.hour, parsed.minute, parsed.second)
+            end = start + timedelta(seconds=1) - Nano(1)
+        elif reso == 'microsecond':
+            start = Timestamp(parsed.year, parsed.month, parsed.day,
+                              parsed.hour, parsed.minute, parsed.second,
+                              parsed.microsecond)
+            end = start + timedelta(microseconds=1) - Nano(1)
+        # GH 24076
+        # If an incoming date string contained a UTC offset, need to localize
+        # the parsed date to this offset first before aligning with the index's
+        # timezone
+        if parsed.tzinfo is not None:
+            if self.tz is None:
+                raise ValueError("The index must be timezone aware "
+                                 "when indexing with a date string with a "
+                                 "UTC offset")
+            start = start.tz_localize(parsed.tzinfo).tz_convert(self.tz)
+            end = end.tz_localize(parsed.tzinfo).tz_convert(self.tz)
+        elif self.tz is not None:
+            start = start.tz_localize(self.tz)
+            end = end.tz_localize(self.tz)
+        return start, end
+
+    def _partial_date_slice(self, reso, parsed, use_lhs=True, use_rhs=True):
+        is_monotonic = self.is_monotonic
+        if (is_monotonic and reso in ['day', 'hour', 'minute', 'second'] and
+                self._resolution >= Resolution.get_reso(reso)):
+            # These resolution/monotonicity validations came from GH3931,
+            # GH3452 and GH2369.
+
+            # See also GH14826
+            raise KeyError
+
+        if reso == 'microsecond':
+            # _partial_date_slice doesn't allow microsecond resolution, but
+            # _parsed_string_to_bounds allows it.
+            raise KeyError
+
+        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
+        stamps = self.asi8
+
+        if is_monotonic:
+
+            # we are out of range
+            if (len(stamps) and ((use_lhs and t1.value < stamps[0] and
+                                  t2.value < stamps[0]) or
+                                 ((use_rhs and t1.value > stamps[-1] and
+                                   t2.value > stamps[-1])))):
+                raise KeyError
+
+            # a monotonic (sorted) series can be sliced
+            left = stamps.searchsorted(
+                t1.value, side='left') if use_lhs else None
+            right = stamps.searchsorted(
+                t2.value, side='right') if use_rhs else None
+
+            return slice(left, right)
+
+        lhs_mask = (stamps >= t1.value) if use_lhs else True
+        rhs_mask = (stamps <= t2.value) if use_rhs else True
+
+        # try to find a the dates
+        return (lhs_mask & rhs_mask).nonzero()[0]
+
+    def _maybe_promote(self, other):
+        if other.inferred_type == 'date':
+            other = DatetimeIndex(other)
+        return self, other
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+
+        if isinstance(key, datetime):
+
+            # needed to localize naive datetimes
+            if self.tz is not None:
+                if key.tzinfo is not None:
+                    key = Timestamp(key).tz_convert(self.tz)
+                else:
+                    key = Timestamp(key).tz_localize(self.tz)
+
+            return self.get_value_maybe_box(series, key)
+
+        if isinstance(key, time):
+            locs = self.indexer_at_time(key)
+            return series.take(locs)
+
+        try:
+            return com.maybe_box(self, Index.get_value(self, series, key),
+                                 series, key)
+        except KeyError:
+            try:
+                loc = self._get_string_slice(key)
+                return series[loc]
+            except (TypeError, ValueError, KeyError):
+                pass
+
+            try:
+                return self.get_value_maybe_box(series, key)
+            except (TypeError, ValueError, KeyError):
+                raise KeyError(key)
+
+    def get_value_maybe_box(self, series, key):
+        # needed to localize naive datetimes
+        if self.tz is not None:
+            key = Timestamp(key)
+            if key.tzinfo is not None:
+                key = key.tz_convert(self.tz)
+            else:
+                key = key.tz_localize(self.tz)
+        elif not isinstance(key, Timestamp):
+            key = Timestamp(key)
+        values = self._engine.get_value(com.values_from_object(series),
+                                        key, tz=self.tz)
+        return com.maybe_box(self, values, series, key)
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+
+        if tolerance is not None:
+            # try converting tolerance now, so errors don't get swallowed by
+            # the try/except clauses below
+            tolerance = self._convert_tolerance(tolerance, np.asarray(key))
+
+        if isinstance(key, datetime):
+            # needed to localize naive datetimes
+            if key.tzinfo is None:
+                key = Timestamp(key, tz=self.tz)
+            else:
+                key = Timestamp(key).tz_convert(self.tz)
+            return Index.get_loc(self, key, method, tolerance)
+
+        elif isinstance(key, timedelta):
+            # GH#20464
+            raise TypeError("Cannot index {cls} with {other}"
+                            .format(cls=type(self).__name__,
+                                    other=type(key).__name__))
+
+        if isinstance(key, time):
+            if method is not None:
+                raise NotImplementedError('cannot yet lookup inexact labels '
+                                          'when key is a time object')
+            return self.indexer_at_time(key)
+
+        try:
+            return Index.get_loc(self, key, method, tolerance)
+        except (KeyError, ValueError, TypeError):
+            try:
+                return self._get_string_slice(key)
+            except (TypeError, KeyError, ValueError, OverflowError):
+                pass
+
+            try:
+                stamp = Timestamp(key)
+                if stamp.tzinfo is not None and self.tz is not None:
+                    stamp = stamp.tz_convert(self.tz)
+                else:
+                    stamp = stamp.tz_localize(self.tz)
+                return Index.get_loc(self, stamp, method, tolerance)
+            except KeyError:
+                raise KeyError(key)
+            except ValueError as e:
+                # list-like tolerance size must match target index size
+                if 'list-like' in str(e):
+                    raise e
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string, cast it to datetime according to resolution.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if is_float(label) or isinstance(label, time) or is_integer(label):
+            self._invalid_indexer('slice', label)
+
+        if isinstance(label, compat.string_types):
+            freq = getattr(self, 'freqstr',
+                           getattr(self, 'inferred_freq', None))
+            _, parsed, reso = parsing.parse_time_string(label, freq)
+            lower, upper = self._parsed_string_to_bounds(reso, parsed)
+            # lower, upper form the half-open interval:
+            #   [parsed, parsed + 1 freq)
+            # because label may be passed to searchsorted
+            # the bounds need swapped if index is reverse sorted and has a
+            # length > 1 (is_monotonic_decreasing gives True for empty
+            # and length 1 index)
+            if self._is_strictly_monotonic_decreasing and len(self) > 1:
+                return upper if side == 'left' else lower
+            return lower if side == 'left' else upper
+        else:
+            return label
+
+    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
+        freq = getattr(self, 'freqstr',
+                       getattr(self, 'inferred_freq', None))
+        _, parsed, reso = parsing.parse_time_string(key, freq)
+        loc = self._partial_date_slice(reso, parsed, use_lhs=use_lhs,
+                                       use_rhs=use_rhs)
+        return loc
+
+    def slice_indexer(self, start=None, end=None, step=None, kind=None):
+        """
+        Return indexer for specified label slice.
+        Index.slice_indexer, customized to handle time slicing.
+
+        In addition to functionality provided by Index.slice_indexer, does the
+        following:
+
+        - if both `start` and `end` are instances of `datetime.time`, it
+          invokes `indexer_between_time`
+        - if `start` and `end` are both either string or None perform
+          value-based selection in non-monotonic cases.
+
+        """
+        # For historical reasons DatetimeIndex supports slices between two
+        # instances of datetime.time as if it were applying a slice mask to
+        # an array of (self.hour, self.minute, self.seconds, self.microsecond).
+        if isinstance(start, time) and isinstance(end, time):
+            if step is not None and step != 1:
+                raise ValueError('Must have step size of 1 with time slices')
+            return self.indexer_between_time(start, end)
+
+        if isinstance(start, time) or isinstance(end, time):
+            raise KeyError('Cannot mix time and non-time slice keys')
+
+        try:
+            return Index.slice_indexer(self, start, end, step, kind=kind)
+        except KeyError:
+            # For historical reasons DatetimeIndex by default supports
+            # value-based partial (aka string) slices on non-monotonic arrays,
+            # let's try that.
+            if ((start is None or isinstance(start, compat.string_types)) and
+                    (end is None or isinstance(end, compat.string_types))):
+                mask = True
+                if start is not None:
+                    start_casted = self._maybe_cast_slice_bound(
+                        start, 'left', kind)
+                    mask = start_casted <= self
+
+                if end is not None:
+                    end_casted = self._maybe_cast_slice_bound(
+                        end, 'right', kind)
+                    mask = (self <= end_casted) & mask
+
+                indexer = mask.nonzero()[0][::step]
+                if len(indexer) == len(self):
+                    return slice(None)
+                else:
+                    return indexer
+            else:
+                raise
+
+    # --------------------------------------------------------------------
+    # Wrapping DatetimeArray
+
+    # Compat for frequency inference, see GH#23789
+    _is_monotonic_increasing = Index.is_monotonic_increasing
+    _is_monotonic_decreasing = Index.is_monotonic_decreasing
+    _is_unique = Index.is_unique
+
+    _timezone = cache_readonly(DatetimeArray._timezone.fget)
+    is_normalized = cache_readonly(DatetimeArray.is_normalized.fget)
+    _resolution = cache_readonly(DatetimeArray._resolution.fget)
+
+    strftime = ea_passthrough(DatetimeArray.strftime)
+    _has_same_tz = ea_passthrough(DatetimeArray._has_same_tz)
+
+    @property
+    def offset(self):
+        """
+        get/set the frequency of the instance
+        """
+        msg = ('{cls}.offset has been deprecated and will be removed '
+               'in a future version; use {cls}.freq instead.'
+               .format(cls=type(self).__name__))
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        return self.freq
+
+    @offset.setter
+    def offset(self, value):
+        """
+        get/set the frequency of the instance
+        """
+        msg = ('{cls}.offset has been deprecated and will be removed '
+               'in a future version; use {cls}.freq instead.'
+               .format(cls=type(self).__name__))
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        self.freq = value
+
+    def __getitem__(self, key):
+        result = self._data.__getitem__(key)
+        if is_scalar(result):
+            return result
+        elif result.ndim > 1:
+            # To support MPL which performs slicing with 2 dim
+            # even though it only has 1 dim by definition
+            assert isinstance(result, np.ndarray), result
+            return result
+        return type(self)(result, name=self.name)
+
+    @property
+    def _box_func(self):
+        return lambda x: Timestamp(x, tz=self.tz)
+
+    # --------------------------------------------------------------------
+
+    @Substitution(klass='DatetimeIndex')
+    @Appender(_shared_docs['searchsorted'])
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, (np.ndarray, Index)):
+            value = np.array(value, dtype=_NS_DTYPE, copy=False)
+        else:
+            value = _to_M8(value, tz=self.tz)
+
+        return self.values.searchsorted(value, side=side)
+
+    def is_type_compatible(self, typ):
+        return typ == self.inferred_type or typ == 'datetime'
+
+    @property
+    def inferred_type(self):
+        # b/c datetime is represented as microseconds since the epoch, make
+        # sure we can't have ambiguous indexing
+        return 'datetime64'
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+            if not either a Python datetime or a numpy integer-like, returned
+            Index dtype will be object rather than datetime.
+
+        Returns
+        -------
+        new_index : Index
+        """
+        if is_scalar(item) and isna(item):
+            # GH 18295
+            item = self._na_value
+
+        freq = None
+
+        if isinstance(item, (datetime, np.datetime64)):
+            self._assert_can_do_op(item)
+            if not self._has_same_tz(item) and not isna(item):
+                raise ValueError(
+                    'Passed item and index have different timezone')
+            # check freq can be preserved on edge cases
+            if self.size and self.freq is not None:
+                if ((loc == 0 or loc == -len(self)) and
+                        item + self.freq == self[0]):
+                    freq = self.freq
+                elif (loc == len(self)) and item - self.freq == self[-1]:
+                    freq = self.freq
+            item = _to_M8(item, tz=self.tz)
+
+        try:
+            new_dates = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
+                                        self[loc:].asi8))
+            return self._shallow_copy(new_dates, freq=freq)
+        except (AttributeError, TypeError):
+
+            # fall back to object index
+            if isinstance(item, compat.string_types):
+                return self.astype(object).insert(loc, item)
+            raise TypeError(
+                "cannot insert DatetimeIndex with incompatible label")
+
+    def delete(self, loc):
+        """
+        Make a new DatetimeIndex with passed location(s) deleted.
+
+        Parameters
+        ----------
+        loc: int, slice or array of ints
+            Indicate which sub-arrays to remove.
+
+        Returns
+        -------
+        new_index : DatetimeIndex
+        """
+        new_dates = np.delete(self.asi8, loc)
+
+        freq = None
+        if is_integer(loc):
+            if loc in (0, -len(self), -1, len(self) - 1):
+                freq = self.freq
+        else:
+            if is_list_like(loc):
+                loc = lib.maybe_indices_to_slice(
+                    ensure_int64(np.array(loc)), len(self))
+            if isinstance(loc, slice) and loc.step in (1, None):
+                if (loc.start in (0, None) or loc.stop in (len(self), None)):
+                    freq = self.freq
+
+        return self._shallow_copy(new_dates, freq=freq)
+
+    def indexer_at_time(self, time, asof=False):
+        """
+        Return index locations of index values at particular time of day
+        (e.g. 9:30AM).
+
+        Parameters
+        ----------
+        time : datetime.time or string
+            datetime.time or string in appropriate format ("%H:%M", "%H%M",
+            "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+            "%I%M%S%p").
+
+        Returns
+        -------
+        values_at_time : array of integers
+
+        See Also
+        --------
+        indexer_between_time, DataFrame.at_time
+        """
+        if asof:
+            raise NotImplementedError("'asof' argument is not supported")
+
+        if isinstance(time, compat.string_types):
+            from dateutil.parser import parse
+            time = parse(time).time()
+
+        if time.tzinfo:
+            if self.tz is None:
+                raise ValueError("Index must be timezone aware.")
+            time_micros = self.tz_convert(time.tzinfo)._get_time_micros()
+        else:
+            time_micros = self._get_time_micros()
+        micros = _time_to_micros(time)
+        return (micros == time_micros).nonzero()[0]
+
+    def indexer_between_time(self, start_time, end_time, include_start=True,
+                             include_end=True):
+        """
+        Return index locations of values between particular times of day
+        (e.g., 9:00-9:30AM).
+
+        Parameters
+        ----------
+        start_time, end_time : datetime.time, str
+            datetime.time or string in appropriate format ("%H:%M", "%H%M",
+            "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+            "%I%M%S%p").
+        include_start : boolean, default True
+        include_end : boolean, default True
+
+        Returns
+        -------
+        values_between_time : array of integers
+
+        See Also
+        --------
+        indexer_at_time, DataFrame.between_time
+        """
+        start_time = tools.to_time(start_time)
+        end_time = tools.to_time(end_time)
+        time_micros = self._get_time_micros()
+        start_micros = _time_to_micros(start_time)
+        end_micros = _time_to_micros(end_time)
+
+        if include_start and include_end:
+            lop = rop = operator.le
+        elif include_start:
+            lop = operator.le
+            rop = operator.lt
+        elif include_end:
+            lop = operator.lt
+            rop = operator.le
+        else:
+            lop = rop = operator.lt
+
+        if start_time <= end_time:
+            join_op = operator.and_
+        else:
+            join_op = operator.or_
+
+        mask = join_op(lop(start_micros, time_micros),
+                       rop(time_micros, end_micros))
+
+        return mask.nonzero()[0]
+
+
+DatetimeIndex._add_comparison_ops()
+DatetimeIndex._add_numeric_methods_disabled()
+DatetimeIndex._add_logical_methods_disabled()
+DatetimeIndex._add_datetimelike_methods()
+
+
+def date_range(start=None, end=None, periods=None, freq=None, tz=None,
+               normalize=False, name=None, closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex.
+
+    Parameters
+    ----------
+    start : str or datetime-like, optional
+        Left bound for generating dates.
+    end : str or datetime-like, optional
+        Right bound for generating dates.
+    periods : integer, optional
+        Number of periods to generate.
+    freq : str or DateOffset, default 'D'
+        Frequency strings can have multiples, e.g. '5H'. See
+        :ref:`here <timeseries.offset_aliases>` for a list of
+        frequency aliases.
+    tz : str or tzinfo, optional
+        Time zone name for returning localized DatetimeIndex, for example
+        'Asia/Hong_Kong'. By default, the resulting DatetimeIndex is
+        timezone-naive.
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range.
+    name : str, default None
+        Name of the resulting DatetimeIndex.
+    closed : {None, 'left', 'right'}, optional
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None, the default).
+    **kwargs
+        For compatibility. Has no effect on the result.
+
+    Returns
+    -------
+    rng : DatetimeIndex
+
+    See Also
+    --------
+    DatetimeIndex : An immutable container for datetimes.
+    timedelta_range : Return a fixed frequency TimedeltaIndex.
+    period_range : Return a fixed frequency PeriodIndex.
+    interval_range : Return a fixed frequency IntervalIndex.
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``DatetimeIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end`` (closed on both sides).
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+    **Specifying the values**
+
+    The next four examples generate the same `DatetimeIndex`, but vary
+    the combination of `start`, `end` and `periods`.
+
+    Specify `start` and `end`, with the default daily frequency.
+
+    >>> pd.date_range(start='1/1/2018', end='1/08/2018')
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+                   '2018-01-05', '2018-01-06', '2018-01-07', '2018-01-08'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `start` and `periods`, the number of periods (days).
+
+    >>> pd.date_range(start='1/1/2018', periods=8)
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+                   '2018-01-05', '2018-01-06', '2018-01-07', '2018-01-08'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `end` and `periods`, the number of periods (days).
+
+    >>> pd.date_range(end='1/1/2018', periods=8)
+    DatetimeIndex(['2017-12-25', '2017-12-26', '2017-12-27', '2017-12-28',
+                   '2017-12-29', '2017-12-30', '2017-12-31', '2018-01-01'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Specify `start`, `end`, and `periods`; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.date_range(start='2018-04-24', end='2018-04-27', periods=3)
+    DatetimeIndex(['2018-04-24 00:00:00', '2018-04-25 12:00:00',
+                   '2018-04-27 00:00:00'],
+                  dtype='datetime64[ns]', freq=None)
+
+    **Other Parameters**
+
+    Changed the `freq` (frequency) to ``'M'`` (month end frequency).
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq='M')
+    DatetimeIndex(['2018-01-31', '2018-02-28', '2018-03-31', '2018-04-30',
+                   '2018-05-31'],
+                  dtype='datetime64[ns]', freq='M')
+
+    Multiples are allowed
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq='3M')
+    DatetimeIndex(['2018-01-31', '2018-04-30', '2018-07-31', '2018-10-31',
+                   '2019-01-31'],
+                  dtype='datetime64[ns]', freq='3M')
+
+    `freq` can also be specified as an Offset object.
+
+    >>> pd.date_range(start='1/1/2018', periods=5, freq=pd.offsets.MonthEnd(3))
+    DatetimeIndex(['2018-01-31', '2018-04-30', '2018-07-31', '2018-10-31',
+                   '2019-01-31'],
+                  dtype='datetime64[ns]', freq='3M')
+
+    Specify `tz` to set the timezone.
+
+    >>> pd.date_range(start='1/1/2018', periods=5, tz='Asia/Tokyo')
+    DatetimeIndex(['2018-01-01 00:00:00+09:00', '2018-01-02 00:00:00+09:00',
+                   '2018-01-03 00:00:00+09:00', '2018-01-04 00:00:00+09:00',
+                   '2018-01-05 00:00:00+09:00'],
+                  dtype='datetime64[ns, Asia/Tokyo]', freq='D')
+
+    `closed` controls whether to include `start` and `end` that are on the
+    boundary. The default includes boundary points on either end.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed=None)
+    DatetimeIndex(['2017-01-01', '2017-01-02', '2017-01-03', '2017-01-04'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Use ``closed='left'`` to exclude `end` if it falls on the boundary.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed='left')
+    DatetimeIndex(['2017-01-01', '2017-01-02', '2017-01-03'],
+                  dtype='datetime64[ns]', freq='D')
+
+    Use ``closed='right'`` to exclude `start` if it falls on the boundary.
+
+    >>> pd.date_range(start='2017-01-01', end='2017-01-04', closed='right')
+    DatetimeIndex(['2017-01-02', '2017-01-03', '2017-01-04'],
+                  dtype='datetime64[ns]', freq='D')
+    """
+
+    if freq is None and com._any_none(periods, start, end):
+        freq = 'D'
+
+    dtarr = DatetimeArray._generate_range(
+        start=start, end=end, periods=periods,
+        freq=freq, tz=tz, normalize=normalize,
+        closed=closed, **kwargs)
+    return DatetimeIndex._simple_new(
+        dtarr, tz=dtarr.tz, freq=dtarr.freq, name=name)
+
+
+def bdate_range(start=None, end=None, periods=None, freq='B', tz=None,
+                normalize=True, name=None, weekmask=None, holidays=None,
+                closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex, with business day as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or datetime-like, default None
+        Left bound for generating dates.
+    end : string or datetime-like, default None
+        Right bound for generating dates.
+    periods : integer, default None
+        Number of periods to generate.
+    freq : string or DateOffset, default 'B' (business daily)
+        Frequency strings can have multiples, e.g. '5H'.
+    tz : string or None
+        Time zone name for returning localized DatetimeIndex, for example
+        Asia/Beijing.
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range.
+    name : string, default None
+        Name of the resulting DatetimeIndex.
+    weekmask : string or None, default None
+        Weekmask of valid business days, passed to ``numpy.busdaycalendar``,
+        only used when custom frequency strings are passed.  The default
+        value None is equivalent to 'Mon Tue Wed Thu Fri'.
+
+        .. versionadded:: 0.21.0
+
+    holidays : list-like or None, default None
+        Dates to exclude from the set of valid business days, passed to
+        ``numpy.busdaycalendar``, only used when custom frequency strings
+        are passed.
+
+        .. versionadded:: 0.21.0
+
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None).
+    **kwargs
+        For compatibility. Has no effect on the result.
+
+    Returns
+    -------
+    DatetimeIndex
+
+    Notes
+    -----
+    Of the four parameters: ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified.  Specifying ``freq`` is a requirement
+    for ``bdate_range``.  Use ``date_range`` if specifying ``freq`` is not
+    desired.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+    Note how the two weekend days are skipped in the result.
+
+    >>> pd.bdate_range(start='1/1/2018', end='1/08/2018')
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+               '2018-01-05', '2018-01-08'],
+              dtype='datetime64[ns]', freq='B')
+    """
+    if freq is None:
+        msg = 'freq must be specified for bdate_range; use date_range instead'
+        raise TypeError(msg)
+
+    if is_string_like(freq) and freq.startswith('C'):
+        try:
+            weekmask = weekmask or 'Mon Tue Wed Thu Fri'
+            freq = prefix_mapping[freq](holidays=holidays, weekmask=weekmask)
+        except (KeyError, TypeError):
+            msg = 'invalid custom frequency string: {freq}'.format(freq=freq)
+            raise ValueError(msg)
+    elif holidays or weekmask:
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency {freq}').format(freq=freq)
+        raise ValueError(msg)
+
+    return date_range(start=start, end=end, periods=periods,
+                      freq=freq, tz=tz, normalize=normalize, name=name,
+                      closed=closed, **kwargs)
+
+
+def cdate_range(start=None, end=None, periods=None, freq='C', tz=None,
+                normalize=True, name=None, closed=None, **kwargs):
+    """
+    Return a fixed frequency DatetimeIndex, with CustomBusinessDay as the
+    default frequency
+
+    .. deprecated:: 0.21.0
+
+    Parameters
+    ----------
+    start : string or datetime-like, default None
+        Left bound for generating dates
+    end : string or datetime-like, default None
+        Right bound for generating dates
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'C' (CustomBusinessDay)
+        Frequency strings can have multiples, e.g. '5H'
+    tz : string, default None
+        Time zone name for returning localized DatetimeIndex, for example
+        Asia/Beijing
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range
+    name : string, default None
+        Name of the resulting DatetimeIndex
+    weekmask : string, Default 'Mon Tue Wed Thu Fri'
+        weekmask of valid business days, passed to ``numpy.busdaycalendar``
+    holidays : list
+        list/array of dates to exclude from the set of valid business days,
+        passed to ``numpy.busdaycalendar``
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+    Notes
+    -----
+    Of the three parameters: ``start``, ``end``, and ``periods``, exactly two
+    must be specified.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Returns
+    -------
+    rng : DatetimeIndex
+    """
+    warnings.warn("cdate_range is deprecated and will be removed in a future "
+                  "version, instead use pd.bdate_range(..., freq='{freq}')"
+                  .format(freq=freq), FutureWarning, stacklevel=2)
+
+    if freq == 'C':
+        holidays = kwargs.pop('holidays', [])
+        weekmask = kwargs.pop('weekmask', 'Mon Tue Wed Thu Fri')
+        freq = CDay(holidays=holidays, weekmask=weekmask)
+
+    return date_range(start=start, end=end, periods=periods, freq=freq,
+                      tz=tz, normalize=normalize, name=name,
+                      closed=closed, **kwargs)
+
+
+def _time_to_micros(time):
+    seconds = time.hour * 60 * 60 + 60 * time.minute + time.second
+    return 1000000 * seconds + time.microsecond
diff --git a/pandas/core/indexes/frozen.py b/pandas/core/indexes/frozen.py
new file mode 100644
index 0000000000000..982645ebd5124
--- /dev/null
+++ b/pandas/core/indexes/frozen.py
@@ -0,0 +1,196 @@
+"""
+frozen (immutable) data structures to support MultiIndexing
+
+These are used for:
+
+- .names (FrozenList)
+- .levels & .codes (FrozenNDArray)
+
+"""
+
+import warnings
+
+import numpy as np
+
+from pandas.util._decorators import deprecate_kwarg
+
+from pandas.core.dtypes.cast import coerce_indexer_dtype
+
+from pandas.core.base import PandasObject
+
+from pandas.io.formats.printing import pprint_thing
+
+
+class FrozenList(PandasObject, list):
+
+    """
+    Container that doesn't allow setting item *but*
+    because it's technically non-hashable, will be used
+    for lookups, appropriately, etc.
+    """
+    # Side note: This has to be of type list. Otherwise,
+    #            it messes up PyTables type checks.
+
+    def union(self, other):
+        """
+        Returns a FrozenList with other concatenated to the end of self.
+
+        Parameters
+        ----------
+        other : array-like
+            The array-like whose elements we are concatenating.
+
+        Returns
+        -------
+        diff : FrozenList
+            The collection difference between self and other.
+        """
+        if isinstance(other, tuple):
+            other = list(other)
+        return type(self)(super(FrozenList, self).__add__(other))
+
+    def difference(self, other):
+        """
+        Returns a FrozenList with elements from other removed from self.
+
+        Parameters
+        ----------
+        other : array-like
+            The array-like whose elements we are removing self.
+
+        Returns
+        -------
+        diff : FrozenList
+            The collection difference between self and other.
+        """
+        other = set(other)
+        temp = [x for x in self if x not in other]
+        return type(self)(temp)
+
+    # TODO: Consider deprecating these in favor of `union` (xref gh-15506)
+    __add__ = __iadd__ = union
+
+    # Python 2 compat
+    def __getslice__(self, i, j):
+        return self.__class__(super(FrozenList, self).__getslice__(i, j))
+
+    def __getitem__(self, n):
+        # Python 3 compat
+        if isinstance(n, slice):
+            return self.__class__(super(FrozenList, self).__getitem__(n))
+        return super(FrozenList, self).__getitem__(n)
+
+    def __radd__(self, other):
+        if isinstance(other, tuple):
+            other = list(other)
+        return self.__class__(other + list(self))
+
+    def __eq__(self, other):
+        if isinstance(other, (tuple, FrozenList)):
+            other = list(other)
+        return super(FrozenList, self).__eq__(other)
+
+    __req__ = __eq__
+
+    def __mul__(self, other):
+        return self.__class__(super(FrozenList, self).__mul__(other))
+
+    __imul__ = __mul__
+
+    def __reduce__(self):
+        return self.__class__, (list(self),)
+
+    def __hash__(self):
+        return hash(tuple(self))
+
+    def _disabled(self, *args, **kwargs):
+        """This method will not function because object is immutable."""
+        raise TypeError("'%s' does not support mutable operations." %
+                        self.__class__.__name__)
+
+    def __unicode__(self):
+        return pprint_thing(self, quote_strings=True,
+                            escape_chars=('\t', '\r', '\n'))
+
+    def __repr__(self):
+        return "%s(%s)" % (self.__class__.__name__,
+                           str(self))
+
+    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
+    pop = append = extend = remove = sort = insert = _disabled
+
+
+class FrozenNDArray(PandasObject, np.ndarray):
+
+    # no __array_finalize__ for now because no metadata
+    def __new__(cls, data, dtype=None, copy=False):
+        warnings.warn("\nFrozenNDArray is deprecated and will be removed in a "
+                      "future version.\nPlease use `numpy.ndarray` instead.\n",
+                      FutureWarning, stacklevel=2)
+
+        if copy is None:
+            copy = not isinstance(data, FrozenNDArray)
+        res = np.array(data, dtype=dtype, copy=copy).view(cls)
+        return res
+
+    def _disabled(self, *args, **kwargs):
+        """This method will not function because object is immutable."""
+        raise TypeError("'%s' does not support mutable operations." %
+                        self.__class__)
+
+    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
+    put = itemset = fill = _disabled
+
+    def _shallow_copy(self):
+        return self.view()
+
+    def values(self):
+        """returns *copy* of underlying array"""
+        arr = self.view(np.ndarray).copy()
+        return arr
+
+    def __unicode__(self):
+        """
+        Return a string representation for this object.
+
+        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
+        py2/py3.
+        """
+        prepr = pprint_thing(self, escape_chars=('\t', '\r', '\n'),
+                             quote_strings=True)
+        return "%s(%s, dtype='%s')" % (type(self).__name__, prepr, self.dtype)
+
+    @deprecate_kwarg(old_arg_name="v", new_arg_name="value")
+    def searchsorted(self, value, side="left", sorter=None):
+        """
+        Find indices to insert `value` so as to maintain order.
+
+        For full documentation, see `numpy.searchsorted`
+
+        See Also
+        --------
+        numpy.searchsorted : Equivalent function.
+        """
+
+        # We are much more performant if the searched
+        # indexer is the same type as the array.
+        #
+        # This doesn't matter for int64, but DOES
+        # matter for smaller int dtypes.
+        #
+        # xref: https://github.com/numpy/numpy/issues/5370
+        try:
+            value = self.dtype.type(value)
+        except ValueError:
+            pass
+
+        return super(FrozenNDArray, self).searchsorted(
+            value, side=side, sorter=sorter)
+
+
+def _ensure_frozen(array_like, categories, copy=False):
+    array_like = coerce_indexer_dtype(array_like, categories)
+    array_like = array_like.view(FrozenNDArray)
+    if copy:
+        array_like = array_like.copy()
+    return array_like
diff --git a/pandas/core/indexes/interval.py b/pandas/core/indexes/interval.py
new file mode 100644
index 0000000000000..2c63fe33c57fe
--- /dev/null
+++ b/pandas/core/indexes/interval.py
@@ -0,0 +1,1315 @@
+""" define the IntervalIndex """
+import textwrap
+import warnings
+
+import numpy as np
+
+from pandas._libs import Timedelta, Timestamp
+from pandas._libs.interval import Interval, IntervalMixin, IntervalTree
+from pandas.compat import add_metaclass
+from pandas.util._decorators import Appender, cache_readonly
+from pandas.util._doctools import _WritableDoc
+from pandas.util._exceptions import rewrite_exception
+
+from pandas.core.dtypes.cast import (
+    find_common_type, infer_dtype_from_scalar, maybe_downcast_to_dtype)
+from pandas.core.dtypes.common import (
+    ensure_platform_int, is_datetime64tz_dtype, is_datetime_or_timedelta_dtype,
+    is_dtype_equal, is_float, is_float_dtype, is_integer, is_integer_dtype,
+    is_interval_dtype, is_list_like, is_number, is_object_dtype, is_scalar)
+from pandas.core.dtypes.missing import isna
+
+from pandas.core.arrays.interval import IntervalArray, _interval_shared_docs
+import pandas.core.common as com
+from pandas.core.config import get_option
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import (
+    Index, _index_shared_docs, default_pprint, ensure_index)
+from pandas.core.indexes.datetimes import DatetimeIndex, date_range
+from pandas.core.indexes.multi import MultiIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex, timedelta_range
+from pandas.core.ops import get_op_result_name
+
+from pandas.tseries.frequencies import to_offset
+from pandas.tseries.offsets import DateOffset
+
+_VALID_CLOSED = {'left', 'right', 'both', 'neither'}
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+
+_index_doc_kwargs.update(
+    dict(klass='IntervalIndex',
+         qualname="IntervalIndex",
+         target_klass='IntervalIndex or list of Intervals',
+         name=textwrap.dedent("""\
+         name : object, optional
+              Name to be stored in the index.
+         """),
+         ))
+
+
+def _get_next_label(label):
+    dtype = getattr(label, 'dtype', type(label))
+    if isinstance(label, (Timestamp, Timedelta)):
+        dtype = 'datetime64'
+    if is_datetime_or_timedelta_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        return label + np.timedelta64(1, 'ns')
+    elif is_integer_dtype(dtype):
+        return label + 1
+    elif is_float_dtype(dtype):
+        return np.nextafter(label, np.infty)
+    else:
+        raise TypeError('cannot determine next label for type {typ!r}'
+                        .format(typ=type(label)))
+
+
+def _get_prev_label(label):
+    dtype = getattr(label, 'dtype', type(label))
+    if isinstance(label, (Timestamp, Timedelta)):
+        dtype = 'datetime64'
+    if is_datetime_or_timedelta_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        return label - np.timedelta64(1, 'ns')
+    elif is_integer_dtype(dtype):
+        return label - 1
+    elif is_float_dtype(dtype):
+        return np.nextafter(label, -np.infty)
+    else:
+        raise TypeError('cannot determine next label for type {typ!r}'
+                        .format(typ=type(label)))
+
+
+def _get_interval_closed_bounds(interval):
+    """
+    Given an Interval or IntervalIndex, return the corresponding interval with
+    closed bounds.
+    """
+    left, right = interval.left, interval.right
+    if interval.open_left:
+        left = _get_next_label(left)
+    if interval.open_right:
+        right = _get_prev_label(right)
+    return left, right
+
+
+def _new_IntervalIndex(cls, d):
+    """
+    This is called upon unpickling, rather than the default which doesn't have
+    arguments and breaks __new__
+    """
+    return cls.from_arrays(**d)
+
+
+@Appender(_interval_shared_docs['class'] % dict(
+    klass="IntervalIndex",
+    summary="Immutable index of intervals that are closed on the same side.",
+    name=_index_doc_kwargs['name'],
+    versionadded="0.20.0",
+    extra_attributes="is_overlapping\nvalues\n",
+    extra_methods="contains\n",
+    examples=textwrap.dedent("""\
+    Examples
+    --------
+    A new ``IntervalIndex`` is typically constructed using
+    :func:`interval_range`:
+
+    >>> pd.interval_range(start=0, end=5)
+    IntervalIndex([(0, 1], (1, 2], (2, 3], (3, 4], (4, 5]],
+                  closed='right',
+                  dtype='interval[int64]')
+
+    It may also be constructed using one of the constructor
+    methods: :meth:`IntervalIndex.from_arrays`,
+    :meth:`IntervalIndex.from_breaks`, and :meth:`IntervalIndex.from_tuples`.
+
+    See further examples in the doc strings of ``interval_range`` and the
+    mentioned constructor methods.
+    """),
+
+))
+@add_metaclass(_WritableDoc)
+class IntervalIndex(IntervalMixin, Index):
+    _typ = 'intervalindex'
+    _comparables = ['name']
+    _attributes = ['name', 'closed']
+
+    # we would like our indexing holder to defer to us
+    _defer_to_indexing = True
+
+    # Immutable, so we are able to cache computations like isna in '_mask'
+    _mask = None
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, data, closed=None, dtype=None, copy=False,
+                name=None, verify_integrity=True):
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        with rewrite_exception("IntervalArray", cls.__name__):
+            array = IntervalArray(data, closed=closed, copy=copy, dtype=dtype,
+                                  verify_integrity=verify_integrity)
+
+        return cls._simple_new(array, name)
+
+    @classmethod
+    def _simple_new(cls, array, name, closed=None):
+        """
+        Construct from an IntervalArray
+
+        Parameters
+        ----------
+        array : IntervalArray
+        name : str
+            Attached as result.name
+        closed : Any
+            Ignored.
+        """
+        result = IntervalMixin.__new__(cls)
+        result._data = array
+        result.name = name
+        result._reset_identity()
+        return result
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_breaks'] % _index_doc_kwargs)
+    def from_breaks(cls, breaks, closed='right', name=None, copy=False,
+                    dtype=None):
+        with rewrite_exception("IntervalArray", cls.__name__):
+            array = IntervalArray.from_breaks(breaks, closed=closed, copy=copy,
+                                              dtype=dtype)
+        return cls._simple_new(array, name=name)
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_arrays'] % _index_doc_kwargs)
+    def from_arrays(cls, left, right, closed='right', name=None, copy=False,
+                    dtype=None):
+        with rewrite_exception("IntervalArray", cls.__name__):
+            array = IntervalArray.from_arrays(left, right, closed, copy=copy,
+                                              dtype=dtype)
+        return cls._simple_new(array, name=name)
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_intervals'] % _index_doc_kwargs)
+    def from_intervals(cls, data, closed=None, name=None, copy=False,
+                       dtype=None):
+        msg = ('IntervalIndex.from_intervals is deprecated and will be '
+               'removed in a future version; Use IntervalIndex(...) instead')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+        with rewrite_exception("IntervalArray", cls.__name__):
+            array = IntervalArray(data, closed=closed, copy=copy, dtype=dtype)
+
+        if name is None and isinstance(data, cls):
+            name = data.name
+
+        return cls._simple_new(array, name=name)
+
+    @classmethod
+    @Appender(_interval_shared_docs['from_tuples'] % _index_doc_kwargs)
+    def from_tuples(cls, data, closed='right', name=None, copy=False,
+                    dtype=None):
+        with rewrite_exception("IntervalArray", cls.__name__):
+            arr = IntervalArray.from_tuples(data, closed=closed, copy=copy,
+                                            dtype=dtype)
+        return cls._simple_new(arr, name=name)
+
+    # --------------------------------------------------------------------
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, left=None, right=None, **kwargs):
+        result = self._data._shallow_copy(left=left, right=right)
+        attributes = self._get_attributes_dict()
+        attributes.update(kwargs)
+        return self._simple_new(result, **attributes)
+
+    @cache_readonly
+    def _isnan(self):
+        """Return a mask indicating if each value is NA"""
+        if self._mask is None:
+            self._mask = isna(self.left)
+        return self._mask
+
+    @cache_readonly
+    def _engine(self):
+        left = self._maybe_convert_i8(self.left)
+        right = self._maybe_convert_i8(self.right)
+        return IntervalTree(left, right, closed=self.closed)
+
+    def __contains__(self, key):
+        """
+        return a boolean if this key is IN the index
+        We *only* accept an Interval
+
+        Parameters
+        ----------
+        key : Interval
+
+        Returns
+        -------
+        boolean
+        """
+        if not isinstance(key, Interval):
+            return False
+
+        try:
+            self.get_loc(key)
+            return True
+        except KeyError:
+            return False
+
+    def contains(self, key):
+        """
+        Return a boolean indicating if the key is IN the index
+
+        We accept / allow keys to be not *just* actual
+        objects.
+
+        Parameters
+        ----------
+        key : int, float, Interval
+
+        Returns
+        -------
+        boolean
+        """
+        try:
+            self.get_loc(key)
+            return True
+        except KeyError:
+            return False
+
+    @Appender(_interval_shared_docs['to_tuples'] % dict(
+        return_type="Index",
+        examples="""
+        Examples
+        --------
+        >>> idx = pd.IntervalIndex.from_arrays([0, np.nan, 2], [1, np.nan, 3])
+        >>> idx.to_tuples()
+        Index([(0.0, 1.0), (nan, nan), (2.0, 3.0)], dtype='object')
+        >>> idx.to_tuples(na_tuple=False)
+        Index([(0.0, 1.0), nan, (2.0, 3.0)], dtype='object')""",
+    ))
+    def to_tuples(self, na_tuple=True):
+        tuples = self._data.to_tuples(na_tuple=na_tuple)
+        return Index(tuples)
+
+    @cache_readonly
+    def _multiindex(self):
+        return MultiIndex.from_arrays([self.left, self.right],
+                                      names=['left', 'right'])
+
+    @property
+    def left(self):
+        """
+        Return the left endpoints of each Interval in the IntervalIndex as
+        an Index
+        """
+        return self._data._left
+
+    @property
+    def right(self):
+        """
+        Return the right endpoints of each Interval in the IntervalIndex as
+        an Index
+        """
+        return self._data._right
+
+    @property
+    def closed(self):
+        """
+        Whether the intervals are closed on the left-side, right-side, both or
+        neither
+        """
+        return self._data._closed
+
+    @Appender(_interval_shared_docs['set_closed'] % _index_doc_kwargs)
+    def set_closed(self, closed):
+        if closed not in _VALID_CLOSED:
+            msg = "invalid option for 'closed': {closed}"
+            raise ValueError(msg.format(closed=closed))
+
+        # return self._shallow_copy(closed=closed)
+        array = self._data.set_closed(closed)
+        return self._simple_new(array, self.name)
+
+    @property
+    def length(self):
+        """
+        Return an Index with entries denoting the length of each Interval in
+        the IntervalIndex
+        """
+        return self._data.length
+
+    @property
+    def size(self):
+        # Avoid materializing ndarray[Interval]
+        return self._data.size
+
+    @property
+    def shape(self):
+        # Avoid materializing ndarray[Interval]
+        return self._data.shape
+
+    @property
+    def itemsize(self):
+        msg = ('IntervalIndex.itemsize is deprecated and will be removed in '
+               'a future version')
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+
+        # supress the warning from the underlying left/right itemsize
+        with warnings.catch_warnings():
+            warnings.simplefilter('ignore')
+            return self.left.itemsize + self.right.itemsize
+
+    def __len__(self):
+        return len(self.left)
+
+    @cache_readonly
+    def values(self):
+        """
+        Return the IntervalIndex's data as an IntervalArray.
+        """
+        return self._data
+
+    @cache_readonly
+    def _values(self):
+        return self._data
+
+    @cache_readonly
+    def _ndarray_values(self):
+        return np.array(self._data)
+
+    def __array__(self, result=None):
+        """ the array interface, return my values """
+        return self._ndarray_values
+
+    def __array_wrap__(self, result, context=None):
+        # we don't want the superclass implementation
+        return result
+
+    def __reduce__(self):
+        d = dict(left=self.left,
+                 right=self.right)
+        d.update(self._get_attributes_dict())
+        return _new_IntervalIndex, (self.__class__, d), None
+
+    @Appender(_index_shared_docs['copy'])
+    def copy(self, deep=False, name=None):
+        array = self._data.copy(deep=deep)
+        attributes = self._get_attributes_dict()
+        if name is not None:
+            attributes.update(name=name)
+
+        return self._simple_new(array, **attributes)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        with rewrite_exception('IntervalArray', self.__class__.__name__):
+            new_values = self.values.astype(dtype, copy=copy)
+        if is_interval_dtype(new_values):
+            return self._shallow_copy(new_values.left, new_values.right)
+        return super(IntervalIndex, self).astype(dtype, copy=copy)
+
+    @cache_readonly
+    def dtype(self):
+        """Return the dtype object of the underlying data"""
+        return self._data.dtype
+
+    @property
+    def inferred_type(self):
+        """Return a string of the type inferred from the values"""
+        return 'interval'
+
+    @Appender(Index.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        # we don't use an explicit engine
+        # so return the bytes here
+        return (self.left.memory_usage(deep=deep) +
+                self.right.memory_usage(deep=deep))
+
+    @cache_readonly
+    def mid(self):
+        """
+        Return the midpoint of each Interval in the IntervalIndex as an Index
+        """
+        return self._data.mid
+
+    @cache_readonly
+    def is_monotonic(self):
+        """
+        Return True if the IntervalIndex is monotonic increasing (only equal or
+        increasing values), else False
+        """
+        return self._multiindex.is_monotonic
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        """
+        Return True if the IntervalIndex is monotonic increasing (only equal or
+        increasing values), else False
+        """
+        return self._multiindex.is_monotonic_increasing
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        """
+        Return True if the IntervalIndex is monotonic decreasing (only equal or
+        decreasing values), else False
+        """
+        return self._multiindex.is_monotonic_decreasing
+
+    @cache_readonly
+    def is_unique(self):
+        """
+        Return True if the IntervalIndex contains unique elements, else False
+        """
+        return self._multiindex.is_unique
+
+    @cache_readonly
+    @Appender(_interval_shared_docs['is_non_overlapping_monotonic']
+              % _index_doc_kwargs)
+    def is_non_overlapping_monotonic(self):
+        return self._data.is_non_overlapping_monotonic
+
+    @property
+    def is_overlapping(self):
+        """
+        Return True if the IntervalIndex has overlapping intervals, else False.
+
+        Two intervals overlap if they share a common point, including closed
+        endpoints. Intervals that only have an open endpoint in common do not
+        overlap.
+
+        .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        bool
+            Boolean indicating if the IntervalIndex has overlapping intervals.
+
+        See Also
+        --------
+        Interval.overlaps : Check whether two Interval objects overlap.
+        IntervalIndex.overlaps : Check an IntervalIndex elementwise for
+            overlaps.
+
+        Examples
+        --------
+        >>> index = pd.IntervalIndex.from_tuples([(0, 2), (1, 3), (4, 5)])
+        >>> index
+        IntervalIndex([(0, 2], (1, 3], (4, 5]],
+              closed='right',
+              dtype='interval[int64]')
+        >>> index.is_overlapping
+        True
+
+        Intervals that share closed endpoints overlap:
+
+        >>> index = pd.interval_range(0, 3, closed='both')
+        >>> index
+        IntervalIndex([[0, 1], [1, 2], [2, 3]],
+              closed='both',
+              dtype='interval[int64]')
+        >>> index.is_overlapping
+        True
+
+        Intervals that only have an open endpoint in common do not overlap:
+
+        >>> index = pd.interval_range(0, 3, closed='left')
+        >>> index
+        IntervalIndex([[0, 1), [1, 2), [2, 3)],
+              closed='left',
+              dtype='interval[int64]')
+        >>> index.is_overlapping
+        False
+        """
+        # GH 23309
+        return self._engine.is_overlapping
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        if kind == 'iloc':
+            return super(IntervalIndex, self)._convert_scalar_indexer(
+                key, kind=kind)
+        return key
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        return getattr(self, side)._maybe_cast_slice_bound(label, side, kind)
+
+    @Appender(_index_shared_docs['_convert_list_indexer'])
+    def _convert_list_indexer(self, keyarr, kind=None):
+        """
+        we are passed a list-like indexer. Return the
+        indexer for matching intervals.
+        """
+        locs = self.get_indexer_for(keyarr)
+
+        # we have missing values
+        if (locs == -1).any():
+            raise KeyError
+
+        return locs
+
+    def _maybe_cast_indexed(self, key):
+        """
+        we need to cast the key, which could be a scalar
+        or an array-like to the type of our subtype
+        """
+        if isinstance(key, IntervalIndex):
+            return key
+
+        subtype = self.dtype.subtype
+        if is_float_dtype(subtype):
+            if is_integer(key):
+                key = float(key)
+            elif isinstance(key, (np.ndarray, Index)):
+                key = key.astype('float64')
+        elif is_integer_dtype(subtype):
+            if is_integer(key):
+                key = int(key)
+
+        return key
+
+    def _needs_i8_conversion(self, key):
+        """
+        Check if a given key needs i8 conversion. Conversion is necessary for
+        Timestamp, Timedelta, DatetimeIndex, and TimedeltaIndex keys. An
+        Interval-like requires conversion if it's endpoints are one of the
+        aforementioned types.
+
+        Assumes that any list-like data has already been cast to an Index.
+
+        Parameters
+        ----------
+        key : scalar or Index-like
+            The key that should be checked for i8 conversion
+
+        Returns
+        -------
+        boolean
+        """
+        if is_interval_dtype(key) or isinstance(key, Interval):
+            return self._needs_i8_conversion(key.left)
+
+        i8_types = (Timestamp, Timedelta, DatetimeIndex, TimedeltaIndex)
+        return isinstance(key, i8_types)
+
+    def _maybe_convert_i8(self, key):
+        """
+        Maybe convert a given key to it's equivalent i8 value(s). Used as a
+        preprocessing step prior to IntervalTree queries (self._engine), which
+        expects numeric data.
+
+        Parameters
+        ----------
+        key : scalar or list-like
+            The key that should maybe be converted to i8.
+
+        Returns
+        -------
+        key: scalar or list-like
+            The original key if no conversion occured, int if converted scalar,
+            Int64Index if converted list-like.
+        """
+        original = key
+        if is_list_like(key):
+            key = ensure_index(key)
+
+        if not self._needs_i8_conversion(key):
+            return original
+
+        scalar = is_scalar(key)
+        if is_interval_dtype(key) or isinstance(key, Interval):
+            # convert left/right and reconstruct
+            left = self._maybe_convert_i8(key.left)
+            right = self._maybe_convert_i8(key.right)
+            constructor = Interval if scalar else IntervalIndex.from_arrays
+            return constructor(left, right, closed=self.closed)
+
+        if scalar:
+            # Timestamp/Timedelta
+            key_dtype, key_i8 = infer_dtype_from_scalar(key, pandas_dtype=True)
+        else:
+            # DatetimeIndex/TimedeltaIndex
+            key_dtype, key_i8 = key.dtype, Index(key.asi8)
+            if key.hasnans:
+                # convert NaT from it's i8 value to np.nan so it's not viewed
+                # as a valid value, maybe causing errors (e.g. is_overlapping)
+                key_i8 = key_i8.where(~key._isnan)
+
+        # ensure consistency with IntervalIndex subtype
+        subtype = self.dtype.subtype
+        msg = ('Cannot index an IntervalIndex of subtype {subtype} with '
+               'values of dtype {other}')
+        if not is_dtype_equal(subtype, key_dtype):
+            raise ValueError(msg.format(subtype=subtype, other=key_dtype))
+
+        return key_i8
+
+    def _check_method(self, method):
+        if method is None:
+            return
+
+        if method in ['bfill', 'backfill', 'pad', 'ffill', 'nearest']:
+            msg = 'method {method} not yet implemented for IntervalIndex'
+            raise NotImplementedError(msg.format(method=method))
+
+        raise ValueError("Invalid fill method")
+
+    def _searchsorted_monotonic(self, label, side, exclude_label=False):
+        if not self.is_non_overlapping_monotonic:
+            raise KeyError('can only get slices from an IntervalIndex if '
+                           'bounds are non-overlapping and all monotonic '
+                           'increasing or decreasing')
+
+        if isinstance(label, IntervalMixin):
+            raise NotImplementedError
+
+        # GH 20921: "not is_monotonic_increasing" for the second condition
+        # instead of "is_monotonic_decreasing" to account for single element
+        # indexes being both increasing and decreasing
+        if ((side == 'left' and self.left.is_monotonic_increasing) or
+                (side == 'right' and not self.left.is_monotonic_increasing)):
+            sub_idx = self.right
+            if self.open_right or exclude_label:
+                label = _get_next_label(label)
+        else:
+            sub_idx = self.left
+            if self.open_left or exclude_label:
+                label = _get_prev_label(label)
+
+        return sub_idx._searchsorted_monotonic(label, side)
+
+    def _get_loc_only_exact_matches(self, key):
+        if isinstance(key, Interval):
+
+            if not self.is_unique:
+                raise ValueError("cannot index with a slice Interval"
+                                 " and a non-unique index")
+
+            # TODO: this expands to a tuple index, see if we can
+            # do better
+            return Index(self._multiindex.values).get_loc(key)
+        raise KeyError
+
+    def _find_non_overlapping_monotonic_bounds(self, key):
+        if isinstance(key, IntervalMixin):
+            start = self._searchsorted_monotonic(
+                key.left, 'left', exclude_label=key.open_left)
+            stop = self._searchsorted_monotonic(
+                key.right, 'right', exclude_label=key.open_right)
+        elif isinstance(key, slice):
+            # slice
+            start, stop = key.start, key.stop
+            if (key.step or 1) != 1:
+                raise NotImplementedError("cannot slice with a slice step")
+            if start is None:
+                start = 0
+            else:
+                start = self._searchsorted_monotonic(start, 'left')
+            if stop is None:
+                stop = len(self)
+            else:
+                stop = self._searchsorted_monotonic(stop, 'right')
+        else:
+            # scalar or index-like
+
+            start = self._searchsorted_monotonic(key, 'left')
+            stop = self._searchsorted_monotonic(key, 'right')
+        return start, stop
+
+    def get_loc(self, key, method=None):
+        """Get integer location, slice or boolean mask for requested label.
+
+        Parameters
+        ----------
+        key : label
+        method : {None}, optional
+            * default: matches where the label is within an interval only.
+
+        Returns
+        -------
+        loc : int if unique index, slice if monotonic index, else mask
+
+        Examples
+        ---------
+        >>> i1, i2 = pd.Interval(0, 1), pd.Interval(1, 2)
+        >>> index = pd.IntervalIndex([i1, i2])
+        >>> index.get_loc(1)
+        0
+
+        You can also supply an interval or an location for a point inside an
+        interval.
+
+        >>> index.get_loc(pd.Interval(0, 2))
+        array([0, 1], dtype=int64)
+        >>> index.get_loc(1.5)
+        1
+
+        If a label is in several intervals, you get the locations of all the
+        relevant intervals.
+
+        >>> i3 = pd.Interval(0, 2)
+        >>> overlapping_index = pd.IntervalIndex([i2, i3])
+        >>> overlapping_index.get_loc(1.5)
+        array([0, 1], dtype=int64)
+        """
+        self._check_method(method)
+
+        original_key = key
+        key = self._maybe_cast_indexed(key)
+
+        if self.is_non_overlapping_monotonic:
+            if isinstance(key, Interval):
+                left = self._maybe_cast_slice_bound(key.left, 'left', None)
+                right = self._maybe_cast_slice_bound(key.right, 'right', None)
+                key = Interval(left, right, key.closed)
+            else:
+                key = self._maybe_cast_slice_bound(key, 'left', None)
+
+            start, stop = self._find_non_overlapping_monotonic_bounds(key)
+
+            if start is None or stop is None:
+                return slice(start, stop)
+            elif start + 1 == stop:
+                return start
+            elif start < stop:
+                return slice(start, stop)
+            else:
+                raise KeyError(original_key)
+
+        else:
+            # use the interval tree
+            key = self._maybe_convert_i8(key)
+            if isinstance(key, Interval):
+                left, right = _get_interval_closed_bounds(key)
+                return self._engine.get_loc_interval(left, right)
+            else:
+                return self._engine.get_loc(key)
+
+    def get_value(self, series, key):
+        if com.is_bool_indexer(key):
+            loc = key
+        elif is_list_like(key):
+            loc = self.get_indexer(key)
+        elif isinstance(key, slice):
+
+            if not (key.step is None or key.step == 1):
+                raise ValueError("cannot support not-default step in a slice")
+
+            try:
+                loc = self.get_loc(key)
+            except TypeError:
+                # we didn't find exact intervals or are non-unique
+                msg = "unable to slice with this key: {key}".format(key=key)
+                raise ValueError(msg)
+
+        else:
+            loc = self.get_loc(key)
+        return series.iloc[loc]
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+
+        self._check_method(method)
+        target = ensure_index(target)
+        target = self._maybe_cast_indexed(target)
+
+        if self.equals(target):
+            return np.arange(len(self), dtype='intp')
+
+        if self.is_non_overlapping_monotonic:
+            start, stop = self._find_non_overlapping_monotonic_bounds(target)
+
+            start_plus_one = start + 1
+            if not ((start_plus_one < stop).any()):
+                return np.where(start_plus_one == stop, start, -1)
+
+        if not self.is_unique:
+            raise ValueError("cannot handle non-unique indices")
+
+        # IntervalIndex
+        if isinstance(target, IntervalIndex):
+            indexer = self._get_reindexer(target)
+
+        # non IntervalIndex
+        else:
+            indexer = np.concatenate([self.get_loc(i) for i in target])
+
+        return ensure_platform_int(indexer)
+
+    def _get_reindexer(self, target):
+        """
+        Return an indexer for a target IntervalIndex with self
+        """
+
+        # find the left and right indexers
+        left = self._maybe_convert_i8(target.left)
+        right = self._maybe_convert_i8(target.right)
+        lindexer = self._engine.get_indexer(left.values)
+        rindexer = self._engine.get_indexer(right.values)
+
+        # we want to return an indexer on the intervals
+        # however, our keys could provide overlapping of multiple
+        # intervals, so we iterate thru the indexers and construct
+        # a set of indexers
+
+        indexer = []
+        n = len(self)
+
+        for i, (lhs, rhs) in enumerate(zip(lindexer, rindexer)):
+
+            target_value = target[i]
+
+            # matching on the lhs bound
+            if (lhs != -1 and
+                    self.closed == 'right' and
+                    target_value.left == self[lhs].right):
+                lhs += 1
+
+            # matching on the lhs bound
+            if (rhs != -1 and
+                    self.closed == 'left' and
+                    target_value.right == self[rhs].left):
+                rhs -= 1
+
+            # not found
+            if lhs == -1 and rhs == -1:
+                indexer.append(np.array([-1]))
+
+            elif rhs == -1:
+
+                indexer.append(np.arange(lhs, n))
+
+            elif lhs == -1:
+
+                # care about left/right closed here
+                value = self[i]
+
+                # target.closed same as self.closed
+                if self.closed == target.closed:
+                    if target_value.left < value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                # target.closed == 'left'
+                elif self.closed == 'right':
+                    if target_value.left <= value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                # target.closed == 'right'
+                elif self.closed == 'left':
+                    if target_value.left <= value.left:
+                        indexer.append(np.array([-1]))
+                        continue
+
+                indexer.append(np.arange(0, rhs + 1))
+
+            else:
+                indexer.append(np.arange(lhs, rhs + 1))
+
+        return np.concatenate(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        target = self._maybe_cast_indexed(ensure_index(target))
+        return super(IntervalIndex, self).get_indexer_non_unique(target)
+
+    @Appender(_index_shared_docs['where'])
+    def where(self, cond, other=None):
+        if other is None:
+            other = self._na_value
+        values = np.where(cond, self.values, other)
+        return self._shallow_copy(values)
+
+    def delete(self, loc):
+        """
+        Return a new IntervalIndex with passed location(-s) deleted
+
+        Returns
+        -------
+        new_index : IntervalIndex
+        """
+        new_left = self.left.delete(loc)
+        new_right = self.right.delete(loc)
+        return self._shallow_copy(new_left, new_right)
+
+    def insert(self, loc, item):
+        """
+        Return a new IntervalIndex inserting new item at location. Follows
+        Python list.append semantics for negative values.  Only Interval
+        objects and NA can be inserted into an IntervalIndex
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+
+        Returns
+        -------
+        new_index : IntervalIndex
+        """
+        if isinstance(item, Interval):
+            if item.closed != self.closed:
+                raise ValueError('inserted item must be closed on the same '
+                                 'side as the index')
+            left_insert = item.left
+            right_insert = item.right
+        elif is_scalar(item) and isna(item):
+            # GH 18295
+            left_insert = right_insert = item
+        else:
+            raise ValueError('can only insert Interval objects and NA into '
+                             'an IntervalIndex')
+
+        new_left = self.left.insert(loc, left_insert)
+        new_right = self.right.insert(loc, right_insert)
+        return self._shallow_copy(new_left, new_right)
+
+    def _as_like_interval_index(self, other):
+        self._assert_can_do_setop(other)
+        other = ensure_index(other)
+        if not isinstance(other, IntervalIndex):
+            msg = ('the other index needs to be an IntervalIndex too, but '
+                   'was type {}').format(other.__class__.__name__)
+            raise TypeError(msg)
+        elif self.closed != other.closed:
+            msg = ('can only do set operations between two IntervalIndex '
+                   'objects that are closed on the same side')
+            raise ValueError(msg)
+        return other
+
+    def _concat_same_dtype(self, to_concat, name):
+        """
+        assert that we all have the same .closed
+        we allow a 0-len index here as well
+        """
+        if not len({i.closed for i in to_concat if len(i)}) == 1:
+            msg = ('can only append two IntervalIndex objects '
+                   'that are closed on the same side')
+            raise ValueError(msg)
+        return super(IntervalIndex, self)._concat_same_dtype(to_concat, name)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        result = self._data.take(indices, axis=axis, allow_fill=allow_fill,
+                                 fill_value=fill_value, **kwargs)
+        attributes = self._get_attributes_dict()
+        return self._simple_new(result, **attributes)
+
+    def __getitem__(self, value):
+        result = self._data[value]
+        if isinstance(result, IntervalArray):
+            return self._shallow_copy(result)
+        else:
+            # scalar
+            return result
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+    # __repr__ associated methods are based on MultiIndex
+
+    def _format_with_header(self, header, **kwargs):
+        return header + list(self._format_native_types(**kwargs))
+
+    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
+        """ actually format my specific types """
+        from pandas.io.formats.format import ExtensionArrayFormatter
+        return ExtensionArrayFormatter(values=self,
+                                       na_rep=na_rep,
+                                       justify='all',
+                                       leading_space=False).get_result()
+
+    def _format_data(self, name=None):
+
+        # TODO: integrate with categorical and make generic
+        # name argument is unused here; just for compat with base / categorical
+        n = len(self)
+        max_seq_items = min((get_option(
+            'display.max_seq_items') or n) // 10, 10)
+
+        formatter = str
+
+        if n == 0:
+            summary = '[]'
+        elif n == 1:
+            first = formatter(self[0])
+            summary = '[{first}]'.format(first=first)
+        elif n == 2:
+            first = formatter(self[0])
+            last = formatter(self[-1])
+            summary = '[{first}, {last}]'.format(first=first, last=last)
+        else:
+
+            if n > max_seq_items:
+                n = min(max_seq_items // 2, 10)
+                head = [formatter(x) for x in self[:n]]
+                tail = [formatter(x) for x in self[-n:]]
+                summary = '[{head} ... {tail}]'.format(
+                    head=', '.join(head), tail=', '.join(tail))
+            else:
+                tail = [formatter(x) for x in self]
+                summary = '[{tail}]'.format(tail=', '.join(tail))
+
+        return summary + ',' + self._format_space()
+
+    def _format_attrs(self):
+        attrs = [('closed', repr(self.closed))]
+        if self.name is not None:
+            attrs.append(('name', default_pprint(self.name)))
+        attrs.append(('dtype', "'{dtype}'".format(dtype=self.dtype)))
+        return attrs
+
+    def _format_space(self):
+        space = ' ' * (len(self.__class__.__name__) + 1)
+        return "\n{space}".format(space=space)
+
+    # --------------------------------------------------------------------
+
+    def argsort(self, *args, **kwargs):
+        return np.lexsort((self.right, self.left))
+
+    def equals(self, other):
+        """
+        Determines if two IntervalIndex objects contain the same elements
+        """
+        if self.is_(other):
+            return True
+
+        # if we can coerce to an II
+        # then we can compare
+        if not isinstance(other, IntervalIndex):
+            if not is_interval_dtype(other):
+                return False
+            other = Index(getattr(other, '.values', other))
+
+        return (self.left.equals(other.left) and
+                self.right.equals(other.right) and
+                self.closed == other.closed)
+
+    @Appender(_interval_shared_docs['overlaps'] % _index_doc_kwargs)
+    def overlaps(self, other):
+        return self._data.overlaps(other)
+
+    def _setop(op_name, sort=None):
+        def func(self, other, sort=sort):
+            other = self._as_like_interval_index(other)
+
+            # GH 19016: ensure set op will not return a prohibited dtype
+            subtypes = [self.dtype.subtype, other.dtype.subtype]
+            common_subtype = find_common_type(subtypes)
+            if is_object_dtype(common_subtype):
+                msg = ('can only do {op} between two IntervalIndex '
+                       'objects that have compatible dtypes')
+                raise TypeError(msg.format(op=op_name))
+
+            result = getattr(self._multiindex, op_name)(other._multiindex,
+                                                        sort=sort)
+            result_name = get_op_result_name(self, other)
+
+            # GH 19101: ensure empty results have correct dtype
+            if result.empty:
+                result = result.values.astype(self.dtype.subtype)
+            else:
+                result = result.values
+
+            return type(self).from_tuples(result, closed=self.closed,
+                                          name=result_name)
+        return func
+
+    @property
+    def is_all_dates(self):
+        """
+        This is False even when left/right contain datetime-like objects,
+        as the check is done on the Interval itself
+        """
+        return False
+
+    union = _setop('union')
+    intersection = _setop('intersection', sort=False)
+    difference = _setop('difference')
+    symmetric_difference = _setop('symmetric_difference')
+
+    # TODO: arithmetic operations
+
+
+IntervalIndex._add_logical_methods_disabled()
+
+
+def _is_valid_endpoint(endpoint):
+    """helper for interval_range to check if start/end are valid types"""
+    return any([is_number(endpoint),
+                isinstance(endpoint, Timestamp),
+                isinstance(endpoint, Timedelta),
+                endpoint is None])
+
+
+def _is_type_compatible(a, b):
+    """helper for interval_range to check type compat of start/end/freq"""
+    is_ts_compat = lambda x: isinstance(x, (Timestamp, DateOffset))
+    is_td_compat = lambda x: isinstance(x, (Timedelta, DateOffset))
+    return ((is_number(a) and is_number(b)) or
+            (is_ts_compat(a) and is_ts_compat(b)) or
+            (is_td_compat(a) and is_td_compat(b)) or
+            com._any_none(a, b))
+
+
+def interval_range(start=None, end=None, periods=None, freq=None,
+                   name=None, closed='right'):
+    """
+    Return a fixed frequency IntervalIndex
+
+    Parameters
+    ----------
+    start : numeric or datetime-like, default None
+        Left bound for generating intervals
+    end : numeric or datetime-like, default None
+        Right bound for generating intervals
+    periods : integer, default None
+        Number of periods to generate
+    freq : numeric, string, or DateOffset, default None
+        The length of each interval. Must be consistent with the type of start
+        and end, e.g. 2 for numeric, or '5H' for datetime-like.  Default is 1
+        for numeric and 'D' for datetime-like.
+    name : string, default None
+        Name of the resulting IntervalIndex
+    closed : {'left', 'right', 'both', 'neither'}, default 'right'
+        Whether the intervals are closed on the left-side, right-side, both
+        or neither.
+
+    Returns
+    -------
+    rng : IntervalIndex
+
+    See Also
+    --------
+    IntervalIndex : An Index of intervals that are all closed on the same side.
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``IntervalIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end``, inclusively.
+
+    To learn more about datetime-like frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+    Numeric ``start`` and  ``end`` is supported.
+
+    >>> pd.interval_range(start=0, end=5)
+    IntervalIndex([(0, 1], (1, 2], (2, 3], (3, 4], (4, 5]],
+                  closed='right', dtype='interval[int64]')
+
+    Additionally, datetime-like input is also supported.
+
+    >>> pd.interval_range(start=pd.Timestamp('2017-01-01'),
+    ...                   end=pd.Timestamp('2017-01-04'))
+    IntervalIndex([(2017-01-01, 2017-01-02], (2017-01-02, 2017-01-03],
+                   (2017-01-03, 2017-01-04]],
+                  closed='right', dtype='interval[datetime64[ns]]')
+
+    The ``freq`` parameter specifies the frequency between the left and right.
+    endpoints of the individual intervals within the ``IntervalIndex``.  For
+    numeric ``start`` and ``end``, the frequency must also be numeric.
+
+    >>> pd.interval_range(start=0, periods=4, freq=1.5)
+    IntervalIndex([(0.0, 1.5], (1.5, 3.0], (3.0, 4.5], (4.5, 6.0]],
+                  closed='right', dtype='interval[float64]')
+
+    Similarly, for datetime-like ``start`` and ``end``, the frequency must be
+    convertible to a DateOffset.
+
+    >>> pd.interval_range(start=pd.Timestamp('2017-01-01'),
+    ...                   periods=3, freq='MS')
+    IntervalIndex([(2017-01-01, 2017-02-01], (2017-02-01, 2017-03-01],
+                   (2017-03-01, 2017-04-01]],
+                  closed='right', dtype='interval[datetime64[ns]]')
+
+    Specify ``start``, ``end``, and ``periods``; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.interval_range(start=0, end=6, periods=4)
+    IntervalIndex([(0.0, 1.5], (1.5, 3.0], (3.0, 4.5], (4.5, 6.0]],
+              closed='right',
+              dtype='interval[float64]')
+
+    The ``closed`` parameter specifies which endpoints of the individual
+    intervals within the ``IntervalIndex`` are closed.
+
+    >>> pd.interval_range(end=5, periods=4, closed='both')
+    IntervalIndex([[1, 2], [2, 3], [3, 4], [4, 5]],
+                  closed='both', dtype='interval[int64]')
+    """
+    start = com.maybe_box_datetimelike(start)
+    end = com.maybe_box_datetimelike(end)
+    endpoint = start if start is not None else end
+
+    if freq is None and com._any_none(periods, start, end):
+        freq = 1 if is_number(endpoint) else 'D'
+
+    if com.count_not_none(start, end, periods, freq) != 3:
+        raise ValueError('Of the four parameters: start, end, periods, and '
+                         'freq, exactly three must be specified')
+
+    if not _is_valid_endpoint(start):
+        msg = 'start must be numeric or datetime-like, got {start}'
+        raise ValueError(msg.format(start=start))
+    elif not _is_valid_endpoint(end):
+        msg = 'end must be numeric or datetime-like, got {end}'
+        raise ValueError(msg.format(end=end))
+
+    if is_float(periods):
+        periods = int(periods)
+    elif not is_integer(periods) and periods is not None:
+        msg = 'periods must be a number, got {periods}'
+        raise TypeError(msg.format(periods=periods))
+
+    if freq is not None and not is_number(freq):
+        try:
+            freq = to_offset(freq)
+        except ValueError:
+            raise ValueError('freq must be numeric or convertible to '
+                             'DateOffset, got {freq}'.format(freq=freq))
+
+    # verify type compatibility
+    if not all([_is_type_compatible(start, end),
+                _is_type_compatible(start, freq),
+                _is_type_compatible(end, freq)]):
+        raise TypeError("start, end, freq need to be type compatible")
+
+    # +1 to convert interval count to breaks count (n breaks = n-1 intervals)
+    if periods is not None:
+        periods += 1
+
+    if is_number(endpoint):
+        # force consistency between start/end/freq (lower end if freq skips it)
+        if com._all_not_none(start, end, freq):
+            end -= (end - start) % freq
+
+        # compute the period/start/end if unspecified (at most one)
+        if periods is None:
+            periods = int((end - start) // freq) + 1
+        elif start is None:
+            start = end - (periods - 1) * freq
+        elif end is None:
+            end = start + (periods - 1) * freq
+
+        breaks = np.linspace(start, end, periods)
+        if all(is_integer(x) for x in com._not_none(start, end, freq)):
+            # np.linspace always produces float output
+            breaks = maybe_downcast_to_dtype(breaks, 'int64')
+    else:
+        # delegate to the appropriate range function
+        if isinstance(endpoint, Timestamp):
+            range_func = date_range
+        else:
+            range_func = timedelta_range
+
+        breaks = range_func(start=start, end=end, periods=periods, freq=freq)
+
+    return IntervalIndex.from_breaks(breaks, name=name, closed=closed)
diff --git a/pandas/core/indexes/multi.py b/pandas/core/indexes/multi.py
new file mode 100644
index 0000000000000..616c17cd16f9a
--- /dev/null
+++ b/pandas/core/indexes/multi.py
@@ -0,0 +1,3172 @@
+# pylint: disable=E1101,E1103,W0232
+from collections import OrderedDict
+import datetime
+from sys import getsizeof
+import warnings
+
+import numpy as np
+
+from pandas._libs import (
+    Timestamp, algos as libalgos, index as libindex, lib, tslibs)
+import pandas.compat as compat
+from pandas.compat import lrange, lzip, map, range, zip
+from pandas.compat.numpy import function as nv
+from pandas.errors import PerformanceWarning, UnsortedIndexError
+from pandas.util._decorators import Appender, cache_readonly, deprecate_kwarg
+
+from pandas.core.dtypes.common import (
+    ensure_int64, ensure_platform_int, is_categorical_dtype, is_hashable,
+    is_integer, is_iterator, is_list_like, is_object_dtype, is_scalar,
+    pandas_dtype)
+from pandas.core.dtypes.dtypes import ExtensionDtype, PandasExtensionDtype
+from pandas.core.dtypes.generic import ABCDataFrame
+from pandas.core.dtypes.missing import array_equivalent, isna
+
+import pandas.core.algorithms as algos
+import pandas.core.common as com
+from pandas.core.config import get_option
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import (
+    Index, InvalidIndexError, _index_shared_docs, ensure_index)
+from pandas.core.indexes.frozen import FrozenList, _ensure_frozen
+import pandas.core.missing as missing
+
+from pandas.io.formats.printing import pprint_thing
+
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(
+    dict(klass='MultiIndex',
+         target_klass='MultiIndex or list of tuples'))
+
+
+class MultiIndexUIntEngine(libindex.BaseMultiIndexCodesEngine,
+                           libindex.UInt64Engine):
+    """
+    This class manages a MultiIndex by mapping label combinations to positive
+    integers.
+    """
+    _base = libindex.UInt64Engine
+
+    def _codes_to_ints(self, codes):
+        """
+        Transform combination(s) of uint64 in one uint64 (each), in a strictly
+        monotonic way (i.e. respecting the lexicographic order of integer
+        combinations): see BaseMultiIndexCodesEngine documentation.
+
+        Parameters
+        ----------
+        codes : 1- or 2-dimensional array of dtype uint64
+            Combinations of integers (one per row)
+
+        Returns
+        ------
+        int_keys : scalar or 1-dimensional array, of dtype uint64
+            Integer(s) representing one combination (each).
+        """
+        # Shift the representation of each level by the pre-calculated number
+        # of bits:
+        codes <<= self.offsets
+
+        # Now sum and OR are in fact interchangeable. This is a simple
+        # composition of the (disjunct) significant bits of each level (i.e.
+        # each column in "codes") in a single positive integer:
+        if codes.ndim == 1:
+            # Single key
+            return np.bitwise_or.reduce(codes)
+
+        # Multiple keys
+        return np.bitwise_or.reduce(codes, axis=1)
+
+
+class MultiIndexPyIntEngine(libindex.BaseMultiIndexCodesEngine,
+                            libindex.ObjectEngine):
+    """
+    This class manages those (extreme) cases in which the number of possible
+    label combinations overflows the 64 bits integers, and uses an ObjectEngine
+    containing Python integers.
+    """
+    _base = libindex.ObjectEngine
+
+    def _codes_to_ints(self, codes):
+        """
+        Transform combination(s) of uint64 in one Python integer (each), in a
+        strictly monotonic way (i.e. respecting the lexicographic order of
+        integer combinations): see BaseMultiIndexCodesEngine documentation.
+
+        Parameters
+        ----------
+        codes : 1- or 2-dimensional array of dtype uint64
+            Combinations of integers (one per row)
+
+        Returns
+        ------
+        int_keys : int, or 1-dimensional array of dtype object
+            Integer(s) representing one combination (each).
+        """
+
+        # Shift the representation of each level by the pre-calculated number
+        # of bits. Since this can overflow uint64, first make sure we are
+        # working with Python integers:
+        codes = codes.astype('object') << self.offsets
+
+        # Now sum and OR are in fact interchangeable. This is a simple
+        # composition of the (disjunct) significant bits of each level (i.e.
+        # each column in "codes") in a single positive integer (per row):
+        if codes.ndim == 1:
+            # Single key
+            return np.bitwise_or.reduce(codes)
+
+        # Multiple keys
+        return np.bitwise_or.reduce(codes, axis=1)
+
+
+class MultiIndex(Index):
+    """
+    A multi-level, or hierarchical, index object for pandas objects.
+
+    Parameters
+    ----------
+    levels : sequence of arrays
+        The unique labels for each level.
+    codes : sequence of arrays
+        Integers for each level designating which label at each location.
+
+        .. versionadded:: 0.24.0
+    labels : sequence of arrays
+        Integers for each level designating which label at each location.
+
+        .. deprecated:: 0.24.0
+            Use ``codes`` instead
+    sortorder : optional int
+        Level of sortedness (must be lexicographically sorted by that
+        level).
+    names : optional sequence of objects
+        Names for each of the index levels. (name is accepted for compat).
+    copy : bool, default False
+        Copy the meta-data.
+    verify_integrity : bool, default True
+        Check that the levels/codes are consistent and valid.
+
+    Attributes
+    ----------
+    names
+    levels
+    codes
+    nlevels
+    levshape
+
+    Methods
+    -------
+    from_arrays
+    from_tuples
+    from_product
+    from_frame
+    set_levels
+    set_codes
+    to_frame
+    to_flat_index
+    is_lexsorted
+    sortlevel
+    droplevel
+    swaplevel
+    reorder_levels
+    remove_unused_levels
+
+    See Also
+    --------
+    MultiIndex.from_arrays  : Convert list of arrays to MultiIndex.
+    MultiIndex.from_product : Create a MultiIndex from the cartesian product
+                              of iterables.
+    MultiIndex.from_tuples  : Convert list of tuples to a MultiIndex.
+    MultiIndex.from_frame   : Make a MultiIndex from a DataFrame.
+    Index : The base pandas Index type.
+
+    Examples
+    ---------
+    A new ``MultiIndex`` is typically constructed using one of the helper
+    methods :meth:`MultiIndex.from_arrays`, :meth:`MultiIndex.from_product`
+    and :meth:`MultiIndex.from_tuples`. For example (using ``.from_arrays``):
+
+    >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
+    >>> pd.MultiIndex.from_arrays(arrays, names=('number', 'color'))
+    MultiIndex(levels=[[1, 2], ['blue', 'red']],
+               codes=[[0, 0, 1, 1], [1, 0, 1, 0]],
+               names=['number', 'color'])
+
+    See further examples for how to construct a MultiIndex in the doc strings
+    of the mentioned helper methods.
+
+    Notes
+    -----
+    See the `user guide
+    <http://pandas.pydata.org/pandas-docs/stable/advanced.html>`_ for more.
+    """
+
+    # initialize to zero-length tuples to make everything work
+    _typ = 'multiindex'
+    _names = FrozenList()
+    _levels = FrozenList()
+    _codes = FrozenList()
+    _comparables = ['names']
+    rename = Index.set_names
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    @deprecate_kwarg(old_arg_name='labels', new_arg_name='codes')
+    def __new__(cls, levels=None, codes=None, sortorder=None, names=None,
+                dtype=None, copy=False, name=None,
+                verify_integrity=True, _set_identity=True):
+
+        # compat with Index
+        if name is not None:
+            names = name
+        if levels is None or codes is None:
+            raise TypeError("Must pass both levels and codes")
+        if len(levels) != len(codes):
+            raise ValueError('Length of levels and codes must be the same.')
+        if len(levels) == 0:
+            raise ValueError('Must pass non-zero number of levels/codes')
+
+        result = object.__new__(MultiIndex)
+
+        # we've already validated levels and codes, so shortcut here
+        result._set_levels(levels, copy=copy, validate=False)
+        result._set_codes(codes, copy=copy, validate=False)
+
+        if names is not None:
+            # handles name validation
+            result._set_names(names)
+
+        if sortorder is not None:
+            result.sortorder = int(sortorder)
+        else:
+            result.sortorder = sortorder
+
+        if verify_integrity:
+            result._verify_integrity()
+        if _set_identity:
+            result._reset_identity()
+        return result
+
+    def _verify_integrity(self, codes=None, levels=None):
+        """
+
+        Parameters
+        ----------
+        codes : optional list
+            Codes to check for validity. Defaults to current codes.
+        levels : optional list
+            Levels to check for validity. Defaults to current levels.
+
+        Raises
+        ------
+        ValueError
+            If length of levels and codes don't match, if the codes for any
+            level would exceed level bounds, or there are any duplicate levels.
+        """
+        # NOTE: Currently does not check, among other things, that cached
+        # nlevels matches nor that sortorder matches actually sortorder.
+        codes = codes or self.codes
+        levels = levels or self.levels
+
+        if len(levels) != len(codes):
+            raise ValueError("Length of levels and codes must match. NOTE:"
+                             " this index is in an inconsistent state.")
+        codes_length = len(self.codes[0])
+        for i, (level, level_codes) in enumerate(zip(levels, codes)):
+            if len(level_codes) != codes_length:
+                raise ValueError("Unequal code lengths: %s" %
+                                 ([len(code_) for code_ in codes]))
+            if len(level_codes) and level_codes.max() >= len(level):
+                raise ValueError("On level %d, code max (%d) >= length of"
+                                 " level  (%d). NOTE: this index is in an"
+                                 " inconsistent state" % (i, level_codes.max(),
+                                                          len(level)))
+            if not level.is_unique:
+                raise ValueError("Level values must be unique: {values} on "
+                                 "level {level}".format(
+                                     values=[value for value in level],
+                                     level=i))
+
+    @classmethod
+    def from_arrays(cls, arrays, sortorder=None, names=None):
+        """
+        Convert arrays to MultiIndex.
+
+        Parameters
+        ----------
+        arrays : list / sequence of array-likes
+            Each array-like gives one level's value for each data point.
+            len(arrays) is the number of levels.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level).
+        names : list / sequence of str, optional
+            Names for the levels in the index.
+
+        Returns
+        -------
+        index : MultiIndex
+
+        See Also
+        --------
+        MultiIndex.from_tuples : Convert list of tuples to MultiIndex.
+        MultiIndex.from_product : Make a MultiIndex from cartesian product
+                                  of iterables.
+        MultiIndex.from_frame : Make a MultiIndex from a DataFrame.
+
+        Examples
+        --------
+        >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
+        >>> pd.MultiIndex.from_arrays(arrays, names=('number', 'color'))
+        MultiIndex(levels=[[1, 2], ['blue', 'red']],
+                   codes=[[0, 0, 1, 1], [1, 0, 1, 0]],
+                   names=['number', 'color'])
+        """
+        error_msg = "Input must be a list / sequence of array-likes."
+        if not is_list_like(arrays):
+            raise TypeError(error_msg)
+        elif is_iterator(arrays):
+            arrays = list(arrays)
+
+        # Check if elements of array are list-like
+        for array in arrays:
+            if not is_list_like(array):
+                raise TypeError(error_msg)
+
+        # Check if lengths of all arrays are equal or not,
+        # raise ValueError, if not
+        for i in range(1, len(arrays)):
+            if len(arrays[i]) != len(arrays[i - 1]):
+                raise ValueError('all arrays must be same length')
+
+        from pandas.core.arrays.categorical import _factorize_from_iterables
+
+        codes, levels = _factorize_from_iterables(arrays)
+        if names is None:
+            names = [getattr(arr, "name", None) for arr in arrays]
+
+        return MultiIndex(levels=levels, codes=codes, sortorder=sortorder,
+                          names=names, verify_integrity=False)
+
+    @classmethod
+    def from_tuples(cls, tuples, sortorder=None, names=None):
+        """
+        Convert list of tuples to MultiIndex.
+
+        Parameters
+        ----------
+        tuples : list / sequence of tuple-likes
+            Each tuple is the index of one row/column.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level).
+        names : list / sequence of str, optional
+            Names for the levels in the index.
+
+        Returns
+        -------
+        index : MultiIndex
+
+        See Also
+        --------
+        MultiIndex.from_arrays : Convert list of arrays to MultiIndex.
+        MultiIndex.from_product : Make a MultiIndex from cartesian product
+                                  of iterables.
+        MultiIndex.from_frame : Make a MultiIndex from a DataFrame.
+
+        Examples
+        --------
+        >>> tuples = [(1, u'red'), (1, u'blue'),
+        ...           (2, u'red'), (2, u'blue')]
+        >>> pd.MultiIndex.from_tuples(tuples, names=('number', 'color'))
+        MultiIndex(levels=[[1, 2], ['blue', 'red']],
+                   codes=[[0, 0, 1, 1], [1, 0, 1, 0]],
+                   names=['number', 'color'])
+        """
+        if not is_list_like(tuples):
+            raise TypeError('Input must be a list / sequence of tuple-likes.')
+        elif is_iterator(tuples):
+            tuples = list(tuples)
+
+        if len(tuples) == 0:
+            if names is None:
+                msg = 'Cannot infer number of levels from empty list'
+                raise TypeError(msg)
+            arrays = [[]] * len(names)
+        elif isinstance(tuples, (np.ndarray, Index)):
+            if isinstance(tuples, Index):
+                tuples = tuples._values
+
+            arrays = list(lib.tuples_to_object_array(tuples).T)
+        elif isinstance(tuples, list):
+            arrays = list(lib.to_object_array_tuples(tuples).T)
+        else:
+            arrays = lzip(*tuples)
+
+        return MultiIndex.from_arrays(arrays, sortorder=sortorder, names=names)
+
+    @classmethod
+    def from_product(cls, iterables, sortorder=None, names=None):
+        """
+        Make a MultiIndex from the cartesian product of multiple iterables.
+
+        Parameters
+        ----------
+        iterables : list / sequence of iterables
+            Each iterable has unique labels for each level of the index.
+        sortorder : int or None
+            Level of sortedness (must be lexicographically sorted by that
+            level).
+        names : list / sequence of str, optional
+            Names for the levels in the index.
+
+        Returns
+        -------
+        index : MultiIndex
+
+        See Also
+        --------
+        MultiIndex.from_arrays : Convert list of arrays to MultiIndex.
+        MultiIndex.from_tuples : Convert list of tuples to MultiIndex.
+        MultiIndex.from_frame : Make a MultiIndex from a DataFrame.
+
+        Examples
+        --------
+        >>> numbers = [0, 1, 2]
+        >>> colors = ['green', 'purple']
+        >>> pd.MultiIndex.from_product([numbers, colors],
+        ...                            names=['number', 'color'])
+        MultiIndex(levels=[[0, 1, 2], ['green', 'purple']],
+                   codes=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]],
+                   names=['number', 'color'])
+        """
+        from pandas.core.arrays.categorical import _factorize_from_iterables
+        from pandas.core.reshape.util import cartesian_product
+
+        if not is_list_like(iterables):
+            raise TypeError("Input must be a list / sequence of iterables.")
+        elif is_iterator(iterables):
+            iterables = list(iterables)
+
+        codes, levels = _factorize_from_iterables(iterables)
+        codes = cartesian_product(codes)
+        return MultiIndex(levels, codes, sortorder=sortorder, names=names)
+
+    @classmethod
+    def from_frame(cls, df, sortorder=None, names=None):
+        """
+        Make a MultiIndex from a DataFrame.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        df : DataFrame
+            DataFrame to be converted to MultiIndex.
+        sortorder : int, optional
+            Level of sortedness (must be lexicographically sorted by that
+            level).
+        names : list-like, optional
+            If no names are provided, use the column names, or tuple of column
+            names if the columns is a MultiIndex. If a sequence, overwrite
+            names with the given sequence.
+
+        Returns
+        -------
+        MultiIndex
+            The MultiIndex representation of the given DataFrame.
+
+        See Also
+        --------
+        MultiIndex.from_arrays : Convert list of arrays to MultiIndex.
+        MultiIndex.from_tuples : Convert list of tuples to MultiIndex.
+        MultiIndex.from_product : Make a MultiIndex from cartesian product
+                                  of iterables.
+
+        Examples
+        --------
+        >>> df = pd.DataFrame([['HI', 'Temp'], ['HI', 'Precip'],
+        ...                    ['NJ', 'Temp'], ['NJ', 'Precip']],
+        ...                   columns=['a', 'b'])
+        >>> df
+              a       b
+        0    HI    Temp
+        1    HI  Precip
+        2    NJ    Temp
+        3    NJ  Precip
+
+        >>> pd.MultiIndex.from_frame(df)
+        MultiIndex(levels=[['HI', 'NJ'], ['Precip', 'Temp']],
+                   codes=[[0, 0, 1, 1], [1, 0, 1, 0]],
+                   names=['a', 'b'])
+
+        Using explicit names, instead of the column names
+
+        >>> pd.MultiIndex.from_frame(df, names=['state', 'observation'])
+        MultiIndex(levels=[['HI', 'NJ'], ['Precip', 'Temp']],
+                   codes=[[0, 0, 1, 1], [1, 0, 1, 0]],
+                   names=['state', 'observation'])
+        """
+        if not isinstance(df, ABCDataFrame):
+            raise TypeError("Input must be a DataFrame")
+
+        column_names, columns = lzip(*df.iteritems())
+        names = column_names if names is None else names
+        return cls.from_arrays(columns, sortorder=sortorder, names=names)
+
+    # --------------------------------------------------------------------
+
+    @property
+    def levels(self):
+        return self._levels
+
+    @property
+    def _values(self):
+        # We override here, since our parent uses _data, which we dont' use.
+        return self.values
+
+    @property
+    def array(self):
+        """
+        Raises a ValueError for `MultiIndex` because there's no single
+        array backing a MultiIndex.
+
+        Raises
+        ------
+        ValueError
+        """
+        msg = ("MultiIndex has no single backing array. Use "
+               "'MultiIndex.to_numpy()' to get a NumPy array of tuples.")
+        raise ValueError(msg)
+
+    @property
+    def _is_homogeneous_type(self):
+        """Whether the levels of a MultiIndex all have the same dtype.
+
+        This looks at the dtypes of the levels.
+
+        See Also
+        --------
+        Index._is_homogeneous_type
+        DataFrame._is_homogeneous_type
+
+        Examples
+        --------
+        >>> MultiIndex.from_tuples([
+        ...     ('a', 'b'), ('a', 'c')])._is_homogeneous_type
+        True
+        >>> MultiIndex.from_tuples([
+        ...     ('a', 1), ('a', 2)])._is_homogeneous_type
+        False
+        """
+        return len({x.dtype for x in self.levels}) <= 1
+
+    def _set_levels(self, levels, level=None, copy=False, validate=True,
+                    verify_integrity=False):
+        # This is NOT part of the levels property because it should be
+        # externally not allowed to set levels. User beware if you change
+        # _levels directly
+        if validate and len(levels) == 0:
+            raise ValueError('Must set non-zero number of levels.')
+        if validate and level is None and len(levels) != self.nlevels:
+            raise ValueError('Length of levels must match number of levels.')
+        if validate and level is not None and len(levels) != len(level):
+            raise ValueError('Length of levels must match length of level.')
+
+        if level is None:
+            new_levels = FrozenList(
+                ensure_index(lev, copy=copy)._shallow_copy()
+                for lev in levels)
+        else:
+            level = [self._get_level_number(l) for l in level]
+            new_levels = list(self._levels)
+            for l, v in zip(level, levels):
+                new_levels[l] = ensure_index(v, copy=copy)._shallow_copy()
+            new_levels = FrozenList(new_levels)
+
+        if verify_integrity:
+            self._verify_integrity(levels=new_levels)
+
+        names = self.names
+        self._levels = new_levels
+        if any(names):
+            self._set_names(names)
+
+        self._tuples = None
+        self._reset_cache()
+
+    def set_levels(self, levels, level=None, inplace=False,
+                   verify_integrity=True):
+        """
+        Set new levels on MultiIndex. Defaults to returning
+        new index.
+
+        Parameters
+        ----------
+        levels : sequence or list of sequence
+            new level(s) to apply
+        level : int, level name, or sequence of int/level names (default None)
+            level(s) to set (None for all levels)
+        inplace : bool
+            if True, mutates in place
+        verify_integrity : bool (default True)
+            if True, checks that levels and codes are compatible
+
+        Returns
+        -------
+        new index (of same type and class...etc)
+
+        Examples
+        --------
+        >>> idx = pd.MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                            (2, u'one'), (2, u'two')],
+                                            names=['foo', 'bar'])
+        >>> idx.set_levels([['a','b'], [1,2]])
+        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels(['a','b'], level=0)
+        MultiIndex(levels=[[u'a', u'b'], [u'one', u'two']],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels(['a','b'], level='bar')
+        MultiIndex(levels=[[1, 2], [u'a', u'b']],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_levels([['a','b'], [1,2]], level=[0,1])
+        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        """
+        if is_list_like(levels) and not isinstance(levels, Index):
+            levels = list(levels)
+
+        if level is not None and not is_list_like(level):
+            if not is_list_like(levels):
+                raise TypeError("Levels must be list-like")
+            if is_list_like(levels[0]):
+                raise TypeError("Levels must be list-like")
+            level = [level]
+            levels = [levels]
+        elif level is None or is_list_like(level):
+            if not is_list_like(levels) or not is_list_like(levels[0]):
+                raise TypeError("Levels must be list of lists-like")
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._reset_identity()
+        idx._set_levels(levels, level=level, validate=True,
+                        verify_integrity=verify_integrity)
+        if not inplace:
+            return idx
+
+    @property
+    def codes(self):
+        return self._codes
+
+    @property
+    def labels(self):
+        warnings.warn((".labels was deprecated in version 0.24.0. "
+                       "Use .codes instead."),
+                      FutureWarning, stacklevel=2)
+        return self.codes
+
+    def _set_codes(self, codes, level=None, copy=False, validate=True,
+                   verify_integrity=False):
+
+        if validate and level is None and len(codes) != self.nlevels:
+            raise ValueError("Length of codes must match number of levels")
+        if validate and level is not None and len(codes) != len(level):
+            raise ValueError('Length of codes must match length of levels.')
+
+        if level is None:
+            new_codes = FrozenList(
+                _ensure_frozen(level_codes, lev, copy=copy)._shallow_copy()
+                for lev, level_codes in zip(self.levels, codes))
+        else:
+            level = [self._get_level_number(l) for l in level]
+            new_codes = list(self._codes)
+            for lev_idx, level_codes in zip(level, codes):
+                lev = self.levels[lev_idx]
+                new_codes[lev_idx] = _ensure_frozen(
+                    level_codes, lev, copy=copy)._shallow_copy()
+            new_codes = FrozenList(new_codes)
+
+        if verify_integrity:
+            self._verify_integrity(codes=new_codes)
+
+        self._codes = new_codes
+        self._tuples = None
+        self._reset_cache()
+
+    def set_labels(self, labels, level=None, inplace=False,
+                   verify_integrity=True):
+        warnings.warn((".set_labels was deprecated in version 0.24.0. "
+                       "Use .set_codes instead."),
+                      FutureWarning, stacklevel=2)
+        return self.set_codes(codes=labels, level=level, inplace=inplace,
+                              verify_integrity=verify_integrity)
+
+    @deprecate_kwarg(old_arg_name='labels', new_arg_name='codes')
+    def set_codes(self, codes, level=None, inplace=False,
+                  verify_integrity=True):
+        """
+        Set new codes on MultiIndex. Defaults to returning
+        new index.
+
+        .. versionadded:: 0.24.0
+
+           New name for deprecated method `set_labels`.
+
+        Parameters
+        ----------
+        codes : sequence or list of sequence
+            new codes to apply
+        level : int, level name, or sequence of int/level names (default None)
+            level(s) to set (None for all levels)
+        inplace : bool
+            if True, mutates in place
+        verify_integrity : bool (default True)
+            if True, checks that levels and codes are compatible
+
+        Returns
+        -------
+        new index (of same type and class...etc)
+
+        Examples
+        --------
+        >>> idx = pd.MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                            (2, u'one'), (2, u'two')],
+                                            names=['foo', 'bar'])
+        >>> idx.set_codes([[1,0,1,0], [0,0,1,1]])
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   codes=[[1, 0, 1, 0], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_codes([1,0,1,0], level=0)
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   codes=[[1, 0, 1, 0], [0, 1, 0, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_codes([0,0,1,1], level='bar')
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   codes=[[0, 0, 1, 1], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        >>> idx.set_codes([[1,0,1,0], [0,0,1,1]], level=[0,1])
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   codes=[[1, 0, 1, 0], [0, 0, 1, 1]],
+                   names=[u'foo', u'bar'])
+        """
+        if level is not None and not is_list_like(level):
+            if not is_list_like(codes):
+                raise TypeError("Codes must be list-like")
+            if is_list_like(codes[0]):
+                raise TypeError("Codes must be list-like")
+            level = [level]
+            codes = [codes]
+        elif level is None or is_list_like(level):
+            if not is_list_like(codes) or not is_list_like(codes[0]):
+                raise TypeError("Codes must be list of lists-like")
+
+        if inplace:
+            idx = self
+        else:
+            idx = self._shallow_copy()
+        idx._reset_identity()
+        idx._set_codes(codes, level=level, verify_integrity=verify_integrity)
+        if not inplace:
+            return idx
+
+    @deprecate_kwarg(old_arg_name='labels', new_arg_name='codes')
+    def copy(self, names=None, dtype=None, levels=None, codes=None,
+             deep=False, _set_identity=False, **kwargs):
+        """
+        Make a copy of this object. Names, dtype, levels and codes can be
+        passed and will be set on new copy.
+
+        Parameters
+        ----------
+        names : sequence, optional
+        dtype : numpy dtype or pandas type, optional
+        levels : sequence, optional
+        codes : sequence, optional
+
+        Returns
+        -------
+        copy : MultiIndex
+
+        Notes
+        -----
+        In most cases, there should be no functional difference from using
+        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
+        This could be potentially expensive on large MultiIndex objects.
+        """
+        name = kwargs.get('name')
+        names = self._validate_names(name=name, names=names, deep=deep)
+
+        if deep:
+            from copy import deepcopy
+            if levels is None:
+                levels = deepcopy(self.levels)
+            if codes is None:
+                codes = deepcopy(self.codes)
+        else:
+            if levels is None:
+                levels = self.levels
+            if codes is None:
+                codes = self.codes
+        return MultiIndex(levels=levels, codes=codes, names=names,
+                          sortorder=self.sortorder, verify_integrity=False,
+                          _set_identity=_set_identity)
+
+    def __array__(self, dtype=None):
+        """ the array interface, return my values """
+        return self.values
+
+    def view(self, cls=None):
+        """ this is defined as a copy with the same identity """
+        result = self.copy()
+        result._id = self._id
+        return result
+
+    def _shallow_copy_with_infer(self, values, **kwargs):
+        # On equal MultiIndexes the difference is empty.
+        # Therefore, an empty MultiIndex is returned GH13490
+        if len(values) == 0:
+            return MultiIndex(levels=[[] for _ in range(self.nlevels)],
+                              codes=[[] for _ in range(self.nlevels)],
+                              **kwargs)
+        return self._shallow_copy(values, **kwargs)
+
+    @Appender(_index_shared_docs['contains'] % _index_doc_kwargs)
+    def __contains__(self, key):
+        hash(key)
+        try:
+            self.get_loc(key)
+            return True
+        except (LookupError, TypeError, ValueError):
+            return False
+
+    contains = __contains__
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is not None:
+            names = kwargs.pop('names', kwargs.pop('name', self.names))
+            # discards freq
+            kwargs.pop('freq', None)
+            return MultiIndex.from_tuples(values, names=names, **kwargs)
+        return self.view()
+
+    @cache_readonly
+    def dtype(self):
+        return np.dtype('O')
+
+    def _is_memory_usage_qualified(self):
+        """ return a boolean if we need a qualified .info display """
+        def f(l):
+            return 'mixed' in l or 'string' in l or 'unicode' in l
+        return any(f(l) for l in self._inferred_type_levels)
+
+    @Appender(Index.memory_usage.__doc__)
+    def memory_usage(self, deep=False):
+        # we are overwriting our base class to avoid
+        # computing .values here which could materialize
+        # a tuple representation uncessarily
+        return self._nbytes(deep)
+
+    @cache_readonly
+    def nbytes(self):
+        """ return the number of bytes in the underlying data """
+        return self._nbytes(False)
+
+    def _nbytes(self, deep=False):
+        """
+        return the number of bytes in the underlying data
+        deeply introspect the level data if deep=True
+
+        include the engine hashtable
+
+        *this is in internal routine*
+
+        """
+
+        # for implementations with no useful getsizeof (PyPy)
+        objsize = 24
+
+        level_nbytes = sum(i.memory_usage(deep=deep) for i in self.levels)
+        label_nbytes = sum(i.nbytes for i in self.codes)
+        names_nbytes = sum(getsizeof(i, objsize) for i in self.names)
+        result = level_nbytes + label_nbytes + names_nbytes
+
+        # include our engine hashtable
+        result += self._engine.sizeof(deep=deep)
+        return result
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr,formatted_value)
+        """
+        attrs = [
+            ('levels', ibase.default_pprint(self._levels,
+                                            max_seq_items=False)),
+            ('codes', ibase.default_pprint(self._codes,
+                                           max_seq_items=False))]
+        if com._any_not_none(*self.names):
+            attrs.append(('names', ibase.default_pprint(self.names)))
+        if self.sortorder is not None:
+            attrs.append(('sortorder', ibase.default_pprint(self.sortorder)))
+        return attrs
+
+    def _format_space(self):
+        return "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
+
+    def _format_data(self, name=None):
+        # we are formatting thru the attributes
+        return None
+
+    def _format_native_types(self, na_rep='nan', **kwargs):
+        new_levels = []
+        new_codes = []
+
+        # go through the levels and format them
+        for level, level_codes in zip(self.levels, self.codes):
+            level = level._format_native_types(na_rep=na_rep, **kwargs)
+            # add nan values, if there are any
+            mask = (level_codes == -1)
+            if mask.any():
+                nan_index = len(level)
+                level = np.append(level, na_rep)
+                level_codes = level_codes.values()
+                level_codes[mask] = nan_index
+            new_levels.append(level)
+            new_codes.append(level_codes)
+
+        if len(new_levels) == 1:
+            return Index(new_levels[0])._format_native_types()
+        else:
+            # reconstruct the multi-index
+            mi = MultiIndex(levels=new_levels, codes=new_codes,
+                            names=self.names, sortorder=self.sortorder,
+                            verify_integrity=False)
+            return mi.values
+
+    def format(self, space=2, sparsify=None, adjoin=True, names=False,
+               na_rep=None, formatter=None):
+        if len(self) == 0:
+            return []
+
+        stringified_levels = []
+        for lev, level_codes in zip(self.levels, self.codes):
+            na = na_rep if na_rep is not None else _get_na_rep(lev.dtype.type)
+
+            if len(lev) > 0:
+
+                formatted = lev.take(level_codes).format(formatter=formatter)
+
+                # we have some NA
+                mask = level_codes == -1
+                if mask.any():
+                    formatted = np.array(formatted, dtype=object)
+                    formatted[mask] = na
+                    formatted = formatted.tolist()
+
+            else:
+                # weird all NA case
+                formatted = [pprint_thing(na if isna(x) else x,
+                                          escape_chars=('\t', '\r', '\n'))
+                             for x in algos.take_1d(lev._values, level_codes)]
+            stringified_levels.append(formatted)
+
+        result_levels = []
+        for lev, name in zip(stringified_levels, self.names):
+            level = []
+
+            if names:
+                level.append(pprint_thing(name,
+                                          escape_chars=('\t', '\r', '\n'))
+                             if name is not None else '')
+
+            level.extend(np.array(lev, dtype=object))
+            result_levels.append(level)
+
+        if sparsify is None:
+            sparsify = get_option("display.multi_sparse")
+
+        if sparsify:
+            sentinel = ''
+            # GH3547
+            # use value of sparsify as sentinel,  unless it's an obvious
+            # "Truthey" value
+            if sparsify not in [True, 1]:
+                sentinel = sparsify
+            # little bit of a kludge job for #1217
+            result_levels = _sparsify(result_levels, start=int(names),
+                                      sentinel=sentinel)
+
+        if adjoin:
+            from pandas.io.formats.format import _get_adjustment
+            adj = _get_adjustment()
+            return adj.adjoin(space, *result_levels).split('\n')
+        else:
+            return result_levels
+
+    # --------------------------------------------------------------------
+
+    def __len__(self):
+        return len(self.codes[0])
+
+    def _get_names(self):
+        return FrozenList(level.name for level in self.levels)
+
+    def _set_names(self, names, level=None, validate=True):
+        """
+        Set new names on index. Each name has to be a hashable type.
+
+        Parameters
+        ----------
+        values : str or sequence
+            name(s) to set
+        level : int, level name, or sequence of int/level names (default None)
+            If the index is a MultiIndex (hierarchical), level(s) to set (None
+            for all levels).  Otherwise level must be None
+        validate : boolean, default True
+            validate that the names match level lengths
+
+        Raises
+        ------
+        TypeError if each name is not hashable.
+
+        Notes
+        -----
+        sets names on levels. WARNING: mutates!
+
+        Note that you generally want to set this *after* changing levels, so
+        that it only acts on copies
+        """
+        # GH 15110
+        # Don't allow a single string for names in a MultiIndex
+        if names is not None and not is_list_like(names):
+            raise ValueError('Names should be list-like for a MultiIndex')
+        names = list(names)
+
+        if validate and level is not None and len(names) != len(level):
+            raise ValueError('Length of names must match length of level.')
+        if validate and level is None and len(names) != self.nlevels:
+            raise ValueError('Length of names must match number of levels in '
+                             'MultiIndex.')
+
+        if level is None:
+            level = range(self.nlevels)
+        else:
+            level = [self._get_level_number(l) for l in level]
+
+        # set the name
+        for l, name in zip(level, names):
+            if name is not None:
+                # GH 20527
+                # All items in 'names' need to be hashable:
+                if not is_hashable(name):
+                    raise TypeError('{}.name must be a hashable type'
+                                    .format(self.__class__.__name__))
+            self.levels[l].rename(name, inplace=True)
+
+    names = property(fset=_set_names, fget=_get_names,
+                     doc="Names of levels in MultiIndex")
+
+    @Appender(_index_shared_docs['_get_grouper_for_level'])
+    def _get_grouper_for_level(self, mapper, level):
+        indexer = self.codes[level]
+        level_index = self.levels[level]
+
+        if mapper is not None:
+            # Handle group mapping function and return
+            level_values = self.levels[level].take(indexer)
+            grouper = level_values.map(mapper)
+            return grouper, None, None
+
+        codes, uniques = algos.factorize(indexer, sort=True)
+
+        if len(uniques) > 0 and uniques[0] == -1:
+            # Handle NAs
+            mask = indexer != -1
+            ok_codes, uniques = algos.factorize(indexer[mask], sort=True)
+
+            codes = np.empty(len(indexer), dtype=indexer.dtype)
+            codes[mask] = ok_codes
+            codes[~mask] = -1
+
+        if len(uniques) < len(level_index):
+            # Remove unobserved levels from level_index
+            level_index = level_index.take(uniques)
+
+        grouper = level_index.take(codes)
+
+        return grouper, codes, level_index
+
+    @property
+    def _constructor(self):
+        return MultiIndex.from_tuples
+
+    @cache_readonly
+    def inferred_type(self):
+        return 'mixed'
+
+    def _get_level_number(self, level):
+        count = self.names.count(level)
+        if (count > 1) and not is_integer(level):
+            raise ValueError('The name %s occurs multiple times, use a '
+                             'level number' % level)
+        try:
+            level = self.names.index(level)
+        except ValueError:
+            if not is_integer(level):
+                raise KeyError('Level %s not found' % str(level))
+            elif level < 0:
+                level += self.nlevels
+                if level < 0:
+                    orig_level = level - self.nlevels
+                    raise IndexError('Too many levels: Index has only %d '
+                                     'levels, %d is not a valid level number' %
+                                     (self.nlevels, orig_level))
+            # Note: levels are zero-based
+            elif level >= self.nlevels:
+                raise IndexError('Too many levels: Index has only %d levels, '
+                                 'not %d' % (self.nlevels, level + 1))
+        return level
+
+    _tuples = None
+
+    @cache_readonly
+    def _engine(self):
+        # Calculate the number of bits needed to represent labels in each
+        # level, as log2 of their sizes (including -1 for NaN):
+        sizes = np.ceil(np.log2([len(l) + 1 for l in self.levels]))
+
+        # Sum bit counts, starting from the _right_....
+        lev_bits = np.cumsum(sizes[::-1])[::-1]
+
+        # ... in order to obtain offsets such that sorting the combination of
+        # shifted codes (one for each level, resulting in a unique integer) is
+        # equivalent to sorting lexicographically the codes themselves. Notice
+        # that each level needs to be shifted by the number of bits needed to
+        # represent the _previous_ ones:
+        offsets = np.concatenate([lev_bits[1:], [0]]).astype('uint64')
+
+        # Check the total number of bits needed for our representation:
+        if lev_bits[0] > 64:
+            # The levels would overflow a 64 bit uint - use Python integers:
+            return MultiIndexPyIntEngine(self.levels, self.codes, offsets)
+        return MultiIndexUIntEngine(self.levels, self.codes, offsets)
+
+    @property
+    def values(self):
+        if self._tuples is not None:
+            return self._tuples
+
+        values = []
+
+        for i in range(self.nlevels):
+            vals = self._get_level_values(i)
+            if is_categorical_dtype(vals):
+                vals = vals.get_values()
+            if (isinstance(vals.dtype, (PandasExtensionDtype, ExtensionDtype))
+                    or hasattr(vals, '_box_values')):
+                vals = vals.astype(object)
+            vals = np.array(vals, copy=False)
+            values.append(vals)
+
+        self._tuples = lib.fast_zip(values)
+        return self._tuples
+
+    @property
+    def _has_complex_internals(self):
+        # to disable groupby tricks
+        return True
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        """
+        return if the index is monotonic increasing (only equal or
+        increasing) values.
+        """
+
+        # reversed() because lexsort() wants the most significant key last.
+        values = [self._get_level_values(i).values
+                  for i in reversed(range(len(self.levels)))]
+        try:
+            sort_order = np.lexsort(values)
+            return Index(sort_order).is_monotonic
+        except TypeError:
+
+            # we have mixed types and np.lexsort is not happy
+            return Index(self.values).is_monotonic
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        """
+        return if the index is monotonic decreasing (only equal or
+        decreasing) values.
+        """
+        # monotonic decreasing if and only if reverse is monotonic increasing
+        return self[::-1].is_monotonic_increasing
+
+    @cache_readonly
+    def _have_mixed_levels(self):
+        """ return a boolean list indicated if we have mixed levels """
+        return ['mixed' in l for l in self._inferred_type_levels]
+
+    @cache_readonly
+    def _inferred_type_levels(self):
+        """ return a list of the inferred types, one for each level """
+        return [i.inferred_type for i in self.levels]
+
+    @cache_readonly
+    def _hashed_values(self):
+        """ return a uint64 ndarray of my hashed values """
+        from pandas.core.util.hashing import hash_tuples
+        return hash_tuples(self)
+
+    def _hashed_indexing_key(self, key):
+        """
+        validate and return the hash for the provided key
+
+        *this is internal for use for the cython routines*
+
+        Parameters
+        ----------
+        key : string or tuple
+
+        Returns
+        -------
+        np.uint64
+
+        Notes
+        -----
+        we need to stringify if we have mixed levels
+
+        """
+        from pandas.core.util.hashing import hash_tuples, hash_tuple
+
+        if not isinstance(key, tuple):
+            return hash_tuples(key)
+
+        if not len(key) == self.nlevels:
+            raise KeyError
+
+        def f(k, stringify):
+            if stringify and not isinstance(k, compat.string_types):
+                k = str(k)
+            return k
+        key = tuple(f(k, stringify)
+                    for k, stringify in zip(key, self._have_mixed_levels))
+        return hash_tuple(key)
+
+    @Appender(Index.duplicated.__doc__)
+    def duplicated(self, keep='first'):
+        from pandas.core.sorting import get_group_index
+        from pandas._libs.hashtable import duplicated_int64
+
+        shape = map(len, self.levels)
+        ids = get_group_index(self.codes, shape, sort=False, xnull=False)
+
+        return duplicated_int64(ids, keep)
+
+    def fillna(self, value=None, downcast=None):
+        """
+        fillna is not implemented for MultiIndex
+        """
+        raise NotImplementedError('isna is not defined for MultiIndex')
+
+    @Appender(_index_shared_docs['dropna'])
+    def dropna(self, how='any'):
+        nans = [level_codes == -1 for level_codes in self.codes]
+        if how == 'any':
+            indexer = np.any(nans, axis=0)
+        elif how == 'all':
+            indexer = np.all(nans, axis=0)
+        else:
+            raise ValueError("invalid how option: {0}".format(how))
+
+        new_codes = [level_codes[~indexer] for level_codes in self.codes]
+        return self.copy(codes=new_codes, deep=True)
+
+    def get_value(self, series, key):
+        # somewhat broken encapsulation
+        from pandas.core.indexing import maybe_droplevels
+
+        # Label-based
+        s = com.values_from_object(series)
+        k = com.values_from_object(key)
+
+        def _try_mi(k):
+            # TODO: what if a level contains tuples??
+            loc = self.get_loc(k)
+            new_values = series._values[loc]
+            new_index = self[loc]
+            new_index = maybe_droplevels(new_index, k)
+            return series._constructor(new_values, index=new_index,
+                                       name=series.name).__finalize__(self)
+
+        try:
+            return self._engine.get_value(s, k)
+        except KeyError as e1:
+            try:
+                return _try_mi(key)
+            except KeyError:
+                pass
+
+            try:
+                return libindex.get_value_at(s, k)
+            except IndexError:
+                raise
+            except TypeError:
+                # generator/iterator-like
+                if is_iterator(key):
+                    raise InvalidIndexError(key)
+                else:
+                    raise e1
+            except Exception:  # pragma: no cover
+                raise e1
+        except TypeError:
+
+            # a Timestamp will raise a TypeError in a multi-index
+            # rather than a KeyError, try it here
+            # note that a string that 'looks' like a Timestamp will raise
+            # a KeyError! (GH5725)
+            if (isinstance(key, (datetime.datetime, np.datetime64)) or
+                    (compat.PY3 and isinstance(key, compat.string_types))):
+                try:
+                    return _try_mi(key)
+                except KeyError:
+                    raise
+                except (IndexError, ValueError, TypeError):
+                    pass
+
+                try:
+                    return _try_mi(Timestamp(key))
+                except (KeyError, TypeError,
+                        IndexError, ValueError, tslibs.OutOfBoundsDatetime):
+                    pass
+
+            raise InvalidIndexError(key)
+
+    def _get_level_values(self, level, unique=False):
+        """
+        Return vector of label values for requested level,
+        equal to the length of the index
+
+        **this is an internal method**
+
+        Parameters
+        ----------
+        level : int level
+        unique : bool, default False
+            if True, drop duplicated values
+
+        Returns
+        -------
+        values : ndarray
+        """
+
+        values = self.levels[level]
+        level_codes = self.codes[level]
+        if unique:
+            level_codes = algos.unique(level_codes)
+        filled = algos.take_1d(values._values, level_codes,
+                               fill_value=values._na_value)
+        values = values._shallow_copy(filled)
+        return values
+
+    def get_level_values(self, level):
+        """
+        Return vector of label values for requested level,
+        equal to the length of the index.
+
+        Parameters
+        ----------
+        level : int or str
+            ``level`` is either the integer position of the level in the
+            MultiIndex, or the name of the level.
+
+        Returns
+        -------
+        values : Index
+            Values is a level of this MultiIndex converted to
+            a single :class:`Index` (or subclass thereof).
+
+        Examples
+        ---------
+
+        Create a MultiIndex:
+
+        >>> mi = pd.MultiIndex.from_arrays((list('abc'), list('def')))
+        >>> mi.names = ['level_1', 'level_2']
+
+        Get level values by supplying level as either integer or name:
+
+        >>> mi.get_level_values(0)
+        Index(['a', 'b', 'c'], dtype='object', name='level_1')
+        >>> mi.get_level_values('level_2')
+        Index(['d', 'e', 'f'], dtype='object', name='level_2')
+        """
+        level = self._get_level_number(level)
+        values = self._get_level_values(level)
+        return values
+
+    @Appender(_index_shared_docs['index_unique'] % _index_doc_kwargs)
+    def unique(self, level=None):
+
+        if level is None:
+            return super(MultiIndex, self).unique()
+        else:
+            level = self._get_level_number(level)
+            return self._get_level_values(level=level, unique=True)
+
+    def _to_safe_for_reshape(self):
+        """ convert to object if we are a categorical """
+        return self.set_levels([i._to_safe_for_reshape() for i in self.levels])
+
+    def to_frame(self, index=True, name=None):
+        """
+        Create a DataFrame with the levels of the MultiIndex as columns.
+
+        Column ordering is determined by the DataFrame constructor with data as
+        a dict.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        index : boolean, default True
+            Set the index of the returned DataFrame as the original MultiIndex.
+
+        name : list / sequence of strings, optional
+            The passed names should substitute index level names.
+
+        Returns
+        -------
+        DataFrame : a DataFrame containing the original MultiIndex data.
+
+        See Also
+        --------
+        DataFrame
+        """
+
+        from pandas import DataFrame
+        if name is not None:
+            if not is_list_like(name):
+                raise TypeError("'name' must be a list / sequence "
+                                "of column names.")
+
+            if len(name) != len(self.levels):
+                raise ValueError("'name' should have same length as "
+                                 "number of levels on index.")
+            idx_names = name
+        else:
+            idx_names = self.names
+
+        # Guarantee resulting column order
+        result = DataFrame(
+            OrderedDict([
+                ((level if lvlname is None else lvlname),
+                 self._get_level_values(level))
+                for lvlname, level in zip(idx_names, range(len(self.levels)))
+            ]),
+            copy=False
+        )
+
+        if index:
+            result.index = self
+        return result
+
+    def to_hierarchical(self, n_repeat, n_shuffle=1):
+        """
+        Return a MultiIndex reshaped to conform to the
+        shapes given by n_repeat and n_shuffle.
+
+        .. deprecated:: 0.24.0
+
+        Useful to replicate and rearrange a MultiIndex for combination
+        with another Index with n_repeat items.
+
+        Parameters
+        ----------
+        n_repeat : int
+            Number of times to repeat the labels on self
+        n_shuffle : int
+            Controls the reordering of the labels. If the result is going
+            to be an inner level in a MultiIndex, n_shuffle will need to be
+            greater than one. The size of each label must divisible by
+            n_shuffle.
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+        >>> idx = pd.MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
+                                            (2, u'one'), (2, u'two')])
+        >>> idx.to_hierarchical(3)
+        MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                   codes=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
+                          [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
+        """
+        levels = self.levels
+        codes = [np.repeat(level_codes, n_repeat) for
+                 level_codes in self.codes]
+        # Assumes that each level_codes is divisible by n_shuffle
+        codes = [x.reshape(n_shuffle, -1).ravel(order='F') for x in codes]
+        names = self.names
+        warnings.warn("Method .to_hierarchical is deprecated and will "
+                      "be removed in a future version",
+                      FutureWarning, stacklevel=2)
+        return MultiIndex(levels=levels, codes=codes, names=names)
+
+    def to_flat_index(self):
+        """
+        Convert a MultiIndex to an Index of Tuples containing the level values.
+
+        .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        pd.Index
+            Index with the MultiIndex data represented in Tuples.
+
+        Notes
+        -----
+        This method will simply return the caller if called by anything other
+        than a MultiIndex.
+
+        Examples
+        --------
+        >>> index = pd.MultiIndex.from_product(
+        ...     [['foo', 'bar'], ['baz', 'qux']],
+        ...     names=['a', 'b'])
+        >>> index.to_flat_index()
+        Index([('foo', 'baz'), ('foo', 'qux'),
+               ('bar', 'baz'), ('bar', 'qux')],
+              dtype='object')
+        """
+        return Index(self.values, tupleize_cols=False)
+
+    @property
+    def is_all_dates(self):
+        return False
+
+    def is_lexsorted(self):
+        """
+        Return True if the codes are lexicographically sorted
+        """
+        return self.lexsort_depth == self.nlevels
+
+    @cache_readonly
+    def lexsort_depth(self):
+        if self.sortorder is not None:
+            if self.sortorder == 0:
+                return self.nlevels
+            else:
+                return 0
+
+        int64_codes = [ensure_int64(level_codes) for level_codes in self.codes]
+        for k in range(self.nlevels, 0, -1):
+            if libalgos.is_lexsorted(int64_codes[:k]):
+                return k
+
+        return 0
+
+    def _sort_levels_monotonic(self):
+        """
+        .. versionadded:: 0.20.0
+
+        This is an *internal* function.
+
+        Create a new MultiIndex from the current to monotonically sorted
+        items IN the levels. This does not actually make the entire MultiIndex
+        monotonic, JUST the levels.
+
+        The resulting MultiIndex will have the same outward
+        appearance, meaning the same .values and ordering. It will also
+        be .equals() to the original.
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+
+        >>> i = pd.MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                              codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> i
+        MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+
+        >>> i.sort_monotonic()
+        MultiIndex(levels=[['a', 'b'], ['aa', 'bb']],
+                   codes=[[0, 0, 1, 1], [1, 0, 1, 0]])
+
+        """
+
+        if self.is_lexsorted() and self.is_monotonic:
+            return self
+
+        new_levels = []
+        new_codes = []
+
+        for lev, level_codes in zip(self.levels, self.codes):
+
+            if not lev.is_monotonic:
+                try:
+                    # indexer to reorder the levels
+                    indexer = lev.argsort()
+                except TypeError:
+                    pass
+                else:
+                    lev = lev.take(indexer)
+
+                    # indexer to reorder the level codes
+                    indexer = ensure_int64(indexer)
+                    ri = lib.get_reverse_indexer(indexer, len(indexer))
+                    level_codes = algos.take_1d(ri, level_codes)
+
+            new_levels.append(lev)
+            new_codes.append(level_codes)
+
+        return MultiIndex(new_levels, new_codes,
+                          names=self.names, sortorder=self.sortorder,
+                          verify_integrity=False)
+
+    def remove_unused_levels(self):
+        """
+        Create a new MultiIndex from the current that removes
+        unused levels, meaning that they are not expressed in the labels.
+
+        The resulting MultiIndex will have the same outward
+        appearance, meaning the same .values and ordering. It will also
+        be .equals() to the original.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        MultiIndex
+
+        Examples
+        --------
+        >>> i = pd.MultiIndex.from_product([range(2), list('ab')])
+        MultiIndex(levels=[[0, 1], ['a', 'b']],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+
+        >>> i[2:]
+        MultiIndex(levels=[[0, 1], ['a', 'b']],
+                   codes=[[1, 1], [0, 1]])
+
+        The 0 from the first level is not represented
+        and can be removed
+
+        >>> i[2:].remove_unused_levels()
+        MultiIndex(levels=[[1], ['a', 'b']],
+                   codes=[[0, 0], [0, 1]])
+        """
+
+        new_levels = []
+        new_codes = []
+
+        changed = False
+        for lev, level_codes in zip(self.levels, self.codes):
+
+            # Since few levels are typically unused, bincount() is more
+            # efficient than unique() - however it only accepts positive values
+            # (and drops order):
+            uniques = np.where(np.bincount(level_codes + 1) > 0)[0] - 1
+            has_na = int(len(uniques) and (uniques[0] == -1))
+
+            if len(uniques) != len(lev) + has_na:
+                # We have unused levels
+                changed = True
+
+                # Recalculate uniques, now preserving order.
+                # Can easily be cythonized by exploiting the already existing
+                # "uniques" and stop parsing "level_codes" when all items
+                # are found:
+                uniques = algos.unique(level_codes)
+                if has_na:
+                    na_idx = np.where(uniques == -1)[0]
+                    # Just ensure that -1 is in first position:
+                    uniques[[0, na_idx[0]]] = uniques[[na_idx[0], 0]]
+
+                # codes get mapped from uniques to 0:len(uniques)
+                # -1 (if present) is mapped to last position
+                code_mapping = np.zeros(len(lev) + has_na)
+                # ... and reassigned value -1:
+                code_mapping[uniques] = np.arange(len(uniques)) - has_na
+
+                level_codes = code_mapping[level_codes]
+
+                # new levels are simple
+                lev = lev.take(uniques[has_na:])
+
+            new_levels.append(lev)
+            new_codes.append(level_codes)
+
+        result = self._shallow_copy()
+
+        if changed:
+            result._reset_identity()
+            result._set_levels(new_levels, validate=False)
+            result._set_codes(new_codes, validate=False)
+
+        return result
+
+    @property
+    def nlevels(self):
+        """Integer number of levels in this MultiIndex."""
+        return len(self.levels)
+
+    @property
+    def levshape(self):
+        """A tuple with the length of each level."""
+        return tuple(len(x) for x in self.levels)
+
+    def __reduce__(self):
+        """Necessary for making this object picklable"""
+        d = dict(levels=[lev for lev in self.levels],
+                 codes=[level_codes for level_codes in self.codes],
+                 sortorder=self.sortorder, names=list(self.names))
+        return ibase._new_Index, (self.__class__, d), None
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+
+        if isinstance(state, dict):
+            levels = state.get('levels')
+            codes = state.get('codes')
+            sortorder = state.get('sortorder')
+            names = state.get('names')
+
+        elif isinstance(state, tuple):
+
+            nd_state, own_state = state
+            levels, codes, sortorder, names = own_state
+
+        self._set_levels([Index(x) for x in levels], validate=False)
+        self._set_codes(codes)
+        self._set_names(names)
+        self.sortorder = sortorder
+        self._verify_integrity()
+        self._reset_identity()
+
+    def __getitem__(self, key):
+        if is_scalar(key):
+            key = com.cast_scalar_indexer(key)
+
+            retval = []
+            for lev, level_codes in zip(self.levels, self.codes):
+                if level_codes[key] == -1:
+                    retval.append(np.nan)
+                else:
+                    retval.append(lev[level_codes[key]])
+
+            return tuple(retval)
+        else:
+            if com.is_bool_indexer(key):
+                key = np.asarray(key, dtype=bool)
+                sortorder = self.sortorder
+            else:
+                # cannot be sure whether the result will be sorted
+                sortorder = None
+
+                if isinstance(key, Index):
+                    key = np.asarray(key)
+
+            new_codes = [level_codes[key] for level_codes in self.codes]
+
+            return MultiIndex(levels=self.levels, codes=new_codes,
+                              names=self.names, sortorder=sortorder,
+                              verify_integrity=False)
+
+    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
+    def take(self, indices, axis=0, allow_fill=True,
+             fill_value=None, **kwargs):
+        nv.validate_take(tuple(), kwargs)
+        indices = ensure_platform_int(indices)
+        taken = self._assert_take_fillable(self.codes, indices,
+                                           allow_fill=allow_fill,
+                                           fill_value=fill_value,
+                                           na_value=-1)
+        return MultiIndex(levels=self.levels, codes=taken,
+                          names=self.names, verify_integrity=False)
+
+    def _assert_take_fillable(self, values, indices, allow_fill=True,
+                              fill_value=None, na_value=None):
+        """ Internal method to handle NA filling of take """
+        # only fill if we are passing a non-None fill_value
+        if allow_fill and fill_value is not None:
+            if (indices < -1).any():
+                msg = ('When allow_fill=True and fill_value is not None, '
+                       'all indices must be >= -1')
+                raise ValueError(msg)
+            taken = [lab.take(indices) for lab in self.codes]
+            mask = indices == -1
+            if mask.any():
+                masked = []
+                for new_label in taken:
+                    label_values = new_label.values()
+                    label_values[mask] = na_value
+                    masked.append(np.asarray(label_values))
+                taken = masked
+        else:
+            taken = [lab.take(indices) for lab in self.codes]
+        return taken
+
+    def append(self, other):
+        """
+        Append a collection of Index options together
+
+        Parameters
+        ----------
+        other : Index or list/tuple of indices
+
+        Returns
+        -------
+        appended : Index
+        """
+        if not isinstance(other, (list, tuple)):
+            other = [other]
+
+        if all((isinstance(o, MultiIndex) and o.nlevels >= self.nlevels)
+               for o in other):
+            arrays = []
+            for i in range(self.nlevels):
+                label = self._get_level_values(i)
+                appended = [o._get_level_values(i) for o in other]
+                arrays.append(label.append(appended))
+            return MultiIndex.from_arrays(arrays, names=self.names)
+
+        to_concat = (self.values, ) + tuple(k._values for k in other)
+        new_tuples = np.concatenate(to_concat)
+
+        # if all(isinstance(x, MultiIndex) for x in other):
+        try:
+            return MultiIndex.from_tuples(new_tuples, names=self.names)
+        except (TypeError, IndexError):
+            return Index(new_tuples)
+
+    def argsort(self, *args, **kwargs):
+        return self.values.argsort(*args, **kwargs)
+
+    @Appender(_index_shared_docs['repeat'] % _index_doc_kwargs)
+    def repeat(self, repeats, axis=None):
+        nv.validate_repeat(tuple(), dict(axis=axis))
+        return MultiIndex(levels=self.levels,
+                          codes=[level_codes.view(np.ndarray).repeat(repeats)
+                                 for level_codes in self.codes],
+                          names=self.names, sortorder=self.sortorder,
+                          verify_integrity=False)
+
+    def where(self, cond, other=None):
+        raise NotImplementedError(".where is not supported for "
+                                  "MultiIndex operations")
+
+    @deprecate_kwarg(old_arg_name='labels', new_arg_name='codes')
+    def drop(self, codes, level=None, errors='raise'):
+        """
+        Make new MultiIndex with passed list of codes deleted
+
+        Parameters
+        ----------
+        codes : array-like
+            Must be a list of tuples
+        level : int or level name, default None
+
+        Returns
+        -------
+        dropped : MultiIndex
+        """
+        if level is not None:
+            return self._drop_from_level(codes, level)
+
+        try:
+            if not isinstance(codes, (np.ndarray, Index)):
+                codes = com.index_labels_to_array(codes)
+            indexer = self.get_indexer(codes)
+            mask = indexer == -1
+            if mask.any():
+                if errors != 'ignore':
+                    raise ValueError('codes %s not contained in axis' %
+                                     codes[mask])
+        except Exception:
+            pass
+
+        inds = []
+        for level_codes in codes:
+            try:
+                loc = self.get_loc(level_codes)
+                # get_loc returns either an integer, a slice, or a boolean
+                # mask
+                if isinstance(loc, int):
+                    inds.append(loc)
+                elif isinstance(loc, slice):
+                    inds.extend(lrange(loc.start, loc.stop))
+                elif com.is_bool_indexer(loc):
+                    if self.lexsort_depth == 0:
+                        warnings.warn('dropping on a non-lexsorted multi-index'
+                                      ' without a level parameter may impact '
+                                      'performance.',
+                                      PerformanceWarning,
+                                      stacklevel=3)
+                    loc = loc.nonzero()[0]
+                    inds.extend(loc)
+                else:
+                    msg = 'unsupported indexer of type {}'.format(type(loc))
+                    raise AssertionError(msg)
+            except KeyError:
+                if errors != 'ignore':
+                    raise
+
+        return self.delete(inds)
+
+    def _drop_from_level(self, codes, level):
+        codes = com.index_labels_to_array(codes)
+        i = self._get_level_number(level)
+        index = self.levels[i]
+        values = index.get_indexer(codes)
+
+        mask = ~algos.isin(self.codes[i], values)
+
+        return self[mask]
+
+    def swaplevel(self, i=-2, j=-1):
+        """
+        Swap level i with level j.
+
+        Calling this method does not change the ordering of the values.
+
+        Parameters
+        ----------
+        i : int, str, default -2
+            First level of index to be swapped. Can pass level name as string.
+            Type of parameters can be mixed.
+        j : int, str, default -1
+            Second level of index to be swapped. Can pass level name as string.
+            Type of parameters can be mixed.
+
+        Returns
+        -------
+        MultiIndex
+            A new MultiIndex.
+
+        .. versionchanged:: 0.18.1
+
+           The indexes ``i`` and ``j`` are now optional, and default to
+           the two innermost levels of the index.
+
+        See Also
+        --------
+        Series.swaplevel : Swap levels i and j in a MultiIndex.
+        Dataframe.swaplevel : Swap levels i and j in a MultiIndex on a
+            particular axis.
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+        ...                    codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> mi
+        MultiIndex(levels=[['a', 'b'], ['bb', 'aa']],
+                   codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        >>> mi.swaplevel(0, 1)
+        MultiIndex(levels=[['bb', 'aa'], ['a', 'b']],
+                   codes=[[0, 1, 0, 1], [0, 0, 1, 1]])
+        """
+        new_levels = list(self.levels)
+        new_codes = list(self.codes)
+        new_names = list(self.names)
+
+        i = self._get_level_number(i)
+        j = self._get_level_number(j)
+
+        new_levels[i], new_levels[j] = new_levels[j], new_levels[i]
+        new_codes[i], new_codes[j] = new_codes[j], new_codes[i]
+        new_names[i], new_names[j] = new_names[j], new_names[i]
+
+        return MultiIndex(levels=new_levels, codes=new_codes,
+                          names=new_names, verify_integrity=False)
+
+    def reorder_levels(self, order):
+        """
+        Rearrange levels using input order. May not drop or duplicate levels
+
+        Parameters
+        ----------
+        """
+        order = [self._get_level_number(i) for i in order]
+        if len(order) != self.nlevels:
+            raise AssertionError('Length of order must be same as '
+                                 'number of levels (%d), got %d' %
+                                 (self.nlevels, len(order)))
+        new_levels = [self.levels[i] for i in order]
+        new_codes = [self.codes[i] for i in order]
+        new_names = [self.names[i] for i in order]
+
+        return MultiIndex(levels=new_levels, codes=new_codes,
+                          names=new_names, verify_integrity=False)
+
+    def __getslice__(self, i, j):
+        return self.__getitem__(slice(i, j))
+
+    def _get_codes_for_sorting(self):
+        """
+        we categorizing our codes by using the
+        available categories (all, not just observed)
+        excluding any missing ones (-1); this is in preparation
+        for sorting, where we need to disambiguate that -1 is not
+        a valid valid
+        """
+        from pandas.core.arrays import Categorical
+
+        def cats(level_codes):
+            return np.arange(np.array(level_codes).max() + 1 if
+                             len(level_codes) else 0,
+                             dtype=level_codes.dtype)
+
+        return [Categorical.from_codes(level_codes, cats(level_codes),
+                                       ordered=True)
+                for level_codes in self.codes]
+
+    def sortlevel(self, level=0, ascending=True, sort_remaining=True):
+        """
+        Sort MultiIndex at the requested level. The result will respect the
+        original ordering of the associated factor at that level.
+
+        Parameters
+        ----------
+        level : list-like, int or str, default 0
+            If a string is given, must be a name of the level
+            If list-like must be names or ints of levels.
+        ascending : boolean, default True
+            False to sort in descending order
+            Can also be a list to specify a directed ordering
+        sort_remaining : sort by the remaining levels after level
+
+        Returns
+        -------
+        sorted_index : pd.MultiIndex
+            Resulting index.
+        indexer : np.ndarray
+            Indices of output values in original index.
+        """
+        from pandas.core.sorting import indexer_from_factorized
+
+        if isinstance(level, (compat.string_types, int)):
+            level = [level]
+        level = [self._get_level_number(lev) for lev in level]
+        sortorder = None
+
+        # we have a directed ordering via ascending
+        if isinstance(ascending, list):
+            if not len(level) == len(ascending):
+                raise ValueError("level must have same length as ascending")
+
+            from pandas.core.sorting import lexsort_indexer
+            indexer = lexsort_indexer([self.codes[lev] for lev in level],
+                                      orders=ascending)
+
+        # level ordering
+        else:
+
+            codes = list(self.codes)
+            shape = list(self.levshape)
+
+            # partition codes and shape
+            primary = tuple(codes.pop(lev - i) for i, lev in enumerate(level))
+            primshp = tuple(shape.pop(lev - i) for i, lev in enumerate(level))
+
+            if sort_remaining:
+                primary += primary + tuple(codes)
+                primshp += primshp + tuple(shape)
+            else:
+                sortorder = level[0]
+
+            indexer = indexer_from_factorized(primary, primshp,
+                                              compress=False)
+
+            if not ascending:
+                indexer = indexer[::-1]
+
+        indexer = ensure_platform_int(indexer)
+        new_codes = [level_codes.take(indexer) for level_codes in self.codes]
+
+        new_index = MultiIndex(codes=new_codes, levels=self.levels,
+                               names=self.names, sortorder=sortorder,
+                               verify_integrity=False)
+
+        return new_index, indexer
+
+    def _convert_listlike_indexer(self, keyarr, kind=None):
+        """
+        Parameters
+        ----------
+        keyarr : list-like
+            Indexer to convert.
+
+        Returns
+        -------
+        tuple (indexer, keyarr)
+            indexer is an ndarray or None if cannot convert
+            keyarr are tuple-safe keys
+        """
+        indexer, keyarr = super(MultiIndex, self)._convert_listlike_indexer(
+            keyarr, kind=kind)
+
+        # are we indexing a specific level
+        if indexer is None and len(keyarr) and not isinstance(keyarr[0],
+                                                              tuple):
+            level = 0
+            _, indexer = self.reindex(keyarr, level=level)
+
+            # take all
+            if indexer is None:
+                indexer = np.arange(len(self))
+
+            check = self.levels[0].get_indexer(keyarr)
+            mask = check == -1
+            if mask.any():
+                raise KeyError('%s not in index' % keyarr[mask])
+
+        return indexer, keyarr
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        method = missing.clean_reindex_fill_method(method)
+        target = ensure_index(target)
+
+        # empty indexer
+        if is_list_like(target) and not len(target):
+            return ensure_platform_int(np.array([]))
+
+        if not isinstance(target, MultiIndex):
+            try:
+                target = MultiIndex.from_tuples(target)
+            except (TypeError, ValueError):
+
+                # let's instead try with a straight Index
+                if method is None:
+                    return Index(self.values).get_indexer(target,
+                                                          method=method,
+                                                          limit=limit,
+                                                          tolerance=tolerance)
+
+        if not self.is_unique:
+            raise ValueError('Reindexing only valid with uniquely valued '
+                             'Index objects')
+
+        if method == 'pad' or method == 'backfill':
+            if tolerance is not None:
+                raise NotImplementedError("tolerance not implemented yet "
+                                          'for MultiIndex')
+            indexer = self._engine.get_indexer(target, method, limit)
+        elif method == 'nearest':
+            raise NotImplementedError("method='nearest' not implemented yet "
+                                      'for MultiIndex; see GitHub issue 9365')
+        else:
+            indexer = self._engine.get_indexer(target)
+
+        return ensure_platform_int(indexer)
+
+    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
+    def get_indexer_non_unique(self, target):
+        return super(MultiIndex, self).get_indexer_non_unique(target)
+
+    def reindex(self, target, method=None, level=None, limit=None,
+                tolerance=None):
+        """
+        Create index with target's values (move/add/delete values as necessary)
+
+        Returns
+        -------
+        new_index : pd.MultiIndex
+            Resulting index
+        indexer : np.ndarray or None
+            Indices of output values in original index.
+
+        """
+        # GH6552: preserve names when reindexing to non-named target
+        # (i.e. neither Index nor Series).
+        preserve_names = not hasattr(target, 'names')
+
+        if level is not None:
+            if method is not None:
+                raise TypeError('Fill method not supported if level passed')
+
+            # GH7774: preserve dtype/tz if target is empty and not an Index.
+            # target may be an iterator
+            target = ibase._ensure_has_len(target)
+            if len(target) == 0 and not isinstance(target, Index):
+                idx = self.levels[level]
+                attrs = idx._get_attributes_dict()
+                attrs.pop('freq', None)  # don't preserve freq
+                target = type(idx)._simple_new(np.empty(0, dtype=idx.dtype),
+                                               **attrs)
+            else:
+                target = ensure_index(target)
+            target, indexer, _ = self._join_level(target, level, how='right',
+                                                  return_indexers=True,
+                                                  keep_order=False)
+        else:
+            target = ensure_index(target)
+            if self.equals(target):
+                indexer = None
+            else:
+                if self.is_unique:
+                    indexer = self.get_indexer(target, method=method,
+                                               limit=limit,
+                                               tolerance=tolerance)
+                else:
+                    raise ValueError("cannot handle a non-unique multi-index!")
+
+        if not isinstance(target, MultiIndex):
+            if indexer is None:
+                target = self
+            elif (indexer >= 0).all():
+                target = self.take(indexer)
+            else:
+                # hopefully?
+                target = MultiIndex.from_tuples(target)
+
+        if (preserve_names and target.nlevels == self.nlevels and
+                target.names != self.names):
+            target = target.copy(deep=False)
+            target.names = self.names
+
+        return target, indexer
+
+    def get_slice_bound(self, label, side, kind):
+
+        if not isinstance(label, tuple):
+            label = label,
+        return self._partial_tup_index(label, side=side)
+
+    def slice_locs(self, start=None, end=None, step=None, kind=None):
+        """
+        For an ordered MultiIndex, compute the slice locations for input
+        labels.
+
+        The input labels can be tuples representing partial levels, e.g. for a
+        MultiIndex with 3 levels, you can pass a single value (corresponding to
+        the first level), or a 1-, 2-, or 3-tuple.
+
+        Parameters
+        ----------
+        start : label or tuple, default None
+            If None, defaults to the beginning
+        end : label or tuple
+            If None, defaults to the end
+        step : int or None
+            Slice step
+        kind : string, optional, defaults None
+
+        Returns
+        -------
+        (start, end) : (int, int)
+
+        Notes
+        -----
+        This method only works if the MultiIndex is properly lexsorted. So,
+        if only the first 2 levels of a 3-level MultiIndex are lexsorted,
+        you can only pass two levels to ``.slice_locs``.
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex.from_arrays([list('abbd'), list('deff')],
+        ...                                names=['A', 'B'])
+
+        Get the slice locations from the beginning of 'b' in the first level
+        until the end of the multiindex:
+
+        >>> mi.slice_locs(start='b')
+        (1, 4)
+
+        Like above, but stop at the end of 'b' in the first level and 'f' in
+        the second level:
+
+        >>> mi.slice_locs(start='b', end=('b', 'f'))
+        (1, 3)
+
+        See Also
+        --------
+        MultiIndex.get_loc : Get location for a label or a tuple of labels.
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such.
+        """
+        # This function adds nothing to its parent implementation (the magic
+        # happens in get_slice_bound method), but it adds meaningful doc.
+        return super(MultiIndex, self).slice_locs(start, end, step, kind=kind)
+
+    def _partial_tup_index(self, tup, side='left'):
+        if len(tup) > self.lexsort_depth:
+            raise UnsortedIndexError(
+                'Key length (%d) was greater than MultiIndex'
+                ' lexsort depth (%d)' %
+                (len(tup), self.lexsort_depth))
+
+        n = len(tup)
+        start, end = 0, len(self)
+        zipped = zip(tup, self.levels, self.codes)
+        for k, (lab, lev, labs) in enumerate(zipped):
+            section = labs[start:end]
+
+            if lab not in lev:
+                if not lev.is_type_compatible(lib.infer_dtype([lab],
+                                                              skipna=False)):
+                    raise TypeError('Level type mismatch: %s' % lab)
+
+                # short circuit
+                loc = lev.searchsorted(lab, side=side)
+                if side == 'right' and loc >= 0:
+                    loc -= 1
+                return start + section.searchsorted(loc, side=side)
+
+            idx = lev.get_loc(lab)
+            if k < n - 1:
+                end = start + section.searchsorted(idx, side='right')
+                start = start + section.searchsorted(idx, side='left')
+            else:
+                return start + section.searchsorted(idx, side=side)
+
+    def get_loc(self, key, method=None):
+        """
+        Get location for a label or a tuple of labels as an integer, slice or
+        boolean mask.
+
+        Parameters
+        ----------
+        key : label or tuple of labels (one for each level)
+        method : None
+
+        Returns
+        -------
+        loc : int, slice object or boolean mask
+            If the key is past the lexsort depth, the return may be a
+            boolean mask array, otherwise it is always a slice or int.
+
+        Examples
+        ---------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')])
+
+        >>> mi.get_loc('b')
+        slice(1, 3, None)
+
+        >>> mi.get_loc(('b', 'e'))
+        1
+
+        Notes
+        ------
+        The key cannot be a slice, list of same-level labels, a boolean mask,
+        or a sequence of such. If you want to use those, use
+        :meth:`MultiIndex.get_locs` instead.
+
+        See Also
+        --------
+        Index.get_loc : The get_loc method for (single-level) index.
+        MultiIndex.slice_locs : Get slice location given start label(s) and
+                                end label(s).
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such.
+        """
+        if method is not None:
+            raise NotImplementedError('only the default get_loc method is '
+                                      'currently supported for MultiIndex')
+
+        def _maybe_to_slice(loc):
+            """convert integer indexer to boolean mask or slice if possible"""
+            if not isinstance(loc, np.ndarray) or loc.dtype != 'int64':
+                return loc
+
+            loc = lib.maybe_indices_to_slice(loc, len(self))
+            if isinstance(loc, slice):
+                return loc
+
+            mask = np.empty(len(self), dtype='bool')
+            mask.fill(False)
+            mask[loc] = True
+            return mask
+
+        if not isinstance(key, tuple):
+            loc = self._get_level_indexer(key, level=0)
+            return _maybe_to_slice(loc)
+
+        keylen = len(key)
+        if self.nlevels < keylen:
+            raise KeyError('Key length ({0}) exceeds index depth ({1})'
+                           ''.format(keylen, self.nlevels))
+
+        if keylen == self.nlevels and self.is_unique:
+            return self._engine.get_loc(key)
+
+        # -- partial selection or non-unique index
+        # break the key into 2 parts based on the lexsort_depth of the index;
+        # the first part returns a continuous slice of the index; the 2nd part
+        # needs linear search within the slice
+        i = self.lexsort_depth
+        lead_key, follow_key = key[:i], key[i:]
+        start, stop = (self.slice_locs(lead_key, lead_key)
+                       if lead_key else (0, len(self)))
+
+        if start == stop:
+            raise KeyError(key)
+
+        if not follow_key:
+            return slice(start, stop)
+
+        warnings.warn('indexing past lexsort depth may impact performance.',
+                      PerformanceWarning, stacklevel=10)
+
+        loc = np.arange(start, stop, dtype='int64')
+
+        for i, k in enumerate(follow_key, len(lead_key)):
+            mask = self.codes[i][loc] == self.levels[i].get_loc(k)
+            if not mask.all():
+                loc = loc[mask]
+            if not len(loc):
+                raise KeyError(key)
+
+        return (_maybe_to_slice(loc) if len(loc) != stop - start else
+                slice(start, stop))
+
+    def get_loc_level(self, key, level=0, drop_level=True):
+        """
+        Get both the location for the requested label(s) and the
+        resulting sliced index.
+
+        Parameters
+        ----------
+        key : label or sequence of labels
+        level : int/level name or list thereof, optional
+        drop_level : bool, default True
+            if ``False``, the resulting index will not drop any level.
+
+        Returns
+        -------
+        loc : A 2-tuple where the elements are:
+              Element 0: int, slice object or boolean array
+              Element 1: The resulting sliced multiindex/index. If the key
+              contains all levels, this will be ``None``.
+
+        Examples
+        --------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')],
+        ...                                names=['A', 'B'])
+
+        >>> mi.get_loc_level('b')
+        (slice(1, 3, None), Index(['e', 'f'], dtype='object', name='B'))
+
+        >>> mi.get_loc_level('e', level='B')
+        (array([False,  True, False], dtype=bool),
+        Index(['b'], dtype='object', name='A'))
+
+        >>> mi.get_loc_level(['b', 'e'])
+        (1, None)
+
+        See Also
+        ---------
+        MultiIndex.get_loc  : Get location for a label or a tuple of labels.
+        MultiIndex.get_locs : Get location for a label/slice/list/mask or a
+                              sequence of such.
+        """
+
+        def maybe_droplevels(indexer, levels, drop_level):
+            if not drop_level:
+                return self[indexer]
+            # kludgearound
+            orig_index = new_index = self[indexer]
+            levels = [self._get_level_number(i) for i in levels]
+            for i in sorted(levels, reverse=True):
+                try:
+                    new_index = new_index.droplevel(i)
+                except ValueError:
+
+                    # no dropping here
+                    return orig_index
+            return new_index
+
+        if isinstance(level, (tuple, list)):
+            if len(key) != len(level):
+                raise AssertionError('Key for location must have same '
+                                     'length as number of levels')
+            result = None
+            for lev, k in zip(level, key):
+                loc, new_index = self.get_loc_level(k, level=lev)
+                if isinstance(loc, slice):
+                    mask = np.zeros(len(self), dtype=bool)
+                    mask[loc] = True
+                    loc = mask
+
+                result = loc if result is None else result & loc
+
+            return result, maybe_droplevels(result, level, drop_level)
+
+        level = self._get_level_number(level)
+
+        # kludge for #1796
+        if isinstance(key, list):
+            key = tuple(key)
+
+        if isinstance(key, tuple) and level == 0:
+
+            try:
+                if key in self.levels[0]:
+                    indexer = self._get_level_indexer(key, level=level)
+                    new_index = maybe_droplevels(indexer, [0], drop_level)
+                    return indexer, new_index
+            except TypeError:
+                pass
+
+            if not any(isinstance(k, slice) for k in key):
+
+                # partial selection
+                # optionally get indexer to avoid re-calculation
+                def partial_selection(key, indexer=None):
+                    if indexer is None:
+                        indexer = self.get_loc(key)
+                    ilevels = [i for i in range(len(key))
+                               if key[i] != slice(None, None)]
+                    return indexer, maybe_droplevels(indexer, ilevels,
+                                                     drop_level)
+
+                if len(key) == self.nlevels and self.is_unique:
+                    # Complete key in unique index -> standard get_loc
+                    return (self._engine.get_loc(key), None)
+                else:
+                    return partial_selection(key)
+            else:
+                indexer = None
+                for i, k in enumerate(key):
+                    if not isinstance(k, slice):
+                        k = self._get_level_indexer(k, level=i)
+                        if isinstance(k, slice):
+                            # everything
+                            if k.start == 0 and k.stop == len(self):
+                                k = slice(None, None)
+                        else:
+                            k_index = k
+
+                    if isinstance(k, slice):
+                        if k == slice(None, None):
+                            continue
+                        else:
+                            raise TypeError(key)
+
+                    if indexer is None:
+                        indexer = k_index
+                    else:  # pragma: no cover
+                        indexer &= k_index
+                if indexer is None:
+                    indexer = slice(None, None)
+                ilevels = [i for i in range(len(key))
+                           if key[i] != slice(None, None)]
+                return indexer, maybe_droplevels(indexer, ilevels, drop_level)
+        else:
+            indexer = self._get_level_indexer(key, level=level)
+            return indexer, maybe_droplevels(indexer, [level], drop_level)
+
+    def _get_level_indexer(self, key, level=0, indexer=None):
+        # return an indexer, boolean array or a slice showing where the key is
+        # in the totality of values
+        # if the indexer is provided, then use this
+
+        level_index = self.levels[level]
+        level_codes = self.codes[level]
+
+        def convert_indexer(start, stop, step, indexer=indexer,
+                            codes=level_codes):
+            # given the inputs and the codes/indexer, compute an indexer set
+            # if we have a provided indexer, then this need not consider
+            # the entire labels set
+
+            r = np.arange(start, stop, step)
+            if indexer is not None and len(indexer) != len(codes):
+
+                # we have an indexer which maps the locations in the labels
+                # that we have already selected (and is not an indexer for the
+                # entire set) otherwise this is wasteful so we only need to
+                # examine locations that are in this set the only magic here is
+                # that the result are the mappings to the set that we have
+                # selected
+                from pandas import Series
+                mapper = Series(indexer)
+                indexer = codes.take(ensure_platform_int(indexer))
+                result = Series(Index(indexer).isin(r).nonzero()[0])
+                m = result.map(mapper)._ndarray_values
+
+            else:
+                m = np.zeros(len(codes), dtype=bool)
+                m[np.in1d(codes, r,
+                          assume_unique=Index(codes).is_unique)] = True
+
+            return m
+
+        if isinstance(key, slice):
+            # handle a slice, returnig a slice if we can
+            # otherwise a boolean indexer
+
+            try:
+                if key.start is not None:
+                    start = level_index.get_loc(key.start)
+                else:
+                    start = 0
+                if key.stop is not None:
+                    stop = level_index.get_loc(key.stop)
+                else:
+                    stop = len(level_index) - 1
+                step = key.step
+            except KeyError:
+
+                # we have a partial slice (like looking up a partial date
+                # string)
+                start = stop = level_index.slice_indexer(key.start, key.stop,
+                                                         key.step, kind='loc')
+                step = start.step
+
+            if isinstance(start, slice) or isinstance(stop, slice):
+                # we have a slice for start and/or stop
+                # a partial date slicer on a DatetimeIndex generates a slice
+                # note that the stop ALREADY includes the stopped point (if
+                # it was a string sliced)
+                return convert_indexer(start.start, stop.stop, step)
+
+            elif level > 0 or self.lexsort_depth == 0 or step is not None:
+                # need to have like semantics here to right
+                # searching as when we are using a slice
+                # so include the stop+1 (so we include stop)
+                return convert_indexer(start, stop + 1, step)
+            else:
+                # sorted, so can return slice object -> view
+                i = level_codes.searchsorted(start, side='left')
+                j = level_codes.searchsorted(stop, side='right')
+                return slice(i, j, step)
+
+        else:
+
+            code = level_index.get_loc(key)
+
+            if level > 0 or self.lexsort_depth == 0:
+                # Desired level is not sorted
+                locs = np.array(level_codes == code, dtype=bool, copy=False)
+                if not locs.any():
+                    # The label is present in self.levels[level] but unused:
+                    raise KeyError(key)
+                return locs
+
+            i = level_codes.searchsorted(code, side='left')
+            j = level_codes.searchsorted(code, side='right')
+            if i == j:
+                # The label is present in self.levels[level] but unused:
+                raise KeyError(key)
+            return slice(i, j)
+
+    def get_locs(self, seq):
+        """
+        Get location for a given label/slice/list/mask or a sequence of such as
+        an array of integers.
+
+        Parameters
+        ----------
+        seq : label/slice/list/mask or a sequence of such
+           You should use one of the above for each level.
+           If a level should not be used, set it to ``slice(None)``.
+
+        Returns
+        -------
+        locs : array of integers suitable for passing to iloc
+
+        Examples
+        ---------
+        >>> mi = pd.MultiIndex.from_arrays([list('abb'), list('def')])
+
+        >>> mi.get_locs('b')
+        array([1, 2], dtype=int64)
+
+        >>> mi.get_locs([slice(None), ['e', 'f']])
+        array([1, 2], dtype=int64)
+
+        >>> mi.get_locs([[True, False, True], slice('e', 'f')])
+        array([2], dtype=int64)
+
+        See Also
+        --------
+        MultiIndex.get_loc : Get location for a label or a tuple of labels.
+        MultiIndex.slice_locs : Get slice location given start label(s) and
+                                end label(s).
+        """
+        from .numeric import Int64Index
+
+        # must be lexsorted to at least as many levels
+        true_slices = [i for (i, s) in enumerate(com.is_true_slices(seq)) if s]
+        if true_slices and true_slices[-1] >= self.lexsort_depth:
+            raise UnsortedIndexError('MultiIndex slicing requires the index '
+                                     'to be lexsorted: slicing on levels {0}, '
+                                     'lexsort depth {1}'
+                                     .format(true_slices, self.lexsort_depth))
+        # indexer
+        # this is the list of all values that we want to select
+        n = len(self)
+        indexer = None
+
+        def _convert_to_indexer(r):
+            # return an indexer
+            if isinstance(r, slice):
+                m = np.zeros(n, dtype=bool)
+                m[r] = True
+                r = m.nonzero()[0]
+            elif com.is_bool_indexer(r):
+                if len(r) != n:
+                    raise ValueError("cannot index with a boolean indexer "
+                                     "that is not the same length as the "
+                                     "index")
+                r = r.nonzero()[0]
+            return Int64Index(r)
+
+        def _update_indexer(idxr, indexer=indexer):
+            if indexer is None:
+                indexer = Index(np.arange(n))
+            if idxr is None:
+                return indexer
+            return indexer & idxr
+
+        for i, k in enumerate(seq):
+
+            if com.is_bool_indexer(k):
+                # a boolean indexer, must be the same length!
+                k = np.asarray(k)
+                indexer = _update_indexer(_convert_to_indexer(k),
+                                          indexer=indexer)
+
+            elif is_list_like(k):
+                # a collection of labels to include from this level (these
+                # are or'd)
+                indexers = None
+                for x in k:
+                    try:
+                        idxrs = _convert_to_indexer(
+                            self._get_level_indexer(x, level=i,
+                                                    indexer=indexer))
+                        indexers = (idxrs if indexers is None
+                                    else indexers | idxrs)
+                    except KeyError:
+
+                        # ignore not founds
+                        continue
+
+                if indexers is not None:
+                    indexer = _update_indexer(indexers, indexer=indexer)
+                else:
+                    # no matches we are done
+                    return Int64Index([])._ndarray_values
+
+            elif com.is_null_slice(k):
+                # empty slice
+                indexer = _update_indexer(None, indexer=indexer)
+
+            elif isinstance(k, slice):
+
+                # a slice, include BOTH of the labels
+                indexer = _update_indexer(_convert_to_indexer(
+                    self._get_level_indexer(k, level=i, indexer=indexer)),
+                    indexer=indexer)
+            else:
+                # a single label
+                indexer = _update_indexer(_convert_to_indexer(
+                    self.get_loc_level(k, level=i, drop_level=False)[0]),
+                    indexer=indexer)
+
+        # empty indexer
+        if indexer is None:
+            return Int64Index([])._ndarray_values
+        return indexer._ndarray_values
+
+    def truncate(self, before=None, after=None):
+        """
+        Slice index between two labels / tuples, return new MultiIndex
+
+        Parameters
+        ----------
+        before : label or tuple, can be partial. Default None
+            None defaults to start
+        after : label or tuple, can be partial. Default None
+            None defaults to end
+
+        Returns
+        -------
+        truncated : MultiIndex
+        """
+        if after and before and after < before:
+            raise ValueError('after < before')
+
+        i, j = self.levels[0].slice_locs(before, after)
+        left, right = self.slice_locs(before, after)
+
+        new_levels = list(self.levels)
+        new_levels[0] = new_levels[0][i:j]
+
+        new_codes = [level_codes[left:right] for level_codes in self.codes]
+        new_codes[0] = new_codes[0] - i
+
+        return MultiIndex(levels=new_levels, codes=new_codes,
+                          verify_integrity=False)
+
+    def equals(self, other):
+        """
+        Determines if two MultiIndex objects have the same labeling information
+        (the levels themselves do not necessarily have to be the same)
+
+        See Also
+        --------
+        equal_levels
+        """
+        if self.is_(other):
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        if not isinstance(other, MultiIndex):
+            other_vals = com.values_from_object(ensure_index(other))
+            return array_equivalent(self._ndarray_values, other_vals)
+
+        if self.nlevels != other.nlevels:
+            return False
+
+        if len(self) != len(other):
+            return False
+
+        for i in range(self.nlevels):
+            self_codes = self.codes[i]
+            self_codes = self_codes[self_codes != -1]
+            self_values = algos.take_nd(np.asarray(self.levels[i]._values),
+                                        self_codes, allow_fill=False)
+
+            other_codes = other.codes[i]
+            other_codes = other_codes[other_codes != -1]
+            other_values = algos.take_nd(
+                np.asarray(other.levels[i]._values),
+                other_codes, allow_fill=False)
+
+            # since we use NaT both datetime64 and timedelta64
+            # we can have a situation where a level is typed say
+            # timedelta64 in self (IOW it has other values than NaT)
+            # but types datetime64 in other (where its all NaT)
+            # but these are equivalent
+            if len(self_values) == 0 and len(other_values) == 0:
+                continue
+
+            if not array_equivalent(self_values, other_values):
+                return False
+
+        return True
+
+    def equal_levels(self, other):
+        """
+        Return True if the levels of both MultiIndex objects are the same
+
+        """
+        if self.nlevels != other.nlevels:
+            return False
+
+        for i in range(self.nlevels):
+            if not self.levels[i].equals(other.levels[i]):
+                return False
+        return True
+
+    def union(self, other, sort=None):
+        """
+        Form the union of two MultiIndex objects
+
+        Parameters
+        ----------
+        other : MultiIndex or array / Index of tuples
+        sort : False or None, default None
+            Whether to sort the resulting Index.
+
+            * None : Sort the result, except when
+
+              1. `self` and `other` are equal.
+              2. `self` has length 0.
+              3. Some values in `self` or `other` cannot be compared.
+                 A RuntimeWarning is issued in this case.
+
+            * False : do not sort the result.
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default value from ``True`` to ``None``
+               (without change in behaviour).
+
+        Returns
+        -------
+        Index
+
+        >>> index.union(index2)
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if len(other) == 0 or self.equals(other):
+            return self
+
+        # TODO: Index.union returns other when `len(self)` is 0.
+
+        uniq_tuples = lib.fast_unique_multiple([self._ndarray_values,
+                                                other._ndarray_values],
+                                               sort=sort)
+
+        return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
+                                      names=result_names)
+
+    def intersection(self, other, sort=False):
+        """
+        Form the intersection of two MultiIndex objects.
+
+        Parameters
+        ----------
+        other : MultiIndex or array / Index of tuples
+        sort : False or None, default False
+            Sort the resulting MultiIndex if possible
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default from ``True`` to ``False``, to match
+               behaviour from before 0.24.0
+
+        Returns
+        -------
+        Index
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if self.equals(other):
+            return self
+
+        self_tuples = self._ndarray_values
+        other_tuples = other._ndarray_values
+        uniq_tuples = set(self_tuples) & set(other_tuples)
+
+        if sort is None:
+            uniq_tuples = sorted(uniq_tuples)
+
+        if len(uniq_tuples) == 0:
+            return MultiIndex(levels=self.levels,
+                              codes=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+        else:
+            return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
+                                          names=result_names)
+
+    def difference(self, other, sort=None):
+        """
+        Compute set difference of two MultiIndex objects
+
+        Parameters
+        ----------
+        other : MultiIndex
+        sort : False or None, default None
+            Sort the resulting MultiIndex if possible
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default value from ``True`` to ``None``
+               (without change in behaviour).
+
+        Returns
+        -------
+        diff : MultiIndex
+        """
+        self._validate_sort_keyword(sort)
+        self._assert_can_do_setop(other)
+        other, result_names = self._convert_can_do_setop(other)
+
+        if len(other) == 0:
+            return self
+
+        if self.equals(other):
+            return MultiIndex(levels=self.levels,
+                              codes=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+
+        this = self._get_unique_index()
+
+        indexer = this.get_indexer(other)
+        indexer = indexer.take((indexer != -1).nonzero()[0])
+
+        label_diff = np.setdiff1d(np.arange(this.size), indexer,
+                                  assume_unique=True)
+        difference = this.values.take(label_diff)
+        if sort is None:
+            difference = sorted(difference)
+
+        if len(difference) == 0:
+            return MultiIndex(levels=[[]] * self.nlevels,
+                              codes=[[]] * self.nlevels,
+                              names=result_names, verify_integrity=False)
+        else:
+            return MultiIndex.from_tuples(difference, sortorder=0,
+                                          names=result_names)
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if is_categorical_dtype(dtype):
+            msg = '> 1 ndim Categorical are not supported at this time'
+            raise NotImplementedError(msg)
+        elif not is_object_dtype(dtype):
+            msg = ('Setting {cls} dtype to anything other than object '
+                   'is not supported').format(cls=self.__class__)
+            raise TypeError(msg)
+        elif copy is True:
+            return self._shallow_copy()
+        return self
+
+    def _convert_can_do_setop(self, other):
+        result_names = self.names
+
+        if not hasattr(other, 'names'):
+            if len(other) == 0:
+                other = MultiIndex(levels=[[]] * self.nlevels,
+                                   codes=[[]] * self.nlevels,
+                                   verify_integrity=False)
+            else:
+                msg = 'other must be a MultiIndex or a list of tuples'
+                try:
+                    other = MultiIndex.from_tuples(other)
+                except TypeError:
+                    raise TypeError(msg)
+        else:
+            result_names = self.names if self.names == other.names else None
+        return other, result_names
+
+    def insert(self, loc, item):
+        """
+        Make new MultiIndex inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : tuple
+            Must be same length as number of levels in the MultiIndex
+
+        Returns
+        -------
+        new_index : Index
+        """
+        # Pad the key with empty strings if lower levels of the key
+        # aren't specified:
+        if not isinstance(item, tuple):
+            item = (item, ) + ('', ) * (self.nlevels - 1)
+        elif len(item) != self.nlevels:
+            raise ValueError('Item must have length equal to number of '
+                             'levels.')
+
+        new_levels = []
+        new_codes = []
+        for k, level, level_codes in zip(item, self.levels, self.codes):
+            if k not in level:
+                # have to insert into level
+                # must insert at end otherwise you have to recompute all the
+                # other codes
+                lev_loc = len(level)
+                level = level.insert(lev_loc, k)
+            else:
+                lev_loc = level.get_loc(k)
+
+            new_levels.append(level)
+            new_codes.append(np.insert(
+                ensure_int64(level_codes), loc, lev_loc))
+
+        return MultiIndex(levels=new_levels, codes=new_codes,
+                          names=self.names, verify_integrity=False)
+
+    def delete(self, loc):
+        """
+        Make new index with passed location deleted
+
+        Returns
+        -------
+        new_index : MultiIndex
+        """
+        new_codes = [np.delete(level_codes, loc) for level_codes in self.codes]
+        return MultiIndex(levels=self.levels, codes=new_codes,
+                          names=self.names, verify_integrity=False)
+
+    def _wrap_joined_index(self, joined, other):
+        names = self.names if self.names == other.names else None
+        return MultiIndex.from_tuples(joined, names=names)
+
+    @Appender(Index.isin.__doc__)
+    def isin(self, values, level=None):
+        if level is None:
+            values = MultiIndex.from_tuples(values,
+                                            names=self.names).values
+            return algos.isin(self.values, values)
+        else:
+            num = self._get_level_number(level)
+            levs = self.levels[num]
+            level_codes = self.codes[num]
+
+            sought_labels = levs.isin(values).nonzero()[0]
+            if levs.size == 0:
+                return np.zeros(len(level_codes), dtype=np.bool_)
+            else:
+                return np.lib.arraysetops.in1d(level_codes, sought_labels)
+
+
+MultiIndex._add_numeric_methods_disabled()
+MultiIndex._add_numeric_methods_add_sub_disabled()
+MultiIndex._add_logical_methods_disabled()
+
+
+def _sparsify(label_list, start=0, sentinel=''):
+    pivoted = lzip(*label_list)
+    k = len(label_list)
+
+    result = pivoted[:start + 1]
+    prev = pivoted[start]
+
+    for cur in pivoted[start + 1:]:
+        sparse_cur = []
+
+        for i, (p, t) in enumerate(zip(prev, cur)):
+            if i == k - 1:
+                sparse_cur.append(t)
+                result.append(sparse_cur)
+                break
+
+            if p == t:
+                sparse_cur.append(sentinel)
+            else:
+                sparse_cur.extend(cur[i:])
+                result.append(sparse_cur)
+                break
+
+        prev = cur
+
+    return lzip(*result)
+
+
+def _get_na_rep(dtype):
+    return {np.datetime64: 'NaT', np.timedelta64: 'NaT'}.get(dtype, 'NaN')
diff --git a/pandas/core/indexes/numeric.py b/pandas/core/indexes/numeric.py
new file mode 100644
index 0000000000000..379464f4fced6
--- /dev/null
+++ b/pandas/core/indexes/numeric.py
@@ -0,0 +1,450 @@
+import warnings
+
+import numpy as np
+
+from pandas._libs import index as libindex
+import pandas.compat as compat
+from pandas.util._decorators import Appender, cache_readonly
+
+from pandas.core.dtypes.common import (
+    is_bool, is_bool_dtype, is_dtype_equal, is_extension_array_dtype, is_float,
+    is_integer_dtype, is_scalar, needs_i8_conversion, pandas_dtype)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import algorithms
+import pandas.core.common as com
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import (
+    Index, InvalidIndexError, _index_shared_docs)
+from pandas.core.ops import get_op_result_name
+
+_num_index_shared_docs = dict()
+
+
+class NumericIndex(Index):
+    """
+    Provide numeric type operations
+
+    This is an abstract class
+
+    """
+    _is_numeric_dtype = True
+
+    def __new__(cls, data=None, dtype=None, copy=False, name=None,
+                fastpath=None):
+
+        if fastpath is not None:
+            warnings.warn("The 'fastpath' keyword is deprecated, and will be "
+                          "removed in a future version.",
+                          FutureWarning, stacklevel=2)
+            if fastpath:
+                return cls._simple_new(data, name=name)
+
+        # is_scalar, generators handled in coerce_to_ndarray
+        data = cls._coerce_to_ndarray(data)
+
+        if issubclass(data.dtype.type, compat.string_types):
+            cls._string_data_error(data)
+
+        if copy or not is_dtype_equal(data.dtype, cls._default_dtype):
+            subarr = np.array(data, dtype=cls._default_dtype, copy=copy)
+            cls._assert_safe_casting(data, subarr)
+        else:
+            subarr = data
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+        return cls._simple_new(subarr, name=name)
+
+    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        # we will try to coerce to integers
+        return self._maybe_cast_indexer(label)
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is not None and not self._can_hold_na:
+            # Ensure we are not returning an Int64Index with float data:
+            return self._shallow_copy_with_infer(values=values, **kwargs)
+        return (super(NumericIndex, self)._shallow_copy(values=values,
+                                                        **kwargs))
+
+    def _convert_for_op(self, value):
+        """ Convert value to be insertable to ndarray """
+
+        if is_bool(value) or is_bool_dtype(value):
+            # force conversion to object
+            # so we don't lose the bools
+            raise TypeError
+
+        return value
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = np.asarray(tolerance)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        if not np.issubdtype(tolerance.dtype, np.number):
+            if tolerance.ndim > 0:
+                raise ValueError(('tolerance argument for %s must contain '
+                                  'numeric elements if it is list type') %
+                                 (type(self).__name__,))
+            else:
+                raise ValueError(('tolerance argument for %s must be numeric '
+                                  'if it is a scalar: %r') %
+                                 (type(self).__name__, tolerance))
+        return tolerance
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Subclasses need to override this only if the process of casting data
+        from some accepted dtype to the internal dtype(s) bears the risk of
+        truncation (e.g. float to int).
+        """
+        pass
+
+    def _concat_same_dtype(self, indexes, name):
+        return _concat._concat_index_same_dtype(indexes).rename(name)
+
+    @property
+    def is_all_dates(self):
+        """
+        Checks that all the labels are datetime objects
+        """
+        return False
+
+    @Appender(Index.insert.__doc__)
+    def insert(self, loc, item):
+        # treat NA values as nans:
+        if is_scalar(item) and isna(item):
+            item = self._na_value
+        return super(NumericIndex, self).insert(loc, item)
+
+
+_num_index_shared_docs['class_descr'] = """
+    Immutable ndarray implementing an ordered, sliceable set. The basic object
+    storing axis labels for all pandas objects. %(klass)s is a special case
+    of `Index` with purely %(ltype)s labels. %(extra)s
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional)
+    dtype : NumPy dtype (default: %(dtype)s)
+    copy : bool
+        Make a copy of input ndarray
+    name : object
+        Name to be stored in the index
+
+    Attributes
+    ----------
+    None
+
+    Methods
+    -------
+    None
+
+    See Also
+    --------
+    Index : The base pandas Index type.
+
+    Notes
+    -----
+    An Index instance can **only** contain hashable objects.
+"""
+
+_int64_descr_args = dict(
+    klass='Int64Index',
+    ltype='integer',
+    dtype='int64',
+    extra=''
+)
+
+
+class IntegerIndex(NumericIndex):
+    """
+    This is an abstract class for Int64Index, UInt64Index.
+    """
+
+    def __contains__(self, key):
+        """
+        Check if key is a float and has a decimal. If it has, return False.
+        """
+        hash(key)
+        try:
+            if is_float(key) and int(key) != key:
+                return False
+            return key in self._engine
+        except (OverflowError, TypeError, ValueError):
+            return False
+
+
+class Int64Index(IntegerIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _int64_descr_args
+
+    _typ = 'int64index'
+    _can_hold_na = False
+    _engine_type = libindex.Int64Engine
+    _default_dtype = np.int64
+
+    @property
+    def inferred_type(self):
+        """Always 'integer' for ``Int64Index``"""
+        return 'integer'
+
+    @property
+    def asi8(self):
+        # do not cache or you'll create a memory leak
+        return self.values.view('i8')
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # don't coerce ilocs to integers
+        if kind != 'iloc':
+            key = self._maybe_cast_indexer(key)
+        return (super(Int64Index, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    def _wrap_joined_index(self, joined, other):
+        name = get_op_result_name(self, other)
+        return Int64Index(joined, name=name)
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Ensure incoming data can be represented as ints.
+        """
+        if not issubclass(data.dtype.type, np.signedinteger):
+            if not np.array_equal(data, subarr):
+                raise TypeError('Unsafe NumPy casting, you must '
+                                'explicitly cast')
+
+
+Int64Index._add_numeric_methods()
+Int64Index._add_logical_methods()
+
+_uint64_descr_args = dict(
+    klass='UInt64Index',
+    ltype='unsigned integer',
+    dtype='uint64',
+    extra=''
+)
+
+
+class UInt64Index(IntegerIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _uint64_descr_args
+
+    _typ = 'uint64index'
+    _can_hold_na = False
+    _engine_type = libindex.UInt64Engine
+    _default_dtype = np.uint64
+
+    @property
+    def inferred_type(self):
+        """Always 'integer' for ``UInt64Index``"""
+        return 'integer'
+
+    @property
+    def asi8(self):
+        # do not cache or you'll create a memory leak
+        return self.values.view('u8')
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        # don't coerce ilocs to integers
+        if kind != 'iloc':
+            key = self._maybe_cast_indexer(key)
+        return (super(UInt64Index, self)
+                ._convert_scalar_indexer(key, kind=kind))
+
+    @Appender(_index_shared_docs['_convert_arr_indexer'])
+    def _convert_arr_indexer(self, keyarr):
+        # Cast the indexer to uint64 if possible so
+        # that the values returned from indexing are
+        # also uint64.
+        keyarr = com.asarray_tuplesafe(keyarr)
+        if is_integer_dtype(keyarr):
+            return com.asarray_tuplesafe(keyarr, dtype=np.uint64)
+        return keyarr
+
+    @Appender(_index_shared_docs['_convert_index_indexer'])
+    def _convert_index_indexer(self, keyarr):
+        # Cast the indexer to uint64 if possible so
+        # that the values returned from indexing are
+        # also uint64.
+        if keyarr.is_integer():
+            return keyarr.astype(np.uint64)
+        return keyarr
+
+    def _wrap_joined_index(self, joined, other):
+        name = get_op_result_name(self, other)
+        return UInt64Index(joined, name=name)
+
+    @classmethod
+    def _assert_safe_casting(cls, data, subarr):
+        """
+        Ensure incoming data can be represented as uints.
+        """
+        if not issubclass(data.dtype.type, np.unsignedinteger):
+            if not np.array_equal(data, subarr):
+                raise TypeError('Unsafe NumPy casting, you must '
+                                'explicitly cast')
+
+
+UInt64Index._add_numeric_methods()
+UInt64Index._add_logical_methods()
+
+_float64_descr_args = dict(
+    klass='Float64Index',
+    dtype='float64',
+    ltype='float',
+    extra=''
+)
+
+
+class Float64Index(NumericIndex):
+    __doc__ = _num_index_shared_docs['class_descr'] % _float64_descr_args
+
+    _typ = 'float64index'
+    _engine_type = libindex.Float64Engine
+    _default_dtype = np.float64
+
+    @property
+    def inferred_type(self):
+        """Always 'floating' for ``Float64Index``"""
+        return 'floating'
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if needs_i8_conversion(dtype):
+            msg = ('Cannot convert Float64Index to dtype {dtype}; integer '
+                   'values are required for conversion').format(dtype=dtype)
+            raise TypeError(msg)
+        elif (is_integer_dtype(dtype) and
+              not is_extension_array_dtype(dtype)) and self.hasnans:
+            # TODO(jreback); this can change once we have an EA Index type
+            # GH 13149
+            raise ValueError('Cannot convert NA to integer')
+        return super(Float64Index, self).astype(dtype, copy=copy)
+
+    @Appender(_index_shared_docs['_convert_scalar_indexer'])
+    def _convert_scalar_indexer(self, key, kind=None):
+        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
+
+        if kind == 'iloc':
+            return self._validate_indexer('positional', key, kind)
+
+        return key
+
+    @Appender(_index_shared_docs['_convert_slice_indexer'])
+    def _convert_slice_indexer(self, key, kind=None):
+        # if we are not a slice, then we are done
+        if not isinstance(key, slice):
+            return key
+
+        if kind == 'iloc':
+            return super(Float64Index, self)._convert_slice_indexer(key,
+                                                                    kind=kind)
+
+        # translate to locations
+        return self.slice_indexer(key.start, key.stop, key.step, kind=kind)
+
+    def _format_native_types(self, na_rep='', float_format=None, decimal='.',
+                             quoting=None, **kwargs):
+        from pandas.io.formats.format import FloatArrayFormatter
+        formatter = FloatArrayFormatter(self.values, na_rep=na_rep,
+                                        float_format=float_format,
+                                        decimal=decimal, quoting=quoting,
+                                        fixed_width=False)
+        return formatter.get_result_as_array()
+
+    def get_value(self, series, key):
+        """ we always want to get an index value, never a value """
+        if not is_scalar(key):
+            raise InvalidIndexError
+
+        k = com.values_from_object(key)
+        loc = self.get_loc(k)
+        new_values = com.values_from_object(series)[loc]
+
+        return new_values
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if self is other:
+            return True
+
+        if not isinstance(other, Index):
+            return False
+
+        # need to compare nans locations and make sure that they are the same
+        # since nans don't compare equal this is a bit tricky
+        try:
+            if not isinstance(other, Float64Index):
+                other = self._constructor(other)
+            if (not is_dtype_equal(self.dtype, other.dtype) or
+                    self.shape != other.shape):
+                return False
+            left, right = self._ndarray_values, other._ndarray_values
+            return ((left == right) | (self._isnan & other._isnan)).all()
+        except (TypeError, ValueError):
+            return False
+
+    def __contains__(self, other):
+        if super(Float64Index, self).__contains__(other):
+            return True
+
+        try:
+            # if other is a sequence this throws a ValueError
+            return np.isnan(other) and self.hasnans
+        except ValueError:
+            try:
+                return len(other) <= 1 and ibase._try_get_item(other) in self
+            except TypeError:
+                pass
+        except TypeError:
+            pass
+
+        return False
+
+    @Appender(_index_shared_docs['get_loc'])
+    def get_loc(self, key, method=None, tolerance=None):
+        try:
+            if np.all(np.isnan(key)) or is_bool(key):
+                nan_idxs = self._nan_idxs
+                try:
+                    return nan_idxs.item()
+                except (ValueError, IndexError):
+                    # should only need to catch ValueError here but on numpy
+                    # 1.7 .item() can raise IndexError when NaNs are present
+                    if not len(nan_idxs):
+                        raise KeyError(key)
+                    return nan_idxs
+        except (TypeError, NotImplementedError):
+            pass
+        return super(Float64Index, self).get_loc(key, method=method,
+                                                 tolerance=tolerance)
+
+    @cache_readonly
+    def is_unique(self):
+        return super(Float64Index, self).is_unique and self._nan_idxs.size < 2
+
+    @Appender(Index.isin.__doc__)
+    def isin(self, values, level=None):
+        if level is not None:
+            self._validate_index_level(level)
+        return algorithms.isin(np.array(self), values)
+
+
+Float64Index._add_numeric_methods()
+Float64Index._add_logical_methods_disabled()
diff --git a/pandas/core/indexes/period.py b/pandas/core/indexes/period.py
new file mode 100644
index 0000000000000..a4bd7f9017eb4
--- /dev/null
+++ b/pandas/core/indexes/period.py
@@ -0,0 +1,966 @@
+# pylint: disable=E1101,E1103,W0232
+from datetime import datetime, timedelta
+import warnings
+
+import numpy as np
+
+from pandas._libs import index as libindex
+from pandas._libs.tslibs import (
+    NaT, frequencies as libfrequencies, iNaT, resolution)
+from pandas._libs.tslibs.period import (
+    DIFFERENT_FREQ, IncompatibleFrequency, Period)
+from pandas.util._decorators import Appender, Substitution, cache_readonly
+
+from pandas.core.dtypes.common import (
+    is_bool_dtype, is_datetime64_any_dtype, is_float, is_float_dtype,
+    is_integer, is_integer_dtype, pandas_dtype)
+
+from pandas import compat
+from pandas.core import common as com
+from pandas.core.accessor import delegate_names
+from pandas.core.algorithms import unique1d
+from pandas.core.arrays.period import (
+    PeriodArray, period_array, validate_dtype_freq)
+from pandas.core.base import _shared_docs
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import _index_shared_docs, ensure_index
+from pandas.core.indexes.datetimelike import (
+    DatetimeIndexOpsMixin, DatetimelikeDelegateMixin)
+from pandas.core.indexes.datetimes import DatetimeIndex, Index, Int64Index
+from pandas.core.missing import isna
+from pandas.core.ops import get_op_result_name
+from pandas.core.tools.datetimes import DateParseError, parse_time_string
+
+from pandas.tseries import frequencies
+from pandas.tseries.offsets import DateOffset, Tick
+
+_index_doc_kwargs = dict(ibase._index_doc_kwargs)
+_index_doc_kwargs.update(
+    dict(target_klass='PeriodIndex or list of Periods'))
+
+
+# --- Period index sketch
+
+
+def _new_PeriodIndex(cls, **d):
+    # GH13277 for unpickling
+    values = d.pop('data')
+    if values.dtype == 'int64':
+        freq = d.pop('freq', None)
+        values = PeriodArray(values, freq=freq)
+        return cls._simple_new(values, **d)
+    else:
+        return cls(values, **d)
+
+
+class PeriodDelegateMixin(DatetimelikeDelegateMixin):
+    """
+    Delegate from PeriodIndex to PeriodArray.
+    """
+    _delegate_class = PeriodArray
+    _delegated_properties = PeriodArray._datetimelike_ops
+    _delegated_methods = (
+        set(PeriodArray._datetimelike_methods) | {'_addsub_int_array'}
+    )
+    _raw_properties = {'is_leap_year'}
+
+
+@delegate_names(PeriodArray,
+                PeriodDelegateMixin._delegated_properties,
+                typ='property')
+@delegate_names(PeriodArray,
+                PeriodDelegateMixin._delegated_methods,
+                typ="method",
+                overwrite=True)
+class PeriodIndex(DatetimeIndexOpsMixin, Int64Index, PeriodDelegateMixin):
+    """
+    Immutable ndarray holding ordinal values indicating regular periods in
+    time such as particular years, quarters, months, etc.
+
+    Index keys are boxed to Period objects which carries the metadata (eg,
+    frequency information).
+
+    Parameters
+    ----------
+    data : array-like (1-dimensional), optional
+        Optional period-like data to construct index with
+    copy : bool
+        Make a copy of input ndarray
+    freq : string or period object, optional
+        One of pandas period strings or corresponding objects
+    start : starting value, period-like, optional
+        If data is None, used as the start point in generating regular
+        period data.
+
+        .. deprecated:: 0.24.0
+
+    periods : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+
+        .. deprecated:: 0.24.0
+
+    end : end value, period-like, optional
+        If periods is none, generated index will extend to first conforming
+        period on or just past end argument
+
+        .. deprecated:: 0.24.0
+
+    year : int, array, or Series, default None
+    month : int, array, or Series, default None
+    quarter : int, array, or Series, default None
+    day : int, array, or Series, default None
+    hour : int, array, or Series, default None
+    minute : int, array, or Series, default None
+    second : int, array, or Series, default None
+    tz : object, default None
+        Timezone for converting datetime64 data to Periods
+    dtype : str or PeriodDtype, default None
+
+    Attributes
+    ----------
+    day
+    dayofweek
+    dayofyear
+    days_in_month
+    daysinmonth
+    end_time
+    freq
+    freqstr
+    hour
+    is_leap_year
+    minute
+    month
+    quarter
+    qyear
+    second
+    start_time
+    week
+    weekday
+    weekofyear
+    year
+
+    Methods
+    -------
+    asfreq
+    strftime
+    to_timestamp
+
+    Notes
+    -----
+    Creating a PeriodIndex based on `start`, `periods`, and `end` has
+    been deprecated in favor of :func:`period_range`.
+
+    Examples
+    --------
+    >>> idx = pd.PeriodIndex(year=year_arr, quarter=q_arr)
+
+    See Also
+    ---------
+    Index : The base pandas Index type.
+    Period : Represents a period of time.
+    DatetimeIndex : Index with datetime64 data.
+    TimedeltaIndex : Index of timedelta64 data.
+    period_range : Create a fixed-frequency PeriodIndex.
+    """
+    _typ = 'periodindex'
+    _attributes = ['name', 'freq']
+
+    # define my properties & methods for delegation
+    _is_numeric_dtype = False
+    _infer_as_myclass = True
+
+    _data = None  # type: PeriodArray
+
+    _engine_type = libindex.PeriodEngine
+
+    # ------------------------------------------------------------------------
+    # Index Constructors
+
+    def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
+                periods=None, tz=None, dtype=None, copy=False, name=None,
+                **fields):
+
+        valid_field_set = {'year', 'month', 'day', 'quarter',
+                           'hour', 'minute', 'second'}
+
+        if not set(fields).issubset(valid_field_set):
+            raise TypeError('__new__() got an unexpected keyword argument {}'.
+                            format(list(set(fields) - valid_field_set)[0]))
+
+        if name is None and hasattr(data, 'name'):
+            name = data.name
+
+        if data is None and ordinal is None:
+            # range-based.
+            data, freq2 = PeriodArray._generate_range(start, end, periods,
+                                                      freq, fields)
+            # PeriodArray._generate range does validate that fields is
+            # empty when really using the range-based constructor.
+            if not fields:
+                msg = ("Creating a PeriodIndex by passing range "
+                       "endpoints is deprecated.  Use "
+                       "`pandas.period_range` instead.")
+                # period_range differs from PeriodIndex for cases like
+                # start="2000", periods=4
+                # PeriodIndex interprets that as A-DEC freq.
+                # period_range interprets it as 'D' freq.
+                cond = (
+                    freq is None and (
+                        (start and not isinstance(start, Period)) or
+                        (end and not isinstance(end, Period))
+                    )
+                )
+                if cond:
+                    msg += (
+                        " Note that the default `freq` may differ. Pass "
+                        "'freq=\"{}\"' to ensure the same output."
+                    ).format(freq2.freqstr)
+                warnings.warn(msg, FutureWarning, stacklevel=2)
+            freq = freq2
+
+            data = PeriodArray(data, freq=freq)
+        else:
+            freq = validate_dtype_freq(dtype, freq)
+
+            # PeriodIndex allow PeriodIndex(period_index, freq=different)
+            # Let's not encourage that kind of behavior in PeriodArray.
+
+            if freq and isinstance(data, cls) and data.freq != freq:
+                # TODO: We can do some of these with no-copy / coercion?
+                # e.g. D -> 2D seems to be OK
+                data = data.asfreq(freq)
+
+            if data is None and ordinal is not None:
+                # we strangely ignore `ordinal` if data is passed.
+                ordinal = np.asarray(ordinal, dtype=np.int64)
+                data = PeriodArray(ordinal, freq)
+            else:
+                # don't pass copy here, since we copy later.
+                data = period_array(data=data, freq=freq)
+
+        if copy:
+            data = data.copy()
+
+        return cls._simple_new(data, name=name)
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, **kwargs):
+        """
+        Create a new PeriodIndex.
+
+        Parameters
+        ----------
+        values : PeriodArray, PeriodIndex, Index[int64], ndarray[int64]
+            Values that can be converted to a PeriodArray without inference
+            or coercion.
+
+        """
+        # TODO: raising on floats is tested, but maybe not useful.
+        # Should the callers know not to pass floats?
+        # At the very least, I think we can ensure that lists aren't passed.
+        if isinstance(values, list):
+            values = np.asarray(values)
+        if is_float_dtype(values):
+            raise TypeError("PeriodIndex._simple_new does not accept floats.")
+        if freq:
+            freq = Period._maybe_convert_freq(freq)
+        values = PeriodArray(values, freq=freq)
+
+        if not isinstance(values, PeriodArray):
+            raise TypeError("PeriodIndex._simple_new only accepts PeriodArray")
+        result = object.__new__(cls)
+        result._data = values
+        # For groupby perf. See note in indexes/base about _index_data
+        result._index_data = values._data
+        result.name = name
+        result._reset_identity()
+        return result
+
+    # ------------------------------------------------------------------------
+    # Data
+
+    @property
+    def values(self):
+        return np.asarray(self)
+
+    @property
+    def freq(self):
+        return self._data.freq
+
+    @freq.setter
+    def freq(self, value):
+        value = Period._maybe_convert_freq(value)
+        # TODO: When this deprecation is enforced, PeriodIndex.freq can
+        # be removed entirely, and we'll just inherit.
+        msg = ('Setting {cls}.freq has been deprecated and will be '
+               'removed in a future version; use {cls}.asfreq instead. '
+               'The {cls}.freq setter is not guaranteed to work.')
+        warnings.warn(msg.format(cls=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        # PeriodArray._freq isn't actually mutable. We set the private _freq
+        # here, but people shouldn't be doing this anyway.
+        self._data._freq = value
+
+    def _shallow_copy(self, values=None, **kwargs):
+        # TODO: simplify, figure out type of values
+        if values is None:
+            values = self._data
+
+        if isinstance(values, type(self)):
+            values = values._values
+
+        if not isinstance(values, PeriodArray):
+            if (isinstance(values, np.ndarray) and
+                    is_integer_dtype(values.dtype)):
+                values = PeriodArray(values, freq=self.freq)
+            else:
+                # in particular, I would like to avoid period_array here.
+                # Some people seem to be calling use with unexpected types
+                # Index.difference -> ndarray[Period]
+                # DatetimelikeIndexOpsMixin.repeat -> ndarray[ordinal]
+                # I think that once all of Datetime* are EAs, we can simplify
+                # this quite a bit.
+                values = period_array(values, freq=self.freq)
+
+        # We don't allow changing `freq` in _shallow_copy.
+        validate_dtype_freq(self.dtype, kwargs.get('freq'))
+        attributes = self._get_attributes_dict()
+
+        attributes.update(kwargs)
+        if not len(values) and 'dtype' not in kwargs:
+            attributes['dtype'] = self.dtype
+        return self._simple_new(values, **attributes)
+
+    def _shallow_copy_with_infer(self, values=None, **kwargs):
+        """ we always want to return a PeriodIndex """
+        return self._shallow_copy(values=values, **kwargs)
+
+    @property
+    def _box_func(self):
+        """Maybe box an ordinal or Period"""
+        # TODO(DatetimeArray): Avoid double-boxing
+        # PeriodArray takes care of boxing already, so we need to check
+        # whether we're given an ordinal or a Period. It seems like some
+        # places outside of indexes/period.py are calling this _box_func,
+        # but passing data that's already boxed.
+        def func(x):
+            if isinstance(x, Period) or x is NaT:
+                return x
+            else:
+                return Period._from_ordinal(ordinal=x, freq=self.freq)
+        return func
+
+    def _maybe_convert_timedelta(self, other):
+        """
+        Convert timedelta-like input to an integer multiple of self.freq
+
+        Parameters
+        ----------
+        other : timedelta, np.timedelta64, DateOffset, int, np.ndarray
+
+        Returns
+        -------
+        converted : int, np.ndarray[int64]
+
+        Raises
+        ------
+        IncompatibleFrequency : if the input cannot be written as a multiple
+            of self.freq.  Note IncompatibleFrequency subclasses ValueError.
+        """
+        if isinstance(
+                other, (timedelta, np.timedelta64, Tick, np.ndarray)):
+            offset = frequencies.to_offset(self.freq.rule_code)
+            if isinstance(offset, Tick):
+                # _check_timedeltalike_freq_compat will raise if incompatible
+                delta = self._data._check_timedeltalike_freq_compat(other)
+                return delta
+        elif isinstance(other, DateOffset):
+            freqstr = other.rule_code
+            base = libfrequencies.get_base_alias(freqstr)
+            if base == self.freq.rule_code:
+                return other.n
+
+            msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                        own_freq=self.freqstr,
+                                        other_freq=other.freqstr)
+            raise IncompatibleFrequency(msg)
+        elif is_integer(other):
+            # integer is passed to .shift via
+            # _add_datetimelike_methods basically
+            # but ufunc may pass integer to _add_delta
+            return other
+
+        # raise when input doesn't have freq
+        msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                    own_freq=self.freqstr,
+                                    other_freq=None)
+        raise IncompatibleFrequency(msg)
+
+    # ------------------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_native_types(self, na_rep=u'NaT', quoting=None, **kwargs):
+        # just dispatch, return ndarray
+        return self._data._format_native_types(na_rep=na_rep,
+                                               quoting=quoting,
+                                               **kwargs)
+
+    def _mpl_repr(self):
+        # how to represent ourselves to matplotlib
+        return self.astype(object).values
+
+    @property
+    def _formatter_func(self):
+        return self.array._formatter(boxed=False)
+
+    # ------------------------------------------------------------------------
+    # Indexing
+
+    @cache_readonly
+    def _engine(self):
+        return self._engine_type(lambda: self, len(self))
+
+    @Appender(_index_shared_docs['contains'])
+    def __contains__(self, key):
+        if isinstance(key, Period):
+            if key.freq != self.freq:
+                return False
+            else:
+                return key.ordinal in self._engine
+        else:
+            try:
+                self.get_loc(key)
+                return True
+            except Exception:
+                return False
+
+    contains = __contains__
+
+    @cache_readonly
+    def _int64index(self):
+        return Int64Index._simple_new(self.asi8, name=self.name)
+
+    # ------------------------------------------------------------------------
+    # Index Methods
+
+    def _coerce_scalar_to_index(self, item):
+        """
+        we need to coerce a scalar to a compat for our index type
+
+        Parameters
+        ----------
+        item : scalar item to coerce
+        """
+        return PeriodIndex([item], **self._get_attributes_dict())
+
+    def __array__(self, dtype=None):
+        if is_integer_dtype(dtype):
+            return self.asi8
+        else:
+            return self.astype(object).values
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called after a ufunc. Needs additional handling as
+        PeriodIndex stores internal data as int dtype
+
+        Replace this to __numpy_ufunc__ in future version
+        """
+        if isinstance(context, tuple) and len(context) > 0:
+            func = context[0]
+            if func is np.add:
+                pass
+            elif func is np.subtract:
+                name = self.name
+                left = context[1][0]
+                right = context[1][1]
+                if (isinstance(left, PeriodIndex) and
+                        isinstance(right, PeriodIndex)):
+                    name = left.name if left.name == right.name else None
+                    return Index(result, name=name)
+                elif isinstance(left, Period) or isinstance(right, Period):
+                    return Index(result, name=name)
+            elif isinstance(func, np.ufunc):
+                if 'M->M' not in func.types:
+                    msg = "ufunc '{0}' not supported for the PeriodIndex"
+                    # This should be TypeError, but TypeError cannot be raised
+                    # from here because numpy catches.
+                    raise ValueError(msg.format(func.__name__))
+
+        if is_bool_dtype(result):
+            return result
+        # the result is object dtype array of Period
+        # cannot pass _simple_new as it is
+        return type(self)(result, freq=self.freq, name=self.name)
+
+    def asof_locs(self, where, mask):
+        """
+        where : array of timestamps
+        mask : array of booleans where data is not NA
+
+        """
+        where_idx = where
+        if isinstance(where_idx, DatetimeIndex):
+            where_idx = PeriodIndex(where_idx.values, freq=self.freq)
+
+        locs = self._ndarray_values[mask].searchsorted(
+            where_idx._ndarray_values, side='right')
+
+        locs = np.where(locs > 0, locs - 1, 0)
+        result = np.arange(len(self))[mask].take(locs)
+
+        first = mask.argmax()
+        result[(locs == 0) & (where_idx._ndarray_values <
+                              self._ndarray_values[first])] = -1
+
+        return result
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True, how='start'):
+        dtype = pandas_dtype(dtype)
+
+        if is_datetime64_any_dtype(dtype):
+            # 'how' is index-specific, isn't part of the EA interface.
+            tz = getattr(dtype, 'tz', None)
+            return self.to_timestamp(how=how).tz_localize(tz)
+
+        # TODO: should probably raise on `how` here, so we don't ignore it.
+        return super(PeriodIndex, self).astype(dtype, copy=copy)
+
+    @Substitution(klass='PeriodIndex')
+    @Appender(_shared_docs['searchsorted'])
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, Period):
+            if value.freq != self.freq:
+                msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                            own_freq=self.freqstr,
+                                            other_freq=value.freqstr)
+                raise IncompatibleFrequency(msg)
+            value = value.ordinal
+        elif isinstance(value, compat.string_types):
+            try:
+                value = Period(value, freq=self.freq).ordinal
+            except DateParseError:
+                raise KeyError("Cannot interpret '{}' as period".format(value))
+
+        return self._ndarray_values.searchsorted(value, side=side,
+                                                 sorter=sorter)
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    @property
+    def is_full(self):
+        """
+        Returns True if this PeriodIndex is range-like in that all Periods
+        between start and end are present, in order.
+        """
+        if len(self) == 0:
+            return True
+        if not self.is_monotonic:
+            raise ValueError('Index is not monotonic')
+        values = self.asi8
+        return ((values[1:] - values[:-1]) < 2).all()
+
+    @property
+    def inferred_type(self):
+        # b/c data is represented as ints make sure we can't have ambiguous
+        # indexing
+        return 'period'
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+        s = com.values_from_object(series)
+        try:
+            return com.maybe_box(self,
+                                 super(PeriodIndex, self).get_value(s, key),
+                                 series, key)
+        except (KeyError, IndexError):
+            try:
+                asdt, parsed, reso = parse_time_string(key, self.freq)
+                grp = resolution.Resolution.get_freq_group(reso)
+                freqn = resolution.get_freq_group(self.freq)
+
+                vals = self._ndarray_values
+
+                # if our data is higher resolution than requested key, slice
+                if grp < freqn:
+                    iv = Period(asdt, freq=(grp, 1))
+                    ord1 = iv.asfreq(self.freq, how='S').ordinal
+                    ord2 = iv.asfreq(self.freq, how='E').ordinal
+
+                    if ord2 < vals[0] or ord1 > vals[-1]:
+                        raise KeyError(key)
+
+                    pos = np.searchsorted(self._ndarray_values, [ord1, ord2])
+                    key = slice(pos[0], pos[1] + 1)
+                    return series[key]
+                elif grp == freqn:
+                    key = Period(asdt, freq=self.freq).ordinal
+                    return com.maybe_box(self, self._engine.get_value(s, key),
+                                         series, key)
+                else:
+                    raise KeyError(key)
+            except TypeError:
+                pass
+
+            period = Period(key, self.freq)
+            key = period.value if isna(period) else period.ordinal
+            return com.maybe_box(self, self._engine.get_value(s, key),
+                                 series, key)
+
+    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
+    def get_indexer(self, target, method=None, limit=None, tolerance=None):
+        target = ensure_index(target)
+
+        if hasattr(target, 'freq') and target.freq != self.freq:
+            msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                        own_freq=self.freqstr,
+                                        other_freq=target.freqstr)
+            raise IncompatibleFrequency(msg)
+
+        if isinstance(target, PeriodIndex):
+            target = target.asi8
+
+        if tolerance is not None:
+            tolerance = self._convert_tolerance(tolerance, target)
+        return Index.get_indexer(self._int64index, target, method,
+                                 limit, tolerance)
+
+    def _get_unique_index(self, dropna=False):
+        """
+        wrap Index._get_unique_index to handle NaT
+        """
+        res = super(PeriodIndex, self)._get_unique_index(dropna=dropna)
+        if dropna:
+            res = res.dropna()
+        return res
+
+    @Appender(Index.unique.__doc__)
+    def unique(self, level=None):
+        # override the Index.unique method for performance GH#23083
+        if level is not None:
+            # this should never occur, but is retained to make the signature
+            # match Index.unique
+            self._validate_index_level(level)
+
+        values = self._ndarray_values
+        result = unique1d(values)
+        return self._shallow_copy(result)
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+        try:
+            return self._engine.get_loc(key)
+        except KeyError:
+            if is_integer(key):
+                raise
+
+            try:
+                asdt, parsed, reso = parse_time_string(key, self.freq)
+                key = asdt
+            except TypeError:
+                pass
+            except DateParseError:
+                # A string with invalid format
+                raise KeyError("Cannot interpret '{}' as period".format(key))
+
+            try:
+                key = Period(key, freq=self.freq)
+            except ValueError:
+                # we cannot construct the Period
+                # as we have an invalid type
+                raise KeyError(key)
+
+            try:
+                ordinal = iNaT if key is NaT else key.ordinal
+                if tolerance is not None:
+                    tolerance = self._convert_tolerance(tolerance,
+                                                        np.asarray(key))
+                return self._int64index.get_loc(ordinal, method, tolerance)
+
+            except KeyError:
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string or a datetime, cast it to Period.ordinal according
+        to resolution.
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        bound : Period or object
+
+        Notes
+        -----
+        Value of `side` parameter should be validated in caller.
+
+        """
+        assert kind in ['ix', 'loc', 'getitem']
+
+        if isinstance(label, datetime):
+            return Period(label, freq=self.freq)
+        elif isinstance(label, compat.string_types):
+            try:
+                _, parsed, reso = parse_time_string(label, self.freq)
+                bounds = self._parsed_string_to_bounds(reso, parsed)
+                return bounds[0 if side == 'left' else 1]
+            except Exception:
+                raise KeyError(label)
+        elif is_integer(label) or is_float(label):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _parsed_string_to_bounds(self, reso, parsed):
+        if reso == 'year':
+            t1 = Period(year=parsed.year, freq='A')
+        elif reso == 'month':
+            t1 = Period(year=parsed.year, month=parsed.month, freq='M')
+        elif reso == 'quarter':
+            q = (parsed.month - 1) // 3 + 1
+            t1 = Period(year=parsed.year, quarter=q, freq='Q-DEC')
+        elif reso == 'day':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        freq='D')
+        elif reso == 'hour':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, freq='H')
+        elif reso == 'minute':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, minute=parsed.minute, freq='T')
+        elif reso == 'second':
+            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
+                        hour=parsed.hour, minute=parsed.minute,
+                        second=parsed.second, freq='S')
+        else:
+            raise KeyError(reso)
+        return (t1.asfreq(self.freq, how='start'),
+                t1.asfreq(self.freq, how='end'))
+
+    def _get_string_slice(self, key):
+        if not self.is_monotonic:
+            raise ValueError('Partial indexing only valid for '
+                             'ordered time series')
+
+        key, parsed, reso = parse_time_string(key, self.freq)
+        grp = resolution.Resolution.get_freq_group(reso)
+        freqn = resolution.get_freq_group(self.freq)
+        if reso in ['day', 'hour', 'minute', 'second'] and not grp < freqn:
+            raise KeyError(key)
+
+        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
+        return slice(self.searchsorted(t1.ordinal, side='left'),
+                     self.searchsorted(t2.ordinal, side='right'))
+
+    def _convert_tolerance(self, tolerance, target):
+        tolerance = DatetimeIndexOpsMixin._convert_tolerance(self, tolerance,
+                                                             target)
+        if target.size != tolerance.size and tolerance.size > 1:
+            raise ValueError('list-like tolerance size must match '
+                             'target index size')
+        return self._maybe_convert_timedelta(tolerance)
+
+    def insert(self, loc, item):
+        if not isinstance(item, Period) or self.freq != item.freq:
+            return self.astype(object).insert(loc, item)
+
+        idx = np.concatenate((self[:loc].asi8, np.array([item.ordinal]),
+                              self[loc:].asi8))
+        return self._shallow_copy(idx)
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        self._assert_can_do_setop(other)
+
+        result = Int64Index.join(self, other, how=how, level=level,
+                                 return_indexers=return_indexers,
+                                 sort=sort)
+
+        if return_indexers:
+            result, lidx, ridx = result
+            return self._apply_meta(result), lidx, ridx
+        return self._apply_meta(result)
+
+    def _assert_can_do_setop(self, other):
+        super(PeriodIndex, self)._assert_can_do_setop(other)
+
+        if not isinstance(other, PeriodIndex):
+            raise ValueError('can only call with other PeriodIndex-ed objects')
+
+        if self.freq != other.freq:
+            msg = DIFFERENT_FREQ.format(cls=type(self).__name__,
+                                        own_freq=self.freqstr,
+                                        other_freq=other.freqstr)
+            raise IncompatibleFrequency(msg)
+
+    def _wrap_setop_result(self, other, result):
+        name = get_op_result_name(self, other)
+        result = self._apply_meta(result)
+        result.name = name
+        return result
+
+    def _apply_meta(self, rawarr):
+        if not isinstance(rawarr, PeriodIndex):
+            rawarr = PeriodIndex._simple_new(rawarr, freq=self.freq,
+                                             name=self.name)
+        return rawarr
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+
+        if isinstance(state, dict):
+            super(PeriodIndex, self).__setstate__(state)
+
+        elif isinstance(state, tuple):
+
+            # < 0.15 compat
+            if len(state) == 2:
+                nd_state, own_state = state
+                data = np.empty(nd_state[1], dtype=nd_state[2])
+                np.ndarray.__setstate__(data, nd_state)
+
+                # backcompat
+                freq = Period._maybe_convert_freq(own_state[1])
+
+            else:  # pragma: no cover
+                data = np.empty(state)
+                np.ndarray.__setstate__(self, state)
+                freq = None  # ?
+
+            data = PeriodArray(data, freq=freq)
+            self._data = data
+
+        else:
+            raise Exception("invalid pickle state")
+
+    _unpickle_compat = __setstate__
+
+    @property
+    def flags(self):
+        """ return the ndarray.flags for the underlying data """
+        warnings.warn("{obj}.flags is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return self._ndarray_values.flags
+
+    def item(self):
+        """
+        return the first element of the underlying data as a python
+        scalar
+        """
+        # TODO(DatetimeArray): remove
+        if len(self) == 1:
+            return self[0]
+        else:
+            # copy numpy's message here because Py26 raises an IndexError
+            raise ValueError('can only convert an array of size 1 to a '
+                             'Python scalar')
+
+    @property
+    def data(self):
+        """ return the data pointer of the underlying data """
+        warnings.warn("{obj}.data is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return np.asarray(self._data).data
+
+    @property
+    def base(self):
+        """ return the base object if the memory of the underlying data is
+        shared
+        """
+        warnings.warn("{obj}.base is deprecated and will be removed "
+                      "in a future version".format(obj=type(self).__name__),
+                      FutureWarning, stacklevel=2)
+        return np.asarray(self._data)
+
+
+PeriodIndex._add_comparison_ops()
+PeriodIndex._add_numeric_methods_disabled()
+PeriodIndex._add_logical_methods_disabled()
+PeriodIndex._add_datetimelike_methods()
+
+
+def period_range(start=None, end=None, periods=None, freq=None, name=None):
+    """
+    Return a fixed frequency PeriodIndex, with day (calendar) as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or period-like, default None
+        Left bound for generating periods
+    end : string or period-like, default None
+        Right bound for generating periods
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, optional
+        Frequency alias. By default the freq is taken from `start` or `end`
+        if those are Period objects. Otherwise, the default is ``"D"`` for
+        daily frequency.
+
+    name : string, default None
+        Name of the resulting PeriodIndex
+
+    Returns
+    -------
+    prng : PeriodIndex
+
+    Notes
+    -----
+    Of the three parameters: ``start``, ``end``, and ``periods``, exactly two
+    must be specified.
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+
+    >>> pd.period_range(start='2017-01-01', end='2018-01-01', freq='M')
+    PeriodIndex(['2017-01', '2017-02', '2017-03', '2017-04', '2017-05',
+                 '2017-06', '2017-06', '2017-07', '2017-08', '2017-09',
+                 '2017-10', '2017-11', '2017-12', '2018-01'],
+                dtype='period[M]', freq='M')
+
+    If ``start`` or ``end`` are ``Period`` objects, they will be used as anchor
+    endpoints for a ``PeriodIndex`` with frequency matching that of the
+    ``period_range`` constructor.
+
+    >>> pd.period_range(start=pd.Period('2017Q1', freq='Q'),
+    ...                 end=pd.Period('2017Q2', freq='Q'), freq='M')
+    PeriodIndex(['2017-03', '2017-04', '2017-05', '2017-06'],
+                dtype='period[M]', freq='M')
+    """
+    if com.count_not_none(start, end, periods) != 2:
+        raise ValueError('Of the three parameters: start, end, and periods, '
+                         'exactly two must be specified')
+    if freq is None and (not isinstance(start, Period)
+                         and not isinstance(end, Period)):
+        freq = 'D'
+
+    data, freq = PeriodArray._generate_range(start, end, periods, freq,
+                                             fields={})
+    data = PeriodArray(data, freq=freq)
+    return PeriodIndex(data, name=name)
diff --git a/pandas/core/indexes/range.py b/pandas/core/indexes/range.py
new file mode 100644
index 0000000000000..5aafe9734b6a0
--- /dev/null
+++ b/pandas/core/indexes/range.py
@@ -0,0 +1,702 @@
+from datetime import timedelta
+import operator
+from sys import getsizeof
+import warnings
+
+import numpy as np
+
+from pandas._libs import index as libindex, lib
+import pandas.compat as compat
+from pandas.compat import get_range_parameters, lrange, range
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, cache_readonly
+
+from pandas.core.dtypes import concat as _concat
+from pandas.core.dtypes.common import (
+    is_int64_dtype, is_integer, is_scalar, is_timedelta64_dtype)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCSeries, ABCTimedeltaIndex)
+
+from pandas.core import ops
+import pandas.core.common as com
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.core.indexes.numeric import Int64Index
+
+
+class RangeIndex(Int64Index):
+    """
+    Immutable Index implementing a monotonic integer range.
+
+    RangeIndex is a memory-saving special case of Int64Index limited to
+    representing monotonic ranges. Using RangeIndex may in some instances
+    improve computing speed.
+
+    This is the default index type used
+    by DataFrame and Series when no explicit index is provided by the user.
+
+    Parameters
+    ----------
+    start : int (default: 0), or other RangeIndex instance
+        If int and "stop" is not given, interpreted as "stop" instead.
+    stop : int (default: 0)
+    step : int (default: 1)
+    name : object, optional
+        Name to be stored in the index
+    copy : bool, default False
+        Unused, accepted for homogeneity with other index types.
+
+    Attributes
+    ----------
+    None
+
+    Methods
+    -------
+    from_range
+
+    See Also
+    --------
+    Index : The base pandas Index type.
+    Int64Index : Index of int64 data.
+    """
+
+    _typ = 'rangeindex'
+    _engine_type = libindex.Int64Engine
+
+    # --------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, start=None, stop=None, step=None,
+                dtype=None, copy=False, name=None, fastpath=None):
+
+        if fastpath is not None:
+            warnings.warn("The 'fastpath' keyword is deprecated, and will be "
+                          "removed in a future version.",
+                          FutureWarning, stacklevel=2)
+            if fastpath:
+                return cls._simple_new(start, stop, step, name=name)
+
+        cls._validate_dtype(dtype)
+
+        # RangeIndex
+        if isinstance(start, RangeIndex):
+            if name is None:
+                name = start.name
+            return cls._simple_new(name=name,
+                                   **dict(start._get_data_as_items()))
+
+        # validate the arguments
+        def ensure_int(value, field):
+            msg = ("RangeIndex(...) must be called with integers,"
+                   " {value} was passed for {field}")
+            if not is_scalar(value):
+                raise TypeError(msg.format(value=type(value).__name__,
+                                           field=field))
+            try:
+                new_value = int(value)
+                assert(new_value == value)
+            except (TypeError, ValueError, AssertionError):
+                raise TypeError(msg.format(value=type(value).__name__,
+                                           field=field))
+
+            return new_value
+
+        if com._all_none(start, stop, step):
+            msg = "RangeIndex(...) must be called with integers"
+            raise TypeError(msg)
+        elif start is None:
+            start = 0
+        else:
+            start = ensure_int(start, 'start')
+        if stop is None:
+            stop = start
+            start = 0
+        else:
+            stop = ensure_int(stop, 'stop')
+        if step is None:
+            step = 1
+        elif step == 0:
+            raise ValueError("Step must not be zero")
+        else:
+            step = ensure_int(step, 'step')
+
+        return cls._simple_new(start, stop, step, name)
+
+    @classmethod
+    def from_range(cls, data, name=None, dtype=None, **kwargs):
+        """ Create RangeIndex from a range (py3), or xrange (py2) object. """
+        if not isinstance(data, range):
+            raise TypeError(
+                '{0}(...) must be called with object coercible to a '
+                'range, {1} was passed'.format(cls.__name__, repr(data)))
+
+        start, stop, step = get_range_parameters(data)
+        return RangeIndex(start, stop, step, dtype=dtype, name=name, **kwargs)
+
+    @classmethod
+    def _simple_new(cls, start, stop=None, step=None, name=None,
+                    dtype=None, **kwargs):
+        result = object.__new__(cls)
+
+        # handle passed None, non-integers
+        if start is None and stop is None:
+            # empty
+            start, stop, step = 0, 0, 1
+
+        if start is None or not is_integer(start):
+            try:
+
+                return RangeIndex(start, stop, step, name=name, **kwargs)
+            except TypeError:
+                return Index(start, stop, step, name=name, **kwargs)
+
+        result._start = start
+        result._stop = stop or 0
+        result._step = step or 1
+        result.name = name
+        for k, v in compat.iteritems(kwargs):
+            setattr(result, k, v)
+
+        result._reset_identity()
+        return result
+
+    # --------------------------------------------------------------------
+
+    @staticmethod
+    def _validate_dtype(dtype):
+        """ require dtype to be None or int64 """
+        if not (dtype is None or is_int64_dtype(dtype)):
+            raise TypeError('Invalid to pass a non-int64 dtype to RangeIndex')
+
+    @cache_readonly
+    def _constructor(self):
+        """ return the class to use for construction """
+        return Int64Index
+
+    @cache_readonly
+    def _data(self):
+        return np.arange(self._start, self._stop, self._step, dtype=np.int64)
+
+    @cache_readonly
+    def _int64index(self):
+        return Int64Index._simple_new(self._data, name=self.name)
+
+    def _get_data_as_items(self):
+        """ return a list of tuples of start, stop, step """
+        return [('start', self._start),
+                ('stop', self._stop),
+                ('step', self._step)]
+
+    def __reduce__(self):
+        d = self._get_attributes_dict()
+        d.update(dict(self._get_data_as_items()))
+        return ibase._new_Index, (self.__class__, d), None
+
+    # --------------------------------------------------------------------
+    # Rendering Methods
+
+    def _format_attrs(self):
+        """
+        Return a list of tuples of the (attr, formatted_value)
+        """
+        attrs = self._get_data_as_items()
+        if self.name is not None:
+            attrs.append(('name', ibase.default_pprint(self.name)))
+        return attrs
+
+    def _format_data(self, name=None):
+        # we are formatting thru the attributes
+        return None
+
+    # --------------------------------------------------------------------
+
+    @cache_readonly
+    def nbytes(self):
+        """
+        Return the number of bytes in the underlying data
+        On implementations where this is undetermined (PyPy)
+        assume 24 bytes for each value
+        """
+        return sum(getsizeof(getattr(self, v), 24) for v in
+                   ['_start', '_stop', '_step'])
+
+    def memory_usage(self, deep=False):
+        """
+        Memory usage of my values
+
+        Parameters
+        ----------
+        deep : bool
+            Introspect the data deeply, interrogate
+            `object` dtypes for system-level memory consumption
+
+        Returns
+        -------
+        bytes used
+
+        Notes
+        -----
+        Memory usage does not include memory consumed by elements that
+        are not components of the array if deep=False
+
+        See Also
+        --------
+        numpy.ndarray.nbytes
+        """
+        return self.nbytes
+
+    @property
+    def dtype(self):
+        return np.dtype(np.int64)
+
+    @property
+    def is_unique(self):
+        """ return if the index has unique values """
+        return True
+
+    @cache_readonly
+    def is_monotonic_increasing(self):
+        return self._step > 0 or len(self) <= 1
+
+    @cache_readonly
+    def is_monotonic_decreasing(self):
+        return self._step < 0 or len(self) <= 1
+
+    @property
+    def has_duplicates(self):
+        return False
+
+    def tolist(self):
+        return lrange(self._start, self._stop, self._step)
+
+    @Appender(_index_shared_docs['_shallow_copy'])
+    def _shallow_copy(self, values=None, **kwargs):
+        if values is None:
+            name = kwargs.get("name", self.name)
+            return RangeIndex._simple_new(
+                name=name, **dict(self._get_data_as_items()))
+        else:
+            kwargs.setdefault('name', self.name)
+            return self._int64index._shallow_copy(values, **kwargs)
+
+    @Appender(ibase._index_shared_docs['copy'])
+    def copy(self, name=None, deep=False, dtype=None, **kwargs):
+        self._validate_dtype(dtype)
+        if name is None:
+            name = self.name
+        return RangeIndex._simple_new(
+            name=name, **dict(self._get_data_as_items()))
+
+    def _minmax(self, meth):
+        no_steps = len(self) - 1
+        if no_steps == -1:
+            return np.nan
+        elif ((meth == 'min' and self._step > 0) or
+              (meth == 'max' and self._step < 0)):
+            return self._start
+
+        return self._start + self._step * no_steps
+
+    def min(self, axis=None, skipna=True):
+        """The minimum value of the RangeIndex"""
+        nv.validate_minmax_axis(axis)
+        return self._minmax('min')
+
+    def max(self, axis=None, skipna=True):
+        """The maximum value of the RangeIndex"""
+        nv.validate_minmax_axis(axis)
+        return self._minmax('max')
+
+    def argsort(self, *args, **kwargs):
+        """
+        Returns the indices that would sort the index and its
+        underlying data.
+
+        Returns
+        -------
+        argsorted : numpy array
+
+        See Also
+        --------
+        numpy.ndarray.argsort
+        """
+        nv.validate_argsort(args, kwargs)
+
+        if self._step > 0:
+            return np.arange(len(self))
+        else:
+            return np.arange(len(self) - 1, -1, -1)
+
+    def equals(self, other):
+        """
+        Determines if two Index objects contain the same elements.
+        """
+        if isinstance(other, RangeIndex):
+            ls = len(self)
+            lo = len(other)
+            return (ls == lo == 0 or
+                    ls == lo == 1 and
+                    self._start == other._start or
+                    ls == lo and
+                    self._start == other._start and
+                    self._step == other._step)
+
+        return super(RangeIndex, self).equals(other)
+
+    def intersection(self, other, sort=False):
+        """
+        Form the intersection of two Index objects.
+
+        Parameters
+        ----------
+        other : Index or array-like
+        sort : False or None, default False
+            Sort the resulting index if possible
+
+            .. versionadded:: 0.24.0
+
+            .. versionchanged:: 0.24.1
+
+               Changed the default to ``False`` to match the behaviour
+               from before 0.24.0.
+
+        Returns
+        -------
+        intersection : Index
+        """
+        self._validate_sort_keyword(sort)
+
+        if self.equals(other):
+            return self._get_reconciled_name_object(other)
+
+        if not isinstance(other, RangeIndex):
+            return super(RangeIndex, self).intersection(other, sort=sort)
+
+        if not len(self) or not len(other):
+            return RangeIndex._simple_new(None)
+
+        first = self[::-1] if self._step < 0 else self
+        second = other[::-1] if other._step < 0 else other
+
+        # check whether intervals intersect
+        # deals with in- and decreasing ranges
+        int_low = max(first._start, second._start)
+        int_high = min(first._stop, second._stop)
+        if int_high <= int_low:
+            return RangeIndex._simple_new(None)
+
+        # Method hint: linear Diophantine equation
+        # solve intersection problem
+        # performance hint: for identical step sizes, could use
+        # cheaper alternative
+        gcd, s, t = first._extended_gcd(first._step, second._step)
+
+        # check whether element sets intersect
+        if (first._start - second._start) % gcd:
+            return RangeIndex._simple_new(None)
+
+        # calculate parameters for the RangeIndex describing the
+        # intersection disregarding the lower bounds
+        tmp_start = first._start + (second._start - first._start) * \
+            first._step // gcd * s
+        new_step = first._step * second._step // gcd
+        new_index = RangeIndex._simple_new(tmp_start, int_high, new_step)
+
+        # adjust index to limiting interval
+        new_index._start = new_index._min_fitting_element(int_low)
+
+        if (self._step < 0 and other._step < 0) is not (new_index._step < 0):
+            new_index = new_index[::-1]
+        if sort is None:
+            new_index = new_index.sort_values()
+        return new_index
+
+    def _min_fitting_element(self, lower_limit):
+        """Returns the smallest element greater than or equal to the limit"""
+        no_steps = -(-(lower_limit - self._start) // abs(self._step))
+        return self._start + abs(self._step) * no_steps
+
+    def _max_fitting_element(self, upper_limit):
+        """Returns the largest element smaller than or equal to the limit"""
+        no_steps = (upper_limit - self._start) // abs(self._step)
+        return self._start + abs(self._step) * no_steps
+
+    def _extended_gcd(self, a, b):
+        """
+        Extended Euclidean algorithms to solve Bezout's identity:
+           a*x + b*y = gcd(x, y)
+        Finds one particular solution for x, y: s, t
+        Returns: gcd, s, t
+        """
+        s, old_s = 0, 1
+        t, old_t = 1, 0
+        r, old_r = b, a
+        while r:
+            quotient = old_r // r
+            old_r, r = r, old_r - quotient * r
+            old_s, s = s, old_s - quotient * s
+            old_t, t = t, old_t - quotient * t
+        return old_r, old_s, old_t
+
+    def union(self, other):
+        """
+        Form the union of two Index objects and sorts if possible
+
+        Parameters
+        ----------
+        other : Index or array-like
+
+        Returns
+        -------
+        union : Index
+        """
+        self._assert_can_do_setop(other)
+        if len(other) == 0 or self.equals(other) or len(self) == 0:
+            return super(RangeIndex, self).union(other)
+
+        if isinstance(other, RangeIndex):
+            start_s, step_s = self._start, self._step
+            end_s = self._start + self._step * (len(self) - 1)
+            start_o, step_o = other._start, other._step
+            end_o = other._start + other._step * (len(other) - 1)
+            if self._step < 0:
+                start_s, step_s, end_s = end_s, -step_s, start_s
+            if other._step < 0:
+                start_o, step_o, end_o = end_o, -step_o, start_o
+            if len(self) == 1 and len(other) == 1:
+                step_s = step_o = abs(self._start - other._start)
+            elif len(self) == 1:
+                step_s = step_o
+            elif len(other) == 1:
+                step_o = step_s
+            start_r = min(start_s, start_o)
+            end_r = max(end_s, end_o)
+            if step_o == step_s:
+                if ((start_s - start_o) % step_s == 0 and
+                        (start_s - end_o) <= step_s and
+                        (start_o - end_s) <= step_s):
+                    return RangeIndex(start_r, end_r + step_s, step_s)
+                if ((step_s % 2 == 0) and
+                        (abs(start_s - start_o) <= step_s / 2) and
+                        (abs(end_s - end_o) <= step_s / 2)):
+                    return RangeIndex(start_r, end_r + step_s / 2, step_s / 2)
+            elif step_o % step_s == 0:
+                if ((start_o - start_s) % step_s == 0 and
+                        (start_o + step_s >= start_s) and
+                        (end_o - step_s <= end_s)):
+                    return RangeIndex(start_r, end_r + step_s, step_s)
+            elif step_s % step_o == 0:
+                if ((start_s - start_o) % step_o == 0 and
+                        (start_s + step_o >= start_o) and
+                        (end_s - step_o <= end_o)):
+                    return RangeIndex(start_r, end_r + step_o, step_o)
+
+        return self._int64index.union(other)
+
+    @Appender(_index_shared_docs['join'])
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        if how == 'outer' and self is not other:
+            # note: could return RangeIndex in more circumstances
+            return self._int64index.join(other, how, level, return_indexers,
+                                         sort)
+
+        return super(RangeIndex, self).join(other, how, level, return_indexers,
+                                            sort)
+
+    def _concat_same_dtype(self, indexes, name):
+        return _concat._concat_rangeindex_same_dtype(indexes).rename(name)
+
+    def __len__(self):
+        """
+        return the length of the RangeIndex
+        """
+        return max(0, -(-(self._stop - self._start) // self._step))
+
+    @property
+    def size(self):
+        return len(self)
+
+    def __getitem__(self, key):
+        """
+        Conserve RangeIndex type for scalar and slice keys.
+        """
+        super_getitem = super(RangeIndex, self).__getitem__
+
+        if is_scalar(key):
+            if not lib.is_integer(key):
+                raise IndexError("only integers, slices (`:`), "
+                                 "ellipsis (`...`), numpy.newaxis (`None`) "
+                                 "and integer or boolean "
+                                 "arrays are valid indices")
+            n = com.cast_scalar_indexer(key)
+            if n != key:
+                return super_getitem(key)
+            if n < 0:
+                n = len(self) + key
+            if n < 0 or n > len(self) - 1:
+                raise IndexError("index {key} is out of bounds for axis 0 "
+                                 "with size {size}".format(key=key,
+                                                           size=len(self)))
+            return self._start + n * self._step
+
+        if isinstance(key, slice):
+
+            # This is basically PySlice_GetIndicesEx, but delegation to our
+            # super routines if we don't have integers
+
+            length = len(self)
+
+            # complete missing slice information
+            step = 1 if key.step is None else key.step
+            if key.start is None:
+                start = length - 1 if step < 0 else 0
+            else:
+                start = key.start
+
+                if start < 0:
+                    start += length
+                if start < 0:
+                    start = -1 if step < 0 else 0
+                if start >= length:
+                    start = length - 1 if step < 0 else length
+
+            if key.stop is None:
+                stop = -1 if step < 0 else length
+            else:
+                stop = key.stop
+
+                if stop < 0:
+                    stop += length
+                if stop < 0:
+                    stop = -1
+                if stop > length:
+                    stop = length
+
+            # delegate non-integer slices
+            if (start != int(start) or
+                    stop != int(stop) or
+                    step != int(step)):
+                return super_getitem(key)
+
+            # convert indexes to values
+            start = self._start + self._step * start
+            stop = self._start + self._step * stop
+            step = self._step * step
+
+            return RangeIndex._simple_new(start, stop, step, name=self.name)
+
+        # fall back to Int64Index
+        return super_getitem(key)
+
+    def __floordiv__(self, other):
+        if isinstance(other, (ABCSeries, ABCDataFrame)):
+            return NotImplemented
+
+        if is_integer(other) and other != 0:
+            if (len(self) == 0 or
+                    self._start % other == 0 and
+                    self._step % other == 0):
+                start = self._start // other
+                step = self._step // other
+                stop = start + len(self) * step
+                return RangeIndex._simple_new(
+                    start, stop, step, name=self.name)
+            if len(self) == 1:
+                start = self._start // other
+                return RangeIndex._simple_new(
+                    start, start + 1, 1, name=self.name)
+        return self._int64index // other
+
+    @classmethod
+    def _add_numeric_methods_binary(cls):
+        """ add in numeric methods, specialized to RangeIndex """
+
+        def _make_evaluate_binop(op, step=False):
+            """
+            Parameters
+            ----------
+            op : callable that accepts 2 parms
+                perform the binary op
+            step : callable, optional, default to False
+                op to apply to the step parm if not None
+                if False, use the existing step
+            """
+
+            def _evaluate_numeric_binop(self, other):
+                if isinstance(other, (ABCSeries, ABCDataFrame)):
+                    return NotImplemented
+                elif isinstance(other, ABCTimedeltaIndex):
+                    # Defer to TimedeltaIndex implementation
+                    return NotImplemented
+                elif isinstance(other, (timedelta, np.timedelta64)):
+                    # GH#19333 is_integer evaluated True on timedelta64,
+                    # so we need to catch these explicitly
+                    return op(self._int64index, other)
+                elif is_timedelta64_dtype(other):
+                    # Must be an np.ndarray; GH#22390
+                    return op(self._int64index, other)
+
+                other = self._validate_for_numeric_binop(other, op)
+                attrs = self._get_attributes_dict()
+                attrs = self._maybe_update_attributes(attrs)
+
+                left, right = self, other
+
+                try:
+                    # apply if we have an override
+                    if step:
+                        with np.errstate(all='ignore'):
+                            rstep = step(left._step, right)
+
+                        # we don't have a representable op
+                        # so return a base index
+                        if not is_integer(rstep) or not rstep:
+                            raise ValueError
+
+                    else:
+                        rstep = left._step
+
+                    with np.errstate(all='ignore'):
+                        rstart = op(left._start, right)
+                        rstop = op(left._stop, right)
+
+                    result = RangeIndex(rstart,
+                                        rstop,
+                                        rstep,
+                                        **attrs)
+
+                    # for compat with numpy / Int64Index
+                    # even if we can represent as a RangeIndex, return
+                    # as a Float64Index if we have float-like descriptors
+                    if not all(is_integer(x) for x in
+                               [rstart, rstop, rstep]):
+                        result = result.astype('float64')
+
+                    return result
+
+                except (ValueError, TypeError, ZeroDivisionError):
+                    # Defer to Int64Index implementation
+                    return op(self._int64index, other)
+                    # TODO: Do attrs get handled reliably?
+
+            name = '__{name}__'.format(name=op.__name__)
+            return compat.set_function_name(_evaluate_numeric_binop, name, cls)
+
+        cls.__add__ = _make_evaluate_binop(operator.add)
+        cls.__radd__ = _make_evaluate_binop(ops.radd)
+        cls.__sub__ = _make_evaluate_binop(operator.sub)
+        cls.__rsub__ = _make_evaluate_binop(ops.rsub)
+        cls.__mul__ = _make_evaluate_binop(operator.mul, step=operator.mul)
+        cls.__rmul__ = _make_evaluate_binop(ops.rmul, step=ops.rmul)
+        cls.__truediv__ = _make_evaluate_binop(operator.truediv,
+                                               step=operator.truediv)
+        cls.__rtruediv__ = _make_evaluate_binop(ops.rtruediv,
+                                                step=ops.rtruediv)
+        if not compat.PY3:
+            cls.__div__ = _make_evaluate_binop(operator.div, step=operator.div)
+            cls.__rdiv__ = _make_evaluate_binop(ops.rdiv, step=ops.rdiv)
+
+
+RangeIndex._add_numeric_methods()
+RangeIndex._add_logical_methods()
diff --git a/pandas/core/indexes/timedeltas.py b/pandas/core/indexes/timedeltas.py
new file mode 100644
index 0000000000000..830925535dab1
--- /dev/null
+++ b/pandas/core/indexes/timedeltas.py
@@ -0,0 +1,809 @@
+""" implement the TimedeltaIndex """
+from datetime import datetime
+import warnings
+
+import numpy as np
+
+from pandas._libs import (
+    NaT, Timedelta, index as libindex, join as libjoin, lib)
+import pandas.compat as compat
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.common import (
+    _TD_DTYPE, ensure_int64, is_float, is_integer, is_list_like, is_scalar,
+    is_timedelta64_dtype, is_timedelta64_ns_dtype, pandas_dtype)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.missing import isna
+
+from pandas.core.accessor import delegate_names
+from pandas.core.arrays import datetimelike as dtl
+from pandas.core.arrays.timedeltas import TimedeltaArray, _is_convertible_to_td
+from pandas.core.base import _shared_docs
+import pandas.core.common as com
+from pandas.core.indexes.base import Index, _index_shared_docs
+from pandas.core.indexes.datetimelike import (
+    DatetimeIndexOpsMixin, DatetimelikeDelegateMixin, maybe_unwrap_index,
+    wrap_arithmetic_op)
+from pandas.core.indexes.numeric import Int64Index
+from pandas.core.ops import get_op_result_name
+
+from pandas.tseries.frequencies import to_offset
+
+
+def _make_wrapped_arith_op(opname):
+
+    meth = getattr(TimedeltaArray, opname)
+
+    def method(self, other):
+        result = meth(self._data, maybe_unwrap_index(other))
+        return wrap_arithmetic_op(self, other, result)
+
+    method.__name__ = opname
+    return method
+
+
+class TimedeltaDelegateMixin(DatetimelikeDelegateMixin):
+    # Most attrs are dispatched via datetimelike_{ops,methods}
+    # Some are "raw" methods, the result is not not re-boxed in an Index
+    # We also have a few "extra" attrs, which may or may not be raw,
+    # which we we dont' want to expose in the .dt accessor.
+    _delegate_class = TimedeltaArray
+    _delegated_properties = (TimedeltaArray._datetimelike_ops + [
+        'components',
+    ])
+    _delegated_methods = TimedeltaArray._datetimelike_methods + [
+        '_box_values',
+    ]
+    _raw_properties = {
+        'components',
+    }
+    _raw_methods = {
+        'to_pytimedelta',
+    }
+
+
+@delegate_names(TimedeltaArray,
+                TimedeltaDelegateMixin._delegated_properties,
+                typ="property")
+@delegate_names(TimedeltaArray,
+                TimedeltaDelegateMixin._delegated_methods,
+                typ="method", overwrite=False)
+class TimedeltaIndex(DatetimeIndexOpsMixin, dtl.TimelikeOps, Int64Index,
+                     TimedeltaDelegateMixin):
+    """
+    Immutable ndarray of timedelta64 data, represented internally as int64, and
+    which can be boxed to timedelta objects
+
+    Parameters
+    ----------
+    data  : array-like (1-dimensional), optional
+        Optional timedelta-like data to construct index with
+    unit : unit of the arg (D,h,m,s,ms,us,ns) denote the unit, optional
+        which is an integer/float number
+    freq : string or pandas offset object, optional
+        One of pandas date offset strings or corresponding objects. The string
+        'infer' can be passed in order to set the frequency of the index as the
+        inferred frequency upon creation
+    copy  : bool
+        Make a copy of input ndarray
+    start : starting value, timedelta-like, optional
+        If data is None, start is used as the start point in generating regular
+        timedelta data.
+
+        .. deprecated:: 0.24.0
+
+    periods  : int, optional, > 0
+        Number of periods to generate, if generating index. Takes precedence
+        over end argument
+
+        .. deprecated:: 0.24.0
+
+    end : end time, timedelta-like, optional
+        If periods is none, generated index will extend to first conforming
+        time on or just past end argument
+
+        .. deprecated:: 0.24. 0
+
+    closed : string or None, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+        .. deprecated:: 0.24. 0
+
+    name : object
+        Name to be stored in the index
+
+    Attributes
+    ----------
+    days
+    seconds
+    microseconds
+    nanoseconds
+    components
+    inferred_freq
+
+    Methods
+    -------
+    to_pytimedelta
+    to_series
+    round
+    floor
+    ceil
+    to_frame
+
+    See Also
+    ---------
+    Index : The base pandas Index type.
+    Timedelta : Represents a duration between two dates or times.
+    DatetimeIndex : Index of datetime64 data.
+    PeriodIndex : Index of Period data.
+    timedelta_range : Create a fixed-frequency TimedeltaIndex.
+
+    Notes
+    -----
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Creating a TimedeltaIndex based on `start`, `periods`, and `end` has
+    been deprecated in favor of :func:`timedelta_range`.
+    """
+
+    _typ = 'timedeltaindex'
+    _join_precedence = 10
+
+    def _join_i8_wrapper(joinf, **kwargs):
+        return DatetimeIndexOpsMixin._join_i8_wrapper(
+            joinf, dtype='m8[ns]', **kwargs)
+
+    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
+    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
+    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
+    _left_indexer_unique = _join_i8_wrapper(
+        libjoin.left_join_indexer_unique_int64, with_indexers=False)
+
+    _engine_type = libindex.TimedeltaEngine
+
+    _comparables = ['name', 'freq']
+    _attributes = ['name', 'freq']
+    _is_numeric_dtype = True
+    _infer_as_myclass = True
+
+    _freq = None
+
+    _box_func = TimedeltaArray._box_func
+    _bool_ops = TimedeltaArray._bool_ops
+    _object_ops = TimedeltaArray._object_ops
+    _field_ops = TimedeltaArray._field_ops
+    _datetimelike_ops = TimedeltaArray._datetimelike_ops
+    _datetimelike_methods = TimedeltaArray._datetimelike_methods
+    _other_ops = TimedeltaArray._other_ops
+
+    # -------------------------------------------------------------------
+    # Constructors
+
+    def __new__(cls, data=None, unit=None, freq=None, start=None, end=None,
+                periods=None, closed=None, dtype=_TD_DTYPE, copy=False,
+                name=None, verify_integrity=None):
+
+        if verify_integrity is not None:
+            warnings.warn("The 'verify_integrity' argument is deprecated, "
+                          "will be removed in a future version.",
+                          FutureWarning, stacklevel=2)
+        else:
+            verify_integrity = True
+
+        if data is None:
+            freq, freq_infer = dtl.maybe_infer_freq(freq)
+            warnings.warn("Creating a TimedeltaIndex by passing range "
+                          "endpoints is deprecated.  Use "
+                          "`pandas.timedelta_range` instead.",
+                          FutureWarning, stacklevel=2)
+            result = TimedeltaArray._generate_range(start, end, periods, freq,
+                                                    closed=closed)
+            return cls._simple_new(result._data, freq=freq, name=name)
+
+        if is_scalar(data):
+            raise TypeError('{cls}() must be called with a '
+                            'collection of some kind, {data} was passed'
+                            .format(cls=cls.__name__, data=repr(data)))
+
+        if unit in {'Y', 'y', 'M'}:
+            warnings.warn("M and Y units are deprecated and "
+                          "will be removed in a future version.",
+                          FutureWarning, stacklevel=2)
+
+        if isinstance(data, TimedeltaArray):
+            if copy:
+                data = data.copy()
+            return cls._simple_new(data, name=name, freq=freq)
+
+        if (isinstance(data, TimedeltaIndex) and
+                freq is None and name is None):
+            if copy:
+                return data.copy()
+            else:
+                return data._shallow_copy()
+
+        # - Cases checked above all return/raise before reaching here - #
+
+        tdarr = TimedeltaArray._from_sequence(data, freq=freq, unit=unit,
+                                              dtype=dtype, copy=copy)
+        return cls._simple_new(tdarr._data, freq=tdarr.freq, name=name)
+
+    @classmethod
+    def _simple_new(cls, values, name=None, freq=None, dtype=_TD_DTYPE):
+        # `dtype` is passed by _shallow_copy in corner cases, should always
+        #  be timedelta64[ns] if present
+        if not isinstance(values, TimedeltaArray):
+            values = TimedeltaArray._simple_new(values, dtype=dtype,
+                                                freq=freq)
+        else:
+            if freq is None:
+                freq = values.freq
+        assert isinstance(values, TimedeltaArray), type(values)
+        assert dtype == _TD_DTYPE, dtype
+        assert values.dtype == 'm8[ns]', values.dtype
+
+        tdarr = TimedeltaArray._simple_new(values._data, freq=freq)
+        result = object.__new__(cls)
+        result._data = tdarr
+        result.name = name
+        # For groupby perf. See note in indexes/base about _index_data
+        result._index_data = tdarr._data
+
+        result._reset_identity()
+        return result
+
+    # -------------------------------------------------------------------
+
+    def __setstate__(self, state):
+        """Necessary for making this object picklable"""
+        if isinstance(state, dict):
+            super(TimedeltaIndex, self).__setstate__(state)
+        else:
+            raise Exception("invalid pickle state")
+    _unpickle_compat = __setstate__
+
+    def _maybe_update_attributes(self, attrs):
+        """ Update Index attributes (e.g. freq) depending on op """
+        freq = attrs.get('freq', None)
+        if freq is not None:
+            # no need to infer if freq is None
+            attrs['freq'] = 'infer'
+        return attrs
+
+    # -------------------------------------------------------------------
+    # Rendering Methods
+
+    @property
+    def _formatter_func(self):
+        from pandas.io.formats.format import _get_format_timedelta64
+        return _get_format_timedelta64(self, box=True)
+
+    def _format_native_types(self, na_rep='NaT', date_format=None, **kwargs):
+        from pandas.io.formats.format import Timedelta64Formatter
+        return Timedelta64Formatter(values=self,
+                                    nat_rep=na_rep,
+                                    justify='all').get_result()
+
+    # -------------------------------------------------------------------
+    # Wrapping TimedeltaArray
+
+    __mul__ = _make_wrapped_arith_op("__mul__")
+    __rmul__ = _make_wrapped_arith_op("__rmul__")
+    __floordiv__ = _make_wrapped_arith_op("__floordiv__")
+    __rfloordiv__ = _make_wrapped_arith_op("__rfloordiv__")
+    __mod__ = _make_wrapped_arith_op("__mod__")
+    __rmod__ = _make_wrapped_arith_op("__rmod__")
+    __divmod__ = _make_wrapped_arith_op("__divmod__")
+    __rdivmod__ = _make_wrapped_arith_op("__rdivmod__")
+    __truediv__ = _make_wrapped_arith_op("__truediv__")
+    __rtruediv__ = _make_wrapped_arith_op("__rtruediv__")
+    if compat.PY2:
+        __div__ = __truediv__
+        __rdiv__ = __rtruediv__
+
+    # Compat for frequency inference, see GH#23789
+    _is_monotonic_increasing = Index.is_monotonic_increasing
+    _is_monotonic_decreasing = Index.is_monotonic_decreasing
+    _is_unique = Index.is_unique
+
+    @property
+    def _box_func(self):
+        return lambda x: Timedelta(x, unit='ns')
+
+    def __getitem__(self, key):
+        result = self._data.__getitem__(key)
+        if is_scalar(result):
+            return result
+        return type(self)(result, name=self.name)
+
+    # -------------------------------------------------------------------
+
+    @Appender(_index_shared_docs['astype'])
+    def astype(self, dtype, copy=True):
+        dtype = pandas_dtype(dtype)
+        if is_timedelta64_dtype(dtype) and not is_timedelta64_ns_dtype(dtype):
+            # Have to repeat the check for 'timedelta64' (not ns) dtype
+            #  so that we can return a numeric index, since pandas will return
+            #  a TimedeltaIndex when dtype='timedelta'
+            result = self._data.astype(dtype, copy=copy)
+            if self.hasnans:
+                return Index(result, name=self.name)
+            return Index(result.astype('i8'), name=self.name)
+        return DatetimeIndexOpsMixin.astype(self, dtype, copy=copy)
+
+    def union(self, other):
+        """
+        Specialized union for TimedeltaIndex objects. If combine
+        overlapping ranges with the same DateOffset, will be much
+        faster than Index.union
+
+        Parameters
+        ----------
+        other : TimedeltaIndex or array-like
+
+        Returns
+        -------
+        y : Index or TimedeltaIndex
+        """
+        self._assert_can_do_setop(other)
+
+        if len(other) == 0 or self.equals(other) or len(self) == 0:
+            return super(TimedeltaIndex, self).union(other)
+
+        if not isinstance(other, TimedeltaIndex):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+        this, other = self, other
+
+        if this._can_fast_union(other):
+            return this._fast_union(other)
+        else:
+            result = Index.union(this, other)
+            if isinstance(result, TimedeltaIndex):
+                if result.freq is None:
+                    result.freq = to_offset(result.inferred_freq)
+            return result
+
+    def join(self, other, how='left', level=None, return_indexers=False,
+             sort=False):
+        """
+        See Index.join
+        """
+        if _is_convertible_to_index(other):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+
+        return Index.join(self, other, how=how, level=level,
+                          return_indexers=return_indexers,
+                          sort=sort)
+
+    def _wrap_joined_index(self, joined, other):
+        name = get_op_result_name(self, other)
+        if (isinstance(other, TimedeltaIndex) and self.freq == other.freq and
+                self._can_fast_union(other)):
+            joined = self._shallow_copy(joined, name=name)
+            return joined
+        else:
+            return self._simple_new(joined, name)
+
+    def _can_fast_union(self, other):
+        if not isinstance(other, TimedeltaIndex):
+            return False
+
+        freq = self.freq
+
+        if freq is None or freq != other.freq:
+            return False
+
+        if not self.is_monotonic or not other.is_monotonic:
+            return False
+
+        if len(self) == 0 or len(other) == 0:
+            return True
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        right_start = right[0]
+        left_end = left[-1]
+
+        # Only need to "adjoin", not overlap
+        return (right_start == left_end + freq) or right_start in left
+
+    def _fast_union(self, other):
+        if len(other) == 0:
+            return self.view(type(self))
+
+        if len(self) == 0:
+            return other.view(type(self))
+
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        left_end = left[-1]
+        right_end = right[-1]
+
+        # concatenate
+        if left_end < right_end:
+            loc = right.searchsorted(left_end, side='right')
+            right_chunk = right.values[loc:]
+            dates = _concat._concat_compat((left.values, right_chunk))
+            return self._shallow_copy(dates)
+        else:
+            return left
+
+    def intersection(self, other):
+        """
+        Specialized intersection for TimedeltaIndex objects. May be much faster
+        than Index.intersection
+
+        Parameters
+        ----------
+        other : TimedeltaIndex or array-like
+
+        Returns
+        -------
+        y : Index or TimedeltaIndex
+        """
+        self._assert_can_do_setop(other)
+
+        if self.equals(other):
+            return self._get_reconciled_name_object(other)
+
+        if not isinstance(other, TimedeltaIndex):
+            try:
+                other = TimedeltaIndex(other)
+            except (TypeError, ValueError):
+                pass
+            result = Index.intersection(self, other)
+            return result
+
+        if len(self) == 0:
+            return self
+        if len(other) == 0:
+            return other
+        # to make our life easier, "sort" the two ranges
+        if self[0] <= other[0]:
+            left, right = self, other
+        else:
+            left, right = other, self
+
+        end = min(left[-1], right[-1])
+        start = right[0]
+
+        if end < start:
+            return type(self)(data=[])
+        else:
+            lslice = slice(*left.slice_locs(start, end))
+            left_chunk = left.values[lslice]
+            return self._shallow_copy(left_chunk)
+
+    def _maybe_promote(self, other):
+        if other.inferred_type == 'timedelta':
+            other = TimedeltaIndex(other)
+        return self, other
+
+    def get_value(self, series, key):
+        """
+        Fast lookup of value from 1-dimensional ndarray. Only use this if you
+        know what you're doing
+        """
+
+        if _is_convertible_to_td(key):
+            key = Timedelta(key)
+            return self.get_value_maybe_box(series, key)
+
+        try:
+            return com.maybe_box(self, Index.get_value(self, series, key),
+                                 series, key)
+        except KeyError:
+            try:
+                loc = self._get_string_slice(key)
+                return series[loc]
+            except (TypeError, ValueError, KeyError):
+                pass
+
+            try:
+                return self.get_value_maybe_box(series, key)
+            except (TypeError, ValueError, KeyError):
+                raise KeyError(key)
+
+    def get_value_maybe_box(self, series, key):
+        if not isinstance(key, Timedelta):
+            key = Timedelta(key)
+        values = self._engine.get_value(com.values_from_object(series), key)
+        return com.maybe_box(self, values, series, key)
+
+    def get_loc(self, key, method=None, tolerance=None):
+        """
+        Get integer location for requested label
+
+        Returns
+        -------
+        loc : int
+        """
+        if is_list_like(key) or (isinstance(key, datetime) and key is not NaT):
+            # GH#20464 datetime check here is to ensure we don't allow
+            #   datetime objects to be incorrectly treated as timedelta
+            #   objects; NaT is a special case because it plays a double role
+            #   as Not-A-Timedelta
+            raise TypeError
+
+        if isna(key):
+            key = NaT
+
+        if tolerance is not None:
+            # try converting tolerance now, so errors don't get swallowed by
+            # the try/except clauses below
+            tolerance = self._convert_tolerance(tolerance, np.asarray(key))
+
+        if _is_convertible_to_td(key):
+            key = Timedelta(key)
+            return Index.get_loc(self, key, method, tolerance)
+
+        try:
+            return Index.get_loc(self, key, method, tolerance)
+        except (KeyError, ValueError, TypeError):
+            try:
+                return self._get_string_slice(key)
+            except (TypeError, KeyError, ValueError):
+                pass
+
+            try:
+                stamp = Timedelta(key)
+                return Index.get_loc(self, stamp, method, tolerance)
+            except (KeyError, ValueError):
+                raise KeyError(key)
+
+    def _maybe_cast_slice_bound(self, label, side, kind):
+        """
+        If label is a string, cast it to timedelta according to resolution.
+
+
+        Parameters
+        ----------
+        label : object
+        side : {'left', 'right'}
+        kind : {'ix', 'loc', 'getitem'}
+
+        Returns
+        -------
+        label :  object
+
+        """
+        assert kind in ['ix', 'loc', 'getitem', None]
+
+        if isinstance(label, compat.string_types):
+            parsed = Timedelta(label)
+            lbound = parsed.round(parsed.resolution)
+            if side == 'left':
+                return lbound
+            else:
+                return (lbound + to_offset(parsed.resolution) -
+                        Timedelta(1, 'ns'))
+        elif ((is_integer(label) or is_float(label)) and
+              not is_timedelta64_dtype(label)):
+            self._invalid_indexer('slice', label)
+
+        return label
+
+    def _get_string_slice(self, key):
+        if is_integer(key) or is_float(key) or key is NaT:
+            self._invalid_indexer('slice', key)
+        loc = self._partial_td_slice(key)
+        return loc
+
+    def _partial_td_slice(self, key):
+
+        # given a key, try to figure out a location for a partial slice
+        if not isinstance(key, compat.string_types):
+            return key
+
+        raise NotImplementedError
+
+    @Substitution(klass='TimedeltaIndex')
+    @Appender(_shared_docs['searchsorted'])
+    def searchsorted(self, value, side='left', sorter=None):
+        if isinstance(value, (np.ndarray, Index)):
+            value = np.array(value, dtype=_TD_DTYPE, copy=False)
+        else:
+            value = Timedelta(value).asm8.view(_TD_DTYPE)
+
+        return self.values.searchsorted(value, side=side, sorter=sorter)
+
+    def is_type_compatible(self, typ):
+        return typ == self.inferred_type or typ == 'timedelta'
+
+    @property
+    def inferred_type(self):
+        return 'timedelta64'
+
+    @property
+    def is_all_dates(self):
+        return True
+
+    def insert(self, loc, item):
+        """
+        Make new Index inserting new item at location
+
+        Parameters
+        ----------
+        loc : int
+        item : object
+            if not either a Python datetime or a numpy integer-like, returned
+            Index dtype will be object rather than datetime.
+
+        Returns
+        -------
+        new_index : Index
+        """
+        # try to convert if possible
+        if _is_convertible_to_td(item):
+            try:
+                item = Timedelta(item)
+            except Exception:
+                pass
+        elif is_scalar(item) and isna(item):
+            # GH 18295
+            item = self._na_value
+
+        freq = None
+        if isinstance(item, Timedelta) or (is_scalar(item) and isna(item)):
+
+            # check freq can be preserved on edge cases
+            if self.freq is not None:
+                if ((loc == 0 or loc == -len(self)) and
+                        item + self.freq == self[0]):
+                    freq = self.freq
+                elif (loc == len(self)) and item - self.freq == self[-1]:
+                    freq = self.freq
+            item = Timedelta(item).asm8.view(_TD_DTYPE)
+
+        try:
+            new_tds = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
+                                      self[loc:].asi8))
+            return self._shallow_copy(new_tds, freq=freq)
+
+        except (AttributeError, TypeError):
+
+            # fall back to object index
+            if isinstance(item, compat.string_types):
+                return self.astype(object).insert(loc, item)
+            raise TypeError(
+                "cannot insert TimedeltaIndex with incompatible label")
+
+    def delete(self, loc):
+        """
+        Make a new TimedeltaIndex with passed location(s) deleted.
+
+        Parameters
+        ----------
+        loc: int, slice or array of ints
+            Indicate which sub-arrays to remove.
+
+        Returns
+        -------
+        new_index : TimedeltaIndex
+        """
+        new_tds = np.delete(self.asi8, loc)
+
+        freq = 'infer'
+        if is_integer(loc):
+            if loc in (0, -len(self), -1, len(self) - 1):
+                freq = self.freq
+        else:
+            if is_list_like(loc):
+                loc = lib.maybe_indices_to_slice(
+                    ensure_int64(np.array(loc)), len(self))
+            if isinstance(loc, slice) and loc.step in (1, None):
+                if (loc.start in (0, None) or loc.stop in (len(self), None)):
+                    freq = self.freq
+
+        return TimedeltaIndex(new_tds, name=self.name, freq=freq)
+
+
+TimedeltaIndex._add_comparison_ops()
+TimedeltaIndex._add_numeric_methods_unary()
+TimedeltaIndex._add_logical_methods_disabled()
+TimedeltaIndex._add_datetimelike_methods()
+
+
+def _is_convertible_to_index(other):
+    """
+    return a boolean whether I can attempt conversion to a TimedeltaIndex
+    """
+    if isinstance(other, TimedeltaIndex):
+        return True
+    elif (len(other) > 0 and
+          other.inferred_type not in ('floating', 'mixed-integer', 'integer',
+                                      'mixed-integer-float', 'mixed')):
+        return True
+    return False
+
+
+def timedelta_range(start=None, end=None, periods=None, freq=None,
+                    name=None, closed=None):
+    """
+    Return a fixed frequency TimedeltaIndex, with day as the default
+    frequency
+
+    Parameters
+    ----------
+    start : string or timedelta-like, default None
+        Left bound for generating timedeltas
+    end : string or timedelta-like, default None
+        Right bound for generating timedeltas
+    periods : integer, default None
+        Number of periods to generate
+    freq : string or DateOffset, default 'D'
+        Frequency strings can have multiples, e.g. '5H'
+    name : string, default None
+        Name of the resulting TimedeltaIndex
+    closed : string, default None
+        Make the interval closed with respect to the given frequency to
+        the 'left', 'right', or both sides (None)
+
+    Returns
+    -------
+    rng : TimedeltaIndex
+
+    Notes
+    -----
+    Of the four parameters ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified. If ``freq`` is omitted, the resulting
+    ``TimedeltaIndex`` will have ``periods`` linearly spaced elements between
+    ``start`` and ``end`` (closed on both sides).
+
+    To learn more about the frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    Examples
+    --------
+
+    >>> pd.timedelta_range(start='1 day', periods=4)
+    TimedeltaIndex(['1 days', '2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq='D')
+
+    The ``closed`` parameter specifies which endpoint is included.  The default
+    behavior is to include both endpoints.
+
+    >>> pd.timedelta_range(start='1 day', periods=4, closed='right')
+    TimedeltaIndex(['2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq='D')
+
+    The ``freq`` parameter specifies the frequency of the TimedeltaIndex.
+    Only fixed frequencies can be passed, non-fixed frequencies such as
+    'M' (month end) will raise.
+
+    >>> pd.timedelta_range(start='1 day', end='2 days', freq='6H')
+    TimedeltaIndex(['1 days 00:00:00', '1 days 06:00:00', '1 days 12:00:00',
+                    '1 days 18:00:00', '2 days 00:00:00'],
+                   dtype='timedelta64[ns]', freq='6H')
+
+    Specify ``start``, ``end``, and ``periods``; the frequency is generated
+    automatically (linearly spaced).
+
+    >>> pd.timedelta_range(start='1 day', end='5 days', periods=4)
+    TimedeltaIndex(['1 days 00:00:00', '2 days 08:00:00', '3 days 16:00:00',
+                '5 days 00:00:00'],
+               dtype='timedelta64[ns]', freq=None)
+    """
+    if freq is None and com._any_none(periods, start, end):
+        freq = 'D'
+
+    freq, freq_infer = dtl.maybe_infer_freq(freq)
+    tdarr = TimedeltaArray._generate_range(start, end, periods, freq,
+                                           closed=closed)
+    return TimedeltaIndex._simple_new(tdarr._data, freq=tdarr.freq, name=name)
diff --git a/pandas/core/indexing.py b/pandas/core/indexing.py
index c80e8c34aa88f..623a48acdd48b 100755
--- a/pandas/core/indexing.py
+++ b/pandas/core/indexing.py
@@ -1,27 +1,24 @@
 # pylint: disable=W0223
-
+import textwrap
 import warnings
+
 import numpy as np
-from pandas.compat import range, zip
+
+from pandas._libs.indexing import _NDFrameIndexerBase
+from pandas._libs.lib import item_from_zerodim
 import pandas.compat as compat
-from pandas.types.generic import ABCDataFrame, ABCPanel, ABCSeries
-from pandas.types.common import (is_integer_dtype,
-                                 is_integer, is_float,
-                                 is_list_like,
-                                 is_sequence,
-                                 is_iterator,
-                                 is_scalar,
-                                 is_sparse,
-                                 _is_unorderable_exception,
-                                 _ensure_platform_int)
-from pandas.types.missing import isnull, _infer_fill_value
+from pandas.compat import range, zip
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender
 
-from pandas.core.index import Index, MultiIndex
+from pandas.core.dtypes.common import (
+    ensure_platform_int, is_float, is_integer, is_integer_dtype, is_iterator,
+    is_list_like, is_scalar, is_sequence, is_sparse)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCPanel, ABCSeries
+from pandas.core.dtypes.missing import _infer_fill_value, isna
 
 import pandas.core.common as com
-from pandas.core.common import (is_bool_indexer, _asarray_tuplesafe,
-                                is_null_slice, is_full_slice,
-                                _values_from_object)
+from pandas.core.index import Index, MultiIndex
 
 
 # the supported indexers
@@ -45,6 +42,15 @@ class _IndexSlice(object):
     """
     Create an object to more easily perform multi-index slicing
 
+    See Also
+    --------
+    MultiIndex.remove_unused_levels : New MultiIndex with no unused levels.
+
+    Notes
+    -----
+    See :ref:`Defined Levels <advanced.shown_levels>`
+    for further info on slicing a MultiIndex.
+
     Examples
     --------
 
@@ -84,20 +90,17 @@ class IndexingError(Exception):
     pass
 
 
-class _NDFrameIndexer(object):
+class _NDFrameIndexer(_NDFrameIndexerBase):
     _valid_types = None
     _exception = KeyError
     axis = None
 
-    def __init__(self, obj, name):
-        self.obj = obj
-        self.ndim = obj.ndim
-        self.name = name
-
     def __call__(self, axis=None):
         # we need to return a copy of ourselves
-        new_self = self.__class__(self.obj, self.name)
+        new_self = self.__class__(self.name, self.obj)
 
+        if axis is not None:
+            axis = self.obj._get_axis_number(axis)
         new_self.axis = axis
         return new_self
 
@@ -106,9 +109,10 @@ def __iter__(self):
 
     def __getitem__(self, key):
         if type(key) is tuple:
-            key = tuple(com._apply_if_callable(x, self.obj) for x in key)
+            key = tuple(com.apply_if_callable(x, self.obj)
+                        for x in key)
             try:
-                values = self.obj.get_value(*key)
+                values = self.obj._get_value(*key)
                 if is_scalar(values):
                     return values
             except Exception:
@@ -116,28 +120,35 @@ def __getitem__(self, key):
 
             return self._getitem_tuple(key)
         else:
-            key = com._apply_if_callable(key, self.obj)
-            return self._getitem_axis(key, axis=0)
+            # we by definition only have the 0th axis
+            axis = self.axis or 0
+
+            key = com.apply_if_callable(key, self.obj)
+            return self._getitem_axis(key, axis=axis)
+
+    def _get_label(self, label, axis=None):
+        if axis is None:
+            axis = self.axis or 0
 
-    def _get_label(self, label, axis=0):
         if self.ndim == 1:
             # for perf reasons we want to try _xs first
             # as its basically direct indexing
             # but will fail when the index is not present
             # see GH5667
-            try:
-                return self.obj._xs(label, axis=axis)
-            except:
-                return self.obj[label]
+            return self.obj._xs(label, axis=axis)
         elif isinstance(label, tuple) and isinstance(label[axis], slice):
             raise IndexingError('no slices here, handle elsewhere')
 
         return self.obj._xs(label, axis=axis)
 
-    def _get_loc(self, key, axis=0):
+    def _get_loc(self, key, axis=None):
+        if axis is None:
+            axis = self.axis
         return self.obj._ixs(key, axis=axis)
 
-    def _slice(self, obj, axis=0, kind=None):
+    def _slice(self, obj, axis=None, kind=None):
+        if axis is None:
+            axis = self.axis
         return self.obj._slice(obj, axis=axis, kind=kind)
 
     def _get_setitem_indexer(self, key):
@@ -145,7 +156,8 @@ def _get_setitem_indexer(self, key):
             return self._convert_tuple(key, is_setter=True)
 
         axis = self.obj._get_axis(0)
-        if isinstance(axis, MultiIndex):
+
+        if isinstance(axis, MultiIndex) and self.name != 'iloc':
             try:
                 return axis.get_loc(key)
             except Exception:
@@ -171,39 +183,53 @@ def _get_setitem_indexer(self, key):
 
     def __setitem__(self, key, value):
         if isinstance(key, tuple):
-            key = tuple(com._apply_if_callable(x, self.obj) for x in key)
+            key = tuple(com.apply_if_callable(x, self.obj)
+                        for x in key)
         else:
-            key = com._apply_if_callable(key, self.obj)
+            key = com.apply_if_callable(key, self.obj)
         indexer = self._get_setitem_indexer(key)
         self._setitem_with_indexer(indexer, value)
 
-    def _has_valid_type(self, k, axis):
-        raise NotImplementedError()
+    def _validate_key(self, key, axis):
+        """
+        Ensure that key is valid for current indexer.
+
+        Parameters
+        ----------
+        key : scalar, slice or list-like
+            The key requested
+
+        axis : int
+            Dimension on which the indexing is being made
+
+        Raises
+        ------
+        TypeError
+            If the key (or some element of it) has wrong type
+
+        IndexError
+            If the key (or some element of it) is out of bounds
+
+        KeyError
+            If the key was not found
+        """
+        raise AbstractMethodError()
 
     def _has_valid_tuple(self, key):
         """ check the key for valid keys across my indexer """
         for i, k in enumerate(key):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
-            if not self._has_valid_type(k, i):
-                raise ValueError("Location based indexing can only have [%s] "
-                                 "types" % self._valid_types)
-
-    def _should_validate_iterable(self, axis=0):
-        """ return a boolean whether this axes needs validation for a passed
-        iterable
-        """
-        ax = self.obj._get_axis(axis)
-        if isinstance(ax, MultiIndex):
-            return False
-        elif ax.is_floating():
-            return False
-
-        return True
+            try:
+                self._validate_key(k, i)
+            except ValueError:
+                raise ValueError("Location based indexing can only have "
+                                 "[{types}] types"
+                                 .format(types=self._valid_types))
 
     def _is_nested_tuple_indexer(self, tup):
-        if any([isinstance(ax, MultiIndex) for ax in self.obj.axes]):
-            return any([is_nested_tuple(tup, ax) for ax in self.obj.axes])
+        if any(isinstance(ax, MultiIndex) for ax in self.obj.axes):
+            return any(is_nested_tuple(tup, ax) for ax in self.obj.axes)
         return False
 
     def _convert_tuple(self, key, is_setter=False):
@@ -230,6 +256,8 @@ def _convert_range(self, key, is_setter=False):
 
     def _convert_scalar_indexer(self, key, axis):
         # if we are accessing via lowered dim, use the last dim
+        if axis is None:
+            axis = 0
         ax = self.obj._get_axis(min(axis, self.ndim - 1))
         # a scalar
         return ax._convert_scalar_indexer(key, kind=self.name)
@@ -261,11 +289,11 @@ def _has_valid_positional_setitem_indexer(self, indexer):
                     pass
                 elif is_integer(i):
                     if i >= len(ax):
-                        raise IndexError("{0} cannot enlarge its target object"
-                                         .format(self.name))
+                        raise IndexError("{name} cannot enlarge its target "
+                                         "object".format(name=self.name))
                 elif isinstance(i, dict):
-                    raise IndexError("{0} cannot enlarge its target object"
-                                     .format(self.name))
+                    raise IndexError("{name} cannot enlarge its target object"
+                                     .format(name=self.name))
 
         return True
 
@@ -273,8 +301,7 @@ def _setitem_with_indexer(self, indexer, value):
         self._has_valid_setitem_indexer(indexer)
 
         # also has the side effect of consolidating in-place
-        # TODO: Panel, DataFrame are not imported, remove?
-        from pandas import Panel, DataFrame, Series  # noqa
+        from pandas import Series
         info_axis = self.obj._info_axis_number
 
         # maybe partial set
@@ -297,7 +324,7 @@ def _setitem_with_indexer(self, indexer, value):
                 # (not null slices) then we must take the split path, xref
                 # GH 10360
                 if (isinstance(ax, MultiIndex) and
-                        not (is_integer(i) or is_null_slice(i))):
+                        not (is_integer(i) or com.is_null_slice(i))):
                     take_split_path = True
                     break
 
@@ -321,11 +348,11 @@ def _setitem_with_indexer(self, indexer, value):
                         # must have all defined axes if we have a scalar
                         # or a list-like on the non-info axes if we have a
                         # list-like
-                        len_non_info_axes = [
+                        len_non_info_axes = (
                             len(_ax) for _i, _ax in enumerate(self.obj.axes)
                             if _i != i
-                        ]
-                        if any([not l for l in len_non_info_axes]):
+                        )
+                        if any(not l for l in len_non_info_axes):
                             if not is_list_like_indexer(value):
                                 raise ValueError("cannot set a frame with no "
                                                  "defined index and a scalar")
@@ -347,9 +374,9 @@ def _setitem_with_indexer(self, indexer, value):
                     # so the object is the same
                     index = self.obj._get_axis(i)
                     labels = index.insert(len(index), key)
-                    self.obj._data = self.obj.reindex_axis(labels, i)._data
+                    self.obj._data = self.obj.reindex(labels, axis=i)._data
                     self.obj._maybe_update_cacher(clear=True)
-                    self.obj.is_copy = None
+                    self.obj._is_copy = None
 
                     nindexer.append(labels.get_loc(key))
 
@@ -388,7 +415,8 @@ def _setitem_with_indexer(self, indexer, value):
                             new_values = np.concatenate([self.obj._values,
                                                          new_values])
                         except TypeError:
-                            new_values = np.concatenate([self.obj.asobject,
+                            as_obj = self.obj.astype(object)
+                            new_values = np.concatenate([as_obj,
                                                          new_values])
                     self.obj._data = self.obj._constructor(
                         new_values, index=new_index, name=self.obj.name)._data
@@ -501,8 +529,8 @@ def setter(item, v):
                 # multi-dim object
                 # GH6149 (null slice), GH10408 (full bounds)
                 if (isinstance(pi, tuple) and
-                        all(is_null_slice(idx) or
-                            is_full_slice(idx, len(self.obj))
+                        all(com.is_null_slice(idx) or
+                            com.is_full_slice(idx, len(self.obj))
                             for idx in pi)):
                     s = v
                 else:
@@ -517,17 +545,18 @@ def setter(item, v):
 
             def can_do_equal_len():
                 """ return True if we have an equal len settable """
-                if not len(labels) == 1 or not np.iterable(value):
+                if (not len(labels) == 1 or not np.iterable(value) or
+                        is_scalar(plane_indexer[0])):
                     return False
 
-                l = len(value)
                 item = labels[0]
                 index = self.obj[item].index
 
+                values_len = len(value)
                 # equal len list/ndarray
-                if len(index) == l:
+                if len(index) == values_len:
                     return True
-                elif lplane_indexer == l:
+                elif lplane_indexer == values_len:
                     return True
 
                 return False
@@ -553,7 +582,12 @@ def can_do_equal_len():
                         setter(item, v)
 
                 # we have an equal len ndarray/convertible to our labels
-                elif np.array(value).ndim == 2:
+                # hasattr first, to avoid coercing to ndarray without reason.
+                # But we may be relying on the ndarray coercion to check ndim.
+                # Why not just convert to an ndarray earlier on if needed?
+                elif ((hasattr(value, 'ndim') and value.ndim == 2)
+                      or (not hasattr(value, 'ndim') and
+                          np.array(value).ndim) == 2):
 
                     # note that this coerces the dtype if we are mixed
                     # GH 7551
@@ -595,12 +629,17 @@ def can_do_equal_len():
                 # logic here
                 if (len(indexer) > info_axis and
                         is_integer(indexer[info_axis]) and
-                        all(is_null_slice(idx) for i, idx in enumerate(indexer)
-                            if i != info_axis) and item_labels.is_unique):
+                        all(com.is_null_slice(idx)
+                            for i, idx in enumerate(indexer)
+                            if i != info_axis) and
+                        item_labels.is_unique):
                     self.obj[item_labels[indexer[info_axis]]] = value
                     return
 
             if isinstance(value, (ABCSeries, dict)):
+                # TODO(EA): ExtensionBlock.setitem this causes issues with
+                # setting for extensionarrays that store dicts. Need to decide
+                # if it's worth supporting that.
                 value = self._align_series(indexer, Series(value))
 
             elif isinstance(value, ABCDataFrame):
@@ -646,10 +685,11 @@ def _align_series(self, indexer, ser, multiindex_indexer=False):
         if isinstance(indexer, tuple):
 
             # flatten np.ndarray indexers
-            ravel = lambda i: i.ravel() if isinstance(i, np.ndarray) else i
+            def ravel(i):
+                return i.ravel() if isinstance(i, np.ndarray) else i
             indexer = tuple(map(ravel, indexer))
 
-            aligners = [not is_null_slice(idx) for idx in indexer]
+            aligners = [not com.is_null_slice(idx) for idx in indexer]
             sum_aligners = sum(aligners)
             single_aligner = sum_aligners == 1
             is_frame = self.obj.ndim == 2
@@ -673,13 +713,13 @@ def _align_series(self, indexer, ser, multiindex_indexer=False):
             # we have a frame, with multiple indexers on both axes; and a
             # series, so need to broadcast (see GH5206)
             if (sum_aligners == self.ndim and
-                    all([is_sequence(_) for _ in indexer])):
+                    all(is_sequence(_) for _ in indexer)):
                 ser = ser.reindex(obj.axes[0][indexer[0]], copy=True)._values
 
                 # single indexer
                 if len(indexer) > 1 and not multiindex_indexer:
-                    l = len(indexer[1])
-                    ser = np.tile(ser, l).reshape(l, -1).T
+                    len_indexer = len(indexer[1])
+                    ser = np.tile(ser, len_indexer).reshape(len_indexer, -1).T
 
                 return ser
 
@@ -688,7 +728,7 @@ def _align_series(self, indexer, ser, multiindex_indexer=False):
 
                 # multiple aligners (or null slices)
                 if is_sequence(idx) or isinstance(idx, slice):
-                    if single_aligner and is_null_slice(idx):
+                    if single_aligner and com.is_null_slice(idx):
                         continue
                     new_ix = ax[idx]
                     if not is_list_like_indexer(new_ix):
@@ -749,20 +789,17 @@ def _align_frame(self, indexer, df):
 
         if isinstance(indexer, tuple):
 
-            aligners = [not is_null_slice(idx) for idx in indexer]
-            sum_aligners = sum(aligners)
-            # TODO: single_aligner is not used
-            single_aligner = sum_aligners == 1  # noqa
-
             idx, cols = None, None
             sindexers = []
             for i, ix in enumerate(indexer):
                 ax = self.obj.axes[i]
                 if is_sequence(ix) or isinstance(ix, slice):
+                    if isinstance(ix, np.ndarray):
+                        ix = ix.ravel()
                     if idx is None:
-                        idx = ax[ix].ravel()
+                        idx = ax[ix]
                     elif cols is None:
-                        cols = ax[ix].ravel()
+                        cols = ax[ix]
                     else:
                         break
                 else:
@@ -824,9 +861,6 @@ def _align_frame(self, indexer, df):
         raise ValueError('Incompatible indexer with DataFrame')
 
     def _align_panel(self, indexer, df):
-        # TODO: is_frame, is_panel are unused
-        is_frame = self.obj.ndim == 2  # noqa
-        is_panel = self.obj.ndim >= 3  # noqa
         raise NotImplementedError("cannot set using an indexer with a Panel "
                                   "yet!")
 
@@ -849,7 +883,7 @@ def _getitem_tuple(self, tup):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 continue
 
             retval = getattr(retval, self.name)._getitem_axis(key, axis=i)
@@ -857,70 +891,59 @@ def _getitem_tuple(self, tup):
         return retval
 
     def _multi_take_opportunity(self, tup):
-        from pandas.core.generic import NDFrame
+        """
+        Check whether there is the possibility to use ``_multi_take``.
+        Currently the limit is that all axes being indexed must be indexed with
+        list-likes.
 
-        # ugly hack for GH #836
-        if not isinstance(self.obj, NDFrame):
-            return False
+        Parameters
+        ----------
+        tup : tuple
+            Tuple of indexers, one per axis
 
+        Returns
+        -------
+        boolean: Whether the current indexing can be passed through _multi_take
+        """
         if not all(is_list_like_indexer(x) for x in tup):
             return False
 
         # just too complicated
-        for indexer, ax in zip(tup, self.obj._data.axes):
-            if isinstance(ax, MultiIndex):
-                return False
-            elif is_bool_indexer(indexer):
-                return False
-            elif not ax.is_unique:
-                return False
+        if any(com.is_bool_indexer(x) for x in tup):
+            return False
 
         return True
 
     def _multi_take(self, tup):
-        """ create the reindex map for our objects, raise the _exception if we
-        can't create the indexer
         """
-        try:
-            o = self.obj
-            d = dict(
-                [(a, self._convert_for_reindex(t, axis=o._get_axis_number(a)))
-                 for t, a in zip(tup, o._AXIS_ORDERS)])
-            return o.reindex(**d)
-        except(KeyError, IndexingError):
-            raise self._exception
-
-    def _convert_for_reindex(self, key, axis=0):
-        labels = self.obj._get_axis(axis)
+        Create the indexers for the passed tuple of keys, and execute the take
+        operation. This allows the take operation to be executed all at once -
+        rather than once for each dimension - improving efficiency.
 
-        if is_bool_indexer(key):
-            key = check_bool_indexer(labels, key)
-            return labels[key]
-        else:
-            if isinstance(key, Index):
-                keyarr = labels._convert_index_indexer(key)
-            else:
-                # asarray can be unsafe, NumPy strings are weird
-                keyarr = _asarray_tuplesafe(key)
-
-            if is_integer_dtype(keyarr):
-                # Cast the indexer to uint64 if possible so
-                # that the values returned from indexing are
-                # also uint64.
-                keyarr = labels._convert_arr_indexer(keyarr)
+        Parameters
+        ----------
+        tup : tuple
+            Tuple of indexers, one per axis
 
-                if not labels.is_integer():
-                    keyarr = _ensure_platform_int(keyarr)
-                    return labels.take(keyarr)
+        Returns
+        -------
+        values: same type as the object being indexed
+        """
+        # GH 836
+        o = self.obj
+        d = {axis: self._get_listlike_indexer(key, axis)
+             for (key, axis) in zip(tup, o._AXIS_ORDERS)}
+        return o._reindex_with_indexers(d, copy=True, allow_dups=True)
 
-            return keyarr
+    def _convert_for_reindex(self, key, axis=None):
+        return key
 
     def _handle_lowerdim_multi_index_axis0(self, tup):
         # we have an axis0 multi-index, handle or raise
 
         try:
             # fast path for series or for tup devoid of slices
-            return self._get_label(tup, axis=0)
+            return self._get_label(tup, axis=self.axis)
         except TypeError:
             # slices are unhashable
             pass
@@ -987,6 +1010,10 @@ def _getitem_lowerdim(self, tup):
                     if len(new_key) == 1:
                         new_key, = new_key
 
+                # Slices should return views, but calling iloc/loc with a null
+                # slice returns a new object.
+                if com.is_null_slice(new_key):
+                    return section
                 # This is an elided recursive call to iloc/loc/etc'
                 return getattr(section, self.name)[new_key]
 
@@ -1006,7 +1033,7 @@ def _getitem_nested_tuple(self, tup):
 
             # this is a series with a multi-index specified a tuple of
             # selectors
-            return self._getitem_axis(tup, axis=0)
+            return self._getitem_axis(tup, axis=self.axis)
 
         # handle the multi-axis by taking sections and reducing
         # this is iterative
@@ -1014,7 +1041,7 @@ def _getitem_nested_tuple(self, tup):
         axis = 0
         for i, key in enumerate(tup):
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 axis += 1
                 continue
 
@@ -1040,10 +1067,14 @@ def _getitem_nested_tuple(self, tup):
 
         return obj
 
-    def _getitem_axis(self, key, axis=0):
+    def _getitem_axis(self, key, axis=None):
 
-        if self._should_validate_iterable(axis):
-            self._has_valid_type(key, axis)
+        if axis is None:
+            axis = self.axis or 0
+
+        if is_iterator(key):
+            key = list(key)
+        self._validate_key(key, axis)
 
         labels = self.obj._get_axis(axis)
         if isinstance(key, slice):
@@ -1075,61 +1106,171 @@ def _getitem_axis(self, key, axis=0):
 
             return self._get_label(key, axis=axis)
 
-    def _getitem_iterable(self, key, axis=0):
-        if self._should_validate_iterable(axis):
-            self._has_valid_type(key, axis)
+    def _get_listlike_indexer(self, key, axis, raise_missing=False):
+        """
+        Transform a list-like of keys into a new index and an indexer.
+
+        Parameters
+        ----------
+        key : list-like
+            Target labels
+        axis: int
+            Dimension on which the indexing is being made
+        raise_missing: bool
+            Whether to raise a KeyError if some labels are not found. Will be
+            removed in the future, and then this method will always behave as
+            if raise_missing=True.
+
+        Raises
+        ------
+        KeyError
+            If at least one key was requested but none was found, and
+            raise_missing=True.
+
+        Returns
+        -------
+        keyarr: Index
+            New index (coinciding with 'key' if the axis is unique)
+        values : array-like
+            An indexer for the return object; -1 denotes keys not found
+        """
+        o = self.obj
+        ax = o._get_axis(axis)
+
+        # Have the index compute an indexer or return None
+        # if it cannot handle:
+        indexer, keyarr = ax._convert_listlike_indexer(key,
+                                                       kind=self.name)
+        # We only act on all found values:
+        if indexer is not None and (indexer != -1).all():
+            self._validate_read_indexer(key, indexer, axis,
+                                        raise_missing=raise_missing)
+            return ax[indexer], indexer
+
+        if ax.is_unique:
+            # If we are trying to get actual keys from empty Series, we
+            # patiently wait for a KeyError later on - otherwise, convert
+            if len(ax) or not len(key):
+                key = self._convert_for_reindex(key, axis)
+            indexer = ax.get_indexer_for(key)
+            keyarr = ax.reindex(keyarr)[0]
+        else:
+            keyarr, indexer, new_indexer = ax._reindex_non_unique(keyarr)
+
+        self._validate_read_indexer(keyarr, indexer,
+                                    o._get_axis_number(axis),
+                                    raise_missing=raise_missing)
+        return keyarr, indexer
+
+    def _getitem_iterable(self, key, axis=None):
+        """
+        Index current object with an an iterable key (which can be a boolean
+        indexer, or a collection of keys).
+
+        Parameters
+        ----------
+        key : iterable
+            Target labels, or boolean indexer
+        axis: int, default None
+            Dimension on which the indexing is being made
+
+        Raises
+        ------
+        KeyError
+            If no key was found. Will change in the future to raise if not all
+            keys were found.
+        IndexingError
+            If the boolean indexer is unalignable with the object being
+            indexed.
+
+        Returns
+        -------
+        scalar, DataFrame, or Series: indexed value(s),
+        """
+
+        if axis is None:
+            axis = self.axis or 0
+
+        self._validate_key(key, axis)
 
         labels = self.obj._get_axis(axis)
 
-        if is_bool_indexer(key):
+        if com.is_bool_indexer(key):
+            # A boolean indexer
             key = check_bool_indexer(labels, key)
             inds, = key.nonzero()
-            return self.obj.take(inds, axis=axis, convert=False)
+            return self.obj._take(inds, axis=axis)
         else:
-            # Have the index compute an indexer or return None
-            # if it cannot handle
-            indexer, keyarr = labels._convert_listlike_indexer(
-                key, kind=self.name)
-            if indexer is not None:
-                return self.obj.take(indexer, axis=axis)
-
-            # existing labels are unique and indexer are unique
-            if labels.is_unique and Index(keyarr).is_unique:
-
-                try:
-                    return self.obj.reindex_axis(keyarr, axis=axis)
-                except AttributeError:
-
-                    # Series
-                    if axis != 0:
-                        raise AssertionError('axis must be 0')
-                    return self.obj.reindex(keyarr)
-
-            # existing labels are non-unique
-            else:
+            # A collection of keys
+            keyarr, indexer = self._get_listlike_indexer(key, axis,
+                                                         raise_missing=False)
+            return self.obj._reindex_with_indexers({axis: [keyarr, indexer]},
+                                                   copy=True, allow_dups=True)
 
-                # reindex with the specified axis
-                if axis + 1 > self.obj.ndim:
-                    raise AssertionError("invalid indexing error with "
-                                         "non-unique index")
+    def _validate_read_indexer(self, key, indexer, axis, raise_missing=False):
+        """
+        Check that indexer can be used to return a result (e.g. at least one
+        element was found, unless the list of keys was actually empty).
 
-                new_target, indexer, new_indexer = labels._reindex_non_unique(
-                    keyarr)
+        Parameters
+        ----------
+        key : list-like
+            Target labels (only used to show correct error message)
+        indexer: array-like of booleans
+            Indices corresponding to the key (with -1 indicating not found)
+        axis: int
+            Dimension on which the indexing is being made
+        raise_missing: bool
+            Whether to raise a KeyError if some labels are not found. Will be
+            removed in the future, and then this method will always behave as
+            if raise_missing=True.
+
+        Raises
+        ------
+        KeyError
+            If at least one key was requested but none was found, and
+            raise_missing=True.
+        """
 
-                if new_indexer is not None:
-                    result = self.obj.take(indexer[indexer != -1], axis=axis,
-                                           convert=False)
+        ax = self.obj._get_axis(axis)
 
-                    result = result._reindex_with_indexers(
-                        {axis: [new_target, new_indexer]},
-                        copy=True, allow_dups=True)
+        if len(key) == 0:
+            return
 
-                else:
-                    result = self.obj.take(indexer, axis=axis, convert=False)
+        # Count missing values:
+        missing = (indexer < 0).sum()
 
-                return result
+        if missing:
+            if missing == len(indexer):
+                raise KeyError(
+                    u"None of [{key}] are in the [{axis}]".format(
+                        key=key, axis=self.obj._get_axis_name(axis)))
+
+            # We (temporarily) allow for some missing keys with .loc, except in
+            # some cases (e.g. setting) in which "raise_missing" will be False
+            if not(self.name == 'loc' and not raise_missing):
+                not_found = list(set(key) - set(ax))
+                raise KeyError("{} not in index".format(not_found))
+
+            # we skip the warning on Categorical/Interval
+            # as this check is actually done (check for
+            # non-missing values), but a bit later in the
+            # code, so we want to avoid warning & then
+            # just raising
+
+            _missing_key_warning = textwrap.dedent("""
+            Passing list-likes to .loc or [] with any missing label will raise
+            KeyError in the future, you can use .reindex() as an alternative.
 
-    def _convert_to_indexer(self, obj, axis=0, is_setter=False):
+            See the documentation here:
+            https://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike""")  # noqa
+
+            if not (ax.is_categorical() or ax.is_interval()):
+                warnings.warn(_missing_key_warning,
+                              FutureWarning, stacklevel=6)
+
+    def _convert_to_indexer(self, obj, axis=None, is_setter=False,
+                            raise_missing=False):
         """
         Convert indexing key into something we can use to do actual fancy
         indexing on an ndarray
@@ -1140,10 +1281,13 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
         ix[['foo', 'bar', 'baz']] -> [i, j, k] (indices of foo, bar, baz)
 
         Going by Zen of Python?
-        "In the face of ambiguity, refuse the temptation to guess."
+        'In the face of ambiguity, refuse the temptation to guess.'
         raise AmbiguousIndexError with integer labels?
         - No, prefer label-based indexing
         """
+        if axis is None:
+            axis = self.axis or 0
+
         labels = self.obj._get_axis(axis)
 
         if isinstance(obj, slice):
@@ -1200,37 +1344,15 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
 
         elif is_list_like_indexer(obj):
 
-            if is_bool_indexer(obj):
+            if com.is_bool_indexer(obj):
                 obj = check_bool_indexer(labels, obj)
                 inds, = obj.nonzero()
                 return inds
             else:
-
-                # Have the index compute an indexer or return None
-                # if it cannot handle
-                indexer, objarr = labels._convert_listlike_indexer(
-                    obj, kind=self.name)
-                if indexer is not None:
-                    return indexer
-
-                # unique index
-                if labels.is_unique:
-                    indexer = check = labels.get_indexer(objarr)
-
-                # non-unique (dups)
-                else:
-                    (indexer,
-                     missing) = labels.get_indexer_non_unique(objarr)
-                    # 'indexer' has dupes, create 'check' using 'missing'
-                    check = np.zeros_like(objarr)
-                    check[missing] = -1
-
-                mask = check == -1
-                if mask.any():
-                    raise KeyError('%s not in index' % objarr[mask])
-
-                return _values_from_object(indexer)
-
+                # When setting, missing keys are not allowed, even with .loc:
+                kwargs = {'raise_missing': True if is_setter else
+                          raise_missing}
+                return self._get_listlike_indexer(obj, axis, **kwargs)[1]
         else:
             try:
                 return labels.get_loc(obj)
@@ -1245,23 +1367,29 @@ def _tuplify(self, loc):
         tup[0] = loc
         return tuple(tup)
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
         obj = self.obj
 
+        if axis is None:
+            axis = self.axis or 0
+
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
         indexer = self._convert_slice_indexer(slice_obj, axis)
 
         if isinstance(indexer, slice):
             return self._slice(indexer, axis=axis, kind='iloc')
         else:
-            return self.obj.take(indexer, axis=axis, convert=False)
+            return self.obj._take(indexer, axis=axis)
 
 
 class _IXIndexer(_NDFrameIndexer):
     """A primarily label-location based indexer, with integer position
     fallback.
 
+    Warning: Starting in 0.20.0, the .ix indexer is deprecated, in
+    favor of the more strict .iloc and .loc indexers.
+
     ``.ix[]`` supports mixed integer and label based access. It is
     primarily label based, but will fall back to integer positional
     access unless the corresponding axis is of integer type.
@@ -1269,35 +1397,34 @@ class _IXIndexer(_NDFrameIndexer):
     ``.ix`` is the most general indexer and will support any of the
     inputs in ``.loc`` and ``.iloc``. ``.ix`` also supports floating
     point label schemes. ``.ix`` is exceptionally useful when dealing
-    with mixed positional and label based hierachical indexes.
+    with mixed positional and label based hierarchical indexes.
 
     However, when an axis is integer based, ONLY label based access
     and not positional access is supported. Thus, in such cases, it's
     usually better to be explicit and use ``.iloc`` or ``.loc``.
 
     See more at :ref:`Advanced Indexing <advanced>`.
-
     """
 
-    def __init__(self, obj, name):
-
-        _ix_deprecation_warning = """
-.ix is deprecated. Please use
-.loc for label based indexing or
-.iloc for positional indexing
+    _ix_deprecation_warning = textwrap.dedent("""
+        .ix is deprecated. Please use
+        .loc for label based indexing or
+        .iloc for positional indexing
 
-See the documentation here:
-http://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate_ix"""
+        See the documentation here:
+        http://pandas.pydata.org/pandas-docs/stable/indexing.html#ix-indexer-is-deprecated""")  # noqa
 
-        warnings.warn(_ix_deprecation_warning,
-                      DeprecationWarning, stacklevel=3)
-        super(_IXIndexer, self).__init__(obj, name)
+    def __init__(self, name, obj):
+        warnings.warn(self._ix_deprecation_warning,
+                      DeprecationWarning, stacklevel=2)
+        super(_IXIndexer, self).__init__(name, obj)
 
-    def _has_valid_type(self, key, axis):
+    @Appender(_NDFrameIndexer._validate_key.__doc__)
+    def _validate_key(self, key, axis):
         if isinstance(key, slice):
             return True
 
-        elif is_bool_indexer(key):
+        elif com.is_bool_indexer(key):
             return True
 
         elif is_list_like_indexer(key):
@@ -1309,22 +1436,69 @@ def _has_valid_type(self, key, axis):
 
         return True
 
+    def _convert_for_reindex(self, key, axis=None):
+        """
+        Transform a list of keys into a new array ready to be used as axis of
+        the object we return (e.g. including NaNs).
+
+        Parameters
+        ----------
+        key : list-like
+            Target labels
+        axis: int
+            Where the indexing is being made
+
+        Returns
+        -------
+        list-like of labels
+        """
+
+        if axis is None:
+            axis = self.axis or 0
+        labels = self.obj._get_axis(axis)
+
+        if com.is_bool_indexer(key):
+            key = check_bool_indexer(labels, key)
+            return labels[key]
+
+        if isinstance(key, Index):
+            keyarr = labels._convert_index_indexer(key)
+        else:
+            # asarray can be unsafe, NumPy strings are weird
+            keyarr = com.asarray_tuplesafe(key)
+
+        if is_integer_dtype(keyarr):
+            # Cast the indexer to uint64 if possible so
+            # that the values returned from indexing are
+            # also uint64.
+            keyarr = labels._convert_arr_indexer(keyarr)
+
+            if not labels.is_integer():
+                keyarr = ensure_platform_int(keyarr)
+                return labels.take(keyarr)
+
+        return keyarr
+
 
 class _LocationIndexer(_NDFrameIndexer):
     _exception = Exception
 
     def __getitem__(self, key):
         if type(key) is tuple:
-            key = tuple(com._apply_if_callable(x, self.obj) for x in key)
+            key = tuple(com.apply_if_callable(x, self.obj)
+                        for x in key)
             try:
                 if self._is_scalar_access(key):
                     return self._getitem_scalar(key)
-            except (KeyError, IndexError):
+            except (KeyError, IndexError, AttributeError):
                 pass
             return self._getitem_tuple(key)
         else:
-            key = com._apply_if_callable(key, self.obj)
-            return self._getitem_axis(key, axis=0)
+            # we by definition only have the 0th axis
+            axis = self.axis or 0
+
+            maybe_callable = com.apply_if_callable(key, self.obj)
+            return self._getitem_axis(maybe_callable, axis=axis)
 
     def _is_scalar_access(self, key):
         raise NotImplementedError()
@@ -1332,23 +1506,28 @@ def _is_scalar_access(self, key):
     def _getitem_scalar(self, key):
         raise NotImplementedError()
 
-    def _getitem_axis(self, key, axis=0):
+    def _getitem_axis(self, key, axis=None):
         raise NotImplementedError()
 
-    def _getbool_axis(self, key, axis=0):
+    def _getbool_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
         labels = self.obj._get_axis(axis)
         key = check_bool_indexer(labels, key)
         inds, = key.nonzero()
         try:
-            return self.obj.take(inds, axis=axis, convert=False)
+            return self.obj._take(inds, axis=axis)
         except Exception as detail:
             raise self._exception(detail)
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
         """ this is pretty simple as we just have to deal with labels """
+        if axis is None:
+            axis = self.axis or 0
+
         obj = self.obj
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
 
         labels = obj._get_axis(axis)
         indexer = labels.slice_indexer(slice_obj.start, slice_obj.stop,
@@ -1357,11 +1536,12 @@ def _get_slice_axis(self, slice_obj, axis=0):
         if isinstance(indexer, slice):
             return self._slice(indexer, axis=axis, kind='iloc')
         else:
-            return self.obj.take(indexer, axis=axis, convert=False)
+            return self.obj._take(indexer, axis=axis)
 
 
 class _LocIndexer(_LocationIndexer):
-    """Purely label-location based indexer for selection by label.
+    """
+    Access a group of rows and columns by label(s) or a boolean array.
 
     ``.loc[]`` is primarily label based, but may also be used with a
     boolean array.
@@ -1372,75 +1552,252 @@ class _LocIndexer(_LocationIndexer):
       interpreted as a *label* of the index, and **never** as an
       integer position along the index).
     - A list or array of labels, e.g. ``['a', 'b', 'c']``.
-    - A slice object with labels, e.g. ``'a':'f'`` (note that contrary
-      to usual python slices, **both** the start and the stop are included!).
-    - A boolean array.
+    - A slice object with labels, e.g. ``'a':'f'``.
+
+      .. warning:: Note that contrary to usual python slices, **both** the
+          start and the stop are included
+
+    - A boolean array of the same length as the axis being sliced,
+      e.g. ``[True, False, True]``.
     - A ``callable`` function with one argument (the calling Series, DataFrame
       or Panel) and that returns valid output for indexing (one of the above)
 
-    ``.loc`` will raise a ``KeyError`` when the items are not found.
-
     See more at :ref:`Selection by Label <indexing.label>`
 
-    """
+    Raises
+    ------
+    KeyError:
+        when any items are not found
 
-    _valid_types = ("labels (MUST BE IN THE INDEX), slices of labels (BOTH "
-                    "endpoints included! Can be slices of integers if the "
-                    "index is integers), listlike of labels, boolean")
-    _exception = KeyError
+    See Also
+    --------
+    DataFrame.at : Access a single value for a row/column label pair.
+    DataFrame.iloc : Access group of rows and columns by integer position(s).
+    DataFrame.xs : Returns a cross-section (row(s) or column(s)) from the
+        Series/DataFrame.
+    Series.loc : Access group of values using labels.
 
-    def _has_valid_type(self, key, axis):
-        ax = self.obj._get_axis(axis)
+    Examples
+    --------
+    **Getting values**
 
-        # valid for a label where all labels are in the index
-        # slice of lables (where start-end in labels)
-        # slice of integers (only if in the lables)
-        # boolean
+    >>> df = pd.DataFrame([[1, 2], [4, 5], [7, 8]],
+    ...      index=['cobra', 'viper', 'sidewinder'],
+    ...      columns=['max_speed', 'shield'])
+    >>> df
+                max_speed  shield
+    cobra               1       2
+    viper               4       5
+    sidewinder          7       8
 
-        if isinstance(key, slice):
-            return True
+    Single label. Note this returns the row as a Series.
 
-        elif is_bool_indexer(key):
-            return True
+    >>> df.loc['viper']
+    max_speed    4
+    shield       5
+    Name: viper, dtype: int64
 
-        elif is_list_like_indexer(key):
+    List of labels. Note using ``[[]]`` returns a DataFrame.
 
-            # mi is just a passthru
-            if isinstance(key, tuple) and isinstance(ax, MultiIndex):
-                return True
+    >>> df.loc[['viper', 'sidewinder']]
+                max_speed  shield
+    viper               4       5
+    sidewinder          7       8
 
-            # TODO: don't check the entire key unless necessary
-            if (not is_iterator(key) and len(key) and
-                    np.all(ax.get_indexer_for(key) < 0)):
+    Single label for row and column
 
-                raise KeyError("None of [%s] are in the [%s]" %
-                               (key, self.obj._get_axis_name(axis)))
+    >>> df.loc['cobra', 'shield']
+    2
 
-            return True
+    Slice with labels for row and single label for column. As mentioned
+    above, note that both the start and stop of the slice are included.
 
-        else:
+    >>> df.loc['cobra':'viper', 'max_speed']
+    cobra    1
+    viper    4
+    Name: max_speed, dtype: int64
 
-            def error():
-                if isnull(key):
-                    raise TypeError("cannot use label indexing with a null "
-                                    "key")
-                raise KeyError("the label [%s] is not in the [%s]" %
-                               (key, self.obj._get_axis_name(axis)))
+    Boolean list with the same length as the row axis
+
+    >>> df.loc[[False, False, True]]
+                max_speed  shield
+    sidewinder          7       8
+
+    Conditional that returns a boolean Series
 
-            try:
-                key = self._convert_scalar_indexer(key, axis)
-                if key not in ax:
-                    error()
-            except TypeError as e:
-
-                # python 3 type errors should be raised
-                if _is_unorderable_exception(e):
-                    error()
-                raise
-            except:
-                error()
+    >>> df.loc[df['shield'] > 6]
+                max_speed  shield
+    sidewinder          7       8
 
-        return True
+    Conditional that returns a boolean Series with column labels specified
+
+    >>> df.loc[df['shield'] > 6, ['max_speed']]
+                max_speed
+    sidewinder          7
+
+    Callable that returns a boolean Series
+
+    >>> df.loc[lambda df: df['shield'] == 8]
+                max_speed  shield
+    sidewinder          7       8
+
+    **Setting values**
+
+    Set value for all items matching the list of labels
+
+    >>> df.loc[['viper', 'sidewinder'], ['shield']] = 50
+    >>> df
+                max_speed  shield
+    cobra               1       2
+    viper               4      50
+    sidewinder          7      50
+
+    Set value for an entire row
+
+    >>> df.loc['cobra'] = 10
+    >>> df
+                max_speed  shield
+    cobra              10      10
+    viper               4      50
+    sidewinder          7      50
+
+    Set value for an entire column
+
+    >>> df.loc[:, 'max_speed'] = 30
+    >>> df
+                max_speed  shield
+    cobra              30      10
+    viper              30      50
+    sidewinder         30      50
+
+    Set value for rows matching callable condition
+
+    >>> df.loc[df['shield'] > 35] = 0
+    >>> df
+                max_speed  shield
+    cobra              30      10
+    viper               0       0
+    sidewinder          0       0
+
+    **Getting values on a DataFrame with an index that has integer labels**
+
+    Another example using integers for the index
+
+    >>> df = pd.DataFrame([[1, 2], [4, 5], [7, 8]],
+    ...      index=[7, 8, 9], columns=['max_speed', 'shield'])
+    >>> df
+       max_speed  shield
+    7          1       2
+    8          4       5
+    9          7       8
+
+    Slice with integer labels for rows. As mentioned above, note that both
+    the start and stop of the slice are included.
+
+    >>> df.loc[7:9]
+       max_speed  shield
+    7          1       2
+    8          4       5
+    9          7       8
+
+    **Getting values with a MultiIndex**
+
+    A number of examples using a DataFrame with a MultiIndex
+
+    >>> tuples = [
+    ...    ('cobra', 'mark i'), ('cobra', 'mark ii'),
+    ...    ('sidewinder', 'mark i'), ('sidewinder', 'mark ii'),
+    ...    ('viper', 'mark ii'), ('viper', 'mark iii')
+    ... ]
+    >>> index = pd.MultiIndex.from_tuples(tuples)
+    >>> values = [[12, 2], [0, 4], [10, 20],
+    ...         [1, 4], [7, 1], [16, 36]]
+    >>> df = pd.DataFrame(values, columns=['max_speed', 'shield'], index=index)
+    >>> df
+                         max_speed  shield
+    cobra      mark i           12       2
+               mark ii           0       4
+    sidewinder mark i           10      20
+               mark ii           1       4
+    viper      mark ii           7       1
+               mark iii         16      36
+
+    Single label. Note this returns a DataFrame with a single index.
+
+    >>> df.loc['cobra']
+             max_speed  shield
+    mark i          12       2
+    mark ii          0       4
+
+    Single index tuple. Note this returns a Series.
+
+    >>> df.loc[('cobra', 'mark ii')]
+    max_speed    0
+    shield       4
+    Name: (cobra, mark ii), dtype: int64
+
+    Single label for row and column. Similar to passing in a tuple, this
+    returns a Series.
+
+    >>> df.loc['cobra', 'mark i']
+    max_speed    12
+    shield        2
+    Name: (cobra, mark i), dtype: int64
+
+    Single tuple. Note using ``[[]]`` returns a DataFrame.
+
+    >>> df.loc[[('cobra', 'mark ii')]]
+                   max_speed  shield
+    cobra mark ii          0       4
+
+    Single tuple for the index with a single label for the column
+
+    >>> df.loc[('cobra', 'mark i'), 'shield']
+    2
+
+    Slice from index tuple to single label
+
+    >>> df.loc[('cobra', 'mark i'):'viper']
+                         max_speed  shield
+    cobra      mark i           12       2
+               mark ii           0       4
+    sidewinder mark i           10      20
+               mark ii           1       4
+    viper      mark ii           7       1
+               mark iii         16      36
+
+    Slice from index tuple to index tuple
+
+    >>> df.loc[('cobra', 'mark i'):('viper', 'mark ii')]
+                        max_speed  shield
+    cobra      mark i          12       2
+               mark ii          0       4
+    sidewinder mark i          10      20
+               mark ii          1       4
+    viper      mark ii          7       1
+    """
+
+    _valid_types = ("labels (MUST BE IN THE INDEX), slices of labels (BOTH "
+                    "endpoints included! Can be slices of integers if the "
+                    "index is integers), listlike of labels, boolean")
+    _exception = KeyError
+
+    @Appender(_NDFrameIndexer._validate_key.__doc__)
+    def _validate_key(self, key, axis):
+
+        # valid for a collection of labels (we check their presence later)
+        # slice of labels (where start-end in labels)
+        # slice of integers (only if in the labels)
+        # boolean
+
+        if isinstance(key, slice):
+            return
+
+        if com.is_bool_indexer(key):
+            return
+
+        if not is_list_like_indexer(key):
+            self._convert_scalar_indexer(key, axis)
 
     def _is_scalar_access(self, key):
         # this is a shortcut accessor to both .loc and .iloc
@@ -1469,15 +1826,15 @@ def _is_scalar_access(self, key):
     def _getitem_scalar(self, key):
         # a fast-path to scalar access
         # if not, raise
-        values = self.obj.get_value(*key)
+        values = self.obj._get_value(*key)
         return values
 
     def _get_partial_string_timestamp_match_key(self, key, labels):
         """Translate any partial string timestamp matches in key, returning the
         new key (GH 10331)"""
         if isinstance(labels, MultiIndex):
-            if isinstance(key, compat.string_types) and \
-                    labels.levels[0].is_all_dates:
+            if (isinstance(key, compat.string_types) and
+                    labels.levels[0].is_all_dates):
                 # Convert key '2016-01-01' to
                 # ('2016-01-01'[, slice(None, None, None)]+)
                 key = tuple([key] + [slice(None)] * (len(labels.levels) - 1))
@@ -1487,8 +1844,8 @@ def _get_partial_string_timestamp_match_key(self, key, labels):
                 # (..., slice('2016-01-01', '2016-01-01', None), ...)
                 new_key = []
                 for i, component in enumerate(key):
-                    if isinstance(component, compat.string_types) and \
-                            labels.levels[i].is_all_dates:
+                    if (isinstance(component, compat.string_types) and
+                            labels.levels[i].is_all_dates):
                         new_key.append(slice(component, component, None))
                     else:
                         new_key.append(component)
@@ -1496,14 +1853,21 @@ def _get_partial_string_timestamp_match_key(self, key, labels):
 
         return key
 
-    def _getitem_axis(self, key, axis=0):
+    def _getitem_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
+
+        key = item_from_zerodim(key)
+        if is_iterator(key):
+            key = list(key)
+
         labels = self.obj._get_axis(axis)
         key = self._get_partial_string_timestamp_match_key(key, labels)
 
         if isinstance(key, slice):
-            self._has_valid_type(key, axis)
+            self._validate_key(key, axis)
             return self._get_slice_axis(key, axis=axis)
-        elif is_bool_indexer(key):
+        elif com.is_bool_indexer(key):
             return self._getbool_axis(key, axis=axis)
         elif is_list_like_indexer(key):
 
@@ -1547,12 +1911,13 @@ def _getitem_axis(self, key, axis=0):
                 return self.obj.iloc[tuple(indexer)]
 
         # fall thru to straight lookup
-        self._has_valid_type(key, axis)
+        self._validate_key(key, axis)
         return self._get_label(key, axis=axis)
 
 
 class _iLocIndexer(_LocationIndexer):
-    """Purely integer-location based indexing for selection by position.
+    """
+    Purely integer-location based indexing for selection by position.
 
     ``.iloc[]`` is primarily integer position based (from ``0`` to
     ``length-1`` of the axis), but may also be used with a boolean
@@ -1565,22 +1930,133 @@ class _iLocIndexer(_LocationIndexer):
     - A slice object with ints, e.g. ``1:7``.
     - A boolean array.
     - A ``callable`` function with one argument (the calling Series, DataFrame
-      or Panel) and that returns valid output for indexing (one of the above)
+      or Panel) and that returns valid output for indexing (one of the above).
+      This is useful in method chains, when you don't have a reference to the
+      calling object, but would like to base your selection on some value.
 
     ``.iloc`` will raise ``IndexError`` if a requested indexer is
     out-of-bounds, except *slice* indexers which allow out-of-bounds
     indexing (this conforms with python/numpy *slice* semantics).
 
-    See more at :ref:`Selection by Position <indexing.integer>`
+    See more at ref:`Selection by Position <indexing.integer>`.
+
+    See Also
+    --------
+    DataFrame.iat : Fast integer location scalar accessor.
+    DataFrame.loc : Purely label-location based indexer for selection by label.
+    Series.iloc : Purely integer-location based indexing for
+                   selection by position.
+
+    Examples
+    --------
+
+    >>> mydict = [{'a': 1, 'b': 2, 'c': 3, 'd': 4},
+    ...           {'a': 100, 'b': 200, 'c': 300, 'd': 400},
+    ...           {'a': 1000, 'b': 2000, 'c': 3000, 'd': 4000 }]
+    >>> df = pd.DataFrame(mydict)
+    >>> df
+          a     b     c     d
+    0     1     2     3     4
+    1   100   200   300   400
+    2  1000  2000  3000  4000
+
+    **Indexing just the rows**
+
+    With a scalar integer.
+
+    >>> type(df.iloc[0])
+    <class 'pandas.core.series.Series'>
+    >>> df.iloc[0]
+    a    1
+    b    2
+    c    3
+    d    4
+    Name: 0, dtype: int64
+
+    With a list of integers.
+
+    >>> df.iloc[[0]]
+       a  b  c  d
+    0  1  2  3  4
+    >>> type(df.iloc[[0]])
+    <class 'pandas.core.frame.DataFrame'>
+
+    >>> df.iloc[[0, 1]]
+         a    b    c    d
+    0    1    2    3    4
+    1  100  200  300  400
+
+    With a `slice` object.
+
+    >>> df.iloc[:3]
+          a     b     c     d
+    0     1     2     3     4
+    1   100   200   300   400
+    2  1000  2000  3000  4000
+
+    With a boolean mask the same length as the index.
+
+    >>> df.iloc[[True, False, True]]
+          a     b     c     d
+    0     1     2     3     4
+    2  1000  2000  3000  4000
+
+    With a callable, useful in method chains. The `x` passed
+    to the ``lambda`` is the DataFrame being sliced. This selects
+    the rows whose index label even.
+
+    >>> df.iloc[lambda x: x.index % 2 == 0]
+          a     b     c     d
+    0     1     2     3     4
+    2  1000  2000  3000  4000
+
+    **Indexing both axes**
+
+    You can mix the indexer types for the index and columns. Use ``:`` to
+    select the entire axis.
 
+    With scalar integers.
+
+    >>> df.iloc[0, 1]
+    2
+
+    With lists of integers.
+
+    >>> df.iloc[[0, 2], [1, 3]]
+          b     d
+    0     2     4
+    2  2000  4000
+
+    With `slice` objects.
+
+    >>> df.iloc[1:3, 0:3]
+          a     b     c
+    1   100   200   300
+    2  1000  2000  3000
+
+    With a boolean array whose length matches the columns.
+
+    >>> df.iloc[:, [True, False, True, False]]
+          a     c
+    0     1     3
+    1   100   300
+    2  1000  3000
+
+    With a callable function that expects the Series or DataFrame.
+
+    >>> df.iloc[:, lambda df: [0, 2]]
+          a     c
+    0     1     3
+    1   100   300
+    2  1000  3000
     """
 
     _valid_types = ("integer, integer slice (START point is INCLUDED, END "
                     "point is EXCLUDED), listlike of integers, boolean array")
     _exception = IndexError
 
-    def _has_valid_type(self, key, axis):
-        if is_bool_indexer(key):
+    def _validate_key(self, key, axis):
+        if com.is_bool_indexer(key):
             if hasattr(key, 'index') and isinstance(key.index, Index):
                 if key.index.inferred_type == 'integer':
                     raise NotImplementedError("iLocation based boolean "
@@ -1588,15 +2064,26 @@ def _has_valid_type(self, key, axis):
                                               "is not available")
                 raise ValueError("iLocation based boolean indexing cannot use "
                                  "an indexable as a mask")
-            return True
+            return
 
         if isinstance(key, slice):
-            return True
+            return
         elif is_integer(key):
-            return self._is_valid_integer(key, axis)
+            self._validate_integer(key, axis)
+        elif isinstance(key, tuple):
+            # a tuple should already have been caught by this point
+            # so don't treat a tuple as a valid indexer
+            raise IndexingError('Too many indexers')
         elif is_list_like_indexer(key):
-            return self._is_valid_list_like(key, axis)
-        return False
+            # check that the key does not exceed the maximum size of the index
+            arr = np.array(key)
+            len_axis = len(self.obj._get_axis(axis))
+
+            if len(arr) and (arr.max() >= len_axis or arr.min() < -len_axis):
+                raise IndexError("positional indexers are out-of-bounds")
+        else:
+            raise ValueError("Can only index by location with "
+                             "a [{types}]".format(types=self._valid_types))
 
     def _has_valid_setitem_indexer(self, indexer):
         self._has_valid_positional_setitem_indexer(indexer)
@@ -1625,43 +2112,40 @@ def _is_scalar_access(self, key):
     def _getitem_scalar(self, key):
         # a fast-path to scalar access
         # if not, raise
-        values = self.obj.get_value(*key, takeable=True)
+        values = self.obj._get_value(*key, takeable=True)
         return values
 
-    def _is_valid_integer(self, key, axis):
-        # return a boolean if we have a valid integer indexer
-
-        ax = self.obj._get_axis(axis)
-        l = len(ax)
-        if key >= l or key < -l:
-            raise IndexError("single positional indexer is out-of-bounds")
-        return True
+    def _validate_integer(self, key, axis):
+        """
+        Check that 'key' is a valid position in the desired axis.
 
-    def _is_valid_list_like(self, key, axis):
-        # return a boolean if we are a valid list-like (e.g. that we don't
-        # have out-of-bounds values)
+        Parameters
+        ----------
+        key : int
+            Requested position
+        axis : int
+            Desired axis
 
-        # a tuple should already have been caught by this point
-        # so don't treat a tuple as a valid indexer
-        if isinstance(key, tuple):
-            raise IndexingError('Too many indexers')
+        Returns
+        -------
+        None
 
-        # coerce the key to not exceed the maximum size of the index
-        arr = np.array(key)
-        ax = self.obj._get_axis(axis)
-        l = len(ax)
-        if (hasattr(arr, '__len__') and len(arr) and
-                (arr.max() >= l or arr.min() < -l)):
-            raise IndexError("positional indexers are out-of-bounds")
+        Raises
+        ------
+        IndexError
+            If 'key' is not a valid position in axis 'axis'
+        """
 
-        return True
+        len_axis = len(self.obj._get_axis(axis))
+        if key >= len_axis or key < -len_axis:
+            raise IndexError("single positional indexer is out-of-bounds")
 
     def _getitem_tuple(self, tup):
 
         self._has_valid_tuple(tup)
         try:
             return self._getitem_lowerdim(tup)
-        except:
+        except IndexingError:
             pass
 
         retval = self.obj
@@ -1670,7 +2154,7 @@ def _getitem_tuple(self, tup):
             if i >= self.obj.ndim:
                 raise IndexingError('Too many indexers')
 
-            if is_null_slice(key):
+            if com.is_null_slice(key):
                 axis += 1
                 continue
 
@@ -1685,47 +2169,53 @@ def _getitem_tuple(self, tup):
 
         return retval
 
-    def _get_slice_axis(self, slice_obj, axis=0):
+    def _get_slice_axis(self, slice_obj, axis=None):
+        if axis is None:
+            axis = self.axis or 0
         obj = self.obj
 
         if not need_slice(slice_obj):
-            return obj
+            return obj.copy(deep=False)
 
         slice_obj = self._convert_slice_indexer(slice_obj, axis)
         if isinstance(slice_obj, slice):
             return self._slice(slice_obj, axis=axis, kind='iloc')
         else:
-            return self.obj.take(slice_obj, axis=axis, convert=False)
+            return self.obj._take(slice_obj, axis=axis)
 
-    def _get_list_axis(self, key_list, axis=0):
+    def _get_list_axis(self, key, axis=None):
         """
         Return Series values by list or array of integers
 
         Parameters
         ----------
-        key_list : list-like positional indexer
+        key : list-like positional indexer
         axis : int (can only be zero)
 
         Returns
         -------
         Series object
         """
+        if axis is None:
+            axis = self.axis or 0
+        try:
+            return self.obj._take(key, axis=axis)
+        except IndexError:
+            # re-raise with different error message
+            raise IndexError("positional indexers are out-of-bounds")
 
-        # validate list bounds
-        self._is_valid_list_like(key_list, axis)
-
-        # force an actual list
-        key_list = list(key_list)
-        return self.obj.take(key_list, axis=axis, convert=False)
-
-    def _getitem_axis(self, key, axis=0):
+    def _getitem_axis(self, key, axis=None):
+        if axis is None:
+            axis = self.axis or 0
 
         if isinstance(key, slice):
-            self._has_valid_type(key, axis)
             return self._get_slice_axis(key, axis=axis)
 
-        elif is_bool_indexer(key):
-            self._has_valid_type(key, axis)
+        if isinstance(key, list):
+            key = np.asarray(key)
+
+        if com.is_bool_indexer(key):
+            self._validate_key(key, axis)
             return self._getbool_axis(key, axis=axis)
 
         # a list of integers
@@ -1734,19 +2224,20 @@ def _getitem_axis(self, key, axis=0):
 
         # a single integer
         else:
-            key = self._convert_scalar_indexer(key, axis)
-
+            key = item_from_zerodim(key)
             if not is_integer(key):
                 raise TypeError("Cannot index by location index with a "
                                 "non-integer key")
 
             # validate the location
-            self._is_valid_integer(key, axis)
+            self._validate_integer(key, axis)
 
             return self._get_loc(key, axis=axis)
 
-    def _convert_to_indexer(self, obj, axis=0, is_setter=False):
+    def _convert_to_indexer(self, obj, axis=None, is_setter=False):
         """ much simpler as we only have to deal with our valid types """
+        if axis is None:
+            axis = self.axis or 0
 
         # make need to convert a float key
         if isinstance(obj, slice):
@@ -1755,11 +2246,12 @@ def _convert_to_indexer(self, obj, axis=0, is_setter=False):
         elif is_float(obj):
             return self._convert_scalar_indexer(obj, axis)
 
-        elif self._has_valid_type(obj, axis):
+        try:
+            self._validate_key(obj, axis)
             return obj
-
-        raise ValueError("Can only index by location with a [%s]" %
-                         self._valid_types)
+        except ValueError:
+            raise ValueError("Can only index by location with "
+                             "a [{types}]".format(types=self._valid_types))
 
 
 class _ScalarAccessIndexer(_NDFrameIndexer):
@@ -1778,14 +2270,15 @@ def __getitem__(self, key):
                 raise ValueError('Invalid call for scalar access (getting)!')
 
         key = self._convert_key(key)
-        return self.obj.get_value(*key, takeable=self._takeable)
+        return self.obj._get_value(*key, takeable=self._takeable)
 
     def __setitem__(self, key, value):
         if isinstance(key, tuple):
-            key = tuple(com._apply_if_callable(x, self.obj) for x in key)
+            key = tuple(com.apply_if_callable(x, self.obj)
+                        for x in key)
         else:
             # scalar callable may return tuple
-            key = com._apply_if_callable(key, self.obj)
+            key = com.apply_if_callable(key, self.obj)
 
         if not isinstance(key, tuple):
             key = self._tuplify(key)
@@ -1794,15 +2287,54 @@ def __setitem__(self, key, value):
                              '(setting)!')
         key = list(self._convert_key(key, is_setter=True))
         key.append(value)
-        self.obj.set_value(*key, takeable=self._takeable)
+        self.obj._set_value(*key, takeable=self._takeable)
 
 
 class _AtIndexer(_ScalarAccessIndexer):
-    """Fast label-based scalar accessor
+    """
+    Access a single value for a row/column label pair.
+
+    Similar to ``loc``, in that both provide label-based lookups. Use
+    ``at`` if you only need to get or set a single value in a DataFrame
+    or Series.
 
-    Similarly to ``loc``, ``at`` provides **label** based scalar lookups.
-    You can also set using these indexers.
+    Raises
+    ------
+    KeyError
+        When label does not exist in DataFrame
+
+    See Also
+    --------
+    DataFrame.iat : Access a single value for a row/column pair by integer
+        position.
+    DataFrame.loc : Access a group of rows and columns by label(s).
+    Series.at : Access a single value using a label.
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[0, 2, 3], [0, 4, 1], [10, 20, 30]],
+    ...                   index=[4, 5, 6], columns=['A', 'B', 'C'])
+    >>> df
+        A   B   C
+    4   0   2   3
+    5   0   4   1
+    6  10  20  30
 
+    Get value at specified row/column pair
+
+    >>> df.at[4, 'B']
+    2
+
+    Set value at specified row/column pair
+
+    >>> df.at[4, 'B'] = 10
+    >>> df.at[4, 'B']
+    10
+
+    Get value within a Series
+
+    >>> df.loc[5].at['B']
+    4
     """
 
     _takeable = False
@@ -1822,7 +2354,7 @@ def _convert_key(self, key, is_setter=False):
                     raise ValueError("At based indexing on an integer index "
                                      "can only have integer indexers")
             else:
-                if is_integer(i):
+                if is_integer(i) and not ax.holds_integer():
                     raise ValueError("At based indexing on an non-integer "
                                      "index can only have non-integer "
                                      "indexers")
@@ -1830,11 +2362,49 @@ def _convert_key(self, key, is_setter=False):
 
 
 class _iAtIndexer(_ScalarAccessIndexer):
-    """Fast integer location scalar accessor.
+    """
+    Access a single value for a row/column pair by integer position.
+
+    Similar to ``iloc``, in that both provide integer-based lookups. Use
+    ``iat`` if you only need to get or set a single value in a DataFrame
+    or Series.
+
+    Raises
+    ------
+    IndexError
+        When integer position is out of bounds
+
+    See Also
+    --------
+    DataFrame.at : Access a single value for a row/column label pair.
+    DataFrame.loc : Access a group of rows and columns by label(s).
+    DataFrame.iloc : Access a group of rows and columns by integer position(s).
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[0, 2, 3], [0, 4, 1], [10, 20, 30]],
+    ...                   columns=['A', 'B', 'C'])
+    >>> df
+        A   B   C
+    0   0   2   3
+    1   0   4   1
+    2  10  20  30
+
+    Get value at specified row/column pair
 
-    Similarly to ``iloc``, ``iat`` provides **integer** based lookups.
-    You can also set using these indexers.
+    >>> df.iat[1, 2]
+    1
 
+    Set value at specified row/column pair
+
+    >>> df.iat[1, 2] = 10
+    >>> df.iat[1, 2]
+    10
+
+    Get value within a series
+
+    >>> df.loc[0].iat[1]
+    2
     """
 
     _takeable = True
@@ -1843,7 +2413,7 @@ def _has_valid_setitem_indexer(self, indexer):
         self._has_valid_positional_setitem_indexer(indexer)
 
     def _convert_key(self, key, is_setter=False):
-        """ require  integer args (and convert to label arguments) """
+        """ require integer args (and convert to label arguments) """
         for a, i in zip(self.obj.axes, key):
             if not is_integer(i):
                 raise ValueError("iAt based indexing can only have integer "
@@ -1851,26 +2421,23 @@ def _convert_key(self, key, is_setter=False):
         return key
 
 
-# 32-bit floating point machine epsilon
-_eps = 1.1920929e-07
-
-
 def length_of_indexer(indexer, target=None):
-    """return the length of a single non-tuple indexer which could be a slice
+    """
+    return the length of a single non-tuple indexer which could be a slice
     """
     if target is not None and isinstance(indexer, slice):
-        l = len(target)
+        target_len = len(target)
         start = indexer.start
         stop = indexer.stop
         step = indexer.step
         if start is None:
             start = 0
         elif start < 0:
-            start += l
-        if stop is None or stop > l:
-            stop = l
+            start += target_len
+        if stop is None or stop > target_len:
+            stop = target_len
         elif stop < 0:
-            stop += l
+            stop += target_len
         if step is None:
             step = 1
         elif step < 0:
@@ -1884,7 +2451,8 @@ def length_of_indexer(indexer, target=None):
 
 
 def convert_to_index_sliceable(obj, key):
-    """if we are index sliceable, then return my slicer, otherwise return None
+    """
+    if we are index sliceable, then return my slicer, otherwise return None
     """
     idx = obj.index
     if isinstance(key, slice):
@@ -1893,7 +2461,7 @@ def convert_to_index_sliceable(obj, key):
     elif isinstance(key, compat.string_types):
 
         # we are an actual column
-        if key in obj._data.items:
+        if obj._data.items.contains(key):
             return None
 
         # We might have a datetimelike string that we can translate to a
@@ -1907,19 +2475,6 @@ def convert_to_index_sliceable(obj, key):
     return None
 
 
-def is_index_slice(obj):
-    def _is_valid_index(x):
-        return (is_integer(x) or is_float(x) and
-                np.allclose(x, int(x), rtol=_eps, atol=0))
-
-    def _crit(v):
-        return v is None or _is_valid_index(v)
-
-    both_none = obj.start is None and obj.stop is None
-
-    return not both_none and (_crit(obj.start) and _crit(obj.stop))
-
-
 def check_bool_indexer(ax, key):
     # boolean indexing, need to check that the data are aligned, otherwise
     # disallowed
@@ -1929,7 +2484,7 @@ def check_bool_indexer(ax, key):
     result = key
     if isinstance(key, ABCSeries) and not key.index.equals(ax):
         result = result.reindex(ax)
-        mask = isnull(result._values)
+        mask = isna(result._values)
         if mask.any():
             raise IndexingError('Unalignable boolean Series provided as '
                                 'indexer (index of the boolean Series and of '
@@ -1946,8 +2501,53 @@ def check_bool_indexer(ax, key):
     return result
 
 
+def check_setitem_lengths(indexer, value, values):
+    """
+    Validate that value and indexer are the same length.
+
+    An special-case is allowed for when the indexer is a boolean array
+    and the number of true values equals the length of ``value``. In
+    this case, no exception is raised.
+
+    Parameters
+    ----------
+    indexer : sequence
+        The key for the setitem
+    value : array-like
+        The value for the setitem
+    values : array-like
+        The values being set into
+
+    Returns
+    -------
+    None
+
+    Raises
+    ------
+    ValueError
+        When the indexer is an ndarray or list and the lengths don't
+        match.
+    """
+    # boolean with truth values == len of the value is ok too
+    if isinstance(indexer, (np.ndarray, list)):
+        if is_list_like(value) and len(indexer) != len(value):
+            if not (isinstance(indexer, np.ndarray) and
+                    indexer.dtype == np.bool_ and
+                    len(indexer[indexer]) == len(value)):
+                raise ValueError("cannot set using a list-like indexer "
+                                 "with a different length than the value")
+    # slice
+    elif isinstance(indexer, slice):
+
+        if is_list_like(value) and len(values):
+            if len(value) != length_of_indexer(indexer, values):
+                raise ValueError("cannot set using a slice indexer with a "
+                                 "different length than the value")
+
+
 def convert_missing_indexer(indexer):
-    """ reverse convert a missing indexer, which is a dict
+    """
+    reverse convert a missing indexer, which is a dict
     return the scalar indexer and a boolean indicating if we converted
     """
 
@@ -1964,35 +2564,102 @@ def convert_missing_indexer(indexer):
 
 
 def convert_from_missing_indexer_tuple(indexer, axes):
-    """ create a filtered indexer that doesn't have any missing indexers """
+    """
+    create a filtered indexer that doesn't have any missing indexers
+    """
 
     def get_indexer(_i, _idx):
         return (axes[_i].get_loc(_idx['key']) if isinstance(_idx, dict) else
                 _idx)
 
-    return tuple([get_indexer(_i, _idx) for _i, _idx in enumerate(indexer)])
+    return tuple(get_indexer(_i, _idx) for _i, _idx in enumerate(indexer))
 
 
 def maybe_convert_indices(indices, n):
-    """ if we have negative indicies, translate to postive here
-    if have indicies that are out-of-bounds, raise an IndexError
     """
+    Attempt to convert indices into valid, positive indices.
+
+    If we have negative indices, translate to positive here.
+    If we have indices that are out-of-bounds, raise an IndexError.
+
+    Parameters
+    ----------
+    indices : array-like
+        The array of indices that we are to convert.
+    n : int
+        The number of elements in the array that we are indexing.
+
+    Returns
+    -------
+    valid_indices : array-like
+        An array-like of positive indices that correspond to the ones
+        that were passed in initially to this function.
+
+    Raises
+    ------
+    IndexError : one of the converted indices either exceeded the number
+        of elements (specified by `n`) OR was still negative.
+    """
+
     if isinstance(indices, list):
         indices = np.array(indices)
         if len(indices) == 0:
             # If list is empty, np.array will return float and cause indexing
             # errors.
-            return np.empty(0, dtype=np.int_)
+            return np.empty(0, dtype=np.intp)
 
     mask = indices < 0
     if mask.any():
+        indices = indices.copy()
         indices[mask] += n
+
     mask = (indices >= n) | (indices < 0)
     if mask.any():
         raise IndexError("indices are out-of-bounds")
     return indices
 
 
+def validate_indices(indices, n):
+    """
+    Perform bounds-checking for an indexer.
+
+    -1 is allowed for indicating missing values.
+
+    Parameters
+    ----------
+    indices : ndarray
+    n : int
+        length of the array being indexed
+
+    Raises
+    ------
+    ValueError
+
+    Examples
+    --------
+    >>> validate_indices([1, 2], 3)
+    # OK
+    >>> validate_indices([1, -2], 3)
+    ValueError
+    >>> validate_indices([1, 2, 3], 3)
+    IndexError
+    >>> validate_indices([-1, -1], 0)
+    # OK
+    >>> validate_indices([0, 1], 0)
+    IndexError
+    """
+    if len(indices):
+        min_idx = indices.min()
+        if min_idx < -1:
+            msg = ("'indices' contains values less than allowed ({} < {})"
+                   .format(min_idx, -1))
+            raise ValueError(msg)
+
+        max_idx = indices.max()
+        if max_idx >= n:
+            raise IndexError("indices are out-of-bounds")
+
+
 def maybe_convert_ix(*args):
     """
     We likely want to take the cross-product
@@ -2010,14 +2677,13 @@ def maybe_convert_ix(*args):
 
 
 def is_nested_tuple(tup, labels):
-    # check for a compatiable nested tuple and multiindexes among the axes
+    # check for a compatible nested tuple and multiindexes among the axes
     if not isinstance(tup, tuple):
         return False
 
-    # are we nested tuple of: tuple,list,slice
     for i, k in enumerate(tup):
 
-        if isinstance(k, (tuple, list, slice)):
+        if is_list_like(k) or isinstance(k, slice):
             return isinstance(labels, MultiIndex)
 
     return False
@@ -2046,13 +2712,13 @@ def maybe_droplevels(index, key):
         for _ in key:
             try:
                 index = index.droplevel(0)
-            except:
+            except ValueError:
                 # we have dropped too much, so back out
                 return original_index
     else:
         try:
             index = index.droplevel(0)
-        except:
+        except ValueError:
             pass
 
     return index
@@ -2073,8 +2739,10 @@ def _non_reducing_slice(slice_):
         slice_ = IndexSlice[:, slice_]
 
     def pred(part):
-        # true when slice does *not* reduce
-        return isinstance(part, slice) or is_list_like(part)
+        # true when slice does *not* reduce, False when part is a tuple,
+        # i.e. MultiIndex slice
+        return ((isinstance(part, slice) or is_list_like(part))
+                and not isinstance(part, tuple))
 
     if not is_list_like(slice_):
         if not isinstance(slice_, slice):
diff --git a/pandas/core/internals.py b/pandas/core/internals.py
deleted file mode 100644
index 8db801f8e7212..0000000000000
--- a/pandas/core/internals.py
+++ /dev/null
@@ -1,5258 +0,0 @@
-import copy
-import itertools
-import re
-import operator
-from datetime import datetime, timedelta, date
-from collections import defaultdict
-
-import numpy as np
-
-from pandas.core.base import PandasObject
-
-from pandas.types.dtypes import (ExtensionDtype, DatetimeTZDtype,
-                                 CategoricalDtype)
-from pandas.types.common import (_TD_DTYPE, _NS_DTYPE,
-                                 _ensure_int64, _ensure_platform_int,
-                                 is_integer,
-                                 is_dtype_equal,
-                                 is_timedelta64_dtype,
-                                 is_datetime64_dtype, is_datetimetz, is_sparse,
-                                 is_categorical, is_categorical_dtype,
-                                 is_integer_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_object_dtype,
-                                 is_datetimelike_v_numeric,
-                                 is_float_dtype, is_numeric_dtype,
-                                 is_numeric_v_string_like, is_extension_type,
-                                 is_list_like,
-                                 is_re,
-                                 is_re_compilable,
-                                 is_scalar,
-                                 _get_dtype)
-from pandas.types.cast import (maybe_downcast_to_dtype,
-                               maybe_convert_string_to_object,
-                               maybe_upcast,
-                               maybe_convert_scalar, maybe_promote,
-                               infer_dtype_from_scalar,
-                               soft_convert_objects,
-                               maybe_convert_objects,
-                               astype_nansafe,
-                               find_common_type)
-from pandas.types.missing import (isnull, array_equivalent,
-                                  _is_na_compat,
-                                  is_null_datelike_scalar)
-import pandas.types.concat as _concat
-
-from pandas.types.generic import ABCSeries
-from pandas.core.common import is_null_slice
-import pandas.core.algorithms as algos
-
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.indexing import maybe_convert_indices, length_of_indexer
-from pandas.core.categorical import Categorical, maybe_to_categorical
-from pandas.tseries.index import DatetimeIndex
-from pandas.formats.printing import pprint_thing
-
-import pandas.core.missing as missing
-from pandas.sparse.array import _maybe_to_sparse, SparseArray
-from pandas._libs import lib, tslib
-from pandas._libs.tslib import Timedelta
-from pandas._libs.lib import BlockPlacement
-
-import pandas.computation.expressions as expressions
-from pandas.util.decorators import cache_readonly
-from pandas.util.validators import validate_bool_kwarg
-
-from pandas import compat, _np_version_under1p9
-from pandas.compat import range, map, zip, u
-
-
-class Block(PandasObject):
-    """
-    Canonical n-dimensional unit of homogeneous dtype contained in a pandas
-    data structure
-
-    Index-ignorant; let the container take care of that
-    """
-    __slots__ = ['_mgr_locs', 'values', 'ndim']
-    is_numeric = False
-    is_float = False
-    is_integer = False
-    is_complex = False
-    is_datetime = False
-    is_datetimetz = False
-    is_timedelta = False
-    is_bool = False
-    is_object = False
-    is_categorical = False
-    is_sparse = False
-    _box_to_block_values = True
-    _can_hold_na = False
-    _downcast_dtype = None
-    _can_consolidate = True
-    _verify_integrity = True
-    _validate_ndim = True
-    _ftype = 'dense'
-    _holder = None
-
-    def __init__(self, values, placement, ndim=None, fastpath=False):
-        if ndim is None:
-            ndim = values.ndim
-        elif values.ndim != ndim:
-            raise ValueError('Wrong number of dimensions')
-        self.ndim = ndim
-
-        self.mgr_locs = placement
-        self.values = values
-
-        if ndim and len(self.mgr_locs) != len(self.values):
-            raise ValueError('Wrong number of items passed %d, placement '
-                             'implies %d' % (len(self.values),
-                                             len(self.mgr_locs)))
-
-    @property
-    def _consolidate_key(self):
-        return (self._can_consolidate, self.dtype.name)
-
-    @property
-    def _is_single_block(self):
-        return self.ndim == 1
-
-    @property
-    def is_view(self):
-        """ return a boolean if I am possibly a view """
-        return self.values.base is not None
-
-    @property
-    def is_datelike(self):
-        """ return True if I am a non-datelike """
-        return self.is_datetime or self.is_timedelta
-
-    def is_categorical_astype(self, dtype):
-        """
-        validate that we have a astypeable to categorical,
-        returns a boolean if we are a categorical
-        """
-        if is_categorical_dtype(dtype):
-            if dtype == CategoricalDtype():
-                return True
-
-            # this is a pd.Categorical, but is not
-            # a valid type for astypeing
-            raise TypeError("invalid type {0} for astype".format(dtype))
-
-        return False
-
-    def external_values(self, dtype=None):
-        """ return an outside world format, currently just the ndarray """
-        return self.values
-
-    def internal_values(self, dtype=None):
-        """ return an internal format, currently just the ndarray
-        this should be the pure internal API format
-        """
-        return self.values
-
-    def get_values(self, dtype=None):
-        """
-        return an internal format, currently just the ndarray
-        this is often overriden to handle to_dense like operations
-        """
-        if is_object_dtype(dtype):
-            return self.values.astype(object)
-        return self.values
-
-    def to_dense(self):
-        return self.values.view()
-
-    def to_object_block(self, mgr):
-        """ return myself as an object block """
-        values = self.get_values(dtype=object)
-        return self.make_block(values, klass=ObjectBlock)
-
-    @property
-    def _na_value(self):
-        return np.nan
-
-    @property
-    def fill_value(self):
-        return np.nan
-
-    @property
-    def mgr_locs(self):
-        return self._mgr_locs
-
-    @property
-    def array_dtype(self):
-        """ the dtype to return if I want to construct this block as an
-        array
-        """
-        return self.dtype
-
-    def make_block(self, values, placement=None, ndim=None, **kwargs):
-        """
-        Create a new block, with type inference propagate any values that are
-        not specified
-        """
-        if placement is None:
-            placement = self.mgr_locs
-        if ndim is None:
-            ndim = self.ndim
-
-        return make_block(values, placement=placement, ndim=ndim, **kwargs)
-
-    def make_block_scalar(self, values, **kwargs):
-        """
-        Create a ScalarBlock
-        """
-        return ScalarBlock(values)
-
-    def make_block_same_class(self, values, placement=None, fastpath=True,
-                              **kwargs):
-        """ Wrap given values in a block of same type as self. """
-        if placement is None:
-            placement = self.mgr_locs
-        return make_block(values, placement=placement, klass=self.__class__,
-                          fastpath=fastpath, **kwargs)
-
-    @mgr_locs.setter
-    def mgr_locs(self, new_mgr_locs):
-        if not isinstance(new_mgr_locs, BlockPlacement):
-            new_mgr_locs = BlockPlacement(new_mgr_locs)
-
-        self._mgr_locs = new_mgr_locs
-
-    def __unicode__(self):
-
-        # don't want to print out all of the items here
-        name = pprint_thing(self.__class__.__name__)
-        if self._is_single_block:
-
-            result = '%s: %s dtype: %s' % (name, len(self), self.dtype)
-
-        else:
-
-            shape = ' x '.join([pprint_thing(s) for s in self.shape])
-            result = '%s: %s, %s, dtype: %s' % (name, pprint_thing(
-                self.mgr_locs.indexer), shape, self.dtype)
-
-        return result
-
-    def __len__(self):
-        return len(self.values)
-
-    def __getstate__(self):
-        return self.mgr_locs.indexer, self.values
-
-    def __setstate__(self, state):
-        self.mgr_locs = BlockPlacement(state[0])
-        self.values = state[1]
-        self.ndim = self.values.ndim
-
-    def _slice(self, slicer):
-        """ return a slice of my values """
-        return self.values[slicer]
-
-    def reshape_nd(self, labels, shape, ref_items, mgr=None):
-        """
-        Parameters
-        ----------
-        labels : list of new axis labels
-        shape : new shape
-        ref_items : new ref_items
-
-        return a new block that is transformed to a nd block
-        """
-
-        return _block2d_to_blocknd(values=self.get_values().T,
-                                   placement=self.mgr_locs, shape=shape,
-                                   labels=labels, ref_items=ref_items)
-
-    def getitem_block(self, slicer, new_mgr_locs=None):
-        """
-        Perform __getitem__-like, return result as block.
-
-        As of now, only supports slices that preserve dimensionality.
-        """
-        if new_mgr_locs is None:
-            if isinstance(slicer, tuple):
-                axis0_slicer = slicer[0]
-            else:
-                axis0_slicer = slicer
-            new_mgr_locs = self.mgr_locs[axis0_slicer]
-
-        new_values = self._slice(slicer)
-
-        if self._validate_ndim and new_values.ndim != self.ndim:
-            raise ValueError("Only same dim slicing is allowed")
-
-        return self.make_block_same_class(new_values, new_mgr_locs)
-
-    @property
-    def shape(self):
-        return self.values.shape
-
-    @property
-    def itemsize(self):
-        return self.values.itemsize
-
-    @property
-    def dtype(self):
-        return self.values.dtype
-
-    @property
-    def ftype(self):
-        return "%s:%s" % (self.dtype, self._ftype)
-
-    def merge(self, other):
-        return _merge_blocks([self, other])
-
-    def reindex_axis(self, indexer, method=None, axis=1, fill_value=None,
-                     limit=None, mask_info=None):
-        """
-        Reindex using pre-computed indexer information
-        """
-        if axis < 1:
-            raise AssertionError('axis must be at least 1, got %d' % axis)
-        if fill_value is None:
-            fill_value = self.fill_value
-
-        new_values = algos.take_nd(self.values, indexer, axis,
-                                   fill_value=fill_value, mask_info=mask_info)
-        return self.make_block(new_values, fastpath=True)
-
-    def get(self, item):
-        loc = self.items.get_loc(item)
-        return self.values[loc]
-
-    def iget(self, i):
-        return self.values[i]
-
-    def set(self, locs, values, check=False):
-        """
-        Modify Block in-place with new item value
-
-        Returns
-        -------
-        None
-        """
-        self.values[locs] = values
-
-    def delete(self, loc):
-        """
-        Delete given loc(-s) from block in-place.
-        """
-        self.values = np.delete(self.values, loc, 0)
-        self.mgr_locs = self.mgr_locs.delete(loc)
-
-    def apply(self, func, mgr=None, **kwargs):
-        """ apply the function to my values; return a block if we are not
-        one
-        """
-        with np.errstate(all='ignore'):
-            result = func(self.values, **kwargs)
-        if not isinstance(result, Block):
-            result = self.make_block(values=_block_shape(result,
-                                                         ndim=self.ndim))
-
-        return result
-
-    def fillna(self, value, limit=None, inplace=False, downcast=None,
-               mgr=None):
-        """ fillna on the block with the value. If we fail, then convert to
-        ObjectBlock and try again
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        if not self._can_hold_na:
-            if inplace:
-                return self
-            else:
-                return self.copy()
-
-        original_value = value
-        mask = isnull(self.values)
-        if limit is not None:
-            if not is_integer(limit):
-                raise ValueError('Limit must be an integer')
-            if limit < 1:
-                raise ValueError('Limit must be greater than 0')
-            if self.ndim > 2:
-                raise NotImplementedError("number of dimensions for 'fillna' "
-                                          "is currently limited to 2")
-            mask[mask.cumsum(self.ndim - 1) > limit] = False
-
-        # fillna, but if we cannot coerce, then try again as an ObjectBlock
-        try:
-            values, _, value, _ = self._try_coerce_args(self.values, value)
-            blocks = self.putmask(mask, value, inplace=inplace)
-            blocks = [b.make_block(values=self._try_coerce_result(b.values))
-                      for b in blocks]
-            return self._maybe_downcast(blocks, downcast)
-        except (TypeError, ValueError):
-
-            # we can't process the value, but nothing to do
-            if not mask.any():
-                return self if inplace else self.copy()
-
-            # we cannot coerce the underlying object, so
-            # make an ObjectBlock
-            return self.to_object_block(mgr=mgr).fillna(original_value,
-                                                        limit=limit,
-                                                        inplace=inplace,
-                                                        downcast=False)
-
-    def _maybe_downcast(self, blocks, downcast=None):
-
-        # no need to downcast our float
-        # unless indicated
-        if downcast is None and self.is_float:
-            return blocks
-        elif downcast is None and (self.is_timedelta or self.is_datetime):
-            return blocks
-
-        return _extend_blocks([b.downcast(downcast) for b in blocks])
-
-    def downcast(self, dtypes=None, mgr=None):
-        """ try to downcast each item to the dict of dtypes if present """
-
-        # turn it off completely
-        if dtypes is False:
-            return self
-
-        values = self.values
-
-        # single block handling
-        if self._is_single_block:
-
-            # try to cast all non-floats here
-            if dtypes is None:
-                dtypes = 'infer'
-
-            nv = maybe_downcast_to_dtype(values, dtypes)
-            return self.make_block(nv, fastpath=True)
-
-        # ndim > 1
-        if dtypes is None:
-            return self
-
-        if not (dtypes == 'infer' or isinstance(dtypes, dict)):
-            raise ValueError("downcast must have a dictionary or 'infer' as "
-                             "its argument")
-
-        # item-by-item
-        # this is expensive as it splits the blocks items-by-item
-        blocks = []
-        for i, rl in enumerate(self.mgr_locs):
-
-            if dtypes == 'infer':
-                dtype = 'infer'
-            else:
-                raise AssertionError("dtypes as dict is not supported yet")
-                # TODO: This either should be completed or removed
-                dtype = dtypes.get(item, self._downcast_dtype)  # noqa
-
-            if dtype is None:
-                nv = _block_shape(values[i], ndim=self.ndim)
-            else:
-                nv = maybe_downcast_to_dtype(values[i], dtype)
-                nv = _block_shape(nv, ndim=self.ndim)
-
-            blocks.append(self.make_block(nv, fastpath=True, placement=[rl]))
-
-        return blocks
-
-    def astype(self, dtype, copy=False, errors='raise', values=None, **kwargs):
-        return self._astype(dtype, copy=copy, errors=errors, values=values,
-                            **kwargs)
-
-    def _astype(self, dtype, copy=False, errors='raise', values=None,
-                klass=None, mgr=None, **kwargs):
-        """
-        Coerce to the new type (if copy=True, return a new copy)
-        raise on an except if raise == True
-        """
-        errors_legal_values = ('raise', 'ignore')
-
-        if errors not in errors_legal_values:
-            invalid_arg = ("Expected value of kwarg 'errors' to be one of {}. "
-                           "Supplied value is '{}'".format(
-                               list(errors_legal_values), errors))
-            raise ValueError(invalid_arg)
-
-        # may need to convert to categorical
-        # this is only called for non-categoricals
-        if self.is_categorical_astype(dtype):
-            return self.make_block(Categorical(self.values, **kwargs))
-
-        # astype processing
-        dtype = np.dtype(dtype)
-        if self.dtype == dtype:
-            if copy:
-                return self.copy()
-            return self
-
-        if klass is None:
-            if dtype == np.object_:
-                klass = ObjectBlock
-        try:
-            # force the copy here
-            if values is None:
-
-                if issubclass(dtype.type,
-                              (compat.text_type, compat.string_types)):
-
-                    # use native type formatting for datetime/tz/timedelta
-                    if self.is_datelike:
-                        values = self.to_native_types()
-
-                    # astype formatting
-                    else:
-                        values = self.values
-
-                else:
-                    values = self.get_values(dtype=dtype)
-
-                # _astype_nansafe works fine with 1-d only
-                values = astype_nansafe(values.ravel(), dtype, copy=True)
-                values = values.reshape(self.shape)
-
-            newb = make_block(values, placement=self.mgr_locs, dtype=dtype,
-                              klass=klass)
-        except:
-            if errors == 'raise':
-                raise
-            newb = self.copy() if copy else self
-
-        if newb.is_numeric and self.is_numeric:
-            if newb.shape != self.shape:
-                raise TypeError("cannot set astype for copy = [%s] for dtype "
-                                "(%s [%s]) with smaller itemsize that current "
-                                "(%s [%s])" % (copy, self.dtype.name,
-                                               self.itemsize, newb.dtype.name,
-                                               newb.itemsize))
-        return newb
-
-    def convert(self, copy=True, **kwargs):
-        """ attempt to coerce any object types to better types return a copy
-        of the block (if copy = True) by definition we are not an ObjectBlock
-        here!
-        """
-
-        return self.copy() if copy else self
-
-    def _can_hold_element(self, value):
-        raise NotImplementedError()
-
-    def _try_cast(self, value):
-        raise NotImplementedError()
-
-    def _try_cast_result(self, result, dtype=None):
-        """ try to cast the result to our original type, we may have
-        roundtripped thru object in the mean-time
-        """
-        if dtype is None:
-            dtype = self.dtype
-
-        if self.is_integer or self.is_bool or self.is_datetime:
-            pass
-        elif self.is_float and result.dtype == self.dtype:
-
-            # protect against a bool/object showing up here
-            if isinstance(dtype, compat.string_types) and dtype == 'infer':
-                return result
-            if not isinstance(dtype, type):
-                dtype = dtype.type
-            if issubclass(dtype, (np.bool_, np.object_)):
-                if issubclass(dtype, np.bool_):
-                    if isnull(result).all():
-                        return result.astype(np.bool_)
-                    else:
-                        result = result.astype(np.object_)
-                        result[result == 1] = True
-                        result[result == 0] = False
-                        return result
-                else:
-                    return result.astype(np.object_)
-
-            return result
-
-        # may need to change the dtype here
-        return maybe_downcast_to_dtype(result, dtype)
-
-    def _try_operate(self, values):
-        """ return a version to operate on as the input """
-        return values
-
-    def _try_coerce_args(self, values, other):
-        """ provide coercion to our input arguments """
-        return values, False, other, False
-
-    def _try_coerce_result(self, result):
-        """ reverse of try_coerce_args """
-        return result
-
-    def _try_coerce_and_cast_result(self, result, dtype=None):
-        result = self._try_coerce_result(result)
-        result = self._try_cast_result(result, dtype=dtype)
-        return result
-
-    def _try_fill(self, value):
-        return value
-
-    def to_native_types(self, slicer=None, na_rep='nan', quoting=None,
-                        **kwargs):
-        """ convert to our native types format, slicing if desired """
-
-        values = self.values
-        if slicer is not None:
-            values = values[:, slicer]
-        mask = isnull(values)
-
-        if not self.is_object and not quoting:
-            values = values.astype(str)
-        else:
-            values = np.array(values, dtype='object')
-
-        values[mask] = na_rep
-        return values
-
-    # block actions ####
-    def copy(self, deep=True, mgr=None):
-        """ copy constructor """
-        values = self.values
-        if deep:
-            values = values.copy()
-        return self.make_block_same_class(values)
-
-    def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False, convert=True, mgr=None):
-        """ replace the to_replace value with value, possible to create new
-        blocks here this is just a call to putmask. regex is not used here.
-        It is used in ObjectBlocks.  It is here for API
-        compatibility.
-        """
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        original_to_replace = to_replace
-        mask = isnull(self.values)
-        # try to replace, if we raise an error, convert to ObjectBlock and
-        # retry
-        try:
-            values, _, to_replace, _ = self._try_coerce_args(self.values,
-                                                             to_replace)
-            mask = missing.mask_missing(values, to_replace)
-            if filter is not None:
-                filtered_out = ~self.mgr_locs.isin(filter)
-                mask[filtered_out.nonzero()[0]] = False
-
-            blocks = self.putmask(mask, value, inplace=inplace)
-            if convert:
-                blocks = [b.convert(by_item=True, numeric=False,
-                                    copy=not inplace) for b in blocks]
-            return blocks
-        except (TypeError, ValueError):
-
-            # we can't process the value, but nothing to do
-            if not mask.any():
-                return self if inplace else self.copy()
-
-            return self.to_object_block(mgr=mgr).replace(
-                to_replace=original_to_replace, value=value, inplace=inplace,
-                filter=filter, regex=regex, convert=convert)
-
-    def _replace_single(self, *args, **kwargs):
-        """ no-op on a non-ObjectBlock """
-        return self if kwargs['inplace'] else self.copy()
-
-    def setitem(self, indexer, value, mgr=None):
-        """ set the value inplace; return a new block (of a possibly different
-        dtype)
-
-        indexer is a direct slice/positional indexer; value must be a
-        compatible shape
-        """
-
-        # coerce None values, if appropriate
-        if value is None:
-            if self.is_numeric:
-                value = np.nan
-
-        # coerce args
-        values, _, value, _ = self._try_coerce_args(self.values, value)
-        arr_value = np.array(value)
-
-        # cast the values to a type that can hold nan (if necessary)
-        if not self._can_hold_element(value):
-            dtype, _ = maybe_promote(arr_value.dtype)
-            values = values.astype(dtype)
-
-        transf = (lambda x: x.T) if self.ndim == 2 else (lambda x: x)
-        values = transf(values)
-        l = len(values)
-
-        # length checking
-        # boolean with truth values == len of the value is ok too
-        if isinstance(indexer, (np.ndarray, list)):
-            if is_list_like(value) and len(indexer) != len(value):
-                if not (isinstance(indexer, np.ndarray) and
-                        indexer.dtype == np.bool_ and
-                        len(indexer[indexer]) == len(value)):
-                    raise ValueError("cannot set using a list-like indexer "
-                                     "with a different length than the value")
-
-        # slice
-        elif isinstance(indexer, slice):
-
-            if is_list_like(value) and l:
-                if len(value) != length_of_indexer(indexer, values):
-                    raise ValueError("cannot set using a slice indexer with a "
-                                     "different length than the value")
-
-        try:
-
-            def _is_scalar_indexer(indexer):
-                # return True if we are all scalar indexers
-
-                if arr_value.ndim == 1:
-                    if not isinstance(indexer, tuple):
-                        indexer = tuple([indexer])
-                    return all([is_scalar(idx) for idx in indexer])
-                return False
-
-            def _is_empty_indexer(indexer):
-                # return a boolean if we have an empty indexer
-
-                if arr_value.ndim == 1:
-                    if not isinstance(indexer, tuple):
-                        indexer = tuple([indexer])
-                    return any(isinstance(idx, np.ndarray) and len(idx) == 0
-                               for idx in indexer)
-                return False
-
-            # empty indexers
-            # 8669 (empty)
-            if _is_empty_indexer(indexer):
-                pass
-
-            # setting a single element for each dim and with a rhs that could
-            # be say a list
-            # GH 6043
-            elif _is_scalar_indexer(indexer):
-                values[indexer] = value
-
-            # if we are an exact match (ex-broadcasting),
-            # then use the resultant dtype
-            elif (len(arr_value.shape) and
-                  arr_value.shape[0] == values.shape[0] and
-                  np.prod(arr_value.shape) == np.prod(values.shape)):
-                values[indexer] = value
-                values = values.astype(arr_value.dtype)
-
-            # set
-            else:
-                values[indexer] = value
-
-            # coerce and try to infer the dtypes of the result
-            if hasattr(value, 'dtype') and is_dtype_equal(values.dtype,
-                                                          value.dtype):
-                dtype = value.dtype
-            elif is_scalar(value):
-                dtype, _ = infer_dtype_from_scalar(value)
-            else:
-                dtype = 'infer'
-            values = self._try_coerce_and_cast_result(values, dtype)
-            block = self.make_block(transf(values), fastpath=True)
-
-            # may have to soft convert_objects here
-            if block.is_object and not self.is_object:
-                block = block.convert(numeric=False)
-
-            return block
-        except ValueError:
-            raise
-        except TypeError:
-
-            # cast to the passed dtype if possible
-            # otherwise raise the original error
-            try:
-                # e.g. we are uint32 and our value is uint64
-                # this is for compat with older numpies
-                block = self.make_block(transf(values.astype(value.dtype)))
-                return block.setitem(indexer=indexer, value=value, mgr=mgr)
-
-            except:
-                pass
-
-            raise
-
-        except Exception:
-            pass
-
-        return [self]
-
-    def putmask(self, mask, new, align=True, inplace=False, axis=0,
-                transpose=False, mgr=None):
-        """ putmask the data to the block; it is possible that we may create a
-        new dtype of block
-
-        return the resulting block(s)
-
-        Parameters
-        ----------
-        mask  : the condition to respect
-        new : a ndarray/object
-        align : boolean, perform alignment on other/cond, default is True
-        inplace : perform inplace modification, default is False
-        axis : int
-        transpose : boolean
-            Set to True if self is stored with axes reversed
-
-        Returns
-        -------
-        a list of new blocks, the result of the putmask
-        """
-
-        new_values = self.values if inplace else self.values.copy()
-
-        if hasattr(new, 'reindex_axis'):
-            new = new.values
-
-        if hasattr(mask, 'reindex_axis'):
-            mask = mask.values
-
-        # if we are passed a scalar None, convert it here
-        if not is_list_like(new) and isnull(new) and not self.is_object:
-            new = self.fill_value
-
-        if self._can_hold_element(new):
-            if transpose:
-                new_values = new_values.T
-
-            new = self._try_cast(new)
-
-            # If the default repeat behavior in np.putmask would go in the
-            # wrong direction, then explictly repeat and reshape new instead
-            if getattr(new, 'ndim', 0) >= 1:
-                if self.ndim - 1 == new.ndim and axis == 1:
-                    new = np.repeat(
-                        new, new_values.shape[-1]).reshape(self.shape)
-                new = new.astype(new_values.dtype)
-
-            np.putmask(new_values, mask, new)
-
-        # maybe upcast me
-        elif mask.any():
-            if transpose:
-                mask = mask.T
-                if isinstance(new, np.ndarray):
-                    new = new.T
-                axis = new_values.ndim - axis - 1
-
-            # Pseudo-broadcast
-            if getattr(new, 'ndim', 0) >= 1:
-                if self.ndim - 1 == new.ndim:
-                    new_shape = list(new.shape)
-                    new_shape.insert(axis, 1)
-                    new = new.reshape(tuple(new_shape))
-
-            # need to go column by column
-            new_blocks = []
-            if self.ndim > 1:
-                for i, ref_loc in enumerate(self.mgr_locs):
-                    m = mask[i]
-                    v = new_values[i]
-
-                    # need a new block
-                    if m.any():
-                        if isinstance(new, np.ndarray):
-                            n = np.squeeze(new[i % new.shape[0]])
-                        else:
-                            n = np.array(new)
-
-                        # type of the new block
-                        dtype, _ = maybe_promote(n.dtype)
-
-                        # we need to explicitly astype here to make a copy
-                        n = n.astype(dtype)
-
-                        nv = _putmask_smart(v, m, n)
-                    else:
-                        nv = v if inplace else v.copy()
-
-                    # Put back the dimension that was taken from it and make
-                    # a block out of the result.
-                    block = self.make_block(values=nv[np.newaxis],
-                                            placement=[ref_loc], fastpath=True)
-
-                    new_blocks.append(block)
-
-            else:
-                nv = _putmask_smart(new_values, mask, new)
-                new_blocks.append(self.make_block(values=nv, fastpath=True))
-
-            return new_blocks
-
-        if inplace:
-            return [self]
-
-        if transpose:
-            new_values = new_values.T
-
-        return [self.make_block(new_values, fastpath=True)]
-
-    def interpolate(self, method='pad', axis=0, index=None, values=None,
-                    inplace=False, limit=None, limit_direction='forward',
-                    fill_value=None, coerce=False, downcast=None, mgr=None,
-                    **kwargs):
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        def check_int_bool(self, inplace):
-            # Only FloatBlocks will contain NaNs.
-            # timedelta subclasses IntBlock
-            if (self.is_bool or self.is_integer) and not self.is_timedelta:
-                if inplace:
-                    return self
-                else:
-                    return self.copy()
-
-        # a fill na type method
-        try:
-            m = missing.clean_fill_method(method)
-        except:
-            m = None
-
-        if m is not None:
-            r = check_int_bool(self, inplace)
-            if r is not None:
-                return r
-            return self._interpolate_with_fill(method=m, axis=axis,
-                                               inplace=inplace, limit=limit,
-                                               fill_value=fill_value,
-                                               coerce=coerce,
-                                               downcast=downcast, mgr=mgr)
-        # try an interp method
-        try:
-            m = missing.clean_interp_method(method, **kwargs)
-        except:
-            m = None
-
-        if m is not None:
-            r = check_int_bool(self, inplace)
-            if r is not None:
-                return r
-            return self._interpolate(method=m, index=index, values=values,
-                                     axis=axis, limit=limit,
-                                     limit_direction=limit_direction,
-                                     fill_value=fill_value, inplace=inplace,
-                                     downcast=downcast, mgr=mgr, **kwargs)
-
-        raise ValueError("invalid method '{0}' to interpolate.".format(method))
-
-    def _interpolate_with_fill(self, method='pad', axis=0, inplace=False,
-                               limit=None, fill_value=None, coerce=False,
-                               downcast=None, mgr=None):
-        """ fillna but using the interpolate machinery """
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        # if we are coercing, then don't force the conversion
-        # if the block can't hold the type
-        if coerce:
-            if not self._can_hold_na:
-                if inplace:
-                    return [self]
-                else:
-                    return [self.copy()]
-
-        values = self.values if inplace else self.values.copy()
-        values, _, fill_value, _ = self._try_coerce_args(values, fill_value)
-        values = self._try_operate(values)
-        values = missing.interpolate_2d(values, method=method, axis=axis,
-                                        limit=limit, fill_value=fill_value,
-                                        dtype=self.dtype)
-        values = self._try_coerce_result(values)
-
-        blocks = [self.make_block(values, klass=self.__class__, fastpath=True)]
-        return self._maybe_downcast(blocks, downcast)
-
-    def _interpolate(self, method=None, index=None, values=None,
-                     fill_value=None, axis=0, limit=None,
-                     limit_direction='forward', inplace=False, downcast=None,
-                     mgr=None, **kwargs):
-        """ interpolate using scipy wrappers """
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        data = self.values if inplace else self.values.copy()
-
-        # only deal with floats
-        if not self.is_float:
-            if not self.is_integer:
-                return self
-            data = data.astype(np.float64)
-
-        if fill_value is None:
-            fill_value = self.fill_value
-
-        if method in ('krogh', 'piecewise_polynomial', 'pchip'):
-            if not index.is_monotonic:
-                raise ValueError("{0} interpolation requires that the "
-                                 "index be monotonic.".format(method))
-        # process 1-d slices in the axis direction
-
-        def func(x):
-
-            # process a 1-d slice, returning it
-            # should the axis argument be handled below in apply_along_axis?
-            # i.e. not an arg to missing.interpolate_1d
-            return missing.interpolate_1d(index, x, method=method, limit=limit,
-                                          limit_direction=limit_direction,
-                                          fill_value=fill_value,
-                                          bounds_error=False, **kwargs)
-
-        # interp each column independently
-        interp_values = np.apply_along_axis(func, axis, data)
-
-        blocks = [self.make_block(interp_values, klass=self.__class__,
-                                  fastpath=True)]
-        return self._maybe_downcast(blocks, downcast)
-
-    def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
-        """
-        Take values according to indexer and return them as a block.bb
-
-        """
-
-        # algos.take_nd dispatches for DatetimeTZBlock, CategoricalBlock
-        # so need to preserve types
-        # sparse is treated like an ndarray, but needs .get_values() shaping
-
-        values = self.values
-        if self.is_sparse:
-            values = self.get_values()
-
-        if fill_tuple is None:
-            fill_value = self.fill_value
-            new_values = algos.take_nd(values, indexer, axis=axis,
-                                       allow_fill=False)
-        else:
-            fill_value = fill_tuple[0]
-            new_values = algos.take_nd(values, indexer, axis=axis,
-                                       allow_fill=True, fill_value=fill_value)
-
-        if new_mgr_locs is None:
-            if axis == 0:
-                slc = lib.indexer_as_slice(indexer)
-                if slc is not None:
-                    new_mgr_locs = self.mgr_locs[slc]
-                else:
-                    new_mgr_locs = self.mgr_locs[indexer]
-            else:
-                new_mgr_locs = self.mgr_locs
-
-        if not is_dtype_equal(new_values.dtype, self.dtype):
-            return self.make_block(new_values, new_mgr_locs)
-        else:
-            return self.make_block_same_class(new_values, new_mgr_locs)
-
-    def diff(self, n, axis=1, mgr=None):
-        """ return block for the diff of the values """
-        new_values = algos.diff(self.values, n, axis=axis)
-        return [self.make_block(values=new_values, fastpath=True)]
-
-    def shift(self, periods, axis=0, mgr=None):
-        """ shift the block by periods, possibly upcast """
-
-        # convert integer to float if necessary. need to do a lot more than
-        # that, handle boolean etc also
-        new_values, fill_value = maybe_upcast(self.values)
-
-        # make sure array sent to np.roll is c_contiguous
-        f_ordered = new_values.flags.f_contiguous
-        if f_ordered:
-            new_values = new_values.T
-            axis = new_values.ndim - axis - 1
-
-        if np.prod(new_values.shape):
-            new_values = np.roll(new_values, _ensure_platform_int(periods),
-                                 axis=axis)
-
-        axis_indexer = [slice(None)] * self.ndim
-        if periods > 0:
-            axis_indexer[axis] = slice(None, periods)
-        else:
-            axis_indexer[axis] = slice(periods, None)
-        new_values[tuple(axis_indexer)] = fill_value
-
-        # restore original order
-        if f_ordered:
-            new_values = new_values.T
-
-        return [self.make_block(new_values, fastpath=True)]
-
-    def eval(self, func, other, raise_on_error=True, try_cast=False, mgr=None):
-        """
-        evaluate the block; return result block from the result
-
-        Parameters
-        ----------
-        func  : how to combine self, other
-        other : a ndarray/object
-        raise_on_error : if True, raise when I can't perform the function,
-            False by default (and just return the data that we had coming in)
-        try_cast : try casting the results to the input type
-
-        Returns
-        -------
-        a new block, the result of the func
-        """
-        values = self.values
-
-        if hasattr(other, 'reindex_axis'):
-            other = other.values
-
-        # make sure that we can broadcast
-        is_transposed = False
-        if hasattr(other, 'ndim') and hasattr(values, 'ndim'):
-            if values.ndim != other.ndim:
-                is_transposed = True
-            else:
-                if values.shape == other.shape[::-1]:
-                    is_transposed = True
-                elif values.shape[0] == other.shape[-1]:
-                    is_transposed = True
-                else:
-                    # this is a broadcast error heree
-                    raise ValueError("cannot broadcast shape [%s] with block "
-                                     "values [%s]" % (values.T.shape,
-                                                      other.shape))
-
-        transf = (lambda x: x.T) if is_transposed else (lambda x: x)
-
-        # coerce/transpose the args if needed
-        values, values_mask, other, other_mask = self._try_coerce_args(
-            transf(values), other)
-
-        # get the result, may need to transpose the other
-        def get_result(other):
-
-            # avoid numpy warning of comparisons again None
-            if other is None:
-                result = not func.__name__ == 'eq'
-
-            # avoid numpy warning of elementwise comparisons to object
-            elif is_numeric_v_string_like(values, other):
-                result = False
-
-            else:
-                result = func(values, other)
-
-            # mask if needed
-            if isinstance(values_mask, np.ndarray) and values_mask.any():
-                result = result.astype('float64', copy=False)
-                result[values_mask] = np.nan
-            if other_mask is True:
-                result = result.astype('float64', copy=False)
-                result[:] = np.nan
-            elif isinstance(other_mask, np.ndarray) and other_mask.any():
-                result = result.astype('float64', copy=False)
-                result[other_mask.ravel()] = np.nan
-
-            return self._try_coerce_result(result)
-
-        # error handler if we have an issue operating with the function
-        def handle_error():
-
-            if raise_on_error:
-                # The 'detail' variable is defined in outer scope.
-                raise TypeError('Could not operate %s with block values %s' %
-                                (repr(other), str(detail)))  # noqa
-            else:
-                # return the values
-                result = np.empty(values.shape, dtype='O')
-                result.fill(np.nan)
-                return result
-
-        # get the result
-        try:
-            with np.errstate(all='ignore'):
-                result = get_result(other)
-
-        # if we have an invalid shape/broadcast error
-        # GH4576, so raise instead of allowing to pass through
-        except ValueError as detail:
-            raise
-        except Exception as detail:
-            result = handle_error()
-
-        # technically a broadcast error in numpy can 'work' by returning a
-        # boolean False
-        if not isinstance(result, np.ndarray):
-            if not isinstance(result, np.ndarray):
-
-                # differentiate between an invalid ndarray-ndarray comparison
-                # and an invalid type comparison
-                if isinstance(values, np.ndarray) and is_list_like(other):
-                    raise ValueError('Invalid broadcasting comparison [%s] '
-                                     'with block values' % repr(other))
-
-                raise TypeError('Could not compare [%s] with block values' %
-                                repr(other))
-
-        # transpose if needed
-        result = transf(result)
-
-        # try to cast if requested
-        if try_cast:
-            result = self._try_cast_result(result)
-
-        return [self.make_block(result, fastpath=True, )]
-
-    def where(self, other, cond, align=True, raise_on_error=True,
-              try_cast=False, axis=0, transpose=False, mgr=None):
-        """
-        evaluate the block; return result block(s) from the result
-
-        Parameters
-        ----------
-        other : a ndarray/object
-        cond  : the condition to respect
-        align : boolean, perform alignment on other/cond
-        raise_on_error : if True, raise when I can't perform the function,
-            False by default (and just return the data that we had coming in)
-        axis : int
-        transpose : boolean
-            Set to True if self is stored with axes reversed
-
-        Returns
-        -------
-        a new block(s), the result of the func
-        """
-
-        values = self.values
-        if transpose:
-            values = values.T
-
-        if hasattr(other, 'reindex_axis'):
-            other = other.values
-
-        if hasattr(cond, 'reindex_axis'):
-            cond = cond.values
-
-        # If the default broadcasting would go in the wrong direction, then
-        # explictly reshape other instead
-        if getattr(other, 'ndim', 0) >= 1:
-            if values.ndim - 1 == other.ndim and axis == 1:
-                other = other.reshape(tuple(other.shape + (1, )))
-
-        if not hasattr(cond, 'shape'):
-            raise ValueError("where must have a condition that is ndarray "
-                             "like")
-
-        other = maybe_convert_string_to_object(other)
-        other = maybe_convert_scalar(other)
-
-        # our where function
-        def func(cond, values, other):
-            if cond.ravel().all():
-                return values
-
-            values, values_mask, other, other_mask = self._try_coerce_args(
-                values, other)
-            try:
-                return self._try_coerce_result(expressions.where(
-                    cond, values, other, raise_on_error=True))
-            except Exception as detail:
-                if raise_on_error:
-                    raise TypeError('Could not operate [%s] with block values '
-                                    '[%s]' % (repr(other), str(detail)))
-                else:
-                    # return the values
-                    result = np.empty(values.shape, dtype='float64')
-                    result.fill(np.nan)
-                    return result
-
-        # see if we can operate on the entire block, or need item-by-item
-        # or if we are a single block (ndim == 1)
-        result = func(cond, values, other)
-        if self._can_hold_na or self.ndim == 1:
-
-            if transpose:
-                result = result.T
-
-            # try to cast if requested
-            if try_cast:
-                result = self._try_cast_result(result)
-
-            return self.make_block(result)
-
-        # might need to separate out blocks
-        axis = cond.ndim - 1
-        cond = cond.swapaxes(axis, 0)
-        mask = np.array([cond[i].all() for i in range(cond.shape[0])],
-                        dtype=bool)
-
-        result_blocks = []
-        for m in [mask, ~mask]:
-            if m.any():
-                r = self._try_cast_result(result.take(m.nonzero()[0],
-                                                      axis=axis))
-                result_blocks.append(
-                    self.make_block(r.T, placement=self.mgr_locs[m]))
-
-        return result_blocks
-
-    def equals(self, other):
-        if self.dtype != other.dtype or self.shape != other.shape:
-            return False
-        return array_equivalent(self.values, other.values)
-
-    def quantile(self, qs, interpolation='linear', axis=0, mgr=None):
-        """
-        compute the quantiles of the
-
-        Parameters
-        ----------
-        qs: a scalar or list of the quantiles to be computed
-        interpolation: type of interpolation, default 'linear'
-        axis: axis to compute, default 0
-
-        Returns
-        -------
-        tuple of (axis, block)
-
-        """
-        if _np_version_under1p9:
-            if interpolation != 'linear':
-                raise ValueError("Interpolation methods other than linear "
-                                 "are not supported in numpy < 1.9.")
-
-        kw = {}
-        if not _np_version_under1p9:
-            kw.update({'interpolation': interpolation})
-
-        values = self.get_values()
-        values, _, _, _ = self._try_coerce_args(values, values)
-
-        def _nanpercentile1D(values, mask, q, **kw):
-            values = values[~mask]
-
-            if len(values) == 0:
-                if is_scalar(q):
-                    return self._na_value
-                else:
-                    return np.array([self._na_value] * len(q),
-                                    dtype=values.dtype)
-
-            return np.percentile(values, q, **kw)
-
-        def _nanpercentile(values, q, axis, **kw):
-
-            mask = isnull(self.values)
-            if not is_scalar(mask) and mask.any():
-                if self.ndim == 1:
-                    return _nanpercentile1D(values, mask, q, **kw)
-                else:
-                    # for nonconsolidatable blocks mask is 1D, but values 2D
-                    if mask.ndim < values.ndim:
-                        mask = mask.reshape(values.shape)
-                    if axis == 0:
-                        values = values.T
-                        mask = mask.T
-                    result = [_nanpercentile1D(val, m, q, **kw) for (val, m)
-                              in zip(list(values), list(mask))]
-                    result = np.array(result, dtype=values.dtype, copy=False).T
-                    return result
-            else:
-                return np.percentile(values, q, axis=axis, **kw)
-
-        from pandas import Float64Index
-        is_empty = values.shape[axis] == 0
-        if is_list_like(qs):
-            ax = Float64Index(qs)
-
-            if is_empty:
-                if self.ndim == 1:
-                    result = self._na_value
-                else:
-                    # create the array of na_values
-                    # 2d len(values) * len(qs)
-                    result = np.repeat(np.array([self._na_value] * len(qs)),
-                                       len(values)).reshape(len(values),
-                                                            len(qs))
-            else:
-
-                try:
-                    result = _nanpercentile(values, np.array(qs) * 100,
-                                            axis=axis, **kw)
-                except ValueError:
-
-                    # older numpies don't handle an array for q
-                    result = [_nanpercentile(values, q * 100,
-                                             axis=axis, **kw) for q in qs]
-
-                result = np.array(result, copy=False)
-                if self.ndim > 1:
-                    result = result.T
-
-        else:
-
-            if self.ndim == 1:
-                ax = Float64Index([qs])
-            else:
-                ax = mgr.axes[0]
-
-            if is_empty:
-                if self.ndim == 1:
-                    result = self._na_value
-                else:
-                    result = np.array([self._na_value] * len(self))
-            else:
-                result = _nanpercentile(values, qs * 100, axis=axis, **kw)
-
-        ndim = getattr(result, 'ndim', None) or 0
-        result = self._try_coerce_result(result)
-        if is_scalar(result):
-            return ax, self.make_block_scalar(result)
-        return ax, make_block(result,
-                              placement=np.arange(len(result)),
-                              ndim=ndim)
-
-
-class ScalarBlock(Block):
-    """
-    a scalar compat Block
-    """
-    __slots__ = ['_mgr_locs', 'values', 'ndim']
-
-    def __init__(self, values):
-        self.ndim = 0
-        self.mgr_locs = [0]
-        self.values = values
-
-    @property
-    def dtype(self):
-        return type(self.values)
-
-    @property
-    def shape(self):
-        return tuple([0])
-
-    def __len__(self):
-        return 0
-
-
-class NonConsolidatableMixIn(object):
-    """ hold methods for the nonconsolidatable blocks """
-    _can_consolidate = False
-    _verify_integrity = False
-    _validate_ndim = False
-    _holder = None
-
-    def __init__(self, values, placement, ndim=None, fastpath=False, **kwargs):
-
-        # Placement must be converted to BlockPlacement via property setter
-        # before ndim logic, because placement may be a slice which doesn't
-        # have a length.
-        self.mgr_locs = placement
-
-        # kludgetastic
-        if ndim is None:
-            if len(self.mgr_locs) != 1:
-                ndim = 1
-            else:
-                ndim = 2
-        self.ndim = ndim
-
-        if not isinstance(values, self._holder):
-            raise TypeError("values must be {0}".format(self._holder.__name__))
-
-        self.values = values
-
-    @property
-    def shape(self):
-        if self.ndim == 1:
-            return (len(self.values)),
-        return (len(self.mgr_locs), len(self.values))
-
-    def get_values(self, dtype=None):
-        """ need to to_dense myself (and always return a ndim sized object) """
-        values = self.values.to_dense()
-        if values.ndim == self.ndim - 1:
-            values = values.reshape((1,) + values.shape)
-        return values
-
-    def iget(self, col):
-
-        if self.ndim == 2 and isinstance(col, tuple):
-            col, loc = col
-            if not is_null_slice(col) and col != 0:
-                raise IndexError("{0} only contains one item".format(self))
-            return self.values[loc]
-        else:
-            if col != 0:
-                raise IndexError("{0} only contains one item".format(self))
-            return self.values
-
-    def should_store(self, value):
-        return isinstance(value, self._holder)
-
-    def set(self, locs, values, check=False):
-        assert locs.tolist() == [0]
-        self.values = values
-
-    def get(self, item):
-        if self.ndim == 1:
-            loc = self.items.get_loc(item)
-            return self.values[loc]
-        else:
-            return self.values
-
-    def putmask(self, mask, new, align=True, inplace=False, axis=0,
-                transpose=False, mgr=None):
-        """
-        putmask the data to the block; we must be a single block and not
-        generate other blocks
-
-        return the resulting block
-
-        Parameters
-        ----------
-        mask  : the condition to respect
-        new : a ndarray/object
-        align : boolean, perform alignment on other/cond, default is True
-        inplace : perform inplace modification, default is False
-
-        Returns
-        -------
-        a new block(s), the result of the putmask
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        # use block's copy logic.
-        # .values may be an Index which does shallow copy by default
-        new_values = self.values if inplace else self.copy().values
-        new_values, _, new, _ = self._try_coerce_args(new_values, new)
-
-        if isinstance(new, np.ndarray) and len(new) == len(mask):
-            new = new[mask]
-
-        mask = _safe_reshape(mask, new_values.shape)
-        new_values[mask] = new
-        new_values = self._try_coerce_result(new_values)
-        return [self.make_block(values=new_values)]
-
-    def _slice(self, slicer):
-        """ return a slice of my values (but densify first) """
-        return self.get_values()[slicer]
-
-    def _try_cast_result(self, result, dtype=None):
-        return result
-
-
-class NumericBlock(Block):
-    __slots__ = ()
-    is_numeric = True
-    _can_hold_na = True
-
-
-class FloatOrComplexBlock(NumericBlock):
-    __slots__ = ()
-
-    def equals(self, other):
-        if self.dtype != other.dtype or self.shape != other.shape:
-            return False
-        left, right = self.values, other.values
-        return ((left == right) | (np.isnan(left) & np.isnan(right))).all()
-
-
-class FloatBlock(FloatOrComplexBlock):
-    __slots__ = ()
-    is_float = True
-    _downcast_dtype = 'int64'
-
-    def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            tipo = element.dtype.type
-            return (issubclass(tipo, (np.floating, np.integer)) and
-                    not issubclass(tipo, (np.datetime64, np.timedelta64)))
-        return (isinstance(element, (float, int, np.float_, np.int_)) and
-                not isinstance(element, (bool, np.bool_, datetime, timedelta,
-                                         np.datetime64, np.timedelta64)))
-
-    def _try_cast(self, element):
-        try:
-            return float(element)
-        except:  # pragma: no cover
-            return element
-
-    def to_native_types(self, slicer=None, na_rep='', float_format=None,
-                        decimal='.', quoting=None, **kwargs):
-        """ convert to our native types format, slicing if desired """
-
-        values = self.values
-        if slicer is not None:
-            values = values[:, slicer]
-
-        # see gh-13418: no special formatting is desired at the
-        # output (important for appropriate 'quoting' behaviour),
-        # so do not pass it through the FloatArrayFormatter
-        if float_format is None and decimal == '.':
-            mask = isnull(values)
-
-            if not quoting:
-                values = values.astype(str)
-            else:
-                values = np.array(values, dtype='object')
-
-            values[mask] = na_rep
-            return values
-
-        from pandas.formats.format import FloatArrayFormatter
-        formatter = FloatArrayFormatter(values, na_rep=na_rep,
-                                        float_format=float_format,
-                                        decimal=decimal, quoting=quoting,
-                                        fixed_width=False)
-        return formatter.get_result_as_array()
-
-    def should_store(self, value):
-        # when inserting a column should not coerce integers to floats
-        # unnecessarily
-        return (issubclass(value.dtype.type, np.floating) and
-                value.dtype == self.dtype)
-
-
-class ComplexBlock(FloatOrComplexBlock):
-    __slots__ = ()
-    is_complex = True
-
-    def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            return issubclass(element.dtype.type,
-                              (np.floating, np.integer, np.complexfloating))
-        return (isinstance(element,
-                           (float, int, complex, np.float_, np.int_)) and
-                not isinstance(bool, np.bool_))
-
-    def _try_cast(self, element):
-        try:
-            return complex(element)
-        except:  # pragma: no cover
-            return element
-
-    def should_store(self, value):
-        return issubclass(value.dtype.type, np.complexfloating)
-
-
-class IntBlock(NumericBlock):
-    __slots__ = ()
-    is_integer = True
-    _can_hold_na = False
-
-    def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            tipo = element.dtype.type
-            return (issubclass(tipo, np.integer) and
-                    not issubclass(tipo, (np.datetime64, np.timedelta64)))
-        return is_integer(element)
-
-    def _try_cast(self, element):
-        try:
-            return int(element)
-        except:  # pragma: no cover
-            return element
-
-    def should_store(self, value):
-        return is_integer_dtype(value) and value.dtype == self.dtype
-
-
-class DatetimeLikeBlockMixin(object):
-
-    @property
-    def _na_value(self):
-        return tslib.NaT
-
-    @property
-    def fill_value(self):
-        return tslib.iNaT
-
-    def _try_operate(self, values):
-        """ return a version to operate on """
-        return values.view('i8')
-
-    def get_values(self, dtype=None):
-        """
-        return object dtype as boxed values, such as Timestamps/Timedelta
-        """
-        if is_object_dtype(dtype):
-            return lib.map_infer(self.values.ravel(),
-                                 self._box_func).reshape(self.values.shape)
-        return self.values
-
-
-class TimeDeltaBlock(DatetimeLikeBlockMixin, IntBlock):
-    __slots__ = ()
-    is_timedelta = True
-    _can_hold_na = True
-    is_numeric = False
-
-    @property
-    def _box_func(self):
-        return lambda x: tslib.Timedelta(x, unit='ns')
-
-    def fillna(self, value, **kwargs):
-
-        # allow filling with integers to be
-        # interpreted as seconds
-        if not isinstance(value, np.timedelta64) and is_integer(value):
-            value = Timedelta(value, unit='s')
-        return super(TimeDeltaBlock, self).fillna(value, **kwargs)
-
-    def _try_coerce_args(self, values, other):
-        """
-        Coerce values and other to int64, with null values converted to
-        iNaT. values is always ndarray-like, other may not be
-
-        Parameters
-        ----------
-        values : ndarray-like
-        other : ndarray-like or scalar
-
-        Returns
-        -------
-        base-type values, values mask, base-type other, other mask
-        """
-
-        values_mask = isnull(values)
-        values = values.view('i8')
-        other_mask = False
-
-        if isinstance(other, bool):
-            raise TypeError
-        elif is_null_datelike_scalar(other):
-            other = tslib.iNaT
-            other_mask = True
-        elif isinstance(other, Timedelta):
-            other_mask = isnull(other)
-            other = other.value
-        elif isinstance(other, np.timedelta64):
-            other_mask = isnull(other)
-            other = Timedelta(other).value
-        elif isinstance(other, timedelta):
-            other = Timedelta(other).value
-        elif isinstance(other, np.ndarray):
-            other_mask = isnull(other)
-            other = other.astype('i8', copy=False).view('i8')
-        else:
-            # scalar
-            other = Timedelta(other)
-            other_mask = isnull(other)
-            other = other.value
-
-        return values, values_mask, other, other_mask
-
-    def _try_coerce_result(self, result):
-        """ reverse of try_coerce_args / try_operate """
-        if isinstance(result, np.ndarray):
-            mask = isnull(result)
-            if result.dtype.kind in ['i', 'f', 'O']:
-                result = result.astype('m8[ns]')
-            result[mask] = tslib.iNaT
-        elif isinstance(result, (np.integer, np.float)):
-            result = self._box_func(result)
-        return result
-
-    def should_store(self, value):
-        return issubclass(value.dtype.type, np.timedelta64)
-
-    def to_native_types(self, slicer=None, na_rep=None, quoting=None,
-                        **kwargs):
-        """ convert to our native types format, slicing if desired """
-
-        values = self.values
-        if slicer is not None:
-            values = values[:, slicer]
-        mask = isnull(values)
-
-        rvalues = np.empty(values.shape, dtype=object)
-        if na_rep is None:
-            na_rep = 'NaT'
-        rvalues[mask] = na_rep
-        imask = (~mask).ravel()
-
-        # FIXME:
-        # should use the formats.format.Timedelta64Formatter here
-        # to figure what format to pass to the Timedelta
-        # e.g. to not show the decimals say
-        rvalues.flat[imask] = np.array([Timedelta(val)._repr_base(format='all')
-                                        for val in values.ravel()[imask]],
-                                       dtype=object)
-        return rvalues
-
-
-class BoolBlock(NumericBlock):
-    __slots__ = ()
-    is_bool = True
-    _can_hold_na = False
-
-    def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            return issubclass(element.dtype.type, np.integer)
-        return isinstance(element, (int, bool))
-
-    def _try_cast(self, element):
-        try:
-            return bool(element)
-        except:  # pragma: no cover
-            return element
-
-    def should_store(self, value):
-        return issubclass(value.dtype.type, np.bool_)
-
-    def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False, convert=True, mgr=None):
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        to_replace_values = np.atleast_1d(to_replace)
-        if not np.can_cast(to_replace_values, bool):
-            return self
-        return super(BoolBlock, self).replace(to_replace, value,
-                                              inplace=inplace, filter=filter,
-                                              regex=regex, convert=convert,
-                                              mgr=mgr)
-
-
-class ObjectBlock(Block):
-    __slots__ = ()
-    is_object = True
-    _can_hold_na = True
-
-    def __init__(self, values, ndim=2, fastpath=False, placement=None,
-                 **kwargs):
-        if issubclass(values.dtype.type, compat.string_types):
-            values = np.array(values, dtype=object)
-
-        super(ObjectBlock, self).__init__(values, ndim=ndim, fastpath=fastpath,
-                                          placement=placement, **kwargs)
-
-    @property
-    def is_bool(self):
-        """ we can be a bool if we have only bool values but are of type
-        object
-        """
-        return lib.is_bool_array(self.values.ravel())
-
-    # TODO: Refactor when convert_objects is removed since there will be 1 path
-    def convert(self, *args, **kwargs):
-        """ attempt to coerce any object types to better types return a copy of
-        the block (if copy = True) by definition we ARE an ObjectBlock!!!!!
-
-        can return multiple blocks!
-        """
-
-        if args:
-            raise NotImplementedError
-        by_item = True if 'by_item' not in kwargs else kwargs['by_item']
-
-        new_inputs = ['coerce', 'datetime', 'numeric', 'timedelta']
-        new_style = False
-        for kw in new_inputs:
-            new_style |= kw in kwargs
-
-        if new_style:
-            fn = soft_convert_objects
-            fn_inputs = new_inputs
-        else:
-            fn = maybe_convert_objects
-            fn_inputs = ['convert_dates', 'convert_numeric',
-                         'convert_timedeltas']
-        fn_inputs += ['copy']
-
-        fn_kwargs = {}
-        for key in fn_inputs:
-            if key in kwargs:
-                fn_kwargs[key] = kwargs[key]
-
-        # attempt to create new type blocks
-        blocks = []
-        if by_item and not self._is_single_block:
-
-            for i, rl in enumerate(self.mgr_locs):
-                values = self.iget(i)
-
-                shape = values.shape
-                values = fn(values.ravel(), **fn_kwargs)
-                try:
-                    values = values.reshape(shape)
-                    values = _block_shape(values, ndim=self.ndim)
-                except (AttributeError, NotImplementedError):
-                    pass
-                newb = make_block(values, ndim=self.ndim, placement=[rl])
-                blocks.append(newb)
-
-        else:
-            values = fn(self.values.ravel(), **fn_kwargs)
-            try:
-                values = values.reshape(self.values.shape)
-            except NotImplementedError:
-                pass
-            blocks.append(make_block(values, ndim=self.ndim,
-                                     placement=self.mgr_locs))
-
-        return blocks
-
-    def set(self, locs, values, check=False):
-        """
-        Modify Block in-place with new item value
-
-        Returns
-        -------
-        None
-        """
-
-        # GH6026
-        if check:
-            try:
-                if (self.values[locs] == values).all():
-                    return
-            except:
-                pass
-        try:
-            self.values[locs] = values
-        except (ValueError):
-
-            # broadcasting error
-            # see GH6171
-            new_shape = list(values.shape)
-            new_shape[0] = len(self.items)
-            self.values = np.empty(tuple(new_shape), dtype=self.dtype)
-            self.values.fill(np.nan)
-            self.values[locs] = values
-
-    def _maybe_downcast(self, blocks, downcast=None):
-
-        if downcast is not None:
-            return blocks
-
-        # split and convert the blocks
-        return _extend_blocks([b.convert(datetime=True, numeric=False)
-                               for b in blocks])
-
-    def _can_hold_element(self, element):
-        return True
-
-    def _try_cast(self, element):
-        return element
-
-    def should_store(self, value):
-        return not (issubclass(value.dtype.type,
-                               (np.integer, np.floating, np.complexfloating,
-                                np.datetime64, np.bool_)) or
-                    is_extension_type(value))
-
-    def replace(self, to_replace, value, inplace=False, filter=None,
-                regex=False, convert=True, mgr=None):
-        to_rep_is_list = is_list_like(to_replace)
-        value_is_list = is_list_like(value)
-        both_lists = to_rep_is_list and value_is_list
-        either_list = to_rep_is_list or value_is_list
-
-        result_blocks = []
-        blocks = [self]
-
-        if not either_list and is_re(to_replace):
-            return self._replace_single(to_replace, value, inplace=inplace,
-                                        filter=filter, regex=True,
-                                        convert=convert, mgr=mgr)
-        elif not (either_list or regex):
-            return super(ObjectBlock, self).replace(to_replace, value,
-                                                    inplace=inplace,
-                                                    filter=filter, regex=regex,
-                                                    convert=convert, mgr=mgr)
-        elif both_lists:
-            for to_rep, v in zip(to_replace, value):
-                result_blocks = []
-                for b in blocks:
-                    result = b._replace_single(to_rep, v, inplace=inplace,
-                                               filter=filter, regex=regex,
-                                               convert=convert, mgr=mgr)
-                    result_blocks = _extend_blocks(result, result_blocks)
-                blocks = result_blocks
-            return result_blocks
-
-        elif to_rep_is_list and regex:
-            for to_rep in to_replace:
-                result_blocks = []
-                for b in blocks:
-                    result = b._replace_single(to_rep, value, inplace=inplace,
-                                               filter=filter, regex=regex,
-                                               convert=convert, mgr=mgr)
-                    result_blocks = _extend_blocks(result, result_blocks)
-                blocks = result_blocks
-            return result_blocks
-
-        return self._replace_single(to_replace, value, inplace=inplace,
-                                    filter=filter, convert=convert,
-                                    regex=regex, mgr=mgr)
-
-    def _replace_single(self, to_replace, value, inplace=False, filter=None,
-                        regex=False, convert=True, mgr=None):
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        # to_replace is regex compilable
-        to_rep_re = regex and is_re_compilable(to_replace)
-
-        # regex is regex compilable
-        regex_re = is_re_compilable(regex)
-
-        # only one will survive
-        if to_rep_re and regex_re:
-            raise AssertionError('only one of to_replace and regex can be '
-                                 'regex compilable')
-
-        # if regex was passed as something that can be a regex (rather than a
-        # boolean)
-        if regex_re:
-            to_replace = regex
-
-        regex = regex_re or to_rep_re
-
-        # try to get the pattern attribute (compiled re) or it's a string
-        try:
-            pattern = to_replace.pattern
-        except AttributeError:
-            pattern = to_replace
-
-        # if the pattern is not empty and to_replace is either a string or a
-        # regex
-        if regex and pattern:
-            rx = re.compile(to_replace)
-        else:
-            # if the thing to replace is not a string or compiled regex call
-            # the superclass method -> to_replace is some kind of object
-            return super(ObjectBlock, self).replace(to_replace, value,
-                                                    inplace=inplace,
-                                                    filter=filter, regex=regex,
-                                                    mgr=mgr)
-
-        new_values = self.values if inplace else self.values.copy()
-
-        # deal with replacing values with objects (strings) that match but
-        # whose replacement is not a string (numeric, nan, object)
-        if isnull(value) or not isinstance(value, compat.string_types):
-
-            def re_replacer(s):
-                try:
-                    return value if rx.search(s) is not None else s
-                except TypeError:
-                    return s
-        else:
-            # value is guaranteed to be a string here, s can be either a string
-            # or null if it's null it gets returned
-            def re_replacer(s):
-                try:
-                    return rx.sub(value, s)
-                except TypeError:
-                    return s
-
-        f = np.vectorize(re_replacer, otypes=[self.dtype])
-
-        if filter is None:
-            filt = slice(None)
-        else:
-            filt = self.mgr_locs.isin(filter).nonzero()[0]
-
-        new_values[filt] = f(new_values[filt])
-
-        # convert
-        block = self.make_block(new_values)
-        if convert:
-            block = block.convert(by_item=True, numeric=False)
-
-        return block
-
-
-class CategoricalBlock(NonConsolidatableMixIn, ObjectBlock):
-    __slots__ = ()
-    is_categorical = True
-    _verify_integrity = True
-    _can_hold_na = True
-    _holder = Categorical
-
-    def __init__(self, values, placement, fastpath=False, **kwargs):
-
-        # coerce to categorical if we can
-        super(CategoricalBlock, self).__init__(maybe_to_categorical(values),
-                                               fastpath=True,
-                                               placement=placement, **kwargs)
-
-    @property
-    def is_view(self):
-        """ I am never a view """
-        return False
-
-    def to_dense(self):
-        return self.values.to_dense().view()
-
-    def convert(self, copy=True, **kwargs):
-        return self.copy() if copy else self
-
-    @property
-    def array_dtype(self):
-        """ the dtype to return if I want to construct this block as an
-        array
-        """
-        return np.object_
-
-    def _slice(self, slicer):
-        """ return a slice of my values """
-
-        # slice the category
-        # return same dims as we currently have
-        return self.values._slice(slicer)
-
-    def _try_coerce_result(self, result):
-        """ reverse of try_coerce_args """
-
-        # GH12564: CategoricalBlock is 1-dim only
-        # while returned results could be any dim
-        if ((not is_categorical_dtype(result)) and
-                isinstance(result, np.ndarray)):
-            result = _block_shape(result, ndim=self.ndim)
-
-        return result
-
-    def fillna(self, value, limit=None, inplace=False, downcast=None,
-               mgr=None):
-        # we may need to upcast our fill to match our dtype
-        if limit is not None:
-            raise NotImplementedError("specifying a limit for 'fillna' has "
-                                      "not been implemented yet")
-
-        values = self.values if inplace else self.values.copy()
-        values = self._try_coerce_result(values.fillna(value=value,
-                                                       limit=limit))
-        return [self.make_block(values=values)]
-
-    def interpolate(self, method='pad', axis=0, inplace=False, limit=None,
-                    fill_value=None, **kwargs):
-
-        values = self.values if inplace else self.values.copy()
-        return self.make_block_same_class(
-            values=values.fillna(fill_value=fill_value, method=method,
-                                 limit=limit),
-            placement=self.mgr_locs)
-
-    def shift(self, periods, axis=0, mgr=None):
-        return self.make_block_same_class(values=self.values.shift(periods),
-                                          placement=self.mgr_locs)
-
-    def take_nd(self, indexer, axis=0, new_mgr_locs=None, fill_tuple=None):
-        """
-        Take values according to indexer and return them as a block.bb
-        """
-        if fill_tuple is None:
-            fill_value = None
-        else:
-            fill_value = fill_tuple[0]
-
-        # axis doesn't matter; we are really a single-dim object
-        # but are passed the axis depending on the calling routing
-        # if its REALLY axis 0, then this will be a reindex and not a take
-        new_values = self.values.take_nd(indexer, fill_value=fill_value)
-
-        # if we are a 1-dim object, then always place at 0
-        if self.ndim == 1:
-            new_mgr_locs = [0]
-        else:
-            if new_mgr_locs is None:
-                new_mgr_locs = self.mgr_locs
-
-        return self.make_block_same_class(new_values, new_mgr_locs)
-
-    def _astype(self, dtype, copy=False, errors='raise', values=None,
-                klass=None, mgr=None):
-        """
-        Coerce to the new type (if copy=True, return a new copy)
-        raise on an except if raise == True
-        """
-
-        if self.is_categorical_astype(dtype):
-            values = self.values
-        else:
-            values = np.asarray(self.values).astype(dtype, copy=False)
-
-        if copy:
-            values = values.copy()
-
-        return self.make_block(values)
-
-    def to_native_types(self, slicer=None, na_rep='', quoting=None, **kwargs):
-        """ convert to our native types format, slicing if desired """
-
-        values = self.values
-        if slicer is not None:
-            # Categorical is always one dimension
-            values = values[slicer]
-        mask = isnull(values)
-        values = np.array(values, dtype='object')
-        values[mask] = na_rep
-
-        # we are expected to return a 2-d ndarray
-        return values.reshape(1, len(values))
-
-
-class DatetimeBlock(DatetimeLikeBlockMixin, Block):
-    __slots__ = ()
-    is_datetime = True
-    _can_hold_na = True
-
-    def __init__(self, values, placement, fastpath=False, **kwargs):
-        if values.dtype != _NS_DTYPE:
-            values = tslib.cast_to_nanoseconds(values)
-
-        super(DatetimeBlock, self).__init__(values, fastpath=True,
-                                            placement=placement, **kwargs)
-
-    def _astype(self, dtype, mgr=None, **kwargs):
-        """
-        these automatically copy, so copy=True has no effect
-        raise on an except if raise == True
-        """
-
-        # if we are passed a datetime64[ns, tz]
-        if is_datetime64tz_dtype(dtype):
-            dtype = DatetimeTZDtype(dtype)
-
-            values = self.values
-            if getattr(values, 'tz', None) is None:
-                values = DatetimeIndex(values).tz_localize('UTC')
-            values = values.tz_convert(dtype.tz)
-            return self.make_block(values)
-
-        # delegate
-        return super(DatetimeBlock, self)._astype(dtype=dtype, **kwargs)
-
-    def _can_hold_element(self, element):
-        if is_list_like(element):
-            element = np.array(element)
-            return element.dtype == _NS_DTYPE or element.dtype == np.int64
-        return (is_integer(element) or isinstance(element, datetime) or
-                isnull(element))
-
-    def _try_cast(self, element):
-        try:
-            return int(element)
-        except:
-            return element
-
-    def _try_coerce_args(self, values, other):
-        """
-        Coerce values and other to dtype 'i8'. NaN and NaT convert to
-        the smallest i8, and will correctly round-trip to NaT if converted
-        back in _try_coerce_result. values is always ndarray-like, other
-        may not be
-
-        Parameters
-        ----------
-        values : ndarray-like
-        other : ndarray-like or scalar
-
-        Returns
-        -------
-        base-type values, values mask, base-type other, other mask
-        """
-
-        values_mask = isnull(values)
-        values = values.view('i8')
-        other_mask = False
-
-        if isinstance(other, bool):
-            raise TypeError
-        elif is_null_datelike_scalar(other):
-            other = tslib.iNaT
-            other_mask = True
-        elif isinstance(other, (datetime, np.datetime64, date)):
-            other = self._box_func(other)
-            if getattr(other, 'tz') is not None:
-                raise TypeError("cannot coerce a Timestamp with a tz on a "
-                                "naive Block")
-            other_mask = isnull(other)
-            other = other.asm8.view('i8')
-        elif hasattr(other, 'dtype') and is_integer_dtype(other):
-            other = other.view('i8')
-        else:
-            try:
-                other = np.asarray(other)
-                other_mask = isnull(other)
-
-                other = other.astype('i8', copy=False).view('i8')
-            except ValueError:
-
-                # coercion issues
-                # let higher levels handle
-                raise TypeError
-
-        return values, values_mask, other, other_mask
-
-    def _try_coerce_result(self, result):
-        """ reverse of try_coerce_args """
-        if isinstance(result, np.ndarray):
-            if result.dtype.kind in ['i', 'f', 'O']:
-                try:
-                    result = result.astype('M8[ns]')
-                except ValueError:
-                    pass
-        elif isinstance(result, (np.integer, np.float, np.datetime64)):
-            result = self._box_func(result)
-        return result
-
-    @property
-    def _box_func(self):
-        return tslib.Timestamp
-
-    def to_native_types(self, slicer=None, na_rep=None, date_format=None,
-                        quoting=None, **kwargs):
-        """ convert to our native types format, slicing if desired """
-
-        values = self.values
-        if slicer is not None:
-            values = values[..., slicer]
-
-        from pandas.formats.format import _get_format_datetime64_from_values
-        format = _get_format_datetime64_from_values(values, date_format)
-
-        result = tslib.format_array_from_datetime(
-            values.view('i8').ravel(), tz=getattr(self.values, 'tz', None),
-            format=format, na_rep=na_rep).reshape(values.shape)
-        return np.atleast_2d(result)
-
-    def should_store(self, value):
-        return (issubclass(value.dtype.type, np.datetime64) and
-                not is_datetimetz(value))
-
-    def set(self, locs, values, check=False):
-        """
-        Modify Block in-place with new item value
-
-        Returns
-        -------
-        None
-        """
-        if values.dtype != _NS_DTYPE:
-            # Workaround for numpy 1.6 bug
-            values = tslib.cast_to_nanoseconds(values)
-
-        self.values[locs] = values
-
-
-class DatetimeTZBlock(NonConsolidatableMixIn, DatetimeBlock):
-    """ implement a datetime64 block with a tz attribute """
-    __slots__ = ()
-    _holder = DatetimeIndex
-    is_datetimetz = True
-
-    def __init__(self, values, placement, ndim=2, **kwargs):
-
-        if not isinstance(values, self._holder):
-            values = self._holder(values)
-
-        dtype = kwargs.pop('dtype', None)
-
-        if dtype is not None:
-            if isinstance(dtype, compat.string_types):
-                dtype = DatetimeTZDtype.construct_from_string(dtype)
-            values = values._shallow_copy(tz=dtype.tz)
-
-        if values.tz is None:
-            raise ValueError("cannot create a DatetimeTZBlock without a tz")
-
-        super(DatetimeTZBlock, self).__init__(values, placement=placement,
-                                              ndim=ndim, **kwargs)
-
-    def copy(self, deep=True, mgr=None):
-        """ copy constructor """
-        values = self.values
-        if deep:
-            values = values.copy(deep=True)
-        return self.make_block_same_class(values)
-
-    def external_values(self):
-        """ we internally represent the data as a DatetimeIndex, but for
-        external compat with ndarray, export as a ndarray of Timestamps
-        """
-        return self.values.astype('datetime64[ns]').values
-
-    def get_values(self, dtype=None):
-        # return object dtype as Timestamps with the zones
-        if is_object_dtype(dtype):
-            f = lambda x: lib.Timestamp(x, tz=self.values.tz)
-            return lib.map_infer(
-                self.values.ravel(), f).reshape(self.values.shape)
-        return self.values
-
-    def to_object_block(self, mgr):
-        """
-        return myself as an object block
-
-        Since we keep the DTI as a 1-d object, this is different
-        depends on BlockManager's ndim
-        """
-        values = self.get_values(dtype=object)
-        kwargs = {}
-        if mgr.ndim > 1:
-            values = _block_shape(values, ndim=mgr.ndim)
-            kwargs['ndim'] = mgr.ndim
-            kwargs['placement'] = [0]
-        return self.make_block(values, klass=ObjectBlock, **kwargs)
-
-    def _slice(self, slicer):
-        """ return a slice of my values """
-        if isinstance(slicer, tuple):
-            col, loc = slicer
-            if not is_null_slice(col) and col != 0:
-                raise IndexError("{0} only contains one item".format(self))
-            return self.values[loc]
-        return self.values[slicer]
-
-    def _try_coerce_args(self, values, other):
-        """
-        localize and return i8 for the values
-
-        Parameters
-        ----------
-        values : ndarray-like
-        other : ndarray-like or scalar
-
-        Returns
-        -------
-        base-type values, values mask, base-type other, other mask
-        """
-        values_mask = _block_shape(isnull(values), ndim=self.ndim)
-        # asi8 is a view, needs copy
-        values = _block_shape(values.asi8, ndim=self.ndim)
-        other_mask = False
-
-        if isinstance(other, ABCSeries):
-            other = self._holder(other)
-            other_mask = isnull(other)
-
-        if isinstance(other, bool):
-            raise TypeError
-        elif (is_null_datelike_scalar(other) or
-              (is_scalar(other) and isnull(other))):
-            other = tslib.iNaT
-            other_mask = True
-        elif isinstance(other, self._holder):
-            if other.tz != self.values.tz:
-                raise ValueError("incompatible or non tz-aware value")
-            other = other.asi8
-            other_mask = isnull(other)
-        elif isinstance(other, (np.datetime64, datetime, date)):
-            other = lib.Timestamp(other)
-            tz = getattr(other, 'tz', None)
-
-            # test we can have an equal time zone
-            if tz is None or str(tz) != str(self.values.tz):
-                raise ValueError("incompatible or non tz-aware value")
-            other_mask = isnull(other)
-            other = other.value
-
-        return values, values_mask, other, other_mask
-
-    def _try_coerce_result(self, result):
-        """ reverse of try_coerce_args """
-        if isinstance(result, np.ndarray):
-            if result.dtype.kind in ['i', 'f', 'O']:
-                result = result.astype('M8[ns]')
-        elif isinstance(result, (np.integer, np.float, np.datetime64)):
-            result = lib.Timestamp(result, tz=self.values.tz)
-        if isinstance(result, np.ndarray):
-            # allow passing of > 1dim if its trivial
-            if result.ndim > 1:
-                result = result.reshape(len(result))
-            result = self.values._shallow_copy(result)
-
-        return result
-
-    @property
-    def _box_func(self):
-        return lambda x: tslib.Timestamp(x, tz=self.dtype.tz)
-
-    def shift(self, periods, axis=0, mgr=None):
-        """ shift the block by periods """
-
-        # think about moving this to the DatetimeIndex. This is a non-freq
-        # (number of periods) shift ###
-
-        N = len(self)
-        indexer = np.zeros(N, dtype=int)
-        if periods > 0:
-            indexer[periods:] = np.arange(N - periods)
-        else:
-            indexer[:periods] = np.arange(-periods, N)
-
-        new_values = self.values.asi8.take(indexer)
-
-        if periods > 0:
-            new_values[:periods] = tslib.iNaT
-        else:
-            new_values[periods:] = tslib.iNaT
-
-        new_values = self.values._shallow_copy(new_values)
-        return [self.make_block_same_class(new_values,
-                                           placement=self.mgr_locs)]
-
-
-class SparseBlock(NonConsolidatableMixIn, Block):
-    """ implement as a list of sparse arrays of the same dtype """
-    __slots__ = ()
-    is_sparse = True
-    is_numeric = True
-    _box_to_block_values = False
-    _can_hold_na = True
-    _ftype = 'sparse'
-    _holder = SparseArray
-
-    @property
-    def shape(self):
-        return (len(self.mgr_locs), self.sp_index.length)
-
-    @property
-    def itemsize(self):
-        return self.dtype.itemsize
-
-    @property
-    def fill_value(self):
-        # return np.nan
-        return self.values.fill_value
-
-    @fill_value.setter
-    def fill_value(self, v):
-        self.values.fill_value = v
-
-    def to_dense(self):
-        return self.values.to_dense().view()
-
-    @property
-    def sp_values(self):
-        return self.values.sp_values
-
-    @sp_values.setter
-    def sp_values(self, v):
-        # reset the sparse values
-        self.values = SparseArray(v, sparse_index=self.sp_index,
-                                  kind=self.kind, dtype=v.dtype,
-                                  fill_value=self.values.fill_value,
-                                  copy=False)
-
-    @property
-    def sp_index(self):
-        return self.values.sp_index
-
-    @property
-    def kind(self):
-        return self.values.kind
-
-    def _astype(self, dtype, copy=False, raise_on_error=True, values=None,
-                klass=None, mgr=None, **kwargs):
-        if values is None:
-            values = self.values
-        values = values.astype(dtype, copy=copy)
-        return self.make_block_same_class(values=values,
-                                          placement=self.mgr_locs)
-
-    def __len__(self):
-        try:
-            return self.sp_index.length
-        except:
-            return 0
-
-    def copy(self, deep=True, mgr=None):
-        return self.make_block_same_class(values=self.values,
-                                          sparse_index=self.sp_index,
-                                          kind=self.kind, copy=deep,
-                                          placement=self.mgr_locs)
-
-    def make_block_same_class(self, values, placement, sparse_index=None,
-                              kind=None, dtype=None, fill_value=None,
-                              copy=False, fastpath=True, **kwargs):
-        """ return a new block """
-        if dtype is None:
-            dtype = values.dtype
-        if fill_value is None and not isinstance(values, SparseArray):
-            fill_value = self.values.fill_value
-
-        # if not isinstance(values, SparseArray) and values.ndim != self.ndim:
-        #     raise ValueError("ndim mismatch")
-
-        if values.ndim == 2:
-            nitems = values.shape[0]
-
-            if nitems == 0:
-                # kludgy, but SparseBlocks cannot handle slices, where the
-                # output is 0-item, so let's convert it to a dense block: it
-                # won't take space since there's 0 items, plus it will preserve
-                # the dtype.
-                return self.make_block(np.empty(values.shape, dtype=dtype),
-                                       placement,
-                                       fastpath=True)
-            elif nitems > 1:
-                raise ValueError("Only 1-item 2d sparse blocks are supported")
-            else:
-                values = values.reshape(values.shape[1])
-
-        new_values = SparseArray(values, sparse_index=sparse_index,
-                                 kind=kind or self.kind, dtype=dtype,
-                                 fill_value=fill_value, copy=copy)
-        return self.make_block(new_values, fastpath=fastpath,
-                               placement=placement)
-
-    def interpolate(self, method='pad', axis=0, inplace=False, limit=None,
-                    fill_value=None, **kwargs):
-
-        values = missing.interpolate_2d(self.values.to_dense(), method, axis,
-                                        limit, fill_value)
-        return self.make_block_same_class(values=values,
-                                          placement=self.mgr_locs)
-
-    def fillna(self, value, limit=None, inplace=False, downcast=None,
-               mgr=None):
-        # we may need to upcast our fill to match our dtype
-        if limit is not None:
-            raise NotImplementedError("specifying a limit for 'fillna' has "
-                                      "not been implemented yet")
-        values = self.values if inplace else self.values.copy()
-        values = values.fillna(value, downcast=downcast)
-        return [self.make_block_same_class(values=values,
-                                           placement=self.mgr_locs)]
-
-    def shift(self, periods, axis=0, mgr=None):
-        """ shift the block by periods """
-        N = len(self.values.T)
-        indexer = np.zeros(N, dtype=int)
-        if periods > 0:
-            indexer[periods:] = np.arange(N - periods)
-        else:
-            indexer[:periods] = np.arange(-periods, N)
-        new_values = self.values.to_dense().take(indexer)
-        # convert integer to float if necessary. need to do a lot more than
-        # that, handle boolean etc also
-        new_values, fill_value = maybe_upcast(new_values)
-        if periods > 0:
-            new_values[:periods] = fill_value
-        else:
-            new_values[periods:] = fill_value
-        return [self.make_block_same_class(new_values,
-                                           placement=self.mgr_locs)]
-
-    def reindex_axis(self, indexer, method=None, axis=1, fill_value=None,
-                     limit=None, mask_info=None):
-        """
-        Reindex using pre-computed indexer information
-        """
-        if axis < 1:
-            raise AssertionError('axis must be at least 1, got %d' % axis)
-
-        # taking on the 0th axis always here
-        if fill_value is None:
-            fill_value = self.fill_value
-        return self.make_block_same_class(self.values.take(indexer),
-                                          fill_value=fill_value,
-                                          placement=self.mgr_locs)
-
-    def sparse_reindex(self, new_index):
-        """ sparse reindex and return a new block
-            current reindex only works for float64 dtype! """
-        values = self.values
-        values = values.sp_index.to_int_index().reindex(
-            values.sp_values.astype('float64'), values.fill_value, new_index)
-        return self.make_block_same_class(values, sparse_index=new_index,
-                                          placement=self.mgr_locs)
-
-
-def make_block(values, placement, klass=None, ndim=None, dtype=None,
-               fastpath=False):
-    if klass is None:
-        dtype = dtype or values.dtype
-        vtype = dtype.type
-
-        if isinstance(values, SparseArray):
-            klass = SparseBlock
-        elif issubclass(vtype, np.floating):
-            klass = FloatBlock
-        elif (issubclass(vtype, np.integer) and
-              issubclass(vtype, np.timedelta64)):
-            klass = TimeDeltaBlock
-        elif (issubclass(vtype, np.integer) and
-              not issubclass(vtype, np.datetime64)):
-            klass = IntBlock
-        elif dtype == np.bool_:
-            klass = BoolBlock
-        elif issubclass(vtype, np.datetime64):
-            if hasattr(values, 'tz'):
-                klass = DatetimeTZBlock
-            else:
-                klass = DatetimeBlock
-        elif is_datetimetz(values):
-            klass = DatetimeTZBlock
-        elif issubclass(vtype, np.complexfloating):
-            klass = ComplexBlock
-        elif is_categorical(values):
-            klass = CategoricalBlock
-        else:
-            klass = ObjectBlock
-
-    elif klass is DatetimeTZBlock and not is_datetimetz(values):
-        return klass(values, ndim=ndim, fastpath=fastpath,
-                     placement=placement, dtype=dtype)
-
-    return klass(values, ndim=ndim, fastpath=fastpath, placement=placement)
-
-# TODO: flexible with index=None and/or items=None
-
-
-class BlockManager(PandasObject):
-    """
-    Core internal data structure to implement DataFrame, Series, Panel, etc.
-
-    Manage a bunch of labeled 2D mixed-type ndarrays. Essentially it's a
-    lightweight blocked set of labeled data to be manipulated by the DataFrame
-    public API class
-
-    Attributes
-    ----------
-    shape
-    ndim
-    axes
-    values
-    items
-
-    Methods
-    -------
-    set_axis(axis, new_labels)
-    copy(deep=True)
-
-    get_dtype_counts
-    get_ftype_counts
-    get_dtypes
-    get_ftypes
-
-    apply(func, axes, block_filter_fn)
-
-    get_bool_data
-    get_numeric_data
-
-    get_slice(slice_like, axis)
-    get(label)
-    iget(loc)
-    get_scalar(label_tup)
-
-    take(indexer, axis)
-    reindex_axis(new_labels, axis)
-    reindex_indexer(new_labels, indexer, axis)
-
-    delete(label)
-    insert(loc, label, value)
-    set(label, value)
-
-    Parameters
-    ----------
-
-
-    Notes
-    -----
-    This is *not* a public API class
-    """
-    __slots__ = ['axes', 'blocks', '_ndim', '_shape', '_known_consolidated',
-                 '_is_consolidated', '_blknos', '_blklocs']
-
-    def __init__(self, blocks, axes, do_integrity_check=True, fastpath=True):
-        self.axes = [_ensure_index(ax) for ax in axes]
-        self.blocks = tuple(blocks)
-
-        for block in blocks:
-            if block.is_sparse:
-                if len(block.mgr_locs) != 1:
-                    raise AssertionError("Sparse block refers to multiple "
-                                         "items")
-            else:
-                if self.ndim != block.ndim:
-                    raise AssertionError('Number of Block dimensions (%d) '
-                                         'must equal number of axes (%d)' %
-                                         (block.ndim, self.ndim))
-
-        if do_integrity_check:
-            self._verify_integrity()
-
-        self._consolidate_check()
-
-        self._rebuild_blknos_and_blklocs()
-
-    def make_empty(self, axes=None):
-        """ return an empty BlockManager with the items axis of len 0 """
-        if axes is None:
-            axes = [_ensure_index([])] + [_ensure_index(a)
-                                          for a in self.axes[1:]]
-
-        # preserve dtype if possible
-        if self.ndim == 1:
-            blocks = np.array([], dtype=self.array_dtype)
-        else:
-            blocks = []
-        return self.__class__(blocks, axes)
-
-    def __nonzero__(self):
-        return True
-
-    # Python3 compat
-    __bool__ = __nonzero__
-
-    @property
-    def shape(self):
-        return tuple(len(ax) for ax in self.axes)
-
-    @property
-    def ndim(self):
-        return len(self.axes)
-
-    def set_axis(self, axis, new_labels):
-        new_labels = _ensure_index(new_labels)
-        old_len = len(self.axes[axis])
-        new_len = len(new_labels)
-
-        if new_len != old_len:
-            raise ValueError('Length mismatch: Expected axis has %d elements, '
-                             'new values have %d elements' %
-                             (old_len, new_len))
-
-        self.axes[axis] = new_labels
-
-    def rename_axis(self, mapper, axis, copy=True):
-        """
-        Rename one of axes.
-
-        Parameters
-        ----------
-        mapper : unary callable
-        axis : int
-        copy : boolean, default True
-
-        """
-        obj = self.copy(deep=copy)
-        obj.set_axis(axis, _transform_index(self.axes[axis], mapper))
-        return obj
-
-    def add_prefix(self, prefix):
-        f = (str(prefix) + '%s').__mod__
-        return self.rename_axis(f, axis=0)
-
-    def add_suffix(self, suffix):
-        f = ('%s' + str(suffix)).__mod__
-        return self.rename_axis(f, axis=0)
-
-    @property
-    def _is_single_block(self):
-        if self.ndim == 1:
-            return True
-
-        if len(self.blocks) != 1:
-            return False
-
-        blk = self.blocks[0]
-        return (blk.mgr_locs.is_slice_like and
-                blk.mgr_locs.as_slice == slice(0, len(self), 1))
-
-    def _rebuild_blknos_and_blklocs(self):
-        """
-        Update mgr._blknos / mgr._blklocs.
-        """
-        new_blknos = np.empty(self.shape[0], dtype=np.int64)
-        new_blklocs = np.empty(self.shape[0], dtype=np.int64)
-        new_blknos.fill(-1)
-        new_blklocs.fill(-1)
-
-        for blkno, blk in enumerate(self.blocks):
-            rl = blk.mgr_locs
-            new_blknos[rl.indexer] = blkno
-            new_blklocs[rl.indexer] = np.arange(len(rl))
-
-        if (new_blknos == -1).any():
-            raise AssertionError("Gaps in blk ref_locs")
-
-        self._blknos = new_blknos
-        self._blklocs = new_blklocs
-
-    # make items read only for now
-    def _get_items(self):
-        return self.axes[0]
-
-    items = property(fget=_get_items)
-
-    def _get_counts(self, f):
-        """ return a dict of the counts of the function in BlockManager """
-        self._consolidate_inplace()
-        counts = dict()
-        for b in self.blocks:
-            v = f(b)
-            counts[v] = counts.get(v, 0) + b.shape[0]
-        return counts
-
-    def get_dtype_counts(self):
-        return self._get_counts(lambda b: b.dtype.name)
-
-    def get_ftype_counts(self):
-        return self._get_counts(lambda b: b.ftype)
-
-    def get_dtypes(self):
-        dtypes = np.array([blk.dtype for blk in self.blocks])
-        return algos.take_1d(dtypes, self._blknos, allow_fill=False)
-
-    def get_ftypes(self):
-        ftypes = np.array([blk.ftype for blk in self.blocks])
-        return algos.take_1d(ftypes, self._blknos, allow_fill=False)
-
-    def __getstate__(self):
-        block_values = [b.values for b in self.blocks]
-        block_items = [self.items[b.mgr_locs.indexer] for b in self.blocks]
-        axes_array = [ax for ax in self.axes]
-
-        extra_state = {
-            '0.14.1': {
-                'axes': axes_array,
-                'blocks': [dict(values=b.values, mgr_locs=b.mgr_locs.indexer)
-                           for b in self.blocks]
-            }
-        }
-
-        # First three elements of the state are to maintain forward
-        # compatibility with 0.13.1.
-        return axes_array, block_values, block_items, extra_state
-
-    def __setstate__(self, state):
-        def unpickle_block(values, mgr_locs):
-            # numpy < 1.7 pickle compat
-            if values.dtype == 'M8[us]':
-                values = values.astype('M8[ns]')
-            return make_block(values, placement=mgr_locs)
-
-        if (isinstance(state, tuple) and len(state) >= 4 and
-                '0.14.1' in state[3]):
-            state = state[3]['0.14.1']
-            self.axes = [_ensure_index(ax) for ax in state['axes']]
-            self.blocks = tuple(unpickle_block(b['values'], b['mgr_locs'])
-                                for b in state['blocks'])
-        else:
-            # discard anything after 3rd, support beta pickling format for a
-            # little while longer
-            ax_arrays, bvalues, bitems = state[:3]
-
-            self.axes = [_ensure_index(ax) for ax in ax_arrays]
-
-            if len(bitems) == 1 and self.axes[0].equals(bitems[0]):
-                # This is a workaround for pre-0.14.1 pickles that didn't
-                # support unpickling multi-block frames/panels with non-unique
-                # columns/items, because given a manager with items ["a", "b",
-                # "a"] there's no way of knowing which block's "a" is where.
-                #
-                # Single-block case can be supported under the assumption that
-                # block items corresponded to manager items 1-to-1.
-                all_mgr_locs = [slice(0, len(bitems[0]))]
-            else:
-                all_mgr_locs = [self.axes[0].get_indexer(blk_items)
-                                for blk_items in bitems]
-
-            self.blocks = tuple(
-                unpickle_block(values, mgr_locs)
-                for values, mgr_locs in zip(bvalues, all_mgr_locs))
-
-        self._post_setstate()
-
-    def _post_setstate(self):
-        self._is_consolidated = False
-        self._known_consolidated = False
-        self._rebuild_blknos_and_blklocs()
-
-    def __len__(self):
-        return len(self.items)
-
-    def __unicode__(self):
-        output = pprint_thing(self.__class__.__name__)
-        for i, ax in enumerate(self.axes):
-            if i == 0:
-                output += u('\nItems: %s') % ax
-            else:
-                output += u('\nAxis %d: %s') % (i, ax)
-
-        for block in self.blocks:
-            output += u('\n%s') % pprint_thing(block)
-        return output
-
-    def _verify_integrity(self):
-        mgr_shape = self.shape
-        tot_items = sum(len(x.mgr_locs) for x in self.blocks)
-        for block in self.blocks:
-            if block._verify_integrity and block.shape[1:] != mgr_shape[1:]:
-                construction_error(tot_items, block.shape[1:], self.axes)
-        if len(self.items) != tot_items:
-            raise AssertionError('Number of manager items must equal union of '
-                                 'block items\n# manager items: {0}, # '
-                                 'tot_items: {1}'.format(
-                                     len(self.items), tot_items))
-
-    def apply(self, f, axes=None, filter=None, do_integrity_check=False,
-              consolidate=True, **kwargs):
-        """
-        iterate over the blocks, collect and create a new block manager
-
-        Parameters
-        ----------
-        f : the callable or function name to operate on at the block level
-        axes : optional (if not supplied, use self.axes)
-        filter : list, if supplied, only call the block if the filter is in
-                 the block
-        do_integrity_check : boolean, default False. Do the block manager
-            integrity check
-        consolidate: boolean, default True. Join together blocks having same
-            dtype
-
-        Returns
-        -------
-        Block Manager (new object)
-
-        """
-
-        result_blocks = []
-
-        # filter kwarg is used in replace-* family of methods
-        if filter is not None:
-            filter_locs = set(self.items.get_indexer_for(filter))
-            if len(filter_locs) == len(self.items):
-                # All items are included, as if there were no filtering
-                filter = None
-            else:
-                kwargs['filter'] = filter_locs
-
-        if consolidate:
-            self._consolidate_inplace()
-
-        if f == 'where':
-            align_copy = True
-            if kwargs.get('align', True):
-                align_keys = ['other', 'cond']
-            else:
-                align_keys = ['cond']
-        elif f == 'putmask':
-            align_copy = False
-            if kwargs.get('align', True):
-                align_keys = ['new', 'mask']
-            else:
-                align_keys = ['mask']
-        elif f == 'eval':
-            align_copy = False
-            align_keys = ['other']
-        elif f == 'fillna':
-            # fillna internally does putmask, maybe it's better to do this
-            # at mgr, not block level?
-            align_copy = False
-            align_keys = ['value']
-        else:
-            align_keys = []
-
-        aligned_args = dict((k, kwargs[k])
-                            for k in align_keys
-                            if hasattr(kwargs[k], 'reindex_axis'))
-
-        for b in self.blocks:
-            if filter is not None:
-                if not b.mgr_locs.isin(filter_locs).any():
-                    result_blocks.append(b)
-                    continue
-
-            if aligned_args:
-                b_items = self.items[b.mgr_locs.indexer]
-
-                for k, obj in aligned_args.items():
-                    axis = getattr(obj, '_info_axis_number', 0)
-                    kwargs[k] = obj.reindex_axis(b_items, axis=axis,
-                                                 copy=align_copy)
-
-            kwargs['mgr'] = self
-            applied = getattr(b, f)(**kwargs)
-            result_blocks = _extend_blocks(applied, result_blocks)
-
-        if len(result_blocks) == 0:
-            return self.make_empty(axes or self.axes)
-        bm = self.__class__(result_blocks, axes or self.axes,
-                            do_integrity_check=do_integrity_check)
-        bm._consolidate_inplace()
-        return bm
-
-    def reduction(self, f, axis=0, consolidate=True, transposed=False,
-                  **kwargs):
-        """
-        iterate over the blocks, collect and create a new block manager.
-        This routine is intended for reduction type operations and
-        will do inference on the generated blocks.
-
-        Parameters
-        ----------
-        f: the callable or function name to operate on at the block level
-        axis: reduction axis, default 0
-        consolidate: boolean, default True. Join together blocks having same
-            dtype
-        transposed: boolean, default False
-            we are holding transposed data
-
-        Returns
-        -------
-        Block Manager (new object)
-
-        """
-
-        if consolidate:
-            self._consolidate_inplace()
-
-        axes, blocks = [], []
-        for b in self.blocks:
-            kwargs['mgr'] = self
-            axe, block = getattr(b, f)(axis=axis, **kwargs)
-
-            axes.append(axe)
-            blocks.append(block)
-
-        # note that some DatetimeTZ, Categorical are always ndim==1
-        ndim = set([b.ndim for b in blocks])
-
-        if 2 in ndim:
-
-            new_axes = list(self.axes)
-
-            # multiple blocks that are reduced
-            if len(blocks) > 1:
-                new_axes[1] = axes[0]
-
-                # reset the placement to the original
-                for b, sb in zip(blocks, self.blocks):
-                    b.mgr_locs = sb.mgr_locs
-
-            else:
-                new_axes[axis] = Index(np.concatenate(
-                    [ax.values for ax in axes]))
-
-            if transposed:
-                new_axes = new_axes[::-1]
-                blocks = [b.make_block(b.values.T,
-                                       placement=np.arange(b.shape[1])
-                                       ) for b in blocks]
-
-            return self.__class__(blocks, new_axes)
-
-        # 0 ndim
-        if 0 in ndim and 1 not in ndim:
-            values = np.array([b.values for b in blocks])
-            if len(values) == 1:
-                return values.item()
-            blocks = [make_block(values, ndim=1)]
-            axes = Index([ax[0] for ax in axes])
-
-        # single block
-        values = _concat._concat_compat([b.values for b in blocks])
-
-        # compute the orderings of our original data
-        if len(self.blocks) > 1:
-
-            indexer = np.empty(len(self.axes[0]), dtype=np.intp)
-            i = 0
-            for b in self.blocks:
-                for j in b.mgr_locs:
-                    indexer[j] = i
-                    i = i + 1
-
-            values = values.take(indexer)
-
-        return SingleBlockManager(
-            [make_block(values,
-                        ndim=1,
-                        placement=np.arange(len(values)))],
-            axes[0])
-
-    def isnull(self, **kwargs):
-        return self.apply('apply', **kwargs)
-
-    def where(self, **kwargs):
-        return self.apply('where', **kwargs)
-
-    def eval(self, **kwargs):
-        return self.apply('eval', **kwargs)
-
-    def quantile(self, **kwargs):
-        return self.reduction('quantile', **kwargs)
-
-    def setitem(self, **kwargs):
-        return self.apply('setitem', **kwargs)
-
-    def putmask(self, **kwargs):
-        return self.apply('putmask', **kwargs)
-
-    def diff(self, **kwargs):
-        return self.apply('diff', **kwargs)
-
-    def interpolate(self, **kwargs):
-        return self.apply('interpolate', **kwargs)
-
-    def shift(self, **kwargs):
-        return self.apply('shift', **kwargs)
-
-    def fillna(self, **kwargs):
-        return self.apply('fillna', **kwargs)
-
-    def downcast(self, **kwargs):
-        return self.apply('downcast', **kwargs)
-
-    def astype(self, dtype, **kwargs):
-        return self.apply('astype', dtype=dtype, **kwargs)
-
-    def convert(self, **kwargs):
-        return self.apply('convert', **kwargs)
-
-    def replace(self, **kwargs):
-        return self.apply('replace', **kwargs)
-
-    def replace_list(self, src_list, dest_list, inplace=False, regex=False,
-                     mgr=None):
-        """ do a list replace """
-
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-
-        if mgr is None:
-            mgr = self
-
-        # figure out our mask a-priori to avoid repeated replacements
-        values = self.as_matrix()
-
-        def comp(s):
-            if isnull(s):
-                return isnull(values)
-            return _maybe_compare(values, getattr(s, 'asm8', s), operator.eq)
-
-        def _cast_scalar(block, scalar):
-            dtype, val = infer_dtype_from_scalar(scalar, pandas_dtype=True)
-            if not is_dtype_equal(block.dtype, dtype):
-                dtype = find_common_type([block.dtype, dtype])
-                block = block.astype(dtype)
-                # use original value
-                val = scalar
-
-            return block, val
-
-        masks = [comp(s) for i, s in enumerate(src_list)]
-
-        result_blocks = []
-        src_len = len(src_list) - 1
-        for blk in self.blocks:
-
-            # its possible to get multiple result blocks here
-            # replace ALWAYS will return a list
-            rb = [blk if inplace else blk.copy()]
-            for i, (s, d) in enumerate(zip(src_list, dest_list)):
-                new_rb = []
-                for b in rb:
-                    if b.dtype == np.object_:
-                        convert = i == src_len
-                        result = b.replace(s, d, inplace=inplace, regex=regex,
-                                           mgr=mgr, convert=convert)
-                        new_rb = _extend_blocks(result, new_rb)
-                    else:
-                        # get our mask for this element, sized to this
-                        # particular block
-                        m = masks[i][b.mgr_locs.indexer]
-                        if m.any():
-                            b, val = _cast_scalar(b, d)
-                            new_rb.extend(b.putmask(m, val, inplace=True))
-                        else:
-                            new_rb.append(b)
-                rb = new_rb
-            result_blocks.extend(rb)
-
-        bm = self.__class__(result_blocks, self.axes)
-        bm._consolidate_inplace()
-        return bm
-
-    def reshape_nd(self, axes, **kwargs):
-        """ a 2d-nd reshape operation on a BlockManager """
-        return self.apply('reshape_nd', axes=axes, **kwargs)
-
-    def is_consolidated(self):
-        """
-        Return True if more than one block with the same dtype
-        """
-        if not self._known_consolidated:
-            self._consolidate_check()
-        return self._is_consolidated
-
-    def _consolidate_check(self):
-        ftypes = [blk.ftype for blk in self.blocks]
-        self._is_consolidated = len(ftypes) == len(set(ftypes))
-        self._known_consolidated = True
-
-    @property
-    def is_mixed_type(self):
-        # Warning, consolidation needs to get checked upstairs
-        self._consolidate_inplace()
-        return len(self.blocks) > 1
-
-    @property
-    def is_numeric_mixed_type(self):
-        # Warning, consolidation needs to get checked upstairs
-        self._consolidate_inplace()
-        return all([block.is_numeric for block in self.blocks])
-
-    @property
-    def is_datelike_mixed_type(self):
-        # Warning, consolidation needs to get checked upstairs
-        self._consolidate_inplace()
-        return any([block.is_datelike for block in self.blocks])
-
-    @property
-    def is_view(self):
-        """ return a boolean if we are a single block and are a view """
-        if len(self.blocks) == 1:
-            return self.blocks[0].is_view
-
-        # It is technically possible to figure out which blocks are views
-        # e.g. [ b.values.base is not None for b in self.blocks ]
-        # but then we have the case of possibly some blocks being a view
-        # and some blocks not. setting in theory is possible on the non-view
-        # blocks w/o causing a SettingWithCopy raise/warn. But this is a bit
-        # complicated
-
-        return False
-
-    def get_bool_data(self, copy=False):
-        """
-        Parameters
-        ----------
-        copy : boolean, default False
-            Whether to copy the blocks
-        """
-        self._consolidate_inplace()
-        return self.combine([b for b in self.blocks if b.is_bool], copy)
-
-    def get_numeric_data(self, copy=False):
-        """
-        Parameters
-        ----------
-        copy : boolean, default False
-            Whether to copy the blocks
-        """
-        self._consolidate_inplace()
-        return self.combine([b for b in self.blocks if b.is_numeric], copy)
-
-    def combine(self, blocks, copy=True):
-        """ return a new manager with the blocks """
-        if len(blocks) == 0:
-            return self.make_empty()
-
-        # FIXME: optimization potential
-        indexer = np.sort(np.concatenate([b.mgr_locs.as_array
-                                          for b in blocks]))
-        inv_indexer = lib.get_reverse_indexer(indexer, self.shape[0])
-
-        new_blocks = []
-        for b in blocks:
-            b = b.copy(deep=copy)
-            b.mgr_locs = algos.take_1d(inv_indexer, b.mgr_locs.as_array,
-                                       axis=0, allow_fill=False)
-            new_blocks.append(b)
-
-        axes = list(self.axes)
-        axes[0] = self.items.take(indexer)
-
-        return self.__class__(new_blocks, axes, do_integrity_check=False)
-
-    def get_slice(self, slobj, axis=0):
-        if axis >= self.ndim:
-            raise IndexError("Requested axis not found in manager")
-
-        if axis == 0:
-            new_blocks = self._slice_take_blocks_ax0(slobj)
-        else:
-            slicer = [slice(None)] * (axis + 1)
-            slicer[axis] = slobj
-            slicer = tuple(slicer)
-            new_blocks = [blk.getitem_block(slicer) for blk in self.blocks]
-
-        new_axes = list(self.axes)
-        new_axes[axis] = new_axes[axis][slobj]
-
-        bm = self.__class__(new_blocks, new_axes, do_integrity_check=False,
-                            fastpath=True)
-        bm._consolidate_inplace()
-        return bm
-
-    def __contains__(self, item):
-        return item in self.items
-
-    @property
-    def nblocks(self):
-        return len(self.blocks)
-
-    def copy(self, deep=True, mgr=None):
-        """
-        Make deep or shallow copy of BlockManager
-
-        Parameters
-        ----------
-        deep : boolean o rstring, default True
-            If False, return shallow copy (do not copy data)
-            If 'all', copy data and a deep copy of the index
-
-        Returns
-        -------
-        copy : BlockManager
-        """
-
-        # this preserves the notion of view copying of axes
-        if deep:
-            if deep == 'all':
-                copy = lambda ax: ax.copy(deep=True)
-            else:
-                copy = lambda ax: ax.view()
-            new_axes = [copy(ax) for ax in self.axes]
-        else:
-            new_axes = list(self.axes)
-        return self.apply('copy', axes=new_axes, deep=deep,
-                          do_integrity_check=False)
-
-    def as_matrix(self, items=None):
-        if len(self.blocks) == 0:
-            return np.empty(self.shape, dtype=float)
-
-        if items is not None:
-            mgr = self.reindex_axis(items, axis=0)
-        else:
-            mgr = self
-
-        if self._is_single_block or not self.is_mixed_type:
-            return mgr.blocks[0].get_values()
-        else:
-            return mgr._interleave()
-
-    def _interleave(self):
-        """
-        Return ndarray from blocks with specified item order
-        Items must be contained in the blocks
-        """
-        dtype = _interleaved_dtype(self.blocks)
-
-        result = np.empty(self.shape, dtype=dtype)
-
-        if result.shape[0] == 0:
-            # Workaround for numpy 1.7 bug:
-            #
-            #     >>> a = np.empty((0,10))
-            #     >>> a[slice(0,0)]
-            #     array([], shape=(0, 10), dtype=float64)
-            #     >>> a[[]]
-            #     Traceback (most recent call last):
-            #       File "<stdin>", line 1, in <module>
-            #     IndexError: index 0 is out of bounds for axis 0 with size 0
-            return result
-
-        itemmask = np.zeros(self.shape[0])
-
-        for blk in self.blocks:
-            rl = blk.mgr_locs
-            result[rl.indexer] = blk.get_values(dtype)
-            itemmask[rl.indexer] = 1
-
-        if not itemmask.all():
-            raise AssertionError('Some items were not contained in blocks')
-
-        return result
-
-    def xs(self, key, axis=1, copy=True, takeable=False):
-        if axis < 1:
-            raise AssertionError('Can only take xs across axis >= 1, got %d' %
-                                 axis)
-
-        # take by position
-        if takeable:
-            loc = key
-        else:
-            loc = self.axes[axis].get_loc(key)
-
-        slicer = [slice(None, None) for _ in range(self.ndim)]
-        slicer[axis] = loc
-        slicer = tuple(slicer)
-
-        new_axes = list(self.axes)
-
-        # could be an array indexer!
-        if isinstance(loc, (slice, np.ndarray)):
-            new_axes[axis] = new_axes[axis][loc]
-        else:
-            new_axes.pop(axis)
-
-        new_blocks = []
-        if len(self.blocks) > 1:
-            # we must copy here as we are mixed type
-            for blk in self.blocks:
-                newb = make_block(values=blk.values[slicer],
-                                  klass=blk.__class__, fastpath=True,
-                                  placement=blk.mgr_locs)
-                new_blocks.append(newb)
-        elif len(self.blocks) == 1:
-            block = self.blocks[0]
-            vals = block.values[slicer]
-            if copy:
-                vals = vals.copy()
-            new_blocks = [make_block(values=vals,
-                                     placement=block.mgr_locs,
-                                     klass=block.__class__,
-                                     fastpath=True, )]
-
-        return self.__class__(new_blocks, new_axes)
-
-    def fast_xs(self, loc):
-        """
-        get a cross sectional for a given location in the
-        items ; handle dups
-
-        return the result, is *could* be a view in the case of a
-        single block
-        """
-        if len(self.blocks) == 1:
-            return self.blocks[0].iget((slice(None), loc))
-
-        items = self.items
-
-        # non-unique (GH4726)
-        if not items.is_unique:
-            result = self._interleave()
-            if self.ndim == 2:
-                result = result.T
-            return result[loc]
-
-        # unique
-        dtype = _interleaved_dtype(self.blocks)
-        n = len(items)
-        result = np.empty(n, dtype=dtype)
-        for blk in self.blocks:
-            # Such assignment may incorrectly coerce NaT to None
-            # result[blk.mgr_locs] = blk._slice((slice(None), loc))
-            for i, rl in enumerate(blk.mgr_locs):
-                result[rl] = blk._try_coerce_result(blk.iget((i, loc)))
-
-        return result
-
-    def consolidate(self):
-        """
-        Join together blocks having same dtype
-
-        Returns
-        -------
-        y : BlockManager
-        """
-        if self.is_consolidated():
-            return self
-
-        bm = self.__class__(self.blocks, self.axes)
-        bm._is_consolidated = False
-        bm._consolidate_inplace()
-        return bm
-
-    def _consolidate_inplace(self):
-        if not self.is_consolidated():
-            self.blocks = tuple(_consolidate(self.blocks))
-            self._is_consolidated = True
-            self._known_consolidated = True
-            self._rebuild_blknos_and_blklocs()
-
-    def get(self, item, fastpath=True):
-        """
-        Return values for selected item (ndarray or BlockManager).
-        """
-        if self.items.is_unique:
-
-            if not isnull(item):
-                loc = self.items.get_loc(item)
-            else:
-                indexer = np.arange(len(self.items))[isnull(self.items)]
-
-                # allow a single nan location indexer
-                if not is_scalar(indexer):
-                    if len(indexer) == 1:
-                        loc = indexer.item()
-                    else:
-                        raise ValueError("cannot label index with a null key")
-
-            return self.iget(loc, fastpath=fastpath)
-        else:
-
-            if isnull(item):
-                raise TypeError("cannot label index with a null key")
-
-            indexer = self.items.get_indexer_for([item])
-            return self.reindex_indexer(new_axis=self.items[indexer],
-                                        indexer=indexer, axis=0,
-                                        allow_dups=True)
-
-    def iget(self, i, fastpath=True):
-        """
-        Return the data as a SingleBlockManager if fastpath=True and possible
-
-        Otherwise return as a ndarray
-        """
-        block = self.blocks[self._blknos[i]]
-        values = block.iget(self._blklocs[i])
-        if not fastpath or not block._box_to_block_values or values.ndim != 1:
-            return values
-
-        # fastpath shortcut for select a single-dim from a 2-dim BM
-        return SingleBlockManager(
-            [block.make_block_same_class(values,
-                                         placement=slice(0, len(values)),
-                                         ndim=1, fastpath=True)],
-            self.axes[1])
-
-    def get_scalar(self, tup):
-        """
-        Retrieve single item
-        """
-        full_loc = list(ax.get_loc(x) for ax, x in zip(self.axes, tup))
-        blk = self.blocks[self._blknos[full_loc[0]]]
-        values = blk.values
-
-        # FIXME: this may return non-upcasted types?
-        if values.ndim == 1:
-            return values[full_loc[1]]
-
-        full_loc[0] = self._blklocs[full_loc[0]]
-        return values[tuple(full_loc)]
-
-    def delete(self, item):
-        """
-        Delete selected item (items if non-unique) in-place.
-        """
-        indexer = self.items.get_loc(item)
-
-        is_deleted = np.zeros(self.shape[0], dtype=np.bool_)
-        is_deleted[indexer] = True
-        ref_loc_offset = -is_deleted.cumsum()
-
-        is_blk_deleted = [False] * len(self.blocks)
-
-        if isinstance(indexer, int):
-            affected_start = indexer
-        else:
-            affected_start = is_deleted.nonzero()[0][0]
-
-        for blkno, _ in _fast_count_smallints(self._blknos[affected_start:]):
-            blk = self.blocks[blkno]
-            bml = blk.mgr_locs
-            blk_del = is_deleted[bml.indexer].nonzero()[0]
-
-            if len(blk_del) == len(bml):
-                is_blk_deleted[blkno] = True
-                continue
-            elif len(blk_del) != 0:
-                blk.delete(blk_del)
-                bml = blk.mgr_locs
-
-            blk.mgr_locs = bml.add(ref_loc_offset[bml.indexer])
-
-        # FIXME: use Index.delete as soon as it uses fastpath=True
-        self.axes[0] = self.items[~is_deleted]
-        self.blocks = tuple(b for blkno, b in enumerate(self.blocks)
-                            if not is_blk_deleted[blkno])
-        self._shape = None
-        self._rebuild_blknos_and_blklocs()
-
-    def set(self, item, value, check=False):
-        """
-        Set new item in-place. Does not consolidate. Adds new Block if not
-        contained in the current set of items
-        if check, then validate that we are not setting the same data in-place
-        """
-        # FIXME: refactor, clearly separate broadcasting & zip-like assignment
-        #        can prob also fix the various if tests for sparse/categorical
-
-        value_is_extension_type = is_extension_type(value)
-
-        # categorical/spares/datetimetz
-        if value_is_extension_type:
-
-            def value_getitem(placement):
-                return value
-        else:
-            if value.ndim == self.ndim - 1:
-                value = _safe_reshape(value, (1,) + value.shape)
-
-                def value_getitem(placement):
-                    return value
-            else:
-
-                def value_getitem(placement):
-                    return value[placement.indexer]
-
-            if value.shape[1:] != self.shape[1:]:
-                raise AssertionError('Shape of new values must be compatible '
-                                     'with manager shape')
-
-        try:
-            loc = self.items.get_loc(item)
-        except KeyError:
-            # This item wasn't present, just insert at end
-            self.insert(len(self.items), item, value)
-            return
-
-        if isinstance(loc, int):
-            loc = [loc]
-
-        blknos = self._blknos[loc]
-        blklocs = self._blklocs[loc].copy()
-
-        unfit_mgr_locs = []
-        unfit_val_locs = []
-        removed_blknos = []
-        for blkno, val_locs in _get_blkno_placements(blknos, len(self.blocks),
-                                                     group=True):
-            blk = self.blocks[blkno]
-            blk_locs = blklocs[val_locs.indexer]
-            if blk.should_store(value):
-                blk.set(blk_locs, value_getitem(val_locs), check=check)
-            else:
-                unfit_mgr_locs.append(blk.mgr_locs.as_array[blk_locs])
-                unfit_val_locs.append(val_locs)
-
-                # If all block items are unfit, schedule the block for removal.
-                if len(val_locs) == len(blk.mgr_locs):
-                    removed_blknos.append(blkno)
-                else:
-                    self._blklocs[blk.mgr_locs.indexer] = -1
-                    blk.delete(blk_locs)
-                    self._blklocs[blk.mgr_locs.indexer] = np.arange(len(blk))
-
-        if len(removed_blknos):
-            # Remove blocks & update blknos accordingly
-            is_deleted = np.zeros(self.nblocks, dtype=np.bool_)
-            is_deleted[removed_blknos] = True
-
-            new_blknos = np.empty(self.nblocks, dtype=np.int64)
-            new_blknos.fill(-1)
-            new_blknos[~is_deleted] = np.arange(self.nblocks -
-                                                len(removed_blknos))
-            self._blknos = algos.take_1d(new_blknos, self._blknos, axis=0,
-                                         allow_fill=False)
-            self.blocks = tuple(blk for i, blk in enumerate(self.blocks)
-                                if i not in set(removed_blknos))
-
-        if unfit_val_locs:
-            unfit_mgr_locs = np.concatenate(unfit_mgr_locs)
-            unfit_count = len(unfit_mgr_locs)
-
-            new_blocks = []
-            if value_is_extension_type:
-                # This code (ab-)uses the fact that sparse blocks contain only
-                # one item.
-                new_blocks.extend(
-                    make_block(values=value.copy(), ndim=self.ndim,
-                               placement=slice(mgr_loc, mgr_loc + 1))
-                    for mgr_loc in unfit_mgr_locs)
-
-                self._blknos[unfit_mgr_locs] = (np.arange(unfit_count) +
-                                                len(self.blocks))
-                self._blklocs[unfit_mgr_locs] = 0
-
-            else:
-                # unfit_val_locs contains BlockPlacement objects
-                unfit_val_items = unfit_val_locs[0].append(unfit_val_locs[1:])
-
-                new_blocks.append(
-                    make_block(values=value_getitem(unfit_val_items),
-                               ndim=self.ndim, placement=unfit_mgr_locs))
-
-                self._blknos[unfit_mgr_locs] = len(self.blocks)
-                self._blklocs[unfit_mgr_locs] = np.arange(unfit_count)
-
-            self.blocks += tuple(new_blocks)
-
-            # Newly created block's dtype may already be present.
-            self._known_consolidated = False
-
-    def insert(self, loc, item, value, allow_duplicates=False):
-        """
-        Insert item at selected position.
-
-        Parameters
-        ----------
-        loc : int
-        item : hashable
-        value : array_like
-        allow_duplicates: bool
-            If False, trying to insert non-unique item will raise
-
-        """
-        if not allow_duplicates and item in self.items:
-            # Should this be a different kind of error??
-            raise ValueError('cannot insert %s, already exists' % item)
-
-        if not isinstance(loc, int):
-            raise TypeError("loc must be int")
-
-        # insert to the axis; this could possibly raise a TypeError
-        new_axis = self.items.insert(loc, item)
-
-        block = make_block(values=value, ndim=self.ndim,
-                           placement=slice(loc, loc + 1))
-
-        for blkno, count in _fast_count_smallints(self._blknos[loc:]):
-            blk = self.blocks[blkno]
-            if count == len(blk.mgr_locs):
-                blk.mgr_locs = blk.mgr_locs.add(1)
-            else:
-                new_mgr_locs = blk.mgr_locs.as_array.copy()
-                new_mgr_locs[new_mgr_locs >= loc] += 1
-                blk.mgr_locs = new_mgr_locs
-
-        if loc == self._blklocs.shape[0]:
-            # np.append is a lot faster (at least in numpy 1.7.1), let's use it
-            # if we can.
-            self._blklocs = np.append(self._blklocs, 0)
-            self._blknos = np.append(self._blknos, len(self.blocks))
-        else:
-            self._blklocs = np.insert(self._blklocs, loc, 0)
-            self._blknos = np.insert(self._blknos, loc, len(self.blocks))
-
-        self.axes[0] = new_axis
-        self.blocks += (block,)
-        self._shape = None
-
-        self._known_consolidated = False
-
-        if len(self.blocks) > 100:
-            self._consolidate_inplace()
-
-    def reindex_axis(self, new_index, axis, method=None, limit=None,
-                     fill_value=None, copy=True):
-        """
-        Conform block manager to new index.
-        """
-        new_index = _ensure_index(new_index)
-        new_index, indexer = self.axes[axis].reindex(new_index, method=method,
-                                                     limit=limit)
-
-        return self.reindex_indexer(new_index, indexer, axis=axis,
-                                    fill_value=fill_value, copy=copy)
-
-    def reindex_indexer(self, new_axis, indexer, axis, fill_value=None,
-                        allow_dups=False, copy=True):
-        """
-        Parameters
-        ----------
-        new_axis : Index
-        indexer : ndarray of int64 or None
-        axis : int
-        fill_value : object
-        allow_dups : bool
-
-        pandas-indexer with -1's only.
-        """
-        if indexer is None:
-            if new_axis is self.axes[axis] and not copy:
-                return self
-
-            result = self.copy(deep=copy)
-            result.axes = list(self.axes)
-            result.axes[axis] = new_axis
-            return result
-
-        self._consolidate_inplace()
-
-        # some axes don't allow reindexing with dups
-        if not allow_dups:
-            self.axes[axis]._can_reindex(indexer)
-
-        if axis >= self.ndim:
-            raise IndexError("Requested axis not found in manager")
-
-        if axis == 0:
-            new_blocks = self._slice_take_blocks_ax0(indexer,
-                                                     fill_tuple=(fill_value,))
-        else:
-            new_blocks = [blk.take_nd(indexer, axis=axis, fill_tuple=(
-                fill_value if fill_value is not None else blk.fill_value,))
-                for blk in self.blocks]
-
-        new_axes = list(self.axes)
-        new_axes[axis] = new_axis
-        return self.__class__(new_blocks, new_axes)
-
-    def _slice_take_blocks_ax0(self, slice_or_indexer, fill_tuple=None):
-        """
-        Slice/take blocks along axis=0.
-
-        Overloaded for SingleBlock
-
-        Returns
-        -------
-        new_blocks : list of Block
-
-        """
-
-        allow_fill = fill_tuple is not None
-
-        sl_type, slobj, sllen = _preprocess_slice_or_indexer(
-            slice_or_indexer, self.shape[0], allow_fill=allow_fill)
-
-        if self._is_single_block:
-            blk = self.blocks[0]
-
-            if sl_type in ('slice', 'mask'):
-                return [blk.getitem_block(slobj, new_mgr_locs=slice(0, sllen))]
-            elif not allow_fill or self.ndim == 1:
-                if allow_fill and fill_tuple[0] is None:
-                    _, fill_value = maybe_promote(blk.dtype)
-                    fill_tuple = (fill_value, )
-
-                return [blk.take_nd(slobj, axis=0,
-                                    new_mgr_locs=slice(0, sllen),
-                                    fill_tuple=fill_tuple)]
-
-        if sl_type in ('slice', 'mask'):
-            blknos = self._blknos[slobj]
-            blklocs = self._blklocs[slobj]
-        else:
-            blknos = algos.take_1d(self._blknos, slobj, fill_value=-1,
-                                   allow_fill=allow_fill)
-            blklocs = algos.take_1d(self._blklocs, slobj, fill_value=-1,
-                                    allow_fill=allow_fill)
-
-        # When filling blknos, make sure blknos is updated before appending to
-        # blocks list, that way new blkno is exactly len(blocks).
-        #
-        # FIXME: mgr_groupby_blknos must return mgr_locs in ascending order,
-        # pytables serialization will break otherwise.
-        blocks = []
-        for blkno, mgr_locs in _get_blkno_placements(blknos, len(self.blocks),
-                                                     group=True):
-            if blkno == -1:
-                # If we've got here, fill_tuple was not None.
-                fill_value = fill_tuple[0]
-
-                blocks.append(self._make_na_block(placement=mgr_locs,
-                                                  fill_value=fill_value))
-            else:
-                blk = self.blocks[blkno]
-
-                # Otherwise, slicing along items axis is necessary.
-                if not blk._can_consolidate:
-                    # A non-consolidatable block, it's easy, because there's
-                    # only one item and each mgr loc is a copy of that single
-                    # item.
-                    for mgr_loc in mgr_locs:
-                        newblk = blk.copy(deep=True)
-                        newblk.mgr_locs = slice(mgr_loc, mgr_loc + 1)
-                        blocks.append(newblk)
-
-                else:
-                    blocks.append(blk.take_nd(blklocs[mgr_locs.indexer],
-                                              axis=0, new_mgr_locs=mgr_locs,
-                                              fill_tuple=None))
-
-        return blocks
-
-    def _make_na_block(self, placement, fill_value=None):
-        # TODO: infer dtypes other than float64 from fill_value
-
-        if fill_value is None:
-            fill_value = np.nan
-        block_shape = list(self.shape)
-        block_shape[0] = len(placement)
-
-        dtype, fill_value = infer_dtype_from_scalar(fill_value)
-        block_values = np.empty(block_shape, dtype=dtype)
-        block_values.fill(fill_value)
-        return make_block(block_values, placement=placement)
-
-    def take(self, indexer, axis=1, verify=True, convert=True):
-        """
-        Take items along any axis.
-        """
-        self._consolidate_inplace()
-        indexer = (np.arange(indexer.start, indexer.stop, indexer.step,
-                             dtype='int64')
-                   if isinstance(indexer, slice)
-                   else np.asanyarray(indexer, dtype='int64'))
-
-        n = self.shape[axis]
-        if convert:
-            indexer = maybe_convert_indices(indexer, n)
-
-        if verify:
-            if ((indexer == -1) | (indexer >= n)).any():
-                raise Exception('Indices must be nonzero and less than '
-                                'the axis length')
-
-        new_labels = self.axes[axis].take(indexer)
-        return self.reindex_indexer(new_axis=new_labels, indexer=indexer,
-                                    axis=axis, allow_dups=True)
-
-    def merge(self, other, lsuffix='', rsuffix=''):
-        if not self._is_indexed_like(other):
-            raise AssertionError('Must have same axes to merge managers')
-
-        l, r = items_overlap_with_suffix(left=self.items, lsuffix=lsuffix,
-                                         right=other.items, rsuffix=rsuffix)
-        new_items = _concat_indexes([l, r])
-
-        new_blocks = [blk.copy(deep=False) for blk in self.blocks]
-
-        offset = self.shape[0]
-        for blk in other.blocks:
-            blk = blk.copy(deep=False)
-            blk.mgr_locs = blk.mgr_locs.add(offset)
-            new_blocks.append(blk)
-
-        new_axes = list(self.axes)
-        new_axes[0] = new_items
-
-        return self.__class__(_consolidate(new_blocks), new_axes)
-
-    def _is_indexed_like(self, other):
-        """
-        Check all axes except items
-        """
-        if self.ndim != other.ndim:
-            raise AssertionError('Number of dimensions must agree '
-                                 'got %d and %d' % (self.ndim, other.ndim))
-        for ax, oax in zip(self.axes[1:], other.axes[1:]):
-            if not ax.equals(oax):
-                return False
-        return True
-
-    def equals(self, other):
-        self_axes, other_axes = self.axes, other.axes
-        if len(self_axes) != len(other_axes):
-            return False
-        if not all(ax1.equals(ax2) for ax1, ax2 in zip(self_axes, other_axes)):
-            return False
-        self._consolidate_inplace()
-        other._consolidate_inplace()
-        if len(self.blocks) != len(other.blocks):
-            return False
-
-        # canonicalize block order, using a tuple combining the type
-        # name and then mgr_locs because there might be unconsolidated
-        # blocks (say, Categorical) which can only be distinguished by
-        # the iteration order
-        def canonicalize(block):
-            return (block.dtype.name, block.mgr_locs.as_array.tolist())
-
-        self_blocks = sorted(self.blocks, key=canonicalize)
-        other_blocks = sorted(other.blocks, key=canonicalize)
-        return all(block.equals(oblock)
-                   for block, oblock in zip(self_blocks, other_blocks))
-
-
-class SingleBlockManager(BlockManager):
-    """ manage a single block with """
-
-    ndim = 1
-    _is_consolidated = True
-    _known_consolidated = True
-    __slots__ = ()
-
-    def __init__(self, block, axis, do_integrity_check=False, fastpath=False):
-
-        if isinstance(axis, list):
-            if len(axis) != 1:
-                raise ValueError("cannot create SingleBlockManager with more "
-                                 "than 1 axis")
-            axis = axis[0]
-
-        # passed from constructor, single block, single axis
-        if fastpath:
-            self.axes = [axis]
-            if isinstance(block, list):
-
-                # empty block
-                if len(block) == 0:
-                    block = [np.array([])]
-                elif len(block) != 1:
-                    raise ValueError('Cannot create SingleBlockManager with '
-                                     'more than 1 block')
-                block = block[0]
-        else:
-            self.axes = [_ensure_index(axis)]
-
-            # create the block here
-            if isinstance(block, list):
-
-                # provide consolidation to the interleaved_dtype
-                if len(block) > 1:
-                    dtype = _interleaved_dtype(block)
-                    block = [b.astype(dtype) for b in block]
-                    block = _consolidate(block)
-
-                if len(block) != 1:
-                    raise ValueError('Cannot create SingleBlockManager with '
-                                     'more than 1 block')
-                block = block[0]
-
-        if not isinstance(block, Block):
-            block = make_block(block, placement=slice(0, len(axis)), ndim=1,
-                               fastpath=True)
-
-        self.blocks = [block]
-
-    def _post_setstate(self):
-        pass
-
-    @property
-    def _block(self):
-        return self.blocks[0]
-
-    @property
-    def _values(self):
-        return self._block.values
-
-    @property
-    def _blknos(self):
-        """ compat with BlockManager """
-        return None
-
-    @property
-    def _blklocs(self):
-        """ compat with BlockManager """
-        return None
-
-    def reindex(self, new_axis, indexer=None, method=None, fill_value=None,
-                limit=None, copy=True):
-        # if we are the same and don't copy, just return
-        if self.index.equals(new_axis):
-            if copy:
-                return self.copy(deep=True)
-            else:
-                return self
-
-        values = self._block.get_values()
-
-        if indexer is None:
-            indexer = self.items.get_indexer_for(new_axis)
-
-        if fill_value is None:
-            fill_value = np.nan
-
-        new_values = algos.take_1d(values, indexer, fill_value=fill_value)
-
-        # fill if needed
-        if method is not None or limit is not None:
-            new_values = missing.interpolate_2d(new_values,
-                                                method=method,
-                                                limit=limit,
-                                                fill_value=fill_value)
-
-        if self._block.is_sparse:
-            make_block = self._block.make_block_same_class
-
-        block = make_block(new_values, copy=copy,
-                           placement=slice(0, len(new_axis)))
-
-        mgr = SingleBlockManager(block, new_axis)
-        mgr._consolidate_inplace()
-        return mgr
-
-    def get_slice(self, slobj, axis=0):
-        if axis >= self.ndim:
-            raise IndexError("Requested axis not found in manager")
-
-        return self.__class__(self._block._slice(slobj),
-                              self.index[slobj], fastpath=True)
-
-    @property
-    def index(self):
-        return self.axes[0]
-
-    def convert(self, **kwargs):
-        """ convert the whole block as one """
-        kwargs['by_item'] = False
-        return self.apply('convert', **kwargs)
-
-    @property
-    def dtype(self):
-        return self._block.dtype
-
-    @property
-    def array_dtype(self):
-        return self._block.array_dtype
-
-    @property
-    def ftype(self):
-        return self._block.ftype
-
-    def get_dtype_counts(self):
-        return {self.dtype.name: 1}
-
-    def get_ftype_counts(self):
-        return {self.ftype: 1}
-
-    def get_dtypes(self):
-        return np.array([self._block.dtype])
-
-    def get_ftypes(self):
-        return np.array([self._block.ftype])
-
-    def external_values(self):
-        return self._block.external_values()
-
-    def internal_values(self):
-        return self._block.internal_values()
-
-    def get_values(self):
-        """ return a dense type view """
-        return np.array(self._block.to_dense(), copy=False)
-
-    @property
-    def asobject(self):
-        """
-        return a object dtype array. datetime/timedelta like values are boxed
-        to Timestamp/Timedelta instances.
-        """
-        return self._block.get_values(dtype=object)
-
-    @property
-    def itemsize(self):
-        return self._block.values.itemsize
-
-    @property
-    def _can_hold_na(self):
-        return self._block._can_hold_na
-
-    def is_consolidated(self):
-        return True
-
-    def _consolidate_check(self):
-        pass
-
-    def _consolidate_inplace(self):
-        pass
-
-    def delete(self, item):
-        """
-        Delete single item from SingleBlockManager.
-
-        Ensures that self.blocks doesn't become empty.
-        """
-        loc = self.items.get_loc(item)
-        self._block.delete(loc)
-        self.axes[0] = self.axes[0].delete(loc)
-
-    def fast_xs(self, loc):
-        """
-        fast path for getting a cross-section
-        return a view of the data
-        """
-        return self._block.values[loc]
-
-
-def construction_error(tot_items, block_shape, axes, e=None):
-    """ raise a helpful message about our construction """
-    passed = tuple(map(int, [tot_items] + list(block_shape)))
-    implied = tuple(map(int, [len(ax) for ax in axes]))
-    if passed == implied and e is not None:
-        raise e
-    if block_shape[0] == 0:
-        raise ValueError("Empty data passed with indices specified.")
-    raise ValueError("Shape of passed values is {0}, indices imply {1}".format(
-        passed, implied))
-
-
-def create_block_manager_from_blocks(blocks, axes):
-    try:
-        if len(blocks) == 1 and not isinstance(blocks[0], Block):
-            # if blocks[0] is of length 0, return empty blocks
-            if not len(blocks[0]):
-                blocks = []
-            else:
-                # It's OK if a single block is passed as values, its placement
-                # is basically "all items", but if there're many, don't bother
-                # converting, it's an error anyway.
-                blocks = [make_block(values=blocks[0],
-                                     placement=slice(0, len(axes[0])))]
-
-        mgr = BlockManager(blocks, axes)
-        mgr._consolidate_inplace()
-        return mgr
-
-    except (ValueError) as e:
-        blocks = [getattr(b, 'values', b) for b in blocks]
-        tot_items = sum(b.shape[0] for b in blocks)
-        construction_error(tot_items, blocks[0].shape[1:], axes, e)
-
-
-def create_block_manager_from_arrays(arrays, names, axes):
-
-    try:
-        blocks = form_blocks(arrays, names, axes)
-        mgr = BlockManager(blocks, axes)
-        mgr._consolidate_inplace()
-        return mgr
-    except ValueError as e:
-        construction_error(len(arrays), arrays[0].shape, axes, e)
-
-
-def form_blocks(arrays, names, axes):
-    # put "leftover" items in float bucket, where else?
-    # generalize?
-    float_items = []
-    complex_items = []
-    int_items = []
-    bool_items = []
-    object_items = []
-    sparse_items = []
-    datetime_items = []
-    datetime_tz_items = []
-    cat_items = []
-    extra_locs = []
-
-    names_idx = Index(names)
-    if names_idx.equals(axes[0]):
-        names_indexer = np.arange(len(names_idx))
-    else:
-        assert names_idx.intersection(axes[0]).is_unique
-        names_indexer = names_idx.get_indexer_for(axes[0])
-
-    for i, name_idx in enumerate(names_indexer):
-        if name_idx == -1:
-            extra_locs.append(i)
-            continue
-
-        k = names[name_idx]
-        v = arrays[name_idx]
-
-        if is_sparse(v):
-            sparse_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.floating):
-            float_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.complexfloating):
-            complex_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.datetime64):
-            if v.dtype != _NS_DTYPE:
-                v = tslib.cast_to_nanoseconds(v)
-
-            if is_datetimetz(v):
-                datetime_tz_items.append((i, k, v))
-            else:
-                datetime_items.append((i, k, v))
-        elif is_datetimetz(v):
-            datetime_tz_items.append((i, k, v))
-        elif issubclass(v.dtype.type, np.integer):
-            int_items.append((i, k, v))
-        elif v.dtype == np.bool_:
-            bool_items.append((i, k, v))
-        elif is_categorical(v):
-            cat_items.append((i, k, v))
-        else:
-            object_items.append((i, k, v))
-
-    blocks = []
-    if len(float_items):
-        float_blocks = _multi_blockify(float_items)
-        blocks.extend(float_blocks)
-
-    if len(complex_items):
-        complex_blocks = _multi_blockify(complex_items)
-        blocks.extend(complex_blocks)
-
-    if len(int_items):
-        int_blocks = _multi_blockify(int_items)
-        blocks.extend(int_blocks)
-
-    if len(datetime_items):
-        datetime_blocks = _simple_blockify(datetime_items, _NS_DTYPE)
-        blocks.extend(datetime_blocks)
-
-    if len(datetime_tz_items):
-        dttz_blocks = [make_block(array,
-                                  klass=DatetimeTZBlock,
-                                  fastpath=True,
-                                  placement=[i], )
-                       for i, _, array in datetime_tz_items]
-        blocks.extend(dttz_blocks)
-
-    if len(bool_items):
-        bool_blocks = _simple_blockify(bool_items, np.bool_)
-        blocks.extend(bool_blocks)
-
-    if len(object_items) > 0:
-        object_blocks = _simple_blockify(object_items, np.object_)
-        blocks.extend(object_blocks)
-
-    if len(sparse_items) > 0:
-        sparse_blocks = _sparse_blockify(sparse_items)
-        blocks.extend(sparse_blocks)
-
-    if len(cat_items) > 0:
-        cat_blocks = [make_block(array, klass=CategoricalBlock, fastpath=True,
-                                 placement=[i])
-                      for i, _, array in cat_items]
-        blocks.extend(cat_blocks)
-
-    if len(extra_locs):
-        shape = (len(extra_locs),) + tuple(len(x) for x in axes[1:])
-
-        # empty items -> dtype object
-        block_values = np.empty(shape, dtype=object)
-        block_values.fill(np.nan)
-
-        na_block = make_block(block_values, placement=extra_locs)
-        blocks.append(na_block)
-
-    return blocks
-
-
-def _simple_blockify(tuples, dtype):
-    """ return a single array of a block that has a single dtype; if dtype is
-    not None, coerce to this dtype
-    """
-    values, placement = _stack_arrays(tuples, dtype)
-
-    # CHECK DTYPE?
-    if dtype is not None and values.dtype != dtype:  # pragma: no cover
-        values = values.astype(dtype)
-
-    block = make_block(values, placement=placement)
-    return [block]
-
-
-def _multi_blockify(tuples, dtype=None):
-    """ return an array of blocks that potentially have different dtypes """
-
-    # group by dtype
-    grouper = itertools.groupby(tuples, lambda x: x[2].dtype)
-
-    new_blocks = []
-    for dtype, tup_block in grouper:
-
-        values, placement = _stack_arrays(list(tup_block), dtype)
-
-        block = make_block(values, placement=placement)
-        new_blocks.append(block)
-
-    return new_blocks
-
-
-def _sparse_blockify(tuples, dtype=None):
-    """ return an array of blocks that potentially have different dtypes (and
-    are sparse)
-    """
-
-    new_blocks = []
-    for i, names, array in tuples:
-        array = _maybe_to_sparse(array)
-        block = make_block(array, klass=SparseBlock, fastpath=True,
-                           placement=[i])
-        new_blocks.append(block)
-
-    return new_blocks
-
-
-def _stack_arrays(tuples, dtype):
-
-    # fml
-    def _asarray_compat(x):
-        if isinstance(x, ABCSeries):
-            return x._values
-        else:
-            return np.asarray(x)
-
-    def _shape_compat(x):
-        if isinstance(x, ABCSeries):
-            return len(x),
-        else:
-            return x.shape
-
-    placement, names, arrays = zip(*tuples)
-
-    first = arrays[0]
-    shape = (len(arrays),) + _shape_compat(first)
-
-    stacked = np.empty(shape, dtype=dtype)
-    for i, arr in enumerate(arrays):
-        stacked[i] = _asarray_compat(arr)
-
-    return stacked, placement
-
-
-def _interleaved_dtype(blocks):
-    if not len(blocks):
-        return None
-
-    dtype = find_common_type([b.dtype for b in blocks])
-
-    # only numpy compat
-    if isinstance(dtype, ExtensionDtype):
-        dtype = np.object
-
-    return dtype
-
-
-def _consolidate(blocks):
-    """
-    Merge blocks having same dtype, exclude non-consolidating blocks
-    """
-
-    # sort by _can_consolidate, dtype
-    gkey = lambda x: x._consolidate_key
-    grouper = itertools.groupby(sorted(blocks, key=gkey), gkey)
-
-    new_blocks = []
-    for (_can_consolidate, dtype), group_blocks in grouper:
-        merged_blocks = _merge_blocks(list(group_blocks), dtype=dtype,
-                                      _can_consolidate=_can_consolidate)
-        new_blocks = _extend_blocks(merged_blocks, new_blocks)
-    return new_blocks
-
-
-def _merge_blocks(blocks, dtype=None, _can_consolidate=True):
-
-    if len(blocks) == 1:
-        return blocks[0]
-
-    if _can_consolidate:
-
-        if dtype is None:
-            if len(set([b.dtype for b in blocks])) != 1:
-                raise AssertionError("_merge_blocks are invalid!")
-            dtype = blocks[0].dtype
-
-        # FIXME: optimization potential in case all mgrs contain slices and
-        # combination of those slices is a slice, too.
-        new_mgr_locs = np.concatenate([b.mgr_locs.as_array for b in blocks])
-        new_values = _vstack([b.values for b in blocks], dtype)
-
-        argsort = np.argsort(new_mgr_locs)
-        new_values = new_values[argsort]
-        new_mgr_locs = new_mgr_locs[argsort]
-
-        return make_block(new_values, fastpath=True, placement=new_mgr_locs)
-
-    # no merge
-    return blocks
-
-
-def _extend_blocks(result, blocks=None):
-    """ return a new extended blocks, givin the result """
-    if blocks is None:
-        blocks = []
-    if isinstance(result, list):
-        for r in result:
-            if isinstance(r, list):
-                blocks.extend(r)
-            else:
-                blocks.append(r)
-    elif isinstance(result, BlockManager):
-        blocks.extend(result.blocks)
-    else:
-        blocks.append(result)
-    return blocks
-
-
-def _block_shape(values, ndim=1, shape=None):
-    """ guarantee the shape of the values to be at least 1 d """
-    if values.ndim < ndim:
-        if shape is None:
-            shape = values.shape
-        values = values.reshape(tuple((1, ) + shape))
-    return values
-
-
-def _vstack(to_stack, dtype):
-
-    # work around NumPy 1.6 bug
-    if dtype == _NS_DTYPE or dtype == _TD_DTYPE:
-        new_values = np.vstack([x.view('i8') for x in to_stack])
-        return new_values.view(dtype)
-
-    else:
-        return np.vstack(to_stack)
-
-
-def _maybe_compare(a, b, op):
-
-    is_a_array = isinstance(a, np.ndarray)
-    is_b_array = isinstance(b, np.ndarray)
-
-    # numpy deprecation warning to have i8 vs integer comparisions
-    if is_datetimelike_v_numeric(a, b):
-        result = False
-
-    # numpy deprecation warning if comparing numeric vs string-like
-    elif is_numeric_v_string_like(a, b):
-        result = False
-
-    else:
-        result = op(a, b)
-
-    if is_scalar(result) and (is_a_array or is_b_array):
-        type_names = [type(a).__name__, type(b).__name__]
-
-        if is_a_array:
-            type_names[0] = 'ndarray(dtype=%s)' % a.dtype
-
-        if is_b_array:
-            type_names[1] = 'ndarray(dtype=%s)' % b.dtype
-
-        raise TypeError("Cannot compare types %r and %r" % tuple(type_names))
-    return result
-
-
-def _concat_indexes(indexes):
-    return indexes[0].append(indexes[1:])
-
-
-def _block2d_to_blocknd(values, placement, shape, labels, ref_items):
-    """ pivot to the labels shape """
-    from pandas.core.internals import make_block
-
-    panel_shape = (len(placement),) + shape
-
-    # TODO: lexsort depth needs to be 2!!
-
-    # Create observation selection vector using major and minor
-    # labels, for converting to panel format.
-    selector = _factor_indexer(shape[1:], labels)
-    mask = np.zeros(np.prod(shape), dtype=bool)
-    mask.put(selector, True)
-
-    if mask.all():
-        pvalues = np.empty(panel_shape, dtype=values.dtype)
-    else:
-        dtype, fill_value = maybe_promote(values.dtype)
-        pvalues = np.empty(panel_shape, dtype=dtype)
-        pvalues.fill(fill_value)
-
-    values = values
-    for i in range(len(placement)):
-        pvalues[i].flat[mask] = values[:, i]
-
-    return make_block(pvalues, placement=placement)
-
-
-def _factor_indexer(shape, labels):
-    """
-    given a tuple of shape and a list of Categorical labels, return the
-    expanded label indexer
-    """
-    mult = np.array(shape)[::-1].cumprod()[::-1]
-    return _ensure_platform_int(
-        np.sum(np.array(labels).T * np.append(mult, [1]), axis=1).T)
-
-
-def _get_blkno_placements(blknos, blk_count, group=True):
-    """
-
-    Parameters
-    ----------
-    blknos : array of int64
-    blk_count : int
-    group : bool
-
-    Returns
-    -------
-    iterator
-        yield (BlockPlacement, blkno)
-
-    """
-
-    blknos = _ensure_int64(blknos)
-
-    # FIXME: blk_count is unused, but it may avoid the use of dicts in cython
-    for blkno, indexer in lib.get_blkno_indexers(blknos, group):
-        yield blkno, BlockPlacement(indexer)
-
-
-def items_overlap_with_suffix(left, lsuffix, right, rsuffix):
-    """
-    If two indices overlap, add suffixes to overlapping entries.
-
-    If corresponding suffix is empty, the entry is simply converted to string.
-
-    """
-    to_rename = left.intersection(right)
-    if len(to_rename) == 0:
-        return left, right
-    else:
-        if not lsuffix and not rsuffix:
-            raise ValueError('columns overlap but no suffix specified: %s' %
-                             to_rename)
-
-        def lrenamer(x):
-            if x in to_rename:
-                return '%s%s' % (x, lsuffix)
-            return x
-
-        def rrenamer(x):
-            if x in to_rename:
-                return '%s%s' % (x, rsuffix)
-            return x
-
-        return (_transform_index(left, lrenamer),
-                _transform_index(right, rrenamer))
-
-
-def _safe_reshape(arr, new_shape):
-    """
-    If possible, reshape `arr` to have shape `new_shape`,
-    with a couple of exceptions (see gh-13012):
-
-    1) If `arr` is a Categorical or Index, `arr` will be
-       returned as is.
-    2) If `arr` is a Series, the `_values` attribute will
-       be reshaped and returned.
-
-    Parameters
-    ----------
-    arr : array-like, object to be reshaped
-    new_shape : int or tuple of ints, the new shape
-    """
-    if isinstance(arr, ABCSeries):
-        arr = arr._values
-    if not isinstance(arr, Categorical):
-        arr = arr.reshape(new_shape)
-    return arr
-
-
-def _transform_index(index, func):
-    """
-    Apply function to all values found in index.
-
-    This includes transforming multiindex entries separately.
-
-    """
-    if isinstance(index, MultiIndex):
-        items = [tuple(func(y) for y in x) for x in index]
-        return MultiIndex.from_tuples(items, names=index.names)
-    else:
-        items = [func(x) for x in index]
-        return Index(items, name=index.name)
-
-
-def _putmask_smart(v, m, n):
-    """
-    Return a new block, try to preserve dtype if possible.
-
-    Parameters
-    ----------
-    v : `values`, updated in-place (array like)
-    m : `mask`, applies to both sides (array like)
-    n : `new values` either scalar or an array like aligned with `values`
-    """
-    # n should be the length of the mask or a scalar here
-    if not is_list_like(n):
-        n = np.array([n] * len(m))
-    elif isinstance(n, np.ndarray) and n.ndim == 0:  # numpy scalar
-        n = np.repeat(np.array(n, ndmin=1), len(m))
-
-    # see if we are only masking values that if putted
-    # will work in the current dtype
-    try:
-        nn = n[m]
-
-        # make sure that we have a nullable type
-        # if we have nulls
-        if not _is_na_compat(v, nn[0]):
-            raise ValueError
-
-        nn_at = nn.astype(v.dtype)
-
-        # avoid invalid dtype comparisons
-        if not is_numeric_v_string_like(nn, nn_at):
-            comp = (nn == nn_at)
-            if is_list_like(comp) and comp.all():
-                nv = v.copy()
-                nv[m] = nn_at
-                return nv
-    except (ValueError, IndexError, TypeError):
-        pass
-
-    # change the dtype
-    dtype, _ = maybe_promote(n.dtype)
-
-    if is_extension_type(v.dtype) and is_object_dtype(dtype):
-        nv = v.get_values(dtype)
-    else:
-        nv = v.astype(dtype)
-
-    try:
-        nv[m] = n[m]
-    except ValueError:
-        idx, = np.where(np.squeeze(m))
-        for mask_index, new_val in zip(idx, n[m]):
-            nv[mask_index] = new_val
-    return nv
-
-
-def concatenate_block_managers(mgrs_indexers, axes, concat_axis, copy):
-    """
-    Concatenate block managers into one.
-
-    Parameters
-    ----------
-    mgrs_indexers : list of (BlockManager, {axis: indexer,...}) tuples
-    axes : list of Index
-    concat_axis : int
-    copy : bool
-
-    """
-    concat_plan = combine_concat_plans(
-        [get_mgr_concatenation_plan(mgr, indexers)
-         for mgr, indexers in mgrs_indexers], concat_axis)
-
-    blocks = [make_block(
-        concatenate_join_units(join_units, concat_axis, copy=copy),
-        placement=placement) for placement, join_units in concat_plan]
-
-    return BlockManager(blocks, axes)
-
-
-def get_empty_dtype_and_na(join_units):
-    """
-    Return dtype and N/A values to use when concatenating specified units.
-
-    Returned N/A value may be None which means there was no casting involved.
-
-    Returns
-    -------
-    dtype
-    na
-    """
-
-    if len(join_units) == 1:
-        blk = join_units[0].block
-        if blk is None:
-            return np.float64, np.nan
-
-    has_none_blocks = False
-    dtypes = [None] * len(join_units)
-    for i, unit in enumerate(join_units):
-        if unit.block is None:
-            has_none_blocks = True
-        else:
-            dtypes[i] = unit.dtype
-
-    upcast_classes = defaultdict(list)
-    null_upcast_classes = defaultdict(list)
-    for dtype, unit in zip(dtypes, join_units):
-        if dtype is None:
-            continue
-
-        if is_categorical_dtype(dtype):
-            upcast_cls = 'category'
-        elif is_datetimetz(dtype):
-            upcast_cls = 'datetimetz'
-        elif issubclass(dtype.type, np.bool_):
-            upcast_cls = 'bool'
-        elif issubclass(dtype.type, np.object_):
-            upcast_cls = 'object'
-        elif is_datetime64_dtype(dtype):
-            upcast_cls = 'datetime'
-        elif is_timedelta64_dtype(dtype):
-            upcast_cls = 'timedelta'
-        elif is_float_dtype(dtype) or is_numeric_dtype(dtype):
-            upcast_cls = dtype.name
-        else:
-            upcast_cls = 'float'
-
-        # Null blocks should not influence upcast class selection, unless there
-        # are only null blocks, when same upcasting rules must be applied to
-        # null upcast classes.
-        if unit.is_null:
-            null_upcast_classes[upcast_cls].append(dtype)
-        else:
-            upcast_classes[upcast_cls].append(dtype)
-
-    if not upcast_classes:
-        upcast_classes = null_upcast_classes
-
-    # create the result
-    if 'object' in upcast_classes:
-        return np.dtype(np.object_), np.nan
-    elif 'bool' in upcast_classes:
-        if has_none_blocks:
-            return np.dtype(np.object_), np.nan
-        else:
-            return np.dtype(np.bool_), None
-    elif 'category' in upcast_classes:
-        return np.dtype(np.object_), np.nan
-    elif 'datetimetz' in upcast_classes:
-        dtype = upcast_classes['datetimetz']
-        return dtype[0], tslib.iNaT
-    elif 'datetime' in upcast_classes:
-        return np.dtype('M8[ns]'), tslib.iNaT
-    elif 'timedelta' in upcast_classes:
-        return np.dtype('m8[ns]'), tslib.iNaT
-    else:  # pragma
-        g = np.find_common_type(upcast_classes, [])
-        if is_float_dtype(g):
-            return g, g.type(np.nan)
-        elif is_numeric_dtype(g):
-            if has_none_blocks:
-                return np.float64, np.nan
-            else:
-                return g, None
-
-    msg = "invalid dtype determination in get_concat_dtype"
-    raise AssertionError(msg)
-
-
-def concatenate_join_units(join_units, concat_axis, copy):
-    """
-    Concatenate values from several join units along selected axis.
-    """
-    if concat_axis == 0 and len(join_units) > 1:
-        # Concatenating join units along ax0 is handled in _merge_blocks.
-        raise AssertionError("Concatenating join units along axis0")
-
-    empty_dtype, upcasted_na = get_empty_dtype_and_na(join_units)
-
-    to_concat = [ju.get_reindexed_values(empty_dtype=empty_dtype,
-                                         upcasted_na=upcasted_na)
-                 for ju in join_units]
-
-    if len(to_concat) == 1:
-        # Only one block, nothing to concatenate.
-        concat_values = to_concat[0]
-        if copy and concat_values.base is not None:
-            concat_values = concat_values.copy()
-    else:
-        concat_values = _concat._concat_compat(to_concat, axis=concat_axis)
-
-    return concat_values
-
-
-def get_mgr_concatenation_plan(mgr, indexers):
-    """
-    Construct concatenation plan for given block manager and indexers.
-
-    Parameters
-    ----------
-    mgr : BlockManager
-    indexers : dict of {axis: indexer}
-
-    Returns
-    -------
-    plan : list of (BlockPlacement, JoinUnit) tuples
-
-    """
-    # Calculate post-reindex shape , save for item axis which will be separate
-    # for each block anyway.
-    mgr_shape = list(mgr.shape)
-    for ax, indexer in indexers.items():
-        mgr_shape[ax] = len(indexer)
-    mgr_shape = tuple(mgr_shape)
-
-    if 0 in indexers:
-        ax0_indexer = indexers.pop(0)
-        blknos = algos.take_1d(mgr._blknos, ax0_indexer, fill_value=-1)
-        blklocs = algos.take_1d(mgr._blklocs, ax0_indexer, fill_value=-1)
-    else:
-
-        if mgr._is_single_block:
-            blk = mgr.blocks[0]
-            return [(blk.mgr_locs, JoinUnit(blk, mgr_shape, indexers))]
-
-        ax0_indexer = None
-        blknos = mgr._blknos
-        blklocs = mgr._blklocs
-
-    plan = []
-    for blkno, placements in _get_blkno_placements(blknos, len(mgr.blocks),
-                                                   group=False):
-
-        assert placements.is_slice_like
-
-        join_unit_indexers = indexers.copy()
-
-        shape = list(mgr_shape)
-        shape[0] = len(placements)
-        shape = tuple(shape)
-
-        if blkno == -1:
-            unit = JoinUnit(None, shape)
-        else:
-            blk = mgr.blocks[blkno]
-            ax0_blk_indexer = blklocs[placements.indexer]
-
-            unit_no_ax0_reindexing = (len(placements) == len(blk.mgr_locs) and
-                                      # Fastpath detection of join unit not
-                                      # needing to reindex its block: no ax0
-                                      # reindexing took place and block
-                                      # placement was sequential before.
-                                      ((ax0_indexer is None and
-                                        blk.mgr_locs.is_slice_like and
-                                        blk.mgr_locs.as_slice.step == 1) or
-                                       # Slow-ish detection: all indexer locs
-                                       # are sequential (and length match is
-                                       # checked above).
-                                       (np.diff(ax0_blk_indexer) == 1).all()))
-
-            # Omit indexer if no item reindexing is required.
-            if unit_no_ax0_reindexing:
-                join_unit_indexers.pop(0, None)
-            else:
-                join_unit_indexers[0] = ax0_blk_indexer
-
-            unit = JoinUnit(blk, shape, join_unit_indexers)
-
-        plan.append((placements, unit))
-
-    return plan
-
-
-def combine_concat_plans(plans, concat_axis):
-    """
-    Combine multiple concatenation plans into one.
-
-    existing_plan is updated in-place.
-    """
-    if len(plans) == 1:
-        for p in plans[0]:
-            yield p[0], [p[1]]
-
-    elif concat_axis == 0:
-        offset = 0
-        for plan in plans:
-            last_plc = None
-
-            for plc, unit in plan:
-                yield plc.add(offset), [unit]
-                last_plc = plc
-
-            if last_plc is not None:
-                offset += last_plc.as_slice.stop
-
-    else:
-        num_ended = [0]
-
-        def _next_or_none(seq):
-            retval = next(seq, None)
-            if retval is None:
-                num_ended[0] += 1
-            return retval
-
-        plans = list(map(iter, plans))
-        next_items = list(map(_next_or_none, plans))
-
-        while num_ended[0] != len(next_items):
-            if num_ended[0] > 0:
-                raise ValueError("Plan shapes are not aligned")
-
-            placements, units = zip(*next_items)
-
-            lengths = list(map(len, placements))
-            min_len, max_len = min(lengths), max(lengths)
-
-            if min_len == max_len:
-                yield placements[0], units
-                next_items[:] = map(_next_or_none, plans)
-            else:
-                yielded_placement = None
-                yielded_units = [None] * len(next_items)
-                for i, (plc, unit) in enumerate(next_items):
-                    yielded_units[i] = unit
-                    if len(plc) > min_len:
-                        # trim_join_unit updates unit in place, so only
-                        # placement needs to be sliced to skip min_len.
-                        next_items[i] = (plc[min_len:],
-                                         trim_join_unit(unit, min_len))
-                    else:
-                        yielded_placement = plc
-                        next_items[i] = _next_or_none(plans[i])
-
-                yield yielded_placement, yielded_units
-
-
-def trim_join_unit(join_unit, length):
-    """
-    Reduce join_unit's shape along item axis to length.
-
-    Extra items that didn't fit are returned as a separate block.
-    """
-
-    if 0 not in join_unit.indexers:
-        extra_indexers = join_unit.indexers
-
-        if join_unit.block is None:
-            extra_block = None
-        else:
-            extra_block = join_unit.block.getitem_block(slice(length, None))
-            join_unit.block = join_unit.block.getitem_block(slice(length))
-    else:
-        extra_block = join_unit.block
-
-        extra_indexers = copy.copy(join_unit.indexers)
-        extra_indexers[0] = extra_indexers[0][length:]
-        join_unit.indexers[0] = join_unit.indexers[0][:length]
-
-    extra_shape = (join_unit.shape[0] - length,) + join_unit.shape[1:]
-    join_unit.shape = (length,) + join_unit.shape[1:]
-
-    return JoinUnit(block=extra_block, indexers=extra_indexers,
-                    shape=extra_shape)
-
-
-class JoinUnit(object):
-
-    def __init__(self, block, shape, indexers=None):
-        # Passing shape explicitly is required for cases when block is None.
-        if indexers is None:
-            indexers = {}
-        self.block = block
-        self.indexers = indexers
-        self.shape = shape
-
-    def __repr__(self):
-        return '%s(%r, %s)' % (self.__class__.__name__, self.block,
-                               self.indexers)
-
-    @cache_readonly
-    def needs_filling(self):
-        for indexer in self.indexers.values():
-            # FIXME: cache results of indexer == -1 checks.
-            if (indexer == -1).any():
-                return True
-
-        return False
-
-    @cache_readonly
-    def dtype(self):
-        if self.block is None:
-            raise AssertionError("Block is None, no dtype")
-
-        if not self.needs_filling:
-            return self.block.dtype
-        else:
-            return _get_dtype(maybe_promote(self.block.dtype,
-                                            self.block.fill_value)[0])
-
-        return self._dtype
-
-    @cache_readonly
-    def is_null(self):
-        if self.block is None:
-            return True
-
-        if not self.block._can_hold_na:
-            return False
-
-        # Usually it's enough to check but a small fraction of values to see if
-        # a block is NOT null, chunks should help in such cases.  1000 value
-        # was chosen rather arbitrarily.
-        values = self.block.values
-        if self.block.is_categorical:
-            values_flat = values.categories
-        elif self.block.is_sparse:
-            # fill_value is not NaN and have holes
-            if not values._null_fill_value and values.sp_index.ngaps > 0:
-                return False
-            values_flat = values.ravel(order='K')
-        else:
-            values_flat = values.ravel(order='K')
-        total_len = values_flat.shape[0]
-        chunk_len = max(total_len // 40, 1000)
-        for i in range(0, total_len, chunk_len):
-            if not isnull(values_flat[i:i + chunk_len]).all():
-                return False
-
-        return True
-
-    def get_reindexed_values(self, empty_dtype, upcasted_na):
-        if upcasted_na is None:
-            # No upcasting is necessary
-            fill_value = self.block.fill_value
-            values = self.block.get_values()
-        else:
-            fill_value = upcasted_na
-
-            if self.is_null:
-                if getattr(self.block, 'is_object', False):
-                    # we want to avoid filling with np.nan if we are
-                    # using None; we already know that we are all
-                    # nulls
-                    values = self.block.values.ravel(order='K')
-                    if len(values) and values[0] is None:
-                        fill_value = None
-
-                if getattr(self.block, 'is_datetimetz', False):
-                    pass
-                elif getattr(self.block, 'is_categorical', False):
-                    pass
-                elif getattr(self.block, 'is_sparse', False):
-                    pass
-                else:
-                    missing_arr = np.empty(self.shape, dtype=empty_dtype)
-                    missing_arr.fill(fill_value)
-                    return missing_arr
-
-            if not self.indexers:
-                if not self.block._can_consolidate:
-                    # preserve these for validation in _concat_compat
-                    return self.block.values
-
-            if self.block.is_bool:
-                # External code requested filling/upcasting, bool values must
-                # be upcasted to object to avoid being upcasted to numeric.
-                values = self.block.astype(np.object_).values
-            elif self.block.is_categorical:
-                values = self.block.values
-            else:
-                # No dtype upcasting is done here, it will be performed during
-                # concatenation itself.
-                values = self.block.get_values()
-
-        if not self.indexers:
-            # If there's no indexing to be done, we want to signal outside
-            # code that this array must be copied explicitly.  This is done
-            # by returning a view and checking `retval.base`.
-            values = values.view()
-
-        else:
-            for ax, indexer in self.indexers.items():
-                values = algos.take_nd(values, indexer, axis=ax,
-                                       fill_value=fill_value)
-
-        return values
-
-
-def _fast_count_smallints(arr):
-    """Faster version of set(arr) for sequences of small numbers."""
-    if len(arr) == 0:
-        # Handle empty arr case separately: numpy 1.6 chokes on that.
-        return np.empty((0, 2), dtype=arr.dtype)
-    else:
-        counts = np.bincount(arr.astype(np.int_))
-        nz = counts.nonzero()[0]
-        return np.c_[nz, counts[nz]]
-
-
-def _preprocess_slice_or_indexer(slice_or_indexer, length, allow_fill):
-    if isinstance(slice_or_indexer, slice):
-        return 'slice', slice_or_indexer, lib.slice_len(slice_or_indexer,
-                                                        length)
-    elif (isinstance(slice_or_indexer, np.ndarray) and
-          slice_or_indexer.dtype == np.bool_):
-        return 'mask', slice_or_indexer, slice_or_indexer.sum()
-    else:
-        indexer = np.asanyarray(slice_or_indexer, dtype=np.int64)
-        if not allow_fill:
-            indexer = maybe_convert_indices(indexer, length)
-        return 'fancy', indexer, len(indexer)
diff --git a/pandas/core/internals/__init__.py b/pandas/core/internals/__init__.py
new file mode 100644
index 0000000000000..a662e1d3ae197
--- /dev/null
+++ b/pandas/core/internals/__init__.py
@@ -0,0 +1,13 @@
+# -*- coding: utf-8 -*-
+from .blocks import (  # noqa:F401
+    _block_shape,   # io.pytables
+    _safe_reshape,  # io.packers
+    make_block,     # io.pytables, io.packers
+    FloatBlock, IntBlock, ComplexBlock, BoolBlock, ObjectBlock,
+    TimeDeltaBlock, DatetimeBlock, DatetimeTZBlock,
+    CategoricalBlock, ExtensionBlock, Block)
+from .managers import (  # noqa:F401
+    BlockManager, SingleBlockManager,
+    create_block_manager_from_arrays, create_block_manager_from_blocks,
+    items_overlap_with_suffix,  # reshape.merge
+    concatenate_block_managers)  # reshape.concat, reshape.merge
diff --git a/pandas/core/internals/arrays.py b/pandas/core/internals/arrays.py
new file mode 100644
index 0000000000000..18af328bfa77f
--- /dev/null
+++ b/pandas/core/internals/arrays.py
@@ -0,0 +1,55 @@
+"""
+Methods for cleaning, validating, and unboxing arrays.
+"""
+from pandas.core.dtypes.generic import ABCIndexClass, ABCPandasArray, ABCSeries
+
+
+def extract_array(obj, extract_numpy=False):
+    """
+    Extract the ndarray or ExtensionArray from a Series or Index.
+
+    For all other types, `obj` is just returned as is.
+
+    Parameters
+    ----------
+    obj : object
+        For Series / Index, the underlying ExtensionArray is unboxed.
+        For Numpy-backed ExtensionArrays, the ndarray is extracted.
+
+    extract_numpy : bool, default False
+        Whether to extract the ndarray from a PandasArray
+
+    Returns
+    -------
+    arr : object
+
+    Examples
+    --------
+    >>> extract_array(pd.Series(['a', 'b', 'c'], dtype='category'))
+    [a, b, c]
+    Categories (3, object): [a, b, c]
+
+    Other objects like lists, arrays, and DataFrames are just passed through.
+
+    >>> extract_array([1, 2, 3])
+    [1, 2, 3]
+
+    For an ndarray-backed Series / Index a PandasArray is returned.
+
+    >>> extract_array(pd.Series([1, 2, 3]))
+    <PandasArray>
+    [1, 2, 3]
+    Length: 3, dtype: int64
+
+    To extract all the way down to the ndarray, pass ``extract_numpy=True``.
+
+    >>> extract_array(pd.Series([1, 2, 3]), extract_numpy=True)
+    array([1, 2, 3])
+    """
+    if isinstance(obj, (ABCIndexClass, ABCSeries)):
+        obj = obj.array
+
+    if extract_numpy and isinstance(obj, ABCPandasArray):
+        obj = obj.to_numpy()
+
+    return obj
diff --git a/pandas/core/internals/blocks.py b/pandas/core/internals/blocks.py
new file mode 100644
index 0000000000000..ada663556899b
--- /dev/null
+++ b/pandas/core/internals/blocks.py
@@ -0,0 +1,3237 @@
+# -*- coding: utf-8 -*-
+from datetime import date, datetime, timedelta
+import functools
+import inspect
+import re
+import warnings
+
+import numpy as np
+
+from pandas._libs import internals as libinternals, lib, tslib, tslibs
+from pandas._libs.tslibs import Timedelta, conversion, is_null_datetimelike
+import pandas.compat as compat
+from pandas.compat import range, zip
+from pandas.util._validators import validate_bool_kwarg
+
+from pandas.core.dtypes.cast import (
+    astype_nansafe, find_common_type, infer_dtype_from,
+    infer_dtype_from_scalar, maybe_convert_objects, maybe_downcast_to_dtype,
+    maybe_infer_dtype_type, maybe_promote, maybe_upcast, soft_convert_objects)
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, _TD_DTYPE, ensure_platform_int, is_bool_dtype, is_categorical,
+    is_categorical_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
+    is_dtype_equal, is_extension_array_dtype, is_extension_type,
+    is_float_dtype, is_integer, is_integer_dtype, is_interval_dtype,
+    is_list_like, is_numeric_v_string_like, is_object_dtype, is_period_dtype,
+    is_re, is_re_compilable, is_sparse, is_timedelta64_dtype, pandas_dtype)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, ExtensionDtype, PandasExtensionDtype)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCDatetimeIndex, ABCExtensionArray, ABCIndexClass,
+    ABCSeries)
+from pandas.core.dtypes.missing import (
+    _isna_compat, array_equivalent, isna, notna)
+
+import pandas.core.algorithms as algos
+from pandas.core.arrays import (
+    Categorical, DatetimeArray, ExtensionArray, TimedeltaArray)
+from pandas.core.base import PandasObject
+import pandas.core.common as com
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexing import check_setitem_lengths
+from pandas.core.internals.arrays import extract_array
+import pandas.core.missing as missing
+from pandas.core.nanops import nanpercentile
+
+from pandas.io.formats.printing import pprint_thing
+
+
+class Block(PandasObject):
+    """
+    Canonical n-dimensional unit of homogeneous dtype contained in a pandas
+    data structure
+
+    Index-ignorant; let the container take care of that
+    """
+    __slots__ = ['_mgr_locs', 'values', 'ndim']
+    is_numeric = False
+    is_float = False
+    is_integer = False
+    is_complex = False
+    is_datetime = False
+    is_datetimetz = False
+    is_timedelta = False
+    is_bool = False
+    is_object = False
+    is_categorical = False
+    is_sparse = False
+    is_extension = False
+    _box_to_block_values = True
+    _can_hold_na = False
+    _can_consolidate = True
+    _verify_integrity = True
+    _validate_ndim = True
+    _ftype = 'dense'
+    _concatenator = staticmethod(np.concatenate)
+
+    def __init__(self, values, placement, ndim=None):
+        self.ndim = self._check_ndim(values, ndim)
+        self.mgr_locs = placement
+        self.values = values
+
+        if (self._validate_ndim and self.ndim and
+                len(self.mgr_locs) != len(self.values)):
+            raise ValueError(
+                'Wrong number of items passed {val}, placement implies '
+                '{mgr}'.format(val=len(self.values), mgr=len(self.mgr_locs)))
+
+    def _check_ndim(self, values, ndim):
+        """
+        ndim inference and validation.
+
+        Infers ndim from 'values' if not provided to __init__.
+        Validates that values.ndim and ndim are consistent if and only if
+        the class variable '_validate_ndim' is True.
+
+        Parameters
+        ----------
+        values : array-like
+        ndim : int or None
+
+        Returns
+        -------
+        ndim : int
+
+        Raises
+        ------
+        ValueError : the number of dimensions do not match
+        """
+        if ndim is None:
+            ndim = values.ndim
+
+        if self._validate_ndim and values.ndim != ndim:
+            msg = ("Wrong number of dimensions. values.ndim != ndim "
+                   "[{} != {}]")
+            raise ValueError(msg.format(values.ndim, ndim))
+
+        return ndim
+
+    @property
+    def _holder(self):
+        """The array-like that can hold the underlying values.
+
+        None for 'Block', overridden by subclasses that don't
+        use an ndarray.
+        """
+        return None
+
+    @property
+    def _consolidate_key(self):
+        return (self._can_consolidate, self.dtype.name)
+
+    @property
+    def _is_single_block(self):
+        return self.ndim == 1
+
+    @property
+    def is_view(self):
+        """ return a boolean if I am possibly a view """
+        return self.values.base is not None
+
+    @property
+    def is_datelike(self):
+        """ return True if I am a non-datelike """
+        return self.is_datetime or self.is_timedelta
+
+    def is_categorical_astype(self, dtype):
+        """
+        validate that we have a astypeable to categorical,
+        returns a boolean if we are a categorical
+        """
+        if dtype is Categorical or dtype is CategoricalDtype:
+            # this is a pd.Categorical, but is not
+            # a valid type for astypeing
+            raise TypeError("invalid type {0} for astype".format(dtype))
+
+        elif is_categorical_dtype(dtype):
+            return True
+
+        return False
+
+    def external_values(self, dtype=None):
+        """ return an outside world format, currently just the ndarray """
+        return self.values
+
+    def internal_values(self, dtype=None):
+        """ return an internal format, currently just the ndarray
+        this should be the pure internal API format
+        """
+        return self.values
+
+    def formatting_values(self):
+        """Return the internal values used by the DataFrame/SeriesFormatter"""
+        return self.internal_values()
+
+    def get_values(self, dtype=None):
+        """
+        return an internal format, currently just the ndarray
+        this is often overridden to handle to_dense like operations
+        """
+        if is_object_dtype(dtype):
+            return self.values.astype(object)
+        return self.values
+
+    def to_dense(self):
+        return self.values.view()
+
+    @property
+    def _na_value(self):
+        return np.nan
+
+    @property
+    def fill_value(self):
+        return np.nan
+
+    @property
+    def mgr_locs(self):
+        return self._mgr_locs
+
+    @mgr_locs.setter
+    def mgr_locs(self, new_mgr_locs):
+        if not isinstance(new_mgr_locs, libinternals.BlockPlacement):
+            new_mgr_locs = libinternals.BlockPlacement(new_mgr_locs)
+
+        self._mgr_locs = new_mgr_locs
+
+    @property
+    def array_dtype(self):
+        """ the dtype to return if I want to construct this block as an
+        array
+        """
+        return self.dtype
+
+    def make_block(self, values, placement=None, ndim=None):
+        """
+        Create a new block, with type inference propagate any values that are
+        not specified
+        """
+        if placement is None:
+            placement = self.mgr_locs
+        if ndim is None:
+            ndim = self.ndim
+
+        return make_block(values, placement=placement, ndim=ndim)
+
+    def make_block_same_class(self, values, placement=None, ndim=None,
+                              dtype=None):
+        """ Wrap given values in a block of same type as self. """
+        if dtype is not None:
+            # issue 19431 fastparquet is passing this
+            warnings.warn("dtype argument is deprecated, will be removed "
+                          "in a future release.", DeprecationWarning)
+        if placement is None:
+            placement = self.mgr_locs
+        return make_block(values, placement=placement, ndim=ndim,
+                          klass=self.__class__, dtype=dtype)
+
+    def __unicode__(self):
+
+        # don't want to print out all of the items here
+        name = pprint_thing(self.__class__.__name__)
+        if self._is_single_block:
+
+            result = '{name}: {len} dtype: {dtype}'.format(
+                name=name, len=len(self), dtype=self.dtype)
+
+        else:
+
+            shape = ' x '.join(pprint_thing(s) for s in self.shape)
+            result = '{name}: {index}, {shape}, dtype: {dtype}'.format(
+                name=name, index=pprint_thing(self.mgr_locs.indexer),
+                shape=shape, dtype=self.dtype)
+
+        return result
+
+    def __len__(self):
+        return len(self.values)
+
+    def __getstate__(self):
+        return self.mgr_locs.indexer, self.values
+
+    def __setstate__(self, state):
+        self.mgr_locs = libinternals.BlockPlacement(state[0])
+        self.values = state[1]
+        self.ndim = self.values.ndim
+
+    def _slice(self, slicer):
+        """ return a slice of my values """
+        return self.values[slicer]
+
+    def getitem_block(self, slicer, new_mgr_locs=None):
+        """
+        Perform __getitem__-like, return result as block.
+
+        As of now, only supports slices that preserve dimensionality.
+        """
+        if new_mgr_locs is None:
+            if isinstance(slicer, tuple):
+                axis0_slicer = slicer[0]
+            else:
+                axis0_slicer = slicer
+            new_mgr_locs = self.mgr_locs[axis0_slicer]
+
+        new_values = self._slice(slicer)
+
+        if self._validate_ndim and new_values.ndim != self.ndim:
+            raise ValueError("Only same dim slicing is allowed")
+
+        return self.make_block_same_class(new_values, new_mgr_locs)
+
+    @property
+    def shape(self):
+        return self.values.shape
+
+    @property
+    def dtype(self):
+        return self.values.dtype
+
+    @property
+    def ftype(self):
+        if getattr(self.values, '_pandas_ftype', False):
+            dtype = self.dtype.subtype
+        else:
+            dtype = self.dtype
+        return "{dtype}:{ftype}".format(dtype=dtype, ftype=self._ftype)
+
+    def merge(self, other):
+        return _merge_blocks([self, other])
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+        """
+        values = self._concatenator([blk.values for blk in to_concat],
+                                    axis=self.ndim - 1)
+        return self.make_block_same_class(
+            values, placement=placement or slice(0, len(values), 1))
+
+    def iget(self, i):
+        return self.values[i]
+
+    def set(self, locs, values):
+        """
+        Modify Block in-place with new item value
+
+        Returns
+        -------
+        None
+        """
+        self.values[locs] = values
+
+    def delete(self, loc):
+        """
+        Delete given loc(-s) from block in-place.
+        """
+        self.values = np.delete(self.values, loc, 0)
+        self.mgr_locs = self.mgr_locs.delete(loc)
+
+    def apply(self, func, **kwargs):
+        """ apply the function to my values; return a block if we are not
+        one
+        """
+        with np.errstate(all='ignore'):
+            result = func(self.values, **kwargs)
+        if not isinstance(result, Block):
+            result = self.make_block(values=_block_shape(result,
+                                                         ndim=self.ndim))
+
+        return result
+
+    def fillna(self, value, limit=None, inplace=False, downcast=None):
+        """ fillna on the block with the value. If we fail, then convert to
+        ObjectBlock and try again
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        if not self._can_hold_na:
+            if inplace:
+                return self
+            else:
+                return self.copy()
+
+        mask = isna(self.values)
+        if limit is not None:
+            if not is_integer(limit):
+                raise ValueError('Limit must be an integer')
+            if limit < 1:
+                raise ValueError('Limit must be greater than 0')
+            if self.ndim > 2:
+                raise NotImplementedError("number of dimensions for 'fillna' "
+                                          "is currently limited to 2")
+            mask[mask.cumsum(self.ndim - 1) > limit] = False
+
+        # fillna, but if we cannot coerce, then try again as an ObjectBlock
+        try:
+            values, _ = self._try_coerce_args(self.values, value)
+            blocks = self.putmask(mask, value, inplace=inplace)
+            blocks = [b.make_block(values=self._try_coerce_result(b.values))
+                      for b in blocks]
+            return self._maybe_downcast(blocks, downcast)
+        except (TypeError, ValueError):
+
+            # we can't process the value, but nothing to do
+            if not mask.any():
+                return self if inplace else self.copy()
+
+            # operate column-by-column
+            def f(m, v, i):
+                block = self.coerce_to_target_dtype(value)
+
+                # slice out our block
+                if i is not None:
+                    block = block.getitem_block(slice(i, i + 1))
+                return block.fillna(value,
+                                    limit=limit,
+                                    inplace=inplace,
+                                    downcast=None)
+
+            return self.split_and_operate(mask, f, inplace)
+
+    def split_and_operate(self, mask, f, inplace):
+        """
+        split the block per-column, and apply the callable f
+        per-column, return a new block for each. Handle
+        masking which will not change a block unless needed.
+
+        Parameters
+        ----------
+        mask : 2-d boolean mask
+        f : callable accepting (1d-mask, 1d values, indexer)
+        inplace : boolean
+
+        Returns
+        -------
+        list of blocks
+        """
+
+        if mask is None:
+            mask = np.ones(self.shape, dtype=bool)
+        new_values = self.values
+
+        def make_a_block(nv, ref_loc):
+            if isinstance(nv, Block):
+                block = nv
+            elif isinstance(nv, list):
+                block = nv[0]
+            else:
+                # Put back the dimension that was taken from it and make
+                # a block out of the result.
+                try:
+                    nv = _block_shape(nv, ndim=self.ndim)
+                except (AttributeError, NotImplementedError):
+                    pass
+                block = self.make_block(values=nv,
+                                        placement=ref_loc)
+            return block
+
+        # ndim == 1
+        if self.ndim == 1:
+            if mask.any():
+                nv = f(mask, new_values, None)
+            else:
+                nv = new_values if inplace else new_values.copy()
+            block = make_a_block(nv, self.mgr_locs)
+            return [block]
+
+        # ndim > 1
+        new_blocks = []
+        for i, ref_loc in enumerate(self.mgr_locs):
+            m = mask[i]
+            v = new_values[i]
+
+            # need a new block
+            if m.any():
+                nv = f(m, v, i)
+            else:
+                nv = v if inplace else v.copy()
+
+            block = make_a_block(nv, [ref_loc])
+            new_blocks.append(block)
+
+        return new_blocks
+
+    def _maybe_downcast(self, blocks, downcast=None):
+
+        # no need to downcast our float
+        # unless indicated
+        if downcast is None and self.is_float:
+            return blocks
+        elif downcast is None and (self.is_timedelta or self.is_datetime):
+            return blocks
+
+        if not isinstance(blocks, list):
+            blocks = [blocks]
+        return _extend_blocks([b.downcast(downcast) for b in blocks])
+
+    def downcast(self, dtypes=None):
+        """ try to downcast each item to the dict of dtypes if present """
+
+        # turn it off completely
+        if dtypes is False:
+            return self
+
+        values = self.values
+
+        # single block handling
+        if self._is_single_block:
+
+            # try to cast all non-floats here
+            if dtypes is None:
+                dtypes = 'infer'
+
+            nv = maybe_downcast_to_dtype(values, dtypes)
+            return self.make_block(nv)
+
+        # ndim > 1
+        if dtypes is None:
+            return self
+
+        if not (dtypes == 'infer' or isinstance(dtypes, dict)):
+            raise ValueError("downcast must have a dictionary or 'infer' as "
+                             "its argument")
+
+        # operate column-by-column
+        # this is expensive as it splits the blocks items-by-item
+        def f(m, v, i):
+
+            if dtypes == 'infer':
+                dtype = 'infer'
+            else:
+                raise AssertionError("dtypes as dict is not supported yet")
+
+            if dtype is not None:
+                v = maybe_downcast_to_dtype(v, dtype)
+            return v
+
+        return self.split_and_operate(None, f, False)
+
+    def astype(self, dtype, copy=False, errors='raise', values=None, **kwargs):
+        return self._astype(dtype, copy=copy, errors=errors, values=values,
+                            **kwargs)
+
+    def _astype(self, dtype, copy=False, errors='raise', values=None,
+                **kwargs):
+        """Coerce to the new type
+
+        Parameters
+        ----------
+        dtype : str, dtype convertible
+        copy : boolean, default False
+            copy if indicated
+        errors : str, {'raise', 'ignore'}, default 'ignore'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+        Returns
+        -------
+        Block
+        """
+        errors_legal_values = ('raise', 'ignore')
+
+        if errors not in errors_legal_values:
+            invalid_arg = ("Expected value of kwarg 'errors' to be one of {}. "
+                           "Supplied value is '{}'".format(
+                               list(errors_legal_values), errors))
+            raise ValueError(invalid_arg)
+
+        if (inspect.isclass(dtype) and
+                issubclass(dtype, (PandasExtensionDtype, ExtensionDtype))):
+            msg = ("Expected an instance of {}, but got the class instead. "
+                   "Try instantiating 'dtype'.".format(dtype.__name__))
+            raise TypeError(msg)
+
+        # may need to convert to categorical
+        if self.is_categorical_astype(dtype):
+
+            # deprecated 17636
+            if ('categories' in kwargs or 'ordered' in kwargs):
+                if isinstance(dtype, CategoricalDtype):
+                    raise TypeError(
+                        "Cannot specify a CategoricalDtype and also "
+                        "`categories` or `ordered`. Use "
+                        "`dtype=CategoricalDtype(categories, ordered)`"
+                        " instead.")
+                warnings.warn("specifying 'categories' or 'ordered' in "
+                              ".astype() is deprecated; pass a "
+                              "CategoricalDtype instead",
+                              FutureWarning, stacklevel=7)
+
+            categories = kwargs.get('categories', None)
+            ordered = kwargs.get('ordered', None)
+            if com._any_not_none(categories, ordered):
+                dtype = CategoricalDtype(categories, ordered)
+
+            if is_categorical_dtype(self.values):
+                # GH 10696/18593: update an existing categorical efficiently
+                return self.make_block(self.values.astype(dtype, copy=copy))
+
+            return self.make_block(Categorical(self.values, dtype=dtype))
+
+        # convert dtypes if needed
+        dtype = pandas_dtype(dtype)
+        # astype processing
+        if is_dtype_equal(self.dtype, dtype):
+            if copy:
+                return self.copy()
+            return self
+
+        klass = None
+        if is_sparse(self.values):
+            # special case sparse, Series[Sparse].astype(object) is sparse
+            klass = ExtensionBlock
+        elif is_object_dtype(dtype):
+            klass = ObjectBlock
+        elif is_extension_array_dtype(dtype):
+            klass = ExtensionBlock
+
+        try:
+            # force the copy here
+            if values is None:
+
+                if self.is_extension:
+                    values = self.values.astype(dtype)
+                else:
+                    if issubclass(dtype.type,
+                                  (compat.text_type, compat.string_types)):
+
+                        # use native type formatting for datetime/tz/timedelta
+                        if self.is_datelike:
+                            values = self.to_native_types()
+
+                        # astype formatting
+                        else:
+                            values = self.get_values()
+
+                    else:
+                        values = self.get_values(dtype=dtype)
+
+                    # _astype_nansafe works fine with 1-d only
+                    values = astype_nansafe(values.ravel(), dtype, copy=True)
+
+                # TODO(extension)
+                # should we make this attribute?
+                try:
+                    values = values.reshape(self.shape)
+                except AttributeError:
+                    pass
+
+            newb = make_block(values, placement=self.mgr_locs,
+                              klass=klass, ndim=self.ndim)
+        except Exception:  # noqa: E722
+            if errors == 'raise':
+                raise
+            newb = self.copy() if copy else self
+
+        if newb.is_numeric and self.is_numeric:
+            if newb.shape != self.shape:
+                raise TypeError(
+                    "cannot set astype for copy = [{copy}] for dtype "
+                    "({dtype} [{shape}]) to different shape "
+                    "({newb_dtype} [{newb_shape}])".format(
+                        copy=copy, dtype=self.dtype.name,
+                        shape=self.shape, newb_dtype=newb.dtype.name,
+                        newb_shape=newb.shape))
+        return newb
+
+    def convert(self, copy=True, **kwargs):
+        """ attempt to coerce any object types to better types return a copy
+        of the block (if copy = True) by definition we are not an ObjectBlock
+        here!
+        """
+
+        return self.copy() if copy else self
+
+    def _can_hold_element(self, element):
+        """ require the same dtype as ourselves """
+        dtype = self.values.dtype.type
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, dtype)
+        return isinstance(element, dtype)
+
+    def _try_cast_result(self, result, dtype=None):
+        """ try to cast the result to our original type, we may have
+        roundtripped thru object in the mean-time
+        """
+        if dtype is None:
+            dtype = self.dtype
+
+        if self.is_integer or self.is_bool or self.is_datetime:
+            pass
+        elif self.is_float and result.dtype == self.dtype:
+
+            # protect against a bool/object showing up here
+            if isinstance(dtype, compat.string_types) and dtype == 'infer':
+                return result
+            if not isinstance(dtype, type):
+                dtype = dtype.type
+            if issubclass(dtype, (np.bool_, np.object_)):
+                if issubclass(dtype, np.bool_):
+                    if isna(result).all():
+                        return result.astype(np.bool_)
+                    else:
+                        result = result.astype(np.object_)
+                        result[result == 1] = True
+                        result[result == 0] = False
+                        return result
+                else:
+                    return result.astype(np.object_)
+
+            return result
+
+        # may need to change the dtype here
+        return maybe_downcast_to_dtype(result, dtype)
+
+    def _try_coerce_args(self, values, other):
+        """ provide coercion to our input arguments """
+
+        if np.any(notna(other)) and not self._can_hold_element(other):
+            # coercion issues
+            # let higher levels handle
+            raise TypeError("cannot convert {} to an {}".format(
+                type(other).__name__,
+                type(self).__name__.lower().replace('Block', '')))
+
+        return values, other
+
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args """
+        return result
+
+    def _try_coerce_and_cast_result(self, result, dtype=None):
+        result = self._try_coerce_result(result)
+        result = self._try_cast_result(result, dtype=dtype)
+        return result
+
+    def to_native_types(self, slicer=None, na_rep='nan', quoting=None,
+                        **kwargs):
+        """ convert to our native types format, slicing if desired """
+
+        values = self.get_values()
+
+        if slicer is not None:
+            values = values[:, slicer]
+        mask = isna(values)
+
+        if not self.is_object and not quoting:
+            values = values.astype(str)
+        else:
+            values = np.array(values, dtype='object')
+
+        values[mask] = na_rep
+        return values
+
+    # block actions ####
+    def copy(self, deep=True):
+        """ copy constructor """
+        values = self.values
+        if deep:
+            values = values.copy()
+        return self.make_block_same_class(values)
+
+    def replace(self, to_replace, value, inplace=False, filter=None,
+                regex=False, convert=True):
+        """replace the to_replace value with value, possible to create new
+        blocks here this is just a call to putmask. regex is not used here.
+        It is used in ObjectBlocks.  It is here for API compatibility.
+        """
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        original_to_replace = to_replace
+
+        # try to replace, if we raise an error, convert to ObjectBlock and
+        # retry
+        try:
+            values, to_replace = self._try_coerce_args(self.values,
+                                                       to_replace)
+            mask = missing.mask_missing(values, to_replace)
+            if filter is not None:
+                filtered_out = ~self.mgr_locs.isin(filter)
+                mask[filtered_out.nonzero()[0]] = False
+
+            blocks = self.putmask(mask, value, inplace=inplace)
+            if convert:
+                blocks = [b.convert(by_item=True, numeric=False,
+                                    copy=not inplace) for b in blocks]
+            return blocks
+        except (TypeError, ValueError):
+            # GH 22083, TypeError or ValueError occurred within error handling
+            # causes infinite loop. Cast and retry only if not objectblock.
+            if is_object_dtype(self):
+                raise
+
+            # try again with a compatible block
+            block = self.astype(object)
+            return block.replace(to_replace=original_to_replace,
+                                 value=value,
+                                 inplace=inplace,
+                                 filter=filter,
+                                 regex=regex,
+                                 convert=convert)
+
+    def _replace_single(self, *args, **kwargs):
+        """ no-op on a non-ObjectBlock """
+        return self if kwargs['inplace'] else self.copy()
+
+    def setitem(self, indexer, value):
+        """Set the value inplace, returning a a maybe different typed block.
+
+        Parameters
+        ----------
+        indexer : tuple, list-like, array-like, slice
+            The subset of self.values to set
+        value : object
+            The value being set
+
+        Returns
+        -------
+        Block
+
+        Notes
+        -----
+        `indexer` is a direct slice/positional indexer. `value` must
+        be a compatible shape.
+        """
+        # coerce None values, if appropriate
+        if value is None:
+            if self.is_numeric:
+                value = np.nan
+
+        # coerce if block dtype can store value
+        values = self.values
+        try:
+            values, value = self._try_coerce_args(values, value)
+            # can keep its own dtype
+            if hasattr(value, 'dtype') and is_dtype_equal(values.dtype,
+                                                          value.dtype):
+                dtype = self.dtype
+            else:
+                dtype = 'infer'
+
+        except (TypeError, ValueError):
+            # current dtype cannot store value, coerce to common dtype
+            find_dtype = False
+
+            if hasattr(value, 'dtype'):
+                dtype = value.dtype
+                find_dtype = True
+
+            elif lib.is_scalar(value):
+                if isna(value):
+                    # NaN promotion is handled in latter path
+                    dtype = False
+                else:
+                    dtype, _ = infer_dtype_from_scalar(value,
+                                                       pandas_dtype=True)
+                    find_dtype = True
+            else:
+                dtype = 'infer'
+
+            if find_dtype:
+                dtype = find_common_type([values.dtype, dtype])
+                if not is_dtype_equal(self.dtype, dtype):
+                    b = self.astype(dtype)
+                    return b.setitem(indexer, value)
+
+        # value must be storeable at this moment
+        arr_value = np.array(value)
+
+        # cast the values to a type that can hold nan (if necessary)
+        if not self._can_hold_element(value):
+            dtype, _ = maybe_promote(arr_value.dtype)
+            values = values.astype(dtype)
+
+        transf = (lambda x: x.T) if self.ndim == 2 else (lambda x: x)
+        values = transf(values)
+
+        # length checking
+        check_setitem_lengths(indexer, value, values)
+
+        def _is_scalar_indexer(indexer):
+            # return True if we are all scalar indexers
+
+            if arr_value.ndim == 1:
+                if not isinstance(indexer, tuple):
+                    indexer = tuple([indexer])
+                    return any(isinstance(idx, np.ndarray) and len(idx) == 0
+                               for idx in indexer)
+            return False
+
+        def _is_empty_indexer(indexer):
+            # return a boolean if we have an empty indexer
+
+            if is_list_like(indexer) and not len(indexer):
+                return True
+            if arr_value.ndim == 1:
+                if not isinstance(indexer, tuple):
+                    indexer = tuple([indexer])
+                return any(isinstance(idx, np.ndarray) and len(idx) == 0
+                           for idx in indexer)
+            return False
+
+        # empty indexers
+        # 8669 (empty)
+        if _is_empty_indexer(indexer):
+            pass
+
+        # setting a single element for each dim and with a rhs that could
+        # be say a list
+        # GH 6043
+        elif _is_scalar_indexer(indexer):
+            values[indexer] = value
+
+        # if we are an exact match (ex-broadcasting),
+        # then use the resultant dtype
+        elif (len(arr_value.shape) and
+              arr_value.shape[0] == values.shape[0] and
+              np.prod(arr_value.shape) == np.prod(values.shape)):
+            values[indexer] = value
+            try:
+                values = values.astype(arr_value.dtype)
+            except ValueError:
+                pass
+
+        # set
+        else:
+            values[indexer] = value
+
+        # coerce and try to infer the dtypes of the result
+        values = self._try_coerce_and_cast_result(values, dtype)
+        block = self.make_block(transf(values))
+        return block
+
+    def putmask(self, mask, new, align=True, inplace=False, axis=0,
+                transpose=False):
+        """ putmask the data to the block; it is possible that we may create a
+        new dtype of block
+
+        return the resulting block(s)
+
+        Parameters
+        ----------
+        mask  : the condition to respect
+        new : a ndarray/object
+        align : boolean, perform alignment on other/cond, default is True
+        inplace : perform inplace modification, default is False
+        axis : int
+        transpose : boolean
+            Set to True if self is stored with axes reversed
+
+        Returns
+        -------
+        a list of new blocks, the result of the putmask
+        """
+
+        new_values = self.values if inplace else self.values.copy()
+
+        new = getattr(new, 'values', new)
+        mask = getattr(mask, 'values', mask)
+
+        # if we are passed a scalar None, convert it here
+        if not is_list_like(new) and isna(new) and not self.is_object:
+            new = self.fill_value
+
+        if self._can_hold_element(new):
+            _, new = self._try_coerce_args(new_values, new)
+
+            if transpose:
+                new_values = new_values.T
+
+            # If the default repeat behavior in np.putmask would go in the
+            # wrong direction, then explicitly repeat and reshape new instead
+            if getattr(new, 'ndim', 0) >= 1:
+                if self.ndim - 1 == new.ndim and axis == 1:
+                    new = np.repeat(
+                        new, new_values.shape[-1]).reshape(self.shape)
+                new = new.astype(new_values.dtype)
+
+            # we require exact matches between the len of the
+            # values we are setting (or is compat). np.putmask
+            # doesn't check this and will simply truncate / pad
+            # the output, but we want sane error messages
+            #
+            # TODO: this prob needs some better checking
+            # for 2D cases
+            if ((is_list_like(new) and
+                 np.any(mask[mask]) and
+                 getattr(new, 'ndim', 1) == 1)):
+
+                if not (mask.shape[-1] == len(new) or
+                        mask[mask].shape[-1] == len(new) or
+                        len(new) == 1):
+                    raise ValueError("cannot assign mismatch "
+                                     "length to masked array")
+
+            np.putmask(new_values, mask, new)
+
+        # maybe upcast me
+        elif mask.any():
+            if transpose:
+                mask = mask.T
+                if isinstance(new, np.ndarray):
+                    new = new.T
+                axis = new_values.ndim - axis - 1
+
+            # Pseudo-broadcast
+            if getattr(new, 'ndim', 0) >= 1:
+                if self.ndim - 1 == new.ndim:
+                    new_shape = list(new.shape)
+                    new_shape.insert(axis, 1)
+                    new = new.reshape(tuple(new_shape))
+
+            # operate column-by-column
+            def f(m, v, i):
+
+                if i is None:
+                    # ndim==1 case.
+                    n = new
+                else:
+
+                    if isinstance(new, np.ndarray):
+                        n = np.squeeze(new[i % new.shape[0]])
+                    else:
+                        n = np.array(new)
+
+                    # type of the new block
+                    dtype, _ = maybe_promote(n.dtype)
+
+                    # we need to explicitly astype here to make a copy
+                    n = n.astype(dtype)
+
+                nv = _putmask_smart(v, m, n)
+                return nv
+
+            new_blocks = self.split_and_operate(mask, f, inplace)
+            return new_blocks
+
+        if inplace:
+            return [self]
+
+        if transpose:
+            new_values = new_values.T
+
+        return [self.make_block(new_values)]
+
+    def coerce_to_target_dtype(self, other):
+        """
+        coerce the current block to a dtype compat for other
+        we will return a block, possibly object, and not raise
+
+        we can also safely try to coerce to the same dtype
+        and will receive the same block
+        """
+
+        # if we cannot then coerce to object
+        dtype, _ = infer_dtype_from(other, pandas_dtype=True)
+
+        if is_dtype_equal(self.dtype, dtype):
+            return self
+
+        if self.is_bool or is_object_dtype(dtype) or is_bool_dtype(dtype):
+            # we don't upcast to bool
+            return self.astype(object)
+
+        elif ((self.is_float or self.is_complex) and
+              (is_integer_dtype(dtype) or is_float_dtype(dtype))):
+            # don't coerce float/complex to int
+            return self
+
+        elif (self.is_datetime or
+              is_datetime64_dtype(dtype) or
+              is_datetime64tz_dtype(dtype)):
+
+            # not a datetime
+            if not ((is_datetime64_dtype(dtype) or
+                     is_datetime64tz_dtype(dtype)) and self.is_datetime):
+                return self.astype(object)
+
+            # don't upcast timezone with different timezone or no timezone
+            mytz = getattr(self.dtype, 'tz', None)
+            othertz = getattr(dtype, 'tz', None)
+
+            if str(mytz) != str(othertz):
+                return self.astype(object)
+
+            raise AssertionError("possible recursion in "
+                                 "coerce_to_target_dtype: {} {}".format(
+                                     self, other))
+
+        elif (self.is_timedelta or is_timedelta64_dtype(dtype)):
+
+            # not a timedelta
+            if not (is_timedelta64_dtype(dtype) and self.is_timedelta):
+                return self.astype(object)
+
+            raise AssertionError("possible recursion in "
+                                 "coerce_to_target_dtype: {} {}".format(
+                                     self, other))
+
+        try:
+            return self.astype(dtype)
+        except (ValueError, TypeError):
+            pass
+
+        return self.astype(object)
+
+    def interpolate(self, method='pad', axis=0, index=None, values=None,
+                    inplace=False, limit=None, limit_direction='forward',
+                    limit_area=None, fill_value=None, coerce=False,
+                    downcast=None, **kwargs):
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        def check_int_bool(self, inplace):
+            # Only FloatBlocks will contain NaNs.
+            # timedelta subclasses IntBlock
+            if (self.is_bool or self.is_integer) and not self.is_timedelta:
+                if inplace:
+                    return self
+                else:
+                    return self.copy()
+
+        # a fill na type method
+        try:
+            m = missing.clean_fill_method(method)
+        except ValueError:
+            m = None
+
+        if m is not None:
+            r = check_int_bool(self, inplace)
+            if r is not None:
+                return r
+            return self._interpolate_with_fill(method=m, axis=axis,
+                                               inplace=inplace, limit=limit,
+                                               fill_value=fill_value,
+                                               coerce=coerce,
+                                               downcast=downcast)
+        # validate the interp method
+        m = missing.clean_interp_method(method, **kwargs)
+
+        r = check_int_bool(self, inplace)
+        if r is not None:
+            return r
+        return self._interpolate(method=m, index=index, values=values,
+                                 axis=axis, limit=limit,
+                                 limit_direction=limit_direction,
+                                 limit_area=limit_area,
+                                 fill_value=fill_value, inplace=inplace,
+                                 downcast=downcast, **kwargs)
+
+    def _interpolate_with_fill(self, method='pad', axis=0, inplace=False,
+                               limit=None, fill_value=None, coerce=False,
+                               downcast=None):
+        """ fillna but using the interpolate machinery """
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        # if we are coercing, then don't force the conversion
+        # if the block can't hold the type
+        if coerce:
+            if not self._can_hold_na:
+                if inplace:
+                    return [self]
+                else:
+                    return [self.copy()]
+
+        values = self.values if inplace else self.values.copy()
+        values, fill_value = self._try_coerce_args(values, fill_value)
+        values = missing.interpolate_2d(values, method=method, axis=axis,
+                                        limit=limit, fill_value=fill_value,
+                                        dtype=self.dtype)
+        values = self._try_coerce_result(values)
+
+        blocks = [self.make_block_same_class(values, ndim=self.ndim)]
+        return self._maybe_downcast(blocks, downcast)
+
+    def _interpolate(self, method=None, index=None, values=None,
+                     fill_value=None, axis=0, limit=None,
+                     limit_direction='forward', limit_area=None,
+                     inplace=False, downcast=None, **kwargs):
+        """ interpolate using scipy wrappers """
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        data = self.values if inplace else self.values.copy()
+
+        # only deal with floats
+        if not self.is_float:
+            if not self.is_integer:
+                return self
+            data = data.astype(np.float64)
+
+        if fill_value is None:
+            fill_value = self.fill_value
+
+        if method in ('krogh', 'piecewise_polynomial', 'pchip'):
+            if not index.is_monotonic:
+                raise ValueError("{0} interpolation requires that the "
+                                 "index be monotonic.".format(method))
+        # process 1-d slices in the axis direction
+
+        def func(x):
+
+            # process a 1-d slice, returning it
+            # should the axis argument be handled below in apply_along_axis?
+            # i.e. not an arg to missing.interpolate_1d
+            return missing.interpolate_1d(index, x, method=method, limit=limit,
+                                          limit_direction=limit_direction,
+                                          limit_area=limit_area,
+                                          fill_value=fill_value,
+                                          bounds_error=False, **kwargs)
+
+        # interp each column independently
+        interp_values = np.apply_along_axis(func, axis, data)
+
+        blocks = [self.make_block_same_class(interp_values)]
+        return self._maybe_downcast(blocks, downcast)
+
+    def take_nd(self, indexer, axis, new_mgr_locs=None, fill_tuple=None):
+        """
+        Take values according to indexer and return them as a block.bb
+
+        """
+
+        # algos.take_nd dispatches for DatetimeTZBlock, CategoricalBlock
+        # so need to preserve types
+        # sparse is treated like an ndarray, but needs .get_values() shaping
+
+        values = self.values
+        if self.is_sparse:
+            values = self.get_values()
+
+        if fill_tuple is None:
+            fill_value = self.fill_value
+            new_values = algos.take_nd(values, indexer, axis=axis,
+                                       allow_fill=False, fill_value=fill_value)
+        else:
+            fill_value = fill_tuple[0]
+            new_values = algos.take_nd(values, indexer, axis=axis,
+                                       allow_fill=True, fill_value=fill_value)
+
+        if new_mgr_locs is None:
+            if axis == 0:
+                slc = libinternals.indexer_as_slice(indexer)
+                if slc is not None:
+                    new_mgr_locs = self.mgr_locs[slc]
+                else:
+                    new_mgr_locs = self.mgr_locs[indexer]
+            else:
+                new_mgr_locs = self.mgr_locs
+
+        if not is_dtype_equal(new_values.dtype, self.dtype):
+            return self.make_block(new_values, new_mgr_locs)
+        else:
+            return self.make_block_same_class(new_values, new_mgr_locs)
+
+    def diff(self, n, axis=1):
+        """ return block for the diff of the values """
+        new_values = algos.diff(self.values, n, axis=axis)
+        return [self.make_block(values=new_values)]
+
+    def shift(self, periods, axis=0, fill_value=None):
+        """ shift the block by periods, possibly upcast """
+
+        # convert integer to float if necessary. need to do a lot more than
+        # that, handle boolean etc also
+        new_values, fill_value = maybe_upcast(self.values, fill_value)
+
+        # make sure array sent to np.roll is c_contiguous
+        f_ordered = new_values.flags.f_contiguous
+        if f_ordered:
+            new_values = new_values.T
+            axis = new_values.ndim - axis - 1
+
+        if np.prod(new_values.shape):
+            new_values = np.roll(new_values, ensure_platform_int(periods),
+                                 axis=axis)
+
+        axis_indexer = [slice(None)] * self.ndim
+        if periods > 0:
+            axis_indexer[axis] = slice(None, periods)
+        else:
+            axis_indexer[axis] = slice(periods, None)
+        new_values[tuple(axis_indexer)] = fill_value
+
+        # restore original order
+        if f_ordered:
+            new_values = new_values.T
+
+        return [self.make_block(new_values)]
+
+    def where(self, other, cond, align=True, errors='raise',
+              try_cast=False, axis=0, transpose=False):
+        """
+        evaluate the block; return result block(s) from the result
+
+        Parameters
+        ----------
+        other : a ndarray/object
+        cond  : the condition to respect
+        align : boolean, perform alignment on other/cond
+        errors : str, {'raise', 'ignore'}, default 'raise'
+            - ``raise`` : allow exceptions to be raised
+            - ``ignore`` : suppress exceptions. On error return original object
+
+        axis : int
+        transpose : boolean
+            Set to True if self is stored with axes reversed
+
+        Returns
+        -------
+        a new block(s), the result of the func
+        """
+        import pandas.core.computation.expressions as expressions
+        assert errors in ['raise', 'ignore']
+
+        values = self.values
+        orig_other = other
+        if transpose:
+            values = values.T
+
+        other = getattr(other, '_values', getattr(other, 'values', other))
+        cond = getattr(cond, 'values', cond)
+
+        # If the default broadcasting would go in the wrong direction, then
+        # explicitly reshape other instead
+        if getattr(other, 'ndim', 0) >= 1:
+            if values.ndim - 1 == other.ndim and axis == 1:
+                other = other.reshape(tuple(other.shape + (1, )))
+            elif transpose and values.ndim == self.ndim - 1:
+                cond = cond.T
+
+        if not hasattr(cond, 'shape'):
+            raise ValueError("where must have a condition that is ndarray "
+                             "like")
+
+        # our where function
+        def func(cond, values, other):
+            if cond.ravel().all():
+                return values
+
+            values, other = self._try_coerce_args(values, other)
+
+            try:
+                return self._try_coerce_result(expressions.where(
+                    cond, values, other))
+            except Exception as detail:
+                if errors == 'raise':
+                    raise TypeError(
+                        'Could not operate [{other!r}] with block values '
+                        '[{detail!s}]'.format(other=other, detail=detail))
+                else:
+                    # return the values
+                    result = np.empty(values.shape, dtype='float64')
+                    result.fill(np.nan)
+                    return result
+
+        # see if we can operate on the entire block, or need item-by-item
+        # or if we are a single block (ndim == 1)
+        try:
+            result = func(cond, values, other)
+        except TypeError:
+
+            # we cannot coerce, return a compat dtype
+            # we are explicitly ignoring errors
+            block = self.coerce_to_target_dtype(other)
+            blocks = block.where(orig_other, cond, align=align,
+                                 errors=errors,
+                                 try_cast=try_cast, axis=axis,
+                                 transpose=transpose)
+            return self._maybe_downcast(blocks, 'infer')
+
+        if self._can_hold_na or self.ndim == 1:
+
+            if transpose:
+                result = result.T
+
+            # try to cast if requested
+            if try_cast:
+                result = self._try_cast_result(result)
+
+            return self.make_block(result)
+
+        # might need to separate out blocks
+        axis = cond.ndim - 1
+        cond = cond.swapaxes(axis, 0)
+        mask = np.array([cond[i].all() for i in range(cond.shape[0])],
+                        dtype=bool)
+
+        result_blocks = []
+        for m in [mask, ~mask]:
+            if m.any():
+                r = self._try_cast_result(result.take(m.nonzero()[0],
+                                                      axis=axis))
+                result_blocks.append(
+                    self.make_block(r.T, placement=self.mgr_locs[m]))
+
+        return result_blocks
+
+    def equals(self, other):
+        if self.dtype != other.dtype or self.shape != other.shape:
+            return False
+        return array_equivalent(self.values, other.values)
+
+    def _unstack(self, unstacker_func, new_columns, n_rows, fill_value):
+        """Return a list of unstacked blocks of self
+
+        Parameters
+        ----------
+        unstacker_func : callable
+            Partially applied unstacker.
+        new_columns : Index
+            All columns of the unstacked BlockManager.
+        n_rows : int
+            Only used in ExtensionBlock.unstack
+        fill_value : int
+            Only used in ExtensionBlock.unstack
+
+        Returns
+        -------
+        blocks : list of Block
+            New blocks of unstacked values.
+        mask : array_like of bool
+            The mask of columns of `blocks` we should keep.
+        """
+        unstacker = unstacker_func(self.values.T)
+        new_items = unstacker.get_new_columns()
+        new_placement = new_columns.get_indexer(new_items)
+        new_values, mask = unstacker.get_new_values()
+
+        mask = mask.any(0)
+        new_values = new_values.T[mask]
+        new_placement = new_placement[mask]
+
+        blocks = [make_block(new_values, placement=new_placement)]
+        return blocks, mask
+
+    def quantile(self, qs, interpolation='linear', axis=0):
+        """
+        compute the quantiles of the
+
+        Parameters
+        ----------
+        qs: a scalar or list of the quantiles to be computed
+        interpolation: type of interpolation, default 'linear'
+        axis: axis to compute, default 0
+
+        Returns
+        -------
+        Block
+        """
+        if self.is_datetimetz:
+            # TODO: cleanup this special case.
+            # We need to operate on i8 values for datetimetz
+            # but `Block.get_values()` returns an ndarray of objects
+            # right now. We need an API for "values to do numeric-like ops on"
+            values = self.values.asi8
+
+            # TODO: NonConsolidatableMixin shape
+            # Usual shape inconsistencies for ExtensionBlocks
+            if self.ndim > 1:
+                values = values[None, :]
+        else:
+            values = self.get_values()
+            values, _ = self._try_coerce_args(values, values)
+
+        is_empty = values.shape[axis] == 0
+        orig_scalar = not is_list_like(qs)
+        if orig_scalar:
+            # make list-like, unpack later
+            qs = [qs]
+
+        if is_empty:
+            if self.ndim == 1:
+                result = self._na_value
+            else:
+                # create the array of na_values
+                # 2d len(values) * len(qs)
+                result = np.repeat(np.array([self.fill_value] * len(qs)),
+                                   len(values)).reshape(len(values),
+                                                        len(qs))
+        else:
+            # asarray needed for Sparse, see GH#24600
+            # TODO: Why self.values and not values?
+            mask = np.asarray(isna(self.values))
+            result = nanpercentile(values, np.array(qs) * 100,
+                                   axis=axis, na_value=self.fill_value,
+                                   mask=mask, ndim=self.ndim,
+                                   interpolation=interpolation)
+
+            result = np.array(result, copy=False)
+            if self.ndim > 1:
+                result = result.T
+
+        if orig_scalar and not lib.is_scalar(result):
+            # result could be scalar in case with is_empty and self.ndim == 1
+            assert result.shape[-1] == 1, result.shape
+            result = result[..., 0]
+            result = lib.item_from_zerodim(result)
+
+        ndim = getattr(result, 'ndim', None) or 0
+        result = self._try_coerce_result(result)
+        return make_block(result,
+                          placement=np.arange(len(result)),
+                          ndim=ndim)
+
+    def _replace_coerce(self, to_replace, value, inplace=True, regex=False,
+                        convert=False, mask=None):
+        """
+        Replace value corresponding to the given boolean array with another
+        value.
+
+        Parameters
+        ----------
+        to_replace : object or pattern
+            Scalar to replace or regular expression to match.
+        value : object
+            Replacement object.
+        inplace : bool, default False
+            Perform inplace modification.
+        regex : bool, default False
+            If true, perform regular expression substitution.
+        convert : bool, default True
+            If true, try to coerce any object types to better types.
+        mask : array-like of bool, optional
+            True indicate corresponding element is ignored.
+
+        Returns
+        -------
+        A new block if there is anything to replace or the original block.
+        """
+
+        if mask.any():
+            if not regex:
+                self = self.coerce_to_target_dtype(value)
+                return self.putmask(mask, value, inplace=inplace)
+            else:
+                return self._replace_single(to_replace, value, inplace=inplace,
+                                            regex=regex,
+                                            convert=convert,
+                                            mask=mask)
+        return self
+
+
+class NonConsolidatableMixIn(object):
+    """ hold methods for the nonconsolidatable blocks """
+    _can_consolidate = False
+    _verify_integrity = False
+    _validate_ndim = False
+
+    def __init__(self, values, placement, ndim=None):
+        """Initialize a non-consolidatable block.
+
+        'ndim' may be inferred from 'placement'.
+
+        This will call continue to call __init__ for the other base
+        classes mixed in with this Mixin.
+        """
+        # Placement must be converted to BlockPlacement so that we can check
+        # its length
+        if not isinstance(placement, libinternals.BlockPlacement):
+            placement = libinternals.BlockPlacement(placement)
+
+        # Maybe infer ndim from placement
+        if ndim is None:
+            if len(placement) != 1:
+                ndim = 1
+            else:
+                ndim = 2
+        super(NonConsolidatableMixIn, self).__init__(values, placement,
+                                                     ndim=ndim)
+
+    @property
+    def shape(self):
+        if self.ndim == 1:
+            return (len(self.values)),
+        return (len(self.mgr_locs), len(self.values))
+
+    def iget(self, col):
+
+        if self.ndim == 2 and isinstance(col, tuple):
+            col, loc = col
+            if not com.is_null_slice(col) and col != 0:
+                raise IndexError("{0} only contains one item".format(self))
+            return self.values[loc]
+        else:
+            if col != 0:
+                raise IndexError("{0} only contains one item".format(self))
+            return self.values
+
+    def should_store(self, value):
+        return isinstance(value, self._holder)
+
+    def set(self, locs, values, check=False):
+        assert locs.tolist() == [0]
+        self.values = values
+
+    def putmask(self, mask, new, align=True, inplace=False, axis=0,
+                transpose=False):
+        """
+        putmask the data to the block; we must be a single block and not
+        generate other blocks
+
+        return the resulting block
+
+        Parameters
+        ----------
+        mask  : the condition to respect
+        new : a ndarray/object
+        align : boolean, perform alignment on other/cond, default is True
+        inplace : perform inplace modification, default is False
+
+        Returns
+        -------
+        a new block, the result of the putmask
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        # use block's copy logic.
+        # .values may be an Index which does shallow copy by default
+        new_values = self.values if inplace else self.copy().values
+        new_values, new = self._try_coerce_args(new_values, new)
+
+        if isinstance(new, np.ndarray) and len(new) == len(mask):
+            new = new[mask]
+
+        mask = _safe_reshape(mask, new_values.shape)
+
+        new_values[mask] = new
+        new_values = self._try_coerce_result(new_values)
+        return [self.make_block(values=new_values)]
+
+    def _try_cast_result(self, result, dtype=None):
+        return result
+
+    def _get_unstack_items(self, unstacker, new_columns):
+        """
+        Get the placement, values, and mask for a Block unstack.
+
+        This is shared between ObjectBlock and ExtensionBlock. They
+        differ in that ObjectBlock passes the values, while ExtensionBlock
+        passes the dummy ndarray of positions to be used by a take
+        later.
+
+        Parameters
+        ----------
+        unstacker : pandas.core.reshape.reshape._Unstacker
+        new_columns : Index
+            All columns of the unstacked BlockManager.
+
+        Returns
+        -------
+        new_placement : ndarray[int]
+            The placement of the new columns in `new_columns`.
+        new_values : Union[ndarray, ExtensionArray]
+            The first return value from _Unstacker.get_new_values.
+        mask : ndarray[bool]
+            The second return value from _Unstacker.get_new_values.
+        """
+        # shared with ExtensionBlock
+        new_items = unstacker.get_new_columns()
+        new_placement = new_columns.get_indexer(new_items)
+        new_values, mask = unstacker.get_new_values()
+
+        mask = mask.any(0)
+        return new_placement, new_values, mask
+
+
+class ExtensionBlock(NonConsolidatableMixIn, Block):
+    """Block for holding extension types.
+
+    Notes
+    -----
+    This holds all 3rd-party extension array types. It's also the immediate
+    parent class for our internal extension types' blocks, CategoricalBlock.
+
+    ExtensionArrays are limited to 1-D.
+    """
+    is_extension = True
+
+    def __init__(self, values, placement, ndim=None):
+        values = self._maybe_coerce_values(values)
+        super(ExtensionBlock, self).__init__(values, placement, ndim)
+
+    def _maybe_coerce_values(self, values):
+        """Unbox to an extension array.
+
+        This will unbox an ExtensionArray stored in an Index or Series.
+        ExtensionArrays pass through. No dtype coercion is done.
+
+        Parameters
+        ----------
+        values : Index, Series, ExtensionArray
+
+        Returns
+        -------
+        ExtensionArray
+        """
+        if isinstance(values, (ABCIndexClass, ABCSeries)):
+            values = values._values
+        return values
+
+    @property
+    def _holder(self):
+        # For extension blocks, the holder is values-dependent.
+        return type(self.values)
+
+    @property
+    def fill_value(self):
+        # Used in reindex_indexer
+        return self.values.dtype.na_value
+
+    @property
+    def _can_hold_na(self):
+        # The default ExtensionArray._can_hold_na is True
+        return self._holder._can_hold_na
+
+    @property
+    def is_view(self):
+        """Extension arrays are never treated as views."""
+        return False
+
+    @property
+    def is_numeric(self):
+        return self.values.dtype._is_numeric
+
+    def setitem(self, indexer, value):
+        """Set the value inplace, returning a same-typed block.
+
+        This differs from Block.setitem by not allowing setitem to change
+        the dtype of the Block.
+
+        Parameters
+        ----------
+        indexer : tuple, list-like, array-like, slice
+            The subset of self.values to set
+        value : object
+            The value being set
+
+        Returns
+        -------
+        Block
+
+        Notes
+        -----
+        `indexer` is a direct slice/positional indexer. `value` must
+        be a compatible shape.
+        """
+        if isinstance(indexer, tuple):
+            # we are always 1-D
+            indexer = indexer[0]
+
+        check_setitem_lengths(indexer, value, self.values)
+        self.values[indexer] = value
+        return self
+
+    def get_values(self, dtype=None):
+        # ExtensionArrays must be iterable, so this works.
+        values = np.asarray(self.values)
+        if values.ndim == self.ndim - 1:
+            values = values.reshape((1,) + values.shape)
+        return values
+
+    def to_dense(self):
+        return np.asarray(self.values)
+
+    def take_nd(self, indexer, axis=0, new_mgr_locs=None, fill_tuple=None):
+        """
+        Take values according to indexer and return them as a block.
+        """
+        if fill_tuple is None:
+            fill_value = None
+        else:
+            fill_value = fill_tuple[0]
+
+        # axis doesn't matter; we are really a single-dim object
+        # but are passed the axis depending on the calling routing
+        # if its REALLY axis 0, then this will be a reindex and not a take
+        new_values = self.values.take(indexer, fill_value=fill_value,
+                                      allow_fill=True)
+
+        if self.ndim == 1 and new_mgr_locs is None:
+            new_mgr_locs = [0]
+        else:
+            if new_mgr_locs is None:
+                new_mgr_locs = self.mgr_locs
+
+        return self.make_block_same_class(new_values, new_mgr_locs)
+
+    def _can_hold_element(self, element):
+        # XXX: We may need to think about pushing this onto the array.
+        # We're doing the same as CategoricalBlock here.
+        return True
+
+    def _slice(self, slicer):
+        """ return a slice of my values """
+
+        # slice the category
+        # return same dims as we currently have
+
+        if isinstance(slicer, tuple) and len(slicer) == 2:
+            if not com.is_null_slice(slicer[0]):
+                raise AssertionError("invalid slicing for a 1-ndim "
+                                     "categorical")
+            slicer = slicer[1]
+
+        return self.values[slicer]
+
+    def formatting_values(self):
+        # Deprecating the ability to override _formatting_values.
+        # Do the warning here, it's only user in pandas, since we
+        # have to check if the subclass overrode it.
+        fv = getattr(type(self.values), '_formatting_values', None)
+        if fv and fv != ExtensionArray._formatting_values:
+            msg = (
+                "'ExtensionArray._formatting_values' is deprecated. "
+                "Specify 'ExtensionArray._formatter' instead."
+            )
+            warnings.warn(msg, DeprecationWarning, stacklevel=10)
+            return self.values._formatting_values()
+
+        return self.values
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+        """
+        values = self._holder._concat_same_type(
+            [blk.values for blk in to_concat])
+        placement = placement or slice(0, len(values), 1)
+        return self.make_block_same_class(values, ndim=self.ndim,
+                                          placement=placement)
+
+    def fillna(self, value, limit=None, inplace=False, downcast=None):
+        values = self.values if inplace else self.values.copy()
+        values = values.fillna(value=value, limit=limit)
+        return [self.make_block_same_class(values=values,
+                                           placement=self.mgr_locs,
+                                           ndim=self.ndim)]
+
+    def interpolate(self, method='pad', axis=0, inplace=False, limit=None,
+                    fill_value=None, **kwargs):
+
+        values = self.values if inplace else self.values.copy()
+        return self.make_block_same_class(
+            values=values.fillna(value=fill_value, method=method,
+                                 limit=limit),
+            placement=self.mgr_locs)
+
+    def shift(self, periods, axis=0, fill_value=None):
+        # type: (int, Optional[BlockPlacement], Any) -> List[ExtensionBlock]
+        """
+        Shift the block by `periods`.
+
+        Dispatches to underlying ExtensionArray and re-boxes in an
+        ExtensionBlock.
+        """
+        return [
+            self.make_block_same_class(
+                self.values.shift(periods=periods, fill_value=fill_value),
+                placement=self.mgr_locs, ndim=self.ndim)
+        ]
+
+    def where(self, other, cond, align=True, errors='raise',
+              try_cast=False, axis=0, transpose=False):
+        if isinstance(other, ABCDataFrame):
+            # ExtensionArrays are 1-D, so if we get here then
+            # `other` should be a DataFrame with a single column.
+            assert other.shape[1] == 1
+            other = other.iloc[:, 0]
+
+        other = extract_array(other, extract_numpy=True)
+
+        if isinstance(cond, ABCDataFrame):
+            assert cond.shape[1] == 1
+            cond = cond.iloc[:, 0]
+
+        cond = extract_array(cond, extract_numpy=True)
+
+        if lib.is_scalar(other) and isna(other):
+            # The default `other` for Series / Frame is np.nan
+            # we want to replace that with the correct NA value
+            # for the type
+            other = self.dtype.na_value
+
+        if is_sparse(self.values):
+            # TODO(SparseArray.__setitem__): remove this if condition
+            # We need to re-infer the type of the data after doing the
+            # where, for cases where the subtypes don't match
+            dtype = None
+        else:
+            dtype = self.dtype
+
+        try:
+            result = self.values.copy()
+            icond = ~cond
+            if lib.is_scalar(other):
+                result[icond] = other
+            else:
+                result[icond] = other[icond]
+        except (NotImplementedError, TypeError):
+            # NotImplementedError for class not implementing `__setitem__`
+            # TypeError for SparseArray, which implements just to raise
+            # a TypeError
+            result = self._holder._from_sequence(
+                np.where(cond, self.values, other),
+                dtype=dtype,
+            )
+
+        return self.make_block_same_class(result, placement=self.mgr_locs)
+
+    @property
+    def _ftype(self):
+        return getattr(self.values, '_pandas_ftype', Block._ftype)
+
+    def _unstack(self, unstacker_func, new_columns, n_rows, fill_value):
+        # ExtensionArray-safe unstack.
+        # We override ObjectBlock._unstack, which unstacks directly on the
+        # values of the array. For EA-backed blocks, this would require
+        # converting to a 2-D ndarray of objects.
+        # Instead, we unstack an ndarray of integer positions, followed by
+        # a `take` on the actual values.
+        dummy_arr = np.arange(n_rows)
+        dummy_unstacker = functools.partial(unstacker_func, fill_value=-1)
+        unstacker = dummy_unstacker(dummy_arr)
+
+        new_placement, new_values, mask = self._get_unstack_items(
+            unstacker, new_columns
+        )
+
+        blocks = [
+            self.make_block_same_class(
+                self.values.take(indices, allow_fill=True,
+                                 fill_value=fill_value),
+                [place])
+            for indices, place in zip(new_values.T, new_placement)
+        ]
+        return blocks, mask
+
+
+class ObjectValuesExtensionBlock(ExtensionBlock):
+    """
+    Block providing backwards-compatibility for `.values`.
+
+    Used by PeriodArray and IntervalArray to ensure that
+    Series[T].values is an ndarray of objects.
+    """
+
+    def external_values(self, dtype=None):
+        return self.values.astype(object)
+
+
+class NumericBlock(Block):
+    __slots__ = ()
+    is_numeric = True
+    _can_hold_na = True
+
+
+class FloatOrComplexBlock(NumericBlock):
+    __slots__ = ()
+
+    def equals(self, other):
+        if self.dtype != other.dtype or self.shape != other.shape:
+            return False
+        left, right = self.values, other.values
+        return ((left == right) | (np.isnan(left) & np.isnan(right))).all()
+
+
+class FloatBlock(FloatOrComplexBlock):
+    __slots__ = ()
+    is_float = True
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return (issubclass(tipo.type, (np.floating, np.integer)) and
+                    not issubclass(tipo.type, (np.datetime64, np.timedelta64)))
+        return (
+            isinstance(
+                element, (float, int, np.floating, np.int_, compat.long))
+            and not isinstance(element, (bool, np.bool_, datetime, timedelta,
+                                         np.datetime64, np.timedelta64)))
+
+    def to_native_types(self, slicer=None, na_rep='', float_format=None,
+                        decimal='.', quoting=None, **kwargs):
+        """ convert to our native types format, slicing if desired """
+
+        values = self.values
+        if slicer is not None:
+            values = values[:, slicer]
+
+        # see gh-13418: no special formatting is desired at the
+        # output (important for appropriate 'quoting' behaviour),
+        # so do not pass it through the FloatArrayFormatter
+        if float_format is None and decimal == '.':
+            mask = isna(values)
+
+            if not quoting:
+                values = values.astype(str)
+            else:
+                values = np.array(values, dtype='object')
+
+            values[mask] = na_rep
+            return values
+
+        from pandas.io.formats.format import FloatArrayFormatter
+        formatter = FloatArrayFormatter(values, na_rep=na_rep,
+                                        float_format=float_format,
+                                        decimal=decimal, quoting=quoting,
+                                        fixed_width=False)
+        return formatter.get_result_as_array()
+
+    def should_store(self, value):
+        # when inserting a column should not coerce integers to floats
+        # unnecessarily
+        return (issubclass(value.dtype.type, np.floating) and
+                value.dtype == self.dtype)
+
+
+class ComplexBlock(FloatOrComplexBlock):
+    __slots__ = ()
+    is_complex = True
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type,
+                              (np.floating, np.integer, np.complexfloating))
+        return (
+            isinstance(
+                element,
+                (float, int, complex, np.float_, np.int_, compat.long))
+            and not isinstance(element, (bool, np.bool_)))
+
+    def should_store(self, value):
+        return issubclass(value.dtype.type, np.complexfloating)
+
+
+class IntBlock(NumericBlock):
+    __slots__ = ()
+    is_integer = True
+    _can_hold_na = False
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return (issubclass(tipo.type, np.integer) and
+                    not issubclass(tipo.type, (np.datetime64,
+                                               np.timedelta64)) and
+                    self.dtype.itemsize >= tipo.itemsize)
+        return is_integer(element)
+
+    def should_store(self, value):
+        return is_integer_dtype(value) and value.dtype == self.dtype
+
+
+class DatetimeLikeBlockMixin(object):
+    """Mixin class for DatetimeBlock, DatetimeTZBlock, and TimedeltaBlock."""
+
+    @property
+    def _holder(self):
+        return DatetimeArray
+
+    @property
+    def _na_value(self):
+        return tslibs.NaT
+
+    @property
+    def fill_value(self):
+        return tslibs.iNaT
+
+    def get_values(self, dtype=None):
+        """
+        return object dtype as boxed values, such as Timestamps/Timedelta
+        """
+        if is_object_dtype(dtype):
+            values = self.values.ravel()
+            result = self._holder(values).astype(object)
+            return result.reshape(self.values.shape)
+        return self.values
+
+
+class DatetimeBlock(DatetimeLikeBlockMixin, Block):
+    __slots__ = ()
+    is_datetime = True
+    _can_hold_na = True
+
+    def __init__(self, values, placement, ndim=None):
+        values = self._maybe_coerce_values(values)
+        super(DatetimeBlock, self).__init__(values,
+                                            placement=placement, ndim=ndim)
+
+    def _maybe_coerce_values(self, values):
+        """Input validation for values passed to __init__. Ensure that
+        we have datetime64ns, coercing if necessary.
+
+        Parameters
+        ----------
+        values : array-like
+            Must be convertible to datetime64
+
+        Returns
+        -------
+        values : ndarray[datetime64ns]
+
+        Overridden by DatetimeTZBlock.
+        """
+        if values.dtype != _NS_DTYPE:
+            values = conversion.ensure_datetime64ns(values)
+
+        if isinstance(values, DatetimeArray):
+            values = values._data
+
+        assert isinstance(values, np.ndarray), type(values)
+        return values
+
+    def _astype(self, dtype, **kwargs):
+        """
+        these automatically copy, so copy=True has no effect
+        raise on an except if raise == True
+        """
+        dtype = pandas_dtype(dtype)
+
+        # if we are passed a datetime64[ns, tz]
+        if is_datetime64tz_dtype(dtype):
+            values = self.values
+            if getattr(values, 'tz', None) is None:
+                values = DatetimeIndex(values).tz_localize('UTC')
+            values = values.tz_convert(dtype.tz)
+            return self.make_block(values)
+
+        # delegate
+        return super(DatetimeBlock, self)._astype(dtype=dtype, **kwargs)
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return tipo == _NS_DTYPE or tipo == np.int64
+        return (is_integer(element) or isinstance(element, datetime) or
+                isna(element))
+
+    def _try_coerce_args(self, values, other):
+        """
+        Coerce values and other to dtype 'i8'. NaN and NaT convert to
+        the smallest i8, and will correctly round-trip to NaT if converted
+        back in _try_coerce_result. values is always ndarray-like, other
+        may not be
+
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
+
+        Returns
+        -------
+        base-type values, base-type other
+        """
+
+        values = values.view('i8')
+
+        if isinstance(other, bool):
+            raise TypeError
+        elif is_null_datetimelike(other):
+            other = tslibs.iNaT
+        elif isinstance(other, (datetime, np.datetime64, date)):
+            other = self._box_func(other)
+            if getattr(other, 'tz') is not None:
+                raise TypeError("cannot coerce a Timestamp with a tz on a "
+                                "naive Block")
+            other = other.asm8.view('i8')
+        elif hasattr(other, 'dtype') and is_datetime64_dtype(other):
+            other = other.astype('i8', copy=False).view('i8')
+        else:
+            # coercion issues
+            # let higher levels handle
+            raise TypeError(other)
+
+        return values, other
+
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args """
+        if isinstance(result, np.ndarray):
+            if result.dtype.kind in ['i', 'f']:
+                result = result.astype('M8[ns]')
+
+        elif isinstance(result, (np.integer, np.float, np.datetime64)):
+            result = self._box_func(result)
+        return result
+
+    @property
+    def _box_func(self):
+        return tslibs.Timestamp
+
+    def to_native_types(self, slicer=None, na_rep=None, date_format=None,
+                        quoting=None, **kwargs):
+        """ convert to our native types format, slicing if desired """
+
+        values = self.values
+        i8values = self.values.view('i8')
+
+        if slicer is not None:
+            i8values = i8values[..., slicer]
+
+        from pandas.io.formats.format import _get_format_datetime64_from_values
+        fmt = _get_format_datetime64_from_values(values, date_format)
+
+        result = tslib.format_array_from_datetime(
+            i8values.ravel(), tz=getattr(self.values, 'tz', None),
+            format=fmt, na_rep=na_rep).reshape(i8values.shape)
+        return np.atleast_2d(result)
+
+    def should_store(self, value):
+        return (issubclass(value.dtype.type, np.datetime64) and
+                not is_datetime64tz_dtype(value) and
+                not is_extension_array_dtype(value))
+
+    def set(self, locs, values):
+        """
+        Modify Block in-place with new item value
+
+        Returns
+        -------
+        None
+        """
+        values = conversion.ensure_datetime64ns(values, copy=False)
+
+        self.values[locs] = values
+
+    def external_values(self):
+        return np.asarray(self.values.astype('datetime64[ns]', copy=False))
+
+
+class DatetimeTZBlock(ExtensionBlock, DatetimeBlock):
+    """ implement a datetime64 block with a tz attribute """
+    __slots__ = ()
+    is_datetimetz = True
+    is_extension = True
+
+    @property
+    def _holder(self):
+        return DatetimeArray
+
+    def _maybe_coerce_values(self, values):
+        """Input validation for values passed to __init__. Ensure that
+        we have datetime64TZ, coercing if necessary.
+
+        Parametetrs
+        -----------
+        values : array-like
+            Must be convertible to datetime64
+
+        Returns
+        -------
+        values : DatetimeArray
+        """
+        if not isinstance(values, self._holder):
+            values = self._holder(values)
+
+        if values.tz is None:
+            raise ValueError("cannot create a DatetimeTZBlock without a tz")
+
+        return values
+
+    @property
+    def is_view(self):
+        """ return a boolean if I am possibly a view """
+        # check the ndarray values of the DatetimeIndex values
+        return self.values._data.base is not None
+
+    def copy(self, deep=True):
+        """ copy constructor """
+        values = self.values
+        if deep:
+            values = values.copy(deep=True)
+        return self.make_block_same_class(values)
+
+    def get_values(self, dtype=None):
+        """
+        Returns an ndarray of values.
+
+        Parameters
+        ----------
+        dtype : np.dtype
+            Only `object`-like dtypes are respected here (not sure
+            why).
+
+        Returns
+        -------
+        values : ndarray
+            When ``dtype=object``, then and object-dtype ndarray of
+            boxed values is returned. Otherwise, an M8[ns] ndarray
+            is returned.
+
+            DatetimeArray is always 1-d. ``get_values`` will reshape
+            the return value to be the same dimensionality as the
+            block.
+        """
+        values = self.values
+        if is_object_dtype(dtype):
+            values = values._box_values(values._data)
+
+        values = np.asarray(values)
+
+        if self.ndim == 2:
+            # Ensure that our shape is correct for DataFrame.
+            # ExtensionArrays are always 1-D, even in a DataFrame when
+            # the analogous NumPy-backed column would be a 2-D ndarray.
+            values = values.reshape(1, -1)
+        return values
+
+    def to_dense(self):
+        # we request M8[ns] dtype here, even though it discards tzinfo,
+        # as lots of code (e.g. anything using values_from_object)
+        # expects that behavior.
+        return np.asarray(self.values, dtype=_NS_DTYPE)
+
+    def _slice(self, slicer):
+        """ return a slice of my values """
+        if isinstance(slicer, tuple):
+            col, loc = slicer
+            if not com.is_null_slice(col) and col != 0:
+                raise IndexError("{0} only contains one item".format(self))
+            return self.values[loc]
+        return self.values[slicer]
+
+    def _try_coerce_args(self, values, other):
+        """
+        localize and return i8 for the values
+
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
+
+        Returns
+        -------
+        base-type values, base-type other
+        """
+        # asi8 is a view, needs copy
+        values = _block_shape(values.view("i8"), ndim=self.ndim)
+
+        if isinstance(other, ABCSeries):
+            other = self._holder(other)
+
+        if isinstance(other, bool):
+            raise TypeError
+        elif is_datetime64_dtype(other):
+            # add the tz back
+            other = self._holder(other, dtype=self.dtype)
+
+        elif is_null_datetimelike(other):
+            other = tslibs.iNaT
+        elif isinstance(other, self._holder):
+            if other.tz != self.values.tz:
+                raise ValueError("incompatible or non tz-aware value")
+            other = _block_shape(other.asi8, ndim=self.ndim)
+        elif isinstance(other, (np.datetime64, datetime, date)):
+            other = tslibs.Timestamp(other)
+            tz = getattr(other, 'tz', None)
+
+            # test we can have an equal time zone
+            if tz is None or str(tz) != str(self.values.tz):
+                raise ValueError("incompatible or non tz-aware value")
+            other = other.value
+        else:
+            raise TypeError(other)
+
+        return values, other
+
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args """
+        if isinstance(result, np.ndarray):
+            if result.dtype.kind in ['i', 'f']:
+                result = result.astype('M8[ns]')
+
+        elif isinstance(result, (np.integer, np.float, np.datetime64)):
+            result = self._box_func(result)
+
+        if isinstance(result, np.ndarray):
+            # allow passing of > 1dim if its trivial
+
+            if result.ndim > 1:
+                result = result.reshape(np.prod(result.shape))
+            # GH#24096 new values invalidates a frequency
+            result = self._holder._simple_new(result, freq=None,
+                                              dtype=self.values.dtype)
+
+        return result
+
+    @property
+    def _box_func(self):
+        return lambda x: tslibs.Timestamp(x, tz=self.dtype.tz)
+
+    def diff(self, n, axis=0):
+        """1st discrete difference
+
+        Parameters
+        ----------
+        n : int, number of periods to diff
+        axis : int, axis to diff upon. default 0
+
+        Return
+        ------
+        A list with a new TimeDeltaBlock.
+
+        Note
+        ----
+        The arguments here are mimicking shift so they are called correctly
+        by apply.
+        """
+        if axis == 0:
+            # Cannot currently calculate diff across multiple blocks since this
+            # function is invoked via apply
+            raise NotImplementedError
+        new_values = (self.values - self.shift(n, axis=axis)[0].values).asi8
+
+        # Reshape the new_values like how algos.diff does for timedelta data
+        new_values = new_values.reshape(1, len(new_values))
+        new_values = new_values.astype('timedelta64[ns]')
+        return [TimeDeltaBlock(new_values, placement=self.mgr_locs.indexer)]
+
+    def concat_same_type(self, to_concat, placement=None):
+        # need to handle concat([tz1, tz2]) here, since DatetimeArray
+        # only handles cases where all the tzs are the same.
+        # Instead of placing the condition here, it could also go into the
+        # is_uniform_join_units check, but I'm not sure what is better.
+        if len({x.dtype for x in to_concat}) > 1:
+            values = _concat._concat_datetime([x.values for x in to_concat])
+            placement = placement or slice(0, len(values), 1)
+
+            if self.ndim > 1:
+                values = np.atleast_2d(values)
+            return ObjectBlock(values, ndim=self.ndim, placement=placement)
+        return super(DatetimeTZBlock, self).concat_same_type(to_concat,
+                                                             placement)
+
+    def fillna(self, value, limit=None, inplace=False, downcast=None):
+        # We support filling a DatetimeTZ with a `value` whose timezone
+        # is different by coercing to object.
+        try:
+            return super(DatetimeTZBlock, self).fillna(
+                value, limit, inplace, downcast
+            )
+        except (ValueError, TypeError):
+            # different timezones, or a non-tz
+            return self.astype(object).fillna(
+                value, limit=limit, inplace=inplace, downcast=downcast
+            )
+
+    def setitem(self, indexer, value):
+        # https://github.com/pandas-dev/pandas/issues/24020
+        # Need a dedicated setitem until #24020 (type promotion in setitem
+        # for extension arrays) is designed and implemented.
+        try:
+            return super(DatetimeTZBlock, self).setitem(indexer, value)
+        except (ValueError, TypeError):
+            newb = make_block(self.values.astype(object),
+                              placement=self.mgr_locs,
+                              klass=ObjectBlock,)
+            return newb.setitem(indexer, value)
+
+    def equals(self, other):
+        # override for significant performance improvement
+        if self.dtype != other.dtype or self.shape != other.shape:
+            return False
+        return (self.values.view('i8') == other.values.view('i8')).all()
+
+
+class TimeDeltaBlock(DatetimeLikeBlockMixin, IntBlock):
+    __slots__ = ()
+    is_timedelta = True
+    _can_hold_na = True
+    is_numeric = False
+
+    def __init__(self, values, placement, ndim=None):
+        if values.dtype != _TD_DTYPE:
+            values = conversion.ensure_timedelta64ns(values)
+        if isinstance(values, TimedeltaArray):
+            values = values._data
+        assert isinstance(values, np.ndarray), type(values)
+        super(TimeDeltaBlock, self).__init__(values,
+                                             placement=placement, ndim=ndim)
+
+    @property
+    def _holder(self):
+        return TimedeltaArray
+
+    @property
+    def _box_func(self):
+        return lambda x: Timedelta(x, unit='ns')
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, (np.timedelta64, np.int64))
+        return is_integer(element) or isinstance(
+            element, (timedelta, np.timedelta64, np.int64))
+
+    def fillna(self, value, **kwargs):
+
+        # allow filling with integers to be
+        # interpreted as nanoseconds
+        if is_integer(value) and not isinstance(value, np.timedelta64):
+            # Deprecation GH#24694, GH#19233
+            warnings.warn("Passing integers to fillna is deprecated, will "
+                          "raise a TypeError in a future version.  To retain "
+                          "the old behavior, pass pd.Timedelta(seconds=n) "
+                          "instead.",
+                          FutureWarning, stacklevel=6)
+            value = Timedelta(value, unit='s')
+        return super(TimeDeltaBlock, self).fillna(value, **kwargs)
+
+    def _try_coerce_args(self, values, other):
+        """
+        Coerce values and other to int64, with null values converted to
+        iNaT. values is always ndarray-like, other may not be
+
+        Parameters
+        ----------
+        values : ndarray-like
+        other : ndarray-like or scalar
+
+        Returns
+        -------
+        base-type values, base-type other
+        """
+        values = values.view('i8')
+
+        if isinstance(other, bool):
+            raise TypeError
+        elif is_null_datetimelike(other):
+            other = tslibs.iNaT
+        elif isinstance(other, (timedelta, np.timedelta64)):
+            other = Timedelta(other).value
+        elif hasattr(other, 'dtype') and is_timedelta64_dtype(other):
+            other = other.astype('i8', copy=False).view('i8')
+        else:
+            # coercion issues
+            # let higher levels handle
+            raise TypeError(other)
+
+        return values, other
+
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args / try_operate """
+        if isinstance(result, np.ndarray):
+            mask = isna(result)
+            if result.dtype.kind in ['i', 'f']:
+                result = result.astype('m8[ns]')
+            result[mask] = tslibs.iNaT
+
+        elif isinstance(result, (np.integer, np.float)):
+            result = self._box_func(result)
+
+        return result
+
+    def should_store(self, value):
+        return (issubclass(value.dtype.type, np.timedelta64) and
+                not is_extension_array_dtype(value))
+
+    def to_native_types(self, slicer=None, na_rep=None, quoting=None,
+                        **kwargs):
+        """ convert to our native types format, slicing if desired """
+
+        values = self.values
+        if slicer is not None:
+            values = values[:, slicer]
+        mask = isna(values)
+
+        rvalues = np.empty(values.shape, dtype=object)
+        if na_rep is None:
+            na_rep = 'NaT'
+        rvalues[mask] = na_rep
+        imask = (~mask).ravel()
+
+        # FIXME:
+        # should use the formats.format.Timedelta64Formatter here
+        # to figure what format to pass to the Timedelta
+        # e.g. to not show the decimals say
+        rvalues.flat[imask] = np.array([Timedelta(val)._repr_base(format='all')
+                                        for val in values.ravel()[imask]],
+                                       dtype=object)
+        return rvalues
+
+    def external_values(self, dtype=None):
+        return np.asarray(self.values.astype("timedelta64[ns]", copy=False))
+
+
+class BoolBlock(NumericBlock):
+    __slots__ = ()
+    is_bool = True
+    _can_hold_na = False
+
+    def _can_hold_element(self, element):
+        tipo = maybe_infer_dtype_type(element)
+        if tipo is not None:
+            return issubclass(tipo.type, np.bool_)
+        return isinstance(element, (bool, np.bool_))
+
+    def should_store(self, value):
+        return (issubclass(value.dtype.type, np.bool_) and not
+                is_extension_array_dtype(value))
+
+    def replace(self, to_replace, value, inplace=False, filter=None,
+                regex=False, convert=True):
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+        to_replace_values = np.atleast_1d(to_replace)
+        if not np.can_cast(to_replace_values, bool):
+            return self
+        return super(BoolBlock, self).replace(to_replace, value,
+                                              inplace=inplace, filter=filter,
+                                              regex=regex, convert=convert)
+
+
+class ObjectBlock(Block):
+    __slots__ = ()
+    is_object = True
+    _can_hold_na = True
+
+    def __init__(self, values, placement=None, ndim=2):
+        if issubclass(values.dtype.type, compat.string_types):
+            values = np.array(values, dtype=object)
+
+        super(ObjectBlock, self).__init__(values, ndim=ndim,
+                                          placement=placement)
+
+    @property
+    def is_bool(self):
+        """ we can be a bool if we have only bool values but are of type
+        object
+        """
+        return lib.is_bool_array(self.values.ravel())
+
+    # TODO: Refactor when convert_objects is removed since there will be 1 path
+    def convert(self, *args, **kwargs):
+        """ attempt to coerce any object types to better types return a copy of
+        the block (if copy = True) by definition we ARE an ObjectBlock!!!!!
+
+        can return multiple blocks!
+        """
+
+        if args:
+            raise NotImplementedError
+        by_item = kwargs.get('by_item', True)
+
+        new_inputs = ['coerce', 'datetime', 'numeric', 'timedelta']
+        new_style = False
+        for kw in new_inputs:
+            new_style |= kw in kwargs
+
+        if new_style:
+            fn = soft_convert_objects
+            fn_inputs = new_inputs
+        else:
+            fn = maybe_convert_objects
+            fn_inputs = ['convert_dates', 'convert_numeric',
+                         'convert_timedeltas']
+        fn_inputs += ['copy']
+
+        fn_kwargs = {key: kwargs[key] for key in fn_inputs if key in kwargs}
+
+        # operate column-by-column
+        def f(m, v, i):
+            shape = v.shape
+            values = fn(v.ravel(), **fn_kwargs)
+            try:
+                values = values.reshape(shape)
+                values = _block_shape(values, ndim=self.ndim)
+            except (AttributeError, NotImplementedError):
+                pass
+
+            return values
+
+        if by_item and not self._is_single_block:
+            blocks = self.split_and_operate(None, f, False)
+        else:
+            values = f(None, self.values.ravel(), None)
+            blocks = [make_block(values, ndim=self.ndim,
+                                 placement=self.mgr_locs)]
+
+        return blocks
+
+    def set(self, locs, values):
+        """
+        Modify Block in-place with new item value
+
+        Returns
+        -------
+        None
+        """
+        try:
+            self.values[locs] = values
+        except (ValueError):
+
+            # broadcasting error
+            # see GH6171
+            new_shape = list(values.shape)
+            new_shape[0] = len(self.items)
+            self.values = np.empty(tuple(new_shape), dtype=self.dtype)
+            self.values.fill(np.nan)
+            self.values[locs] = values
+
+    def _maybe_downcast(self, blocks, downcast=None):
+
+        if downcast is not None:
+            return blocks
+
+        # split and convert the blocks
+        return _extend_blocks([b.convert(datetime=True, numeric=False)
+                               for b in blocks])
+
+    def _can_hold_element(self, element):
+        return True
+
+    def _try_coerce_args(self, values, other):
+        """ provide coercion to our input arguments """
+
+        if isinstance(other, ABCDatetimeIndex):
+            # May get a DatetimeIndex here. Unbox it.
+            other = other.array
+
+        if isinstance(other, DatetimeArray):
+            # hit in pandas/tests/indexing/test_coercion.py
+            # ::TestWhereCoercion::test_where_series_datetime64[datetime64tz]
+            # when falling back to ObjectBlock.where
+            other = other.astype(object)
+
+        return values, other
+
+    def should_store(self, value):
+        return not (issubclass(value.dtype.type,
+                               (np.integer, np.floating, np.complexfloating,
+                                np.datetime64, np.bool_)) or
+                    # TODO(ExtensionArray): remove is_extension_type
+                    # when all extension arrays have been ported.
+                    is_extension_type(value) or
+                    is_extension_array_dtype(value))
+
+    def replace(self, to_replace, value, inplace=False, filter=None,
+                regex=False, convert=True):
+        to_rep_is_list = is_list_like(to_replace)
+        value_is_list = is_list_like(value)
+        both_lists = to_rep_is_list and value_is_list
+        either_list = to_rep_is_list or value_is_list
+
+        result_blocks = []
+        blocks = [self]
+
+        if not either_list and is_re(to_replace):
+            return self._replace_single(to_replace, value, inplace=inplace,
+                                        filter=filter, regex=True,
+                                        convert=convert)
+        elif not (either_list or regex):
+            return super(ObjectBlock, self).replace(to_replace, value,
+                                                    inplace=inplace,
+                                                    filter=filter, regex=regex,
+                                                    convert=convert)
+        elif both_lists:
+            for to_rep, v in zip(to_replace, value):
+                result_blocks = []
+                for b in blocks:
+                    result = b._replace_single(to_rep, v, inplace=inplace,
+                                               filter=filter, regex=regex,
+                                               convert=convert)
+                    result_blocks = _extend_blocks(result, result_blocks)
+                blocks = result_blocks
+            return result_blocks
+
+        elif to_rep_is_list and regex:
+            for to_rep in to_replace:
+                result_blocks = []
+                for b in blocks:
+                    result = b._replace_single(to_rep, value, inplace=inplace,
+                                               filter=filter, regex=regex,
+                                               convert=convert)
+                    result_blocks = _extend_blocks(result, result_blocks)
+                blocks = result_blocks
+            return result_blocks
+
+        return self._replace_single(to_replace, value, inplace=inplace,
+                                    filter=filter, convert=convert,
+                                    regex=regex)
+
+    def _replace_single(self, to_replace, value, inplace=False, filter=None,
+                        regex=False, convert=True, mask=None):
+        """
+        Replace elements by the given value.
+
+        Parameters
+        ----------
+        to_replace : object or pattern
+            Scalar to replace or regular expression to match.
+        value : object
+            Replacement object.
+        inplace : bool, default False
+            Perform inplace modification.
+        filter : list, optional
+        regex : bool, default False
+            If true, perform regular expression substitution.
+        convert : bool, default True
+            If true, try to coerce any object types to better types.
+        mask : array-like of bool, optional
+            True indicate corresponding element is ignored.
+
+        Returns
+        -------
+        a new block, the result after replacing
+        """
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        # to_replace is regex compilable
+        to_rep_re = regex and is_re_compilable(to_replace)
+
+        # regex is regex compilable
+        regex_re = is_re_compilable(regex)
+
+        # only one will survive
+        if to_rep_re and regex_re:
+            raise AssertionError('only one of to_replace and regex can be '
+                                 'regex compilable')
+
+        # if regex was passed as something that can be a regex (rather than a
+        # boolean)
+        if regex_re:
+            to_replace = regex
+
+        regex = regex_re or to_rep_re
+
+        # try to get the pattern attribute (compiled re) or it's a string
+        try:
+            pattern = to_replace.pattern
+        except AttributeError:
+            pattern = to_replace
+
+        # if the pattern is not empty and to_replace is either a string or a
+        # regex
+        if regex and pattern:
+            rx = re.compile(to_replace)
+        else:
+            # if the thing to replace is not a string or compiled regex call
+            # the superclass method -> to_replace is some kind of object
+            return super(ObjectBlock, self).replace(to_replace, value,
+                                                    inplace=inplace,
+                                                    filter=filter, regex=regex)
+
+        new_values = self.values if inplace else self.values.copy()
+
+        # deal with replacing values with objects (strings) that match but
+        # whose replacement is not a string (numeric, nan, object)
+        if isna(value) or not isinstance(value, compat.string_types):
+
+            def re_replacer(s):
+                try:
+                    return value if rx.search(s) is not None else s
+                except TypeError:
+                    return s
+        else:
+            # value is guaranteed to be a string here, s can be either a string
+            # or null if it's null it gets returned
+            def re_replacer(s):
+                try:
+                    return rx.sub(value, s)
+                except TypeError:
+                    return s
+
+        f = np.vectorize(re_replacer, otypes=[self.dtype])
+
+        if filter is None:
+            filt = slice(None)
+        else:
+            filt = self.mgr_locs.isin(filter).nonzero()[0]
+
+        if mask is None:
+            new_values[filt] = f(new_values[filt])
+        else:
+            new_values[filt][mask] = f(new_values[filt][mask])
+
+        # convert
+        block = self.make_block(new_values)
+        if convert:
+            block = block.convert(by_item=True, numeric=False)
+        return block
+
+    def _replace_coerce(self, to_replace, value, inplace=True, regex=False,
+                        convert=False, mask=None):
+        """
+        Replace value corresponding to the given boolean array with another
+        value.
+
+        Parameters
+        ----------
+        to_replace : object or pattern
+            Scalar to replace or regular expression to match.
+        value : object
+            Replacement object.
+        inplace : bool, default False
+            Perform inplace modification.
+        regex : bool, default False
+            If true, perform regular expression substitution.
+        convert : bool, default True
+            If true, try to coerce any object types to better types.
+        mask : array-like of bool, optional
+            True indicate corresponding element is ignored.
+
+        Returns
+        -------
+        A new block if there is anything to replace or the original block.
+        """
+        if mask.any():
+            block = super(ObjectBlock, self)._replace_coerce(
+                to_replace=to_replace, value=value, inplace=inplace,
+                regex=regex, convert=convert, mask=mask)
+            if convert:
+                block = [b.convert(by_item=True, numeric=False, copy=True)
+                         for b in block]
+            return block
+        return self
+
+
+class CategoricalBlock(ExtensionBlock):
+    __slots__ = ()
+    is_categorical = True
+    _verify_integrity = True
+    _can_hold_na = True
+    _concatenator = staticmethod(_concat._concat_categorical)
+
+    def __init__(self, values, placement, ndim=None):
+        from pandas.core.arrays.categorical import _maybe_to_categorical
+
+        # coerce to categorical if we can
+        super(CategoricalBlock, self).__init__(_maybe_to_categorical(values),
+                                               placement=placement,
+                                               ndim=ndim)
+
+    @property
+    def _holder(self):
+        return Categorical
+
+    @property
+    def array_dtype(self):
+        """ the dtype to return if I want to construct this block as an
+        array
+        """
+        return np.object_
+
+    def _try_coerce_result(self, result):
+        """ reverse of try_coerce_args """
+
+        # GH12564: CategoricalBlock is 1-dim only
+        # while returned results could be any dim
+        if ((not is_categorical_dtype(result)) and
+                isinstance(result, np.ndarray)):
+            result = _block_shape(result, ndim=self.ndim)
+
+        return result
+
+    def to_dense(self):
+        # Categorical.get_values returns a DatetimeIndex for datetime
+        # categories, so we can't simply use `np.asarray(self.values)` like
+        # other types.
+        return self.values.get_values()
+
+    def to_native_types(self, slicer=None, na_rep='', quoting=None, **kwargs):
+        """ convert to our native types format, slicing if desired """
+
+        values = self.values
+        if slicer is not None:
+            # Categorical is always one dimension
+            values = values[slicer]
+        mask = isna(values)
+        values = np.array(values, dtype='object')
+        values[mask] = na_rep
+
+        # we are expected to return a 2-d ndarray
+        return values.reshape(1, len(values))
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Concatenate list of single blocks of the same type.
+
+        Note that this CategoricalBlock._concat_same_type *may* not
+        return a CategoricalBlock. When the categories in `to_concat`
+        differ, this will return an object ndarray.
+
+        If / when we decide we don't like that behavior:
+
+        1. Change Categorical._concat_same_type to use union_categoricals
+        2. Delete this method.
+        """
+        values = self._concatenator([blk.values for blk in to_concat],
+                                    axis=self.ndim - 1)
+        # not using self.make_block_same_class as values can be object dtype
+        return make_block(
+            values, placement=placement or slice(0, len(values), 1),
+            ndim=self.ndim)
+
+    def where(self, other, cond, align=True, errors='raise',
+              try_cast=False, axis=0, transpose=False):
+        # TODO(CategoricalBlock.where):
+        # This can all be deleted in favor of ExtensionBlock.where once
+        # we enforce the deprecation.
+        object_msg = (
+            "Implicitly converting categorical to object-dtype ndarray. "
+            "One or more of the values in 'other' are not present in this "
+            "categorical's categories. A future version of pandas will raise "
+            "a ValueError when 'other' contains different categories.\n\n"
+            "To preserve the current behavior, add the new categories to "
+            "the categorical before calling 'where', or convert the "
+            "categorical to a different dtype."
+        )
+        try:
+            # Attempt to do preserve categorical dtype.
+            result = super(CategoricalBlock, self).where(
+                other, cond, align, errors, try_cast, axis, transpose
+            )
+        except (TypeError, ValueError):
+            warnings.warn(object_msg, FutureWarning, stacklevel=6)
+            result = self.astype(object).where(other, cond, align=align,
+                                               errors=errors,
+                                               try_cast=try_cast,
+                                               axis=axis, transpose=transpose)
+        return result
+
+
+# -----------------------------------------------------------------
+# Constructor Helpers
+
+def get_block_type(values, dtype=None):
+    """
+    Find the appropriate Block subclass to use for the given values and dtype.
+
+    Parameters
+    ----------
+    values : ndarray-like
+    dtype : numpy or pandas dtype
+
+    Returns
+    -------
+    cls : class, subclass of Block
+    """
+    dtype = dtype or values.dtype
+    vtype = dtype.type
+
+    if is_sparse(dtype):
+        # Need this first(ish) so that Sparse[datetime] is sparse
+        cls = ExtensionBlock
+    elif is_categorical(values):
+        cls = CategoricalBlock
+    elif issubclass(vtype, np.datetime64):
+        assert not is_datetime64tz_dtype(values)
+        cls = DatetimeBlock
+    elif is_datetime64tz_dtype(values):
+        cls = DatetimeTZBlock
+    elif is_interval_dtype(dtype) or is_period_dtype(dtype):
+        cls = ObjectValuesExtensionBlock
+    elif is_extension_array_dtype(values):
+        cls = ExtensionBlock
+    elif issubclass(vtype, np.floating):
+        cls = FloatBlock
+    elif issubclass(vtype, np.timedelta64):
+        assert issubclass(vtype, np.integer)
+        cls = TimeDeltaBlock
+    elif issubclass(vtype, np.complexfloating):
+        cls = ComplexBlock
+    elif issubclass(vtype, np.integer):
+        cls = IntBlock
+    elif dtype == np.bool_:
+        cls = BoolBlock
+    else:
+        cls = ObjectBlock
+    return cls
+
+
+def make_block(values, placement, klass=None, ndim=None, dtype=None,
+               fastpath=None):
+    if fastpath is not None:
+        # GH#19265 pyarrow is passing this
+        warnings.warn("fastpath argument is deprecated, will be removed "
+                      "in a future release.", DeprecationWarning)
+    if klass is None:
+        dtype = dtype or values.dtype
+        klass = get_block_type(values, dtype)
+
+    elif klass is DatetimeTZBlock and not is_datetime64tz_dtype(values):
+        # TODO: This is no longer hit internally; does it need to be retained
+        #  for e.g. pyarrow?
+        values = DatetimeArray._simple_new(values, dtype=dtype)
+
+    return klass(values, ndim=ndim, placement=placement)
+
+
+# -----------------------------------------------------------------
+
+def _extend_blocks(result, blocks=None):
+    """ return a new extended blocks, givin the result """
+    from pandas.core.internals import BlockManager
+    if blocks is None:
+        blocks = []
+    if isinstance(result, list):
+        for r in result:
+            if isinstance(r, list):
+                blocks.extend(r)
+            else:
+                blocks.append(r)
+    elif isinstance(result, BlockManager):
+        blocks.extend(result.blocks)
+    else:
+        blocks.append(result)
+    return blocks
+
+
+def _block_shape(values, ndim=1, shape=None):
+    """ guarantee the shape of the values to be at least 1 d """
+    if values.ndim < ndim:
+        if shape is None:
+            shape = values.shape
+        if not is_extension_array_dtype(values):
+            # TODO: https://github.com/pandas-dev/pandas/issues/23023
+            # block.shape is incorrect for "2D" ExtensionArrays
+            # We can't, and don't need to, reshape.
+            values = values.reshape(tuple((1, ) + shape))
+    return values
+
+
+def _merge_blocks(blocks, dtype=None, _can_consolidate=True):
+
+    if len(blocks) == 1:
+        return blocks[0]
+
+    if _can_consolidate:
+
+        if dtype is None:
+            if len({b.dtype for b in blocks}) != 1:
+                raise AssertionError("_merge_blocks are invalid!")
+            dtype = blocks[0].dtype
+
+        # FIXME: optimization potential in case all mgrs contain slices and
+        # combination of those slices is a slice, too.
+        new_mgr_locs = np.concatenate([b.mgr_locs.as_array for b in blocks])
+        new_values = np.vstack([b.values for b in blocks])
+
+        argsort = np.argsort(new_mgr_locs)
+        new_values = new_values[argsort]
+        new_mgr_locs = new_mgr_locs[argsort]
+
+        return make_block(new_values, placement=new_mgr_locs)
+
+    # no merge
+    return blocks
+
+
+def _safe_reshape(arr, new_shape):
+    """
+    If possible, reshape `arr` to have shape `new_shape`,
+    with a couple of exceptions (see gh-13012):
+
+    1) If `arr` is a ExtensionArray or Index, `arr` will be
+       returned as is.
+    2) If `arr` is a Series, the `_values` attribute will
+       be reshaped and returned.
+
+    Parameters
+    ----------
+    arr : array-like, object to be reshaped
+    new_shape : int or tuple of ints, the new shape
+    """
+    if isinstance(arr, ABCSeries):
+        arr = arr._values
+    if not isinstance(arr, ABCExtensionArray):
+        arr = arr.reshape(new_shape)
+    return arr
+
+
+def _putmask_smart(v, m, n):
+    """
+    Return a new ndarray, try to preserve dtype if possible.
+
+    Parameters
+    ----------
+    v : `values`, updated in-place (array like)
+    m : `mask`, applies to both sides (array like)
+    n : `new values` either scalar or an array like aligned with `values`
+
+    Returns
+    -------
+    values : ndarray with updated values
+        this *may* be a copy of the original
+
+    See Also
+    --------
+    ndarray.putmask
+    """
+
+    # we cannot use np.asarray() here as we cannot have conversions
+    # that numpy does when numeric are mixed with strings
+
+    # n should be the length of the mask or a scalar here
+    if not is_list_like(n):
+        n = np.repeat(n, len(m))
+    elif isinstance(n, np.ndarray) and n.ndim == 0:  # numpy scalar
+        n = np.repeat(np.array(n, ndmin=1), len(m))
+
+    # see if we are only masking values that if putted
+    # will work in the current dtype
+    try:
+        nn = n[m]
+
+        # make sure that we have a nullable type
+        # if we have nulls
+        if not _isna_compat(v, nn[0]):
+            raise ValueError
+
+        # we ignore ComplexWarning here
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", np.ComplexWarning)
+            nn_at = nn.astype(v.dtype)
+
+        # avoid invalid dtype comparisons
+        # between numbers & strings
+
+        # only compare integers/floats
+        # don't compare integers to datetimelikes
+        if (not is_numeric_v_string_like(nn, nn_at) and
+            (is_float_dtype(nn.dtype) or
+             is_integer_dtype(nn.dtype) and
+             is_float_dtype(nn_at.dtype) or
+             is_integer_dtype(nn_at.dtype))):
+
+            comp = (nn == nn_at)
+            if is_list_like(comp) and comp.all():
+                nv = v.copy()
+                nv[m] = nn_at
+                return nv
+    except (ValueError, IndexError, TypeError):
+        pass
+
+    n = np.asarray(n)
+
+    def _putmask_preserve(nv, n):
+        try:
+            nv[m] = n[m]
+        except (IndexError, ValueError):
+            nv[m] = n
+        return nv
+
+    # preserves dtype if possible
+    if v.dtype.kind == n.dtype.kind:
+        return _putmask_preserve(v, n)
+
+    # change the dtype if needed
+    dtype, _ = maybe_promote(n.dtype)
+
+    if is_extension_type(v.dtype) and is_object_dtype(dtype):
+        v = v.get_values(dtype)
+    else:
+        v = v.astype(dtype)
+
+    return _putmask_preserve(v, n)
diff --git a/pandas/core/internals/concat.py b/pandas/core/internals/concat.py
new file mode 100644
index 0000000000000..cb98274962656
--- /dev/null
+++ b/pandas/core/internals/concat.py
@@ -0,0 +1,485 @@
+# -*- coding: utf-8 -*-
+# TODO: Needs a better name; too many modules are already called "concat"
+from collections import defaultdict
+import copy
+
+import numpy as np
+
+from pandas._libs import internals as libinternals, tslibs
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.cast import maybe_promote
+from pandas.core.dtypes.common import (
+    _get_dtype, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_extension_array_dtype, is_float_dtype,
+    is_numeric_dtype, is_sparse, is_timedelta64_dtype)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.missing import isna
+
+import pandas.core.algorithms as algos
+
+
+def get_mgr_concatenation_plan(mgr, indexers):
+    """
+    Construct concatenation plan for given block manager and indexers.
+
+    Parameters
+    ----------
+    mgr : BlockManager
+    indexers : dict of {axis: indexer}
+
+    Returns
+    -------
+    plan : list of (BlockPlacement, JoinUnit) tuples
+
+    """
+    # Calculate post-reindex shape , save for item axis which will be separate
+    # for each block anyway.
+    mgr_shape = list(mgr.shape)
+    for ax, indexer in indexers.items():
+        mgr_shape[ax] = len(indexer)
+    mgr_shape = tuple(mgr_shape)
+
+    if 0 in indexers:
+        ax0_indexer = indexers.pop(0)
+        blknos = algos.take_1d(mgr._blknos, ax0_indexer, fill_value=-1)
+        blklocs = algos.take_1d(mgr._blklocs, ax0_indexer, fill_value=-1)
+    else:
+
+        if mgr._is_single_block:
+            blk = mgr.blocks[0]
+            return [(blk.mgr_locs, JoinUnit(blk, mgr_shape, indexers))]
+
+        ax0_indexer = None
+        blknos = mgr._blknos
+        blklocs = mgr._blklocs
+
+    plan = []
+    for blkno, placements in libinternals.get_blkno_placements(blknos,
+                                                               mgr.nblocks,
+                                                               group=False):
+
+        assert placements.is_slice_like
+
+        join_unit_indexers = indexers.copy()
+
+        shape = list(mgr_shape)
+        shape[0] = len(placements)
+        shape = tuple(shape)
+
+        if blkno == -1:
+            unit = JoinUnit(None, shape)
+        else:
+            blk = mgr.blocks[blkno]
+            ax0_blk_indexer = blklocs[placements.indexer]
+
+            unit_no_ax0_reindexing = (len(placements) == len(blk.mgr_locs) and
+                                      # Fastpath detection of join unit not
+                                      # needing to reindex its block: no ax0
+                                      # reindexing took place and block
+                                      # placement was sequential before.
+                                      ((ax0_indexer is None and
+                                        blk.mgr_locs.is_slice_like and
+                                        blk.mgr_locs.as_slice.step == 1) or
+                                       # Slow-ish detection: all indexer locs
+                                       # are sequential (and length match is
+                                       # checked above).
+                                       (np.diff(ax0_blk_indexer) == 1).all()))
+
+            # Omit indexer if no item reindexing is required.
+            if unit_no_ax0_reindexing:
+                join_unit_indexers.pop(0, None)
+            else:
+                join_unit_indexers[0] = ax0_blk_indexer
+
+            unit = JoinUnit(blk, shape, join_unit_indexers)
+
+        plan.append((placements, unit))
+
+    return plan
+
+
+class JoinUnit(object):
+
+    def __init__(self, block, shape, indexers=None):
+        # Passing shape explicitly is required for cases when block is None.
+        if indexers is None:
+            indexers = {}
+        self.block = block
+        self.indexers = indexers
+        self.shape = shape
+
+    def __repr__(self):
+        return '{name}({block!r}, {indexers})'.format(
+            name=self.__class__.__name__, block=self.block,
+            indexers=self.indexers)
+
+    @cache_readonly
+    def needs_filling(self):
+        for indexer in self.indexers.values():
+            # FIXME: cache results of indexer == -1 checks.
+            if (indexer == -1).any():
+                return True
+
+        return False
+
+    @cache_readonly
+    def dtype(self):
+        if self.block is None:
+            raise AssertionError("Block is None, no dtype")
+
+        if not self.needs_filling:
+            return self.block.dtype
+        else:
+            return _get_dtype(maybe_promote(self.block.dtype,
+                                            self.block.fill_value)[0])
+
+    @cache_readonly
+    def is_na(self):
+        if self.block is None:
+            return True
+
+        if not self.block._can_hold_na:
+            return False
+
+        # Usually it's enough to check but a small fraction of values to see if
+        # a block is NOT null, chunks should help in such cases.  1000 value
+        # was chosen rather arbitrarily.
+        values = self.block.values
+        if self.block.is_categorical:
+            values_flat = values.categories
+        elif is_sparse(self.block.values.dtype):
+            return False
+        elif self.block.is_extension:
+            values_flat = values
+        else:
+            values_flat = values.ravel(order='K')
+        total_len = values_flat.shape[0]
+        chunk_len = max(total_len // 40, 1000)
+        for i in range(0, total_len, chunk_len):
+            if not isna(values_flat[i:i + chunk_len]).all():
+                return False
+
+        return True
+
+    def get_reindexed_values(self, empty_dtype, upcasted_na):
+        if upcasted_na is None:
+            # No upcasting is necessary
+            fill_value = self.block.fill_value
+            values = self.block.get_values()
+        else:
+            fill_value = upcasted_na
+
+            if self.is_na:
+                if getattr(self.block, 'is_object', False):
+                    # we want to avoid filling with np.nan if we are
+                    # using None; we already know that we are all
+                    # nulls
+                    values = self.block.values.ravel(order='K')
+                    if len(values) and values[0] is None:
+                        fill_value = None
+
+                if (getattr(self.block, 'is_datetimetz', False) or
+                        is_datetime64tz_dtype(empty_dtype)):
+                    if self.block is None:
+                        array = empty_dtype.construct_array_type()
+                        return array(np.full(self.shape[1], fill_value.value),
+                                     dtype=empty_dtype)
+                    pass
+                elif getattr(self.block, 'is_categorical', False):
+                    pass
+                elif getattr(self.block, 'is_sparse', False):
+                    pass
+                elif getattr(self.block, 'is_extension', False):
+                    pass
+                else:
+                    missing_arr = np.empty(self.shape, dtype=empty_dtype)
+                    missing_arr.fill(fill_value)
+                    return missing_arr
+
+            if not self.indexers:
+                if not self.block._can_consolidate:
+                    # preserve these for validation in _concat_compat
+                    return self.block.values
+
+            if self.block.is_bool and not self.block.is_categorical:
+                # External code requested filling/upcasting, bool values must
+                # be upcasted to object to avoid being upcasted to numeric.
+                values = self.block.astype(np.object_).values
+            elif self.block.is_extension:
+                values = self.block.values
+            else:
+                # No dtype upcasting is done here, it will be performed during
+                # concatenation itself.
+                values = self.block.get_values()
+
+        if not self.indexers:
+            # If there's no indexing to be done, we want to signal outside
+            # code that this array must be copied explicitly.  This is done
+            # by returning a view and checking `retval.base`.
+            values = values.view()
+
+        else:
+            for ax, indexer in self.indexers.items():
+                values = algos.take_nd(values, indexer, axis=ax,
+                                       fill_value=fill_value)
+
+        return values
+
+
+def concatenate_join_units(join_units, concat_axis, copy):
+    """
+    Concatenate values from several join units along selected axis.
+    """
+    if concat_axis == 0 and len(join_units) > 1:
+        # Concatenating join units along ax0 is handled in _merge_blocks.
+        raise AssertionError("Concatenating join units along axis0")
+
+    empty_dtype, upcasted_na = get_empty_dtype_and_na(join_units)
+
+    to_concat = [ju.get_reindexed_values(empty_dtype=empty_dtype,
+                                         upcasted_na=upcasted_na)
+                 for ju in join_units]
+
+    if len(to_concat) == 1:
+        # Only one block, nothing to concatenate.
+        concat_values = to_concat[0]
+        if copy:
+            if isinstance(concat_values, np.ndarray):
+                # non-reindexed (=not yet copied) arrays are made into a view
+                # in JoinUnit.get_reindexed_values
+                if concat_values.base is not None:
+                    concat_values = concat_values.copy()
+            else:
+                concat_values = concat_values.copy()
+    else:
+        concat_values = _concat._concat_compat(to_concat, axis=concat_axis)
+
+    return concat_values
+
+
+def get_empty_dtype_and_na(join_units):
+    """
+    Return dtype and N/A values to use when concatenating specified units.
+
+    Returned N/A value may be None which means there was no casting involved.
+
+    Returns
+    -------
+    dtype
+    na
+    """
+    if len(join_units) == 1:
+        blk = join_units[0].block
+        if blk is None:
+            return np.float64, np.nan
+
+    if is_uniform_reindex(join_units):
+        # XXX: integrate property
+        empty_dtype = join_units[0].block.dtype
+        upcasted_na = join_units[0].block.fill_value
+        return empty_dtype, upcasted_na
+
+    has_none_blocks = False
+    dtypes = [None] * len(join_units)
+    for i, unit in enumerate(join_units):
+        if unit.block is None:
+            has_none_blocks = True
+        else:
+            dtypes[i] = unit.dtype
+
+    upcast_classes = defaultdict(list)
+    null_upcast_classes = defaultdict(list)
+    for dtype, unit in zip(dtypes, join_units):
+        if dtype is None:
+            continue
+
+        if is_categorical_dtype(dtype):
+            upcast_cls = 'category'
+        elif is_datetime64tz_dtype(dtype):
+            upcast_cls = 'datetimetz'
+        elif issubclass(dtype.type, np.bool_):
+            upcast_cls = 'bool'
+        elif issubclass(dtype.type, np.object_):
+            upcast_cls = 'object'
+        elif is_datetime64_dtype(dtype):
+            upcast_cls = 'datetime'
+        elif is_timedelta64_dtype(dtype):
+            upcast_cls = 'timedelta'
+        elif is_sparse(dtype):
+            upcast_cls = dtype.subtype.name
+        elif is_extension_array_dtype(dtype):
+            upcast_cls = 'object'
+        elif is_float_dtype(dtype) or is_numeric_dtype(dtype):
+            upcast_cls = dtype.name
+        else:
+            upcast_cls = 'float'
+
+        # Null blocks should not influence upcast class selection, unless there
+        # are only null blocks, when same upcasting rules must be applied to
+        # null upcast classes.
+        if unit.is_na:
+            null_upcast_classes[upcast_cls].append(dtype)
+        else:
+            upcast_classes[upcast_cls].append(dtype)
+
+    if not upcast_classes:
+        upcast_classes = null_upcast_classes
+
+    # create the result
+    if 'object' in upcast_classes:
+        return np.dtype(np.object_), np.nan
+    elif 'bool' in upcast_classes:
+        if has_none_blocks:
+            return np.dtype(np.object_), np.nan
+        else:
+            return np.dtype(np.bool_), None
+    elif 'category' in upcast_classes:
+        return np.dtype(np.object_), np.nan
+    elif 'datetimetz' in upcast_classes:
+        # GH-25014. We use NaT instead of iNaT, since this eventually
+        # ends up in DatetimeArray.take, which does not allow iNaT.
+        dtype = upcast_classes['datetimetz']
+        return dtype[0], tslibs.NaT
+    elif 'datetime' in upcast_classes:
+        return np.dtype('M8[ns]'), tslibs.iNaT
+    elif 'timedelta' in upcast_classes:
+        return np.dtype('m8[ns]'), tslibs.iNaT
+    else:  # pragma
+        try:
+            g = np.find_common_type(upcast_classes, [])
+        except TypeError:
+            # At least one is an ExtensionArray
+            return np.dtype(np.object_), np.nan
+        else:
+            if is_float_dtype(g):
+                return g, g.type(np.nan)
+            elif is_numeric_dtype(g):
+                if has_none_blocks:
+                    return np.float64, np.nan
+                else:
+                    return g, None
+
+    msg = "invalid dtype determination in get_concat_dtype"
+    raise AssertionError(msg)
+
+
+def is_uniform_join_units(join_units):
+    """
+    Check if the join units consist of blocks of uniform type that can
+    be concatenated using Block.concat_same_type instead of the generic
+    concatenate_join_units (which uses `_concat._concat_compat`).
+
+    """
+    return (
+        # all blocks need to have the same type
+        all(type(ju.block) is type(join_units[0].block) for ju in join_units) and  # noqa
+        # no blocks that would get missing values (can lead to type upcasts)
+        # unless we're an extension dtype.
+        all(not ju.is_na or ju.block.is_extension for ju in join_units) and
+        # no blocks with indexers (as then the dimensions do not fit)
+        all(not ju.indexers for ju in join_units) and
+        # disregard Panels
+        all(ju.block.ndim <= 2 for ju in join_units) and
+        # only use this path when there is something to concatenate
+        len(join_units) > 1)
+
+
+def is_uniform_reindex(join_units):
+    return (
+        # TODO: should this be ju.block._can_hold_na?
+        all(ju.block and ju.block.is_extension for ju in join_units) and
+        len({ju.block.dtype.name for ju in join_units}) == 1
+    )
+
+
+def trim_join_unit(join_unit, length):
+    """
+    Reduce join_unit's shape along item axis to length.
+
+    Extra items that didn't fit are returned as a separate block.
+    """
+
+    if 0 not in join_unit.indexers:
+        extra_indexers = join_unit.indexers
+
+        if join_unit.block is None:
+            extra_block = None
+        else:
+            extra_block = join_unit.block.getitem_block(slice(length, None))
+            join_unit.block = join_unit.block.getitem_block(slice(length))
+    else:
+        extra_block = join_unit.block
+
+        extra_indexers = copy.copy(join_unit.indexers)
+        extra_indexers[0] = extra_indexers[0][length:]
+        join_unit.indexers[0] = join_unit.indexers[0][:length]
+
+    extra_shape = (join_unit.shape[0] - length,) + join_unit.shape[1:]
+    join_unit.shape = (length,) + join_unit.shape[1:]
+
+    return JoinUnit(block=extra_block, indexers=extra_indexers,
+                    shape=extra_shape)
+
+
+def combine_concat_plans(plans, concat_axis):
+    """
+    Combine multiple concatenation plans into one.
+
+    existing_plan is updated in-place.
+    """
+    if len(plans) == 1:
+        for p in plans[0]:
+            yield p[0], [p[1]]
+
+    elif concat_axis == 0:
+        offset = 0
+        for plan in plans:
+            last_plc = None
+
+            for plc, unit in plan:
+                yield plc.add(offset), [unit]
+                last_plc = plc
+
+            if last_plc is not None:
+                offset += last_plc.as_slice.stop
+
+    else:
+        num_ended = [0]
+
+        def _next_or_none(seq):
+            retval = next(seq, None)
+            if retval is None:
+                num_ended[0] += 1
+            return retval
+
+        plans = list(map(iter, plans))
+        next_items = list(map(_next_or_none, plans))
+
+        while num_ended[0] != len(next_items):
+            if num_ended[0] > 0:
+                raise ValueError("Plan shapes are not aligned")
+
+            placements, units = zip(*next_items)
+
+            lengths = list(map(len, placements))
+            min_len, max_len = min(lengths), max(lengths)
+
+            if min_len == max_len:
+                yield placements[0], units
+                next_items[:] = map(_next_or_none, plans)
+            else:
+                yielded_placement = None
+                yielded_units = [None] * len(next_items)
+                for i, (plc, unit) in enumerate(next_items):
+                    yielded_units[i] = unit
+                    if len(plc) > min_len:
+                        # trim_join_unit updates unit in place, so only
+                        # placement needs to be sliced to skip min_len.
+                        next_items[i] = (plc[min_len:],
+                                         trim_join_unit(unit, min_len))
+                    else:
+                        yielded_placement = plc
+                        next_items[i] = _next_or_none(plans[i])
+
+                yield yielded_placement, yielded_units
diff --git a/pandas/core/internals/construction.py b/pandas/core/internals/construction.py
new file mode 100644
index 0000000000000..7e97512682720
--- /dev/null
+++ b/pandas/core/internals/construction.py
@@ -0,0 +1,715 @@
+"""
+Functions for preparing various inputs passed to the DataFrame or Series
+constructors before passing them to a BlockManager.
+"""
+from collections import OrderedDict
+
+import numpy as np
+import numpy.ma as ma
+
+from pandas._libs import lib
+from pandas._libs.tslibs import IncompatibleFrequency
+import pandas.compat as compat
+from pandas.compat import (
+    get_range_parameters, lmap, lrange, raise_with_traceback, range)
+
+from pandas.core.dtypes.cast import (
+    construct_1d_arraylike_from_scalar, construct_1d_ndarray_preserving_na,
+    construct_1d_object_array_from_listlike, infer_dtype_from_scalar,
+    maybe_cast_to_datetime, maybe_cast_to_integer_array, maybe_castable,
+    maybe_convert_platform, maybe_infer_to_datetimelike, maybe_upcast)
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64tz_dtype, is_dtype_equal,
+    is_extension_array_dtype, is_extension_type, is_float_dtype,
+    is_integer_dtype, is_iterator, is_list_like, is_object_dtype, pandas_dtype)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCDatetimeIndex, ABCIndexClass, ABCPandasArray,
+    ABCPeriodIndex, ABCSeries, ABCTimedeltaIndex)
+from pandas.core.dtypes.missing import isna
+
+from pandas.core import algorithms, common as com
+from pandas.core.arrays import Categorical, ExtensionArray, period_array
+from pandas.core.index import (
+    Index, _get_objs_combined_axis, _union_indexes, ensure_index)
+from pandas.core.indexes import base as ibase
+from pandas.core.internals import (
+    create_block_manager_from_arrays, create_block_manager_from_blocks)
+from pandas.core.internals.arrays import extract_array
+
+# ---------------------------------------------------------------------
+# BlockManager Interface
+
+
+def arrays_to_mgr(arrays, arr_names, index, columns, dtype=None):
+    """
+    Segregate Series based on type and coerce into matrices.
+
+    Needs to handle a lot of exceptional cases.
+    """
+    # figure out the index, if necessary
+    if index is None:
+        index = extract_index(arrays)
+    else:
+        index = ensure_index(index)
+
+    # don't force copy because getting jammed in an ndarray anyway
+    arrays = _homogenize(arrays, index, dtype)
+
+    # from BlockManager perspective
+    axes = [ensure_index(columns), index]
+
+    return create_block_manager_from_arrays(arrays, arr_names, axes)
+
+
+def masked_rec_array_to_mgr(data, index, columns, dtype, copy):
+    """
+    Extract from a masked rec array and create the manager.
+    """
+
+    # essentially process a record array then fill it
+    fill_value = data.fill_value
+    fdata = ma.getdata(data)
+    if index is None:
+        index = get_names_from_index(fdata)
+        if index is None:
+            index = ibase.default_index(len(data))
+    index = ensure_index(index)
+
+    if columns is not None:
+        columns = ensure_index(columns)
+    arrays, arr_columns = to_arrays(fdata, columns)
+
+    # fill if needed
+    new_arrays = []
+    for fv, arr, col in zip(fill_value, arrays, arr_columns):
+        mask = ma.getmaskarray(data[col])
+        if mask.any():
+            arr, fv = maybe_upcast(arr, fill_value=fv, copy=True)
+            arr[mask] = fv
+        new_arrays.append(arr)
+
+    # create the manager
+    arrays, arr_columns = reorder_arrays(new_arrays, arr_columns, columns)
+    if columns is None:
+        columns = arr_columns
+
+    mgr = arrays_to_mgr(arrays, arr_columns, index, columns, dtype)
+
+    if copy:
+        mgr = mgr.copy()
+    return mgr
+
+
+# ---------------------------------------------------------------------
+# DataFrame Constructor Interface
+
+def init_ndarray(values, index, columns, dtype=None, copy=False):
+    # input must be a ndarray, list, Series, index
+
+    if isinstance(values, ABCSeries):
+        if columns is None:
+            if values.name is not None:
+                columns = [values.name]
+        if index is None:
+            index = values.index
+        else:
+            values = values.reindex(index)
+
+        # zero len case (GH #2234)
+        if not len(values) and columns is not None and len(columns):
+            values = np.empty((0, 1), dtype=object)
+
+    # we could have a categorical type passed or coerced to 'category'
+    # recast this to an arrays_to_mgr
+    if (is_categorical_dtype(getattr(values, 'dtype', None)) or
+            is_categorical_dtype(dtype)):
+
+        if not hasattr(values, 'dtype'):
+            values = prep_ndarray(values, copy=copy)
+            values = values.ravel()
+        elif copy:
+            values = values.copy()
+
+        index, columns = _get_axes(len(values), 1, index, columns)
+        return arrays_to_mgr([values], columns, index, columns,
+                             dtype=dtype)
+    elif (is_datetime64tz_dtype(values) or
+          is_extension_array_dtype(values)):
+        # GH#19157
+        if columns is None:
+            columns = [0]
+        return arrays_to_mgr([values], columns, index, columns,
+                             dtype=dtype)
+
+    # by definition an array here
+    # the dtypes will be coerced to a single dtype
+    values = prep_ndarray(values, copy=copy)
+
+    if dtype is not None:
+        if not is_dtype_equal(values.dtype, dtype):
+            try:
+                values = values.astype(dtype)
+            except Exception as orig:
+                e = ValueError("failed to cast to '{dtype}' (Exception "
+                               "was: {orig})".format(dtype=dtype,
+                                                     orig=orig))
+                raise_with_traceback(e)
+
+    index, columns = _get_axes(*values.shape, index=index, columns=columns)
+    values = values.T
+
+    # if we don't have a dtype specified, then try to convert objects
+    # on the entire block; this is to convert if we have datetimelike's
+    # embedded in an object type
+    if dtype is None and is_object_dtype(values):
+        values = maybe_infer_to_datetimelike(values)
+
+    return create_block_manager_from_blocks([values], [columns, index])
+
+
+def init_dict(data, index, columns, dtype=None):
+    """
+    Segregate Series based on type and coerce into matrices.
+    Needs to handle a lot of exceptional cases.
+    """
+    if columns is not None:
+        from pandas.core.series import Series
+        arrays = Series(data, index=columns, dtype=object)
+        data_names = arrays.index
+
+        missing = arrays.isnull()
+        if index is None:
+            # GH10856
+            # raise ValueError if only scalars in dict
+            index = extract_index(arrays[~missing])
+        else:
+            index = ensure_index(index)
+
+        # no obvious "empty" int column
+        if missing.any() and not is_integer_dtype(dtype):
+            if dtype is None or np.issubdtype(dtype, np.flexible):
+                # GH#1783
+                nan_dtype = object
+            else:
+                nan_dtype = dtype
+            val = construct_1d_arraylike_from_scalar(np.nan, len(index),
+                                                     nan_dtype)
+            arrays.loc[missing] = [val] * missing.sum()
+
+    else:
+        keys = com.dict_keys_to_ordered_list(data)
+        columns = data_names = Index(keys)
+        # GH#24096 need copy to be deep for datetime64tz case
+        # TODO: See if we can avoid these copies
+        arrays = [data[k] if not is_datetime64tz_dtype(data[k]) else
+                  data[k].copy(deep=True) for k in keys]
+    return arrays_to_mgr(arrays, data_names, index, columns, dtype=dtype)
+
+
+# ---------------------------------------------------------------------
+
+def prep_ndarray(values, copy=True):
+    if not isinstance(values, (np.ndarray, ABCSeries, Index)):
+        if len(values) == 0:
+            return np.empty((0, 0), dtype=object)
+
+        def convert(v):
+            return maybe_convert_platform(v)
+
+        # we could have a 1-dim or 2-dim list here
+        # this is equiv of np.asarray, but does object conversion
+        # and platform dtype preservation
+        try:
+            if is_list_like(values[0]) or hasattr(values[0], 'len'):
+                values = np.array([convert(v) for v in values])
+            elif isinstance(values[0], np.ndarray) and values[0].ndim == 0:
+                # GH#21861
+                values = np.array([convert(v) for v in values])
+            else:
+                values = convert(values)
+        except (ValueError, TypeError):
+            values = convert(values)
+
+    else:
+
+        # drop subclass info, do not copy data
+        values = np.asarray(values)
+        if copy:
+            values = values.copy()
+
+    if values.ndim == 1:
+        values = values.reshape((values.shape[0], 1))
+    elif values.ndim != 2:
+        raise ValueError('Must pass 2-d input')
+
+    return values
+
+
+def _homogenize(data, index, dtype=None):
+    oindex = None
+    homogenized = []
+
+    for val in data:
+        if isinstance(val, ABCSeries):
+            if dtype is not None:
+                val = val.astype(dtype)
+            if val.index is not index:
+                # Forces alignment. No need to copy data since we
+                # are putting it into an ndarray later
+                val = val.reindex(index, copy=False)
+        else:
+            if isinstance(val, dict):
+                if oindex is None:
+                    oindex = index.astype('O')
+
+                if isinstance(index, (ABCDatetimeIndex, ABCTimedeltaIndex)):
+                    val = com.dict_compat(val)
+                else:
+                    val = dict(val)
+                val = lib.fast_multiget(val, oindex.values, default=np.nan)
+            val = sanitize_array(val, index, dtype=dtype, copy=False,
+                                 raise_cast_failure=False)
+
+        homogenized.append(val)
+
+    return homogenized
+
+
+def extract_index(data):
+    index = None
+    if len(data) == 0:
+        index = Index([])
+    elif len(data) > 0:
+        raw_lengths = []
+        indexes = []
+
+        have_raw_arrays = False
+        have_series = False
+        have_dicts = False
+
+        for val in data:
+            if isinstance(val, ABCSeries):
+                have_series = True
+                indexes.append(val.index)
+            elif isinstance(val, dict):
+                have_dicts = True
+                indexes.append(list(val.keys()))
+            elif is_list_like(val) and getattr(val, 'ndim', 1) == 1:
+                have_raw_arrays = True
+                raw_lengths.append(len(val))
+
+        if not indexes and not raw_lengths:
+            raise ValueError('If using all scalar values, you must pass'
+                             ' an index')
+
+        if have_series or have_dicts:
+            index = _union_indexes(indexes)
+
+        if have_raw_arrays:
+            lengths = list(set(raw_lengths))
+            if len(lengths) > 1:
+                raise ValueError('arrays must all be same length')
+
+            if have_dicts:
+                raise ValueError('Mixing dicts with non-Series may lead to '
+                                 'ambiguous ordering.')
+
+            if have_series:
+                if lengths[0] != len(index):
+                    msg = ('array length {length} does not match index '
+                           'length {idx_len}'
+                           .format(length=lengths[0], idx_len=len(index)))
+                    raise ValueError(msg)
+            else:
+                index = ibase.default_index(lengths[0])
+
+    return ensure_index(index)
+
+
+def reorder_arrays(arrays, arr_columns, columns):
+    # reorder according to the columns
+    if (columns is not None and len(columns) and arr_columns is not None and
+            len(arr_columns)):
+        indexer = ensure_index(arr_columns).get_indexer(columns)
+        arr_columns = ensure_index([arr_columns[i] for i in indexer])
+        arrays = [arrays[i] for i in indexer]
+    return arrays, arr_columns
+
+
+def get_names_from_index(data):
+    has_some_name = any(getattr(s, 'name', None) is not None for s in data)
+    if not has_some_name:
+        return ibase.default_index(len(data))
+
+    index = lrange(len(data))
+    count = 0
+    for i, s in enumerate(data):
+        n = getattr(s, 'name', None)
+        if n is not None:
+            index[i] = n
+        else:
+            index[i] = 'Unnamed {count}'.format(count=count)
+            count += 1
+
+    return index
+
+
+def _get_axes(N, K, index, columns):
+    # helper to create the axes as indexes
+    # return axes or defaults
+
+    if index is None:
+        index = ibase.default_index(N)
+    else:
+        index = ensure_index(index)
+
+    if columns is None:
+        columns = ibase.default_index(K)
+    else:
+        columns = ensure_index(columns)
+    return index, columns
+
+
+# ---------------------------------------------------------------------
+# Conversion of Inputs to Arrays
+
+def to_arrays(data, columns, coerce_float=False, dtype=None):
+    """
+    Return list of arrays, columns.
+    """
+    if isinstance(data, ABCDataFrame):
+        if columns is not None:
+            arrays = [data._ixs(i, axis=1).values
+                      for i, col in enumerate(data.columns) if col in columns]
+        else:
+            columns = data.columns
+            arrays = [data._ixs(i, axis=1).values for i in range(len(columns))]
+
+        return arrays, columns
+
+    if not len(data):
+        if isinstance(data, np.ndarray):
+            columns = data.dtype.names
+            if columns is not None:
+                return [[]] * len(columns), columns
+        return [], []  # columns if columns is not None else []
+    if isinstance(data[0], (list, tuple)):
+        return _list_to_arrays(data, columns, coerce_float=coerce_float,
+                               dtype=dtype)
+    elif isinstance(data[0], compat.Mapping):
+        return _list_of_dict_to_arrays(data, columns,
+                                       coerce_float=coerce_float, dtype=dtype)
+    elif isinstance(data[0], ABCSeries):
+        return _list_of_series_to_arrays(data, columns,
+                                         coerce_float=coerce_float,
+                                         dtype=dtype)
+    elif isinstance(data[0], Categorical):
+        if columns is None:
+            columns = ibase.default_index(len(data))
+        return data, columns
+    elif (isinstance(data, (np.ndarray, ABCSeries, Index)) and
+          data.dtype.names is not None):
+
+        columns = list(data.dtype.names)
+        arrays = [data[k] for k in columns]
+        return arrays, columns
+    else:
+        # last ditch effort
+        data = lmap(tuple, data)
+        return _list_to_arrays(data, columns, coerce_float=coerce_float,
+                               dtype=dtype)
+
+
+def _list_to_arrays(data, columns, coerce_float=False, dtype=None):
+    if len(data) > 0 and isinstance(data[0], tuple):
+        content = list(lib.to_object_array_tuples(data).T)
+    else:
+        # list of lists
+        content = list(lib.to_object_array(data).T)
+    return _convert_object_array(content, columns, dtype=dtype,
+                                 coerce_float=coerce_float)
+
+
+def _list_of_series_to_arrays(data, columns, coerce_float=False, dtype=None):
+    if columns is None:
+        columns = _get_objs_combined_axis(data, sort=False)
+
+    indexer_cache = {}
+
+    aligned_values = []
+    for s in data:
+        index = getattr(s, 'index', None)
+        if index is None:
+            index = ibase.default_index(len(s))
+
+        if id(index) in indexer_cache:
+            indexer = indexer_cache[id(index)]
+        else:
+            indexer = indexer_cache[id(index)] = index.get_indexer(columns)
+
+        values = com.values_from_object(s)
+        aligned_values.append(algorithms.take_1d(values, indexer))
+
+    values = np.vstack(aligned_values)
+
+    if values.dtype == np.object_:
+        content = list(values.T)
+        return _convert_object_array(content, columns, dtype=dtype,
+                                     coerce_float=coerce_float)
+    else:
+        return values.T, columns
+
+
+def _list_of_dict_to_arrays(data, columns, coerce_float=False, dtype=None):
+    if columns is None:
+        gen = (list(x.keys()) for x in data)
+        sort = not any(isinstance(d, OrderedDict) for d in data)
+        columns = lib.fast_unique_multiple_list_gen(gen, sort=sort)
+
+    # assure that they are of the base dict class and not of derived
+    # classes
+    data = [(type(d) is dict) and d or dict(d) for d in data]
+
+    content = list(lib.dicts_to_array(data, list(columns)).T)
+    return _convert_object_array(content, columns, dtype=dtype,
+                                 coerce_float=coerce_float)
+
+
+def _convert_object_array(content, columns, coerce_float=False, dtype=None):
+    if columns is None:
+        columns = ibase.default_index(len(content))
+    else:
+        if len(columns) != len(content):  # pragma: no cover
+            # caller's responsibility to check for this...
+            raise AssertionError('{col:d} columns passed, passed data had '
+                                 '{con} columns'.format(col=len(columns),
+                                                        con=len(content)))
+
+    # provide soft conversion of object dtypes
+    def convert(arr):
+        if dtype != object and dtype != np.object:
+            arr = lib.maybe_convert_objects(arr, try_float=coerce_float)
+            arr = maybe_cast_to_datetime(arr, dtype)
+        return arr
+
+    arrays = [convert(arr) for arr in content]
+
+    return arrays, columns
+
+
+# ---------------------------------------------------------------------
+# Series-Based
+
+def sanitize_index(data, index, copy=False):
+    """
+    Sanitize an index type to return an ndarray of the underlying, pass
+    through a non-Index.
+    """
+
+    if index is None:
+        return data
+
+    if len(data) != len(index):
+        raise ValueError('Length of values does not match length of index')
+
+    if isinstance(data, ABCIndexClass) and not copy:
+        pass
+    elif isinstance(data, (ABCPeriodIndex, ABCDatetimeIndex)):
+        data = data._values
+        if copy:
+            data = data.copy()
+
+    elif isinstance(data, np.ndarray):
+
+        # coerce datetimelike types
+        if data.dtype.kind in ['M', 'm']:
+            data = sanitize_array(data, index, copy=copy)
+
+    return data
+
+
+def sanitize_array(data, index, dtype=None, copy=False,
+                   raise_cast_failure=False):
+    """
+    Sanitize input data to an ndarray, copy if specified, coerce to the
+    dtype if specified.
+    """
+    if dtype is not None:
+        dtype = pandas_dtype(dtype)
+
+    if isinstance(data, ma.MaskedArray):
+        mask = ma.getmaskarray(data)
+        if mask.any():
+            data, fill_value = maybe_upcast(data, copy=True)
+            data.soften_mask()  # set hardmask False if it was True
+            data[mask] = fill_value
+        else:
+            data = data.copy()
+
+    data = extract_array(data, extract_numpy=True)
+
+    # GH#846
+    if isinstance(data, np.ndarray):
+
+        if dtype is not None:
+            subarr = np.array(data, copy=False)
+
+            # possibility of nan -> garbage
+            if is_float_dtype(data.dtype) and is_integer_dtype(dtype):
+                try:
+                    subarr = _try_cast(data, True, dtype, copy,
+                                       True)
+                except ValueError:
+                    if copy:
+                        subarr = data.copy()
+            else:
+                subarr = _try_cast(data, True, dtype, copy, raise_cast_failure)
+        elif isinstance(data, Index):
+            # don't coerce Index types
+            # e.g. indexes can have different conversions (so don't fast path
+            # them)
+            # GH#6140
+            subarr = sanitize_index(data, index, copy=copy)
+        else:
+
+            # we will try to copy be-definition here
+            subarr = _try_cast(data, True, dtype, copy, raise_cast_failure)
+
+    elif isinstance(data, ExtensionArray):
+        if isinstance(data, ABCPandasArray):
+            # We don't want to let people put our PandasArray wrapper
+            # (the output of Series/Index.array), into a Series. So
+            # we explicitly unwrap it here.
+            subarr = data.to_numpy()
+        else:
+            subarr = data
+
+        # everything else in this block must also handle ndarray's,
+        # becuase we've unwrapped PandasArray into an ndarray.
+
+        if dtype is not None:
+            subarr = data.astype(dtype)
+
+        if copy:
+            subarr = data.copy()
+        return subarr
+
+    elif isinstance(data, (list, tuple)) and len(data) > 0:
+        if dtype is not None:
+            try:
+                subarr = _try_cast(data, False, dtype, copy,
+                                   raise_cast_failure)
+            except Exception:
+                if raise_cast_failure:  # pragma: no cover
+                    raise
+                subarr = np.array(data, dtype=object, copy=copy)
+                subarr = lib.maybe_convert_objects(subarr)
+
+        else:
+            subarr = maybe_convert_platform(data)
+
+        subarr = maybe_cast_to_datetime(subarr, dtype)
+
+    elif isinstance(data, range):
+        # GH#16804
+        start, stop, step = get_range_parameters(data)
+        arr = np.arange(start, stop, step, dtype='int64')
+        subarr = _try_cast(arr, False, dtype, copy, raise_cast_failure)
+    else:
+        subarr = _try_cast(data, False, dtype, copy, raise_cast_failure)
+
+    # scalar like, GH
+    if getattr(subarr, 'ndim', 0) == 0:
+        if isinstance(data, list):  # pragma: no cover
+            subarr = np.array(data, dtype=object)
+        elif index is not None:
+            value = data
+
+            # figure out the dtype from the value (upcast if necessary)
+            if dtype is None:
+                dtype, value = infer_dtype_from_scalar(value)
+            else:
+                # need to possibly convert the value here
+                value = maybe_cast_to_datetime(value, dtype)
+
+            subarr = construct_1d_arraylike_from_scalar(
+                value, len(index), dtype)
+
+        else:
+            return subarr.item()
+
+    # the result that we want
+    elif subarr.ndim == 1:
+        if index is not None:
+
+            # a 1-element ndarray
+            if len(subarr) != len(index) and len(subarr) == 1:
+                subarr = construct_1d_arraylike_from_scalar(
+                    subarr[0], len(index), subarr.dtype)
+
+    elif subarr.ndim > 1:
+        if isinstance(data, np.ndarray):
+            raise Exception('Data must be 1-dimensional')
+        else:
+            subarr = com.asarray_tuplesafe(data, dtype=dtype)
+
+    # This is to prevent mixed-type Series getting all casted to
+    # NumPy string type, e.g. NaN --> '-1#IND'.
+    if issubclass(subarr.dtype.type, compat.string_types):
+        # GH#16605
+        # If not empty convert the data to dtype
+        # GH#19853: If data is a scalar, subarr has already the result
+        if not lib.is_scalar(data):
+            if not np.all(isna(data)):
+                data = np.array(data, dtype=dtype, copy=False)
+            subarr = np.array(data, dtype=object, copy=copy)
+
+    if is_object_dtype(subarr.dtype) and dtype != 'object':
+        inferred = lib.infer_dtype(subarr, skipna=False)
+        if inferred == 'period':
+            try:
+                subarr = period_array(subarr)
+            except IncompatibleFrequency:
+                pass
+
+    return subarr
+
+
+def _try_cast(arr, take_fast_path, dtype, copy, raise_cast_failure):
+
+    # perf shortcut as this is the most common case
+    if take_fast_path:
+        if maybe_castable(arr) and not copy and dtype is None:
+            return arr
+
+    try:
+        # GH#15832: Check if we are requesting a numeric dype and
+        # that we can convert the data to the requested dtype.
+        if is_integer_dtype(dtype):
+            subarr = maybe_cast_to_integer_array(arr, dtype)
+
+        subarr = maybe_cast_to_datetime(arr, dtype)
+        # Take care in creating object arrays (but iterators are not
+        # supported):
+        if is_object_dtype(dtype) and (is_list_like(subarr) and
+                                       not (is_iterator(subarr) or
+                                       isinstance(subarr, np.ndarray))):
+            subarr = construct_1d_object_array_from_listlike(subarr)
+        elif not is_extension_type(subarr):
+            subarr = construct_1d_ndarray_preserving_na(subarr, dtype,
+                                                        copy=copy)
+    except (ValueError, TypeError):
+        if is_categorical_dtype(dtype):
+            # We *do* allow casting to categorical, since we know
+            # that Categorical is the only array type for 'category'.
+            subarr = Categorical(arr, dtype.categories,
+                                 ordered=dtype.ordered)
+        elif is_extension_array_dtype(dtype):
+            # create an extension array from its dtype
+            array_type = dtype.construct_array_type()._from_sequence
+            subarr = array_type(arr, dtype=dtype, copy=copy)
+        elif dtype is not None and raise_cast_failure:
+            raise
+        else:
+            subarr = np.array(arr, dtype=object, copy=copy)
+    return subarr
diff --git a/pandas/core/internals/managers.py b/pandas/core/internals/managers.py
new file mode 100644
index 0000000000000..407db772d73e8
--- /dev/null
+++ b/pandas/core/internals/managers.py
@@ -0,0 +1,2073 @@
+# -*- coding: utf-8 -*-
+from collections import defaultdict
+from functools import partial
+import itertools
+import operator
+import re
+
+import numpy as np
+
+from pandas._libs import internals as libinternals, lib
+from pandas.compat import map, range, zip
+from pandas.util._validators import validate_bool_kwarg
+
+from pandas.core.dtypes.cast import (
+    find_common_type, infer_dtype_from_scalar, maybe_convert_objects,
+    maybe_promote)
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, is_datetimelike_v_numeric, is_extension_array_dtype,
+    is_extension_type, is_list_like, is_numeric_v_string_like, is_scalar)
+import pandas.core.dtypes.concat as _concat
+from pandas.core.dtypes.generic import ABCExtensionArray, ABCSeries
+from pandas.core.dtypes.missing import isna
+
+import pandas.core.algorithms as algos
+from pandas.core.arrays.sparse import _maybe_to_sparse
+from pandas.core.base import PandasObject
+from pandas.core.index import Index, MultiIndex, ensure_index
+from pandas.core.indexing import maybe_convert_indices
+
+from pandas.io.formats.printing import pprint_thing
+
+from .blocks import (
+    Block, CategoricalBlock, DatetimeTZBlock, ExtensionBlock,
+    ObjectValuesExtensionBlock, _extend_blocks, _merge_blocks, _safe_reshape,
+    get_block_type, make_block)
+from .concat import (  # all for concatenate_block_managers
+    combine_concat_plans, concatenate_join_units, get_mgr_concatenation_plan,
+    is_uniform_join_units)
+
+# TODO: flexible with index=None and/or items=None
+
+
+class BlockManager(PandasObject):
+    """
+    Core internal data structure to implement DataFrame, Series, Panel, etc.
+
+    Manage a bunch of labeled 2D mixed-type ndarrays. Essentially it's a
+    lightweight blocked set of labeled data to be manipulated by the DataFrame
+    public API class
+
+    Attributes
+    ----------
+    shape
+    ndim
+    axes
+    values
+    items
+
+    Methods
+    -------
+    set_axis(axis, new_labels)
+    copy(deep=True)
+
+    get_dtype_counts
+    get_ftype_counts
+    get_dtypes
+    get_ftypes
+
+    apply(func, axes, block_filter_fn)
+
+    get_bool_data
+    get_numeric_data
+
+    get_slice(slice_like, axis)
+    get(label)
+    iget(loc)
+
+    take(indexer, axis)
+    reindex_axis(new_labels, axis)
+    reindex_indexer(new_labels, indexer, axis)
+
+    delete(label)
+    insert(loc, label, value)
+    set(label, value)
+
+    Parameters
+    ----------
+
+
+    Notes
+    -----
+    This is *not* a public API class
+    """
+    __slots__ = ['axes', 'blocks', '_ndim', '_shape', '_known_consolidated',
+                 '_is_consolidated', '_blknos', '_blklocs']
+
+    def __init__(self, blocks, axes, do_integrity_check=True):
+        self.axes = [ensure_index(ax) for ax in axes]
+        self.blocks = tuple(blocks)
+
+        for block in blocks:
+            if block.is_sparse:
+                if len(block.mgr_locs) != 1:
+                    raise AssertionError("Sparse block refers to multiple "
+                                         "items")
+            else:
+                if self.ndim != block.ndim:
+                    raise AssertionError(
+                        'Number of Block dimensions ({block}) must equal '
+                        'number of axes ({self})'.format(block=block.ndim,
+                                                         self=self.ndim))
+
+        if do_integrity_check:
+            self._verify_integrity()
+
+        self._consolidate_check()
+
+        self._rebuild_blknos_and_blklocs()
+
+    def make_empty(self, axes=None):
+        """ return an empty BlockManager with the items axis of len 0 """
+        if axes is None:
+            axes = [ensure_index([])] + [ensure_index(a)
+                                         for a in self.axes[1:]]
+
+        # preserve dtype if possible
+        if self.ndim == 1:
+            blocks = np.array([], dtype=self.array_dtype)
+        else:
+            blocks = []
+        return self.__class__(blocks, axes)
+
+    def __nonzero__(self):
+        return True
+
+    # Python3 compat
+    __bool__ = __nonzero__
+
+    @property
+    def shape(self):
+        return tuple(len(ax) for ax in self.axes)
+
+    @property
+    def ndim(self):
+        return len(self.axes)
+
+    def set_axis(self, axis, new_labels):
+        new_labels = ensure_index(new_labels)
+        old_len = len(self.axes[axis])
+        new_len = len(new_labels)
+
+        if new_len != old_len:
+            raise ValueError(
+                'Length mismatch: Expected axis has {old} elements, new '
+                'values have {new} elements'.format(old=old_len, new=new_len))
+
+        self.axes[axis] = new_labels
+
+    def rename_axis(self, mapper, axis, copy=True, level=None):
+        """
+        Rename one of axes.
+
+        Parameters
+        ----------
+        mapper : unary callable
+        axis : int
+        copy : boolean, default True
+        level : int, default None
+        """
+        obj = self.copy(deep=copy)
+        obj.set_axis(axis, _transform_index(self.axes[axis], mapper, level))
+        return obj
+
+    @property
+    def _is_single_block(self):
+        if self.ndim == 1:
+            return True
+
+        if len(self.blocks) != 1:
+            return False
+
+        blk = self.blocks[0]
+        return (blk.mgr_locs.is_slice_like and
+                blk.mgr_locs.as_slice == slice(0, len(self), 1))
+
+    def _rebuild_blknos_and_blklocs(self):
+        """
+        Update mgr._blknos / mgr._blklocs.
+        """
+        new_blknos = np.empty(self.shape[0], dtype=np.int64)
+        new_blklocs = np.empty(self.shape[0], dtype=np.int64)
+        new_blknos.fill(-1)
+        new_blklocs.fill(-1)
+
+        for blkno, blk in enumerate(self.blocks):
+            rl = blk.mgr_locs
+            new_blknos[rl.indexer] = blkno
+            new_blklocs[rl.indexer] = np.arange(len(rl))
+
+        if (new_blknos == -1).any():
+            raise AssertionError("Gaps in blk ref_locs")
+
+        self._blknos = new_blknos
+        self._blklocs = new_blklocs
+
+    @property
+    def items(self):
+        return self.axes[0]
+
+    def _get_counts(self, f):
+        """ return a dict of the counts of the function in BlockManager """
+        self._consolidate_inplace()
+        counts = dict()
+        for b in self.blocks:
+            v = f(b)
+            counts[v] = counts.get(v, 0) + b.shape[0]
+        return counts
+
+    def get_dtype_counts(self):
+        return self._get_counts(lambda b: b.dtype.name)
+
+    def get_ftype_counts(self):
+        return self._get_counts(lambda b: b.ftype)
+
+    def get_dtypes(self):
+        dtypes = np.array([blk.dtype for blk in self.blocks])
+        return algos.take_1d(dtypes, self._blknos, allow_fill=False)
+
+    def get_ftypes(self):
+        ftypes = np.array([blk.ftype for blk in self.blocks])
+        return algos.take_1d(ftypes, self._blknos, allow_fill=False)
+
+    def __getstate__(self):
+        block_values = [b.values for b in self.blocks]
+        block_items = [self.items[b.mgr_locs.indexer] for b in self.blocks]
+        axes_array = [ax for ax in self.axes]
+
+        extra_state = {
+            '0.14.1': {
+                'axes': axes_array,
+                'blocks': [dict(values=b.values, mgr_locs=b.mgr_locs.indexer)
+                           for b in self.blocks]
+            }
+        }
+
+        # First three elements of the state are to maintain forward
+        # compatibility with 0.13.1.
+        return axes_array, block_values, block_items, extra_state
+
+    def __setstate__(self, state):
+        def unpickle_block(values, mgr_locs):
+            return make_block(values, placement=mgr_locs)
+
+        if (isinstance(state, tuple) and len(state) >= 4 and
+                '0.14.1' in state[3]):
+            state = state[3]['0.14.1']
+            self.axes = [ensure_index(ax) for ax in state['axes']]
+            self.blocks = tuple(unpickle_block(b['values'], b['mgr_locs'])
+                                for b in state['blocks'])
+        else:
+            # discard anything after 3rd, support beta pickling format for a
+            # little while longer
+            ax_arrays, bvalues, bitems = state[:3]
+
+            self.axes = [ensure_index(ax) for ax in ax_arrays]
+
+            if len(bitems) == 1 and self.axes[0].equals(bitems[0]):
+                # This is a workaround for pre-0.14.1 pickles that didn't
+                # support unpickling multi-block frames/panels with non-unique
+                # columns/items, because given a manager with items ["a", "b",
+                # "a"] there's no way of knowing which block's "a" is where.
+                #
+                # Single-block case can be supported under the assumption that
+                # block items corresponded to manager items 1-to-1.
+                all_mgr_locs = [slice(0, len(bitems[0]))]
+            else:
+                all_mgr_locs = [self.axes[0].get_indexer(blk_items)
+                                for blk_items in bitems]
+
+            self.blocks = tuple(
+                unpickle_block(values, mgr_locs)
+                for values, mgr_locs in zip(bvalues, all_mgr_locs))
+
+        self._post_setstate()
+
+    def _post_setstate(self):
+        self._is_consolidated = False
+        self._known_consolidated = False
+        self._rebuild_blknos_and_blklocs()
+
+    def __len__(self):
+        return len(self.items)
+
+    def __unicode__(self):
+        output = pprint_thing(self.__class__.__name__)
+        for i, ax in enumerate(self.axes):
+            if i == 0:
+                output += u'\nItems: {ax}'.format(ax=ax)
+            else:
+                output += u'\nAxis {i}: {ax}'.format(i=i, ax=ax)
+
+        for block in self.blocks:
+            output += u'\n{block}'.format(block=pprint_thing(block))
+        return output
+
+    def _verify_integrity(self):
+        mgr_shape = self.shape
+        tot_items = sum(len(x.mgr_locs) for x in self.blocks)
+        for block in self.blocks:
+            if block._verify_integrity and block.shape[1:] != mgr_shape[1:]:
+                construction_error(tot_items, block.shape[1:], self.axes)
+        if len(self.items) != tot_items:
+            raise AssertionError('Number of manager items must equal union of '
+                                 'block items\n# manager items: {0}, # '
+                                 'tot_items: {1}'.format(
+                                     len(self.items), tot_items))
+
+    def apply(self, f, axes=None, filter=None, do_integrity_check=False,
+              consolidate=True, **kwargs):
+        """
+        iterate over the blocks, collect and create a new block manager
+
+        Parameters
+        ----------
+        f : the callable or function name to operate on at the block level
+        axes : optional (if not supplied, use self.axes)
+        filter : list, if supplied, only call the block if the filter is in
+                 the block
+        do_integrity_check : boolean, default False. Do the block manager
+            integrity check
+        consolidate: boolean, default True. Join together blocks having same
+            dtype
+
+        Returns
+        -------
+        Block Manager (new object)
+
+        """
+
+        result_blocks = []
+
+        # filter kwarg is used in replace-* family of methods
+        if filter is not None:
+            filter_locs = set(self.items.get_indexer_for(filter))
+            if len(filter_locs) == len(self.items):
+                # All items are included, as if there were no filtering
+                filter = None
+            else:
+                kwargs['filter'] = filter_locs
+
+        if consolidate:
+            self._consolidate_inplace()
+
+        if f == 'where':
+            align_copy = True
+            if kwargs.get('align', True):
+                align_keys = ['other', 'cond']
+            else:
+                align_keys = ['cond']
+        elif f == 'putmask':
+            align_copy = False
+            if kwargs.get('align', True):
+                align_keys = ['new', 'mask']
+            else:
+                align_keys = ['mask']
+        elif f == 'fillna':
+            # fillna internally does putmask, maybe it's better to do this
+            # at mgr, not block level?
+            align_copy = False
+            align_keys = ['value']
+        else:
+            align_keys = []
+
+        # TODO(EA): may interfere with ExtensionBlock.setitem for blocks
+        # with a .values attribute.
+        aligned_args = {k: kwargs[k]
+                        for k in align_keys
+                        if hasattr(kwargs[k], 'values') and
+                        not isinstance(kwargs[k], ABCExtensionArray)}
+
+        for b in self.blocks:
+            if filter is not None:
+                if not b.mgr_locs.isin(filter_locs).any():
+                    result_blocks.append(b)
+                    continue
+
+            if aligned_args:
+                b_items = self.items[b.mgr_locs.indexer]
+
+                for k, obj in aligned_args.items():
+                    axis = getattr(obj, '_info_axis_number', 0)
+                    kwargs[k] = obj.reindex(b_items, axis=axis,
+                                            copy=align_copy)
+
+            applied = getattr(b, f)(**kwargs)
+            result_blocks = _extend_blocks(applied, result_blocks)
+
+        if len(result_blocks) == 0:
+            return self.make_empty(axes or self.axes)
+        bm = self.__class__(result_blocks, axes or self.axes,
+                            do_integrity_check=do_integrity_check)
+        bm._consolidate_inplace()
+        return bm
+
+    def quantile(self, axis=0, consolidate=True, transposed=False,
+                 interpolation='linear', qs=None, numeric_only=None):
+        """
+        Iterate over blocks applying quantile reduction.
+        This routine is intended for reduction type operations and
+        will do inference on the generated blocks.
+
+        Parameters
+        ----------
+        axis: reduction axis, default 0
+        consolidate: boolean, default True. Join together blocks having same
+            dtype
+        transposed: boolean, default False
+            we are holding transposed data
+        interpolation : type of interpolation, default 'linear'
+        qs : a scalar or list of the quantiles to be computed
+        numeric_only : ignored
+
+        Returns
+        -------
+        Block Manager (new object)
+        """
+
+        # Series dispatches to DataFrame for quantile, which allows us to
+        #  simplify some of the code here and in the blocks
+        assert self.ndim >= 2
+
+        if consolidate:
+            self._consolidate_inplace()
+
+        def get_axe(block, qs, axes):
+            from pandas import Float64Index
+            if is_list_like(qs):
+                ax = Float64Index(qs)
+            elif block.ndim == 1:
+                ax = Float64Index([qs])
+            else:
+                ax = axes[0]
+            return ax
+
+        axes, blocks = [], []
+        for b in self.blocks:
+            block = b.quantile(axis=axis, qs=qs, interpolation=interpolation)
+
+            axe = get_axe(b, qs, axes=self.axes)
+
+            axes.append(axe)
+            blocks.append(block)
+
+        # note that some DatetimeTZ, Categorical are always ndim==1
+        ndim = {b.ndim for b in blocks}
+        assert 0 not in ndim, ndim
+
+        if 2 in ndim:
+
+            new_axes = list(self.axes)
+
+            # multiple blocks that are reduced
+            if len(blocks) > 1:
+                new_axes[1] = axes[0]
+
+                # reset the placement to the original
+                for b, sb in zip(blocks, self.blocks):
+                    b.mgr_locs = sb.mgr_locs
+
+            else:
+                new_axes[axis] = Index(np.concatenate(
+                    [ax.values for ax in axes]))
+
+            if transposed:
+                new_axes = new_axes[::-1]
+                blocks = [b.make_block(b.values.T,
+                                       placement=np.arange(b.shape[1])
+                                       ) for b in blocks]
+
+            return self.__class__(blocks, new_axes)
+
+        # single block, i.e. ndim == {1}
+        values = _concat._concat_compat([b.values for b in blocks])
+
+        # compute the orderings of our original data
+        if len(self.blocks) > 1:
+
+            indexer = np.empty(len(self.axes[0]), dtype=np.intp)
+            i = 0
+            for b in self.blocks:
+                for j in b.mgr_locs:
+                    indexer[j] = i
+                    i = i + 1
+
+            values = values.take(indexer)
+
+        return SingleBlockManager(
+            [make_block(values,
+                        ndim=1,
+                        placement=np.arange(len(values)))],
+            axes[0])
+
+    def isna(self, func, **kwargs):
+        return self.apply('apply', func=func, **kwargs)
+
+    def where(self, **kwargs):
+        return self.apply('where', **kwargs)
+
+    def setitem(self, **kwargs):
+        return self.apply('setitem', **kwargs)
+
+    def putmask(self, **kwargs):
+        return self.apply('putmask', **kwargs)
+
+    def diff(self, **kwargs):
+        return self.apply('diff', **kwargs)
+
+    def interpolate(self, **kwargs):
+        return self.apply('interpolate', **kwargs)
+
+    def shift(self, **kwargs):
+        return self.apply('shift', **kwargs)
+
+    def fillna(self, **kwargs):
+        return self.apply('fillna', **kwargs)
+
+    def downcast(self, **kwargs):
+        return self.apply('downcast', **kwargs)
+
+    def astype(self, dtype, **kwargs):
+        return self.apply('astype', dtype=dtype, **kwargs)
+
+    def convert(self, **kwargs):
+        return self.apply('convert', **kwargs)
+
+    def replace(self, **kwargs):
+        return self.apply('replace', **kwargs)
+
+    def replace_list(self, src_list, dest_list, inplace=False, regex=False):
+        """ do a list replace """
+
+        inplace = validate_bool_kwarg(inplace, 'inplace')
+
+        # figure out our mask a-priori to avoid repeated replacements
+        values = self.as_array()
+
+        def comp(s, regex=False):
+            """
+            Generate a bool array by perform an equality check, or perform
+            an element-wise regular expression matching
+            """
+            if isna(s):
+                return isna(values)
+            if hasattr(s, 'asm8'):
+                return _compare_or_regex_search(maybe_convert_objects(values),
+                                                getattr(s, 'asm8'), regex)
+            return _compare_or_regex_search(values, s, regex)
+
+        masks = [comp(s, regex) for i, s in enumerate(src_list)]
+
+        result_blocks = []
+        src_len = len(src_list) - 1
+        for blk in self.blocks:
+
+            # its possible to get multiple result blocks here
+            # replace ALWAYS will return a list
+            rb = [blk if inplace else blk.copy()]
+            for i, (s, d) in enumerate(zip(src_list, dest_list)):
+                new_rb = []
+                for b in rb:
+                    m = masks[i][b.mgr_locs.indexer]
+                    convert = i == src_len
+                    result = b._replace_coerce(mask=m, to_replace=s, value=d,
+                                               inplace=inplace,
+                                               convert=convert, regex=regex)
+                    if m.any():
+                        new_rb = _extend_blocks(result, new_rb)
+                    else:
+                        new_rb.append(b)
+                rb = new_rb
+            result_blocks.extend(rb)
+
+        bm = self.__class__(result_blocks, self.axes)
+        bm._consolidate_inplace()
+        return bm
+
+    def is_consolidated(self):
+        """
+        Return True if more than one block with the same dtype
+        """
+        if not self._known_consolidated:
+            self._consolidate_check()
+        return self._is_consolidated
+
+    def _consolidate_check(self):
+        ftypes = [blk.ftype for blk in self.blocks]
+        self._is_consolidated = len(ftypes) == len(set(ftypes))
+        self._known_consolidated = True
+
+    @property
+    def is_mixed_type(self):
+        # Warning, consolidation needs to get checked upstairs
+        self._consolidate_inplace()
+        return len(self.blocks) > 1
+
+    @property
+    def is_numeric_mixed_type(self):
+        # Warning, consolidation needs to get checked upstairs
+        self._consolidate_inplace()
+        return all(block.is_numeric for block in self.blocks)
+
+    @property
+    def is_datelike_mixed_type(self):
+        # Warning, consolidation needs to get checked upstairs
+        self._consolidate_inplace()
+        return any(block.is_datelike for block in self.blocks)
+
+    @property
+    def any_extension_types(self):
+        """Whether any of the blocks in this manager are extension blocks"""
+        return any(block.is_extension for block in self.blocks)
+
+    @property
+    def is_view(self):
+        """ return a boolean if we are a single block and are a view """
+        if len(self.blocks) == 1:
+            return self.blocks[0].is_view
+
+        # It is technically possible to figure out which blocks are views
+        # e.g. [ b.values.base is not None for b in self.blocks ]
+        # but then we have the case of possibly some blocks being a view
+        # and some blocks not. setting in theory is possible on the non-view
+        # blocks w/o causing a SettingWithCopy raise/warn. But this is a bit
+        # complicated
+
+        return False
+
+    def get_bool_data(self, copy=False):
+        """
+        Parameters
+        ----------
+        copy : boolean, default False
+            Whether to copy the blocks
+        """
+        self._consolidate_inplace()
+        return self.combine([b for b in self.blocks if b.is_bool], copy)
+
+    def get_numeric_data(self, copy=False):
+        """
+        Parameters
+        ----------
+        copy : boolean, default False
+            Whether to copy the blocks
+        """
+        self._consolidate_inplace()
+        return self.combine([b for b in self.blocks if b.is_numeric], copy)
+
+    def combine(self, blocks, copy=True):
+        """ return a new manager with the blocks """
+        if len(blocks) == 0:
+            return self.make_empty()
+
+        # FIXME: optimization potential
+        indexer = np.sort(np.concatenate([b.mgr_locs.as_array
+                                          for b in blocks]))
+        inv_indexer = lib.get_reverse_indexer(indexer, self.shape[0])
+
+        new_blocks = []
+        for b in blocks:
+            b = b.copy(deep=copy)
+            b.mgr_locs = algos.take_1d(inv_indexer, b.mgr_locs.as_array,
+                                       axis=0, allow_fill=False)
+            new_blocks.append(b)
+
+        axes = list(self.axes)
+        axes[0] = self.items.take(indexer)
+
+        return self.__class__(new_blocks, axes, do_integrity_check=False)
+
+    def get_slice(self, slobj, axis=0):
+        if axis >= self.ndim:
+            raise IndexError("Requested axis not found in manager")
+
+        if axis == 0:
+            new_blocks = self._slice_take_blocks_ax0(slobj)
+        else:
+            slicer = [slice(None)] * (axis + 1)
+            slicer[axis] = slobj
+            slicer = tuple(slicer)
+            new_blocks = [blk.getitem_block(slicer) for blk in self.blocks]
+
+        new_axes = list(self.axes)
+        new_axes[axis] = new_axes[axis][slobj]
+
+        bm = self.__class__(new_blocks, new_axes, do_integrity_check=False)
+        bm._consolidate_inplace()
+        return bm
+
+    def __contains__(self, item):
+        return item in self.items
+
+    @property
+    def nblocks(self):
+        return len(self.blocks)
+
+    def copy(self, deep=True):
+        """
+        Make deep or shallow copy of BlockManager
+
+        Parameters
+        ----------
+        deep : boolean o rstring, default True
+            If False, return shallow copy (do not copy data)
+            If 'all', copy data and a deep copy of the index
+
+        Returns
+        -------
+        copy : BlockManager
+        """
+        # this preserves the notion of view copying of axes
+        if deep:
+            if deep == 'all':
+                copy = lambda ax: ax.copy(deep=True)
+            else:
+                copy = lambda ax: ax.view()
+            new_axes = [copy(ax) for ax in self.axes]
+        else:
+            new_axes = list(self.axes)
+        return self.apply('copy', axes=new_axes, deep=deep,
+                          do_integrity_check=False)
+
+    def as_array(self, transpose=False, items=None):
+        """Convert the blockmanager data into an numpy array.
+
+        Parameters
+        ----------
+        transpose : boolean, default False
+            If True, transpose the return array
+        items : list of strings or None
+            Names of block items that will be included in the returned
+            array. ``None`` means that all block items will be used
+
+        Returns
+        -------
+        arr : ndarray
+        """
+        if len(self.blocks) == 0:
+            arr = np.empty(self.shape, dtype=float)
+            return arr.transpose() if transpose else arr
+
+        if items is not None:
+            mgr = self.reindex_axis(items, axis=0)
+        else:
+            mgr = self
+
+        if self._is_single_block and mgr.blocks[0].is_datetimetz:
+            # TODO(Block.get_values): Make DatetimeTZBlock.get_values
+            # always be object dtype. Some callers seem to want the
+            # DatetimeArray (previously DTI)
+            arr = mgr.blocks[0].get_values(dtype=object)
+        elif self._is_single_block or not self.is_mixed_type:
+            arr = np.asarray(mgr.blocks[0].get_values())
+        else:
+            arr = mgr._interleave()
+
+        return arr.transpose() if transpose else arr
+
+    def _interleave(self):
+        """
+        Return ndarray from blocks with specified item order
+        Items must be contained in the blocks
+        """
+        from pandas.core.dtypes.common import is_sparse
+        dtype = _interleaved_dtype(self.blocks)
+
+        # TODO: https://github.com/pandas-dev/pandas/issues/22791
+        # Give EAs some input on what happens here. Sparse needs this.
+        if is_sparse(dtype):
+            dtype = dtype.subtype
+        elif is_extension_array_dtype(dtype):
+            dtype = 'object'
+
+        result = np.empty(self.shape, dtype=dtype)
+
+        itemmask = np.zeros(self.shape[0])
+
+        for blk in self.blocks:
+            rl = blk.mgr_locs
+            result[rl.indexer] = blk.get_values(dtype)
+            itemmask[rl.indexer] = 1
+
+        if not itemmask.all():
+            raise AssertionError('Some items were not contained in blocks')
+
+        return result
+
+    def to_dict(self, copy=True):
+        """
+        Return a dict of str(dtype) -> BlockManager
+
+        Parameters
+        ----------
+        copy : boolean, default True
+
+        Returns
+        -------
+        values : a dict of dtype -> BlockManager
+
+        Notes
+        -----
+        This consolidates based on str(dtype)
+        """
+        self._consolidate_inplace()
+
+        bd = {}
+        for b in self.blocks:
+            bd.setdefault(str(b.dtype), []).append(b)
+
+        return {dtype: self.combine(blocks, copy=copy)
+                for dtype, blocks in bd.items()}
+
+    def xs(self, key, axis=1, copy=True, takeable=False):
+        if axis < 1:
+            raise AssertionError(
+                'Can only take xs across axis >= 1, got {ax}'.format(ax=axis))
+
+        # take by position
+        if takeable:
+            loc = key
+        else:
+            loc = self.axes[axis].get_loc(key)
+
+        slicer = [slice(None, None) for _ in range(self.ndim)]
+        slicer[axis] = loc
+        slicer = tuple(slicer)
+
+        new_axes = list(self.axes)
+
+        # could be an array indexer!
+        if isinstance(loc, (slice, np.ndarray)):
+            new_axes[axis] = new_axes[axis][loc]
+        else:
+            new_axes.pop(axis)
+
+        new_blocks = []
+        if len(self.blocks) > 1:
+            # we must copy here as we are mixed type
+            for blk in self.blocks:
+                newb = make_block(values=blk.values[slicer],
+                                  klass=blk.__class__,
+                                  placement=blk.mgr_locs)
+                new_blocks.append(newb)
+        elif len(self.blocks) == 1:
+            block = self.blocks[0]
+            vals = block.values[slicer]
+            if copy:
+                vals = vals.copy()
+            new_blocks = [make_block(values=vals,
+                                     placement=block.mgr_locs,
+                                     klass=block.__class__)]
+
+        return self.__class__(new_blocks, new_axes)
+
+    def fast_xs(self, loc):
+        """
+        get a cross sectional for a given location in the
+        items ; handle dups
+
+        return the result, is *could* be a view in the case of a
+        single block
+        """
+        if len(self.blocks) == 1:
+            return self.blocks[0].iget((slice(None), loc))
+
+        items = self.items
+
+        # non-unique (GH4726)
+        if not items.is_unique:
+            result = self._interleave()
+            if self.ndim == 2:
+                result = result.T
+            return result[loc]
+
+        # unique
+        dtype = _interleaved_dtype(self.blocks)
+
+        n = len(items)
+        if is_extension_array_dtype(dtype):
+            # we'll eventually construct an ExtensionArray.
+            result = np.empty(n, dtype=object)
+        else:
+            result = np.empty(n, dtype=dtype)
+
+        for blk in self.blocks:
+            # Such assignment may incorrectly coerce NaT to None
+            # result[blk.mgr_locs] = blk._slice((slice(None), loc))
+            for i, rl in enumerate(blk.mgr_locs):
+                result[rl] = blk._try_coerce_result(blk.iget((i, loc)))
+
+        if is_extension_array_dtype(dtype):
+            result = dtype.construct_array_type()._from_sequence(
+                result, dtype=dtype
+            )
+
+        return result
+
+    def consolidate(self):
+        """
+        Join together blocks having same dtype
+
+        Returns
+        -------
+        y : BlockManager
+        """
+        if self.is_consolidated():
+            return self
+
+        bm = self.__class__(self.blocks, self.axes)
+        bm._is_consolidated = False
+        bm._consolidate_inplace()
+        return bm
+
+    def _consolidate_inplace(self):
+        if not self.is_consolidated():
+            self.blocks = tuple(_consolidate(self.blocks))
+            self._is_consolidated = True
+            self._known_consolidated = True
+            self._rebuild_blknos_and_blklocs()
+
+    def get(self, item, fastpath=True):
+        """
+        Return values for selected item (ndarray or BlockManager).
+        """
+        if self.items.is_unique:
+
+            if not isna(item):
+                loc = self.items.get_loc(item)
+            else:
+                indexer = np.arange(len(self.items))[isna(self.items)]
+
+                # allow a single nan location indexer
+                if not is_scalar(indexer):
+                    if len(indexer) == 1:
+                        loc = indexer.item()
+                    else:
+                        raise ValueError("cannot label index with a null key")
+
+            return self.iget(loc, fastpath=fastpath)
+        else:
+
+            if isna(item):
+                raise TypeError("cannot label index with a null key")
+
+            indexer = self.items.get_indexer_for([item])
+            return self.reindex_indexer(new_axis=self.items[indexer],
+                                        indexer=indexer, axis=0,
+                                        allow_dups=True)
+
+    def iget(self, i, fastpath=True):
+        """
+        Return the data as a SingleBlockManager if fastpath=True and possible
+
+        Otherwise return as a ndarray
+        """
+        block = self.blocks[self._blknos[i]]
+        values = block.iget(self._blklocs[i])
+        if not fastpath or not block._box_to_block_values or values.ndim != 1:
+            return values
+
+        # fastpath shortcut for select a single-dim from a 2-dim BM
+        return SingleBlockManager(
+            [block.make_block_same_class(values,
+                                         placement=slice(0, len(values)),
+                                         ndim=1)],
+            self.axes[1])
+
+    def delete(self, item):
+        """
+        Delete selected item (items if non-unique) in-place.
+        """
+        indexer = self.items.get_loc(item)
+
+        is_deleted = np.zeros(self.shape[0], dtype=np.bool_)
+        is_deleted[indexer] = True
+        ref_loc_offset = -is_deleted.cumsum()
+
+        is_blk_deleted = [False] * len(self.blocks)
+
+        if isinstance(indexer, int):
+            affected_start = indexer
+        else:
+            affected_start = is_deleted.nonzero()[0][0]
+
+        for blkno, _ in _fast_count_smallints(self._blknos[affected_start:]):
+            blk = self.blocks[blkno]
+            bml = blk.mgr_locs
+            blk_del = is_deleted[bml.indexer].nonzero()[0]
+
+            if len(blk_del) == len(bml):
+                is_blk_deleted[blkno] = True
+                continue
+            elif len(blk_del) != 0:
+                blk.delete(blk_del)
+                bml = blk.mgr_locs
+
+            blk.mgr_locs = bml.add(ref_loc_offset[bml.indexer])
+
+        # FIXME: use Index.delete as soon as it uses fastpath=True
+        self.axes[0] = self.items[~is_deleted]
+        self.blocks = tuple(b for blkno, b in enumerate(self.blocks)
+                            if not is_blk_deleted[blkno])
+        self._shape = None
+        self._rebuild_blknos_and_blklocs()
+
+    def set(self, item, value):
+        """
+        Set new item in-place. Does not consolidate. Adds new Block if not
+        contained in the current set of items
+        """
+        # FIXME: refactor, clearly separate broadcasting & zip-like assignment
+        #        can prob also fix the various if tests for sparse/categorical
+
+        # TODO(EA): Remove an is_extension_ when all extension types satisfy
+        # the interface
+        value_is_extension_type = (is_extension_type(value) or
+                                   is_extension_array_dtype(value))
+
+        # categorical/spares/datetimetz
+        if value_is_extension_type:
+
+            def value_getitem(placement):
+                return value
+        else:
+            if value.ndim == self.ndim - 1:
+                value = _safe_reshape(value, (1,) + value.shape)
+
+                def value_getitem(placement):
+                    return value
+            else:
+
+                def value_getitem(placement):
+                    return value[placement.indexer]
+
+            if value.shape[1:] != self.shape[1:]:
+                raise AssertionError('Shape of new values must be compatible '
+                                     'with manager shape')
+
+        try:
+            loc = self.items.get_loc(item)
+        except KeyError:
+            # This item wasn't present, just insert at end
+            self.insert(len(self.items), item, value)
+            return
+
+        if isinstance(loc, int):
+            loc = [loc]
+
+        blknos = self._blknos[loc]
+        blklocs = self._blklocs[loc].copy()
+
+        unfit_mgr_locs = []
+        unfit_val_locs = []
+        removed_blknos = []
+        for blkno, val_locs in libinternals.get_blkno_placements(blknos,
+                                                                 self.nblocks,
+                                                                 group=True):
+            blk = self.blocks[blkno]
+            blk_locs = blklocs[val_locs.indexer]
+            if blk.should_store(value):
+                blk.set(blk_locs, value_getitem(val_locs))
+            else:
+                unfit_mgr_locs.append(blk.mgr_locs.as_array[blk_locs])
+                unfit_val_locs.append(val_locs)
+
+                # If all block items are unfit, schedule the block for removal.
+                if len(val_locs) == len(blk.mgr_locs):
+                    removed_blknos.append(blkno)
+                else:
+                    self._blklocs[blk.mgr_locs.indexer] = -1
+                    blk.delete(blk_locs)
+                    self._blklocs[blk.mgr_locs.indexer] = np.arange(len(blk))
+
+        if len(removed_blknos):
+            # Remove blocks & update blknos accordingly
+            is_deleted = np.zeros(self.nblocks, dtype=np.bool_)
+            is_deleted[removed_blknos] = True
+
+            new_blknos = np.empty(self.nblocks, dtype=np.int64)
+            new_blknos.fill(-1)
+            new_blknos[~is_deleted] = np.arange(self.nblocks -
+                                                len(removed_blknos))
+            self._blknos = algos.take_1d(new_blknos, self._blknos, axis=0,
+                                         allow_fill=False)
+            self.blocks = tuple(blk for i, blk in enumerate(self.blocks)
+                                if i not in set(removed_blknos))
+
+        if unfit_val_locs:
+            unfit_mgr_locs = np.concatenate(unfit_mgr_locs)
+            unfit_count = len(unfit_mgr_locs)
+
+            new_blocks = []
+            if value_is_extension_type:
+                # This code (ab-)uses the fact that sparse blocks contain only
+                # one item.
+                new_blocks.extend(
+                    make_block(values=value.copy(), ndim=self.ndim,
+                               placement=slice(mgr_loc, mgr_loc + 1))
+                    for mgr_loc in unfit_mgr_locs)
+
+                self._blknos[unfit_mgr_locs] = (np.arange(unfit_count) +
+                                                len(self.blocks))
+                self._blklocs[unfit_mgr_locs] = 0
+
+            else:
+                # unfit_val_locs contains BlockPlacement objects
+                unfit_val_items = unfit_val_locs[0].append(unfit_val_locs[1:])
+
+                new_blocks.append(
+                    make_block(values=value_getitem(unfit_val_items),
+                               ndim=self.ndim, placement=unfit_mgr_locs))
+
+                self._blknos[unfit_mgr_locs] = len(self.blocks)
+                self._blklocs[unfit_mgr_locs] = np.arange(unfit_count)
+
+            self.blocks += tuple(new_blocks)
+
+            # Newly created block's dtype may already be present.
+            self._known_consolidated = False
+
+    def insert(self, loc, item, value, allow_duplicates=False):
+        """
+        Insert item at selected position.
+
+        Parameters
+        ----------
+        loc : int
+        item : hashable
+        value : array_like
+        allow_duplicates: bool
+            If False, trying to insert non-unique item will raise
+
+        """
+        if not allow_duplicates and item in self.items:
+            # Should this be a different kind of error??
+            raise ValueError('cannot insert {}, already exists'.format(item))
+
+        if not isinstance(loc, int):
+            raise TypeError("loc must be int")
+
+        # insert to the axis; this could possibly raise a TypeError
+        new_axis = self.items.insert(loc, item)
+
+        block = make_block(values=value, ndim=self.ndim,
+                           placement=slice(loc, loc + 1))
+
+        for blkno, count in _fast_count_smallints(self._blknos[loc:]):
+            blk = self.blocks[blkno]
+            if count == len(blk.mgr_locs):
+                blk.mgr_locs = blk.mgr_locs.add(1)
+            else:
+                new_mgr_locs = blk.mgr_locs.as_array.copy()
+                new_mgr_locs[new_mgr_locs >= loc] += 1
+                blk.mgr_locs = new_mgr_locs
+
+        if loc == self._blklocs.shape[0]:
+            # np.append is a lot faster, let's use it if we can.
+            self._blklocs = np.append(self._blklocs, 0)
+            self._blknos = np.append(self._blknos, len(self.blocks))
+        else:
+            self._blklocs = np.insert(self._blklocs, loc, 0)
+            self._blknos = np.insert(self._blknos, loc, len(self.blocks))
+
+        self.axes[0] = new_axis
+        self.blocks += (block,)
+        self._shape = None
+
+        self._known_consolidated = False
+
+        if len(self.blocks) > 100:
+            self._consolidate_inplace()
+
+    def reindex_axis(self, new_index, axis, method=None, limit=None,
+                     fill_value=None, copy=True):
+        """
+        Conform block manager to new index.
+        """
+        new_index = ensure_index(new_index)
+        new_index, indexer = self.axes[axis].reindex(new_index, method=method,
+                                                     limit=limit)
+
+        return self.reindex_indexer(new_index, indexer, axis=axis,
+                                    fill_value=fill_value, copy=copy)
+
+    def reindex_indexer(self, new_axis, indexer, axis, fill_value=None,
+                        allow_dups=False, copy=True):
+        """
+        Parameters
+        ----------
+        new_axis : Index
+        indexer : ndarray of int64 or None
+        axis : int
+        fill_value : object
+        allow_dups : bool
+
+        pandas-indexer with -1's only.
+        """
+        if indexer is None:
+            if new_axis is self.axes[axis] and not copy:
+                return self
+
+            result = self.copy(deep=copy)
+            result.axes = list(self.axes)
+            result.axes[axis] = new_axis
+            return result
+
+        self._consolidate_inplace()
+
+        # some axes don't allow reindexing with dups
+        if not allow_dups:
+            self.axes[axis]._can_reindex(indexer)
+
+        if axis >= self.ndim:
+            raise IndexError("Requested axis not found in manager")
+
+        if axis == 0:
+            new_blocks = self._slice_take_blocks_ax0(indexer,
+                                                     fill_tuple=(fill_value,))
+        else:
+            new_blocks = [blk.take_nd(indexer, axis=axis, fill_tuple=(
+                fill_value if fill_value is not None else blk.fill_value,))
+                for blk in self.blocks]
+
+        new_axes = list(self.axes)
+        new_axes[axis] = new_axis
+        return self.__class__(new_blocks, new_axes)
+
+    def _slice_take_blocks_ax0(self, slice_or_indexer, fill_tuple=None):
+        """
+        Slice/take blocks along axis=0.
+
+        Overloaded for SingleBlock
+
+        Returns
+        -------
+        new_blocks : list of Block
+
+        """
+
+        allow_fill = fill_tuple is not None
+
+        sl_type, slobj, sllen = _preprocess_slice_or_indexer(
+            slice_or_indexer, self.shape[0], allow_fill=allow_fill)
+
+        if self._is_single_block:
+            blk = self.blocks[0]
+
+            if sl_type in ('slice', 'mask'):
+                return [blk.getitem_block(slobj, new_mgr_locs=slice(0, sllen))]
+            elif not allow_fill or self.ndim == 1:
+                if allow_fill and fill_tuple[0] is None:
+                    _, fill_value = maybe_promote(blk.dtype)
+                    fill_tuple = (fill_value, )
+
+                return [blk.take_nd(slobj, axis=0,
+                                    new_mgr_locs=slice(0, sllen),
+                                    fill_tuple=fill_tuple)]
+
+        if sl_type in ('slice', 'mask'):
+            blknos = self._blknos[slobj]
+            blklocs = self._blklocs[slobj]
+        else:
+            blknos = algos.take_1d(self._blknos, slobj, fill_value=-1,
+                                   allow_fill=allow_fill)
+            blklocs = algos.take_1d(self._blklocs, slobj, fill_value=-1,
+                                    allow_fill=allow_fill)
+
+        # When filling blknos, make sure blknos is updated before appending to
+        # blocks list, that way new blkno is exactly len(blocks).
+        #
+        # FIXME: mgr_groupby_blknos must return mgr_locs in ascending order,
+        # pytables serialization will break otherwise.
+        blocks = []
+        for blkno, mgr_locs in libinternals.get_blkno_placements(blknos,
+                                                                 self.nblocks,
+                                                                 group=True):
+            if blkno == -1:
+                # If we've got here, fill_tuple was not None.
+                fill_value = fill_tuple[0]
+
+                blocks.append(self._make_na_block(placement=mgr_locs,
+                                                  fill_value=fill_value))
+            else:
+                blk = self.blocks[blkno]
+
+                # Otherwise, slicing along items axis is necessary.
+                if not blk._can_consolidate:
+                    # A non-consolidatable block, it's easy, because there's
+                    # only one item and each mgr loc is a copy of that single
+                    # item.
+                    for mgr_loc in mgr_locs:
+                        newblk = blk.copy(deep=True)
+                        newblk.mgr_locs = slice(mgr_loc, mgr_loc + 1)
+                        blocks.append(newblk)
+
+                else:
+                    blocks.append(blk.take_nd(blklocs[mgr_locs.indexer],
+                                              axis=0, new_mgr_locs=mgr_locs,
+                                              fill_tuple=None))
+
+        return blocks
+
+    def _make_na_block(self, placement, fill_value=None):
+        # TODO: infer dtypes other than float64 from fill_value
+
+        if fill_value is None:
+            fill_value = np.nan
+        block_shape = list(self.shape)
+        block_shape[0] = len(placement)
+
+        dtype, fill_value = infer_dtype_from_scalar(fill_value)
+        block_values = np.empty(block_shape, dtype=dtype)
+        block_values.fill(fill_value)
+        return make_block(block_values, placement=placement)
+
+    def take(self, indexer, axis=1, verify=True, convert=True):
+        """
+        Take items along any axis.
+        """
+        self._consolidate_inplace()
+        indexer = (np.arange(indexer.start, indexer.stop, indexer.step,
+                             dtype='int64')
+                   if isinstance(indexer, slice)
+                   else np.asanyarray(indexer, dtype='int64'))
+
+        n = self.shape[axis]
+        if convert:
+            indexer = maybe_convert_indices(indexer, n)
+
+        if verify:
+            if ((indexer == -1) | (indexer >= n)).any():
+                raise Exception('Indices must be nonzero and less than '
+                                'the axis length')
+
+        new_labels = self.axes[axis].take(indexer)
+        return self.reindex_indexer(new_axis=new_labels, indexer=indexer,
+                                    axis=axis, allow_dups=True)
+
+    def merge(self, other, lsuffix='', rsuffix=''):
+        # We assume at this point that the axes of self and other match.
+        # This is only called from Panel.join, which reindexes prior
+        # to calling to ensure this assumption holds.
+        l, r = items_overlap_with_suffix(left=self.items, lsuffix=lsuffix,
+                                         right=other.items, rsuffix=rsuffix)
+        new_items = _concat_indexes([l, r])
+
+        new_blocks = [blk.copy(deep=False) for blk in self.blocks]
+
+        offset = self.shape[0]
+        for blk in other.blocks:
+            blk = blk.copy(deep=False)
+            blk.mgr_locs = blk.mgr_locs.add(offset)
+            new_blocks.append(blk)
+
+        new_axes = list(self.axes)
+        new_axes[0] = new_items
+
+        return self.__class__(_consolidate(new_blocks), new_axes)
+
+    def equals(self, other):
+        self_axes, other_axes = self.axes, other.axes
+        if len(self_axes) != len(other_axes):
+            return False
+        if not all(ax1.equals(ax2) for ax1, ax2 in zip(self_axes, other_axes)):
+            return False
+        self._consolidate_inplace()
+        other._consolidate_inplace()
+        if len(self.blocks) != len(other.blocks):
+            return False
+
+        # canonicalize block order, using a tuple combining the type
+        # name and then mgr_locs because there might be unconsolidated
+        # blocks (say, Categorical) which can only be distinguished by
+        # the iteration order
+        def canonicalize(block):
+            return (block.dtype.name, block.mgr_locs.as_array.tolist())
+
+        self_blocks = sorted(self.blocks, key=canonicalize)
+        other_blocks = sorted(other.blocks, key=canonicalize)
+        return all(block.equals(oblock)
+                   for block, oblock in zip(self_blocks, other_blocks))
+
+    def unstack(self, unstacker_func, fill_value):
+        """Return a blockmanager with all blocks unstacked.
+
+        Parameters
+        ----------
+        unstacker_func : callable
+            A (partially-applied) ``pd.core.reshape._Unstacker`` class.
+        fill_value : Any
+            fill_value for newly introduced missing values.
+
+        Returns
+        -------
+        unstacked : BlockManager
+        """
+        n_rows = self.shape[-1]
+        dummy = unstacker_func(np.empty((0, 0)), value_columns=self.items)
+        new_columns = dummy.get_new_columns()
+        new_index = dummy.get_new_index()
+        new_blocks = []
+        columns_mask = []
+
+        for blk in self.blocks:
+            blocks, mask = blk._unstack(
+                partial(unstacker_func,
+                        value_columns=self.items[blk.mgr_locs.indexer]),
+                new_columns,
+                n_rows,
+                fill_value
+            )
+
+            new_blocks.extend(blocks)
+            columns_mask.extend(mask)
+
+        new_columns = new_columns[columns_mask]
+
+        bm = BlockManager(new_blocks, [new_columns, new_index])
+        return bm
+
+
+class SingleBlockManager(BlockManager):
+    """ manage a single block with """
+
+    ndim = 1
+    _is_consolidated = True
+    _known_consolidated = True
+    __slots__ = ()
+
+    def __init__(self, block, axis, do_integrity_check=False, fastpath=False):
+
+        if isinstance(axis, list):
+            if len(axis) != 1:
+                raise ValueError("cannot create SingleBlockManager with more "
+                                 "than 1 axis")
+            axis = axis[0]
+
+        # passed from constructor, single block, single axis
+        if fastpath:
+            self.axes = [axis]
+            if isinstance(block, list):
+
+                # empty block
+                if len(block) == 0:
+                    block = [np.array([])]
+                elif len(block) != 1:
+                    raise ValueError('Cannot create SingleBlockManager with '
+                                     'more than 1 block')
+                block = block[0]
+        else:
+            self.axes = [ensure_index(axis)]
+
+            # create the block here
+            if isinstance(block, list):
+
+                # provide consolidation to the interleaved_dtype
+                if len(block) > 1:
+                    dtype = _interleaved_dtype(block)
+                    block = [b.astype(dtype) for b in block]
+                    block = _consolidate(block)
+
+                if len(block) != 1:
+                    raise ValueError('Cannot create SingleBlockManager with '
+                                     'more than 1 block')
+                block = block[0]
+
+        if not isinstance(block, Block):
+            block = make_block(block, placement=slice(0, len(axis)), ndim=1)
+
+        self.blocks = [block]
+
+    def _post_setstate(self):
+        pass
+
+    @property
+    def _block(self):
+        return self.blocks[0]
+
+    @property
+    def _values(self):
+        return self._block.values
+
+    @property
+    def _blknos(self):
+        """ compat with BlockManager """
+        return None
+
+    @property
+    def _blklocs(self):
+        """ compat with BlockManager """
+        return None
+
+    def get_slice(self, slobj, axis=0):
+        if axis >= self.ndim:
+            raise IndexError("Requested axis not found in manager")
+
+        return self.__class__(self._block._slice(slobj),
+                              self.index[slobj], fastpath=True)
+
+    @property
+    def index(self):
+        return self.axes[0]
+
+    def convert(self, **kwargs):
+        """ convert the whole block as one """
+        kwargs['by_item'] = False
+        return self.apply('convert', **kwargs)
+
+    @property
+    def dtype(self):
+        return self._block.dtype
+
+    @property
+    def array_dtype(self):
+        return self._block.array_dtype
+
+    @property
+    def ftype(self):
+        return self._block.ftype
+
+    def get_dtype_counts(self):
+        return {self.dtype.name: 1}
+
+    def get_ftype_counts(self):
+        return {self.ftype: 1}
+
+    def get_dtypes(self):
+        return np.array([self._block.dtype])
+
+    def get_ftypes(self):
+        return np.array([self._block.ftype])
+
+    def external_values(self):
+        return self._block.external_values()
+
+    def internal_values(self):
+        return self._block.internal_values()
+
+    def formatting_values(self):
+        """Return the internal values used by the DataFrame/SeriesFormatter"""
+        return self._block.formatting_values()
+
+    def get_values(self):
+        """ return a dense type view """
+        return np.array(self._block.to_dense(), copy=False)
+
+    @property
+    def asobject(self):
+        """
+        return a object dtype array. datetime/timedelta like values are boxed
+        to Timestamp/Timedelta instances.
+        """
+        return self._block.get_values(dtype=object)
+
+    @property
+    def _can_hold_na(self):
+        return self._block._can_hold_na
+
+    def is_consolidated(self):
+        return True
+
+    def _consolidate_check(self):
+        pass
+
+    def _consolidate_inplace(self):
+        pass
+
+    def delete(self, item):
+        """
+        Delete single item from SingleBlockManager.
+
+        Ensures that self.blocks doesn't become empty.
+        """
+        loc = self.items.get_loc(item)
+        self._block.delete(loc)
+        self.axes[0] = self.axes[0].delete(loc)
+
+    def fast_xs(self, loc):
+        """
+        fast path for getting a cross-section
+        return a view of the data
+        """
+        return self._block.values[loc]
+
+    def concat(self, to_concat, new_axis):
+        """
+        Concatenate a list of SingleBlockManagers into a single
+        SingleBlockManager.
+
+        Used for pd.concat of Series objects with axis=0.
+
+        Parameters
+        ----------
+        to_concat : list of SingleBlockManagers
+        new_axis : Index of the result
+
+        Returns
+        -------
+        SingleBlockManager
+
+        """
+        non_empties = [x for x in to_concat if len(x) > 0]
+
+        # check if all series are of the same block type:
+        if len(non_empties) > 0:
+            blocks = [obj.blocks[0] for obj in non_empties]
+            if len({b.dtype for b in blocks}) == 1:
+                new_block = blocks[0].concat_same_type(blocks)
+            else:
+                values = [x.values for x in blocks]
+                values = _concat._concat_compat(values)
+                new_block = make_block(
+                    values, placement=slice(0, len(values), 1))
+        else:
+            values = [x._block.values for x in to_concat]
+            values = _concat._concat_compat(values)
+            new_block = make_block(
+                values, placement=slice(0, len(values), 1))
+
+        mgr = SingleBlockManager(new_block, new_axis)
+        return mgr
+
+
+# --------------------------------------------------------------------
+# Constructor Helpers
+
+def create_block_manager_from_blocks(blocks, axes):
+    try:
+        if len(blocks) == 1 and not isinstance(blocks[0], Block):
+            # if blocks[0] is of length 0, return empty blocks
+            if not len(blocks[0]):
+                blocks = []
+            else:
+                # It's OK if a single block is passed as values, its placement
+                # is basically "all items", but if there're many, don't bother
+                # converting, it's an error anyway.
+                blocks = [make_block(values=blocks[0],
+                                     placement=slice(0, len(axes[0])))]
+
+        mgr = BlockManager(blocks, axes)
+        mgr._consolidate_inplace()
+        return mgr
+
+    except (ValueError) as e:
+        blocks = [getattr(b, 'values', b) for b in blocks]
+        tot_items = sum(b.shape[0] for b in blocks)
+        construction_error(tot_items, blocks[0].shape[1:], axes, e)
+
+
+def create_block_manager_from_arrays(arrays, names, axes):
+
+    try:
+        blocks = form_blocks(arrays, names, axes)
+        mgr = BlockManager(blocks, axes)
+        mgr._consolidate_inplace()
+        return mgr
+    except ValueError as e:
+        construction_error(len(arrays), arrays[0].shape, axes, e)
+
+
+def construction_error(tot_items, block_shape, axes, e=None):
+    """ raise a helpful message about our construction """
+    passed = tuple(map(int, [tot_items] + list(block_shape)))
+    # Correcting the user facing error message during dataframe construction
+    if len(passed) <= 2:
+        passed = passed[::-1]
+
+    implied = tuple(len(ax) for ax in axes)
+    # Correcting the user facing error message during dataframe construction
+    if len(implied) <= 2:
+        implied = implied[::-1]
+
+    if passed == implied and e is not None:
+        raise e
+    if block_shape[0] == 0:
+        raise ValueError("Empty data passed with indices specified.")
+    raise ValueError("Shape of passed values is {0}, indices imply {1}".format(
+        passed, implied))
+
+
+# -----------------------------------------------------------------------
+
+def form_blocks(arrays, names, axes):
+    # put "leftover" items in float bucket, where else?
+    # generalize?
+    items_dict = defaultdict(list)
+    extra_locs = []
+
+    names_idx = ensure_index(names)
+    if names_idx.equals(axes[0]):
+        names_indexer = np.arange(len(names_idx))
+    else:
+        assert names_idx.intersection(axes[0]).is_unique
+        names_indexer = names_idx.get_indexer_for(axes[0])
+
+    for i, name_idx in enumerate(names_indexer):
+        if name_idx == -1:
+            extra_locs.append(i)
+            continue
+
+        k = names[name_idx]
+        v = arrays[name_idx]
+
+        block_type = get_block_type(v)
+        items_dict[block_type.__name__].append((i, k, v))
+
+    blocks = []
+    if len(items_dict['FloatBlock']):
+        float_blocks = _multi_blockify(items_dict['FloatBlock'])
+        blocks.extend(float_blocks)
+
+    if len(items_dict['ComplexBlock']):
+        complex_blocks = _multi_blockify(items_dict['ComplexBlock'])
+        blocks.extend(complex_blocks)
+
+    if len(items_dict['TimeDeltaBlock']):
+        timedelta_blocks = _multi_blockify(items_dict['TimeDeltaBlock'])
+        blocks.extend(timedelta_blocks)
+
+    if len(items_dict['IntBlock']):
+        int_blocks = _multi_blockify(items_dict['IntBlock'])
+        blocks.extend(int_blocks)
+
+    if len(items_dict['DatetimeBlock']):
+        datetime_blocks = _simple_blockify(items_dict['DatetimeBlock'],
+                                           _NS_DTYPE)
+        blocks.extend(datetime_blocks)
+
+    if len(items_dict['DatetimeTZBlock']):
+        dttz_blocks = [make_block(array,
+                                  klass=DatetimeTZBlock,
+                                  placement=[i])
+                       for i, _, array in items_dict['DatetimeTZBlock']]
+        blocks.extend(dttz_blocks)
+
+    if len(items_dict['BoolBlock']):
+        bool_blocks = _simple_blockify(items_dict['BoolBlock'], np.bool_)
+        blocks.extend(bool_blocks)
+
+    if len(items_dict['ObjectBlock']) > 0:
+        object_blocks = _simple_blockify(items_dict['ObjectBlock'], np.object_)
+        blocks.extend(object_blocks)
+
+    if len(items_dict['SparseBlock']) > 0:
+        sparse_blocks = _sparse_blockify(items_dict['SparseBlock'])
+        blocks.extend(sparse_blocks)
+
+    if len(items_dict['CategoricalBlock']) > 0:
+        cat_blocks = [make_block(array, klass=CategoricalBlock, placement=[i])
+                      for i, _, array in items_dict['CategoricalBlock']]
+        blocks.extend(cat_blocks)
+
+    if len(items_dict['ExtensionBlock']):
+
+        external_blocks = [
+            make_block(array, klass=ExtensionBlock, placement=[i])
+            for i, _, array in items_dict['ExtensionBlock']
+        ]
+
+        blocks.extend(external_blocks)
+
+    if len(items_dict['ObjectValuesExtensionBlock']):
+        external_blocks = [
+            make_block(array, klass=ObjectValuesExtensionBlock, placement=[i])
+            for i, _, array in items_dict['ObjectValuesExtensionBlock']
+        ]
+
+        blocks.extend(external_blocks)
+
+    if len(extra_locs):
+        shape = (len(extra_locs),) + tuple(len(x) for x in axes[1:])
+
+        # empty items -> dtype object
+        block_values = np.empty(shape, dtype=object)
+        block_values.fill(np.nan)
+
+        na_block = make_block(block_values, placement=extra_locs)
+        blocks.append(na_block)
+
+    return blocks
+
+
+def _simple_blockify(tuples, dtype):
+    """ return a single array of a block that has a single dtype; if dtype is
+    not None, coerce to this dtype
+    """
+    values, placement = _stack_arrays(tuples, dtype)
+
+    # CHECK DTYPE?
+    if dtype is not None and values.dtype != dtype:  # pragma: no cover
+        values = values.astype(dtype)
+
+    block = make_block(values, placement=placement)
+    return [block]
+
+
+def _multi_blockify(tuples, dtype=None):
+    """ return an array of blocks that potentially have different dtypes """
+
+    # group by dtype
+    grouper = itertools.groupby(tuples, lambda x: x[2].dtype)
+
+    new_blocks = []
+    for dtype, tup_block in grouper:
+
+        values, placement = _stack_arrays(list(tup_block), dtype)
+
+        block = make_block(values, placement=placement)
+        new_blocks.append(block)
+
+    return new_blocks
+
+
+def _sparse_blockify(tuples, dtype=None):
+    """ return an array of blocks that potentially have different dtypes (and
+    are sparse)
+    """
+
+    new_blocks = []
+    for i, names, array in tuples:
+        array = _maybe_to_sparse(array)
+        block = make_block(array, placement=[i])
+        new_blocks.append(block)
+
+    return new_blocks
+
+
+def _stack_arrays(tuples, dtype):
+
+    # fml
+    def _asarray_compat(x):
+        if isinstance(x, ABCSeries):
+            return x._values
+        else:
+            return np.asarray(x)
+
+    def _shape_compat(x):
+        if isinstance(x, ABCSeries):
+            return len(x),
+        else:
+            return x.shape
+
+    placement, names, arrays = zip(*tuples)
+
+    first = arrays[0]
+    shape = (len(arrays),) + _shape_compat(first)
+
+    stacked = np.empty(shape, dtype=dtype)
+    for i, arr in enumerate(arrays):
+        stacked[i] = _asarray_compat(arr)
+
+    return stacked, placement
+
+
+def _interleaved_dtype(blocks):
+    # type: (List[Block]) -> Optional[Union[np.dtype, ExtensionDtype]]
+    """Find the common dtype for `blocks`.
+
+    Parameters
+    ----------
+    blocks : List[Block]
+
+    Returns
+    -------
+    dtype : Optional[Union[np.dtype, ExtensionDtype]]
+        None is returned when `blocks` is empty.
+    """
+    if not len(blocks):
+        return None
+
+    return find_common_type([b.dtype for b in blocks])
+
+
+def _consolidate(blocks):
+    """
+    Merge blocks having same dtype, exclude non-consolidating blocks
+    """
+
+    # sort by _can_consolidate, dtype
+    gkey = lambda x: x._consolidate_key
+    grouper = itertools.groupby(sorted(blocks, key=gkey), gkey)
+
+    new_blocks = []
+    for (_can_consolidate, dtype), group_blocks in grouper:
+        merged_blocks = _merge_blocks(list(group_blocks), dtype=dtype,
+                                      _can_consolidate=_can_consolidate)
+        new_blocks = _extend_blocks(merged_blocks, new_blocks)
+    return new_blocks
+
+
+def _compare_or_regex_search(a, b, regex=False):
+    """
+    Compare two array_like inputs of the same shape or two scalar values
+
+    Calls operator.eq or re.search, depending on regex argument. If regex is
+    True, perform an element-wise regex matching.
+
+    Parameters
+    ----------
+    a : array_like or scalar
+    b : array_like or scalar
+    regex : bool, default False
+
+    Returns
+    -------
+    mask : array_like of bool
+    """
+    if not regex:
+        op = lambda x: operator.eq(x, b)
+    else:
+        op = np.vectorize(lambda x: bool(re.search(b, x)) if isinstance(x, str)
+                          else False)
+
+    is_a_array = isinstance(a, np.ndarray)
+    is_b_array = isinstance(b, np.ndarray)
+
+    # numpy deprecation warning to have i8 vs integer comparisons
+    if is_datetimelike_v_numeric(a, b):
+        result = False
+
+    # numpy deprecation warning if comparing numeric vs string-like
+    elif is_numeric_v_string_like(a, b):
+        result = False
+    else:
+        result = op(a)
+
+    if is_scalar(result) and (is_a_array or is_b_array):
+        type_names = [type(a).__name__, type(b).__name__]
+
+        if is_a_array:
+            type_names[0] = 'ndarray(dtype={dtype})'.format(dtype=a.dtype)
+
+        if is_b_array:
+            type_names[1] = 'ndarray(dtype={dtype})'.format(dtype=b.dtype)
+
+        raise TypeError(
+            "Cannot compare types {a!r} and {b!r}".format(a=type_names[0],
+                                                          b=type_names[1]))
+    return result
+
+
+def _concat_indexes(indexes):
+    return indexes[0].append(indexes[1:])
+
+
+def items_overlap_with_suffix(left, lsuffix, right, rsuffix):
+    """
+    If two indices overlap, add suffixes to overlapping entries.
+
+    If corresponding suffix is empty, the entry is simply converted to string.
+
+    """
+    to_rename = left.intersection(right)
+    if len(to_rename) == 0:
+        return left, right
+    else:
+        if not lsuffix and not rsuffix:
+            raise ValueError('columns overlap but no suffix specified: '
+                             '{rename}'.format(rename=to_rename))
+
+        def renamer(x, suffix):
+            """Rename the left and right indices.
+
+            If there is overlap, and suffix is not None, add
+            suffix, otherwise, leave it as-is.
+
+            Parameters
+            ----------
+            x : original column name
+            suffix : str or None
+
+            Returns
+            -------
+            x : renamed column name
+            """
+            if x in to_rename and suffix is not None:
+                return '{x}{suffix}'.format(x=x, suffix=suffix)
+            return x
+
+        lrenamer = partial(renamer, suffix=lsuffix)
+        rrenamer = partial(renamer, suffix=rsuffix)
+
+        return (_transform_index(left, lrenamer),
+                _transform_index(right, rrenamer))
+
+
+def _transform_index(index, func, level=None):
+    """
+    Apply function to all values found in index.
+
+    This includes transforming multiindex entries separately.
+    Only apply function to one level of the MultiIndex if level is specified.
+
+    """
+    if isinstance(index, MultiIndex):
+        if level is not None:
+            items = [tuple(func(y) if i == level else y
+                           for i, y in enumerate(x)) for x in index]
+        else:
+            items = [tuple(func(y) for y in x) for x in index]
+        return MultiIndex.from_tuples(items, names=index.names)
+    else:
+        items = [func(x) for x in index]
+        return Index(items, name=index.name, tupleize_cols=False)
+
+
+def _fast_count_smallints(arr):
+    """Faster version of set(arr) for sequences of small numbers."""
+    counts = np.bincount(arr.astype(np.int_))
+    nz = counts.nonzero()[0]
+    return np.c_[nz, counts[nz]]
+
+
+def _preprocess_slice_or_indexer(slice_or_indexer, length, allow_fill):
+    if isinstance(slice_or_indexer, slice):
+        return ('slice', slice_or_indexer,
+                libinternals.slice_len(slice_or_indexer, length))
+    elif (isinstance(slice_or_indexer, np.ndarray) and
+          slice_or_indexer.dtype == np.bool_):
+        return 'mask', slice_or_indexer, slice_or_indexer.sum()
+    else:
+        indexer = np.asanyarray(slice_or_indexer, dtype=np.int64)
+        if not allow_fill:
+            indexer = maybe_convert_indices(indexer, length)
+        return 'fancy', indexer, len(indexer)
+
+
+def concatenate_block_managers(mgrs_indexers, axes, concat_axis, copy):
+    """
+    Concatenate block managers into one.
+
+    Parameters
+    ----------
+    mgrs_indexers : list of (BlockManager, {axis: indexer,...}) tuples
+    axes : list of Index
+    concat_axis : int
+    copy : bool
+
+    """
+    concat_plans = [get_mgr_concatenation_plan(mgr, indexers)
+                    for mgr, indexers in mgrs_indexers]
+    concat_plan = combine_concat_plans(concat_plans, concat_axis)
+    blocks = []
+
+    for placement, join_units in concat_plan:
+
+        if len(join_units) == 1 and not join_units[0].indexers:
+            b = join_units[0].block
+            values = b.values
+            if copy:
+                values = values.copy()
+            elif not copy:
+                values = values.view()
+            b = b.make_block_same_class(values, placement=placement)
+        elif is_uniform_join_units(join_units):
+            b = join_units[0].block.concat_same_type(
+                [ju.block for ju in join_units], placement=placement)
+        else:
+            b = make_block(
+                concatenate_join_units(join_units, concat_axis, copy=copy),
+                placement=placement)
+        blocks.append(b)
+
+    return BlockManager(blocks, axes)
diff --git a/pandas/core/missing.py b/pandas/core/missing.py
index 91039f3270af2..9acdb1a06b2d1 100644
--- a/pandas/core/missing.py
+++ b/pandas/core/missing.py
@@ -1,25 +1,20 @@
 """
-Routines for filling missing data
+Routines for filling missing data.
 """
+from distutils.version import LooseVersion
+import operator
 
 import numpy as np
-from distutils.version import LooseVersion
 
 from pandas._libs import algos, lib
-
 from pandas.compat import range, string_types
-from pandas.types.common import (is_numeric_v_string_like,
-                                 is_float_dtype,
-                                 is_datetime64_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_integer_dtype,
-                                 is_scalar,
-                                 is_integer,
-                                 needs_i8_conversion,
-                                 _ensure_float64)
 
-from pandas.types.cast import infer_dtype_from_array
-from pandas.types.missing import isnull
+from pandas.core.dtypes.cast import infer_dtype_from_array
+from pandas.core.dtypes.common import (
+    ensure_float64, is_datetime64_dtype, is_datetime64tz_dtype, is_float_dtype,
+    is_integer, is_integer_dtype, is_numeric_v_string_like, is_scalar,
+    is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.missing import isna
 
 
 def mask_missing(arr, values_to_mask):
@@ -35,7 +30,7 @@ def mask_missing(arr, values_to_mask):
     except Exception:
         values_to_mask = np.array(values_to_mask, dtype=object)
 
-    na_mask = isnull(values_to_mask)
+    na_mask = isna(values_to_mask)
     nonna = values_to_mask[~na_mask]
 
     mask = None
@@ -62,9 +57,13 @@ def mask_missing(arr, values_to_mask):
 
     if na_mask.any():
         if mask is None:
-            mask = isnull(arr)
+            mask = isna(arr)
         else:
-            mask |= isnull(arr)
+            mask |= isna(arr)
+
+    # GH 21977
+    if mask is None:
+        mask = np.zeros(arr.shape, dtype=bool)
 
     return mask
 
@@ -87,8 +86,8 @@ def clean_fill_method(method, allow_nearest=False):
         valid_methods.append('nearest')
         expecting = 'pad (ffill), backfill (bfill) or nearest'
     if method not in valid_methods:
-        msg = ('Invalid fill method. Expecting %s. Got %s' %
-               (expecting, method))
+        msg = ('Invalid fill method. Expecting {expecting}. Got {method}'
+               .format(expecting=expecting, method=method))
         raise ValueError(msg)
     return method
 
@@ -103,30 +102,30 @@ def clean_interp_method(method, **kwargs):
         raise ValueError("You must specify the order of the spline or "
                          "polynomial.")
     if method not in valid:
-        raise ValueError("method must be one of {0}."
-                         "Got '{1}' instead.".format(valid, method))
+        raise ValueError("method must be one of {valid}. Got '{method}' "
+                         "instead.".format(valid=valid, method=method))
 
     return method
 
 
 def interpolate_1d(xvalues, yvalues, method='linear', limit=None,
-                   limit_direction='forward', fill_value=None,
+                   limit_direction='forward', limit_area=None, fill_value=None,
                    bounds_error=False, order=None, **kwargs):
     """
     Logic for the 1-d interpolation.  The result should be 1-d, inputs
     xvalues and yvalues will each be 1-d arrays of the same length.
 
     Bounds_error is currently hardcoded to False since non-scipy ones don't
-    take it as an argumnet.
+    take it as an argument.
     """
     # Treat the original, non-scipy methods first.
 
-    invalid = isnull(yvalues)
+    invalid = isna(yvalues)
     valid = ~invalid
 
     if not valid.any():
         # have to call np.asarray(xvalues) since xvalues could be an Index
-        # which cant be mutated
+        # which can't be mutated
         result = np.empty_like(np.asarray(xvalues), dtype=np.float64)
         result.fill(np.nan)
         return result
@@ -142,52 +141,67 @@ def interpolate_1d(xvalues, yvalues, method='linear', limit=None,
                              'DatetimeIndex')
         method = 'values'
 
-    def _interp_limit(invalid, fw_limit, bw_limit):
-        "Get idx of values that won't be filled b/c they exceed the limits."
-        for x in np.where(invalid)[0]:
-            if invalid[max(0, x - fw_limit):x + bw_limit + 1].all():
-                yield x
-
     valid_limit_directions = ['forward', 'backward', 'both']
     limit_direction = limit_direction.lower()
     if limit_direction not in valid_limit_directions:
-        raise ValueError('Invalid limit_direction: expecting one of %r, got '
-                         '%r.' % (valid_limit_directions, limit_direction))
+        msg = ('Invalid limit_direction: expecting one of {valid!r}, '
+               'got {invalid!r}.')
+        raise ValueError(msg.format(valid=valid_limit_directions,
+                                    invalid=limit_direction))
+
+    if limit_area is not None:
+        valid_limit_areas = ['inside', 'outside']
+        limit_area = limit_area.lower()
+        if limit_area not in valid_limit_areas:
+            raise ValueError('Invalid limit_area: expecting one of {}, got '
+                             '{}.'.format(valid_limit_areas, limit_area))
+
+    # default limit is unlimited GH #16282
+    if limit is None:
+        # limit = len(xvalues)
+        pass
+    elif not is_integer(limit):
+        raise ValueError('Limit must be an integer')
+    elif limit < 1:
+        raise ValueError('Limit must be greater than 0')
 
     from pandas import Series
     ys = Series(yvalues)
+
+    # These are sets of index pointers to invalid values... i.e. {0, 1, etc...
+    all_nans = set(np.flatnonzero(invalid))
     start_nans = set(range(ys.first_valid_index()))
     end_nans = set(range(1 + ys.last_valid_index(), len(valid)))
+    mid_nans = all_nans - start_nans - end_nans
+
+    # Like the sets above, preserve_nans contains indices of invalid values,
+    # but in this case, it is the final set of indices that need to be
+    # preserved as NaN after the interpolation.
+
+    # For example if limit_direction='forward' then preserve_nans will
+    # contain indices of NaNs at the beginning of the series, and NaNs that
+    # are more than'limit' away from the prior non-NaN.
+
+    # set preserve_nans based on direction using _interp_limit
+    if limit_direction == 'forward':
+        preserve_nans = start_nans | set(_interp_limit(invalid, limit, 0))
+    elif limit_direction == 'backward':
+        preserve_nans = end_nans | set(_interp_limit(invalid, 0, limit))
+    else:
+        # both directions... just use _interp_limit
+        preserve_nans = set(_interp_limit(invalid, limit, limit))
+
+    # if limit_area is set, add either mid or outside indices
+    # to preserve_nans GH #16284
+    if limit_area == 'inside':
+        # preserve NaNs on the outside
+        preserve_nans |= start_nans | end_nans
+    elif limit_area == 'outside':
+        # preserve NaNs on the inside
+        preserve_nans |= mid_nans
 
-    # This is a list of the indexes in the series whose yvalue is currently
-    # NaN, but whose interpolated yvalue will be overwritten with NaN after
-    # computing the interpolation. For each index in this list, one of these
-    # conditions is true of the corresponding NaN in the yvalues:
-    #
-    # a) It is one of a chain of NaNs at the beginning of the series, and
-    #    either limit is not specified or limit_direction is 'forward'.
-    # b) It is one of a chain of NaNs at the end of the series, and limit is
-    #    specified and limit_direction is 'backward' or 'both'.
-    # c) Limit is nonzero and it is further than limit from the nearest non-NaN
-    #    value (with respect to the limit_direction setting).
-    #
-    # The default behavior is to fill forward with no limit, ignoring NaNs at
-    # the beginning (see issues #9218 and #10420)
-    violate_limit = sorted(start_nans)
-
-    if limit is not None:
-        if not is_integer(limit):
-            raise ValueError('Limit must be an integer')
-        if limit < 1:
-            raise ValueError('Limit must be greater than 0')
-        if limit_direction == 'forward':
-            violate_limit = sorted(start_nans | set(_interp_limit(invalid,
-                                                                  limit, 0)))
-        if limit_direction == 'backward':
-            violate_limit = sorted(end_nans | set(_interp_limit(invalid, 0,
-                                                                limit)))
-        if limit_direction == 'both':
-            violate_limit = sorted(_interp_limit(invalid, limit, limit))
+    # sort preserve_nans and covert to list
+    preserve_nans = sorted(preserve_nans)
 
     xvalues = getattr(xvalues, 'values', xvalues)
     yvalues = getattr(yvalues, 'values', yvalues)
@@ -204,7 +218,7 @@ def _interp_limit(invalid, fw_limit, bw_limit):
         else:
             inds = xvalues
         result[invalid] = np.interp(inds[invalid], inds[valid], yvalues[valid])
-        result[violate_limit] = np.nan
+        result[preserve_nans] = np.nan
         return result
 
     sp_methods = ['nearest', 'zero', 'slinear', 'quadratic', 'cubic',
@@ -223,23 +237,24 @@ def _interp_limit(invalid, fw_limit, bw_limit):
                                                      fill_value=fill_value,
                                                      bounds_error=bounds_error,
                                                      order=order, **kwargs)
-        result[violate_limit] = np.nan
+        result[preserve_nans] = np.nan
         return result
 
 
 def _interpolate_scipy_wrapper(x, y, new_x, method, fill_value=None,
                                bounds_error=False, order=None, **kwargs):
     """
-    passed off to scipy.interpolate.interp1d. method is scipy's kind.
+    Passed off to scipy.interpolate.interp1d. method is scipy's kind.
     Returns an array interpolated at new_x.  Add any new methods to
-    the list in _clean_interp_method
+    the list in _clean_interp_method.
     """
     try:
         from scipy import interpolate
         # TODO: Why is DatetimeIndex being imported here?
         from pandas import DatetimeIndex  # noqa
     except ImportError:
-        raise ImportError('{0} interpolation requires Scipy'.format(method))
+        raise ImportError('{method} interpolation requires SciPy'
+                          .format(method=method))
 
     new_x = np.asarray(new_x)
 
@@ -278,9 +293,10 @@ def _interpolate_scipy_wrapper(x, y, new_x, method, fill_value=None,
                                     bounds_error=bounds_error)
         new_y = terp(new_x)
     elif method == 'spline':
-        # GH #10633
-        if not order:
-            raise ValueError("order needs to be specified and greater than 0")
+        # GH #10633, #24014
+        if isna(order) or (order <= 0):
+            raise ValueError("order needs to be specified and greater than 0; "
+                             "got order: {}".format(order))
         terp = interpolate.UnivariateSpline(x, y, k=order, **kwargs)
         new_y = terp(new_x)
     else:
@@ -299,7 +315,7 @@ def _interpolate_scipy_wrapper(x, y, new_x, method, fill_value=None,
 
 def _from_derivatives(xi, yi, x, order=None, der=0, extrapolate=False):
     """
-    Convenience function for interpolate.BPoly.from_derivatives
+    Convenience function for interpolate.BPoly.from_derivatives.
 
     Construct a piecewise polynomial in the Bernstein basis, compatible
     with the specified values and derivatives at breakpoints.
@@ -310,7 +326,7 @@ def _from_derivatives(xi, yi, x, order=None, der=0, extrapolate=False):
         sorted 1D array of x-coordinates
     yi : array_like or list of array-likes
         yi[i][j] is the j-th derivative known at xi[i]
-    orders : None or int or array_like of ints. Default: None.
+    order: None or int or array_like of ints. Default: None.
         Specifies the degree of local polynomials. If not None, some
         derivatives are ignored.
     der : int or list
@@ -329,13 +345,12 @@ def _from_derivatives(xi, yi, x, order=None, der=0, extrapolate=False):
     Returns
     -------
     y : scalar or array_like
-        The result, of length R or length M or M by R,
-
+        The result, of length R or length M or M by R.
     """
     import scipy
     from scipy import interpolate
 
-    if LooseVersion(scipy.__version__) < '0.18.0':
+    if LooseVersion(scipy.__version__) < LooseVersion('0.18.0'):
         try:
             method = interpolate.piecewise_polynomial_interpolate
             return method(xi, yi.reshape(-1, 1), x,
@@ -403,8 +418,9 @@ def _akima_interpolate(xi, yi, x, der=0, axis=0):
 
 def interpolate_2d(values, method='pad', axis=0, limit=None, fill_value=None,
                    dtype=None):
-    """ perform an actual interpolation of values, values will be make 2-d if
-    needed fills inplace, returns the result
+    """
+    Perform an actual interpolation of values, values will be make 2-d if
+    needed fills inplace, returns the result.
     """
 
     transf = (lambda x: x) if axis == 0 else (lambda x: x.T)
@@ -437,93 +453,56 @@ def interpolate_2d(values, method='pad', axis=0, limit=None, fill_value=None,
     return values
 
 
-def _interp_wrapper(f, wrap_dtype, na_override=None):
-    def wrapper(arr, mask, limit=None):
-        view = arr.view(wrap_dtype)
-        f(view, mask, limit=limit)
-
-    return wrapper
-
-
-_pad_1d_datetime = _interp_wrapper(algos.pad_inplace_int64, np.int64)
-_pad_2d_datetime = _interp_wrapper(algos.pad_2d_inplace_int64, np.int64)
-_backfill_1d_datetime = _interp_wrapper(algos.backfill_inplace_int64, np.int64)
-_backfill_2d_datetime = _interp_wrapper(algos.backfill_2d_inplace_int64,
-                                        np.int64)
+def _cast_values_for_fillna(values, dtype):
+    """
+    Cast values to a dtype that algos.pad and algos.backfill can handle.
+    """
+    # TODO: for int-dtypes we make a copy, but for everything else this
+    #  alters the values in-place.  Is this intentional?
 
+    if (is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype) or
+            is_timedelta64_dtype(dtype)):
+        values = values.view(np.int64)
 
-def pad_1d(values, limit=None, mask=None, dtype=None):
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'pad_inplace_%s' % dtype.name, None)
-    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
-        _method = _pad_1d_datetime
     elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.pad_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.pad_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for pad_1d [%s]' % dtype.name)
+        # NB: this check needs to come after the datetime64 check above
+        values = ensure_float64(values)
 
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
-    _method(values, mask, limit=limit)
     return values
 
 
-def backfill_1d(values, limit=None, mask=None, dtype=None):
+def _fillna_prep(values, mask=None, dtype=None):
+    # boilerplate for pad_1d, backfill_1d, pad_2d, backfill_2d
     if dtype is None:
         dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'backfill_inplace_%s' % dtype.name, None)
-    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
-        _method = _backfill_1d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.backfill_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.backfill_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for backfill_1d [%s]' % dtype.name)
 
     if mask is None:
-        mask = isnull(values)
+        # This needs to occur before datetime/timedeltas are cast to int64
+        mask = isna(values)
+
+    values = _cast_values_for_fillna(values, dtype)
+
     mask = mask.view(np.uint8)
+    return values, mask
+
 
-    _method(values, mask, limit=limit)
+def pad_1d(values, limit=None, mask=None, dtype=None):
+    values, mask = _fillna_prep(values, mask, dtype)
+    algos.pad_inplace(values, mask, limit=limit)
     return values
 
 
-def pad_2d(values, limit=None, mask=None, dtype=None):
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'pad_2d_inplace_%s' % dtype.name, None)
-    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
-        _method = _pad_2d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.pad_2d_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.pad_2d_inplace_object
+def backfill_1d(values, limit=None, mask=None, dtype=None):
+    values, mask = _fillna_prep(values, mask, dtype)
+    algos.backfill_inplace(values, mask, limit=limit)
+    return values
 
-    if _method is None:
-        raise ValueError('Invalid dtype for pad_2d [%s]' % dtype.name)
 
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
+def pad_2d(values, limit=None, mask=None, dtype=None):
+    values, mask = _fillna_prep(values, mask, dtype)
 
     if np.all(values.shape):
-        _method(values, mask, limit=limit)
+        algos.pad_2d_inplace(values, mask, limit=limit)
     else:
         # for test coverage
         pass
@@ -531,28 +510,10 @@ def pad_2d(values, limit=None, mask=None, dtype=None):
 
 
 def backfill_2d(values, limit=None, mask=None, dtype=None):
-    if dtype is None:
-        dtype = values.dtype
-    _method = None
-    if is_float_dtype(values):
-        _method = getattr(algos, 'backfill_2d_inplace_%s' % dtype.name, None)
-    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
-        _method = _backfill_2d_datetime
-    elif is_integer_dtype(values):
-        values = _ensure_float64(values)
-        _method = algos.backfill_2d_inplace_float64
-    elif values.dtype == np.object_:
-        _method = algos.backfill_2d_inplace_object
-
-    if _method is None:
-        raise ValueError('Invalid dtype for backfill_2d [%s]' % dtype.name)
-
-    if mask is None:
-        mask = isnull(values)
-    mask = mask.view(np.uint8)
+    values, mask = _fillna_prep(values, mask, dtype)
 
     if np.all(values.shape):
-        _method(values, mask, limit=limit)
+        algos.backfill_2d_inplace(values, mask, limit=limit)
     else:
         # for test coverage
         pass
@@ -573,13 +534,13 @@ def clean_reindex_fill_method(method):
 
 def fill_zeros(result, x, y, name, fill):
     """
-    if this is a reversed op, then flip x,y
+    If this is a reversed op, then flip x,y
 
-    if we have an integer value (or array in y)
+    If we have an integer value (or array in y)
     and we have 0's, fill them with the fill,
-    return the result
+    return the result.
 
-    mask the nan's from x
+    Mask the nan's from x.
     """
     if fill is None or is_float_dtype(result):
         return result
@@ -612,7 +573,8 @@ def fill_zeros(result, x, y, name, fill):
             # if we have a fill of inf, then sign it correctly
             # (GH 6178 and PR 9308)
             if np.isinf(fill):
-                signs = np.sign(y if name.startswith(('r', '__r')) else x)
+                signs = y if name.startswith(('r', '__r')) else x
+                signs = np.sign(signs.astype('float', copy=False))
                 negative_inf_mask = (signs.ravel() < 0) & mask
                 np.putmask(result, negative_inf_mask, -fill)
 
@@ -623,3 +585,165 @@ def fill_zeros(result, x, y, name, fill):
             result = result.reshape(shape)
 
     return result
+
+
+def mask_zero_div_zero(x, y, result, copy=False):
+    """
+    Set results of 0 / 0 or 0 // 0 to np.nan, regardless of the dtypes
+    of the numerator or the denominator.
+
+    Parameters
+    ----------
+    x : ndarray
+    y : ndarray
+    result : ndarray
+    copy : bool (default False)
+        Whether to always create a new array or try to fill in the existing
+        array if possible.
+
+    Returns
+    -------
+    filled_result : ndarray
+
+    Examples
+    --------
+    >>> x = np.array([1, 0, -1], dtype=np.int64)
+    >>> y = 0       # int 0; numpy behavior is different with float
+    >>> result = x / y
+    >>> result      # raw numpy result does not fill division by zero
+    array([0, 0, 0])
+    >>> mask_zero_div_zero(x, y, result)
+    array([ inf,  nan, -inf])
+    """
+    if is_scalar(y):
+        y = np.array(y)
+
+    zmask = y == 0
+    if zmask.any():
+        shape = result.shape
+
+        nan_mask = (zmask & (x == 0)).ravel()
+        neginf_mask = (zmask & (x < 0)).ravel()
+        posinf_mask = (zmask & (x > 0)).ravel()
+
+        if nan_mask.any() or neginf_mask.any() or posinf_mask.any():
+            # Fill negative/0 with -inf, positive/0 with +inf, 0/0 with NaN
+            result = result.astype('float64', copy=copy).ravel()
+
+            np.putmask(result, nan_mask, np.nan)
+            np.putmask(result, posinf_mask, np.inf)
+            np.putmask(result, neginf_mask, -np.inf)
+
+            result = result.reshape(shape)
+
+    return result
+
+
+def dispatch_missing(op, left, right, result):
+    """
+    Fill nulls caused by division by zero, casting to a diffferent dtype
+    if necessary.
+
+    Parameters
+    ----------
+    op : function (operator.add, operator.div, ...)
+    left : object (Index for non-reversed ops)
+    right : object (Index fof reversed ops)
+    result : ndarray
+
+    Returns
+    -------
+    result : ndarray
+    """
+    opstr = '__{opname}__'.format(opname=op.__name__).replace('____', '__')
+    if op in [operator.truediv, operator.floordiv,
+              getattr(operator, 'div', None)]:
+        result = mask_zero_div_zero(left, right, result)
+    elif op is operator.mod:
+        result = fill_zeros(result, left, right, opstr, np.nan)
+    elif op is divmod:
+        res0 = mask_zero_div_zero(left, right, result[0])
+        res1 = fill_zeros(result[1], left, right, opstr, np.nan)
+        result = (res0, res1)
+    return result
+
+
+def _interp_limit(invalid, fw_limit, bw_limit):
+    """
+    Get indexers of values that won't be filled
+    because they exceed the limits.
+
+    Parameters
+    ----------
+    invalid : boolean ndarray
+    fw_limit : int or None
+        forward limit to index
+    bw_limit : int or None
+        backward limit to index
+
+    Returns
+    -------
+    set of indexers
+
+    Notes
+    -----
+    This is equivalent to the more readable, but slower
+
+    .. code-block:: python
+
+        def _interp_limit(invalid, fw_limit, bw_limit):
+            for x in np.where(invalid)[0]:
+                if invalid[max(0, x - fw_limit):x + bw_limit + 1].all():
+                    yield x
+    """
+    # handle forward first; the backward direction is the same except
+    # 1. operate on the reversed array
+    # 2. subtract the returned indices from N - 1
+    N = len(invalid)
+    f_idx = set()
+    b_idx = set()
+
+    def inner(invalid, limit):
+        limit = min(limit, N)
+        windowed = _rolling_window(invalid, limit + 1).all(1)
+        idx = (set(np.where(windowed)[0] + limit) |
+               set(np.where((~invalid[:limit + 1]).cumsum() == 0)[0]))
+        return idx
+
+    if fw_limit is not None:
+
+        if fw_limit == 0:
+            f_idx = set(np.where(invalid)[0])
+        else:
+            f_idx = inner(invalid, fw_limit)
+
+    if bw_limit is not None:
+
+        if bw_limit == 0:
+            # then we don't even need to care about backwards
+            # just use forwards
+            return f_idx
+        else:
+            b_idx = list(inner(invalid[::-1], bw_limit))
+            b_idx = set(N - 1 - np.asarray(b_idx))
+            if fw_limit == 0:
+                return b_idx
+
+    return f_idx & b_idx
+
+
+def _rolling_window(a, window):
+    """
+    [True, True, False, True, False], 2 ->
+
+    [
+        [True,  True],
+        [True, False],
+        [False, True],
+        [True, False],
+    ]
+    """
+    # https://stackoverflow.com/a/6811241
+    shape = a.shape[:-1] + (a.shape[-1] - window + 1, window)
+    strides = a.strides + (a.strides[-1],)
+    return np.lib.stride_tricks.as_strided(a, shape=shape, strides=strides)
diff --git a/pandas/core/nanops.py b/pandas/core/nanops.py
index 6ec94e69740a2..86c3c380636c9 100644
--- a/pandas/core/nanops.py
+++ b/pandas/core/nanops.py
@@ -1,36 +1,64 @@
-import itertools
+from distutils.version import LooseVersion
 import functools
-import numpy as np
+import itertools
 import operator
+import warnings
+
+import numpy as np
+
+from pandas._libs import iNaT, lib, tslibs
+import pandas.compat as compat
+
+from pandas.core.dtypes.cast import _int64_max, maybe_upcast_putmask
+from pandas.core.dtypes.common import (
+    _get_dtype, is_any_int_dtype, is_bool_dtype, is_complex, is_complex_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype, is_datetime_or_timedelta_dtype,
+    is_float, is_float_dtype, is_integer, is_integer_dtype, is_numeric_dtype,
+    is_object_dtype, is_scalar, is_timedelta64_dtype, pandas_dtype)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.missing import isna, na_value_for_dtype, notna
+
+import pandas.core.common as com
+from pandas.core.config import get_option
+
+_BOTTLENECK_INSTALLED = False
+_MIN_BOTTLENECK_VERSION = '1.0.0'
 
 try:
     import bottleneck as bn
-    _USE_BOTTLENECK = True
+    ver = bn.__version__
+    _BOTTLENECK_INSTALLED = (LooseVersion(ver) >=
+                             LooseVersion(_MIN_BOTTLENECK_VERSION))
+
+    if not _BOTTLENECK_INSTALLED:
+        warnings.warn(
+            "The installed version of bottleneck {ver} is not supported "
+            "in pandas and will be not be used\nThe minimum supported "
+            "version is {min_ver}\n".format(
+                ver=ver, min_ver=_MIN_BOTTLENECK_VERSION), UserWarning)
+
 except ImportError:  # pragma: no cover
-    _USE_BOTTLENECK = False
+    pass
 
-from pandas import compat
-from pandas._libs import tslib, algos, lib
-from pandas.types.common import (_get_dtype,
-                                 is_float, is_scalar,
-                                 is_integer, is_complex, is_float_dtype,
-                                 is_complex_dtype, is_integer_dtype,
-                                 is_bool_dtype, is_object_dtype,
-                                 is_numeric_dtype,
-                                 is_datetime64_dtype, is_timedelta64_dtype,
-                                 is_datetime_or_timedelta_dtype,
-                                 is_int_or_datetime_dtype, is_any_int_dtype)
-from pandas.types.cast import _int64_max, maybe_upcast_putmask
-from pandas.types.missing import isnull, notnull
 
-from pandas.core.common import _values_from_object
+_USE_BOTTLENECK = False
+
+
+def set_use_bottleneck(v=True):
+    # set/unset to use bottleneck
+    global _USE_BOTTLENECK
+    if _BOTTLENECK_INSTALLED:
+        _USE_BOTTLENECK = v
+
+
+set_use_bottleneck(get_option('compute.use_bottleneck'))
 
 
 class disallow(object):
 
     def __init__(self, *dtypes):
         super(disallow, self).__init__()
-        self.dtypes = tuple(np.dtype(dtype).type for dtype in dtypes)
+        self.dtypes = tuple(pandas_dtype(dtype).type for dtype in dtypes)
 
     def check(self, obj):
         return hasattr(obj, 'dtype') and issubclass(obj.dtype.type,
@@ -41,9 +69,8 @@ def __call__(self, f):
         def _f(*args, **kwargs):
             obj_iter = itertools.chain(args, compat.itervalues(kwargs))
             if any(self.check(obj) for obj in obj_iter):
-                raise TypeError('reduction operation {0!r} not allowed for '
-                                'this dtype'.format(
-                                    f.__name__.replace('nan', '')))
+                msg = 'reduction operation {name!r} not allowed for this dtype'
+                raise TypeError(msg.format(name=f.__name__.replace('nan', '')))
             try:
                 with np.errstate(invalid='ignore'):
                     return f(*args, **kwargs)
@@ -61,8 +88,7 @@ def _f(*args, **kwargs):
 
 class bottleneck_switch(object):
 
-    def __init__(self, zero_value=None, **kwargs):
-        self.zero_value = zero_value
+    def __init__(self, **kwargs):
         self.kwargs = kwargs
 
     def __call__(self, alt):
@@ -80,19 +106,14 @@ def f(values, axis=None, skipna=True, **kwds):
                     if k not in kwds:
                         kwds[k] = v
             try:
-                if self.zero_value is not None and values.size == 0:
-                    if values.ndim == 1:
-
-                        # wrap the 0's if needed
-                        if is_timedelta64_dtype(values):
-                            return lib.Timedelta(0)
-                        return 0
-                    else:
-                        result_shape = (values.shape[:axis] +
-                                        values.shape[axis + 1:])
-                        result = np.empty(result_shape)
-                        result.fill(0)
-                        return result
+                if values.size == 0 and kwds.get('min_count') is None:
+                    # We are empty, returning NA for our type
+                    # Only applies for the default `min_count` of None
+                    # since that affects how empty arrays are handled.
+                    # TODO(GH-18976) update all the nanops methods to
+                    # correctly handle empty inputs and remove this check.
+                    # It *may* just be `var`
+                    return _na_for_min_count(values, axis)
 
                 if (_USE_BOTTLENECK and skipna and
                         _bn_ok_dtype(values.dtype, bn_name)):
@@ -124,13 +145,20 @@ def f(values, axis=None, skipna=True, **kwds):
 
 def _bn_ok_dtype(dt, name):
     # Bottleneck chokes on datetime64
-    if (not is_object_dtype(dt) and not is_datetime_or_timedelta_dtype(dt)):
+    if (not is_object_dtype(dt) and
+            not (is_datetime_or_timedelta_dtype(dt) or
+                 is_datetime64tz_dtype(dt))):
 
+        # GH 15507
         # bottleneck does not properly upcast during the sum
         # so can overflow
-        if name == 'nansum':
-            if dt.itemsize < 8:
-                return False
+
+        # GH 9422
+        # further we also want to preserve NaN when all elements
+        # are NaN, unlinke bottleneck/numpy which consider this
+        # to be 0
+        if name in ['nansum', 'nanprod']:
+            return False
 
         return True
     return False
@@ -163,28 +191,43 @@ def _get_fill_value(dtype, fill_value=None, fill_value_typ=None):
                 return -np.inf
     else:
         if fill_value_typ is None:
-            return tslib.iNaT
+            return tslibs.iNaT
         else:
             if fill_value_typ == '+inf':
                 # need the max int here
                 return _int64_max
             else:
-                return tslib.iNaT
+                return tslibs.iNaT
 
 
 def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
-                isfinite=False, copy=True):
+                isfinite=False, copy=True, mask=None):
     """ utility to get the values view, mask, dtype
     if necessary copy and mask using the specified fill_value
     copy = True will force the copy
     """
-    values = _values_from_object(values)
-    if isfinite:
-        mask = _isfinite(values)
+
+    if is_datetime64tz_dtype(values):
+        # com.values_from_object returns M8[ns] dtype instead of tz-aware,
+        #  so this case must be handled separately from the rest
+        dtype = values.dtype
+        values = getattr(values, "_values", values)
     else:
-        mask = isnull(values)
+        values = com.values_from_object(values)
+        dtype = values.dtype
+
+    if mask is None:
+        if isfinite:
+            mask = _isfinite(values)
+        else:
+            mask = isna(values)
+
+    if is_datetime_or_timedelta_dtype(values) or is_datetime64tz_dtype(values):
+        # changing timedelta64/datetime64 to int64 needs to happen after
+        #  finding `mask` above
+        values = getattr(values, "asi8", values)
+        values = values.view(np.int64)
 
-    dtype = values.dtype
     dtype_ok = _na_ok_dtype(dtype)
 
     # get our fill value (in case we need to provide an alternative
@@ -205,8 +248,6 @@ def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
     elif copy:
         values = values.copy()
 
-    values = _view_if_needed(values)
-
     # return a platform independent precision dtype
     dtype_max = dtype
     if is_integer_dtype(dtype) or is_bool_dtype(dtype):
@@ -214,12 +255,12 @@ def _get_values(values, skipna, fill_value=None, fill_value_typ=None,
     elif is_float_dtype(dtype):
         dtype_max = np.float64
 
-    return values, mask, dtype, dtype_max
+    return values, mask, dtype, dtype_max, fill_value
 
 
 def _isfinite(values):
     if is_datetime_or_timedelta_dtype(values):
-        return isnull(values)
+        return isna(values)
     if (is_complex_dtype(values) or is_float_dtype(values) or
             is_integer_dtype(values) or is_bool_dtype(values)):
         return ~np.isfinite(values)
@@ -227,70 +268,209 @@ def _isfinite(values):
 
 
 def _na_ok_dtype(dtype):
-    return not is_int_or_datetime_dtype(dtype)
-
-
-def _view_if_needed(values):
-    if is_datetime_or_timedelta_dtype(values):
-        return values.view(np.int64)
-    return values
+    # TODO: what about datetime64tz?  PeriodDtype?
+    return not issubclass(dtype.type,
+                          (np.integer, np.timedelta64, np.datetime64))
 
 
-def _wrap_results(result, dtype):
+def _wrap_results(result, dtype, fill_value=None):
     """ wrap our results if needed """
 
-    if is_datetime64_dtype(dtype):
+    if is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        if fill_value is None:
+            # GH#24293
+            fill_value = iNaT
         if not isinstance(result, np.ndarray):
-            result = lib.Timestamp(result)
+            tz = getattr(dtype, 'tz', None)
+            assert not isna(fill_value), "Expected non-null fill_value"
+            if result == fill_value:
+                result = np.nan
+            result = tslibs.Timestamp(result, tz=tz)
         else:
             result = result.view(dtype)
     elif is_timedelta64_dtype(dtype):
         if not isinstance(result, np.ndarray):
+            if result == fill_value:
+                result = np.nan
 
             # raise if we have a timedelta64[ns] which is too large
             if np.fabs(result) > _int64_max:
                 raise ValueError("overflow in timedelta operation")
 
-            result = lib.Timedelta(result, unit='ns')
+            result = tslibs.Timedelta(result, unit='ns')
         else:
             result = result.astype('i8').view(dtype)
 
     return result
 
 
-def nanany(values, axis=None, skipna=True):
-    values, mask, dtype, _ = _get_values(values, skipna, False, copy=skipna)
+def _na_for_min_count(values, axis):
+    """Return the missing value for `values`
+
+    Parameters
+    ----------
+    values : ndarray
+    axis : int or None
+        axis for the reduction
+
+    Returns
+    -------
+    result : scalar or ndarray
+        For 1-D values, returns a scalar of the correct missing type.
+        For 2-D values, returns a 1-D array where each element is missing.
+    """
+    # we either return np.nan or pd.NaT
+    if is_numeric_dtype(values):
+        values = values.astype('float64')
+    fill_value = na_value_for_dtype(values.dtype)
+
+    if values.ndim == 1:
+        return fill_value
+    else:
+        result_shape = (values.shape[:axis] +
+                        values.shape[axis + 1:])
+        result = np.empty(result_shape, dtype=values.dtype)
+        result.fill(fill_value)
+        return result
+
+
+def nanany(values, axis=None, skipna=True, mask=None):
+    """
+    Check if any elements along an axis evaluate to True.
+
+    Parameters
+    ----------
+    values : ndarray
+    axis : int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : bool
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2])
+    >>> nanops.nanany(s)
+    True
+
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([np.nan])
+    >>> nanops.nanany(s)
+    False
+    """
+    values, mask, dtype, _, _ = _get_values(values, skipna, False, copy=skipna,
+                                            mask=mask)
     return values.any(axis)
 
 
-def nanall(values, axis=None, skipna=True):
-    values, mask, dtype, _ = _get_values(values, skipna, True, copy=skipna)
+def nanall(values, axis=None, skipna=True, mask=None):
+    """
+    Check if all elements along an axis evaluate to True.
+
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : bool
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, np.nan])
+    >>> nanops.nanall(s)
+    True
+
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 0])
+    >>> nanops.nanall(s)
+    False
+    """
+    values, mask, dtype, _, _ = _get_values(values, skipna, True, copy=skipna,
+                                            mask=mask)
     return values.all(axis)
 
 
 @disallow('M8')
-@bottleneck_switch(zero_value=0)
-def nansum(values, axis=None, skipna=True):
-    values, mask, dtype, dtype_max = _get_values(values, skipna, 0)
+def nansum(values, axis=None, skipna=True, min_count=0, mask=None):
+    """
+    Sum the elements along an axis ignoring NaNs
+
+    Parameters
+    ----------
+    values : ndarray[dtype]
+    axis: int, optional
+    skipna : bool, default True
+    min_count: int, default 0
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : dtype
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, np.nan])
+    >>> nanops.nansum(s)
+    3.0
+    """
+    values, mask, dtype, dtype_max, _ = _get_values(values,
+                                                    skipna, 0, mask=mask)
     dtype_sum = dtype_max
     if is_float_dtype(dtype):
         dtype_sum = dtype
     elif is_timedelta64_dtype(dtype):
         dtype_sum = np.float64
     the_sum = values.sum(axis, dtype=dtype_sum)
-    the_sum = _maybe_null_out(the_sum, axis, mask)
+    the_sum = _maybe_null_out(the_sum, axis, mask, min_count=min_count)
 
     return _wrap_results(the_sum, dtype)
 
 
-@disallow('M8')
+@disallow('M8', DatetimeTZDtype)
 @bottleneck_switch()
-def nanmean(values, axis=None, skipna=True):
-    values, mask, dtype, dtype_max = _get_values(values, skipna, 0)
-
+def nanmean(values, axis=None, skipna=True, mask=None):
+    """
+    Compute the mean of the element along an axis ignoring NaNs
+
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, np.nan])
+    >>> nanops.nanmean(s)
+    1.5
+    """
+    values, mask, dtype, dtype_max, _ = _get_values(
+        values, skipna, 0, mask=mask)
     dtype_sum = dtype_max
     dtype_count = np.float64
-    if is_integer_dtype(dtype) or is_timedelta64_dtype(dtype):
+    if (is_integer_dtype(dtype) or is_timedelta64_dtype(dtype) or
+            is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype)):
         dtype_sum = np.float64
     elif is_float_dtype(dtype):
         dtype_sum = dtype
@@ -299,7 +479,9 @@ def nanmean(values, axis=None, skipna=True):
     the_sum = _ensure_numeric(values.sum(axis, dtype=dtype_sum))
 
     if axis is not None and getattr(the_sum, 'ndim', False):
-        the_mean = the_sum / count
+        with np.errstate(all="ignore"):
+            # suppress division by zero warnings
+            the_mean = the_sum / count
         ct_mask = count == 0
         if ct_mask.any():
             the_mean[ct_mask] = np.nan
@@ -311,16 +493,36 @@ def nanmean(values, axis=None, skipna=True):
 
 @disallow('M8')
 @bottleneck_switch()
-def nanmedian(values, axis=None, skipna=True):
-
-    values, mask, dtype, dtype_max = _get_values(values, skipna)
-
+def nanmedian(values, axis=None, skipna=True, mask=None):
+    """
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, np.nan, 2, 2])
+    >>> nanops.nanmedian(s)
+    2.0
+    """
     def get_median(x):
-        mask = notnull(x)
+        mask = notna(x)
         if not skipna and not mask.all():
             return np.nan
-        return algos.median(_values_from_object(x[mask]))
+        return np.nanmedian(x[mask])
 
+    values, mask, dtype, dtype_max, _ = _get_values(values, skipna, mask=mask)
     if not is_float_dtype(values):
         values = values.astype('f8')
         values[mask] = np.nan
@@ -332,10 +534,15 @@ def get_median(x):
 
     # an array from a frame
     if values.ndim > 1:
+
         # there's a non-empty array to apply over otherwise numpy raises
         if notempty:
-            return _wrap_results(
-                np.apply_along_axis(get_median, axis, values), dtype)
+            if not skipna:
+                return _wrap_results(
+                    np.apply_along_axis(get_median, axis, values), dtype)
+
+            # fastpath for the skipna case
+            return _wrap_results(np.nanmedian(values, axis), dtype)
 
         # must return the correct shape, but median is not defined for the
         # empty set so return nans of shape "everything but the passed axis"
@@ -371,17 +578,73 @@ def _get_counts_nanvar(mask, axis, ddof, dtype=float):
 
 @disallow('M8')
 @bottleneck_switch(ddof=1)
-def nanstd(values, axis=None, skipna=True, ddof=1):
-    result = np.sqrt(nanvar(values, axis=axis, skipna=skipna, ddof=ddof))
+def nanstd(values, axis=None, skipna=True, ddof=1, mask=None):
+    """
+    Compute the standard deviation along given axis while ignoring NaNs
+
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    ddof : int, default 1
+        Delta Degrees of Freedom. The divisor used in calculations is N - ddof,
+        where N represents the number of elements.
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, np.nan, 2, 3])
+    >>> nanops.nanstd(s)
+    1.0
+    """
+    result = np.sqrt(nanvar(values, axis=axis, skipna=skipna, ddof=ddof,
+                            mask=mask))
     return _wrap_results(result, values.dtype)
 
 
 @disallow('M8')
 @bottleneck_switch(ddof=1)
-def nanvar(values, axis=None, skipna=True, ddof=1):
-
+def nanvar(values, axis=None, skipna=True, ddof=1, mask=None):
+    """
+    Compute the variance along given axis while ignoring NaNs
+
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    ddof : int, default 1
+        Delta Degrees of Freedom. The divisor used in calculations is N - ddof,
+        where N represents the number of elements.
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, np.nan, 2, 3])
+    >>> nanops.nanvar(s)
+    1.0
+    """
+    values = com.values_from_object(values)
     dtype = values.dtype
-    mask = isnull(values)
+    if mask is None:
+        mask = isna(values)
     if is_any_int_dtype(values):
         values = values.astype('f8')
         values[mask] = np.nan
@@ -404,7 +667,7 @@ def nanvar(values, axis=None, skipna=True, ddof=1):
     avg = _ensure_numeric(values.sum(axis=axis, dtype=np.float64)) / count
     if axis is not None:
         avg = np.expand_dims(avg, axis)
-    sqr = _ensure_numeric((avg - values)**2)
+    sqr = _ensure_numeric((avg - values) ** 2)
     np.putmask(sqr, mask, 0)
     result = sqr.sum(axis=axis, dtype=np.float64) / d
 
@@ -417,10 +680,41 @@ def nanvar(values, axis=None, skipna=True, ddof=1):
 
 
 @disallow('M8', 'm8')
-def nansem(values, axis=None, skipna=True, ddof=1):
-    var = nanvar(values, axis, skipna, ddof=ddof)
+def nansem(values, axis=None, skipna=True, ddof=1, mask=None):
+    """
+    Compute the standard error in the mean along given axis while ignoring NaNs
+
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    ddof : int, default 1
+        Delta Degrees of Freedom. The divisor used in calculations is N - ddof,
+        where N represents the number of elements.
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float64
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, np.nan, 2, 3])
+    >>> nanops.nansem(s)
+     0.5773502691896258
+    """
+
+    # This checks if non-numeric-like data is passed with numeric_only=False
+    # and raises a TypeError otherwise
+    nanvar(values, axis, skipna, ddof=ddof, mask=mask)
 
-    mask = isnull(values)
+    if mask is None:
+        mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
     count, _ = _get_counts_nanvar(mask, axis, ddof, values.dtype)
@@ -431,21 +725,23 @@ def nansem(values, axis=None, skipna=True, ddof=1):
 
 def _nanminmax(meth, fill_value_typ):
     @bottleneck_switch()
-    def reduction(values, axis=None, skipna=True):
-        values, mask, dtype, dtype_max = _get_values(
-            values, skipna, fill_value_typ=fill_value_typ, )
+    def reduction(values, axis=None, skipna=True, mask=None):
+
+        values, mask, dtype, dtype_max, fill_value = _get_values(
+            values, skipna, fill_value_typ=fill_value_typ, mask=mask)
 
         if ((axis is not None and values.shape[axis] == 0) or
                 values.size == 0):
             try:
                 result = getattr(values, meth)(axis, dtype=dtype_max)
                 result.fill(np.nan)
-            except:
+            except (AttributeError, TypeError,
+                    ValueError, np.core._internal.AxisError):
                 result = np.nan
         else:
             result = getattr(values, meth)(axis)
 
-        result = _wrap_results(result, dtype)
+        result = _wrap_results(result, dtype, fill_value)
         return _maybe_null_out(result, axis, mask)
 
     reduction.__name__ = 'nan' + meth
@@ -456,39 +752,98 @@ def reduction(values, axis=None, skipna=True):
 nanmax = _nanminmax('max', fill_value_typ='-inf')
 
 
-def nanargmax(values, axis=None, skipna=True):
+@disallow('O')
+def nanargmax(values, axis=None, skipna=True, mask=None):
     """
-    Returns -1 in the NA case
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    --------
+    result : int
+        The index of max value in specified axis or -1 in the NA case
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, 3, np.nan, 4])
+    >>> nanops.nanargmax(s)
+    4
     """
-    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='-inf',
-                                         isfinite=True)
+    values, mask, dtype, _, _ = _get_values(
+        values, skipna, fill_value_typ='-inf', mask=mask)
     result = values.argmax(axis)
     result = _maybe_arg_null_out(result, axis, mask, skipna)
     return result
 
 
-def nanargmin(values, axis=None, skipna=True):
+@disallow('O')
+def nanargmin(values, axis=None, skipna=True, mask=None):
     """
-    Returns -1 in the NA case
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    --------
+    result : int
+        The index of min value in specified axis or -1 in the NA case
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, 3, np.nan, 4])
+    >>> nanops.nanargmin(s)
+    0
     """
-    values, mask, dtype, _ = _get_values(values, skipna, fill_value_typ='+inf',
-                                         isfinite=True)
+    values, mask, dtype, _, _ = _get_values(
+        values, skipna, fill_value_typ='+inf', mask=mask)
     result = values.argmin(axis)
     result = _maybe_arg_null_out(result, axis, mask, skipna)
     return result
 
 
 @disallow('M8', 'm8')
-def nanskew(values, axis=None, skipna=True):
+def nanskew(values, axis=None, skipna=True, mask=None):
     """ Compute the sample skewness.
 
     The statistic computed here is the adjusted Fisher-Pearson standardized
     moment coefficient G1. The algorithm computes this coefficient directly
     from the second and third central moment.
 
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float64
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1,np.nan, 1, 2])
+    >>> nanops.nanskew(s)
+    1.7320508075688787
     """
-
-    mask = isnull(values)
+    values = com.values_from_object(values)
+    if mask is None:
+        mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
         count = _get_counts(mask, axis)
@@ -512,6 +867,9 @@ def nanskew(values, axis=None, skipna=True):
     m3 = adjusted3.sum(axis, dtype=np.float64)
 
     # floating point error
+    #
+    # #18044 in _libs/windows.pyx calc_skew follow this behavior
+    # to fix the fperr to treat m2 <1e-14 as zero
     m2 = _zero_out_fperr(m2)
     m3 = _zero_out_fperr(m3)
 
@@ -534,15 +892,38 @@ def nanskew(values, axis=None, skipna=True):
 
 
 @disallow('M8', 'm8')
-def nankurt(values, axis=None, skipna=True):
-    """ Compute the sample skewness.
+def nankurt(values, axis=None, skipna=True, mask=None):
+    """
+    Compute the sample excess kurtosis
 
     The statistic computed here is the adjusted Fisher-Pearson standardized
     moment coefficient G2, computed directly from the second and fourth
     central moment.
 
+    Parameters
+    ----------
+    values : ndarray
+    axis: int, optional
+    skipna : bool, default True
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : float64
+        Unless input is a float array, in which case use the same
+        precision as the input array.
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1,np.nan, 1, 3, 2])
+    >>> nanops.nankurt(s)
+    -1.2892561983471076
     """
-    mask = isnull(values)
+    values = com.values_from_object(values)
+    if mask is None:
+        mask = isna(values)
     if not is_float_dtype(values.dtype):
         values = values.astype('f8')
         count = _get_counts(mask, axis)
@@ -568,10 +949,12 @@ def nankurt(values, axis=None, skipna=True):
     with np.errstate(invalid='ignore', divide='ignore'):
         adj = 3 * (count - 1) ** 2 / ((count - 2) * (count - 3))
         numer = count * (count + 1) * (count - 1) * m4
-        denom = (count - 2) * (count - 3) * m2**2
-        result = numer / denom - adj
+        denom = (count - 2) * (count - 3) * m2 ** 2
 
     # floating point error
+    #
+    # #18044 in _libs/windows.pyx calc_kurt follow this behavior
+    # to fix the fperr to treat denom <1e-14 as zero
     numer = _zero_out_fperr(numer)
     denom = _zero_out_fperr(denom)
 
@@ -598,13 +981,39 @@ def nankurt(values, axis=None, skipna=True):
 
 
 @disallow('M8', 'm8')
-def nanprod(values, axis=None, skipna=True):
-    mask = isnull(values)
+def nanprod(values, axis=None, skipna=True, min_count=0, mask=None):
+    """
+    Parameters
+    ----------
+    values : ndarray[dtype]
+    axis: int, optional
+    skipna : bool, default True
+    min_count: int, default 0
+    mask : ndarray[bool], optional
+        nan-mask if known
+
+    Returns
+    -------
+    result : dtype
+
+    Examples
+    --------
+    >>> import pandas.core.nanops as nanops
+    >>> s = pd.Series([1, 2, 3, np.nan])
+    >>> nanops.nanprod(s)
+    6.0
+
+    Returns
+    --------
+    The product of all elements on a given axis. ( NaNs are treated as 1)
+    """
+    if mask is None:
+        mask = isna(values)
     if skipna and not is_any_int_dtype(values):
         values = values.copy()
         values[mask] = 1
     result = values.prod(axis)
-    return _maybe_null_out(result, axis, mask)
+    return _maybe_null_out(result, axis, mask, min_count=min_count)
 
 
 def _maybe_arg_null_out(result, axis, mask, skipna):
@@ -640,9 +1049,9 @@ def _get_counts(mask, axis, dtype=float):
         return np.array(count, dtype=dtype)
 
 
-def _maybe_null_out(result, axis, mask):
+def _maybe_null_out(result, axis, mask, min_count=1):
     if axis is not None and getattr(result, 'ndim', False):
-        null_mask = (mask.shape[axis] - mask.sum(axis)) == 0
+        null_mask = (mask.shape[axis] - mask.sum(axis) - min_count) < 0
         if np.any(null_mask):
             if is_numeric_dtype(result):
                 if np.iscomplexobj(result):
@@ -653,15 +1062,16 @@ def _maybe_null_out(result, axis, mask):
             else:
                 # GH12941, use None to auto cast null
                 result[null_mask] = None
-    elif result is not tslib.NaT:
+    elif result is not tslibs.NaT:
         null_mask = mask.size - mask.sum()
-        if null_mask == 0:
+        if null_mask < min_count:
             result = np.nan
 
     return result
 
 
 def _zero_out_fperr(arg):
+    # #18044 reference this behavior to fix rolling skew/kurt issue
     if isinstance(arg, np.ndarray):
         with np.errstate(invalid='ignore'):
             return np.where(np.abs(arg) < 1e-14, 0, arg)
@@ -680,7 +1090,7 @@ def nancorr(a, b, method='pearson', min_periods=None):
     if min_periods is None:
         min_periods = 1
 
-    valid = notnull(a) & notnull(b)
+    valid = notna(a) & notna(b)
     if not valid.all():
         a = a[valid]
         b = b[valid]
@@ -695,6 +1105,8 @@ def nancorr(a, b, method='pearson', min_periods=None):
 def get_corr_func(method):
     if method in ['kendall', 'spearman']:
         from scipy.stats import kendalltau, spearmanr
+    elif callable(method):
+        return method
 
     def _pearson(a, b):
         return np.corrcoef(a, b)[0, 1]
@@ -724,7 +1136,7 @@ def nancov(a, b, min_periods=None):
     if min_periods is None:
         min_periods = 1
 
-    valid = notnull(a) & notnull(b)
+    valid = notna(a) & notna(b)
     if not valid.all():
         a = a[valid]
         b = b[valid]
@@ -742,7 +1154,7 @@ def _ensure_numeric(x):
         elif is_object_dtype(x):
             try:
                 x = x.astype(np.complex128)
-            except:
+            except (TypeError, ValueError):
                 x = x.astype(np.float64)
             else:
                 if not np.any(x.imag):
@@ -754,7 +1166,8 @@ def _ensure_numeric(x):
             try:
                 x = complex(x)
             except Exception:
-                raise TypeError('Could not convert %s to numeric' % str(x))
+                raise TypeError('Could not convert {value!s} to numeric'
+                                .format(value=x))
     return x
 
 # NA-friendly array comparisons
@@ -762,8 +1175,8 @@ def _ensure_numeric(x):
 
 def make_nancomp(op):
     def f(x, y):
-        xmask = isnull(x)
-        ymask = isnull(y)
+        xmask = isna(x)
+        ymask = isna(y)
         mask = xmask | ymask
 
         with np.errstate(all='ignore'):
@@ -785,3 +1198,75 @@ def f(x, y):
 nanle = make_nancomp(operator.le)
 naneq = make_nancomp(operator.eq)
 nanne = make_nancomp(operator.ne)
+
+
+def _nanpercentile_1d(values, mask, q, na_value, interpolation):
+    """
+    Wraper for np.percentile that skips missing values, specialized to
+    1-dimensional case.
+
+    Parameters
+    ----------
+    values : array over which to find quantiles
+    mask : ndarray[bool]
+        locations in values that should be considered missing
+    q : scalar or array of quantile indices to find
+    na_value : scalar
+        value to return for empty or all-null values
+    interpolation : str
+
+    Returns
+    -------
+    quantiles : scalar or array
+    """
+    # mask is Union[ExtensionArray, ndarray]
+    values = values[~mask]
+
+    if len(values) == 0:
+        if lib.is_scalar(q):
+            return na_value
+        else:
+            return np.array([na_value] * len(q),
+                            dtype=values.dtype)
+
+    return np.percentile(values, q, interpolation=interpolation)
+
+
+def nanpercentile(values, q, axis, na_value, mask, ndim, interpolation):
+    """
+    Wraper for np.percentile that skips missing values.
+
+    Parameters
+    ----------
+    values : array over which to find quantiles
+    q : scalar or array of quantile indices to find
+    axis : {0, 1}
+    na_value : scalar
+        value to return for empty or all-null values
+    mask : ndarray[bool]
+        locations in values that should be considered missing
+    ndim : {1, 2}
+    interpolation : str
+
+    Returns
+    -------
+    quantiles : scalar or array
+    """
+    if not lib.is_scalar(mask) and mask.any():
+        if ndim == 1:
+            return _nanpercentile_1d(values, mask, q, na_value,
+                                     interpolation=interpolation)
+        else:
+            # for nonconsolidatable blocks mask is 1D, but values 2D
+            if mask.ndim < values.ndim:
+                mask = mask.reshape(values.shape)
+            if axis == 0:
+                values = values.T
+                mask = mask.T
+            result = [_nanpercentile_1d(val, m, q, na_value,
+                                        interpolation=interpolation)
+                      for (val, m) in zip(list(values), list(mask))]
+            result = np.array(result, dtype=values.dtype, copy=False).T
+            return result
+    else:
+        return np.percentile(values, q, axis=axis, interpolation=interpolation)
diff --git a/pandas/core/ops.py b/pandas/core/ops.py
index 5dac8a7e4d2da..dbdabecafae3a 100644
--- a/pandas/core/ops.py
+++ b/pandas/core/ops.py
@@ -5,609 +5,1466 @@
 """
 # necessary to enforce truediv in Python 2.X
 from __future__ import division
+
+import datetime
 import operator
+import textwrap
 import warnings
+
 import numpy as np
+
+from pandas._libs import algos as libalgos, lib, ops as libops
+import pandas.compat as compat
+from pandas.compat import bind_method
+from pandas.errors import NullFrequencyError
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.cast import (
+    construct_1d_object_array_from_listlike, find_common_type,
+    maybe_upcast_putmask)
+from pandas.core.dtypes.common import (
+    ensure_object, is_bool_dtype, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_datetimelike_v_numeric, is_extension_array_dtype,
+    is_integer_dtype, is_list_like, is_object_dtype, is_period_dtype,
+    is_scalar, is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndex, ABCIndexClass, ABCPanel, ABCSeries, ABCSparseArray,
+    ABCSparseSeries)
+from pandas.core.dtypes.missing import isna, notna
+
 import pandas as pd
-import datetime
+import pandas.core.common as com
+import pandas.core.missing as missing
 
-from pandas._libs import (lib, index as libindex,
-                          tslib as libts, algos as libalgos, iNaT)
+# -----------------------------------------------------------------------------
+# Ops Wrapping Utilities
 
-from pandas import compat
-from pandas.util.decorators import Appender
-import pandas.computation.expressions as expressions
 
-from pandas.compat import bind_method
-import pandas.core.missing as missing
+def get_op_result_name(left, right):
+    """
+    Find the appropriate name to pin to an operation result.  This result
+    should always be either an Index or a Series.
+
+    Parameters
+    ----------
+    left : {Series, Index}
+    right : object
+
+    Returns
+    -------
+    name : object
+        Usually a string
+    """
+    # `left` is always a pd.Series when called from within ops
+    if isinstance(right, (ABCSeries, pd.Index)):
+        name = _maybe_match_name(left, right)
+    else:
+        name = left.name
+    return name
+
+
+def _maybe_match_name(a, b):
+    """
+    Try to find a name to attach to the result of an operation between
+    a and b.  If only one of these has a `name` attribute, return that
+    name.  Otherwise return a consensus name if they match of None if
+    they have different names.
+
+    Parameters
+    ----------
+    a : object
+    b : object
+
+    Returns
+    -------
+    name : str or None
+
+    See Also
+    --------
+    pandas.core.common.consensus_name_attr
+    """
+    a_has = hasattr(a, 'name')
+    b_has = hasattr(b, 'name')
+    if a_has and b_has:
+        if a.name == b.name:
+            return a.name
+        else:
+            # TODO: what if they both have np.nan for their names?
+            return None
+    elif a_has:
+        return a.name
+    elif b_has:
+        return b.name
+    return None
+
+
+def maybe_upcast_for_op(obj):
+    """
+    Cast non-pandas objects to pandas types to unify behavior of arithmetic
+    and comparison operations.
+
+    Parameters
+    ----------
+    obj: object
+
+    Returns
+    -------
+    out : object
+
+    Notes
+    -----
+    Be careful to call this *after* determining the `name` attribute to be
+    attached to the result of the arithmetic operation.
+    """
+    if type(obj) is datetime.timedelta:
+        # GH#22390  cast up to Timedelta to rely on Timedelta
+        # implementation; otherwise operation against numeric-dtype
+        # raises TypeError
+        return pd.Timedelta(obj)
+    elif isinstance(obj, np.timedelta64) and not isna(obj):
+        # In particular non-nanosecond timedelta64 needs to be cast to
+        #  nanoseconds, or else we get undesired behavior like
+        #  np.timedelta64(3, 'D') / 2 == np.timedelta64(1, 'D')
+        # The isna check is to avoid casting timedelta64("NaT"), which would
+        #  return NaT and incorrectly be treated as a datetime-NaT.
+        return pd.Timedelta(obj)
+    elif isinstance(obj, np.ndarray) and is_timedelta64_dtype(obj):
+        # GH#22390 Unfortunately we need to special-case right-hand
+        # timedelta64 dtypes because numpy casts integer dtypes to
+        # timedelta64 when operating with timedelta64
+        return pd.TimedeltaIndex(obj)
+    return obj
 
-from pandas.core.common import (_values_from_object, _maybe_match_name,
-                                PerformanceWarning)
-from pandas.types.missing import notnull, isnull
-from pandas.types.common import (needs_i8_conversion,
-                                 is_datetimelike_v_numeric,
-                                 is_integer_dtype, is_categorical_dtype,
-                                 is_object_dtype, is_timedelta64_dtype,
-                                 is_datetime64_dtype, is_datetime64tz_dtype,
-                                 is_bool_dtype, is_datetimetz,
-                                 is_list_like,
-                                 is_scalar,
-                                 _ensure_object)
-from pandas.types.cast import maybe_upcast_putmask, find_common_type
-from pandas.types.generic import ABCSeries, ABCIndex, ABCPeriodIndex
 
 # -----------------------------------------------------------------------------
-# Functions that add arithmetic methods to objects, given arithmetic factory
-# methods
+# Reversed Operations not available in the stdlib operator module.
+# Defining these instead of using lambdas allows us to reference them by name.
 
+def radd(left, right):
+    return right + left
 
-def _create_methods(arith_method, comp_method, bool_method,
-                    use_numexpr, special=False, default_axis='columns',
-                    have_divmod=False):
-    # creates actual methods based upon arithmetic, comp and bool method
-    # constructors.
 
-    # NOTE: Only frame cares about default_axis, specifically: special methods
-    # have default axis None, whereas flex methods have default axis 'columns'
-    # if we're not using numexpr, then don't pass a str_rep
-    if use_numexpr:
-        op = lambda x: x
+def rsub(left, right):
+    return right - left
+
+
+def rmul(left, right):
+    return right * left
+
+
+def rdiv(left, right):
+    return right / left
+
+
+def rtruediv(left, right):
+    return right / left
+
+
+def rfloordiv(left, right):
+    return right // left
+
+
+def rmod(left, right):
+    # check if right is a string as % is the string
+    # formatting operation; this is a TypeError
+    # otherwise perform the op
+    if isinstance(right, compat.string_types):
+        raise TypeError("{typ} cannot perform the operation mod".format(
+            typ=type(left).__name__))
+
+    return right % left
+
+
+def rdivmod(left, right):
+    return divmod(right, left)
+
+
+def rpow(left, right):
+    return right ** left
+
+
+def rand_(left, right):
+    return operator.and_(right, left)
+
+
+def ror_(left, right):
+    return operator.or_(right, left)
+
+
+def rxor(left, right):
+    return operator.xor(right, left)
+
+
+# -----------------------------------------------------------------------------
+
+def make_invalid_op(name):
+    """
+    Return a binary method that always raises a TypeError.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    invalid_op : function
+    """
+    def invalid_op(self, other=None):
+        raise TypeError("cannot perform {name} with this index type: "
+                        "{typ}".format(name=name, typ=type(self).__name__))
+
+    invalid_op.__name__ = name
+    return invalid_op
+
+
+def _gen_eval_kwargs(name):
+    """
+    Find the keyword arguments to pass to numexpr for the given operation.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    eval_kwargs : dict
+
+    Examples
+    --------
+    >>> _gen_eval_kwargs("__add__")
+    {}
+
+    >>> _gen_eval_kwargs("rtruediv")
+    {'reversed': True, 'truediv': True}
+    """
+    kwargs = {}
+
+    # Series and Panel appear to only pass __add__, __radd__, ...
+    # but DataFrame gets both these dunder names _and_ non-dunder names
+    # add, radd, ...
+    name = name.replace('__', '')
+
+    if name.startswith('r'):
+        if name not in ['radd', 'rand', 'ror', 'rxor']:
+            # Exclude commutative operations
+            kwargs['reversed'] = True
+
+    if name in ['truediv', 'rtruediv']:
+        kwargs['truediv'] = True
+
+    if name in ['ne']:
+        kwargs['masker'] = True
+
+    return kwargs
+
+
+def _gen_fill_zeros(name):
+    """
+    Find the appropriate fill value to use when filling in undefined values
+    in the results of the given operation caused by operating on
+    (generally dividing by) zero.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    fill_value : {None, np.nan, np.inf}
+    """
+    name = name.strip('__')
+    if 'div' in name:
+        # truediv, floordiv, div, and reversed variants
+        fill_value = np.inf
+    elif 'mod' in name:
+        # mod, rmod
+        fill_value = np.nan
+    else:
+        fill_value = None
+    return fill_value
+
+
+def _get_frame_op_default_axis(name):
+    """
+    Only DataFrame cares about default_axis, specifically:
+    special methods have default_axis=None and flex methods
+    have default_axis='columns'.
+
+    Parameters
+    ----------
+    name : str
+
+    Returns
+    -------
+    default_axis: str or None
+    """
+    if name.replace('__r', '__') in ['__and__', '__or__', '__xor__']:
+        # bool methods
+        return 'columns'
+    elif name.startswith('__'):
+        # __add__, __mul__, ...
+        return None
     else:
-        op = lambda x: None
+        # add, mul, ...
+        return 'columns'
+
+
+def _get_opstr(op, cls):
+    """
+    Find the operation string, if any, to pass to numexpr for this
+    operation.
+
+    Parameters
+    ----------
+    op : binary operator
+    cls : class
+
+    Returns
+    -------
+    op_str : string or None
+    """
+    # numexpr is available for non-sparse classes
+    subtyp = getattr(cls, '_subtyp', '')
+    use_numexpr = 'sparse' not in subtyp
+
+    if not use_numexpr:
+        # if we're not using numexpr, then don't pass a str_rep
+        return None
+
+    return {operator.add: '+',
+            radd: '+',
+            operator.mul: '*',
+            rmul: '*',
+            operator.sub: '-',
+            rsub: '-',
+            operator.truediv: '/',
+            rtruediv: '/',
+            operator.floordiv: '//',
+            rfloordiv: '//',
+            operator.mod: None,  # TODO: Why None for mod but '%' for rmod?
+            rmod: '%',
+            operator.pow: '**',
+            rpow: '**',
+            operator.eq: '==',
+            operator.ne: '!=',
+            operator.le: '<=',
+            operator.lt: '<',
+            operator.ge: '>=',
+            operator.gt: '>',
+            operator.and_: '&',
+            rand_: '&',
+            operator.or_: '|',
+            ror_: '|',
+            operator.xor: '^',
+            rxor: '^',
+            divmod: None,
+            rdivmod: None}[op]
+
+
+def _get_op_name(op, special):
+    """
+    Find the name to attach to this method according to conventions
+    for special and non-special methods.
+
+    Parameters
+    ----------
+    op : binary operator
+    special : bool
+
+    Returns
+    -------
+    op_name : str
+    """
+    opname = op.__name__.strip('_')
     if special:
+        opname = '__{opname}__'.format(opname=opname)
+    return opname
 
-        def names(x):
-            if x[-1] == "_":
-                return "__%s_" % x
-            else:
-                return "__%s__" % x
+
+# -----------------------------------------------------------------------------
+# Docstring Generation and Templates
+
+_op_descriptions = {
+    # Arithmetic Operators
+    'add': {'op': '+',
+            'desc': 'Addition',
+            'reverse': 'radd'},
+    'sub': {'op': '-',
+            'desc': 'Subtraction',
+            'reverse': 'rsub'},
+    'mul': {'op': '*',
+            'desc': 'Multiplication',
+            'reverse': 'rmul',
+            'df_examples': None},
+    'mod': {'op': '%',
+            'desc': 'Modulo',
+            'reverse': 'rmod'},
+    'pow': {'op': '**',
+            'desc': 'Exponential power',
+            'reverse': 'rpow',
+            'df_examples': None},
+    'truediv': {'op': '/',
+                'desc': 'Floating division',
+                'reverse': 'rtruediv',
+                'df_examples': None},
+    'floordiv': {'op': '//',
+                 'desc': 'Integer division',
+                 'reverse': 'rfloordiv',
+                 'df_examples': None},
+    'divmod': {'op': 'divmod',
+               'desc': 'Integer division and modulo',
+               'reverse': 'rdivmod',
+               'df_examples': None},
+
+    # Comparison Operators
+    'eq': {'op': '==',
+           'desc': 'Equal to',
+           'reverse': None},
+    'ne': {'op': '!=',
+           'desc': 'Not equal to',
+           'reverse': None},
+    'lt': {'op': '<',
+           'desc': 'Less than',
+           'reverse': None},
+    'le': {'op': '<=',
+           'desc': 'Less than or equal to',
+           'reverse': None},
+    'gt': {'op': '>',
+           'desc': 'Greater than',
+           'reverse': None},
+    'ge': {'op': '>=',
+           'desc': 'Greater than or equal to',
+           'reverse': None}
+}
+
+_op_names = list(_op_descriptions.keys())
+for key in _op_names:
+    _op_descriptions[key]['reversed'] = False
+    reverse_op = _op_descriptions[key]['reverse']
+    if reverse_op is not None:
+        _op_descriptions[reverse_op] = _op_descriptions[key].copy()
+        _op_descriptions[reverse_op]['reversed'] = True
+        _op_descriptions[reverse_op]['reverse'] = key
+
+_flex_doc_SERIES = """
+Return {desc} of series and other, element-wise (binary operator `{op_name}`).
+
+Equivalent to ``{equiv}``, but with support to substitute a fill_value for
+missing data in one of the inputs.
+
+Parameters
+----------
+other : Series or scalar value
+fill_value : None or float value, default None (NaN)
+    Fill existing missing (NaN) values, and any new element needed for
+    successful Series alignment, with this value before computation.
+    If data in both corresponding Series locations is missing
+    the result will be missing.
+level : int or name
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level.
+
+Returns
+-------
+Series
+    The result of the operation.
+
+See Also
+--------
+Series.{reverse}
+
+Examples
+--------
+>>> a = pd.Series([1, 1, 1, np.nan], index=['a', 'b', 'c', 'd'])
+>>> a
+a    1.0
+b    1.0
+c    1.0
+d    NaN
+dtype: float64
+>>> b = pd.Series([1, np.nan, 1, np.nan], index=['a', 'b', 'd', 'e'])
+>>> b
+a    1.0
+b    NaN
+d    1.0
+e    NaN
+dtype: float64
+>>> a.add(b, fill_value=0)
+a    2.0
+b    1.0
+c    1.0
+d    1.0
+e    NaN
+dtype: float64
+>>> a.subtract(b, fill_value=0)
+a    0.0
+b    1.0
+c    1.0
+d   -1.0
+e    NaN
+dtype: float64
+>>> a.multiply(b)
+a    1.0
+b    NaN
+c    NaN
+d    NaN
+e    NaN
+dtype: float64
+>>> a.divide(b, fill_value=0)
+a    1.0
+b    inf
+c    inf
+d    0.0
+e    NaN
+dtype: float64
+"""
+
+_arith_doc_FRAME = """
+Binary operator %s with support to substitute a fill_value for missing data in
+one of the inputs
+
+Parameters
+----------
+other : Series, DataFrame, or constant
+axis : {0, 1, 'index', 'columns'}
+    For Series input, axis to match Series index on
+fill_value : None or float value, default None
+    Fill existing missing (NaN) values, and any new element needed for
+    successful DataFrame alignment, with this value before computation.
+    If data in both corresponding DataFrame locations is missing
+    the result will be missing
+level : int or name
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level
+
+Returns
+-------
+result : DataFrame
+
+Notes
+-----
+Mismatched indices will be unioned together
+"""
+
+_flex_doc_FRAME = """
+Get {desc} of dataframe and other, element-wise (binary operator `{op_name}`).
+
+Equivalent to ``{equiv}``, but with support to substitute a fill_value
+for missing data in one of the inputs. With reverse version, `{reverse}`.
+
+Among flexible wrappers (`add`, `sub`, `mul`, `div`, `mod`, `pow`) to
+arithmetic operators: `+`, `-`, `*`, `/`, `//`, `%`, `**`.
+
+Parameters
+----------
+other : scalar, sequence, Series, or DataFrame
+    Any single or multiple element data structure, or list-like object.
+axis :  {{0 or 'index', 1 or 'columns'}}
+    Whether to compare by the index (0 or 'index') or columns
+    (1 or 'columns'). For Series input, axis to match Series index on.
+level : int or label
+    Broadcast across a level, matching Index values on the
+    passed MultiIndex level.
+fill_value : float or None, default None
+    Fill existing missing (NaN) values, and any new element needed for
+    successful DataFrame alignment, with this value before computation.
+    If data in both corresponding DataFrame locations is missing
+    the result will be missing.
+
+Returns
+-------
+DataFrame
+    Result of the arithmetic operation.
+
+See Also
+--------
+DataFrame.add : Add DataFrames.
+DataFrame.sub : Subtract DataFrames.
+DataFrame.mul : Multiply DataFrames.
+DataFrame.div : Divide DataFrames (float division).
+DataFrame.truediv : Divide DataFrames (float division).
+DataFrame.floordiv : Divide DataFrames (integer division).
+DataFrame.mod : Calculate modulo (remainder after division).
+DataFrame.pow : Calculate exponential power.
+
+Notes
+-----
+Mismatched indices will be unioned together.
+
+Examples
+--------
+>>> df = pd.DataFrame({{'angles': [0, 3, 4],
+...                    'degrees': [360, 180, 360]}},
+...                   index=['circle', 'triangle', 'rectangle'])
+>>> df
+           angles  degrees
+circle          0      360
+triangle        3      180
+rectangle       4      360
+
+Add a scalar with operator version which return the same
+results.
+
+>>> df + 1
+           angles  degrees
+circle          1      361
+triangle        4      181
+rectangle       5      361
+
+>>> df.add(1)
+           angles  degrees
+circle          1      361
+triangle        4      181
+rectangle       5      361
+
+Divide by constant with reverse version.
+
+>>> df.div(10)
+           angles  degrees
+circle        0.0     36.0
+triangle      0.3     18.0
+rectangle     0.4     36.0
+
+>>> df.rdiv(10)
+             angles   degrees
+circle          inf  0.027778
+triangle   3.333333  0.055556
+rectangle  2.500000  0.027778
+
+Subtract a list and Series by axis with operator version.
+
+>>> df - [1, 2]
+           angles  degrees
+circle         -1      358
+triangle        2      178
+rectangle       3      358
+
+>>> df.sub([1, 2], axis='columns')
+           angles  degrees
+circle         -1      358
+triangle        2      178
+rectangle       3      358
+
+>>> df.sub(pd.Series([1, 1, 1], index=['circle', 'triangle', 'rectangle']),
+...        axis='index')
+           angles  degrees
+circle         -1      359
+triangle        2      179
+rectangle       3      359
+
+Multiply a DataFrame of different shape with operator version.
+
+>>> other = pd.DataFrame({{'angles': [0, 3, 4]}},
+...                      index=['circle', 'triangle', 'rectangle'])
+>>> other
+           angles
+circle          0
+triangle        3
+rectangle       4
+
+>>> df * other
+           angles  degrees
+circle          0      NaN
+triangle        9      NaN
+rectangle      16      NaN
+
+>>> df.mul(other, fill_value=0)
+           angles  degrees
+circle          0      0.0
+triangle        9      0.0
+rectangle      16      0.0
+
+Divide by a MultiIndex by level.
+
+>>> df_multindex = pd.DataFrame({{'angles': [0, 3, 4, 4, 5, 6],
+...                              'degrees': [360, 180, 360, 360, 540, 720]}},
+...                             index=[['A', 'A', 'A', 'B', 'B', 'B'],
+...                                    ['circle', 'triangle', 'rectangle',
+...                                     'square', 'pentagon', 'hexagon']])
+>>> df_multindex
+             angles  degrees
+A circle          0      360
+  triangle        3      180
+  rectangle       4      360
+B square          4      360
+  pentagon        5      540
+  hexagon         6      720
+
+>>> df.div(df_multindex, level=1, fill_value=0)
+             angles  degrees
+A circle        NaN      1.0
+  triangle      1.0      1.0
+  rectangle     1.0      1.0
+B square        0.0      0.0
+  pentagon      0.0      0.0
+  hexagon       0.0      0.0
+"""
+
+_flex_comp_doc_FRAME = """
+Get {desc} of dataframe and other, element-wise (binary operator `{op_name}`).
+
+Among flexible wrappers (`eq`, `ne`, `le`, `lt`, `ge`, `gt`) to comparison
+operators.
+
+Equivalent to `==`, `=!`, `<=`, `<`, `>=`, `>` with support to choose axis
+(rows or columns) and level for comparison.
+
+Parameters
+----------
+other : scalar, sequence, Series, or DataFrame
+    Any single or multiple element data structure, or list-like object.
+axis :  {{0 or 'index', 1 or 'columns'}}, default 'columns'
+    Whether to compare by the index (0 or 'index') or columns
+    (1 or 'columns').
+level : int or label
+    Broadcast across a level, matching Index values on the passed
+    MultiIndex level.
+
+Returns
+-------
+DataFrame of bool
+    Result of the comparison.
+
+See Also
+--------
+DataFrame.eq : Compare DataFrames for equality elementwise.
+DataFrame.ne : Compare DataFrames for inequality elementwise.
+DataFrame.le : Compare DataFrames for less than inequality
+    or equality elementwise.
+DataFrame.lt : Compare DataFrames for strictly less than
+    inequality elementwise.
+DataFrame.ge : Compare DataFrames for greater than inequality
+    or equality elementwise.
+DataFrame.gt : Compare DataFrames for strictly greater than
+    inequality elementwise.
+
+Notes
+--------
+Mismatched indices will be unioned together.
+`NaN` values are considered different (i.e. `NaN` != `NaN`).
+
+Examples
+--------
+>>> df = pd.DataFrame({{'cost': [250, 150, 100],
+...                    'revenue': [100, 250, 300]}},
+...                   index=['A', 'B', 'C'])
+>>> df
+   cost  revenue
+A   250      100
+B   150      250
+C   100      300
+
+Comparison with a scalar, using either the operator or method:
+
+>>> df == 100
+    cost  revenue
+A  False     True
+B  False    False
+C   True    False
+
+>>> df.eq(100)
+    cost  revenue
+A  False     True
+B  False    False
+C   True    False
+
+When `other` is a :class:`Series`, the columns of a DataFrame are aligned
+with the index of `other` and broadcast:
+
+>>> df != pd.Series([100, 250], index=["cost", "revenue"])
+    cost  revenue
+A   True     True
+B   True    False
+C  False     True
+
+Use the method to control the broadcast axis:
+
+>>> df.ne(pd.Series([100, 300], index=["A", "D"]), axis='index')
+   cost  revenue
+A  True    False
+B  True     True
+C  True     True
+D  True     True
+
+When comparing to an arbitrary sequence, the number of columns must
+match the number elements in `other`:
+
+>>> df == [250, 100]
+    cost  revenue
+A   True     True
+B  False    False
+C  False    False
+
+Use the method to control the axis:
+
+>>> df.eq([250, 250, 100], axis='index')
+    cost  revenue
+A   True    False
+B  False     True
+C   True    False
+
+Compare to a DataFrame of different shape.
+
+>>> other = pd.DataFrame({{'revenue': [300, 250, 100, 150]}},
+...                      index=['A', 'B', 'C', 'D'])
+>>> other
+   revenue
+A      300
+B      250
+C      100
+D      150
+
+>>> df.gt(other)
+    cost  revenue
+A  False    False
+B  False    False
+C  False     True
+D  False    False
+
+Compare to a MultiIndex by level.
+
+>>> df_multindex = pd.DataFrame({{'cost': [250, 150, 100, 150, 300, 220],
+...                              'revenue': [100, 250, 300, 200, 175, 225]}},
+...                             index=[['Q1', 'Q1', 'Q1', 'Q2', 'Q2', 'Q2'],
+...                                    ['A', 'B', 'C', 'A', 'B', 'C']])
+>>> df_multindex
+      cost  revenue
+Q1 A   250      100
+   B   150      250
+   C   100      300
+Q2 A   150      200
+   B   300      175
+   C   220      225
+
+>>> df.le(df_multindex, level=1)
+       cost  revenue
+Q1 A   True     True
+   B   True     True
+   C   True     True
+Q2 A  False     True
+   B   True    False
+   C   True    False
+"""
+
+_flex_doc_PANEL = """
+Return {desc} of series and other, element-wise (binary operator `{op_name}`).
+Equivalent to ``{equiv}``.
+
+Parameters
+----------
+other : DataFrame or Panel
+axis : {{items, major_axis, minor_axis}}
+    Axis to broadcast over
+
+Returns
+-------
+Panel
+
+See Also
+--------
+Panel.{reverse}
+"""
+
+
+_agg_doc_PANEL = """
+Wrapper method for {op_name}
+
+Parameters
+----------
+other : DataFrame or Panel
+axis : {{items, major_axis, minor_axis}}
+    Axis to broadcast over
+
+Returns
+-------
+Panel
+"""
+
+
+def _make_flex_doc(op_name, typ):
+    """
+    Make the appropriate substitutions for the given operation and class-typ
+    into either _flex_doc_SERIES or _flex_doc_FRAME to return the docstring
+    to attach to a generated method.
+
+    Parameters
+    ----------
+    op_name : str {'__add__', '__sub__', ... '__eq__', '__ne__', ...}
+    typ : str {series, 'dataframe']}
+
+    Returns
+    -------
+    doc : str
+    """
+    op_name = op_name.replace('__', '')
+    op_desc = _op_descriptions[op_name]
+
+    if op_desc['reversed']:
+        equiv = 'other ' + op_desc['op'] + ' ' + typ
     else:
-        names = lambda x: x
+        equiv = typ + ' ' + op_desc['op'] + ' other'
+
+    if typ == 'series':
+        base_doc = _flex_doc_SERIES
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'])
+    elif typ == 'dataframe':
+        base_doc = _flex_doc_FRAME
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'])
+    elif typ == 'panel':
+        base_doc = _flex_doc_PANEL
+        doc = base_doc.format(desc=op_desc['desc'], op_name=op_name,
+                              equiv=equiv, reverse=op_desc['reverse'])
+    else:
+        raise AssertionError('Invalid typ argument.')
+    return doc
 
-    # Inframe, all special methods have default_axis=None, flex methods have
-    # default_axis set to the default (columns)
-    # yapf: disable
-    new_methods = dict(
-        add=arith_method(operator.add, names('add'), op('+'),
-                         default_axis=default_axis),
-        radd=arith_method(lambda x, y: y + x, names('radd'), op('+'),
-                          default_axis=default_axis),
-        sub=arith_method(operator.sub, names('sub'), op('-'),
-                         default_axis=default_axis),
-        mul=arith_method(operator.mul, names('mul'), op('*'),
-                         default_axis=default_axis),
-        truediv=arith_method(operator.truediv, names('truediv'), op('/'),
-                             truediv=True, fill_zeros=np.inf,
-                             default_axis=default_axis),
-        floordiv=arith_method(operator.floordiv, names('floordiv'), op('//'),
-                              default_axis=default_axis, fill_zeros=np.inf),
-        # Causes a floating point exception in the tests when numexpr enabled,
-        # so for now no speedup
-        mod=arith_method(operator.mod, names('mod'), None,
-                         default_axis=default_axis, fill_zeros=np.nan),
-        pow=arith_method(operator.pow, names('pow'), op('**'),
-                         default_axis=default_axis),
-        # not entirely sure why this is necessary, but previously was included
-        # so it's here to maintain compatibility
-        rmul=arith_method(operator.mul, names('rmul'), op('*'),
-                          default_axis=default_axis, reversed=True),
-        rsub=arith_method(lambda x, y: y - x, names('rsub'), op('-'),
-                          default_axis=default_axis, reversed=True),
-        rtruediv=arith_method(lambda x, y: operator.truediv(y, x),
-                              names('rtruediv'), op('/'), truediv=True,
-                              fill_zeros=np.inf, default_axis=default_axis,
-                              reversed=True),
-        rfloordiv=arith_method(lambda x, y: operator.floordiv(y, x),
-                               names('rfloordiv'), op('//'),
-                               default_axis=default_axis, fill_zeros=np.inf,
-                               reversed=True),
-        rpow=arith_method(lambda x, y: y**x, names('rpow'), op('**'),
-                          default_axis=default_axis, reversed=True),
-        rmod=arith_method(lambda x, y: y % x, names('rmod'), op('%'),
-                          default_axis=default_axis, fill_zeros=np.nan,
-                          reversed=True),)
-    # yapf: enable
-    new_methods['div'] = new_methods['truediv']
-    new_methods['rdiv'] = new_methods['rtruediv']
 
-    # Comp methods never had a default axis set
-    if comp_method:
-        new_methods.update(dict(
-            eq=comp_method(operator.eq, names('eq'), op('==')),
-            ne=comp_method(operator.ne, names('ne'), op('!='), masker=True),
-            lt=comp_method(operator.lt, names('lt'), op('<')),
-            gt=comp_method(operator.gt, names('gt'), op('>')),
-            le=comp_method(operator.le, names('le'), op('<=')),
-            ge=comp_method(operator.ge, names('ge'), op('>=')), ))
-    if bool_method:
-        new_methods.update(
-            dict(and_=bool_method(operator.and_, names('and_'), op('&')),
-                 or_=bool_method(operator.or_, names('or_'), op('|')),
-                 # For some reason ``^`` wasn't used in original.
-                 xor=bool_method(operator.xor, names('xor'), op('^')),
-                 rand_=bool_method(lambda x, y: operator.and_(y, x),
-                                   names('rand_'), op('&')),
-                 ror_=bool_method(lambda x, y: operator.or_(y, x),
-                                  names('ror_'), op('|')),
-                 rxor=bool_method(lambda x, y: operator.xor(y, x),
-                                  names('rxor'), op('^'))))
-    if have_divmod:
-        # divmod doesn't have an op that is supported by numexpr
-        new_methods['divmod'] = arith_method(
-            divmod,
-            names('divmod'),
-            None,
-            default_axis=default_axis,
-            construct_result=_construct_divmod_result,
-        )
-
-    new_methods = dict((names(k), v) for k, v in new_methods.items())
-    return new_methods
+# -----------------------------------------------------------------------------
+# Masking NA values and fallbacks for operations numpy does not support
 
+def fill_binop(left, right, fill_value):
+    """
+    If a non-None fill_value is given, replace null entries in left and right
+    with this value, but only in positions where _one_ of left/right is null,
+    not both.
 
-def add_methods(cls, new_methods, force, select, exclude):
-    if select and exclude:
-        raise TypeError("May only pass either select or exclude")
-    methods = new_methods
-    if select:
-        select = set(select)
-        methods = {}
-        for key, method in new_methods.items():
-            if key in select:
-                methods[key] = method
-    if exclude:
-        for k in exclude:
-            new_methods.pop(k, None)
+    Parameters
+    ----------
+    left : array-like
+    right : array-like
+    fill_value : object
+
+    Returns
+    -------
+    left : array-like
+    right : array-like
+
+    Notes
+    -----
+    Makes copies if fill_value is not None
+    """
+    # TODO: can we make a no-copy implementation?
+    if fill_value is not None:
+        left_mask = isna(left)
+        right_mask = isna(right)
+        left = left.copy()
+        right = right.copy()
+
+        # one but not both
+        mask = left_mask ^ right_mask
+        left[left_mask & mask] = fill_value
+        right[right_mask & mask] = fill_value
+    return left, right
 
-    for name, method in new_methods.items():
-        if force or name not in cls.__dict__:
-            bind_method(cls, name, method)
 
+def mask_cmp_op(x, y, op, allowed_types):
+    """
+    Apply the function `op` to only non-null points in x and y.
 
-# ----------------------------------------------------------------------
-# Arithmetic
-def add_special_arithmetic_methods(cls, arith_method=None,
-                                   comp_method=None, bool_method=None,
-                                   use_numexpr=True, force=False, select=None,
-                                   exclude=None, have_divmod=False):
+    Parameters
+    ----------
+    x : array-like
+    y : array-like
+    op : binary operation
+    allowed_types : class or tuple of classes
+
+    Returns
+    -------
+    result : ndarray[bool]
     """
-    Adds the full suite of special arithmetic methods (``__add__``,
-    ``__sub__``, etc.) to the class.
+    # TODO: Can we make the allowed_types arg unnecessary?
+    xrav = x.ravel()
+    result = np.empty(x.size, dtype=bool)
+    if isinstance(y, allowed_types):
+        yrav = y.ravel()
+        mask = notna(xrav) & notna(yrav)
+        result[mask] = op(np.array(list(xrav[mask])),
+                          np.array(list(yrav[mask])))
+    else:
+        mask = notna(xrav)
+        result[mask] = op(np.array(list(xrav[mask])), y)
+
+    if op == operator.ne:  # pragma: no cover
+        np.putmask(result, ~mask, True)
+    else:
+        np.putmask(result, ~mask, False)
+    result = result.reshape(x.shape)
+    return result
+
+
+def masked_arith_op(x, y, op):
+    """
+    If the given arithmetic operation fails, attempt it again on
+    only the non-null elements of the input array(s).
 
     Parameters
     ----------
-    arith_method : function (optional)
-        factory for special arithmetic methods, with op string:
-        f(op, name, str_rep, default_axis=None, fill_zeros=None, **eval_kwargs)
-    comp_method : function, optional,
-        factory for rich comparison - signature: f(op, name, str_rep)
-    use_numexpr : bool, default True
-        whether to accelerate with numexpr, defaults to True
-    force : bool, default False
-        if False, checks whether function is defined **on ``cls.__dict__``**
-        before defining if True, always defines functions on class base
-    select : iterable of strings (optional)
-        if passed, only sets functions with names in select
-    exclude : iterable of strings (optional)
-        if passed, will not set functions with names in exclude
-    have_divmod : bool, (optional)
-        should a divmod method be added? this method is special because it
-        returns a tuple of cls instead of a single element of type cls
+    x : np.ndarray
+    y : np.ndarray, Series, Index
+    op : binary operator
     """
+    # For Series `x` is 1D so ravel() is a no-op; calling it anyway makes
+    # the logic valid for both Series and DataFrame ops.
+    xrav = x.ravel()
+    assert isinstance(x, (np.ndarray, ABCSeries)), type(x)
+    if isinstance(y, (np.ndarray, ABCSeries, ABCIndexClass)):
+        dtype = find_common_type([x.dtype, y.dtype])
+        result = np.empty(x.size, dtype=dtype)
+
+        # PeriodIndex.ravel() returns int64 dtype, so we have
+        # to work around that case.  See GH#19956
+        yrav = y if is_period_dtype(y) else y.ravel()
+        mask = notna(xrav) & notna(yrav)
+
+        if yrav.shape != mask.shape:
+            # FIXME: GH#5284, GH#5035, GH#19448
+            # Without specifically raising here we get mismatched
+            # errors in Py3 (TypeError) vs Py2 (ValueError)
+            # Note: Only = an issue in DataFrame case
+            raise ValueError('Cannot broadcast operands together.')
 
-    # in frame, special methods have default_axis = None, comp methods use
-    # 'columns'
+        if mask.any():
+            with np.errstate(all='ignore'):
+                result[mask] = op(xrav[mask],
+                                  com.values_from_object(yrav[mask]))
 
-    new_methods = _create_methods(arith_method, comp_method,
-                                  bool_method, use_numexpr, default_axis=None,
-                                  special=True, have_divmod=have_divmod)
+    else:
+        assert is_scalar(y), type(y)
+        assert isinstance(x, np.ndarray), type(x)
+        # mask is only meaningful for x
+        result = np.empty(x.size, dtype=x.dtype)
+        mask = notna(xrav)
+
+        # 1 ** np.nan is 1. So we have to unmask those.
+        if op == pow:
+            mask = np.where(x == 1, False, mask)
+        elif op == rpow:
+            mask = np.where(y == 1, False, mask)
 
-    # inplace operators (I feel like these should get passed an `inplace=True`
-    # or just be removed
+        if mask.any():
+            with np.errstate(all='ignore'):
+                result[mask] = op(xrav[mask], y)
 
-    def _wrap_inplace_method(method):
-        """
-        return an inplace wrapper for this method
-        """
+    result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
+    result = result.reshape(x.shape)  # 2D compat
+    return result
 
-        def f(self, other):
-            result = method(self, other)
 
-            # this makes sure that we are aligned like the input
-            # we are updating inplace so we want to ignore is_copy
-            self._update_inplace(result.reindex_like(self, copy=False)._data,
-                                 verify_is_copy=False)
+def invalid_comparison(left, right, op):
+    """
+    If a comparison has mismatched types and is not necessarily meaningful,
+    follow python3 conventions by:
 
-            return self
+        - returning all-False for equality
+        - returning all-True for inequality
+        - raising TypeError otherwise
 
-        return f
+    Parameters
+    ----------
+    left : array-like
+    right : scalar, array-like
+    op : operator.{eq, ne, lt, le, gt}
 
-    new_methods.update(
-        dict(__iadd__=_wrap_inplace_method(new_methods["__add__"]),
-             __isub__=_wrap_inplace_method(new_methods["__sub__"]),
-             __imul__=_wrap_inplace_method(new_methods["__mul__"]),
-             __itruediv__=_wrap_inplace_method(new_methods["__truediv__"]),
-             __ipow__=_wrap_inplace_method(new_methods["__pow__"]), ))
-    if not compat.PY3:
-        new_methods["__idiv__"] = new_methods["__div__"]
+    Raises
+    ------
+    TypeError : on inequality comparisons
+    """
+    if op is operator.eq:
+        res_values = np.zeros(left.shape, dtype=bool)
+    elif op is operator.ne:
+        res_values = np.ones(left.shape, dtype=bool)
+    else:
+        raise TypeError("Invalid comparison between dtype={dtype} and {typ}"
+                        .format(dtype=left.dtype, typ=type(right).__name__))
+    return res_values
 
-    add_methods(cls, new_methods=new_methods, force=force, select=select,
-                exclude=exclude)
 
+# -----------------------------------------------------------------------------
+# Dispatch logic
 
-def add_flex_arithmetic_methods(cls, flex_arith_method,
-                                flex_comp_method=None, flex_bool_method=None,
-                                use_numexpr=True, force=False, select=None,
-                                exclude=None):
+def should_series_dispatch(left, right, op):
     """
-    Adds the full suite of flex arithmetic methods (``pow``, ``mul``, ``add``)
-    to the class.
+    Identify cases where a DataFrame operation should dispatch to its
+    Series counterpart.
 
     Parameters
     ----------
-    flex_arith_method : function
-        factory for special arithmetic methods, with op string:
-        f(op, name, str_rep, default_axis=None, fill_zeros=None, **eval_kwargs)
-    flex_comp_method : function, optional,
-        factory for rich comparison - signature: f(op, name, str_rep)
-    use_numexpr : bool, default True
-        whether to accelerate with numexpr, defaults to True
-    force : bool, default False
-        if False, checks whether function is defined **on ``cls.__dict__``**
-        before defining if True, always defines functions on class base
-    select : iterable of strings (optional)
-        if passed, only sets functions with names in select
-    exclude : iterable of strings (optional)
-        if passed, will not set functions with names in exclude
+    left : DataFrame
+    right : DataFrame
+    op : binary operator
+
+    Returns
+    -------
+    override : bool
     """
-    # in frame, default axis is 'columns', doesn't matter for series and panel
-    new_methods = _create_methods(flex_arith_method,
-                                  flex_comp_method, flex_bool_method,
-                                  use_numexpr, default_axis='columns',
-                                  special=False)
-    new_methods.update(dict(multiply=new_methods['mul'],
-                            subtract=new_methods['sub'],
-                            divide=new_methods['div']))
-    # opt out of bool flex methods for now
-    for k in ('ror_', 'rxor', 'rand_'):
-        if k in new_methods:
-            new_methods.pop(k)
+    if left._is_mixed_type or right._is_mixed_type:
+        return True
+
+    if not len(left.columns) or not len(right.columns):
+        # ensure obj.dtypes[0] exists for each obj
+        return False
+
+    ldtype = left.dtypes.iloc[0]
+    rdtype = right.dtypes.iloc[0]
 
-    add_methods(cls, new_methods=new_methods, force=force, select=select,
-                exclude=exclude)
+    if ((is_timedelta64_dtype(ldtype) and is_integer_dtype(rdtype)) or
+            (is_timedelta64_dtype(rdtype) and is_integer_dtype(ldtype))):
+        # numpy integer dtypes as timedelta64 dtypes in this scenario
+        return True
 
+    if is_datetime64_dtype(ldtype) and is_object_dtype(rdtype):
+        # in particular case where right is an array of DateOffsets
+        return True
 
-class _Op(object):
+    return False
+
+
+def dispatch_to_series(left, right, func, str_rep=None, axis=None):
+    """
+    Evaluate the frame operation func(left, right) by evaluating
+    column-by-column, dispatching to the Series implementation.
 
+    Parameters
+    ----------
+    left : DataFrame
+    right : scalar or DataFrame
+    func : arithmetic or comparison operator
+    str_rep : str or None, default None
+    axis : {None, 0, 1, "index", "columns"}
+
+    Returns
+    -------
+    DataFrame
     """
-    Wrapper around Series arithmetic operations.
-    Generally, you should use classmethod ``_Op.get_op`` as an entry point.
+    # Note: we use iloc to access columns for compat with cases
+    #       with non-unique columns.
+    import pandas.core.computation.expressions as expressions
+
+    right = lib.item_from_zerodim(right)
+    if lib.is_scalar(right) or np.ndim(right) == 0:
+
+        def column_op(a, b):
+            return {i: func(a.iloc[:, i], b)
+                    for i in range(len(a.columns))}
+
+    elif isinstance(right, ABCDataFrame):
+        assert right._indexed_same(left)
+
+        def column_op(a, b):
+            return {i: func(a.iloc[:, i], b.iloc[:, i])
+                    for i in range(len(a.columns))}
+
+    elif isinstance(right, ABCSeries) and axis == "columns":
+        # We only get here if called via left._combine_match_columns,
+        # in which case we specifically want to operate row-by-row
+        assert right.index.equals(left.columns)
 
-    This validates and coerces lhs and rhs depending on its dtype and
-    based on op. See _TimeOp also.
+        def column_op(a, b):
+            return {i: func(a.iloc[:, i], b.iloc[i])
+                    for i in range(len(a.columns))}
+
+    elif isinstance(right, ABCSeries):
+        assert right.index.equals(left.index)  # Handle other cases later
+
+        def column_op(a, b):
+            return {i: func(a.iloc[:, i], b)
+                    for i in range(len(a.columns))}
+
+    else:
+        # Remaining cases have less-obvious dispatch rules
+        raise NotImplementedError(right)
+
+    new_data = expressions.evaluate(column_op, str_rep, left, right)
+
+    result = left._constructor(new_data, index=left.index, copy=False)
+    # Pin columns instead of passing to constructor for compat with
+    # non-unique columns case
+    result.columns = left.columns
+    return result
+
+
+def dispatch_to_index_op(op, left, right, index_class):
+    """
+    Wrap Series left in the given index_class to delegate the operation op
+    to the index implementation.  DatetimeIndex and TimedeltaIndex perform
+    type checking, timezone handling, overflow checks, etc.
 
     Parameters
     ----------
+    op : binary operator (operator.add, operator.sub, ...)
     left : Series
-        lhs of op
     right : object
-        rhs of op
-    name : str
-        name of op
-    na_op : callable
-        a function which wraps op
+    index_class : DatetimeIndex or TimedeltaIndex
+
+    Returns
+    -------
+    result : object, usually DatetimeIndex, TimedeltaIndex, or Series
     """
+    left_idx = index_class(left)
+
+    # avoid accidentally allowing integer add/sub.  For datetime64[tz] dtypes,
+    # left_idx may inherit a freq from a cached DatetimeIndex.
+    # See discussion in GH#19147.
+    if getattr(left_idx, 'freq', None) is not None:
+        left_idx = left_idx._shallow_copy(freq=None)
+    try:
+        result = op(left_idx, right)
+    except NullFrequencyError:
+        # DatetimeIndex and TimedeltaIndex with freq == None raise ValueError
+        # on add/sub of integers (or int-like).  We re-raise as a TypeError.
+        raise TypeError('incompatible type for a datetime/timedelta '
+                        'operation [{name}]'.format(name=op.__name__))
+    return result
 
-    fill_value = np.nan
-    wrap_results = staticmethod(lambda x: x)
-    dtype = None
 
-    def __init__(self, left, right, name, na_op):
-        self.left = left
-        self.right = right
+def dispatch_to_extension_op(op, left, right):
+    """
+    Assume that left or right is a Series backed by an ExtensionArray,
+    apply the operator defined by op.
+    """
 
-        self.name = name
-        self.na_op = na_op
+    # The op calls will raise TypeError if the op is not defined
+    # on the ExtensionArray
 
-        self.lvalues = left
-        self.rvalues = right
+    # unbox Series and Index to arrays
+    if isinstance(left, (ABCSeries, ABCIndexClass)):
+        new_left = left._values
+    else:
+        new_left = left
 
-    @classmethod
-    def get_op(cls, left, right, name, na_op):
-        """
-        Get op dispatcher, returns _Op or _TimeOp.
+    if isinstance(right, (ABCSeries, ABCIndexClass)):
+        new_right = right._values
+    else:
+        new_right = right
 
-        If ``left`` and ``right`` are appropriate for datetime arithmetic with
-        operation ``name``, processes them and returns a ``_TimeOp`` object
-        that stores all the required values.  Otherwise, it will generate
-        either a ``_Op``, indicating that the operation is performed via
-        normal numpy path.
-        """
-        is_timedelta_lhs = is_timedelta64_dtype(left)
-        is_datetime_lhs = (is_datetime64_dtype(left) or
-                           is_datetime64tz_dtype(left))
+    res_values = op(new_left, new_right)
+    res_name = get_op_result_name(left, right)
 
-        if not (is_datetime_lhs or is_timedelta_lhs):
-            return _Op(left, right, name, na_op)
-        else:
-            return _TimeOp(left, right, name, na_op)
+    if op.__name__ in ['divmod', 'rdivmod']:
+        return _construct_divmod_result(
+            left, res_values, left.index, res_name)
 
+    return _construct_result(left, res_values, left.index, res_name)
 
-class _TimeOp(_Op):
+
+# -----------------------------------------------------------------------------
+# Functions that add arithmetic methods to objects, given arithmetic factory
+# methods
+
+def _get_method_wrappers(cls):
     """
-    Wrapper around Series datetime/time/timedelta arithmetic operations.
-    Generally, you should use classmethod ``_Op.get_op`` as an entry point.
+    Find the appropriate operation-wrappers to use when defining flex/special
+    arithmetic, boolean, and comparison operations with the given class.
+
+    Parameters
+    ----------
+    cls : class
+
+    Returns
+    -------
+    arith_flex : function or None
+    comp_flex : function or None
+    arith_special : function
+    comp_special : function
+    bool_special : function
+
+    Notes
+    -----
+    None is only returned for SparseArray
     """
-    fill_value = iNaT
-
-    def __init__(self, left, right, name, na_op):
-        super(_TimeOp, self).__init__(left, right, name, na_op)
-
-        lvalues = self._convert_to_array(left, name=name)
-        rvalues = self._convert_to_array(right, name=name, other=lvalues)
-
-        # left
-        self.is_offset_lhs = self._is_offset(left)
-        self.is_timedelta_lhs = is_timedelta64_dtype(lvalues)
-        self.is_datetime64_lhs = is_datetime64_dtype(lvalues)
-        self.is_datetime64tz_lhs = is_datetime64tz_dtype(lvalues)
-        self.is_datetime_lhs = (self.is_datetime64_lhs or
-                                self.is_datetime64tz_lhs)
-        self.is_integer_lhs = left.dtype.kind in ['i', 'u']
-        self.is_floating_lhs = left.dtype.kind == 'f'
-
-        # right
-        self.is_offset_rhs = self._is_offset(right)
-        self.is_datetime64_rhs = is_datetime64_dtype(rvalues)
-        self.is_datetime64tz_rhs = is_datetime64tz_dtype(rvalues)
-        self.is_datetime_rhs = (self.is_datetime64_rhs or
-                                self.is_datetime64tz_rhs)
-        self.is_timedelta_rhs = is_timedelta64_dtype(rvalues)
-        self.is_integer_rhs = rvalues.dtype.kind in ('i', 'u')
-        self.is_floating_rhs = rvalues.dtype.kind == 'f'
-
-        self._validate(lvalues, rvalues, name)
-        self.lvalues, self.rvalues = self._convert_for_datetime(lvalues,
-                                                                rvalues)
-
-    def _validate(self, lvalues, rvalues, name):
-        # timedelta and integer mul/div
-
-        if ((self.is_timedelta_lhs and
-                (self.is_integer_rhs or self.is_floating_rhs)) or
-            (self.is_timedelta_rhs and
-                (self.is_integer_lhs or self.is_floating_lhs))):
-
-            if name not in ('__div__', '__truediv__', '__mul__', '__rmul__'):
-                raise TypeError("can only operate on a timedelta and an "
-                                "integer or a float for division and "
-                                "multiplication, but the operator [%s] was"
-                                "passed" % name)
-
-        # 2 timedeltas
-        elif ((self.is_timedelta_lhs and
-               (self.is_timedelta_rhs or self.is_offset_rhs)) or
-              (self.is_timedelta_rhs and
-               (self.is_timedelta_lhs or self.is_offset_lhs))):
-
-            if name not in ('__div__', '__rdiv__', '__truediv__',
-                            '__rtruediv__', '__add__', '__radd__', '__sub__',
-                            '__rsub__'):
-                raise TypeError("can only operate on a timedeltas for "
-                                "addition, subtraction, and division, but the"
-                                " operator [%s] was passed" % name)
-
-        # datetime and timedelta/DateOffset
-        elif (self.is_datetime_lhs and
-              (self.is_timedelta_rhs or self.is_offset_rhs)):
-
-            if name not in ('__add__', '__radd__', '__sub__'):
-                raise TypeError("can only operate on a datetime with a rhs of "
-                                "a timedelta/DateOffset for addition and "
-                                "subtraction, but the operator [%s] was "
-                                "passed" % name)
-
-        elif (self.is_datetime_rhs and
-              (self.is_timedelta_lhs or self.is_offset_lhs)):
-            if name not in ('__add__', '__radd__', '__rsub__'):
-                raise TypeError("can only operate on a timedelta/DateOffset "
-                                "with a rhs of a datetime for addition, "
-                                "but the operator [%s] was passed" % name)
-
-        # 2 datetimes
-        elif self.is_datetime_lhs and self.is_datetime_rhs:
-
-            if name not in ('__sub__', '__rsub__'):
-                raise TypeError("can only operate on a datetimes for"
-                                " subtraction, but the operator [%s] was"
-                                " passed" % name)
-
-            # if tz's must be equal (same or None)
-            if getattr(lvalues, 'tz', None) != getattr(rvalues, 'tz', None):
-                raise ValueError("Incompatible tz's on datetime subtraction "
-                                 "ops")
-
-        elif ((self.is_timedelta_lhs or self.is_offset_lhs) and
-              self.is_datetime_rhs):
-
-            if name not in ('__add__', '__radd__'):
-                raise TypeError("can only operate on a timedelta/DateOffset "
-                                "and a datetime for addition, but the "
-                                "operator [%s] was passed" % name)
-        else:
-            raise TypeError('cannot operate on a series without a rhs '
-                            'of a series/ndarray of type datetime64[ns] '
-                            'or a timedelta')
-
-    def _convert_to_array(self, values, name=None, other=None):
-        """converts values to ndarray"""
-        from pandas.tseries.timedeltas import to_timedelta
-
-        ovalues = values
-        supplied_dtype = None
-        if not is_list_like(values):
-            values = np.array([values])
-
-        # if this is a Series that contains relevant dtype info, then use this
-        # instead of the inferred type; this avoids coercing Series([NaT],
-        # dtype='datetime64[ns]') to Series([NaT], dtype='timedelta64[ns]')
-        elif (isinstance(values, pd.Series) and
-              (is_timedelta64_dtype(values) or is_datetime64_dtype(values))):
-            supplied_dtype = values.dtype
-
-        inferred_type = lib.infer_dtype(values)
-        if (inferred_type in ('datetime64', 'datetime', 'date', 'time') or
-                is_datetimetz(inferred_type)):
-            # if we have a other of timedelta, but use pd.NaT here we
-            # we are in the wrong path
-            if (supplied_dtype is None and other is not None and
-                (other.dtype in ('timedelta64[ns]', 'datetime64[ns]')) and
-                    isnull(values).all()):
-                values = np.empty(values.shape, dtype='timedelta64[ns]')
-                values[:] = iNaT
-
-            # a datelike
-            elif isinstance(values, pd.DatetimeIndex):
-                values = values.to_series()
-            # datetime with tz
-            elif (isinstance(ovalues, datetime.datetime) and
-                  hasattr(ovalues, 'tzinfo')):
-                values = pd.DatetimeIndex(values)
-            # datetime array with tz
-            elif is_datetimetz(values):
-                if isinstance(values, ABCSeries):
-                    values = values._values
-            elif not (isinstance(values, (np.ndarray, ABCSeries)) and
-                      is_datetime64_dtype(values)):
-                values = libts.array_to_datetime(values)
-        elif inferred_type in ('timedelta', 'timedelta64'):
-            # have a timedelta, convert to to ns here
-            values = to_timedelta(values, errors='coerce', box=False)
-        elif inferred_type == 'integer':
-            # py3 compat where dtype is 'm' but is an integer
-            if values.dtype.kind == 'm':
-                values = values.astype('timedelta64[ns]')
-            elif isinstance(values, pd.PeriodIndex):
-                values = values.to_timestamp().to_series()
-            elif name not in ('__truediv__', '__div__', '__mul__', '__rmul__'):
-                raise TypeError("incompatible type for a datetime/timedelta "
-                                "operation [{0}]".format(name))
-        elif inferred_type == 'floating':
-            if (isnull(values).all() and
-                    name in ('__add__', '__radd__', '__sub__', '__rsub__')):
-                values = np.empty(values.shape, dtype=other.dtype)
-                values[:] = iNaT
-            return values
-        elif self._is_offset(values):
-            return values
-        else:
-            raise TypeError("incompatible type [{0}] for a datetime/timedelta"
-                            " operation".format(np.array(values).dtype))
+    if issubclass(cls, ABCSparseSeries):
+        # Be sure to catch this before ABCSeries and ABCSparseArray,
+        # as they will both come see SparseSeries as a subclass
+        arith_flex = _flex_method_SERIES
+        comp_flex = _flex_method_SERIES
+        arith_special = _arith_method_SPARSE_SERIES
+        comp_special = _arith_method_SPARSE_SERIES
+        bool_special = _bool_method_SERIES
+        # TODO: I don't think the functions defined by bool_method are tested
+    elif issubclass(cls, ABCSeries):
+        # Just Series; SparseSeries is caught above
+        arith_flex = _flex_method_SERIES
+        comp_flex = _flex_method_SERIES
+        arith_special = _arith_method_SERIES
+        comp_special = _comp_method_SERIES
+        bool_special = _bool_method_SERIES
+    elif issubclass(cls, ABCSparseArray):
+        arith_flex = None
+        comp_flex = None
+        arith_special = _arith_method_SPARSE_ARRAY
+        comp_special = _arith_method_SPARSE_ARRAY
+        bool_special = _arith_method_SPARSE_ARRAY
+    elif issubclass(cls, ABCPanel):
+        arith_flex = _flex_method_PANEL
+        comp_flex = _comp_method_PANEL
+        arith_special = _arith_method_PANEL
+        comp_special = _comp_method_PANEL
+        bool_special = _arith_method_PANEL
+    elif issubclass(cls, ABCDataFrame):
+        # Same for DataFrame and SparseDataFrame
+        arith_flex = _arith_method_FRAME
+        comp_flex = _flex_comp_method_FRAME
+        arith_special = _arith_method_FRAME
+        comp_special = _comp_method_FRAME
+        bool_special = _arith_method_FRAME
+    return arith_flex, comp_flex, arith_special, comp_special, bool_special
+
+
+def _create_methods(cls, arith_method, comp_method, bool_method, special):
+    # creates actual methods based upon arithmetic, comp and bool method
+    # constructors.
 
-        return values
+    have_divmod = issubclass(cls, ABCSeries)
+    # divmod is available for Series and SparseSeries
 
-    def _convert_for_datetime(self, lvalues, rvalues):
-        from pandas.tseries.timedeltas import to_timedelta
+    # yapf: disable
+    new_methods = dict(
+        add=arith_method(cls, operator.add, special),
+        radd=arith_method(cls, radd, special),
+        sub=arith_method(cls, operator.sub, special),
+        mul=arith_method(cls, operator.mul, special),
+        truediv=arith_method(cls, operator.truediv, special),
+        floordiv=arith_method(cls, operator.floordiv, special),
+        # Causes a floating point exception in the tests when numexpr enabled,
+        # so for now no speedup
+        mod=arith_method(cls, operator.mod, special),
+        pow=arith_method(cls, operator.pow, special),
+        # not entirely sure why this is necessary, but previously was included
+        # so it's here to maintain compatibility
+        rmul=arith_method(cls, rmul, special),
+        rsub=arith_method(cls, rsub, special),
+        rtruediv=arith_method(cls, rtruediv, special),
+        rfloordiv=arith_method(cls, rfloordiv, special),
+        rpow=arith_method(cls, rpow, special),
+        rmod=arith_method(cls, rmod, special))
+    # yapf: enable
+    new_methods['div'] = new_methods['truediv']
+    new_methods['rdiv'] = new_methods['rtruediv']
+    if have_divmod:
+        # divmod doesn't have an op that is supported by numexpr
+        new_methods['divmod'] = arith_method(cls, divmod, special)
+        new_methods['rdivmod'] = arith_method(cls, rdivmod, special)
 
-        mask = isnull(lvalues) | isnull(rvalues)
+    new_methods.update(dict(
+        eq=comp_method(cls, operator.eq, special),
+        ne=comp_method(cls, operator.ne, special),
+        lt=comp_method(cls, operator.lt, special),
+        gt=comp_method(cls, operator.gt, special),
+        le=comp_method(cls, operator.le, special),
+        ge=comp_method(cls, operator.ge, special)))
 
-        # datetimes require views
-        if self.is_datetime_lhs or self.is_datetime_rhs:
+    if bool_method:
+        new_methods.update(
+            dict(and_=bool_method(cls, operator.and_, special),
+                 or_=bool_method(cls, operator.or_, special),
+                 # For some reason ``^`` wasn't used in original.
+                 xor=bool_method(cls, operator.xor, special),
+                 rand_=bool_method(cls, rand_, special),
+                 ror_=bool_method(cls, ror_, special),
+                 rxor=bool_method(cls, rxor, special)))
 
-            # datetime subtraction means timedelta
-            if self.is_datetime_lhs and self.is_datetime_rhs:
-                if self.name in ('__sub__', '__rsub__'):
-                    self.dtype = 'timedelta64[ns]'
-                else:
-                    self.dtype = 'datetime64[ns]'
-            elif self.is_datetime64tz_lhs:
-                self.dtype = lvalues.dtype
-            elif self.is_datetime64tz_rhs:
-                self.dtype = rvalues.dtype
-            else:
-                self.dtype = 'datetime64[ns]'
-
-            # if adding single offset try vectorized path
-            # in DatetimeIndex; otherwise elementwise apply
-            def _offset(lvalues, rvalues):
-                if len(lvalues) == 1:
-                    rvalues = pd.DatetimeIndex(rvalues)
-                    lvalues = lvalues[0]
-                else:
-                    warnings.warn("Adding/subtracting array of DateOffsets to "
-                                  "Series not vectorized", PerformanceWarning)
-                    rvalues = rvalues.astype('O')
-
-                # pass thru on the na_op
-                self.na_op = lambda x, y: getattr(x, self.name)(y)
-                return lvalues, rvalues
-
-            if self.is_offset_lhs:
-                lvalues, rvalues = _offset(lvalues, rvalues)
-            elif self.is_offset_rhs:
-                rvalues, lvalues = _offset(rvalues, lvalues)
-            else:
+    if special:
+        dunderize = lambda x: '__{name}__'.format(name=x.strip('_'))
+    else:
+        dunderize = lambda x: x
+    new_methods = {dunderize(k): v for k, v in new_methods.items()}
+    return new_methods
 
-                # with tz, convert to UTC
-                if self.is_datetime64tz_lhs:
-                    lvalues = lvalues.tz_convert('UTC').tz_localize(None)
-                if self.is_datetime64tz_rhs:
-                    rvalues = rvalues.tz_convert('UTC').tz_localize(None)
 
-                lvalues = lvalues.view(np.int64)
-                rvalues = rvalues.view(np.int64)
+def add_methods(cls, new_methods):
+    for name, method in new_methods.items():
+        # For most methods, if we find that the class already has a method
+        # of the same name, it is OK to over-write it.  The exception is
+        # inplace methods (__iadd__, __isub__, ...) for SparseArray, which
+        # retain the np.ndarray versions.
+        force = not (issubclass(cls, ABCSparseArray) and
+                     name.startswith('__i'))
+        if force or name not in cls.__dict__:
+            bind_method(cls, name, method)
 
-        # otherwise it's a timedelta
-        else:
 
-            self.dtype = 'timedelta64[ns]'
-
-            # convert Tick DateOffset to underlying delta
-            if self.is_offset_lhs:
-                lvalues = to_timedelta(lvalues, box=False)
-            if self.is_offset_rhs:
-                rvalues = to_timedelta(rvalues, box=False)
-
-            lvalues = lvalues.astype(np.int64)
-            if not self.is_floating_rhs:
-                rvalues = rvalues.astype(np.int64)
-
-            # time delta division -> unit less
-            # integer gets converted to timedelta in np < 1.6
-            if ((self.is_timedelta_lhs and self.is_timedelta_rhs) and
-                    not self.is_integer_rhs and not self.is_integer_lhs and
-                    self.name in ('__div__', '__truediv__')):
-                self.dtype = 'float64'
-                self.fill_value = np.nan
-                lvalues = lvalues.astype(np.float64)
-                rvalues = rvalues.astype(np.float64)
-
-        # if we need to mask the results
-        if mask.any():
+# ----------------------------------------------------------------------
+# Arithmetic
+def add_special_arithmetic_methods(cls):
+    """
+    Adds the full suite of special arithmetic methods (``__add__``,
+    ``__sub__``, etc.) to the class.
+
+    Parameters
+    ----------
+    cls : class
+        special methods will be defined and pinned to this class
+    """
+    _, _, arith_method, comp_method, bool_method = _get_method_wrappers(cls)
+    new_methods = _create_methods(cls, arith_method, comp_method, bool_method,
+                                  special=True)
+    # inplace operators (I feel like these should get passed an `inplace=True`
+    # or just be removed
+
+    def _wrap_inplace_method(method):
+        """
+        return an inplace wrapper for this method
+        """
+
+        def f(self, other):
+            result = method(self, other)
+
+            # this makes sure that we are aligned like the input
+            # we are updating inplace so we want to ignore is_copy
+            self._update_inplace(result.reindex_like(self, copy=False)._data,
+                                 verify_is_copy=False)
+
+            return self
+
+        f.__name__ = "__i{name}__".format(name=method.__name__.strip("__"))
+        return f
+
+    new_methods.update(
+        dict(__iadd__=_wrap_inplace_method(new_methods["__add__"]),
+             __isub__=_wrap_inplace_method(new_methods["__sub__"]),
+             __imul__=_wrap_inplace_method(new_methods["__mul__"]),
+             __itruediv__=_wrap_inplace_method(new_methods["__truediv__"]),
+             __ifloordiv__=_wrap_inplace_method(new_methods["__floordiv__"]),
+             __imod__=_wrap_inplace_method(new_methods["__mod__"]),
+             __ipow__=_wrap_inplace_method(new_methods["__pow__"])))
+    if not compat.PY3:
+        new_methods["__idiv__"] = _wrap_inplace_method(new_methods["__div__"])
+
+    new_methods.update(
+        dict(__iand__=_wrap_inplace_method(new_methods["__and__"]),
+             __ior__=_wrap_inplace_method(new_methods["__or__"]),
+             __ixor__=_wrap_inplace_method(new_methods["__xor__"])))
 
-            def f(x):
+    add_methods(cls, new_methods=new_methods)
 
-                # datetime64[ns]/timedelta64[ns] masking
-                try:
-                    x = np.array(x, dtype=self.dtype)
-                except TypeError:
-                    x = np.array(x, dtype='datetime64[ns]')
 
-                np.putmask(x, mask, self.fill_value)
-                return x
+def add_flex_arithmetic_methods(cls):
+    """
+    Adds the full suite of flex arithmetic methods (``pow``, ``mul``, ``add``)
+    to the class.
 
-            self.wrap_results = f
+    Parameters
+    ----------
+    cls : class
+        flex methods will be defined and pinned to this class
+    """
+    flex_arith_method, flex_comp_method, _, _, _ = _get_method_wrappers(cls)
+    new_methods = _create_methods(cls, flex_arith_method,
+                                  flex_comp_method, bool_method=None,
+                                  special=False)
+    new_methods.update(dict(multiply=new_methods['mul'],
+                            subtract=new_methods['sub'],
+                            divide=new_methods['div']))
+    # opt out of bool flex methods for now
+    assert not any(kname in new_methods for kname in ('ror_', 'rxor', 'rand_'))
 
-        return lvalues, rvalues
+    add_methods(cls, new_methods=new_methods)
 
-    def _is_offset(self, arr_or_obj):
-        """ check if obj or all elements of list-like is DateOffset """
-        if isinstance(arr_or_obj, pd.DateOffset):
-            return True
-        elif is_list_like(arr_or_obj) and len(arr_or_obj):
-            return all(isinstance(x, pd.DateOffset) for x in arr_or_obj)
-        return False
 
+# -----------------------------------------------------------------------------
+# Series
 
 def _align_method_SERIES(left, right, align_asobject=False):
     """ align lhs and rhs Series """
@@ -630,11 +1487,19 @@ def _align_method_SERIES(left, right, align_asobject=False):
     return left, right
 
 
-def _construct_result(left, result, index, name, dtype):
-    return left._constructor(result, index=index, name=name, dtype=dtype)
+def _construct_result(left, result, index, name, dtype=None):
+    """
+    If the raw op result has a non-None name (e.g. it is an Index object) and
+    the name argument is None, then passing name to the constructor will
+    not be enough; we still need to override the name attribute.
+    """
+    out = left._constructor(result, index=index, dtype=dtype)
+
+    out.name = name
+    return out
 
 
-def _construct_divmod_result(left, result, index, name, dtype):
+def _construct_divmod_result(left, result, index, name, dtype=None):
     """divmod returns a tuple of like indexed series instead of a single series.
     """
     constructor = left._constructor
@@ -644,94 +1509,110 @@ def _construct_divmod_result(left, result, index, name, dtype):
     )
 
 
-def _arith_method_SERIES(op, name, str_rep, fill_zeros=None, default_axis=None,
-                         construct_result=_construct_result, **eval_kwargs):
+def _arith_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
+    construct_result = (_construct_divmod_result
+                        if op in [divmod, rdivmod] else _construct_result)
 
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
         try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True, **eval_kwargs)
+            result = expressions.evaluate(op, str_rep, x, y, **eval_kwargs)
         except TypeError:
-            if isinstance(y, (np.ndarray, ABCSeries, pd.Index)):
-                dtype = find_common_type([x.dtype, y.dtype])
-                result = np.empty(x.size, dtype=dtype)
-                mask = notnull(x) & notnull(y)
-                result[mask] = op(x[mask], _values_from_object(y[mask]))
-            elif isinstance(x, np.ndarray):
-                result = np.empty(len(x), dtype=x.dtype)
-                mask = notnull(x)
-                result[mask] = op(x[mask], y)
-            else:
-                raise TypeError("{typ} cannot perform the operation "
-                                "{op}".format(typ=type(x).__name__,
-                                              op=str_rep))
-
-            result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
+            result = masked_arith_op(x, y, op)
 
-        result = missing.fill_zeros(result, x, y, name, fill_zeros)
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
         return result
 
     def safe_na_op(lvalues, rvalues):
+        """
+        return the result of evaluating na_op on the passed in values
+
+        try coercion to object type if the native types are not compatible
+
+        Parameters
+        ----------
+        lvalues : array-like
+        rvalues : array-like
+
+        Raises
+        ------
+        TypeError: invalid operation
+        """
         try:
             with np.errstate(all='ignore'):
                 return na_op(lvalues, rvalues)
         except Exception:
-            if isinstance(rvalues, ABCSeries):
-                if is_object_dtype(rvalues):
-                    # if dtype is object, try elementwise op
-                    return libalgos.arrmap_object(rvalues,
-                                                  lambda x: op(lvalues, x))
-            else:
-                if is_object_dtype(lvalues):
-                    return libalgos.arrmap_object(lvalues,
-                                                  lambda x: op(x, rvalues))
+            if is_object_dtype(lvalues):
+                return libalgos.arrmap_object(lvalues,
+                                              lambda x: op(x, rvalues))
             raise
 
-    def wrapper(left, right, name=name, na_op=na_op):
-
-        if isinstance(right, pd.DataFrame):
+    def wrapper(left, right):
+        if isinstance(right, ABCDataFrame):
             return NotImplemented
 
         left, right = _align_method_SERIES(left, right)
-
-        converted = _Op.get_op(left, right, name, na_op)
-
-        left, right = converted.left, converted.right
-        lvalues, rvalues = converted.lvalues, converted.rvalues
-        dtype = converted.dtype
-        wrap_results = converted.wrap_results
-        na_op = converted.na_op
-
+        res_name = get_op_result_name(left, right)
+        right = maybe_upcast_for_op(right)
+
+        if is_categorical_dtype(left):
+            raise TypeError("{typ} cannot perform the operation "
+                            "{op}".format(typ=type(left).__name__, op=str_rep))
+
+        elif is_datetime64_dtype(left) or is_datetime64tz_dtype(left):
+            # Give dispatch_to_index_op a chance for tests like
+            # test_dt64_series_add_intlike, which the index dispatching handles
+            # specifically.
+            result = dispatch_to_index_op(op, left, right, pd.DatetimeIndex)
+            return construct_result(left, result,
+                                    index=left.index, name=res_name,
+                                    dtype=result.dtype)
+
+        elif (is_extension_array_dtype(left) or
+                (is_extension_array_dtype(right) and not is_scalar(right))):
+            # GH#22378 disallow scalar to exclude e.g. "category", "Int64"
+            return dispatch_to_extension_op(op, left, right)
+
+        elif is_timedelta64_dtype(left):
+            result = dispatch_to_index_op(op, left, right, pd.TimedeltaIndex)
+            return construct_result(left, result,
+                                    index=left.index, name=res_name)
+
+        elif is_timedelta64_dtype(right):
+            # We should only get here with non-scalar or timedelta64('NaT')
+            #  values for right
+            # Note: we cannot use dispatch_to_index_op because
+            #  that may incorrectly raise TypeError when we
+            #  should get NullFrequencyError
+            result = op(pd.Index(left), right)
+            return construct_result(left, result,
+                                    index=left.index, name=res_name,
+                                    dtype=result.dtype)
+
+        lvalues = left.values
+        rvalues = right
         if isinstance(rvalues, ABCSeries):
-            name = _maybe_match_name(left, rvalues)
-            lvalues = getattr(lvalues, 'values', lvalues)
-            rvalues = getattr(rvalues, 'values', rvalues)
-            # _Op aligns left and right
-        else:
-            name = left.name
-            if (hasattr(lvalues, 'values') and
-                    not isinstance(lvalues, pd.DatetimeIndex)):
-                lvalues = lvalues.values
-
-        result = wrap_results(safe_na_op(lvalues, rvalues))
-        return construct_result(
-            left,
-            result,
-            index=left.index,
-            name=name,
-            dtype=dtype,
-        )
+            rvalues = rvalues.values
+
+        result = safe_na_op(lvalues, rvalues)
+        return construct_result(left, result,
+                                index=left.index, name=res_name, dtype=None)
 
+    wrapper.__name__ = op_name
     return wrapper
 
 
 def _comp_method_OBJECT_ARRAY(op, x, y):
     if isinstance(y, list):
-        y = lib.list_to_object_array(y)
+        y = construct_1d_object_array_from_listlike(y)
     if isinstance(y, (np.ndarray, ABCSeries, ABCIndex)):
         if not is_object_dtype(y.dtype):
             y = y.astype(np.object_)
@@ -739,29 +1620,35 @@ def _comp_method_OBJECT_ARRAY(op, x, y):
         if isinstance(y, (ABCSeries, ABCIndex)):
             y = y.values
 
-        result = lib.vec_compare(x, y, op)
+        result = libops.vec_compare(x, y, op)
     else:
-        result = lib.scalar_compare(x, y, op)
+        result = libops.scalar_compare(x, y, op)
     return result
 
 
-def _comp_method_SERIES(op, name, str_rep, masker=False):
+def _comp_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+    op_name = _get_op_name(op, special)
+    masker = _gen_eval_kwargs(op_name).get('masker', False)
 
     def na_op(x, y):
+        # TODO:
+        # should have guarantess on what x, y can be type-wise
+        # Extension Dtypes are not called here
 
-        # dispatch to the categorical if we have a categorical
-        # in either operand
-        if is_categorical_dtype(x):
-            return op(x, y)
-        elif is_categorical_dtype(y) and not is_scalar(y):
-            return op(y, x)
+        # Checking that cases that were once handled here are no longer
+        # reachable.
+        assert not (is_categorical_dtype(y) and not is_scalar(y))
 
         if is_object_dtype(x.dtype):
             result = _comp_method_OBJECT_ARRAY(op, x, y)
+
+        elif is_datetimelike_v_numeric(x, y):
+            return invalid_comparison(x, y, op)
+
         else:
 
             # we want to compare like types
@@ -769,35 +1656,22 @@ def na_op(x, y):
             # we are not NotImplemented, otherwise
             # we would allow datetime64 (but viewed as i8) against
             # integer comparisons
-            if is_datetimelike_v_numeric(x, y):
-                raise TypeError("invalid type comparison")
-
-            # numpy does not like comparisons vs None
-            if is_scalar(y) and isnull(y):
-                if name == '__ne__':
-                    return np.ones(len(x), dtype=bool)
-                else:
-                    return np.zeros(len(x), dtype=bool)
 
             # we have a datetime/timedelta and may need to convert
+            assert not needs_i8_conversion(x)
             mask = None
-            if (needs_i8_conversion(x) or
-                    (not is_scalar(y) and needs_i8_conversion(y))):
-
-                if is_scalar(y):
-                    mask = isnull(x)
-                    y = libindex.convert_scalar(x, _values_from_object(y))
-                else:
-                    mask = isnull(x) | isnull(y)
-                    y = y.view('i8')
+            if not is_scalar(y) and needs_i8_conversion(y):
+                mask = isna(x) | isna(y)
+                y = y.view('i8')
                 x = x.view('i8')
 
-            try:
+            method = getattr(x, op_name, None)
+            if method is not None:
                 with np.errstate(all='ignore'):
-                    result = getattr(x, name)(y)
+                    result = method(y)
                 if result is NotImplemented:
-                    raise TypeError("invalid type comparison")
-            except AttributeError:
+                    return invalid_comparison(x, y, op)
+            else:
                 result = op(x, y)
 
             if mask is not None and mask.any():
@@ -810,236 +1684,204 @@ def wrapper(self, other, axis=None):
         if axis is not None:
             self._get_axis_number(axis)
 
-        if isinstance(other, ABCSeries):
-            name = _maybe_match_name(self, other)
-            if not self._indexed_same(other):
-                msg = 'Can only compare identically-labeled Series objects'
-                raise ValueError(msg)
-            return self._constructor(na_op(self.values, other.values),
-                                     index=self.index, name=name)
-        elif isinstance(other, pd.DataFrame):  # pragma: no cover
+        res_name = get_op_result_name(self, other)
+
+        if isinstance(other, list):
+            # TODO: same for tuples?
+            other = np.asarray(other)
+
+        if isinstance(other, ABCDataFrame):  # pragma: no cover
+            # Defer to DataFrame implementation; fail early
             return NotImplemented
+
+        elif isinstance(other, ABCSeries) and not self._indexed_same(other):
+            raise ValueError("Can only compare identically-labeled "
+                             "Series objects")
+
+        elif is_categorical_dtype(self):
+            # Dispatch to Categorical implementation; pd.CategoricalIndex
+            # behavior is non-canonical GH#19513
+            res_values = dispatch_to_index_op(op, self, other, pd.Categorical)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        elif is_datetime64_dtype(self) or is_datetime64tz_dtype(self):
+            # Dispatch to DatetimeIndex to ensure identical
+            # Series/Index behavior
+            if (isinstance(other, datetime.date) and
+                    not isinstance(other, datetime.datetime)):
+                # https://github.com/pandas-dev/pandas/issues/21152
+                # Compatibility for difference between Series comparison w/
+                # datetime and date
+                msg = (
+                    "Comparing Series of datetimes with 'datetime.date'.  "
+                    "Currently, the 'datetime.date' is coerced to a "
+                    "datetime. In the future pandas will not coerce, "
+                    "and {future}. "
+                    "To retain the current behavior, "
+                    "convert the 'datetime.date' to a datetime with "
+                    "'pd.Timestamp'."
+                )
+
+                if op in {operator.lt, operator.le, operator.gt, operator.ge}:
+                    future = "a TypeError will be raised"
+                else:
+                    future = (
+                        "'the values will not compare equal to the "
+                        "'datetime.date'"
+                    )
+                msg = '\n'.join(textwrap.wrap(msg.format(future=future)))
+                warnings.warn(msg, FutureWarning, stacklevel=2)
+                other = pd.Timestamp(other)
+
+            res_values = dispatch_to_index_op(op, self, other,
+                                              pd.DatetimeIndex)
+
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        elif is_timedelta64_dtype(self):
+            res_values = dispatch_to_index_op(op, self, other,
+                                              pd.TimedeltaIndex)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name)
+
+        elif (is_extension_array_dtype(self) or
+              (is_extension_array_dtype(other) and not is_scalar(other))):
+            # Note: the `not is_scalar(other)` condition rules out
+            # e.g. other == "category"
+            return dispatch_to_extension_op(op, self, other)
+
+        elif isinstance(other, ABCSeries):
+            # By this point we have checked that self._indexed_same(other)
+            res_values = na_op(self.values, other.values)
+            # rename is needed in case res_name is None and res_values.name
+            # is not.
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name).rename(res_name)
+
         elif isinstance(other, (np.ndarray, pd.Index)):
             # do not check length of zerodim array
             # as it will broadcast
-            if (not is_scalar(lib.item_from_zerodim(other)) and
-                    len(self) != len(other)):
+            if other.ndim != 0 and len(self) != len(other):
                 raise ValueError('Lengths must match to compare')
 
-            if isinstance(other, ABCPeriodIndex):
-                # temp workaround until fixing GH 13637
-                # tested in test_nat_comparisons
-                # (pandas.tests.series.test_operators.TestSeriesOperators)
-                return self._constructor(na_op(self.values,
-                                               other.asobject.values),
-                                         index=self.index)
-
-            return self._constructor(na_op(self.values, np.asarray(other)),
-                                     index=self.index).__finalize__(self)
-
-        elif isinstance(other, pd.Categorical):
-            if not is_categorical_dtype(self):
-                msg = ("Cannot compare a Categorical for op {op} with Series "
-                       "of dtype {typ}.\nIf you want to compare values, use "
-                       "'series <op> np.asarray(other)'.")
-                raise TypeError(msg.format(op=op, typ=self.dtype))
-
-        if is_categorical_dtype(self):
-            # cats are a special case as get_values() would return an ndarray,
-            # which would then not take categories ordering into account
-            # we can go directly to op, as the na_op would just test again and
-            # dispatch to it.
-            with np.errstate(all='ignore'):
-                res = op(self.values, other)
+            res_values = na_op(self.values, np.asarray(other))
+            result = self._constructor(res_values, index=self.index)
+            # rename is needed in case res_name is None and self.name
+            # is not.
+            return result.__finalize__(self).rename(res_name)
+
+        elif is_scalar(other) and isna(other):
+            # numpy does not like comparisons vs None
+            if op is operator.ne:
+                res_values = np.ones(len(self), dtype=bool)
+            else:
+                res_values = np.zeros(len(self), dtype=bool)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name, dtype='bool')
+
         else:
             values = self.get_values()
-            if isinstance(other, (list, np.ndarray)):
-                other = np.asarray(other)
 
             with np.errstate(all='ignore'):
                 res = na_op(values, other)
             if is_scalar(res):
-                raise TypeError('Could not compare %s type with Series' %
-                                type(other))
+                raise TypeError('Could not compare {typ} type with Series'
+                                .format(typ=type(other)))
 
             # always return a full value series here
-            res = _values_from_object(res)
-
-        res = pd.Series(res, index=self.index, name=self.name, dtype='bool')
-        return res
+            res_values = com.values_from_object(res)
+            return self._constructor(res_values, index=self.index,
+                                     name=res_name, dtype='bool')
 
+    wrapper.__name__ = op_name
     return wrapper
 
 
-def _bool_method_SERIES(op, name, str_rep):
+def _bool_method_SERIES(cls, op, special):
     """
     Wrapper function for Series arithmetic operations, to avoid
     code duplication.
     """
+    op_name = _get_op_name(op, special)
 
     def na_op(x, y):
         try:
             result = op(x, y)
         except TypeError:
-            if isinstance(y, list):
-                y = lib.list_to_object_array(y)
-
-            if isinstance(y, (np.ndarray, ABCSeries)):
-                if (is_bool_dtype(x.dtype) and is_bool_dtype(y.dtype)):
-                    result = op(x, y)  # when would this be hit?
-                else:
-                    x = _ensure_object(x)
-                    y = _ensure_object(y)
-                    result = lib.vec_binop(x, y, op)
+            assert not isinstance(y, (list, ABCSeries, ABCIndexClass))
+            if isinstance(y, np.ndarray):
+                # bool-bool dtype operations should be OK, should not get here
+                assert not (is_bool_dtype(x) and is_bool_dtype(y))
+                x = ensure_object(x)
+                y = ensure_object(y)
+                result = libops.vec_binop(x, y, op)
             else:
+                # let null fall thru
+                assert lib.is_scalar(y)
+                if not isna(y):
+                    y = bool(y)
                 try:
-
-                    # let null fall thru
-                    if not isnull(y):
-                        y = bool(y)
-                    result = lib.scalar_binop(x, y, op)
-                except:
-                    raise TypeError("cannot compare a dtyped [{0}] array with "
-                                    "a scalar of type [{1}]".format(
-                                        x.dtype, type(y).__name__))
+                    result = libops.scalar_binop(x, y, op)
+                except (TypeError, ValueError, AttributeError,
+                        OverflowError, NotImplementedError):
+                    raise TypeError("cannot compare a dtyped [{dtype}] array "
+                                    "with a scalar of type [{typ}]"
+                                    .format(dtype=x.dtype,
+                                            typ=type(y).__name__))
 
         return result
 
+    fill_int = lambda x: x.fillna(0)
+    fill_bool = lambda x: x.fillna(False).astype(bool)
+
     def wrapper(self, other):
         is_self_int_dtype = is_integer_dtype(self.dtype)
 
-        fill_int = lambda x: x.fillna(0)
-        fill_bool = lambda x: x.fillna(False).astype(bool)
-
         self, other = _align_method_SERIES(self, other, align_asobject=True)
+        res_name = get_op_result_name(self, other)
 
-        if isinstance(other, ABCSeries):
-            name = _maybe_match_name(self, other)
+        if isinstance(other, ABCDataFrame):
+            # Defer to DataFrame implementation; fail early
+            return NotImplemented
+
+        elif isinstance(other, (ABCSeries, ABCIndexClass)):
             is_other_int_dtype = is_integer_dtype(other.dtype)
             other = fill_int(other) if is_other_int_dtype else fill_bool(other)
 
-            filler = (fill_int if is_self_int_dtype and is_other_int_dtype
-                      else fill_bool)
-            return filler(self._constructor(na_op(self.values, other.values),
-                                            index=self.index, name=name))
-
-        elif isinstance(other, pd.DataFrame):
-            return NotImplemented
+            ovalues = other.values
+            finalizer = lambda x: x
 
         else:
             # scalars, list, tuple, np.array
-            filler = (fill_int if is_self_int_dtype and
-                      is_integer_dtype(np.asarray(other)) else fill_bool)
-            return filler(self._constructor(
-                na_op(self.values, other),
-                index=self.index)).__finalize__(self)
-
+            is_other_int_dtype = is_integer_dtype(np.asarray(other))
+            if is_list_like(other) and not isinstance(other, np.ndarray):
+                # TODO: Can we do this before the is_integer_dtype check?
+                # could the is_integer_dtype check be checking the wrong
+                # thing?  e.g. other = [[0, 1], [2, 3], [4, 5]]?
+                other = construct_1d_object_array_from_listlike(other)
+
+            ovalues = other
+            finalizer = lambda x: x.__finalize__(self)
+
+        # For int vs int `^`, `|`, `&` are bitwise operators and return
+        #   integer dtypes.  Otherwise these are boolean ops
+        filler = (fill_int if is_self_int_dtype and is_other_int_dtype
+                  else fill_bool)
+        res_values = na_op(self.values, ovalues)
+        unfilled = self._constructor(res_values,
+                                     index=self.index, name=res_name)
+        filled = filler(unfilled)
+        return finalizer(filled)
+
+    wrapper.__name__ = op_name
     return wrapper
 
 
-_op_descriptions = {'add': {'op': '+',
-                            'desc': 'Addition',
-                            'reversed': False,
-                            'reverse': 'radd'},
-                    'sub': {'op': '-',
-                            'desc': 'Subtraction',
-                            'reversed': False,
-                            'reverse': 'rsub'},
-                    'mul': {'op': '*',
-                            'desc': 'Multiplication',
-                            'reversed': False,
-                            'reverse': 'rmul'},
-                    'mod': {'op': '%',
-                            'desc': 'Modulo',
-                            'reversed': False,
-                            'reverse': 'rmod'},
-                    'pow': {'op': '**',
-                            'desc': 'Exponential power',
-                            'reversed': False,
-                            'reverse': 'rpow'},
-                    'truediv': {'op': '/',
-                                'desc': 'Floating division',
-                                'reversed': False,
-                                'reverse': 'rtruediv'},
-                    'floordiv': {'op': '//',
-                                 'desc': 'Integer division',
-                                 'reversed': False,
-                                 'reverse': 'rfloordiv'},
-                    'divmod': {'op': 'divmod',
-                               'desc': 'Integer division and modulo',
-                               'reversed': False,
-                               'reverse': None},
-
-                    'eq': {'op': '==',
-                                 'desc': 'Equal to',
-                                 'reversed': False,
-                                 'reverse': None},
-                    'ne': {'op': '!=',
-                                 'desc': 'Not equal to',
-                                 'reversed': False,
-                                 'reverse': None},
-                    'lt': {'op': '<',
-                                 'desc': 'Less than',
-                                 'reversed': False,
-                                 'reverse': None},
-                    'le': {'op': '<=',
-                                 'desc': 'Less than or equal to',
-                                 'reversed': False,
-                                 'reverse': None},
-                    'gt': {'op': '>',
-                                 'desc': 'Greater than',
-                                 'reversed': False,
-                                 'reverse': None},
-                    'ge': {'op': '>=',
-                                 'desc': 'Greater than or equal to',
-                                 'reversed': False,
-                                 'reverse': None}}
-
-_op_names = list(_op_descriptions.keys())
-for k in _op_names:
-    reverse_op = _op_descriptions[k]['reverse']
-    _op_descriptions[reverse_op] = _op_descriptions[k].copy()
-    _op_descriptions[reverse_op]['reversed'] = True
-    _op_descriptions[reverse_op]['reverse'] = k
-
-
-_flex_doc_SERIES = """
-%s of series and other, element-wise (binary operator `%s`).
-
-Equivalent to ``%s``, but with support to substitute a fill_value for
-missing data in one of the inputs.
-
-Parameters
-----------
-other : Series or scalar value
-fill_value : None or float value, default None (NaN)
-    Fill missing (NaN) values with this value. If both Series are
-    missing, the result will be missing
-level : int or name
-    Broadcast across a level, matching Index values on the
-    passed MultiIndex level
-
-Returns
--------
-result : Series
-
-See also
---------
-Series.%s
-"""
-
-
-def _flex_method_SERIES(op, name, str_rep, default_axis=None, fill_zeros=None,
-                        **eval_kwargs):
-    op_name = name.replace('__', '')
-    op_desc = _op_descriptions[op_name]
-    if op_desc['reversed']:
-        equiv = 'other ' + op_desc['op'] + ' series'
-    else:
-        equiv = 'series ' + op_desc['op'] + ' other'
-
-    doc = _flex_doc_SERIES % (op_desc['desc'], op_name, equiv,
-                              op_desc['reverse'])
+def _flex_method_SERIES(cls, op, special):
+    name = _get_op_name(op, special)
+    doc = _make_flex_doc(name, 'series')
 
     @Appender(doc)
     def flex_wrapper(self, other, level=None, fill_value=None, axis=0):
@@ -1051,8 +1893,8 @@ def flex_wrapper(self, other, level=None, fill_value=None, axis=0):
         elif isinstance(other, (np.ndarray, list, tuple)):
             if len(other) != len(self):
                 raise ValueError('Lengths must be equal')
-            return self._binop(self._constructor(other, self.index), op,
-                               level=level, fill_value=fill_value)
+            other = self._constructor(other, self.index)
+            return self._binop(other, op, level=level, fill_value=fill_value)
         else:
             if fill_value is not None:
                 self = self.fillna(fill_value)
@@ -1064,334 +1906,426 @@ def flex_wrapper(self, other, level=None, fill_value=None, axis=0):
     return flex_wrapper
 
 
-series_flex_funcs = dict(flex_arith_method=_flex_method_SERIES,
-                         flex_comp_method=_flex_method_SERIES)
-
-series_special_funcs = dict(arith_method=_arith_method_SERIES,
-                            comp_method=_comp_method_SERIES,
-                            bool_method=_bool_method_SERIES,
-                            have_divmod=True)
-
-_arith_doc_FRAME = """
-Binary operator %s with support to substitute a fill_value for missing data in
-one of the inputs
-
-Parameters
-----------
-other : Series, DataFrame, or constant
-axis : {0, 1, 'index', 'columns'}
-    For Series input, axis to match Series index on
-fill_value : None or float value, default None
-    Fill missing (NaN) values with this value. If both DataFrame locations are
-    missing, the result will be missing
-level : int or name
-    Broadcast across a level, matching Index values on the
-    passed MultiIndex level
-
-Notes
------
-Mismatched indices will be unioned together
-
-Returns
--------
-result : DataFrame
-"""
-
-_flex_doc_FRAME = """
-%s of dataframe and other, element-wise (binary operator `%s`).
+# -----------------------------------------------------------------------------
+# DataFrame
 
-Equivalent to ``%s``, but with support to substitute a fill_value for
-missing data in one of the inputs.
 
-Parameters
-----------
-other : Series, DataFrame, or constant
-axis : {0, 1, 'index', 'columns'}
-    For Series input, axis to match Series index on
-fill_value : None or float value, default None
-    Fill missing (NaN) values with this value. If both DataFrame
-    locations are missing, the result will be missing
-level : int or name
-    Broadcast across a level, matching Index values on the
-    passed MultiIndex level
+def _combine_series_frame(self, other, func, fill_value=None, axis=None,
+                          level=None):
+    """
+    Apply binary operator `func` to self, other using alignment and fill
+    conventions determined by the fill_value, axis, and level kwargs.
 
-Notes
------
-Mismatched indices will be unioned together
+    Parameters
+    ----------
+    self : DataFrame
+    other : Series
+    func : binary operator
+    fill_value : object, default None
+    axis : {0, 1, 'columns', 'index', None}, default None
+    level : int or None, default None
+
+    Returns
+    -------
+    result : DataFrame
+    """
+    if fill_value is not None:
+        raise NotImplementedError("fill_value {fill} not supported."
+                                  .format(fill=fill_value))
+
+    if axis is not None:
+        axis = self._get_axis_number(axis)
+        if axis == 0:
+            return self._combine_match_index(other, func, level=level)
+        else:
+            return self._combine_match_columns(other, func, level=level)
+    else:
+        if not len(other):
+            return self * np.nan
 
-Returns
--------
-result : DataFrame
+        if not len(self):
+            # Ambiguous case, use _series so works with DataFrame
+            return self._constructor(data=self._series, index=self.index,
+                                     columns=self.columns)
 
-See also
---------
-DataFrame.%s
-"""
+        # default axis is columns
+        return self._combine_match_columns(other, func, level=level)
 
 
 def _align_method_FRAME(left, right, axis):
     """ convert rhs to meet lhs dims if input is list, tuple or np.ndarray """
 
     def to_series(right):
-        msg = 'Unable to coerce to Series, length must be {0}: given {1}'
+        msg = ('Unable to coerce to Series, length must be {req_len}: '
+               'given {given_len}')
         if axis is not None and left._get_axis_name(axis) == 'index':
             if len(left.index) != len(right):
-                raise ValueError(msg.format(len(left.index), len(right)))
+                raise ValueError(msg.format(req_len=len(left.index),
+                                            given_len=len(right)))
             right = left._constructor_sliced(right, index=left.index)
         else:
             if len(left.columns) != len(right):
-                raise ValueError(msg.format(len(left.columns), len(right)))
+                raise ValueError(msg.format(req_len=len(left.columns),
+                                            given_len=len(right)))
             right = left._constructor_sliced(right, index=left.columns)
         return right
 
-    if isinstance(right, (list, tuple)):
-        right = to_series(right)
-
-    elif isinstance(right, np.ndarray) and right.ndim:  # skips np scalar
+    if isinstance(right, np.ndarray):
 
         if right.ndim == 1:
             right = to_series(right)
 
         elif right.ndim == 2:
-            if left.shape != right.shape:
-                msg = ("Unable to coerce to DataFrame, "
-                       "shape must be {0}: given {1}")
-                raise ValueError(msg.format(left.shape, right.shape))
+            if right.shape == left.shape:
+                right = left._constructor(right, index=left.index,
+                                          columns=left.columns)
 
-            right = left._constructor(right, index=left.index,
-                                      columns=left.columns)
-        else:
-            msg = 'Unable to coerce to Series/DataFrame, dim must be <= 2: {0}'
-            raise ValueError(msg.format(right.shape, ))
+            elif right.shape[0] == left.shape[0] and right.shape[1] == 1:
+                # Broadcast across columns
+                right = np.broadcast_to(right, left.shape)
+                right = left._constructor(right,
+                                          index=left.index,
+                                          columns=left.columns)
+
+            elif right.shape[1] == left.shape[1] and right.shape[0] == 1:
+                # Broadcast along rows
+                right = to_series(right[0, :])
+
+            else:
+                raise ValueError("Unable to coerce to DataFrame, shape "
+                                 "must be {req_shape}: given {given_shape}"
+                                 .format(req_shape=left.shape,
+                                         given_shape=right.shape))
+
+        elif right.ndim > 2:
+            raise ValueError('Unable to coerce to Series/DataFrame, dim '
+                             'must be <= 2: {dim}'.format(dim=right.shape))
+
+    elif (is_list_like(right) and
+          not isinstance(right, (ABCSeries, ABCDataFrame))):
+        # GH17901
+        right = to_series(right)
 
     return right
 
 
-def _arith_method_FRAME(op, name, str_rep=None, default_axis='columns',
-                        fill_zeros=None, **eval_kwargs):
+def _arith_method_FRAME(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
+    default_axis = _get_frame_op_default_axis(op_name)
+
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True, **eval_kwargs)
+            result = expressions.evaluate(op, str_rep, x, y, **eval_kwargs)
         except TypeError:
-            xrav = x.ravel()
-            if isinstance(y, (np.ndarray, ABCSeries)):
-                dtype = np.find_common_type([x.dtype, y.dtype], [])
-                result = np.empty(x.size, dtype=dtype)
-                yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
-                xrav = xrav[mask]
-
-                # we may need to manually
-                # broadcast a 1 element array
-                if yrav.shape != mask.shape:
-                    yrav = np.empty(mask.shape, dtype=yrav.dtype)
-                    yrav.fill(yrav.item())
-
-                yrav = yrav[mask]
-                if np.prod(xrav.shape) and np.prod(yrav.shape):
-                    with np.errstate(all='ignore'):
-                        result[mask] = op(xrav, yrav)
-            elif hasattr(x, 'size'):
-                result = np.empty(x.size, dtype=x.dtype)
-                mask = notnull(xrav)
-                xrav = xrav[mask]
-                if np.prod(xrav.shape):
-                    with np.errstate(all='ignore'):
-                        result[mask] = op(xrav, y)
-            else:
-                raise TypeError("cannot perform operation {op} between "
-                                "objects of type {x} and {y}".format(
-                                    op=name, x=type(x), y=type(y)))
-
-            result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
-            result = result.reshape(x.shape)
+            result = masked_arith_op(x, y, op)
 
-        result = missing.fill_zeros(result, x, y, name, fill_zeros)
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
 
         return result
 
-    if name in _op_descriptions:
-        op_name = name.replace('__', '')
-        op_desc = _op_descriptions[op_name]
-        if op_desc['reversed']:
-            equiv = 'other ' + op_desc['op'] + ' dataframe'
-        else:
-            equiv = 'dataframe ' + op_desc['op'] + ' other'
-
-        doc = _flex_doc_FRAME % (op_desc['desc'], op_name, equiv,
-                                 op_desc['reverse'])
+    if op_name in _op_descriptions:
+        # i.e. include "add" but not "__add__"
+        doc = _make_flex_doc(op_name, 'dataframe')
     else:
-        doc = _arith_doc_FRAME % name
+        doc = _arith_doc_FRAME % op_name
 
     @Appender(doc)
     def f(self, other, axis=default_axis, level=None, fill_value=None):
 
         other = _align_method_FRAME(self, other, axis)
 
-        if isinstance(other, pd.DataFrame):  # Another DataFrame
-            return self._combine_frame(other, na_op, fill_value, level)
+        if isinstance(other, ABCDataFrame):
+            # Another DataFrame
+            pass_op = op if should_series_dispatch(self, other, op) else na_op
+            return self._combine_frame(other, pass_op, fill_value, level)
         elif isinstance(other, ABCSeries):
-            return self._combine_series(other, na_op, fill_value, axis, level)
+            # For these values of `axis`, we end up dispatching to Series op,
+            # so do not want the masked op.
+            pass_op = op if axis in [0, "columns", None] else na_op
+            return _combine_series_frame(self, other, pass_op,
+                                         fill_value=fill_value, axis=axis,
+                                         level=level)
         else:
             if fill_value is not None:
                 self = self.fillna(fill_value)
 
-            return self._combine_const(other, na_op)
+            assert np.ndim(other) == 0
+            return self._combine_const(other, op)
 
-    f.__name__ = name
+    f.__name__ = op_name
 
     return f
 
 
-# Masker unused for now
-def _flex_comp_method_FRAME(op, name, str_rep=None, default_axis='columns',
-                            masker=False):
+def _flex_comp_method_FRAME(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    default_axis = _get_frame_op_default_axis(op_name)
+
     def na_op(x, y):
         try:
-            result = op(x, y)
+            with np.errstate(invalid='ignore'):
+                result = op(x, y)
         except TypeError:
-            xrav = x.ravel()
-            result = np.empty(x.size, dtype=bool)
-            if isinstance(y, (np.ndarray, ABCSeries)):
-                yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
-                result[mask] = op(np.array(list(xrav[mask])),
-                                  np.array(list(yrav[mask])))
-            else:
-                mask = notnull(xrav)
-                result[mask] = op(np.array(list(xrav[mask])), y)
-
-            if op == operator.ne:  # pragma: no cover
-                np.putmask(result, ~mask, True)
-            else:
-                np.putmask(result, ~mask, False)
-            result = result.reshape(x.shape)
-
+            result = mask_cmp_op(x, y, op, (np.ndarray, ABCSeries))
         return result
 
-    @Appender('Wrapper for flexible comparison methods %s' % name)
+    doc = _flex_comp_doc_FRAME.format(op_name=op_name,
+                                      desc=_op_descriptions[op_name]['desc'])
+
+    @Appender(doc)
     def f(self, other, axis=default_axis, level=None):
 
         other = _align_method_FRAME(self, other, axis)
 
-        if isinstance(other, pd.DataFrame):  # Another DataFrame
-            return self._flex_compare_frame(other, na_op, str_rep, level)
+        if isinstance(other, ABCDataFrame):
+            # Another DataFrame
+            if not self._indexed_same(other):
+                self, other = self.align(other, 'outer',
+                                         level=level, copy=False)
+            return dispatch_to_series(self, other, na_op, str_rep)
 
         elif isinstance(other, ABCSeries):
-            return self._combine_series(other, na_op, None, axis, level)
+            return _combine_series_frame(self, other, na_op,
+                                         fill_value=None, axis=axis,
+                                         level=level)
         else:
+            assert np.ndim(other) == 0, other
             return self._combine_const(other, na_op)
 
-    f.__name__ = name
+    f.__name__ = op_name
 
     return f
 
 
-def _comp_method_FRAME(func, name, str_rep, masker=False):
-    @Appender('Wrapper for comparison method %s' % name)
+def _comp_method_FRAME(cls, func, special):
+    str_rep = _get_opstr(func, cls)
+    op_name = _get_op_name(func, special)
+
+    @Appender('Wrapper for comparison method {name}'.format(name=op_name))
     def f(self, other):
-        if isinstance(other, pd.DataFrame):  # Another DataFrame
-            return self._compare_frame(other, func, str_rep)
+
+        other = _align_method_FRAME(self, other, axis=None)
+
+        if isinstance(other, ABCDataFrame):
+            # Another DataFrame
+            if not self._indexed_same(other):
+                raise ValueError('Can only compare identically-labeled '
+                                 'DataFrame objects')
+            return dispatch_to_series(self, other, func, str_rep)
+
         elif isinstance(other, ABCSeries):
-            return self._combine_series_infer(other, func)
+            return _combine_series_frame(self, other, func,
+                                         fill_value=None, axis=None,
+                                         level=None)
         else:
 
-            # straight boolean comparisions we want to allow all columns
+            # straight boolean comparisons we want to allow all columns
             # (regardless of dtype to pass thru) See #4537 for discussion.
-            res = self._combine_const(other, func, raise_on_error=False)
+            res = self._combine_const(other, func)
             return res.fillna(True).astype(bool)
 
-    f.__name__ = name
+    f.__name__ = op_name
 
     return f
 
 
-frame_flex_funcs = dict(flex_arith_method=_arith_method_FRAME,
-                        flex_comp_method=_flex_comp_method_FRAME)
-
-frame_special_funcs = dict(arith_method=_arith_method_FRAME,
-                           comp_method=_comp_method_FRAME,
-                           bool_method=_arith_method_FRAME)
-
-
-def _arith_method_PANEL(op, name, str_rep=None, fill_zeros=None,
-                        default_axis=None, **eval_kwargs):
-    # copied from Series na_op above, but without unnecessary branch for
-    # non-scalar
-    def na_op(x, y):
-        try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True, **eval_kwargs)
-        except TypeError:
-
-            # TODO: might need to find_common_type here?
-            result = np.empty(len(x), dtype=x.dtype)
-            mask = notnull(x)
-            result[mask] = op(x[mask], y)
-            result, changed = maybe_upcast_putmask(result, ~mask, np.nan)
-
-        result = missing.fill_zeros(result, x, y, name, fill_zeros)
-        return result
+# -----------------------------------------------------------------------------
+# Panel
 
+def _arith_method_PANEL(cls, op, special):
     # work only for scalars
+    op_name = _get_op_name(op, special)
+
     def f(self, other):
         if not is_scalar(other):
-            raise ValueError('Simple arithmetic with %s can only be '
-                             'done with scalar values' %
-                             self._constructor.__name__)
+            raise ValueError('Simple arithmetic with {name} can only be '
+                             'done with scalar values'
+                             .format(name=self._constructor.__name__))
 
         return self._combine(other, op)
 
-    f.__name__ = name
+    f.__name__ = op_name
     return f
 
 
-def _comp_method_PANEL(op, name, str_rep=None, masker=False):
+def _comp_method_PANEL(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+
     def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
         try:
-            result = expressions.evaluate(op, str_rep, x, y,
-                                          raise_on_error=True)
+            result = expressions.evaluate(op, str_rep, x, y)
         except TypeError:
-            xrav = x.ravel()
-            result = np.empty(x.size, dtype=bool)
-            if isinstance(y, np.ndarray):
-                yrav = y.ravel()
-                mask = notnull(xrav) & notnull(yrav)
-                result[mask] = op(np.array(list(xrav[mask])),
-                                  np.array(list(yrav[mask])))
-            else:
-                mask = notnull(xrav)
-                result[mask] = op(np.array(list(xrav[mask])), y)
-
-            if op == operator.ne:  # pragma: no cover
-                np.putmask(result, ~mask, True)
-            else:
-                np.putmask(result, ~mask, False)
-            result = result.reshape(x.shape)
-
+            result = mask_cmp_op(x, y, op, np.ndarray)
         return result
 
-    @Appender('Wrapper for comparison method %s' % name)
+    @Appender('Wrapper for comparison method {name}'.format(name=op_name))
     def f(self, other, axis=None):
         # Validate the axis parameter
         if axis is not None:
-            axis = self._get_axis_number(axis)
+            self._get_axis_number(axis)
 
         if isinstance(other, self._constructor):
             return self._compare_constructor(other, na_op)
-        elif isinstance(other, (self._constructor_sliced, pd.DataFrame,
+        elif isinstance(other, (self._constructor_sliced, ABCDataFrame,
                                 ABCSeries)):
-            raise Exception("input needs alignment for this object [%s]" %
-                            self._constructor)
+            raise Exception("input needs alignment for this object [{object}]"
+                            .format(object=self._constructor))
         else:
             return self._combine_const(other, na_op)
 
-    f.__name__ = name
+    f.__name__ = op_name
+
+    return f
+
+
+def _flex_method_PANEL(cls, op, special):
+    str_rep = _get_opstr(op, cls)
+    op_name = _get_op_name(op, special)
+    eval_kwargs = _gen_eval_kwargs(op_name)
+    fill_zeros = _gen_fill_zeros(op_name)
+
+    def na_op(x, y):
+        import pandas.core.computation.expressions as expressions
+
+        try:
+            result = expressions.evaluate(op, str_rep, x, y,
+                                          errors='raise',
+                                          **eval_kwargs)
+        except TypeError:
+            result = op(x, y)
+
+        # handles discrepancy between numpy and numexpr on division/mod
+        # by 0 though, given that these are generally (always?)
+        # non-scalars, I'm not sure whether it's worth it at the moment
+        result = missing.fill_zeros(result, x, y, op_name, fill_zeros)
+        return result
+
+    if op_name in _op_descriptions:
+        doc = _make_flex_doc(op_name, 'panel')
+    else:
+        # doc strings substitors
+        doc = _agg_doc_PANEL.format(op_name=op_name)
 
+    @Appender(doc)
+    def f(self, other, axis=0):
+        return self._combine(other, na_op, axis=axis)
+
+    f.__name__ = op_name
     return f
 
 
-panel_special_funcs = dict(arith_method=_arith_method_PANEL,
-                           comp_method=_comp_method_PANEL,
-                           bool_method=_arith_method_PANEL)
+# -----------------------------------------------------------------------------
+# Sparse
+
+def _cast_sparse_series_op(left, right, opname):
+    """
+    For SparseSeries operation, coerce to float64 if the result is expected
+    to have NaN or inf values
+
+    Parameters
+    ----------
+    left : SparseArray
+    right : SparseArray
+    opname : str
+
+    Returns
+    -------
+    left : SparseArray
+    right : SparseArray
+    """
+    from pandas.core.sparse.api import SparseDtype
+
+    opname = opname.strip('_')
+
+    # TODO: This should be moved to the array?
+    if is_integer_dtype(left) and is_integer_dtype(right):
+        # series coerces to float64 if result should have NaN/inf
+        if opname in ('floordiv', 'mod') and (right.values == 0).any():
+            left = left.astype(SparseDtype(np.float64, left.fill_value))
+            right = right.astype(SparseDtype(np.float64, right.fill_value))
+        elif opname in ('rfloordiv', 'rmod') and (left.values == 0).any():
+            left = left.astype(SparseDtype(np.float64, left.fill_value))
+            right = right.astype(SparseDtype(np.float64, right.fill_value))
+
+    return left, right
+
+
+def _arith_method_SPARSE_SERIES(cls, op, special):
+    """
+    Wrapper function for Series arithmetic operations, to avoid
+    code duplication.
+    """
+    op_name = _get_op_name(op, special)
+
+    def wrapper(self, other):
+        if isinstance(other, ABCDataFrame):
+            return NotImplemented
+        elif isinstance(other, ABCSeries):
+            if not isinstance(other, ABCSparseSeries):
+                other = other.to_sparse(fill_value=self.fill_value)
+            return _sparse_series_op(self, other, op, op_name)
+        elif is_scalar(other):
+            with np.errstate(all='ignore'):
+                new_values = op(self.values, other)
+            return self._constructor(new_values,
+                                     index=self.index,
+                                     name=self.name)
+        else:  # pragma: no cover
+            raise TypeError('operation with {other} not supported'
+                            .format(other=type(other)))
+
+    wrapper.__name__ = op_name
+    return wrapper
+
+
+def _sparse_series_op(left, right, op, name):
+    left, right = left.align(right, join='outer', copy=False)
+    new_index = left.index
+    new_name = get_op_result_name(left, right)
+
+    from pandas.core.arrays.sparse import _sparse_array_op
+    lvalues, rvalues = _cast_sparse_series_op(left.values, right.values, name)
+    result = _sparse_array_op(lvalues, rvalues, op, name)
+    return left._constructor(result, index=new_index, name=new_name)
+
+
+def _arith_method_SPARSE_ARRAY(cls, op, special):
+    """
+    Wrapper function for Series arithmetic operations, to avoid
+    code duplication.
+    """
+    op_name = _get_op_name(op, special)
+
+    def wrapper(self, other):
+        from pandas.core.arrays.sparse.array import (
+            SparseArray, _sparse_array_op, _wrap_result, _get_fill)
+        if isinstance(other, np.ndarray):
+            if len(self) != len(other):
+                raise AssertionError("length mismatch: {self} vs. {other}"
+                                     .format(self=len(self), other=len(other)))
+            if not isinstance(other, SparseArray):
+                dtype = getattr(other, 'dtype', None)
+                other = SparseArray(other, fill_value=self.fill_value,
+                                    dtype=dtype)
+            return _sparse_array_op(self, other, op, op_name)
+        elif is_scalar(other):
+            with np.errstate(all='ignore'):
+                fill = op(_get_fill(self), np.asarray(other))
+                result = op(self.sp_values, other)
+
+            return _wrap_result(op_name, result, self.sp_index, fill)
+        else:  # pragma: no cover
+            raise TypeError('operation with {other} not supported'
+                            .format(other=type(other)))
+
+    wrapper.__name__ = op_name
+    return wrapper
diff --git a/pandas/core/panel.py b/pandas/core/panel.py
index 5ab3c44b175fe..1555542079d80 100644
--- a/pandas/core/panel.py
+++ b/pandas/core/panel.py
@@ -4,50 +4,52 @@
 # pylint: disable=E1103,W0231,W0212,W0621
 from __future__ import division
 
+from collections import OrderedDict
 import warnings
 
 import numpy as np
 
-from pandas.types.cast import (infer_dtype_from_scalar,
-                               maybe_cast_item)
-from pandas.types.common import (is_integer, is_list_like,
-                                 is_string_like, is_scalar)
-from pandas.types.missing import notnull
+import pandas.compat as compat
+from pandas.compat import map, range, u, zip
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, Substitution, deprecate_kwarg
+from pandas.util._validators import validate_axis_style_args
+
+from pandas.core.dtypes.cast import (
+    cast_scalar_to_array, infer_dtype_from_scalar, maybe_cast_item)
+from pandas.core.dtypes.common import (
+    is_integer, is_list_like, is_scalar, is_string_like)
+from pandas.core.dtypes.missing import notna
 
-import pandas.computation.expressions as expressions
 import pandas.core.common as com
-import pandas.core.ops as ops
-import pandas.core.missing as missing
-from pandas import compat
-from pandas.compat import (map, zip, range, u, OrderedDict, OrderedDefaultdict)
-from pandas.compat.numpy import function as nv
-from pandas.core.common import PandasError, _try_sort, _default_index
 from pandas.core.frame import DataFrame
 from pandas.core.generic import NDFrame, _shared_docs
-from pandas.core.index import (Index, MultiIndex, _ensure_index,
-                               _get_combined_index)
-from pandas.formats.printing import pprint_thing
+from pandas.core.index import (
+    Index, MultiIndex, _get_objs_combined_axis, ensure_index)
+import pandas.core.indexes.base as ibase
 from pandas.core.indexing import maybe_droplevels
-from pandas.core.internals import (BlockManager,
-                                   create_block_manager_from_arrays,
-                                   create_block_manager_from_blocks)
-from pandas.core.ops import _op_descriptions
+from pandas.core.internals import (
+    BlockManager, create_block_manager_from_arrays,
+    create_block_manager_from_blocks)
+import pandas.core.ops as ops
+from pandas.core.reshape.util import cartesian_product
 from pandas.core.series import Series
-from pandas.tools.util import cartesian_product
-from pandas.util.decorators import (deprecate, Appender)
+
+from pandas.io.formats.printing import pprint_thing
 
 _shared_doc_kwargs = dict(
     axes='items, major_axis, minor_axis',
     klass="Panel",
-    axes_single_arg="{0, 1, 2, 'items', 'major_axis', 'minor_axis'}")
-_shared_doc_kwargs['args_transpose'] = ("three positional arguments: each one"
-                                        "of\n%s" %
-                                        _shared_doc_kwargs['axes_single_arg'])
+    axes_single_arg="{0, 1, 2, 'items', 'major_axis', 'minor_axis'}",
+    optional_mapper='', optional_axis='', optional_labels='')
+_shared_doc_kwargs['args_transpose'] = (
+    "{ax_single}\n\tThree positional arguments from given options.".format(
+        ax_single=_shared_doc_kwargs['axes_single_arg']))
 
 
 def _ensure_like_indices(time, panels):
     """
-    Makes sure that time and panels are conformable
+    Makes sure that time and panels are conformable.
     """
     n_time = len(time)
     n_panel = len(panels)
@@ -62,7 +64,7 @@ def _ensure_like_indices(time, panels):
 
 def panel_index(time, panels, names=None):
     """
-    Returns a multi-index suitable for a panel-like DataFrame
+    Returns a multi-index suitable for a panel-like DataFrame.
 
     Parameters
     ----------
@@ -90,7 +92,6 @@ def panel_index(time, panels, names=None):
 
     or
 
-    >>> import numpy as np
     >>> years = np.repeat(range(1960,1963), 3)
     >>> panels = np.tile(['A', 'B', 'C'], 3)
     >>> panel_idx = panel_index(years, panels)
@@ -107,7 +108,14 @@ def panel_index(time, panels, names=None):
 
 class Panel(NDFrame):
     """
-    Represents wide format panel data, stored as 3-dimensional array
+    Represents wide format panel data, stored as 3-dimensional array.
+
+    .. deprecated:: 0.20.0
+        The recommended way to represent 3-D data are with a MultiIndex on a
+        DataFrame via the :attr:`~Panel.to_frame()` method or with the
+        `xarray package <http://xarray.pydata.org/en/stable/>`__.
+        Pandas provides a :attr:`~Panel.to_xarray()` method to automate this
+        conversion.
 
     Parameters
     ----------
@@ -118,10 +126,10 @@ class Panel(NDFrame):
         axis=1
     minor_axis : Index or array-like
         axis=2
-    dtype : dtype, default None
-        Data type to force, otherwise infer
     copy : boolean, default False
         Copy data from inputs. Only affects DataFrame / 2d ndarray input
+    dtype : dtype, default None
+        Data type to force, otherwise infer
     """
 
     @property
@@ -132,13 +140,25 @@ def _constructor(self):
 
     def __init__(self, data=None, items=None, major_axis=None, minor_axis=None,
                  copy=False, dtype=None):
+        # deprecation GH13563
+        warnings.warn("\nPanel is deprecated and will be removed in a "
+                      "future version.\nThe recommended way to represent "
+                      "these types of 3-dimensional data are with a "
+                      "MultiIndex on a DataFrame, via the "
+                      "Panel.to_frame() method\n"
+                      "Alternatively, you can use the xarray package "
+                      "http://xarray.pydata.org/en/stable/.\n"
+                      "Pandas provides a `.to_xarray()` method to help "
+                      "automate this conversion.\n",
+                      FutureWarning, stacklevel=3)
+
         self._init_data(data=data, items=items, major_axis=major_axis,
                         minor_axis=minor_axis, copy=copy, dtype=dtype)
 
     def _init_data(self, data, copy, dtype, **kwargs):
         """
         Generate ND initialization; axes are passed
-        as required objects to __init__
+        as required objects to __init__.
         """
         if data is None:
             data = {}
@@ -153,7 +173,7 @@ def _init_data(self, data, copy, dtype, **kwargs):
 
         axes = None
         if isinstance(data, BlockManager):
-            if any(x is not None for x in passed_axes):
+            if com._any_not_none(*passed_axes):
                 axes = [x if x is not None else y
                         for x, y in zip(passed_axes, data.axes)]
             mgr = data
@@ -165,16 +185,14 @@ def _init_data(self, data, copy, dtype, **kwargs):
             mgr = self._init_matrix(data, passed_axes, dtype=dtype, copy=copy)
             copy = False
             dtype = None
-        elif is_scalar(data) and all(x is not None for x in passed_axes):
-            if dtype is None:
-                dtype, data = infer_dtype_from_scalar(data)
-            values = np.empty([len(x) for x in passed_axes], dtype=dtype)
-            values.fill(data)
-            mgr = self._init_matrix(values, passed_axes, dtype=dtype,
+        elif is_scalar(data) and com._all_not_none(*passed_axes):
+            values = cast_scalar_to_array([len(x) for x in passed_axes],
+                                          data, dtype=dtype)
+            mgr = self._init_matrix(values, passed_axes, dtype=values.dtype,
                                     copy=False)
             copy = False
         else:  # pragma: no cover
-            raise PandasError('Panel constructor not properly called!')
+            raise ValueError('Panel constructor not properly called!')
 
         NDFrame.__init__(self, mgr, axes=axes, copy=copy, dtype=dtype)
 
@@ -183,15 +201,13 @@ def _init_dict(self, data, axes, dtype=None):
 
         # prefilter if haxis passed
         if haxis is not None:
-            haxis = _ensure_index(haxis)
+            haxis = ensure_index(haxis)
             data = OrderedDict((k, v)
                                for k, v in compat.iteritems(data)
                                if k in haxis)
         else:
-            ks = list(data.keys())
-            if not isinstance(data, OrderedDict):
-                ks = _try_sort(ks)
-            haxis = Index(ks)
+            keys = com.dict_keys_to_ordered_list(data)
+            haxis = Index(keys)
 
         for k, v in compat.iteritems(data):
             if isinstance(v, dict):
@@ -227,7 +243,7 @@ def _init_arrays(self, arrays, arr_names, axes):
     @classmethod
     def from_dict(cls, data, intersect=False, orient='items', dtype=None):
         """
-        Construct Panel from dict of DataFrame objects
+        Construct Panel from dict of DataFrame objects.
 
         Parameters
         ----------
@@ -248,9 +264,11 @@ def from_dict(cls, data, intersect=False, orient='items', dtype=None):
         -------
         Panel
         """
+        from collections import defaultdict
+
         orient = orient.lower()
         if orient == 'minor':
-            new_data = OrderedDefaultdict(dict)
+            new_data = defaultdict(OrderedDict)
             for col, df in compat.iteritems(data):
                 for item, s in compat.iteritems(df):
                     new_data[item][col] = s
@@ -266,7 +284,7 @@ def from_dict(cls, data, intersect=False, orient='items', dtype=None):
         return cls(**d)
 
     def __getitem__(self, key):
-        key = com._apply_if_callable(key, self)
+        key = com.apply_if_callable(key, self)
 
         if isinstance(self._info_axis, MultiIndex):
             return self._getitem_multilevel(key)
@@ -280,7 +298,7 @@ def _getitem_multilevel(self, key):
         if isinstance(loc, (slice, np.ndarray)):
             new_index = info[loc]
             result_index = maybe_droplevels(new_index, key)
-            slices = [loc] + [slice(None) for x in range(self._AXIS_LEN - 1)]
+            slices = [loc] + [slice(None)] * (self._AXIS_LEN - 1)
             new_values = self.values[slices]
 
             d = self._construct_axes_dict(self._AXIS_ORDERS[1:])
@@ -297,15 +315,16 @@ def _init_matrix(self, data, axes, dtype=None, copy=False):
             try:
                 values = values.astype(dtype)
             except Exception:
-                raise ValueError('failed to cast to %s' % dtype)
+                raise ValueError('failed to cast to '
+                                 '{datatype}'.format(datatype=dtype))
 
         shape = values.shape
         fixed_axes = []
         for i, ax in enumerate(axes):
             if ax is None:
-                ax = _default_index(shape[i])
+                ax = ibase.default_index(shape[i])
             else:
-                ax = _ensure_index(ax)
+                ax = ensure_index(ax)
             fixed_axes.append(ax)
 
         return create_block_manager_from_blocks([values], fixed_axes)
@@ -318,9 +337,8 @@ def _compare_constructor(self, other, func):
             raise Exception('Can only compare identically-labeled '
                             'same type objects')
 
-        new_data = {}
-        for col in self._info_axis:
-            new_data[col] = func(self[col], other[col])
+        new_data = {col: func(self[col], other[col])
+                    for col in self._info_axis}
 
         d = self._construct_axes_dict(copy=False)
         return self._constructor(data=new_data, **d)
@@ -330,7 +348,7 @@ def _compare_constructor(self, other, func):
 
     def __unicode__(self):
         """
-        Return a string representation for a particular Panel
+        Return a string representation for a particular Panel.
 
         Invoked by unicode(df) in py2 only.
         Yields a Unicode String in both py2/py3.
@@ -338,18 +356,18 @@ def __unicode__(self):
 
         class_name = str(self.__class__)
 
-        shape = self.shape
-        dims = u('Dimensions: %s') % ' x '.join(
-            ["%d (%s)" % (s, a) for a, s in zip(self._AXIS_ORDERS, shape)])
+        dims = u('Dimensions: {dimensions}'.format(dimensions=' x '.join(
+            ["{shape} ({axis})".format(shape=shape, axis=axis) for axis, shape
+             in zip(self._AXIS_ORDERS, self.shape)])))
 
         def axis_pretty(a):
             v = getattr(self, a)
             if len(v) > 0:
-                return u('%s axis: %s to %s') % (a.capitalize(),
-                                                 pprint_thing(v[0]),
-                                                 pprint_thing(v[-1]))
+                return u('{ax} axis: {x} to {y}'.format(ax=a.capitalize(),
+                                                        x=pprint_thing(v[0]),
+                                                        y=pprint_thing(v[-1])))
             else:
-                return u('%s axis: None') % a.capitalize()
+                return u('{ax} axis: None'.format(ax=a.capitalize()))
 
         output = '\n'.join(
             [class_name, dims] + [axis_pretty(a) for a in self._AXIS_ORDERS])
@@ -359,7 +377,7 @@ def _get_plane_axes_index(self, axis):
         """
         Get my plane axes indexes: these are already
         (as compared with higher level planes),
-        as we are returning a DataFrame axes indexes
+        as we are returning a DataFrame axes indexes.
         """
         axis_name = self._get_axis_name(axis)
 
@@ -379,7 +397,7 @@ def _get_plane_axes(self, axis):
         """
         Get my plane axes indexes: these are already
         (as compared with higher level planes),
-        as we are returning a DataFrame axes
+        as we are returning a DataFrame axes.
         """
         return [self._get_axis(axi)
                 for axi in self._get_plane_axes_index(axis)]
@@ -391,14 +409,14 @@ def to_sparse(self, *args, **kwargs):
         NOT IMPLEMENTED: do not call this method, as sparsifying is not
         supported for Panel objects and will raise an error.
 
-        Convert to SparsePanel
+        Convert to SparsePanel.
         """
         raise NotImplementedError("sparsifying is not supported "
                                   "for Panel objects")
 
     def to_excel(self, path, na_rep='', engine=None, **kwargs):
         """
-        Write each DataFrame in Panel to a separate excel sheet
+        Write each DataFrame in Panel to a separate excel sheet.
 
         Parameters
         ----------
@@ -449,14 +467,18 @@ def to_excel(self, path, na_rep='', engine=None, **kwargs):
 
     def as_matrix(self):
         self._consolidate_inplace()
-        return self._data.as_matrix()
+        return self._data.as_array()
 
     # ----------------------------------------------------------------------
     # Getting and setting elements
 
     def get_value(self, *args, **kwargs):
         """
-        Quickly retrieve single value at (item, major, minor) location
+        Quickly retrieve single value at (item, major, minor) location.
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
@@ -469,6 +491,13 @@ def get_value(self, *args, **kwargs):
         -------
         value : scalar value
         """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(*args, **kwargs)
+
+    def _get_value(self, *args, **kwargs):
         nargs = len(args)
         nreq = self._AXIS_LEN
 
@@ -488,11 +517,16 @@ def get_value(self, *args, **kwargs):
         else:
             lower = self._get_item_cache(args[0])
 
-        return lower.get_value(*args[1:], takeable=takeable)
+        return lower._get_value(*args[1:], takeable=takeable)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, *args, **kwargs):
         """
-        Quickly set single value at (item, major, minor) location
+        Quickly set single value at (item, major, minor) location.
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
@@ -506,8 +540,15 @@ def set_value(self, *args, **kwargs):
         -------
         panel : Panel
             If label combo is contained, will be reference to calling Panel,
-            otherwise a new object
+            otherwise a new object.
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(*args, **kwargs)
+
+    def _set_value(self, *args, **kwargs):
         # require an arg for each axis and the value
         nargs = len(args)
         nreq = self._AXIS_LEN + 1
@@ -528,7 +569,7 @@ def set_value(self, *args, **kwargs):
             else:
                 lower = self._get_item_cache(args[0])
 
-            lower.set_value(*args[1:], takeable=takeable)
+            lower._set_value(*args[1:], takeable=takeable)
             return self
         except KeyError:
             axes = self._expand_axes(args)
@@ -541,7 +582,8 @@ def set_value(self, *args, **kwargs):
             if made_bigger:
                 maybe_cast_item(result, args[0], likely_dtype)
 
-            return result.set_value(*args)
+            return result._set_value(*args)
+    _set_value.__doc__ = set_value.__doc__
 
     def _box_item_values(self, key, values):
         if self.ndim == values.ndim:
@@ -557,7 +599,7 @@ def _box_item_values(self, key, values):
         return self._constructor_sliced(values, **d)
 
     def __setitem__(self, key, value):
-        key = com._apply_if_callable(key, self)
+        key = com.apply_if_callable(key, self)
         shape = tuple(self.shape)
         if isinstance(value, self._constructor_sliced):
             value = value.reindex(
@@ -570,18 +612,21 @@ def __setitem__(self, key, value):
                                      shape[1:], tuple(map(int, value.shape))))
             mat = np.asarray(value)
         elif is_scalar(value):
-            dtype, value = infer_dtype_from_scalar(value)
-            mat = np.empty(shape[1:], dtype=dtype)
-            mat.fill(value)
+            mat = cast_scalar_to_array(shape[1:], value)
         else:
-            raise TypeError('Cannot set item of type: %s' % str(type(value)))
+            raise TypeError('Cannot set item of '
+                            'type: {dtype!s}'.format(dtype=type(value)))
 
         mat = mat.reshape(tuple([1]) + shape[1:])
         NDFrame._set_item(self, key, mat)
 
     def _unpickle_panel_compat(self, state):  # pragma: no cover
-        "Unpickle the panel"
-        _unpickle = com._unpickle_array
+        """
+        Unpickle the panel.
+        """
+        from pandas.io.pickle import _unpickle_array
+
+        _unpickle = _unpickle_array
         vals, items, major, minor = state
 
         items = _unpickle(items)
@@ -646,7 +691,9 @@ def round(self, decimals=0, *args, **kwargs):
         raise TypeError("decimals must be an integer")
 
     def _needs_reindex_multi(self, axes, method, level):
-        """ don't allow a multi reindex on Panel or above ndim """
+        """
+        Don't allow a multi reindex on Panel or above ndim.
+        """
         return False
 
     def align(self, other, **kwargs):
@@ -654,7 +701,7 @@ def align(self, other, **kwargs):
 
     def dropna(self, axis=0, how='any', inplace=False):
         """
-        Drop 2D from panel, holding passed axis constant
+        Drop 2D from panel, holding passed axis constant.
 
         Parameters
         ----------
@@ -674,9 +721,9 @@ def dropna(self, axis=0, how='any', inplace=False):
         axis = self._get_axis_number(axis)
 
         values = self.values
-        mask = notnull(values)
+        mask = notna(values)
 
-        for ax in reversed(sorted(set(range(self._AXIS_LEN)) - set([axis]))):
+        for ax in reversed(sorted(set(range(self._AXIS_LEN)) - {axis})):
             mask = mask.sum(ax)
 
         per_slice = np.prod(values.shape[:axis] + values.shape[axis + 1:])
@@ -701,9 +748,9 @@ def _combine(self, other, func, axis=0):
         elif is_scalar(other):
             return self._combine_const(other, func)
         else:
-            raise NotImplementedError("%s is not supported in combine "
-                                      "operation with %s" %
-                                      (str(type(other)), str(type(self))))
+            raise NotImplementedError(
+                "{otype!s} is not supported in combine operation with "
+                "{selftype!s}".format(otype=type(other), selftype=type(self)))
 
     def _combine_const(self, other, func):
         with np.errstate(all='ignore'):
@@ -746,7 +793,7 @@ def _combine_panel(self, other, func):
 
     def major_xs(self, key):
         """
-        Return slice of panel along major axis
+        Return slice of panel along major axis.
 
         Parameters
         ----------
@@ -756,7 +803,7 @@ def major_xs(self, key):
         Returns
         -------
         y : DataFrame
-            index -> minor axis, columns -> items
+            Index -> minor axis, columns -> items.
 
         Notes
         -----
@@ -765,13 +812,12 @@ def major_xs(self, key):
         MultiIndex Slicers is a generic way to get/set values on any level or
         levels and is a superset of major_xs functionality, see
         :ref:`MultiIndex Slicers <advanced.mi_slicers>`
-
         """
         return self.xs(key, axis=self._AXIS_LEN - 2)
 
     def minor_xs(self, key):
         """
-        Return slice of panel along minor axis
+        Return slice of panel along minor axis.
 
         Parameters
         ----------
@@ -781,7 +827,7 @@ def minor_xs(self, key):
         Returns
         -------
         y : DataFrame
-            index -> major axis, columns -> items
+            Index -> major axis, columns -> items.
 
         Notes
         -----
@@ -790,13 +836,12 @@ def minor_xs(self, key):
         MultiIndex Slicers is a generic way to get/set values on any level or
         levels and is a superset of minor_xs functionality, see
         :ref:`MultiIndex Slicers <advanced.mi_slicers>`
-
         """
         return self.xs(key, axis=self._AXIS_LEN - 1)
 
     def xs(self, key, axis=1):
         """
-        Return slice of panel along selected axis
+        Return slice of panel along selected axis.
 
         Parameters
         ----------
@@ -813,9 +858,8 @@ def xs(self, key, axis=1):
         xs is only for getting, not setting values.
 
         MultiIndex Slicers is a generic way to get/set values on any level or
-        levels and  is a superset of xs functionality, see
+        levels and is a superset of xs functionality, see
         :ref:`MultiIndex Slicers <advanced.mi_slicers>`
-
         """
         axis = self._get_axis_number(axis)
         if axis == 0:
@@ -833,6 +877,8 @@ def xs(self, key, axis=1):
 
     def _ixs(self, i, axis=0):
         """
+        Parameters
+        ----------
         i : int, slice, or sequence of integers
         axis : int
         """
@@ -860,7 +906,7 @@ def _ixs(self, i, axis=0):
 
     def groupby(self, function, axis='major'):
         """
-        Group data on given axis, returning GroupBy object
+        Group data on given axis, returning GroupBy object.
 
         Parameters
         ----------
@@ -872,9 +918,7 @@ def groupby(self, function, axis='major'):
         -------
         grouped : PanelGroupBy
         """
-        from pandas.core.groupby import PanelGroupBy
-        axis = self._get_axis_number(axis)
-        return PanelGroupBy(self, function, axis=axis)
+        raise NotImplementedError("Panel is removed in pandas 0.25.0")
 
     def to_frame(self, filter_observations=True):
         """
@@ -896,65 +940,65 @@ def to_frame(self, filter_observations=True):
 
         if filter_observations:
             # shaped like the return DataFrame
-            mask = notnull(self.values).all(axis=0)
+            mask = notna(self.values).all(axis=0)
             # size = mask.sum()
             selector = mask.ravel()
         else:
             # size = N * K
             selector = slice(None, None)
 
-        data = {}
-        for item in self.items:
-            data[item] = self[item].values.ravel()[selector]
+        data = {item: self[item].values.ravel()[selector]
+                for item in self.items}
 
         def construct_multi_parts(idx, n_repeat, n_shuffle=1):
-            axis_idx = idx.to_hierarchical(n_repeat, n_shuffle)
-            labels = [x[selector] for x in axis_idx.labels]
-            levels = axis_idx.levels
-            names = axis_idx.names
-            return labels, levels, names
+            # Replicates and shuffles MultiIndex, returns individual attributes
+            codes = [np.repeat(x, n_repeat) for x in idx.codes]
+            # Assumes that each label is divisible by n_shuffle
+            codes = [x.reshape(n_shuffle, -1).ravel(order='F')
+                     for x in codes]
+            codes = [x[selector] for x in codes]
+            levels = idx.levels
+            names = idx.names
+            return codes, levels, names
 
         def construct_index_parts(idx, major=True):
             levels = [idx]
             if major:
-                labels = [np.arange(N).repeat(K)[selector]]
+                codes = [np.arange(N).repeat(K)[selector]]
                 names = idx.name or 'major'
             else:
-                labels = np.arange(K).reshape(1, K)[np.zeros(N, dtype=int)]
-                labels = [labels.ravel()[selector]]
+                codes = np.arange(K).reshape(1, K)[np.zeros(N, dtype=int)]
+                codes = [codes.ravel()[selector]]
                 names = idx.name or 'minor'
             names = [names]
-            return labels, levels, names
+            return codes, levels, names
 
         if isinstance(self.major_axis, MultiIndex):
-            major_labels, major_levels, major_names = construct_multi_parts(
+            major_codes, major_levels, major_names = construct_multi_parts(
                 self.major_axis, n_repeat=K)
         else:
-            major_labels, major_levels, major_names = construct_index_parts(
+            major_codes, major_levels, major_names = construct_index_parts(
                 self.major_axis)
 
         if isinstance(self.minor_axis, MultiIndex):
-            minor_labels, minor_levels, minor_names = construct_multi_parts(
+            minor_codes, minor_levels, minor_names = construct_multi_parts(
                 self.minor_axis, n_repeat=N, n_shuffle=K)
         else:
-            minor_labels, minor_levels, minor_names = construct_index_parts(
+            minor_codes, minor_levels, minor_names = construct_index_parts(
                 self.minor_axis, major=False)
 
         levels = major_levels + minor_levels
-        labels = major_labels + minor_labels
+        codes = major_codes + minor_codes
         names = major_names + minor_names
 
-        index = MultiIndex(levels=levels, labels=labels, names=names,
+        index = MultiIndex(levels=levels, codes=codes, names=names,
                            verify_integrity=False)
 
         return DataFrame(data, index=index, columns=self.items)
 
-    to_long = deprecate('to_long', to_frame)
-    toLong = deprecate('toLong', to_frame)
-
     def apply(self, func, axis='major', **kwargs):
         """
-        Applies function along axis (or axes) of the Panel
+        Apply function along axis (or axes) of the Panel.
 
         Parameters
         ----------
@@ -965,32 +1009,33 @@ def apply(self, func, axis='major', **kwargs):
             DataFrames of items & major axis will be passed
         axis : {'items', 'minor', 'major'}, or {0, 1, 2}, or a tuple with two
             axes
-        Additional keyword arguments will be passed as keywords to the function
+        **kwargs
+            Additional keyword arguments will be passed to the function.
+
+        Returns
+        -------
+        result : Panel, DataFrame, or Series
 
         Examples
         --------
 
         Returns a Panel with the square root of each element
 
-        >>> p = pd.Panel(np.random.rand(4,3,2))
+        >>> p = pd.Panel(np.random.rand(4, 3, 2))  # doctest: +SKIP
         >>> p.apply(np.sqrt)
 
         Equivalent to p.sum(1), returning a DataFrame
 
-        >>> p.apply(lambda x: x.sum(), axis=1)
+        >>> p.apply(lambda x: x.sum(), axis=1)  # doctest: +SKIP
 
         Equivalent to previous:
 
-        >>> p.apply(lambda x: x.sum(), axis='minor')
+        >>> p.apply(lambda x: x.sum(), axis='major')  # doctest: +SKIP
 
         Return the shapes of each DataFrame over axis 2 (i.e the shapes of
         items x major), as a Series
 
-        >>> p.apply(lambda x: x.shape, axis=(0,1))
-
-        Returns
-        -------
-        result : Panel, DataFrame, or Series
+        >>> p.apply(lambda x: x.shape, axis=(0,1))  # doctest: +SKIP
         """
 
         if kwargs and not isinstance(func, np.ufunc):
@@ -1040,7 +1085,7 @@ def _apply_1d(self, func, axis):
         for i in range(np.prod(shape)):
 
             # construct the object
-            pts = tuple([p[i] for p in points])
+            pts = tuple(p[i] for p in points)
             indexer.put(indlist, slice_indexer)
 
             obj = Series(values[tuple(indexer)], index=slice_axis, name=pts)
@@ -1076,8 +1121,9 @@ def _apply_1d(self, func, axis):
         return self._construct_return_type(results, planes)
 
     def _apply_2d(self, func, axis):
-        """ handle 2-d slices, equiv to iterating over the other axis """
-
+        """
+        Handle 2-d slices, equiv to iterating over the other axis.
+        """
         ndim = self.ndim
         axis = [self._get_axis_number(a) for a in axis]
 
@@ -1106,13 +1152,26 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
             raise NotImplementedError('Panel.{0} does not implement '
                                       'numeric_only.'.format(name))
 
-        axis_name = self._get_axis_name(axis)
-        axis_number = self._get_axis_number(axis_name)
+        if axis is None and filter_type == 'bool':
+            # labels = None
+            # constructor = None
+            axis_number = None
+            axis_name = None
+        else:
+            # TODO: Make other agg func handle axis=None properly
+            axis = self._get_axis_number(axis)
+            # labels = self._get_agg_axis(axis)
+            # constructor = self._constructor
+            axis_name = self._get_axis_name(axis)
+            axis_number = self._get_axis_number(axis_name)
+
         f = lambda x: op(x, axis=axis_number, skipna=skipna, **kwds)
 
         with np.errstate(all='ignore'):
             result = f(self.values)
 
+        if axis is None and filter_type == 'bool':
+            return np.bool_(result)
         axes = self._get_plane_axes(axis_name)
         if result.ndim == 2 and axis_name != self._info_axis_name:
             result = result.T
@@ -1120,7 +1179,9 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
         return self._construct_return_type(result, axes)
 
     def _construct_return_type(self, result, axes=None):
-        """ return the type for the ndim of the result """
+        """
+        Return the type for the ndim of the result.
+        """
         ndim = getattr(result, 'ndim', None)
 
         # need to assume they are the same
@@ -1150,8 +1211,8 @@ def _construct_return_type(self, result, axes=None):
             return self._constructor_sliced(
                 result, **self._extract_axes_for_slice(self, axes))
 
-        raise PandasError('invalid _construct_return_type [self->%s] '
-                          '[result->%s]' % (self, result))
+        raise ValueError('invalid _construct_return_type [self->{self}] '
+                         '[result->{result}]'.format(self=self, result=result))
 
     def _wrap_result(self, result, axis):
         axis = self._get_axis_name(axis)
@@ -1161,16 +1222,35 @@ def _wrap_result(self, result, axis):
 
         return self._construct_return_type(result, axes)
 
-    @Appender(_shared_docs['reindex'] % _shared_doc_kwargs)
-    def reindex(self, items=None, major_axis=None, minor_axis=None, **kwargs):
-        major_axis = (major_axis if major_axis is not None else
-                      kwargs.pop('major', None))
-        minor_axis = (minor_axis if minor_axis is not None else
-                      kwargs.pop('minor', None))
-        return super(Panel, self).reindex(items=items, major_axis=major_axis,
-                                          minor_axis=minor_axis, **kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.reindex.__doc__)
+    def reindex(self, *args, **kwargs):
+        major = kwargs.pop("major", None)
+        minor = kwargs.pop('minor', None)
+
+        if major is not None:
+            if kwargs.get("major_axis"):
+                raise TypeError("Cannot specify both 'major' and 'major_axis'")
+            kwargs['major_axis'] = major
+        if minor is not None:
+            if kwargs.get("minor_axis"):
+                raise TypeError("Cannot specify both 'minor' and 'minor_axis'")
+
+            kwargs['minor_axis'] = minor
+        axes = validate_axis_style_args(self, args, kwargs, 'labels',
+                                        'reindex')
+        kwargs.update(axes)
+        kwargs.pop('axis', None)
+        kwargs.pop('labels', None)
+
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", FutureWarning)
+            # do not warn about constructing Panel when reindexing
+            result = super(Panel, self).reindex(**kwargs)
+        return result
 
-    @Appender(_shared_docs['rename'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.rename.__doc__)
     def rename(self, items=None, major_axis=None, minor_axis=None, **kwargs):
         major_axis = (major_axis if major_axis is not None else
                       kwargs.pop('major', None))
@@ -1187,7 +1267,8 @@ def reindex_axis(self, labels, axis=0, method=None, level=None, copy=True,
                                                copy=copy, limit=limit,
                                                fill_value=fill_value)
 
-    @Appender(_shared_docs['transpose'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.transpose.__doc__)
     def transpose(self, *args, **kwargs):
         # check if a list of axes was passed in instead as a
         # single *args element
@@ -1205,7 +1286,8 @@ def transpose(self, *args, **kwargs):
 
         return super(Panel, self).transpose(*axes, **kwargs)
 
-    @Appender(_shared_docs['fillna'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
         return super(Panel, self).fillna(value=value, method=method, axis=axis,
@@ -1235,6 +1317,7 @@ def count(self, axis='major'):
     def shift(self, periods=1, freq=None, axis='major'):
         """
         Shift index by desired number of periods with an optional time freq.
+
         The shifted data will not include the dropped periods and the
         shifted axis will be smaller than the original. This is different
         from the behavior of DataFrame.shift()
@@ -1260,7 +1343,7 @@ def tshift(self, periods=1, freq=None, axis='major'):
 
     def join(self, other, how='left', lsuffix='', rsuffix=''):
         """
-        Join items with other Panel either on major and minor axes column
+        Join items with other Panel either on major and minor axes column.
 
         Parameters
         ----------
@@ -1282,7 +1365,7 @@ def join(self, other, how='left', lsuffix='', rsuffix=''):
         -------
         joined : Panel
         """
-        from pandas.tools.concat import concat
+        from pandas.core.reshape.concat import concat
 
         if isinstance(other, Panel):
             join_major, join_minor = self._get_join_index(other, how)
@@ -1307,25 +1390,37 @@ def join(self, other, how='left', lsuffix='', rsuffix=''):
             return concat([self] + list(other), axis=0, join=how,
                           join_axes=join_axes, verify_integrity=True)
 
+    @deprecate_kwarg(old_arg_name='raise_conflict', new_arg_name='errors',
+                     mapping={False: 'ignore', True: 'raise'})
     def update(self, other, join='left', overwrite=True, filter_func=None,
-               raise_conflict=False):
+               errors='ignore'):
         """
-        Modify Panel in place using non-NA values from passed
-        Panel, or object coercible to Panel. Aligns on items
+        Modify Panel in place using non-NA values from other Panel.
+
+        May also use object coercible to Panel. Will align on items.
 
         Parameters
         ----------
         other : Panel, or object coercible to Panel
-        join : How to join individual DataFrames
-            {'left', 'right', 'outer', 'inner'}, default 'left'
-        overwrite : boolean, default True
-            If True then overwrite values for common keys in the calling panel
-        filter_func : callable(1d-array) -> 1d-array<boolean>, default None
+            The object from which the caller will be udpated.
+        join : {'left', 'right', 'outer', 'inner'}, default 'left'
+            How individual DataFrames are joined.
+        overwrite : bool, default True
+            If True then overwrite values for common keys in the calling Panel.
+        filter_func : callable(1d-array) -> 1d-array<bool>, default None
             Can choose to replace values other than NA. Return True for values
-            that should be updated
-        raise_conflict : bool
-            If True, will raise an error if a DataFrame and other both
-            contain data in the same place.
+            that should be updated.
+        errors : {'raise', 'ignore'}, default 'ignore'
+            If 'raise', will raise an error if a DataFrame and other both.
+
+            .. versionchanged :: 0.24.0
+               Changed from `raise_conflict=False|True`
+               to `errors='ignore'|'raise'`.
+
+        See Also
+        --------
+        DataFrame.update : Similar method for DataFrames.
+        dict.update : Similar method for dictionaries.
         """
 
         if not isinstance(other, self._constructor):
@@ -1336,8 +1431,8 @@ def update(self, other, join='left', overwrite=True, filter_func=None,
         other = other.reindex(**{axis_name: axis_values})
 
         for frame in axis_values:
-            self[frame].update(other[frame], join, overwrite, filter_func,
-                               raise_conflict)
+            self[frame].update(other[frame], join=join, overwrite=overwrite,
+                               filter_func=filter_func, errors=errors)
 
     def _get_join_index(self, other, how):
         if how == 'left':
@@ -1355,17 +1450,19 @@ def _get_join_index(self, other, how):
     # miscellaneous data creation
     @staticmethod
     def _extract_axes(self, data, axes, **kwargs):
-        """ return a list of the axis indicies """
+        """
+        Return a list of the axis indices.
+        """
         return [self._extract_axis(self, data, axis=i, **kwargs)
                 for i, a in enumerate(axes)]
 
     @staticmethod
     def _extract_axes_for_slice(self, axes):
-        """ return the slice dictionary for these axes """
-        return dict([(self._AXIS_SLICEMAP[i], a)
-                     for i, a in zip(
-                         self._AXIS_ORDERS[self._AXIS_LEN - len(axes):],
-                         axes)])
+        """
+        Return the slice dictionary for these axes.
+        """
+        return {self._AXIS_SLICEMAP[i]: a for i, a in
+                zip(self._AXIS_ORDERS[self._AXIS_LEN - len(axes):], axes)}
 
     @staticmethod
     def _prep_ndarray(self, values, copy=True):
@@ -1397,11 +1494,11 @@ def _homogenize_dict(self, frames, intersect=True, dtype=None):
 
         Returns
         -------
-        dict of aligned results & indicies
+        dict of aligned results & indices
         """
 
         result = dict()
-        # caller differs dict/ODict, presered type
+        # caller differs dict/ODict, preserved type
         if isinstance(frames, OrderedDict):
             result = OrderedDict()
 
@@ -1413,11 +1510,10 @@ def _homogenize_dict(self, frames, intersect=True, dtype=None):
                 adj_frames[k] = v
 
         axes = self._AXIS_ORDERS[1:]
-        axes_dict = dict([(a, ax) for a, ax in zip(axes, self._extract_axes(
-            self, adj_frames, axes, intersect=intersect))])
+        axes_dict = {a: ax for a, ax in zip(axes, self._extract_axes(
+                     self, adj_frames, axes, intersect=intersect))}
 
-        reindex_dict = dict(
-            [(self._AXIS_SLICEMAP[a], axes_dict[a]) for a in axes])
+        reindex_dict = {self._AXIS_SLICEMAP[a]: axes_dict[a] for a in axes}
         reindex_dict['copy'] = False
         for key, frame in compat.iteritems(adj_frames):
             if frame is not None:
@@ -1437,7 +1533,6 @@ def _extract_axis(self, data, axis=0, intersect=False):
             index = Index([])
         elif len(data) > 0:
             raw_lengths = []
-            indexes = []
 
         have_raw_arrays = False
         have_frames = False
@@ -1445,18 +1540,22 @@ def _extract_axis(self, data, axis=0, intersect=False):
         for v in data.values():
             if isinstance(v, self._constructor_sliced):
                 have_frames = True
-                indexes.append(v._get_axis(axis))
             elif v is not None:
                 have_raw_arrays = True
                 raw_lengths.append(v.shape[axis])
 
         if have_frames:
-            index = _get_combined_index(indexes, intersect=intersect)
+            # we want the "old" behavior here, of sorting only
+            # 1. we're doing a union (intersect=False)
+            # 2. the indices are not aligned.
+            index = _get_objs_combined_axis(data.values(), axis=axis,
+                                            intersect=intersect, sort=None)
 
         if have_raw_arrays:
             lengths = list(set(raw_lengths))
             if len(lengths) > 1:
-                raise ValueError('ndarrays must match shape on axis %d' % axis)
+                raise ValueError('ndarrays must match shape on '
+                                 'axis {ax}'.format(ax=axis))
 
             if have_frames:
                 if lengths[0] != len(index):
@@ -1467,113 +1566,23 @@ def _extract_axis(self, data, axis=0, intersect=False):
         if index is None:
             index = Index([])
 
-        return _ensure_index(index)
-
-    @classmethod
-    def _add_aggregate_operations(cls, use_numexpr=True):
-        """ add the operations to the cls; evaluate the doc strings again """
-
-        # doc strings substitors
-        _agg_doc = """
-Wrapper method for %%s
-
-Parameters
-----------
-other : %s or %s""" % (cls._constructor_sliced.__name__, cls.__name__) + """
-axis : {""" + ', '.join(cls._AXIS_ORDERS) + "}" + """
-    Axis to broadcast over
-
-Returns
--------
-""" + cls.__name__ + "\n"
-
-        def _panel_arith_method(op, name, str_rep=None, default_axis=None,
-                                fill_zeros=None, **eval_kwargs):
-            def na_op(x, y):
-                try:
-                    result = expressions.evaluate(op, str_rep, x, y,
-                                                  raise_on_error=True,
-                                                  **eval_kwargs)
-                except TypeError:
-                    result = op(x, y)
-
-                # handles discrepancy between numpy and numexpr on division/mod
-                # by 0 though, given that these are generally (always?)
-                # non-scalars, I'm not sure whether it's worth it at the moment
-                result = missing.fill_zeros(result, x, y, name, fill_zeros)
-                return result
-
-            if name in _op_descriptions:
-                op_name = name.replace('__', '')
-                op_desc = _op_descriptions[op_name]
-                if op_desc['reversed']:
-                    equiv = 'other ' + op_desc['op'] + ' panel'
-                else:
-                    equiv = 'panel ' + op_desc['op'] + ' other'
-
-                _op_doc = """
-                %%s of series and other, element-wise (binary operator `%%s`).
-                Equivalent to ``%%s``.
-
-                Parameters
-                ----------
-                other : %s or %s""" % (cls._constructor_sliced.__name__,
-                                       cls.__name__) + """
-                axis : {""" + ', '.join(cls._AXIS_ORDERS) + "}" + """
-                    Axis to broadcast over
-
-                Returns
-                -------
-                """ + cls.__name__ + """
-
-                See also
-                --------
-                """ + cls.__name__ + ".%s\n"
-                doc = _op_doc % (op_desc['desc'], op_name, equiv,
-                                 op_desc['reverse'])
-            else:
-                doc = _agg_doc % name
-
-            @Appender(doc)
-            def f(self, other, axis=0):
-                return self._combine(other, na_op, axis=axis)
-
-            f.__name__ = name
-            return f
+        return ensure_index(index)
 
-        # add `div`, `mul`, `pow`, etc..
-        ops.add_flex_arithmetic_methods(
-            cls, _panel_arith_method, use_numexpr=use_numexpr,
-            flex_comp_method=ops._comp_method_PANEL)
+    def sort_values(self, *args, **kwargs):
+        """
+        NOT IMPLEMENTED: do not call this method, as sorting values is not
+        supported for Panel objects and will raise an error.
+        """
+        super(Panel, self).sort_values(*args, **kwargs)
 
 
 Panel._setup_axes(axes=['items', 'major_axis', 'minor_axis'], info_axis=0,
                   stat_axis=1, aliases={'major': 'major_axis',
                                         'minor': 'minor_axis'},
                   slicers={'major_axis': 'index',
-                           'minor_axis': 'columns'})
+                           'minor_axis': 'columns'},
+                  docs={})
 
-ops.add_special_arithmetic_methods(Panel, **ops.panel_special_funcs)
-Panel._add_aggregate_operations()
+ops.add_special_arithmetic_methods(Panel)
+ops.add_flex_arithmetic_methods(Panel)
 Panel._add_numeric_operations()
-
-
-# legacy
-class WidePanel(Panel):
-
-    def __init__(self, *args, **kwargs):
-        # deprecation, #10892
-        warnings.warn("WidePanel is deprecated. Please use Panel",
-                      FutureWarning, stacklevel=2)
-
-        super(WidePanel, self).__init__(*args, **kwargs)
-
-
-class LongPanel(DataFrame):
-
-    def __init__(self, *args, **kwargs):
-        # deprecation, #10892
-        warnings.warn("LongPanel is deprecated. Please use DataFrame",
-                      FutureWarning, stacklevel=2)
-
-        super(LongPanel, self).__init__(*args, **kwargs)
diff --git a/pandas/core/panel4d.py b/pandas/core/panel4d.py
deleted file mode 100644
index f32de29c5c167..0000000000000
--- a/pandas/core/panel4d.py
+++ /dev/null
@@ -1,60 +0,0 @@
-""" Panel4D: a 4-d dict like collection of panels """
-
-import warnings
-from pandas.core.panelnd import create_nd_panel_factory
-from pandas.core.panel import Panel
-
-Panel4D = create_nd_panel_factory(klass_name='Panel4D',
-                                  orders=['labels', 'items', 'major_axis',
-                                          'minor_axis'],
-                                  slices={'labels': 'labels',
-                                          'items': 'items',
-                                          'major_axis': 'major_axis',
-                                          'minor_axis': 'minor_axis'},
-                                  slicer=Panel,
-                                  aliases={'major': 'major_axis',
-                                           'minor': 'minor_axis'}, stat_axis=2,
-                                  ns=dict(__doc__="""
-    Panel4D is a 4-Dimensional named container very much like a Panel, but
-    having 4 named dimensions. It is intended as a test bed for more
-    N-Dimensional named containers.
-
-    DEPRECATED. Panel4D is deprecated and will be removed in a future version.
-    The recommended way to represent these types of n-dimensional data are with
-    the `xarray package <http://xarray.pydata.org/en/stable/>`__.
-    Pandas provides a `.to_xarray()` method to automate this conversion.
-
-    Parameters
-    ----------
-    data : ndarray (labels x items x major x minor), or dict of Panels
-
-    labels : Index or array-like : axis=0
-    items  : Index or array-like : axis=1
-    major_axis : Index or array-like: axis=2
-    minor_axis : Index or array-like: axis=3
-
-    dtype : dtype, default None
-    Data type to force, otherwise infer
-    copy : boolean, default False
-    Copy data from inputs. Only affects DataFrame / 2d ndarray input
-    """))
-
-
-def panel4d_init(self, data=None, labels=None, items=None, major_axis=None,
-                 minor_axis=None, copy=False, dtype=None):
-
-    # deprecation GH13564
-    warnings.warn("\nPanel4D is deprecated and will be removed in a "
-                  "future version.\nThe recommended way to represent "
-                  "these types of n-dimensional data are with\n"
-                  "the `xarray package "
-                  "<http://xarray.pydata.org/en/stable/>`__.\n"
-                  "Pandas provides a `.to_xarray()` method to help "
-                  "automate this conversion.\n",
-                  FutureWarning, stacklevel=2)
-    self._init_data(data=data, labels=labels, items=items,
-                    major_axis=major_axis, minor_axis=minor_axis, copy=copy,
-                    dtype=dtype)
-
-
-Panel4D.__init__ = panel4d_init
diff --git a/pandas/core/panelnd.py b/pandas/core/panelnd.py
deleted file mode 100644
index 26ceeea654e4e..0000000000000
--- a/pandas/core/panelnd.py
+++ /dev/null
@@ -1,132 +0,0 @@
-""" Factory methods to create N-D panels """
-
-import warnings
-from pandas.compat import zip
-import pandas.compat as compat
-
-
-def create_nd_panel_factory(klass_name, orders, slices, slicer, aliases=None,
-                            stat_axis=2, info_axis=0, ns=None):
-    """ manufacture a n-d class:
-
-    DEPRECATED. Panelnd is deprecated and will be removed in a future version.
-    The recommended way to represent these types of n-dimensional data are with
-    the `xarray package <http://xarray.pydata.org/en/stable/>`__.
-    Pandas provides a `.to_xarray()` method to automate this conversion.
-
-    Parameters
-    ----------
-    klass_name : the klass name
-    orders : the names of the axes in order (highest to lowest)
-    slices : a dictionary that defines how the axes map to the slice axis
-    slicer : the class representing a slice of this panel
-    aliases : a dictionary defining aliases for various axes
-        default = { major : major_axis, minor : minor_axis }
-    stat_axis : the default statistic axis default = 2
-    info_axis : the info axis
-
-    Returns
-    -------
-    a class object representing this panel
-    """
-
-    # if slicer is a name, get the object
-    if isinstance(slicer, compat.string_types):
-        import pandas
-        try:
-            slicer = getattr(pandas, slicer)
-        except:
-            raise Exception("cannot create this slicer [%s]" % slicer)
-
-    # build the klass
-    ns = {} if not ns else ns
-    klass = type(klass_name, (slicer, ), ns)
-
-    # setup the axes
-    klass._setup_axes(axes=orders, info_axis=info_axis, stat_axis=stat_axis,
-                      aliases=aliases, slicers=slices)
-
-    klass._constructor_sliced = slicer
-
-    # define the methods ####
-    def __init__(self, *args, **kwargs):
-
-        # deprecation GH13564
-        warnings.warn("\n{klass} is deprecated and will be removed in a "
-                      "future version.\nThe recommended way to represent "
-                      "these types of n-dimensional data are with the\n"
-                      "`xarray package "
-                      "<http://xarray.pydata.org/en/stable/>`__.\n"
-                      "Pandas provides a `.to_xarray()` method to help "
-                      "automate this conversion.\n".format(
-                          klass=self.__class__.__name__),
-                      FutureWarning, stacklevel=2)
-
-        if not (kwargs.get('data') or len(args)):
-            raise Exception("must supply at least a data argument to [%s]" %
-                            klass_name)
-        if 'copy' not in kwargs:
-            kwargs['copy'] = False
-        if 'dtype' not in kwargs:
-            kwargs['dtype'] = None
-        self._init_data(*args, **kwargs)
-
-    klass.__init__ = __init__
-
-    def _get_plane_axes_index(self, axis):
-        """ return the sliced index for this object """
-
-        # TODO: axis_name is not used, remove?
-        axis_name = self._get_axis_name(axis)  # noqa
-        index = self._AXIS_ORDERS.index(axis)
-
-        planes = []
-        if index:
-            planes.extend(self._AXIS_ORDERS[0:index])
-        if index != self._AXIS_LEN:
-            planes.extend(self._AXIS_ORDERS[index + 1:])
-
-        return planes
-
-    klass._get_plane_axes_index = _get_plane_axes_index
-
-    def _combine(self, other, func, axis=0):
-        if isinstance(other, klass):
-            return self._combine_with_constructor(other, func)
-        return super(klass, self)._combine(other, func, axis=axis)
-
-    klass._combine = _combine
-
-    def _combine_with_constructor(self, other, func):
-
-        # combine labels to form new axes
-        new_axes = []
-        for a in self._AXIS_ORDERS:
-            new_axes.append(getattr(self, a).union(getattr(other, a)))
-
-        # reindex: could check that everything's the same size, but forget it
-        d = dict([(a, ax) for a, ax in zip(self._AXIS_ORDERS, new_axes)])
-        d['copy'] = False
-        this = self.reindex(**d)
-        other = other.reindex(**d)
-
-        result_values = func(this.values, other.values)
-
-        return self._constructor(result_values, **d)
-
-    klass._combine_with_constructor = _combine_with_constructor
-
-    # set as NonImplemented operations which we don't support
-    for f in ['to_frame', 'to_excel', 'to_sparse', 'groupby', 'join', 'filter',
-              'dropna', 'shift']:
-
-        def func(self, *args, **kwargs):
-            raise NotImplementedError("this operation is not supported")
-
-        setattr(klass, f, func)
-
-    # add the aggregate operations
-    klass._add_aggregate_operations()
-    klass._add_numeric_operations()
-
-    return klass
diff --git a/pandas/core/resample.py b/pandas/core/resample.py
new file mode 100644
index 0000000000000..b3b28d7772713
--- /dev/null
+++ b/pandas/core/resample.py
@@ -0,0 +1,1760 @@
+import copy
+from datetime import timedelta
+from textwrap import dedent
+import warnings
+
+import numpy as np
+
+from pandas._libs import lib
+from pandas._libs.tslibs import NaT, Timestamp
+from pandas._libs.tslibs.frequencies import is_subperiod, is_superperiod
+from pandas._libs.tslibs.period import IncompatibleFrequency
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.generic import ABCDataFrame, ABCSeries
+
+import pandas as pd
+import pandas.core.algorithms as algos
+from pandas.core.generic import _shared_docs
+from pandas.core.groupby.base import GroupByMixin
+from pandas.core.groupby.generic import SeriesGroupBy
+from pandas.core.groupby.groupby import (
+    GroupBy, _GroupBy, _pipe_template, groupby)
+from pandas.core.groupby.grouper import Grouper
+from pandas.core.groupby.ops import BinGrouper
+from pandas.core.indexes.datetimes import DatetimeIndex, date_range
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex, timedelta_range
+
+from pandas.tseries.frequencies import to_offset
+from pandas.tseries.offsets import DateOffset, Day, Nano, Tick
+
+_shared_docs_kwargs = dict()
+
+
+class Resampler(_GroupBy):
+    """
+    Class for resampling datetimelike data, a groupby-like operation.
+    See aggregate, transform, and apply functions on this object.
+
+    It's easiest to use obj.resample(...) to use Resampler.
+
+    Parameters
+    ----------
+    obj : pandas object
+    groupby : a TimeGrouper object
+    axis : int, default 0
+    kind : str or None
+        'period', 'timestamp' to override default index treatement
+
+    Returns
+    -------
+    a Resampler of the appropriate type
+
+    Notes
+    -----
+    After resampling, see aggregate, apply, and transform functions.
+    """
+
+    # to the groupby descriptor
+    _attributes = ['freq', 'axis', 'closed', 'label', 'convention',
+                   'loffset', 'base', 'kind']
+
+    def __init__(self, obj, groupby=None, axis=0, kind=None, **kwargs):
+        self.groupby = groupby
+        self.keys = None
+        self.sort = True
+        self.axis = axis
+        self.kind = kind
+        self.squeeze = False
+        self.group_keys = True
+        self.as_index = True
+        self.exclusions = set()
+        self.binner = None
+        self.grouper = None
+
+        if self.groupby is not None:
+            self.groupby._set_grouper(self._convert_obj(obj), sort=True)
+
+    def __unicode__(self):
+        """
+        Provide a nice str repr of our rolling object.
+        """
+        attrs = ("{k}={v}".format(k=k, v=getattr(self.groupby, k))
+                 for k in self._attributes if
+                 getattr(self.groupby, k, None) is not None)
+        return "{klass} [{attrs}]".format(klass=self.__class__.__name__,
+                                          attrs=', '.join(attrs))
+
+    def __getattr__(self, attr):
+        if attr in self._internal_names_set:
+            return object.__getattribute__(self, attr)
+        if attr in self._attributes:
+            return getattr(self.groupby, attr)
+        if attr in self.obj:
+            return self[attr]
+
+        return object.__getattribute__(self, attr)
+
+    def __iter__(self):
+        """
+        Resampler iterator.
+
+        Returns
+        -------
+        Generator yielding sequence of (name, subsetted object)
+        for each group.
+
+        See Also
+        --------
+        GroupBy.__iter__
+        """
+        self._set_binner()
+        return super(Resampler, self).__iter__()
+
+    @property
+    def obj(self):
+        return self.groupby.obj
+
+    @property
+    def ax(self):
+        return self.groupby.ax
+
+    @property
+    def _typ(self):
+        """
+        Masquerade for compat as a Series or a DataFrame.
+        """
+        if isinstance(self._selected_obj, pd.Series):
+            return 'series'
+        return 'dataframe'
+
+    @property
+    def _from_selection(self):
+        """
+        Is the resampling from a DataFrame column or MultiIndex level.
+        """
+        # upsampling and PeriodIndex resampling do not work
+        # with selection, this state used to catch and raise an error
+        return (self.groupby is not None and
+                (self.groupby.key is not None or
+                 self.groupby.level is not None))
+
+    def _convert_obj(self, obj):
+        """
+        Provide any conversions for the object in order to correctly handle.
+
+        Parameters
+        ----------
+        obj : the object to be resampled
+
+        Returns
+        -------
+        obj : converted object
+        """
+        obj = obj._consolidate()
+        return obj
+
+    def _get_binner_for_time(self):
+        raise AbstractMethodError(self)
+
+    def _set_binner(self):
+        """
+        Setup our binners.
+
+        Cache these as we are an immutable object
+        """
+        if self.binner is None:
+            self.binner, self.grouper = self._get_binner()
+
+    def _get_binner(self):
+        """
+        Create the BinGrouper, assume that self.set_grouper(obj)
+        has already been called.
+        """
+
+        binner, bins, binlabels = self._get_binner_for_time()
+        bin_grouper = BinGrouper(bins, binlabels, indexer=self.groupby.indexer)
+        return binner, bin_grouper
+
+    def _assure_grouper(self):
+        """
+        Make sure that we are creating our binner & grouper.
+        """
+        self._set_binner()
+
+    @Substitution(klass='Resampler',
+                  versionadded='.. versionadded:: 0.23.0',
+                  examples="""
+    >>> df = pd.DataFrame({'A': [1, 2, 3, 4]},
+    ...                   index=pd.date_range('2012-08-02', periods=4))
+    >>> df
+                A
+    2012-08-02  1
+    2012-08-03  2
+    2012-08-04  3
+    2012-08-05  4
+
+    To get the difference between each 2-day period's maximum and minimum
+    value in one pass, you can do
+
+    >>> df.resample('2D').pipe(lambda x: x.max() - x.min())
+                A
+    2012-08-02  1
+    2012-08-04  1
+    """)
+    @Appender(_pipe_template)
+    def pipe(self, func, *args, **kwargs):
+        return super(Resampler, self).pipe(func, *args, **kwargs)
+
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    DataFrame.groupby.aggregate
+    DataFrame.resample.transform
+    DataFrame.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+    >>> s = pd.Series([1,2,3,4,5],
+                      index=pd.date_range('20130101', periods=5,freq='s'))
+    2013-01-01 00:00:00    1
+    2013-01-01 00:00:01    2
+    2013-01-01 00:00:02    3
+    2013-01-01 00:00:03    4
+    2013-01-01 00:00:04    5
+    Freq: S, dtype: int64
+
+    >>> r = s.resample('2s')
+    DatetimeIndexResampler [freq=<2 * Seconds>, axis=0, closed=left,
+                            label=left, convention=start, base=0]
+
+    >>> r.agg(np.sum)
+    2013-01-01 00:00:00    3
+    2013-01-01 00:00:02    7
+    2013-01-01 00:00:04    5
+    Freq: 2S, dtype: int64
+
+    >>> r.agg(['sum','mean','max'])
+                         sum  mean  max
+    2013-01-01 00:00:00    3   1.5    2
+    2013-01-01 00:00:02    7   3.5    4
+    2013-01-01 00:00:04    5   5.0    5
+
+    >>> r.agg({'result' : lambda x: x.mean() / x.std(),
+               'total' : np.sum})
+                         total    result
+    2013-01-01 00:00:00      3  2.121320
+    2013-01-01 00:00:02      7  4.949747
+    2013-01-01 00:00:04      5       NaN
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='DataFrame',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
+    def aggregate(self, func, *args, **kwargs):
+
+        self._set_binner()
+        result, how = self._aggregate(func, *args, **kwargs)
+        if result is None:
+            how = func
+            grouper = None
+            result = self._groupby_and_aggregate(how,
+                                                 grouper,
+                                                 *args,
+                                                 **kwargs)
+
+        result = self._apply_loffset(result)
+        return result
+
+    agg = aggregate
+    apply = aggregate
+
+    def transform(self, arg, *args, **kwargs):
+        """
+        Call function producing a like-indexed Series on each group and return
+        a Series with the transformed values.
+
+        Parameters
+        ----------
+        arg : function
+            To apply to each group. Should return a Series with the same index.
+
+        Returns
+        -------
+        transformed : Series
+
+        Examples
+        --------
+        >>> resampled.transform(lambda x: (x - x.mean()) / x.std())
+        """
+        return self._selected_obj.groupby(self.groupby).transform(
+            arg, *args, **kwargs)
+
+    def _downsample(self, f):
+        raise AbstractMethodError(self)
+
+    def _upsample(self, f, limit=None, fill_value=None):
+        raise AbstractMethodError(self)
+
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        Sub-classes to define. Return a sliced object.
+
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        self._set_binner()
+        grouper = self.grouper
+        if subset is None:
+            subset = self.obj
+        grouped = groupby(subset, by=None, grouper=grouper, axis=self.axis)
+
+        # try the key selection
+        try:
+            return grouped[key]
+        except KeyError:
+            return grouped
+
+    def _groupby_and_aggregate(self, how, grouper=None, *args, **kwargs):
+        """
+        Re-evaluate the obj with a groupby aggregation.
+        """
+
+        if grouper is None:
+            self._set_binner()
+            grouper = self.grouper
+
+        obj = self._selected_obj
+
+        grouped = groupby(obj, by=None, grouper=grouper, axis=self.axis)
+
+        try:
+            if isinstance(obj, ABCDataFrame) and callable(how):
+                # Check if the function is reducing or not.
+                result = grouped._aggregate_item_by_item(how, *args, **kwargs)
+            else:
+                result = grouped.aggregate(how, *args, **kwargs)
+        except Exception:
+
+            # we have a non-reducing function
+            # try to evaluate
+            result = grouped.apply(how, *args, **kwargs)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _apply_loffset(self, result):
+        """
+        If loffset is set, offset the result index.
+
+        This is NOT an idempotent routine, it will be applied
+        exactly once to the result.
+
+        Parameters
+        ----------
+        result : Series or DataFrame
+            the result of resample
+        """
+
+        needs_offset = (
+            isinstance(self.loffset, (DateOffset, timedelta,
+                                      np.timedelta64)) and
+            isinstance(result.index, DatetimeIndex) and
+            len(result.index) > 0
+        )
+
+        if needs_offset:
+            result.index = result.index + self.loffset
+
+        self.loffset = None
+        return result
+
+    def _get_resampler_for_grouping(self, groupby, **kwargs):
+        """
+        Return the correct class for resampling with groupby.
+        """
+        return self._resampler_for_grouping(self, groupby=groupby, **kwargs)
+
+    def _wrap_result(self, result):
+        """
+        Potentially wrap any results.
+        """
+        if isinstance(result, ABCSeries) and self._selection is not None:
+            result.name = self._selection
+
+        if isinstance(result, ABCSeries) and result.empty:
+            obj = self.obj
+            if isinstance(obj.index, PeriodIndex):
+                result.index = obj.index.asfreq(self.freq)
+            else:
+                result.index = obj.index._shallow_copy(freq=self.freq)
+            result.name = getattr(obj, 'name', None)
+
+        return result
+
+    def pad(self, limit=None):
+        """
+        Forward fill the values.
+
+        Parameters
+        ----------
+        limit : integer, optional
+            limit of how many values to fill
+
+        Returns
+        -------
+        An upsampled Series.
+
+        See Also
+        --------
+        Series.fillna
+        DataFrame.fillna
+        """
+        return self._upsample('pad', limit=limit)
+    ffill = pad
+
+    def nearest(self, limit=None):
+        """
+        Resample by using the nearest value.
+
+        When resampling data, missing values may appear (e.g., when the
+        resampling frequency is higher than the original frequency).
+        The `nearest` method will replace ``NaN`` values that appeared in
+        the resampled data with the value from the nearest member of the
+        sequence, based on the index value.
+        Missing values that existed in the original data will not be modified.
+        If `limit` is given, fill only this many values in each direction for
+        each of the original values.
+
+        Parameters
+        ----------
+        limit : int, optional
+            Limit of how many values to fill.
+
+            .. versionadded:: 0.21.0
+
+        Returns
+        -------
+        Series or DataFrame
+            An upsampled Series or DataFrame with ``NaN`` values filled with
+            their nearest value.
+
+        See Also
+        --------
+        backfill : Backward fill the new missing values in the resampled data.
+        pad : Forward fill ``NaN`` values.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2],
+        ...               index=pd.date_range('20180101',
+        ...                                   periods=2,
+        ...                                   freq='1h'))
+        >>> s
+        2018-01-01 00:00:00    1
+        2018-01-01 01:00:00    2
+        Freq: H, dtype: int64
+
+        >>> s.resample('15min').nearest()
+        2018-01-01 00:00:00    1
+        2018-01-01 00:15:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 00:45:00    2
+        2018-01-01 01:00:00    2
+        Freq: 15T, dtype: int64
+
+        Limit the number of upsampled values imputed by the nearest:
+
+        >>> s.resample('15min').nearest(limit=1)
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:15:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 00:45:00    2.0
+        2018-01-01 01:00:00    2.0
+        Freq: 15T, dtype: float64
+        """
+        return self._upsample('nearest', limit=limit)
+
+    def backfill(self, limit=None):
+        """
+        Backward fill the new missing values in the resampled data.
+
+        In statistics, imputation is the process of replacing missing data with
+        substituted values [1]_. When resampling data, missing values may
+        appear (e.g., when the resampling frequency is higher than the original
+        frequency). The backward fill will replace NaN values that appeared in
+        the resampled data with the next value in the original sequence.
+        Missing values that existed in the original data will not be modified.
+
+        Parameters
+        ----------
+        limit : integer, optional
+            Limit of how many values to fill.
+
+        Returns
+        -------
+        Series, DataFrame
+            An upsampled Series or DataFrame with backward filled NaN values.
+
+        See Also
+        --------
+        bfill : Alias of backfill.
+        fillna : Fill NaN values using the specified method, which can be
+            'backfill'.
+        nearest : Fill NaN values with nearest neighbor starting from center.
+        pad : Forward fill NaN values.
+        Series.fillna : Fill NaN values in the Series using the
+            specified method, which can be 'backfill'.
+        DataFrame.fillna : Fill NaN values in the DataFrame using the
+            specified method, which can be 'backfill'.
+
+        References
+        ----------
+        .. [1] https://en.wikipedia.org/wiki/Imputation_(statistics)
+
+        Examples
+        --------
+
+        Resampling a Series:
+
+        >>> s = pd.Series([1, 2, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> s
+        2018-01-01 00:00:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 02:00:00    3
+        Freq: H, dtype: int64
+
+        >>> s.resample('30min').backfill()
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('15min').backfill(limit=2)
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:15:00    NaN
+        2018-01-01 00:30:00    2.0
+        2018-01-01 00:45:00    2.0
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:15:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 01:45:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 15T, dtype: float64
+
+        Resampling a DataFrame that has missing values:
+
+        >>> df = pd.DataFrame({'a': [2, np.nan, 6], 'b': [1, 3, 5]},
+        ...                   index=pd.date_range('20180101', periods=3,
+        ...                                       freq='h'))
+        >>> df
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('30min').backfill()
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 00:30:00  NaN  3
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 01:30:00  6.0  5
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('15min').backfill(limit=2)
+                               a    b
+        2018-01-01 00:00:00  2.0  1.0
+        2018-01-01 00:15:00  NaN  NaN
+        2018-01-01 00:30:00  NaN  3.0
+        2018-01-01 00:45:00  NaN  3.0
+        2018-01-01 01:00:00  NaN  3.0
+        2018-01-01 01:15:00  NaN  NaN
+        2018-01-01 01:30:00  6.0  5.0
+        2018-01-01 01:45:00  6.0  5.0
+        2018-01-01 02:00:00  6.0  5.0
+        """
+        return self._upsample('backfill', limit=limit)
+    bfill = backfill
+
+    def fillna(self, method, limit=None):
+        """
+        Fill missing values introduced by upsampling.
+
+        In statistics, imputation is the process of replacing missing data with
+        substituted values [1]_. When resampling data, missing values may
+        appear (e.g., when the resampling frequency is higher than the original
+        frequency).
+
+        Missing values that existed in the original data will
+        not be modified.
+
+        Parameters
+        ----------
+        method : {'pad', 'backfill', 'ffill', 'bfill', 'nearest'}
+            Method to use for filling holes in resampled data
+
+            * 'pad' or 'ffill': use previous valid observation to fill gap
+              (forward fill).
+            * 'backfill' or 'bfill': use next valid observation to fill gap.
+            * 'nearest': use nearest valid observation to fill gap.
+
+        limit : integer, optional
+            Limit of how many consecutive missing values to fill.
+
+        Returns
+        -------
+        Series or DataFrame
+            An upsampled Series or DataFrame with missing values filled.
+
+        See Also
+        --------
+        backfill : Backward fill NaN values in the resampled data.
+        pad : Forward fill NaN values in the resampled data.
+        nearest : Fill NaN values in the resampled data
+            with nearest neighbor starting from center.
+        interpolate : Fill NaN values using interpolation.
+        Series.fillna : Fill NaN values in the Series using the
+            specified method, which can be 'bfill' and 'ffill'.
+        DataFrame.fillna : Fill NaN values in the DataFrame using the
+            specified method, which can be 'bfill' and 'ffill'.
+
+        References
+        ----------
+        .. [1] https://en.wikipedia.org/wiki/Imputation_(statistics)
+
+        Examples
+        --------
+        Resampling a Series:
+
+        >>> s = pd.Series([1, 2, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> s
+        2018-01-01 00:00:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 02:00:00    3
+        Freq: H, dtype: int64
+
+        Without filling the missing values you get:
+
+        >>> s.resample("30min").asfreq()
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:30:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> s.resample('30min').fillna("backfill")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('15min').fillna("backfill", limit=2)
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:15:00    NaN
+        2018-01-01 00:30:00    2.0
+        2018-01-01 00:45:00    2.0
+        2018-01-01 01:00:00    2.0
+        2018-01-01 01:15:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 01:45:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 15T, dtype: float64
+
+        >>> s.resample('30min').fillna("pad")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    1
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    2
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        >>> s.resample('30min').fillna("nearest")
+        2018-01-01 00:00:00    1
+        2018-01-01 00:30:00    2
+        2018-01-01 01:00:00    2
+        2018-01-01 01:30:00    3
+        2018-01-01 02:00:00    3
+        Freq: 30T, dtype: int64
+
+        Missing values present before the upsampling are not affected.
+
+        >>> sm = pd.Series([1, None, 3],
+        ...               index=pd.date_range('20180101', periods=3, freq='h'))
+        >>> sm
+        2018-01-01 00:00:00    1.0
+        2018-01-01 01:00:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: H, dtype: float64
+
+        >>> sm.resample('30min').fillna('backfill')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> sm.resample('30min').fillna('pad')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    1.0
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    NaN
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        >>> sm.resample('30min').fillna('nearest')
+        2018-01-01 00:00:00    1.0
+        2018-01-01 00:30:00    NaN
+        2018-01-01 01:00:00    NaN
+        2018-01-01 01:30:00    3.0
+        2018-01-01 02:00:00    3.0
+        Freq: 30T, dtype: float64
+
+        DataFrame resampling is done column-wise. All the same options are
+        available.
+
+        >>> df = pd.DataFrame({'a': [2, np.nan, 6], 'b': [1, 3, 5]},
+        ...                   index=pd.date_range('20180101', periods=3,
+        ...                                       freq='h'))
+        >>> df
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 02:00:00  6.0  5
+
+        >>> df.resample('30min').fillna("bfill")
+                               a  b
+        2018-01-01 00:00:00  2.0  1
+        2018-01-01 00:30:00  NaN  3
+        2018-01-01 01:00:00  NaN  3
+        2018-01-01 01:30:00  6.0  5
+        2018-01-01 02:00:00  6.0  5
+        """
+        return self._upsample(method, limit=limit)
+
+    @Appender(_shared_docs['interpolate'] % _shared_docs_kwargs)
+    def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
+                    limit_direction='forward', limit_area=None,
+                    downcast=None, **kwargs):
+        """
+        Interpolate values according to different methods.
+
+        .. versionadded:: 0.18.1
+        """
+        result = self._upsample(None)
+        return result.interpolate(method=method, axis=axis, limit=limit,
+                                  inplace=inplace,
+                                  limit_direction=limit_direction,
+                                  limit_area=limit_area,
+                                  downcast=downcast, **kwargs)
+
+    def asfreq(self, fill_value=None):
+        """
+        Return the values at the new freq, essentially a reindex.
+
+        Parameters
+        ----------
+        fill_value : scalar, optional
+            Value to use for missing values, applied during upsampling (note
+            this does not fill NaNs that already were present).
+
+            .. versionadded:: 0.20.0
+
+        See Also
+        --------
+        Series.asfreq
+        DataFrame.asfreq
+        """
+        return self._upsample('asfreq', fill_value=fill_value)
+
+    def std(self, ddof=1, *args, **kwargs):
+        """
+        Compute standard deviation of groups, excluding missing values.
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            Degrees of freedom.
+        """
+        nv.validate_resampler_func('std', args, kwargs)
+        return self._downsample('std', ddof=ddof)
+
+    def var(self, ddof=1, *args, **kwargs):
+        """
+        Compute variance of groups, excluding missing values.
+
+        Parameters
+        ----------
+        ddof : integer, default 1
+            degrees of freedom
+        """
+        nv.validate_resampler_func('var', args, kwargs)
+        return self._downsample('var', ddof=ddof)
+
+    @Appender(GroupBy.size.__doc__)
+    def size(self):
+        # It's a special case as higher level does return
+        # a copy of 0-len objects. GH14962
+        result = self._downsample('size')
+        if not len(self.ax) and isinstance(self._selected_obj, ABCDataFrame):
+            result = pd.Series([], index=result.index, dtype='int64')
+        return result
+
+    def quantile(self, q=0.5, **kwargs):
+        """
+        Return value at the given quantile.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        q : float or array-like, default 0.5 (50% quantile)
+
+        See Also
+        --------
+        Series.quantile
+        DataFrame.quantile
+        DataFrameGroupBy.quantile
+        """
+        return self._downsample('quantile', q=q, **kwargs)
+
+
+# downsample methods
+for method in ['sum', 'prod']:
+
+    def f(self, _method=method, min_count=0, *args, **kwargs):
+        nv.validate_resampler_func(_method, args, kwargs)
+        return self._downsample(_method, min_count=min_count)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+
+# downsample methods
+for method in ['min', 'max', 'first', 'last', 'mean', 'sem',
+               'median', 'ohlc']:
+
+    def f(self, _method=method, *args, **kwargs):
+        nv.validate_resampler_func(_method, args, kwargs)
+        return self._downsample(_method)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+# groupby & aggregate methods
+for method in ['count']:
+    def f(self, _method=method):
+        return self._downsample(_method)
+    f.__doc__ = getattr(GroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+# series only methods
+for method in ['nunique']:
+    def f(self, _method=method):
+        return self._downsample(_method)
+    f.__doc__ = getattr(SeriesGroupBy, method).__doc__
+    setattr(Resampler, method, f)
+
+
+def _maybe_process_deprecations(r, how=None, fill_method=None, limit=None):
+    """
+    Potentially we might have a deprecation warning, show it
+    but call the appropriate methods anyhow.
+    """
+
+    if how is not None:
+
+        # .resample(..., how='sum')
+        if isinstance(how, compat.string_types):
+            method = "{0}()".format(how)
+
+            # .resample(..., how=lambda x: ....)
+        else:
+            method = ".apply(<func>)"
+
+        # if we have both a how and fill_method, then show
+        # the following warning
+        if fill_method is None:
+            warnings.warn("how in .resample() is deprecated\n"
+                          "the new syntax is "
+                          ".resample(...).{method}".format(
+                              method=method),
+                          FutureWarning, stacklevel=3)
+        r = r.aggregate(how)
+
+    if fill_method is not None:
+
+        # show the prior function call
+        method = '.' + method if how is not None else ''
+
+        args = "limit={0}".format(limit) if limit is not None else ""
+        warnings.warn("fill_method is deprecated to .resample()\n"
+                      "the new syntax is .resample(...){method}"
+                      ".{fill_method}({args})".format(
+                          method=method,
+                          fill_method=fill_method,
+                          args=args),
+                      FutureWarning, stacklevel=3)
+
+        if how is not None:
+            r = getattr(r, fill_method)(limit=limit)
+        else:
+            r = r.aggregate(fill_method, limit=limit)
+
+    return r
+
+
+class _GroupByMixin(GroupByMixin):
+    """
+    Provide the groupby facilities.
+    """
+    def __init__(self, obj, *args, **kwargs):
+
+        parent = kwargs.pop('parent', None)
+        groupby = kwargs.pop('groupby', None)
+        if parent is None:
+            parent = obj
+
+        # initialize our GroupByMixin object with
+        # the resampler attributes
+        for attr in self._attributes:
+            setattr(self, attr, kwargs.get(attr, getattr(parent, attr)))
+
+        super(_GroupByMixin, self).__init__(None)
+        self._groupby = groupby
+        self._groupby.mutated = True
+        self._groupby.grouper.mutated = True
+        self.groupby = copy.copy(parent.groupby)
+
+    def _apply(self, f, grouper=None, *args, **kwargs):
+        """
+        Dispatch to _upsample; we are stripping all of the _upsample kwargs and
+        performing the original function call on the grouped object.
+        """
+
+        def func(x):
+            x = self._shallow_copy(x, groupby=self.groupby)
+
+            if isinstance(f, compat.string_types):
+                return getattr(x, f)(**kwargs)
+
+            return x.apply(f, *args, **kwargs)
+
+        result = self._groupby.apply(func)
+        return self._wrap_result(result)
+
+    _upsample = _apply
+    _downsample = _apply
+    _groupby_and_aggregate = _apply
+
+
+class DatetimeIndexResampler(Resampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return DatetimeIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+
+        # this is how we are actually creating the bins
+        if self.kind == 'period':
+            return self.groupby._get_time_period_bins(self.ax)
+        return self.groupby._get_time_bins(self.ax)
+
+    def _downsample(self, how, **kwargs):
+        """
+        Downsample the cython defined function.
+
+        Parameters
+        ----------
+        how : string / cython mapped function
+        **kwargs : kw args passed to how function
+        """
+        self._set_binner()
+        how = self._is_cython_func(how) or how
+        ax = self.ax
+        obj = self._selected_obj
+
+        if not len(ax):
+            # reset to the new freq
+            obj = obj.copy()
+            obj.index.freq = self.freq
+            return obj
+
+        # do we have a regular frequency
+        if ax.freq is not None or ax.inferred_freq is not None:
+
+            if len(self.grouper.binlabels) > len(ax) and how is None:
+
+                # let's do an asfreq
+                return self.asfreq()
+
+        # we are downsampling
+        # we want to call the actual grouper method here
+        result = obj.groupby(
+            self.grouper, axis=self.axis).aggregate(how, **kwargs)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _adjust_binner_for_upsample(self, binner):
+        """
+        Adjust our binner when upsampling.
+
+        The range of a new index should not be outside specified range
+        """
+        if self.closed == 'right':
+            binner = binner[1:]
+        else:
+            binner = binner[:-1]
+        return binner
+
+    def _upsample(self, method, limit=None, fill_value=None):
+        """
+        Parameters
+        ----------
+        method : string {'backfill', 'bfill', 'pad',
+            'ffill', 'asfreq'} method for upsampling
+        limit : int, default None
+            Maximum size gap to fill when reindexing
+        fill_value : scalar, default None
+            Value to use for missing values
+
+        See Also
+        --------
+        .fillna
+
+        """
+        self._set_binner()
+        if self.axis:
+            raise AssertionError('axis must be 0')
+        if self._from_selection:
+            raise ValueError("Upsampling from level= or on= selection"
+                             " is not supported, use .set_index(...)"
+                             " to explicitly set index to"
+                             " datetime-like")
+
+        ax = self.ax
+        obj = self._selected_obj
+        binner = self.binner
+        res_index = self._adjust_binner_for_upsample(binner)
+
+        # if we have the same frequency as our axis, then we are equal sampling
+        if limit is None and to_offset(ax.inferred_freq) == self.freq:
+            result = obj.copy()
+            result.index = res_index
+        else:
+            result = obj.reindex(res_index, method=method,
+                                 limit=limit, fill_value=fill_value)
+
+        result = self._apply_loffset(result)
+        return self._wrap_result(result)
+
+    def _wrap_result(self, result):
+        result = super(DatetimeIndexResampler, self)._wrap_result(result)
+
+        # we may have a different kind that we were asked originally
+        # convert if needed
+        if self.kind == 'period' and not isinstance(result.index, PeriodIndex):
+            result.index = result.index.to_period(self.freq)
+        return result
+
+
+class DatetimeIndexResamplerGroupby(_GroupByMixin, DatetimeIndexResampler):
+    """
+    Provides a resample of a groupby implementation
+
+    .. versionadded:: 0.18.1
+    """
+    @property
+    def _constructor(self):
+        return DatetimeIndexResampler
+
+
+class PeriodIndexResampler(DatetimeIndexResampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return PeriodIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._get_binner_for_time()
+        return self.groupby._get_period_bins(self.ax)
+
+    def _convert_obj(self, obj):
+        obj = super(PeriodIndexResampler, self)._convert_obj(obj)
+
+        if self._from_selection:
+            # see GH 14008, GH 12871
+            msg = ("Resampling from level= or on= selection"
+                   " with a PeriodIndex is not currently supported,"
+                   " use .set_index(...) to explicitly set index")
+            raise NotImplementedError(msg)
+
+        if self.loffset is not None:
+            # Cannot apply loffset/timedelta to PeriodIndex -> convert to
+            # timestamps
+            self.kind = 'timestamp'
+
+        # convert to timestamp
+        if self.kind == 'timestamp':
+            obj = obj.to_timestamp(how=self.convention)
+
+        return obj
+
+    def _downsample(self, how, **kwargs):
+        """
+        Downsample the cython defined function.
+
+        Parameters
+        ----------
+        how : string / cython mapped function
+        **kwargs : kw args passed to how function
+        """
+
+        # we may need to actually resample as if we are timestamps
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._downsample(how, **kwargs)
+
+        how = self._is_cython_func(how) or how
+        ax = self.ax
+
+        if is_subperiod(ax.freq, self.freq):
+            # Downsampling
+            return self._groupby_and_aggregate(how, grouper=self.grouper,
+                                               **kwargs)
+        elif is_superperiod(ax.freq, self.freq):
+            if how == 'ohlc':
+                # GH #13083
+                # upsampling to subperiods is handled as an asfreq, which works
+                # for pure aggregating/reducing methods
+                # OHLC reduces along the time dimension, but creates multiple
+                # values for each period -> handle by _groupby_and_aggregate()
+                return self._groupby_and_aggregate(how, grouper=self.grouper)
+            return self.asfreq()
+        elif ax.freq == self.freq:
+            return self.asfreq()
+
+        raise IncompatibleFrequency(
+            'Frequency {} cannot be resampled to {}, as they are not '
+            'sub or super periods'.format(ax.freq, self.freq))
+
+    def _upsample(self, method, limit=None, fill_value=None):
+        """
+        Parameters
+        ----------
+        method : string {'backfill', 'bfill', 'pad', 'ffill'}
+            method for upsampling
+        limit : int, default None
+            Maximum size gap to fill when reindexing
+        fill_value : scalar, default None
+            Value to use for missing values
+
+        See Also
+        --------
+        .fillna
+
+        """
+
+        # we may need to actually resample as if we are timestamps
+        if self.kind == 'timestamp':
+            return super(PeriodIndexResampler, self)._upsample(
+                method, limit=limit, fill_value=fill_value)
+
+        self._set_binner()
+        ax = self.ax
+        obj = self.obj
+        new_index = self.binner
+
+        # Start vs. end of period
+        memb = ax.asfreq(self.freq, how=self.convention)
+
+        # Get the fill indexer
+        indexer = memb.get_indexer(new_index, method=method, limit=limit)
+        return self._wrap_result(_take_new_index(
+            obj, indexer, new_index, axis=self.axis))
+
+
+class PeriodIndexResamplerGroupby(_GroupByMixin, PeriodIndexResampler):
+    """
+    Provides a resample of a groupby implementation.
+
+    .. versionadded:: 0.18.1
+    """
+    @property
+    def _constructor(self):
+        return PeriodIndexResampler
+
+
+class TimedeltaIndexResampler(DatetimeIndexResampler):
+
+    @property
+    def _resampler_for_grouping(self):
+        return TimedeltaIndexResamplerGroupby
+
+    def _get_binner_for_time(self):
+        return self.groupby._get_time_delta_bins(self.ax)
+
+    def _adjust_binner_for_upsample(self, binner):
+        """
+        Adjust our binner when upsampling.
+
+        The range of a new index is allowed to be greater than original range
+        so we don't need to change the length of a binner, GH 13022
+        """
+        return binner
+
+
+class TimedeltaIndexResamplerGroupby(_GroupByMixin, TimedeltaIndexResampler):
+    """
+    Provides a resample of a groupby implementation.
+
+    .. versionadded:: 0.18.1
+    """
+    @property
+    def _constructor(self):
+        return TimedeltaIndexResampler
+
+
+def resample(obj, kind=None, **kwds):
+    """
+    Create a TimeGrouper and return our resampler.
+    """
+    tg = TimeGrouper(**kwds)
+    return tg._get_resampler(obj, kind=kind)
+
+
+resample.__doc__ = Resampler.__doc__
+
+
+def get_resampler_for_grouping(groupby, rule, how=None, fill_method=None,
+                               limit=None, kind=None, **kwargs):
+    """
+    Return our appropriate resampler when grouping as well.
+    """
+
+    # .resample uses 'on' similar to how .groupby uses 'key'
+    kwargs['key'] = kwargs.pop('on', None)
+
+    tg = TimeGrouper(freq=rule, **kwargs)
+    resampler = tg._get_resampler(groupby.obj, kind=kind)
+    r = resampler._get_resampler_for_grouping(groupby=groupby)
+    return _maybe_process_deprecations(r,
+                                       how=how,
+                                       fill_method=fill_method,
+                                       limit=limit)
+
+
+class TimeGrouper(Grouper):
+    """
+    Custom groupby class for time-interval grouping.
+
+    Parameters
+    ----------
+    freq : pandas date offset or offset alias for identifying bin edges
+    closed : closed end of interval; 'left' or 'right'
+    label : interval boundary to use for labeling; 'left' or 'right'
+    convention : {'start', 'end', 'e', 's'}
+        If axis is PeriodIndex
+    """
+    _attributes = Grouper._attributes + ('closed', 'label', 'how',
+                                         'loffset', 'kind', 'convention',
+                                         'base')
+
+    def __init__(self, freq='Min', closed=None, label=None, how='mean',
+                 axis=0, fill_method=None, limit=None, loffset=None,
+                 kind=None, convention=None, base=0, **kwargs):
+        # Check for correctness of the keyword arguments which would
+        # otherwise silently use the default if misspelled
+        if label not in {None, 'left', 'right'}:
+            raise ValueError('Unsupported value {} for `label`'.format(label))
+        if closed not in {None, 'left', 'right'}:
+            raise ValueError('Unsupported value {} for `closed`'.format(
+                closed))
+        if convention not in {None, 'start', 'end', 'e', 's'}:
+            raise ValueError('Unsupported value {} for `convention`'
+                             .format(convention))
+
+        freq = to_offset(freq)
+
+        end_types = {'M', 'A', 'Q', 'BM', 'BA', 'BQ', 'W'}
+        rule = freq.rule_code
+        if (rule in end_types or
+                ('-' in rule and rule[:rule.find('-')] in end_types)):
+            if closed is None:
+                closed = 'right'
+            if label is None:
+                label = 'right'
+        else:
+            if closed is None:
+                closed = 'left'
+            if label is None:
+                label = 'left'
+
+        self.closed = closed
+        self.label = label
+        self.kind = kind
+
+        self.convention = convention or 'E'
+        self.convention = self.convention.lower()
+
+        if isinstance(loffset, compat.string_types):
+            loffset = to_offset(loffset)
+        self.loffset = loffset
+
+        self.how = how
+        self.fill_method = fill_method
+        self.limit = limit
+        self.base = base
+
+        # always sort time groupers
+        kwargs['sort'] = True
+
+        super(TimeGrouper, self).__init__(freq=freq, axis=axis, **kwargs)
+
+    def _get_resampler(self, obj, kind=None):
+        """
+        Return my resampler or raise if we have an invalid axis.
+
+        Parameters
+        ----------
+        obj : input object
+        kind : string, optional
+            'period','timestamp','timedelta' are valid
+
+        Returns
+        -------
+        a Resampler
+
+        Raises
+        ------
+        TypeError if incompatible axis
+
+        """
+        self._set_grouper(obj)
+
+        ax = self.ax
+        if isinstance(ax, DatetimeIndex):
+            return DatetimeIndexResampler(obj,
+                                          groupby=self,
+                                          kind=kind,
+                                          axis=self.axis)
+        elif isinstance(ax, PeriodIndex) or kind == 'period':
+            return PeriodIndexResampler(obj,
+                                        groupby=self,
+                                        kind=kind,
+                                        axis=self.axis)
+        elif isinstance(ax, TimedeltaIndex):
+            return TimedeltaIndexResampler(obj,
+                                           groupby=self,
+                                           axis=self.axis)
+
+        raise TypeError("Only valid with DatetimeIndex, "
+                        "TimedeltaIndex or PeriodIndex, "
+                        "but got an instance of %r" % type(ax).__name__)
+
+    def _get_grouper(self, obj, validate=True):
+        # create the resampler and return our binner
+        r = self._get_resampler(obj)
+        r._set_binner()
+        return r.binner, r.grouper, r.obj
+
+    def _get_time_bins(self, ax):
+        if not isinstance(ax, DatetimeIndex):
+            raise TypeError('axis must be a DatetimeIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        if len(ax) == 0:
+            binner = labels = DatetimeIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        first, last = _get_timestamp_range_edges(ax.min(), ax.max(),
+                                                 self.freq,
+                                                 closed=self.closed,
+                                                 base=self.base)
+        # GH #12037
+        # use first/last directly instead of call replace() on them
+        # because replace() will swallow the nanosecond part
+        # thus last bin maybe slightly before the end if the end contains
+        # nanosecond part and lead to `Values falls after last bin` error
+        binner = labels = date_range(freq=self.freq,
+                                     start=first,
+                                     end=last,
+                                     tz=ax.tz,
+                                     name=ax.name,
+                                     ambiguous='infer',
+                                     nonexistent='shift_forward')
+
+        ax_values = ax.asi8
+        binner, bin_edges = self._adjust_bin_edges(binner, ax_values)
+
+        # general version, knowing nothing about relative frequencies
+        bins = lib.generate_bins_dt64(
+            ax_values, bin_edges, self.closed, hasnans=ax.hasnans)
+
+        if self.closed == 'right':
+            labels = binner
+            if self.label == 'right':
+                labels = labels[1:]
+        elif self.label == 'right':
+            labels = labels[1:]
+
+        if ax.hasnans:
+            binner = binner.insert(0, NaT)
+            labels = labels.insert(0, NaT)
+
+        # if we end up with more labels than bins
+        # adjust the labels
+        # GH4076
+        if len(bins) < len(labels):
+            labels = labels[:len(bins)]
+
+        return binner, bins, labels
+
+    def _adjust_bin_edges(self, binner, ax_values):
+        # Some hacks for > daily data, see #1471, #1458, #1483
+
+        if self.freq != 'D' and is_superperiod(self.freq, 'D'):
+            if self.closed == 'right':
+                # GH 21459, GH 9119: Adjust the bins relative to the wall time
+                bin_edges = binner.tz_localize(None)
+                bin_edges = bin_edges + timedelta(1) - Nano(1)
+                bin_edges = bin_edges.tz_localize(binner.tz).asi8
+            else:
+                bin_edges = binner.asi8
+
+            # intraday values on last day
+            if bin_edges[-2] > ax_values.max():
+                bin_edges = bin_edges[:-1]
+                binner = binner[:-1]
+        else:
+            bin_edges = binner.asi8
+        return binner, bin_edges
+
+    def _get_time_delta_bins(self, ax):
+        if not isinstance(ax, TimedeltaIndex):
+            raise TypeError('axis must be a TimedeltaIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        if not len(ax):
+            binner = labels = TimedeltaIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        start, end = ax.min(), ax.max()
+        labels = binner = timedelta_range(start=start,
+                                          end=end,
+                                          freq=self.freq,
+                                          name=ax.name)
+
+        end_stamps = labels + self.freq
+        bins = ax.searchsorted(end_stamps, side='left')
+
+        # Addresses GH #10530
+        if self.base > 0:
+            labels += type(self.freq)(self.base)
+
+        return binner, bins, labels
+
+    def _get_time_period_bins(self, ax):
+        if not isinstance(ax, DatetimeIndex):
+            raise TypeError('axis must be a DatetimeIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        freq = self.freq
+
+        if not len(ax):
+            binner = labels = PeriodIndex(data=[], freq=freq, name=ax.name)
+            return binner, [], labels
+
+        labels = binner = pd.period_range(start=ax[0],
+                                          end=ax[-1],
+                                          freq=freq,
+                                          name=ax.name)
+
+        end_stamps = (labels + freq).asfreq(freq, 's').to_timestamp()
+        if ax.tzinfo:
+            end_stamps = end_stamps.tz_localize(ax.tzinfo)
+        bins = ax.searchsorted(end_stamps, side='left')
+
+        return binner, bins, labels
+
+    def _get_period_bins(self, ax):
+        if not isinstance(ax, PeriodIndex):
+            raise TypeError('axis must be a PeriodIndex, but got '
+                            'an instance of %r' % type(ax).__name__)
+
+        memb = ax.asfreq(self.freq, how=self.convention)
+
+        # NaT handling as in pandas._lib.lib.generate_bins_dt64()
+        nat_count = 0
+        if memb.hasnans:
+            nat_count = np.sum(memb._isnan)
+            memb = memb[~memb._isnan]
+
+        # if index contains no valid (non-NaT) values, return empty index
+        if not len(memb):
+            binner = labels = PeriodIndex(
+                data=[], freq=self.freq, name=ax.name)
+            return binner, [], labels
+
+        freq_mult = self.freq.n
+
+        start = ax.min().asfreq(self.freq, how=self.convention)
+        end = ax.max().asfreq(self.freq, how='end')
+        bin_shift = 0
+
+        # GH 23882
+        if self.base:
+            # get base adjusted bin edge labels
+            p_start, end = _get_period_range_edges(start,
+                                                   end,
+                                                   self.freq,
+                                                   closed=self.closed,
+                                                   base=self.base)
+
+            # Get offset for bin edge (not label edge) adjustment
+            start_offset = (pd.Period(start, self.freq)
+                            - pd.Period(p_start, self.freq))
+            bin_shift = start_offset.n % freq_mult
+            start = p_start
+
+        labels = binner = pd.period_range(start=start, end=end,
+                                          freq=self.freq, name=ax.name)
+
+        i8 = memb.asi8
+
+        # when upsampling to subperiods, we need to generate enough bins
+        expected_bins_count = len(binner) * freq_mult
+        i8_extend = expected_bins_count - (i8[-1] - i8[0])
+        rng = np.arange(i8[0], i8[-1] + i8_extend, freq_mult)
+        rng += freq_mult
+        # adjust bin edge indexes to account for base
+        rng -= bin_shift
+        bins = memb.searchsorted(rng, side='left')
+
+        if nat_count > 0:
+            # NaT handling as in pandas._lib.lib.generate_bins_dt64()
+            # shift bins by the number of NaT
+            bins += nat_count
+            bins = np.insert(bins, 0, nat_count)
+            binner = binner.insert(0, NaT)
+            labels = labels.insert(0, NaT)
+
+        return binner, bins, labels
+
+
+def _take_new_index(obj, indexer, new_index, axis=0):
+    from pandas.core.api import Series, DataFrame
+
+    if isinstance(obj, Series):
+        new_values = algos.take_1d(obj.values, indexer)
+        return Series(new_values, index=new_index, name=obj.name)
+    elif isinstance(obj, DataFrame):
+        if axis == 1:
+            raise NotImplementedError("axis 1 is not supported")
+        return DataFrame(obj._data.reindex_indexer(
+            new_axis=new_index, indexer=indexer, axis=1))
+    else:
+        raise ValueError("'obj' should be either a Series or a DataFrame")
+
+
+def _get_timestamp_range_edges(first, last, offset, closed='left', base=0):
+    """
+    Adjust the `first` Timestamp to the preceeding Timestamp that resides on
+    the provided offset. Adjust the `last` Timestamp to the following
+    Timestamp that resides on the provided offset. Input Timestamps that
+    already reside on the offset will be adjusted depending on the type of
+    offset and the `closed` parameter.
+
+    Parameters
+    ----------
+    first : pd.Timestamp
+        The beginning Timestamp of the range to be adjusted.
+    last : pd.Timestamp
+        The ending Timestamp of the range to be adjusted.
+    offset : pd.DateOffset
+        The dateoffset to which the Timestamps will be adjusted.
+    closed : {'right', 'left'}, default None
+        Which side of bin interval is closed.
+    base : int, default 0
+        The "origin" of the adjusted Timestamps.
+
+    Returns
+    -------
+    A tuple of length 2, containing the adjusted pd.Timestamp objects.
+    """
+    if isinstance(offset, Tick):
+        if isinstance(offset, Day):
+            # _adjust_dates_anchored assumes 'D' means 24H, but first/last
+            # might contain a DST transition (23H, 24H, or 25H).
+            # So "pretend" the dates are naive when adjusting the endpoints
+            tz = first.tz
+            first = first.tz_localize(None)
+            last = last.tz_localize(None)
+
+        first, last = _adjust_dates_anchored(first, last, offset,
+                                             closed=closed, base=base)
+        if isinstance(offset, Day):
+            first = first.tz_localize(tz)
+            last = last.tz_localize(tz)
+        return first, last
+
+    else:
+        first = first.normalize()
+        last = last.normalize()
+
+    if closed == 'left':
+        first = Timestamp(offset.rollback(first))
+    else:
+        first = Timestamp(first - offset)
+
+    last = Timestamp(last + offset)
+
+    return first, last
+
+
+def _get_period_range_edges(first, last, offset, closed='left', base=0):
+    """
+    Adjust the provided `first` and `last` Periods to the respective Period of
+    the given offset that encompasses them.
+
+    Parameters
+    ----------
+    first : pd.Period
+        The beginning Period of the range to be adjusted.
+    last : pd.Period
+        The ending Period of the range to be adjusted.
+    offset : pd.DateOffset
+        The dateoffset to which the Periods will be adjusted.
+    closed : {'right', 'left'}, default None
+        Which side of bin interval is closed.
+    base : int, default 0
+        The "origin" of the adjusted Periods.
+
+    Returns
+    -------
+    A tuple of length 2, containing the adjusted pd.Period objects.
+    """
+    if not all(isinstance(obj, pd.Period) for obj in [first, last]):
+        raise TypeError("'first' and 'last' must be instances of type Period")
+
+    # GH 23882
+    first = first.to_timestamp()
+    last = last.to_timestamp()
+    adjust_first = not offset.onOffset(first)
+    adjust_last = offset.onOffset(last)
+
+    first, last = _get_timestamp_range_edges(first, last, offset,
+                                             closed=closed, base=base)
+
+    first = (first + adjust_first * offset).to_period(offset)
+    last = (last - adjust_last * offset).to_period(offset)
+    return first, last
+
+
+def _adjust_dates_anchored(first, last, offset, closed='right', base=0):
+    # First and last offsets should be calculated from the start day to fix an
+    # error cause by resampling across multiple days when a one day period is
+    # not a multiple of the frequency.
+    #
+    # See https://github.com/pandas-dev/pandas/issues/8683
+
+    # GH 10117 & GH 19375. If first and last contain timezone information,
+    # Perform the calculation in UTC in order to avoid localizing on an
+    # Ambiguous or Nonexistent time.
+    first_tzinfo = first.tzinfo
+    last_tzinfo = last.tzinfo
+    start_day_nanos = first.normalize().value
+    if first_tzinfo is not None:
+        first = first.tz_convert('UTC')
+    if last_tzinfo is not None:
+        last = last.tz_convert('UTC')
+
+    base_nanos = (base % offset.n) * offset.nanos // offset.n
+    start_day_nanos += base_nanos
+
+    foffset = (first.value - start_day_nanos) % offset.nanos
+    loffset = (last.value - start_day_nanos) % offset.nanos
+
+    if closed == 'right':
+        if foffset > 0:
+            # roll back
+            fresult = first.value - foffset
+        else:
+            fresult = first.value - offset.nanos
+
+        if loffset > 0:
+            # roll forward
+            lresult = last.value + (offset.nanos - loffset)
+        else:
+            # already the end of the road
+            lresult = last.value
+    else:  # closed == 'left'
+        if foffset > 0:
+            fresult = first.value - foffset
+        else:
+            # start of the road
+            fresult = first.value
+
+        if loffset > 0:
+            # roll forward
+            lresult = last.value + (offset.nanos - loffset)
+        else:
+            lresult = last.value + offset.nanos
+    fresult = Timestamp(fresult)
+    lresult = Timestamp(lresult)
+    if first_tzinfo is not None:
+        fresult = fresult.tz_localize('UTC').tz_convert(first_tzinfo)
+    if last_tzinfo is not None:
+        lresult = lresult.tz_localize('UTC').tz_convert(last_tzinfo)
+    return fresult, lresult
+
+
+def asfreq(obj, freq, method=None, how=None, normalize=False, fill_value=None):
+    """
+    Utility frequency conversion method for Series/DataFrame.
+    """
+    if isinstance(obj.index, PeriodIndex):
+        if method is not None:
+            raise NotImplementedError("'method' argument is not supported")
+
+        if how is None:
+            how = 'E'
+
+        new_obj = obj.copy()
+        new_obj.index = obj.index.asfreq(freq, how=how)
+
+    elif len(obj.index) == 0:
+        new_obj = obj.copy()
+        new_obj.index = obj.index._shallow_copy(freq=to_offset(freq))
+
+    else:
+        dti = date_range(obj.index[0], obj.index[-1], freq=freq)
+        dti.name = obj.index.name
+        new_obj = obj.reindex(dti, method=method, fill_value=fill_value)
+        if normalize:
+            new_obj.index = new_obj.index.normalize()
+
+    return new_obj
diff --git a/pandas/core/reshape.py b/pandas/core/reshape.py
deleted file mode 100644
index 2822d98b7c906..0000000000000
--- a/pandas/core/reshape.py
+++ /dev/null
@@ -1,1411 +0,0 @@
-# pylint: disable=E1101,E1103
-# pylint: disable=W0703,W0622,W0613,W0201
-from pandas.compat import range, zip
-from pandas import compat
-import itertools
-import re
-
-import numpy as np
-
-from pandas.types.common import (_ensure_platform_int,
-                                 is_list_like, is_bool_dtype,
-                                 needs_i8_conversion)
-from pandas.types.cast import maybe_promote
-from pandas.types.missing import notnull
-import pandas.types.concat as _concat
-
-from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-
-from pandas.core.sparse import SparseDataFrame, SparseSeries
-from pandas.sparse.array import SparseArray
-from pandas.sparse.libsparse import IntIndex
-
-from pandas.core.categorical import Categorical, _factorize_from_iterable
-from pandas.core.sorting import (get_group_index, compress_group_index,
-                                 decons_obs_group_ids)
-
-import pandas.core.algorithms as algos
-from pandas._libs import algos as _algos, reshape as _reshape
-
-from pandas.core.index import MultiIndex, _get_na_value
-
-
-class _Unstacker(object):
-    """
-    Helper class to unstack data / pivot with multi-level index
-
-    Parameters
-    ----------
-    level : int or str, default last level
-        Level to "unstack". Accepts a name for the level.
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> index = pd.MultiIndex.from_tuples([('one', 'a'), ('one', 'b'),
-    ...                                    ('two', 'a'), ('two', 'b')])
-    >>> s = pd.Series(np.arange(1.0, 5.0), index=index)
-    >>> s
-    one  a   1
-         b   2
-    two  a   3
-         b   4
-    dtype: float64
-
-    >>> s.unstack(level=-1)
-         a   b
-    one  1  2
-    two  3  4
-
-    >>> s.unstack(level=0)
-       one  two
-    a  1   2
-    b  3   4
-
-    Returns
-    -------
-    unstacked : DataFrame
-    """
-
-    def __init__(self, values, index, level=-1, value_columns=None,
-                 fill_value=None):
-
-        self.is_categorical = None
-        if values.ndim == 1:
-            if isinstance(values, Categorical):
-                self.is_categorical = values
-                values = np.array(values)
-            values = values[:, np.newaxis]
-        self.values = values
-        self.value_columns = value_columns
-        self.fill_value = fill_value
-
-        if value_columns is None and values.shape[1] != 1:  # pragma: no cover
-            raise ValueError('must pass column labels for multi-column data')
-
-        self.index = index
-
-        if isinstance(self.index, MultiIndex):
-            if index._reference_duplicate_name(level):
-                msg = ("Ambiguous reference to {0}. The index "
-                       "names are not unique.".format(level))
-                raise ValueError(msg)
-
-        self.level = self.index._get_level_number(level)
-
-        # when index includes `nan`, need to lift levels/strides by 1
-        self.lift = 1 if -1 in self.index.labels[self.level] else 0
-
-        self.new_index_levels = list(index.levels)
-        self.new_index_names = list(index.names)
-
-        self.removed_name = self.new_index_names.pop(self.level)
-        self.removed_level = self.new_index_levels.pop(self.level)
-
-        self._make_sorted_values_labels()
-        self._make_selectors()
-
-    def _make_sorted_values_labels(self):
-        v = self.level
-
-        labs = list(self.index.labels)
-        levs = list(self.index.levels)
-        to_sort = labs[:v] + labs[v + 1:] + [labs[v]]
-        sizes = [len(x) for x in levs[:v] + levs[v + 1:] + [levs[v]]]
-
-        comp_index, obs_ids = get_compressed_ids(to_sort, sizes)
-        ngroups = len(obs_ids)
-
-        indexer = _algos.groupsort_indexer(comp_index, ngroups)[0]
-        indexer = _ensure_platform_int(indexer)
-
-        self.sorted_values = algos.take_nd(self.values, indexer, axis=0)
-        self.sorted_labels = [l.take(indexer) for l in to_sort]
-
-    def _make_selectors(self):
-        new_levels = self.new_index_levels
-
-        # make the mask
-        remaining_labels = self.sorted_labels[:-1]
-        level_sizes = [len(x) for x in new_levels]
-
-        comp_index, obs_ids = get_compressed_ids(remaining_labels, level_sizes)
-        ngroups = len(obs_ids)
-
-        comp_index = _ensure_platform_int(comp_index)
-        stride = self.index.levshape[self.level] + self.lift
-        self.full_shape = ngroups, stride
-
-        selector = self.sorted_labels[-1] + stride * comp_index + self.lift
-        mask = np.zeros(np.prod(self.full_shape), dtype=bool)
-        mask.put(selector, True)
-
-        if mask.sum() < len(self.index):
-            raise ValueError('Index contains duplicate entries, '
-                             'cannot reshape')
-
-        self.group_index = comp_index
-        self.mask = mask
-        self.unique_groups = obs_ids
-        self.compressor = comp_index.searchsorted(np.arange(ngroups))
-
-    def get_result(self):
-        # TODO: find a better way than this masking business
-
-        values, value_mask = self.get_new_values()
-        columns = self.get_new_columns()
-        index = self.get_new_index()
-
-        # filter out missing levels
-        if values.shape[1] > 0:
-            col_inds, obs_ids = compress_group_index(self.sorted_labels[-1])
-            # rare case, level values not observed
-            if len(obs_ids) < self.full_shape[1]:
-                inds = (value_mask.sum(0) > 0).nonzero()[0]
-                values = algos.take_nd(values, inds, axis=1)
-                columns = columns[inds]
-
-        # may need to coerce categoricals here
-        if self.is_categorical is not None:
-            categories = self.is_categorical.categories
-            ordered = self.is_categorical.ordered
-            values = [Categorical(values[:, i], categories=categories,
-                                  ordered=ordered)
-                      for i in range(values.shape[-1])]
-
-        return DataFrame(values, index=index, columns=columns)
-
-    def get_new_values(self):
-        values = self.values
-
-        # place the values
-        length, width = self.full_shape
-        stride = values.shape[1]
-        result_width = width * stride
-        result_shape = (length, result_width)
-        mask = self.mask
-        mask_all = mask.all()
-
-        # we can simply reshape if we don't have a mask
-        if mask_all and len(values):
-            new_values = (self.sorted_values
-                              .reshape(length, width, stride)
-                              .swapaxes(1, 2)
-                              .reshape(result_shape)
-                          )
-            new_mask = np.ones(result_shape, dtype=bool)
-            return new_values, new_mask
-
-        # if our mask is all True, then we can use our existing dtype
-        if mask_all:
-            dtype = values.dtype
-            new_values = np.empty(result_shape, dtype=dtype)
-        else:
-            dtype, fill_value = maybe_promote(values.dtype, self.fill_value)
-            new_values = np.empty(result_shape, dtype=dtype)
-            new_values.fill(fill_value)
-
-        new_mask = np.zeros(result_shape, dtype=bool)
-
-        name = np.dtype(dtype).name
-        sorted_values = self.sorted_values
-
-        # we need to convert to a basic dtype
-        # and possibly coerce an input to our output dtype
-        # e.g. ints -> floats
-        if needs_i8_conversion(values):
-            sorted_values = sorted_values.view('i8')
-            new_values = new_values.view('i8')
-            name = 'int64'
-        elif is_bool_dtype(values):
-            sorted_values = sorted_values.astype('object')
-            new_values = new_values.astype('object')
-            name = 'object'
-        else:
-            sorted_values = sorted_values.astype(name, copy=False)
-
-        # fill in our values & mask
-        f = getattr(_reshape, "unstack_{}".format(name))
-        f(sorted_values,
-          mask.view('u1'),
-          stride,
-          length,
-          width,
-          new_values,
-          new_mask.view('u1'))
-
-        # reconstruct dtype if needed
-        if needs_i8_conversion(values):
-            new_values = new_values.view(values.dtype)
-
-        return new_values, new_mask
-
-    def get_new_columns(self):
-        if self.value_columns is None:
-            if self.lift == 0:
-                return self.removed_level
-
-            lev = self.removed_level
-            return lev.insert(0, _get_na_value(lev.dtype.type))
-
-        stride = len(self.removed_level) + self.lift
-        width = len(self.value_columns)
-        propagator = np.repeat(np.arange(width), stride)
-        if isinstance(self.value_columns, MultiIndex):
-            new_levels = self.value_columns.levels + (self.removed_level,)
-            new_names = self.value_columns.names + (self.removed_name,)
-
-            new_labels = [lab.take(propagator)
-                          for lab in self.value_columns.labels]
-        else:
-            new_levels = [self.value_columns, self.removed_level]
-            new_names = [self.value_columns.name, self.removed_name]
-            new_labels = [propagator]
-
-        new_labels.append(np.tile(np.arange(stride) - self.lift, width))
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def get_new_index(self):
-        result_labels = [lab.take(self.compressor)
-                         for lab in self.sorted_labels[:-1]]
-
-        # construct the new index
-        if len(self.new_index_levels) == 1:
-            lev, lab = self.new_index_levels[0], result_labels[0]
-            if (lab == -1).any():
-                lev = lev.insert(len(lev), _get_na_value(lev.dtype.type))
-            return lev.take(lab)
-
-        return MultiIndex(levels=self.new_index_levels, labels=result_labels,
-                          names=self.new_index_names, verify_integrity=False)
-
-
-def _unstack_multiple(data, clocs):
-    if len(clocs) == 0:
-        return data
-
-    # NOTE: This doesn't deal with hierarchical columns yet
-
-    index = data.index
-
-    clocs = [index._get_level_number(i) for i in clocs]
-
-    rlocs = [i for i in range(index.nlevels) if i not in clocs]
-
-    clevels = [index.levels[i] for i in clocs]
-    clabels = [index.labels[i] for i in clocs]
-    cnames = [index.names[i] for i in clocs]
-    rlevels = [index.levels[i] for i in rlocs]
-    rlabels = [index.labels[i] for i in rlocs]
-    rnames = [index.names[i] for i in rlocs]
-
-    shape = [len(x) for x in clevels]
-    group_index = get_group_index(clabels, shape, sort=False, xnull=False)
-
-    comp_ids, obs_ids = compress_group_index(group_index, sort=False)
-    recons_labels = decons_obs_group_ids(comp_ids, obs_ids, shape, clabels,
-                                         xnull=False)
-
-    dummy_index = MultiIndex(levels=rlevels + [obs_ids],
-                             labels=rlabels + [comp_ids],
-                             names=rnames + ['__placeholder__'],
-                             verify_integrity=False)
-
-    if isinstance(data, Series):
-        dummy = data.copy()
-        dummy.index = dummy_index
-        unstacked = dummy.unstack('__placeholder__')
-        new_levels = clevels
-        new_names = cnames
-        new_labels = recons_labels
-    else:
-        if isinstance(data.columns, MultiIndex):
-            result = data
-            for i in range(len(clocs)):
-                val = clocs[i]
-                result = result.unstack(val)
-                clocs = [v if i > v else v - 1 for v in clocs]
-
-            return result
-
-        dummy = data.copy()
-        dummy.index = dummy_index
-
-        unstacked = dummy.unstack('__placeholder__')
-        if isinstance(unstacked, Series):
-            unstcols = unstacked.index
-        else:
-            unstcols = unstacked.columns
-        new_levels = [unstcols.levels[0]] + clevels
-        new_names = [data.columns.name] + cnames
-
-        new_labels = [unstcols.labels[0]]
-        for rec in recons_labels:
-            new_labels.append(rec.take(unstcols.labels[-1]))
-
-    new_columns = MultiIndex(levels=new_levels, labels=new_labels,
-                             names=new_names, verify_integrity=False)
-
-    if isinstance(unstacked, Series):
-        unstacked.index = new_columns
-    else:
-        unstacked.columns = new_columns
-
-    return unstacked
-
-
-def pivot(self, index=None, columns=None, values=None):
-    """
-    See DataFrame.pivot
-    """
-    if values is None:
-        cols = [columns] if index is None else [index, columns]
-        append = index is None
-        indexed = self.set_index(cols, append=append)
-        return indexed.unstack(columns)
-    else:
-        if index is None:
-            index = self.index
-        else:
-            index = self[index]
-        indexed = Series(self[values].values,
-                         index=MultiIndex.from_arrays([index, self[columns]]))
-        return indexed.unstack(columns)
-
-
-def pivot_simple(index, columns, values):
-    """
-    Produce 'pivot' table based on 3 columns of this DataFrame.
-    Uses unique values from index / columns and fills with values.
-
-    Parameters
-    ----------
-    index : ndarray
-        Labels to use to make new frame's index
-    columns : ndarray
-        Labels to use to make new frame's columns
-    values : ndarray
-        Values to use for populating new frame's values
-
-    Notes
-    -----
-    Obviously, all 3 of the input arguments must have the same length
-
-    Returns
-    -------
-    DataFrame
-
-    See also
-    --------
-    DataFrame.pivot_table : generalization of pivot that can handle
-        duplicate values for one index/column pair
-    """
-    if (len(index) != len(columns)) or (len(columns) != len(values)):
-        raise AssertionError('Length of index, columns, and values must be the'
-                             ' same')
-
-    if len(index) == 0:
-        return DataFrame(index=[])
-
-    hindex = MultiIndex.from_arrays([index, columns])
-    series = Series(values.ravel(), index=hindex)
-    series = series.sort_index(level=0)
-    return series.unstack()
-
-
-def _slow_pivot(index, columns, values):
-    """
-    Produce 'pivot' table based on 3 columns of this DataFrame.
-    Uses unique values from index / columns and fills with values.
-
-    Parameters
-    ----------
-    index : string or object
-        Column name to use to make new frame's index
-    columns : string or object
-        Column name to use to make new frame's columns
-    values : string or object
-        Column name to use for populating new frame's values
-
-    Could benefit from some Cython here.
-    """
-    tree = {}
-    for i, (idx, col) in enumerate(zip(index, columns)):
-        if col not in tree:
-            tree[col] = {}
-        branch = tree[col]
-        branch[idx] = values[i]
-
-    return DataFrame(tree)
-
-
-def unstack(obj, level, fill_value=None):
-    if isinstance(level, (tuple, list)):
-        return _unstack_multiple(obj, level)
-
-    if isinstance(obj, DataFrame):
-        if isinstance(obj.index, MultiIndex):
-            return _unstack_frame(obj, level, fill_value=fill_value)
-        else:
-            return obj.T.stack(dropna=False)
-    else:
-        unstacker = _Unstacker(obj.values, obj.index, level=level,
-                               fill_value=fill_value)
-        return unstacker.get_result()
-
-
-def _unstack_frame(obj, level, fill_value=None):
-    from pandas.core.internals import BlockManager, make_block
-
-    if obj._is_mixed_type:
-        unstacker = _Unstacker(np.empty(obj.shape, dtype=bool),  # dummy
-                               obj.index, level=level,
-                               value_columns=obj.columns)
-        new_columns = unstacker.get_new_columns()
-        new_index = unstacker.get_new_index()
-        new_axes = [new_columns, new_index]
-
-        new_blocks = []
-        mask_blocks = []
-        for blk in obj._data.blocks:
-            blk_items = obj._data.items[blk.mgr_locs.indexer]
-            bunstacker = _Unstacker(blk.values.T, obj.index, level=level,
-                                    value_columns=blk_items,
-                                    fill_value=fill_value)
-            new_items = bunstacker.get_new_columns()
-            new_placement = new_columns.get_indexer(new_items)
-            new_values, mask = bunstacker.get_new_values()
-
-            mblk = make_block(mask.T, placement=new_placement)
-            mask_blocks.append(mblk)
-
-            newb = make_block(new_values.T, placement=new_placement)
-            new_blocks.append(newb)
-
-        result = DataFrame(BlockManager(new_blocks, new_axes))
-        mask_frame = DataFrame(BlockManager(mask_blocks, new_axes))
-        return result.loc[:, mask_frame.sum(0) > 0]
-    else:
-        unstacker = _Unstacker(obj.values, obj.index, level=level,
-                               value_columns=obj.columns,
-                               fill_value=fill_value)
-        return unstacker.get_result()
-
-
-def get_compressed_ids(labels, sizes):
-    ids = get_group_index(labels, sizes, sort=True, xnull=False)
-    return compress_group_index(ids, sort=True)
-
-
-def stack(frame, level=-1, dropna=True):
-    """
-    Convert DataFrame to Series with multi-level Index. Columns become the
-    second level of the resulting hierarchical index
-
-    Returns
-    -------
-    stacked : Series
-    """
-
-    def factorize(index):
-        if index.is_unique:
-            return index, np.arange(len(index))
-        codes, categories = _factorize_from_iterable(index)
-        return categories, codes
-
-    N, K = frame.shape
-    if isinstance(frame.columns, MultiIndex):
-        if frame.columns._reference_duplicate_name(level):
-            msg = ("Ambiguous reference to {0}. The column "
-                   "names are not unique.".format(level))
-            raise ValueError(msg)
-
-    # Will also convert negative level numbers and check if out of bounds.
-    level_num = frame.columns._get_level_number(level)
-
-    if isinstance(frame.columns, MultiIndex):
-        return _stack_multi_columns(frame, level_num=level_num, dropna=dropna)
-    elif isinstance(frame.index, MultiIndex):
-        new_levels = list(frame.index.levels)
-        new_labels = [lab.repeat(K) for lab in frame.index.labels]
-
-        clev, clab = factorize(frame.columns)
-        new_levels.append(clev)
-        new_labels.append(np.tile(clab, N).ravel())
-
-        new_names = list(frame.index.names)
-        new_names.append(frame.columns.name)
-        new_index = MultiIndex(levels=new_levels, labels=new_labels,
-                               names=new_names, verify_integrity=False)
-    else:
-        levels, (ilab, clab) = zip(*map(factorize, (frame.index,
-                                                    frame.columns)))
-        labels = ilab.repeat(K), np.tile(clab, N).ravel()
-        new_index = MultiIndex(levels=levels, labels=labels,
-                               names=[frame.index.name, frame.columns.name],
-                               verify_integrity=False)
-
-    new_values = frame.values.ravel()
-    if dropna:
-        mask = notnull(new_values)
-        new_values = new_values[mask]
-        new_index = new_index[mask]
-    return Series(new_values, index=new_index)
-
-
-def stack_multiple(frame, level, dropna=True):
-    # If all passed levels match up to column names, no
-    # ambiguity about what to do
-    if all(lev in frame.columns.names for lev in level):
-        result = frame
-        for lev in level:
-            result = stack(result, lev, dropna=dropna)
-
-    # Otherwise, level numbers may change as each successive level is stacked
-    elif all(isinstance(lev, int) for lev in level):
-        # As each stack is done, the level numbers decrease, so we need
-        #  to account for that when level is a sequence of ints
-        result = frame
-        # _get_level_number() checks level numbers are in range and converts
-        # negative numbers to positive
-        level = [frame.columns._get_level_number(lev) for lev in level]
-
-        # Can't iterate directly through level as we might need to change
-        # values as we go
-        for index in range(len(level)):
-            lev = level[index]
-            result = stack(result, lev, dropna=dropna)
-            # Decrement all level numbers greater than current, as these
-            # have now shifted down by one
-            updated_level = []
-            for other in level:
-                if other > lev:
-                    updated_level.append(other - 1)
-                else:
-                    updated_level.append(other)
-            level = updated_level
-
-    else:
-        raise ValueError("level should contain all level names or all level "
-                         "numbers, not a mixture of the two.")
-
-    return result
-
-
-def _stack_multi_columns(frame, level_num=-1, dropna=True):
-    def _convert_level_number(level_num, columns):
-        """
-        Logic for converting the level number to something we can safely pass
-        to swaplevel:
-
-        We generally want to convert the level number into a level name, except
-        when columns do not have names, in which case we must leave as a level
-        number
-        """
-        if level_num in columns.names:
-            return columns.names[level_num]
-        else:
-            if columns.names[level_num] is None:
-                return level_num
-            else:
-                return columns.names[level_num]
-
-    this = frame.copy()
-
-    # this makes life much simpler
-    if level_num != frame.columns.nlevels - 1:
-        # roll levels to put selected level at end
-        roll_columns = this.columns
-        for i in range(level_num, frame.columns.nlevels - 1):
-            # Need to check if the ints conflict with level names
-            lev1 = _convert_level_number(i, roll_columns)
-            lev2 = _convert_level_number(i + 1, roll_columns)
-            roll_columns = roll_columns.swaplevel(lev1, lev2)
-        this.columns = roll_columns
-
-    if not this.columns.is_lexsorted():
-        # Workaround the edge case where 0 is one of the column names,
-        # which interferes with trying to sort based on the first
-        # level
-        level_to_sort = _convert_level_number(0, this.columns)
-        this = this.sort_index(level=level_to_sort, axis=1)
-
-    # tuple list excluding level for grouping columns
-    if len(frame.columns.levels) > 2:
-        tuples = list(zip(*[lev.take(lab)
-                            for lev, lab in zip(this.columns.levels[:-1],
-                                                this.columns.labels[:-1])]))
-        unique_groups = [key for key, _ in itertools.groupby(tuples)]
-        new_names = this.columns.names[:-1]
-        new_columns = MultiIndex.from_tuples(unique_groups, names=new_names)
-    else:
-        new_columns = unique_groups = this.columns.levels[0]
-
-    # time to ravel the values
-    new_data = {}
-    level_vals = this.columns.levels[-1]
-    level_labels = sorted(set(this.columns.labels[-1]))
-    level_vals_used = level_vals[level_labels]
-    levsize = len(level_labels)
-    drop_cols = []
-    for key in unique_groups:
-        loc = this.columns.get_loc(key)
-        slice_len = loc.stop - loc.start
-        # can make more efficient?
-
-        if slice_len == 0:
-            drop_cols.append(key)
-            continue
-        elif slice_len != levsize:
-            chunk = this.loc[:, this.columns[loc]]
-            chunk.columns = level_vals.take(chunk.columns.labels[-1])
-            value_slice = chunk.reindex(columns=level_vals_used).values
-        else:
-            if frame._is_mixed_type:
-                value_slice = this.loc[:, this.columns[loc]].values
-            else:
-                value_slice = this.values[:, loc]
-
-        new_data[key] = value_slice.ravel()
-
-    if len(drop_cols) > 0:
-        new_columns = new_columns.difference(drop_cols)
-
-    N = len(this)
-
-    if isinstance(this.index, MultiIndex):
-        new_levels = list(this.index.levels)
-        new_names = list(this.index.names)
-        new_labels = [lab.repeat(levsize) for lab in this.index.labels]
-    else:
-        new_levels = [this.index]
-        new_labels = [np.arange(N).repeat(levsize)]
-        new_names = [this.index.name]  # something better?
-
-    new_levels.append(frame.columns.levels[level_num])
-    new_labels.append(np.tile(level_labels, N))
-    new_names.append(frame.columns.names[level_num])
-
-    new_index = MultiIndex(levels=new_levels, labels=new_labels,
-                           names=new_names, verify_integrity=False)
-
-    result = DataFrame(new_data, index=new_index, columns=new_columns)
-
-    # more efficient way to go about this? can do the whole masking biz but
-    # will only save a small amount of time...
-    if dropna:
-        result = result.dropna(axis=0, how='all')
-
-    return result
-
-
-def melt(frame, id_vars=None, value_vars=None, var_name=None,
-         value_name='value', col_level=None):
-    """
-    "Unpivots" a DataFrame from wide format to long format, optionally leaving
-    identifier variables set.
-
-    This function is useful to massage a DataFrame into a format where one
-    or more columns are identifier variables (`id_vars`), while all other
-    columns, considered measured variables (`value_vars`), are "unpivoted" to
-    the row axis, leaving just two non-identifier columns, 'variable' and
-    'value'.
-
-    Parameters
-    ----------
-    frame : DataFrame
-    id_vars : tuple, list, or ndarray, optional
-        Column(s) to use as identifier variables.
-    value_vars : tuple, list, or ndarray, optional
-        Column(s) to unpivot. If not specified, uses all columns that
-        are not set as `id_vars`.
-    var_name : scalar
-        Name to use for the 'variable' column. If None it uses
-        ``frame.columns.name`` or 'variable'.
-    value_name : scalar, default 'value'
-        Name to use for the 'value' column.
-    col_level : int or string, optional
-        If columns are a MultiIndex then use this level to melt.
-
-    See also
-    --------
-    pivot_table
-    DataFrame.pivot
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
-    ...                    'B': {0: 1, 1: 3, 2: 5},
-    ...                    'C': {0: 2, 1: 4, 2: 6}})
-    >>> df
-       A  B  C
-    0  a  1  2
-    1  b  3  4
-    2  c  5  6
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B', 'C'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-    3  a        C      2
-    4  b        C      4
-    5  c        C      6
-
-    The names of 'variable' and 'value' columns can be customized:
-
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B'],
-    ...         var_name='myVarname', value_name='myValname')
-       A myVarname  myValname
-    0  a         B          1
-    1  b         B          3
-    2  c         B          5
-
-    If you have multi-index columns:
-
-    >>> df.columns = [list('ABC'), list('DEF')]
-    >>> df
-       A  B  C
-       D  E  F
-    0  a  1  2
-    1  b  3  4
-    2  c  5  6
-
-    >>> pd.melt(df, col_level=0, id_vars=['A'], value_vars=['B'])
-       A variable  value
-    0  a        B      1
-    1  b        B      3
-    2  c        B      5
-
-    >>> pd.melt(df, id_vars=[('A', 'D')], value_vars=[('B', 'E')])
-      (A, D) variable_0 variable_1  value
-    0      a          B          E      1
-    1      b          B          E      3
-    2      c          B          E      5
-
-    """
-    # TODO: what about the existing index?
-    if id_vars is not None:
-        if not is_list_like(id_vars):
-            id_vars = [id_vars]
-        elif (isinstance(frame.columns, MultiIndex) and
-              not isinstance(id_vars, list)):
-            raise ValueError('id_vars must be a list of tuples when columns'
-                             ' are a MultiIndex')
-        else:
-            id_vars = list(id_vars)
-    else:
-        id_vars = []
-
-    if value_vars is not None:
-        if not is_list_like(value_vars):
-            value_vars = [value_vars]
-        elif (isinstance(frame.columns, MultiIndex) and
-              not isinstance(value_vars, list)):
-            raise ValueError('value_vars must be a list of tuples when'
-                             ' columns are a MultiIndex')
-        else:
-            value_vars = list(value_vars)
-        frame = frame.loc[:, id_vars + value_vars]
-    else:
-        frame = frame.copy()
-
-    if col_level is not None:  # allow list or other?
-        # frame is a copy
-        frame.columns = frame.columns.get_level_values(col_level)
-
-    if var_name is None:
-        if isinstance(frame.columns, MultiIndex):
-            if len(frame.columns.names) == len(set(frame.columns.names)):
-                var_name = frame.columns.names
-            else:
-                var_name = ['variable_%s' % i
-                            for i in range(len(frame.columns.names))]
-        else:
-            var_name = [frame.columns.name if frame.columns.name is not None
-                        else 'variable']
-    if isinstance(var_name, compat.string_types):
-        var_name = [var_name]
-
-    N, K = frame.shape
-    K -= len(id_vars)
-
-    mdata = {}
-    for col in id_vars:
-        mdata[col] = np.tile(frame.pop(col).values, K)
-
-    mcolumns = id_vars + var_name + [value_name]
-
-    mdata[value_name] = frame.values.ravel('F')
-    for i, col in enumerate(var_name):
-        # asanyarray will keep the columns as an Index
-        mdata[col] = np.asanyarray(frame.columns
-                                   ._get_level_values(i)).repeat(N)
-
-    return DataFrame(mdata, columns=mcolumns)
-
-
-def lreshape(data, groups, dropna=True, label=None):
-    """
-    Reshape long-format data to wide. Generalized inverse of DataFrame.pivot
-
-    Parameters
-    ----------
-    data : DataFrame
-    groups : dict
-        {new_name : list_of_columns}
-    dropna : boolean, default True
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> data = pd.DataFrame({'hr1': [514, 573], 'hr2': [545, 526],
-    ...                      'team': ['Red Sox', 'Yankees'],
-    ...                      'year1': [2007, 2008], 'year2': [2008, 2008]})
-    >>> data
-       hr1  hr2     team  year1  year2
-    0  514  545  Red Sox   2007   2008
-    1  573  526  Yankees   2007   2008
-
-    >>> pd.lreshape(data, {'year': ['year1', 'year2'], 'hr': ['hr1', 'hr2']})
-          team   hr  year
-    0  Red Sox  514  2007
-    1  Yankees  573  2007
-    2  Red Sox  545  2008
-    3  Yankees  526  2008
-
-    Returns
-    -------
-    reshaped : DataFrame
-    """
-    if isinstance(groups, dict):
-        keys = list(groups.keys())
-        values = list(groups.values())
-    else:
-        keys, values = zip(*groups)
-
-    all_cols = list(set.union(*[set(x) for x in values]))
-    id_cols = list(data.columns.difference(all_cols))
-
-    K = len(values[0])
-
-    for seq in values:
-        if len(seq) != K:
-            raise ValueError('All column lists must be same length')
-
-    mdata = {}
-    pivot_cols = []
-
-    for target, names in zip(keys, values):
-        to_concat = [data[col].values for col in names]
-        mdata[target] = _concat._concat_compat(to_concat)
-        pivot_cols.append(target)
-
-    for col in id_cols:
-        mdata[col] = np.tile(data[col].values, K)
-
-    if dropna:
-        mask = np.ones(len(mdata[pivot_cols[0]]), dtype=bool)
-        for c in pivot_cols:
-            mask &= notnull(mdata[c])
-        if not mask.all():
-            mdata = dict((k, v[mask]) for k, v in compat.iteritems(mdata))
-
-    return DataFrame(mdata, columns=id_cols + pivot_cols)
-
-
-def wide_to_long(df, stubnames, i, j, sep="", suffix='\d+'):
-    r"""
-    Wide panel to long format. Less flexible but more user-friendly than melt.
-
-    With stubnames ['A', 'B'], this function expects to find one or more
-    group of columns with format Asuffix1, Asuffix2,..., Bsuffix1, Bsuffix2,...
-    You specify what you want to call this suffix in the resulting long format
-    with `j` (for example `j='year'`)
-
-    Each row of these wide variables are assumed to be uniquely identified by
-    `i` (can be a single column name or a list of column names)
-
-    All remaining variables in the data frame are left intact.
-
-    Parameters
-    ----------
-    df : DataFrame
-        The wide-format DataFrame
-    stubnames : str or list-like
-        The stub name(s). The wide format variables are assumed to
-        start with the stub names.
-    i : str or list-like
-        Column(s) to use as id variable(s)
-    j : str
-        The name of the subobservation variable. What you wish to name your
-        suffix in the long format.
-    sep : str, default ""
-        A character indicating the separation of the variable names
-        in the wide format, to be stripped from the names in the long format.
-        For example, if your column names are A-suffix1, A-suffix2, you
-        can strip the hypen by specifying `sep='-'`
-
-        .. versionadded:: 0.20.0
-
-    suffix : str, default '\\d+'
-        A regular expression capturing the wanted suffixes. '\\d+' captures
-        numeric suffixes. Suffixes with no numbers could be specified with the
-        negated character class '\\D+'. You can also further disambiguate
-        suffixes, for example, if your wide variables are of the form
-        Aone, Btwo,.., and you have an unrelated column Arating, you can
-        ignore the last one by specifying `suffix='(!?one|two)'`
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    DataFrame
-        A DataFrame that contains each stub name as a variable, with new index
-        (i, j)
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> import numpy as np
-    >>> np.random.seed(123)
-    >>> df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
-    ...                    "A1980" : {0 : "d", 1 : "e", 2 : "f"},
-    ...                    "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
-    ...                    "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
-    ...                    "X"     : dict(zip(range(3), np.random.randn(3)))
-    ...                   })
-    >>> df["id"] = df.index
-    >>> df
-    A1970 A1980  B1970  B1980         X  id
-    0     a     d    2.5    3.2 -1.085631   0
-    1     b     e    1.2    1.3  0.997345   1
-    2     c     f    0.7    0.1  0.282978   2
-    >>> pd.wide_to_long(df, ["A", "B"], i="id", j="year")
-                    X  A    B
-    id year
-    0  1970 -1.085631  a  2.5
-    1  1970  0.997345  b  1.2
-    2  1970  0.282978  c  0.7
-    0  1980 -1.085631  d  3.2
-    1  1980  0.997345  e  1.3
-    2  1980  0.282978  f  0.1
-
-    With multuple id columns
-
-    >>> df = pd.DataFrame({
-    ...     'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
-    ...     'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
-    ...     'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
-    ...     'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
-    ... })
-    >>> df
-       birth  famid  ht1  ht2
-    0      1      1  2.8  3.4
-    1      2      1  2.9  3.8
-    2      3      1  2.2  2.9
-    3      1      2  2.0  3.2
-    4      2      2  1.8  2.8
-    5      3      2  1.9  2.4
-    6      1      3  2.2  3.3
-    7      2      3  2.3  3.4
-    8      3      3  2.1  2.9
-    >>> l = pd.wide_to_long(df, stubnames='ht', i=['famid', 'birth'], j='age')
-    >>> l
-                      ht
-    famid birth age
-    1     1     1    2.8
-                2    3.4
-          2     1    2.9
-                2    3.8
-          3     1    2.2
-                2    2.9
-    2     1     1    2.0
-                2    3.2
-          2     1    1.8
-                2    2.8
-          3     1    1.9
-                2    2.4
-    3     1     1    2.2
-                2    3.3
-          2     1    2.3
-                2    3.4
-          3     1    2.1
-                2    2.9
-
-    Going from long back to wide just takes some creative use of `unstack`
-
-    >>> w = l.reset_index().set_index(['famid', 'birth', 'age']).unstack()
-    >>> w.columns = pd.Index(w.columns).str.join('')
-    >>> w.reset_index()
-       famid  birth  ht1  ht2
-    0      1      1  2.8  3.4
-    1      1      2  2.9  3.8
-    2      1      3  2.2  2.9
-    3      2      1  2.0  3.2
-    4      2      2  1.8  2.8
-    5      2      3  1.9  2.4
-    6      3      1  2.2  3.3
-    7      3      2  2.3  3.4
-    8      3      3  2.1  2.9
-
-    Less wieldy column names are also handled
-
-    >>> df = pd.DataFrame({'A(quarterly)-2010': np.random.rand(3),
-    ...                    'A(quarterly)-2011': np.random.rand(3),
-    ...                    'B(quarterly)-2010': np.random.rand(3),
-    ...                    'B(quarterly)-2011': np.random.rand(3),
-    ...                    'X' : np.random.randint(3, size=3)})
-    >>> df['id'] = df.index
-    >>> df
-      A(quarterly)-2010 A(quarterly)-2011 B(quarterly)-2010 B(quarterly)-2011
-    0          0.531828          0.724455          0.322959          0.293714
-    1          0.634401          0.611024          0.361789          0.630976
-    2          0.849432          0.722443          0.228263          0.092105
-    \
-       X  id
-    0  0   0
-    1  1   1
-    2  2   2
-    >>> pd.wide_to_long(df, ['A(quarterly)', 'B(quarterly)'],
-                        i='id', j='year', sep='-')
-             X     A(quarterly)  B(quarterly)
-    id year
-    0  2010  0       0.531828       0.322959
-    1  2010  2       0.634401       0.361789
-    2  2010  2       0.849432       0.228263
-    0  2011  0       0.724455       0.293714
-    1  2011  2       0.611024       0.630976
-    2  2011  2       0.722443       0.092105
-
-    If we have many columns, we could also use a regex to find our
-    stubnames and pass that list on to wide_to_long
-
-    >>> stubnames = set([match[0] for match in
-                        df.columns.str.findall('[A-B]\(.*\)').values
-                        if match != [] ])
-    >>> list(stubnames)
-    ['B(quarterly)', 'A(quarterly)']
-
-    Notes
-    -----
-    All extra variables are left untouched. This simply uses
-    `pandas.melt` under the hood, but is hard-coded to "do the right thing"
-    in a typicaly case.
-    """
-    def get_var_names(df, stub, sep, suffix):
-        regex = "^{0}{1}{2}".format(re.escape(stub), re.escape(sep), suffix)
-        return df.filter(regex=regex).columns.tolist()
-
-    def melt_stub(df, stub, i, j, value_vars, sep):
-        newdf = melt(df, id_vars=i, value_vars=value_vars,
-                     value_name=stub.rstrip(sep), var_name=j)
-        newdf[j] = Categorical(newdf[j])
-        newdf[j] = newdf[j].str.replace(re.escape(stub + sep), "")
-
-        return newdf.set_index(i + [j])
-
-    if any(map(lambda s: s in df.columns.tolist(), stubnames)):
-        raise ValueError("stubname can't be identical to a column name")
-
-    if not is_list_like(stubnames):
-        stubnames = [stubnames]
-    else:
-        stubnames = list(stubnames)
-
-    if not is_list_like(i):
-        i = [i]
-    else:
-        i = list(i)
-
-    value_vars = list(map(lambda stub:
-                          get_var_names(df, stub, sep, suffix), stubnames))
-
-    value_vars_flattened = [e for sublist in value_vars for e in sublist]
-    id_vars = list(set(df.columns.tolist()).difference(value_vars_flattened))
-
-    melted = []
-    for s, v in zip(stubnames, value_vars):
-        melted.append(melt_stub(df, s, i, j, v, sep))
-    melted = melted[0].join(melted[1:], how='outer')
-
-    if len(i) == 1:
-        new = df[id_vars].set_index(i).join(melted)
-        return new
-
-    new = df[id_vars].merge(melted.reset_index(), on=i).set_index(i + [j])
-
-    return new
-
-
-def get_dummies(data, prefix=None, prefix_sep='_', dummy_na=False,
-                columns=None, sparse=False, drop_first=False):
-    """
-    Convert categorical variable into dummy/indicator variables
-
-    Parameters
-    ----------
-    data : array-like, Series, or DataFrame
-    prefix : string, list of strings, or dict of strings, default None
-        String to append DataFrame column names
-        Pass a list with length equal to the number of columns
-        when calling get_dummies on a DataFrame. Alternativly, `prefix`
-        can be a dictionary mapping column names to prefixes.
-    prefix_sep : string, default '_'
-        If appending prefix, separator/delimiter to use. Or pass a
-        list or dictionary as with `prefix.`
-    dummy_na : bool, default False
-        Add a column to indicate NaNs, if False NaNs are ignored.
-    columns : list-like, default None
-        Column names in the DataFrame to be encoded.
-        If `columns` is None then all the columns with
-        `object` or `category` dtype will be converted.
-    sparse : bool, default False
-        Whether the dummy columns should be sparse or not.  Returns
-        SparseDataFrame if `data` is a Series or if all columns are included.
-        Otherwise returns a DataFrame with some SparseBlocks.
-
-        .. versionadded:: 0.16.1
-    drop_first : bool, default False
-        Whether to get k-1 dummies out of k categorical levels by removing the
-        first level.
-
-        .. versionadded:: 0.18.0
-    Returns
-    -------
-    dummies : DataFrame or SparseDataFrame
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> s = pd.Series(list('abca'))
-
-    >>> pd.get_dummies(s)
-       a  b  c
-    0  1  0  0
-    1  0  1  0
-    2  0  0  1
-    3  1  0  0
-
-    >>> s1 = ['a', 'b', np.nan]
-
-    >>> pd.get_dummies(s1)
-       a  b
-    0  1  0
-    1  0  1
-    2  0  0
-
-    >>> pd.get_dummies(s1, dummy_na=True)
-       a  b  NaN
-    0  1  0    0
-    1  0  1    0
-    2  0  0    1
-
-    >>> df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
-                        'C': [1, 2, 3]})
-
-    >>> pd.get_dummies(df, prefix=['col1', 'col2'])
-       C  col1_a  col1_b  col2_a  col2_b  col2_c
-    0  1       1       0       0       1       0
-    1  2       0       1       1       0       0
-    2  3       1       0       0       0       1
-
-    >>> pd.get_dummies(pd.Series(list('abcaa')))
-       a  b  c
-    0  1  0  0
-    1  0  1  0
-    2  0  0  1
-    3  1  0  0
-    4  1  0  0
-
-    >>> pd.get_dummies(pd.Series(list('abcaa')), drop_first=True))
-       b  c
-    0  0  0
-    1  1  0
-    2  0  1
-    3  0  0
-    4  0  0
-
-    See Also
-    --------
-    Series.str.get_dummies
-    """
-    from pandas.tools.concat import concat
-    from itertools import cycle
-
-    if isinstance(data, DataFrame):
-        # determine columns being encoded
-
-        if columns is None:
-            columns_to_encode = data.select_dtypes(
-                include=['object', 'category']).columns
-        else:
-            columns_to_encode = columns
-
-        # validate prefixes and separator to avoid silently dropping cols
-        def check_len(item, name):
-            length_msg = ("Length of '{0}' ({1}) did not match the length of "
-                          "the columns being encoded ({2}).")
-
-            if is_list_like(item):
-                if not len(item) == len(columns_to_encode):
-                    raise ValueError(length_msg.format(name, len(item),
-                                                       len(columns_to_encode)))
-
-        check_len(prefix, 'prefix')
-        check_len(prefix_sep, 'prefix_sep')
-        if isinstance(prefix, compat.string_types):
-            prefix = cycle([prefix])
-        if isinstance(prefix, dict):
-            prefix = [prefix[col] for col in columns_to_encode]
-
-        if prefix is None:
-            prefix = columns_to_encode
-
-        # validate separators
-        if isinstance(prefix_sep, compat.string_types):
-            prefix_sep = cycle([prefix_sep])
-        elif isinstance(prefix_sep, dict):
-            prefix_sep = [prefix_sep[col] for col in columns_to_encode]
-
-        if set(columns_to_encode) == set(data.columns):
-            with_dummies = []
-        else:
-            with_dummies = [data.drop(columns_to_encode, axis=1)]
-
-        for (col, pre, sep) in zip(columns_to_encode, prefix, prefix_sep):
-
-            dummy = _get_dummies_1d(data[col], prefix=pre, prefix_sep=sep,
-                                    dummy_na=dummy_na, sparse=sparse,
-                                    drop_first=drop_first)
-            with_dummies.append(dummy)
-        result = concat(with_dummies, axis=1)
-    else:
-        result = _get_dummies_1d(data, prefix, prefix_sep, dummy_na,
-                                 sparse=sparse, drop_first=drop_first)
-    return result
-
-
-def _get_dummies_1d(data, prefix, prefix_sep='_', dummy_na=False,
-                    sparse=False, drop_first=False):
-    # Series avoids inconsistent NaN handling
-    codes, levels = _factorize_from_iterable(Series(data))
-
-    def get_empty_Frame(data, sparse):
-        if isinstance(data, Series):
-            index = data.index
-        else:
-            index = np.arange(len(data))
-        if not sparse:
-            return DataFrame(index=index)
-        else:
-            return SparseDataFrame(index=index, default_fill_value=0)
-
-    # if all NaN
-    if not dummy_na and len(levels) == 0:
-        return get_empty_Frame(data, sparse)
-
-    codes = codes.copy()
-    if dummy_na:
-        codes[codes == -1] = len(levels)
-        levels = np.append(levels, np.nan)
-
-    # if dummy_na, we just fake a nan level. drop_first will drop it again
-    if drop_first and len(levels) == 1:
-        return get_empty_Frame(data, sparse)
-
-    number_of_cols = len(levels)
-
-    if prefix is not None:
-        dummy_cols = ['%s%s%s' % (prefix, prefix_sep, v) for v in levels]
-    else:
-        dummy_cols = levels
-
-    if isinstance(data, Series):
-        index = data.index
-    else:
-        index = None
-
-    if sparse:
-        sparse_series = {}
-        N = len(data)
-        sp_indices = [[] for _ in range(len(dummy_cols))]
-        for ndx, code in enumerate(codes):
-            if code == -1:
-                # Blank entries if not dummy_na and code == -1, #GH4446
-                continue
-            sp_indices[code].append(ndx)
-
-        if drop_first:
-            # remove first categorical level to avoid perfect collinearity
-            # GH12042
-            sp_indices = sp_indices[1:]
-            dummy_cols = dummy_cols[1:]
-        for col, ixs in zip(dummy_cols, sp_indices):
-            sarr = SparseArray(np.ones(len(ixs), dtype=np.uint8),
-                               sparse_index=IntIndex(N, ixs), fill_value=0,
-                               dtype=np.uint8)
-            sparse_series[col] = SparseSeries(data=sarr, index=index)
-
-        out = SparseDataFrame(sparse_series, index=index, columns=dummy_cols,
-                              default_fill_value=0,
-                              dtype=np.uint8)
-        return out
-
-    else:
-        dummy_mat = np.eye(number_of_cols, dtype=np.uint8).take(codes, axis=0)
-
-        if not dummy_na:
-            # reset NaN GH4446
-            dummy_mat[codes == -1] = 0
-
-        if drop_first:
-            # remove first GH12042
-            dummy_mat = dummy_mat[:, 1:]
-            dummy_cols = dummy_cols[1:]
-        return DataFrame(dummy_mat, index=index, columns=dummy_cols)
-
-
-def make_axis_dummies(frame, axis='minor', transform=None):
-    """
-    Construct 1-0 dummy variables corresponding to designated axis
-    labels
-
-    Parameters
-    ----------
-    frame : DataFrame
-    axis : {'major', 'minor'}, default 'minor'
-    transform : function, default None
-        Function to apply to axis labels first. For example, to
-        get "day of week" dummies in a time series regression
-        you might call::
-
-            make_axis_dummies(panel, axis='major',
-                              transform=lambda d: d.weekday())
-    Returns
-    -------
-    dummies : DataFrame
-        Column names taken from chosen axis
-    """
-    numbers = {'major': 0, 'minor': 1}
-    num = numbers.get(axis, axis)
-
-    items = frame.index.levels[num]
-    labels = frame.index.labels[num]
-    if transform is not None:
-        mapped_items = items.map(transform)
-        labels, items = _factorize_from_iterable(mapped_items.take(labels))
-
-    values = np.eye(len(items), dtype=float)
-    values = values.take(labels, axis=0)
-
-    return DataFrame(values, columns=items, index=frame.index)
diff --git a/pandas/stats/__init__.py b/pandas/core/reshape/__init__.py
similarity index 100%
rename from pandas/stats/__init__.py
rename to pandas/core/reshape/__init__.py
diff --git a/pandas/core/reshape/api.py b/pandas/core/reshape/api.py
new file mode 100644
index 0000000000000..3c76eef809c7a
--- /dev/null
+++ b/pandas/core/reshape/api.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.melt import lreshape, melt, wide_to_long
+from pandas.core.reshape.merge import merge, merge_asof, merge_ordered
+from pandas.core.reshape.pivot import crosstab, pivot, pivot_table
+from pandas.core.reshape.reshape import get_dummies
+from pandas.core.reshape.tile import cut, qcut
diff --git a/pandas/core/reshape/concat.py b/pandas/core/reshape/concat.py
new file mode 100644
index 0000000000000..a6c945ac2e464
--- /dev/null
+++ b/pandas/core/reshape/concat.py
@@ -0,0 +1,635 @@
+"""
+concat routines
+"""
+
+import numpy as np
+
+import pandas.core.dtypes.concat as _concat
+
+from pandas import DataFrame, Index, MultiIndex, Series, compat
+from pandas.core import common as com
+from pandas.core.arrays.categorical import (
+    _factorize_from_iterable, _factorize_from_iterables)
+from pandas.core.generic import NDFrame
+from pandas.core.index import (
+    _all_indexes_same, _get_consensus_names, _get_objs_combined_axis,
+    ensure_index)
+import pandas.core.indexes.base as ibase
+from pandas.core.internals import concatenate_block_managers
+
+# ---------------------------------------------------------------------
+# Concatenate DataFrame objects
+
+
+def concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
+           keys=None, levels=None, names=None, verify_integrity=False,
+           sort=None, copy=True):
+    """
+    Concatenate pandas objects along a particular axis with optional set logic
+    along the other axes.
+
+    Can also add a layer of hierarchical indexing on the concatenation axis,
+    which may be useful if the labels are the same (or overlapping) on
+    the passed axis number.
+
+    Parameters
+    ----------
+    objs : a sequence or mapping of Series, DataFrame, or Panel objects
+        If a dict is passed, the sorted keys will be used as the `keys`
+        argument, unless it is passed, in which case the values will be
+        selected (see below). Any None objects will be dropped silently unless
+        they are all None in which case a ValueError will be raised.
+    axis : {0/'index', 1/'columns'}, default 0
+        The axis to concatenate along.
+    join : {'inner', 'outer'}, default 'outer'
+        How to handle indexes on other axis (or axes).
+    join_axes : list of Index objects
+        Specific indexes to use for the other n - 1 axes instead of performing
+        inner/outer set logic.
+    ignore_index : bool, default False
+        If True, do not use the index values along the concatenation axis. The
+        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
+        concatenating objects where the concatenation axis does not have
+        meaningful indexing information. Note the index values on the other
+        axes are still respected in the join.
+    keys : sequence, default None
+        If multiple levels passed, should contain tuples. Construct
+        hierarchical index using the passed keys as the outermost level.
+    levels : list of sequences, default None
+        Specific levels (unique values) to use for constructing a
+        MultiIndex. Otherwise they will be inferred from the keys.
+    names : list, default None
+        Names for the levels in the resulting hierarchical index.
+    verify_integrity : bool, default False
+        Check whether the new concatenated axis contains duplicates. This can
+        be very expensive relative to the actual data concatenation.
+    sort : bool, default None
+        Sort non-concatenation axis if it is not already aligned when `join`
+        is 'outer'. The current default of sorting is deprecated and will
+        change to not-sorting in a future version of pandas.
+
+        Explicitly pass ``sort=True`` to silence the warning and sort.
+        Explicitly pass ``sort=False`` to silence the warning and not sort.
+
+        This has no effect when ``join='inner'``, which already preserves
+        the order of the non-concatenation axis.
+
+        .. versionadded:: 0.23.0
+
+    copy : bool, default True
+        If False, do not copy data unnecessarily.
+
+    Returns
+    -------
+    object, type of objs
+        When concatenating all ``Series`` along the index (axis=0), a
+        ``Series`` is returned. When ``objs`` contains at least one
+        ``DataFrame``, a ``DataFrame`` is returned. When concatenating along
+        the columns (axis=1), a ``DataFrame`` is returned.
+
+    See Also
+    --------
+    Series.append : Concatenate Series.
+    DataFrame.append : Concatenate DataFrames.
+    DataFrame.join : Join DataFrames using indexes.
+    DataFrame.merge : Merge DataFrames by indexes or columns.
+
+    Notes
+    -----
+    The keys, levels, and names arguments are all optional.
+
+    A walkthrough of how this method fits in with other tools for combining
+    pandas objects can be found `here
+    <http://pandas.pydata.org/pandas-docs/stable/merging.html>`__.
+
+    Examples
+    --------
+    Combine two ``Series``.
+
+    >>> s1 = pd.Series(['a', 'b'])
+    >>> s2 = pd.Series(['c', 'd'])
+    >>> pd.concat([s1, s2])
+    0    a
+    1    b
+    0    c
+    1    d
+    dtype: object
+
+    Clear the existing index and reset it in the result
+    by setting the ``ignore_index`` option to ``True``.
+
+    >>> pd.concat([s1, s2], ignore_index=True)
+    0    a
+    1    b
+    2    c
+    3    d
+    dtype: object
+
+    Add a hierarchical index at the outermost level of
+    the data with the ``keys`` option.
+
+    >>> pd.concat([s1, s2], keys=['s1', 's2'])
+    s1  0    a
+        1    b
+    s2  0    c
+        1    d
+    dtype: object
+
+    Label the index keys you create with the ``names`` option.
+
+    >>> pd.concat([s1, s2], keys=['s1', 's2'],
+    ...           names=['Series name', 'Row ID'])
+    Series name  Row ID
+    s1           0         a
+                 1         b
+    s2           0         c
+                 1         d
+    dtype: object
+
+    Combine two ``DataFrame`` objects with identical columns.
+
+    >>> df1 = pd.DataFrame([['a', 1], ['b', 2]],
+    ...                    columns=['letter', 'number'])
+    >>> df1
+      letter  number
+    0      a       1
+    1      b       2
+    >>> df2 = pd.DataFrame([['c', 3], ['d', 4]],
+    ...                    columns=['letter', 'number'])
+    >>> df2
+      letter  number
+    0      c       3
+    1      d       4
+    >>> pd.concat([df1, df2])
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
+
+    Combine ``DataFrame`` objects with overlapping columns
+    and return everything. Columns outside the intersection will
+    be filled with ``NaN`` values.
+
+    >>> df3 = pd.DataFrame([['c', 3, 'cat'], ['d', 4, 'dog']],
+    ...                    columns=['letter', 'number', 'animal'])
+    >>> df3
+      letter  number animal
+    0      c       3    cat
+    1      d       4    dog
+    >>> pd.concat([df1, df3], sort=False)
+      letter  number animal
+    0      a       1    NaN
+    1      b       2    NaN
+    0      c       3    cat
+    1      d       4    dog
+
+    Combine ``DataFrame`` objects with overlapping columns
+    and return only those that are shared by passing ``inner`` to
+    the ``join`` keyword argument.
+
+    >>> pd.concat([df1, df3], join="inner")
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
+
+    Combine ``DataFrame`` objects horizontally along the x axis by
+    passing in ``axis=1``.
+
+    >>> df4 = pd.DataFrame([['bird', 'polly'], ['monkey', 'george']],
+    ...                    columns=['animal', 'name'])
+    >>> pd.concat([df1, df4], axis=1)
+      letter  number  animal    name
+    0      a       1    bird   polly
+    1      b       2  monkey  george
+
+    Prevent the result from including duplicate index values with the
+    ``verify_integrity`` option.
+
+    >>> df5 = pd.DataFrame([1], index=['a'])
+    >>> df5
+       0
+    a  1
+    >>> df6 = pd.DataFrame([2], index=['a'])
+    >>> df6
+       0
+    a  2
+    >>> pd.concat([df5, df6], verify_integrity=True)
+    Traceback (most recent call last):
+        ...
+    ValueError: Indexes have overlapping values: ['a']
+    """
+    op = _Concatenator(objs, axis=axis, join_axes=join_axes,
+                       ignore_index=ignore_index, join=join,
+                       keys=keys, levels=levels, names=names,
+                       verify_integrity=verify_integrity,
+                       copy=copy, sort=sort)
+    return op.get_result()
+
+
+class _Concatenator(object):
+    """
+    Orchestrates a concatenation operation for BlockManagers
+    """
+
+    def __init__(self, objs, axis=0, join='outer', join_axes=None,
+                 keys=None, levels=None, names=None,
+                 ignore_index=False, verify_integrity=False, copy=True,
+                 sort=False):
+        if isinstance(objs, (NDFrame, compat.string_types)):
+            raise TypeError('first argument must be an iterable of pandas '
+                            'objects, you passed an object of type '
+                            '"{name}"'.format(name=type(objs).__name__))
+
+        if join == 'outer':
+            self.intersect = False
+        elif join == 'inner':
+            self.intersect = True
+        else:  # pragma: no cover
+            raise ValueError('Only can inner (intersect) or outer (union) '
+                             'join the other axis')
+
+        if isinstance(objs, dict):
+            if keys is None:
+                keys = sorted(objs)
+            objs = [objs[k] for k in keys]
+        else:
+            objs = list(objs)
+
+        if len(objs) == 0:
+            raise ValueError('No objects to concatenate')
+
+        if keys is None:
+            objs = list(com._not_none(*objs))
+        else:
+            # #1649
+            clean_keys = []
+            clean_objs = []
+            for k, v in zip(keys, objs):
+                if v is None:
+                    continue
+                clean_keys.append(k)
+                clean_objs.append(v)
+            objs = clean_objs
+            name = getattr(keys, 'name', None)
+            keys = Index(clean_keys, name=name)
+
+        if len(objs) == 0:
+            raise ValueError('All objects passed were None')
+
+        # consolidate data & figure out what our result ndim is going to be
+        ndims = set()
+        for obj in objs:
+            if not isinstance(obj, NDFrame):
+                msg = ('cannot concatenate object of type "{0}";'
+                       ' only pd.Series, pd.DataFrame, and pd.Panel'
+                       ' (deprecated) objs are valid'.format(type(obj)))
+                raise TypeError(msg)
+
+            # consolidate
+            obj._consolidate(inplace=True)
+            ndims.add(obj.ndim)
+
+        # get the sample
+        # want the highest ndim that we have, and must be non-empty
+        # unless all objs are empty
+        sample = None
+        if len(ndims) > 1:
+            max_ndim = max(ndims)
+            for obj in objs:
+                if obj.ndim == max_ndim and np.sum(obj.shape):
+                    sample = obj
+                    break
+
+        else:
+            # filter out the empties if we have not multi-index possibilities
+            # note to keep empty Series as it affect to result columns / name
+            non_empties = [obj for obj in objs
+                           if sum(obj.shape) > 0 or isinstance(obj, Series)]
+
+            if (len(non_empties) and (keys is None and names is None and
+                                      levels is None and
+                                      join_axes is None and
+                                      not self.intersect)):
+                objs = non_empties
+                sample = objs[0]
+
+        if sample is None:
+            sample = objs[0]
+        self.objs = objs
+
+        # Standardize axis parameter to int
+        if isinstance(sample, Series):
+            axis = DataFrame._get_axis_number(axis)
+        else:
+            axis = sample._get_axis_number(axis)
+
+        # Need to flip BlockManager axis in the DataFrame special case
+        self._is_frame = isinstance(sample, DataFrame)
+        if self._is_frame:
+            axis = 1 if axis == 0 else 0
+
+        self._is_series = isinstance(sample, Series)
+        if not 0 <= axis <= sample.ndim:
+            raise AssertionError("axis must be between 0 and {ndim}, input was"
+                                 " {axis}".format(ndim=sample.ndim, axis=axis))
+
+        # if we have mixed ndims, then convert to highest ndim
+        # creating column numbers as needed
+        if len(ndims) > 1:
+            current_column = 0
+            max_ndim = sample.ndim
+            self.objs, objs = [], self.objs
+            for obj in objs:
+
+                ndim = obj.ndim
+                if ndim == max_ndim:
+                    pass
+
+                elif ndim != max_ndim - 1:
+                    raise ValueError("cannot concatenate unaligned mixed "
+                                     "dimensional NDFrame objects")
+
+                else:
+                    name = getattr(obj, 'name', None)
+                    if ignore_index or name is None:
+                        name = current_column
+                        current_column += 1
+
+                    # doing a row-wise concatenation so need everything
+                    # to line up
+                    if self._is_frame and axis == 1:
+                        name = 0
+                    obj = sample._constructor({name: obj})
+
+                self.objs.append(obj)
+
+        # note: this is the BlockManager axis (since DataFrame is transposed)
+        self.axis = axis
+        self.join_axes = join_axes
+        self.keys = keys
+        self.names = names or getattr(keys, 'names', None)
+        self.levels = levels
+        self.sort = sort
+
+        self.ignore_index = ignore_index
+        self.verify_integrity = verify_integrity
+        self.copy = copy
+
+        self.new_axes = self._get_new_axes()
+
+    def get_result(self):
+
+        # series only
+        if self._is_series:
+
+            # stack blocks
+            if self.axis == 0:
+                name = com.consensus_name_attr(self.objs)
+
+                mgr = self.objs[0]._data.concat([x._data for x in self.objs],
+                                                self.new_axes)
+                cons = _concat._get_series_result_type(mgr, self.objs)
+                return cons(mgr, name=name).__finalize__(self, method='concat')
+
+            # combine as columns in a frame
+            else:
+                data = dict(zip(range(len(self.objs)), self.objs))
+                cons = _concat._get_series_result_type(data)
+
+                index, columns = self.new_axes
+                df = cons(data, index=index)
+                df.columns = columns
+                return df.__finalize__(self, method='concat')
+
+        # combine block managers
+        else:
+            mgrs_indexers = []
+            for obj in self.objs:
+                mgr = obj._data
+                indexers = {}
+                for ax, new_labels in enumerate(self.new_axes):
+                    if ax == self.axis:
+                        # Suppress reindexing on concat axis
+                        continue
+
+                    obj_labels = mgr.axes[ax]
+                    if not new_labels.equals(obj_labels):
+                        indexers[ax] = obj_labels.reindex(new_labels)[1]
+
+                mgrs_indexers.append((obj._data, indexers))
+
+            new_data = concatenate_block_managers(
+                mgrs_indexers, self.new_axes, concat_axis=self.axis,
+                copy=self.copy)
+            if not self.copy:
+                new_data._consolidate_inplace()
+
+            cons = _concat._get_frame_result_type(new_data, self.objs)
+            return (cons._from_axes(new_data, self.new_axes)
+                    .__finalize__(self, method='concat'))
+
+    def _get_result_dim(self):
+        if self._is_series and self.axis == 1:
+            return 2
+        else:
+            return self.objs[0].ndim
+
+    def _get_new_axes(self):
+        ndim = self._get_result_dim()
+        new_axes = [None] * ndim
+
+        if self.join_axes is None:
+            for i in range(ndim):
+                if i == self.axis:
+                    continue
+                new_axes[i] = self._get_comb_axis(i)
+        else:
+            if len(self.join_axes) != ndim - 1:
+                raise AssertionError("length of join_axes must be equal "
+                                     "to {length}".format(length=ndim - 1))
+
+            # ufff...
+            indices = compat.lrange(ndim)
+            indices.remove(self.axis)
+
+            for i, ax in zip(indices, self.join_axes):
+                new_axes[i] = ax
+
+        new_axes[self.axis] = self._get_concat_axis()
+        return new_axes
+
+    def _get_comb_axis(self, i):
+        data_axis = self.objs[0]._get_block_manager_axis(i)
+        try:
+            return _get_objs_combined_axis(self.objs, axis=data_axis,
+                                           intersect=self.intersect,
+                                           sort=self.sort)
+        except IndexError:
+            types = [type(x).__name__ for x in self.objs]
+            raise TypeError("Cannot concatenate list of {types}"
+                            .format(types=types))
+
+    def _get_concat_axis(self):
+        """
+        Return index to be used along concatenation axis.
+        """
+        if self._is_series:
+            if self.axis == 0:
+                indexes = [x.index for x in self.objs]
+            elif self.ignore_index:
+                idx = ibase.default_index(len(self.objs))
+                return idx
+            elif self.keys is None:
+                names = [None] * len(self.objs)
+                num = 0
+                has_names = False
+                for i, x in enumerate(self.objs):
+                    if not isinstance(x, Series):
+                        raise TypeError("Cannot concatenate type 'Series' "
+                                        "with object of type {type!r}"
+                                        .format(type=type(x).__name__))
+                    if x.name is not None:
+                        names[i] = x.name
+                        has_names = True
+                    else:
+                        names[i] = num
+                        num += 1
+                if has_names:
+                    return Index(names)
+                else:
+                    return ibase.default_index(len(self.objs))
+            else:
+                return ensure_index(self.keys).set_names(self.names)
+        else:
+            indexes = [x._data.axes[self.axis] for x in self.objs]
+
+        if self.ignore_index:
+            idx = ibase.default_index(sum(len(i) for i in indexes))
+            return idx
+
+        if self.keys is None:
+            concat_axis = _concat_indexes(indexes)
+        else:
+            concat_axis = _make_concat_multiindex(indexes, self.keys,
+                                                  self.levels, self.names)
+
+        self._maybe_check_integrity(concat_axis)
+
+        return concat_axis
+
+    def _maybe_check_integrity(self, concat_index):
+        if self.verify_integrity:
+            if not concat_index.is_unique:
+                overlap = concat_index[concat_index.duplicated()].unique()
+                raise ValueError('Indexes have overlapping values: '
+                                 '{overlap!s}'.format(overlap=overlap))
+
+
+def _concat_indexes(indexes):
+    return indexes[0].append(indexes[1:])
+
+
+def _make_concat_multiindex(indexes, keys, levels=None, names=None):
+
+    if ((levels is None and isinstance(keys[0], tuple)) or
+            (levels is not None and len(levels) > 1)):
+        zipped = compat.lzip(*keys)
+        if names is None:
+            names = [None] * len(zipped)
+
+        if levels is None:
+            _, levels = _factorize_from_iterables(zipped)
+        else:
+            levels = [ensure_index(x) for x in levels]
+    else:
+        zipped = [keys]
+        if names is None:
+            names = [None]
+
+        if levels is None:
+            levels = [ensure_index(keys)]
+        else:
+            levels = [ensure_index(x) for x in levels]
+
+    if not _all_indexes_same(indexes):
+        codes_list = []
+
+        # things are potentially different sizes, so compute the exact codes
+        # for each level and pass those to MultiIndex.from_arrays
+
+        for hlevel, level in zip(zipped, levels):
+            to_concat = []
+            for key, index in zip(hlevel, indexes):
+                try:
+                    i = level.get_loc(key)
+                except KeyError:
+                    raise ValueError('Key {key!s} not in level {level!s}'
+                                     .format(key=key, level=level))
+
+                to_concat.append(np.repeat(i, len(index)))
+            codes_list.append(np.concatenate(to_concat))
+
+        concat_index = _concat_indexes(indexes)
+
+        # these go at the end
+        if isinstance(concat_index, MultiIndex):
+            levels.extend(concat_index.levels)
+            codes_list.extend(concat_index.codes)
+        else:
+            codes, categories = _factorize_from_iterable(concat_index)
+            levels.append(categories)
+            codes_list.append(codes)
+
+        if len(names) == len(levels):
+            names = list(names)
+        else:
+            # make sure that all of the passed indices have the same nlevels
+            if not len({idx.nlevels for idx in indexes}) == 1:
+                raise AssertionError("Cannot concat indices that do"
+                                     " not have the same number of levels")
+
+            # also copies
+            names = names + _get_consensus_names(indexes)
+
+        return MultiIndex(levels=levels, codes=codes_list, names=names,
+                          verify_integrity=False)
+
+    new_index = indexes[0]
+    n = len(new_index)
+    kpieces = len(indexes)
+
+    # also copies
+    new_names = list(names)
+    new_levels = list(levels)
+
+    # construct codes
+    new_codes = []
+
+    # do something a bit more speedy
+
+    for hlevel, level in zip(zipped, levels):
+        hlevel = ensure_index(hlevel)
+        mapped = level.get_indexer(hlevel)
+
+        mask = mapped == -1
+        if mask.any():
+            raise ValueError('Values not found in passed level: {hlevel!s}'
+                             .format(hlevel=hlevel[mask]))
+
+        new_codes.append(np.repeat(mapped, n))
+
+    if isinstance(new_index, MultiIndex):
+        new_levels.extend(new_index.levels)
+        new_codes.extend([np.tile(lab, kpieces) for lab in new_index.codes])
+    else:
+        new_levels.append(new_index)
+        new_codes.append(np.tile(np.arange(n), kpieces))
+
+    if len(new_names) < len(new_levels):
+        new_names.extend(new_index.names)
+
+    return MultiIndex(levels=new_levels, codes=new_codes, names=new_names,
+                      verify_integrity=False)
diff --git a/pandas/core/reshape/melt.py b/pandas/core/reshape/melt.py
new file mode 100644
index 0000000000000..0fa80de812c5f
--- /dev/null
+++ b/pandas/core/reshape/melt.py
@@ -0,0 +1,461 @@
+# pylint: disable=E1101,E1103
+# pylint: disable=W0703,W0622,W0613,W0201
+import re
+
+import numpy as np
+
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.common import is_extension_type, is_list_like
+from pandas.core.dtypes.generic import ABCMultiIndex
+from pandas.core.dtypes.missing import notna
+
+from pandas import compat
+from pandas.core.arrays import Categorical
+from pandas.core.frame import _shared_docs
+from pandas.core.indexes.base import Index
+from pandas.core.reshape.concat import concat
+from pandas.core.tools.numeric import to_numeric
+
+
+@Appender(_shared_docs['melt'] %
+          dict(caller='pd.melt(df, ',
+               versionadded="",
+               other='DataFrame.melt'))
+def melt(frame, id_vars=None, value_vars=None, var_name=None,
+         value_name='value', col_level=None):
+    # TODO: what about the existing index?
+    # If multiindex, gather names of columns on all level for checking presence
+    # of `id_vars` and `value_vars`
+    if isinstance(frame.columns, ABCMultiIndex):
+        cols = [x for c in frame.columns for x in c]
+    else:
+        cols = list(frame.columns)
+    if id_vars is not None:
+        if not is_list_like(id_vars):
+            id_vars = [id_vars]
+        elif (isinstance(frame.columns, ABCMultiIndex) and
+              not isinstance(id_vars, list)):
+            raise ValueError('id_vars must be a list of tuples when columns'
+                             ' are a MultiIndex')
+        else:
+            # Check that `id_vars` are in frame
+            id_vars = list(id_vars)
+            missing = Index(np.ravel(id_vars)).difference(cols)
+            if not missing.empty:
+                raise KeyError("The following 'id_vars' are not present"
+                               " in the DataFrame: {missing}"
+                               "".format(missing=list(missing)))
+    else:
+        id_vars = []
+
+    if value_vars is not None:
+        if not is_list_like(value_vars):
+            value_vars = [value_vars]
+        elif (isinstance(frame.columns, ABCMultiIndex) and
+              not isinstance(value_vars, list)):
+            raise ValueError('value_vars must be a list of tuples when'
+                             ' columns are a MultiIndex')
+        else:
+            value_vars = list(value_vars)
+            # Check that `value_vars` are in frame
+            missing = Index(np.ravel(value_vars)).difference(cols)
+            if not missing.empty:
+                raise KeyError("The following 'value_vars' are not present in"
+                               " the DataFrame: {missing}"
+                               "".format(missing=list(missing)))
+        frame = frame.loc[:, id_vars + value_vars]
+    else:
+        frame = frame.copy()
+
+    if col_level is not None:  # allow list or other?
+        # frame is a copy
+        frame.columns = frame.columns.get_level_values(col_level)
+
+    if var_name is None:
+        if isinstance(frame.columns, ABCMultiIndex):
+            if len(frame.columns.names) == len(set(frame.columns.names)):
+                var_name = frame.columns.names
+            else:
+                var_name = ['variable_{i}'.format(i=i)
+                            for i in range(len(frame.columns.names))]
+        else:
+            var_name = [frame.columns.name if frame.columns.name is not None
+                        else 'variable']
+    if isinstance(var_name, compat.string_types):
+        var_name = [var_name]
+
+    N, K = frame.shape
+    K -= len(id_vars)
+
+    mdata = {}
+    for col in id_vars:
+        id_data = frame.pop(col)
+        if is_extension_type(id_data):
+            id_data = concat([id_data] * K, ignore_index=True)
+        else:
+            id_data = np.tile(id_data.values, K)
+        mdata[col] = id_data
+
+    mcolumns = id_vars + var_name + [value_name]
+
+    mdata[value_name] = frame.values.ravel('F')
+    for i, col in enumerate(var_name):
+        # asanyarray will keep the columns as an Index
+        mdata[col] = np.asanyarray(frame.columns
+                                   ._get_level_values(i)).repeat(N)
+
+    return frame._constructor(mdata, columns=mcolumns)
+
+
+def lreshape(data, groups, dropna=True, label=None):
+    """
+    Reshape long-format data to wide. Generalized inverse of DataFrame.pivot
+
+    Parameters
+    ----------
+    data : DataFrame
+    groups : dict
+        {new_name : list_of_columns}
+    dropna : boolean, default True
+
+    Examples
+    --------
+    >>> data = pd.DataFrame({'hr1': [514, 573], 'hr2': [545, 526],
+    ...                      'team': ['Red Sox', 'Yankees'],
+    ...                      'year1': [2007, 2007], 'year2': [2008, 2008]})
+    >>> data
+       hr1  hr2     team  year1  year2
+    0  514  545  Red Sox   2007   2008
+    1  573  526  Yankees   2007   2008
+
+    >>> pd.lreshape(data, {'year': ['year1', 'year2'], 'hr': ['hr1', 'hr2']})
+          team  year   hr
+    0  Red Sox  2007  514
+    1  Yankees  2007  573
+    2  Red Sox  2008  545
+    3  Yankees  2008  526
+
+    Returns
+    -------
+    reshaped : DataFrame
+    """
+    if isinstance(groups, dict):
+        keys = list(groups.keys())
+        values = list(groups.values())
+    else:
+        keys, values = zip(*groups)
+
+    all_cols = list(set.union(*[set(x) for x in values]))
+    id_cols = list(data.columns.difference(all_cols))
+
+    K = len(values[0])
+
+    for seq in values:
+        if len(seq) != K:
+            raise ValueError('All column lists must be same length')
+
+    mdata = {}
+    pivot_cols = []
+
+    for target, names in zip(keys, values):
+        to_concat = [data[col].values for col in names]
+
+        import pandas.core.dtypes.concat as _concat
+        mdata[target] = _concat._concat_compat(to_concat)
+        pivot_cols.append(target)
+
+    for col in id_cols:
+        mdata[col] = np.tile(data[col].values, K)
+
+    if dropna:
+        mask = np.ones(len(mdata[pivot_cols[0]]), dtype=bool)
+        for c in pivot_cols:
+            mask &= notna(mdata[c])
+        if not mask.all():
+            mdata = {k: v[mask] for k, v in compat.iteritems(mdata)}
+
+    return data._constructor(mdata, columns=id_cols + pivot_cols)
+
+
+def wide_to_long(df, stubnames, i, j, sep="", suffix=r'\d+'):
+    r"""
+    Wide panel to long format. Less flexible but more user-friendly than melt.
+
+    With stubnames ['A', 'B'], this function expects to find one or more
+    group of columns with format
+    A-suffix1, A-suffix2,..., B-suffix1, B-suffix2,...
+    You specify what you want to call this suffix in the resulting long format
+    with `j` (for example `j='year'`)
+
+    Each row of these wide variables are assumed to be uniquely identified by
+    `i` (can be a single column name or a list of column names)
+
+    All remaining variables in the data frame are left intact.
+
+    Parameters
+    ----------
+    df : DataFrame
+        The wide-format DataFrame
+    stubnames : str or list-like
+        The stub name(s). The wide format variables are assumed to
+        start with the stub names.
+    i : str or list-like
+        Column(s) to use as id variable(s)
+    j : str
+        The name of the sub-observation variable. What you wish to name your
+        suffix in the long format.
+    sep : str, default ""
+        A character indicating the separation of the variable names
+        in the wide format, to be stripped from the names in the long format.
+        For example, if your column names are A-suffix1, A-suffix2, you
+        can strip the hyphen by specifying `sep='-'`
+
+        .. versionadded:: 0.20.0
+
+    suffix : str, default '\\d+'
+        A regular expression capturing the wanted suffixes. '\\d+' captures
+        numeric suffixes. Suffixes with no numbers could be specified with the
+        negated character class '\\D+'. You can also further disambiguate
+        suffixes, for example, if your wide variables are of the form
+        A-one, B-two,.., and you have an unrelated column A-rating, you can
+        ignore the last one by specifying `suffix='(!?one|two)'`
+
+        .. versionadded:: 0.20.0
+
+        .. versionchanged:: 0.23.0
+            When all suffixes are numeric, they are cast to int64/float64.
+
+    Returns
+    -------
+    DataFrame
+        A DataFrame that contains each stub name as a variable, with new index
+        (i, j).
+
+    Notes
+    -----
+    All extra variables are left untouched. This simply uses
+    `pandas.melt` under the hood, but is hard-coded to "do the right thing"
+    in a typical case.
+
+    Examples
+    --------
+    >>> np.random.seed(123)
+    >>> df = pd.DataFrame({"A1970" : {0 : "a", 1 : "b", 2 : "c"},
+    ...                    "A1980" : {0 : "d", 1 : "e", 2 : "f"},
+    ...                    "B1970" : {0 : 2.5, 1 : 1.2, 2 : .7},
+    ...                    "B1980" : {0 : 3.2, 1 : 1.3, 2 : .1},
+    ...                    "X"     : dict(zip(range(3), np.random.randn(3)))
+    ...                   })
+    >>> df["id"] = df.index
+    >>> df
+      A1970 A1980  B1970  B1980         X  id
+    0     a     d    2.5    3.2 -1.085631   0
+    1     b     e    1.2    1.3  0.997345   1
+    2     c     f    0.7    0.1  0.282978   2
+    >>> pd.wide_to_long(df, ["A", "B"], i="id", j="year")
+    ... # doctest: +NORMALIZE_WHITESPACE
+                    X  A    B
+    id year
+    0  1970 -1.085631  a  2.5
+    1  1970  0.997345  b  1.2
+    2  1970  0.282978  c  0.7
+    0  1980 -1.085631  d  3.2
+    1  1980  0.997345  e  1.3
+    2  1980  0.282978  f  0.1
+
+    With multiple id columns
+
+    >>> df = pd.DataFrame({
+    ...     'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+    ...     'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+    ...     'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+    ...     'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+    ... })
+    >>> df
+       birth  famid  ht1  ht2
+    0      1      1  2.8  3.4
+    1      2      1  2.9  3.8
+    2      3      1  2.2  2.9
+    3      1      2  2.0  3.2
+    4      2      2  1.8  2.8
+    5      3      2  1.9  2.4
+    6      1      3  2.2  3.3
+    7      2      3  2.3  3.4
+    8      3      3  2.1  2.9
+    >>> l = pd.wide_to_long(df, stubnames='ht', i=['famid', 'birth'], j='age')
+    >>> l
+    ... # doctest: +NORMALIZE_WHITESPACE
+                      ht
+    famid birth age
+    1     1     1    2.8
+                2    3.4
+          2     1    2.9
+                2    3.8
+          3     1    2.2
+                2    2.9
+    2     1     1    2.0
+                2    3.2
+          2     1    1.8
+                2    2.8
+          3     1    1.9
+                2    2.4
+    3     1     1    2.2
+                2    3.3
+          2     1    2.3
+                2    3.4
+          3     1    2.1
+                2    2.9
+
+    Going from long back to wide just takes some creative use of `unstack`
+
+    >>> w = l.unstack()
+    >>> w.columns = w.columns.map('{0[0]}{0[1]}'.format)
+    >>> w.reset_index()
+       famid  birth  ht1  ht2
+    0      1      1  2.8  3.4
+    1      1      2  2.9  3.8
+    2      1      3  2.2  2.9
+    3      2      1  2.0  3.2
+    4      2      2  1.8  2.8
+    5      2      3  1.9  2.4
+    6      3      1  2.2  3.3
+    7      3      2  2.3  3.4
+    8      3      3  2.1  2.9
+
+    Less wieldy column names are also handled
+
+    >>> np.random.seed(0)
+    >>> df = pd.DataFrame({'A(quarterly)-2010': np.random.rand(3),
+    ...                    'A(quarterly)-2011': np.random.rand(3),
+    ...                    'B(quarterly)-2010': np.random.rand(3),
+    ...                    'B(quarterly)-2011': np.random.rand(3),
+    ...                    'X' : np.random.randint(3, size=3)})
+    >>> df['id'] = df.index
+    >>> df # doctest: +NORMALIZE_WHITESPACE, +ELLIPSIS
+       A(quarterly)-2010  A(quarterly)-2011  B(quarterly)-2010  ...
+    0           0.548814           0.544883           0.437587  ...
+    1           0.715189           0.423655           0.891773  ...
+    2           0.602763           0.645894           0.963663  ...
+       X  id
+    0  0   0
+    1  1   1
+    2  1   2
+
+    >>> pd.wide_to_long(df, ['A(quarterly)', 'B(quarterly)'], i='id',
+    ...                 j='year', sep='-')
+    ... # doctest: +NORMALIZE_WHITESPACE
+             X  A(quarterly)  B(quarterly)
+    id year
+    0  2010  0      0.548814     0.437587
+    1  2010  1      0.715189     0.891773
+    2  2010  1      0.602763     0.963663
+    0  2011  0      0.544883     0.383442
+    1  2011  1      0.423655     0.791725
+    2  2011  1      0.645894     0.528895
+
+    If we have many columns, we could also use a regex to find our
+    stubnames and pass that list on to wide_to_long
+
+    >>> stubnames = sorted(
+    ...     set([match[0] for match in df.columns.str.findall(
+    ...         r'[A-B]\(.*\)').values if match != [] ])
+    ... )
+    >>> list(stubnames)
+    ['A(quarterly)', 'B(quarterly)']
+
+    All of the above examples have integers as suffixes. It is possible to
+    have non-integers as suffixes.
+
+    >>> df = pd.DataFrame({
+    ...     'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+    ...     'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+    ...     'ht_one': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+    ...     'ht_two': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+    ... })
+    >>> df
+       birth  famid  ht_one  ht_two
+    0      1      1     2.8     3.4
+    1      2      1     2.9     3.8
+    2      3      1     2.2     2.9
+    3      1      2     2.0     3.2
+    4      2      2     1.8     2.8
+    5      3      2     1.9     2.4
+    6      1      3     2.2     3.3
+    7      2      3     2.3     3.4
+    8      3      3     2.1     2.9
+
+    >>> l = pd.wide_to_long(df, stubnames='ht', i=['famid', 'birth'], j='age',
+                            sep='_', suffix='\w')
+    >>> l
+    ... # doctest: +NORMALIZE_WHITESPACE
+                      ht
+    famid birth age
+    1     1     one  2.8
+                two  3.4
+          2     one  2.9
+                two  3.8
+          3     one  2.2
+                two  2.9
+    2     1     one  2.0
+                two  3.2
+          2     one  1.8
+                two  2.8
+          3     one  1.9
+                two  2.4
+    3     1     one  2.2
+                two  3.3
+          2     one  2.3
+                two  3.4
+          3     one  2.1
+                two  2.9
+    """
+    def get_var_names(df, stub, sep, suffix):
+        regex = r'^{stub}{sep}{suffix}$'.format(
+            stub=re.escape(stub), sep=re.escape(sep), suffix=suffix)
+        pattern = re.compile(regex)
+        return [col for col in df.columns if pattern.match(col)]
+
+    def melt_stub(df, stub, i, j, value_vars, sep):
+        newdf = melt(df, id_vars=i, value_vars=value_vars,
+                     value_name=stub.rstrip(sep), var_name=j)
+        newdf[j] = Categorical(newdf[j])
+        newdf[j] = newdf[j].str.replace(re.escape(stub + sep), "")
+
+        # GH17627 Cast numerics suffixes to int/float
+        newdf[j] = to_numeric(newdf[j], errors='ignore')
+
+        return newdf.set_index(i + [j])
+
+    if not is_list_like(stubnames):
+        stubnames = [stubnames]
+    else:
+        stubnames = list(stubnames)
+
+    if any(col in stubnames for col in df.columns):
+        raise ValueError("stubname can't be identical to a column name")
+
+    if not is_list_like(i):
+        i = [i]
+    else:
+        i = list(i)
+
+    if df[i].duplicated().any():
+        raise ValueError("the id variables need to uniquely identify each row")
+
+    value_vars = [get_var_names(df, stub, sep, suffix) for stub in stubnames]
+
+    value_vars_flattened = [e for sublist in value_vars for e in sublist]
+    id_vars = list(set(df.columns.tolist()).difference(value_vars_flattened))
+
+    melted = [melt_stub(df, s, i, j, v, sep)
+              for s, v in zip(stubnames, value_vars)]
+    melted = melted[0].join(melted[1:], how='outer')
+
+    if len(i) == 1:
+        new = df[id_vars].set_index(i).join(melted)
+        return new
+
+    new = df[id_vars].merge(melted.reset_index(), on=i).set_index(i + [j])
+
+    return new
diff --git a/pandas/core/reshape/merge.py b/pandas/core/reshape/merge.py
new file mode 100644
index 0000000000000..fb50a3c60f705
--- /dev/null
+++ b/pandas/core/reshape/merge.py
@@ -0,0 +1,1799 @@
+"""
+SQL-style merge routines
+"""
+
+import copy
+import string
+import warnings
+
+import numpy as np
+
+from pandas._libs import hashtable as libhashtable, join as libjoin, lib
+import pandas.compat as compat
+from pandas.compat import filter, lzip, map, range, zip
+from pandas.errors import MergeError
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.common import (
+    ensure_float64, ensure_int64, ensure_object, is_array_like, is_bool,
+    is_bool_dtype, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_datetimelike, is_dtype_equal,
+    is_extension_array_dtype, is_float_dtype, is_int64_dtype, is_integer,
+    is_integer_dtype, is_list_like, is_number, is_numeric_dtype,
+    is_object_dtype, needs_i8_conversion)
+from pandas.core.dtypes.missing import isnull, na_value_for_dtype
+
+from pandas import Categorical, DataFrame, Index, MultiIndex, Series, Timedelta
+import pandas.core.algorithms as algos
+from pandas.core.arrays.categorical import _recode_for_categories
+import pandas.core.common as com
+from pandas.core.frame import _merge_doc
+from pandas.core.internals import (
+    concatenate_block_managers, items_overlap_with_suffix)
+import pandas.core.sorting as sorting
+from pandas.core.sorting import is_int64_overflow_possible
+
+
+@Substitution('\nleft : DataFrame')
+@Appender(_merge_doc, indents=0)
+def merge(left, right, how='inner', on=None, left_on=None, right_on=None,
+          left_index=False, right_index=False, sort=False,
+          suffixes=('_x', '_y'), copy=True, indicator=False,
+          validate=None):
+    op = _MergeOperation(left, right, how=how, on=on, left_on=left_on,
+                         right_on=right_on, left_index=left_index,
+                         right_index=right_index, sort=sort, suffixes=suffixes,
+                         copy=copy, indicator=indicator,
+                         validate=validate)
+    return op.get_result()
+
+
+if __debug__:
+    merge.__doc__ = _merge_doc % '\nleft : DataFrame'
+
+
+def _groupby_and_merge(by, on, left, right, _merge_pieces,
+                       check_duplicates=True):
+    """
+    groupby & merge; we are always performing a left-by type operation
+
+    Parameters
+    ----------
+    by: field to group
+    on: duplicates field
+    left: left frame
+    right: right frame
+    _merge_pieces: function for merging
+    check_duplicates: boolean, default True
+        should we check & clean duplicates
+    """
+
+    pieces = []
+    if not isinstance(by, (list, tuple)):
+        by = [by]
+
+    lby = left.groupby(by, sort=False)
+
+    # if we can groupby the rhs
+    # then we can get vastly better perf
+    try:
+
+        # we will check & remove duplicates if indicated
+        if check_duplicates:
+            if on is None:
+                on = []
+            elif not isinstance(on, (list, tuple)):
+                on = [on]
+
+            if right.duplicated(by + on).any():
+                right = right.drop_duplicates(by + on, keep='last')
+        rby = right.groupby(by, sort=False)
+    except KeyError:
+        rby = None
+
+    for key, lhs in lby:
+
+        if rby is None:
+            rhs = right
+        else:
+            try:
+                rhs = right.take(rby.indices[key])
+            except KeyError:
+                # key doesn't exist in left
+                lcols = lhs.columns.tolist()
+                cols = lcols + [r for r in right.columns
+                                if r not in set(lcols)]
+                merged = lhs.reindex(columns=cols)
+                merged.index = range(len(merged))
+                pieces.append(merged)
+                continue
+
+        merged = _merge_pieces(lhs, rhs)
+
+        # make sure join keys are in the merged
+        # TODO, should _merge_pieces do this?
+        for k in by:
+            try:
+                if k in merged:
+                    merged[k] = key
+            except KeyError:
+                pass
+
+        pieces.append(merged)
+
+    # preserve the original order
+    # if we have a missing piece this can be reset
+    from pandas.core.reshape.concat import concat
+    result = concat(pieces, ignore_index=True)
+    result = result.reindex(columns=pieces[0].columns, copy=False)
+    return result, lby
+
+
+def merge_ordered(left, right, on=None,
+                  left_on=None, right_on=None,
+                  left_by=None, right_by=None,
+                  fill_method=None, suffixes=('_x', '_y'),
+                  how='outer'):
+    """Perform merge with optional filling/interpolation designed for ordered
+    data like time series data. Optionally perform group-wise merge (see
+    examples)
+
+    Parameters
+    ----------
+    left : DataFrame
+    right : DataFrame
+    on : label or list
+        Field names to join on. Must be found in both DataFrames.
+    left_on : label or list, or array-like
+        Field names to join on in left DataFrame. Can be a vector or list of
+        vectors of the length of the DataFrame to use a particular vector as
+        the join key instead of columns
+    right_on : label or list, or array-like
+        Field names to join on in right DataFrame or vector/list of vectors per
+        left_on docs
+    left_by : column name or list of column names
+        Group left DataFrame by group columns and merge piece by piece with
+        right DataFrame
+    right_by : column name or list of column names
+        Group right DataFrame by group columns and merge piece by piece with
+        left DataFrame
+    fill_method : {'ffill', None}, default None
+        Interpolation method for data
+    suffixes : Sequence, default is ("_x", "_y")
+        A length-2 sequence where each element is optionally a string
+        indicating the suffix to add to overlapping column names in
+        `left` and `right` respectively. Pass a value of `None` instead
+        of a string to indicate that the column name from `left` or
+        `right` should be left as-is, with no suffix. At least one of the
+        values must not be None.
+
+        .. versionchanged:: 0.25.0
+    how : {'left', 'right', 'outer', 'inner'}, default 'outer'
+        * left: use only keys from left frame (SQL: left outer join)
+        * right: use only keys from right frame (SQL: right outer join)
+        * outer: use union of keys from both frames (SQL: full outer join)
+        * inner: use intersection of keys from both frames (SQL: inner join)
+
+        .. versionadded:: 0.19.0
+
+    Returns
+    -------
+    merged : DataFrame
+        The output type will the be same as 'left', if it is a subclass
+        of DataFrame.
+
+    See Also
+    --------
+    merge
+    merge_asof
+
+    Examples
+    --------
+    >>> A                      >>> B
+          key  lvalue group        key  rvalue
+    0   a       1     a        0     b       1
+    1   c       2     a        1     c       2
+    2   e       3     a        2     d       3
+    3   a       1     b
+    4   c       2     b
+    5   e       3     b
+
+    >>> merge_ordered(A, B, fill_method='ffill', left_by='group')
+      group key  lvalue  rvalue
+    0     a   a       1     NaN
+    1     a   b       1     1.0
+    2     a   c       2     2.0
+    3     a   d       2     3.0
+    4     a   e       3     3.0
+    5     b   a       1     NaN
+    6     b   b       1     1.0
+    7     b   c       2     2.0
+    8     b   d       2     3.0
+    9     b   e       3     3.0
+    """
+    def _merger(x, y):
+        # perform the ordered merge operation
+        op = _OrderedMerge(x, y, on=on, left_on=left_on, right_on=right_on,
+                           suffixes=suffixes, fill_method=fill_method,
+                           how=how)
+        return op.get_result()
+
+    if left_by is not None and right_by is not None:
+        raise ValueError('Can only group either left or right frames')
+    elif left_by is not None:
+        result, _ = _groupby_and_merge(left_by, on, left, right,
+                                       lambda x, y: _merger(x, y),
+                                       check_duplicates=False)
+    elif right_by is not None:
+        result, _ = _groupby_and_merge(right_by, on, right, left,
+                                       lambda x, y: _merger(y, x),
+                                       check_duplicates=False)
+    else:
+        result = _merger(left, right)
+    return result
+
+
+def merge_asof(left, right, on=None,
+               left_on=None, right_on=None,
+               left_index=False, right_index=False,
+               by=None, left_by=None, right_by=None,
+               suffixes=('_x', '_y'),
+               tolerance=None,
+               allow_exact_matches=True,
+               direction='backward'):
+    """Perform an asof merge. This is similar to a left-join except that we
+    match on nearest key rather than equal keys.
+
+    Both DataFrames must be sorted by the key.
+
+    For each row in the left DataFrame:
+
+      - A "backward" search selects the last row in the right DataFrame whose
+        'on' key is less than or equal to the left's key.
+
+      - A "forward" search selects the first row in the right DataFrame whose
+        'on' key is greater than or equal to the left's key.
+
+      - A "nearest" search selects the row in the right DataFrame whose 'on'
+        key is closest in absolute distance to the left's key.
+
+    The default is "backward" and is compatible in versions below 0.20.0.
+    The direction parameter was added in version 0.20.0 and introduces
+    "forward" and "nearest".
+
+    Optionally match on equivalent keys with 'by' before searching with 'on'.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    left : DataFrame
+    right : DataFrame
+    on : label
+        Field name to join on. Must be found in both DataFrames.
+        The data MUST be ordered. Furthermore this must be a numeric column,
+        such as datetimelike, integer, or float. On or left_on/right_on
+        must be given.
+    left_on : label
+        Field name to join on in left DataFrame.
+    right_on : label
+        Field name to join on in right DataFrame.
+    left_index : boolean
+        Use the index of the left DataFrame as the join key.
+
+        .. versionadded:: 0.19.2
+
+    right_index : boolean
+        Use the index of the right DataFrame as the join key.
+
+        .. versionadded:: 0.19.2
+
+    by : column name or list of column names
+        Match on these columns before performing merge operation.
+    left_by : column name
+        Field names to match on in the left DataFrame.
+
+        .. versionadded:: 0.19.2
+
+    right_by : column name
+        Field names to match on in the right DataFrame.
+
+        .. versionadded:: 0.19.2
+
+    suffixes : 2-length sequence (tuple, list, ...)
+        Suffix to apply to overlapping column names in the left and right
+        side, respectively.
+    tolerance : integer or Timedelta, optional, default None
+        Select asof tolerance within this range; must be compatible
+        with the merge index.
+    allow_exact_matches : boolean, default True
+
+        - If True, allow matching with the same 'on' value
+          (i.e. less-than-or-equal-to / greater-than-or-equal-to)
+        - If False, don't match the same 'on' value
+          (i.e., strictly less-than / strictly greater-than)
+
+    direction : 'backward' (default), 'forward', or 'nearest'
+        Whether to search for prior, subsequent, or closest matches.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    merged : DataFrame
+
+    See Also
+    --------
+    merge
+    merge_ordered
+
+    Examples
+    --------
+    >>> left = pd.DataFrame({'a': [1, 5, 10], 'left_val': ['a', 'b', 'c']})
+    >>> left
+        a left_val
+    0   1        a
+    1   5        b
+    2  10        c
+
+    >>> right = pd.DataFrame({'a': [1, 2, 3, 6, 7],
+    ...                       'right_val': [1, 2, 3, 6, 7]})
+    >>> right
+       a  right_val
+    0  1          1
+    1  2          2
+    2  3          3
+    3  6          6
+    4  7          7
+
+    >>> pd.merge_asof(left, right, on='a')
+        a left_val  right_val
+    0   1        a          1
+    1   5        b          3
+    2  10        c          7
+
+    >>> pd.merge_asof(left, right, on='a', allow_exact_matches=False)
+        a left_val  right_val
+    0   1        a        NaN
+    1   5        b        3.0
+    2  10        c        7.0
+
+    >>> pd.merge_asof(left, right, on='a', direction='forward')
+        a left_val  right_val
+    0   1        a        1.0
+    1   5        b        6.0
+    2  10        c        NaN
+
+    >>> pd.merge_asof(left, right, on='a', direction='nearest')
+        a left_val  right_val
+    0   1        a          1
+    1   5        b          6
+    2  10        c          7
+
+    We can use indexed DataFrames as well.
+
+    >>> left = pd.DataFrame({'left_val': ['a', 'b', 'c']}, index=[1, 5, 10])
+    >>> left
+       left_val
+    1         a
+    5         b
+    10        c
+
+    >>> right = pd.DataFrame({'right_val': [1, 2, 3, 6, 7]},
+    ...                      index=[1, 2, 3, 6, 7])
+    >>> right
+       right_val
+    1          1
+    2          2
+    3          3
+    6          6
+    7          7
+
+    >>> pd.merge_asof(left, right, left_index=True, right_index=True)
+       left_val  right_val
+    1         a          1
+    5         b          3
+    10        c          7
+
+    Here is a real-world times-series example
+
+    >>> quotes
+                         time ticker     bid     ask
+    0 2016-05-25 13:30:00.023   GOOG  720.50  720.93
+    1 2016-05-25 13:30:00.023   MSFT   51.95   51.96
+    2 2016-05-25 13:30:00.030   MSFT   51.97   51.98
+    3 2016-05-25 13:30:00.041   MSFT   51.99   52.00
+    4 2016-05-25 13:30:00.048   GOOG  720.50  720.93
+    5 2016-05-25 13:30:00.049   AAPL   97.99   98.01
+    6 2016-05-25 13:30:00.072   GOOG  720.50  720.88
+    7 2016-05-25 13:30:00.075   MSFT   52.01   52.03
+
+    >>> trades
+                         time ticker   price  quantity
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100
+
+    By default we are taking the asof of the quotes
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker')
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+
+    We only asof within 2ms between the quote time and the trade time
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker',
+    ...                       tolerance=pd.Timedelta('2ms'))
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155     NaN     NaN
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+
+    We only asof within 10ms between the quote time and the trade time
+    and we exclude exact matches on time. However *prior* data will
+    propagate forward
+
+    >>> pd.merge_asof(trades, quotes,
+    ...                       on='time',
+    ...                       by='ticker',
+    ...                       tolerance=pd.Timedelta('10ms'),
+    ...                       allow_exact_matches=False)
+                         time ticker   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   MSFT   51.95        75     NaN     NaN
+    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
+    2 2016-05-25 13:30:00.048   GOOG  720.77       100     NaN     NaN
+    3 2016-05-25 13:30:00.048   GOOG  720.92       100     NaN     NaN
+    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
+    """
+    op = _AsOfMerge(left, right,
+                    on=on, left_on=left_on, right_on=right_on,
+                    left_index=left_index, right_index=right_index,
+                    by=by, left_by=left_by, right_by=right_by,
+                    suffixes=suffixes,
+                    how='asof', tolerance=tolerance,
+                    allow_exact_matches=allow_exact_matches,
+                    direction=direction)
+    return op.get_result()
+
+
+# TODO: transformations??
+# TODO: only copy DataFrames when modification necessary
+class _MergeOperation(object):
+    """
+    Perform a database (SQL) merge operation between two DataFrame objects
+    using either columns as keys or their row indexes
+    """
+    _merge_type = 'merge'
+
+    def __init__(self, left, right, how='inner', on=None,
+                 left_on=None, right_on=None, axis=1,
+                 left_index=False, right_index=False, sort=True,
+                 suffixes=('_x', '_y'), copy=True, indicator=False,
+                 validate=None):
+        left = validate_operand(left)
+        right = validate_operand(right)
+        self.left = self.orig_left = left
+        self.right = self.orig_right = right
+        self.how = how
+        self.axis = axis
+
+        self.on = com.maybe_make_list(on)
+        self.left_on = com.maybe_make_list(left_on)
+        self.right_on = com.maybe_make_list(right_on)
+
+        self.copy = copy
+        self.suffixes = suffixes
+        self.sort = sort
+
+        self.left_index = left_index
+        self.right_index = right_index
+
+        self.indicator = indicator
+
+        if isinstance(self.indicator, compat.string_types):
+            self.indicator_name = self.indicator
+        elif isinstance(self.indicator, bool):
+            self.indicator_name = '_merge' if self.indicator else None
+        else:
+            raise ValueError(
+                'indicator option can only accept boolean or string arguments')
+
+        if not is_bool(left_index):
+            raise ValueError(
+                'left_index parameter must be of type bool, not '
+                '{left_index}'.format(left_index=type(left_index)))
+        if not is_bool(right_index):
+            raise ValueError(
+                'right_index parameter must be of type bool, not '
+                '{right_index}'.format(right_index=type(right_index)))
+
+        # warn user when merging between different levels
+        if left.columns.nlevels != right.columns.nlevels:
+            msg = ('merging between different levels can give an unintended '
+                   'result ({left} levels on the left, {right} on the right)'
+                   ).format(left=left.columns.nlevels,
+                            right=right.columns.nlevels)
+            warnings.warn(msg, UserWarning)
+
+        self._validate_specification()
+
+        # note this function has side effects
+        (self.left_join_keys,
+         self.right_join_keys,
+         self.join_names) = self._get_merge_keys()
+
+        # validate the merge keys dtypes. We may need to coerce
+        # to avoid incompat dtypes
+        self._maybe_coerce_merge_keys()
+
+        # If argument passed to validate,
+        # check if columns specified as unique
+        # are in fact unique.
+        if validate is not None:
+            self._validate(validate)
+
+    def get_result(self):
+        if self.indicator:
+            self.left, self.right = self._indicator_pre_merge(
+                self.left, self.right)
+
+        join_index, left_indexer, right_indexer = self._get_join_info()
+
+        ldata, rdata = self.left._data, self.right._data
+        lsuf, rsuf = self.suffixes
+
+        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
+                                                     rdata.items, rsuf)
+
+        lindexers = {1: left_indexer} if left_indexer is not None else {}
+        rindexers = {1: right_indexer} if right_indexer is not None else {}
+
+        result_data = concatenate_block_managers(
+            [(ldata, lindexers), (rdata, rindexers)],
+            axes=[llabels.append(rlabels), join_index],
+            concat_axis=0, copy=self.copy)
+
+        typ = self.left._constructor
+        result = typ(result_data).__finalize__(self, method=self._merge_type)
+
+        if self.indicator:
+            result = self._indicator_post_merge(result)
+
+        self._maybe_add_join_keys(result, left_indexer, right_indexer)
+
+        self._maybe_restore_index_levels(result)
+
+        return result
+
+    def _indicator_pre_merge(self, left, right):
+
+        columns = left.columns.union(right.columns)
+
+        for i in ['_left_indicator', '_right_indicator']:
+            if i in columns:
+                raise ValueError("Cannot use `indicator=True` option when "
+                                 "data contains a column named {name}"
+                                 .format(name=i))
+        if self.indicator_name in columns:
+            raise ValueError(
+                "Cannot use name of an existing column for indicator column")
+
+        left = left.copy()
+        right = right.copy()
+
+        left['_left_indicator'] = 1
+        left['_left_indicator'] = left['_left_indicator'].astype('int8')
+
+        right['_right_indicator'] = 2
+        right['_right_indicator'] = right['_right_indicator'].astype('int8')
+
+        return left, right
+
+    def _indicator_post_merge(self, result):
+
+        result['_left_indicator'] = result['_left_indicator'].fillna(0)
+        result['_right_indicator'] = result['_right_indicator'].fillna(0)
+
+        result[self.indicator_name] = Categorical((result['_left_indicator'] +
+                                                   result['_right_indicator']),
+                                                  categories=[1, 2, 3])
+        result[self.indicator_name] = (
+            result[self.indicator_name]
+            .cat.rename_categories(['left_only', 'right_only', 'both']))
+
+        result = result.drop(labels=['_left_indicator', '_right_indicator'],
+                             axis=1)
+        return result
+
+    def _maybe_restore_index_levels(self, result):
+        """
+        Restore index levels specified as `on` parameters
+
+        Here we check for cases where `self.left_on` and `self.right_on` pairs
+        each reference an index level in their respective DataFrames. The
+        joined columns corresponding to these pairs are then restored to the
+        index of `result`.
+
+        **Note:** This method has side effects. It modifies `result` in-place
+
+        Parameters
+        ----------
+        result: DataFrame
+            merge result
+
+        Returns
+        -------
+        None
+        """
+        names_to_restore = []
+        for name, left_key, right_key in zip(self.join_names,
+                                             self.left_on,
+                                             self.right_on):
+            if (self.orig_left._is_level_reference(left_key) and
+                    self.orig_right._is_level_reference(right_key) and
+                    name not in result.index.names):
+
+                names_to_restore.append(name)
+
+        if names_to_restore:
+            result.set_index(names_to_restore, inplace=True)
+
+    def _maybe_add_join_keys(self, result, left_indexer, right_indexer):
+
+        left_has_missing = None
+        right_has_missing = None
+
+        keys = zip(self.join_names, self.left_on, self.right_on)
+        for i, (name, lname, rname) in enumerate(keys):
+            if not _should_fill(lname, rname):
+                continue
+
+            take_left, take_right = None, None
+
+            if name in result:
+
+                if left_indexer is not None and right_indexer is not None:
+                    if name in self.left:
+
+                        if left_has_missing is None:
+                            left_has_missing = (left_indexer == -1).any()
+
+                        if left_has_missing:
+                            take_right = self.right_join_keys[i]
+
+                            if not is_dtype_equal(result[name].dtype,
+                                                  self.left[name].dtype):
+                                take_left = self.left[name]._values
+
+                    elif name in self.right:
+
+                        if right_has_missing is None:
+                            right_has_missing = (right_indexer == -1).any()
+
+                        if right_has_missing:
+                            take_left = self.left_join_keys[i]
+
+                            if not is_dtype_equal(result[name].dtype,
+                                                  self.right[name].dtype):
+                                take_right = self.right[name]._values
+
+            elif left_indexer is not None \
+                    and is_array_like(self.left_join_keys[i]):
+                take_left = self.left_join_keys[i]
+                take_right = self.right_join_keys[i]
+
+            if take_left is not None or take_right is not None:
+
+                if take_left is None:
+                    lvals = result[name]._values
+                else:
+                    lfill = na_value_for_dtype(take_left.dtype)
+                    lvals = algos.take_1d(take_left, left_indexer,
+                                          fill_value=lfill)
+
+                if take_right is None:
+                    rvals = result[name]._values
+                else:
+                    rfill = na_value_for_dtype(take_right.dtype)
+                    rvals = algos.take_1d(take_right, right_indexer,
+                                          fill_value=rfill)
+
+                # if we have an all missing left_indexer
+                # make sure to just use the right values
+                mask = left_indexer == -1
+                if mask.all():
+                    key_col = rvals
+                else:
+                    key_col = Index(lvals).where(~mask, rvals)
+
+                if result._is_label_reference(name):
+                    result[name] = key_col
+                elif result._is_level_reference(name):
+                    if isinstance(result.index, MultiIndex):
+                        key_col.name = name
+                        idx_list = [result.index.get_level_values(level_name)
+                                    if level_name != name else key_col
+                                    for level_name in result.index.names]
+
+                        result.set_index(idx_list, inplace=True)
+                    else:
+                        result.index = Index(key_col, name=name)
+                else:
+                    result.insert(i, name or 'key_{i}'.format(i=i), key_col)
+
+    def _get_join_indexers(self):
+        """ return the join indexers """
+        return _get_join_indexers(self.left_join_keys,
+                                  self.right_join_keys,
+                                  sort=self.sort,
+                                  how=self.how)
+
+    def _get_join_info(self):
+        left_ax = self.left._data.axes[self.axis]
+        right_ax = self.right._data.axes[self.axis]
+
+        if self.left_index and self.right_index and self.how != 'asof':
+            join_index, left_indexer, right_indexer = \
+                left_ax.join(right_ax, how=self.how, return_indexers=True,
+                             sort=self.sort)
+        elif self.right_index and self.how == 'left':
+            join_index, left_indexer, right_indexer = \
+                _left_join_on_index(left_ax, right_ax, self.left_join_keys,
+                                    sort=self.sort)
+
+        elif self.left_index and self.how == 'right':
+            join_index, right_indexer, left_indexer = \
+                _left_join_on_index(right_ax, left_ax, self.right_join_keys,
+                                    sort=self.sort)
+        else:
+            (left_indexer,
+             right_indexer) = self._get_join_indexers()
+
+            if self.right_index:
+                if len(self.left) > 0:
+                    join_index = self._create_join_index(self.left.index,
+                                                         self.right.index,
+                                                         left_indexer,
+                                                         right_indexer,
+                                                         how='right')
+                else:
+                    join_index = self.right.index.take(right_indexer)
+                    left_indexer = np.array([-1] * len(join_index))
+            elif self.left_index:
+                if len(self.right) > 0:
+                    join_index = self._create_join_index(self.right.index,
+                                                         self.left.index,
+                                                         right_indexer,
+                                                         left_indexer,
+                                                         how='left')
+                else:
+                    join_index = self.left.index.take(left_indexer)
+                    right_indexer = np.array([-1] * len(join_index))
+            else:
+                join_index = Index(np.arange(len(left_indexer)))
+
+        if len(join_index) == 0:
+            join_index = join_index.astype(object)
+        return join_index, left_indexer, right_indexer
+
+    def _create_join_index(self, index, other_index, indexer,
+                           other_indexer, how='left'):
+        """
+        Create a join index by rearranging one index to match another
+
+        Parameters
+        ----------
+        index: Index being rearranged
+        other_index: Index used to supply values not found in index
+        indexer: how to rearrange index
+        how: replacement is only necessary if indexer based on other_index
+
+        Returns
+        -------
+        join_index
+        """
+        join_index = index.take(indexer)
+        if (self.how in (how, 'outer') and
+                not isinstance(other_index, MultiIndex)):
+            # if final index requires values in other_index but not target
+            # index, indexer may hold missing (-1) values, causing Index.take
+            # to take the final value in target index
+            mask = indexer == -1
+            if np.any(mask):
+                # if values missing (-1) from target index,
+                # take from other_index instead
+                join_list = join_index.to_numpy()
+                other_list = other_index.take(other_indexer).to_numpy()
+                join_list[mask] = other_list[mask]
+                join_index = Index(join_list, dtype=join_index.dtype,
+                                   name=join_index.name)
+        return join_index
+
+    def _get_merge_keys(self):
+        """
+        Note: has side effects (copy/delete key columns)
+
+        Parameters
+        ----------
+        left
+        right
+        on
+
+        Returns
+        -------
+        left_keys, right_keys
+        """
+        left_keys = []
+        right_keys = []
+        join_names = []
+        right_drop = []
+        left_drop = []
+
+        left, right = self.left, self.right
+
+        is_lkey = lambda x: is_array_like(x) and len(x) == len(left)
+        is_rkey = lambda x: is_array_like(x) and len(x) == len(right)
+
+        # Note that pd.merge_asof() has separate 'on' and 'by' parameters. A
+        # user could, for example, request 'left_index' and 'left_by'. In a
+        # regular pd.merge(), users cannot specify both 'left_index' and
+        # 'left_on'. (Instead, users have a MultiIndex). That means the
+        # self.left_on in this function is always empty in a pd.merge(), but
+        # a pd.merge_asof(left_index=True, left_by=...) will result in a
+        # self.left_on array with a None in the middle of it. This requires
+        # a work-around as designated in the code below.
+        # See _validate_specification() for where this happens.
+
+        # ugh, spaghetti re #733
+        if _any(self.left_on) and _any(self.right_on):
+            for lk, rk in zip(self.left_on, self.right_on):
+                if is_lkey(lk):
+                    left_keys.append(lk)
+                    if is_rkey(rk):
+                        right_keys.append(rk)
+                        join_names.append(None)  # what to do?
+                    else:
+                        if rk is not None:
+                            right_keys.append(
+                                right._get_label_or_level_values(rk))
+                            join_names.append(rk)
+                        else:
+                            # work-around for merge_asof(right_index=True)
+                            right_keys.append(right.index)
+                            join_names.append(right.index.name)
+                else:
+                    if not is_rkey(rk):
+                        if rk is not None:
+                            right_keys.append(
+                                right._get_label_or_level_values(rk))
+                        else:
+                            # work-around for merge_asof(right_index=True)
+                            right_keys.append(right.index)
+                        if lk is not None and lk == rk:
+                            # avoid key upcast in corner case (length-0)
+                            if len(left) > 0:
+                                right_drop.append(rk)
+                            else:
+                                left_drop.append(lk)
+                    else:
+                        right_keys.append(rk)
+                    if lk is not None:
+                        left_keys.append(left._get_label_or_level_values(lk))
+                        join_names.append(lk)
+                    else:
+                        # work-around for merge_asof(left_index=True)
+                        left_keys.append(left.index)
+                        join_names.append(left.index.name)
+        elif _any(self.left_on):
+            for k in self.left_on:
+                if is_lkey(k):
+                    left_keys.append(k)
+                    join_names.append(None)
+                else:
+                    left_keys.append(left._get_label_or_level_values(k))
+                    join_names.append(k)
+            if isinstance(self.right.index, MultiIndex):
+                right_keys = [lev._values.take(lev_codes) for lev, lev_codes
+                              in zip(self.right.index.levels,
+                                     self.right.index.codes)]
+            else:
+                right_keys = [self.right.index._values]
+        elif _any(self.right_on):
+            for k in self.right_on:
+                if is_rkey(k):
+                    right_keys.append(k)
+                    join_names.append(None)
+                else:
+                    right_keys.append(right._get_label_or_level_values(k))
+                    join_names.append(k)
+            if isinstance(self.left.index, MultiIndex):
+                left_keys = [lev._values.take(lev_codes) for lev, lev_codes
+                             in zip(self.left.index.levels,
+                                    self.left.index.codes)]
+            else:
+                left_keys = [self.left.index.values]
+
+        if left_drop:
+            self.left = self.left._drop_labels_or_levels(left_drop)
+
+        if right_drop:
+            self.right = self.right._drop_labels_or_levels(right_drop)
+
+        return left_keys, right_keys, join_names
+
+    def _maybe_coerce_merge_keys(self):
+        # we have valid mergees but we may have to further
+        # coerce these if they are originally incompatible types
+        #
+        # for example if these are categorical, but are not dtype_equal
+        # or if we have object and integer dtypes
+
+        for lk, rk, name in zip(self.left_join_keys,
+                                self.right_join_keys,
+                                self.join_names):
+            if (len(lk) and not len(rk)) or (not len(lk) and len(rk)):
+                continue
+
+            lk_is_cat = is_categorical_dtype(lk)
+            rk_is_cat = is_categorical_dtype(rk)
+            lk_is_object = is_object_dtype(lk)
+            rk_is_object = is_object_dtype(rk)
+
+            # if either left or right is a categorical
+            # then the must match exactly in categories & ordered
+            if lk_is_cat and rk_is_cat:
+                if lk.is_dtype_equal(rk):
+                    continue
+
+            elif lk_is_cat or rk_is_cat:
+                pass
+
+            elif is_dtype_equal(lk.dtype, rk.dtype):
+                continue
+
+            msg = ("You are trying to merge on {lk_dtype} and "
+                   "{rk_dtype} columns. If you wish to proceed "
+                   "you should use pd.concat".format(lk_dtype=lk.dtype,
+                                                     rk_dtype=rk.dtype))
+
+            # if we are numeric, then allow differing
+            # kinds to proceed, eg. int64 and int8, int and float
+            # further if we are object, but we infer to
+            # the same, then proceed
+            if is_numeric_dtype(lk) and is_numeric_dtype(rk):
+                if lk.dtype.kind == rk.dtype.kind:
+                    continue
+
+                # check whether ints and floats
+                elif is_integer_dtype(rk) and is_float_dtype(lk):
+                    if not (lk == lk.astype(rk.dtype))[~np.isnan(lk)].all():
+                        warnings.warn('You are merging on int and float '
+                                      'columns where the float values '
+                                      'are not equal to their int '
+                                      'representation', UserWarning)
+                    continue
+
+                elif is_float_dtype(rk) and is_integer_dtype(lk):
+                    if not (rk == rk.astype(lk.dtype))[~np.isnan(rk)].all():
+                        warnings.warn('You are merging on int and float '
+                                      'columns where the float values '
+                                      'are not equal to their int '
+                                      'representation', UserWarning)
+                    continue
+
+                # let's infer and see if we are ok
+                elif (lib.infer_dtype(lk, skipna=False)
+                      == lib.infer_dtype(rk, skipna=False)):
+                    continue
+
+            # Check if we are trying to merge on obviously
+            # incompatible dtypes GH 9780, GH 15800
+
+            # bool values are coerced to object
+            elif ((lk_is_object and is_bool_dtype(rk)) or
+                  (is_bool_dtype(lk) and rk_is_object)):
+                pass
+
+            # object values are allowed to be merged
+            elif ((lk_is_object and is_numeric_dtype(rk)) or
+                  (is_numeric_dtype(lk) and rk_is_object)):
+                inferred_left = lib.infer_dtype(lk, skipna=False)
+                inferred_right = lib.infer_dtype(rk, skipna=False)
+                bool_types = ['integer', 'mixed-integer', 'boolean', 'empty']
+                string_types = ['string', 'unicode', 'mixed', 'bytes', 'empty']
+
+                # inferred bool
+                if (inferred_left in bool_types and
+                        inferred_right in bool_types):
+                    pass
+
+                # unless we are merging non-string-like with string-like
+                elif ((inferred_left in string_types and
+                       inferred_right not in string_types) or
+                      (inferred_right in string_types and
+                       inferred_left not in string_types)):
+                    raise ValueError(msg)
+
+            # datetimelikes must match exactly
+            elif is_datetimelike(lk) and not is_datetimelike(rk):
+                raise ValueError(msg)
+            elif not is_datetimelike(lk) and is_datetimelike(rk):
+                raise ValueError(msg)
+            elif is_datetime64tz_dtype(lk) and not is_datetime64tz_dtype(rk):
+                raise ValueError(msg)
+            elif not is_datetime64tz_dtype(lk) and is_datetime64tz_dtype(rk):
+                raise ValueError(msg)
+
+            elif lk_is_object and rk_is_object:
+                continue
+
+            # Houston, we have a problem!
+            # let's coerce to object if the dtypes aren't
+            # categorical, otherwise coerce to the category
+            # dtype. If we coerced categories to object,
+            # then we would lose type information on some
+            # columns, and end up trying to merge
+            # incompatible dtypes. See GH 16900.
+            if name in self.left.columns:
+                typ = lk.categories.dtype if lk_is_cat else object
+                self.left = self.left.assign(
+                    **{name: self.left[name].astype(typ)})
+            if name in self.right.columns:
+                typ = rk.categories.dtype if rk_is_cat else object
+                self.right = self.right.assign(
+                    **{name: self.right[name].astype(typ)})
+
+    def _validate_specification(self):
+        # Hm, any way to make this logic less complicated??
+        if self.on is None and self.left_on is None and self.right_on is None:
+
+            if self.left_index and self.right_index:
+                self.left_on, self.right_on = (), ()
+            elif self.left_index:
+                if self.right_on is None:
+                    raise MergeError('Must pass right_on or right_index=True')
+            elif self.right_index:
+                if self.left_on is None:
+                    raise MergeError('Must pass left_on or left_index=True')
+            else:
+                # use the common columns
+                common_cols = self.left.columns.intersection(
+                    self.right.columns)
+                if len(common_cols) == 0:
+                    raise MergeError(
+                        'No common columns to perform merge on. '
+                        'Merge options: left_on={lon}, right_on={ron}, '
+                        'left_index={lidx}, right_index={ridx}'
+                        .format(lon=self.left_on, ron=self.right_on,
+                                lidx=self.left_index, ridx=self.right_index))
+                if not common_cols.is_unique:
+                    raise MergeError("Data columns not unique: {common!r}"
+                                     .format(common=common_cols))
+                self.left_on = self.right_on = common_cols
+        elif self.on is not None:
+            if self.left_on is not None or self.right_on is not None:
+                raise MergeError('Can only pass argument "on" OR "left_on" '
+                                 'and "right_on", not a combination of both.')
+            self.left_on = self.right_on = self.on
+        elif self.left_on is not None:
+            n = len(self.left_on)
+            if self.right_index:
+                if len(self.left_on) != self.right.index.nlevels:
+                    raise ValueError('len(left_on) must equal the number '
+                                     'of levels in the index of "right"')
+                self.right_on = [None] * n
+        elif self.right_on is not None:
+            n = len(self.right_on)
+            if self.left_index:
+                if len(self.right_on) != self.left.index.nlevels:
+                    raise ValueError('len(right_on) must equal the number '
+                                     'of levels in the index of "left"')
+                self.left_on = [None] * n
+        if len(self.right_on) != len(self.left_on):
+            raise ValueError("len(right_on) must equal len(left_on)")
+
+    def _validate(self, validate):
+
+        # Check uniqueness of each
+        if self.left_index:
+            left_unique = self.orig_left.index.is_unique
+        else:
+            left_unique = MultiIndex.from_arrays(self.left_join_keys
+                                                 ).is_unique
+
+        if self.right_index:
+            right_unique = self.orig_right.index.is_unique
+        else:
+            right_unique = MultiIndex.from_arrays(self.right_join_keys
+                                                  ).is_unique
+
+        # Check data integrity
+        if validate in ["one_to_one", "1:1"]:
+            if not left_unique and not right_unique:
+                raise MergeError("Merge keys are not unique in either left"
+                                 " or right dataset; not a one-to-one merge")
+            elif not left_unique:
+                raise MergeError("Merge keys are not unique in left dataset;"
+                                 " not a one-to-one merge")
+            elif not right_unique:
+                raise MergeError("Merge keys are not unique in right dataset;"
+                                 " not a one-to-one merge")
+
+        elif validate in ["one_to_many", "1:m"]:
+            if not left_unique:
+                raise MergeError("Merge keys are not unique in left dataset;"
+                                 " not a one-to-many merge")
+
+        elif validate in ["many_to_one", "m:1"]:
+            if not right_unique:
+                raise MergeError("Merge keys are not unique in right dataset;"
+                                 " not a many-to-one merge")
+
+        elif validate in ['many_to_many', 'm:m']:
+            pass
+
+        else:
+            raise ValueError("Not a valid argument for validate")
+
+
+def _get_join_indexers(left_keys, right_keys, sort=False, how='inner',
+                       **kwargs):
+    """
+
+    Parameters
+    ----------
+    left_keys: ndarray, Index, Series
+    right_keys: ndarray, Index, Series
+    sort: boolean, default False
+    how: string {'inner', 'outer', 'left', 'right'}, default 'inner'
+
+    Returns
+    -------
+    tuple of (left_indexer, right_indexer)
+        indexers into the left_keys, right_keys
+
+    """
+    from functools import partial
+
+    assert len(left_keys) == len(right_keys), \
+        'left_key and right_keys must be the same length'
+
+    # bind `sort` arg. of _factorize_keys
+    fkeys = partial(_factorize_keys, sort=sort)
+
+    # get left & right join labels and num. of levels at each location
+    llab, rlab, shape = map(list, zip(* map(fkeys, left_keys, right_keys)))
+
+    # get flat i8 keys from label lists
+    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
+
+    # factorize keys to a dense i8 space
+    # `count` is the num. of unique keys
+    # set(lkey) | set(rkey) == range(count)
+    lkey, rkey, count = fkeys(lkey, rkey)
+
+    # preserve left frame order if how == 'left' and sort == False
+    kwargs = copy.copy(kwargs)
+    if how == 'left':
+        kwargs['sort'] = sort
+    join_func = _join_functions[how]
+
+    return join_func(lkey, rkey, count, **kwargs)
+
+
+def _restore_dropped_levels_multijoin(left, right, dropped_level_names,
+                                      join_index, lindexer, rindexer):
+    """
+    *this is an internal non-public method*
+
+    Returns the levels, labels and names of a multi-index to multi-index join.
+    Depending on the type of join, this method restores the appropriate
+    dropped levels of the joined multi-index.
+    The method relies on lidx, rindexer which hold the index positions of
+    left and right, where a join was feasible
+
+    Parameters
+    ----------
+    left : MultiIndex
+        left index
+    right : MultiIndex
+        right index
+    dropped_level_names : str array
+        list of non-common level names
+    join_index : MultiIndex
+        the index of the join between the
+        common levels of left and right
+    lindexer : intp array
+        left indexer
+    rindexer : intp array
+        right indexer
+
+    Returns
+    -------
+    levels : list of Index
+        levels of combined multiindexes
+    labels : intp array
+        labels of combined multiindexes
+    names : str array
+        names of combined multiindexes
+
+    """
+
+    def _convert_to_mulitindex(index):
+        if isinstance(index, MultiIndex):
+            return index
+        else:
+            return MultiIndex.from_arrays([index.values],
+                                          names=[index.name])
+
+    # For multi-multi joins with one overlapping level,
+    # the returned index if of type Index
+    # Assure that join_index is of type MultiIndex
+    # so that dropped levels can be appended
+    join_index = _convert_to_mulitindex(join_index)
+
+    join_levels = join_index.levels
+    join_codes = join_index.codes
+    join_names = join_index.names
+
+    # lindexer and rindexer hold the indexes where the join occurred
+    # for left and right respectively. If left/right is None then
+    # the join occurred on all indices of left/right
+    if lindexer is None:
+        lindexer = range(left.size)
+
+    if rindexer is None:
+        rindexer = range(right.size)
+
+    # Iterate through the levels that must be restored
+    for dropped_level_name in dropped_level_names:
+        if dropped_level_name in left.names:
+            idx = left
+            indexer = lindexer
+        else:
+            idx = right
+            indexer = rindexer
+
+        # The index of the level name to be restored
+        name_idx = idx.names.index(dropped_level_name)
+
+        restore_levels = idx.levels[name_idx]
+        # Inject -1 in the codes list where a join was not possible
+        # IOW indexer[i]=-1
+        codes = idx.codes[name_idx]
+        restore_codes = algos.take_nd(codes, indexer, fill_value=-1)
+
+        join_levels = join_levels + [restore_levels]
+        join_codes = join_codes + [restore_codes]
+        join_names = join_names + [dropped_level_name]
+
+    return join_levels, join_codes, join_names
+
+
+class _OrderedMerge(_MergeOperation):
+    _merge_type = 'ordered_merge'
+
+    def __init__(self, left, right, on=None, left_on=None, right_on=None,
+                 left_index=False, right_index=False, axis=1,
+                 suffixes=('_x', '_y'), copy=True,
+                 fill_method=None, how='outer'):
+
+        self.fill_method = fill_method
+        _MergeOperation.__init__(self, left, right, on=on, left_on=left_on,
+                                 left_index=left_index,
+                                 right_index=right_index,
+                                 right_on=right_on, axis=axis,
+                                 how=how, suffixes=suffixes,
+                                 sort=True  # factorize sorts
+                                 )
+
+    def get_result(self):
+        join_index, left_indexer, right_indexer = self._get_join_info()
+
+        # this is a bit kludgy
+        ldata, rdata = self.left._data, self.right._data
+        lsuf, rsuf = self.suffixes
+
+        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
+                                                     rdata.items, rsuf)
+
+        if self.fill_method == 'ffill':
+            left_join_indexer = libjoin.ffill_indexer(left_indexer)
+            right_join_indexer = libjoin.ffill_indexer(right_indexer)
+        else:
+            left_join_indexer = left_indexer
+            right_join_indexer = right_indexer
+
+        lindexers = {
+            1: left_join_indexer} if left_join_indexer is not None else {}
+        rindexers = {
+            1: right_join_indexer} if right_join_indexer is not None else {}
+
+        result_data = concatenate_block_managers(
+            [(ldata, lindexers), (rdata, rindexers)],
+            axes=[llabels.append(rlabels), join_index],
+            concat_axis=0, copy=self.copy)
+
+        typ = self.left._constructor
+        result = typ(result_data).__finalize__(self, method=self._merge_type)
+
+        self._maybe_add_join_keys(result, left_indexer, right_indexer)
+
+        return result
+
+
+def _asof_function(direction):
+    name = 'asof_join_{dir}'.format(dir=direction)
+    return getattr(libjoin, name, None)
+
+
+def _asof_by_function(direction):
+    name = 'asof_join_{dir}_on_X_by_Y'.format(dir=direction)
+    return getattr(libjoin, name, None)
+
+
+_type_casters = {
+    'int64_t': ensure_int64,
+    'double': ensure_float64,
+    'object': ensure_object,
+}
+
+
+def _get_cython_type_upcast(dtype):
+    """ Upcast a dtype to 'int64_t', 'double', or 'object' """
+    if is_integer_dtype(dtype):
+        return 'int64_t'
+    elif is_float_dtype(dtype):
+        return 'double'
+    else:
+        return 'object'
+
+
+class _AsOfMerge(_OrderedMerge):
+    _merge_type = 'asof_merge'
+
+    def __init__(self, left, right, on=None, left_on=None, right_on=None,
+                 left_index=False, right_index=False,
+                 by=None, left_by=None, right_by=None,
+                 axis=1, suffixes=('_x', '_y'), copy=True,
+                 fill_method=None,
+                 how='asof', tolerance=None,
+                 allow_exact_matches=True,
+                 direction='backward'):
+
+        self.by = by
+        self.left_by = left_by
+        self.right_by = right_by
+        self.tolerance = tolerance
+        self.allow_exact_matches = allow_exact_matches
+        self.direction = direction
+
+        _OrderedMerge.__init__(self, left, right, on=on, left_on=left_on,
+                               right_on=right_on, left_index=left_index,
+                               right_index=right_index, axis=axis,
+                               how=how, suffixes=suffixes,
+                               fill_method=fill_method)
+
+    def _validate_specification(self):
+        super(_AsOfMerge, self)._validate_specification()
+
+        # we only allow on to be a single item for on
+        if len(self.left_on) != 1 and not self.left_index:
+            raise MergeError("can only asof on a key for left")
+
+        if len(self.right_on) != 1 and not self.right_index:
+            raise MergeError("can only asof on a key for right")
+
+        if self.left_index and isinstance(self.left.index, MultiIndex):
+            raise MergeError("left can only have one index")
+
+        if self.right_index and isinstance(self.right.index, MultiIndex):
+            raise MergeError("right can only have one index")
+
+        # set 'by' columns
+        if self.by is not None:
+            if self.left_by is not None or self.right_by is not None:
+                raise MergeError('Can only pass by OR left_by '
+                                 'and right_by')
+            self.left_by = self.right_by = self.by
+        if self.left_by is None and self.right_by is not None:
+            raise MergeError('missing left_by')
+        if self.left_by is not None and self.right_by is None:
+            raise MergeError('missing right_by')
+
+        # add 'by' to our key-list so we can have it in the
+        # output as a key
+        if self.left_by is not None:
+            if not is_list_like(self.left_by):
+                self.left_by = [self.left_by]
+            if not is_list_like(self.right_by):
+                self.right_by = [self.right_by]
+
+            if len(self.left_by) != len(self.right_by):
+                raise MergeError('left_by and right_by must be same length')
+
+            self.left_on = self.left_by + list(self.left_on)
+            self.right_on = self.right_by + list(self.right_on)
+
+        # check 'direction' is valid
+        if self.direction not in ['backward', 'forward', 'nearest']:
+            raise MergeError('direction invalid: {direction}'
+                             .format(direction=self.direction))
+
+    @property
+    def _asof_key(self):
+        """ This is our asof key, the 'on' """
+        return self.left_on[-1]
+
+    def _get_merge_keys(self):
+
+        # note this function has side effects
+        (left_join_keys,
+         right_join_keys,
+         join_names) = super(_AsOfMerge, self)._get_merge_keys()
+
+        # validate index types are the same
+        for i, (lk, rk) in enumerate(zip(left_join_keys, right_join_keys)):
+            if not is_dtype_equal(lk.dtype, rk.dtype):
+                raise MergeError("incompatible merge keys [{i}] {lkdtype} and "
+                                 "{rkdtype}, must be the same type"
+                                 .format(i=i, lkdtype=lk.dtype,
+                                         rkdtype=rk.dtype))
+
+        # validate tolerance; must be a Timedelta if we have a DTI
+        if self.tolerance is not None:
+
+            if self.left_index:
+                lt = self.left.index
+            else:
+                lt = left_join_keys[-1]
+
+            msg = ("incompatible tolerance {tolerance}, must be compat "
+                   "with type {lkdtype}".format(
+                       tolerance=type(self.tolerance),
+                       lkdtype=lt.dtype))
+
+            if is_datetime64_dtype(lt) or is_datetime64tz_dtype(lt):
+                if not isinstance(self.tolerance, Timedelta):
+                    raise MergeError(msg)
+                if self.tolerance < Timedelta(0):
+                    raise MergeError("tolerance must be positive")
+
+            elif is_int64_dtype(lt):
+                if not is_integer(self.tolerance):
+                    raise MergeError(msg)
+                if self.tolerance < 0:
+                    raise MergeError("tolerance must be positive")
+
+            elif is_float_dtype(lt):
+                if not is_number(self.tolerance):
+                    raise MergeError(msg)
+                if self.tolerance < 0:
+                    raise MergeError("tolerance must be positive")
+
+            else:
+                raise MergeError("key must be integer, timestamp or float")
+
+        # validate allow_exact_matches
+        if not is_bool(self.allow_exact_matches):
+            msg = "allow_exact_matches must be boolean, passed {passed}"
+            raise MergeError(msg.format(passed=self.allow_exact_matches))
+
+        return left_join_keys, right_join_keys, join_names
+
+    def _get_join_indexers(self):
+        """ return the join indexers """
+
+        def flip(xs):
+            """ unlike np.transpose, this returns an array of tuples """
+            labels = list(string.ascii_lowercase[:len(xs)])
+            dtypes = [x.dtype for x in xs]
+            labeled_dtypes = list(zip(labels, dtypes))
+            return np.array(lzip(*xs), labeled_dtypes)
+
+        # values to compare
+        left_values = (self.left.index.values if self.left_index else
+                       self.left_join_keys[-1])
+        right_values = (self.right.index.values if self.right_index else
+                        self.right_join_keys[-1])
+        tolerance = self.tolerance
+
+        # we require sortedness and non-null values in the join keys
+        msg_sorted = "{side} keys must be sorted"
+        msg_missings = "Merge keys contain null values on {side} side"
+
+        if not Index(left_values).is_monotonic:
+            if isnull(left_values).any():
+                raise ValueError(msg_missings.format(side='left'))
+            else:
+                raise ValueError(msg_sorted.format(side='left'))
+
+        if not Index(right_values).is_monotonic:
+            if isnull(right_values).any():
+                raise ValueError(msg_missings.format(side='right'))
+            else:
+                raise ValueError(msg_sorted.format(side='right'))
+
+        # initial type conversion as needed
+        if needs_i8_conversion(left_values):
+            left_values = left_values.view('i8')
+            right_values = right_values.view('i8')
+            if tolerance is not None:
+                tolerance = tolerance.value
+
+        # a "by" parameter requires special handling
+        if self.left_by is not None:
+            # remove 'on' parameter from values if one existed
+            if self.left_index and self.right_index:
+                left_by_values = self.left_join_keys
+                right_by_values = self.right_join_keys
+            else:
+                left_by_values = self.left_join_keys[0:-1]
+                right_by_values = self.right_join_keys[0:-1]
+
+            # get tuple representation of values if more than one
+            if len(left_by_values) == 1:
+                left_by_values = left_by_values[0]
+                right_by_values = right_by_values[0]
+            else:
+                left_by_values = flip(left_by_values)
+                right_by_values = flip(right_by_values)
+
+            # upcast 'by' parameter because HashTable is limited
+            by_type = _get_cython_type_upcast(left_by_values.dtype)
+            by_type_caster = _type_casters[by_type]
+            left_by_values = by_type_caster(left_by_values)
+            right_by_values = by_type_caster(right_by_values)
+
+            # choose appropriate function by type
+            func = _asof_by_function(self.direction)
+            return func(left_values,
+                        right_values,
+                        left_by_values,
+                        right_by_values,
+                        self.allow_exact_matches,
+                        tolerance)
+        else:
+            # choose appropriate function by type
+            func = _asof_function(self.direction)
+            return func(left_values,
+                        right_values,
+                        self.allow_exact_matches,
+                        tolerance)
+
+
+def _get_multiindex_indexer(join_keys, index, sort):
+    from functools import partial
+
+    # bind `sort` argument
+    fkeys = partial(_factorize_keys, sort=sort)
+
+    # left & right join labels and num. of levels at each location
+    rcodes, lcodes, shape = map(list, zip(* map(fkeys,
+                                                index.levels,
+                                                join_keys)))
+    if sort:
+        rcodes = list(map(np.take, rcodes, index.codes))
+    else:
+        i8copy = lambda a: a.astype('i8', subok=False, copy=True)
+        rcodes = list(map(i8copy, index.codes))
+
+    # fix right labels if there were any nulls
+    for i in range(len(join_keys)):
+        mask = index.codes[i] == -1
+        if mask.any():
+            # check if there already was any nulls at this location
+            # if there was, it is factorized to `shape[i] - 1`
+            a = join_keys[i][lcodes[i] == shape[i] - 1]
+            if a.size == 0 or not a[0] != a[0]:
+                shape[i] += 1
+
+            rcodes[i][mask] = shape[i] - 1
+
+    # get flat i8 join keys
+    lkey, rkey = _get_join_keys(lcodes, rcodes, shape, sort)
+
+    # factorize keys to a dense i8 space
+    lkey, rkey, count = fkeys(lkey, rkey)
+
+    return libjoin.left_outer_join(lkey, rkey, count, sort=sort)
+
+
+def _get_single_indexer(join_key, index, sort=False):
+    left_key, right_key, count = _factorize_keys(join_key, index, sort=sort)
+
+    left_indexer, right_indexer = libjoin.left_outer_join(
+        ensure_int64(left_key),
+        ensure_int64(right_key),
+        count, sort=sort)
+
+    return left_indexer, right_indexer
+
+
+def _left_join_on_index(left_ax, right_ax, join_keys, sort=False):
+    if len(join_keys) > 1:
+        if not ((isinstance(right_ax, MultiIndex) and
+                 len(join_keys) == right_ax.nlevels)):
+            raise AssertionError("If more than one join key is given then "
+                                 "'right_ax' must be a MultiIndex and the "
+                                 "number of join keys must be the number of "
+                                 "levels in right_ax")
+
+        left_indexer, right_indexer = \
+            _get_multiindex_indexer(join_keys, right_ax, sort=sort)
+    else:
+        jkey = join_keys[0]
+
+        left_indexer, right_indexer = \
+            _get_single_indexer(jkey, right_ax, sort=sort)
+
+    if sort or len(left_ax) != len(left_indexer):
+        # if asked to sort or there are 1-to-many matches
+        join_index = left_ax.take(left_indexer)
+        return join_index, left_indexer, right_indexer
+
+    # left frame preserves order & length of its index
+    return left_ax, None, right_indexer
+
+
+def _right_outer_join(x, y, max_groups):
+    right_indexer, left_indexer = libjoin.left_outer_join(y, x, max_groups)
+    return left_indexer, right_indexer
+
+
+_join_functions = {
+    'inner': libjoin.inner_join,
+    'left': libjoin.left_outer_join,
+    'right': _right_outer_join,
+    'outer': libjoin.full_outer_join,
+}
+
+
+def _factorize_keys(lk, rk, sort=True):
+    # Some pre-processing for non-ndarray lk / rk
+    if is_datetime64tz_dtype(lk) and is_datetime64tz_dtype(rk):
+        lk = lk._data
+        rk = rk._data
+
+    elif (is_categorical_dtype(lk) and
+            is_categorical_dtype(rk) and
+            lk.is_dtype_equal(rk)):
+        if lk.categories.equals(rk.categories):
+            # if we exactly match in categories, allow us to factorize on codes
+            rk = rk.codes
+        else:
+            # Same categories in different orders -> recode
+            rk = _recode_for_categories(rk.codes, rk.categories, lk.categories)
+
+        lk = ensure_int64(lk.codes)
+        rk = ensure_int64(rk)
+
+    elif (is_extension_array_dtype(lk.dtype) and
+          is_extension_array_dtype(rk.dtype) and
+          lk.dtype == rk.dtype):
+        lk, _ = lk._values_for_factorize()
+        rk, _ = rk._values_for_factorize()
+
+    if is_integer_dtype(lk) and is_integer_dtype(rk):
+        # GH#23917 TODO: needs tests for case where lk is integer-dtype
+        #  and rk is datetime-dtype
+        klass = libhashtable.Int64Factorizer
+        lk = ensure_int64(com.values_from_object(lk))
+        rk = ensure_int64(com.values_from_object(rk))
+    elif (issubclass(lk.dtype.type, (np.timedelta64, np.datetime64)) and
+          issubclass(rk.dtype.type, (np.timedelta64, np.datetime64))):
+        # GH#23917 TODO: Needs tests for non-matching dtypes
+        klass = libhashtable.Int64Factorizer
+        lk = ensure_int64(com.values_from_object(lk))
+        rk = ensure_int64(com.values_from_object(rk))
+    else:
+        klass = libhashtable.Factorizer
+        lk = ensure_object(lk)
+        rk = ensure_object(rk)
+
+    rizer = klass(max(len(lk), len(rk)))
+
+    llab = rizer.factorize(lk)
+    rlab = rizer.factorize(rk)
+
+    count = rizer.get_count()
+
+    if sort:
+        uniques = rizer.uniques.to_array()
+        llab, rlab = _sort_labels(uniques, llab, rlab)
+
+    # NA group
+    lmask = llab == -1
+    lany = lmask.any()
+    rmask = rlab == -1
+    rany = rmask.any()
+
+    if lany or rany:
+        if lany:
+            np.putmask(llab, lmask, count)
+        if rany:
+            np.putmask(rlab, rmask, count)
+        count += 1
+
+    return llab, rlab, count
+
+
+def _sort_labels(uniques, left, right):
+    if not isinstance(uniques, np.ndarray):
+        # tuplesafe
+        uniques = Index(uniques).values
+
+    llength = len(left)
+    labels = np.concatenate([left, right])
+
+    _, new_labels = sorting.safe_sort(uniques, labels, na_sentinel=-1)
+    new_labels = ensure_int64(new_labels)
+    new_left, new_right = new_labels[:llength], new_labels[llength:]
+
+    return new_left, new_right
+
+
+def _get_join_keys(llab, rlab, shape, sort):
+
+    # how many levels can be done without overflow
+    pred = lambda i: not is_int64_overflow_possible(shape[:i])
+    nlev = next(filter(pred, range(len(shape), 0, -1)))
+
+    # get keys for the first `nlev` levels
+    stride = np.prod(shape[1:nlev], dtype='i8')
+    lkey = stride * llab[0].astype('i8', subok=False, copy=False)
+    rkey = stride * rlab[0].astype('i8', subok=False, copy=False)
+
+    for i in range(1, nlev):
+        with np.errstate(divide='ignore'):
+            stride //= shape[i]
+        lkey += llab[i] * stride
+        rkey += rlab[i] * stride
+
+    if nlev == len(shape):  # all done!
+        return lkey, rkey
+
+    # densify current keys to avoid overflow
+    lkey, rkey, count = _factorize_keys(lkey, rkey, sort=sort)
+
+    llab = [lkey] + llab[nlev:]
+    rlab = [rkey] + rlab[nlev:]
+    shape = [count] + shape[nlev:]
+
+    return _get_join_keys(llab, rlab, shape, sort)
+
+
+def _should_fill(lname, rname):
+    if (not isinstance(lname, compat.string_types) or
+            not isinstance(rname, compat.string_types)):
+        return True
+    return lname == rname
+
+
+def _any(x):
+    return x is not None and com._any_not_none(*x)
+
+
+def validate_operand(obj):
+    if isinstance(obj, DataFrame):
+        return obj
+    elif isinstance(obj, Series):
+        if obj.name is None:
+            raise ValueError('Cannot merge a Series without a name')
+        else:
+            return obj.to_frame()
+    else:
+        raise TypeError('Can only merge Series or DataFrame objects, '
+                        'a {obj} was passed'.format(obj=type(obj)))
diff --git a/pandas/core/reshape/pivot.py b/pandas/core/reshape/pivot.py
new file mode 100644
index 0000000000000..8d7616c4b6b61
--- /dev/null
+++ b/pandas/core/reshape/pivot.py
@@ -0,0 +1,618 @@
+# pylint: disable=E1103
+import numpy as np
+
+from pandas.compat import lrange, range, zip
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.common import is_integer_dtype, is_list_like, is_scalar
+from pandas.core.dtypes.generic import ABCDataFrame, ABCSeries
+
+from pandas import compat
+import pandas.core.common as com
+from pandas.core.frame import _shared_docs
+from pandas.core.groupby import Grouper
+from pandas.core.index import Index, MultiIndex, _get_objs_combined_axis
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.util import cartesian_product
+from pandas.core.series import Series
+
+
+# Note: We need to make sure `frame` is imported before `pivot`, otherwise
+# _shared_docs['pivot_table'] will not yet exist.  TODO: Fix this dependency
+@Substitution('\ndata : DataFrame')
+@Appender(_shared_docs['pivot_table'], indents=1)
+def pivot_table(data, values=None, index=None, columns=None, aggfunc='mean',
+                fill_value=None, margins=False, dropna=True,
+                margins_name='All'):
+    index = _convert_by(index)
+    columns = _convert_by(columns)
+
+    if isinstance(aggfunc, list):
+        pieces = []
+        keys = []
+        for func in aggfunc:
+            table = pivot_table(data, values=values, index=index,
+                                columns=columns,
+                                fill_value=fill_value, aggfunc=func,
+                                margins=margins, margins_name=margins_name)
+            pieces.append(table)
+            keys.append(getattr(func, '__name__', func))
+
+        return concat(pieces, keys=keys, axis=1)
+
+    keys = index + columns
+
+    values_passed = values is not None
+    if values_passed:
+        if is_list_like(values):
+            values_multi = True
+            values = list(values)
+        else:
+            values_multi = False
+            values = [values]
+
+        # GH14938 Make sure value labels are in data
+        for i in values:
+            if i not in data:
+                raise KeyError(i)
+
+        to_filter = []
+        for x in keys + values:
+            if isinstance(x, Grouper):
+                x = x.key
+            try:
+                if x in data:
+                    to_filter.append(x)
+            except TypeError:
+                pass
+        if len(to_filter) < len(data.columns):
+            data = data[to_filter]
+
+    else:
+        values = data.columns
+        for key in keys:
+            try:
+                values = values.drop(key)
+            except (TypeError, ValueError, KeyError):
+                pass
+        values = list(values)
+
+    grouped = data.groupby(keys, observed=False)
+    agged = grouped.agg(aggfunc)
+    if dropna and isinstance(agged, ABCDataFrame) and len(agged.columns):
+        agged = agged.dropna(how='all')
+
+        # gh-21133
+        # we want to down cast if
+        # the original values are ints
+        # as we grouped with a NaN value
+        # and then dropped, coercing to floats
+        for v in values:
+            if (v in data and is_integer_dtype(data[v]) and
+                    v in agged and not is_integer_dtype(agged[v])):
+                agged[v] = maybe_downcast_to_dtype(agged[v], data[v].dtype)
+
+    table = agged
+    if table.index.nlevels > 1:
+        # Related GH #17123
+        # If index_names are integers, determine whether the integers refer
+        # to the level position or name.
+        index_names = agged.index.names[:len(index)]
+        to_unstack = []
+        for i in range(len(index), len(keys)):
+            name = agged.index.names[i]
+            if name is None or name in index_names:
+                to_unstack.append(i)
+            else:
+                to_unstack.append(name)
+        table = agged.unstack(to_unstack)
+
+    if not dropna:
+        from pandas import MultiIndex
+        if table.index.nlevels > 1:
+            m = MultiIndex.from_arrays(cartesian_product(table.index.levels),
+                                       names=table.index.names)
+            table = table.reindex(m, axis=0)
+
+        if table.columns.nlevels > 1:
+            m = MultiIndex.from_arrays(cartesian_product(table.columns.levels),
+                                       names=table.columns.names)
+            table = table.reindex(m, axis=1)
+
+    if isinstance(table, ABCDataFrame):
+        table = table.sort_index(axis=1)
+
+    if fill_value is not None:
+        table = table.fillna(value=fill_value, downcast='infer')
+
+    if margins:
+        if dropna:
+            data = data[data.notna().all(axis=1)]
+        table = _add_margins(table, data, values, rows=index,
+                             cols=columns, aggfunc=aggfunc,
+                             observed=dropna,
+                             margins_name=margins_name, fill_value=fill_value)
+
+    # discard the top level
+    if (values_passed and not values_multi and not table.empty and
+            (table.columns.nlevels > 1)):
+        table = table[values[0]]
+
+    if len(index) == 0 and len(columns) > 0:
+        table = table.T
+
+    # GH 15193 Make sure empty columns are removed if dropna=True
+    if isinstance(table, ABCDataFrame) and dropna:
+        table = table.dropna(how='all', axis=1)
+
+    return table
+
+
+def _add_margins(table, data, values, rows, cols, aggfunc,
+                 observed=None, margins_name='All', fill_value=None):
+    if not isinstance(margins_name, compat.string_types):
+        raise ValueError('margins_name argument must be a string')
+
+    msg = u'Conflicting name "{name}" in margins'.format(name=margins_name)
+    for level in table.index.names:
+        if margins_name in table.index.get_level_values(level):
+            raise ValueError(msg)
+
+    grand_margin = _compute_grand_margin(data, values, aggfunc, margins_name)
+
+    # could be passed a Series object with no 'columns'
+    if hasattr(table, 'columns'):
+        for level in table.columns.names[1:]:
+            if margins_name in table.columns.get_level_values(level):
+                raise ValueError(msg)
+
+    if len(rows) > 1:
+        key = (margins_name,) + ('',) * (len(rows) - 1)
+    else:
+        key = margins_name
+
+    if not values and isinstance(table, ABCSeries):
+        # If there are no values and the table is a series, then there is only
+        # one column in the data. Compute grand margin and return it.
+        return table.append(Series({key: grand_margin[margins_name]}))
+
+    if values:
+        marginal_result_set = _generate_marginal_results(table, data, values,
+                                                         rows, cols, aggfunc,
+                                                         observed,
+                                                         grand_margin,
+                                                         margins_name)
+        if not isinstance(marginal_result_set, tuple):
+            return marginal_result_set
+        result, margin_keys, row_margin = marginal_result_set
+    else:
+        marginal_result_set = _generate_marginal_results_without_values(
+            table, data, rows, cols, aggfunc, observed, margins_name)
+        if not isinstance(marginal_result_set, tuple):
+            return marginal_result_set
+        result, margin_keys, row_margin = marginal_result_set
+    row_margin = row_margin.reindex(result.columns, fill_value=fill_value)
+    # populate grand margin
+    for k in margin_keys:
+        if isinstance(k, compat.string_types):
+            row_margin[k] = grand_margin[k]
+        else:
+            row_margin[k] = grand_margin[k[0]]
+
+    from pandas import DataFrame
+    margin_dummy = DataFrame(row_margin, columns=[key]).T
+
+    row_names = result.index.names
+    try:
+        for dtype in set(result.dtypes):
+            cols = result.select_dtypes([dtype]).columns
+            margin_dummy[cols] = margin_dummy[cols].astype(dtype)
+        result = result.append(margin_dummy)
+    except TypeError:
+
+        # we cannot reshape, so coerce the axis
+        result.index = result.index._to_safe_for_reshape()
+        result = result.append(margin_dummy)
+    result.index.names = row_names
+
+    return result
+
+
+def _compute_grand_margin(data, values, aggfunc,
+                          margins_name='All'):
+
+    if values:
+        grand_margin = {}
+        for k, v in data[values].iteritems():
+            try:
+                if isinstance(aggfunc, compat.string_types):
+                    grand_margin[k] = getattr(v, aggfunc)()
+                elif isinstance(aggfunc, dict):
+                    if isinstance(aggfunc[k], compat.string_types):
+                        grand_margin[k] = getattr(v, aggfunc[k])()
+                    else:
+                        grand_margin[k] = aggfunc[k](v)
+                else:
+                    grand_margin[k] = aggfunc(v)
+            except TypeError:
+                pass
+        return grand_margin
+    else:
+        return {margins_name: aggfunc(data.index)}
+
+
+def _generate_marginal_results(table, data, values, rows, cols, aggfunc,
+                               observed,
+                               grand_margin,
+                               margins_name='All'):
+    if len(cols) > 0:
+        # need to "interleave" the margins
+        table_pieces = []
+        margin_keys = []
+
+        def _all_key(key):
+            return (key, margins_name) + ('',) * (len(cols) - 1)
+
+        if len(rows) > 0:
+            margin = data[rows + values].groupby(
+                rows, observed=observed).agg(aggfunc)
+            cat_axis = 1
+
+            for key, piece in table.groupby(level=0,
+                                            axis=cat_axis,
+                                            observed=observed):
+                all_key = _all_key(key)
+
+                # we are going to mutate this, so need to copy!
+                piece = piece.copy()
+                try:
+                    piece[all_key] = margin[key]
+                except TypeError:
+
+                    # we cannot reshape, so coerce the axis
+                    piece.set_axis(piece._get_axis(
+                                   cat_axis)._to_safe_for_reshape(),
+                                   axis=cat_axis, inplace=True)
+                    piece[all_key] = margin[key]
+
+                table_pieces.append(piece)
+                margin_keys.append(all_key)
+        else:
+            margin = grand_margin
+            cat_axis = 0
+            for key, piece in table.groupby(level=0,
+                                            axis=cat_axis,
+                                            observed=observed):
+                all_key = _all_key(key)
+                table_pieces.append(piece)
+                table_pieces.append(Series(margin[key], index=[all_key]))
+                margin_keys.append(all_key)
+
+        result = concat(table_pieces, axis=cat_axis)
+
+        if len(rows) == 0:
+            return result
+    else:
+        result = table
+        margin_keys = table.columns
+
+    if len(cols) > 0:
+        row_margin = data[cols + values].groupby(
+            cols, observed=observed).agg(aggfunc)
+        row_margin = row_margin.stack()
+
+        # slight hack
+        new_order = [len(cols)] + lrange(len(cols))
+        row_margin.index = row_margin.index.reorder_levels(new_order)
+    else:
+        row_margin = Series(np.nan, index=result.columns)
+
+    return result, margin_keys, row_margin
+
+
+def _generate_marginal_results_without_values(
+        table, data, rows, cols, aggfunc,
+        observed, margins_name='All'):
+    if len(cols) > 0:
+        # need to "interleave" the margins
+        margin_keys = []
+
+        def _all_key():
+            if len(cols) == 1:
+                return margins_name
+            return (margins_name, ) + ('', ) * (len(cols) - 1)
+
+        if len(rows) > 0:
+            margin = data[rows].groupby(rows,
+                                        observed=observed).apply(aggfunc)
+            all_key = _all_key()
+            table[all_key] = margin
+            result = table
+            margin_keys.append(all_key)
+
+        else:
+            margin = data.groupby(level=0,
+                                  axis=0,
+                                  observed=observed).apply(aggfunc)
+            all_key = _all_key()
+            table[all_key] = margin
+            result = table
+            margin_keys.append(all_key)
+            return result
+    else:
+        result = table
+        margin_keys = table.columns
+
+    if len(cols):
+        row_margin = data[cols].groupby(cols, observed=observed).apply(aggfunc)
+    else:
+        row_margin = Series(np.nan, index=result.columns)
+
+    return result, margin_keys, row_margin
+
+
+def _convert_by(by):
+    if by is None:
+        by = []
+    elif (is_scalar(by) or
+          isinstance(by, (np.ndarray, Index, ABCSeries, Grouper)) or
+          hasattr(by, '__call__')):
+        by = [by]
+    else:
+        by = list(by)
+    return by
+
+
+@Substitution('\ndata : DataFrame')
+@Appender(_shared_docs['pivot'], indents=1)
+def pivot(data, index=None, columns=None, values=None):
+    if values is None:
+        cols = [columns] if index is None else [index, columns]
+        append = index is None
+        indexed = data.set_index(cols, append=append)
+    else:
+        if index is None:
+            index = data.index
+        else:
+            index = data[index]
+        index = MultiIndex.from_arrays([index, data[columns]])
+
+        if is_list_like(values) and not isinstance(values, tuple):
+            # Exclude tuple because it is seen as a single column name
+            indexed = data._constructor(data[values].values, index=index,
+                                        columns=values)
+        else:
+            indexed = data._constructor_sliced(data[values].values,
+                                               index=index)
+    return indexed.unstack(columns)
+
+
+def crosstab(index, columns, values=None, rownames=None, colnames=None,
+             aggfunc=None, margins=False, margins_name='All', dropna=True,
+             normalize=False):
+    """
+    Compute a simple cross tabulation of two (or more) factors. By default
+    computes a frequency table of the factors unless an array of values and an
+    aggregation function are passed.
+
+    Parameters
+    ----------
+    index : array-like, Series, or list of arrays/Series
+        Values to group by in the rows.
+    columns : array-like, Series, or list of arrays/Series
+        Values to group by in the columns.
+    values : array-like, optional
+        Array of values to aggregate according to the factors.
+        Requires `aggfunc` be specified.
+    rownames : sequence, default None
+        If passed, must match number of row arrays passed.
+    colnames : sequence, default None
+        If passed, must match number of column arrays passed.
+    aggfunc : function, optional
+        If specified, requires `values` be specified as well.
+    margins : bool, default False
+        Add row/column margins (subtotals).
+    margins_name : str, default 'All'
+        Name of the row/column that will contain the totals
+        when margins is True.
+
+        .. versionadded:: 0.21.0
+
+    dropna : bool, default True
+        Do not include columns whose entries are all NaN.
+    normalize : bool, {'all', 'index', 'columns'}, or {0,1}, default False
+        Normalize by dividing all values by the sum of values.
+
+        - If passed 'all' or `True`, will normalize over all values.
+        - If passed 'index' will normalize over each row.
+        - If passed 'columns' will normalize over each column.
+        - If margins is `True`, will also normalize margin values.
+
+        .. versionadded:: 0.18.1
+
+    Returns
+    -------
+    DataFrame
+        Cross tabulation of the data.
+
+    See Also
+    --------
+    DataFrame.pivot : Reshape data based on column values.
+    pivot_table : Create a pivot table as a DataFrame.
+
+    Notes
+    -----
+    Any Series passed will have their name attributes used unless row or column
+    names for the cross-tabulation are specified.
+
+    Any input passed containing Categorical data will have **all** of its
+    categories included in the cross-tabulation, even if the actual data does
+    not contain any instances of a particular category.
+
+    In the event that there aren't overlapping indexes an empty DataFrame will
+    be returned.
+
+    Examples
+    --------
+    >>> a = np.array(["foo", "foo", "foo", "foo", "bar", "bar",
+    ...               "bar", "bar", "foo", "foo", "foo"], dtype=object)
+    >>> b = np.array(["one", "one", "one", "two", "one", "one",
+    ...               "one", "two", "two", "two", "one"], dtype=object)
+    >>> c = np.array(["dull", "dull", "shiny", "dull", "dull", "shiny",
+    ...               "shiny", "dull", "shiny", "shiny", "shiny"],
+    ...              dtype=object)
+    >>> pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
+    b   one        two
+    c   dull shiny dull shiny
+    a
+    bar    1     2    1     0
+    foo    2     2    1     2
+
+    Here 'c' and 'f' are not represented in the data and will not be
+    shown in the output because dropna is True by default. Set
+    dropna=False to preserve categories with no data.
+
+    >>> foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+    >>> bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
+    >>> pd.crosstab(foo, bar)
+    col_0  d  e
+    row_0
+    a      1  0
+    b      0  1
+    >>> pd.crosstab(foo, bar, dropna=False)
+    col_0  d  e  f
+    row_0
+    a      1  0  0
+    b      0  1  0
+    c      0  0  0
+    """
+
+    index = com.maybe_make_list(index)
+    columns = com.maybe_make_list(columns)
+
+    rownames = _get_names(index, rownames, prefix='row')
+    colnames = _get_names(columns, colnames, prefix='col')
+
+    common_idx = _get_objs_combined_axis(index + columns, intersect=True,
+                                         sort=False)
+
+    data = {}
+    data.update(zip(rownames, index))
+    data.update(zip(colnames, columns))
+
+    if values is None and aggfunc is not None:
+        raise ValueError("aggfunc cannot be used without values.")
+
+    if values is not None and aggfunc is None:
+        raise ValueError("values cannot be used without an aggfunc.")
+
+    from pandas import DataFrame
+    df = DataFrame(data, index=common_idx)
+    if values is None:
+        df['__dummy__'] = 0
+        kwargs = {'aggfunc': len, 'fill_value': 0}
+    else:
+        df['__dummy__'] = values
+        kwargs = {'aggfunc': aggfunc}
+
+    table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
+                           margins=margins, margins_name=margins_name,
+                           dropna=dropna, **kwargs)
+
+    # Post-process
+    if normalize is not False:
+        table = _normalize(table, normalize=normalize, margins=margins,
+                           margins_name=margins_name)
+
+    return table
+
+
+def _normalize(table, normalize, margins, margins_name='All'):
+
+    if not isinstance(normalize, bool) and not isinstance(normalize,
+                                                          compat.string_types):
+        axis_subs = {0: 'index', 1: 'columns'}
+        try:
+            normalize = axis_subs[normalize]
+        except KeyError:
+            raise ValueError("Not a valid normalize argument")
+
+    if margins is False:
+
+        # Actual Normalizations
+        normalizers = {
+            'all': lambda x: x / x.sum(axis=1).sum(axis=0),
+            'columns': lambda x: x / x.sum(),
+            'index': lambda x: x.div(x.sum(axis=1), axis=0)
+        }
+
+        normalizers[True] = normalizers['all']
+
+        try:
+            f = normalizers[normalize]
+        except KeyError:
+            raise ValueError("Not a valid normalize argument")
+
+        table = f(table)
+        table = table.fillna(0)
+
+    elif margins is True:
+
+        column_margin = table.loc[:, margins_name].drop(margins_name)
+        index_margin = table.loc[margins_name, :].drop(margins_name)
+        table = table.drop(margins_name, axis=1).drop(margins_name)
+        # to keep index and columns names
+        table_index_names = table.index.names
+        table_columns_names = table.columns.names
+
+        # Normalize core
+        table = _normalize(table, normalize=normalize, margins=False)
+
+        # Fix Margins
+        if normalize == 'columns':
+            column_margin = column_margin / column_margin.sum()
+            table = concat([table, column_margin], axis=1)
+            table = table.fillna(0)
+
+        elif normalize == 'index':
+            index_margin = index_margin / index_margin.sum()
+            table = table.append(index_margin)
+            table = table.fillna(0)
+
+        elif normalize == "all" or normalize is True:
+            column_margin = column_margin / column_margin.sum()
+            index_margin = index_margin / index_margin.sum()
+            index_margin.loc[margins_name] = 1
+            table = concat([table, column_margin], axis=1)
+            table = table.append(index_margin)
+
+            table = table.fillna(0)
+
+        else:
+            raise ValueError("Not a valid normalize argument")
+
+        table.index.names = table_index_names
+        table.columns.names = table_columns_names
+
+    else:
+        raise ValueError("Not a valid margins argument")
+
+    return table
+
+
+def _get_names(arrs, names, prefix='row'):
+    if names is None:
+        names = []
+        for i, arr in enumerate(arrs):
+            if isinstance(arr, ABCSeries) and arr.name is not None:
+                names.append(arr.name)
+            else:
+                names.append('{prefix}_{i}'.format(prefix=prefix, i=i))
+    else:
+        if len(names) != len(arrs):
+            raise AssertionError('arrays and names must have the same length')
+        if not isinstance(names, list):
+            names = list(names)
+
+    return names
diff --git a/pandas/core/reshape/reshape.py b/pandas/core/reshape/reshape.py
new file mode 100644
index 0000000000000..6ba33301753d6
--- /dev/null
+++ b/pandas/core/reshape/reshape.py
@@ -0,0 +1,1046 @@
+# pylint: disable=E1101,E1103
+# pylint: disable=W0703,W0622,W0613,W0201
+from functools import partial
+import itertools
+
+import numpy as np
+
+from pandas._libs import algos as _algos, reshape as _reshape
+from pandas._libs.sparse import IntIndex
+from pandas.compat import PY2, range, text_type, u, zip
+
+from pandas.core.dtypes.cast import maybe_promote
+from pandas.core.dtypes.common import (
+    ensure_platform_int, is_bool_dtype, is_extension_array_dtype,
+    is_integer_dtype, is_list_like, is_object_dtype, needs_i8_conversion)
+from pandas.core.dtypes.missing import notna
+
+from pandas import compat
+import pandas.core.algorithms as algos
+from pandas.core.arrays import SparseArray
+from pandas.core.arrays.categorical import _factorize_from_iterable
+from pandas.core.frame import DataFrame
+from pandas.core.index import Index, MultiIndex
+from pandas.core.internals.arrays import extract_array
+from pandas.core.series import Series
+from pandas.core.sorting import (
+    compress_group_index, decons_obs_group_ids, get_compressed_ids,
+    get_group_index)
+
+
+class _Unstacker(object):
+    """
+    Helper class to unstack data / pivot with multi-level index
+
+    Parameters
+    ----------
+    values : ndarray
+        Values of DataFrame to "Unstack"
+    index : object
+        Pandas ``Index``
+    level : int or str, default last level
+        Level to "unstack". Accepts a name for the level.
+    value_columns : Index, optional
+        Pandas ``Index`` or ``MultiIndex`` object if unstacking a DataFrame
+    fill_value : scalar, optional
+        Default value to fill in missing values if subgroups do not have the
+        same set of labels. By default, missing values will be replaced with
+        the default fill value for that data type, NaN for float, NaT for
+        datetimelike, etc. For integer types, by default data will converted to
+        float and missing values will be set to NaN.
+    constructor : object
+        Pandas ``DataFrame`` or subclass used to create unstacked
+        response.  If None, DataFrame or SparseDataFrame will be used.
+
+    Examples
+    --------
+    >>> index = pd.MultiIndex.from_tuples([('one', 'a'), ('one', 'b'),
+    ...                                    ('two', 'a'), ('two', 'b')])
+    >>> s = pd.Series(np.arange(1, 5, dtype=np.int64), index=index)
+    >>> s
+    one  a    1
+         b    2
+    two  a    3
+         b    4
+    dtype: int64
+
+    >>> s.unstack(level=-1)
+         a  b
+    one  1  2
+    two  3  4
+
+    >>> s.unstack(level=0)
+       one  two
+    a    1    3
+    b    2    4
+
+    Returns
+    -------
+    unstacked : DataFrame
+    """
+
+    def __init__(self, values, index, level=-1, value_columns=None,
+                 fill_value=None, constructor=None):
+
+        if values.ndim == 1:
+            values = values[:, np.newaxis]
+        self.values = values
+        self.value_columns = value_columns
+        self.fill_value = fill_value
+
+        if constructor is None:
+            constructor = DataFrame
+        self.constructor = constructor
+
+        if value_columns is None and values.shape[1] != 1:  # pragma: no cover
+            raise ValueError('must pass column labels for multi-column data')
+
+        self.index = index.remove_unused_levels()
+
+        self.level = self.index._get_level_number(level)
+
+        # when index includes `nan`, need to lift levels/strides by 1
+        self.lift = 1 if -1 in self.index.codes[self.level] else 0
+
+        self.new_index_levels = list(self.index.levels)
+        self.new_index_names = list(self.index.names)
+
+        self.removed_name = self.new_index_names.pop(self.level)
+        self.removed_level = self.new_index_levels.pop(self.level)
+        self.removed_level_full = index.levels[self.level]
+
+        # Bug fix GH 20601
+        # If the data frame is too big, the number of unique index combination
+        # will cause int32 overflow on windows environments.
+        # We want to check and raise an error before this happens
+        num_rows = np.max([index_level.size for index_level
+                           in self.new_index_levels])
+        num_columns = self.removed_level.size
+
+        # GH20601: This forces an overflow if the number of cells is too high.
+        num_cells = np.multiply(num_rows, num_columns, dtype=np.int32)
+
+        if num_rows > 0 and num_columns > 0 and num_cells <= 0:
+            raise ValueError('Unstacked DataFrame is too big, '
+                             'causing int32 overflow')
+
+        self._make_sorted_values_labels()
+        self._make_selectors()
+
+    def _make_sorted_values_labels(self):
+        v = self.level
+
+        codes = list(self.index.codes)
+        levs = list(self.index.levels)
+        to_sort = codes[:v] + codes[v + 1:] + [codes[v]]
+        sizes = [len(x) for x in levs[:v] + levs[v + 1:] + [levs[v]]]
+
+        comp_index, obs_ids = get_compressed_ids(to_sort, sizes)
+        ngroups = len(obs_ids)
+
+        indexer = _algos.groupsort_indexer(comp_index, ngroups)[0]
+        indexer = ensure_platform_int(indexer)
+
+        self.sorted_values = algos.take_nd(self.values, indexer, axis=0)
+        self.sorted_labels = [l.take(indexer) for l in to_sort]
+
+    def _make_selectors(self):
+        new_levels = self.new_index_levels
+
+        # make the mask
+        remaining_labels = self.sorted_labels[:-1]
+        level_sizes = [len(x) for x in new_levels]
+
+        comp_index, obs_ids = get_compressed_ids(remaining_labels, level_sizes)
+        ngroups = len(obs_ids)
+
+        comp_index = ensure_platform_int(comp_index)
+        stride = self.index.levshape[self.level] + self.lift
+        self.full_shape = ngroups, stride
+
+        selector = self.sorted_labels[-1] + stride * comp_index + self.lift
+        mask = np.zeros(np.prod(self.full_shape), dtype=bool)
+        mask.put(selector, True)
+
+        if mask.sum() < len(self.index):
+            raise ValueError('Index contains duplicate entries, '
+                             'cannot reshape')
+
+        self.group_index = comp_index
+        self.mask = mask
+        self.unique_groups = obs_ids
+        self.compressor = comp_index.searchsorted(np.arange(ngroups))
+
+    def get_result(self):
+        values, _ = self.get_new_values()
+        columns = self.get_new_columns()
+        index = self.get_new_index()
+
+        return self.constructor(values, index=index, columns=columns)
+
+    def get_new_values(self):
+        values = self.values
+
+        # place the values
+        length, width = self.full_shape
+        stride = values.shape[1]
+        result_width = width * stride
+        result_shape = (length, result_width)
+        mask = self.mask
+        mask_all = mask.all()
+
+        # we can simply reshape if we don't have a mask
+        if mask_all and len(values):
+            new_values = (self.sorted_values
+                              .reshape(length, width, stride)
+                              .swapaxes(1, 2)
+                              .reshape(result_shape)
+                          )
+            new_mask = np.ones(result_shape, dtype=bool)
+            return new_values, new_mask
+
+        # if our mask is all True, then we can use our existing dtype
+        if mask_all:
+            dtype = values.dtype
+            new_values = np.empty(result_shape, dtype=dtype)
+        else:
+            dtype, fill_value = maybe_promote(values.dtype, self.fill_value)
+            new_values = np.empty(result_shape, dtype=dtype)
+            new_values.fill(fill_value)
+
+        new_mask = np.zeros(result_shape, dtype=bool)
+
+        name = np.dtype(dtype).name
+        sorted_values = self.sorted_values
+
+        # we need to convert to a basic dtype
+        # and possibly coerce an input to our output dtype
+        # e.g. ints -> floats
+        if needs_i8_conversion(values):
+            sorted_values = sorted_values.view('i8')
+            new_values = new_values.view('i8')
+            name = 'int64'
+        elif is_bool_dtype(values):
+            sorted_values = sorted_values.astype('object')
+            new_values = new_values.astype('object')
+            name = 'object'
+        else:
+            sorted_values = sorted_values.astype(name, copy=False)
+
+        # fill in our values & mask
+        f = getattr(_reshape, "unstack_{name}".format(name=name))
+        f(sorted_values,
+          mask.view('u1'),
+          stride,
+          length,
+          width,
+          new_values,
+          new_mask.view('u1'))
+
+        # reconstruct dtype if needed
+        if needs_i8_conversion(values):
+            new_values = new_values.view(values.dtype)
+
+        return new_values, new_mask
+
+    def get_new_columns(self):
+        if self.value_columns is None:
+            if self.lift == 0:
+                return self.removed_level
+
+            lev = self.removed_level
+            return lev.insert(0, lev._na_value)
+
+        stride = len(self.removed_level) + self.lift
+        width = len(self.value_columns)
+        propagator = np.repeat(np.arange(width), stride)
+        if isinstance(self.value_columns, MultiIndex):
+            new_levels = self.value_columns.levels + (self.removed_level_full,)
+            new_names = self.value_columns.names + (self.removed_name,)
+
+            new_codes = [lab.take(propagator)
+                         for lab in self.value_columns.codes]
+        else:
+            new_levels = [self.value_columns, self.removed_level_full]
+            new_names = [self.value_columns.name, self.removed_name]
+            new_codes = [propagator]
+
+        # The two indices differ only if the unstacked level had unused items:
+        if len(self.removed_level_full) != len(self.removed_level):
+            # In this case, we remap the new codes to the original level:
+            repeater = self.removed_level_full.get_indexer(self.removed_level)
+            if self.lift:
+                repeater = np.insert(repeater, 0, -1)
+        else:
+            # Otherwise, we just use each level item exactly once:
+            repeater = np.arange(stride) - self.lift
+
+        # The entire level is then just a repetition of the single chunk:
+        new_codes.append(np.tile(repeater, width))
+        return MultiIndex(levels=new_levels, codes=new_codes,
+                          names=new_names, verify_integrity=False)
+
+    def get_new_index(self):
+        result_codes = [lab.take(self.compressor)
+                        for lab in self.sorted_labels[:-1]]
+
+        # construct the new index
+        if len(self.new_index_levels) == 1:
+            lev, lab = self.new_index_levels[0], result_codes[0]
+            if (lab == -1).any():
+                lev = lev.insert(len(lev), lev._na_value)
+            return lev.take(lab)
+
+        return MultiIndex(levels=self.new_index_levels, codes=result_codes,
+                          names=self.new_index_names, verify_integrity=False)
+
+
+def _unstack_multiple(data, clocs, fill_value=None):
+    if len(clocs) == 0:
+        return data
+
+    # NOTE: This doesn't deal with hierarchical columns yet
+
+    index = data.index
+
+    clocs = [index._get_level_number(i) for i in clocs]
+
+    rlocs = [i for i in range(index.nlevels) if i not in clocs]
+
+    clevels = [index.levels[i] for i in clocs]
+    ccodes = [index.codes[i] for i in clocs]
+    cnames = [index.names[i] for i in clocs]
+    rlevels = [index.levels[i] for i in rlocs]
+    rcodes = [index.codes[i] for i in rlocs]
+    rnames = [index.names[i] for i in rlocs]
+
+    shape = [len(x) for x in clevels]
+    group_index = get_group_index(ccodes, shape, sort=False, xnull=False)
+
+    comp_ids, obs_ids = compress_group_index(group_index, sort=False)
+    recons_codes = decons_obs_group_ids(comp_ids, obs_ids, shape, ccodes,
+                                        xnull=False)
+
+    if rlocs == []:
+        # Everything is in clocs, so the dummy df has a regular index
+        dummy_index = Index(obs_ids, name='__placeholder__')
+    else:
+        dummy_index = MultiIndex(levels=rlevels + [obs_ids],
+                                 codes=rcodes + [comp_ids],
+                                 names=rnames + ['__placeholder__'],
+                                 verify_integrity=False)
+
+    if isinstance(data, Series):
+        dummy = data.copy()
+        dummy.index = dummy_index
+
+        unstacked = dummy.unstack('__placeholder__', fill_value=fill_value)
+        new_levels = clevels
+        new_names = cnames
+        new_codes = recons_codes
+    else:
+        if isinstance(data.columns, MultiIndex):
+            result = data
+            for i in range(len(clocs)):
+                val = clocs[i]
+                result = result.unstack(val)
+                clocs = [v if i > v else v - 1 for v in clocs]
+
+            return result
+
+        dummy = data.copy()
+        dummy.index = dummy_index
+
+        unstacked = dummy.unstack('__placeholder__', fill_value=fill_value)
+        if isinstance(unstacked, Series):
+            unstcols = unstacked.index
+        else:
+            unstcols = unstacked.columns
+        new_levels = [unstcols.levels[0]] + clevels
+        new_names = [data.columns.name] + cnames
+
+        new_codes = [unstcols.codes[0]]
+        for rec in recons_codes:
+            new_codes.append(rec.take(unstcols.codes[-1]))
+
+    new_columns = MultiIndex(levels=new_levels, codes=new_codes,
+                             names=new_names, verify_integrity=False)
+
+    if isinstance(unstacked, Series):
+        unstacked.index = new_columns
+    else:
+        unstacked.columns = new_columns
+
+    return unstacked
+
+
+def unstack(obj, level, fill_value=None):
+    if isinstance(level, (tuple, list)):
+        if len(level) != 1:
+            # _unstack_multiple only handles MultiIndexes,
+            # and isn't needed for a single level
+            return _unstack_multiple(obj, level, fill_value=fill_value)
+        else:
+            level = level[0]
+
+    if isinstance(obj, DataFrame):
+        if isinstance(obj.index, MultiIndex):
+            return _unstack_frame(obj, level, fill_value=fill_value)
+        else:
+            return obj.T.stack(dropna=False)
+    else:
+        if is_extension_array_dtype(obj.dtype):
+            return _unstack_extension_series(obj, level, fill_value)
+        unstacker = _Unstacker(obj.values, obj.index, level=level,
+                               fill_value=fill_value,
+                               constructor=obj._constructor_expanddim)
+        return unstacker.get_result()
+
+
+def _unstack_frame(obj, level, fill_value=None):
+    if obj._is_mixed_type:
+        unstacker = partial(_Unstacker, index=obj.index,
+                            level=level, fill_value=fill_value)
+        blocks = obj._data.unstack(unstacker,
+                                   fill_value=fill_value)
+        return obj._constructor(blocks)
+    else:
+        unstacker = _Unstacker(obj.values, obj.index, level=level,
+                               value_columns=obj.columns,
+                               fill_value=fill_value,
+                               constructor=obj._constructor)
+        return unstacker.get_result()
+
+
+def _unstack_extension_series(series, level, fill_value):
+    """
+    Unstack an ExtensionArray-backed Series.
+
+    The ExtensionDtype is preserved.
+
+    Parameters
+    ----------
+    series : Series
+        A Series with an ExtensionArray for values
+    level : Any
+        The level name or number.
+    fill_value : Any
+        The user-level (not physical storage) fill value to use for
+        missing values introduced by the reshape. Passed to
+        ``series.values.take``.
+
+    Returns
+    -------
+    DataFrame
+        Each column of the DataFrame will have the same dtype as
+        the input Series.
+    """
+    # Implementation note: the basic idea is to
+    # 1. Do a regular unstack on a dummy array of integers
+    # 2. Followup with a columnwise take.
+    # We use the dummy take to discover newly-created missing values
+    # introduced by the reshape.
+    from pandas.core.reshape.concat import concat
+
+    dummy_arr = np.arange(len(series))
+    # fill_value=-1, since we will do a series.values.take later
+    result = _Unstacker(dummy_arr, series.index,
+                        level=level, fill_value=-1).get_result()
+
+    out = []
+    values = extract_array(series, extract_numpy=False)
+
+    for col, indices in result.iteritems():
+        out.append(Series(values.take(indices.values,
+                                      allow_fill=True,
+                                      fill_value=fill_value),
+                          name=col, index=result.index))
+    return concat(out, axis='columns', copy=False, keys=result.columns)
+
+
+def stack(frame, level=-1, dropna=True):
+    """
+    Convert DataFrame to Series with multi-level Index. Columns become the
+    second level of the resulting hierarchical index
+
+    Returns
+    -------
+    stacked : Series
+    """
+    def factorize(index):
+        if index.is_unique:
+            return index, np.arange(len(index))
+        codes, categories = _factorize_from_iterable(index)
+        return categories, codes
+
+    N, K = frame.shape
+
+    # Will also convert negative level numbers and check if out of bounds.
+    level_num = frame.columns._get_level_number(level)
+
+    if isinstance(frame.columns, MultiIndex):
+        return _stack_multi_columns(frame, level_num=level_num, dropna=dropna)
+    elif isinstance(frame.index, MultiIndex):
+        new_levels = list(frame.index.levels)
+        new_codes = [lab.repeat(K) for lab in frame.index.codes]
+
+        clev, clab = factorize(frame.columns)
+        new_levels.append(clev)
+        new_codes.append(np.tile(clab, N).ravel())
+
+        new_names = list(frame.index.names)
+        new_names.append(frame.columns.name)
+        new_index = MultiIndex(levels=new_levels, codes=new_codes,
+                               names=new_names, verify_integrity=False)
+    else:
+        levels, (ilab, clab) = zip(*map(factorize, (frame.index,
+                                                    frame.columns)))
+        codes = ilab.repeat(K), np.tile(clab, N).ravel()
+        new_index = MultiIndex(levels=levels, codes=codes,
+                               names=[frame.index.name, frame.columns.name],
+                               verify_integrity=False)
+
+    if frame._is_homogeneous_type:
+        # For homogeneous EAs, frame.values will coerce to object. So
+        # we concatenate instead.
+        dtypes = list(frame.dtypes.values)
+        dtype = dtypes[0]
+
+        if is_extension_array_dtype(dtype):
+            arr = dtype.construct_array_type()
+            new_values = arr._concat_same_type([
+                col._values for _, col in frame.iteritems()
+            ])
+            new_values = _reorder_for_extension_array_stack(new_values, N, K)
+        else:
+            # homogeneous, non-EA
+            new_values = frame.values.ravel()
+
+    else:
+        # non-homogeneous
+        new_values = frame.values.ravel()
+
+    if dropna:
+        mask = notna(new_values)
+        new_values = new_values[mask]
+        new_index = new_index[mask]
+
+    return frame._constructor_sliced(new_values, index=new_index)
+
+
+def stack_multiple(frame, level, dropna=True):
+    # If all passed levels match up to column names, no
+    # ambiguity about what to do
+    if all(lev in frame.columns.names for lev in level):
+        result = frame
+        for lev in level:
+            result = stack(result, lev, dropna=dropna)
+
+    # Otherwise, level numbers may change as each successive level is stacked
+    elif all(isinstance(lev, int) for lev in level):
+        # As each stack is done, the level numbers decrease, so we need
+        #  to account for that when level is a sequence of ints
+        result = frame
+        # _get_level_number() checks level numbers are in range and converts
+        # negative numbers to positive
+        level = [frame.columns._get_level_number(lev) for lev in level]
+
+        # Can't iterate directly through level as we might need to change
+        # values as we go
+        for index in range(len(level)):
+            lev = level[index]
+            result = stack(result, lev, dropna=dropna)
+            # Decrement all level numbers greater than current, as these
+            # have now shifted down by one
+            updated_level = []
+            for other in level:
+                if other > lev:
+                    updated_level.append(other - 1)
+                else:
+                    updated_level.append(other)
+            level = updated_level
+
+    else:
+        raise ValueError("level should contain all level names or all level "
+                         "numbers, not a mixture of the two.")
+
+    return result
+
+
+def _stack_multi_columns(frame, level_num=-1, dropna=True):
+    def _convert_level_number(level_num, columns):
+        """
+        Logic for converting the level number to something we can safely pass
+        to swaplevel:
+
+        We generally want to convert the level number into a level name, except
+        when columns do not have names, in which case we must leave as a level
+        number
+        """
+        if level_num in columns.names:
+            return columns.names[level_num]
+        else:
+            if columns.names[level_num] is None:
+                return level_num
+            else:
+                return columns.names[level_num]
+
+    this = frame.copy()
+
+    # this makes life much simpler
+    if level_num != frame.columns.nlevels - 1:
+        # roll levels to put selected level at end
+        roll_columns = this.columns
+        for i in range(level_num, frame.columns.nlevels - 1):
+            # Need to check if the ints conflict with level names
+            lev1 = _convert_level_number(i, roll_columns)
+            lev2 = _convert_level_number(i + 1, roll_columns)
+            roll_columns = roll_columns.swaplevel(lev1, lev2)
+        this.columns = roll_columns
+
+    if not this.columns.is_lexsorted():
+        # Workaround the edge case where 0 is one of the column names,
+        # which interferes with trying to sort based on the first
+        # level
+        level_to_sort = _convert_level_number(0, this.columns)
+        this = this.sort_index(level=level_to_sort, axis=1)
+
+    # tuple list excluding level for grouping columns
+    if len(frame.columns.levels) > 2:
+        tuples = list(zip(*[lev.take(level_codes) for lev, level_codes
+                            in zip(this.columns.levels[:-1],
+                                   this.columns.codes[:-1])]))
+        unique_groups = [key for key, _ in itertools.groupby(tuples)]
+        new_names = this.columns.names[:-1]
+        new_columns = MultiIndex.from_tuples(unique_groups, names=new_names)
+    else:
+        new_columns = unique_groups = this.columns.levels[0]
+
+    # time to ravel the values
+    new_data = {}
+    level_vals = this.columns.levels[-1]
+    level_codes = sorted(set(this.columns.codes[-1]))
+    level_vals_used = level_vals[level_codes]
+    levsize = len(level_codes)
+    drop_cols = []
+    for key in unique_groups:
+        try:
+            loc = this.columns.get_loc(key)
+        except KeyError:
+            drop_cols.append(key)
+            continue
+
+        # can make more efficient?
+        # we almost always return a slice
+        # but if unsorted can get a boolean
+        # indexer
+        if not isinstance(loc, slice):
+            slice_len = len(loc)
+        else:
+            slice_len = loc.stop - loc.start
+
+        if slice_len != levsize:
+            chunk = this.loc[:, this.columns[loc]]
+            chunk.columns = level_vals.take(chunk.columns.codes[-1])
+            value_slice = chunk.reindex(columns=level_vals_used).values
+        else:
+            if (frame._is_homogeneous_type and
+                    is_extension_array_dtype(frame.dtypes.iloc[0])):
+                dtype = this[this.columns[loc]].dtypes.iloc[0]
+                subset = this[this.columns[loc]]
+
+                value_slice = dtype.construct_array_type()._concat_same_type(
+                    [x._values for _, x in subset.iteritems()]
+                )
+                N, K = this.shape
+                idx = np.arange(N * K).reshape(K, N).T.ravel()
+                value_slice = value_slice.take(idx)
+
+            elif frame._is_mixed_type:
+                value_slice = this[this.columns[loc]].values
+            else:
+                value_slice = this.values[:, loc]
+
+        if value_slice.ndim > 1:
+            # i.e. not extension
+            value_slice = value_slice.ravel()
+
+        new_data[key] = value_slice
+
+    if len(drop_cols) > 0:
+        new_columns = new_columns.difference(drop_cols)
+
+    N = len(this)
+
+    if isinstance(this.index, MultiIndex):
+        new_levels = list(this.index.levels)
+        new_names = list(this.index.names)
+        new_codes = [lab.repeat(levsize) for lab in this.index.codes]
+    else:
+        new_levels = [this.index]
+        new_codes = [np.arange(N).repeat(levsize)]
+        new_names = [this.index.name]  # something better?
+
+    new_levels.append(level_vals)
+    new_codes.append(np.tile(level_codes, N))
+    new_names.append(frame.columns.names[level_num])
+
+    new_index = MultiIndex(levels=new_levels, codes=new_codes,
+                           names=new_names, verify_integrity=False)
+
+    result = frame._constructor(new_data, index=new_index, columns=new_columns)
+
+    # more efficient way to go about this? can do the whole masking biz but
+    # will only save a small amount of time...
+    if dropna:
+        result = result.dropna(axis=0, how='all')
+
+    return result
+
+
+def get_dummies(data, prefix=None, prefix_sep='_', dummy_na=False,
+                columns=None, sparse=False, drop_first=False, dtype=None):
+    """
+    Convert categorical variable into dummy/indicator variables.
+
+    Parameters
+    ----------
+    data : array-like, Series, or DataFrame
+        Data of which to get dummy indicators.
+    prefix : str, list of str, or dict of str, default None
+        String to append DataFrame column names.
+        Pass a list with length equal to the number of columns
+        when calling get_dummies on a DataFrame. Alternatively, `prefix`
+        can be a dictionary mapping column names to prefixes.
+    prefix_sep : str, default '_'
+        If appending prefix, separator/delimiter to use. Or pass a
+        list or dictionary as with `prefix`.
+    dummy_na : bool, default False
+        Add a column to indicate NaNs, if False NaNs are ignored.
+    columns : list-like, default None
+        Column names in the DataFrame to be encoded.
+        If `columns` is None then all the columns with
+        `object` or `category` dtype will be converted.
+    sparse : bool, default False
+        Whether the dummy-encoded columns should be be backed by
+        a :class:`SparseArray` (True) or a regular NumPy array (False).
+    drop_first : bool, default False
+        Whether to get k-1 dummies out of k categorical levels by removing the
+        first level.
+
+        .. versionadded:: 0.18.0
+
+    dtype : dtype, default np.uint8
+        Data type for new columns. Only a single dtype is allowed.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    DataFrame
+        Dummy-coded data.
+
+    See Also
+    --------
+    Series.str.get_dummies : Convert Series to dummy codes.
+
+    Examples
+    --------
+    >>> s = pd.Series(list('abca'))
+
+    >>> pd.get_dummies(s)
+       a  b  c
+    0  1  0  0
+    1  0  1  0
+    2  0  0  1
+    3  1  0  0
+
+    >>> s1 = ['a', 'b', np.nan]
+
+    >>> pd.get_dummies(s1)
+       a  b
+    0  1  0
+    1  0  1
+    2  0  0
+
+    >>> pd.get_dummies(s1, dummy_na=True)
+       a  b  NaN
+    0  1  0    0
+    1  0  1    0
+    2  0  0    1
+
+    >>> df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
+    ...                    'C': [1, 2, 3]})
+
+    >>> pd.get_dummies(df, prefix=['col1', 'col2'])
+       C  col1_a  col1_b  col2_a  col2_b  col2_c
+    0  1       1       0       0       1       0
+    1  2       0       1       1       0       0
+    2  3       1       0       0       0       1
+
+    >>> pd.get_dummies(pd.Series(list('abcaa')))
+       a  b  c
+    0  1  0  0
+    1  0  1  0
+    2  0  0  1
+    3  1  0  0
+    4  1  0  0
+
+    >>> pd.get_dummies(pd.Series(list('abcaa')), drop_first=True)
+       b  c
+    0  0  0
+    1  1  0
+    2  0  1
+    3  0  0
+    4  0  0
+
+    >>> pd.get_dummies(pd.Series(list('abc')), dtype=float)
+         a    b    c
+    0  1.0  0.0  0.0
+    1  0.0  1.0  0.0
+    2  0.0  0.0  1.0
+    """
+    from pandas.core.reshape.concat import concat
+    from itertools import cycle
+
+    dtypes_to_encode = ['object', 'category']
+
+    if isinstance(data, DataFrame):
+        # determine columns being encoded
+        if columns is None:
+            data_to_encode = data.select_dtypes(
+                include=dtypes_to_encode)
+        else:
+            data_to_encode = data[columns]
+
+        # validate prefixes and separator to avoid silently dropping cols
+        def check_len(item, name):
+            len_msg = ("Length of '{name}' ({len_item}) did not match the "
+                       "length of the columns being encoded ({len_enc}).")
+
+            if is_list_like(item):
+                if not len(item) == data_to_encode.shape[1]:
+                    len_msg = len_msg.format(name=name, len_item=len(item),
+                                             len_enc=data_to_encode.shape[1])
+                    raise ValueError(len_msg)
+
+        check_len(prefix, 'prefix')
+        check_len(prefix_sep, 'prefix_sep')
+
+        if isinstance(prefix, compat.string_types):
+            prefix = cycle([prefix])
+        if isinstance(prefix, dict):
+            prefix = [prefix[col] for col in data_to_encode.columns]
+
+        if prefix is None:
+            prefix = data_to_encode.columns
+
+        # validate separators
+        if isinstance(prefix_sep, compat.string_types):
+            prefix_sep = cycle([prefix_sep])
+        elif isinstance(prefix_sep, dict):
+            prefix_sep = [prefix_sep[col] for col in data_to_encode.columns]
+
+        if data_to_encode.shape == data.shape:
+            # Encoding the entire df, do not prepend any dropped columns
+            with_dummies = []
+        elif columns is not None:
+            # Encoding only cols specified in columns. Get all cols not in
+            # columns to prepend to result.
+            with_dummies = [data.drop(columns, axis=1)]
+        else:
+            # Encoding only object and category dtype columns. Get remaining
+            # columns to prepend to result.
+            with_dummies = [data.select_dtypes(exclude=dtypes_to_encode)]
+
+        for (col, pre, sep) in zip(data_to_encode.iteritems(), prefix,
+                                   prefix_sep):
+            # col is (column_name, column), use just column data here
+            dummy = _get_dummies_1d(col[1], prefix=pre, prefix_sep=sep,
+                                    dummy_na=dummy_na, sparse=sparse,
+                                    drop_first=drop_first, dtype=dtype)
+            with_dummies.append(dummy)
+        result = concat(with_dummies, axis=1)
+    else:
+        result = _get_dummies_1d(data, prefix, prefix_sep, dummy_na,
+                                 sparse=sparse,
+                                 drop_first=drop_first,
+                                 dtype=dtype)
+    return result
+
+
+def _get_dummies_1d(data, prefix, prefix_sep='_', dummy_na=False,
+                    sparse=False, drop_first=False, dtype=None):
+    from pandas.core.reshape.concat import concat
+    # Series avoids inconsistent NaN handling
+    codes, levels = _factorize_from_iterable(Series(data))
+
+    if dtype is None:
+        dtype = np.uint8
+    dtype = np.dtype(dtype)
+
+    if is_object_dtype(dtype):
+        raise ValueError("dtype=object is not a valid dtype for get_dummies")
+
+    def get_empty_frame(data):
+        if isinstance(data, Series):
+            index = data.index
+        else:
+            index = np.arange(len(data))
+        return DataFrame(index=index)
+
+    # if all NaN
+    if not dummy_na and len(levels) == 0:
+        return get_empty_frame(data)
+
+    codes = codes.copy()
+    if dummy_na:
+        codes[codes == -1] = len(levels)
+        levels = np.append(levels, np.nan)
+
+    # if dummy_na, we just fake a nan level. drop_first will drop it again
+    if drop_first and len(levels) == 1:
+        return get_empty_frame(data)
+
+    number_of_cols = len(levels)
+
+    if prefix is None:
+        dummy_cols = levels
+    else:
+
+        # PY2 embedded unicode, gh-22084
+        def _make_col_name(prefix, prefix_sep, level):
+            fstr = '{prefix}{prefix_sep}{level}'
+            if PY2 and (isinstance(prefix, text_type) or
+                        isinstance(prefix_sep, text_type) or
+                        isinstance(level, text_type)):
+                fstr = u(fstr)
+            return fstr.format(prefix=prefix,
+                               prefix_sep=prefix_sep,
+                               level=level)
+
+        dummy_cols = [_make_col_name(prefix, prefix_sep, level)
+                      for level in levels]
+
+    if isinstance(data, Series):
+        index = data.index
+    else:
+        index = None
+
+    if sparse:
+
+        if is_integer_dtype(dtype):
+            fill_value = 0
+        elif dtype == bool:
+            fill_value = False
+        else:
+            fill_value = 0.0
+
+        sparse_series = []
+        N = len(data)
+        sp_indices = [[] for _ in range(len(dummy_cols))]
+        mask = codes != -1
+        codes = codes[mask]
+        n_idx = np.arange(N)[mask]
+
+        for ndx, code in zip(n_idx, codes):
+            sp_indices[code].append(ndx)
+
+        if drop_first:
+            # remove first categorical level to avoid perfect collinearity
+            # GH12042
+            sp_indices = sp_indices[1:]
+            dummy_cols = dummy_cols[1:]
+        for col, ixs in zip(dummy_cols, sp_indices):
+            sarr = SparseArray(np.ones(len(ixs), dtype=dtype),
+                               sparse_index=IntIndex(N, ixs),
+                               fill_value=fill_value,
+                               dtype=dtype)
+            sparse_series.append(Series(data=sarr, index=index, name=col))
+
+        out = concat(sparse_series, axis=1, copy=False)
+        return out
+
+    else:
+        dummy_mat = np.eye(number_of_cols, dtype=dtype).take(codes, axis=0)
+
+        if not dummy_na:
+            # reset NaN GH4446
+            dummy_mat[codes == -1] = 0
+
+        if drop_first:
+            # remove first GH12042
+            dummy_mat = dummy_mat[:, 1:]
+            dummy_cols = dummy_cols[1:]
+        return DataFrame(dummy_mat, index=index, columns=dummy_cols)
+
+
+def make_axis_dummies(frame, axis='minor', transform=None):
+    """
+    Construct 1-0 dummy variables corresponding to designated axis
+    labels
+
+    Parameters
+    ----------
+    frame : DataFrame
+    axis : {'major', 'minor'}, default 'minor'
+    transform : function, default None
+        Function to apply to axis labels first. For example, to
+        get "day of week" dummies in a time series regression
+        you might call::
+
+            make_axis_dummies(panel, axis='major',
+                              transform=lambda d: d.weekday())
+    Returns
+    -------
+    dummies : DataFrame
+        Column names taken from chosen axis
+    """
+    numbers = {'major': 0, 'minor': 1}
+    num = numbers.get(axis, axis)
+
+    items = frame.index.levels[num]
+    codes = frame.index.codes[num]
+    if transform is not None:
+        mapped_items = items.map(transform)
+        codes, items = _factorize_from_iterable(mapped_items.take(codes))
+
+    values = np.eye(len(items), dtype=float)
+    values = values.take(codes, axis=0)
+
+    return DataFrame(values, columns=items, index=frame.index)
+
+
+def _reorder_for_extension_array_stack(arr, n_rows, n_columns):
+    """
+    Re-orders the values when stacking multiple extension-arrays.
+
+    The indirect stacking method used for EAs requires a followup
+    take to get the order correct.
+
+    Parameters
+    ----------
+    arr : ExtensionArray
+    n_rows, n_columns : int
+        The number of rows and columns in the original DataFrame.
+
+    Returns
+    -------
+    taken : ExtensionArray
+        The original `arr` with elements re-ordered appropriately
+
+    Examples
+    --------
+    >>> arr = np.array(['a', 'b', 'c', 'd', 'e', 'f'])
+    >>> _reorder_for_extension_array_stack(arr, 2, 3)
+    array(['a', 'c', 'e', 'b', 'd', 'f'], dtype='<U1')
+
+    >>> _reorder_for_extension_array_stack(arr, 3, 2)
+    array(['a', 'd', 'b', 'e', 'c', 'f'], dtype='<U1')
+    """
+    # final take to get the order correct.
+    # idx is an indexer like
+    # [c0r0, c1r0, c2r0, ...,
+    #  c0r1, c1r1, c2r1, ...]
+    idx = np.arange(n_rows * n_columns).reshape(n_columns, n_rows).T.ravel()
+    return arr.take(idx)
diff --git a/pandas/core/reshape/tile.py b/pandas/core/reshape/tile.py
new file mode 100644
index 0000000000000..f99fd9004bb31
--- /dev/null
+++ b/pandas/core/reshape/tile.py
@@ -0,0 +1,550 @@
+"""
+Quantilization functions and related stuff
+"""
+from functools import partial
+
+import numpy as np
+
+from pandas._libs.lib import infer_dtype
+
+from pandas.core.dtypes.common import (
+    _NS_DTYPE, ensure_int64, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_datetime_or_timedelta_dtype, is_integer,
+    is_scalar, is_timedelta64_dtype)
+from pandas.core.dtypes.missing import isna
+
+from pandas import (
+    Categorical, Index, Interval, IntervalIndex, Series, Timedelta, Timestamp,
+    to_datetime, to_timedelta)
+import pandas.core.algorithms as algos
+import pandas.core.nanops as nanops
+
+
+def cut(x, bins, right=True, labels=None, retbins=False, precision=3,
+        include_lowest=False, duplicates='raise'):
+    """
+    Bin values into discrete intervals.
+
+    Use `cut` when you need to segment and sort data values into bins. This
+    function is also useful for going from a continuous variable to a
+    categorical variable. For example, `cut` could convert ages to groups of
+    age ranges. Supports binning into an equal number of bins, or a
+    pre-specified array of bins.
+
+    Parameters
+    ----------
+    x : array-like
+        The input array to be binned. Must be 1-dimensional.
+    bins : int, sequence of scalars, or IntervalIndex
+        The criteria to bin by.
+
+        * int : Defines the number of equal-width bins in the range of `x`. The
+          range of `x` is extended by .1% on each side to include the minimum
+          and maximum values of `x`.
+        * sequence of scalars : Defines the bin edges allowing for non-uniform
+          width. No extension of the range of `x` is done.
+        * IntervalIndex : Defines the exact bins to be used. Note that
+          IntervalIndex for `bins` must be non-overlapping.
+
+    right : bool, default True
+        Indicates whether `bins` includes the rightmost edge or not. If
+        ``right == True`` (the default), then the `bins` ``[1, 2, 3, 4]``
+        indicate (1,2], (2,3], (3,4]. This argument is ignored when
+        `bins` is an IntervalIndex.
+    labels : array or bool, optional
+        Specifies the labels for the returned bins. Must be the same length as
+        the resulting bins. If False, returns only integer indicators of the
+        bins. This affects the type of the output container (see below).
+        This argument is ignored when `bins` is an IntervalIndex.
+    retbins : bool, default False
+        Whether to return the bins or not. Useful when bins is provided
+        as a scalar.
+    precision : int, default 3
+        The precision at which to store and display the bins labels.
+    include_lowest : bool, default False
+        Whether the first interval should be left-inclusive or not.
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    out : Categorical, Series, or ndarray
+        An array-like object representing the respective bin for each value
+        of `x`. The type depends on the value of `labels`.
+
+        * True (default) : returns a Series for Series `x` or a
+          Categorical for all other inputs. The values stored within
+          are Interval dtype.
+
+        * sequence of scalars : returns a Series for Series `x` or a
+          Categorical for all other inputs. The values stored within
+          are whatever the type in the sequence is.
+
+        * False : returns an ndarray of integers.
+
+    bins : numpy.ndarray or IntervalIndex.
+        The computed or specified bins. Only returned when `retbins=True`.
+        For scalar or sequence `bins`, this is an ndarray with the computed
+        bins. If set `duplicates=drop`, `bins` will drop non-unique bin. For
+        an IntervalIndex `bins`, this is equal to `bins`.
+
+    See Also
+    --------
+    qcut : Discretize variable into equal-sized buckets based on rank
+        or based on sample quantiles.
+    Categorical : Array type for storing data that come from a
+        fixed set of values.
+    Series : One-dimensional array with axis labels (including time series).
+    IntervalIndex : Immutable Index implementing an ordered, sliceable set.
+
+    Notes
+    -----
+    Any NA values will be NA in the result. Out of bounds values will be NA in
+    the resulting Series or Categorical object.
+
+    Examples
+    --------
+    Discretize into three equal-sized bins.
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3)
+    ... # doctest: +ELLIPSIS
+    [(0.994, 3.0], (5.0, 7.0], (3.0, 5.0], (3.0, 5.0], (5.0, 7.0], ...
+    Categories (3, interval[float64]): [(0.994, 3.0] < (3.0, 5.0] ...
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3, retbins=True)
+    ... # doctest: +ELLIPSIS
+    ([(0.994, 3.0], (5.0, 7.0], (3.0, 5.0], (3.0, 5.0], (5.0, 7.0], ...
+    Categories (3, interval[float64]): [(0.994, 3.0] < (3.0, 5.0] ...
+    array([0.994, 3.   , 5.   , 7.   ]))
+
+    Discovers the same bins, but assign them specific labels. Notice that
+    the returned Categorical's categories are `labels` and is ordered.
+
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]),
+    ...        3, labels=["bad", "medium", "good"])
+    [bad, good, medium, medium, good, bad]
+    Categories (3, object): [bad < medium < good]
+
+    ``labels=False`` implies you just want the bins back.
+
+    >>> pd.cut([0, 1, 1, 2], bins=4, labels=False)
+    array([0, 1, 1, 3])
+
+    Passing a Series as an input returns a Series with categorical dtype:
+
+    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
+    ...               index=['a', 'b', 'c', 'd', 'e'])
+    >>> pd.cut(s, 3)
+    ... # doctest: +ELLIPSIS
+    a    (1.992, 4.667]
+    b    (1.992, 4.667]
+    c    (4.667, 7.333]
+    d     (7.333, 10.0]
+    e     (7.333, 10.0]
+    dtype: category
+    Categories (3, interval[float64]): [(1.992, 4.667] < (4.667, ...
+
+    Passing a Series as an input returns a Series with mapping value.
+    It is used to map numerically to intervals based on bins.
+
+    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
+    ...               index=['a', 'b', 'c', 'd', 'e'])
+    >>> pd.cut(s, [0, 2, 4, 6, 8, 10], labels=False, retbins=True, right=False)
+    ... # doctest: +ELLIPSIS
+    (a    0.0
+     b    1.0
+     c    2.0
+     d    3.0
+     e    4.0
+     dtype: float64, array([0, 2, 4, 6, 8]))
+
+    Use `drop` optional when bins is not unique
+
+    >>> pd.cut(s, [0, 2, 4, 6, 10, 10], labels=False, retbins=True,
+    ...        right=False, duplicates='drop')
+    ... # doctest: +ELLIPSIS
+    (a    0.0
+     b    1.0
+     c    2.0
+     d    3.0
+     e    3.0
+     dtype: float64, array([0, 2, 4, 6, 8]))
+
+    Passing an IntervalIndex for `bins` results in those categories exactly.
+    Notice that values not covered by the IntervalIndex are set to NaN. 0
+    is to the left of the first bin (which is closed on the right), and 1.5
+    falls between two bins.
+
+    >>> bins = pd.IntervalIndex.from_tuples([(0, 1), (2, 3), (4, 5)])
+    >>> pd.cut([0, 0.5, 1.5, 2.5, 4.5], bins)
+    [NaN, (0, 1], NaN, (2, 3], (4, 5]]
+    Categories (3, interval[int64]): [(0, 1] < (2, 3] < (4, 5]]
+    """
+    # NOTE: this binning code is changed a bit from histogram for var(x) == 0
+
+    # for handling the cut for datetime and timedelta objects
+    x_is_series, series_index, name, x = _preprocess_for_cut(x)
+    x, dtype = _coerce_to_type(x)
+
+    if not np.iterable(bins):
+        if is_scalar(bins) and bins < 1:
+            raise ValueError("`bins` should be a positive integer.")
+
+        try:  # for array-like
+            sz = x.size
+        except AttributeError:
+            x = np.asarray(x)
+            sz = x.size
+
+        if sz == 0:
+            raise ValueError('Cannot cut empty array')
+
+        rng = (nanops.nanmin(x), nanops.nanmax(x))
+        mn, mx = [mi + 0.0 for mi in rng]
+
+        if np.isinf(mn) or np.isinf(mx):
+            # GH 24314
+            raise ValueError('cannot specify integer `bins` when input data '
+                             'contains infinity')
+        elif mn == mx:  # adjust end points before binning
+            mn -= .001 * abs(mn) if mn != 0 else .001
+            mx += .001 * abs(mx) if mx != 0 else .001
+            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
+        else:  # adjust end points after binning
+            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
+            adj = (mx - mn) * 0.001  # 0.1% of the range
+            if right:
+                bins[0] -= adj
+            else:
+                bins[-1] += adj
+
+    elif isinstance(bins, IntervalIndex):
+        if bins.is_overlapping:
+            raise ValueError('Overlapping IntervalIndex is not accepted.')
+
+    else:
+        if is_datetime64tz_dtype(bins):
+            bins = np.asarray(bins, dtype=_NS_DTYPE)
+        else:
+            bins = np.asarray(bins)
+        bins = _convert_bin_to_numeric_type(bins, dtype)
+        if (np.diff(bins) < 0).any():
+            raise ValueError('bins must increase monotonically.')
+
+    fac, bins = _bins_to_cuts(x, bins, right=right, labels=labels,
+                              precision=precision,
+                              include_lowest=include_lowest,
+                              dtype=dtype,
+                              duplicates=duplicates)
+
+    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                                series_index, name, dtype)
+
+
+def qcut(x, q, labels=None, retbins=False, precision=3, duplicates='raise'):
+    """
+    Quantile-based discretization function. Discretize variable into
+    equal-sized buckets based on rank or based on sample quantiles. For example
+    1000 values for 10 quantiles would produce a Categorical object indicating
+    quantile membership for each data point.
+
+    Parameters
+    ----------
+    x : 1d ndarray or Series
+    q : integer or array of quantiles
+        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately
+        array of quantiles, e.g. [0, .25, .5, .75, 1.] for quartiles
+    labels : array or boolean, default None
+        Used as labels for the resulting bins. Must be of the same length as
+        the resulting bins. If False, return only integer indicators of the
+        bins.
+    retbins : bool, optional
+        Whether to return the (bins, labels) or not. Can be useful if bins
+        is given as a scalar.
+    precision : int, optional
+        The precision at which to store and display the bins labels
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    out : Categorical or Series or array of integers if labels is False
+        The return type (Categorical or Series) depends on the input: a Series
+        of type category if input is a Series else Categorical. Bins are
+        represented as categories when categorical data is returned.
+    bins : ndarray of floats
+        Returned only if `retbins` is True.
+
+    Notes
+    -----
+    Out of bounds values will be NA in the resulting Categorical object
+
+    Examples
+    --------
+    >>> pd.qcut(range(5), 4)
+    ... # doctest: +ELLIPSIS
+    [(-0.001, 1.0], (-0.001, 1.0], (1.0, 2.0], (2.0, 3.0], (3.0, 4.0]]
+    Categories (4, interval[float64]): [(-0.001, 1.0] < (1.0, 2.0] ...
+
+    >>> pd.qcut(range(5), 3, labels=["good", "medium", "bad"])
+    ... # doctest: +SKIP
+    [good, good, medium, bad, bad]
+    Categories (3, object): [good < medium < bad]
+
+    >>> pd.qcut(range(5), 4, labels=False)
+    array([0, 0, 1, 2, 3])
+    """
+    x_is_series, series_index, name, x = _preprocess_for_cut(x)
+
+    x, dtype = _coerce_to_type(x)
+
+    if is_integer(q):
+        quantiles = np.linspace(0, 1, q + 1)
+    else:
+        quantiles = q
+    bins = algos.quantile(x, quantiles)
+    fac, bins = _bins_to_cuts(x, bins, labels=labels,
+                              precision=precision, include_lowest=True,
+                              dtype=dtype, duplicates=duplicates)
+
+    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                                series_index, name, dtype)
+
+
+def _bins_to_cuts(x, bins, right=True, labels=None,
+                  precision=3, include_lowest=False,
+                  dtype=None, duplicates='raise'):
+
+    if duplicates not in ['raise', 'drop']:
+        raise ValueError("invalid value for 'duplicates' parameter, "
+                         "valid options are: raise, drop")
+
+    if isinstance(bins, IntervalIndex):
+        # we have a fast-path here
+        ids = bins.get_indexer(x)
+        result = algos.take_nd(bins, ids)
+        result = Categorical(result, categories=bins, ordered=True)
+        return result, bins
+
+    unique_bins = algos.unique(bins)
+    if len(unique_bins) < len(bins) and len(bins) != 2:
+        if duplicates == 'raise':
+            raise ValueError("Bin edges must be unique: {bins!r}.\nYou "
+                             "can drop duplicate edges by setting "
+                             "the 'duplicates' kwarg".format(bins=bins))
+        else:
+            bins = unique_bins
+
+    side = 'left' if right else 'right'
+    ids = ensure_int64(bins.searchsorted(x, side=side))
+
+    if include_lowest:
+        ids[x == bins[0]] = 1
+
+    na_mask = isna(x) | (ids == len(bins)) | (ids == 0)
+    has_nas = na_mask.any()
+
+    if labels is not False:
+        if labels is None:
+            labels = _format_labels(bins, precision, right=right,
+                                    include_lowest=include_lowest,
+                                    dtype=dtype)
+        else:
+            if len(labels) != len(bins) - 1:
+                raise ValueError('Bin labels must be one fewer than '
+                                 'the number of bin edges')
+        if not is_categorical_dtype(labels):
+            labels = Categorical(labels, categories=labels, ordered=True)
+
+        np.putmask(ids, na_mask, 0)
+        result = algos.take_nd(labels, ids - 1)
+
+    else:
+        result = ids - 1
+        if has_nas:
+            result = result.astype(np.float64)
+            np.putmask(result, na_mask, np.nan)
+
+    return result, bins
+
+
+def _coerce_to_type(x):
+    """
+    if the passed data is of datetime/timedelta type,
+    this method converts it to numeric so that cut method can
+    handle it
+    """
+    dtype = None
+
+    if is_datetime64tz_dtype(x):
+        dtype = x.dtype
+    elif is_datetime64_dtype(x):
+        x = to_datetime(x)
+        dtype = np.dtype('datetime64[ns]')
+    elif is_timedelta64_dtype(x):
+        x = to_timedelta(x)
+        dtype = np.dtype('timedelta64[ns]')
+
+    if dtype is not None:
+        # GH 19768: force NaT to NaN during integer conversion
+        x = np.where(x.notna(), x.view(np.int64), np.nan)
+
+    return x, dtype
+
+
+def _convert_bin_to_numeric_type(bins, dtype):
+    """
+    if the passed bin is of datetime/timedelta type,
+    this method converts it to integer
+
+    Parameters
+    ----------
+    bins : list-like of bins
+    dtype : dtype of data
+
+    Raises
+    ------
+    ValueError if bins are not of a compat dtype to dtype
+    """
+    bins_dtype = infer_dtype(bins, skipna=False)
+    if is_timedelta64_dtype(dtype):
+        if bins_dtype in ['timedelta', 'timedelta64']:
+            bins = to_timedelta(bins).view(np.int64)
+        else:
+            raise ValueError("bins must be of timedelta64 dtype")
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        if bins_dtype in ['datetime', 'datetime64']:
+            bins = to_datetime(bins).view(np.int64)
+        else:
+            raise ValueError("bins must be of datetime64 dtype")
+
+    return bins
+
+
+def _convert_bin_to_datelike_type(bins, dtype):
+    """
+    Convert bins to a DatetimeIndex or TimedeltaIndex if the orginal dtype is
+    datelike
+
+    Parameters
+    ----------
+    bins : list-like of bins
+    dtype : dtype of data
+
+    Returns
+    -------
+    bins : Array-like of bins, DatetimeIndex or TimedeltaIndex if dtype is
+           datelike
+    """
+    if is_datetime64tz_dtype(dtype):
+        bins = to_datetime(bins.astype(np.int64),
+                           utc=True).tz_convert(dtype.tz)
+    elif is_datetime_or_timedelta_dtype(dtype):
+        bins = Index(bins.astype(np.int64), dtype=dtype)
+    return bins
+
+
+def _format_labels(bins, precision, right=True,
+                   include_lowest=False, dtype=None):
+    """ based on the dtype, return our labels """
+
+    closed = 'right' if right else 'left'
+
+    if is_datetime64tz_dtype(dtype):
+        formatter = partial(Timestamp, tz=dtype.tz)
+        adjust = lambda x: x - Timedelta('1ns')
+    elif is_datetime64_dtype(dtype):
+        formatter = Timestamp
+        adjust = lambda x: x - Timedelta('1ns')
+    elif is_timedelta64_dtype(dtype):
+        formatter = Timedelta
+        adjust = lambda x: x - Timedelta('1ns')
+    else:
+        precision = _infer_precision(precision, bins)
+        formatter = lambda x: _round_frac(x, precision)
+        adjust = lambda x: x - 10 ** (-precision)
+
+    breaks = [formatter(b) for b in bins]
+    labels = IntervalIndex.from_breaks(breaks, closed=closed)
+
+    if right and include_lowest:
+        # we will adjust the left hand side by precision to
+        # account that we are all right closed
+        v = adjust(labels[0].left)
+
+        i = IntervalIndex([Interval(v, labels[0].right, closed='right')])
+        labels = i.append(labels[1:])
+
+    return labels
+
+
+def _preprocess_for_cut(x):
+    """
+    handles preprocessing for cut where we convert passed
+    input to array, strip the index information and store it
+    separately
+    """
+    x_is_series = isinstance(x, Series)
+    series_index = None
+    name = None
+
+    if x_is_series:
+        series_index = x.index
+        name = x.name
+
+    # Check that the passed array is a Pandas or Numpy object
+    # We don't want to strip away a Pandas data-type here (e.g. datetimetz)
+    ndim = getattr(x, 'ndim', None)
+    if ndim is None:
+        x = np.asarray(x)
+    if x.ndim != 1:
+        raise ValueError("Input array must be 1 dimensional")
+
+    return x_is_series, series_index, name, x
+
+
+def _postprocess_for_cut(fac, bins, retbins, x_is_series,
+                         series_index, name, dtype):
+    """
+    handles post processing for the cut method where
+    we combine the index information if the originally passed
+    datatype was a series
+    """
+    if x_is_series:
+        fac = Series(fac, index=series_index, name=name)
+
+    if not retbins:
+        return fac
+
+    bins = _convert_bin_to_datelike_type(bins, dtype)
+
+    return fac, bins
+
+
+def _round_frac(x, precision):
+    """
+    Round the fractional part of the given number
+    """
+    if not np.isfinite(x) or x == 0:
+        return x
+    else:
+        frac, whole = np.modf(x)
+        if whole == 0:
+            digits = -int(np.floor(np.log10(abs(frac)))) - 1 + precision
+        else:
+            digits = precision
+        return np.around(x, digits)
+
+
+def _infer_precision(base_precision, bins):
+    """Infer an appropriate precision for _round_frac
+    """
+    for precision in range(base_precision, 20):
+        levels = [_round_frac(b, precision) for b in bins]
+        if algos.unique(levels).size == bins.size:
+            return precision
+    return base_precision  # default
diff --git a/pandas/core/reshape/util.py b/pandas/core/reshape/util.py
new file mode 100644
index 0000000000000..9d4135a7f310e
--- /dev/null
+++ b/pandas/core/reshape/util.py
@@ -0,0 +1,57 @@
+import numpy as np
+
+from pandas.core.dtypes.common import is_list_like
+
+from pandas.core import common as com
+
+
+def cartesian_product(X):
+    """
+    Numpy version of itertools.product or pandas.compat.product.
+    Sometimes faster (for large inputs)...
+
+    Parameters
+    ----------
+    X : list-like of list-likes
+
+    Returns
+    -------
+    product : list of ndarrays
+
+    Examples
+    --------
+    >>> cartesian_product([list('ABC'), [1, 2]])
+    [array(['A', 'A', 'B', 'B', 'C', 'C'], dtype='|S1'),
+    array([1, 2, 1, 2, 1, 2])]
+
+    See Also
+    --------
+    itertools.product : Cartesian product of input iterables.  Equivalent to
+        nested for-loops.
+    pandas.compat.product : An alias for itertools.product.
+    """
+    msg = "Input must be a list-like of list-likes"
+    if not is_list_like(X):
+        raise TypeError(msg)
+    for x in X:
+        if not is_list_like(x):
+            raise TypeError(msg)
+
+    if len(X) == 0:
+        return []
+
+    lenX = np.fromiter((len(x) for x in X), dtype=np.intp)
+    cumprodX = np.cumproduct(lenX)
+
+    a = np.roll(cumprodX, 1)
+    a[0] = 1
+
+    if cumprodX[-1] != 0:
+        b = cumprodX[-1] / cumprodX
+    else:
+        # if any factor is empty, the cartesian product is empty
+        b = np.zeros_like(cumprodX)
+
+    return [np.tile(np.repeat(np.asarray(com.values_from_object(x)), b[i]),
+                    np.product(a[i]))
+            for i, x in enumerate(X)]
diff --git a/pandas/core/series.py b/pandas/core/series.py
index bcc1ed272b081..03fc26efa4516 100644
--- a/pandas/core/series.py
+++ b/pandas/core/series.py
@@ -3,88 +3,89 @@
 """
 from __future__ import division
 
-# pylint: disable=E1101,E1103
-# pylint: disable=W0703,W0622,W0613,W0201
-
-import types
+from collections import OrderedDict
+from textwrap import dedent
 import warnings
 
-from numpy import nan, ndarray
 import numpy as np
-import numpy.ma as ma
-
-from pandas.types.common import (_coerce_to_dtype, is_categorical_dtype,
-                                 is_bool,
-                                 is_integer, is_integer_dtype,
-                                 is_float_dtype,
-                                 is_extension_type, is_datetimetz,
-                                 is_datetimelike,
-                                 is_datetime64tz_dtype,
-                                 is_timedelta64_dtype,
-                                 is_list_like,
-                                 is_hashable,
-                                 is_iterator,
-                                 is_dict_like,
-                                 is_scalar,
-                                 _is_unorderable_exception,
-                                 _ensure_platform_int)
-from pandas.types.generic import ABCSparseArray, ABCDataFrame
-from pandas.types.cast import (maybe_upcast, infer_dtype_from_scalar,
-                               maybe_convert_platform,
-                               maybe_cast_to_datetime, maybe_castable)
-from pandas.types.missing import isnull, notnull
-
-from pandas.core.common import (is_bool_indexer,
-                                _default_index,
-                                _asarray_tuplesafe,
-                                _values_from_object,
-                                _try_sort,
-                                _maybe_match_name,
-                                SettingWithCopyError,
-                                _maybe_box_datetimelike,
-                                _dict_compat)
-from pandas.core.index import (Index, MultiIndex, InvalidIndexError,
-                               Float64Index, _ensure_index)
+
+from pandas._libs import iNaT, index as libindex, lib, tslibs
+import pandas.compat as compat
+from pandas.compat import PY36, StringIO, u, zip
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, Substitution, deprecate
+from pandas.util._validators import validate_bool_kwarg
+
+from pandas.core.dtypes.common import (
+    _is_unorderable_exception, ensure_platform_int, is_bool,
+    is_categorical_dtype, is_datetime64_dtype, is_datetimelike, is_dict_like,
+    is_extension_array_dtype, is_extension_type, is_hashable, is_integer,
+    is_iterator, is_list_like, is_scalar, is_string_like, is_timedelta64_dtype)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCDatetimeArray, ABCDatetimeIndex, ABCSeries,
+    ABCSparseArray, ABCSparseSeries)
+from pandas.core.dtypes.missing import (
+    isna, na_value_for_dtype, notna, remove_na_arraylike)
+
+from pandas.core import algorithms, base, generic, nanops, ops
+from pandas.core.accessor import CachedAccessor
+from pandas.core.arrays import ExtensionArray, SparseArray
+from pandas.core.arrays.categorical import Categorical, CategoricalAccessor
+from pandas.core.arrays.sparse import SparseAccessor
+import pandas.core.common as com
+from pandas.core.config import get_option
+from pandas.core.index import (
+    Float64Index, Index, InvalidIndexError, MultiIndex, ensure_index)
+from pandas.core.indexes.accessors import CombinedDatetimelikeProperties
+import pandas.core.indexes.base as ibase
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.period import PeriodIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
 from pandas.core.indexing import check_bool_indexer, maybe_convert_indices
-from pandas.core import generic, base
 from pandas.core.internals import SingleBlockManager
-from pandas.core.categorical import Categorical, CategoricalAccessor
-import pandas.core.strings as strings
-from pandas.tseries.common import (maybe_to_datetimelike,
-                                   CombinedDatetimelikeProperties)
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.period import PeriodIndex
-from pandas import compat
-from pandas.util.terminal import get_terminal_size
-from pandas.compat import zip, u, OrderedDict, StringIO
-from pandas.compat.numpy import function as nv
+from pandas.core.internals.construction import sanitize_array
+from pandas.core.strings import StringMethods
+from pandas.core.tools.datetimes import to_datetime
 
-import pandas.core.ops as ops
-import pandas.core.algorithms as algorithms
+import pandas.io.formats.format as fmt
+from pandas.io.formats.terminal import get_terminal_size
+import pandas.plotting._core as gfx
 
-import pandas.core.common as com
-import pandas.core.nanops as nanops
-import pandas.formats.format as fmt
-from pandas.util.decorators import Appender, deprecate_kwarg, Substitution
-from pandas.util.validators import validate_bool_kwarg
+# pylint: disable=E1101,E1103
+# pylint: disable=W0703,W0622,W0613,W0201
 
-from pandas._libs import index as libindex, tslib as libts, lib, iNaT
-from pandas.core.config import get_option
 
 __all__ = ['Series']
 
 _shared_doc_kwargs = dict(
-    axes='index', klass='Series', axes_single_arg="{0, 'index'}",
+    axes='index', klass='Series', axes_single_arg="{0 or 'index'}",
+    axis="""axis : {0 or 'index'}
+        Parameter needed for compatibility with DataFrame.""",
     inplace="""inplace : boolean, default False
         If True, performs operation inplace and returns None.""",
     unique='np.ndarray', duplicated='Series',
-    optional_by='',
-    versionadded_to_excel='\n.. versionadded:: 0.20.0\n')
+    optional_by='', optional_mapper='', optional_labels='', optional_axis='',
+    versionadded_to_excel='\n    .. versionadded:: 0.20.0\n')
+
+
+# see gh-16971
+def remove_na(arr):
+    """
+    Remove null values from array like structure.
+
+    .. deprecated:: 0.21.0
+        Use s[s.notnull()] instead.
+    """
+
+    warnings.warn("remove_na is deprecated and is a private "
+                  "function. Do not use.", FutureWarning, stacklevel=2)
+    return remove_na_arraylike(arr)
 
 
 def _coerce_method(converter):
-    """ install the scalar coercion methods """
+    """
+    Install the scalar coercion methods.
+    """
 
     def wrapper(self):
         if len(self) == 1:
@@ -92,14 +93,14 @@ def wrapper(self):
         raise TypeError("cannot convert the series to "
                         "{0}".format(str(converter)))
 
+    wrapper.__name__ = "__{name}__".format(name=converter.__name__)
     return wrapper
 
 # ----------------------------------------------------------------------
 # Series class
 
 
-class Series(base.IndexOpsMixin, strings.StringAccessorMixin,
-             generic.NDFrame,):
+class Series(base.IndexOpsMixin, generic.NDFrame):
     """
     One-dimensional ndarray with axis labels (including time series).
 
@@ -115,22 +116,39 @@ class Series(base.IndexOpsMixin, strings.StringAccessorMixin,
 
     Parameters
     ----------
-    data : array-like, dict, or scalar value
-        Contains data stored in Series
+    data : array-like, Iterable, dict, or scalar value
+        Contains data stored in Series.
+
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
     index : array-like or Index (1d)
         Values must be hashable and have the same length as `data`.
         Non-unique index values are allowed. Will default to
-        RangeIndex(len(data)) if not provided. If both a dict and index
+        RangeIndex (0, 1, 2, ..., n) if not provided. If both a dict and index
         sequence are used, the index will override the keys found in the
         dict.
-    dtype : numpy.dtype or None
-        If None, dtype will be inferred
-    copy : boolean, default False
-        Copy input data
+    dtype : str, numpy.dtype, or ExtensionDtype, optional
+        Data type for the output Series. If not specified, this will be
+        inferred from `data`.
+        See the :ref:`user guide <basics.dtypes>` for more usages.
+    copy : bool, default False
+        Copy input data.
     """
     _metadata = ['name']
-    _accessors = frozenset(['dt', 'cat', 'str'])
-    _allow_index_ops = True
+    _accessors = {'dt', 'cat', 'str', 'sparse'}
+    # tolist is not actually deprecated, just suppressed in the __dir__
+    _deprecations = generic.NDFrame._deprecations | frozenset(
+        ['asobject', 'reshape', 'get_value', 'set_value',
+         'from_csv', 'valid', 'tolist'])
+
+    # Override cache_readonly bc Series is mutable
+    hasnans = property(base.IndexOpsMixin.hasnans.func,
+                       doc=base.IndexOpsMixin.hasnans.__doc__)
+
+    # ----------------------------------------------------------------------
+    # Constructors
 
     def __init__(self, data=None, index=None, dtype=None, name=None,
                  copy=False, fastpath=False):
@@ -149,7 +167,7 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
         else:
 
             if index is not None:
-                index = _ensure_index(index)
+                index = ensure_index(index)
 
             if data is None:
                 data = {}
@@ -160,15 +178,25 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
                 raise NotImplementedError("initializing a Series from a "
                                           "MultiIndex is not supported")
             elif isinstance(data, Index):
-                # need to copy to avoid aliasing issues
                 if name is None:
                     name = data.name
 
-                data = data._to_embed(keep_tz=True)
-                copy = True
+                if dtype is not None:
+                    # astype copies
+                    data = data.astype(dtype)
+                else:
+                    # need to copy to avoid aliasing issues
+                    data = data._values.copy()
+                    if (isinstance(data, ABCDatetimeIndex) and
+                            data.tz is not None):
+                        # GH#24096 need copy to be deep for datetime64tz case
+                        # TODO: See if we can avoid these copies
+                        data = data._values.copy(deep=True)
+                copy = False
+
             elif isinstance(data, np.ndarray):
                 pass
-            elif isinstance(data, Series):
+            elif isinstance(data, (ABCSeries, ABCSparseSeries)):
                 if name is None:
                     name = data.name
                 if index is None:
@@ -177,50 +205,29 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
                     data = data.reindex(index, copy=copy)
                 data = data._data
             elif isinstance(data, dict):
-                if index is None:
-                    if isinstance(data, OrderedDict):
-                        index = Index(data)
-                    else:
-                        index = Index(_try_sort(data))
-                try:
-                    if isinstance(index, DatetimeIndex):
-                        if len(data):
-                            # coerce back to datetime objects for lookup
-                            data = _dict_compat(data)
-                            data = lib.fast_multiget(data,
-                                                     index.asobject.values,
-                                                     default=np.nan)
-                        else:
-                            data = np.nan
-                    # GH #12169
-                    elif isinstance(index, (PeriodIndex, TimedeltaIndex)):
-                        data = ([data.get(i, nan) for i in index]
-                                if data else np.nan)
-                    else:
-                        data = lib.fast_multiget(data, index.values,
-                                                 default=np.nan)
-                except TypeError:
-                    data = ([data.get(i, nan) for i in index]
-                            if data else np.nan)
-
+                data, index = self._init_dict(data, index, dtype)
+                dtype = None
+                copy = False
             elif isinstance(data, SingleBlockManager):
                 if index is None:
                     index = data.index
-                else:
-                    data = data.reindex(index, copy=copy)
-            elif isinstance(data, Categorical):
-                # GH12574: Allow dtype=category only, otherwise error
-                if ((dtype is not None) and
-                        not is_categorical_dtype(dtype)):
-                    raise ValueError("cannot specify a dtype with a "
-                                     "Categorical unless "
-                                     "dtype='category'")
-            elif (isinstance(data, types.GeneratorType) or
-                  (compat.PY3 and isinstance(data, map))):
-                data = list(data)
+                elif not data.index.equals(index) or copy:
+                    # GH#19275 SingleBlockManager input should only be called
+                    # internally
+                    raise AssertionError('Cannot pass both SingleBlockManager '
+                                         '`data` argument and a different '
+                                         '`index` argument.  `copy` must '
+                                         'be False.')
+
+            elif is_extension_array_dtype(data):
+                pass
             elif isinstance(data, (set, frozenset)):
                 raise TypeError("{0!r} type is unordered"
                                 "".format(data.__class__.__name__))
+            # If data is Iterable but not list-like, consume into list.
+            elif (isinstance(data, compat.Iterable)
+                  and not isinstance(data, compat.Sized)):
+                data = list(data)
             else:
 
                 # handle sparse passed here (and force conversion)
@@ -230,18 +237,30 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
             if index is None:
                 if not is_list_like(data):
                     data = [data]
-                index = _default_index(len(data))
+                index = ibase.default_index(len(data))
+            elif is_list_like(data):
+
+                # a scalar numpy array is list-like but doesn't
+                # have a proper length
+                try:
+                    if len(index) != len(data):
+                        raise ValueError(
+                            'Length of passed values is {val}, '
+                            'index implies {ind}'
+                            .format(val=len(data), ind=len(index)))
+                except TypeError:
+                    pass
 
             # create/copy the manager
             if isinstance(data, SingleBlockManager):
                 if dtype is not None:
-                    data = data.astype(dtype=dtype, raise_on_error=False,
+                    data = data.astype(dtype=dtype, errors='ignore',
                                        copy=copy)
                 elif copy:
                     data = data.copy()
             else:
-                data = _sanitize_array(data, index, dtype, copy,
-                                       raise_cast_failure=True)
+                data = sanitize_array(data, index, dtype, copy,
+                                      raise_cast_failure=True)
 
                 data = SingleBlockManager(data, index, fastpath=True)
 
@@ -250,16 +269,72 @@ def __init__(self, data=None, index=None, dtype=None, name=None,
         self.name = name
         self._set_axis(0, index, fastpath=True)
 
+    def _init_dict(self, data, index=None, dtype=None):
+        """
+        Derive the "_data" and "index" attributes of a new Series from a
+        dictionary input.
+
+        Parameters
+        ----------
+        data : dict or dict-like
+            Data used to populate the new Series
+        index : Index or index-like, default None
+            index for the new Series: if None, use dict keys
+        dtype : dtype, default None
+            dtype for the new Series: if None, infer from data
+
+        Returns
+        -------
+        _data : BlockManager for the new Series
+        index : index for the new Series
+        """
+        # Looking for NaN in dict doesn't work ({np.nan : 1}[float('nan')]
+        # raises KeyError), so we iterate the entire dict, and align
+        if data:
+            keys, values = zip(*compat.iteritems(data))
+            values = list(values)
+        elif index is not None:
+            # fastpath for Series(data=None). Just use broadcasting a scalar
+            # instead of reindexing.
+            values = na_value_for_dtype(dtype)
+            keys = index
+        else:
+            keys, values = [], []
+
+        # Input is now list-like, so rely on "standard" construction:
+        s = Series(values, index=keys, dtype=dtype)
+
+        # Now we just make sure the order is respected, if any
+        if data and index is not None:
+            s = s.reindex(index, copy=False)
+        elif not PY36 and not isinstance(data, OrderedDict) and data:
+            # Need the `and data` to avoid sorting Series(None, index=[...])
+            # since that isn't really dict-like
+            try:
+                s = s.sort_index()
+            except TypeError:
+                pass
+        return s._data, s.index
+
     @classmethod
     def from_array(cls, arr, index=None, name=None, dtype=None, copy=False,
                    fastpath=False):
-        # return a sparse series here
+        """
+        Construct Series from array.
+
+        .. deprecated :: 0.23.0
+            Use pd.Series(..) constructor instead.
+        """
+        warnings.warn("'from_array' is deprecated and will be removed in a "
+                      "future version. Please use the pd.Series(..) "
+                      "constructor instead.", FutureWarning, stacklevel=2)
         if isinstance(arr, ABCSparseArray):
-            from pandas.sparse.series import SparseSeries
+            from pandas.core.sparse.series import SparseSeries
             cls = SparseSeries
+        return cls(arr, index=index, name=name, dtype=dtype,
+                   copy=copy, fastpath=fastpath)
 
-        return cls(arr, index=index, name=name, dtype=dtype, copy=copy,
-                   fastpath=fastpath)
+    # ----------------------------------------------------------------------
 
     @property
     def _constructor(self):
@@ -278,10 +353,12 @@ def _can_hold_na(self):
     _index = None
 
     def _set_axis(self, axis, labels, fastpath=False):
-        """ override generic, we want to set the _typ here """
+        """
+        Override generic, we want to set the _typ here.
+        """
 
         if not fastpath:
-            labels = _ensure_index(labels)
+            labels = ensure_index(labels)
 
         is_all_dates = labels.is_all_dates
         if is_all_dates:
@@ -289,10 +366,10 @@ def _set_axis(self, axis, labels, fastpath=False):
                               (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
                 try:
                     labels = DatetimeIndex(labels)
-                    # need to set here becuase we changed the index
+                    # need to set here because we changed the index
                     if fastpath:
                         self._data.set_axis(axis, labels)
-                except (libts.OutOfBoundsDatetime, ValueError):
+                except (tslibs.OutOfBoundsDatetime, ValueError):
                     # labels may exceeds datetime bounds,
                     # or not be a DatetimeIndex
                     pass
@@ -315,6 +392,9 @@ def _update_inplace(self, result, **kwargs):
 
     @property
     def name(self):
+        """
+        Return name of the Series.
+        """
         return self._name
 
     @name.setter
@@ -326,33 +406,51 @@ def name(self, value):
     # ndarray compatibility
     @property
     def dtype(self):
-        """ return the dtype object of the underlying data """
+        """
+        Return the dtype object of the underlying data.
+        """
         return self._data.dtype
 
     @property
     def dtypes(self):
-        """ return the dtype object of the underlying data """
+        """
+        Return the dtype object of the underlying data.
+        """
         return self._data.dtype
 
     @property
     def ftype(self):
-        """ return if the data is sparse|dense """
+        """
+        Return if the data is sparse|dense.
+        """
         return self._data.ftype
 
     @property
     def ftypes(self):
-        """ return if the data is sparse|dense """
+        """
+        Return if the data is sparse|dense.
+        """
         return self._data.ftype
 
     @property
     def values(self):
         """
-        Return Series as ndarray or ndarray-like
-        depending on the dtype
+        Return Series as ndarray or ndarray-like depending on the dtype.
+
+        .. warning::
+
+           We recommend using :attr:`Series.array` or
+           :meth:`Series.to_numpy`, depending on whether you need
+           a reference to the underlying data or a NumPy array.
 
         Returns
         -------
-        arr : numpy.ndarray or ndarray-like
+        numpy.ndarray or ndarray-like
+
+        See Also
+        --------
+        Series.array : Reference to the underlying data.
+        Series.to_numpy : A NumPy array representing the underlying data.
 
         Examples
         --------
@@ -373,34 +471,55 @@ def values(self):
         array(['2013-01-01T05:00:00.000000000',
                '2013-01-02T05:00:00.000000000',
                '2013-01-03T05:00:00.000000000'], dtype='datetime64[ns]')
-
         """
         return self._data.external_values()
 
     @property
     def _values(self):
-        """ return the internal repr of this data """
+        """
+        Return the internal repr of this data.
+        """
         return self._data.internal_values()
 
+    def _formatting_values(self):
+        """
+        Return the values that can be formatted (used by SeriesFormatter
+        and DataFrameFormatter).
+        """
+        return self._data.formatting_values()
+
     def get_values(self):
-        """ same as values (but handles sparseness conversions); is a view """
+        """
+        Same as values (but handles sparseness conversions); is a view.
+        """
         return self._data.get_values()
 
     @property
     def asobject(self):
         """
-        return object Series which contains boxed values
+        Return object Series which contains boxed values.
+
+        .. deprecated :: 0.23.0
+
+           Use ``astype(object)`` instead.
 
         *this is an internal non-public method*
         """
-        return self._data.asobject
+        warnings.warn("'asobject' is deprecated. Use 'astype(object)'"
+                      " instead", FutureWarning, stacklevel=2)
+        return self.astype(object).values
 
     # ops
     def ravel(self, order='C'):
         """
-        Return the flattened underlying data as an ndarray
+        Return the flattened underlying data as an ndarray.
 
-        See also
+        Returns
+        -------
+        numpy.ndarray or ndarray-like
+            Flattened data of the Series.
+
+        See Also
         --------
         numpy.ndarray.ravel
         """
@@ -408,25 +527,38 @@ def ravel(self, order='C'):
 
     def compress(self, condition, *args, **kwargs):
         """
-        Return selected slices of an array along given axis as a Series
+        Return selected slices of an array along given axis as a Series.
 
-        See also
+        .. deprecated:: 0.24.0
+
+        See Also
         --------
         numpy.ndarray.compress
         """
+        msg = ("Series.compress(condition) is deprecated. "
+               "Use 'Series[condition]' or "
+               "'np.asarray(series).compress(condition)' instead.")
+        warnings.warn(msg, FutureWarning, stacklevel=2)
         nv.validate_compress(args, kwargs)
         return self[condition]
 
     def nonzero(self):
         """
-        Return the indices of the elements that are non-zero
+        Return the *integer* indices of the elements that are non-zero.
+
+        .. deprecated:: 0.24.0
+           Please use .to_numpy().nonzero() as a replacement.
 
         This method is equivalent to calling `numpy.nonzero` on the
-        series data. For compatability with NumPy, the return value is
+        series data. For compatibility with NumPy, the return value is
         the same (a tuple with an array of indices for each dimension),
         but it will always be a one-item tuple because series only have
         one dimension.
 
+        See Also
+        --------
+        numpy.nonzero
+
         Examples
         --------
         >>> s = pd.Series([0, 3, 0, 4])
@@ -437,18 +569,26 @@ def nonzero(self):
         3    4
         dtype: int64
 
-        See Also
-        --------
-        numpy.nonzero
+        >>> s = pd.Series([0, 3, 0, 4], index=['a', 'b', 'c', 'd'])
+        # same return although index of s is different
+        >>> s.nonzero()
+        (array([1, 3]),)
+        >>> s.iloc[s.nonzero()[0]]
+        b    3
+        d    4
+        dtype: int64
         """
+        msg = ("Series.nonzero() is deprecated "
+               "and will be removed in a future version."
+               "Use Series.to_numpy().nonzero() instead")
+        warnings.warn(msg, FutureWarning, stacklevel=2)
         return self._values.nonzero()
 
     def put(self, *args, **kwargs):
         """
-        Applies the `put` method to its `values` attribute
-        if it has one.
+        Apply the `put` method to its `values` attribute if it has one.
 
-        See also
+        See Also
         --------
         numpy.ndarray.put
         """
@@ -456,34 +596,159 @@ def put(self, *args, **kwargs):
 
     def __len__(self):
         """
-        return the length of the Series
+        Return the length of the Series.
         """
         return len(self._data)
 
     def view(self, dtype=None):
+        """
+        Create a new view of the Series.
+
+        This function will return a new Series with a view of the same
+        underlying values in memory, optionally reinterpreted with a new data
+        type. The new data type must preserve the same size in bytes as to not
+        cause index misalignment.
+
+        Parameters
+        ----------
+        dtype : data type
+            Data type object or one of their string representations.
+
+        Returns
+        -------
+        Series
+            A new Series object as a view of the same data in memory.
+
+        See Also
+        --------
+        numpy.ndarray.view : Equivalent numpy function to create a new view of
+            the same data in memory.
+
+        Notes
+        -----
+        Series are instantiated with ``dtype=float64`` by default. While
+        ``numpy.ndarray.view()`` will return a view with the same data type as
+        the original array, ``Series.view()`` (without specified dtype)
+        will try using ``float64`` and may fail if the original data type size
+        in bytes is not the same.
+
+        Examples
+        --------
+        >>> s = pd.Series([-2, -1, 0, 1, 2], dtype='int8')
+        >>> s
+        0   -2
+        1   -1
+        2    0
+        3    1
+        4    2
+        dtype: int8
+
+        The 8 bit signed integer representation of `-1` is `0b11111111`, but
+        the same bytes represent 255 if read as an 8 bit unsigned integer:
+
+        >>> us = s.view('uint8')
+        >>> us
+        0    254
+        1    255
+        2      0
+        3      1
+        4      2
+        dtype: uint8
+
+        The views share the same underlying values:
+
+        >>> us[0] = 128
+        >>> s
+        0   -128
+        1     -1
+        2      0
+        3      1
+        4      2
+        dtype: int8
+        """
         return self._constructor(self._values.view(dtype),
                                  index=self.index).__finalize__(self)
 
-    def __array__(self, result=None):
+    # ----------------------------------------------------------------------
+    # NDArray Compat
+
+    def __array__(self, dtype=None):
         """
-        the array interface, return my values
+        Return the values as a NumPy array.
+
+        Users should not call this directly. Rather, it is invoked by
+        :func:`numpy.array` and :func:`numpy.asarray`.
+
+        Parameters
+        ----------
+        dtype : str or numpy.dtype, optional
+            The dtype to use for the resulting NumPy array. By default,
+            the dtype is inferred from the data.
+
+        Returns
+        -------
+        numpy.ndarray
+            The values in the series converted to a :class:`numpy.ndarary`
+            with the specified `dtype`.
+
+        See Also
+        --------
+        array : Create a new array from data.
+        Series.array : Zero-copy view to the array backing the Series.
+        Series.to_numpy : Series method for similar behavior.
+
+        Examples
+        --------
+        >>> ser = pd.Series([1, 2, 3])
+        >>> np.asarray(ser)
+        array([1, 2, 3])
+
+        For timezone-aware data, the timezones may be retained with
+        ``dtype='object'``
+
+        >>> tzser = pd.Series(pd.date_range('2000', periods=2, tz="CET"))
+        >>> np.asarray(tzser, dtype="object")
+        array([Timestamp('2000-01-01 00:00:00+0100', tz='CET', freq='D'),
+               Timestamp('2000-01-02 00:00:00+0100', tz='CET', freq='D')],
+              dtype=object)
+
+        Or the values may be localized to UTC and the tzinfo discared with
+        ``dtype='datetime64[ns]'``
+
+        >>> np.asarray(tzser, dtype="datetime64[ns]")  # doctest: +ELLIPSIS
+        array(['1999-12-31T23:00:00.000000000', ...],
+              dtype='datetime64[ns]')
         """
-        return self.get_values()
+        if (dtype is None and isinstance(self.array, ABCDatetimeArray)
+                and getattr(self.dtype, 'tz', None)):
+            msg = (
+                "Converting timezone-aware DatetimeArray to timezone-naive "
+                "ndarray with 'datetime64[ns]' dtype. In the future, this "
+                "will return an ndarray with 'object' dtype where each "
+                "element is a 'pandas.Timestamp' with the correct 'tz'.\n\t"
+                "To accept the future behavior, pass 'dtype=object'.\n\t"
+                "To keep the old behavior, pass 'dtype=\"datetime64[ns]\"'."
+            )
+            warnings.warn(msg, FutureWarning, stacklevel=3)
+            dtype = 'M8[ns]'
+        return np.asarray(self.array, dtype)
 
     def __array_wrap__(self, result, context=None):
         """
-        Gets called after a ufunc
+        Gets called after a ufunc.
         """
         return self._constructor(result, index=self.index,
                                  copy=False).__finalize__(self)
 
     def __array_prepare__(self, result, context=None):
         """
-        Gets called prior to a ufunc
+        Gets called prior to a ufunc.
         """
 
         # nice error message for non-ufunc types
-        if context is not None and not isinstance(self._values, np.ndarray):
+        if (context is not None and
+                (not isinstance(self._values, (np.ndarray, ExtensionArray))
+                 or isinstance(self._values, Categorical))):
             obj = context[1][0]
             raise TypeError("{obj} with dtype {dtype} cannot perform "
                             "the numpy op {op}".format(
@@ -492,9 +757,14 @@ def __array_prepare__(self, result, context=None):
                                 op=context[0].__name__))
         return result
 
-    # complex
+    # ----------------------------------------------------------------------
+    # Unary Methods
+
     @property
     def real(self):
+        """
+        Return the real value of vector.
+        """
         return self.values.real
 
     @real.setter
@@ -503,6 +773,9 @@ def real(self, v):
 
     @property
     def imag(self):
+        """
+        Return imag value of vector.
+        """
         return self.values.imag
 
     @imag.setter
@@ -514,6 +787,8 @@ def imag(self, v):
     __long__ = _coerce_method(int)
     __int__ = _coerce_method(int)
 
+    # ----------------------------------------------------------------------
+
     def _unpickle_series_compat(self, state):
         if isinstance(state, dict):
             self._data = state['_data']
@@ -546,12 +821,14 @@ def _unpickle_series_compat(self, state):
     # indexers
     @property
     def axes(self):
-        """Return a list of the row axis labels"""
+        """
+        Return a list of the row axis labels.
+        """
         return [self.index]
 
     def _ixs(self, i, axis=0):
         """
-        Return the i-th value or values in the Series by location
+        Return the i-th value or values in the Series by location.
 
         Parameters
         ----------
@@ -559,7 +836,7 @@ def _ixs(self, i, axis=0):
 
         Returns
         -------
-        value : scalar (int) or Series (slice, sequence)
+        scalar (int) or Series (slice, sequence)
         """
         try:
 
@@ -571,7 +848,7 @@ def _ixs(self, i, axis=0):
                 return values[i]
         except IndexError:
             raise
-        except:
+        except Exception:
             if isinstance(i, slice):
                 indexer = self.index._convert_slice_indexer(i, kind='iloc')
                 return self._get_values(indexer)
@@ -592,20 +869,22 @@ def _slice(self, slobj, axis=0, kind=None):
         return self._get_values(slobj)
 
     def __getitem__(self, key):
-        key = com._apply_if_callable(key, self)
+        key = com.apply_if_callable(key, self)
         try:
             result = self.index.get_value(self, key)
 
             if not is_scalar(result):
                 if is_list_like(result) and not isinstance(result, Series):
 
-                    # we need to box if we have a non-unique index here
+                    # we need to box if loc of the key isn't scalar here
                     # otherwise have inline ndarray/lists
-                    if not self.index.is_unique:
-                        result = self._constructor(
-                            result, index=[key] * len(result),
-                            dtype=self.dtype).__finalize__(self)
-
+                    try:
+                        if not is_scalar(self.index.get_loc(key)):
+                            result = self._constructor(
+                                result, index=[key] * len(result),
+                                dtype=self.dtype).__finalize__(self)
+                    except KeyError:
+                        pass
             return result
         except InvalidIndexError:
             pass
@@ -615,7 +894,7 @@ def __getitem__(self, key):
                 pass
             elif key is Ellipsis:
                 return self
-            elif is_bool_indexer(key):
+            elif com.is_bool_indexer(key):
                 pass
             else:
 
@@ -645,51 +924,50 @@ def _get_with(self, key):
         elif isinstance(key, ABCDataFrame):
             raise TypeError('Indexing a Series with DataFrame is not '
                             'supported, use the appropriate DataFrame column')
+        elif isinstance(key, tuple):
+            try:
+                return self._get_values_tuple(key)
+            except Exception:
+                if len(key) == 1:
+                    key = key[0]
+                    if isinstance(key, slice):
+                        return self._get_values(key)
+                raise
+
+        # pragma: no cover
+        if not isinstance(key, (list, np.ndarray, Series, Index)):
+            key = list(key)
+
+        if isinstance(key, Index):
+            key_type = key.inferred_type
         else:
-            if isinstance(key, tuple):
-                try:
-                    return self._get_values_tuple(key)
-                except:
-                    if len(key) == 1:
-                        key = key[0]
-                        if isinstance(key, slice):
-                            return self._get_values(key)
-                    raise
-
-            # pragma: no cover
-            if not isinstance(key, (list, np.ndarray, Series, Index)):
-                key = list(key)
+            key_type = lib.infer_dtype(key, skipna=False)
 
-            if isinstance(key, Index):
-                key_type = key.inferred_type
+        if key_type == 'integer':
+            if self.index.is_integer() or self.index.is_floating():
+                return self.loc[key]
             else:
-                key_type = lib.infer_dtype(key)
-
-            if key_type == 'integer':
-                if self.index.is_integer() or self.index.is_floating():
-                    return self.reindex(key)
-                else:
-                    return self._get_values(key)
-            elif key_type == 'boolean':
                 return self._get_values(key)
-            else:
-                try:
-                    # handle the dup indexing case (GH 4246)
-                    if isinstance(key, (list, tuple)):
-                        return self.loc[key]
+        elif key_type == 'boolean':
+            return self._get_values(key)
 
-                    return self.reindex(key)
-                except Exception:
-                    # [slice(0, 5, None)] will break if you convert to ndarray,
-                    # e.g. as requested by np.median
-                    # hack
-                    if isinstance(key[0], slice):
-                        return self._get_values(key)
-                    raise
+        try:
+            # handle the dup indexing case (GH 4246)
+            if isinstance(key, (list, tuple)):
+                return self.loc[key]
+
+            return self.reindex(key)
+        except Exception:
+            # [slice(0, 5, None)] will break if you convert to ndarray,
+            # e.g. as requested by np.median
+            # hack
+            if isinstance(key[0], slice):
+                return self._get_values(key)
+            raise
 
     def _get_values_tuple(self, key):
         # mpl hackaround
-        if any(k is None for k in key):
+        if com._any_none(*key):
             return self._get_values(key)
 
         if not isinstance(self.index, MultiIndex):
@@ -708,13 +986,13 @@ def _get_values(self, indexer):
             return self._values[indexer]
 
     def __setitem__(self, key, value):
-        key = com._apply_if_callable(key, self)
+        key = com.apply_if_callable(key, self)
 
         def setitem(key, value):
             try:
                 self._set_with_engine(key, value)
                 return
-            except (SettingWithCopyError):
+            except com.SettingWithCopyError:
                 raise
             except (KeyError, ValueError):
                 values = self._values
@@ -730,7 +1008,7 @@ def setitem(key, value):
                     pass
                 elif is_timedelta64_dtype(self.dtype):
                     # reassign a null value to iNaT
-                    if isnull(value):
+                    if isna(value):
                         value = iNaT
 
                         try:
@@ -789,16 +1067,18 @@ def _set_with(self, key, value):
                 except Exception:
                     pass
 
-            if not isinstance(key, (list, Series, np.ndarray, Series)):
+            if is_scalar(key):
+                key = [key]
+            elif not isinstance(key, (list, Series, np.ndarray)):
                 try:
                     key = list(key)
-                except:
+                except Exception:
                     key = [key]
 
             if isinstance(key, Index):
                 key_type = key.inferred_type
             else:
-                key_type = lib.infer_dtype(key)
+                key_type = lib.infer_dtype(key, skipna=False)
 
             if key_type == 'integer':
                 if self.index.inferred_type == 'integer':
@@ -814,7 +1094,7 @@ def _set_labels(self, key, value):
         if isinstance(key, Index):
             key = key.values
         else:
-            key = _asarray_tuplesafe(key)
+            key = com.asarray_tuplesafe(key)
         indexer = self.index.get_indexer(key)
         mask = indexer == -1
         if mask.any():
@@ -827,74 +1107,101 @@ def _set_values(self, key, value):
         self._data = self._data.setitem(indexer=key, value=value)
         self._maybe_update_cacher()
 
-    @deprecate_kwarg(old_arg_name='reps', new_arg_name='repeats')
-    def repeat(self, repeats, *args, **kwargs):
+    def repeat(self, repeats, axis=None):
         """
-        Repeat elements of an Series. Refer to `numpy.ndarray.repeat`
-        for more information about the `repeats` argument.
+        Repeat elements of a Series.
+
+        Returns a new Series where each element of the current Series
+        is repeated consecutively a given number of times.
+
+        Parameters
+        ----------
+        repeats : int or array of ints
+            The number of repetitions for each element. This should be a
+            non-negative integer. Repeating 0 times will return an empty
+            Series.
+        axis : None
+            Must be ``None``. Has no effect but is accepted for compatibility
+            with numpy.
+
+        Returns
+        -------
+        Series
+            Newly created Series with repeated elements.
+
+        See Also
+        --------
+        Index.repeat : Equivalent function for Index.
+        numpy.repeat : Similar method for :class:`numpy.ndarray`.
 
-        See also
+        Examples
         --------
-        numpy.ndarray.repeat
+        >>> s = pd.Series(['a', 'b', 'c'])
+        >>> s
+        0    a
+        1    b
+        2    c
+        dtype: object
+        >>> s.repeat(2)
+        0    a
+        0    a
+        1    b
+        1    b
+        2    c
+        2    c
+        dtype: object
+        >>> s.repeat([1, 2, 3])
+        0    a
+        1    b
+        1    b
+        2    c
+        2    c
+        2    c
+        dtype: object
         """
-        nv.validate_repeat(args, kwargs)
+        nv.validate_repeat(tuple(), dict(axis=axis))
         new_index = self.index.repeat(repeats)
         new_values = self._values.repeat(repeats)
         return self._constructor(new_values,
                                  index=new_index).__finalize__(self)
 
-    def reshape(self, *args, **kwargs):
-        """
-        DEPRECATED: calling this method will raise an error in a
-        future release. Please call ``.values.reshape(...)`` instead.
-
-        return an ndarray with the values shape
-        if the specified shape matches exactly the current shape, then
-        return self (for compat)
-
-        See also
-        --------
-        numpy.ndarray.reshape
-        """
-        warnings.warn("reshape is deprecated and will raise "
-                      "in a subsequent release. Please use "
-                      ".values.reshape(...) instead", FutureWarning,
-                      stacklevel=2)
-
-        if len(args) == 1 and hasattr(args[0], '__iter__'):
-            shape = args[0]
-        else:
-            shape = args
-
-        if tuple(shape) == self.shape:
-            # XXX ignoring the "order" keyword.
-            nv.validate_reshape(tuple(), kwargs)
-            return self
-
-        return self._values.reshape(shape, **kwargs)
-
     def get_value(self, label, takeable=False):
         """
-        Quickly retrieve single value at passed index label
+        Quickly retrieve single value at passed index label.
+
+        .. deprecated:: 0.21.0
+            Please use .at[] or .iat[] accessors.
 
         Parameters
         ----------
-        index : label
+        label : object
         takeable : interpret the index as indexers, default False
 
         Returns
         -------
-        value : scalar value
+        scalar value
         """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(label, takeable=takeable)
+
+    def _get_value(self, label, takeable=False):
         if takeable is True:
-            return _maybe_box_datetimelike(self._values[label])
+            return com.maybe_box_datetimelike(self._values[label])
         return self.index.get_value(self._values, label)
+    _get_value.__doc__ = get_value.__doc__
 
     def set_value(self, label, value, takeable=False):
         """
-        Quickly set single value at passed label. If label is not contained, a
-        new object is created with the label placed at the end of the result
-        index
+        Quickly set single value at passed label.
+
+        .. deprecated:: 0.21.0
+            Please use .at[] or .iat[] accessors.
+
+        If label is not contained, a new object is created with the label
+        placed at the end of the result index.
 
         Parameters
         ----------
@@ -906,51 +1213,146 @@ def set_value(self, label, value, takeable=False):
 
         Returns
         -------
-        series : Series
+        Series
             If label is contained, will be reference to calling Series,
-            otherwise a new object
+            otherwise a new object.
         """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(label, value, takeable=takeable)
+
+    def _set_value(self, label, value, takeable=False):
         try:
             if takeable:
                 self._values[label] = value
             else:
                 self.index._engine.set_value(self._values, label, value)
-            return self
-        except KeyError:
+        except (KeyError, TypeError):
 
             # set using a non-recursive method
             self.loc[label] = value
-            return self
+
+        return self
+    _set_value.__doc__ = set_value.__doc__
 
     def reset_index(self, level=None, drop=False, name=None, inplace=False):
         """
-        Analogous to the :meth:`pandas.DataFrame.reset_index` function, see
-        docstring there.
+        Generate a new DataFrame or Series with the index reset.
+
+        This is useful when the index needs to be treated as a column, or
+        when the index is meaningless and needs to be reset to the default
+        before another operation.
 
         Parameters
         ----------
-        level : int, str, tuple, or list, default None
-            Only remove the given levels from the index. Removes all levels by
-            default
-        drop : boolean, default False
-            Do not try to insert index into dataframe columns
-        name : object, default None
-            The name of the column corresponding to the Series values
-        inplace : boolean, default False
-            Modify the Series in place (do not create a new object)
+        level : int, str, tuple, or list, default optional
+            For a Series with a MultiIndex, only remove the specified levels
+            from the index. Removes all levels by default.
+        drop : bool, default False
+            Just reset the index, without inserting it as a column in
+            the new DataFrame.
+        name : object, optional
+            The name to use for the column containing the original Series
+            values. Uses ``self.name`` by default. This argument is ignored
+            when `drop` is True.
+        inplace : bool, default False
+            Modify the Series in place (do not create a new object).
 
         Returns
-        ----------
-        resetted : DataFrame, or Series if drop == True
+        -------
+        Series or DataFrame
+            When `drop` is False (the default), a DataFrame is returned.
+            The newly created columns will come first in the DataFrame,
+            followed by the original Series values.
+            When `drop` is True, a `Series` is returned.
+            In either case, if ``inplace=True``, no value is returned.
+
+        See Also
+        --------
+        DataFrame.reset_index: Analogous function for DataFrame.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4], name='foo',
+        ...               index=pd.Index(['a', 'b', 'c', 'd'], name='idx'))
+
+        Generate a DataFrame with default index.
+
+        >>> s.reset_index()
+          idx  foo
+        0   a    1
+        1   b    2
+        2   c    3
+        3   d    4
+
+        To specify the name of the new column use `name`.
+
+        >>> s.reset_index(name='values')
+          idx  values
+        0   a       1
+        1   b       2
+        2   c       3
+        3   d       4
+
+        To generate a new Series with the default set `drop` to True.
+
+        >>> s.reset_index(drop=True)
+        0    1
+        1    2
+        2    3
+        3    4
+        Name: foo, dtype: int64
+
+        To update the Series in place, without generating a new one
+        set `inplace` to True. Note that it also requires ``drop=True``.
+
+        >>> s.reset_index(inplace=True, drop=True)
+        >>> s
+        0    1
+        1    2
+        2    3
+        3    4
+        Name: foo, dtype: int64
+
+        The `level` parameter is interesting for Series with a multi-level
+        index.
+
+        >>> arrays = [np.array(['bar', 'bar', 'baz', 'baz']),
+        ...           np.array(['one', 'two', 'one', 'two'])]
+        >>> s2 = pd.Series(
+        ...     range(4), name='foo',
+        ...     index=pd.MultiIndex.from_arrays(arrays,
+        ...                                     names=['a', 'b']))
+
+        To remove a specific level from the Index, use `level`.
+
+        >>> s2.reset_index(level='a')
+               a  foo
+        b
+        one  bar    0
+        two  bar    1
+        one  baz    2
+        two  baz    3
+
+        If `level` is not set, all levels are removed from the Index.
+
+        >>> s2.reset_index()
+             a    b  foo
+        0  bar  one    0
+        1  bar  two    1
+        2  baz  one    2
+        3  baz  two    3
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         if drop:
-            new_index = _default_index(len(self))
-            if level is not None and isinstance(self.index, MultiIndex):
+            new_index = ibase.default_index(len(self))
+            if level is not None:
                 if not isinstance(level, (tuple, list)):
                     level = [level]
                 level = [self.index._get_level_number(lev) for lev in level]
-                if len(level) < len(self.index.levels):
+                if len(level) < self.index.nlevels:
                     new_index = self.index.droplevel(level)
 
             if inplace:
@@ -967,9 +1369,12 @@ def reset_index(self, level=None, drop=False, name=None, inplace=False):
             df = self.to_frame(name)
             return df.reset_index(level=level, drop=drop)
 
+    # ----------------------------------------------------------------------
+    # Rendering Methods
+
     def __unicode__(self):
         """
-        Return a string representation for a particular DataFrame
+        Return a string representation for a particular DataFrame.
 
         Invoked by unicode(df) in py2 only. Yields a Unicode String in both
         py2/py3.
@@ -978,9 +1383,10 @@ def __unicode__(self):
         width, height = get_terminal_size()
         max_rows = (height if get_option("display.max_rows") == 0 else
                     get_option("display.max_rows"))
+        show_dimensions = get_option("display.show_dimensions")
 
         self.to_string(buf=buf, name=self.name, dtype=self.dtype,
-                       max_rows=max_rows)
+                       max_rows=max_rows, length=show_dimensions)
         result = buf.getvalue()
 
         return result
@@ -989,61 +1395,37 @@ def to_string(self, buf=None, na_rep='NaN', float_format=None, header=True,
                   index=True, length=False, dtype=False, name=False,
                   max_rows=None):
         """
-        Render a string representation of the Series
+        Render a string representation of the Series.
 
         Parameters
         ----------
         buf : StringIO-like, optional
-            buffer to write to
-        na_rep : string, optional
-            string representation of NAN to use, default 'NaN'
+            Buffer to write to.
+        na_rep : str, optional
+            String representation of NaN to use, default 'NaN'.
         float_format : one-parameter function, optional
-            formatter function to apply to columns' elements if they are floats
-            default None
-        header: boolean, default True
-            Add the Series header (index name)
+            Formatter function to apply to columns' elements if they are
+            floats, default None.
+        header : bool, default True
+            Add the Series header (index name).
         index : bool, optional
-            Add index (row) labels, default True
-        length : boolean, default False
-            Add the Series length
-        dtype : boolean, default False
-            Add the Series dtype
-        name : boolean, default False
-            Add the Series name if not None
+            Add index (row) labels, default True.
+        length : bool, default False
+            Add the Series length.
+        dtype : bool, default False
+            Add the Series dtype.
+        name : bool, default False
+            Add the Series name if not None.
         max_rows : int, optional
             Maximum number of rows to show before truncating. If None, show
             all.
 
         Returns
         -------
-        formatted : string (if not buffer passed)
+        str or None
+            String representation of Series if ``buf=None``, otherwise None.
         """
 
-        the_repr = self._get_repr(float_format=float_format, na_rep=na_rep,
-                                  header=header, index=index, length=length,
-                                  dtype=dtype, name=name, max_rows=max_rows)
-
-        # catch contract violations
-        if not isinstance(the_repr, compat.text_type):
-            raise AssertionError("result must be of type unicode, type"
-                                 " of result is {0!r}"
-                                 "".format(the_repr.__class__.__name__))
-
-        if buf is None:
-            return the_repr
-        else:
-            try:
-                buf.write(the_repr)
-            except AttributeError:
-                with open(buf, 'w') as f:
-                    f.write(the_repr)
-
-    def _get_repr(self, name=False, header=True, index=True, length=True,
-                  dtype=True, na_rep='NaN', float_format=None, max_rows=None):
-        """
-
-        Internal function, should always return unicode string
-        """
         formatter = fmt.SeriesFormatter(self, name=name, length=length,
                                         header=header, index=index,
                                         dtype=dtype, na_rep=na_rep,
@@ -1051,54 +1433,78 @@ def _get_repr(self, name=False, header=True, index=True, length=True,
                                         max_rows=max_rows)
         result = formatter.to_string()
 
-        # TODO: following check prob. not neces.
+        # catch contract violations
         if not isinstance(result, compat.text_type):
             raise AssertionError("result must be of type unicode, type"
                                  " of result is {0!r}"
                                  "".format(result.__class__.__name__))
-        return result
 
-    def __iter__(self):
-        """ provide iteration over the values of the Series
-        box values if necessary """
-        if is_datetimelike(self):
-            return (_maybe_box_datetimelike(x) for x in self._values)
+        if buf is None:
+            return result
         else:
-            return iter(self._values)
+            try:
+                buf.write(result)
+            except AttributeError:
+                with open(buf, 'w') as f:
+                    f.write(result)
+
+    # ----------------------------------------------------------------------
 
     def iteritems(self):
         """
-        Lazily iterate over (index, value) tuples
+        Lazily iterate over (index, value) tuples.
         """
         return zip(iter(self.index), iter(self))
 
-    if compat.PY3:  # pragma: no cover
-        items = iteritems
+    items = iteritems
 
     # ----------------------------------------------------------------------
     # Misc public methods
 
     def keys(self):
-        """Alias for index"""
+        """
+        Return alias for index.
+        """
         return self.index
 
-    def tolist(self):
-        """ Convert Series to a nested list """
-        return list(self.asobject)
-
-    def to_dict(self):
+    def to_dict(self, into=dict):
         """
-        Convert Series to {label -> value} dict
+        Convert Series to {label -> value} dict or dict-like object.
+
+        Parameters
+        ----------
+        into : class, default dict
+            The collections.Mapping subclass to use as the return
+            object. Can be the actual class or an empty
+            instance of the mapping type you want.  If you want a
+            collections.defaultdict, you must pass it initialized.
+
+            .. versionadded:: 0.21.0
 
         Returns
         -------
-        value_dict : dict
+        collections.Mapping
+            Key-value representation of Series.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3, 4])
+        >>> s.to_dict()
+        {0: 1, 1: 2, 2: 3, 3: 4}
+        >>> from collections import OrderedDict, defaultdict
+        >>> s.to_dict(OrderedDict)
+        OrderedDict([(0, 1), (1, 2), (2, 3), (3, 4)])
+        >>> dd = defaultdict(list)
+        >>> s.to_dict(dd)
+        defaultdict(<class 'list'>, {0: 1, 1: 2, 2: 3, 3: 4})
         """
-        return dict(compat.iteritems(self))
+        # GH16122
+        into_c = com.standardize_mapping(into)
+        return into_c(compat.iteritems(self))
 
     def to_frame(self, name=None):
         """
-        Convert Series to DataFrame
+        Convert Series to DataFrame.
 
         Parameters
         ----------
@@ -1108,7 +1514,18 @@ def to_frame(self, name=None):
 
         Returns
         -------
-        data_frame : DataFrame
+        DataFrame
+            DataFrame representation of Series.
+
+        Examples
+        --------
+        >>> s = pd.Series(["a", "b", "c"],
+        ...               name="vals")
+        >>> s.to_frame()
+          vals
+        0    a
+        1    b
+        2    c
         """
         if name is None:
             df = self._constructor_expanddim(self)
@@ -1119,20 +1536,26 @@ def to_frame(self, name=None):
 
     def to_sparse(self, kind='block', fill_value=None):
         """
-        Convert Series to SparseSeries
+        Convert Series to SparseSeries.
 
         Parameters
         ----------
-        kind : {'block', 'integer'}
+        kind : {'block', 'integer'}, default 'block'
         fill_value : float, defaults to NaN (missing)
+            Value to use for filling NaN values.
 
         Returns
         -------
-        sp : SparseSeries
+        SparseSeries
+            Sparse representation of the Series.
         """
-        from pandas.core.sparse import SparseSeries
-        return SparseSeries(self, kind=kind,
-                            fill_value=fill_value).__finalize__(self)
+        # TODO: deprecate
+        from pandas.core.sparse.series import SparseSeries
+
+        values = SparseArray(self, kind=kind, fill_value=fill_value)
+        return SparseSeries(
+            values, index=self.index, name=self.name
+        ).__finalize__(self)
 
     def _set_name(self, name, inplace=False):
         """
@@ -1156,127 +1579,441 @@ def _set_name(self, name, inplace=False):
 
     def count(self, level=None):
         """
-        Return number of non-NA/null observations in the Series
+        Return number of non-NA/null observations in the Series.
 
         Parameters
         ----------
         level : int or level name, default None
             If the axis is a MultiIndex (hierarchical), count along a
-            particular level, collapsing into a smaller Series
+            particular level, collapsing into a smaller Series.
 
         Returns
         -------
-        nobs : int or Series (if level specified)
-        """
-        from pandas.core.index import _get_na_value
+        int or Series (if level specified)
+            Number of non-null values in the Series.
 
+        Examples
+        --------
+        >>> s = pd.Series([0.0, 1.0, np.nan])
+        >>> s.count()
+        2
+        """
         if level is None:
-            return notnull(_values_from_object(self)).sum()
+            return notna(com.values_from_object(self)).sum()
 
         if isinstance(level, compat.string_types):
             level = self.index._get_level_number(level)
 
         lev = self.index.levels[level]
-        lab = np.array(self.index.labels[level], subok=False, copy=True)
+        level_codes = np.array(self.index.codes[level], subok=False, copy=True)
 
-        mask = lab == -1
+        mask = level_codes == -1
         if mask.any():
-            lab[mask] = cnt = len(lev)
-            lev = lev.insert(cnt, _get_na_value(lev.dtype.type))
+            level_codes[mask] = cnt = len(lev)
+            lev = lev.insert(cnt, lev._na_value)
 
-        obs = lab[notnull(self.values)]
+        obs = level_codes[notna(self.values)]
         out = np.bincount(obs, minlength=len(lev) or None)
         return self._constructor(out, index=lev,
                                  dtype='int64').__finalize__(self)
 
-    def mode(self):
-        """Return the mode(s) of the dataset.
+    def mode(self, dropna=True):
+        """
+        Return the mode(s) of the dataset.
 
         Always returns Series even if only one value is returned.
 
+        Parameters
+        ----------
+        dropna : bool, default True
+            Don't consider counts of NaN/NaT.
+
+            .. versionadded:: 0.24.0
+
         Returns
         -------
-        modes : Series (sorted)
+        Series
+            Modes of the Series in sorted order.
         """
         # TODO: Add option for bins like value_counts()
-        return algorithms.mode(self)
+        return algorithms.mode(self, dropna=dropna)
 
-    @Appender(base._shared_docs['unique'] % _shared_doc_kwargs)
     def unique(self):
+        """
+        Return unique values of Series object.
+
+        Uniques are returned in order of appearance. Hash table-based unique,
+        therefore does NOT sort.
+
+        Returns
+        -------
+        ndarray or ExtensionArray
+            The unique values returned as a NumPy array. See Notes.
+
+        See Also
+        --------
+        unique : Top-level unique method for any 1-d array-like object.
+        Index.unique : Return Index with unique values from an Index object.
+
+        Notes
+        -----
+        Returns the unique values as a NumPy array. In case of an
+        extension-array backed Series, a new
+        :class:`~api.extensions.ExtensionArray` of that type with just
+        the unique values is returned. This includes
+
+            * Categorical
+            * Period
+            * Datetime with Timezone
+            * Interval
+            * Sparse
+            * IntegerNA
+
+        See Examples section.
+
+        Examples
+        --------
+        >>> pd.Series([2, 1, 3, 3], name='A').unique()
+        array([2, 1, 3])
+
+        >>> pd.Series([pd.Timestamp('2016-01-01') for _ in range(3)]).unique()
+        array(['2016-01-01T00:00:00.000000000'], dtype='datetime64[ns]')
+
+        >>> pd.Series([pd.Timestamp('2016-01-01', tz='US/Eastern')
+        ...            for _ in range(3)]).unique()
+        <DatetimeArray>
+        ['2016-01-01 00:00:00-05:00']
+        Length: 1, dtype: datetime64[ns, US/Eastern]
+
+        An unordered Categorical will return categories in the order of
+        appearance.
+
+        >>> pd.Series(pd.Categorical(list('baabc'))).unique()
+        [b, a, c]
+        Categories (3, object): [b, a, c]
+
+        An ordered Categorical preserves the category ordering.
+
+        >>> pd.Series(pd.Categorical(list('baabc'), categories=list('abc'),
+        ...                          ordered=True)).unique()
+        [b, a, c]
+        Categories (3, object): [a < b < c]
+        """
         result = super(Series, self).unique()
-        if is_datetime64tz_dtype(self.dtype):
-            # to return array of Timestamp with tz
-            # ToDo: it must return DatetimeArray with tz in pandas 2.0
-            return result.asobject.values
         return result
 
-    @Appender(base._shared_docs['drop_duplicates'] % _shared_doc_kwargs)
     def drop_duplicates(self, keep='first', inplace=False):
+        """
+        Return Series with duplicate values removed.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', ``False``}, default 'first'
+            - 'first' : Drop duplicates except for the first occurrence.
+            - 'last' : Drop duplicates except for the last occurrence.
+            - ``False`` : Drop all duplicates.
+        inplace : bool, default ``False``
+            If ``True``, performs operation inplace and returns None.
+
+        Returns
+        -------
+        Series
+            Series with duplicates dropped.
+
+        See Also
+        --------
+        Index.drop_duplicates : Equivalent method on Index.
+        DataFrame.drop_duplicates : Equivalent method on DataFrame.
+        Series.duplicated : Related method on Series, indicating duplicate
+            Series values.
+
+        Examples
+        --------
+        Generate an Series with duplicated entries.
+
+        >>> s = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama', 'hippo'],
+        ...               name='animal')
+        >>> s
+        0      lama
+        1       cow
+        2      lama
+        3    beetle
+        4      lama
+        5     hippo
+        Name: animal, dtype: object
+
+        With the 'keep' parameter, the selection behaviour of duplicated values
+        can be changed. The value 'first' keeps the first occurrence for each
+        set of duplicated entries. The default value of keep is 'first'.
+
+        >>> s.drop_duplicates()
+        0      lama
+        1       cow
+        3    beetle
+        5     hippo
+        Name: animal, dtype: object
+
+        The value 'last' for parameter 'keep' keeps the last occurrence for
+        each set of duplicated entries.
+
+        >>> s.drop_duplicates(keep='last')
+        1       cow
+        3    beetle
+        4      lama
+        5     hippo
+        Name: animal, dtype: object
+
+        The value ``False`` for parameter 'keep' discards all sets of
+        duplicated entries. Setting the value of 'inplace' to ``True`` performs
+        the operation inplace and returns ``None``.
+
+        >>> s.drop_duplicates(keep=False, inplace=True)
+        >>> s
+        1       cow
+        3    beetle
+        5     hippo
+        Name: animal, dtype: object
+        """
         return super(Series, self).drop_duplicates(keep=keep, inplace=inplace)
 
-    @Appender(base._shared_docs['duplicated'] % _shared_doc_kwargs)
     def duplicated(self, keep='first'):
+        """
+        Indicate duplicate Series values.
+
+        Duplicated values are indicated as ``True`` values in the resulting
+        Series. Either all duplicates, all except the first or all except the
+        last occurrence of duplicates can be indicated.
+
+        Parameters
+        ----------
+        keep : {'first', 'last', False}, default 'first'
+            - 'first' : Mark duplicates as ``True`` except for the first
+              occurrence.
+            - 'last' : Mark duplicates as ``True`` except for the last
+              occurrence.
+            - ``False`` : Mark all duplicates as ``True``.
+
+        Returns
+        -------
+        Series
+            Series indicating whether each value has occurred in the
+            preceding values.
+
+        See Also
+        --------
+        Index.duplicated : Equivalent method on pandas.Index.
+        DataFrame.duplicated : Equivalent method on pandas.DataFrame.
+        Series.drop_duplicates : Remove duplicate values from Series.
+
+        Examples
+        --------
+        By default, for each set of duplicated values, the first occurrence is
+        set on False and all others on True:
+
+        >>> animals = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama'])
+        >>> animals.duplicated()
+        0    False
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+
+        which is equivalent to
+
+        >>> animals.duplicated(keep='first')
+        0    False
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+
+        By using 'last', the last occurrence of each set of duplicated values
+        is set on False and all others on True:
+
+        >>> animals.duplicated(keep='last')
+        0     True
+        1    False
+        2     True
+        3    False
+        4    False
+        dtype: bool
+
+        By setting keep on ``False``, all duplicates are True:
+
+        >>> animals.duplicated(keep=False)
+        0     True
+        1    False
+        2     True
+        3    False
+        4     True
+        dtype: bool
+        """
         return super(Series, self).duplicated(keep=keep)
 
-    def idxmin(self, axis=None, skipna=True, *args, **kwargs):
+    def idxmin(self, axis=0, skipna=True, *args, **kwargs):
         """
-        Index of first occurrence of minimum of values.
+        Return the row label of the minimum value.
+
+        If multiple values equal the minimum, the first row label with that
+        value is returned.
 
         Parameters
         ----------
-        skipna : boolean, default True
-            Exclude NA/null values
+        skipna : bool, default True
+            Exclude NA/null values. If the entire Series is NA, the result
+            will be NA.
+        axis : int, default 0
+            For compatibility with DataFrame.idxmin. Redundant for application
+            on Series.
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted
+            for compatibility with NumPy.
 
         Returns
         -------
-        idxmin : Index of minimum of values
+        Index
+            Label of the minimum value.
+
+        Raises
+        ------
+        ValueError
+            If the Series is empty.
+
+        See Also
+        --------
+        numpy.argmin : Return indices of the minimum values
+            along the given axis.
+        DataFrame.idxmin : Return index of first occurrence of minimum
+            over requested axis.
+        Series.idxmax : Return index *label* of the first occurrence
+            of maximum of values.
 
         Notes
         -----
-        This method is the Series version of ``ndarray.argmin``.
+        This method is the Series version of ``ndarray.argmin``. This method
+        returns the label of the minimum, while ``ndarray.argmin`` returns
+        the position. To get the position, use ``series.values.argmin()``.
 
-        See Also
+        Examples
         --------
-        DataFrame.idxmin
-        numpy.ndarray.argmin
+        >>> s = pd.Series(data=[1, None, 4, 1],
+        ...               index=['A', 'B', 'C', 'D'])
+        >>> s
+        A    1.0
+        B    NaN
+        C    4.0
+        D    1.0
+        dtype: float64
+
+        >>> s.idxmin()
+        'A'
+
+        If `skipna` is False and there is an NA value in the data,
+        the function returns ``nan``.
+
+        >>> s.idxmin(skipna=False)
+        nan
         """
         skipna = nv.validate_argmin_with_skipna(skipna, args, kwargs)
-        i = nanops.nanargmin(_values_from_object(self), skipna=skipna)
+        i = nanops.nanargmin(com.values_from_object(self), skipna=skipna)
         if i == -1:
             return np.nan
         return self.index[i]
 
-    def idxmax(self, axis=None, skipna=True, *args, **kwargs):
+    def idxmax(self, axis=0, skipna=True, *args, **kwargs):
         """
-        Index of first occurrence of maximum of values.
+        Return the row label of the maximum value.
+
+        If multiple values equal the maximum, the first row label with that
+        value is returned.
 
         Parameters
         ----------
-        skipna : boolean, default True
-            Exclude NA/null values
+        skipna : bool, default True
+            Exclude NA/null values. If the entire Series is NA, the result
+            will be NA.
+        axis : int, default 0
+            For compatibility with DataFrame.idxmax. Redundant for application
+            on Series.
+        *args, **kwargs
+            Additional keywords have no effect but might be accepted
+            for compatibility with NumPy.
 
         Returns
         -------
-        idxmax : Index of maximum of values
+        Index
+            Label of the maximum value.
+
+        Raises
+        ------
+        ValueError
+            If the Series is empty.
+
+        See Also
+        --------
+        numpy.argmax : Return indices of the maximum values
+            along the given axis.
+        DataFrame.idxmax : Return index of first occurrence of maximum
+            over requested axis.
+        Series.idxmin : Return index *label* of the first occurrence
+            of minimum of values.
 
         Notes
         -----
-        This method is the Series version of ``ndarray.argmax``.
+        This method is the Series version of ``ndarray.argmax``. This method
+        returns the label of the maximum, while ``ndarray.argmax`` returns
+        the position. To get the position, use ``series.values.argmax()``.
 
-        See Also
+        Examples
         --------
-        DataFrame.idxmax
-        numpy.ndarray.argmax
+        >>> s = pd.Series(data=[1, None, 4, 3, 4],
+        ...               index=['A', 'B', 'C', 'D', 'E'])
+        >>> s
+        A    1.0
+        B    NaN
+        C    4.0
+        D    3.0
+        E    4.0
+        dtype: float64
+
+        >>> s.idxmax()
+        'C'
+
+        If `skipna` is False and there is an NA value in the data,
+        the function returns ``nan``.
+
+        >>> s.idxmax(skipna=False)
+        nan
         """
         skipna = nv.validate_argmax_with_skipna(skipna, args, kwargs)
-        i = nanops.nanargmax(_values_from_object(self), skipna=skipna)
+        i = nanops.nanargmax(com.values_from_object(self), skipna=skipna)
         if i == -1:
             return np.nan
         return self.index[i]
 
     # ndarray compat
-    argmin = idxmin
-    argmax = idxmax
+    argmin = deprecate(
+        'argmin', idxmin, '0.21.0',
+        msg=dedent("""
+        The current behaviour of 'Series.argmin' is deprecated, use 'idxmin'
+        instead.
+        The behavior of 'argmin' will be corrected to return the positional
+        minimum in the future. For now, use 'series.values.argmin' or
+        'np.argmin(np.array(values))' to get the position of the minimum
+        row.""")
+    )
+    argmax = deprecate(
+        'argmax', idxmax, '0.21.0',
+        msg=dedent("""
+        The current behaviour of 'Series.argmax' is deprecated, use 'idxmax'
+        instead.
+        The behavior of 'argmax' will be corrected to return the positional
+        maximum in the future. For now, use 'series.values.argmax' or
+        'np.argmax(np.array(values))' to get the position of the maximum
+        row.""")
+    )
 
     def round(self, decimals=0, *args, **kwargs):
         """
@@ -1291,28 +2028,37 @@ def round(self, decimals=0, *args, **kwargs):
 
         Returns
         -------
-        Series object
+        Series
+            Rounded values of the Series.
 
         See Also
         --------
-        numpy.around
-        DataFrame.round
+        numpy.around : Round values of an np.array.
+        DataFrame.round : Round values of a DataFrame.
 
+        Examples
+        --------
+        >>> s = pd.Series([0.1, 1.3, 2.7])
+        >>> s.round()
+        0    0.0
+        1    1.0
+        2    3.0
+        dtype: float64
         """
         nv.validate_round(args, kwargs)
-        result = _values_from_object(self).round(decimals)
+        result = com.values_from_object(self).round(decimals)
         result = self._constructor(result, index=self.index).__finalize__(self)
 
         return result
 
     def quantile(self, q=0.5, interpolation='linear'):
         """
-        Return value at the given quantile, a la numpy.percentile.
+        Return value at the given quantile.
 
         Parameters
         ----------
         q : float or array-like, default 0.5 (50% quantile)
-            0 <= q <= 1, the quantile(s) to compute
+            0 <= q <= 1, the quantile(s) to compute.
         interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
             .. versionadded:: 0.18.0
 
@@ -1328,13 +2074,19 @@ def quantile(self, q=0.5, interpolation='linear'):
 
         Returns
         -------
-        quantile : float or Series
-            if ``q`` is an array, a Series will be returned where the
-            index is ``q`` and the values are the quantiles.
+        float or Series
+            If ``q`` is an array, a Series will be returned where the
+            index is ``q`` and the values are the quantiles, otherwise
+            a float will be returned.
+
+        See Also
+        --------
+        core.window.Rolling.quantile
+        numpy.percentile
 
         Examples
         --------
-        >>> s = Series([1, 2, 3, 4])
+        >>> s = pd.Series([1, 2, 3, 4])
         >>> s.quantile(.5)
         2.5
         >>> s.quantile([.25, .5, .75])
@@ -1342,61 +2094,97 @@ def quantile(self, q=0.5, interpolation='linear'):
         0.50    2.50
         0.75    3.25
         dtype: float64
-
         """
 
         self._check_percentile(q)
 
-        result = self._data.quantile(qs=q, interpolation=interpolation)
+        # We dispatch to DataFrame so that core.internals only has to worry
+        #  about 2D cases.
+        df = self.to_frame()
+
+        result = df.quantile(q=q, interpolation=interpolation,
+                             numeric_only=False)
+        if result.ndim == 2:
+            result = result.iloc[:, 0]
 
         if is_list_like(q):
+            result.name = self.name
             return self._constructor(result,
                                      index=Float64Index(q),
                                      name=self.name)
         else:
             # scalar
-            return result
+            return result.iloc[0]
 
     def corr(self, other, method='pearson', min_periods=None):
         """
-        Compute correlation with `other` Series, excluding missing values
+        Compute correlation with `other` Series, excluding missing values.
 
         Parameters
         ----------
         other : Series
-        method : {'pearson', 'kendall', 'spearman'}
+            Series with which to compute the correlation.
+        method : {'pearson', 'kendall', 'spearman'} or callable
             * pearson : standard correlation coefficient
             * kendall : Kendall Tau correlation coefficient
             * spearman : Spearman rank correlation
-        min_periods : int, optional
-            Minimum number of observations needed to have a valid result
+            * callable: callable with input two 1d ndarray
+                and returning a float
+                .. versionadded:: 0.24.0
 
+        min_periods : int, optional
+            Minimum number of observations needed to have a valid result.
 
         Returns
         -------
-        correlation : float
+        float
+            Correlation with other.
+
+        Examples
+        --------
+        >>> def histogram_intersection(a, b):
+        ...     v = np.minimum(a, b).sum().round(decimals=1)
+        ...     return v
+        >>> s1 = pd.Series([.2, .0, .6, .2])
+        >>> s2 = pd.Series([.3, .6, .0, .1])
+        >>> s1.corr(s2, method=histogram_intersection)
+        0.3
         """
         this, other = self.align(other, join='inner', copy=False)
         if len(this) == 0:
             return np.nan
-        return nanops.nancorr(this.values, other.values, method=method,
-                              min_periods=min_periods)
+
+        if method in ['pearson', 'spearman', 'kendall'] or callable(method):
+            return nanops.nancorr(this.values, other.values, method=method,
+                                  min_periods=min_periods)
+
+        raise ValueError("method must be either 'pearson', "
+                         "'spearman', or 'kendall', '{method}' "
+                         "was supplied".format(method=method))
 
     def cov(self, other, min_periods=None):
         """
-        Compute covariance with Series, excluding missing values
+        Compute covariance with Series, excluding missing values.
 
         Parameters
         ----------
         other : Series
+            Series with which to compute the covariance.
         min_periods : int, optional
-            Minimum number of observations needed to have a valid result
+            Minimum number of observations needed to have a valid result.
 
         Returns
         -------
-        covariance : float
+        float
+            Covariance between Series and other normalized by N-1
+            (unbiased estimator).
 
-        Normalized by N-1 (unbiased estimator).
+        Examples
+        --------
+        >>> s1 = pd.Series([0.90010907, 0.13484424, 0.62036035])
+        >>> s2 = pd.Series([0.12528585, 0.26962463, 0.51111198])
+        >>> s1.cov(s2)
+        -0.01685762652715874
         """
         this, other = self.align(other, join='inner', copy=False)
         if len(this) == 0:
@@ -1406,23 +2194,74 @@ def cov(self, other, min_periods=None):
 
     def diff(self, periods=1):
         """
-        1st discrete difference of object
+        First discrete difference of element.
+
+        Calculates the difference of a Series element compared with another
+        element in the Series (default is element in previous row).
 
         Parameters
         ----------
         periods : int, default 1
-            Periods to shift for forming difference
+            Periods to shift for calculating difference, accepts negative
+            values.
 
         Returns
         -------
-        diffed : Series
+        Series
+            First differences of the Series.
+
+        See Also
+        --------
+        Series.pct_change: Percent change over given number of periods.
+        Series.shift: Shift index by desired number of periods with an
+            optional time freq.
+        DataFrame.diff: First discrete difference of object.
+
+        Examples
+        --------
+        Difference with previous row
+
+        >>> s = pd.Series([1, 1, 2, 3, 5, 8])
+        >>> s.diff()
+        0    NaN
+        1    0.0
+        2    1.0
+        3    1.0
+        4    2.0
+        5    3.0
+        dtype: float64
+
+        Difference with 3rd previous row
+
+        >>> s.diff(periods=3)
+        0    NaN
+        1    NaN
+        2    NaN
+        3    2.0
+        4    4.0
+        5    6.0
+        dtype: float64
+
+        Difference with following row
+
+        >>> s.diff(periods=-1)
+        0    0.0
+        1   -1.0
+        2   -1.0
+        3   -2.0
+        4   -3.0
+        5    NaN
+        dtype: float64
         """
-        result = algorithms.diff(_values_from_object(self), periods)
+        result = algorithms.diff(com.values_from_object(self), periods)
         return self._constructor(result, index=self.index).__finalize__(self)
 
     def autocorr(self, lag=1):
         """
-        Lag-N autocorrelation
+        Compute the lag-N autocorrelation.
+
+        This method computes the Pearson correlation between
+        the Series and its shifted self.
 
         Parameters
         ----------
@@ -1431,22 +2270,86 @@ def autocorr(self, lag=1):
 
         Returns
         -------
-        autocorr : float
+        float
+            The Pearson correlation between self and self.shift(lag).
+
+        See Also
+        --------
+        Series.corr : Compute the correlation between two Series.
+        Series.shift : Shift index by desired number of periods.
+        DataFrame.corr : Compute pairwise correlation of columns.
+        DataFrame.corrwith : Compute pairwise correlation between rows or
+            columns of two DataFrame objects.
+
+        Notes
+        -----
+        If the Pearson correlation is not well defined return 'NaN'.
+
+        Examples
+        --------
+        >>> s = pd.Series([0.25, 0.5, 0.2, -0.05])
+        >>> s.autocorr()  # doctest: +ELLIPSIS
+        0.10355...
+        >>> s.autocorr(lag=2)  # doctest: +ELLIPSIS
+        -0.99999...
+
+        If the Pearson correlation is not well defined, then 'NaN' is returned.
+
+        >>> s = pd.Series([1, 0, 0, 0])
+        >>> s.autocorr()
+        nan
         """
         return self.corr(self.shift(lag))
 
     def dot(self, other):
         """
-        Matrix multiplication with DataFrame or inner-product with Series
-        objects
+        Compute the dot product between the Series and the columns of other.
+
+        This method computes the dot product between the Series and another
+        one, or the Series and each columns of a DataFrame, or the Series and
+        each columns of an array.
+
+        It can also be called using `self @ other` in Python >= 3.5.
 
         Parameters
         ----------
-        other : Series or DataFrame
+        other : Series, DataFrame or array-like
+            The other object to compute the dot product with its columns.
 
         Returns
         -------
-        dot_product : scalar or Series
+        scalar, Series or numpy.ndarray
+            Return the dot product of the Series and other if other is a
+            Series, the Series of the dot product of Series and each rows of
+            other if other is a DataFrame or a numpy.ndarray between the Series
+            and each columns of the numpy array.
+
+        See Also
+        --------
+        DataFrame.dot: Compute the matrix product with the DataFrame.
+        Series.mul: Multiplication of series and other, element-wise.
+
+        Notes
+        -----
+        The Series and other has to share the same index if other is a Series
+        or a DataFrame.
+
+        Examples
+        --------
+        >>> s = pd.Series([0, 1, 2, 3])
+        >>> other = pd.Series([-1, 2, -3, 4])
+        >>> s.dot(other)
+        8
+        >>> s @ other
+        8
+        >>> df = pd.DataFrame([[0, 1], [-2, 3], [4, -5], [6, 7]])
+        >>> s.dot(df)
+        0    24
+        1    14
+        dtype: int64
+        >>> arr = np.array([[0, 1], [-2, 3], [4, -5], [6, 7]])
+        >>> s.dot(arr)
+        array([24, 14])
         """
         from pandas.core.frame import DataFrame
         if isinstance(other, (Series, DataFrame)):
@@ -1460,7 +2363,6 @@ def dot(self, other):
             lvals = left.values
             rvals = right.values
         else:
-            left = self
             lvals = self.values
             rvals = np.asarray(other)
             if lvals.shape[0] != rvals.shape[0]:
@@ -1477,14 +2379,23 @@ def dot(self, other):
         else:  # pragma: no cover
             raise TypeError('unsupported type: %s' % type(other))
 
+    def __matmul__(self, other):
+        """
+        Matrix multiplication using binary `@` operator in Python>=3.5.
+        """
+        return self.dot(other)
+
+    def __rmatmul__(self, other):
+        """
+        Matrix multiplication using binary `@` operator in Python>=3.5.
+        """
+        return self.dot(np.transpose(other))
+
     @Substitution(klass='Series')
     @Appender(base._shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='v', new_arg_name='value')
     def searchsorted(self, value, side='left', sorter=None):
-        if sorter is not None:
-            sorter = _ensure_platform_int(sorter)
-        return self._values.searchsorted(Series(value)._values,
-                                         side=side, sorter=sorter)
+        return algorithms.searchsorted(self._values, value,
+                                       side=side, sorter=sorter)
 
     # -------------------------------------------------------------------
     # Combination
@@ -1496,23 +2407,37 @@ def append(self, to_append, ignore_index=False, verify_integrity=False):
         Parameters
         ----------
         to_append : Series or list/tuple of Series
-        ignore_index : boolean, default False
+            Series to append with self.
+        ignore_index : bool, default False
             If True, do not use the index labels.
 
-            .. versionadded: 0.19.0
+            .. versionadded:: 0.19.0
 
-        verify_integrity : boolean, default False
-            If True, raise Exception on creating index with duplicates
+        verify_integrity : bool, default False
+            If True, raise Exception on creating index with duplicates.
 
         Returns
         -------
-        appended : Series
+        Series
+            Concatenated Series.
+
+        See Also
+        --------
+        concat : General function to concatenate DataFrame, Series
+            or Panel objects.
+
+        Notes
+        -----
+        Iteratively appending to a Series can be more computationally intensive
+        than a single concatenate. A better solution is to append values to a
+        list and then concatenate the list with the original Series all at
+        once.
 
         Examples
         --------
         >>> s1 = pd.Series([1, 2, 3])
         >>> s2 = pd.Series([4, 5, 6])
-        >>> s3 = pd.Series([4, 5, 6], index=[3,4,5])
+        >>> s3 = pd.Series([4, 5, 6], index=[3, 4, 5])
         >>> s1.append(s2)
         0    1
         1    2
@@ -1548,10 +2473,8 @@ def append(self, to_append, ignore_index=False, verify_integrity=False):
         Traceback (most recent call last):
         ...
         ValueError: Indexes have overlapping values: [0, 1, 2]
-
-
         """
-        from pandas.tools.concat import concat
+        from pandas.core.reshape.concat import concat
 
         if isinstance(to_append, (list, tuple)):
             to_concat = [self] + to_append
@@ -1562,7 +2485,7 @@ def append(self, to_append, ignore_index=False, verify_integrity=False):
 
     def _binop(self, other, func, level=None, fill_value=None):
         """
-        Perform generic binary operation with optional fill value
+        Perform generic binary operation with optional fill value.
 
         Parameters
         ----------
@@ -1577,7 +2500,7 @@ def _binop(self, other, func, level=None, fill_value=None):
 
         Returns
         -------
-        combined : Series
+        Series
         """
         if not isinstance(other, Series):
             raise AssertionError('Other operand must be Series')
@@ -1590,23 +2513,12 @@ def _binop(self, other, func, level=None, fill_value=None):
                                      copy=False)
             new_index = this.index
 
-        this_vals = this.values
-        other_vals = other.values
-
-        if fill_value is not None:
-            this_mask = isnull(this_vals)
-            other_mask = isnull(other_vals)
-            this_vals = this_vals.copy()
-            other_vals = other_vals.copy()
-
-            # one but not both
-            mask = this_mask ^ other_mask
-            this_vals[this_mask & mask] = fill_value
-            other_vals[other_mask & mask] = fill_value
+        this_vals, other_vals = ops.fill_binop(this.values, other.values,
+                                               fill_value)
 
         with np.errstate(all='ignore'):
             result = func(this_vals, other_vals)
-        name = _maybe_match_name(self, other)
+        name = ops.get_op_result_name(self, other)
         result = self._constructor(result, index=new_index, name=name)
         result = result.__finalize__(self)
         if name is None:
@@ -1614,70 +2526,199 @@ def _binop(self, other, func, level=None, fill_value=None):
             result.name = None
         return result
 
-    def combine(self, other, func, fill_value=nan):
+    def combine(self, other, func, fill_value=None):
         """
-        Perform elementwise binary operation on two Series using given function
-        with optional fill value when an index is missing from one Series or
-        the other
+        Combine the Series with a Series or scalar according to `func`.
+
+        Combine the Series and `other` using `func` to perform elementwise
+        selection for combined Series.
+        `fill_value` is assumed when value is missing at some index
+        from one of the two objects being combined.
 
         Parameters
         ----------
-        other : Series or scalar value
+        other : Series or scalar
+            The value(s) to be combined with the `Series`.
         func : function
-        fill_value : scalar value
+            Function that takes two scalars as inputs and returns an element.
+        fill_value : scalar, optional
+            The value to assume when an index is missing from
+            one Series or the other. The default specifies to use the
+            appropriate NaN value for the underlying dtype of the Series.
 
         Returns
         -------
-        result : Series
+        Series
+            The result of combining the Series with the other object.
+
+        See Also
+        --------
+        Series.combine_first : Combine Series values, choosing the calling
+            Series' values first.
+
+        Examples
+        --------
+        Consider 2 Datasets ``s1`` and ``s2`` containing
+        highest clocked speeds of different birds.
+
+        >>> s1 = pd.Series({'falcon': 330.0, 'eagle': 160.0})
+        >>> s1
+        falcon    330.0
+        eagle     160.0
+        dtype: float64
+        >>> s2 = pd.Series({'falcon': 345.0, 'eagle': 200.0, 'duck': 30.0})
+        >>> s2
+        falcon    345.0
+        eagle     200.0
+        duck       30.0
+        dtype: float64
+
+        Now, to combine the two datasets and view the highest speeds
+        of the birds across the two datasets
+
+        >>> s1.combine(s2, max)
+        duck        NaN
+        eagle     200.0
+        falcon    345.0
+        dtype: float64
+
+        In the previous example, the resulting value for duck is missing,
+        because the maximum of a NaN and a float is a NaN.
+        So, in the example, we set ``fill_value=0``,
+        so the maximum value returned will be the value from some dataset.
+
+        >>> s1.combine(s2, max, fill_value=0)
+        duck       30.0
+        eagle     200.0
+        falcon    345.0
+        dtype: float64
         """
+        if fill_value is None:
+            fill_value = na_value_for_dtype(self.dtype, compat=False)
+
         if isinstance(other, Series):
+            # If other is a Series, result is based on union of Series,
+            # so do this element by element
             new_index = self.index.union(other.index)
-            new_name = _maybe_match_name(self, other)
-            new_values = np.empty(len(new_index), dtype=self.dtype)
-            for i, idx in enumerate(new_index):
+            new_name = ops.get_op_result_name(self, other)
+            new_values = []
+            for idx in new_index:
                 lv = self.get(idx, fill_value)
                 rv = other.get(idx, fill_value)
                 with np.errstate(all='ignore'):
-                    new_values[i] = func(lv, rv)
+                    new_values.append(func(lv, rv))
         else:
+            # Assume that other is a scalar, so apply the function for
+            # each element in the Series
             new_index = self.index
             with np.errstate(all='ignore'):
-                new_values = func(self._values, other)
+                new_values = [func(lv, other) for lv in self._values]
             new_name = self.name
+
+        if is_categorical_dtype(self.values):
+            pass
+        elif is_extension_array_dtype(self.values):
+            # The function can return something of any type, so check
+            # if the type is compatible with the calling EA.
+            try:
+                new_values = self._values._from_sequence(new_values)
+            except Exception:
+                # https://github.com/pandas-dev/pandas/issues/22850
+                # pandas has no control over what 3rd-party ExtensionArrays
+                # do in _values_from_sequence. We still want ops to work
+                # though, so we catch any regular Exception.
+                pass
+
         return self._constructor(new_values, index=new_index, name=new_name)
 
     def combine_first(self, other):
         """
-        Combine Series values, choosing the calling Series's values
-        first. Result index will be the union of the two indexes
+        Combine Series values, choosing the calling Series's values first.
 
         Parameters
         ----------
         other : Series
+            The value(s) to be combined with the `Series`.
 
         Returns
         -------
-        y : Series
+        Series
+            The result of combining the Series with the other object.
+
+        See Also
+        --------
+        Series.combine : Perform elementwise operation on two Series
+            using a given function.
+
+        Notes
+        -----
+        Result index will be the union of the two indexes.
+
+        Examples
+        --------
+        >>> s1 = pd.Series([1, np.nan])
+        >>> s2 = pd.Series([3, 4])
+        >>> s1.combine_first(s2)
+        0    1.0
+        1    4.0
+        dtype: float64
         """
         new_index = self.index.union(other.index)
         this = self.reindex(new_index, copy=False)
         other = other.reindex(new_index, copy=False)
-        # TODO: do we need name?
-        name = _maybe_match_name(self, other)  # noqa
-        rs_vals = com._where_compat(isnull(this), other._values, this._values)
-        return self._constructor(rs_vals, index=new_index).__finalize__(self)
+        if is_datetimelike(this) and not is_datetimelike(other):
+            other = to_datetime(other)
+
+        return this.where(notna(this), other)
 
     def update(self, other):
         """
         Modify Series in place using non-NA values from passed
-        Series. Aligns on index
+        Series. Aligns on index.
 
         Parameters
         ----------
         other : Series
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, 5, 6]))
+        >>> s
+        0    4
+        1    5
+        2    6
+        dtype: int64
+
+        >>> s = pd.Series(['a', 'b', 'c'])
+        >>> s.update(pd.Series(['d', 'e'], index=[0, 2]))
+        >>> s
+        0    d
+        1    b
+        2    e
+        dtype: object
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, 5, 6, 7, 8]))
+        >>> s
+        0    4
+        1    5
+        2    6
+        dtype: int64
+
+        If ``other`` contains NaNs the corresponding values are not updated
+        in the original Series.
+
+        >>> s = pd.Series([1, 2, 3])
+        >>> s.update(pd.Series([4, np.nan, 6]))
+        >>> s
+        0    4
+        1    2
+        2    6
+        dtype: int64
         """
         other = other.reindex_like(self)
-        mask = notnull(other)
+        mask = notna(other)
 
         self._data = self._data.putmask(mask=mask, new=other, inplace=True)
         self._maybe_update_cacher()
@@ -1685,12 +2726,115 @@ def update(self, other):
     # ----------------------------------------------------------------------
     # Reindexing, sorting
 
-    @Appender(generic._shared_docs['sort_values'] % _shared_doc_kwargs)
     def sort_values(self, axis=0, ascending=True, inplace=False,
                     kind='quicksort', na_position='last'):
+        """
+        Sort by the values.
+
+        Sort a Series in ascending or descending order by some
+        criterion.
 
+        Parameters
+        ----------
+        axis : {0 or 'index'}, default 0
+            Axis to direct sorting. The value 'index' is accepted for
+            compatibility with DataFrame.sort_values.
+        ascending : bool, default True
+            If True, sort values in ascending order, otherwise descending.
+        inplace : bool, default False
+            If True, perform operation in-place.
+        kind : {'quicksort', 'mergesort' or 'heapsort'}, default 'quicksort'
+            Choice of sorting algorithm. See also :func:`numpy.sort` for more
+            information. 'mergesort' is the only stable  algorithm.
+        na_position : {'first' or 'last'}, default 'last'
+            Argument 'first' puts NaNs at the beginning, 'last' puts NaNs at
+            the end.
+
+        Returns
+        -------
+        Series
+            Series ordered by values.
+
+        See Also
+        --------
+        Series.sort_index : Sort by the Series indices.
+        DataFrame.sort_values : Sort DataFrame by the values along either axis.
+        DataFrame.sort_index : Sort DataFrame by indices.
+
+        Examples
+        --------
+        >>> s = pd.Series([np.nan, 1, 3, 10, 5])
+        >>> s
+        0     NaN
+        1     1.0
+        2     3.0
+        3     10.0
+        4     5.0
+        dtype: float64
+
+        Sort values ascending order (default behaviour)
+
+        >>> s.sort_values(ascending=True)
+        1     1.0
+        2     3.0
+        4     5.0
+        3    10.0
+        0     NaN
+        dtype: float64
+
+        Sort values descending order
+
+        >>> s.sort_values(ascending=False)
+        3    10.0
+        4     5.0
+        2     3.0
+        1     1.0
+        0     NaN
+        dtype: float64
+
+        Sort values inplace
+
+        >>> s.sort_values(ascending=False, inplace=True)
+        >>> s
+        3    10.0
+        4     5.0
+        2     3.0
+        1     1.0
+        0     NaN
+        dtype: float64
+
+        Sort values putting NAs first
+
+        >>> s.sort_values(na_position='first')
+        0     NaN
+        1     1.0
+        2     3.0
+        4     5.0
+        3    10.0
+        dtype: float64
+
+        Sort a series of strings
+
+        >>> s = pd.Series(['z', 'b', 'd', 'a', 'c'])
+        >>> s
+        0    z
+        1    b
+        2    d
+        3    a
+        4    c
+        dtype: object
+
+        >>> s.sort_values()
+        3    a
+        1    b
+        4    c
+        2    d
+        0    z
+        dtype: object
+        """
         inplace = validate_bool_kwarg(inplace, 'inplace')
-        axis = self._get_axis_number(axis)
+        # Validate the axis parameter
+        self._get_axis_number(axis)
 
         # GH 5856/5853
         if inplace and self._is_cached:
@@ -1710,10 +2854,10 @@ def _try_kind_sort(arr):
         arr = self._values
         sortedIdx = np.empty(len(self), dtype=np.int32)
 
-        bad = isnull(arr)
+        bad = isna(arr)
 
         good = ~bad
-        idx = _default_index(len(self))
+        idx = ibase.default_index(len(self))
 
         argsorted = _try_kind_sort(arr[good])
 
@@ -1747,26 +2891,152 @@ def _try_kind_sort(arr):
         else:
             return result.__finalize__(self)
 
-    @Appender(generic._shared_docs['sort_index'] % _shared_doc_kwargs)
     def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
                    kind='quicksort', na_position='last', sort_remaining=True):
+        """
+        Sort Series by index labels.
+
+        Returns a new Series sorted by label if `inplace` argument is
+        ``False``, otherwise updates the original series and returns None.
+
+        Parameters
+        ----------
+        axis : int, default 0
+            Axis to direct sorting. This can only be 0 for Series.
+        level : int, optional
+            If not None, sort on values in specified index level(s).
+        ascending : bool, default true
+            Sort ascending vs. descending.
+        inplace : bool, default False
+            If True, perform operation in-place.
+        kind : {'quicksort', 'mergesort', 'heapsort'}, default 'quicksort'
+            Choice of sorting algorithm. See also :func:`numpy.sort` for more
+            information.  'mergesort' is the only stable algorithm. For
+            DataFrames, this option is only applied when sorting on a single
+            column or label.
+        na_position : {'first', 'last'}, default 'last'
+            If 'first' puts NaNs at the beginning, 'last' puts NaNs at the end.
+            Not implemented for MultiIndex.
+        sort_remaining : bool, default True
+            If True and sorting by level and index is multilevel, sort by other
+            levels too (in order) after sorting by specified level.
+
+        Returns
+        -------
+        Series
+            The original Series sorted by the labels.
+
+        See Also
+        --------
+        DataFrame.sort_index: Sort DataFrame by the index.
+        DataFrame.sort_values: Sort DataFrame by the value.
+        Series.sort_values : Sort Series by the value.
+
+        Examples
+        --------
+        >>> s = pd.Series(['a', 'b', 'c', 'd'], index=[3, 2, 1, 4])
+        >>> s.sort_index()
+        1    c
+        2    b
+        3    a
+        4    d
+        dtype: object
+
+        Sort Descending
+
+        >>> s.sort_index(ascending=False)
+        4    d
+        3    a
+        2    b
+        1    c
+        dtype: object
+
+        Sort Inplace
+
+        >>> s.sort_index(inplace=True)
+        >>> s
+        1    c
+        2    b
+        3    a
+        4    d
+        dtype: object
+
+        By default NaNs are put at the end, but use `na_position` to place
+        them at the beginning
+
+        >>> s = pd.Series(['a', 'b', 'c', 'd'], index=[3, 2, 1, np.nan])
+        >>> s.sort_index(na_position='first')
+        NaN     d
+         1.0    c
+         2.0    b
+         3.0    a
+        dtype: object
 
+        Specify index level to sort
+
+        >>> arrays = [np.array(['qux', 'qux', 'foo', 'foo',
+        ...                     'baz', 'baz', 'bar', 'bar']),
+        ...           np.array(['two', 'one', 'two', 'one',
+        ...                     'two', 'one', 'two', 'one'])]
+        >>> s = pd.Series([1, 2, 3, 4, 5, 6, 7, 8], index=arrays)
+        >>> s.sort_index(level=1)
+        bar  one    8
+        baz  one    6
+        foo  one    4
+        qux  one    2
+        bar  two    7
+        baz  two    5
+        foo  two    3
+        qux  two    1
+        dtype: int64
+
+        Does not sort by remaining levels when sorting by levels
+
+        >>> s.sort_index(level=1, sort_remaining=False)
+        qux  one    2
+        foo  one    4
+        baz  one    6
+        bar  one    8
+        qux  two    1
+        foo  two    3
+        baz  two    5
+        bar  two    7
+        dtype: int64
+        """
+        # TODO: this can be combined with DataFrame.sort_index impl as
+        # almost identical
         inplace = validate_bool_kwarg(inplace, 'inplace')
-        axis = self._get_axis_number(axis)
+        # Validate the axis parameter
+        self._get_axis_number(axis)
         index = self.index
+
         if level is not None:
             new_index, indexer = index.sortlevel(level, ascending=ascending,
                                                  sort_remaining=sort_remaining)
         elif isinstance(index, MultiIndex):
             from pandas.core.sorting import lexsort_indexer
-            indexer = lexsort_indexer(index.labels, orders=ascending)
+            labels = index._sort_levels_monotonic()
+            indexer = lexsort_indexer(labels._get_codes_for_sorting(),
+                                      orders=ascending,
+                                      na_position=na_position)
         else:
             from pandas.core.sorting import nargsort
+
+            # Check monotonic-ness before sort an index
+            # GH11080
+            if ((ascending and index.is_monotonic_increasing) or
+                    (not ascending and index.is_monotonic_decreasing)):
+                if inplace:
+                    return
+                else:
+                    return self.copy()
+
             indexer = nargsort(index, kind=kind, ascending=ascending,
                                na_position=na_position)
 
-        indexer = _ensure_platform_int(indexer)
+        indexer = ensure_platform_int(indexer)
         new_index = index.take(indexer)
+        new_index = new_index._sort_levels_monotonic()
 
         new_values = self._values.take(indexer)
         result = self._constructor(new_values, index=new_index)
@@ -1778,27 +3048,31 @@ def sort_index(self, axis=0, level=None, ascending=True, inplace=False,
 
     def argsort(self, axis=0, kind='quicksort', order=None):
         """
-        Overrides ndarray.argsort. Argsorts the value, omitting NA/null values,
-        and places the result in the same locations as the non-NA values
+        Override ndarray.argsort. Argsorts the value, omitting NA/null values,
+        and places the result in the same locations as the non-NA values.
 
         Parameters
         ----------
-        axis : int (can only be zero)
+        axis : int
+            Has no effect but is accepted for compatibility with numpy.
         kind : {'mergesort', 'quicksort', 'heapsort'}, default 'quicksort'
             Choice of sorting algorithm. See np.sort for more
             information. 'mergesort' is the only stable algorithm
-        order : ignored
+        order : None
+            Has no effect but is accepted for compatibility with numpy.
 
         Returns
         -------
-        argsorted : Series, with -1 indicated where nan values are present
+        Series
+            Positions of values within the sort order with -1 indicating
+            nan values.
 
-        See also
+        See Also
         --------
         numpy.ndarray.argsort
         """
         values = self._values
-        mask = isnull(values)
+        mask = isna(values)
 
         if mask.any():
             result = Series(-1, index=self.index, name=self.name,
@@ -1813,144 +3087,218 @@ def argsort(self, axis=0, kind='quicksort', order=None):
                 dtype='int64').__finalize__(self)
 
     def nlargest(self, n=5, keep='first'):
-        """Return the largest `n` elements.
+        """
+        Return the largest `n` elements.
 
         Parameters
         ----------
-        n : int
-            Return this many descending sorted values
-        keep : {'first', 'last', False}, default 'first'
-            Where there are duplicate values:
-            - ``first`` : take the first occurrence.
-            - ``last`` : take the last occurrence.
+        n : int, default 5
+            Return this many descending sorted values.
+        keep : {'first', 'last', 'all'}, default 'first'
+            When there are duplicate values that cannot all fit in a
+            Series of `n` elements:
+
+            - ``first`` : return the first `n` occurrences in order
+                of appearance.
+            - ``last`` : return the last `n` occurrences in reverse
+                order of appearance.
+            - ``all`` : keep all occurrences. This can result in a Series of
+                size larger than `n`.
 
         Returns
         -------
-        top_n : Series
-            The n largest values in the Series, in sorted order
+        Series
+            The `n` largest values in the Series, sorted in decreasing order.
+
+        See Also
+        --------
+        Series.nsmallest: Get the `n` smallest elements.
+        Series.sort_values: Sort Series by values.
+        Series.head: Return the first `n` rows.
 
         Notes
         -----
         Faster than ``.sort_values(ascending=False).head(n)`` for small `n`
         relative to the size of the ``Series`` object.
 
-        See Also
-        --------
-        Series.nsmallest
-
         Examples
         --------
-        >>> import pandas as pd
-        >>> import numpy as np
-        >>> s = pd.Series(np.random.randn(10**6))
-        >>> s.nlargest(10)  # only sorts up to the N requested
-        219921    4.644710
-        82124     4.608745
-        421689    4.564644
-        425277    4.447014
-        718691    4.414137
-        43154     4.403520
-        283187    4.313922
-        595519    4.273635
-        503969    4.250236
-        121637    4.240952
-        dtype: float64
+        >>> countries_population = {"Italy": 59000000, "France": 65000000,
+        ...                         "Malta": 434000, "Maldives": 434000,
+        ...                         "Brunei": 434000, "Iceland": 337000,
+        ...                         "Nauru": 11300, "Tuvalu": 11300,
+        ...                         "Anguilla": 11300, "Monserat": 5200}
+        >>> s = pd.Series(countries_population)
+        >>> s
+        Italy       59000000
+        France      65000000
+        Malta         434000
+        Maldives      434000
+        Brunei        434000
+        Iceland       337000
+        Nauru          11300
+        Tuvalu         11300
+        Anguilla       11300
+        Monserat        5200
+        dtype: int64
+
+        The `n` largest elements where ``n=5`` by default.
+
+        >>> s.nlargest()
+        France      65000000
+        Italy       59000000
+        Malta         434000
+        Maldives      434000
+        Brunei        434000
+        dtype: int64
+
+        The `n` largest elements where ``n=3``. Default `keep` value is 'first'
+        so Malta will be kept.
+
+        >>> s.nlargest(3)
+        France    65000000
+        Italy     59000000
+        Malta       434000
+        dtype: int64
+
+        The `n` largest elements where ``n=3`` and keeping the last duplicates.
+        Brunei will be kept since it is the last with value 434000 based on
+        the index order.
+
+        >>> s.nlargest(3, keep='last')
+        France      65000000
+        Italy       59000000
+        Brunei        434000
+        dtype: int64
+
+        The `n` largest elements where ``n=3`` with all duplicates kept. Note
+        that the returned Series has five elements due to the three duplicates.
+
+        >>> s.nlargest(3, keep='all')
+        France      65000000
+        Italy       59000000
+        Malta         434000
+        Maldives      434000
+        Brunei        434000
+        dtype: int64
         """
-        return algorithms.select_n_series(self, n=n, keep=keep,
-                                          method='nlargest')
+        return algorithms.SelectNSeries(self, n=n, keep=keep).nlargest()
 
     def nsmallest(self, n=5, keep='first'):
-        """Return the smallest `n` elements.
+        """
+        Return the smallest `n` elements.
 
         Parameters
         ----------
-        n : int
-            Return this many ascending sorted values
-        keep : {'first', 'last', False}, default 'first'
-            Where there are duplicate values:
-            - ``first`` : take the first occurrence.
-            - ``last`` : take the last occurrence.
+        n : int, default 5
+            Return this many ascending sorted values.
+        keep : {'first', 'last', 'all'}, default 'first'
+            When there are duplicate values that cannot all fit in a
+            Series of `n` elements:
+
+            - ``first`` : return the first `n` occurrences in order
+                of appearance.
+            - ``last`` : return the last `n` occurrences in reverse
+                order of appearance.
+            - ``all`` : keep all occurrences. This can result in a Series of
+                size larger than `n`.
 
         Returns
         -------
-        bottom_n : Series
-            The n smallest values in the Series, in sorted order
+        Series
+            The `n` smallest values in the Series, sorted in increasing order.
+
+        See Also
+        --------
+        Series.nlargest: Get the `n` largest elements.
+        Series.sort_values: Sort Series by values.
+        Series.head: Return the first `n` rows.
 
         Notes
         -----
         Faster than ``.sort_values().head(n)`` for small `n` relative to
         the size of the ``Series`` object.
 
-        See Also
-        --------
-        Series.nlargest
-
         Examples
         --------
-        >>> import pandas as pd
-        >>> import numpy as np
-        >>> s = pd.Series(np.random.randn(10**6))
-        >>> s.nsmallest(10)  # only sorts up to the N requested
-        288532   -4.954580
-        732345   -4.835960
-        64803    -4.812550
-        446457   -4.609998
-        501225   -4.483945
-        669476   -4.472935
-        973615   -4.401699
-        621279   -4.355126
-        773916   -4.347355
-        359919   -4.331927
-        dtype: float64
-        """
-        return algorithms.select_n_series(self, n=n, keep=keep,
-                                          method='nsmallest')
+        >>> countries_population = {"Italy": 59000000, "France": 65000000,
+        ...                         "Brunei": 434000, "Malta": 434000,
+        ...                         "Maldives": 434000, "Iceland": 337000,
+        ...                         "Nauru": 11300, "Tuvalu": 11300,
+        ...                         "Anguilla": 11300, "Monserat": 5200}
+        >>> s = pd.Series(countries_population)
+        >>> s
+        Italy       59000000
+        France      65000000
+        Brunei        434000
+        Malta         434000
+        Maldives      434000
+        Iceland       337000
+        Nauru          11300
+        Tuvalu         11300
+        Anguilla       11300
+        Monserat        5200
+        dtype: int64
 
-    def sortlevel(self, level=0, ascending=True, sort_remaining=True):
-        """
-        DEPRECATED: use :meth:`Series.sort_index`
+        The `n` smallest elements where ``n=5`` by default.
 
-        Sort Series with MultiIndex by chosen level. Data will be
-        lexicographically sorted by the chosen level followed by the other
-        levels (in order)
+        >>> s.nsmallest()
+        Monserat      5200
+        Nauru        11300
+        Tuvalu       11300
+        Anguilla     11300
+        Iceland     337000
+        dtype: int64
 
-        Parameters
-        ----------
-        level : int or level name, default None
-        ascending : bool, default True
+        The `n` smallest elements where ``n=3``. Default `keep` value is
+        'first' so Nauru and Tuvalu will be kept.
 
-        Returns
-        -------
-        sorted : Series
+        >>> s.nsmallest(3)
+        Monserat     5200
+        Nauru       11300
+        Tuvalu      11300
+        dtype: int64
 
-        See Also
-        --------
-        Series.sort_index(level=...)
+        The `n` smallest elements where ``n=3`` and keeping the last
+        duplicates. Anguilla and Tuvalu will be kept since they are the last
+        with value 11300 based on the index order.
 
+        >>> s.nsmallest(3, keep='last')
+        Monserat     5200
+        Anguilla    11300
+        Tuvalu      11300
+        dtype: int64
+
+        The `n` smallest elements where ``n=3`` with all duplicates kept. Note
+        that the returned Series has four elements due to the three duplicates.
+
+        >>> s.nsmallest(3, keep='all')
+        Monserat     5200
+        Nauru       11300
+        Tuvalu      11300
+        Anguilla    11300
+        dtype: int64
         """
-        warnings.warn("sortlevel is deprecated, use sort_index(level=...)",
-                      FutureWarning, stacklevel=2)
-        return self.sort_index(level=level, ascending=ascending,
-                               sort_remaining=sort_remaining)
+        return algorithms.SelectNSeries(self, n=n, keep=keep).nsmallest()
 
     def swaplevel(self, i=-2, j=-1, copy=True):
         """
-        Swap levels i and j in a MultiIndex
+        Swap levels i and j in a MultiIndex.
 
         Parameters
         ----------
-        i, j : int, string (can be mixed)
+        i, j : int, str (can be mixed)
             Level of index to be swapped. Can pass level name as string.
 
         Returns
         -------
-        swapped : Series
+        Series
+            Series with levels swapped in MultiIndex.
 
         .. versionchanged:: 0.18.1
 
            The indexes ``i`` and ``j`` are now optional, and default to
            the two innermost levels of the index.
-
         """
         new_index = self.index.swaplevel(i, j)
         return self._constructor(self._values, index=new_index,
@@ -1958,14 +3306,14 @@ def swaplevel(self, i=-2, j=-1, copy=True):
 
     def reorder_levels(self, order):
         """
-        Rearrange index levels using input order. May not drop or duplicate
-        levels
+        Rearrange index levels using input order.
+
+        May not drop or duplicate levels.
 
         Parameters
         ----------
-        order : list of int representing new level order.
+        order : list of int representing new level order
                (reference level by number or key)
-        axis : where to reorder levels
 
         Returns
         -------
@@ -1985,17 +3333,23 @@ def unstack(self, level=-1, fill_value=None):
 
         Parameters
         ----------
-        level : int, string, or list of these, default last level
-            Level(s) to unstack, can pass level name
-        fill_value : replace NaN with this value if the unstack produces
-            missing values
+        level : int, str, or list of these, default last level
+            Level(s) to unstack, can pass level name.
+        fill_value : scalar value, default None
+            Value to use when replacing NaN values.
+
+            .. versionadded:: 0.18.0
 
-            .. versionadded: 0.18.0
+        Returns
+        -------
+        DataFrame
+            Unstacked Series.
 
         Examples
         --------
         >>> s = pd.Series([1, 2, 3, 4],
-        ...     index=pd.MultiIndex.from_product([['one', 'two'], ['a', 'b']]))
+        ...               index=pd.MultiIndex.from_product([['one', 'two'],
+        ...                                                 ['a', 'b']]))
         >>> s
         one  a    1
              b    2
@@ -2012,12 +3366,8 @@ def unstack(self, level=-1, fill_value=None):
            one  two
         a    1    3
         b    2    4
-
-        Returns
-        -------
-        unstacked : DataFrame
         """
-        from pandas.core.reshape import unstack
+        from pandas.core.reshape.reshape import unstack
         return unstack(self, level, fill_value)
 
     # ----------------------------------------------------------------------
@@ -2025,143 +3375,201 @@ def unstack(self, level=-1, fill_value=None):
 
     def map(self, arg, na_action=None):
         """
-        Map values of Series using input correspondence (which can be
-        a dict, Series, or function)
+        Map values of Series according to input correspondence.
+
+        Used for substituting each value in a Series with another value,
+        that may be derived from a function, a ``dict`` or
+        a :class:`Series`.
 
         Parameters
         ----------
         arg : function, dict, or Series
-        na_action : {None, 'ignore'}
-            If 'ignore', propagate NA values, without passing them to the
-            mapping function
+            Mapping correspondence.
+        na_action : {None, 'ignore'}, default None
+            If 'ignore', propagate NaN values, without passing them to the
+            mapping correspondence.
 
         Returns
         -------
-        y : Series
-            same index as caller
+        Series
+            Same index as caller.
 
-        Examples
+        See Also
         --------
+        Series.apply : For applying more complex functions on a Series.
+        DataFrame.apply : Apply a function row-/column-wise.
+        DataFrame.applymap : Apply a function elementwise on a whole DataFrame.
 
-        Map inputs to outputs (both of type `Series`)
-
-        >>> x = pd.Series([1,2,3], index=['one', 'two', 'three'])
-        >>> x
-        one      1
-        two      2
-        three    3
-        dtype: int64
-
-        >>> y = pd.Series(['foo', 'bar', 'baz'], index=[1,2,3])
-        >>> y
-        1    foo
-        2    bar
-        3    baz
-
-        >>> x.map(y)
-        one   foo
-        two   bar
-        three baz
-
-        Mapping a dictionary keys on the index labels works similar as
-        with a `Series`:
+        Notes
+        -----
+        When ``arg`` is a dictionary, values in Series that are not in the
+        dictionary (as keys) are converted to ``NaN``. However, if the
+        dictionary is a ``dict`` subclass that defines ``__missing__`` (i.e.
+        provides a method for default values), then this default is used
+        rather than ``NaN``.
 
-        >>> z = {1: 'A', 2: 'B', 3: 'C'}
+        Examples
+        --------
+        >>> s = pd.Series(['cat', 'dog', np.nan, 'rabbit'])
+        >>> s
+        0      cat
+        1      dog
+        2      NaN
+        3   rabbit
+        dtype: object
 
-        >>> x.map(z)
-        one   A
-        two   B
-        three C
+        ``map`` accepts a ``dict`` or a ``Series``. Values that are not found
+        in the ``dict`` are converted to ``NaN``, unless the dict has a default
+        value (e.g. ``defaultdict``):
 
-        Use na_action to control whether NA values are affected by the mapping
-        function.
+        >>> s.map({'cat': 'kitten', 'dog': 'puppy'})
+        0   kitten
+        1    puppy
+        2      NaN
+        3      NaN
+        dtype: object
 
-        >>> s = pd.Series([1, 2, 3, np.nan])
+        It also accepts a function:
 
-        >>> s2 = s.map(lambda x: 'this is a string {}'.format(x),
-                       na_action=None)
-        0    this is a string 1.0
-        1    this is a string 2.0
-        2    this is a string 3.0
-        3    this is a string nan
+        >>> s.map('I am a {}'.format)
+        0       I am a cat
+        1       I am a dog
+        2       I am a nan
+        3    I am a rabbit
         dtype: object
 
-        >>> s3 = s.map(lambda x: 'this is a string {}'.format(x),
-                       na_action='ignore')
-        0    this is a string 1.0
-        1    this is a string 2.0
-        2    this is a string 3.0
-        3                     NaN
-        dtype: object
+        To avoid applying the function to missing values (and keep them as
+        ``NaN``) ``na_action='ignore'`` can be used:
 
-        See Also
-        --------
-        Series.apply: For applying more complex functions on a Series
-        DataFrame.apply: Apply a function row-/column-wise
-        DataFrame.applymap: Apply a function elementwise on a whole DataFrame
+        >>> s.map('I am a {}'.format, na_action='ignore')
+        0     I am a cat
+        1     I am a dog
+        2            NaN
+        3  I am a rabbit
+        dtype: object
         """
+        new_values = super(Series, self)._map_values(
+            arg, na_action=na_action)
+        return self._constructor(new_values,
+                                 index=self.index).__finalize__(self)
 
-        if is_extension_type(self.dtype):
-            values = self._values
-            if na_action is not None:
-                raise NotImplementedError
-            map_f = lambda values, f: values.map(f)
-        else:
-            values = self.asobject
+    def _gotitem(self, key, ndim, subset=None):
+        """
+        Sub-classes to define. Return a sliced object.
 
-            if na_action == 'ignore':
-                def map_f(values, f):
-                    return lib.map_infer_mask(values, f,
-                                              isnull(values).view(np.uint8))
-            else:
-                map_f = lib.map_infer
+        Parameters
+        ----------
+        key : string / list of selections
+        ndim : 1,2
+            requested ndim of result
+        subset : object, default None
+            subset to act on
+        """
+        return self
+
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    Series.apply : Invoke function on a Series.
+    Series.transform : Transform function producing a Series with like indexes.
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4])
+    >>> s
+    0    1
+    1    2
+    2    3
+    3    4
+    dtype: int64
+
+    >>> s.agg('min')
+    1
+
+    >>> s.agg(['min', 'max'])
+    min   1
+    max   4
+    dtype: int64
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='.. versionadded:: 0.20.0',
+                  **_shared_doc_kwargs)
+    @Appender(generic._shared_docs['aggregate'])
+    def aggregate(self, func, axis=0, *args, **kwargs):
+        # Validate the axis parameter
+        self._get_axis_number(axis)
+        result, how = self._aggregate(func, *args, **kwargs)
+        if result is None:
+
+            # we can be called from an inner function which
+            # passes this meta-data
+            kwargs.pop('_axis', None)
+            kwargs.pop('_level', None)
+
+            # try a regular apply, this evaluates lambdas
+            # row-by-row; however if the lambda is expected a Series
+            # expression, e.g.: lambda x: x-x.quantile(0.25)
+            # this will fail, so we can try a vectorized evaluation
+
+            # we cannot FIRST try the vectorized evaluation, because
+            # then .agg and .apply would have different semantics if the
+            # operation is actually defined on the Series, e.g. str
+            try:
+                result = self.apply(func, *args, **kwargs)
+            except (ValueError, AttributeError, TypeError):
+                result = func(self, *args, **kwargs)
 
-        if isinstance(arg, (dict, Series)):
-            if isinstance(arg, dict):
-                arg = self._constructor(arg, index=arg.keys())
+        return result
 
-            indexer = arg.index.get_indexer(values)
-            new_values = algorithms.take_1d(arg._values, indexer)
-        else:
-            new_values = map_f(values, arg)
+    agg = aggregate
 
-        return self._constructor(new_values,
-                                 index=self.index).__finalize__(self)
+    @Appender(generic._shared_docs['transform'] % _shared_doc_kwargs)
+    def transform(self, func, axis=0, *args, **kwargs):
+        # Validate the axis parameter
+        self._get_axis_number(axis)
+        return super(Series, self).transform(func, *args, **kwargs)
 
     def apply(self, func, convert_dtype=True, args=(), **kwds):
         """
-        Invoke function on values of Series. Can be ufunc (a NumPy function
-        that applies to the entire Series) or a Python function that only works
-        on single values
+        Invoke function on values of Series.
+
+        Can be ufunc (a NumPy function that applies to the entire Series)
+        or a Python function that only works on single values.
 
         Parameters
         ----------
         func : function
-        convert_dtype : boolean, default True
+            Python function or NumPy ufunc to apply.
+        convert_dtype : bool, default True
             Try to find better dtype for elementwise function results. If
-            False, leave as dtype=object
+            False, leave as dtype=object.
         args : tuple
-            Positional arguments to pass to function in addition to the value
-        Additional keyword arguments will be passed as keywords to the function
+            Positional arguments passed to func after the series value.
+        **kwds
+            Additional keyword arguments passed to func.
 
         Returns
         -------
-        y : Series or DataFrame if func returns a Series
+        Series or DataFrame
+            If func returns a Series object the result will be a DataFrame.
 
-        See also
+        See Also
         --------
-        Series.map: For element-wise operations
+        Series.map: For element-wise operations.
+        Series.agg: Only perform aggregating type operations.
+        Series.transform: Only perform transforming type operations.
 
         Examples
         --------
-
         Create a series with typical summer temperatures for each city.
 
-        >>> import pandas as pd
-        >>> import numpy as np
-        >>> series = pd.Series([20, 21, 12], index=['London',
-        ... 'New York','Helsinki'])
-        >>> series
+        >>> s = pd.Series([20, 21, 12],
+        ...               index=['London', 'New York', 'Helsinki'])
+        >>> s
         London      20
         New York    21
         Helsinki    12
@@ -2171,8 +3579,8 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         argument to ``apply()``.
 
         >>> def square(x):
-        ...     return x**2
-        >>> series.apply(square)
+        ...     return x ** 2
+        >>> s.apply(square)
         London      400
         New York    441
         Helsinki    144
@@ -2181,7 +3589,7 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         Square the values by passing an anonymous function as an
         argument to ``apply()``.
 
-        >>> series.apply(lambda x: x**2)
+        >>> s.apply(lambda x: x ** 2)
         London      400
         New York    441
         Helsinki    144
@@ -2192,9 +3600,9 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
         ``args`` keyword.
 
         >>> def subtract_custom_value(x, custom_value):
-        ...     return x-custom_value
+        ...     return x - custom_value
 
-        >>> series.apply(subtract_custom_value, args=(5,))
+        >>> s.apply(subtract_custom_value, args=(5,))
         London      15
         New York    16
         Helsinki     7
@@ -2205,10 +3613,10 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
 
         >>> def add_custom_values(x, **kwargs):
         ...     for month in kwargs:
-        ...         x+=kwargs[month]
-        ...         return x
+        ...         x += kwargs[month]
+        ...     return x
 
-        >>> series.apply(add_custom_values, june=30, july=20, august=25)
+        >>> s.apply(add_custom_values, june=30, july=20, august=25)
         London      95
         New York    96
         Helsinki    87
@@ -2216,20 +3624,28 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
 
         Use a function from the Numpy library.
 
-        >>> series.apply(np.log)
+        >>> s.apply(np.log)
         London      2.995732
         New York    3.044522
         Helsinki    2.484907
         dtype: float64
-
-
         """
         if len(self) == 0:
             return self._constructor(dtype=self.dtype,
                                      index=self.index).__finalize__(self)
 
+        # dispatch to agg
+        if isinstance(func, (list, dict)):
+            return self.aggregate(func, *args, **kwds)
+
+        # if we are a string, try to dispatch
+        if isinstance(func, compat.string_types):
+            return self._try_aggregate_string_function(func, *args, **kwds)
+
+        # handle ufuncs and lambdas
         if kwds or args and not isinstance(func, np.ufunc):
-            f = lambda x: func(x, *args, **kwds)
+            def f(x):
+                return func(x, *args, **kwds)
         else:
             f = func
 
@@ -2237,10 +3653,11 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
             if isinstance(f, np.ufunc):
                 return f(self)
 
+            # row-wise access
             if is_extension_type(self.dtype):
                 mapped = self._values.map(f)
             else:
-                values = self.asobject
+                values = self.astype(object).values
                 mapped = lib.map_infer(values, f, convert=convert_dtype)
 
         if len(mapped) and isinstance(mapped[0], Series):
@@ -2253,22 +3670,38 @@ def apply(self, func, convert_dtype=True, args=(), **kwds):
     def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
                 filter_type=None, **kwds):
         """
-        perform a reduction operation
-
-        if we have an ndarray as a value, then simply perform the operation,
-        otherwise delegate to the object
+        Perform a reduction operation.
 
+        If we have an ndarray as a value, then simply perform the operation,
+        otherwise delegate to the object.
         """
         delegate = self._values
-        if isinstance(delegate, np.ndarray):
-            # Validate that 'axis' is consistent with Series's single axis.
+
+        if axis is not None:
             self._get_axis_number(axis)
+
+        if isinstance(delegate, Categorical):
+            # TODO deprecate numeric_only argument for Categorical and use
+            # skipna as well, see GH25303
+            return delegate._reduce(name, numeric_only=numeric_only, **kwds)
+        elif isinstance(delegate, ExtensionArray):
+            # dispatch to ExtensionArray interface
+            return delegate._reduce(name, skipna=skipna, **kwds)
+        elif is_datetime64_dtype(delegate):
+            # use DatetimeIndex implementation to handle skipna correctly
+            delegate = DatetimeIndex(delegate)
+
+        # dispatch to numpy arrays
+        elif isinstance(delegate, np.ndarray):
             if numeric_only:
                 raise NotImplementedError('Series.{0} does not implement '
                                           'numeric_only.'.format(name))
             with np.errstate(all='ignore'):
                 return op(delegate, skipna=skipna, **kwds)
 
+        # TODO(EA) dispatch to Index
+        # remove once all internals extension types are
+        # moved to ExtensionArrays
         return delegate._reduce(op=op, name=name, axis=axis, skipna=skipna,
                                 numeric_only=numeric_only,
                                 filter_type=filter_type, **kwds)
@@ -2279,13 +3712,14 @@ def _reindex_indexer(self, new_index, indexer, copy):
                 return self.copy()
             return self
 
-        # be subclass-friendly
-        new_values = algorithms.take_1d(self.get_values(), indexer)
+        new_values = algorithms.take_1d(self._values, indexer,
+                                        allow_fill=True, fill_value=None)
         return self._constructor(new_values, index=new_index)
 
     def _needs_reindex_multi(self, axes, method, level):
-        """ check if we do need a multi reindex; this is for compat with
-        higher dims
+        """
+        Check if we do need a multi reindex; this is for compat with
+        higher dims.
         """
         return False
 
@@ -2299,8 +3733,67 @@ def align(self, other, join='outer', axis=None, level=None, copy=True,
                                          limit=limit, fill_axis=fill_axis,
                                          broadcast_axis=broadcast_axis)
 
-    @Appender(generic._shared_docs['rename'] % _shared_doc_kwargs)
     def rename(self, index=None, **kwargs):
+        """
+        Alter Series index labels or name.
+
+        Function / dict values must be unique (1-to-1). Labels not contained in
+        a dict / Series will be left as-is. Extra labels listed don't throw an
+        error.
+
+        Alternatively, change ``Series.name`` with a scalar value.
+
+        See the :ref:`user guide <basics.rename>` for more.
+
+        Parameters
+        ----------
+        index : scalar, hashable sequence, dict-like or function, optional
+            dict-like or functions are transformations to apply to
+            the index.
+            Scalar or hashable sequence-like will alter the ``Series.name``
+            attribute.
+        copy : bool, default True
+            Whether to copy underlying data.
+        inplace : bool, default False
+            Whether to return a new Series. If True then value of copy is
+            ignored.
+        level : int or level name, default None
+            In case of a MultiIndex, only rename labels in the specified
+            level.
+
+        Returns
+        -------
+        Series
+            Series with index labels or name altered.
+
+        See Also
+        --------
+        Series.rename_axis : Set the name of the axis.
+
+        Examples
+        --------
+        >>> s = pd.Series([1, 2, 3])
+        >>> s
+        0    1
+        1    2
+        2    3
+        dtype: int64
+        >>> s.rename("my_name")  # scalar, changes Series.name
+        0    1
+        1    2
+        2    3
+        Name: my_name, dtype: int64
+        >>> s.rename(lambda x: x ** 2)  # function, changes labels
+        0    1
+        1    2
+        4    3
+        dtype: int64
+        >>> s.rename({1: 3, 2: 5})  # mapping, changes labels
+        0    1
+        3    2
+        5    3
+        dtype: int64
+        """
         kwargs['inplace'] = validate_bool_kwarg(kwargs.get('inplace', False),
                                                 'inplace')
 
@@ -2310,11 +3803,105 @@ def rename(self, index=None, **kwargs):
             return self._set_name(index, inplace=kwargs.get('inplace'))
         return super(Series, self).rename(index=index, **kwargs)
 
-    @Appender(generic._shared_docs['reindex'] % _shared_doc_kwargs)
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(generic.NDFrame.reindex.__doc__)
     def reindex(self, index=None, **kwargs):
         return super(Series, self).reindex(index=index, **kwargs)
 
-    @Appender(generic._shared_docs['fillna'] % _shared_doc_kwargs)
+    def drop(self, labels=None, axis=0, index=None, columns=None,
+             level=None, inplace=False, errors='raise'):
+        """
+        Return Series with specified index labels removed.
+
+        Remove elements of a Series based on specifying the index labels.
+        When using a multi-index, labels on different levels can be removed
+        by specifying the level.
+
+        Parameters
+        ----------
+        labels : single label or list-like
+            Index labels to drop.
+        axis : 0, default 0
+            Redundant for application on Series.
+        index, columns : None
+            Redundant for application on Series, but index can be used instead
+            of labels.
+
+            .. versionadded:: 0.21.0
+        level : int or level name, optional
+            For MultiIndex, level for which the labels will be removed.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        errors : {'ignore', 'raise'}, default 'raise'
+            If 'ignore', suppress error and only existing labels are dropped.
+
+        Returns
+        -------
+        Series
+            Series with specified index labels removed.
+
+        Raises
+        ------
+        KeyError
+            If none of the labels are found in the index.
+
+        See Also
+        --------
+        Series.reindex : Return only specified index labels of Series.
+        Series.dropna : Return series without null values.
+        Series.drop_duplicates : Return Series with duplicate values removed.
+        DataFrame.drop : Drop specified labels from rows or columns.
+
+        Examples
+        --------
+        >>> s = pd.Series(data=np.arange(3), index=['A', 'B', 'C'])
+        >>> s
+        A  0
+        B  1
+        C  2
+        dtype: int64
+
+        Drop labels B en C
+
+        >>> s.drop(labels=['B', 'C'])
+        A  0
+        dtype: int64
+
+        Drop 2nd level label in MultiIndex Series
+
+        >>> midx = pd.MultiIndex(levels=[['lama', 'cow', 'falcon'],
+        ...                              ['speed', 'weight', 'length']],
+        ...                      codes=[[0, 0, 0, 1, 1, 1, 2, 2, 2],
+        ...                             [0, 1, 2, 0, 1, 2, 0, 1, 2]])
+        >>> s = pd.Series([45, 200, 1.2, 30, 250, 1.5, 320, 1, 0.3],
+        ...               index=midx)
+        >>> s
+        lama    speed      45.0
+                weight    200.0
+                length      1.2
+        cow     speed      30.0
+                weight    250.0
+                length      1.5
+        falcon  speed     320.0
+                weight      1.0
+                length      0.3
+        dtype: float64
+
+        >>> s.drop(labels='weight', level=1)
+        lama    speed      45.0
+                length      1.2
+        cow     speed      30.0
+                length      1.5
+        falcon  speed     320.0
+                length      0.3
+        dtype: float64
+        """
+        return super(Series, self).drop(labels=labels, axis=axis, index=index,
+                                        columns=columns, level=level,
+                                        inplace=inplace, errors=errors)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(generic.NDFrame.fillna.__doc__)
     def fillna(self, value=None, method=None, axis=None, inplace=False,
                limit=None, downcast=None, **kwargs):
         return super(Series, self).fillna(value=value, method=method,
@@ -2322,142 +3909,238 @@ def fillna(self, value=None, method=None, axis=None, inplace=False,
                                           limit=limit, downcast=downcast,
                                           **kwargs)
 
+    @Appender(generic._shared_docs['replace'] % _shared_doc_kwargs)
+    def replace(self, to_replace=None, value=None, inplace=False, limit=None,
+                regex=False, method='pad'):
+        return super(Series, self).replace(to_replace=to_replace, value=value,
+                                           inplace=inplace, limit=limit,
+                                           regex=regex, method=method)
+
     @Appender(generic._shared_docs['shift'] % _shared_doc_kwargs)
-    def shift(self, periods=1, freq=None, axis=0):
-        return super(Series, self).shift(periods=periods, freq=freq, axis=axis)
+    def shift(self, periods=1, freq=None, axis=0, fill_value=None):
+        return super(Series, self).shift(periods=periods, freq=freq, axis=axis,
+                                         fill_value=fill_value)
 
     def reindex_axis(self, labels, axis=0, **kwargs):
-        """ for compatibility with higher dims """
+        """
+        Conform Series to new index with optional filling logic.
+
+        .. deprecated:: 0.21.0
+            Use ``Series.reindex`` instead.
+        """
+        # for compatibility with higher dims
         if axis != 0:
             raise ValueError("cannot reindex series on non-zero axis!")
+        msg = ("'.reindex_axis' is deprecated and will be removed in a future "
+               "version. Use '.reindex' instead.")
+        warnings.warn(msg, FutureWarning, stacklevel=2)
+
         return self.reindex(index=labels, **kwargs)
 
     def memory_usage(self, index=True, deep=False):
-        """Memory usage of the Series
+        """
+        Return the memory usage of the Series.
+
+        The memory usage can optionally include the contribution of
+        the index and of elements of `object` dtype.
 
         Parameters
         ----------
-        index : bool
-            Specifies whether to include memory usage of Series index
-        deep : bool
-            Introspect the data deeply, interrogate
-            `object` dtypes for system-level memory consumption
+        index : bool, default True
+            Specifies whether to include the memory usage of the Series index.
+        deep : bool, default False
+            If True, introspect the data deeply by interrogating
+            `object` dtypes for system-level memory consumption, and include
+            it in the returned value.
 
         Returns
         -------
-        scalar bytes of memory consumed
-
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array if deep=False
+        int
+            Bytes of memory consumed.
 
         See Also
         --------
-        numpy.ndarray.nbytes
+        numpy.ndarray.nbytes : Total bytes consumed by the elements of the
+            array.
+        DataFrame.memory_usage : Bytes consumed by a DataFrame.
+
+        Examples
+        --------
+        >>> s = pd.Series(range(3))
+        >>> s.memory_usage()
+        104
+
+        Not including the index gives the size of the rest of the data, which
+        is necessarily smaller:
+
+        >>> s.memory_usage(index=False)
+        24
+
+        The memory footprint of `object` values is ignored by default:
+
+        >>> s = pd.Series(["a", "b"])
+        >>> s.values
+        array(['a', 'b'], dtype=object)
+        >>> s.memory_usage()
+        96
+        >>> s.memory_usage(deep=True)
+        212
         """
         v = super(Series, self).memory_usage(deep=deep)
         if index:
             v += self.index.memory_usage(deep=deep)
         return v
 
-    def take(self, indices, axis=0, convert=True, is_copy=False, **kwargs):
-        """
-        return Series corresponding to requested indices
+    @Appender(generic.NDFrame._take.__doc__)
+    def _take(self, indices, axis=0, is_copy=False):
 
-        Parameters
-        ----------
-        indices : list / array of ints
-        convert : translate negative to positive indices (default)
+        indices = ensure_platform_int(indices)
+        new_index = self.index.take(indices)
 
-        Returns
-        -------
-        taken : Series
+        if is_categorical_dtype(self):
+            # https://github.com/pandas-dev/pandas/issues/20664
+            # TODO: remove when the default Categorical.take behavior changes
+            indices = maybe_convert_indices(indices, len(self._get_axis(axis)))
+            kwargs = {'allow_fill': False}
+        else:
+            kwargs = {}
+        new_values = self._values.take(indices, **kwargs)
 
-        See also
-        --------
-        numpy.ndarray.take
-        """
-        nv.validate_take(tuple(), kwargs)
+        result = (self._constructor(new_values, index=new_index,
+                                    fastpath=True).__finalize__(self))
 
-        # check/convert indicies here
-        if convert:
-            indices = maybe_convert_indices(indices, len(self._get_axis(axis)))
+        # Maybe set copy if we didn't actually change the index.
+        if is_copy:
+            if not result._get_axis(axis).equals(self._get_axis(axis)):
+                result._set_is_copy(self)
 
-        indices = _ensure_platform_int(indices)
-        new_index = self.index.take(indices)
-        new_values = self._values.take(indices)
-        return self._constructor(new_values,
-                                 index=new_index).__finalize__(self)
+        return result
 
     def isin(self, values):
         """
-        Return a boolean :class:`~pandas.Series` showing whether each element
-        in the :class:`~pandas.Series` is exactly contained in the passed
-        sequence of ``values``.
+        Check whether `values` are contained in Series.
+
+        Return a boolean Series showing whether each element in the Series
+        matches an element in the passed sequence of `values` exactly.
 
         Parameters
         ----------
         values : set or list-like
             The sequence of values to test. Passing in a single string will
             raise a ``TypeError``. Instead, turn a single string into a
-            ``list`` of one element.
+            list of one element.
 
             .. versionadded:: 0.18.1
 
-            Support for values as a set
+              Support for values as a set.
 
         Returns
         -------
-        isin : Series (bool dtype)
+        Series
+            Series of booleans indicating if each element is in values.
 
         Raises
         ------
         TypeError
-          * If ``values`` is a string
+          * If `values` is a string
 
         See Also
         --------
-        pandas.DataFrame.isin
+        DataFrame.isin : Equivalent method on DataFrame.
 
         Examples
         --------
-
-        >>> s = pd.Series(list('abc'))
-        >>> s.isin(['a', 'c', 'e'])
+        >>> s = pd.Series(['lama', 'cow', 'lama', 'beetle', 'lama',
+        ...                'hippo'], name='animal')
+        >>> s.isin(['cow', 'lama'])
         0     True
-        1    False
+        1     True
         2     True
-        dtype: bool
+        3    False
+        4     True
+        5    False
+        Name: animal, dtype: bool
 
-        Passing a single string as ``s.isin('a')`` will raise an error. Use
+        Passing a single string as ``s.isin('lama')`` will raise an error. Use
         a list of one element instead:
 
-        >>> s.isin(['a'])
+        >>> s.isin(['lama'])
         0     True
         1    False
-        2    False
-        dtype: bool
-
+        2     True
+        3    False
+        4     True
+        5    False
+        Name: animal, dtype: bool
         """
-        result = algorithms.isin(_values_from_object(self), values)
+        result = algorithms.isin(self, values)
         return self._constructor(result, index=self.index).__finalize__(self)
 
     def between(self, left, right, inclusive=True):
         """
-        Return boolean Series equivalent to left <= series <= right. NA values
-        will be treated as False
+        Return boolean Series equivalent to left <= series <= right.
+
+        This function returns a boolean vector containing `True` wherever the
+        corresponding Series element is between the boundary values `left` and
+        `right`. NA values are treated as `False`.
 
         Parameters
         ----------
         left : scalar
-            Left boundary
+            Left boundary.
         right : scalar
-            Right boundary
+            Right boundary.
+        inclusive : bool, default True
+            Include boundaries.
 
         Returns
         -------
-        is_between : Series
+        Series
+            Series representing whether each element is between left and
+            right (inclusive).
+
+        See Also
+        --------
+        Series.gt : Greater than of series and other.
+        Series.lt : Less than of series and other.
+
+        Notes
+        -----
+        This function is equivalent to ``(left <= ser) & (ser <= right)``
+
+        Examples
+        --------
+        >>> s = pd.Series([2, 0, 4, 8, np.nan])
+
+        Boundary values are included by default:
+
+        >>> s.between(1, 4)
+        0     True
+        1    False
+        2     True
+        3    False
+        4    False
+        dtype: bool
+
+        With `inclusive` set to ``False`` boundary values are excluded:
+
+        >>> s.between(1, 4, inclusive=False)
+        0     True
+        1    False
+        2    False
+        3    False
+        4    False
+        dtype: bool
+
+        `left` and `right` can be any scalar value:
+
+        >>> s = pd.Series(['Alice', 'Bob', 'Carol', 'Eve'])
+        >>> s.between('Anna', 'Daniel')
+        0    False
+        1     True
+        2     True
+        3    False
+        dtype: bool
         """
         if inclusive:
             lmask = self >= left
@@ -2472,8 +4155,10 @@ def between(self, left, right, inclusive=True):
     def from_csv(cls, path, sep=',', parse_dates=True, header=None,
                  index_col=0, encoding=None, infer_datetime_format=False):
         """
-        Read CSV file (DISCOURAGED, please use :func:`pandas.read_csv`
-        instead).
+        Read CSV file.
+
+        .. deprecated:: 0.21.0
+            Use :func:`pandas.read_csv` instead.
 
         It is preferable to use the more powerful :func:`pandas.read_csv`
         for most general purposes, but ``from_csv`` makes for an easy
@@ -2494,32 +4179,35 @@ def from_csv(cls, path, sep=',', parse_dates=True, header=None,
 
         Parameters
         ----------
-        path : string file path or file handle / StringIO
-        sep : string, default ','
-            Field delimiter
-        parse_dates : boolean, default True
-            Parse dates. Different default from read_table
+        path : str, file path, or file handle / StringIO
+        sep : str, default ','
+            Field delimiter.
+        parse_dates : bool, default True
+            Parse dates. Different default from read_table.
         header : int, default None
-            Row to use as header (skip prior rows)
+            Row to use as header (skip prior rows).
         index_col : int or sequence, default 0
             Column to use for index. If a sequence is given, a MultiIndex
-            is used. Different default from read_table
-        encoding : string, optional
-            a string representing the encoding to use if the contents are
-            non-ascii, for python versions prior to 3
-        infer_datetime_format: boolean, default False
+            is used. Different default from read_table.
+        encoding : str, optional
+            A string representing the encoding to use if the contents are
+            non-ascii, for python versions prior to 3.
+        infer_datetime_format : bool, default False
             If True and `parse_dates` is True for a column, try to infer the
             datetime format based on the first datetime string. If the format
             can be inferred, there often will be a large parsing speed-up.
 
-        See also
-        --------
-        pandas.read_csv
-
         Returns
         -------
-        y : Series
+        Series
+
+        See Also
+        --------
+        read_csv
         """
+
+        # We're calling `DataFrame.from_csv` in the implementation,
+        # which will propagate a warning regarding `from_csv` deprecation.
         from pandas.core.frame import DataFrame
         df = DataFrame.from_csv(path, header=header, index_col=index_col,
                                 sep=sep, parse_dates=parse_dates,
@@ -2531,85 +4219,160 @@ def from_csv(cls, path, sep=',', parse_dates=True, header=None,
 
         return result
 
-    def to_csv(self, path=None, index=True, sep=",", na_rep='',
-               float_format=None, header=False, index_label=None,
-               mode='w', encoding=None, date_format=None, decimal='.'):
-        """
-        Write Series to a comma-separated values (csv) file
+    @Appender(generic.NDFrame.to_csv.__doc__)
+    def to_csv(self, *args, **kwargs):
+
+        names = ["path_or_buf", "sep", "na_rep", "float_format", "columns",
+                 "header", "index", "index_label", "mode", "encoding",
+                 "compression", "quoting", "quotechar", "line_terminator",
+                 "chunksize", "tupleize_cols", "date_format", "doublequote",
+                 "escapechar", "decimal"]
+
+        old_names = ["path_or_buf", "index", "sep", "na_rep", "float_format",
+                     "header", "index_label", "mode", "encoding",
+                     "compression", "date_format", "decimal"]
+
+        if "path" in kwargs:
+            warnings.warn("The signature of `Series.to_csv` was aligned "
+                          "to that of `DataFrame.to_csv`, and argument "
+                          "'path' will be renamed to 'path_or_buf'.",
+                          FutureWarning, stacklevel=2)
+            kwargs["path_or_buf"] = kwargs.pop("path")
+
+        if len(args) > 1:
+            # Either "index" (old signature) or "sep" (new signature) is being
+            # passed as second argument (while the first is the same)
+            maybe_sep = args[1]
+
+            if not (is_string_like(maybe_sep) and len(maybe_sep) == 1):
+                # old signature
+                warnings.warn("The signature of `Series.to_csv` was aligned "
+                              "to that of `DataFrame.to_csv`. Note that the "
+                              "order of arguments changed, and the new one "
+                              "has 'sep' in first place, for which \"{}\" is "
+                              "not a valid value. The old order will cease to "
+                              "be supported in a future version. Please refer "
+                              "to the documentation for `DataFrame.to_csv` "
+                              "when updating your function "
+                              "calls.".format(maybe_sep),
+                              FutureWarning, stacklevel=2)
+                names = old_names
+
+        pos_args = dict(zip(names[:len(args)], args))
+
+        for key in pos_args:
+            if key in kwargs:
+                raise ValueError("Argument given by name ('{}') and position "
+                                 "({})".format(key, names.index(key)))
+            kwargs[key] = pos_args[key]
+
+        if kwargs.get("header", None) is None:
+            warnings.warn("The signature of `Series.to_csv` was aligned "
+                          "to that of `DataFrame.to_csv`, and argument "
+                          "'header' will change its default value from False "
+                          "to True: please pass an explicit value to suppress "
+                          "this warning.", FutureWarning,
+                          stacklevel=2)
+            kwargs["header"] = False  # Backwards compatibility.
+        return self.to_frame().to_csv(**kwargs)
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return super(Series, self).isna()
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isnull(self):
+        return super(Series, self).isnull()
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return super(Series, self).notna()
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notnull(self):
+        return super(Series, self).notnull()
 
-        Parameters
-        ----------
-        path : string or file handle, default None
-            File path or object, if None is provided the result is returned as
-            a string.
-        na_rep : string, default ''
-            Missing data representation
-        float_format : string, default None
-            Format string for floating point numbers
-        header : boolean, default False
-            Write out series name
-        index : boolean, default True
-            Write row names (index)
-        index_label : string or sequence, default None
-            Column label for index column(s) if desired. If None is given, and
-            `header` and `index` are True, then the index names are used. A
-            sequence should be given if the DataFrame uses MultiIndex.
-        mode : Python write mode, default 'w'
-        sep : character, default ","
-            Field delimiter for the output file.
-        encoding : string, optional
-            a string representing the encoding to use if the contents are
-            non-ascii, for python versions prior to 3
-        date_format: string, default None
-            Format string for datetime objects.
-        decimal: string, default '.'
-            Character recognized as decimal separator. E.g. use ',' for
-            European data
+    def dropna(self, axis=0, inplace=False, **kwargs):
         """
-        from pandas.core.frame import DataFrame
-        df = DataFrame(self)
-        # result is only a string if no path provided, otherwise None
-        result = df.to_csv(path, index=index, sep=sep, na_rep=na_rep,
-                           float_format=float_format, header=header,
-                           index_label=index_label, mode=mode,
-                           encoding=encoding, date_format=date_format,
-                           decimal=decimal)
-        if path is None:
-            return result
+        Return a new Series with missing values removed.
 
-    @Appender(generic._shared_docs['to_excel'] % _shared_doc_kwargs)
-    def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
-                 float_format=None, columns=None, header=True, index=True,
-                 index_label=None, startrow=0, startcol=0, engine=None,
-                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True):
-        df = self.to_frame()
-        df.to_excel(excel_writer=excel_writer, sheet_name=sheet_name,
-                    na_rep=na_rep, float_format=float_format, columns=columns,
-                    header=header, index=index, index_label=index_label,
-                    startrow=startrow, startcol=startcol, engine=engine,
-                    merge_cells=merge_cells, encoding=encoding,
-                    inf_rep=inf_rep, verbose=verbose)
+        See the :ref:`User Guide <missing_data>` for more on which values are
+        considered missing, and how to work with missing data.
 
-    def dropna(self, axis=0, inplace=False, **kwargs):
-        """
-        Return Series without null values
+        Parameters
+        ----------
+        axis : {0 or 'index'}, default 0
+            There is only one axis to drop values from.
+        inplace : bool, default False
+            If True, do operation inplace and return None.
+        **kwargs
+            Not in use.
 
         Returns
         -------
-        valid : Series
-        inplace : boolean, default False
-            Do operation in place.
+        Series
+            Series with NA entries dropped from it.
+
+        See Also
+        --------
+        Series.isna: Indicate missing values.
+        Series.notna : Indicate existing (non-missing) values.
+        Series.fillna : Replace missing values.
+        DataFrame.dropna : Drop rows or columns which contain NA values.
+        Index.dropna : Drop missing indices.
+
+        Examples
+        --------
+        >>> ser = pd.Series([1., 2., np.nan])
+        >>> ser
+        0    1.0
+        1    2.0
+        2    NaN
+        dtype: float64
+
+        Drop NA values from a Series.
+
+        >>> ser.dropna()
+        0    1.0
+        1    2.0
+        dtype: float64
+
+        Keep the Series with valid entries in the same variable.
+
+        >>> ser.dropna(inplace=True)
+        >>> ser
+        0    1.0
+        1    2.0
+        dtype: float64
+
+        Empty strings are not considered NA values. ``None`` is considered an
+        NA value.
+
+        >>> ser = pd.Series([np.NaN, 2, pd.NaT, '', None, 'I stay'])
+        >>> ser
+        0       NaN
+        1         2
+        2       NaT
+        3
+        4      None
+        5    I stay
+        dtype: object
+        >>> ser.dropna()
+        1         2
+        3
+        5    I stay
+        dtype: object
         """
         inplace = validate_bool_kwarg(inplace, 'inplace')
         kwargs.pop('how', None)
         if kwargs:
             raise TypeError('dropna() got an unexpected keyword '
                             'argument "{0}"'.format(list(kwargs.keys())[0]))
-
-        axis = self._get_axis_number(axis or 0)
+        # Validate the axis parameter
+        self._get_axis_number(axis or 0)
 
         if self._can_hold_na:
-            result = remove_na(self)
+            result = remove_na_arraylike(self)
             if inplace:
                 self._update_inplace(result)
             else:
@@ -2621,55 +4384,37 @@ def dropna(self, axis=0, inplace=False, **kwargs):
             else:
                 return self.copy()
 
-    valid = lambda self, inplace=False, **kwargs: self.dropna(inplace=inplace,
-                                                              **kwargs)
-
-    def first_valid_index(self):
+    def valid(self, inplace=False, **kwargs):
         """
-        Return label for first non-NA/null value
-        """
-        if len(self) == 0:
-            return None
+        Return Series without null values.
 
-        mask = isnull(self._values)
-        i = mask.argmin()
-        if mask[i]:
-            return None
-        else:
-            return self.index[i]
-
-    def last_valid_index(self):
-        """
-        Return label for last non-NA/null value
+        .. deprecated:: 0.23.0
+            Use :meth:`Series.dropna` instead.
         """
-        if len(self) == 0:
-            return None
-
-        mask = isnull(self._values[::-1])
-        i = mask.argmin()
-        if mask[i]:
-            return None
-        else:
-            return self.index[len(self) - i - 1]
+        warnings.warn("Method .valid will be removed in a future version. "
+                      "Use .dropna instead.", FutureWarning, stacklevel=2)
+        return self.dropna(inplace=inplace, **kwargs)
 
     # ----------------------------------------------------------------------
     # Time series-oriented methods
 
     def to_timestamp(self, freq=None, how='start', copy=True):
         """
-        Cast to datetimeindex of timestamps, at *beginning* of period
+        Cast to DatetimeIndex of Timestamps, at *beginning* of period.
 
         Parameters
         ----------
-        freq : string, default frequency of PeriodIndex
-            Desired frequency
+        freq : str, default frequency of PeriodIndex
+            Desired frequency.
         how : {'s', 'e', 'start', 'end'}
             Convention for converting period to timestamp; start of period
-            vs. end
+            vs. end.
+        copy : bool, default True
+            Whether or not to return a copy.
 
         Returns
         -------
-        ts : Series with DatetimeIndex
+        Series with DatetimeIndex
         """
         new_values = self._values
         if copy:
@@ -2682,15 +4427,19 @@ def to_timestamp(self, freq=None, how='start', copy=True):
     def to_period(self, freq=None, copy=True):
         """
         Convert Series from DatetimeIndex to PeriodIndex with desired
-        frequency (inferred from index if not passed)
+        frequency (inferred from index if not passed).
 
         Parameters
         ----------
-        freq : string, default
+        freq : str, default None
+            Frequency associated with the PeriodIndex.
+        copy : bool, default True
+            Whether or not to return a copy.
 
         Returns
         -------
-        ts : Series with PeriodIndex
+        Series
+            Series with index converted to PeriodIndex.
         """
         new_values = self._values
         if copy:
@@ -2700,241 +4449,26 @@ def to_period(self, freq=None, copy=True):
         return self._constructor(new_values,
                                  index=new_index).__finalize__(self)
 
-    # -------------------------------------------------------------------------
-    # Datetimelike delegation methods
-
-    def _make_dt_accessor(self):
-        try:
-            return maybe_to_datetimelike(self)
-        except Exception:
-            raise AttributeError("Can only use .dt accessor with datetimelike "
-                                 "values")
-
-    dt = base.AccessorProperty(CombinedDatetimelikeProperties,
-                               _make_dt_accessor)
-
-    # -------------------------------------------------------------------------
-    # Categorical methods
-
-    def _make_cat_accessor(self):
-        if not is_categorical_dtype(self.dtype):
-            raise AttributeError("Can only use .cat accessor with a "
-                                 "'category' dtype")
-        return CategoricalAccessor(self.values, self.index)
-
-    cat = base.AccessorProperty(CategoricalAccessor, _make_cat_accessor)
-
-    def _dir_deletions(self):
-        return self._accessors
+    # ----------------------------------------------------------------------
+    # Accessor Methods
+    # ----------------------------------------------------------------------
+    str = CachedAccessor("str", StringMethods)
+    dt = CachedAccessor("dt", CombinedDatetimelikeProperties)
+    cat = CachedAccessor("cat", CategoricalAccessor)
+    plot = CachedAccessor("plot", gfx.SeriesPlotMethods)
+    sparse = CachedAccessor("sparse", SparseAccessor)
 
-    def _dir_additions(self):
-        rv = set()
-        for accessor in self._accessors:
-            try:
-                getattr(self, accessor)
-                rv.add(accessor)
-            except AttributeError:
-                pass
-        return rv
+    # ----------------------------------------------------------------------
+    # Add plotting methods to Series
+    hist = gfx.hist_series
 
 
-Series._setup_axes(['index'], info_axis=0, stat_axis=0, aliases={'rows': 0})
+Series._setup_axes(['index'], info_axis=0, stat_axis=0, aliases={'rows': 0},
+                   docs={'index': 'The index (axis labels) of the Series.'})
 Series._add_numeric_operations()
 Series._add_series_only_operations()
 Series._add_series_or_dataframe_operations()
-_INDEX_TYPES = ndarray, Index, list, tuple
-
-# -----------------------------------------------------------------------------
-# Supplementary functions
-
-
-def remove_na(series):
-    """
-    Return series containing only true/non-NaN values, possibly empty.
-    """
-    return series[notnull(_values_from_object(series))]
-
-
-def _sanitize_index(data, index, copy=False):
-    """ sanitize an index type to return an ndarray of the underlying, pass
-    thru a non-Index
-    """
-
-    if index is None:
-        return data
-
-    if len(data) != len(index):
-        raise ValueError('Length of values does not match length of ' 'index')
-
-    if isinstance(data, PeriodIndex):
-        data = data.asobject
-    elif isinstance(data, DatetimeIndex):
-        data = data._to_embed(keep_tz=True)
-        if copy:
-            data = data.copy()
-    elif isinstance(data, np.ndarray):
-
-        # coerce datetimelike types
-        if data.dtype.kind in ['M', 'm']:
-            data = _sanitize_array(data, index, copy=copy)
-
-    return data
-
-
-def _sanitize_array(data, index, dtype=None, copy=False,
-                    raise_cast_failure=False):
-    """ sanitize input data to an ndarray, copy if specified, coerce to the
-    dtype if specified
-    """
-
-    if dtype is not None:
-        dtype = _coerce_to_dtype(dtype)
-
-    if isinstance(data, ma.MaskedArray):
-        mask = ma.getmaskarray(data)
-        if mask.any():
-            data, fill_value = maybe_upcast(data, copy=True)
-            data[mask] = fill_value
-        else:
-            data = data.copy()
-
-    def _try_cast(arr, take_fast_path):
-
-        # perf shortcut as this is the most common case
-        if take_fast_path:
-            if maybe_castable(arr) and not copy and dtype is None:
-                return arr
-
-        try:
-            subarr = maybe_cast_to_datetime(arr, dtype)
-            if not is_extension_type(subarr):
-                subarr = np.array(subarr, dtype=dtype, copy=copy)
-        except (ValueError, TypeError):
-            if is_categorical_dtype(dtype):
-                subarr = Categorical(arr)
-            elif dtype is not None and raise_cast_failure:
-                raise
-            else:
-                subarr = np.array(arr, dtype=object, copy=copy)
-        return subarr
-
-    # GH #846
-    if isinstance(data, (np.ndarray, Index, Series)):
-
-        if dtype is not None:
-            subarr = np.array(data, copy=False)
-
-            # possibility of nan -> garbage
-            if is_float_dtype(data.dtype) and is_integer_dtype(dtype):
-                if not isnull(data).any():
-                    subarr = _try_cast(data, True)
-                elif copy:
-                    subarr = data.copy()
-            else:
-                subarr = _try_cast(data, True)
-        elif isinstance(data, Index):
-            # don't coerce Index types
-            # e.g. indexes can have different conversions (so don't fast path
-            # them)
-            # GH 6140
-            subarr = _sanitize_index(data, index, copy=True)
-        else:
-            subarr = _try_cast(data, True)
-
-        if copy:
-            subarr = data.copy()
-
-    elif isinstance(data, Categorical):
-        subarr = data
-
-        if copy:
-            subarr = data.copy()
-        return subarr
-
-    elif isinstance(data, (list, tuple)) and len(data) > 0:
-        if dtype is not None:
-            try:
-                subarr = _try_cast(data, False)
-            except Exception:
-                if raise_cast_failure:  # pragma: no cover
-                    raise
-                subarr = np.array(data, dtype=object, copy=copy)
-                subarr = lib.maybe_convert_objects(subarr)
-
-        else:
-            subarr = maybe_convert_platform(data)
-
-        subarr = maybe_cast_to_datetime(subarr, dtype)
-
-    else:
-        subarr = _try_cast(data, False)
-
-    def create_from_value(value, index, dtype):
-        # return a new empty value suitable for the dtype
-
-        if is_datetimetz(dtype):
-            subarr = DatetimeIndex([value] * len(index), dtype=dtype)
-        elif is_categorical_dtype(dtype):
-            subarr = Categorical([value] * len(index))
-        else:
-            if not isinstance(dtype, (np.dtype, type(np.dtype))):
-                dtype = dtype.dtype
-            subarr = np.empty(len(index), dtype=dtype)
-            subarr.fill(value)
-
-        return subarr
-
-    # scalar like, GH
-    if getattr(subarr, 'ndim', 0) == 0:
-        if isinstance(data, list):  # pragma: no cover
-            subarr = np.array(data, dtype=object)
-        elif index is not None:
-            value = data
-
-            # figure out the dtype from the value (upcast if necessary)
-            if dtype is None:
-                dtype, value = infer_dtype_from_scalar(value)
-            else:
-                # need to possibly convert the value here
-                value = maybe_cast_to_datetime(value, dtype)
-
-            subarr = create_from_value(value, index, dtype)
-
-        else:
-            return subarr.item()
-
-    # the result that we want
-    elif subarr.ndim == 1:
-        if index is not None:
-
-            # a 1-element ndarray
-            if len(subarr) != len(index) and len(subarr) == 1:
-                subarr = create_from_value(subarr[0], index,
-                                           subarr.dtype)
-
-    elif subarr.ndim > 1:
-        if isinstance(data, np.ndarray):
-            raise Exception('Data must be 1-dimensional')
-        else:
-            subarr = _asarray_tuplesafe(data, dtype=dtype)
-
-    # This is to prevent mixed-type Series getting all casted to
-    # NumPy string type, e.g. NaN --> '-1#IND'.
-    if issubclass(subarr.dtype.type, compat.string_types):
-        subarr = np.array(data, dtype=object, copy=copy)
-
-    return subarr
-
-
-# ----------------------------------------------------------------------
-# Add plotting methods to Series
-
-import pandas.tools.plotting as _gfx  # noqa
-
-Series.plot = base.AccessorProperty(_gfx.SeriesPlotMethods,
-                                    _gfx.SeriesPlotMethods)
-Series.hist = _gfx.hist_series
 
 # Add arithmetic!
-ops.add_flex_arithmetic_methods(Series, **ops.series_flex_funcs)
-ops.add_special_arithmetic_methods(Series, **ops.series_special_funcs)
+ops.add_flex_arithmetic_methods(Series)
+ops.add_special_arithmetic_methods(Series)
diff --git a/pandas/core/sorting.py b/pandas/core/sorting.py
index 205d0d94d2ec3..ef69939d6e978 100644
--- a/pandas/core/sorting.py
+++ b/pandas/core/sorting.py
@@ -1,16 +1,17 @@
 """ miscellaneous sorting / groupby utilities """
 
 import numpy as np
-from pandas.compat import long
-from pandas.core.categorical import Categorical
-from pandas.types.common import (_ensure_platform_int,
-                                 _ensure_int64,
-                                 is_categorical_dtype)
-from pandas.types.missing import isnull
-import pandas.core.algorithms as algorithms
-from pandas._libs import lib, algos, hashtable
+
+from pandas._libs import algos, hashtable, lib
 from pandas._libs.hashtable import unique_label_indices
+from pandas.compat import PY3, long, string_types
+
+from pandas.core.dtypes.cast import infer_dtype_from_array
+from pandas.core.dtypes.common import (
+    ensure_int64, ensure_platform_int, is_categorical_dtype, is_list_like)
+from pandas.core.dtypes.missing import isna
 
+import pandas.core.algorithms as algorithms
 
 _INT64_MAX = np.iinfo(np.int64).max
 
@@ -50,7 +51,21 @@ def _int64_cut_off(shape):
                 return i
         return len(shape)
 
-    def loop(labels, shape):
+    def maybe_lift(lab, size):
+        # promote nan values (assigned -1 label in lab array)
+        # so that all output values are non-negative
+        return (lab + 1, size + 1) if (lab == -1).any() else (lab, size)
+
+    labels = map(ensure_int64, labels)
+    if not xnull:
+        labels, shape = map(list, zip(*map(maybe_lift, labels, shape)))
+
+    labels = list(labels)
+    shape = list(shape)
+
+    # Iteratively process all the labels in chunks sized so less
+    # than _INT64_MAX unique int ids will be required for each chunk
+    while True:
         # how many levels can be done without overflow:
         nlev = _int64_cut_off(shape)
 
@@ -72,7 +87,7 @@ def loop(labels, shape):
             out[mask] = -1
 
         if nlev == len(shape):  # all levels done!
-            return out
+            break
 
         # compress what has been done so far in order to avoid overflow
         # to retain lexical ranks, obs_ids should be sorted
@@ -81,16 +96,28 @@ def loop(labels, shape):
         labels = [comp_ids] + labels[nlev:]
         shape = [len(obs_ids)] + shape[nlev:]
 
-        return loop(labels, shape)
+    return out
 
-    def maybe_lift(lab, size):  # pormote nan values
-        return (lab + 1, size + 1) if (lab == -1).any() else (lab, size)
 
-    labels = map(_ensure_int64, labels)
-    if not xnull:
-        labels, shape = map(list, zip(*map(maybe_lift, labels, shape)))
+def get_compressed_ids(labels, sizes):
+    """
+
+    Group_index is offsets into cartesian product of all possible labels. This
+    space can be huge, so this function compresses it, by computing offsets
+    (comp_ids) into the list of unique labels (obs_group_ids).
+
+    Parameters
+    ----------
+    labels : list of label arrays
+    sizes : list of size of the levels
+
+    Returns
+    -------
+    tuple of (comp_ids, obs_group_ids)
 
-    return loop(list(labels), list(shape))
+    """
+    ids = get_group_index(labels, sizes, sort=True, xnull=False)
+    return compress_group_index(ids, sort=True)
 
 
 def is_int64_overflow_possible(shape):
@@ -159,6 +186,8 @@ def indexer_from_factorized(labels, shape, compress=True):
 
 
 def lexsort_indexer(keys, orders=None, na_position='last'):
+    from pandas.core.arrays import Categorical
+
     labels = []
     shape = []
     if isinstance(orders, bool):
@@ -211,11 +240,23 @@ def nargsort(items, kind='quicksort', ascending=True, na_position='last'):
 
     # specially handle Categorical
     if is_categorical_dtype(items):
-        return items.argsort(ascending=ascending)
+        if na_position not in {'first', 'last'}:
+            raise ValueError('invalid na_position: {!r}'.format(na_position))
+
+        mask = isna(items)
+        cnt_null = mask.sum()
+        sorted_idx = items.argsort(ascending=ascending, kind=kind)
+        if ascending and na_position == 'last':
+            # NaN is coded as -1 and is listed in front after sorting
+            sorted_idx = np.roll(sorted_idx, -cnt_null)
+        elif not ascending and na_position == 'first':
+            # NaN is coded as -1 and is listed in the end after sorting
+            sorted_idx = np.roll(sorted_idx, cnt_null)
+        return sorted_idx
 
     items = np.asanyarray(items)
     idx = np.arange(len(items))
-    mask = isnull(items)
+    mask = isna(items)
     non_nans = items[~mask]
     non_nan_idx = idx[~mask]
     nan_idx = np.nonzero(mask)[0]
@@ -308,9 +349,9 @@ def get_group_index_sorter(group_index, ngroups):
     do_groupsort = (count > 0 and ((alpha + beta * ngroups) <
                                    (count * np.log(count))))
     if do_groupsort:
-        sorter, _ = algos.groupsort_indexer(_ensure_int64(group_index),
+        sorter, _ = algos.groupsort_indexer(ensure_int64(group_index),
                                             ngroups)
-        return _ensure_platform_int(sorter)
+        return ensure_platform_int(sorter)
     else:
         return group_index.argsort(kind='mergesort')
 
@@ -325,7 +366,7 @@ def compress_group_index(group_index, sort=True):
     size_hint = min(len(group_index), hashtable._SIZE_HINT_LIMIT)
     table = hashtable.Int64HashTable(size_hint)
 
-    group_index = _ensure_int64(group_index)
+    group_index = ensure_int64(group_index)
 
     # note, group labels come out ascending (ie, 1,2,3 etc)
     comp_ids, obs_group_ids = table.get_labels_groupby(group_index)
@@ -354,3 +395,107 @@ def _reorder_by_uniques(uniques, labels):
     uniques = algorithms.take_nd(uniques, sorter, allow_fill=False)
 
     return uniques, labels
+
+
+def safe_sort(values, labels=None, na_sentinel=-1, assume_unique=False):
+    """
+    Sort ``values`` and reorder corresponding ``labels``.
+    ``values`` should be unique if ``labels`` is not None.
+    Safe for use with mixed types (int, str), orders ints before strs.
+
+    .. versionadded:: 0.19.0
+
+    Parameters
+    ----------
+    values : list-like
+        Sequence; must be unique if ``labels`` is not None.
+    labels : list_like
+        Indices to ``values``. All out of bound indices are treated as
+        "not found" and will be masked with ``na_sentinel``.
+    na_sentinel : int, default -1
+        Value in ``labels`` to mark "not found".
+        Ignored when ``labels`` is None.
+    assume_unique : bool, default False
+        When True, ``values`` are assumed to be unique, which can speed up
+        the calculation. Ignored when ``labels`` is None.
+
+    Returns
+    -------
+    ordered : ndarray
+        Sorted ``values``
+    new_labels : ndarray
+        Reordered ``labels``; returned when ``labels`` is not None.
+
+    Raises
+    ------
+    TypeError
+        * If ``values`` is not list-like or if ``labels`` is neither None
+        nor list-like
+        * If ``values`` cannot be sorted
+    ValueError
+        * If ``labels`` is not None and ``values`` contain duplicates.
+    """
+    if not is_list_like(values):
+        raise TypeError("Only list-like objects are allowed to be passed to"
+                        "safe_sort as values")
+
+    if not isinstance(values, np.ndarray):
+
+        # don't convert to string types
+        dtype, _ = infer_dtype_from_array(values)
+        values = np.asarray(values, dtype=dtype)
+
+    def sort_mixed(values):
+        # order ints before strings, safe in py3
+        str_pos = np.array([isinstance(x, string_types) for x in values],
+                           dtype=bool)
+        nums = np.sort(values[~str_pos])
+        strs = np.sort(values[str_pos])
+        return np.concatenate([nums, np.asarray(strs, dtype=object)])
+
+    sorter = None
+    if PY3 and lib.infer_dtype(values, skipna=False) == 'mixed-integer':
+        # unorderable in py3 if mixed str/int
+        ordered = sort_mixed(values)
+    else:
+        try:
+            sorter = values.argsort()
+            ordered = values.take(sorter)
+        except TypeError:
+            # try this anyway
+            ordered = sort_mixed(values)
+
+    # labels:
+
+    if labels is None:
+        return ordered
+
+    if not is_list_like(labels):
+        raise TypeError("Only list-like objects or None are allowed to be"
+                        "passed to safe_sort as labels")
+    labels = ensure_platform_int(np.asarray(labels))
+
+    from pandas import Index
+    if not assume_unique and not Index(values).is_unique:
+        raise ValueError("values should be unique if labels is not None")
+
+    if sorter is None:
+        # mixed types
+        (hash_klass, _), values = algorithms._get_data_algo(
+            values, algorithms._hashtables)
+        t = hash_klass(len(values))
+        t.map_locations(values)
+        sorter = ensure_platform_int(t.lookup(ordered))
+
+    reverse_indexer = np.empty(len(sorter), dtype=np.int_)
+    reverse_indexer.put(sorter, np.arange(len(sorter)))
+
+    mask = (labels < -len(values)) | (labels >= len(values)) | \
+        (labels == na_sentinel)
+
+    # (Out of bound indices will be masked with `na_sentinel` next, so we may
+    # deal with them here without performance loss using `mode='wrap'`.)
+    new_labels = reverse_indexer.take(labels, mode='wrap')
+    np.putmask(new_labels, mask, na_sentinel)
+
+    return ordered, ensure_platform_int(new_labels)
diff --git a/pandas/core/sparse.py b/pandas/core/sparse.py
deleted file mode 100644
index 4fc329844d616..0000000000000
--- a/pandas/core/sparse.py
+++ /dev/null
@@ -1,10 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-
-# pylint: disable=W0611
-# flake8: noqa
-
-from pandas.sparse.series import SparseSeries
-from pandas.sparse.frame import SparseDataFrame
diff --git a/pandas/tests/formats/__init__.py b/pandas/core/sparse/__init__.py
similarity index 100%
rename from pandas/tests/formats/__init__.py
rename to pandas/core/sparse/__init__.py
diff --git a/pandas/core/sparse/api.py b/pandas/core/sparse/api.py
new file mode 100644
index 0000000000000..33e8b921905ba
--- /dev/null
+++ b/pandas/core/sparse/api.py
@@ -0,0 +1,5 @@
+# pylint: disable=W0611
+# flake8: noqa
+from pandas.core.arrays.sparse import SparseArray, SparseDtype
+from pandas.core.sparse.frame import SparseDataFrame
+from pandas.core.sparse.series import SparseSeries
diff --git a/pandas/core/sparse/frame.py b/pandas/core/sparse/frame.py
new file mode 100644
index 0000000000000..2d54b82a3c844
--- /dev/null
+++ b/pandas/core/sparse/frame.py
@@ -0,0 +1,1051 @@
+"""
+Data structures for sparse float data. Life is made simpler by dealing only
+with float64 data
+"""
+from __future__ import division
+
+import warnings
+
+import numpy as np
+
+from pandas._libs.sparse import BlockIndex, get_blocks
+import pandas.compat as compat
+from pandas.compat import lmap
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.cast import find_common_type, maybe_upcast
+from pandas.core.dtypes.common import ensure_platform_int, is_scipy_sparse
+from pandas.core.dtypes.missing import isna, notna
+
+import pandas.core.algorithms as algos
+from pandas.core.arrays.sparse import SparseArray, SparseDtype
+import pandas.core.common as com
+from pandas.core.frame import DataFrame
+import pandas.core.generic as generic
+from pandas.core.index import Index, MultiIndex, ensure_index
+import pandas.core.indexes.base as ibase
+from pandas.core.internals import (
+    BlockManager, create_block_manager_from_arrays)
+from pandas.core.internals.construction import extract_index, prep_ndarray
+import pandas.core.ops as ops
+from pandas.core.series import Series
+from pandas.core.sparse.series import SparseSeries
+
+# pylint: disable=E1101,E1103,W0231,E0202
+
+
+_shared_doc_kwargs = dict(klass='SparseDataFrame')
+
+
+class SparseDataFrame(DataFrame):
+    """
+    DataFrame containing sparse floating point data in the form of SparseSeries
+    objects
+
+    Parameters
+    ----------
+    data : same types as can be passed to DataFrame or scipy.sparse.spmatrix
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
+    index : array-like, optional
+    column : array-like, optional
+    default_kind : {'block', 'integer'}, default 'block'
+        Default sparse kind for converting Series to SparseSeries. Will not
+        override SparseSeries passed into constructor
+    default_fill_value : float
+        Default fill_value for converting Series to SparseSeries
+        (default: nan). Will not override SparseSeries passed in.
+    """
+    _subtyp = 'sparse_frame'
+
+    def __init__(self, data=None, index=None, columns=None, default_kind=None,
+                 default_fill_value=None, dtype=None, copy=False):
+
+        # pick up the defaults from the Sparse structures
+        if isinstance(data, SparseDataFrame):
+            if index is None:
+                index = data.index
+            if columns is None:
+                columns = data.columns
+            if default_fill_value is None:
+                default_fill_value = data.default_fill_value
+            if default_kind is None:
+                default_kind = data.default_kind
+        elif isinstance(data, (SparseSeries, SparseArray)):
+            if index is None:
+                index = data.index
+            if default_fill_value is None:
+                default_fill_value = data.fill_value
+            if columns is None and hasattr(data, 'name'):
+                columns = [data.name]
+            if columns is None:
+                raise Exception("cannot pass a series w/o a name or columns")
+            data = {columns[0]: data}
+
+        if default_fill_value is None:
+            default_fill_value = np.nan
+        if default_kind is None:
+            default_kind = 'block'
+
+        self._default_kind = default_kind
+        self._default_fill_value = default_fill_value
+
+        if is_scipy_sparse(data):
+            mgr = self._init_spmatrix(data, index, columns, dtype=dtype,
+                                      fill_value=default_fill_value)
+        elif isinstance(data, dict):
+            mgr = self._init_dict(data, index, columns, dtype=dtype)
+        elif isinstance(data, (np.ndarray, list)):
+            mgr = self._init_matrix(data, index, columns, dtype=dtype)
+        elif isinstance(data, SparseDataFrame):
+            mgr = self._init_mgr(data._data,
+                                 dict(index=index, columns=columns),
+                                 dtype=dtype, copy=copy)
+        elif isinstance(data, DataFrame):
+            mgr = self._init_dict(data, data.index, data.columns, dtype=dtype)
+        elif isinstance(data, Series):
+            mgr = self._init_dict(data.to_frame(), data.index,
+                                  columns=None, dtype=dtype)
+        elif isinstance(data, BlockManager):
+            mgr = self._init_mgr(data, axes=dict(index=index, columns=columns),
+                                 dtype=dtype, copy=copy)
+        elif data is None:
+            data = DataFrame()
+
+            if index is None:
+                index = Index([])
+            else:
+                index = ensure_index(index)
+
+            if columns is None:
+                columns = Index([])
+            else:
+                for c in columns:
+                    data[c] = SparseArray(self._default_fill_value,
+                                          index=index, kind=self._default_kind,
+                                          fill_value=self._default_fill_value)
+            mgr = to_manager(data, columns, index)
+            if dtype is not None:
+                mgr = mgr.astype(dtype)
+        else:
+            msg = ('SparseDataFrame called with unknown type "{data_type}" '
+                   'for data argument')
+            raise TypeError(msg.format(data_type=type(data).__name__))
+
+        generic.NDFrame.__init__(self, mgr)
+
+    @property
+    def _constructor(self):
+        return SparseDataFrame
+
+    _constructor_sliced = SparseSeries
+
+    def _init_dict(self, data, index, columns, dtype=None):
+        # pre-filter out columns if we passed it
+        if columns is not None:
+            columns = ensure_index(columns)
+            data = {k: v for k, v in compat.iteritems(data) if k in columns}
+        else:
+            keys = com.dict_keys_to_ordered_list(data)
+            columns = Index(keys)
+
+        if index is None:
+            index = extract_index(list(data.values()))
+
+        def sp_maker(x):
+            return SparseArray(x, kind=self._default_kind,
+                               fill_value=self._default_fill_value,
+                               copy=True, dtype=dtype)
+        sdict = {}
+        for k, v in compat.iteritems(data):
+            if isinstance(v, Series):
+                # Force alignment, no copy necessary
+                if not v.index.equals(index):
+                    v = v.reindex(index)
+
+                if not isinstance(v, SparseSeries):
+                    v = sp_maker(v.values)
+            elif isinstance(v, SparseArray):
+                v = v.copy()
+            else:
+                if isinstance(v, dict):
+                    v = [v.get(i, np.nan) for i in index]
+
+                v = sp_maker(v)
+
+            if index is not None and len(v) != len(index):
+                msg = "Length of passed values is {}, index implies {}"
+                raise ValueError(msg.format(len(v), len(index)))
+            sdict[k] = v
+
+        if len(columns.difference(sdict)):
+            # TODO: figure out how to handle this case, all nan's?
+            # add in any other columns we want to have (completeness)
+            nan_arr = np.empty(len(index), dtype='float64')
+            nan_arr.fill(np.nan)
+            nan_arr = SparseArray(nan_arr, kind=self._default_kind,
+                                  fill_value=self._default_fill_value,
+                                  copy=False)
+            sdict.update((c, nan_arr) for c in columns if c not in sdict)
+
+        return to_manager(sdict, columns, index)
+
+    def _init_matrix(self, data, index, columns, dtype=None):
+        """
+        Init self from ndarray or list of lists.
+        """
+        data = prep_ndarray(data, copy=False)
+        index, columns = self._prep_index(data, index, columns)
+        data = {idx: data[:, i] for i, idx in enumerate(columns)}
+        return self._init_dict(data, index, columns, dtype)
+
+    def _init_spmatrix(self, data, index, columns, dtype=None,
+                       fill_value=None):
+        """
+        Init self from scipy.sparse matrix.
+        """
+        index, columns = self._prep_index(data, index, columns)
+        data = data.tocoo()
+        N = len(index)
+
+        # Construct a dict of SparseSeries
+        sdict = {}
+        values = Series(data.data, index=data.row, copy=False)
+        for col, rowvals in values.groupby(data.col):
+            # get_blocks expects int32 row indices in sorted order
+            rowvals = rowvals.sort_index()
+            rows = rowvals.index.values.astype(np.int32)
+            blocs, blens = get_blocks(rows)
+
+            sdict[columns[col]] = SparseSeries(
+                rowvals.values, index=index,
+                fill_value=fill_value,
+                sparse_index=BlockIndex(N, blocs, blens))
+
+        # Add any columns that were empty and thus not grouped on above
+        sdict.update({column: SparseSeries(index=index,
+                                           fill_value=fill_value,
+                                           sparse_index=BlockIndex(N, [], []))
+                      for column in columns
+                      if column not in sdict})
+
+        return self._init_dict(sdict, index, columns, dtype)
+
+    def _prep_index(self, data, index, columns):
+        N, K = data.shape
+        if index is None:
+            index = ibase.default_index(N)
+        if columns is None:
+            columns = ibase.default_index(K)
+
+        if len(columns) != K:
+            raise ValueError('Column length mismatch: {columns} vs. {K}'
+                             .format(columns=len(columns), K=K))
+        if len(index) != N:
+            raise ValueError('Index length mismatch: {index} vs. {N}'
+                             .format(index=len(index), N=N))
+        return index, columns
+
+    def to_coo(self):
+        """
+        Return the contents of the frame as a sparse SciPy COO matrix.
+
+        .. versionadded:: 0.20.0
+
+        Returns
+        -------
+        coo_matrix : scipy.sparse.spmatrix
+            If the caller is heterogeneous and contains booleans or objects,
+            the result will be of dtype=object. See Notes.
+
+        Notes
+        -----
+        The dtype will be the lowest-common-denominator type (implicit
+        upcasting); that is to say if the dtypes (even of numeric types)
+        are mixed, the one that accommodates all will be chosen.
+
+        e.g. If the dtypes are float16 and float32, dtype will be upcast to
+        float32. By numpy.find_common_type convention, mixing int64 and
+        and uint64 will result in a float64 dtype.
+        """
+        try:
+            from scipy.sparse import coo_matrix
+        except ImportError:
+            raise ImportError('Scipy is not installed')
+
+        dtype = find_common_type(self.dtypes)
+        if isinstance(dtype, SparseDtype):
+            dtype = dtype.subtype
+
+        cols, rows, datas = [], [], []
+        for col, name in enumerate(self):
+            s = self[name]
+            row = s.sp_index.to_int_index().indices
+            cols.append(np.repeat(col, len(row)))
+            rows.append(row)
+            datas.append(s.sp_values.astype(dtype, copy=False))
+
+        cols = np.concatenate(cols)
+        rows = np.concatenate(rows)
+        datas = np.concatenate(datas)
+        return coo_matrix((datas, (rows, cols)), shape=self.shape)
+
+    def __array_wrap__(self, result):
+        return self._constructor(
+            result, index=self.index, columns=self.columns,
+            default_kind=self._default_kind,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def __getstate__(self):
+        # pickling
+        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
+                    _default_fill_value=self._default_fill_value,
+                    _default_kind=self._default_kind)
+
+    def _unpickle_sparse_frame_compat(self, state):
+        """
+        Original pickle format
+        """
+        series, cols, idx, fv, kind = state
+
+        if not isinstance(cols, Index):  # pragma: no cover
+            from pandas.io.pickle import _unpickle_array
+            columns = _unpickle_array(cols)
+        else:
+            columns = cols
+
+        if not isinstance(idx, Index):  # pragma: no cover
+            from pandas.io.pickle import _unpickle_array
+            index = _unpickle_array(idx)
+        else:
+            index = idx
+
+        series_dict = DataFrame()
+        for col, (sp_index, sp_values) in compat.iteritems(series):
+            series_dict[col] = SparseSeries(sp_values, sparse_index=sp_index,
+                                            fill_value=fv)
+
+        self._data = to_manager(series_dict, columns, index)
+        self._default_fill_value = fv
+        self._default_kind = kind
+
+    def to_dense(self):
+        """
+        Convert to dense DataFrame
+
+        Returns
+        -------
+        df : DataFrame
+        """
+        data = {k: v.to_dense() for k, v in compat.iteritems(self)}
+        return DataFrame(data, index=self.index, columns=self.columns)
+
+    def _apply_columns(self, func):
+        """
+        Get new SparseDataFrame applying func to each columns
+        """
+
+        new_data = {col: func(series)
+                    for col, series in compat.iteritems(self)}
+
+        return self._constructor(
+            data=new_data, index=self.index, columns=self.columns,
+            default_fill_value=self.default_fill_value).__finalize__(self)
+
+    def astype(self, dtype):
+        return self._apply_columns(lambda x: x.astype(dtype))
+
+    def copy(self, deep=True):
+        """
+        Make a copy of this SparseDataFrame
+        """
+        result = super(SparseDataFrame, self).copy(deep=deep)
+        result._default_fill_value = self._default_fill_value
+        result._default_kind = self._default_kind
+        return result
+
+    @property
+    def default_fill_value(self):
+        return self._default_fill_value
+
+    @property
+    def default_kind(self):
+        return self._default_kind
+
+    @property
+    def density(self):
+        """
+        Ratio of non-sparse points to total (dense) data points
+        represented in the frame
+        """
+        tot_nonsparse = sum(ser.sp_index.npoints
+                            for _, ser in compat.iteritems(self))
+        tot = len(self.index) * len(self.columns)
+        return tot_nonsparse / float(tot)
+
+    def fillna(self, value=None, method=None, axis=0, inplace=False,
+               limit=None, downcast=None):
+        new_self = super(SparseDataFrame,
+                         self).fillna(value=value, method=method, axis=axis,
+                                      inplace=inplace, limit=limit,
+                                      downcast=downcast)
+        if not inplace:
+            self = new_self
+
+        # set the fill value if we are filling as a scalar with nothing special
+        # going on
+        if (value is not None and value == value and method is None and
+                limit is None):
+            self._default_fill_value = value
+
+        if not inplace:
+            return self
+
+    # ----------------------------------------------------------------------
+    # Support different internal representation of SparseDataFrame
+
+    def _sanitize_column(self, key, value, **kwargs):
+        """
+        Creates a new SparseArray from the input value.
+
+        Parameters
+        ----------
+        key : object
+        value : scalar, Series, or array-like
+        kwargs : dict
+
+        Returns
+        -------
+        sanitized_column : SparseArray
+
+        """
+        def sp_maker(x, index=None):
+            return SparseArray(x, index=index,
+                               fill_value=self._default_fill_value,
+                               kind=self._default_kind)
+        if isinstance(value, SparseSeries):
+            clean = value.reindex(self.index).as_sparse_array(
+                fill_value=self._default_fill_value, kind=self._default_kind)
+
+        elif isinstance(value, SparseArray):
+            if len(value) != len(self.index):
+                raise AssertionError('Length of values does not match '
+                                     'length of index')
+            clean = value
+
+        elif hasattr(value, '__iter__'):
+            if isinstance(value, Series):
+                clean = value.reindex(self.index)
+                if not isinstance(value, SparseSeries):
+                    clean = sp_maker(clean)
+            else:
+                if len(value) != len(self.index):
+                    raise AssertionError('Length of values does not match '
+                                         'length of index')
+                clean = sp_maker(value)
+
+        # Scalar
+        else:
+            clean = sp_maker(value, self.index)
+
+        # always return a SparseArray!
+        return clean
+
+    def get_value(self, index, col, takeable=False):
+        """
+        Quickly retrieve single value at passed column and index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : row label
+        col : column label
+        takeable : interpret the index/col as indexers, default False
+
+        Returns
+        -------
+        value : scalar value
+        """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._get_value(index, col, takeable=takeable)
+
+    def _get_value(self, index, col, takeable=False):
+        if takeable is True:
+            series = self._iget_item_cache(col)
+        else:
+            series = self._get_item_cache(col)
+
+        return series._get_value(index, takeable=takeable)
+    _get_value.__doc__ = get_value.__doc__
+
+    def set_value(self, index, col, value, takeable=False):
+        """
+        Put single value at passed column and index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : row label
+        col : column label
+        value : scalar value
+        takeable : interpret the index/col as indexers, default False
+
+        Notes
+        -----
+        This method *always* returns a new object. It is currently not
+        particularly efficient (and potentially very expensive) but is provided
+        for API compatibility with DataFrame
+
+        Returns
+        -------
+        frame : DataFrame
+        """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(index, col, value, takeable=takeable)
+
+    def _set_value(self, index, col, value, takeable=False):
+        dense = self.to_dense()._set_value(
+            index, col, value, takeable=takeable)
+        return dense.to_sparse(kind=self._default_kind,
+                               fill_value=self._default_fill_value)
+    _set_value.__doc__ = set_value.__doc__
+
+    def _slice(self, slobj, axis=0, kind=None):
+        if axis == 0:
+            new_index = self.index[slobj]
+            new_columns = self.columns
+        else:
+            new_index = self.index
+            new_columns = self.columns[slobj]
+
+        return self.reindex(index=new_index, columns=new_columns)
+
+    def xs(self, key, axis=0, copy=False):
+        """
+        Returns a row (cross-section) from the SparseDataFrame as a Series
+        object.
+
+        Parameters
+        ----------
+        key : some index contained in the index
+
+        Returns
+        -------
+        xs : Series
+        """
+        if axis == 1:
+            data = self[key]
+            return data
+
+        i = self.index.get_loc(key)
+        data = self.take([i]).get_values()[0]
+        return Series(data, index=self.columns)
+
+    # ----------------------------------------------------------------------
+    # Arithmetic-related methods
+
+    def _combine_frame(self, other, func, fill_value=None, level=None):
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        this, other = self.align(other, join='outer', level=level, copy=False)
+        new_index, new_columns = this.index, this.columns
+
+        if self.empty and other.empty:
+            return self._constructor(index=new_index).__finalize__(self)
+
+        new_data = {}
+        if fill_value is not None:
+            # TODO: be a bit more intelligent here
+            for col in new_columns:
+                if col in this and col in other:
+                    dleft = this[col].to_dense()
+                    dright = other[col].to_dense()
+                    result = dleft._binop(dright, func, fill_value=fill_value)
+                    result = result.to_sparse(fill_value=this[col].fill_value)
+                    new_data[col] = result
+        else:
+
+            for col in new_columns:
+                if col in this and col in other:
+                    new_data[col] = func(this[col], other[col])
+
+        new_fill_value = self._get_op_result_fill_value(other, func)
+
+        return self._constructor(data=new_data, index=new_index,
+                                 columns=new_columns,
+                                 default_fill_value=new_fill_value
+                                 ).__finalize__(self)
+
+    def _combine_match_index(self, other, func, level=None):
+        new_data = {}
+
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        this, other = self.align(other, join='outer', axis=0, level=level,
+                                 copy=False)
+
+        for col, series in compat.iteritems(this):
+            new_data[col] = func(series.values, other.values)
+
+        fill_value = self._get_op_result_fill_value(other, func)
+
+        return self._constructor(
+            new_data, index=this.index, columns=self.columns,
+            default_fill_value=fill_value).__finalize__(self)
+
+    def _combine_match_columns(self, other, func, level=None):
+        # patched version of DataFrame._combine_match_columns to account for
+        # NumPy circumventing __rsub__ with float64 types, e.g.: 3.0 - series,
+        # where 3.0 is numpy.float64 and series is a SparseSeries. Still
+        # possible for this to happen, which is bothersome
+
+        if level is not None:
+            raise NotImplementedError("'level' argument is not supported")
+
+        left, right = self.align(other, join='outer', axis=1, level=level,
+                                 copy=False)
+        assert left.columns.equals(right.index)
+
+        new_data = {}
+
+        for col in left.columns:
+            new_data[col] = func(left[col], float(right[col]))
+
+        return self._constructor(
+            new_data, index=left.index, columns=left.columns,
+            default_fill_value=self.default_fill_value).__finalize__(self)
+
+    def _combine_const(self, other, func):
+        return self._apply_columns(lambda x: func(x, other))
+
+    def _get_op_result_fill_value(self, other, func):
+        own_default = self.default_fill_value
+
+        if isinstance(other, DataFrame):
+            # i.e. called from _combine_frame
+
+            other_default = getattr(other, 'default_fill_value', np.nan)
+
+            # if the fill values are the same use them? or use a valid one
+            if own_default == other_default:
+                # TOOD: won't this evaluate as False if both are np.nan?
+                fill_value = own_default
+            elif np.isnan(own_default) and not np.isnan(other_default):
+                fill_value = other_default
+            elif not np.isnan(own_default) and np.isnan(other_default):
+                fill_value = own_default
+            else:
+                fill_value = None
+
+        elif isinstance(other, SparseSeries):
+            # i.e. called from _combine_match_index
+
+            # fill_value is a function of our operator
+            if isna(other.fill_value) or isna(own_default):
+                fill_value = np.nan
+            else:
+                fill_value = func(np.float64(own_default),
+                                  np.float64(other.fill_value))
+
+        else:
+            raise NotImplementedError(type(other))
+
+        return fill_value
+
+    def _reindex_index(self, index, method, copy, level, fill_value=np.nan,
+                       limit=None, takeable=False):
+        if level is not None:
+            raise TypeError('Reindex by level not supported for sparse')
+
+        if self.index.equals(index):
+            if copy:
+                return self.copy()
+            else:
+                return self
+
+        if len(self.index) == 0:
+            return self._constructor(
+                index=index, columns=self.columns).__finalize__(self)
+
+        indexer = self.index.get_indexer(index, method, limit=limit)
+        indexer = ensure_platform_int(indexer)
+        mask = indexer == -1
+        need_mask = mask.any()
+
+        new_series = {}
+        for col, series in self.iteritems():
+            if mask.all():
+                continue
+
+            values = series.values
+            # .take returns SparseArray
+            new = values.take(indexer)
+            if need_mask:
+                new = new.values
+                # convert integer to float if necessary. need to do a lot
+                # more than that, handle boolean etc also
+                new, fill_value = maybe_upcast(new, fill_value=fill_value)
+                np.putmask(new, mask, fill_value)
+
+            new_series[col] = new
+
+        return self._constructor(
+            new_series, index=index, columns=self.columns,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def _reindex_columns(self, columns, method, copy, level, fill_value=None,
+                         limit=None, takeable=False):
+        if level is not None:
+            raise TypeError('Reindex by level not supported for sparse')
+
+        if notna(fill_value):
+            raise NotImplementedError("'fill_value' argument is not supported")
+
+        if limit:
+            raise NotImplementedError("'limit' argument is not supported")
+
+        if method is not None:
+            raise NotImplementedError("'method' argument is not supported")
+
+        # TODO: fill value handling
+        sdict = {k: v for k, v in compat.iteritems(self) if k in columns}
+        return self._constructor(
+            sdict, index=self.index, columns=columns,
+            default_fill_value=self._default_fill_value).__finalize__(self)
+
+    def _reindex_with_indexers(self, reindexers, method=None, fill_value=None,
+                               limit=None, copy=False, allow_dups=False):
+
+        if method is not None or limit is not None:
+            raise NotImplementedError("cannot reindex with a method or limit "
+                                      "with sparse")
+
+        if fill_value is None:
+            fill_value = np.nan
+
+        reindexers = {self._get_axis_number(a): val
+                      for (a, val) in compat.iteritems(reindexers)}
+
+        index, row_indexer = reindexers.get(0, (None, None))
+        columns, col_indexer = reindexers.get(1, (None, None))
+
+        if columns is None:
+            columns = self.columns
+
+        new_arrays = {}
+        for col in columns:
+            if col not in self:
+                continue
+            if row_indexer is not None:
+                new_arrays[col] = algos.take_1d(self[col].get_values(),
+                                                row_indexer,
+                                                fill_value=fill_value)
+            else:
+                new_arrays[col] = self[col]
+
+        return self._constructor(new_arrays, index=index,
+                                 columns=columns).__finalize__(self)
+
+    def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
+                     sort=False):
+        if on is not None:
+            raise NotImplementedError("'on' keyword parameter is not yet "
+                                      "implemented")
+        return self._join_index(other, how, lsuffix, rsuffix)
+
+    def _join_index(self, other, how, lsuffix, rsuffix):
+        if isinstance(other, Series):
+            if other.name is None:
+                raise ValueError('Other Series must have a name')
+
+            other = SparseDataFrame(
+                {other.name: other},
+                default_fill_value=self._default_fill_value)
+
+        join_index = self.index.join(other.index, how=how)
+
+        this = self.reindex(join_index)
+        other = other.reindex(join_index)
+
+        this, other = this._maybe_rename_join(other, lsuffix, rsuffix)
+
+        from pandas import concat
+        return concat([this, other], axis=1, verify_integrity=True)
+
+    def _maybe_rename_join(self, other, lsuffix, rsuffix):
+        to_rename = self.columns.intersection(other.columns)
+        if len(to_rename) > 0:
+            if not lsuffix and not rsuffix:
+                raise ValueError('columns overlap but no suffix specified: '
+                                 '{to_rename}'.format(to_rename=to_rename))
+
+            def lrenamer(x):
+                if x in to_rename:
+                    return '{x}{lsuffix}'.format(x=x, lsuffix=lsuffix)
+                return x
+
+            def rrenamer(x):
+                if x in to_rename:
+                    return '{x}{rsuffix}'.format(x=x, rsuffix=rsuffix)
+                return x
+
+            this = self.rename(columns=lrenamer)
+            other = other.rename(columns=rrenamer)
+        else:
+            this = self
+
+        return this, other
+
+    def transpose(self, *args, **kwargs):
+        """
+        Returns a DataFrame with the rows/columns switched.
+        """
+        nv.validate_transpose(args, kwargs)
+        return self._constructor(
+            self.values.T, index=self.columns, columns=self.index,
+            default_fill_value=self._default_fill_value,
+            default_kind=self._default_kind).__finalize__(self)
+
+    T = property(transpose)
+
+    @Appender(DataFrame.count.__doc__)
+    def count(self, axis=0, **kwds):
+        if axis is None:
+            axis = self._stat_axis_number
+
+        return self.apply(lambda x: x.count(), axis=axis)
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Return SparseDataFrame of cumulative sums over requested axis.
+
+        Parameters
+        ----------
+        axis : {0, 1}
+            0 for row-wise, 1 for column-wise
+
+        Returns
+        -------
+        y : SparseDataFrame
+        """
+        nv.validate_cumsum(args, kwargs)
+
+        if axis is None:
+            axis = self._stat_axis_number
+
+        return self.apply(lambda x: x.cumsum(), axis=axis)
+
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        return self._apply_columns(lambda x: x.isna())
+    isnull = isna
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        return self._apply_columns(lambda x: x.notna())
+    notnull = notna
+
+    def apply(self, func, axis=0, broadcast=None, reduce=None,
+              result_type=None):
+        """
+        Analogous to DataFrame.apply, for SparseDataFrame
+
+        Parameters
+        ----------
+        func : function
+            Function to apply to each column
+        axis : {0, 1, 'index', 'columns'}
+        broadcast : bool, default False
+            For aggregation functions, return object of same size with values
+            propagated
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='broadcast'.
+
+        reduce : boolean or None, default None
+            Try to apply reduction procedures. If the DataFrame is empty,
+            apply will use reduce to determine whether the result should be a
+            Series or a DataFrame. If reduce is None (the default), apply's
+            return value will be guessed by calling func an empty Series (note:
+            while guessing, exceptions raised by func will be ignored). If
+            reduce is True a Series will always be returned, and if False a
+            DataFrame will always be returned.
+
+            .. deprecated:: 0.23.0
+               This argument will be removed in a future version, replaced
+               by result_type='reduce'.
+
+        result_type : {'expand', 'reduce', 'broadcast, None}
+            These only act when axis=1 {columns}:
+
+            * 'expand' : list-like results will be turned into columns.
+            * 'reduce' : return a Series if possible rather than expanding
+              list-like results. This is the opposite to 'expand'.
+            * 'broadcast' : results will be broadcast to the original shape
+              of the frame, the original index & columns will be retained.
+
+            The default behaviour (None) depends on the return value of the
+            applied function: list-like results will be returned as a Series
+            of those. However if the apply function returns a Series these
+            are expanded to columns.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        applied : Series or SparseDataFrame
+        """
+        if not len(self.columns):
+            return self
+        axis = self._get_axis_number(axis)
+
+        if isinstance(func, np.ufunc):
+            new_series = {}
+            for k, v in compat.iteritems(self):
+                applied = func(v)
+                applied.fill_value = func(v.fill_value)
+                new_series[k] = applied
+            return self._constructor(
+                new_series, index=self.index, columns=self.columns,
+                default_fill_value=self._default_fill_value,
+                default_kind=self._default_kind).__finalize__(self)
+
+        from pandas.core.apply import frame_apply
+        op = frame_apply(self,
+                         func=func,
+                         axis=axis,
+                         reduce=reduce,
+                         broadcast=broadcast,
+                         result_type=result_type)
+        return op.get_result()
+
+    def applymap(self, func):
+        """
+        Apply a function to a DataFrame that is intended to operate
+        elementwise, i.e. like doing map(func, series) for each series in the
+        DataFrame
+
+        Parameters
+        ----------
+        func : function
+            Python function, returns a single value from a single value
+
+        Returns
+        -------
+        applied : DataFrame
+        """
+        return self.apply(lambda x: lmap(func, x))
+
+
+def to_manager(sdf, columns, index):
+    """ create and return the block manager from a dataframe of series,
+    columns, index
+    """
+
+    # from BlockManager perspective
+    axes = [ensure_index(columns), ensure_index(index)]
+
+    return create_block_manager_from_arrays(
+        [sdf[c] for c in columns], columns, axes)
+
+
+def stack_sparse_frame(frame):
+    """
+    Only makes sense when fill_value is NaN
+    """
+    lengths = [s.sp_index.npoints for _, s in compat.iteritems(frame)]
+    nobs = sum(lengths)
+
+    # this is pretty fast
+    minor_codes = np.repeat(np.arange(len(frame.columns)), lengths)
+
+    inds_to_concat = []
+    vals_to_concat = []
+    # TODO: Figure out whether this can be reached.
+    # I think this currently can't be reached because you can't build a
+    # SparseDataFrame with a non-np.NaN fill value (fails earlier).
+    for _, series in compat.iteritems(frame):
+        if not np.isnan(series.fill_value):
+            raise TypeError('This routine assumes NaN fill value')
+
+        int_index = series.sp_index.to_int_index()
+        inds_to_concat.append(int_index.indices)
+        vals_to_concat.append(series.sp_values)
+
+    major_codes = np.concatenate(inds_to_concat)
+    stacked_values = np.concatenate(vals_to_concat)
+    index = MultiIndex(levels=[frame.index, frame.columns],
+                       codes=[major_codes, minor_codes],
+                       verify_integrity=False)
+
+    lp = DataFrame(stacked_values.reshape((nobs, 1)), index=index,
+                   columns=['foo'])
+    return lp.sort_index(level=0)
+
+
+def homogenize(series_dict):
+    """
+    Conform a set of SparseSeries (with NaN fill_value) to a common SparseIndex
+    corresponding to the locations where they all have data
+
+    Parameters
+    ----------
+    series_dict : dict or DataFrame
+
+    Notes
+    -----
+    Using the dumbest algorithm I could think of. Should put some more thought
+    into this
+
+    Returns
+    -------
+    homogenized : dict of SparseSeries
+    """
+    index = None
+
+    need_reindex = False
+
+    for _, series in compat.iteritems(series_dict):
+        if not np.isnan(series.fill_value):
+            raise TypeError('this method is only valid with NaN fill values')
+
+        if index is None:
+            index = series.sp_index
+        elif not series.sp_index.equals(index):
+            need_reindex = True
+            index = index.intersect(series.sp_index)
+
+    if need_reindex:
+        output = {}
+        for name, series in compat.iteritems(series_dict):
+            if not series.sp_index.equals(index):
+                series = series.sparse_reindex(index)
+
+            output[name] = series
+    else:
+        output = series_dict
+
+    return output
+
+
+# use unaccelerated ops for sparse objects
+ops.add_flex_arithmetic_methods(SparseDataFrame)
+ops.add_special_arithmetic_methods(SparseDataFrame)
diff --git a/pandas/sparse/scipy_sparse.py b/pandas/core/sparse/scipy_sparse.py
similarity index 86%
rename from pandas/sparse/scipy_sparse.py
rename to pandas/core/sparse/scipy_sparse.py
index ea108e3e89935..5a39a1529a33a 100644
--- a/pandas/sparse/scipy_sparse.py
+++ b/pandas/core/sparse/scipy_sparse.py
@@ -3,9 +3,12 @@
 
 Currently only includes SparseSeries.to_coo helpers.
 """
-from pandas.core.index import MultiIndex, Index
+from collections import OrderedDict
+
+from pandas.compat import lmap
+
+from pandas.core.index import Index, MultiIndex
 from pandas.core.series import Series
-from pandas.compat import OrderedDict, lmap
 
 
 def _check_is_partition(parts, whole):
@@ -57,21 +60,17 @@ def _get_label_to_i_dict(labels, sort_labels=False):
             return (d)
 
         def _get_index_subset_to_coord_dict(index, subset, sort_labels=False):
-            def robust_get_level_values(i):
-                # if index has labels (that are not None) use those,
-                # else use the level location
-                try:
-                    return index.get_level_values(index.names[i])
-                except KeyError:
-                    return index.get_level_values(i)
-
-            ilabels = list(zip(*[robust_get_level_values(i) for i in subset]))
+            ilabels = list(zip(*[index._get_level_values(i) for i in subset]))
             labels_to_i = _get_label_to_i_dict(ilabels,
                                                sort_labels=sort_labels)
             labels_to_i = Series(labels_to_i)
             if len(subset) > 1:
                 labels_to_i.index = MultiIndex.from_tuples(labels_to_i.index)
-            labels_to_i.index.names = [index.names[i] for i in subset]
+                labels_to_i.index.names = [index.names[i] for i in subset]
+            else:
+                labels_to_i.index = Index(x[0] for x in labels_to_i.index)
+                labels_to_i.index.name = index.names[subset[0]]
+
             labels_to_i.name = 'value'
             return (labels_to_i)
 
@@ -93,7 +92,8 @@ def robust_get_level_values(i):
 
 def _sparse_series_to_coo(ss, row_levels=(0, ), column_levels=(1, ),
                           sort_labels=False):
-    """ Convert a SparseSeries to a scipy.sparse.coo_matrix using index
+    """
+    Convert a SparseSeries to a scipy.sparse.coo_matrix using index
     levels row_levels, column_levels as the row and column
     labels respectively. Returns the sparse_matrix, row and column labels.
     """
@@ -119,7 +119,8 @@ def _sparse_series_to_coo(ss, row_levels=(0, ), column_levels=(1, ),
 
 
 def _coo_to_sparse_series(A, dense_index=False):
-    """ Convert a scipy.sparse.coo_matrix to a SparseSeries.
+    """
+    Convert a scipy.sparse.coo_matrix to a SparseSeries.
     Use the defaults given in the SparseSeries constructor.
     """
     s = Series(A.data, MultiIndex.from_arrays((A.row, A.col)))
@@ -130,5 +131,5 @@ def _coo_to_sparse_series(A, dense_index=False):
         i = range(A.shape[0])
         j = range(A.shape[1])
         ind = MultiIndex.from_product([i, j])
-        s = s.reindex_axis(ind)
+        s = s.reindex(ind)
     return s
diff --git a/pandas/core/sparse/series.py b/pandas/core/sparse/series.py
new file mode 100644
index 0000000000000..db4d3e876dec5
--- /dev/null
+++ b/pandas/core/sparse/series.py
@@ -0,0 +1,592 @@
+"""
+Data structures for sparse float data. Life is made simpler by dealing only
+with float64 data
+"""
+
+# pylint: disable=E1101,E1103,W0231
+
+import warnings
+
+import numpy as np
+
+import pandas._libs.index as libindex
+import pandas._libs.sparse as splib
+from pandas._libs.sparse import BlockIndex, IntIndex
+import pandas.compat as compat
+from pandas.compat.numpy import function as nv
+from pandas.util._decorators import Appender, Substitution
+
+from pandas.core.dtypes.common import is_integer, is_scalar
+from pandas.core.dtypes.generic import ABCSeries, ABCSparseSeries
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas.core import generic
+from pandas.core.arrays import SparseArray
+from pandas.core.arrays.sparse import SparseAccessor
+from pandas.core.index import Index
+from pandas.core.internals import SingleBlockManager
+import pandas.core.ops as ops
+from pandas.core.series import Series
+from pandas.core.sparse.scipy_sparse import (
+    _coo_to_sparse_series, _sparse_series_to_coo)
+
+_shared_doc_kwargs = dict(axes='index', klass='SparseSeries',
+                          axes_single_arg="{0, 'index'}",
+                          optional_labels='', optional_axis='')
+
+
+class SparseSeries(Series):
+    """Data structure for labeled, sparse floating point data
+
+    Parameters
+    ----------
+    data : {array-like, Series, SparseSeries, dict}
+        .. versionchanged :: 0.23.0
+           If data is a dict, argument order is maintained for Python 3.6
+           and later.
+
+    kind : {'block', 'integer'}
+    fill_value : float
+        Code for missing value. Defaults depends on dtype.
+        0 for int dtype, False for bool dtype, and NaN for other dtypes
+    sparse_index : {BlockIndex, IntIndex}, optional
+        Only if you have one. Mainly used internally
+
+    Notes
+    -----
+    SparseSeries objects are immutable via the typical Python means. If you
+    must change values, convert to dense, make your changes, then convert back
+    to sparse
+    """
+    _subtyp = 'sparse_series'
+
+    def __init__(self, data=None, index=None, sparse_index=None, kind='block',
+                 fill_value=None, name=None, dtype=None, copy=False,
+                 fastpath=False):
+        # TODO: Most of this should be refactored and shared with Series
+        # 1. BlockManager -> array
+        # 2. Series.index, Series.name, index, name reconciliation
+        # 3. Implicit reindexing
+        # 4. Implicit broadcasting
+        # 5. Dict construction
+        if data is None:
+            data = []
+        elif isinstance(data, SingleBlockManager):
+            index = data.index
+            data = data.blocks[0].values
+        elif isinstance(data, (ABCSeries, ABCSparseSeries)):
+            index = data.index if index is None else index
+            dtype = data.dtype if dtype is None else dtype
+            name = data.name if name is None else name
+
+            if index is not None:
+                data = data.reindex(index)
+
+        elif isinstance(data, compat.Mapping):
+            data, index = Series()._init_dict(data, index=index)
+
+        elif is_scalar(data) and index is not None:
+            data = np.full(len(index), fill_value=data)
+
+        super(SparseSeries, self).__init__(
+            SparseArray(data,
+                        sparse_index=sparse_index,
+                        kind=kind,
+                        dtype=dtype,
+                        fill_value=fill_value,
+                        copy=copy),
+            index=index, name=name,
+            copy=False, fastpath=fastpath
+        )
+
+    def __array_ufunc__(self, ufunc, method, *inputs, **kwargs):
+        # avoid infinite recursion for other SparseSeries inputs
+        inputs = tuple(
+            x.values if isinstance(x, type(self)) else x
+            for x in inputs
+        )
+        result = self.values.__array_ufunc__(ufunc, method, *inputs, **kwargs)
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=result.fill_value,
+                                 copy=False).__finalize__(self)
+
+    def __array_wrap__(self, result, context=None):
+        """
+        Gets called prior to a ufunc (and after)
+
+        See SparseArray.__array_wrap__ for detail.
+        """
+        result = self.values.__array_wrap__(result, context=context)
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=result.fill_value,
+                                 copy=False).__finalize__(self)
+
+    def __array_finalize__(self, obj):
+        """
+        Gets called after any ufunc or other array operations, necessary
+        to pass on the index.
+        """
+        self.name = getattr(obj, 'name', None)
+        self.fill_value = getattr(obj, 'fill_value', None)
+
+    # unary ops
+    # TODO: See if this can be shared
+    def __pos__(self):
+        result = self.values.__pos__()
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=result.fill_value,
+                                 copy=False).__finalize__(self)
+
+    def __neg__(self):
+        result = self.values.__neg__()
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=result.fill_value,
+                                 copy=False).__finalize__(self)
+
+    def __invert__(self):
+        result = self.values.__invert__()
+        return self._constructor(result, index=self.index,
+                                 sparse_index=self.sp_index,
+                                 fill_value=result.fill_value,
+                                 copy=False).__finalize__(self)
+
+    @property
+    def block(self):
+        warnings.warn("SparseSeries.block is deprecated.", FutureWarning,
+                      stacklevel=2)
+        return self._data._block
+
+    @property
+    def fill_value(self):
+        return self.values.fill_value
+
+    @fill_value.setter
+    def fill_value(self, v):
+        self.values.fill_value = v
+
+    @property
+    def sp_index(self):
+        return self.values.sp_index
+
+    @property
+    def sp_values(self):
+        return self.values.sp_values
+
+    @property
+    def npoints(self):
+        return self.values.npoints
+
+    @classmethod
+    def from_array(cls, arr, index=None, name=None, copy=False,
+                   fill_value=None, fastpath=False):
+        """Construct SparseSeries from array.
+
+        .. deprecated:: 0.23.0
+            Use the pd.SparseSeries(..) constructor instead.
+        """
+        warnings.warn("'from_array' is deprecated and will be removed in a "
+                      "future version. Please use the pd.SparseSeries(..) "
+                      "constructor instead.", FutureWarning, stacklevel=2)
+        return cls(arr, index=index, name=name, copy=copy,
+                   fill_value=fill_value, fastpath=fastpath)
+
+    @property
+    def _constructor(self):
+        return SparseSeries
+
+    @property
+    def _constructor_expanddim(self):
+        from pandas.core.sparse.api import SparseDataFrame
+        return SparseDataFrame
+
+    @property
+    def kind(self):
+        if isinstance(self.sp_index, BlockIndex):
+            return 'block'
+        elif isinstance(self.sp_index, IntIndex):
+            return 'integer'
+
+    def as_sparse_array(self, kind=None, fill_value=None, copy=False):
+        """ return my self as a sparse array, do not copy by default """
+
+        if fill_value is None:
+            fill_value = self.fill_value
+        if kind is None:
+            kind = self.kind
+        return SparseArray(self.values, sparse_index=self.sp_index,
+                           fill_value=fill_value, kind=kind, copy=copy)
+
+    def __unicode__(self):
+        # currently, unicode is same as repr...fixes infinite loop
+        series_rep = Series.__unicode__(self)
+        rep = '{series}\n{index!r}'.format(series=series_rep,
+                                           index=self.sp_index)
+        return rep
+
+    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
+                filter_type=None, **kwds):
+        """ perform a reduction operation """
+        return op(self.get_values(), skipna=skipna, **kwds)
+
+    def __getstate__(self):
+        # pickling
+        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
+                    fill_value=self.fill_value, name=self.name)
+
+    def _unpickle_series_compat(self, state):
+
+        nd_state, own_state = state
+
+        # recreate the ndarray
+        data = np.empty(nd_state[1], dtype=nd_state[2])
+        np.ndarray.__setstate__(data, nd_state)
+
+        index, fill_value, sp_index = own_state[:3]
+        name = None
+        if len(own_state) > 3:
+            name = own_state[3]
+
+        # create a sparse array
+        if not isinstance(data, SparseArray):
+            data = SparseArray(data, sparse_index=sp_index,
+                               fill_value=fill_value, copy=False)
+
+        # recreate
+        data = SingleBlockManager(data, index, fastpath=True)
+        generic.NDFrame.__init__(self, data)
+
+        self._set_axis(0, index)
+        self.name = name
+
+    def _set_subtyp(self, is_all_dates):
+        if is_all_dates:
+            object.__setattr__(self, '_subtyp', 'sparse_time_series')
+        else:
+            object.__setattr__(self, '_subtyp', 'sparse_series')
+
+    def _ixs(self, i, axis=0):
+        """
+        Return the i-th value or values in the SparseSeries by location
+
+        Parameters
+        ----------
+        i : int, slice, or sequence of integers
+
+        Returns
+        -------
+        value : scalar (int) or Series (slice, sequence)
+        """
+        label = self.index[i]
+        if isinstance(label, Index):
+            return self.take(i, axis=axis)
+        else:
+            return self._get_val_at(i)
+
+    def _get_val_at(self, loc):
+        """ forward to the array """
+        return self.values._get_val_at(loc)
+
+    def __getitem__(self, key):
+        # TODO: Document difference from Series.__getitem__, deprecate,
+        # and remove!
+        if is_integer(key) and key not in self.index:
+            return self._get_val_at(key)
+        else:
+            return super(SparseSeries, self).__getitem__(key)
+
+    def _get_values(self, indexer):
+        try:
+            return self._constructor(self._data.get_slice(indexer),
+                                     fastpath=True).__finalize__(self)
+        except Exception:
+            return self[indexer]
+
+    def _set_with_engine(self, key, value):
+        return self._set_value(key, value)
+
+    def abs(self):
+        """
+        Return an object with absolute value taken. Only applicable to objects
+        that are all numeric
+
+        Returns
+        -------
+        abs: same type as caller
+        """
+        return self._constructor(np.abs(self.values),
+                                 index=self.index).__finalize__(self)
+
+    def get(self, label, default=None):
+        """
+        Returns value occupying requested label, default to specified
+        missing value if not present. Analogous to dict.get
+
+        Parameters
+        ----------
+        label : object
+            Label value looking for
+        default : object, optional
+            Value to return if label not in index
+
+        Returns
+        -------
+        y : scalar
+        """
+        if label in self.index:
+            loc = self.index.get_loc(label)
+            return self._get_val_at(loc)
+        else:
+            return default
+
+    def get_value(self, label, takeable=False):
+        """
+        Retrieve single value at passed index label
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        index : label
+        takeable : interpret the index as indexers, default False
+
+        Returns
+        -------
+        value : scalar value
+        """
+        warnings.warn("get_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+
+        return self._get_value(label, takeable=takeable)
+
+    def _get_value(self, label, takeable=False):
+        loc = label if takeable is True else self.index.get_loc(label)
+        return self._get_val_at(loc)
+    _get_value.__doc__ = get_value.__doc__
+
+    def set_value(self, label, value, takeable=False):
+        """
+        Quickly set single value at passed label. If label is not contained, a
+        new object is created with the label placed at the end of the result
+        index
+
+        .. deprecated:: 0.21.0
+
+        Please use .at[] or .iat[] accessors.
+
+        Parameters
+        ----------
+        label : object
+            Partial indexing with MultiIndex not allowed
+        value : object
+            Scalar value
+        takeable : interpret the index as indexers, default False
+
+        Notes
+        -----
+        This method *always* returns a new object. It is not particularly
+        efficient but is provided for API compatibility with Series
+
+        Returns
+        -------
+        series : SparseSeries
+        """
+        warnings.warn("set_value is deprecated and will be removed "
+                      "in a future release. Please use "
+                      ".at[] or .iat[] accessors instead", FutureWarning,
+                      stacklevel=2)
+        return self._set_value(label, value, takeable=takeable)
+
+    def _set_value(self, label, value, takeable=False):
+        values = self.to_dense()
+
+        # if the label doesn't exist, we will create a new object here
+        # and possibly change the index
+        new_values = values._set_value(label, value, takeable=takeable)
+        if new_values is not None:
+            values = new_values
+        new_index = values.index
+        values = SparseArray(values, fill_value=self.fill_value,
+                             kind=self.kind)
+        self._data = SingleBlockManager(values, new_index)
+        self._index = new_index
+    _set_value.__doc__ = set_value.__doc__
+
+    def _set_values(self, key, value):
+
+        # this might be inefficient as we have to recreate the sparse array
+        # rather than setting individual elements, but have to convert
+        # the passed slice/boolean that's in dense space into a sparse indexer
+        # not sure how to do that!
+        if isinstance(key, Series):
+            key = key.values
+
+        values = self.values.to_dense()
+        values[key] = libindex.convert_scalar(values, value)
+        values = SparseArray(values, fill_value=self.fill_value,
+                             kind=self.kind)
+        self._data = SingleBlockManager(values, self.index)
+
+    def to_dense(self):
+        """
+        Convert SparseSeries to a Series.
+
+        Returns
+        -------
+        s : Series
+        """
+        return Series(self.values.to_dense(), index=self.index,
+                      name=self.name)
+
+    @property
+    def density(self):
+        return self.values.density
+
+    def copy(self, deep=True):
+        """
+        Make a copy of the SparseSeries. Only the actual sparse values need to
+        be copied
+        """
+        # TODO: https://github.com/pandas-dev/pandas/issues/22314
+        # We skip the block manager till that is resolved.
+        new_data = self.values.copy(deep=deep)
+        return self._constructor(new_data, sparse_index=self.sp_index,
+                                 fill_value=self.fill_value,
+                                 index=self.index.copy(),
+                                 name=self.name).__finalize__(self)
+
+    @Substitution(**_shared_doc_kwargs)
+    @Appender(generic.NDFrame.reindex.__doc__)
+    def reindex(self, index=None, method=None, copy=True, limit=None,
+                **kwargs):
+        # TODO: remove?
+        return super(SparseSeries, self).reindex(index=index, method=method,
+                                                 copy=copy, limit=limit,
+                                                 **kwargs)
+
+    def sparse_reindex(self, new_index):
+        """
+        Conform sparse values to new SparseIndex
+
+        Parameters
+        ----------
+        new_index : {BlockIndex, IntIndex}
+
+        Returns
+        -------
+        reindexed : SparseSeries
+        """
+        if not isinstance(new_index, splib.SparseIndex):
+            raise TypeError("new index must be a SparseIndex")
+        values = self.values
+        values = values.sp_index.to_int_index().reindex(
+            values.sp_values.astype('float64'), values.fill_value, new_index)
+        values = SparseArray(values,
+                             sparse_index=new_index,
+                             fill_value=self.values.fill_value)
+        return self._constructor(values, index=self.index).__finalize__(self)
+
+    def cumsum(self, axis=0, *args, **kwargs):
+        """
+        Cumulative sum of non-NA/null values.
+
+        When performing the cumulative summation, any non-NA/null values will
+        be skipped. The resulting SparseSeries will preserve the locations of
+        NaN values, but the fill value will be `np.nan` regardless.
+
+        Parameters
+        ----------
+        axis : {0}
+
+        Returns
+        -------
+        cumsum : SparseSeries
+        """
+        nv.validate_cumsum(args, kwargs)
+        # Validate axis
+        if axis is not None:
+            self._get_axis_number(axis)
+
+        new_array = self.values.cumsum()
+
+        return self._constructor(
+            new_array, index=self.index,
+            sparse_index=new_array.sp_index).__finalize__(self)
+
+    # TODO: SparseSeries.isna is Sparse, while Series.isna is dense
+    @Appender(generic._shared_docs['isna'] % _shared_doc_kwargs)
+    def isna(self):
+        arr = SparseArray(isna(self.values.sp_values),
+                          sparse_index=self.values.sp_index,
+                          fill_value=isna(self.fill_value))
+        return self._constructor(arr, index=self.index).__finalize__(self)
+
+    isnull = isna
+
+    @Appender(generic._shared_docs['notna'] % _shared_doc_kwargs)
+    def notna(self):
+        arr = SparseArray(notna(self.values.sp_values),
+                          sparse_index=self.values.sp_index,
+                          fill_value=notna(self.fill_value))
+        return self._constructor(arr, index=self.index).__finalize__(self)
+    notnull = notna
+
+    def dropna(self, axis=0, inplace=False, **kwargs):
+        """
+        Analogous to Series.dropna. If fill_value=NaN, returns a dense Series
+        """
+        # TODO: make more efficient
+        # Validate axis
+        self._get_axis_number(axis or 0)
+        dense_valid = self.to_dense().dropna()
+        if inplace:
+            raise NotImplementedError("Cannot perform inplace dropna"
+                                      " operations on a SparseSeries")
+        if isna(self.fill_value):
+            return dense_valid
+        else:
+            dense_valid = dense_valid[dense_valid != self.fill_value]
+            return dense_valid.to_sparse(fill_value=self.fill_value)
+
+    def combine_first(self, other):
+        """
+        Combine Series values, choosing the calling Series's values
+        first. Result index will be the union of the two indexes
+
+        Parameters
+        ----------
+        other : Series
+
+        Returns
+        -------
+        y : Series
+        """
+        if isinstance(other, SparseSeries):
+            other = other.to_dense()
+
+        dense_combined = self.to_dense().combine_first(other)
+        return dense_combined.to_sparse(fill_value=self.fill_value)
+
+    @Appender(SparseAccessor.to_coo.__doc__)
+    def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
+        A, rows, columns = _sparse_series_to_coo(self, row_levels,
+                                                 column_levels,
+                                                 sort_labels=sort_labels)
+        return A, rows, columns
+
+    @classmethod
+    @Appender(SparseAccessor.from_coo.__doc__)
+    def from_coo(cls, A, dense_index=False):
+        return _coo_to_sparse_series(A, dense_index=dense_index)
+
+
+# overwrite series methods with unaccelerated Sparse-specific versions
+ops.add_flex_arithmetic_methods(SparseSeries)
+ops.add_special_arithmetic_methods(SparseSeries)
diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 504d3dd47cc21..9577b07360f65 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -1,27 +1,26 @@
+# -*- coding: utf-8 -*-
+import codecs
+import re
+import textwrap
+import warnings
+
 import numpy as np
 
+import pandas._libs.lib as lib
+import pandas._libs.ops as libops
+import pandas.compat as compat
 from pandas.compat import zip
-from pandas.types.generic import ABCSeries, ABCIndex
-from pandas.types.missing import isnull, notnull
-from pandas.types.common import (is_bool_dtype,
-                                 is_categorical_dtype,
-                                 is_object_dtype,
-                                 is_string_like,
-                                 is_list_like,
-                                 is_scalar,
-                                 is_integer,
-                                 is_re)
-from pandas.core.common import _values_from_object
+from pandas.util._decorators import Appender, deprecate_kwarg
+
+from pandas.core.dtypes.common import (
+    ensure_object, is_bool_dtype, is_categorical_dtype, is_integer,
+    is_list_like, is_object_dtype, is_re, is_scalar, is_string_like)
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import isna
 
 from pandas.core.algorithms import take_1d
-import pandas.compat as compat
-from pandas.core.base import AccessorProperty, NoNewAttributesMixin
-from pandas.util.decorators import Appender
-import re
-import pandas._libs.lib as lib
-import warnings
-import textwrap
-import codecs
+from pandas.core.base import NoNewAttributesMixin
+import pandas.core.common as com
 
 _cpython_optimized_encoders = (
     "utf-8", "utf8", "latin-1", "latin1", "iso-8859-1", "mbcs", "ascii"
@@ -33,121 +32,26 @@
 _shared_docs = dict()
 
 
-def _get_array_list(arr, others):
-    from pandas.core.series import Series
-
-    if len(others) and isinstance(_values_from_object(others)[0],
-                                  (list, np.ndarray, Series)):
-        arrays = [arr] + list(others)
-    else:
-        arrays = [arr, others]
-
-    return [np.asarray(x, dtype=object) for x in arrays]
-
-
-def str_cat(arr, others=None, sep=None, na_rep=None):
+def cat_core(list_of_columns, sep):
     """
-    Concatenate strings in the Series/Index with given separator.
+    Auxiliary function for :meth:`str.cat`
 
     Parameters
     ----------
-    others : list-like, or list of list-likes
-      If None, returns str concatenating strings of the Series
-    sep : string or None, default None
-    na_rep : string or None, default None
-        If None, NA in the series are ignored.
+    list_of_columns : list of numpy arrays
+        List of arrays to be concatenated with sep;
+        these arrays may not contain NaNs!
+    sep : string
+        The separator string for concatenating the columns
 
     Returns
     -------
-    concat : Series/Index of objects or str
-
-    Examples
-    --------
-    When ``na_rep`` is `None` (default behavior), NaN value(s)
-    in the Series are ignored.
-
-    >>> Series(['a','b',np.nan,'c']).str.cat(sep=' ')
-    'a b c'
-
-    >>> Series(['a','b',np.nan,'c']).str.cat(sep=' ', na_rep='?')
-    'a b ? c'
-
-    If ``others`` is specified, corresponding values are
-    concatenated with the separator. Result will be a Series of strings.
-
-    >>> Series(['a', 'b', 'c']).str.cat(['A', 'B', 'C'], sep=',')
-    0    a,A
-    1    b,B
-    2    c,C
-    dtype: object
-
-    Otherwise, strings in the Series are concatenated. Result will be a string.
-
-    >>> Series(['a', 'b', 'c']).str.cat(sep=',')
-    'a,b,c'
-
-    Also, you can pass a list of list-likes.
-
-    >>> Series(['a', 'b']).str.cat([['x', 'y'], ['1', '2']], sep=',')
-    0    a,x,1
-    1    b,y,2
-    dtype: object
+    nd.array
+        The concatenation of list_of_columns with sep
     """
-    if sep is None:
-        sep = ''
-
-    if others is not None:
-        arrays = _get_array_list(arr, others)
-
-        n = _length_check(arrays)
-        masks = np.array([isnull(x) for x in arrays])
-        cats = None
-
-        if na_rep is None:
-            na_mask = np.logical_or.reduce(masks, axis=0)
-
-            result = np.empty(n, dtype=object)
-            np.putmask(result, na_mask, np.nan)
-
-            notmask = ~na_mask
-
-            tuples = zip(*[x[notmask] for x in arrays])
-            cats = [sep.join(tup) for tup in tuples]
-
-            result[notmask] = cats
-        else:
-            for i, x in enumerate(arrays):
-                x = np.where(masks[i], na_rep, x)
-                if cats is None:
-                    cats = x
-                else:
-                    cats = cats + sep + x
-
-            result = cats
-
-        return result
-    else:
-        arr = np.asarray(arr, dtype=object)
-        mask = isnull(arr)
-        if na_rep is None and mask.any():
-            if sep == '':
-                na_rep = ''
-            else:
-                return sep.join(arr[notnull(arr)])
-        return sep.join(np.where(mask, na_rep, arr))
-
-
-def _length_check(others):
-    n = None
-    for x in others:
-        try:
-            if n is None:
-                n = len(x)
-            elif len(x) != n:
-                raise ValueError('All arrays must be same length')
-        except TypeError:
-            raise ValueError("Did you mean to supply a `sep` keyword?")
-    return n
+    list_with_sep = [sep] * (2 * len(list_of_columns) - 1)
+    list_with_sep[::2] = list_of_columns
+    return np.sum(list_with_sep, axis=0)
 
 
 def _na_map(f, arr, na_result=np.nan, dtype=object):
@@ -164,7 +68,7 @@ def _map(f, arr, na_mask=False, na_value=np.nan, dtype=object):
     if not isinstance(arr, np.ndarray):
         arr = np.asarray(arr, dtype=object)
     if na_mask:
-        mask = isnull(arr)
+        mask = isna(arr)
         try:
             convert = not all(mask)
             result = lib.map_infer_mask(arr, f, mask.view(np.uint8), convert)
@@ -200,15 +104,65 @@ def str_count(arr, pat, flags=0):
     """
     Count occurrences of pattern in each string of the Series/Index.
 
+    This function is used to count the number of times a particular regex
+    pattern is repeated in each of the string elements of the
+    :class:`~pandas.Series`.
+
     Parameters
     ----------
-    pat : string, valid regular expression
-    flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+    pat : str
+        Valid regular expression.
+    flags : int, default 0, meaning no flags
+        Flags for the `re` module. For a complete list, `see here
+        <https://docs.python.org/3/howto/regex.html#compilation-flags>`_.
+    **kwargs
+        For compatibility with other string methods. Not used.
 
     Returns
     -------
-    counts : Series/Index of integer values
+    Series or Index
+        Same type as the calling object containing the integer counts.
+
+    See Also
+    --------
+    re : Standard library module for regular expressions.
+    str.count : Standard library version, without regular expression support.
+
+    Notes
+    -----
+    Some characters need to be escaped when passing in `pat`.
+    eg. ``'$'`` has a special meaning in regex and must be escaped when
+    finding this literal character.
+
+    Examples
+    --------
+    >>> s = pd.Series(['A', 'B', 'Aaba', 'Baca', np.nan, 'CABA', 'cat'])
+    >>> s.str.count('a')
+    0    0.0
+    1    0.0
+    2    2.0
+    3    2.0
+    4    NaN
+    5    0.0
+    6    1.0
+    dtype: float64
+
+    Escape ``'$'`` to find the literal dollar sign.
+
+    >>> s = pd.Series(['$', 'B', 'Aab$', '$$ca', 'C$B$', 'cat'])
+    >>> s.str.count('\\$')
+    0    1
+    1    0
+    2    1
+    3    2
+    4    2
+    5    0
+    dtype: int64
+
+    This is also available on Index
+
+    >>> pd.Index(['A', 'A', 'Aaba', 'cat']).str.count('a')
+    Int64Index([0, 0, 2, 1], dtype='int64')
     """
     regex = re.compile(pat, flags=flags)
     f = lambda x: len(regex.findall(x))
@@ -217,29 +171,126 @@ def str_count(arr, pat, flags=0):
 
 def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
     """
-    Return boolean Series/``array`` whether given pattern/regex is
-    contained in each string in the Series/Index.
+    Test if pattern or regex is contained within a string of a Series or Index.
+
+    Return boolean Series or Index based on whether a given pattern or regex is
+    contained within a string of a Series or Index.
 
     Parameters
     ----------
-    pat : string
-        Character sequence or regular expression
-    case : boolean, default True
-        If True, case sensitive
+    pat : str
+        Character sequence or regular expression.
+    case : bool, default True
+        If True, case sensitive.
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
-    na : default NaN, fill value for missing values.
+        Flags to pass through to the re module, e.g. re.IGNORECASE.
+    na : default NaN
+        Fill value for missing values.
     regex : bool, default True
-        If True use re.search, otherwise use Python in operator
+        If True, assumes the pat is a regular expression.
+
+        If False, treats the pat as a literal string.
 
     Returns
     -------
-    contained : Series/array of boolean values
+    Series or Index of boolean values
+        A Series or Index of boolean values indicating whether the
+        given pattern is contained within the string of each element
+        of the Series or Index.
 
     See Also
     --------
-    match : analogous, but stricter, relying on re.match instead of re.search
+    match : Analogous, but stricter, relying on re.match instead of re.search.
+    Series.str.startswith : Test if the start of each string element matches a
+        pattern.
+    Series.str.endswith : Same as startswith, but tests the end of string.
+
+    Examples
+    --------
+
+    Returning a Series of booleans using only a literal pattern.
+
+    >>> s1 = pd.Series(['Mouse', 'dog', 'house and parrot', '23', np.NaN])
+    >>> s1.str.contains('og', regex=False)
+    0    False
+    1     True
+    2    False
+    3    False
+    4      NaN
+    dtype: object
+
+    Returning an Index of booleans using only a literal pattern.
 
+    >>> ind = pd.Index(['Mouse', 'dog', 'house and parrot', '23.0', np.NaN])
+    >>> ind.str.contains('23', regex=False)
+    Index([False, False, False, True, nan], dtype='object')
+
+    Specifying case sensitivity using `case`.
+
+    >>> s1.str.contains('oG', case=True, regex=True)
+    0    False
+    1    False
+    2    False
+    3    False
+    4      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN` replaces NaN values
+    with `False`. If Series or Index does not contain NaN values
+    the resultant dtype will be `bool`, otherwise, an `object` dtype.
+
+    >>> s1.str.contains('og', na=False, regex=True)
+    0    False
+    1     True
+    2    False
+    3    False
+    4    False
+    dtype: bool
+
+    Returning 'house' or 'dog' when either expression occurs in a string.
+
+    >>> s1.str.contains('house|dog', regex=True)
+    0    False
+    1     True
+    2     True
+    3    False
+    4      NaN
+    dtype: object
+
+    Ignoring case sensitivity using `flags` with regex.
+
+    >>> import re
+    >>> s1.str.contains('PARROT', flags=re.IGNORECASE, regex=True)
+    0    False
+    1    False
+    2     True
+    3    False
+    4      NaN
+    dtype: object
+
+    Returning any digit using regular expression.
+
+    >>> s1.str.contains('\\d', regex=True)
+    0    False
+    1    False
+    2    False
+    3     True
+    4      NaN
+    dtype: object
+
+    Ensure `pat` is a not a literal pattern when `regex` is set to True.
+    Note in the following example one might expect only `s2[1]` and `s2[3]` to
+    return `True`. However, '.0' as a regex matches any character
+    followed by a 0.
+
+    >>> s2 = pd.Series(['40', '40.0', '41', '41.0', '35'])
+    >>> s2.str.contains('.0', regex=True)
+    0     True
+    1     True
+    2    False
+    3     True
+    4    False
+    dtype: bool
     """
     if regex:
         if not case:
@@ -266,19 +317,54 @@ def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
 
 def str_startswith(arr, pat, na=np.nan):
     """
-    Return boolean Series/``array`` indicating whether each string in the
-    Series/Index starts with passed pattern. Equivalent to
-    :meth:`str.startswith`.
+    Test if the start of each string element matches a pattern.
+
+    Equivalent to :meth:`str.startswith`.
 
     Parameters
     ----------
-    pat : string
-        Character sequence
-    na : bool, default NaN
+    pat : str
+        Character sequence. Regular expressions are not accepted.
+    na : object, default NaN
+        Object shown if element tested is not a string.
 
     Returns
     -------
-    startswith : Series/array of boolean values
+    Series or Index of bool
+        A Series of booleans indicating whether the given pattern matches
+        the start of each string element.
+
+    See Also
+    --------
+    str.startswith : Python standard library string method.
+    Series.str.endswith : Same as startswith, but tests the end of string.
+    Series.str.contains : Tests if string element contains a pattern.
+
+    Examples
+    --------
+    >>> s = pd.Series(['bat', 'Bear', 'cat', np.nan])
+    >>> s
+    0     bat
+    1    Bear
+    2     cat
+    3     NaN
+    dtype: object
+
+    >>> s.str.startswith('b')
+    0     True
+    1    False
+    2    False
+    3      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN`.
+
+    >>> s.str.startswith('b', na=False)
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
     """
     f = lambda x: x.startswith(pat)
     return _na_map(f, arr, na, dtype=bool)
@@ -286,39 +372,74 @@ def str_startswith(arr, pat, na=np.nan):
 
 def str_endswith(arr, pat, na=np.nan):
     """
-    Return boolean Series indicating whether each string in the
-    Series/Index ends with passed pattern. Equivalent to
-    :meth:`str.endswith`.
+    Test if the end of each string element matches a pattern.
+
+    Equivalent to :meth:`str.endswith`.
 
     Parameters
     ----------
-    pat : string
-        Character sequence
-    na : bool, default NaN
+    pat : str
+        Character sequence. Regular expressions are not accepted.
+    na : object, default NaN
+        Object shown if element tested is not a string.
 
     Returns
     -------
-    endswith : Series/array of boolean values
+    Series or Index of bool
+        A Series of booleans indicating whether the given pattern matches
+        the end of each string element.
+
+    See Also
+    --------
+    str.endswith : Python standard library string method.
+    Series.str.startswith : Same as endswith, but tests the start of string.
+    Series.str.contains : Tests if string element contains a pattern.
+
+    Examples
+    --------
+    >>> s = pd.Series(['bat', 'bear', 'caT', np.nan])
+    >>> s
+    0     bat
+    1    bear
+    2     caT
+    3     NaN
+    dtype: object
+
+    >>> s.str.endswith('t')
+    0     True
+    1    False
+    2    False
+    3      NaN
+    dtype: object
+
+    Specifying `na` to be `False` instead of `NaN`.
+
+    >>> s.str.endswith('t', na=False)
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
     """
     f = lambda x: x.endswith(pat)
     return _na_map(f, arr, na, dtype=bool)
 
 
-def str_replace(arr, pat, repl, n=-1, case=None, flags=0):
-    """
+def str_replace(arr, pat, repl, n=-1, case=None, flags=0, regex=True):
+    r"""
     Replace occurrences of pattern/regex in the Series/Index with
     some other string. Equivalent to :meth:`str.replace` or
     :func:`re.sub`.
 
     Parameters
     ----------
-    pat : string or compiled regex
+    pat : str or compiled regex
         String can be a character sequence or regular expression.
 
         .. versionadded:: 0.20.0
             `pat` also accepts a compiled regex.
 
-    repl : string or callable
+    repl : str or callable
         Replacement string or a callable. The callable is passed the regex
         match object and must return a replacement string to be used.
         See :func:`re.sub`.
@@ -327,33 +448,60 @@ def str_replace(arr, pat, repl, n=-1, case=None, flags=0):
             `repl` also accepts a callable.
 
     n : int, default -1 (all)
-        Number of replacements to make from start
-    case : boolean, default None
+        Number of replacements to make from start.
+    case : bool, default None
         - If True, case sensitive (the default if `pat` is a string)
         - Set to False for case insensitive
         - Cannot be set if `pat` is a compiled regex
     flags : int, default 0 (no flags)
         - re module flags, e.g. re.IGNORECASE
         - Cannot be set if `pat` is a compiled regex
+    regex : bool, default True
+        - If True, assumes the passed-in pattern is a regular expression.
+        - If False, treats the pattern as a literal string
+        - Cannot be set to False if `pat` is a compiled regex or `repl` is
+          a callable.
+
+        .. versionadded:: 0.23.0
 
     Returns
     -------
-    replaced : Series/Index of objects
+    Series or Index of object
+        A copy of the object with all matching occurrences of `pat` replaced by
+        `repl`.
+
+    Raises
+    ------
+    ValueError
+        * if `regex` is False and `repl` is a callable or `pat` is a compiled
+          regex
+        * if `pat` is a compiled regex and `case` or `flags` is set
 
     Notes
     -----
     When `pat` is a compiled regex, all flags should be included in the
-    compiled regex. Use of `case` or `flags` with a compiled regex will
-    raise an error.
+    compiled regex. Use of `case`, `flags`, or `regex=False` with a compiled
+    regex will raise an error.
 
     Examples
     --------
-    When `repl` is a string, every `pat` is replaced as with
-    :meth:`str.replace`. NaN value(s) in the Series are left as is.
+    When `pat` is a string and `regex` is True (the default), the given `pat`
+    is compiled as a regex. When `repl` is a string, it replaces matching
+    regex patterns as with :meth:`re.sub`. NaN value(s) in the Series are
+    left as is:
+
+    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f.', 'ba', regex=True)
+    0    bao
+    1    baz
+    2    NaN
+    dtype: object
+
+    When `pat` is a string and `regex` is False, every `pat` is replaced with
+    `repl` as with :meth:`str.replace`:
 
-    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f', 'b')
-    0    boo
-    1    buz
+    >>> pd.Series(['f.o', 'fuz', np.nan]).str.replace('f.', 'ba', regex=False)
+    0    bao
+    1    fuz
     2    NaN
     dtype: object
 
@@ -389,6 +537,7 @@ def str_replace(arr, pat, repl, n=-1, case=None, flags=0):
 
     Using a compiled regex with flags
 
+    >>> import re
     >>> regex_pat = re.compile(r'FUZ', flags=re.IGNORECASE)
     >>> pd.Series(['foo', 'fuz', np.nan]).str.replace(regex_pat, 'bar')
     0    foo
@@ -402,27 +551,33 @@ def str_replace(arr, pat, repl, n=-1, case=None, flags=0):
         raise TypeError("repl must be a string or callable")
 
     is_compiled_re = is_re(pat)
-    if is_compiled_re:
-        if (case is not None) or (flags != 0):
-            raise ValueError("case and flags cannot be set"
-                             " when pat is a compiled regex")
-    else:
-        # not a compiled regex
-        # set default case
-        if case is None:
-            case = True
-
-        # add case flag, if provided
-        if case is False:
-            flags |= re.IGNORECASE
-
-    use_re = is_compiled_re or len(pat) > 1 or flags or callable(repl)
-
-    if use_re:
-        n = n if n >= 0 else 0
-        regex = re.compile(pat, flags=flags)
-        f = lambda x: regex.sub(repl=repl, string=x, count=n)
+    if regex:
+        if is_compiled_re:
+            if (case is not None) or (flags != 0):
+                raise ValueError("case and flags cannot be set"
+                                 " when pat is a compiled regex")
+        else:
+            # not a compiled regex
+            # set default case
+            if case is None:
+                case = True
+
+            # add case flag, if provided
+            if case is False:
+                flags |= re.IGNORECASE
+        if is_compiled_re or len(pat) > 1 or flags or callable(repl):
+            n = n if n >= 0 else 0
+            compiled = re.compile(pat, flags=flags)
+            f = lambda x: compiled.sub(repl=repl, string=x, count=n)
+        else:
+            f = lambda x: x.replace(pat, repl, n)
     else:
+        if is_compiled_re:
+            raise ValueError("Cannot use a compiled regex as replacement "
+                             "pattern with regex=False")
+        if callable(repl):
+            raise ValueError("Cannot use a callable replacement when "
+                             "regex=False")
         f = lambda x: x.replace(pat, repl, n)
 
     return _na_map(f, arr)
@@ -430,20 +585,45 @@ def str_replace(arr, pat, repl, n=-1, case=None, flags=0):
 
 def str_repeat(arr, repeats):
     """
-    Duplicate each string in the Series/Index by indicated number
-    of times.
+    Duplicate each string in the Series or Index.
 
     Parameters
     ----------
-    repeats : int or array
-        Same value for all (int) or different value per (array)
+    repeats : int or sequence of int
+        Same value for all (int) or different value per (sequence).
 
     Returns
     -------
-    repeated : Series/Index of objects
+    Series or Index of object
+        Series or Index of repeated string objects specified by
+        input parameter repeats.
+
+    Examples
+    --------
+    >>> s = pd.Series(['a', 'b', 'c'])
+    >>> s
+    0    a
+    1    b
+    2    c
+    dtype: object
+
+    Single int repeats string in Series
+
+    >>> s.str.repeat(repeats=2)
+    0    aa
+    1    bb
+    2    cc
+    dtype: object
+
+    Sequence of int repeats corresponding string in Series
+
+    >>> s.str.repeat(repeats=[1, 2, 3])
+    0      a
+    1     bb
+    2    ccc
+    dtype: object
     """
     if is_scalar(repeats):
-
         def rep(x):
             try:
                 return compat.binary_type.__mul__(x, repeats)
@@ -460,24 +640,24 @@ def rep(x, r):
                 return compat.text_type.__mul__(x, r)
 
         repeats = np.asarray(repeats, dtype=object)
-        result = lib.vec_binop(_values_from_object(arr), repeats, rep)
+        result = libops.vec_binop(com.values_from_object(arr), repeats, rep)
         return result
 
 
-def str_match(arr, pat, case=True, flags=0, na=np.nan, as_indexer=None):
+def str_match(arr, pat, case=True, flags=0, na=np.nan):
     """
     Determine if each string matches a regular expression.
 
     Parameters
     ----------
-    pat : string
-        Character sequence or regular expression
-    case : boolean, default True
-        If True, case sensitive
+    pat : str
+        Character sequence or regular expression.
+    case : bool, default True
+        If True, case sensitive.
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
-    na : default NaN, fill value for missing values.
-    as_indexer : DEPRECATED
+        re module flags, e.g. re.IGNORECASE.
+    na : default NaN
+        Fill value for missing values.
 
     Returns
     -------
@@ -485,27 +665,15 @@ def str_match(arr, pat, case=True, flags=0, na=np.nan, as_indexer=None):
 
     See Also
     --------
-    contains : analogous, but less strict, relying on re.search instead of
-        re.match
-    extract : extract matched groups
-
+    contains : Analogous, but less strict, relying on re.search instead of
+        re.match.
+    extract : Extract matched groups.
     """
     if not case:
         flags |= re.IGNORECASE
 
     regex = re.compile(pat, flags=flags)
 
-    if (as_indexer is False) and (regex.groups > 0):
-        raise ValueError("as_indexer=False with a pattern with groups is no "
-                         "longer supported. Use '.str.extract(pat)' instead")
-    elif as_indexer is not None:
-        # Previously, this keyword was used for changing the default but
-        # deprecated behaviour. This keyword is now no longer needed.
-        warnings.warn("'as_indexer' keyword was specified but is ignored "
-                      "(match now returns a boolean indexer by default), "
-                      "and will be removed in a future version.",
-                      FutureWarning, stacklevel=3)
-
     dtype = bool
     f = lambda x: bool(regex.match(x))
 
@@ -596,46 +764,51 @@ def _str_extract_frame(arr, pat, flags=0):
         dtype=object)
 
 
-def str_extract(arr, pat, flags=0, expand=None):
-    """
-    For each subject string in the Series, extract groups from the
-    first match of regular expression pat.
+def str_extract(arr, pat, flags=0, expand=True):
+    r"""
+    Extract capture groups in the regex `pat` as columns in a DataFrame.
 
-    .. versionadded:: 0.13.0
+    For each subject string in the Series, extract groups from the
+    first match of regular expression `pat`.
 
     Parameters
     ----------
-    pat : string
-        Regular expression pattern with capturing groups
+    pat : str
+        Regular expression pattern with capturing groups.
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+        Flags from the ``re`` module, e.g. ``re.IGNORECASE``, that
+        modify regular expression matching for things like case,
+        spaces, etc. For more details, see :mod:`re`.
+    expand : bool, default True
+        If True, return DataFrame with one column per capture group.
+        If False, return a Series/Index if there is one capture group
+        or DataFrame if there are multiple capture groups.
 
-    .. versionadded:: 0.18.0
-    expand : bool, default False
-        * If True, return DataFrame.
-        * If False, return Series/Index/DataFrame.
+        .. versionadded:: 0.18.0
 
     Returns
     -------
-    DataFrame with one row for each subject string, and one column for
-    each group. Any capture group names in regular expression pat will
-    be used for column names; otherwise capture group numbers will be
-    used. The dtype of each result column is always object, even when
-    no match is found. If expand=False and pat has only one capture group,
-    then return a Series (if subject is a Series) or Index (if subject
-    is an Index).
+    DataFrame or Series or Index
+        A DataFrame with one row for each subject string, and one
+        column for each group. Any capture group names in regular
+        expression pat will be used for column names; otherwise
+        capture group numbers will be used. The dtype of each result
+        column is always object, even when no match is found. If
+        ``expand=False`` and pat has only one capture group, then
+        return a Series (if subject is a Series) or Index (if subject
+        is an Index).
 
     See Also
     --------
-    extractall : returns all matches (not just the first match)
+    extractall : Returns all matches (not just the first match).
 
     Examples
     --------
     A pattern with two groups will return a DataFrame with two columns.
     Non-matches will be NaN.
 
-    >>> s = Series(['a1', 'b2', 'c3'])
-    >>> s.str.extract('([ab])(\d)')
+    >>> s = pd.Series(['a1', 'b2', 'c3'])
+    >>> s.str.extract(r'([ab])(\d)')
          0    1
     0    a    1
     1    b    2
@@ -643,7 +816,7 @@ def str_extract(arr, pat, flags=0, expand=None):
 
     A pattern may contain optional groups.
 
-    >>> s.str.extract('([ab])?(\d)')
+    >>> s.str.extract(r'([ab])?(\d)')
          0  1
     0    a  1
     1    b  2
@@ -651,7 +824,7 @@ def str_extract(arr, pat, flags=0, expand=None):
 
     Named groups will become column names in the result.
 
-    >>> s.str.extract('(?P<letter>[ab])(?P<digit>\d)')
+    >>> s.str.extract(r'(?P<letter>[ab])(?P<digit>\d)')
       letter digit
     0      a     1
     1      b     2
@@ -660,7 +833,7 @@ def str_extract(arr, pat, flags=0, expand=None):
     A pattern with one group will return a DataFrame with one column
     if expand=True.
 
-    >>> s.str.extract('[ab](\d)', expand=True)
+    >>> s.str.extract(r'[ab](\d)', expand=True)
          0
     0    1
     1    2
@@ -668,33 +841,23 @@ def str_extract(arr, pat, flags=0, expand=None):
 
     A pattern with one group will return a Series if expand=False.
 
-    >>> s.str.extract('[ab](\d)', expand=False)
+    >>> s.str.extract(r'[ab](\d)', expand=False)
     0      1
     1      2
     2    NaN
     dtype: object
-
     """
-    if expand is None:
-        warnings.warn(
-            "currently extract(expand=None) " +
-            "means expand=False (return Index/Series/DataFrame) " +
-            "but in a future version of pandas this will be changed " +
-            "to expand=True (return DataFrame)",
-            FutureWarning,
-            stacklevel=3)
-        expand = False
     if not isinstance(expand, bool):
         raise ValueError("expand must be True or False")
     if expand:
         return _str_extract_frame(arr._orig, pat, flags=flags)
     else:
-        result, name = _str_extract_noexpand(arr._data, pat, flags=flags)
+        result, name = _str_extract_noexpand(arr._parent, pat, flags=flags)
         return arr._wrap_result(result, name=name, expand=expand)
 
 
 def str_extractall(arr, pat, flags=0):
-    """
+    r"""
     For each subject string in the Series, extract groups from all
     matches of regular expression pat. When each subject string in the
     Series has exactly one match, extractall(pat).xs(0, level='match')
@@ -704,31 +867,35 @@ def str_extractall(arr, pat, flags=0):
 
     Parameters
     ----------
-    pat : string
-        Regular expression pattern with capturing groups
+    pat : str
+        Regular expression pattern with capturing groups.
     flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+        A ``re`` module flag, for example ``re.IGNORECASE``. These allow
+        to modify regular expression matching for things like case, spaces,
+        etc. Multiple flags can be combined with the bitwise OR operator,
+        for example ``re.IGNORECASE | re.MULTILINE``.
 
     Returns
     -------
-    A DataFrame with one row for each match, and one column for each
-    group. Its rows have a MultiIndex with first levels that come from
-    the subject Series. The last level is named 'match' and indicates
-    the order in the subject. Any capture group names in regular
-    expression pat will be used for column names; otherwise capture
-    group numbers will be used.
+    DataFrame
+        A ``DataFrame`` with one row for each match, and one column for each
+        group. Its rows have a ``MultiIndex`` with first levels that come from
+        the subject ``Series``. The last level is named 'match' and indexes the
+        matches in each item of the ``Series``. Any capture group names in
+        regular expression pat will be used for column names; otherwise capture
+        group numbers will be used.
 
     See Also
     --------
-    extract : returns first match only (not all matches)
+    extract : Returns first match only (not all matches).
 
     Examples
     --------
     A pattern with one group will return a DataFrame with one column.
     Indices with no matches will not appear in the result.
 
-    >>> s = Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
-    >>> s.str.extractall("[ab](\d)")
+    >>> s = pd.Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
+    >>> s.str.extractall(r"[ab](\d)")
              0
       match
     A 0      1
@@ -737,7 +904,7 @@ def str_extractall(arr, pat, flags=0):
 
     Capture group names are used for column names of the result.
 
-    >>> s.str.extractall("[ab](?P<digit>\d)")
+    >>> s.str.extractall(r"[ab](?P<digit>\d)")
             digit
       match
     A 0         1
@@ -746,7 +913,7 @@ def str_extractall(arr, pat, flags=0):
 
     A pattern with two groups will return a DataFrame with two columns.
 
-    >>> s.str.extractall("(?P<letter>[ab])(?P<digit>\d)")
+    >>> s.str.extractall(r"(?P<letter>[ab])(?P<digit>\d)")
             letter digit
       match
     A 0          a     1
@@ -755,14 +922,13 @@ def str_extractall(arr, pat, flags=0):
 
     Optional groups that do not match are NaN in the result.
 
-    >>> s.str.extractall("(?P<letter>[ab])?(?P<digit>\d)")
+    >>> s.str.extractall(r"(?P<letter>[ab])?(?P<digit>\d)")
             letter digit
       match
     A 0          a     1
       1          a     2
     B 0          b     1
     C 0        NaN     1
-
     """
 
     regex = re.compile(pat, flags=flags)
@@ -770,7 +936,7 @@ def str_extractall(arr, pat, flags=0):
     if regex.groups == 0:
         raise ValueError("pattern contains no capture groups")
 
-    if isinstance(arr, ABCIndex):
+    if isinstance(arr, ABCIndexClass):
         arr = arr.to_series().reset_index(drop=True)
 
     names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
@@ -794,12 +960,10 @@ def str_extractall(arr, pat, flags=0):
                 result_key = tuple(subject_key + (match_i, ))
                 index_list.append(result_key)
 
-    if 0 < len(index_list):
-        from pandas import MultiIndex
-        index = MultiIndex.from_tuples(
-            index_list, names=arr.index.names + ["match"])
-    else:
-        index = None
+    from pandas import MultiIndex
+    index = MultiIndex.from_tuples(
+        index_list, names=arr.index.names + ["match"])
+
     result = arr._constructor_expanddim(match_list, index=index,
                                         columns=columns)
     return result
@@ -807,35 +971,37 @@ def str_extractall(arr, pat, flags=0):
 
 def str_get_dummies(arr, sep='|'):
     """
-    Split each string in the Series by sep and return a frame of
-    dummy/indicator variables.
+    Split each string in the Series by sep and return a DataFrame
+    of dummy/indicator variables.
 
     Parameters
     ----------
-    sep : string, default "|"
+    sep : str, default "|"
         String to split on.
 
     Returns
     -------
-    dummies : DataFrame
+    DataFrame
+        Dummy variables corresponding to values of the Series.
+
+    See Also
+    --------
+    get_dummies : Convert categorical variable into dummy/indicator
+        variables.
 
     Examples
     --------
-    >>> Series(['a|b', 'a', 'a|c']).str.get_dummies()
+    >>> pd.Series(['a|b', 'a', 'a|c']).str.get_dummies()
        a  b  c
     0  1  1  0
     1  1  0  0
     2  1  0  1
 
-    >>> Series(['a|b', np.nan, 'a|c']).str.get_dummies()
+    >>> pd.Series(['a|b', np.nan, 'a|c']).str.get_dummies()
        a  b  c
     0  1  1  0
     1  0  0  0
     2  1  0  1
-
-    See Also
-    --------
-    pandas.get_dummies
     """
     arr = arr.fillna('')
     try:
@@ -846,7 +1012,7 @@ def str_get_dummies(arr, sep='|'):
     tags = set()
     for ts in arr.str.split(sep):
         tags.update(ts)
-    tags = sorted(tags - set([""]))
+    tags = sorted(tags - {""})
 
     dummies = np.empty((len(arr), len(tags)), dtype=np.int64)
 
@@ -858,40 +1024,158 @@ def str_get_dummies(arr, sep='|'):
 
 def str_join(arr, sep):
     """
-    Join lists contained as elements in the Series/Index with
-    passed delimiter. Equivalent to :meth:`str.join`.
+    Join lists contained as elements in the Series/Index with passed delimiter.
+
+    If the elements of a Series are lists themselves, join the content of these
+    lists using the delimiter passed to the function.
+    This function is an equivalent to :meth:`str.join`.
 
     Parameters
     ----------
-    sep : string
-        Delimiter
+    sep : str
+        Delimiter to use between list entries.
 
     Returns
     -------
-    joined : Series/Index of objects
+    Series/Index: object
+        The list entries concatenated by intervening occurrences of the
+        delimiter.
+
+    Raises
+    -------
+    AttributeError
+        If the supplied Series contains neither strings nor lists.
+
+    See Also
+    --------
+    str.join : Standard library version of this method.
+    Series.str.split : Split strings around given separator/delimiter.
+
+    Notes
+    -----
+    If any of the list items is not a string object, the result of the join
+    will be `NaN`.
+
+    Examples
+    --------
+    Example with a list that contains non-string elements.
+
+    >>> s = pd.Series([['lion', 'elephant', 'zebra'],
+    ...                [1.1, 2.2, 3.3],
+    ...                ['cat', np.nan, 'dog'],
+    ...                ['cow', 4.5, 'goat'],
+    ...                ['duck', ['swan', 'fish'], 'guppy']])
+    >>> s
+    0        [lion, elephant, zebra]
+    1                [1.1, 2.2, 3.3]
+    2                [cat, nan, dog]
+    3               [cow, 4.5, goat]
+    4    [duck, [swan, fish], guppy]
+    dtype: object
+
+    Join all lists using a '-'. The lists containing object(s) of types other
+    than str will produce a NaN.
+
+    >>> s.str.join('-')
+    0    lion-elephant-zebra
+    1                    NaN
+    2                    NaN
+    3                    NaN
+    4                    NaN
+    dtype: object
     """
     return _na_map(sep.join, arr)
 
 
 def str_findall(arr, pat, flags=0):
     """
-    Find all occurrences of pattern or regular expression in the
-    Series/Index. Equivalent to :func:`re.findall`.
+    Find all occurrences of pattern or regular expression in the Series/Index.
+
+    Equivalent to applying :func:`re.findall` to all the elements in the
+    Series/Index.
 
     Parameters
     ----------
-    pat : string
-        Pattern or regular expression
-    flags : int, default 0 (no flags)
-        re module flags, e.g. re.IGNORECASE
+    pat : str
+        Pattern or regular expression.
+    flags : int, default 0
+        Flags from ``re`` module, e.g. `re.IGNORECASE` (default is 0, which
+        means no flags).
 
     Returns
     -------
-    matches : Series/Index of lists
+    Series/Index of lists of strings
+        All non-overlapping matches of pattern or regular expression in each
+        string of this Series/Index.
 
     See Also
     --------
-    extractall : returns DataFrame with one column per capture group
+    count : Count occurrences of pattern or regular expression in each string
+        of the Series/Index.
+    extractall : For each string in the Series, extract groups from all matches
+        of regular expression and return a DataFrame with one row for each
+        match and one column for each group.
+    re.findall : The equivalent ``re`` function to all non-overlapping matches
+        of pattern or regular expression in string, as a list of strings.
+
+    Examples
+    --------
+
+    >>> s = pd.Series(['Lion', 'Monkey', 'Rabbit'])
+
+    The search for the pattern 'Monkey' returns one match:
+
+    >>> s.str.findall('Monkey')
+    0          []
+    1    [Monkey]
+    2          []
+    dtype: object
+
+    On the other hand, the search for the pattern 'MONKEY' doesn't return any
+    match:
+
+    >>> s.str.findall('MONKEY')
+    0    []
+    1    []
+    2    []
+    dtype: object
+
+    Flags can be added to the pattern or regular expression. For instance,
+    to find the pattern 'MONKEY' ignoring the case:
+
+    >>> import re
+    >>> s.str.findall('MONKEY', flags=re.IGNORECASE)
+    0          []
+    1    [Monkey]
+    2          []
+    dtype: object
+
+    When the pattern matches more than one string in the Series, all matches
+    are returned:
+
+    >>> s.str.findall('on')
+    0    [on]
+    1    [on]
+    2      []
+    dtype: object
+
+    Regular expressions are supported too. For instance, the search for all the
+    strings ending with the word 'on' is shown next:
+
+    >>> s.str.findall('on$')
+    0    [on]
+    1      []
+    2      []
+    dtype: object
+
+    If the pattern is found more than once in the same string, then a list of
+    multiple strings is returned:
+
+    >>> s.str.findall('b')
+    0        []
+    1        []
+    2    [b, b]
+    dtype: object
     """
     regex = re.compile(pat, flags=flags)
     return _na_map(regex.findall, arr)
@@ -905,17 +1189,18 @@ def str_find(arr, sub, start=0, end=None, side='left'):
     Parameters
     ----------
     sub : str
-        Substring being searched
+        Substring being searched.
     start : int
-        Left edge index
+        Left edge index.
     end : int
-        Right edge index
+        Right edge index.
     side : {'left', 'right'}, default 'left'
-        Specifies a starting side, equivalent to ``find`` or ``rfind``
+        Specifies a starting side, equivalent to ``find`` or ``rfind``.
 
     Returns
     -------
-    found : Series/Index of integer values
+    Series or Index
+        Indexes where substring is found.
     """
 
     if not isinstance(sub, compat.string_types):
@@ -959,23 +1244,57 @@ def str_index(arr, sub, start=0, end=None, side='left'):
 
 def str_pad(arr, width, side='left', fillchar=' '):
     """
-    Pad strings in the Series/Index with an additional character to
-    specified side.
+    Pad strings in the Series/Index up to width.
 
     Parameters
     ----------
     width : int
         Minimum width of resulting string; additional characters will be filled
-        with spaces
+        with character defined in `fillchar`.
     side : {'left', 'right', 'both'}, default 'left'
-    fillchar : str
-        Additional character for filling, default is whitespace
+        Side from which to fill resulting string.
+    fillchar : str, default ' '
+        Additional character for filling, default is whitespace.
 
     Returns
     -------
-    padded : Series/Index of objects
-    """
+    Series or Index of object
+        Returns Series or Index with minimum number of char in object.
 
+    See Also
+    --------
+    Series.str.rjust : Fills the left side of strings with an arbitrary
+        character. Equivalent to ``Series.str.pad(side='left')``.
+    Series.str.ljust : Fills the right side of strings with an arbitrary
+        character. Equivalent to ``Series.str.pad(side='right')``.
+    Series.str.center : Fills boths sides of strings with an arbitrary
+        character. Equivalent to ``Series.str.pad(side='both')``.
+    Series.str.zfill :  Pad strings in the Series/Index by prepending '0'
+        character. Equivalent to ``Series.str.pad(side='left', fillchar='0')``.
+
+    Examples
+    --------
+    >>> s = pd.Series(["caribou", "tiger"])
+    >>> s
+    0    caribou
+    1      tiger
+    dtype: object
+
+    >>> s.str.pad(width=10)
+    0       caribou
+    1         tiger
+    dtype: object
+
+    >>> s.str.pad(width=10, side='right', fillchar='-')
+    0    caribou---
+    1    tiger-----
+    dtype: object
+
+    >>> s.str.pad(width=10, side='both', fillchar='-')
+    0    -caribou--
+    1    --tiger---
+    dtype: object
+    """
     if not isinstance(fillchar, compat.string_types):
         msg = 'fillchar must be a character, not {0}'
         raise TypeError(msg.format(type(fillchar).__name__))
@@ -1000,27 +1319,7 @@ def str_pad(arr, width, side='left', fillchar=' '):
 
 
 def str_split(arr, pat=None, n=None):
-    """
-    Split each string (a la re.split) in the Series/Index by given
-    pattern, propagating NA values. Equivalent to :meth:`str.split`.
 
-    Parameters
-    ----------
-    pat : string, default None
-        String or regular expression to split on. If None, splits on whitespace
-    n : int, default -1 (all)
-        None, 0 and -1 will be interpreted as return all splits
-    expand : bool, default False
-        * If True, return DataFrame/MultiIndex expanding dimensionality.
-        * If False, return Series/Index.
-
-        .. versionadded:: 0.16.1
-    return_type : deprecated, use `expand`
-
-    Returns
-    -------
-    split : Series/Index or DataFrame/MultiIndex of objects
-    """
     if pat is None:
         if n is None or n == 0:
             n = -1
@@ -1040,27 +1339,7 @@ def str_split(arr, pat=None, n=None):
 
 
 def str_rsplit(arr, pat=None, n=None):
-    """
-    Split each string in the Series/Index by the given delimiter
-    string, starting at the end of the string and working to the front.
-    Equivalent to :meth:`str.rsplit`.
 
-    .. versionadded:: 0.16.2
-
-    Parameters
-    ----------
-    pat : string, default None
-        Separator to split on. If None, splits on whitespace
-    n : int, default -1 (all)
-        None, 0 and -1 will be interpreted as return all splits
-    expand : bool, default False
-        * If True, return DataFrame/MultiIndex expanding dimensionality.
-        * If False, return Series/Index.
-
-    Returns
-    -------
-    split : Series/Index or DataFrame/MultiIndex of objects
-    """
     if n is None or n == 0:
         n = -1
     f = lambda x: x.rsplit(pat, n)
@@ -1070,17 +1349,69 @@ def str_rsplit(arr, pat=None, n=None):
 
 def str_slice(arr, start=None, stop=None, step=None):
     """
-    Slice substrings from each element in the Series/Index
+    Slice substrings from each element in the Series or Index.
 
     Parameters
     ----------
-    start : int or None
-    stop : int or None
-    step : int or None
+    start : int, optional
+        Start position for slice operation.
+    stop : int, optional
+        Stop position for slice operation.
+    step : int, optional
+        Step size for slice operation.
 
     Returns
     -------
-    sliced : Series/Index of objects
+    Series or Index of object
+        Series or Index from sliced substring from original string object.
+
+    See Also
+    --------
+    Series.str.slice_replace : Replace a slice with a string.
+    Series.str.get : Return element at position.
+        Equivalent to `Series.str.slice(start=i, stop=i+1)` with `i`
+        being the position.
+
+    Examples
+    --------
+    >>> s = pd.Series(["koala", "fox", "chameleon"])
+    >>> s
+    0        koala
+    1          fox
+    2    chameleon
+    dtype: object
+
+    >>> s.str.slice(start=1)
+    0        oala
+    1          ox
+    2    hameleon
+    dtype: object
+
+    >>> s.str.slice(stop=2)
+    0    ko
+    1    fo
+    2    ch
+    dtype: object
+
+    >>> s.str.slice(step=2)
+    0      kaa
+    1       fx
+    2    caeen
+    dtype: object
+
+    >>> s.str.slice(start=0, stop=5, step=3)
+    0    kl
+    1     f
+    2    cm
+    dtype: object
+
+    Equivalent behaviour to:
+
+    >>> s.str[0:5:3]
+    0    kl
+    1     f
+    2    cm
+    dtype: object
     """
     obj = slice(start, stop, step)
     f = lambda x: x[obj]
@@ -1089,19 +1420,75 @@ def str_slice(arr, start=None, stop=None, step=None):
 
 def str_slice_replace(arr, start=None, stop=None, repl=None):
     """
-    Replace a slice of each string in the Series/Index with another
-    string.
+    Replace a positional slice of a string with another value.
 
     Parameters
     ----------
-    start : int or None
-    stop : int or None
-    repl : str or None
-        String for replacement
+    start : int, optional
+        Left index position to use for the slice. If not specified (None),
+        the slice is unbounded on the left, i.e. slice from the start
+        of the string.
+    stop : int, optional
+        Right index position to use for the slice. If not specified (None),
+        the slice is unbounded on the right, i.e. slice until the
+        end of the string.
+    repl : str, optional
+        String for replacement. If not specified (None), the sliced region
+        is replaced with an empty string.
 
     Returns
     -------
-    replaced : Series/Index of objects
+    Series or Index
+        Same type as the original object.
+
+    See Also
+    --------
+    Series.str.slice : Just slicing without replacement.
+
+    Examples
+    --------
+    >>> s = pd.Series(['a', 'ab', 'abc', 'abdc', 'abcde'])
+    >>> s
+    0        a
+    1       ab
+    2      abc
+    3     abdc
+    4    abcde
+    dtype: object
+
+    Specify just `start`, meaning replace `start` until the end of the
+    string with `repl`.
+
+    >>> s.str.slice_replace(1, repl='X')
+    0    aX
+    1    aX
+    2    aX
+    3    aX
+    4    aX
+    dtype: object
+
+    Specify just `stop`, meaning the start of the string to `stop` is replaced
+    with `repl`, and the rest of the string is included.
+
+    >>> s.str.slice_replace(stop=2, repl='X')
+    0       X
+    1       X
+    2      Xc
+    3     Xdc
+    4    Xcde
+    dtype: object
+
+    Specify `start` and `stop`, meaning the slice from `start` to `stop` is
+    replaced with `repl`. Everything before or after `start` and `stop` is
+    included as is.
+
+    >>> s.str.slice_replace(start=1, stop=3, repl='X')
+    0      aX
+    1      aX
+    2      aX
+    3     aXc
+    4    aXde
+    dtype: object
     """
     if repl is None:
         repl = ''
@@ -1134,7 +1521,7 @@ def str_strip(arr, to_strip=None, side='both'):
 
     Returns
     -------
-    stripped : Series/Index of objects
+    Series or Index
     """
     if side == 'both':
         f = lambda x: x.strip(to_strip)
@@ -1158,30 +1545,30 @@ def str_wrap(arr, width, **kwargs):
     Parameters
     ----------
     width : int
-        Maximum line-width
+        Maximum line width.
     expand_tabs : bool, optional
-        If true, tab characters will be expanded to spaces (default: True)
+        If True, tab characters will be expanded to spaces (default: True).
     replace_whitespace : bool, optional
-        If true, each whitespace character (as defined by string.whitespace)
+        If True, each whitespace character (as defined by string.whitespace)
         remaining after tab expansion will be replaced by a single space
-        (default: True)
+        (default: True).
     drop_whitespace : bool, optional
-        If true, whitespace that, after wrapping, happens to end up at the
-        beginning or end of a line is dropped (default: True)
+        If True, whitespace that, after wrapping, happens to end up at the
+        beginning or end of a line is dropped (default: True).
     break_long_words : bool, optional
-        If true, then words longer than width will be broken in order to ensure
+        If True, then words longer than width will be broken in order to ensure
         that no lines are longer than width. If it is false, long words will
-        not be broken, and some lines may be longer than width. (default: True)
+        not be broken, and some lines may be longer than width (default: True).
     break_on_hyphens : bool, optional
-        If true, wrapping will occur preferably on whitespace and right after
+        If True, wrapping will occur preferably on whitespace and right after
         hyphens in compound words, as it is customary in English. If false,
         only whitespaces will be considered as potentially good places for line
         breaks, but you need to set break_long_words to false if you want truly
-        insecable words. (default: True)
+        insecable words (default: True).
 
     Returns
     -------
-    wrapped : Series/Index of objects
+    Series or Index
 
     Notes
     -----
@@ -1202,6 +1589,7 @@ def str_wrap(arr, width, **kwargs):
     >>> s.str.wrap(12)
     0             line to be\nwrapped
     1    another line\nto be\nwrapped
+    dtype: object
     """
     kwargs['width'] = width
 
@@ -1234,12 +1622,11 @@ def str_translate(arr, table, deletechars=None):
 
     Returns
     -------
-    translated : Series/Index of objects
+    Series or Index
     """
     if deletechars is None:
         f = lambda x: x.translate(table)
     else:
-        from pandas import compat
         if compat.PY3:
             raise ValueError("deletechars is not a valid argument for "
                              "str.translate in python 3. You should simply "
@@ -1251,19 +1638,61 @@ def str_translate(arr, table, deletechars=None):
 
 def str_get(arr, i):
     """
+    Extract element from each component at specified position.
+
     Extract element from lists, tuples, or strings in each element in the
     Series/Index.
 
     Parameters
     ----------
     i : int
-        Integer index (location)
+        Position of element to extract.
 
     Returns
     -------
-    items : Series/Index of objects
+    Series or Index
+
+    Examples
+    --------
+    >>> s = pd.Series(["String",
+    ...               (1, 2, 3),
+    ...               ["a", "b", "c"],
+    ...               123,
+    ...               -456,
+    ...               {1: "Hello", "2": "World"}])
+    >>> s
+    0                        String
+    1                     (1, 2, 3)
+    2                     [a, b, c]
+    3                           123
+    4                          -456
+    5    {1: 'Hello', '2': 'World'}
+    dtype: object
+
+    >>> s.str.get(1)
+    0        t
+    1        2
+    2        b
+    3      NaN
+    4      NaN
+    5    Hello
+    dtype: object
+
+    >>> s.str.get(-1)
+    0      g
+    1      3
+    2      c
+    3    NaN
+    4    NaN
+    5    None
+    dtype: object
     """
-    f = lambda x: x[i] if len(x) > i else np.nan
+    def f(x):
+        if isinstance(x, dict):
+            return x.get(i)
+        elif len(x) > i >= -len(x):
+            return x[i]
+        return np.nan
     return _na_map(f, arr)
 
 
@@ -1280,7 +1709,7 @@ def str_decode(arr, encoding, errors="strict"):
 
     Returns
     -------
-    decoded : Series/Index of objects
+    Series or Index
     """
     if encoding in _cpython_optimized_decoders:
         # CPython optimized implementation
@@ -1316,7 +1745,7 @@ def str_encode(arr, encoding, errors="strict"):
 
 def _noarg_wrapper(f, docstring=None, **kargs):
     def wrapper(self):
-        result = _na_map(f, self._data, **kargs)
+        result = _na_map(f, self._parent, **kargs)
         return self._wrap_result(result)
 
     wrapper.__name__ = f.__name__
@@ -1330,15 +1759,15 @@ def wrapper(self):
 
 def _pat_wrapper(f, flags=False, na=False, **kwargs):
     def wrapper1(self, pat):
-        result = f(self._data, pat)
+        result = f(self._parent, pat)
         return self._wrap_result(result)
 
     def wrapper2(self, pat, flags=0, **kwargs):
-        result = f(self._data, pat, flags=flags, **kwargs)
+        result = f(self._parent, pat, flags=flags, **kwargs)
         return self._wrap_result(result)
 
     def wrapper3(self, pat, na=np.nan):
-        result = f(self._data, pat, na=na)
+        result = f(self._parent, pat, na=na)
         return self._wrap_result(result)
 
     wrapper = wrapper3 if na else wrapper2 if flags else wrapper1
@@ -1374,12 +1803,50 @@ class StringMethods(NoNewAttributesMixin):
     """
 
     def __init__(self, data):
+        self._validate(data)
         self._is_categorical = is_categorical_dtype(data)
-        self._data = data.cat.categories if self._is_categorical else data
+
+        # .values.categories works for both Series/Index
+        self._parent = data.values.categories if self._is_categorical else data
         # save orig to blow up categoricals to the right type
         self._orig = data
         self._freeze()
 
+    @staticmethod
+    def _validate(data):
+        from pandas.core.index import Index
+
+        if (isinstance(data, ABCSeries) and
+                not ((is_categorical_dtype(data.dtype) and
+                      is_object_dtype(data.values.categories)) or
+                     (is_object_dtype(data.dtype)))):
+            # it's neither a string series not a categorical series with
+            # strings inside the categories.
+            # this really should exclude all series with any non-string values
+            # (instead of test for object dtype), but that isn't practical for
+            # performance reasons until we have a str dtype (GH 9343)
+            raise AttributeError("Can only use .str accessor with string "
+                                 "values, which use np.object_ dtype in "
+                                 "pandas")
+        elif isinstance(data, Index):
+            # can't use ABCIndex to exclude non-str
+
+            # see src/inference.pyx which can contain string values
+            allowed_types = ('string', 'unicode', 'mixed', 'mixed-integer')
+            if is_categorical_dtype(data.dtype):
+                inf_type = data.categories.inferred_type
+            else:
+                inf_type = data.inferred_type
+            if inf_type not in allowed_types:
+                message = ("Can only use .str accessor with string values "
+                           "(i.e. inferred_type is 'string', 'unicode' or "
+                           "'mixed')")
+                raise AttributeError(message)
+            if data.nlevels > 1:
+                message = ("Can only use .str accessor with Index, not "
+                           "MultiIndex")
+                raise AttributeError(message)
+
     def __getitem__(self, key):
         if isinstance(key, slice):
             return self.slice(start=key.start, stop=key.stop, step=key.step)
@@ -1389,15 +1856,15 @@ def __getitem__(self, key):
     def __iter__(self):
         i = 0
         g = self.get(i)
-        while g.notnull().any():
+        while g.notna().any():
             yield g
             i += 1
             g = self.get(i)
 
     def _wrap_result(self, result, use_codes=True,
-                     name=None, expand=None):
+                     name=None, expand=None, fill_value=np.nan):
 
-        from pandas.core.index import Index, MultiIndex
+        from pandas import Index, Series, MultiIndex
 
         # for category, we do the stuff on the categories, so blow it up
         # to the full series again
@@ -1405,7 +1872,9 @@ def _wrap_result(self, result, use_codes=True,
         # so make it possible to skip this step as the method already did this
         # before the transformation...
         if use_codes and self._is_categorical:
-            result = take_1d(result, self._orig.cat.codes)
+            # if self._orig is a CategoricalIndex, there is no .cat-accessor
+            result = take_1d(result, Series(self._orig, copy=False).cat.codes,
+                             fill_value=fill_value)
 
         if not hasattr(result, 'ndim') or not hasattr(result, 'dtype'):
             return result
@@ -1413,11 +1882,11 @@ def _wrap_result(self, result, use_codes=True,
 
         if expand is None:
             # infer from ndim if expand is not specified
-            expand = False if result.ndim == 1 else True
+            expand = result.ndim != 1
 
         elif expand is True and not isinstance(self._orig, Index):
             # required when expand=True is explicitly specified
-            # not needed when infered
+            # not needed when inferred
 
             def cons_row(x):
                 if is_list_like(x):
@@ -1426,6 +1895,11 @@ def cons_row(x):
                     return [x]
 
             result = [cons_row(x) for x in result]
+            if result:
+                # propagate nan values to match longest sequence (GH 18450)
+                max_len = max(len(x) for x in result)
+                result = [x * max_len if len(x) == 0 or x[0] is np.nan
+                          else x for x in result]
 
         if not isinstance(expand, bool):
             raise ValueError("expand must be True or False")
@@ -1450,7 +1924,12 @@ def cons_row(x):
 
             if expand:
                 result = list(result)
-                return MultiIndex.from_tuples(result, names=name)
+                out = MultiIndex.from_tuples(result, names=name)
+                if out.nlevels == 1:
+                    # We had all tuples of length-one, which are
+                    # better represented as a regular Index.
+                    out = out.get_level_values(0)
+                return out
             else:
                 return Index(result, name=name)
         else:
@@ -1463,124 +1942,616 @@ def cons_row(x):
                 cons = self._orig._constructor
                 return cons(result, name=name, index=index)
 
-    @copy(str_cat)
-    def cat(self, others=None, sep=None, na_rep=None):
-        data = self._orig if self._is_categorical else self._data
-        result = str_cat(data, others=others, sep=sep, na_rep=na_rep)
-        return self._wrap_result(result, use_codes=(not self._is_categorical))
+    def _get_series_list(self, others, ignore_index=False):
+        """
+        Auxiliary function for :meth:`str.cat`. Turn potentially mixed input
+        into a list of Series (elements without an index must match the length
+        of the calling Series/Index).
+
+        Parameters
+        ----------
+        others : Series, Index, DataFrame, np.ndarray, list-like or list-like
+            of objects that are Series, Index or np.ndarray (1-dim)
+        ignore_index : boolean, default False
+            Determines whether to forcefully align others with index of caller
+
+        Returns
+        -------
+        tuple : (others transformed into list of Series,
+                 boolean whether FutureWarning should be raised)
+        """
+
+        # Once str.cat defaults to alignment, this function can be simplified;
+        # will not need `ignore_index` and the second boolean output anymore
+
+        from pandas import Index, Series, DataFrame
+
+        # self._orig is either Series or Index
+        idx = self._orig if isinstance(self._orig, Index) else self._orig.index
+
+        err_msg = ('others must be Series, Index, DataFrame, np.ndarrary or '
+                   'list-like (either containing only strings or containing '
+                   'only objects of type Series/Index/list-like/np.ndarray)')
+
+        # Generally speaking, all objects without an index inherit the index
+        # `idx` of the calling Series/Index - i.e. must have matching length.
+        # Objects with an index (i.e. Series/Index/DataFrame) keep their own
+        # index, *unless* ignore_index is set to True.
+        if isinstance(others, Series):
+            warn = not others.index.equals(idx)
+            # only reconstruct Series when absolutely necessary
+            los = [Series(others.values, index=idx)
+                   if ignore_index and warn else others]
+            return (los, warn)
+        elif isinstance(others, Index):
+            warn = not others.equals(idx)
+            los = [Series(others.values,
+                          index=(idx if ignore_index else others))]
+            return (los, warn)
+        elif isinstance(others, DataFrame):
+            warn = not others.index.equals(idx)
+            if ignore_index and warn:
+                # without copy, this could change "others"
+                # that was passed to str.cat
+                others = others.copy()
+                others.index = idx
+            return ([others[x] for x in others], warn)
+        elif isinstance(others, np.ndarray) and others.ndim == 2:
+            others = DataFrame(others, index=idx)
+            return ([others[x] for x in others], False)
+        elif is_list_like(others, allow_sets=False):
+            others = list(others)  # ensure iterators do not get read twice etc
+
+            # in case of list-like `others`, all elements must be
+            # either one-dimensional list-likes or scalars
+            if all(is_list_like(x, allow_sets=False) for x in others):
+                los = []
+                join_warn = False
+                depr_warn = False
+                # iterate through list and append list of series for each
+                # element (which we check to be one-dimensional and non-nested)
+                while others:
+                    nxt = others.pop(0)  # nxt is guaranteed list-like by above
+
+                    # GH 21950 - DeprecationWarning
+                    # only allowing Series/Index/np.ndarray[1-dim] will greatly
+                    # simply this function post-deprecation.
+                    if not (isinstance(nxt, (Series, Index)) or
+                            (isinstance(nxt, np.ndarray) and nxt.ndim == 1)):
+                        depr_warn = True
+
+                    if not isinstance(nxt, (DataFrame, Series,
+                                            Index, np.ndarray)):
+                        # safety for non-persistent list-likes (e.g. iterators)
+                        # do not map indexed/typed objects; info needed below
+                        nxt = list(nxt)
+
+                    # known types for which we can avoid deep inspection
+                    no_deep = ((isinstance(nxt, np.ndarray) and nxt.ndim == 1)
+                               or isinstance(nxt, (Series, Index)))
+                    # nested list-likes are forbidden:
+                    # -> elements of nxt must not be list-like
+                    is_legal = ((no_deep and nxt.dtype == object)
+                                or all(not is_list_like(x) for x in nxt))
+
+                    # DataFrame is false positive of is_legal
+                    # because "x in df" returns column names
+                    if not is_legal or isinstance(nxt, DataFrame):
+                        raise TypeError(err_msg)
+
+                    nxt, wnx = self._get_series_list(nxt,
+                                                     ignore_index=ignore_index)
+                    los = los + nxt
+                    join_warn = join_warn or wnx
+
+                if depr_warn:
+                    warnings.warn('list-likes other than Series, Index, or '
+                                  'np.ndarray WITHIN another list-like are '
+                                  'deprecated and will be removed in a future '
+                                  'version.', FutureWarning, stacklevel=3)
+                return (los, join_warn)
+            elif all(not is_list_like(x) for x in others):
+                return ([Series(others, index=idx)], False)
+        raise TypeError(err_msg)
+
+    def cat(self, others=None, sep=None, na_rep=None, join=None):
+        """
+        Concatenate strings in the Series/Index with given separator.
+
+        If `others` is specified, this function concatenates the Series/Index
+        and elements of `others` element-wise.
+        If `others` is not passed, then all values in the Series/Index are
+        concatenated into a single string with a given `sep`.
+
+        Parameters
+        ----------
+        others : Series, Index, DataFrame, np.ndarrary or list-like
+            Series, Index, DataFrame, np.ndarray (one- or two-dimensional) and
+            other list-likes of strings must have the same length as the
+            calling Series/Index, with the exception of indexed objects (i.e.
+            Series/Index/DataFrame) if `join` is not None.
+
+            If others is a list-like that contains a combination of Series,
+            Index or np.ndarray (1-dim), then all elements will be unpacked and
+            must satisfy the above criteria individually.
+
+            If others is None, the method returns the concatenation of all
+            strings in the calling Series/Index.
+        sep : str, default ''
+            The separator between the different elements/columns. By default
+            the empty string `''` is used.
+        na_rep : str or None, default None
+            Representation that is inserted for all missing values:
+
+            - If `na_rep` is None, and `others` is None, missing values in the
+              Series/Index are omitted from the result.
+            - If `na_rep` is None, and `others` is not None, a row containing a
+              missing value in any of the columns (before concatenation) will
+              have a missing value in the result.
+        join : {'left', 'right', 'outer', 'inner'}, default None
+            Determines the join-style between the calling Series/Index and any
+            Series/Index/DataFrame in `others` (objects without an index need
+            to match the length of the calling Series/Index). If None,
+            alignment is disabled, but this option will be removed in a future
+            version of pandas and replaced with a default of `'left'`. To
+            disable alignment, use `.values` on any Series/Index/DataFrame in
+            `others`.
+
+            .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        str, Series or Index
+            If `others` is None, `str` is returned, otherwise a `Series/Index`
+            (same type as caller) of objects is returned.
+
+        See Also
+        --------
+        split : Split each string in the Series/Index.
+        join : Join lists contained as elements in the Series/Index.
+
+        Examples
+        --------
+        When not passing `others`, all values are concatenated into a single
+        string:
+
+        >>> s = pd.Series(['a', 'b', np.nan, 'd'])
+        >>> s.str.cat(sep=' ')
+        'a b d'
+
+        By default, NA values in the Series are ignored. Using `na_rep`, they
+        can be given a representation:
+
+        >>> s.str.cat(sep=' ', na_rep='?')
+        'a b ? d'
+
+        If `others` is specified, corresponding values are concatenated with
+        the separator. Result will be a Series of strings.
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',')
+        0    a,A
+        1    b,B
+        2    NaN
+        3    d,D
+        dtype: object
+
+        Missing values will remain missing in the result, but can again be
+        represented using `na_rep`
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',', na_rep='-')
+        0    a,A
+        1    b,B
+        2    -,C
+        3    d,D
+        dtype: object
+
+        If `sep` is not specified, the values are concatenated without
+        separation.
+
+        >>> s.str.cat(['A', 'B', 'C', 'D'], na_rep='-')
+        0    aA
+        1    bB
+        2    -C
+        3    dD
+        dtype: object
+
+        Series with different indexes can be aligned before concatenation. The
+        `join`-keyword works as in other methods.
+
+        >>> t = pd.Series(['d', 'a', 'e', 'c'], index=[3, 0, 4, 2])
+        >>> s.str.cat(t, join='left', na_rep='-')
+        0    aa
+        1    b-
+        2    -c
+        3    dd
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='outer', na_rep='-')
+        0    aa
+        1    b-
+        2    -c
+        3    dd
+        4    -e
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='inner', na_rep='-')
+        0    aa
+        2    -c
+        3    dd
+        dtype: object
+        >>>
+        >>> s.str.cat(t, join='right', na_rep='-')
+        3    dd
+        0    aa
+        4    -e
+        2    -c
+        dtype: object
+
+        For more examples, see :ref:`here <text.concatenate>`.
+        """
+        from pandas import Index, Series, concat
+
+        if isinstance(others, compat.string_types):
+            raise ValueError("Did you mean to supply a `sep` keyword?")
+        if sep is None:
+            sep = ''
+
+        if isinstance(self._orig, Index):
+            data = Series(self._orig, index=self._orig)
+        else:  # Series
+            data = self._orig
+
+        # concatenate Series/Index with itself if no "others"
+        if others is None:
+            data = ensure_object(data)
+            na_mask = isna(data)
+            if na_rep is None and na_mask.any():
+                data = data[~na_mask]
+            elif na_rep is not None and na_mask.any():
+                data = np.where(na_mask, na_rep, data)
+            return sep.join(data)
+
+        try:
+            # turn anything in "others" into lists of Series
+            others, warn = self._get_series_list(others,
+                                                 ignore_index=(join is None))
+        except ValueError:  # do not catch TypeError raised by _get_series_list
+            if join is None:
+                raise ValueError('All arrays must be same length, except '
+                                 'those having an index if `join` is not None')
+            else:
+                raise ValueError('If `others` contains arrays or lists (or '
+                                 'other list-likes without an index), these '
+                                 'must all be of the same length as the '
+                                 'calling Series/Index.')
+
+        if join is None and warn:
+            warnings.warn("A future version of pandas will perform index "
+                          "alignment when `others` is a Series/Index/"
+                          "DataFrame (or a list-like containing one). To "
+                          "disable alignment (the behavior before v.0.23) and "
+                          "silence this warning, use `.values` on any Series/"
+                          "Index/DataFrame in `others`. To enable alignment "
+                          "and silence this warning, pass `join='left'|"
+                          "'outer'|'inner'|'right'`. The future default will "
+                          "be `join='left'`.", FutureWarning, stacklevel=2)
+
+        # if join is None, _get_series_list already force-aligned indexes
+        join = 'left' if join is None else join
+
+        # align if required
+        if any(not data.index.equals(x.index) for x in others):
+            # Need to add keys for uniqueness in case of duplicate columns
+            others = concat(others, axis=1,
+                            join=(join if join == 'inner' else 'outer'),
+                            keys=range(len(others)), sort=False, copy=False)
+            data, others = data.align(others, join=join)
+            others = [others[x] for x in others]  # again list of Series
+
+        all_cols = [ensure_object(x) for x in [data] + others]
+        na_masks = np.array([isna(x) for x in all_cols])
+        union_mask = np.logical_or.reduce(na_masks, axis=0)
+
+        if na_rep is None and union_mask.any():
+            # no na_rep means NaNs for all rows where any column has a NaN
+            # only necessary if there are actually any NaNs
+            result = np.empty(len(data), dtype=object)
+            np.putmask(result, union_mask, np.nan)
+
+            not_masked = ~union_mask
+            result[not_masked] = cat_core([x[not_masked] for x in all_cols],
+                                          sep)
+        elif na_rep is not None and union_mask.any():
+            # fill NaNs with na_rep in case there are actually any NaNs
+            all_cols = [np.where(nm, na_rep, col)
+                        for nm, col in zip(na_masks, all_cols)]
+            result = cat_core(all_cols, sep)
+        else:
+            # no NaNs - can just concatenate
+            result = cat_core(all_cols, sep)
+
+        if isinstance(self._orig, Index):
+            # add dtype for case that result is all-NA
+            result = Index(result, dtype=object, name=self._orig.name)
+        else:  # Series
+            result = Series(result, dtype=object, index=data.index,
+                            name=self._orig.name)
+        return result
+
+    _shared_docs['str_split'] = ("""
+    Split strings around given separator/delimiter.
+
+    Splits the string in the Series/Index from the %(side)s,
+    at the specified delimiter string. Equivalent to :meth:`str.%(method)s`.
+
+    Parameters
+    ----------
+    pat : str, optional
+        String or regular expression to split on.
+        If not specified, split on whitespace.
+    n : int, default -1 (all)
+        Limit number of splits in output.
+        ``None``, 0 and -1 will be interpreted as return all splits.
+    expand : bool, default False
+        Expand the splitted strings into separate columns.
+
+        * If ``True``, return DataFrame/MultiIndex expanding dimensionality.
+        * If ``False``, return Series/Index, containing lists of strings.
+
+    Returns
+    -------
+    Series, Index, DataFrame or MultiIndex
+        Type matches caller unless ``expand=True`` (see Notes).
+
+    See Also
+    --------
+     Series.str.split : Split strings around given separator/delimiter.
+     Series.str.rsplit : Splits string around given separator/delimiter,
+     starting from the right.
+     Series.str.join : Join lists contained as elements in the Series/Index
+     with passed delimiter.
+     str.split : Standard library version for split.
+     str.rsplit : Standard library version for rsplit.
+
+    Notes
+    -----
+    The handling of the `n` keyword depends on the number of found splits:
+
+    - If found splits > `n`,  make first `n` splits only
+    - If found splits <= `n`, make all splits
+    - If for a certain row the number of found splits < `n`,
+      append `None` for padding up to `n` if ``expand=True``
 
-    @copy(str_split)
+    If using ``expand=True``, Series and Index callers return DataFrame and
+    MultiIndex objects, respectively.
+
+    Examples
+    --------
+    >>> s = pd.Series(["this is a regular sentence",
+    "https://docs.python.org/3/tutorial/index.html", np.nan])
+
+    In the default setting, the string is split by whitespace.
+
+    >>> s.str.split()
+    0                   [this, is, a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    Without the `n` parameter, the outputs of `rsplit` and `split`
+    are identical.
+
+    >>> s.str.rsplit()
+    0                   [this, is, a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    The `n` parameter can be used to limit the number of splits on the
+    delimiter. The outputs of `split` and `rsplit` are different.
+
+    >>> s.str.split(n=2)
+    0                     [this, is, a regular sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    >>> s.str.rsplit(n=2)
+    0                     [this is a, regular, sentence]
+    1    [https://docs.python.org/3/tutorial/index.html]
+    2                                                NaN
+    dtype: object
+
+    The `pat` parameter can be used to split by other characters.
+
+    >>> s.str.split(pat = "/")
+    0                         [this is a regular sentence]
+    1    [https:, , docs.python.org, 3, tutorial, index...
+    2                                                  NaN
+    dtype: object
+
+    When using ``expand=True``, the split elements will expand out into
+    separate columns. If NaN is present, it is propagated throughout
+    the columns during the split.
+
+    >>> s.str.split(expand=True)
+                                                   0     1     2        3
+    0                                           this    is     a  regular
+    1  https://docs.python.org/3/tutorial/index.html  None  None     None
+    2                                            NaN   NaN   NaN      NaN \
+
+                 4
+    0     sentence
+    1         None
+    2          NaN
+
+    For slightly more complex use cases like splitting the html document name
+    from a url, a combination of parameter settings can be used.
+
+    >>> s.str.rsplit("/", n=1, expand=True)
+                                        0           1
+    0          this is a regular sentence        None
+    1  https://docs.python.org/3/tutorial  index.html
+    2                                 NaN         NaN
+    """)
+
+    @Appender(_shared_docs['str_split'] % {
+        'side': 'beginning',
+        'method': 'split'})
     def split(self, pat=None, n=-1, expand=False):
-        result = str_split(self._data, pat, n=n)
+        result = str_split(self._parent, pat, n=n)
         return self._wrap_result(result, expand=expand)
 
-    @copy(str_rsplit)
+    @Appender(_shared_docs['str_split'] % {
+        'side': 'end',
+        'method': 'rsplit'})
     def rsplit(self, pat=None, n=-1, expand=False):
-        result = str_rsplit(self._data, pat, n=n)
+        result = str_rsplit(self._parent, pat, n=n)
         return self._wrap_result(result, expand=expand)
 
     _shared_docs['str_partition'] = ("""
-    Split the string at the %(side)s occurrence of `sep`, and return 3 elements
-    containing the part before the separator, the separator itself,
-    and the part after the separator.
+    Split the string at the %(side)s occurrence of `sep`.
+
+    This method splits the string at the %(side)s occurrence of `sep`,
+    and returns 3 elements containing the part before the separator,
+    the separator itself, and the part after the separator.
     If the separator is not found, return %(return)s.
 
     Parameters
     ----------
-    pat : string, default whitespace
+    sep : str, default whitespace
         String to split on.
+    pat : str, default whitespace
+        .. deprecated:: 0.24.0
+           Use ``sep`` instead
     expand : bool, default True
-        * If True, return DataFrame/MultiIndex expanding dimensionality.
-        * If False, return Series/Index.
+        If True, return DataFrame/MultiIndex expanding dimensionality.
+        If False, return Series/Index.
 
     Returns
     -------
-    split : DataFrame/MultiIndex or Series/Index of objects
+    DataFrame/MultiIndex or Series/Index of objects
 
     See Also
     --------
     %(also)s
+    Series.str.split : Split strings around given separators.
+    str.partition : Standard library version.
 
     Examples
     --------
 
-    >>> s = Series(['A_B_C', 'D_E_F', 'X'])
-    0    A_B_C
-    1    D_E_F
-    2        X
+    >>> s = pd.Series(['Linda van der Berg', 'George Pitt-Rivers'])
+    >>> s
+    0    Linda van der Berg
+    1    George Pitt-Rivers
+    dtype: object
+
+    >>> s.str.partition()
+            0  1             2
+    0   Linda     van der Berg
+    1  George      Pitt-Rivers
+
+    To partition by the last space instead of the first one:
+
+    >>> s.str.rpartition()
+                   0  1            2
+    0  Linda van der            Berg
+    1         George     Pitt-Rivers
+
+    To partition by something different than a space:
+
+    >>> s.str.partition('-')
+                        0  1       2
+    0  Linda van der Berg
+    1         George Pitt  -  Rivers
+
+    To return a Series containining tuples instead of a DataFrame:
+
+    >>> s.str.partition('-', expand=False)
+    0    (Linda van der Berg, , )
+    1    (George Pitt, -, Rivers)
     dtype: object
 
-    >>> s.str.partition('_')
-       0  1    2
-    0  A  _  B_C
-    1  D  _  E_F
-    2  X
+    Also available on indices:
 
-    >>> s.str.rpartition('_')
-         0  1  2
-    0  A_B  _  C
-    1  D_E  _  F
-    2          X
+    >>> idx = pd.Index(['X 123', 'Y 999'])
+    >>> idx
+    Index(['X 123', 'Y 999'], dtype='object')
+
+    Which will create a MultiIndex:
+
+    >>> idx.str.partition()
+    MultiIndex(levels=[['X', 'Y'], [' '], ['123', '999']],
+               codes=[[0, 1], [0, 0], [0, 1]])
+
+    Or an index with tuples with ``expand=False``:
+
+    >>> idx.str.partition(expand=False)
+    Index([('X', ' ', '123'), ('Y', ' ', '999')], dtype='object')
     """)
 
     @Appender(_shared_docs['str_partition'] % {
         'side': 'first',
         'return': '3 elements containing the string itself, followed by two '
                   'empty strings',
-        'also': 'rpartition : Split the string at the last occurrence of `sep`'
+        'also': 'rpartition : Split the string at the last occurrence of '
+                '`sep`.'
     })
-    def partition(self, pat=' ', expand=True):
-        f = lambda x: x.partition(pat)
-        result = _na_map(f, self._data)
+    @deprecate_kwarg(old_arg_name='pat', new_arg_name='sep')
+    def partition(self, sep=' ', expand=True):
+        f = lambda x: x.partition(sep)
+        result = _na_map(f, self._parent)
         return self._wrap_result(result, expand=expand)
 
     @Appender(_shared_docs['str_partition'] % {
         'side': 'last',
         'return': '3 elements containing two empty strings, followed by the '
                   'string itself',
-        'also': 'partition : Split the string at the first occurrence of `sep`'
+        'also': 'partition : Split the string at the first occurrence of '
+                '`sep`.'
     })
-    def rpartition(self, pat=' ', expand=True):
-        f = lambda x: x.rpartition(pat)
-        result = _na_map(f, self._data)
+    @deprecate_kwarg(old_arg_name='pat', new_arg_name='sep')
+    def rpartition(self, sep=' ', expand=True):
+        f = lambda x: x.rpartition(sep)
+        result = _na_map(f, self._parent)
         return self._wrap_result(result, expand=expand)
 
     @copy(str_get)
     def get(self, i):
-        result = str_get(self._data, i)
+        result = str_get(self._parent, i)
         return self._wrap_result(result)
 
     @copy(str_join)
     def join(self, sep):
-        result = str_join(self._data, sep)
+        result = str_join(self._parent, sep)
         return self._wrap_result(result)
 
     @copy(str_contains)
     def contains(self, pat, case=True, flags=0, na=np.nan, regex=True):
-        result = str_contains(self._data, pat, case=case, flags=flags, na=na,
+        result = str_contains(self._parent, pat, case=case, flags=flags, na=na,
                               regex=regex)
-        return self._wrap_result(result)
+        return self._wrap_result(result, fill_value=na)
 
     @copy(str_match)
-    def match(self, pat, case=True, flags=0, na=np.nan, as_indexer=None):
-        result = str_match(self._data, pat, case=case, flags=flags, na=na,
-                           as_indexer=as_indexer)
-        return self._wrap_result(result)
+    def match(self, pat, case=True, flags=0, na=np.nan):
+        result = str_match(self._parent, pat, case=case, flags=flags, na=na)
+        return self._wrap_result(result, fill_value=na)
 
     @copy(str_replace)
-    def replace(self, pat, repl, n=-1, case=None, flags=0):
-        result = str_replace(self._data, pat, repl, n=n, case=case,
-                             flags=flags)
+    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=True):
+        result = str_replace(self._parent, pat, repl, n=n, case=case,
+                             flags=flags, regex=regex)
         return self._wrap_result(result)
 
     @copy(str_repeat)
     def repeat(self, repeats):
-        result = str_repeat(self._data, repeats)
+        result = str_repeat(self._parent, repeats)
         return self._wrap_result(result)
 
     @copy(str_pad)
     def pad(self, width, side='left', fillchar=' '):
-        result = str_pad(self._data, width, side=side, fillchar=fillchar)
+        result = str_pad(self._parent, width, side=side, fillchar=fillchar)
         return self._wrap_result(result)
 
     _shared_docs['str_pad'] = ("""
@@ -1615,86 +2586,185 @@ def rjust(self, width, fillchar=' '):
 
     def zfill(self, width):
         """
-        Filling left side of strings in the Series/Index with 0.
-        Equivalent to :meth:`str.zfill`.
+        Pad strings in the Series/Index by prepending '0' characters.
+
+        Strings in the Series/Index are padded with '0' characters on the
+        left of the string to reach a total string length  `width`. Strings
+        in the Series/Index with length greater or equal to `width` are
+        unchanged.
 
         Parameters
         ----------
         width : int
-            Minimum width of resulting string; additional characters will be
-            filled with 0
+            Minimum length of resulting string; strings with length less
+            than `width` be prepended with '0' characters.
 
         Returns
         -------
-        filled : Series/Index of objects
+        Series/Index of objects
+
+        See Also
+        --------
+        Series.str.rjust : Fills the left side of strings with an arbitrary
+            character.
+        Series.str.ljust : Fills the right side of strings with an arbitrary
+            character.
+        Series.str.pad : Fills the specified sides of strings with an arbitrary
+            character.
+        Series.str.center : Fills boths sides of strings with an arbitrary
+            character.
+
+        Notes
+        -----
+        Differs from :meth:`str.zfill` which has special handling
+        for '+'/'-' in the string.
+
+        Examples
+        --------
+        >>> s = pd.Series(['-1', '1', '1000', 10, np.nan])
+        >>> s
+        0      -1
+        1       1
+        2    1000
+        3      10
+        4     NaN
+        dtype: object
+
+        Note that ``10`` and ``NaN`` are not strings, therefore they are
+        converted to ``NaN``. The minus sign in ``'-1'`` is treated as a
+        regular character and the zero is added to the left of it
+        (:meth:`str.zfill` would have moved it to the left). ``1000``
+        remains unchanged as it is longer than `width`.
+
+        >>> s.str.zfill(3)
+        0     0-1
+        1     001
+        2    1000
+        3     NaN
+        4     NaN
+        dtype: object
         """
-        result = str_pad(self._data, width, side='left', fillchar='0')
+        result = str_pad(self._parent, width, side='left', fillchar='0')
         return self._wrap_result(result)
 
     @copy(str_slice)
     def slice(self, start=None, stop=None, step=None):
-        result = str_slice(self._data, start, stop, step)
+        result = str_slice(self._parent, start, stop, step)
         return self._wrap_result(result)
 
     @copy(str_slice_replace)
     def slice_replace(self, start=None, stop=None, repl=None):
-        result = str_slice_replace(self._data, start, stop, repl)
+        result = str_slice_replace(self._parent, start, stop, repl)
         return self._wrap_result(result)
 
     @copy(str_decode)
     def decode(self, encoding, errors="strict"):
-        result = str_decode(self._data, encoding, errors)
+        result = str_decode(self._parent, encoding, errors)
         return self._wrap_result(result)
 
     @copy(str_encode)
     def encode(self, encoding, errors="strict"):
-        result = str_encode(self._data, encoding, errors)
+        result = str_encode(self._parent, encoding, errors)
         return self._wrap_result(result)
 
-    _shared_docs['str_strip'] = ("""
-    Strip whitespace (including newlines) from each string in the
-    Series/Index from %(side)s. Equivalent to :meth:`str.%(method)s`.
+    _shared_docs['str_strip'] = (r"""
+    Remove leading and trailing characters.
+
+    Strip whitespaces (including newlines) or a set of specified characters
+    from each string in the Series/Index from %(side)s.
+    Equivalent to :meth:`str.%(method)s`.
+
+    Parameters
+    ----------
+    to_strip : str or None, default None
+        Specifying the set of characters to be removed.
+        All combinations of this set of characters will be stripped.
+        If None then whitespaces are removed.
 
     Returns
     -------
-    stripped : Series/Index of objects
+    Series/Index of objects
+
+    See Also
+    --------
+    Series.str.strip : Remove leading and trailing characters in Series/Index.
+    Series.str.lstrip : Remove leading characters in Series/Index.
+    Series.str.rstrip : Remove trailing characters in Series/Index.
+
+    Examples
+    --------
+    >>> s = pd.Series(['1. Ant.  ', '2. Bee!\n', '3. Cat?\t', np.nan])
+    >>> s
+    0    1. Ant.
+    1    2. Bee!\n
+    2    3. Cat?\t
+    3          NaN
+    dtype: object
+
+    >>> s.str.strip()
+    0    1. Ant.
+    1    2. Bee!
+    2    3. Cat?
+    3        NaN
+    dtype: object
+
+    >>> s.str.lstrip('123.')
+    0    Ant.
+    1    Bee!\n
+    2    Cat?\t
+    3       NaN
+    dtype: object
+
+    >>> s.str.rstrip('.!? \n\t')
+    0    1. Ant
+    1    2. Bee
+    2    3. Cat
+    3       NaN
+    dtype: object
+
+    >>> s.str.strip('123.!? \n\t')
+    0    Ant
+    1    Bee
+    2    Cat
+    3    NaN
+    dtype: object
     """)
 
     @Appender(_shared_docs['str_strip'] % dict(side='left and right sides',
                                                method='strip'))
     def strip(self, to_strip=None):
-        result = str_strip(self._data, to_strip, side='both')
+        result = str_strip(self._parent, to_strip, side='both')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['str_strip'] % dict(side='left side',
                                                method='lstrip'))
     def lstrip(self, to_strip=None):
-        result = str_strip(self._data, to_strip, side='left')
+        result = str_strip(self._parent, to_strip, side='left')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['str_strip'] % dict(side='right side',
                                                method='rstrip'))
     def rstrip(self, to_strip=None):
-        result = str_strip(self._data, to_strip, side='right')
+        result = str_strip(self._parent, to_strip, side='right')
         return self._wrap_result(result)
 
     @copy(str_wrap)
     def wrap(self, width, **kwargs):
-        result = str_wrap(self._data, width, **kwargs)
+        result = str_wrap(self._parent, width, **kwargs)
         return self._wrap_result(result)
 
     @copy(str_get_dummies)
     def get_dummies(self, sep='|'):
         # we need to cast to Series of strings as only that has all
         # methods available for making the dummies...
-        data = self._orig.astype(str) if self._is_categorical else self._data
+        data = self._orig.astype(str) if self._is_categorical else self._parent
         result, name = str_get_dummies(data, sep)
         return self._wrap_result(result, use_codes=(not self._is_categorical),
                                  name=name, expand=True)
 
     @copy(str_translate)
     def translate(self, table, deletechars=None):
-        result = str_translate(self._data, table, deletechars)
+        result = str_translate(self._parent, table, deletechars)
         return self._wrap_result(result)
 
     count = _pat_wrapper(str_count, flags=True)
@@ -1703,7 +2773,7 @@ def translate(self, table, deletechars=None):
     findall = _pat_wrapper(str_findall, flags=True)
 
     @copy(str_extract)
-    def extract(self, pat, flags=0, expand=None):
+    def extract(self, pat, flags=0, expand=True):
         return str_extract(self, pat, flags=flags, expand=expand)
 
     @copy(str_extractall)
@@ -1735,20 +2805,22 @@ def extractall(self, pat, flags=0):
 
     @Appender(_shared_docs['find'] %
               dict(side='lowest', method='find',
-                   also='rfind : Return highest indexes in each strings'))
+                   also='rfind : Return highest indexes in each strings.'))
     def find(self, sub, start=0, end=None):
-        result = str_find(self._data, sub, start=start, end=end, side='left')
+        result = str_find(self._parent, sub, start=start, end=end, side='left')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['find'] %
               dict(side='highest', method='rfind',
-                   also='find : Return lowest indexes in each strings'))
+                   also='find : Return lowest indexes in each strings.'))
     def rfind(self, sub, start=0, end=None):
-        result = str_find(self._data, sub, start=start, end=end, side='right')
+        result = str_find(self._parent, sub,
+                          start=start, end=end, side='right')
         return self._wrap_result(result)
 
     def normalize(self, form):
-        """Return the Unicode normal form for the strings in the Series/Index.
+        """
+        Return the Unicode normal form for the strings in the Series/Index.
         For more information on the forms, see the
         :func:`unicodedata.normalize`.
 
@@ -1763,7 +2835,7 @@ def normalize(self, form):
         """
         import unicodedata
         f = lambda x: unicodedata.normalize(form, compat.u_safe(x))
-        result = _na_map(f, self._data)
+        result = _na_map(f, self._parent)
         return self._wrap_result(result)
 
     _shared_docs['index'] = ("""
@@ -1792,41 +2864,141 @@ def normalize(self, form):
 
     @Appender(_shared_docs['index'] %
               dict(side='lowest', similar='find', method='index',
-                   also='rindex : Return highest indexes in each strings'))
+                   also='rindex : Return highest indexes in each strings.'))
     def index(self, sub, start=0, end=None):
-        result = str_index(self._data, sub, start=start, end=end, side='left')
+        result = str_index(self._parent, sub,
+                           start=start, end=end, side='left')
         return self._wrap_result(result)
 
     @Appender(_shared_docs['index'] %
               dict(side='highest', similar='rfind', method='rindex',
-                   also='index : Return lowest indexes in each strings'))
+                   also='index : Return lowest indexes in each strings.'))
     def rindex(self, sub, start=0, end=None):
-        result = str_index(self._data, sub, start=start, end=end, side='right')
+        result = str_index(self._parent, sub,
+                           start=start, end=end, side='right')
         return self._wrap_result(result)
 
     _shared_docs['len'] = ("""
-    Compute length of each string in the Series/Index.
+    Compute the length of each element in the Series/Index. The element may be
+    a sequence (such as a string, tuple or list) or a collection
+    (such as a dictionary).
 
     Returns
     -------
-    lengths : Series/Index of integer values
+    Series or Index of int
+        A Series or Index of integer values indicating the length of each
+        element in the Series or Index.
+
+    See Also
+    --------
+    str.len : Python built-in function returning the length of an object.
+    Series.size : Returns the length of the Series.
+
+    Examples
+    --------
+    Returns the length (number of characters) in a string. Returns the
+    number of entries for dictionaries, lists or tuples.
+
+    >>> s = pd.Series(['dog',
+    ...                 '',
+    ...                 5,
+    ...                 {'foo' : 'bar'},
+    ...                 [2, 3, 5, 7],
+    ...                 ('one', 'two', 'three')])
+    >>> s
+    0                  dog
+    1
+    2                    5
+    3       {'foo': 'bar'}
+    4         [2, 3, 5, 7]
+    5    (one, two, three)
+    dtype: object
+    >>> s.str.len()
+    0    3.0
+    1    0.0
+    2    NaN
+    3    1.0
+    4    4.0
+    5    3.0
+    dtype: float64
     """)
     len = _noarg_wrapper(len, docstring=_shared_docs['len'], dtype=int)
 
     _shared_docs['casemethods'] = ("""
     Convert strings in the Series/Index to %(type)s.
+    %(version)s
     Equivalent to :meth:`str.%(method)s`.
 
     Returns
     -------
-    converted : Series/Index of objects
+    Series/Index of objects
+
+    See Also
+    --------
+    Series.str.lower : Converts all characters to lowercase.
+    Series.str.upper : Converts all characters to uppercase.
+    Series.str.title : Converts first character of each word to uppercase and
+        remaining to lowercase.
+    Series.str.capitalize : Converts first character to uppercase and
+        remaining to lowercase.
+    Series.str.swapcase : Converts uppercase to lowercase and lowercase to
+        uppercase.
+    Series.str.casefold: Removes all case distinctions in the string.
+
+    Examples
+    --------
+    >>> s = pd.Series(['lower', 'CAPITALS', 'this is a sentence', 'SwApCaSe'])
+    >>> s
+    0                 lower
+    1              CAPITALS
+    2    this is a sentence
+    3              SwApCaSe
+    dtype: object
+
+    >>> s.str.lower()
+    0                 lower
+    1              capitals
+    2    this is a sentence
+    3              swapcase
+    dtype: object
+
+    >>> s.str.upper()
+    0                 LOWER
+    1              CAPITALS
+    2    THIS IS A SENTENCE
+    3              SWAPCASE
+    dtype: object
+
+    >>> s.str.title()
+    0                 Lower
+    1              Capitals
+    2    This Is A Sentence
+    3              Swapcase
+    dtype: object
+
+    >>> s.str.capitalize()
+    0                 Lower
+    1              Capitals
+    2    This is a sentence
+    3              Swapcase
+    dtype: object
+
+    >>> s.str.swapcase()
+    0                 LOWER
+    1              capitals
+    2    THIS IS A SENTENCE
+    3              sWaPcAsE
+    dtype: object
     """)
-    _shared_docs['lower'] = dict(type='lowercase', method='lower')
-    _shared_docs['upper'] = dict(type='uppercase', method='upper')
-    _shared_docs['title'] = dict(type='titlecase', method='title')
+    _shared_docs['lower'] = dict(type='lowercase', method='lower', version='')
+    _shared_docs['upper'] = dict(type='uppercase', method='upper', version='')
+    _shared_docs['title'] = dict(type='titlecase', method='title', version='')
     _shared_docs['capitalize'] = dict(type='be capitalized',
-                                      method='capitalize')
-    _shared_docs['swapcase'] = dict(type='be swapcased', method='swapcase')
+                                      method='capitalize', version='')
+    _shared_docs['swapcase'] = dict(type='be swapcased', method='swapcase',
+                                    version='')
+    _shared_docs['casefold'] = dict(type='be casefolded', method='casefold',
+                                    version='\n    .. versionadded:: 0.25.0\n')
     lower = _noarg_wrapper(lambda x: x.lower(),
                            docstring=_shared_docs['casemethods'] %
                            _shared_docs['lower'])
@@ -1842,14 +3014,149 @@ def rindex(self, sub, start=0, end=None):
     swapcase = _noarg_wrapper(lambda x: x.swapcase(),
                               docstring=_shared_docs['casemethods'] %
                               _shared_docs['swapcase'])
+    casefold = _noarg_wrapper(lambda x: x.casefold(),
+                              docstring=_shared_docs['casemethods'] %
+                              _shared_docs['casefold'])
 
     _shared_docs['ismethods'] = ("""
-    Check whether all characters in each string in the Series/Index
-    are %(type)s. Equivalent to :meth:`str.%(method)s`.
+    Check whether all characters in each string are %(type)s.
+
+    This is equivalent to running the Python string method
+    :meth:`str.%(method)s` for each element of the Series/Index. If a string
+    has zero characters, ``False`` is returned for that check.
 
     Returns
     -------
-    is : Series/array of boolean values
+    Series or Index of bool
+        Series or Index of boolean values with the same length as the original
+        Series/Index.
+
+    See Also
+    --------
+    Series.str.isalpha : Check whether all characters are alphabetic.
+    Series.str.isnumeric : Check whether all characters are numeric.
+    Series.str.isalnum : Check whether all characters are alphanumeric.
+    Series.str.isdigit : Check whether all characters are digits.
+    Series.str.isdecimal : Check whether all characters are decimal.
+    Series.str.isspace : Check whether all characters are whitespace.
+    Series.str.islower : Check whether all characters are lowercase.
+    Series.str.isupper : Check whether all characters are uppercase.
+    Series.str.istitle : Check whether all characters are titlecase.
+
+    Examples
+    --------
+    **Checks for Alphabetic and Numeric Characters**
+
+    >>> s1 = pd.Series(['one', 'one1', '1', ''])
+
+    >>> s1.str.isalpha()
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
+
+    >>> s1.str.isnumeric()
+    0    False
+    1    False
+    2     True
+    3    False
+    dtype: bool
+
+    >>> s1.str.isalnum()
+    0     True
+    1     True
+    2     True
+    3    False
+    dtype: bool
+
+    Note that checks against characters mixed with any additional punctuation
+    or whitespace will evaluate to false for an alphanumeric check.
+
+    >>> s2 = pd.Series(['A B', '1.5', '3,000'])
+    >>> s2.str.isalnum()
+    0    False
+    1    False
+    2    False
+    dtype: bool
+
+    **More Detailed Checks for Numeric Characters**
+
+    There are several different but overlapping sets of numeric characters that
+    can be checked for.
+
+    >>> s3 = pd.Series(['23', '³', '⅕', ''])
+
+    The ``s3.str.isdecimal`` method checks for characters used to form numbers
+    in base 10.
+
+    >>> s3.str.isdecimal()
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
+
+    The ``s.str.isdigit`` method is the same as ``s3.str.isdecimal`` but also
+    includes special digits, like superscripted and subscripted digits in
+    unicode.
+
+    >>> s3.str.isdigit()
+    0     True
+    1     True
+    2    False
+    3    False
+    dtype: bool
+
+    The ``s.str.isnumeric`` method is the same as ``s3.str.isdigit`` but also
+    includes other characters that can represent quantities such as unicode
+    fractions.
+
+    >>> s3.str.isnumeric()
+    0     True
+    1     True
+    2     True
+    3    False
+    dtype: bool
+
+    **Checks for Whitespace**
+
+    >>> s4 = pd.Series([' ', '\\t\\r\\n ', ''])
+    >>> s4.str.isspace()
+    0     True
+    1     True
+    2    False
+    dtype: bool
+
+    **Checks for Character Case**
+
+    >>> s5 = pd.Series(['leopard', 'Golden Eagle', 'SNAKE', ''])
+
+    >>> s5.str.islower()
+    0     True
+    1    False
+    2    False
+    3    False
+    dtype: bool
+
+    >>> s5.str.isupper()
+    0    False
+    1    False
+    2     True
+    3    False
+    dtype: bool
+
+    The ``s5.str.istitle`` method checks for whether all words are in title
+    case (whether only the first letter of each word is capitalized). Words are
+    assumed to be as any sequence of non-numeric characters seperated by
+    whitespace characters.
+
+    >>> s5.str.istitle()
+    0    False
+    1     True
+    2    False
+    3    False
+    dtype: bool
     """)
     _shared_docs['isalnum'] = dict(type='alphanumeric', method='isalnum')
     _shared_docs['isalpha'] = dict(type='alphabetic', method='isalpha')
@@ -1888,50 +3195,7 @@ def rindex(self, sub, start=0, end=None):
                                docstring=_shared_docs['ismethods'] %
                                _shared_docs['isdecimal'])
 
-
-class StringAccessorMixin(object):
-    """ Mixin to add a `.str` acessor to the class."""
-
-    # string methods
-    def _make_str_accessor(self):
-        from pandas.core.index import Index
-
-        if (isinstance(self, ABCSeries) and
-                not ((is_categorical_dtype(self.dtype) and
-                      is_object_dtype(self.values.categories)) or
-                     (is_object_dtype(self.dtype)))):
-            # it's neither a string series not a categorical series with
-            # strings inside the categories.
-            # this really should exclude all series with any non-string values
-            # (instead of test for object dtype), but that isn't practical for
-            # performance reasons until we have a str dtype (GH 9343)
-            raise AttributeError("Can only use .str accessor with string "
-                                 "values, which use np.object_ dtype in "
-                                 "pandas")
-        elif isinstance(self, Index):
-            # can't use ABCIndex to exclude non-str
-
-            # see scc/inferrence.pyx which can contain string values
-            allowed_types = ('string', 'unicode', 'mixed', 'mixed-integer')
-            if self.inferred_type not in allowed_types:
-                message = ("Can only use .str accessor with string values "
-                           "(i.e. inferred_type is 'string', 'unicode' or "
-                           "'mixed')")
-                raise AttributeError(message)
-            if self.nlevels > 1:
-                message = ("Can only use .str accessor with Index, not "
-                           "MultiIndex")
-                raise AttributeError(message)
-        return StringMethods(self)
-
-    str = AccessorProperty(StringMethods, _make_str_accessor)
-
-    def _dir_additions(self):
-        return set()
-
-    def _dir_deletions(self):
-        try:
-            getattr(self, 'str')
-        except AttributeError:
-            return set(['str'])
-        return set()
+    @classmethod
+    def _make_accessor(cls, data):
+        cls._validate(data)
+        return cls(data)
diff --git a/pandas/tests/types/__init__.py b/pandas/core/tools/__init__.py
similarity index 100%
rename from pandas/tests/types/__init__.py
rename to pandas/core/tools/__init__.py
diff --git a/pandas/core/tools/datetimes.py b/pandas/core/tools/datetimes.py
new file mode 100644
index 0000000000000..0c76ac6cd75ac
--- /dev/null
+++ b/pandas/core/tools/datetimes.py
@@ -0,0 +1,901 @@
+from datetime import datetime, time
+from functools import partial
+
+import numpy as np
+
+from pandas._libs import tslib, tslibs
+from pandas._libs.tslibs import Timestamp, conversion, parsing
+from pandas._libs.tslibs.parsing import (  # noqa
+    DateParseError, _format_is_iso, _guess_datetime_format, parse_time_string)
+from pandas._libs.tslibs.strptime import array_strptime
+from pandas.compat import zip
+
+from pandas.core.dtypes.common import (
+    ensure_object, is_datetime64_dtype, is_datetime64_ns_dtype,
+    is_datetime64tz_dtype, is_float, is_integer, is_integer_dtype,
+    is_list_like, is_numeric_dtype, is_object_dtype, is_scalar)
+from pandas.core.dtypes.generic import ABCDataFrame, ABCIndexClass, ABCSeries
+from pandas.core.dtypes.missing import notna
+
+from pandas import compat
+from pandas.core import algorithms
+
+
+def _guess_datetime_format_for_array(arr, **kwargs):
+    # Try to guess the format based on the first non-NaN element
+    non_nan_elements = notna(arr).nonzero()[0]
+    if len(non_nan_elements):
+        return _guess_datetime_format(arr[non_nan_elements[0]], **kwargs)
+
+
+def _maybe_cache(arg, format, cache, convert_listlike):
+    """
+    Create a cache of unique dates from an array of dates
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+    format : string
+        Strftime format to parse time
+    cache : boolean
+        True attempts to create a cache of converted values
+    convert_listlike : function
+        Conversion function to apply on dates
+
+    Returns
+    -------
+    cache_array : Series
+        Cache of converted, unique dates. Can be empty
+    """
+    from pandas import Series
+    cache_array = Series()
+    if cache:
+        # Perform a quicker unique check
+        from pandas import Index
+        if not Index(arg).is_unique:
+            unique_dates = algorithms.unique(arg)
+            cache_dates = convert_listlike(unique_dates, True, format)
+            cache_array = Series(cache_dates, index=unique_dates)
+    return cache_array
+
+
+def _convert_and_box_cache(arg, cache_array, box, errors, name=None):
+    """
+    Convert array of dates with a cache and box the result
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+    cache_array : Series
+        Cache of converted, unique dates
+    box : boolean
+        True boxes result as an Index-like, False returns an ndarray
+    errors : string
+        'ignore' plus box=True will convert result to Index
+    name : string, default None
+        Name for a DatetimeIndex
+
+    Returns
+    -------
+    result : datetime of converted dates
+        Returns:
+
+        - Index-like if box=True
+        - ndarray if box=False
+    """
+    from pandas import Series, DatetimeIndex, Index
+    result = Series(arg).map(cache_array)
+    if box:
+        if errors == 'ignore':
+            return Index(result, name=name)
+        else:
+            return DatetimeIndex(result, name=name)
+    return result.values
+
+
+def _return_parsed_timezone_results(result, timezones, box, tz, name):
+    """
+    Return results from array_strptime if a %z or %Z directive was passed.
+
+    Parameters
+    ----------
+    result : ndarray
+        int64 date representations of the dates
+    timezones : ndarray
+        pytz timezone objects
+    box : boolean
+        True boxes result as an Index-like, False returns an ndarray
+    tz : object
+        None or pytz timezone object
+    name : string, default None
+        Name for a DatetimeIndex
+
+    Returns
+    -------
+    tz_result : ndarray of parsed dates with timezone
+        Returns:
+
+        - Index-like if box=True
+        - ndarray of Timestamps if box=False
+
+    """
+    if tz is not None:
+        raise ValueError("Cannot pass a tz argument when "
+                         "parsing strings with timezone "
+                         "information.")
+    tz_results = np.array([Timestamp(res).tz_localize(zone) for res, zone
+                           in zip(result, timezones)])
+    if box:
+        from pandas import Index
+        return Index(tz_results, name=name)
+    return tz_results
+
+
+def _convert_listlike_datetimes(arg, box, format, name=None, tz=None,
+                                unit=None, errors=None,
+                                infer_datetime_format=None, dayfirst=None,
+                                yearfirst=None, exact=None):
+    """
+    Helper function for to_datetime. Performs the conversions of 1D listlike
+    of dates
+
+    Parameters
+    ----------
+    arg : list, tuple, ndarray, Series, Index
+        date to be parced
+    box : boolean
+        True boxes result as an Index-like, False returns an ndarray
+    name : object
+        None or string for the Index name
+    tz : object
+        None or 'utc'
+    unit : string
+        None or string of the frequency of the passed data
+    errors : string
+        error handing behaviors from to_datetime, 'raise', 'coerce', 'ignore'
+    infer_datetime_format : boolean
+        inferring format behavior from to_datetime
+    dayfirst : boolean
+        dayfirst parsing behavior from to_datetime
+    yearfirst : boolean
+        yearfirst parsing behavior from to_datetime
+    exact : boolean
+        exact format matching behavior from to_datetime
+
+    Returns
+    -------
+    ndarray of parsed dates
+        Returns:
+
+        - Index-like if box=True
+        - ndarray of Timestamps if box=False
+    """
+    from pandas import DatetimeIndex
+    from pandas.core.arrays import DatetimeArray
+    from pandas.core.arrays.datetimes import (
+        maybe_convert_dtype, objects_to_datetime64ns)
+
+    if isinstance(arg, (list, tuple)):
+        arg = np.array(arg, dtype='O')
+
+    # these are shortcutable
+    if is_datetime64tz_dtype(arg):
+        if not isinstance(arg, (DatetimeArray, DatetimeIndex)):
+            return DatetimeIndex(arg, tz=tz, name=name)
+        if tz == 'utc':
+            arg = arg.tz_convert(None).tz_localize(tz)
+        return arg
+
+    elif is_datetime64_ns_dtype(arg):
+        if box and not isinstance(arg, (DatetimeArray, DatetimeIndex)):
+            try:
+                return DatetimeIndex(arg, tz=tz, name=name)
+            except ValueError:
+                pass
+
+        return arg
+
+    elif unit is not None:
+        if format is not None:
+            raise ValueError("cannot specify both format and unit")
+        arg = getattr(arg, 'values', arg)
+        result = tslib.array_with_unit_to_datetime(arg, unit,
+                                                   errors=errors)
+        if box:
+            if errors == 'ignore':
+                from pandas import Index
+                result = Index(result, name=name)
+                # GH 23758: We may still need to localize the result with tz
+                try:
+                    return result.tz_localize(tz)
+                except AttributeError:
+                    return result
+
+            return DatetimeIndex(result, tz=tz, name=name)
+        return result
+    elif getattr(arg, 'ndim', 1) > 1:
+        raise TypeError('arg must be a string, datetime, list, tuple, '
+                        '1-d array, or Series')
+
+    # warn if passing timedelta64, raise for PeriodDtype
+    # NB: this must come after unit transformation
+    orig_arg = arg
+    arg, _ = maybe_convert_dtype(arg, copy=False)
+
+    arg = ensure_object(arg)
+    require_iso8601 = False
+
+    if infer_datetime_format and format is None:
+        format = _guess_datetime_format_for_array(arg, dayfirst=dayfirst)
+
+    if format is not None:
+        # There is a special fast-path for iso8601 formatted
+        # datetime strings, so in those cases don't use the inferred
+        # format because this path makes process slower in this
+        # special case
+        format_is_iso8601 = _format_is_iso(format)
+        if format_is_iso8601:
+            require_iso8601 = not infer_datetime_format
+            format = None
+
+    tz_parsed = None
+    result = None
+
+    if format is not None:
+        try:
+            # shortcut formatting here
+            if format == '%Y%m%d':
+                try:
+                    # pass orig_arg as float-dtype may have been converted to
+                    # datetime64[ns]
+                    orig_arg = ensure_object(orig_arg)
+                    result = _attempt_YYYYMMDD(orig_arg, errors=errors)
+                except (ValueError, TypeError, tslibs.OutOfBoundsDatetime):
+                    raise ValueError("cannot convert the input to "
+                                     "'%Y%m%d' date format")
+
+            # fallback
+            if result is None:
+                try:
+                    result, timezones = array_strptime(
+                        arg, format, exact=exact, errors=errors)
+                    if '%Z' in format or '%z' in format:
+                        return _return_parsed_timezone_results(
+                            result, timezones, box, tz, name)
+                except tslibs.OutOfBoundsDatetime:
+                    if errors == 'raise':
+                        raise
+                    elif errors == 'coerce':
+                        result = np.empty(arg.shape, dtype='M8[ns]')
+                        iresult = result.view('i8')
+                        iresult.fill(tslibs.iNaT)
+                    else:
+                        result = arg
+                except ValueError:
+                    # if format was inferred, try falling back
+                    # to array_to_datetime - terminate here
+                    # for specified formats
+                    if not infer_datetime_format:
+                        if errors == 'raise':
+                            raise
+                        elif errors == 'coerce':
+                            result = np.empty(arg.shape, dtype='M8[ns]')
+                            iresult = result.view('i8')
+                            iresult.fill(tslibs.iNaT)
+                        else:
+                            result = arg
+        except ValueError as e:
+            # Fallback to try to convert datetime objects if timezone-aware
+            #  datetime objects are found without passing `utc=True`
+            try:
+                values, tz = conversion.datetime_to_datetime64(arg)
+                return DatetimeIndex._simple_new(values, name=name, tz=tz)
+            except (ValueError, TypeError):
+                raise e
+
+    if result is None:
+        assert format is None or infer_datetime_format
+        utc = tz == 'utc'
+        result, tz_parsed = objects_to_datetime64ns(
+            arg, dayfirst=dayfirst, yearfirst=yearfirst,
+            utc=utc, errors=errors, require_iso8601=require_iso8601,
+            allow_object=True)
+
+    if tz_parsed is not None:
+        if box:
+            # We can take a shortcut since the datetime64 numpy array
+            # is in UTC
+            return DatetimeIndex._simple_new(result, name=name,
+                                             tz=tz_parsed)
+        else:
+            # Convert the datetime64 numpy array to an numpy array
+            # of datetime objects
+            result = [Timestamp(ts, tz=tz_parsed).to_pydatetime()
+                      for ts in result]
+            return np.array(result, dtype=object)
+
+    if box:
+        # Ensure we return an Index in all cases where box=True
+        if is_datetime64_dtype(result):
+            return DatetimeIndex(result, tz=tz, name=name)
+        elif is_object_dtype(result):
+            # e.g. an Index of datetime objects
+            from pandas import Index
+            return Index(result, name=name)
+    return result
+
+
+def _adjust_to_origin(arg, origin, unit):
+    """
+    Helper function for to_datetime.
+    Adjust input argument to the specified origin
+
+    Parameters
+    ----------
+    arg : list, tuple, ndarray, Series, Index
+        date to be adjusted
+    origin : 'julian' or Timestamp
+        origin offset for the arg
+    unit : string
+        passed unit from to_datetime, must be 'D'
+
+    Returns
+    -------
+    ndarray or scalar of adjusted date(s)
+    """
+    if origin == 'julian':
+        original = arg
+        j0 = Timestamp(0).to_julian_date()
+        if unit != 'D':
+            raise ValueError("unit must be 'D' for origin='julian'")
+        try:
+            arg = arg - j0
+        except TypeError:
+            raise ValueError("incompatible 'arg' type for given "
+                             "'origin'='julian'")
+
+        # premptively check this for a nice range
+        j_max = Timestamp.max.to_julian_date() - j0
+        j_min = Timestamp.min.to_julian_date() - j0
+        if np.any(arg > j_max) or np.any(arg < j_min):
+            raise tslibs.OutOfBoundsDatetime(
+                "{original} is Out of Bounds for "
+                "origin='julian'".format(original=original))
+    else:
+        # arg must be numeric
+        if not ((is_scalar(arg) and (is_integer(arg) or is_float(arg))) or
+                is_numeric_dtype(np.asarray(arg))):
+            raise ValueError(
+                "'{arg}' is not compatible with origin='{origin}'; "
+                "it must be numeric with a unit specified ".format(
+                    arg=arg,
+                    origin=origin))
+
+        # we are going to offset back to unix / epoch time
+        try:
+            offset = Timestamp(origin)
+        except tslibs.OutOfBoundsDatetime:
+            raise tslibs.OutOfBoundsDatetime(
+                "origin {origin} is Out of Bounds".format(origin=origin))
+        except ValueError:
+            raise ValueError("origin {origin} cannot be converted "
+                             "to a Timestamp".format(origin=origin))
+
+        if offset.tz is not None:
+            raise ValueError(
+                "origin offset {} must be tz-naive".format(offset))
+        offset -= Timestamp(0)
+
+        # convert the offset to the unit of the arg
+        # this should be lossless in terms of precision
+        offset = offset // tslibs.Timedelta(1, unit=unit)
+
+        # scalars & ndarray-like can handle the addition
+        if is_list_like(arg) and not isinstance(
+                arg, (ABCSeries, ABCIndexClass, np.ndarray)):
+            arg = np.asarray(arg)
+        arg = arg + offset
+    return arg
+
+
+def to_datetime(arg, errors='raise', dayfirst=False, yearfirst=False,
+                utc=None, box=True, format=None, exact=True,
+                unit=None, infer_datetime_format=False, origin='unix',
+                cache=False):
+    """
+    Convert argument to datetime.
+
+    Parameters
+    ----------
+    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
+
+        .. versionadded:: 0.18.1
+
+           or DataFrame/dict-like
+
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaT
+        - If 'ignore', then invalid parsing will return the input
+    dayfirst : boolean, default False
+        Specify a date parse order if `arg` is str or its list-likes.
+        If True, parses dates with the day first, eg 10/11/12 is parsed as
+        2012-11-10.
+        Warning: dayfirst=True is not strict, but will prefer to parse
+        with day first (this is a known bug, based on dateutil behavior).
+    yearfirst : boolean, default False
+        Specify a date parse order if `arg` is str or its list-likes.
+
+        - If True parses dates with the year first, eg 10/11/12 is parsed as
+          2010-11-12.
+        - If both dayfirst and yearfirst are True, yearfirst is preceded (same
+          as dateutil).
+
+        Warning: yearfirst=True is not strict, but will prefer to parse
+        with year first (this is a known bug, based on dateutil behavior).
+
+        .. versionadded:: 0.16.1
+
+    utc : boolean, default None
+        Return UTC DatetimeIndex if True (converting any tz-aware
+        datetime.datetime objects as well).
+    box : boolean, default True
+
+        - If True returns a DatetimeIndex or Index-like object
+        - If False returns ndarray of values.
+    format : string, default None
+        strftime to parse time, eg "%d/%m/%Y", note that "%f" will parse
+        all the way up to nanoseconds.
+    exact : boolean, True by default
+
+        - If True, require an exact format match.
+        - If False, allow the format to match anywhere in the target string.
+
+    unit : string, default 'ns'
+        unit of the arg (D,s,ms,us,ns) denote the unit, which is an
+        integer or float number. This will be based off the origin.
+        Example, with unit='ms' and origin='unix' (the default), this
+        would calculate the number of milliseconds to the unix epoch start.
+    infer_datetime_format : boolean, default False
+        If True and no `format` is given, attempt to infer the format of the
+        datetime strings, and if it can be inferred, switch to a faster
+        method of parsing them. In some cases this can increase the parsing
+        speed by ~5-10x.
+    origin : scalar, default is 'unix'
+        Define the reference date. The numeric values would be parsed as number
+        of units (defined by `unit`) since this reference date.
+
+        - If 'unix' (or POSIX) time; origin is set to 1970-01-01.
+        - If 'julian', unit must be 'D', and origin is set to beginning of
+          Julian Calendar. Julian day number 0 is assigned to the day starting
+          at noon on January 1, 4713 BC.
+        - If Timestamp convertible, origin is set to Timestamp identified by
+          origin.
+
+        .. versionadded:: 0.20.0
+    cache : boolean, default False
+        If True, use a cache of unique, converted dates to apply the datetime
+        conversion. May produce significant speed-up when parsing duplicate
+        date strings, especially ones with timezone offsets.
+
+        .. versionadded:: 0.23.0
+
+    Returns
+    -------
+    ret : datetime if parsing succeeded.
+        Return type depends on input:
+
+        - list-like: DatetimeIndex
+        - Series: Series of datetime64 dtype
+        - scalar: Timestamp
+
+        In case when it is not possible to return designated types (e.g. when
+        any element of input is before Timestamp.min or after Timestamp.max)
+        return will have datetime.datetime type (or corresponding
+        array/Series).
+
+    See Also
+    --------
+    DataFrame.astype : Cast argument to a specified dtype.
+    to_timedelta : Convert argument to timedelta.
+
+    Examples
+    --------
+    Assembling a datetime from multiple columns of a DataFrame. The keys can be
+    common abbreviations like ['year', 'month', 'day', 'minute', 'second',
+    'ms', 'us', 'ns']) or plurals of the same
+
+    >>> df = pd.DataFrame({'year': [2015, 2016],
+                           'month': [2, 3],
+                           'day': [4, 5]})
+    >>> pd.to_datetime(df)
+    0   2015-02-04
+    1   2016-03-05
+    dtype: datetime64[ns]
+
+    If a date does not meet the `timestamp limitations
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html
+    #timeseries-timestamp-limits>`_, passing errors='ignore'
+    will return the original input instead of raising any exception.
+
+    Passing errors='coerce' will force an out-of-bounds date to NaT,
+    in addition to forcing non-dates (or non-parseable dates) to NaT.
+
+    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='ignore')
+    datetime.datetime(1300, 1, 1, 0, 0)
+    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='coerce')
+    NaT
+
+    Passing infer_datetime_format=True can often-times speedup a parsing
+    if its not an ISO8601 format exactly, but in a regular format.
+
+    >>> s = pd.Series(['3/11/2000', '3/12/2000', '3/13/2000']*1000)
+
+    >>> s.head()
+    0    3/11/2000
+    1    3/12/2000
+    2    3/13/2000
+    3    3/11/2000
+    4    3/12/2000
+    dtype: object
+
+    >>> %timeit pd.to_datetime(s,infer_datetime_format=True)
+    100 loops, best of 3: 10.4 ms per loop
+
+    >>> %timeit pd.to_datetime(s,infer_datetime_format=False)
+    1 loop, best of 3: 471 ms per loop
+
+    Using a unix epoch time
+
+    >>> pd.to_datetime(1490195805, unit='s')
+    Timestamp('2017-03-22 15:16:45')
+    >>> pd.to_datetime(1490195805433502912, unit='ns')
+    Timestamp('2017-03-22 15:16:45.433502912')
+
+    .. warning:: For float arg, precision rounding might happen. To prevent
+        unexpected behavior use a fixed-width exact type.
+
+    Using a non-unix epoch origin
+
+    >>> pd.to_datetime([1, 2, 3], unit='D',
+                       origin=pd.Timestamp('1960-01-01'))
+    0    1960-01-02
+    1    1960-01-03
+    2    1960-01-04
+    """
+    if arg is None:
+        return None
+
+    if origin != 'unix':
+        arg = _adjust_to_origin(arg, origin, unit)
+
+    tz = 'utc' if utc else None
+    convert_listlike = partial(_convert_listlike_datetimes, tz=tz, unit=unit,
+                               dayfirst=dayfirst, yearfirst=yearfirst,
+                               errors=errors, exact=exact,
+                               infer_datetime_format=infer_datetime_format)
+
+    if isinstance(arg, Timestamp):
+        result = arg
+        if tz is not None:
+            if arg.tz is not None:
+                result = result.tz_convert(tz)
+            else:
+                result = result.tz_localize(tz)
+    elif isinstance(arg, ABCSeries):
+        cache_array = _maybe_cache(arg, format, cache, convert_listlike)
+        if not cache_array.empty:
+            result = arg.map(cache_array)
+        else:
+            values = convert_listlike(arg._values, True, format)
+            result = arg._constructor(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, (ABCDataFrame, compat.MutableMapping)):
+        result = _assemble_from_unit_mappings(arg, errors, box, tz)
+    elif isinstance(arg, ABCIndexClass):
+        cache_array = _maybe_cache(arg, format, cache, convert_listlike)
+        if not cache_array.empty:
+            result = _convert_and_box_cache(arg, cache_array, box, errors,
+                                            name=arg.name)
+        else:
+            convert_listlike = partial(convert_listlike, name=arg.name)
+            result = convert_listlike(arg, box, format)
+    elif is_list_like(arg):
+        cache_array = _maybe_cache(arg, format, cache, convert_listlike)
+        if not cache_array.empty:
+            result = _convert_and_box_cache(arg, cache_array, box, errors)
+        else:
+            result = convert_listlike(arg, box, format)
+    else:
+        result = convert_listlike(np.array([arg]), box, format)[0]
+
+    return result
+
+
+# mappings for assembling units
+_unit_map = {'year': 'year',
+             'years': 'year',
+             'month': 'month',
+             'months': 'month',
+             'day': 'day',
+             'days': 'day',
+             'hour': 'h',
+             'hours': 'h',
+             'minute': 'm',
+             'minutes': 'm',
+             'second': 's',
+             'seconds': 's',
+             'ms': 'ms',
+             'millisecond': 'ms',
+             'milliseconds': 'ms',
+             'us': 'us',
+             'microsecond': 'us',
+             'microseconds': 'us',
+             'ns': 'ns',
+             'nanosecond': 'ns',
+             'nanoseconds': 'ns'
+             }
+
+
+def _assemble_from_unit_mappings(arg, errors, box, tz):
+    """
+    assemble the unit specified fields from the arg (DataFrame)
+    Return a Series for actual parsing
+
+    Parameters
+    ----------
+    arg : DataFrame
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaT
+        - If 'ignore', then invalid parsing will return the input
+    box : boolean
+
+        - If True, return a DatetimeIndex
+        - If False, return an array
+    tz : None or 'utc'
+
+    Returns
+    -------
+    Series
+    """
+    from pandas import to_timedelta, to_numeric, DataFrame
+    arg = DataFrame(arg)
+    if not arg.columns.is_unique:
+        raise ValueError("cannot assemble with duplicate keys")
+
+    # replace passed unit with _unit_map
+    def f(value):
+        if value in _unit_map:
+            return _unit_map[value]
+
+        # m is case significant
+        if value.lower() in _unit_map:
+            return _unit_map[value.lower()]
+
+        return value
+
+    unit = {k: f(k) for k in arg.keys()}
+    unit_rev = {v: k for k, v in unit.items()}
+
+    # we require at least Ymd
+    required = ['year', 'month', 'day']
+    req = sorted(list(set(required) - set(unit_rev.keys())))
+    if len(req):
+        raise ValueError("to assemble mappings requires at least that "
+                         "[year, month, day] be specified: [{required}] "
+                         "is missing".format(required=','.join(req)))
+
+    # keys we don't recognize
+    excess = sorted(list(set(unit_rev.keys()) - set(_unit_map.values())))
+    if len(excess):
+        raise ValueError("extra keys have been passed "
+                         "to the datetime assemblage: "
+                         "[{excess}]".format(excess=','.join(excess)))
+
+    def coerce(values):
+        # we allow coercion to if errors allows
+        values = to_numeric(values, errors=errors)
+
+        # prevent overflow in case of int8 or int16
+        if is_integer_dtype(values):
+            values = values.astype('int64', copy=False)
+        return values
+
+    values = (coerce(arg[unit_rev['year']]) * 10000 +
+              coerce(arg[unit_rev['month']]) * 100 +
+              coerce(arg[unit_rev['day']]))
+    try:
+        values = to_datetime(values, format='%Y%m%d', errors=errors, utc=tz)
+    except (TypeError, ValueError) as e:
+        raise ValueError("cannot assemble the "
+                         "datetimes: {error}".format(error=e))
+
+    for u in ['h', 'm', 's', 'ms', 'us', 'ns']:
+        value = unit_rev.get(u)
+        if value is not None and value in arg:
+            try:
+                values += to_timedelta(coerce(arg[value]),
+                                       unit=u,
+                                       errors=errors)
+            except (TypeError, ValueError) as e:
+                raise ValueError("cannot assemble the datetimes [{value}]: "
+                                 "{error}".format(value=value, error=e))
+    if not box:
+        return values.values
+    return values
+
+
+def _attempt_YYYYMMDD(arg, errors):
+    """
+    try to parse the YYYYMMDD/%Y%m%d format, try to deal with NaT-like,
+    arg is a passed in as an object dtype, but could really be ints/strings
+    with nan-like/or floats (e.g. with nan)
+
+    Parameters
+    ----------
+    arg : passed value
+    errors : 'raise','ignore','coerce'
+    """
+
+    def calc(carg):
+        # calculate the actual result
+        carg = carg.astype(object)
+        parsed = parsing.try_parse_year_month_day(carg / 10000,
+                                                  carg / 100 % 100,
+                                                  carg % 100)
+        return tslib.array_to_datetime(parsed, errors=errors)[0]
+
+    def calc_with_mask(carg, mask):
+        result = np.empty(carg.shape, dtype='M8[ns]')
+        iresult = result.view('i8')
+        iresult[~mask] = tslibs.iNaT
+
+        masked_result = calc(carg[mask].astype(np.float64).astype(np.int64))
+        result[mask] = masked_result.astype('M8[ns]')
+        return result
+
+    # try intlike / strings that are ints
+    try:
+        return calc(arg.astype(np.int64))
+    except ValueError:
+        pass
+
+    # a float with actual np.nan
+    try:
+        carg = arg.astype(np.float64)
+        return calc_with_mask(carg, notna(carg))
+    except ValueError:
+        pass
+
+    # string with NaN-like
+    try:
+        mask = ~algorithms.isin(arg, list(tslib.nat_strings))
+        return calc_with_mask(arg, mask)
+    except ValueError:
+        pass
+
+    return None
+
+
+# Fixed time formats for time parsing
+_time_formats = ["%H:%M", "%H%M", "%I:%M%p", "%I%M%p",
+                 "%H:%M:%S", "%H%M%S", "%I:%M:%S%p", "%I%M%S%p"]
+
+
+def _guess_time_format_for_array(arr):
+    # Try to guess the format based on the first non-NaN element
+    non_nan_elements = notna(arr).nonzero()[0]
+    if len(non_nan_elements):
+        element = arr[non_nan_elements[0]]
+        for time_format in _time_formats:
+            try:
+                datetime.strptime(element, time_format)
+                return time_format
+            except ValueError:
+                pass
+
+    return None
+
+
+def to_time(arg, format=None, infer_time_format=False, errors='raise'):
+    """
+    Parse time strings to time objects using fixed strptime formats ("%H:%M",
+    "%H%M", "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
+    "%I%M%S%p")
+
+    Use infer_time_format if all the strings are in the same format to speed
+    up conversion.
+
+    Parameters
+    ----------
+    arg : string in time format, datetime.time, list, tuple, 1-d array,  Series
+    format : str, default None
+        Format used to convert arg into a time object.  If None, fixed formats
+        are used.
+    infer_time_format: bool, default False
+        Infer the time format based on the first non-NaN element.  If all
+        strings are in the same format, this will speed up conversion.
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as None
+        - If 'ignore', then invalid parsing will return the input
+
+    Returns
+    -------
+    datetime.time
+    """
+
+    def _convert_listlike(arg, format):
+
+        if isinstance(arg, (list, tuple)):
+            arg = np.array(arg, dtype='O')
+
+        elif getattr(arg, 'ndim', 1) > 1:
+            raise TypeError('arg must be a string, datetime, list, tuple, '
+                            '1-d array, or Series')
+
+        arg = ensure_object(arg)
+
+        if infer_time_format and format is None:
+            format = _guess_time_format_for_array(arg)
+
+        times = []
+        if format is not None:
+            for element in arg:
+                try:
+                    times.append(datetime.strptime(element, format).time())
+                except (ValueError, TypeError):
+                    if errors == 'raise':
+                        msg = ("Cannot convert {element} to a time with given "
+                               "format {format}").format(element=element,
+                                                         format=format)
+                        raise ValueError(msg)
+                    elif errors == 'ignore':
+                        return arg
+                    else:
+                        times.append(None)
+        else:
+            formats = _time_formats[:]
+            format_found = False
+            for element in arg:
+                time_object = None
+                for time_format in formats:
+                    try:
+                        time_object = datetime.strptime(element,
+                                                        time_format).time()
+                        if not format_found:
+                            # Put the found format in front
+                            fmt = formats.pop(formats.index(time_format))
+                            formats.insert(0, fmt)
+                            format_found = True
+                        break
+                    except (ValueError, TypeError):
+                        continue
+
+                if time_object is not None:
+                    times.append(time_object)
+                elif errors == 'raise':
+                    raise ValueError("Cannot convert arg {arg} to "
+                                     "a time".format(arg=arg))
+                elif errors == 'ignore':
+                    return arg
+                else:
+                    times.append(None)
+
+        return times
+
+    if arg is None:
+        return arg
+    elif isinstance(arg, time):
+        return arg
+    elif isinstance(arg, ABCSeries):
+        values = _convert_listlike(arg._values, format)
+        return arg._constructor(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, ABCIndexClass):
+        return _convert_listlike(arg, format)
+    elif is_list_like(arg):
+        return _convert_listlike(arg, format)
+
+    return _convert_listlike(np.array([arg]), format)[0]
diff --git a/pandas/core/tools/numeric.py b/pandas/core/tools/numeric.py
new file mode 100644
index 0000000000000..08ce649d8602c
--- /dev/null
+++ b/pandas/core/tools/numeric.py
@@ -0,0 +1,187 @@
+import numpy as np
+
+from pandas._libs import lib
+
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+from pandas.core.dtypes.common import (
+    ensure_object, is_datetime_or_timedelta_dtype, is_decimal, is_number,
+    is_numeric_dtype, is_scalar)
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+
+import pandas as pd
+
+
+def to_numeric(arg, errors='raise', downcast=None):
+    """
+    Convert argument to a numeric type.
+
+    The default return dtype is `float64` or `int64`
+    depending on the data supplied. Use the `downcast` parameter
+    to obtain other dtypes.
+
+    Please note that precision loss may occur if really large numbers
+    are passed in. Due to the internal limitations of `ndarray`, if
+    numbers smaller than `-9223372036854775808` (np.iinfo(np.int64).min)
+    or larger than `18446744073709551615` (np.iinfo(np.uint64).max) are
+    passed in, it is very likely they will be converted to float so that
+    they can stored in an `ndarray`. These warnings apply similarly to
+    `Series` since it internally leverages `ndarray`.
+
+    Parameters
+    ----------
+    arg : scalar, list, tuple, 1-d array, or Series
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception
+        - If 'coerce', then invalid parsing will be set as NaN
+        - If 'ignore', then invalid parsing will return the input
+    downcast : {'integer', 'signed', 'unsigned', 'float'} , default None
+        If not None, and if the data has been successfully cast to a
+        numerical dtype (or if the data was numeric to begin with),
+        downcast that resulting data to the smallest numerical dtype
+        possible according to the following rules:
+
+        - 'integer' or 'signed': smallest signed int dtype (min.: np.int8)
+        - 'unsigned': smallest unsigned int dtype (min.: np.uint8)
+        - 'float': smallest float dtype (min.: np.float32)
+
+        As this behaviour is separate from the core conversion to
+        numeric values, any errors raised during the downcasting
+        will be surfaced regardless of the value of the 'errors' input.
+
+        In addition, downcasting will only occur if the size
+        of the resulting data's dtype is strictly larger than
+        the dtype it is to be cast to, so if none of the dtypes
+        checked satisfy that specification, no downcasting will be
+        performed on the data.
+
+        .. versionadded:: 0.19.0
+
+    Returns
+    -------
+    ret : numeric if parsing succeeded.
+        Return type depends on input.  Series if Series, otherwise ndarray.
+
+    See Also
+    --------
+    DataFrame.astype : Cast argument to a specified dtype.
+    to_datetime : Convert argument to datetime.
+    to_timedelta : Convert argument to timedelta.
+    numpy.ndarray.astype : Cast a numpy array to a specified type.
+
+    Examples
+    --------
+    Take separate series and convert to numeric, coercing when told to
+
+    >>> s = pd.Series(['1.0', '2', -3])
+    >>> pd.to_numeric(s)
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
+    >>> pd.to_numeric(s, downcast='float')
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float32
+    >>> pd.to_numeric(s, downcast='signed')
+    0    1
+    1    2
+    2   -3
+    dtype: int8
+    >>> s = pd.Series(['apple', '1.0', '2', -3])
+    >>> pd.to_numeric(s, errors='ignore')
+    0    apple
+    1      1.0
+    2        2
+    3       -3
+    dtype: object
+    >>> pd.to_numeric(s, errors='coerce')
+    0    NaN
+    1    1.0
+    2    2.0
+    3   -3.0
+    dtype: float64
+    """
+    if downcast not in (None, 'integer', 'signed', 'unsigned', 'float'):
+        raise ValueError('invalid downcasting method provided')
+
+    is_series = False
+    is_index = False
+    is_scalars = False
+
+    if isinstance(arg, ABCSeries):
+        is_series = True
+        values = arg.values
+    elif isinstance(arg, ABCIndexClass):
+        is_index = True
+        values = arg.asi8
+        if values is None:
+            values = arg.values
+    elif isinstance(arg, (list, tuple)):
+        values = np.array(arg, dtype='O')
+    elif is_scalar(arg):
+        if is_decimal(arg):
+            return float(arg)
+        if is_number(arg):
+            return arg
+        is_scalars = True
+        values = np.array([arg], dtype='O')
+    elif getattr(arg, 'ndim', 1) > 1:
+        raise TypeError('arg must be a list, tuple, 1-d array, or Series')
+    else:
+        values = arg
+
+    try:
+        if is_numeric_dtype(values):
+            pass
+        elif is_datetime_or_timedelta_dtype(values):
+            values = values.astype(np.int64)
+        else:
+            values = ensure_object(values)
+            coerce_numeric = errors not in ('ignore', 'raise')
+            values = lib.maybe_convert_numeric(values, set(),
+                                               coerce_numeric=coerce_numeric)
+
+    except Exception:
+        if errors == 'raise':
+            raise
+
+    # attempt downcast only if the data has been successfully converted
+    # to a numerical dtype and if a downcast method has been specified
+    if downcast is not None and is_numeric_dtype(values):
+        typecodes = None
+
+        if downcast in ('integer', 'signed'):
+            typecodes = np.typecodes['Integer']
+        elif downcast == 'unsigned' and np.min(values) >= 0:
+            typecodes = np.typecodes['UnsignedInteger']
+        elif downcast == 'float':
+            typecodes = np.typecodes['Float']
+
+            # pandas support goes only to np.float32,
+            # as float dtypes smaller than that are
+            # extremely rare and not well supported
+            float_32_char = np.dtype(np.float32).char
+            float_32_ind = typecodes.index(float_32_char)
+            typecodes = typecodes[float_32_ind:]
+
+        if typecodes is not None:
+            # from smallest to largest
+            for dtype in typecodes:
+                if np.dtype(dtype).itemsize <= values.dtype.itemsize:
+                    values = maybe_downcast_to_dtype(values, dtype)
+
+                    # successful conversion
+                    if values.dtype == dtype:
+                        break
+
+    if is_series:
+        return pd.Series(values, index=arg.index, name=arg.name)
+    elif is_index:
+        # because we want to coerce to numeric if possible,
+        # do not use _shallow_copy_with_infer
+        return pd.Index(values, name=arg.name)
+    elif is_scalars:
+        return values[0]
+    else:
+        return values
diff --git a/pandas/core/tools/timedeltas.py b/pandas/core/tools/timedeltas.py
new file mode 100644
index 0000000000000..7ebaf3056e79e
--- /dev/null
+++ b/pandas/core/tools/timedeltas.py
@@ -0,0 +1,172 @@
+"""
+timedelta support tools
+"""
+
+import warnings
+
+import numpy as np
+
+from pandas._libs.tslibs import NaT
+from pandas._libs.tslibs.timedeltas import Timedelta, parse_timedelta_unit
+
+from pandas.core.dtypes.common import is_list_like
+from pandas.core.dtypes.generic import ABCIndexClass, ABCSeries
+
+from pandas.core.arrays.timedeltas import sequence_to_td64ns
+
+
+def to_timedelta(arg, unit='ns', box=True, errors='raise'):
+    """
+    Convert argument to timedelta.
+
+    Timedeltas are absolute differences in times, expressed in difference
+    units (e.g. days, hours, minutes, seconds). This method converts
+    an argument from a recognized timedelta format / value into
+    a Timedelta type.
+
+    Parameters
+    ----------
+    arg : str, timedelta, list-like or Series
+        The data to be converted to timedelta.
+    unit : str, default 'ns'
+        Denotes the unit of the arg. Possible values:
+        ('Y', 'M', 'W', 'D', 'days', 'day', 'hours', hour', 'hr',
+        'h', 'm', 'minute', 'min', 'minutes', 'T', 'S', 'seconds',
+        'sec', 'second', 'ms', 'milliseconds', 'millisecond',
+        'milli', 'millis', 'L', 'us', 'microseconds', 'microsecond',
+        'micro', 'micros', 'U', 'ns', 'nanoseconds', 'nano', 'nanos',
+        'nanosecond', 'N').
+    box : bool, default True
+        - If True returns a Timedelta/TimedeltaIndex of the results.
+        - If False returns a numpy.timedelta64 or numpy.darray of
+          values of dtype timedelta64[ns].
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception.
+        - If 'coerce', then invalid parsing will be set as NaT.
+        - If 'ignore', then invalid parsing will return the input.
+
+    Returns
+    -------
+    timedelta64 or numpy.array of timedelta64
+        Output type returned if parsing succeeded.
+
+    See Also
+    --------
+    DataFrame.astype : Cast argument to a specified dtype.
+    to_datetime : Convert argument to datetime.
+
+    Examples
+    --------
+
+    Parsing a single string to a Timedelta:
+
+    >>> pd.to_timedelta('1 days 06:05:01.00003')
+    Timedelta('1 days 06:05:01.000030')
+    >>> pd.to_timedelta('15.5us')
+    Timedelta('0 days 00:00:00.000015')
+
+    Parsing a list or array of strings:
+
+    >>> pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
+    TimedeltaIndex(['1 days 06:05:01.000030', '0 days 00:00:00.000015', NaT],
+                   dtype='timedelta64[ns]', freq=None)
+
+    Converting numbers by specifying the `unit` keyword argument:
+
+    >>> pd.to_timedelta(np.arange(5), unit='s')
+    TimedeltaIndex(['00:00:00', '00:00:01', '00:00:02',
+                    '00:00:03', '00:00:04'],
+                   dtype='timedelta64[ns]', freq=None)
+    >>> pd.to_timedelta(np.arange(5), unit='d')
+    TimedeltaIndex(['0 days', '1 days', '2 days', '3 days', '4 days'],
+                   dtype='timedelta64[ns]', freq=None)
+
+    Returning an ndarray by using the 'box' keyword argument:
+
+    >>> pd.to_timedelta(np.arange(5), box=False)
+    array([0, 1, 2, 3, 4], dtype='timedelta64[ns]')
+    """
+    unit = parse_timedelta_unit(unit)
+
+    if errors not in ('ignore', 'raise', 'coerce'):
+        raise ValueError("errors must be one of 'ignore', "
+                         "'raise', or 'coerce'}")
+
+    if unit in {'Y', 'y', 'M'}:
+        warnings.warn("M and Y units are deprecated and "
+                      "will be removed in a future version.",
+                      FutureWarning, stacklevel=2)
+
+    if arg is None:
+        return arg
+    elif isinstance(arg, ABCSeries):
+        values = _convert_listlike(arg._values, unit=unit,
+                                   box=False, errors=errors)
+        return arg._constructor(values, index=arg.index, name=arg.name)
+    elif isinstance(arg, ABCIndexClass):
+        return _convert_listlike(arg, unit=unit, box=box,
+                                 errors=errors, name=arg.name)
+    elif isinstance(arg, np.ndarray) and arg.ndim == 0:
+        # extract array scalar and process below
+        arg = arg.item()
+    elif is_list_like(arg) and getattr(arg, 'ndim', 1) == 1:
+        return _convert_listlike(arg, unit=unit, box=box, errors=errors)
+    elif getattr(arg, 'ndim', 1) > 1:
+        raise TypeError('arg must be a string, timedelta, list, tuple, '
+                        '1-d array, or Series')
+
+    # ...so it must be a scalar value. Return scalar.
+    return _coerce_scalar_to_timedelta_type(arg, unit=unit,
+                                            box=box, errors=errors)
+
+
+def _coerce_scalar_to_timedelta_type(r, unit='ns', box=True, errors='raise'):
+    """Convert string 'r' to a timedelta object."""
+
+    try:
+        result = Timedelta(r, unit)
+        if not box:
+            # explicitly view as timedelta64 for case when result is pd.NaT
+            result = result.asm8.view('timedelta64[ns]')
+    except ValueError:
+        if errors == 'raise':
+            raise
+        elif errors == 'ignore':
+            return r
+
+        # coerce
+        result = NaT
+
+    return result
+
+
+def _convert_listlike(arg, unit='ns', box=True, errors='raise', name=None):
+    """Convert a list of objects to a timedelta index object."""
+
+    if isinstance(arg, (list, tuple)) or not hasattr(arg, 'dtype'):
+        # This is needed only to ensure that in the case where we end up
+        #  returning arg (errors == "ignore"), and where the input is a
+        #  generator, we return a useful list-like instead of a
+        #  used-up generator
+        arg = np.array(list(arg), dtype=object)
+
+    try:
+        value = sequence_to_td64ns(arg, unit=unit,
+                                   errors=errors, copy=False)[0]
+    except ValueError:
+        if errors == 'ignore':
+            return arg
+        else:
+            # This else-block accounts for the cases when errors='raise'
+            # and errors='coerce'. If errors == 'raise', these errors
+            # should be raised. If errors == 'coerce', we shouldn't
+            # expect any errors to be raised, since all parsing errors
+            # cause coercion to pd.NaT. However, if an error / bug is
+            # introduced that causes an Exception to be raised, we would
+            # like to surface it.
+            raise
+
+    if box:
+        from pandas import TimedeltaIndex
+        value = TimedeltaIndex(value, unit='ns', name=name)
+    return value
diff --git a/pandas/tools/__init__.py b/pandas/core/util/__init__.py
similarity index 100%
rename from pandas/tools/__init__.py
rename to pandas/core/util/__init__.py
diff --git a/pandas/core/util/hashing.py b/pandas/core/util/hashing.py
new file mode 100644
index 0000000000000..29fc1e3671a83
--- /dev/null
+++ b/pandas/core/util/hashing.py
@@ -0,0 +1,333 @@
+"""
+data hash pandas / numpy objects
+"""
+import itertools
+
+import numpy as np
+
+from pandas._libs import hashing, tslibs
+
+from pandas.core.dtypes.cast import infer_dtype_from_scalar
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_extension_array_dtype, is_list_like)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndexClass, ABCMultiIndex, ABCSeries)
+from pandas.core.dtypes.missing import isna
+
+# 16 byte long hashing key
+_default_hash_key = '0123456789123456'
+
+
+def _combine_hash_arrays(arrays, num_items):
+    """
+    Parameters
+    ----------
+    arrays : generator
+    num_items : int
+
+    Should be the same as CPython's tupleobject.c
+    """
+    try:
+        first = next(arrays)
+    except StopIteration:
+        return np.array([], dtype=np.uint64)
+
+    arrays = itertools.chain([first], arrays)
+
+    mult = np.uint64(1000003)
+    out = np.zeros_like(first) + np.uint64(0x345678)
+    for i, a in enumerate(arrays):
+        inverse_i = num_items - i
+        out ^= a
+        out *= mult
+        mult += np.uint64(82520 + inverse_i + inverse_i)
+    assert i + 1 == num_items, 'Fed in wrong num_items'
+    out += np.uint64(97531)
+    return out
+
+
+def hash_pandas_object(obj, index=True, encoding='utf8', hash_key=None,
+                       categorize=True):
+    """
+    Return a data hash of the Index/Series/DataFrame
+
+    .. versionadded:: 0.19.2
+
+    Parameters
+    ----------
+    index : boolean, default True
+        include the index in the hash (if Series/DataFrame)
+    encoding : string, default 'utf8'
+        encoding for data & key when strings
+    hash_key : string key to encode, default to _default_hash_key
+    categorize : bool, default True
+        Whether to first categorize object arrays before hashing. This is more
+        efficient when the array contains duplicate values.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    Series of uint64, same length as the object
+    """
+    from pandas import Series
+    if hash_key is None:
+        hash_key = _default_hash_key
+
+    if isinstance(obj, ABCMultiIndex):
+        return Series(hash_tuples(obj, encoding, hash_key),
+                      dtype='uint64', copy=False)
+
+    if isinstance(obj, ABCIndexClass):
+        h = hash_array(obj.values, encoding, hash_key,
+                       categorize).astype('uint64', copy=False)
+        h = Series(h, index=obj, dtype='uint64', copy=False)
+    elif isinstance(obj, ABCSeries):
+        h = hash_array(obj.values, encoding, hash_key,
+                       categorize).astype('uint64', copy=False)
+        if index:
+            index_iter = (hash_pandas_object(obj.index,
+                                             index=False,
+                                             encoding=encoding,
+                                             hash_key=hash_key,
+                                             categorize=categorize).values
+                          for _ in [None])
+            arrays = itertools.chain([h], index_iter)
+            h = _combine_hash_arrays(arrays, 2)
+
+        h = Series(h, index=obj.index, dtype='uint64', copy=False)
+
+    elif isinstance(obj, ABCDataFrame):
+        hashes = (hash_array(series.values) for _, series in obj.iteritems())
+        num_items = len(obj.columns)
+        if index:
+            index_hash_generator = (hash_pandas_object(obj.index,
+                                                       index=False,
+                                                       encoding=encoding,
+                                                       hash_key=hash_key,
+                                                       categorize=categorize).values  # noqa
+                                    for _ in [None])
+            num_items += 1
+            hashes = itertools.chain(hashes, index_hash_generator)
+        h = _combine_hash_arrays(hashes, num_items)
+
+        h = Series(h, index=obj.index, dtype='uint64', copy=False)
+    else:
+        raise TypeError("Unexpected type for hashing %s" % type(obj))
+    return h
+
+
+def hash_tuples(vals, encoding='utf8', hash_key=None):
+    """
+    Hash an MultiIndex / list-of-tuples efficiently
+
+    .. versionadded:: 0.20.0
+
+    Parameters
+    ----------
+    vals : MultiIndex, list-of-tuples, or single tuple
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    ndarray of hashed values array
+    """
+    is_tuple = False
+    if isinstance(vals, tuple):
+        vals = [vals]
+        is_tuple = True
+    elif not is_list_like(vals):
+        raise TypeError("must be convertible to a list-of-tuples")
+
+    from pandas import Categorical, MultiIndex
+
+    if not isinstance(vals, ABCMultiIndex):
+        vals = MultiIndex.from_tuples(vals)
+
+    # create a list-of-Categoricals
+    vals = [Categorical(vals.codes[level],
+                        vals.levels[level],
+                        ordered=False,
+                        fastpath=True)
+            for level in range(vals.nlevels)]
+
+    # hash the list-of-ndarrays
+    hashes = (_hash_categorical(cat,
+                                encoding=encoding,
+                                hash_key=hash_key)
+              for cat in vals)
+    h = _combine_hash_arrays(hashes, len(vals))
+    if is_tuple:
+        h = h[0]
+
+    return h
+
+
+def hash_tuple(val, encoding='utf8', hash_key=None):
+    """
+    Hash a single tuple efficiently
+
+    Parameters
+    ----------
+    val : single tuple
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    hash
+
+    """
+    hashes = (_hash_scalar(v, encoding=encoding, hash_key=hash_key)
+              for v in val)
+
+    h = _combine_hash_arrays(hashes, len(val))[0]
+
+    return h
+
+
+def _hash_categorical(c, encoding, hash_key):
+    """
+    Hash a Categorical by hashing its categories, and then mapping the codes
+    to the hashes
+
+    Parameters
+    ----------
+    c : Categorical
+    encoding : string, default 'utf8'
+    hash_key : string key to encode, default to _default_hash_key
+
+    Returns
+    -------
+    ndarray of hashed values array, same size as len(c)
+    """
+    # Convert ExtensionArrays to ndarrays
+    values = np.asarray(c.categories.values)
+    hashed = hash_array(values, encoding, hash_key,
+                        categorize=False)
+
+    # we have uint64, as we don't directly support missing values
+    # we don't want to use take_nd which will coerce to float
+    # instead, directly construct the result with a
+    # max(np.uint64) as the missing value indicator
+    #
+    # TODO: GH 15362
+
+    mask = c.isna()
+    if len(hashed):
+        result = hashed.take(c.codes)
+    else:
+        result = np.zeros(len(mask), dtype='uint64')
+
+    if mask.any():
+        result[mask] = np.iinfo(np.uint64).max
+
+    return result
+
+
+def hash_array(vals, encoding='utf8', hash_key=None, categorize=True):
+    """
+    Given a 1d array, return an array of deterministic integers.
+
+    .. versionadded:: 0.19.2
+
+    Parameters
+    ----------
+    vals : ndarray, Categorical
+    encoding : string, default 'utf8'
+        encoding for data & key when strings
+    hash_key : string key to encode, default to _default_hash_key
+    categorize : bool, default True
+        Whether to first categorize object arrays before hashing. This is more
+        efficient when the array contains duplicate values.
+
+        .. versionadded:: 0.20.0
+
+    Returns
+    -------
+    1d uint64 numpy array of hash values, same length as the vals
+    """
+
+    if not hasattr(vals, 'dtype'):
+        raise TypeError("must pass a ndarray-like")
+    dtype = vals.dtype
+
+    if hash_key is None:
+        hash_key = _default_hash_key
+
+    # For categoricals, we hash the categories, then remap the codes to the
+    # hash values. (This check is above the complex check so that we don't ask
+    # numpy if categorical is a subdtype of complex, as it will choke).
+    if is_categorical_dtype(dtype):
+        return _hash_categorical(vals, encoding, hash_key)
+    elif is_extension_array_dtype(dtype):
+        vals, _ = vals._values_for_factorize()
+        dtype = vals.dtype
+
+    # we'll be working with everything as 64-bit values, so handle this
+    # 128-bit value early
+    if np.issubdtype(dtype, np.complex128):
+        return hash_array(vals.real) + 23 * hash_array(vals.imag)
+
+    # First, turn whatever array this is into unsigned 64-bit ints, if we can
+    # manage it.
+    elif isinstance(dtype, np.bool):
+        vals = vals.astype('u8')
+    elif issubclass(dtype.type, (np.datetime64, np.timedelta64)):
+        vals = vals.view('i8').astype('u8', copy=False)
+    elif issubclass(dtype.type, np.number) and dtype.itemsize <= 8:
+        vals = vals.view('u{}'.format(vals.dtype.itemsize)).astype('u8')
+    else:
+        # With repeated values, its MUCH faster to categorize object dtypes,
+        # then hash and rename categories. We allow skipping the categorization
+        # when the values are known/likely to be unique.
+        if categorize:
+            from pandas import factorize, Categorical, Index
+            codes, categories = factorize(vals, sort=False)
+            cat = Categorical(codes, Index(categories),
+                              ordered=False, fastpath=True)
+            return _hash_categorical(cat, encoding, hash_key)
+
+        try:
+            vals = hashing.hash_object_array(vals, hash_key, encoding)
+        except TypeError:
+            # we have mixed types
+            vals = hashing.hash_object_array(vals.astype(str).astype(object),
+                                             hash_key, encoding)
+
+    # Then, redistribute these 64-bit ints within the space of 64-bit ints
+    vals ^= vals >> 30
+    vals *= np.uint64(0xbf58476d1ce4e5b9)
+    vals ^= vals >> 27
+    vals *= np.uint64(0x94d049bb133111eb)
+    vals ^= vals >> 31
+    return vals
+
+
+def _hash_scalar(val, encoding='utf8', hash_key=None):
+    """
+    Hash scalar value
+
+    Returns
+    -------
+    1d uint64 numpy array of hash value, of length 1
+    """
+
+    if isna(val):
+        # this is to be consistent with the _hash_categorical implementation
+        return np.array([np.iinfo(np.uint64).max], dtype='u8')
+
+    if getattr(val, 'tzinfo', None) is not None:
+        # for tz-aware datetimes, we need the underlying naive UTC value and
+        # not the tz aware object or pd extension type (as
+        # infer_dtype_from_scalar would do)
+        if not isinstance(val, tslibs.Timestamp):
+            val = tslibs.Timestamp(val)
+        val = val.tz_convert(None)
+
+    dtype, val = infer_dtype_from_scalar(val)
+    vals = np.array([val], dtype=dtype)
+
+    return hash_array(vals, hash_key=hash_key, encoding=encoding,
+                      categorize=False)
diff --git a/pandas/core/window.py b/pandas/core/window.py
index 9c9f861451309..9e29fdb94c1e0 100644
--- a/pandas/core/window.py
+++ b/pandas/core/window.py
@@ -1,81 +1,66 @@
 """
-
-provide a generic structure to support window functions,
-similar to how we have a Groupby object
-
-
+Provide a generic structure to support window functions,
+similar to how we have a Groupby object.
 """
 from __future__ import division
 
-import warnings
-import numpy as np
 from collections import defaultdict
 from datetime import timedelta
+from textwrap import dedent
+import warnings
 
-from pandas.types.generic import (ABCSeries,
-                                  ABCDataFrame,
-                                  ABCDatetimeIndex,
-                                  ABCTimedeltaIndex,
-                                  ABCPeriodIndex)
-from pandas.types.common import (is_integer,
-                                 is_bool,
-                                 is_float_dtype,
-                                 is_integer_dtype,
-                                 needs_i8_conversion,
-                                 is_timedelta64_dtype,
-                                 is_list_like,
-                                 _ensure_float64,
-                                 is_scalar)
-import pandas as pd
-
-from pandas.core.base import (PandasObject, SelectionMixin,
-                              GroupByMixin)
-import pandas.core.common as com
-import pandas.core.libwindow as _window
-from pandas.tseries.offsets import DateOffset
-from pandas import compat
+import numpy as np
+
+import pandas._libs.window as libwindow
+import pandas.compat as compat
 from pandas.compat.numpy import function as nv
-from pandas.util.decorators import (Substitution, Appender,
-                                    cache_readonly)
-from textwrap import dedent
+from pandas.util._decorators import Appender, Substitution, cache_readonly
 
+from pandas.core.dtypes.common import (
+    ensure_float64, is_bool, is_float_dtype, is_integer, is_integer_dtype,
+    is_list_like, is_scalar, is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCDateOffset, ABCDatetimeIndex, ABCPeriodIndex, ABCSeries,
+    ABCTimedeltaIndex)
 
-_shared_docs = dict()
-_doc_template = """
+from pandas.core.base import PandasObject, SelectionMixin
+import pandas.core.common as com
+from pandas.core.generic import _shared_docs
+from pandas.core.groupby.base import GroupByMixin
 
-Returns
--------
-same type as input
+_shared_docs = dict(**_shared_docs)
+_doc_template = """
+        Returns
+        -------
+        Series or DataFrame
+            Return type is determined by the caller.
 
-See also
---------
-pandas.Series.%(name)s
-pandas.DataFrame.%(name)s
+        See Also
+        --------
+        Series.%(name)s : Series %(name)s.
+        DataFrame.%(name)s : DataFrame %(name)s.
 """
 
 
 class _Window(PandasObject, SelectionMixin):
-    _attributes = ['window', 'min_periods', 'freq', 'center', 'win_type',
-                   'axis', 'on']
+    _attributes = ['window', 'min_periods', 'center', 'win_type',
+                   'axis', 'on', 'closed']
     exclusions = set()
 
-    def __init__(self, obj, window=None, min_periods=None, freq=None,
-                 center=False, win_type=None, axis=0, on=None, **kwargs):
-
-        if freq is not None:
-            warnings.warn("The freq kw is deprecated and will be removed in a "
-                          "future version. You can resample prior to passing "
-                          "to a window function", FutureWarning, stacklevel=3)
+    def __init__(self, obj, window=None, min_periods=None,
+                 center=False, win_type=None, axis=0, on=None, closed=None,
+                 **kwargs):
 
         self.__dict__.update(kwargs)
         self.blocks = []
         self.obj = obj
         self.on = on
+        self.closed = closed
         self.window = window
         self.min_periods = min_periods
-        self.freq = freq
         self.center = center
         self.win_type = win_type
+        self.win_freq = None
         self.axis = obj._get_axis_number(axis) if axis is not None else None
         self.validate()
 
@@ -98,31 +83,28 @@ def is_freq_type(self):
     def validate(self):
         if self.center is not None and not is_bool(self.center):
             raise ValueError("center must be a boolean")
-        if self.min_periods is not None and not \
-           is_integer(self.min_periods):
+        if (self.min_periods is not None and
+                not is_integer(self.min_periods)):
             raise ValueError("min_periods must be an integer")
+        if (self.closed is not None and
+                self.closed not in ['right', 'both', 'left', 'neither']):
+            raise ValueError("closed must be 'right', 'left', 'both' or "
+                             "'neither'")
 
-    def _convert_freq(self, how=None):
-        """ resample according to the how, return a new object """
-
+    def _convert_freq(self):
+        """
+        Resample according to the how, return a new object.
+        """
         obj = self._selected_obj
         index = None
-        if (self.freq is not None and
-                isinstance(obj, (ABCSeries, ABCDataFrame))):
-            if how is not None:
-                warnings.warn("The how kw argument is deprecated and removed "
-                              "in a future version. You can resample prior "
-                              "to passing to a window function", FutureWarning,
-                              stacklevel=6)
-
-            obj = obj.resample(self.freq).aggregate(how or 'asfreq')
-
         return obj, index
 
-    def _create_blocks(self, how):
-        """ split data into blocks & return conformed data """
+    def _create_blocks(self):
+        """
+        Split data into blocks & return conformed data.
+        """
 
-        obj, index = self._convert_freq(how)
+        obj, index = self._convert_freq()
         if index is not None:
             index = self._on
 
@@ -131,18 +113,17 @@ def _create_blocks(self, how):
             if obj.ndim == 2:
                 obj = obj.reindex(columns=obj.columns.difference([self.on]),
                                   copy=False)
-        blocks = obj.as_blocks(copy=False).values()
+        blocks = obj._to_dict_of_blocks(copy=False).values()
 
         return blocks, obj, index
 
     def _gotitem(self, key, ndim, subset=None):
         """
-        sub-classes to define
-        return a sliced object
+        Sub-classes to define. Return a sliced object.
 
         Parameters
         ----------
-        key : string / list of selections
+        key : str / list of selections
         ndim : 1,2
             requested ndim of result
         subset : object, default None
@@ -179,17 +160,23 @@ def _window_type(self):
         return self.__class__.__name__
 
     def __unicode__(self):
-        """ provide a nice str repr of our rolling object """
+        """
+        Provide a nice str repr of our rolling object.
+        """
 
-        attrs = ["{k}={v}".format(k=k, v=getattr(self, k))
+        attrs = ("{k}={v}".format(k=k, v=getattr(self, k))
                  for k in self._attributes
-                 if getattr(self, k, None) is not None]
+                 if getattr(self, k, None) is not None)
         return "{klass} [{attrs}]".format(klass=self._window_type,
                                           attrs=','.join(attrs))
 
+    def __iter__(self):
+        url = 'https://github.com/pandas-dev/pandas/issues/11704'
+        raise NotImplementedError('See issue #11704 {url}'.format(url=url))
+
     def _get_index(self, index=None):
         """
-        Return index as ndarrays
+        Return index as ndarrays.
 
         Returns
         -------
@@ -202,7 +189,7 @@ def _get_index(self, index=None):
             return index, index.asi8
         return index, index
 
-    def _prep_values(self, values=None, kill_inf=True, how=None):
+    def _prep_values(self, values=None, kill_inf=True):
 
         if values is None:
             values = getattr(self._selected_obj, 'values', self._selected_obj)
@@ -210,9 +197,9 @@ def _prep_values(self, values=None, kill_inf=True, how=None):
         # GH #12373 : rolling functions error on float32 data
         # make sure the data is coerced to float64
         if is_float_dtype(values.dtype):
-            values = _ensure_float64(values)
+            values = ensure_float64(values)
         elif is_integer_dtype(values.dtype):
-            values = _ensure_float64(values)
+            values = ensure_float64(values)
         elif needs_i8_conversion(values.dtype):
             raise NotImplementedError("ops for {action} for this "
                                       "dtype {dtype} are not "
@@ -221,7 +208,7 @@ def _prep_values(self, values=None, kill_inf=True, how=None):
                                           dtype=values.dtype))
         else:
             try:
-                values = _ensure_float64(values)
+                values = ensure_float64(values)
             except (ValueError, TypeError):
                 raise TypeError("cannot handle this type -> {0}"
                                 "".format(values.dtype))
@@ -233,7 +220,9 @@ def _prep_values(self, values=None, kill_inf=True, how=None):
         return values
 
     def _wrap_result(self, result, block=None, obj=None):
-        """ wrap a single result """
+        """
+        Wrap a single result.
+        """
 
         if obj is None:
             obj = self._selected_obj
@@ -244,7 +233,8 @@ def _wrap_result(self, result, block=None, obj=None):
             # coerce if necessary
             if block is not None:
                 if is_timedelta64_dtype(block.values.dtype):
-                    result = pd.to_timedelta(
+                    from pandas import to_timedelta
+                    result = to_timedelta(
                         result.ravel(), unit='ns').values.reshape(result.shape)
 
             if result.ndim == 1:
@@ -256,17 +246,17 @@ def _wrap_result(self, result, block=None, obj=None):
 
     def _wrap_results(self, results, blocks, obj):
         """
-        wrap the results
+        Wrap the results.
 
-        Paramters
-        ---------
+        Parameters
+        ----------
         results : list of ndarrays
         blocks : list of blocks
         obj : conformed data (may be resampled)
         """
 
-        from pandas import Series
-        from pandas.core.index import _ensure_index
+        from pandas import Series, concat
+        from pandas.core.index import ensure_index
 
         final = []
         for result, block in zip(results, blocks):
@@ -280,15 +270,14 @@ def _wrap_results(self, results, blocks, obj):
         # we want to put it back into the results
         # in the same location
         columns = self._selected_obj.columns
-        if self.on is not None \
-           and not self._on.equals(obj.index):
+        if self.on is not None and not self._on.equals(obj.index):
 
             name = self._on.name
             final.append(Series(self._on, index=obj.index, name=name))
 
             if self._selection is not None:
 
-                selection = _ensure_index(self._selection)
+                selection = ensure_index(self._selection)
 
                 # need to reorder to include original location of
                 # the on column (if its not already there)
@@ -299,19 +288,19 @@ def _wrap_results(self, results, blocks, obj):
 
         if not len(final):
             return obj.astype('float64')
-        return pd.concat(final, axis=1).reindex(columns=columns,
-                                                copy=False)
+        return concat(final, axis=1).reindex(columns=columns, copy=False)
 
     def _center_window(self, result, window):
-        """ center the result in the window """
+        """
+        Center the result in the window.
+        """
         if self.axis > result.ndim - 1:
             raise ValueError("Requested axis is larger then no. of argument "
                              "dimensions")
 
-        from pandas import Series, DataFrame
         offset = _offset(window, True)
         if offset > 0:
-            if isinstance(result, (Series, DataFrame)):
+            if isinstance(result, (ABCSeries, ABCDataFrame)):
                 result = result.slice_shift(-offset, axis=self.axis)
             else:
                 lead_indexer = [slice(None)] * result.ndim
@@ -322,31 +311,134 @@ def _center_window(self, result, window):
     def aggregate(self, arg, *args, **kwargs):
         result, how = self._aggregate(arg, *args, **kwargs)
         if result is None:
-            return self.apply(arg, args=args, kwargs=kwargs)
+            return self.apply(arg, raw=False, args=args, kwargs=kwargs)
         return result
 
     agg = aggregate
 
     _shared_docs['sum'] = dedent("""
-    %(name)s sum
+    Calculate %(name)s sum of given DataFrame or Series.
 
     Parameters
     ----------
-    how : string, default None (DEPRECATED)
-        Method for down- or re-sampling""")
+    *args, **kwargs
+        For compatibility with other %(name)s methods. Has no effect
+        on the computed value.
+
+    Returns
+    -------
+    Series or DataFrame
+        Same type as the input, with the same index, containing the
+        %(name)s sum.
+
+    See Also
+    --------
+    Series.sum : Reducing sum for Series.
+    DataFrame.sum : Reducing sum for DataFrame.
+
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4, 5])
+    >>> s
+    0    1
+    1    2
+    2    3
+    3    4
+    4    5
+    dtype: int64
+
+    >>> s.rolling(3).sum()
+    0     NaN
+    1     NaN
+    2     6.0
+    3     9.0
+    4    12.0
+    dtype: float64
+
+    >>> s.expanding(3).sum()
+    0     NaN
+    1     NaN
+    2     6.0
+    3    10.0
+    4    15.0
+    dtype: float64
+
+    >>> s.rolling(3, center=True).sum()
+    0     NaN
+    1     6.0
+    2     9.0
+    3    12.0
+    4     NaN
+    dtype: float64
+
+    For DataFrame, each %(name)s sum is computed column-wise.
+
+    >>> df = pd.DataFrame({"A": s, "B": s ** 2})
+    >>> df
+       A   B
+    0  1   1
+    1  2   4
+    2  3   9
+    3  4  16
+    4  5  25
+
+    >>> df.rolling(3).sum()
+          A     B
+    0   NaN   NaN
+    1   NaN   NaN
+    2   6.0  14.0
+    3   9.0  29.0
+    4  12.0  50.0
+    """)
 
     _shared_docs['mean'] = dedent("""
-    %(name)s mean
+    Calculate the %(name)s mean of the values.
 
     Parameters
     ----------
-    how : string, default None (DEPRECATED)
-        Method for down- or re-sampling""")
+    *args
+        Under Review.
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.mean : Equivalent method for Series.
+    DataFrame.mean : Equivalent method for DataFrame.
+
+    Examples
+    --------
+    The below examples will show rolling mean calculations with window sizes of
+    two and three, respectively.
+
+    >>> s = pd.Series([1, 2, 3, 4])
+    >>> s.rolling(2).mean()
+    0    NaN
+    1    1.5
+    2    2.5
+    3    3.5
+    dtype: float64
+
+    >>> s.rolling(3).mean()
+    0    NaN
+    1    NaN
+    2    2.0
+    3    3.0
+    dtype: float64
+    """)
 
 
 class Window(_Window):
     """
-    Provides rolling window calculcations.
+    Provide rolling window calculations.
 
     .. versionadded:: 0.18.0
 
@@ -363,26 +455,64 @@ class Window(_Window):
     min_periods : int, default None
         Minimum number of observations in window required to have a value
         (otherwise result is NA). For a window that is specified by an offset,
-        this will default to 1.
-    freq : string or DateOffset object, optional (default None) (DEPRECATED)
-        Frequency to conform the data to before computing the statistic.
-        Specified as a frequency string or DateOffset object.
-    center : boolean, default False
+        `min_periods` will default to 1. Otherwise, `min_periods` will default
+        to the size of the window.
+    center : bool, default False
         Set the labels at the center of the window.
-    win_type : string, default None
-        Provide a window type. See the notes below.
-    on : string, optional
+    win_type : str, default None
+        Provide a window type. If ``None``, all points are evenly weighted.
+        See the notes below for further information.
+    on : str, optional
         For a DataFrame, column on which to calculate
         the rolling window, rather than the index
+    axis : int or str, default 0
+    closed : str, default None
+        Make the interval closed on the 'right', 'left', 'both' or
+        'neither' endpoints.
+        For offset-based windows, it defaults to 'right'.
+        For fixed windows, defaults to 'both'. Remaining cases not implemented
+        for fixed windows.
 
-        .. versionadded:: 0.19.0
-
-    axis : int or string, default 0
+        .. versionadded:: 0.20.0
 
     Returns
     -------
     a Window or Rolling sub-classed for the particular operation
 
+    See Also
+    --------
+    expanding : Provides expanding transformations.
+    ewm : Provides exponential weighted functions.
+
+    Notes
+    -----
+    By default, the result is set to the right edge of the window. This can be
+    changed to the center of the window by setting ``center=True``.
+
+    To learn more about the offsets & frequency strings, please see `this link
+    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
+
+    The recognized win_types are:
+
+    * ``boxcar``
+    * ``triang``
+    * ``blackman``
+    * ``hamming``
+    * ``bartlett``
+    * ``parzen``
+    * ``bohman``
+    * ``blackmanharris``
+    * ``nuttall``
+    * ``barthann``
+    * ``kaiser`` (needs beta)
+    * ``gaussian`` (needs std)
+    * ``general_gaussian`` (needs power, width)
+    * ``slepian`` (needs width).
+
+    If ``win_type=None`` all points are evenly weighted. To learn more about
+    different window types see `scipy.signal window functions
+    <https://docs.scipy.org/doc/scipy/reference/signal.html#window-functions>`__.
+
     Examples
     --------
 
@@ -417,7 +547,7 @@ class Window(_Window):
     3  NaN
     4  NaN
 
-    Same as above, but explicity set the min_periods
+    Same as above, but explicitly set the min_periods
 
     >>> df.rolling(2, min_periods=1).sum()
          B
@@ -430,11 +560,11 @@ class Window(_Window):
     A ragged (meaning not-a-regular frequency), time-indexed DataFrame
 
     >>> df = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]},
-    ....:                 index = [pd.Timestamp('20130101 09:00:00'),
-    ....:                          pd.Timestamp('20130101 09:00:02'),
-    ....:                          pd.Timestamp('20130101 09:00:03'),
-    ....:                          pd.Timestamp('20130101 09:00:05'),
-    ....:                          pd.Timestamp('20130101 09:00:06')])
+    ...                   index = [pd.Timestamp('20130101 09:00:00'),
+    ...                            pd.Timestamp('20130101 09:00:02'),
+    ...                            pd.Timestamp('20130101 09:00:03'),
+    ...                            pd.Timestamp('20130101 09:00:05'),
+    ...                            pd.Timestamp('20130101 09:00:06')])
 
     >>> df
                            B
@@ -444,7 +574,6 @@ class Window(_Window):
     2013-01-01 09:00:05  NaN
     2013-01-01 09:00:06  4.0
 
-
     Contrasting to an integer rolling window, this will roll a variable
     length window corresponding to the time period.
     The default for min_periods is 1.
@@ -456,36 +585,6 @@ class Window(_Window):
     2013-01-01 09:00:03  3.0
     2013-01-01 09:00:05  NaN
     2013-01-01 09:00:06  4.0
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the offsets & frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-
-    The recognized win_types are:
-
-    * ``boxcar``
-    * ``triang``
-    * ``blackman``
-    * ``hamming``
-    * ``bartlett``
-    * ``parzen``
-    * ``bohman``
-    * ``blackmanharris``
-    * ``nuttall``
-    * ``barthann``
-    * ``kaiser`` (needs beta)
-    * ``gaussian`` (needs std)
-    * ``general_gaussian`` (needs power, width)
-    * ``slepian`` (needs width).
-
     """
 
     def validate(self):
@@ -495,8 +594,8 @@ def validate(self):
         if isinstance(window, (list, tuple, np.ndarray)):
             pass
         elif is_integer(window):
-            if window < 0:
-                raise ValueError("window must be non-negative")
+            if window <= 0:
+                raise ValueError("window must be > 0 ")
             try:
                 import scipy.signal as sig
             except ImportError:
@@ -512,13 +611,13 @@ def validate(self):
 
     def _prep_window(self, **kwargs):
         """
-        provide validation for our window type, return the window
-        we have already been validated
+        Provide validation for our window type, return the window
+        we have already been validated.
         """
 
         window = self._get_window()
         if isinstance(window, (list, tuple, np.ndarray)):
-            return com._asarray_tuplesafe(window).astype(float)
+            return com.asarray_tuplesafe(window).astype(float)
         elif is_integer(window):
             import scipy.signal as sig
 
@@ -547,26 +646,24 @@ def _pop_args(win_type, arg_names, kwargs):
             # GH #15662. `False` makes symmetric window, rather than periodic.
             return sig.get_window(win_type, window, False).astype(float)
 
-    def _apply_window(self, mean=True, how=None, **kwargs):
+    def _apply_window(self, mean=True, **kwargs):
         """
         Applies a moving window of type ``window_type`` on the data.
 
         Parameters
         ----------
-        mean : boolean, default True
+        mean : bool, default True
             If True computes weighted mean, else weighted sum
-        how : string, default to None (DEPRECATED)
-            how to resample
 
         Returns
         -------
-        y : type of input argument
+        y : same type as input argument
 
         """
         window = self._prep_window(**kwargs)
         center = self.center
 
-        blocks, obj, index = self._create_blocks(how=how)
+        blocks, obj, index = self._create_blocks()
         results = []
         for b in blocks:
             try:
@@ -584,10 +681,10 @@ def _apply_window(self, mean=True, how=None, **kwargs):
 
             def f(arg, *args, **kwargs):
                 minp = _use_window(self.min_periods, len(window))
-                return _window.roll_window(np.concatenate((arg,
-                                                           additional_nans))
-                                           if center else arg, window, minp,
-                                           avg=mean)
+                return libwindow.roll_window(np.concatenate((arg,
+                                                             additional_nans))
+                                             if center else arg, window, minp,
+                                             avg=mean)
 
             result = np.apply_along_axis(f, self.axis, values)
 
@@ -597,9 +694,51 @@ def f(arg, *args, **kwargs):
 
         return self._wrap_results(results, blocks, obj)
 
-    @Substitution(name='rolling')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    pandas.DataFrame.rolling.aggregate
+    pandas.DataFrame.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.rolling(3, win_type='boxcar').agg('mean')
+              A         B         C
+    0       NaN       NaN       NaN
+    1       NaN       NaN       NaN
+    2 -0.885035  0.212600 -0.711689
+    3 -0.323928 -0.200122 -1.093408
+    4 -0.071445 -0.431533 -1.075833
+    5  0.504739  0.676083 -0.996353
+    6  0.358206  1.903256 -0.774200
+    7  0.906020  1.283573  0.085482
+    8 -0.096361  0.818139  0.472290
+    9  0.070889  0.134399 -0.031308
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='Series/DataFrame',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
     def aggregate(self, arg, *args, **kwargs):
         result, how = self._aggregate(arg, *args, **kwargs)
         if result is None:
@@ -612,14 +751,12 @@ def aggregate(self, arg, *args, **kwargs):
     agg = aggregate
 
     @Substitution(name='window')
-    @Appender(_doc_template)
     @Appender(_shared_docs['sum'])
     def sum(self, *args, **kwargs):
         nv.validate_window_func('sum', args, kwargs)
         return self._apply_window(mean=False, **kwargs)
 
     @Substitution(name='window')
-    @Appender(_doc_template)
     @Appender(_shared_docs['mean'])
     def mean(self, *args, **kwargs):
         nv.validate_window_func('mean', args, kwargs)
@@ -627,7 +764,9 @@ def mean(self, *args, **kwargs):
 
 
 class _GroupByMixin(GroupByMixin):
-    """ provide the groupby facilities """
+    """
+    Provide the groupby facilities.
+    """
 
     def __init__(self, obj, *args, **kwargs):
         parent = kwargs.pop('parent', None)  # noqa
@@ -644,10 +783,10 @@ def __init__(self, obj, *args, **kwargs):
     cov = GroupByMixin._dispatch('cov', other=None, pairwise=None)
 
     def _apply(self, func, name, window=None, center=None,
-               check_minp=None, how=None, **kwargs):
+               check_minp=None, **kwargs):
         """
-        dispatch to apply; we are stripping all of the _apply kwargs and
-        performing the original function call on the grouped object
+        Dispatch to apply; we are stripping all of the _apply kwargs and
+        performing the original function call on the grouped object.
         """
 
         def f(x, name=name, *args):
@@ -668,21 +807,20 @@ def _constructor(self):
         return Rolling
 
     def _apply(self, func, name=None, window=None, center=None,
-               check_minp=None, how=None, **kwargs):
+               check_minp=None, **kwargs):
         """
-        Rolling statistical measure using supplied function. Designed to be
-        used with passed-in Cython array-based functions.
+        Rolling statistical measure using supplied function.
+
+        Designed to be used with passed-in Cython array-based functions.
 
         Parameters
         ----------
-        func : string/callable to apply
-        name : string, optional
+        func : str/callable to apply
+        name : str, optional
            name of this function
         window : int/array, default to _get_window()
-        center : boolean, default to self.center
+        center : bool, default to self.center
         check_minp : function, default to _use_window
-        how : string, default to None (DEPRECATED)
-            how to resample
 
         Returns
         -------
@@ -696,15 +834,11 @@ def _apply(self, func, name=None, window=None, center=None,
         if check_minp is None:
             check_minp = _use_window
 
-        blocks, obj, index = self._create_blocks(how=how)
+        blocks, obj, index = self._create_blocks()
         index, indexi = self._get_index(index=index)
         results = []
         for b in blocks:
-            try:
-                values = self._prep_values(b.values)
-            except TypeError:
-                results.append(b.values.copy())
-                continue
+            values = self._prep_values(b.values)
 
             if values.size == 0:
                 results.append(values.copy())
@@ -712,17 +846,17 @@ def _apply(self, func, name=None, window=None, center=None,
 
             # if we have a string function name, wrap it
             if isinstance(func, compat.string_types):
-                cfunc = getattr(_window, func, None)
+                cfunc = getattr(libwindow, func, None)
                 if cfunc is None:
                     raise ValueError("we do not support this function "
-                                     "in _window.{0}".format(func))
+                                     "in libwindow.{func}".format(func=func))
 
-                def func(arg, window, min_periods=None):
+                def func(arg, window, min_periods=None, closed=None):
                     minp = check_minp(min_periods, window)
                     # ensure we are only rolling on floats
-                    arg = _ensure_float64(arg)
+                    arg = ensure_float64(arg)
                     return cfunc(arg,
-                                 window, minp, indexi, **kwargs)
+                                 window, minp, indexi, closed, **kwargs)
 
             # calculation function
             if center:
@@ -731,11 +865,13 @@ def func(arg, window, min_periods=None):
 
                 def calc(x):
                     return func(np.concatenate((x, additional_nans)),
-                                window, min_periods=self.min_periods)
+                                window, min_periods=self.min_periods,
+                                closed=self.closed)
             else:
 
                 def calc(x):
-                    return func(x, window, min_periods=self.min_periods)
+                    return func(x, window, min_periods=self.min_periods,
+                                closed=self.closed)
 
             with np.errstate(all='ignore'):
                 if values.ndim > 1:
@@ -753,108 +889,283 @@ def calc(x):
 
 class _Rolling_and_Expanding(_Rolling):
 
-    _shared_docs['count'] = """%(name)s count of number of non-NaN
-    observations inside provided window."""
+    _shared_docs['count'] = dedent(r"""
+    The %(name)s count of any non-NaN observations inside the window.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    DataFrame.count : Count of the full DataFrame.
+
+    Examples
+    --------
+    >>> s = pd.Series([2, 3, np.nan, 10])
+    >>> s.rolling(2).count()
+    0    1.0
+    1    2.0
+    2    1.0
+    3    1.0
+    dtype: float64
+    >>> s.rolling(3).count()
+    0    1.0
+    1    2.0
+    2    2.0
+    3    2.0
+    dtype: float64
+    >>> s.rolling(4).count()
+    0    1.0
+    1    2.0
+    2    2.0
+    3    3.0
+    dtype: float64
+    """)
 
     def count(self):
 
-        blocks, obj, index = self._create_blocks(how=None)
-        index, indexi = self._get_index(index=index)
+        blocks, obj, index = self._create_blocks()
+        # Validate the index
+        self._get_index(index=index)
 
         window = self._get_window()
         window = min(window, len(obj)) if not self.center else window
 
         results = []
         for b in blocks:
-            result = b.notnull().astype(int)
+            result = b.notna().astype(int)
             result = self._constructor(result, window=window, min_periods=0,
-                                       center=self.center).sum()
+                                       center=self.center,
+                                       closed=self.closed).sum()
             results.append(result)
 
         return self._wrap_results(results, blocks, obj)
 
-    _shared_docs['apply'] = dedent("""
-    %(name)s function apply
+    _shared_docs['apply'] = dedent(r"""
+    The %(name)s function's apply function.
 
     Parameters
     ----------
     func : function
-        Must produce a single value from an ndarray input
-        \*args and \*\*kwargs are passed to the function""")
+        Must produce a single value from an ndarray input if ``raw=True``
+        or a Series if ``raw=False``.
+    raw : bool, default None
+        * ``False`` : passes each row or column as a Series to the
+          function.
+        * ``True`` or ``None`` : the passed function will receive ndarray
+          objects instead.
+          If you are just applying a NumPy reduction function this will
+          achieve much better performance.
+
+        The `raw` parameter is required and will show a FutureWarning if
+        not passed. In the future `raw` will default to False.
+
+        .. versionadded:: 0.23.0
+    *args, **kwargs
+        Arguments and keyword arguments to be passed into func.
+
+    Returns
+    -------
+    Series or DataFrame
+        Return type is determined by the caller.
+
+    See Also
+    --------
+    Series.%(name)s : Series %(name)s.
+    DataFrame.%(name)s : DataFrame %(name)s.
+    """)
+
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        from pandas import Series
 
-    def apply(self, func, args=(), kwargs={}):
         # TODO: _level is unused?
         _level = kwargs.pop('_level', None)  # noqa
         window = self._get_window()
         offset = _offset(window, self.center)
         index, indexi = self._get_index()
 
-        def f(arg, window, min_periods):
+        # TODO: default is for backward compat
+        # change to False in the future
+        if raw is None:
+            warnings.warn(
+                "Currently, 'apply' passes the values as ndarrays to the "
+                "applied function. In the future, this will change to passing "
+                "it as Series objects. You need to specify 'raw=True' to keep "
+                "the current behaviour, and you can pass 'raw=False' to "
+                "silence this warning", FutureWarning, stacklevel=3)
+            raw = True
+
+        def f(arg, window, min_periods, closed):
             minp = _use_window(min_periods, window)
-            return _window.roll_generic(arg, window, minp, indexi,
-                                        offset, func, args,
-                                        kwargs)
+            if not raw:
+                arg = Series(arg, index=self.obj.index)
+            return libwindow.roll_generic(
+                arg, window, minp, indexi,
+                closed, offset, func, raw, args, kwargs)
 
         return self._apply(f, func, args=args, kwargs=kwargs,
-                           center=False)
+                           center=False, raw=raw)
 
     def sum(self, *args, **kwargs):
         nv.validate_window_func('sum', args, kwargs)
         return self._apply('roll_sum', 'sum', **kwargs)
 
     _shared_docs['max'] = dedent("""
-    %(name)s maximum
+    Calculate the %(name)s maximum.
 
     Parameters
     ----------
-    how : string, default 'max' (DEPRECATED)
-        Method for down- or re-sampling""")
+    *args, **kwargs
+        Arguments and keyword arguments to be passed into func.
+    """)
 
-    def max(self, how=None, *args, **kwargs):
+    def max(self, *args, **kwargs):
         nv.validate_window_func('max', args, kwargs)
-        if self.freq is not None and how is None:
-            how = 'max'
-        return self._apply('roll_max', 'max', how=how, **kwargs)
+        return self._apply('roll_max', 'max', **kwargs)
 
     _shared_docs['min'] = dedent("""
-    %(name)s minimum
+    Calculate the %(name)s minimum.
 
     Parameters
     ----------
-    how : string, default 'min' (DEPRECATED)
-        Method for down- or re-sampling""")
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with a Series.
+    DataFrame.%(name)s : Calling object with a DataFrame.
+    Series.min : Similar method for Series.
+    DataFrame.min : Similar method for DataFrame.
 
-    def min(self, how=None, *args, **kwargs):
+    Examples
+    --------
+    Performing a rolling minimum with a window size of 3.
+
+    >>> s = pd.Series([4, 3, 5, 2, 6])
+    >>> s.rolling(3).min()
+    0    NaN
+    1    NaN
+    2    3.0
+    3    2.0
+    4    2.0
+    dtype: float64
+    """)
+
+    def min(self, *args, **kwargs):
         nv.validate_window_func('min', args, kwargs)
-        if self.freq is not None and how is None:
-            how = 'min'
-        return self._apply('roll_min', 'min', how=how, **kwargs)
+        return self._apply('roll_min', 'min', **kwargs)
 
     def mean(self, *args, **kwargs):
         nv.validate_window_func('mean', args, kwargs)
         return self._apply('roll_mean', 'mean', **kwargs)
 
     _shared_docs['median'] = dedent("""
-    %(name)s median
+    Calculate the %(name)s median.
 
     Parameters
     ----------
-    how : string, default 'median' (DEPRECATED)
-        Method for down- or re-sampling""")
+    **kwargs
+        For compatibility with other %(name)s methods. Has no effect
+        on the computed median.
 
-    def median(self, how=None, **kwargs):
-        if self.freq is not None and how is None:
-            how = 'median'
-        return self._apply('roll_median_c', 'median', how=how, **kwargs)
+    Returns
+    -------
+    Series or DataFrame
+        Returned type is the same as the original object.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.median : Equivalent method for Series.
+    DataFrame.median : Equivalent method for DataFrame.
+
+    Examples
+    --------
+    Compute the rolling median of a series with a window size of 3.
+
+    >>> s = pd.Series([0, 1, 2, 3, 4])
+    >>> s.rolling(3).median()
+    0    NaN
+    1    NaN
+    2    1.0
+    3    2.0
+    4    3.0
+    dtype: float64
+    """)
+
+    def median(self, **kwargs):
+        return self._apply('roll_median_c', 'median', **kwargs)
 
     _shared_docs['std'] = dedent("""
-    %(name)s standard deviation
+    Calculate %(name)s standard deviation.
+
+    Normalized by N-1 by default. This can be changed using the `ddof`
+    argument.
 
     Parameters
     ----------
     ddof : int, default 1
         Delta Degrees of Freedom.  The divisor used in calculations
-        is ``N - ddof``, where ``N`` represents the number of elements.""")
+        is ``N - ddof``, where ``N`` represents the number of elements.
+    *args, **kwargs
+        For NumPy compatibility. No additional arguments are used.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returns the same object type as the caller of the %(name)s calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.std : Equivalent method for Series.
+    DataFrame.std : Equivalent method for DataFrame.
+    numpy.std : Equivalent method for Numpy array.
+
+    Notes
+    -----
+    The default `ddof` of 1 used in Series.std is different than the default
+    `ddof` of 0 in numpy.std.
+
+    A minimum of one period is required for the rolling calculation.
+
+    Examples
+    --------
+    >>> s = pd.Series([5, 5, 6, 7, 5, 5, 5])
+    >>> s.rolling(3).std()
+    0         NaN
+    1         NaN
+    2    0.577350
+    3    1.000000
+    4    1.000000
+    5    1.154701
+    6    0.000000
+    dtype: float64
+
+    >>> s.expanding(3).std()
+    0         NaN
+    1         NaN
+    2    0.577350
+    3    0.957427
+    4    0.894427
+    5    0.836660
+    6    0.786796
+    dtype: float64
+    """)
 
     def std(self, ddof=1, *args, **kwargs):
         nv.validate_window_func('std', args, kwargs)
@@ -863,20 +1174,69 @@ def std(self, ddof=1, *args, **kwargs):
 
         def f(arg, *args, **kwargs):
             minp = _require_min_periods(1)(self.min_periods, window)
-            return _zsqrt(_window.roll_var(arg, window, minp, indexi,
-                                           ddof))
+            return _zsqrt(libwindow.roll_var(arg, window, minp, indexi,
+                                             self.closed, ddof))
 
         return self._apply(f, 'std', check_minp=_require_min_periods(1),
                            ddof=ddof, **kwargs)
 
     _shared_docs['var'] = dedent("""
-    %(name)s variance
+    Calculate unbiased %(name)s variance.
+
+    Normalized by N-1 by default. This can be changed using the `ddof`
+    argument.
 
     Parameters
     ----------
     ddof : int, default 1
         Delta Degrees of Freedom.  The divisor used in calculations
-        is ``N - ddof``, where ``N`` represents the number of elements.""")
+        is ``N - ddof``, where ``N`` represents the number of elements.
+    *args, **kwargs
+        For NumPy compatibility. No additional arguments are used.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returns the same object type as the caller of the %(name)s calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.var : Equivalent method for Series.
+    DataFrame.var : Equivalent method for DataFrame.
+    numpy.var : Equivalent method for Numpy array.
+
+    Notes
+    -----
+    The default `ddof` of 1 used in :meth:`Series.var` is different than the
+    default `ddof` of 0 in :func:`numpy.var`.
+
+    A minimum of 1 period is required for the rolling calculation.
+
+    Examples
+    --------
+    >>> s = pd.Series([5, 5, 6, 7, 5, 5, 5])
+    >>> s.rolling(3).var()
+    0         NaN
+    1         NaN
+    2    0.333333
+    3    1.000000
+    4    1.000000
+    5    1.333333
+    6    0.000000
+    dtype: float64
+
+    >>> s.expanding(3).var()
+    0         NaN
+    1         NaN
+    2    0.333333
+    3    0.916667
+    4    0.800000
+    5    0.700000
+    6    0.619048
+    dtype: float64
+    """)
 
     def var(self, ddof=1, *args, **kwargs):
         nv.validate_window_func('var', args, kwargs)
@@ -884,54 +1244,148 @@ def var(self, ddof=1, *args, **kwargs):
                            check_minp=_require_min_periods(1), ddof=ddof,
                            **kwargs)
 
-    _shared_docs['skew'] = """Unbiased %(name)s skewness"""
+    _shared_docs['skew'] = """
+    Unbiased %(name)s skewness.
+
+    Parameters
+    ----------
+    **kwargs
+        Keyword arguments to be passed into func.
+    """
 
     def skew(self, **kwargs):
         return self._apply('roll_skew', 'skew',
                            check_minp=_require_min_periods(3), **kwargs)
 
-    _shared_docs['kurt'] = """Unbiased %(name)s kurtosis"""
+    _shared_docs['kurt'] = dedent("""
+    Calculate unbiased %(name)s kurtosis.
+
+    This function uses Fisher's definition of kurtosis without bias.
+
+    Parameters
+    ----------
+    **kwargs
+        Under Review.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.kurt : Equivalent method for Series.
+    DataFrame.kurt : Equivalent method for DataFrame.
+    scipy.stats.skew : Third moment of a probability density.
+    scipy.stats.kurtosis : Reference SciPy method.
+
+    Notes
+    -----
+    A minimum of 4 periods is required for the %(name)s calculation.
+    """)
 
     def kurt(self, **kwargs):
         return self._apply('roll_kurt', 'kurt',
                            check_minp=_require_min_periods(4), **kwargs)
 
     _shared_docs['quantile'] = dedent("""
-    %(name)s quantile
+    Calculate the %(name)s quantile.
 
     Parameters
     ----------
     quantile : float
-        0 <= quantile <= 1""")
+        Quantile to compute. 0 <= quantile <= 1.
+    interpolation : {'linear', 'lower', 'higher', 'midpoint', 'nearest'}
+        .. versionadded:: 0.23.0
+
+        This optional parameter specifies the interpolation method to use,
+        when the desired quantile lies between two data points `i` and `j`:
+
+            * linear: `i + (j - i) * fraction`, where `fraction` is the
+              fractional part of the index surrounded by `i` and `j`.
+            * lower: `i`.
+            * higher: `j`.
+            * nearest: `i` or `j` whichever is nearest.
+            * midpoint: (`i` + `j`) / 2.
+    **kwargs:
+        For compatibility with other %(name)s methods. Has no effect on
+        the result.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the %(name)s
+        calculation.
 
-    def quantile(self, quantile, **kwargs):
+    See Also
+    --------
+    Series.quantile : Computes value at the given quantile over all data
+        in Series.
+    DataFrame.quantile : Computes values at the given quantile over
+        requested axis in DataFrame.
+
+    Examples
+    --------
+    >>> s = pd.Series([1, 2, 3, 4])
+    >>> s.rolling(2).quantile(.4, interpolation='lower')
+    0    NaN
+    1    1.0
+    2    2.0
+    3    3.0
+    dtype: float64
+
+    >>> s.rolling(2).quantile(.4, interpolation='midpoint')
+    0    NaN
+    1    1.5
+    2    2.5
+    3    3.5
+    dtype: float64
+    """)
+
+    def quantile(self, quantile, interpolation='linear', **kwargs):
         window = self._get_window()
         index, indexi = self._get_index()
 
         def f(arg, *args, **kwargs):
             minp = _use_window(self.min_periods, window)
-            return _window.roll_quantile(arg, window, minp, indexi,
-                                         quantile)
+            if quantile == 1.0:
+                return libwindow.roll_max(arg, window, minp, indexi,
+                                          self.closed)
+            elif quantile == 0.0:
+                return libwindow.roll_min(arg, window, minp, indexi,
+                                          self.closed)
+            else:
+                return libwindow.roll_quantile(arg, window, minp, indexi,
+                                               self.closed, quantile,
+                                               interpolation)
 
         return self._apply(f, 'quantile', quantile=quantile,
                            **kwargs)
 
-    _shared_docs['cov'] = dedent("""
-    %(name)s sample covariance
+    _shared_docs['cov'] = """
+        Calculate the %(name)s sample covariance.
 
-    Parameters
-    ----------
-    other : Series, DataFrame, or ndarray, optional
-        if not supplied then will default to self and produce pairwise output
-    pairwise : bool, default None
-        If False then only matching columns between self and other will be used
-        and the output will be a DataFrame.
-        If True then all pairwise combinations will be calculated and the
-        output will be a Panel in the case of DataFrame inputs. In the case of
-        missing elements, only complete pairwise observations will be used.
-    ddof : int, default 1
-        Delta Degrees of Freedom.  The divisor used in calculations
-        is ``N - ddof``, where ``N`` represents the number of elements.""")
+        Parameters
+        ----------
+        other : Series, DataFrame, or ndarray, optional
+            If not supplied then will default to self and produce pairwise
+            output.
+        pairwise : bool, default None
+            If False then only matching columns between self and other will be
+            used and the output will be a DataFrame.
+            If True then all pairwise combinations will be calculated and the
+            output will be a MultiIndexed DataFrame in the case of DataFrame
+            inputs. In the case of missing elements, only complete pairwise
+            observations will be used.
+        ddof : int, default 1
+            Delta Degrees of Freedom.  The divisor used in calculations
+            is ``N - ddof``, where ``N`` represents the number of elements.
+        **kwargs
+            Keyword arguments to be passed into func.
+    """
 
     def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
         if other is None:
@@ -939,7 +1393,12 @@ def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
             # only default unset
             pairwise = True if pairwise is None else pairwise
         other = self._shallow_copy(other)
-        window = self._get_window(other)
+
+        # GH 16058: offset window
+        if self.is_freq_type:
+            window = self.win_freq
+        else:
+            window = self._get_window(other)
 
         def _get_cov(X, Y):
             # GH #12373 : rolling functions error on float32 data
@@ -957,18 +1416,113 @@ def _get_cov(X, Y):
                                    _get_cov, pairwise=bool(pairwise))
 
     _shared_docs['corr'] = dedent("""
-    %(name)s sample correlation
+    Calculate %(name)s correlation.
 
     Parameters
     ----------
     other : Series, DataFrame, or ndarray, optional
-        if not supplied then will default to self and produce pairwise output
+        If not supplied then will default to self.
     pairwise : bool, default None
-        If False then only matching columns between self and other will be used
-        and the output will be a DataFrame.
-        If True then all pairwise combinations will be calculated and the
-        output will be a Panel in the case of DataFrame inputs. In the case of
-        missing elements, only complete pairwise observations will be used.""")
+        Calculate pairwise combinations of columns within a
+        DataFrame. If `other` is not specified, defaults to `True`,
+        otherwise defaults to `False`.
+        Not relevant for :class:`~pandas.Series`.
+    **kwargs
+        Unused.
+
+    Returns
+    -------
+    Series or DataFrame
+        Returned object type is determined by the caller of the
+        %(name)s calculation.
+
+    See Also
+    --------
+    Series.%(name)s : Calling object with Series data.
+    DataFrame.%(name)s : Calling object with DataFrames.
+    Series.corr : Equivalent method for Series.
+    DataFrame.corr : Equivalent method for DataFrame.
+    %(name)s.cov : Similar method to calculate covariance.
+    numpy.corrcoef : NumPy Pearson's correlation calculation.
+
+    Notes
+    -----
+    This function uses Pearson's definition of correlation
+    (https://en.wikipedia.org/wiki/Pearson_correlation_coefficient).
+
+    When `other` is not specified, the output will be self correlation (e.g.
+    all 1's), except for :class:`~pandas.DataFrame` inputs with `pairwise`
+    set to `True`.
+
+    Function will return ``NaN`` for correlations of equal valued sequences;
+    this is the result of a 0/0 division error.
+
+    When `pairwise` is set to `False`, only matching columns between `self` and
+    `other` will be used.
+
+    When `pairwise` is set to `True`, the output will be a MultiIndex DataFrame
+    with the original index on the first level, and the `other` DataFrame
+    columns on the second level.
+
+    In the case of missing elements, only complete pairwise observations
+    will be used.
+
+    Examples
+    --------
+    The below example shows a rolling calculation with a window size of
+    four matching the equivalent function call using :meth:`numpy.corrcoef`.
+
+    >>> v1 = [3, 3, 3, 5, 8]
+    >>> v2 = [3, 4, 4, 4, 8]
+    >>> fmt = "{0:.6f}"  # limit the printed precision to 6 digits
+    >>> # numpy returns a 2X2 array, the correlation coefficient
+    >>> # is the number at entry [0][1]
+    >>> print(fmt.format(np.corrcoef(v1[:-1], v2[:-1])[0][1]))
+    0.333333
+    >>> print(fmt.format(np.corrcoef(v1[1:], v2[1:])[0][1]))
+    0.916949
+    >>> s1 = pd.Series(v1)
+    >>> s2 = pd.Series(v2)
+    >>> s1.rolling(4).corr(s2)
+    0         NaN
+    1         NaN
+    2         NaN
+    3    0.333333
+    4    0.916949
+    dtype: float64
+
+    The below example shows a similar rolling calculation on a
+    DataFrame using the pairwise option.
+
+    >>> matrix = np.array([[51., 35.], [49., 30.], [47., 32.],\
+    [46., 31.], [50., 36.]])
+    >>> print(np.corrcoef(matrix[:-1,0], matrix[:-1,1]).round(7))
+    [[1.         0.6263001]
+     [0.6263001  1.       ]]
+    >>> print(np.corrcoef(matrix[1:,0], matrix[1:,1]).round(7))
+    [[1.         0.5553681]
+     [0.5553681  1.        ]]
+    >>> df = pd.DataFrame(matrix, columns=['X','Y'])
+    >>> df
+          X     Y
+    0  51.0  35.0
+    1  49.0  30.0
+    2  47.0  32.0
+    3  46.0  31.0
+    4  50.0  36.0
+    >>> df.rolling(4).corr(pairwise=True)
+                X         Y
+    0 X       NaN       NaN
+      Y       NaN       NaN
+    1 X       NaN       NaN
+      Y       NaN       NaN
+    2 X       NaN       NaN
+      Y       NaN       NaN
+    3 X  1.000000  0.626300
+      Y  0.626300  1.000000
+    4 X  1.000000  0.555368
+      Y  0.555368  1.000000
+    """)
 
     def corr(self, other=None, pairwise=None, **kwargs):
         if other is None:
@@ -980,9 +1534,9 @@ def corr(self, other=None, pairwise=None, **kwargs):
 
         def _get_corr(a, b):
             a = a.rolling(window=window, min_periods=self.min_periods,
-                          freq=self.freq, center=self.center)
+                          center=self.center)
             b = b.rolling(window=window, min_periods=self.min_periods,
-                          freq=self.freq, center=self.center)
+                          center=self.center)
 
             return a.cov(b, **kwargs) / (a.std(**kwargs) * b.std(**kwargs))
 
@@ -1006,7 +1560,8 @@ def _on(self):
             return self.obj.index
         elif (isinstance(self.obj, ABCDataFrame) and
               self.on in self.obj.columns):
-            return pd.Index(self.obj[self.on])
+            from pandas import Index
+            return Index(self.obj[self.on])
         else:
             raise ValueError("invalid on specified as {0}, "
                              "must be a column (if DataFrame) "
@@ -1016,8 +1571,8 @@ def validate(self):
         super(Rolling, self).validate()
 
         # we allow rolling on a datetimelike index
-        if (self.is_datetimelike and
-                isinstance(self.window, (compat.string_types, DateOffset,
+        if ((self.obj.empty or self.is_datetimelike) and
+                isinstance(self.window, (compat.string_types, ABCDateOffset,
                                          timedelta))):
 
             self._validate_monotonic()
@@ -1030,6 +1585,7 @@ def validate(self):
                                           "based windows")
 
             # this will raise ValueError on non-fixed freqs
+            self.win_freq = self.window
             self.window = freq.nanos
             self.win_type = 'freq'
 
@@ -1042,33 +1598,95 @@ def validate(self):
         elif self.window < 0:
             raise ValueError("window must be non-negative")
 
+        if not self.is_datetimelike and self.closed is not None:
+            raise ValueError("closed only implemented for datetimelike "
+                             "and offset based windows")
+
     def _validate_monotonic(self):
-        """ validate on is monotonic """
+        """
+        Validate on is_monotonic.
+        """
         if not self._on.is_monotonic:
             formatted = self.on or 'index'
             raise ValueError("{0} must be "
                              "monotonic".format(formatted))
 
     def _validate_freq(self):
-        """ validate & return our freq """
+        """
+        Validate & return window frequency.
+        """
         from pandas.tseries.frequencies import to_offset
         try:
             return to_offset(self.window)
         except (TypeError, ValueError):
-            raise ValueError("passed window {0} in not "
-                             "compat with a datetimelike "
+            raise ValueError("passed window {0} is not "
+                             "compatible with a datetimelike "
                              "index".format(self.window))
 
-    @Substitution(name='rolling')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    Series.rolling
+    DataFrame.rolling
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.rolling(3).sum()
+              A         B         C
+    0       NaN       NaN       NaN
+    1       NaN       NaN       NaN
+    2 -2.655105  0.637799 -2.135068
+    3 -0.971785 -0.600366 -3.280224
+    4 -0.214334 -1.294599 -3.227500
+    5  1.514216  2.028250 -2.989060
+    6  1.074618  5.709767 -2.322600
+    7  2.718061  3.850718  0.256446
+    8 -0.289082  2.454418  1.416871
+    9  0.212668  0.403198 -0.093924
+
+    >>> df.rolling(3).agg({'A':'sum', 'B':'min'})
+              A         B
+    0       NaN       NaN
+    1       NaN       NaN
+    2 -2.655105 -0.165272
+    3 -0.971785 -1.340923
+    4 -0.214334 -1.340923
+    5  1.514216 -1.340923
+    6  1.074618  0.211596
+    7  2.718061 -1.647453
+    8 -0.289082 -1.647453
+    9  0.212668 -1.647453
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='Series/Dataframe',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
     def aggregate(self, arg, *args, **kwargs):
         return super(Rolling, self).aggregate(arg, *args, **kwargs)
 
     agg = aggregate
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['count'])
     def count(self):
 
@@ -1079,13 +1697,12 @@ def count(self):
         return super(Rolling, self).count()
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['apply'])
-    def apply(self, func, args=(), kwargs={}):
-        return super(Rolling, self).apply(func, args=args, kwargs=kwargs)
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        return super(Rolling, self).apply(
+            func, raw=raw, args=args, kwargs=kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['sum'])
     def sum(self, *args, **kwargs):
         nv.validate_rolling_func('sum', args, kwargs)
@@ -1099,34 +1716,29 @@ def max(self, *args, **kwargs):
         return super(Rolling, self).max(*args, **kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['min'])
     def min(self, *args, **kwargs):
         nv.validate_rolling_func('min', args, kwargs)
         return super(Rolling, self).min(*args, **kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['mean'])
     def mean(self, *args, **kwargs):
         nv.validate_rolling_func('mean', args, kwargs)
         return super(Rolling, self).mean(*args, **kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['median'])
     def median(self, **kwargs):
         return super(Rolling, self).median(**kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['std'])
     def std(self, ddof=1, *args, **kwargs):
         nv.validate_rolling_func('std', args, kwargs)
         return super(Rolling, self).std(ddof=ddof, **kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['var'])
     def var(self, ddof=1, *args, **kwargs):
         nv.validate_rolling_func('var', args, kwargs)
@@ -1138,17 +1750,42 @@ def var(self, ddof=1, *args, **kwargs):
     def skew(self, **kwargs):
         return super(Rolling, self).skew(**kwargs)
 
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    The example below will show a rolling calculation with a window size of
+    four matching the equivalent function call using `scipy.stats`.
+
+    >>> arr = [1, 2, 3, 4, 999]
+    >>> fmt = "{0:.6f}"  # limit the printed precision to 6 digits
+    >>> import scipy.stats
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[:-1], bias=False)))
+    -1.200000
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[1:], bias=False)))
+    3.999946
+    >>> s = pd.Series(arr)
+    >>> s.rolling(4).kurt()
+    0         NaN
+    1         NaN
+    2         NaN
+    3   -1.200000
+    4    3.999946
+    dtype: float64
+    """)
+
+    @Appender(_agg_doc)
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['kurt'])
     def kurt(self, **kwargs):
         return super(Rolling, self).kurt(**kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['quantile'])
-    def quantile(self, quantile, **kwargs):
-        return super(Rolling, self).quantile(quantile=quantile, **kwargs)
+    def quantile(self, quantile, interpolation='linear', **kwargs):
+        return super(Rolling, self).quantile(quantile=quantile,
+                                             interpolation=interpolation,
+                                             **kwargs)
 
     @Substitution(name='rolling')
     @Appender(_doc_template)
@@ -1158,7 +1795,6 @@ def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
                                         ddof=ddof, **kwargs)
 
     @Substitution(name='rolling')
-    @Appender(_doc_template)
     @Appender(_shared_docs['corr'])
     def corr(self, other=None, pairwise=None, **kwargs):
         return super(Rolling, self).corr(other=other, pairwise=pairwise,
@@ -1167,7 +1803,7 @@ def corr(self, other=None, pairwise=None, **kwargs):
 
 class RollingGroupby(_GroupByMixin, Rolling):
     """
-    Provides a rolling groupby implementation
+    Provide a rolling groupby implementation.
 
     .. versionadded:: 0.18.1
 
@@ -1188,40 +1824,47 @@ def _gotitem(self, key, ndim, subset=None):
 
     def _validate_monotonic(self):
         """
-        validate that on is monotonic;
+        Validate that on is monotonic;
         we don't care for groupby.rolling
         because we have already validated at a higher
-        level
+        level.
         """
         pass
 
 
 class Expanding(_Rolling_and_Expanding):
     """
-    Provides expanding transformations.
+    Provide expanding transformations.
 
     .. versionadded:: 0.18.0
 
     Parameters
     ----------
-    min_periods : int, default None
+    min_periods : int, default 1
         Minimum number of observations in window required to have a value
         (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None) (DEPRECATED)
-        Frequency to conform the data to before computing the statistic.
-        Specified as a frequency string or DateOffset object.
-    center : boolean, default False
+    center : bool, default False
         Set the labels at the center of the window.
-    axis : int or string, default 0
+    axis : int or str, default 0
 
     Returns
     -------
     a Window sub-classed for the particular operation
 
+    See Also
+    --------
+    rolling : Provides rolling window calculations.
+    ewm : Provides exponential weighted functions.
+
+    Notes
+    -----
+    By default, the result is set to the right edge of the window. This can be
+    changed to the center of the window by setting ``center=True``.
+
     Examples
     --------
 
-    >>> df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
+    >>> df = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]})
          B
     0  0.0
     1  1.0
@@ -1236,58 +1879,103 @@ class Expanding(_Rolling_and_Expanding):
     2  3.0
     3  3.0
     4  7.0
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
     """
 
-    _attributes = ['min_periods', 'freq', 'center', 'axis']
+    _attributes = ['min_periods', 'center', 'axis']
 
-    def __init__(self, obj, min_periods=1, freq=None, center=False, axis=0,
+    def __init__(self, obj, min_periods=1, center=False, axis=0,
                  **kwargs):
         super(Expanding, self).__init__(obj=obj, min_periods=min_periods,
-                                        freq=freq, center=center, axis=axis)
+                                        center=center, axis=axis)
 
     @property
     def _constructor(self):
         return Expanding
 
     def _get_window(self, other=None):
-        obj = self._selected_obj
-        if other is None:
-            return (max(len(obj), self.min_periods) if self.min_periods
-                    else len(obj))
-        return (max((len(obj) + len(obj)), self.min_periods)
-                if self.min_periods else (len(obj) + len(obj)))
+        """
+        Get the window length over which to perform some operation.
 
-    @Substitution(name='expanding')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
+        Parameters
+        ----------
+        other : object, default None
+            The other object that is involved in the operation.
+            Such an object is involved for operations like covariance.
+
+        Returns
+        -------
+        window : int
+            The window length.
+        """
+        axis = self.obj._get_axis(self.axis)
+        length = len(axis) + (other is not None) * len(axis)
+
+        other = self.min_periods or -1
+        return max(length, other)
+
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    DataFrame.expanding.aggregate
+    DataFrame.rolling.aggregate
+    DataFrame.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.ewm(alpha=0.5).mean()
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.464856  0.569633 -0.490089
+    2 -0.207700  0.149687 -1.135379
+    3 -0.471677 -0.645305 -0.906555
+    4 -0.355635 -0.203033 -0.904111
+    5  1.076417  1.503943 -1.146293
+    6 -0.041654  1.925562 -0.588728
+    7  0.680292  0.132049  0.548693
+    8  0.067236  0.948257  0.163353
+    9 -0.286980  0.618493 -0.694496
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='Series/Dataframe',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
     def aggregate(self, arg, *args, **kwargs):
         return super(Expanding, self).aggregate(arg, *args, **kwargs)
 
     agg = aggregate
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['count'])
     def count(self, **kwargs):
         return super(Expanding, self).count(**kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['apply'])
-    def apply(self, func, args=(), kwargs={}):
-        return super(Expanding, self).apply(func, args=args, kwargs=kwargs)
+    def apply(self, func, raw=None, args=(), kwargs={}):
+        return super(Expanding, self).apply(
+            func, raw=raw, args=args, kwargs=kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['sum'])
     def sum(self, *args, **kwargs):
         nv.validate_expanding_func('sum', args, kwargs)
@@ -1301,34 +1989,29 @@ def max(self, *args, **kwargs):
         return super(Expanding, self).max(*args, **kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['min'])
     def min(self, *args, **kwargs):
         nv.validate_expanding_func('min', args, kwargs)
         return super(Expanding, self).min(*args, **kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['mean'])
     def mean(self, *args, **kwargs):
         nv.validate_expanding_func('mean', args, kwargs)
         return super(Expanding, self).mean(*args, **kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['median'])
     def median(self, **kwargs):
         return super(Expanding, self).median(**kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['std'])
     def std(self, ddof=1, *args, **kwargs):
         nv.validate_expanding_func('std', args, kwargs)
         return super(Expanding, self).std(ddof=ddof, **kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['var'])
     def var(self, ddof=1, *args, **kwargs):
         nv.validate_expanding_func('var', args, kwargs)
@@ -1340,17 +2023,42 @@ def var(self, ddof=1, *args, **kwargs):
     def skew(self, **kwargs):
         return super(Expanding, self).skew(**kwargs)
 
+    _agg_doc = dedent("""
+    Examples
+    --------
+
+    The example below will show an expanding calculation with a window size of
+    four matching the equivalent function call using `scipy.stats`.
+
+    >>> arr = [1, 2, 3, 4, 999]
+    >>> import scipy.stats
+    >>> fmt = "{0:.6f}"  # limit the printed precision to 6 digits
+    >>> print(fmt.format(scipy.stats.kurtosis(arr[:-1], bias=False)))
+    -1.200000
+    >>> print(fmt.format(scipy.stats.kurtosis(arr, bias=False)))
+    4.999874
+    >>> s = pd.Series(arr)
+    >>> s.expanding(4).kurt()
+    0         NaN
+    1         NaN
+    2         NaN
+    3   -1.200000
+    4    4.999874
+    dtype: float64
+    """)
+
+    @Appender(_agg_doc)
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['kurt'])
     def kurt(self, **kwargs):
         return super(Expanding, self).kurt(**kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['quantile'])
-    def quantile(self, quantile, **kwargs):
-        return super(Expanding, self).quantile(quantile=quantile, **kwargs)
+    def quantile(self, quantile, interpolation='linear', **kwargs):
+        return super(Expanding, self).quantile(quantile=quantile,
+                                               interpolation=interpolation,
+                                               **kwargs)
 
     @Substitution(name='expanding')
     @Appender(_doc_template)
@@ -1360,7 +2068,6 @@ def cov(self, other=None, pairwise=None, ddof=1, **kwargs):
                                           ddof=ddof, **kwargs)
 
     @Substitution(name='expanding')
-    @Appender(_doc_template)
     @Appender(_shared_docs['corr'])
     def corr(self, other=None, pairwise=None, **kwargs):
         return super(Expanding, self).corr(other=other, pairwise=pairwise,
@@ -1369,7 +2076,7 @@ def corr(self, other=None, pairwise=None, **kwargs):
 
 class ExpandingGroupby(_GroupByMixin, Expanding):
     """
-    Provides a expanding groupby implementation
+    Provide a expanding groupby implementation.
 
     .. versionadded:: 0.18.1
 
@@ -1380,33 +2087,37 @@ def _constructor(self):
 
 
 _bias_template = """
-
-Parameters
-----------
-bias : boolean, default False
-    Use a standard estimation bias correction
+        Parameters
+        ----------
+        bias : bool, default False
+            Use a standard estimation bias correction.
+        *args, **kwargs
+            Arguments and keyword arguments to be passed into func.
 """
 
 _pairwise_template = """
-
-Parameters
-----------
-other : Series, DataFrame, or ndarray, optional
-    if not supplied then will default to self and produce pairwise output
-pairwise : bool, default None
-    If False then only matching columns between self and other will be used and
-    the output will be a DataFrame.
-    If True then all pairwise combinations will be calculated and the output
-    will be a Panel in the case of DataFrame inputs. In the case of missing
-    elements, only complete pairwise observations will be used.
-bias : boolean, default False
-   Use a standard estimation bias correction
+        Parameters
+        ----------
+        other : Series, DataFrame, or ndarray, optional
+            If not supplied then will default to self and produce pairwise
+            output.
+        pairwise : bool, default None
+            If False then only matching columns between self and other will be
+            used and the output will be a DataFrame.
+            If True then all pairwise combinations will be calculated and the
+            output will be a MultiIndex DataFrame in the case of DataFrame
+            inputs. In the case of missing elements, only complete pairwise
+            observations will be used.
+        bias : bool, default False
+           Use a standard estimation bias correction.
+        **kwargs
+           Keyword arguments to be passed into func.
 """
 
 
 class EWM(_Rolling):
     r"""
-    Provides exponential weighted functions
+    Provide exponential weighted functions.
 
     .. versionadded:: 0.18.0
 
@@ -1414,53 +2125,43 @@ class EWM(_Rolling):
     ----------
     com : float, optional
         Specify decay in terms of center of mass,
-        :math:`\alpha = 1 / (1 + com),\text{ for } com \geq 0`
+        :math:`\alpha = 1 / (1 + com),\text{ for } com \geq 0`.
     span : float, optional
         Specify decay in terms of span,
-        :math:`\alpha = 2 / (span + 1),\text{ for } span \geq 1`
+        :math:`\alpha = 2 / (span + 1),\text{ for } span \geq 1`.
     halflife : float, optional
         Specify decay in terms of half-life,
-        :math:`\alpha = 1 - exp(log(0.5) / halflife),\text{ for } halflife > 0`
+        :math:`\alpha = 1 - exp(log(0.5) / halflife),\text{ for }
+            halflife > 0`.
     alpha : float, optional
         Specify smoothing factor :math:`\alpha` directly,
-        :math:`0 < \alpha \leq 1`
+        :math:`0 < \alpha \leq 1`.
 
         .. versionadded:: 0.18.0
 
     min_periods : int, default 0
         Minimum number of observations in window required to have a value
         (otherwise result is NA).
-    freq : None or string alias / date offset object, default=None (DEPRECATED)
-        Frequency to conform to before computing statistic
-    adjust : boolean, default True
+    adjust : bool, default True
         Divide by decaying adjustment factor in beginning periods to account
-        for imbalance in relative weightings (viewing EWMA as a moving average)
-    ignore_na : boolean, default False
+        for imbalance in relative weightings
+        (viewing EWMA as a moving average).
+    ignore_na : bool, default False
         Ignore missing values when calculating weights;
-        specify True to reproduce pre-0.15.0 behavior
+        specify True to reproduce pre-0.15.0 behavior.
+    axis : {0 or 'index', 1 or 'columns'}, default 0
+        The axis to use. The value 0 identifies the rows, and 1
+        identifies the columns.
 
     Returns
     -------
-    a Window sub-classed for the particular operation
+    DataFrame
+        A Window sub-classed for the particular operation.
 
-    Examples
+    See Also
     --------
-
-    >>> df = DataFrame({'B': [0, 1, 2, np.nan, 4]})
-         B
-    0  0.0
-    1  1.0
-    2  2.0
-    3  NaN
-    4  4.0
-
-    >>> df.ewm(com=0.5).mean()
-              B
-    0  0.000000
-    1  0.750000
-    2  1.615385
-    3  1.615385
-    4  3.670213
+    rolling : Provides rolling window calculations.
+    expanding : Provides expanding transformations.
 
     Notes
     -----
@@ -1469,10 +2170,6 @@ class EWM(_Rolling):
     parameter descriptions above; see the link at the end of this section for
     a detailed explanation.
 
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
     When adjust is True (default), weighted averages are calculated using
     weights (1-alpha)**(n-1), (1-alpha)**(n-2), ..., 1-alpha, 1.
 
@@ -1492,16 +2189,35 @@ class EWM(_Rolling):
 
     More details can be found at
     http://pandas.pydata.org/pandas-docs/stable/computation.html#exponentially-weighted-windows
+
+    Examples
+    --------
+
+    >>> df = pd.DataFrame({'B': [0, 1, 2, np.nan, 4]})
+    >>> df
+         B
+    0  0.0
+    1  1.0
+    2  2.0
+    3  NaN
+    4  4.0
+
+    >>> df.ewm(com=0.5).mean()
+              B
+    0  0.000000
+    1  0.750000
+    2  1.615385
+    3  1.615385
+    4  3.670213
     """
-    _attributes = ['com', 'min_periods', 'freq', 'adjust', 'ignore_na', 'axis']
+    _attributes = ['com', 'min_periods', 'adjust', 'ignore_na', 'axis']
 
     def __init__(self, obj, com=None, span=None, halflife=None, alpha=None,
-                 min_periods=0, freq=None, adjust=True, ignore_na=False,
+                 min_periods=0, adjust=True, ignore_na=False,
                  axis=0):
         self.obj = obj
         self.com = _get_center_of_mass(com, span, halflife, alpha)
         self.min_periods = min_periods
-        self.freq = freq
         self.adjust = adjust
         self.ignore_na = ignore_na
         self.axis = axis
@@ -1511,30 +2227,69 @@ def __init__(self, obj, com=None, span=None, halflife=None, alpha=None,
     def _constructor(self):
         return EWM
 
-    @Substitution(name='ewm')
-    @Appender(SelectionMixin._see_also_template)
-    @Appender(SelectionMixin._agg_doc)
+    _agg_see_also_doc = dedent("""
+    See Also
+    --------
+    pandas.DataFrame.rolling.aggregate
+    """)
+
+    _agg_examples_doc = dedent("""
+    Examples
+    --------
+
+    >>> df = pd.DataFrame(np.random.randn(10, 3), columns=['A', 'B', 'C'])
+    >>> df
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.004295  0.905829 -0.954544
+    2  0.735167 -0.165272 -1.619346
+    3 -0.702657 -1.340923 -0.706334
+    4 -0.246845  0.211596 -0.901819
+    5  2.463718  3.157577 -1.380906
+    6 -1.142255  2.340594 -0.039875
+    7  1.396598 -1.647453  1.677227
+    8 -0.543425  1.761277 -0.220481
+    9 -0.640505  0.289374 -1.550670
+
+    >>> df.ewm(alpha=0.5).mean()
+              A         B         C
+    0 -2.385977 -0.102758  0.438822
+    1 -1.464856  0.569633 -0.490089
+    2 -0.207700  0.149687 -1.135379
+    3 -0.471677 -0.645305 -0.906555
+    4 -0.355635 -0.203033 -0.904111
+    5  1.076417  1.503943 -1.146293
+    6 -0.041654  1.925562 -0.588728
+    7  0.680292  0.132049  0.548693
+    8  0.067236  0.948257  0.163353
+    9 -0.286980  0.618493 -0.694496
+    """)
+
+    @Substitution(see_also=_agg_see_also_doc,
+                  examples=_agg_examples_doc,
+                  versionadded='',
+                  klass='Series/Dataframe',
+                  axis='')
+    @Appender(_shared_docs['aggregate'])
     def aggregate(self, arg, *args, **kwargs):
         return super(EWM, self).aggregate(arg, *args, **kwargs)
 
     agg = aggregate
 
-    def _apply(self, func, how=None, **kwargs):
-        """Rolling statistical measure using supplied function. Designed to be
+    def _apply(self, func, **kwargs):
+        """
+        Rolling statistical measure using supplied function. Designed to be
         used with passed-in Cython array-based functions.
 
         Parameters
         ----------
-        func : string/callable to apply
-        how : string, default to None (DEPRECATED)
-            how to resample
+        func : str/callable to apply
 
         Returns
         -------
-        y : type of input argument
-
+        y : same type as input argument
         """
-        blocks, obj, index = self._create_blocks(how=how)
+        blocks, obj, index = self._create_blocks()
         results = []
         for b in blocks:
             try:
@@ -1549,10 +2304,10 @@ def _apply(self, func, how=None, **kwargs):
 
             # if we have a string function name, wrap it
             if isinstance(func, compat.string_types):
-                cfunc = getattr(_window, func, None)
+                cfunc = getattr(libwindow, func, None)
                 if cfunc is None:
                     raise ValueError("we do not support this function "
-                                     "in _window.{0}".format(func))
+                                     "in libwindow.{func}".format(func=func))
 
                 def func(arg):
                     return cfunc(arg, self.com, int(self.adjust),
@@ -1565,7 +2320,14 @@ def func(arg):
     @Substitution(name='ewm')
     @Appender(_doc_template)
     def mean(self, *args, **kwargs):
-        """exponential weighted moving average"""
+        """
+        Exponential weighted moving average.
+
+        Parameters
+        ----------
+        *args, **kwargs
+            Arguments and keyword arguments to be passed into func.
+        """
         nv.validate_window_func('mean', args, kwargs)
         return self._apply('ewma', **kwargs)
 
@@ -1573,7 +2335,9 @@ def mean(self, *args, **kwargs):
     @Appender(_doc_template)
     @Appender(_bias_template)
     def std(self, bias=False, *args, **kwargs):
-        """exponential weighted moving stddev"""
+        """
+        Exponential weighted moving stddev.
+        """
         nv.validate_window_func('std', args, kwargs)
         return _zsqrt(self.var(bias=bias, **kwargs))
 
@@ -1583,13 +2347,15 @@ def std(self, bias=False, *args, **kwargs):
     @Appender(_doc_template)
     @Appender(_bias_template)
     def var(self, bias=False, *args, **kwargs):
-        """exponential weighted moving variance"""
+        """
+        Exponential weighted moving variance.
+        """
         nv.validate_window_func('var', args, kwargs)
 
         def f(arg):
-            return _window.ewmcov(arg, arg, self.com, int(self.adjust),
-                                  int(self.ignore_na), int(self.min_periods),
-                                  int(bias))
+            return libwindow.ewmcov(arg, arg, self.com, int(self.adjust),
+                                    int(self.ignore_na), int(self.min_periods),
+                                    int(bias))
 
         return self._apply(f, **kwargs)
 
@@ -1597,7 +2363,9 @@ def f(arg):
     @Appender(_doc_template)
     @Appender(_pairwise_template)
     def cov(self, other=None, pairwise=None, bias=False, **kwargs):
-        """exponential weighted sample covariance"""
+        """
+        Exponential weighted sample covariance.
+        """
         if other is None:
             other = self._selected_obj
             # only default unset
@@ -1607,9 +2375,10 @@ def cov(self, other=None, pairwise=None, bias=False, **kwargs):
         def _get_cov(X, Y):
             X = self._shallow_copy(X)
             Y = self._shallow_copy(Y)
-            cov = _window.ewmcov(X._prep_values(), Y._prep_values(), self.com,
-                                 int(self.adjust), int(self.ignore_na),
-                                 int(self.min_periods), int(bias))
+            cov = libwindow.ewmcov(X._prep_values(), Y._prep_values(),
+                                   self.com, int(self.adjust),
+                                   int(self.ignore_na), int(self.min_periods),
+                                   int(bias))
             return X._wrap_result(cov)
 
         return _flex_binary_moment(self._selected_obj, other._selected_obj,
@@ -1619,7 +2388,9 @@ def _get_cov(X, Y):
     @Appender(_doc_template)
     @Appender(_pairwise_template)
     def corr(self, other=None, pairwise=None, **kwargs):
-        """exponential weighted sample correlation"""
+        """
+        Exponential weighted sample correlation.
+        """
         if other is None:
             other = self._selected_obj
             # only default unset
@@ -1631,10 +2402,10 @@ def _get_corr(X, Y):
             Y = self._shallow_copy(Y)
 
             def _cov(x, y):
-                return _window.ewmcov(x, y, self.com, int(self.adjust),
-                                      int(self.ignore_na),
-                                      int(self.min_periods),
-                                      1)
+                return libwindow.ewmcov(x, y, self.com, int(self.adjust),
+                                        int(self.ignore_na),
+                                        int(self.min_periods),
+                                        1)
 
             x_values = X._prep_values()
             y_values = Y._prep_values()
@@ -1652,18 +2423,19 @@ def _cov(x, y):
 
 
 def _flex_binary_moment(arg1, arg2, f, pairwise=False):
-    from pandas import Series, DataFrame, Panel
-    if not (isinstance(arg1, (np.ndarray, Series, DataFrame)) and
-            isinstance(arg2, (np.ndarray, Series, DataFrame))):
+
+    if not (isinstance(arg1, (np.ndarray, ABCSeries, ABCDataFrame)) and
+            isinstance(arg2, (np.ndarray, ABCSeries, ABCDataFrame))):
         raise TypeError("arguments to moment function must be of type "
                         "np.ndarray/Series/DataFrame")
 
-    if (isinstance(arg1, (np.ndarray, Series)) and
-            isinstance(arg2, (np.ndarray, Series))):
+    if (isinstance(arg1, (np.ndarray, ABCSeries)) and
+            isinstance(arg2, (np.ndarray, ABCSeries))):
         X, Y = _prep_binary(arg1, arg2)
         return f(X, Y)
 
-    elif isinstance(arg1, DataFrame):
+    elif isinstance(arg1, ABCDataFrame):
+        from pandas import DataFrame
 
         def dataframe_from_int_dict(data, frame_template):
             result = DataFrame(data, index=frame_template.index)
@@ -1672,7 +2444,7 @@ def dataframe_from_int_dict(data, frame_template):
             return result
 
         results = {}
-        if isinstance(arg2, DataFrame):
+        if isinstance(arg2, ABCDataFrame):
             if pairwise is False:
                 if arg1 is arg2:
                     # special case in order to handle duplicate column names
@@ -1684,10 +2456,15 @@ def dataframe_from_int_dict(data, frame_template):
                         raise ValueError("'arg1' columns are not unique")
                     if not arg2.columns.is_unique:
                         raise ValueError("'arg2' columns are not unique")
-                    X, Y = arg1.align(arg2, join='outer')
+                    with warnings.catch_warnings(record=True):
+                        warnings.simplefilter("ignore", RuntimeWarning)
+                        X, Y = arg1.align(arg2, join='outer')
                     X = X + 0 * Y
                     Y = Y + 0 * X
-                    res_columns = arg1.columns.union(arg2.columns)
+
+                    with warnings.catch_warnings(record=True):
+                        warnings.simplefilter("ignore", RuntimeWarning)
+                        res_columns = arg1.columns.union(arg2.columns)
                     for col in res_columns:
                         if col in X and col in Y:
                             results[col] = f(X[col], Y[col])
@@ -1703,52 +2480,91 @@ def dataframe_from_int_dict(data, frame_template):
                         else:
                             results[i][j] = f(*_prep_binary(arg1.iloc[:, i],
                                                             arg2.iloc[:, j]))
-                p = Panel.from_dict(results).swapaxes('items', 'major')
-                if len(p.major_axis) > 0:
-                    p.major_axis = arg1.columns[p.major_axis]
-                if len(p.minor_axis) > 0:
-                    p.minor_axis = arg2.columns[p.minor_axis]
-                return p
+
+                from pandas import MultiIndex, concat
+
+                result_index = arg1.index.union(arg2.index)
+                if len(result_index):
+
+                    # construct result frame
+                    result = concat(
+                        [concat([results[i][j]
+                                 for j, c in enumerate(arg2.columns)],
+                                ignore_index=True)
+                         for i, c in enumerate(arg1.columns)],
+                        ignore_index=True,
+                        axis=1)
+                    result.columns = arg1.columns
+
+                    # set the index and reorder
+                    if arg2.columns.nlevels > 1:
+                        result.index = MultiIndex.from_product(
+                            arg2.columns.levels + [result_index])
+                        result = result.reorder_levels([2, 0, 1]).sort_index()
+                    else:
+                        result.index = MultiIndex.from_product(
+                            [range(len(arg2.columns)),
+                             range(len(result_index))])
+                        result = result.swaplevel(1, 0).sort_index()
+                        result.index = MultiIndex.from_product(
+                            [result_index] + [arg2.columns])
+                else:
+
+                    # empty result
+                    result = DataFrame(
+                        index=MultiIndex(levels=[arg1.index, arg2.columns],
+                                         codes=[[], []]),
+                        columns=arg2.columns,
+                        dtype='float64')
+
+                # reset our index names to arg1 names
+                # reset our column names to arg2 names
+                # careful not to mutate the original names
+                result.columns = result.columns.set_names(
+                    arg1.columns.names)
+                result.index = result.index.set_names(
+                    result_index.names + arg2.columns.names)
+
+                return result
+
             else:
                 raise ValueError("'pairwise' is not True/False")
         else:
-            results = {}
-            for i, col in enumerate(arg1.columns):
-                results[i] = f(*_prep_binary(arg1.iloc[:, i], arg2))
+            results = {i: f(*_prep_binary(arg1.iloc[:, i], arg2))
+                       for i, col in enumerate(arg1.columns)}
             return dataframe_from_int_dict(results, arg1)
 
     else:
         return _flex_binary_moment(arg2, arg1, f)
 
 
-def _get_center_of_mass(com, span, halflife, alpha):
-    valid_count = len([x for x in [com, span, halflife, alpha]
-                       if x is not None])
+def _get_center_of_mass(comass, span, halflife, alpha):
+    valid_count = com.count_not_none(comass, span, halflife, alpha)
     if valid_count > 1:
-        raise ValueError("com, span, halflife, and alpha "
+        raise ValueError("comass, span, halflife, and alpha "
                          "are mutually exclusive")
 
     # Convert to center of mass; domain checks ensure 0 < alpha <= 1
-    if com is not None:
-        if com < 0:
-            raise ValueError("com must satisfy: com >= 0")
+    if comass is not None:
+        if comass < 0:
+            raise ValueError("comass must satisfy: comass >= 0")
     elif span is not None:
         if span < 1:
             raise ValueError("span must satisfy: span >= 1")
-        com = (span - 1) / 2.
+        comass = (span - 1) / 2.
     elif halflife is not None:
         if halflife <= 0:
             raise ValueError("halflife must satisfy: halflife > 0")
         decay = 1 - np.exp(np.log(0.5) / halflife)
-        com = 1 / decay - 1
+        comass = 1 / decay - 1
     elif alpha is not None:
         if alpha <= 0 or alpha > 1:
             raise ValueError("alpha must satisfy: 0 < alpha <= 1")
-        com = (1.0 - alpha) / alpha
+        comass = (1.0 - alpha) / alpha
     else:
-        raise ValueError("Must pass one of com, span, halflife, or alpha")
+        raise ValueError("Must pass one of comass, span, halflife, or alpha")
 
-    return float(com)
+    return float(comass)
 
 
 def _offset(window, center):
@@ -1757,7 +2573,7 @@ def _offset(window, center):
     offset = (window - 1) / 2. if center else 0
     try:
         return int(offset)
-    except:
+    except TypeError:
         return offset.astype(int)
 
 
@@ -1783,8 +2599,7 @@ def _zsqrt(x):
         result = np.sqrt(x)
         mask = x < 0
 
-    from pandas import DataFrame
-    if isinstance(x, DataFrame):
+    if isinstance(x, ABCDataFrame):
         if mask.values.any():
             result[mask] = 0
     else:
@@ -1809,8 +2624,7 @@ def _prep_binary(arg1, arg2):
 
 
 def rolling(obj, win_type=None, **kwds):
-    from pandas import Series, DataFrame
-    if not isinstance(obj, (Series, DataFrame)):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
         raise TypeError('invalid type: %s' % type(obj))
 
     if win_type is not None:
@@ -1823,8 +2637,7 @@ def rolling(obj, win_type=None, **kwds):
 
 
 def expanding(obj, **kwds):
-    from pandas import Series, DataFrame
-    if not isinstance(obj, (Series, DataFrame)):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
         raise TypeError('invalid type: %s' % type(obj))
 
     return Expanding(obj, **kwds)
@@ -1834,8 +2647,7 @@ def expanding(obj, **kwds):
 
 
 def ewm(obj, **kwds):
-    from pandas import Series, DataFrame
-    if not isinstance(obj, (Series, DataFrame)):
+    if not isinstance(obj, (ABCSeries, ABCDataFrame)):
         raise TypeError('invalid type: %s' % type(obj))
 
     return EWM(obj, **kwds)
diff --git a/pandas/core/window.pyx b/pandas/core/window.pyx
deleted file mode 100644
index a06e616002ee2..0000000000000
--- a/pandas/core/window.pyx
+++ /dev/null
@@ -1,1652 +0,0 @@
-# cython: profile=False
-# cython: boundscheck=False, wraparound=False, cdivision=True
-
-from numpy cimport *
-cimport numpy as np
-import numpy as np
-
-cimport cython
-
-import_array()
-
-cimport util
-
-from libc.stdlib cimport malloc, free
-
-from numpy cimport NPY_INT8 as NPY_int8
-from numpy cimport NPY_INT16 as NPY_int16
-from numpy cimport NPY_INT32 as NPY_int32
-from numpy cimport NPY_INT64 as NPY_int64
-from numpy cimport NPY_FLOAT16 as NPY_float16
-from numpy cimport NPY_FLOAT32 as NPY_float32
-from numpy cimport NPY_FLOAT64 as NPY_float64
-
-from numpy cimport (int8_t, int16_t, int32_t, int64_t, uint8_t, uint16_t,
-                    uint32_t, uint64_t, float16_t, float32_t, float64_t)
-
-int8 = np.dtype(np.int8)
-int16 = np.dtype(np.int16)
-int32 = np.dtype(np.int32)
-int64 = np.dtype(np.int64)
-float16 = np.dtype(np.float16)
-float32 = np.dtype(np.float32)
-float64 = np.dtype(np.float64)
-
-cdef np.int8_t MINint8 = np.iinfo(np.int8).min
-cdef np.int16_t MINint16 = np.iinfo(np.int16).min
-cdef np.int32_t MINint32 = np.iinfo(np.int32).min
-cdef np.int64_t MINint64 = np.iinfo(np.int64).min
-cdef np.float16_t MINfloat16 = np.NINF
-cdef np.float32_t MINfloat32 = np.NINF
-cdef np.float64_t MINfloat64 = np.NINF
-
-cdef np.int8_t MAXint8 = np.iinfo(np.int8).max
-cdef np.int16_t MAXint16 = np.iinfo(np.int16).max
-cdef np.int32_t MAXint32 = np.iinfo(np.int32).max
-cdef np.int64_t MAXint64 = np.iinfo(np.int64).max
-cdef np.float16_t MAXfloat16 = np.inf
-cdef np.float32_t MAXfloat32 = np.inf
-cdef np.float64_t MAXfloat64 = np.inf
-
-cdef double NaN = <double> np.NaN
-cdef double nan = NaN
-
-cdef inline int int_max(int a, int b): return a if a >= b else b
-cdef inline int int_min(int a, int b): return a if a <= b else b
-
-from util cimport numeric
-
-from skiplist cimport *
-
-cdef extern from "../src/headers/math.h":
-    double sqrt(double x) nogil
-    int signbit(double) nogil
-
-include "skiplist.pyx"
-
-# Cython implementations of rolling sum, mean, variance, skewness,
-# other statistical moment functions
-#
-# Misc implementation notes
-# -------------------------
-#
-# - In Cython x * x is faster than x ** 2 for C types, this should be
-#   periodically revisited to see if it's still true.
-#
-
-
-def _check_minp(win, minp, N, floor=None):
-    """
-    Parameters
-    ----------
-    win: int
-    minp: int or None
-    N: len of window
-    floor: int, optional
-        default 1
-
-    Returns
-    -------
-    minimum period
-    """
-
-    if minp is None:
-        minp = 1
-    if not util.is_integer_object(minp):
-        raise ValueError("min_periods must be an integer")
-    if minp > win:
-        raise ValueError("min_periods (%d) must be <= "
-                         "window (%d)" % (minp, win))
-    elif minp > N:
-        minp = N + 1
-    elif minp < 0:
-        raise ValueError('min_periods must be >= 0')
-    if floor is None:
-        floor = 1
-
-    return max(minp, floor)
-
-# original C implementation by N. Devillard.
-# This code in public domain.
-# Function :   kth_smallest()
-# In       :   array of elements, # of elements in the array, rank k
-# Out      :   one element
-# Job      :   find the kth smallest element in the array
-
-#             Reference:
-
-#               Author: Wirth, Niklaus
-#                Title: Algorithms + data structures = programs
-#            Publisher: Englewood Cliffs: Prentice-Hall, 1976
-# Physical description: 366 p.
-#               Series: Prentice-Hall Series in Automatic Computation
-
-# ----------------------------------------------------------------------
-# The indexer objects for rolling
-# These define start/end indexers to compute offsets
-
-
-cdef class WindowIndexer:
-
-    cdef:
-        ndarray start, end
-        int64_t N, minp, win
-        bint is_variable
-
-    def get_data(self):
-        return (self.start, self.end, <int64_t>self.N,
-                <int64_t>self.win, <int64_t>self.minp,
-                self.is_variable)
-
-
-cdef class MockFixedWindowIndexer(WindowIndexer):
-    """
-
-    We are just checking parameters of the indexer,
-    and returning a consistent API with fixed/variable
-    indexers.
-
-    Parameters
-    ----------
-    input: ndarray
-        input data array
-    win: int64_t
-        window size
-    minp: int64_t
-        min number of obs in a window to consider non-NaN
-    index: object
-        index of the input
-    floor: optional
-        unit for flooring
-
-    """
-    def __init__(self, ndarray input, int64_t win, int64_t minp,
-                 object index=None, object floor=None):
-
-        assert index is None
-        self.is_variable = 0
-        self.N = len(input)
-        self.minp = _check_minp(win, minp, self.N, floor=floor)
-        self.start = np.empty(0, dtype='int64')
-        self.end = np.empty(0, dtype='int64')
-        self.win = win
-
-
-cdef class FixedWindowIndexer(WindowIndexer):
-    """
-    create a fixed length window indexer object
-    that has start & end, that point to offsets in
-    the index object; these are defined based on the win
-    arguments
-
-    Parameters
-    ----------
-    input: ndarray
-        input data array
-    win: int64_t
-        window size
-    minp: int64_t
-        min number of obs in a window to consider non-NaN
-    index: object
-        index of the input
-    floor: optional
-        unit for flooring the unit
-
-    """
-    def __init__(self, ndarray input, int64_t win, int64_t minp,
-                 object index=None, object floor=None):
-        cdef ndarray start_s, start_e, end_s, end_e
-
-        assert index is None
-        self.is_variable = 0
-        self.N = len(input)
-        self.minp = _check_minp(win, minp, self.N, floor=floor)
-
-        start_s = np.zeros(win, dtype='int64')
-        start_e = np.arange(win, self.N, dtype='int64') - win + 1
-        self.start = np.concatenate([start_s, start_e])
-
-        end_s = np.arange(win, dtype='int64') + 1
-        end_e = start_e + win
-        self.end = np.concatenate([end_s, end_e])
-        self.win = win
-
-
-cdef class VariableWindowIndexer(WindowIndexer):
-    """
-    create a variable length window indexer object
-    that has start & end, that point to offsets in
-    the index object; these are defined based on the win
-    arguments
-
-    Parameters
-    ----------
-    input: ndarray
-        input data array
-    win: int64_t
-        window size
-    minp: int64_t
-        min number of obs in a window to consider non-NaN
-    index: ndarray
-        index of the input
-
-    """
-    def __init__(self, ndarray input, int64_t win, int64_t minp,
-                 ndarray index):
-
-        self.is_variable = 1
-        self.N = len(index)
-        self.minp = _check_minp(win, minp, self.N)
-
-        self.start = np.empty(self.N, dtype='int64')
-        self.start.fill(-1)
-
-        self.end = np.empty(self.N, dtype='int64')
-        self.end.fill(-1)
-
-        self.build(index, win)
-
-        # max window size
-        self.win = (self.end - self.start).max()
-
-    def build(self, ndarray[int64_t] index, int64_t win):
-
-        cdef:
-            ndarray[int64_t] start, end
-            int64_t start_bound, end_bound, N
-            Py_ssize_t i, j
-
-        start = self.start
-        end = self.end
-        N = self.N
-
-        start[0] = 0
-        end[0] = 1
-
-        with nogil:
-
-            # start is start of slice interval (including)
-            # end is end of slice interval (not including)
-            for i in range(1, N):
-                end_bound = index[i]
-                start_bound = index[i] - win
-
-                # advance the start bound until we are
-                # within the constraint
-                start[i] = i
-                for j in range(start[i - 1], i):
-                    if index[j] > start_bound:
-                        start[i] = j
-                        break
-
-                # end bound is previous end
-                # or current index
-                if index[end[i - 1]] <= end_bound:
-                    end[i] = i + 1
-                else:
-                    end[i] = end[i - 1]
-
-
-def get_window_indexer(input, win, minp, index, floor=None,
-                       use_mock=True):
-    """
-    return the correct window indexer for the computation
-
-    Parameters
-    ----------
-    input: 1d ndarray
-    win: integer, window size
-    minp: integer, minimum periods
-    index: 1d ndarray, optional
-        index to the input array
-    floor: optional
-        unit for flooring the unit
-    use_mock: boolean, default True
-        if we are a fixed indexer, return a mock indexer
-        instead of the FixedWindow Indexer. This is a type
-        compat Indexer that allows us to use a standard
-        code path with all of the indexers.
-
-    Returns
-    -------
-    tuple of 1d int64 ndarrays of the offsets & data about the window
-
-    """
-
-    if index is not None:
-        indexer = VariableWindowIndexer(input, win, minp, index)
-    elif use_mock:
-        indexer = MockFixedWindowIndexer(input, win, minp, index, floor)
-    else:
-        indexer = FixedWindowIndexer(input, win, minp, index, floor)
-    return indexer.get_data()
-
-# ----------------------------------------------------------------------
-# Rolling count
-# this is only an impl for index not None, IOW, freq aware
-
-
-def roll_count(ndarray[double_t] input, int64_t win, int64_t minp,
-               object index):
-    cdef:
-        double val, count_x = 0.0
-        int64_t s, e, nobs, N
-        Py_ssize_t i, j
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, _ = get_window_indexer(input, win,
-                                                     minp, index)
-    output = np.empty(N, dtype=float)
-
-    with nogil:
-
-        for i in range(0, N):
-            s = start[i]
-            e = end[i]
-
-            if i == 0:
-
-                # setup
-                count_x = 0.0
-                for j in range(s, e):
-                    val = input[j]
-                    if val == val:
-                        count_x += 1.0
-
-            else:
-
-                # calculate deletes
-                for j in range(start[i - 1], s):
-                    val = input[j]
-                    if val == val:
-                        count_x -= 1.0
-
-                # calculate adds
-                for j in range(end[i - 1], e):
-                    val = input[j]
-                    if val == val:
-                        count_x += 1.0
-
-            if count_x >= minp:
-                output[i] = count_x
-            else:
-                output[i] = NaN
-
-    return output
-
-# ----------------------------------------------------------------------
-# Rolling sum
-
-
-cdef inline double calc_sum(int64_t minp, int64_t nobs, double sum_x) nogil:
-    cdef double result
-
-    if nobs >= minp:
-        result = sum_x
-    else:
-        result = NaN
-
-    return result
-
-
-cdef inline void add_sum(double val, int64_t *nobs, double *sum_x) nogil:
-    """ add a value from the sum calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] + 1
-        sum_x[0] = sum_x[0] + val
-
-
-cdef inline void remove_sum(double val, int64_t *nobs, double *sum_x) nogil:
-    """ remove a value from the sum calc """
-
-    if val == val:
-        nobs[0] = nobs[0] - 1
-        sum_x[0] = sum_x[0] - val
-
-
-def roll_sum(ndarray[double_t] input, int64_t win, int64_t minp,
-             object index):
-    cdef:
-        double val, prev_x, sum_x = 0
-        int64_t s, e
-        int64_t nobs = 0, i, j, N
-        bint is_variable
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index)
-    output = np.empty(N, dtype=float)
-
-    # for performance we are going to iterate
-    # fixed windows separately, makes the code more complex as we have 2 paths
-    # but is faster
-
-    if is_variable:
-
-        # variable window
-        with nogil:
-
-            for i in range(0, N):
-                s = start[i]
-                e = end[i]
-
-                if i == 0:
-
-                    # setup
-                    sum_x = 0.0
-                    nobs = 0
-                    for j in range(s, e):
-                        add_sum(input[j], &nobs, &sum_x)
-
-                else:
-
-                    # calculate deletes
-                    for j in range(start[i - 1], s):
-                        remove_sum(input[j], &nobs, &sum_x)
-
-                    # calculate adds
-                    for j in range(end[i - 1], e):
-                        add_sum(input[j], &nobs, &sum_x)
-
-                output[i] = calc_sum(minp, nobs, sum_x)
-
-    else:
-
-        # fixed window
-
-        with nogil:
-
-            for i in range(0, minp - 1):
-                add_sum(input[i], &nobs, &sum_x)
-                output[i] = NaN
-
-            for i in range(minp - 1, N):
-                val = input[i]
-                add_sum(val, &nobs, &sum_x)
-
-                if i > win - 1:
-                    prev_x = input[i - win]
-                    remove_sum(prev_x, &nobs, &sum_x)
-
-                output[i] = calc_sum(minp, nobs, sum_x)
-
-    return output
-
-# ----------------------------------------------------------------------
-# Rolling mean
-
-
-cdef inline double calc_mean(int64_t minp, Py_ssize_t nobs,
-                             Py_ssize_t neg_ct, double sum_x) nogil:
-    cdef double result
-
-    if nobs >= minp:
-        result = sum_x / <double>nobs
-        if neg_ct == 0 and result < 0:
-            # all positive
-            result = 0
-        elif neg_ct == nobs and result > 0:
-            # all negative
-            result = 0
-        else:
-            pass
-    else:
-        result = NaN
-    return result
-
-
-cdef inline void add_mean(double val, Py_ssize_t *nobs, double *sum_x,
-                          Py_ssize_t *neg_ct) nogil:
-    """ add a value from the mean calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] + 1
-        sum_x[0] = sum_x[0] + val
-        if signbit(val):
-            neg_ct[0] = neg_ct[0] + 1
-
-
-cdef inline void remove_mean(double val, Py_ssize_t *nobs, double *sum_x,
-                             Py_ssize_t *neg_ct) nogil:
-    """ remove a value from the mean calc """
-
-    if val == val:
-        nobs[0] = nobs[0] - 1
-        sum_x[0] = sum_x[0] - val
-        if signbit(val):
-            neg_ct[0] = neg_ct[0] - 1
-
-
-def roll_mean(ndarray[double_t] input, int64_t win, int64_t minp,
-              object index):
-    cdef:
-        double val, prev_x, result, sum_x = 0
-        int64_t s, e
-        bint is_variable
-        Py_ssize_t nobs = 0, i, j, neg_ct = 0, N
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index)
-    output = np.empty(N, dtype=float)
-
-    # for performance we are going to iterate
-    # fixed windows separately, makes the code more complex as we have 2 paths
-    # but is faster
-
-    if is_variable:
-
-        with nogil:
-
-            for i in range(0, N):
-                s = start[i]
-                e = end[i]
-
-                if i == 0:
-
-                    # setup
-                    sum_x = 0.0
-                    nobs = 0
-                    for j in range(s, e):
-                        val = input[j]
-                        add_mean(val, &nobs, &sum_x, &neg_ct)
-
-                else:
-
-                    # calculate deletes
-                    for j in range(start[i - 1], s):
-                        val = input[j]
-                        remove_mean(val, &nobs, &sum_x, &neg_ct)
-
-                    # calculate adds
-                    for j in range(end[i - 1], e):
-                        val = input[j]
-                        add_mean(val, &nobs, &sum_x, &neg_ct)
-
-                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
-
-    else:
-
-        with nogil:
-            for i from 0 <= i < minp - 1:
-                val = input[i]
-                add_mean(val, &nobs, &sum_x, &neg_ct)
-                output[i] = NaN
-
-            for i from minp - 1 <= i < N:
-                val = input[i]
-                add_mean(val, &nobs, &sum_x, &neg_ct)
-
-                if i > win - 1:
-                    prev_x = input[i - win]
-                    remove_mean(prev_x, &nobs, &sum_x, &neg_ct)
-
-                output[i] = calc_mean(minp, nobs, neg_ct, sum_x)
-
-    return output
-
-# ----------------------------------------------------------------------
-# Rolling variance
-
-
-cdef inline double calc_var(int64_t minp, int ddof, double nobs,
-                            double ssqdm_x) nogil:
-    cdef double result
-
-    # Variance is unchanged if no observation is added or removed
-    if (nobs >= minp) and (nobs > ddof):
-
-        # pathological case
-        if nobs == 1:
-            result = 0
-        else:
-            result = ssqdm_x / (nobs - <double>ddof)
-            if result < 0:
-                result = 0
-    else:
-        result = NaN
-
-    return result
-
-
-cdef inline void add_var(double val, double *nobs, double *mean_x,
-                         double *ssqdm_x) nogil:
-    """ add a value from the var calc """
-    cdef double delta
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] + 1
-
-        delta = (val - mean_x[0])
-        mean_x[0] = mean_x[0] + delta / nobs[0]
-        ssqdm_x[0] = ssqdm_x[0] + delta * (val - mean_x[0])
-
-
-cdef inline void remove_var(double val, double *nobs, double *mean_x,
-                            double *ssqdm_x) nogil:
-    """ remove a value from the var calc """
-    cdef double delta
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] - 1
-        if nobs[0]:
-            delta = (val - mean_x[0])
-            mean_x[0] = mean_x[0] - delta / nobs[0]
-            ssqdm_x[0] = ssqdm_x[0] - delta * (val - mean_x[0])
-        else:
-            mean_x[0] = 0
-            ssqdm_x[0] = 0
-
-
-def roll_var(ndarray[double_t] input, int64_t win, int64_t minp,
-             object index, int ddof=1):
-    """
-    Numerically stable implementation using Welford's method.
-    """
-    cdef:
-        double val, prev, mean_x = 0, ssqdm_x = 0, nobs = 0, delta
-        int64_t s, e
-        bint is_variable
-        Py_ssize_t i, j, N
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index)
-    output = np.empty(N, dtype=float)
-
-    # Check for windows larger than array, addresses #7297
-    win = min(win, N)
-
-    # for performance we are going to iterate
-    # fixed windows separately, makes the code more complex as we
-    # have 2 paths but is faster
-
-    if is_variable:
-
-        with nogil:
-
-            for i in range(0, N):
-
-                s = start[i]
-                e = end[i]
-
-                # Over the first window, observations can only be added
-                # never removed
-                if i == 0:
-
-                    for j in range(s, e):
-                        add_var(input[j], &nobs, &mean_x, &ssqdm_x)
-
-                else:
-
-                    # After the first window, observations can both be added
-                    # and removed
-
-                    # calculate adds
-                    for j in range(end[i - 1], e):
-                        add_var(input[j], &nobs, &mean_x, &ssqdm_x)
-
-                    # calculate deletes
-                    for j in range(start[i - 1], s):
-                        remove_var(input[j], &nobs, &mean_x, &ssqdm_x)
-
-                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
-
-    else:
-
-        with nogil:
-
-            # Over the first window, observations can only be added, never
-            # removed
-            for i from 0 <= i < win:
-                add_var(input[i], &nobs, &mean_x, &ssqdm_x)
-                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
-
-            # After the first window, observations can both be added and
-            # removed
-            for i from win <= i < N:
-                val = input[i]
-                prev = input[i - win]
-
-                if val == val:
-                    if prev == prev:
-
-                        # Adding one observation and removing another one
-                        delta = val - prev
-                        prev -= mean_x
-                        mean_x += delta / nobs
-                        val -= mean_x
-                        ssqdm_x += (val + prev) * delta
-
-                    else:
-                        add_var(val, &nobs, &mean_x, &ssqdm_x)
-                elif prev == prev:
-                    remove_var(prev, &nobs, &mean_x, &ssqdm_x)
-
-                output[i] = calc_var(minp, ddof, nobs, ssqdm_x)
-
-    return output
-
-
-# ----------------------------------------------------------------------
-# Rolling skewness
-
-cdef inline double calc_skew(int64_t minp, int64_t nobs, double x, double xx,
-                             double xxx) nogil:
-    cdef double result, dnobs
-    cdef double A, B, C, R
-
-    if nobs >= minp:
-        dnobs = <double>nobs
-        A = x / dnobs
-        B = xx / dnobs - A * A
-        C = xxx / dnobs - A * A * A - 3 * A * B
-        if B <= 0 or nobs < 3:
-            result = NaN
-        else:
-            R = sqrt(B)
-            result = ((sqrt(dnobs * (dnobs - 1.)) * C) /
-                      ((dnobs - 2) * R * R * R))
-    else:
-        result = NaN
-
-    return result
-
-cdef inline void add_skew(double val, int64_t *nobs, double *x, double *xx,
-                          double *xxx) nogil:
-    """ add a value from the skew calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] + 1
-
-        # seriously don't ask me why this is faster
-        x[0] = x[0] + val
-        xx[0] = xx[0] + val * val
-        xxx[0] = xxx[0] + val * val * val
-
-cdef inline void remove_skew(double val, int64_t *nobs, double *x, double *xx,
-                             double *xxx) nogil:
-    """ remove a value from the skew calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] - 1
-
-        # seriously don't ask me why this is faster
-        x[0] = x[0] - val
-        xx[0] = xx[0] - val * val
-        xxx[0] = xxx[0] - val * val * val
-
-
-def roll_skew(ndarray[double_t] input, int64_t win, int64_t minp,
-              object index):
-    cdef:
-        double val, prev
-        double x = 0, xx = 0, xxx = 0
-        int64_t nobs = 0, i, j, N
-        int64_t s, e
-        bint is_variable
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index)
-    output = np.empty(N, dtype=float)
-
-    if is_variable:
-
-        with nogil:
-
-            for i in range(0, N):
-
-                s = start[i]
-                e = end[i]
-
-                # Over the first window, observations can only be added
-                # never removed
-                if i == 0:
-
-                    for j in range(s, e):
-                        val = input[j]
-                        add_skew(val, &nobs, &x, &xx, &xxx)
-
-                else:
-
-                    # After the first window, observations can both be added
-                    # and removed
-
-                    # calculate adds
-                    for j in range(end[i - 1], e):
-                        val = input[j]
-                        add_skew(val, &nobs, &x, &xx, &xxx)
-
-                    # calculate deletes
-                    for j in range(start[i - 1], s):
-                        val = input[j]
-                        remove_skew(val, &nobs, &x, &xx, &xxx)
-
-                output[i] = calc_skew(minp, nobs, x, xx, xxx)
-
-    else:
-
-        with nogil:
-            for i from 0 <= i < minp - 1:
-                val = input[i]
-                add_skew(val, &nobs, &x, &xx, &xxx)
-                output[i] = NaN
-
-            for i from minp - 1 <= i < N:
-                val = input[i]
-                add_skew(val, &nobs, &x, &xx, &xxx)
-
-                if i > win - 1:
-                    prev = input[i - win]
-                    remove_skew(prev, &nobs, &x, &xx, &xxx)
-
-                output[i] = calc_skew(minp, nobs, x, xx, xxx)
-
-    return output
-
-# ----------------------------------------------------------------------
-# Rolling kurtosis
-
-
-cdef inline double calc_kurt(int64_t minp, int64_t nobs, double x, double xx,
-                             double xxx, double xxxx) nogil:
-    cdef double result, dnobs
-    cdef double A, B, C, D, R, K
-
-    if nobs >= minp:
-        dnobs = <double>nobs
-        A = x / dnobs
-        R = A * A
-        B = xx / dnobs - R
-        R = R * A
-        C = xxx / dnobs - R - 3 * A * B
-        R = R * A
-        D = xxxx / dnobs - R - 6 * B * A * A - 4 * C * A
-
-        if B == 0 or nobs < 4:
-            result = NaN
-        else:
-            K = (dnobs * dnobs - 1.) * D / (B * B) - 3 * ((dnobs - 1.) ** 2)
-            result = K / ((dnobs - 2.) * (dnobs - 3.))
-    else:
-        result = NaN
-
-    return result
-
-cdef inline void add_kurt(double val, int64_t *nobs, double *x, double *xx,
-                          double *xxx, double *xxxx) nogil:
-    """ add a value from the kurotic calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] + 1
-
-        # seriously don't ask me why this is faster
-        x[0] = x[0] + val
-        xx[0] = xx[0] + val * val
-        xxx[0] = xxx[0] + val * val * val
-        xxxx[0] = xxxx[0] + val * val * val * val
-
-cdef inline void remove_kurt(double val, int64_t *nobs, double *x, double *xx,
-                             double *xxx, double *xxxx) nogil:
-    """ remove a value from the kurotic calc """
-
-    # Not NaN
-    if val == val:
-        nobs[0] = nobs[0] - 1
-
-        # seriously don't ask me why this is faster
-        x[0] = x[0] - val
-        xx[0] = xx[0] - val * val
-        xxx[0] = xxx[0] - val * val * val
-        xxxx[0] = xxxx[0] - val * val * val * val
-
-
-def roll_kurt(ndarray[double_t] input, int64_t win, int64_t minp,
-              object index):
-    cdef:
-        double val, prev
-        double x = 0, xx = 0, xxx = 0, xxxx = 0
-        int64_t nobs = 0, i, j, N
-        int64_t s, e
-        bint is_variable
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index)
-    output = np.empty(N, dtype=float)
-
-    if is_variable:
-
-        with nogil:
-
-            for i in range(0, N):
-
-                s = start[i]
-                e = end[i]
-
-                # Over the first window, observations can only be added
-                # never removed
-                if i == 0:
-
-                    for j in range(s, e):
-                        add_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
-
-                else:
-
-                    # After the first window, observations can both be added
-                    # and removed
-
-                    # calculate adds
-                    for j in range(end[i - 1], e):
-                        add_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
-
-                    # calculate deletes
-                    for j in range(start[i - 1], s):
-                        remove_kurt(input[j], &nobs, &x, &xx, &xxx, &xxxx)
-
-                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
-
-    else:
-
-        with nogil:
-
-            for i from 0 <= i < minp - 1:
-                add_kurt(input[i], &nobs, &x, &xx, &xxx, &xxxx)
-                output[i] = NaN
-
-            for i from minp - 1 <= i < N:
-                add_kurt(input[i], &nobs, &x, &xx, &xxx, &xxxx)
-
-                if i > win - 1:
-                    prev = input[i - win]
-                    remove_kurt(prev, &nobs, &x, &xx, &xxx, &xxxx)
-
-                output[i] = calc_kurt(minp, nobs, x, xx, xxx, xxxx)
-
-    return output
-
-# ----------------------------------------------------------------------
-# Rolling median, min, max
-
-
-def roll_median_c(ndarray[float64_t] input, int64_t win, int64_t minp,
-                  object index):
-    cdef:
-        double val, res, prev
-        bint err=0, is_variable
-        int ret=0
-        skiplist_t *sl
-        Py_ssize_t i, j
-        int64_t nobs = 0, N, s, e
-        int midpoint
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    # we use the Fixed/Variable Indexer here as the
-    # actual skiplist ops outweigh any window computation costs
-    start, end, N, win, minp, is_variable = get_window_indexer(
-        input, win,
-        minp, index,
-        use_mock=False)
-    output = np.empty(N, dtype=float)
-
-    sl = skiplist_init(<int>win)
-    if sl == NULL:
-        raise MemoryError("skiplist_init failed")
-
-    with nogil:
-
-        for i in range(0, N):
-            s = start[i]
-            e = end[i]
-
-            if i == 0:
-
-                # setup
-                val = input[i]
-                if val == val:
-                    nobs += 1
-                    err = skiplist_insert(sl, val) != 1
-                    if err:
-                        break
-
-            else:
-
-                # calculate deletes
-                for j in range(start[i - 1], s):
-                    val = input[j]
-                    if val == val:
-                        skiplist_remove(sl, val)
-                        nobs -= 1
-
-                # calculate adds
-                for j in range(end[i - 1], e):
-                    val = input[j]
-                    if val == val:
-                        nobs += 1
-                        err = skiplist_insert(sl, val) != 1
-                        if err:
-                            break
-
-            if nobs >= minp:
-                midpoint = <int>(nobs / 2)
-                if nobs % 2:
-                    res = skiplist_get(sl, midpoint, &ret)
-                else:
-                    res = (skiplist_get(sl, midpoint, &ret) +
-                           skiplist_get(sl, (midpoint - 1), &ret)) / 2
-            else:
-                res = NaN
-
-            output[i] = res
-
-    skiplist_destroy(sl)
-    if err:
-        raise MemoryError("skiplist_insert failed")
-    return output
-
-# ----------------------------------------------------------------------
-
-# Moving maximum / minimum code taken from Bottleneck under the terms
-# of its Simplified BSD license
-# https://github.com/kwgoodman/bottleneck
-
-
-cdef inline numeric init_mm(numeric ai, Py_ssize_t *nobs, bint is_max) nogil:
-
-    if numeric in cython.floating:
-        if ai == ai:
-            nobs[0] = nobs[0] + 1
-        elif is_max:
-            if numeric == cython.float:
-                ai = MINfloat32
-            else:
-                ai = MINfloat64
-        else:
-            if numeric == cython.float:
-                ai = MAXfloat32
-            else:
-                ai = MAXfloat64
-
-    else:
-        nobs[0] = nobs[0] + 1
-
-    return ai
-
-
-cdef inline void remove_mm(numeric aold, Py_ssize_t *nobs) nogil:
-    """ remove a value from the mm calc """
-    if numeric in cython.floating and aold == aold:
-        nobs[0] = nobs[0] - 1
-
-
-cdef inline numeric calc_mm(int64_t minp, Py_ssize_t nobs,
-                            numeric value) nogil:
-    cdef numeric result
-
-    if numeric in cython.floating:
-        if nobs >= minp:
-            result = value
-        else:
-            result = NaN
-    else:
-        result = value
-
-    return result
-
-
-def roll_max(ndarray[numeric] input, int64_t win, int64_t minp,
-             object index):
-    """
-    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
-
-    Parameters
-    ----------
-    input: numpy array
-    window: int, size of rolling window
-    minp: if number of observations in window
-          is below this, output a NaN
-    index: ndarray, optional
-       index for window computation
-    """
-    return _roll_min_max(input, win, minp, index, is_max=1)
-
-
-def roll_min(ndarray[numeric] input, int64_t win, int64_t minp,
-             object index):
-    """
-    Moving max of 1d array of any numeric type along axis=0 ignoring NaNs.
-
-    Parameters
-    ----------
-    input: numpy array
-    window: int, size of rolling window
-    minp: if number of observations in window
-          is below this, output a NaN
-    index: ndarray, optional
-       index for window computation
-    """
-    return _roll_min_max(input, win, minp, index, is_max=0)
-
-
-cdef _roll_min_max(ndarray[numeric] input, int64_t win, int64_t minp,
-                   object index, bint is_max):
-    """
-    Moving min/max of 1d array of any numeric type along axis=0
-    ignoring NaNs.
-    """
-
-    cdef:
-        numeric ai
-        bint is_variable, should_replace
-        int64_t s, e, N, i, j, removed
-        Py_ssize_t nobs = 0
-        ndarray[int64_t] starti, endi
-        ndarray[numeric, ndim=1] output
-    cdef:
-        int64_t* death
-        numeric* ring
-        numeric* minvalue
-        numeric* end
-        numeric* last
-
-    cdef:
-        cdef numeric r
-
-    starti, endi, N, win, minp, is_variable = get_window_indexer(
-        input, win,
-        minp, index)
-
-    output = np.empty(N, dtype=input.dtype)
-
-    if is_variable:
-
-        with nogil:
-
-            for i in range(N):
-                s = starti[i]
-                e = endi[i]
-
-                r = input[s]
-                nobs = 0
-                for j in range(s, e):
-
-                    # adds, death at the i offset
-                    ai = init_mm(input[j], &nobs, is_max)
-
-                    if is_max:
-                        if ai > r:
-                            r = ai
-                    else:
-                        if ai < r:
-                            r = ai
-
-                output[i] = calc_mm(minp, nobs, r)
-
-    else:
-
-        # setup the rings of death!
-        ring = <numeric *>malloc(win * sizeof(numeric))
-        death = <int64_t *>malloc(win * sizeof(int64_t))
-
-        end = ring + win
-        last = ring
-        minvalue = ring
-        ai = input[0]
-        minvalue[0] = init_mm(input[0], &nobs, is_max)
-        death[0] = win
-        nobs = 0
-
-        with nogil:
-
-            for i in range(N):
-                ai = init_mm(input[i], &nobs, is_max)
-
-                if i >= win:
-                    remove_mm(input[i - win], &nobs)
-
-                if death[minvalue - ring] == i:
-                    minvalue = minvalue + 1
-                    if minvalue >= end:
-                        minvalue = ring
-
-                if is_max:
-                    should_replace = ai >= minvalue[0]
-                else:
-                    should_replace = ai <= minvalue[0]
-                if should_replace:
-
-                    minvalue[0] = ai
-                    death[minvalue - ring] = i + win
-                    last = minvalue
-
-                else:
-
-                    if is_max:
-                        should_replace = last[0] <= ai
-                    else:
-                        should_replace = last[0] >= ai
-                    while should_replace:
-                        if last == ring:
-                            last = end
-                        last -= 1
-                        if is_max:
-                            should_replace = last[0] <= ai
-                        else:
-                            should_replace = last[0] >= ai
-
-                    last += 1
-                    if last == end:
-                        last = ring
-                    last[0] = ai
-                    death[last - ring] = i + win
-
-                output[i] = calc_mm(minp, nobs, minvalue[0])
-
-            for i in range(minp - 1):
-                if numeric in cython.floating:
-                    output[i] = NaN
-                else:
-                    output[i] = 0
-
-            free(ring)
-            free(death)
-
-    # print("output: {0}".format(output))
-    return output
-
-
-def roll_quantile(ndarray[float64_t, cast=True] input, int64_t win,
-                  int64_t minp, object index, double quantile):
-    """
-    O(N log(window)) implementation using skip list
-    """
-    cdef:
-        double val, prev, midpoint
-        IndexableSkiplist skiplist
-        int64_t nobs = 0, i, j, s, e, N
-        Py_ssize_t idx
-        bint is_variable
-        ndarray[int64_t] start, end
-        ndarray[double_t] output
-
-    if quantile < 0.0 or quantile > 1.0:
-        raise ValueError("quantile value {0} not in [0, 1]".format(quantile))
-
-    # we use the Fixed/Variable Indexer here as the
-    # actual skiplist ops outweigh any window computation costs
-    start, end, N, win, minp, is_variable = get_window_indexer(
-        input, win,
-        minp, index,
-        use_mock=False)
-    output = np.empty(N, dtype=float)
-    skiplist = IndexableSkiplist(win)
-
-    for i in range(0, N):
-        s = start[i]
-        e = end[i]
-
-        if i == 0:
-
-            # setup
-            val = input[i]
-            if val == val:
-                nobs += 1
-                skiplist.insert(val)
-
-        else:
-
-            # calculate deletes
-            for j in range(start[i - 1], s):
-                val = input[j]
-                if val == val:
-                    skiplist.remove(val)
-                    nobs -= 1
-
-            # calculate adds
-            for j in range(end[i - 1], e):
-                val = input[j]
-                if val == val:
-                    nobs += 1
-                    skiplist.insert(val)
-
-        if nobs >= minp:
-            idx = int(quantile * <double>(nobs - 1))
-            output[i] = skiplist.get(idx)
-        else:
-            output[i] = NaN
-
-    return output
-
-
-def roll_generic(ndarray[float64_t, cast=True] input,
-                 int64_t win, int64_t minp, object index,
-                 int offset, object func,
-                 object args, object kwargs):
-    cdef:
-        ndarray[double_t] output, counts, bufarr
-        float64_t *buf
-        float64_t *oldbuf
-        int64_t nobs = 0, i, j, s, e, N
-        bint is_variable
-        ndarray[int64_t] start, end
-
-    if not input.flags.c_contiguous:
-        input = input.copy('C')
-
-    n = len(input)
-    if n == 0:
-        return input
-
-    start, end, N, win, minp, is_variable = get_window_indexer(input, win,
-                                                               minp, index,
-                                                               floor=0)
-    output = np.empty(N, dtype=float)
-
-    counts = roll_sum(np.concatenate([np.isfinite(input).astype(float),
-                                      np.array([0.] * offset)]),
-                      win, minp, index)[offset:]
-
-    if is_variable:
-
-        # variable window
-        if offset != 0:
-            raise ValueError("unable to roll_generic with a non-zero offset")
-
-        for i in range(0, N):
-            s = start[i]
-            e = end[i]
-
-            if counts[i] >= minp:
-                output[i] = func(input[s:e], *args, **kwargs)
-            else:
-                output[i] = NaN
-
-    else:
-
-        # truncated windows at the beginning, through first full-length window
-        for i from 0 <= i < (int_min(win, N) - offset):
-            if counts[i] >= minp:
-                output[i] = func(input[0: (i + offset + 1)], *args, **kwargs)
-            else:
-                output[i] = NaN
-
-        # remaining full-length windows
-        buf = <float64_t *> input.data
-        bufarr = np.empty(win, dtype=float)
-        oldbuf = <float64_t *> bufarr.data
-        for i from (win - offset) <= i < (N - offset):
-            buf = buf + 1
-            bufarr.data = <char *> buf
-            if counts[i] >= minp:
-                output[i] = func(bufarr, *args, **kwargs)
-            else:
-                output[i] = NaN
-        bufarr.data = <char *> oldbuf
-
-        # truncated windows at the end
-        for i from int_max(N - offset, 0) <= i < N:
-            if counts[i] >= minp:
-                output[i] = func(input[int_max(i + offset - win + 1, 0): N],
-                                 *args,
-                                 **kwargs)
-            else:
-                output[i] = NaN
-
-    return output
-
-
-def roll_window(ndarray[float64_t, ndim=1, cast=True] input,
-                ndarray[float64_t, ndim=1, cast=True] weights,
-                int minp, bint avg=True):
-    """
-    Assume len(weights) << len(input)
-    """
-    cdef:
-        ndarray[double_t] output, tot_wgt, counts
-        Py_ssize_t in_i, win_i, win_n, win_k, in_n, in_k
-        float64_t val_in, val_win, c, w
-
-    in_n = len(input)
-    win_n = len(weights)
-    output = np.zeros(in_n, dtype=float)
-    counts = np.zeros(in_n, dtype=float)
-    if avg:
-        tot_wgt = np.zeros(in_n, dtype=float)
-
-    minp = _check_minp(len(weights), minp, in_n)
-
-    if avg:
-        for win_i from 0 <= win_i < win_n:
-            val_win = weights[win_i]
-            if val_win != val_win:
-                continue
-
-            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
-                val_in = input[in_i]
-                if val_in == val_in:
-                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
-                    counts[in_i + (win_n - win_i) - 1] += 1
-                    tot_wgt[in_i + (win_n - win_i) - 1] += val_win
-
-        for in_i from 0 <= in_i < in_n:
-            c = counts[in_i]
-            if c < minp:
-                output[in_i] = NaN
-            else:
-                w = tot_wgt[in_i]
-                if w == 0:
-                    output[in_i] = NaN
-                else:
-                    output[in_i] /= tot_wgt[in_i]
-
-    else:
-        for win_i from 0 <= win_i < win_n:
-            val_win = weights[win_i]
-            if val_win != val_win:
-                continue
-
-            for in_i from 0 <= in_i < in_n - (win_n - win_i) + 1:
-                val_in = input[in_i]
-
-                if val_in == val_in:
-                    output[in_i + (win_n - win_i) - 1] += val_in * val_win
-                    counts[in_i + (win_n - win_i) - 1] += 1
-
-        for in_i from 0 <= in_i < in_n:
-            c = counts[in_i]
-            if c < minp:
-                output[in_i] = NaN
-
-    return output
-
-# ----------------------------------------------------------------------
-# Exponentially weighted moving average
-
-
-def ewma(ndarray[double_t] input, double_t com, int adjust, int ignore_na,
-         int minp):
-    """
-    Compute exponentially-weighted moving average using center-of-mass.
-
-    Parameters
-    ----------
-    input : ndarray (float64 type)
-    com : float64
-    adjust: int
-    ignore_na: int
-    minp: int
-
-    Returns
-    -------
-    y : ndarray
-    """
-
-    cdef Py_ssize_t N = len(input)
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-    if N == 0:
-        return output
-
-    minp = max(minp, 1)
-
-    cdef double alpha, old_wt_factor, new_wt, weighted_avg, old_wt, cur
-    cdef Py_ssize_t i, nobs
-
-    alpha = 1. / (1. + com)
-    old_wt_factor = 1. - alpha
-    new_wt = 1. if adjust else alpha
-
-    weighted_avg = input[0]
-    is_observation = (weighted_avg == weighted_avg)
-    nobs = int(is_observation)
-    output[0] = weighted_avg if (nobs >= minp) else NaN
-    old_wt = 1.
-
-    for i from 1 <= i < N:
-        cur = input[i]
-        is_observation = (cur == cur)
-        nobs += int(is_observation)
-        if weighted_avg == weighted_avg:
-
-            if is_observation or (not ignore_na):
-
-                old_wt *= old_wt_factor
-                if is_observation:
-
-                    # avoid numerical errors on constant series
-                    if weighted_avg != cur:
-                        weighted_avg = ((old_wt * weighted_avg) +
-                                        (new_wt * cur)) / (old_wt + new_wt)
-                    if adjust:
-                        old_wt += new_wt
-                    else:
-                        old_wt = 1.
-        elif is_observation:
-            weighted_avg = cur
-
-        output[i] = weighted_avg if (nobs >= minp) else NaN
-
-    return output
-
-# ----------------------------------------------------------------------
-# Exponentially weighted moving covariance
-
-
-def ewmcov(ndarray[double_t] input_x, ndarray[double_t] input_y,
-           double_t com, int adjust, int ignore_na, int minp, int bias):
-    """
-    Compute exponentially-weighted moving variance using center-of-mass.
-
-    Parameters
-    ----------
-    input_x : ndarray (float64 type)
-    input_y : ndarray (float64 type)
-    com : float64
-    adjust: int
-    ignore_na: int
-    minp: int
-    bias: int
-
-    Returns
-    -------
-    y : ndarray
-    """
-
-    cdef Py_ssize_t N = len(input_x)
-    if len(input_y) != N:
-        raise ValueError("arrays are of different lengths "
-                         "(%d and %d)" % (N, len(input_y)))
-    cdef ndarray[double_t] output = np.empty(N, dtype=float)
-    if N == 0:
-        return output
-
-    minp = max(minp, 1)
-
-    cdef double alpha, old_wt_factor, new_wt, mean_x, mean_y, cov
-    cdef double sum_wt, sum_wt2, old_wt, cur_x, cur_y, old_mean_x, old_mean_y
-    cdef Py_ssize_t i, nobs
-
-    alpha = 1. / (1. + com)
-    old_wt_factor = 1. - alpha
-    new_wt = 1. if adjust else alpha
-
-    mean_x = input_x[0]
-    mean_y = input_y[0]
-    is_observation = ((mean_x == mean_x) and (mean_y == mean_y))
-    nobs = int(is_observation)
-    if not is_observation:
-        mean_x = NaN
-        mean_y = NaN
-    output[0] = (0. if bias else NaN) if (nobs >= minp) else NaN
-    cov = 0.
-    sum_wt = 1.
-    sum_wt2 = 1.
-    old_wt = 1.
-
-    for i from 1 <= i < N:
-        cur_x = input_x[i]
-        cur_y = input_y[i]
-        is_observation = ((cur_x == cur_x) and (cur_y == cur_y))
-        nobs += int(is_observation)
-        if mean_x == mean_x:
-            if is_observation or (not ignore_na):
-                sum_wt *= old_wt_factor
-                sum_wt2 *= (old_wt_factor * old_wt_factor)
-                old_wt *= old_wt_factor
-                if is_observation:
-                    old_mean_x = mean_x
-                    old_mean_y = mean_y
-
-                    # avoid numerical errors on constant series
-                    if mean_x != cur_x:
-                        mean_x = ((old_wt * old_mean_x) +
-                                  (new_wt * cur_x)) / (old_wt + new_wt)
-
-                    # avoid numerical errors on constant series
-                    if mean_y != cur_y:
-                        mean_y = ((old_wt * old_mean_y) +
-                                  (new_wt * cur_y)) / (old_wt + new_wt)
-                    cov = ((old_wt * (cov + ((old_mean_x - mean_x) *
-                                             (old_mean_y - mean_y)))) +
-                           (new_wt * ((cur_x - mean_x) *
-                                      (cur_y - mean_y)))) / (old_wt + new_wt)
-                    sum_wt += new_wt
-                    sum_wt2 += (new_wt * new_wt)
-                    old_wt += new_wt
-                    if not adjust:
-                        sum_wt /= old_wt
-                        sum_wt2 /= (old_wt * old_wt)
-                        old_wt = 1.
-        elif is_observation:
-            mean_x = cur_x
-            mean_y = cur_y
-
-        if nobs >= minp:
-            if not bias:
-                numerator = sum_wt * sum_wt
-                denominator = numerator - sum_wt2
-                if (denominator > 0.):
-                    output[i] = ((numerator / denominator) * cov)
-                else:
-                    output[i] = NaN
-            else:
-                output[i] = cov
-        else:
-            output[i] = NaN
-
-    return output
diff --git a/pandas/errors/__init__.py b/pandas/errors/__init__.py
new file mode 100644
index 0000000000000..7d5a7f1a99e41
--- /dev/null
+++ b/pandas/errors/__init__.py
@@ -0,0 +1,192 @@
+# flake8: noqa
+
+"""
+Expose public exceptions & warnings
+"""
+
+from pandas._libs.tslibs import OutOfBoundsDatetime
+
+
+class PerformanceWarning(Warning):
+    """
+    Warning raised when there is a possible performance impact.
+    """
+
+
+class UnsupportedFunctionCall(ValueError):
+    """
+    Exception raised when attempting to call a numpy function
+    on a pandas object, but that function is not supported by
+    the object e.g. ``np.cumsum(groupby_object)``.
+    """
+
+
+class UnsortedIndexError(KeyError):
+    """
+    Error raised when attempting to get a slice of a MultiIndex,
+    and the index has not been lexsorted. Subclass of `KeyError`.
+
+    .. versionadded:: 0.20.0
+    """
+
+
+class ParserError(ValueError):
+    """
+    Exception that is raised by an error encountered in parsing file contents.
+
+    This is a generic error raised for errors encountered when functions like
+    `read_csv` or `read_html` are parsing contents of a file.
+
+    See Also
+    --------
+    read_csv : Read CSV (comma-separated) file into a DataFrame.
+    read_html : Read HTML table into a DataFrame.
+    """
+
+
+class DtypeWarning(Warning):
+    """
+    Warning raised when reading different dtypes in a column from a file.
+
+    Raised for a dtype incompatibility. This can happen whenever `read_csv`
+    or `read_table` encounter non-uniform dtypes in a column(s) of a given
+    CSV file.
+
+    See Also
+    --------
+    read_csv : Read CSV (comma-separated) file into a DataFrame.
+    read_table : Read general delimited file into a DataFrame.
+
+    Notes
+    -----
+    This warning is issued when dealing with larger files because the dtype
+    checking happens per chunk read.
+
+    Despite the warning, the CSV file is read with mixed types in a single
+    column which will be an object type. See the examples below to better
+    understand this issue.
+
+    Examples
+    --------
+    This example creates and reads a large CSV file with a column that contains
+    `int` and `str`.
+
+    >>> df = pd.DataFrame({'a': (['1'] * 100000 + ['X'] * 100000 +
+    ...                          ['1'] * 100000),
+    ...                    'b': ['b'] * 300000})
+    >>> df.to_csv('test.csv', index=False)
+    >>> df2 = pd.read_csv('test.csv')
+    ... # DtypeWarning: Columns (0) have mixed types
+
+    Important to notice that ``df2`` will contain both `str` and `int` for the
+    same input, '1'.
+
+    >>> df2.iloc[262140, 0]
+    '1'
+    >>> type(df2.iloc[262140, 0])
+    <class 'str'>
+    >>> df2.iloc[262150, 0]
+    1
+    >>> type(df2.iloc[262150, 0])
+    <class 'int'>
+
+    One way to solve this issue is using the `dtype` parameter in the
+    `read_csv` and `read_table` functions to explicit the conversion:
+
+    >>> df2 = pd.read_csv('test.csv', sep=',', dtype={'a': str})
+
+    No warning was issued.
+
+    >>> import os
+    >>> os.remove('test.csv')
+    """
+
+
+class EmptyDataError(ValueError):
+    """
+    Exception that is thrown in `pd.read_csv` (by both the C and
+    Python engines) when empty data or header is encountered.
+    """
+
+
+class ParserWarning(Warning):
+    """
+    Warning raised when reading a file that doesn't use the default 'c' parser.
+
+    Raised by `pd.read_csv` and `pd.read_table` when it is necessary to change
+    parsers, generally from the default 'c' parser to 'python'.
+
+    It happens due to a lack of support or functionality for parsing a
+    particular attribute of a CSV file with the requested engine.
+
+    Currently, 'c' unsupported options include the following parameters:
+
+    1. `sep` other than a single character (e.g. regex separators)
+    2. `skipfooter` higher than 0
+    3. `sep=None` with `delim_whitespace=False`
+
+    The warning can be avoided by adding `engine='python'` as a parameter in
+    `pd.read_csv` and `pd.read_table` methods.
+
+    See Also
+    --------
+    pd.read_csv : Read CSV (comma-separated) file into DataFrame.
+    pd.read_table : Read general delimited file into DataFrame.
+
+    Examples
+    --------
+    Using a `sep` in `pd.read_csv` other than a single character:
+
+    >>> import io
+    >>> csv = u'''a;b;c
+    ...           1;1,8
+    ...           1;2,1'''
+    >>> df = pd.read_csv(io.StringIO(csv), sep='[;,]')  # doctest: +SKIP
+    ... # ParserWarning: Falling back to the 'python' engine...
+
+    Adding `engine='python'` to `pd.read_csv` removes the Warning:
+
+    >>> df = pd.read_csv(io.StringIO(csv), sep='[;,]', engine='python')
+    """
+
+
+class MergeError(ValueError):
+    """
+    Error raised when problems arise during merging due to problems
+    with input data. Subclass of `ValueError`.
+    """
+
+
+class NullFrequencyError(ValueError):
+    """
+    Error raised when a null `freq` attribute is used in an operation
+    that needs a non-null frequency, particularly `DatetimeIndex.shift`,
+    `TimedeltaIndex.shift`, `PeriodIndex.shift`.
+    """
+
+
+class AccessorRegistrationWarning(Warning):
+    """Warning for attribute conflicts in accessor registration."""
+
+
+class AbstractMethodError(NotImplementedError):
+    """Raise this error instead of NotImplementedError for abstract methods
+    while keeping compatibility with Python 2 and Python 3.
+    """
+
+    def __init__(self, class_instance, methodtype='method'):
+        types = {'method', 'classmethod', 'staticmethod', 'property'}
+        if methodtype not in types:
+            msg = 'methodtype must be one of {}, got {} instead.'.format(
+                methodtype, types)
+            raise ValueError(msg)
+        self.methodtype = methodtype
+        self.class_instance = class_instance
+
+    def __str__(self):
+        if self.methodtype == 'classmethod':
+            name = self.class_instance.__name__
+        else:
+            name = self.class_instance.__class__.__name__
+        msg = "This {methodtype} must be defined in the concrete class {name}"
+        return msg.format(methodtype=self.methodtype, name=name)
diff --git a/pandas/formats/format.py b/pandas/formats/format.py
deleted file mode 100644
index 2665f5aea145d..0000000000000
--- a/pandas/formats/format.py
+++ /dev/null
@@ -1,2800 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Internal module for formatting output data in csv, html,
-and latex files. This module also applies to display formatting.
-"""
-
-from __future__ import print_function
-from distutils.version import LooseVersion
-# pylint: disable=W0141
-
-import sys
-
-from pandas.types.missing import isnull, notnull
-from pandas.types.common import (is_categorical_dtype,
-                                 is_float_dtype,
-                                 is_period_arraylike,
-                                 is_integer_dtype,
-                                 is_datetimetz,
-                                 is_integer,
-                                 is_float,
-                                 is_numeric_dtype,
-                                 is_datetime64_dtype,
-                                 is_timedelta64_dtype,
-                                 is_list_like)
-from pandas.types.generic import ABCSparseArray
-from pandas.core.base import PandasObject
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas import compat
-from pandas.compat import (StringIO, lzip, range, map, zip, reduce, u,
-                           OrderedDict, unichr)
-from pandas.util.terminal import get_terminal_size
-from pandas.core.config import get_option, set_option
-from pandas.io.common import _get_handle, UnicodeWriter, _expand_user
-from pandas.formats.printing import adjoin, justify, pprint_thing
-import pandas.core.common as com
-import pandas._libs.lib as lib
-from pandas._libs.tslib import (iNaT, Timestamp, Timedelta,
-                                format_array_from_datetime)
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex
-import pandas as pd
-import numpy as np
-
-import itertools
-import csv
-
-common_docstring = """
-    Parameters
-    ----------
-    buf : StringIO-like, optional
-        buffer to write to
-    columns : sequence, optional
-        the subset of columns to write; default None writes all columns
-    col_space : int, optional
-        the minimum width of each column
-    header : bool, optional
-        %(header)s
-    index : bool, optional
-        whether to print index (row) labels, default True
-    na_rep : string, optional
-        string representation of NAN to use, default 'NaN'
-    formatters : list or dict of one-parameter functions, optional
-        formatter functions to apply to columns' elements by position or name,
-        default None. The result of each function must be a unicode string.
-        List must be of length equal to the number of columns.
-    float_format : one-parameter function, optional
-        formatter function to apply to columns' elements if they are floats,
-        default None. The result of this function must be a unicode string.
-    sparsify : bool, optional
-        Set to False for a DataFrame with a hierarchical index to print every
-        multiindex key at each row, default True
-    index_names : bool, optional
-        Prints the names of the indexes, default True
-    line_width : int, optional
-        Width to wrap a line in characters, default no wrap"""
-
-justify_docstring = """
-    justify : {'left', 'right'}, default None
-        Left or right-justify the column labels. If None uses the option from
-        the print configuration (controlled by set_option), 'right' out
-        of the box."""
-
-return_docstring = """
-
-    Returns
-    -------
-    formatted : string (or unicode, depending on data and options)"""
-
-docstring_to_string = common_docstring + justify_docstring + return_docstring
-
-
-class CategoricalFormatter(object):
-
-    def __init__(self, categorical, buf=None, length=True, na_rep='NaN',
-                 footer=True):
-        self.categorical = categorical
-        self.buf = buf if buf is not None else StringIO(u(""))
-        self.na_rep = na_rep
-        self.length = length
-        self.footer = footer
-
-    def _get_footer(self):
-        footer = ''
-
-        if self.length:
-            if footer:
-                footer += ', '
-            footer += "Length: %d" % len(self.categorical)
-
-        level_info = self.categorical._repr_categories_info()
-
-        # Levels are added in a newline
-        if footer:
-            footer += '\n'
-        footer += level_info
-
-        return compat.text_type(footer)
-
-    def _get_formatted_values(self):
-        return format_array(self.categorical.get_values(), None,
-                            float_format=None, na_rep=self.na_rep)
-
-    def to_string(self):
-        categorical = self.categorical
-
-        if len(categorical) == 0:
-            if self.footer:
-                return self._get_footer()
-            else:
-                return u('')
-
-        fmt_values = self._get_formatted_values()
-
-        result = ['%s' % i for i in fmt_values]
-        result = [i.strip() for i in result]
-        result = u(', ').join(result)
-        result = [u('[') + result + u(']')]
-        if self.footer:
-            footer = self._get_footer()
-            if footer:
-                result.append(footer)
-
-        return compat.text_type(u('\n').join(result))
-
-
-class SeriesFormatter(object):
-
-    def __init__(self, series, buf=None, length=True, header=True, index=True,
-                 na_rep='NaN', name=False, float_format=None, dtype=True,
-                 max_rows=None):
-        self.series = series
-        self.buf = buf if buf is not None else StringIO()
-        self.name = name
-        self.na_rep = na_rep
-        self.header = header
-        self.length = length
-        self.index = index
-        self.max_rows = max_rows
-
-        if float_format is None:
-            float_format = get_option("display.float_format")
-        self.float_format = float_format
-        self.dtype = dtype
-        self.adj = _get_adjustment()
-
-        self._chk_truncate()
-
-    def _chk_truncate(self):
-        from pandas.tools.concat import concat
-        max_rows = self.max_rows
-        truncate_v = max_rows and (len(self.series) > max_rows)
-        series = self.series
-        if truncate_v:
-            if max_rows == 1:
-                row_num = max_rows
-                series = series.iloc[:max_rows]
-            else:
-                row_num = max_rows // 2
-                series = concat((series.iloc[:row_num],
-                                 series.iloc[-row_num:]))
-            self.tr_row_num = row_num
-        self.tr_series = series
-        self.truncate_v = truncate_v
-
-    def _get_footer(self):
-        name = self.series.name
-        footer = u('')
-
-        if getattr(self.series.index, 'freq', None) is not None:
-            footer += 'Freq: %s' % self.series.index.freqstr
-
-        if self.name is not False and name is not None:
-            if footer:
-                footer += ', '
-
-            series_name = pprint_thing(name,
-                                       escape_chars=('\t', '\r', '\n'))
-            footer += ("Name: %s" % series_name) if name is not None else ""
-
-        if self.length:
-            if footer:
-                footer += ', '
-            footer += 'Length: %d' % len(self.series)
-
-        if self.dtype is not False and self.dtype is not None:
-            name = getattr(self.tr_series.dtype, 'name', None)
-            if name:
-                if footer:
-                    footer += ', '
-                footer += 'dtype: %s' % pprint_thing(name)
-
-        # level infos are added to the end and in a new line, like it is done
-        # for Categoricals
-        if is_categorical_dtype(self.tr_series.dtype):
-            level_info = self.tr_series._values._repr_categories_info()
-            if footer:
-                footer += "\n"
-            footer += level_info
-
-        return compat.text_type(footer)
-
-    def _get_formatted_index(self):
-        index = self.tr_series.index
-        is_multi = isinstance(index, MultiIndex)
-
-        if is_multi:
-            have_header = any(name for name in index.names)
-            fmt_index = index.format(names=True)
-        else:
-            have_header = index.name is not None
-            fmt_index = index.format(name=True)
-        return fmt_index, have_header
-
-    def _get_formatted_values(self):
-        return format_array(self.tr_series._values, None,
-                            float_format=self.float_format, na_rep=self.na_rep)
-
-    def to_string(self):
-        series = self.tr_series
-        footer = self._get_footer()
-
-        if len(series) == 0:
-            return 'Series([], ' + footer + ')'
-
-        fmt_index, have_header = self._get_formatted_index()
-        fmt_values = self._get_formatted_values()
-
-        if self.truncate_v:
-            n_header_rows = 0
-            row_num = self.tr_row_num
-            width = self.adj.len(fmt_values[row_num - 1])
-            if width > 3:
-                dot_str = '...'
-            else:
-                dot_str = '..'
-            # Series uses mode=center because it has single value columns
-            # DataFrame uses mode=left
-            dot_str = self.adj.justify([dot_str], width, mode='center')[0]
-            fmt_values.insert(row_num + n_header_rows, dot_str)
-            fmt_index.insert(row_num + 1, '')
-
-        if self.index:
-            result = self.adj.adjoin(3, *[fmt_index[1:], fmt_values])
-        else:
-            result = self.adj.adjoin(3, fmt_values).replace('\n ',
-                                                            '\n').strip()
-
-        if self.header and have_header:
-            result = fmt_index[0] + '\n' + result
-
-        if footer:
-            result += '\n' + footer
-
-        return compat.text_type(u('').join(result))
-
-
-class TextAdjustment(object):
-
-    def __init__(self):
-        self.encoding = get_option("display.encoding")
-
-    def len(self, text):
-        return compat.strlen(text, encoding=self.encoding)
-
-    def justify(self, texts, max_len, mode='right'):
-        return justify(texts, max_len, mode=mode)
-
-    def adjoin(self, space, *lists, **kwargs):
-        return adjoin(space, *lists, strlen=self.len,
-                      justfunc=self.justify, **kwargs)
-
-
-class EastAsianTextAdjustment(TextAdjustment):
-
-    def __init__(self):
-        super(EastAsianTextAdjustment, self).__init__()
-        if get_option("display.unicode.ambiguous_as_wide"):
-            self.ambiguous_width = 2
-        else:
-            self.ambiguous_width = 1
-
-    def len(self, text):
-        return compat.east_asian_len(text, encoding=self.encoding,
-                                     ambiguous_width=self.ambiguous_width)
-
-    def justify(self, texts, max_len, mode='right'):
-        # re-calculate padding space per str considering East Asian Width
-        def _get_pad(t):
-            return max_len - self.len(t) + len(t)
-
-        if mode == 'left':
-            return [x.ljust(_get_pad(x)) for x in texts]
-        elif mode == 'center':
-            return [x.center(_get_pad(x)) for x in texts]
-        else:
-            return [x.rjust(_get_pad(x)) for x in texts]
-
-
-def _get_adjustment():
-    use_east_asian_width = get_option("display.unicode.east_asian_width")
-    if use_east_asian_width:
-        return EastAsianTextAdjustment()
-    else:
-        return TextAdjustment()
-
-
-class TableFormatter(object):
-    is_truncated = False
-    show_dimensions = None
-
-    @property
-    def should_show_dimensions(self):
-        return (self.show_dimensions is True or
-                (self.show_dimensions == 'truncate' and self.is_truncated))
-
-    def _get_formatter(self, i):
-        if isinstance(self.formatters, (list, tuple)):
-            if is_integer(i):
-                return self.formatters[i]
-            else:
-                return None
-        else:
-            if is_integer(i) and i not in self.columns:
-                i = self.columns[i]
-            return self.formatters.get(i, None)
-
-
-class DataFrameFormatter(TableFormatter):
-    """
-    Render a DataFrame
-
-    self.to_string() : console-friendly tabular output
-    self.to_html()   : html table
-    self.to_latex()   : LaTeX tabular environment table
-
-    """
-
-    __doc__ = __doc__ if __doc__ else ''
-    __doc__ += common_docstring + justify_docstring + return_docstring
-
-    def __init__(self, frame, buf=None, columns=None, col_space=None,
-                 header=True, index=True, na_rep='NaN', formatters=None,
-                 justify=None, float_format=None, sparsify=None,
-                 index_names=True, line_width=None, max_rows=None,
-                 max_cols=None, show_dimensions=False, decimal='.', **kwds):
-        self.frame = frame
-        self.buf = _expand_user(buf) if buf is not None else StringIO()
-        self.show_index_names = index_names
-
-        if sparsify is None:
-            sparsify = get_option("display.multi_sparse")
-
-        self.sparsify = sparsify
-
-        self.float_format = float_format
-        self.formatters = formatters if formatters is not None else {}
-        self.na_rep = na_rep
-        self.decimal = decimal
-        self.col_space = col_space
-        self.header = header
-        self.index = index
-        self.line_width = line_width
-        self.max_rows = max_rows
-        self.max_cols = max_cols
-        self.max_rows_displayed = min(max_rows or len(self.frame),
-                                      len(self.frame))
-        self.show_dimensions = show_dimensions
-
-        if justify is None:
-            self.justify = get_option("display.colheader_justify")
-        else:
-            self.justify = justify
-
-        self.kwds = kwds
-
-        if columns is not None:
-            self.columns = _ensure_index(columns)
-            self.frame = self.frame[self.columns]
-        else:
-            self.columns = frame.columns
-
-        self._chk_truncate()
-        self.adj = _get_adjustment()
-
-    def _chk_truncate(self):
-        """
-        Checks whether the frame should be truncated. If so, slices
-        the frame up.
-        """
-        from pandas.tools.concat import concat
-
-        # Column of which first element is used to determine width of a dot col
-        self.tr_size_col = -1
-
-        # Cut the data to the information actually printed
-        max_cols = self.max_cols
-        max_rows = self.max_rows
-
-        if max_cols == 0 or max_rows == 0:  # assume we are in the terminal
-                                            # (why else = 0)
-            (w, h) = get_terminal_size()
-            self.w = w
-            self.h = h
-            if self.max_rows == 0:
-                dot_row = 1
-                prompt_row = 1
-                if self.show_dimensions:
-                    show_dimension_rows = 3
-                n_add_rows = (self.header + dot_row + show_dimension_rows +
-                              prompt_row)
-                # rows available to fill with actual data
-                max_rows_adj = self.h - n_add_rows
-                self.max_rows_adj = max_rows_adj
-
-            # Format only rows and columns that could potentially fit the
-            # screen
-            if max_cols == 0 and len(self.frame.columns) > w:
-                max_cols = w
-            if max_rows == 0 and len(self.frame) > h:
-                max_rows = h
-
-        if not hasattr(self, 'max_rows_adj'):
-            self.max_rows_adj = max_rows
-        if not hasattr(self, 'max_cols_adj'):
-            self.max_cols_adj = max_cols
-
-        max_cols_adj = self.max_cols_adj
-        max_rows_adj = self.max_rows_adj
-
-        truncate_h = max_cols_adj and (len(self.columns) > max_cols_adj)
-        truncate_v = max_rows_adj and (len(self.frame) > max_rows_adj)
-
-        frame = self.frame
-        if truncate_h:
-            if max_cols_adj == 0:
-                col_num = len(frame.columns)
-            elif max_cols_adj == 1:
-                frame = frame.iloc[:, :max_cols]
-                col_num = max_cols
-            else:
-                col_num = (max_cols_adj // 2)
-                frame = concat((frame.iloc[:, :col_num],
-                                frame.iloc[:, -col_num:]), axis=1)
-            self.tr_col_num = col_num
-        if truncate_v:
-            if max_rows_adj == 0:
-                row_num = len(frame)
-            if max_rows_adj == 1:
-                row_num = max_rows
-                frame = frame.iloc[:max_rows, :]
-            else:
-                row_num = max_rows_adj // 2
-                frame = concat((frame.iloc[:row_num, :],
-                                frame.iloc[-row_num:, :]))
-            self.tr_row_num = row_num
-
-        self.tr_frame = frame
-        self.truncate_h = truncate_h
-        self.truncate_v = truncate_v
-        self.is_truncated = self.truncate_h or self.truncate_v
-
-    def _to_str_columns(self):
-        """
-        Render a DataFrame to a list of columns (as lists of strings).
-        """
-        frame = self.tr_frame
-
-        # may include levels names also
-
-        str_index = self._get_formatted_index(frame)
-
-        if not is_list_like(self.header) and not self.header:
-            stringified = []
-            for i, c in enumerate(frame):
-                fmt_values = self._format_col(i)
-                fmt_values = _make_fixed_width(fmt_values, self.justify,
-                                               minimum=(self.col_space or 0),
-                                               adj=self.adj)
-                stringified.append(fmt_values)
-        else:
-            if is_list_like(self.header):
-                if len(self.header) != len(self.columns):
-                    raise ValueError(('Writing %d cols but got %d aliases'
-                                      % (len(self.columns), len(self.header))))
-                str_columns = [[label] for label in self.header]
-            else:
-                str_columns = self._get_formatted_column_labels(frame)
-
-            stringified = []
-            for i, c in enumerate(frame):
-                cheader = str_columns[i]
-                header_colwidth = max(self.col_space or 0,
-                                      *(self.adj.len(x) for x in cheader))
-                fmt_values = self._format_col(i)
-                fmt_values = _make_fixed_width(fmt_values, self.justify,
-                                               minimum=header_colwidth,
-                                               adj=self.adj)
-
-                max_len = max(np.max([self.adj.len(x) for x in fmt_values]),
-                              header_colwidth)
-                cheader = self.adj.justify(cheader, max_len, mode=self.justify)
-                stringified.append(cheader + fmt_values)
-
-        strcols = stringified
-        if self.index:
-            strcols.insert(0, str_index)
-
-        # Add ... to signal truncated
-        truncate_h = self.truncate_h
-        truncate_v = self.truncate_v
-
-        if truncate_h:
-            col_num = self.tr_col_num
-            # infer from column header
-            col_width = self.adj.len(strcols[self.tr_size_col][0])
-            strcols.insert(self.tr_col_num + 1, ['...'.center(col_width)] *
-                           (len(str_index)))
-        if truncate_v:
-            n_header_rows = len(str_index) - len(frame)
-            row_num = self.tr_row_num
-            for ix, col in enumerate(strcols):
-                # infer from above row
-                cwidth = self.adj.len(strcols[ix][row_num])
-                is_dot_col = False
-                if truncate_h:
-                    is_dot_col = ix == col_num + 1
-                if cwidth > 3 or is_dot_col:
-                    my_str = '...'
-                else:
-                    my_str = '..'
-
-                if ix == 0:
-                    dot_mode = 'left'
-                elif is_dot_col:
-                    cwidth = self.adj.len(strcols[self.tr_size_col][0])
-                    dot_mode = 'center'
-                else:
-                    dot_mode = 'right'
-                dot_str = self.adj.justify([my_str], cwidth, mode=dot_mode)[0]
-                strcols[ix].insert(row_num + n_header_rows, dot_str)
-        return strcols
-
-    def to_string(self):
-        """
-        Render a DataFrame to a console-friendly tabular output.
-        """
-        from pandas import Series
-
-        frame = self.frame
-
-        if len(frame.columns) == 0 or len(frame.index) == 0:
-            info_line = (u('Empty %s\nColumns: %s\nIndex: %s') %
-                         (type(self.frame).__name__,
-                          pprint_thing(frame.columns),
-                          pprint_thing(frame.index)))
-            text = info_line
-        else:
-            strcols = self._to_str_columns()
-            if self.line_width is None:  # no need to wrap around just print
-                # the whole frame
-                text = self.adj.adjoin(1, *strcols)
-            elif (not isinstance(self.max_cols, int) or
-                    self.max_cols > 0):  # need to wrap around
-                text = self._join_multiline(*strcols)
-            else:  # max_cols == 0. Try to fit frame to terminal
-                text = self.adj.adjoin(1, *strcols).split('\n')
-                row_lens = Series(text).apply(len)
-                max_len_col_ix = np.argmax(row_lens)
-                max_len = row_lens[max_len_col_ix]
-                headers = [ele[0] for ele in strcols]
-                # Size of last col determines dot col size. See
-                # `self._to_str_columns
-                size_tr_col = len(headers[self.tr_size_col])
-                max_len += size_tr_col  # Need to make space for largest row
-                # plus truncate dot col
-                dif = max_len - self.w
-                adj_dif = dif
-                col_lens = Series([Series(ele).apply(len).max()
-                                   for ele in strcols])
-                n_cols = len(col_lens)
-                counter = 0
-                while adj_dif > 0 and n_cols > 1:
-                    counter += 1
-                    mid = int(round(n_cols / 2.))
-                    mid_ix = col_lens.index[mid]
-                    col_len = col_lens[mid_ix]
-                    adj_dif -= (col_len + 1)  # adjoin adds one
-                    col_lens = col_lens.drop(mid_ix)
-                    n_cols = len(col_lens)
-                max_cols_adj = n_cols - self.index  # subtract index column
-                self.max_cols_adj = max_cols_adj
-
-                # Call again _chk_truncate to cut frame appropriately
-                # and then generate string representation
-                self._chk_truncate()
-                strcols = self._to_str_columns()
-                text = self.adj.adjoin(1, *strcols)
-        if not self.index:
-            text = text.replace('\n ', '\n').strip()
-        self.buf.writelines(text)
-
-        if self.should_show_dimensions:
-            self.buf.write("\n\n[%d rows x %d columns]" %
-                           (len(frame), len(frame.columns)))
-
-    def _join_multiline(self, *strcols):
-        lwidth = self.line_width
-        adjoin_width = 1
-        strcols = list(strcols)
-        if self.index:
-            idx = strcols.pop(0)
-            lwidth -= np.array([self.adj.len(x)
-                                for x in idx]).max() + adjoin_width
-
-        col_widths = [np.array([self.adj.len(x) for x in col]).max() if
-                      len(col) > 0 else 0 for col in strcols]
-        col_bins = _binify(col_widths, lwidth)
-        nbins = len(col_bins)
-
-        if self.truncate_v:
-            nrows = self.max_rows_adj + 1
-        else:
-            nrows = len(self.frame)
-
-        str_lst = []
-        st = 0
-        for i, ed in enumerate(col_bins):
-            row = strcols[st:ed]
-            if self.index:
-                row.insert(0, idx)
-            if nbins > 1:
-                if ed <= len(strcols) and i < nbins - 1:
-                    row.append([' \\'] + ['  '] * (nrows - 1))
-                else:
-                    row.append([' '] * nrows)
-            str_lst.append(self.adj.adjoin(adjoin_width, *row))
-            st = ed
-        return '\n\n'.join(str_lst)
-
-    def to_latex(self, column_format=None, longtable=False, encoding=None,
-                 multicolumn=False, multicolumn_format=None, multirow=False):
-        """
-        Render a DataFrame to a LaTeX tabular/longtable environment output.
-        """
-
-        latex_renderer = LatexFormatter(self, column_format=column_format,
-                                        longtable=longtable,
-                                        multicolumn=multicolumn,
-                                        multicolumn_format=multicolumn_format,
-                                        multirow=multirow)
-
-        if encoding is None:
-            encoding = 'ascii' if compat.PY2 else 'utf-8'
-
-        if hasattr(self.buf, 'write'):
-            latex_renderer.write_result(self.buf)
-        elif isinstance(self.buf, compat.string_types):
-            import codecs
-            with codecs.open(self.buf, 'w', encoding=encoding) as f:
-                latex_renderer.write_result(f)
-        else:
-            raise TypeError('buf is not a file name and it has no write '
-                            'method')
-
-    def _format_col(self, i):
-        frame = self.tr_frame
-        formatter = self._get_formatter(i)
-        return format_array(frame.iloc[:, i]._values, formatter,
-                            float_format=self.float_format, na_rep=self.na_rep,
-                            space=self.col_space, decimal=self.decimal)
-
-    def to_html(self, classes=None, notebook=False, border=None):
-        """
-        Render a DataFrame to a html table.
-
-        Parameters
-        ----------
-        classes : str or list-like
-            classes to include in the `class` attribute of the opening
-            ``<table>`` tag, in addition to the default "dataframe".
-        notebook : {True, False}, optional, default False
-            Whether the generated HTML is for IPython Notebook.
-        border : int
-            A ``border=border`` attribute is included in the opening
-            ``<table>`` tag. Default ``pd.options.html.border``.
-
-            .. versionadded:: 0.19.0
-         """
-        html_renderer = HTMLFormatter(self, classes=classes,
-                                      max_rows=self.max_rows,
-                                      max_cols=self.max_cols,
-                                      notebook=notebook,
-                                      border=border)
-        if hasattr(self.buf, 'write'):
-            html_renderer.write_result(self.buf)
-        elif isinstance(self.buf, compat.string_types):
-            with open(self.buf, 'w') as f:
-                html_renderer.write_result(f)
-        else:
-            raise TypeError('buf is not a file name and it has no write '
-                            ' method')
-
-    def _get_formatted_column_labels(self, frame):
-        from pandas.core.index import _sparsify
-
-        columns = frame.columns
-
-        if isinstance(columns, MultiIndex):
-            fmt_columns = columns.format(sparsify=False, adjoin=False)
-            fmt_columns = lzip(*fmt_columns)
-            dtypes = self.frame.dtypes._values
-
-            # if we have a Float level, they don't use leading space at all
-            restrict_formatting = any([l.is_floating for l in columns.levels])
-            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
-
-            def space_format(x, y):
-                if (y not in self.formatters and
-                        need_leadsp[x] and not restrict_formatting):
-                    return ' ' + y
-                return y
-
-            str_columns = list(zip(*[[space_format(x, y) for y in x]
-                                     for x in fmt_columns]))
-            if self.sparsify:
-                str_columns = _sparsify(str_columns)
-
-            str_columns = [list(x) for x in zip(*str_columns)]
-        else:
-            fmt_columns = columns.format()
-            dtypes = self.frame.dtypes
-            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
-            str_columns = [[' ' + x if not self._get_formatter(i) and
-                            need_leadsp[x] else x]
-                           for i, (col, x) in enumerate(zip(columns,
-                                                            fmt_columns))]
-
-        if self.show_index_names and self.has_index_names:
-            for x in str_columns:
-                x.append('')
-
-        # self.str_columns = str_columns
-        return str_columns
-
-    @property
-    def has_index_names(self):
-        return _has_names(self.frame.index)
-
-    @property
-    def has_column_names(self):
-        return _has_names(self.frame.columns)
-
-    def _get_formatted_index(self, frame):
-        # Note: this is only used by to_string() and to_latex(), not by
-        # to_html().
-        index = frame.index
-        columns = frame.columns
-
-        show_index_names = self.show_index_names and self.has_index_names
-        show_col_names = (self.show_index_names and self.has_column_names)
-
-        fmt = self._get_formatter('__index__')
-
-        if isinstance(index, MultiIndex):
-            fmt_index = index.format(sparsify=self.sparsify, adjoin=False,
-                                     names=show_index_names, formatter=fmt)
-        else:
-            fmt_index = [index.format(name=show_index_names, formatter=fmt)]
-        fmt_index = [tuple(_make_fixed_width(list(x), justify='left',
-                                             minimum=(self.col_space or 0),
-                                             adj=self.adj)) for x in fmt_index]
-
-        adjoined = self.adj.adjoin(1, *fmt_index).split('\n')
-
-        # empty space for columns
-        if show_col_names:
-            col_header = ['%s' % x for x in self._get_column_name_list()]
-        else:
-            col_header = [''] * columns.nlevels
-
-        if self.header:
-            return col_header + adjoined
-        else:
-            return adjoined
-
-    def _get_column_name_list(self):
-        names = []
-        columns = self.frame.columns
-        if isinstance(columns, MultiIndex):
-            names.extend('' if name is None else name
-                         for name in columns.names)
-        else:
-            names.append('' if columns.name is None else columns.name)
-        return names
-
-
-class LatexFormatter(TableFormatter):
-    """ Used to render a DataFrame to a LaTeX tabular/longtable environment
-    output.
-
-    Parameters
-    ----------
-    formatter : `DataFrameFormatter`
-    column_format : str, default None
-        The columns format as specified in `LaTeX table format
-        <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3 columns
-    longtable : boolean, default False
-        Use a longtable environment instead of tabular.
-
-    See also
-    --------
-    HTMLFormatter
-    """
-
-    def __init__(self, formatter, column_format=None, longtable=False,
-                 multicolumn=False, multicolumn_format=None, multirow=False):
-        self.fmt = formatter
-        self.frame = self.fmt.frame
-        self.column_format = column_format
-        self.longtable = longtable
-        self.multicolumn = multicolumn
-        self.multicolumn_format = multicolumn_format
-        self.multirow = multirow
-
-    def write_result(self, buf):
-        """
-        Render a DataFrame to a LaTeX tabular/longtable environment output.
-        """
-
-        # string representation of the columns
-        if len(self.frame.columns) == 0 or len(self.frame.index) == 0:
-            info_line = (u('Empty %s\nColumns: %s\nIndex: %s') %
-                         (type(self.frame).__name__, self.frame.columns,
-                          self.frame.index))
-            strcols = [[info_line]]
-        else:
-            strcols = self.fmt._to_str_columns()
-
-        def get_col_type(dtype):
-            if issubclass(dtype.type, np.number):
-                return 'r'
-            else:
-                return 'l'
-
-        # reestablish the MultiIndex that has been joined by _to_str_column
-        if self.fmt.index and isinstance(self.frame.index, MultiIndex):
-            clevels = self.frame.columns.nlevels
-            strcols.pop(0)
-            name = any(self.frame.index.names)
-            cname = any(self.frame.columns.names)
-            lastcol = self.frame.index.nlevels - 1
-            for i, lev in enumerate(self.frame.index.levels):
-                lev2 = lev.format()
-                blank = ' ' * len(lev2[0])
-                # display column names in last index-column
-                if cname and i == lastcol:
-                    lev3 = [x if x else '{}' for x in self.frame.columns.names]
-                else:
-                    lev3 = [blank] * clevels
-                if name:
-                    lev3.append(lev.name)
-                for level_idx, group in itertools.groupby(
-                        self.frame.index.labels[i]):
-                    count = len(list(group))
-                    lev3.extend([lev2[level_idx]] + [blank] * (count - 1))
-                strcols.insert(i, lev3)
-
-        column_format = self.column_format
-        if column_format is None:
-            dtypes = self.frame.dtypes._values
-            column_format = ''.join(map(get_col_type, dtypes))
-            if self.fmt.index:
-                index_format = 'l' * self.frame.index.nlevels
-                column_format = index_format + column_format
-        elif not isinstance(column_format,
-                            compat.string_types):  # pragma: no cover
-            raise AssertionError('column_format must be str or unicode, not %s'
-                                 % type(column_format))
-
-        if not self.longtable:
-            buf.write('\\begin{tabular}{%s}\n' % column_format)
-            buf.write('\\toprule\n')
-        else:
-            buf.write('\\begin{longtable}{%s}\n' % column_format)
-            buf.write('\\toprule\n')
-
-        ilevels = self.frame.index.nlevels
-        clevels = self.frame.columns.nlevels
-        nlevels = clevels
-        if any(self.frame.index.names):
-            nlevels += 1
-        strrows = list(zip(*strcols))
-        self.clinebuf = []
-
-        for i, row in enumerate(strrows):
-            if i == nlevels and self.fmt.header:
-                buf.write('\\midrule\n')  # End of header
-                if self.longtable:
-                    buf.write('\\endhead\n')
-                    buf.write('\\midrule\n')
-                    buf.write('\\multicolumn{3}{r}{{Continued on next '
-                              'page}} \\\\\n')
-                    buf.write('\\midrule\n')
-                    buf.write('\\endfoot\n\n')
-                    buf.write('\\bottomrule\n')
-                    buf.write('\\endlastfoot\n')
-            if self.fmt.kwds.get('escape', True):
-                # escape backslashes first
-                crow = [(x.replace('\\', '\\textbackslash').replace('_', '\\_')
-                         .replace('%', '\\%').replace('$', '\\$')
-                         .replace('#', '\\#').replace('{', '\\{')
-                         .replace('}', '\\}').replace('~', '\\textasciitilde')
-                         .replace('^', '\\textasciicircum').replace('&', '\\&')
-                         if x else '{}') for x in row]
-            else:
-                crow = [x if x else '{}' for x in row]
-            if i < clevels and self.fmt.header and self.multicolumn:
-                # sum up columns to multicolumns
-                crow = self._format_multicolumn(crow, ilevels)
-            if (i >= nlevels and self.fmt.index and self.multirow and
-                    ilevels > 1):
-                # sum up rows to multirows
-                crow = self._format_multirow(crow, ilevels, i, strrows)
-            buf.write(' & '.join(crow))
-            buf.write(' \\\\\n')
-            if self.multirow and i < len(strrows) - 1:
-                self._print_cline(buf, i, len(strcols))
-
-        if not self.longtable:
-            buf.write('\\bottomrule\n')
-            buf.write('\\end{tabular}\n')
-        else:
-            buf.write('\\end{longtable}\n')
-
-    def _format_multicolumn(self, row, ilevels):
-        """
-        Combine columns belonging to a group to a single multicolumn entry
-        according to self.multicolumn_format
-
-        e.g.:
-        a &  &  & b & c &
-        will become
-        \multicolumn{3}{l}{a} & b & \multicolumn{2}{l}{c}
-        """
-        row2 = list(row[:ilevels])
-        ncol = 1
-        coltext = ''
-
-        def append_col():
-            # write multicolumn if needed
-            if ncol > 1:
-                row2.append('\\multicolumn{{{0:d}}}{{{1:s}}}{{{2:s}}}'
-                            .format(ncol, self.multicolumn_format,
-                                    coltext.strip()))
-            # don't modify where not needed
-            else:
-                row2.append(coltext)
-        for c in row[ilevels:]:
-            # if next col has text, write the previous
-            if c.strip():
-                if coltext:
-                    append_col()
-                coltext = c
-                ncol = 1
-            # if not, add it to the previous multicolumn
-            else:
-                ncol += 1
-        # write last column name
-        if coltext:
-            append_col()
-        return row2
-
-    def _format_multirow(self, row, ilevels, i, rows):
-        """
-        Check following rows, whether row should be a multirow
-
-        e.g.:     becomes:
-        a & 0 &   \multirow{2}{*}{a} & 0 &
-          & 1 &     & 1 &
-        b & 0 &   \cline{1-2}
-                  b & 0 &
-        """
-        for j in range(ilevels):
-            if row[j].strip():
-                nrow = 1
-                for r in rows[i + 1:]:
-                    if not r[j].strip():
-                        nrow += 1
-                    else:
-                        break
-                if nrow > 1:
-                    # overwrite non-multirow entry
-                    row[j] = '\\multirow{{{0:d}}}{{*}}{{{1:s}}}'.format(
-                        nrow, row[j].strip())
-                    # save when to end the current block with \cline
-                    self.clinebuf.append([i + nrow - 1, j + 1])
-        return row
-
-    def _print_cline(self, buf, i, icol):
-        """
-        Print clines after multirow-blocks are finished
-        """
-        for cl in self.clinebuf:
-            if cl[0] == i:
-                buf.write('\cline{{{0:d}-{1:d}}}\n'.format(cl[1], icol))
-        # remove entries that have been written to buffer
-        self.clinebuf = [x for x in self.clinebuf if x[0] != i]
-
-
-class HTMLFormatter(TableFormatter):
-
-    indent_delta = 2
-
-    def __init__(self, formatter, classes=None, max_rows=None, max_cols=None,
-                 notebook=False, border=None):
-        self.fmt = formatter
-        self.classes = classes
-
-        self.frame = self.fmt.frame
-        self.columns = self.fmt.tr_frame.columns
-        self.elements = []
-        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
-        self.escape = self.fmt.kwds.get('escape', True)
-
-        self.max_rows = max_rows or len(self.fmt.frame)
-        self.max_cols = max_cols or len(self.fmt.columns)
-        self.show_dimensions = self.fmt.show_dimensions
-        self.is_truncated = (self.max_rows < len(self.fmt.frame) or
-                             self.max_cols < len(self.fmt.columns))
-        self.notebook = notebook
-        if border is None:
-            border = get_option('html.border')
-        self.border = border
-
-    def write(self, s, indent=0):
-        rs = pprint_thing(s)
-        self.elements.append(' ' * indent + rs)
-
-    def write_th(self, s, indent=0, tags=None):
-        if self.fmt.col_space is not None and self.fmt.col_space > 0:
-            tags = (tags or "")
-            tags += 'style="min-width: %s;"' % self.fmt.col_space
-
-        return self._write_cell(s, kind='th', indent=indent, tags=tags)
-
-    def write_td(self, s, indent=0, tags=None):
-        return self._write_cell(s, kind='td', indent=indent, tags=tags)
-
-    def _write_cell(self, s, kind='td', indent=0, tags=None):
-        if tags is not None:
-            start_tag = '<%s %s>' % (kind, tags)
-        else:
-            start_tag = '<%s>' % kind
-
-        if self.escape:
-            # escape & first to prevent double escaping of &
-            esc = OrderedDict([('&', r'&amp;'), ('<', r'&lt;'),
-                               ('>', r'&gt;')])
-        else:
-            esc = {}
-        rs = pprint_thing(s, escape_chars=esc).strip()
-        self.write('%s%s</%s>' % (start_tag, rs, kind), indent)
-
-    def write_tr(self, line, indent=0, indent_delta=4, header=False,
-                 align=None, tags=None, nindex_levels=0):
-        if tags is None:
-            tags = {}
-
-        if align is None:
-            self.write('<tr>', indent)
-        else:
-            self.write('<tr style="text-align: %s;">' % align, indent)
-        indent += indent_delta
-
-        for i, s in enumerate(line):
-            val_tag = tags.get(i, None)
-            if header or (self.bold_rows and i < nindex_levels):
-                self.write_th(s, indent, tags=val_tag)
-            else:
-                self.write_td(s, indent, tags=val_tag)
-
-        indent -= indent_delta
-        self.write('</tr>', indent)
-
-    def write_result(self, buf):
-        indent = 0
-        frame = self.frame
-
-        _classes = ['dataframe']  # Default class.
-        if self.classes is not None:
-            if isinstance(self.classes, str):
-                self.classes = self.classes.split()
-            if not isinstance(self.classes, (list, tuple)):
-                raise AssertionError('classes must be list or tuple, '
-                                     'not %s' % type(self.classes))
-            _classes.extend(self.classes)
-
-        if self.notebook:
-            div_style = ''
-            try:
-                import IPython
-                if IPython.__version__ < LooseVersion('3.0.0'):
-                    div_style = ' style="max-width:1500px;overflow:auto;"'
-            except (ImportError, AttributeError):
-                pass
-
-            self.write('<div{0}>'.format(div_style))
-
-        self.write('<table border="%s" class="%s">' % (self.border,
-                                                       ' '.join(_classes)),
-                   indent)
-
-        indent += self.indent_delta
-        indent = self._write_header(indent)
-        indent = self._write_body(indent)
-
-        self.write('</table>', indent)
-        if self.should_show_dimensions:
-            by = chr(215) if compat.PY3 else unichr(215)  # ×
-            self.write(u('<p>%d rows %s %d columns</p>') %
-                       (len(frame), by, len(frame.columns)))
-
-        if self.notebook:
-            self.write('</div>')
-
-        _put_lines(buf, self.elements)
-
-    def _write_header(self, indent):
-        truncate_h = self.fmt.truncate_h
-        row_levels = self.frame.index.nlevels
-        if not self.fmt.header:
-            # write nothing
-            return indent
-
-        def _column_header():
-            if self.fmt.index:
-                row = [''] * (self.frame.index.nlevels - 1)
-            else:
-                row = []
-
-            if isinstance(self.columns, MultiIndex):
-                if self.fmt.has_column_names and self.fmt.index:
-                    row.append(single_column_table(self.columns.names))
-                else:
-                    row.append('')
-                style = "text-align: %s;" % self.fmt.justify
-                row.extend([single_column_table(c, self.fmt.justify, style)
-                            for c in self.columns])
-            else:
-                if self.fmt.index:
-                    row.append(self.columns.name or '')
-                row.extend(self.columns)
-            return row
-
-        self.write('<thead>', indent)
-        row = []
-
-        indent += self.indent_delta
-
-        if isinstance(self.columns, MultiIndex):
-            template = 'colspan="%d" halign="left"'
-
-            if self.fmt.sparsify:
-                # GH3547
-                sentinel = com.sentinel_factory()
-            else:
-                sentinel = None
-            levels = self.columns.format(sparsify=sentinel, adjoin=False,
-                                         names=False)
-            level_lengths = _get_level_lengths(levels, sentinel)
-            inner_lvl = len(level_lengths) - 1
-            for lnum, (records, values) in enumerate(zip(level_lengths,
-                                                         levels)):
-                if truncate_h:
-                    # modify the header lines
-                    ins_col = self.fmt.tr_col_num
-                    if self.fmt.sparsify:
-                        recs_new = {}
-                        # Increment tags after ... col.
-                        for tag, span in list(records.items()):
-                            if tag >= ins_col:
-                                recs_new[tag + 1] = span
-                            elif tag + span > ins_col:
-                                recs_new[tag] = span + 1
-                                if lnum == inner_lvl:
-                                    values = (values[:ins_col] + (u('...'),) +
-                                              values[ins_col:])
-                                else:
-                                    # sparse col headers do not receive a ...
-                                    values = (values[:ins_col] +
-                                              (values[ins_col - 1], ) +
-                                              values[ins_col:])
-                            else:
-                                recs_new[tag] = span
-                            # if ins_col lies between tags, all col headers
-                            # get ...
-                            if tag + span == ins_col:
-                                recs_new[ins_col] = 1
-                                values = (values[:ins_col] + (u('...'),) +
-                                          values[ins_col:])
-                        records = recs_new
-                        inner_lvl = len(level_lengths) - 1
-                        if lnum == inner_lvl:
-                            records[ins_col] = 1
-                    else:
-                        recs_new = {}
-                        for tag, span in list(records.items()):
-                            if tag >= ins_col:
-                                recs_new[tag + 1] = span
-                            else:
-                                recs_new[tag] = span
-                        recs_new[ins_col] = 1
-                        records = recs_new
-                        values = (values[:ins_col] + [u('...')] +
-                                  values[ins_col:])
-
-                name = self.columns.names[lnum]
-                row = [''] * (row_levels - 1) + ['' if name is None else
-                                                 pprint_thing(name)]
-
-                if row == [""] and self.fmt.index is False:
-                    row = []
-
-                tags = {}
-                j = len(row)
-                for i, v in enumerate(values):
-                    if i in records:
-                        if records[i] > 1:
-                            tags[j] = template % records[i]
-                    else:
-                        continue
-                    j += 1
-                    row.append(v)
-                self.write_tr(row, indent, self.indent_delta, tags=tags,
-                              header=True)
-        else:
-            col_row = _column_header()
-            align = self.fmt.justify
-
-            if truncate_h:
-                ins_col = row_levels + self.fmt.tr_col_num
-                col_row.insert(ins_col, '...')
-
-            self.write_tr(col_row, indent, self.indent_delta, header=True,
-                          align=align)
-
-        if self.fmt.has_index_names and self.fmt.index:
-            row = ([x if x is not None else ''
-                    for x in self.frame.index.names] +
-                   [''] * min(len(self.columns), self.max_cols))
-            if truncate_h:
-                ins_col = row_levels + self.fmt.tr_col_num
-                row.insert(ins_col, '')
-            self.write_tr(row, indent, self.indent_delta, header=True)
-
-        indent -= self.indent_delta
-        self.write('</thead>', indent)
-
-        return indent
-
-    def _write_body(self, indent):
-        self.write('<tbody>', indent)
-        indent += self.indent_delta
-
-        fmt_values = {}
-        for i in range(min(len(self.columns), self.max_cols)):
-            fmt_values[i] = self.fmt._format_col(i)
-
-        # write values
-        if self.fmt.index:
-            if isinstance(self.frame.index, MultiIndex):
-                self._write_hierarchical_rows(fmt_values, indent)
-            else:
-                self._write_regular_rows(fmt_values, indent)
-        else:
-            for i in range(min(len(self.frame), self.max_rows)):
-                row = [fmt_values[j][i] for j in range(len(self.columns))]
-                self.write_tr(row, indent, self.indent_delta, tags=None)
-
-        indent -= self.indent_delta
-        self.write('</tbody>', indent)
-        indent -= self.indent_delta
-
-        return indent
-
-    def _write_regular_rows(self, fmt_values, indent):
-        truncate_h = self.fmt.truncate_h
-        truncate_v = self.fmt.truncate_v
-
-        ncols = len(self.fmt.tr_frame.columns)
-        nrows = len(self.fmt.tr_frame)
-        fmt = self.fmt._get_formatter('__index__')
-        if fmt is not None:
-            index_values = self.fmt.tr_frame.index.map(fmt)
-        else:
-            index_values = self.fmt.tr_frame.index.format()
-
-        row = []
-        for i in range(nrows):
-
-            if truncate_v and i == (self.fmt.tr_row_num):
-                str_sep_row = ['...' for ele in row]
-                self.write_tr(str_sep_row, indent, self.indent_delta,
-                              tags=None, nindex_levels=1)
-
-            row = []
-            row.append(index_values[i])
-            row.extend(fmt_values[j][i] for j in range(ncols))
-
-            if truncate_h:
-                dot_col_ix = self.fmt.tr_col_num + 1
-                row.insert(dot_col_ix, '...')
-            self.write_tr(row, indent, self.indent_delta, tags=None,
-                          nindex_levels=1)
-
-    def _write_hierarchical_rows(self, fmt_values, indent):
-        template = 'rowspan="%d" valign="top"'
-
-        truncate_h = self.fmt.truncate_h
-        truncate_v = self.fmt.truncate_v
-        frame = self.fmt.tr_frame
-        ncols = len(frame.columns)
-        nrows = len(frame)
-        row_levels = self.frame.index.nlevels
-
-        idx_values = frame.index.format(sparsify=False, adjoin=False,
-                                        names=False)
-        idx_values = lzip(*idx_values)
-
-        if self.fmt.sparsify:
-            # GH3547
-            sentinel = com.sentinel_factory()
-            levels = frame.index.format(sparsify=sentinel, adjoin=False,
-                                        names=False)
-
-            level_lengths = _get_level_lengths(levels, sentinel)
-            inner_lvl = len(level_lengths) - 1
-            if truncate_v:
-                # Insert ... row and adjust idx_values and
-                # level_lengths to take this into account.
-                ins_row = self.fmt.tr_row_num
-                inserted = False
-                for lnum, records in enumerate(level_lengths):
-                    rec_new = {}
-                    for tag, span in list(records.items()):
-                        if tag >= ins_row:
-                            rec_new[tag + 1] = span
-                        elif tag + span > ins_row:
-                            rec_new[tag] = span + 1
-
-                            # GH 14882 - Make sure insertion done once
-                            if not inserted:
-                                dot_row = list(idx_values[ins_row - 1])
-                                dot_row[-1] = u('...')
-                                idx_values.insert(ins_row, tuple(dot_row))
-                                inserted = True
-                            else:
-                                dot_row = list(idx_values[ins_row])
-                                dot_row[inner_lvl - lnum] = u('...')
-                                idx_values[ins_row] = tuple(dot_row)
-                        else:
-                            rec_new[tag] = span
-                        # If ins_row lies between tags, all cols idx cols
-                        # receive ...
-                        if tag + span == ins_row:
-                            rec_new[ins_row] = 1
-                            if lnum == 0:
-                                idx_values.insert(ins_row, tuple(
-                                    [u('...')] * len(level_lengths)))
-
-                            # GH 14882 - Place ... in correct level
-                            elif inserted:
-                                dot_row = list(idx_values[ins_row])
-                                dot_row[inner_lvl - lnum] = u('...')
-                                idx_values[ins_row] = tuple(dot_row)
-                    level_lengths[lnum] = rec_new
-
-                level_lengths[inner_lvl][ins_row] = 1
-                for ix_col in range(len(fmt_values)):
-                    fmt_values[ix_col].insert(ins_row, '...')
-                nrows += 1
-
-            for i in range(nrows):
-                row = []
-                tags = {}
-
-                sparse_offset = 0
-                j = 0
-                for records, v in zip(level_lengths, idx_values[i]):
-                    if i in records:
-                        if records[i] > 1:
-                            tags[j] = template % records[i]
-                    else:
-                        sparse_offset += 1
-                        continue
-
-                    j += 1
-                    row.append(v)
-
-                row.extend(fmt_values[j][i] for j in range(ncols))
-                if truncate_h:
-                    row.insert(row_levels - sparse_offset +
-                               self.fmt.tr_col_num, '...')
-                self.write_tr(row, indent, self.indent_delta, tags=tags,
-                              nindex_levels=len(levels) - sparse_offset)
-        else:
-            for i in range(len(frame)):
-                idx_values = list(zip(*frame.index.format(
-                    sparsify=False, adjoin=False, names=False)))
-                row = []
-                row.extend(idx_values[i])
-                row.extend(fmt_values[j][i] for j in range(ncols))
-                if truncate_h:
-                    row.insert(row_levels + self.fmt.tr_col_num, '...')
-                self.write_tr(row, indent, self.indent_delta, tags=None,
-                              nindex_levels=frame.index.nlevels)
-
-
-def _get_level_lengths(levels, sentinel=''):
-    """For each index in each level the function returns lengths of indexes.
-
-    Parameters
-    ----------
-    levels : list of lists
-        List of values on for level.
-    sentinel : string, optional
-        Value which states that no new index starts on there.
-
-    Returns
-    ----------
-    Returns list of maps. For each level returns map of indexes (key is index
-    in row and value is length of index).
-    """
-    if len(levels) == 0:
-        return []
-
-    control = [True for x in levels[0]]
-
-    result = []
-    for level in levels:
-        last_index = 0
-
-        lengths = {}
-        for i, key in enumerate(level):
-            if control[i] and key == sentinel:
-                pass
-            else:
-                control[i] = False
-                lengths[last_index] = i - last_index
-                last_index = i
-
-        lengths[last_index] = len(level) - last_index
-
-        result.append(lengths)
-
-    return result
-
-
-class CSVFormatter(object):
-
-    def __init__(self, obj, path_or_buf=None, sep=",", na_rep='',
-                 float_format=None, cols=None, header=True, index=True,
-                 index_label=None, mode='w', nanRep=None, encoding=None,
-                 compression=None, quoting=None, line_terminator='\n',
-                 chunksize=None, tupleize_cols=False, quotechar='"',
-                 date_format=None, doublequote=True, escapechar=None,
-                 decimal='.'):
-
-        self.obj = obj
-
-        if path_or_buf is None:
-            path_or_buf = StringIO()
-
-        self.path_or_buf = _expand_user(path_or_buf)
-        self.sep = sep
-        self.na_rep = na_rep
-        self.float_format = float_format
-        self.decimal = decimal
-
-        self.header = header
-        self.index = index
-        self.index_label = index_label
-        self.mode = mode
-        self.encoding = encoding
-        self.compression = compression
-
-        if quoting is None:
-            quoting = csv.QUOTE_MINIMAL
-        self.quoting = quoting
-
-        if quoting == csv.QUOTE_NONE:
-            # prevents crash in _csv
-            quotechar = None
-        self.quotechar = quotechar
-
-        self.doublequote = doublequote
-        self.escapechar = escapechar
-
-        self.line_terminator = line_terminator
-
-        self.date_format = date_format
-
-        self.tupleize_cols = tupleize_cols
-        self.has_mi_columns = (isinstance(obj.columns, MultiIndex) and
-                               not self.tupleize_cols)
-
-        # validate mi options
-        if self.has_mi_columns:
-            if cols is not None:
-                raise TypeError("cannot specify cols with a MultiIndex on the "
-                                "columns")
-
-        if cols is not None:
-            if isinstance(cols, Index):
-                cols = cols.to_native_types(na_rep=na_rep,
-                                            float_format=float_format,
-                                            date_format=date_format,
-                                            quoting=self.quoting)
-            else:
-                cols = list(cols)
-            self.obj = self.obj.loc[:, cols]
-
-        # update columns to include possible multiplicity of dupes
-        # and make sure sure cols is just a list of labels
-        cols = self.obj.columns
-        if isinstance(cols, Index):
-            cols = cols.to_native_types(na_rep=na_rep,
-                                        float_format=float_format,
-                                        date_format=date_format,
-                                        quoting=self.quoting)
-        else:
-            cols = list(cols)
-
-        # save it
-        self.cols = cols
-
-        # preallocate data 2d list
-        self.blocks = self.obj._data.blocks
-        ncols = sum(b.shape[0] for b in self.blocks)
-        self.data = [None] * ncols
-
-        if chunksize is None:
-            chunksize = (100000 // (len(self.cols) or 1)) or 1
-        self.chunksize = int(chunksize)
-
-        self.data_index = obj.index
-        if isinstance(obj.index, PeriodIndex):
-            self.data_index = obj.index.to_timestamp()
-
-        if (isinstance(self.data_index, DatetimeIndex) and
-                date_format is not None):
-            self.data_index = Index([x.strftime(date_format) if notnull(x) else
-                                     '' for x in self.data_index])
-
-        self.nlevels = getattr(self.data_index, 'nlevels', 1)
-        if not index:
-            self.nlevels = 0
-
-    def save(self):
-        # create the writer & save
-        if hasattr(self.path_or_buf, 'write'):
-            f = self.path_or_buf
-            close = False
-        else:
-            f, handles = _get_handle(self.path_or_buf, self.mode,
-                                     encoding=self.encoding,
-                                     compression=self.compression)
-            close = True
-
-        try:
-            writer_kwargs = dict(lineterminator=self.line_terminator,
-                                 delimiter=self.sep, quoting=self.quoting,
-                                 doublequote=self.doublequote,
-                                 escapechar=self.escapechar,
-                                 quotechar=self.quotechar)
-            if self.encoding is not None:
-                writer_kwargs['encoding'] = self.encoding
-                self.writer = UnicodeWriter(f, **writer_kwargs)
-            else:
-                self.writer = csv.writer(f, **writer_kwargs)
-
-            self._save()
-
-        finally:
-            if close:
-                f.close()
-
-    def _save_header(self):
-
-        writer = self.writer
-        obj = self.obj
-        index_label = self.index_label
-        cols = self.cols
-        has_mi_columns = self.has_mi_columns
-        header = self.header
-        encoded_labels = []
-
-        has_aliases = isinstance(header, (tuple, list, np.ndarray, Index))
-        if not (has_aliases or self.header):
-            return
-        if has_aliases:
-            if len(header) != len(cols):
-                raise ValueError(('Writing %d cols but got %d aliases'
-                                  % (len(cols), len(header))))
-            else:
-                write_cols = header
-        else:
-            write_cols = cols
-
-        if self.index:
-            # should write something for index label
-            if index_label is not False:
-                if index_label is None:
-                    if isinstance(obj.index, MultiIndex):
-                        index_label = []
-                        for i, name in enumerate(obj.index.names):
-                            if name is None:
-                                name = ''
-                            index_label.append(name)
-                    else:
-                        index_label = obj.index.name
-                        if index_label is None:
-                            index_label = ['']
-                        else:
-                            index_label = [index_label]
-                elif not isinstance(index_label,
-                                    (list, tuple, np.ndarray, Index)):
-                    # given a string for a DF with Index
-                    index_label = [index_label]
-
-                encoded_labels = list(index_label)
-            else:
-                encoded_labels = []
-
-        if not has_mi_columns:
-            encoded_labels += list(write_cols)
-            writer.writerow(encoded_labels)
-        else:
-            # write out the mi
-            columns = obj.columns
-
-            # write out the names for each level, then ALL of the values for
-            # each level
-            for i in range(columns.nlevels):
-
-                # we need at least 1 index column to write our col names
-                col_line = []
-                if self.index:
-
-                    # name is the first column
-                    col_line.append(columns.names[i])
-
-                    if isinstance(index_label, list) and len(index_label) > 1:
-                        col_line.extend([''] * (len(index_label) - 1))
-
-                col_line.extend(columns._get_level_values(i))
-
-                writer.writerow(col_line)
-
-            # Write out the index line if it's not empty.
-            # Otherwise, we will print out an extraneous
-            # blank line between the mi and the data rows.
-            if encoded_labels and set(encoded_labels) != set(['']):
-                encoded_labels.extend([''] * len(columns))
-                writer.writerow(encoded_labels)
-
-    def _save(self):
-
-        self._save_header()
-
-        nrows = len(self.data_index)
-
-        # write in chunksize bites
-        chunksize = self.chunksize
-        chunks = int(nrows / chunksize) + 1
-
-        for i in range(chunks):
-            start_i = i * chunksize
-            end_i = min((i + 1) * chunksize, nrows)
-            if start_i >= end_i:
-                break
-
-            self._save_chunk(start_i, end_i)
-
-    def _save_chunk(self, start_i, end_i):
-
-        data_index = self.data_index
-
-        # create the data for a chunk
-        slicer = slice(start_i, end_i)
-        for i in range(len(self.blocks)):
-            b = self.blocks[i]
-            d = b.to_native_types(slicer=slicer, na_rep=self.na_rep,
-                                  float_format=self.float_format,
-                                  decimal=self.decimal,
-                                  date_format=self.date_format,
-                                  quoting=self.quoting)
-
-            for col_loc, col in zip(b.mgr_locs, d):
-                # self.data is a preallocated list
-                self.data[col_loc] = col
-
-        ix = data_index.to_native_types(slicer=slicer, na_rep=self.na_rep,
-                                        float_format=self.float_format,
-                                        decimal=self.decimal,
-                                        date_format=self.date_format,
-                                        quoting=self.quoting)
-
-        lib.write_csv_rows(self.data, ix, self.nlevels, self.cols, self.writer)
-
-# from collections import namedtuple
-# ExcelCell = namedtuple("ExcelCell",
-#                        'row, col, val, style, mergestart, mergeend')
-
-
-class ExcelCell(object):
-    __fields__ = ('row', 'col', 'val', 'style', 'mergestart', 'mergeend')
-    __slots__ = __fields__
-
-    def __init__(self, row, col, val, style=None, mergestart=None,
-                 mergeend=None):
-        self.row = row
-        self.col = col
-        self.val = val
-        self.style = style
-        self.mergestart = mergestart
-        self.mergeend = mergeend
-
-
-header_style = {"font": {"bold": True},
-                "borders": {"top": "thin",
-                            "right": "thin",
-                            "bottom": "thin",
-                            "left": "thin"},
-                "alignment": {"horizontal": "center",
-                              "vertical": "top"}}
-
-
-class ExcelFormatter(object):
-    """
-    Class for formatting a DataFrame to a list of ExcelCells,
-
-    Parameters
-    ----------
-    df : dataframe
-    na_rep: na representation
-    float_format : string, default None
-            Format string for floating point numbers
-    cols : sequence, optional
-        Columns to write
-    header : boolean or list of string, default True
-        Write out column names. If a list of string is given it is
-        assumed to be aliases for the column names
-    index : boolean, default True
-        output row names (index)
-    index_label : string or sequence, default None
-            Column label for index column(s) if desired. If None is given, and
-            `header` and `index` are True, then the index names are used. A
-            sequence should be given if the DataFrame uses MultiIndex.
-    merge_cells : boolean, default False
-            Format MultiIndex and Hierarchical Rows as merged cells.
-    inf_rep : string, default `'inf'`
-        representation for np.inf values (which aren't representable in Excel)
-        A `'-'` sign will be added in front of -inf.
-    """
-
-    def __init__(self, df, na_rep='', float_format=None, cols=None,
-                 header=True, index=True, index_label=None, merge_cells=False,
-                 inf_rep='inf'):
-        self.rowcounter = 0
-        self.na_rep = na_rep
-        self.df = df
-        if cols is not None:
-            self.df = df.loc[:, cols]
-        self.columns = self.df.columns
-        self.float_format = float_format
-        self.index = index
-        self.index_label = index_label
-        self.header = header
-        self.merge_cells = merge_cells
-        self.inf_rep = inf_rep
-
-    def _format_value(self, val):
-        if lib.checknull(val):
-            val = self.na_rep
-        elif is_float(val):
-            if lib.isposinf_scalar(val):
-                val = self.inf_rep
-            elif lib.isneginf_scalar(val):
-                val = '-%s' % self.inf_rep
-            elif self.float_format is not None:
-                val = float(self.float_format % val)
-        return val
-
-    def _format_header_mi(self):
-        if self.columns.nlevels > 1:
-            if not self.index:
-                raise NotImplementedError("Writing to Excel with MultiIndex"
-                                          " columns and no index "
-                                          "('index'=False) is not yet "
-                                          "implemented.")
-
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if not (has_aliases or self.header):
-            return
-
-        columns = self.columns
-        level_strs = columns.format(sparsify=self.merge_cells, adjoin=False,
-                                    names=False)
-        level_lengths = _get_level_lengths(level_strs)
-        coloffset = 0
-        lnum = 0
-
-        if self.index and isinstance(self.df.index, MultiIndex):
-            coloffset = len(self.df.index[0]) - 1
-
-        if self.merge_cells:
-            # Format multi-index as a merged cells.
-            for lnum in range(len(level_lengths)):
-                name = columns.names[lnum]
-                yield ExcelCell(lnum, coloffset, name, header_style)
-
-            for lnum, (spans, levels, labels) in enumerate(zip(
-                    level_lengths, columns.levels, columns.labels)):
-                values = levels.take(labels)
-                for i in spans:
-                    if spans[i] > 1:
-                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
-                                        header_style, lnum,
-                                        coloffset + i + spans[i])
-                    else:
-                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
-                                        header_style)
-        else:
-            # Format in legacy format with dots to indicate levels.
-            for i, values in enumerate(zip(*level_strs)):
-                v = ".".join(map(pprint_thing, values))
-                yield ExcelCell(lnum, coloffset + i + 1, v, header_style)
-
-        self.rowcounter = lnum
-
-    def _format_header_regular(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            coloffset = 0
-
-            if self.index:
-                coloffset = 1
-                if isinstance(self.df.index, MultiIndex):
-                    coloffset = len(self.df.index[0])
-
-            colnames = self.columns
-            if has_aliases:
-                if len(self.header) != len(self.columns):
-                    raise ValueError('Writing %d cols but got %d aliases' %
-                                     (len(self.columns), len(self.header)))
-                else:
-                    colnames = self.header
-
-            for colindex, colname in enumerate(colnames):
-                yield ExcelCell(self.rowcounter, colindex + coloffset, colname,
-                                header_style)
-
-    def _format_header(self):
-        if isinstance(self.columns, MultiIndex):
-            gen = self._format_header_mi()
-        else:
-            gen = self._format_header_regular()
-
-        gen2 = ()
-        if self.df.index.names:
-            row = [x if x is not None else ''
-                   for x in self.df.index.names] + [''] * len(self.columns)
-            if reduce(lambda x, y: x and y, map(lambda x: x != '', row)):
-                gen2 = (ExcelCell(self.rowcounter, colindex, val, header_style)
-                        for colindex, val in enumerate(row))
-                self.rowcounter += 1
-        return itertools.chain(gen, gen2)
-
-    def _format_body(self):
-
-        if isinstance(self.df.index, MultiIndex):
-            return self._format_hierarchical_rows()
-        else:
-            return self._format_regular_rows()
-
-    def _format_regular_rows(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            self.rowcounter += 1
-
-        coloffset = 0
-        # output index and index_label?
-        if self.index:
-            # chek aliases
-            # if list only take first as this is not a MultiIndex
-            if (self.index_label and
-                    isinstance(self.index_label, (list, tuple, np.ndarray,
-                                                  Index))):
-                index_label = self.index_label[0]
-            # if string good to go
-            elif self.index_label and isinstance(self.index_label, str):
-                index_label = self.index_label
-            else:
-                index_label = self.df.index.names[0]
-
-            if isinstance(self.columns, MultiIndex):
-                self.rowcounter += 1
-
-            if index_label and self.header is not False:
-                yield ExcelCell(self.rowcounter - 1, 0, index_label,
-                                header_style)
-
-            # write index_values
-            index_values = self.df.index
-            if isinstance(self.df.index, PeriodIndex):
-                index_values = self.df.index.to_timestamp()
-
-            coloffset = 1
-            for idx, idxval in enumerate(index_values):
-                yield ExcelCell(self.rowcounter + idx, 0, idxval, header_style)
-
-        # Write the body of the frame data series by series.
-        for colidx in range(len(self.columns)):
-            series = self.df.iloc[:, colidx]
-            for i, val in enumerate(series):
-                yield ExcelCell(self.rowcounter + i, colidx + coloffset, val)
-
-    def _format_hierarchical_rows(self):
-        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
-        if has_aliases or self.header:
-            self.rowcounter += 1
-
-        gcolidx = 0
-
-        if self.index:
-            index_labels = self.df.index.names
-            # check for aliases
-            if (self.index_label and
-                    isinstance(self.index_label, (list, tuple, np.ndarray,
-                                                  Index))):
-                index_labels = self.index_label
-
-            # MultiIndex columns require an extra row
-            # with index names (blank if None) for
-            # unambigous round-trip, unless not merging,
-            # in which case the names all go on one row Issue #11328
-            if isinstance(self.columns, MultiIndex) and self.merge_cells:
-                self.rowcounter += 1
-
-            # if index labels are not empty go ahead and dump
-            if (any(x is not None for x in index_labels) and
-                    self.header is not False):
-
-                for cidx, name in enumerate(index_labels):
-                    yield ExcelCell(self.rowcounter - 1, cidx, name,
-                                    header_style)
-
-            if self.merge_cells:
-                # Format hierarchical rows as merged cells.
-                level_strs = self.df.index.format(sparsify=True, adjoin=False,
-                                                  names=False)
-                level_lengths = _get_level_lengths(level_strs)
-
-                for spans, levels, labels in zip(level_lengths,
-                                                 self.df.index.levels,
-                                                 self.df.index.labels):
-
-                    values = levels.take(labels,
-                                         allow_fill=levels._can_hold_na,
-                                         fill_value=True)
-
-                    for i in spans:
-                        if spans[i] > 1:
-                            yield ExcelCell(self.rowcounter + i, gcolidx,
-                                            values[i], header_style,
-                                            self.rowcounter + i + spans[i] - 1,
-                                            gcolidx)
-                        else:
-                            yield ExcelCell(self.rowcounter + i, gcolidx,
-                                            values[i], header_style)
-                    gcolidx += 1
-
-            else:
-                # Format hierarchical rows with non-merged values.
-                for indexcolvals in zip(*self.df.index):
-                    for idx, indexcolval in enumerate(indexcolvals):
-                        yield ExcelCell(self.rowcounter + idx, gcolidx,
-                                        indexcolval, header_style)
-                    gcolidx += 1
-
-        # Write the body of the frame data series by series.
-        for colidx in range(len(self.columns)):
-            series = self.df.iloc[:, colidx]
-            for i, val in enumerate(series):
-                yield ExcelCell(self.rowcounter + i, gcolidx + colidx, val)
-
-    def get_formatted_cells(self):
-        for cell in itertools.chain(self._format_header(),
-                                    self._format_body()):
-            cell.val = self._format_value(cell.val)
-            yield cell
-
-# ----------------------------------------------------------------------
-# Array formatters
-
-
-def format_array(values, formatter, float_format=None, na_rep='NaN',
-                 digits=None, space=None, justify='right', decimal='.'):
-
-    if is_categorical_dtype(values):
-        fmt_klass = CategoricalArrayFormatter
-    elif is_float_dtype(values.dtype):
-        fmt_klass = FloatArrayFormatter
-    elif is_period_arraylike(values):
-        fmt_klass = PeriodArrayFormatter
-    elif is_integer_dtype(values.dtype):
-        fmt_klass = IntArrayFormatter
-    elif is_datetimetz(values):
-        fmt_klass = Datetime64TZFormatter
-    elif is_datetime64_dtype(values.dtype):
-        fmt_klass = Datetime64Formatter
-    elif is_timedelta64_dtype(values.dtype):
-        fmt_klass = Timedelta64Formatter
-    else:
-        fmt_klass = GenericArrayFormatter
-
-    if space is None:
-        space = get_option("display.column_space")
-
-    if float_format is None:
-        float_format = get_option("display.float_format")
-
-    if digits is None:
-        digits = get_option("display.precision")
-
-    fmt_obj = fmt_klass(values, digits=digits, na_rep=na_rep,
-                        float_format=float_format, formatter=formatter,
-                        space=space, justify=justify, decimal=decimal)
-
-    return fmt_obj.get_result()
-
-
-class GenericArrayFormatter(object):
-
-    def __init__(self, values, digits=7, formatter=None, na_rep='NaN',
-                 space=12, float_format=None, justify='right', decimal='.',
-                 quoting=None, fixed_width=True):
-        self.values = values
-        self.digits = digits
-        self.na_rep = na_rep
-        self.space = space
-        self.formatter = formatter
-        self.float_format = float_format
-        self.justify = justify
-        self.decimal = decimal
-        self.quoting = quoting
-        self.fixed_width = fixed_width
-
-    def get_result(self):
-        fmt_values = self._format_strings()
-        return _make_fixed_width(fmt_values, self.justify)
-
-    def _format_strings(self):
-        if self.float_format is None:
-            float_format = get_option("display.float_format")
-            if float_format is None:
-                fmt_str = '%% .%dg' % get_option("display.precision")
-                float_format = lambda x: fmt_str % x
-        else:
-            float_format = self.float_format
-
-        formatter = (
-            self.formatter if self.formatter is not None else
-            (lambda x: pprint_thing(x, escape_chars=('\t', '\r', '\n'))))
-
-        def _format(x):
-            if self.na_rep is not None and lib.checknull(x):
-                if x is None:
-                    return 'None'
-                elif x is pd.NaT:
-                    return 'NaT'
-                return self.na_rep
-            elif isinstance(x, PandasObject):
-                return '%s' % x
-            else:
-                # object dtype
-                return '%s' % formatter(x)
-
-        vals = self.values
-        if isinstance(vals, Index):
-            vals = vals._values
-        elif isinstance(vals, ABCSparseArray):
-            vals = vals.values
-
-        is_float_type = lib.map_infer(vals, is_float) & notnull(vals)
-        leading_space = is_float_type.any()
-
-        fmt_values = []
-        for i, v in enumerate(vals):
-            if not is_float_type[i] and leading_space:
-                fmt_values.append(' %s' % _format(v))
-            elif is_float_type[i]:
-                fmt_values.append(float_format(v))
-            else:
-                fmt_values.append(' %s' % _format(v))
-
-        return fmt_values
-
-
-class FloatArrayFormatter(GenericArrayFormatter):
-    """
-
-    """
-
-    def __init__(self, *args, **kwargs):
-        GenericArrayFormatter.__init__(self, *args, **kwargs)
-
-        # float_format is expected to be a string
-        # formatter should be used to pass a function
-        if self.float_format is not None and self.formatter is None:
-            if callable(self.float_format):
-                self.formatter = self.float_format
-                self.float_format = None
-
-    def _value_formatter(self, float_format=None, threshold=None):
-        """Returns a function to be applied on each value to format it
-        """
-
-        # the float_format parameter supersedes self.float_format
-        if float_format is None:
-            float_format = self.float_format
-
-        # we are going to compose different functions, to first convert to
-        # a string, then replace the decimal symbol, and finally chop according
-        # to the threshold
-
-        # when there is no float_format, we use str instead of '%g'
-        # because str(0.0) = '0.0' while '%g' % 0.0 = '0'
-        if float_format:
-            def base_formatter(v):
-                return (float_format % v) if notnull(v) else self.na_rep
-        else:
-            def base_formatter(v):
-                return str(v) if notnull(v) else self.na_rep
-
-        if self.decimal != '.':
-            def decimal_formatter(v):
-                return base_formatter(v).replace('.', self.decimal, 1)
-        else:
-            decimal_formatter = base_formatter
-
-        if threshold is None:
-            return decimal_formatter
-
-        def formatter(value):
-            if notnull(value):
-                if abs(value) > threshold:
-                    return decimal_formatter(value)
-                else:
-                    return decimal_formatter(0.0)
-            else:
-                return self.na_rep
-
-        return formatter
-
-    def get_result_as_array(self):
-        """
-        Returns the float values converted into strings using
-        the parameters given at initalisation, as a numpy array
-        """
-
-        if self.formatter is not None:
-            return np.array([self.formatter(x) for x in self.values])
-
-        if self.fixed_width:
-            threshold = get_option("display.chop_threshold")
-        else:
-            threshold = None
-
-        # if we have a fixed_width, we'll need to try different float_format
-        def format_values_with(float_format):
-            formatter = self._value_formatter(float_format, threshold)
-
-            # separate the wheat from the chaff
-            values = self.values
-            mask = isnull(values)
-            if hasattr(values, 'to_dense'):  # sparse numpy ndarray
-                values = values.to_dense()
-            values = np.array(values, dtype='object')
-            values[mask] = self.na_rep
-            imask = (~mask).ravel()
-            values.flat[imask] = np.array([formatter(val)
-                                           for val in values.ravel()[imask]])
-
-            if self.fixed_width:
-                return _trim_zeros(values, self.na_rep)
-
-            return values
-
-        # There is a special default string when we are fixed-width
-        # The default is otherwise to use str instead of a formatting string
-        if self.float_format is None and self.fixed_width:
-            float_format = '%% .%df' % self.digits
-        else:
-            float_format = self.float_format
-
-        formatted_values = format_values_with(float_format)
-
-        if not self.fixed_width:
-            return formatted_values
-
-        # we need do convert to engineering format if some values are too small
-        # and would appear as 0, or if some values are too big and take too
-        # much space
-
-        if len(formatted_values) > 0:
-            maxlen = max(len(x) for x in formatted_values)
-            too_long = maxlen > self.digits + 6
-        else:
-            too_long = False
-
-        with np.errstate(invalid='ignore'):
-            abs_vals = np.abs(self.values)
-            # this is pretty arbitrary for now
-            # large values: more that 8 characters including decimal symbol
-            # and first digit, hence > 1e6
-            has_large_values = (abs_vals > 1e6).any()
-            has_small_values = ((abs_vals < 10**(-self.digits)) &
-                                (abs_vals > 0)).any()
-
-        if has_small_values or (too_long and has_large_values):
-            float_format = '%% .%de' % self.digits
-            formatted_values = format_values_with(float_format)
-
-        return formatted_values
-
-    def _format_strings(self):
-        # shortcut
-        if self.formatter is not None:
-            return [self.formatter(x) for x in self.values]
-
-        return list(self.get_result_as_array())
-
-
-class IntArrayFormatter(GenericArrayFormatter):
-
-    def _format_strings(self):
-        formatter = self.formatter or (lambda x: '% d' % x)
-        fmt_values = [formatter(x) for x in self.values]
-        return fmt_values
-
-
-class Datetime64Formatter(GenericArrayFormatter):
-
-    def __init__(self, values, nat_rep='NaT', date_format=None, **kwargs):
-        super(Datetime64Formatter, self).__init__(values, **kwargs)
-        self.nat_rep = nat_rep
-        self.date_format = date_format
-
-    def _format_strings(self):
-        """ we by definition have DO NOT have a TZ """
-
-        values = self.values
-
-        if not isinstance(values, DatetimeIndex):
-            values = DatetimeIndex(values)
-
-        if self.formatter is not None and callable(self.formatter):
-            return [self.formatter(x) for x in values]
-
-        fmt_values = format_array_from_datetime(
-            values.asi8.ravel(),
-            format=_get_format_datetime64_from_values(values,
-                                                      self.date_format),
-            na_rep=self.nat_rep).reshape(values.shape)
-        return fmt_values.tolist()
-
-
-class PeriodArrayFormatter(IntArrayFormatter):
-
-    def _format_strings(self):
-        from pandas.tseries.period import IncompatibleFrequency
-        try:
-            values = PeriodIndex(self.values).to_native_types()
-        except IncompatibleFrequency:
-            # periods may contains different freq
-            values = Index(self.values, dtype='object').to_native_types()
-
-        formatter = self.formatter or (lambda x: '%s' % x)
-        fmt_values = [formatter(x) for x in values]
-        return fmt_values
-
-
-class CategoricalArrayFormatter(GenericArrayFormatter):
-
-    def __init__(self, values, *args, **kwargs):
-        GenericArrayFormatter.__init__(self, values, *args, **kwargs)
-
-    def _format_strings(self):
-        fmt_values = format_array(self.values.get_values(), self.formatter,
-                                  float_format=self.float_format,
-                                  na_rep=self.na_rep, digits=self.digits,
-                                  space=self.space, justify=self.justify)
-        return fmt_values
-
-
-def format_percentiles(percentiles):
-    """
-    Outputs rounded and formatted percentiles.
-
-    Parameters
-    ----------
-    percentiles : list-like, containing floats from interval [0,1]
-
-    Returns
-    -------
-    formatted : list of strings
-
-    Notes
-    -----
-    Rounding precision is chosen so that: (1) if any two elements of
-    ``percentiles`` differ, they remain different after rounding
-    (2) no entry is *rounded* to 0% or 100%.
-    Any non-integer is always rounded to at least 1 decimal place.
-
-    Examples
-    --------
-    Keeps all entries different after rounding:
-
-    >>> format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
-    ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
-
-    No element is rounded to 0% or 100% (unless already equal to it).
-    Duplicates are allowed:
-
-    >>> format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
-    ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
-    """
-
-    percentiles = np.asarray(percentiles)
-
-    # It checks for np.NaN as well
-    with np.errstate(invalid='ignore'):
-        if not is_numeric_dtype(percentiles) or not np.all(percentiles >= 0) \
-                or not np.all(percentiles <= 1):
-            raise ValueError("percentiles should all be in the interval [0,1]")
-
-    percentiles = 100 * percentiles
-    int_idx = (percentiles.astype(int) == percentiles)
-
-    if np.all(int_idx):
-        out = percentiles.astype(int).astype(str)
-        return [i + '%' for i in out]
-
-    unique_pcts = np.unique(percentiles)
-    to_begin = unique_pcts[0] if unique_pcts[0] > 0 else None
-    to_end = 100 - unique_pcts[-1] if unique_pcts[-1] < 100 else None
-
-    # Least precision that keeps percentiles unique after rounding
-    prec = -np.floor(np.log10(np.min(
-        np.ediff1d(unique_pcts, to_begin=to_begin, to_end=to_end)
-    ))).astype(int)
-    prec = max(1, prec)
-    out = np.empty_like(percentiles, dtype=object)
-    out[int_idx] = percentiles[int_idx].astype(int).astype(str)
-    out[~int_idx] = percentiles[~int_idx].round(prec).astype(str)
-    return [i + '%' for i in out]
-
-
-def _is_dates_only(values):
-    # return a boolean if we are only dates (and don't have a timezone)
-    values = DatetimeIndex(values)
-    if values.tz is not None:
-        return False
-
-    values_int = values.asi8
-    consider_values = values_int != iNaT
-    one_day_nanos = (86400 * 1e9)
-    even_days = np.logical_and(consider_values,
-                               values_int % one_day_nanos != 0).sum() == 0
-    if even_days:
-        return True
-    return False
-
-
-def _format_datetime64(x, tz=None, nat_rep='NaT'):
-    if x is None or lib.checknull(x):
-        return nat_rep
-
-    if tz is not None or not isinstance(x, Timestamp):
-        x = Timestamp(x, tz=tz)
-
-    return str(x)
-
-
-def _format_datetime64_dateonly(x, nat_rep='NaT', date_format=None):
-    if x is None or lib.checknull(x):
-        return nat_rep
-
-    if not isinstance(x, Timestamp):
-        x = Timestamp(x)
-
-    if date_format:
-        return x.strftime(date_format)
-    else:
-        return x._date_repr
-
-
-def _get_format_datetime64(is_dates_only, nat_rep='NaT', date_format=None):
-
-    if is_dates_only:
-        return lambda x, tz=None: _format_datetime64_dateonly(
-            x, nat_rep=nat_rep, date_format=date_format)
-    else:
-        return lambda x, tz=None: _format_datetime64(x, tz=tz, nat_rep=nat_rep)
-
-
-def _get_format_datetime64_from_values(values, date_format):
-    """ given values and a date_format, return a string format """
-    is_dates_only = _is_dates_only(values)
-    if is_dates_only:
-        return date_format or "%Y-%m-%d"
-    return date_format
-
-
-class Datetime64TZFormatter(Datetime64Formatter):
-
-    def _format_strings(self):
-        """ we by definition have a TZ """
-
-        values = self.values.asobject
-        is_dates_only = _is_dates_only(values)
-        formatter = (self.formatter or
-                     _get_format_datetime64(is_dates_only,
-                                            date_format=self.date_format))
-        fmt_values = [formatter(x) for x in values]
-
-        return fmt_values
-
-
-class Timedelta64Formatter(GenericArrayFormatter):
-
-    def __init__(self, values, nat_rep='NaT', box=False, **kwargs):
-        super(Timedelta64Formatter, self).__init__(values, **kwargs)
-        self.nat_rep = nat_rep
-        self.box = box
-
-    def _format_strings(self):
-        formatter = (self.formatter or
-                     _get_format_timedelta64(self.values, nat_rep=self.nat_rep,
-                                             box=self.box))
-        fmt_values = np.array([formatter(x) for x in self.values])
-        return fmt_values
-
-
-def _get_format_timedelta64(values, nat_rep='NaT', box=False):
-    """
-    Return a formatter function for a range of timedeltas.
-    These will all have the same format argument
-
-    If box, then show the return in quotes
-    """
-
-    values_int = values.astype(np.int64)
-
-    consider_values = values_int != iNaT
-
-    one_day_nanos = (86400 * 1e9)
-    even_days = np.logical_and(consider_values,
-                               values_int % one_day_nanos != 0).sum() == 0
-    all_sub_day = np.logical_and(
-        consider_values, np.abs(values_int) >= one_day_nanos).sum() == 0
-
-    if even_days:
-        format = 'even_day'
-    elif all_sub_day:
-        format = 'sub_day'
-    else:
-        format = 'long'
-
-    def _formatter(x):
-        if x is None or lib.checknull(x):
-            return nat_rep
-
-        if not isinstance(x, Timedelta):
-            x = Timedelta(x)
-        result = x._repr_base(format=format)
-        if box:
-            result = "'{0}'".format(result)
-        return result
-
-    return _formatter
-
-
-def _make_fixed_width(strings, justify='right', minimum=None, adj=None):
-
-    if len(strings) == 0 or justify == 'all':
-        return strings
-
-    if adj is None:
-        adj = _get_adjustment()
-
-    max_len = np.max([adj.len(x) for x in strings])
-
-    if minimum is not None:
-        max_len = max(minimum, max_len)
-
-    conf_max = get_option("display.max_colwidth")
-    if conf_max is not None and max_len > conf_max:
-        max_len = conf_max
-
-    def just(x):
-        if conf_max is not None:
-            if (conf_max > 3) & (adj.len(x) > max_len):
-                x = x[:max_len - 3] + '...'
-        return x
-
-    strings = [just(x) for x in strings]
-    result = adj.justify(strings, max_len, mode=justify)
-    return result
-
-
-def _trim_zeros(str_floats, na_rep='NaN'):
-    """
-    Trims zeros, leaving just one before the decimal points if need be.
-    """
-    trimmed = str_floats
-
-    def _cond(values):
-        non_na = [x for x in values if x != na_rep]
-        return (len(non_na) > 0 and all([x.endswith('0') for x in non_na]) and
-                not (any([('e' in x) or ('E' in x) for x in non_na])))
-
-    while _cond(trimmed):
-        trimmed = [x[:-1] if x != na_rep else x for x in trimmed]
-
-    # leave one 0 after the decimal points if need be.
-    return [x + "0" if x.endswith('.') and x != na_rep else x for x in trimmed]
-
-
-def single_column_table(column, align=None, style=None):
-    table = '<table'
-    if align is not None:
-        table += (' align="%s"' % align)
-    if style is not None:
-        table += (' style="%s"' % style)
-    table += '><tbody>'
-    for i in column:
-        table += ('<tr><td>%s</td></tr>' % str(i))
-    table += '</tbody></table>'
-    return table
-
-
-def single_row_table(row):  # pragma: no cover
-    table = '<table><tbody><tr>'
-    for i in row:
-        table += ('<td>%s</td>' % str(i))
-    table += '</tr></tbody></table>'
-    return table
-
-
-def _has_names(index):
-    if isinstance(index, MultiIndex):
-        return any([x is not None for x in index.names])
-    else:
-        return index.name is not None
-
-
-# -----------------------------------------------------------------------------
-# Global formatting options
-_initial_defencoding = None
-
-
-def detect_console_encoding():
-    """
-    Try to find the most capable encoding supported by the console.
-    slighly modified from the way IPython handles the same issue.
-    """
-    import locale
-    global _initial_defencoding
-
-    encoding = None
-    try:
-        encoding = sys.stdout.encoding or sys.stdin.encoding
-    except AttributeError:
-        pass
-
-    # try again for something better
-    if not encoding or 'ascii' in encoding.lower():
-        try:
-            encoding = locale.getpreferredencoding()
-        except Exception:
-            pass
-
-    # when all else fails. this will usually be "ascii"
-    if not encoding or 'ascii' in encoding.lower():
-        encoding = sys.getdefaultencoding()
-
-    # GH3360, save the reported defencoding at import time
-    # MPL backends may change it. Make available for debugging.
-    if not _initial_defencoding:
-        _initial_defencoding = sys.getdefaultencoding()
-
-    return encoding
-
-
-def get_console_size():
-    """Return console size as tuple = (width, height).
-
-    Returns (None,None) in non-interactive session.
-    """
-    display_width = get_option('display.width')
-    # deprecated.
-    display_height = get_option('display.height', silent=True)
-
-    # Consider
-    # interactive shell terminal, can detect term size
-    # interactive non-shell terminal (ipnb/ipqtconsole), cannot detect term
-    # size non-interactive script, should disregard term size
-
-    # in addition
-    # width,height have default values, but setting to 'None' signals
-    # should use Auto-Detection, But only in interactive shell-terminal.
-    # Simple. yeah.
-
-    if com.in_interactive_session():
-        if com.in_ipython_frontend():
-            # sane defaults for interactive non-shell terminal
-            # match default for width,height in config_init
-            from pandas.core.config import get_default_val
-            terminal_width = get_default_val('display.width')
-            terminal_height = get_default_val('display.height')
-        else:
-            # pure terminal
-            terminal_width, terminal_height = get_terminal_size()
-    else:
-        terminal_width, terminal_height = None, None
-
-    # Note if the User sets width/Height to None (auto-detection)
-    # and we're in a script (non-inter), this will return (None,None)
-    # caller needs to deal.
-    return (display_width or terminal_width, display_height or terminal_height)
-
-
-class EngFormatter(object):
-    """
-    Formats float values according to engineering format.
-
-    Based on matplotlib.ticker.EngFormatter
-    """
-
-    # The SI engineering prefixes
-    ENG_PREFIXES = {
-        -24: "y",
-        -21: "z",
-        -18: "a",
-        -15: "f",
-        -12: "p",
-        -9: "n",
-        -6: "u",
-        -3: "m",
-        0: "",
-        3: "k",
-        6: "M",
-        9: "G",
-        12: "T",
-        15: "P",
-        18: "E",
-        21: "Z",
-        24: "Y"
-    }
-
-    def __init__(self, accuracy=None, use_eng_prefix=False):
-        self.accuracy = accuracy
-        self.use_eng_prefix = use_eng_prefix
-
-    def __call__(self, num):
-        """ Formats a number in engineering notation, appending a letter
-        representing the power of 1000 of the original number. Some examples:
-
-        >>> format_eng(0)       # for self.accuracy = 0
-        ' 0'
-
-        >>> format_eng(1000000) # for self.accuracy = 1,
-                                #     self.use_eng_prefix = True
-        ' 1.0M'
-
-        >>> format_eng("-1e-6") # for self.accuracy = 2
-                                #     self.use_eng_prefix = False
-        '-1.00E-06'
-
-        @param num: the value to represent
-        @type num: either a numeric value or a string that can be converted to
-                   a numeric value (as per decimal.Decimal constructor)
-
-        @return: engineering formatted string
-        """
-        import decimal
-        import math
-        dnum = decimal.Decimal(str(num))
-
-        if decimal.Decimal.is_nan(dnum):
-            return 'NaN'
-
-        if decimal.Decimal.is_infinite(dnum):
-            return 'inf'
-
-        sign = 1
-
-        if dnum < 0:  # pragma: no cover
-            sign = -1
-            dnum = -dnum
-
-        if dnum != 0:
-            pow10 = decimal.Decimal(int(math.floor(dnum.log10() / 3) * 3))
-        else:
-            pow10 = decimal.Decimal(0)
-
-        pow10 = pow10.min(max(self.ENG_PREFIXES.keys()))
-        pow10 = pow10.max(min(self.ENG_PREFIXES.keys()))
-        int_pow10 = int(pow10)
-
-        if self.use_eng_prefix:
-            prefix = self.ENG_PREFIXES[int_pow10]
-        else:
-            if int_pow10 < 0:
-                prefix = 'E-%02d' % (-int_pow10)
-            else:
-                prefix = 'E+%02d' % int_pow10
-
-        mant = sign * dnum / (10**pow10)
-
-        if self.accuracy is None:  # pragma: no cover
-            format_str = u("% g%s")
-        else:
-            format_str = (u("%% .%if%%s") % self.accuracy)
-
-        formatted = format_str % (mant, prefix)
-
-        return formatted  # .strip()
-
-
-def set_eng_float_format(accuracy=3, use_eng_prefix=False):
-    """
-    Alter default behavior on how float is formatted in DataFrame.
-    Format float in engineering format. By accuracy, we mean the number of
-    decimal digits after the floating point.
-
-    See also EngFormatter.
-    """
-
-    set_option("display.float_format", EngFormatter(accuracy, use_eng_prefix))
-    set_option("display.column_space", max(12, accuracy + 9))
-
-
-def _put_lines(buf, lines):
-    if any(isinstance(x, compat.text_type) for x in lines):
-        lines = [compat.text_type(x) for x in lines]
-    buf.write('\n'.join(lines))
-
-
-def _binify(cols, line_width):
-    adjoin_width = 1
-    bins = []
-    curr_width = 0
-    i_last_column = len(cols) - 1
-    for i, w in enumerate(cols):
-        w_adjoined = w + adjoin_width
-        curr_width += w_adjoined
-        if i_last_column == i:
-            wrap = curr_width + 1 > line_width and i > 0
-        else:
-            wrap = curr_width + 2 > line_width and i > 0
-        if wrap:
-            bins.append(i)
-            curr_width = w_adjoined
-
-    bins.append(len(cols))
-    return bins
diff --git a/pandas/formats/printing.py b/pandas/formats/printing.py
deleted file mode 100644
index 37bd4b63d6f7a..0000000000000
--- a/pandas/formats/printing.py
+++ /dev/null
@@ -1,235 +0,0 @@
-"""
-printing tools
-"""
-
-from pandas.types.inference import is_sequence
-from pandas import compat
-from pandas.compat import u
-from pandas.core.config import get_option
-
-
-def adjoin(space, *lists, **kwargs):
-    """
-    Glues together two sets of strings using the amount of space requested.
-    The idea is to prettify.
-
-    ----------
-    space : int
-        number of spaces for padding
-    lists : str
-        list of str which being joined
-    strlen : callable
-        function used to calculate the length of each str. Needed for unicode
-        handling.
-    justfunc : callable
-        function used to justify str. Needed for unicode handling.
-    """
-    strlen = kwargs.pop('strlen', len)
-    justfunc = kwargs.pop('justfunc', justify)
-
-    out_lines = []
-    newLists = []
-    lengths = [max(map(strlen, x)) + space for x in lists[:-1]]
-    # not the last one
-    lengths.append(max(map(len, lists[-1])))
-    maxLen = max(map(len, lists))
-    for i, lst in enumerate(lists):
-        nl = justfunc(lst, lengths[i], mode='left')
-        nl.extend([' ' * lengths[i]] * (maxLen - len(lst)))
-        newLists.append(nl)
-    toJoin = zip(*newLists)
-    for lines in toJoin:
-        out_lines.append(_join_unicode(lines))
-    return _join_unicode(out_lines, sep='\n')
-
-
-def justify(texts, max_len, mode='right'):
-    """
-    Perform ljust, center, rjust against string or list-like
-    """
-    if mode == 'left':
-        return [x.ljust(max_len) for x in texts]
-    elif mode == 'center':
-        return [x.center(max_len) for x in texts]
-    else:
-        return [x.rjust(max_len) for x in texts]
-
-
-def _join_unicode(lines, sep=''):
-    try:
-        return sep.join(lines)
-    except UnicodeDecodeError:
-        sep = compat.text_type(sep)
-        return sep.join([x.decode('utf-8') if isinstance(x, str) else x
-                         for x in lines])
-
-
-# Unicode consolidation
-# ---------------------
-#
-# pprinting utility functions for generating Unicode text or
-# bytes(3.x)/str(2.x) representations of objects.
-# Try to use these as much as possible rather then rolling your own.
-#
-# When to use
-# -----------
-#
-# 1) If you're writing code internal to pandas (no I/O directly involved),
-#    use pprint_thing().
-#
-#    It will always return unicode text which can handled by other
-#    parts of the package without breakage.
-#
-# 2) If you need to send something to the console, use console_encode().
-#
-#    console_encode() should (hopefully) choose the right encoding for you
-#    based on the encoding set in option "display.encoding"
-#
-# 3) if you need to write something out to file, use
-#    pprint_thing_encoded(encoding).
-#
-#    If no encoding is specified, it defaults to utf-8. Since encoding pure
-#    ascii with utf-8 is a no-op you can safely use the default utf-8 if you're
-#    working with straight ascii.
-
-
-def _pprint_seq(seq, _nest_lvl=0, max_seq_items=None, **kwds):
-    """
-    internal. pprinter for iterables. you should probably use pprint_thing()
-    rather then calling this directly.
-
-    bounds length of printed sequence, depending on options
-    """
-    if isinstance(seq, set):
-        fmt = u("{%s}")
-    else:
-        fmt = u("[%s]") if hasattr(seq, '__setitem__') else u("(%s)")
-
-    if max_seq_items is False:
-        nitems = len(seq)
-    else:
-        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
-
-    s = iter(seq)
-    r = []
-    for i in range(min(nitems, len(seq))):  # handle sets, no slicing
-        r.append(pprint_thing(
-            next(s), _nest_lvl + 1, max_seq_items=max_seq_items, **kwds))
-    body = ", ".join(r)
-
-    if nitems < len(seq):
-        body += ", ..."
-    elif isinstance(seq, tuple) and len(seq) == 1:
-        body += ','
-
-    return fmt % body
-
-
-def _pprint_dict(seq, _nest_lvl=0, max_seq_items=None, **kwds):
-    """
-    internal. pprinter for iterables. you should probably use pprint_thing()
-    rather then calling this directly.
-    """
-    fmt = u("{%s}")
-    pairs = []
-
-    pfmt = u("%s: %s")
-
-    if max_seq_items is False:
-        nitems = len(seq)
-    else:
-        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
-
-    for k, v in list(seq.items())[:nitems]:
-        pairs.append(pfmt %
-                     (pprint_thing(k, _nest_lvl + 1,
-                                   max_seq_items=max_seq_items, **kwds),
-                      pprint_thing(v, _nest_lvl + 1,
-                                   max_seq_items=max_seq_items, **kwds)))
-
-    if nitems < len(seq):
-        return fmt % (", ".join(pairs) + ", ...")
-    else:
-        return fmt % ", ".join(pairs)
-
-
-def pprint_thing(thing, _nest_lvl=0, escape_chars=None, default_escapes=False,
-                 quote_strings=False, max_seq_items=None):
-    """
-    This function is the sanctioned way of converting objects
-    to a unicode representation.
-
-    properly handles nested sequences containing unicode strings
-    (unicode(object) does not)
-
-    Parameters
-    ----------
-    thing : anything to be formatted
-    _nest_lvl : internal use only. pprint_thing() is mutually-recursive
-        with pprint_sequence, this argument is used to keep track of the
-        current nesting level, and limit it.
-    escape_chars : list or dict, optional
-        Characters to escape. If a dict is passed the values are the
-        replacements
-    default_escapes : bool, default False
-        Whether the input escape characters replaces or adds to the defaults
-    max_seq_items : False, int, default None
-        Pass thru to other pretty printers to limit sequence printing
-
-    Returns
-    -------
-    result - unicode object on py2, str on py3. Always Unicode.
-
-    """
-
-    def as_escaped_unicode(thing, escape_chars=escape_chars):
-        # Unicode is fine, else we try to decode using utf-8 and 'replace'
-        # if that's not it either, we have no way of knowing and the user
-        # should deal with it himself.
-
-        try:
-            result = compat.text_type(thing)  # we should try this first
-        except UnicodeDecodeError:
-            # either utf-8 or we replace errors
-            result = str(thing).decode('utf-8', "replace")
-
-        translate = {'\t': r'\t', '\n': r'\n', '\r': r'\r', }
-        if isinstance(escape_chars, dict):
-            if default_escapes:
-                translate.update(escape_chars)
-            else:
-                translate = escape_chars
-            escape_chars = list(escape_chars.keys())
-        else:
-            escape_chars = escape_chars or tuple()
-        for c in escape_chars:
-            result = result.replace(c, translate[c])
-
-        return compat.text_type(result)
-
-    if (compat.PY3 and hasattr(thing, '__next__')) or hasattr(thing, 'next'):
-        return compat.text_type(thing)
-    elif (isinstance(thing, dict) and
-          _nest_lvl < get_option("display.pprint_nest_depth")):
-        result = _pprint_dict(thing, _nest_lvl, quote_strings=True,
-                              max_seq_items=max_seq_items)
-    elif (is_sequence(thing) and
-          _nest_lvl < get_option("display.pprint_nest_depth")):
-        result = _pprint_seq(thing, _nest_lvl, escape_chars=escape_chars,
-                             quote_strings=quote_strings,
-                             max_seq_items=max_seq_items)
-    elif isinstance(thing, compat.string_types) and quote_strings:
-        if compat.PY3:
-            fmt = "'%s'"
-        else:
-            fmt = "u'%s'"
-        result = fmt % as_escaped_unicode(thing)
-    else:
-        result = as_escaped_unicode(thing)
-
-    return compat.text_type(result)  # always unicode
-
-
-def pprint_thing_encoded(object, encoding='utf-8', errors='replace', **kwds):
-    value = pprint_thing(object)  # get unicode representation of object
-    return value.encode(encoding, errors, **kwds)
diff --git a/pandas/formats/style.py b/pandas/formats/style.py
deleted file mode 100644
index e712010a8b4f2..0000000000000
--- a/pandas/formats/style.py
+++ /dev/null
@@ -1,1007 +0,0 @@
-"""
-Module for applying conditional formatting to
-DataFrames and Series.
-"""
-from functools import partial
-from itertools import product
-from contextlib import contextmanager
-from uuid import uuid1
-import copy
-from collections import defaultdict, MutableMapping
-
-try:
-    from jinja2 import Template
-except ImportError:
-    msg = "pandas.Styler requires jinja2. "\
-          "Please install with `conda install Jinja2`\n"\
-          "or `pip install Jinja2`"
-    raise ImportError(msg)
-
-from pandas.types.common import is_float, is_string_like
-
-import numpy as np
-import pandas as pd
-from pandas.compat import range
-from pandas.core.config import get_option
-import pandas.core.common as com
-from pandas.core.indexing import _maybe_numeric_slice, _non_reducing_slice
-try:
-    import matplotlib.pyplot as plt
-    from matplotlib import colors
-    has_mpl = True
-except ImportError:
-    has_mpl = False
-    no_mpl_message = "{0} requires matplotlib."
-
-
-@contextmanager
-def _mpl(func):
-    if has_mpl:
-        yield plt, colors
-    else:
-        raise ImportError(no_mpl_message.format(func.__name__))
-
-
-class Styler(object):
-    """
-    Helps style a DataFrame or Series according to the
-    data with HTML and CSS.
-
-    .. versionadded:: 0.17.1
-
-    .. warning::
-        This is a new feature and is under active development.
-        We'll be adding features and possibly making breaking changes in future
-        releases.
-
-    Parameters
-    ----------
-    data: Series or DataFrame
-    precision: int
-        precision to round floats to, defaults to pd.options.display.precision
-    table_styles: list-like, default None
-        list of {selector: (attr, value)} dicts; see Notes
-    uuid: str, default None
-        a unique identifier to avoid CSS collisons; generated automatically
-    caption: str, default None
-        caption to attach to the table
-
-    Attributes
-    ----------
-    template: Jinja Template
-
-    Notes
-    -----
-    Most styling will be done by passing style functions into
-    ``Styler.apply`` or ``Styler.applymap``. Style functions should
-    return values with strings containing CSS ``'attr: value'`` that will
-    be applied to the indicated cells.
-
-    If using in the Jupyter notebook, Styler has defined a ``_repr_html_``
-    to automatically render itself. Otherwise call Styler.render to get
-    the genterated HTML.
-
-    CSS classes are attached to the generated HTML
-
-    * Index and Column names include ``index_name`` and ``level<k>``
-      where `k` is its level in a MultiIndex
-    * Index label cells include
-
-      * ``row_heading``
-      * ``row<n>`` where `n` is the numeric position of the row
-      * ``level<k>`` where `k` is the level in a MultiIndex
-
-    * Column label cells include
-      * ``col_heading``
-      * ``col<n>`` where `n` is the numeric position of the column
-      * ``evel<k>`` where `k` is the level in a MultiIndex
-
-    * Blank cells include ``blank``
-    * Data cells include ``data``
-
-    See Also
-    --------
-    pandas.DataFrame.style
-    """
-    template = Template("""
-        <style  type="text/css" >
-        {% for s in table_styles %}
-            #T_{{uuid}} {{s.selector}} {
-            {% for p,val in s.props %}
-                {{p}}: {{val}};
-            {% endfor %}
-            }
-        {% endfor %}
-        {% for s in cellstyle %}
-            #T_{{uuid}}{{s.selector}} {
-            {% for p,val in s.props %}
-                {{p}}: {{val}};
-            {% endfor %}
-            }
-        {% endfor %}
-        </style>
-
-        <table id="T_{{uuid}}" {{ table_attributes }}>
-        {% if caption %}
-            <caption>{{caption}}</caption>
-        {% endif %}
-
-        <thead>
-            {% for r in head %}
-            <tr>
-                {% for c in r %}
-                {% if c.is_visible != False %}
-                <{{c.type}} class="{{c.class}}" {{ c.attributes|join(" ") }}>
-                  {{c.value}}
-                {% endif %}
-                {% endfor %}
-            </tr>
-            {% endfor %}
-        </thead>
-        <tbody>
-            {% for r in body %}
-            <tr>
-                {% for c in r %}
-                {% if c.is_visible != False %}
-                <{{c.type}} id="T_{{uuid}}{{c.id}}"
-                 class="{{c.class}}" {{ c.attributes|join(" ") }}>
-                    {{ c.display_value }}
-                {% endif %}
-                {% endfor %}
-            </tr>
-            {% endfor %}
-        </tbody>
-        </table>
-        """)
-
-    def __init__(self, data, precision=None, table_styles=None, uuid=None,
-                 caption=None, table_attributes=None):
-        self.ctx = defaultdict(list)
-        self._todo = []
-
-        if not isinstance(data, (pd.Series, pd.DataFrame)):
-            raise TypeError("``data`` must be a Series or DataFrame")
-        if data.ndim == 1:
-            data = data.to_frame()
-        if not data.index.is_unique or not data.columns.is_unique:
-            raise ValueError("style is not supported for non-unique indicies.")
-
-        self.data = data
-        self.index = data.index
-        self.columns = data.columns
-
-        self.uuid = uuid
-        self.table_styles = table_styles
-        self.caption = caption
-        if precision is None:
-            precision = get_option('display.precision')
-        self.precision = precision
-        self.table_attributes = table_attributes
-        # display_funcs maps (row, col) -> formatting function
-
-        def default_display_func(x):
-            if is_float(x):
-                return '{:>.{precision}g}'.format(x, precision=self.precision)
-            else:
-                return x
-
-        self._display_funcs = defaultdict(lambda: default_display_func)
-
-    def _repr_html_(self):
-        """Hooks into Jupyter notebook rich display system."""
-        return self.render()
-
-    def _translate(self):
-        """
-        Convert the DataFrame in `self.data` and the attrs from `_build_styles`
-        into a dictionary of {head, body, uuid, cellstyle}
-        """
-        table_styles = self.table_styles or []
-        caption = self.caption
-        ctx = self.ctx
-        precision = self.precision
-        uuid = self.uuid or str(uuid1()).replace("-", "_")
-        ROW_HEADING_CLASS = "row_heading"
-        COL_HEADING_CLASS = "col_heading"
-        INDEX_NAME_CLASS = "index_name"
-
-        DATA_CLASS = "data"
-        BLANK_CLASS = "blank"
-        BLANK_VALUE = ""
-
-        def format_attr(pair):
-            return "{key}={value}".format(**pair)
-
-        # for sparsifying a MultiIndex
-        idx_lengths = _get_level_lengths(self.index)
-        col_lengths = _get_level_lengths(self.columns)
-
-        cell_context = dict()
-
-        n_rlvls = self.data.index.nlevels
-        n_clvls = self.data.columns.nlevels
-        rlabels = self.data.index.tolist()
-        clabels = self.data.columns.tolist()
-
-        if n_rlvls == 1:
-            rlabels = [[x] for x in rlabels]
-        if n_clvls == 1:
-            clabels = [[x] for x in clabels]
-        clabels = list(zip(*clabels))
-
-        cellstyle = []
-        head = []
-
-        for r in range(n_clvls):
-            # Blank for Index columns...
-            row_es = [{"type": "th",
-                       "value": BLANK_VALUE,
-                       "display_value": BLANK_VALUE,
-                       "is_visible": True,
-                       "class": " ".join([BLANK_CLASS])}] * (n_rlvls - 1)
-
-            # ... except maybe the last for columns.names
-            name = self.data.columns.names[r]
-            cs = [BLANK_CLASS if name is None else INDEX_NAME_CLASS,
-                  "level%s" % r]
-            name = BLANK_VALUE if name is None else name
-            row_es.append({"type": "th",
-                           "value": name,
-                           "display_value": name,
-                           "class": " ".join(cs),
-                           "is_visible": True})
-
-            for c, value in enumerate(clabels[r]):
-                cs = [COL_HEADING_CLASS, "level%s" % r, "col%s" % c]
-                cs.extend(cell_context.get(
-                    "col_headings", {}).get(r, {}).get(c, []))
-                es = {
-                    "type": "th",
-                    "value": value,
-                    "display_value": value,
-                    "class": " ".join(cs),
-                    "is_visible": _is_visible(c, r, col_lengths),
-                }
-                colspan = col_lengths.get((r, c), 0)
-                if colspan > 1:
-                    es["attributes"] = [
-                        format_attr({"key": "colspan", "value": colspan})
-                    ]
-                row_es.append(es)
-            head.append(row_es)
-
-        if self.data.index.names and not all(x is None
-                                             for x in self.data.index.names):
-            index_header_row = []
-
-            for c, name in enumerate(self.data.index.names):
-                cs = [INDEX_NAME_CLASS,
-                      "level%s" % c]
-                name = '' if name is None else name
-                index_header_row.append({"type": "th", "value": name,
-                                         "class": " ".join(cs)})
-
-            index_header_row.extend(
-                [{"type": "th",
-                  "value": BLANK_VALUE,
-                  "class": " ".join([BLANK_CLASS])
-                  }] * len(clabels[0]))
-
-            head.append(index_header_row)
-
-        body = []
-        for r, idx in enumerate(self.data.index):
-            row_es = []
-            for c, value in enumerate(rlabels[r]):
-                es = {
-                    "type": "th",
-                    "is_visible": _is_visible(r, c, idx_lengths),
-                    "value": value,
-                    "display_value": value,
-                    "class": " ".join([ROW_HEADING_CLASS, "level%s" % c,
-                                       "row%s" % r]),
-                }
-                rowspan = idx_lengths.get((c, r), 0)
-                if rowspan > 1:
-                    es["attributes"] = [
-                        format_attr({"key": "rowspan", "value": rowspan})
-                    ]
-                row_es.append(es)
-
-            for c, col in enumerate(self.data.columns):
-                cs = [DATA_CLASS, "row%s" % r, "col%s" % c]
-                cs.extend(cell_context.get("data", {}).get(r, {}).get(c, []))
-                formatter = self._display_funcs[(r, c)]
-                value = self.data.iloc[r, c]
-                row_es.append({
-                    "type": "td",
-                    "value": value,
-                    "class": " ".join(cs),
-                    "id": "_".join(cs[1:]),
-                    "display_value": formatter(value)
-                })
-                props = []
-                for x in ctx[r, c]:
-                    # have to handle empty styles like ['']
-                    if x.count(":"):
-                        props.append(x.split(":"))
-                    else:
-                        props.append(['', ''])
-                cellstyle.append({'props': props,
-                                  'selector': "row%s_col%s" % (r, c)})
-            body.append(row_es)
-
-        return dict(head=head, cellstyle=cellstyle, body=body, uuid=uuid,
-                    precision=precision, table_styles=table_styles,
-                    caption=caption, table_attributes=self.table_attributes)
-
-    def format(self, formatter, subset=None):
-        """
-        Format the text display value of cells.
-
-        .. versionadded:: 0.18.0
-
-        Parameters
-        ----------
-        formatter: str, callable, or dict
-        subset: IndexSlice
-            An argument to ``DataFrame.loc`` that restricts which elements
-            ``formatter`` is applied to.
-
-        Returns
-        -------
-        self : Styler
-
-        Notes
-        -----
-
-        ``formatter`` is either an ``a`` or a dict ``{column name: a}`` where
-        ``a`` is one of
-
-        - str: this will be wrapped in: ``a.format(x)``
-        - callable: called with the value of an individual cell
-
-        The default display value for numeric values is the "general" (``g``)
-        format with ``pd.options.display.precision`` precision.
-
-        Examples
-        --------
-
-        >>> df = pd.DataFrame(np.random.randn(4, 2), columns=['a', 'b'])
-        >>> df.style.format("{:.2%}")
-        >>> df['c'] = ['a', 'b', 'c', 'd']
-        >>> df.style.format({'C': str.upper})
-        """
-        if subset is None:
-            row_locs = range(len(self.data))
-            col_locs = range(len(self.data.columns))
-        else:
-            subset = _non_reducing_slice(subset)
-            if len(subset) == 1:
-                subset = subset, self.data.columns
-
-            sub_df = self.data.loc[subset]
-            row_locs = self.data.index.get_indexer_for(sub_df.index)
-            col_locs = self.data.columns.get_indexer_for(sub_df.columns)
-
-        if isinstance(formatter, MutableMapping):
-            for col, col_formatter in formatter.items():
-                # formatter must be callable, so '{}' are converted to lambdas
-                col_formatter = _maybe_wrap_formatter(col_formatter)
-                col_num = self.data.columns.get_indexer_for([col])[0]
-
-                for row_num in row_locs:
-                    self._display_funcs[(row_num, col_num)] = col_formatter
-        else:
-            # single scalar to format all cells with
-            locs = product(*(row_locs, col_locs))
-            for i, j in locs:
-                formatter = _maybe_wrap_formatter(formatter)
-                self._display_funcs[(i, j)] = formatter
-        return self
-
-    def render(self):
-        """
-        Render the built up styles to HTML
-
-        .. versionadded:: 0.17.1
-
-        Returns
-        -------
-        rendered: str
-            the rendered HTML
-
-        Notes
-        -----
-        ``Styler`` objects have defined the ``_repr_html_`` method
-        which automatically calls ``self.render()`` when it's the
-        last item in a Notebook cell. When calling ``Styler.render()``
-        directly, wrap the result in ``IPython.display.HTML`` to view
-        the rendered HTML in the notebook.
-        """
-        self._compute()
-        d = self._translate()
-        # filter out empty styles, every cell will have a class
-        # but the list of props may just be [['', '']].
-        # so we have the neested anys below
-        trimmed = [x for x in d['cellstyle']
-                   if any(any(y) for y in x['props'])]
-        d['cellstyle'] = trimmed
-        return self.template.render(**d)
-
-    def _update_ctx(self, attrs):
-        """
-        update the state of the Styler. Collects a mapping
-        of {index_label: ['<property>: <value>']}
-
-        attrs: Series or DataFrame
-        should contain strings of '<property>: <value>;<prop2>: <val2>'
-        Whitespace shouldn't matter and the final trailing ';' shouldn't
-        matter.
-        """
-        for row_label, v in attrs.iterrows():
-            for col_label, col in v.iteritems():
-                i = self.index.get_indexer([row_label])[0]
-                j = self.columns.get_indexer([col_label])[0]
-                for pair in col.rstrip(";").split(";"):
-                    self.ctx[(i, j)].append(pair)
-
-    def _copy(self, deepcopy=False):
-        styler = Styler(self.data, precision=self.precision,
-                        caption=self.caption, uuid=self.uuid,
-                        table_styles=self.table_styles)
-        if deepcopy:
-            styler.ctx = copy.deepcopy(self.ctx)
-            styler._todo = copy.deepcopy(self._todo)
-        else:
-            styler.ctx = self.ctx
-            styler._todo = self._todo
-        return styler
-
-    def __copy__(self):
-        """
-        Deep copy by default.
-        """
-        return self._copy(deepcopy=False)
-
-    def __deepcopy__(self, memo):
-        return self._copy(deepcopy=True)
-
-    def clear(self):
-        """"Reset" the styler, removing any previously applied styles.
-        Returns None.
-        """
-        self.ctx.clear()
-        self._todo = []
-
-    def _compute(self):
-        """
-        Execute the style functions built up in `self._todo`.
-
-        Relies on the conventions that all style functions go through
-        .apply or .applymap. The append styles to apply as tuples of
-
-        (application method, *args, **kwargs)
-        """
-        r = self
-        for func, args, kwargs in self._todo:
-            r = func(self)(*args, **kwargs)
-        return r
-
-    def _apply(self, func, axis=0, subset=None, **kwargs):
-        subset = slice(None) if subset is None else subset
-        subset = _non_reducing_slice(subset)
-        data = self.data.loc[subset]
-        if axis is not None:
-            result = data.apply(func, axis=axis, **kwargs)
-        else:
-            result = func(data, **kwargs)
-            if not isinstance(result, pd.DataFrame):
-                raise TypeError(
-                    "Function {!r} must return a DataFrame when "
-                    "passed to `Styler.apply` with axis=None".format(func))
-            if not (result.index.equals(data.index) and
-                    result.columns.equals(data.columns)):
-                msg = ('Result of {!r} must have identical index and columns '
-                       'as the input'.format(func))
-                raise ValueError(msg)
-
-        result_shape = result.shape
-        expected_shape = self.data.loc[subset].shape
-        if result_shape != expected_shape:
-            msg = ("Function {!r} returned the wrong shape.\n"
-                   "Result has shape: {}\n"
-                   "Expected shape:   {}".format(func,
-                                                 result.shape,
-                                                 expected_shape))
-            raise ValueError(msg)
-        self._update_ctx(result)
-        return self
-
-    def apply(self, func, axis=0, subset=None, **kwargs):
-        """
-        Apply a function column-wise, row-wise, or table-wase,
-        updating the HTML representation with the result.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        func : function
-            ``func`` should take a Series or DataFrame (depending
-            on ``axis``), and return an object with the same shape.
-            Must return a DataFrame with identical index and
-            column labels when ``axis=None``
-        axis : int, str or None
-            apply to each column (``axis=0`` or ``'index'``)
-            or to each row (``axis=1`` or ``'columns'``) or
-            to the entire DataFrame at once with ``axis=None``
-        subset : IndexSlice
-            a valid indexer to limit ``data`` to *before* applying the
-            function. Consider using a pandas.IndexSlice
-        kwargs : dict
-            pass along to ``func``
-
-        Returns
-        -------
-        self : Styler
-
-        Notes
-        -----
-        The output shape of ``func`` should match the input, i.e. if
-        ``x`` is the input row, column, or table (depending on ``axis``),
-        then ``func(x.shape) == x.shape`` should be true.
-
-        This is similar to ``DataFrame.apply``, except that ``axis=None``
-        applies the function to the entire DataFrame at once,
-        rather than column-wise or row-wise.
-
-        Examples
-        --------
-        >>> def highlight_max(x):
-        ...     return ['background-color: yellow' if v == x.max() else ''
-                        for v in x]
-        ...
-        >>> df = pd.DataFrame(np.random.randn(5, 2))
-        >>> df.style.apply(highlight_max)
-        """
-        self._todo.append((lambda instance: getattr(instance, '_apply'),
-                           (func, axis, subset), kwargs))
-        return self
-
-    def _applymap(self, func, subset=None, **kwargs):
-        func = partial(func, **kwargs)  # applymap doesn't take kwargs?
-        if subset is None:
-            subset = pd.IndexSlice[:]
-        subset = _non_reducing_slice(subset)
-        result = self.data.loc[subset].applymap(func)
-        self._update_ctx(result)
-        return self
-
-    def applymap(self, func, subset=None, **kwargs):
-        """
-        Apply a function elementwise, updating the HTML
-        representation with the result.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        func : function
-            ``func`` should take a scalar and return a scalar
-        subset : IndexSlice
-            a valid indexer to limit ``data`` to *before* applying the
-            function. Consider using a pandas.IndexSlice
-        kwargs : dict
-            pass along to ``func``
-
-        Returns
-        -------
-        self : Styler
-
-        """
-        self._todo.append((lambda instance: getattr(instance, '_applymap'),
-                           (func, subset), kwargs))
-        return self
-
-    def set_precision(self, precision):
-        """
-        Set the precision used to render.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        precision: int
-
-        Returns
-        -------
-        self : Styler
-        """
-        self.precision = precision
-        return self
-
-    def set_table_attributes(self, attributes):
-        """
-        Set the table attributes. These are the items
-        that show up in the opening ``<table>`` tag in addition
-        to to automatic (by default) id.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        attributes : string
-
-        Returns
-        -------
-        self : Styler
-
-        Examples
-        --------
-        >>> df = pd.DataFrame(np.random.randn(10, 4))
-        >>> df.style.set_table_attributes('class="pure-table"')
-        # ... <table class="pure-table"> ...
-        """
-        self.table_attributes = attributes
-        return self
-
-    def export(self):
-        """
-        Export the styles to applied to the current Styler.
-        Can be applied to a second style with ``Styler.use``.
-
-        .. versionadded:: 0.17.1
-
-        Returns
-        -------
-        styles: list
-
-        See Also
-        --------
-        Styler.use
-        """
-        return self._todo
-
-    def use(self, styles):
-        """
-        Set the styles on the current Styler, possibly using styles
-        from ``Styler.export``.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        styles: list
-            list of style functions
-
-        Returns
-        -------
-        self : Styler
-
-        See Also
-        --------
-        Styler.export
-        """
-        self._todo.extend(styles)
-        return self
-
-    def set_uuid(self, uuid):
-        """
-        Set the uuid for a Styler.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        uuid: str
-
-        Returns
-        -------
-        self : Styler
-        """
-        self.uuid = uuid
-        return self
-
-    def set_caption(self, caption):
-        """
-        Se the caption on a Styler
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        caption: str
-
-        Returns
-        -------
-        self : Styler
-        """
-        self.caption = caption
-        return self
-
-    def set_table_styles(self, table_styles):
-        """
-        Set the table styles on a Styler. These are placed in a
-        ``<style>`` tag before the generated HTML table.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        table_styles: list
-            Each individual table_style should be a dictionary with
-            ``selector`` and ``props`` keys. ``selector`` should be a CSS
-            selector that the style will be applied to (automatically
-            prefixed by the table's UUID) and ``props`` should be a list of
-            tuples with ``(attribute, value)``.
-
-        Returns
-        -------
-        self : Styler
-
-        Examples
-        --------
-        >>> df = pd.DataFrame(np.random.randn(10, 4))
-        >>> df.style.set_table_styles(
-        ...     [{'selector': 'tr:hover',
-        ...       'props': [('background-color', 'yellow')]}]
-        ... )
-        """
-        self.table_styles = table_styles
-        return self
-
-    # -----------------------------------------------------------------------
-    # A collection of "builtin" styles
-    # -----------------------------------------------------------------------
-
-    @staticmethod
-    def _highlight_null(v, null_color):
-        return 'background-color: %s' % null_color if pd.isnull(v) else ''
-
-    def highlight_null(self, null_color='red'):
-        """
-        Shade the background ``null_color`` for missing values.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        null_color: str
-
-        Returns
-        -------
-        self : Styler
-        """
-        self.applymap(self._highlight_null, null_color=null_color)
-        return self
-
-    def background_gradient(self, cmap='PuBu', low=0, high=0, axis=0,
-                            subset=None):
-        """
-        Color the background in a gradient according to
-        the data in each column (optionally row).
-        Requires matplotlib.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        cmap: str or colormap
-            matplotlib colormap
-        low, high: float
-            compress the range by these values.
-        axis: int or str
-            1 or 'columns' for columnwise, 0 or 'index' for rowwise
-        subset: IndexSlice
-            a valid slice for ``data`` to limit the style application to
-
-        Returns
-        -------
-        self : Styler
-
-        Notes
-        -----
-        Tune ``low`` and ``high`` to keep the text legible by
-        not using the entire range of the color map. These extend
-        the range of the data by ``low * (x.max() - x.min())``
-        and ``high * (x.max() - x.min())`` before normalizing.
-        """
-        subset = _maybe_numeric_slice(self.data, subset)
-        subset = _non_reducing_slice(subset)
-        self.apply(self._background_gradient, cmap=cmap, subset=subset,
-                   axis=axis, low=low, high=high)
-        return self
-
-    @staticmethod
-    def _background_gradient(s, cmap='PuBu', low=0, high=0):
-        """Color background in a range according to the data."""
-        with _mpl(Styler.background_gradient) as (plt, colors):
-            rng = s.max() - s.min()
-            # extend lower / upper bounds, compresses color range
-            norm = colors.Normalize(s.min() - (rng * low),
-                                    s.max() + (rng * high))
-            # matplotlib modifies inplace?
-            # https://github.com/matplotlib/matplotlib/issues/5427
-            normed = norm(s.values)
-            c = [colors.rgb2hex(x) for x in plt.cm.get_cmap(cmap)(normed)]
-            return ['background-color: %s' % color for color in c]
-
-    def set_properties(self, subset=None, **kwargs):
-        """
-        Convience method for setting one or more non-data dependent
-        properties or each cell.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        subset: IndexSlice
-            a valid slice for ``data`` to limit the style application to
-        kwargs: dict
-            property: value pairs to be set for each cell
-
-        Returns
-        -------
-        self : Styler
-
-        Examples
-        --------
-        >>> df = pd.DataFrame(np.random.randn(10, 4))
-        >>> df.style.set_properties(color="white", align="right")
-        >>> df.style.set_properties(**{'background-color': 'yellow'})
-        """
-        values = ';'.join('{p}: {v}'.format(p=p, v=v)
-                          for p, v in kwargs.items())
-        f = lambda x: values
-        return self.applymap(f, subset=subset)
-
-    @staticmethod
-    def _bar(s, color, width):
-        normed = width * (s - s.min()) / (s.max() - s.min())
-
-        base = 'width: 10em; height: 80%;'
-        attrs = (base + 'background: linear-gradient(90deg,{c} {w}%, '
-                        'transparent 0%)')
-        return [attrs.format(c=color, w=x) if x != 0 else base for x in normed]
-
-    def bar(self, subset=None, axis=0, color='#d65f5f', width=100):
-        """
-        Color the background ``color`` proptional to the values in each column.
-        Excludes non-numeric data by default.
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        subset: IndexSlice, default None
-            a valid slice for ``data`` to limit the style application to
-        axis: int
-        color: str
-        width: float
-            A number between 0 or 100. The largest value will cover ``width``
-            percent of the cell's width
-
-        Returns
-        -------
-        self : Styler
-        """
-        subset = _maybe_numeric_slice(self.data, subset)
-        subset = _non_reducing_slice(subset)
-        self.apply(self._bar, subset=subset, axis=axis, color=color,
-                   width=width)
-        return self
-
-    def highlight_max(self, subset=None, color='yellow', axis=0):
-        """
-        Highlight the maximum by shading the background
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        subset: IndexSlice, default None
-            a valid slice for ``data`` to limit the style application to
-        color: str, default 'yellow'
-        axis: int, str, or None; default None
-            0 or 'index' for columnwise, 1 or 'columns' for rowwise
-            or ``None`` for tablewise (the default)
-
-        Returns
-        -------
-        self : Styler
-        """
-        return self._highlight_handler(subset=subset, color=color, axis=axis,
-                                       max_=True)
-
-    def highlight_min(self, subset=None, color='yellow', axis=0):
-        """
-        Highlight the minimum by shading the background
-
-        .. versionadded:: 0.17.1
-
-        Parameters
-        ----------
-        subset: IndexSlice, default None
-            a valid slice for ``data`` to limit the style application to
-        color: str, default 'yellow'
-        axis: int, str, or None; default None
-            0 or 'index' for columnwise, 1 or 'columns' for rowwise
-            or ``None`` for tablewise (the default)
-
-        Returns
-        -------
-        self : Styler
-        """
-        return self._highlight_handler(subset=subset, color=color, axis=axis,
-                                       max_=False)
-
-    def _highlight_handler(self, subset=None, color='yellow', axis=None,
-                           max_=True):
-        subset = _non_reducing_slice(_maybe_numeric_slice(self.data, subset))
-        self.apply(self._highlight_extrema, color=color, axis=axis,
-                   subset=subset, max_=max_)
-        return self
-
-    @staticmethod
-    def _highlight_extrema(data, color='yellow', max_=True):
-        """Highlight the min or max in a Series or DataFrame"""
-        attr = 'background-color: {0}'.format(color)
-        if data.ndim == 1:  # Series from .apply
-            if max_:
-                extrema = data == data.max()
-            else:
-                extrema = data == data.min()
-            return [attr if v else '' for v in extrema]
-        else:  # DataFrame from .tee
-            if max_:
-                extrema = data == data.max().max()
-            else:
-                extrema = data == data.min().min()
-            return pd.DataFrame(np.where(extrema, attr, ''),
-                                index=data.index, columns=data.columns)
-
-
-def _is_visible(idx_row, idx_col, lengths):
-    """
-    Index -> {(idx_row, idx_col): bool})
-    """
-    return (idx_col, idx_row) in lengths
-
-
-def _get_level_lengths(index):
-    """
-    Given an index, find the level lenght for each element.
-
-    Result is a dictionary of (level, inital_position): span
-    """
-    sentinel = com.sentinel_factory()
-    levels = index.format(sparsify=sentinel, adjoin=False, names=False)
-
-    if index.nlevels == 1:
-        return {(0, i): 1 for i, value in enumerate(levels)}
-
-    lengths = {}
-
-    for i, lvl in enumerate(levels):
-        for j, row in enumerate(lvl):
-            if not get_option('display.multi_sparse'):
-                lengths[(i, j)] = 1
-            elif row != sentinel:
-                last_label = j
-                lengths[(i, last_label)] = 1
-            else:
-                lengths[(i, last_label)] += 1
-
-    return lengths
-
-
-def _maybe_wrap_formatter(formatter):
-    if is_string_like(formatter):
-        return lambda x: formatter.format(x)
-    elif callable(formatter):
-        return formatter
-    else:
-        msg = "Expected a template string or callable, got {} instead".format(
-            formatter)
-        raise TypeError(msg)
diff --git a/pandas/indexes/api.py b/pandas/indexes/api.py
deleted file mode 100644
index a38453e0d2ccc..0000000000000
--- a/pandas/indexes/api.py
+++ /dev/null
@@ -1,121 +0,0 @@
-from pandas.indexes.base import (Index, _new_Index,  # noqa
-                                 _ensure_index, _get_na_value,
-                                 InvalidIndexError)
-from pandas.indexes.category import CategoricalIndex  # noqa
-from pandas.indexes.multi import MultiIndex  # noqa
-from pandas.indexes.numeric import (NumericIndex, Float64Index,  # noqa
-                                    Int64Index, UInt64Index)
-from pandas.indexes.range import RangeIndex  # noqa
-
-import pandas.core.common as com
-import pandas._libs.lib as lib
-
-# TODO: there are many places that rely on these private methods existing in
-# pandas.core.index
-__all__ = ['Index', 'MultiIndex', 'NumericIndex', 'Float64Index', 'Int64Index',
-           'CategoricalIndex', 'RangeIndex', 'UInt64Index',
-           'InvalidIndexError',
-           '_new_Index',
-           '_ensure_index', '_get_na_value', '_get_combined_index',
-           '_get_distinct_indexes', '_union_indexes',
-           '_get_consensus_names',
-           '_all_indexes_same']
-
-
-def _get_combined_index(indexes, intersect=False):
-    # TODO: handle index names!
-    indexes = _get_distinct_indexes(indexes)
-    if len(indexes) == 0:
-        return Index([])
-    if len(indexes) == 1:
-        return indexes[0]
-    if intersect:
-        index = indexes[0]
-        for other in indexes[1:]:
-            index = index.intersection(other)
-        return index
-    union = _union_indexes(indexes)
-    return _ensure_index(union)
-
-
-def _get_distinct_indexes(indexes):
-    return list(dict((id(x), x) for x in indexes).values())
-
-
-def _union_indexes(indexes):
-    if len(indexes) == 0:
-        raise AssertionError('Must have at least 1 Index to union')
-    if len(indexes) == 1:
-        result = indexes[0]
-        if isinstance(result, list):
-            result = Index(sorted(result))
-        return result
-
-    indexes, kind = _sanitize_and_check(indexes)
-
-    def _unique_indices(inds):
-        def conv(i):
-            if isinstance(i, Index):
-                i = i.tolist()
-            return i
-
-        return Index(lib.fast_unique_multiple_list([conv(i) for i in inds]))
-
-    if kind == 'special':
-        result = indexes[0]
-
-        if hasattr(result, 'union_many'):
-            return result.union_many(indexes[1:])
-        else:
-            for other in indexes[1:]:
-                result = result.union(other)
-            return result
-    elif kind == 'array':
-        index = indexes[0]
-        for other in indexes[1:]:
-            if not index.equals(other):
-                return _unique_indices(indexes)
-
-        name = _get_consensus_names(indexes)[0]
-        if name != index.name:
-            index = index._shallow_copy(name=name)
-        return index
-    else:
-        return _unique_indices(indexes)
-
-
-def _sanitize_and_check(indexes):
-    kinds = list(set([type(index) for index in indexes]))
-
-    if list in kinds:
-        if len(kinds) > 1:
-            indexes = [Index(com._try_sort(x))
-                       if not isinstance(x, Index) else
-                       x for x in indexes]
-            kinds.remove(list)
-        else:
-            return indexes, 'list'
-
-    if len(kinds) > 1 or Index not in kinds:
-        return indexes, 'special'
-    else:
-        return indexes, 'array'
-
-
-def _get_consensus_names(indexes):
-
-    # find the non-none names, need to tupleify to make
-    # the set hashable, then reverse on return
-    consensus_names = set([tuple(i.names) for i in indexes
-                           if all(n is not None for n in i.names)])
-    if len(consensus_names) == 1:
-        return list(list(consensus_names)[0])
-    return [None] * indexes[0].nlevels
-
-
-def _all_indexes_same(indexes):
-    first = indexes[0]
-    for index in indexes[1:]:
-        if not first.equals(index):
-            return False
-    return True
diff --git a/pandas/indexes/base.py b/pandas/indexes/base.py
deleted file mode 100644
index 7f0de963e5c56..0000000000000
--- a/pandas/indexes/base.py
+++ /dev/null
@@ -1,3925 +0,0 @@
-import datetime
-import warnings
-import operator
-
-import numpy as np
-from pandas._libs import (lib, index as libindex, tslib as libts,
-                          algos as libalgos, join as libjoin,
-                          Timestamp, Timedelta, )
-from pandas._libs.lib import is_datetime_array
-
-from pandas.compat import range, u
-from pandas.compat.numpy import function as nv
-from pandas import compat
-
-
-from pandas.types.generic import ABCSeries, ABCMultiIndex, ABCPeriodIndex
-from pandas.types.missing import isnull, array_equivalent
-from pandas.types.common import (_ensure_int64,
-                                 _ensure_object,
-                                 _ensure_categorical,
-                                 _ensure_platform_int,
-                                 is_integer,
-                                 is_float,
-                                 is_dtype_equal,
-                                 is_object_dtype,
-                                 is_categorical_dtype,
-                                 is_bool_dtype,
-                                 is_signed_integer_dtype,
-                                 is_unsigned_integer_dtype,
-                                 is_integer_dtype, is_float_dtype,
-                                 is_datetime64_any_dtype,
-                                 is_timedelta64_dtype,
-                                 needs_i8_conversion,
-                                 is_iterator, is_list_like,
-                                 is_scalar)
-from pandas.core.common import (is_bool_indexer,
-                                _values_from_object,
-                                _asarray_tuplesafe)
-
-from pandas.core.base import PandasObject, IndexOpsMixin
-import pandas.core.base as base
-from pandas.util.decorators import (Appender, Substitution, cache_readonly,
-                                    deprecate, deprecate_kwarg)
-from pandas.indexes.frozen import FrozenList
-import pandas.core.common as com
-import pandas.types.concat as _concat
-import pandas.core.missing as missing
-import pandas.core.algorithms as algos
-from pandas.formats.printing import pprint_thing
-from pandas.core.ops import _comp_method_OBJECT_ARRAY
-from pandas.core.strings import StringAccessorMixin
-
-from pandas.core.config import get_option
-
-# simplify
-default_pprint = lambda x, max_seq_items=None: \
-    pprint_thing(x, escape_chars=('\t', '\r', '\n'), quote_strings=True,
-                 max_seq_items=max_seq_items)
-
-__all__ = ['Index']
-
-_unsortable_types = frozenset(('mixed', 'mixed-integer'))
-
-_index_doc_kwargs = dict(klass='Index', inplace='',
-                         target_klass='Index',
-                         unique='Index', duplicated='np.ndarray')
-_index_shared_docs = dict()
-
-
-def _try_get_item(x):
-    try:
-        return x.item()
-    except AttributeError:
-        return x
-
-
-class InvalidIndexError(Exception):
-    pass
-
-
-_o_dtype = np.dtype(object)
-_Identity = object
-
-
-def _new_Index(cls, d):
-    """ This is called upon unpickling, rather than the default which doesn't
-    have arguments and breaks __new__
-    """
-    # required for backward compat, because PI can't be instantiated with
-    # ordinals through __new__ GH #13277
-    if issubclass(cls, ABCPeriodIndex):
-        from pandas.tseries.period import _new_PeriodIndex
-        return _new_PeriodIndex(cls, **d)
-    return cls.__new__(cls, **d)
-
-
-class Index(IndexOpsMixin, StringAccessorMixin, PandasObject):
-    """
-    Immutable ndarray implementing an ordered, sliceable set. The basic object
-    storing axis labels for all pandas objects
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional)
-    dtype : NumPy dtype (default: object)
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-    tupleize_cols : bool (default: True)
-        When True, attempt to create a MultiIndex if possible
-
-    Notes
-    -----
-    An Index instance can **only** contain hashable objects
-    """
-    # To hand over control to subclasses
-    _join_precedence = 1
-
-    # Cython methods
-    _arrmap = libalgos.arrmap_object
-    _left_indexer_unique = libjoin.left_join_indexer_unique_object
-    _left_indexer = libjoin.left_join_indexer_object
-    _inner_indexer = libjoin.inner_join_indexer_object
-    _outer_indexer = libjoin.outer_join_indexer_object
-    _box_scalars = False
-
-    _typ = 'index'
-    _data = None
-    _id = None
-    name = None
-    asi8 = None
-    _comparables = ['name']
-    _attributes = ['name']
-    _allow_index_ops = True
-    _allow_datetime_index_ops = False
-    _allow_period_index_ops = False
-    _is_numeric_dtype = False
-    _can_hold_na = True
-
-    # prioritize current class for _shallow_copy_with_infer,
-    # used to infer integers as datetime-likes
-    _infer_as_myclass = False
-
-    _engine_type = libindex.ObjectEngine
-
-    def __new__(cls, data=None, dtype=None, copy=False, name=None,
-                fastpath=False, tupleize_cols=True, **kwargs):
-
-        if name is None and hasattr(data, 'name'):
-            name = data.name
-
-        if fastpath:
-            return cls._simple_new(data, name)
-
-        from .range import RangeIndex
-
-        # range
-        if isinstance(data, RangeIndex):
-            return RangeIndex(start=data, copy=copy, dtype=dtype, name=name)
-        elif isinstance(data, range):
-            return RangeIndex.from_range(data, copy=copy, dtype=dtype,
-                                         name=name)
-
-        # categorical
-        if is_categorical_dtype(data) or is_categorical_dtype(dtype):
-            from .category import CategoricalIndex
-            return CategoricalIndex(data, copy=copy, name=name, **kwargs)
-
-        # index-like
-        elif isinstance(data, (np.ndarray, Index, ABCSeries)):
-
-            if (is_datetime64_any_dtype(data) or
-                (dtype is not None and is_datetime64_any_dtype(dtype)) or
-                    'tz' in kwargs):
-                from pandas.tseries.index import DatetimeIndex
-                result = DatetimeIndex(data, copy=copy, name=name,
-                                       dtype=dtype, **kwargs)
-                if dtype is not None and is_dtype_equal(_o_dtype, dtype):
-                    return Index(result.to_pydatetime(), dtype=_o_dtype)
-                else:
-                    return result
-
-            elif (is_timedelta64_dtype(data) or
-                  (dtype is not None and is_timedelta64_dtype(dtype))):
-                from pandas.tseries.tdi import TimedeltaIndex
-                result = TimedeltaIndex(data, copy=copy, name=name, **kwargs)
-                if dtype is not None and _o_dtype == dtype:
-                    return Index(result.to_pytimedelta(), dtype=_o_dtype)
-                else:
-                    return result
-
-            if dtype is not None:
-                try:
-
-                    # we need to avoid having numpy coerce
-                    # things that look like ints/floats to ints unless
-                    # they are actually ints, e.g. '0' and 0.0
-                    # should not be coerced
-                    # GH 11836
-                    if is_integer_dtype(dtype):
-                        inferred = lib.infer_dtype(data)
-                        if inferred == 'integer':
-                            data = np.array(data, copy=copy, dtype=dtype)
-                        elif inferred in ['floating', 'mixed-integer-float']:
-                            if isnull(data).any():
-                                raise ValueError('cannot convert float '
-                                                 'NaN to integer')
-
-                            # If we are actually all equal to integers,
-                            # then coerce to integer.
-                            try:
-                                return cls._try_convert_to_int_index(
-                                    data, copy, name)
-                            except ValueError:
-                                pass
-
-                            # Return an actual float index.
-                            from .numeric import Float64Index
-                            return Float64Index(data, copy=copy, dtype=dtype,
-                                                name=name)
-
-                        elif inferred == 'string':
-                            pass
-                        else:
-                            data = data.astype(dtype)
-                    elif is_float_dtype(dtype):
-                        inferred = lib.infer_dtype(data)
-                        if inferred == 'string':
-                            pass
-                        else:
-                            data = data.astype(dtype)
-                    else:
-                        data = np.array(data, dtype=dtype, copy=copy)
-
-                except (TypeError, ValueError) as e:
-                    msg = str(e)
-                    if 'cannot convert float' in msg:
-                        raise
-
-            # maybe coerce to a sub-class
-            from pandas.tseries.period import (PeriodIndex,
-                                               IncompatibleFrequency)
-            if isinstance(data, PeriodIndex):
-                return PeriodIndex(data, copy=copy, name=name, **kwargs)
-            if is_signed_integer_dtype(data.dtype):
-                from .numeric import Int64Index
-                return Int64Index(data, copy=copy, dtype=dtype, name=name)
-            elif is_unsigned_integer_dtype(data.dtype):
-                from .numeric import UInt64Index
-                return UInt64Index(data, copy=copy, dtype=dtype, name=name)
-            elif is_float_dtype(data.dtype):
-                from .numeric import Float64Index
-                return Float64Index(data, copy=copy, dtype=dtype, name=name)
-            elif issubclass(data.dtype.type, np.bool) or is_bool_dtype(data):
-                subarr = data.astype('object')
-            else:
-                subarr = _asarray_tuplesafe(data, dtype=object)
-
-            # _asarray_tuplesafe does not always copy underlying data,
-            # so need to make sure that this happens
-            if copy:
-                subarr = subarr.copy()
-
-            if dtype is None:
-                inferred = lib.infer_dtype(subarr)
-                if inferred == 'integer':
-                    try:
-                        return cls._try_convert_to_int_index(
-                            subarr, copy, name)
-                    except ValueError:
-                        pass
-
-                    return Index(subarr, copy=copy,
-                                 dtype=object, name=name)
-                elif inferred in ['floating', 'mixed-integer-float']:
-                    from .numeric import Float64Index
-                    return Float64Index(subarr, copy=copy, name=name)
-                elif inferred == 'boolean':
-                    # don't support boolean explicity ATM
-                    pass
-                elif inferred != 'string':
-                    if inferred.startswith('datetime'):
-                        if (lib.is_datetime_with_singletz_array(subarr) or
-                                'tz' in kwargs):
-                            # only when subarr has the same tz
-                            from pandas.tseries.index import DatetimeIndex
-                            try:
-                                return DatetimeIndex(subarr, copy=copy,
-                                                     name=name, **kwargs)
-                            except libts.OutOfBoundsDatetime:
-                                pass
-
-                    elif inferred.startswith('timedelta'):
-                        from pandas.tseries.tdi import TimedeltaIndex
-                        return TimedeltaIndex(subarr, copy=copy, name=name,
-                                              **kwargs)
-                    elif inferred == 'period':
-                        try:
-                            return PeriodIndex(subarr, name=name, **kwargs)
-                        except IncompatibleFrequency:
-                            pass
-            return cls._simple_new(subarr, name)
-
-        elif hasattr(data, '__array__'):
-            return Index(np.asarray(data), dtype=dtype, copy=copy, name=name,
-                         **kwargs)
-        elif data is None or is_scalar(data):
-            cls._scalar_data_error(data)
-        else:
-            if (tupleize_cols and isinstance(data, list) and data and
-                    isinstance(data[0], tuple)):
-
-                # we must be all tuples, otherwise don't construct
-                # 10697
-                if all(isinstance(e, tuple) for e in data):
-                    try:
-                        # must be orderable in py3
-                        if compat.PY3:
-                            sorted(data)
-                        from .multi import MultiIndex
-                        return MultiIndex.from_tuples(
-                            data, names=name or kwargs.get('names'))
-                    except (TypeError, KeyError):
-                        # python2 - MultiIndex fails on mixed types
-                        pass
-            # other iterable of some kind
-            subarr = _asarray_tuplesafe(data, dtype=object)
-            return Index(subarr, dtype=dtype, copy=copy, name=name, **kwargs)
-
-    """
-    NOTE for new Index creation:
-
-    - _simple_new: It returns new Index with the same type as the caller.
-      All metadata (such as name) must be provided by caller's responsibility.
-      Using _shallow_copy is recommended because it fills these metadata
-      otherwise specified.
-
-    - _shallow_copy: It returns new Index with the same type (using
-      _simple_new), but fills caller's metadata otherwise specified. Passed
-      kwargs will overwrite corresponding metadata.
-
-    - _shallow_copy_with_infer: It returns new Index inferring its type
-      from passed values. It fills caller's metadata otherwise specified as the
-      same as _shallow_copy.
-
-    See each method's docstring.
-    """
-
-    @classmethod
-    def _simple_new(cls, values, name=None, dtype=None, **kwargs):
-        """
-        we require the we have a dtype compat for the values
-        if we are passed a non-dtype compat, then coerce using the constructor
-
-        Must be careful not to recurse.
-        """
-        if not hasattr(values, 'dtype'):
-            if values is None and dtype is not None:
-                values = np.empty(0, dtype=dtype)
-            else:
-                values = np.array(values, copy=False)
-                if is_object_dtype(values):
-                    values = cls(values, name=name, dtype=dtype,
-                                 **kwargs)._values
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        for k, v in compat.iteritems(kwargs):
-            setattr(result, k, v)
-        return result._reset_identity()
-
-    _index_shared_docs['_shallow_copy'] = """
-        create a new Index with the same class as the caller, don't copy the
-        data, use the same object attributes with passed in attributes taking
-        precedence
-
-        *this is an internal non-public method*
-
-        Parameters
-        ----------
-        values : the values to create the new Index, optional
-        kwargs : updates the default attributes for this Index
-        """
-
-    @Appender(_index_shared_docs['_shallow_copy'])
-    def _shallow_copy(self, values=None, **kwargs):
-        if values is None:
-            values = self.values
-        attributes = self._get_attributes_dict()
-        attributes.update(kwargs)
-        return self._simple_new(values, **attributes)
-
-    def _shallow_copy_with_infer(self, values=None, **kwargs):
-        """
-        create a new Index inferring the class with passed value, don't copy
-        the data, use the same object attributes with passed in attributes
-        taking precedence
-
-        *this is an internal non-public method*
-
-        Parameters
-        ----------
-        values : the values to create the new Index, optional
-        kwargs : updates the default attributes for this Index
-        """
-        if values is None:
-            values = self.values
-        attributes = self._get_attributes_dict()
-        attributes.update(kwargs)
-        attributes['copy'] = False
-        if self._infer_as_myclass:
-            try:
-                return self._constructor(values, **attributes)
-            except (TypeError, ValueError):
-                pass
-        return Index(values, **attributes)
-
-    def _deepcopy_if_needed(self, orig, copy=False):
-        """
-        .. versionadded:: 0.19.0
-
-        Make a copy of self if data coincides (in memory) with orig.
-        Subclasses should override this if self._base is not an ndarray.
-
-        Parameters
-        ----------
-        orig : ndarray
-            other ndarray to compare self._data against
-        copy : boolean, default False
-            when False, do not run any check, just return self
-
-        Returns
-        -------
-        A copy of self if needed, otherwise self : Index
-        """
-        if copy:
-            # Retrieve the "base objects", i.e. the original memory allocations
-            orig = orig if orig.base is None else orig.base
-            new = self._data if self._data.base is None else self._data.base
-            if orig is new:
-                return self.copy(deep=True)
-
-        return self
-
-    def _update_inplace(self, result, **kwargs):
-        # guard when called from IndexOpsMixin
-        raise TypeError("Index can't be updated inplace")
-
-    _index_shared_docs['_get_grouper_for_level'] = """
-        Get index grouper corresponding to an index level
-
-        Parameters
-        ----------
-        mapper: Group mapping function or None
-            Function mapping index values to groups
-        level : int or None
-            Index level
-
-        Returns
-        -------
-        grouper : Index
-            Index of values to group on
-        labels : ndarray of int or None
-            Array of locations in level_index
-        uniques : Index or None
-            Index of unique values for level
-        """
-
-    @Appender(_index_shared_docs['_get_grouper_for_level'])
-    def _get_grouper_for_level(self, mapper, level=None):
-        assert level is None or level == 0
-        if mapper is None:
-            grouper = self
-        else:
-            grouper = self.map(mapper)
-
-        return grouper, None, None
-
-    def is_(self, other):
-        """
-        More flexible, faster check like ``is`` but that works through views
-
-        Note: this is *not* the same as ``Index.identical()``, which checks
-        that metadata is also the same.
-
-        Parameters
-        ----------
-        other : object
-            other object to compare against.
-
-        Returns
-        -------
-        True if both have same underlying data, False otherwise : bool
-        """
-        # use something other than None to be clearer
-        return self._id is getattr(
-            other, '_id', Ellipsis) and self._id is not None
-
-    def _reset_identity(self):
-        """Initializes or resets ``_id`` attribute with new object"""
-        self._id = _Identity()
-        return self
-
-    # ndarray compat
-    def __len__(self):
-        """
-        return the length of the Index
-        """
-        return len(self._data)
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return self._data.view(np.ndarray)
-
-    def __array_wrap__(self, result, context=None):
-        """
-        Gets called after a ufunc
-        """
-        if is_bool_dtype(result):
-            return result
-
-        attrs = self._get_attributes_dict()
-        attrs = self._maybe_update_attributes(attrs)
-        return Index(result, **attrs)
-
-    @cache_readonly
-    def dtype(self):
-        """ return the dtype object of the underlying data """
-        return self._data.dtype
-
-    @cache_readonly
-    def dtype_str(self):
-        """ return the dtype str of the underlying data """
-        return str(self.dtype)
-
-    @property
-    def values(self):
-        """ return the underlying data as an ndarray """
-        return self._data.view(np.ndarray)
-
-    def get_values(self):
-        """ return the underlying data as an ndarray """
-        return self.values
-
-    @Appender(IndexOpsMixin.memory_usage.__doc__)
-    def memory_usage(self, deep=False):
-        result = super(Index, self).memory_usage(deep=deep)
-
-        # include our engine hashtable
-        result += self._engine.sizeof(deep=deep)
-        return result
-
-    # ops compat
-    def tolist(self):
-        """
-        return a list of the Index values
-        """
-        return list(self.values)
-
-    @deprecate_kwarg(old_arg_name='n', new_arg_name='repeats')
-    def repeat(self, repeats, *args, **kwargs):
-        """
-        Repeat elements of an Index. Refer to `numpy.ndarray.repeat`
-        for more information about the `repeats` argument.
-
-        See also
-        --------
-        numpy.ndarray.repeat
-        """
-        nv.validate_repeat(args, kwargs)
-        return self._shallow_copy(self._values.repeat(repeats))
-
-    _index_shared_docs['where'] = """
-        .. versionadded:: 0.19.0
-
-        Return an Index of same shape as self and whose corresponding
-        entries are from self where cond is True and otherwise are from
-        other.
-
-        Parameters
-        ----------
-        cond : boolean array-like with the same length as self
-        other : scalar, or array-like
-        """
-
-    @Appender(_index_shared_docs['where'])
-    def where(self, cond, other=None):
-        if other is None:
-            other = self._na_value
-        values = np.where(cond, self.values, other)
-
-        dtype = self.dtype
-        if self._is_numeric_dtype and np.any(isnull(values)):
-            # We can't coerce to the numeric dtype of "self" (unless
-            # it's float) if there are NaN values in our output.
-            dtype = None
-
-        return self._shallow_copy_with_infer(values, dtype=dtype)
-
-    def ravel(self, order='C'):
-        """
-        return an ndarray of the flattened values of the underlying data
-
-        See also
-        --------
-        numpy.ndarray.ravel
-        """
-        return self._values.ravel(order=order)
-
-    # construction helpers
-    @classmethod
-    def _try_convert_to_int_index(cls, data, copy, name):
-        """
-        Attempt to convert an array of data into an integer index.
-
-        Parameters
-        ----------
-        data : The data to convert.
-        copy : Whether to copy the data or not.
-        name : The name of the index returned.
-
-        Returns
-        -------
-        int_index : data converted to either an Int64Index or a
-                    UInt64Index
-
-        Raises
-        ------
-        ValueError if the conversion was not successful.
-        """
-
-        from .numeric import Int64Index, UInt64Index
-        try:
-            res = data.astype('i8', copy=False)
-            if (res == data).all():
-                return Int64Index(res, copy=copy, name=name)
-        except (OverflowError, TypeError, ValueError):
-            pass
-
-        # Conversion to int64 failed (possibly due to
-        # overflow), so let's try now with uint64.
-        try:
-            res = data.astype('u8', copy=False)
-            if (res == data).all():
-                return UInt64Index(res, copy=copy, name=name)
-        except (TypeError, ValueError):
-            pass
-
-        raise ValueError
-
-    @classmethod
-    def _scalar_data_error(cls, data):
-        raise TypeError('{0}(...) must be called with a collection of some '
-                        'kind, {1} was passed'.format(cls.__name__,
-                                                      repr(data)))
-
-    @classmethod
-    def _string_data_error(cls, data):
-        raise TypeError('String dtype not supported, you may need '
-                        'to explicitly cast to a numeric type')
-
-    @classmethod
-    def _coerce_to_ndarray(cls, data):
-        """coerces data to ndarray, raises on scalar data. Converts other
-        iterables to list first and then to array. Does not touch ndarrays.
-        """
-
-        if not isinstance(data, (np.ndarray, Index)):
-            if data is None or is_scalar(data):
-                cls._scalar_data_error(data)
-
-            # other iterable of some kind
-            if not isinstance(data, (ABCSeries, list, tuple)):
-                data = list(data)
-            data = np.asarray(data)
-        return data
-
-    def _get_attributes_dict(self):
-        """ return an attributes dict for my class """
-        return dict([(k, getattr(self, k, None)) for k in self._attributes])
-
-    def view(self, cls=None):
-
-        # we need to see if we are subclassing an
-        # index type here
-        if cls is not None and not hasattr(cls, '_typ'):
-            result = self._data.view(cls)
-        else:
-            result = self._shallow_copy()
-        if isinstance(result, Index):
-            result._id = self._id
-        return result
-
-    def _coerce_scalar_to_index(self, item):
-        """
-        we need to coerce a scalar to a compat for our index type
-
-        Parameters
-        ----------
-        item : scalar item to coerce
-        """
-        dtype = self.dtype
-
-        if self._is_numeric_dtype and isnull(item):
-            # We can't coerce to the numeric dtype of "self" (unless
-            # it's float) if there are NaN values in our output.
-            dtype = None
-
-        return Index([item], dtype=dtype, **self._get_attributes_dict())
-
-    _index_shared_docs['copy'] = """
-        Make a copy of this object.  Name and dtype sets those attributes on
-        the new object.
-
-        Parameters
-        ----------
-        name : string, optional
-        deep : boolean, default False
-        dtype : numpy dtype or pandas type
-
-        Returns
-        -------
-        copy : Index
-
-        Notes
-        -----
-        In most cases, there should be no functional difference from using
-        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
-        """
-
-    @Appender(_index_shared_docs['copy'])
-    def copy(self, name=None, deep=False, dtype=None, **kwargs):
-        if deep:
-            new_index = self._shallow_copy(self._data.copy())
-        else:
-            new_index = self._shallow_copy()
-
-        names = kwargs.get('names')
-        names = self._validate_names(name=name, names=names, deep=deep)
-        new_index = new_index.set_names(names)
-
-        if dtype:
-            new_index = new_index.astype(dtype)
-        return new_index
-
-    def __copy__(self, **kwargs):
-        return self.copy(**kwargs)
-
-    def __deepcopy__(self, memo=None):
-        if memo is None:
-            memo = {}
-        return self.copy(deep=True)
-
-    def _validate_names(self, name=None, names=None, deep=False):
-        """
-        Handles the quirks of having a singular 'name' parameter for general
-        Index and plural 'names' parameter for MultiIndex.
-        """
-        from copy import deepcopy
-        if names is not None and name is not None:
-            raise TypeError("Can only provide one of `names` and `name`")
-        elif names is None and name is None:
-            return deepcopy(self.names) if deep else self.names
-        elif names is not None:
-            if not is_list_like(names):
-                raise TypeError("Must pass list-like as `names`.")
-            return names
-        else:
-            if not is_list_like(name):
-                return [name]
-            return name
-
-    def __unicode__(self):
-        """
-        Return a string representation for this object.
-
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
-        """
-        klass = self.__class__.__name__
-        data = self._format_data()
-        attrs = self._format_attrs()
-        space = self._format_space()
-
-        prepr = (u(",%s") %
-                 space).join([u("%s=%s") % (k, v) for k, v in attrs])
-
-        # no data provided, just attributes
-        if data is None:
-            data = ''
-
-        res = u("%s(%s%s)") % (klass, data, prepr)
-
-        return res
-
-    def _format_space(self):
-
-        # using space here controls if the attributes
-        # are line separated or not (the default)
-
-        # max_seq_items = get_option('display.max_seq_items')
-        # if len(self) > max_seq_items:
-        #    space = "\n%s" % (' ' * (len(klass) + 1))
-        return " "
-
-    @property
-    def _formatter_func(self):
-        """
-        Return the formatted data as a unicode string
-        """
-        return default_pprint
-
-    def _format_data(self):
-        """
-        Return the formatted data as a unicode string
-        """
-        from pandas.formats.format import get_console_size, _get_adjustment
-        display_width, _ = get_console_size()
-        if display_width is None:
-            display_width = get_option('display.width') or 80
-
-        space1 = "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
-        space2 = "\n%s" % (' ' * (len(self.__class__.__name__) + 2))
-
-        n = len(self)
-        sep = ','
-        max_seq_items = get_option('display.max_seq_items') or n
-        formatter = self._formatter_func
-
-        # do we want to justify (only do so for non-objects)
-        is_justify = not (self.inferred_type in ('string', 'unicode') or
-                          (self.inferred_type == 'categorical' and
-                           is_object_dtype(self.categories)))
-
-        # are we a truncated display
-        is_truncated = n > max_seq_items
-
-        # adj can optionaly handle unicode eastern asian width
-        adj = _get_adjustment()
-
-        def _extend_line(s, line, value, display_width, next_line_prefix):
-
-            if (adj.len(line.rstrip()) + adj.len(value.rstrip()) >=
-                    display_width):
-                s += line.rstrip()
-                line = next_line_prefix
-            line += value
-            return s, line
-
-        def best_len(values):
-            if values:
-                return max([adj.len(x) for x in values])
-            else:
-                return 0
-
-        if n == 0:
-            summary = '[], '
-        elif n == 1:
-            first = formatter(self[0])
-            summary = '[%s], ' % first
-        elif n == 2:
-            first = formatter(self[0])
-            last = formatter(self[-1])
-            summary = '[%s, %s], ' % (first, last)
-        else:
-
-            if n > max_seq_items:
-                n = min(max_seq_items // 2, 10)
-                head = [formatter(x) for x in self[:n]]
-                tail = [formatter(x) for x in self[-n:]]
-            else:
-                head = []
-                tail = [formatter(x) for x in self]
-
-            # adjust all values to max length if needed
-            if is_justify:
-
-                # however, if we are not truncated and we are only a single
-                # line, then don't justify
-                if (is_truncated or
-                        not (len(', '.join(head)) < display_width and
-                             len(', '.join(tail)) < display_width)):
-                    max_len = max(best_len(head), best_len(tail))
-                    head = [x.rjust(max_len) for x in head]
-                    tail = [x.rjust(max_len) for x in tail]
-
-            summary = ""
-            line = space2
-
-            for i in range(len(head)):
-                word = head[i] + sep + ' '
-                summary, line = _extend_line(summary, line, word,
-                                             display_width, space2)
-
-            if is_truncated:
-                # remove trailing space of last line
-                summary += line.rstrip() + space2 + '...'
-                line = space2
-
-            for i in range(len(tail) - 1):
-                word = tail[i] + sep + ' '
-                summary, line = _extend_line(summary, line, word,
-                                             display_width, space2)
-
-            # last value: no sep added + 1 space of width used for trailing ','
-            summary, line = _extend_line(summary, line, tail[-1],
-                                         display_width - 2, space2)
-            summary += line
-            summary += '],'
-
-            if len(summary) > (display_width):
-                summary += space1
-            else:  # one row
-                summary += ' '
-
-            # remove initial space
-            summary = '[' + summary[len(space2):]
-
-        return summary
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = []
-        attrs.append(('dtype', "'%s'" % self.dtype))
-        if self.name is not None:
-            attrs.append(('name', default_pprint(self.name)))
-        max_seq_items = get_option('display.max_seq_items') or len(self)
-        if len(self) > max_seq_items:
-            attrs.append(('length', len(self)))
-        return attrs
-
-    def to_series(self, **kwargs):
-        """
-        Create a Series with both index and values equal to the index keys
-        useful with map for returning an indexer based on an index
-
-        Returns
-        -------
-        Series : dtype will be based on the type of the Index values.
-        """
-
-        from pandas import Series
-        return Series(self._to_embed(), index=self, name=self.name)
-
-    def _to_embed(self, keep_tz=False):
-        """
-        *this is an internal non-public method*
-
-        return an array repr of this object, potentially casting to object
-
-        """
-        return self.values.copy()
-
-    _index_shared_docs['astype'] = """
-        Create an Index with values cast to dtypes. The class of a new Index
-        is determined by dtype. When conversion is impossible, a ValueError
-        exception is raised.
-
-        Parameters
-        ----------
-        dtype : numpy dtype or pandas type
-        copy : bool, default True
-            By default, astype always returns a newly allocated object.
-            If copy is set to False and internal requirements on dtype are
-            satisfied, the original data is used to create a new Index
-            or the original Index is returned.
-
-            .. versionadded:: 0.19.0
-
-        """
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True):
-        return Index(self.values.astype(dtype, copy=copy), name=self.name,
-                     dtype=dtype)
-
-    def _to_safe_for_reshape(self):
-        """ convert to object if we are a categorical """
-        return self
-
-    def to_datetime(self, dayfirst=False):
-        """
-        DEPRECATED: use :meth:`pandas.to_datetime` instead.
-
-        For an Index containing strings or datetime.datetime objects, attempt
-        conversion to DatetimeIndex
-        """
-        warnings.warn("to_datetime is deprecated. Use pd.to_datetime(...)",
-                      FutureWarning, stacklevel=2)
-
-        from pandas.tseries.index import DatetimeIndex
-        if self.inferred_type == 'string':
-            from dateutil.parser import parse
-            parser = lambda x: parse(x, dayfirst=dayfirst)
-            parsed = lib.try_parse_dates(self.values, parser=parser)
-            return DatetimeIndex(parsed)
-        else:
-            return DatetimeIndex(self.values)
-
-    def _assert_can_do_setop(self, other):
-        if not is_list_like(other):
-            raise TypeError('Input must be Index or array-like')
-        return True
-
-    def _convert_can_do_setop(self, other):
-        if not isinstance(other, Index):
-            other = Index(other, name=self.name)
-            result_name = self.name
-        else:
-            result_name = self.name if self.name == other.name else None
-        return other, result_name
-
-    def _convert_for_op(self, value):
-        """ Convert value to be insertable to ndarray """
-        return value
-
-    def _assert_can_do_op(self, value):
-        """ Check value is valid for scalar op """
-        if not lib.isscalar(value):
-            msg = "'value' must be a scalar, passed: {0}"
-            raise TypeError(msg.format(type(value).__name__))
-
-    @property
-    def nlevels(self):
-        return 1
-
-    def _get_names(self):
-        return FrozenList((self.name, ))
-
-    def _set_names(self, values, level=None):
-        if len(values) != 1:
-            raise ValueError('Length of new names must be 1, got %d' %
-                             len(values))
-        self.name = values[0]
-
-    names = property(fset=_set_names, fget=_get_names)
-
-    def set_names(self, names, level=None, inplace=False):
-        """
-        Set new names on index. Defaults to returning new index.
-
-        Parameters
-        ----------
-        names : str or sequence
-            name(s) to set
-        level : int, level name, or sequence of int/level names (default None)
-            If the index is a MultiIndex (hierarchical), level(s) to set (None
-            for all levels).  Otherwise level must be None
-        inplace : bool
-            if True, mutates in place
-
-        Returns
-        -------
-        new index (of same type and class...etc) [if inplace, returns None]
-
-        Examples
-        --------
-        >>> Index([1, 2, 3, 4]).set_names('foo')
-        Int64Index([1, 2, 3, 4], dtype='int64')
-        >>> Index([1, 2, 3, 4]).set_names(['foo'])
-        Int64Index([1, 2, 3, 4], dtype='int64')
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_names(['baz', 'quz'])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'baz', u'quz'])
-        >>> idx.set_names('baz', level=0)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'baz', u'bar'])
-        """
-        if level is not None and self.nlevels == 1:
-            raise ValueError('Level must be None for non-MultiIndex')
-
-        if level is not None and not is_list_like(level) and is_list_like(
-                names):
-            raise TypeError("Names must be a string")
-
-        if not is_list_like(names) and level is None and self.nlevels > 1:
-            raise TypeError("Must pass list-like as `names`.")
-
-        if not is_list_like(names):
-            names = [names]
-        if level is not None and not is_list_like(level):
-            level = [level]
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._set_names(names, level=level)
-        if not inplace:
-            return idx
-
-    def rename(self, name, inplace=False):
-        """
-        Set new names on index. Defaults to returning new index.
-
-        Parameters
-        ----------
-        name : str or list
-            name to set
-        inplace : bool
-            if True, mutates in place
-
-        Returns
-        -------
-        new index (of same type and class...etc) [if inplace, returns None]
-        """
-        return self.set_names([name], inplace=inplace)
-
-    def reshape(self, *args, **kwargs):
-        """
-        NOT IMPLEMENTED: do not call this method, as reshaping is not
-        supported for Index objects and will raise an error.
-
-        Reshape an Index.
-        """
-        raise NotImplementedError("reshaping is not supported "
-                                  "for Index objects")
-
-    @property
-    def _has_complex_internals(self):
-        # to disable groupby tricks in MultiIndex
-        return False
-
-    def summary(self, name=None):
-        if len(self) > 0:
-            head = self[0]
-            if (hasattr(head, 'format') and
-                    not isinstance(head, compat.string_types)):
-                head = head.format()
-            tail = self[-1]
-            if (hasattr(tail, 'format') and
-                    not isinstance(tail, compat.string_types)):
-                tail = tail.format()
-            index_summary = ', %s to %s' % (pprint_thing(head),
-                                            pprint_thing(tail))
-        else:
-            index_summary = ''
-
-        if name is None:
-            name = type(self).__name__
-        return '%s: %s entries%s' % (name, len(self), index_summary)
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return self.values
-
-    _na_value = np.nan
-    """The expected NA value to use with this index."""
-
-    # introspection
-    @property
-    def is_monotonic(self):
-        """ alias for is_monotonic_increasing (deprecated) """
-        return self._engine.is_monotonic_increasing
-
-    @property
-    def is_monotonic_increasing(self):
-        """
-        return if the index is monotonic increasing (only equal or
-        increasing) values.
-        """
-        return self._engine.is_monotonic_increasing
-
-    @property
-    def is_monotonic_decreasing(self):
-        """
-        return if the index is monotonic decreasing (only equal or
-        decreasing) values.
-        """
-        return self._engine.is_monotonic_decreasing
-
-    def is_lexsorted_for_tuple(self, tup):
-        return True
-
-    @cache_readonly(allow_setting=True)
-    def is_unique(self):
-        """ return if the index has unique values """
-        return self._engine.is_unique
-
-    @property
-    def has_duplicates(self):
-        return not self.is_unique
-
-    def is_boolean(self):
-        return self.inferred_type in ['boolean']
-
-    def is_integer(self):
-        return self.inferred_type in ['integer']
-
-    def is_floating(self):
-        return self.inferred_type in ['floating', 'mixed-integer-float']
-
-    def is_numeric(self):
-        return self.inferred_type in ['integer', 'floating']
-
-    def is_object(self):
-        return is_object_dtype(self.dtype)
-
-    def is_categorical(self):
-        return self.inferred_type in ['categorical']
-
-    def is_mixed(self):
-        return self.inferred_type in ['mixed']
-
-    def holds_integer(self):
-        return self.inferred_type in ['integer', 'mixed-integer']
-
-    _index_shared_docs['_convert_scalar_indexer'] = """
-        Convert a scalar indexer.
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
-    """
-
-    @Appender(_index_shared_docs['_convert_scalar_indexer'])
-    def _convert_scalar_indexer(self, key, kind=None):
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        if kind == 'iloc':
-            return self._validate_indexer('positional', key, kind)
-
-        if len(self) and not isinstance(self, ABCMultiIndex,):
-
-            # we can raise here if we are definitive that this
-            # is positional indexing (eg. .ix on with a float)
-            # or label indexing if we are using a type able
-            # to be represented in the index
-
-            if kind in ['getitem', 'ix'] and is_float(key):
-                if not self.is_floating():
-                    return self._invalid_indexer('label', key)
-
-            elif kind in ['loc'] and is_float(key):
-
-                # we want to raise KeyError on string/mixed here
-                # technically we *could* raise a TypeError
-                # on anything but mixed though
-                if self.inferred_type not in ['floating',
-                                              'mixed-integer-float',
-                                              'string',
-                                              'unicode',
-                                              'mixed']:
-                    return self._invalid_indexer('label', key)
-
-            elif kind in ['loc'] and is_integer(key):
-                if not self.holds_integer():
-                    return self._invalid_indexer('label', key)
-
-        return key
-
-    _index_shared_docs['_convert_slice_indexer'] = """
-        Convert a slice indexer.
-
-        By definition, these are labels unless 'iloc' is passed in.
-        Floats are not allowed as the start, step, or stop of the slice.
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
-    """
-
-    @Appender(_index_shared_docs['_convert_slice_indexer'])
-    def _convert_slice_indexer(self, key, kind=None):
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        # if we are not a slice, then we are done
-        if not isinstance(key, slice):
-            return key
-
-        # validate iloc
-        if kind == 'iloc':
-            return slice(self._validate_indexer('slice', key.start, kind),
-                         self._validate_indexer('slice', key.stop, kind),
-                         self._validate_indexer('slice', key.step, kind))
-
-        # potentially cast the bounds to integers
-        start, stop, step = key.start, key.stop, key.step
-
-        # figure out if this is a positional indexer
-        def is_int(v):
-            return v is None or is_integer(v)
-
-        is_null_slicer = start is None and stop is None
-        is_index_slice = is_int(start) and is_int(stop)
-        is_positional = is_index_slice and not self.is_integer()
-
-        if kind == 'getitem':
-            """
-            called from the getitem slicers, validate that we are in fact
-            integers
-            """
-            if self.is_integer() or is_index_slice:
-                return slice(self._validate_indexer('slice', key.start, kind),
-                             self._validate_indexer('slice', key.stop, kind),
-                             self._validate_indexer('slice', key.step, kind))
-
-        # convert the slice to an indexer here
-
-        # if we are mixed and have integers
-        try:
-            if is_positional and self.is_mixed():
-                # TODO: i, j are not used anywhere
-                if start is not None:
-                    i = self.get_loc(start)  # noqa
-                if stop is not None:
-                    j = self.get_loc(stop)  # noqa
-                is_positional = False
-        except KeyError:
-            if self.inferred_type == 'mixed-integer-float':
-                raise
-
-        if is_null_slicer:
-            indexer = key
-        elif is_positional:
-            indexer = key
-        else:
-            try:
-                indexer = self.slice_indexer(start, stop, step, kind=kind)
-            except Exception:
-                if is_index_slice:
-                    if self.is_integer():
-                        raise
-                    else:
-                        indexer = key
-                else:
-                    raise
-
-        return indexer
-
-    def _convert_listlike_indexer(self, keyarr, kind=None):
-        """
-        Parameters
-        ----------
-        keyarr : list-like
-            Indexer to convert.
-
-        Returns
-        -------
-        tuple (indexer, keyarr)
-            indexer is an ndarray or None if cannot convert
-            keyarr are tuple-safe keys
-        """
-        if isinstance(keyarr, Index):
-            keyarr = self._convert_index_indexer(keyarr)
-        else:
-            keyarr = self._convert_arr_indexer(keyarr)
-
-        indexer = self._convert_list_indexer(keyarr, kind=kind)
-        return indexer, keyarr
-
-    _index_shared_docs['_convert_arr_indexer'] = """
-        Convert an array-like indexer to the appropriate dtype.
-
-        Parameters
-        ----------
-        keyarr : array-like
-            Indexer to convert.
-
-        Returns
-        -------
-        converted_keyarr : array-like
-    """
-
-    @Appender(_index_shared_docs['_convert_arr_indexer'])
-    def _convert_arr_indexer(self, keyarr):
-        keyarr = _asarray_tuplesafe(keyarr)
-        return keyarr
-
-    _index_shared_docs['_convert_index_indexer'] = """
-        Convert an Index indexer to the appropriate dtype.
-
-        Parameters
-        ----------
-        keyarr : Index (or sub-class)
-            Indexer to convert.
-
-        Returns
-        -------
-        converted_keyarr : Index (or sub-class)
-    """
-
-    @Appender(_index_shared_docs['_convert_index_indexer'])
-    def _convert_index_indexer(self, keyarr):
-        return keyarr
-
-    _index_shared_docs['_convert_list_indexer'] = """
-        Convert a list-like indexer to the appropriate dtype.
-
-        Parameters
-        ----------
-        keyarr : Index (or sub-class)
-            Indexer to convert.
-        kind : iloc, ix, loc, optional
-
-        Returns
-        -------
-        positional indexer or None
-    """
-
-    @Appender(_index_shared_docs['_convert_list_indexer'])
-    def _convert_list_indexer(self, keyarr, kind=None):
-        """
-        passed a key that is tuplesafe that is integer based
-        and we have a mixed index (e.g. number/labels). figure out
-        the indexer. return None if we can't help
-        """
-        if (kind in [None, 'iloc', 'ix'] and
-                is_integer_dtype(keyarr) and not self.is_floating() and
-                not isinstance(keyarr, ABCPeriodIndex)):
-
-            if self.inferred_type == 'mixed-integer':
-                indexer = self.get_indexer(keyarr)
-                if (indexer >= 0).all():
-                    return indexer
-                # missing values are flagged as -1 by get_indexer and negative
-                # indices are already converted to positive indices in the
-                # above if-statement, so the negative flags are changed to
-                # values outside the range of indices so as to trigger an
-                # IndexError in maybe_convert_indices
-                indexer[indexer < 0] = len(self)
-                from pandas.core.indexing import maybe_convert_indices
-                return maybe_convert_indices(indexer, len(self))
-
-            elif not self.inferred_type == 'integer':
-                keyarr = np.where(keyarr < 0, len(self) + keyarr, keyarr)
-                return keyarr
-
-        return None
-
-    def _invalid_indexer(self, form, key):
-        """ consistent invalid indexer message """
-        raise TypeError("cannot do {form} indexing on {klass} with these "
-                        "indexers [{key}] of {kind}".format(
-                            form=form, klass=type(self), key=key,
-                            kind=type(key)))
-
-    def get_duplicates(self):
-        from collections import defaultdict
-        counter = defaultdict(lambda: 0)
-        for k in self.values:
-            counter[k] += 1
-        return sorted(k for k, v in compat.iteritems(counter) if v > 1)
-
-    _get_duplicates = get_duplicates
-
-    def _cleanup(self):
-        self._engine.clear_mapping()
-
-    @cache_readonly
-    def _constructor(self):
-        return type(self)
-
-    @cache_readonly
-    def _engine(self):
-        # property, for now, slow to look up
-        return self._engine_type(lambda: self._values, len(self))
-
-    def _validate_index_level(self, level):
-        """
-        Validate index level.
-
-        For single-level Index getting level number is a no-op, but some
-        verification must be done like in MultiIndex.
-
-        """
-        if isinstance(level, int):
-            if level < 0 and level != -1:
-                raise IndexError("Too many levels: Index has only 1 level,"
-                                 " %d is not a valid level number" % (level, ))
-            elif level > 0:
-                raise IndexError("Too many levels:"
-                                 " Index has only 1 level, not %d" %
-                                 (level + 1))
-        elif level != self.name:
-            raise KeyError('Level %s must be same as name (%s)' %
-                           (level, self.name))
-
-    def _get_level_number(self, level):
-        self._validate_index_level(level)
-        return 0
-
-    @cache_readonly
-    def inferred_type(self):
-        """ return a string of the type inferred from the values """
-        return lib.infer_dtype(self)
-
-    def _is_memory_usage_qualified(self):
-        """ return a boolean if we need a qualified .info display """
-        return self.is_object()
-
-    def is_type_compatible(self, kind):
-        return kind == self.inferred_type
-
-    @cache_readonly
-    def is_all_dates(self):
-        if self._data is None:
-            return False
-        return is_datetime_array(_ensure_object(self.values))
-
-    def __iter__(self):
-        return iter(self.values)
-
-    def __reduce__(self):
-        d = dict(data=self._data)
-        d.update(self._get_attributes_dict())
-        return _new_Index, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            self._data = state.pop('data')
-            for k, v in compat.iteritems(state):
-                setattr(self, k, v)
-
-        elif isinstance(state, tuple):
-
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-                self.name = own_state[0]
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(data, state)
-
-            self._data = data
-            self._reset_identity()
-        else:
-            raise Exception("invalid pickle state")
-
-    _unpickle_compat = __setstate__
-
-    def __nonzero__(self):
-        raise ValueError("The truth value of a {0} is ambiguous. "
-                         "Use a.empty, a.bool(), a.item(), a.any() or a.all()."
-                         .format(self.__class__.__name__))
-
-    __bool__ = __nonzero__
-
-    def __contains__(self, key):
-        hash(key)
-        # work around some kind of odd cython bug
-        try:
-            return key in self._engine
-        except TypeError:
-            return False
-
-    def __hash__(self):
-        raise TypeError("unhashable type: %r" % type(self).__name__)
-
-    def __setitem__(self, key, value):
-        raise TypeError("Index does not support mutable operations")
-
-    def __getitem__(self, key):
-        """
-        Override numpy.ndarray's __getitem__ method to work as desired.
-
-        This function adds lists and Series as valid boolean indexers
-        (ndarrays only supports ndarray with dtype=bool).
-
-        If resulting ndim != 1, plain ndarray is returned instead of
-        corresponding `Index` subclass.
-
-        """
-        # There's no custom logic to be implemented in __getslice__, so it's
-        # not overloaded intentionally.
-        getitem = self._data.__getitem__
-        promote = self._shallow_copy
-
-        if is_scalar(key):
-            return getitem(key)
-
-        if isinstance(key, slice):
-            # This case is separated from the conditional above to avoid
-            # pessimization of basic indexing.
-            return promote(getitem(key))
-
-        if is_bool_indexer(key):
-            key = np.asarray(key)
-
-        key = _values_from_object(key)
-        result = getitem(key)
-        if not is_scalar(result):
-            return promote(result)
-        else:
-            return result
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-
-        to_concat = [self]
-
-        if isinstance(other, (list, tuple)):
-            to_concat = to_concat + list(other)
-        else:
-            to_concat.append(other)
-
-        for obj in to_concat:
-            if not isinstance(obj, Index):
-                raise TypeError('all inputs must be Index')
-
-        names = set([obj.name for obj in to_concat])
-        name = None if len(names) > 1 else self.name
-
-        if self.is_categorical():
-            # if calling index is category, don't check dtype of others
-            from pandas.indexes.category import CategoricalIndex
-            return CategoricalIndex._append_same_dtype(self, to_concat, name)
-
-        typs = _concat.get_dtype_kinds(to_concat)
-
-        if len(typs) == 1:
-            return self._append_same_dtype(to_concat, name=name)
-        return _concat._concat_index_asobject(to_concat, name=name)
-
-    def _append_same_dtype(self, to_concat, name):
-        """
-        Concatenate to_concat which has the same class
-        """
-        # must be overrided in specific classes
-        return _concat._concat_index_asobject(to_concat, name)
-
-    _index_shared_docs['take'] = """
-        return a new %(klass)s of the values selected by the indices
-
-        For internal compatibility with numpy arrays.
-
-        Parameters
-        ----------
-        indices : list
-            Indices to be taken
-        axis : int, optional
-            The axis over which to select values, always 0.
-        allow_fill : bool, default True
-        fill_value : bool, default None
-            If allow_fill=True and fill_value is not None, indices specified by
-            -1 is regarded as NA. If Index doesn't hold NA, raise ValueError
-
-        See also
-        --------
-        numpy.ndarray.take
-        """
-
-    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
-    def take(self, indices, axis=0, allow_fill=True,
-             fill_value=None, **kwargs):
-        nv.validate_take(tuple(), kwargs)
-        indices = _ensure_platform_int(indices)
-        if self._can_hold_na:
-            taken = self._assert_take_fillable(self.values, indices,
-                                               allow_fill=allow_fill,
-                                               fill_value=fill_value,
-                                               na_value=self._na_value)
-        else:
-            if allow_fill and fill_value is not None:
-                msg = 'Unable to fill values because {0} cannot contain NA'
-                raise ValueError(msg.format(self.__class__.__name__))
-            taken = self.values.take(indices)
-        return self._shallow_copy(taken)
-
-    def _assert_take_fillable(self, values, indices, allow_fill=True,
-                              fill_value=None, na_value=np.nan):
-        """ Internal method to handle NA filling of take """
-        indices = _ensure_platform_int(indices)
-
-        # only fill if we are passing a non-None fill_value
-        if allow_fill and fill_value is not None:
-            if (indices < -1).any():
-                msg = ('When allow_fill=True and fill_value is not None, '
-                       'all indices must be >= -1')
-                raise ValueError(msg)
-            taken = values.take(indices)
-            mask = indices == -1
-            if mask.any():
-                taken[mask] = na_value
-        else:
-            taken = values.take(indices)
-        return taken
-
-    @cache_readonly
-    def _isnan(self):
-        """ return if each value is nan"""
-        if self._can_hold_na:
-            return isnull(self)
-        else:
-            # shouldn't reach to this condition by checking hasnans beforehand
-            values = np.empty(len(self), dtype=np.bool_)
-            values.fill(False)
-            return values
-
-    @cache_readonly
-    def _nan_idxs(self):
-        if self._can_hold_na:
-            w, = self._isnan.nonzero()
-            return w
-        else:
-            return np.array([], dtype=np.int64)
-
-    @cache_readonly
-    def hasnans(self):
-        """ return if I have any nans; enables various perf speedups """
-        if self._can_hold_na:
-            return self._isnan.any()
-        else:
-            return False
-
-    def isnull(self):
-        """
-        Detect missing values
-
-        .. versionadded:: 0.20.0
-
-        Returns
-        -------
-        a boolean array of whether my values are null
-
-        See also
-        --------
-        pandas.isnull : pandas version
-        """
-        return self._isnan
-
-    def notnull(self):
-        """
-        Reverse of isnull
-
-        .. versionadded:: 0.20.0
-
-        Returns
-        -------
-        a boolean array of whether my values are not null
-
-        See also
-        --------
-        pandas.notnull : pandas version
-        """
-        return ~self.isnull()
-
-    def putmask(self, mask, value):
-        """
-        return a new Index of the values set with the mask
-
-        See also
-        --------
-        numpy.ndarray.putmask
-        """
-        values = self.values.copy()
-        try:
-            np.putmask(values, mask, self._convert_for_op(value))
-            return self._shallow_copy(values)
-        except (ValueError, TypeError):
-            # coerces to object
-            return self.astype(object).putmask(mask, value)
-
-    def format(self, name=False, formatter=None, **kwargs):
-        """
-        Render a string representation of the Index
-        """
-        header = []
-        if name:
-            header.append(pprint_thing(self.name,
-                                       escape_chars=('\t', '\r', '\n')) if
-                          self.name is not None else '')
-
-        if formatter is not None:
-            return header + list(self.map(formatter))
-
-        return self._format_with_header(header, **kwargs)
-
-    def _format_with_header(self, header, na_rep='NaN', **kwargs):
-        values = self.values
-
-        from pandas.formats.format import format_array
-
-        if is_categorical_dtype(values.dtype):
-            values = np.array(values)
-        elif is_object_dtype(values.dtype):
-            values = lib.maybe_convert_objects(values, safe=1)
-
-        if is_object_dtype(values.dtype):
-            result = [pprint_thing(x, escape_chars=('\t', '\r', '\n'))
-                      for x in values]
-
-            # could have nans
-            mask = isnull(values)
-            if mask.any():
-                result = np.array(result)
-                result[mask] = na_rep
-                result = result.tolist()
-
-        else:
-            result = _trim_front(format_array(values, None, justify='left'))
-        return header + result
-
-    def to_native_types(self, slicer=None, **kwargs):
-        """ slice and dice then format """
-        values = self
-        if slicer is not None:
-            values = values[slicer]
-        return values._format_native_types(**kwargs)
-
-    def _format_native_types(self, na_rep='', quoting=None, **kwargs):
-        """ actually format my specific types """
-        mask = isnull(self)
-        if not self.is_object() and not quoting:
-            values = np.asarray(self).astype(str)
-        else:
-            values = np.array(self, dtype=object, copy=True)
-
-        values[mask] = na_rep
-        return values
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, Index):
-            return False
-
-        if is_object_dtype(self) and not is_object_dtype(other):
-            # if other is not object, use other's logic for coercion
-            return other.equals(self)
-
-        try:
-            return array_equivalent(_values_from_object(self),
-                                    _values_from_object(other))
-        except:
-            return False
-
-    def identical(self, other):
-        """Similar to equals, but check that other comparable attributes are
-        also equal
-        """
-        return (self.equals(other) and
-                all((getattr(self, c, None) == getattr(other, c, None)
-                     for c in self._comparables)) and
-                type(self) == type(other))
-
-    def asof(self, label):
-        """
-        For a sorted index, return the most recent label up to and including
-        the passed label. Return NaN if not found.
-
-        See also
-        --------
-        get_loc : asof is a thin wrapper around get_loc with method='pad'
-        """
-        try:
-            loc = self.get_loc(label, method='pad')
-        except KeyError:
-            return _get_na_value(self.dtype)
-        else:
-            if isinstance(loc, slice):
-                loc = loc.indices(len(self))[-1]
-            return self[loc]
-
-    def asof_locs(self, where, mask):
-        """
-        where : array of timestamps
-        mask : array of booleans where data is not NA
-
-        """
-        locs = self.values[mask].searchsorted(where.values, side='right')
-
-        locs = np.where(locs > 0, locs - 1, 0)
-        result = np.arange(len(self))[mask].take(locs)
-
-        first = mask.argmax()
-        result[(locs == 0) & (where < self.values[first])] = -1
-
-        return result
-
-    def sort_values(self, return_indexer=False, ascending=True):
-        """
-        Return sorted copy of Index
-        """
-        _as = self.argsort()
-        if not ascending:
-            _as = _as[::-1]
-
-        sorted_index = self.take(_as)
-
-        if return_indexer:
-            return sorted_index, _as
-        else:
-            return sorted_index
-
-    def sort(self, *args, **kwargs):
-        raise TypeError("cannot sort an Index object in-place, use "
-                        "sort_values instead")
-
-    def sortlevel(self, level=None, ascending=True, sort_remaining=None):
-        """
-
-        For internal compatibility with with the Index API
-
-        Sort the Index. This is for compat with MultiIndex
-
-        Parameters
-        ----------
-        ascending : boolean, default True
-            False to sort in descending order
-
-        level, sort_remaining are compat parameters
-
-        Returns
-        -------
-        sorted_index : Index
-        """
-        return self.sort_values(return_indexer=True, ascending=ascending)
-
-    def shift(self, periods=1, freq=None):
-        """
-        Shift Index containing datetime objects by input number of periods and
-        DateOffset
-
-        Returns
-        -------
-        shifted : Index
-        """
-        raise NotImplementedError("Not supported for type %s" %
-                                  type(self).__name__)
-
-    def argsort(self, *args, **kwargs):
-        """
-        Returns the indices that would sort the index and its
-        underlying data.
-
-        Returns
-        -------
-        argsorted : numpy array
-
-        See also
-        --------
-        numpy.ndarray.argsort
-        """
-        result = self.asi8
-        if result is None:
-            result = np.array(self)
-        return result.argsort(*args, **kwargs)
-
-    def __add__(self, other):
-        return Index(np.array(self) + other)
-
-    def __radd__(self, other):
-        return Index(other + np.array(self))
-
-    __iadd__ = __add__
-
-    def __sub__(self, other):
-        raise TypeError("cannot perform __sub__ with this index type: "
-                        "{typ}".format(typ=type(self)))
-
-    def __and__(self, other):
-        return self.intersection(other)
-
-    def __or__(self, other):
-        return self.union(other)
-
-    def __xor__(self, other):
-        return self.symmetric_difference(other)
-
-    def _get_consensus_name(self, other):
-        """
-        Given 2 indexes, give a consensus name meaning
-        we take the not None one, or None if the names differ.
-        Return a new object if we are resetting the name
-        """
-        if self.name != other.name:
-            if self.name is None or other.name is None:
-                name = self.name or other.name
-            else:
-                name = None
-            if self.name != name:
-                return self._shallow_copy(name=name)
-        return self
-
-    def union(self, other):
-        """
-        Form the union of two Index objects and sorts if possible.
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        union : Index
-
-        Examples
-        --------
-
-        >>> idx1 = pd.Index([1, 2, 3, 4])
-        >>> idx2 = pd.Index([3, 4, 5, 6])
-        >>> idx1.union(idx2)
-        Int64Index([1, 2, 3, 4, 5, 6], dtype='int64')
-
-        """
-        self._assert_can_do_setop(other)
-        other = _ensure_index(other)
-
-        if len(other) == 0 or self.equals(other):
-            return self._get_consensus_name(other)
-
-        if len(self) == 0:
-            return other._get_consensus_name(self)
-
-        if not is_dtype_equal(self.dtype, other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.union(other)
-
-        if self.is_monotonic and other.is_monotonic:
-            try:
-                result = self._outer_indexer(self._values, other._values)[0]
-            except TypeError:
-                # incomparable objects
-                result = list(self._values)
-
-                # worth making this faster? a very unusual case
-                value_set = set(self._values)
-                result.extend([x for x in other._values if x not in value_set])
-        else:
-            indexer = self.get_indexer(other)
-            indexer, = (indexer == -1).nonzero()
-
-            if len(indexer) > 0:
-                other_diff = algos.take_nd(other._values, indexer,
-                                           allow_fill=False)
-                result = _concat._concat_compat((self._values, other_diff))
-
-                try:
-                    self._values[0] < other_diff[0]
-                except TypeError as e:
-                    warnings.warn("%s, sort order is undefined for "
-                                  "incomparable objects" % e, RuntimeWarning,
-                                  stacklevel=3)
-                else:
-                    types = frozenset((self.inferred_type,
-                                       other.inferred_type))
-                    if not types & _unsortable_types:
-                        result.sort()
-
-            else:
-                result = self._values
-
-                try:
-                    result = np.sort(result)
-                except TypeError as e:
-                    warnings.warn("%s, sort order is undefined for "
-                                  "incomparable objects" % e, RuntimeWarning,
-                                  stacklevel=3)
-
-        # for subclasses
-        return self._wrap_union_result(other, result)
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        return self.__class__(result, name=name)
-
-    def intersection(self, other):
-        """
-        Form the intersection of two Index objects.
-
-        This returns a new Index with elements common to the index and `other`,
-        preserving the order of the calling index.
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        intersection : Index
-
-        Examples
-        --------
-
-        >>> idx1 = pd.Index([1, 2, 3, 4])
-        >>> idx2 = pd.Index([3, 4, 5, 6])
-        >>> idx1.intersection(idx2)
-        Int64Index([3, 4], dtype='int64')
-
-        """
-        self._assert_can_do_setop(other)
-        other = _ensure_index(other)
-
-        if self.equals(other):
-            return self._get_consensus_name(other)
-
-        if not is_dtype_equal(self.dtype, other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.intersection(other)
-
-        if self.is_monotonic and other.is_monotonic:
-            try:
-                result = self._inner_indexer(self._values, other._values)[0]
-                return self._wrap_union_result(other, result)
-            except TypeError:
-                pass
-
-        try:
-            indexer = Index(other._values).get_indexer(self._values)
-            indexer = indexer.take((indexer != -1).nonzero()[0])
-        except:
-            # duplicates
-            indexer = Index(other._values).get_indexer_non_unique(
-                self._values)[0].unique()
-            indexer = indexer[indexer != -1]
-
-        taken = other.take(indexer)
-        if self.name != other.name:
-            taken.name = None
-        return taken
-
-    def difference(self, other):
-        """
-        Return a new Index with elements from the index that are not in
-        `other`.
-
-        This is the set difference of two Index objects.
-        It's sorted if sorting is possible.
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        difference : Index
-
-        Examples
-        --------
-
-        >>> idx1 = pd.Index([1, 2, 3, 4])
-        >>> idx2 = pd.Index([3, 4, 5, 6])
-        >>> idx1.difference(idx2)
-        Int64Index([1, 2], dtype='int64')
-
-        """
-        self._assert_can_do_setop(other)
-
-        if self.equals(other):
-            return Index([], name=self.name)
-
-        other, result_name = self._convert_can_do_setop(other)
-
-        this = self._get_unique_index()
-
-        indexer = this.get_indexer(other)
-        indexer = indexer.take((indexer != -1).nonzero()[0])
-
-        label_diff = np.setdiff1d(np.arange(this.size), indexer,
-                                  assume_unique=True)
-        the_diff = this.values.take(label_diff)
-        try:
-            the_diff = algos.safe_sort(the_diff)
-        except TypeError:
-            pass
-
-        return this._shallow_copy(the_diff, name=result_name, freq=None)
-
-    def symmetric_difference(self, other, result_name=None):
-        """
-        Compute the symmetric difference of two Index objects.
-        It's sorted if sorting is possible.
-
-        Parameters
-        ----------
-        other : Index or array-like
-        result_name : str
-
-        Returns
-        -------
-        symmetric_difference : Index
-
-        Notes
-        -----
-        ``symmetric_difference`` contains elements that appear in either
-        ``idx1`` or ``idx2`` but not both. Equivalent to the Index created by
-        ``idx1.difference(idx2) | idx2.difference(idx1)`` with duplicates
-        dropped.
-
-        Examples
-        --------
-        >>> idx1 = Index([1, 2, 3, 4])
-        >>> idx2 = Index([2, 3, 4, 5])
-        >>> idx1.symmetric_difference(idx2)
-        Int64Index([1, 5], dtype='int64')
-
-        You can also use the ``^`` operator:
-
-        >>> idx1 ^ idx2
-        Int64Index([1, 5], dtype='int64')
-        """
-        self._assert_can_do_setop(other)
-        other, result_name_update = self._convert_can_do_setop(other)
-        if result_name is None:
-            result_name = result_name_update
-
-        this = self._get_unique_index()
-        other = other._get_unique_index()
-        indexer = this.get_indexer(other)
-
-        # {this} minus {other}
-        common_indexer = indexer.take((indexer != -1).nonzero()[0])
-        left_indexer = np.setdiff1d(np.arange(this.size), common_indexer,
-                                    assume_unique=True)
-        left_diff = this.values.take(left_indexer)
-
-        # {other} minus {this}
-        right_indexer = (indexer == -1).nonzero()[0]
-        right_diff = other.values.take(right_indexer)
-
-        the_diff = _concat._concat_compat([left_diff, right_diff])
-        try:
-            the_diff = algos.safe_sort(the_diff)
-        except TypeError:
-            pass
-
-        attribs = self._get_attributes_dict()
-        attribs['name'] = result_name
-        if 'freq' in attribs:
-            attribs['freq'] = None
-        return self._shallow_copy_with_infer(the_diff, **attribs)
-
-    sym_diff = deprecate('sym_diff', symmetric_difference)
-
-    def _get_unique_index(self, dropna=False):
-        """
-        Returns an index containing unique values.
-
-        Parameters
-        ----------
-        dropna : bool
-            If True, NaN values are dropped.
-
-        Returns
-        -------
-        uniques : index
-        """
-        if self.is_unique and not dropna:
-            return self
-
-        values = self.values
-
-        if not self.is_unique:
-            values = self.unique()
-
-        if dropna:
-            try:
-                if self.hasnans:
-                    values = values[~isnull(values)]
-            except NotImplementedError:
-                pass
-
-        return self._shallow_copy(values)
-
-    _index_shared_docs['get_loc'] = """
-        Get integer location for requested label.
-
-        Parameters
-        ----------
-        key : label
-        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
-            * default: exact matches only.
-            * pad / ffill: find the PREVIOUS index value if no exact match.
-            * backfill / bfill: use NEXT index value if no exact match
-            * nearest: use the NEAREST index value if no exact match. Tied
-              distances are broken by preferring the larger index value.
-        tolerance : optional
-            Maximum distance from index value for inexact matches. The value of
-            the index at the matching location most satisfy the equation
-            ``abs(index[loc] - key) <= tolerance``.
-
-            .. versionadded:: 0.17.0
-
-        Returns
-        -------
-        loc : int if unique index, possibly slice or mask if not
-    """
-
-    @Appender(_index_shared_docs['get_loc'])
-    def get_loc(self, key, method=None, tolerance=None):
-        if method is None:
-            if tolerance is not None:
-                raise ValueError('tolerance argument only valid if using pad, '
-                                 'backfill or nearest lookups')
-            key = _values_from_object(key)
-            try:
-                return self._engine.get_loc(key)
-            except KeyError:
-                return self._engine.get_loc(self._maybe_cast_indexer(key))
-
-        indexer = self.get_indexer([key], method=method, tolerance=tolerance)
-        if indexer.ndim > 1 or indexer.size > 1:
-            raise TypeError('get_loc requires scalar valued input')
-        loc = indexer.item()
-        if loc == -1:
-            raise KeyError(key)
-        return loc
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        # if we have something that is Index-like, then
-        # use this, e.g. DatetimeIndex
-        s = getattr(series, '_values', None)
-        if isinstance(s, Index) and is_scalar(key):
-            try:
-                return s[key]
-            except (IndexError, ValueError):
-
-                # invalid type as an indexer
-                pass
-
-        s = _values_from_object(series)
-        k = _values_from_object(key)
-
-        k = self._convert_scalar_indexer(k, kind='getitem')
-        try:
-            return self._engine.get_value(s, k,
-                                          tz=getattr(series.dtype, 'tz', None))
-        except KeyError as e1:
-            if len(self) > 0 and self.inferred_type in ['integer', 'boolean']:
-                raise
-
-            try:
-                return libts.get_value_box(s, key)
-            except IndexError:
-                raise
-            except TypeError:
-                # generator/iterator-like
-                if is_iterator(key):
-                    raise InvalidIndexError(key)
-                else:
-                    raise e1
-            except Exception:  # pragma: no cover
-                raise e1
-        except TypeError:
-            # python 3
-            if is_scalar(key):  # pragma: no cover
-                raise IndexError(key)
-            raise InvalidIndexError(key)
-
-    def set_value(self, arr, key, value):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-        self._engine.set_value(_values_from_object(arr),
-                               _values_from_object(key), value)
-
-    def _get_level_values(self, level):
-        """
-        Return an Index of values for requested level, equal to the length
-        of the index
-
-        Parameters
-        ----------
-        level : int
-
-        Returns
-        -------
-        values : Index
-        """
-
-        self._validate_index_level(level)
-        return self
-
-    get_level_values = _get_level_values
-
-    _index_shared_docs['get_indexer'] = """
-        Compute indexer and mask for new index given the current index. The
-        indexer should be then used as an input to ndarray.take to align the
-        current data to the new index.
-
-        Parameters
-        ----------
-        target : %(target_klass)s
-        method : {None, 'pad'/'ffill', 'backfill'/'bfill', 'nearest'}, optional
-            * default: exact matches only.
-            * pad / ffill: find the PREVIOUS index value if no exact match.
-            * backfill / bfill: use NEXT index value if no exact match
-            * nearest: use the NEAREST index value if no exact match. Tied
-              distances are broken by preferring the larger index value.
-        limit : int, optional
-            Maximum number of consecutive labels in ``target`` to match for
-            inexact matches.
-        tolerance : optional
-            Maximum distance between original and new labels for inexact
-            matches. The values of the index at the matching locations most
-            satisfy the equation ``abs(index[indexer] - target) <= tolerance``.
-
-            .. versionadded:: 0.17.0
-
-        Examples
-        --------
-        >>> indexer = index.get_indexer(new_index)
-        >>> new_values = cur_values.take(indexer)
-
-        Returns
-        -------
-        indexer : ndarray of int
-            Integers from 0 to n - 1 indicating that the index at these
-            positions matches the corresponding target values. Missing values
-            in the target are marked by -1.
-        """
-
-    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        method = missing.clean_reindex_fill_method(method)
-        target = _ensure_index(target)
-        if tolerance is not None:
-            tolerance = self._convert_tolerance(tolerance)
-
-        pself, ptarget = self._maybe_promote(target)
-        if pself is not self or ptarget is not target:
-            return pself.get_indexer(ptarget, method=method, limit=limit,
-                                     tolerance=tolerance)
-
-        if not is_dtype_equal(self.dtype, target.dtype):
-            this = self.astype(object)
-            target = target.astype(object)
-            return this.get_indexer(target, method=method, limit=limit,
-                                    tolerance=tolerance)
-
-        if not self.is_unique:
-            raise InvalidIndexError('Reindexing only valid with uniquely'
-                                    ' valued Index objects')
-
-        if method == 'pad' or method == 'backfill':
-            indexer = self._get_fill_indexer(target, method, limit, tolerance)
-        elif method == 'nearest':
-            indexer = self._get_nearest_indexer(target, limit, tolerance)
-        else:
-            if tolerance is not None:
-                raise ValueError('tolerance argument only valid if doing pad, '
-                                 'backfill or nearest reindexing')
-            if limit is not None:
-                raise ValueError('limit argument only valid if doing pad, '
-                                 'backfill or nearest reindexing')
-
-            indexer = self._engine.get_indexer(target._values)
-
-        return _ensure_platform_int(indexer)
-
-    def _convert_tolerance(self, tolerance):
-        # override this method on subclasses
-        return tolerance
-
-    def _get_fill_indexer(self, target, method, limit=None, tolerance=None):
-        if self.is_monotonic_increasing and target.is_monotonic_increasing:
-            method = (self._engine.get_pad_indexer if method == 'pad' else
-                      self._engine.get_backfill_indexer)
-            indexer = method(target._values, limit)
-        else:
-            indexer = self._get_fill_indexer_searchsorted(target, method,
-                                                          limit)
-        if tolerance is not None:
-            indexer = self._filter_indexer_tolerance(target._values, indexer,
-                                                     tolerance)
-        return indexer
-
-    def _get_fill_indexer_searchsorted(self, target, method, limit=None):
-        """
-        Fallback pad/backfill get_indexer that works for monotonic decreasing
-        indexes and non-monotonic targets
-        """
-        if limit is not None:
-            raise ValueError('limit argument for %r method only well-defined '
-                             'if index and target are monotonic' % method)
-
-        side = 'left' if method == 'pad' else 'right'
-
-        # find exact matches first (this simplifies the algorithm)
-        indexer = self.get_indexer(target)
-        nonexact = (indexer == -1)
-        indexer[nonexact] = self._searchsorted_monotonic(target[nonexact],
-                                                         side)
-        if side == 'left':
-            # searchsorted returns "indices into a sorted array such that,
-            # if the corresponding elements in v were inserted before the
-            # indices, the order of a would be preserved".
-            # Thus, we need to subtract 1 to find values to the left.
-            indexer[nonexact] -= 1
-            # This also mapped not found values (values of 0 from
-            # np.searchsorted) to -1, which conveniently is also our
-            # sentinel for missing values
-        else:
-            # Mark indices to the right of the largest value as not found
-            indexer[indexer == len(self)] = -1
-        return indexer
-
-    def _get_nearest_indexer(self, target, limit, tolerance):
-        """
-        Get the indexer for the nearest index labels; requires an index with
-        values that can be subtracted from each other (e.g., not strings or
-        tuples).
-        """
-        left_indexer = self.get_indexer(target, 'pad', limit=limit)
-        right_indexer = self.get_indexer(target, 'backfill', limit=limit)
-
-        target = np.asarray(target)
-        left_distances = abs(self.values[left_indexer] - target)
-        right_distances = abs(self.values[right_indexer] - target)
-
-        op = operator.lt if self.is_monotonic_increasing else operator.le
-        indexer = np.where(op(left_distances, right_distances) |
-                           (right_indexer == -1), left_indexer, right_indexer)
-        if tolerance is not None:
-            indexer = self._filter_indexer_tolerance(target, indexer,
-                                                     tolerance)
-        return indexer
-
-    def _filter_indexer_tolerance(self, target, indexer, tolerance):
-        distance = abs(self.values[indexer] - target)
-        indexer = np.where(distance <= tolerance, indexer, -1)
-        return indexer
-
-    _index_shared_docs['get_indexer_non_unique'] = """
-        Compute indexer and mask for new index given the current index. The
-        indexer should be then used as an input to ndarray.take to align the
-        current data to the new index.
-
-        Parameters
-        ----------
-        target : %(target_klass)s
-
-        Returns
-        -------
-        indexer : ndarray of int
-            Integers from 0 to n - 1 indicating that the index at these
-            positions matches the corresponding target values. Missing values
-            in the target are marked by -1.
-        missing : ndarray of int
-            An indexer into the target of the values not found.
-            These correspond to the -1 in the indexer array
-        """
-
-    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
-    def get_indexer_non_unique(self, target):
-        target = _ensure_index(target)
-        pself, ptarget = self._maybe_promote(target)
-        if pself is not self or ptarget is not target:
-            return pself.get_indexer_non_unique(ptarget)
-
-        if self.is_all_dates:
-            self = Index(self.asi8)
-            tgt_values = target.asi8
-        else:
-            tgt_values = target._values
-
-        indexer, missing = self._engine.get_indexer_non_unique(tgt_values)
-        return Index(indexer), missing
-
-    def get_indexer_for(self, target, **kwargs):
-        """
-        guaranteed return of an indexer even when non-unique
-        This dispatches to get_indexer or get_indexer_nonunique as appropriate
-        """
-        if self.is_unique:
-            return self.get_indexer(target, **kwargs)
-        indexer, _ = self.get_indexer_non_unique(target, **kwargs)
-        return indexer
-
-    def _maybe_promote(self, other):
-        # A hack, but it works
-        from pandas.tseries.index import DatetimeIndex
-        if self.inferred_type == 'date' and isinstance(other, DatetimeIndex):
-            return DatetimeIndex(self), other
-        elif self.inferred_type == 'boolean':
-            if not is_object_dtype(self.dtype):
-                return self.astype('object'), other.astype('object')
-        return self, other
-
-    def groupby(self, values):
-        """
-        Group the index labels by a given array of values.
-
-        Parameters
-        ----------
-        values : array
-            Values used to determine the groups.
-
-        Returns
-        -------
-        groups : dict
-            {group name -> group labels}
-        """
-
-        # TODO: if we are a MultiIndex, we can do better
-        # that converting to tuples
-        from .multi import MultiIndex
-        if isinstance(values, MultiIndex):
-            values = values.values
-        values = _ensure_categorical(values)
-        result = values._reverse_indexer()
-
-        # map to the label
-        result = {k: self.take(v) for k, v in compat.iteritems(result)}
-
-        return result
-
-    def map(self, mapper):
-        """Apply mapper function to an index.
-
-        Parameters
-        ----------
-        mapper : callable
-            Function to be applied.
-
-        Returns
-        -------
-        applied : Union[Index, MultiIndex], inferred
-            The output of the mapping function applied to the index.
-            If the function returns a tuple with more than one element
-            a MultiIndex will be returned.
-
-        """
-        from .multi import MultiIndex
-        mapped_values = self._arrmap(self.values, mapper)
-        attributes = self._get_attributes_dict()
-        if mapped_values.size and isinstance(mapped_values[0], tuple):
-            return MultiIndex.from_tuples(mapped_values,
-                                          names=attributes.get('name'))
-
-        attributes['copy'] = False
-        return Index(mapped_values, **attributes)
-
-    def isin(self, values, level=None):
-        """
-        Compute boolean array of whether each index value is found in the
-        passed set of values.
-
-        Parameters
-        ----------
-        values : set or list-like
-            Sought values.
-
-            .. versionadded:: 0.18.1
-
-            Support for values as a set
-
-        level : str or int, optional
-            Name or position of the index level to use (if the index is a
-            MultiIndex).
-
-        Notes
-        -----
-        If `level` is specified:
-
-        - if it is the name of one *and only one* index level, use that level;
-        - otherwise it should be a number indicating level position.
-
-        Returns
-        -------
-        is_contained : ndarray (boolean dtype)
-
-        """
-        if level is not None:
-            self._validate_index_level(level)
-        return algos.isin(np.array(self), values)
-
-    def _can_reindex(self, indexer):
-        """
-        *this is an internal non-public method*
-
-        Check if we are allowing reindexing with this particular indexer
-
-        Parameters
-        ----------
-        indexer : an integer indexer
-
-        Raises
-        ------
-        ValueError if its a duplicate axis
-        """
-
-        # trying to reindex on an axis with duplicates
-        if not self.is_unique and len(indexer):
-            raise ValueError("cannot reindex from a duplicate axis")
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Parameters
-        ----------
-        target : an iterable
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-        # GH6552: preserve names when reindexing to non-named target
-        # (i.e. neither Index nor Series).
-        preserve_names = not hasattr(target, 'name')
-
-        # GH7774: preserve dtype/tz if target is empty and not an Index.
-        target = _ensure_has_len(target)  # target may be an iterator
-
-        if not isinstance(target, Index) and len(target) == 0:
-            attrs = self._get_attributes_dict()
-            attrs.pop('freq', None)  # don't preserve freq
-            target = self._simple_new(None, dtype=self.dtype, **attrs)
-        else:
-            target = _ensure_index(target)
-
-        if level is not None:
-            if method is not None:
-                raise TypeError('Fill method not supported if level passed')
-            _, indexer, _ = self._join_level(target, level, how='right',
-                                             return_indexers=True)
-        else:
-            if self.equals(target):
-                indexer = None
-            else:
-
-                if self.is_unique:
-                    indexer = self.get_indexer(target, method=method,
-                                               limit=limit,
-                                               tolerance=tolerance)
-                else:
-                    if method is not None or limit is not None:
-                        raise ValueError("cannot reindex a non-unique index "
-                                         "with a method or limit")
-                    indexer, missing = self.get_indexer_non_unique(target)
-
-        if preserve_names and target.nlevels == 1 and target.name != self.name:
-            target = target.copy()
-            target.name = self.name
-
-        return target, indexer
-
-    def _reindex_non_unique(self, target):
-        """
-        *this is an internal non-public method*
-
-        Create a new index with target's values (move/add/delete values as
-        necessary) use with non-unique Index and a possibly non-unique target
-
-        Parameters
-        ----------
-        target : an iterable
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-
-        target = _ensure_index(target)
-        indexer, missing = self.get_indexer_non_unique(target)
-        check = indexer != -1
-        new_labels = self.take(indexer[check])
-        new_indexer = None
-
-        if len(missing):
-            l = np.arange(len(indexer))
-
-            missing = _ensure_platform_int(missing)
-            missing_labels = target.take(missing)
-            missing_indexer = _ensure_int64(l[~check])
-            cur_labels = self.take(indexer[check]).values
-            cur_indexer = _ensure_int64(l[check])
-
-            new_labels = np.empty(tuple([len(indexer)]), dtype=object)
-            new_labels[cur_indexer] = cur_labels
-            new_labels[missing_indexer] = missing_labels
-
-            # a unique indexer
-            if target.is_unique:
-
-                # see GH5553, make sure we use the right indexer
-                new_indexer = np.arange(len(indexer))
-                new_indexer[cur_indexer] = np.arange(len(cur_labels))
-                new_indexer[missing_indexer] = -1
-
-            # we have a non_unique selector, need to use the original
-            # indexer here
-            else:
-
-                # need to retake to have the same size as the indexer
-                indexer = indexer.values
-                indexer[~check] = 0
-
-                # reset the new indexer to account for the new size
-                new_indexer = np.arange(len(self.take(indexer)))
-                new_indexer[~check] = -1
-
-        new_index = self._shallow_copy_with_infer(new_labels, freq=None)
-        return new_index, indexer, new_indexer
-
-    _index_shared_docs['join'] = """
-        *this is an internal non-public method*
-
-        Compute join_index and indexers to conform data
-        structures to the new index.
-
-        Parameters
-        ----------
-        other : Index
-        how : {'left', 'right', 'inner', 'outer'}
-        level : int or level name, default None
-        return_indexers : boolean, default False
-        sort : boolean, default False
-            Sort the join keys lexicographically in the result Index. If False,
-            the order of the join keys depends on the join type (how keyword)
-
-            .. versionadded:: 0.20.0
-
-        Returns
-        -------
-        join_index, (left_indexer, right_indexer)
-        """
-
-    @Appender(_index_shared_docs['join'])
-    def join(self, other, how='left', level=None, return_indexers=False,
-             sort=False):
-        from .multi import MultiIndex
-        self_is_mi = isinstance(self, MultiIndex)
-        other_is_mi = isinstance(other, MultiIndex)
-
-        # try to figure out the join level
-        # GH3662
-        if level is None and (self_is_mi or other_is_mi):
-
-            # have the same levels/names so a simple join
-            if self.names == other.names:
-                pass
-            else:
-                return self._join_multi(other, how=how,
-                                        return_indexers=return_indexers)
-
-        # join on the level
-        if level is not None and (self_is_mi or other_is_mi):
-            return self._join_level(other, level, how=how,
-                                    return_indexers=return_indexers)
-
-        other = _ensure_index(other)
-
-        if len(other) == 0 and how in ('left', 'outer'):
-            join_index = self._shallow_copy()
-            if return_indexers:
-                rindexer = np.repeat(-1, len(join_index))
-                return join_index, None, rindexer
-            else:
-                return join_index
-
-        if len(self) == 0 and how in ('right', 'outer'):
-            join_index = other._shallow_copy()
-            if return_indexers:
-                lindexer = np.repeat(-1, len(join_index))
-                return join_index, lindexer, None
-            else:
-                return join_index
-
-        if self._join_precedence < other._join_precedence:
-            how = {'right': 'left', 'left': 'right'}.get(how, how)
-            result = other.join(self, how=how, level=level,
-                                return_indexers=return_indexers)
-            if return_indexers:
-                x, y, z = result
-                result = x, z, y
-            return result
-
-        if not is_dtype_equal(self.dtype, other.dtype):
-            this = self.astype('O')
-            other = other.astype('O')
-            return this.join(other, how=how, return_indexers=return_indexers)
-
-        _validate_join_method(how)
-
-        if not self.is_unique and not other.is_unique:
-            return self._join_non_unique(other, how=how,
-                                         return_indexers=return_indexers)
-        elif not self.is_unique or not other.is_unique:
-            if self.is_monotonic and other.is_monotonic:
-                return self._join_monotonic(other, how=how,
-                                            return_indexers=return_indexers)
-            else:
-                return self._join_non_unique(other, how=how,
-                                             return_indexers=return_indexers)
-        elif self.is_monotonic and other.is_monotonic:
-            try:
-                return self._join_monotonic(other, how=how,
-                                            return_indexers=return_indexers)
-            except TypeError:
-                pass
-
-        if how == 'left':
-            join_index = self
-        elif how == 'right':
-            join_index = other
-        elif how == 'inner':
-            join_index = self.intersection(other)
-        elif how == 'outer':
-            join_index = self.union(other)
-
-        if sort:
-            join_index = join_index.sort_values()
-
-        if return_indexers:
-            if join_index is self:
-                lindexer = None
-            else:
-                lindexer = self.get_indexer(join_index)
-            if join_index is other:
-                rindexer = None
-            else:
-                rindexer = other.get_indexer(join_index)
-            return join_index, lindexer, rindexer
-        else:
-            return join_index
-
-    def _join_multi(self, other, how, return_indexers=True):
-        from .multi import MultiIndex
-        self_is_mi = isinstance(self, MultiIndex)
-        other_is_mi = isinstance(other, MultiIndex)
-
-        # figure out join names
-        self_names = [n for n in self.names if n is not None]
-        other_names = [n for n in other.names if n is not None]
-        overlap = list(set(self_names) & set(other_names))
-
-        # need at least 1 in common, but not more than 1
-        if not len(overlap):
-            raise ValueError("cannot join with no level specified and no "
-                             "overlapping names")
-        if len(overlap) > 1:
-            raise NotImplementedError("merging with more than one level "
-                                      "overlap on a multi-index is not "
-                                      "implemented")
-        jl = overlap[0]
-
-        # make the indices into mi's that match
-        if not (self_is_mi and other_is_mi):
-
-            flip_order = False
-            if self_is_mi:
-                self, other = other, self
-                flip_order = True
-                # flip if join method is right or left
-                how = {'right': 'left', 'left': 'right'}.get(how, how)
-
-            level = other.names.index(jl)
-            result = self._join_level(other, level, how=how,
-                                      return_indexers=return_indexers)
-
-            if flip_order:
-                if isinstance(result, tuple):
-                    return result[0], result[2], result[1]
-            return result
-
-        # 2 multi-indexes
-        raise NotImplementedError("merging with both multi-indexes is not "
-                                  "implemented")
-
-    def _join_non_unique(self, other, how='left', return_indexers=False):
-        from pandas.tools.merge import _get_join_indexers
-
-        left_idx, right_idx = _get_join_indexers([self.values],
-                                                 [other._values], how=how,
-                                                 sort=True)
-
-        left_idx = _ensure_platform_int(left_idx)
-        right_idx = _ensure_platform_int(right_idx)
-
-        join_index = self.values.take(left_idx)
-        mask = left_idx == -1
-        np.putmask(join_index, mask, other._values.take(right_idx))
-
-        join_index = self._wrap_joined_index(join_index, other)
-
-        if return_indexers:
-            return join_index, left_idx, right_idx
-        else:
-            return join_index
-
-    def _join_level(self, other, level, how='left', return_indexers=False,
-                    keep_order=True):
-        """
-        The join method *only* affects the level of the resulting
-        MultiIndex. Otherwise it just exactly aligns the Index data to the
-        labels of the level in the MultiIndex. If `keep_order` == True, the
-        order of the data indexed by the MultiIndex will not be changed;
-        otherwise, it will tie out with `other`.
-        """
-        from .multi import MultiIndex
-
-        def _get_leaf_sorter(labels):
-            """
-            returns sorter for the inner most level while preserving the
-            order of higher levels
-            """
-            if labels[0].size == 0:
-                return np.empty(0, dtype='int64')
-
-            if len(labels) == 1:
-                lab = _ensure_int64(labels[0])
-                sorter, _ = libalgos.groupsort_indexer(lab, 1 + lab.max())
-                return sorter
-
-            # find indexers of begining of each set of
-            # same-key labels w.r.t all but last level
-            tic = labels[0][:-1] != labels[0][1:]
-            for lab in labels[1:-1]:
-                tic |= lab[:-1] != lab[1:]
-
-            starts = np.hstack(([True], tic, [True])).nonzero()[0]
-            lab = _ensure_int64(labels[-1])
-            return lib.get_level_sorter(lab, _ensure_int64(starts))
-
-        if isinstance(self, MultiIndex) and isinstance(other, MultiIndex):
-            raise TypeError('Join on level between two MultiIndex objects '
-                            'is ambiguous')
-
-        left, right = self, other
-
-        flip_order = not isinstance(self, MultiIndex)
-        if flip_order:
-            left, right = right, left
-            how = {'right': 'left', 'left': 'right'}.get(how, how)
-
-        level = left._get_level_number(level)
-        old_level = left.levels[level]
-
-        if not right.is_unique:
-            raise NotImplementedError('Index._join_level on non-unique index '
-                                      'is not implemented')
-
-        new_level, left_lev_indexer, right_lev_indexer = \
-            old_level.join(right, how=how, return_indexers=True)
-
-        if left_lev_indexer is None:
-            if keep_order or len(left) == 0:
-                left_indexer = None
-                join_index = left
-            else:  # sort the leaves
-                left_indexer = _get_leaf_sorter(left.labels[:level + 1])
-                join_index = left[left_indexer]
-
-        else:
-            left_lev_indexer = _ensure_int64(left_lev_indexer)
-            rev_indexer = lib.get_reverse_indexer(left_lev_indexer,
-                                                  len(old_level))
-
-            new_lev_labels = algos.take_nd(rev_indexer, left.labels[level],
-                                           allow_fill=False)
-
-            new_labels = list(left.labels)
-            new_labels[level] = new_lev_labels
-
-            new_levels = list(left.levels)
-            new_levels[level] = new_level
-
-            if keep_order:  # just drop missing values. o.w. keep order
-                left_indexer = np.arange(len(left), dtype=np.intp)
-                mask = new_lev_labels != -1
-                if not mask.all():
-                    new_labels = [lab[mask] for lab in new_labels]
-                    left_indexer = left_indexer[mask]
-
-            else:  # tie out the order with other
-                if level == 0:  # outer most level, take the fast route
-                    ngroups = 1 + new_lev_labels.max()
-                    left_indexer, counts = libalgos.groupsort_indexer(
-                        new_lev_labels, ngroups)
-
-                    # missing values are placed first; drop them!
-                    left_indexer = left_indexer[counts[0]:]
-                    new_labels = [lab[left_indexer] for lab in new_labels]
-
-                else:  # sort the leaves
-                    mask = new_lev_labels != -1
-                    mask_all = mask.all()
-                    if not mask_all:
-                        new_labels = [lab[mask] for lab in new_labels]
-
-                    left_indexer = _get_leaf_sorter(new_labels[:level + 1])
-                    new_labels = [lab[left_indexer] for lab in new_labels]
-
-                    # left_indexers are w.r.t masked frame.
-                    # reverse to original frame!
-                    if not mask_all:
-                        left_indexer = mask.nonzero()[0][left_indexer]
-
-            join_index = MultiIndex(levels=new_levels, labels=new_labels,
-                                    names=left.names, verify_integrity=False)
-
-        if right_lev_indexer is not None:
-            right_indexer = algos.take_nd(right_lev_indexer,
-                                          join_index.labels[level],
-                                          allow_fill=False)
-        else:
-            right_indexer = join_index.labels[level]
-
-        if flip_order:
-            left_indexer, right_indexer = right_indexer, left_indexer
-
-        if return_indexers:
-            left_indexer = (None if left_indexer is None
-                            else _ensure_platform_int(left_indexer))
-            right_indexer = (None if right_indexer is None
-                             else _ensure_platform_int(right_indexer))
-            return join_index, left_indexer, right_indexer
-        else:
-            return join_index
-
-    def _join_monotonic(self, other, how='left', return_indexers=False):
-        if self.equals(other):
-            ret_index = other if how == 'right' else self
-            if return_indexers:
-                return ret_index, None, None
-            else:
-                return ret_index
-
-        sv = self._values
-        ov = other._values
-
-        if self.is_unique and other.is_unique:
-            # We can perform much better than the general case
-            if how == 'left':
-                join_index = self
-                lidx = None
-                ridx = self._left_indexer_unique(sv, ov)
-            elif how == 'right':
-                join_index = other
-                lidx = self._left_indexer_unique(ov, sv)
-                ridx = None
-            elif how == 'inner':
-                join_index, lidx, ridx = self._inner_indexer(sv, ov)
-                join_index = self._wrap_joined_index(join_index, other)
-            elif how == 'outer':
-                join_index, lidx, ridx = self._outer_indexer(sv, ov)
-                join_index = self._wrap_joined_index(join_index, other)
-        else:
-            if how == 'left':
-                join_index, lidx, ridx = self._left_indexer(sv, ov)
-            elif how == 'right':
-                join_index, ridx, lidx = self._left_indexer(ov, sv)
-            elif how == 'inner':
-                join_index, lidx, ridx = self._inner_indexer(sv, ov)
-            elif how == 'outer':
-                join_index, lidx, ridx = self._outer_indexer(sv, ov)
-            join_index = self._wrap_joined_index(join_index, other)
-
-        if return_indexers:
-            lidx = None if lidx is None else _ensure_platform_int(lidx)
-            ridx = None if ridx is None else _ensure_platform_int(ridx)
-            return join_index, lidx, ridx
-        else:
-            return join_index
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        return Index(joined, name=name)
-
-    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
-        # this is for partial string indexing,
-        # overridden in DatetimeIndex, TimedeltaIndex and PeriodIndex
-        raise NotImplementedError
-
-    def slice_indexer(self, start=None, end=None, step=None, kind=None):
-        """
-        For an ordered Index, compute the slice indexer for input labels and
-        step
-
-        Parameters
-        ----------
-        start : label, default None
-            If None, defaults to the beginning
-        end : label, default None
-            If None, defaults to the end
-        step : int, default None
-        kind : string, default None
-
-        Returns
-        -------
-        indexer : ndarray or slice
-
-        Notes
-        -----
-        This function assumes that the data is sorted, so use at your own peril
-        """
-        start_slice, end_slice = self.slice_locs(start, end, step=step,
-                                                 kind=kind)
-
-        # return a slice
-        if not is_scalar(start_slice):
-            raise AssertionError("Start slice bound is non-scalar")
-        if not is_scalar(end_slice):
-            raise AssertionError("End slice bound is non-scalar")
-
-        return slice(start_slice, end_slice, step)
-
-    def _maybe_cast_indexer(self, key):
-        """
-        If we have a float key and are not a floating index
-        then try to cast to an int if equivalent
-        """
-
-        if is_float(key) and not self.is_floating():
-            try:
-                ckey = int(key)
-                if ckey == key:
-                    key = ckey
-            except (ValueError, TypeError):
-                pass
-        return key
-
-    def _validate_indexer(self, form, key, kind):
-        """
-        if we are positional indexer
-        validate that we have appropriate typed bounds
-        must be an integer
-        """
-        assert kind in ['ix', 'loc', 'getitem', 'iloc']
-
-        if key is None:
-            pass
-        elif is_integer(key):
-            pass
-        elif kind in ['iloc', 'getitem']:
-            self._invalid_indexer(form, key)
-        return key
-
-    _index_shared_docs['_maybe_cast_slice_bound'] = """
-        This function should be overloaded in subclasses that allow non-trivial
-        casting on label-slice bounds, e.g. datetime-like indices allowing
-        strings containing formatted datetimes.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : {'ix', 'loc', 'getitem'}
-
-        Returns
-        -------
-        label :  object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-
-    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        assert kind in ['ix', 'loc', 'getitem', None]
-
-        # We are a plain index here (sub-class override this method if they
-        # wish to have special treatment for floats/ints, e.g. Float64Index and
-        # datetimelike Indexes
-        # reject them
-        if is_float(label):
-            if not (kind in ['ix'] and (self.holds_integer() or
-                                        self.is_floating())):
-                self._invalid_indexer('slice', label)
-
-        # we are trying to find integer bounds on a non-integer based index
-        # this is rejected (generally .loc gets you here)
-        elif is_integer(label):
-            self._invalid_indexer('slice', label)
-
-        return label
-
-    def _searchsorted_monotonic(self, label, side='left'):
-        if self.is_monotonic_increasing:
-            return self.searchsorted(label, side=side)
-        elif self.is_monotonic_decreasing:
-            # np.searchsorted expects ascending sort order, have to reverse
-            # everything for it to work (element ordering, search side and
-            # resulting value).
-            pos = self[::-1].searchsorted(label, side='right' if side == 'left'
-                                          else 'right')
-            return len(self) - pos
-
-        raise ValueError('index must be monotonic increasing or decreasing')
-
-    def get_slice_bound(self, label, side, kind):
-        """
-        Calculate slice bound that corresponds to given label.
-
-        Returns leftmost (one-past-the-rightmost if ``side=='right'``) position
-        of given label.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : {'ix', 'loc', 'getitem'}
-
-        """
-        assert kind in ['ix', 'loc', 'getitem', None]
-
-        if side not in ('left', 'right'):
-            raise ValueError("Invalid value for side kwarg,"
-                             " must be either 'left' or 'right': %s" %
-                             (side, ))
-
-        original_label = label
-
-        # For datetime indices label may be a string that has to be converted
-        # to datetime boundary according to its resolution.
-        label = self._maybe_cast_slice_bound(label, side, kind)
-
-        # we need to look up the label
-        try:
-            slc = self.get_loc(label)
-        except KeyError as err:
-            try:
-                return self._searchsorted_monotonic(label, side)
-            except ValueError:
-                # raise the original KeyError
-                raise err
-
-        if isinstance(slc, np.ndarray):
-            # get_loc may return a boolean array or an array of indices, which
-            # is OK as long as they are representable by a slice.
-            if is_bool_dtype(slc):
-                slc = lib.maybe_booleans_to_slice(slc.view('u1'))
-            else:
-                slc = lib.maybe_indices_to_slice(slc.astype('i8'), len(self))
-            if isinstance(slc, np.ndarray):
-                raise KeyError("Cannot get %s slice bound for non-unique "
-                               "label: %r" % (side, original_label))
-
-        if isinstance(slc, slice):
-            if side == 'left':
-                return slc.start
-            else:
-                return slc.stop
-        else:
-            if side == 'right':
-                return slc + 1
-            else:
-                return slc
-
-    def slice_locs(self, start=None, end=None, step=None, kind=None):
-        """
-        Compute slice locations for input labels.
-
-        Parameters
-        ----------
-        start : label, default None
-            If None, defaults to the beginning
-        end : label, default None
-            If None, defaults to the end
-        step : int, defaults None
-            If None, defaults to 1
-        kind : {'ix', 'loc', 'getitem'} or None
-
-        Returns
-        -------
-        start, end : int
-
-        """
-        inc = (step is None or step >= 0)
-
-        if not inc:
-            # If it's a reverse slice, temporarily swap bounds.
-            start, end = end, start
-
-        start_slice = None
-        if start is not None:
-            start_slice = self.get_slice_bound(start, 'left', kind)
-        if start_slice is None:
-            start_slice = 0
-
-        end_slice = None
-        if end is not None:
-            end_slice = self.get_slice_bound(end, 'right', kind)
-        if end_slice is None:
-            end_slice = len(self)
-
-        if not inc:
-            # Bounds at this moment are swapped, swap them back and shift by 1.
-            #
-            # slice_locs('B', 'A', step=-1): s='B', e='A'
-            #
-            #              s='A'                 e='B'
-            # AFTER SWAP:    |                     |
-            #                v ------------------> V
-            #           -----------------------------------
-            #           | | |A|A|A|A| | | | | |B|B| | | | |
-            #           -----------------------------------
-            #              ^ <------------------ ^
-            # SHOULD BE:   |                     |
-            #           end=s-1              start=e-1
-            #
-            end_slice, start_slice = start_slice - 1, end_slice - 1
-
-            # i == -1 triggers ``len(self) + i`` selection that points to the
-            # last element, not before-the-first one, subtracting len(self)
-            # compensates that.
-            if end_slice == -1:
-                end_slice -= len(self)
-            if start_slice == -1:
-                start_slice -= len(self)
-
-        return start_slice, end_slice
-
-    def delete(self, loc):
-        """
-        Make new Index with passed location(-s) deleted
-
-        Returns
-        -------
-        new_index : Index
-        """
-        return self._shallow_copy(np.delete(self._data, loc))
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location. Follows
-        Python list.append semantics for negative values
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-
-        Returns
-        -------
-        new_index : Index
-        """
-        _self = np.asarray(self)
-        item = self._coerce_scalar_to_index(item)._values
-        idx = np.concatenate((_self[:loc], item, _self[loc:]))
-        return self._shallow_copy_with_infer(idx)
-
-    def drop(self, labels, errors='raise'):
-        """
-        Make new Index with passed list of labels deleted
-
-        Parameters
-        ----------
-        labels : array-like
-        errors : {'ignore', 'raise'}, default 'raise'
-            If 'ignore', suppress error and existing labels are dropped.
-
-        Returns
-        -------
-        dropped : Index
-        """
-        labels = com._index_labels_to_array(labels)
-        indexer = self.get_indexer(labels)
-        mask = indexer == -1
-        if mask.any():
-            if errors != 'ignore':
-                raise ValueError('labels %s not contained in axis' %
-                                 labels[mask])
-            indexer = indexer[~mask]
-        return self.delete(indexer)
-
-    @Appender(base._shared_docs['unique'] % _index_doc_kwargs)
-    def unique(self):
-        result = super(Index, self).unique()
-        return self._shallow_copy(result)
-
-    @Appender(base._shared_docs['drop_duplicates'] % _index_doc_kwargs)
-    def drop_duplicates(self, keep='first'):
-        return super(Index, self).drop_duplicates(keep=keep)
-
-    @Appender(base._shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        return super(Index, self).duplicated(keep=keep)
-
-    _index_shared_docs['fillna'] = """
-        Fill NA/NaN values with the specified value
-
-        Parameters
-        ----------
-        value : scalar
-            Scalar value to use to fill holes (e.g. 0).
-            This value cannot be a list-likes.
-        downcast : dict, default is None
-            a dict of item->dtype of what to downcast if possible,
-            or the string 'infer' which will try to downcast to an appropriate
-            equal type (e.g. float64 to int64 if possible)
-
-        Returns
-        -------
-        filled : %(klass)s
-        """
-
-    @Appender(_index_shared_docs['fillna'])
-    def fillna(self, value=None, downcast=None):
-        self._assert_can_do_op(value)
-        if self.hasnans:
-            result = self.putmask(self._isnan, value)
-            if downcast is None:
-                # no need to care metadata other than name
-                # because it can't have freq if
-                return Index(result, name=self.name)
-        return self._shallow_copy()
-
-    _index_shared_docs['dropna'] = """
-        Return Index without NA/NaN values
-
-        Parameters
-        ----------
-        how :  {'any', 'all'}, default 'any'
-            If the Index is a MultiIndex, drop the value when any or all levels
-            are NaN.
-
-        Returns
-        -------
-        valid : Index
-        """
-
-    @Appender(_index_shared_docs['dropna'])
-    def dropna(self, how='any'):
-        if how not in ('any', 'all'):
-            raise ValueError("invalid how option: {0}".format(how))
-
-        if self.hasnans:
-            return self._shallow_copy(self.values[~self._isnan])
-        return self._shallow_copy()
-
-    def _evaluate_with_timedelta_like(self, other, op, opstr):
-        raise TypeError("can only perform ops with timedelta like values")
-
-    def _evaluate_with_datetime_like(self, other, op, opstr):
-        raise TypeError("can only perform ops with datetime like values")
-
-    def _evalute_compare(self, op):
-        raise base.AbstractMethodError(self)
-
-    @classmethod
-    def _add_comparison_methods(cls):
-        """ add in comparison methods """
-
-        def _make_compare(op):
-            def _evaluate_compare(self, other):
-                if isinstance(other, (np.ndarray, Index, ABCSeries)):
-                    if other.ndim > 0 and len(self) != len(other):
-                        raise ValueError('Lengths must match to compare')
-
-                # we may need to directly compare underlying
-                # representations
-                if needs_i8_conversion(self) and needs_i8_conversion(other):
-                    return self._evaluate_compare(other, op)
-
-                if is_object_dtype(self) and self.nlevels == 1:
-                    # don't pass MultiIndex
-                    with np.errstate(all='ignore'):
-                        result = _comp_method_OBJECT_ARRAY(
-                            op, self.values, other)
-                else:
-                    with np.errstate(all='ignore'):
-                        result = op(self.values, np.asarray(other))
-
-                # technically we could support bool dtyped Index
-                # for now just return the indexing array directly
-                if is_bool_dtype(result):
-                    return result
-                try:
-                    return Index(result)
-                except TypeError:
-                    return result
-
-            return _evaluate_compare
-
-        cls.__eq__ = _make_compare(operator.eq)
-        cls.__ne__ = _make_compare(operator.ne)
-        cls.__lt__ = _make_compare(operator.lt)
-        cls.__gt__ = _make_compare(operator.gt)
-        cls.__le__ = _make_compare(operator.le)
-        cls.__ge__ = _make_compare(operator.ge)
-
-    @classmethod
-    def _add_numeric_methods_add_sub_disabled(cls):
-        """ add in the numeric add/sub methods to disable """
-
-        def _make_invalid_op(name):
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: "
-                                "{typ}".format(name=name, typ=type(self)))
-
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.__add__ = cls.__radd__ = __iadd__ = _make_invalid_op('__add__')  # noqa
-        cls.__sub__ = __isub__ = _make_invalid_op('__sub__')  # noqa
-
-    @classmethod
-    def _add_numeric_methods_disabled(cls):
-        """ add in numeric methods to disable other than add/sub """
-
-        def _make_invalid_op(name):
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: "
-                                "{typ}".format(name=name, typ=type(self)))
-
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.__pow__ = cls.__rpow__ = _make_invalid_op('__pow__')
-        cls.__mul__ = cls.__rmul__ = _make_invalid_op('__mul__')
-        cls.__floordiv__ = cls.__rfloordiv__ = _make_invalid_op('__floordiv__')
-        cls.__truediv__ = cls.__rtruediv__ = _make_invalid_op('__truediv__')
-        if not compat.PY3:
-            cls.__div__ = cls.__rdiv__ = _make_invalid_op('__div__')
-        cls.__neg__ = _make_invalid_op('__neg__')
-        cls.__pos__ = _make_invalid_op('__pos__')
-        cls.__abs__ = _make_invalid_op('__abs__')
-        cls.__inv__ = _make_invalid_op('__inv__')
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        return attrs
-
-    def _validate_for_numeric_unaryop(self, op, opstr):
-        """ validate if we can perform a numeric unary operation """
-
-        if not self._is_numeric_dtype:
-            raise TypeError("cannot evaluate a numeric op "
-                            "{opstr} for type: {typ}".format(
-                                opstr=opstr,
-                                typ=type(self))
-                            )
-
-    def _validate_for_numeric_binop(self, other, op, opstr):
-        """
-        return valid other, evaluate or raise TypeError
-        if we are not of the appropriate type
-
-        internal method called by ops
-        """
-        from pandas.tseries.offsets import DateOffset
-
-        # if we are an inheritor of numeric,
-        # but not actually numeric (e.g. DatetimeIndex/PeriodInde)
-        if not self._is_numeric_dtype:
-            raise TypeError("cannot evaluate a numeric op {opstr} "
-                            "for type: {typ}".format(
-                                opstr=opstr,
-                                typ=type(self))
-                            )
-
-        if isinstance(other, Index):
-            if not other._is_numeric_dtype:
-                raise TypeError("cannot evaluate a numeric op "
-                                "{opstr} with type: {typ}".format(
-                                    opstr=type(self),
-                                    typ=type(other))
-                                )
-        elif isinstance(other, np.ndarray) and not other.ndim:
-            other = other.item()
-
-        if isinstance(other, (Index, ABCSeries, np.ndarray)):
-            if len(self) != len(other):
-                raise ValueError("cannot evaluate a numeric op with "
-                                 "unequal lengths")
-            other = _values_from_object(other)
-            if other.dtype.kind not in ['f', 'i', 'u']:
-                raise TypeError("cannot evaluate a numeric op "
-                                "with a non-numeric dtype")
-        elif isinstance(other, (DateOffset, np.timedelta64,
-                                Timedelta, datetime.timedelta)):
-            # higher up to handle
-            pass
-        elif isinstance(other, (Timestamp, np.datetime64)):
-            # higher up to handle
-            pass
-        else:
-            if not (is_float(other) or is_integer(other)):
-                raise TypeError("can only perform ops with scalar values")
-
-        return other
-
-    @classmethod
-    def _add_numeric_methods_binary(cls):
-        """ add in numeric methods """
-
-        def _make_evaluate_binop(op, opstr, reversed=False, constructor=Index):
-            def _evaluate_numeric_binop(self, other):
-
-                from pandas.tseries.offsets import DateOffset
-                other = self._validate_for_numeric_binop(other, op, opstr)
-
-                # handle time-based others
-                if isinstance(other, (DateOffset, np.timedelta64,
-                                      Timedelta, datetime.timedelta)):
-                    return self._evaluate_with_timedelta_like(other, op, opstr)
-                elif isinstance(other, (Timestamp, np.datetime64)):
-                    return self._evaluate_with_datetime_like(other, op, opstr)
-
-                # if we are a reversed non-communative op
-                values = self.values
-                if reversed:
-                    values, other = other, values
-
-                attrs = self._get_attributes_dict()
-                attrs = self._maybe_update_attributes(attrs)
-                with np.errstate(all='ignore'):
-                    result = op(values, other)
-                return constructor(result, **attrs)
-
-            return _evaluate_numeric_binop
-
-        cls.__add__ = cls.__radd__ = _make_evaluate_binop(
-            operator.add, '__add__')
-        cls.__sub__ = _make_evaluate_binop(
-            operator.sub, '__sub__')
-        cls.__rsub__ = _make_evaluate_binop(
-            operator.sub, '__sub__', reversed=True)
-        cls.__mul__ = cls.__rmul__ = _make_evaluate_binop(
-            operator.mul, '__mul__')
-        cls.__rpow__ = _make_evaluate_binop(
-            operator.pow, '__pow__', reversed=True)
-        cls.__pow__ = _make_evaluate_binop(
-            operator.pow, '__pow__')
-        cls.__mod__ = _make_evaluate_binop(
-            operator.mod, '__mod__')
-        cls.__floordiv__ = _make_evaluate_binop(
-            operator.floordiv, '__floordiv__')
-        cls.__rfloordiv__ = _make_evaluate_binop(
-            operator.floordiv, '__floordiv__', reversed=True)
-        cls.__truediv__ = _make_evaluate_binop(
-            operator.truediv, '__truediv__')
-        cls.__rtruediv__ = _make_evaluate_binop(
-            operator.truediv, '__truediv__', reversed=True)
-        if not compat.PY3:
-            cls.__div__ = _make_evaluate_binop(
-                operator.div, '__div__')
-            cls.__rdiv__ = _make_evaluate_binop(
-                operator.div, '__div__', reversed=True)
-
-        cls.__divmod__ = _make_evaluate_binop(
-            divmod,
-            '__divmod__',
-            constructor=lambda result, **attrs: (
-                Index(result[0], **attrs),
-                Index(result[1], **attrs),
-            ),
-        )
-
-    @classmethod
-    def _add_numeric_methods_unary(cls):
-        """ add in numeric unary methods """
-
-        def _make_evaluate_unary(op, opstr):
-
-            def _evaluate_numeric_unary(self):
-
-                self._validate_for_numeric_unaryop(op, opstr)
-                attrs = self._get_attributes_dict()
-                attrs = self._maybe_update_attributes(attrs)
-                return Index(op(self.values), **attrs)
-
-            return _evaluate_numeric_unary
-
-        cls.__neg__ = _make_evaluate_unary(lambda x: -x, '__neg__')
-        cls.__pos__ = _make_evaluate_unary(lambda x: x, '__pos__')
-        cls.__abs__ = _make_evaluate_unary(np.abs, '__abs__')
-        cls.__inv__ = _make_evaluate_unary(lambda x: -x, '__inv__')
-
-    @classmethod
-    def _add_numeric_methods(cls):
-        cls._add_numeric_methods_unary()
-        cls._add_numeric_methods_binary()
-
-    @classmethod
-    def _add_logical_methods(cls):
-        """ add in logical methods """
-
-        _doc = """
-
-        %(desc)s
-
-        Parameters
-        ----------
-        All arguments to numpy.%(outname)s are accepted.
-
-        Returns
-        -------
-        %(outname)s : bool or array_like (if axis is specified)
-            A single element array_like may be converted to bool."""
-
-        def _make_logical_function(name, desc, f):
-            @Substitution(outname=name, desc=desc)
-            @Appender(_doc)
-            def logical_func(self, *args, **kwargs):
-                result = f(self.values)
-                if (isinstance(result, (np.ndarray, ABCSeries, Index)) and
-                        result.ndim == 0):
-                    # return NumPy type
-                    return result.dtype.type(result.item())
-                else:  # pragma: no cover
-                    return result
-
-            logical_func.__name__ = name
-            return logical_func
-
-        cls.all = _make_logical_function('all', 'Return whether all elements '
-                                                'are True',
-                                         np.all)
-        cls.any = _make_logical_function('any',
-                                         'Return whether any element is True',
-                                         np.any)
-
-    @classmethod
-    def _add_logical_methods_disabled(cls):
-        """ add in logical methods to disable """
-
-        def _make_invalid_op(name):
-            def invalid_op(self, other=None):
-                raise TypeError("cannot perform {name} with this index type: "
-                                "{typ}".format(name=name, typ=type(self)))
-
-            invalid_op.__name__ = name
-            return invalid_op
-
-        cls.all = _make_invalid_op('all')
-        cls.any = _make_invalid_op('any')
-
-
-Index._add_numeric_methods_disabled()
-Index._add_logical_methods()
-Index._add_comparison_methods()
-
-
-def _ensure_index(index_like, copy=False):
-    if isinstance(index_like, Index):
-        if copy:
-            index_like = index_like.copy()
-        return index_like
-    if hasattr(index_like, 'name'):
-        return Index(index_like, name=index_like.name, copy=copy)
-
-    # must check for exactly list here because of strict type
-    # check in clean_index_list
-    if isinstance(index_like, list):
-        if type(index_like) != list:
-            index_like = list(index_like)
-        # 2200 ?
-        converted, all_arrays = lib.clean_index_list(index_like)
-
-        if len(converted) > 0 and all_arrays:
-            from .multi import MultiIndex
-            return MultiIndex.from_arrays(converted)
-        else:
-            index_like = converted
-    else:
-        # clean_index_list does the equivalent of copying
-        # so only need to do this if not list instance
-        if copy:
-            from copy import copy
-            index_like = copy(index_like)
-
-    return Index(index_like)
-
-
-def _get_na_value(dtype):
-    return {np.datetime64: libts.NaT,
-            np.timedelta64: libts.NaT}.get(dtype, np.nan)
-
-
-def _ensure_has_len(seq):
-    """If seq is an iterator, put its values into a list."""
-    try:
-        len(seq)
-    except TypeError:
-        return list(seq)
-    else:
-        return seq
-
-
-def _trim_front(strings):
-    """
-    Trims zeros and decimal points
-    """
-    trimmed = strings
-    while len(strings) > 0 and all([x[0] == ' ' for x in trimmed]):
-        trimmed = [x[1:] for x in trimmed]
-    return trimmed
-
-
-def _validate_join_method(method):
-    if method not in ['left', 'right', 'inner', 'outer']:
-        raise ValueError('do not recognize join method %s' % method)
diff --git a/pandas/indexes/category.py b/pandas/indexes/category.py
deleted file mode 100644
index 7cfc95de5f538..0000000000000
--- a/pandas/indexes/category.py
+++ /dev/null
@@ -1,632 +0,0 @@
-import numpy as np
-from pandas._libs import index as libindex
-
-from pandas import compat
-from pandas.compat.numpy import function as nv
-from pandas.types.generic import ABCCategorical, ABCSeries
-from pandas.types.common import (is_categorical_dtype,
-                                 _ensure_platform_int,
-                                 is_list_like,
-                                 is_scalar)
-from pandas.types.missing import array_equivalent
-
-
-from pandas.util.decorators import Appender, cache_readonly
-from pandas.core.config import get_option
-from pandas.indexes.base import Index, _index_shared_docs
-import pandas.core.base as base
-import pandas.core.missing as missing
-import pandas.indexes.base as ibase
-from pandas.core.common import _asarray_tuplesafe
-
-_index_doc_kwargs = dict(ibase._index_doc_kwargs)
-_index_doc_kwargs.update(dict(target_klass='CategoricalIndex'))
-
-
-class CategoricalIndex(Index, base.PandasDelegate):
-    """
-
-    Immutable Index implementing an ordered, sliceable set. CategoricalIndex
-    represents a sparsely populated Index with an underlying Categorical.
-
-    .. versionadded:: 0.16.1
-
-    Parameters
-    ----------
-    data : array-like or Categorical, (1-dimensional)
-    categories : optional, array-like
-        categories for the CategoricalIndex
-    ordered : boolean,
-        designating if the categories are ordered
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-
-    """
-
-    _typ = 'categoricalindex'
-    _engine_type = libindex.Int64Engine
-    _attributes = ['name']
-
-    def __new__(cls, data=None, categories=None, ordered=None, dtype=None,
-                copy=False, name=None, fastpath=False, **kwargs):
-
-        if fastpath:
-            return cls._simple_new(data, name=name)
-
-        if name is None and hasattr(data, 'name'):
-            name = data.name
-
-        if isinstance(data, ABCCategorical):
-            data = cls._create_categorical(cls, data, categories, ordered)
-        elif isinstance(data, CategoricalIndex):
-            data = data._data
-            data = cls._create_categorical(cls, data, categories, ordered)
-        else:
-
-            # don't allow scalars
-            # if data is None, then categories must be provided
-            if is_scalar(data):
-                if data is not None or categories is None:
-                    cls._scalar_data_error(data)
-                data = []
-            data = cls._create_categorical(cls, data, categories, ordered)
-
-        if copy:
-            data = data.copy()
-
-        return cls._simple_new(data, name=name)
-
-    def _create_from_codes(self, codes, categories=None, ordered=None,
-                           name=None):
-        """
-        *this is an internal non-public method*
-
-        create the correct categorical from codes
-
-        Parameters
-        ----------
-        codes : new codes
-        categories : optional categories, defaults to existing
-        ordered : optional ordered attribute, defaults to existing
-        name : optional name attribute, defaults to existing
-
-        Returns
-        -------
-        CategoricalIndex
-        """
-
-        from pandas.core.categorical import Categorical
-        if categories is None:
-            categories = self.categories
-        if ordered is None:
-            ordered = self.ordered
-        if name is None:
-            name = self.name
-        cat = Categorical.from_codes(codes, categories=categories,
-                                     ordered=self.ordered)
-        return CategoricalIndex(cat, name=name)
-
-    @staticmethod
-    def _create_categorical(self, data, categories=None, ordered=None):
-        """
-        *this is an internal non-public method*
-
-        create the correct categorical from data and the properties
-
-        Parameters
-        ----------
-        data : data for new Categorical
-        categories : optional categories, defaults to existing
-        ordered : optional ordered attribute, defaults to existing
-
-        Returns
-        -------
-        Categorical
-        """
-        if not isinstance(data, ABCCategorical):
-            ordered = False if ordered is None else ordered
-            from pandas.core.categorical import Categorical
-            data = Categorical(data, categories=categories, ordered=ordered)
-        else:
-            if categories is not None:
-                data = data.set_categories(categories)
-            if ordered is not None:
-                data = data.set_ordered(ordered)
-        return data
-
-    @classmethod
-    def _simple_new(cls, values, name=None, categories=None, ordered=None,
-                    **kwargs):
-        result = object.__new__(cls)
-
-        values = cls._create_categorical(cls, values, categories, ordered)
-        result._data = values
-        result.name = name
-        for k, v in compat.iteritems(kwargs):
-            setattr(result, k, v)
-
-        result._reset_identity()
-        return result
-
-    @Appender(_index_shared_docs['_shallow_copy'])
-    def _shallow_copy(self, values=None, categories=None, ordered=None,
-                      **kwargs):
-        # categories and ordered can't be part of attributes,
-        # as these are properties
-        if categories is None:
-            categories = self.categories
-        if ordered is None:
-            ordered = self.ordered
-        return super(CategoricalIndex,
-                     self)._shallow_copy(values=values, categories=categories,
-                                         ordered=ordered, **kwargs)
-
-    def _is_dtype_compat(self, other):
-        """
-        *this is an internal non-public method*
-
-        provide a comparison between the dtype of self and other (coercing if
-        needed)
-
-        Raises
-        ------
-        TypeError if the dtypes are not compatible
-        """
-        if is_categorical_dtype(other):
-            if isinstance(other, CategoricalIndex):
-                other = other._values
-            if not other.is_dtype_equal(self):
-                raise TypeError("categories must match existing categories "
-                                "when appending")
-        else:
-            values = other
-            if not is_list_like(values):
-                values = [values]
-            other = CategoricalIndex(self._create_categorical(
-                self, other, categories=self.categories, ordered=self.ordered))
-            if not other.isin(values).all():
-                raise TypeError("cannot append a non-category item to a "
-                                "CategoricalIndex")
-
-        return other
-
-    def equals(self, other):
-        """
-        Determines if two CategorialIndex objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, Index):
-            return False
-
-        try:
-            other = self._is_dtype_compat(other)
-            return array_equivalent(self._data, other)
-        except (TypeError, ValueError):
-            pass
-
-        return False
-
-    @property
-    def _formatter_func(self):
-        return self.categories._formatter_func
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        max_categories = (10 if get_option("display.max_categories") == 0 else
-                          get_option("display.max_categories"))
-        attrs = [
-            ('categories',
-             ibase.default_pprint(self.categories,
-                                  max_seq_items=max_categories)),
-            ('ordered', self.ordered)]
-        if self.name is not None:
-            attrs.append(('name', ibase.default_pprint(self.name)))
-        attrs.append(('dtype', "'%s'" % self.dtype))
-        max_seq_items = get_option('display.max_seq_items') or len(self)
-        if len(self) > max_seq_items:
-            attrs.append(('length', len(self)))
-        return attrs
-
-    @property
-    def inferred_type(self):
-        return 'categorical'
-
-    @property
-    def values(self):
-        """ return the underlying data, which is a Categorical """
-        return self._data
-
-    def get_values(self):
-        """ return the underlying data as an ndarray """
-        return self._data.get_values()
-
-    @property
-    def codes(self):
-        return self._data.codes
-
-    @property
-    def categories(self):
-        return self._data.categories
-
-    @property
-    def ordered(self):
-        return self._data.ordered
-
-    def _reverse_indexer(self):
-        return self._data._reverse_indexer()
-
-    def __contains__(self, key):
-        hash(key)
-        return key in self.values
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return np.array(self._data, dtype=dtype)
-
-    @cache_readonly
-    def _isnan(self):
-        """ return if each value is nan"""
-        return self._data.codes == -1
-
-    @Appender(ibase._index_shared_docs['fillna'])
-    def fillna(self, value, downcast=None):
-        self._assert_can_do_op(value)
-        return CategoricalIndex(self._data.fillna(value), name=self.name)
-
-    def argsort(self, *args, **kwargs):
-        return self.values.argsort(*args, **kwargs)
-
-    @cache_readonly
-    def _engine(self):
-
-        # we are going to look things up with the codes themselves
-        return self._engine_type(lambda: self.codes.astype('i8'), len(self))
-
-    @cache_readonly
-    def is_unique(self):
-        return not self.duplicated().any()
-
-    @Appender(base._shared_docs['unique'] % _index_doc_kwargs)
-    def unique(self):
-        result = base.IndexOpsMixin.unique(self)
-        # CategoricalIndex._shallow_copy uses keeps original categories
-        # and ordered if not otherwise specified
-        return self._shallow_copy(result, categories=result.categories,
-                                  ordered=result.ordered)
-
-    @Appender(base._shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        from pandas._libs.hashtable import duplicated_int64
-        codes = self.codes.astype('i8')
-        return duplicated_int64(codes, keep)
-
-    def _to_safe_for_reshape(self):
-        """ convert to object if we are a categorical """
-        return self.astype('object')
-
-    def get_loc(self, key, method=None):
-        """
-        Get integer location for requested label
-
-        Parameters
-        ----------
-        key : label
-        method : {None}
-            * default: exact matches only.
-
-        Returns
-        -------
-        loc : int if unique index, possibly slice or mask if not
-        """
-        codes = self.categories.get_loc(key)
-        if (codes == -1):
-            raise KeyError(key)
-        return self._engine.get_loc(codes)
-
-    def _can_reindex(self, indexer):
-        """ always allow reindexing """
-        pass
-
-    @Appender(_index_shared_docs['where'])
-    def where(self, cond, other=None):
-        if other is None:
-            other = self._na_value
-        values = np.where(cond, self.values, other)
-
-        from pandas.core.categorical import Categorical
-        cat = Categorical(values,
-                          categories=self.categories,
-                          ordered=self.ordered)
-        return self._shallow_copy(cat, **self._get_attributes_dict())
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Returns
-        -------
-        new_index : pd.Index
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-
-        if method is not None:
-            raise NotImplementedError("argument method is not implemented for "
-                                      "CategoricalIndex.reindex")
-        if level is not None:
-            raise NotImplementedError("argument level is not implemented for "
-                                      "CategoricalIndex.reindex")
-        if limit is not None:
-            raise NotImplementedError("argument limit is not implemented for "
-                                      "CategoricalIndex.reindex")
-
-        target = ibase._ensure_index(target)
-
-        if not is_categorical_dtype(target) and not target.is_unique:
-            raise ValueError("cannot reindex with a non-unique indexer")
-
-        indexer, missing = self.get_indexer_non_unique(np.array(target))
-        new_target = self.take(indexer)
-
-        # filling in missing if needed
-        if len(missing):
-            cats = self.categories.get_indexer(target)
-
-            if (cats == -1).any():
-                # coerce to a regular index here!
-                result = Index(np.array(self), name=self.name)
-                new_target, indexer, _ = result._reindex_non_unique(
-                    np.array(target))
-
-            else:
-
-                codes = new_target.codes.copy()
-                codes[indexer == -1] = cats[missing]
-                new_target = self._create_from_codes(codes)
-
-        # we always want to return an Index type here
-        # to be consistent with .reindex for other index types (e.g. they don't
-        # coerce based on the actual values, only on the dtype)
-        # unless we had an inital Categorical to begin with
-        # in which case we are going to conform to the passed Categorical
-        new_target = np.asarray(new_target)
-        if is_categorical_dtype(target):
-            new_target = target._shallow_copy(new_target, name=self.name)
-        else:
-            new_target = Index(new_target, name=self.name)
-
-        return new_target, indexer
-
-    def _reindex_non_unique(self, target):
-        """ reindex from a non-unique; which CategoricalIndex's are almost
-        always
-        """
-        new_target, indexer = self.reindex(target)
-        new_indexer = None
-
-        check = indexer == -1
-        if check.any():
-            new_indexer = np.arange(len(self.take(indexer)))
-            new_indexer[check] = -1
-
-        cats = self.categories.get_indexer(target)
-        if not (cats == -1).any():
-            # .reindex returns normal Index. Revert to CategoricalIndex if
-            # all targets are included in my categories
-            new_target = self._shallow_copy(new_target)
-
-        return new_target, indexer, new_indexer
-
-    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        method = missing.clean_reindex_fill_method(method)
-        target = ibase._ensure_index(target)
-
-        if isinstance(target, CategoricalIndex):
-            target = target.categories
-
-        if method == 'pad' or method == 'backfill':
-            raise NotImplementedError("method='pad' and method='backfill' not "
-                                      "implemented yet for CategoricalIndex")
-        elif method == 'nearest':
-            raise NotImplementedError("method='nearest' not implemented yet "
-                                      'for CategoricalIndex')
-        else:
-
-            codes = self.categories.get_indexer(target)
-            indexer, _ = self._engine.get_indexer_non_unique(codes)
-
-        return _ensure_platform_int(indexer)
-
-    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
-    def get_indexer_non_unique(self, target):
-        target = ibase._ensure_index(target)
-
-        if isinstance(target, CategoricalIndex):
-            target = target.categories
-
-        codes = self.categories.get_indexer(target)
-        return self._engine.get_indexer_non_unique(codes)
-
-    @Appender(_index_shared_docs['_convert_list_indexer'])
-    def _convert_list_indexer(self, keyarr, kind=None):
-        # Return our indexer or raise if all of the values are not included in
-        # the categories
-        codes = self.categories.get_indexer(keyarr)
-        if (codes == -1).any():
-            raise KeyError("a list-indexer must only include values that are "
-                           "in the categories")
-
-        return None
-
-    @Appender(_index_shared_docs['_convert_arr_indexer'])
-    def _convert_arr_indexer(self, keyarr):
-        keyarr = _asarray_tuplesafe(keyarr)
-        return self._shallow_copy(keyarr)
-
-    @Appender(_index_shared_docs['_convert_index_indexer'])
-    def _convert_index_indexer(self, keyarr):
-        return self._shallow_copy(keyarr)
-
-    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
-    def take(self, indices, axis=0, allow_fill=True,
-             fill_value=None, **kwargs):
-        nv.validate_take(tuple(), kwargs)
-        indices = _ensure_platform_int(indices)
-        taken = self._assert_take_fillable(self.codes, indices,
-                                           allow_fill=allow_fill,
-                                           fill_value=fill_value,
-                                           na_value=-1)
-        return self._create_from_codes(taken)
-
-    def map(self, mapper):
-        """Apply mapper function to its categories (not codes).
-
-        Parameters
-        ----------
-        mapper : callable
-            Function to be applied. When all categories are mapped
-            to different categories, the result will be a CategoricalIndex
-            which has the same order property as the original. Otherwise,
-            the result will be a Index.
-
-        Returns
-        -------
-        applied : CategoricalIndex or Index
-
-        """
-        return self._shallow_copy_with_infer(self.values.map(mapper))
-
-    def delete(self, loc):
-        """
-        Make new Index with passed location(-s) deleted
-
-        Returns
-        -------
-        new_index : Index
-        """
-        return self._create_from_codes(np.delete(self.codes, loc))
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location. Follows
-        Python list.append semantics for negative values
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-
-        Returns
-        -------
-        new_index : Index
-
-        Raises
-        ------
-        ValueError if the item is not in the categories
-
-        """
-        code = self.categories.get_indexer([item])
-        if (code == -1):
-            raise TypeError("cannot insert an item into a CategoricalIndex "
-                            "that is not already an existing category")
-
-        codes = self.codes
-        codes = np.concatenate((codes[:loc], code, codes[loc:]))
-        return self._create_from_codes(codes)
-
-    def _append_same_dtype(self, to_concat, name):
-        """
-        Concatenate to_concat which has the same class
-        ValueError if other is not in the categories
-        """
-        to_concat = [self._is_dtype_compat(c) for c in to_concat]
-        codes = np.concatenate([c.codes for c in to_concat])
-        result = self._create_from_codes(codes, name=name)
-        # if name is None, _create_from_codes sets self.name
-        result.name = name
-        return result
-
-    def _codes_for_groupby(self, sort):
-        """ Return a Categorical adjusted for groupby """
-        return self.values._codes_for_groupby(sort)
-
-    @classmethod
-    def _add_comparison_methods(cls):
-        """ add in comparison methods """
-
-        def _make_compare(op):
-            def _evaluate_compare(self, other):
-
-                # if we have a Categorical type, then must have the same
-                # categories
-                if isinstance(other, CategoricalIndex):
-                    other = other._values
-                elif isinstance(other, Index):
-                    other = self._create_categorical(
-                        self, other._values, categories=self.categories,
-                        ordered=self.ordered)
-
-                if isinstance(other, (ABCCategorical, np.ndarray,
-                                      ABCSeries)):
-                    if len(self.values) != len(other):
-                        raise ValueError("Lengths must match to compare")
-
-                if isinstance(other, ABCCategorical):
-                    if not self.values.is_dtype_equal(other):
-                        raise TypeError("categorical index comparisions must "
-                                        "have the same categories and ordered "
-                                        "attributes")
-
-                return getattr(self.values, op)(other)
-
-            return _evaluate_compare
-
-        cls.__eq__ = _make_compare('__eq__')
-        cls.__ne__ = _make_compare('__ne__')
-        cls.__lt__ = _make_compare('__lt__')
-        cls.__gt__ = _make_compare('__gt__')
-        cls.__le__ = _make_compare('__le__')
-        cls.__ge__ = _make_compare('__ge__')
-
-    def _delegate_method(self, name, *args, **kwargs):
-        """ method delegation to the ._values """
-        method = getattr(self._values, name)
-        if 'inplace' in kwargs:
-            raise ValueError("cannot use inplace with CategoricalIndex")
-        res = method(*args, **kwargs)
-        if is_scalar(res):
-            return res
-        return CategoricalIndex(res, name=self.name)
-
-    @classmethod
-    def _add_accessors(cls):
-        """ add in Categorical accessor methods """
-
-        from pandas.core.categorical import Categorical
-        CategoricalIndex._add_delegate_accessors(
-            delegate=Categorical, accessors=["rename_categories",
-                                             "reorder_categories",
-                                             "add_categories",
-                                             "remove_categories",
-                                             "remove_unused_categories",
-                                             "set_categories",
-                                             "as_ordered", "as_unordered",
-                                             "min", "max"],
-            typ='method', overwrite=True)
-
-
-CategoricalIndex._add_numeric_methods_add_sub_disabled()
-CategoricalIndex._add_numeric_methods_disabled()
-CategoricalIndex._add_logical_methods_disabled()
-CategoricalIndex._add_comparison_methods()
-CategoricalIndex._add_accessors()
diff --git a/pandas/indexes/frozen.py b/pandas/indexes/frozen.py
deleted file mode 100644
index 97a1a3ea99e65..0000000000000
--- a/pandas/indexes/frozen.py
+++ /dev/null
@@ -1,126 +0,0 @@
-"""
-frozen (immutable) data structures to support MultiIndexing
-
-These are used for:
-
-- .names (FrozenList)
-- .levels & .labels (FrozenNDArray)
-
-"""
-
-import numpy as np
-from pandas.core.base import PandasObject
-from pandas.types.cast import coerce_indexer_dtype
-from pandas.formats.printing import pprint_thing
-
-
-class FrozenList(PandasObject, list):
-
-    """
-    Container that doesn't allow setting item *but*
-    because it's technically non-hashable, will be used
-    for lookups, appropriately, etc.
-    """
-    # Sidenote: This has to be of type list, otherwise it messes up PyTables
-    #           typechecks
-
-    def __add__(self, other):
-        if isinstance(other, tuple):
-            other = list(other)
-        return self.__class__(super(FrozenList, self).__add__(other))
-
-    __iadd__ = __add__
-
-    # Python 2 compat
-    def __getslice__(self, i, j):
-        return self.__class__(super(FrozenList, self).__getslice__(i, j))
-
-    def __getitem__(self, n):
-        # Python 3 compat
-        if isinstance(n, slice):
-            return self.__class__(super(FrozenList, self).__getitem__(n))
-        return super(FrozenList, self).__getitem__(n)
-
-    def __radd__(self, other):
-        if isinstance(other, tuple):
-            other = list(other)
-        return self.__class__(other + list(self))
-
-    def __eq__(self, other):
-        if isinstance(other, (tuple, FrozenList)):
-            other = list(other)
-        return super(FrozenList, self).__eq__(other)
-
-    __req__ = __eq__
-
-    def __mul__(self, other):
-        return self.__class__(super(FrozenList, self).__mul__(other))
-
-    __imul__ = __mul__
-
-    def __reduce__(self):
-        return self.__class__, (list(self),)
-
-    def __hash__(self):
-        return hash(tuple(self))
-
-    def _disabled(self, *args, **kwargs):
-        """This method will not function because object is immutable."""
-        raise TypeError("'%s' does not support mutable operations." %
-                        self.__class__.__name__)
-
-    def __unicode__(self):
-        return pprint_thing(self, quote_strings=True,
-                            escape_chars=('\t', '\r', '\n'))
-
-    def __repr__(self):
-        return "%s(%s)" % (self.__class__.__name__,
-                           str(self))
-
-    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
-    pop = append = extend = remove = sort = insert = _disabled
-
-
-class FrozenNDArray(PandasObject, np.ndarray):
-
-    # no __array_finalize__ for now because no metadata
-    def __new__(cls, data, dtype=None, copy=False):
-        if copy is None:
-            copy = not isinstance(data, FrozenNDArray)
-        res = np.array(data, dtype=dtype, copy=copy).view(cls)
-        return res
-
-    def _disabled(self, *args, **kwargs):
-        """This method will not function because object is immutable."""
-        raise TypeError("'%s' does not support mutable operations." %
-                        self.__class__)
-
-    __setitem__ = __setslice__ = __delitem__ = __delslice__ = _disabled
-    put = itemset = fill = _disabled
-
-    def _shallow_copy(self):
-        return self.view()
-
-    def values(self):
-        """returns *copy* of underlying array"""
-        arr = self.view(np.ndarray).copy()
-        return arr
-
-    def __unicode__(self):
-        """
-        Return a string representation for this object.
-
-        Invoked by unicode(df) in py2 only. Yields a Unicode String in both
-        py2/py3.
-        """
-        prepr = pprint_thing(self, escape_chars=('\t', '\r', '\n'),
-                             quote_strings=True)
-        return "%s(%s, dtype='%s')" % (type(self).__name__, prepr, self.dtype)
-
-
-def _ensure_frozen(array_like, categories, copy=False):
-    array_like = coerce_indexer_dtype(array_like, categories)
-    array_like = array_like.view(FrozenNDArray)
-    if copy:
-        array_like = array_like.copy()
-    return array_like
diff --git a/pandas/indexes/multi.py b/pandas/indexes/multi.py
deleted file mode 100644
index e6ae0605d4758..0000000000000
--- a/pandas/indexes/multi.py
+++ /dev/null
@@ -1,2514 +0,0 @@
-
-# pylint: disable=E1101,E1103,W0232
-import datetime
-import warnings
-from functools import partial
-from sys import getsizeof
-
-import numpy as np
-from pandas._libs import index as libindex, lib, Timestamp
-
-from pandas.compat import range, zip, lrange, lzip, map
-from pandas.compat.numpy import function as nv
-from pandas import compat
-
-from pandas.types.common import (_ensure_int64,
-                                 _ensure_platform_int,
-                                 is_object_dtype,
-                                 is_iterator,
-                                 is_list_like,
-                                 is_scalar)
-from pandas.types.missing import isnull, array_equivalent
-from pandas.core.common import (_values_from_object,
-                                is_bool_indexer,
-                                is_null_slice,
-                                PerformanceWarning,
-                                UnsortedIndexError)
-
-
-import pandas.core.base as base
-from pandas.util.decorators import (Appender, cache_readonly,
-                                    deprecate, deprecate_kwarg)
-import pandas.core.common as com
-import pandas.core.missing as missing
-import pandas.core.algorithms as algos
-from pandas.formats.printing import pprint_thing
-
-from pandas.core.config import get_option
-
-from pandas.indexes.base import (Index, _ensure_index,
-                                 _get_na_value, InvalidIndexError,
-                                 _index_shared_docs)
-from pandas.indexes.frozen import FrozenNDArray, FrozenList, _ensure_frozen
-import pandas.indexes.base as ibase
-_index_doc_kwargs = dict(ibase._index_doc_kwargs)
-_index_doc_kwargs.update(
-    dict(klass='MultiIndex',
-         target_klass='MultiIndex or list of tuples'))
-
-
-class MultiIndex(Index):
-    """
-    A multi-level, or hierarchical, index object for pandas objects
-
-    Parameters
-    ----------
-    levels : sequence of arrays
-        The unique labels for each level
-    labels : sequence of arrays
-        Integers for each level designating which label at each location
-    sortorder : optional int
-        Level of sortedness (must be lexicographically sorted by that
-        level)
-    names : optional sequence of objects
-        Names for each of the index levels. (name is accepted for compat)
-    copy : boolean, default False
-        Copy the meta-data
-    verify_integrity : boolean, default True
-        Check that the levels/labels are consistent and valid
-    """
-
-    # initialize to zero-length tuples to make everything work
-    _typ = 'multiindex'
-    _names = FrozenList()
-    _levels = FrozenList()
-    _labels = FrozenList()
-    _comparables = ['names']
-    _engine_type = libindex.MultiIndexEngine
-    rename = Index.set_names
-
-    def __new__(cls, levels=None, labels=None, sortorder=None, names=None,
-                copy=False, verify_integrity=True, _set_identity=True,
-                name=None, **kwargs):
-
-        # compat with Index
-        if name is not None:
-            names = name
-        if levels is None or labels is None:
-            raise TypeError("Must pass both levels and labels")
-        if len(levels) != len(labels):
-            raise ValueError('Length of levels and labels must be the same.')
-        if len(levels) == 0:
-            raise ValueError('Must pass non-zero number of levels/labels')
-        if len(levels) == 1:
-            if names:
-                name = names[0]
-            else:
-                name = None
-            return Index(levels[0], name=name, copy=True).take(labels[0])
-
-        result = object.__new__(MultiIndex)
-
-        # we've already validated levels and labels, so shortcut here
-        result._set_levels(levels, copy=copy, validate=False)
-        result._set_labels(labels, copy=copy, validate=False)
-
-        if names is not None:
-            # handles name validation
-            result._set_names(names)
-
-        if sortorder is not None:
-            result.sortorder = int(sortorder)
-        else:
-            result.sortorder = sortorder
-
-        if verify_integrity:
-            result._verify_integrity()
-        if _set_identity:
-            result._reset_identity()
-        return result
-
-    def _verify_integrity(self, labels=None, levels=None):
-        """
-
-        Parameters
-        ----------
-        labels : optional list
-            Labels to check for validity. Defaults to current labels.
-        levels : optional list
-            Levels to check for validity. Defaults to current levels.
-
-        Raises
-        ------
-        ValueError
-            * if length of levels and labels don't match or any label would
-            exceed level bounds
-        """
-        # NOTE: Currently does not check, among other things, that cached
-        # nlevels matches nor that sortorder matches actually sortorder.
-        labels = labels or self.labels
-        levels = levels or self.levels
-
-        if len(levels) != len(labels):
-            raise ValueError("Length of levels and labels must match. NOTE:"
-                             " this index is in an inconsistent state.")
-        label_length = len(self.labels[0])
-        for i, (level, label) in enumerate(zip(levels, labels)):
-            if len(label) != label_length:
-                raise ValueError("Unequal label lengths: %s" %
-                                 ([len(lab) for lab in labels]))
-            if len(label) and label.max() >= len(level):
-                raise ValueError("On level %d, label max (%d) >= length of"
-                                 " level  (%d). NOTE: this index is in an"
-                                 " inconsistent state" % (i, label.max(),
-                                                          len(level)))
-
-    def _get_levels(self):
-        return self._levels
-
-    def _set_levels(self, levels, level=None, copy=False, validate=True,
-                    verify_integrity=False):
-        # This is NOT part of the levels property because it should be
-        # externally not allowed to set levels. User beware if you change
-        # _levels directly
-        if validate and len(levels) == 0:
-            raise ValueError('Must set non-zero number of levels.')
-        if validate and level is None and len(levels) != self.nlevels:
-            raise ValueError('Length of levels must match number of levels.')
-        if validate and level is not None and len(levels) != len(level):
-            raise ValueError('Length of levels must match length of level.')
-
-        if level is None:
-            new_levels = FrozenList(
-                _ensure_index(lev, copy=copy)._shallow_copy()
-                for lev in levels)
-        else:
-            level = [self._get_level_number(l) for l in level]
-            new_levels = list(self._levels)
-            for l, v in zip(level, levels):
-                new_levels[l] = _ensure_index(v, copy=copy)._shallow_copy()
-            new_levels = FrozenList(new_levels)
-
-        if verify_integrity:
-            self._verify_integrity(levels=new_levels)
-
-        names = self.names
-        self._levels = new_levels
-        if any(names):
-            self._set_names(names)
-
-        self._tuples = None
-        self._reset_cache()
-
-    def set_levels(self, levels, level=None, inplace=False,
-                   verify_integrity=True):
-        """
-        Set new levels on MultiIndex. Defaults to returning
-        new index.
-
-        Parameters
-        ----------
-        levels : sequence or list of sequence
-            new level(s) to apply
-        level : int, level name, or sequence of int/level names (default None)
-            level(s) to set (None for all levels)
-        inplace : bool
-            if True, mutates in place
-        verify_integrity : bool (default True)
-            if True, checks that levels and labels are compatible
-
-        Returns
-        -------
-        new index (of same type and class...etc)
-
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_levels([['a','b'], [1,2]])
-        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels(['a','b'], level=0)
-        MultiIndex(levels=[[u'a', u'b'], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels(['a','b'], level='bar')
-        MultiIndex(levels=[[1, 2], [u'a', u'b']],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_levels([['a','b'], [1,2]], level=[0,1])
-        MultiIndex(levels=[[u'a', u'b'], [1, 2]],
-                   labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        """
-        if level is not None and not is_list_like(level):
-            if not is_list_like(levels):
-                raise TypeError("Levels must be list-like")
-            if is_list_like(levels[0]):
-                raise TypeError("Levels must be list-like")
-            level = [level]
-            levels = [levels]
-        elif level is None or is_list_like(level):
-            if not is_list_like(levels) or not is_list_like(levels[0]):
-                raise TypeError("Levels must be list of lists-like")
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._reset_identity()
-        idx._set_levels(levels, level=level, validate=True,
-                        verify_integrity=verify_integrity)
-        if not inplace:
-            return idx
-
-    # remove me in 0.14 and change to read only property
-    __set_levels = deprecate("setting `levels` directly",
-                             partial(set_levels, inplace=True,
-                                     verify_integrity=True),
-                             alt_name="set_levels")
-    levels = property(fget=_get_levels, fset=__set_levels)
-
-    def _get_labels(self):
-        return self._labels
-
-    def _set_labels(self, labels, level=None, copy=False, validate=True,
-                    verify_integrity=False):
-
-        if validate and level is None and len(labels) != self.nlevels:
-            raise ValueError("Length of labels must match number of levels")
-        if validate and level is not None and len(labels) != len(level):
-            raise ValueError('Length of labels must match length of levels.')
-
-        if level is None:
-            new_labels = FrozenList(
-                _ensure_frozen(lab, lev, copy=copy)._shallow_copy()
-                for lev, lab in zip(self.levels, labels))
-        else:
-            level = [self._get_level_number(l) for l in level]
-            new_labels = list(self._labels)
-            for l, lev, lab in zip(level, self.levels, labels):
-                new_labels[l] = _ensure_frozen(
-                    lab, lev, copy=copy)._shallow_copy()
-            new_labels = FrozenList(new_labels)
-
-        if verify_integrity:
-            self._verify_integrity(labels=new_labels)
-
-        self._labels = new_labels
-        self._tuples = None
-        self._reset_cache()
-
-    def set_labels(self, labels, level=None, inplace=False,
-                   verify_integrity=True):
-        """
-        Set new labels on MultiIndex. Defaults to returning
-        new index.
-
-        Parameters
-        ----------
-        labels : sequence or list of sequence
-            new labels to apply
-        level : int, level name, or sequence of int/level names (default None)
-            level(s) to set (None for all levels)
-        inplace : bool
-            if True, mutates in place
-        verify_integrity : bool (default True)
-            if True, checks that levels and labels are compatible
-
-        Returns
-        -------
-        new index (of same type and class...etc)
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')],
-                                          names=['foo', 'bar'])
-        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([1,0,1,0], level=0)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 1, 0, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([0,0,1,1], level='bar')
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 1, 1], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        >>> idx.set_labels([[1,0,1,0], [0,0,1,1]], level=[0,1])
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[1, 0, 1, 0], [0, 0, 1, 1]],
-                   names=[u'foo', u'bar'])
-        """
-        if level is not None and not is_list_like(level):
-            if not is_list_like(labels):
-                raise TypeError("Labels must be list-like")
-            if is_list_like(labels[0]):
-                raise TypeError("Labels must be list-like")
-            level = [level]
-            labels = [labels]
-        elif level is None or is_list_like(level):
-            if not is_list_like(labels) or not is_list_like(labels[0]):
-                raise TypeError("Labels must be list of lists-like")
-
-        if inplace:
-            idx = self
-        else:
-            idx = self._shallow_copy()
-        idx._reset_identity()
-        idx._set_labels(labels, level=level, verify_integrity=verify_integrity)
-        if not inplace:
-            return idx
-
-    # remove me in 0.14 and change to readonly property
-    __set_labels = deprecate("setting labels directly",
-                             partial(set_labels, inplace=True,
-                                     verify_integrity=True),
-                             alt_name="set_labels")
-    labels = property(fget=_get_labels, fset=__set_labels)
-
-    def copy(self, names=None, dtype=None, levels=None, labels=None,
-             deep=False, _set_identity=False, **kwargs):
-        """
-        Make a copy of this object. Names, dtype, levels and labels can be
-        passed and will be set on new copy.
-
-        Parameters
-        ----------
-        names : sequence, optional
-        dtype : numpy dtype or pandas type, optional
-        levels : sequence, optional
-        labels : sequence, optional
-
-        Returns
-        -------
-        copy : MultiIndex
-
-        Notes
-        -----
-        In most cases, there should be no functional difference from using
-        ``deep``, but if ``deep`` is passed it will attempt to deepcopy.
-        This could be potentially expensive on large MultiIndex objects.
-        """
-        name = kwargs.get('name')
-        names = self._validate_names(name=name, names=names, deep=deep)
-
-        if deep:
-            from copy import deepcopy
-            if levels is None:
-                levels = deepcopy(self.levels)
-            if labels is None:
-                labels = deepcopy(self.labels)
-        else:
-            if levels is None:
-                levels = self.levels
-            if labels is None:
-                labels = self.labels
-        return MultiIndex(levels=levels, labels=labels, names=names,
-                          sortorder=self.sortorder, verify_integrity=False,
-                          _set_identity=_set_identity)
-
-    def __array__(self, dtype=None):
-        """ the array interface, return my values """
-        return self.values
-
-    def view(self, cls=None):
-        """ this is defined as a copy with the same identity """
-        result = self.copy()
-        result._id = self._id
-        return result
-
-    def _shallow_copy_with_infer(self, values=None, **kwargs):
-        return self._shallow_copy(values, **kwargs)
-
-    @Appender(_index_shared_docs['_shallow_copy'])
-    def _shallow_copy(self, values=None, **kwargs):
-        if values is not None:
-            if 'name' in kwargs:
-                kwargs['names'] = kwargs.pop('name', None)
-            # discards freq
-            kwargs.pop('freq', None)
-            return MultiIndex.from_tuples(values, **kwargs)
-        return self.view()
-
-    @cache_readonly
-    def dtype(self):
-        return np.dtype('O')
-
-    def _is_memory_usage_qualified(self):
-        """ return a boolean if we need a qualified .info display """
-        def f(l):
-            return 'mixed' in l or 'string' in l or 'unicode' in l
-        return any([f(l) for l in self._inferred_type_levels])
-
-    @Appender(Index.memory_usage.__doc__)
-    def memory_usage(self, deep=False):
-        # we are overwriting our base class to avoid
-        # computing .values here which could materialize
-        # a tuple representation uncessarily
-        return self._nbytes(deep)
-
-    @cache_readonly
-    def nbytes(self):
-        """ return the number of bytes in the underlying data """
-        return self._nbytes(False)
-
-    def _nbytes(self, deep=False):
-        """
-        return the number of bytes in the underlying data
-        deeply introspect the level data if deep=True
-
-        include the engine hashtable
-
-        *this is in internal routine*
-
-        """
-        level_nbytes = sum((i.memory_usage(deep=deep) for i in self.levels))
-        label_nbytes = sum((i.nbytes for i in self.labels))
-        names_nbytes = sum((getsizeof(i) for i in self.names))
-        result = level_nbytes + label_nbytes + names_nbytes
-
-        # include our engine hashtable
-        result += self._engine.sizeof(deep=deep)
-        return result
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = [
-            ('levels', ibase.default_pprint(self._levels,
-                                            max_seq_items=False)),
-            ('labels', ibase.default_pprint(self._labels,
-                                            max_seq_items=False))]
-        if not all(name is None for name in self.names):
-            attrs.append(('names', ibase.default_pprint(self.names)))
-        if self.sortorder is not None:
-            attrs.append(('sortorder', ibase.default_pprint(self.sortorder)))
-        return attrs
-
-    def _format_space(self):
-        return "\n%s" % (' ' * (len(self.__class__.__name__) + 1))
-
-    def _format_data(self):
-        # we are formatting thru the attributes
-        return None
-
-    def __len__(self):
-        return len(self.labels[0])
-
-    def _get_names(self):
-        return FrozenList(level.name for level in self.levels)
-
-    def _set_names(self, names, level=None, validate=True):
-        """
-        sets names on levels. WARNING: mutates!
-
-        Note that you generally want to set this *after* changing levels, so
-        that it only acts on copies
-        """
-
-        # GH 15110
-        # Don't allow a single string for names in a MultiIndex
-        if names is not None and not is_list_like(names):
-            raise ValueError('Names should be list-like for a MultiIndex')
-        names = list(names)
-
-        if validate and level is not None and len(names) != len(level):
-            raise ValueError('Length of names must match length of level.')
-        if validate and level is None and len(names) != self.nlevels:
-            raise ValueError('Length of names must match number of levels in '
-                             'MultiIndex.')
-
-        if level is None:
-            level = range(self.nlevels)
-        else:
-            level = [self._get_level_number(l) for l in level]
-
-        # set the name
-        for l, name in zip(level, names):
-            self.levels[l].rename(name, inplace=True)
-
-    names = property(fset=_set_names, fget=_get_names,
-                     doc="Names of levels in MultiIndex")
-
-    def _reference_duplicate_name(self, name):
-        """
-        Returns True if the name refered to in self.names is duplicated.
-        """
-        # count the times name equals an element in self.names.
-        return sum(name == n for n in self.names) > 1
-
-    def _format_native_types(self, na_rep='nan', **kwargs):
-        new_levels = []
-        new_labels = []
-
-        # go through the levels and format them
-        for level, label in zip(self.levels, self.labels):
-            level = level._format_native_types(na_rep=na_rep, **kwargs)
-            # add nan values, if there are any
-            mask = (label == -1)
-            if mask.any():
-                nan_index = len(level)
-                level = np.append(level, na_rep)
-                label = label.values()
-                label[mask] = nan_index
-            new_levels.append(level)
-            new_labels.append(label)
-
-        # reconstruct the multi-index
-        mi = MultiIndex(levels=new_levels, labels=new_labels, names=self.names,
-                        sortorder=self.sortorder, verify_integrity=False)
-
-        return mi.values
-
-    @Appender(_index_shared_docs['_get_grouper_for_level'])
-    def _get_grouper_for_level(self, mapper, level):
-        indexer = self.labels[level]
-        level_index = self.levels[level]
-
-        if mapper is not None:
-            # Handle group mapping function and return
-            level_values = self.levels[level].take(indexer)
-            grouper = level_values.map(mapper)
-            return grouper, None, None
-
-        labels, uniques = algos.factorize(indexer, sort=True)
-
-        if len(uniques) > 0 and uniques[0] == -1:
-            # Handle NAs
-            mask = indexer != -1
-            ok_labels, uniques = algos.factorize(indexer[mask],
-                                                 sort=True)
-
-            labels = np.empty(len(indexer), dtype=indexer.dtype)
-            labels[mask] = ok_labels
-            labels[~mask] = -1
-
-        if len(uniques) < len(level_index):
-            # Remove unobserved levels from level_index
-            level_index = level_index.take(uniques)
-
-        grouper = level_index.take(labels)
-
-        return grouper, labels, level_index
-
-    @property
-    def _constructor(self):
-        return MultiIndex.from_tuples
-
-    @cache_readonly
-    def inferred_type(self):
-        return 'mixed'
-
-    @staticmethod
-    def _from_elements(values, labels=None, levels=None, names=None,
-                       sortorder=None):
-        return MultiIndex(levels, labels, names, sortorder=sortorder)
-
-    def _get_level_number(self, level):
-        try:
-            count = self.names.count(level)
-            if count > 1:
-                raise ValueError('The name %s occurs multiple times, use a '
-                                 'level number' % level)
-            level = self.names.index(level)
-        except ValueError:
-            if not isinstance(level, int):
-                raise KeyError('Level %s not found' % str(level))
-            elif level < 0:
-                level += self.nlevels
-                if level < 0:
-                    orig_level = level - self.nlevels
-                    raise IndexError('Too many levels: Index has only %d '
-                                     'levels, %d is not a valid level number' %
-                                     (self.nlevels, orig_level))
-            # Note: levels are zero-based
-            elif level >= self.nlevels:
-                raise IndexError('Too many levels: Index has only %d levels, '
-                                 'not %d' % (self.nlevels, level + 1))
-        return level
-
-    _tuples = None
-
-    @cache_readonly
-    def _engine(self):
-        return self._engine_type(lambda: self, len(self))
-
-    @property
-    def values(self):
-        if self._tuples is not None:
-            return self._tuples
-
-        values = []
-        for lev, lab in zip(self.levels, self.labels):
-            # Need to box timestamps, etc.
-            box = hasattr(lev, '_box_values')
-            # Try to minimize boxing.
-            if box and len(lev) > len(lab):
-                taken = lev._box_values(algos.take_1d(lev._values, lab))
-            elif box:
-                taken = algos.take_1d(lev._box_values(lev._values), lab,
-                                      fill_value=_get_na_value(lev.dtype.type))
-            else:
-                taken = algos.take_1d(np.asarray(lev._values), lab)
-            values.append(taken)
-
-        self._tuples = lib.fast_zip(values)
-        return self._tuples
-
-    # fml
-    @property
-    def _is_v1(self):
-        return False
-
-    @property
-    def _is_v2(self):
-        return False
-
-    @property
-    def _has_complex_internals(self):
-        # to disable groupby tricks
-        return True
-
-    @cache_readonly
-    def is_monotonic(self):
-        """
-        return if the index is monotonic increasing (only equal or
-        increasing) values.
-        """
-        return self.is_monotonic_increasing
-
-    @cache_readonly
-    def is_monotonic_increasing(self):
-        """
-        return if the index is monotonic increasing (only equal or
-        increasing) values.
-        """
-
-        # reversed() because lexsort() wants the most significant key last.
-        values = [self._get_level_values(i).values
-                  for i in reversed(range(len(self.levels)))]
-        try:
-            sort_order = np.lexsort(values)
-            return Index(sort_order).is_monotonic
-        except TypeError:
-
-            # we have mixed types and np.lexsort is not happy
-            return Index(self.values).is_monotonic
-
-    @property
-    def is_monotonic_decreasing(self):
-        """
-        return if the index is monotonic decreasing (only equal or
-        decreasing) values.
-        """
-        return False
-
-    @cache_readonly
-    def is_unique(self):
-        return not self.duplicated().any()
-
-    @cache_readonly
-    def _have_mixed_levels(self):
-        """ return a boolean list indicated if we have mixed levels """
-        return ['mixed' in l for l in self._inferred_type_levels]
-
-    @cache_readonly
-    def _inferred_type_levels(self):
-        """ return a list of the inferred types, one for each level """
-        return [i.inferred_type for i in self.levels]
-
-    @cache_readonly
-    def _hashed_values(self):
-        """ return a uint64 ndarray of my hashed values """
-        from pandas.tools.hashing import hash_tuples
-        return hash_tuples(self)
-
-    def _hashed_indexing_key(self, key):
-        """
-        validate and return the hash for the provided key
-
-        *this is internal for use for the cython routines*
-
-        Paramters
-        ---------
-        key : string or tuple
-
-        Returns
-        -------
-        np.uint64
-
-        Notes
-        -----
-        we need to stringify if we have mixed levels
-
-        """
-        from pandas.tools.hashing import hash_tuples
-
-        if not isinstance(key, tuple):
-            return hash_tuples(key)
-
-        if not len(key) == self.nlevels:
-            raise KeyError
-
-        def f(k, stringify):
-            if stringify and not isinstance(k, compat.string_types):
-                k = str(k)
-            return k
-        key = tuple([f(k, stringify)
-                     for k, stringify in zip(key, self._have_mixed_levels)])
-        return hash_tuples(key)
-
-    @Appender(base._shared_docs['duplicated'] % _index_doc_kwargs)
-    def duplicated(self, keep='first'):
-        from pandas.core.sorting import get_group_index
-        from pandas._libs.hashtable import duplicated_int64
-
-        shape = map(len, self.levels)
-        ids = get_group_index(self.labels, shape, sort=False, xnull=False)
-
-        return duplicated_int64(ids, keep)
-
-    @Appender(ibase._index_shared_docs['fillna'])
-    def fillna(self, value=None, downcast=None):
-        # isnull is not implemented for MultiIndex
-        raise NotImplementedError('isnull is not defined for MultiIndex')
-
-    @Appender(_index_shared_docs['dropna'])
-    def dropna(self, how='any'):
-        nans = [label == -1 for label in self.labels]
-        if how == 'any':
-            indexer = np.any(nans, axis=0)
-        elif how == 'all':
-            indexer = np.all(nans, axis=0)
-        else:
-            raise ValueError("invalid how option: {0}".format(how))
-
-        new_labels = [label[~indexer] for label in self.labels]
-        return self.copy(labels=new_labels, deep=True)
-
-    def get_value(self, series, key):
-        # somewhat broken encapsulation
-        from pandas.core.indexing import maybe_droplevels
-
-        # Label-based
-        s = _values_from_object(series)
-        k = _values_from_object(key)
-
-        def _try_mi(k):
-            # TODO: what if a level contains tuples??
-            loc = self.get_loc(k)
-            new_values = series._values[loc]
-            new_index = self[loc]
-            new_index = maybe_droplevels(new_index, k)
-            return series._constructor(new_values, index=new_index,
-                                       name=series.name).__finalize__(self)
-
-        try:
-            return self._engine.get_value(s, k)
-        except KeyError as e1:
-            try:
-                return _try_mi(key)
-            except KeyError:
-                pass
-
-            try:
-                return libindex.get_value_at(s, k)
-            except IndexError:
-                raise
-            except TypeError:
-                # generator/iterator-like
-                if is_iterator(key):
-                    raise InvalidIndexError(key)
-                else:
-                    raise e1
-            except Exception:  # pragma: no cover
-                raise e1
-        except TypeError:
-
-            # a Timestamp will raise a TypeError in a multi-index
-            # rather than a KeyError, try it here
-            # note that a string that 'looks' like a Timestamp will raise
-            # a KeyError! (GH5725)
-            if (isinstance(key, (datetime.datetime, np.datetime64)) or
-                    (compat.PY3 and isinstance(key, compat.string_types))):
-                try:
-                    return _try_mi(key)
-                except (KeyError):
-                    raise
-                except:
-                    pass
-
-                try:
-                    return _try_mi(Timestamp(key))
-                except:
-                    pass
-
-            raise InvalidIndexError(key)
-
-    def _get_level_values(self, level):
-        """
-        Return vector of label values for requested level,
-        equal to the length of the index
-
-        **this is an internal method**
-
-        Parameters
-        ----------
-        level : int level
-
-        Returns
-        -------
-        values : ndarray
-        """
-
-        unique = self.levels[level]
-        labels = self.labels[level]
-        filled = algos.take_1d(unique._values, labels,
-                               fill_value=unique._na_value)
-        values = unique._shallow_copy(filled)
-        return values
-
-    def get_level_values(self, level):
-        """
-        Return vector of label values for requested level,
-        equal to the length of the index
-
-        Parameters
-        ----------
-        level : int or level name
-
-        Returns
-        -------
-        values : Index
-        """
-        level = self._get_level_number(level)
-        values = self._get_level_values(level)
-        return values
-
-    def format(self, space=2, sparsify=None, adjoin=True, names=False,
-               na_rep=None, formatter=None):
-        if len(self) == 0:
-            return []
-
-        stringified_levels = []
-        for lev, lab in zip(self.levels, self.labels):
-            na = na_rep if na_rep is not None else _get_na_rep(lev.dtype.type)
-
-            if len(lev) > 0:
-
-                formatted = lev.take(lab).format(formatter=formatter)
-
-                # we have some NA
-                mask = lab == -1
-                if mask.any():
-                    formatted = np.array(formatted, dtype=object)
-                    formatted[mask] = na
-                    formatted = formatted.tolist()
-
-            else:
-                # weird all NA case
-                formatted = [pprint_thing(na if isnull(x) else x,
-                                          escape_chars=('\t', '\r', '\n'))
-                             for x in algos.take_1d(lev._values, lab)]
-            stringified_levels.append(formatted)
-
-        result_levels = []
-        for lev, name in zip(stringified_levels, self.names):
-            level = []
-
-            if names:
-                level.append(pprint_thing(name,
-                                          escape_chars=('\t', '\r', '\n'))
-                             if name is not None else '')
-
-            level.extend(np.array(lev, dtype=object))
-            result_levels.append(level)
-
-        if sparsify is None:
-            sparsify = get_option("display.multi_sparse")
-
-        if sparsify:
-            sentinel = ''
-            # GH3547
-            # use value of sparsify as sentinel,  unless it's an obvious
-            # "Truthey" value
-            if sparsify not in [True, 1]:
-                sentinel = sparsify
-            # little bit of a kludge job for #1217
-            result_levels = _sparsify(result_levels, start=int(names),
-                                      sentinel=sentinel)
-
-        if adjoin:
-            from pandas.formats.format import _get_adjustment
-            adj = _get_adjustment()
-            return adj.adjoin(space, *result_levels).split('\n')
-        else:
-            return result_levels
-
-    def _to_safe_for_reshape(self):
-        """ convert to object if we are a categorical """
-        return self.set_levels([i._to_safe_for_reshape() for i in self.levels])
-
-    def to_frame(self, index=True):
-        """
-        Create a DataFrame with the columns the levels of the MultiIndex
-
-        .. versionadded:: 0.20.0
-
-        Parameters
-        ----------
-        index : boolean, default True
-            return this MultiIndex as the index
-
-        Returns
-        -------
-        DataFrame
-        """
-
-        from pandas import DataFrame
-        result = DataFrame({(name or level):
-                            self._get_level_values(level)
-                            for name, level in
-                            zip(self.names, range(len(self.levels)))},
-                           copy=False)
-        if index:
-            result.index = self
-        return result
-
-    def to_hierarchical(self, n_repeat, n_shuffle=1):
-        """
-        Return a MultiIndex reshaped to conform to the
-        shapes given by n_repeat and n_shuffle.
-
-        Useful to replicate and rearrange a MultiIndex for combination
-        with another Index with n_repeat items.
-
-        Parameters
-        ----------
-        n_repeat : int
-            Number of times to repeat the labels on self
-        n_shuffle : int
-            Controls the reordering of the labels. If the result is going
-            to be an inner level in a MultiIndex, n_shuffle will need to be
-            greater than one. The size of each label must divisible by
-            n_shuffle.
-
-        Returns
-        -------
-        MultiIndex
-
-        Examples
-        --------
-        >>> idx = MultiIndex.from_tuples([(1, u'one'), (1, u'two'),
-                                          (2, u'one'), (2, u'two')])
-        >>> idx.to_hierarchical(3)
-        MultiIndex(levels=[[1, 2], [u'one', u'two']],
-                   labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
-                           [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
-        """
-        levels = self.levels
-        labels = [np.repeat(x, n_repeat) for x in self.labels]
-        # Assumes that each label is divisible by n_shuffle
-        labels = [x.reshape(n_shuffle, -1).ravel(order='F') for x in labels]
-        names = self.names
-        return MultiIndex(levels=levels, labels=labels, names=names)
-
-    @property
-    def is_all_dates(self):
-        return False
-
-    def is_lexsorted(self):
-        """
-        Return True if the labels are lexicographically sorted
-        """
-        return self.lexsort_depth == self.nlevels
-
-    def is_lexsorted_for_tuple(self, tup):
-        """
-        Return True if we are correctly lexsorted given the passed tuple
-        """
-        return len(tup) <= self.lexsort_depth
-
-    @cache_readonly
-    def lexsort_depth(self):
-        if self.sortorder is not None:
-            if self.sortorder == 0:
-                return self.nlevels
-            else:
-                return 0
-
-        int64_labels = [_ensure_int64(lab) for lab in self.labels]
-        for k in range(self.nlevels, 0, -1):
-            if lib.is_lexsorted(int64_labels[:k]):
-                return k
-
-        return 0
-
-    @classmethod
-    def from_arrays(cls, arrays, sortorder=None, names=None):
-        """
-        Convert arrays to MultiIndex
-
-        Parameters
-        ----------
-        arrays : list / sequence of array-likes
-            Each array-like gives one level's value for each data point.
-            len(arrays) is the number of levels.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level)
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> arrays = [[1, 1, 2, 2], ['red', 'blue', 'red', 'blue']]
-        >>> MultiIndex.from_arrays(arrays, names=('number', 'color'))
-
-        See Also
-        --------
-        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
-        MultiIndex.from_product : Make a MultiIndex from cartesian product
-                                  of iterables
-        """
-        if len(arrays) == 1:
-            name = None if names is None else names[0]
-            return Index(arrays[0], name=name)
-
-        # Check if lengths of all arrays are equal or not,
-        # raise ValueError, if not
-        for i in range(1, len(arrays)):
-            if len(arrays[i]) != len(arrays[i - 1]):
-                raise ValueError('all arrays must be same length')
-
-        from pandas.core.categorical import _factorize_from_iterables
-
-        labels, levels = _factorize_from_iterables(arrays)
-        if names is None:
-            names = [getattr(arr, "name", None) for arr in arrays]
-
-        return MultiIndex(levels=levels, labels=labels, sortorder=sortorder,
-                          names=names, verify_integrity=False)
-
-    @classmethod
-    def from_tuples(cls, tuples, sortorder=None, names=None):
-        """
-        Convert list of tuples to MultiIndex
-
-        Parameters
-        ----------
-        tuples : list / sequence of tuple-likes
-            Each tuple is the index of one row/column.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level)
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> tuples = [(1, u'red'), (1, u'blue'),
-                      (2, u'red'), (2, u'blue')]
-        >>> MultiIndex.from_tuples(tuples, names=('number', 'color'))
-
-        See Also
-        --------
-        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
-        MultiIndex.from_product : Make a MultiIndex from cartesian product
-                                  of iterables
-        """
-        if len(tuples) == 0:
-            # I think this is right? Not quite sure...
-            raise TypeError('Cannot infer number of levels from empty list')
-
-        if isinstance(tuples, (np.ndarray, Index)):
-            if isinstance(tuples, Index):
-                tuples = tuples._values
-
-            arrays = list(lib.tuples_to_object_array(tuples).T)
-        elif isinstance(tuples, list):
-            arrays = list(lib.to_object_array_tuples(tuples).T)
-        else:
-            arrays = lzip(*tuples)
-
-        return MultiIndex.from_arrays(arrays, sortorder=sortorder, names=names)
-
-    @classmethod
-    def from_product(cls, iterables, sortorder=None, names=None):
-        """
-        Make a MultiIndex from the cartesian product of multiple iterables
-
-        Parameters
-        ----------
-        iterables : list / sequence of iterables
-            Each iterable has unique labels for each level of the index.
-        sortorder : int or None
-            Level of sortedness (must be lexicographically sorted by that
-            level).
-        names : list / sequence of strings or None
-            Names for the levels in the index.
-
-        Returns
-        -------
-        index : MultiIndex
-
-        Examples
-        --------
-        >>> numbers = [0, 1, 2]
-        >>> colors = [u'green', u'purple']
-        >>> MultiIndex.from_product([numbers, colors],
-                                     names=['number', 'color'])
-        MultiIndex(levels=[[0, 1, 2], [u'green', u'purple']],
-                   labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]],
-                   names=[u'number', u'color'])
-
-        See Also
-        --------
-        MultiIndex.from_arrays : Convert list of arrays to MultiIndex
-        MultiIndex.from_tuples : Convert list of tuples to MultiIndex
-        """
-        from pandas.core.categorical import _factorize_from_iterables
-        from pandas.tools.util import cartesian_product
-
-        labels, levels = _factorize_from_iterables(iterables)
-        labels = cartesian_product(labels)
-
-        return MultiIndex(levels=levels, labels=labels, sortorder=sortorder,
-                          names=names)
-
-    @property
-    def nlevels(self):
-        return len(self.levels)
-
-    @property
-    def levshape(self):
-        return tuple(len(x) for x in self.levels)
-
-    def __contains__(self, key):
-        hash(key)
-        # work around some kind of odd cython bug
-        try:
-            self.get_loc(key)
-            return True
-        except LookupError:
-            return False
-
-    def __reduce__(self):
-        """Necessary for making this object picklable"""
-        d = dict(levels=[lev for lev in self.levels],
-                 labels=[label for label in self.labels],
-                 sortorder=self.sortorder, names=list(self.names))
-        return ibase._new_Index, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            levels = state.get('levels')
-            labels = state.get('labels')
-            sortorder = state.get('sortorder')
-            names = state.get('names')
-
-        elif isinstance(state, tuple):
-
-            nd_state, own_state = state
-            levels, labels, sortorder, names = own_state
-
-        self._set_levels([Index(x) for x in levels], validate=False)
-        self._set_labels(labels)
-        self._set_names(names)
-        self.sortorder = sortorder
-        self._verify_integrity()
-        self._reset_identity()
-
-    def __getitem__(self, key):
-        if is_scalar(key):
-            retval = []
-            for lev, lab in zip(self.levels, self.labels):
-                if lab[key] == -1:
-                    retval.append(np.nan)
-                else:
-                    retval.append(lev[lab[key]])
-
-            return tuple(retval)
-        else:
-            if is_bool_indexer(key):
-                key = np.asarray(key)
-                sortorder = self.sortorder
-            else:
-                # cannot be sure whether the result will be sorted
-                sortorder = None
-
-            new_labels = [lab[key] for lab in self.labels]
-
-            return MultiIndex(levels=self.levels, labels=new_labels,
-                              names=self.names, sortorder=sortorder,
-                              verify_integrity=False)
-
-    @Appender(_index_shared_docs['take'] % _index_doc_kwargs)
-    def take(self, indices, axis=0, allow_fill=True,
-             fill_value=None, **kwargs):
-        nv.validate_take(tuple(), kwargs)
-        indices = _ensure_platform_int(indices)
-        taken = self._assert_take_fillable(self.labels, indices,
-                                           allow_fill=allow_fill,
-                                           fill_value=fill_value,
-                                           na_value=-1)
-        return MultiIndex(levels=self.levels, labels=taken,
-                          names=self.names, verify_integrity=False)
-
-    def _assert_take_fillable(self, values, indices, allow_fill=True,
-                              fill_value=None, na_value=None):
-        """ Internal method to handle NA filling of take """
-        # only fill if we are passing a non-None fill_value
-        if allow_fill and fill_value is not None:
-            if (indices < -1).any():
-                msg = ('When allow_fill=True and fill_value is not None, '
-                       'all indices must be >= -1')
-                raise ValueError(msg)
-            taken = [lab.take(indices) for lab in self.labels]
-            mask = indices == -1
-            if mask.any():
-                masked = []
-                for new_label in taken:
-                    label_values = new_label.values()
-                    label_values[mask] = na_value
-                    masked.append(FrozenNDArray(label_values))
-                taken = masked
-        else:
-            taken = [lab.take(indices) for lab in self.labels]
-        return taken
-
-    def append(self, other):
-        """
-        Append a collection of Index options together
-
-        Parameters
-        ----------
-        other : Index or list/tuple of indices
-
-        Returns
-        -------
-        appended : Index
-        """
-        if not isinstance(other, (list, tuple)):
-            other = [other]
-
-        if all((isinstance(o, MultiIndex) and o.nlevels >= self.nlevels)
-               for o in other):
-            arrays = []
-            for i in range(self.nlevels):
-                label = self._get_level_values(i)
-                appended = [o._get_level_values(i) for o in other]
-                arrays.append(label.append(appended))
-            return MultiIndex.from_arrays(arrays, names=self.names)
-
-        to_concat = (self.values, ) + tuple(k._values for k in other)
-        new_tuples = np.concatenate(to_concat)
-
-        # if all(isinstance(x, MultiIndex) for x in other):
-        try:
-            return MultiIndex.from_tuples(new_tuples, names=self.names)
-        except:
-            return Index(new_tuples)
-
-    def argsort(self, *args, **kwargs):
-        return self.values.argsort(*args, **kwargs)
-
-    @deprecate_kwarg(old_arg_name='n', new_arg_name='repeats')
-    def repeat(self, repeats, *args, **kwargs):
-        nv.validate_repeat(args, kwargs)
-        return MultiIndex(levels=self.levels,
-                          labels=[label.view(np.ndarray).repeat(repeats)
-                                  for label in self.labels], names=self.names,
-                          sortorder=self.sortorder, verify_integrity=False)
-
-    def where(self, cond, other=None):
-        raise NotImplementedError(".where is not supported for "
-                                  "MultiIndex operations")
-
-    def drop(self, labels, level=None, errors='raise'):
-        """
-        Make new MultiIndex with passed list of labels deleted
-
-        Parameters
-        ----------
-        labels : array-like
-            Must be a list of tuples
-        level : int or level name, default None
-
-        Returns
-        -------
-        dropped : MultiIndex
-        """
-        if level is not None:
-            return self._drop_from_level(labels, level)
-
-        try:
-            if not isinstance(labels, (np.ndarray, Index)):
-                labels = com._index_labels_to_array(labels)
-            indexer = self.get_indexer(labels)
-            mask = indexer == -1
-            if mask.any():
-                if errors != 'ignore':
-                    raise ValueError('labels %s not contained in axis' %
-                                     labels[mask])
-                indexer = indexer[~mask]
-        except Exception:
-            pass
-
-        inds = []
-        for label in labels:
-            try:
-                loc = self.get_loc(label)
-                # get_loc returns either an integer, a slice, or a boolean
-                # mask
-                if isinstance(loc, int):
-                    inds.append(loc)
-                elif isinstance(loc, slice):
-                    inds.extend(lrange(loc.start, loc.stop))
-                elif is_bool_indexer(loc):
-                    if self.lexsort_depth == 0:
-                        warnings.warn('dropping on a non-lexsorted multi-index'
-                                      ' without a level parameter may impact '
-                                      'performance.',
-                                      PerformanceWarning,
-                                      stacklevel=3)
-                    loc = loc.nonzero()[0]
-                    inds.extend(loc)
-                else:
-                    msg = 'unsupported indexer of type {}'.format(type(loc))
-                    raise AssertionError(msg)
-            except KeyError:
-                if errors != 'ignore':
-                    raise
-
-        return self.delete(inds)
-
-    def _drop_from_level(self, labels, level):
-        labels = com._index_labels_to_array(labels)
-        i = self._get_level_number(level)
-        index = self.levels[i]
-        values = index.get_indexer(labels)
-
-        mask = ~algos.isin(self.labels[i], values)
-
-        return self[mask]
-
-    def droplevel(self, level=0):
-        """
-        Return Index with requested level removed. If MultiIndex has only 2
-        levels, the result will be of Index type not MultiIndex.
-
-        Parameters
-        ----------
-        level : int/level name or list thereof
-
-        Notes
-        -----
-        Does not check if result index is unique or not
-
-        Returns
-        -------
-        index : Index or MultiIndex
-        """
-        levels = level
-        if not isinstance(levels, (tuple, list)):
-            levels = [level]
-
-        new_levels = list(self.levels)
-        new_labels = list(self.labels)
-        new_names = list(self.names)
-
-        levnums = sorted(self._get_level_number(lev) for lev in levels)[::-1]
-
-        for i in levnums:
-            new_levels.pop(i)
-            new_labels.pop(i)
-            new_names.pop(i)
-
-        if len(new_levels) == 1:
-
-            # set nan if needed
-            mask = new_labels[0] == -1
-            result = new_levels[0].take(new_labels[0])
-            if mask.any():
-                result = result.putmask(mask, np.nan)
-
-            result.name = new_names[0]
-            return result
-        else:
-            return MultiIndex(levels=new_levels, labels=new_labels,
-                              names=new_names, verify_integrity=False)
-
-    def swaplevel(self, i=-2, j=-1):
-        """
-        Swap level i with level j. Do not change the ordering of anything
-
-        Parameters
-        ----------
-        i, j : int, string (can be mixed)
-            Level of index to be swapped. Can pass level name as string.
-
-        Returns
-        -------
-        swapped : MultiIndex
-
-        .. versionchanged:: 0.18.1
-
-           The indexes ``i`` and ``j`` are now optional, and default to
-           the two innermost levels of the index.
-
-        """
-        new_levels = list(self.levels)
-        new_labels = list(self.labels)
-        new_names = list(self.names)
-
-        i = self._get_level_number(i)
-        j = self._get_level_number(j)
-
-        new_levels[i], new_levels[j] = new_levels[j], new_levels[i]
-        new_labels[i], new_labels[j] = new_labels[j], new_labels[i]
-        new_names[i], new_names[j] = new_names[j], new_names[i]
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def reorder_levels(self, order):
-        """
-        Rearrange levels using input order. May not drop or duplicate levels
-
-        Parameters
-        ----------
-        """
-        order = [self._get_level_number(i) for i in order]
-        if len(order) != self.nlevels:
-            raise AssertionError('Length of order must be same as '
-                                 'number of levels (%d), got %d' %
-                                 (self.nlevels, len(order)))
-        new_levels = [self.levels[i] for i in order]
-        new_labels = [self.labels[i] for i in order]
-        new_names = [self.names[i] for i in order]
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=new_names, verify_integrity=False)
-
-    def __getslice__(self, i, j):
-        return self.__getitem__(slice(i, j))
-
-    def sortlevel(self, level=0, ascending=True, sort_remaining=True):
-        """
-        Sort MultiIndex at the requested level. The result will respect the
-        original ordering of the associated factor at that level.
-
-        Parameters
-        ----------
-        level : list-like, int or str, default 0
-            If a string is given, must be a name of the level
-            If list-like must be names or ints of levels.
-        ascending : boolean, default True
-            False to sort in descending order
-            Can also be a list to specify a directed ordering
-        sort_remaining : sort by the remaining levels after level.
-
-        Returns
-        -------
-        sorted_index : pd.MultiIndex
-            Resulting index
-        indexer : np.ndarray
-            Indices of output values in original index
-
-        """
-        from pandas.core.sorting import indexer_from_factorized
-
-        if isinstance(level, (compat.string_types, int)):
-            level = [level]
-        level = [self._get_level_number(lev) for lev in level]
-        sortorder = None
-
-        # we have a directed ordering via ascending
-        if isinstance(ascending, list):
-            if not len(level) == len(ascending):
-                raise ValueError("level must have same length as ascending")
-
-            from pandas.core.sorting import lexsort_indexer
-            indexer = lexsort_indexer(self.labels, orders=ascending)
-
-        # level ordering
-        else:
-
-            labels = list(self.labels)
-            shape = list(self.levshape)
-
-            # partition labels and shape
-            primary = tuple(labels.pop(lev - i) for i, lev in enumerate(level))
-            primshp = tuple(shape.pop(lev - i) for i, lev in enumerate(level))
-
-            if sort_remaining:
-                primary += primary + tuple(labels)
-                primshp += primshp + tuple(shape)
-            else:
-                sortorder = level[0]
-
-            indexer = indexer_from_factorized(primary, primshp,
-                                              compress=False)
-
-            if not ascending:
-                indexer = indexer[::-1]
-
-        indexer = _ensure_platform_int(indexer)
-        new_labels = [lab.take(indexer) for lab in self.labels]
-
-        new_index = MultiIndex(labels=new_labels, levels=self.levels,
-                               names=self.names, sortorder=sortorder,
-                               verify_integrity=False)
-
-        return new_index, indexer
-
-    def _convert_listlike_indexer(self, keyarr, kind=None):
-        """
-        Parameters
-        ----------
-        keyarr : list-like
-            Indexer to convert.
-
-        Returns
-        -------
-        tuple (indexer, keyarr)
-            indexer is an ndarray or None if cannot convert
-            keyarr are tuple-safe keys
-        """
-        indexer, keyarr = super(MultiIndex, self)._convert_listlike_indexer(
-            keyarr, kind=kind)
-
-        # are we indexing a specific level
-        if indexer is None and len(keyarr) and not isinstance(keyarr[0],
-                                                              tuple):
-            level = 0
-            _, indexer = self.reindex(keyarr, level=level)
-
-            # take all
-            if indexer is None:
-                indexer = np.arange(len(self))
-
-            check = self.levels[0].get_indexer(keyarr)
-            mask = check == -1
-            if mask.any():
-                raise KeyError('%s not in index' % keyarr[mask])
-
-        return indexer, keyarr
-
-    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        method = missing.clean_reindex_fill_method(method)
-        target = _ensure_index(target)
-
-        # empty indexer
-        if is_list_like(target) and not len(target):
-            return _ensure_platform_int(np.array([]))
-
-        if not isinstance(target, MultiIndex):
-            try:
-                target = MultiIndex.from_tuples(target)
-            except (TypeError, ValueError):
-
-                # let's instead try with a straight Index
-                if method is None:
-                    return Index(self.values).get_indexer(target,
-                                                          method=method,
-                                                          limit=limit,
-                                                          tolerance=tolerance)
-
-        if not self.is_unique:
-            raise Exception('Reindexing only valid with uniquely valued Index '
-                            'objects')
-
-        if method == 'pad' or method == 'backfill':
-            if tolerance is not None:
-                raise NotImplementedError("tolerance not implemented yet "
-                                          'for MultiIndex')
-            indexer = self._get_fill_indexer(target, method, limit)
-        elif method == 'nearest':
-            raise NotImplementedError("method='nearest' not implemented yet "
-                                      'for MultiIndex; see GitHub issue 9365')
-        else:
-            # we may not compare equally because of hashing if we
-            # don't have the same dtypes
-            if self._inferred_type_levels != target._inferred_type_levels:
-                return Index(self.values).get_indexer(target.values)
-
-            indexer = self._engine.get_indexer(target)
-
-        return _ensure_platform_int(indexer)
-
-    @Appender(_index_shared_docs['get_indexer_non_unique'] % _index_doc_kwargs)
-    def get_indexer_non_unique(self, target):
-        return super(MultiIndex, self).get_indexer_non_unique(target)
-
-    def reindex(self, target, method=None, level=None, limit=None,
-                tolerance=None):
-        """
-        Create index with target's values (move/add/delete values as necessary)
-
-        Returns
-        -------
-        new_index : pd.MultiIndex
-            Resulting index
-        indexer : np.ndarray or None
-            Indices of output values in original index
-
-        """
-        # GH6552: preserve names when reindexing to non-named target
-        # (i.e. neither Index nor Series).
-        preserve_names = not hasattr(target, 'names')
-
-        if level is not None:
-            if method is not None:
-                raise TypeError('Fill method not supported if level passed')
-
-            # GH7774: preserve dtype/tz if target is empty and not an Index.
-            # target may be an iterator
-            target = ibase._ensure_has_len(target)
-            if len(target) == 0 and not isinstance(target, Index):
-                idx = self.levels[level]
-                attrs = idx._get_attributes_dict()
-                attrs.pop('freq', None)  # don't preserve freq
-                target = type(idx)._simple_new(np.empty(0, dtype=idx.dtype),
-                                               **attrs)
-            else:
-                target = _ensure_index(target)
-            target, indexer, _ = self._join_level(target, level, how='right',
-                                                  return_indexers=True,
-                                                  keep_order=False)
-        else:
-            target = _ensure_index(target)
-            if self.equals(target):
-                indexer = None
-            else:
-                if self.is_unique:
-                    indexer = self.get_indexer(target, method=method,
-                                               limit=limit,
-                                               tolerance=tolerance)
-                else:
-                    raise Exception("cannot handle a non-unique multi-index!")
-
-        if not isinstance(target, MultiIndex):
-            if indexer is None:
-                target = self
-            elif (indexer >= 0).all():
-                target = self.take(indexer)
-            else:
-                # hopefully?
-                target = MultiIndex.from_tuples(target)
-
-        if (preserve_names and target.nlevels == self.nlevels and
-                target.names != self.names):
-            target = target.copy(deep=False)
-            target.names = self.names
-
-        return target, indexer
-
-    def get_slice_bound(self, label, side, kind):
-
-        if not isinstance(label, tuple):
-            label = label,
-        return self._partial_tup_index(label, side=side)
-
-    def slice_locs(self, start=None, end=None, step=None, kind=None):
-        """
-        For an ordered MultiIndex, compute the slice locations for input
-        labels. They can be tuples representing partial levels, e.g. for a
-        MultiIndex with 3 levels, you can pass a single value (corresponding to
-        the first level), or a 1-, 2-, or 3-tuple.
-
-        Parameters
-        ----------
-        start : label or tuple, default None
-            If None, defaults to the beginning
-        end : label or tuple
-            If None, defaults to the end
-        step : int or None
-            Slice step
-        kind : string, optional, defaults None
-
-        Returns
-        -------
-        (start, end) : (int, int)
-
-        Notes
-        -----
-        This function assumes that the data is sorted by the first level
-        """
-        # This function adds nothing to its parent implementation (the magic
-        # happens in get_slice_bound method), but it adds meaningful doc.
-        return super(MultiIndex, self).slice_locs(start, end, step, kind=kind)
-
-    def _partial_tup_index(self, tup, side='left'):
-        if len(tup) > self.lexsort_depth:
-            raise KeyError('Key length (%d) was greater than MultiIndex'
-                           ' lexsort depth (%d)' %
-                           (len(tup), self.lexsort_depth))
-
-        n = len(tup)
-        start, end = 0, len(self)
-        zipped = zip(tup, self.levels, self.labels)
-        for k, (lab, lev, labs) in enumerate(zipped):
-            section = labs[start:end]
-
-            if lab not in lev:
-                if not lev.is_type_compatible(lib.infer_dtype([lab])):
-                    raise TypeError('Level type mismatch: %s' % lab)
-
-                # short circuit
-                loc = lev.searchsorted(lab, side=side)
-                if side == 'right' and loc >= 0:
-                    loc -= 1
-                return start + section.searchsorted(loc, side=side)
-
-            idx = lev.get_loc(lab)
-            if k < n - 1:
-                end = start + section.searchsorted(idx, side='right')
-                start = start + section.searchsorted(idx, side='left')
-            else:
-                return start + section.searchsorted(idx, side=side)
-
-    def get_loc(self, key, method=None):
-        """
-        Get integer location, slice or boolean mask for requested label or
-        tuple.  If the key is past the lexsort depth, the return may be a
-        boolean mask array, otherwise it is always a slice or int.
-
-        Parameters
-        ----------
-        key : label or tuple
-        method : None
-
-        Returns
-        -------
-        loc : int, slice object or boolean mask
-        """
-        if method is not None:
-            raise NotImplementedError('only the default get_loc method is '
-                                      'currently supported for MultiIndex')
-
-        def _maybe_to_slice(loc):
-            """convert integer indexer to boolean mask or slice if possible"""
-            if not isinstance(loc, np.ndarray) or loc.dtype != 'int64':
-                return loc
-
-            loc = lib.maybe_indices_to_slice(loc, len(self))
-            if isinstance(loc, slice):
-                return loc
-
-            mask = np.empty(len(self), dtype='bool')
-            mask.fill(False)
-            mask[loc] = True
-            return mask
-
-        if not isinstance(key, tuple):
-            loc = self._get_level_indexer(key, level=0)
-            return _maybe_to_slice(loc)
-
-        keylen = len(key)
-        if self.nlevels < keylen:
-            raise KeyError('Key length ({0}) exceeds index depth ({1})'
-                           ''.format(keylen, self.nlevels))
-
-        if keylen == self.nlevels and self.is_unique:
-
-            def _maybe_str_to_time_stamp(key, lev):
-                if lev.is_all_dates and not isinstance(key, Timestamp):
-                    try:
-                        return Timestamp(key, tz=getattr(lev, 'tz', None))
-                    except Exception:
-                        pass
-                return key
-
-            key = _values_from_object(key)
-            key = tuple(map(_maybe_str_to_time_stamp, key, self.levels))
-            return self._engine.get_loc(key)
-
-        # -- partial selection or non-unique index
-        # break the key into 2 parts based on the lexsort_depth of the index;
-        # the first part returns a continuous slice of the index; the 2nd part
-        # needs linear search within the slice
-        i = self.lexsort_depth
-        lead_key, follow_key = key[:i], key[i:]
-        start, stop = (self.slice_locs(lead_key, lead_key)
-                       if lead_key else (0, len(self)))
-
-        if start == stop:
-            raise KeyError(key)
-
-        if not follow_key:
-            return slice(start, stop)
-
-        warnings.warn('indexing past lexsort depth may impact performance.',
-                      PerformanceWarning, stacklevel=10)
-
-        loc = np.arange(start, stop, dtype='int64')
-
-        for i, k in enumerate(follow_key, len(lead_key)):
-            mask = self.labels[i][loc] == self.levels[i].get_loc(k)
-            if not mask.all():
-                loc = loc[mask]
-            if not len(loc):
-                raise KeyError(key)
-
-        return (_maybe_to_slice(loc) if len(loc) != stop - start else
-                slice(start, stop))
-
-    def get_loc_level(self, key, level=0, drop_level=True):
-        """
-        Get integer location slice for requested label or tuple
-
-        Parameters
-        ----------
-        key : label or tuple
-        level : int/level name or list thereof
-
-        Returns
-        -------
-        loc : int or slice object
-        """
-
-        def maybe_droplevels(indexer, levels, drop_level):
-            if not drop_level:
-                return self[indexer]
-            # kludgearound
-            orig_index = new_index = self[indexer]
-            levels = [self._get_level_number(i) for i in levels]
-            for i in sorted(levels, reverse=True):
-                try:
-                    new_index = new_index.droplevel(i)
-                except:
-
-                    # no dropping here
-                    return orig_index
-            return new_index
-
-        if isinstance(level, (tuple, list)):
-            if len(key) != len(level):
-                raise AssertionError('Key for location must have same '
-                                     'length as number of levels')
-            result = None
-            for lev, k in zip(level, key):
-                loc, new_index = self.get_loc_level(k, level=lev)
-                if isinstance(loc, slice):
-                    mask = np.zeros(len(self), dtype=bool)
-                    mask[loc] = True
-                    loc = mask
-
-                result = loc if result is None else result & loc
-
-            return result, maybe_droplevels(result, level, drop_level)
-
-        level = self._get_level_number(level)
-
-        # kludge for #1796
-        if isinstance(key, list):
-            key = tuple(key)
-
-        if isinstance(key, tuple) and level == 0:
-
-            try:
-                if key in self.levels[0]:
-                    indexer = self._get_level_indexer(key, level=level)
-                    new_index = maybe_droplevels(indexer, [0], drop_level)
-                    return indexer, new_index
-            except TypeError:
-                pass
-
-            if not any(isinstance(k, slice) for k in key):
-
-                # partial selection
-                # optionally get indexer to avoid re-calculation
-                def partial_selection(key, indexer=None):
-                    if indexer is None:
-                        indexer = self.get_loc(key)
-                    ilevels = [i for i in range(len(key))
-                               if key[i] != slice(None, None)]
-                    return indexer, maybe_droplevels(indexer, ilevels,
-                                                     drop_level)
-
-                if len(key) == self.nlevels:
-
-                    if self.is_unique:
-
-                        # here we have a completely specified key, but are
-                        # using some partial string matching here
-                        # GH4758
-                        all_dates = [(l.is_all_dates and
-                                      not isinstance(k, compat.string_types))
-                                     for k, l in zip(key, self.levels)]
-                        can_index_exactly = any(all_dates)
-                        if (any([l.is_all_dates
-                                 for k, l in zip(key, self.levels)]) and
-                                not can_index_exactly):
-                            indexer = self.get_loc(key)
-
-                            # we have a multiple selection here
-                            if (not isinstance(indexer, slice) or
-                                    indexer.stop - indexer.start != 1):
-                                return partial_selection(key, indexer)
-
-                            key = tuple(self[indexer].tolist()[0])
-
-                        return (self._engine.get_loc(
-                            _values_from_object(key)), None)
-
-                    else:
-                        return partial_selection(key)
-                else:
-                    return partial_selection(key)
-            else:
-                indexer = None
-                for i, k in enumerate(key):
-                    if not isinstance(k, slice):
-                        k = self._get_level_indexer(k, level=i)
-                        if isinstance(k, slice):
-                            # everything
-                            if k.start == 0 and k.stop == len(self):
-                                k = slice(None, None)
-                        else:
-                            k_index = k
-
-                    if isinstance(k, slice):
-                        if k == slice(None, None):
-                            continue
-                        else:
-                            raise TypeError(key)
-
-                    if indexer is None:
-                        indexer = k_index
-                    else:  # pragma: no cover
-                        indexer &= k_index
-                if indexer is None:
-                    indexer = slice(None, None)
-                ilevels = [i for i in range(len(key))
-                           if key[i] != slice(None, None)]
-                return indexer, maybe_droplevels(indexer, ilevels, drop_level)
-        else:
-            indexer = self._get_level_indexer(key, level=level)
-            return indexer, maybe_droplevels(indexer, [level], drop_level)
-
-    def _get_level_indexer(self, key, level=0, indexer=None):
-        # return an indexer, boolean array or a slice showing where the key is
-        # in the totality of values
-        # if the indexer is provided, then use this
-
-        level_index = self.levels[level]
-        labels = self.labels[level]
-
-        def convert_indexer(start, stop, step, indexer=indexer, labels=labels):
-            # given the inputs and the labels/indexer, compute an indexer set
-            # if we have a provided indexer, then this need not consider
-            # the entire labels set
-
-            r = np.arange(start, stop, step)
-            if indexer is not None and len(indexer) != len(labels):
-
-                # we have an indexer which maps the locations in the labels
-                # that we have already selected (and is not an indexer for the
-                # entire set) otherwise this is wasteful so we only need to
-                # examine locations that are in this set the only magic here is
-                # that the result are the mappings to the set that we have
-                # selected
-                from pandas import Series
-                mapper = Series(indexer)
-                indexer = labels.take(_ensure_platform_int(indexer))
-                result = Series(Index(indexer).isin(r).nonzero()[0])
-                m = result.map(mapper)._values
-
-            else:
-                m = np.zeros(len(labels), dtype=bool)
-                m[np.in1d(labels, r,
-                          assume_unique=Index(labels).is_unique)] = True
-
-            return m
-
-        if isinstance(key, slice):
-            # handle a slice, returnig a slice if we can
-            # otherwise a boolean indexer
-
-            try:
-                if key.start is not None:
-                    start = level_index.get_loc(key.start)
-                else:
-                    start = 0
-                if key.stop is not None:
-                    stop = level_index.get_loc(key.stop)
-                else:
-                    stop = len(level_index) - 1
-                step = key.step
-            except KeyError:
-
-                # we have a partial slice (like looking up a partial date
-                # string)
-                start = stop = level_index.slice_indexer(key.start, key.stop,
-                                                         key.step, kind='loc')
-                step = start.step
-
-            if isinstance(start, slice) or isinstance(stop, slice):
-                # we have a slice for start and/or stop
-                # a partial date slicer on a DatetimeIndex generates a slice
-                # note that the stop ALREADY includes the stopped point (if
-                # it was a string sliced)
-                return convert_indexer(start.start, stop.stop, step)
-
-            elif level > 0 or self.lexsort_depth == 0 or step is not None:
-                # need to have like semantics here to right
-                # searching as when we are using a slice
-                # so include the stop+1 (so we include stop)
-                return convert_indexer(start, stop + 1, step)
-            else:
-                # sorted, so can return slice object -> view
-                i = labels.searchsorted(start, side='left')
-                j = labels.searchsorted(stop, side='right')
-                return slice(i, j, step)
-
-        else:
-
-            loc = level_index.get_loc(key)
-            if level > 0 or self.lexsort_depth == 0:
-                return np.array(labels == loc, dtype=bool)
-            else:
-                # sorted, so can return slice object -> view
-                try:
-                    loc = labels.dtype.type(loc)
-                except TypeError:
-                    # this occurs when loc is a slice (partial string indexing)
-                    # but the TypeError raised by searchsorted in this case
-                    # is catched in Index._has_valid_type()
-                    pass
-                i = labels.searchsorted(loc, side='left')
-                j = labels.searchsorted(loc, side='right')
-                return slice(i, j)
-
-    def get_locs(self, tup):
-        """
-        Given a tuple of slices/lists/labels/boolean indexer to a level-wise
-        spec produce an indexer to extract those locations
-
-        Parameters
-        ----------
-        key : tuple of (slices/list/labels)
-
-        Returns
-        -------
-        locs : integer list of locations or boolean indexer suitable
-               for passing to iloc
-        """
-
-        # must be lexsorted to at least as many levels
-        if not self.is_lexsorted_for_tuple(tup):
-            raise UnsortedIndexError('MultiIndex Slicing requires the index '
-                                     'to be fully lexsorted tuple len ({0}), '
-                                     'lexsort depth ({1})'
-                                     .format(len(tup), self.lexsort_depth))
-
-        # indexer
-        # this is the list of all values that we want to select
-        n = len(self)
-        indexer = None
-
-        def _convert_to_indexer(r):
-            # return an indexer
-            if isinstance(r, slice):
-                m = np.zeros(n, dtype=bool)
-                m[r] = True
-                r = m.nonzero()[0]
-            elif is_bool_indexer(r):
-                if len(r) != n:
-                    raise ValueError("cannot index with a boolean indexer "
-                                     "that is not the same length as the "
-                                     "index")
-                r = r.nonzero()[0]
-            from .numeric import Int64Index
-            return Int64Index(r)
-
-        def _update_indexer(idxr, indexer=indexer):
-            if indexer is None:
-                indexer = Index(np.arange(n))
-            if idxr is None:
-                return indexer
-            return indexer & idxr
-
-        for i, k in enumerate(tup):
-
-            if is_bool_indexer(k):
-                # a boolean indexer, must be the same length!
-                k = np.asarray(k)
-                indexer = _update_indexer(_convert_to_indexer(k),
-                                          indexer=indexer)
-
-            elif is_list_like(k):
-                # a collection of labels to include from this level (these
-                # are or'd)
-                indexers = None
-                for x in k:
-                    try:
-                        idxrs = _convert_to_indexer(
-                            self._get_level_indexer(x, level=i,
-                                                    indexer=indexer))
-                        indexers = (idxrs if indexers is None
-                                    else indexers | idxrs)
-                    except KeyError:
-
-                        # ignore not founds
-                        continue
-
-                if indexers is not None:
-                    indexer = _update_indexer(indexers, indexer=indexer)
-                else:
-                    from .numeric import Int64Index
-                    # no matches we are done
-                    return Int64Index([])._values
-
-            elif is_null_slice(k):
-                # empty slice
-                indexer = _update_indexer(None, indexer=indexer)
-
-            elif isinstance(k, slice):
-
-                # a slice, include BOTH of the labels
-                indexer = _update_indexer(_convert_to_indexer(
-                    self._get_level_indexer(k, level=i, indexer=indexer)),
-                    indexer=indexer)
-            else:
-                # a single label
-                indexer = _update_indexer(_convert_to_indexer(
-                    self.get_loc_level(k, level=i, drop_level=False)[0]),
-                    indexer=indexer)
-
-        # empty indexer
-        if indexer is None:
-            return Int64Index([])._values
-        return indexer._values
-
-    def truncate(self, before=None, after=None):
-        """
-        Slice index between two labels / tuples, return new MultiIndex
-
-        Parameters
-        ----------
-        before : label or tuple, can be partial. Default None
-            None defaults to start
-        after : label or tuple, can be partial. Default None
-            None defaults to end
-
-        Returns
-        -------
-        truncated : MultiIndex
-        """
-        if after and before and after < before:
-            raise ValueError('after < before')
-
-        i, j = self.levels[0].slice_locs(before, after)
-        left, right = self.slice_locs(before, after)
-
-        new_levels = list(self.levels)
-        new_levels[0] = new_levels[0][i:j]
-
-        new_labels = [lab[left:right] for lab in self.labels]
-        new_labels[0] = new_labels[0] - i
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          verify_integrity=False)
-
-    def equals(self, other):
-        """
-        Determines if two MultiIndex objects have the same labeling information
-        (the levels themselves do not necessarily have to be the same)
-
-        See also
-        --------
-        equal_levels
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, Index):
-            return False
-
-        if not isinstance(other, MultiIndex):
-            return array_equivalent(self._values,
-                                    _values_from_object(_ensure_index(other)))
-
-        if self.nlevels != other.nlevels:
-            return False
-
-        if len(self) != len(other):
-            return False
-
-        for i in range(self.nlevels):
-            slabels = self.labels[i]
-            slabels = slabels[slabels != -1]
-            svalues = algos.take_nd(np.asarray(self.levels[i]._values),
-                                    slabels, allow_fill=False)
-
-            olabels = other.labels[i]
-            olabels = olabels[olabels != -1]
-            ovalues = algos.take_nd(np.asarray(other.levels[i]._values),
-                                    olabels, allow_fill=False)
-
-            # since we use NaT both datetime64 and timedelta64
-            # we can have a situation where a level is typed say
-            # timedelta64 in self (IOW it has other values than NaT)
-            # but types datetime64 in other (where its all NaT)
-            # but these are equivalent
-            if len(svalues) == 0 and len(ovalues) == 0:
-                continue
-
-            if not array_equivalent(svalues, ovalues):
-                return False
-
-        return True
-
-    def equal_levels(self, other):
-        """
-        Return True if the levels of both MultiIndex objects are the same
-
-        """
-        if self.nlevels != other.nlevels:
-            return False
-
-        for i in range(self.nlevels):
-            if not self.levels[i].equals(other.levels[i]):
-                return False
-        return True
-
-    def union(self, other):
-        """
-        Form the union of two MultiIndex objects, sorting if possible
-
-        Parameters
-        ----------
-        other : MultiIndex or array / Index of tuples
-
-        Returns
-        -------
-        Index
-
-        >>> index.union(index2)
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if len(other) == 0 or self.equals(other):
-            return self
-
-        uniq_tuples = lib.fast_unique_multiple([self._values, other._values])
-        return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
-                                      names=result_names)
-
-    def intersection(self, other):
-        """
-        Form the intersection of two MultiIndex objects, sorting if possible
-
-        Parameters
-        ----------
-        other : MultiIndex or array / Index of tuples
-
-        Returns
-        -------
-        Index
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if self.equals(other):
-            return self
-
-        self_tuples = self._values
-        other_tuples = other._values
-        uniq_tuples = sorted(set(self_tuples) & set(other_tuples))
-        if len(uniq_tuples) == 0:
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-        else:
-            return MultiIndex.from_arrays(lzip(*uniq_tuples), sortorder=0,
-                                          names=result_names)
-
-    def difference(self, other):
-        """
-        Compute sorted set difference of two MultiIndex objects
-
-        Returns
-        -------
-        diff : MultiIndex
-        """
-        self._assert_can_do_setop(other)
-        other, result_names = self._convert_can_do_setop(other)
-
-        if len(other) == 0:
-            return self
-
-        if self.equals(other):
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-
-        difference = sorted(set(self._values) - set(other._values))
-
-        if len(difference) == 0:
-            return MultiIndex(levels=[[]] * self.nlevels,
-                              labels=[[]] * self.nlevels,
-                              names=result_names, verify_integrity=False)
-        else:
-            return MultiIndex.from_tuples(difference, sortorder=0,
-                                          names=result_names)
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True):
-        if not is_object_dtype(np.dtype(dtype)):
-            raise TypeError('Setting %s dtype to anything other than object '
-                            'is not supported' % self.__class__)
-        elif copy is True:
-            return self._shallow_copy()
-        return self
-
-    def _convert_can_do_setop(self, other):
-        result_names = self.names
-
-        if not hasattr(other, 'names'):
-            if len(other) == 0:
-                other = MultiIndex(levels=[[]] * self.nlevels,
-                                   labels=[[]] * self.nlevels,
-                                   verify_integrity=False)
-            else:
-                msg = 'other must be a MultiIndex or a list of tuples'
-                try:
-                    other = MultiIndex.from_tuples(other)
-                except:
-                    raise TypeError(msg)
-        else:
-            result_names = self.names if self.names == other.names else None
-        return other, result_names
-
-    def insert(self, loc, item):
-        """
-        Make new MultiIndex inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : tuple
-            Must be same length as number of levels in the MultiIndex
-
-        Returns
-        -------
-        new_index : Index
-        """
-        # Pad the key with empty strings if lower levels of the key
-        # aren't specified:
-        if not isinstance(item, tuple):
-            item = (item, ) + ('', ) * (self.nlevels - 1)
-        elif len(item) != self.nlevels:
-            raise ValueError('Item must have length equal to number of '
-                             'levels.')
-
-        new_levels = []
-        new_labels = []
-        for k, level, labels in zip(item, self.levels, self.labels):
-            if k not in level:
-                # have to insert into level
-                # must insert at end otherwise you have to recompute all the
-                # other labels
-                lev_loc = len(level)
-                level = level.insert(lev_loc, k)
-            else:
-                lev_loc = level.get_loc(k)
-
-            new_levels.append(level)
-            new_labels.append(np.insert(_ensure_int64(labels), loc, lev_loc))
-
-        return MultiIndex(levels=new_levels, labels=new_labels,
-                          names=self.names, verify_integrity=False)
-
-    def delete(self, loc):
-        """
-        Make new index with passed location deleted
-
-        Returns
-        -------
-        new_index : MultiIndex
-        """
-        new_labels = [np.delete(lab, loc) for lab in self.labels]
-        return MultiIndex(levels=self.levels, labels=new_labels,
-                          names=self.names, verify_integrity=False)
-
-    get_major_bounds = slice_locs
-
-    __bounds = None
-
-    @property
-    def _bounds(self):
-        """
-        Return or compute and return slice points for level 0, assuming
-        sortedness
-        """
-        if self.__bounds is None:
-            inds = np.arange(len(self.levels[0]))
-            self.__bounds = self.labels[0].searchsorted(inds)
-
-        return self.__bounds
-
-    def _wrap_joined_index(self, joined, other):
-        names = self.names if self.names == other.names else None
-        return MultiIndex.from_tuples(joined, names=names)
-
-    @Appender(Index.isin.__doc__)
-    def isin(self, values, level=None):
-        if level is None:
-            return algos.isin(self.values,
-                              MultiIndex.from_tuples(values).values)
-        else:
-            num = self._get_level_number(level)
-            levs = self.levels[num]
-            labs = self.labels[num]
-
-            sought_labels = levs.isin(values).nonzero()[0]
-            if levs.size == 0:
-                return np.zeros(len(labs), dtype=np.bool_)
-            else:
-                return np.lib.arraysetops.in1d(labs, sought_labels)
-
-
-MultiIndex._add_numeric_methods_disabled()
-MultiIndex._add_numeric_methods_add_sub_disabled()
-MultiIndex._add_logical_methods_disabled()
-
-
-def _sparsify(label_list, start=0, sentinel=''):
-    pivoted = lzip(*label_list)
-    k = len(label_list)
-
-    result = pivoted[:start + 1]
-    prev = pivoted[start]
-
-    for cur in pivoted[start + 1:]:
-        sparse_cur = []
-
-        for i, (p, t) in enumerate(zip(prev, cur)):
-            if i == k - 1:
-                sparse_cur.append(t)
-                result.append(sparse_cur)
-                break
-
-            if p == t:
-                sparse_cur.append(sentinel)
-            else:
-                sparse_cur.extend(cur[i:])
-                result.append(sparse_cur)
-                break
-
-        prev = cur
-
-    return lzip(*result)
-
-
-def _get_na_rep(dtype):
-    return {np.datetime64: 'NaT', np.timedelta64: 'NaT'}.get(dtype, 'NaN')
diff --git a/pandas/indexes/numeric.py b/pandas/indexes/numeric.py
deleted file mode 100644
index 31258c785d9e8..0000000000000
--- a/pandas/indexes/numeric.py
+++ /dev/null
@@ -1,388 +0,0 @@
-import numpy as np
-from pandas._libs import (index as libindex,
-                          algos as libalgos, join as libjoin)
-from pandas.types.common import (is_dtype_equal, pandas_dtype,
-                                 is_float_dtype, is_object_dtype,
-                                 is_integer_dtype, is_scalar)
-from pandas.core.common import _asarray_tuplesafe, _values_from_object
-
-from pandas import compat
-from pandas.core import algorithms
-from pandas.indexes.base import Index, InvalidIndexError, _index_shared_docs
-from pandas.util.decorators import Appender, cache_readonly
-import pandas.indexes.base as ibase
-
-
-_num_index_shared_docs = dict()
-
-
-class NumericIndex(Index):
-    """
-    Provide numeric type operations
-
-    This is an abstract class
-
-    """
-    _is_numeric_dtype = True
-
-    def __new__(cls, data=None, dtype=None, copy=False, name=None,
-                fastpath=False):
-
-        if fastpath:
-            return cls._simple_new(data, name=name)
-
-        # isscalar, generators handled in coerce_to_ndarray
-        data = cls._coerce_to_ndarray(data)
-
-        if issubclass(data.dtype.type, compat.string_types):
-            cls._string_data_error(data)
-
-        if copy or not is_dtype_equal(data.dtype, cls._default_dtype):
-            subarr = np.array(data, dtype=cls._default_dtype, copy=copy)
-            cls._assert_safe_casting(data, subarr)
-        else:
-            subarr = data
-
-        if name is None and hasattr(data, 'name'):
-            name = data.name
-        return cls._simple_new(subarr, name=name)
-
-    @Appender(_index_shared_docs['_maybe_cast_slice_bound'])
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        assert kind in ['ix', 'loc', 'getitem', None]
-
-        # we will try to coerce to integers
-        return self._maybe_cast_indexer(label)
-
-    def _convert_tolerance(self, tolerance):
-        try:
-            return float(tolerance)
-        except ValueError:
-            raise ValueError('tolerance argument for %s must be numeric: %r' %
-                             (type(self).__name__, tolerance))
-
-    @classmethod
-    def _assert_safe_casting(cls, data, subarr):
-        """
-        Subclasses need to override this only if the process of casting data
-        from some accepted dtype to the internal dtype(s) bears the risk of
-        truncation (e.g. float to int).
-        """
-        pass
-
-    @property
-    def is_all_dates(self):
-        """
-        Checks that all the labels are datetime objects
-        """
-        return False
-
-
-_num_index_shared_docs['class_descr'] = """
-    Immutable ndarray implementing an ordered, sliceable set. The basic object
-    storing axis labels for all pandas objects. %(klass)s is a special case
-    of `Index` with purely %(ltype)s labels. %(extra)s
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional)
-    dtype : NumPy dtype (default: %(dtype)s)
-    copy : bool
-        Make a copy of input ndarray
-    name : object
-        Name to be stored in the index
-    Notes
-    -----
-    An Index instance can **only** contain hashable objects.
-"""
-
-_int64_descr_args = dict(
-    klass='Int64Index',
-    ltype='integer',
-    dtype='int64',
-    extra="""This is the default index type used
-    by the DataFrame and Series ctors when no explicit
-    index is provided by the user.
-"""
-)
-
-
-class Int64Index(NumericIndex):
-    __doc__ = _num_index_shared_docs['class_descr'] % _int64_descr_args
-
-    _typ = 'int64index'
-    _arrmap = libalgos.arrmap_int64
-    _left_indexer_unique = libjoin.left_join_indexer_unique_int64
-    _left_indexer = libjoin.left_join_indexer_int64
-    _inner_indexer = libjoin.inner_join_indexer_int64
-    _outer_indexer = libjoin.outer_join_indexer_int64
-    _can_hold_na = False
-    _engine_type = libindex.Int64Engine
-    _default_dtype = np.int64
-
-    @property
-    def inferred_type(self):
-        return 'integer'
-
-    @property
-    def asi8(self):
-        # do not cache or you'll create a memory leak
-        return self.values.view('i8')
-
-    @Appender(_index_shared_docs['_convert_scalar_indexer'])
-    def _convert_scalar_indexer(self, key, kind=None):
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        # don't coerce ilocs to integers
-        if kind != 'iloc':
-            key = self._maybe_cast_indexer(key)
-        return (super(Int64Index, self)
-                ._convert_scalar_indexer(key, kind=kind))
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        return Int64Index(joined, name=name)
-
-    @classmethod
-    def _assert_safe_casting(cls, data, subarr):
-        """
-        Ensure incoming data can be represented as ints.
-        """
-        if not issubclass(data.dtype.type, np.signedinteger):
-            if not np.array_equal(data, subarr):
-                raise TypeError('Unsafe NumPy casting, you must '
-                                'explicitly cast')
-
-
-Int64Index._add_numeric_methods()
-Int64Index._add_logical_methods()
-
-_uint64_descr_args = dict(
-    klass='UInt64Index',
-    ltype='unsigned integer',
-    dtype='uint64',
-    extra=''
-)
-
-
-class UInt64Index(NumericIndex):
-    __doc__ = _num_index_shared_docs['class_descr'] % _uint64_descr_args
-
-    _typ = 'uint64index'
-    _arrmap = libalgos.arrmap_uint64
-    _left_indexer_unique = libjoin.left_join_indexer_unique_uint64
-    _left_indexer = libjoin.left_join_indexer_uint64
-    _inner_indexer = libjoin.inner_join_indexer_uint64
-    _outer_indexer = libjoin.outer_join_indexer_uint64
-    _can_hold_na = False
-    _na_value = 0
-    _engine_type = libindex.UInt64Engine
-    _default_dtype = np.uint64
-
-    @property
-    def inferred_type(self):
-        return 'integer'
-
-    @property
-    def asi8(self):
-        # do not cache or you'll create a memory leak
-        return self.values.view('u8')
-
-    @Appender(_index_shared_docs['_convert_scalar_indexer'])
-    def _convert_scalar_indexer(self, key, kind=None):
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        # don't coerce ilocs to integers
-        if kind != 'iloc':
-            key = self._maybe_cast_indexer(key)
-        return (super(UInt64Index, self)
-                ._convert_scalar_indexer(key, kind=kind))
-
-    @Appender(_index_shared_docs['_convert_arr_indexer'])
-    def _convert_arr_indexer(self, keyarr):
-        # Cast the indexer to uint64 if possible so
-        # that the values returned from indexing are
-        # also uint64.
-        keyarr = _asarray_tuplesafe(keyarr)
-        if is_integer_dtype(keyarr):
-            return _asarray_tuplesafe(keyarr, dtype=np.uint64)
-        return keyarr
-
-    @Appender(_index_shared_docs['_convert_index_indexer'])
-    def _convert_index_indexer(self, keyarr):
-        # Cast the indexer to uint64 if possible so
-        # that the values returned from indexing are
-        # also uint64.
-        if keyarr.is_integer():
-            return keyarr.astype(np.uint64)
-        return keyarr
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        return UInt64Index(joined, name=name)
-
-    @classmethod
-    def _assert_safe_casting(cls, data, subarr):
-        """
-        Ensure incoming data can be represented as uints.
-        """
-        if not issubclass(data.dtype.type, np.unsignedinteger):
-            if not np.array_equal(data, subarr):
-                raise TypeError('Unsafe NumPy casting, you must '
-                                'explicitly cast')
-
-
-UInt64Index._add_numeric_methods()
-UInt64Index._add_logical_methods()
-
-_float64_descr_args = dict(
-    klass='Float64Index',
-    dtype='float64',
-    ltype='float',
-    extra=''
-)
-
-
-class Float64Index(NumericIndex):
-    __doc__ = _num_index_shared_docs['class_descr'] % _float64_descr_args
-
-    _typ = 'float64index'
-    _engine_type = libindex.Float64Engine
-    _arrmap = libalgos.arrmap_float64
-    _left_indexer_unique = libjoin.left_join_indexer_unique_float64
-    _left_indexer = libjoin.left_join_indexer_float64
-    _inner_indexer = libjoin.inner_join_indexer_float64
-    _outer_indexer = libjoin.outer_join_indexer_float64
-
-    _default_dtype = np.float64
-
-    @property
-    def inferred_type(self):
-        return 'floating'
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True):
-        dtype = pandas_dtype(dtype)
-        if is_float_dtype(dtype):
-            values = self._values.astype(dtype, copy=copy)
-        elif is_integer_dtype(dtype):
-            if self.hasnans:
-                raise ValueError('cannot convert float NaN to integer')
-            values = self._values.astype(dtype, copy=copy)
-        elif is_object_dtype(dtype):
-            values = self._values.astype('object', copy=copy)
-        else:
-            raise TypeError('Setting %s dtype to anything other than '
-                            'float64 or object is not supported' %
-                            self.__class__)
-        return Index(values, name=self.name, dtype=dtype)
-
-    @Appender(_index_shared_docs['_convert_scalar_indexer'])
-    def _convert_scalar_indexer(self, key, kind=None):
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        if kind == 'iloc':
-            return self._validate_indexer('positional', key, kind)
-
-        return key
-
-    @Appender(_index_shared_docs['_convert_slice_indexer'])
-    def _convert_slice_indexer(self, key, kind=None):
-        # if we are not a slice, then we are done
-        if not isinstance(key, slice):
-            return key
-
-        if kind == 'iloc':
-            return super(Float64Index, self)._convert_slice_indexer(key,
-                                                                    kind=kind)
-
-        # translate to locations
-        return self.slice_indexer(key.start, key.stop, key.step, kind=kind)
-
-    def _format_native_types(self, na_rep='', float_format=None, decimal='.',
-                             quoting=None, **kwargs):
-        from pandas.formats.format import FloatArrayFormatter
-        formatter = FloatArrayFormatter(self.values, na_rep=na_rep,
-                                        float_format=float_format,
-                                        decimal=decimal, quoting=quoting,
-                                        fixed_width=False)
-        return formatter.get_result_as_array()
-
-    def get_value(self, series, key):
-        """ we always want to get an index value, never a value """
-        if not is_scalar(key):
-            raise InvalidIndexError
-
-        k = _values_from_object(key)
-        loc = self.get_loc(k)
-        new_values = _values_from_object(series)[loc]
-
-        return new_values
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self is other:
-            return True
-
-        if not isinstance(other, Index):
-            return False
-
-        # need to compare nans locations and make sure that they are the same
-        # since nans don't compare equal this is a bit tricky
-        try:
-            if not isinstance(other, Float64Index):
-                other = self._constructor(other)
-            if (not is_dtype_equal(self.dtype, other.dtype) or
-                    self.shape != other.shape):
-                return False
-            left, right = self._values, other._values
-            return ((left == right) | (self._isnan & other._isnan)).all()
-        except (TypeError, ValueError):
-            return False
-
-    def __contains__(self, other):
-        if super(Float64Index, self).__contains__(other):
-            return True
-
-        try:
-            # if other is a sequence this throws a ValueError
-            return np.isnan(other) and self.hasnans
-        except ValueError:
-            try:
-                return len(other) <= 1 and ibase._try_get_item(other) in self
-            except TypeError:
-                return False
-        except:
-            return False
-
-    @Appender(_index_shared_docs['get_loc'])
-    def get_loc(self, key, method=None, tolerance=None):
-        try:
-            if np.all(np.isnan(key)):
-                nan_idxs = self._nan_idxs
-                try:
-                    return nan_idxs.item()
-                except (ValueError, IndexError):
-                    # should only need to catch ValueError here but on numpy
-                    # 1.7 .item() can raise IndexError when NaNs are present
-                    return nan_idxs
-        except (TypeError, NotImplementedError):
-            pass
-        return super(Float64Index, self).get_loc(key, method=method,
-                                                 tolerance=tolerance)
-
-    @cache_readonly
-    def is_unique(self):
-        return super(Float64Index, self).is_unique and self._nan_idxs.size < 2
-
-    @Appender(Index.isin.__doc__)
-    def isin(self, values, level=None):
-        if level is not None:
-            self._validate_index_level(level)
-        return algorithms.isin(np.array(self), values)
-
-
-Float64Index._add_numeric_methods()
-Float64Index._add_logical_methods_disabled()
diff --git a/pandas/indexes/range.py b/pandas/indexes/range.py
deleted file mode 100644
index be68c97fb7890..0000000000000
--- a/pandas/indexes/range.py
+++ /dev/null
@@ -1,644 +0,0 @@
-from sys import getsizeof
-import operator
-
-import numpy as np
-from pandas._libs import index as libindex
-
-from pandas.types.common import (is_integer,
-                                 is_scalar,
-                                 is_int64_dtype)
-
-from pandas import compat
-from pandas.compat import lrange, range
-from pandas.compat.numpy import function as nv
-from pandas.indexes.base import Index, _index_shared_docs
-from pandas.util.decorators import Appender, cache_readonly
-import pandas.indexes.base as ibase
-
-from pandas.indexes.numeric import Int64Index
-
-
-class RangeIndex(Int64Index):
-
-    """
-    Immutable Index implementing a monotonic range. RangeIndex is a
-    memory-saving special case of Int64Index limited to representing
-    monotonic ranges.
-
-    Parameters
-    ----------
-    start : int (default: 0), or other RangeIndex instance.
-        If int and "stop" is not given, interpreted as "stop" instead.
-    stop : int (default: 0)
-    step : int (default: 1)
-    name : object, optional
-        Name to be stored in the index
-    copy : bool, default False
-        Unused, accepted for homogeneity with other index types.
-
-    """
-
-    _typ = 'rangeindex'
-    _engine_type = libindex.Int64Engine
-
-    def __new__(cls, start=None, stop=None, step=None, name=None, dtype=None,
-                fastpath=False, copy=False, **kwargs):
-
-        if fastpath:
-            return cls._simple_new(start, stop, step, name=name)
-
-        cls._validate_dtype(dtype)
-
-        # RangeIndex
-        if isinstance(start, RangeIndex):
-            if name is None:
-                name = start.name
-            return cls._simple_new(name=name,
-                                   **dict(start._get_data_as_items()))
-
-        # validate the arguments
-        def _ensure_int(value, field):
-            msg = ("RangeIndex(...) must be called with integers,"
-                   " {value} was passed for {field}")
-            if not is_scalar(value):
-                raise TypeError(msg.format(value=type(value).__name__,
-                                           field=field))
-            try:
-                new_value = int(value)
-                assert(new_value == value)
-            except (TypeError, ValueError, AssertionError):
-                raise TypeError(msg.format(value=type(value).__name__,
-                                           field=field))
-
-            return new_value
-
-        if start is None and stop is None and step is None:
-            msg = "RangeIndex(...) must be called with integers"
-            raise TypeError(msg)
-        elif start is None:
-            start = 0
-        else:
-            start = _ensure_int(start, 'start')
-        if stop is None:
-            stop = start
-            start = 0
-        else:
-            stop = _ensure_int(stop, 'stop')
-        if step is None:
-            step = 1
-        elif step == 0:
-            raise ValueError("Step must not be zero")
-        else:
-            step = _ensure_int(step, 'step')
-
-        return cls._simple_new(start, stop, step, name)
-
-    @classmethod
-    def from_range(cls, data, name=None, dtype=None, **kwargs):
-        """ create RangeIndex from a range (py3), or xrange (py2) object """
-        if not isinstance(data, range):
-            raise TypeError(
-                '{0}(...) must be called with object coercible to a '
-                'range, {1} was passed'.format(cls.__name__, repr(data)))
-
-        if compat.PY3:
-            step = data.step
-            stop = data.stop
-            start = data.start
-        else:
-            # seems we only have indexing ops to infer
-            # rather than direct accessors
-            if len(data) > 1:
-                step = data[1] - data[0]
-                stop = data[-1] + step
-                start = data[0]
-            elif len(data):
-                start = data[0]
-                stop = data[0] + 1
-                step = 1
-            else:
-                start = stop = 0
-                step = 1
-        return RangeIndex(start, stop, step, dtype=dtype, name=name, **kwargs)
-
-    @classmethod
-    def _simple_new(cls, start, stop=None, step=None, name=None,
-                    dtype=None, **kwargs):
-        result = object.__new__(cls)
-
-        # handle passed None, non-integers
-        if start is None and stop is None:
-            # empty
-            start, stop, step = 0, 0, 1
-
-        if start is None or not is_integer(start):
-            try:
-
-                return RangeIndex(start, stop, step, name=name, **kwargs)
-            except TypeError:
-                return Index(start, stop, step, name=name, **kwargs)
-
-        result._start = start
-        result._stop = stop or 0
-        result._step = step or 1
-        result.name = name
-        for k, v in compat.iteritems(kwargs):
-            setattr(result, k, v)
-
-        result._reset_identity()
-        return result
-
-    @staticmethod
-    def _validate_dtype(dtype):
-        """ require dtype to be None or int64 """
-        if not (dtype is None or is_int64_dtype(dtype)):
-            raise TypeError('Invalid to pass a non-int64 dtype to RangeIndex')
-
-    @cache_readonly
-    def _constructor(self):
-        """ return the class to use for construction """
-        return Int64Index
-
-    @cache_readonly
-    def _data(self):
-        return np.arange(self._start, self._stop, self._step, dtype=np.int64)
-
-    @cache_readonly
-    def _int64index(self):
-        return Int64Index(self._data, name=self.name, fastpath=True)
-
-    def _get_data_as_items(self):
-        """ return a list of tuples of start, stop, step """
-        return [('start', self._start),
-                ('stop', self._stop),
-                ('step', self._step)]
-
-    def __reduce__(self):
-        d = self._get_attributes_dict()
-        d.update(dict(self._get_data_as_items()))
-        return ibase._new_Index, (self.__class__, d), None
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr, formatted_value)
-        """
-        attrs = self._get_data_as_items()
-        if self.name is not None:
-            attrs.append(('name', ibase.default_pprint(self.name)))
-        return attrs
-
-    def _format_data(self):
-        # we are formatting thru the attributes
-        return None
-
-    @cache_readonly
-    def nbytes(self):
-        """ return the number of bytes in the underlying data """
-        return sum([getsizeof(getattr(self, v)) for v in
-                    ['_start', '_stop', '_step']])
-
-    def memory_usage(self, deep=False):
-        """
-        Memory usage of my values
-
-        Parameters
-        ----------
-        deep : bool
-            Introspect the data deeply, interrogate
-            `object` dtypes for system-level memory consumption
-
-        Returns
-        -------
-        bytes used
-
-        Notes
-        -----
-        Memory usage does not include memory consumed by elements that
-        are not components of the array if deep=False
-
-        See Also
-        --------
-        numpy.ndarray.nbytes
-        """
-        return self.nbytes
-
-    @property
-    def dtype(self):
-        return np.dtype(np.int64)
-
-    @property
-    def is_unique(self):
-        """ return if the index has unique values """
-        return True
-
-    @cache_readonly
-    def is_monotonic_increasing(self):
-        return self._step > 0 or len(self) <= 1
-
-    @cache_readonly
-    def is_monotonic_decreasing(self):
-        return self._step < 0 or len(self) <= 1
-
-    @property
-    def has_duplicates(self):
-        return False
-
-    def tolist(self):
-        return lrange(self._start, self._stop, self._step)
-
-    @Appender(_index_shared_docs['_shallow_copy'])
-    def _shallow_copy(self, values=None, **kwargs):
-        if values is None:
-            return RangeIndex(name=self.name, fastpath=True,
-                              **dict(self._get_data_as_items()))
-        else:
-            kwargs.setdefault('name', self.name)
-            return self._int64index._shallow_copy(values, **kwargs)
-
-    @Appender(ibase._index_shared_docs['copy'])
-    def copy(self, name=None, deep=False, dtype=None, **kwargs):
-        self._validate_dtype(dtype)
-        if name is None:
-            name = self.name
-        return RangeIndex(name=name, fastpath=True,
-                          **dict(self._get_data_as_items()))
-
-    def argsort(self, *args, **kwargs):
-        """
-        Returns the indices that would sort the index and its
-        underlying data.
-
-        Returns
-        -------
-        argsorted : numpy array
-
-        See also
-        --------
-        numpy.ndarray.argsort
-        """
-        nv.validate_argsort(args, kwargs)
-
-        if self._step > 0:
-            return np.arange(len(self))
-        else:
-            return np.arange(len(self) - 1, -1, -1)
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if isinstance(other, RangeIndex):
-            ls = len(self)
-            lo = len(other)
-            return (ls == lo == 0 or
-                    ls == lo == 1 and
-                    self._start == other._start or
-                    ls == lo and
-                    self._start == other._start and
-                    self._step == other._step)
-
-        return super(RangeIndex, self).equals(other)
-
-    def intersection(self, other):
-        """
-        Form the intersection of two Index objects. Sortedness of the result is
-        not guaranteed
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        intersection : Index
-        """
-        if not isinstance(other, RangeIndex):
-            return super(RangeIndex, self).intersection(other)
-
-        if not len(self) or not len(other):
-            return RangeIndex._simple_new(None)
-
-        # check whether intervals intersect
-        # deals with in- and decreasing ranges
-        int_low = max(min(self._start, self._stop + 1),
-                      min(other._start, other._stop + 1))
-        int_high = min(max(self._stop, self._start + 1),
-                       max(other._stop, other._start + 1))
-        if int_high <= int_low:
-            return RangeIndex._simple_new(None)
-
-        # Method hint: linear Diophantine equation
-        # solve intersection problem
-        # performance hint: for identical step sizes, could use
-        # cheaper alternative
-        gcd, s, t = self._extended_gcd(self._step, other._step)
-
-        # check whether element sets intersect
-        if (self._start - other._start) % gcd:
-            return RangeIndex._simple_new(None)
-
-        # calculate parameters for the RangeIndex describing the
-        # intersection disregarding the lower bounds
-        tmp_start = self._start + (other._start - self._start) * \
-            self._step // gcd * s
-        new_step = self._step * other._step // gcd
-        new_index = RangeIndex(tmp_start, int_high, new_step, fastpath=True)
-
-        # adjust index to limiting interval
-        new_index._start = new_index._min_fitting_element(int_low)
-        return new_index
-
-    def _min_fitting_element(self, lower_limit):
-        """Returns the smallest element greater than or equal to the limit"""
-        no_steps = -(-(lower_limit - self._start) // abs(self._step))
-        return self._start + abs(self._step) * no_steps
-
-    def _max_fitting_element(self, upper_limit):
-        """Returns the largest element smaller than or equal to the limit"""
-        no_steps = (upper_limit - self._start) // abs(self._step)
-        return self._start + abs(self._step) * no_steps
-
-    def _extended_gcd(self, a, b):
-        """
-        Extended Euclidean algorithms to solve Bezout's identity:
-           a*x + b*y = gcd(x, y)
-        Finds one particular solution for x, y: s, t
-        Returns: gcd, s, t
-        """
-        s, old_s = 0, 1
-        t, old_t = 1, 0
-        r, old_r = b, a
-        while r:
-            quotient = old_r // r
-            old_r, r = r, old_r - quotient * r
-            old_s, s = s, old_s - quotient * s
-            old_t, t = t, old_t - quotient * t
-        return old_r, old_s, old_t
-
-    def union(self, other):
-        """
-        Form the union of two Index objects and sorts if possible
-
-        Parameters
-        ----------
-        other : Index or array-like
-
-        Returns
-        -------
-        union : Index
-        """
-        self._assert_can_do_setop(other)
-        if len(other) == 0 or self.equals(other):
-            return self
-        if len(self) == 0:
-            return other
-        if isinstance(other, RangeIndex):
-            start_s, step_s = self._start, self._step
-            end_s = self._start + self._step * (len(self) - 1)
-            start_o, step_o = other._start, other._step
-            end_o = other._start + other._step * (len(other) - 1)
-            if self._step < 0:
-                start_s, step_s, end_s = end_s, -step_s, start_s
-            if other._step < 0:
-                start_o, step_o, end_o = end_o, -step_o, start_o
-            if len(self) == 1 and len(other) == 1:
-                step_s = step_o = abs(self._start - other._start)
-            elif len(self) == 1:
-                step_s = step_o
-            elif len(other) == 1:
-                step_o = step_s
-            start_r = min(start_s, start_o)
-            end_r = max(end_s, end_o)
-            if step_o == step_s:
-                if ((start_s - start_o) % step_s == 0 and
-                        (start_s - end_o) <= step_s and
-                        (start_o - end_s) <= step_s):
-                    return RangeIndex(start_r, end_r + step_s, step_s)
-                if ((step_s % 2 == 0) and
-                        (abs(start_s - start_o) <= step_s / 2) and
-                        (abs(end_s - end_o) <= step_s / 2)):
-                    return RangeIndex(start_r, end_r + step_s / 2, step_s / 2)
-            elif step_o % step_s == 0:
-                if ((start_o - start_s) % step_s == 0 and
-                        (start_o + step_s >= start_s) and
-                        (end_o - step_s <= end_s)):
-                    return RangeIndex(start_r, end_r + step_s, step_s)
-            elif step_s % step_o == 0:
-                if ((start_s - start_o) % step_o == 0 and
-                        (start_s + step_o >= start_o) and
-                        (end_s - step_o <= end_o)):
-                    return RangeIndex(start_r, end_r + step_o, step_o)
-
-        return self._int64index.union(other)
-
-    @Appender(_index_shared_docs['join'])
-    def join(self, other, how='left', level=None, return_indexers=False,
-             sort=False):
-        if how == 'outer' and self is not other:
-            # note: could return RangeIndex in more circumstances
-            return self._int64index.join(other, how, level, return_indexers,
-                                         sort)
-
-        return super(RangeIndex, self).join(other, how, level, return_indexers,
-                                            sort)
-
-    def __len__(self):
-        """
-        return the length of the RangeIndex
-        """
-        return max(0, -(-(self._stop - self._start) // self._step))
-
-    @property
-    def size(self):
-        return len(self)
-
-    def __getitem__(self, key):
-        """
-        Conserve RangeIndex type for scalar and slice keys.
-        """
-        super_getitem = super(RangeIndex, self).__getitem__
-
-        if is_scalar(key):
-            n = int(key)
-            if n != key:
-                return super_getitem(key)
-            if n < 0:
-                n = len(self) + key
-            if n < 0 or n > len(self) - 1:
-                raise IndexError("index {key} is out of bounds for axis 0 "
-                                 "with size {size}".format(key=key,
-                                                           size=len(self)))
-            return self._start + n * self._step
-
-        if isinstance(key, slice):
-
-            # This is basically PySlice_GetIndicesEx, but delegation to our
-            # super routines if we don't have integers
-
-            l = len(self)
-
-            # complete missing slice information
-            step = 1 if key.step is None else key.step
-            if key.start is None:
-                start = l - 1 if step < 0 else 0
-            else:
-                start = key.start
-
-                if start < 0:
-                    start += l
-                if start < 0:
-                    start = -1 if step < 0 else 0
-                if start >= l:
-                    start = l - 1 if step < 0 else l
-
-            if key.stop is None:
-                stop = -1 if step < 0 else l
-            else:
-                stop = key.stop
-
-                if stop < 0:
-                    stop += l
-                if stop < 0:
-                    stop = -1
-                if stop > l:
-                    stop = l
-
-            # delegate non-integer slices
-            if (start != int(start) or
-                    stop != int(stop) or
-                    step != int(step)):
-                return super_getitem(key)
-
-            # convert indexes to values
-            start = self._start + self._step * start
-            stop = self._start + self._step * stop
-            step = self._step * step
-
-            return RangeIndex(start, stop, step, self.name, fastpath=True)
-
-        # fall back to Int64Index
-        return super_getitem(key)
-
-    def __floordiv__(self, other):
-        if is_integer(other):
-            if (len(self) == 0 or
-                    self._start % other == 0 and
-                    self._step % other == 0):
-                start = self._start // other
-                step = self._step // other
-                stop = start + len(self) * step
-                return RangeIndex(start, stop, step, name=self.name,
-                                  fastpath=True)
-            if len(self) == 1:
-                start = self._start // other
-                return RangeIndex(start, start + 1, 1, name=self.name,
-                                  fastpath=True)
-        return self._int64index // other
-
-    @classmethod
-    def _add_numeric_methods_binary(cls):
-        """ add in numeric methods, specialized to RangeIndex """
-
-        def _make_evaluate_binop(op, opstr, reversed=False, step=False):
-            """
-            Parameters
-            ----------
-            op : callable that accepts 2 parms
-                perform the binary op
-            opstr : string
-                string name of ops
-            reversed : boolean, default False
-                if this is a reversed op, e.g. radd
-            step : callable, optional, default to False
-                op to apply to the step parm if not None
-                if False, use the existing step
-            """
-
-            def _evaluate_numeric_binop(self, other):
-
-                other = self._validate_for_numeric_binop(other, op, opstr)
-                attrs = self._get_attributes_dict()
-                attrs = self._maybe_update_attributes(attrs)
-
-                if reversed:
-                    self, other = other, self
-
-                try:
-                    # alppy if we have an override
-                    if step:
-                        with np.errstate(all='ignore'):
-                            rstep = step(self._step, other)
-
-                        # we don't have a representable op
-                        # so return a base index
-                        if not is_integer(rstep) or not rstep:
-                            raise ValueError
-
-                    else:
-                        rstep = self._step
-
-                    with np.errstate(all='ignore'):
-                        rstart = op(self._start, other)
-                        rstop = op(self._stop, other)
-
-                    result = RangeIndex(rstart,
-                                        rstop,
-                                        rstep,
-                                        **attrs)
-
-                    # for compat with numpy / Int64Index
-                    # even if we can represent as a RangeIndex, return
-                    # as a Float64Index if we have float-like descriptors
-                    if not all([is_integer(x) for x in
-                                [rstart, rstop, rstep]]):
-                        result = result.astype('float64')
-
-                    return result
-
-                except (ValueError, TypeError, AttributeError):
-                    pass
-
-                # convert to Int64Index ops
-                if isinstance(self, RangeIndex):
-                    self = self.values
-                if isinstance(other, RangeIndex):
-                    other = other.values
-
-                with np.errstate(all='ignore'):
-                    results = op(self, other)
-                return Index(results, **attrs)
-
-            return _evaluate_numeric_binop
-
-        cls.__add__ = cls.__radd__ = _make_evaluate_binop(
-            operator.add, '__add__')
-        cls.__sub__ = _make_evaluate_binop(operator.sub, '__sub__')
-        cls.__rsub__ = _make_evaluate_binop(
-            operator.sub, '__sub__', reversed=True)
-        cls.__mul__ = cls.__rmul__ = _make_evaluate_binop(
-            operator.mul,
-            '__mul__',
-            step=operator.mul)
-        cls.__truediv__ = _make_evaluate_binop(
-            operator.truediv,
-            '__truediv__',
-            step=operator.truediv)
-        cls.__rtruediv__ = _make_evaluate_binop(
-            operator.truediv,
-            '__truediv__',
-            reversed=True,
-            step=operator.truediv)
-        if not compat.PY3:
-            cls.__div__ = _make_evaluate_binop(
-                operator.div,
-                '__div__',
-                step=operator.div)
-            cls.__rdiv__ = _make_evaluate_binop(
-                operator.div,
-                '__div__',
-                reversed=True,
-                step=operator.div)
-
-
-RangeIndex._add_numeric_methods()
-RangeIndex._add_logical_methods()
diff --git a/pandas/io/api.py b/pandas/io/api.py
index e312e7bc2f300..8c8d7cf73b37a 100644
--- a/pandas/io/api.py
+++ b/pandas/io/api.py
@@ -4,28 +4,17 @@
 
 # flake8: noqa
 
-from pandas.io.parsers import read_csv, read_table, read_fwf
-from pandas.io.clipboard import read_clipboard
+from pandas.io.clipboards import read_clipboard
 from pandas.io.excel import ExcelFile, ExcelWriter, read_excel
-from pandas.io.pytables import HDFStore, get_store, read_hdf
-from pandas.io.json import read_json
+from pandas.io.feather_format import read_feather
+from pandas.io.gbq import read_gbq
 from pandas.io.html import read_html
-from pandas.io.sql import read_sql, read_sql_table, read_sql_query
+from pandas.io.json import read_json
+from pandas.io.packers import read_msgpack, to_msgpack
+from pandas.io.parquet import read_parquet
+from pandas.io.parsers import read_csv, read_fwf, read_table
+from pandas.io.pickle import read_pickle, to_pickle
+from pandas.io.pytables import HDFStore, read_hdf
 from pandas.io.sas import read_sas
-from pandas.io.feather_format import read_feather
+from pandas.io.sql import read_sql, read_sql_query, read_sql_table
 from pandas.io.stata import read_stata
-from pandas.io.pickle import read_pickle, to_pickle
-from pandas.io.packers import read_msgpack, to_msgpack
-from pandas.io.gbq import read_gbq
-
-# deprecation, xref #13790
-def Term(*args, **kwargs):
-    import warnings
-
-    warnings.warn("pd.Term is deprecated as it is not "
-                  "applicable to user code. Instead use in-line "
-                  "string expressions in the where clause when "
-                  "searching in HDFStore",
-                  FutureWarning, stacklevel=2)
-    from pandas.io.pytables import Term
-    return Term(*args, **kwargs)
diff --git a/pandas/io/clipboard.py b/pandas/io/clipboard.py
deleted file mode 100644
index 3c7ac528d83fd..0000000000000
--- a/pandas/io/clipboard.py
+++ /dev/null
@@ -1,120 +0,0 @@
-""" io on the clipboard """
-from pandas import compat, get_option, option_context, DataFrame
-from pandas.compat import StringIO, PY2
-
-
-def read_clipboard(sep='\s+', **kwargs):  # pragma: no cover
-    r"""
-    Read text from clipboard and pass to read_table. See read_table for the
-    full argument list
-
-    Parameters
-    ----------
-    sep : str, default '\s+'.
-        A string or regex delimiter. The default of '\s+' denotes
-        one or more whitespace characters.
-
-    Returns
-    -------
-    parsed : DataFrame
-    """
-    encoding = kwargs.pop('encoding', 'utf-8')
-
-    # only utf-8 is valid for passed value because that's what clipboard
-    # supports
-    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
-        raise NotImplementedError(
-            'reading from clipboard only supports utf-8 encoding')
-
-    from pandas.util.clipboard import clipboard_get
-    from pandas.io.parsers import read_table
-    text = clipboard_get()
-
-    # try to decode (if needed on PY3)
-    # Strange. linux py33 doesn't complain, win py33 does
-    if compat.PY3:
-        try:
-            text = compat.bytes_to_str(
-                text, encoding=(kwargs.get('encoding') or
-                                get_option('display.encoding'))
-            )
-        except:
-            pass
-
-    # Excel copies into clipboard with \t separation
-    # inspect no more then the 10 first lines, if they
-    # all contain an equal number (>0) of tabs, infer
-    # that this came from excel and set 'sep' accordingly
-    lines = text[:10000].split('\n')[:-1][:10]
-
-    # Need to remove leading white space, since read_table
-    # accepts:
-    #    a  b
-    # 0  1  2
-    # 1  3  4
-
-    counts = set([x.lstrip().count('\t') for x in lines])
-    if len(lines) > 1 and len(counts) == 1 and counts.pop() != 0:
-        sep = '\t'
-
-    if sep is None and kwargs.get('delim_whitespace') is None:
-        sep = '\s+'
-
-    return read_table(StringIO(text), sep=sep, **kwargs)
-
-
-def to_clipboard(obj, excel=None, sep=None, **kwargs):  # pragma: no cover
-    """
-    Attempt to write text representation of object to the system clipboard
-    The clipboard can be then pasted into Excel for example.
-
-    Parameters
-    ----------
-    obj : the object to write to the clipboard
-    excel : boolean, defaults to True
-            if True, use the provided separator, writing in a csv
-            format for allowing easy pasting into excel.
-            if False, write a string representation of the object
-            to the clipboard
-    sep : optional, defaults to tab
-    other keywords are passed to to_csv
-
-    Notes
-    -----
-    Requirements for your platform
-      - Linux: xclip, or xsel (with gtk or PyQt4 modules)
-      - Windows:
-      - OS X:
-    """
-    encoding = kwargs.pop('encoding', 'utf-8')
-
-    # testing if an invalid encoding is passed to clipboard
-    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
-        raise ValueError('clipboard only supports utf-8 encoding')
-
-    from pandas.util.clipboard import clipboard_set
-    if excel is None:
-        excel = True
-
-    if excel:
-        try:
-            if sep is None:
-                sep = '\t'
-            buf = StringIO()
-            # clipboard_set (pyperclip) expects unicode
-            obj.to_csv(buf, sep=sep, encoding='utf-8', **kwargs)
-            text = buf.getvalue()
-            if PY2:
-                text = text.decode('utf-8')
-            clipboard_set(text)
-            return
-        except:
-            pass
-
-    if isinstance(obj, DataFrame):
-        # str(df) has various unhelpful defaults, like truncation
-        with option_context('display.max_colwidth', 999999):
-            objstr = obj.to_string(**kwargs)
-    else:
-        objstr = str(obj)
-    clipboard_set(objstr)
diff --git a/pandas/io/clipboard/__init__.py b/pandas/io/clipboard/__init__.py
new file mode 100644
index 0000000000000..b76a843e3e7f2
--- /dev/null
+++ b/pandas/io/clipboard/__init__.py
@@ -0,0 +1,125 @@
+"""
+Pyperclip
+
+A cross-platform clipboard module for Python. (only handles plain text for now)
+By Al Sweigart al@inventwithpython.com
+BSD License
+
+Usage:
+  import pyperclip
+  pyperclip.copy('The text to be copied to the clipboard.')
+  spam = pyperclip.paste()
+
+  if not pyperclip.copy:
+    print("Copy functionality unavailable!")
+
+On Windows, no additional modules are needed.
+On Mac, the module uses pbcopy and pbpaste, which should come with the os.
+On Linux, install xclip or xsel via package manager. For example, in Debian:
+sudo apt-get install xclip
+
+Otherwise on Linux, you will need the gtk, qtpy or PyQt modules installed.
+qtpy also requires a python-qt-bindings module: PyQt4, PyQt5, PySide, PySide2
+
+gtk and PyQt4 modules are not available for Python 3,
+and this module does not work with PyGObject yet.
+"""
+__version__ = '1.5.27'
+
+import platform
+import os
+import subprocess
+from .clipboards import (init_osx_clipboard,
+                         init_gtk_clipboard, init_qt_clipboard,
+                         init_xclip_clipboard, init_xsel_clipboard,
+                         init_klipper_clipboard, init_no_clipboard)
+from .windows import init_windows_clipboard
+
+# `import qtpy` sys.exit()s if DISPLAY is not in the environment.
+# Thus, we need to detect the presence of $DISPLAY manually
+# and not load qtpy if it is absent.
+HAS_DISPLAY = os.getenv("DISPLAY", False)
+CHECK_CMD = "where" if platform.system() == "Windows" else "which"
+
+
+def _executable_exists(name):
+    return subprocess.call([CHECK_CMD, name],
+                           stdout=subprocess.PIPE, stderr=subprocess.PIPE) == 0
+
+
+def determine_clipboard():
+    # Determine the OS/platform and set
+    # the copy() and paste() functions accordingly.
+    if 'cygwin' in platform.system().lower():
+        # FIXME: pyperclip currently does not support Cygwin,
+        # see https://github.com/asweigart/pyperclip/issues/55
+        pass
+    elif os.name == 'nt' or platform.system() == 'Windows':
+        return init_windows_clipboard()
+    if os.name == 'mac' or platform.system() == 'Darwin':
+        return init_osx_clipboard()
+    if HAS_DISPLAY:
+        # Determine which command/module is installed, if any.
+        try:
+            # Check if gtk is installed
+            import gtk  # noqa
+        except ImportError:
+            pass
+        else:
+            return init_gtk_clipboard()
+
+        try:
+            # qtpy is a small abstraction layer that lets you write
+            # applications using a single api call to either PyQt or PySide
+            # https://pypi.org/project/QtPy
+            import qtpy  # noqa
+        except ImportError:
+            # If qtpy isn't installed, fall back on importing PyQt5, or PyQt5
+            try:
+                import PyQt5  # noqa
+            except ImportError:
+                try:
+                    import PyQt4  # noqa
+                except ImportError:
+                    pass  # fail fast for all non-ImportError exceptions.
+                else:
+                    return init_qt_clipboard()
+            else:
+                return init_qt_clipboard()
+            pass
+        else:
+            return init_qt_clipboard()
+
+        if _executable_exists("xclip"):
+            return init_xclip_clipboard()
+        if _executable_exists("xsel"):
+            return init_xsel_clipboard()
+        if _executable_exists("klipper") and _executable_exists("qdbus"):
+            return init_klipper_clipboard()
+
+    return init_no_clipboard()
+
+
+def set_clipboard(clipboard):
+    global copy, paste
+
+    clipboard_types = {'osx': init_osx_clipboard,
+                       'gtk': init_gtk_clipboard,
+                       'qt': init_qt_clipboard,
+                       'xclip': init_xclip_clipboard,
+                       'xsel': init_xsel_clipboard,
+                       'klipper': init_klipper_clipboard,
+                       'windows': init_windows_clipboard,
+                       'no': init_no_clipboard}
+
+    copy, paste = clipboard_types[clipboard]()
+
+
+copy, paste = determine_clipboard()
+
+__all__ = ["copy", "paste"]
+
+
+# pandas aliases
+clipboard_get = paste
+clipboard_set = copy
diff --git a/pandas/io/clipboard/clipboards.py b/pandas/io/clipboard/clipboards.py
new file mode 100644
index 0000000000000..d6d0ba0a560bb
--- /dev/null
+++ b/pandas/io/clipboard/clipboards.py
@@ -0,0 +1,145 @@
+import subprocess
+
+from pandas.compat import PY2, text_type
+
+from .exceptions import PyperclipException
+
+EXCEPT_MSG = """
+    Pyperclip could not find a copy/paste mechanism for your system.
+    For more information, please visit https://pyperclip.readthedocs.org """
+
+
+def init_osx_clipboard():
+    def copy_osx(text):
+        p = subprocess.Popen(['pbcopy', 'w'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_osx():
+        p = subprocess.Popen(['pbpaste', 'r'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_osx, paste_osx
+
+
+def init_gtk_clipboard():
+    import gtk
+
+    def copy_gtk(text):
+        global cb
+        cb = gtk.Clipboard()
+        cb.set_text(text)
+        cb.store()
+
+    def paste_gtk():
+        clipboardContents = gtk.Clipboard().wait_for_text()
+        # for python 2, returns None if the clipboard is blank.
+        if clipboardContents is None:
+            return ''
+        else:
+            return clipboardContents
+
+    return copy_gtk, paste_gtk
+
+
+def init_qt_clipboard():
+    # $DISPLAY should exist
+
+    # Try to import from qtpy, but if that fails try PyQt5 then PyQt4
+    try:
+        from qtpy.QtWidgets import QApplication
+    except ImportError:
+        try:
+            from PyQt5.QtWidgets import QApplication
+        except ImportError:
+            from PyQt4.QtGui import QApplication
+
+    app = QApplication.instance()
+    if app is None:
+        app = QApplication([])
+
+    def copy_qt(text):
+        cb = app.clipboard()
+        cb.setText(text)
+
+    def paste_qt():
+        cb = app.clipboard()
+        return text_type(cb.text())
+
+    return copy_qt, paste_qt
+
+
+def init_xclip_clipboard():
+    def copy_xclip(text):
+        p = subprocess.Popen(['xclip', '-selection', 'c'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_xclip():
+        p = subprocess.Popen(['xclip', '-selection', 'c', '-o'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_xclip, paste_xclip
+
+
+def init_xsel_clipboard():
+    def copy_xsel(text):
+        p = subprocess.Popen(['xsel', '-b', '-i'],
+                             stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=text.encode('utf-8'))
+
+    def paste_xsel():
+        p = subprocess.Popen(['xsel', '-b', '-o'],
+                             stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+        return stdout.decode('utf-8')
+
+    return copy_xsel, paste_xsel
+
+
+def init_klipper_clipboard():
+    def copy_klipper(text):
+        p = subprocess.Popen(
+            ['qdbus', 'org.kde.klipper', '/klipper', 'setClipboardContents',
+             text.encode('utf-8')],
+            stdin=subprocess.PIPE, close_fds=True)
+        p.communicate(input=None)
+
+    def paste_klipper():
+        p = subprocess.Popen(
+            ['qdbus', 'org.kde.klipper', '/klipper', 'getClipboardContents'],
+            stdout=subprocess.PIPE, close_fds=True)
+        stdout, stderr = p.communicate()
+
+        # Workaround for https://bugs.kde.org/show_bug.cgi?id=342874
+        # TODO: https://github.com/asweigart/pyperclip/issues/43
+        clipboardContents = stdout.decode('utf-8')
+        # even if blank, Klipper will append a newline at the end
+        assert len(clipboardContents) > 0
+        # make sure that newline is there
+        assert clipboardContents.endswith('\n')
+        if clipboardContents.endswith('\n'):
+            clipboardContents = clipboardContents[:-1]
+        return clipboardContents
+
+    return copy_klipper, paste_klipper
+
+
+def init_no_clipboard():
+    class ClipboardUnavailable(object):
+
+        def __call__(self, *args, **kwargs):
+            raise PyperclipException(EXCEPT_MSG)
+
+        if PY2:
+            def __nonzero__(self):
+                return False
+        else:
+            def __bool__(self):
+                return False
+
+    return ClipboardUnavailable(), ClipboardUnavailable()
diff --git a/pandas/util/clipboard/exceptions.py b/pandas/io/clipboard/exceptions.py
similarity index 78%
rename from pandas/util/clipboard/exceptions.py
rename to pandas/io/clipboard/exceptions.py
index 413518e53660a..d948ad414327c 100644
--- a/pandas/util/clipboard/exceptions.py
+++ b/pandas/io/clipboard/exceptions.py
@@ -8,5 +8,5 @@ class PyperclipException(RuntimeError):
 class PyperclipWindowsException(PyperclipException):
 
     def __init__(self, message):
-        message += " (%s)" % ctypes.WinError()
+        message += " ({err})".format(err=ctypes.WinError())
         super(PyperclipWindowsException, self).__init__(message)
diff --git a/pandas/util/clipboard/windows.py b/pandas/io/clipboard/windows.py
similarity index 93%
rename from pandas/util/clipboard/windows.py
rename to pandas/io/clipboard/windows.py
index 5c9be9ddaf508..4f5275af693b7 100644
--- a/pandas/util/clipboard/windows.py
+++ b/pandas/io/clipboard/windows.py
@@ -1,11 +1,11 @@
-# flake8: noqa
 """
 This module implements clipboard handling on Windows using ctypes.
 """
-import time
 import contextlib
 import ctypes
-from ctypes import c_size_t, sizeof, c_wchar_p, get_errno, c_wchar
+from ctypes import c_size_t, c_wchar, c_wchar_p, get_errno, sizeof
+import time
+
 from .exceptions import PyperclipWindowsException
 
 
@@ -29,6 +29,7 @@ def init_windows_clipboard():
                                  HINSTANCE, HMENU, BOOL, UINT, HANDLE)
 
     windll = ctypes.windll
+    msvcrt = ctypes.CDLL('msvcrt')
 
     safeCreateWindowExA = CheckedCall(windll.user32.CreateWindowExA)
     safeCreateWindowExA.argtypes = [DWORD, LPCSTR, LPCSTR, DWORD, INT, INT,
@@ -71,6 +72,10 @@ def init_windows_clipboard():
     safeGlobalUnlock.argtypes = [HGLOBAL]
     safeGlobalUnlock.restype = BOOL
 
+    wcslen = CheckedCall(msvcrt.wcslen)
+    wcslen.argtypes = [c_wchar_p]
+    wcslen.restype = UINT
+
     GMEM_MOVEABLE = 0x0002
     CF_UNICODETEXT = 13
 
@@ -129,13 +134,13 @@ def copy_windows(text):
                     # If the hMem parameter identifies a memory object,
                     # the object must have been allocated using the
                     # function with the GMEM_MOVEABLE flag.
-                    count = len(text) + 1
+                    count = wcslen(text) + 1
                     handle = safeGlobalAlloc(GMEM_MOVEABLE,
                                              count * sizeof(c_wchar))
                     locked_handle = safeGlobalLock(handle)
 
-                    ctypes.memmove(c_wchar_p(locked_handle),
-                                   c_wchar_p(text), count * sizeof(c_wchar))
+                    ctypes.memmove(c_wchar_p(locked_handle), c_wchar_p(text),
+                                   count * sizeof(c_wchar))
 
                     safeGlobalUnlock(handle)
                     safeSetClipboardData(CF_UNICODETEXT, handle)
diff --git a/pandas/io/clipboards.py b/pandas/io/clipboards.py
new file mode 100644
index 0000000000000..23a2b04214e4e
--- /dev/null
+++ b/pandas/io/clipboards.py
@@ -0,0 +1,145 @@
+""" io on the clipboard """
+import warnings
+
+import pandas.compat as compat
+from pandas.compat import PY2, PY3, StringIO
+
+from pandas.core.dtypes.generic import ABCDataFrame
+
+from pandas import get_option, option_context
+
+
+def read_clipboard(sep=r'\s+', **kwargs):  # pragma: no cover
+    r"""
+    Read text from clipboard and pass to read_csv. See read_csv for the
+    full argument list
+
+    Parameters
+    ----------
+    sep : str, default '\s+'
+        A string or regex delimiter. The default of '\s+' denotes
+        one or more whitespace characters.
+
+    Returns
+    -------
+    parsed : DataFrame
+    """
+    encoding = kwargs.pop('encoding', 'utf-8')
+
+    # only utf-8 is valid for passed value because that's what clipboard
+    # supports
+    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
+        raise NotImplementedError(
+            'reading from clipboard only supports utf-8 encoding')
+
+    from pandas.io.clipboard import clipboard_get
+    from pandas.io.parsers import read_csv
+    text = clipboard_get()
+
+    # try to decode (if needed on PY3)
+    # Strange. linux py33 doesn't complain, win py33 does
+    if PY3:
+        try:
+            text = compat.bytes_to_str(
+                text, encoding=(kwargs.get('encoding') or
+                                get_option('display.encoding'))
+            )
+        except AttributeError:
+            pass
+
+    # Excel copies into clipboard with \t separation
+    # inspect no more then the 10 first lines, if they
+    # all contain an equal number (>0) of tabs, infer
+    # that this came from excel and set 'sep' accordingly
+    lines = text[:10000].split('\n')[:-1][:10]
+
+    # Need to remove leading white space, since read_csv
+    # accepts:
+    #    a  b
+    # 0  1  2
+    # 1  3  4
+
+    counts = {x.lstrip().count('\t') for x in lines}
+    if len(lines) > 1 and len(counts) == 1 and counts.pop() != 0:
+        sep = '\t'
+
+    # Edge case where sep is specified to be None, return to default
+    if sep is None and kwargs.get('delim_whitespace') is None:
+        sep = r'\s+'
+
+    # Regex separator currently only works with python engine.
+    # Default to python if separator is multi-character (regex)
+    if len(sep) > 1 and kwargs.get('engine') is None:
+        kwargs['engine'] = 'python'
+    elif len(sep) > 1 and kwargs.get('engine') == 'c':
+        warnings.warn('read_clipboard with regex separator does not work'
+                      ' properly with c engine')
+
+    # In PY2, the c table reader first encodes text with UTF-8 but Python
+    # table reader uses the format of the passed string. For consistency,
+    # encode strings for python engine so that output from python and c
+    # engines produce consistent results
+    if kwargs.get('engine') == 'python' and PY2:
+        text = text.encode('utf-8')
+
+    return read_csv(StringIO(text), sep=sep, **kwargs)
+
+
+def to_clipboard(obj, excel=True, sep=None, **kwargs):  # pragma: no cover
+    """
+    Attempt to write text representation of object to the system clipboard
+    The clipboard can be then pasted into Excel for example.
+
+    Parameters
+    ----------
+    obj : the object to write to the clipboard
+    excel : boolean, defaults to True
+            if True, use the provided separator, writing in a csv
+            format for allowing easy pasting into excel.
+            if False, write a string representation of the object
+            to the clipboard
+    sep : optional, defaults to tab
+    other keywords are passed to to_csv
+
+    Notes
+    -----
+    Requirements for your platform
+      - Linux: xclip, or xsel (with gtk or PyQt4 modules)
+      - Windows:
+      - OS X:
+    """
+    encoding = kwargs.pop('encoding', 'utf-8')
+
+    # testing if an invalid encoding is passed to clipboard
+    if encoding is not None and encoding.lower().replace('-', '') != 'utf8':
+        raise ValueError('clipboard only supports utf-8 encoding')
+
+    from pandas.io.clipboard import clipboard_set
+    if excel is None:
+        excel = True
+
+    if excel:
+        try:
+            if sep is None:
+                sep = '\t'
+            buf = StringIO()
+            # clipboard_set (pyperclip) expects unicode
+            obj.to_csv(buf, sep=sep, encoding='utf-8', **kwargs)
+            text = buf.getvalue()
+            if PY2:
+                text = text.decode('utf-8')
+            clipboard_set(text)
+            return
+        except TypeError:
+            warnings.warn('to_clipboard in excel mode requires a single '
+                          'character separator.')
+    elif sep is not None:
+        warnings.warn('to_clipboard with excel=False ignores the sep argument')
+
+    if isinstance(obj, ABCDataFrame):
+        # str(df) has various unhelpful defaults, like truncation
+        with option_context('display.max_colwidth', 999999):
+            objstr = obj.to_string(**kwargs)
+    else:
+        objstr = str(obj)
+    clipboard_set(objstr)
diff --git a/pandas/io/common.py b/pandas/io/common.py
index e42d218d7925f..ad054d77b3bc8 100644
--- a/pandas/io/common.py
+++ b/pandas/io/common.py
@@ -1,43 +1,31 @@
 """Common IO api utilities"""
 
-import os
-import csv
 import codecs
+from contextlib import closing, contextmanager
+import csv
 import mmap
-from contextlib import contextmanager, closing
+import os
+import zipfile
+
+import pandas.compat as compat
+from pandas.compat import BytesIO, StringIO, string_types, text_type
+from pandas.errors import (  # noqa
+    AbstractMethodError, DtypeWarning, EmptyDataError, ParserError,
+    ParserWarning)
 
-from pandas.compat import StringIO, BytesIO, string_types, text_type
-from pandas import compat
-from pandas.formats.printing import pprint_thing
-from pandas.core.common import AbstractMethodError
-from pandas.types.common import is_number
+from pandas.core.dtypes.common import is_file_like, is_number
 
-try:
-    from s3fs import S3File
-    need_text_wrapping = (BytesIO, S3File)
-except ImportError:
-    need_text_wrapping = (BytesIO,)
+from pandas.io.formats.printing import pprint_thing
+
+# gh-12665: Alias for now and remove later.
+CParserError = ParserError
 
 # common NA values
 # no longer excluding inf representations
 # '1.#INF','-1.#INF', '1.#INF000000',
-_NA_VALUES = set([
-    '-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A',
-    'N/A', 'NA', '#NA', 'NULL', 'NaN', '-NaN', 'nan', '-nan', ''
-])
-
-try:
-    import pathlib
-    _PATHLIB_INSTALLED = True
-except ImportError:
-    _PATHLIB_INSTALLED = False
-
-
-try:
-    from py.path import local as LocalPath
-    _PY_PATH_INSTALLED = True
-except:
-    _PY_PATH_INSTALLED = False
+_NA_VALUES = {'-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN', '#N/A N/A', '#N/A',
+              'N/A', 'n/a', 'NA', '#NA', 'NULL', 'null', 'NaN', '-NaN', 'nan',
+              '-nan', ''}
 
 
 if compat.PY3:
@@ -69,43 +57,6 @@ def urlopen(*args, **kwargs):
 _VALID_URLS.discard('')
 
 
-class ParserError(ValueError):
-    """
-    Exception that is thrown by an error is encountered in `pd.read_csv`
-    """
-    pass
-
-
-# gh-12665: Alias for now and remove later.
-CParserError = ParserError
-
-
-class DtypeWarning(Warning):
-    """
-    Warning that is raised whenever `pd.read_csv` encounters non-
-    uniform dtypes in a column(s) of a given CSV file
-    """
-    pass
-
-
-class EmptyDataError(ValueError):
-    """
-    Exception that is thrown in `pd.read_csv` (by both the C and
-    Python engines) when empty data or header is encountered
-    """
-    pass
-
-
-class ParserWarning(Warning):
-    """
-    Warning that is raised in `pd.read_csv` whenever it is necessary
-    to change parsers (generally from 'c' to 'python') contrary to the
-    one specified by the user due to lack of support or functionality for
-    parsing particular attributes of a CSV file with the requsted engine
-    """
-    pass
-
-
 class BaseIterator(object):
     """Subclass this and provide a "__next__()" method to obtain an iterator.
     Useful only when the object being iterated is non-reusable (e.g. OK for a
@@ -136,15 +87,7 @@ def _is_url(url):
     """
     try:
         return parse_url(url).scheme in _VALID_URLS
-    except:
-        return False
-
-
-def _is_s3_url(url):
-    """Check for an s3, s3n, or s3a url"""
-    try:
-        return parse_url(url).scheme in ['s3', 's3n', 's3a']
-    except:
+    except Exception:
         return False
 
 
@@ -175,8 +118,7 @@ def _validate_header_arg(header):
 
 
 def _stringify_path(filepath_or_buffer):
-    """Return the argument coerced to a string if it was a pathlib.Path
-       or a py.path.local
+    """Attempt to convert a path-like object to a string.
 
     Parameters
     ----------
@@ -184,17 +126,58 @@ def _stringify_path(filepath_or_buffer):
 
     Returns
     -------
-    str_filepath_or_buffer : a the string version of the input path
+    str_filepath_or_buffer : maybe a string version of the object
+
+    Notes
+    -----
+    Objects supporting the fspath protocol (python 3.6+) are coerced
+    according to its __fspath__ method.
+
+    For backwards compatibility with older pythons, pathlib.Path and
+    py.path objects are specially coerced.
+
+    Any other object is passed through unchanged, which includes bytes,
+    strings, buffers, or anything else that's not even path-like.
     """
+    try:
+        import pathlib
+        _PATHLIB_INSTALLED = True
+    except ImportError:
+        _PATHLIB_INSTALLED = False
+
+    try:
+        from py.path import local as LocalPath
+        _PY_PATH_INSTALLED = True
+    except ImportError:
+        _PY_PATH_INSTALLED = False
+
+    if hasattr(filepath_or_buffer, '__fspath__'):
+        return filepath_or_buffer.__fspath__()
     if _PATHLIB_INSTALLED and isinstance(filepath_or_buffer, pathlib.Path):
         return text_type(filepath_or_buffer)
     if _PY_PATH_INSTALLED and isinstance(filepath_or_buffer, LocalPath):
         return filepath_or_buffer.strpath
-    return filepath_or_buffer
+    return _expand_user(filepath_or_buffer)
+
+
+def is_s3_url(url):
+    """Check for an s3, s3n, or s3a url"""
+    try:
+        return parse_url(url).scheme in ['s3', 's3n', 's3a']
+    except Exception:
+        return False
+
+
+def is_gcs_url(url):
+    """Check for a gcs url"""
+    try:
+        return parse_url(url).scheme in ['gcs', 'gs']
+    except Exception:
+        return False
 
 
 def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
-                           compression=None):
+                           compression=None, mode=None):
     """
     If the filepath_or_buffer is a url, translate and return the buffer.
     Otherwise passthrough.
@@ -204,31 +187,51 @@ def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
     filepath_or_buffer : a url, filepath (str, py.path.local or pathlib.Path),
                          or buffer
     encoding : the encoding to use to decode py3 bytes, default is 'utf-8'
+    mode : str, optional
 
     Returns
     -------
-    a filepath_or_buffer, the encoding, the compression
+    tuple of ({a filepath_ or buffer or S3File instance},
+              encoding, str,
+              compression, str,
+              should_close, bool)
     """
+    filepath_or_buffer = _stringify_path(filepath_or_buffer)
 
     if _is_url(filepath_or_buffer):
-        url = str(filepath_or_buffer)
-        req = _urlopen(url)
+        req = _urlopen(filepath_or_buffer)
         content_encoding = req.headers.get('Content-Encoding', None)
         if content_encoding == 'gzip':
             # Override compression based on Content-Encoding header
             compression = 'gzip'
         reader = BytesIO(req.read())
-        return reader, encoding, compression
+        req.close()
+        return reader, encoding, compression, True
 
-    if _is_s3_url(filepath_or_buffer):
+    if is_s3_url(filepath_or_buffer):
         from pandas.io import s3
         return s3.get_filepath_or_buffer(filepath_or_buffer,
                                          encoding=encoding,
-                                         compression=compression)
+                                         compression=compression,
+                                         mode=mode)
 
-    # It is a pathlib.Path/py.path.local or string
-    filepath_or_buffer = _stringify_path(filepath_or_buffer)
-    return _expand_user(filepath_or_buffer), None, compression
+    if is_gcs_url(filepath_or_buffer):
+        from pandas.io import gcs
+        return gcs.get_filepath_or_buffer(filepath_or_buffer,
+                                          encoding=encoding,
+                                          compression=compression,
+                                          mode=mode)
+
+    if isinstance(filepath_or_buffer, (compat.string_types,
+                                       compat.binary_type,
+                                       mmap.mmap)):
+        return _expand_user(filepath_or_buffer), None, compression, False
+
+    if not is_file_like(filepath_or_buffer):
+        msg = "Invalid file path or buffer object type: {_type}"
+        raise ValueError(msg.format(_type=type(filepath_or_buffer)))
+
+    return filepath_or_buffer, None, compression, False
 
 
 def file_path_to_url(path):
@@ -263,10 +266,12 @@ def _infer_compression(filepath_or_buffer, compression):
 
     Parameters
     ----------
-    filepath_or_buf :
+    filepath_or_buffer :
         a path (str) or buffer
-    compression : str or None
-        the compression method including None for no compression and 'infer'
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}
+        If 'infer' and `filepath_or_buffer` is path-like, then detect
+        compression from the following extensions: '.gz', '.bz2', '.zip',
+        or '.xz' (otherwise no compression).
 
     Returns
     -------
@@ -282,13 +287,15 @@ def _infer_compression(filepath_or_buffer, compression):
     if compression is None:
         return None
 
-    # Cannot infer compression of a buffer. Hence assume no compression.
-    is_path = isinstance(filepath_or_buffer, compat.string_types)
-    if compression == 'infer' and not is_path:
-        return None
-
-    # Infer compression from the filename/URL extension
+    # Infer compression
     if compression == 'infer':
+        # Convert all path types (e.g. pathlib.Path) to strings
+        filepath_or_buffer = _stringify_path(filepath_or_buffer)
+        if not isinstance(filepath_or_buffer, compat.string_types):
+            # Cannot infer compression of a buffer, assume no compression
+            return None
+
+        # Infer compression from the filename/URL extension
         for compression, extension in _compression_to_extension.items():
             if filepath_or_buffer.endswith(extension):
                 return compression
@@ -316,25 +323,39 @@ def _get_handle(path_or_buf, mode, encoding=None, compression=None,
     mode : str
         mode to open path_or_buf with
     encoding : str or None
-    compression : str or None
-        Supported compression protocols are gzip, bz2, zip, and xz
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default None
+        If 'infer' and `filepath_or_buffer` is path-like, then detect
+        compression from the following extensions: '.gz', '.bz2', '.zip',
+        or '.xz' (otherwise no compression).
     memory_map : boolean, default False
         See parsers._parser_params for more information.
     is_text : boolean, default True
         whether file/buffer is in text format (csv, json, etc.), or in binary
         mode (pickle, etc.)
+
     Returns
     -------
     f : file-like
         A file-like object
     handles : list of file-like objects
-        A list of file-like object that were openned in this function.
+        A list of file-like object that were opened in this function.
     """
+    try:
+        from s3fs import S3File
+        need_text_wrapping = (BytesIO, S3File)
+    except ImportError:
+        need_text_wrapping = (BytesIO,)
 
     handles = list()
     f = path_or_buf
+
+    # Convert pathlib.Path/py.path.local or string
+    path_or_buf = _stringify_path(path_or_buf)
     is_path = isinstance(path_or_buf, compat.string_types)
 
+    if is_path:
+        compression = _infer_compression(path_or_buf, compression)
+
     if compression:
 
         if compat.PY2 and not is_path and encoding:
@@ -364,18 +385,22 @@ def _get_handle(path_or_buf, mode, encoding=None, compression=None,
 
         # ZIP Compression
         elif compression == 'zip':
-            import zipfile
-            zip_file = zipfile.ZipFile(path_or_buf)
-            zip_names = zip_file.namelist()
-            if len(zip_names) == 1:
-                f = zip_file.open(zip_names.pop())
-            elif len(zip_names) == 0:
-                raise ValueError('Zero files found in ZIP file {}'
-                                 .format(path_or_buf))
-            else:
-                raise ValueError('Multiple files found in ZIP file.'
-                                 ' Only one file per ZIP: {}'
-                                 .format(zip_names))
+            zf = BytesZipFile(path_or_buf, mode)
+            # Ensure the container is closed as well.
+            handles.append(zf)
+            if zf.mode == 'w':
+                f = zf
+            elif zf.mode == 'r':
+                zip_names = zf.namelist()
+                if len(zip_names) == 1:
+                    f = zf.open(zip_names.pop())
+                elif len(zip_names) == 0:
+                    raise ValueError('Zero files found in ZIP file {}'
+                                     .format(path_or_buf))
+                else:
+                    raise ValueError('Multiple files found in ZIP file.'
+                                     ' Only one file per ZIP: {}'
+                                     .format(zip_names))
 
         # XZ Compression
         elif compression == 'xz':
@@ -392,21 +417,22 @@ def _get_handle(path_or_buf, mode, encoding=None, compression=None,
     elif is_path:
         if compat.PY2:
             # Python 2
+            mode = "wb" if mode == "w" else mode
             f = open(path_or_buf, mode)
         elif encoding:
             # Python 3 and encoding
-            f = open(path_or_buf, mode, encoding=encoding)
+            f = open(path_or_buf, mode, encoding=encoding, newline="")
         elif is_text:
             # Python 3 and no explicit encoding
-            f = open(path_or_buf, mode, errors='replace')
+            f = open(path_or_buf, mode, errors='replace', newline="")
         else:
             # Python 3 and binary mode
             f = open(path_or_buf, mode)
         handles.append(f)
 
     # in Python 3, convert BytesIO or fileobjects passed with an encoding
-    if compat.PY3 and is_text and\
-            (compression or isinstance(f, need_text_wrapping)):
+    if (compat.PY3 and is_text and
+            (compression or isinstance(f, need_text_wrapping))):
         from io import TextIOWrapper
         f = TextIOWrapper(f, encoding=encoding)
         handles.append(f)
@@ -426,6 +452,28 @@ def _get_handle(path_or_buf, mode, encoding=None, compression=None,
     return f, handles
 
 
+class BytesZipFile(zipfile.ZipFile, BytesIO):
+    """
+    Wrapper for standard library class ZipFile and allow the returned file-like
+    handle to accept byte strings via `write` method.
+
+    BytesIO provides attributes of file-like object and ZipFile.writestr writes
+    bytes strings into a member of the archive.
+    """
+    # GH 17778
+    def __init__(self, file, mode, compression=zipfile.ZIP_DEFLATED, **kwargs):
+        if mode in ['wb', 'rb']:
+            mode = mode.replace('b', '')
+        super(BytesZipFile, self).__init__(file, mode, compression, **kwargs)
+
+    def write(self, data):
+        super(BytesZipFile, self).writestr(self.filename, data)
+
+    @property
+    def closed(self):
+        return self.fp is None
+
+
 class MMapWrapper(BaseIterator):
     """
     Wrapper for the Python's mmap class so that it can be properly read in
@@ -445,6 +493,9 @@ def __init__(self, f):
     def __getattr__(self, name):
         return getattr(self.mmap, name)
 
+    def __iter__(self):
+        return self
+
     def __next__(self):
         newline = self.mmap.readline()
 
@@ -462,6 +513,10 @@ def __next__(self):
         return newline
 
 
+if not compat.PY3:
+    MMapWrapper.next = lambda self: self.__next__()
+
+
 class UTF8Recoder(BaseIterator):
 
     """
@@ -507,7 +562,7 @@ def __next__(self):
             row = next(self.reader)
             return [compat.text_type(s, "utf-8") for s in row]
 
-    class UnicodeWriter:
+    class UnicodeWriter(object):
 
         """
         A CSV writer which will write rows to CSV file "f",
@@ -534,7 +589,7 @@ def _check_as_is(x):
             # Fetch UTF-8 output from the queue ...
             data = self.queue.getvalue()
             data = data.decode("utf-8")
-            # ... and reencode it into the target encoding
+            # ... and re-encode it into the target encoding
             data = self.encoder.encode(data)
             # write to the target stream
             self.stream.write(data)
@@ -554,7 +609,7 @@ def _check_as_is(x):
             # Fetch UTF-8 output from the queue ...
             data = self.queue.getvalue()
             data = data.decode("utf-8")
-            # ... and reencode it into the target encoding
+            # ... and re-encode it into the target encoding
             data = self.encoder.encode(data)
             # write to the target stream
             self.stream.write(data)
diff --git a/pandas/io/data.py b/pandas/io/data.py
deleted file mode 100644
index e76790a6ab98b..0000000000000
--- a/pandas/io/data.py
+++ /dev/null
@@ -1,6 +0,0 @@
-raise ImportError(
-    "The pandas.io.data module is moved to a separate package "
-    "(pandas-datareader). After installing the pandas-datareader package "
-    "(https://github.com/pydata/pandas-datareader), you can change "
-    "the import ``from pandas.io import data, wb`` to "
-    "``from pandas_datareader import data, wb``.")
diff --git a/pandas/io/date_converters.py b/pandas/io/date_converters.py
index 080d6c3e273a3..1a22ee7240d59 100644
--- a/pandas/io/date_converters.py
+++ b/pandas/io/date_converters.py
@@ -1,20 +1,21 @@
 """This module is designed for community supported date conversion functions"""
-from pandas.compat import range, map
 import numpy as np
-import pandas._libs.lib as lib
+
+from pandas._libs.tslibs import parsing
+from pandas.compat import map, range
 
 
 def parse_date_time(date_col, time_col):
     date_col = _maybe_cast(date_col)
     time_col = _maybe_cast(time_col)
-    return lib.try_parse_date_and_time(date_col, time_col)
+    return parsing.try_parse_date_and_time(date_col, time_col)
 
 
 def parse_date_fields(year_col, month_col, day_col):
     year_col = _maybe_cast(year_col)
     month_col = _maybe_cast(month_col)
     day_col = _maybe_cast(day_col)
-    return lib.try_parse_year_month_day(year_col, month_col, day_col)
+    return parsing.try_parse_year_month_day(year_col, month_col, day_col)
 
 
 def parse_all_fields(year_col, month_col, day_col, hour_col, minute_col,
@@ -25,8 +26,9 @@ def parse_all_fields(year_col, month_col, day_col, hour_col, minute_col,
     hour_col = _maybe_cast(hour_col)
     minute_col = _maybe_cast(minute_col)
     second_col = _maybe_cast(second_col)
-    return lib.try_parse_datetime_components(year_col, month_col, day_col,
-                                             hour_col, minute_col, second_col)
+    return parsing.try_parse_datetime_components(year_col, month_col, day_col,
+                                                 hour_col, minute_col,
+                                                 second_col)
 
 
 def generic_parser(parse_func, *cols):
diff --git a/pandas/io/excel.py b/pandas/io/excel.py
deleted file mode 100644
index d324855bc2f4d..0000000000000
--- a/pandas/io/excel.py
+++ /dev/null
@@ -1,1644 +0,0 @@
-"""
-Module parse to/from Excel
-"""
-
-# ---------------------------------------------------------------------
-# ExcelFile class
-from datetime import datetime, date, time, MINYEAR
-
-import os
-import abc
-import numpy as np
-
-from pandas.types.common import (is_integer, is_float,
-                                 is_bool, is_list_like)
-
-from pandas.core.frame import DataFrame
-from pandas.io.parsers import TextParser
-from pandas.io.common import (_is_url, _urlopen, _validate_header_arg,
-                              EmptyDataError, get_filepath_or_buffer,
-                              _NA_VALUES)
-from pandas.tseries.period import Period
-from pandas.io.json import libjson
-from pandas.compat import (map, zip, reduce, range, lrange, u, add_metaclass,
-                           string_types, OrderedDict)
-from pandas.core import config
-from pandas.formats.printing import pprint_thing
-import pandas.compat as compat
-import pandas.compat.openpyxl_compat as openpyxl_compat
-from warnings import warn
-from distutils.version import LooseVersion
-from pandas.util.decorators import Appender
-from textwrap import fill
-
-__all__ = ["read_excel", "ExcelWriter", "ExcelFile"]
-
-_writer_extensions = ["xlsx", "xls", "xlsm"]
-_writers = {}
-
-_read_excel_doc = """
-Read an Excel table into a pandas DataFrame
-
-Parameters
-----------
-io : string, path object (pathlib.Path or py._path.local.LocalPath),
-    file-like object, pandas ExcelFile, or xlrd workbook.
-    The string could be a URL. Valid URL schemes include http, ftp, s3,
-    and file. For file URLs, a host is expected. For instance, a local
-    file could be file://localhost/path/to/workbook.xlsx
-sheetname : string, int, mixed list of strings/ints, or None, default 0
-
-    Strings are used for sheet names, Integers are used in zero-indexed
-    sheet positions.
-
-    Lists of strings/integers are used to request multiple sheets.
-
-    Specify None to get all sheets.
-
-    str|int -> DataFrame is returned.
-    list|None -> Dict of DataFrames is returned, with keys representing
-    sheets.
-
-    Available Cases
-
-    * Defaults to 0 -> 1st sheet as a DataFrame
-    * 1 -> 2nd sheet as a DataFrame
-    * "Sheet1" -> 1st sheet as a DataFrame
-    * [0,1,"Sheet5"] -> 1st, 2nd & 5th sheet as a dictionary of DataFrames
-    * None -> All sheets as a dictionary of DataFrames
-
-header : int, list of ints, default 0
-    Row (0-indexed) to use for the column labels of the parsed
-    DataFrame. If a list of integers is passed those row positions will
-    be combined into a ``MultiIndex``
-skiprows : list-like
-    Rows to skip at the beginning (0-indexed)
-skip_footer : int, default 0
-    Rows at the end to skip (0-indexed)
-index_col : int, list of ints, default None
-    Column (0-indexed) to use as the row labels of the DataFrame.
-    Pass None if there is no such column.  If a list is passed,
-    those columns will be combined into a ``MultiIndex``
-names : array-like, default None
-    List of column names to use. If file contains no header row,
-    then you should explicitly pass header=None
-converters : dict, default None
-    Dict of functions for converting values in certain columns. Keys can
-    either be integers or column labels, values are functions that take one
-    input argument, the Excel cell content, and return the transformed
-    content.
-dtype : Type name or dict of column -> type, default None
-    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
-    Use `str` or `object` to preserve and not interpret dtype.
-    If converters are specified, they will be applied INSTEAD
-    of dtype conversion.
-
-    .. versionadded:: 0.20.0
-
-true_values : list, default None
-    Values to consider as True
-
-    .. versionadded:: 0.19.0
-
-false_values : list, default None
-    Values to consider as False
-
-    .. versionadded:: 0.19.0
-
-parse_cols : int or list, default None
-    * If None then parse all columns,
-    * If int then indicates last column to be parsed
-    * If list of ints then indicates list of column numbers to be parsed
-    * If string then indicates comma separated list of column names and
-      column ranges (e.g. "A:E" or "A,C,E:F")
-squeeze : boolean, default False
-    If the parsed data only contains one column then return a Series
-na_values : scalar, str, list-like, or dict, default None
-    Additional strings to recognize as NA/NaN. If dict passed, specific
-    per-column NA values. By default the following values are interpreted
-    as NaN: '""" + fill("', '".join(sorted(_NA_VALUES)), 70) + """'.
-thousands : str, default None
-    Thousands separator for parsing string columns to numeric.  Note that
-    this parameter is only necessary for columns stored as TEXT in Excel,
-    any numeric columns will automatically be parsed, regardless of display
-    format.
-keep_default_na : bool, default True
-    If na_values are specified and keep_default_na is False the default NaN
-    values are overridden, otherwise they're appended to.
-verbose : boolean, default False
-    Indicate number of NA values placed in non-numeric columns
-engine: string, default None
-    If io is not a buffer or path, this must be set to identify io.
-    Acceptable values are None or xlrd
-convert_float : boolean, default True
-    convert integral floats to int (i.e., 1.0 --> 1). If False, all numeric
-    data will be read in as floats: Excel stores all numbers as floats
-    internally
-has_index_names : boolean, default None
-    DEPRECATED: for version 0.17+ index names will be automatically
-    inferred based on index_col.  To read Excel output from 0.16.2 and
-    prior that had saved index names, use True.
-
-Returns
--------
-parsed : DataFrame or Dict of DataFrames
-    DataFrame from the passed in Excel file.  See notes in sheetname
-    argument for more information on when a Dict of Dataframes is returned.
-"""
-
-
-def register_writer(klass):
-    """Adds engine to the excel writer registry. You must use this method to
-    integrate with ``to_excel``. Also adds config options for any new
-    ``supported_extensions`` defined on the writer."""
-    if not compat.callable(klass):
-        raise ValueError("Can only register callables as engines")
-    engine_name = klass.engine
-    _writers[engine_name] = klass
-    for ext in klass.supported_extensions:
-        if ext.startswith('.'):
-            ext = ext[1:]
-        if ext not in _writer_extensions:
-            config.register_option("io.excel.%s.writer" % ext,
-                                   engine_name, validator=str)
-            _writer_extensions.append(ext)
-
-
-def get_writer(engine_name):
-    if engine_name == 'openpyxl':
-        try:
-            import openpyxl
-
-            # with version-less openpyxl engine
-            # make sure we make the intelligent choice for the user
-            if LooseVersion(openpyxl.__version__) < '2.0.0':
-                return _writers['openpyxl1']
-            elif LooseVersion(openpyxl.__version__) < '2.2.0':
-                return _writers['openpyxl20']
-            else:
-                return _writers['openpyxl22']
-        except ImportError:
-            # fall through to normal exception handling below
-            pass
-
-    try:
-        return _writers[engine_name]
-    except KeyError:
-        raise ValueError("No Excel writer '%s'" % engine_name)
-
-
-@Appender(_read_excel_doc)
-def read_excel(io, sheetname=0, header=0, skiprows=None, skip_footer=0,
-               index_col=None, names=None, parse_cols=None, parse_dates=False,
-               date_parser=None, na_values=None, thousands=None,
-               convert_float=True, has_index_names=None, converters=None,
-               dtype=None, true_values=None, false_values=None, engine=None,
-               squeeze=False, **kwds):
-
-    if not isinstance(io, ExcelFile):
-        io = ExcelFile(io, engine=engine)
-
-    return io._parse_excel(
-        sheetname=sheetname, header=header, skiprows=skiprows, names=names,
-        index_col=index_col, parse_cols=parse_cols, parse_dates=parse_dates,
-        date_parser=date_parser, na_values=na_values, thousands=thousands,
-        convert_float=convert_float, has_index_names=has_index_names,
-        skip_footer=skip_footer, converters=converters, dtype=dtype,
-        true_values=true_values, false_values=false_values, squeeze=squeeze,
-        **kwds)
-
-
-class ExcelFile(object):
-    """
-    Class for parsing tabular excel sheets into DataFrame objects.
-    Uses xlrd. See read_excel for more documentation
-
-    Parameters
-    ----------
-    io : string, path object (pathlib.Path or py._path.local.LocalPath),
-        file-like object or xlrd workbook
-        If a string or path object, expected to be a path to xls or xlsx file
-    engine: string, default None
-        If io is not a buffer or path, this must be set to identify io.
-        Acceptable values are None or xlrd
-    """
-
-    def __init__(self, io, **kwds):
-
-        import xlrd  # throw an ImportError if we need to
-
-        ver = tuple(map(int, xlrd.__VERSION__.split(".")[:2]))
-        if ver < (0, 9):  # pragma: no cover
-            raise ImportError("pandas requires xlrd >= 0.9.0 for excel "
-                              "support, current version " + xlrd.__VERSION__)
-
-        self.io = io
-
-        engine = kwds.pop('engine', None)
-
-        if engine is not None and engine != 'xlrd':
-            raise ValueError("Unknown engine: %s" % engine)
-
-        # If io is a url, want to keep the data as bytes so can't pass
-        # to get_filepath_or_buffer()
-        if _is_url(io):
-            io = _urlopen(io)
-        # Deal with S3 urls, path objects, etc. Will convert them to
-        # buffer or path string
-        io, _, _ = get_filepath_or_buffer(io)
-
-        if engine == 'xlrd' and isinstance(io, xlrd.Book):
-            self.book = io
-        elif not isinstance(io, xlrd.Book) and hasattr(io, "read"):
-            # N.B. xlrd.Book has a read attribute too
-            data = io.read()
-            self.book = xlrd.open_workbook(file_contents=data)
-        elif isinstance(io, compat.string_types):
-            self.book = xlrd.open_workbook(io)
-        else:
-            raise ValueError('Must explicitly set engine if not passing in'
-                             ' buffer or path for io.')
-
-    def parse(self, sheetname=0, header=0, skiprows=None, skip_footer=0,
-              names=None, index_col=None, parse_cols=None, parse_dates=False,
-              date_parser=None, na_values=None, thousands=None,
-              convert_float=True, has_index_names=None,
-              converters=None, true_values=None, false_values=None,
-              squeeze=False, **kwds):
-        """
-        Parse specified sheet(s) into a DataFrame
-
-        Equivalent to read_excel(ExcelFile, ...)  See the read_excel
-        docstring for more info on accepted parameters
-        """
-
-        return self._parse_excel(sheetname=sheetname, header=header,
-                                 skiprows=skiprows, names=names,
-                                 index_col=index_col,
-                                 has_index_names=has_index_names,
-                                 parse_cols=parse_cols,
-                                 parse_dates=parse_dates,
-                                 date_parser=date_parser, na_values=na_values,
-                                 thousands=thousands,
-                                 skip_footer=skip_footer,
-                                 convert_float=convert_float,
-                                 converters=converters,
-                                 true_values=true_values,
-                                 false_values=false_values,
-                                 squeeze=squeeze,
-                                 **kwds)
-
-    def _should_parse(self, i, parse_cols):
-
-        def _range2cols(areas):
-            """
-            Convert comma separated list of column names and column ranges to a
-            list of 0-based column indexes.
-
-            >>> _range2cols('A:E')
-            [0, 1, 2, 3, 4]
-            >>> _range2cols('A,C,Z:AB')
-            [0, 2, 25, 26, 27]
-            """
-            def _excel2num(x):
-                "Convert Excel column name like 'AB' to 0-based column index"
-                return reduce(lambda s, a: s * 26 + ord(a) - ord('A') + 1,
-                              x.upper().strip(), 0) - 1
-
-            cols = []
-            for rng in areas.split(','):
-                if ':' in rng:
-                    rng = rng.split(':')
-                    cols += lrange(_excel2num(rng[0]), _excel2num(rng[1]) + 1)
-                else:
-                    cols.append(_excel2num(rng))
-            return cols
-
-        if isinstance(parse_cols, int):
-            return i <= parse_cols
-        elif isinstance(parse_cols, compat.string_types):
-            return i in _range2cols(parse_cols)
-        else:
-            return i in parse_cols
-
-    def _parse_excel(self, sheetname=0, header=0, skiprows=None, names=None,
-                     skip_footer=0, index_col=None, has_index_names=None,
-                     parse_cols=None, parse_dates=False, date_parser=None,
-                     na_values=None, thousands=None, convert_float=True,
-                     true_values=None, false_values=None, verbose=False,
-                     dtype=None, squeeze=False, **kwds):
-
-        skipfooter = kwds.pop('skipfooter', None)
-        if skipfooter is not None:
-            skip_footer = skipfooter
-
-        _validate_header_arg(header)
-        if has_index_names is not None:
-            warn("\nThe has_index_names argument is deprecated; index names "
-                 "will be automatically inferred based on index_col.\n"
-                 "This argmument is still necessary if reading Excel output "
-                 "from 0.16.2 or prior with index names.", FutureWarning,
-                 stacklevel=3)
-
-        if 'chunksize' in kwds:
-            raise NotImplementedError("chunksize keyword of read_excel "
-                                      "is not implemented")
-
-        if parse_dates is True and index_col is None:
-            warn("The 'parse_dates=True' keyword of read_excel was provided"
-                 " without an 'index_col' keyword value.")
-
-        import xlrd
-        from xlrd import (xldate, XL_CELL_DATE,
-                          XL_CELL_ERROR, XL_CELL_BOOLEAN,
-                          XL_CELL_NUMBER)
-
-        epoch1904 = self.book.datemode
-
-        def _parse_cell(cell_contents, cell_typ):
-            """converts the contents of the cell into a pandas
-               appropriate object"""
-
-            if cell_typ == XL_CELL_DATE:
-
-                if xlrd_0_9_3:
-                    # Use the newer xlrd datetime handling.
-                    try:
-                        cell_contents = \
-                            xldate.xldate_as_datetime(cell_contents,
-                                                      epoch1904)
-                    except OverflowError:
-                        return cell_contents
-                    # Excel doesn't distinguish between dates and time,
-                    # so we treat dates on the epoch as times only.
-                    # Also, Excel supports 1900 and 1904 epochs.
-                    year = (cell_contents.timetuple())[0:3]
-                    if ((not epoch1904 and year == (1899, 12, 31)) or
-                            (epoch1904 and year == (1904, 1, 1))):
-                        cell_contents = time(cell_contents.hour,
-                                             cell_contents.minute,
-                                             cell_contents.second,
-                                             cell_contents.microsecond)
-                else:
-                    # Use the xlrd <= 0.9.2 date handling.
-                    try:
-                        dt = xldate.xldate_as_tuple(cell_contents, epoch1904)
-
-                    except xldate.XLDateTooLarge:
-                        return cell_contents
-
-                    if dt[0] < MINYEAR:
-                        cell_contents = time(*dt[3:])
-                    else:
-                        cell_contents = datetime(*dt)
-
-            elif cell_typ == XL_CELL_ERROR:
-                cell_contents = np.nan
-            elif cell_typ == XL_CELL_BOOLEAN:
-                cell_contents = bool(cell_contents)
-            elif convert_float and cell_typ == XL_CELL_NUMBER:
-                # GH5394 - Excel 'numbers' are always floats
-                # it's a minimal perf hit and less suprising
-                val = int(cell_contents)
-                if val == cell_contents:
-                    cell_contents = val
-            return cell_contents
-
-        # xlrd >= 0.9.3 can return datetime objects directly.
-        if LooseVersion(xlrd.__VERSION__) >= LooseVersion("0.9.3"):
-            xlrd_0_9_3 = True
-        else:
-            xlrd_0_9_3 = False
-
-        ret_dict = False
-
-        # Keep sheetname to maintain backwards compatibility.
-        if isinstance(sheetname, list):
-            sheets = sheetname
-            ret_dict = True
-        elif sheetname is None:
-            sheets = self.sheet_names
-            ret_dict = True
-        else:
-            sheets = [sheetname]
-
-        # handle same-type duplicates.
-        sheets = list(OrderedDict.fromkeys(sheets).keys())
-
-        output = OrderedDict()
-
-        for asheetname in sheets:
-            if verbose:
-                print("Reading sheet %s" % asheetname)
-
-            if isinstance(asheetname, compat.string_types):
-                sheet = self.book.sheet_by_name(asheetname)
-            else:  # assume an integer if not a string
-                sheet = self.book.sheet_by_index(asheetname)
-
-            data = []
-            should_parse = {}
-
-            for i in range(sheet.nrows):
-                row = []
-                for j, (value, typ) in enumerate(zip(sheet.row_values(i),
-                                                     sheet.row_types(i))):
-                    if parse_cols is not None and j not in should_parse:
-                        should_parse[j] = self._should_parse(j, parse_cols)
-
-                    if parse_cols is None or should_parse[j]:
-                        row.append(_parse_cell(value, typ))
-                data.append(row)
-
-            if sheet.nrows == 0:
-                output[asheetname] = DataFrame()
-                continue
-
-            if is_list_like(header) and len(header) == 1:
-                header = header[0]
-
-            # forward fill and pull out names for MultiIndex column
-            header_names = None
-            if header is not None:
-                if is_list_like(header):
-                    header_names = []
-                    control_row = [True for x in data[0]]
-                    for row in header:
-                        if is_integer(skiprows):
-                            row += skiprows
-
-                        data[row], control_row = _fill_mi_header(
-                            data[row], control_row)
-                        header_name, data[row] = _pop_header_name(
-                            data[row], index_col)
-                        header_names.append(header_name)
-                else:
-                    data[header] = _trim_excel_header(data[header])
-
-            if is_list_like(index_col):
-                # forward fill values for MultiIndex index
-                if not is_list_like(header):
-                    offset = 1 + header
-                else:
-                    offset = 1 + max(header)
-
-                for col in index_col:
-                    last = data[offset][col]
-                    for row in range(offset + 1, len(data)):
-                        if data[row][col] == '' or data[row][col] is None:
-                            data[row][col] = last
-                        else:
-                            last = data[row][col]
-
-            if is_list_like(header) and len(header) > 1:
-                has_index_names = True
-
-            # GH 12292 : error when read one empty column from excel file
-            try:
-                parser = TextParser(data, header=header, index_col=index_col,
-                                    has_index_names=has_index_names,
-                                    na_values=na_values,
-                                    thousands=thousands,
-                                    parse_dates=parse_dates,
-                                    date_parser=date_parser,
-                                    true_values=true_values,
-                                    false_values=false_values,
-                                    skiprows=skiprows,
-                                    skipfooter=skip_footer,
-                                    squeeze=squeeze,
-                                    dtype=dtype,
-                                    **kwds)
-
-                output[asheetname] = parser.read()
-                if names is not None:
-                    output[asheetname].columns = names
-                if not squeeze or isinstance(output[asheetname], DataFrame):
-                    output[asheetname].columns = output[
-                        asheetname].columns.set_names(header_names)
-            except EmptyDataError:
-                # No Data, return an empty DataFrame
-                output[asheetname] = DataFrame()
-
-        if ret_dict:
-            return output
-        else:
-            return output[asheetname]
-
-    @property
-    def sheet_names(self):
-        return self.book.sheet_names()
-
-    def close(self):
-        """close io if necessary"""
-        if hasattr(self.io, 'close'):
-            self.io.close()
-
-    def __enter__(self):
-        return self
-
-    def __exit__(self, exc_type, exc_value, traceback):
-        self.close()
-
-
-def _validate_freeze_panes(freeze_panes):
-    if freeze_panes is not None:
-        if (
-            len(freeze_panes) == 2 and
-            all(isinstance(item, int) for item in freeze_panes)
-        ):
-            return True
-
-        raise ValueError("freeze_panes must be of form (row, column)"
-                         " where row and column are integers")
-
-    # freeze_panes wasn't specified, return False so it won't be applied
-    # to output sheet
-    return False
-
-
-def _trim_excel_header(row):
-    # trim header row so auto-index inference works
-    # xlrd uses '' , openpyxl None
-    while len(row) > 0 and (row[0] == '' or row[0] is None):
-        row = row[1:]
-    return row
-
-
-def _fill_mi_header(row, control_row):
-    """Forward fills blank entries in row, but only inside the same parent index
-
-    Used for creating headers in Multiindex.
-    Parameters
-    ----------
-    row : list
-        List of items in a single row.
-    constrol_row : list of boolean
-        Helps to determine if particular column is in same parent index as the
-        previous value. Used to stop propagation of empty cells between
-        different indexes.
-
-    Returns
-    ----------
-    Returns changed row and control_row
-    """
-    last = row[0]
-    for i in range(1, len(row)):
-        if not control_row[i]:
-            last = row[i]
-
-        if row[i] == '' or row[i] is None:
-            row[i] = last
-        else:
-            control_row[i] = False
-            last = row[i]
-
-    return row, control_row
-
-# fill blank if index_col not None
-
-
-def _pop_header_name(row, index_col):
-    """ (header, new_data) for header rows in MultiIndex parsing"""
-    none_fill = lambda x: None if x == '' else x
-
-    if index_col is None:
-        # no index col specified, trim data for inference path
-        return none_fill(row[0]), row[1:]
-    else:
-        # pop out header name and fill w/ blank
-        i = index_col if not is_list_like(index_col) else max(index_col)
-        return none_fill(row[i]), row[:i] + [''] + row[i + 1:]
-
-
-def _conv_value(val):
-    # Convert numpy types to Python types for the Excel writers.
-    if is_integer(val):
-        val = int(val)
-    elif is_float(val):
-        val = float(val)
-    elif is_bool(val):
-        val = bool(val)
-    elif isinstance(val, Period):
-        val = "%s" % val
-    elif is_list_like(val):
-        val = str(val)
-
-    return val
-
-
-@add_metaclass(abc.ABCMeta)
-class ExcelWriter(object):
-    """
-    Class for writing DataFrame objects into excel sheets, default is to use
-    xlwt for xls, openpyxl for xlsx.  See DataFrame.to_excel for typical usage.
-
-    Parameters
-    ----------
-    path : string
-        Path to xls or xlsx file.
-    engine : string (optional)
-        Engine to use for writing. If None, defaults to
-        ``io.excel.<extension>.writer``.  NOTE: can only be passed as a keyword
-        argument.
-    date_format : string, default None
-        Format string for dates written into Excel files (e.g. 'YYYY-MM-DD')
-    datetime_format : string, default None
-        Format string for datetime objects written into Excel files
-        (e.g. 'YYYY-MM-DD HH:MM:SS')
-
-    Notes
-    -----
-    For compatibility with CSV writers, ExcelWriter serializes lists
-    and dicts to strings before writing.
-    """
-    # Defining an ExcelWriter implementation (see abstract methods for more...)
-
-    # - Mandatory
-    #   - ``write_cells(self, cells, sheet_name=None, startrow=0, startcol=0)``
-    #     --> called to write additional DataFrames to disk
-    #   - ``supported_extensions`` (tuple of supported extensions), used to
-    #      check that engine supports the given extension.
-    #   - ``engine`` - string that gives the engine name. Necessary to
-    #     instantiate class directly and bypass ``ExcelWriterMeta`` engine
-    #     lookup.
-    #   - ``save(self)`` --> called to save file to disk
-    # - Mostly mandatory (i.e. should at least exist)
-    #   - book, cur_sheet, path
-
-    # - Optional:
-    #   - ``__init__(self, path, engine=None, **kwargs)`` --> always called
-    #     with path as first argument.
-
-    # You also need to register the class with ``register_writer()``.
-    # Technically, ExcelWriter implementations don't need to subclass
-    # ExcelWriter.
-    def __new__(cls, path, engine=None, **kwargs):
-        # only switch class if generic(ExcelWriter)
-        if issubclass(cls, ExcelWriter):
-            if engine is None:
-                if isinstance(path, string_types):
-                    ext = os.path.splitext(path)[-1][1:]
-                else:
-                    ext = 'xlsx'
-
-                try:
-                    engine = config.get_option('io.excel.%s.writer' % ext)
-                except KeyError:
-                    error = ValueError("No engine for filetype: '%s'" % ext)
-                    raise error
-            cls = get_writer(engine)
-
-        return object.__new__(cls)
-
-    # declare external properties you can count on
-    book = None
-    curr_sheet = None
-    path = None
-
-    @abc.abstractproperty
-    def supported_extensions(self):
-        "extensions that writer engine supports"
-        pass
-
-    @abc.abstractproperty
-    def engine(self):
-        "name of engine"
-        pass
-
-    @abc.abstractmethod
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        """
-        Write given formated cells into Excel an excel sheet
-
-        Parameters
-        ----------
-        cells : generator
-            cell of formated data to save to Excel sheet
-        sheet_name : string, default None
-            Name of Excel sheet, if None, then use self.cur_sheet
-        startrow: upper left cell row to dump data frame
-        startcol: upper left cell column to dump data frame
-        freeze_panes: integer tuple of length 2
-            contains the bottom-most row and right-most column to freeze
-        """
-        pass
-
-    @abc.abstractmethod
-    def save(self):
-        """
-        Save workbook to disk.
-        """
-        pass
-
-    def __init__(self, path, engine=None,
-                 date_format=None, datetime_format=None, **engine_kwargs):
-        # validate that this engine can handle the extension
-        if isinstance(path, string_types):
-            ext = os.path.splitext(path)[-1]
-        else:
-            ext = 'xls' if engine == 'xlwt' else 'xlsx'
-
-        self.check_extension(ext)
-
-        self.path = path
-        self.sheets = {}
-        self.cur_sheet = None
-
-        if date_format is None:
-            self.date_format = 'YYYY-MM-DD'
-        else:
-            self.date_format = date_format
-        if datetime_format is None:
-            self.datetime_format = 'YYYY-MM-DD HH:MM:SS'
-        else:
-            self.datetime_format = datetime_format
-
-    def _get_sheet_name(self, sheet_name):
-        if sheet_name is None:
-            sheet_name = self.cur_sheet
-        if sheet_name is None:  # pragma: no cover
-            raise ValueError('Must pass explicit sheet_name or set '
-                             'cur_sheet property')
-        return sheet_name
-
-    @classmethod
-    def check_extension(cls, ext):
-        """checks that path's extension against the Writer's supported
-        extensions.  If it isn't supported, raises UnsupportedFiletypeError."""
-        if ext.startswith('.'):
-            ext = ext[1:]
-        if not any(ext in extension for extension in cls.supported_extensions):
-            msg = (u("Invalid extension for engine '%s': '%s'") %
-                   (pprint_thing(cls.engine), pprint_thing(ext)))
-            raise ValueError(msg)
-        else:
-            return True
-
-    # Allow use as a contextmanager
-    def __enter__(self):
-        return self
-
-    def __exit__(self, exc_type, exc_value, traceback):
-        self.close()
-
-    def close(self):
-        """synonym for save, to make it more file-like"""
-        return self.save()
-
-
-class _Openpyxl1Writer(ExcelWriter):
-    engine = 'openpyxl1'
-    supported_extensions = ('.xlsx', '.xlsm')
-    openpyxl_majorver = 1
-
-    def __init__(self, path, engine=None, **engine_kwargs):
-        if not openpyxl_compat.is_compat(major_ver=self.openpyxl_majorver):
-            raise ValueError('Installed openpyxl is not supported at this '
-                             'time. Use {0}.x.y.'
-                             .format(self.openpyxl_majorver))
-        # Use the openpyxl module as the Excel writer.
-        from openpyxl.workbook import Workbook
-
-        super(_Openpyxl1Writer, self).__init__(path, **engine_kwargs)
-
-        # Create workbook object with default optimized_write=True.
-        self.book = Workbook()
-
-        # Openpyxl 1.6.1 adds a dummy sheet. We remove it.
-        if self.book.worksheets:
-            try:
-                self.book.remove(self.book.worksheets[0])
-            except AttributeError:
-
-                # compat
-                self.book.remove_sheet(self.book.worksheets[0])
-
-    def save(self):
-        """
-        Save workbook to disk.
-        """
-        return self.book.save(self.path)
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        # Write the frame cells using openpyxl.
-        from openpyxl.cell import get_column_letter
-
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.create_sheet()
-            wks.title = sheet_name
-            self.sheets[sheet_name] = wks
-
-        for cell in cells:
-            colletter = get_column_letter(startcol + cell.col + 1)
-            xcell = wks.cell("%s%s" % (colletter, startrow + cell.row + 1))
-            if (isinstance(cell.val, compat.string_types) and
-                    xcell.data_type_for_value(cell.val) != xcell.TYPE_STRING):
-                xcell.set_value_explicit(cell.val)
-            else:
-                xcell.value = _conv_value(cell.val)
-            style = None
-            if cell.style:
-                style = self._convert_to_style(cell.style)
-                for field in style.__fields__:
-                    xcell.style.__setattr__(field,
-                                            style.__getattribute__(field))
-
-            if isinstance(cell.val, datetime):
-                xcell.style.number_format.format_code = self.datetime_format
-            elif isinstance(cell.val, date):
-                xcell.style.number_format.format_code = self.date_format
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                cletterstart = get_column_letter(startcol + cell.col + 1)
-                cletterend = get_column_letter(startcol + cell.mergeend + 1)
-
-                wks.merge_cells('%s%s:%s%s' % (cletterstart,
-                                               startrow + cell.row + 1,
-                                               cletterend,
-                                               startrow + cell.mergestart + 1))
-
-                # Excel requires that the format of the first cell in a merged
-                # range is repeated in the rest of the merged range.
-                if style:
-                    first_row = startrow + cell.row + 1
-                    last_row = startrow + cell.mergestart + 1
-                    first_col = startcol + cell.col + 1
-                    last_col = startcol + cell.mergeend + 1
-
-                    for row in range(first_row, last_row + 1):
-                        for col in range(first_col, last_col + 1):
-                            if row == first_row and col == first_col:
-                                # Ignore first cell. It is already handled.
-                                continue
-                            colletter = get_column_letter(col)
-                            xcell = wks.cell("%s%s" % (colletter, row))
-                            for field in style.__fields__:
-                                xcell.style.__setattr__(
-                                    field, style.__getattribute__(field))
-
-    @classmethod
-    def _convert_to_style(cls, style_dict):
-        """
-        converts a style_dict to an openpyxl style object
-        Parameters
-        ----------
-        style_dict: style dictionary to convert
-        """
-
-        from openpyxl.style import Style
-        xls_style = Style()
-        for key, value in style_dict.items():
-            for nk, nv in value.items():
-                if key == "borders":
-                    (xls_style.borders.__getattribute__(nk)
-                     .__setattr__('border_style', nv))
-                else:
-                    xls_style.__getattribute__(key).__setattr__(nk, nv)
-
-        return xls_style
-
-
-register_writer(_Openpyxl1Writer)
-
-
-class _OpenpyxlWriter(_Openpyxl1Writer):
-    engine = 'openpyxl'
-
-
-register_writer(_OpenpyxlWriter)
-
-
-class _Openpyxl20Writer(_Openpyxl1Writer):
-    """
-    Note: Support for OpenPyxl v2 is currently EXPERIMENTAL (GH7565).
-    """
-    engine = 'openpyxl20'
-    openpyxl_majorver = 2
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        # Write the frame cells using openpyxl.
-        from openpyxl.cell import get_column_letter
-
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.create_sheet()
-            wks.title = sheet_name
-            self.sheets[sheet_name] = wks
-
-        for cell in cells:
-            colletter = get_column_letter(startcol + cell.col + 1)
-            xcell = wks["%s%s" % (colletter, startrow + cell.row + 1)]
-            xcell.value = _conv_value(cell.val)
-            style_kwargs = {}
-
-            # Apply format codes before cell.style to allow override
-            if isinstance(cell.val, datetime):
-                style_kwargs.update(self._convert_to_style_kwargs({
-                    'number_format': {'format_code': self.datetime_format}}))
-            elif isinstance(cell.val, date):
-                style_kwargs.update(self._convert_to_style_kwargs({
-                    'number_format': {'format_code': self.date_format}}))
-
-            if cell.style:
-                style_kwargs.update(self._convert_to_style_kwargs(cell.style))
-
-            if style_kwargs:
-                xcell.style = xcell.style.copy(**style_kwargs)
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                cletterstart = get_column_letter(startcol + cell.col + 1)
-                cletterend = get_column_letter(startcol + cell.mergeend + 1)
-
-                wks.merge_cells('%s%s:%s%s' % (cletterstart,
-                                               startrow + cell.row + 1,
-                                               cletterend,
-                                               startrow + cell.mergestart + 1))
-
-                # Excel requires that the format of the first cell in a merged
-                # range is repeated in the rest of the merged range.
-                if style_kwargs:
-                    first_row = startrow + cell.row + 1
-                    last_row = startrow + cell.mergestart + 1
-                    first_col = startcol + cell.col + 1
-                    last_col = startcol + cell.mergeend + 1
-
-                    for row in range(first_row, last_row + 1):
-                        for col in range(first_col, last_col + 1):
-                            if row == first_row and col == first_col:
-                                # Ignore first cell. It is already handled.
-                                continue
-                            colletter = get_column_letter(col)
-                            xcell = wks["%s%s" % (colletter, row)]
-                            xcell.style = xcell.style.copy(**style_kwargs)
-
-    @classmethod
-    def _convert_to_style_kwargs(cls, style_dict):
-        """
-        Convert a style_dict to a set of kwargs suitable for initializing
-        or updating-on-copy an openpyxl v2 style object
-        Parameters
-        ----------
-        style_dict : dict
-            A dict with zero or more of the following keys (or their synonyms).
-                'font'
-                'fill'
-                'border' ('borders')
-                'alignment'
-                'number_format'
-                'protection'
-        Returns
-        -------
-        style_kwargs : dict
-            A dict with the same, normalized keys as ``style_dict`` but each
-            value has been replaced with a native openpyxl style object of the
-            appropriate class.
-        """
-
-        _style_key_map = {
-            'borders': 'border',
-        }
-
-        style_kwargs = {}
-        for k, v in style_dict.items():
-            if k in _style_key_map:
-                k = _style_key_map[k]
-            _conv_to_x = getattr(cls, '_convert_to_{0}'.format(k),
-                                 lambda x: None)
-            new_v = _conv_to_x(v)
-            if new_v:
-                style_kwargs[k] = new_v
-
-        return style_kwargs
-
-    @classmethod
-    def _convert_to_color(cls, color_spec):
-        """
-        Convert ``color_spec`` to an openpyxl v2 Color object
-        Parameters
-        ----------
-        color_spec : str, dict
-            A 32-bit ARGB hex string, or a dict with zero or more of the
-            following keys.
-                'rgb'
-                'indexed'
-                'auto'
-                'theme'
-                'tint'
-                'index'
-                'type'
-        Returns
-        -------
-        color : openpyxl.styles.Color
-        """
-
-        from openpyxl.styles import Color
-
-        if isinstance(color_spec, str):
-            return Color(color_spec)
-        else:
-            return Color(**color_spec)
-
-    @classmethod
-    def _convert_to_font(cls, font_dict):
-        """
-        Convert ``font_dict`` to an openpyxl v2 Font object
-        Parameters
-        ----------
-        font_dict : dict
-            A dict with zero or more of the following keys (or their synonyms).
-                'name'
-                'size' ('sz')
-                'bold' ('b')
-                'italic' ('i')
-                'underline' ('u')
-                'strikethrough' ('strike')
-                'color'
-                'vertAlign' ('vertalign')
-                'charset'
-                'scheme'
-                'family'
-                'outline'
-                'shadow'
-                'condense'
-        Returns
-        -------
-        font : openpyxl.styles.Font
-        """
-
-        from openpyxl.styles import Font
-
-        _font_key_map = {
-            'sz': 'size',
-            'b': 'bold',
-            'i': 'italic',
-            'u': 'underline',
-            'strike': 'strikethrough',
-            'vertalign': 'vertAlign',
-        }
-
-        font_kwargs = {}
-        for k, v in font_dict.items():
-            if k in _font_key_map:
-                k = _font_key_map[k]
-            if k == 'color':
-                v = cls._convert_to_color(v)
-            font_kwargs[k] = v
-
-        return Font(**font_kwargs)
-
-    @classmethod
-    def _convert_to_stop(cls, stop_seq):
-        """
-        Convert ``stop_seq`` to a list of openpyxl v2 Color objects,
-        suitable for initializing the ``GradientFill`` ``stop`` parameter.
-        Parameters
-        ----------
-        stop_seq : iterable
-            An iterable that yields objects suitable for consumption by
-            ``_convert_to_color``.
-        Returns
-        -------
-        stop : list of openpyxl.styles.Color
-        """
-
-        return map(cls._convert_to_color, stop_seq)
-
-    @classmethod
-    def _convert_to_fill(cls, fill_dict):
-        """
-        Convert ``fill_dict`` to an openpyxl v2 Fill object
-        Parameters
-        ----------
-        fill_dict : dict
-            A dict with one or more of the following keys (or their synonyms),
-                'fill_type' ('patternType', 'patterntype')
-                'start_color' ('fgColor', 'fgcolor')
-                'end_color' ('bgColor', 'bgcolor')
-            or one or more of the following keys (or their synonyms).
-                'type' ('fill_type')
-                'degree'
-                'left'
-                'right'
-                'top'
-                'bottom'
-                'stop'
-        Returns
-        -------
-        fill : openpyxl.styles.Fill
-        """
-
-        from openpyxl.styles import PatternFill, GradientFill
-
-        _pattern_fill_key_map = {
-            'patternType': 'fill_type',
-            'patterntype': 'fill_type',
-            'fgColor': 'start_color',
-            'fgcolor': 'start_color',
-            'bgColor': 'end_color',
-            'bgcolor': 'end_color',
-        }
-
-        _gradient_fill_key_map = {
-            'fill_type': 'type',
-        }
-
-        pfill_kwargs = {}
-        gfill_kwargs = {}
-        for k, v in fill_dict.items():
-            pk = gk = None
-            if k in _pattern_fill_key_map:
-                pk = _pattern_fill_key_map[k]
-            if k in _gradient_fill_key_map:
-                gk = _gradient_fill_key_map[k]
-            if pk in ['start_color', 'end_color']:
-                v = cls._convert_to_color(v)
-            if gk == 'stop':
-                v = cls._convert_to_stop(v)
-            if pk:
-                pfill_kwargs[pk] = v
-            elif gk:
-                gfill_kwargs[gk] = v
-            else:
-                pfill_kwargs[k] = v
-                gfill_kwargs[k] = v
-
-        try:
-            return PatternFill(**pfill_kwargs)
-        except TypeError:
-            return GradientFill(**gfill_kwargs)
-
-    @classmethod
-    def _convert_to_side(cls, side_spec):
-        """
-        Convert ``side_spec`` to an openpyxl v2 Side object
-        Parameters
-        ----------
-        side_spec : str, dict
-            A string specifying the border style, or a dict with zero or more
-            of the following keys (or their synonyms).
-                'style' ('border_style')
-                'color'
-        Returns
-        -------
-        side : openpyxl.styles.Side
-        """
-
-        from openpyxl.styles import Side
-
-        _side_key_map = {
-            'border_style': 'style',
-        }
-
-        if isinstance(side_spec, str):
-            return Side(style=side_spec)
-
-        side_kwargs = {}
-        for k, v in side_spec.items():
-            if k in _side_key_map:
-                k = _side_key_map[k]
-            if k == 'color':
-                v = cls._convert_to_color(v)
-            side_kwargs[k] = v
-
-        return Side(**side_kwargs)
-
-    @classmethod
-    def _convert_to_border(cls, border_dict):
-        """
-        Convert ``border_dict`` to an openpyxl v2 Border object
-        Parameters
-        ----------
-        border_dict : dict
-            A dict with zero or more of the following keys (or their synonyms).
-                'left'
-                'right'
-                'top'
-                'bottom'
-                'diagonal'
-                'diagonal_direction'
-                'vertical'
-                'horizontal'
-                'diagonalUp' ('diagonalup')
-                'diagonalDown' ('diagonaldown')
-                'outline'
-        Returns
-        -------
-        border : openpyxl.styles.Border
-        """
-
-        from openpyxl.styles import Border
-
-        _border_key_map = {
-            'diagonalup': 'diagonalUp',
-            'diagonaldown': 'diagonalDown',
-        }
-
-        border_kwargs = {}
-        for k, v in border_dict.items():
-            if k in _border_key_map:
-                k = _border_key_map[k]
-            if k == 'color':
-                v = cls._convert_to_color(v)
-            if k in ['left', 'right', 'top', 'bottom', 'diagonal']:
-                v = cls._convert_to_side(v)
-            border_kwargs[k] = v
-
-        return Border(**border_kwargs)
-
-    @classmethod
-    def _convert_to_alignment(cls, alignment_dict):
-        """
-        Convert ``alignment_dict`` to an openpyxl v2 Alignment object
-        Parameters
-        ----------
-        alignment_dict : dict
-            A dict with zero or more of the following keys (or their synonyms).
-                'horizontal'
-                'vertical'
-                'text_rotation'
-                'wrap_text'
-                'shrink_to_fit'
-                'indent'
-        Returns
-        -------
-        alignment : openpyxl.styles.Alignment
-        """
-
-        from openpyxl.styles import Alignment
-
-        return Alignment(**alignment_dict)
-
-    @classmethod
-    def _convert_to_number_format(cls, number_format_dict):
-        """
-        Convert ``number_format_dict`` to an openpyxl v2.1.0 number format
-        initializer.
-        Parameters
-        ----------
-        number_format_dict : dict
-            A dict with zero or more of the following keys.
-                'format_code' : str
-        Returns
-        -------
-        number_format : str
-        """
-        try:
-            # >= 2.0.0 < 2.1.0
-            from openpyxl.styles import NumberFormat
-            return NumberFormat(**number_format_dict)
-        except:
-            # >= 2.1.0
-            return number_format_dict['format_code']
-
-    @classmethod
-    def _convert_to_protection(cls, protection_dict):
-        """
-        Convert ``protection_dict`` to an openpyxl v2 Protection object.
-        Parameters
-        ----------
-        protection_dict : dict
-            A dict with zero or more of the following keys.
-                'locked'
-                'hidden'
-        Returns
-        -------
-        """
-
-        from openpyxl.styles import Protection
-
-        return Protection(**protection_dict)
-
-
-register_writer(_Openpyxl20Writer)
-
-
-class _Openpyxl22Writer(_Openpyxl20Writer):
-    """
-    Note: Support for OpenPyxl v2.2 is currently EXPERIMENTAL (GH7565).
-    """
-    engine = 'openpyxl22'
-    openpyxl_majorver = 2
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        # Write the frame cells using openpyxl.
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        _style_cache = {}
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.create_sheet()
-            wks.title = sheet_name
-            self.sheets[sheet_name] = wks
-
-        if _validate_freeze_panes(freeze_panes):
-            wks.freeze_panes = wks.cell(row=freeze_panes[0] + 1,
-                                        column=freeze_panes[1] + 1)
-
-        for cell in cells:
-            xcell = wks.cell(
-                row=startrow + cell.row + 1,
-                column=startcol + cell.col + 1
-            )
-            xcell.value = _conv_value(cell.val)
-
-            style_kwargs = {}
-            if cell.style:
-                key = str(cell.style)
-                style_kwargs = _style_cache.get(key)
-                if style_kwargs is None:
-                    style_kwargs = self._convert_to_style_kwargs(cell.style)
-                    _style_cache[key] = style_kwargs
-
-            if style_kwargs:
-                for k, v in style_kwargs.items():
-                    setattr(xcell, k, v)
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-
-                wks.merge_cells(
-                    start_row=startrow + cell.row + 1,
-                    start_column=startcol + cell.col + 1,
-                    end_column=startcol + cell.mergeend + 1,
-                    end_row=startrow + cell.mergestart + 1
-                )
-
-                # When cells are merged only the top-left cell is preserved
-                # The behaviour of the other cells in a merged range is
-                # undefined
-                if style_kwargs:
-                    first_row = startrow + cell.row + 1
-                    last_row = startrow + cell.mergestart + 1
-                    first_col = startcol + cell.col + 1
-                    last_col = startcol + cell.mergeend + 1
-
-                    for row in range(first_row, last_row + 1):
-                        for col in range(first_col, last_col + 1):
-                            if row == first_row and col == first_col:
-                                # Ignore first cell. It is already handled.
-                                continue
-                            xcell = wks.cell(column=col, row=row)
-                            for k, v in style_kwargs.items():
-                                setattr(xcell, k, v)
-
-
-register_writer(_Openpyxl22Writer)
-
-
-class _XlwtWriter(ExcelWriter):
-    engine = 'xlwt'
-    supported_extensions = ('.xls',)
-
-    def __init__(self, path, engine=None, encoding=None, **engine_kwargs):
-        # Use the xlwt module as the Excel writer.
-        import xlwt
-        engine_kwargs['engine'] = engine
-        super(_XlwtWriter, self).__init__(path, **engine_kwargs)
-
-        if encoding is None:
-            encoding = 'ascii'
-        self.book = xlwt.Workbook(encoding=encoding)
-        self.fm_datetime = xlwt.easyxf(num_format_str=self.datetime_format)
-        self.fm_date = xlwt.easyxf(num_format_str=self.date_format)
-
-    def save(self):
-        """
-        Save workbook to disk.
-        """
-        return self.book.save(self.path)
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        # Write the frame cells using xlwt.
-
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.add_sheet(sheet_name)
-            self.sheets[sheet_name] = wks
-
-        if _validate_freeze_panes(freeze_panes):
-            wks.set_panes_frozen(True)
-            wks.set_horz_split_pos(freeze_panes[0])
-            wks.set_vert_split_pos(freeze_panes[1])
-
-        style_dict = {}
-
-        for cell in cells:
-            val = _conv_value(cell.val)
-
-            num_format_str = None
-            if isinstance(cell.val, datetime):
-                num_format_str = self.datetime_format
-            elif isinstance(cell.val, date):
-                num_format_str = self.date_format
-
-            stylekey = libjson.dumps(cell.style)
-            if num_format_str:
-                stylekey += num_format_str
-
-            if stylekey in style_dict:
-                style = style_dict[stylekey]
-            else:
-                style = self._convert_to_style(cell.style, num_format_str)
-                style_dict[stylekey] = style
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                wks.write_merge(startrow + cell.row,
-                                startrow + cell.mergestart,
-                                startcol + cell.col,
-                                startcol + cell.mergeend,
-                                val, style)
-            else:
-                wks.write(startrow + cell.row,
-                          startcol + cell.col,
-                          val, style)
-
-    @classmethod
-    def _style_to_xlwt(cls, item, firstlevel=True, field_sep=',',
-                       line_sep=';'):
-        """helper which recursively generate an xlwt easy style string
-        for example:
-
-            hstyle = {"font": {"bold": True},
-            "border": {"top": "thin",
-                    "right": "thin",
-                    "bottom": "thin",
-                    "left": "thin"},
-            "align": {"horiz": "center"}}
-            will be converted to
-            font: bold on; \
-                    border: top thin, right thin, bottom thin, left thin; \
-                    align: horiz center;
-        """
-        if hasattr(item, 'items'):
-            if firstlevel:
-                it = ["%s: %s" % (key, cls._style_to_xlwt(value, False))
-                      for key, value in item.items()]
-                out = "%s " % (line_sep).join(it)
-                return out
-            else:
-                it = ["%s %s" % (key, cls._style_to_xlwt(value, False))
-                      for key, value in item.items()]
-                out = "%s " % (field_sep).join(it)
-                return out
-        else:
-            item = "%s" % item
-            item = item.replace("True", "on")
-            item = item.replace("False", "off")
-            return item
-
-    @classmethod
-    def _convert_to_style(cls, style_dict, num_format_str=None):
-        """
-        converts a style_dict to an xlwt style object
-        Parameters
-        ----------
-        style_dict: style dictionary to convert
-        num_format_str: optional number format string
-        """
-        import xlwt
-
-        if style_dict:
-            xlwt_stylestr = cls._style_to_xlwt(style_dict)
-            style = xlwt.easyxf(xlwt_stylestr, field_sep=',', line_sep=';')
-        else:
-            style = xlwt.XFStyle()
-        if num_format_str is not None:
-            style.num_format_str = num_format_str
-
-        return style
-
-
-register_writer(_XlwtWriter)
-
-
-class _XlsxWriter(ExcelWriter):
-    engine = 'xlsxwriter'
-    supported_extensions = ('.xlsx',)
-
-    def __init__(self, path, engine=None,
-                 date_format=None, datetime_format=None, **engine_kwargs):
-        # Use the xlsxwriter module as the Excel writer.
-        import xlsxwriter
-
-        super(_XlsxWriter, self).__init__(path, engine=engine,
-                                          date_format=date_format,
-                                          datetime_format=datetime_format,
-                                          **engine_kwargs)
-
-        self.book = xlsxwriter.Workbook(path, **engine_kwargs)
-
-    def save(self):
-        """
-        Save workbook to disk.
-        """
-
-        return self.book.close()
-
-    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
-                    freeze_panes=None):
-        # Write the frame cells using xlsxwriter.
-        sheet_name = self._get_sheet_name(sheet_name)
-
-        if sheet_name in self.sheets:
-            wks = self.sheets[sheet_name]
-        else:
-            wks = self.book.add_worksheet(sheet_name)
-            self.sheets[sheet_name] = wks
-
-        style_dict = {}
-
-        if _validate_freeze_panes(freeze_panes):
-            wks.freeze_panes(*(freeze_panes))
-
-        for cell in cells:
-            val = _conv_value(cell.val)
-
-            num_format_str = None
-            if isinstance(cell.val, datetime):
-                num_format_str = self.datetime_format
-            elif isinstance(cell.val, date):
-                num_format_str = self.date_format
-
-            stylekey = libjson.dumps(cell.style)
-            if num_format_str:
-                stylekey += num_format_str
-
-            if stylekey in style_dict:
-                style = style_dict[stylekey]
-            else:
-                style = self._convert_to_style(cell.style, num_format_str)
-                style_dict[stylekey] = style
-
-            if cell.mergestart is not None and cell.mergeend is not None:
-                wks.merge_range(startrow + cell.row,
-                                startcol + cell.col,
-                                startrow + cell.mergestart,
-                                startcol + cell.mergeend,
-                                cell.val, style)
-            else:
-                wks.write(startrow + cell.row,
-                          startcol + cell.col,
-                          val, style)
-
-    def _convert_to_style(self, style_dict, num_format_str=None):
-        """
-        converts a style_dict to an xlsxwriter format object
-        Parameters
-        ----------
-        style_dict: style dictionary to convert
-        num_format_str: optional number format string
-        """
-
-        # If there is no formatting we don't create a format object.
-        if num_format_str is None and style_dict is None:
-            return None
-
-        # Create a XlsxWriter format object.
-        xl_format = self.book.add_format()
-
-        if num_format_str is not None:
-            xl_format.set_num_format(num_format_str)
-
-        if style_dict is None:
-            return xl_format
-
-        # Map the cell font to XlsxWriter font properties.
-        if style_dict.get('font'):
-            font = style_dict['font']
-            if font.get('bold'):
-                xl_format.set_bold()
-
-        # Map the alignment to XlsxWriter alignment properties.
-        alignment = style_dict.get('alignment')
-        if alignment:
-            if (alignment.get('horizontal') and
-                    alignment['horizontal'] == 'center'):
-                xl_format.set_align('center')
-            if (alignment.get('vertical') and
-                    alignment['vertical'] == 'top'):
-                xl_format.set_align('top')
-
-        # Map the cell borders to XlsxWriter border properties.
-        if style_dict.get('borders'):
-            xl_format.set_border()
-
-        return xl_format
-
-
-register_writer(_XlsxWriter)
diff --git a/pandas/io/excel/__init__.py b/pandas/io/excel/__init__.py
new file mode 100644
index 0000000000000..704789cb6061e
--- /dev/null
+++ b/pandas/io/excel/__init__.py
@@ -0,0 +1,16 @@
+from pandas.io.excel._base import read_excel, ExcelWriter, ExcelFile
+from pandas.io.excel._openpyxl import _OpenpyxlWriter
+from pandas.io.excel._util import register_writer
+from pandas.io.excel._xlsxwriter import _XlsxWriter
+from pandas.io.excel._xlwt import _XlwtWriter
+
+__all__ = ["read_excel", "ExcelWriter", "ExcelFile"]
+
+
+register_writer(_OpenpyxlWriter)
+
+
+register_writer(_XlwtWriter)
+
+
+register_writer(_XlsxWriter)
diff --git a/pandas/io/excel/_base.py b/pandas/io/excel/_base.py
new file mode 100644
index 0000000000000..c6d390692c789
--- /dev/null
+++ b/pandas/io/excel/_base.py
@@ -0,0 +1,852 @@
+import abc
+from collections import OrderedDict
+from datetime import date, datetime, timedelta
+import os
+from textwrap import fill
+import warnings
+
+import pandas.compat as compat
+from pandas.compat import add_metaclass, range, string_types, u
+from pandas.errors import EmptyDataError
+from pandas.util._decorators import Appender, deprecate_kwarg
+
+from pandas.core.dtypes.common import (
+    is_bool, is_float, is_integer, is_list_like)
+
+from pandas.core import config
+from pandas.core.frame import DataFrame
+
+from pandas.io.common import _NA_VALUES, _stringify_path, _validate_header_arg
+from pandas.io.excel._util import (
+    _fill_mi_header, _get_default_writer, _maybe_convert_to_string,
+    _maybe_convert_usecols, _pop_header_name, get_writer)
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.parsers import TextParser
+
+_read_excel_doc = """
+Read an Excel file into a pandas DataFrame.
+
+Support both `xls` and `xlsx` file extensions from a local filesystem or URL.
+Support an option to read a single sheet or a list of sheets.
+
+Parameters
+----------
+io : str, file descriptor, pathlib.Path, ExcelFile or xlrd.Book
+    The string could be a URL. Valid URL schemes include http, ftp, s3,
+    gcs, and file. For file URLs, a host is expected. For instance, a local
+    file could be /path/to/workbook.xlsx.
+sheet_name : str, int, list, or None, default 0
+    Strings are used for sheet names. Integers are used in zero-indexed
+    sheet positions. Lists of strings/integers are used to request
+    multiple sheets. Specify None to get all sheets.
+
+    Available cases:
+
+    * Defaults to ``0``: 1st sheet as a `DataFrame`
+    * ``1``: 2nd sheet as a `DataFrame`
+    * ``"Sheet1"``: Load sheet with name "Sheet1"
+    * ``[0, 1, "Sheet5"]``: Load first, second and sheet named "Sheet5"
+      as a dict of `DataFrame`
+    * None: All sheets.
+
+header : int, list of int, default 0
+    Row (0-indexed) to use for the column labels of the parsed
+    DataFrame. If a list of integers is passed those row positions will
+    be combined into a ``MultiIndex``. Use None if there is no header.
+names : array-like, default None
+    List of column names to use. If file contains no header row,
+    then you should explicitly pass header=None.
+index_col : int, list of int, default None
+    Column (0-indexed) to use as the row labels of the DataFrame.
+    Pass None if there is no such column.  If a list is passed,
+    those columns will be combined into a ``MultiIndex``.  If a
+    subset of data is selected with ``usecols``, index_col
+    is based on the subset.
+parse_cols : int or list, default None
+    Alias of `usecols`.
+
+    .. deprecated:: 0.21.0
+       Use `usecols` instead.
+
+usecols : int, str, list-like, or callable default None
+    Return a subset of the columns.
+    * If None, then parse all columns.
+    * If int, then indicates last column to be parsed.
+
+    .. deprecated:: 0.24.0
+       Pass in a list of int instead from 0 to `usecols` inclusive.
+
+    * If str, then indicates comma separated list of Excel column letters
+      and column ranges (e.g. "A:E" or "A,C,E:F"). Ranges are inclusive of
+      both sides.
+    * If list of int, then indicates list of column numbers to be parsed.
+    * If list of string, then indicates list of column names to be parsed.
+
+    .. versionadded:: 0.24.0
+
+    * If callable, then evaluate each column name against it and parse the
+      column if the callable returns ``True``.
+
+    .. versionadded:: 0.24.0
+
+squeeze : bool, default False
+    If the parsed data only contains one column then return a Series.
+dtype : Type name or dict of column -> type, default None
+    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
+    Use `object` to preserve data as stored in Excel and not interpret dtype.
+    If converters are specified, they will be applied INSTEAD
+    of dtype conversion.
+
+    .. versionadded:: 0.20.0
+
+engine : str, default None
+    If io is not a buffer or path, this must be set to identify io.
+    Acceptable values are None or xlrd.
+converters : dict, default None
+    Dict of functions for converting values in certain columns. Keys can
+    either be integers or column labels, values are functions that take one
+    input argument, the Excel cell content, and return the transformed
+    content.
+true_values : list, default None
+    Values to consider as True.
+
+    .. versionadded:: 0.19.0
+
+false_values : list, default None
+    Values to consider as False.
+
+    .. versionadded:: 0.19.0
+
+skiprows : list-like
+    Rows to skip at the beginning (0-indexed).
+nrows : int, default None
+    Number of rows to parse.
+
+    .. versionadded:: 0.23.0
+
+na_values : scalar, str, list-like, or dict, default None
+    Additional strings to recognize as NA/NaN. If dict passed, specific
+    per-column NA values. By default the following values are interpreted
+    as NaN: '""" + fill("', '".join(
+    sorted(_NA_VALUES)), 70, subsequent_indent="    ") + """'.
+keep_default_na : bool, default True
+    If na_values are specified and keep_default_na is False the default NaN
+    values are overridden, otherwise they're appended to.
+verbose : bool, default False
+    Indicate number of NA values placed in non-numeric columns.
+parse_dates : bool, list-like, or dict, default False
+    The behavior is as follows:
+
+    * bool. If True -> try parsing the index.
+    * list of int or names. e.g. If [1, 2, 3] -> try parsing columns 1, 2, 3
+      each as a separate date column.
+    * list of lists. e.g.  If [[1, 3]] -> combine columns 1 and 3 and parse as
+      a single date column.
+    * dict, e.g. {{'foo' : [1, 3]}} -> parse columns 1, 3 as date and call
+      result 'foo'
+
+    If a column or index contains an unparseable date, the entire column or
+    index will be returned unaltered as an object data type. For non-standard
+    datetime parsing, use ``pd.to_datetime`` after ``pd.read_csv``
+
+    Note: A fast-path exists for iso8601-formatted dates.
+date_parser : function, optional
+    Function to use for converting a sequence of string columns to an array of
+    datetime instances. The default uses ``dateutil.parser.parser`` to do the
+    conversion. Pandas will try to call `date_parser` in three different ways,
+    advancing to the next if an exception occurs: 1) Pass one or more arrays
+    (as defined by `parse_dates`) as arguments; 2) concatenate (row-wise) the
+    string values from the columns defined by `parse_dates` into a single array
+    and pass that; and 3) call `date_parser` once for each row using one or
+    more strings (corresponding to the columns defined by `parse_dates`) as
+    arguments.
+thousands : str, default None
+    Thousands separator for parsing string columns to numeric.  Note that
+    this parameter is only necessary for columns stored as TEXT in Excel,
+    any numeric columns will automatically be parsed, regardless of display
+    format.
+comment : str, default None
+    Comments out remainder of line. Pass a character or characters to this
+    argument to indicate comments in the input file. Any data between the
+    comment string and the end of the current line is ignored.
+skip_footer : int, default 0
+    Alias of `skipfooter`.
+
+    .. deprecated:: 0.23.0
+       Use `skipfooter` instead.
+skipfooter : int, default 0
+    Rows at the end to skip (0-indexed).
+convert_float : bool, default True
+    Convert integral floats to int (i.e., 1.0 --> 1). If False, all numeric
+    data will be read in as floats: Excel stores all numbers as floats
+    internally.
+mangle_dupe_cols : bool, default True
+    Duplicate columns will be specified as 'X', 'X.1', ...'X.N', rather than
+    'X'...'X'. Passing in False will cause data to be overwritten if there
+    are duplicate names in the columns.
+**kwds : optional
+        Optional keyword arguments can be passed to ``TextFileReader``.
+
+Returns
+-------
+DataFrame or dict of DataFrames
+    DataFrame from the passed in Excel file. See notes in sheet_name
+    argument for more information on when a dict of DataFrames is returned.
+
+See Also
+--------
+to_excel : Write DataFrame to an Excel file.
+to_csv : Write DataFrame to a comma-separated values (csv) file.
+read_csv : Read a comma-separated values (csv) file into DataFrame.
+read_fwf : Read a table of fixed-width formatted lines into DataFrame.
+
+Examples
+--------
+The file can be read using the file name as string or an open file object:
+
+>>> pd.read_excel('tmp.xlsx', index_col=0)  # doctest: +SKIP
+       Name  Value
+0   string1      1
+1   string2      2
+2  #Comment      3
+
+>>> pd.read_excel(open('tmp.xlsx', 'rb'),
+...               sheet_name='Sheet3')  # doctest: +SKIP
+   Unnamed: 0      Name  Value
+0           0   string1      1
+1           1   string2      2
+2           2  #Comment      3
+
+Index and header can be specified via the `index_col` and `header` arguments
+
+>>> pd.read_excel('tmp.xlsx', index_col=None, header=None)  # doctest: +SKIP
+     0         1      2
+0  NaN      Name  Value
+1  0.0   string1      1
+2  1.0   string2      2
+3  2.0  #Comment      3
+
+Column types are inferred but can be explicitly specified
+
+>>> pd.read_excel('tmp.xlsx', index_col=0,
+...               dtype={'Name': str, 'Value': float})  # doctest: +SKIP
+       Name  Value
+0   string1    1.0
+1   string2    2.0
+2  #Comment    3.0
+
+True, False, and NA values, and thousands separators have defaults,
+but can be explicitly specified, too. Supply the values you would like
+as strings or lists of strings!
+
+>>> pd.read_excel('tmp.xlsx', index_col=0,
+...               na_values=['string1', 'string2'])  # doctest: +SKIP
+       Name  Value
+0       NaN      1
+1       NaN      2
+2  #Comment      3
+
+Comment lines in the excel input file can be skipped using the `comment` kwarg
+
+>>> pd.read_excel('tmp.xlsx', index_col=0, comment='#')  # doctest: +SKIP
+      Name  Value
+0  string1    1.0
+1  string2    2.0
+2     None    NaN
+"""
+
+
+@Appender(_read_excel_doc)
+@deprecate_kwarg("parse_cols", "usecols")
+@deprecate_kwarg("skip_footer", "skipfooter")
+def read_excel(io,
+               sheet_name=0,
+               header=0,
+               names=None,
+               index_col=None,
+               parse_cols=None,
+               usecols=None,
+               squeeze=False,
+               dtype=None,
+               engine=None,
+               converters=None,
+               true_values=None,
+               false_values=None,
+               skiprows=None,
+               nrows=None,
+               na_values=None,
+               keep_default_na=True,
+               verbose=False,
+               parse_dates=False,
+               date_parser=None,
+               thousands=None,
+               comment=None,
+               skip_footer=0,
+               skipfooter=0,
+               convert_float=True,
+               mangle_dupe_cols=True,
+               **kwds):
+
+    # Can't use _deprecate_kwarg since sheetname=None has a special meaning
+    if is_integer(sheet_name) and sheet_name == 0 and 'sheetname' in kwds:
+        warnings.warn("The `sheetname` keyword is deprecated, use "
+                      "`sheet_name` instead", FutureWarning, stacklevel=2)
+        sheet_name = kwds.pop("sheetname")
+
+    if 'sheet' in kwds:
+        raise TypeError("read_excel() got an unexpected keyword argument "
+                        "`sheet`")
+
+    if not isinstance(io, ExcelFile):
+        io = ExcelFile(io, engine=engine)
+
+    return io.parse(
+        sheet_name=sheet_name,
+        header=header,
+        names=names,
+        index_col=index_col,
+        usecols=usecols,
+        squeeze=squeeze,
+        dtype=dtype,
+        converters=converters,
+        true_values=true_values,
+        false_values=false_values,
+        skiprows=skiprows,
+        nrows=nrows,
+        na_values=na_values,
+        keep_default_na=keep_default_na,
+        verbose=verbose,
+        parse_dates=parse_dates,
+        date_parser=date_parser,
+        thousands=thousands,
+        comment=comment,
+        skipfooter=skipfooter,
+        convert_float=convert_float,
+        mangle_dupe_cols=mangle_dupe_cols,
+        **kwds)
+
+
+@add_metaclass(abc.ABCMeta)
+class _BaseExcelReader(object):
+
+    @property
+    @abc.abstractmethod
+    def sheet_names(self):
+        pass
+
+    @abc.abstractmethod
+    def get_sheet_by_name(self, name):
+        pass
+
+    @abc.abstractmethod
+    def get_sheet_by_index(self, index):
+        pass
+
+    @abc.abstractmethod
+    def get_sheet_data(self, sheet, convert_float):
+        pass
+
+    def parse(self,
+              sheet_name=0,
+              header=0,
+              names=None,
+              index_col=None,
+              usecols=None,
+              squeeze=False,
+              dtype=None,
+              true_values=None,
+              false_values=None,
+              skiprows=None,
+              nrows=None,
+              na_values=None,
+              verbose=False,
+              parse_dates=False,
+              date_parser=None,
+              thousands=None,
+              comment=None,
+              skipfooter=0,
+              convert_float=True,
+              mangle_dupe_cols=True,
+              **kwds):
+
+        _validate_header_arg(header)
+
+        ret_dict = False
+
+        # Keep sheetname to maintain backwards compatibility.
+        if isinstance(sheet_name, list):
+            sheets = sheet_name
+            ret_dict = True
+        elif sheet_name is None:
+            sheets = self.sheet_names
+            ret_dict = True
+        else:
+            sheets = [sheet_name]
+
+        # handle same-type duplicates.
+        sheets = list(OrderedDict.fromkeys(sheets).keys())
+
+        output = OrderedDict()
+
+        for asheetname in sheets:
+            if verbose:
+                print("Reading sheet {sheet}".format(sheet=asheetname))
+
+            if isinstance(asheetname, compat.string_types):
+                sheet = self.get_sheet_by_name(asheetname)
+            else:  # assume an integer if not a string
+                sheet = self.get_sheet_by_index(asheetname)
+
+            data = self.get_sheet_data(sheet, convert_float)
+            usecols = _maybe_convert_usecols(usecols)
+
+            if sheet.nrows == 0:
+                output[asheetname] = DataFrame()
+                continue
+
+            if is_list_like(header) and len(header) == 1:
+                header = header[0]
+
+            # forward fill and pull out names for MultiIndex column
+            header_names = None
+            if header is not None and is_list_like(header):
+                header_names = []
+                control_row = [True] * len(data[0])
+
+                for row in header:
+                    if is_integer(skiprows):
+                        row += skiprows
+
+                    data[row], control_row = _fill_mi_header(data[row],
+                                                             control_row)
+
+                    if index_col is not None:
+                        header_name, _ = _pop_header_name(data[row], index_col)
+                        header_names.append(header_name)
+
+            if is_list_like(index_col):
+                # Forward fill values for MultiIndex index.
+                if not is_list_like(header):
+                    offset = 1 + header
+                else:
+                    offset = 1 + max(header)
+
+                # Check if we have an empty dataset
+                # before trying to collect data.
+                if offset < len(data):
+                    for col in index_col:
+                        last = data[offset][col]
+
+                        for row in range(offset + 1, len(data)):
+                            if data[row][col] == '' or data[row][col] is None:
+                                data[row][col] = last
+                            else:
+                                last = data[row][col]
+
+            has_index_names = is_list_like(header) and len(header) > 1
+
+            # GH 12292 : error when read one empty column from excel file
+            try:
+                parser = TextParser(data,
+                                    names=names,
+                                    header=header,
+                                    index_col=index_col,
+                                    has_index_names=has_index_names,
+                                    squeeze=squeeze,
+                                    dtype=dtype,
+                                    true_values=true_values,
+                                    false_values=false_values,
+                                    skiprows=skiprows,
+                                    nrows=nrows,
+                                    na_values=na_values,
+                                    parse_dates=parse_dates,
+                                    date_parser=date_parser,
+                                    thousands=thousands,
+                                    comment=comment,
+                                    skipfooter=skipfooter,
+                                    usecols=usecols,
+                                    mangle_dupe_cols=mangle_dupe_cols,
+                                    **kwds)
+
+                output[asheetname] = parser.read(nrows=nrows)
+
+                if not squeeze or isinstance(output[asheetname], DataFrame):
+                    if header_names:
+                        output[asheetname].columns = output[
+                            asheetname].columns.set_names(header_names)
+                    elif compat.PY2:
+                        output[asheetname].columns = _maybe_convert_to_string(
+                            output[asheetname].columns)
+
+            except EmptyDataError:
+                # No Data, return an empty DataFrame
+                output[asheetname] = DataFrame()
+
+        if ret_dict:
+            return output
+        else:
+            return output[asheetname]
+
+
+@add_metaclass(abc.ABCMeta)
+class ExcelWriter(object):
+    """
+    Class for writing DataFrame objects into excel sheets, default is to use
+    xlwt for xls, openpyxl for xlsx.  See DataFrame.to_excel for typical usage.
+
+    Parameters
+    ----------
+    path : string
+        Path to xls or xlsx file.
+    engine : string (optional)
+        Engine to use for writing. If None, defaults to
+        ``io.excel.<extension>.writer``.  NOTE: can only be passed as a keyword
+        argument.
+    date_format : string, default None
+        Format string for dates written into Excel files (e.g. 'YYYY-MM-DD')
+    datetime_format : string, default None
+        Format string for datetime objects written into Excel files
+        (e.g. 'YYYY-MM-DD HH:MM:SS')
+    mode : {'w' or 'a'}, default 'w'
+        File mode to use (write or append).
+
+        .. versionadded:: 0.24.0
+
+    Attributes
+    ----------
+    None
+
+    Methods
+    -------
+    None
+
+    Notes
+    -----
+    None of the methods and properties are considered public.
+
+    For compatibility with CSV writers, ExcelWriter serializes lists
+    and dicts to strings before writing.
+
+    Examples
+    --------
+    Default usage:
+
+    >>> with ExcelWriter('path_to_file.xlsx') as writer:
+    ...     df.to_excel(writer)
+
+    To write to separate sheets in a single file:
+
+    >>> with ExcelWriter('path_to_file.xlsx') as writer:
+    ...     df1.to_excel(writer, sheet_name='Sheet1')
+    ...     df2.to_excel(writer, sheet_name='Sheet2')
+
+    You can set the date format or datetime format:
+
+    >>> with ExcelWriter('path_to_file.xlsx',
+                          date_format='YYYY-MM-DD',
+                          datetime_format='YYYY-MM-DD HH:MM:SS') as writer:
+    ...     df.to_excel(writer)
+
+    You can also append to an existing Excel file:
+
+    >>> with ExcelWriter('path_to_file.xlsx', mode='a') as writer:
+    ...     df.to_excel(writer, sheet_name='Sheet3')
+    """
+    # Defining an ExcelWriter implementation (see abstract methods for more...)
+
+    # - Mandatory
+    #   - ``write_cells(self, cells, sheet_name=None, startrow=0, startcol=0)``
+    #     --> called to write additional DataFrames to disk
+    #   - ``supported_extensions`` (tuple of supported extensions), used to
+    #      check that engine supports the given extension.
+    #   - ``engine`` - string that gives the engine name. Necessary to
+    #     instantiate class directly and bypass ``ExcelWriterMeta`` engine
+    #     lookup.
+    #   - ``save(self)`` --> called to save file to disk
+    # - Mostly mandatory (i.e. should at least exist)
+    #   - book, cur_sheet, path
+
+    # - Optional:
+    #   - ``__init__(self, path, engine=None, **kwargs)`` --> always called
+    #     with path as first argument.
+
+    # You also need to register the class with ``register_writer()``.
+    # Technically, ExcelWriter implementations don't need to subclass
+    # ExcelWriter.
+    def __new__(cls, path, engine=None, **kwargs):
+        # only switch class if generic(ExcelWriter)
+
+        if issubclass(cls, ExcelWriter):
+            if engine is None or (isinstance(engine, string_types) and
+                                  engine == 'auto'):
+                if isinstance(path, string_types):
+                    ext = os.path.splitext(path)[-1][1:]
+                else:
+                    ext = 'xlsx'
+
+                try:
+                    engine = config.get_option('io.excel.{ext}.writer'
+                                               .format(ext=ext))
+                    if engine == 'auto':
+                        engine = _get_default_writer(ext)
+                except KeyError:
+                    raise ValueError("No engine for filetype: '{ext}'"
+                                     .format(ext=ext))
+            cls = get_writer(engine)
+
+        return object.__new__(cls)
+
+    # declare external properties you can count on
+    book = None
+    curr_sheet = None
+    path = None
+
+    @abc.abstractproperty
+    def supported_extensions(self):
+        "extensions that writer engine supports"
+        pass
+
+    @abc.abstractproperty
+    def engine(self):
+        "name of engine"
+        pass
+
+    @abc.abstractmethod
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
+        """
+        Write given formatted cells into Excel an excel sheet
+
+        Parameters
+        ----------
+        cells : generator
+            cell of formatted data to save to Excel sheet
+        sheet_name : string, default None
+            Name of Excel sheet, if None, then use self.cur_sheet
+        startrow : upper left cell row to dump data frame
+        startcol : upper left cell column to dump data frame
+        freeze_panes: integer tuple of length 2
+            contains the bottom-most row and right-most column to freeze
+        """
+        pass
+
+    @abc.abstractmethod
+    def save(self):
+        """
+        Save workbook to disk.
+        """
+        pass
+
+    def __init__(self, path, engine=None,
+                 date_format=None, datetime_format=None, mode='w',
+                 **engine_kwargs):
+        # validate that this engine can handle the extension
+        if isinstance(path, string_types):
+            ext = os.path.splitext(path)[-1]
+        else:
+            ext = 'xls' if engine == 'xlwt' else 'xlsx'
+
+        self.check_extension(ext)
+
+        self.path = path
+        self.sheets = {}
+        self.cur_sheet = None
+
+        if date_format is None:
+            self.date_format = 'YYYY-MM-DD'
+        else:
+            self.date_format = date_format
+        if datetime_format is None:
+            self.datetime_format = 'YYYY-MM-DD HH:MM:SS'
+        else:
+            self.datetime_format = datetime_format
+
+        self.mode = mode
+
+    def __fspath__(self):
+        return _stringify_path(self.path)
+
+    def _get_sheet_name(self, sheet_name):
+        if sheet_name is None:
+            sheet_name = self.cur_sheet
+        if sheet_name is None:  # pragma: no cover
+            raise ValueError('Must pass explicit sheet_name or set '
+                             'cur_sheet property')
+        return sheet_name
+
+    def _value_with_fmt(self, val):
+        """Convert numpy types to Python types for the Excel writers.
+
+        Parameters
+        ----------
+        val : object
+            Value to be written into cells
+
+        Returns
+        -------
+        Tuple with the first element being the converted value and the second
+            being an optional format
+        """
+        fmt = None
+
+        if is_integer(val):
+            val = int(val)
+        elif is_float(val):
+            val = float(val)
+        elif is_bool(val):
+            val = bool(val)
+        elif isinstance(val, datetime):
+            fmt = self.datetime_format
+        elif isinstance(val, date):
+            fmt = self.date_format
+        elif isinstance(val, timedelta):
+            val = val.total_seconds() / float(86400)
+            fmt = '0'
+        else:
+            val = compat.to_str(val)
+
+        return val, fmt
+
+    @classmethod
+    def check_extension(cls, ext):
+        """checks that path's extension against the Writer's supported
+        extensions.  If it isn't supported, raises UnsupportedFiletypeError."""
+        if ext.startswith('.'):
+            ext = ext[1:]
+        if not any(ext in extension for extension in cls.supported_extensions):
+            msg = (u("Invalid extension for engine '{engine}': '{ext}'")
+                   .format(engine=pprint_thing(cls.engine),
+                           ext=pprint_thing(ext)))
+            raise ValueError(msg)
+        else:
+            return True
+
+    # Allow use as a contextmanager
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        self.close()
+
+    def close(self):
+        """synonym for save, to make it more file-like"""
+        return self.save()
+
+
+class ExcelFile(object):
+    """
+    Class for parsing tabular excel sheets into DataFrame objects.
+    Uses xlrd. See read_excel for more documentation
+
+    Parameters
+    ----------
+    io : string, path object (pathlib.Path or py._path.local.LocalPath),
+        file-like object or xlrd workbook
+        If a string or path object, expected to be a path to xls or xlsx file.
+    engine : string, default None
+        If io is not a buffer or path, this must be set to identify io.
+        Acceptable values are None or ``xlrd``.
+    """
+
+    from pandas.io.excel._xlrd import _XlrdReader
+
+    _engines = {
+        'xlrd': _XlrdReader,
+    }
+
+    def __init__(self, io, engine=None):
+        if engine is None:
+            engine = 'xlrd'
+        if engine not in self._engines:
+            raise ValueError("Unknown engine: {engine}".format(engine=engine))
+
+        # could be a str, ExcelFile, Book, etc.
+        self.io = io
+        # Always a string
+        self._io = _stringify_path(io)
+
+        self._reader = self._engines[engine](self._io)
+
+    def __fspath__(self):
+        return self._io
+
+    def parse(self,
+              sheet_name=0,
+              header=0,
+              names=None,
+              index_col=None,
+              usecols=None,
+              squeeze=False,
+              converters=None,
+              true_values=None,
+              false_values=None,
+              skiprows=None,
+              nrows=None,
+              na_values=None,
+              parse_dates=False,
+              date_parser=None,
+              thousands=None,
+              comment=None,
+              skipfooter=0,
+              convert_float=True,
+              mangle_dupe_cols=True,
+              **kwds):
+        """
+        Parse specified sheet(s) into a DataFrame
+
+        Equivalent to read_excel(ExcelFile, ...)  See the read_excel
+        docstring for more info on accepted parameters
+        """
+
+        # Can't use _deprecate_kwarg since sheetname=None has a special meaning
+        if is_integer(sheet_name) and sheet_name == 0 and 'sheetname' in kwds:
+            warnings.warn("The `sheetname` keyword is deprecated, use "
+                          "`sheet_name` instead", FutureWarning, stacklevel=2)
+            sheet_name = kwds.pop("sheetname")
+        elif 'sheetname' in kwds:
+            raise TypeError("Cannot specify both `sheet_name` "
+                            "and `sheetname`. Use just `sheet_name`")
+
+        if 'chunksize' in kwds:
+            raise NotImplementedError("chunksize keyword of read_excel "
+                                      "is not implemented")
+
+        return self._reader.parse(sheet_name=sheet_name,
+                                  header=header,
+                                  names=names,
+                                  index_col=index_col,
+                                  usecols=usecols,
+                                  squeeze=squeeze,
+                                  converters=converters,
+                                  true_values=true_values,
+                                  false_values=false_values,
+                                  skiprows=skiprows,
+                                  nrows=nrows,
+                                  na_values=na_values,
+                                  parse_dates=parse_dates,
+                                  date_parser=date_parser,
+                                  thousands=thousands,
+                                  comment=comment,
+                                  skipfooter=skipfooter,
+                                  convert_float=convert_float,
+                                  mangle_dupe_cols=mangle_dupe_cols,
+                                  **kwds)
+
+    @property
+    def book(self):
+        return self._reader.book
+
+    @property
+    def sheet_names(self):
+        return self._reader.sheet_names
+
+    def close(self):
+        """close io if necessary"""
+        if hasattr(self.io, 'close'):
+            self.io.close()
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        self.close()
diff --git a/pandas/io/excel/_openpyxl.py b/pandas/io/excel/_openpyxl.py
new file mode 100644
index 0000000000000..8d79c13a65c97
--- /dev/null
+++ b/pandas/io/excel/_openpyxl.py
@@ -0,0 +1,453 @@
+from pandas.io.excel._base import ExcelWriter
+from pandas.io.excel._util import _validate_freeze_panes
+
+
+class _OpenpyxlWriter(ExcelWriter):
+    engine = 'openpyxl'
+    supported_extensions = ('.xlsx', '.xlsm')
+
+    def __init__(self, path, engine=None, mode='w', **engine_kwargs):
+        # Use the openpyxl module as the Excel writer.
+        from openpyxl.workbook import Workbook
+
+        super(_OpenpyxlWriter, self).__init__(path, mode=mode, **engine_kwargs)
+
+        if self.mode == 'a':  # Load from existing workbook
+            from openpyxl import load_workbook
+            book = load_workbook(self.path)
+            self.book = book
+        else:
+            # Create workbook object with default optimized_write=True.
+            self.book = Workbook()
+
+            if self.book.worksheets:
+                try:
+                    self.book.remove(self.book.worksheets[0])
+                except AttributeError:
+
+                    # compat - for openpyxl <= 2.4
+                    self.book.remove_sheet(self.book.worksheets[0])
+
+    def save(self):
+        """
+        Save workbook to disk.
+        """
+        return self.book.save(self.path)
+
+    @classmethod
+    def _convert_to_style(cls, style_dict):
+        """
+        converts a style_dict to an openpyxl style object
+        Parameters
+        ----------
+        style_dict : style dictionary to convert
+        """
+
+        from openpyxl.style import Style
+        xls_style = Style()
+        for key, value in style_dict.items():
+            for nk, nv in value.items():
+                if key == "borders":
+                    (xls_style.borders.__getattribute__(nk)
+                     .__setattr__('border_style', nv))
+                else:
+                    xls_style.__getattribute__(key).__setattr__(nk, nv)
+
+        return xls_style
+
+    @classmethod
+    def _convert_to_style_kwargs(cls, style_dict):
+        """
+        Convert a style_dict to a set of kwargs suitable for initializing
+        or updating-on-copy an openpyxl v2 style object
+        Parameters
+        ----------
+        style_dict : dict
+            A dict with zero or more of the following keys (or their synonyms).
+                'font'
+                'fill'
+                'border' ('borders')
+                'alignment'
+                'number_format'
+                'protection'
+        Returns
+        -------
+        style_kwargs : dict
+            A dict with the same, normalized keys as ``style_dict`` but each
+            value has been replaced with a native openpyxl style object of the
+            appropriate class.
+        """
+
+        _style_key_map = {
+            'borders': 'border',
+        }
+
+        style_kwargs = {}
+        for k, v in style_dict.items():
+            if k in _style_key_map:
+                k = _style_key_map[k]
+            _conv_to_x = getattr(cls, '_convert_to_{k}'.format(k=k),
+                                 lambda x: None)
+            new_v = _conv_to_x(v)
+            if new_v:
+                style_kwargs[k] = new_v
+
+        return style_kwargs
+
+    @classmethod
+    def _convert_to_color(cls, color_spec):
+        """
+        Convert ``color_spec`` to an openpyxl v2 Color object
+        Parameters
+        ----------
+        color_spec : str, dict
+            A 32-bit ARGB hex string, or a dict with zero or more of the
+            following keys.
+                'rgb'
+                'indexed'
+                'auto'
+                'theme'
+                'tint'
+                'index'
+                'type'
+        Returns
+        -------
+        color : openpyxl.styles.Color
+        """
+
+        from openpyxl.styles import Color
+
+        if isinstance(color_spec, str):
+            return Color(color_spec)
+        else:
+            return Color(**color_spec)
+
+    @classmethod
+    def _convert_to_font(cls, font_dict):
+        """
+        Convert ``font_dict`` to an openpyxl v2 Font object
+        Parameters
+        ----------
+        font_dict : dict
+            A dict with zero or more of the following keys (or their synonyms).
+                'name'
+                'size' ('sz')
+                'bold' ('b')
+                'italic' ('i')
+                'underline' ('u')
+                'strikethrough' ('strike')
+                'color'
+                'vertAlign' ('vertalign')
+                'charset'
+                'scheme'
+                'family'
+                'outline'
+                'shadow'
+                'condense'
+        Returns
+        -------
+        font : openpyxl.styles.Font
+        """
+
+        from openpyxl.styles import Font
+
+        _font_key_map = {
+            'sz': 'size',
+            'b': 'bold',
+            'i': 'italic',
+            'u': 'underline',
+            'strike': 'strikethrough',
+            'vertalign': 'vertAlign',
+        }
+
+        font_kwargs = {}
+        for k, v in font_dict.items():
+            if k in _font_key_map:
+                k = _font_key_map[k]
+            if k == 'color':
+                v = cls._convert_to_color(v)
+            font_kwargs[k] = v
+
+        return Font(**font_kwargs)
+
+    @classmethod
+    def _convert_to_stop(cls, stop_seq):
+        """
+        Convert ``stop_seq`` to a list of openpyxl v2 Color objects,
+        suitable for initializing the ``GradientFill`` ``stop`` parameter.
+        Parameters
+        ----------
+        stop_seq : iterable
+            An iterable that yields objects suitable for consumption by
+            ``_convert_to_color``.
+        Returns
+        -------
+        stop : list of openpyxl.styles.Color
+        """
+
+        return map(cls._convert_to_color, stop_seq)
+
+    @classmethod
+    def _convert_to_fill(cls, fill_dict):
+        """
+        Convert ``fill_dict`` to an openpyxl v2 Fill object
+        Parameters
+        ----------
+        fill_dict : dict
+            A dict with one or more of the following keys (or their synonyms),
+                'fill_type' ('patternType', 'patterntype')
+                'start_color' ('fgColor', 'fgcolor')
+                'end_color' ('bgColor', 'bgcolor')
+            or one or more of the following keys (or their synonyms).
+                'type' ('fill_type')
+                'degree'
+                'left'
+                'right'
+                'top'
+                'bottom'
+                'stop'
+        Returns
+        -------
+        fill : openpyxl.styles.Fill
+        """
+
+        from openpyxl.styles import PatternFill, GradientFill
+
+        _pattern_fill_key_map = {
+            'patternType': 'fill_type',
+            'patterntype': 'fill_type',
+            'fgColor': 'start_color',
+            'fgcolor': 'start_color',
+            'bgColor': 'end_color',
+            'bgcolor': 'end_color',
+        }
+
+        _gradient_fill_key_map = {
+            'fill_type': 'type',
+        }
+
+        pfill_kwargs = {}
+        gfill_kwargs = {}
+        for k, v in fill_dict.items():
+            pk = gk = None
+            if k in _pattern_fill_key_map:
+                pk = _pattern_fill_key_map[k]
+            if k in _gradient_fill_key_map:
+                gk = _gradient_fill_key_map[k]
+            if pk in ['start_color', 'end_color']:
+                v = cls._convert_to_color(v)
+            if gk == 'stop':
+                v = cls._convert_to_stop(v)
+            if pk:
+                pfill_kwargs[pk] = v
+            elif gk:
+                gfill_kwargs[gk] = v
+            else:
+                pfill_kwargs[k] = v
+                gfill_kwargs[k] = v
+
+        try:
+            return PatternFill(**pfill_kwargs)
+        except TypeError:
+            return GradientFill(**gfill_kwargs)
+
+    @classmethod
+    def _convert_to_side(cls, side_spec):
+        """
+        Convert ``side_spec`` to an openpyxl v2 Side object
+        Parameters
+        ----------
+        side_spec : str, dict
+            A string specifying the border style, or a dict with zero or more
+            of the following keys (or their synonyms).
+                'style' ('border_style')
+                'color'
+        Returns
+        -------
+        side : openpyxl.styles.Side
+        """
+
+        from openpyxl.styles import Side
+
+        _side_key_map = {
+            'border_style': 'style',
+        }
+
+        if isinstance(side_spec, str):
+            return Side(style=side_spec)
+
+        side_kwargs = {}
+        for k, v in side_spec.items():
+            if k in _side_key_map:
+                k = _side_key_map[k]
+            if k == 'color':
+                v = cls._convert_to_color(v)
+            side_kwargs[k] = v
+
+        return Side(**side_kwargs)
+
+    @classmethod
+    def _convert_to_border(cls, border_dict):
+        """
+        Convert ``border_dict`` to an openpyxl v2 Border object
+        Parameters
+        ----------
+        border_dict : dict
+            A dict with zero or more of the following keys (or their synonyms).
+                'left'
+                'right'
+                'top'
+                'bottom'
+                'diagonal'
+                'diagonal_direction'
+                'vertical'
+                'horizontal'
+                'diagonalUp' ('diagonalup')
+                'diagonalDown' ('diagonaldown')
+                'outline'
+        Returns
+        -------
+        border : openpyxl.styles.Border
+        """
+
+        from openpyxl.styles import Border
+
+        _border_key_map = {
+            'diagonalup': 'diagonalUp',
+            'diagonaldown': 'diagonalDown',
+        }
+
+        border_kwargs = {}
+        for k, v in border_dict.items():
+            if k in _border_key_map:
+                k = _border_key_map[k]
+            if k == 'color':
+                v = cls._convert_to_color(v)
+            if k in ['left', 'right', 'top', 'bottom', 'diagonal']:
+                v = cls._convert_to_side(v)
+            border_kwargs[k] = v
+
+        return Border(**border_kwargs)
+
+    @classmethod
+    def _convert_to_alignment(cls, alignment_dict):
+        """
+        Convert ``alignment_dict`` to an openpyxl v2 Alignment object
+        Parameters
+        ----------
+        alignment_dict : dict
+            A dict with zero or more of the following keys (or their synonyms).
+                'horizontal'
+                'vertical'
+                'text_rotation'
+                'wrap_text'
+                'shrink_to_fit'
+                'indent'
+        Returns
+        -------
+        alignment : openpyxl.styles.Alignment
+        """
+
+        from openpyxl.styles import Alignment
+
+        return Alignment(**alignment_dict)
+
+    @classmethod
+    def _convert_to_number_format(cls, number_format_dict):
+        """
+        Convert ``number_format_dict`` to an openpyxl v2.1.0 number format
+        initializer.
+        Parameters
+        ----------
+        number_format_dict : dict
+            A dict with zero or more of the following keys.
+                'format_code' : str
+        Returns
+        -------
+        number_format : str
+        """
+        return number_format_dict['format_code']
+
+    @classmethod
+    def _convert_to_protection(cls, protection_dict):
+        """
+        Convert ``protection_dict`` to an openpyxl v2 Protection object.
+        Parameters
+        ----------
+        protection_dict : dict
+            A dict with zero or more of the following keys.
+                'locked'
+                'hidden'
+        Returns
+        -------
+        """
+
+        from openpyxl.styles import Protection
+
+        return Protection(**protection_dict)
+
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
+        # Write the frame cells using openpyxl.
+        sheet_name = self._get_sheet_name(sheet_name)
+
+        _style_cache = {}
+
+        if sheet_name in self.sheets:
+            wks = self.sheets[sheet_name]
+        else:
+            wks = self.book.create_sheet()
+            wks.title = sheet_name
+            self.sheets[sheet_name] = wks
+
+        if _validate_freeze_panes(freeze_panes):
+            wks.freeze_panes = wks.cell(row=freeze_panes[0] + 1,
+                                        column=freeze_panes[1] + 1)
+
+        for cell in cells:
+            xcell = wks.cell(
+                row=startrow + cell.row + 1,
+                column=startcol + cell.col + 1
+            )
+            xcell.value, fmt = self._value_with_fmt(cell.val)
+            if fmt:
+                xcell.number_format = fmt
+
+            style_kwargs = {}
+            if cell.style:
+                key = str(cell.style)
+                style_kwargs = _style_cache.get(key)
+                if style_kwargs is None:
+                    style_kwargs = self._convert_to_style_kwargs(cell.style)
+                    _style_cache[key] = style_kwargs
+
+            if style_kwargs:
+                for k, v in style_kwargs.items():
+                    setattr(xcell, k, v)
+
+            if cell.mergestart is not None and cell.mergeend is not None:
+
+                wks.merge_cells(
+                    start_row=startrow + cell.row + 1,
+                    start_column=startcol + cell.col + 1,
+                    end_column=startcol + cell.mergeend + 1,
+                    end_row=startrow + cell.mergestart + 1
+                )
+
+                # When cells are merged only the top-left cell is preserved
+                # The behaviour of the other cells in a merged range is
+                # undefined
+                if style_kwargs:
+                    first_row = startrow + cell.row + 1
+                    last_row = startrow + cell.mergestart + 1
+                    first_col = startcol + cell.col + 1
+                    last_col = startcol + cell.mergeend + 1
+
+                    for row in range(first_row, last_row + 1):
+                        for col in range(first_col, last_col + 1):
+                            if row == first_row and col == first_col:
+                                # Ignore first cell. It is already handled.
+                                continue
+                            xcell = wks.cell(column=col, row=row)
+                            for k, v in style_kwargs.items():
+                                setattr(xcell, k, v)
diff --git a/pandas/io/excel/_util.py b/pandas/io/excel/_util.py
new file mode 100644
index 0000000000000..49255d83d1cd3
--- /dev/null
+++ b/pandas/io/excel/_util.py
@@ -0,0 +1,265 @@
+import warnings
+
+import pandas.compat as compat
+from pandas.compat import lrange, range
+
+from pandas.core.dtypes.common import is_integer, is_list_like
+
+_writers = {}
+
+
+def register_writer(klass):
+    """
+    Add engine to the excel writer registry.io.excel.
+
+    You must use this method to integrate with ``to_excel``.
+
+    Parameters
+    ----------
+    klass : ExcelWriter
+    """
+    if not callable(klass):
+        raise ValueError("Can only register callables as engines")
+    engine_name = klass.engine
+    _writers[engine_name] = klass
+
+
+def _get_default_writer(ext):
+    """
+    Return the default writer for the given extension.
+
+    Parameters
+    ----------
+    ext : str
+        The excel file extension for which to get the default engine.
+
+    Returns
+    -------
+    str
+        The default engine for the extension.
+    """
+    _default_writers = {'xlsx': 'openpyxl', 'xlsm': 'openpyxl', 'xls': 'xlwt'}
+    try:
+        import xlsxwriter  # noqa
+        _default_writers['xlsx'] = 'xlsxwriter'
+    except ImportError:
+        pass
+    return _default_writers[ext]
+
+
+def get_writer(engine_name):
+    try:
+        return _writers[engine_name]
+    except KeyError:
+        raise ValueError("No Excel writer '{engine}'"
+                         .format(engine=engine_name))
+
+
+def _excel2num(x):
+    """
+    Convert Excel column name like 'AB' to 0-based column index.
+
+    Parameters
+    ----------
+    x : str
+        The Excel column name to convert to a 0-based column index.
+
+    Returns
+    -------
+    num : int
+        The column index corresponding to the name.
+
+    Raises
+    ------
+    ValueError
+        Part of the Excel column name was invalid.
+    """
+    index = 0
+
+    for c in x.upper().strip():
+        cp = ord(c)
+
+        if cp < ord("A") or cp > ord("Z"):
+            raise ValueError("Invalid column name: {x}".format(x=x))
+
+        index = index * 26 + cp - ord("A") + 1
+
+    return index - 1
+
+
+def _range2cols(areas):
+    """
+    Convert comma separated list of column names and ranges to indices.
+
+    Parameters
+    ----------
+    areas : str
+        A string containing a sequence of column ranges (or areas).
+
+    Returns
+    -------
+    cols : list
+        A list of 0-based column indices.
+
+    Examples
+    --------
+    >>> _range2cols('A:E')
+    [0, 1, 2, 3, 4]
+    >>> _range2cols('A,C,Z:AB')
+    [0, 2, 25, 26, 27]
+    """
+    cols = []
+
+    for rng in areas.split(","):
+        if ":" in rng:
+            rng = rng.split(":")
+            cols.extend(lrange(_excel2num(rng[0]), _excel2num(rng[1]) + 1))
+        else:
+            cols.append(_excel2num(rng))
+
+    return cols
+
+
+def _maybe_convert_usecols(usecols):
+    """
+    Convert `usecols` into a compatible format for parsing in `parsers.py`.
+
+    Parameters
+    ----------
+    usecols : object
+        The use-columns object to potentially convert.
+
+    Returns
+    -------
+    converted : object
+        The compatible format of `usecols`.
+    """
+    if usecols is None:
+        return usecols
+
+    if is_integer(usecols):
+        warnings.warn(("Passing in an integer for `usecols` has been "
+                       "deprecated. Please pass in a list of int from "
+                       "0 to `usecols` inclusive instead."),
+                      FutureWarning, stacklevel=2)
+        return lrange(usecols + 1)
+
+    if isinstance(usecols, compat.string_types):
+        return _range2cols(usecols)
+
+    return usecols
+
+
+def _validate_freeze_panes(freeze_panes):
+    if freeze_panes is not None:
+        if (
+            len(freeze_panes) == 2 and
+            all(isinstance(item, int) for item in freeze_panes)
+        ):
+            return True
+
+        raise ValueError("freeze_panes must be of form (row, column)"
+                         " where row and column are integers")
+
+    # freeze_panes wasn't specified, return False so it won't be applied
+    # to output sheet
+    return False
+
+
+def _trim_excel_header(row):
+    # trim header row so auto-index inference works
+    # xlrd uses '' , openpyxl None
+    while len(row) > 0 and (row[0] == '' or row[0] is None):
+        row = row[1:]
+    return row
+
+
+def _maybe_convert_to_string(row):
+    """
+    Convert elements in a row to string from Unicode.
+
+    This is purely a Python 2.x patch and is performed ONLY when all
+    elements of the row are string-like.
+
+    Parameters
+    ----------
+    row : array-like
+        The row of data to convert.
+
+    Returns
+    -------
+    converted : array-like
+    """
+    if compat.PY2:
+        converted = []
+
+        for i in range(len(row)):
+            if isinstance(row[i], compat.string_types):
+                try:
+                    converted.append(str(row[i]))
+                except UnicodeEncodeError:
+                    break
+            else:
+                break
+        else:
+            row = converted
+
+    return row
+
+
+def _fill_mi_header(row, control_row):
+    """Forward fill blank entries in row but only inside the same parent index.
+
+    Used for creating headers in Multiindex.
+    Parameters
+    ----------
+    row : list
+        List of items in a single row.
+    control_row : list of bool
+        Helps to determine if particular column is in same parent index as the
+        previous value. Used to stop propagation of empty cells between
+        different indexes.
+
+    Returns
+    ----------
+    Returns changed row and control_row
+    """
+    last = row[0]
+    for i in range(1, len(row)):
+        if not control_row[i]:
+            last = row[i]
+
+        if row[i] == '' or row[i] is None:
+            row[i] = last
+        else:
+            control_row[i] = False
+            last = row[i]
+
+    return _maybe_convert_to_string(row), control_row
+
+
+def _pop_header_name(row, index_col):
+    """
+    Pop the header name for MultiIndex parsing.
+
+    Parameters
+    ----------
+    row : list
+        The data row to parse for the header name.
+    index_col : int, list
+        The index columns for our data. Assumed to be non-null.
+
+    Returns
+    -------
+    header_name : str
+        The extracted header name.
+    trimmed_row : list
+        The original data row with the header name removed.
+    """
+    # Pop out header name and fill w/blank.
+    i = index_col if not is_list_like(index_col) else max(index_col)
+
+    header_name = row[i]
+    header_name = None if header_name == "" else header_name
+
+    return header_name, row[:i] + [''] + row[i + 1:]
diff --git a/pandas/io/excel/_xlrd.py b/pandas/io/excel/_xlrd.py
new file mode 100644
index 0000000000000..60f7d8f94a399
--- /dev/null
+++ b/pandas/io/excel/_xlrd.py
@@ -0,0 +1,126 @@
+from datetime import time
+from distutils.version import LooseVersion
+from io import UnsupportedOperation
+
+import numpy as np
+
+import pandas.compat as compat
+from pandas.compat import range, zip
+
+from pandas.io.common import _is_url, _urlopen, get_filepath_or_buffer
+from pandas.io.excel._base import _BaseExcelReader
+
+
+class _XlrdReader(_BaseExcelReader):
+
+    def __init__(self, filepath_or_buffer):
+        """Reader using xlrd engine.
+
+        Parameters
+        ----------
+        filepath_or_buffer : string, path object or Workbook
+            Object to be parsed.
+        """
+        err_msg = "Install xlrd >= 1.0.0 for Excel support"
+
+        try:
+            import xlrd
+        except ImportError:
+            raise ImportError(err_msg)
+        else:
+            if xlrd.__VERSION__ < LooseVersion("1.0.0"):
+                raise ImportError(err_msg +
+                                  ". Current version " + xlrd.__VERSION__)
+
+        from pandas.io.excel._base import ExcelFile
+        # If filepath_or_buffer is a url, want to keep the data as bytes so
+        # can't pass to get_filepath_or_buffer()
+        if _is_url(filepath_or_buffer):
+            filepath_or_buffer = _urlopen(filepath_or_buffer)
+        elif not isinstance(filepath_or_buffer, (ExcelFile, xlrd.Book)):
+            filepath_or_buffer, _, _, _ = get_filepath_or_buffer(
+                filepath_or_buffer)
+
+        if isinstance(filepath_or_buffer, xlrd.Book):
+            self.book = filepath_or_buffer
+        elif hasattr(filepath_or_buffer, "read"):
+            # N.B. xlrd.Book has a read attribute too
+            if hasattr(filepath_or_buffer, 'seek'):
+                try:
+                    # GH 19779
+                    filepath_or_buffer.seek(0)
+                except UnsupportedOperation:
+                    # HTTPResponse does not support seek()
+                    # GH 20434
+                    pass
+
+            data = filepath_or_buffer.read()
+            self.book = xlrd.open_workbook(file_contents=data)
+        elif isinstance(filepath_or_buffer, compat.string_types):
+            self.book = xlrd.open_workbook(filepath_or_buffer)
+        else:
+            raise ValueError('Must explicitly set engine if not passing in'
+                             ' buffer or path for io.')
+
+    @property
+    def sheet_names(self):
+        return self.book.sheet_names()
+
+    def get_sheet_by_name(self, name):
+        return self.book.sheet_by_name(name)
+
+    def get_sheet_by_index(self, index):
+        return self.book.sheet_by_index(index)
+
+    def get_sheet_data(self, sheet, convert_float):
+        from xlrd import (xldate, XL_CELL_DATE,
+                          XL_CELL_ERROR, XL_CELL_BOOLEAN,
+                          XL_CELL_NUMBER)
+
+        epoch1904 = self.book.datemode
+
+        def _parse_cell(cell_contents, cell_typ):
+            """converts the contents of the cell into a pandas
+               appropriate object"""
+
+            if cell_typ == XL_CELL_DATE:
+
+                # Use the newer xlrd datetime handling.
+                try:
+                    cell_contents = xldate.xldate_as_datetime(
+                        cell_contents, epoch1904)
+                except OverflowError:
+                    return cell_contents
+
+                # Excel doesn't distinguish between dates and time,
+                # so we treat dates on the epoch as times only.
+                # Also, Excel supports 1900 and 1904 epochs.
+                year = (cell_contents.timetuple())[0:3]
+                if ((not epoch1904 and year == (1899, 12, 31)) or
+                        (epoch1904 and year == (1904, 1, 1))):
+                    cell_contents = time(cell_contents.hour,
+                                         cell_contents.minute,
+                                         cell_contents.second,
+                                         cell_contents.microsecond)
+
+            elif cell_typ == XL_CELL_ERROR:
+                cell_contents = np.nan
+            elif cell_typ == XL_CELL_BOOLEAN:
+                cell_contents = bool(cell_contents)
+            elif convert_float and cell_typ == XL_CELL_NUMBER:
+                # GH5394 - Excel 'numbers' are always floats
+                # it's a minimal perf hit and less surprising
+                val = int(cell_contents)
+                if val == cell_contents:
+                    cell_contents = val
+            return cell_contents
+
+        data = []
+
+        for i in range(sheet.nrows):
+            row = [_parse_cell(value, typ)
+                   for value, typ in zip(sheet.row_values(i),
+                                         sheet.row_types(i))]
+            data.append(row)
+
+        return data
diff --git a/pandas/io/excel/_xlsxwriter.py b/pandas/io/excel/_xlsxwriter.py
new file mode 100644
index 0000000000000..531a3657cac6f
--- /dev/null
+++ b/pandas/io/excel/_xlsxwriter.py
@@ -0,0 +1,218 @@
+import pandas._libs.json as json
+from pandas.compat import string_types
+
+from pandas.io.excel._base import ExcelWriter
+from pandas.io.excel._util import _validate_freeze_panes
+
+
+class _XlsxStyler(object):
+    # Map from openpyxl-oriented styles to flatter xlsxwriter representation
+    # Ordering necessary for both determinism and because some are keyed by
+    # prefixes of others.
+    STYLE_MAPPING = {
+        'font': [
+            (('name',), 'font_name'),
+            (('sz',), 'font_size'),
+            (('size',), 'font_size'),
+            (('color', 'rgb',), 'font_color'),
+            (('color',), 'font_color'),
+            (('b',), 'bold'),
+            (('bold',), 'bold'),
+            (('i',), 'italic'),
+            (('italic',), 'italic'),
+            (('u',), 'underline'),
+            (('underline',), 'underline'),
+            (('strike',), 'font_strikeout'),
+            (('vertAlign',), 'font_script'),
+            (('vertalign',), 'font_script'),
+        ],
+        'number_format': [
+            (('format_code',), 'num_format'),
+            ((), 'num_format',),
+        ],
+        'protection': [
+            (('locked',), 'locked'),
+            (('hidden',), 'hidden'),
+        ],
+        'alignment': [
+            (('horizontal',), 'align'),
+            (('vertical',), 'valign'),
+            (('text_rotation',), 'rotation'),
+            (('wrap_text',), 'text_wrap'),
+            (('indent',), 'indent'),
+            (('shrink_to_fit',), 'shrink'),
+        ],
+        'fill': [
+            (('patternType',), 'pattern'),
+            (('patterntype',), 'pattern'),
+            (('fill_type',), 'pattern'),
+            (('start_color', 'rgb',), 'fg_color'),
+            (('fgColor', 'rgb',), 'fg_color'),
+            (('fgcolor', 'rgb',), 'fg_color'),
+            (('start_color',), 'fg_color'),
+            (('fgColor',), 'fg_color'),
+            (('fgcolor',), 'fg_color'),
+            (('end_color', 'rgb',), 'bg_color'),
+            (('bgColor', 'rgb',), 'bg_color'),
+            (('bgcolor', 'rgb',), 'bg_color'),
+            (('end_color',), 'bg_color'),
+            (('bgColor',), 'bg_color'),
+            (('bgcolor',), 'bg_color'),
+        ],
+        'border': [
+            (('color', 'rgb',), 'border_color'),
+            (('color',), 'border_color'),
+            (('style',), 'border'),
+            (('top', 'color', 'rgb',), 'top_color'),
+            (('top', 'color',), 'top_color'),
+            (('top', 'style',), 'top'),
+            (('top',), 'top'),
+            (('right', 'color', 'rgb',), 'right_color'),
+            (('right', 'color',), 'right_color'),
+            (('right', 'style',), 'right'),
+            (('right',), 'right'),
+            (('bottom', 'color', 'rgb',), 'bottom_color'),
+            (('bottom', 'color',), 'bottom_color'),
+            (('bottom', 'style',), 'bottom'),
+            (('bottom',), 'bottom'),
+            (('left', 'color', 'rgb',), 'left_color'),
+            (('left', 'color',), 'left_color'),
+            (('left', 'style',), 'left'),
+            (('left',), 'left'),
+        ],
+    }
+
+    @classmethod
+    def convert(cls, style_dict, num_format_str=None):
+        """
+        converts a style_dict to an xlsxwriter format dict
+
+        Parameters
+        ----------
+        style_dict : style dictionary to convert
+        num_format_str : optional number format string
+        """
+
+        # Create a XlsxWriter format object.
+        props = {}
+
+        if num_format_str is not None:
+            props['num_format'] = num_format_str
+
+        if style_dict is None:
+            return props
+
+        if 'borders' in style_dict:
+            style_dict = style_dict.copy()
+            style_dict['border'] = style_dict.pop('borders')
+
+        for style_group_key, style_group in style_dict.items():
+            for src, dst in cls.STYLE_MAPPING.get(style_group_key, []):
+                # src is a sequence of keys into a nested dict
+                # dst is a flat key
+                if dst in props:
+                    continue
+                v = style_group
+                for k in src:
+                    try:
+                        v = v[k]
+                    except (KeyError, TypeError):
+                        break
+                else:
+                    props[dst] = v
+
+        if isinstance(props.get('pattern'), string_types):
+            # TODO: support other fill patterns
+            props['pattern'] = 0 if props['pattern'] == 'none' else 1
+
+        for k in ['border', 'top', 'right', 'bottom', 'left']:
+            if isinstance(props.get(k), string_types):
+                try:
+                    props[k] = ['none', 'thin', 'medium', 'dashed', 'dotted',
+                                'thick', 'double', 'hair', 'mediumDashed',
+                                'dashDot', 'mediumDashDot', 'dashDotDot',
+                                'mediumDashDotDot',
+                                'slantDashDot'].index(props[k])
+                except ValueError:
+                    props[k] = 2
+
+        if isinstance(props.get('font_script'), string_types):
+            props['font_script'] = ['baseline', 'superscript',
+                                    'subscript'].index(props['font_script'])
+
+        if isinstance(props.get('underline'), string_types):
+            props['underline'] = {'none': 0, 'single': 1, 'double': 2,
+                                  'singleAccounting': 33,
+                                  'doubleAccounting': 34}[props['underline']]
+
+        return props
+
+
+class _XlsxWriter(ExcelWriter):
+    engine = 'xlsxwriter'
+    supported_extensions = ('.xlsx',)
+
+    def __init__(self, path, engine=None,
+                 date_format=None, datetime_format=None, mode='w',
+                 **engine_kwargs):
+        # Use the xlsxwriter module as the Excel writer.
+        import xlsxwriter
+
+        if mode == 'a':
+            raise ValueError('Append mode is not supported with xlsxwriter!')
+
+        super(_XlsxWriter, self).__init__(path, engine=engine,
+                                          date_format=date_format,
+                                          datetime_format=datetime_format,
+                                          mode=mode,
+                                          **engine_kwargs)
+
+        self.book = xlsxwriter.Workbook(path, **engine_kwargs)
+
+    def save(self):
+        """
+        Save workbook to disk.
+        """
+
+        return self.book.close()
+
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
+        # Write the frame cells using xlsxwriter.
+        sheet_name = self._get_sheet_name(sheet_name)
+
+        if sheet_name in self.sheets:
+            wks = self.sheets[sheet_name]
+        else:
+            wks = self.book.add_worksheet(sheet_name)
+            self.sheets[sheet_name] = wks
+
+        style_dict = {'null': None}
+
+        if _validate_freeze_panes(freeze_panes):
+            wks.freeze_panes(*(freeze_panes))
+
+        for cell in cells:
+            val, fmt = self._value_with_fmt(cell.val)
+
+            stylekey = json.dumps(cell.style)
+            if fmt:
+                stylekey += fmt
+
+            if stylekey in style_dict:
+                style = style_dict[stylekey]
+            else:
+                style = self.book.add_format(
+                    _XlsxStyler.convert(cell.style, fmt))
+                style_dict[stylekey] = style
+
+            if cell.mergestart is not None and cell.mergeend is not None:
+                wks.merge_range(startrow + cell.row,
+                                startcol + cell.col,
+                                startrow + cell.mergestart,
+                                startcol + cell.mergeend,
+                                cell.val, style)
+            else:
+                wks.write(startrow + cell.row,
+                          startcol + cell.col,
+                          val, style)
diff --git a/pandas/io/excel/_xlwt.py b/pandas/io/excel/_xlwt.py
new file mode 100644
index 0000000000000..191fbe914b750
--- /dev/null
+++ b/pandas/io/excel/_xlwt.py
@@ -0,0 +1,132 @@
+import pandas._libs.json as json
+
+from pandas.io.excel._base import ExcelWriter
+from pandas.io.excel._util import _validate_freeze_panes
+
+
+class _XlwtWriter(ExcelWriter):
+    engine = 'xlwt'
+    supported_extensions = ('.xls',)
+
+    def __init__(self, path, engine=None, encoding=None, mode='w',
+                 **engine_kwargs):
+        # Use the xlwt module as the Excel writer.
+        import xlwt
+        engine_kwargs['engine'] = engine
+
+        if mode == 'a':
+            raise ValueError('Append mode is not supported with xlwt!')
+
+        super(_XlwtWriter, self).__init__(path, mode=mode, **engine_kwargs)
+
+        if encoding is None:
+            encoding = 'ascii'
+        self.book = xlwt.Workbook(encoding=encoding)
+        self.fm_datetime = xlwt.easyxf(num_format_str=self.datetime_format)
+        self.fm_date = xlwt.easyxf(num_format_str=self.date_format)
+
+    def save(self):
+        """
+        Save workbook to disk.
+        """
+        return self.book.save(self.path)
+
+    def write_cells(self, cells, sheet_name=None, startrow=0, startcol=0,
+                    freeze_panes=None):
+        # Write the frame cells using xlwt.
+
+        sheet_name = self._get_sheet_name(sheet_name)
+
+        if sheet_name in self.sheets:
+            wks = self.sheets[sheet_name]
+        else:
+            wks = self.book.add_sheet(sheet_name)
+            self.sheets[sheet_name] = wks
+
+        if _validate_freeze_panes(freeze_panes):
+            wks.set_panes_frozen(True)
+            wks.set_horz_split_pos(freeze_panes[0])
+            wks.set_vert_split_pos(freeze_panes[1])
+
+        style_dict = {}
+
+        for cell in cells:
+            val, fmt = self._value_with_fmt(cell.val)
+
+            stylekey = json.dumps(cell.style)
+            if fmt:
+                stylekey += fmt
+
+            if stylekey in style_dict:
+                style = style_dict[stylekey]
+            else:
+                style = self._convert_to_style(cell.style, fmt)
+                style_dict[stylekey] = style
+
+            if cell.mergestart is not None and cell.mergeend is not None:
+                wks.write_merge(startrow + cell.row,
+                                startrow + cell.mergestart,
+                                startcol + cell.col,
+                                startcol + cell.mergeend,
+                                val, style)
+            else:
+                wks.write(startrow + cell.row,
+                          startcol + cell.col,
+                          val, style)
+
+    @classmethod
+    def _style_to_xlwt(cls, item, firstlevel=True, field_sep=',',
+                       line_sep=';'):
+        """helper which recursively generate an xlwt easy style string
+        for example:
+
+            hstyle = {"font": {"bold": True},
+            "border": {"top": "thin",
+                    "right": "thin",
+                    "bottom": "thin",
+                    "left": "thin"},
+            "align": {"horiz": "center"}}
+            will be converted to
+            font: bold on; \
+                    border: top thin, right thin, bottom thin, left thin; \
+                    align: horiz center;
+        """
+        if hasattr(item, 'items'):
+            if firstlevel:
+                it = ["{key}: {val}"
+                      .format(key=key, val=cls._style_to_xlwt(value, False))
+                      for key, value in item.items()]
+                out = "{sep} ".format(sep=(line_sep).join(it))
+                return out
+            else:
+                it = ["{key} {val}"
+                      .format(key=key, val=cls._style_to_xlwt(value, False))
+                      for key, value in item.items()]
+                out = "{sep} ".format(sep=(field_sep).join(it))
+                return out
+        else:
+            item = "{item}".format(item=item)
+            item = item.replace("True", "on")
+            item = item.replace("False", "off")
+            return item
+
+    @classmethod
+    def _convert_to_style(cls, style_dict, num_format_str=None):
+        """
+        converts a style_dict to an xlwt style object
+        Parameters
+        ----------
+        style_dict : style dictionary to convert
+        num_format_str : optional number format string
+        """
+        import xlwt
+
+        if style_dict:
+            xlwt_stylestr = cls._style_to_xlwt(style_dict)
+            style = xlwt.easyxf(xlwt_stylestr, field_sep=',', line_sep=';')
+        else:
+            style = xlwt.XFStyle()
+        if num_format_str is not None:
+            style.num_format_str = num_format_str
+
+        return style
diff --git a/pandas/io/feather_format.py b/pandas/io/feather_format.py
index ac74ac4823613..d76e6b75d3762 100644
--- a/pandas/io/feather_format.py
+++ b/pandas/io/feather_format.py
@@ -1,36 +1,37 @@
 """ feather-format compat """
 
 from distutils.version import LooseVersion
-from pandas import DataFrame, RangeIndex, Int64Index
+
 from pandas.compat import range
+from pandas.util._decorators import deprecate_kwarg
+
+from pandas import DataFrame, Int64Index, RangeIndex
+
+from pandas.io.common import _stringify_path
 
 
 def _try_import():
-    # since pandas is a dependency of feather
+    # since pandas is a dependency of pyarrow
     # we need to import on first use
-
     try:
-        import feather
+        import pyarrow
+        from pyarrow import feather
     except ImportError:
-
         # give a nice error message
-        raise ImportError("the feather-format library is not installed\n"
+        raise ImportError("pyarrow is not installed\n\n"
                           "you can install via conda\n"
-                          "conda install feather-format -c conda-forge\n"
+                          "conda install pyarrow -c conda-forge\n"
                           "or via pip\n"
-                          "pip install feather-format\n")
+                          "pip install -U pyarrow\n")
 
-    try:
-        feather.__version__ >= LooseVersion('0.3.1')
-    except AttributeError:
-        raise ImportError("the feather-format library must be >= "
-                          "version 0.3.1\n"
+    if LooseVersion(pyarrow.__version__) < LooseVersion('0.9.0'):
+        raise ImportError("pyarrow >= 0.9.0 required for feather support\n\n"
                           "you can install via conda\n"
-                          "conda install feather-format -c conda-forge"
+                          "conda install pyarrow -c conda-forge"
                           "or via pip\n"
-                          "pip install feather-format\n")
+                          "pip install -U pyarrow\n")
 
-    return feather
+    return feather, pyarrow
 
 
 def to_feather(df, path):
@@ -40,13 +41,14 @@ def to_feather(df, path):
     Parameters
     ----------
     df : DataFrame
-    path : string
-        File path
+    path : string file path, or file-like object
+
     """
+    path = _stringify_path(path)
     if not isinstance(df, DataFrame):
         raise ValueError("feather only support IO with DataFrames")
 
-    feather = _try_import()
+    feather = _try_import()[0]
     valid_types = {'string', 'unicode'}
 
     # validate index
@@ -56,15 +58,16 @@ def to_feather(df, path):
     # raise on anything else as we don't serialize the index
 
     if not isinstance(df.index, Int64Index):
-        raise ValueError("feather does not serializing {} "
+        raise ValueError("feather does not support serializing {} "
                          "for the index; you can .reset_index()"
                          "to make the index into column(s)".format(
                              type(df.index)))
 
     if not df.index.equals(RangeIndex.from_range(range(len(df)))):
-        raise ValueError("feather does not serializing a non-default index "
-                         "for the index; you can .reset_index()"
-                         "to make the index into column(s)")
+        raise ValueError("feather does not support serializing a "
+                         "non-default index for the index; you "
+                         "can .reset_index() to make the index "
+                         "into column(s)")
 
     if df.index.name is not None:
         raise ValueError("feather does not serialize index meta-data on a "
@@ -77,10 +80,11 @@ def to_feather(df, path):
     if df.columns.inferred_type not in valid_types:
         raise ValueError("feather must have string column names")
 
-    feather.write_dataframe(df, path)
+    feather.write_feather(df, path)
 
 
-def read_feather(path):
+@deprecate_kwarg(old_arg_name='nthreads', new_arg_name='use_threads')
+def read_feather(path, columns=None, use_threads=True):
     """
     Load a feather-format object from the file path
 
@@ -88,8 +92,20 @@ def read_feather(path):
 
     Parameters
     ----------
-    path : string
-        File path
+    path : string file path, or file-like object
+    columns : sequence, default None
+        If not provided, all columns are read
+
+        .. versionadded 0.24.0
+    nthreads : int, default 1
+        Number of CPU threads to use when reading to pandas.DataFrame
+
+       .. versionadded 0.21.0
+       .. deprecated 0.24.0
+    use_threads : bool, default True
+        Whether to parallelize reading using multiple threads
+
+       .. versionadded 0.24.0
 
     Returns
     -------
@@ -97,5 +113,15 @@ def read_feather(path):
 
     """
 
-    feather = _try_import()
-    return feather.read_dataframe(path)
+    feather, pyarrow = _try_import()
+    path = _stringify_path(path)
+
+    if LooseVersion(pyarrow.__version__) < LooseVersion('0.11.0'):
+        int_use_threads = int(use_threads)
+        if int_use_threads < 1:
+            int_use_threads = 1
+        return feather.read_feather(path, columns=columns,
+                                    nthreads=int_use_threads)
+
+    return feather.read_feather(path, columns=columns,
+                                use_threads=bool(use_threads))
diff --git a/pandas/types/__init__.py b/pandas/io/formats/__init__.py
similarity index 100%
rename from pandas/types/__init__.py
rename to pandas/io/formats/__init__.py
diff --git a/pandas/io/formats/console.py b/pandas/io/formats/console.py
new file mode 100644
index 0000000000000..ad63b3efdd832
--- /dev/null
+++ b/pandas/io/formats/console.py
@@ -0,0 +1,121 @@
+"""
+Internal module for console introspection
+"""
+
+import locale
+import sys
+
+from pandas.io.formats.terminal import get_terminal_size
+
+# -----------------------------------------------------------------------------
+# Global formatting options
+_initial_defencoding = None
+
+
+def detect_console_encoding():
+    """
+    Try to find the most capable encoding supported by the console.
+    slightly modified from the way IPython handles the same issue.
+    """
+    global _initial_defencoding
+
+    encoding = None
+    try:
+        encoding = sys.stdout.encoding or sys.stdin.encoding
+    except (AttributeError, IOError):
+        pass
+
+    # try again for something better
+    if not encoding or 'ascii' in encoding.lower():
+        try:
+            encoding = locale.getpreferredencoding()
+        except Exception:
+            pass
+
+    # when all else fails. this will usually be "ascii"
+    if not encoding or 'ascii' in encoding.lower():
+        encoding = sys.getdefaultencoding()
+
+    # GH3360, save the reported defencoding at import time
+    # MPL backends may change it. Make available for debugging.
+    if not _initial_defencoding:
+        _initial_defencoding = sys.getdefaultencoding()
+
+    return encoding
+
+
+def get_console_size():
+    """Return console size as tuple = (width, height).
+
+    Returns (None,None) in non-interactive session.
+    """
+    from pandas import get_option
+
+    display_width = get_option('display.width')
+    # deprecated.
+    display_height = get_option('display.max_rows')
+
+    # Consider
+    # interactive shell terminal, can detect term size
+    # interactive non-shell terminal (ipnb/ipqtconsole), cannot detect term
+    # size non-interactive script, should disregard term size
+
+    # in addition
+    # width,height have default values, but setting to 'None' signals
+    # should use Auto-Detection, But only in interactive shell-terminal.
+    # Simple. yeah.
+
+    if in_interactive_session():
+        if in_ipython_frontend():
+            # sane defaults for interactive non-shell terminal
+            # match default for width,height in config_init
+            from pandas.core.config import get_default_val
+            terminal_width = get_default_val('display.width')
+            terminal_height = get_default_val('display.max_rows')
+        else:
+            # pure terminal
+            terminal_width, terminal_height = get_terminal_size()
+    else:
+        terminal_width, terminal_height = None, None
+
+    # Note if the User sets width/Height to None (auto-detection)
+    # and we're in a script (non-inter), this will return (None,None)
+    # caller needs to deal.
+    return (display_width or terminal_width, display_height or terminal_height)
+
+
+# ----------------------------------------------------------------------
+# Detect our environment
+
+def in_interactive_session():
+    """ check if we're running in an interactive shell
+
+    returns True if running under python/ipython interactive shell
+    """
+    from pandas import get_option
+
+    def check_main():
+        try:
+            import __main__ as main
+        except ModuleNotFoundError:
+            return get_option('mode.sim_interactive')
+        return (not hasattr(main, '__file__') or
+                get_option('mode.sim_interactive'))
+
+    try:
+        return __IPYTHON__ or check_main()  # noqa
+    except NameError:
+        return check_main()
+
+
+def in_ipython_frontend():
+    """
+    check if we're inside an an IPython zmq frontend
+    """
+    try:
+        ip = get_ipython()  # noqa
+        return 'zmq' in str(type(ip)).lower()
+    except NameError:
+        pass
+
+    return False
diff --git a/pandas/io/formats/css.py b/pandas/io/formats/css.py
new file mode 100644
index 0000000000000..429c98b579ca0
--- /dev/null
+++ b/pandas/io/formats/css.py
@@ -0,0 +1,250 @@
+"""Utilities for interpreting CSS from Stylers for formatting non-HTML outputs
+"""
+
+import re
+import warnings
+
+
+class CSSWarning(UserWarning):
+    """This CSS syntax cannot currently be parsed"""
+    pass
+
+
+class CSSResolver(object):
+    """A callable for parsing and resolving CSS to atomic properties
+
+    """
+
+    INITIAL_STYLE = {
+    }
+
+    def __call__(self, declarations_str, inherited=None):
+        """ the given declarations to atomic properties
+
+        Parameters
+        ----------
+        declarations_str : str
+            A list of CSS declarations
+        inherited : dict, optional
+            Atomic properties indicating the inherited style context in which
+            declarations_str is to be resolved. ``inherited`` should already
+            be resolved, i.e. valid output of this method.
+
+        Returns
+        -------
+        props : dict
+            Atomic CSS 2.2 properties
+
+        Examples
+        --------
+        >>> resolve = CSSResolver()
+        >>> inherited = {'font-family': 'serif', 'font-weight': 'bold'}
+        >>> out = resolve('''
+        ...               border-color: BLUE RED;
+        ...               font-size: 1em;
+        ...               font-size: 2em;
+        ...               font-weight: normal;
+        ...               font-weight: inherit;
+        ...               ''', inherited)
+        >>> sorted(out.items())  # doctest: +NORMALIZE_WHITESPACE
+        [('border-bottom-color', 'blue'),
+         ('border-left-color', 'red'),
+         ('border-right-color', 'red'),
+         ('border-top-color', 'blue'),
+         ('font-family', 'serif'),
+         ('font-size', '24pt'),
+         ('font-weight', 'bold')]
+        """
+
+        props = dict(self.atomize(self.parse(declarations_str)))
+        if inherited is None:
+            inherited = {}
+
+        # 1. resolve inherited, initial
+        for prop, val in inherited.items():
+            if prop not in props:
+                props[prop] = val
+
+        for prop, val in list(props.items()):
+            if val == 'inherit':
+                val = inherited.get(prop, 'initial')
+            if val == 'initial':
+                val = self.INITIAL_STYLE.get(prop)
+
+            if val is None:
+                # we do not define a complete initial stylesheet
+                del props[prop]
+            else:
+                props[prop] = val
+
+        # 2. resolve relative font size
+        if props.get('font-size'):
+            if 'font-size' in inherited:
+                em_pt = inherited['font-size']
+                assert em_pt[-2:] == 'pt'
+                em_pt = float(em_pt[:-2])
+            else:
+                em_pt = None
+            props['font-size'] = self.size_to_pt(
+                props['font-size'], em_pt, conversions=self.FONT_SIZE_RATIOS)
+
+            font_size = float(props['font-size'][:-2])
+        else:
+            font_size = None
+
+        # 3. TODO: resolve other font-relative units
+        for side in self.SIDES:
+            prop = 'border-{side}-width'.format(side=side)
+            if prop in props:
+                props[prop] = self.size_to_pt(
+                    props[prop], em_pt=font_size,
+                    conversions=self.BORDER_WIDTH_RATIOS)
+            for prop in ['margin-{side}'.format(side=side),
+                         'padding-{side}'.format(side=side)]:
+                if prop in props:
+                    # TODO: support %
+                    props[prop] = self.size_to_pt(
+                        props[prop], em_pt=font_size,
+                        conversions=self.MARGIN_RATIOS)
+
+        return props
+
+    UNIT_RATIOS = {
+        'rem': ('pt', 12),
+        'ex': ('em', .5),
+        # 'ch':
+        'px': ('pt', .75),
+        'pc': ('pt', 12),
+        'in': ('pt', 72),
+        'cm': ('in', 1 / 2.54),
+        'mm': ('in', 1 / 25.4),
+        'q': ('mm', .25),
+        '!!default': ('em', 0),
+    }
+
+    FONT_SIZE_RATIOS = UNIT_RATIOS.copy()
+    FONT_SIZE_RATIOS.update({
+        '%': ('em', .01),
+        'xx-small': ('rem', .5),
+        'x-small': ('rem', .625),
+        'small': ('rem', .8),
+        'medium': ('rem', 1),
+        'large': ('rem', 1.125),
+        'x-large': ('rem', 1.5),
+        'xx-large': ('rem', 2),
+        'smaller': ('em', 1 / 1.2),
+        'larger': ('em', 1.2),
+        '!!default': ('em', 1),
+    })
+
+    MARGIN_RATIOS = UNIT_RATIOS.copy()
+    MARGIN_RATIOS.update({
+        'none': ('pt', 0),
+    })
+
+    BORDER_WIDTH_RATIOS = UNIT_RATIOS.copy()
+    BORDER_WIDTH_RATIOS.update({
+        'none': ('pt', 0),
+        'thick': ('px', 4),
+        'medium': ('px', 2),
+        'thin': ('px', 1),
+        # Default: medium only if solid
+    })
+
+    def size_to_pt(self, in_val, em_pt=None, conversions=UNIT_RATIOS):
+        def _error():
+            warnings.warn('Unhandled size: {val!r}'.format(val=in_val),
+                          CSSWarning)
+            return self.size_to_pt('1!!default', conversions=conversions)
+
+        try:
+            val, unit = re.match(r'^(\S*?)([a-zA-Z%!].*)', in_val).groups()
+        except AttributeError:
+            return _error()
+        if val == '':
+            # hack for 'large' etc.
+            val = 1
+        else:
+            try:
+                val = float(val)
+            except ValueError:
+                return _error()
+
+        while unit != 'pt':
+            if unit == 'em':
+                if em_pt is None:
+                    unit = 'rem'
+                else:
+                    val *= em_pt
+                    unit = 'pt'
+                continue
+
+            try:
+                unit, mul = conversions[unit]
+            except KeyError:
+                return _error()
+            val *= mul
+
+        val = round(val, 5)
+        if int(val) == val:
+            size_fmt = '{fmt:d}pt'.format(fmt=int(val))
+        else:
+            size_fmt = '{fmt:f}pt'.format(fmt=val)
+        return size_fmt
+
+    def atomize(self, declarations):
+        for prop, value in declarations:
+            attr = 'expand_' + prop.replace('-', '_')
+            try:
+                expand = getattr(self, attr)
+            except AttributeError:
+                yield prop, value
+            else:
+                for prop, value in expand(prop, value):
+                    yield prop, value
+
+    SIDE_SHORTHANDS = {
+        1: [0, 0, 0, 0],
+        2: [0, 1, 0, 1],
+        3: [0, 1, 2, 1],
+        4: [0, 1, 2, 3],
+    }
+    SIDES = ('top', 'right', 'bottom', 'left')
+
+    def _side_expander(prop_fmt):
+        def expand(self, prop, value):
+            tokens = value.split()
+            try:
+                mapping = self.SIDE_SHORTHANDS[len(tokens)]
+            except KeyError:
+                warnings.warn('Could not expand "{prop}: {val}"'
+                              .format(prop=prop, val=value), CSSWarning)
+                return
+            for key, idx in zip(self.SIDES, mapping):
+                yield prop_fmt.format(key), tokens[idx]
+
+        return expand
+
+    expand_border_color = _side_expander('border-{:s}-color')
+    expand_border_style = _side_expander('border-{:s}-style')
+    expand_border_width = _side_expander('border-{:s}-width')
+    expand_margin = _side_expander('margin-{:s}')
+    expand_padding = _side_expander('padding-{:s}')
+
+    def parse(self, declarations_str):
+        """Generates (prop, value) pairs from declarations
+
+        In a future version may generate parsed tokens from tinycss/tinycss2
+        """
+        for decl in declarations_str.split(';'):
+            if not decl.strip():
+                continue
+            prop, sep, val = decl.partition(':')
+            prop = prop.strip().lower()
+            # TODO: don't lowercase case sensitive parts of values (strings)
+            val = val.strip().lower()
+            if sep:
+                yield prop, val
+            else:
+                warnings.warn('Ill-formatted attribute: expected a colon '
+                              'in {decl!r}'.format(decl=decl), CSSWarning)
diff --git a/pandas/io/formats/csvs.py b/pandas/io/formats/csvs.py
new file mode 100644
index 0000000000000..46c843af043e7
--- /dev/null
+++ b/pandas/io/formats/csvs.py
@@ -0,0 +1,315 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data into CSV files.
+"""
+
+from __future__ import print_function
+
+import csv as csvlib
+import os
+import warnings
+from zipfile import ZipFile
+
+import numpy as np
+
+from pandas._libs import writers as libwriters
+from pandas.compat import StringIO, range, zip
+
+from pandas.core.dtypes.generic import (
+    ABCDatetimeIndex, ABCIndexClass, ABCMultiIndex, ABCPeriodIndex)
+from pandas.core.dtypes.missing import notna
+
+from pandas import compat
+
+from pandas.io.common import (
+    UnicodeWriter, _get_handle, _infer_compression, get_filepath_or_buffer)
+
+
+class CSVFormatter(object):
+
+    def __init__(self, obj, path_or_buf=None, sep=",", na_rep='',
+                 float_format=None, cols=None, header=True, index=True,
+                 index_label=None, mode='w', nanRep=None, encoding=None,
+                 compression='infer', quoting=None, line_terminator='\n',
+                 chunksize=None, tupleize_cols=False, quotechar='"',
+                 date_format=None, doublequote=True, escapechar=None,
+                 decimal='.'):
+
+        self.obj = obj
+
+        if path_or_buf is None:
+            path_or_buf = StringIO()
+
+        self.path_or_buf, _, _, _ = get_filepath_or_buffer(
+            path_or_buf, encoding=encoding, compression=compression, mode=mode
+        )
+        self.sep = sep
+        self.na_rep = na_rep
+        self.float_format = float_format
+        self.decimal = decimal
+
+        self.header = header
+        self.index = index
+        self.index_label = index_label
+        self.mode = mode
+        if encoding is None:
+            encoding = 'ascii' if compat.PY2 else 'utf-8'
+        self.encoding = encoding
+        self.compression = _infer_compression(self.path_or_buf, compression)
+
+        if quoting is None:
+            quoting = csvlib.QUOTE_MINIMAL
+        self.quoting = quoting
+
+        if quoting == csvlib.QUOTE_NONE:
+            # prevents crash in _csv
+            quotechar = None
+        self.quotechar = quotechar
+
+        self.doublequote = doublequote
+        self.escapechar = escapechar
+
+        self.line_terminator = line_terminator or os.linesep
+
+        self.date_format = date_format
+
+        self.tupleize_cols = tupleize_cols
+        self.has_mi_columns = (isinstance(obj.columns, ABCMultiIndex) and
+                               not self.tupleize_cols)
+
+        # validate mi options
+        if self.has_mi_columns:
+            if cols is not None:
+                raise TypeError("cannot specify cols with a MultiIndex on the "
+                                "columns")
+
+        if cols is not None:
+            if isinstance(cols, ABCIndexClass):
+                cols = cols.to_native_types(na_rep=na_rep,
+                                            float_format=float_format,
+                                            date_format=date_format,
+                                            quoting=self.quoting)
+            else:
+                cols = list(cols)
+            self.obj = self.obj.loc[:, cols]
+
+        # update columns to include possible multiplicity of dupes
+        # and make sure sure cols is just a list of labels
+        cols = self.obj.columns
+        if isinstance(cols, ABCIndexClass):
+            cols = cols.to_native_types(na_rep=na_rep,
+                                        float_format=float_format,
+                                        date_format=date_format,
+                                        quoting=self.quoting)
+        else:
+            cols = list(cols)
+
+        # save it
+        self.cols = cols
+
+        # preallocate data 2d list
+        self.blocks = self.obj._data.blocks
+        ncols = sum(b.shape[0] for b in self.blocks)
+        self.data = [None] * ncols
+
+        if chunksize is None:
+            chunksize = (100000 // (len(self.cols) or 1)) or 1
+        self.chunksize = int(chunksize)
+
+        self.data_index = obj.index
+        if (isinstance(self.data_index, (ABCDatetimeIndex, ABCPeriodIndex)) and
+                date_format is not None):
+            from pandas import Index
+            self.data_index = Index([x.strftime(date_format) if notna(x) else
+                                     '' for x in self.data_index])
+
+        self.nlevels = getattr(self.data_index, 'nlevels', 1)
+        if not index:
+            self.nlevels = 0
+
+    def save(self):
+        """
+        Create the writer & save
+        """
+        # GH21227 internal compression is not used when file-like passed.
+        if self.compression and hasattr(self.path_or_buf, 'write'):
+            msg = ("compression has no effect when passing file-like "
+                   "object as input.")
+            warnings.warn(msg, RuntimeWarning, stacklevel=2)
+
+        # when zip compression is called.
+        is_zip = isinstance(self.path_or_buf, ZipFile) or (
+            not hasattr(self.path_or_buf, 'write')
+            and self.compression == 'zip')
+
+        if is_zip:
+            # zipfile doesn't support writing string to archive. uses string
+            # buffer to receive csv writing and dump into zip compression
+            # file handle. GH21241, GH21118
+            f = StringIO()
+            close = False
+        elif hasattr(self.path_or_buf, 'write'):
+            f = self.path_or_buf
+            close = False
+        else:
+            f, handles = _get_handle(self.path_or_buf, self.mode,
+                                     encoding=self.encoding,
+                                     compression=self.compression)
+            close = True
+
+        try:
+            writer_kwargs = dict(lineterminator=self.line_terminator,
+                                 delimiter=self.sep, quoting=self.quoting,
+                                 doublequote=self.doublequote,
+                                 escapechar=self.escapechar,
+                                 quotechar=self.quotechar)
+            if self.encoding == 'ascii':
+                self.writer = csvlib.writer(f, **writer_kwargs)
+            else:
+                writer_kwargs['encoding'] = self.encoding
+                self.writer = UnicodeWriter(f, **writer_kwargs)
+
+            self._save()
+
+        finally:
+            if is_zip:
+                # GH17778 handles zip compression separately.
+                buf = f.getvalue()
+                if hasattr(self.path_or_buf, 'write'):
+                    self.path_or_buf.write(buf)
+                else:
+                    f, handles = _get_handle(self.path_or_buf, self.mode,
+                                             encoding=self.encoding,
+                                             compression=self.compression)
+                    f.write(buf)
+                    close = True
+            if close:
+                f.close()
+                for _fh in handles:
+                    _fh.close()
+
+    def _save_header(self):
+
+        writer = self.writer
+        obj = self.obj
+        index_label = self.index_label
+        cols = self.cols
+        has_mi_columns = self.has_mi_columns
+        header = self.header
+        encoded_labels = []
+
+        has_aliases = isinstance(header, (tuple, list, np.ndarray,
+                                          ABCIndexClass))
+        if not (has_aliases or self.header):
+            return
+        if has_aliases:
+            if len(header) != len(cols):
+                raise ValueError(('Writing {ncols} cols but got {nalias} '
+                                 'aliases'.format(ncols=len(cols),
+                                                  nalias=len(header))))
+            else:
+                write_cols = header
+        else:
+            write_cols = cols
+
+        if self.index:
+            # should write something for index label
+            if index_label is not False:
+                if index_label is None:
+                    if isinstance(obj.index, ABCMultiIndex):
+                        index_label = []
+                        for i, name in enumerate(obj.index.names):
+                            if name is None:
+                                name = ''
+                            index_label.append(name)
+                    else:
+                        index_label = obj.index.name
+                        if index_label is None:
+                            index_label = ['']
+                        else:
+                            index_label = [index_label]
+                elif not isinstance(index_label,
+                                    (list, tuple, np.ndarray, ABCIndexClass)):
+                    # given a string for a DF with Index
+                    index_label = [index_label]
+
+                encoded_labels = list(index_label)
+            else:
+                encoded_labels = []
+
+        if not has_mi_columns or has_aliases:
+            encoded_labels += list(write_cols)
+            writer.writerow(encoded_labels)
+        else:
+            # write out the mi
+            columns = obj.columns
+
+            # write out the names for each level, then ALL of the values for
+            # each level
+            for i in range(columns.nlevels):
+
+                # we need at least 1 index column to write our col names
+                col_line = []
+                if self.index:
+
+                    # name is the first column
+                    col_line.append(columns.names[i])
+
+                    if isinstance(index_label, list) and len(index_label) > 1:
+                        col_line.extend([''] * (len(index_label) - 1))
+
+                col_line.extend(columns._get_level_values(i))
+
+                writer.writerow(col_line)
+
+            # Write out the index line if it's not empty.
+            # Otherwise, we will print out an extraneous
+            # blank line between the mi and the data rows.
+            if encoded_labels and set(encoded_labels) != {''}:
+                encoded_labels.extend([''] * len(columns))
+                writer.writerow(encoded_labels)
+
+    def _save(self):
+
+        self._save_header()
+
+        nrows = len(self.data_index)
+
+        # write in chunksize bites
+        chunksize = self.chunksize
+        chunks = int(nrows / chunksize) + 1
+
+        for i in range(chunks):
+            start_i = i * chunksize
+            end_i = min((i + 1) * chunksize, nrows)
+            if start_i >= end_i:
+                break
+
+            self._save_chunk(start_i, end_i)
+
+    def _save_chunk(self, start_i, end_i):
+
+        data_index = self.data_index
+
+        # create the data for a chunk
+        slicer = slice(start_i, end_i)
+        for i in range(len(self.blocks)):
+            b = self.blocks[i]
+            d = b.to_native_types(slicer=slicer, na_rep=self.na_rep,
+                                  float_format=self.float_format,
+                                  decimal=self.decimal,
+                                  date_format=self.date_format,
+                                  quoting=self.quoting)
+
+            for col_loc, col in zip(b.mgr_locs, d):
+                # self.data is a preallocated list
+                self.data[col_loc] = col
+
+        ix = data_index.to_native_types(slicer=slicer, na_rep=self.na_rep,
+                                        float_format=self.float_format,
+                                        decimal=self.decimal,
+                                        date_format=self.date_format,
+                                        quoting=self.quoting)
+
+        libwriters.write_csv_rows(self.data, ix, self.nlevels,
+                                  self.cols, self.writer)
diff --git a/pandas/io/formats/excel.py b/pandas/io/formats/excel.py
new file mode 100644
index 0000000000000..d74722996a660
--- /dev/null
+++ b/pandas/io/formats/excel.py
@@ -0,0 +1,664 @@
+"""Utilities for conversion to writer-agnostic Excel representation
+"""
+
+import itertools
+import re
+import warnings
+
+import numpy as np
+
+from pandas.compat import reduce
+
+from pandas.core.dtypes import missing
+from pandas.core.dtypes.common import is_float, is_scalar
+from pandas.core.dtypes.generic import ABCMultiIndex, ABCPeriodIndex
+
+from pandas import Index
+import pandas.core.common as com
+
+from pandas.io.formats.css import CSSResolver, CSSWarning
+from pandas.io.formats.format import get_level_lengths
+from pandas.io.formats.printing import pprint_thing
+
+
+class ExcelCell(object):
+    __fields__ = ('row', 'col', 'val', 'style', 'mergestart', 'mergeend')
+    __slots__ = __fields__
+
+    def __init__(self, row, col, val, style=None, mergestart=None,
+                 mergeend=None):
+        self.row = row
+        self.col = col
+        self.val = val
+        self.style = style
+        self.mergestart = mergestart
+        self.mergeend = mergeend
+
+
+class CSSToExcelConverter(object):
+    """A callable for converting CSS declarations to ExcelWriter styles
+
+    Supports parts of CSS 2.2, with minimal CSS 3.0 support (e.g. text-shadow),
+    focusing on font styling, backgrounds, borders and alignment.
+
+    Operates by first computing CSS styles in a fairly generic
+    way (see :meth:`compute_css`) then determining Excel style
+    properties from CSS properties (see :meth:`build_xlstyle`).
+
+    Parameters
+    ----------
+    inherited : str, optional
+        CSS declarations understood to be the containing scope for the
+        CSS processed by :meth:`__call__`.
+    """
+    # NB: Most of the methods here could be classmethods, as only __init__
+    #     and __call__ make use of instance attributes.  We leave them as
+    #     instancemethods so that users can easily experiment with extensions
+    #     without monkey-patching.
+
+    def __init__(self, inherited=None):
+        if inherited is not None:
+            inherited = self.compute_css(inherited,
+                                         self.compute_css.INITIAL_STYLE)
+
+        self.inherited = inherited
+
+    compute_css = CSSResolver()
+
+    def __call__(self, declarations_str):
+        """Convert CSS declarations to ExcelWriter style
+
+        Parameters
+        ----------
+        declarations_str : str
+            List of CSS declarations.
+            e.g. "font-weight: bold; background: blue"
+
+        Returns
+        -------
+        xlstyle : dict
+            A style as interpreted by ExcelWriter when found in
+            ExcelCell.style.
+        """
+        # TODO: memoize?
+        properties = self.compute_css(declarations_str, self.inherited)
+        return self.build_xlstyle(properties)
+
+    def build_xlstyle(self, props):
+        out = {
+            'alignment': self.build_alignment(props),
+            'border': self.build_border(props),
+            'fill': self.build_fill(props),
+            'font': self.build_font(props),
+            'number_format': self.build_number_format(props),
+        }
+        # TODO: handle cell width and height: needs support in pandas.io.excel
+
+        def remove_none(d):
+            """Remove key where value is None, through nested dicts"""
+            for k, v in list(d.items()):
+                if v is None:
+                    del d[k]
+                elif isinstance(v, dict):
+                    remove_none(v)
+                    if not v:
+                        del d[k]
+
+        remove_none(out)
+        return out
+
+    VERTICAL_MAP = {
+        'top': 'top',
+        'text-top': 'top',
+        'middle': 'center',
+        'baseline': 'bottom',
+        'bottom': 'bottom',
+        'text-bottom': 'bottom',
+        # OpenXML also has 'justify', 'distributed'
+    }
+
+    def build_alignment(self, props):
+        # TODO: text-indent, padding-left -> alignment.indent
+        return {'horizontal': props.get('text-align'),
+                'vertical': self.VERTICAL_MAP.get(props.get('vertical-align')),
+                'wrap_text': (None if props.get('white-space') is None else
+                              props['white-space'] not in
+                              ('nowrap', 'pre', 'pre-line'))
+                }
+
+    def build_border(self, props):
+        return {side: {
+            'style': self._border_style(props.get('border-{side}-style'
+                                        .format(side=side)),
+                                        props.get('border-{side}-width'
+                                        .format(side=side))),
+            'color': self.color_to_excel(
+                props.get('border-{side}-color'.format(side=side))),
+        } for side in ['top', 'right', 'bottom', 'left']}
+
+    def _border_style(self, style, width):
+        # convert styles and widths to openxml, one of:
+        #       'dashDot'
+        #       'dashDotDot'
+        #       'dashed'
+        #       'dotted'
+        #       'double'
+        #       'hair'
+        #       'medium'
+        #       'mediumDashDot'
+        #       'mediumDashDotDot'
+        #       'mediumDashed'
+        #       'slantDashDot'
+        #       'thick'
+        #       'thin'
+        if width is None and style is None:
+            return None
+        if style == 'none' or style == 'hidden':
+            return None
+
+        if width is None:
+            width = '2pt'
+        width = float(width[:-2])
+        if width < 1e-5:
+            return None
+        elif width < 1.3:
+            width_name = 'thin'
+        elif width < 2.8:
+            width_name = 'medium'
+        else:
+            width_name = 'thick'
+
+        if style in (None, 'groove', 'ridge', 'inset', 'outset'):
+            # not handled
+            style = 'solid'
+
+        if style == 'double':
+            return 'double'
+        if style == 'solid':
+            return width_name
+        if style == 'dotted':
+            if width_name in ('hair', 'thin'):
+                return 'dotted'
+            return 'mediumDashDotDot'
+        if style == 'dashed':
+            if width_name in ('hair', 'thin'):
+                return 'dashed'
+            return 'mediumDashed'
+
+    def build_fill(self, props):
+        # TODO: perhaps allow for special properties
+        #       -excel-pattern-bgcolor and -excel-pattern-type
+        fill_color = props.get('background-color')
+        if fill_color not in (None, 'transparent', 'none'):
+            return {
+                'fgColor': self.color_to_excel(fill_color),
+                'patternType': 'solid',
+            }
+
+    BOLD_MAP = {'bold': True, 'bolder': True, '600': True, '700': True,
+                '800': True, '900': True,
+                'normal': False, 'lighter': False, '100': False, '200': False,
+                '300': False, '400': False, '500': False}
+    ITALIC_MAP = {'normal': False, 'italic': True, 'oblique': True}
+
+    def build_font(self, props):
+        size = props.get('font-size')
+        if size is not None:
+            assert size.endswith('pt')
+            size = float(size[:-2])
+
+        font_names_tmp = re.findall(r'''(?x)
+            (
+            "(?:[^"]|\\")+"
+            |
+            '(?:[^']|\\')+'
+            |
+            [^'",]+
+            )(?=,|\s*$)
+        ''', props.get('font-family', ''))
+        font_names = []
+        for name in font_names_tmp:
+            if name[:1] == '"':
+                name = name[1:-1].replace('\\"', '"')
+            elif name[:1] == '\'':
+                name = name[1:-1].replace('\\\'', '\'')
+            else:
+                name = name.strip()
+            if name:
+                font_names.append(name)
+
+        family = None
+        for name in font_names:
+            if name == 'serif':
+                family = 1  # roman
+                break
+            elif name == 'sans-serif':
+                family = 2  # swiss
+                break
+            elif name == 'cursive':
+                family = 4  # script
+                break
+            elif name == 'fantasy':
+                family = 5  # decorative
+                break
+
+        decoration = props.get('text-decoration')
+        if decoration is not None:
+            decoration = decoration.split()
+        else:
+            decoration = ()
+
+        return {
+            'name': font_names[0] if font_names else None,
+            'family': family,
+            'size': size,
+            'bold': self.BOLD_MAP.get(props.get('font-weight')),
+            'italic': self.ITALIC_MAP.get(props.get('font-style')),
+            'underline': ('single' if
+                          'underline' in decoration
+                          else None),
+            'strike': ('line-through' in decoration) or None,
+            'color': self.color_to_excel(props.get('color')),
+            # shadow if nonzero digit before shadow color
+            'shadow': (bool(re.search('^[^#(]*[1-9]',
+                                      props['text-shadow']))
+                       if 'text-shadow' in props else None),
+            # 'vertAlign':,
+            # 'charset': ,
+            # 'scheme': ,
+            # 'outline': ,
+            # 'condense': ,
+        }
+
+    NAMED_COLORS = {
+        'maroon': '800000',
+        'brown': 'A52A2A',
+        'red': 'FF0000',
+        'pink': 'FFC0CB',
+        'orange': 'FFA500',
+        'yellow': 'FFFF00',
+        'olive': '808000',
+        'green': '008000',
+        'purple': '800080',
+        'fuchsia': 'FF00FF',
+        'lime': '00FF00',
+        'teal': '008080',
+        'aqua': '00FFFF',
+        'blue': '0000FF',
+        'navy': '000080',
+        'black': '000000',
+        'gray': '808080',
+        'grey': '808080',
+        'silver': 'C0C0C0',
+        'white': 'FFFFFF',
+    }
+
+    def color_to_excel(self, val):
+        if val is None:
+            return None
+        if val.startswith('#') and len(val) == 7:
+            return val[1:].upper()
+        if val.startswith('#') and len(val) == 4:
+            return (val[1] * 2 + val[2] * 2 + val[3] * 2).upper()
+        try:
+            return self.NAMED_COLORS[val]
+        except KeyError:
+            warnings.warn('Unhandled color format: {val!r}'.format(val=val),
+                          CSSWarning)
+
+    def build_number_format(self, props):
+        return {'format_code': props.get('number-format')}
+
+
+class ExcelFormatter(object):
+    """
+    Class for formatting a DataFrame to a list of ExcelCells,
+
+    Parameters
+    ----------
+    df : DataFrame or Styler
+    na_rep: na representation
+    float_format : string, default None
+            Format string for floating point numbers
+    cols : sequence, optional
+        Columns to write
+    header : boolean or list of string, default True
+        Write out column names. If a list of string is given it is
+        assumed to be aliases for the column names
+    index : boolean, default True
+        output row names (index)
+    index_label : string or sequence, default None
+            Column label for index column(s) if desired. If None is given, and
+            `header` and `index` are True, then the index names are used. A
+            sequence should be given if the DataFrame uses MultiIndex.
+    merge_cells : boolean, default False
+            Format MultiIndex and Hierarchical Rows as merged cells.
+    inf_rep : string, default `'inf'`
+        representation for np.inf values (which aren't representable in Excel)
+        A `'-'` sign will be added in front of -inf.
+    style_converter : callable, optional
+        This translates Styler styles (CSS) into ExcelWriter styles.
+        Defaults to ``CSSToExcelConverter()``.
+        It should have signature css_declarations string -> excel style.
+        This is only called for body cells.
+    """
+
+    def __init__(self, df, na_rep='', float_format=None, cols=None,
+                 header=True, index=True, index_label=None, merge_cells=False,
+                 inf_rep='inf', style_converter=None):
+        self.rowcounter = 0
+        self.na_rep = na_rep
+        if hasattr(df, 'render'):
+            self.styler = df
+            df = df.data
+            if style_converter is None:
+                style_converter = CSSToExcelConverter()
+            self.style_converter = style_converter
+        else:
+            self.styler = None
+        self.df = df
+        if cols is not None:
+
+            # all missing, raise
+            if not len(Index(cols) & df.columns):
+                raise KeyError(
+                    "passes columns are not ALL present dataframe")
+
+            # deprecatedin gh-17295
+            # 1 missing is ok (for now)
+            if len(Index(cols) & df.columns) != len(cols):
+                warnings.warn(
+                    "Not all names specified in 'columns' are found; "
+                    "this will raise a KeyError in the future",
+                    FutureWarning)
+
+            self.df = df.reindex(columns=cols)
+        self.columns = self.df.columns
+        self.float_format = float_format
+        self.index = index
+        self.index_label = index_label
+        self.header = header
+        self.merge_cells = merge_cells
+        self.inf_rep = inf_rep
+
+    @property
+    def header_style(self):
+        return {"font": {"bold": True},
+                "borders": {"top": "thin",
+                            "right": "thin",
+                            "bottom": "thin",
+                            "left": "thin"},
+                "alignment": {"horizontal": "center",
+                              "vertical": "top"}}
+
+    def _format_value(self, val):
+        if is_scalar(val) and missing.isna(val):
+            val = self.na_rep
+        elif is_float(val):
+            if missing.isposinf_scalar(val):
+                val = self.inf_rep
+            elif missing.isneginf_scalar(val):
+                val = '-{inf}'.format(inf=self.inf_rep)
+            elif self.float_format is not None:
+                val = float(self.float_format % val)
+        return val
+
+    def _format_header_mi(self):
+        if self.columns.nlevels > 1:
+            if not self.index:
+                raise NotImplementedError("Writing to Excel with MultiIndex"
+                                          " columns and no index "
+                                          "('index'=False) is not yet "
+                                          "implemented.")
+
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if not (has_aliases or self.header):
+            return
+
+        columns = self.columns
+        level_strs = columns.format(sparsify=self.merge_cells, adjoin=False,
+                                    names=False)
+        level_lengths = get_level_lengths(level_strs)
+        coloffset = 0
+        lnum = 0
+
+        if self.index and isinstance(self.df.index, ABCMultiIndex):
+            coloffset = len(self.df.index[0]) - 1
+
+        if self.merge_cells:
+            # Format multi-index as a merged cells.
+            for lnum in range(len(level_lengths)):
+                name = columns.names[lnum]
+                yield ExcelCell(lnum, coloffset, name, self.header_style)
+
+            for lnum, (spans, levels, level_codes) in enumerate(zip(
+                    level_lengths, columns.levels, columns.codes)):
+                values = levels.take(level_codes)
+                for i in spans:
+                    if spans[i] > 1:
+                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
+                                        self.header_style, lnum,
+                                        coloffset + i + spans[i])
+                    else:
+                        yield ExcelCell(lnum, coloffset + i + 1, values[i],
+                                        self.header_style)
+        else:
+            # Format in legacy format with dots to indicate levels.
+            for i, values in enumerate(zip(*level_strs)):
+                v = ".".join(map(pprint_thing, values))
+                yield ExcelCell(lnum, coloffset + i + 1, v, self.header_style)
+
+        self.rowcounter = lnum
+
+    def _format_header_regular(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            coloffset = 0
+
+            if self.index:
+                coloffset = 1
+                if isinstance(self.df.index, ABCMultiIndex):
+                    coloffset = len(self.df.index[0])
+
+            colnames = self.columns
+            if has_aliases:
+                if len(self.header) != len(self.columns):
+                    raise ValueError('Writing {cols} cols but got {alias} '
+                                     'aliases'.format(cols=len(self.columns),
+                                                      alias=len(self.header)))
+                else:
+                    colnames = self.header
+
+            for colindex, colname in enumerate(colnames):
+                yield ExcelCell(self.rowcounter, colindex + coloffset, colname,
+                                self.header_style)
+
+    def _format_header(self):
+        if isinstance(self.columns, ABCMultiIndex):
+            gen = self._format_header_mi()
+        else:
+            gen = self._format_header_regular()
+
+        gen2 = ()
+        if self.df.index.names:
+            row = [x if x is not None else ''
+                   for x in self.df.index.names] + [''] * len(self.columns)
+            if reduce(lambda x, y: x and y, map(lambda x: x != '', row)):
+                gen2 = (ExcelCell(self.rowcounter, colindex, val,
+                                  self.header_style)
+                        for colindex, val in enumerate(row))
+                self.rowcounter += 1
+        return itertools.chain(gen, gen2)
+
+    def _format_body(self):
+
+        if isinstance(self.df.index, ABCMultiIndex):
+            return self._format_hierarchical_rows()
+        else:
+            return self._format_regular_rows()
+
+    def _format_regular_rows(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            self.rowcounter += 1
+
+        # output index and index_label?
+        if self.index:
+            # check aliases
+            # if list only take first as this is not a MultiIndex
+            if (self.index_label and
+                    isinstance(self.index_label, (list, tuple, np.ndarray,
+                                                  Index))):
+                index_label = self.index_label[0]
+            # if string good to go
+            elif self.index_label and isinstance(self.index_label, str):
+                index_label = self.index_label
+            else:
+                index_label = self.df.index.names[0]
+
+            if isinstance(self.columns, ABCMultiIndex):
+                self.rowcounter += 1
+
+            if index_label and self.header is not False:
+                yield ExcelCell(self.rowcounter - 1, 0, index_label,
+                                self.header_style)
+
+            # write index_values
+            index_values = self.df.index
+            if isinstance(self.df.index, ABCPeriodIndex):
+                index_values = self.df.index.to_timestamp()
+
+            for idx, idxval in enumerate(index_values):
+                yield ExcelCell(self.rowcounter + idx, 0, idxval,
+                                self.header_style)
+
+            coloffset = 1
+        else:
+            coloffset = 0
+
+        for cell in self._generate_body(coloffset):
+            yield cell
+
+    def _format_hierarchical_rows(self):
+        has_aliases = isinstance(self.header, (tuple, list, np.ndarray, Index))
+        if has_aliases or self.header:
+            self.rowcounter += 1
+
+        gcolidx = 0
+
+        if self.index:
+            index_labels = self.df.index.names
+            # check for aliases
+            if (self.index_label and
+                    isinstance(self.index_label, (list, tuple, np.ndarray,
+                                                  Index))):
+                index_labels = self.index_label
+
+            # MultiIndex columns require an extra row
+            # with index names (blank if None) for
+            # unambigous round-trip, unless not merging,
+            # in which case the names all go on one row Issue #11328
+            if isinstance(self.columns, ABCMultiIndex) and self.merge_cells:
+                self.rowcounter += 1
+
+            # if index labels are not empty go ahead and dump
+            if com._any_not_none(*index_labels) and self.header is not False:
+
+                for cidx, name in enumerate(index_labels):
+                    yield ExcelCell(self.rowcounter - 1, cidx, name,
+                                    self.header_style)
+
+            if self.merge_cells:
+                # Format hierarchical rows as merged cells.
+                level_strs = self.df.index.format(sparsify=True, adjoin=False,
+                                                  names=False)
+                level_lengths = get_level_lengths(level_strs)
+
+                for spans, levels, level_codes in zip(level_lengths,
+                                                      self.df.index.levels,
+                                                      self.df.index.codes):
+
+                    values = levels.take(level_codes,
+                                         allow_fill=levels._can_hold_na,
+                                         fill_value=True)
+
+                    for i in spans:
+                        if spans[i] > 1:
+                            yield ExcelCell(self.rowcounter + i, gcolidx,
+                                            values[i], self.header_style,
+                                            self.rowcounter + i + spans[i] - 1,
+                                            gcolidx)
+                        else:
+                            yield ExcelCell(self.rowcounter + i, gcolidx,
+                                            values[i], self.header_style)
+                    gcolidx += 1
+
+            else:
+                # Format hierarchical rows with non-merged values.
+                for indexcolvals in zip(*self.df.index):
+                    for idx, indexcolval in enumerate(indexcolvals):
+                        yield ExcelCell(self.rowcounter + idx, gcolidx,
+                                        indexcolval, self.header_style)
+                    gcolidx += 1
+
+        for cell in self._generate_body(gcolidx):
+            yield cell
+
+    def _generate_body(self, coloffset):
+        if self.styler is None:
+            styles = None
+        else:
+            styles = self.styler._compute().ctx
+            if not styles:
+                styles = None
+        xlstyle = None
+
+        # Write the body of the frame data series by series.
+        for colidx in range(len(self.columns)):
+            series = self.df.iloc[:, colidx]
+            for i, val in enumerate(series):
+                if styles is not None:
+                    xlstyle = self.style_converter(';'.join(styles[i, colidx]))
+                yield ExcelCell(self.rowcounter + i, colidx + coloffset, val,
+                                xlstyle)
+
+    def get_formatted_cells(self):
+        for cell in itertools.chain(self._format_header(),
+                                    self._format_body()):
+            cell.val = self._format_value(cell.val)
+            yield cell
+
+    def write(self, writer, sheet_name='Sheet1', startrow=0,
+              startcol=0, freeze_panes=None, engine=None):
+        """
+        writer : string or ExcelWriter object
+            File path or existing ExcelWriter
+        sheet_name : string, default 'Sheet1'
+            Name of sheet which will contain DataFrame
+        startrow :
+            upper left cell row to dump data frame
+        startcol :
+            upper left cell column to dump data frame
+        freeze_panes : tuple of integer (length 2), default None
+            Specifies the one-based bottommost row and rightmost column that
+            is to be frozen
+        engine : string, default None
+            write engine to use if writer is a path - you can also set this
+            via the options ``io.excel.xlsx.writer``, ``io.excel.xls.writer``,
+            and ``io.excel.xlsm.writer``.
+        """
+        from pandas.io.excel import ExcelWriter
+        from pandas.io.common import _stringify_path
+
+        if isinstance(writer, ExcelWriter):
+            need_save = False
+        else:
+            writer = ExcelWriter(_stringify_path(writer), engine=engine)
+            need_save = True
+
+        formatted_cells = self.get_formatted_cells()
+        writer.write_cells(formatted_cells, sheet_name,
+                           startrow=startrow, startcol=startcol,
+                           freeze_panes=freeze_panes)
+        if need_save:
+            writer.save()
diff --git a/pandas/io/formats/format.py b/pandas/io/formats/format.py
new file mode 100644
index 0000000000000..f68ef2cc39006
--- /dev/null
+++ b/pandas/io/formats/format.py
@@ -0,0 +1,1626 @@
+# -*- coding: utf-8 -*-
+"""
+Internal module for formatting output data in csv, html,
+and latex files. This module also applies to display formatting.
+"""
+
+from __future__ import print_function
+
+from functools import partial
+
+import numpy as np
+
+from pandas._libs import lib
+from pandas._libs.tslib import format_array_from_datetime
+from pandas._libs.tslibs import NaT, Timedelta, Timestamp, iNaT
+from pandas.compat import StringIO, lzip, map, u, zip
+
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
+    is_extension_array_dtype, is_float, is_float_dtype, is_integer,
+    is_integer_dtype, is_list_like, is_numeric_dtype, is_scalar,
+    is_timedelta64_dtype)
+from pandas.core.dtypes.generic import (
+    ABCIndexClass, ABCMultiIndex, ABCSeries, ABCSparseArray)
+from pandas.core.dtypes.missing import isna, notna
+
+from pandas import compat
+from pandas.core.base import PandasObject
+import pandas.core.common as com
+from pandas.core.config import get_option, set_option
+from pandas.core.index import Index, ensure_index
+from pandas.core.indexes.datetimes import DatetimeIndex
+
+from pandas.io.common import _expand_user, _stringify_path
+from pandas.io.formats.printing import adjoin, justify, pprint_thing
+from pandas.io.formats.terminal import get_terminal_size
+
+# pylint: disable=W0141
+
+
+common_docstring = """
+        Parameters
+        ----------
+        buf : StringIO-like, optional
+            Buffer to write to.
+        columns : sequence, optional, default None
+            The subset of columns to write. Writes all columns by default.
+        col_space : int, optional
+            The minimum width of each column.
+        header : bool, optional
+            %(header)s.
+        index : bool, optional, default True
+            Whether to print index (row) labels.
+        na_rep : str, optional, default 'NaN'
+            String representation of NAN to use.
+        formatters : list or dict of one-param. functions, optional
+            Formatter functions to apply to columns' elements by position or
+            name.
+            The result of each function must be a unicode string.
+            List must be of length equal to the number of columns.
+        float_format : one-parameter function, optional, default None
+            Formatter function to apply to columns' elements if they are
+            floats. The result of this function must be a unicode string.
+        sparsify : bool, optional, default True
+            Set to False for a DataFrame with a hierarchical index to print
+            every multiindex key at each row.
+        index_names : bool, optional, default True
+            Prints the names of the indexes.
+        justify : str, default None
+            How to justify the column labels. If None uses the option from
+            the print configuration (controlled by set_option), 'right' out
+            of the box. Valid values are
+
+            * left
+            * right
+            * center
+            * justify
+            * justify-all
+            * start
+            * end
+            * inherit
+            * match-parent
+            * initial
+            * unset.
+        max_rows : int, optional
+            Maximum number of rows to display in the console.
+        max_cols : int, optional
+            Maximum number of columns to display in the console.
+        show_dimensions : bool, default False
+            Display DataFrame dimensions (number of rows by number of columns).
+        decimal : str, default '.'
+            Character recognized as decimal separator, e.g. ',' in Europe.
+
+            .. versionadded:: 0.18.0
+    """
+
+_VALID_JUSTIFY_PARAMETERS = ("left", "right", "center", "justify",
+                             "justify-all", "start", "end", "inherit",
+                             "match-parent", "initial", "unset")
+
+return_docstring = """
+        Returns
+        -------
+        str (or unicode, depending on data and options)
+            String representation of the dataframe.
+    """
+
+
+class CategoricalFormatter(object):
+
+    def __init__(self, categorical, buf=None, length=True, na_rep='NaN',
+                 footer=True):
+        self.categorical = categorical
+        self.buf = buf if buf is not None else StringIO(u(""))
+        self.na_rep = na_rep
+        self.length = length
+        self.footer = footer
+
+    def _get_footer(self):
+        footer = ''
+
+        if self.length:
+            if footer:
+                footer += ', '
+            footer += "Length: {length}".format(length=len(self.categorical))
+
+        level_info = self.categorical._repr_categories_info()
+
+        # Levels are added in a newline
+        if footer:
+            footer += '\n'
+        footer += level_info
+
+        return compat.text_type(footer)
+
+    def _get_formatted_values(self):
+        return format_array(self.categorical.get_values(), None,
+                            float_format=None, na_rep=self.na_rep)
+
+    def to_string(self):
+        categorical = self.categorical
+
+        if len(categorical) == 0:
+            if self.footer:
+                return self._get_footer()
+            else:
+                return u('')
+
+        fmt_values = self._get_formatted_values()
+
+        result = [u('{i}').format(i=i) for i in fmt_values]
+        result = [i.strip() for i in result]
+        result = u(', ').join(result)
+        result = [u('[') + result + u(']')]
+        if self.footer:
+            footer = self._get_footer()
+            if footer:
+                result.append(footer)
+
+        return compat.text_type(u('\n').join(result))
+
+
+class SeriesFormatter(object):
+
+    def __init__(self, series, buf=None, length=True, header=True, index=True,
+                 na_rep='NaN', name=False, float_format=None, dtype=True,
+                 max_rows=None):
+        self.series = series
+        self.buf = buf if buf is not None else StringIO()
+        self.name = name
+        self.na_rep = na_rep
+        self.header = header
+        self.length = length
+        self.index = index
+        self.max_rows = max_rows
+
+        if float_format is None:
+            float_format = get_option("display.float_format")
+        self.float_format = float_format
+        self.dtype = dtype
+        self.adj = _get_adjustment()
+
+        self._chk_truncate()
+
+    def _chk_truncate(self):
+        from pandas.core.reshape.concat import concat
+        max_rows = self.max_rows
+        truncate_v = max_rows and (len(self.series) > max_rows)
+        series = self.series
+        if truncate_v:
+            if max_rows == 1:
+                row_num = max_rows
+                series = series.iloc[:max_rows]
+            else:
+                row_num = max_rows // 2
+                series = concat((series.iloc[:row_num],
+                                 series.iloc[-row_num:]))
+            self.tr_row_num = row_num
+        self.tr_series = series
+        self.truncate_v = truncate_v
+
+    def _get_footer(self):
+        name = self.series.name
+        footer = u('')
+
+        if getattr(self.series.index, 'freq', None) is not None:
+            footer += 'Freq: {freq}'.format(freq=self.series.index.freqstr)
+
+        if self.name is not False and name is not None:
+            if footer:
+                footer += ', '
+
+            series_name = pprint_thing(name,
+                                       escape_chars=('\t', '\r', '\n'))
+            footer += ((u"Name: {sname}".format(sname=series_name))
+                       if name is not None else "")
+
+        if (self.length is True or
+                (self.length == 'truncate' and self.truncate_v)):
+            if footer:
+                footer += ', '
+            footer += 'Length: {length}'.format(length=len(self.series))
+
+        if self.dtype is not False and self.dtype is not None:
+            name = getattr(self.tr_series.dtype, 'name', None)
+            if name:
+                if footer:
+                    footer += ', '
+                footer += u'dtype: {typ}'.format(typ=pprint_thing(name))
+
+        # level infos are added to the end and in a new line, like it is done
+        # for Categoricals
+        if is_categorical_dtype(self.tr_series.dtype):
+            level_info = self.tr_series._values._repr_categories_info()
+            if footer:
+                footer += "\n"
+            footer += level_info
+
+        return compat.text_type(footer)
+
+    def _get_formatted_index(self):
+        index = self.tr_series.index
+        is_multi = isinstance(index, ABCMultiIndex)
+
+        if is_multi:
+            have_header = any(name for name in index.names)
+            fmt_index = index.format(names=True)
+        else:
+            have_header = index.name is not None
+            fmt_index = index.format(name=True)
+        return fmt_index, have_header
+
+    def _get_formatted_values(self):
+        values_to_format = self.tr_series._formatting_values()
+        return format_array(values_to_format, None,
+                            float_format=self.float_format, na_rep=self.na_rep)
+
+    def to_string(self):
+        series = self.tr_series
+        footer = self._get_footer()
+
+        if len(series) == 0:
+            return 'Series([], ' + footer + ')'
+
+        fmt_index, have_header = self._get_formatted_index()
+        fmt_values = self._get_formatted_values()
+
+        if self.truncate_v:
+            n_header_rows = 0
+            row_num = self.tr_row_num
+            width = self.adj.len(fmt_values[row_num - 1])
+            if width > 3:
+                dot_str = '...'
+            else:
+                dot_str = '..'
+            # Series uses mode=center because it has single value columns
+            # DataFrame uses mode=left
+            dot_str = self.adj.justify([dot_str], width, mode='center')[0]
+            fmt_values.insert(row_num + n_header_rows, dot_str)
+            fmt_index.insert(row_num + 1, '')
+
+        if self.index:
+            result = self.adj.adjoin(3, *[fmt_index[1:], fmt_values])
+        else:
+            result = self.adj.adjoin(3, fmt_values)
+
+        if self.header and have_header:
+            result = fmt_index[0] + '\n' + result
+
+        if footer:
+            result += '\n' + footer
+
+        return compat.text_type(u('').join(result))
+
+
+class TextAdjustment(object):
+
+    def __init__(self):
+        self.encoding = get_option("display.encoding")
+
+    def len(self, text):
+        return compat.strlen(text, encoding=self.encoding)
+
+    def justify(self, texts, max_len, mode='right'):
+        return justify(texts, max_len, mode=mode)
+
+    def adjoin(self, space, *lists, **kwargs):
+        return adjoin(space, *lists, strlen=self.len,
+                      justfunc=self.justify, **kwargs)
+
+
+class EastAsianTextAdjustment(TextAdjustment):
+
+    def __init__(self):
+        super(EastAsianTextAdjustment, self).__init__()
+        if get_option("display.unicode.ambiguous_as_wide"):
+            self.ambiguous_width = 2
+        else:
+            self.ambiguous_width = 1
+
+    def len(self, text):
+        return compat.east_asian_len(text, encoding=self.encoding,
+                                     ambiguous_width=self.ambiguous_width)
+
+    def justify(self, texts, max_len, mode='right'):
+        # re-calculate padding space per str considering East Asian Width
+        def _get_pad(t):
+            return max_len - self.len(t) + len(t)
+
+        if mode == 'left':
+            return [x.ljust(_get_pad(x)) for x in texts]
+        elif mode == 'center':
+            return [x.center(_get_pad(x)) for x in texts]
+        else:
+            return [x.rjust(_get_pad(x)) for x in texts]
+
+
+def _get_adjustment():
+    use_east_asian_width = get_option("display.unicode.east_asian_width")
+    if use_east_asian_width:
+        return EastAsianTextAdjustment()
+    else:
+        return TextAdjustment()
+
+
+class TableFormatter(object):
+
+    is_truncated = False
+    show_dimensions = None
+
+    @property
+    def should_show_dimensions(self):
+        return (self.show_dimensions is True or
+                (self.show_dimensions == 'truncate' and self.is_truncated))
+
+    def _get_formatter(self, i):
+        if isinstance(self.formatters, (list, tuple)):
+            if is_integer(i):
+                return self.formatters[i]
+            else:
+                return None
+        else:
+            if is_integer(i) and i not in self.columns:
+                i = self.columns[i]
+            return self.formatters.get(i, None)
+
+
+class DataFrameFormatter(TableFormatter):
+    """
+    Render a DataFrame
+
+    self.to_string() : console-friendly tabular output
+    self.to_html()   : html table
+    self.to_latex()   : LaTeX tabular environment table
+
+    """
+
+    __doc__ = __doc__ if __doc__ else ''
+    __doc__ += common_docstring + return_docstring
+
+    def __init__(self, frame, buf=None, columns=None, col_space=None,
+                 header=True, index=True, na_rep='NaN', formatters=None,
+                 justify=None, float_format=None, sparsify=None,
+                 index_names=True, line_width=None, max_rows=None,
+                 max_cols=None, show_dimensions=False, decimal='.',
+                 table_id=None, render_links=False, **kwds):
+        self.frame = frame
+        if buf is not None:
+            self.buf = _expand_user(_stringify_path(buf))
+        else:
+            self.buf = StringIO()
+        self.show_index_names = index_names
+
+        if sparsify is None:
+            sparsify = get_option("display.multi_sparse")
+
+        self.sparsify = sparsify
+
+        self.float_format = float_format
+        self.formatters = formatters if formatters is not None else {}
+        self.na_rep = na_rep
+        self.decimal = decimal
+        self.col_space = col_space
+        self.header = header
+        self.index = index
+        self.line_width = line_width
+        self.max_rows = max_rows
+        self.max_cols = max_cols
+        self.max_rows_displayed = min(max_rows or len(self.frame),
+                                      len(self.frame))
+        self.show_dimensions = show_dimensions
+        self.table_id = table_id
+        self.render_links = render_links
+
+        if justify is None:
+            self.justify = get_option("display.colheader_justify")
+        else:
+            self.justify = justify
+
+        self.kwds = kwds
+
+        if columns is not None:
+            self.columns = ensure_index(columns)
+            self.frame = self.frame[self.columns]
+        else:
+            self.columns = frame.columns
+
+        self._chk_truncate()
+        self.adj = _get_adjustment()
+
+    def _chk_truncate(self):
+        """
+        Checks whether the frame should be truncated. If so, slices
+        the frame up.
+        """
+        from pandas.core.reshape.concat import concat
+
+        # Cut the data to the information actually printed
+        max_cols = self.max_cols
+        max_rows = self.max_rows
+
+        if max_cols == 0 or max_rows == 0:  # assume we are in the terminal
+                                            # (why else = 0)
+            (w, h) = get_terminal_size()
+            self.w = w
+            self.h = h
+            if self.max_rows == 0:
+                dot_row = 1
+                prompt_row = 1
+                if self.show_dimensions:
+                    show_dimension_rows = 3
+                n_add_rows = (self.header + dot_row + show_dimension_rows +
+                              prompt_row)
+                # rows available to fill with actual data
+                max_rows_adj = self.h - n_add_rows
+                self.max_rows_adj = max_rows_adj
+
+            # Format only rows and columns that could potentially fit the
+            # screen
+            if max_cols == 0 and len(self.frame.columns) > w:
+                max_cols = w
+            if max_rows == 0 and len(self.frame) > h:
+                max_rows = h
+
+        if not hasattr(self, 'max_rows_adj'):
+            self.max_rows_adj = max_rows
+        if not hasattr(self, 'max_cols_adj'):
+            self.max_cols_adj = max_cols
+
+        max_cols_adj = self.max_cols_adj
+        max_rows_adj = self.max_rows_adj
+
+        truncate_h = max_cols_adj and (len(self.columns) > max_cols_adj)
+        truncate_v = max_rows_adj and (len(self.frame) > max_rows_adj)
+
+        frame = self.frame
+        if truncate_h:
+            if max_cols_adj == 0:
+                col_num = len(frame.columns)
+            elif max_cols_adj == 1:
+                frame = frame.iloc[:, :max_cols]
+                col_num = max_cols
+            else:
+                col_num = (max_cols_adj // 2)
+                frame = concat((frame.iloc[:, :col_num],
+                                frame.iloc[:, -col_num:]), axis=1)
+            self.tr_col_num = col_num
+        if truncate_v:
+            if max_rows_adj == 1:
+                row_num = max_rows
+                frame = frame.iloc[:max_rows, :]
+            else:
+                row_num = max_rows_adj // 2
+                frame = concat((frame.iloc[:row_num, :],
+                                frame.iloc[-row_num:, :]))
+            self.tr_row_num = row_num
+
+        self.tr_frame = frame
+        self.truncate_h = truncate_h
+        self.truncate_v = truncate_v
+        self.is_truncated = self.truncate_h or self.truncate_v
+
+    def _to_str_columns(self):
+        """
+        Render a DataFrame to a list of columns (as lists of strings).
+        """
+        frame = self.tr_frame
+        # may include levels names also
+
+        str_index = self._get_formatted_index(frame)
+
+        if not is_list_like(self.header) and not self.header:
+            stringified = []
+            for i, c in enumerate(frame):
+                fmt_values = self._format_col(i)
+                fmt_values = _make_fixed_width(fmt_values, self.justify,
+                                               minimum=(self.col_space or 0),
+                                               adj=self.adj)
+                stringified.append(fmt_values)
+        else:
+            if is_list_like(self.header):
+                if len(self.header) != len(self.columns):
+                    raise ValueError(('Writing {ncols} cols but got {nalias} '
+                                      'aliases'
+                                      .format(ncols=len(self.columns),
+                                              nalias=len(self.header))))
+                str_columns = [[label] for label in self.header]
+            else:
+                str_columns = self._get_formatted_column_labels(frame)
+
+            stringified = []
+            for i, c in enumerate(frame):
+                cheader = str_columns[i]
+                header_colwidth = max(self.col_space or 0,
+                                      *(self.adj.len(x) for x in cheader))
+                fmt_values = self._format_col(i)
+                fmt_values = _make_fixed_width(fmt_values, self.justify,
+                                               minimum=header_colwidth,
+                                               adj=self.adj)
+
+                max_len = max(max(self.adj.len(x) for x in fmt_values),
+                              header_colwidth)
+                cheader = self.adj.justify(cheader, max_len, mode=self.justify)
+                stringified.append(cheader + fmt_values)
+
+        strcols = stringified
+        if self.index:
+            strcols.insert(0, str_index)
+
+        # Add ... to signal truncated
+        truncate_h = self.truncate_h
+        truncate_v = self.truncate_v
+
+        if truncate_h:
+            col_num = self.tr_col_num
+            strcols.insert(self.tr_col_num + 1, [' ...'] * (len(str_index)))
+        if truncate_v:
+            n_header_rows = len(str_index) - len(frame)
+            row_num = self.tr_row_num
+            for ix, col in enumerate(strcols):
+                # infer from above row
+                cwidth = self.adj.len(strcols[ix][row_num])
+                is_dot_col = False
+                if truncate_h:
+                    is_dot_col = ix == col_num + 1
+                if cwidth > 3 or is_dot_col:
+                    my_str = '...'
+                else:
+                    my_str = '..'
+
+                if ix == 0:
+                    dot_mode = 'left'
+                elif is_dot_col:
+                    cwidth = 4
+                    dot_mode = 'right'
+                else:
+                    dot_mode = 'right'
+                dot_str = self.adj.justify([my_str], cwidth, mode=dot_mode)[0]
+                strcols[ix].insert(row_num + n_header_rows, dot_str)
+        return strcols
+
+    def to_string(self):
+        """
+        Render a DataFrame to a console-friendly tabular output.
+        """
+        from pandas import Series
+
+        frame = self.frame
+
+        if len(frame.columns) == 0 or len(frame.index) == 0:
+            info_line = (u('Empty {name}\nColumns: {col}\nIndex: {idx}')
+                         .format(name=type(self.frame).__name__,
+                         col=pprint_thing(frame.columns),
+                         idx=pprint_thing(frame.index)))
+            text = info_line
+        else:
+
+            strcols = self._to_str_columns()
+            if self.line_width is None:  # no need to wrap around just print
+                # the whole frame
+                text = self.adj.adjoin(1, *strcols)
+            elif (not isinstance(self.max_cols, int) or
+                    self.max_cols > 0):  # need to wrap around
+                text = self._join_multiline(*strcols)
+            else:  # max_cols == 0. Try to fit frame to terminal
+                text = self.adj.adjoin(1, *strcols).split('\n')
+                max_len = Series(text).str.len().max()
+                # plus truncate dot col
+                dif = max_len - self.w
+                # '+ 1' to avoid too wide repr (GH PR #17023)
+                adj_dif = dif + 1
+                col_lens = Series([Series(ele).apply(len).max()
+                                   for ele in strcols])
+                n_cols = len(col_lens)
+                counter = 0
+                while adj_dif > 0 and n_cols > 1:
+                    counter += 1
+                    mid = int(round(n_cols / 2.))
+                    mid_ix = col_lens.index[mid]
+                    col_len = col_lens[mid_ix]
+                    # adjoin adds one
+                    adj_dif -= (col_len + 1)
+                    col_lens = col_lens.drop(mid_ix)
+                    n_cols = len(col_lens)
+                # subtract index column
+                max_cols_adj = n_cols - self.index
+                # GH-21180. Ensure that we print at least two.
+                max_cols_adj = max(max_cols_adj, 2)
+                self.max_cols_adj = max_cols_adj
+
+                # Call again _chk_truncate to cut frame appropriately
+                # and then generate string representation
+                self._chk_truncate()
+                strcols = self._to_str_columns()
+                text = self.adj.adjoin(1, *strcols)
+        self.buf.writelines(text)
+
+        if self.should_show_dimensions:
+            self.buf.write("\n\n[{nrows} rows x {ncols} columns]"
+                           .format(nrows=len(frame), ncols=len(frame.columns)))
+
+    def _join_multiline(self, *strcols):
+        lwidth = self.line_width
+        adjoin_width = 1
+        strcols = list(strcols)
+        if self.index:
+            idx = strcols.pop(0)
+            lwidth -= np.array([self.adj.len(x)
+                                for x in idx]).max() + adjoin_width
+
+        col_widths = [np.array([self.adj.len(x) for x in col]).max() if
+                      len(col) > 0 else 0 for col in strcols]
+        col_bins = _binify(col_widths, lwidth)
+        nbins = len(col_bins)
+
+        if self.truncate_v:
+            nrows = self.max_rows_adj + 1
+        else:
+            nrows = len(self.frame)
+
+        str_lst = []
+        st = 0
+        for i, ed in enumerate(col_bins):
+            row = strcols[st:ed]
+            if self.index:
+                row.insert(0, idx)
+            if nbins > 1:
+                if ed <= len(strcols) and i < nbins - 1:
+                    row.append([' \\'] + ['  '] * (nrows - 1))
+                else:
+                    row.append([' '] * nrows)
+            str_lst.append(self.adj.adjoin(adjoin_width, *row))
+            st = ed
+        return '\n\n'.join(str_lst)
+
+    def to_latex(self, column_format=None, longtable=False, encoding=None,
+                 multicolumn=False, multicolumn_format=None, multirow=False):
+        """
+        Render a DataFrame to a LaTeX tabular/longtable environment output.
+        """
+
+        from pandas.io.formats.latex import LatexFormatter
+        latex_renderer = LatexFormatter(self, column_format=column_format,
+                                        longtable=longtable,
+                                        multicolumn=multicolumn,
+                                        multicolumn_format=multicolumn_format,
+                                        multirow=multirow)
+
+        if encoding is None:
+            encoding = 'ascii' if compat.PY2 else 'utf-8'
+
+        if hasattr(self.buf, 'write'):
+            latex_renderer.write_result(self.buf)
+        elif isinstance(self.buf, compat.string_types):
+            import codecs
+            with codecs.open(self.buf, 'w', encoding=encoding) as f:
+                latex_renderer.write_result(f)
+        else:
+            raise TypeError('buf is not a file name and it has no write '
+                            'method')
+
+    def _format_col(self, i):
+        frame = self.tr_frame
+        formatter = self._get_formatter(i)
+        values_to_format = frame.iloc[:, i]._formatting_values()
+        return format_array(values_to_format, formatter,
+                            float_format=self.float_format, na_rep=self.na_rep,
+                            space=self.col_space, decimal=self.decimal)
+
+    def to_html(self, classes=None, notebook=False, border=None):
+        """
+        Render a DataFrame to a html table.
+
+        Parameters
+        ----------
+        classes : str or list-like
+            classes to include in the `class` attribute of the opening
+            ``<table>`` tag, in addition to the default "dataframe".
+        notebook : {True, False}, optional, default False
+            Whether the generated HTML is for IPython Notebook.
+        border : int
+            A ``border=border`` attribute is included in the opening
+            ``<table>`` tag. Default ``pd.options.html.border``.
+
+            .. versionadded:: 0.19.0
+         """
+        from pandas.io.formats.html import HTMLFormatter, NotebookFormatter
+        Klass = NotebookFormatter if notebook else HTMLFormatter
+        html = Klass(self, classes=classes, border=border).render()
+        if hasattr(self.buf, 'write'):
+            buffer_put_lines(self.buf, html)
+        elif isinstance(self.buf, compat.string_types):
+            with open(self.buf, 'w') as f:
+                buffer_put_lines(f, html)
+        else:
+            raise TypeError('buf is not a file name and it has no write '
+                            ' method')
+
+    def _get_formatted_column_labels(self, frame):
+        from pandas.core.index import _sparsify
+
+        columns = frame.columns
+
+        if isinstance(columns, ABCMultiIndex):
+            fmt_columns = columns.format(sparsify=False, adjoin=False)
+            fmt_columns = lzip(*fmt_columns)
+            dtypes = self.frame.dtypes._values
+
+            # if we have a Float level, they don't use leading space at all
+            restrict_formatting = any(l.is_floating for l in columns.levels)
+            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
+
+            def space_format(x, y):
+                if (y not in self.formatters and
+                        need_leadsp[x] and not restrict_formatting):
+                    return ' ' + y
+                return y
+
+            str_columns = list(zip(*[[space_format(x, y) for y in x]
+                                     for x in fmt_columns]))
+            if self.sparsify and len(str_columns):
+                str_columns = _sparsify(str_columns)
+
+            str_columns = [list(x) for x in zip(*str_columns)]
+        else:
+            fmt_columns = columns.format()
+            dtypes = self.frame.dtypes
+            need_leadsp = dict(zip(fmt_columns, map(is_numeric_dtype, dtypes)))
+            str_columns = [[' ' + x if not self._get_formatter(i) and
+                            need_leadsp[x] else x]
+                           for i, (col, x) in enumerate(zip(columns,
+                                                            fmt_columns))]
+
+        if self.show_row_idx_names:
+            for x in str_columns:
+                x.append('')
+
+        # self.str_columns = str_columns
+        return str_columns
+
+    @property
+    def has_index_names(self):
+        return _has_names(self.frame.index)
+
+    @property
+    def has_column_names(self):
+        return _has_names(self.frame.columns)
+
+    @property
+    def show_row_idx_names(self):
+        return all((self.has_index_names,
+                    self.index,
+                    self.show_index_names))
+
+    @property
+    def show_col_idx_names(self):
+        return all((self.has_column_names,
+                    self.show_index_names,
+                    self.header))
+
+    def _get_formatted_index(self, frame):
+        # Note: this is only used by to_string() and to_latex(), not by
+        # to_html().
+        index = frame.index
+        columns = frame.columns
+        fmt = self._get_formatter('__index__')
+
+        if isinstance(index, ABCMultiIndex):
+            fmt_index = index.format(
+                sparsify=self.sparsify, adjoin=False,
+                names=self.show_row_idx_names, formatter=fmt)
+        else:
+            fmt_index = [index.format(
+                name=self.show_row_idx_names, formatter=fmt)]
+
+        fmt_index = [tuple(_make_fixed_width(list(x), justify='left',
+                                             minimum=(self.col_space or 0),
+                                             adj=self.adj)) for x in fmt_index]
+
+        adjoined = self.adj.adjoin(1, *fmt_index).split('\n')
+
+        # empty space for columns
+        if self.show_col_idx_names:
+            col_header = ['{x}'.format(x=x)
+                          for x in self._get_column_name_list()]
+        else:
+            col_header = [''] * columns.nlevels
+
+        if self.header:
+            return col_header + adjoined
+        else:
+            return adjoined
+
+    def _get_column_name_list(self):
+        names = []
+        columns = self.frame.columns
+        if isinstance(columns, ABCMultiIndex):
+            names.extend('' if name is None else name
+                         for name in columns.names)
+        else:
+            names.append('' if columns.name is None else columns.name)
+        return names
+
+# ----------------------------------------------------------------------
+# Array formatters
+
+
+def format_array(values, formatter, float_format=None, na_rep='NaN',
+                 digits=None, space=None, justify='right', decimal='.',
+                 leading_space=None):
+    """
+    Format an array for printing.
+
+    Parameters
+    ----------
+    values
+    formatter
+    float_format
+    na_rep
+    digits
+    space
+    justify
+    decimal
+    leading_space : bool, optional
+        Whether the array should be formatted with a leading space.
+        When an array as a column of a Series or DataFrame, we do want
+        the leading space to pad between columns.
+
+        When formatting an Index subclass
+        (e.g. IntervalIndex._format_native_types), we don't want the
+        leading space since it should be left-aligned.
+
+    Returns
+    -------
+    List[str]
+    """
+
+    if is_datetime64_dtype(values.dtype):
+        fmt_klass = Datetime64Formatter
+    elif is_datetime64tz_dtype(values):
+        fmt_klass = Datetime64TZFormatter
+    elif is_timedelta64_dtype(values.dtype):
+        fmt_klass = Timedelta64Formatter
+    elif is_extension_array_dtype(values.dtype):
+        fmt_klass = ExtensionArrayFormatter
+    elif is_float_dtype(values.dtype):
+        fmt_klass = FloatArrayFormatter
+    elif is_integer_dtype(values.dtype):
+        fmt_klass = IntArrayFormatter
+    else:
+        fmt_klass = GenericArrayFormatter
+
+    if space is None:
+        space = get_option("display.column_space")
+
+    if float_format is None:
+        float_format = get_option("display.float_format")
+
+    if digits is None:
+        digits = get_option("display.precision")
+
+    fmt_obj = fmt_klass(values, digits=digits, na_rep=na_rep,
+                        float_format=float_format, formatter=formatter,
+                        space=space, justify=justify, decimal=decimal,
+                        leading_space=leading_space)
+
+    return fmt_obj.get_result()
+
+
+class GenericArrayFormatter(object):
+
+    def __init__(self, values, digits=7, formatter=None, na_rep='NaN',
+                 space=12, float_format=None, justify='right', decimal='.',
+                 quoting=None, fixed_width=True, leading_space=None):
+        self.values = values
+        self.digits = digits
+        self.na_rep = na_rep
+        self.space = space
+        self.formatter = formatter
+        self.float_format = float_format
+        self.justify = justify
+        self.decimal = decimal
+        self.quoting = quoting
+        self.fixed_width = fixed_width
+        self.leading_space = leading_space
+
+    def get_result(self):
+        fmt_values = self._format_strings()
+        return _make_fixed_width(fmt_values, self.justify)
+
+    def _format_strings(self):
+        if self.float_format is None:
+            float_format = get_option("display.float_format")
+            if float_format is None:
+                fmt_str = ('{{x: .{prec:d}g}}'
+                           .format(prec=get_option("display.precision")))
+                float_format = lambda x: fmt_str.format(x=x)
+        else:
+            float_format = self.float_format
+
+        formatter = (
+            self.formatter if self.formatter is not None else
+            (lambda x: pprint_thing(x, escape_chars=('\t', '\r', '\n'))))
+
+        def _format(x):
+            if self.na_rep is not None and is_scalar(x) and isna(x):
+                if x is None:
+                    return 'None'
+                elif x is NaT:
+                    return 'NaT'
+                return self.na_rep
+            elif isinstance(x, PandasObject):
+                return u'{x}'.format(x=x)
+            else:
+                # object dtype
+                return u'{x}'.format(x=formatter(x))
+
+        vals = self.values
+        if isinstance(vals, Index):
+            vals = vals._values
+        elif isinstance(vals, ABCSparseArray):
+            vals = vals.values
+
+        is_float_type = lib.map_infer(vals, is_float) & notna(vals)
+        leading_space = self.leading_space
+        if leading_space is None:
+            leading_space = is_float_type.any()
+
+        fmt_values = []
+        for i, v in enumerate(vals):
+            if not is_float_type[i] and leading_space:
+                fmt_values.append(u' {v}'.format(v=_format(v)))
+            elif is_float_type[i]:
+                fmt_values.append(float_format(v))
+            else:
+                if leading_space is False:
+                    # False specifically, so that the default is
+                    # to include a space if we get here.
+                    tpl = u'{v}'
+                else:
+                    tpl = u' {v}'
+                fmt_values.append(tpl.format(v=_format(v)))
+
+        return fmt_values
+
+
+class FloatArrayFormatter(GenericArrayFormatter):
+    """
+
+    """
+
+    def __init__(self, *args, **kwargs):
+        GenericArrayFormatter.__init__(self, *args, **kwargs)
+
+        # float_format is expected to be a string
+        # formatter should be used to pass a function
+        if self.float_format is not None and self.formatter is None:
+            # GH21625, GH22270
+            self.fixed_width = False
+            if callable(self.float_format):
+                self.formatter = self.float_format
+                self.float_format = None
+
+    def _value_formatter(self, float_format=None, threshold=None):
+        """Returns a function to be applied on each value to format it
+        """
+
+        # the float_format parameter supersedes self.float_format
+        if float_format is None:
+            float_format = self.float_format
+
+        # we are going to compose different functions, to first convert to
+        # a string, then replace the decimal symbol, and finally chop according
+        # to the threshold
+
+        # when there is no float_format, we use str instead of '%g'
+        # because str(0.0) = '0.0' while '%g' % 0.0 = '0'
+        if float_format:
+            def base_formatter(v):
+                return float_format(value=v) if notna(v) else self.na_rep
+        else:
+            def base_formatter(v):
+                return str(v) if notna(v) else self.na_rep
+
+        if self.decimal != '.':
+            def decimal_formatter(v):
+                return base_formatter(v).replace('.', self.decimal, 1)
+        else:
+            decimal_formatter = base_formatter
+
+        if threshold is None:
+            return decimal_formatter
+
+        def formatter(value):
+            if notna(value):
+                if abs(value) > threshold:
+                    return decimal_formatter(value)
+                else:
+                    return decimal_formatter(0.0)
+            else:
+                return self.na_rep
+
+        return formatter
+
+    def get_result_as_array(self):
+        """
+        Returns the float values converted into strings using
+        the parameters given at initialisation, as a numpy array
+        """
+
+        if self.formatter is not None:
+            return np.array([self.formatter(x) for x in self.values])
+
+        if self.fixed_width:
+            threshold = get_option("display.chop_threshold")
+        else:
+            threshold = None
+
+        # if we have a fixed_width, we'll need to try different float_format
+        def format_values_with(float_format):
+            formatter = self._value_formatter(float_format, threshold)
+
+            # default formatter leaves a space to the left when formatting
+            # floats, must be consistent for left-justifying NaNs (GH #25061)
+            if self.justify == 'left':
+                na_rep = ' ' + self.na_rep
+            else:
+                na_rep = self.na_rep
+
+            # separate the wheat from the chaff
+            values = self.values
+            mask = isna(values)
+            if hasattr(values, 'to_dense'):  # sparse numpy ndarray
+                values = values.to_dense()
+            values = np.array(values, dtype='object')
+            values[mask] = na_rep
+            imask = (~mask).ravel()
+            values.flat[imask] = np.array([formatter(val)
+                                           for val in values.ravel()[imask]])
+
+            if self.fixed_width:
+                return _trim_zeros(values, na_rep)
+
+            return values
+
+        # There is a special default string when we are fixed-width
+        # The default is otherwise to use str instead of a formatting string
+        if self.float_format is None:
+            if self.fixed_width:
+                float_format = partial('{value: .{digits:d}f}'.format,
+                                       digits=self.digits)
+            else:
+                float_format = self.float_format
+        else:
+            float_format = lambda value: self.float_format % value
+
+        formatted_values = format_values_with(float_format)
+
+        if not self.fixed_width:
+            return formatted_values
+
+        # we need do convert to engineering format if some values are too small
+        # and would appear as 0, or if some values are too big and take too
+        # much space
+
+        if len(formatted_values) > 0:
+            maxlen = max(len(x) for x in formatted_values)
+            too_long = maxlen > self.digits + 6
+        else:
+            too_long = False
+
+        with np.errstate(invalid='ignore'):
+            abs_vals = np.abs(self.values)
+            # this is pretty arbitrary for now
+            # large values: more that 8 characters including decimal symbol
+            # and first digit, hence > 1e6
+            has_large_values = (abs_vals > 1e6).any()
+            has_small_values = ((abs_vals < 10**(-self.digits)) &
+                                (abs_vals > 0)).any()
+
+        if has_small_values or (too_long and has_large_values):
+            float_format = partial('{value: .{digits:d}e}'.format,
+                                   digits=self.digits)
+            formatted_values = format_values_with(float_format)
+
+        return formatted_values
+
+    def _format_strings(self):
+        # shortcut
+        if self.formatter is not None:
+            return [self.formatter(x) for x in self.values]
+
+        return list(self.get_result_as_array())
+
+
+class IntArrayFormatter(GenericArrayFormatter):
+
+    def _format_strings(self):
+        formatter = self.formatter or (lambda x: '{x: d}'.format(x=x))
+        fmt_values = [formatter(x) for x in self.values]
+        return fmt_values
+
+
+class Datetime64Formatter(GenericArrayFormatter):
+
+    def __init__(self, values, nat_rep='NaT', date_format=None, **kwargs):
+        super(Datetime64Formatter, self).__init__(values, **kwargs)
+        self.nat_rep = nat_rep
+        self.date_format = date_format
+
+    def _format_strings(self):
+        """ we by definition have DO NOT have a TZ """
+
+        values = self.values
+
+        if not isinstance(values, DatetimeIndex):
+            values = DatetimeIndex(values)
+
+        if self.formatter is not None and callable(self.formatter):
+            return [self.formatter(x) for x in values]
+
+        fmt_values = format_array_from_datetime(
+            values.asi8.ravel(),
+            format=_get_format_datetime64_from_values(values,
+                                                      self.date_format),
+            na_rep=self.nat_rep).reshape(values.shape)
+        return fmt_values.tolist()
+
+
+class ExtensionArrayFormatter(GenericArrayFormatter):
+    def _format_strings(self):
+        values = self.values
+        if isinstance(values, (ABCIndexClass, ABCSeries)):
+            values = values._values
+
+        formatter = values._formatter(boxed=True)
+
+        if is_categorical_dtype(values.dtype):
+            # Categorical is special for now, so that we can preserve tzinfo
+            array = values.get_values()
+        else:
+            array = np.asarray(values)
+
+        fmt_values = format_array(array,
+                                  formatter,
+                                  float_format=self.float_format,
+                                  na_rep=self.na_rep, digits=self.digits,
+                                  space=self.space, justify=self.justify,
+                                  leading_space=self.leading_space)
+        return fmt_values
+
+
+def format_percentiles(percentiles):
+    """
+    Outputs rounded and formatted percentiles.
+
+    Parameters
+    ----------
+    percentiles : list-like, containing floats from interval [0,1]
+
+    Returns
+    -------
+    formatted : list of strings
+
+    Notes
+    -----
+    Rounding precision is chosen so that: (1) if any two elements of
+    ``percentiles`` differ, they remain different after rounding
+    (2) no entry is *rounded* to 0% or 100%.
+    Any non-integer is always rounded to at least 1 decimal place.
+
+    Examples
+    --------
+    Keeps all entries different after rounding:
+
+    >>> format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
+    ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
+
+    No element is rounded to 0% or 100% (unless already equal to it).
+    Duplicates are allowed:
+
+    >>> format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
+    ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
+    """
+
+    percentiles = np.asarray(percentiles)
+
+    # It checks for np.NaN as well
+    with np.errstate(invalid='ignore'):
+        if not is_numeric_dtype(percentiles) or not np.all(percentiles >= 0) \
+                or not np.all(percentiles <= 1):
+            raise ValueError("percentiles should all be in the interval [0,1]")
+
+    percentiles = 100 * percentiles
+    int_idx = (percentiles.astype(int) == percentiles)
+
+    if np.all(int_idx):
+        out = percentiles.astype(int).astype(str)
+        return [i + '%' for i in out]
+
+    unique_pcts = np.unique(percentiles)
+    to_begin = unique_pcts[0] if unique_pcts[0] > 0 else None
+    to_end = 100 - unique_pcts[-1] if unique_pcts[-1] < 100 else None
+
+    # Least precision that keeps percentiles unique after rounding
+    prec = -np.floor(np.log10(np.min(
+        np.ediff1d(unique_pcts, to_begin=to_begin, to_end=to_end)
+    ))).astype(int)
+    prec = max(1, prec)
+    out = np.empty_like(percentiles, dtype=object)
+    out[int_idx] = percentiles[int_idx].astype(int).astype(str)
+    out[~int_idx] = percentiles[~int_idx].round(prec).astype(str)
+    return [i + '%' for i in out]
+
+
+def _is_dates_only(values):
+    # return a boolean if we are only dates (and don't have a timezone)
+    values = DatetimeIndex(values)
+    if values.tz is not None:
+        return False
+
+    values_int = values.asi8
+    consider_values = values_int != iNaT
+    one_day_nanos = (86400 * 1e9)
+    even_days = np.logical_and(consider_values,
+                               values_int % int(one_day_nanos) != 0).sum() == 0
+    if even_days:
+        return True
+    return False
+
+
+def _format_datetime64(x, tz=None, nat_rep='NaT'):
+    if x is None or (is_scalar(x) and isna(x)):
+        return nat_rep
+
+    if tz is not None or not isinstance(x, Timestamp):
+        if getattr(x, 'tzinfo', None) is not None:
+            x = Timestamp(x).tz_convert(tz)
+        else:
+            x = Timestamp(x).tz_localize(tz)
+
+    return str(x)
+
+
+def _format_datetime64_dateonly(x, nat_rep='NaT', date_format=None):
+    if x is None or (is_scalar(x) and isna(x)):
+        return nat_rep
+
+    if not isinstance(x, Timestamp):
+        x = Timestamp(x)
+
+    if date_format:
+        return x.strftime(date_format)
+    else:
+        return x._date_repr
+
+
+def _get_format_datetime64(is_dates_only, nat_rep='NaT', date_format=None):
+
+    if is_dates_only:
+        return lambda x, tz=None: _format_datetime64_dateonly(
+            x, nat_rep=nat_rep, date_format=date_format)
+    else:
+        return lambda x, tz=None: _format_datetime64(x, tz=tz, nat_rep=nat_rep)
+
+
+def _get_format_datetime64_from_values(values, date_format):
+    """ given values and a date_format, return a string format """
+    is_dates_only = _is_dates_only(values)
+    if is_dates_only:
+        return date_format or "%Y-%m-%d"
+    return date_format
+
+
+class Datetime64TZFormatter(Datetime64Formatter):
+
+    def _format_strings(self):
+        """ we by definition have a TZ """
+
+        values = self.values.astype(object)
+        is_dates_only = _is_dates_only(values)
+        formatter = (self.formatter or
+                     _get_format_datetime64(is_dates_only,
+                                            date_format=self.date_format))
+        fmt_values = [formatter(x) for x in values]
+
+        return fmt_values
+
+
+class Timedelta64Formatter(GenericArrayFormatter):
+
+    def __init__(self, values, nat_rep='NaT', box=False, **kwargs):
+        super(Timedelta64Formatter, self).__init__(values, **kwargs)
+        self.nat_rep = nat_rep
+        self.box = box
+
+    def _format_strings(self):
+        formatter = (self.formatter or
+                     _get_format_timedelta64(self.values, nat_rep=self.nat_rep,
+                                             box=self.box))
+        fmt_values = np.array([formatter(x) for x in self.values])
+        return fmt_values
+
+
+def _get_format_timedelta64(values, nat_rep='NaT', box=False):
+    """
+    Return a formatter function for a range of timedeltas.
+    These will all have the same format argument
+
+    If box, then show the return in quotes
+    """
+
+    values_int = values.astype(np.int64)
+
+    consider_values = values_int != iNaT
+
+    one_day_nanos = (86400 * 1e9)
+    even_days = np.logical_and(consider_values,
+                               values_int % one_day_nanos != 0).sum() == 0
+    all_sub_day = np.logical_and(
+        consider_values, np.abs(values_int) >= one_day_nanos).sum() == 0
+
+    if even_days:
+        format = None
+    elif all_sub_day:
+        format = 'sub_day'
+    else:
+        format = 'long'
+
+    def _formatter(x):
+        if x is None or (is_scalar(x) and isna(x)):
+            return nat_rep
+
+        if not isinstance(x, Timedelta):
+            x = Timedelta(x)
+        result = x._repr_base(format=format)
+        if box:
+            result = "'{res}'".format(res=result)
+        return result
+
+    return _formatter
+
+
+def _make_fixed_width(strings, justify='right', minimum=None, adj=None):
+
+    if len(strings) == 0 or justify == 'all':
+        return strings
+
+    if adj is None:
+        adj = _get_adjustment()
+
+    max_len = max(adj.len(x) for x in strings)
+
+    if minimum is not None:
+        max_len = max(minimum, max_len)
+
+    conf_max = get_option("display.max_colwidth")
+    if conf_max is not None and max_len > conf_max:
+        max_len = conf_max
+
+    def just(x):
+        if conf_max is not None:
+            if (conf_max > 3) & (adj.len(x) > max_len):
+                x = x[:max_len - 3] + '...'
+        return x
+
+    strings = [just(x) for x in strings]
+    result = adj.justify(strings, max_len, mode=justify)
+    return result
+
+
+def _trim_zeros(str_floats, na_rep='NaN'):
+    """
+    Trims zeros, leaving just one before the decimal points if need be.
+    """
+    trimmed = str_floats
+
+    def _is_number(x):
+        return (x != na_rep and not x.endswith('inf'))
+
+    def _cond(values):
+        finite = [x for x in values if _is_number(x)]
+        return (len(finite) > 0 and all(x.endswith('0') for x in finite) and
+                not (any(('e' in x) or ('E' in x) for x in finite)))
+
+    while _cond(trimmed):
+        trimmed = [x[:-1] if _is_number(x) else x for x in trimmed]
+
+    # leave one 0 after the decimal points if need be.
+    return [x + "0" if x.endswith('.') and _is_number(x) else x
+            for x in trimmed]
+
+
+def _has_names(index):
+    if isinstance(index, ABCMultiIndex):
+        return com._any_not_none(*index.names)
+    else:
+        return index.name is not None
+
+
+class EngFormatter(object):
+    """
+    Formats float values according to engineering format.
+
+    Based on matplotlib.ticker.EngFormatter
+    """
+
+    # The SI engineering prefixes
+    ENG_PREFIXES = {
+        -24: "y",
+        -21: "z",
+        -18: "a",
+        -15: "f",
+        -12: "p",
+        -9: "n",
+        -6: "u",
+        -3: "m",
+        0: "",
+        3: "k",
+        6: "M",
+        9: "G",
+        12: "T",
+        15: "P",
+        18: "E",
+        21: "Z",
+        24: "Y"
+    }
+
+    def __init__(self, accuracy=None, use_eng_prefix=False):
+        self.accuracy = accuracy
+        self.use_eng_prefix = use_eng_prefix
+
+    def __call__(self, num):
+        """ Formats a number in engineering notation, appending a letter
+        representing the power of 1000 of the original number. Some examples:
+
+        >>> format_eng(0)       # for self.accuracy = 0
+        ' 0'
+
+        >>> format_eng(1000000) # for self.accuracy = 1,
+                                #     self.use_eng_prefix = True
+        ' 1.0M'
+
+        >>> format_eng("-1e-6") # for self.accuracy = 2
+                                #     self.use_eng_prefix = False
+        '-1.00E-06'
+
+        @param num: the value to represent
+        @type num: either a numeric value or a string that can be converted to
+                   a numeric value (as per decimal.Decimal constructor)
+
+        @return: engineering formatted string
+        """
+        import decimal
+        import math
+        dnum = decimal.Decimal(str(num))
+
+        if decimal.Decimal.is_nan(dnum):
+            return 'NaN'
+
+        if decimal.Decimal.is_infinite(dnum):
+            return 'inf'
+
+        sign = 1
+
+        if dnum < 0:  # pragma: no cover
+            sign = -1
+            dnum = -dnum
+
+        if dnum != 0:
+            pow10 = decimal.Decimal(int(math.floor(dnum.log10() / 3) * 3))
+        else:
+            pow10 = decimal.Decimal(0)
+
+        pow10 = pow10.min(max(self.ENG_PREFIXES.keys()))
+        pow10 = pow10.max(min(self.ENG_PREFIXES.keys()))
+        int_pow10 = int(pow10)
+
+        if self.use_eng_prefix:
+            prefix = self.ENG_PREFIXES[int_pow10]
+        else:
+            if int_pow10 < 0:
+                prefix = 'E-{pow10:02d}'.format(pow10=-int_pow10)
+            else:
+                prefix = 'E+{pow10:02d}'.format(pow10=int_pow10)
+
+        mant = sign * dnum / (10**pow10)
+
+        if self.accuracy is None:  # pragma: no cover
+            format_str = u("{mant: g}{prefix}")
+        else:
+            format_str = (u("{{mant: .{acc:d}f}}{{prefix}}")
+                          .format(acc=self.accuracy))
+
+        formatted = format_str.format(mant=mant, prefix=prefix)
+
+        return formatted  # .strip()
+
+
+def set_eng_float_format(accuracy=3, use_eng_prefix=False):
+    """
+    Alter default behavior on how float is formatted in DataFrame.
+    Format float in engineering format. By accuracy, we mean the number of
+    decimal digits after the floating point.
+
+    See also EngFormatter.
+    """
+
+    set_option("display.float_format", EngFormatter(accuracy, use_eng_prefix))
+    set_option("display.column_space", max(12, accuracy + 9))
+
+
+def _binify(cols, line_width):
+    adjoin_width = 1
+    bins = []
+    curr_width = 0
+    i_last_column = len(cols) - 1
+    for i, w in enumerate(cols):
+        w_adjoined = w + adjoin_width
+        curr_width += w_adjoined
+        if i_last_column == i:
+            wrap = curr_width + 1 > line_width and i > 0
+        else:
+            wrap = curr_width + 2 > line_width and i > 0
+        if wrap:
+            bins.append(i)
+            curr_width = w_adjoined
+
+    bins.append(len(cols))
+    return bins
+
+
+def get_level_lengths(levels, sentinel=''):
+    """For each index in each level the function returns lengths of indexes.
+
+    Parameters
+    ----------
+    levels : list of lists
+        List of values on for level.
+    sentinel : string, optional
+        Value which states that no new index starts on there.
+
+    Returns
+    ----------
+    Returns list of maps. For each level returns map of indexes (key is index
+    in row and value is length of index).
+    """
+    if len(levels) == 0:
+        return []
+
+    control = [True] * len(levels[0])
+
+    result = []
+    for level in levels:
+        last_index = 0
+
+        lengths = {}
+        for i, key in enumerate(level):
+            if control[i] and key == sentinel:
+                pass
+            else:
+                control[i] = False
+                lengths[last_index] = i - last_index
+                last_index = i
+
+        lengths[last_index] = len(level) - last_index
+
+        result.append(lengths)
+
+    return result
+
+
+def buffer_put_lines(buf, lines):
+    """
+    Appends lines to a buffer.
+
+    Parameters
+    ----------
+    buf
+        The buffer to write to
+    lines
+        The lines to append.
+    """
+    if any(isinstance(x, compat.text_type) for x in lines):
+        lines = [compat.text_type(x) for x in lines]
+    buf.write('\n'.join(lines))
diff --git a/pandas/io/formats/html.py b/pandas/io/formats/html.py
new file mode 100644
index 0000000000000..66d13bf2668f9
--- /dev/null
+++ b/pandas/io/formats/html.py
@@ -0,0 +1,540 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data in HTML.
+"""
+
+from __future__ import print_function
+
+from collections import OrderedDict
+from textwrap import dedent
+
+from pandas.compat import lzip, map, range, u, unichr, zip
+
+from pandas.core.dtypes.generic import ABCMultiIndex
+
+from pandas import compat, option_context
+from pandas.core.config import get_option
+
+from pandas.io.common import _is_url
+from pandas.io.formats.format import TableFormatter, get_level_lengths
+from pandas.io.formats.printing import pprint_thing
+
+
+class HTMLFormatter(TableFormatter):
+    """
+    Internal class for formatting output data in html.
+    This class is intended for shared functionality between
+    DataFrame.to_html() and DataFrame._repr_html_().
+    Any logic in common with other output formatting methods
+    should ideally be inherited from classes in format.py
+    and this class responsible for only producing html markup.
+    """
+
+    indent_delta = 2
+
+    def __init__(self, formatter, classes=None, border=None):
+        self.fmt = formatter
+        self.classes = classes
+
+        self.frame = self.fmt.frame
+        self.columns = self.fmt.tr_frame.columns
+        self.elements = []
+        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
+        self.escape = self.fmt.kwds.get('escape', True)
+        self.show_dimensions = self.fmt.show_dimensions
+        if border is None:
+            border = get_option('display.html.border')
+        self.border = border
+        self.table_id = self.fmt.table_id
+        self.render_links = self.fmt.render_links
+
+    @property
+    def show_row_idx_names(self):
+        return self.fmt.show_row_idx_names
+
+    @property
+    def show_col_idx_names(self):
+        return self.fmt.show_col_idx_names
+
+    @property
+    def row_levels(self):
+        if self.fmt.index:
+            # showing (row) index
+            return self.frame.index.nlevels
+        elif self.show_col_idx_names:
+            # see gh-22579
+            # Column misalignment also occurs for
+            # a standard index when the columns index is named.
+            # If the row index is not displayed a column of
+            # blank cells need to be included before the DataFrame values.
+            return 1
+        # not showing (row) index
+        return 0
+
+    @property
+    def is_truncated(self):
+        return self.fmt.is_truncated
+
+    @property
+    def ncols(self):
+        return len(self.fmt.tr_frame.columns)
+
+    def write(self, s, indent=0):
+        rs = pprint_thing(s)
+        self.elements.append(' ' * indent + rs)
+
+    def write_th(self, s, indent=0, tags=None):
+        if self.fmt.col_space is not None and self.fmt.col_space > 0:
+            tags = (tags or "")
+            tags += ('style="min-width: {colspace};"'
+                     .format(colspace=self.fmt.col_space))
+
+        return self._write_cell(s, kind='th', indent=indent, tags=tags)
+
+    def write_td(self, s, indent=0, tags=None):
+        return self._write_cell(s, kind='td', indent=indent, tags=tags)
+
+    def _write_cell(self, s, kind='td', indent=0, tags=None):
+        if tags is not None:
+            start_tag = '<{kind} {tags}>'.format(kind=kind, tags=tags)
+        else:
+            start_tag = '<{kind}>'.format(kind=kind)
+
+        if self.escape:
+            # escape & first to prevent double escaping of &
+            esc = OrderedDict([('&', r'&amp;'), ('<', r'&lt;'),
+                               ('>', r'&gt;')])
+        else:
+            esc = {}
+
+        rs = pprint_thing(s, escape_chars=esc).strip()
+
+        if self.render_links and _is_url(rs):
+            rs_unescaped = pprint_thing(s, escape_chars={}).strip()
+            start_tag += '<a href="{url}" target="_blank">'.format(
+                url=rs_unescaped)
+            end_a = '</a>'
+        else:
+            end_a = ''
+
+        self.write(u'{start}{rs}{end_a}</{kind}>'.format(
+            start=start_tag, rs=rs, end_a=end_a, kind=kind), indent)
+
+    def write_tr(self, line, indent=0, indent_delta=0, header=False,
+                 align=None, tags=None, nindex_levels=0):
+        if tags is None:
+            tags = {}
+
+        if align is None:
+            self.write('<tr>', indent)
+        else:
+            self.write('<tr style="text-align: {align};">'
+                       .format(align=align), indent)
+        indent += indent_delta
+
+        for i, s in enumerate(line):
+            val_tag = tags.get(i, None)
+            if header or (self.bold_rows and i < nindex_levels):
+                self.write_th(s, indent, tags=val_tag)
+            else:
+                self.write_td(s, indent, tags=val_tag)
+
+        indent -= indent_delta
+        self.write('</tr>', indent)
+
+    def render(self):
+        self._write_table()
+
+        if self.should_show_dimensions:
+            by = chr(215) if compat.PY3 else unichr(215)  # ×
+            self.write(u('<p>{rows} rows {by} {cols} columns</p>')
+                       .format(rows=len(self.frame),
+                               by=by,
+                               cols=len(self.frame.columns)))
+
+        return self.elements
+
+    def _write_table(self, indent=0):
+        _classes = ['dataframe']  # Default class.
+        use_mathjax = get_option("display.html.use_mathjax")
+        if not use_mathjax:
+            _classes.append('tex2jax_ignore')
+        if self.classes is not None:
+            if isinstance(self.classes, str):
+                self.classes = self.classes.split()
+            if not isinstance(self.classes, (list, tuple)):
+                raise AssertionError('classes must be list or tuple, not {typ}'
+                                     .format(typ=type(self.classes)))
+            _classes.extend(self.classes)
+
+        if self.table_id is None:
+            id_section = ""
+        else:
+            id_section = ' id="{table_id}"'.format(table_id=self.table_id)
+
+        self.write('<table border="{border}" class="{cls}"{id_section}>'
+                   .format(border=self.border, cls=' '.join(_classes),
+                           id_section=id_section), indent)
+
+        if self.fmt.header or self.show_row_idx_names:
+            self._write_header(indent + self.indent_delta)
+
+        self._write_body(indent + self.indent_delta)
+
+        self.write('</table>', indent)
+
+    def _write_col_header(self, indent):
+        truncate_h = self.fmt.truncate_h
+        if isinstance(self.columns, ABCMultiIndex):
+            template = 'colspan="{span:d}" halign="left"'
+
+            if self.fmt.sparsify:
+                # GH3547
+                sentinel = object()
+            else:
+                sentinel = False
+            levels = self.columns.format(sparsify=sentinel, adjoin=False,
+                                         names=False)
+            level_lengths = get_level_lengths(levels, sentinel)
+            inner_lvl = len(level_lengths) - 1
+            for lnum, (records, values) in enumerate(zip(level_lengths,
+                                                         levels)):
+                if truncate_h:
+                    # modify the header lines
+                    ins_col = self.fmt.tr_col_num
+                    if self.fmt.sparsify:
+                        recs_new = {}
+                        # Increment tags after ... col.
+                        for tag, span in list(records.items()):
+                            if tag >= ins_col:
+                                recs_new[tag + 1] = span
+                            elif tag + span > ins_col:
+                                recs_new[tag] = span + 1
+                                if lnum == inner_lvl:
+                                    values = (values[:ins_col] + (u('...'),) +
+                                              values[ins_col:])
+                                else:
+                                    # sparse col headers do not receive a ...
+                                    values = (values[:ins_col] +
+                                              (values[ins_col - 1], ) +
+                                              values[ins_col:])
+                            else:
+                                recs_new[tag] = span
+                            # if ins_col lies between tags, all col headers
+                            # get ...
+                            if tag + span == ins_col:
+                                recs_new[ins_col] = 1
+                                values = (values[:ins_col] + (u('...'),) +
+                                          values[ins_col:])
+                        records = recs_new
+                        inner_lvl = len(level_lengths) - 1
+                        if lnum == inner_lvl:
+                            records[ins_col] = 1
+                    else:
+                        recs_new = {}
+                        for tag, span in list(records.items()):
+                            if tag >= ins_col:
+                                recs_new[tag + 1] = span
+                            else:
+                                recs_new[tag] = span
+                        recs_new[ins_col] = 1
+                        records = recs_new
+                        values = (values[:ins_col] + [u('...')] +
+                                  values[ins_col:])
+
+                # see gh-22579
+                # Column Offset Bug with to_html(index=False) with
+                # MultiIndex Columns and Index.
+                # Initially fill row with blank cells before column names.
+                # TODO: Refactor to remove code duplication with code
+                # block below for standard columns index.
+                row = [''] * (self.row_levels - 1)
+                if self.fmt.index or self.show_col_idx_names:
+                    # see gh-22747
+                    # If to_html(index_names=False) do not show columns
+                    # index names.
+                    # TODO: Refactor to use _get_column_name_list from
+                    # DataFrameFormatter class and create a
+                    # _get_formatted_column_labels function for code
+                    # parity with DataFrameFormatter class.
+                    if self.fmt.show_index_names:
+                        name = self.columns.names[lnum]
+                        row.append(pprint_thing(name or ''))
+                    else:
+                        row.append('')
+
+                tags = {}
+                j = len(row)
+                for i, v in enumerate(values):
+                    if i in records:
+                        if records[i] > 1:
+                            tags[j] = template.format(span=records[i])
+                    else:
+                        continue
+                    j += 1
+                    row.append(v)
+                self.write_tr(row, indent, self.indent_delta, tags=tags,
+                              header=True)
+        else:
+            # see gh-22579
+            # Column misalignment also occurs for
+            # a standard index when the columns index is named.
+            # Initially fill row with blank cells before column names.
+            # TODO: Refactor to remove code duplication with code block
+            # above for columns MultiIndex.
+            row = [''] * (self.row_levels - 1)
+            if self.fmt.index or self.show_col_idx_names:
+                # see gh-22747
+                # If to_html(index_names=False) do not show columns
+                # index names.
+                # TODO: Refactor to use _get_column_name_list from
+                # DataFrameFormatter class.
+                if self.fmt.show_index_names:
+                    row.append(self.columns.name or '')
+                else:
+                    row.append('')
+            row.extend(self.columns)
+            align = self.fmt.justify
+
+            if truncate_h:
+                ins_col = self.row_levels + self.fmt.tr_col_num
+                row.insert(ins_col, '...')
+
+            self.write_tr(row, indent, self.indent_delta, header=True,
+                          align=align)
+
+    def _write_row_header(self, indent):
+        truncate_h = self.fmt.truncate_h
+        row = ([x if x is not None else '' for x in self.frame.index.names]
+               + [''] * (self.ncols + (1 if truncate_h else 0)))
+        self.write_tr(row, indent, self.indent_delta, header=True)
+
+    def _write_header(self, indent):
+        self.write('<thead>', indent)
+
+        if self.fmt.header:
+            self._write_col_header(indent + self.indent_delta)
+
+        if self.show_row_idx_names:
+            self._write_row_header(indent + self.indent_delta)
+
+        self.write('</thead>', indent)
+
+    def _get_formatted_values(self):
+        with option_context('display.max_colwidth', 999999):
+            fmt_values = {i: self.fmt._format_col(i)
+                          for i in range(self.ncols)}
+        return fmt_values
+
+    def _write_body(self, indent):
+        self.write('<tbody>', indent)
+        fmt_values = self._get_formatted_values()
+
+        # write values
+        if self.fmt.index and isinstance(self.frame.index, ABCMultiIndex):
+            self._write_hierarchical_rows(
+                fmt_values, indent + self.indent_delta)
+        else:
+            self._write_regular_rows(
+                fmt_values, indent + self.indent_delta)
+
+        self.write('</tbody>', indent)
+
+    def _write_regular_rows(self, fmt_values, indent):
+        truncate_h = self.fmt.truncate_h
+        truncate_v = self.fmt.truncate_v
+
+        nrows = len(self.fmt.tr_frame)
+
+        if self.fmt.index:
+            fmt = self.fmt._get_formatter('__index__')
+            if fmt is not None:
+                index_values = self.fmt.tr_frame.index.map(fmt)
+            else:
+                index_values = self.fmt.tr_frame.index.format()
+
+        row = []
+        for i in range(nrows):
+
+            if truncate_v and i == (self.fmt.tr_row_num):
+                str_sep_row = ['...'] * len(row)
+                self.write_tr(str_sep_row, indent, self.indent_delta,
+                              tags=None, nindex_levels=self.row_levels)
+
+            row = []
+            if self.fmt.index:
+                row.append(index_values[i])
+            # see gh-22579
+            # Column misalignment also occurs for
+            # a standard index when the columns index is named.
+            # Add blank cell before data cells.
+            elif self.show_col_idx_names:
+                row.append('')
+            row.extend(fmt_values[j][i] for j in range(self.ncols))
+
+            if truncate_h:
+                dot_col_ix = self.fmt.tr_col_num + self.row_levels
+                row.insert(dot_col_ix, '...')
+            self.write_tr(row, indent, self.indent_delta, tags=None,
+                          nindex_levels=self.row_levels)
+
+    def _write_hierarchical_rows(self, fmt_values, indent):
+        template = 'rowspan="{span}" valign="top"'
+
+        truncate_h = self.fmt.truncate_h
+        truncate_v = self.fmt.truncate_v
+        frame = self.fmt.tr_frame
+        nrows = len(frame)
+
+        idx_values = frame.index.format(sparsify=False, adjoin=False,
+                                        names=False)
+        idx_values = lzip(*idx_values)
+
+        if self.fmt.sparsify:
+            # GH3547
+            sentinel = object()
+            levels = frame.index.format(sparsify=sentinel, adjoin=False,
+                                        names=False)
+
+            level_lengths = get_level_lengths(levels, sentinel)
+            inner_lvl = len(level_lengths) - 1
+            if truncate_v:
+                # Insert ... row and adjust idx_values and
+                # level_lengths to take this into account.
+                ins_row = self.fmt.tr_row_num
+                inserted = False
+                for lnum, records in enumerate(level_lengths):
+                    rec_new = {}
+                    for tag, span in list(records.items()):
+                        if tag >= ins_row:
+                            rec_new[tag + 1] = span
+                        elif tag + span > ins_row:
+                            rec_new[tag] = span + 1
+
+                            # GH 14882 - Make sure insertion done once
+                            if not inserted:
+                                dot_row = list(idx_values[ins_row - 1])
+                                dot_row[-1] = u('...')
+                                idx_values.insert(ins_row, tuple(dot_row))
+                                inserted = True
+                            else:
+                                dot_row = list(idx_values[ins_row])
+                                dot_row[inner_lvl - lnum] = u('...')
+                                idx_values[ins_row] = tuple(dot_row)
+                        else:
+                            rec_new[tag] = span
+                        # If ins_row lies between tags, all cols idx cols
+                        # receive ...
+                        if tag + span == ins_row:
+                            rec_new[ins_row] = 1
+                            if lnum == 0:
+                                idx_values.insert(ins_row, tuple(
+                                    [u('...')] * len(level_lengths)))
+
+                            # GH 14882 - Place ... in correct level
+                            elif inserted:
+                                dot_row = list(idx_values[ins_row])
+                                dot_row[inner_lvl - lnum] = u('...')
+                                idx_values[ins_row] = tuple(dot_row)
+                    level_lengths[lnum] = rec_new
+
+                level_lengths[inner_lvl][ins_row] = 1
+                for ix_col in range(len(fmt_values)):
+                    fmt_values[ix_col].insert(ins_row, '...')
+                nrows += 1
+
+            for i in range(nrows):
+                row = []
+                tags = {}
+
+                sparse_offset = 0
+                j = 0
+                for records, v in zip(level_lengths, idx_values[i]):
+                    if i in records:
+                        if records[i] > 1:
+                            tags[j] = template.format(span=records[i])
+                    else:
+                        sparse_offset += 1
+                        continue
+
+                    j += 1
+                    row.append(v)
+
+                row.extend(fmt_values[j][i] for j in range(self.ncols))
+                if truncate_h:
+                    row.insert(self.row_levels - sparse_offset +
+                               self.fmt.tr_col_num, '...')
+                self.write_tr(row, indent, self.indent_delta, tags=tags,
+                              nindex_levels=len(levels) - sparse_offset)
+        else:
+            row = []
+            for i in range(len(frame)):
+                if truncate_v and i == (self.fmt.tr_row_num):
+                    str_sep_row = ['...'] * len(row)
+                    self.write_tr(str_sep_row, indent, self.indent_delta,
+                                  tags=None, nindex_levels=self.row_levels)
+
+                idx_values = list(zip(*frame.index.format(
+                    sparsify=False, adjoin=False, names=False)))
+                row = []
+                row.extend(idx_values[i])
+                row.extend(fmt_values[j][i] for j in range(self.ncols))
+                if truncate_h:
+                    row.insert(self.row_levels + self.fmt.tr_col_num, '...')
+                self.write_tr(row, indent, self.indent_delta, tags=None,
+                              nindex_levels=frame.index.nlevels)
+
+
+class NotebookFormatter(HTMLFormatter):
+    """
+    Internal class for formatting output data in html for display in Jupyter
+    Notebooks. This class is intended for functionality specific to
+    DataFrame._repr_html_() and DataFrame.to_html(notebook=True)
+    """
+
+    def _get_formatted_values(self):
+        return {i: self.fmt._format_col(i) for i in range(self.ncols)}
+
+    def write_style(self):
+        # We use the "scoped" attribute here so that the desired
+        # style properties for the data frame are not then applied
+        # throughout the entire notebook.
+        template_first = """\
+            <style scoped>"""
+        template_last = """\
+            </style>"""
+        template_select = """\
+                .dataframe %s {
+                    %s: %s;
+                }"""
+        element_props = [('tbody tr th:only-of-type',
+                          'vertical-align',
+                          'middle'),
+                         ('tbody tr th',
+                          'vertical-align',
+                          'top')]
+        if isinstance(self.columns, ABCMultiIndex):
+            element_props.append(('thead tr th',
+                                  'text-align',
+                                  'left'))
+            if self.show_row_idx_names:
+                element_props.append(('thead tr:last-of-type th',
+                                      'text-align',
+                                      'right'))
+        else:
+            element_props.append(('thead th',
+                                  'text-align',
+                                  'right'))
+        template_mid = '\n\n'.join(map(lambda t: template_select % t,
+                                       element_props))
+        template = dedent('\n'.join((template_first,
+                                     template_mid,
+                                     template_last)))
+        self.write(template)
+
+    def render(self):
+        self.write('<div>')
+        self.write_style()
+        super(NotebookFormatter, self).render()
+        self.write('</div>')
+        return self.elements
diff --git a/pandas/io/formats/latex.py b/pandas/io/formats/latex.py
new file mode 100644
index 0000000000000..90be3364932a2
--- /dev/null
+++ b/pandas/io/formats/latex.py
@@ -0,0 +1,246 @@
+# -*- coding: utf-8 -*-
+"""
+Module for formatting output data in Latex.
+"""
+from __future__ import print_function
+
+import numpy as np
+
+from pandas.compat import map, range, u, zip
+
+from pandas.core.dtypes.generic import ABCMultiIndex
+
+from pandas import compat
+
+from pandas.io.formats.format import TableFormatter
+
+
+class LatexFormatter(TableFormatter):
+    """ Used to render a DataFrame to a LaTeX tabular/longtable environment
+    output.
+
+    Parameters
+    ----------
+    formatter : `DataFrameFormatter`
+    column_format : str, default None
+        The columns format as specified in `LaTeX table format
+        <https://en.wikibooks.org/wiki/LaTeX/Tables>`__ e.g 'rcl' for 3 columns
+    longtable : boolean, default False
+        Use a longtable environment instead of tabular.
+
+    See Also
+    --------
+    HTMLFormatter
+    """
+
+    def __init__(self, formatter, column_format=None, longtable=False,
+                 multicolumn=False, multicolumn_format=None, multirow=False):
+        self.fmt = formatter
+        self.frame = self.fmt.frame
+        self.bold_rows = self.fmt.kwds.get('bold_rows', False)
+        self.column_format = column_format
+        self.longtable = longtable
+        self.multicolumn = multicolumn
+        self.multicolumn_format = multicolumn_format
+        self.multirow = multirow
+
+    def write_result(self, buf):
+        """
+        Render a DataFrame to a LaTeX tabular/longtable environment output.
+        """
+
+        # string representation of the columns
+        if len(self.frame.columns) == 0 or len(self.frame.index) == 0:
+            info_line = (u('Empty {name}\nColumns: {col}\nIndex: {idx}')
+                         .format(name=type(self.frame).__name__,
+                                 col=self.frame.columns,
+                                 idx=self.frame.index))
+            strcols = [[info_line]]
+        else:
+            strcols = self.fmt._to_str_columns()
+
+        def get_col_type(dtype):
+            if issubclass(dtype.type, np.number):
+                return 'r'
+            else:
+                return 'l'
+
+        # reestablish the MultiIndex that has been joined by _to_str_column
+        if self.fmt.index and isinstance(self.frame.index, ABCMultiIndex):
+            out = self.frame.index.format(
+                adjoin=False, sparsify=self.fmt.sparsify,
+                names=self.fmt.has_index_names, na_rep=self.fmt.na_rep
+            )
+
+            # index.format will sparsify repeated entries with empty strings
+            # so pad these with some empty space
+            def pad_empties(x):
+                for pad in reversed(x):
+                    if pad:
+                        break
+                return [x[0]] + [i if i else ' ' * len(pad) for i in x[1:]]
+            out = (pad_empties(i) for i in out)
+
+            # Add empty spaces for each column level
+            clevels = self.frame.columns.nlevels
+            out = [[' ' * len(i[-1])] * clevels + i for i in out]
+
+            # Add the column names to the last index column
+            cnames = self.frame.columns.names
+            if any(cnames):
+                new_names = [i if i else '{}' for i in cnames]
+                out[self.frame.index.nlevels - 1][:clevels] = new_names
+
+            # Get rid of old multiindex column and add new ones
+            strcols = out + strcols[1:]
+
+        column_format = self.column_format
+        if column_format is None:
+            dtypes = self.frame.dtypes._values
+            column_format = ''.join(map(get_col_type, dtypes))
+            if self.fmt.index:
+                index_format = 'l' * self.frame.index.nlevels
+                column_format = index_format + column_format
+        elif not isinstance(column_format,
+                            compat.string_types):  # pragma: no cover
+            raise AssertionError('column_format must be str or unicode, '
+                                 'not {typ}'.format(typ=type(column_format)))
+
+        if not self.longtable:
+            buf.write('\\begin{{tabular}}{{{fmt}}}\n'
+                      .format(fmt=column_format))
+            buf.write('\\toprule\n')
+        else:
+            buf.write('\\begin{{longtable}}{{{fmt}}}\n'
+                      .format(fmt=column_format))
+            buf.write('\\toprule\n')
+
+        ilevels = self.frame.index.nlevels
+        clevels = self.frame.columns.nlevels
+        nlevels = clevels
+        if self.fmt.has_index_names and self.fmt.show_index_names:
+            nlevels += 1
+        strrows = list(zip(*strcols))
+        self.clinebuf = []
+
+        for i, row in enumerate(strrows):
+            if i == nlevels and self.fmt.header:
+                buf.write('\\midrule\n')  # End of header
+                if self.longtable:
+                    buf.write('\\endhead\n')
+                    buf.write('\\midrule\n')
+                    buf.write('\\multicolumn{{{n}}}{{r}}{{{{Continued on next '
+                              'page}}}} \\\\\n'.format(n=len(row)))
+                    buf.write('\\midrule\n')
+                    buf.write('\\endfoot\n\n')
+                    buf.write('\\bottomrule\n')
+                    buf.write('\\endlastfoot\n')
+            if self.fmt.kwds.get('escape', True):
+                # escape backslashes first
+                crow = [(x.replace('\\', '\\textbackslash ')
+                         .replace('_', '\\_')
+                         .replace('%', '\\%').replace('$', '\\$')
+                         .replace('#', '\\#').replace('{', '\\{')
+                         .replace('}', '\\}').replace('~', '\\textasciitilde ')
+                         .replace('^', '\\textasciicircum ')
+                         .replace('&', '\\&')
+                         if (x and x != '{}') else '{}') for x in row]
+            else:
+                crow = [x if x else '{}' for x in row]
+            if self.bold_rows and self.fmt.index:
+                # bold row labels
+                crow = ['\\textbf{{{x}}}'.format(x=x)
+                        if j < ilevels and x.strip() not in ['', '{}'] else x
+                        for j, x in enumerate(crow)]
+            if i < clevels and self.fmt.header and self.multicolumn:
+                # sum up columns to multicolumns
+                crow = self._format_multicolumn(crow, ilevels)
+            if (i >= nlevels and self.fmt.index and self.multirow and
+                    ilevels > 1):
+                # sum up rows to multirows
+                crow = self._format_multirow(crow, ilevels, i, strrows)
+            buf.write(' & '.join(crow))
+            buf.write(' \\\\\n')
+            if self.multirow and i < len(strrows) - 1:
+                self._print_cline(buf, i, len(strcols))
+
+        if not self.longtable:
+            buf.write('\\bottomrule\n')
+            buf.write('\\end{tabular}\n')
+        else:
+            buf.write('\\end{longtable}\n')
+
+    def _format_multicolumn(self, row, ilevels):
+        r"""
+        Combine columns belonging to a group to a single multicolumn entry
+        according to self.multicolumn_format
+
+        e.g.:
+        a &  &  & b & c &
+        will become
+        \multicolumn{3}{l}{a} & b & \multicolumn{2}{l}{c}
+        """
+        row2 = list(row[:ilevels])
+        ncol = 1
+        coltext = ''
+
+        def append_col():
+            # write multicolumn if needed
+            if ncol > 1:
+                row2.append('\\multicolumn{{{ncol:d}}}{{{fmt:s}}}{{{txt:s}}}'
+                            .format(ncol=ncol, fmt=self.multicolumn_format,
+                                    txt=coltext.strip()))
+            # don't modify where not needed
+            else:
+                row2.append(coltext)
+        for c in row[ilevels:]:
+            # if next col has text, write the previous
+            if c.strip():
+                if coltext:
+                    append_col()
+                coltext = c
+                ncol = 1
+            # if not, add it to the previous multicolumn
+            else:
+                ncol += 1
+        # write last column name
+        if coltext:
+            append_col()
+        return row2
+
+    def _format_multirow(self, row, ilevels, i, rows):
+        r"""
+        Check following rows, whether row should be a multirow
+
+        e.g.:     becomes:
+        a & 0 &   \multirow{2}{*}{a} & 0 &
+          & 1 &     & 1 &
+        b & 0 &   \cline{1-2}
+                  b & 0 &
+        """
+        for j in range(ilevels):
+            if row[j].strip():
+                nrow = 1
+                for r in rows[i + 1:]:
+                    if not r[j].strip():
+                        nrow += 1
+                    else:
+                        break
+                if nrow > 1:
+                    # overwrite non-multirow entry
+                    row[j] = '\\multirow{{{nrow:d}}}{{*}}{{{row:s}}}'.format(
+                        nrow=nrow, row=row[j].strip())
+                    # save when to end the current block with \cline
+                    self.clinebuf.append([i + nrow - 1, j + 1])
+        return row
+
+    def _print_cline(self, buf, i, icol):
+        """
+        Print clines after multirow-blocks are finished
+        """
+        for cl in self.clinebuf:
+            if cl[0] == i:
+                buf.write('\\cline{{{cl:d}-{icol:d}}}\n'
+                          .format(cl=cl[1], icol=icol))
+        # remove entries that have been written to buffer
+        self.clinebuf = [x for x in self.clinebuf if x[0] != i]
diff --git a/pandas/io/formats/printing.py b/pandas/io/formats/printing.py
new file mode 100644
index 0000000000000..6d45d1e5dfcee
--- /dev/null
+++ b/pandas/io/formats/printing.py
@@ -0,0 +1,435 @@
+"""
+printing tools
+"""
+
+import sys
+
+from pandas.compat import u
+
+from pandas.core.dtypes.inference import is_sequence
+
+from pandas import compat
+from pandas.core.config import get_option
+
+
+def adjoin(space, *lists, **kwargs):
+    """
+    Glues together two sets of strings using the amount of space requested.
+    The idea is to prettify.
+
+    ----------
+    space : int
+        number of spaces for padding
+    lists : str
+        list of str which being joined
+    strlen : callable
+        function used to calculate the length of each str. Needed for unicode
+        handling.
+    justfunc : callable
+        function used to justify str. Needed for unicode handling.
+    """
+    strlen = kwargs.pop('strlen', len)
+    justfunc = kwargs.pop('justfunc', justify)
+
+    out_lines = []
+    newLists = []
+    lengths = [max(map(strlen, x)) + space for x in lists[:-1]]
+    # not the last one
+    lengths.append(max(map(len, lists[-1])))
+    maxLen = max(map(len, lists))
+    for i, lst in enumerate(lists):
+        nl = justfunc(lst, lengths[i], mode='left')
+        nl.extend([' ' * lengths[i]] * (maxLen - len(lst)))
+        newLists.append(nl)
+    toJoin = zip(*newLists)
+    for lines in toJoin:
+        out_lines.append(_join_unicode(lines))
+    return _join_unicode(out_lines, sep='\n')
+
+
+def justify(texts, max_len, mode='right'):
+    """
+    Perform ljust, center, rjust against string or list-like
+    """
+    if mode == 'left':
+        return [x.ljust(max_len) for x in texts]
+    elif mode == 'center':
+        return [x.center(max_len) for x in texts]
+    else:
+        return [x.rjust(max_len) for x in texts]
+
+
+def _join_unicode(lines, sep=''):
+    try:
+        return sep.join(lines)
+    except UnicodeDecodeError:
+        sep = compat.text_type(sep)
+        return sep.join([x.decode('utf-8') if isinstance(x, str) else x
+                         for x in lines])
+
+
+# Unicode consolidation
+# ---------------------
+#
+# pprinting utility functions for generating Unicode text or
+# bytes(3.x)/str(2.x) representations of objects.
+# Try to use these as much as possible rather then rolling your own.
+#
+# When to use
+# -----------
+#
+# 1) If you're writing code internal to pandas (no I/O directly involved),
+#    use pprint_thing().
+#
+#    It will always return unicode text which can handled by other
+#    parts of the package without breakage.
+#
+# 2) if you need to write something out to file, use
+#    pprint_thing_encoded(encoding).
+#
+#    If no encoding is specified, it defaults to utf-8. Since encoding pure
+#    ascii with utf-8 is a no-op you can safely use the default utf-8 if you're
+#    working with straight ascii.
+
+
+def _pprint_seq(seq, _nest_lvl=0, max_seq_items=None, **kwds):
+    """
+    internal. pprinter for iterables. you should probably use pprint_thing()
+    rather then calling this directly.
+
+    bounds length of printed sequence, depending on options
+    """
+    if isinstance(seq, set):
+        fmt = u("{{{body}}}")
+    else:
+        fmt = u("[{body}]") if hasattr(seq, '__setitem__') else u("({body})")
+
+    if max_seq_items is False:
+        nitems = len(seq)
+    else:
+        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
+
+    s = iter(seq)
+    # handle sets, no slicing
+    r = [pprint_thing(next(s),
+                      _nest_lvl + 1, max_seq_items=max_seq_items, **kwds)
+         for i in range(min(nitems, len(seq)))]
+    body = ", ".join(r)
+
+    if nitems < len(seq):
+        body += ", ..."
+    elif isinstance(seq, tuple) and len(seq) == 1:
+        body += ','
+
+    return fmt.format(body=body)
+
+
+def _pprint_dict(seq, _nest_lvl=0, max_seq_items=None, **kwds):
+    """
+    internal. pprinter for iterables. you should probably use pprint_thing()
+    rather then calling this directly.
+    """
+    fmt = u("{{{things}}}")
+    pairs = []
+
+    pfmt = u("{key}: {val}")
+
+    if max_seq_items is False:
+        nitems = len(seq)
+    else:
+        nitems = max_seq_items or get_option("max_seq_items") or len(seq)
+
+    for k, v in list(seq.items())[:nitems]:
+        pairs.append(
+            pfmt.format(
+                key=pprint_thing(k, _nest_lvl + 1,
+                                 max_seq_items=max_seq_items, **kwds),
+                val=pprint_thing(v, _nest_lvl + 1,
+                                 max_seq_items=max_seq_items, **kwds)))
+
+    if nitems < len(seq):
+        return fmt.format(things=", ".join(pairs) + ", ...")
+    else:
+        return fmt.format(things=", ".join(pairs))
+
+
+def pprint_thing(thing, _nest_lvl=0, escape_chars=None, default_escapes=False,
+                 quote_strings=False, max_seq_items=None):
+    """
+    This function is the sanctioned way of converting objects
+    to a unicode representation.
+
+    properly handles nested sequences containing unicode strings
+    (unicode(object) does not)
+
+    Parameters
+    ----------
+    thing : anything to be formatted
+    _nest_lvl : internal use only. pprint_thing() is mutually-recursive
+        with pprint_sequence, this argument is used to keep track of the
+        current nesting level, and limit it.
+    escape_chars : list or dict, optional
+        Characters to escape. If a dict is passed the values are the
+        replacements
+    default_escapes : bool, default False
+        Whether the input escape characters replaces or adds to the defaults
+    max_seq_items : False, int, default None
+        Pass thru to other pretty printers to limit sequence printing
+
+    Returns
+    -------
+    result - unicode object on py2, str on py3. Always Unicode.
+
+    """
+
+    def as_escaped_unicode(thing, escape_chars=escape_chars):
+        # Unicode is fine, else we try to decode using utf-8 and 'replace'
+        # if that's not it either, we have no way of knowing and the user
+        # should deal with it himself.
+
+        try:
+            result = compat.text_type(thing)  # we should try this first
+        except UnicodeDecodeError:
+            # either utf-8 or we replace errors
+            result = str(thing).decode('utf-8', "replace")
+
+        translate = {'\t': r'\t', '\n': r'\n', '\r': r'\r', }
+        if isinstance(escape_chars, dict):
+            if default_escapes:
+                translate.update(escape_chars)
+            else:
+                translate = escape_chars
+            escape_chars = list(escape_chars.keys())
+        else:
+            escape_chars = escape_chars or tuple()
+        for c in escape_chars:
+            result = result.replace(c, translate[c])
+
+        return compat.text_type(result)
+
+    if (compat.PY3 and hasattr(thing, '__next__')) or hasattr(thing, 'next'):
+        return compat.text_type(thing)
+    elif (isinstance(thing, dict) and
+          _nest_lvl < get_option("display.pprint_nest_depth")):
+        result = _pprint_dict(thing, _nest_lvl, quote_strings=True,
+                              max_seq_items=max_seq_items)
+    elif (is_sequence(thing) and
+          _nest_lvl < get_option("display.pprint_nest_depth")):
+        result = _pprint_seq(thing, _nest_lvl, escape_chars=escape_chars,
+                             quote_strings=quote_strings,
+                             max_seq_items=max_seq_items)
+    elif isinstance(thing, compat.string_types) and quote_strings:
+        if compat.PY3:
+            fmt = u("'{thing}'")
+        else:
+            fmt = u("u'{thing}'")
+        result = fmt.format(thing=as_escaped_unicode(thing))
+    else:
+        result = as_escaped_unicode(thing)
+
+    return compat.text_type(result)  # always unicode
+
+
+def pprint_thing_encoded(object, encoding='utf-8', errors='replace', **kwds):
+    value = pprint_thing(object)  # get unicode representation of object
+    return value.encode(encoding, errors, **kwds)
+
+
+def _enable_data_resource_formatter(enable):
+    if 'IPython' not in sys.modules:
+        # definitely not in IPython
+        return
+    from IPython import get_ipython
+    ip = get_ipython()
+    if ip is None:
+        # still not in IPython
+        return
+
+    formatters = ip.display_formatter.formatters
+    mimetype = "application/vnd.dataresource+json"
+
+    if enable:
+        if mimetype not in formatters:
+            # define tableschema formatter
+            from IPython.core.formatters import BaseFormatter
+
+            class TableSchemaFormatter(BaseFormatter):
+                print_method = '_repr_data_resource_'
+                _return_type = (dict,)
+            # register it:
+            formatters[mimetype] = TableSchemaFormatter()
+        # enable it if it's been disabled:
+        formatters[mimetype].enabled = True
+    else:
+        # unregister tableschema mime-type
+        if mimetype in formatters:
+            formatters[mimetype].enabled = False
+
+
+default_pprint = lambda x, max_seq_items=None: \
+    pprint_thing(x, escape_chars=('\t', '\r', '\n'), quote_strings=True,
+                 max_seq_items=max_seq_items)
+
+
+def format_object_summary(obj, formatter, is_justify=True, name=None,
+                          indent_for_name=True):
+    """
+    Return the formatted obj as a unicode string
+
+    Parameters
+    ----------
+    obj : object
+        must be iterable and support __getitem__
+    formatter : callable
+        string formatter for an element
+    is_justify : boolean
+        should justify the display
+    name : name, optional
+        defaults to the class name of the obj
+    indent_for_name : bool, default True
+        Whether subsequent lines should be be indented to
+        align with the name.
+
+    Returns
+    -------
+    summary string
+
+    """
+    from pandas.io.formats.console import get_console_size
+    from pandas.io.formats.format import _get_adjustment
+
+    display_width, _ = get_console_size()
+    if display_width is None:
+        display_width = get_option('display.width') or 80
+    if name is None:
+        name = obj.__class__.__name__
+
+    if indent_for_name:
+        name_len = len(name)
+        space1 = "\n%s" % (' ' * (name_len + 1))
+        space2 = "\n%s" % (' ' * (name_len + 2))
+    else:
+        space1 = "\n"
+        space2 = "\n "  # space for the opening '['
+
+    n = len(obj)
+    sep = ','
+    max_seq_items = get_option('display.max_seq_items') or n
+
+    # are we a truncated display
+    is_truncated = n > max_seq_items
+
+    # adj can optionally handle unicode eastern asian width
+    adj = _get_adjustment()
+
+    def _extend_line(s, line, value, display_width, next_line_prefix):
+
+        if (adj.len(line.rstrip()) + adj.len(value.rstrip()) >=
+                display_width):
+            s += line.rstrip()
+            line = next_line_prefix
+        line += value
+        return s, line
+
+    def best_len(values):
+        if values:
+            return max(adj.len(x) for x in values)
+        else:
+            return 0
+
+    close = u', '
+
+    if n == 0:
+        summary = u'[]{}'.format(close)
+    elif n == 1:
+        first = formatter(obj[0])
+        summary = u'[{}]{}'.format(first, close)
+    elif n == 2:
+        first = formatter(obj[0])
+        last = formatter(obj[-1])
+        summary = u'[{}, {}]{}'.format(first, last, close)
+    else:
+
+        if n > max_seq_items:
+            n = min(max_seq_items // 2, 10)
+            head = [formatter(x) for x in obj[:n]]
+            tail = [formatter(x) for x in obj[-n:]]
+        else:
+            head = []
+            tail = [formatter(x) for x in obj]
+
+        # adjust all values to max length if needed
+        if is_justify:
+
+            # however, if we are not truncated and we are only a single
+            # line, then don't justify
+            if (is_truncated or
+                    not (len(', '.join(head)) < display_width and
+                         len(', '.join(tail)) < display_width)):
+                max_len = max(best_len(head), best_len(tail))
+                head = [x.rjust(max_len) for x in head]
+                tail = [x.rjust(max_len) for x in tail]
+
+        summary = ""
+        line = space2
+
+        for i in range(len(head)):
+            word = head[i] + sep + ' '
+            summary, line = _extend_line(summary, line, word,
+                                         display_width, space2)
+
+        if is_truncated:
+            # remove trailing space of last line
+            summary += line.rstrip() + space2 + '...'
+            line = space2
+
+        for i in range(len(tail) - 1):
+            word = tail[i] + sep + ' '
+            summary, line = _extend_line(summary, line, word,
+                                         display_width, space2)
+
+        # last value: no sep added + 1 space of width used for trailing ','
+        summary, line = _extend_line(summary, line, tail[-1],
+                                     display_width - 2, space2)
+        summary += line
+
+        # right now close is either '' or ', '
+        # Now we want to include the ']', but not the maybe space.
+        close = ']' + close.rstrip(' ')
+        summary += close
+
+        if len(summary) > (display_width):
+            summary += space1
+        else:  # one row
+            summary += ' '
+
+        # remove initial space
+        summary = '[' + summary[len(space2):]
+
+    return summary
+
+
+def format_object_attrs(obj):
+    """
+    Return a list of tuples of the (attr, formatted_value)
+    for common attrs, including dtype, name, length
+
+    Parameters
+    ----------
+    obj : object
+        must be iterable
+
+    Returns
+    -------
+    list
+
+    """
+    attrs = []
+    if hasattr(obj, 'dtype'):
+        attrs.append(('dtype', "'{}'".format(obj.dtype)))
+    if getattr(obj, 'name', None) is not None:
+        attrs.append(('name', default_pprint(obj.name)))
+    max_seq_items = get_option('display.max_seq_items') or len(obj)
+    if len(obj) > max_seq_items:
+        attrs.append(('length', len(obj)))
+    return attrs
diff --git a/pandas/io/formats/style.py b/pandas/io/formats/style.py
new file mode 100644
index 0000000000000..b872f86eb8683
--- /dev/null
+++ b/pandas/io/formats/style.py
@@ -0,0 +1,1373 @@
+"""
+Module for applying conditional formatting to
+DataFrames and Series.
+"""
+
+from collections import defaultdict
+from contextlib import contextmanager
+import copy
+from functools import partial
+from itertools import product
+from uuid import uuid1
+
+import numpy as np
+
+from pandas.compat import range
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.common import is_float, is_string_like
+from pandas.core.dtypes.generic import ABCSeries
+
+import pandas as pd
+from pandas.api.types import is_dict_like, is_list_like
+import pandas.core.common as com
+from pandas.core.config import get_option
+from pandas.core.generic import _shared_docs
+from pandas.core.indexing import _maybe_numeric_slice, _non_reducing_slice
+
+try:
+    from jinja2 import (
+        PackageLoader, Environment, ChoiceLoader, FileSystemLoader
+    )
+except ImportError:
+    raise ImportError("pandas.Styler requires jinja2. "
+                      "Please install with `conda install Jinja2`\n"
+                      "or `pip install Jinja2`")
+
+
+try:
+    import matplotlib.pyplot as plt
+    from matplotlib import colors
+    has_mpl = True
+except ImportError:
+    has_mpl = False
+    no_mpl_message = "{0} requires matplotlib."
+
+
+@contextmanager
+def _mpl(func):
+    if has_mpl:
+        yield plt, colors
+    else:
+        raise ImportError(no_mpl_message.format(func.__name__))
+
+
+class Styler(object):
+    """
+    Helps style a DataFrame or Series according to the data with HTML and CSS.
+
+    Parameters
+    ----------
+    data : Series or DataFrame
+    precision : int
+        precision to round floats to, defaults to pd.options.display.precision
+    table_styles : list-like, default None
+        list of {selector: (attr, value)} dicts; see Notes
+    uuid : str, default None
+        a unique identifier to avoid CSS collisions; generated automatically
+    caption : str, default None
+        caption to attach to the table
+    cell_ids : bool, default True
+        If True, each cell will have an ``id`` attribute in their HTML tag.
+        The ``id`` takes the form ``T_<uuid>_row<num_row>_col<num_col>``
+        where ``<uuid>`` is the unique identifier, ``<num_row>`` is the row
+        number and ``<num_col>`` is the column number.
+
+    Attributes
+    ----------
+    env : Jinja2 Environment
+    template : Jinja2 Template
+    loader : Jinja2 Loader
+
+    See Also
+    --------
+    DataFrame.style
+
+    Notes
+    -----
+    Most styling will be done by passing style functions into
+    ``Styler.apply`` or ``Styler.applymap``. Style functions should
+    return values with strings containing CSS ``'attr: value'`` that will
+    be applied to the indicated cells.
+
+    If using in the Jupyter notebook, Styler has defined a ``_repr_html_``
+    to automatically render itself. Otherwise call Styler.render to get
+    the generated HTML.
+
+    CSS classes are attached to the generated HTML
+
+    * Index and Column names include ``index_name`` and ``level<k>``
+      where `k` is its level in a MultiIndex
+    * Index label cells include
+
+      * ``row_heading``
+      * ``row<n>`` where `n` is the numeric position of the row
+      * ``level<k>`` where `k` is the level in a MultiIndex
+
+    * Column label cells include
+      * ``col_heading``
+      * ``col<n>`` where `n` is the numeric position of the column
+      * ``evel<k>`` where `k` is the level in a MultiIndex
+
+    * Blank cells include ``blank``
+    * Data cells include ``data``
+    """
+    loader = PackageLoader("pandas", "io/formats/templates")
+    env = Environment(
+        loader=loader,
+        trim_blocks=True,
+    )
+    template = env.get_template("html.tpl")
+
+    def __init__(self, data, precision=None, table_styles=None, uuid=None,
+                 caption=None, table_attributes=None, cell_ids=True):
+        self.ctx = defaultdict(list)
+        self._todo = []
+
+        if not isinstance(data, (pd.Series, pd.DataFrame)):
+            raise TypeError("``data`` must be a Series or DataFrame")
+        if data.ndim == 1:
+            data = data.to_frame()
+        if not data.index.is_unique or not data.columns.is_unique:
+            raise ValueError("style is not supported for non-unique indices.")
+
+        self.data = data
+        self.index = data.index
+        self.columns = data.columns
+
+        self.uuid = uuid
+        self.table_styles = table_styles
+        self.caption = caption
+        if precision is None:
+            precision = get_option('display.precision')
+        self.precision = precision
+        self.table_attributes = table_attributes
+        self.hidden_index = False
+        self.hidden_columns = []
+        self.cell_ids = cell_ids
+
+        # display_funcs maps (row, col) -> formatting function
+
+        def default_display_func(x):
+            if is_float(x):
+                return '{:>.{precision}g}'.format(x, precision=self.precision)
+            else:
+                return x
+
+        self._display_funcs = defaultdict(lambda: default_display_func)
+
+    def _repr_html_(self):
+        """
+        Hooks into Jupyter notebook rich display system.
+        """
+        return self.render()
+
+    @Appender(_shared_docs['to_excel'] % dict(
+        axes='index, columns', klass='Styler',
+        axes_single_arg="{0 or 'index', 1 or 'columns'}",
+        optional_by="""
+            by : str or list of str
+                Name or list of names which refer to the axis items.""",
+        versionadded_to_excel='\n    .. versionadded:: 0.20'))
+    def to_excel(self, excel_writer, sheet_name='Sheet1', na_rep='',
+                 float_format=None, columns=None, header=True, index=True,
+                 index_label=None, startrow=0, startcol=0, engine=None,
+                 merge_cells=True, encoding=None, inf_rep='inf', verbose=True,
+                 freeze_panes=None):
+
+        from pandas.io.formats.excel import ExcelFormatter
+        formatter = ExcelFormatter(self, na_rep=na_rep, cols=columns,
+                                   header=header,
+                                   float_format=float_format, index=index,
+                                   index_label=index_label,
+                                   merge_cells=merge_cells,
+                                   inf_rep=inf_rep)
+        formatter.write(excel_writer, sheet_name=sheet_name, startrow=startrow,
+                        startcol=startcol, freeze_panes=freeze_panes,
+                        engine=engine)
+
+    def _translate(self):
+        """
+        Convert the DataFrame in `self.data` and the attrs from `_build_styles`
+        into a dictionary of {head, body, uuid, cellstyle}.
+        """
+        table_styles = self.table_styles or []
+        caption = self.caption
+        ctx = self.ctx
+        precision = self.precision
+        hidden_index = self.hidden_index
+        hidden_columns = self.hidden_columns
+        uuid = self.uuid or str(uuid1()).replace("-", "_")
+        ROW_HEADING_CLASS = "row_heading"
+        COL_HEADING_CLASS = "col_heading"
+        INDEX_NAME_CLASS = "index_name"
+
+        DATA_CLASS = "data"
+        BLANK_CLASS = "blank"
+        BLANK_VALUE = ""
+
+        def format_attr(pair):
+            return "{key}={value}".format(**pair)
+
+        # for sparsifying a MultiIndex
+        idx_lengths = _get_level_lengths(self.index)
+        col_lengths = _get_level_lengths(self.columns, hidden_columns)
+
+        cell_context = dict()
+
+        n_rlvls = self.data.index.nlevels
+        n_clvls = self.data.columns.nlevels
+        rlabels = self.data.index.tolist()
+        clabels = self.data.columns.tolist()
+
+        if n_rlvls == 1:
+            rlabels = [[x] for x in rlabels]
+        if n_clvls == 1:
+            clabels = [[x] for x in clabels]
+        clabels = list(zip(*clabels))
+
+        cellstyle = []
+        head = []
+
+        for r in range(n_clvls):
+            # Blank for Index columns...
+            row_es = [{"type": "th",
+                       "value": BLANK_VALUE,
+                       "display_value": BLANK_VALUE,
+                       "is_visible": not hidden_index,
+                       "class": " ".join([BLANK_CLASS])}] * (n_rlvls - 1)
+
+            # ... except maybe the last for columns.names
+            name = self.data.columns.names[r]
+            cs = [BLANK_CLASS if name is None else INDEX_NAME_CLASS,
+                  "level{lvl}".format(lvl=r)]
+            name = BLANK_VALUE if name is None else name
+            row_es.append({"type": "th",
+                           "value": name,
+                           "display_value": name,
+                           "class": " ".join(cs),
+                           "is_visible": not hidden_index})
+
+            if clabels:
+                for c, value in enumerate(clabels[r]):
+                    cs = [COL_HEADING_CLASS, "level{lvl}".format(lvl=r),
+                          "col{col}".format(col=c)]
+                    cs.extend(cell_context.get(
+                        "col_headings", {}).get(r, {}).get(c, []))
+                    es = {
+                        "type": "th",
+                        "value": value,
+                        "display_value": value,
+                        "class": " ".join(cs),
+                        "is_visible": _is_visible(c, r, col_lengths),
+                    }
+                    colspan = col_lengths.get((r, c), 0)
+                    if colspan > 1:
+                        es["attributes"] = [
+                            format_attr({"key": "colspan", "value": colspan})
+                        ]
+                    row_es.append(es)
+                head.append(row_es)
+
+        if (self.data.index.names and
+                com._any_not_none(*self.data.index.names) and
+                not hidden_index):
+            index_header_row = []
+
+            for c, name in enumerate(self.data.index.names):
+                cs = [INDEX_NAME_CLASS,
+                      "level{lvl}".format(lvl=c)]
+                name = '' if name is None else name
+                index_header_row.append({"type": "th", "value": name,
+                                         "class": " ".join(cs)})
+
+            index_header_row.extend(
+                [{"type": "th",
+                  "value": BLANK_VALUE,
+                  "class": " ".join([BLANK_CLASS])
+                  }] * (len(clabels[0]) - len(hidden_columns)))
+
+            head.append(index_header_row)
+
+        body = []
+        for r, idx in enumerate(self.data.index):
+            row_es = []
+            for c, value in enumerate(rlabels[r]):
+                rid = [ROW_HEADING_CLASS, "level{lvl}".format(lvl=c),
+                       "row{row}".format(row=r)]
+                es = {
+                    "type": "th",
+                    "is_visible": (_is_visible(r, c, idx_lengths) and
+                                   not hidden_index),
+                    "value": value,
+                    "display_value": value,
+                    "id": "_".join(rid[1:]),
+                    "class": " ".join(rid)
+                }
+                rowspan = idx_lengths.get((c, r), 0)
+                if rowspan > 1:
+                    es["attributes"] = [
+                        format_attr({"key": "rowspan", "value": rowspan})
+                    ]
+                row_es.append(es)
+
+            for c, col in enumerate(self.data.columns):
+                cs = [DATA_CLASS, "row{row}".format(row=r),
+                      "col{col}".format(col=c)]
+                cs.extend(cell_context.get("data", {}).get(r, {}).get(c, []))
+                formatter = self._display_funcs[(r, c)]
+                value = self.data.iloc[r, c]
+                row_dict = {"type": "td",
+                            "value": value,
+                            "class": " ".join(cs),
+                            "display_value": formatter(value),
+                            "is_visible": (c not in hidden_columns)}
+                # only add an id if the cell has a style
+                if (self.cell_ids or
+                        not(len(ctx[r, c]) == 1 and ctx[r, c][0] == '')):
+                    row_dict["id"] = "_".join(cs[1:])
+                row_es.append(row_dict)
+                props = []
+                for x in ctx[r, c]:
+                    # have to handle empty styles like ['']
+                    if x.count(":"):
+                        props.append(x.split(":"))
+                    else:
+                        props.append(['', ''])
+                cellstyle.append({'props': props,
+                                  'selector': "row{row}_col{col}"
+                                  .format(row=r, col=c)})
+            body.append(row_es)
+
+        table_attr = self.table_attributes
+        use_mathjax = get_option("display.html.use_mathjax")
+        if not use_mathjax:
+            table_attr = table_attr or ''
+            if 'class="' in table_attr:
+                table_attr = table_attr.replace('class="',
+                                                'class="tex2jax_ignore ')
+            else:
+                table_attr += ' class="tex2jax_ignore"'
+
+        return dict(head=head, cellstyle=cellstyle, body=body, uuid=uuid,
+                    precision=precision, table_styles=table_styles,
+                    caption=caption, table_attributes=table_attr)
+
+    def format(self, formatter, subset=None):
+        """
+        Format the text display value of cells.
+
+        .. versionadded:: 0.18.0
+
+        Parameters
+        ----------
+        formatter : str, callable, or dict
+        subset : IndexSlice
+            An argument to ``DataFrame.loc`` that restricts which elements
+            ``formatter`` is applied to.
+
+        Returns
+        -------
+        self : Styler
+
+        Notes
+        -----
+
+        ``formatter`` is either an ``a`` or a dict ``{column name: a}`` where
+        ``a`` is one of
+
+        - str: this will be wrapped in: ``a.format(x)``
+        - callable: called with the value of an individual cell
+
+        The default display value for numeric values is the "general" (``g``)
+        format with ``pd.options.display.precision`` precision.
+
+        Examples
+        --------
+
+        >>> df = pd.DataFrame(np.random.randn(4, 2), columns=['a', 'b'])
+        >>> df.style.format("{:.2%}")
+        >>> df['c'] = ['a', 'b', 'c', 'd']
+        >>> df.style.format({'c': str.upper})
+        """
+        if subset is None:
+            row_locs = range(len(self.data))
+            col_locs = range(len(self.data.columns))
+        else:
+            subset = _non_reducing_slice(subset)
+            if len(subset) == 1:
+                subset = subset, self.data.columns
+
+            sub_df = self.data.loc[subset]
+            row_locs = self.data.index.get_indexer_for(sub_df.index)
+            col_locs = self.data.columns.get_indexer_for(sub_df.columns)
+
+        if is_dict_like(formatter):
+            for col, col_formatter in formatter.items():
+                # formatter must be callable, so '{}' are converted to lambdas
+                col_formatter = _maybe_wrap_formatter(col_formatter)
+                col_num = self.data.columns.get_indexer_for([col])[0]
+
+                for row_num in row_locs:
+                    self._display_funcs[(row_num, col_num)] = col_formatter
+        else:
+            # single scalar to format all cells with
+            locs = product(*(row_locs, col_locs))
+            for i, j in locs:
+                formatter = _maybe_wrap_formatter(formatter)
+                self._display_funcs[(i, j)] = formatter
+        return self
+
+    def render(self, **kwargs):
+        """
+        Render the built up styles to HTML.
+
+        Parameters
+        ----------
+        **kwargs
+            Any additional keyword arguments are passed
+            through to ``self.template.render``.
+            This is useful when you need to provide
+            additional variables for a custom template.
+
+            .. versionadded:: 0.20
+
+        Returns
+        -------
+        rendered : str
+            The rendered HTML.
+
+        Notes
+        -----
+        ``Styler`` objects have defined the ``_repr_html_`` method
+        which automatically calls ``self.render()`` when it's the
+        last item in a Notebook cell. When calling ``Styler.render()``
+        directly, wrap the result in ``IPython.display.HTML`` to view
+        the rendered HTML in the notebook.
+
+        Pandas uses the following keys in render. Arguments passed
+        in ``**kwargs`` take precedence, so think carefully if you want
+        to override them:
+
+        * head
+        * cellstyle
+        * body
+        * uuid
+        * precision
+        * table_styles
+        * caption
+        * table_attributes
+        """
+        self._compute()
+        # TODO: namespace all the pandas keys
+        d = self._translate()
+        # filter out empty styles, every cell will have a class
+        # but the list of props may just be [['', '']].
+        # so we have the neested anys below
+        trimmed = [x for x in d['cellstyle']
+                   if any(any(y) for y in x['props'])]
+        d['cellstyle'] = trimmed
+        d.update(kwargs)
+        return self.template.render(**d)
+
+    def _update_ctx(self, attrs):
+        """
+        Update the state of the Styler.
+
+        Collects a mapping of {index_label: ['<property>: <value>']}.
+
+        attrs : Series or DataFrame
+        should contain strings of '<property>: <value>;<prop2>: <val2>'
+        Whitespace shouldn't matter and the final trailing ';' shouldn't
+        matter.
+        """
+        for row_label, v in attrs.iterrows():
+            for col_label, col in v.iteritems():
+                i = self.index.get_indexer([row_label])[0]
+                j = self.columns.get_indexer([col_label])[0]
+                for pair in col.rstrip(";").split(";"):
+                    self.ctx[(i, j)].append(pair)
+
+    def _copy(self, deepcopy=False):
+        styler = Styler(self.data, precision=self.precision,
+                        caption=self.caption, uuid=self.uuid,
+                        table_styles=self.table_styles)
+        if deepcopy:
+            styler.ctx = copy.deepcopy(self.ctx)
+            styler._todo = copy.deepcopy(self._todo)
+        else:
+            styler.ctx = self.ctx
+            styler._todo = self._todo
+        return styler
+
+    def __copy__(self):
+        """
+        Deep copy by default.
+        """
+        return self._copy(deepcopy=False)
+
+    def __deepcopy__(self, memo):
+        return self._copy(deepcopy=True)
+
+    def clear(self):
+        """
+        Reset the styler, removing any previously applied styles.
+        Returns None.
+        """
+        self.ctx.clear()
+        self._todo = []
+
+    def _compute(self):
+        """
+        Execute the style functions built up in `self._todo`.
+
+        Relies on the conventions that all style functions go through
+        .apply or .applymap. The append styles to apply as tuples of
+
+        (application method, *args, **kwargs)
+        """
+        r = self
+        for func, args, kwargs in self._todo:
+            r = func(self)(*args, **kwargs)
+        return r
+
+    def _apply(self, func, axis=0, subset=None, **kwargs):
+        subset = slice(None) if subset is None else subset
+        subset = _non_reducing_slice(subset)
+        data = self.data.loc[subset]
+        if axis is not None:
+            result = data.apply(func, axis=axis,
+                                result_type='expand', **kwargs)
+            result.columns = data.columns
+        else:
+            result = func(data, **kwargs)
+            if not isinstance(result, pd.DataFrame):
+                raise TypeError(
+                    "Function {func!r} must return a DataFrame when "
+                    "passed to `Styler.apply` with axis=None"
+                    .format(func=func))
+            if not (result.index.equals(data.index) and
+                    result.columns.equals(data.columns)):
+                msg = ('Result of {func!r} must have identical index and '
+                       'columns as the input'.format(func=func))
+                raise ValueError(msg)
+
+        result_shape = result.shape
+        expected_shape = self.data.loc[subset].shape
+        if result_shape != expected_shape:
+            msg = ("Function {func!r} returned the wrong shape.\n"
+                   "Result has shape: {res}\n"
+                   "Expected shape:   {expect}".format(func=func,
+                                                       res=result.shape,
+                                                       expect=expected_shape))
+            raise ValueError(msg)
+        self._update_ctx(result)
+        return self
+
+    def apply(self, func, axis=0, subset=None, **kwargs):
+        """
+        Apply a function column-wise, row-wise, or table-wise,
+        updating the HTML representation with the result.
+
+        Parameters
+        ----------
+        func : function
+            ``func`` should take a Series or DataFrame (depending
+            on ``axis``), and return an object with the same shape.
+            Must return a DataFrame with identical index and
+            column labels when ``axis=None``
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            apply to each column (``axis=0`` or ``'index'``), to each row
+            (``axis=1`` or ``'columns'``), or to the entire DataFrame at once
+            with ``axis=None``.
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``func``
+
+        Returns
+        -------
+        self : Styler
+
+        Notes
+        -----
+        The output shape of ``func`` should match the input, i.e. if
+        ``x`` is the input row, column, or table (depending on ``axis``),
+        then ``func(x).shape == x.shape`` should be true.
+
+        This is similar to ``DataFrame.apply``, except that ``axis=None``
+        applies the function to the entire DataFrame at once,
+        rather than column-wise or row-wise.
+
+        Examples
+        --------
+        >>> def highlight_max(x):
+        ...     return ['background-color: yellow' if v == x.max() else ''
+                        for v in x]
+        ...
+        >>> df = pd.DataFrame(np.random.randn(5, 2))
+        >>> df.style.apply(highlight_max)
+        """
+        self._todo.append((lambda instance: getattr(instance, '_apply'),
+                           (func, axis, subset), kwargs))
+        return self
+
+    def _applymap(self, func, subset=None, **kwargs):
+        func = partial(func, **kwargs)  # applymap doesn't take kwargs?
+        if subset is None:
+            subset = pd.IndexSlice[:]
+        subset = _non_reducing_slice(subset)
+        result = self.data.loc[subset].applymap(func)
+        self._update_ctx(result)
+        return self
+
+    def applymap(self, func, subset=None, **kwargs):
+        """
+        Apply a function elementwise, updating the HTML
+        representation with the result.
+
+        Parameters
+        ----------
+        func : function
+            ``func`` should take a scalar and return a scalar
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``func``
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.where
+        """
+        self._todo.append((lambda instance: getattr(instance, '_applymap'),
+                           (func, subset), kwargs))
+        return self
+
+    def where(self, cond, value, other=None, subset=None, **kwargs):
+        """
+        Apply a function elementwise, updating the HTML
+        representation with a style which is selected in
+        accordance with the return value of a function.
+
+        .. versionadded:: 0.21.0
+
+        Parameters
+        ----------
+        cond : callable
+            ``cond`` should take a scalar and return a boolean
+        value : str
+            applied when ``cond`` returns true
+        other : str
+            applied when ``cond`` returns false
+        subset : IndexSlice
+            a valid indexer to limit ``data`` to *before* applying the
+            function. Consider using a pandas.IndexSlice
+        kwargs : dict
+            pass along to ``cond``
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.applymap
+        """
+
+        if other is None:
+            other = ''
+
+        return self.applymap(lambda val: value if cond(val) else other,
+                             subset=subset, **kwargs)
+
+    def set_precision(self, precision):
+        """
+        Set the precision used to render.
+
+        Parameters
+        ----------
+        precision : int
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.precision = precision
+        return self
+
+    def set_table_attributes(self, attributes):
+        """
+        Set the table attributes.
+
+        These are the items that show up in the opening ``<table>`` tag
+        in addition to to automatic (by default) id.
+
+        Parameters
+        ----------
+        attributes : string
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_table_attributes('class="pure-table"')
+        # ... <table class="pure-table"> ...
+        """
+        self.table_attributes = attributes
+        return self
+
+    def export(self):
+        """
+        Export the styles to applied to the current Styler.
+
+        Can be applied to a second style with ``Styler.use``.
+
+        Returns
+        -------
+        styles : list
+
+        See Also
+        --------
+        Styler.use
+        """
+        return self._todo
+
+    def use(self, styles):
+        """
+        Set the styles on the current Styler, possibly using styles
+        from ``Styler.export``.
+
+        Parameters
+        ----------
+        styles : list
+            list of style functions
+
+        Returns
+        -------
+        self : Styler
+
+        See Also
+        --------
+        Styler.export
+        """
+        self._todo.extend(styles)
+        return self
+
+    def set_uuid(self, uuid):
+        """
+        Set the uuid for a Styler.
+
+        Parameters
+        ----------
+        uuid : str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.uuid = uuid
+        return self
+
+    def set_caption(self, caption):
+        """
+        Set the caption on a Styler
+
+        Parameters
+        ----------
+        caption : str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.caption = caption
+        return self
+
+    def set_table_styles(self, table_styles):
+        """
+        Set the table styles on a Styler.
+
+        These are placed in a ``<style>`` tag before the generated HTML table.
+
+        Parameters
+        ----------
+        table_styles : list
+            Each individual table_style should be a dictionary with
+            ``selector`` and ``props`` keys. ``selector`` should be a CSS
+            selector that the style will be applied to (automatically
+            prefixed by the table's UUID) and ``props`` should be a list of
+            tuples with ``(attribute, value)``.
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_table_styles(
+        ...     [{'selector': 'tr:hover',
+        ...       'props': [('background-color', 'yellow')]}]
+        ... )
+        """
+        self.table_styles = table_styles
+        return self
+
+    def hide_index(self):
+        """
+        Hide any indices from rendering.
+
+        .. versionadded:: 0.23.0
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.hidden_index = True
+        return self
+
+    def hide_columns(self, subset):
+        """
+        Hide columns from rendering.
+
+        .. versionadded:: 0.23.0
+
+        Parameters
+        ----------
+        subset : IndexSlice
+            An argument to ``DataFrame.loc`` that identifies which columns
+            are hidden.
+
+        Returns
+        -------
+        self : Styler
+        """
+        subset = _non_reducing_slice(subset)
+        hidden_df = self.data.loc[subset]
+        self.hidden_columns = self.columns.get_indexer_for(hidden_df.columns)
+        return self
+
+    # -----------------------------------------------------------------------
+    # A collection of "builtin" styles
+    # -----------------------------------------------------------------------
+
+    @staticmethod
+    def _highlight_null(v, null_color):
+        return ('background-color: {color}'.format(color=null_color)
+                if pd.isna(v) else '')
+
+    def highlight_null(self, null_color='red'):
+        """
+        Shade the background ``null_color`` for missing values.
+
+        Parameters
+        ----------
+        null_color : str
+
+        Returns
+        -------
+        self : Styler
+        """
+        self.applymap(self._highlight_null, null_color=null_color)
+        return self
+
+    def background_gradient(self, cmap='PuBu', low=0, high=0, axis=0,
+                            subset=None, text_color_threshold=0.408):
+        """
+        Color the background in a gradient according to
+        the data in each column (optionally row).
+
+        Requires matplotlib.
+
+        Parameters
+        ----------
+        cmap : str or colormap
+            matplotlib colormap
+        low, high : float
+            compress the range by these values.
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            apply to each column (``axis=0`` or ``'index'``), to each row
+            (``axis=1`` or ``'columns'``), or to the entire DataFrame at once
+            with ``axis=None``.
+        subset : IndexSlice
+            a valid slice for ``data`` to limit the style application to.
+        text_color_threshold : float or int
+            luminance threshold for determining text color. Facilitates text
+            visibility across varying background colors. From 0 to 1.
+            0 = all text is dark colored, 1 = all text is light colored.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        self : Styler
+
+        Raises
+        ------
+        ValueError
+            If ``text_color_threshold`` is not a value from 0 to 1.
+
+        Notes
+        -----
+        Set ``text_color_threshold`` or tune ``low`` and ``high`` to keep the
+        text legible by not using the entire range of the color map. The range
+        of the data is extended by ``low * (x.max() - x.min())`` and ``high *
+        (x.max() - x.min())`` before normalizing.
+        """
+        subset = _maybe_numeric_slice(self.data, subset)
+        subset = _non_reducing_slice(subset)
+        self.apply(self._background_gradient, cmap=cmap, subset=subset,
+                   axis=axis, low=low, high=high,
+                   text_color_threshold=text_color_threshold)
+        return self
+
+    @staticmethod
+    def _background_gradient(s, cmap='PuBu', low=0, high=0,
+                             text_color_threshold=0.408):
+        """
+        Color background in a range according to the data.
+        """
+        if (not isinstance(text_color_threshold, (float, int)) or
+                not 0 <= text_color_threshold <= 1):
+            msg = "`text_color_threshold` must be a value from 0 to 1."
+            raise ValueError(msg)
+
+        with _mpl(Styler.background_gradient) as (plt, colors):
+            smin = s.values.min()
+            smax = s.values.max()
+            rng = smax - smin
+            # extend lower / upper bounds, compresses color range
+            norm = colors.Normalize(smin - (rng * low), smax + (rng * high))
+            # matplotlib colors.Normalize modifies inplace?
+            # https://github.com/matplotlib/matplotlib/issues/5427
+            rgbas = plt.cm.get_cmap(cmap)(norm(s.values))
+
+            def relative_luminance(rgba):
+                """
+                Calculate relative luminance of a color.
+
+                The calculation adheres to the W3C standards
+                (https://www.w3.org/WAI/GL/wiki/Relative_luminance)
+
+                Parameters
+                ----------
+                color : rgb or rgba tuple
+
+                Returns
+                -------
+                float
+                    The relative luminance as a value from 0 to 1
+                """
+                r, g, b = (
+                    x / 12.92 if x <= 0.03928 else ((x + 0.055) / 1.055 ** 2.4)
+                    for x in rgba[:3]
+                )
+                return 0.2126 * r + 0.7152 * g + 0.0722 * b
+
+            def css(rgba):
+                dark = relative_luminance(rgba) < text_color_threshold
+                text_color = '#f1f1f1' if dark else '#000000'
+                return 'background-color: {b};color: {c};'.format(
+                    b=colors.rgb2hex(rgba), c=text_color
+                )
+
+            if s.ndim == 1:
+                return [css(rgba) for rgba in rgbas]
+            else:
+                return pd.DataFrame(
+                    [[css(rgba) for rgba in row] for row in rgbas],
+                    index=s.index, columns=s.columns
+                )
+
+    def set_properties(self, subset=None, **kwargs):
+        """
+        Convenience method for setting one or more non-data dependent
+        properties or each cell.
+
+        Parameters
+        ----------
+        subset : IndexSlice
+            a valid slice for ``data`` to limit the style application to
+        kwargs : dict
+            property: value pairs to be set for each cell
+
+        Returns
+        -------
+        self : Styler
+
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.random.randn(10, 4))
+        >>> df.style.set_properties(color="white", align="right")
+        >>> df.style.set_properties(**{'background-color': 'yellow'})
+        """
+        values = ';'.join('{p}: {v}'.format(p=p, v=v)
+                          for p, v in kwargs.items())
+        f = lambda x: values
+        return self.applymap(f, subset=subset)
+
+    @staticmethod
+    def _bar(s, align, colors, width=100, vmin=None, vmax=None):
+        """
+        Draw bar chart in dataframe cells.
+        """
+        # Get input value range.
+        smin = s.min() if vmin is None else vmin
+        if isinstance(smin, ABCSeries):
+            smin = smin.min()
+        smax = s.max() if vmax is None else vmax
+        if isinstance(smax, ABCSeries):
+            smax = smax.max()
+        if align == 'mid':
+            smin = min(0, smin)
+            smax = max(0, smax)
+        elif align == 'zero':
+            # For "zero" mode, we want the range to be symmetrical around zero.
+            smax = max(abs(smin), abs(smax))
+            smin = -smax
+        # Transform to percent-range of linear-gradient
+        normed = width * (s.values - smin) / (smax - smin + 1e-12)
+        zero = -width * smin / (smax - smin + 1e-12)
+
+        def css_bar(start, end, color):
+            """
+            Generate CSS code to draw a bar from start to end.
+            """
+            css = 'width: 10em; height: 80%;'
+            if end > start:
+                css += 'background: linear-gradient(90deg,'
+                if start > 0:
+                    css += ' transparent {s:.1f}%, {c} {s:.1f}%, '.format(
+                        s=start, c=color
+                    )
+                css += '{c} {e:.1f}%, transparent {e:.1f}%)'.format(
+                    e=min(end, width), c=color,
+                )
+            return css
+
+        def css(x):
+            if pd.isna(x):
+                return ''
+
+            # avoid deprecated indexing `colors[x > zero]`
+            color = colors[1] if x > zero else colors[0]
+
+            if align == 'left':
+                return css_bar(0, x, color)
+            else:
+                return css_bar(min(x, zero), max(x, zero), color)
+
+        if s.ndim == 1:
+            return [css(x) for x in normed]
+        else:
+            return pd.DataFrame(
+                [[css(x) for x in row] for row in normed],
+                index=s.index, columns=s.columns
+            )
+
+    def bar(self, subset=None, axis=0, color='#d65f5f', width=100,
+            align='left', vmin=None, vmax=None):
+        """
+        Draw bar chart in the cell backgrounds.
+
+        Parameters
+        ----------
+        subset : IndexSlice, optional
+            A valid slice for `data` to limit the style application to.
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            apply to each column (``axis=0`` or ``'index'``), to each row
+            (``axis=1`` or ``'columns'``), or to the entire DataFrame at once
+            with ``axis=None``.
+        color : str or 2-tuple/list
+            If a str is passed, the color is the same for both
+            negative and positive numbers. If 2-tuple/list is used, the
+            first element is the color_negative and the second is the
+            color_positive (eg: ['#d65f5f', '#5fba7d']).
+        width : float, default 100
+            A number between 0 or 100. The largest value will cover `width`
+            percent of the cell's width.
+        align : {'left', 'zero',' mid'}, default 'left'
+            How to align the bars with the cells.
+
+            - 'left' : the min value starts at the left of the cell.
+            - 'zero' : a value of zero is located at the center of the cell.
+            - 'mid' : the center of the cell is at (max-min)/2, or
+              if values are all negative (positive) the zero is aligned
+              at the right (left) of the cell.
+
+              .. versionadded:: 0.20.0
+
+        vmin : float, optional
+            Minimum bar value, defining the left hand limit
+            of the bar drawing range, lower values are clipped to `vmin`.
+            When None (default): the minimum value of the data will be used.
+
+            .. versionadded:: 0.24.0
+
+        vmax : float, optional
+            Maximum bar value, defining the right hand limit
+            of the bar drawing range, higher values are clipped to `vmax`.
+            When None (default): the maximum value of the data will be used.
+
+            .. versionadded:: 0.24.0
+
+        Returns
+        -------
+        self : Styler
+        """
+        if align not in ('left', 'zero', 'mid'):
+            raise ValueError("`align` must be one of {'left', 'zero',' mid'}")
+
+        if not (is_list_like(color)):
+            color = [color, color]
+        elif len(color) == 1:
+            color = [color[0], color[0]]
+        elif len(color) > 2:
+            raise ValueError("`color` must be string or a list-like"
+                             " of length 2: [`color_neg`, `color_pos`]"
+                             " (eg: color=['#d65f5f', '#5fba7d'])")
+
+        subset = _maybe_numeric_slice(self.data, subset)
+        subset = _non_reducing_slice(subset)
+        self.apply(self._bar, subset=subset, axis=axis,
+                   align=align, colors=color, width=width,
+                   vmin=vmin, vmax=vmax)
+
+        return self
+
+    def highlight_max(self, subset=None, color='yellow', axis=0):
+        """
+        Highlight the maximum by shading the background.
+
+        Parameters
+        ----------
+        subset : IndexSlice, default None
+            a valid slice for ``data`` to limit the style application to.
+        color : str, default 'yellow'
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            apply to each column (``axis=0`` or ``'index'``), to each row
+            (``axis=1`` or ``'columns'``), or to the entire DataFrame at once
+            with ``axis=None``.
+
+        Returns
+        -------
+        self : Styler
+        """
+        return self._highlight_handler(subset=subset, color=color, axis=axis,
+                                       max_=True)
+
+    def highlight_min(self, subset=None, color='yellow', axis=0):
+        """
+        Highlight the minimum by shading the background.
+
+        Parameters
+        ----------
+        subset : IndexSlice, default None
+            a valid slice for ``data`` to limit the style application to.
+        color : str, default 'yellow'
+        axis : {0 or 'index', 1 or 'columns', None}, default 0
+            apply to each column (``axis=0`` or ``'index'``), to each row
+            (``axis=1`` or ``'columns'``), or to the entire DataFrame at once
+            with ``axis=None``.
+
+        Returns
+        -------
+        self : Styler
+        """
+        return self._highlight_handler(subset=subset, color=color, axis=axis,
+                                       max_=False)
+
+    def _highlight_handler(self, subset=None, color='yellow', axis=None,
+                           max_=True):
+        subset = _non_reducing_slice(_maybe_numeric_slice(self.data, subset))
+        self.apply(self._highlight_extrema, color=color, axis=axis,
+                   subset=subset, max_=max_)
+        return self
+
+    @staticmethod
+    def _highlight_extrema(data, color='yellow', max_=True):
+        """
+        Highlight the min or max in a Series or DataFrame.
+        """
+        attr = 'background-color: {0}'.format(color)
+        if data.ndim == 1:  # Series from .apply
+            if max_:
+                extrema = data == data.max()
+            else:
+                extrema = data == data.min()
+            return [attr if v else '' for v in extrema]
+        else:  # DataFrame from .tee
+            if max_:
+                extrema = data == data.max().max()
+            else:
+                extrema = data == data.min().min()
+            return pd.DataFrame(np.where(extrema, attr, ''),
+                                index=data.index, columns=data.columns)
+
+    @classmethod
+    def from_custom_template(cls, searchpath, name):
+        """
+        Factory function for creating a subclass of ``Styler``
+        with a custom template and Jinja environment.
+
+        Parameters
+        ----------
+        searchpath : str or list
+            Path or paths of directories containing the templates
+        name : str
+            Name of your custom template to use for rendering
+
+        Returns
+        -------
+        MyStyler : subclass of Styler
+            Has the correct ``env`` and ``template`` class attributes set.
+        """
+        loader = ChoiceLoader([
+            FileSystemLoader(searchpath),
+            cls.loader,
+        ])
+
+        class MyStyler(cls):
+            env = Environment(loader=loader)
+            template = env.get_template(name)
+
+        return MyStyler
+
+    def pipe(self, func, *args, **kwargs):
+        """
+        Apply ``func(self, *args, **kwargs)``, and return the result.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        func : function
+            Function to apply to the Styler.  Alternatively, a
+            ``(callable, keyword)`` tuple where ``keyword`` is a string
+            indicating the keyword of ``callable`` that expects the Styler.
+        *args, **kwargs :
+            Arguments passed to `func`.
+
+        Returns
+        -------
+        object :
+            The value returned by ``func``.
+
+        See Also
+        --------
+        DataFrame.pipe : Analogous method for DataFrame.
+        Styler.apply : Apply a function row-wise, column-wise, or table-wise to
+            modify the dataframe's styling.
+
+        Notes
+        -----
+        Like :meth:`DataFrame.pipe`, this method can simplify the
+        application of several user-defined functions to a styler.  Instead
+        of writing:
+
+        .. code-block:: python
+
+            f(g(df.style.set_precision(3), arg1=a), arg2=b, arg3=c)
+
+        users can write:
+
+        .. code-block:: python
+
+            (df.style.set_precision(3)
+               .pipe(g, arg1=a)
+               .pipe(f, arg2=b, arg3=c))
+
+        In particular, this allows users to define functions that take a
+        styler object, along with other parameters, and return the styler after
+        making styling changes (such as calling :meth:`Styler.apply` or
+        :meth:`Styler.set_properties`).  Using ``.pipe``, these user-defined
+        style "transformations" can be interleaved with calls to the built-in
+        Styler interface.
+
+        Examples
+        --------
+        >>> def format_conversion(styler):
+        ...     return (styler.set_properties(**{'text-align': 'right'})
+        ...                   .format({'conversion': '{:.1%}'}))
+
+        The user-defined ``format_conversion`` function above can be called
+        within a sequence of other style modifications:
+
+        >>> df = pd.DataFrame({'trial': list(range(5)),
+        ...                    'conversion': [0.75, 0.85, np.nan, 0.7, 0.72]})
+        >>> (df.style
+        ...    .highlight_min(subset=['conversion'], color='yellow')
+        ...    .pipe(format_conversion)
+        ...    .set_caption("Results with minimum conversion highlighted."))
+        """
+        return com._pipe(self, func, *args, **kwargs)
+
+
+def _is_visible(idx_row, idx_col, lengths):
+    """
+    Index -> {(idx_row, idx_col): bool}).
+    """
+    return (idx_col, idx_row) in lengths
+
+
+def _get_level_lengths(index, hidden_elements=None):
+    """
+    Given an index, find the level length for each element.
+
+    Optional argument is a list of index positions which
+    should not be visible.
+
+    Result is a dictionary of (level, inital_position): span
+    """
+    sentinel = object()
+    levels = index.format(sparsify=sentinel, adjoin=False, names=False)
+
+    if hidden_elements is None:
+        hidden_elements = []
+
+    lengths = {}
+    if index.nlevels == 1:
+        for i, value in enumerate(levels):
+            if(i not in hidden_elements):
+                lengths[(0, i)] = 1
+        return lengths
+
+    for i, lvl in enumerate(levels):
+        for j, row in enumerate(lvl):
+            if not get_option('display.multi_sparse'):
+                lengths[(i, j)] = 1
+            elif (row != sentinel) and (j not in hidden_elements):
+                last_label = j
+                lengths[(i, last_label)] = 1
+            elif (row != sentinel):
+                # even if its hidden, keep track of it in case
+                # length >1 and later elements are visible
+                last_label = j
+                lengths[(i, last_label)] = 0
+            elif(j not in hidden_elements):
+                lengths[(i, last_label)] += 1
+
+    non_zero_lengths = {
+        element: length for element, length in lengths.items() if length >= 1}
+
+    return non_zero_lengths
+
+
+def _maybe_wrap_formatter(formatter):
+    if is_string_like(formatter):
+        return lambda x: formatter.format(x)
+    elif callable(formatter):
+        return formatter
+    else:
+        msg = ("Expected a template string or callable, got {formatter} "
+               "instead".format(formatter=formatter))
+        raise TypeError(msg)
diff --git a/pandas/io/formats/templates/html.tpl b/pandas/io/formats/templates/html.tpl
new file mode 100644
index 0000000000000..15feafcea6864
--- /dev/null
+++ b/pandas/io/formats/templates/html.tpl
@@ -0,0 +1,70 @@
+{# Update the template_structure.html document too #}
+{%- block before_style -%}{%- endblock before_style -%}
+{% block style %}
+<style  type="text/css" >
+{% block table_styles %}
+{% for s in table_styles %}
+    #T_{{uuid}} {{s.selector}} {
+    {% for p,val in s.props %}
+      {{p}}: {{val}};
+    {% endfor -%}
+    }
+{%- endfor -%}
+{% endblock table_styles %}
+{% block before_cellstyle %}{% endblock before_cellstyle %}
+{% block cellstyle %}
+{%- for s in cellstyle %}
+    #T_{{uuid}}{{s.selector}} {
+    {% for p,val in s.props %}
+        {{p}}: {{val}};
+    {% endfor %}
+    }
+{%- endfor -%}
+{%- endblock cellstyle %}
+</style>
+{%- endblock style %}
+{%- block before_table %}{% endblock before_table %}
+{%- block table %}
+<table id="T_{{uuid}}" {% if table_attributes %}{{ table_attributes }}{% endif %}>
+{%- block caption %}
+{%- if caption -%}
+    <caption>{{caption}}</caption>
+{%- endif -%}
+{%- endblock caption %}
+{%- block thead %}
+<thead>
+    {%- block before_head_rows %}{% endblock %}
+    {%- for r in head %}
+    {%- block head_tr scoped %}
+    <tr>
+        {%- for c in r %}
+        {%- if c.is_visible != False %}
+        <{{ c.type }} class="{{c.class}}" {{ c.attributes|join(" ") }}>{{c.value}}</{{ c.type }}>
+        {%- endif %}
+        {%- endfor %}
+    </tr>
+    {%- endblock head_tr %}
+    {%- endfor %}
+    {%- block after_head_rows %}{% endblock %}
+</thead>
+{%- endblock thead %}
+{%- block tbody %}
+<tbody>
+    {% block before_rows %}{% endblock before_rows %}
+    {% for r in body %}
+    {% block tr scoped %}
+    <tr>
+        {% for c in r %}
+        {% if c.is_visible != False %}
+        <{{ c.type }} {% if c.id is defined -%} id="T_{{ uuid }}{{ c.id }}" {%- endif %} class="{{ c.class }}" {{ c.attributes|join(" ") }}>{{ c.display_value }}</{{ c.type }}>
+        {% endif %}
+        {%- endfor %}
+    </tr>
+    {% endblock tr %}
+    {%- endfor %}
+    {%- block after_rows %}{%- endblock after_rows %}
+</tbody>
+{%- endblock tbody %}
+</table>
+{%- endblock table %}
+{%- block after_table %}{% endblock after_table %}
diff --git a/pandas/io/formats/terminal.py b/pandas/io/formats/terminal.py
new file mode 100644
index 0000000000000..cf2383955d593
--- /dev/null
+++ b/pandas/io/formats/terminal.py
@@ -0,0 +1,152 @@
+"""
+get_terminal_size() -- return width and height of terminal as a tuple
+
+code from:
+http://stackoverflow.com/questions/566746/how-to-get-console- window-width-in-
+python
+
+written by
+Harco Kuppens (http://stackoverflow.com/users/825214/harco-kuppens)
+
+It is mentioned in the stackoverflow response that this code works
+on linux, os x, windows and cygwin (windows).
+"""
+from __future__ import print_function
+
+import os
+import shutil
+import subprocess
+
+from pandas.compat import PY3
+
+__all__ = ['get_terminal_size', 'is_terminal']
+
+
+def get_terminal_size():
+    """
+    Detect terminal size and return tuple = (width, height).
+
+    Only to be used when running in a terminal. Note that the IPython notebook,
+    IPython zmq frontends, or IDLE do not run in a terminal,
+    """
+    import platform
+
+    if PY3:
+        return shutil.get_terminal_size()
+
+    current_os = platform.system()
+    tuple_xy = None
+    if current_os == 'Windows':
+        tuple_xy = _get_terminal_size_windows()
+        if tuple_xy is None:
+            tuple_xy = _get_terminal_size_tput()
+            # needed for window's python in cygwin's xterm!
+    if (current_os == 'Linux' or current_os == 'Darwin' or
+            current_os.startswith('CYGWIN')):
+        tuple_xy = _get_terminal_size_linux()
+    if tuple_xy is None:
+        tuple_xy = (80, 25)      # default value
+    return tuple_xy
+
+
+def is_terminal():
+    """
+    Detect if Python is running in a terminal.
+
+    Returns True if Python is running in a terminal or False if not.
+    """
+    try:
+        ip = get_ipython()
+    except NameError:  # assume standard Python interpreter in a terminal
+        return True
+    else:
+        if hasattr(ip, 'kernel'):  # IPython as a Jupyter kernel
+            return False
+        else:  # IPython in a terminal
+            return True
+
+
+def _get_terminal_size_windows():
+
+    try:
+        from ctypes import windll, create_string_buffer
+
+        # stdin handle is -10
+        # stdout handle is -11
+        # stderr handle is -12
+
+        h = windll.kernel32.GetStdHandle(-12)
+        csbi = create_string_buffer(22)
+        res = windll.kernel32.GetConsoleScreenBufferInfo(h, csbi)
+    except (AttributeError, ValueError):
+        return None
+    if res:
+        import struct
+        (bufx, bufy, curx, cury, wattr, left, top, right, bottom, maxx,
+         maxy) = struct.unpack("hhhhHhhhhhh", csbi.raw)
+        sizex = right - left + 1
+        sizey = bottom - top + 1
+        return sizex, sizey
+    else:
+        return None
+
+
+def _get_terminal_size_tput():
+    # get terminal width
+    # src: http://stackoverflow.com/questions/263890/how-do-i-find-the-width
+    # -height-of-a-terminal-window
+
+    try:
+        proc = subprocess.Popen(["tput", "cols"],
+                                stdin=subprocess.PIPE,
+                                stdout=subprocess.PIPE)
+        output_cols = proc.communicate(input=None)
+        proc = subprocess.Popen(["tput", "lines"],
+                                stdin=subprocess.PIPE,
+                                stdout=subprocess.PIPE)
+        output_rows = proc.communicate(input=None)
+    except OSError:
+        return None
+
+    try:
+        # Some terminals (e.g. spyder) may report a terminal size of '',
+        # making the `int` fail.
+
+        cols = int(output_cols[0])
+        rows = int(output_rows[0])
+        return cols, rows
+    except (ValueError, IndexError):
+        return None
+
+
+def _get_terminal_size_linux():
+    def ioctl_GWINSZ(fd):
+        try:
+            import fcntl
+            import termios
+            import struct
+            cr = struct.unpack(
+                'hh', fcntl.ioctl(fd, termios.TIOCGWINSZ, '1234'))
+        except (struct.error, IOError):
+            return None
+        return cr
+    cr = ioctl_GWINSZ(0) or ioctl_GWINSZ(1) or ioctl_GWINSZ(2)
+    if not cr:
+        try:
+            fd = os.open(os.ctermid(), os.O_RDONLY)
+            cr = ioctl_GWINSZ(fd)
+            os.close(fd)
+        except OSError:
+            pass
+    if not cr or cr == (0, 0):
+        try:
+            from os import environ as env
+            cr = (env['LINES'], env['COLUMNS'])
+        except (ValueError, KeyError):
+            return None
+    return int(cr[1]), int(cr[0])
+
+
+if __name__ == "__main__":
+    sizex, sizey = get_terminal_size()
+    print('width = {w} height = {h}'.format(w=sizex, h=sizey))
diff --git a/pandas/io/gbq.py b/pandas/io/gbq.py
index b4dc9173f11ba..a6cec7ea8fb16 100644
--- a/pandas/io/gbq.py
+++ b/pandas/io/gbq.py
@@ -1,5 +1,7 @@
 """ Google BigQuery support """
 
+import warnings
+
 
 def _try_import():
     # since pandas is a dependency of pandas-gbq
@@ -22,88 +24,139 @@ def _try_import():
 
 
 def read_gbq(query, project_id=None, index_col=None, col_order=None,
-             reauth=False, verbose=True, private_key=None, dialect='legacy',
-             **kwargs):
-    r"""Load data from Google BigQuery.
-
-    The main method a user calls to execute a Query in Google BigQuery
-    and read results into a pandas DataFrame.
-
-    Google BigQuery API Client Library v2 for Python is used.
-    Documentation is available `here
-    <https://developers.google.com/api-client-library/python/apis/bigquery/v2>`__
-
-    Authentication to the Google BigQuery service is via OAuth 2.0.
-
-    - If "private_key" is not provided:
-
-      By default "application default credentials" are used.
-
-      If default application credentials are not found or are restrictive,
-      user account credentials are used. In this case, you will be asked to
-      grant permissions for product name 'pandas GBQ'.
+             reauth=False, auth_local_webserver=False, dialect=None,
+             location=None, configuration=None, credentials=None,
+             private_key=None, verbose=None):
+    """
+    Load data from Google BigQuery.
 
-    - If "private_key" is provided:
+    This function requires the `pandas-gbq package
+    <https://pandas-gbq.readthedocs.io>`__.
 
-      Service account credentials will be used to authenticate.
+    See the `How to authenticate with Google BigQuery
+    <https://pandas-gbq.readthedocs.io/en/latest/howto/authentication.html>`__
+    guide for authentication instructions.
 
     Parameters
     ----------
     query : str
-        SQL-Like Query to return data values
-    project_id : str
-        Google BigQuery Account project ID.
-    index_col : str (optional)
-        Name of result column to use for index in results DataFrame
-    col_order : list(str) (optional)
+        SQL-Like Query to return data values.
+    project_id : str, optional
+        Google BigQuery Account project ID. Optional when available from
+        the environment.
+    index_col : str, optional
+        Name of result column to use for index in results DataFrame.
+    col_order : list(str), optional
         List of BigQuery column names in the desired order for results
-        DataFrame
-    reauth : boolean (default False)
-        Force Google BigQuery to reauthenticate the user. This is useful
+        DataFrame.
+    reauth : boolean, default False
+        Force Google BigQuery to re-authenticate the user. This is useful
         if multiple accounts are used.
-    verbose : boolean (default True)
-        Verbose output
-    private_key : str (optional)
-        Service account private key in JSON format. Can be file path
-        or string contents. This is useful for remote server
-        authentication (eg. jupyter iPython notebook on remote host)
-
-    dialect : {'legacy', 'standard'}, default 'legacy'
-        'legacy' : Use BigQuery's legacy SQL dialect.
-        'standard' : Use BigQuery's standard SQL (beta), which is
-        compliant with the SQL 2011 standard. For more information
-        see `BigQuery SQL Reference
-        <https://cloud.google.com/bigquery/sql-reference/>`__
-
-    **kwargs : Arbitrary keyword arguments
-        configuration (dict): query config parameters for job processing.
+    auth_local_webserver : boolean, default False
+        Use the `local webserver flow`_ instead of the `console flow`_
+        when getting user credentials.
+
+        .. _local webserver flow:
+            http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_local_server
+        .. _console flow:
+            http://google-auth-oauthlib.readthedocs.io/en/latest/reference/google_auth_oauthlib.flow.html#google_auth_oauthlib.flow.InstalledAppFlow.run_console
+
+        *New in version 0.2.0 of pandas-gbq*.
+    dialect : str, default 'legacy'
+        Note: The default value is changing to 'standard' in a future verion.
+
+        SQL syntax dialect to use. Value can be one of:
+
+        ``'legacy'``
+            Use BigQuery's legacy SQL dialect. For more information see
+            `BigQuery Legacy SQL Reference
+            <https://cloud.google.com/bigquery/docs/reference/legacy-sql>`__.
+        ``'standard'``
+            Use BigQuery's standard SQL, which is
+            compliant with the SQL 2011 standard. For more information
+            see `BigQuery Standard SQL Reference
+            <https://cloud.google.com/bigquery/docs/reference/standard-sql/>`__.
+
+        .. versionchanged:: 0.24.0
+    location : str, optional
+        Location where the query job should run. See the `BigQuery locations
+        documentation
+        <https://cloud.google.com/bigquery/docs/dataset-locations>`__ for a
+        list of available locations. The location must match that of any
+        datasets used in the query.
+
+        *New in version 0.5.0 of pandas-gbq*.
+    configuration : dict, optional
+        Query config parameters for job processing.
         For example:
 
             configuration = {'query': {'useQueryCache': False}}
 
-        For more information see `BigQuery SQL Reference
-        <https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query>`__
+        For more information see `BigQuery REST API Reference
+        <https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query>`__.
+    credentials : google.auth.credentials.Credentials, optional
+        Credentials for accessing Google APIs. Use this parameter to override
+        default credentials, such as to use Compute Engine
+        :class:`google.auth.compute_engine.Credentials` or Service Account
+        :class:`google.oauth2.service_account.Credentials` directly.
+
+        *New in version 0.8.0 of pandas-gbq*.
+
+        .. versionadded:: 0.24.0
+    private_key : str, deprecated
+        Deprecated in pandas-gbq version 0.8.0. Use the ``credentials``
+        parameter and
+        :func:`google.oauth2.service_account.Credentials.from_service_account_info`
+        or
+        :func:`google.oauth2.service_account.Credentials.from_service_account_file`
+        instead.
+
+        Service account private key in JSON format. Can be file path
+        or string contents. This is useful for remote server
+        authentication (eg. Jupyter/IPython notebook on remote host).
+    verbose : None, deprecated
+        Deprecated in pandas-gbq version 0.4.0. Use the `logging module to
+        adjust verbosity instead
+        <https://pandas-gbq.readthedocs.io/en/latest/intro.html#logging>`__.
 
     Returns
     -------
     df: DataFrame
-        DataFrame representing results of query
+        DataFrame representing results of query.
 
+    See Also
+    --------
+    pandas_gbq.read_gbq : This function in the pandas-gbq library.
+    DataFrame.to_gbq : Write a DataFrame to Google BigQuery.
     """
     pandas_gbq = _try_import()
+
+    if dialect is None:
+        dialect = "legacy"
+        warnings.warn(
+            'The default value for dialect is changing to "standard" in a '
+            'future version of pandas-gbq. Pass in dialect="legacy" to '
+            "disable this warning.",
+            FutureWarning,
+            stacklevel=2,
+        )
+
     return pandas_gbq.read_gbq(
-        query, project_id=project_id,
-        index_col=index_col, col_order=col_order,
-        reauth=reauth, verbose=verbose,
-        private_key=private_key,
-        dialect=dialect,
-        **kwargs)
+        query, project_id=project_id, index_col=index_col,
+        col_order=col_order, reauth=reauth,
+        auth_local_webserver=auth_local_webserver, dialect=dialect,
+        location=location, configuration=configuration,
+        credentials=credentials, verbose=verbose, private_key=private_key)
 
 
-def to_gbq(dataframe, destination_table, project_id, chunksize=10000,
-           verbose=True, reauth=False, if_exists='fail', private_key=None):
+def to_gbq(dataframe, destination_table, project_id=None, chunksize=None,
+           reauth=False, if_exists='fail', auth_local_webserver=False,
+           table_schema=None, location=None, progress_bar=True,
+           credentials=None, verbose=None, private_key=None):
     pandas_gbq = _try_import()
-    pandas_gbq.to_gbq(dataframe, destination_table, project_id,
-                      chunksize=chunksize,
-                      verbose=verbose, reauth=reauth,
-                      if_exists=if_exists, private_key=private_key)
+    return pandas_gbq.to_gbq(
+        dataframe, destination_table, project_id=project_id,
+        chunksize=chunksize, reauth=reauth, if_exists=if_exists,
+        auth_local_webserver=auth_local_webserver, table_schema=table_schema,
+        location=location, progress_bar=progress_bar,
+        credentials=credentials, verbose=verbose, private_key=private_key)
diff --git a/pandas/io/gcs.py b/pandas/io/gcs.py
new file mode 100644
index 0000000000000..aa1cb648f05d1
--- /dev/null
+++ b/pandas/io/gcs.py
@@ -0,0 +1,16 @@
+""" GCS support for remote file interactivity """
+try:
+    import gcsfs
+except ImportError:
+    raise ImportError("The gcsfs library is required to handle GCS files")
+
+
+def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
+                           compression=None, mode=None):
+
+    if mode is None:
+        mode = 'rb'
+
+    fs = gcsfs.GCSFileSystem()
+    filepath_or_buffer = fs.open(filepath_or_buffer, mode)
+    return filepath_or_buffer, None, compression, True
diff --git a/pandas/io/html.py b/pandas/io/html.py
index 8a3709dba2176..347bb3eec54af 100644
--- a/pandas/io/html.py
+++ b/pandas/io/html.py
@@ -3,24 +3,24 @@
 
 """
 
+from distutils.version import LooseVersion
+import numbers
 import os
 import re
-import numbers
-import collections
 
-from distutils.version import LooseVersion
+import pandas.compat as compat
+from pandas.compat import (
+    binary_type, iteritems, lmap, lrange, raise_with_traceback, string_types,
+    u)
+from pandas.errors import AbstractMethodError, EmptyDataError
 
-import numpy as np
+from pandas.core.dtypes.common import is_list_like
 
-from pandas.types.common import is_list_like
-from pandas.io.common import (EmptyDataError, _is_url, urlopen,
-                              parse_url, _validate_header_arg)
-from pandas.io.parsers import TextParser
-from pandas.compat import (lrange, lmap, u, string_types, iteritems,
-                           raise_with_traceback, binary_type)
 from pandas import Series
-from pandas.core.common import AbstractMethodError
-from pandas.formats.printing import pprint_thing
+
+from pandas.io.common import _is_url, _validate_header_arg, urlopen
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.parsers import TextParser
 
 _IMPORTS = False
 _HAS_BS4 = False
@@ -36,8 +36,6 @@ def _importers():
     if _IMPORTS:
         return
 
-    _IMPORTS = True
-
     global _HAS_BS4, _HAS_LXML, _HAS_HTML5LIB
 
     try:
@@ -58,6 +56,8 @@ def _importers():
     except ImportError:
         pass
 
+    _IMPORTS = True
+
 
 #############
 # READ HTML #
@@ -159,6 +159,14 @@ class _HtmlFrameParser(object):
     attrs : dict
         List of HTML <table> element attributes to match.
 
+    encoding : str
+        Encoding to be used by parser
+
+    displayed_only : bool
+        Whether or not items with "display:none" should be ignored
+
+        .. versionadded:: 0.23.0
+
     Attributes
     ----------
     io : str or file-like
@@ -171,57 +179,71 @@ class _HtmlFrameParser(object):
         A dictionary of valid table attributes to use to search for table
         elements.
 
+    encoding : str
+        Encoding to be used by parser
+
+    displayed_only : bool
+        Whether or not items with "display:none" should be ignored
+
+        .. versionadded:: 0.23.0
+
     Notes
     -----
     To subclass this class effectively you must override the following methods:
         * :func:`_build_doc`
+        * :func:`_attr_getter`
         * :func:`_text_getter`
         * :func:`_parse_td`
+        * :func:`_parse_thead_tr`
+        * :func:`_parse_tbody_tr`
+        * :func:`_parse_tfoot_tr`
         * :func:`_parse_tables`
-        * :func:`_parse_tr`
-        * :func:`_parse_thead`
-        * :func:`_parse_tbody`
-        * :func:`_parse_tfoot`
+        * :func:`_equals_tag`
     See each method's respective documentation for details on their
     functionality.
     """
 
-    def __init__(self, io, match, attrs, encoding):
+    def __init__(self, io, match, attrs, encoding, displayed_only):
         self.io = io
         self.match = match
         self.attrs = attrs
         self.encoding = encoding
+        self.displayed_only = displayed_only
 
     def parse_tables(self):
+        """
+        Parse and return all tables from the DOM.
+
+        Returns
+        -------
+        list of parsed (header, body, footer) tuples from tables.
+        """
         tables = self._parse_tables(self._build_doc(), self.match, self.attrs)
-        return (self._build_table(table) for table in tables)
+        return (self._parse_thead_tbody_tfoot(table) for table in tables)
 
-    def _parse_raw_data(self, rows):
-        """Parse the raw data into a list of lists.
+    def _attr_getter(self, obj, attr):
+        """
+        Return the attribute value of an individual DOM node.
 
         Parameters
         ----------
-        rows : iterable of node-like
-            A list of row elements.
-
-        text_getter : callable
-            A callable that gets the text from an individual node. This must be
-            defined by subclasses.
+        obj : node-like
+            A DOM node.
 
-        column_finder : callable
-            A callable that takes a row node as input and returns a list of the
-            column node in that row. This must be defined by subclasses.
+        attr : str or unicode
+            The attribute, such as "colspan"
 
         Returns
         -------
-        data : list of list of strings
+        str or unicode
+            The attribute value.
         """
-        data = [[_remove_whitespace(self._text_getter(col)) for col in
-                 self._parse_td(row)] for row in rows]
-        return data
+        # Both lxml and BeautifulSoup have the same implementation:
+        return obj.get(attr)
 
     def _text_getter(self, obj):
-        """Return the text of an individual DOM node.
+        """
+        Return the text of an individual DOM node.
 
         Parameters
         ----------
@@ -241,143 +263,264 @@ def _parse_td(self, obj):
         Parameters
         ----------
         obj : node-like
+            A DOM <tr> node.
 
         Returns
         -------
-        columns : list of node-like
+        list of node-like
             These are the elements of each row, i.e., the columns.
         """
         raise AbstractMethodError(self)
 
-    def _parse_tables(self, doc, match, attrs):
-        """Return all tables from the parsed DOM.
+    def _parse_thead_tr(self, table):
+        """
+        Return the list of thead row elements from the parsed table element.
 
         Parameters
         ----------
-        doc : tree-like
-            The DOM from which to parse the table element.
-
-        match : str or regular expression
-            The text to search for in the DOM tree.
-
-        attrs : dict
-            A dictionary of table attributes that can be used to disambiguate
-            mutliple tables on a page.
-
-        Raises
-        ------
-        ValueError
-            * If `match` does not match any text in the document.
+        table : a table element that contains zero or more thead elements.
 
         Returns
         -------
-        tables : list of node-like
-            A list of <table> elements to be parsed into raw data.
+        list of node-like
+            These are the <tr> row elements of a table.
         """
         raise AbstractMethodError(self)
 
-    def _parse_tr(self, table):
-        """Return the list of row elements from the parsed table element.
+    def _parse_tbody_tr(self, table):
+        """
+        Return the list of tbody row elements from the parsed table element.
+
+        HTML5 table bodies consist of either 0 or more <tbody> elements (which
+        only contain <tr> elements) or 0 or more <tr> elements. This method
+        checks for both structures.
 
         Parameters
         ----------
-        table : node-like
-            A table element that contains row elements.
+        table : a table element that contains row elements.
 
         Returns
         -------
-        rows : list of node-like
-            A list row elements of a table, usually <tr> or <th> elements.
+        list of node-like
+            These are the <tr> row elements of a table.
         """
         raise AbstractMethodError(self)
 
-    def _parse_thead(self, table):
-        """Return the header of a table.
+    def _parse_tfoot_tr(self, table):
+        """
+        Return the list of tfoot row elements from the parsed table element.
 
         Parameters
         ----------
-        table : node-like
-            A table element that contains row elements.
+        table : a table element that contains row elements.
 
         Returns
         -------
-        thead : node-like
-            A <thead>...</thead> element.
+        list of node-like
+            These are the <tr> row elements of a table.
         """
         raise AbstractMethodError(self)
 
-    def _parse_tbody(self, table):
-        """Return the body of the table.
+    def _parse_tables(self, doc, match, attrs):
+        """
+        Return all tables from the parsed DOM.
 
         Parameters
         ----------
-        table : node-like
-            A table element that contains row elements.
+        doc : the DOM from which to parse the table element.
+
+        match : str or regular expression
+            The text to search for in the DOM tree.
+
+        attrs : dict
+            A dictionary of table attributes that can be used to disambiguate
+            multiple tables on a page.
+
+        Raises
+        ------
+        ValueError : `match` does not match any text in the document.
 
         Returns
         -------
-        tbody : node-like
-            A <tbody>...</tbody> element.
+        list of node-like
+            HTML <table> elements to be parsed into raw data.
         """
         raise AbstractMethodError(self)
 
-    def _parse_tfoot(self, table):
-        """Return the footer of the table if any.
+    def _equals_tag(self, obj, tag):
+        """
+        Return whether an individual DOM node matches a tag
 
         Parameters
         ----------
-        table : node-like
-            A table element that contains row elements.
+        obj : node-like
+            A DOM node.
+
+        tag : str
+            Tag name to be checked for equality.
 
         Returns
         -------
-        tfoot : node-like
-            A <tfoot>...</tfoot> element.
+        boolean
+            Whether `obj`'s tag name is `tag`
         """
         raise AbstractMethodError(self)
 
     def _build_doc(self):
-        """Return a tree-like object that can be used to iterate over the DOM.
+        """
+        Return a tree-like object that can be used to iterate over the DOM.
 
         Returns
         -------
-        obj : tree-like
+        node-like
+            The DOM from which to parse the table element.
         """
         raise AbstractMethodError(self)
 
-    def _build_table(self, table):
-        header = self._parse_raw_thead(table)
-        body = self._parse_raw_tbody(table)
-        footer = self._parse_raw_tfoot(table)
+    def _parse_thead_tbody_tfoot(self, table_html):
+        """
+        Given a table, return parsed header, body, and foot.
+
+        Parameters
+        ----------
+        table_html : node-like
+
+        Returns
+        -------
+        tuple of (header, body, footer), each a list of list-of-text rows.
+
+        Notes
+        -----
+        Header and body are lists-of-lists. Top level list is a list of
+        rows. Each row is a list of str text.
+
+        Logic: Use <thead>, <tbody>, <tfoot> elements to identify
+               header, body, and footer, otherwise:
+               - Put all rows into body
+               - Move rows from top of body to header only if
+                 all elements inside row are <th>
+               - Move rows from bottom of body to footer only if
+                 all elements inside row are <th>
+        """
+
+        header_rows = self._parse_thead_tr(table_html)
+        body_rows = self._parse_tbody_tr(table_html)
+        footer_rows = self._parse_tfoot_tr(table_html)
+
+        def row_is_all_th(row):
+            return all(self._equals_tag(t, 'th') for t in
+                       self._parse_td(row))
+
+        if not header_rows:
+            # The table has no <thead>. Move the top all-<th> rows from
+            # body_rows to header_rows. (This is a common case because many
+            # tables in the wild have no <thead> or <tfoot>
+            while body_rows and row_is_all_th(body_rows[0]):
+                header_rows.append(body_rows.pop(0))
+
+        header = self._expand_colspan_rowspan(header_rows)
+        body = self._expand_colspan_rowspan(body_rows)
+        footer = self._expand_colspan_rowspan(footer_rows)
+
         return header, body, footer
 
-    def _parse_raw_thead(self, table):
-        thead = self._parse_thead(table)
-        res = []
-        if thead:
-            trs = self._parse_tr(thead[0])
-            for tr in trs:
-                cols = lmap(self._text_getter, self._parse_td(tr))
-                if any([col != '' for col in cols]):
-                    res.append(cols)
-        return res
-
-    def _parse_raw_tfoot(self, table):
-        tfoot = self._parse_tfoot(table)
-        res = []
-        if tfoot:
-            res = lmap(self._text_getter, self._parse_td(tfoot[0]))
-        return np.atleast_1d(
-            np.array(res).squeeze()) if res and len(res) == 1 else res
-
-    def _parse_raw_tbody(self, table):
-        tbody = self._parse_tbody(table)
+    def _expand_colspan_rowspan(self, rows):
+        """
+        Given a list of <tr>s, return a list of text rows.
 
-        try:
-            res = self._parse_tr(tbody[0])
-        except IndexError:
-            res = self._parse_tr(table)
-        return self._parse_raw_data(res)
+        Parameters
+        ----------
+        rows : list of node-like
+            List of <tr>s
+
+        Returns
+        -------
+        list of list
+            Each returned row is a list of str text.
+
+        Notes
+        -----
+        Any cell with ``rowspan`` or ``colspan`` will have its contents copied
+        to subsequent cells.
+        """
+
+        all_texts = []  # list of rows, each a list of str
+        remainder = []  # list of (index, text, nrows)
+
+        for tr in rows:
+            texts = []  # the output for this row
+            next_remainder = []
+
+            index = 0
+            tds = self._parse_td(tr)
+            for td in tds:
+                # Append texts from previous rows with rowspan>1 that come
+                # before this <td>
+                while remainder and remainder[0][0] <= index:
+                    prev_i, prev_text, prev_rowspan = remainder.pop(0)
+                    texts.append(prev_text)
+                    if prev_rowspan > 1:
+                        next_remainder.append((prev_i, prev_text,
+                                               prev_rowspan - 1))
+                    index += 1
+
+                # Append the text from this <td>, colspan times
+                text = _remove_whitespace(self._text_getter(td))
+                rowspan = int(self._attr_getter(td, 'rowspan') or 1)
+                colspan = int(self._attr_getter(td, 'colspan') or 1)
+
+                for _ in range(colspan):
+                    texts.append(text)
+                    if rowspan > 1:
+                        next_remainder.append((index, text, rowspan - 1))
+                    index += 1
+
+            # Append texts from previous rows at the final position
+            for prev_i, prev_text, prev_rowspan in remainder:
+                texts.append(prev_text)
+                if prev_rowspan > 1:
+                    next_remainder.append((prev_i, prev_text,
+                                           prev_rowspan - 1))
+
+            all_texts.append(texts)
+            remainder = next_remainder
+
+        # Append rows that only appear because the previous row had non-1
+        # rowspan
+        while remainder:
+            next_remainder = []
+            texts = []
+            for prev_i, prev_text, prev_rowspan in remainder:
+                texts.append(prev_text)
+                if prev_rowspan > 1:
+                    next_remainder.append((prev_i, prev_text,
+                                           prev_rowspan - 1))
+            all_texts.append(texts)
+            remainder = next_remainder
+
+        return all_texts
+
+    def _handle_hidden_tables(self, tbl_list, attr_name):
+        """
+        Return list of tables, potentially removing hidden elements
+
+        Parameters
+        ----------
+        tbl_list : list of node-like
+            Type of list elements will vary depending upon parser used
+        attr_name : str
+            Name of the accessor for retrieving HTML attributes
+
+        Returns
+        -------
+        list of node-like
+            Return type matches `tbl_list`
+        """
+        if not self.displayed_only:
+            return tbl_list
+
+        return [x for x in tbl_list if "display:none" not in
+                getattr(x, attr_name).get('style', '').replace(" ", "")]
 
 
 class _BeautifulSoupHtml5LibFrameParser(_HtmlFrameParser):
@@ -400,27 +543,6 @@ def __init__(self, *args, **kwargs):
         from bs4 import SoupStrainer
         self._strainer = SoupStrainer('table')
 
-    def _text_getter(self, obj):
-        return obj.text
-
-    def _parse_td(self, row):
-        return row.find_all(('td', 'th'))
-
-    def _parse_tr(self, element):
-        return element.find_all('tr')
-
-    def _parse_th(self, element):
-        return element.find_all('th')
-
-    def _parse_thead(self, table):
-        return table.find_all('thead')
-
-    def _parse_tbody(self, table):
-        return table.find_all('tbody')
-
-    def _parse_tfoot(self, table):
-        return table.find_all('tfoot')
-
     def _parse_tables(self, doc, match, attrs):
         element_name = self._strainer.name
         tables = doc.find_all(element_name, attrs=attrs)
@@ -430,22 +552,50 @@ def _parse_tables(self, doc, match, attrs):
 
         result = []
         unique_tables = set()
+        tables = self._handle_hidden_tables(tables, "attrs")
 
         for table in tables:
+            if self.displayed_only:
+                for elem in table.find_all(
+                        style=re.compile(r"display:\s*none")):
+                    elem.decompose()
+
             if (table not in unique_tables and
                     table.find(text=match) is not None):
                 result.append(table)
             unique_tables.add(table)
 
         if not result:
-            raise ValueError("No tables found matching pattern %r" %
-                             match.pattern)
+            raise ValueError("No tables found matching pattern {patt!r}"
+                             .format(patt=match.pattern))
         return result
 
+    def _text_getter(self, obj):
+        return obj.text
+
+    def _equals_tag(self, obj, tag):
+        return obj.name == tag
+
+    def _parse_td(self, row):
+        return row.find_all(('td', 'th'), recursive=False)
+
+    def _parse_thead_tr(self, table):
+        return table.select('thead tr')
+
+    def _parse_tbody_tr(self, table):
+        from_tbody = table.select('tbody tr')
+        from_root = table.find_all('tr', recursive=False)
+        # HTML spec: at most one of these lists has content
+        return from_tbody + from_root
+
+    def _parse_tfoot_tr(self, table):
+        return table.select('tfoot tr')
+
     def _setup_build_doc(self):
         raw_text = _read(self.io)
         if not raw_text:
-            raise ValueError('No text parsed from document: %s' % self.io)
+            raise ValueError('No text parsed from document: {doc}'
+                             .format(doc=self.io))
         return raw_text
 
     def _build_doc(self):
@@ -472,8 +622,8 @@ def _build_xpath_expr(attrs):
     if 'class_' in attrs:
         attrs['class'] = attrs.pop('class_')
 
-    s = [u("@%s=%r") % (k, v) for k, v in iteritems(attrs)]
-    return u('[%s]') % ' and '.join(s)
+    s = [u("@{key}={val!r}").format(key=k, val=v) for k, v in iteritems(attrs)]
+    return u('[{expr}]').format(expr=' and '.join(s))
 
 
 _re_namespace = {'re': 'http://exslt.org/regular-expressions'}
@@ -505,19 +655,17 @@ def _text_getter(self, obj):
         return obj.text_content()
 
     def _parse_td(self, row):
-        return row.xpath('.//td|.//th')
-
-    def _parse_tr(self, table):
-        expr = './/tr[normalize-space()]'
-        return table.xpath(expr)
+        # Look for direct children only: the "row" element here may be a
+        # <thead> or <tfoot> (see _parse_thead_tr).
+        return row.xpath('./td|./th')
 
     def _parse_tables(self, doc, match, kwargs):
         pattern = match.pattern
 
         # 1. check all descendants for the given pattern and only search tables
         # 2. go up the tree until we find a table
-        query = '//table//*[re:test(text(), %r)]/ancestor::table'
-        xpath_expr = u(query) % pattern
+        query = '//table//*[re:test(text(), {patt!r})]/ancestor::table'
+        xpath_expr = u(query).format(patt=pattern)
 
         # if any table attributes were given build an xpath expression to
         # search for them
@@ -526,10 +674,25 @@ def _parse_tables(self, doc, match, kwargs):
 
         tables = doc.xpath(xpath_expr, namespaces=_re_namespace)
 
+        tables = self._handle_hidden_tables(tables, "attrib")
+        if self.displayed_only:
+            for table in tables:
+                # lxml utilizes XPATH 1.0 which does not have regex
+                # support. As a result, we find all elements with a style
+                # attribute and iterate them to check for display:none
+                for elem in table.xpath('.//*[@style]'):
+                    if "display:none" in elem.attrib.get(
+                            "style", "").replace(" ", ""):
+                        elem.getparent().remove(elem)
+
         if not tables:
-            raise ValueError("No tables found matching regex %r" % pattern)
+            raise ValueError("No tables found matching regex {patt!r}"
+                             .format(patt=pattern))
         return tables
 
+    def _equals_tag(self, obj, tag):
+        return obj.tag == tag
+
     def _build_doc(self):
         """
         Raises
@@ -548,18 +711,20 @@ def _build_doc(self):
         """
         from lxml.html import parse, fromstring, HTMLParser
         from lxml.etree import XMLSyntaxError
-
-        parser = HTMLParser(recover=False, encoding=self.encoding)
+        parser = HTMLParser(recover=True, encoding=self.encoding)
 
         try:
-            # try to parse the input in the simplest way
-            r = parse(self.io, parser=parser)
-
+            if _is_url(self.io):
+                with urlopen(self.io) as f:
+                    r = parse(f, parser=parser)
+            else:
+                # try to parse the input in the simplest way
+                r = parse(self.io, parser=parser)
             try:
                 r = r.getroot()
             except AttributeError:
                 pass
-        except (UnicodeDecodeError, IOError):
+        except (UnicodeDecodeError, IOError) as e:
             # if the input is a blob of html goop
             if not _is_url(self.io):
                 r = fromstring(self.io, parser=parser)
@@ -569,47 +734,38 @@ def _build_doc(self):
                 except AttributeError:
                     pass
             else:
-                # not a url
-                scheme = parse_url(self.io).scheme
-                if scheme not in _valid_schemes:
-                    # lxml can't parse it
-                    msg = ('%r is not a valid url scheme, valid schemes are '
-                           '%s') % (scheme, _valid_schemes)
-                    raise ValueError(msg)
-                else:
-                    # something else happened: maybe a faulty connection
-                    raise
+                raise e
         else:
             if not hasattr(r, 'text_content'):
                 raise XMLSyntaxError("no text parsed from document", 0, 0, 0)
         return r
 
-    def _parse_tbody(self, table):
-        return table.xpath('.//tbody')
+    def _parse_thead_tr(self, table):
+        rows = []
+
+        for thead in table.xpath('.//thead'):
+            rows.extend(thead.xpath('./tr'))
 
-    def _parse_thead(self, table):
-        return table.xpath('.//thead')
+            # HACK: lxml does not clean up the clearly-erroneous
+            # <thead><th>foo</th><th>bar</th></thead>. (Missing <tr>). Add
+            # the <thead> and _pretend_ it's a <tr>; _parse_td() will find its
+            # children as though it's a <tr>.
+            #
+            # Better solution would be to use html5lib.
+            elements_at_root = thead.xpath('./td|./th')
+            if elements_at_root:
+                rows.append(thead)
 
-    def _parse_tfoot(self, table):
-        return table.xpath('.//tfoot')
+        return rows
 
-    def _parse_raw_thead(self, table):
-        expr = './/thead'
-        thead = table.xpath(expr)
-        res = []
-        if thead:
-            trs = self._parse_tr(thead[0])
-            for tr in trs:
-                cols = [_remove_whitespace(x.text_content()) for x in
-                        self._parse_td(tr)]
-                if any([col != '' for col in cols]):
-                    res.append(cols)
-        return res
+    def _parse_tbody_tr(self, table):
+        from_tbody = table.xpath('.//tbody//tr')
+        from_root = table.xpath('./tr')
+        # HTML spec: at most one of these lists has content
+        return from_tbody + from_root
 
-    def _parse_raw_tfoot(self, table):
-        expr = './/tfoot//th|//tfoot//td'
-        return [_remove_whitespace(x.text_content()) for x in
-                table.xpath(expr)]
+    def _parse_tfoot_tr(self, table):
+        return table.xpath('.//tfoot//tr')
 
 
 def _expand_elements(body):
@@ -627,13 +783,19 @@ def _data_to_frame(**kwargs):
     header = kwargs.pop('header')
     kwargs['skiprows'] = _get_skiprows(kwargs['skiprows'])
     if head:
-        rows = lrange(len(head))
         body = head + body
-        if header is None:  # special case when a table has <th> elements
-            header = 0 if rows == [0] else rows
+
+        # Infer header when there is a <thead> or top <th>-only rows
+        if header is None:
+            if len(head) == 1:
+                header = 0
+            else:
+                # ignore all-empty-text rows
+                header = [i for i, row in enumerate(head)
+                          if any(text for text in row)]
 
     if foot:
-        body += [foot]
+        body += foot
 
     # fill out elements of body that are "ragged"
     _expand_elements(body)
@@ -669,8 +831,9 @@ def _parser_dispatch(flavor):
     """
     valid_parsers = list(_valid_parsers.keys())
     if flavor not in valid_parsers:
-        raise ValueError('%r is not a valid flavor, valid flavors are %s' %
-                         (flavor, valid_parsers))
+        raise ValueError('{invalid!r} is not a valid flavor, valid flavors '
+                         'are {valid}'
+                         .format(invalid=flavor, valid=valid_parsers))
 
     if flavor in ('bs4', 'html5lib'):
         if not _HAS_HTML5LIB:
@@ -679,14 +842,10 @@ def _parser_dispatch(flavor):
             raise ImportError(
                 "BeautifulSoup4 (bs4) not found, please install it")
         import bs4
-        if bs4.__version__ == LooseVersion('4.2.0'):
-            raise ValueError("You're using a version"
-                             " of BeautifulSoup4 (4.2.0) that has been"
-                             " known to cause problems on certain"
-                             " operating systems such as Debian. "
-                             "Please install a version of"
-                             " BeautifulSoup4 != 4.2.0, both earlier"
-                             " and later releases will work.")
+        if LooseVersion(bs4.__version__) <= LooseVersion('4.2.0'):
+            raise ValueError("A minimum version of BeautifulSoup 4.2.1 "
+                             "is required")
+
     else:
         if not _HAS_LXML:
             raise ImportError("lxml not found, please install it")
@@ -694,7 +853,8 @@ def _parser_dispatch(flavor):
 
 
 def _print_as_set(s):
-    return '{%s}' % ', '.join([pprint_thing(el) for el in s])
+    return ('{' + '{arg}'.format(arg=', '.join(
+        pprint_thing(el) for el in s)) + '}')
 
 
 def _validate_flavor(flavor):
@@ -702,27 +862,29 @@ def _validate_flavor(flavor):
         flavor = 'lxml', 'bs4'
     elif isinstance(flavor, string_types):
         flavor = flavor,
-    elif isinstance(flavor, collections.Iterable):
+    elif isinstance(flavor, compat.Iterable):
         if not all(isinstance(flav, string_types) for flav in flavor):
-            raise TypeError('Object of type %r is not an iterable of strings' %
-                            type(flavor).__name__)
+            raise TypeError('Object of type {typ!r} is not an iterable of '
+                            'strings'
+                            .format(typ=type(flavor).__name__))
     else:
-        fmt = '{0!r}' if isinstance(flavor, string_types) else '{0}'
+        fmt = '{flavor!r}' if isinstance(flavor, string_types) else '{flavor}'
         fmt += ' is not a valid flavor'
-        raise ValueError(fmt.format(flavor))
+        raise ValueError(fmt.format(flavor=flavor))
 
     flavor = tuple(flavor)
     valid_flavors = set(_valid_parsers)
     flavor_set = set(flavor)
 
     if not flavor_set & valid_flavors:
-        raise ValueError('%s is not a valid set of flavors, valid flavors are '
-                         '%s' % (_print_as_set(flavor_set),
-                                 _print_as_set(valid_flavors)))
+        raise ValueError('{invalid} is not a valid set of flavors, valid '
+                         'flavors are {valid}'
+                         .format(invalid=_print_as_set(flavor_set),
+                                 valid=_print_as_set(valid_flavors)))
     return flavor
 
 
-def _parse(flavor, io, match, attrs, encoding, **kwargs):
+def _parse(flavor, io, match, attrs, encoding, displayed_only, **kwargs):
     flavor = _validate_flavor(flavor)
     compiled_match = re.compile(match)  # you can pass a compiled regex here
 
@@ -730,11 +892,23 @@ def _parse(flavor, io, match, attrs, encoding, **kwargs):
     retained = None
     for flav in flavor:
         parser = _parser_dispatch(flav)
-        p = parser(io, compiled_match, attrs, encoding)
+        p = parser(io, compiled_match, attrs, encoding, displayed_only)
 
         try:
             tables = p.parse_tables()
         except Exception as caught:
+            # if `io` is an io-like object, check if it's seekable
+            # and try to rewind it before trying the next parser
+            if hasattr(io, 'seekable') and io.seekable():
+                io.seek(0)
+            elif hasattr(io, 'seekable') and not io.seekable():
+                # if we couldn't rewind it, let the user know
+                raise ValueError('The flavor {} failed to parse your input. '
+                                 'Since you passed a non-rewindable file '
+                                 'object, we can\'t rewind it to try '
+                                 'another parser. Try read_html() with a '
+                                 'different flavor.'.format(flav))
+
             retained = caught
         else:
             break
@@ -752,9 +926,9 @@ def _parse(flavor, io, match, attrs, encoding, **kwargs):
 
 def read_html(io, match='.+', flavor=None, header=None, index_col=None,
               skiprows=None, attrs=None, parse_dates=False,
-              tupleize_cols=False, thousands=',', encoding=None,
+              tupleize_cols=None, thousands=',', encoding=None,
               decimal='.', converters=None, na_values=None,
-              keep_default_na=True):
+              keep_default_na=True, displayed_only=True):
     r"""Read HTML tables into a ``list`` of ``DataFrame`` objects.
 
     Parameters
@@ -814,13 +988,16 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
         latest information on table attributes for the modern web.
 
     parse_dates : bool, optional
-        See :func:`~pandas.read_csv` for more details.
+        See :func:`~read_csv` for more details.
 
     tupleize_cols : bool, optional
         If ``False`` try to parse multiple header rows into a
         :class:`~pandas.MultiIndex`, otherwise return raw tuples. Defaults to
         ``False``.
 
+        .. deprecated:: 0.21.0
+           This argument will be removed and will always convert to MultiIndex
+
     thousands : str, optional
         Separator to use to parse thousands. Defaults to ``','``.
 
@@ -855,10 +1032,19 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
 
         .. versionadded:: 0.19.0
 
+    displayed_only : bool, default True
+        Whether elements with "display: none" should be parsed
+
+        .. versionadded:: 0.23.0
+
     Returns
     -------
     dfs : list of DataFrames
 
+    See Also
+    --------
+    read_csv
+
     Notes
     -----
     Before using this function you should read the :ref:`gotchas about the
@@ -872,9 +1058,15 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
 
     This function searches for ``<table>`` elements and only for ``<tr>``
     and ``<th>`` rows and ``<td>`` elements within each ``<tr>`` or ``<th>``
-    element in the table. ``<td>`` stands for "table data".
+    element in the table. ``<td>`` stands for "table data". This function
+    attempts to properly handle ``colspan`` and ``rowspan`` attributes.
+    If the function has a ``<thead>`` argument, it is used to construct
+    the header, otherwise the function attempts to find the header within
+    the body (by putting rows with only ``<th>`` elements into the header).
 
-    Similar to :func:`~pandas.read_csv` the `header` argument is applied
+        .. versionadded:: 0.21.0
+
+    Similar to :func:`~read_csv` the `header` argument is applied
     **after** `skiprows` is applied.
 
     This function will *always* return a list of :class:`DataFrame` *or*
@@ -884,10 +1076,6 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
     --------
     See the :ref:`read_html documentation in the IO section of the docs
     <io.read_html>` for some examples of reading in HTML tables.
-
-    See Also
-    --------
-    pandas.read_csv
     """
     _importers()
 
@@ -902,4 +1090,5 @@ def read_html(io, match='.+', flavor=None, header=None, index_col=None,
                   parse_dates=parse_dates, tupleize_cols=tupleize_cols,
                   thousands=thousands, attrs=attrs, encoding=encoding,
                   decimal=decimal, converters=converters, na_values=na_values,
-                  keep_default_na=keep_default_na)
+                  keep_default_na=keep_default_na,
+                  displayed_only=displayed_only)
diff --git a/pandas/io/json/json.py b/pandas/io/json/json.py
index 114ec4bb2723e..4bae067ee5196 100644
--- a/pandas/io/json/json.py
+++ b/pandas/io/json/json.py
@@ -1,21 +1,30 @@
 # pylint: disable-msg=E1101,W0613,W0603
+from itertools import islice
 import os
+
 import numpy as np
 
-from pandas.io.json import libjson
-from pandas._libs.tslib import iNaT
-from pandas.compat import StringIO, long, u
-from pandas import compat, isnull
-from pandas import Series, DataFrame, to_datetime
-from pandas.io.common import get_filepath_or_buffer, _get_handle
-from pandas.core.common import AbstractMethodError
-from pandas.formats.printing import pprint_thing
+import pandas._libs.json as json
+from pandas._libs.tslibs import iNaT
+from pandas.compat import StringIO, long, to_str, u
+from pandas.errors import AbstractMethodError
+
+from pandas.core.dtypes.common import is_period_dtype
+
+from pandas import DataFrame, MultiIndex, Series, compat, isna, to_datetime
+from pandas.core.reshape.concat import concat
+
+from pandas.io.common import (
+    BaseIterator, _get_handle, _infer_compression, _stringify_path,
+    get_filepath_or_buffer)
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.parsers import _validate_integer
+
 from .normalize import _convert_to_line_delimits
-from .table_schema import build_table_schema
-from pandas.types.common import is_period_dtype
+from .table_schema import build_table_schema, parse_table_schema
 
-loads = libjson.loads
-dumps = libjson.dumps
+loads = json.loads
+dumps = json.dumps
 
 TABLE_SCHEMA_VERSION = '0.20.0'
 
@@ -23,8 +32,14 @@
 # interface to/from
 def to_json(path_or_buf, obj, orient=None, date_format='epoch',
             double_precision=10, force_ascii=True, date_unit='ms',
-            default_handler=None, lines=False):
+            default_handler=None, lines=False, compression='infer',
+            index=True):
+
+    if not index and orient not in ['split', 'table']:
+        raise ValueError("'index=False' is only valid when 'orient' is "
+                         "'split' or 'table'")
 
+    path_or_buf = _stringify_path(path_or_buf)
     if lines and orient != 'records':
         raise ValueError(
             "'lines' keyword only valid when 'orient' is records")
@@ -43,14 +58,18 @@ def to_json(path_or_buf, obj, orient=None, date_format='epoch',
     s = writer(
         obj, orient=orient, date_format=date_format,
         double_precision=double_precision, ensure_ascii=force_ascii,
-        date_unit=date_unit, default_handler=default_handler).write()
+        date_unit=date_unit, default_handler=default_handler,
+        index=index).write()
 
     if lines:
         s = _convert_to_line_delimits(s)
 
     if isinstance(path_or_buf, compat.string_types):
-        with open(path_or_buf, 'w') as fh:
+        fh, handles = _get_handle(path_or_buf, 'w', compression=compression)
+        try:
             fh.write(s)
+        finally:
+            fh.close()
     elif path_or_buf is None:
         return s
     else:
@@ -58,9 +77,8 @@ def to_json(path_or_buf, obj, orient=None, date_format='epoch',
 
 
 class Writer(object):
-
     def __init__(self, obj, orient, date_format, double_precision,
-                 ensure_ascii, date_unit, default_handler=None):
+                 ensure_ascii, date_unit, index, default_handler=None):
         self.obj = obj
 
         if orient is None:
@@ -72,6 +90,7 @@ def __init__(self, obj, orient, date_format, double_precision,
         self.ensure_ascii = ensure_ascii
         self.date_unit = date_unit
         self.default_handler = default_handler
+        self.index = index
 
         self.is_copy = None
         self._format_axes()
@@ -80,14 +99,20 @@ def _format_axes(self):
         raise AbstractMethodError(self)
 
     def write(self):
+        return self._write(self.obj, self.orient, self.double_precision,
+                           self.ensure_ascii, self.date_unit,
+                           self.date_format == 'iso', self.default_handler)
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
         return dumps(
-            self.obj,
-            orient=self.orient,
-            double_precision=self.double_precision,
-            ensure_ascii=self.ensure_ascii,
-            date_unit=self.date_unit,
-            iso_dates=self.date_format == 'iso',
-            default_handler=self.default_handler
+            obj,
+            orient=orient,
+            double_precision=double_precision,
+            ensure_ascii=ensure_ascii,
+            date_unit=date_unit,
+            iso_dates=iso_dates,
+            default_handler=default_handler
         )
 
 
@@ -97,46 +122,73 @@ class SeriesWriter(Writer):
     def _format_axes(self):
         if not self.obj.index.is_unique and self.orient == 'index':
             raise ValueError("Series index must be unique for orient="
-                             "'%s'" % self.orient)
+                             "'{orient}'".format(orient=self.orient))
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        if not self.index and orient == 'split':
+            obj = {"name": obj.name, "data": obj.values}
+        return super(SeriesWriter, self)._write(obj, orient,
+                                                double_precision,
+                                                ensure_ascii, date_unit,
+                                                iso_dates, default_handler)
 
 
 class FrameWriter(Writer):
     _default_orient = 'columns'
 
     def _format_axes(self):
-        """ try to axes if they are datelike """
+        """
+        Try to format axes if they are datelike.
+        """
         if not self.obj.index.is_unique and self.orient in (
                 'index', 'columns'):
             raise ValueError("DataFrame index must be unique for orient="
-                             "'%s'." % self.orient)
+                             "'{orient}'.".format(orient=self.orient))
         if not self.obj.columns.is_unique and self.orient in (
                 'index', 'columns', 'records'):
             raise ValueError("DataFrame columns must be unique for orient="
-                             "'%s'." % self.orient)
+                             "'{orient}'.".format(orient=self.orient))
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        if not self.index and orient == 'split':
+            obj = obj.to_dict(orient='split')
+            del obj["index"]
+        return super(FrameWriter, self)._write(obj, orient,
+                                               double_precision,
+                                               ensure_ascii, date_unit,
+                                               iso_dates, default_handler)
 
 
 class JSONTableWriter(FrameWriter):
     _default_orient = 'records'
 
     def __init__(self, obj, orient, date_format, double_precision,
-                 ensure_ascii, date_unit, default_handler=None):
+                 ensure_ascii, date_unit, index, default_handler=None):
         """
-        Adds a `schema` attribut with the Table Schema, resets
+        Adds a `schema` attribute with the Table Schema, resets
         the index (can't do in caller, because the schema inference needs
         to know what the index is, forces orient to records, and forces
         date_format to 'iso'.
         """
         super(JSONTableWriter, self).__init__(
             obj, orient, date_format, double_precision, ensure_ascii,
-            date_unit, default_handler=default_handler)
+            date_unit, index, default_handler=default_handler)
 
         if date_format != 'iso':
             msg = ("Trying to write with `orient='table'` and "
-                   "`date_format='%s'`. Table Schema requires dates "
-                   "to be formatted with `date_format='iso'`" % date_format)
+                   "`date_format='{fmt}'`. Table Schema requires dates "
+                   "to be formatted with `date_format='iso'`"
+                   .format(fmt=date_format))
             raise ValueError(msg)
 
-        self.schema = build_table_schema(obj)
+        self.schema = build_table_schema(obj, index=self.index)
+
+        # NotImplementd on a column MultiIndex
+        if obj.ndim == 2 and isinstance(obj.columns, MultiIndex):
+            raise NotImplementedError(
+                "orient='table' is not supported for MultiIndex")
 
         # TODO: Do this timedelta properly in objToJSON.c See GH #15137
         if ((obj.ndim == 1) and (obj.name in set(obj.index.names)) or
@@ -153,30 +205,40 @@ def __init__(self, obj, orient, date_format, double_precision,
         if is_period_dtype(obj.index):
             obj.index = obj.index.to_timestamp()
 
-        self.obj = obj.reset_index()
+        # exclude index from obj if index=False
+        if not self.index:
+            self.obj = obj.reset_index(drop=True)
+        else:
+            self.obj = obj.reset_index(drop=False)
         self.date_format = 'iso'
         self.orient = 'records'
-
-    def write(self):
-        data = super(JSONTableWriter, self).write()
-        serialized = '{{"schema": {}, "data": {}}}'.format(
-            dumps(self.schema), data)
+        self.index = index
+
+    def _write(self, obj, orient, double_precision, ensure_ascii,
+               date_unit, iso_dates, default_handler):
+        data = super(JSONTableWriter, self)._write(obj, orient,
+                                                   double_precision,
+                                                   ensure_ascii, date_unit,
+                                                   iso_dates,
+                                                   default_handler)
+        serialized = '{{"schema": {schema}, "data": {data}}}'.format(
+                     schema=dumps(self.schema), data=data)
         return serialized
 
 
-def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
-              convert_axes=True, convert_dates=True, keep_default_dates=True,
+def read_json(path_or_buf=None, orient=None, typ='frame', dtype=None,
+              convert_axes=None, convert_dates=True, keep_default_dates=True,
               numpy=False, precise_float=False, date_unit=None, encoding=None,
-              lines=False):
+              lines=False, chunksize=None, compression='infer'):
     """
-    Convert a JSON string to pandas object
+    Convert a JSON string to pandas object.
 
     Parameters
     ----------
     path_or_buf : a valid JSON string or file-like, default: None
-        The string could be a URL. Valid URL schemes include http, ftp, s3, and
-        file. For file URLs, a host is expected. For instance, a local file
-        could be ``file://localhost/path/to/table.json``
+        The string could be a URL. Valid URL schemes include http, ftp, s3,
+        gcs, and file. For file URLs, a host is expected. For instance, a local
+        file could be ``file://localhost/path/to/table.json``
 
     orient : string,
         Indication of expected JSON string format.
@@ -204,19 +266,36 @@ def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
         * when ``typ == 'frame'``,
 
           - allowed orients are ``{'split','records','index',
-            'columns','values'}``
+            'columns','values', 'table'}``
           - default is ``'columns'``
           - The DataFrame index must be unique for orients ``'index'`` and
             ``'columns'``.
           - The DataFrame columns must be unique for orients ``'index'``,
             ``'columns'``, and ``'records'``.
 
+        .. versionadded:: 0.23.0
+           'table' as an allowed value for the ``orient`` argument
+
     typ : type of object to recover (series or frame), default 'frame'
-    dtype : boolean or dict, default True
-        If True, infer dtypes, if a dict of column to dtype, then use those,
+    dtype : boolean or dict, default None
+        If True, infer dtypes; if a dict of column to dtype, then use those;
         if False, then don't infer dtypes at all, applies only to the data.
-    convert_axes : boolean, default True
+
+        For all ``orient`` values except ``'table'``, default is True.
+
+        .. versionchanged:: 0.25.0
+
+           Not applicable for ``orient='table'``.
+
+    convert_axes : boolean, default None
         Try to convert the axes to the proper dtypes.
+
+        For all ``orient`` values except ``'table'``, default is True.
+
+        .. versionchanged:: 0.25.0
+
+           Not applicable for ``orient='table'``.
+
     convert_dates : boolean, default True
         List of columns to parse for dates; If True, then try to parse
         datelike columns default is True; a column label is datelike if
@@ -246,15 +325,34 @@ def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
         is to try and detect the correct precision, but if this is not desired
         then pass one of 's', 'ms', 'us' or 'ns' to force parsing only seconds,
         milliseconds, microseconds or nanoseconds respectively.
+    encoding : str, default is 'utf-8'
+        The encoding to use to decode py3 bytes.
+
+        .. versionadded:: 0.19.0
+
     lines : boolean, default False
         Read the file as a json object per line.
 
         .. versionadded:: 0.19.0
 
-    encoding : str, default is 'utf-8'
-        The encoding to use to decode py3 bytes.
+    chunksize : integer, default None
+        Return JsonReader object for iteration.
+        See the `line-delimted json docs
+        <http://pandas.pydata.org/pandas-docs/stable/io.html#io-jsonl>`_
+        for more information on ``chunksize``.
+        This can only be passed if `lines=True`.
+        If this is None, the file will be read into memory all at once.
 
-        .. versionadded:: 0.19.0
+        .. versionadded:: 0.21.0
+
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+        For on-the-fly decompression of on-disk data. If 'infer', then use
+        gzip, bz2, zip or xz if path_or_buf is a string ending in
+        '.gz', '.bz2', '.zip', or 'xz', respectively, and no decompression
+        otherwise. If using 'zip', the ZIP file must contain only one data
+        file to be read in. Set to None for no decompression.
+
+        .. versionadded:: 0.21.0
 
     Returns
     -------
@@ -264,6 +362,17 @@ def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
     --------
     DataFrame.to_json
 
+    Notes
+    -----
+    Specific to ``orient='table'``, if a :class:`DataFrame` with a literal
+    :class:`Index` name of `index` gets written with :func:`to_json`, the
+    subsequent read operation will incorrectly set the :class:`Index` name to
+    ``None``. This is because `index` is also used by :func:`DataFrame.to_json`
+    to denote a missing :class:`Index` name, and the subsequent
+    :func:`read_json` operation cannot distinguish between the two. The same
+    limitation is encountered with a :class:`MultiIndex` and any names
+    beginning with ``'level_'``.
+
     Examples
     --------
 
@@ -313,49 +422,197 @@ def read_json(path_or_buf=None, orient=None, typ='frame', dtype=True,
                 {"index": "row 2", "col 1": "c", "col 2": "d"}]}'
     """
 
-    filepath_or_buffer, _, _ = get_filepath_or_buffer(path_or_buf,
-                                                      encoding=encoding)
-    if isinstance(filepath_or_buffer, compat.string_types):
+    if orient == 'table' and dtype:
+        raise ValueError("cannot pass both dtype and orient='table'")
+    if orient == 'table' and convert_axes:
+        raise ValueError("cannot pass both convert_axes and orient='table'")
+
+    if dtype is None and orient != 'table':
+        dtype = True
+    if convert_axes is None and orient != 'table':
+        convert_axes = True
+
+    compression = _infer_compression(path_or_buf, compression)
+    filepath_or_buffer, _, compression, should_close = get_filepath_or_buffer(
+        path_or_buf, encoding=encoding, compression=compression,
+    )
+
+    json_reader = JsonReader(
+        filepath_or_buffer, orient=orient, typ=typ, dtype=dtype,
+        convert_axes=convert_axes, convert_dates=convert_dates,
+        keep_default_dates=keep_default_dates, numpy=numpy,
+        precise_float=precise_float, date_unit=date_unit, encoding=encoding,
+        lines=lines, chunksize=chunksize, compression=compression,
+    )
+
+    if chunksize:
+        return json_reader
+
+    result = json_reader.read()
+    if should_close:
         try:
-            exists = os.path.exists(filepath_or_buffer)
+            filepath_or_buffer.close()
+        except:  # noqa: flake8
+            pass
+    return result
 
-        # if the filepath is too long will raise here
-        # 5874
-        except (TypeError, ValueError):
-            exists = False
 
-        if exists:
-            fh, handles = _get_handle(filepath_or_buffer, 'r',
-                                      encoding=encoding)
-            json = fh.read()
-            fh.close()
+class JsonReader(BaseIterator):
+    """
+    JsonReader provides an interface for reading in a JSON file.
+
+    If initialized with ``lines=True`` and ``chunksize``, can be iterated over
+    ``chunksize`` lines at a time. Otherwise, calling ``read`` reads in the
+    whole document.
+    """
+    def __init__(self, filepath_or_buffer, orient, typ, dtype, convert_axes,
+                 convert_dates, keep_default_dates, numpy, precise_float,
+                 date_unit, encoding, lines, chunksize, compression):
+
+        self.path_or_buf = filepath_or_buffer
+        self.orient = orient
+        self.typ = typ
+        self.dtype = dtype
+        self.convert_axes = convert_axes
+        self.convert_dates = convert_dates
+        self.keep_default_dates = keep_default_dates
+        self.numpy = numpy
+        self.precise_float = precise_float
+        self.date_unit = date_unit
+        self.encoding = encoding
+        self.compression = compression
+        self.lines = lines
+        self.chunksize = chunksize
+        self.nrows_seen = 0
+        self.should_close = False
+
+        if self.chunksize is not None:
+            self.chunksize = _validate_integer("chunksize", self.chunksize, 1)
+            if not self.lines:
+                raise ValueError("chunksize can only be passed if lines=True")
+
+        data = self._get_data_from_filepath(filepath_or_buffer)
+        self.data = self._preprocess_data(data)
+
+    def _preprocess_data(self, data):
+        """
+        At this point, the data either has a `read` attribute (e.g. a file
+        object or a StringIO) or is a string that is a JSON document.
+
+        If self.chunksize, we prepare the data for the `__next__` method.
+        Otherwise, we read it into memory for the `read` method.
+        """
+        if hasattr(data, 'read') and not self.chunksize:
+            data = data.read()
+        if not hasattr(data, 'read') and self.chunksize:
+            data = StringIO(data)
+
+        return data
+
+    def _get_data_from_filepath(self, filepath_or_buffer):
+        """
+        The function read_json accepts three input types:
+            1. filepath (string-like)
+            2. file-like object (e.g. open file object, StringIO)
+            3. JSON string
+
+        This method turns (1) into (2) to simplify the rest of the processing.
+        It returns input types (2) and (3) unchanged.
+        """
+        data = filepath_or_buffer
+
+        exists = False
+        if isinstance(data, compat.string_types):
+            try:
+                exists = os.path.exists(filepath_or_buffer)
+            # gh-5874: if the filepath is too long will raise here
+            except (TypeError, ValueError):
+                pass
+
+        if exists or self.compression is not None:
+            data, _ = _get_handle(filepath_or_buffer, 'r',
+                                  encoding=self.encoding,
+                                  compression=self.compression)
+            self.should_close = True
+            self.open_stream = data
+
+        return data
+
+    def _combine_lines(self, lines):
+        """
+        Combines a list of JSON objects into one JSON object.
+        """
+        lines = filter(None, map(lambda x: x.strip(), lines))
+        return '[' + ','.join(lines) + ']'
+
+    def read(self):
+        """
+        Read the whole JSON input into a pandas object.
+        """
+        if self.lines and self.chunksize:
+            obj = concat(self)
+        elif self.lines:
+
+            data = to_str(self.data)
+            obj = self._get_object_parser(
+                self._combine_lines(data.split('\n'))
+            )
         else:
-            json = filepath_or_buffer
-    elif hasattr(filepath_or_buffer, 'read'):
-        json = filepath_or_buffer.read()
-    else:
-        json = filepath_or_buffer
+            obj = self._get_object_parser(self.data)
+        self.close()
+        return obj
 
-    if lines:
-        # If given a json lines file, we break the string into lines, add
-        # commas and put it in a json list to make a valid json object.
-        lines = list(StringIO(json.strip()))
-        json = '[' + ','.join(lines) + ']'
+    def _get_object_parser(self, json):
+        """
+        Parses a json document into a pandas object.
+        """
+        typ = self.typ
+        dtype = self.dtype
+        kwargs = {
+            "orient": self.orient, "dtype": self.dtype,
+            "convert_axes": self.convert_axes,
+            "convert_dates": self.convert_dates,
+            "keep_default_dates": self.keep_default_dates, "numpy": self.numpy,
+            "precise_float": self.precise_float, "date_unit": self.date_unit
+        }
+        obj = None
+        if typ == 'frame':
+            obj = FrameParser(json, **kwargs).parse()
+
+        if typ == 'series' or obj is None:
+            if not isinstance(dtype, bool):
+                kwargs['dtype'] = dtype
+            obj = SeriesParser(json, **kwargs).parse()
+
+        return obj
+
+    def close(self):
+        """
+        If we opened a stream earlier, in _get_data_from_filepath, we should
+        close it.
+
+        If an open stream or file was passed, we leave it open.
+        """
+        if self.should_close:
+            try:
+                self.open_stream.close()
+            except (IOError, AttributeError):
+                pass
+
+    def __next__(self):
+        lines = list(islice(self.data, self.chunksize))
+        if lines:
+            lines_json = self._combine_lines(lines)
+            obj = self._get_object_parser(lines_json)
 
-    obj = None
-    if typ == 'frame':
-        obj = FrameParser(json, orient, dtype, convert_axes, convert_dates,
-                          keep_default_dates, numpy, precise_float,
-                          date_unit).parse()
+            # Make sure that the returned objects have the right index.
+            obj.index = range(self.nrows_seen, self.nrows_seen + len(obj))
+            self.nrows_seen += len(obj)
 
-    if typ == 'series' or obj is None:
-        if not isinstance(dtype, bool):
-            dtype = dict(data=dtype)
-        obj = SeriesParser(json, orient, dtype, convert_axes, convert_dates,
-                           keep_default_dates, numpy, precise_float,
-                           date_unit).parse()
+            return obj
 
-    return obj
+        self.close()
+        raise StopIteration
 
 
 class Parser(object):
@@ -367,15 +624,15 @@ class Parser(object):
         'us': long(31536000000000),
         'ns': long(31536000000000000)}
 
-    def __init__(self, json, orient, dtype=True, convert_axes=True,
+    def __init__(self, json, orient, dtype=None, convert_axes=True,
                  convert_dates=True, keep_default_dates=False, numpy=False,
                  precise_float=False, date_unit=None):
         self.json = json
 
         if orient is None:
             orient = self._default_orient
-
         self.orient = orient
+
         self.dtype = dtype
 
         if orient == "split":
@@ -384,8 +641,8 @@ def __init__(self, json, orient, dtype=True, convert_axes=True,
         if date_unit is not None:
             date_unit = date_unit.lower()
             if date_unit not in self._STAMP_UNITS:
-                raise ValueError('date_unit must be one of %s' %
-                                 (self._STAMP_UNITS,))
+                raise ValueError('date_unit must be one of {units}'
+                                 .format(units=self._STAMP_UNITS))
             self.min_stamp = self._MIN_STAMPS[date_unit]
         else:
             self.min_stamp = self._MIN_STAMPS['s']
@@ -399,12 +656,14 @@ def __init__(self, json, orient, dtype=True, convert_axes=True,
         self.obj = None
 
     def check_keys_split(self, decoded):
-        "checks that dict has only the appropriate keys for orient='split'"
+        """
+        Checks that dict has only the appropriate keys for orient='split'.
+        """
         bad_keys = set(decoded.keys()).difference(set(self._split_keys))
         if bad_keys:
             bad_keys = ", ".join(bad_keys)
-            raise ValueError(u("JSON data had unexpected key(s): %s") %
-                             pprint_thing(bad_keys))
+            raise ValueError(u("JSON data had unexpected key(s): {bad_keys}")
+                             .format(bad_keys=pprint_thing(bad_keys)))
 
     def parse(self):
 
@@ -424,7 +683,9 @@ def parse(self):
         return self.obj
 
     def _convert_axes(self):
-        """ try to convert axes """
+        """
+        Try to convert axes.
+        """
         for axis in self.obj._AXIS_NUMBERS.keys():
             new_axis, result = self._try_convert_data(
                 axis, self.obj._get_axis(axis), use_dtypes=False,
@@ -437,17 +698,17 @@ def _try_convert_types(self):
 
     def _try_convert_data(self, name, data, use_dtypes=True,
                           convert_dates=True):
-        """ try to parse a ndarray like into a column by inferring dtype """
+        """
+        Try to parse a ndarray like into a column by inferring dtype.
+        """
 
         # don't try to coerce, unless a force conversion
         if use_dtypes:
-            if self.dtype is False:
+            if not self.dtype:
                 return data, False
             elif self.dtype is True:
                 pass
-
             else:
-
                 # dtype to force
                 dtype = (self.dtype.get(name)
                          if isinstance(self.dtype, dict) else self.dtype)
@@ -455,7 +716,7 @@ def _try_convert_data(self, name, data, use_dtypes=True,
                     try:
                         dtype = np.dtype(dtype)
                         return data.astype(dtype), True
-                    except:
+                    except (TypeError, ValueError):
                         return data, False
 
         if convert_dates:
@@ -471,7 +732,7 @@ def _try_convert_data(self, name, data, use_dtypes=True,
             try:
                 data = data.astype('float64')
                 result = True
-            except:
+            except (TypeError, ValueError):
                 pass
 
         if data.dtype.kind == 'f':
@@ -482,10 +743,10 @@ def _try_convert_data(self, name, data, use_dtypes=True,
                 try:
                     data = data.astype('float64')
                     result = True
-                except:
+                except (TypeError, ValueError):
                     pass
 
-        # do't coerce 0-len data
+        # don't coerce 0-len data
         if len(data) and (data.dtype == 'float' or data.dtype == 'object'):
 
             # coerce ints if we can
@@ -494,7 +755,7 @@ def _try_convert_data(self, name, data, use_dtypes=True,
                 if (new_data == data).all():
                     data = new_data
                     result = True
-            except:
+            except (TypeError, ValueError):
                 pass
 
         # coerce ints to 64
@@ -504,16 +765,18 @@ def _try_convert_data(self, name, data, use_dtypes=True,
             try:
                 data = data.astype('int64')
                 result = True
-            except:
+            except (TypeError, ValueError):
                 pass
 
         return data, result
 
     def _try_convert_to_date(self, data):
-        """ try to parse a ndarray like into a date column
-            try to coerce object in epoch/iso formats and
-            integer/float in epcoh formats, return a boolean if parsing
-            was successful """
+        """
+        Try to parse a ndarray like into a date column.
+
+        Try to coerce object in epoch/iso formats and integer/float in epoch
+        formats. Return a boolean if parsing was successful.
+        """
 
         # no conversion on empty
         if not len(data):
@@ -523,12 +786,12 @@ def _try_convert_to_date(self, data):
         if new_data.dtype == 'object':
             try:
                 new_data = data.astype('int64')
-            except:
+            except (TypeError, ValueError, OverflowError):
                 pass
 
         # ignore numbers that are out of range
         if issubclass(new_data.dtype.type, np.number):
-            in_range = (isnull(new_data.values) | (new_data > self.min_stamp) |
+            in_range = (isna(new_data.values) | (new_data > self.min_stamp) |
                         (new_data.values == iNaT))
             if not in_range.all():
                 return data, False
@@ -540,7 +803,7 @@ def _try_convert_to_date(self, data):
                                        unit=date_unit)
             except ValueError:
                 continue
-            except:
+            except Exception:
                 break
             return new_data, True
         return data, False
@@ -558,10 +821,8 @@ def _parse_no_numpy(self):
         json = self.json
         orient = self.orient
         if orient == "split":
-            decoded = dict((str(k), v)
-                           for k, v in compat.iteritems(loads(
-                               json,
-                               precise_float=self.precise_float)))
+            decoded = {str(k): v for k, v in compat.iteritems(
+                loads(json, precise_float=self.precise_float))}
             self.check_keys_split(decoded)
             self.obj = Series(dtype=None, **decoded)
         else:
@@ -575,7 +836,7 @@ def _parse_numpy(self):
         if orient == "split":
             decoded = loads(json, dtype=None, numpy=True,
                             precise_float=self.precise_float)
-            decoded = dict((str(k), v) for k, v in compat.iteritems(decoded))
+            decoded = {str(k): v for k, v in compat.iteritems(decoded)}
             self.check_keys_split(decoded)
             self.obj = Series(**decoded)
         elif orient == "columns" or orient == "index":
@@ -607,13 +868,13 @@ def _parse_numpy(self):
         if orient == "columns":
             args = loads(json, dtype=None, numpy=True, labelled=True,
                          precise_float=self.precise_float)
-            if args:
+            if len(args):
                 args = (args[0].T, args[2], args[1])
             self.obj = DataFrame(*args)
         elif orient == "split":
             decoded = loads(json, dtype=None, numpy=True,
                             precise_float=self.precise_float)
-            decoded = dict((str(k), v) for k, v in compat.iteritems(decoded))
+            decoded = {str(k): v for k, v in compat.iteritems(decoded)}
             self.check_keys_split(decoded)
             self.obj = DataFrame(**decoded)
         elif orient == "values":
@@ -633,21 +894,24 @@ def _parse_no_numpy(self):
             self.obj = DataFrame(
                 loads(json, precise_float=self.precise_float), dtype=None)
         elif orient == "split":
-            decoded = dict((str(k), v)
-                           for k, v in compat.iteritems(loads(
-                               json,
-                               precise_float=self.precise_float)))
+            decoded = {str(k): v for k, v in compat.iteritems(
+                loads(json, precise_float=self.precise_float))}
             self.check_keys_split(decoded)
             self.obj = DataFrame(dtype=None, **decoded)
         elif orient == "index":
             self.obj = DataFrame(
                 loads(json, precise_float=self.precise_float), dtype=None).T
+        elif orient == 'table':
+            self.obj = parse_table_schema(json,
+                                          precise_float=self.precise_float)
         else:
             self.obj = DataFrame(
                 loads(json, precise_float=self.precise_float), dtype=None)
 
     def _process_converter(self, f, filt=None):
-        """ take a conversion function and possibly recreate the frame """
+        """
+        Take a conversion function and possibly recreate the frame.
+        """
 
         if filt is None:
             filt = lambda col, c: True
@@ -689,7 +953,9 @@ def _try_convert_dates(self):
         convert_dates = set(convert_dates)
 
         def is_ok(col):
-            """ return if this col is ok to try for a date parse """
+            """
+            Return if this col is ok to try for a date parse.
+            """
             if not isinstance(col, compat.string_types):
                 return False
 
diff --git a/pandas/io/json/normalize.py b/pandas/io/json/normalize.py
index 518e0bc2064e2..279630ccd107c 100644
--- a/pandas/io/json/normalize.py
+++ b/pandas/io/json/normalize.py
@@ -1,16 +1,20 @@
 # ---------------------------------------------------------------------
 # JSON normalization routines
 
-import copy
 from collections import defaultdict
+import copy
+
 import numpy as np
 
-from pandas._libs.lib import convert_json_to_lines
-from pandas import compat, DataFrame
+from pandas._libs.writers import convert_json_to_lines
+
+from pandas import DataFrame, compat
 
 
 def _convert_to_line_delimits(s):
-    """Helper function that converts json lists to line delimited json."""
+    """
+    Helper function that converts JSON lists to line delimited JSON.
+    """
 
     # Determine we have a JSON list to turn to lines otherwise just return the
     # json object, only lists can
@@ -22,9 +26,10 @@ def _convert_to_line_delimits(s):
 
 
 def nested_to_record(ds, prefix="", sep=".", level=0):
-    """a simplified json_normalize
+    """
+    A simplified json_normalize.
 
-    converts a nested dict into a flat dict ("record"), unlike json_normalize,
+    Converts a nested dict into a flat dict ("record"), unlike json_normalize,
     it does not attempt to extract a subset of the data.
 
     Parameters
@@ -97,7 +102,7 @@ def json_normalize(data, record_path=None, meta=None,
                    errors='raise',
                    sep='.'):
     """
-    "Normalize" semi-structured JSON data into a flat table
+    Normalize semi-structured JSON data into a flat table.
 
     Parameters
     ----------
@@ -108,16 +113,16 @@ def json_normalize(data, record_path=None, meta=None,
         assumed to be an array of records
     meta : list of paths (string or list of strings), default None
         Fields to use as metadata for each record in resulting table
+    meta_prefix : string, default None
     record_prefix : string, default None
         If True, prefix records with dotted (?) path, e.g. foo.bar.field if
         path to records is ['foo', 'bar']
-    meta_prefix : string, default None
     errors : {'raise', 'ignore'}, default 'raise'
 
-        * ignore : will ignore KeyError if keys listed in meta are not
-        always present
-        * raise : will raise KeyError if keys listed in meta are not
-        always present
+        * 'ignore' : will ignore KeyError if keys listed in meta are not
+          always present
+        * 'raise' : will raise KeyError if keys listed in meta are not
+          always present
 
         .. versionadded:: 0.20.0
 
@@ -127,7 +132,6 @@ def json_normalize(data, record_path=None, meta=None,
 
         .. versionadded:: 0.20.0
 
-
     Returns
     -------
     frame : DataFrame
@@ -135,6 +139,16 @@ def json_normalize(data, record_path=None, meta=None,
     Examples
     --------
 
+    >>> from pandas.io.json import json_normalize
+    >>> data = [{'id': 1, 'name': {'first': 'Coleen', 'last': 'Volk'}},
+    ...         {'name': {'given': 'Mose', 'family': 'Regner'}},
+    ...         {'id': 2, 'name': 'Faye Raker'}]
+    >>> json_normalize(data)
+        id        name name.family name.first name.given name.last
+    0  1.0         NaN         NaN     Coleen        NaN      Volk
+    1  NaN         NaN      Regner        NaN       Mose       NaN
+    2  2.0  Faye Raker         NaN        NaN        NaN       NaN
+
     >>> data = [{'state': 'Florida',
     ...          'shortname': 'FL',
     ...          'info': {
@@ -150,7 +164,6 @@ def json_normalize(data, record_path=None, meta=None,
     ...          },
     ...          'counties': [{'name': 'Summit', 'population': 1234},
     ...                       {'name': 'Cuyahoga', 'population': 1337}]}]
-    >>> from pandas.io.json import json_normalize
     >>> result = json_normalize(data, 'counties', ['state', 'shortname',
     ...                                           ['info', 'governor']])
     >>> result
@@ -161,6 +174,11 @@ def json_normalize(data, record_path=None, meta=None,
     3      Summit        1234   John Kasich     Ohio        OH
     4    Cuyahoga        1337   John Kasich     Ohio        OH
 
+    >>> data = {'A': [1, 2]}
+    >>> json_normalize(data, 'A', record_prefix='Prefix.')
+        Prefix.0
+    0          1
+    1          2
     """
     def _pull_field(js, spec):
         result = js
@@ -172,7 +190,7 @@ def _pull_field(js, spec):
 
         return result
 
-    if isinstance(data, list) and len(data) is 0:
+    if isinstance(data, list) and not data:
         return DataFrame()
 
     # A bit of a hackjob
@@ -180,7 +198,8 @@ def _pull_field(js, spec):
         data = [data]
 
     if record_path is None:
-        if any([isinstance(x, dict) for x in compat.itervalues(data[0])]):
+        if any([isinstance(x, dict)
+                for x in compat.itervalues(y)] for y in data):
             # naive normalization, this is idempotent for flat records
             # and potentially will inflate the data considerably for
             # deeply nested structures:
@@ -198,9 +217,7 @@ def _pull_field(js, spec):
     elif not isinstance(meta, list):
         meta = [meta]
 
-    for i, x in enumerate(meta):
-        if not isinstance(x, list):
-            meta[i] = [x]
+    meta = [m if isinstance(m, list) else [m] for m in meta]
 
     # Disastrously inefficient for now
     records = []
@@ -212,6 +229,8 @@ def _pull_field(js, spec):
     meta_keys = [sep.join(val) for val in meta]
 
     def _recursive_extract(data, path, seen_meta, level=0):
+        if isinstance(data, dict):
+            data = [data]
         if len(path) > 1:
             for obj in data:
                 for val, key in zip(meta, meta_keys):
@@ -237,10 +256,10 @@ def _recursive_extract(data, path, seen_meta, level=0):
                             if errors == 'ignore':
                                 meta_val = np.nan
                             else:
-                                raise \
-                                    KeyError("Try running with "
-                                             "errors='ignore' as key "
-                                             "%s is not always present", e)
+                                raise KeyError("Try running with "
+                                               "errors='ignore' as key "
+                                               "{err} is not always present"
+                                               .format(err=e))
                     meta_vals[key].append(meta_val)
 
                 records.extend(recs)
@@ -250,7 +269,8 @@ def _recursive_extract(data, path, seen_meta, level=0):
     result = DataFrame(records)
 
     if record_prefix is not None:
-        result.rename(columns=lambda x: record_prefix + x, inplace=True)
+        result = result.rename(
+            columns=lambda x: "{p}{c}".format(p=record_prefix, c=x))
 
     # Data types, a problem
     for k, v in compat.iteritems(meta_vals):
@@ -258,8 +278,8 @@ def _recursive_extract(data, path, seen_meta, level=0):
             k = meta_prefix + k
 
         if k in result:
-            raise ValueError('Conflicting metadata name %s, '
-                             'need distinguishing prefix ' % k)
+            raise ValueError('Conflicting metadata name {name}, '
+                             'need distinguishing prefix '.format(name=k))
 
         result[k] = np.array(v).repeat(lengths)
 
diff --git a/pandas/io/json/table_schema.py b/pandas/io/json/table_schema.py
index 48f92d28baf61..971386c91944e 100644
--- a/pandas/io/json/table_schema.py
+++ b/pandas/io/json/table_schema.py
@@ -3,11 +3,20 @@
 
 http://specs.frictionlessdata.io/json-table-schema/
 """
-from pandas.types.common import (
-    is_integer_dtype, is_timedelta64_dtype, is_numeric_dtype,
-    is_bool_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
-    is_categorical_dtype, is_period_dtype, is_string_dtype
-)
+import warnings
+
+import pandas._libs.json as json
+
+from pandas.core.dtypes.common import (
+    is_bool_dtype, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_integer_dtype, is_numeric_dtype, is_period_dtype,
+    is_string_dtype, is_timedelta64_dtype)
+
+from pandas import DataFrame
+from pandas.api.types import CategoricalDtype
+import pandas.core.common as com
+
+loads = json.loads
 
 
 def as_json_table_type(x):
@@ -61,7 +70,13 @@ def as_json_table_type(x):
 
 def set_default_names(data):
     """Sets index names to 'index' for regular, or 'level_x' for Multi"""
-    if all(name is not None for name in data.index.names):
+    if com._all_not_none(*data.index.names):
+        nms = data.index.names
+        if len(nms) == 1 and data.index.name == 'index':
+            warnings.warn("Index name of 'index' is not round-trippable")
+        elif len(nms) > 1 and any(x.startswith('level_') for x in nms):
+            warnings.warn("Index names beginning with 'level_' are not "
+                          "round-trippable")
         return data
 
     data = data.copy()
@@ -74,9 +89,13 @@ def set_default_names(data):
     return data
 
 
-def make_field(arr, dtype=None):
+def convert_pandas_type_to_json_field(arr, dtype=None):
     dtype = dtype or arr.dtype
-    field = {'name': arr.name or 'values',
+    if arr.name is None:
+        name = 'values'
+    else:
+        name = arr.name
+    field = {'name': name,
              'type': as_json_table_type(dtype)}
 
     if is_categorical_dtype(arr):
@@ -98,6 +117,69 @@ def make_field(arr, dtype=None):
     return field
 
 
+def convert_json_field_to_pandas_type(field):
+    """
+    Converts a JSON field descriptor into its corresponding NumPy / pandas type
+
+    Parameters
+    ----------
+    field
+        A JSON field descriptor
+
+    Returns
+    -------
+    dtype
+
+    Raises
+    -----
+    ValueError
+        If the type of the provided field is unknown or currently unsupported
+
+    Examples
+    --------
+    >>> convert_json_field_to_pandas_type({'name': 'an_int',
+                                           'type': 'integer'})
+    'int64'
+    >>> convert_json_field_to_pandas_type({'name': 'a_categorical',
+                                           'type': 'any',
+                                           'contraints': {'enum': [
+                                                          'a', 'b', 'c']},
+                                           'ordered': True})
+    'CategoricalDtype(categories=['a', 'b', 'c'], ordered=True)'
+    >>> convert_json_field_to_pandas_type({'name': 'a_datetime',
+                                           'type': 'datetime'})
+    'datetime64[ns]'
+    >>> convert_json_field_to_pandas_type({'name': 'a_datetime_with_tz',
+                                           'type': 'datetime',
+                                           'tz': 'US/Central'})
+    'datetime64[ns, US/Central]'
+    """
+    typ = field['type']
+    if typ == 'string':
+        return 'object'
+    elif typ == 'integer':
+        return 'int64'
+    elif typ == 'number':
+        return 'float64'
+    elif typ == 'boolean':
+        return 'bool'
+    elif typ == 'duration':
+        return 'timedelta64'
+    elif typ == 'datetime':
+        if field.get('tz'):
+            return 'datetime64[ns, {tz}]'.format(tz=field['tz'])
+        else:
+            return 'datetime64[ns]'
+    elif typ == 'any':
+        if 'constraints' in field and 'ordered' in field:
+            return CategoricalDtype(categories=field['constraints']['enum'],
+                                    ordered=field['ordered'])
+        else:
+            return 'object'
+
+    raise ValueError("Unsupported or invalid field type: {}".format(typ))
+
+
 def build_table_schema(data, index=True, primary_key=None, version=True):
     """
     Create a Table schema from ``data``.
@@ -119,6 +201,16 @@ def build_table_schema(data, index=True, primary_key=None, version=True):
     -------
     schema : dict
 
+    Notes
+    -----
+    See `_as_json_table_type` for conversion types.
+    Timedeltas as converted to ISO8601 duration format with
+    9 decimal places after the seconds field for nanosecond precision.
+
+    Categoricals are converted to the `any` dtype, and use the `enum` field
+    constraint to list the allowed values. The `ordered` attribute is included
+    in an `ordered` field.
+
     Examples
     --------
     >>> df = pd.DataFrame(
@@ -133,16 +225,6 @@ def build_table_schema(data, index=True, primary_key=None, version=True):
     {'name': 'C', 'type': 'datetime'}],
     'pandas_version': '0.20.0',
     'primaryKey': ['idx']}
-
-    Notes
-    -----
-    See `_as_json_table_type` for conversion types.
-    Timedeltas as converted to ISO8601 duration format with
-    9 decimal places after the secnods field for nanosecond precision.
-
-    Categoricals are converted to the `any` dtype, and use the `enum` field
-    constraint to list the allowed values. The `ordered` attribute is included
-    in an `ordered` field.
     """
     if index is True:
         data = set_default_names(data)
@@ -153,15 +235,15 @@ def build_table_schema(data, index=True, primary_key=None, version=True):
     if index:
         if data.index.nlevels > 1:
             for level in data.index.levels:
-                fields.append(make_field(level))
+                fields.append(convert_pandas_type_to_json_field(level))
         else:
-            fields.append(make_field(data.index))
+            fields.append(convert_pandas_type_to_json_field(data.index))
 
     if data.ndim > 1:
         for column, s in data.iteritems():
-            fields.append(make_field(s))
+            fields.append(convert_pandas_type_to_json_field(s))
     else:
-        fields.append(make_field(data))
+        fields.append(convert_pandas_type_to_json_field(data))
 
     schema['fields'] = fields
     if index and data.index.is_unique and primary_key is None:
@@ -175,3 +257,70 @@ def build_table_schema(data, index=True, primary_key=None, version=True):
     if version:
         schema['pandas_version'] = '0.20.0'
     return schema
+
+
+def parse_table_schema(json, precise_float):
+    """
+    Builds a DataFrame from a given schema
+
+    Parameters
+    ----------
+    json :
+        A JSON table schema
+    precise_float : boolean
+        Flag controlling precision when decoding string to double values, as
+        dictated by ``read_json``
+
+    Returns
+    -------
+    df : DataFrame
+
+    Raises
+    ------
+    NotImplementedError
+        If the JSON table schema contains either timezone or timedelta data
+
+    Notes
+    -----
+        Because :func:`DataFrame.to_json` uses the string 'index' to denote a
+        name-less :class:`Index`, this function sets the name of the returned
+        :class:`DataFrame` to ``None`` when said string is encountered with a
+        normal :class:`Index`. For a :class:`MultiIndex`, the same limitation
+        applies to any strings beginning with 'level_'. Therefore, an
+        :class:`Index` name of 'index'  and :class:`MultiIndex` names starting
+        with 'level_' are not supported.
+
+    See Also
+    --------
+    build_table_schema : Inverse function.
+    pandas.read_json
+    """
+    table = loads(json, precise_float=precise_float)
+    col_order = [field['name'] for field in table['schema']['fields']]
+    df = DataFrame(table['data'], columns=col_order)[col_order]
+
+    dtypes = {field['name']: convert_json_field_to_pandas_type(field)
+              for field in table['schema']['fields']}
+
+    # Cannot directly use as_type with timezone data on object; raise for now
+    if any(str(x).startswith('datetime64[ns, ') for x in dtypes.values()):
+        raise NotImplementedError('table="orient" can not yet read timezone '
+                                  'data')
+
+    # No ISO constructor for Timedelta as of yet, so need to raise
+    if 'timedelta64' in dtypes.values():
+        raise NotImplementedError('table="orient" can not yet read '
+                                  'ISO-formatted Timedelta data')
+
+    df = df.astype(dtypes)
+
+    if 'primaryKey' in table['schema']:
+        df = df.set_index(table['schema']['primaryKey'])
+        if len(df.index.names) == 1:
+            if df.index.name == 'index':
+                df.index.name = None
+        else:
+            df.index.names = [None if x.startswith('level_') else x for x in
+                              df.index.names]
+
+    return df
diff --git a/pandas/io/msgpack/_packer.pyx b/pandas/io/msgpack/_packer.pyx
index ad7ce1fb2531a..8e2d943d8ddb1 100644
--- a/pandas/io/msgpack/_packer.pyx
+++ b/pandas/io/msgpack/_packer.pyx
@@ -1,13 +1,20 @@
 # coding: utf-8
-#cython: embedsignature=True
+# cython: embedsignature=True
 
-from cpython cimport *
-from libc.stdlib cimport *
-from libc.string cimport *
-from libc.limits cimport *
+from cpython cimport (
+    PyFloat_Check, PyLong_Check, PyInt_Check,
+    PyDict_CheckExact, PyDict_Check,
+    PyTuple_Check, PyList_Check,
+    PyCallable_Check,
+    PyUnicode_Check, PyBytes_Check,
+    PyBytes_AsString,
+    PyBytes_FromStringAndSize,
+    PyUnicode_AsEncodedString)
+from libc.stdlib cimport free, malloc
 
 from pandas.io.msgpack.exceptions import PackValueError
 from pandas.io.msgpack import ExtType
+import numpy as np
 
 
 cdef extern from "../../src/msgpack/pack.h":
@@ -67,14 +74,15 @@ cdef class Packer(object):
         Use bin type introduced in msgpack spec 2.0 for bytes.
         It also enable str8 type for unicode.
     """
-    cdef msgpack_packer pk
-    cdef object _default
-    cdef object _bencoding
-    cdef object _berrors
-    cdef char *encoding
-    cdef char *unicode_errors
-    cdef bool use_float
-    cdef bint autoreset
+    cdef:
+        msgpack_packer pk
+        object _default
+        object _bencoding
+        object _berrors
+        char *encoding
+        char *unicode_errors
+        bint use_float
+        bint autoreset
 
     def __cinit__(self):
         cdef int buf_size = 1024 * 1024
@@ -116,16 +124,17 @@ cdef class Packer(object):
 
     cdef int _pack(self, object o,
                    int nest_limit=DEFAULT_RECURSE_LIMIT) except -1:
-        cdef long long llval
-        cdef unsigned long long ullval
-        cdef long longval
-        cdef float fval
-        cdef double dval
-        cdef char* rawval
-        cdef int ret
-        cdef dict d
-        cdef size_t L
-        cdef int default_used = 0
+        cdef:
+            long long llval
+            unsigned long long ullval
+            long longval
+            float fval
+            double dval
+            char* rawval
+            int ret
+            dict d
+            size_t L
+            int default_used = 0
 
         if nest_limit < 0:
             raise PackValueError("recursion limit exceeded.")
@@ -133,7 +142,7 @@ cdef class Packer(object):
         while True:
             if o is None:
                 ret = msgpack_pack_nil(&self.pk)
-            elif isinstance(o, bool):
+            elif isinstance(o, (bool, np.bool_)):
                 if o:
                     ret = msgpack_pack_true(&self.pk)
                 else:
@@ -224,7 +233,7 @@ cdef class Packer(object):
                 default_used = 1
                 continue
             else:
-                raise TypeError("can't serialize %r" % (o,))
+                raise TypeError("can't serialize {thing!r}".format(thing=o))
             return ret
 
     cpdef pack(self, object obj):
diff --git a/pandas/io/msgpack/_unpacker.pyx b/pandas/io/msgpack/_unpacker.pyx
index 504bfed48df3c..9bbfe749ef9ba 100644
--- a/pandas/io/msgpack/_unpacker.pyx
+++ b/pandas/io/msgpack/_unpacker.pyx
@@ -1,15 +1,23 @@
 # coding: utf-8
-#cython: embedsignature=True
+# cython: embedsignature=True
+
+from cython cimport Py_ssize_t
+
+from cpython cimport (
+    PyCallable_Check,
+    PyBUF_SIMPLE, PyObject_GetBuffer, PyBuffer_Release,
+    PyBytes_Size,
+    PyBytes_FromStringAndSize,
+    PyBytes_AsString)
 
-from cpython cimport *
 cdef extern from "Python.h":
     ctypedef struct PyObject
     cdef int PyObject_AsReadBuffer(object o, const void** buff,
                                    Py_ssize_t* buf_len) except -1
 
-from libc.stdlib cimport *
-from libc.string cimport *
-from libc.limits cimport *
+from libc.stdlib cimport free, malloc
+from libc.string cimport memcpy, memmove
+from libc.limits cimport INT_MAX
 
 from pandas.io.msgpack.exceptions import (BufferFull, OutOfData,
                                           UnpackValueError, ExtraData)
@@ -20,7 +28,7 @@ cdef extern from "../../src/msgpack/unpack.h":
     ctypedef struct msgpack_user:
         bint use_list
         PyObject* object_hook
-        bint has_pairs_hook # call object_hook with k-v pairs
+        bint has_pairs_hook  # call object_hook with k-v pairs
         PyObject* list_hook
         PyObject* ext_hook
         char *encoding
@@ -94,13 +102,13 @@ cdef inline init_ctx(unpack_context *ctx,
 
 def default_read_extended_type(typecode, data):
     raise NotImplementedError("Cannot decode extended type "
-                              "with typecode=%d" % typecode)
+                              "with typecode={code}".format(code=typecode))
 
 
 def unpackb(object packed, object object_hook=None, object list_hook=None,
             bint use_list=1, encoding=None, unicode_errors="strict",
             object_pairs_hook=None, ext_hook=ExtType,
-            Py_ssize_t max_str_len=2147483647, # 2**32-1
+            Py_ssize_t max_str_len=2147483647,  # 2**32-1
             Py_ssize_t max_bin_len=2147483647,
             Py_ssize_t max_array_len=2147483647,
             Py_ssize_t max_map_len=2147483647,
@@ -112,14 +120,15 @@ def unpackb(object packed, object object_hook=None, object list_hook=None,
 
     See :class:`Unpacker` for options.
     """
-    cdef unpack_context ctx
-    cdef size_t off = 0
-    cdef int ret
+    cdef:
+        unpack_context ctx
+        size_t off = 0
+        int ret
 
-    cdef char* buf
-    cdef Py_ssize_t buf_len
-    cdef char* cenc = NULL
-    cdef char* cerr = NULL
+        char* buf
+        Py_ssize_t buf_len
+        char* cenc = NULL
+        char* cerr = NULL
 
     PyObject_AsReadBuffer(packed, <const void**>&buf, &buf_len)
 
@@ -139,12 +148,12 @@ def unpackb(object packed, object object_hook=None, object list_hook=None,
     ret = unpack_construct(&ctx, buf, buf_len, &off)
     if ret == 1:
         obj = unpack_data(&ctx)
-        if off < buf_len:
+        if <Py_ssize_t> off < buf_len:
             raise ExtraData(obj, PyBytes_FromStringAndSize(
                 buf + off, buf_len - off))
         return obj
     else:
-        raise UnpackValueError("Unpack failed: error = %d" % (ret,))
+        raise UnpackValueError("Unpack failed: error = {ret}".format(ret=ret))
 
 
 def unpack(object stream, object object_hook=None, object list_hook=None,
@@ -202,7 +211,7 @@ cdef class Unpacker(object):
     :param int max_buffer_size:
         Limits size of data waiting unpacked.  0 means system's
         INT_MAX  (default). Raises `BufferFull` exception when it
-        is insufficient. You shoud set this parameter when unpacking
+        is insufficient. You should set this parameter when unpacking
         data from untrasted source.
 
     :param int max_str_len:
@@ -235,16 +244,17 @@ cdef class Unpacker(object):
             for o in unpacker:
                 process(o)
     """
-    cdef unpack_context ctx
-    cdef char* buf
-    cdef size_t buf_size, buf_head, buf_tail
-    cdef object file_like
-    cdef object file_like_read
-    cdef Py_ssize_t read_size
-    # To maintain refcnt.
-    cdef object object_hook, object_pairs_hook, list_hook, ext_hook
-    cdef object encoding, unicode_errors
-    cdef size_t max_buffer_size
+    cdef:
+        unpack_context ctx
+        char* buf
+        size_t buf_size, buf_head, buf_tail
+        object file_like
+        object file_like_read
+        Py_ssize_t read_size
+        # To maintain refcnt.
+        object object_hook, object_pairs_hook, list_hook, ext_hook
+        object encoding, unicode_errors
+        size_t max_buffer_size
 
     def __cinit__(self):
         self.buf = NULL
@@ -257,13 +267,14 @@ cdef class Unpacker(object):
                  object object_hook=None, object object_pairs_hook=None,
                  object list_hook=None, encoding=None, unicode_errors='strict',
                  int max_buffer_size=0, object ext_hook=ExtType,
-                 Py_ssize_t max_str_len=2147483647, # 2**32-1
+                 Py_ssize_t max_str_len=2147483647,  # 2**32-1
                  Py_ssize_t max_bin_len=2147483647,
                  Py_ssize_t max_array_len=2147483647,
                  Py_ssize_t max_map_len=2147483647,
                  Py_ssize_t max_ext_len=2147483647):
-        cdef char *cenc=NULL,
-        cdef char *cerr=NULL
+        cdef:
+            char *cenc=NULL,
+            char *cerr=NULL
 
         self.object_hook = object_hook
         self.object_pairs_hook = object_pairs_hook
@@ -367,9 +378,11 @@ cdef class Unpacker(object):
         self.buf_tail = tail + _buf_len
 
     cdef read_from_file(self):
+        # Assume self.max_buffer_size - (self.buf_tail - self.buf_head) >= 0
         next_bytes = self.file_like_read(
             min(self.read_size,
-                self.max_buffer_size - (self.buf_tail - self.buf_head)))
+                <Py_ssize_t>(self.max_buffer_size -
+                             (self.buf_tail - self.buf_head))))
         if next_bytes:
             self.append_buffer(PyBytes_AsString(next_bytes),
                                PyBytes_Size(next_bytes))
@@ -378,9 +391,10 @@ cdef class Unpacker(object):
 
     cdef object _unpack(self, execute_fn execute,
                         object write_bytes, bint iter=0):
-        cdef int ret
-        cdef object obj
-        cdef size_t prev_head
+        cdef:
+            int ret
+            object obj
+            size_t prev_head
 
         if self.buf_head >= self.buf_tail and self.file_like is not None:
             self.read_from_file()
@@ -411,12 +425,15 @@ cdef class Unpacker(object):
                 else:
                     raise OutOfData("No more data to unpack.")
             else:
-                raise ValueError("Unpack failed: error = %d" % (ret,))
+                raise ValueError("Unpack failed: error = {ret}"
+                                 .format(ret=ret))
 
     def read_bytes(self, Py_ssize_t nbytes):
         """Read a specified number of raw bytes from the stream"""
         cdef size_t nread
-        nread = min(self.buf_tail - self.buf_head, nbytes)
+
+        # Assume that self.buf_tail - self.buf_head >= 0
+        nread = min(<Py_ssize_t>(self.buf_tail - self.buf_head), nbytes)
         ret = PyBytes_FromStringAndSize(self.buf + self.buf_head, nread)
         self.buf_head += nread
         if len(ret) < nbytes and self.file_like is not None:
@@ -466,8 +483,8 @@ cdef class Unpacker(object):
         return self._unpack(unpack_construct, None, 1)
 
     # for debug.
-    #def _buf(self):
+    # def _buf(self):
     #    return PyString_FromStringAndSize(self.buf, self.buf_tail)
 
-    #def _off(self):
+    # def _off(self):
     #    return self.buf_head
diff --git a/pandas/io/packers.py b/pandas/io/packers.py
index 4662e8b635d3f..588d63d73515f 100644
--- a/pandas/io/packers.py
+++ b/pandas/io/packers.py
@@ -38,39 +38,39 @@
 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 """
 
-from datetime import datetime, date, timedelta
-from dateutil.parser import parse
+from datetime import date, datetime, timedelta
 import os
 from textwrap import dedent
 import warnings
 
+from dateutil.parser import parse
 import numpy as np
-from pandas import compat
-from pandas.compat import u, u_safe
 
-from pandas.types.common import (is_categorical_dtype, is_object_dtype,
-                                 needs_i8_conversion, pandas_dtype)
-
-from pandas import (Timestamp, Period, Series, DataFrame,  # noqa
-                    Index, MultiIndex, Float64Index, Int64Index,
-                    Panel, RangeIndex, PeriodIndex, DatetimeIndex, NaT,
-                    Categorical, CategoricalIndex)
-from pandas._libs.tslib import NaTType
-from pandas.sparse.api import SparseSeries, SparseDataFrame
-from pandas.sparse.array import BlockIndex, IntIndex
+import pandas.compat as compat
+from pandas.compat import u, u_safe
+from pandas.errors import PerformanceWarning
+from pandas.util._move import (
+    BadMove as _BadMove, move_into_mutable_buffer as _move_into_mutable_buffer)
+
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64tz_dtype, is_object_dtype,
+    needs_i8_conversion, pandas_dtype)
+
+from pandas import (  # noqa:F401
+    Categorical, CategoricalIndex, DataFrame, DatetimeIndex, Float64Index,
+    Index, Int64Index, Interval, IntervalIndex, MultiIndex, NaT, Panel, Period,
+    PeriodIndex, RangeIndex, Series, TimedeltaIndex, Timestamp)
+from pandas.core import internals
+from pandas.core.arrays import DatetimeArray, IntervalArray, PeriodArray
+from pandas.core.arrays.sparse import BlockIndex, IntIndex
 from pandas.core.generic import NDFrame
-from pandas.core.common import PerformanceWarning
-from pandas.io.common import get_filepath_or_buffer
-from pandas.core.internals import BlockManager, make_block, _safe_reshape
-import pandas.core.internals as internals
+from pandas.core.internals import BlockManager, _safe_reshape, make_block
+from pandas.core.sparse.api import SparseDataFrame, SparseSeries
 
-from pandas.io.msgpack import Unpacker as _Unpacker, Packer as _Packer, ExtType
-from pandas.util._move import (
-    BadMove as _BadMove,
-    move_into_mutable_buffer as _move_into_mutable_buffer,
-)
+from pandas.io.common import _stringify_path, get_filepath_or_buffer
+from pandas.io.msgpack import ExtType, Packer as _Packer, Unpacker as _Unpacker
 
-# check whcih compression libs we have installed
+# check which compression libs we have installed
 try:
     import zlib
 
@@ -128,7 +128,7 @@ def to_msgpack(path_or_buf, *args, **kwargs):
     path_or_buf : string File path, buffer-like, or None
                   if None, return generated string
     args : an object or objects to serialize
-    encoding: encoding for unicode objects
+    encoding : encoding for unicode objects
     append : boolean whether to append to an existing msgpack
              (default is False)
     compress : type of compressor (zlib or blosc), default to None (no
@@ -148,6 +148,7 @@ def writer(fh):
         for a in args:
             fh.write(pack(a, **kwargs))
 
+    path_or_buf = _stringify_path(path_or_buf)
     if isinstance(path_or_buf, compat.string_types):
         with open(path_or_buf, mode) as fh:
             writer(fh)
@@ -170,28 +171,32 @@ def read_msgpack(path_or_buf, encoding='utf-8', iterator=False, **kwargs):
     Parameters
     ----------
     path_or_buf : string File path, BytesIO like or string
-    encoding: Encoding for decoding msgpack str type
+    encoding : Encoding for decoding msgpack str type
     iterator : boolean, if True, return an iterator to the unpacker
                (default is False)
 
     Returns
     -------
-    obj : type of object stored in file
-
+    obj : same type as object stored in file
     """
-    path_or_buf, _, _ = get_filepath_or_buffer(path_or_buf)
+    path_or_buf, _, _, should_close = get_filepath_or_buffer(path_or_buf)
     if iterator:
         return Iterator(path_or_buf)
 
     def read(fh):
-        l = list(unpack(fh, encoding=encoding, **kwargs))
-        if len(l) == 1:
-            return l[0]
-        return l
+        unpacked_obj = list(unpack(fh, encoding=encoding, **kwargs))
+        if len(unpacked_obj) == 1:
+            return unpacked_obj[0]
+
+        if should_close:
+            try:
+                path_or_buf.close()
+            except IOError:
+                pass
+        return unpacked_obj
 
     # see if we have an actual file
     if isinstance(path_or_buf, compat.string_types):
-
         try:
             exists = os.path.exists(path_or_buf)
         except (TypeError, ValueError):
@@ -201,18 +206,21 @@ def read(fh):
             with open(path_or_buf, 'rb') as fh:
                 return read(fh)
 
-    # treat as a binary-like
     if isinstance(path_or_buf, compat.binary_type):
+        # treat as a binary-like
         fh = None
         try:
-            fh = compat.BytesIO(path_or_buf)
-            return read(fh)
+            # We can't distinguish between a path and a buffer of bytes in
+            # Python 2 so instead assume the first byte of a valid path is
+            # less than 0x80.
+            if compat.PY3 or ord(path_or_buf[0]) >= 0x80:
+                fh = compat.BytesIO(path_or_buf)
+                return read(fh)
         finally:
             if fh is not None:
                 fh.close()
-
-    # a buffer like
-    if hasattr(path_or_buf, 'read') and compat.callable(path_or_buf.read):
+    elif hasattr(path_or_buf, 'read') and callable(path_or_buf.read):
+        # treat as a buffer like
         return read(path_or_buf)
 
     raise ValueError('path_or_buf needs to be a string file path or file-like')
@@ -243,7 +251,7 @@ def dtype_for(t):
             'complex128': np.float64,
             'complex64': np.float32}
 
-# numpy 1.6.1 compat
+# windows (32 bit) compat
 if hasattr(np, 'float128'):
     c2f_dict['complex256'] = np.float128
 
@@ -349,8 +357,11 @@ def unconvert(values, dtype, compress=None):
                 )
                 # fall through to copying `np.fromstring`
 
-    # Copy the string into a numpy array.
-    return np.fromstring(values, dtype=dtype)
+    # Copy the bytes into a numpy array.
+    buf = np.frombuffer(values, dtype=dtype)
+    buf = buf.copy()  # required to not mutate the original data
+    buf.flags.writeable = True
+    return buf
 
 
 def encode(obj):
@@ -389,6 +400,17 @@ def encode(obj):
                     u'freq': u_safe(getattr(obj, 'freqstr', None)),
                     u'tz': tz,
                     u'compress': compressor}
+        elif isinstance(obj, (IntervalIndex, IntervalArray)):
+            if isinstance(obj, IntervalIndex):
+                typ = u'interval_index'
+            else:
+                typ = u'interval_array'
+            return {u'typ': typ,
+                    u'klass': u(obj.__class__.__name__),
+                    u'name': getattr(obj, 'name', None),
+                    u'left': getattr(obj, 'left', None),
+                    u'right': getattr(obj, 'right', None),
+                    u'closed': getattr(obj, 'closed', None)}
         elif isinstance(obj, MultiIndex):
             return {u'typ': u'multi_index',
                     u'klass': u(obj.__class__.__name__),
@@ -468,7 +490,7 @@ def encode(obj):
                     }
 
     elif isinstance(obj, (datetime, date, np.datetime64, timedelta,
-                          np.timedelta64, NaTType)):
+                          np.timedelta64)) or obj is NaT:
         if isinstance(obj, Timestamp):
             tz = obj.tzinfo
             if tz is not None:
@@ -480,7 +502,7 @@ def encode(obj):
                     u'value': obj.value,
                     u'freq': freq,
                     u'tz': tz}
-        if isinstance(obj, NaTType):
+        if obj is NaT:
             return {u'typ': u'nat'}
         elif isinstance(obj, np.timedelta64):
             return {u'typ': u'timedelta64',
@@ -497,11 +519,17 @@ def encode(obj):
         elif isinstance(obj, date):
             return {u'typ': u'date',
                     u'data': u(obj.isoformat())}
-        raise Exception("cannot encode this datetimelike object: %s" % obj)
+        raise Exception(
+            "cannot encode this datetimelike object: {obj}".format(obj=obj))
     elif isinstance(obj, Period):
         return {u'typ': u'period',
                 u'ordinal': obj.ordinal,
-                u'freq': u(obj.freq)}
+                u'freq': u_safe(obj.freqstr)}
+    elif isinstance(obj, Interval):
+        return {u'typ': u'interval',
+                u'left': obj.left,
+                u'right': obj.right,
+                u'closed': obj.closed}
     elif isinstance(obj, BlockIndex):
         return {u'typ': u'block_index',
                 u'klass': u(obj.__class__.__name__),
@@ -558,26 +586,28 @@ def decode(obj):
         dtype = dtype_for(obj[u'dtype'])
         data = unconvert(obj[u'data'], dtype,
                          obj.get(u'compress'))
-        return globals()[obj[u'klass']](data, dtype=dtype, name=obj[u'name'])
+        return Index(data, dtype=dtype, name=obj[u'name'])
     elif typ == u'range_index':
-        return globals()[obj[u'klass']](obj[u'start'],
-                                        obj[u'stop'],
-                                        obj[u'step'],
-                                        name=obj[u'name'])
+        return RangeIndex(obj[u'start'],
+                          obj[u'stop'],
+                          obj[u'step'],
+                          name=obj[u'name'])
     elif typ == u'multi_index':
         dtype = dtype_for(obj[u'dtype'])
         data = unconvert(obj[u'data'], dtype,
                          obj.get(u'compress'))
         data = [tuple(x) for x in data]
-        return globals()[obj[u'klass']].from_tuples(data, names=obj[u'names'])
+        return MultiIndex.from_tuples(data, names=obj[u'names'])
     elif typ == u'period_index':
         data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
         d = dict(name=obj[u'name'], freq=obj[u'freq'])
-        return globals()[obj[u'klass']]._from_ordinals(data, **d)
+        freq = d.pop('freq', None)
+        return PeriodIndex(PeriodArray(data, freq), **d)
+
     elif typ == u'datetime_index':
         data = unconvert(obj[u'data'], np.int64, obj.get(u'compress'))
-        d = dict(name=obj[u'name'], freq=obj[u'freq'], verify_integrity=False)
-        result = globals()[obj[u'klass']](data, **d)
+        d = dict(name=obj[u'name'], freq=obj[u'freq'])
+        result = DatetimeIndex(data, **d)
         tz = obj[u'tz']
 
         # reverse tz conversion
@@ -585,22 +615,28 @@ def decode(obj):
             result = result.tz_localize('UTC').tz_convert(tz)
         return result
 
+    elif typ in (u'interval_index', 'interval_array'):
+        return globals()[obj[u'klass']].from_arrays(obj[u'left'],
+                                                    obj[u'right'],
+                                                    obj[u'closed'],
+                                                    name=obj[u'name'])
     elif typ == u'category':
         from_codes = globals()[obj[u'klass']].from_codes
         return from_codes(codes=obj[u'codes'],
                           categories=obj[u'categories'],
                           ordered=obj[u'ordered'])
 
+    elif typ == u'interval':
+        return Interval(obj[u'left'], obj[u'right'], obj[u'closed'])
     elif typ == u'series':
         dtype = dtype_for(obj[u'dtype'])
         pd_dtype = pandas_dtype(dtype)
 
         index = obj[u'index']
-        result = globals()[obj[u'klass']](unconvert(obj[u'data'], dtype,
-                                                    obj[u'compress']),
-                                          index=index,
-                                          dtype=pd_dtype,
-                                          name=obj[u'name'])
+        result = Series(unconvert(obj[u'data'], dtype, obj[u'compress']),
+                        index=index,
+                        dtype=pd_dtype,
+                        name=obj[u'name'])
         return result
 
     elif typ == u'block_manager':
@@ -617,6 +653,12 @@ def create_block(b):
                 placement = b[u'locs']
             else:
                 placement = axes[0].get_indexer(b[u'items'])
+
+            if is_datetime64tz_dtype(b[u'dtype']):
+                assert isinstance(values, np.ndarray), type(values)
+                assert values.dtype == 'M8[ns]', values.dtype
+                values = DatetimeArray(values, dtype=b[u'dtype'])
+
             return make_block(values=values,
                               klass=getattr(internals, b[u'klass']),
                               placement=placement,
@@ -636,18 +678,18 @@ def create_block(b):
         return np.timedelta64(int(obj[u'data']))
     # elif typ == 'sparse_series':
     #    dtype = dtype_for(obj['dtype'])
-    #    return globals()[obj['klass']](
+    #    return SparseSeries(
     #        unconvert(obj['sp_values'], dtype, obj['compress']),
     #        sparse_index=obj['sp_index'], index=obj['index'],
     #        fill_value=obj['fill_value'], kind=obj['kind'], name=obj['name'])
     # elif typ == 'sparse_dataframe':
-    #    return globals()[obj['klass']](
+    #    return SparseDataFrame(
     #        obj['data'], columns=obj['columns'],
     #        default_fill_value=obj['default_fill_value'],
     #        default_kind=obj['default_kind']
     #    )
     # elif typ == 'sparse_panel':
-    #    return globals()[obj['klass']](
+    #    return SparsePanel(
     #        obj['data'], items=obj['items'],
     #        default_fill_value=obj['default_fill_value'],
     #        default_kind=obj['default_kind'])
@@ -666,7 +708,7 @@ def create_block(b):
             dtype = dtype_for(obj[u'dtype'])
             try:
                 return dtype(obj[u'data'])
-            except:
+            except (ValueError, TypeError):
                 return dtype.type(obj[u'data'])
     elif typ == u'np_complex':
         return complex(obj[u'real'] + u'+' + obj[u'imag'] + u'j')
diff --git a/pandas/io/parquet.py b/pandas/io/parquet.py
new file mode 100644
index 0000000000000..ba322f42c07c1
--- /dev/null
+++ b/pandas/io/parquet.py
@@ -0,0 +1,283 @@
+""" parquet compat """
+
+from distutils.version import LooseVersion
+from warnings import catch_warnings
+
+from pandas.compat import string_types
+from pandas.errors import AbstractMethodError
+
+from pandas import DataFrame, get_option
+
+from pandas.io.common import get_filepath_or_buffer, is_s3_url
+
+
+def get_engine(engine):
+    """ return our implementation """
+
+    if engine == 'auto':
+        engine = get_option('io.parquet.engine')
+
+    if engine == 'auto':
+        # try engines in this order
+        try:
+            return PyArrowImpl()
+        except ImportError:
+            pass
+
+        try:
+            return FastParquetImpl()
+        except ImportError:
+            pass
+
+        raise ImportError("Unable to find a usable engine; "
+                          "tried using: 'pyarrow', 'fastparquet'.\n"
+                          "pyarrow or fastparquet is required for parquet "
+                          "support")
+
+    if engine not in ['pyarrow', 'fastparquet']:
+        raise ValueError("engine must be one of 'pyarrow', 'fastparquet'")
+
+    if engine == 'pyarrow':
+        return PyArrowImpl()
+    elif engine == 'fastparquet':
+        return FastParquetImpl()
+
+
+class BaseImpl(object):
+
+    api = None  # module
+
+    @staticmethod
+    def validate_dataframe(df):
+
+        if not isinstance(df, DataFrame):
+            raise ValueError("to_parquet only supports IO with DataFrames")
+
+        # must have value column names (strings only)
+        if df.columns.inferred_type not in {'string', 'unicode'}:
+            raise ValueError("parquet must have string column names")
+
+        # index level names must be strings
+        valid_names = all(
+            isinstance(name, string_types)
+            for name in df.index.names
+            if name is not None
+        )
+        if not valid_names:
+            raise ValueError("Index level names must be strings")
+
+    def write(self, df, path, compression, **kwargs):
+        raise AbstractMethodError(self)
+
+    def read(self, path, columns=None, **kwargs):
+        raise AbstractMethodError(self)
+
+
+class PyArrowImpl(BaseImpl):
+
+    def __init__(self):
+        # since pandas is a dependency of pyarrow
+        # we need to import on first use
+        try:
+            import pyarrow
+            import pyarrow.parquet
+        except ImportError:
+            raise ImportError(
+                "pyarrow is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install pyarrow -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U pyarrow\n"
+            )
+        if LooseVersion(pyarrow.__version__) < '0.9.0':
+            raise ImportError(
+                "pyarrow >= 0.9.0 is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install pyarrow -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U pyarrow\n"
+            )
+
+        self.api = pyarrow
+
+    def write(self, df, path, compression='snappy',
+              coerce_timestamps='ms', index=None, partition_cols=None,
+              **kwargs):
+        self.validate_dataframe(df)
+        path, _, _, _ = get_filepath_or_buffer(path, mode='wb')
+
+        if index is None:
+            from_pandas_kwargs = {}
+        else:
+            from_pandas_kwargs = {'preserve_index': index}
+        table = self.api.Table.from_pandas(df, **from_pandas_kwargs)
+        if partition_cols is not None:
+            self.api.parquet.write_to_dataset(
+                table, path, compression=compression,
+                coerce_timestamps=coerce_timestamps,
+                partition_cols=partition_cols, **kwargs)
+        else:
+            self.api.parquet.write_table(
+                table, path, compression=compression,
+                coerce_timestamps=coerce_timestamps, **kwargs)
+
+    def read(self, path, columns=None, **kwargs):
+        path, _, _, should_close = get_filepath_or_buffer(path)
+
+        kwargs['use_pandas_metadata'] = True
+        result = self.api.parquet.read_table(path, columns=columns,
+                                             **kwargs).to_pandas()
+        if should_close:
+            try:
+                path.close()
+            except:  # noqa: flake8
+                pass
+
+        return result
+
+
+class FastParquetImpl(BaseImpl):
+
+    def __init__(self):
+        # since pandas is a dependency of fastparquet
+        # we need to import on first use
+        try:
+            import fastparquet
+        except ImportError:
+            raise ImportError(
+                "fastparquet is required for parquet support\n\n"
+                "you can install via conda\n"
+                "conda install fastparquet -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U fastparquet"
+            )
+        if LooseVersion(fastparquet.__version__) < '0.2.1':
+            raise ImportError(
+                "fastparquet >= 0.2.1 is required for parquet "
+                "support\n\n"
+                "you can install via conda\n"
+                "conda install fastparquet -c conda-forge\n"
+                "\nor via pip\n"
+                "pip install -U fastparquet"
+            )
+        self.api = fastparquet
+
+    def write(self, df, path, compression='snappy', index=None,
+              partition_cols=None, **kwargs):
+        self.validate_dataframe(df)
+        # thriftpy/protocol/compact.py:339:
+        # DeprecationWarning: tostring() is deprecated.
+        # Use tobytes() instead.
+
+        if 'partition_on' in kwargs and partition_cols is not None:
+            raise ValueError("Cannot use both partition_on and "
+                             "partition_cols. Use partition_cols for "
+                             "partitioning data")
+        elif 'partition_on' in kwargs:
+            partition_cols = kwargs.pop('partition_on')
+
+        if partition_cols is not None:
+            kwargs['file_scheme'] = 'hive'
+
+        if is_s3_url(path):
+            # path is s3:// so we need to open the s3file in 'wb' mode.
+            # TODO: Support 'ab'
+
+            path, _, _, _ = get_filepath_or_buffer(path, mode='wb')
+            # And pass the opened s3file to the fastparquet internal impl.
+            kwargs['open_with'] = lambda path, _: path
+        else:
+            path, _, _, _ = get_filepath_or_buffer(path)
+
+        with catch_warnings(record=True):
+            self.api.write(path, df, compression=compression,
+                           write_index=index, partition_on=partition_cols,
+                           **kwargs)
+
+    def read(self, path, columns=None, **kwargs):
+        if is_s3_url(path):
+            # When path is s3:// an S3File is returned.
+            # We need to retain the original path(str) while also
+            # pass the S3File().open function to fsatparquet impl.
+            s3, _, _, should_close = get_filepath_or_buffer(path)
+            try:
+                parquet_file = self.api.ParquetFile(path, open_with=s3.s3.open)
+            finally:
+                s3.close()
+        else:
+            path, _, _, _ = get_filepath_or_buffer(path)
+            parquet_file = self.api.ParquetFile(path)
+
+        return parquet_file.to_pandas(columns=columns, **kwargs)
+
+
+def to_parquet(df, path, engine='auto', compression='snappy', index=None,
+               partition_cols=None, **kwargs):
+    """
+    Write a DataFrame to the parquet format.
+
+    Parameters
+    ----------
+    path : str
+        File path or Root Directory path. Will be used as Root Directory path
+        while writing a partitioned dataset.
+
+        .. versionchanged:: 0.24.0
+
+    engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+        Parquet library to use. If 'auto', then the option
+        ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+        behavior is to try 'pyarrow', falling back to 'fastparquet' if
+        'pyarrow' is unavailable.
+    compression : {'snappy', 'gzip', 'brotli', None}, default 'snappy'
+        Name of the compression to use. Use ``None`` for no compression.
+    index : bool, default None
+        If ``True``, include the dataframe's index(es) in the file output. If
+        ``False``, they will not be written to the file. If ``None``, the
+        engine's default behavior will be used.
+
+        .. versionadded 0.24.0
+
+    partition_cols : list, optional, default None
+        Column names by which to partition the dataset
+        Columns are partitioned in the order they are given
+
+        .. versionadded:: 0.24.0
+
+    kwargs
+        Additional keyword arguments passed to the engine
+    """
+    impl = get_engine(engine)
+    return impl.write(df, path, compression=compression, index=index,
+                      partition_cols=partition_cols, **kwargs)
+
+
+def read_parquet(path, engine='auto', columns=None, **kwargs):
+    """
+    Load a parquet object from the file path, returning a DataFrame.
+
+    .. versionadded 0.21.0
+
+    Parameters
+    ----------
+    path : string
+        File path
+    engine : {'auto', 'pyarrow', 'fastparquet'}, default 'auto'
+        Parquet library to use. If 'auto', then the option
+        ``io.parquet.engine`` is used. The default ``io.parquet.engine``
+        behavior is to try 'pyarrow', falling back to 'fastparquet' if
+        'pyarrow' is unavailable.
+    columns : list, default=None
+        If not None, only these columns will be read from the file.
+
+        .. versionadded 0.21.1
+    **kwargs
+        Any additional kwargs are passed to the engine.
+
+    Returns
+    -------
+    DataFrame
+    """
+
+    impl = get_engine(engine)
+    return impl.read(path, columns=columns, **kwargs)
diff --git a/pandas/io/parsers.py b/pandas/io/parsers.py
index 30b88de91ef76..4163a571df800 100755
--- a/pandas/io/parsers.py
+++ b/pandas/io/parsers.py
@@ -1,45 +1,51 @@
 """
 Module contains tools for processing files into DataFrames or other objects
 """
+
 from __future__ import print_function
+
 from collections import defaultdict
-import re
 import csv
-import sys
-import warnings
 import datetime
+import re
+import sys
 from textwrap import fill
+import warnings
 
 import numpy as np
 
-from pandas import compat
-from pandas.compat import (range, lrange, StringIO, lzip,
-                           zip, string_types, map, u)
-from pandas.types.common import (is_integer, _ensure_object,
-                                 is_list_like, is_integer_dtype,
-                                 is_float, is_dtype_equal,
-                                 is_object_dtype, is_string_dtype,
-                                 is_scalar, is_categorical_dtype)
-from pandas.types.missing import isnull
-from pandas.types.cast import astype_nansafe
-from pandas.core.index import Index, MultiIndex, RangeIndex
-from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-from pandas.core.categorical import Categorical
-from pandas.core import algorithms
-from pandas.core.common import AbstractMethodError
-from pandas.io.date_converters import generic_parser
-from pandas.io.common import (get_filepath_or_buffer, _validate_header_arg,
-                              _get_handle, UnicodeReader, UTF8Recoder,
-                              BaseIterator, ParserError, EmptyDataError,
-                              ParserWarning, _NA_VALUES, _infer_compression)
-from pandas.tseries import tools
-
-from pandas.util.decorators import Appender
-
 import pandas._libs.lib as lib
-import pandas.io.libparsers as libparsers
+import pandas._libs.ops as libops
+import pandas._libs.parsers as parsers
+from pandas._libs.tslibs import parsing
+import pandas.compat as compat
+from pandas.compat import (
+    PY3, StringIO, lrange, lzip, map, range, string_types, u, zip)
+from pandas.errors import (
+    AbstractMethodError, EmptyDataError, ParserError, ParserWarning)
+from pandas.util._decorators import Appender
+
+from pandas.core.dtypes.cast import astype_nansafe
+from pandas.core.dtypes.common import (
+    ensure_object, is_bool_dtype, is_categorical_dtype, is_dtype_equal,
+    is_extension_array_dtype, is_float, is_integer, is_integer_dtype,
+    is_list_like, is_object_dtype, is_scalar, is_string_dtype, pandas_dtype)
+from pandas.core.dtypes.dtypes import CategoricalDtype
+from pandas.core.dtypes.missing import isna
 
+from pandas.core import algorithms
+from pandas.core.arrays import Categorical
+from pandas.core.frame import DataFrame
+from pandas.core.index import (
+    Index, MultiIndex, RangeIndex, ensure_index_from_sequences)
+from pandas.core.series import Series
+from pandas.core.tools import datetimes as tools
+
+from pandas.io.common import (
+    _NA_VALUES, BaseIterator, UnicodeReader, UTF8Recoder, _get_handle,
+    _infer_compression, _validate_header_arg, get_filepath_or_buffer,
+    is_file_like)
+from pandas.io.date_converters import generic_parser
 
 # BOM character (byte order mark)
 # This exists at the beginning of a file to indicate endianness
@@ -47,93 +53,106 @@
 # so we need to remove it if we see it.
 _BOM = u('\ufeff')
 
-_parser_params = """Also supports optionally iterating or breaking of the file
+_doc_read_csv_and_table = r"""
+{summary}
+
+Also supports optionally iterating or breaking of the file
 into chunks.
 
-Additional help can be found in the `online docs for IO Tools
-<http://pandas.pydata.org/pandas-docs/stable/io.html>`_.
+Additional help can be found in the online docs for
+`IO Tools <http://pandas.pydata.org/pandas-docs/stable/io.html>`_.
 
 Parameters
 ----------
-filepath_or_buffer : str, pathlib.Path, py._path.local.LocalPath or any \
-object with a read() method (such as a file handle or StringIO)
-    The string could be a URL. Valid URL schemes include http, ftp, s3, and
-    file. For file URLs, a host is expected. For instance, a local file could
-    be file ://localhost/path/to/table.csv
-%s
-delimiter : str, default ``None``
-    Alternative argument name for sep.
-delim_whitespace : boolean, default False
-    Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``) will be
-    used as the sep. Equivalent to setting ``sep='\s+'``. If this option
-    is set to True, nothing should be passed in for the ``delimiter``
-    parameter.
+filepath_or_buffer : str, path object, or file-like object
+    Any valid string path is acceptable. The string could be a URL. Valid
+    URL schemes include http, ftp, s3, and file. For file URLs, a host is
+    expected. A local file could be: file://localhost/path/to/table.csv.
 
-    .. versionadded:: 0.18.1 support for the Python parser.
+    If you want to pass in a path object, pandas accepts either
+    ``pathlib.Path`` or ``py._path.local.LocalPath``.
 
-header : int or list of ints, default 'infer'
-    Row number(s) to use as the column names, and the start of the data.
-    Default behavior is as if set to 0 if no ``names`` passed, otherwise
-    ``None``. Explicitly pass ``header=0`` to be able to replace existing
-    names. The header can be a list of integers that specify row locations for
-    a multi-index on the columns e.g. [0,1,3]. Intervening rows that are not
-    specified will be skipped (e.g. 2 in this example is skipped). Note that
-    this parameter ignores commented lines and empty lines if
-    ``skip_blank_lines=True``, so header=0 denotes the first line of data
-    rather than the first line of the file.
-names : array-like, default None
+    By file-like object, we refer to objects with a ``read()`` method, such as
+    a file handler (e.g. via builtin ``open`` function) or ``StringIO``.
+sep : str, default {_default_sep}
+    Delimiter to use. If sep is None, the C engine cannot automatically detect
+    the separator, but the Python parsing engine can, meaning the latter will
+    be used and automatically detect the separator by Python's builtin sniffer
+    tool, ``csv.Sniffer``. In addition, separators longer than 1 character and
+    different from ``'\s+'`` will be interpreted as regular expressions and
+    will also force the use of the Python parsing engine. Note that regex
+    delimiters are prone to ignoring quoted data. Regex example: ``'\r\t'``.
+delimiter : str, default ``None``
+    Alias for sep.
+header : int, list of int, default 'infer'
+    Row number(s) to use as the column names, and the start of the
+    data.  Default behavior is to infer the column names: if no names
+    are passed the behavior is identical to ``header=0`` and column
+    names are inferred from the first line of the file, if column
+    names are passed explicitly then the behavior is identical to
+    ``header=None``. Explicitly pass ``header=0`` to be able to
+    replace existing names. The header can be a list of integers that
+    specify row locations for a multi-index on the columns
+    e.g. [0,1,3]. Intervening rows that are not specified will be
+    skipped (e.g. 2 in this example is skipped). Note that this
+    parameter ignores commented lines and empty lines if
+    ``skip_blank_lines=True``, so ``header=0`` denotes the first line of
+    data rather than the first line of the file.
+names : array-like, optional
     List of column names to use. If file contains no header row, then you
-    should explicitly pass header=None. Duplicates in this list are not
-    allowed unless mangle_dupe_cols=True, which is the default.
-index_col : int or sequence or False, default None
+    should explicitly pass ``header=None``. Duplicates in this list will cause
+    a ``UserWarning`` to be issued.
+index_col : int, sequence or bool, optional
     Column to use as the row labels of the DataFrame. If a sequence is given, a
     MultiIndex is used. If you have a malformed file with delimiters at the end
-    of each line, you might consider index_col=False to force pandas to _not_
-    use the first column as the index (row names)
-usecols : array-like or callable, default None
-    Return a subset of the columns. If array-like, all elements must either
+    of each line, you might consider ``index_col=False`` to force pandas to
+    not use the first column as the index (row names).
+usecols : list-like or callable, optional
+    Return a subset of the columns. If list-like, all elements must either
     be positional (i.e. integer indices into the document columns) or strings
     that correspond to column names provided either by the user in `names` or
-    inferred from the document header row(s). For example, a valid array-like
-    `usecols` parameter would be [0, 1, 2] or ['foo', 'bar', 'baz'].
+    inferred from the document header row(s). For example, a valid list-like
+    `usecols` parameter would be ``[0, 1, 2]`` or ``['foo', 'bar', 'baz']``.
+    Element order is ignored, so ``usecols=[0, 1]`` is the same as ``[1, 0]``.
+    To instantiate a DataFrame from ``data`` with element order preserved use
+    ``pd.read_csv(data, usecols=['foo', 'bar'])[['foo', 'bar']]`` for columns
+    in ``['foo', 'bar']`` order or
+    ``pd.read_csv(data, usecols=['foo', 'bar'])[['bar', 'foo']]``
+    for ``['bar', 'foo']`` order.
 
     If callable, the callable function will be evaluated against the column
     names, returning names where the callable function evaluates to True. An
     example of a valid callable argument would be ``lambda x: x.upper() in
     ['AAA', 'BBB', 'DDD']``. Using this parameter results in much faster
     parsing time and lower memory usage.
-as_recarray : boolean, default False
-    DEPRECATED: this argument will be removed in a future version. Please call
-    `pd.read_csv(...).to_records()` instead.
-
-    Return a NumPy recarray instead of a DataFrame after parsing the data.
-    If set to True, this option takes precedence over the `squeeze` parameter.
-    In addition, as row indices are not available in such a format, the
-    `index_col` parameter will be ignored.
-squeeze : boolean, default False
-    If the parsed data only contains one column then return a Series
-prefix : str, default None
+squeeze : bool, default False
+    If the parsed data only contains one column then return a Series.
+prefix : str, optional
     Prefix to add to column numbers when no header, e.g. 'X' for X0, X1, ...
-mangle_dupe_cols : boolean, default True
-    Duplicate columns will be specified as 'X.0'...'X.N', rather than
+mangle_dupe_cols : bool, default True
+    Duplicate columns will be specified as 'X', 'X.1', ...'X.N', rather than
     'X'...'X'. Passing in False will cause data to be overwritten if there
     are duplicate names in the columns.
-dtype : Type name or dict of column -> type, default None
-    Data type for data or columns. E.g. {'a': np.float64, 'b': np.int32}
-    Use `str` or `object` to preserve and not interpret dtype.
+dtype : Type name or dict of column -> type, optional
+    Data type for data or columns. E.g. {{'a': np.float64, 'b': np.int32,
+    'c': 'Int64'}}
+    Use `str` or `object` together with suitable `na_values` settings
+    to preserve and not interpret dtype.
     If converters are specified, they will be applied INSTEAD
     of dtype conversion.
-%s
-converters : dict, default None
+engine : {{'c', 'python'}}, optional
+    Parser engine to use. The C engine is faster while the python engine is
+    currently more feature-complete.
+converters : dict, optional
     Dict of functions for converting values in certain columns. Keys can either
-    be integers or column labels
-true_values : list, default None
-    Values to consider as True
-false_values : list, default None
-    Values to consider as False
-skipinitialspace : boolean, default False
+    be integers or column labels.
+true_values : list, optional
+    Values to consider as True.
+false_values : list, optional
+    Values to consider as False.
+skipinitialspace : bool, default False
     Skip spaces after delimiter.
-skiprows : list-like or integer or callable, default None
+skiprows : list-like, int or callable, optional
     Line numbers to skip (0-indexed) or number of lines to skip (int)
     at the start of the file.
 
@@ -141,89 +160,101 @@
     indices, returning True if the row should be skipped and False otherwise.
     An example of a valid callable argument would be ``lambda x: x in [0, 2]``.
 skipfooter : int, default 0
-    Number of lines at bottom of file to skip (Unsupported with engine='c')
-skip_footer : int, default 0
-    DEPRECATED: use the `skipfooter` parameter instead, as they are identical
-nrows : int, default None
-    Number of rows of file to read. Useful for reading pieces of large files
-na_values : scalar, str, list-like, or dict, default None
+    Number of lines at bottom of file to skip (Unsupported with engine='c').
+nrows : int, optional
+    Number of rows of file to read. Useful for reading pieces of large files.
+na_values : scalar, str, list-like, or dict, optional
     Additional strings to recognize as NA/NaN. If dict passed, specific
     per-column NA values.  By default the following values are interpreted as
     NaN: '""" + fill("', '".join(sorted(_NA_VALUES)),
-                     70, subsequent_indent="    ") + """'`.
+                     70, subsequent_indent="    ") + """'.
 keep_default_na : bool, default True
-    If na_values are specified and keep_default_na is False the default NaN
-    values are overridden, otherwise they're appended to.
-na_filter : boolean, default True
+    Whether or not to include the default NaN values when parsing the data.
+    Depending on whether `na_values` is passed in, the behavior is as follows:
+
+    * If `keep_default_na` is True, and `na_values` are specified, `na_values`
+      is appended to the default NaN values used for parsing.
+    * If `keep_default_na` is True, and `na_values` are not specified, only
+      the default NaN values are used for parsing.
+    * If `keep_default_na` is False, and `na_values` are specified, only
+      the NaN values specified `na_values` are used for parsing.
+    * If `keep_default_na` is False, and `na_values` are not specified, no
+      strings will be parsed as NaN.
+
+    Note that if `na_filter` is passed in as False, the `keep_default_na` and
+    `na_values` parameters will be ignored.
+na_filter : bool, default True
     Detect missing value markers (empty strings and the value of na_values). In
     data without any NAs, passing na_filter=False can improve the performance
-    of reading a large file
-verbose : boolean, default False
-    Indicate number of NA values placed in non-numeric columns
-skip_blank_lines : boolean, default True
-    If True, skip over blank lines rather than interpreting as NaN values
-parse_dates : boolean or list of ints or names or list of lists or dict, \
+    of reading a large file.
+verbose : bool, default False
+    Indicate number of NA values placed in non-numeric columns.
+skip_blank_lines : bool, default True
+    If True, skip over blank lines rather than interpreting as NaN values.
+parse_dates : bool or list of int or names or list of lists or dict, \
 default False
+    The behavior is as follows:
 
     * boolean. If True -> try parsing the index.
-    * list of ints or names. e.g. If [1, 2, 3] -> try parsing columns 1, 2, 3
+    * list of int or names. e.g. If [1, 2, 3] -> try parsing columns 1, 2, 3
       each as a separate date column.
     * list of lists. e.g.  If [[1, 3]] -> combine columns 1 and 3 and parse as
-        a single date column.
-    * dict, e.g. {'foo' : [1, 3]} -> parse columns 1, 3 as date and call result
-      'foo'
-
-    If a column or index contains an unparseable date, the entire column or
-    index will be returned unaltered as an object data type. For non-standard
-    datetime parsing, use ``pd.to_datetime`` after ``pd.read_csv``
+      a single date column.
+    * dict, e.g. {{'foo' : [1, 3]}} -> parse columns 1, 3 as date and call
+      result 'foo'
+
+    If a column or index cannot be represented as an array of datetimes,
+    say because of an unparseable value or a mixture of timezones, the column
+    or index will be returned unaltered as an object data type. For
+    non-standard datetime parsing, use ``pd.to_datetime`` after
+    ``pd.read_csv``. To parse an index or column with a mixture of timezones,
+    specify ``date_parser`` to be a partially-applied
+    :func:`pandas.to_datetime` with ``utc=True``. See
+    :ref:`io.csv.mixed_timezones` for more.
 
     Note: A fast-path exists for iso8601-formatted dates.
-infer_datetime_format : boolean, default False
-    If True and parse_dates is enabled, pandas will attempt to infer the format
-    of the datetime strings in the columns, and if it can be inferred, switch
-    to a faster method of parsing them. In some cases this can increase the
-    parsing speed by 5-10x.
-keep_date_col : boolean, default False
-    If True and parse_dates specifies combining multiple columns then
+infer_datetime_format : bool, default False
+    If True and `parse_dates` is enabled, pandas will attempt to infer the
+    format of the datetime strings in the columns, and if it can be inferred,
+    switch to a faster method of parsing them. In some cases this can increase
+    the parsing speed by 5-10x.
+keep_date_col : bool, default False
+    If True and `parse_dates` specifies combining multiple columns then
     keep the original columns.
-date_parser : function, default None
+date_parser : function, optional
     Function to use for converting a sequence of string columns to an array of
     datetime instances. The default uses ``dateutil.parser.parser`` to do the
-    conversion. Pandas will try to call date_parser in three different ways,
+    conversion. Pandas will try to call `date_parser` in three different ways,
     advancing to the next if an exception occurs: 1) Pass one or more arrays
-    (as defined by parse_dates) as arguments; 2) concatenate (row-wise) the
-    string values from the columns defined by parse_dates into a single array
-    and pass that; and 3) call date_parser once for each row using one or more
-    strings (corresponding to the columns defined by parse_dates) as arguments.
-dayfirst : boolean, default False
-    DD/MM format dates, international and European format
-iterator : boolean, default False
+    (as defined by `parse_dates`) as arguments; 2) concatenate (row-wise) the
+    string values from the columns defined by `parse_dates` into a single array
+    and pass that; and 3) call `date_parser` once for each row using one or
+    more strings (corresponding to the columns defined by `parse_dates`) as
+    arguments.
+dayfirst : bool, default False
+    DD/MM format dates, international and European format.
+iterator : bool, default False
     Return TextFileReader object for iteration or getting chunks with
     ``get_chunk()``.
-chunksize : int, default None
+chunksize : int, optional
     Return TextFileReader object for iteration.
     See the `IO Tools docs
     <http://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking>`_
     for more information on ``iterator`` and ``chunksize``.
-compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
-    For on-the-fly decompression of on-disk data. If 'infer', then use gzip,
-    bz2, zip or xz if filepath_or_buffer is a string ending in '.gz', '.bz2',
-    '.zip', or 'xz', respectively, and no decompression otherwise. If using
-    'zip', the ZIP file must contain only one data file to be read in.
-    Set to None for no decompression.
+compression : {{'infer', 'gzip', 'bz2', 'zip', 'xz', None}}, default 'infer'
+    For on-the-fly decompression of on-disk data. If 'infer' and
+    `filepath_or_buffer` is path-like, then detect compression from the
+    following extensions: '.gz', '.bz2', '.zip', or '.xz' (otherwise no
+    decompression). If using 'zip', the ZIP file must contain only one data
+    file to be read in. Set to None for no decompression.
 
     .. versionadded:: 0.18.1 support for 'zip' and 'xz' compression.
 
-thousands : str, default None
-    Thousands separator
+thousands : str, optional
+    Thousands separator.
 decimal : str, default '.'
     Character to recognize as decimal point (e.g. use ',' for European data).
-float_precision : string, default None
-    Specifies which converter the C engine should use for floating-point
-    values. The options are `None` for the ordinary converter,
-    `high` for the high-precision converter, and `round_trip` for the
-    round-trip converter.
-lineterminator : str (length 1), default None
+lineterminator : str (length 1), optional
     Character to break file into lines. Only valid with C parser.
 quotechar : str (length 1), optional
     The character used to denote the start and end of a quoted item. Quoted
@@ -231,121 +262,87 @@
 quoting : int or csv.QUOTE_* instance, default 0
     Control field quoting behavior per ``csv.QUOTE_*`` constants. Use one of
     QUOTE_MINIMAL (0), QUOTE_ALL (1), QUOTE_NONNUMERIC (2) or QUOTE_NONE (3).
-doublequote : boolean, default ``True``
+doublequote : bool, default ``True``
    When quotechar is specified and quoting is not ``QUOTE_NONE``, indicate
    whether or not to interpret two consecutive quotechar elements INSIDE a
    field as a single ``quotechar`` element.
-escapechar : str (length 1), default None
-    One-character string used to escape delimiter when quoting is QUOTE_NONE.
-comment : str, default None
+escapechar : str (length 1), optional
+    One-character string used to escape other characters.
+comment : str, optional
     Indicates remainder of line should not be parsed. If found at the beginning
     of a line, the line will be ignored altogether. This parameter must be a
     single character. Like empty lines (as long as ``skip_blank_lines=True``),
     fully commented lines are ignored by the parameter `header` but not by
-    `skiprows`. For example, if comment='#', parsing '#empty\\na,b,c\\n1,2,3'
-    with `header=0` will result in 'a,b,c' being
+    `skiprows`. For example, if ``comment='#'``, parsing
+    ``#empty\\na,b,c\\n1,2,3`` with ``header=0`` will result in 'a,b,c' being
     treated as the header.
-encoding : str, default None
+encoding : str, optional
     Encoding to use for UTF when reading/writing (ex. 'utf-8'). `List of Python
     standard encodings
-    <https://docs.python.org/3/library/codecs.html#standard-encodings>`_
-dialect : str or csv.Dialect instance, default None
+    <https://docs.python.org/3/library/codecs.html#standard-encodings>`_ .
+dialect : str or csv.Dialect, optional
     If provided, this parameter will override values (default or not) for the
     following parameters: `delimiter`, `doublequote`, `escapechar`,
     `skipinitialspace`, `quotechar`, and `quoting`. If it is necessary to
     override values, a ParserWarning will be issued. See csv.Dialect
     documentation for more details.
-tupleize_cols : boolean, default False
+tupleize_cols : bool, default False
     Leave a list of tuples on columns as is (default is to convert to
-    a Multi Index on the columns)
-error_bad_lines : boolean, default True
+    a MultiIndex on the columns).
+
+    .. deprecated:: 0.21.0
+       This argument will be removed and will always convert to MultiIndex
+
+error_bad_lines : bool, default True
     Lines with too many fields (e.g. a csv line with too many commas) will by
     default cause an exception to be raised, and no DataFrame will be returned.
     If False, then these "bad lines" will dropped from the DataFrame that is
-    returned. (Only valid with C parser)
-warn_bad_lines : boolean, default True
+    returned.
+warn_bad_lines : bool, default True
     If error_bad_lines is False, and warn_bad_lines is True, a warning for each
-    "bad line" will be output. (Only valid with C parser).
-low_memory : boolean, default True
+    "bad line" will be output.
+delim_whitespace : bool, default False
+    Specifies whether or not whitespace (e.g. ``' '`` or ``'\t'``) will be
+    used as the sep. Equivalent to setting ``sep='\\s+'``. If this option
+    is set to True, nothing should be passed in for the ``delimiter``
+    parameter.
+
+    .. versionadded:: 0.18.1 support for the Python parser.
+
+low_memory : bool, default True
     Internally process the file in chunks, resulting in lower memory use
     while parsing, but possibly mixed type inference.  To ensure no mixed
     types either set False, or specify the type with the `dtype` parameter.
     Note that the entire file is read into a single DataFrame regardless,
     use the `chunksize` or `iterator` parameter to return the data in chunks.
-    (Only valid with C parser)
-buffer_lines : int, default None
-    DEPRECATED: this argument will be removed in a future version because its
-    value is not respected by the parser
-compact_ints : boolean, default False
-    DEPRECATED: this argument will be removed in a future version
-
-    If compact_ints is True, then for any column that is of integer dtype,
-    the parser will attempt to cast it as the smallest integer dtype possible,
-    either signed or unsigned depending on the specification from the
-    `use_unsigned` parameter.
-use_unsigned : boolean, default False
-    DEPRECATED: this argument will be removed in a future version
-
-    If integer columns are being compacted (i.e. `compact_ints=True`), specify
-    whether the column should be compacted to the smallest signed or unsigned
-    integer dtype.
-memory_map : boolean, default False
+    (Only valid with C parser).
+memory_map : bool, default False
     If a filepath is provided for `filepath_or_buffer`, map the file object
     directly onto memory and access the data directly from there. Using this
     option can improve performance because there is no longer any I/O overhead.
+float_precision : str, optional
+    Specifies which converter the C engine should use for floating-point
+    values. The options are `None` for the ordinary converter,
+    `high` for the high-precision converter, and `round_trip` for the
+    round-trip converter.
 
 Returns
 -------
-result : DataFrame or TextParser
-"""
-
-# engine is not used in read_fwf() so is factored out of the shared docstring
-_engine_doc = """engine : {'c', 'python'}, optional
-    Parser engine to use. The C engine is faster while the python engine is
-    currently more feature-complete."""
-
-_sep_doc = r"""sep : str, default {default}
-    Delimiter to use. If sep is None, the C engine cannot automatically detect
-    the separator, but the Python parsing engine can, meaning the latter will
-    be used automatically. In addition, separators longer than 1 character and
-    different from ``'\s+'`` will be interpreted as regular expressions and
-    will also force the use of the Python parsing engine. Note that regex
-    delimiters are prone to ignoring quoted data. Regex example: ``'\r\t'``"""
-
-_read_csv_doc = """
-Read CSV (comma-separated) file into DataFrame
-
-%s
-""" % (_parser_params % (_sep_doc.format(default="','"), _engine_doc))
-
-_read_table_doc = """
-Read general delimited file into DataFrame
-
-%s
-""" % (_parser_params % (_sep_doc.format(default="\\t (tab-stop)"),
-                         _engine_doc))
-
-_fwf_widths = """\
-colspecs : list of pairs (int, int) or 'infer'. optional
-    A list of pairs (tuples) giving the extents of the fixed-width
-    fields of each line as half-open intervals (i.e.,  [from, to[ ).
-    String value 'infer' can be used to instruct the parser to try
-    detecting the column specifications from the first 100 rows of
-    the data which are not being skipped via skiprows (default='infer').
-widths : list of ints. optional
-    A list of field widths which can be used instead of 'colspecs' if
-    the intervals are contiguous.
+DataFrame or TextParser
+    A comma-separated values (csv) file is returned as two-dimensional
+    data structure with labeled axes.
+
+See Also
+--------
+to_csv : Write DataFrame to a comma-separated values (csv) file.
+read_csv : Read a comma-separated values (csv) file into DataFrame.
+read_fwf : Read a table of fixed-width formatted lines into DataFrame.
+
+Examples
+--------
+>>> pd.{func_name}('data.csv')  # doctest: +SKIP
 """
 
-_read_fwf_doc = """
-Read a table of fixed-width formatted lines into DataFrame
-
-%s
-
-Also, 'delimiter' is used to specify the filler character of the
-fields if it is not spaces (e.g., '~').
-""" % (_parser_params % (_fwf_widths, ''))
-
 
 def _validate_integer(name, val, min_val=0):
     """
@@ -377,6 +374,32 @@ def _validate_integer(name, val, min_val=0):
     return val
 
 
+def _validate_names(names):
+    """
+    Check if the `names` parameter contains duplicates.
+
+    If duplicates are found, we issue a warning before returning.
+
+    Parameters
+    ----------
+    names : array-like or None
+        An array containing a list of the names used for the output DataFrame.
+
+    Returns
+    -------
+    names : array-like or None
+        The original `names` parameter.
+    """
+
+    if names is not None:
+        if len(names) != len(set(names)):
+            msg = ("Duplicate names specified. This "
+                   "will raise an error in the future.")
+            warnings.warn(msg, UserWarning, stacklevel=3)
+
+    return names
+
+
 def _read(filepath_or_buffer, kwds):
     """Generic reader of line files."""
     encoding = kwds.get('encoding', None)
@@ -384,9 +407,9 @@ def _read(filepath_or_buffer, kwds):
         encoding = re.sub('_', '-', encoding).lower()
         kwds['encoding'] = encoding
 
-    compression = kwds.get('compression')
+    compression = kwds.get('compression', 'infer')
     compression = _infer_compression(filepath_or_buffer, compression)
-    filepath_or_buffer, _, compression = get_filepath_or_buffer(
+    filepath_or_buffer, _, compression, should_close = get_filepath_or_buffer(
         filepath_or_buffer, encoding, compression)
     kwds['compression'] = compression
 
@@ -397,7 +420,10 @@ def _read(filepath_or_buffer, kwds):
     # Extract some of the arguments (pass chunksize on).
     iterator = kwds.get('iterator', False)
     chunksize = _validate_integer('chunksize', kwds.get('chunksize', None), 1)
-    nrows = _validate_integer('nrows', kwds.get('nrows', None))
+    nrows = kwds.get('nrows', None)
+
+    # Check for duplicates in names.
+    _validate_names(kwds.get("names", None))
 
     # Create the parser.
     parser = TextFileReader(filepath_or_buffer, **kwds)
@@ -409,16 +435,23 @@ def _read(filepath_or_buffer, kwds):
         data = parser.read(nrows)
     finally:
         parser.close()
+
+    if should_close:
+        try:
+            filepath_or_buffer.close()
+        except ValueError:
+            pass
+
     return data
 
 
 _parser_defaults = {
     'delimiter': None,
 
-    'doublequote': True,
     'escapechar': None,
     'quotechar': '"',
     'quoting': csv.QUOTE_MINIMAL,
+    'doublequote': True,
     'skipinitialspace': False,
     'lineterminator': None,
 
@@ -427,14 +460,16 @@ def _read(filepath_or_buffer, kwds):
     'names': None,
     'prefix': None,
     'skiprows': None,
+    'skipfooter': 0,
+    'nrows': None,
     'na_values': None,
+    'keep_default_na': True,
+
     'true_values': None,
     'false_values': None,
     'converters': None,
     'dtype': None,
-    'skipfooter': 0,
 
-    'keep_default_na': True,
     'thousands': None,
     'comment': None,
     'decimal': b'.',
@@ -444,10 +479,8 @@ def _read(filepath_or_buffer, kwds):
     'keep_date_col': False,
     'dayfirst': False,
     'date_parser': None,
-
     'usecols': None,
 
-    'nrows': None,
     # 'iterator': False,
     'chunksize': None,
     'verbose': False,
@@ -463,42 +496,42 @@ def _read(filepath_or_buffer, kwds):
 
 _c_parser_defaults = {
     'delim_whitespace': False,
-    'as_recarray': False,
     'na_filter': True,
-    'compact_ints': False,
-    'use_unsigned': False,
     'low_memory': True,
     'memory_map': False,
-    'buffer_lines': None,
     'error_bad_lines': True,
     'warn_bad_lines': True,
+    'tupleize_cols': False,
     'float_precision': None
 }
 
 _fwf_defaults = {
     'colspecs': 'infer',
+    'infer_nrows': 100,
     'widths': None,
 }
 
-_c_unsupported = set(['skipfooter'])
-_python_unsupported = set([
+_c_unsupported = {'skipfooter'}
+_python_unsupported = {
     'low_memory',
-    'buffer_lines',
-    'error_bad_lines',
-    'warn_bad_lines',
     'float_precision',
-])
-_deprecated_args = set([
-    'as_recarray',
-    'buffer_lines',
-    'compact_ints',
-    'use_unsigned',
-])
+}
 
+_deprecated_defaults = {
+    'tupleize_cols': None
+}
+_deprecated_args = {
+    'tupleize_cols',
+}
 
-def _make_parser_function(name, sep=','):
 
-    default_sep = sep
+def _make_parser_function(name, default_sep=','):
+
+    # prepare read_table deprecation
+    if name == "read_table":
+        sep = False
+    else:
+        sep = default_sep
 
     def parser_f(filepath_or_buffer,
                  sep=sep,
@@ -521,6 +554,7 @@ def parser_f(filepath_or_buffer,
                  false_values=None,
                  skipinitialspace=False,
                  skiprows=None,
+                 skipfooter=0,
                  nrows=None,
 
                  # NA and Missing Data Handling
@@ -548,35 +582,59 @@ def parser_f(filepath_or_buffer,
                  lineterminator=None,
                  quotechar='"',
                  quoting=csv.QUOTE_MINIMAL,
+                 doublequote=True,
                  escapechar=None,
                  comment=None,
                  encoding=None,
                  dialect=None,
-                 tupleize_cols=False,
+                 tupleize_cols=None,
 
                  # Error Handling
                  error_bad_lines=True,
                  warn_bad_lines=True,
 
-                 skipfooter=0,
-                 skip_footer=0,  # deprecated
-
                  # Internal
-                 doublequote=True,
                  delim_whitespace=False,
-                 as_recarray=False,
-                 compact_ints=False,
-                 use_unsigned=False,
                  low_memory=_c_parser_defaults['low_memory'],
-                 buffer_lines=None,
                  memory_map=False,
                  float_precision=None):
 
+        # deprecate read_table GH21948
+        if name == "read_table":
+            if sep is False and delimiter is None:
+                warnings.warn("read_table is deprecated, use read_csv "
+                              "instead, passing sep='\\t'.",
+                              FutureWarning, stacklevel=2)
+            else:
+                warnings.warn("read_table is deprecated, use read_csv "
+                              "instead.",
+                              FutureWarning, stacklevel=2)
+            if sep is False:
+                sep = default_sep
+
+        # gh-23761
+        #
+        # When a dialect is passed, it overrides any of the overlapping
+        # parameters passed in directly. We don't want to warn if the
+        # default parameters were passed in (since it probably means
+        # that the user didn't pass them in explicitly in the first place).
+        #
+        # "delimiter" is the annoying corner case because we alias it to
+        # "sep" before doing comparison to the dialect values later on.
+        # Thus, we need a flag to indicate that we need to "override"
+        # the comparison to dialect values by checking if default values
+        # for BOTH "delimiter" and "sep" were provided.
+        if dialect is not None:
+            sep_override = delimiter is None and sep == default_sep
+            kwds = dict(sep_override=sep_override)
+        else:
+            kwds = dict()
+
         # Alias sep -> delimiter.
         if delimiter is None:
             delimiter = sep
 
-        if delim_whitespace and delimiter is not default_sep:
+        if delim_whitespace and delimiter != default_sep:
             raise ValueError("Specified a delimiter with both sep and"
                              " delim_whitespace=True; you can only"
                              " specify one.")
@@ -587,14 +645,7 @@ def parser_f(filepath_or_buffer,
             engine = 'c'
             engine_specified = False
 
-        if skip_footer != 0:
-            warnings.warn("The 'skip_footer' argument has "
-                          "been deprecated and will be removed "
-                          "in a future version. Please use the "
-                          "'skipfooter' argument instead.",
-                          FutureWarning, stacklevel=2)
-
-        kwds = dict(delimiter=delimiter,
+        kwds.update(delimiter=delimiter,
                     engine=engine,
                     dialect=dialect,
                     compression=compression,
@@ -612,6 +663,7 @@ def parser_f(filepath_or_buffer,
                     names=names,
                     prefix=prefix,
                     skiprows=skiprows,
+                    skipfooter=skipfooter,
                     na_values=na_values,
                     true_values=true_values,
                     false_values=false_values,
@@ -628,7 +680,6 @@ def parser_f(filepath_or_buffer,
                     nrows=nrows,
                     iterator=iterator,
                     chunksize=chunksize,
-                    skipfooter=skipfooter or skip_footer,
                     converters=converters,
                     dtype=dtype,
                     usecols=usecols,
@@ -639,14 +690,10 @@ def parser_f(filepath_or_buffer,
                     float_precision=float_precision,
 
                     na_filter=na_filter,
-                    compact_ints=compact_ints,
-                    use_unsigned=use_unsigned,
                     delim_whitespace=delim_whitespace,
-                    as_recarray=as_recarray,
                     warn_bad_lines=warn_bad_lines,
                     error_bad_lines=error_bad_lines,
                     low_memory=low_memory,
-                    buffer_lines=buffer_lines,
                     mangle_dupe_cols=mangle_dupe_cols,
                     tupleize_cols=tupleize_cols,
                     infer_datetime_format=infer_datetime_format,
@@ -659,15 +706,83 @@ def parser_f(filepath_or_buffer,
     return parser_f
 
 
-read_csv = _make_parser_function('read_csv', sep=',')
-read_csv = Appender(_read_csv_doc)(read_csv)
+read_csv = _make_parser_function('read_csv', default_sep=',')
+read_csv = Appender(_doc_read_csv_and_table.format(
+                    func_name='read_csv',
+                    summary=('Read a comma-separated values (csv) file '
+                             'into DataFrame.'),
+                    _default_sep="','")
+                    )(read_csv)
+
+read_table = _make_parser_function('read_table', default_sep='\t')
+read_table = Appender(_doc_read_csv_and_table.format(
+                      func_name='read_table',
+                      summary="""Read general delimited file into DataFrame.
+
+.. deprecated:: 0.24.0
+Use :func:`pandas.read_csv` instead, passing ``sep='\\t'`` if necessary.""",
+                      _default_sep=r"'\\t' (tab-stop)")
+                      )(read_table)
 
-read_table = _make_parser_function('read_table', sep='\t')
-read_table = Appender(_read_table_doc)(read_table)
 
+def read_fwf(filepath_or_buffer, colspecs='infer', widths=None,
+             infer_nrows=100, **kwds):
+
+    r"""
+    Read a table of fixed-width formatted lines into DataFrame.
+
+    Also supports optionally iterating or breaking of the file
+    into chunks.
+
+    Additional help can be found in the `online docs for IO Tools
+    <http://pandas.pydata.org/pandas-docs/stable/io.html>`_.
+
+    Parameters
+    ----------
+    filepath_or_buffer : str, path object, or file-like object
+        Any valid string path is acceptable. The string could be a URL. Valid
+        URL schemes include http, ftp, s3, and file. For file URLs, a host is
+        expected. A local file could be: file://localhost/path/to/table.csv.
+
+        If you want to pass in a path object, pandas accepts either
+        ``pathlib.Path`` or ``py._path.local.LocalPath``.
+
+        By file-like object, we refer to objects with a ``read()`` method,
+        such as a file handler (e.g. via builtin ``open`` function)
+        or ``StringIO``.
+    colspecs : list of tuple (int, int) or 'infer'. optional
+        A list of tuples giving the extents of the fixed-width
+        fields of each line as half-open intervals (i.e.,  [from, to[ ).
+        String value 'infer' can be used to instruct the parser to try
+        detecting the column specifications from the first 100 rows of
+        the data which are not being skipped via skiprows (default='infer').
+    widths : list of int, optional
+        A list of field widths which can be used instead of 'colspecs' if
+        the intervals are contiguous.
+    infer_nrows : int, default 100
+        The number of rows to consider when letting the parser determine the
+        `colspecs`.
+
+        .. versionadded:: 0.24.0
+    **kwds : optional
+        Optional keyword arguments can be passed to ``TextFileReader``.
+
+    Returns
+    -------
+    DataFrame or TextParser
+        A comma-separated values (csv) file is returned as two-dimensional
+        data structure with labeled axes.
+
+    See Also
+    --------
+    to_csv : Write DataFrame to a comma-separated values (csv) file.
+    read_csv : Read a comma-separated values (csv) file into DataFrame.
+
+    Examples
+    --------
+    >>> pd.read_fwf('data.csv')  # doctest: +SKIP
+    """
 
-@Appender(_read_fwf_doc)
-def read_fwf(filepath_or_buffer, colspecs='infer', widths=None, **kwds):
     # Check input arguments.
     if colspecs is None and widths is None:
         raise ValueError("Must specify either colspecs or widths")
@@ -683,6 +798,7 @@ def read_fwf(filepath_or_buffer, colspecs='infer', widths=None, **kwds):
             col += w
 
     kwds['colspecs'] = colspecs
+    kwds['infer_nrows'] = infer_nrows
     kwds['engine'] = 'python-fwf'
     return _read(filepath_or_buffer, kwds)
 
@@ -720,24 +836,39 @@ def __init__(self, f, engine=None, **kwds):
                 except AttributeError:
                     raise ValueError("Invalid dialect '{dialect}' provided"
                                      .format(dialect=kwds['dialect']))
-                provided = kwds.get(param, _parser_defaults[param])
+                parser_default = _parser_defaults[param]
+                provided = kwds.get(param, parser_default)
 
-                # Messages for conflicting values between the dialect instance
-                # and the actual parameters provided.
+                # Messages for conflicting values between the dialect
+                # instance and the actual parameters provided.
                 conflict_msgs = []
 
-                if dialect_val != provided:
-                    conflict_msgs.append((
-                        "Conflicting values for '{param}': '{val}' was "
-                        "provided, but the dialect specifies '{diaval}'. "
-                        "Using the dialect-specified value.".format(
-                            param=param, val=provided, diaval=dialect_val)))
+                # Don't warn if the default parameter was passed in,
+                # even if it conflicts with the dialect (gh-23761).
+                if provided != parser_default and provided != dialect_val:
+                    msg = ("Conflicting values for '{param}': '{val}' was "
+                           "provided, but the dialect specifies '{diaval}'. "
+                           "Using the dialect-specified value.".format(
+                               param=param, val=provided, diaval=dialect_val))
+
+                    # Annoying corner case for not warning about
+                    # conflicts between dialect and delimiter parameter.
+                    # Refer to the outer "_read_" function for more info.
+                    if not (param == "delimiter" and
+                            kwds.pop("sep_override", False)):
+                        conflict_msgs.append(msg)
 
                 if conflict_msgs:
                     warnings.warn('\n\n'.join(conflict_msgs), ParserWarning,
                                   stacklevel=2)
                 kwds[param] = dialect_val
 
+        if kwds.get("skipfooter"):
+            if kwds.get("iterator") or kwds.get("chunksize"):
+                raise ValueError("'skipfooter' not supported for 'iteration'")
+            if kwds.get("nrows"):
+                raise ValueError("'skipfooter' not supported with 'nrows'")
+
         if kwds.get('header', 'infer') == 'infer':
             kwds['header'] = 0 if kwds.get('names') is None else None
 
@@ -755,7 +886,9 @@ def __init__(self, f, engine=None, **kwds):
         self.squeeze = options.pop('squeeze', False)
 
         # might mutate self.engine
+        self.engine = self._check_file_or_buffer(f, engine)
         self.options, self.engine = self._clean_options(options, engine)
+
         if 'has_index_names' in kwds:
             self.options['has_index_names'] = kwds['has_index_names']
 
@@ -787,12 +920,14 @@ def _get_options_with_defaults(self, engine):
                     if ('python' in engine and
                             argname not in _python_unsupported):
                         pass
+                    elif value == _deprecated_defaults.get(argname, default):
+                        pass
                     else:
                         raise ValueError(
                             'The %r option is not supported with the'
                             ' %r engine' % (argname, engine))
             else:
-                value = default
+                value = _deprecated_defaults.get(argname, default)
             options[argname] = value
 
         if engine == 'python-fwf':
@@ -801,6 +936,23 @@ def _get_options_with_defaults(self, engine):
 
         return options
 
+    def _check_file_or_buffer(self, f, engine):
+        # see gh-16530
+        if is_file_like(f):
+            next_attr = "__next__" if PY3 else "next"
+
+            # The C engine doesn't need the file-like to have the "next" or
+            # "__next__" attribute. However, the Python engine explicitly calls
+            # "next(...)" when iterating through such an object, meaning it
+            # needs to have that attribute ("next" for Python 2.x, "__next__"
+            # for Python 3.x)
+            if engine != "c" and not hasattr(f, next_attr):
+                msg = ("The 'python' engine cannot iterate "
+                       "through this file buffer.")
+                raise ValueError(msg)
+
+        return engine
+
     def _clean_options(self, options, engine):
         result = options.copy()
 
@@ -813,30 +965,30 @@ def _clean_options(self, options, engine):
         # C engine not supported yet
         if engine == 'c':
             if options['skipfooter'] > 0:
-                fallback_reason = "the 'c' engine does not support"\
-                                  " skipfooter"
+                fallback_reason = ("the 'c' engine does not support"
+                                   " skipfooter")
                 engine = 'python'
 
         encoding = sys.getfilesystemencoding() or 'utf-8'
         if sep is None and not delim_whitespace:
             if engine == 'c':
-                fallback_reason = "the 'c' engine does not support"\
-                                  " sep=None with delim_whitespace=False"
+                fallback_reason = ("the 'c' engine does not support"
+                                   " sep=None with delim_whitespace=False")
                 engine = 'python'
         elif sep is not None and len(sep) > 1:
-            if engine == 'c' and sep == '\s+':
+            if engine == 'c' and sep == r'\s+':
                 result['delim_whitespace'] = True
                 del result['delimiter']
             elif engine not in ('python', 'python-fwf'):
                 # wait until regex engine integrated
-                fallback_reason = "the 'c' engine does not support"\
-                                  " regex separators (separators > 1 char and"\
-                                  " different from '\s+' are"\
-                                  " interpreted as regex)"
+                fallback_reason = ("the 'c' engine does not support"
+                                   " regex separators (separators > 1 char and"
+                                   r" different from '\s+' are"
+                                   " interpreted as regex)")
                 engine = 'python'
         elif delim_whitespace:
             if 'python' in engine:
-                result['delimiter'] = '\s+'
+                result['delimiter'] = r'\s+'
         elif sep is not None:
             encodeable = True
             try:
@@ -845,10 +997,10 @@ def _clean_options(self, options, engine):
             except UnicodeDecodeError:
                 encodeable = False
             if not encodeable and engine not in ('python', 'python-fwf'):
-                fallback_reason = "the separator encoded in {encoding}" \
-                                  " is > 1 char long, and the 'c' engine" \
-                                  " does not support such separators".format(
-                                      encoding=encoding)
+                fallback_reason = ("the separator encoded in {encoding}"
+                                   " is > 1 char long, and the 'c' engine"
+                                   " does not support such separators"
+                                   .format(encoding=encoding))
                 engine = 'python'
 
         quotechar = options['quotechar']
@@ -892,24 +1044,27 @@ def _clean_options(self, options, engine):
         na_values = options['na_values']
         skiprows = options['skiprows']
 
-        # really delete this one
-        keep_default_na = result.pop('keep_default_na')
-
         _validate_header_arg(options['header'])
 
         depr_warning = ''
 
         for arg in _deprecated_args:
             parser_default = _c_parser_defaults[arg]
+            depr_default = _deprecated_defaults[arg]
+
             msg = ("The '{arg}' argument has been deprecated "
                    "and will be removed in a future version."
                    .format(arg=arg))
 
-            if arg == 'as_recarray':
-                msg += ' Please call pd.to_csv(...).to_records() instead.'
+            if arg == 'tupleize_cols':
+                msg += (' Column tuples will then '
+                        'always be converted to MultiIndex.')
 
-            if result.get(arg, parser_default) != parser_default:
+            if result.get(arg, depr_default) != depr_default:
+                # raise Exception(result.get(arg, depr_default), depr_default)
                 depr_warning += msg + '\n\n'
+            else:
+                result[arg] = parser_default
 
         if depr_warning != '':
             warnings.warn(depr_warning, FutureWarning, stacklevel=2)
@@ -933,6 +1088,7 @@ def _clean_options(self, options, engine):
             converters = {}
 
         # Converting values to NA
+        keep_default_na = options['keep_default_na']
         na_values, na_fvalues = _clean_na_values(na_values, keep_default_na)
 
         # handle skiprows; this is internally handled by the
@@ -969,21 +1125,19 @@ def _make_engine(self, engine='c'):
                 klass = PythonParser
             elif engine == 'python-fwf':
                 klass = FixedWidthFieldParser
+            else:
+                raise ValueError('Unknown engine: {engine} (valid options are'
+                                 ' "c", "python", or' ' "python-fwf")'.format(
+                                     engine=engine))
             self._engine = klass(self.f, **self.options)
 
     def _failover_to_python(self):
         raise AbstractMethodError(self)
 
     def read(self, nrows=None):
-        if nrows is not None:
-            if self.options.get('skipfooter'):
-                raise ValueError('skipfooter not supported for iteration')
-
+        nrows = _validate_integer('nrows', nrows)
         ret = self._engine.read(nrows)
 
-        if self.options.get('as_recarray'):
-            return ret
-
         # May alter columns / col_dict
         index, columns, col_dict = self._create_index(ret)
 
@@ -1023,6 +1177,24 @@ def _is_index_col(col):
     return col is not None and col is not False
 
 
+def _is_potential_multi_index(columns):
+    """
+    Check whether or not the `columns` parameter
+    could be converted into a MultiIndex.
+
+    Parameters
+    ----------
+    columns : array-like
+        Object which may or may not be convertible into a MultiIndex
+
+    Returns
+    -------
+    boolean : Whether or not columns could become a MultiIndex
+    """
+    return (len(columns) and not isinstance(columns, MultiIndex) and
+            all(isinstance(c, tuple) for c in columns))
+
+
 def _evaluate_usecols(usecols, names):
     """
     Check whether or not the 'usecols' parameter
@@ -1032,11 +1204,73 @@ def _evaluate_usecols(usecols, names):
     If not a callable, returns 'usecols'.
     """
     if callable(usecols):
-        return set([i for i, name in enumerate(names)
-                    if usecols(name)])
+        return {i for i, name in enumerate(names) if usecols(name)}
     return usecols
 
 
+def _validate_usecols_names(usecols, names):
+    """
+    Validates that all usecols are present in a given
+    list of names. If not, raise a ValueError that
+    shows what usecols are missing.
+
+    Parameters
+    ----------
+    usecols : iterable of usecols
+        The columns to validate are present in names.
+    names : iterable of names
+        The column names to check against.
+
+    Returns
+    -------
+    usecols : iterable of usecols
+        The `usecols` parameter if the validation succeeds.
+
+    Raises
+    ------
+    ValueError : Columns were missing. Error message will list them.
+    """
+    missing = [c for c in usecols if c not in names]
+    if len(missing) > 0:
+        raise ValueError(
+            "Usecols do not match columns, "
+            "columns expected but not found: {missing}".format(missing=missing)
+        )
+
+    return usecols
+
+
+def _validate_skipfooter_arg(skipfooter):
+    """
+    Validate the 'skipfooter' parameter.
+
+    Checks whether 'skipfooter' is a non-negative integer.
+    Raises a ValueError if that is not the case.
+
+    Parameters
+    ----------
+    skipfooter : non-negative integer
+        The number of rows to skip at the end of the file.
+
+    Returns
+    -------
+    validated_skipfooter : non-negative integer
+        The original input if the validation succeeds.
+
+    Raises
+    ------
+    ValueError : 'skipfooter' was not a non-negative integer.
+    """
+
+    if not is_integer(skipfooter):
+        raise ValueError("skipfooter must be an integer")
+
+    if skipfooter < 0:
+        raise ValueError("skipfooter cannot be negative")
+
+    return skipfooter
+
+
 def _validate_usecols_arg(usecols):
     """
     Validate the 'usecols' parameter.
@@ -1047,7 +1281,7 @@ def _validate_usecols_arg(usecols):
 
     Parameters
     ----------
-    usecols : array-like, callable, or None
+    usecols : list-like, callable, or None
         List of columns to use when parsing or a callable that can be used
         to filter a list of table columns.
 
@@ -1062,18 +1296,33 @@ def _validate_usecols_arg(usecols):
         'usecols_dtype` is the inferred dtype of 'usecols' if an array-like
         is passed in or None if a callable or None is passed in.
     """
-    msg = ("'usecols' must either be all strings, all unicode, "
-           "all integers or a callable")
-
+    msg = ("'usecols' must either be list-like of all strings, all unicode, "
+           "all integers or a callable.")
     if usecols is not None:
         if callable(usecols):
             return usecols, None
-        usecols_dtype = lib.infer_dtype(usecols)
-        if usecols_dtype not in ('empty', 'integer',
-                                 'string', 'unicode'):
+
+        if not is_list_like(usecols):
+            # see gh-20529
+            #
+            # Ensure it is iterable container but not string.
             raise ValueError(msg)
 
-        return set(usecols), usecols_dtype
+        usecols_dtype = lib.infer_dtype(usecols, skipna=False)
+
+        if usecols_dtype not in ("empty", "integer",
+                                 "string", "unicode"):
+            raise ValueError(msg)
+
+        usecols = set(usecols)
+
+        if usecols_dtype == "unicode":
+            # see gh-13253
+            #
+            # Python 2.x compatibility
+            usecols = {col.encode("utf-8") for col in usecols}
+
+        return usecols, usecols_dtype
     return usecols, None
 
 
@@ -1106,6 +1355,7 @@ def __init__(self, kwds):
         self.prefix = kwds.pop('prefix', None)
 
         self.index_col = kwds.get('index_col', None)
+        self.unnamed_cols = set()
         self.index_names = None
         self.col_names = None
 
@@ -1117,9 +1367,11 @@ def __init__(self, kwds):
 
         self.na_values = kwds.get('na_values')
         self.na_fvalues = kwds.get('na_fvalues')
+        self.na_filter = kwds.get('na_filter', False)
+        self.keep_default_na = kwds.get('keep_default_na', True)
+
         self.true_values = kwds.get('true_values')
         self.false_values = kwds.get('false_values')
-        self.as_recarray = kwds.get('as_recarray', False)
         self.tupleize_cols = kwds.get('tupleize_cols', False)
         self.mangle_dupe_cols = kwds.get('mangle_dupe_cols', True)
         self.infer_datetime_format = kwds.pop('infer_datetime_format', False)
@@ -1133,9 +1385,8 @@ def __init__(self, kwds):
         # validate header options for mi
         self.header = kwds.get('header')
         if isinstance(self.header, (list, tuple, np.ndarray)):
-            if kwds.get('as_recarray'):
-                raise ValueError("cannot specify as_recarray when "
-                                 "specifying a multi-index header")
+            if not all(map(is_integer, self.header)):
+                raise ValueError("header must be integer or list of integers")
             if kwds.get('usecols'):
                 raise ValueError("cannot specify usecols when "
                                  "specifying a multi-index header")
@@ -1153,6 +1404,10 @@ def __init__(self, kwds):
                     raise ValueError("index_col must only contain row numbers "
                                      "when specifying a multi-index header")
 
+        # GH 16338
+        elif self.header is not None and not is_integer(self.header):
+            raise ValueError("header must be integer or list of integers")
+
         self._name_processed = False
 
         self._first_chunk = True
@@ -1210,33 +1465,32 @@ def _extract_multi_indexer_columns(self, header, index_names, col_names,
         # clean the index_names
         index_names = header.pop(-1)
         index_names, names, index_col = _clean_index_names(index_names,
-                                                           self.index_col)
+                                                           self.index_col,
+                                                           self.unnamed_cols)
 
         # extract the columns
         field_count = len(header[0])
 
         def extract(r):
-            return tuple([r[i] for i in range(field_count) if i not in sic])
+            return tuple(r[i] for i in range(field_count) if i not in sic)
 
         columns = lzip(*[extract(r) for r in header])
         names = ic + columns
 
-        def tostr(x):
-            return str(x) if not isinstance(x, compat.string_types) else x
-
-        # if we find 'Unnamed' all of a single level, then our header was too
-        # long
+        # If we find unnamed columns all in a single
+        # level, then our header was too long.
         for n in range(len(columns[0])):
-            if all(['Unnamed' in tostr(c[n]) for c in columns]):
+            if all(compat.to_str(c[n]) in self.unnamed_cols for c in columns):
                 raise ParserError(
                     "Passed header=[%s] are too many rows for this "
                     "multi_index of columns"
-                    % ','.join([str(x) for x in self.header])
+                    % ','.join(str(x) for x in self.header)
                 )
 
-        # clean the column names (if we have an index_col)
+        # Clean the column names (if we have an index_col).
         if len(ic):
-            col_names = [r[0] if len(r[0]) and 'Unnamed' not in r[0] else None
+            col_names = [r[0] if (len(r[0]) and
+                                  r[0] not in self.unnamed_cols) else None
                          for r in header]
         else:
             col_names = [None] * len(header)
@@ -1253,23 +1507,29 @@ def _maybe_dedup_names(self, names):
         # would be nice!
         if self.mangle_dupe_cols:
             names = list(names)  # so we can index
-            counts = {}
+            counts = defaultdict(int)
+            is_potential_mi = _is_potential_multi_index(names)
 
             for i, col in enumerate(names):
-                cur_count = counts.get(col, 0)
+                cur_count = counts[col]
 
-                if cur_count > 0:
-                    names[i] = '%s.%d' % (col, cur_count)
+                while cur_count > 0:
+                    counts[col] = cur_count + 1
 
+                    if is_potential_mi:
+                        col = col[:-1] + ('%s.%d' % (col[-1], cur_count),)
+                    else:
+                        col = '%s.%d' % (col, cur_count)
+                    cur_count = counts[col]
+
+                names[i] = col
                 counts[col] = cur_count + 1
 
         return names
 
     def _maybe_make_multi_index_columns(self, columns, col_names=None):
         # possibly create a column mi here
-        if (not self.tupleize_cols and len(columns) and
-                not isinstance(columns, MultiIndex) and
-                all([isinstance(c, tuple) for c in columns])):
+        if _is_potential_multi_index(columns):
             columns = MultiIndex.from_tuples(columns, names=col_names)
         return columns
 
@@ -1280,12 +1540,12 @@ def _make_index(self, data, alldata, columns, indexnamerow=False):
         elif not self._has_complex_date_col:
             index = self._get_simple_index(alldata, columns)
             index = self._agg_index(index)
-
         elif self._has_complex_date_col:
             if not self._name_processed:
                 (self.index_names, _,
                  self.index_col) = _clean_index_names(list(columns),
-                                                      self.index_col)
+                                                      self.index_col,
+                                                      self.unnamed_cols)
                 self._name_processed = True
             index = self._get_complex_date_index(data, columns)
             index = self._agg_index(index, try_parse_dates=False)
@@ -1307,7 +1567,6 @@ def ix(col):
             if not isinstance(col, compat.string_types):
                 return col
             raise ValueError('Index %s invalid' % col)
-        index = None
 
         to_remove = []
         index = []
@@ -1338,8 +1597,6 @@ def _get_name(icol):
                 if i == icol:
                     return c
 
-        index = None
-
         to_remove = []
         index = []
         for idx in self.index_col:
@@ -1360,22 +1617,28 @@ def _agg_index(self, index, try_parse_dates=True):
 
         for i, arr in enumerate(index):
 
-            if (try_parse_dates and self._should_parse_dates(i)):
+            if try_parse_dates and self._should_parse_dates(i):
                 arr = self._date_conv(arr)
 
-            col_na_values = self.na_values
-            col_na_fvalues = self.na_fvalues
+            if self.na_filter:
+                col_na_values = self.na_values
+                col_na_fvalues = self.na_fvalues
+            else:
+                col_na_values = set()
+                col_na_fvalues = set()
 
             if isinstance(self.na_values, dict):
                 col_name = self.index_names[i]
                 if col_name is not None:
                     col_na_values, col_na_fvalues = _get_na_values(
-                        col_name, self.na_values, self.na_fvalues)
+                        col_name, self.na_values, self.na_fvalues,
+                        self.keep_default_na)
 
             arr, _ = self._infer_types(arr, col_na_values | col_na_fvalues)
             arrays.append(arr)
 
-        index = MultiIndex.from_arrays(arrays, names=self.index_names)
+        names = self.index_names
+        index = ensure_index_from_sequences(arrays, names)
 
         return index
 
@@ -1392,7 +1655,7 @@ def _convert_to_ndarrays(self, dct, na_values, na_fvalues, verbose=False,
 
             if self.na_filter:
                 col_na_values, col_na_fvalues = _get_na_values(
-                    c, na_values, na_fvalues)
+                    c, na_values, na_fvalues, self.keep_default_na)
             else:
                 col_na_values, col_na_fvalues = set(), set()
 
@@ -1415,23 +1678,32 @@ def _convert_to_ndarrays(self, dct, na_values, na_fvalues, verbose=False,
                     values, set(col_na_values) | col_na_fvalues,
                     try_num_bool=False)
             else:
+                is_str_or_ea_dtype = (is_string_dtype(cast_type)
+                                      or is_extension_array_dtype(cast_type))
                 # skip inference if specified dtype is object
-                try_num_bool = not (cast_type and is_string_dtype(cast_type))
+                # or casting to an EA
+                try_num_bool = not (cast_type and is_str_or_ea_dtype)
 
                 # general type inference and conversion
                 cvals, na_count = self._infer_types(
                     values, set(col_na_values) | col_na_fvalues,
                     try_num_bool)
 
-                # type specificed in dtype param
-                if cast_type and not is_dtype_equal(cvals, cast_type):
+                # type specified in dtype param or cast_type is an EA
+                if cast_type and (not is_dtype_equal(cvals, cast_type)
+                                  or is_extension_array_dtype(cast_type)):
+                    try:
+                        if (is_bool_dtype(cast_type) and
+                                not is_categorical_dtype(cast_type)
+                                and na_count > 0):
+                            raise ValueError("Bool column has NA values in "
+                                             "column {column}"
+                                             .format(column=c))
+                    except (AttributeError, TypeError):
+                        # invalid input to is_bool_dtype
+                        pass
                     cvals = self._cast_types(cvals, cast_type, c)
 
-            if issubclass(cvals.dtype.type, np.integer) and self.compact_ints:
-                cvals = lib.downcast_int64(
-                    cvals, libparsers.na_values,
-                    self.use_unsigned)
-
             result[c] = cvals
             if verbose and na_count:
                 print('Filled %d NA values in column %s' % (na_count, str(c)))
@@ -1453,7 +1725,6 @@ def _infer_types(self, values, na_values, try_num_bool=True):
         converted : ndarray
         na_count : int
         """
-
         na_count = 0
         if issubclass(values.dtype.type, (np.number, np.bool_)):
             mask = algorithms.isin(values, list(na_values))
@@ -1467,20 +1738,21 @@ def _infer_types(self, values, na_values, try_num_bool=True):
         if try_num_bool:
             try:
                 result = lib.maybe_convert_numeric(values, na_values, False)
-                na_count = isnull(result).sum()
+                na_count = isna(result).sum()
             except Exception:
                 result = values
                 if values.dtype == np.object_:
-                    na_count = lib.sanitize_objects(result, na_values, False)
+                    na_count = parsers.sanitize_objects(result,
+                                                        na_values, False)
         else:
             result = values
             if values.dtype == np.object_:
-                na_count = lib.sanitize_objects(values, na_values, False)
+                na_count = parsers.sanitize_objects(values, na_values, False)
 
         if result.dtype == np.object_ and try_num_bool:
-            result = lib.maybe_convert_bool(values,
-                                            true_values=self.true_values,
-                                            false_values=self.false_values)
+            result = libops.maybe_convert_bool(np.asarray(values),
+                                               true_values=self.true_values,
+                                               false_values=self.false_values)
 
         return result, na_count
 
@@ -1502,15 +1774,38 @@ def _cast_types(self, values, cast_type, column):
         """
 
         if is_categorical_dtype(cast_type):
-            # XXX this is for consistency with
-            # c-parser which parses all categories
-            # as strings
-            if not is_object_dtype(values):
+            known_cats = (isinstance(cast_type, CategoricalDtype) and
+                          cast_type.categories is not None)
+
+            if not is_object_dtype(values) and not known_cats:
+                # XXX this is for consistency with
+                # c-parser which parses all categories
+                # as strings
                 values = astype_nansafe(values, str)
-            values = Categorical(values)
+
+            cats = Index(values).unique().dropna()
+            values = Categorical._from_inferred_categories(
+                cats, cats.get_indexer(values), cast_type,
+                true_values=self.true_values)
+
+        # use the EA's implementation of casting
+        elif is_extension_array_dtype(cast_type):
+            # ensure cast_type is an actual dtype and not a string
+            cast_type = pandas_dtype(cast_type)
+            array_type = cast_type.construct_array_type()
+            try:
+                return array_type._from_sequence_of_strings(values,
+                                                            dtype=cast_type)
+            except NotImplementedError:
+                raise NotImplementedError(
+                    "Extension Array: {ea} must implement "
+                    "_from_sequence_of_strings in order "
+                    "to be used in parser methods".format(ea=array_type))
+
         else:
             try:
-                values = astype_nansafe(values, cast_type, copy=True)
+                values = astype_nansafe(values, cast_type,
+                                        copy=True, skipna=True)
             except ValueError:
                 raise ValueError("Unable to convert column %s to "
                                  "type %s" % (column, cast_type))
@@ -1538,7 +1833,9 @@ def __init__(self, src, **kwds):
 
         ParserBase.__init__(self, kwds)
 
-        if 'utf-16' in (kwds.get('encoding') or ''):
+        if (kwds.get('compression') is None
+           and 'utf-16' in (kwds.get('encoding') or '')):
+            # if source is utf-16 plain text, convert source to utf-8
             if isinstance(src, compat.string_types):
                 src = open(src, 'rb')
                 self.handles.append(src)
@@ -1548,11 +1845,13 @@ def __init__(self, src, **kwds):
         # #2442
         kwds['allow_leading_cols'] = self.index_col is not False
 
-        self._reader = libparsers.TextReader(src, **kwds)
-
-        # XXX
+        # GH20529, validate usecol arg before TextReader
         self.usecols, self.usecols_dtype = _validate_usecols_arg(
-            self._reader.usecols)
+            kwds['usecols'])
+        kwds['usecols'] = self.usecols
+
+        self._reader = parsers.TextReader(src, **kwds)
+        self.unnamed_cols = self._reader.unnamed_cols
 
         passed_names = self.names is None
 
@@ -1589,12 +1888,18 @@ def __init__(self, src, **kwds):
 
         if self.usecols:
             usecols = _evaluate_usecols(self.usecols, self.orig_names)
+
+            # GH 14671
+            if (self.usecols_dtype == 'string' and
+                    not set(usecols).issubset(self.orig_names)):
+                _validate_usecols_names(usecols, self.orig_names)
+
             if len(self.names) > len(usecols):
                 self.names = [n for i, n in enumerate(self.names)
                               if (i in usecols or n in usecols)]
 
             if len(self.names) < len(usecols):
-                raise ValueError("Usecols do not match names.")
+                _validate_usecols_names(usecols, self.names)
 
         self._set_noconvert_columns()
 
@@ -1607,7 +1912,8 @@ def __init__(self, src, **kwds):
                 self._name_processed = True
                 (index_names, self.names,
                  self.index_col) = _clean_index_names(self.names,
-                                                      self.index_col)
+                                                      self.index_col,
+                                                      self.unnamed_cols)
 
                 if self.index_names is None:
                     self.index_names = index_names
@@ -1624,7 +1930,7 @@ def close(self):
         # close additional handles opened by C parser (for compression)
         try:
             self._reader.close()
-        except:
+        except ValueError:
             pass
 
     def _set_noconvert_columns(self):
@@ -1639,6 +1945,7 @@ def _set_noconvert_columns(self):
             # A set of integers will be converted to a list in
             # the correct order every single time.
             usecols = list(self.usecols)
+            usecols.sort()
         elif (callable(self.usecols) or
                 self.usecols_dtype not in ('empty', None)):
             # The names attribute should have the correct columns
@@ -1710,10 +2017,6 @@ def read(self, nrows=None):
         # Done with first read, next time raise StopIteration
         self._first_chunk = False
 
-        if self.as_recarray:
-            # what to do if there are leading columns?
-            return data
-
         names = self.names
 
         if self._reader.leading_cols:
@@ -1733,7 +2036,7 @@ def read(self, nrows=None):
                                                  try_parse_dates=True)
                 arrays.append(values)
 
-            index = MultiIndex.from_arrays(arrays)
+            index = ensure_index_from_sequences(arrays)
 
             if self.usecols is not None:
                 names = self._filter_usecols(names)
@@ -1742,7 +2045,7 @@ def read(self, nrows=None):
 
             # rename dict keys
             data = sorted(data.items())
-            data = dict((k, v) for k, (i, v) in zip(names, data))
+            data = {k: v for k, (i, v) in zip(names, data)}
 
             names, data = self._do_date_conversions(names, data)
 
@@ -1760,7 +2063,7 @@ def read(self, nrows=None):
             # columns as list
             alldata = [x[1] for x in data]
 
-            data = dict((k, v) for k, (i, v) in zip(names, data))
+            data = {k: v for k, (i, v) in zip(names, data)}
 
             names, data = self._do_date_conversions(names, data)
             index, names = self._make_index(data, alldata, names)
@@ -1784,7 +2087,8 @@ def _get_index_names(self):
 
         if self._reader.leading_cols == 0 and self.index_col is not None:
             (idx_names, names,
-             self.index_col) = _clean_index_names(names, self.index_col)
+             self.index_col) = _clean_index_names(names, self.index_col,
+                                                  self.unnamed_cols)
 
         return names, idx_names
 
@@ -1804,45 +2108,45 @@ def TextParser(*args, **kwds):
     ----------
     data : file-like object or list
     delimiter : separator character to use
-    dialect : str or csv.Dialect instance, default None
+    dialect : str or csv.Dialect instance, optional
         Ignored if delimiter is longer than 1 character
     names : sequence, default
     header : int, default 0
         Row to use to parse column labels. Defaults to the first row. Prior
         rows will be discarded
-    index_col : int or list, default None
+    index_col : int or list, optional
         Column or columns to use as the (possibly hierarchical) index
-    has_index_names: boolean, default False
+    has_index_names: bool, default False
         True if the cols defined in index_col have an index name and are
-        not in the header
-    na_values : scalar, str, list-like, or dict, default None
+        not in the header.
+    na_values : scalar, str, list-like, or dict, optional
         Additional strings to recognize as NA/NaN.
     keep_default_na : bool, default True
-    thousands : str, default None
+    thousands : str, optional
         Thousands separator
-    comment : str, default None
+    comment : str, optional
         Comment out remainder of line
-    parse_dates : boolean, default False
-    keep_date_col : boolean, default False
-    date_parser : function, default None
+    parse_dates : bool, default False
+    keep_date_col : bool, default False
+    date_parser : function, optional
     skiprows : list of integers
         Row numbers to skip
     skipfooter : int
         Number of line at bottom of file to skip
-    converters : dict, default None
+    converters : dict, optional
         Dict of functions for converting values in certain columns. Keys can
         either be integers or column labels, values are functions that take one
         input argument, the cell (not column) content, and return the
         transformed content.
-    encoding : string, default None
+    encoding : str, optional
         Encoding to use for UTF when reading/writing (ex. 'utf-8')
-    squeeze : boolean, default False
-        returns Series if only one column
-    infer_datetime_format: boolean, default False
+    squeeze : bool, default False
+        returns Series if only one column.
+    infer_datetime_format: bool, default False
         If True and `parse_dates` is True for a column, try to infer the
         datetime format based on the first datetime string. If the format
         can be inferred, there often will be a large parsing speed-up.
-    float_precision : string, default None
+    float_precision : str, optional
         Specifies which converter the C engine should use for floating-point
         values. The options are None for the ordinary converter,
         'high' for the high-precision converter, and 'round_trip' for the
@@ -1853,7 +2157,7 @@ def TextParser(*args, **kwds):
 
 
 def count_empty_vals(vals):
-    return sum([1 for v in vals if v == '' or v is None])
+    return sum(1 for v in vals if v == '' or v is None)
 
 
 class PythonParser(ParserBase):
@@ -1881,7 +2185,7 @@ def __init__(self, f, **kwds):
         else:
             self.skipfunc = lambda x: x in self.skiprows
 
-        self.skipfooter = kwds['skipfooter']
+        self.skipfooter = _validate_skipfooter_arg(kwds['skipfooter'])
         self.delimiter = kwds['delimiter']
 
         self.quotechar = kwds['quotechar']
@@ -1896,9 +2200,10 @@ def __init__(self, f, **kwds):
         self.usecols, _ = _validate_usecols_arg(kwds['usecols'])
         self.skip_blank_lines = kwds['skip_blank_lines']
 
-        self.names_passed = kwds['names'] or None
+        self.warn_bad_lines = kwds['warn_bad_lines']
+        self.error_bad_lines = kwds['error_bad_lines']
 
-        self.na_filter = kwds['na_filter']
+        self.names_passed = kwds['names'] or None
 
         self.has_index_names = False
         if 'has_index_names' in kwds:
@@ -1906,17 +2211,16 @@ def __init__(self, f, **kwds):
 
         self.verbose = kwds['verbose']
         self.converters = kwds['converters']
-        self.dtype = kwds['dtype']
 
-        self.compact_ints = kwds['compact_ints']
-        self.use_unsigned = kwds['use_unsigned']
+        self.dtype = kwds['dtype']
         self.thousands = kwds['thousands']
         self.decimal = kwds['decimal']
 
         self.comment = kwds['comment']
         self._comment_lines = []
 
-        f, handles = _get_handle(f, 'r', encoding=self.encoding,
+        mode = 'r' if PY3 else 'rb'
+        f, handles = _get_handle(f, mode, encoding=self.encoding,
                                  compression=self.compression,
                                  memory_map=self.memory_map)
         self.handles.extend(handles)
@@ -1928,9 +2232,10 @@ def __init__(self, f, **kwds):
             self.data = f
 
         # Get columns in two steps: infer from data, then
-        # infer column indices from self.usecols if is is specified.
+        # infer column indices from self.usecols if it is specified.
         self._col_indices = None
-        self.columns, self.num_original_columns = self._infer_columns()
+        (self.columns, self.num_original_columns,
+         self.unnamed_cols) = self._infer_columns()
 
         # Now self.columns has the set of columns that we will process.
         # The original set is stored in self.original_columns.
@@ -2114,9 +2419,6 @@ def read(self, rows=None):
         columns, data = self._do_date_conversions(columns, data)
 
         data = self._convert_data(data)
-        if self.as_recarray:
-            return self._to_recarray(data, columns)
-
         index, columns = self._make_index(data, alldata, columns, indexnamerow)
 
         return index, columns, data
@@ -2134,7 +2436,7 @@ def _exclude_implicit_index(self, alldata):
                     offset += 1
                 data[col] = alldata[i + offset]
         else:
-            data = dict((k, v) for k, v in zip(names, alldata))
+            data = {k: v for k, v in zip(names, alldata)}
 
         return data
 
@@ -2142,7 +2444,7 @@ def _exclude_implicit_index(self, alldata):
     def get_chunk(self, size=None):
         if size is None:
             size = self.chunksize
-        return self.read(nrows=size)
+        return self.read(rows=size)
 
     def _convert_data(self, data):
         # apply converters
@@ -2184,30 +2486,20 @@ def _clean_mapping(mapping):
                                          clean_na_fvalues, self.verbose,
                                          clean_conv, clean_dtypes)
 
-    def _to_recarray(self, data, columns):
-        dtypes = []
-        o = compat.OrderedDict()
-
-        # use the columns to "order" the keys
-        # in the unordered 'data' dictionary
-        for col in columns:
-            dtypes.append((str(col), data[col].dtype))
-            o[col] = data[col]
-
-        tuples = lzip(*o.values())
-        return np.array(tuples, dtypes)
-
     def _infer_columns(self):
         names = self.names
         num_original_columns = 0
         clear_buffer = True
+        unnamed_cols = set()
+
         if self.header is not None:
             header = self.header
 
-            # we have a mi columns, so read an extra line
             if isinstance(header, (list, tuple, np.ndarray)):
-                have_mi_columns = True
-                header = list(header) + [header[-1] + 1]
+                have_mi_columns = len(header) > 1
+                # we have a mi columns, so read an extra line
+                if have_mi_columns:
+                    header = list(header) + [header[-1] + 1]
             else:
                 have_mi_columns = False
                 header = [header]
@@ -2233,7 +2525,7 @@ def _infer_columns(self):
                         if clear_buffer:
                             self._clear_buffer()
                         columns.append([None] * len(columns[-1]))
-                        return columns, num_original_columns
+                        return columns, num_original_columns, unnamed_cols
 
                     if not self.names:
                         raise EmptyDataError(
@@ -2241,25 +2533,34 @@ def _infer_columns(self):
 
                     line = self.names[:]
 
-                unnamed_count = 0
                 this_columns = []
+                this_unnamed_cols = []
+
                 for i, c in enumerate(line):
                     if c == '':
                         if have_mi_columns:
-                            this_columns.append('Unnamed: %d_level_%d'
-                                                % (i, level))
+                            col_name = ("Unnamed: {i}_level_{level}"
+                                        .format(i=i, level=level))
                         else:
-                            this_columns.append('Unnamed: %d' % i)
-                        unnamed_count += 1
+                            col_name = "Unnamed: {i}".format(i=i)
+
+                        this_unnamed_cols.append(i)
+                        this_columns.append(col_name)
                     else:
                         this_columns.append(c)
 
                 if not have_mi_columns and self.mangle_dupe_cols:
-                    counts = {}
+                    counts = defaultdict(int)
+
                     for i, col in enumerate(this_columns):
-                        cur_count = counts.get(col, 0)
-                        if cur_count > 0:
-                            this_columns[i] = '%s.%d' % (col, cur_count)
+                        cur_count = counts[col]
+
+                        while cur_count > 0:
+                            counts[col] = cur_count + 1
+                            col = "%s.%d" % (col, cur_count)
+                            cur_count = counts[col]
+
+                        this_columns[i] = col
                         counts[col] = cur_count + 1
                 elif have_mi_columns:
 
@@ -2270,12 +2571,17 @@ def _infer_columns(self):
                         lc = len(this_columns)
                         ic = (len(self.index_col)
                               if self.index_col is not None else 0)
+                        unnamed_count = len(this_unnamed_cols)
+
                         if lc != unnamed_count and lc - ic > unnamed_count:
                             clear_buffer = False
                             this_columns = [None] * lc
                             self.buf = [self.buf[-1]]
 
                 columns.append(this_columns)
+                unnamed_cols.update({this_columns[i]
+                                     for i in this_unnamed_cols})
+
                 if len(columns) == 1:
                     num_original_columns = len(this_columns)
 
@@ -2340,7 +2646,7 @@ def _infer_columns(self):
                     columns = [names]
                     num_original_columns = ncols
 
-        return columns, num_original_columns
+        return columns, num_original_columns, unnamed_cols
 
     def _handle_usecols(self, columns, usecols_key):
         """
@@ -2351,14 +2657,18 @@ def _handle_usecols(self, columns, usecols_key):
         if self.usecols is not None:
             if callable(self.usecols):
                 col_indices = _evaluate_usecols(self.usecols, usecols_key)
-            elif any([isinstance(u, string_types) for u in self.usecols]):
+            elif any(isinstance(u, string_types) for u in self.usecols):
                 if len(columns) > 1:
                     raise ValueError("If using multiple headers, usecols must "
                                      "be integers.")
                 col_indices = []
+
                 for col in self.usecols:
                     if isinstance(col, string_types):
-                        col_indices.append(usecols_key.index(col))
+                        try:
+                            col_indices.append(usecols_key.index(col))
+                        except ValueError:
+                            _validate_usecols_names(self.usecols, usecols_key)
                     else:
                         col_indices.append(col)
             else:
@@ -2439,7 +2749,19 @@ def _check_for_bom(self, first_row):
             # return an empty string.
             return [""]
 
-    def _empty(self, line):
+    def _is_line_empty(self, line):
+        """
+        Check if a line is empty or not.
+
+        Parameters
+        ----------
+        line : str, array-like
+            The line of data to check.
+
+        Returns
+        -------
+        boolean : Whether or not the line is empty.
+        """
         return not line or all(not x for x in line)
 
     def _next_line(self):
@@ -2452,11 +2774,12 @@ def _next_line(self):
                     line = self._check_comments([self.data[self.pos]])[0]
                     self.pos += 1
                     # either uncommented or blank to begin with
-                    if not self.skip_blank_lines and (self._empty(self.data[
-                            self.pos - 1]) or line):
+                    if (not self.skip_blank_lines and
+                            (self._is_line_empty(
+                                self.data[self.pos - 1]) or line)):
                         break
                     elif self.skip_blank_lines:
-                        ret = self._check_empty([line])
+                        ret = self._remove_empty_lines([line])
                         if ret:
                             line = ret[0]
                             break
@@ -2468,35 +2791,19 @@ def _next_line(self):
                 next(self.data)
 
             while True:
-                try:
-                    orig_line = next(self.data)
-                except csv.Error as e:
-                    msg = str(e)
-
-                    if 'NULL byte' in str(e):
-                        msg = ('NULL byte detected. This byte '
-                               'cannot be processed in Python\'s '
-                               'native csv library at the moment, '
-                               'so please pass in engine=\'c\' instead')
-
-                    if self.skipfooter > 0:
-                        reason = ('Error could possibly be due to '
-                                  'parsing errors in the skipped footer rows '
-                                  '(the skipfooter keyword is only applied '
-                                  'after Python\'s csv library has parsed '
-                                  'all rows).')
-                        msg += '. ' + reason
-
-                    raise csv.Error(msg)
-                line = self._check_comments([orig_line])[0]
+                orig_line = self._next_iter_line(row_num=self.pos + 1)
                 self.pos += 1
-                if (not self.skip_blank_lines and
-                        (self._empty(orig_line) or line)):
-                    break
-                elif self.skip_blank_lines:
-                    ret = self._check_empty([line])
-                    if ret:
-                        line = ret[0]
+
+                if orig_line is not None:
+                    line = self._check_comments([orig_line])[0]
+
+                    if self.skip_blank_lines:
+                        ret = self._remove_empty_lines([line])
+
+                        if ret:
+                            line = ret[0]
+                            break
+                    elif self._is_line_empty(orig_line) or line:
                         break
 
         # This was the first line of the file,
@@ -2509,6 +2816,63 @@ def _next_line(self):
         self.buf.append(line)
         return line
 
+    def _alert_malformed(self, msg, row_num):
+        """
+        Alert a user about a malformed row.
+
+        If `self.error_bad_lines` is True, the alert will be `ParserError`.
+        If `self.warn_bad_lines` is True, the alert will be printed out.
+
+        Parameters
+        ----------
+        msg : The error message to display.
+        row_num : The row number where the parsing error occurred.
+                  Because this row number is displayed, we 1-index,
+                  even though we 0-index internally.
+        """
+
+        if self.error_bad_lines:
+            raise ParserError(msg)
+        elif self.warn_bad_lines:
+            base = 'Skipping line {row_num}: '.format(row_num=row_num)
+            sys.stderr.write(base + msg + '\n')
+
+    def _next_iter_line(self, row_num):
+        """
+        Wrapper around iterating through `self.data` (CSV source).
+
+        When a CSV error is raised, we check for specific
+        error messages that allow us to customize the
+        error message displayed to the user.
+
+        Parameters
+        ----------
+        row_num : The row number of the line being parsed.
+        """
+
+        try:
+            return next(self.data)
+        except csv.Error as e:
+            if self.warn_bad_lines or self.error_bad_lines:
+                msg = str(e)
+
+                if 'NULL byte' in msg:
+                    msg = ('NULL byte detected. This byte '
+                           'cannot be processed in Python\'s '
+                           'native csv library at the moment, '
+                           'so please pass in engine=\'c\' instead')
+
+                if self.skipfooter > 0:
+                    reason = ('Error could possibly be due to '
+                              'parsing errors in the skipped footer rows '
+                              '(the skipfooter keyword is only applied '
+                              'after Python\'s csv library has parsed '
+                              'all rows).')
+                    msg += '. ' + reason
+
+                self._alert_malformed(msg, row_num)
+            return None
+
     def _check_comments(self, lines):
         if self.comment is None:
             return lines
@@ -2527,7 +2891,22 @@ def _check_comments(self, lines):
             ret.append(rl)
         return ret
 
-    def _check_empty(self, lines):
+    def _remove_empty_lines(self, lines):
+        """
+        Iterate through the lines and remove any that are
+        either empty or contain only one whitespace value
+
+        Parameters
+        ----------
+        lines : array-like
+            The array of lines that we are to filter.
+
+        Returns
+        -------
+        filtered_lines : array-like
+            The same array of lines with the "empty" ones removed.
+        """
+
         ret = []
         for l in lines:
             # Remove empty lines and lines with only one whitespace value
@@ -2633,7 +3012,8 @@ def _get_index_name(self, columns):
         else:
             # Case 2
             (index_name, columns_,
-             self.index_col) = _clean_index_names(columns, self.index_col)
+             self.index_col) = _clean_index_names(columns, self.index_col,
+                                                  self.unnamed_cols)
 
         return index_name, orig_names, columns
 
@@ -2643,37 +3023,51 @@ def _rows_to_cols(self, content):
         if self._implicit_index:
             col_len += len(self.index_col)
 
-        # see gh-13320
-        zipped_content = list(lib.to_object_array(
-            content, min_width=col_len).T)
-        zip_len = len(zipped_content)
+        max_len = max(len(row) for row in content)
 
-        if self.skipfooter < 0:
-            raise ValueError('skip footer cannot be negative')
-
-        # Loop through rows to verify lengths are correct.
-        if (col_len != zip_len and
+        # Check that there are no rows with too many
+        # elements in their row (rows with too few
+        # elements are padded with NaN).
+        if (max_len > col_len and
                 self.index_col is not False and
                 self.usecols is None):
-            i = 0
-            for (i, l) in enumerate(content):
-                if len(l) != col_len:
-                    break
 
-            footers = 0
-            if self.skipfooter:
-                footers = self.skipfooter
+            footers = self.skipfooter if self.skipfooter else 0
+            bad_lines = []
 
-            row_num = self.pos - (len(content) - i + footers)
+            iter_content = enumerate(content)
+            content_len = len(content)
+            content = []
 
-            msg = ('Expected %d fields in line %d, saw %d' %
-                   (col_len, row_num + 1, zip_len))
-            if len(self.delimiter) > 1 and self.quoting != csv.QUOTE_NONE:
-                # see gh-13374
-                reason = ('Error could possibly be due to quotes being '
-                          'ignored when a multi-char delimiter is used.')
-                msg += '. ' + reason
-            raise ValueError(msg)
+            for (i, l) in iter_content:
+                actual_len = len(l)
+
+                if actual_len > col_len:
+                    if self.error_bad_lines or self.warn_bad_lines:
+                        row_num = self.pos - (content_len - i + footers)
+                        bad_lines.append((row_num, actual_len))
+
+                        if self.error_bad_lines:
+                            break
+                else:
+                    content.append(l)
+
+            for row_num, actual_len in bad_lines:
+                msg = ('Expected %d fields in line %d, saw %d' %
+                       (col_len, row_num + 1, actual_len))
+                if (self.delimiter and
+                        len(self.delimiter) > 1 and
+                        self.quoting != csv.QUOTE_NONE):
+                    # see gh-13374
+                    reason = ('Error could possibly be due to quotes being '
+                              'ignored when a multi-char delimiter is used.')
+                    msg += '. ' + reason
+
+                self._alert_malformed(msg, row_num + 1)
+
+        # see gh-13320
+        zipped_content = list(lib.to_object_array(
+            content, min_width=col_len).T)
 
         if self.usecols:
             if self._implicit_index:
@@ -2687,7 +3081,6 @@ def _rows_to_cols(self, content):
         return zipped_content
 
     def _get_lines(self, rows=None):
-        source = self.data
         lines = self.buf
         new_rows = None
 
@@ -2702,14 +3095,14 @@ def _get_lines(self, rows=None):
                 rows -= len(self.buf)
 
         if new_rows is None:
-            if isinstance(source, list):
-                if self.pos > len(source):
+            if isinstance(self.data, list):
+                if self.pos > len(self.data):
                     raise StopIteration
                 if rows is None:
-                    new_rows = source[self.pos:]
-                    new_pos = len(source)
+                    new_rows = self.data[self.pos:]
+                    new_pos = len(self.data)
                 else:
-                    new_rows = source[self.pos:self.pos + rows]
+                    new_rows = self.data[self.pos:self.pos + rows]
                     new_pos = self.pos + rows
 
                 # Check for stop rows. n.b.: self.skiprows is a set.
@@ -2725,21 +3118,19 @@ def _get_lines(self, rows=None):
                 try:
                     if rows is not None:
                         for _ in range(rows):
-                            new_rows.append(next(source))
+                            new_rows.append(next(self.data))
                         lines.extend(new_rows)
                     else:
                         rows = 0
+
                         while True:
-                            try:
-                                new_rows.append(next(source))
-                                rows += 1
-                            except csv.Error as inst:
-                                if 'newline inside string' in str(inst):
-                                    row_num = str(self.pos + rows)
-                                    msg = ('EOF inside string starting with '
-                                           'line ' + row_num)
-                                    raise Exception(msg)
-                                raise
+                            new_row = self._next_iter_line(
+                                row_num=self.pos + rows + 1)
+                            rows += 1
+
+                            if new_row is not None:
+                                new_rows.append(new_row)
+
                 except StopIteration:
                     if self.skiprows:
                         new_rows = [row for i, row in enumerate(new_rows)
@@ -2758,7 +3149,7 @@ def _get_lines(self, rows=None):
 
         lines = self._check_comments(lines)
         if self.skip_blank_lines:
-            lines = self._check_empty(lines)
+            lines = self._remove_empty_lines(lines)
         lines = self._check_thousands(lines)
         return self._check_decimal(lines)
 
@@ -2771,16 +3162,16 @@ def converter(*date_cols):
 
             try:
                 return tools.to_datetime(
-                    _ensure_object(strs),
+                    ensure_object(strs),
                     utc=None,
                     box=False,
                     dayfirst=dayfirst,
                     errors='ignore',
                     infer_datetime_format=infer_datetime_format
                 )
-            except:
+            except ValueError:
                 return tools.to_datetime(
-                    lib.try_parse_dates(strs, dayfirst=dayfirst))
+                    parsing.try_parse_dates(strs, dayfirst=dayfirst))
         else:
             try:
                 result = tools.to_datetime(
@@ -2791,9 +3182,9 @@ def converter(*date_cols):
             except Exception:
                 try:
                     return tools.to_datetime(
-                        lib.try_parse_dates(_concat_date_cols(date_cols),
-                                            parser=date_parser,
-                                            dayfirst=dayfirst),
+                        parsing.try_parse_dates(_concat_date_cols(date_cols),
+                                                parser=date_parser,
+                                                dayfirst=dayfirst),
                         errors='ignore')
                 except Exception:
                     return generic_parser(date_parser, *date_cols)
@@ -2877,7 +3268,7 @@ def _try_convert_dates(parser, colspec, data_dict, columns):
         else:
             colnames.append(c)
 
-    new_name = '_'.join([str(x) for x in colnames])
+    new_name = '_'.join(str(x) for x in colnames)
     to_parse = [data_dict[c] for c in colnames if c in data_dict]
 
     new_col = parser(*to_parse)
@@ -2890,19 +3281,25 @@ def _clean_na_values(na_values, keep_default_na=True):
         if keep_default_na:
             na_values = _NA_VALUES
         else:
-            na_values = []
+            na_values = set()
         na_fvalues = set()
     elif isinstance(na_values, dict):
-        na_values = na_values.copy()  # Prevent aliasing.
-        if keep_default_na:
-            for k, v in compat.iteritems(na_values):
-                if not is_list_like(v):
-                    v = [v]
+        old_na_values = na_values.copy()
+        na_values = {}  # Prevent aliasing.
+
+        # Convert the values in the na_values dictionary
+        # into array-likes for further use. This is also
+        # where we append the default NaN values, provided
+        # that `keep_default_na=True`.
+        for k, v in compat.iteritems(old_na_values):
+            if not is_list_like(v):
+                v = [v]
+
+            if keep_default_na:
                 v = set(v) | _NA_VALUES
-                na_values[k] = v
-        na_fvalues = dict([
-            (k, _floatify_na_values(v)) for k, v in na_values.items()  # noqa
-        ])
+
+            na_values[k] = v
+        na_fvalues = {k: _floatify_na_values(v) for k, v in na_values.items()}
     else:
         if not is_list_like(na_values):
             na_values = [na_values]
@@ -2915,7 +3312,7 @@ def _clean_na_values(na_values, keep_default_na=True):
     return na_values, na_fvalues
 
 
-def _clean_index_names(columns, index_col):
+def _clean_index_names(columns, index_col, unnamed_cols):
     if not _is_index_col(index_col):
         return None, columns, index_col
 
@@ -2940,10 +3337,10 @@ def _clean_index_names(columns, index_col):
             columns.remove(name)
             index_names.append(name)
 
-    # hack
-    if isinstance(index_names[0], compat.string_types)\
-            and 'Unnamed' in index_names[0]:
-        index_names[0] = None
+    # Only clean index names that were placeholders.
+    for i, name in enumerate(index_names):
+        if isinstance(name, compat.string_types) and name in unnamed_cols:
+            index_names[i] = None
 
     return index_names, columns, index_col
 
@@ -2968,19 +3365,27 @@ def _get_empty_meta(columns, index_col, index_names, dtype=None):
             col = columns[k] if is_integer(k) else k
             dtype[col] = v
 
-    if index_col is None or index_col is False:
+    # Even though we have no data, the "index" of the empty DataFrame
+    # could for example still be an empty MultiIndex. Thus, we need to
+    # check whether we have any index columns specified, via either:
+    #
+    # 1) index_col (column indices)
+    # 2) index_names (column names)
+    #
+    # Both must be non-null to ensure a successful construction. Otherwise,
+    # we have to create a generic emtpy Index.
+    if (index_col is None or index_col is False) or index_names is None:
         index = Index([])
     else:
-        index = [Series([], dtype=dtype[index_name])
-                 for index_name in index_names]
-        index = MultiIndex.from_arrays(index, names=index_names)
+        data = [Series([], dtype=dtype[name]) for name in index_names]
+        index = ensure_index_from_sequences(data, names=index_names)
         index_col.sort()
+
         for i, n in enumerate(index_col):
             columns.pop(n - i)
 
-    col_dict = dict((col_name,
-                     Series([], dtype=dtype[col_name]))
-                    for col_name in columns)
+    col_dict = {col_name: Series([], dtype=dtype[col_name])
+                for col_name in columns}
 
     return index, columns, col_dict
 
@@ -2993,7 +3398,7 @@ def _floatify_na_values(na_values):
             v = float(v)
             if not np.isnan(v):
                 result.add(v)
-        except:
+        except (TypeError, ValueError, OverflowError):
             pass
     return result
 
@@ -3014,21 +3419,47 @@ def _stringify_na_values(na_values):
                 result.append(str(v))
 
             result.append(v)
-        except:
+        except (TypeError, ValueError, OverflowError):
             pass
         try:
             result.append(int(x))
-        except:
+        except (TypeError, ValueError, OverflowError):
             pass
     return set(result)
 
 
-def _get_na_values(col, na_values, na_fvalues):
+def _get_na_values(col, na_values, na_fvalues, keep_default_na):
+    """
+    Get the NaN values for a given column.
+
+    Parameters
+    ----------
+    col : str
+        The name of the column.
+    na_values : array-like, dict
+        The object listing the NaN values as strings.
+    na_fvalues : array-like, dict
+        The object listing the NaN values as floats.
+    keep_default_na : bool
+        If `na_values` is a dict, and the column is not mapped in the
+        dictionary, whether to return the default NaN values or the empty set.
+
+    Returns
+    -------
+    nan_tuple : A length-two tuple composed of
+
+        1) na_values : the string NaN values for that column.
+        2) na_fvalues : the float NaN values for that column.
+    """
+
     if isinstance(na_values, dict):
         if col in na_values:
             return na_values[col], na_fvalues[col]
         else:
-            return _NA_VALUES, set()
+            if keep_default_na:
+                return _NA_VALUES, set()
+
+            return set(), set()
     else:
         return na_values, na_fvalues
 
@@ -3055,7 +3486,7 @@ def _concat_date_cols(date_cols):
                 for x in date_cols[0]
             ], dtype=object)
 
-    rs = np.array([' '.join([compat.text_type(y) for y in x])
+    rs = np.array([' '.join(compat.text_type(y) for y in x)
                    for x in zip(*date_cols)], dtype=object)
     return rs
 
@@ -3065,13 +3496,15 @@ class FixedWidthReader(BaseIterator):
     A reader of fixed-width lines.
     """
 
-    def __init__(self, f, colspecs, delimiter, comment, skiprows=None):
+    def __init__(self, f, colspecs, delimiter, comment, skiprows=None,
+                 infer_nrows=100):
         self.f = f
         self.buffer = None
         self.delimiter = '\r\n' + delimiter if delimiter else '\n\r\t '
         self.comment = comment
         if colspecs == 'infer':
-            self.colspecs = self.detect_colspecs(skiprows=skiprows)
+            self.colspecs = self.detect_colspecs(infer_nrows=infer_nrows,
+                                                 skiprows=skiprows)
         else:
             self.colspecs = colspecs
 
@@ -3087,19 +3520,20 @@ def __init__(self, f, colspecs, delimiter, comment, skiprows=None):
                 raise TypeError('Each column specification must be '
                                 '2 element tuple or list of integers')
 
-    def get_rows(self, n, skiprows=None):
+    def get_rows(self, infer_nrows, skiprows=None):
         """
         Read rows from self.f, skipping as specified.
 
-        We distinguish buffer_rows (the first <= n lines)
-        from the rows returned to detect_colspecs because
-        it's simpler to leave the other locations with
-        skiprows logic alone than to modify them to deal
-        with the fact we skipped some rows here as well.
+        We distinguish buffer_rows (the first <= infer_nrows
+        lines) from the rows returned to detect_colspecs
+        because it's simpler to leave the other locations
+        with skiprows logic alone than to modify them to
+        deal with the fact we skipped some rows here as
+        well.
 
         Parameters
         ----------
-        n : int
+        infer_nrows : int
             Number of rows to read from self.f, not counting
             rows that are skipped.
         skiprows: set, optional
@@ -3119,16 +3553,16 @@ def get_rows(self, n, skiprows=None):
             if i not in skiprows:
                 detect_rows.append(row)
             buffer_rows.append(row)
-            if len(detect_rows) >= n:
+            if len(detect_rows) >= infer_nrows:
                 break
         self.buffer = iter(buffer_rows)
         return detect_rows
 
-    def detect_colspecs(self, n=100, skiprows=None):
+    def detect_colspecs(self, infer_nrows=100, skiprows=None):
         # Regex escape the delimiters
-        delimiters = ''.join([r'\%s' % x for x in self.delimiter])
+        delimiters = ''.join(r'\%s' % x for x in self.delimiter)
         pattern = re.compile('([^%s]+)' % delimiters)
-        rows = self.get_rows(n, skiprows)
+        rows = self.get_rows(infer_nrows, skiprows)
         if not rows:
             raise EmptyDataError("No rows from which to infer column width")
         max_len = max(map(len, rows))
@@ -3167,8 +3601,10 @@ class FixedWidthFieldParser(PythonParser):
     def __init__(self, f, **kwds):
         # Support iterators, convert to a list.
         self.colspecs = kwds.pop('colspecs')
+        self.infer_nrows = kwds.pop('infer_nrows')
         PythonParser.__init__(self, f, **kwds)
 
     def _make_reader(self, f):
         self.data = FixedWidthReader(f, self.colspecs, self.delimiter,
-                                     self.comment, self.skiprows)
+                                     self.comment, self.skiprows,
+                                     self.infer_nrows)
diff --git a/pandas/io/pickle.py b/pandas/io/pickle.py
index 969a2a51cb15d..ab4a266853a78 100644
--- a/pandas/io/pickle.py
+++ b/pandas/io/pickle.py
@@ -1,122 +1,170 @@
 """ pickle compat """
+import warnings
 
-import numpy as np
-from numpy.lib.format import read_array, write_array
-from pandas.compat import BytesIO, cPickle as pkl, pickle_compat as pc, PY3
-from pandas.types.common import is_datetime64_dtype, _NS_DTYPE
-from pandas.io.common import _get_handle, _infer_compression
+from numpy.lib.format import read_array
 
+from pandas.compat import PY3, BytesIO, cPickle as pkl, pickle_compat as pc
 
-def to_pickle(obj, path, compression='infer'):
+from pandas.io.common import _get_handle, _stringify_path
+
+
+def to_pickle(obj, path, compression='infer', protocol=pkl.HIGHEST_PROTOCOL):
     """
-    Pickle (serialize) object to input file path
+    Pickle (serialize) object to file.
 
     Parameters
     ----------
     obj : any object
-    path : string
-        File path
-    compression : {'infer', 'gzip', 'bz2', 'xz', None}, default 'infer'
-        a string representing the compression to use in the output file
+        Any python object.
+    path : str
+        File path where the pickled object will be stored.
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
+        A string representing the compression to use in the output file. By
+        default, infers from the file extension in specified path.
 
         .. versionadded:: 0.20.0
+    protocol : int
+        Int which indicates which protocol should be used by the pickler,
+        default HIGHEST_PROTOCOL (see [1], paragraph 12.1.2). The possible
+        values for this parameter depend on the version of Python. For Python
+        2.x, possible values are 0, 1, 2. For Python>=3.0, 3 is a valid value.
+        For Python >= 3.4, 4 is a valid value. A negative value for the
+        protocol parameter is equivalent to setting its value to
+        HIGHEST_PROTOCOL.
+
+        .. [1] https://docs.python.org/3/library/pickle.html
+        .. versionadded:: 0.21.0
+
+    See Also
+    --------
+    read_pickle : Load pickled pandas object (or any object) from file.
+    DataFrame.to_hdf : Write DataFrame to an HDF5 file.
+    DataFrame.to_sql : Write DataFrame to a SQL database.
+    DataFrame.to_parquet : Write a DataFrame to the binary parquet format.
+
+    Examples
+    --------
+    >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+    >>> original_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+    >>> pd.to_pickle(original_df, "./dummy.pkl")
+
+    >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+    >>> unpickled_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+
+    >>> import os
+    >>> os.remove("./dummy.pkl")
     """
-    inferred_compression = _infer_compression(path, compression)
+    path = _stringify_path(path)
     f, fh = _get_handle(path, 'wb',
-                        compression=inferred_compression,
+                        compression=compression,
                         is_text=False)
+    if protocol < 0:
+        protocol = pkl.HIGHEST_PROTOCOL
     try:
-        pkl.dump(obj, f, protocol=pkl.HIGHEST_PROTOCOL)
+        f.write(pkl.dumps(obj, protocol=protocol))
     finally:
+        f.close()
         for _f in fh:
             _f.close()
 
 
 def read_pickle(path, compression='infer'):
     """
-    Load pickled pandas object (or any other pickled object) from the specified
-    file path
+    Load pickled pandas object (or any object) from file.
 
-    Warning: Loading pickled data received from untrusted sources can be
-    unsafe. See: http://docs.python.org/2.7/library/pickle.html
+    .. warning::
+
+       Loading pickled data received from untrusted sources can be
+       unsafe. See `here <https://docs.python.org/3/library/pickle.html>`__.
 
     Parameters
     ----------
-    path : string
-        File path
-    compression : {'infer', 'gzip', 'bz2', 'xz', 'zip', None}, default 'infer'
+    path : str
+        File path where the pickled object will be loaded.
+    compression : {'infer', 'gzip', 'bz2', 'zip', 'xz', None}, default 'infer'
         For on-the-fly decompression of on-disk data. If 'infer', then use
-        gzip, bz2, xz or zip if path is a string ending in '.gz', '.bz2', 'xz',
-        or 'zip' respectively, and no decompression otherwise.
+        gzip, bz2, xz or zip if path ends in '.gz', '.bz2', '.xz',
+        or '.zip' respectively, and no decompression otherwise.
         Set to None for no decompression.
 
         .. versionadded:: 0.20.0
 
     Returns
     -------
-    unpickled : type of object stored in file
+    unpickled : same type as object stored in file
+
+    See Also
+    --------
+    DataFrame.to_pickle : Pickle (serialize) DataFrame object to file.
+    Series.to_pickle : Pickle (serialize) Series object to file.
+    read_hdf : Read HDF5 file into a DataFrame.
+    read_sql : Read SQL query or database table into a DataFrame.
+    read_parquet : Load a parquet object, returning a DataFrame.
+
+    Examples
+    --------
+    >>> original_df = pd.DataFrame({"foo": range(5), "bar": range(5, 10)})
+    >>> original_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+    >>> pd.to_pickle(original_df, "./dummy.pkl")
+
+    >>> unpickled_df = pd.read_pickle("./dummy.pkl")
+    >>> unpickled_df
+       foo  bar
+    0    0    5
+    1    1    6
+    2    2    7
+    3    3    8
+    4    4    9
+
+    >>> import os
+    >>> os.remove("./dummy.pkl")
     """
+    path = _stringify_path(path)
+    f, fh = _get_handle(path, 'rb', compression=compression, is_text=False)
 
-    inferred_compression = _infer_compression(path, compression)
+    # 1) try with cPickle
+    # 2) try with the compat pickle to handle subclass changes
+    # 3) pass encoding only if its not None as py2 doesn't handle the param
 
-    def read_wrapper(func):
-        # wrapper file handle open/close operation
-        f, fh = _get_handle(path, 'rb',
-                            compression=inferred_compression,
-                            is_text=False)
-        try:
-            return func(f)
-        finally:
-            for _f in fh:
-                _f.close()
-
-    def try_read(path, encoding=None):
-        # try with cPickle
-        # try with current pickle, if we have a Type Error then
-        # try with the compat pickle to handle subclass changes
-        # pass encoding only if its not None as py2 doesn't handle
-        # the param
-
-        # cpickle
-        # GH 6899
-        try:
-            return read_wrapper(lambda f: pkl.load(f))
-        except Exception:
-            # reg/patched pickle
-            try:
-                return read_wrapper(
-                    lambda f: pc.load(f, encoding=encoding, compat=False))
-            # compat pickle
-            except:
-                return read_wrapper(
-                    lambda f: pc.load(f, encoding=encoding, compat=True))
     try:
-        return try_read(path)
-    except:
-        if PY3:
-            return try_read(path, encoding='latin1')
-        raise
-
+        with warnings.catch_warnings(record=True):
+            # We want to silence any warnings about, e.g. moved modules.
+            warnings.simplefilter("ignore", Warning)
+            return pkl.load(f)
+    except Exception:  # noqa: E722
+        try:
+            return pc.load(f, encoding=None)
+        except Exception:  # noqa: E722
+            if PY3:
+                return pc.load(f, encoding='latin1')
+            raise
+    finally:
+        f.close()
+        for _f in fh:
+            _f.close()
 
 # compat with sparse pickle / unpickle
 
 
-def _pickle_array(arr):
-    arr = arr.view(np.ndarray)
-
-    buf = BytesIO()
-    write_array(buf, arr)
-
-    return buf.getvalue()
-
-
 def _unpickle_array(bytes):
     arr = read_array(BytesIO(bytes))
 
-    # All datetimes should be stored as M8[ns].  When unpickling with
-    # numpy1.6, it will read these as M8[us].  So this ensures all
-    # datetime64 types are read as MS[ns]
-    if is_datetime64_dtype(arr):
-        arr = arr.view(_NS_DTYPE)
-
     return arr
diff --git a/pandas/io/pytables.py b/pandas/io/pytables.py
index f75a4761e0948..2ee8759b9bdd8 100644
--- a/pandas/io/pytables.py
+++ b/pandas/io/pytables.py
@@ -1,52 +1,46 @@
+# pylint: disable-msg=E1101,W0613,W0603
 """
 High level interface to PyTables for reading and writing pandas data structures
 to disk
 """
 
-# pylint: disable-msg=E1101,W0613,W0603
-from datetime import datetime, date
-import time
-import re
 import copy
+from datetime import date, datetime
+from distutils.version import LooseVersion
 import itertools
-import warnings
 import os
-
-from pandas.types.common import (is_list_like,
-                                 is_categorical_dtype,
-                                 is_timedelta64_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_datetime64_dtype,
-                                 _ensure_object,
-                                 _ensure_int64,
-                                 _ensure_platform_int)
-from pandas.types.missing import array_equivalent
+import re
+import time
+import warnings
 
 import numpy as np
-from pandas import (Series, DataFrame, Panel, Panel4D, Index,
-                    MultiIndex, Int64Index, isnull, concat,
-                    SparseSeries, SparseDataFrame, PeriodIndex,
-                    DatetimeIndex, TimedeltaIndex)
+
+from pandas._libs import lib, writers as libwriters
+from pandas._libs.tslibs import timezones
+from pandas.compat import PY3, filter, lrange, range, string_types
+from pandas.errors import PerformanceWarning
+
+from pandas.core.dtypes.common import (
+    ensure_object, is_categorical_dtype, is_datetime64_dtype,
+    is_datetime64tz_dtype, is_list_like, is_timedelta64_dtype)
+from pandas.core.dtypes.missing import array_equivalent
+
+from pandas import (
+    DataFrame, DatetimeIndex, Index, Int64Index, MultiIndex, PeriodIndex,
+    Series, SparseDataFrame, SparseSeries, TimedeltaIndex, compat, concat,
+    isna, to_datetime)
 from pandas.core import config
-from pandas.io.common import _stringify_path
-from pandas.sparse.array import BlockIndex, IntIndex
+from pandas.core.arrays.categorical import Categorical
+from pandas.core.arrays.sparse import BlockIndex, IntIndex
 from pandas.core.base import StringMixin
-from pandas.formats.printing import adjoin, pprint_thing
-from pandas.core.common import _asarray_tuplesafe, PerformanceWarning
-from pandas.core.algorithms import match, unique
-from pandas.core.categorical import Categorical, _factorize_from_iterables
-from pandas.core.internals import (BlockManager, make_block,
-                                   _block2d_to_blocknd,
-                                   _factor_indexer, _block_shape)
-from pandas.core.index import _ensure_index
-from pandas import compat
-from pandas.compat import u_safe as u, PY3, range, lrange, string_types, filter
+import pandas.core.common as com
+from pandas.core.computation.pytables import Expr, maybe_expression
 from pandas.core.config import get_option
-from pandas.computation.pytables import Expr, maybe_expression
-
-from pandas._libs import tslib, algos, lib
+from pandas.core.index import ensure_index
+from pandas.core.internals import BlockManager, _block_shape, make_block
 
-from distutils.version import LooseVersion
+from pandas.io.common import _stringify_path
+from pandas.io.formats.printing import adjoin, pprint_thing
 
 # versioning attribute
 _version = '0.15.2'
@@ -71,6 +65,18 @@ def _ensure_encoding(encoding):
     return encoding
 
 
+def _ensure_str(name):
+    """Ensure that an index / column name is a str (python 3) or
+    unicode (python 2); otherwise they may be np.string dtype.
+    Non-string dtypes are passed through unchanged.
+
+    https://github.com/pandas-dev/pandas/issues/13492
+    """
+    if isinstance(name, compat.string_types):
+        name = compat.text_type(name)
+    return name
+
+
 Term = Expr
 
 
@@ -82,7 +88,7 @@ def _ensure_term(where, scope_level):
     create the terms here with a frame_level=2 (we are 2 levels down)
     """
 
-    # only consider list/tuple here as an ndarray is automaticaly a coordinate
+    # only consider list/tuple here as an ndarray is automatically a coordinate
     # list
     level = scope_level + 1
     if isinstance(where, (list, tuple)):
@@ -142,10 +148,10 @@ class DuplicateWarning(Warning):
 
 # formats
 _FORMAT_MAP = {
-    u('f'): 'fixed',
-    u('fixed'): 'fixed',
-    u('t'): 'table',
-    u('table'): 'table',
+    u'f': 'fixed',
+    u'fixed': 'fixed',
+    u't': 'table',
+    u'table': 'table',
 }
 
 format_deprecate_doc = """
@@ -160,45 +166,36 @@ class DuplicateWarning(Warning):
 # map object types
 _TYPE_MAP = {
 
-    Series: u('series'),
-    SparseSeries: u('sparse_series'),
-    DataFrame: u('frame'),
-    SparseDataFrame: u('sparse_frame'),
-    Panel: u('wide'),
-    Panel4D: u('ndim'),
+    Series: u'series',
+    SparseSeries: u'sparse_series',
+    DataFrame: u'frame',
+    SparseDataFrame: u'sparse_frame',
 }
 
 # storer class map
 _STORER_MAP = {
-    u('Series'): 'LegacySeriesFixed',
-    u('DataFrame'): 'LegacyFrameFixed',
-    u('DataMatrix'): 'LegacyFrameFixed',
-    u('series'): 'SeriesFixed',
-    u('sparse_series'): 'SparseSeriesFixed',
-    u('frame'): 'FrameFixed',
-    u('sparse_frame'): 'SparseFrameFixed',
-    u('wide'): 'PanelFixed',
+    u'Series': 'LegacySeriesFixed',
+    u'DataFrame': 'LegacyFrameFixed',
+    u'DataMatrix': 'LegacyFrameFixed',
+    u'series': 'SeriesFixed',
+    u'sparse_series': 'SparseSeriesFixed',
+    u'frame': 'FrameFixed',
+    u'sparse_frame': 'SparseFrameFixed',
 }
 
 # table class map
 _TABLE_MAP = {
-    u('generic_table'): 'GenericTable',
-    u('appendable_series'): 'AppendableSeriesTable',
-    u('appendable_multiseries'): 'AppendableMultiSeriesTable',
-    u('appendable_frame'): 'AppendableFrameTable',
-    u('appendable_multiframe'): 'AppendableMultiFrameTable',
-    u('appendable_panel'): 'AppendablePanelTable',
-    u('appendable_ndim'): 'AppendableNDimTable',
-    u('worm'): 'WORMTable',
-    u('legacy_frame'): 'LegacyFrameTable',
-    u('legacy_panel'): 'LegacyPanelTable',
+    u'generic_table': 'GenericTable',
+    u'appendable_series': 'AppendableSeriesTable',
+    u'appendable_multiseries': 'AppendableMultiSeriesTable',
+    u'appendable_frame': 'AppendableFrameTable',
+    u'appendable_multiframe': 'AppendableMultiFrameTable',
+    u'worm': 'WORMTable',
 }
 
 # axes map
 _AXES_MAP = {
     DataFrame: [0],
-    Panel: [1, 2],
-    Panel4D: [1, 2, 3],
 }
 
 # register our configuration options
@@ -233,7 +230,7 @@ def _tables():
         _table_mod = tables
 
         # version requirements
-        if LooseVersion(tables.__version__) < '3.0.0':
+        if LooseVersion(tables.__version__) < LooseVersion('3.0.0'):
             raise ImportError("PyTables version >= 3.0.0 is required")
 
         # set the file open policy
@@ -242,7 +239,7 @@ def _tables():
         try:
             _table_file_open_policy_is_strict = (
                 tables.file._FILE_OPEN_POLICY == 'strict')
-        except:
+        except AttributeError:
             pass
 
     return _table_mod
@@ -268,48 +265,84 @@ def to_hdf(path_or_buf, key, value, mode=None, complevel=None, complib=None,
         f(path_or_buf)
 
 
-def read_hdf(path_or_buf, key=None, **kwargs):
-    """ read from the store, close it if we opened it
+def read_hdf(path_or_buf, key=None, mode='r', **kwargs):
+    """
+    Read from the store, close it if we opened it.
 
-        Retrieve pandas object stored in file, optionally based on where
-        criteria
+    Retrieve pandas object stored in file, optionally based on where
+    criteria
 
-        Parameters
-        ----------
-        path_or_buf : path (string), buffer, or path object (pathlib.Path or
-            py._path.local.LocalPath) to read from
-
-            .. versionadded:: 0.19.0 support for pathlib, py.path.
-
-        key : group identifier in the store. Can be omitted if the HDF file
-            contains a single pandas object.
-        where : list of Term (or convertable) objects, optional
-        start : optional, integer (defaults to None), row number to start
-            selection
-        stop  : optional, integer (defaults to None), row number to stop
-            selection
-        columns : optional, a list of columns that if not None, will limit the
-            return columns
-        iterator : optional, boolean, return an iterator, default False
-        chunksize : optional, nrows to include in iteration, return an iterator
+    Parameters
+    ----------
+    path_or_buf : string, buffer or path object
+        Path to the file to open, or an open :class:`pandas.HDFStore` object.
+        Supports any object implementing the ``__fspath__`` protocol.
+        This includes :class:`pathlib.Path` and py._path.local.LocalPath
+        objects.
+
+        .. versionadded:: 0.19.0 support for pathlib, py.path.
+        .. versionadded:: 0.21.0 support for __fspath__ protocol.
+
+    key : object, optional
+        The group identifier in the store. Can be omitted if the HDF file
+        contains a single pandas object.
+    mode : {'r', 'r+', 'a'}, optional
+        Mode to use when opening the file. Ignored if path_or_buf is a
+        :class:`pandas.HDFStore`. Default is 'r'.
+    where : list, optional
+        A list of Term (or convertible) objects.
+    start : int, optional
+        Row number to start selection.
+    stop  : int, optional
+        Row number to stop selection.
+    columns : list, optional
+        A list of columns names to return.
+    iterator : bool, optional
+        Return an iterator object.
+    chunksize : int, optional
+        Number of rows to include in an iteration when using an iterator.
+    errors : str, default 'strict'
+        Specifies how encoding and decoding errors are to be handled.
+        See the errors argument for :func:`open` for a full list
+        of options.
+    **kwargs
+        Additional keyword arguments passed to HDFStore.
 
-        Returns
-        -------
-        The selected object
+    Returns
+    -------
+    item : object
+        The selected object. Return type depends on the object stored.
 
-        """
+    See Also
+    --------
+    DataFrame.to_hdf : Write a HDF file from a DataFrame.
+    HDFStore : Low-level access to HDF files.
+
+    Examples
+    --------
+    >>> df = pd.DataFrame([[1, 1.0, 'a']], columns=['x', 'y', 'z'])
+    >>> df.to_hdf('./store.h5', 'data')
+    >>> reread = pd.read_hdf('./store.h5')
+    """
 
-    if kwargs.get('mode', 'a') not in ['r', 'r+', 'a']:
+    if mode not in ['r', 'r+', 'a']:
         raise ValueError('mode {0} is not allowed while performing a read. '
-                         'Allowed modes are r, r+ and a.'
-                         .format(kwargs.get('mode')))
+                         'Allowed modes are r, r+ and a.'.format(mode))
     # grab the scope
     if 'where' in kwargs:
         kwargs['where'] = _ensure_term(kwargs['where'], scope_level=1)
 
-    path_or_buf = _stringify_path(path_or_buf)
-    if isinstance(path_or_buf, string_types):
+    if isinstance(path_or_buf, HDFStore):
+        if not path_or_buf.is_open:
+            raise IOError('The HDFStore must be open for reading.')
 
+        store = path_or_buf
+        auto_close = False
+    else:
+        path_or_buf = _stringify_path(path_or_buf)
+        if not isinstance(path_or_buf, string_types):
+            raise NotImplementedError('Support for generic buffers has not '
+                                      'been implemented.')
         try:
             exists = os.path.exists(path_or_buf)
 
@@ -319,24 +352,13 @@ def read_hdf(path_or_buf, key=None, **kwargs):
 
         if not exists:
             raise compat.FileNotFoundError(
-                'File %s does not exist' % path_or_buf)
+                'File {path} does not exist'.format(path=path_or_buf))
 
+        store = HDFStore(path_or_buf, mode=mode, **kwargs)
         # can't auto open/close if we are using an iterator
         # so delegate to the iterator
-        store = HDFStore(path_or_buf, **kwargs)
         auto_close = True
 
-    elif isinstance(path_or_buf, HDFStore):
-        if not path_or_buf.is_open:
-            raise IOError('The HDFStore must be open for reading.')
-
-        store = path_or_buf
-        auto_close = False
-
-    else:
-        raise NotImplementedError('Support for generic buffers has not been '
-                                  'implemented.')
-
     try:
         if key is None:
             groups = store.groups()
@@ -354,11 +376,11 @@ def read_hdf(path_or_buf, key=None, **kwargs):
                                      'contains multiple datasets.')
             key = candidate_only_group._v_pathname
         return store.select(key, auto_close=auto_close, **kwargs)
-    except:
+    except (ValueError, TypeError):
         # if there is an error, close the store
         try:
             store.close()
-        except:
+        except AttributeError:
             pass
 
         raise
@@ -381,7 +403,7 @@ def _is_metadata_of(group, parent_group):
 class HDFStore(StringMixin):
 
     """
-    dict-like IO interface for storing pandas objects in PyTables
+    Dict-like IO interface for storing pandas objects in PyTables
     either Fixed or Table format.
 
     Parameters
@@ -400,21 +422,24 @@ class HDFStore(StringMixin):
             and if the file does not exist it is created.
         ``'r+'``
             It is similar to ``'a'``, but the file must already exist.
-    complevel : int, 1-9, default 0
-            If a complib is specified compression will be applied
-            where possible
-    complib : {'zlib', 'bzip2', 'lzo', 'blosc', None}, default None
-            If complevel is > 0 apply compression to objects written
-            in the store wherever possible
+    complevel : int, 0-9, default None
+            Specifies a compression level for data.
+            A value of 0 disables compression.
+    complib : {'zlib', 'lzo', 'bzip2', 'blosc'}, default 'zlib'
+            Specifies the compression library to be used.
+            As of v0.20.2 these additional compressors for Blosc are supported
+            (default if no compressor specified: 'blosc:blosclz'):
+            {'blosc:blosclz', 'blosc:lz4', 'blosc:lz4hc', 'blosc:snappy',
+             'blosc:zlib', 'blosc:zstd'}.
+            Specifying a compression library which is not available issues
+            a ValueError.
     fletcher32 : bool, default False
             If applying compression use the fletcher32 checksum
 
     Examples
     --------
-    >>> from pandas import DataFrame
-    >>> from numpy.random import randn
-    >>> bar = DataFrame(randn(10, 4))
-    >>> store = HDFStore('test.h5')
+    >>> bar = pd.DataFrame(np.random.randn(10, 4))
+    >>> store = pd.HDFStore('test.h5')
     >>> store['foo'] = bar   # write to HDF5
     >>> bar = store['foo']   # retrieve
     >>> store.close()
@@ -422,27 +447,38 @@ class HDFStore(StringMixin):
 
     def __init__(self, path, mode=None, complevel=None, complib=None,
                  fletcher32=False, **kwargs):
+
+        if 'format' in kwargs:
+            raise ValueError('format is not a defined argument for HDFStore')
+
         try:
             import tables  # noqa
         except ImportError as ex:  # pragma: no cover
-            raise ImportError('HDFStore requires PyTables, "{ex}" problem '
-                              'importing'.format(ex=str(ex)))
+            raise ImportError('HDFStore requires PyTables, "{ex!s}" problem '
+                              'importing'.format(ex=ex))
 
-        if complib not in (None, 'blosc', 'bzip2', 'lzo', 'zlib'):
-            raise ValueError("complib only supports 'blosc', 'bzip2', lzo' "
-                             "or 'zlib' compression.")
+        if complib is not None and complib not in tables.filters.all_complibs:
+            raise ValueError(
+                "complib only supports {libs} compression.".format(
+                    libs=tables.filters.all_complibs))
+
+        if complib is None and complevel is not None:
+            complib = tables.filters.default_complib
 
-        self._path = path
+        self._path = _stringify_path(path)
         if mode is None:
             mode = 'a'
         self._mode = mode
         self._handle = None
-        self._complevel = complevel
+        self._complevel = complevel if complevel else 0
         self._complib = complib
         self._fletcher32 = fletcher32
         self._filters = None
         self.open(mode=mode, **kwargs)
 
+    def __fspath__(self):
+        return self._path
+
     @property
     def root(self):
         """ return the root node """
@@ -464,16 +500,16 @@ def __delitem__(self, key):
 
     def __getattr__(self, name):
         """ allow attribute access to get stores """
-        self._check_if_open()
         try:
             return self.get(name)
-        except:
+        except (KeyError, ClosedFileError):
             pass
-        raise AttributeError("'%s' object has no attribute '%s'" %
-                             (type(self).__name__, name))
+        raise AttributeError(
+            "'{object}' object has no attribute '{name}'".format(
+                object=type(self).__name__, name=name))
 
     def __contains__(self, key):
-        """ check for existance of this key
+        """ check for existence of this key
               can match the exact pathname or the pathnm w/o the leading '/'
               """
         node = self.get_node(key)
@@ -487,32 +523,8 @@ def __len__(self):
         return len(self.groups())
 
     def __unicode__(self):
-        output = '%s\nFile path: %s\n' % (type(self), pprint_thing(self._path))
-        if self.is_open:
-            lkeys = sorted(list(self.keys()))
-            if len(lkeys):
-                keys = []
-                values = []
-
-                for k in lkeys:
-                    try:
-                        s = self.get_storer(k)
-                        if s is not None:
-                            keys.append(pprint_thing(s.pathname or k))
-                            values.append(
-                                pprint_thing(s or 'invalid_HDFStore node'))
-                    except Exception as detail:
-                        keys.append(k)
-                        values.append("[invalid_HDFStore node: %s]"
-                                      % pprint_thing(detail))
-
-                output += adjoin(12, keys, values)
-            else:
-                output += 'Empty'
-        else:
-            output += "File is CLOSED"
-
-        return output
+        return '{type}\nFile path: {path}\n'.format(
+            type=type(self), path=pprint_thing(self._path))
 
     def __enter__(self):
         return self
@@ -572,18 +584,16 @@ def open(self, mode='a', **kwargs):
         if self.is_open:
             self.close()
 
-        if self._complib is not None:
-            if self._complevel is None:
-                self._complevel = 9
-            self._filters = _tables().Filters(self._complevel,
-                                              self._complib,
+        if self._complevel and self._complevel > 0:
+            self._filters = _tables().Filters(self._complevel, self._complib,
                                               fletcher32=self._fletcher32)
 
         try:
             self._handle = tables.open_file(self._path, self._mode, **kwargs)
         except (IOError) as e:  # pragma: no cover
             if 'can not be written' in str(e):
-                print('Opening %s in read-only mode' % self._path)
+                print(
+                    'Opening {path} in read-only mode'.format(path=self._path))
                 self._handle = tables.open_file(self._path, 'r', **kwargs)
             else:
                 raise
@@ -609,7 +619,7 @@ def open(self, mode='a', **kwargs):
 
         except (Exception) as e:
 
-            # trying to read from a non-existant file causes an error which
+            # trying to read from a non-existent file causes an error which
             # is not part of IOError, make it one
             if self._mode == 'r' and 'Unable to open/create file' in str(e):
                 raise IOError(str(e))
@@ -653,7 +663,7 @@ def flush(self, fsync=False):
             if fsync:
                 try:
                     os.fsync(self._handle.fileno())
-                except:
+                except OSError:
                     pass
 
     def get(self, key):
@@ -666,11 +676,11 @@ def get(self, key):
 
         Returns
         -------
-        obj : type of object stored in file
+        obj : same type as object stored in file
         """
         group = self.get_node(key)
         if group is None:
-            raise KeyError('No object named %s in the file' % key)
+            raise KeyError('No object named {key} in the file'.format(key=key))
         return self._read_group(group)
 
     def select(self, key, where=None, start=None, stop=None, columns=None,
@@ -682,7 +692,7 @@ def select(self, key, where=None, start=None, stop=None, columns=None,
         Parameters
         ----------
         key : object
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
         columns : a list of columns that if not None, will limit the return
@@ -695,11 +705,10 @@ def select(self, key, where=None, start=None, stop=None, columns=None,
         Returns
         -------
         The selected object
-
         """
         group = self.get_node(key)
         if group is None:
-            raise KeyError('No object named %s in the file' % key)
+            raise KeyError('No object named {key} in the file'.format(key=key))
 
         # create the storer and axes
         where = _ensure_term(where, scope_level=1)
@@ -710,7 +719,7 @@ def select(self, key, where=None, start=None, stop=None, columns=None,
         def func(_start, _stop, _where):
             return s.read(start=_start, stop=_stop,
                           where=_where,
-                          columns=columns, **kwargs)
+                          columns=columns)
 
         # create the iterator
         it = TableIterator(self, s, func, where=where, nrows=s.nrows,
@@ -727,7 +736,7 @@ def select_as_coordinates(
         Parameters
         ----------
         key : object
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
         """
@@ -804,11 +813,11 @@ def select_as_multiple(self, keys, where=None, selector=None, columns=None,
         nrows = None
         for t, k in itertools.chain([(s, selector)], zip(tbls, keys)):
             if t is None:
-                raise KeyError("Invalid table [%s]" % k)
+                raise KeyError("Invalid table [{key}]".format(key=k))
             if not t.is_table:
                 raise TypeError(
-                    "object [%s] is not a table, and cannot be used in all "
-                    "select as multiple" % t.pathname
+                    "object [{obj}] is not a table, and cannot be used in all "
+                    "select as multiple".format(obj=t.pathname)
                 )
 
             if nrows is None:
@@ -818,14 +827,14 @@ def select_as_multiple(self, keys, where=None, selector=None, columns=None,
                     "all tables must have exactly the same nrows!")
 
         # axis is the concentation axes
-        axis = list(set([t.non_index_axes[0][0] for t in tbls]))[0]
+        axis = list({t.non_index_axes[0][0] for t in tbls})[0]
 
         def func(_start, _stop, _where):
 
             # retrieve the objs, _where is always passed as a set of
             # coordinates here
-            objs = [t.read(where=_where, columns=columns, **kwargs)
-                    for t in tbls]
+            objs = [t.read(where=_where, columns=columns, start=_start,
+                           stop=_stop, **kwargs) for t in tbls]
 
             # concat and return
             return concat(objs, axis=axis,
@@ -845,7 +854,7 @@ def put(self, key, value, format=None, append=False, **kwargs):
         Parameters
         ----------
         key      : object
-        value    : {Series, DataFrame, Panel}
+        value    : {Series, DataFrame}
         format   : 'fixed(f)|table(t)', default is 'fixed'
             fixed(f) : Fixed format
                        Fast writing/reading. Not-appendable, nor searchable
@@ -876,7 +885,7 @@ def remove(self, key, where=None, start=None, stop=None):
         ----------
         key : string
             Node to remove or delete rows from
-        where : list of Term (or convertable) objects, optional
+        where : list of Term (or convertible) objects, optional
         start : integer (defaults to None), row number to start selection
         stop  : integer (defaults to None), row number to stop selection
 
@@ -892,7 +901,10 @@ def remove(self, key, where=None, start=None, stop=None):
         where = _ensure_term(where, scope_level=1)
         try:
             s = self.get_storer(key)
-        except:
+        except KeyError:
+            # the key is not a valid store, re-raising KeyError
+            raise
+        except Exception:
 
             if where is not None:
                 raise ValueError(
@@ -904,11 +916,8 @@ def remove(self, key, where=None, start=None, stop=None):
                 s._f_remove(recursive=True)
                 return None
 
-        if s is None:
-            raise KeyError('No object named %s in the file' % key)
-
         # remove the node
-        if where is None and start is None and stop is None:
+        if com._all_none(where, start, stop):
             s.group._f_remove(recursive=True)
 
         # delete from the table
@@ -927,8 +936,8 @@ def append(self, key, value, format=None, append=True, columns=None,
         Parameters
         ----------
         key : object
-        value : {Series, DataFrame, Panel, Panel4D}
-        format: 'table' is the default
+        value : {Series, DataFrame}
+        format : 'table' is the default
             table(t) : table format
                        Write as a PyTables Table structure which may perform
                        worse but allow more flexible operations like searching
@@ -1043,7 +1052,7 @@ def append_to_multiple(self, d, value, selector, data_columns=None,
             dc = data_columns if k == selector else None
 
             # compute the val
-            val = value.reindex_axis(v, axis=axis)
+            val = value.reindex(v, axis=axis)
 
             self.append(k, val, data_columns=dc, **kwargs)
 
@@ -1077,13 +1086,60 @@ def groups(self):
         _tables()
         self._check_if_open()
         return [
-            g for g in self._handle.walk_nodes()
-            if (getattr(g._v_attrs, 'pandas_type', None) or
-                getattr(g, 'table', None) or
+            g for g in self._handle.walk_groups()
+            if (not isinstance(g, _table_mod.link.Link) and
+                (getattr(g._v_attrs, 'pandas_type', None) or
+                 getattr(g, 'table', None) or
                 (isinstance(g, _table_mod.table.Table) and
-                 g._v_name != u('table')))
+                 g._v_name != u'table')))
         ]
 
+    def walk(self, where="/"):
+        """ Walk the pytables group hierarchy for pandas objects
+
+        This generator will yield the group path, subgroups and pandas object
+        names for each group.
+        Any non-pandas PyTables objects that are not a group will be ignored.
+
+        The `where` group itself is listed first (preorder), then each of its
+        child groups (following an alphanumerical order) is also traversed,
+        following the same procedure.
+
+        .. versionadded:: 0.24.0
+
+        Parameters
+        ----------
+        where : str, optional
+            Group where to start walking.
+            If not supplied, the root group is used.
+
+        Yields
+        ------
+        path : str
+            Full path to a group (without trailing '/')
+        groups : list of str
+            names of the groups contained in `path`
+        leaves : list of str
+            names of the pandas objects contained in `path`
+        """
+        _tables()
+        self._check_if_open()
+        for g in self._handle.walk_groups(where):
+            if getattr(g._v_attrs, 'pandas_type', None) is not None:
+                continue
+
+            groups = []
+            leaves = []
+            for child in g._v_children.values():
+                pandas_type = getattr(child._v_attrs, 'pandas_type', None)
+                if pandas_type is None:
+                    if isinstance(child, _table_mod.group.Group):
+                        groups.append(child._v_name)
+                else:
+                    leaves.append(child._v_name)
+
+            yield (g._v_pathname.rstrip('/'), groups, leaves)
+
     def get_node(self, key):
         """ return the node with the key or None if it does not exist """
         self._check_if_open()
@@ -1091,14 +1147,15 @@ def get_node(self, key):
             if not key.startswith('/'):
                 key = '/' + key
             return self._handle.get_node(self.root, key)
-        except:
+        except _table_mod.exceptions.NoSuchNodeError:
             return None
 
     def get_storer(self, key):
         """ return the storer object for a key, raise if not in the file """
         group = self.get_node(key)
         if group is None:
-            return None
+            raise KeyError('No object named {key} in the file'.format(key=key))
+
         s = self._create_storer(group)
         s.infer_axes()
         return s
@@ -1154,6 +1211,41 @@ def copy(self, file, mode='w', propindexes=True, keys=None, complib=None,
 
         return new_store
 
+    def info(self):
+        """
+        Print detailed information on the store.
+
+        .. versionadded:: 0.21.0
+        """
+        output = '{type}\nFile path: {path}\n'.format(
+            type=type(self), path=pprint_thing(self._path))
+        if self.is_open:
+            lkeys = sorted(list(self.keys()))
+            if len(lkeys):
+                keys = []
+                values = []
+
+                for k in lkeys:
+                    try:
+                        s = self.get_storer(k)
+                        if s is not None:
+                            keys.append(pprint_thing(s.pathname or k))
+                            values.append(
+                                pprint_thing(s or 'invalid_HDFStore node'))
+                    except Exception as detail:
+                        keys.append(k)
+                        values.append(
+                            "[invalid_HDFStore node: {detail}]".format(
+                                detail=pprint_thing(detail)))
+
+                output += adjoin(12, keys, values)
+            else:
+                output += 'Empty'
+        else:
+            output += "File is CLOSED"
+
+        return output
+
     # private methods ######
     def _check_if_open(self):
         if not self.is_open:
@@ -1166,7 +1258,7 @@ def _validate_format(self, format, kwargs):
         # validate
         try:
             kwargs['format'] = _FORMAT_MAP[format.lower()]
-        except:
+        except KeyError:
             raise TypeError("invalid HDFStore format specified [{0}]"
                             .format(format))
 
@@ -1178,10 +1270,11 @@ def _create_storer(self, group, format=None, value=None, append=False,
 
         def error(t):
             raise TypeError(
-                "cannot properly create the storer for: [%s] [group->%s,"
-                "value->%s,format->%s,append->%s,kwargs->%s]"
-                % (t, group, type(value), format, append, kwargs)
-            )
+                "cannot properly create the storer for: [{t}] [group->"
+                "{group},value->{value},format->{format},append->{append},"
+                "kwargs->{kwargs}]".format(t=t, group=group,
+                                           value=type(value), format=format,
+                                           append=append, kwargs=kwargs))
 
         pt = _ensure_decoded(getattr(group._v_attrs, 'pandas_type', None))
         tt = _ensure_decoded(getattr(group._v_attrs, 'table_type', None))
@@ -1193,8 +1286,8 @@ def error(t):
                 _tables()
                 if (getattr(group, 'table', None) or
                         isinstance(group, _table_mod.table.Table)):
-                    pt = u('frame_table')
-                    tt = u('generic_table')
+                    pt = u'frame_table'
+                    tt = u'generic_table'
                 else:
                     raise TypeError(
                         "cannot create a storer if the object is not existing "
@@ -1203,59 +1296,59 @@ def error(t):
 
                 try:
                     pt = _TYPE_MAP[type(value)]
-                except:
+                except KeyError:
                     error('_TYPE_MAP')
 
                 # we are actually a table
                 if format == 'table':
-                    pt += u('_table')
+                    pt += u'_table'
 
         # a storer node
-        if u('table') not in pt:
+        if u'table' not in pt:
             try:
                 return globals()[_STORER_MAP[pt]](self, group, **kwargs)
-            except:
+            except KeyError:
                 error('_STORER_MAP')
 
         # existing node (and must be a table)
         if tt is None:
 
-            # if we are a writer, determin the tt
+            # if we are a writer, determine the tt
             if value is not None:
 
-                if pt == u('series_table'):
+                if pt == u'series_table':
                     index = getattr(value, 'index', None)
                     if index is not None:
                         if index.nlevels == 1:
-                            tt = u('appendable_series')
+                            tt = u'appendable_series'
                         elif index.nlevels > 1:
-                            tt = u('appendable_multiseries')
-                elif pt == u('frame_table'):
+                            tt = u'appendable_multiseries'
+                elif pt == u'frame_table':
                     index = getattr(value, 'index', None)
                     if index is not None:
                         if index.nlevels == 1:
-                            tt = u('appendable_frame')
+                            tt = u'appendable_frame'
                         elif index.nlevels > 1:
-                            tt = u('appendable_multiframe')
-                elif pt == u('wide_table'):
-                    tt = u('appendable_panel')
-                elif pt == u('ndim_table'):
-                    tt = u('appendable_ndim')
+                            tt = u'appendable_multiframe'
+                elif pt == u'wide_table':
+                    tt = u'appendable_panel'
+                elif pt == u'ndim_table':
+                    tt = u'appendable_ndim'
 
             else:
 
                 # distiguish between a frame/table
-                tt = u('legacy_panel')
+                tt = u'legacy_panel'
                 try:
                     fields = group.table._v_attrs.fields
-                    if len(fields) == 1 and fields[0] == u('value'):
-                        tt = u('legacy_frame')
-                except:
+                    if len(fields) == 1 and fields[0] == u'value':
+                        tt = u'legacy_frame'
+                except IndexError:
                     pass
 
         try:
             return globals()[_TABLE_MAP[tt]](self, group, **kwargs)
-        except:
+        except KeyError:
             error('_TABLE_MAP')
 
     def _write_to_group(self, key, value, format, index=True, append=False,
@@ -1319,12 +1412,6 @@ def _read_group(self, group, **kwargs):
         return s.read(**kwargs)
 
 
-def get_store(path, **kwargs):
-    """ Backwards compatible alias for ``HDFStore``
-    """
-    return HDFStore(path, **kwargs)
-
-
 class TableIterator(object):
 
     """ define the iteration interface on a table
@@ -1333,7 +1420,7 @@ class TableIterator(object):
         ----------
 
         store : the reference store
-        s     : the refered storer
+        s     : the referred storer
         func  : the function to execute the query
         where : the where of the query
         nrows : the rows to iterate on
@@ -1411,7 +1498,8 @@ def get_result(self, coordinates=False):
 
         # if specified read via coordinates (necessary for multiple selections
         if coordinates:
-            where = self.s.read_coordinates(where=self.where)
+            where = self.s.read_coordinates(where=self.where, start=self.start,
+                                            stop=self.stop)
         else:
             where = self.where
 
@@ -1466,7 +1554,7 @@ def __init__(self, values=None, kind=None, typ=None, cname=None,
     def set_name(self, name, kind_attr=None):
         """ set the name of this indexer """
         self.name = name
-        self.kind_attr = kind_attr or "%s_kind" % name
+        self.kind_attr = kind_attr or "{name}_kind".format(name=name)
         if self.cname is None:
             self.cname = name
 
@@ -1497,12 +1585,14 @@ def __unicode__(self):
                      self.axis,
                      self.pos,
                      self.kind)))
-        return "name->%s,cname->%s,axis->%s,pos->%s,kind->%s" % temp
+        return ','.join(("{key}->{value}".format(key=key, value=value)
+                         for key, value in zip(
+            ['name', 'cname', 'axis', 'pos', 'kind'], temp)))
 
     def __eq__(self, other):
         """ compare 2 col items """
-        return all([getattr(self, a, None) == getattr(other, a, None)
-                    for a in ['name', 'cname', 'axis', 'pos']])
+        return all(getattr(self, a, None) == getattr(other, a, None)
+                   for a in ['name', 'cname', 'axis', 'pos'])
 
     def __ne__(self, other):
         return not self.__eq__(other)
@@ -1512,7 +1602,7 @@ def is_indexed(self):
         """ return whether I am an indexed column """
         try:
             return getattr(self.table.cols, self.cname).is_indexed
-        except:
+        except AttributeError:
             False
 
     def copy(self):
@@ -1528,23 +1618,24 @@ def infer(self, handler):
         new_self.read_metadata(handler)
         return new_self
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """ set the values from this selection: take = take ownership """
 
         # values is a recarray
         if values.dtype.fields is not None:
             values = values[self.cname]
 
-        values = _maybe_convert(values, self.kind, encoding)
+        values = _maybe_convert(values, self.kind, encoding, errors)
 
         kwargs = dict()
         if self.freq is not None:
             kwargs['freq'] = _ensure_decoded(self.freq)
         if self.index_name is not None:
             kwargs['name'] = _ensure_decoded(self.index_name)
+        # making an Index instance could throw a number of different errors
         try:
             self.values = Index(values, **kwargs)
-        except:
+        except Exception:  # noqa: E722
 
             # if the output freq is different that what we recorded,
             # it should be None (see also 'doc example part 2')
@@ -1582,11 +1673,11 @@ def cvalues(self):
     def __iter__(self):
         return iter(self.values)
 
-    def maybe_set_size(self, min_itemsize=None, **kwargs):
+    def maybe_set_size(self, min_itemsize=None):
         """ maybe set a string col itemsize:
-               min_itemsize can be an interger or a dict with this columns name
+               min_itemsize can be an integer or a dict with this columns name
                with an integer size """
-        if _ensure_decoded(self.kind) == u('string'):
+        if _ensure_decoded(self.kind) == u'string':
 
             if isinstance(min_itemsize, dict):
                 min_itemsize = min_itemsize.get(self.name)
@@ -1595,13 +1686,13 @@ def maybe_set_size(self, min_itemsize=None, **kwargs):
                 self.typ = _tables(
                 ).StringCol(itemsize=min_itemsize, pos=self.pos)
 
-    def validate(self, handler, append, **kwargs):
+    def validate(self, handler, append):
         self.validate_names()
 
     def validate_names(self):
         pass
 
-    def validate_and_set(self, handler, append, **kwargs):
+    def validate_and_set(self, handler, append):
         self.set_table(handler.table)
         self.validate_col()
         self.validate_attr(append)
@@ -1613,17 +1704,19 @@ def validate_col(self, itemsize=None):
         """ validate this column: return the compared against itemsize """
 
         # validate this column for string truncation (or reset to the max size)
-        if _ensure_decoded(self.kind) == u('string'):
+        if _ensure_decoded(self.kind) == u'string':
             c = self.col
             if c is not None:
                 if itemsize is None:
                     itemsize = self.itemsize
                 if c.itemsize < itemsize:
                     raise ValueError(
-                        "Trying to store a string with len [%s] in [%s] "
-                        "column but\nthis column has a limit of [%s]!\n"
-                        "Consider using min_itemsize to preset the sizes on "
-                        "these columns" % (itemsize, self.cname, c.itemsize))
+                        "Trying to store a string with len [{itemsize}] in "
+                        "[{cname}] column but\nthis column has a limit of "
+                        "[{c_itemsize}]!\nConsider using min_itemsize to "
+                        "preset the sizes on these columns".format(
+                            itemsize=itemsize, cname=self.cname,
+                            c_itemsize=c.itemsize))
                 return c.itemsize
 
         return None
@@ -1633,8 +1726,10 @@ def validate_attr(self, append):
         if append:
             existing_kind = getattr(self.attrs, self.kind_attr, None)
             if existing_kind is not None and existing_kind != self.kind:
-                raise TypeError("incompatible kind in col [%s - %s]" %
-                                (existing_kind, self.kind))
+                raise TypeError(
+                    "incompatible kind in col [{existing} - "
+                    "{self_kind}]".format(
+                        existing=existing_kind, self_kind=self.kind))
 
     def update_info(self, info):
         """ set/update the info for this indexable with the key/value
@@ -1659,9 +1754,11 @@ def update_info(self, info):
 
                 else:
                     raise ValueError(
-                        "invalid info for [%s] for [%s], existing_value [%s] "
-                        "conflicts with new value [%s]"
-                        % (self.name, key, existing_value, value))
+                        "invalid info for [{name}] for [{key}], "
+                        "existing_value [{existing_value}] conflicts with "
+                        "new value [{value}]".format(
+                            name=self.name, key=key,
+                            existing_value=existing_value, value=value))
             else:
                 if value is not None or existing_value is not None:
                     idx[key] = value
@@ -1675,11 +1772,11 @@ def set_info(self, info):
             self.__dict__.update(idx)
 
     def get_attr(self):
-        """ set the kind for this colummn """
+        """ set the kind for this column """
         self.kind = getattr(self.attrs, self.kind_attr, None)
 
     def set_attr(self):
-        """ set the kind for this colummn """
+        """ set the kind for this column """
         setattr(self.attrs, self.kind_attr, self.kind)
 
     def read_metadata(self, handler):
@@ -1691,8 +1788,8 @@ def validate_metadata(self, handler):
         if self.meta == 'category':
             new_metadata = self.metadata
             cur_metadata = handler.read_metadata(self.cname)
-            if new_metadata is not None and cur_metadata is not None \
-                    and not array_equivalent(new_metadata, cur_metadata):
+            if (new_metadata is not None and cur_metadata is not None and
+                    not array_equivalent(new_metadata, cur_metadata)):
                 raise ValueError("cannot append a categorical with "
                                  "different categories to the existing")
 
@@ -1710,7 +1807,7 @@ class GenericIndexCol(IndexCol):
     def is_indexed(self):
         return False
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """ set the values from this selection: take = take ownership """
 
         self.values = Int64Index(np.arange(self.table.nrows))
@@ -1746,7 +1843,7 @@ def create_for_block(
         """ return a new datacol with the block i """
 
         if cname is None:
-            cname = name or 'values_block_%d' % i
+            cname = name or 'values_block_{idx}'.format(idx=i)
         if name is None:
             name = cname
 
@@ -1754,10 +1851,10 @@ def create_for_block(
         # name values_0
         try:
             if version[0] == 0 and version[1] <= 10 and version[2] == 0:
-                m = re.search("values_block_(\d+)", name)
+                m = re.search(r"values_block_(\d+)", name)
                 if m:
-                    name = "values_%s" % m.groups()[0]
-        except:
+                    name = "values_{group}".format(group=m.groups()[0])
+        except IndexError:
             pass
 
         return cls(name=name, cname=cname, **kwargs)
@@ -1768,9 +1865,9 @@ def __init__(self, values=None, kind=None, typ=None,
         super(DataCol, self).__init__(values=values, kind=kind, typ=typ,
                                       cname=cname, **kwargs)
         self.dtype = None
-        self.dtype_attr = u("%s_dtype" % self.name)
+        self.dtype_attr = u'{name}_dtype'.format(name=self.name)
         self.meta = meta
-        self.meta_attr = u("%s_meta" % self.name)
+        self.meta_attr = u'{name}_meta'.format(name=self.name)
         self.set_data(data)
         self.set_metadata(metadata)
 
@@ -1782,12 +1879,14 @@ def __unicode__(self):
                      self.dtype,
                      self.kind,
                      self.shape)))
-        return "name->%s,cname->%s,dtype->%s,kind->%s,shape->%s" % temp
+        return ','.join(("{key}->{value}".format(key=key, value=value)
+                         for key, value in zip(
+            ['name', 'cname', 'dtype', 'kind', 'shape'], temp)))
 
     def __eq__(self, other):
         """ compare 2 col items """
-        return all([getattr(self, a, None) == getattr(other, a, None)
-                    for a in ['name', 'cname', 'dtype', 'pos']])
+        return all(getattr(self, a, None) == getattr(other, a, None)
+                   for a in ['name', 'cname', 'dtype', 'pos'])
 
     def set_data(self, data, dtype=None):
         self.data = data
@@ -1816,30 +1915,31 @@ def set_kind(self):
         if self.dtype is not None:
             dtype = _ensure_decoded(self.dtype)
 
-            if dtype.startswith(u('string')) or dtype.startswith(u('bytes')):
+            if dtype.startswith(u'string') or dtype.startswith(u'bytes'):
                 self.kind = 'string'
-            elif dtype.startswith(u('float')):
+            elif dtype.startswith(u'float'):
                 self.kind = 'float'
-            elif dtype.startswith(u('complex')):
+            elif dtype.startswith(u'complex'):
                 self.kind = 'complex'
-            elif dtype.startswith(u('int')) or dtype.startswith(u('uint')):
+            elif dtype.startswith(u'int') or dtype.startswith(u'uint'):
                 self.kind = 'integer'
-            elif dtype.startswith(u('date')):
+            elif dtype.startswith(u'date'):
                 self.kind = 'datetime'
-            elif dtype.startswith(u('timedelta')):
+            elif dtype.startswith(u'timedelta'):
                 self.kind = 'timedelta'
-            elif dtype.startswith(u('bool')):
+            elif dtype.startswith(u'bool'):
                 self.kind = 'bool'
             else:
                 raise AssertionError(
-                    "cannot interpret dtype of [%s] in [%s]" % (dtype, self))
+                    "cannot interpret dtype of [{dtype}] in [{obj}]".format(
+                        dtype=dtype, obj=self))
 
             # set my typ if we need
             if self.typ is None:
                 self.typ = getattr(self.description, self.cname, None)
 
     def set_atom(self, block, block_items, existing_col, min_itemsize,
-                 nan_rep, info, encoding=None, **kwargs):
+                 nan_rep, info, encoding=None, errors='strict'):
         """ create and setup my atom from the block b """
 
         self.values = list(block_items)
@@ -1858,7 +1958,7 @@ def set_atom(self, block, block_items, existing_col, min_itemsize,
             return self.set_atom_complex(block)
 
         dtype = block.dtype.name
-        inferred_type = lib.infer_dtype(block.values)
+        inferred_type = lib.infer_dtype(block.values, skipna=False)
 
         if inferred_type == 'date':
             raise TypeError(
@@ -1884,7 +1984,8 @@ def set_atom(self, block, block_items, existing_col, min_itemsize,
                 existing_col,
                 min_itemsize,
                 nan_rep,
-                encoding)
+                encoding,
+                errors)
 
         # set as a data block
         else:
@@ -1894,7 +1995,7 @@ def get_atom_string(self, block, itemsize):
         return _tables().StringCol(itemsize=itemsize, shape=block.shape[0])
 
     def set_atom_string(self, block, block_items, existing_col, min_itemsize,
-                        nan_rep, encoding):
+                        nan_rep, encoding, errors):
         # fill nan items with myself, don't disturb the blocks by
         # trying to downcast
         block = block.fillna(nan_rep, downcast=False)
@@ -1903,7 +2004,7 @@ def set_atom_string(self, block, block_items, existing_col, min_itemsize,
         data = block.values
 
         # see if we have a valid string type
-        inferred_type = lib.infer_dtype(data.ravel())
+        inferred_type = lib.infer_dtype(data.ravel(), skipna=False)
         if inferred_type != 'string':
 
             # we cannot serialize this data, so report an exception on a column
@@ -1911,16 +2012,16 @@ def set_atom_string(self, block, block_items, existing_col, min_itemsize,
             for i, item in enumerate(block_items):
 
                 col = block.iget(i)
-                inferred_type = lib.infer_dtype(col.ravel())
+                inferred_type = lib.infer_dtype(col.ravel(), skipna=False)
                 if inferred_type != 'string':
                     raise TypeError(
-                        "Cannot serialize the column [%s] because\n"
-                        "its data contents are [%s] object dtype"
-                        % (item, inferred_type)
+                        "Cannot serialize the column [{item}] because\n"
+                        "its data contents are [{type}] object dtype".format(
+                            item=item, type=inferred_type)
                     )
 
         # itemsize is the maximum length of a string (along any dimension)
-        data_converted = _convert_string_array(data, encoding)
+        data_converted = _convert_string_array(data, encoding, errors)
         itemsize = data_converted.itemsize
 
         # specified min_itemsize?
@@ -1938,16 +2039,17 @@ def set_atom_string(self, block, block_items, existing_col, min_itemsize,
         self.itemsize = itemsize
         self.kind = 'string'
         self.typ = self.get_atom_string(block, itemsize)
-        self.set_data(data_converted.astype('|S%d' % itemsize, copy=False))
+        self.set_data(data_converted.astype(
+            '|S{size}'.format(size=itemsize), copy=False))
 
     def get_atom_coltype(self, kind=None):
         """ return the PyTables column class for this column """
         if kind is None:
             kind = self.kind
         if self.kind.startswith('uint'):
-            col_name = "UInt%sCol" % kind[4:]
+            col_name = "UInt{name}Col".format(name=kind[4:])
         else:
-            col_name = "%sCol" % kind.capitalize()
+            col_name = "{name}Col".format(name=kind.capitalize())
 
         return getattr(_tables(), col_name)
 
@@ -2051,7 +2153,7 @@ def validate_attr(self, append):
                 raise ValueError("appended items dtype do not match existing "
                                  "items dtype in table!")
 
-    def convert(self, values, nan_rep, encoding):
+    def convert(self, values, nan_rep, encoding, errors):
         """set the data from this selection (and convert to the correct dtype
         if we can)
         """
@@ -2070,14 +2172,14 @@ def convert(self, values, nan_rep, encoding):
             dtype = _ensure_decoded(self.dtype)
 
             # reverse converts
-            if dtype == u('datetime64'):
+            if dtype == u'datetime64':
 
                 # recreate with tz if indicated
                 self.data = _set_tz(self.data, self.tz, coerce=True)
 
-            elif dtype == u('timedelta64'):
+            elif dtype == u'timedelta64':
                 self.data = np.asarray(self.data, dtype='m8[ns]')
-            elif dtype == u('date'):
+            elif dtype == u'date':
                 try:
                     self.data = np.asarray(
                         [date.fromordinal(v) for v in self.data], dtype=object)
@@ -2085,12 +2187,12 @@ def convert(self, values, nan_rep, encoding):
                     self.data = np.asarray(
                         [date.fromtimestamp(v) for v in self.data],
                         dtype=object)
-            elif dtype == u('datetime'):
+            elif dtype == u'datetime':
                 self.data = np.asarray(
                     [datetime.fromtimestamp(v) for v in self.data],
                     dtype=object)
 
-            elif meta == u('category'):
+            elif meta == u'category':
 
                 # we have a categorical
                 categories = self.metadata
@@ -2099,10 +2201,17 @@ def convert(self, values, nan_rep, encoding):
                 # if we have stored a NaN in the categories
                 # then strip it; in theory we could have BOTH
                 # -1s in the codes and nulls :<
-                mask = isnull(categories)
-                if mask.any():
-                    categories = categories[~mask]
-                    codes[codes != -1] -= mask.astype(int).cumsum().values
+                if categories is None:
+                    # Handle case of NaN-only categorical columns in which case
+                    # the categories are an empty array; when this is stored,
+                    # pytables cannot write a zero-len array, so on readback
+                    # the categories would be None and `read_hdf()` would fail.
+                    categories = Index([], dtype=np.float64)
+                else:
+                    mask = isna(categories)
+                    if mask.any():
+                        categories = categories[~mask]
+                        codes[codes != -1] -= mask.astype(int).cumsum().values
 
                 self.data = Categorical.from_codes(codes,
                                                    categories=categories,
@@ -2112,25 +2221,25 @@ def convert(self, values, nan_rep, encoding):
 
                 try:
                     self.data = self.data.astype(dtype, copy=False)
-                except:
+                except TypeError:
                     self.data = self.data.astype('O', copy=False)
 
         # convert nans / decode
-        if _ensure_decoded(self.kind) == u('string'):
+        if _ensure_decoded(self.kind) == u'string':
             self.data = _unconvert_string_array(
-                self.data, nan_rep=nan_rep, encoding=encoding)
+                self.data, nan_rep=nan_rep, encoding=encoding, errors=errors)
 
         return self
 
     def get_attr(self):
-        """ get the data for this colummn """
+        """ get the data for this column """
         self.values = getattr(self.attrs, self.kind_attr, None)
         self.dtype = getattr(self.attrs, self.dtype_attr, None)
         self.meta = getattr(self.attrs, self.meta_attr, None)
         self.set_kind()
 
     def set_attr(self):
-        """ set the data for this colummn """
+        """ set the data for this column """
         setattr(self.attrs, self.kind_attr, self.values)
         setattr(self.attrs, self.meta_attr, self.meta)
         if self.dtype is not None:
@@ -2184,10 +2293,12 @@ class Fixed(StringMixin):
     ndim = None
     is_table = False
 
-    def __init__(self, parent, group, encoding=None, **kwargs):
+    def __init__(self, parent, group, encoding=None, errors='strict',
+                 **kwargs):
         self.parent = parent
         self.group = group
         self.encoding = _ensure_encoding(encoding)
+        self.errors = errors
         self.set_version()
 
     @property
@@ -2200,10 +2311,10 @@ def set_version(self):
         version = _ensure_decoded(
             getattr(self.group._v_attrs, 'pandas_version', None))
         try:
-            self.version = tuple([int(x) for x in version.split('.')])
+            self.version = tuple(int(x) for x in version.split('.'))
             if len(self.version) == 2:
                 self.version = self.version + (0,)
-        except:
+        except AttributeError:
             self.version = (0, 0, 0)
 
     @property
@@ -2221,8 +2332,10 @@ def __unicode__(self):
         s = self.shape
         if s is not None:
             if isinstance(s, (list, tuple)):
-                s = "[%s]" % ','.join([pprint_thing(x) for x in s])
-            return "%-12.12s (shape->%s)" % (self.pandas_type, s)
+                s = "[{shape}]".format(
+                    shape=','.join(pprint_thing(x) for x in s))
+            return "{type:12.12} (shape->{shape})".format(
+                type=self.pandas_type, shape=s)
         return self.pandas_type
 
     def set_object_info(self):
@@ -2325,7 +2438,7 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
         support fully deleting the node in its entirety (only) - where
         specification must be None
         """
-        if where is None and start is None and stop is None:
+        if com._all_none(where, start, stop):
             self._handle.remove_node(self.group, recursive=True)
             return None
 
@@ -2336,8 +2449,7 @@ class GenericFixed(Fixed):
 
     """ a generified fixed version """
     _index_type_map = {DatetimeIndex: 'datetime', PeriodIndex: 'period'}
-    _reverse_index_map = dict([(v, k)
-                               for k, v in compat.iteritems(_index_type_map)])
+    _reverse_index_map = {v: k for k, v in compat.iteritems(_index_type_map)}
     attributes = []
 
     # indexer helpders
@@ -2353,12 +2465,16 @@ def _alias_to_class(self, alias):
     def _get_index_factory(self, klass):
         if klass == DatetimeIndex:
             def f(values, freq=None, tz=None):
-                return DatetimeIndex._simple_new(values, None, freq=freq,
-                                                 tz=tz)
+                # data are already in UTC, localize and convert if tz present
+                result = DatetimeIndex._simple_new(values.values, name=None,
+                                                   freq=freq)
+                if tz is not None:
+                    result = result.tz_localize('UTC').tz_convert(tz)
+                return result
             return f
         elif klass == PeriodIndex:
             def f(values, freq=None, tz=None):
-                return PeriodIndex._simple_new(values, None, freq=freq)
+                return PeriodIndex._simple_new(values, name=None, freq=freq)
             return f
 
         return klass
@@ -2389,10 +2505,12 @@ def is_exists(self):
     def set_attrs(self):
         """ set our object attributes """
         self.attrs.encoding = self.encoding
+        self.attrs.errors = self.errors
 
     def get_attrs(self):
         """ retrieve our attributes """
         self.encoding = _ensure_encoding(getattr(self.attrs, 'encoding', None))
+        self.errors = _ensure_decoded(getattr(self.attrs, 'errors', 'strict'))
         for n in self.attributes:
             setattr(self, n, _ensure_decoded(getattr(self.attrs, n, None)))
 
@@ -2403,13 +2521,12 @@ def read_array(self, key, start=None, stop=None):
         """ read an array for the specified node (off of group """
         import tables
         node = getattr(self.group, key)
-        data = node[start:stop]
         attrs = node._v_attrs
 
         transposed = getattr(attrs, 'transposed', False)
 
         if isinstance(node, tables.VLArray):
-            ret = data[0]
+            ret = node[0][start:stop]
         else:
             dtype = getattr(attrs, 'value_type', None)
             shape = getattr(attrs, 'shape', None)
@@ -2418,14 +2535,14 @@ def read_array(self, key, start=None, stop=None):
                 # length 0 axis
                 ret = np.empty(shape, dtype=dtype)
             else:
-                ret = data
+                ret = node[start:stop]
 
-            if dtype == u('datetime64'):
+            if dtype == u'datetime64':
 
                 # reconstruct a timezone if indicated
                 ret = _set_tz(ret, getattr(attrs, 'tz', None), coerce=True)
 
-            elif dtype == u('timedelta64'):
+            elif dtype == u'timedelta64':
                 ret = np.asarray(ret, dtype='m8[ns]')
 
         if transposed:
@@ -2434,33 +2551,36 @@ def read_array(self, key, start=None, stop=None):
             return ret
 
     def read_index(self, key, **kwargs):
-        variety = _ensure_decoded(getattr(self.attrs, '%s_variety' % key))
+        variety = _ensure_decoded(
+            getattr(self.attrs, '{key}_variety'.format(key=key)))
 
-        if variety == u('multi'):
+        if variety == u'multi':
             return self.read_multi_index(key, **kwargs)
-        elif variety == u('block'):
+        elif variety == u'block':
             return self.read_block_index(key, **kwargs)
-        elif variety == u('sparseint'):
+        elif variety == u'sparseint':
             return self.read_sparse_intindex(key, **kwargs)
-        elif variety == u('regular'):
+        elif variety == u'regular':
             _, index = self.read_index_node(getattr(self.group, key), **kwargs)
             return index
         else:  # pragma: no cover
-            raise TypeError('unrecognized index variety: %s' % variety)
+            raise TypeError(
+                'unrecognized index variety: {variety}'.format(
+                    variety=variety))
 
     def write_index(self, key, index):
         if isinstance(index, MultiIndex):
-            setattr(self.attrs, '%s_variety' % key, 'multi')
+            setattr(self.attrs, '{key}_variety'.format(key=key), 'multi')
             self.write_multi_index(key, index)
         elif isinstance(index, BlockIndex):
-            setattr(self.attrs, '%s_variety' % key, 'block')
+            setattr(self.attrs, '{key}_variety'.format(key=key), 'block')
             self.write_block_index(key, index)
         elif isinstance(index, IntIndex):
-            setattr(self.attrs, '%s_variety' % key, 'sparseint')
+            setattr(self.attrs, '{key}_variety'.format(key=key), 'sparseint')
             self.write_sparse_intindex(key, index)
         else:
-            setattr(self.attrs, '%s_variety' % key, 'regular')
-            converted = _convert_index(index, self.encoding,
+            setattr(self.attrs, '{key}_variety'.format(key=key), 'regular')
+            converted = _convert_index(index, self.encoding, self.errors,
                                        self.format_type).set_name('index')
 
             self.write_array(key, converted.values)
@@ -2479,34 +2599,34 @@ def write_index(self, key, index):
                 node._v_attrs.tz = _get_tz(index.tz)
 
     def write_block_index(self, key, index):
-        self.write_array('%s_blocs' % key, index.blocs)
-        self.write_array('%s_blengths' % key, index.blengths)
-        setattr(self.attrs, '%s_length' % key, index.length)
+        self.write_array('{key}_blocs'.format(key=key), index.blocs)
+        self.write_array('{key}_blengths'.format(key=key), index.blengths)
+        setattr(self.attrs, '{key}_length'.format(key=key), index.length)
 
     def read_block_index(self, key, **kwargs):
-        length = getattr(self.attrs, '%s_length' % key)
-        blocs = self.read_array('%s_blocs' % key, **kwargs)
-        blengths = self.read_array('%s_blengths' % key, **kwargs)
+        length = getattr(self.attrs, '{key}_length'.format(key=key))
+        blocs = self.read_array('{key}_blocs'.format(key=key), **kwargs)
+        blengths = self.read_array('{key}_blengths'.format(key=key), **kwargs)
         return BlockIndex(length, blocs, blengths)
 
     def write_sparse_intindex(self, key, index):
-        self.write_array('%s_indices' % key, index.indices)
-        setattr(self.attrs, '%s_length' % key, index.length)
+        self.write_array('{key}_indices'.format(key=key), index.indices)
+        setattr(self.attrs, '{key}_length'.format(key=key), index.length)
 
     def read_sparse_intindex(self, key, **kwargs):
-        length = getattr(self.attrs, '%s_length' % key)
-        indices = self.read_array('%s_indices' % key, **kwargs)
+        length = getattr(self.attrs, '{key}_length'.format(key=key))
+        indices = self.read_array('{key}_indices'.format(key=key), **kwargs)
         return IntIndex(length, indices)
 
     def write_multi_index(self, key, index):
-        setattr(self.attrs, '%s_nlevels' % key, index.nlevels)
+        setattr(self.attrs, '{key}_nlevels'.format(key=key), index.nlevels)
 
-        for i, (lev, lab, name) in enumerate(zip(index.levels,
-                                                 index.labels,
-                                                 index.names)):
+        for i, (lev, level_codes, name) in enumerate(zip(index.levels,
+                                                         index.codes,
+                                                         index.names)):
             # write the level
-            level_key = '%s_level%d' % (key, i)
-            conv_level = _convert_index(lev, self.encoding,
+            level_key = '{key}_level{idx}'.format(key=key, idx=i)
+            conv_level = _convert_index(lev, self.encoding, self.errors,
                                         self.format_type).set_name(level_key)
             self.write_array(level_key, conv_level.values)
             node = getattr(self.group, level_key)
@@ -2514,30 +2634,31 @@ def write_multi_index(self, key, index):
             node._v_attrs.name = name
 
             # write the name
-            setattr(node._v_attrs, '%s_name%d' % (key, i), name)
+            setattr(node._v_attrs, '{key}_name{name}'.format(
+                key=key, name=name), name)
 
             # write the labels
-            label_key = '%s_label%d' % (key, i)
-            self.write_array(label_key, lab)
+            label_key = '{key}_label{idx}'.format(key=key, idx=i)
+            self.write_array(label_key, level_codes)
 
     def read_multi_index(self, key, **kwargs):
-        nlevels = getattr(self.attrs, '%s_nlevels' % key)
+        nlevels = getattr(self.attrs, '{key}_nlevels'.format(key=key))
 
         levels = []
-        labels = []
+        codes = []
         names = []
         for i in range(nlevels):
-            level_key = '%s_level%d' % (key, i)
+            level_key = '{key}_level{idx}'.format(key=key, idx=i)
             name, lev = self.read_index_node(getattr(self.group, level_key),
                                              **kwargs)
             levels.append(lev)
             names.append(name)
 
-            label_key = '%s_label%d' % (key, i)
-            lab = self.read_array(label_key, **kwargs)
-            labels.append(lab)
+            label_key = '{key}_label{idx}'.format(key=key, idx=i)
+            level_codes = self.read_array(label_key, **kwargs)
+            codes.append(level_codes)
 
-        return MultiIndex(levels=levels, labels=labels, names=names,
+        return MultiIndex(levels=levels, codes=codes, names=names,
                           verify_integrity=True)
 
     def read_index_node(self, node, start=None, stop=None):
@@ -2552,26 +2673,29 @@ def read_index_node(self, node, start=None, stop=None):
         name = None
 
         if 'name' in node._v_attrs:
-            name = node._v_attrs.name
+            name = _ensure_str(node._v_attrs.name)
+            name = _ensure_decoded(name)
 
-        index_class = self._alias_to_class(getattr(node._v_attrs,
-                                                   'index_class', ''))
+        index_class = self._alias_to_class(_ensure_decoded(
+            getattr(node._v_attrs, 'index_class', '')))
         factory = self._get_index_factory(index_class)
 
         kwargs = {}
-        if u('freq') in node._v_attrs:
+        if u'freq' in node._v_attrs:
             kwargs['freq'] = node._v_attrs['freq']
 
-        if u('tz') in node._v_attrs:
+        if u'tz' in node._v_attrs:
             kwargs['tz'] = node._v_attrs['tz']
 
-        if kind in (u('date'), u('datetime')):
+        if kind in (u'date', u'datetime'):
             index = factory(_unconvert_index(data, kind,
-                                             encoding=self.encoding),
+                                             encoding=self.encoding,
+                                             errors=self.errors),
                             dtype=object, **kwargs)
         else:
             index = factory(_unconvert_index(data, kind,
-                                             encoding=self.encoding), **kwargs)
+                                             encoding=self.encoding,
+                                             errors=self.errors), **kwargs)
 
         index.name = name
 
@@ -2602,10 +2726,11 @@ def write_array(self, key, value, items=None):
             raise NotImplementedError('Cannot store a category dtype in '
                                       'a HDF5 dataset that uses format='
                                       '"fixed". Use format="table".')
-
         if not empty_array:
-            value = value.T
-            transposed = True
+            if hasattr(value, 'T'):
+                # ExtensionArrays (1d) may not have transpose.
+                value = value.T
+                transposed = True
 
         if self._filters is not None:
             atom = None
@@ -2633,7 +2758,7 @@ def write_array(self, key, value, items=None):
 
             # infer the type, warn if we have a non-string type here (for
             # performance)
-            inferred_type = lib.infer_dtype(value.ravel())
+            inferred_type = lib.infer_dtype(value.ravel(), skipna=False)
             if empty_array:
                 pass
             elif inferred_type == 'string':
@@ -2641,7 +2766,7 @@ def write_array(self, key, value, items=None):
             else:
                 try:
                     items = list(items)
-                except:
+                except TypeError:
                     pass
                 ws = performance_doc % (inferred_type, key, items)
                 warnings.warn(ws, PerformanceWarning, stacklevel=7)
@@ -2684,7 +2809,8 @@ def read_index_legacy(self, key, start=None, stop=None):
         node = getattr(self.group, key)
         data = node[start:stop]
         kind = node._v_attrs.kind
-        return _unconvert_index_legacy(data, kind, encoding=self.encoding)
+        return _unconvert_index_legacy(data, kind, encoding=self.encoding,
+                                       errors=self.errors)
 
 
 class LegacySeriesFixed(LegacyFixed):
@@ -2707,14 +2833,14 @@ def read(self, **kwargs):
 
 
 class SeriesFixed(GenericFixed):
-    pandas_kind = u('series')
+    pandas_kind = u'series'
     attributes = ['name']
 
     @property
     def shape(self):
         try:
             return len(getattr(self.group, 'values')),
-        except:
+        except (TypeError, AttributeError):
             return None
 
     def read(self, **kwargs):
@@ -2744,7 +2870,7 @@ def validate_read(self, kwargs):
 
 
 class SparseSeriesFixed(SparseFixed):
-    pandas_kind = u('sparse_series')
+    pandas_kind = u'sparse_series'
     attributes = ['name', 'fill_value', 'kind']
 
     def read(self, **kwargs):
@@ -2753,7 +2879,7 @@ def read(self, **kwargs):
         sp_values = self.read_array('sp_values')
         sp_index = self.read_index('sp_index')
         return SparseSeries(sp_values, index=index, sparse_index=sp_index,
-                            kind=self.kind or u('block'),
+                            kind=self.kind or u'block',
                             fill_value=self.fill_value,
                             name=self.name)
 
@@ -2768,7 +2894,7 @@ def write(self, obj, **kwargs):
 
 
 class SparseFrameFixed(SparseFixed):
-    pandas_kind = u('sparse_frame')
+    pandas_kind = u'sparse_frame'
     attributes = ['default_kind', 'default_fill_value']
 
     def read(self, **kwargs):
@@ -2776,7 +2902,7 @@ def read(self, **kwargs):
         columns = self.read_index('columns')
         sdict = {}
         for c in columns:
-            key = 'sparse_series_%s' % c
+            key = 'sparse_series_{columns}'.format(columns=c)
             s = SparseSeriesFixed(self.parent, getattr(self.group, key))
             s.infer_axes()
             sdict[c] = s.read()
@@ -2788,7 +2914,7 @@ def write(self, obj, **kwargs):
         """ write it as a collection of individual sparse series """
         super(SparseFrameFixed, self).write(obj, **kwargs)
         for name, ss in compat.iteritems(obj):
-            key = 'sparse_series_%s' % name
+            key = 'sparse_series_{name}'.format(name=name)
             if key not in self.group._v_children:
                 node = self._handle.create_group(self.group, key)
             else:
@@ -2812,7 +2938,7 @@ def shape(self):
             # items
             items = 0
             for i in range(self.nblocks):
-                node = getattr(self.group, 'block%d_items' % i)
+                node = getattr(self.group, 'block{idx}_items'.format(idx=i))
                 shape = getattr(node, 'shape', None)
                 if shape is not None:
                     items += shape[0]
@@ -2832,7 +2958,7 @@ def shape(self):
                 shape = shape[::-1]
 
             return shape
-        except:
+        except AttributeError:
             return None
 
     def read(self, start=None, stop=None, **kwargs):
@@ -2845,15 +2971,16 @@ def read(self, start=None, stop=None, **kwargs):
         for i in range(self.ndim):
 
             _start, _stop = (start, stop) if i == select_axis else (None, None)
-            ax = self.read_index('axis%d' % i, start=_start, stop=_stop)
+            ax = self.read_index('axis{idx}'.format(
+                idx=i), start=_start, stop=_stop)
             axes.append(ax)
 
         items = axes[0]
         blocks = []
         for i in range(self.nblocks):
 
-            blk_items = self.read_index('block%d_items' % i)
-            values = self.read_array('block%d_values' % i,
+            blk_items = self.read_index('block{idx}_items'.format(idx=i))
+            values = self.read_array('block{idx}_values'.format(idx=i),
                                      start=_start, stop=_stop)
             blk = make_block(values,
                              placement=items.get_indexer(blk_items))
@@ -2873,32 +3000,23 @@ def write(self, obj, **kwargs):
                 if not ax.is_unique:
                     raise ValueError(
                         "Columns index has to be unique for fixed format")
-            self.write_index('axis%d' % i, ax)
+            self.write_index('axis{idx}'.format(idx=i), ax)
 
         # Supporting mixed-type DataFrame objects...nontrivial
         self.attrs.nblocks = len(data.blocks)
         for i, blk in enumerate(data.blocks):
             # I have no idea why, but writing values before items fixed #2299
             blk_items = data.items.take(blk.mgr_locs)
-            self.write_array('block%d_values' % i, blk.values, items=blk_items)
-            self.write_index('block%d_items' % i, blk_items)
+            self.write_array('block{idx}_values'.format(idx=i),
+                             blk.values, items=blk_items)
+            self.write_index('block{idx}_items'.format(idx=i), blk_items)
 
 
 class FrameFixed(BlockManagerFixed):
-    pandas_kind = u('frame')
+    pandas_kind = u'frame'
     obj_type = DataFrame
 
 
-class PanelFixed(BlockManagerFixed):
-    pandas_kind = u('wide')
-    obj_type = Panel
-    is_shape_reversed = True
-
-    def write(self, obj, **kwargs):
-        obj._consolidate_inplace()
-        return super(PanelFixed, self).write(obj, **kwargs)
-
-
 class Table(Fixed):
 
     """ represent a table:
@@ -2924,7 +3042,7 @@ class Table(Fixed):
         metadata      : the names of the metadata columns
 
         """
-    pandas_kind = u('wide_table')
+    pandas_kind = u'wide_table'
     table_type = None
     levels = 1
     is_table = True
@@ -2952,17 +3070,22 @@ def format_type(self):
     def __unicode__(self):
         """ return a pretty representatgion of myself """
         self.infer_axes()
-        dc = ",dc->[%s]" % ','.join(
-            self.data_columns) if len(self.data_columns) else ''
+        dc = ",dc->[{columns}]".format(columns=(','.join(
+            self.data_columns) if len(self.data_columns) else ''))
 
         ver = ''
         if self.is_old_version:
-            ver = "[%s]" % '.'.join([str(x) for x in self.version])
-
-        return "%-12.12s%s (typ->%s,nrows->%s,ncols->%s,indexers->[%s]%s)" % (
-            self.pandas_type, ver, self.table_type_short, self.nrows,
-            self.ncols, ','.join([a.name for a in self.index_axes]), dc
-        )
+            ver = "[{version}]".format(
+                version='.'.join(str(x) for x in self.version))
+
+        return (
+            "{pandas_type:12.12}{ver} (typ->{table_type},nrows->{nrows},"
+            "ncols->{ncols},indexers->[{index_axes}]{dc})".format(
+                pandas_type=self.pandas_type, ver=ver,
+                table_type=self.table_type_short, nrows=self.nrows,
+                ncols=self.ncols,
+                index_axes=(','.join(a.name for a in self.index_axes)), dc=dc
+            ))
 
     def __getitem__(self, c):
         """ return the axis for c """
@@ -2977,8 +3100,10 @@ def validate(self, other):
             return
 
         if other.table_type != self.table_type:
-            raise TypeError("incompatible table_type with existing [%s - %s]" %
-                            (other.table_type, self.table_type))
+            raise TypeError(
+                "incompatible table_type with existing "
+                "[{other} - {self}]".format(
+                    other=other.table_type, self=self.table_type))
 
         for c in ['index_axes', 'non_index_axes', 'values_axes']:
             sv = getattr(self, c, None)
@@ -2990,13 +3115,14 @@ def validate(self, other):
                     oax = ov[i]
                     if sax != oax:
                         raise ValueError(
-                            "invalid combinate of [%s] on appending data [%s] "
-                            "vs current table [%s]" % (c, sax, oax))
+                            "invalid combinate of [{c}] on appending data "
+                            "[{sax}] vs current table [{oax}]".format(
+                                c=c, sax=sax, oax=oax))
 
                 # should never get here
                 raise Exception(
-                    "invalid combinate of [%s] on appending data [%s] vs "
-                    "current table [%s]" % (c, sv, ov))
+                    "invalid combinate of [{c}] on appending data [{sv}] vs "
+                    "current table [{ov}]".format(c=c, sv=sv, ov=ov))
 
     @property
     def is_multi_index(self):
@@ -3028,7 +3154,7 @@ def nrows_expected(self):
     @property
     def is_exists(self):
         """ has this table been created """
-        return u('table') in self.group
+        return u'table' in self.group
 
     @property
     def storable(self):
@@ -3054,7 +3180,7 @@ def axes(self):
     @property
     def ncols(self):
         """ the number of total columns in the values axes """
-        return sum([len(a.values) for a in self.values_axes])
+        return sum(len(a.values) for a in self.values_axes)
 
     @property
     def is_transposed(self):
@@ -3103,7 +3229,8 @@ def write_metadata(self, key, values):
         """
         values = Series(values)
         self.parent.put(self._get_metadata_path(key), values, format='table',
-                        encoding=self.encoding, nan_rep=self.nan_rep)
+                        encoding=self.encoding, errors=self.errors,
+                        nan_rep=self.nan_rep)
 
     def read_metadata(self, key):
         """ return the meta data array for this key """
@@ -3124,6 +3251,7 @@ def set_attrs(self):
         self.attrs.data_columns = self.data_columns
         self.attrs.nan_rep = self.nan_rep
         self.attrs.encoding = self.encoding
+        self.attrs.errors = self.errors
         self.attrs.levels = self.levels
         self.attrs.metadata = self.metadata
         self.set_info()
@@ -3139,6 +3267,7 @@ def get_attrs(self):
         self.nan_rep = getattr(self.attrs, 'nan_rep', None)
         self.encoding = _ensure_encoding(
             getattr(self.attrs, 'encoding', None))
+        self.errors = _ensure_decoded(getattr(self.attrs, 'errors', 'strict'))
         self.levels = getattr(
             self.attrs, 'levels', None) or []
         self.index_axes = [
@@ -3176,8 +3305,8 @@ def validate_min_itemsize(self, min_itemsize):
                 continue
             if k not in q:
                 raise ValueError(
-                    "min_itemsize has the key [%s] which is not an axis or "
-                    "data_column" % k)
+                    "min_itemsize has the key [{key}] which is not an axis or "
+                    "data_column".format(key=k))
 
     @property
     def indexables(self):
@@ -3296,7 +3425,8 @@ def read_axes(self, where, **kwargs):
         # convert the data
         for a in self.axes:
             a.set_info(self.info)
-            a.convert(values, nan_rep=self.nan_rep, encoding=self.encoding)
+            a.convert(values, nan_rep=self.nan_rep, encoding=self.encoding,
+                      errors=self.errors)
 
         return True
 
@@ -3362,10 +3492,11 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
         if axes is None:
             try:
                 axes = _AXES_MAP[type(obj)]
-            except:
-                raise TypeError("cannot properly create the storer for: "
-                                "[group->%s,value->%s]"
-                                % (self.group._v_name, type(obj)))
+            except KeyError:
+                raise TypeError(
+                    "cannot properly create the storer for: [group->{group},"
+                    "value->{value}]".format(
+                        group=self.group._v_name, value=type(obj)))
 
         # map axes to numbers
         axes = [obj._get_axis_number(a) for a in axes]
@@ -3378,6 +3509,7 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
             data_columns = existing_table.data_columns
             nan_rep = existing_table.nan_rep
             self.encoding = existing_table.encoding
+            self.errors = existing_table.errors
             self.info = copy.copy(existing_table.info)
         else:
             existing_table = None
@@ -3404,7 +3536,7 @@ def create_axes(self, axes, obj, validate=True, nan_rep=None,
             if i in axes:
                 name = obj._AXIS_NAMES[i]
                 index_axes_map[i] = _convert_index(
-                    a, self.encoding, self.format_type
+                    a, self.encoding, self.errors, self.format_type
                 ).set_name(name).set_axis(i)
             else:
 
@@ -3456,7 +3588,7 @@ def get_blk_items(mgr, blocks):
             data_columns = self.validate_data_columns(
                 data_columns, min_itemsize)
             if len(data_columns):
-                mgr = block_obj.reindex_axis(
+                mgr = block_obj.reindex(
                     Index(axis_labels).difference(Index(data_columns)),
                     axis=axis
                 )._data
@@ -3464,14 +3596,14 @@ def get_blk_items(mgr, blocks):
                 blocks = list(mgr.blocks)
                 blk_items = get_blk_items(mgr, blocks)
                 for c in data_columns:
-                    mgr = block_obj.reindex_axis([c], axis=axis)._data
+                    mgr = block_obj.reindex([c], axis=axis)._data
                     blocks.extend(mgr.blocks)
                     blk_items.extend(get_blk_items(mgr, mgr.blocks))
 
         # reorder the blocks in the same order as the existing_table if we can
         if existing_table is not None:
-            by_items = dict([(tuple(b_items.tolist()), (b, b_items))
-                             for b, b_items in zip(blocks, blk_items)])
+            by_items = {tuple(b_items.tolist()): (b, b_items)
+                        for b, b_items in zip(blocks, blk_items)}
             new_blocks = []
             new_blk_items = []
             for ea in existing_table.values_axes:
@@ -3480,11 +3612,12 @@ def get_blk_items(mgr, blocks):
                     b, b_items = by_items.pop(items)
                     new_blocks.append(b)
                     new_blk_items.append(b_items)
-                except:
+                except (IndexError, KeyError):
                     raise ValueError(
-                        "cannot match existing table structure for [%s] on "
-                        "appending data" % ','.join(pprint_thing(item) for
-                                                    item in items))
+                        "cannot match existing table structure for [{items}] "
+                        "on appending data".format(
+                            items=(','.join(pprint_thing(item) for
+                                            item in items))))
             blocks = new_blocks
             blk_items = new_blk_items
 
@@ -3508,10 +3641,12 @@ def get_blk_items(mgr, blocks):
             if existing_table is not None and validate:
                 try:
                     existing_col = existing_table.values_axes[i]
-                except:
-                    raise ValueError("Incompatible appended table [%s] with "
-                                     "existing table [%s]"
-                                     % (blocks, existing_table.values_axes))
+                except (IndexError, KeyError):
+                    raise ValueError(
+                        "Incompatible appended table [{blocks}]"
+                        "with existing table [{table}]".format(
+                            blocks=blocks,
+                            table=existing_table.values_axes))
             else:
                 existing_col = None
 
@@ -3523,8 +3658,8 @@ def get_blk_items(mgr, blocks):
                              min_itemsize=min_itemsize,
                              nan_rep=nan_rep,
                              encoding=self.encoding,
-                             info=self.info,
-                             **kwargs)
+                             errors=self.errors,
+                             info=self.info)
                 col.set_pos(j)
 
                 self.values_axes.append(col)
@@ -3533,9 +3668,8 @@ def get_blk_items(mgr, blocks):
             except Exception as detail:
                 raise Exception(
                     "cannot find the correct atom type -> "
-                    "[dtype->%s,items->%s] %s"
-                    % (b.dtype.name, b_items, str(detail))
-                )
+                    "[dtype->{name},items->{items}] {detail!s}".format(
+                        name=b.dtype.name, items=b_items, detail=detail))
             j += 1
 
         # validate our min_itemsize
@@ -3591,8 +3725,8 @@ def process_filter(field, filt):
                         elif field in axis_values:
 
                             # we need to filter on this dimension
-                            values = _ensure_index(getattr(obj, field).values)
-                            filt = _ensure_index(filt)
+                            values = ensure_index(getattr(obj, field).values)
+                            filt = ensure_index(filt)
 
                             # hack until we support reversed dim flags
                             if isinstance(obj, DataFrame):
@@ -3601,8 +3735,8 @@ def process_filter(field, filt):
                             return obj.loc._getitem_axis(takers,
                                                          axis=axis_number)
 
-                    raise ValueError(
-                        "cannot find the field [%s] for filtering!" % field)
+                    raise ValueError("cannot find the field [{field}] for "
+                                     "filtering!".format(field=field))
 
                 obj = process_filter(field, filt)
 
@@ -3619,7 +3753,7 @@ def create_description(self, complib=None, complevel=None,
         d = dict(name='table', expectedrows=expectedrows)
 
         # description from the axes & values
-        d['description'] = dict([(a.cname, a.typ) for a in self.axes])
+        d['description'] = {a.cname: a.typ for a in self.axes}
 
         if complib:
             if complevel is None:
@@ -3658,7 +3792,7 @@ def read_coordinates(self, where=None, start=None, stop=None, **kwargs):
 
         return Index(coords)
 
-    def read_column(self, column, where=None, start=None, stop=None, **kwargs):
+    def read_column(self, column, where=None, start=None, stop=None):
         """return a single column from the table, generally only indexables
         are interesting
         """
@@ -3680,19 +3814,21 @@ def read_column(self, column, where=None, start=None, stop=None, **kwargs):
 
                 if not a.is_data_indexable:
                     raise ValueError(
-                        "column [%s] can not be extracted individually; it is "
-                        "not data indexable" % column)
+                        "column [{column}] can not be extracted individually; "
+                        "it is not data indexable".format(column=column))
 
                 # column must be an indexable or a data column
                 c = getattr(self.table.cols, column)
                 a.set_info(self.info)
                 return Series(_set_tz(a.convert(c[start:stop],
                                                 nan_rep=self.nan_rep,
-                                                encoding=self.encoding
+                                                encoding=self.encoding,
+                                                errors=self.errors
                                                 ).take_data(),
                                       a.tz, True), name=column)
 
-        raise KeyError("column [%s] not found in the table" % column)
+        raise KeyError(
+            "column [{column}] not found in the table".format(column=column))
 
 
 class WORMTable(Table):
@@ -3701,16 +3837,16 @@ class WORMTable(Table):
          table. writing is a one-time operation the data are stored in a format
          that allows for searching the data on disk
          """
-    table_type = u('worm')
+    table_type = u'worm'
 
     def read(self, **kwargs):
-        """ read the indicies and the indexing array, calculate offset rows and
+        """ read the indices and the indexing array, calculate offset rows and
         return """
         raise NotImplementedError("WORMTable needs to implement read")
 
     def write(self, **kwargs):
         """ write in a format that we can search later on (but cannot append
-               to): write out the indicies and the values using _write_array
+               to): write out the indices and the values using _write_array
                (e.g. a CArray) create an indexing table so that we can search
         """
         raise NotImplementedError("WORKTable needs to implement write")
@@ -3719,7 +3855,7 @@ def write(self, **kwargs):
 class LegacyTable(Table):
 
     """ an appendable table: allow append/query/delete operations to a
-          (possibily) already existing appendable table this table ALLOWS
+          (possibly) already existing appendable table this table ALLOWS
           append (but doesn't require them), and stores the data in a format
           that can be easily searched
 
@@ -3729,7 +3865,7 @@ class LegacyTable(Table):
         IndexCol(name='column', axis=2, pos=1, index_kind='columns_kind'),
         DataCol(name='fields', cname='values', kind_attr='fields', pos=2)
     ]
-    table_type = u('legacy')
+    table_type = u'legacy'
     ndim = 3
 
     def write(self, **kwargs):
@@ -3743,109 +3879,13 @@ def read(self, where=None, columns=None, **kwargs):
         if not self.read_axes(where=where, **kwargs):
             return None
 
-        lst_vals = [a.values for a in self.index_axes]
-        labels, levels = _factorize_from_iterables(lst_vals)
-        # labels and levels are tuples but lists are expected
-        labels = list(labels)
-        levels = list(levels)
-        N = [len(lvl) for lvl in levels]
-
-        # compute the key
-        key = _factor_indexer(N[1:], labels)
-
-        objs = []
-        if len(unique(key)) == len(key):
-
-            sorter, _ = algos.groupsort_indexer(
-                _ensure_int64(key), np.prod(N))
-            sorter = _ensure_platform_int(sorter)
-
-            # create the objs
-            for c in self.values_axes:
-
-                # the data need to be sorted
-                sorted_values = c.take_data().take(sorter, axis=0)
-                if sorted_values.ndim == 1:
-                    sorted_values = sorted_values.reshape(
-                        (sorted_values.shape[0], 1))
-
-                take_labels = [l.take(sorter) for l in labels]
-                items = Index(c.values)
-                block = _block2d_to_blocknd(
-                    values=sorted_values, placement=np.arange(len(items)),
-                    shape=tuple(N), labels=take_labels, ref_items=items)
-
-                # create the object
-                mgr = BlockManager([block], [items] + levels)
-                obj = self.obj_type(mgr)
-
-                # permute if needed
-                if self.is_transposed:
-                    obj = obj.transpose(
-                        *tuple(Series(self.data_orientation).argsort()))
-
-                objs.append(obj)
-
-        else:
-            warnings.warn(duplicate_doc, DuplicateWarning, stacklevel=5)
-
-            # reconstruct
-            long_index = MultiIndex.from_arrays(
-                [i.values for i in self.index_axes])
-
-            for c in self.values_axes:
-                lp = DataFrame(c.data, index=long_index, columns=c.values)
-
-                # need a better algorithm
-                tuple_index = long_index.values
-
-                unique_tuples = lib.fast_unique(tuple_index)
-                unique_tuples = _asarray_tuplesafe(unique_tuples)
-
-                indexer = match(unique_tuples, tuple_index)
-                indexer = _ensure_platform_int(indexer)
-
-                new_index = long_index.take(indexer)
-                new_values = lp.values.take(indexer, axis=0)
-
-                lp = DataFrame(new_values, index=new_index, columns=lp.columns)
-                objs.append(lp.to_panel())
-
-        # create the composite object
-        if len(objs) == 1:
-            wp = objs[0]
-        else:
-            wp = concat(objs, axis=0, verify_integrity=False)._consolidate()
-
-        # apply the selection filters & axis orderings
-        wp = self.process_axes(wp, columns=columns)
-
-        return wp
-
-
-class LegacyFrameTable(LegacyTable):
-
-    """ support the legacy frame table """
-    pandas_kind = u('frame_table')
-    table_type = u('legacy_frame')
-    obj_type = Panel
-
-    def read(self, *args, **kwargs):
-        return super(LegacyFrameTable, self).read(*args, **kwargs)['value']
-
-
-class LegacyPanelTable(LegacyTable):
-
-    """ support the legacy panel table """
-    table_type = u('legacy_panel')
-    obj_type = Panel
+        raise NotImplementedError("Panel is removed in pandas 0.25.0")
 
 
 class AppendableTable(LegacyTable):
-
-    """ suppor the new appendable table formats """
+    """ support the new appendable table formats """
     _indexables = None
-    table_type = u('appendable')
+    table_type = u'appendable'
 
     def write(self, obj, axes=None, append=False, complib=None,
               complevel=None, fletcher32=None, min_itemsize=None,
@@ -3904,7 +3944,7 @@ def write_data(self, chunksize, dropna=False):
 
                 # figure the mask: only do if we can successfully process this
                 # column, otherwise ignore the mask
-                mask = isnull(a.data).all(axis=0)
+                mask = isna(a.data).all(axis=0)
                 if isinstance(mask, np.ndarray):
                     masks.append(mask.astype('u1', copy=False))
 
@@ -4001,14 +4041,17 @@ def write_data_chunk(self, rows, indexes, mask, values):
                     rows = rows[m]
 
         except Exception as detail:
-            raise Exception("cannot create row-data -> %s" % detail)
+            raise Exception(
+                "cannot create row-data -> {detail}".format(detail=detail))
 
         try:
             if len(rows):
                 self.table.append(rows)
                 self.table.flush()
         except Exception as detail:
-            raise TypeError("tables cannot write this data -> %s" % detail)
+            raise TypeError(
+                "tables cannot write this data -> {detail}".format(
+                    detail=detail))
 
     def delete(self, where=None, start=None, stop=None, **kwargs):
 
@@ -4036,13 +4079,13 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
         values = self.selection.select_coords()
 
         # delete the rows in reverse order
-        l = Series(values).sort_values()
-        ln = len(l)
+        sorted_series = Series(values).sort_values()
+        ln = len(sorted_series)
 
         if ln:
 
             # construct groups of consecutive rows
-            diff = l.diff()
+            diff = sorted_series.diff()
             groups = list(diff[diff > 1].index)
 
             # 1 group
@@ -4060,7 +4103,7 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
             # we must remove in reverse order!
             pg = groups.pop()
             for g in reversed(groups):
-                rows = l.take(lrange(g, pg))
+                rows = sorted_series.take(lrange(g, pg))
                 table.remove_rows(start=rows[rows.index[0]
                                              ], stop=rows[rows.index[-1]] + 1)
                 pg = g
@@ -4072,10 +4115,9 @@ def delete(self, where=None, start=None, stop=None, **kwargs):
 
 
 class AppendableFrameTable(AppendableTable):
-
-    """ suppor the new appendable table formats """
-    pandas_kind = u('frame_table')
-    table_type = u('appendable_frame')
+    """ support the new appendable table formats """
+    pandas_kind = u'frame_table'
+    table_type = u'appendable_frame'
     ndim = 2
     obj_type = DataFrame
 
@@ -4101,7 +4143,7 @@ def read(self, where=None, columns=None, **kwargs):
         for a in self.values_axes:
 
             # we could have a multi-index constructor here
-            # _ensure_index doesn't recognized our list-of-tuples here
+            # ensure_index doesn't recognized our list-of-tuples here
             if info.get('type') == 'MultiIndex':
                 cols = MultiIndex.from_tuples(a.values)
             else:
@@ -4140,8 +4182,8 @@ def read(self, where=None, columns=None, **kwargs):
 
 class AppendableSeriesTable(AppendableFrameTable):
     """ support the new appendable table formats """
-    pandas_kind = u('series_table')
-    table_type = u('appendable_series')
+    pandas_kind = u'series_table'
+    table_type = u'appendable_series'
     ndim = 2
     obj_type = Series
     storage_obj_type = DataFrame
@@ -4183,8 +4225,8 @@ def read(self, columns=None, **kwargs):
 
 class AppendableMultiSeriesTable(AppendableSeriesTable):
     """ support the new appendable table formats """
-    pandas_kind = u('series_table')
-    table_type = u('appendable_multiseries')
+    pandas_kind = u'series_table'
+    table_type = u'appendable_multiseries'
 
     def write(self, obj, **kwargs):
         """ we are going to write this as a frame table """
@@ -4198,8 +4240,8 @@ def write(self, obj, **kwargs):
 
 class GenericTable(AppendableFrameTable):
     """ a table that read/writes the generic pytables table format """
-    pandas_kind = u('frame_table')
-    table_type = u('generic_table')
+    pandas_kind = u'frame_table'
+    table_type = u'generic_table'
     ndim = 2
     obj_type = DataFrame
 
@@ -4248,14 +4290,14 @@ def write(self, **kwargs):
 class AppendableMultiFrameTable(AppendableFrameTable):
 
     """ a frame with a multi-index """
-    table_type = u('appendable_multiframe')
+    table_type = u'appendable_multiframe'
     obj_type = DataFrame
     ndim = 2
-    _re_levels = re.compile("^level_\d+$")
+    _re_levels = re.compile(r"^level_\d+$")
 
     @property
     def table_type_short(self):
-        return u('appendable_multi')
+        return u'appendable_multi'
 
     def write(self, obj, data_columns=None, **kwargs):
         if data_columns is None:
@@ -4282,46 +4324,20 @@ def read(self, **kwargs):
         return df
 
 
-class AppendablePanelTable(AppendableTable):
-
-    """ suppor the new appendable table formats """
-    table_type = u('appendable_panel')
-    ndim = 3
-    obj_type = Panel
-
-    def get_object(self, obj):
-        """ these are written transposed """
-        if self.is_transposed:
-            obj = obj.transpose(*self.data_orientation)
-        return obj
-
-    @property
-    def is_transposed(self):
-        return self.data_orientation != tuple(range(self.ndim))
-
-
-class AppendableNDimTable(AppendablePanelTable):
-
-    """ suppor the new appendable table formats """
-    table_type = u('appendable_ndim')
-    ndim = 4
-    obj_type = Panel4D
-
-
 def _reindex_axis(obj, axis, labels, other=None):
     ax = obj._get_axis(axis)
-    labels = _ensure_index(labels)
+    labels = ensure_index(labels)
 
     # try not to reindex even if other is provided
     # if it equals our current index
     if other is not None:
-        other = _ensure_index(other)
+        other = ensure_index(other)
     if (other is None or labels.equals(other)) and labels.equals(ax):
         return obj
 
-    labels = _ensure_index(labels.unique())
+    labels = ensure_index(labels.unique())
     if other is not None:
-        labels = _ensure_index(other.unique()) & labels
+        labels = ensure_index(other.unique()).intersection(labels, sort=False)
     if not labels.equals(ax):
         slicer = [slice(None, None)] * obj.ndim
         slicer[axis] = labels
@@ -4333,7 +4349,7 @@ def _get_info(info, name):
     """ get/create the info for this name """
     try:
         idx = info[name]
-    except:
+    except KeyError:
         idx = info[name] = dict()
     return idx
 
@@ -4342,9 +4358,9 @@ def _get_info(info, name):
 
 def _get_tz(tz):
     """ for a tz-aware type, return an encoded zone """
-    zone = tslib.get_timezone(tz)
+    zone = timezones.get_timezone(tz)
     if zone is None:
-        zone = tslib.tot_seconds(tz.utcoffset())
+        zone = tz.utcoffset().total_seconds()
     return zone
 
 
@@ -4364,7 +4380,7 @@ def _set_tz(values, tz, preserve_UTC=False, coerce=False):
     if tz is not None:
         name = getattr(values, 'name', None)
         values = values.ravel()
-        tz = tslib.get_timezone(_ensure_decoded(tz))
+        tz = timezones.get_timezone(_ensure_decoded(tz))
         values = DatetimeIndex(values, name=name)
         if values.tz is None:
             values = values.tz_localize('UTC').tz_convert(tz)
@@ -4377,7 +4393,7 @@ def _set_tz(values, tz, preserve_UTC=False, coerce=False):
     return values
 
 
-def _convert_index(index, encoding=None, format_type=None):
+def _convert_index(index, encoding=None, errors='strict', format_type=None):
     index_name = getattr(index, 'name', None)
 
     if isinstance(index, DatetimeIndex):
@@ -4394,14 +4410,14 @@ def _convert_index(index, encoding=None, format_type=None):
     elif isinstance(index, (Int64Index, PeriodIndex)):
         atom = _tables().Int64Col()
         # avoid to store ndarray of Period objects
-        return IndexCol(index._values, 'integer', atom,
+        return IndexCol(index._ndarray_values, 'integer', atom,
                         freq=getattr(index, 'freq', None),
                         index_name=index_name)
 
     if isinstance(index, MultiIndex):
         raise TypeError('MultiIndex not supported here!')
 
-    inferred_type = lib.infer_dtype(index)
+    inferred_type = lib.infer_dtype(index, skipna=False)
 
     values = np.asarray(index)
 
@@ -4431,7 +4447,7 @@ def _convert_index(index, encoding=None, format_type=None):
         # atom = _tables().ObjectAtom()
         # return np.asarray(values, dtype='O'), 'object', atom
 
-        converted = _convert_string_array(values, encoding)
+        converted = _convert_string_array(values, encoding, errors)
         itemsize = converted.dtype.itemsize
         return IndexCol(
             converted, 'string', _tables().StringCol(itemsize),
@@ -4462,47 +4478,50 @@ def _convert_index(index, encoding=None, format_type=None):
                         index_name=index_name)
 
 
-def _unconvert_index(data, kind, encoding=None):
+def _unconvert_index(data, kind, encoding=None, errors='strict'):
     kind = _ensure_decoded(kind)
-    if kind == u('datetime64'):
+    if kind == u'datetime64':
         index = DatetimeIndex(data)
-    elif kind == u('timedelta64'):
+    elif kind == u'timedelta64':
         index = TimedeltaIndex(data)
-    elif kind == u('datetime'):
+    elif kind == u'datetime':
         index = np.asarray([datetime.fromtimestamp(v) for v in data],
                            dtype=object)
-    elif kind == u('date'):
+    elif kind == u'date':
         try:
             index = np.asarray(
                 [date.fromordinal(v) for v in data], dtype=object)
         except (ValueError):
             index = np.asarray(
                 [date.fromtimestamp(v) for v in data], dtype=object)
-    elif kind in (u('integer'), u('float')):
+    elif kind in (u'integer', u'float'):
         index = np.asarray(data)
-    elif kind in (u('string')):
-        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding)
-    elif kind == u('object'):
+    elif kind in (u'string'):
+        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding,
+                                        errors=errors)
+    elif kind == u'object':
         index = np.asarray(data[0])
     else:  # pragma: no cover
-        raise ValueError('unrecognized index type %s' % kind)
+        raise ValueError('unrecognized index type {kind}'.format(kind=kind))
     return index
 
 
-def _unconvert_index_legacy(data, kind, legacy=False, encoding=None):
+def _unconvert_index_legacy(data, kind, legacy=False, encoding=None,
+                            errors='strict'):
     kind = _ensure_decoded(kind)
-    if kind == u('datetime'):
-        index = lib.time64_to_datetime(data)
-    elif kind in (u('integer')):
+    if kind == u'datetime':
+        index = to_datetime(data)
+    elif kind in (u'integer'):
         index = np.asarray(data, dtype=object)
-    elif kind in (u('string')):
-        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding)
+    elif kind in (u'string'):
+        index = _unconvert_string_array(data, nan_rep=None, encoding=encoding,
+                                        errors=errors)
     else:  # pragma: no cover
-        raise ValueError('unrecognized index type %s' % kind)
+        raise ValueError('unrecognized index type {kind}'.format(kind=kind))
     return index
 
 
-def _convert_string_array(data, encoding, itemsize=None):
+def _convert_string_array(data, encoding, errors, itemsize=None):
     """
     we take a string-like that is object dtype and coerce to a fixed size
     string type
@@ -4511,6 +4530,7 @@ def _convert_string_array(data, encoding, itemsize=None):
     ----------
     data : a numpy array of object dtype
     encoding : None or string-encoding
+    errors : handler for encoding errors
     itemsize : integer, optional, defaults to the max length of the strings
 
     Returns
@@ -4521,17 +4541,19 @@ def _convert_string_array(data, encoding, itemsize=None):
     # encode if needed
     if encoding is not None and len(data):
         data = Series(data.ravel()).str.encode(
-            encoding).values.reshape(data.shape)
+            encoding, errors).values.reshape(data.shape)
 
     # create the sized dtype
     if itemsize is None:
-        itemsize = lib.max_len_string_array(_ensure_object(data.ravel()))
+        ensured = ensure_object(data.ravel())
+        itemsize = max(1, libwriters.max_len_string_array(ensured))
 
-    data = np.asarray(data, dtype="S%d" % itemsize)
+    data = np.asarray(data, dtype="S{size}".format(size=itemsize))
     return data
 
 
-def _unconvert_string_array(data, nan_rep=None, encoding=None):
+def _unconvert_string_array(data, nan_rep=None, encoding=None,
+                            errors='strict'):
     """
     inverse of _convert_string_array
 
@@ -4540,6 +4562,7 @@ def _unconvert_string_array(data, nan_rep=None, encoding=None):
     data : fixed length string dtyped array
     nan_rep : the storage repr of NaN, optional
     encoding : the encoding of the data, optional
+    errors : handler for encoding errors, default 'strict'
 
     Returns
     -------
@@ -4554,47 +4577,48 @@ def _unconvert_string_array(data, nan_rep=None, encoding=None):
     encoding = _ensure_encoding(encoding)
     if encoding is not None and len(data):
 
-        itemsize = lib.max_len_string_array(_ensure_object(data))
+        itemsize = libwriters.max_len_string_array(ensure_object(data))
         if compat.PY3:
             dtype = "U{0}".format(itemsize)
         else:
             dtype = "S{0}".format(itemsize)
 
         if isinstance(data[0], compat.binary_type):
-            data = Series(data).str.decode(encoding).values
+            data = Series(data).str.decode(encoding, errors=errors).values
         else:
             data = data.astype(dtype, copy=False).astype(object, copy=False)
 
     if nan_rep is None:
         nan_rep = 'nan'
 
-    data = lib.string_array_replace_from_nan_rep(data, nan_rep)
+    data = libwriters.string_array_replace_from_nan_rep(data, nan_rep)
     return data.reshape(shape)
 
 
-def _maybe_convert(values, val_kind, encoding):
+def _maybe_convert(values, val_kind, encoding, errors):
     if _need_convert(val_kind):
-        conv = _get_converter(val_kind, encoding)
+        conv = _get_converter(val_kind, encoding, errors)
         # conv = np.frompyfunc(conv, 1, 1)
         values = conv(values)
     return values
 
 
-def _get_converter(kind, encoding):
+def _get_converter(kind, encoding, errors):
     kind = _ensure_decoded(kind)
     if kind == 'datetime64':
         return lambda x: np.asarray(x, dtype='M8[ns]')
     elif kind == 'datetime':
-        return lib.convert_timestamps
+        return lambda x: to_datetime(x, cache=True).to_pydatetime()
     elif kind == 'string':
-        return lambda x: _unconvert_string_array(x, encoding=encoding)
+        return lambda x: _unconvert_string_array(x, encoding=encoding,
+                                                 errors=errors)
     else:  # pragma: no cover
-        raise ValueError('invalid kind %s' % kind)
+        raise ValueError('invalid kind {kind}'.format(kind=kind))
 
 
 def _need_convert(kind):
     kind = _ensure_decoded(kind)
-    if kind in (u('datetime'), u('datetime64'), u('string')):
+    if kind in (u'datetime', u'datetime64', u'string'):
         return True
     return False
 
@@ -4607,12 +4631,12 @@ class Selection(object):
     Parameters
     ----------
     table : a Table object
-    where : list of Terms (or convertable to)
-    start, stop: indicies to start and/or stop selection
+    where : list of Terms (or convertible to)
+    start, stop: indices to start and/or stop selection
 
     """
 
-    def __init__(self, table, where=None, start=None, stop=None, **kwargs):
+    def __init__(self, table, where=None, start=None, stop=None):
         self.table = table
         self.where = where
         self.start = start
@@ -4626,7 +4650,7 @@ def __init__(self, table, where=None, start=None, stop=None, **kwargs):
 
             # see if we have a passed coordinate like
             try:
-                inferred = lib.infer_dtype(where)
+                inferred = lib.infer_dtype(where, skipna=False)
                 if inferred == 'integer' or inferred == 'boolean':
                     where = np.asarray(where)
                     if where.dtype == np.bool_:
@@ -4647,7 +4671,7 @@ def __init__(self, table, where=None, start=None, stop=None, **kwargs):
                             )
                         self.coordinates = where
 
-            except:
+            except ValueError:
                 pass
 
         if self.coordinates is None:
@@ -4672,7 +4696,7 @@ def generate(self, where):
             raise ValueError(
                 "The passed where expression: {0}\n"
                 "            contains an invalid variable reference\n"
-                "            all of the variable refrences must be a "
+                "            all of the variable references must be a "
                 "reference to\n"
                 "            an axis (e.g. 'index' or 'columns'), or a "
                 "data_column\n"
@@ -4715,16 +4739,3 @@ def select_coords(self):
             return self.coordinates
 
         return np.arange(start, stop)
-
-# utilities ###
-
-
-def timeit(key, df, fn=None, remove=True, **kwargs):
-    if fn is None:
-        fn = 'timeit.h5'
-    store = HDFStore(fn, mode='w')
-    store.append(key, df, **kwargs)
-    store.close()
-
-    if remove:
-        os.remove(fn)
diff --git a/pandas/io/s3.py b/pandas/io/s3.py
index 5e48de757d00e..4998e4c0400ac 100644
--- a/pandas/io/s3.py
+++ b/pandas/io/s3.py
@@ -1,9 +1,10 @@
 """ s3 support for remote file interactivity """
 from pandas import compat
+
 try:
     import s3fs
     from botocore.exceptions import NoCredentialsError
-except:
+except ImportError:
     raise ImportError("The s3fs library is required to handle s3 files")
 
 if compat.PY3:
@@ -19,11 +20,15 @@ def _strip_schema(url):
 
 
 def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
-                           compression=None):
+                           compression=None, mode=None):
+
+    if mode is None:
+        mode = 'rb'
+
     fs = s3fs.S3FileSystem(anon=False)
     try:
-        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer))
-    except (OSError, NoCredentialsError):
+        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer), mode)
+    except (compat.FileNotFoundError, NoCredentialsError):
         # boto3 has troubles when trying to access a public file
         # when credentialed...
         # An OSError is raised if you have credentials, but they
@@ -31,5 +36,5 @@ def get_filepath_or_buffer(filepath_or_buffer, encoding=None,
         # A NoCredentialsError is raised if you don't have creds
         # for that bucket.
         fs = s3fs.S3FileSystem(anon=True)
-        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer))
-    return filepath_or_buffer, None, compression
+        filepath_or_buffer = fs.open(_strip_schema(filepath_or_buffer), mode)
+    return filepath_or_buffer, None, compression, True
diff --git a/pandas/io/sas/sas.pyx b/pandas/io/sas/sas.pyx
index 4396180da44cb..9b8fba16741f6 100644
--- a/pandas/io/sas/sas.pyx
+++ b/pandas/io/sas/sas.pyx
@@ -2,20 +2,22 @@
 # cython: boundscheck=False, initializedcheck=False
 
 import numpy as np
-cimport numpy as np
-from numpy cimport uint8_t, uint16_t, int8_t, int64_t
 import sas_constants as const
 
+ctypedef signed long long   int64_t
+ctypedef unsigned char      uint8_t
+ctypedef unsigned short     uint16_t
+
 # rle_decompress decompresses data using a Run Length Encoding
 # algorithm.  It is partially documented here:
 #
 # https://cran.r-project.org/web/packages/sas7bdat/vignettes/sas7bdat.pdf
-cdef np.ndarray[uint8_t, ndim=1] rle_decompress(
-        int result_length, np.ndarray[uint8_t, ndim=1] inbuff):
+cdef const uint8_t[:] rle_decompress(int result_length,
+                                     const uint8_t[:] inbuff):
 
     cdef:
         uint8_t control_byte, x
-        uint8_t [:] result = np.zeros(result_length, np.uint8)
+        uint8_t[:] result = np.zeros(result_length, np.uint8)
         int rpos = 0, ipos = 0, length = len(inbuff)
         int i, nbytes, end_of_first_byte
 
@@ -101,10 +103,13 @@ cdef np.ndarray[uint8_t, ndim=1] rle_decompress(
                 result[rpos] = 0x00
                 rpos += 1
         else:
-            raise ValueError("unknown control byte: %v", control_byte)
+            raise ValueError("unknown control byte: {byte}"
+                             .format(byte=control_byte))
 
-    if len(result) != result_length:
-        raise ValueError("RLE: %v != %v", (len(result), result_length))
+    # In py37 cython/clang sees `len(outbuff)` as size_t and not Py_ssize_t
+    if <Py_ssize_t>len(result) != <Py_ssize_t>result_length:
+        raise ValueError("RLE: {got} != {expect}".format(got=len(result),
+                                                         expect=result_length))
 
     return np.asarray(result)
 
@@ -112,14 +117,14 @@ cdef np.ndarray[uint8_t, ndim=1] rle_decompress(
 # rdc_decompress decompresses data using the Ross Data Compression algorithm:
 #
 # http://collaboration.cmc.ec.gc.ca/science/rpn/biblio/ddj/Website/articles/CUJ/1992/9210/ross/ross.htm
-cdef np.ndarray[uint8_t, ndim=1] rdc_decompress(
-        int result_length, np.ndarray[uint8_t, ndim=1] inbuff):
+cdef const uint8_t[:] rdc_decompress(int result_length,
+                                     const uint8_t[:] inbuff):
 
     cdef:
         uint8_t cmd
         uint16_t ctrl_bits, ctrl_mask = 0, ofs, cnt
         int ipos = 0, rpos = 0, k
-        uint8_t [:] outbuff = np.zeros(result_length, dtype=np.uint8)
+        uint8_t[:] outbuff = np.zeros(result_length, dtype=np.uint8)
 
     ii = -1
 
@@ -184,22 +189,27 @@ cdef np.ndarray[uint8_t, ndim=1] rdc_decompress(
         else:
             raise ValueError("unknown RDC command")
 
-    if len(outbuff) != result_length:
-        raise ValueError("RDC: %v != %v\n", len(outbuff), result_length)
+    # In py37 cython/clang sees `len(outbuff)` as size_t and not Py_ssize_t
+    if <Py_ssize_t>len(outbuff) != <Py_ssize_t>result_length:
+        raise ValueError("RDC: {got} != {expect}\n"
+                         .format(got=len(outbuff), expect=result_length))
 
     return np.asarray(outbuff)
 
+
 cdef enum ColumnTypes:
     column_type_decimal = 1
     column_type_string = 2
 
 
 # type the page_data types
-cdef int page_meta_type = const.page_meta_type
-cdef int page_mix_types_0 = const.page_mix_types[0]
-cdef int page_mix_types_1 = const.page_mix_types[1]
-cdef int page_data_type = const.page_data_type
-cdef int subheader_pointers_offset = const.subheader_pointers_offset
+cdef:
+    int page_meta_type = const.page_meta_type
+    int page_mix_types_0 = const.page_mix_types[0]
+    int page_mix_types_1 = const.page_mix_types[1]
+    int page_data_type = const.page_data_type
+    int subheader_pointers_offset = const.subheader_pointers_offset
+
 
 cdef class Parser(object):
 
@@ -223,8 +233,8 @@ cdef class Parser(object):
         int subheader_pointer_length
         int current_page_type
         bint is_little_endian
-        np.ndarray[uint8_t, ndim=1] (*decompress)(
-            int result_length, np.ndarray[uint8_t, ndim=1] inbuff)
+        const uint8_t[:] (*decompress)(int result_length,
+                                       const uint8_t[:] inbuff)
         object parser
 
     def __init__(self, object parser):
@@ -235,8 +245,8 @@ cdef class Parser(object):
         self.parser = parser
         self.header_length = self.parser.header_length
         self.column_count = parser.column_count
-        self.lengths = parser._column_data_lengths
-        self.offsets = parser._column_data_offsets
+        self.lengths = parser.column_data_lengths()
+        self.offsets = parser.column_data_offsets()
         self.byte_chunk = parser._byte_chunk
         self.string_chunk = parser._string_chunk
         self.row_length = parser.row_length
@@ -248,7 +258,7 @@ cdef class Parser(object):
         # page indicators
         self.update_next_page()
 
-        column_types = parser.column_types
+        column_types = parser.column_types()
 
         # map column types
         for j in range(self.column_count):
@@ -258,7 +268,8 @@ cdef class Parser(object):
                 self.column_types[j] = column_type_string
             else:
                 raise ValueError("unknown column type: "
-                                 "%s" % self.parser.columns[j].ctype)
+                                 "{typ}"
+                                 .format(typ=self.parser.columns[j].ctype))
 
         # compression
         if parser.compression == const.rle_compression:
@@ -365,7 +376,7 @@ cdef class Parser(object):
                     if done:
                         return True
                 return False
-            elif self.current_page_type == page_data_type:
+            elif self.current_page_type & page_data_type == page_data_type:
                 self.process_byte_array_with_data(
                     bit_offset + subheader_pointers_offset +
                     self.current_row_on_page_index * self.row_length,
@@ -378,8 +389,8 @@ cdef class Parser(object):
                         return True
                 return False
             else:
-                raise ValueError("unknown page type: %s",
-                                 self.current_page_type)
+                raise ValueError("unknown page type: {typ}"
+                                 .format(typ=self.current_page_type))
 
     cdef void process_byte_array_with_data(self, int offset, int length):
 
@@ -387,7 +398,7 @@ cdef class Parser(object):
             Py_ssize_t j
             int s, k, m, jb, js, current_row
             int64_t lngt, start, ct
-            np.ndarray[uint8_t, ndim=1] source
+            const uint8_t[:] source
             int64_t[:] column_types
             int64_t[:] lengths
             int64_t[:] offsets
@@ -426,8 +437,8 @@ cdef class Parser(object):
                 jb += 1
             elif column_types[j] == column_type_string:
                 # string
-                string_chunk[js, current_row] = source[start:(
-                    start + lngt)].tostring().rstrip()
+                string_chunk[js, current_row] = np.array(source[start:(
+                    start + lngt)]).tostring().rstrip(b"\x00 ")
                 js += 1
 
         self.current_row_on_page_index += 1
diff --git a/pandas/io/sas/sas7bdat.py b/pandas/io/sas/sas7bdat.py
index d33cee2c5a1bc..eb77f79d38d59 100644
--- a/pandas/io/sas/sas7bdat.py
+++ b/pandas/io/sas/sas7bdat.py
@@ -13,14 +13,19 @@
 Reference for binary data compression:
   http://collaboration.cmc.ec.gc.ca/science/rpn/biblio/ddj/Website/articles/CUJ/1992/9210/ross/ross.htm
 """
+from datetime import datetime
+import struct
+
+import numpy as np
+
+from pandas.errors import EmptyDataError
 
 import pandas as pd
 from pandas import compat
-from pandas.io.common import get_filepath_or_buffer, BaseIterator
-import numpy as np
-import struct
+
+from pandas.io.common import BaseIterator, get_filepath_or_buffer
+from pandas.io.sas._sas import Parser
 import pandas.io.sas.sas_constants as const
-from pandas.io.sas.libsas import Parser
 
 
 class _subheader_pointer(object):
@@ -44,8 +49,8 @@ class SAS7BDATReader(BaseIterator):
     index : column identifier, defaults to None
         Column to use as index.
     convert_dates : boolean, defaults to True
-        Attempt to convert dates to Pandas datetime values.  Note all
-        SAS date formats are supported.
+        Attempt to convert dates to Pandas datetime values.  Note that
+        some rarely used SAS date formats may be unsupported.
     blank_missing : boolean, defaults to True
         Convert empty strings to missing values (SAS uses blanks to
         indicate missing character variables).
@@ -77,7 +82,6 @@ def __init__(self, path_or_buf, index=None, convert_dates=True,
         self.compression = ""
         self.column_names_strings = []
         self.column_names = []
-        self.column_types = []
         self.column_formats = []
         self.columns = []
 
@@ -85,11 +89,13 @@ def __init__(self, path_or_buf, index=None, convert_dates=True,
         self._cached_page = None
         self._column_data_lengths = []
         self._column_data_offsets = []
+        self._column_types = []
+
         self._current_row_in_file_index = 0
         self._current_row_on_page_index = 0
         self._current_row_in_file_index = 0
 
-        self._path_or_buf, _, _ = get_filepath_or_buffer(path_or_buf)
+        self._path_or_buf, _, _, _ = get_filepath_or_buffer(path_or_buf)
         if isinstance(self._path_or_buf, compat.string_types):
             self._path_or_buf = open(self._path_or_buf, 'rb')
             self.handle = self._path_or_buf
@@ -97,6 +103,19 @@ def __init__(self, path_or_buf, index=None, convert_dates=True,
         self._get_properties()
         self._parse_metadata()
 
+    def column_data_lengths(self):
+        """Return a numpy int64 array of the column data lengths"""
+        return np.asarray(self._column_data_lengths, dtype=np.int64)
+
+    def column_data_offsets(self):
+        """Return a numpy int64 array of the column offsets"""
+        return np.asarray(self._column_data_offsets, dtype=np.int64)
+
+    def column_types(self):
+        """Returns a numpy character array of the column types:
+           s (string) or d (double)"""
+        return np.asarray(self._column_types, dtype=np.dtype('S1'))
+
     def close(self):
         try:
             self.handle.close()
@@ -144,7 +163,7 @@ def _get_properties(self):
         if buf in const.encoding_names:
             self.file_encoding = const.encoding_names[buf]
         else:
-            self.file_encoding = "unknown (code=%s)" % str(buf)
+            self.file_encoding = "unknown (code={name!s})".format(name=buf)
 
         # Get platform information
         buf = self._read_bytes(const.platform_offset, const.platform_length)
@@ -168,7 +187,7 @@ def _get_properties(self):
                 self.encoding or self.default_encoding)
 
         # Timestamp is epoch 01/01/1960
-        epoch = pd.datetime(1960, 1, 1)
+        epoch = datetime(1960, 1, 1)
         x = self._read_float(const.date_created_offset + align1,
                              const.date_created_length)
         self.date_created = epoch + pd.to_timedelta(x, unit='s')
@@ -282,8 +301,10 @@ def _process_page_meta(self):
         pt = [const.page_meta_type, const.page_amd_type] + const.page_mix_types
         if self._current_page_type in pt:
             self._process_page_metadata()
-        return ((self._current_page_type in [256] + const.page_mix_types) or
-                (self._current_page_data_subheader_pointers is not None))
+        is_data_page = self._current_page_type & const.page_data_type
+        is_mix_page = self._current_page_type in const.page_mix_types
+        return (is_data_page or is_mix_page
+                or self._current_page_data_subheader_pointers != [])
 
     def _read_page_header(self):
         bit_offset = self._page_bit_offset
@@ -320,7 +341,7 @@ def _get_subheader_index(self, signature, compression, ptype):
                   (compression == 0))
             f2 = (ptype == const.compressed_subheader_type)
             if (self.compression != "") and f1 and f2:
-                index = const.index.dataSubheaderIndex
+                index = const.SASIndex.data_subheader_index
             else:
                 self.close()
                 raise ValueError("Unknown subheader signature")
@@ -359,23 +380,23 @@ def _process_subheader(self, subheader_index, pointer):
         offset = pointer.offset
         length = pointer.length
 
-        if subheader_index == const.index.rowSizeIndex:
+        if subheader_index == const.SASIndex.row_size_index:
             processor = self._process_rowsize_subheader
-        elif subheader_index == const.index.columnSizeIndex:
+        elif subheader_index == const.SASIndex.column_size_index:
             processor = self._process_columnsize_subheader
-        elif subheader_index == const.index.columnTextIndex:
+        elif subheader_index == const.SASIndex.column_text_index:
             processor = self._process_columntext_subheader
-        elif subheader_index == const.index.columnNameIndex:
+        elif subheader_index == const.SASIndex.column_name_index:
             processor = self._process_columnname_subheader
-        elif subheader_index == const.index.columnAttributesIndex:
+        elif subheader_index == const.SASIndex.column_attributes_index:
             processor = self._process_columnattributes_subheader
-        elif subheader_index == const.index.formatAndLabelIndex:
+        elif subheader_index == const.SASIndex.format_and_label_index:
             processor = self._process_format_subheader
-        elif subheader_index == const.index.columnListIndex:
+        elif subheader_index == const.SASIndex.column_list_index:
             processor = self._process_columnlist_subheader
-        elif subheader_index == const.index.subheaderCountsIndex:
+        elif subheader_index == const.SASIndex.subheader_counts_index:
             processor = self._process_subheader_counts
-        elif subheader_index == const.index.dataSubheaderIndex:
+        elif subheader_index == const.SASIndex.data_subheader_index:
             self._current_page_data_subheader_pointers.append(pointer)
             return
         else:
@@ -414,8 +435,11 @@ def _process_columnsize_subheader(self, offset, length):
         self.column_count = self._read_int(offset, int_len)
         if (self.col_count_p1 + self.col_count_p2 !=
                 self.column_count):
-            print("Warning: column count mismatch (%d + %d != %d)\n",
-                  self.col_count_p1, self.col_count_p2, self.column_count)
+            print(
+                "Warning: column count mismatch ({p1} + {p2} != "
+                "{column_count})\n".format(
+                    p1=self.col_count_p1, p2=self.col_count_p2,
+                    column_count=self.column_count))
 
     # Unknown purpose
     def _process_subheader_counts(self, offset, length):
@@ -498,12 +522,6 @@ def _process_columnattributes_subheader(self, offset, length):
         int_len = self._int_length
         column_attributes_vectors_count = (
             length - 2 * int_len - 12) // (int_len + 8)
-        self.column_types = np.empty(
-            column_attributes_vectors_count, dtype=np.dtype('S1'))
-        self._column_data_lengths = np.empty(
-            column_attributes_vectors_count, dtype=np.int64)
-        self._column_data_offsets = np.empty(
-            column_attributes_vectors_count, dtype=np.int64)
         for i in range(column_attributes_vectors_count):
             col_data_offset = (offset + int_len +
                                const.column_data_offset_offset +
@@ -515,16 +533,13 @@ def _process_columnattributes_subheader(self, offset, length):
                          const.column_type_offset + i * (int_len + 8))
 
             x = self._read_int(col_data_offset, int_len)
-            self._column_data_offsets[i] = x
+            self._column_data_offsets.append(x)
 
             x = self._read_int(col_data_len, const.column_data_length_length)
-            self._column_data_lengths[i] = x
+            self._column_data_lengths.append(x)
 
             x = self._read_int(col_types, const.column_type_length)
-            if x == 1:
-                self.column_types[i] = b'd'
-            else:
-                self.column_types[i] = b's'
+            self._column_types.append(b'd' if x == 1 else b's')
 
     def _process_columnlist_subheader(self, offset, length):
         # unknown purpose
@@ -581,7 +596,7 @@ def _process_format_subheader(self, offset, length):
         col.name = self.column_names[current_column_number]
         col.label = column_label
         col.format = column_format
-        col.ctype = self.column_types[current_column_number]
+        col.ctype = self._column_types[current_column_number]
         col.length = self._column_data_lengths[current_column_number]
 
         self.column_formats.append(column_format)
@@ -594,6 +609,10 @@ def read(self, nrows=None):
         elif nrows is None:
             nrows = self.row_count
 
+        if len(self._column_types) == 0:
+            self.close()
+            raise EmptyDataError("No columns to parse from file")
+
         if self._current_row_in_file_index >= self.row_count:
             return None
 
@@ -601,11 +620,11 @@ def read(self, nrows=None):
         if nrows > m:
             nrows = m
 
-        nd = (self.column_types == b'd').sum()
-        ns = (self.column_types == b's').sum()
+        nd = self._column_types.count(b'd')
+        ns = self._column_types.count(b's')
 
         self._string_chunk = np.empty((ns, nrows), dtype=np.object)
-        self._byte_chunk = np.empty((nd, 8 * nrows), dtype=np.uint8)
+        self._byte_chunk = np.zeros((nd, 8 * nrows), dtype=np.uint8)
 
         self._current_row_in_chunk_index = 0
         p = Parser(self)
@@ -630,11 +649,13 @@ def _read_next_page(self):
                                         self._page_length))
 
         self._read_page_header()
-        if self._current_page_type == const.page_meta_type:
+        page_type = self._current_page_type
+        if page_type == const.page_meta_type:
             self._process_page_metadata()
-        pt = [const.page_meta_type, const.page_data_type]
-        pt += [const.page_mix_types]
-        if self._current_page_type not in pt:
+
+        is_data_page = page_type & const.page_data_type
+        pt = [const.page_meta_type] + const.page_mix_types
+        if not is_data_page and self._current_page_type not in pt:
             return self._read_next_page()
 
         return False
@@ -651,15 +672,21 @@ def _chunk_to_dataframe(self):
 
             name = self.column_names[j]
 
-            if self.column_types[j] == b'd':
+            if self._column_types[j] == b'd':
                 rslt[name] = self._byte_chunk[jb, :].view(
                     dtype=self.byte_order + 'd')
                 rslt[name] = np.asarray(rslt[name], dtype=np.float64)
-                if self.convert_dates and (self.column_formats[j] == "MMDDYY"):
-                    epoch = pd.datetime(1960, 1, 1)
-                    rslt[name] = epoch + pd.to_timedelta(rslt[name], unit='d')
+                if self.convert_dates:
+                    unit = None
+                    if self.column_formats[j] in const.sas_date_formats:
+                        unit = 'd'
+                    elif self.column_formats[j] in const.sas_datetime_formats:
+                        unit = 's'
+                    if unit:
+                        rslt[name] = pd.to_datetime(rslt[name], unit=unit,
+                                                    origin="1960-01-01")
                 jb += 1
-            elif self.column_types[j] == b's':
+            elif self._column_types[j] == b's':
                 rslt[name] = self._string_chunk[js, :]
                 if self.convert_text and (self.encoding is not None):
                     rslt[name] = rslt[name].str.decode(
@@ -670,7 +697,7 @@ def _chunk_to_dataframe(self):
                 js += 1
             else:
                 self.close()
-                raise ValueError("unknown column type %s" %
-                                 self.column_types[j])
+                raise ValueError("unknown column type {type}".format(
+                    type=self._column_types[j]))
 
         return rslt
diff --git a/pandas/io/sas/sas_constants.py b/pandas/io/sas/sas_constants.py
index 65ae1e9102cb2..98502d32d39e8 100644
--- a/pandas/io/sas/sas_constants.py
+++ b/pandas/io/sas/sas_constants.py
@@ -102,46 +102,70 @@
                   61: "wcyrillic", 62: "wlatin1", 90: "ebcdic870"}
 
 
-class index:
-    rowSizeIndex = 0
-    columnSizeIndex = 1
-    subheaderCountsIndex = 2
-    columnTextIndex = 3
-    columnNameIndex = 4
-    columnAttributesIndex = 5
-    formatAndLabelIndex = 6
-    columnListIndex = 7
-    dataSubheaderIndex = 8
+class SASIndex(object):
+    row_size_index = 0
+    column_size_index = 1
+    subheader_counts_index = 2
+    column_text_index = 3
+    column_name_index = 4
+    column_attributes_index = 5
+    format_and_label_index = 6
+    column_list_index = 7
+    data_subheader_index = 8
 
 
 subheader_signature_to_index = {
-    b"\xF7\xF7\xF7\xF7": index.rowSizeIndex,
-    b"\x00\x00\x00\x00\xF7\xF7\xF7\xF7": index.rowSizeIndex,
-    b"\xF7\xF7\xF7\xF7\x00\x00\x00\x00": index.rowSizeIndex,
-    b"\xF7\xF7\xF7\xF7\xFF\xFF\xFB\xFE": index.rowSizeIndex,
-    b"\xF6\xF6\xF6\xF6": index.columnSizeIndex,
-    b"\x00\x00\x00\x00\xF6\xF6\xF6\xF6": index.columnSizeIndex,
-    b"\xF6\xF6\xF6\xF6\x00\x00\x00\x00": index.columnSizeIndex,
-    b"\xF6\xF6\xF6\xF6\xFF\xFF\xFB\xFE": index.columnSizeIndex,
-    b"\x00\xFC\xFF\xFF": index.subheaderCountsIndex,
-    b"\xFF\xFF\xFC\x00": index.subheaderCountsIndex,
-    b"\x00\xFC\xFF\xFF\xFF\xFF\xFF\xFF": index.subheaderCountsIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFC\x00": index.subheaderCountsIndex,
-    b"\xFD\xFF\xFF\xFF": index.columnTextIndex,
-    b"\xFF\xFF\xFF\xFD": index.columnTextIndex,
-    b"\xFD\xFF\xFF\xFF\xFF\xFF\xFF\xFF": index.columnTextIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFD": index.columnTextIndex,
-    b"\xFF\xFF\xFF\xFF": index.columnNameIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF": index.columnNameIndex,
-    b"\xFC\xFF\xFF\xFF": index.columnAttributesIndex,
-    b"\xFF\xFF\xFF\xFC": index.columnAttributesIndex,
-    b"\xFC\xFF\xFF\xFF\xFF\xFF\xFF\xFF": index.columnAttributesIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFC": index.columnAttributesIndex,
-    b"\xFE\xFB\xFF\xFF": index.formatAndLabelIndex,
-    b"\xFF\xFF\xFB\xFE": index.formatAndLabelIndex,
-    b"\xFE\xFB\xFF\xFF\xFF\xFF\xFF\xFF": index.formatAndLabelIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFB\xFE": index.formatAndLabelIndex,
-    b"\xFE\xFF\xFF\xFF": index.columnListIndex,
-    b"\xFF\xFF\xFF\xFE": index.columnListIndex,
-    b"\xFE\xFF\xFF\xFF\xFF\xFF\xFF\xFF": index.columnListIndex,
-    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFE": index.columnListIndex}
+    b"\xF7\xF7\xF7\xF7": SASIndex.row_size_index,
+    b"\x00\x00\x00\x00\xF7\xF7\xF7\xF7": SASIndex.row_size_index,
+    b"\xF7\xF7\xF7\xF7\x00\x00\x00\x00": SASIndex.row_size_index,
+    b"\xF7\xF7\xF7\xF7\xFF\xFF\xFB\xFE": SASIndex.row_size_index,
+    b"\xF6\xF6\xF6\xF6": SASIndex.column_size_index,
+    b"\x00\x00\x00\x00\xF6\xF6\xF6\xF6": SASIndex.column_size_index,
+    b"\xF6\xF6\xF6\xF6\x00\x00\x00\x00": SASIndex.column_size_index,
+    b"\xF6\xF6\xF6\xF6\xFF\xFF\xFB\xFE": SASIndex.column_size_index,
+    b"\x00\xFC\xFF\xFF": SASIndex.subheader_counts_index,
+    b"\xFF\xFF\xFC\x00": SASIndex.subheader_counts_index,
+    b"\x00\xFC\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.subheader_counts_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFC\x00": SASIndex.subheader_counts_index,
+    b"\xFD\xFF\xFF\xFF": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFD": SASIndex.column_text_index,
+    b"\xFD\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFD": SASIndex.column_text_index,
+    b"\xFF\xFF\xFF\xFF": SASIndex.column_name_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_name_index,
+    b"\xFC\xFF\xFF\xFF": SASIndex.column_attributes_index,
+    b"\xFF\xFF\xFF\xFC": SASIndex.column_attributes_index,
+    b"\xFC\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_attributes_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFC": SASIndex.column_attributes_index,
+    b"\xFE\xFB\xFF\xFF": SASIndex.format_and_label_index,
+    b"\xFF\xFF\xFB\xFE": SASIndex.format_and_label_index,
+    b"\xFE\xFB\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.format_and_label_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFB\xFE": SASIndex.format_and_label_index,
+    b"\xFE\xFF\xFF\xFF": SASIndex.column_list_index,
+    b"\xFF\xFF\xFF\xFE": SASIndex.column_list_index,
+    b"\xFE\xFF\xFF\xFF\xFF\xFF\xFF\xFF": SASIndex.column_list_index,
+    b"\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFE": SASIndex.column_list_index}
+
+
+# List of frequently used SAS date and datetime formats
+# http://support.sas.com/documentation/cdl/en/etsug/60372/HTML/default/viewer.htm#etsug_intervals_sect009.htm
+# https://github.com/epam/parso/blob/master/src/main/java/com/epam/parso/impl/SasFileConstants.java
+sas_date_formats = ("DATE", "DAY", "DDMMYY", "DOWNAME", "JULDAY", "JULIAN",
+                    "MMDDYY", "MMYY", "MMYYC", "MMYYD", "MMYYP", "MMYYS",
+                    "MMYYN", "MONNAME", "MONTH", "MONYY", "QTR", "QTRR",
+                    "NENGO", "WEEKDATE", "WEEKDATX", "WEEKDAY", "WEEKV",
+                    "WORDDATE", "WORDDATX", "YEAR", "YYMM", "YYMMC", "YYMMD",
+                    "YYMMP", "YYMMS", "YYMMN", "YYMON", "YYMMDD", "YYQ",
+                    "YYQC", "YYQD", "YYQP", "YYQS", "YYQN", "YYQR", "YYQRC",
+                    "YYQRD", "YYQRP", "YYQRS", "YYQRN",
+                    "YYMMDDP", "YYMMDDC", "E8601DA", "YYMMDDN", "MMDDYYC",
+                    "MMDDYYS", "MMDDYYD", "YYMMDDS", "B8601DA", "DDMMYYN",
+                    "YYMMDDD", "DDMMYYB", "DDMMYYP", "MMDDYYP", "YYMMDDB",
+                    "MMDDYYN", "DDMMYYC", "DDMMYYD", "DDMMYYS",
+                    "MINGUO")
+
+sas_datetime_formats = ("DATETIME", "DTWKDATX",
+                        "B8601DN", "B8601DT", "B8601DX", "B8601DZ", "B8601LX",
+                        "E8601DN", "E8601DT", "E8601DX", "E8601DZ", "E8601LX",
+                        "DATEAMPM", "DTDATE", "DTMONYY", "DTMONYY", "DTWKDATX",
+                        "DTYEAR", "TOD", "MDYAMPM")
diff --git a/pandas/io/sas/sas_xport.py b/pandas/io/sas/sas_xport.py
index 76fc55154bc49..3c607d62b4286 100644
--- a/pandas/io/sas/sas_xport.py
+++ b/pandas/io/sas/sas_xport.py
@@ -9,14 +9,18 @@
 """
 
 from datetime import datetime
-import pandas as pd
-from pandas.io.common import get_filepath_or_buffer, BaseIterator
-from pandas import compat
 import struct
-import numpy as np
-from pandas.util.decorators import Appender
 import warnings
 
+import numpy as np
+
+from pandas.util._decorators import Appender
+
+import pandas as pd
+from pandas import compat
+
+from pandas.io.common import BaseIterator, get_filepath_or_buffer
+
 _correct_line1 = ("HEADER RECORD*******LIBRARY HEADER RECORD!!!!!!!"
                   "000000000000000000000000000000  ")
 _correct_header1 = ("HEADER RECORD*******MEMBER  HEADER RECORD!!!!!!!"
@@ -68,15 +72,14 @@
 --------
 Read a SAS Xport file:
 
->>> df = pandas.read_sas('filename.XPT')
+>>> df = pd.read_sas('filename.XPT')
 
 Read a Xport file in 10,000 line chunks:
 
->>> itr = pandas.read_sas('filename.XPT', chunksize=10000)
+>>> itr = pd.read_sas('filename.XPT', chunksize=10000)
 >>> for chunk in itr:
 >>>     do_something(chunk)
 
-.. versionadded:: 0.17.0
 """ % {"_base_params_doc": _base_params_doc,
        "_format_params_doc": _format_params_doc,
        "_params2_doc": _params2_doc,
@@ -179,10 +182,6 @@ def _parse_float_vec(vec):
     # number sans exponent
     ieee1 = xport1 & 0x00ffffff
 
-    # Get the second half of the ibm number into the second half of
-    # the ieee number
-    ieee2 = xport2
-
     # The fraction bit to the left of the binary point in the ieee
     # format was set and the number was shifted 0, 1, 2, or 3
     # places. This will tell us how to adjust the ibm exponent to be a
@@ -237,7 +236,8 @@ def __init__(self, filepath_or_buffer, index=None, encoding='ISO-8859-1',
         self._chunksize = chunksize
 
         if isinstance(filepath_or_buffer, str):
-            filepath_or_buffer, encoding, compression = get_filepath_or_buffer(
+            (filepath_or_buffer, encoding,
+             compression, should_close) = get_filepath_or_buffer(
                 filepath_or_buffer, encoding=encoding)
 
         if isinstance(filepath_or_buffer, (str, compat.text_type, bytes)):
@@ -247,7 +247,7 @@ def __init__(self, filepath_or_buffer, index=None, encoding='ISO-8859-1',
             contents = filepath_or_buffer.read()
             try:
                 contents = contents.encode(self._encoding)
-            except:
+            except UnicodeEncodeError:
                 pass
             self.filepath_or_buffer = compat.BytesIO(contents)
 
@@ -353,9 +353,8 @@ def _read_header(self):
         self.columns = [x['name'].decode() for x in self.fields]
 
         # Setup the dtype.
-        dtypel = []
-        for i, field in enumerate(self.fields):
-            dtypel.append(('s' + str(i), "S" + str(field['field_length'])))
+        dtypel = [('s' + str(i), "S" + str(field['field_length']))
+                  for i, field in enumerate(self.fields)]
         dtype = np.dtype(dtypel)
         self._dtype = dtype
 
diff --git a/pandas/io/sas/sasreader.py b/pandas/io/sas/sasreader.py
index 3e4d9c9024dbd..9fae0da670bec 100644
--- a/pandas/io/sas/sasreader.py
+++ b/pandas/io/sas/sasreader.py
@@ -3,6 +3,8 @@
 """
 from pandas import compat
 
+from pandas.io.common import _stringify_path
+
 
 def read_sas(filepath_or_buffer, format=None, index=None, encoding=None,
              chunksize=None, iterator=False):
@@ -14,8 +16,8 @@ def read_sas(filepath_or_buffer, format=None, index=None, encoding=None,
     filepath_or_buffer : string or file-like object
         Path to the SAS file.
     format : string {'xport', 'sas7bdat'} or None
-        If None, file format is inferred.  If 'xport' or 'sas7bdat',
-        uses the corresponding format.
+        If None, file format is inferred from file extension. If 'xport' or
+        'sas7bdat', uses the corresponding format.
     index : identifier of index column, defaults to None
         Identifier of column that should be used as index of the DataFrame.
     encoding : string, default is None
@@ -34,18 +36,16 @@ def read_sas(filepath_or_buffer, format=None, index=None, encoding=None,
         buffer_error_msg = ("If this is a buffer object rather "
                             "than a string name, you must specify "
                             "a format string")
+        filepath_or_buffer = _stringify_path(filepath_or_buffer)
         if not isinstance(filepath_or_buffer, compat.string_types):
             raise ValueError(buffer_error_msg)
-        try:
-            fname = filepath_or_buffer.lower()
-            if fname.endswith(".xpt"):
-                format = "xport"
-            elif fname.endswith(".sas7bdat"):
-                format = "sas7bdat"
-            else:
-                raise ValueError("unable to infer format of SAS file")
-        except:
-            pass
+        fname = filepath_or_buffer.lower()
+        if fname.endswith(".xpt"):
+            format = "xport"
+        elif fname.endswith(".sas7bdat"):
+            format = "sas7bdat"
+        else:
+            raise ValueError("unable to infer format of SAS file")
 
     if format.lower() == 'xport':
         from pandas.io.sas.sas_xport import XportReader
diff --git a/pandas/io/sql.py b/pandas/io/sql.py
index b210baedaaf6d..02fba52eac7f7 100644
--- a/pandas/io/sql.py
+++ b/pandas/io/sql.py
@@ -4,26 +4,28 @@
 retrieval and to reduce dependency on DB-specific API.
 """
 
-from __future__ import print_function, division
-from datetime import datetime, date, time
+from __future__ import division, print_function
 
-import warnings
+from contextlib import contextmanager
+from datetime import date, datetime, time
+from functools import partial
 import re
+import warnings
+
 import numpy as np
 
 import pandas._libs.lib as lib
-from pandas.types.missing import isnull
-from pandas.types.dtypes import DatetimeTZDtype
-from pandas.types.common import (is_list_like, is_dict_like,
-                                 is_datetime64tz_dtype)
+from pandas.compat import (
+    map, raise_with_traceback, string_types, text_type, zip)
+
+from pandas.core.dtypes.common import (
+    is_datetime64tz_dtype, is_dict_like, is_list_like)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+from pandas.core.dtypes.missing import isna
 
-from pandas.compat import (map, zip, raise_with_traceback,
-                           string_types, text_type)
 from pandas.core.api import DataFrame, Series
 from pandas.core.base import PandasObject
-from pandas.tseries.tools import to_datetime
-
-from contextlib import contextmanager
+from pandas.core.tools.datetimes import to_datetime
 
 
 class SQLAlchemyRequired(ImportError):
@@ -40,24 +42,6 @@ class DatabaseError(IOError):
 _SQLALCHEMY_INSTALLED = None
 
 
-def _validate_flavor_parameter(flavor):
-    """
-    Checks whether a database 'flavor' was specified.
-    If not None, produces FutureWarning if 'sqlite' and
-    raises a ValueError if anything else.
-    """
-    if flavor is not None:
-        if flavor == 'sqlite':
-            warnings.warn("the 'flavor' parameter is deprecated "
-                          "and will be removed in a future version, "
-                          "as 'sqlite' is the only supported option "
-                          "when SQLAlchemy is not installed.",
-                          FutureWarning, stacklevel=2)
-        else:
-            raise ValueError("database flavor {flavor} is not "
-                             "supported".format(flavor=flavor))
-
-
 def _is_sqlalchemy_connectable(con):
     global _SQLALCHEMY_INSTALLED
     if _SQLALCHEMY_INSTALLED is None:
@@ -66,11 +50,11 @@ def _is_sqlalchemy_connectable(con):
             _SQLALCHEMY_INSTALLED = True
 
             from distutils.version import LooseVersion
-            ver = LooseVersion(sqlalchemy.__version__)
+            ver = sqlalchemy.__version__
             # For sqlalchemy versions < 0.8.2, the BIGINT type is recognized
             # for a sqlite engine, which results in a warning when trying to
             # read/write a DataFrame with int64 values. (GH7433)
-            if ver < '0.8.2':
+            if LooseVersion(ver) < LooseVersion('0.8.2'):
                 from sqlalchemy import BigInteger
                 from sqlalchemy.ext.compiler import compiles
 
@@ -88,7 +72,7 @@ def compile_big_int_sqlite(type_, compiler, **kw):
 
 
 def _convert_params(sql, params):
-    """convert sql and params args to DBAPI2.0 compliant format"""
+    """Convert SQL and params args to DBAPI2.0 compliant format."""
     args = [sql]
     if params is not None:
         if hasattr(params, 'keys'):  # test if params is a mapping
@@ -98,64 +82,65 @@ def _convert_params(sql, params):
     return args
 
 
-def _handle_date_column(col, format=None):
+def _process_parse_dates_argument(parse_dates):
+    """Process parse_dates argument for read_sql functions"""
+    # handle non-list entries for parse_dates gracefully
+    if parse_dates is True or parse_dates is None or parse_dates is False:
+        parse_dates = []
+
+    elif not hasattr(parse_dates, '__iter__'):
+        parse_dates = [parse_dates]
+    return parse_dates
+
+
+def _handle_date_column(col, utc=None, format=None):
     if isinstance(format, dict):
         return to_datetime(col, errors='ignore', **format)
     else:
-        if format in ['D', 's', 'ms', 'us', 'ns']:
-            return to_datetime(col, errors='coerce', unit=format, utc=True)
-        elif (issubclass(col.dtype.type, np.floating) or
-              issubclass(col.dtype.type, np.integer)):
-            # parse dates as timestamp
-            format = 's' if format is None else format
-            return to_datetime(col, errors='coerce', unit=format, utc=True)
+        # Allow passing of formatting string for integers
+        # GH17855
+        if format is None and (issubclass(col.dtype.type, np.floating) or
+                               issubclass(col.dtype.type, np.integer)):
+            format = 's'
+        if format in ['D', 'd', 'h', 'm', 's', 'ms', 'us', 'ns']:
+            return to_datetime(col, errors='coerce', unit=format, utc=utc)
         elif is_datetime64tz_dtype(col):
             # coerce to UTC timezone
             # GH11216
-            return (to_datetime(col, errors='coerce')
-                    .astype('datetime64[ns, UTC]'))
+            return to_datetime(col, utc=True)
         else:
-            return to_datetime(col, errors='coerce', format=format, utc=True)
+            return to_datetime(col, errors='coerce', format=format, utc=utc)
 
 
 def _parse_date_columns(data_frame, parse_dates):
     """
     Force non-datetime columns to be read as such.
-    Supports both string formatted and integer timestamp columns
+    Supports both string formatted and integer timestamp columns.
     """
-    # handle non-list entries for parse_dates gracefully
-    if parse_dates is True or parse_dates is None or parse_dates is False:
-        parse_dates = []
+    parse_dates = _process_parse_dates_argument(parse_dates)
 
-    if not hasattr(parse_dates, '__iter__'):
-        parse_dates = [parse_dates]
-
-    for col_name in parse_dates:
-        df_col = data_frame[col_name]
-        try:
-            fmt = parse_dates[col_name]
-        except TypeError:
-            fmt = None
-        data_frame[col_name] = _handle_date_column(df_col, format=fmt)
-
-    # we want to coerce datetime64_tz dtypes for now
+    # we want to coerce datetime64_tz dtypes for now to UTC
     # we could in theory do a 'nice' conversion from a FixedOffset tz
     # GH11216
     for col_name, df_col in data_frame.iteritems():
-        if is_datetime64tz_dtype(df_col):
-            data_frame[col_name] = _handle_date_column(df_col)
+        if is_datetime64tz_dtype(df_col) or col_name in parse_dates:
+            try:
+                fmt = parse_dates[col_name]
+            except TypeError:
+                fmt = None
+            data_frame[col_name] = _handle_date_column(df_col, format=fmt)
 
     return data_frame
 
 
 def _wrap_result(data, columns, index_col=None, coerce_float=True,
                  parse_dates=None):
-    """Wrap result set of query in a DataFrame """
+    """Wrap result set of query in a DataFrame."""
 
     frame = DataFrame.from_records(data, columns=columns,
                                    coerce_float=coerce_float)
 
-    _parse_date_columns(frame, parse_dates)
+    frame = _parse_date_columns(frame, parse_dates)
 
     if index_col is not None:
         frame.set_index(index_col, inplace=True)
@@ -170,9 +155,9 @@ def execute(sql, con, cur=None, params=None):
     Parameters
     ----------
     sql : string
-        Query to be executed
+        SQL query to be executed.
     con : SQLAlchemy connectable(engine/connection) or sqlite3 connection
-        Using SQLAlchemy makes it possible to use any DB supported by that
+        Using SQLAlchemy makes it possible to use any DB supported by the
         library.
         If a DBAPI2 object, only sqlite3 is supported.
     cur : deprecated, cursor is obtained from connection, default: None
@@ -197,53 +182,61 @@ def execute(sql, con, cur=None, params=None):
 def read_sql_table(table_name, con, schema=None, index_col=None,
                    coerce_float=True, parse_dates=None, columns=None,
                    chunksize=None):
-    """Read SQL database table into a DataFrame.
+    """
+    Read SQL database table into a DataFrame.
 
-    Given a table name and an SQLAlchemy connectable, returns a DataFrame.
+    Given a table name and a SQLAlchemy connectable, returns a DataFrame.
     This function does not support DBAPI connections.
 
     Parameters
     ----------
-    table_name : string
-        Name of SQL table in database
-    con : SQLAlchemy connectable (or database string URI)
-        Sqlite DBAPI connection mode not supported
-    schema : string, default None
+    table_name : str
+        Name of SQL table in database.
+    con : SQLAlchemy connectable or str
+        A database URI could be provided as as str.
+        SQLite DBAPI connection mode not supported.
+    schema : str, default None
         Name of SQL schema in database to query (if database flavor
-        supports this). If None, use default schema (default).
-    index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
-    coerce_float : boolean, default True
-        Attempt to convert values of non-string, non-numeric objects (like
+        supports this). Uses default schema if None (default).
+    index_col : str or list of str, optional, default: None
+        Column(s) to set as index(MultiIndex).
+    coerce_float : bool, default True
+        Attempts to convert values of non-string, non-numeric objects (like
         decimal.Decimal) to floating point. Can result in loss of Precision.
-    parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+    parse_dates : list or dict, default None
+        The behavior is as follows:
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
           strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
-    columns : list, default: None
-        List of column names to select from sql table
+          such as SQLite.
+    columns : list, default None
+        List of column names to select from SQL table.
     chunksize : int, default None
-        If specified, return an iterator where `chunksize` is the number of
+        If specified, returns an iterator where `chunksize` is the number of
         rows to include in each chunk.
 
     Returns
     -------
     DataFrame
+        A SQL table is returned as two-dimensional data structure with labeled
+        axes.
+
+    See Also
+    --------
+    read_sql_query : Read SQL query into a DataFrame.
+    read_sql : Read SQL query or database table into a DataFrame.
 
     Notes
     -----
-    Any datetime values with time zone information will be converted to UTC
+    Any datetime values with time zone information will be converted to UTC.
 
-    See also
+    Examples
     --------
-    read_sql_query : Read SQL query into a DataFrame.
-    read_sql
-
+    >>> pd.read_sql_table('table_name', 'postgres:///db_name')  # doctest:+SKIP
     """
 
     con = _engine_builder(con)
@@ -256,7 +249,7 @@ def read_sql_table(table_name, con, schema=None, index_col=None,
     try:
         meta.reflect(only=[table_name], views=True)
     except sqlalchemy.exc.InvalidRequestError:
-        raise ValueError("Table %s not found" % table_name)
+        raise ValueError("Table {name} not found".format(name=table_name))
 
     pandas_sql = SQLDatabase(con, meta=meta)
     table = pandas_sql.read_table(
@@ -266,7 +259,7 @@ def read_sql_table(table_name, con, schema=None, index_col=None,
     if table is not None:
         return table
     else:
-        raise ValueError("Table %s not found" % table_name, con)
+        raise ValueError("Table {name} not found".format(name=table_name), con)
 
 
 def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
@@ -280,17 +273,17 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
     Parameters
     ----------
     sql : string SQL query or SQLAlchemy Selectable (select or text object)
-        to be executed.
-    con : SQLAlchemy connectable(engine/connection) or database string URI
+        SQL query to be executed.
+    con : SQLAlchemy connectable(engine/connection), database string URI,
         or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
     index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
+        Column(s) to set as index(MultiIndex).
     coerce_float : boolean, default True
-        Attempt to convert values of non-string, non-numeric objects (like
-        decimal.Decimal) to floating point, useful for SQL result sets
+        Attempts to convert values of non-string, non-numeric objects (like
+        decimal.Decimal) to floating point. Useful for SQL result sets.
     params : list, tuple or dict, optional, default: None
         List of parameters to pass to execute method.  The syntax used
         to pass parameters is database driver dependent. Check your
@@ -298,14 +291,14 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
         described in PEP 249's paramstyle, is supported.
         Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
     parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
-          strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          strftime compatible in case of parsing string times, or is one of
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
+          such as SQLite.
     chunksize : int, default None
         If specified, return an iterator where `chunksize` is the number of
         rows to include in each chunk.
@@ -314,16 +307,15 @@ def read_sql_query(sql, con, index_col=None, coerce_float=True, params=None,
     -------
     DataFrame
 
-    Notes
-    -----
-    Any datetime values with time zone information parsed via the `parse_dates`
-    parameter will be converted to UTC
-
-    See also
+    See Also
     --------
-    read_sql_table : Read SQL database table into a DataFrame
+    read_sql_table : Read SQL database table into a DataFrame.
     read_sql
 
+    Notes
+    -----
+    Any datetime values with time zone information parsed via the `parse_dates`
+    parameter will be converted to UTC.
     """
     pandas_sql = pandasSQL_builder(con)
     return pandas_sql.read_query(
@@ -336,20 +328,27 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
     """
     Read SQL query or database table into a DataFrame.
 
+    This function is a convenience wrapper around ``read_sql_table`` and
+    ``read_sql_query`` (for backward compatibility). It will delegate
+    to the specific function depending on the provided input. A SQL query
+    will be routed to ``read_sql_query``, while a database table name will
+    be routed to ``read_sql_table``. Note that the delegated function might
+    have more specific notes about their functionality not listed here.
+
     Parameters
     ----------
-    sql : string SQL query or SQLAlchemy Selectable (select or text object)
-        to be executed, or database table name.
-    con : SQLAlchemy connectable(engine/connection) or database string URI
+    sql : string or SQLAlchemy Selectable (select or text object)
+        SQL query to be executed or a table name.
+    con : SQLAlchemy connectable (engine/connection) or database string URI
         or DBAPI2 connection (fallback mode)
+
         Using SQLAlchemy makes it possible to use any DB supported by that
-        library.
-        If a DBAPI2 object, only sqlite3 is supported.
+        library. If a DBAPI2 object, only sqlite3 is supported.
     index_col : string or list of strings, optional, default: None
-        Column(s) to set as index(MultiIndex)
+        Column(s) to set as index(MultiIndex).
     coerce_float : boolean, default True
-        Attempt to convert values of non-string, non-numeric objects (like
-        decimal.Decimal) to floating point, useful for SQL result sets
+        Attempts to convert values of non-string, non-numeric objects (like
+        decimal.Decimal) to floating point, useful for SQL result sets.
     params : list, tuple or dict, optional, default: None
         List of parameters to pass to execute method.  The syntax used
         to pass parameters is database driver dependent. Check your
@@ -357,16 +356,16 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
         described in PEP 249's paramstyle, is supported.
         Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
     parse_dates : list or dict, default: None
-        - List of column names to parse as dates
+        - List of column names to parse as dates.
         - Dict of ``{column_name: format string}`` where format string is
-          strftime compatible in case of parsing string times or is one of
-          (D, s, ns, ms, us) in case of parsing integer timestamps
+          strftime compatible in case of parsing string times, or is one of
+          (D, s, ns, ms, us) in case of parsing integer timestamps.
         - Dict of ``{column_name: arg dict}``, where the arg dict corresponds
           to the keyword arguments of :func:`pandas.to_datetime`
           Especially useful with databases without native Datetime support,
-          such as SQLite
+          such as SQLite.
     columns : list, default: None
-        List of column names to select from sql table (only used when reading
+        List of column names to select from SQL table (only used when reading
         a table).
     chunksize : int, default None
         If specified, return an iterator where `chunksize` is the
@@ -376,19 +375,10 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
     -------
     DataFrame
 
-    Notes
-    -----
-    This function is a convenience wrapper around ``read_sql_table`` and
-    ``read_sql_query`` (and for backward compatibility) and will delegate
-    to the specific function depending on the provided input (database
-    table name or sql query).  The delegated function might have more specific
-    notes about their functionality not listed here.
-
-    See also
+    See Also
     --------
-    read_sql_table : Read SQL database table into a DataFrame
-    read_sql_query : Read SQL query into a DataFrame
-
+    read_sql_table : Read SQL database table into a DataFrame.
+    read_sql_query : Read SQL query into a DataFrame.
     """
     pandas_sql = pandasSQL_builder(con)
 
@@ -400,7 +390,8 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
 
     try:
         _is_table_name = pandas_sql.has_table(sql)
-    except:
+    except Exception:
+        # using generic exception to catch errors from sql drivers (GH24988)
         _is_table_name = False
 
     if _is_table_name:
@@ -415,23 +406,21 @@ def read_sql(sql, con, index_col=None, coerce_float=True, params=None,
             chunksize=chunksize)
 
 
-def to_sql(frame, name, con, flavor=None, schema=None, if_exists='fail',
-           index=True, index_label=None, chunksize=None, dtype=None):
+def to_sql(frame, name, con, schema=None, if_exists='fail', index=True,
+           index_label=None, chunksize=None, dtype=None, method=None):
     """
     Write records stored in a DataFrame to a SQL database.
 
     Parameters
     ----------
-    frame : DataFrame
+    frame : DataFrame, Series
     name : string
-        Name of SQL table
+        Name of SQL table.
     con : SQLAlchemy connectable(engine/connection) or database string URI
         or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
-    flavor : 'sqlite', default None
-        DEPRECATED: this parameter will be removed in a future version
     schema : string, default None
         Name of SQL schema in database to write to (if database flavor
         supports this). If None, use default schema (default).
@@ -440,7 +429,7 @@ def to_sql(frame, name, con, flavor=None, schema=None, if_exists='fail',
         - replace: If table exists, drop it, recreate it, and insert data.
         - append: If table exists, insert data. Create if does not exist.
     index : boolean, default True
-        Write DataFrame index as a column
+        Write DataFrame index as a column.
     index_label : string or sequence, default None
         Column label for index column(s). If None is given (default) and
         `index` is True, then the index names are used.
@@ -452,12 +441,22 @@ def to_sql(frame, name, con, flavor=None, schema=None, if_exists='fail',
         Optional specifying the datatype for columns. The SQL type should
         be a SQLAlchemy type, or a string for sqlite3 fallback connection.
         If all columns are of the same type, one single value can be used.
+    method : {None, 'multi', callable}, default None
+        Controls the SQL insertion clause used:
+
+        - None : Uses standard SQL ``INSERT`` clause (one per row).
+        - 'multi': Pass multiple values in a single ``INSERT`` clause.
+        - callable with signature ``(pd_table, conn, keys, data_iter)``.
 
+        Details and a sample callable implementation can be found in the
+        section :ref:`insert method <io.sql.method>`.
+
+        .. versionadded:: 0.24.0
     """
     if if_exists not in ('fail', 'replace', 'append'):
         raise ValueError("'{0}' is not valid for if_exists".format(if_exists))
 
-    pandas_sql = pandasSQL_builder(con, schema=schema, flavor=flavor)
+    pandas_sql = pandasSQL_builder(con, schema=schema)
 
     if isinstance(frame, Series):
         frame = frame.to_frame()
@@ -467,23 +466,21 @@ def to_sql(frame, name, con, flavor=None, schema=None, if_exists='fail',
 
     pandas_sql.to_sql(frame, name, if_exists=if_exists, index=index,
                       index_label=index_label, schema=schema,
-                      chunksize=chunksize, dtype=dtype)
+                      chunksize=chunksize, dtype=dtype, method=method)
 
 
-def has_table(table_name, con, flavor=None, schema=None):
+def has_table(table_name, con, schema=None):
     """
     Check if DataBase has named table.
 
     Parameters
     ----------
     table_name: string
-        Name of SQL table
+        Name of SQL table.
     con: SQLAlchemy connectable(engine/connection) or sqlite3 DBAPI2 connection
         Using SQLAlchemy makes it possible to use any DB supported by that
         library.
         If a DBAPI2 object, only sqlite3 is supported.
-    flavor : 'sqlite', default None
-        DEPRECATED: this parameter will be removed in a future version
     schema : string, default None
         Name of SQL schema in database to write to (if database flavor supports
         this). If None, use default schema (default).
@@ -492,7 +489,7 @@ def has_table(table_name, con, flavor=None, schema=None):
     -------
     boolean
     """
-    pandas_sql = pandasSQL_builder(con, flavor=flavor, schema=schema)
+    pandas_sql = pandasSQL_builder(con, schema=schema)
     return pandas_sql.has_table(table_name)
 
 
@@ -502,7 +499,7 @@ def has_table(table_name, con, flavor=None, schema=None):
 def _engine_builder(con):
     """
     Returns a SQLAlchemy engine from a URI (if con is a string)
-    else it just return con without modifying it
+    else it just return con without modifying it.
     """
     global _SQLALCHEMY_INSTALLED
     if isinstance(con, string_types):
@@ -517,14 +514,12 @@ def _engine_builder(con):
     return con
 
 
-def pandasSQL_builder(con, flavor=None, schema=None, meta=None,
+def pandasSQL_builder(con, schema=None, meta=None,
                       is_cursor=False):
     """
     Convenience function to return the correct PandasSQL subclass based on the
-    provided parameters
+    provided parameters.
     """
-    _validate_flavor_parameter(flavor)
-
     # When support for DBAPI connections is removed,
     # is_cursor should not be necessary.
     con = _engine_builder(con)
@@ -540,7 +535,7 @@ class SQLTable(PandasObject):
     """
     For mapping Pandas tables to SQL tables.
     Uses fact that table is reflected by SQLAlchemy to
-    do better type convertions.
+    do better type conversions.
     Also holds various flags needed to avoid having to
     pass them between functions all the time.
     """
@@ -567,7 +562,8 @@ def __init__(self, name, pandas_sql_engine, frame=None, index=True,
             self.table = self.pd_sql.get_table(self.name, self.schema)
 
         if self.table is None:
-            raise ValueError("Could not init table '%s'" % name)
+            raise ValueError(
+                "Could not init table '{name}'".format(name=name))
 
     def exists(self):
         return self.pd_sql.has_table(self.name, self.schema)
@@ -584,7 +580,8 @@ def _execute_create(self):
     def create(self):
         if self.exists():
             if self.if_exists == 'fail':
-                raise ValueError("Table '%s' already exists." % self.name)
+                raise ValueError(
+                    "Table '{name}' already exists.".format(name=self.name))
             elif self.if_exists == 'replace':
                 self.pd_sql.drop_table(self.name, self.schema)
                 self._execute_create()
@@ -596,8 +593,29 @@ def create(self):
         else:
             self._execute_create()
 
-    def insert_statement(self):
-        return self.table.insert()
+    def _execute_insert(self, conn, keys, data_iter):
+        """Execute SQL statement inserting data
+
+        Parameters
+        ----------
+        conn : sqlalchemy.engine.Engine or sqlalchemy.engine.Connection
+        keys : list of str
+           Column names
+        data_iter : generator of list
+           Each item contains a list of values to be inserted
+        """
+        data = [dict(zip(keys, row)) for row in data_iter]
+        conn.execute(self.table.insert(), data)
+
+    def _execute_insert_multi(self, conn, keys, data_iter):
+        """Alternative to _execute_insert for DBs support multivalue INSERT.
+
+        Note: multi-value insert is usually faster for analytics DBs
+        and tables containing a few columns
+        but performance degrades quickly with increase of columns.
+        """
+        data = [dict(zip(keys, row)) for row in data_iter]
+        conn.execute(self.table.insert(data))
 
     def insert_data(self):
         if self.index is not None:
@@ -616,18 +634,23 @@ def insert_data(self):
         data_list = [None] * ncols
         blocks = temp._data.blocks
 
-        for i in range(len(blocks)):
-            b = blocks[i]
+        for b in blocks:
             if b.is_datetime:
-                # convert to microsecond resolution so this yields
-                # datetime.datetime
-                d = b.values.astype('M8[us]').astype(object)
+                # return datetime.datetime objects
+                if b.is_datetimetz:
+                    # GH 9086: Ensure we return datetimes with timezone info
+                    # Need to return 2-D data; DatetimeIndex is 1D
+                    d = b.values.to_pydatetime()
+                    d = np.expand_dims(d, axis=0)
+                else:
+                    # convert to microsecond resolution for datetime.datetime
+                    d = b.values.astype('M8[us]').astype(object)
             else:
                 d = np.array(b.get_values(), dtype=object)
 
             # replace NaN with None
             if b._can_hold_na:
-                mask = isnull(d)
+                mask = isna(d)
                 d[mask] = None
 
             for col_loc, col in zip(b.mgr_locs, d):
@@ -635,11 +658,18 @@ def insert_data(self):
 
         return column_names, data_list
 
-    def _execute_insert(self, conn, keys, data_iter):
-        data = [dict((k, v) for k, v in zip(keys, row)) for row in data_iter]
-        conn.execute(self.insert_statement(), data)
+    def insert(self, chunksize=None, method=None):
+
+        # set insert method
+        if method is None:
+            exec_insert = self._execute_insert
+        elif method == 'multi':
+            exec_insert = self._execute_insert_multi
+        elif callable(method):
+            exec_insert = partial(method, self)
+        else:
+            raise ValueError('Invalid parameter `method`: {}'.format(method))
 
-    def insert(self, chunksize=None):
         keys, data_list = self.insert_data()
 
         nrows = len(self.frame)
@@ -662,11 +692,11 @@ def insert(self, chunksize=None):
                     break
 
                 chunk_iter = zip(*[arr[start_i:end_i] for arr in data_list])
-                self._execute_insert(conn, keys, chunk_iter)
+                exec_insert(conn, keys, chunk_iter)
 
     def _query_iterator(self, result, chunksize, columns, coerce_float=True,
                         parse_dates=None):
-        """Return generator through chunked result set"""
+        """Return generator through chunked result set."""
 
         while True:
             data = result.fetchmany(chunksize)
@@ -765,8 +795,9 @@ def _get_column_names_and_types(self, dtype_mapper):
     def _create_table_setup(self):
         from sqlalchemy import Table, Column, PrimaryKeyConstraint
 
-        column_names_and_types = \
-            self._get_column_names_and_types(self._sqlalchemy_type)
+        column_names_and_types = self._get_column_names_and_types(
+            self._sqlalchemy_type
+        )
 
         columns = [Column(name, typ, index=is_index)
                    for name, typ, is_index in column_names_and_types]
@@ -798,26 +829,34 @@ def _harmonize_columns(self, parse_dates=None):
         all Nones with false. Therefore only convert bool if there are no
         NA values.
         Datetimes should already be converted to np.datetime64 if supported,
-        but here we also force conversion if required
+        but here we also force conversion if required.
         """
-        # handle non-list entries for parse_dates gracefully
-        if parse_dates is True or parse_dates is None or parse_dates is False:
-            parse_dates = []
-
-        if not hasattr(parse_dates, '__iter__'):
-            parse_dates = [parse_dates]
+        parse_dates = _process_parse_dates_argument(parse_dates)
 
         for sql_col in self.table.columns:
             col_name = sql_col.name
             try:
                 df_col = self.frame[col_name]
+
+                # Handle date parsing upfront; don't try to convert columns
+                # twice
+                if col_name in parse_dates:
+                    try:
+                        fmt = parse_dates[col_name]
+                    except TypeError:
+                        fmt = None
+                    self.frame[col_name] = _handle_date_column(
+                        df_col, format=fmt)
+                    continue
+
                 # the type the dataframe column should have
                 col_type = self._get_dtype(sql_col.type)
 
                 if (col_type is datetime or col_type is date or
                         col_type is DatetimeTZDtype):
-                    self.frame[col_name] = _handle_date_column(df_col)
-
+                    # Convert tz-aware Datetime SQL columns to UTC
+                    utc = col_type is DatetimeTZDtype
+                    self.frame[col_name] = _handle_date_column(df_col, utc=utc)
                 elif col_type is float:
                     # floats support NA, can always convert!
                     self.frame[col_name] = df_col.astype(col_type, copy=False)
@@ -827,51 +866,34 @@ def _harmonize_columns(self, parse_dates=None):
                     if col_type is np.dtype('int64') or col_type is bool:
                         self.frame[col_name] = df_col.astype(
                             col_type, copy=False)
-
-                # Handle date parsing
-                if col_name in parse_dates:
-                    try:
-                        fmt = parse_dates[col_name]
-                    except TypeError:
-                        fmt = None
-                    self.frame[col_name] = _handle_date_column(
-                        df_col, format=fmt)
-
             except KeyError:
                 pass  # this column not in results
 
-    def _get_notnull_col_dtype(self, col):
-        """
-        Infer datatype of the Series col.  In case the dtype of col is 'object'
-        and it contains NA values, this infers the datatype of the not-NA
-        values.  Needed for inserting typed data containing NULLs, GH8778.
-        """
-        col_for_inference = col
-        if col.dtype == 'object':
-            notnulldata = col[~isnull(col)]
-            if len(notnulldata):
-                col_for_inference = notnulldata
-
-        return lib.infer_dtype(col_for_inference)
-
     def _sqlalchemy_type(self, col):
 
         dtype = self.dtype or {}
         if col.name in dtype:
             return self.dtype[col.name]
 
-        col_type = self._get_notnull_col_dtype(col)
+        # Infer type of column, while ignoring missing values.
+        # Needed for inserting typed data containing NULLs, GH 8778.
+        col_type = lib.infer_dtype(col, skipna=True)
 
         from sqlalchemy.types import (BigInteger, Integer, Float,
                                       Text, Boolean,
-                                      DateTime, Date, Time)
+                                      DateTime, Date, Time, TIMESTAMP)
 
         if col_type == 'datetime64' or col_type == 'datetime':
+            # GH 9086: TIMESTAMP is the suggested type if the column contains
+            # timezone information
             try:
-                tz = col.tzinfo  # noqa
-                return DateTime(timezone=True)
-            except:
-                return DateTime
+                if col.dt.tz is not None:
+                    return TIMESTAMP(timezone=True)
+            except AttributeError:
+                # The column is actually a DatetimeIndex
+                if col.tz is not None:
+                    return TIMESTAMP(timezone=True)
+            return DateTime
         if col_type == 'timedelta64':
             warnings.warn("the 'timedelta' type is not supported, and will be "
                           "written as integer values (ns frequency) to the "
@@ -924,7 +946,7 @@ def _get_dtype(self, sqltype):
 
 class PandasSQL(PandasObject):
     """
-    Subclasses Should define read_sql and to_sql
+    Subclasses Should define read_sql and to_sql.
     """
 
     def read_sql(self, *args, **kwargs):
@@ -938,8 +960,8 @@ def to_sql(self, *args, **kwargs):
 
 class SQLDatabase(PandasSQL):
     """
-    This class enables convertion between DataFrame and SQL databases
-    using SQLAlchemy to handle DataBase abstraction
+    This class enables conversion between DataFrame and SQL databases
+    using SQLAlchemy to handle DataBase abstraction.
 
     Parameters
     ----------
@@ -984,28 +1006,28 @@ def read_table(self, table_name, index_col=None, coerce_float=True,
         Parameters
         ----------
         table_name : string
-            Name of SQL table in database
+            Name of SQL table in database.
         index_col : string, optional, default: None
-            Column to set as index
+            Column to set as index.
         coerce_float : boolean, default True
-            Attempt to convert values of non-string, non-numeric objects
+            Attempts to convert values of non-string, non-numeric objects
             (like decimal.Decimal) to floating point. This can result in
             loss of precision.
         parse_dates : list or dict, default: None
-            - List of column names to parse as dates
+            - List of column names to parse as dates.
             - Dict of ``{column_name: format string}`` where format string is
-              strftime compatible in case of parsing string times or is one of
-              (D, s, ns, ms, us) in case of parsing integer timestamps
+              strftime compatible in case of parsing string times, or is one of
+              (D, s, ns, ms, us) in case of parsing integer timestamps.
             - Dict of ``{column_name: arg}``, where the arg corresponds
               to the keyword arguments of :func:`pandas.to_datetime`.
               Especially useful with databases without native Datetime support,
-              such as SQLite
+              such as SQLite.
         columns : list, default: None
-            List of column names to select from sql table
+            List of column names to select from SQL table.
         schema : string, default None
             Name of SQL schema in database to query (if database flavor
             supports this).  If specified, this overwrites the default
-            schema of the SQLDatabase object.
+            schema of the SQL database object.
         chunksize : int, default None
             If specified, return an iterator where `chunksize` is the number
             of rows to include in each chunk.
@@ -1014,7 +1036,7 @@ def read_table(self, table_name, index_col=None, coerce_float=True,
         -------
         DataFrame
 
-        See also
+        See Also
         --------
         pandas.read_sql_table
         SQLDatabase.read_query
@@ -1046,12 +1068,12 @@ def read_query(self, sql, index_col=None, coerce_float=True,
         Parameters
         ----------
         sql : string
-            SQL query to be executed
+            SQL query to be executed.
         index_col : string, optional, default: None
             Column name to use as index for the returned DataFrame object.
         coerce_float : boolean, default True
             Attempt to convert values of non-string, non-numeric objects (like
-            decimal.Decimal) to floating point, useful for SQL result sets
+            decimal.Decimal) to floating point, useful for SQL result sets.
         params : list, tuple or dict, optional, default: None
             List of parameters to pass to execute method.  The syntax used
             to pass parameters is database driver dependent. Check your
@@ -1059,14 +1081,14 @@ def read_query(self, sql, index_col=None, coerce_float=True,
             described in PEP 249's paramstyle, is supported.
             Eg. for psycopg2, uses %(name)s so use params={'name' : 'value'}
         parse_dates : list or dict, default: None
-            - List of column names to parse as dates
+            - List of column names to parse as dates.
             - Dict of ``{column_name: format string}`` where format string is
-              strftime compatible in case of parsing string times or is one of
-              (D, s, ns, ms, us) in case of parsing integer timestamps
+              strftime compatible in case of parsing string times, or is one of
+              (D, s, ns, ms, us) in case of parsing integer timestamps.
             - Dict of ``{column_name: arg dict}``, where the arg dict
               corresponds to the keyword arguments of
               :func:`pandas.to_datetime` Especially useful with databases
-              without native Datetime support, such as SQLite
+              without native Datetime support, such as SQLite.
         chunksize : int, default None
             If specified, return an iterator where `chunksize` is the number
             of rows to include in each chunk.
@@ -1075,9 +1097,9 @@ def read_query(self, sql, index_col=None, coerce_float=True,
         -------
         DataFrame
 
-        See also
+        See Also
         --------
-        read_sql_table : Read SQL database table into a DataFrame
+        read_sql_table : Read SQL database table into a DataFrame.
         read_sql
 
         """
@@ -1101,7 +1123,8 @@ def read_query(self, sql, index_col=None, coerce_float=True,
     read_sql = read_query
 
     def to_sql(self, frame, name, if_exists='fail', index=True,
-               index_label=None, schema=None, chunksize=None, dtype=None):
+               index_label=None, schema=None, chunksize=None, dtype=None,
+               method=None):
         """
         Write records stored in a DataFrame to a SQL database.
 
@@ -1109,13 +1132,13 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         ----------
         frame : DataFrame
         name : string
-            Name of SQL table
+            Name of SQL table.
         if_exists : {'fail', 'replace', 'append'}, default 'fail'
             - fail: If table exists, do nothing.
             - replace: If table exists, drop it, recreate it, and insert data.
             - append: If table exists, insert data. Create if does not exist.
         index : boolean, default True
-            Write DataFrame index as a column
+            Write DataFrame index as a column.
         index_label : string or sequence, default None
             Column label for index column(s). If None is given (default) and
             `index` is True, then the index names are used.
@@ -1131,7 +1154,17 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
             Optional specifying the datatype for columns. The SQL type should
             be a SQLAlchemy type. If all columns are of the same type, one
             single value can be used.
+        method : {None', 'multi', callable}, default None
+            Controls the SQL insertion clause used:
 
+            * None : Uses standard SQL ``INSERT`` clause (one per row).
+            * 'multi': Pass multiple values in a single ``INSERT`` clause.
+            * callable with signature ``(pd_table, conn, keys, data_iter)``.
+
+            Details and a sample callable implementation can be found in the
+            section :ref:`insert method <io.sql.method>`.
+
+            .. versionadded:: 0.24.0
         """
         if dtype and not is_dict_like(dtype):
             dtype = {col_name: dtype for col_name in frame}
@@ -1140,14 +1173,14 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
             from sqlalchemy.types import to_instance, TypeEngine
             for col, my_type in dtype.items():
                 if not isinstance(to_instance(my_type), TypeEngine):
-                    raise ValueError('The type of %s is not a SQLAlchemy '
-                                     'type ' % col)
+                    raise ValueError('The type of {column} is not a '
+                                     'SQLAlchemy type '.format(column=col))
 
         table = SQLTable(name, self, frame=frame, index=index,
                          if_exists=if_exists, index_label=index_label,
                          schema=schema, dtype=dtype)
         table.create()
-        table.insert(chunksize)
+        table.insert(chunksize, method=method)
         if (not name.isdigit() and not name.islower()):
             # check for potentially case sensitivity issues (GH7815)
             # Only check when name is not a number and name is not lower case
@@ -1223,7 +1256,8 @@ def _get_unicode_name(name):
     try:
         uname = text_type(name).encode("utf-8", "strict").decode("utf-8")
     except UnicodeError:
-        raise ValueError("Cannot convert identifier to UTF-8: '%s'" % name)
+        raise ValueError(
+            "Cannot convert identifier to UTF-8: '{name}'".format(name=name))
     return uname
 
 
@@ -1284,8 +1318,9 @@ def insert_statement(self):
         bracketed_names = [escape(column) for column in names]
         col_names = ','.join(bracketed_names)
         wildcards = ','.join([wld] * len(names))
-        insert_statement = 'INSERT INTO %s (%s) VALUES (%s)' % (
-            escape(self.name), col_names, wildcards)
+        insert_statement = \
+            u'INSERT INTO {table} ({columns}) VALUES ({wld})'.format(
+                table=escape(self.name), columns=col_names, wld=wildcards)
         return insert_statement
 
     def _execute_insert(self, conn, keys, data_iter):
@@ -1294,14 +1329,15 @@ def _execute_insert(self, conn, keys, data_iter):
 
     def _create_table_setup(self):
         """
-        Return a list of SQL statement that create a table reflecting the
+        Return a list of SQL statements that creates a table reflecting the
         structure of a DataFrame.  The first entry will be a CREATE TABLE
-        statement while the rest will be CREATE INDEX statements
+        statement while the rest will be CREATE INDEX statements.
         """
-        column_names_and_types = \
-            self._get_column_names_and_types(self._sql_type_name)
+        column_names_and_types = self._get_column_names_and_types(
+            self._sql_type_name
+        )
 
-        pat = re.compile('\s+')
+        pat = re.compile(r'\s+')
         column_names = [col_name for col_name, _, _ in column_names_and_types]
         if any(map(pat.search, column_names)):
             warnings.warn(_SAFE_NAMES_WARNING, stacklevel=6)
@@ -1316,7 +1352,7 @@ def _create_table_setup(self):
                 keys = [self.keys]
             else:
                 keys = self.keys
-            cnames_br = ", ".join([escape(c) for c in keys])
+            cnames_br = ", ".join(escape(c) for c in keys)
             create_tbl_stmts.append(
                 "CONSTRAINT {tbl}_pk PRIMARY KEY ({cnames_br})".format(
                     tbl=self.name, cnames_br=cnames_br))
@@ -1328,7 +1364,7 @@ def _create_table_setup(self):
                    if is_index]
         if len(ix_cols):
             cnames = "_".join(ix_cols)
-            cnames_br = ",".join([escape(c) for c in ix_cols])
+            cnames_br = ",".join(escape(c) for c in ix_cols)
             create_stmts.append(
                 "CREATE INDEX " + escape("ix_" + self.name + "_" + cnames) +
                 "ON " + escape(self.name) + " (" + cnames_br + ")")
@@ -1340,7 +1376,10 @@ def _sql_type_name(self, col):
         if col.name in dtype:
             return dtype[col.name]
 
-        col_type = self._get_notnull_col_dtype(col)
+        # Infer type of column, while ignoring missing values.
+        # Needed for inserting typed data containing NULLs, GH 8778.
+        col_type = lib.infer_dtype(col, skipna=True)
+
         if col_type == 'timedelta64':
             warnings.warn("the 'timedelta' type is not supported, and will be "
                           "written as integer values (ns frequency) to the "
@@ -1364,8 +1403,8 @@ def _sql_type_name(self, col):
 
 class SQLiteDatabase(PandasSQL):
     """
-    Version of SQLDatabase to support sqlite connections (fallback without
-    sqlalchemy). This should only be used internally.
+    Version of SQLDatabase to support SQLite connections (fallback without
+    SQLAlchemy). This should only be used internally.
 
     Parameters
     ----------
@@ -1373,9 +1412,7 @@ class SQLiteDatabase(PandasSQL):
 
     """
 
-    def __init__(self, con, flavor=None, is_cursor=False):
-        _validate_flavor_parameter(flavor)
-
+    def __init__(self, con, is_cursor=False):
         self.is_cursor = is_cursor
         self.con = con
 
@@ -1385,7 +1422,7 @@ def run_transaction(self):
         try:
             yield cur
             self.con.commit()
-        except:
+        except Exception:
             self.con.rollback()
             raise
         finally:
@@ -1406,12 +1443,14 @@ def execute(self, *args, **kwargs):
             try:
                 self.con.rollback()
             except Exception:  # pragma: no cover
-                ex = DatabaseError("Execution failed on sql: %s\n%s\nunable"
-                                   " to rollback" % (args[0], exc))
+                ex = DatabaseError(
+                    "Execution failed on sql: {sql}\n{exc}\nunable "
+                    "to rollback".format(sql=args[0], exc=exc))
                 raise_with_traceback(ex)
 
             ex = DatabaseError(
-                "Execution failed on sql '%s': %s" % (args[0], exc))
+                "Execution failed on sql '{sql}': {exc}".format(
+                    sql=args[0], exc=exc))
             raise_with_traceback(ex)
 
     @staticmethod
@@ -1459,18 +1498,20 @@ def _fetchall_as_list(self, cur):
         return result
 
     def to_sql(self, frame, name, if_exists='fail', index=True,
-               index_label=None, schema=None, chunksize=None, dtype=None):
+               index_label=None, schema=None, chunksize=None, dtype=None,
+               method=None):
         """
         Write records stored in a DataFrame to a SQL database.
 
         Parameters
         ----------
         frame: DataFrame
-        name: name of SQL table
+        name: string
+            Name of SQL table.
         if_exists: {'fail', 'replace', 'append'}, default 'fail'
             fail: If table exists, do nothing.
             replace: If table exists, drop it, recreate it, and insert data.
-            append: If table exists, insert data. Create if does not exist.
+            append: If table exists, insert data. Create if it does not exist.
         index : boolean, default True
             Write DataFrame index as a column
         index_label : string or sequence, default None
@@ -1478,7 +1519,7 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
             `index` is True, then the index names are used.
             A sequence should be given if the DataFrame uses MultiIndex.
         schema : string, default None
-            Ignored parameter included for compatability with SQLAlchemy
+            Ignored parameter included for compatibility with SQLAlchemy
             version of ``to_sql``.
         chunksize : int, default None
             If not None, then rows will be written in batches of this
@@ -1487,7 +1528,17 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
             Optional specifying the datatype for columns. The SQL type should
             be a string. If all columns are of the same type, one single value
             can be used.
+        method : {None, 'multi', callable}, default None
+            Controls the SQL insertion clause used:
+
+            * None : Uses standard SQL ``INSERT`` clause (one per row).
+            * 'multi': Pass multiple values in a single ``INSERT`` clause.
+            * callable with signature ``(pd_table, conn, keys, data_iter)``.
+
+            Details and a sample callable implementation can be found in the
+            section :ref:`insert method <io.sql.method>`.
 
+            .. versionadded:: 0.24.0
         """
         if dtype and not is_dict_like(dtype):
             dtype = {col_name: dtype for col_name in frame}
@@ -1495,14 +1546,14 @@ def to_sql(self, frame, name, if_exists='fail', index=True,
         if dtype is not None:
             for col, my_type in dtype.items():
                 if not isinstance(my_type, str):
-                    raise ValueError('%s (%s) not a string' % (
-                        col, str(my_type)))
+                    raise ValueError('{column} ({type!s}) not a string'.format(
+                        column=col, type=my_type))
 
         table = SQLiteTable(name, self, frame=frame, index=index,
                             if_exists=if_exists, index_label=index_label,
                             dtype=dtype)
         table.create()
-        table.insert(chunksize)
+        table.insert(chunksize, method)
 
     def has_table(self, name, schema=None):
         # TODO(wesm): unused?
@@ -1511,7 +1562,7 @@ def has_table(self, name, schema=None):
 
         wld = '?'
         query = ("SELECT name FROM sqlite_master "
-                 "WHERE type='table' AND name=%s;") % wld
+                 "WHERE type='table' AND name={wld};").format(wld=wld)
 
         return len(self.execute(query, [name, ]).fetchall()) > 0
 
@@ -1519,7 +1570,8 @@ def get_table(self, table_name, schema=None):
         return None  # not supported in fallback mode
 
     def drop_table(self, name, schema=None):
-        drop_sql = "DROP TABLE %s" % _get_valid_sqlite_name(name)
+        drop_sql = "DROP TABLE {name}".format(
+            name=_get_valid_sqlite_name(name))
         self.execute(drop_sql)
 
     def _create_sql_schema(self, frame, table_name, keys=None, dtype=None):
@@ -1528,7 +1580,7 @@ def _create_sql_schema(self, frame, table_name, keys=None, dtype=None):
         return str(table.sql_schema())
 
 
-def get_schema(frame, name, flavor=None, keys=None, con=None, dtype=None):
+def get_schema(frame, name, keys=None, con=None, dtype=None):
     """
     Get the SQL db table schema for the given frame.
 
@@ -1543,13 +1595,11 @@ def get_schema(frame, name, flavor=None, keys=None, con=None, dtype=None):
         Using SQLAlchemy makes it possible to use any DB supported by that
         library, default: None
         If a DBAPI2 object, only sqlite3 is supported.
-    flavor : 'sqlite', default None
-        DEPRECATED: this parameter will be removed in a future version
     dtype : dict of column name to SQL type, default None
         Optional specifying the datatype for columns. The SQL type should
         be a SQLAlchemy type, or a string for sqlite3 fallback connection.
 
     """
 
-    pandas_sql = pandasSQL_builder(con=con, flavor=flavor)
+    pandas_sql = pandasSQL_builder(con=con)
     return pandas_sql._create_sql_schema(frame, name, keys=keys, dtype=dtype)
diff --git a/pandas/io/stata.py b/pandas/io/stata.py
index 1d2951da68086..62a9dbdc4657e 100644
--- a/pandas/io/stata.py
+++ b/pandas/io/stata.py
@@ -9,32 +9,36 @@
 You can find more information on http://presbrey.mit.edu/PyDTA and
 http://www.statsmodels.org/devel/
 """
-import numpy as np
 
-import sys
+from collections import OrderedDict
+import datetime
+import os
 import struct
+import sys
+import warnings
+
 from dateutil.relativedelta import relativedelta
+import numpy as np
 
-from pandas.types.common import (is_categorical_dtype, is_datetime64_dtype,
-                                 _ensure_object)
+from pandas._libs.lib import infer_dtype
+from pandas._libs.tslibs import NaT, Timestamp
+from pandas._libs.writers import max_len_string_array
+from pandas.compat import (
+    BytesIO, ResourceWarning, lmap, lrange, lzip, range, string_types,
+    text_type, zip)
+from pandas.util._decorators import Appender, deprecate_kwarg
 
+from pandas.core.dtypes.common import (
+    ensure_object, is_categorical_dtype, is_datetime64_dtype)
+
+from pandas import DatetimeIndex, compat, isna, to_datetime, to_timedelta
+from pandas.core.arrays import Categorical
 from pandas.core.base import StringMixin
-from pandas.core.categorical import Categorical
 from pandas.core.frame import DataFrame
 from pandas.core.series import Series
-import datetime
-from pandas import compat, to_timedelta, to_datetime, isnull, DatetimeIndex
-from pandas.compat import lrange, lmap, lzip, text_type, string_types, range, \
-    zip, BytesIO
-from pandas.util.decorators import Appender
-import pandas as pd
-
-from pandas.io.common import get_filepath_or_buffer, BaseIterator
-from pandas._libs.lib import max_len_string_array, infer_dtype
-from pandas._libs.tslib import NaT, Timestamp
 
-VALID_ENCODINGS = ('ascii', 'us-ascii', 'latin-1', 'latin_1', 'iso-8859-1',
-                   'iso8859-1', '8859', 'cp819', 'latin', 'latin1', 'L1')
+from pandas.io.common import (
+    BaseIterator, _stringify_path, get_filepath_or_buffer)
 
 _version_error = ("Version of given Stata file is not 104, 105, 108, "
                   "111 (Stata 7SE), 113 (Stata 8/9), 114 (Stata 10/11), "
@@ -42,47 +46,48 @@
 
 _statafile_processing_params1 = """\
 convert_dates : boolean, defaults to True
-    Convert date variables to DataFrame time values
+    Convert date variables to DataFrame time values.
 convert_categoricals : boolean, defaults to True
-    Read value labels and convert columns to Categorical/Factor variables"""
+    Read value labels and convert columns to Categorical/Factor variables."""
 
 _encoding_params = """\
 encoding : string, None or encoding
     Encoding used to parse the files. None defaults to latin-1."""
 
 _statafile_processing_params2 = """\
-index : identifier of index column
-    identifier of column that should be used as index of the DataFrame
+index_col : string, optional, default: None
+    Column to set as index.
 convert_missing : boolean, defaults to False
     Flag indicating whether to convert missing values to their Stata
-    representations.  If False, missing values are replaced with nans.
+    representations.  If False, missing values are replaced with nan.
     If True, columns containing missing values are returned with
     object data types and missing values are represented by
     StataMissingValue objects.
 preserve_dtypes : boolean, defaults to True
     Preserve Stata datatypes. If False, numeric data are upcast to pandas
-    default types for foreign data (float64 or int64)
+    default types for foreign data (float64 or int64).
 columns : list or None
     Columns to retain.  Columns will be returned in the given order.  None
-    returns all columns
+    returns all columns.
 order_categoricals : boolean, defaults to True
     Flag indicating whether converted categorical data are ordered."""
 
 _chunksize_params = """\
 chunksize : int, default None
     Return StataReader object for iterations, returns chunks with
-    given number of lines"""
+    given number of lines."""
 
 _iterator_params = """\
 iterator : boolean, default False
-    Return StataReader object"""
+    Return StataReader object."""
 
-_read_stata_doc = """Read Stata file into DataFrame
+_read_stata_doc = """
+Read Stata file into DataFrame.
 
 Parameters
 ----------
 filepath_or_buffer : string or file-like object
-    Path to .dta file or object implementing a binary read() functions
+    Path to .dta file or object implementing a binary read() functions.
 %s
 %s
 %s
@@ -93,24 +98,31 @@
 -------
 DataFrame or StataReader
 
+See Also
+--------
+io.stata.StataReader : Low-level reader for Stata data files.
+DataFrame.to_stata: Export Stata data files.
+
 Examples
 --------
 Read a Stata dta file:
 
->>> df = pandas.read_stata('filename.dta')
+>>> df = pd.read_stata('filename.dta')
 
 Read a Stata dta file in 10,000 line chunks:
 
->>> itr = pandas.read_stata('filename.dta', chunksize=10000)
+>>> itr = pd.read_stata('filename.dta', chunksize=10000)
 >>> for chunk in itr:
->>>     do_something(chunk)
+...     do_something(chunk)
 """ % (_statafile_processing_params1, _encoding_params,
        _statafile_processing_params2, _chunksize_params,
        _iterator_params)
 
-_data_method_doc = """Reads observations from Stata file, converting them into a dataframe
+_data_method_doc = """\
+Read observations from Stata file, converting them into a dataframe
 
-This is a legacy method.  Use `read` in new code.
+.. deprecated::
+    This is a legacy method.  Use `read` in new code.
 
 Parameters
 ----------
@@ -122,7 +134,6 @@
 DataFrame
 """ % (_statafile_processing_params1, _statafile_processing_params2)
 
-
 _read_method_doc = """\
 Reads observations from Stata file, converting them into a dataframe
 
@@ -144,8 +155,11 @@
 
 Parameters
 ----------
-path_or_buf : string or file-like object
-    Path to .dta file or object implementing a binary read() functions
+path_or_buf : path (string), buffer or path object
+    string, path object (pathlib.Path or py._path.local.LocalPath) or object
+    implementing a binary read() functions.
+
+    .. versionadded:: 0.23.0 support for pathlib, py.path.
 %s
 %s
 %s
@@ -155,19 +169,21 @@
 
 
 @Appender(_read_stata_doc)
+@deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+@deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
 def read_stata(filepath_or_buffer, convert_dates=True,
-               convert_categoricals=True, encoding=None, index=None,
+               convert_categoricals=True, encoding=None, index_col=None,
                convert_missing=False, preserve_dtypes=True, columns=None,
                order_categoricals=True, chunksize=None, iterator=False):
 
     reader = StataReader(filepath_or_buffer,
                          convert_dates=convert_dates,
                          convert_categoricals=convert_categoricals,
-                         index=index, convert_missing=convert_missing,
+                         index_col=index_col, convert_missing=convert_missing,
                          preserve_dtypes=preserve_dtypes,
                          columns=columns,
                          order_categoricals=order_categoricals,
-                         chunksize=chunksize, encoding=encoding)
+                         chunksize=chunksize)
 
     if iterator or chunksize:
         data = reader
@@ -204,7 +220,6 @@ def _stata_elapsed_date_to_datetime_vec(dates, fmt):
 
     Examples
     --------
-    >>> import pandas as pd
     >>> dates = pd.Series([52])
     >>> _stata_elapsed_date_to_datetime_vec(dates , "%tw")
     0   1961-01-01
@@ -244,8 +259,9 @@ def _stata_elapsed_date_to_datetime_vec(dates, fmt):
     def convert_year_month_safe(year, month):
         """
         Convert year and month to datetimes, using pandas vectorized versions
-        when the date range falls within the range supported by pandas.  Other
-        wise it falls back to a slower but more robust method using datetime.
+        when the date range falls within the range supported by pandas.
+        Otherwise it falls back to a slower but more robust method
+        using datetime.
         """
         if year.max() < MAX_YEAR and year.min() > MIN_YEAR:
             return to_datetime(100 * year + month, format='%Y%m')
@@ -301,44 +317,47 @@ def convert_delta_safe(base, deltas, unit):
         data_col[bad_locs] = 1.0  # Replace with NaT
     dates = dates.astype(np.int64)
 
-    if fmt in ["%tc", "tc"]:  # Delta ms relative to base
+    if fmt.startswith(("%tc", "tc")):  # Delta ms relative to base
         base = stata_epoch
         ms = dates
         conv_dates = convert_delta_safe(base, ms, 'ms')
-    elif fmt in ["%tC", "tC"]:
-        from warnings import warn
+    elif fmt.startswith(("%tC", "tC")):
 
-        warn("Encountered %tC format. Leaving in Stata Internal Format.")
+        warnings.warn("Encountered %tC format. Leaving in Stata "
+                      "Internal Format.")
         conv_dates = Series(dates, dtype=np.object)
         if has_bad_values:
-            conv_dates[bad_locs] = pd.NaT
+            conv_dates[bad_locs] = NaT
         return conv_dates
-    elif fmt in ["%td", "td", "%d", "d"]:  # Delta days relative to base
+    # Delta days relative to base
+    elif fmt.startswith(("%td", "td", "%d", "d")):
         base = stata_epoch
         days = dates
         conv_dates = convert_delta_safe(base, days, 'd')
-    elif fmt in ["%tw", "tw"]:  # does not count leap days - 7 days is a week
+    # does not count leap days - 7 days is a week.
+    # 52nd week may have more than 7 days
+    elif fmt.startswith(("%tw", "tw")):
         year = stata_epoch.year + dates // 52
         days = (dates % 52) * 7
         conv_dates = convert_year_days_safe(year, days)
-    elif fmt in ["%tm", "tm"]:  # Delta months relative to base
+    elif fmt.startswith(("%tm", "tm")):  # Delta months relative to base
         year = stata_epoch.year + dates // 12
         month = (dates % 12) + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%tq", "tq"]:  # Delta quarters relative to base
+    elif fmt.startswith(("%tq", "tq")):  # Delta quarters relative to base
         year = stata_epoch.year + dates // 4
         month = (dates % 4) * 3 + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%th", "th"]:  # Delta half-years relative to base
+    elif fmt.startswith(("%th", "th")):  # Delta half-years relative to base
         year = stata_epoch.year + dates // 2
         month = (dates % 2) * 6 + 1
         conv_dates = convert_year_month_safe(year, month)
-    elif fmt in ["%ty", "ty"]:  # Years -- not delta
+    elif fmt.startswith(("%ty", "ty")):  # Years -- not delta
         year = dates
         month = np.ones_like(dates)
         conv_dates = convert_year_month_safe(year, month)
     else:
-        raise ValueError("Date fmt %s not understood" % fmt)
+        raise ValueError("Date fmt {fmt} not understood".format(fmt=fmt))
 
     if has_bad_values:  # Restore NaT for bad values
         conv_dates[bad_locs] = NaT
@@ -377,7 +396,7 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
                         to_datetime(d['year'], format='%Y').astype(np.int64))
                 d['days'] = days // NS_PER_DAY
 
-        elif infer_dtype(dates) == 'datetime':
+        elif infer_dtype(dates, skipna=False) == 'datetime':
             if delta:
                 delta = dates.values - stata_epoch
                 f = lambda x: \
@@ -398,7 +417,7 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
 
         return DataFrame(d, index=index)
 
-    bad_loc = isnull(dates)
+    bad_loc = isna(dates)
     index = dates.index
     if bad_loc.any():
         dates = Series(dates)
@@ -411,8 +430,7 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
         d = parse_dates_safe(dates, delta=True)
         conv_dates = d.delta / 1000
     elif fmt in ["%tC", "tC"]:
-        from warnings import warn
-        warn("Stata Internal Format tC not supported.")
+        warnings.warn("Stata Internal Format tC not supported.")
         conv_dates = dates
     elif fmt in ["%td", "td"]:
         d = parse_dates_safe(dates, delta=True)
@@ -428,13 +446,14 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
         conv_dates = 4 * (d.year - stata_epoch.year) + (d.month - 1) // 3
     elif fmt in ["%th", "th"]:
         d = parse_dates_safe(dates, year=True)
-        conv_dates = 2 * (d.year - stata_epoch.year) + \
-                         (d.month > 6).astype(np.int)
+        conv_dates = (2 * (d.year - stata_epoch.year) +
+                      (d.month > 6).astype(np.int))
     elif fmt in ["%ty", "ty"]:
         d = parse_dates_safe(dates, year=True)
         conv_dates = d.year
     else:
-        raise ValueError("Format %s is not a known Stata date format" % fmt)
+        raise ValueError(
+            "Format {fmt} is not a known Stata date format".format(fmt=fmt))
 
     conv_dates = Series(conv_dates, dtype=np.float64)
     missing_value = struct.unpack('<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0]
@@ -445,7 +464,8 @@ def parse_dates_safe(dates, delta=False, year=False, days=False):
 
 excessive_string_length_error = """
 Fixed width strings in Stata .dta files are limited to 244 (or fewer)
-characters.  Column '%s' does not satisfy this restriction.
+characters.  Column '%s' does not satisfy this restriction. Use the
+'version=117' parameter to write the newer (Stata 13 and later) format.
 """
 
 
@@ -506,8 +526,8 @@ def _cast_to_stata_types(data):
     this range.  If the int64 values are outside of the range of those
     perfectly representable as float64 values, a warning is raised.
 
-    bool columns are cast to int8.  uint colums are converted to int of the
-    same size if there is no loss in precision, other wise are upcast to a
+    bool columns are cast to int8.  uint columns are converted to int of the
+    same size if there is no loss in precision, otherwise are upcast to a
     larger type.  uint64 is currently not supported since it is concerted to
     object in a DataFrame.
     """
@@ -554,20 +574,20 @@ def _cast_to_stata_types(data):
         elif dtype in (np.float32, np.float64):
             value = data[col].max()
             if np.isinf(value):
-                msg = 'Column {0} has a maximum value of infinity which is ' \
-                      'outside the range supported by Stata.'
-                raise ValueError(msg.format(col))
+                raise ValueError('Column {col} has a maximum value of '
+                                 'infinity which is outside the range '
+                                 'supported by Stata.'.format(col=col))
             if dtype == np.float32 and value > float32_max:
                 data[col] = data[col].astype(np.float64)
             elif dtype == np.float64:
                 if value > float64_max:
-                    msg = 'Column {0} has a maximum value ({1}) outside the ' \
-                          'range supported by Stata ({1})'
-                    raise ValueError(msg.format(col, value, float64_max))
+                    raise ValueError('Column {col} has a maximum value '
+                                     '({val}) outside the range supported by '
+                                     'Stata ({float64_max})'
+                                     .format(col=col, val=value,
+                                             float64_max=float64_max))
 
     if ws:
-        import warnings
-
         warnings.warn(ws, PossiblePrecisionLoss)
 
     return data
@@ -613,7 +633,6 @@ def __init__(self, catarray):
             category = vl[1]
             if not isinstance(category, string_types):
                 category = str(category)
-                import warnings
                 warnings.warn(value_label_mismatch_doc.format(catarray.name),
                               ValueLabelTypeMismatch)
 
@@ -637,7 +656,7 @@ def __init__(self, catarray):
 
     def _encode(self, s):
         """
-        Python 3 compatability shim
+        Python 3 compatibility shim
         """
         if compat.PY3:
             return s.encode(self._encoding)
@@ -795,7 +814,7 @@ def __unicode__(self):
 
     def __repr__(self):
         # not perfect :-/
-        return "%s(%s)" % (self.__class__, self)
+        return "{cls}({obj})".format(cls=self.__class__, obj=self)
 
     def __eq__(self, other):
         return (isinstance(other, self.__class__) and
@@ -819,15 +838,8 @@ def get_base_missing_value(cls, dtype):
 
 
 class StataParser(object):
-    _default_encoding = 'latin-1'
-
-    def __init__(self, encoding):
-        if encoding is not None:
-            if encoding not in VALID_ENCODINGS:
-                raise ValueError('Unknown encoding. Only latin-1 and ascii '
-                                 'supported.')
 
-        self._encoding = encoding
+    def __init__(self):
 
         # type          code.
         # --------------------
@@ -898,10 +910,10 @@ def __init__(self, encoding):
         }
 
         self.OLD_TYPE_MAPPING = {
-            98: 251,   # byte
+            98: 251,  # byte
             105: 252,  # int
             108: 253,  # long
-            102: 254   # float
+            102: 254  # float
             # don't know old code for double
         }
 
@@ -940,28 +952,26 @@ def __init__(self, encoding):
 class StataReader(StataParser, BaseIterator):
     __doc__ = _stata_reader_doc
 
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+    @deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
     def __init__(self, path_or_buf, convert_dates=True,
-                 convert_categoricals=True, index=None,
+                 convert_categoricals=True, index_col=None,
                  convert_missing=False, preserve_dtypes=True,
                  columns=None, order_categoricals=True,
-                 encoding='latin-1', chunksize=None):
-        super(StataReader, self).__init__(encoding)
+                 encoding=None, chunksize=None):
+        super(StataReader, self).__init__()
         self.col_sizes = ()
 
         # Arguments to the reader (can be temporarily overridden in
         # calls to read).
         self._convert_dates = convert_dates
         self._convert_categoricals = convert_categoricals
-        self._index = index
+        self._index_col = index_col
         self._convert_missing = convert_missing
         self._preserve_dtypes = preserve_dtypes
         self._columns = columns
         self._order_categoricals = order_categoricals
-        if encoding is not None:
-            if encoding not in VALID_ENCODINGS:
-                raise ValueError('Unknown encoding. Only latin-1 and  ascii '
-                                 'supported.')
-        self._encoding = encoding
+        self._encoding = None
         self._chunksize = chunksize
 
         # State variables for the file
@@ -975,23 +985,20 @@ def __init__(self, path_or_buf, convert_dates=True,
         self._lines_read = 0
 
         self._native_byteorder = _set_endianness(sys.byteorder)
+        path_or_buf = _stringify_path(path_or_buf)
         if isinstance(path_or_buf, str):
-            path_or_buf, encoding, _ = get_filepath_or_buffer(
-                path_or_buf, encoding=self._default_encoding
-            )
+            path_or_buf, encoding, _, should_close = get_filepath_or_buffer(
+                path_or_buf)
 
-        if isinstance(path_or_buf, (str, compat.text_type, bytes)):
+        if isinstance(path_or_buf, (str, text_type, bytes)):
             self.path_or_buf = open(path_or_buf, 'rb')
         else:
             # Copy to BytesIO, and ensure no encoding
             contents = path_or_buf.read()
-            try:
-                contents = contents.encode(self._default_encoding)
-            except:
-                pass
             self.path_or_buf = BytesIO(contents)
 
         self._read_header()
+        self._setup_dtype()
 
     def __enter__(self):
         """ enter context manager """
@@ -1008,6 +1015,15 @@ def close(self):
         except IOError:
             pass
 
+    def _set_encoding(self):
+        """
+        Set string encoding which depends on file version
+        """
+        if self.format_version < 118:
+            self._encoding = 'latin-1'
+        else:
+            self._encoding = 'utf-8'
+
     def _read_header(self):
         first_char = self.path_or_buf.read(1)
         if struct.unpack('c', first_char)[0] == b'<':
@@ -1021,18 +1037,15 @@ def _read_header(self):
         # calculate size of a data record
         self.col_sizes = lmap(lambda x: self._calcsize(x), self.typlist)
 
-        # remove format details from %td
-        self.fmtlist = ["%td" if x.startswith("%td") else x
-                        for x in self.fmtlist]
-
     def _read_new_header(self, first_char):
         # The first part of the header is common to 117 and 118.
         self.path_or_buf.read(27)  # stata_dta><header><release>
         self.format_version = int(self.path_or_buf.read(3))
         if self.format_version not in [117, 118]:
             raise ValueError(_version_error)
+        self._set_encoding()
         self.path_or_buf.read(21)  # </release><byteorder>
-        self.byteorder = self.path_or_buf.read(3) == "MSF" and '>' or '<'
+        self.byteorder = self.path_or_buf.read(3) == b'MSF' and '>' or '<'
         self.path_or_buf.read(15)  # </byteorder><K>
         self.nvar = struct.unpack(self.byteorder + 'H',
                                   self.path_or_buf.read(2))[0]
@@ -1217,6 +1230,7 @@ def _read_old_header(self, first_char):
         self.format_version = struct.unpack('b', first_char)[0]
         if self.format_version not in [104, 105, 108, 111, 113, 114, 115]:
             raise ValueError(_version_error)
+        self._set_encoding()
         self.byteorder = struct.unpack('b', self.path_or_buf.read(1))[
             0] == 0x1 and '>' or '<'
         self.filetype = struct.unpack('b', self.path_or_buf.read(1))[0]
@@ -1246,12 +1260,12 @@ def _read_old_header(self, first_char):
 
         try:
             self.typlist = [self.TYPE_MAP[typ] for typ in typlist]
-        except:
+        except ValueError:
             raise ValueError("cannot convert stata types [{0}]"
                              .format(','.join(str(x) for x in typlist)))
         try:
             self.dtyplist = [self.DTYPE_MAP[typ] for typ in typlist]
-        except:
+        except ValueError:
             raise ValueError("cannot convert stata dtypes [{0}]"
                              .format(','.join(str(x) for x in typlist)))
 
@@ -1294,6 +1308,23 @@ def _read_old_header(self, first_char):
         # necessary data to continue parsing
         self.data_location = self.path_or_buf.tell()
 
+    def _setup_dtype(self):
+        """Map between numpy and state dtypes"""
+        if self._dtype is not None:
+            return self._dtype
+
+        dtype = []  # Convert struct data types to numpy data type
+        for i, typ in enumerate(self.typlist):
+            if typ in self.NUMPY_TYPE_MAP:
+                dtype.append(('s' + str(i), self.byteorder +
+                              self.NUMPY_TYPE_MAP[typ]))
+            else:
+                dtype.append(('s' + str(i), 'S' + str(typ)))
+        dtype = np.dtype(dtype)
+        self._dtype = dtype
+
+        return self._dtype
+
     def _calcsize(self, fmt):
         return (type(fmt) is int and fmt or
                 struct.calcsize(self.byteorder + fmt))
@@ -1303,24 +1334,19 @@ def _decode(self, s):
         return s.decode('utf-8')
 
     def _null_terminate(self, s):
-        if compat.PY3 or self._encoding is not None:
-            # have bytes not strings, so must decode
-            s = s.partition(b"\0")[0]
-            return s.decode(self._encoding or self._default_encoding)
-        else:
-            null_byte = "\0"
-            try:
-                return s.lstrip(null_byte)[:s.index(null_byte)]
-            except:
-                return s
+        # have bytes not strings, so must decode
+        s = s.partition(b"\0")[0]
+        return s.decode(self._encoding)
 
     def _read_value_labels(self):
-        if self.format_version <= 108:
-            # Value labels are not supported in version 108 and earlier.
-            return
         if self._value_labels_read:
             # Don't read twice
             return
+        if self.format_version <= 108:
+            # Value labels are not supported in version 108 and earlier.
+            self._value_labels_read = True
+            self.value_label_dict = dict()
+            return
 
         if self.format_version >= 117:
             self.path_or_buf.seek(self.seek_value_labels)
@@ -1396,18 +1422,14 @@ def _read_strls(self):
                                    self.path_or_buf.read(4))[0]
             va = self.path_or_buf.read(length)
             if typ == 130:
-                encoding = 'utf-8'
-                if self.format_version == 117:
-                    encoding = self._encoding or self._default_encoding
-                va = va[0:-1].decode(encoding)
+                va = va[0:-1].decode(self._encoding)
             # Wrap v_o in a string to allow uint64 values as keys on 32bit OS
             self.GSO[str(v_o)] = va
 
     # legacy
-    @Appender('DEPRECATED: ' + _data_method_doc)
+    @Appender(_data_method_doc)
     def data(self, **kwargs):
 
-        import warnings
         warnings.warn("'data' is deprecated, use 'read' instead")
 
         if self._data_read:
@@ -1437,8 +1459,9 @@ def get_chunk(self, size=None):
         return self.read(nrows=size)
 
     @Appender(_read_method_doc)
+    @deprecate_kwarg(old_arg_name='index', new_arg_name='index_col')
     def read(self, nrows=None, convert_dates=None,
-             convert_categoricals=None, index=None,
+             convert_categoricals=None, index_col=None,
              convert_missing=None, preserve_dtypes=None,
              columns=None, order_categoricals=None):
         # Handle empty file or chunk.  If reading incrementally raise
@@ -1463,26 +1486,16 @@ def read(self, nrows=None, convert_dates=None,
             columns = self._columns
         if order_categoricals is None:
             order_categoricals = self._order_categoricals
+        if index_col is None:
+            index_col = self._index_col
 
         if nrows is None:
             nrows = self.nobs
 
-        if (self.format_version >= 117) and (self._dtype is None):
+        if (self.format_version >= 117) and (not self._value_labels_read):
             self._can_read_value_labels = True
             self._read_strls()
 
-        # Setup the dtype.
-        if self._dtype is None:
-            dtype = []  # Convert struct data types to numpy data type
-            for i, typ in enumerate(self.typlist):
-                if typ in self.NUMPY_TYPE_MAP:
-                    dtype.append(('s' + str(i), self.byteorder +
-                                  self.NUMPY_TYPE_MAP[typ]))
-                else:
-                    dtype.append(('s' + str(i), 'S' + str(typ)))
-            dtype = np.dtype(dtype)
-            self._dtype = dtype
-
         # Read data
         dtype = self._dtype
         max_read_len = (self.nobs - self._lines_read) * dtype.itemsize
@@ -1513,14 +1526,14 @@ def read(self, nrows=None, convert_dates=None,
             self._read_value_labels()
 
         if len(data) == 0:
-            data = DataFrame(columns=self.varlist, index=index)
+            data = DataFrame(columns=self.varlist)
         else:
-            data = DataFrame.from_records(data, index=index)
+            data = DataFrame.from_records(data)
             data.columns = self.varlist
 
         # If index is not specified, use actual row number rather than
         # restarting at 0 for each chunk.
-        if index is None:
+        if index_col is None:
             ix = np.arange(self._lines_read - read_lines, self._lines_read)
             data = data.set_index(ix)
 
@@ -1542,7 +1555,7 @@ def read(self, nrows=None, convert_dates=None,
         cols_ = np.where(self.dtyplist)[0]
 
         # Convert columns (if needed) to match input type
-        index = data.index
+        ix = data.index
         requires_type_conversion = False
         data_formatted = []
         for i in cols_:
@@ -1552,17 +1565,18 @@ def read(self, nrows=None, convert_dates=None,
                 if dtype != np.dtype(object) and dtype != self.dtyplist[i]:
                     requires_type_conversion = True
                     data_formatted.append(
-                        (col, Series(data[col], index, self.dtyplist[i])))
+                        (col, Series(data[col], ix, self.dtyplist[i])))
                 else:
                     data_formatted.append((col, data[col]))
         if requires_type_conversion:
-            data = DataFrame.from_items(data_formatted)
+            data = DataFrame.from_dict(OrderedDict(data_formatted))
         del data_formatted
 
         self._do_convert_missing(data, convert_missing)
 
         if convert_dates:
-            cols = np.where(lmap(lambda x: x in _date_formats,
+            cols = np.where(lmap(lambda x: any(x.startswith(fmt)
+                                               for fmt in _date_formats),
                                  self.fmtlist))[0]
             for i in cols:
                 col = data.columns[i]
@@ -1593,7 +1607,10 @@ def read(self, nrows=None, convert_dates=None,
                     convert = True
                 retyped_data.append((col, data[col].astype(dtype)))
             if convert:
-                data = DataFrame.from_items(retyped_data)
+                data = DataFrame.from_dict(OrderedDict(retyped_data))
+
+        if index_col is not None:
+            data = data.set_index(data.pop(index_col))
 
         return data
 
@@ -1613,7 +1630,8 @@ def _do_convert_missing(self, data, convert_missing):
                 continue
 
             if convert_missing:  # Replacement follows Stata notation
-                missing_loc = np.argwhere(missing)
+
+                missing_loc = np.argwhere(missing._ndarray_values)
                 umissing, umissing_loc = np.unique(series[missing],
                                                    return_inverse=True)
                 replacement = Series(series, dtype=np.object)
@@ -1695,30 +1713,35 @@ def _do_convert_categoricals(self, data, value_label_dict, lbllist,
                     vc = Series(categories).value_counts()
                     repeats = list(vc.index[vc > 1])
                     repeats = '\n' + '-' * 80 + '\n'.join(repeats)
-                    msg = 'Value labels for column {0} are not unique. The ' \
-                          'repeated labels are:\n{1}'.format(col, repeats)
-                    raise ValueError(msg)
+                    raise ValueError('Value labels for column {col} are not '
+                                     'unique. The repeated labels are:\n'
+                                     '{repeats}'
+                                     .format(col=col, repeats=repeats))
                 # TODO: is the next line needed above in the data(...) method?
                 cat_data = Series(cat_data, index=data.index)
                 cat_converted_data.append((col, cat_data))
             else:
                 cat_converted_data.append((col, data[col]))
-        data = DataFrame.from_items(cat_converted_data)
+        data = DataFrame.from_dict(OrderedDict(cat_converted_data))
         return data
 
     def data_label(self):
-        """Returns data label of Stata file"""
+        """
+        Return data label of Stata file.
+        """
         return self.data_label
 
     def variable_labels(self):
-        """Returns variable labels as a dict, associating each variable name
-        with corresponding label
+        """
+        Return variable labels as a dict, associating each variable name
+        with corresponding label.
         """
         return dict(zip(self.varlist, self._variable_labels))
 
     def value_labels(self):
-        """Returns a dict, associating each variable name a dict, associating
-        each value its corresponding label
+        """
+        Return a dict, associating each variable name a dict, associating
+        each value its corresponding label.
         """
         if not self._value_labels_read:
             self._read_value_labels()
@@ -1726,11 +1749,25 @@ def value_labels(self):
         return self.value_label_dict
 
 
-def _open_file_binary_write(fname, encoding):
+def _open_file_binary_write(fname):
+    """
+    Open a binary file or no-op if file-like.
+
+    Parameters
+    ----------
+    fname : string path, path object or buffer
+
+    Returns
+    -------
+    file : file-like object
+        File object supporting write
+    own : bool
+        True if the file was created, otherwise False
+    """
     if hasattr(fname, 'write'):
         # if 'b' not in fname.mode:
-        return fname
-    return open(fname, "wb")
+        return fname, False
+    return open(fname, "wb"), True
 
 
 def _set_endianness(endianness):
@@ -1739,25 +1776,27 @@ def _set_endianness(endianness):
     elif endianness.lower() in [">", "big"]:
         return ">"
     else:  # pragma : no cover
-        raise ValueError("Endianness %s not understood" % endianness)
+        raise ValueError(
+            "Endianness {endian} not understood".format(endian=endianness))
 
 
 def _pad_bytes(name, length):
     """
-    Takes a char string and pads it with null bytes until it's length chars
+    Take a char string and pads it with null bytes until it's length chars.
     """
     return name + "\x00" * (length - len(name))
 
 
 def _convert_datetime_to_stata_type(fmt):
     """
-    Converts from one of the stata date formats to a type in TYPE_MAP
+    Convert from one of the stata date formats to a type in TYPE_MAP.
     """
     if fmt in ["tc", "%tc", "td", "%td", "tw", "%tw", "tm", "%tm", "tq",
                "%tq", "th", "%th", "ty", "%ty"]:
         return np.float64  # Stata expects doubles for SIFs
     else:
-        raise NotImplementedError("Format %s not implemented" % fmt)
+        raise NotImplementedError(
+            "Format {fmt} not implemented".format(fmt=fmt))
 
 
 def _maybe_convert_to_int_keys(convert_dates, varlist):
@@ -1777,45 +1816,45 @@ def _maybe_convert_to_int_keys(convert_dates, varlist):
 
 def _dtype_to_stata_type(dtype, column):
     """
-    Converts dtype types to stata types. Returns the byte of the given ordinal.
+    Convert dtype types to stata types. Returns the byte of the given ordinal.
     See TYPE_MAP and comments for an explanation. This is also explained in
     the dta spec.
     1 - 244 are strings of this length
                          Pandas    Stata
-    251 - chr(251) - for int8      byte
-    252 - chr(252) - for int16     int
-    253 - chr(253) - for int32     long
-    254 - chr(254) - for float32   float
-    255 - chr(255) - for double    double
+    251 - for int8      byte
+    252 - for int16     int
+    253 - for int32     long
+    254 - for float32   float
+    255 - for double    double
 
     If there are dates to convert, then dtype will already have the correct
     type inserted.
     """
     # TODO: expand to handle datetime to integer conversion
-    if dtype.type == np.string_:
-        return chr(dtype.itemsize)
-    elif dtype.type == np.object_:  # try to coerce it to the biggest string
-                                    # not memory efficient, what else could we
-                                    # do?
-        itemsize = max_len_string_array(_ensure_object(column.values))
-        return chr(max(itemsize, 1))
+    if dtype.type == np.object_:  # try to coerce it to the biggest string
+        # not memory efficient, what else could we
+        # do?
+        itemsize = max_len_string_array(ensure_object(column.values))
+        return max(itemsize, 1)
     elif dtype == np.float64:
-        return chr(255)
+        return 255
     elif dtype == np.float32:
-        return chr(254)
+        return 254
     elif dtype == np.int32:
-        return chr(253)
+        return 253
     elif dtype == np.int16:
-        return chr(252)
+        return 252
     elif dtype == np.int8:
-        return chr(251)
+        return 251
     else:  # pragma : no cover
-        raise NotImplementedError("Data type %s not supported." % dtype)
+        raise NotImplementedError(
+            "Data type {dtype} not supported.".format(dtype=dtype))
 
 
-def _dtype_to_default_stata_fmt(dtype, column):
+def _dtype_to_default_stata_fmt(dtype, column, dta_version=114,
+                                force_strl=False):
     """
-    Maps numpy dtype to stata's default format for this type. Not terribly
+    Map numpy dtype to stata's default format for this type. Not terribly
     important since users can change this in Stata. Semantics are
 
     object  -> "%DDs" where DD is the length of the string.  If not a string,
@@ -1826,17 +1865,34 @@ def _dtype_to_default_stata_fmt(dtype, column):
     int32   -> "%12.0g"
     int16   -> "%8.0g"
     int8    -> "%8.0g"
+    strl    -> "%9s"
     """
     # TODO: Refactor to combine type with format
     # TODO: expand this to handle a default datetime format?
+    if dta_version < 117:
+        max_str_len = 244
+    else:
+        max_str_len = 2045
+        if force_strl:
+            return '%9s'
     if dtype.type == np.object_:
-        inferred_dtype = infer_dtype(column.dropna())
+        inferred_dtype = infer_dtype(column, skipna=True)
         if not (inferred_dtype in ('string', 'unicode') or
                 len(column) == 0):
-            raise ValueError('Writing general object arrays is not supported')
-        itemsize = max_len_string_array(_ensure_object(column.values))
-        if itemsize > 244:
-            raise ValueError(excessive_string_length_error % column.name)
+            raise ValueError('Column `{col}` cannot be exported.\n\nOnly '
+                             'string-like object arrays containing all '
+                             'strings or a mix of strings and None can be '
+                             'exported. Object arrays containing only null '
+                             'values are prohibited. Other object types'
+                             'cannot be exported and must first be converted '
+                             'to one of the supported '
+                             'types.'.format(col=column.name))
+        itemsize = max_len_string_array(ensure_object(column.values))
+        if itemsize > max_str_len:
+            if dta_version >= 117:
+                return '%9s'
+            else:
+                raise ValueError(excessive_string_length_error % column.name)
         return "%" + str(max(itemsize, 1)) + "s"
     elif dtype == np.float64:
         return "%10.0g"
@@ -1847,7 +1903,8 @@ def _dtype_to_default_stata_fmt(dtype, column):
     elif dtype == np.int8 or dtype == np.int16:
         return "%8.0g"
     else:  # pragma : no cover
-        raise NotImplementedError("Data type %s not supported." % dtype)
+        raise NotImplementedError(
+            "Data type {dtype} not supported.".format(dtype=dtype))
 
 
 class StataWriter(StataParser):
@@ -1856,13 +1913,19 @@ class StataWriter(StataParser):
 
     Parameters
     ----------
-    fname : str or buffer
-        String path of file-like object
+    fname : path (string), buffer or path object
+        string, path object (pathlib.Path or py._path.local.LocalPath) or
+        object implementing a binary write() functions. If using a buffer
+        then the buffer will not be automatically closed after the file
+        is written.
+
+        .. versionadded:: 0.23.0 support for pathlib, py.path.
+
     data : DataFrame
         Input to save
     convert_dates : dict
         Dictionary mapping columns containing datetime types to stata internal
-        format to use when wirting the dates. Options are 'tc', 'td', 'tm',
+        format to use when writing the dates. Options are 'tc', 'td', 'tm',
         'tw', 'th', 'tq', 'ty'. Column can be either an integer or a name.
         Datetime columns that do not have a conversion type specified will be
         converted to 'tc'. Raises NotImplementedError if a datetime column has
@@ -1875,7 +1938,7 @@ class StataWriter(StataParser):
         Can be ">", "<", "little", or "big". default is `sys.byteorder`
     time_stamp : datetime
         A datetime to use as file creation date.  Default is the current time
-    dataset_label : str
+    data_label : str
         A label for the data set.  Must be 80 characters or smaller.
     variable_labels : dict
         Dictionary containing columns as keys and variable labels as values.
@@ -1894,7 +1957,7 @@ class StataWriter(StataParser):
     NotImplementedError
         * If datetimes contain timezone information
     ValueError
-        * Columns listed in convert_dates are noth either datetime64[ns]
+        * Columns listed in convert_dates are neither datetime64[ns]
           or datetime.datetime
         * Column dtype is not representable in Stata
         * Column listed in convert_dates is not in DataFrame
@@ -1902,7 +1965,6 @@ class StataWriter(StataParser):
 
     Examples
     --------
-    >>> import pandas as pd
     >>> data = pd.DataFrame([[1.0, 1]], columns=['a', 'b'])
     >>> writer = StataWriter('./data_file.dta', data)
     >>> writer.write_file()
@@ -1914,23 +1976,29 @@ class StataWriter(StataParser):
     >>> writer.write_file()
     """
 
+    _max_string_length = 244
+
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
     def __init__(self, fname, data, convert_dates=None, write_index=True,
                  encoding="latin-1", byteorder=None, time_stamp=None,
                  data_label=None, variable_labels=None):
-        super(StataWriter, self).__init__(encoding)
+        super(StataWriter, self).__init__()
         self._convert_dates = {} if convert_dates is None else convert_dates
         self._write_index = write_index
+        self._encoding = 'latin-1'
         self._time_stamp = time_stamp
         self._data_label = data_label
         self._variable_labels = variable_labels
+        self._own_file = True
         # attach nobs, nvars, data, varlist, typlist
         self._prepare_pandas(data)
 
         if byteorder is None:
             byteorder = sys.byteorder
         self._byteorder = _set_endianness(byteorder)
-        self._fname = fname
+        self._fname = _stringify_path(fname)
         self.type_converters = {253: np.int32, 252: np.int16, 251: np.int8}
+        self._converted_names = {}
 
     def _write(self, to_write):
         """
@@ -1953,7 +2021,6 @@ def _prepare_categoricals(self, data):
             return data
 
         get_base_missing_value = StataMissingValue.get_base_missing_value
-        index = data.index
         data_formatted = []
         for col, col_is_cat in zip(data, is_cat):
             if col_is_cat:
@@ -1976,11 +2043,10 @@ def _prepare_categoricals(self, data):
 
                 # Replace missing values with Stata missing value for type
                 values[values == -1] = get_base_missing_value(dtype)
-                data_formatted.append((col, values, index))
-
+                data_formatted.append((col, values))
             else:
                 data_formatted.append((col, data[col]))
-        return DataFrame.from_items(data_formatted)
+        return DataFrame.from_dict(OrderedDict(data_formatted))
 
     def _replace_nans(self, data):
         # return data
@@ -1997,6 +2063,10 @@ def _replace_nans(self, data):
 
         return data
 
+    def _update_strl_names(self):
+        """No-op, forward compatibility"""
+        pass
+
     def _check_column_names(self, data):
         """
         Checks column names to ensure that they are valid Stata column names.
@@ -2010,7 +2080,7 @@ def _check_column_names(self, data):
         dates are exported, the variable name is propagated to the date
         conversion dictionary
         """
-        converted_names = []
+        converted_names = {}
         columns = list(data.columns)
         original_columns = columns[:]
 
@@ -2021,8 +2091,8 @@ def _check_column_names(self, data):
                 name = text_type(name)
 
             for c in name:
-                if (c < 'A' or c > 'Z') and (c < 'a' or c > 'z') and \
-                        (c < '0' or c > '9') and c != '_':
+                if ((c < 'A' or c > 'Z') and (c < 'a' or c > 'z') and
+                        (c < '0' or c > '9') and c != '_'):
                     name = name.replace(c, '_')
 
             # Variable name must not be a reserved word
@@ -2042,14 +2112,7 @@ def _check_column_names(self, data):
                     name = '_' + str(duplicate_var_id) + name
                     name = name[:min(len(name), 32)]
                     duplicate_var_id += 1
-
-                # need to possibly encode the orig name if its unicode
-                try:
-                    orig_name = orig_name.encode('utf-8')
-                except:
-                    pass
-                converted_names.append(
-                    '{0}   ->   {1}'.format(orig_name, name))
+                converted_names[orig_name] = name
 
             columns[j] = name
 
@@ -2063,13 +2126,31 @@ def _check_column_names(self, data):
                     del self._convert_dates[o]
 
         if converted_names:
-            import warnings
+            conversion_warning = []
+            for orig_name, name in converted_names.items():
+                # need to possibly encode the orig name if its unicode
+                try:
+                    orig_name = orig_name.encode('utf-8')
+                except (UnicodeDecodeError, AttributeError):
+                    pass
+                msg = '{0}   ->   {1}'.format(orig_name, name)
+                conversion_warning.append(msg)
 
-            ws = invalid_name_doc.format('\n    '.join(converted_names))
+            ws = invalid_name_doc.format('\n    '.join(conversion_warning))
             warnings.warn(ws, InvalidColumnName)
 
+        self._converted_names = converted_names
+        self._update_strl_names()
+
         return data
 
+    def _set_formats_and_types(self, data, dtypes):
+        self.typlist = []
+        self.fmtlist = []
+        for col, dtype in dtypes.iteritems():
+            self.fmtlist.append(_dtype_to_default_stata_fmt(dtype, data[col]))
+            self.typlist.append(_dtype_to_stata_type(dtype, data[col]))
+
     def _prepare_pandas(self, data):
         # NOTE: we might need a different API / class for pandas objects so
         # we can set different semantics - handle this with a PR to pandas.io
@@ -2113,11 +2194,7 @@ def _prepare_pandas(self, data):
             )
             dtypes[key] = np.dtype(new_type)
 
-        self.typlist = []
-        self.fmtlist = []
-        for col, dtype in dtypes.iteritems():
-            self.fmtlist.append(_dtype_to_default_stata_fmt(dtype, data[col]))
-            self.typlist.append(_dtype_to_stata_type(dtype, data[col]))
+        self._set_formats_and_types(data, dtypes)
 
         # set the given format for the datetime cols
         if self._convert_dates is not None:
@@ -2125,22 +2202,75 @@ def _prepare_pandas(self, data):
                 self.fmtlist[key] = self._convert_dates[key]
 
     def write_file(self):
-        self._file = _open_file_binary_write(
-            self._fname, self._encoding or self._default_encoding
-        )
+        self._file, self._own_file = _open_file_binary_write(self._fname)
         try:
             self._write_header(time_stamp=self._time_stamp,
                                data_label=self._data_label)
-            self._write_descriptors()
+            self._write_map()
+            self._write_variable_types()
+            self._write_varnames()
+            self._write_sortlist()
+            self._write_formats()
+            self._write_value_label_names()
             self._write_variable_labels()
-            # write 5 zeros for expansion fields
-            self._write(_pad_bytes("", 5))
+            self._write_expansion_fields()
+            self._write_characteristics()
             self._prepare_data()
             self._write_data()
+            self._write_strls()
             self._write_value_labels()
-        finally:
+            self._write_file_close_tag()
+            self._write_map()
+        except Exception as exc:
+            self._close()
+            try:
+                if self._own_file:
+                    os.unlink(self._fname)
+            except Exception:
+                warnings.warn('This save was not successful but {0} could not '
+                              'be deleted.  This file is not '
+                              'valid.'.format(self._fname), ResourceWarning)
+            raise exc
+        else:
+            self._close()
+
+    def _close(self):
+        """
+        Close the file if it was created by the writer.
+
+        If a buffer or file-like object was passed in, for example a GzipFile,
+        then leave this file open for the caller to close. In either case,
+        attempt to flush the file contents to ensure they are written to disk
+        (if supported)
+        """
+        # Some file-like objects might not support flush
+        try:
+            self._file.flush()
+        except AttributeError:
+            pass
+        if self._own_file:
             self._file.close()
 
+    def _write_map(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_file_close_tag(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_characteristics(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_strls(self):
+        """No-op, future compatibility"""
+        pass
+
+    def _write_expansion_fields(self):
+        """Write 5 zeros for expansion fields"""
+        self._write(_pad_bytes("", 5))
+
     def _write_value_labels(self):
         for vl in self._value_labels:
             self._file.write(vl.generate_value_label(self._byteorder,
@@ -2183,13 +2313,11 @@ def _write_header(self, data_label=None, time_stamp=None):
               time_stamp.strftime(" %Y %H:%M"))
         self._file.write(self._null_terminate(ts))
 
-    def _write_descriptors(self, typlist=None, varlist=None, srtlist=None,
-                           fmtlist=None, lbllist=None):
-        nvar = self.nvar
-        # typlist, length nvar, format byte array
+    def _write_variable_types(self):
         for typ in self.typlist:
-            self._write(typ)
+            self._file.write(struct.pack('B', typ))
 
+    def _write_varnames(self):
         # varlist names are checked by _check_column_names
         # varlist, requires null terminated
         for name in self.varlist:
@@ -2197,16 +2325,19 @@ def _write_descriptors(self, typlist=None, varlist=None, srtlist=None,
             name = _pad_bytes(name[:32], 33)
             self._write(name)
 
+    def _write_sortlist(self):
         # srtlist, 2*(nvar+1), int array, encoded by byteorder
-        srtlist = _pad_bytes("", 2 * (nvar + 1))
+        srtlist = _pad_bytes("", 2 * (self.nvar + 1))
         self._write(srtlist)
 
+    def _write_formats(self):
         # fmtlist, 49*nvar, char array
         for fmt in self.fmtlist:
             self._write(_pad_bytes(fmt, 49))
 
+    def _write_value_label_names(self):
         # lbllist, 33*nvar, char array
-        for i in range(nvar):
+        for i in range(self.nvar):
             # Use variable name when categorical
             if self._is_col_cat[i]:
                 name = self.varlist[i]
@@ -2240,6 +2371,10 @@ def _write_variable_labels(self):
             else:
                 self._write(blank)
 
+    def _convert_strls(self, data):
+        """No-op, future compatibility"""
+        return data
+
     def _prepare_data(self):
         data = self.data
         typlist = self.typlist
@@ -2250,33 +2385,30 @@ def _prepare_data(self):
                 if i in convert_dates:
                     data[col] = _datetime_to_stata_elapsed_vec(data[col],
                                                                self.fmtlist[i])
+        # 2. Convert strls
+        data = self._convert_strls(data)
 
-        # 2. Convert bad string data to '' and pad to correct length
-        dtype = []
-        data_cols = []
-        has_strings = False
+        # 3. Convert bad string data to '' and pad to correct length
+        dtypes = {}
+        native_byteorder = self._byteorder == _set_endianness(sys.byteorder)
         for i, col in enumerate(data):
-            typ = ord(typlist[i])
-            if typ <= 244:
-                has_strings = True
+            typ = typlist[i]
+            if typ <= self._max_string_length:
                 data[col] = data[col].fillna('').apply(_pad_bytes, args=(typ,))
-                stype = 'S%d' % typ
-                dtype.append(('c' + str(i), stype))
-                string = data[col].str.encode(self._encoding)
-                data_cols.append(string.values.astype(stype))
+                stype = 'S{type}'.format(type=typ)
+                dtypes[col] = stype
+                data[col] = data[col].str.encode(self._encoding).astype(stype)
             else:
-                dtype.append(('c' + str(i), data[col].dtype))
-                data_cols.append(data[col].values)
-        dtype = np.dtype(dtype)
+                dtype = data[col].dtype
+                if not native_byteorder:
+                    dtype = dtype.newbyteorder(self._byteorder)
+                dtypes[col] = dtype
 
-        if has_strings:
-            self.data = np.fromiter(zip(*data_cols), dtype=dtype)
-        else:
-            self.data = data.to_records(index=False)
+        self.data = data.to_records(index=False, column_dtypes=dtypes)
 
     def _write_data(self):
         data = self.data
-        data.tofile(self._file)
+        self._file.write(data.tobytes())
 
     def _null_terminate(self, s, as_string=False):
         null_byte = '\x00'
@@ -2286,3 +2418,565 @@ def _null_terminate(self, s, as_string=False):
         else:
             s += null_byte
             return s
+
+
+def _dtype_to_stata_type_117(dtype, column, force_strl):
+    """
+    Converts dtype types to stata types. Returns the byte of the given ordinal.
+    See TYPE_MAP and comments for an explanation. This is also explained in
+    the dta spec.
+    1 - 2045 are strings of this length
+                Pandas    Stata
+    32768 - for object    strL
+    65526 - for int8      byte
+    65527 - for int16     int
+    65528 - for int32     long
+    65529 - for float32   float
+    65530 - for double    double
+
+    If there are dates to convert, then dtype will already have the correct
+    type inserted.
+    """
+    # TODO: expand to handle datetime to integer conversion
+    if force_strl:
+        return 32768
+    if dtype.type == np.object_:  # try to coerce it to the biggest string
+        # not memory efficient, what else could we
+        # do?
+        itemsize = max_len_string_array(ensure_object(column.values))
+        itemsize = max(itemsize, 1)
+        if itemsize <= 2045:
+            return itemsize
+        return 32768
+    elif dtype == np.float64:
+        return 65526
+    elif dtype == np.float32:
+        return 65527
+    elif dtype == np.int32:
+        return 65528
+    elif dtype == np.int16:
+        return 65529
+    elif dtype == np.int8:
+        return 65530
+    else:  # pragma : no cover
+        raise NotImplementedError("Data type %s not supported." % dtype)
+
+
+def _bytes(s, encoding):
+    if compat.PY3:
+        return bytes(s, encoding)
+    else:
+        return bytes(s.encode(encoding))
+
+
+def _pad_bytes_new(name, length):
+    """
+    Takes a bytes instance and pads it with null bytes until it's length chars.
+    """
+    if isinstance(name, string_types):
+        name = _bytes(name, 'utf-8')
+    return name + b'\x00' * (length - len(name))
+
+
+class StataStrLWriter(object):
+    """
+    Converter for Stata StrLs
+
+    Stata StrLs map 8 byte values to strings which are stored using a
+    dictionary-like format where strings are keyed to two values.
+
+    Parameters
+    ----------
+    df : DataFrame
+        DataFrame to convert
+    columns : list
+        List of columns names to convert to StrL
+    version : int, optional
+        dta version.  Currently supports 117, 118 and 119
+    byteorder : str, optional
+        Can be ">", "<", "little", or "big". default is `sys.byteorder`
+
+    Notes
+    -----
+    Supports creation of the StrL block of a dta file for dta versions
+    117, 118 and 119.  These differ in how the GSO is stored.  118 and
+    119 store the GSO lookup value as a uint32 and a uint64, while 117
+    uses two uint32s. 118 and 119 also encode all strings as unicode
+    which is required by the format.  117 uses 'latin-1' a fixed width
+    encoding that extends the 7-bit ascii table with an additional 128
+    characters.
+    """
+
+    def __init__(self, df, columns, version=117, byteorder=None):
+        if version not in (117, 118, 119):
+            raise ValueError('Only dta versions 117, 118 and 119 supported')
+        self._dta_ver = version
+
+        self.df = df
+        self.columns = columns
+        self._gso_table = OrderedDict((('', (0, 0)),))
+        if byteorder is None:
+            byteorder = sys.byteorder
+        self._byteorder = _set_endianness(byteorder)
+
+        gso_v_type = 'I'  # uint32
+        gso_o_type = 'Q'  # uint64
+        self._encoding = 'utf-8'
+        if version == 117:
+            o_size = 4
+            gso_o_type = 'I'  # 117 used uint32
+            self._encoding = 'latin-1'
+        elif version == 118:
+            o_size = 6
+        else:  # version == 119
+            o_size = 5
+        self._o_offet = 2 ** (8 * (8 - o_size))
+        self._gso_o_type = gso_o_type
+        self._gso_v_type = gso_v_type
+
+    def _convert_key(self, key):
+        v, o = key
+        return v + self._o_offet * o
+
+    def generate_table(self):
+        """
+        Generates the GSO lookup table for the DataFRame
+
+        Returns
+        -------
+        gso_table : OrderedDict
+            Ordered dictionary using the string found as keys
+            and their lookup position (v,o) as values
+        gso_df : DataFrame
+            DataFrame where strl columns have been converted to
+            (v,o) values
+
+        Notes
+        -----
+        Modifies the DataFrame in-place.
+
+        The DataFrame returned encodes the (v,o) values as uint64s. The
+        encoding depends on teh dta version, and can be expressed as
+
+        enc = v + o * 2 ** (o_size * 8)
+
+        so that v is stored in the lower bits and o is in the upper
+        bits. o_size is
+
+          * 117: 4
+          * 118: 6
+          * 119: 5
+        """
+
+        gso_table = self._gso_table
+        gso_df = self.df
+        columns = list(gso_df.columns)
+        selected = gso_df[self.columns]
+        col_index = [(col, columns.index(col)) for col in self.columns]
+        keys = np.empty(selected.shape, dtype=np.uint64)
+        for o, (idx, row) in enumerate(selected.iterrows()):
+            for j, (col, v) in enumerate(col_index):
+                val = row[col]
+                # Allow columns with mixed str and None (GH 23633)
+                val = '' if val is None else val
+                key = gso_table.get(val, None)
+                if key is None:
+                    # Stata prefers human numbers
+                    key = (v + 1, o + 1)
+                    gso_table[val] = key
+                keys[o, j] = self._convert_key(key)
+        for i, col in enumerate(self.columns):
+            gso_df[col] = keys[:, i]
+
+        return gso_table, gso_df
+
+    def _encode(self, s):
+        """
+        Python 3 compatibility shim
+        """
+        if compat.PY3:
+            return s.encode(self._encoding)
+        else:
+            if isinstance(s, text_type):
+                return s.encode(self._encoding)
+            return s
+
+    def generate_blob(self, gso_table):
+        """
+        Generates the binary blob of GSOs that is written to the dta file.
+
+        Parameters
+        ----------
+        gso_table : OrderedDict
+            Ordered dictionary (str, vo)
+
+        Returns
+        -------
+        gso : bytes
+            Binary content of dta file to be placed between strl tags
+
+        Notes
+        -----
+        Output format depends on dta version.  117 uses two uint32s to
+        express v and o while 118+ uses a uint32 for v and a uint64 for o.
+        """
+        # Format information
+        # Length includes null term
+        # 117
+        # GSOvvvvooootllllxxxxxxxxxxxxxxx...x
+        #  3  u4  u4 u1 u4  string + null term
+        #
+        # 118, 119
+        # GSOvvvvooooooootllllxxxxxxxxxxxxxxx...x
+        #  3  u4   u8   u1 u4    string + null term
+
+        bio = BytesIO()
+        gso = _bytes('GSO', 'ascii')
+        gso_type = struct.pack(self._byteorder + 'B', 130)
+        null = struct.pack(self._byteorder + 'B', 0)
+        v_type = self._byteorder + self._gso_v_type
+        o_type = self._byteorder + self._gso_o_type
+        len_type = self._byteorder + 'I'
+        for strl, vo in gso_table.items():
+            if vo == (0, 0):
+                continue
+            v, o = vo
+
+            # GSO
+            bio.write(gso)
+
+            # vvvv
+            bio.write(struct.pack(v_type, v))
+
+            # oooo / oooooooo
+            bio.write(struct.pack(o_type, o))
+
+            # t
+            bio.write(gso_type)
+
+            # llll
+            utf8_string = _bytes(strl, 'utf-8')
+            bio.write(struct.pack(len_type, len(utf8_string) + 1))
+
+            # xxx...xxx
+            bio.write(utf8_string)
+            bio.write(null)
+
+        bio.seek(0)
+        return bio.read()
+
+
+class StataWriter117(StataWriter):
+    """
+    A class for writing Stata binary dta files in Stata 13 format (117)
+
+    .. versionadded:: 0.23.0
+
+    Parameters
+    ----------
+    fname : path (string), buffer or path object
+        string, path object (pathlib.Path or py._path.local.LocalPath) or
+        object implementing a binary write() functions. If using a buffer
+        then the buffer will not be automatically closed after the file
+        is written.
+    data : DataFrame
+        Input to save
+    convert_dates : dict
+        Dictionary mapping columns containing datetime types to stata internal
+        format to use when writing the dates. Options are 'tc', 'td', 'tm',
+        'tw', 'th', 'tq', 'ty'. Column can be either an integer or a name.
+        Datetime columns that do not have a conversion type specified will be
+        converted to 'tc'. Raises NotImplementedError if a datetime column has
+        timezone information
+    write_index : bool
+        Write the index to Stata dataset.
+    encoding : str
+        Default is latin-1. Only latin-1 and ascii are supported.
+    byteorder : str
+        Can be ">", "<", "little", or "big". default is `sys.byteorder`
+    time_stamp : datetime
+        A datetime to use as file creation date.  Default is the current time
+    data_label : str
+        A label for the data set.  Must be 80 characters or smaller.
+    variable_labels : dict
+        Dictionary containing columns as keys and variable labels as values.
+        Each label must be 80 characters or smaller.
+    convert_strl : list
+        List of columns names to convert to Stata StrL format.  Columns with
+        more than 2045 characters are aautomatically written as StrL.
+        Smaller columns can be converted by including the column name.  Using
+        StrLs can reduce output file size when strings are longer than 8
+        characters, and either frequently repeated or sparse.
+
+    Returns
+    -------
+    writer : StataWriter117 instance
+        The StataWriter117 instance has a write_file method, which will
+        write the file to the given `fname`.
+
+    Raises
+    ------
+    NotImplementedError
+        * If datetimes contain timezone information
+    ValueError
+        * Columns listed in convert_dates are neither datetime64[ns]
+          or datetime.datetime
+        * Column dtype is not representable in Stata
+        * Column listed in convert_dates is not in DataFrame
+        * Categorical label contains more than 32,000 characters
+
+    Examples
+    --------
+    >>> from pandas.io.stata import StataWriter117
+    >>> data = pd.DataFrame([[1.0, 1, 'a']], columns=['a', 'b', 'c'])
+    >>> writer = StataWriter117('./data_file.dta', data)
+    >>> writer.write_file()
+
+    Or with long strings stored in strl format
+
+    >>> data = pd.DataFrame([['A relatively long string'], [''], ['']],
+    ...                     columns=['strls'])
+    >>> writer = StataWriter117('./data_file_with_long_strings.dta', data,
+    ...                         convert_strl=['strls'])
+    >>> writer.write_file()
+    """
+
+    _max_string_length = 2045
+
+    @deprecate_kwarg(old_arg_name='encoding', new_arg_name=None)
+    def __init__(self, fname, data, convert_dates=None, write_index=True,
+                 encoding="latin-1", byteorder=None, time_stamp=None,
+                 data_label=None, variable_labels=None, convert_strl=None):
+        # Shallow copy since convert_strl might be modified later
+        self._convert_strl = [] if convert_strl is None else convert_strl[:]
+
+        super(StataWriter117, self).__init__(fname, data, convert_dates,
+                                             write_index, byteorder=byteorder,
+                                             time_stamp=time_stamp,
+                                             data_label=data_label,
+                                             variable_labels=variable_labels)
+        self._map = None
+        self._strl_blob = None
+
+    @staticmethod
+    def _tag(val, tag):
+        """Surround val with <tag></tag>"""
+        if isinstance(val, str) and compat.PY3:
+            val = _bytes(val, 'utf-8')
+        return (_bytes('<' + tag + '>', 'utf-8') + val +
+                _bytes('</' + tag + '>', 'utf-8'))
+
+    def _update_map(self, tag):
+        """Update map location for tag with file position"""
+        self._map[tag] = self._file.tell()
+
+    def _write_header(self, data_label=None, time_stamp=None):
+        """Write the file header"""
+        byteorder = self._byteorder
+        self._file.write(_bytes('<stata_dta>', 'utf-8'))
+        bio = BytesIO()
+        # ds_format - 117
+        bio.write(self._tag(_bytes('117', 'utf-8'), 'release'))
+        # byteorder
+        bio.write(self._tag(byteorder == ">" and "MSF" or "LSF", 'byteorder'))
+        # number of vars, 2 bytes
+        assert self.nvar < 2 ** 16
+        bio.write(self._tag(struct.pack(byteorder + "H", self.nvar), 'K'))
+        # number of obs, 4 bytes
+        bio.write(self._tag(struct.pack(byteorder + "I", self.nobs), 'N'))
+        # data label 81 bytes, char, null terminated
+        label = data_label[:80] if data_label is not None else ''
+        label_len = struct.pack(byteorder + "B", len(label))
+        label = label_len + _bytes(label, 'utf-8')
+        bio.write(self._tag(label, 'label'))
+        # time stamp, 18 bytes, char, null terminated
+        # format dd Mon yyyy hh:mm
+        if time_stamp is None:
+            time_stamp = datetime.datetime.now()
+        elif not isinstance(time_stamp, datetime.datetime):
+            raise ValueError("time_stamp should be datetime type")
+        # Avoid locale-specific month conversion
+        months = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug',
+                  'Sep', 'Oct', 'Nov', 'Dec']
+        month_lookup = {i + 1: month for i, month in enumerate(months)}
+        ts = (time_stamp.strftime("%d ") +
+              month_lookup[time_stamp.month] +
+              time_stamp.strftime(" %Y %H:%M"))
+        # '\x11' added due to inspection of Stata file
+        ts = b'\x11' + _bytes(ts, 'utf8')
+        bio.write(self._tag(ts, 'timestamp'))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'header'))
+
+    def _write_map(self):
+        """Called twice during file write. The first populates the values in
+        the map with 0s.  The second call writes the final map locations when
+        all blocks have been written."""
+        if self._map is None:
+            self._map = OrderedDict((('stata_data', 0),
+                                     ('map', self._file.tell()),
+                                     ('variable_types', 0),
+                                     ('varnames', 0),
+                                     ('sortlist', 0),
+                                     ('formats', 0),
+                                     ('value_label_names', 0),
+                                     ('variable_labels', 0),
+                                     ('characteristics', 0),
+                                     ('data', 0),
+                                     ('strls', 0),
+                                     ('value_labels', 0),
+                                     ('stata_data_close', 0),
+                                     ('end-of-file', 0)))
+        # Move to start of map
+        self._file.seek(self._map['map'])
+        bio = BytesIO()
+        for val in self._map.values():
+            bio.write(struct.pack(self._byteorder + 'Q', val))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'map'))
+
+    def _write_variable_types(self):
+        self._update_map('variable_types')
+        bio = BytesIO()
+        for typ in self.typlist:
+            bio.write(struct.pack(self._byteorder + 'H', typ))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'variable_types'))
+
+    def _write_varnames(self):
+        self._update_map('varnames')
+        bio = BytesIO()
+        for name in self.varlist:
+            name = self._null_terminate(name, True)
+            name = _pad_bytes_new(name[:32], 33)
+            bio.write(name)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'varnames'))
+
+    def _write_sortlist(self):
+        self._update_map('sortlist')
+        self._file.write(self._tag(b'\x00\00' * (self.nvar + 1), 'sortlist'))
+
+    def _write_formats(self):
+        self._update_map('formats')
+        bio = BytesIO()
+        for fmt in self.fmtlist:
+            bio.write(_pad_bytes_new(fmt, 49))
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'formats'))
+
+    def _write_value_label_names(self):
+        self._update_map('value_label_names')
+        bio = BytesIO()
+        for i in range(self.nvar):
+            # Use variable name when categorical
+            name = ''  # default name
+            if self._is_col_cat[i]:
+                name = self.varlist[i]
+            name = self._null_terminate(name, True)
+            name = _pad_bytes_new(name[:32], 33)
+            bio.write(name)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'value_label_names'))
+
+    def _write_variable_labels(self):
+        # Missing labels are 80 blank characters plus null termination
+        self._update_map('variable_labels')
+        bio = BytesIO()
+        blank = _pad_bytes_new('', 81)
+
+        if self._variable_labels is None:
+            for _ in range(self.nvar):
+                bio.write(blank)
+            bio.seek(0)
+            self._file.write(self._tag(bio.read(), 'variable_labels'))
+            return
+
+        for col in self.data:
+            if col in self._variable_labels:
+                label = self._variable_labels[col]
+                if len(label) > 80:
+                    raise ValueError('Variable labels must be 80 characters '
+                                     'or fewer')
+                is_latin1 = all(ord(c) < 256 for c in label)
+                if not is_latin1:
+                    raise ValueError('Variable labels must contain only '
+                                     'characters that can be encoded in '
+                                     'Latin-1')
+                bio.write(_pad_bytes_new(label, 81))
+            else:
+                bio.write(blank)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'variable_labels'))
+
+    def _write_characteristics(self):
+        self._update_map('characteristics')
+        self._file.write(self._tag(b'', 'characteristics'))
+
+    def _write_data(self):
+        self._update_map('data')
+        data = self.data
+        self._file.write(b'<data>')
+        self._file.write(data.tobytes())
+        self._file.write(b'</data>')
+
+    def _write_strls(self):
+        self._update_map('strls')
+        strls = b''
+        if self._strl_blob is not None:
+            strls = self._strl_blob
+        self._file.write(self._tag(strls, 'strls'))
+
+    def _write_expansion_fields(self):
+        """No-op in dta 117+"""
+        pass
+
+    def _write_value_labels(self):
+        self._update_map('value_labels')
+        bio = BytesIO()
+        for vl in self._value_labels:
+            lab = vl.generate_value_label(self._byteorder, self._encoding)
+            lab = self._tag(lab, 'lbl')
+            bio.write(lab)
+        bio.seek(0)
+        self._file.write(self._tag(bio.read(), 'value_labels'))
+
+    def _write_file_close_tag(self):
+        self._update_map('stata_data_close')
+        self._file.write(_bytes('</stata_dta>', 'utf-8'))
+        self._update_map('end-of-file')
+
+    def _update_strl_names(self):
+        """Update column names for conversion to strl if they might have been
+        changed to comply with Stata naming rules"""
+        # Update convert_strl if names changed
+        for orig, new in self._converted_names.items():
+            if orig in self._convert_strl:
+                idx = self._convert_strl.index(orig)
+                self._convert_strl[idx] = new
+
+    def _convert_strls(self, data):
+        """Convert columns to StrLs if either very large or in the
+        convert_strl variable"""
+        convert_cols = [
+            col for i, col in enumerate(data)
+            if self.typlist[i] == 32768 or col in self._convert_strl]
+
+        if convert_cols:
+            ssw = StataStrLWriter(data, convert_cols)
+            tab, new_data = ssw.generate_table()
+            data = new_data
+            self._strl_blob = ssw.generate_blob(tab)
+        return data
+
+    def _set_formats_and_types(self, data, dtypes):
+        self.typlist = []
+        self.fmtlist = []
+        for col, dtype in dtypes.iteritems():
+            force_strl = col in self._convert_strl
+            fmt = _dtype_to_default_stata_fmt(dtype, data[col],
+                                              dta_version=117,
+                                              force_strl=force_strl)
+            self.fmtlist.append(fmt)
+            self.typlist.append(_dtype_to_stata_type_117(dtype, data[col],
+                                                         force_strl))
diff --git a/pandas/io/wb.py b/pandas/io/wb.py
deleted file mode 100644
index 5dc4d9ce1adc4..0000000000000
--- a/pandas/io/wb.py
+++ /dev/null
@@ -1,6 +0,0 @@
-raise ImportError(
-    "The pandas.io.wb module is moved to a separate package "
-    "(pandas-datareader). After installing the pandas-datareader package "
-    "(https://github.com/pydata/pandas-datareader), you can change "
-    "the import ``from pandas.io import data, wb`` to "
-    "``from pandas_datareader import data, wb``.")
diff --git a/pandas/json.py b/pandas/json.py
deleted file mode 100644
index 5b1e395fa4b74..0000000000000
--- a/pandas/json.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# flake8: noqa
-
-import warnings
-warnings.warn("The pandas.json module is deprecated and will be "
-              "removed in a future version. Please import from "
-              "the pandas.io.json instead", FutureWarning, stacklevel=2)
-from pandas.io.json.libjson import dumps, loads
diff --git a/pandas/lib.py b/pandas/lib.py
deleted file mode 100644
index 6c26627a97de3..0000000000000
--- a/pandas/lib.py
+++ /dev/null
@@ -1,7 +0,0 @@
-# flake8: noqa
-
-import warnings
-warnings.warn("The pandas.lib module is deprecated and will be "
-              "removed in a future version. Please import from "
-              "the pandas._libs.lib instead", FutureWarning, stacklevel=2)
-from pandas._libs.lib import *
diff --git a/pandas/parser.py b/pandas/parser.py
deleted file mode 100644
index af203c3df8cc9..0000000000000
--- a/pandas/parser.py
+++ /dev/null
@@ -1,8 +0,0 @@
-# flake8: noqa
-
-import warnings
-warnings.warn("The pandas.parser module is deprecated and will be "
-              "removed in a future version. Please import from "
-              "the pandas.io.parser instead", FutureWarning, stacklevel=2)
-from pandas.io.libparsers import na_values
-from pandas.io.common import CParserError
diff --git a/pandas/plotting/__init__.py b/pandas/plotting/__init__.py
new file mode 100644
index 0000000000000..ff5351bb6c6ea
--- /dev/null
+++ b/pandas/plotting/__init__.py
@@ -0,0 +1,20 @@
+"""
+Plotting api
+"""
+
+# flake8: noqa
+
+from pandas.plotting._misc import (scatter_matrix, radviz,
+                                   andrews_curves, bootstrap_plot,
+                                   parallel_coordinates, lag_plot,
+                                   autocorrelation_plot)
+from pandas.plotting._core import boxplot
+from pandas.plotting._style import plot_params
+from pandas.plotting._tools import table
+try:
+    from pandas.plotting._converter import (
+        register as register_matplotlib_converters)
+    from pandas.plotting._converter import (
+        deregister as deregister_matplotlib_converters)
+except ImportError:
+    pass
diff --git a/pandas/plotting/_compat.py b/pandas/plotting/_compat.py
new file mode 100644
index 0000000000000..48900c088a125
--- /dev/null
+++ b/pandas/plotting/_compat.py
@@ -0,0 +1,25 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+from distutils.version import LooseVersion
+import operator
+
+
+def _mpl_version(version, op):
+    def inner():
+        try:
+            import matplotlib as mpl
+        except ImportError:
+            return False
+        return (op(LooseVersion(mpl.__version__), LooseVersion(version)) and
+                str(mpl.__version__)[0] != '0')
+
+    return inner
+
+
+_mpl_ge_2_0_1 = _mpl_version('2.0.1', operator.ge)
+_mpl_ge_2_1_0 = _mpl_version('2.1.0', operator.ge)
+_mpl_ge_2_2_0 = _mpl_version('2.2.0', operator.ge)
+_mpl_ge_2_2_2 = _mpl_version('2.2.2', operator.ge)
+_mpl_ge_3_0_0 = _mpl_version('3.0.0', operator.ge)
diff --git a/pandas/plotting/_converter.py b/pandas/plotting/_converter.py
new file mode 100644
index 0000000000000..aaa7aa04acf48
--- /dev/null
+++ b/pandas/plotting/_converter.py
@@ -0,0 +1,1154 @@
+import datetime as pydt
+from datetime import datetime, timedelta
+import warnings
+
+from dateutil.relativedelta import relativedelta
+import matplotlib.dates as dates
+from matplotlib.ticker import AutoLocator, Formatter, Locator
+from matplotlib.transforms import nonsingular
+import matplotlib.units as units
+import numpy as np
+
+from pandas._libs import lib, tslibs
+from pandas._libs.tslibs import resolution
+from pandas._libs.tslibs.frequencies import FreqGroup, get_freq
+import pandas.compat as compat
+from pandas.compat import lrange
+
+from pandas.core.dtypes.common import (
+    is_datetime64_ns_dtype, is_float, is_float_dtype, is_integer,
+    is_integer_dtype, is_nested_list_like)
+from pandas.core.dtypes.generic import ABCSeries
+
+import pandas.core.common as com
+from pandas.core.index import Index
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.period import Period, PeriodIndex, period_range
+import pandas.core.tools.datetimes as tools
+
+# constants
+HOURS_PER_DAY = 24.
+MIN_PER_HOUR = 60.
+SEC_PER_MIN = 60.
+
+SEC_PER_HOUR = SEC_PER_MIN * MIN_PER_HOUR
+SEC_PER_DAY = SEC_PER_HOUR * HOURS_PER_DAY
+
+MUSEC_PER_DAY = 1e6 * SEC_PER_DAY
+
+_WARN = True  # Global for whether pandas has registered the units explicitly
+_mpl_units = {}  # Cache for units overwritten by us
+
+
+def get_pairs():
+    pairs = [
+        (tslibs.Timestamp, DatetimeConverter),
+        (Period, PeriodConverter),
+        (pydt.datetime, DatetimeConverter),
+        (pydt.date, DatetimeConverter),
+        (pydt.time, TimeConverter),
+        (np.datetime64, DatetimeConverter),
+    ]
+    return pairs
+
+
+def register(explicit=True):
+    """
+    Register Pandas Formatters and Converters with matplotlib
+
+    This function modifies the global ``matplotlib.units.registry``
+    dictionary. Pandas adds custom converters for
+
+    * pd.Timestamp
+    * pd.Period
+    * np.datetime64
+    * datetime.datetime
+    * datetime.date
+    * datetime.time
+
+    See Also
+    --------
+    deregister_matplotlib_converter
+    """
+    # Renamed in pandas.plotting.__init__
+    global _WARN
+
+    if explicit:
+        _WARN = False
+
+    pairs = get_pairs()
+    for type_, cls in pairs:
+        converter = cls()
+        if type_ in units.registry:
+            previous = units.registry[type_]
+            _mpl_units[type_] = previous
+        units.registry[type_] = converter
+
+
+def deregister():
+    """
+    Remove pandas' formatters and converters
+
+    Removes the custom converters added by :func:`register`. This
+    attempts to set the state of the registry back to the state before
+    pandas registered its own units. Converters for pandas' own types like
+    Timestamp and Period are removed completely. Converters for types
+    pandas overwrites, like ``datetime.datetime``, are restored to their
+    original value.
+
+    See Also
+    --------
+    deregister_matplotlib_converters
+    """
+    # Renamed in pandas.plotting.__init__
+    for type_, cls in get_pairs():
+        # We use type to catch our classes directly, no inheritance
+        if type(units.registry.get(type_)) is cls:
+            units.registry.pop(type_)
+
+    # restore the old keys
+    for unit, formatter in _mpl_units.items():
+        if type(formatter) not in {DatetimeConverter, PeriodConverter,
+                                   TimeConverter}:
+            # make it idempotent by excluding ours.
+            units.registry[unit] = formatter
+
+
+def _check_implicitly_registered():
+    global _WARN
+
+    if _WARN:
+        msg = ("Using an implicitly registered datetime converter for a "
+               "matplotlib plotting method. The converter was registered "
+               "by pandas on import. Future versions of pandas will require "
+               "you to explicitly register matplotlib converters.\n\n"
+               "To register the converters:\n\t"
+               ">>> from pandas.plotting import register_matplotlib_converters"
+               "\n\t"
+               ">>> register_matplotlib_converters()")
+        warnings.warn(msg, FutureWarning)
+        _WARN = False
+
+
+def _to_ordinalf(tm):
+    tot_sec = (tm.hour * 3600 + tm.minute * 60 + tm.second +
+               float(tm.microsecond / 1e6))
+    return tot_sec
+
+
+def time2num(d):
+    if isinstance(d, compat.string_types):
+        parsed = tools.to_datetime(d)
+        if not isinstance(parsed, datetime):
+            raise ValueError('Could not parse time {d}'.format(d=d))
+        return _to_ordinalf(parsed.time())
+    if isinstance(d, pydt.time):
+        return _to_ordinalf(d)
+    return d
+
+
+class TimeConverter(units.ConversionInterface):
+
+    @staticmethod
+    def convert(value, unit, axis):
+        valid_types = (str, pydt.time)
+        if (isinstance(value, valid_types) or is_integer(value) or
+                is_float(value)):
+            return time2num(value)
+        if isinstance(value, Index):
+            return value.map(time2num)
+        if isinstance(value, (list, tuple, np.ndarray, Index)):
+            return [time2num(x) for x in value]
+        return value
+
+    @staticmethod
+    def axisinfo(unit, axis):
+        if unit != 'time':
+            return None
+
+        majloc = AutoLocator()
+        majfmt = TimeFormatter(majloc)
+        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='time')
+
+    @staticmethod
+    def default_units(x, axis):
+        return 'time'
+
+
+# time formatter
+class TimeFormatter(Formatter):
+
+    def __init__(self, locs):
+        self.locs = locs
+
+    def __call__(self, x, pos=0):
+        """
+        Return the time of day as a formatted string.
+
+        Parameters
+        ----------
+        x : float
+            The time of day specified as seconds since 00:00 (midnight),
+            with up to microsecond precision.
+        pos
+            Unused
+
+        Returns
+        -------
+        str
+            A string in HH:MM:SS.mmmuuu format. Microseconds,
+            milliseconds and seconds are only displayed if non-zero.
+        """
+        fmt = '%H:%M:%S.%f'
+        s = int(x)
+        msus = int(round((x - s) * 1e6))
+        ms = msus // 1000
+        us = msus % 1000
+        m, s = divmod(s, 60)
+        h, m = divmod(m, 60)
+        _, h = divmod(h, 24)
+        if us != 0:
+            return pydt.time(h, m, s, msus).strftime(fmt)
+        elif ms != 0:
+            return pydt.time(h, m, s, msus).strftime(fmt)[:-3]
+        elif s != 0:
+            return pydt.time(h, m, s).strftime('%H:%M:%S')
+
+        return pydt.time(h, m).strftime('%H:%M')
+
+
+# Period Conversion
+
+
+class PeriodConverter(dates.DateConverter):
+
+    @staticmethod
+    def convert(values, units, axis):
+        if is_nested_list_like(values):
+            values = [PeriodConverter._convert_1d(v, units, axis)
+                      for v in values]
+        else:
+            values = PeriodConverter._convert_1d(values, units, axis)
+        return values
+
+    @staticmethod
+    def _convert_1d(values, units, axis):
+        if not hasattr(axis, 'freq'):
+            raise TypeError('Axis must have `freq` set to convert to Periods')
+        valid_types = (compat.string_types, datetime,
+                       Period, pydt.date, pydt.time, np.datetime64)
+        if (isinstance(values, valid_types) or is_integer(values) or
+                is_float(values)):
+            return get_datevalue(values, axis.freq)
+        elif isinstance(values, PeriodIndex):
+            return values.asfreq(axis.freq)._ndarray_values
+        elif isinstance(values, Index):
+            return values.map(lambda x: get_datevalue(x, axis.freq))
+        elif lib.infer_dtype(values, skipna=False) == 'period':
+            # https://github.com/pandas-dev/pandas/issues/24304
+            # convert ndarray[period] -> PeriodIndex
+            return PeriodIndex(values, freq=axis.freq)._ndarray_values
+        elif isinstance(values, (list, tuple, np.ndarray, Index)):
+            return [get_datevalue(x, axis.freq) for x in values]
+        return values
+
+
+def get_datevalue(date, freq):
+    if isinstance(date, Period):
+        return date.asfreq(freq).ordinal
+    elif isinstance(date, (compat.string_types, datetime,
+                           pydt.date, pydt.time, np.datetime64)):
+        return Period(date, freq).ordinal
+    elif (is_integer(date) or is_float(date) or
+          (isinstance(date, (np.ndarray, Index)) and (date.size == 1))):
+        return date
+    elif date is None:
+        return None
+    raise ValueError("Unrecognizable date '{date}'".format(date=date))
+
+
+def _dt_to_float_ordinal(dt):
+    """
+    Convert :mod:`datetime` to the Gregorian date as UTC float days,
+    preserving hours, minutes, seconds and microseconds.  Return value
+    is a :func:`float`.
+    """
+    if (isinstance(dt, (np.ndarray, Index, ABCSeries)
+                   ) and is_datetime64_ns_dtype(dt)):
+        base = dates.epoch2num(dt.asi8 / 1.0E9)
+    else:
+        base = dates.date2num(dt)
+    return base
+
+
+# Datetime Conversion
+class DatetimeConverter(dates.DateConverter):
+
+    @staticmethod
+    def convert(values, unit, axis):
+        # values might be a 1-d array, or a list-like of arrays.
+        _check_implicitly_registered()
+        if is_nested_list_like(values):
+            values = [DatetimeConverter._convert_1d(v, unit, axis)
+                      for v in values]
+        else:
+            values = DatetimeConverter._convert_1d(values, unit, axis)
+        return values
+
+    @staticmethod
+    def _convert_1d(values, unit, axis):
+        def try_parse(values):
+            try:
+                return _dt_to_float_ordinal(tools.to_datetime(values))
+            except Exception:
+                return values
+
+        if isinstance(values, (datetime, pydt.date)):
+            return _dt_to_float_ordinal(values)
+        elif isinstance(values, np.datetime64):
+            return _dt_to_float_ordinal(tslibs.Timestamp(values))
+        elif isinstance(values, pydt.time):
+            return dates.date2num(values)
+        elif (is_integer(values) or is_float(values)):
+            return values
+        elif isinstance(values, compat.string_types):
+            return try_parse(values)
+        elif isinstance(values, (list, tuple, np.ndarray, Index, ABCSeries)):
+            if isinstance(values, ABCSeries):
+                # https://github.com/matplotlib/matplotlib/issues/11391
+                # Series was skipped. Convert to DatetimeIndex to get asi8
+                values = Index(values)
+            if isinstance(values, Index):
+                values = values.values
+            if not isinstance(values, np.ndarray):
+                values = com.asarray_tuplesafe(values)
+
+            if is_integer_dtype(values) or is_float_dtype(values):
+                return values
+
+            try:
+                values = tools.to_datetime(values)
+                if isinstance(values, Index):
+                    values = _dt_to_float_ordinal(values)
+                else:
+                    values = [_dt_to_float_ordinal(x) for x in values]
+            except Exception:
+                values = _dt_to_float_ordinal(values)
+
+        return values
+
+    @staticmethod
+    def axisinfo(unit, axis):
+        """
+        Return the :class:`~matplotlib.units.AxisInfo` for *unit*.
+
+        *unit* is a tzinfo instance or None.
+        The *axis* argument is required but not used.
+        """
+        tz = unit
+
+        majloc = PandasAutoDateLocator(tz=tz)
+        majfmt = PandasAutoDateFormatter(majloc, tz=tz)
+        datemin = pydt.date(2000, 1, 1)
+        datemax = pydt.date(2010, 1, 1)
+
+        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='',
+                              default_limits=(datemin, datemax))
+
+
+class PandasAutoDateFormatter(dates.AutoDateFormatter):
+
+    def __init__(self, locator, tz=None, defaultfmt='%Y-%m-%d'):
+        dates.AutoDateFormatter.__init__(self, locator, tz, defaultfmt)
+        # matplotlib.dates._UTC has no _utcoffset called by pandas
+        if self._tz is dates.UTC:
+            self._tz._utcoffset = self._tz.utcoffset(None)
+
+
+class PandasAutoDateLocator(dates.AutoDateLocator):
+
+    def get_locator(self, dmin, dmax):
+        'Pick the best locator based on a distance.'
+        _check_implicitly_registered()
+        delta = relativedelta(dmax, dmin)
+
+        num_days = (delta.years * 12.0 + delta.months) * 31.0 + delta.days
+        num_sec = (delta.hours * 60.0 + delta.minutes) * 60.0 + delta.seconds
+        tot_sec = num_days * 86400. + num_sec
+
+        if abs(tot_sec) < self.minticks:
+            self._freq = -1
+            locator = MilliSecondLocator(self.tz)
+            locator.set_axis(self.axis)
+
+            locator.set_view_interval(*self.axis.get_view_interval())
+            locator.set_data_interval(*self.axis.get_data_interval())
+            return locator
+
+        return dates.AutoDateLocator.get_locator(self, dmin, dmax)
+
+    def _get_unit(self):
+        return MilliSecondLocator.get_unit_generic(self._freq)
+
+
+class MilliSecondLocator(dates.DateLocator):
+
+    UNIT = 1. / (24 * 3600 * 1000)
+
+    def __init__(self, tz):
+        dates.DateLocator.__init__(self, tz)
+        self._interval = 1.
+
+    def _get_unit(self):
+        return self.get_unit_generic(-1)
+
+    @staticmethod
+    def get_unit_generic(freq):
+        unit = dates.RRuleLocator.get_unit_generic(freq)
+        if unit < 0:
+            return MilliSecondLocator.UNIT
+        return unit
+
+    def __call__(self):
+        # if no data have been set, this will tank with a ValueError
+        _check_implicitly_registered()
+        try:
+            dmin, dmax = self.viewlim_to_dt()
+        except ValueError:
+            return []
+
+        if dmin > dmax:
+            dmax, dmin = dmin, dmax
+        # We need to cap at the endpoints of valid datetime
+
+        # TODO(wesm) unused?
+        # delta = relativedelta(dmax, dmin)
+        # try:
+        #     start = dmin - delta
+        # except ValueError:
+        #     start = _from_ordinal(1.0)
+
+        # try:
+        #     stop = dmax + delta
+        # except ValueError:
+        #     # The magic number!
+        #     stop = _from_ordinal(3652059.9999999)
+
+        nmax, nmin = dates.date2num((dmax, dmin))
+
+        num = (nmax - nmin) * 86400 * 1000
+        max_millis_ticks = 6
+        for interval in [1, 10, 50, 100, 200, 500]:
+            if num <= interval * (max_millis_ticks - 1):
+                self._interval = interval
+                break
+            else:
+                # We went through the whole loop without breaking, default to 1
+                self._interval = 1000.
+
+        estimate = (nmax - nmin) / (self._get_unit() * self._get_interval())
+
+        if estimate > self.MAXTICKS * 2:
+            raise RuntimeError(('MillisecondLocator estimated to generate '
+                                '{estimate:d} ticks from {dmin} to {dmax}: '
+                                'exceeds Locator.MAXTICKS'
+                                '* 2 ({arg:d}) ').format(
+                                    estimate=estimate, dmin=dmin, dmax=dmax,
+                                    arg=self.MAXTICKS * 2))
+
+        freq = '%dL' % self._get_interval()
+        tz = self.tz.tzname(None)
+        st = _from_ordinal(dates.date2num(dmin))  # strip tz
+        ed = _from_ordinal(dates.date2num(dmax))
+        all_dates = date_range(start=st, end=ed,
+                               freq=freq, tz=tz).astype(object)
+
+        try:
+            if len(all_dates) > 0:
+                locs = self.raise_if_exceeds(dates.date2num(all_dates))
+                return locs
+        except Exception:  # pragma: no cover
+            pass
+
+        lims = dates.date2num([dmin, dmax])
+        return lims
+
+    def _get_interval(self):
+        return self._interval
+
+    def autoscale(self):
+        """
+        Set the view limits to include the data range.
+        """
+        dmin, dmax = self.datalim_to_dt()
+        if dmin > dmax:
+            dmax, dmin = dmin, dmax
+
+        # We need to cap at the endpoints of valid datetime
+
+        # TODO(wesm): unused?
+
+        # delta = relativedelta(dmax, dmin)
+        # try:
+        #     start = dmin - delta
+        # except ValueError:
+        #     start = _from_ordinal(1.0)
+
+        # try:
+        #     stop = dmax + delta
+        # except ValueError:
+        #     # The magic number!
+        #     stop = _from_ordinal(3652059.9999999)
+
+        dmin, dmax = self.datalim_to_dt()
+
+        vmin = dates.date2num(dmin)
+        vmax = dates.date2num(dmax)
+
+        return self.nonsingular(vmin, vmax)
+
+
+def _from_ordinal(x, tz=None):
+    ix = int(x)
+    dt = datetime.fromordinal(ix)
+    remainder = float(x) - ix
+    hour, remainder = divmod(24 * remainder, 1)
+    minute, remainder = divmod(60 * remainder, 1)
+    second, remainder = divmod(60 * remainder, 1)
+    microsecond = int(1e6 * remainder)
+    if microsecond < 10:
+        microsecond = 0  # compensate for rounding errors
+    dt = datetime(dt.year, dt.month, dt.day, int(hour), int(minute),
+                  int(second), microsecond)
+    if tz is not None:
+        dt = dt.astimezone(tz)
+
+    if microsecond > 999990:  # compensate for rounding errors
+        dt += timedelta(microseconds=1e6 - microsecond)
+
+    return dt
+
+# Fixed frequency dynamic tick locators and formatters
+
+# -------------------------------------------------------------------------
+# --- Locators ---
+# -------------------------------------------------------------------------
+
+
+def _get_default_annual_spacing(nyears):
+    """
+    Returns a default spacing between consecutive ticks for annual data.
+    """
+    if nyears < 11:
+        (min_spacing, maj_spacing) = (1, 1)
+    elif nyears < 20:
+        (min_spacing, maj_spacing) = (1, 2)
+    elif nyears < 50:
+        (min_spacing, maj_spacing) = (1, 5)
+    elif nyears < 100:
+        (min_spacing, maj_spacing) = (5, 10)
+    elif nyears < 200:
+        (min_spacing, maj_spacing) = (5, 25)
+    elif nyears < 600:
+        (min_spacing, maj_spacing) = (10, 50)
+    else:
+        factor = nyears // 1000 + 1
+        (min_spacing, maj_spacing) = (factor * 20, factor * 100)
+    return (min_spacing, maj_spacing)
+
+
+def period_break(dates, period):
+    """
+    Returns the indices where the given period changes.
+
+    Parameters
+    ----------
+    dates : PeriodIndex
+        Array of intervals to monitor.
+    period : string
+        Name of the period to monitor.
+    """
+    current = getattr(dates, period)
+    previous = getattr(dates - 1 * dates.freq, period)
+    return np.nonzero(current - previous)[0]
+
+
+def has_level_label(label_flags, vmin):
+    """
+    Returns true if the ``label_flags`` indicate there is at least one label
+    for this level.
+
+    if the minimum view limit is not an exact integer, then the first tick
+    label won't be shown, so we must adjust for that.
+    """
+    if label_flags.size == 0 or (label_flags.size == 1 and
+                                 label_flags[0] == 0 and
+                                 vmin % 1 > 0.0):
+        return False
+    else:
+        return True
+
+
+def _daily_finder(vmin, vmax, freq):
+    periodsperday = -1
+
+    if freq >= FreqGroup.FR_HR:
+        if freq == FreqGroup.FR_NS:
+            periodsperday = 24 * 60 * 60 * 1000000000
+        elif freq == FreqGroup.FR_US:
+            periodsperday = 24 * 60 * 60 * 1000000
+        elif freq == FreqGroup.FR_MS:
+            periodsperday = 24 * 60 * 60 * 1000
+        elif freq == FreqGroup.FR_SEC:
+            periodsperday = 24 * 60 * 60
+        elif freq == FreqGroup.FR_MIN:
+            periodsperday = 24 * 60
+        elif freq == FreqGroup.FR_HR:
+            periodsperday = 24
+        else:  # pragma: no cover
+            raise ValueError("unexpected frequency: {freq}".format(freq=freq))
+        periodsperyear = 365 * periodsperday
+        periodspermonth = 28 * periodsperday
+
+    elif freq == FreqGroup.FR_BUS:
+        periodsperyear = 261
+        periodspermonth = 19
+    elif freq == FreqGroup.FR_DAY:
+        periodsperyear = 365
+        periodspermonth = 28
+    elif resolution.get_freq_group(freq) == FreqGroup.FR_WK:
+        periodsperyear = 52
+        periodspermonth = 3
+    else:  # pragma: no cover
+        raise ValueError("unexpected frequency")
+
+    # save this for later usage
+    vmin_orig = vmin
+
+    (vmin, vmax) = (Period(ordinal=int(vmin), freq=freq),
+                    Period(ordinal=int(vmax), freq=freq))
+    span = vmax.ordinal - vmin.ordinal + 1
+    dates_ = period_range(start=vmin, end=vmax, freq=freq)
+    # Initialize the output
+    info = np.zeros(span,
+                    dtype=[('val', np.int64), ('maj', bool),
+                           ('min', bool), ('fmt', '|S20')])
+    info['val'][:] = dates_._ndarray_values
+    info['fmt'][:] = ''
+    info['maj'][[0, -1]] = True
+    # .. and set some shortcuts
+    info_maj = info['maj']
+    info_min = info['min']
+    info_fmt = info['fmt']
+
+    def first_label(label_flags):
+        if (label_flags[0] == 0) and (label_flags.size > 1) and \
+                ((vmin_orig % 1) > 0.0):
+            return label_flags[1]
+        else:
+            return label_flags[0]
+
+    # Case 1. Less than a month
+    if span <= periodspermonth:
+        day_start = period_break(dates_, 'day')
+        month_start = period_break(dates_, 'month')
+
+        def _hour_finder(label_interval, force_year_start):
+            _hour = dates_.hour
+            _prev_hour = (dates_ - 1 * dates_.freq).hour
+            hour_start = (_hour - _prev_hour) != 0
+            info_maj[day_start] = True
+            info_min[hour_start & (_hour % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt[hour_start & (_hour % label_interval == 0)] = '%H:%M'
+            info_fmt[day_start] = '%H:%M\n%d-%b'
+            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
+            if force_year_start and not has_level_label(year_start, vmin_orig):
+                info_fmt[first_label(day_start)] = '%H:%M\n%d-%b\n%Y'
+
+        def _minute_finder(label_interval):
+            hour_start = period_break(dates_, 'hour')
+            _minute = dates_.minute
+            _prev_minute = (dates_ - 1 * dates_.freq).minute
+            minute_start = (_minute - _prev_minute) != 0
+            info_maj[hour_start] = True
+            info_min[minute_start & (_minute % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[minute_start & (_minute % label_interval == 0)] = '%H:%M'
+            info_fmt[day_start] = '%H:%M\n%d-%b'
+            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
+
+        def _second_finder(label_interval):
+            minute_start = period_break(dates_, 'minute')
+            _second = dates_.second
+            _prev_second = (dates_ - 1 * dates_.freq).second
+            second_start = (_second - _prev_second) != 0
+            info['maj'][minute_start] = True
+            info['min'][second_start & (_second % label_interval == 0)] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[second_start & (_second %
+                                     label_interval == 0)] = '%H:%M:%S'
+            info_fmt[day_start] = '%H:%M:%S\n%d-%b'
+            info_fmt[year_start] = '%H:%M:%S\n%d-%b\n%Y'
+
+        if span < periodsperday / 12000.0:
+            _second_finder(1)
+        elif span < periodsperday / 6000.0:
+            _second_finder(2)
+        elif span < periodsperday / 2400.0:
+            _second_finder(5)
+        elif span < periodsperday / 1200.0:
+            _second_finder(10)
+        elif span < periodsperday / 800.0:
+            _second_finder(15)
+        elif span < periodsperday / 400.0:
+            _second_finder(30)
+        elif span < periodsperday / 150.0:
+            _minute_finder(1)
+        elif span < periodsperday / 70.0:
+            _minute_finder(2)
+        elif span < periodsperday / 24.0:
+            _minute_finder(5)
+        elif span < periodsperday / 12.0:
+            _minute_finder(15)
+        elif span < periodsperday / 6.0:
+            _minute_finder(30)
+        elif span < periodsperday / 2.5:
+            _hour_finder(1, False)
+        elif span < periodsperday / 1.5:
+            _hour_finder(2, False)
+        elif span < periodsperday * 1.25:
+            _hour_finder(3, False)
+        elif span < periodsperday * 2.5:
+            _hour_finder(6, True)
+        elif span < periodsperday * 4:
+            _hour_finder(12, True)
+        else:
+            info_maj[month_start] = True
+            info_min[day_start] = True
+            year_start = period_break(dates_, 'year')
+            info_fmt = info['fmt']
+            info_fmt[day_start] = '%d'
+            info_fmt[month_start] = '%d\n%b'
+            info_fmt[year_start] = '%d\n%b\n%Y'
+            if not has_level_label(year_start, vmin_orig):
+                if not has_level_label(month_start, vmin_orig):
+                    info_fmt[first_label(day_start)] = '%d\n%b\n%Y'
+                else:
+                    info_fmt[first_label(month_start)] = '%d\n%b\n%Y'
+
+    # Case 2. Less than three months
+    elif span <= periodsperyear // 4:
+        month_start = period_break(dates_, 'month')
+        info_maj[month_start] = True
+        if freq < FreqGroup.FR_HR:
+            info['min'] = True
+        else:
+            day_start = period_break(dates_, 'day')
+            info['min'][day_start] = True
+        week_start = period_break(dates_, 'week')
+        year_start = period_break(dates_, 'year')
+        info_fmt[week_start] = '%d'
+        info_fmt[month_start] = '\n\n%b'
+        info_fmt[year_start] = '\n\n%b\n%Y'
+        if not has_level_label(year_start, vmin_orig):
+            if not has_level_label(month_start, vmin_orig):
+                info_fmt[first_label(week_start)] = '\n\n%b\n%Y'
+            else:
+                info_fmt[first_label(month_start)] = '\n\n%b\n%Y'
+    # Case 3. Less than 14 months ...............
+    elif span <= 1.15 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        month_start = period_break(dates_, 'month')
+        week_start = period_break(dates_, 'week')
+        info_maj[month_start] = True
+        info_min[week_start] = True
+        info_min[year_start] = False
+        info_min[month_start] = False
+        info_fmt[month_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+        if not has_level_label(year_start, vmin_orig):
+            info_fmt[first_label(month_start)] = '%b\n%Y'
+    # Case 4. Less than 2.5 years ...............
+    elif span <= 2.5 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        quarter_start = period_break(dates_, 'quarter')
+        month_start = period_break(dates_, 'month')
+        info_maj[quarter_start] = True
+        info_min[month_start] = True
+        info_fmt[quarter_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+    # Case 4. Less than 4 years .................
+    elif span <= 4 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        month_start = period_break(dates_, 'month')
+        info_maj[year_start] = True
+        info_min[month_start] = True
+        info_min[year_start] = False
+
+        month_break = dates_[month_start].month
+        jan_or_jul = month_start[(month_break == 1) | (month_break == 7)]
+        info_fmt[jan_or_jul] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+    # Case 5. Less than 11 years ................
+    elif span <= 11 * periodsperyear:
+        year_start = period_break(dates_, 'year')
+        quarter_start = period_break(dates_, 'quarter')
+        info_maj[year_start] = True
+        info_min[quarter_start] = True
+        info_min[year_start] = False
+        info_fmt[year_start] = '%Y'
+    # Case 6. More than 12 years ................
+    else:
+        year_start = period_break(dates_, 'year')
+        year_break = dates_[year_start].year
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        major_idx = year_start[(year_break % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        minor_idx = year_start[(year_break % min_anndef == 0)]
+        info_min[minor_idx] = True
+        info_fmt[major_idx] = '%Y'
+
+    return info
+
+
+def _monthly_finder(vmin, vmax, freq):
+    periodsperyear = 12
+
+    vmin_orig = vmin
+    (vmin, vmax) = (int(vmin), int(vmax))
+    span = vmax - vmin + 1
+
+    # Initialize the output
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    dates_ = info['val']
+    info['fmt'] = ''
+    year_start = (dates_ % 12 == 0).nonzero()[0]
+    info_maj = info['maj']
+    info_fmt = info['fmt']
+
+    if span <= 1.15 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        info_fmt[:] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+        if not has_level_label(year_start, vmin_orig):
+            if dates_.size > 1:
+                idx = 1
+            else:
+                idx = 0
+            info_fmt[idx] = '%b\n%Y'
+
+    elif span <= 2.5 * periodsperyear:
+        quarter_start = (dates_ % 3 == 0).nonzero()
+        info_maj[year_start] = True
+        # TODO: Check the following : is it really info['fmt'] ?
+        info['fmt'][quarter_start] = True
+        info['min'] = True
+
+        info_fmt[quarter_start] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+    elif span <= 4 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        jan_or_jul = (dates_ % 12 == 0) | (dates_ % 12 == 6)
+        info_fmt[jan_or_jul] = '%b'
+        info_fmt[year_start] = '%b\n%Y'
+
+    elif span <= 11 * periodsperyear:
+        quarter_start = (dates_ % 3 == 0).nonzero()
+        info_maj[year_start] = True
+        info['min'][quarter_start] = True
+
+        info_fmt[year_start] = '%Y'
+
+    else:
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        years = dates_[year_start] // 12 + 1
+        major_idx = year_start[(years % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        info['min'][year_start[(years % min_anndef == 0)]] = True
+
+        info_fmt[major_idx] = '%Y'
+
+    return info
+
+
+def _quarterly_finder(vmin, vmax, freq):
+    periodsperyear = 4
+    vmin_orig = vmin
+    (vmin, vmax) = (int(vmin), int(vmax))
+    span = vmax - vmin + 1
+
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    info['fmt'] = ''
+    dates_ = info['val']
+    info_maj = info['maj']
+    info_fmt = info['fmt']
+    year_start = (dates_ % 4 == 0).nonzero()[0]
+
+    if span <= 3.5 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+
+        info_fmt[:] = 'Q%q'
+        info_fmt[year_start] = 'Q%q\n%F'
+        if not has_level_label(year_start, vmin_orig):
+            if dates_.size > 1:
+                idx = 1
+            else:
+                idx = 0
+            info_fmt[idx] = 'Q%q\n%F'
+
+    elif span <= 11 * periodsperyear:
+        info_maj[year_start] = True
+        info['min'] = True
+        info_fmt[year_start] = '%F'
+
+    else:
+        years = dates_[year_start] // 4 + 1
+        nyears = span / periodsperyear
+        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
+        major_idx = year_start[(years % maj_anndef == 0)]
+        info_maj[major_idx] = True
+        info['min'][year_start[(years % min_anndef == 0)]] = True
+        info_fmt[major_idx] = '%F'
+
+    return info
+
+
+def _annual_finder(vmin, vmax, freq):
+    (vmin, vmax) = (int(vmin), int(vmax + 1))
+    span = vmax - vmin + 1
+
+    info = np.zeros(span,
+                    dtype=[('val', int), ('maj', bool), ('min', bool),
+                           ('fmt', '|S8')])
+    info['val'] = np.arange(vmin, vmax + 1)
+    info['fmt'] = ''
+    dates_ = info['val']
+
+    (min_anndef, maj_anndef) = _get_default_annual_spacing(span)
+    major_idx = dates_ % maj_anndef == 0
+    info['maj'][major_idx] = True
+    info['min'][(dates_ % min_anndef == 0)] = True
+    info['fmt'][major_idx] = '%Y'
+
+    return info
+
+
+def get_finder(freq):
+    if isinstance(freq, compat.string_types):
+        freq = get_freq(freq)
+    fgroup = resolution.get_freq_group(freq)
+
+    if fgroup == FreqGroup.FR_ANN:
+        return _annual_finder
+    elif fgroup == FreqGroup.FR_QTR:
+        return _quarterly_finder
+    elif freq == FreqGroup.FR_MTH:
+        return _monthly_finder
+    elif ((freq >= FreqGroup.FR_BUS) or fgroup == FreqGroup.FR_WK):
+        return _daily_finder
+    else:  # pragma: no cover
+        errmsg = "Unsupported frequency: {freq}".format(freq=freq)
+        raise NotImplementedError(errmsg)
+
+
+class TimeSeries_DateLocator(Locator):
+    """
+    Locates the ticks along an axis controlled by a :class:`Series`.
+
+    Parameters
+    ----------
+    freq : {var}
+        Valid frequency specifier.
+    minor_locator : {False, True}, optional
+        Whether the locator is for minor ticks (True) or not.
+    dynamic_mode : {True, False}, optional
+        Whether the locator should work in dynamic mode.
+    base : {int}, optional
+    quarter : {int}, optional
+    month : {int}, optional
+    day : {int}, optional
+    """
+
+    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
+                 base=1, quarter=1, month=1, day=1, plot_obj=None):
+        if isinstance(freq, compat.string_types):
+            freq = get_freq(freq)
+        self.freq = freq
+        self.base = base
+        (self.quarter, self.month, self.day) = (quarter, month, day)
+        self.isminor = minor_locator
+        self.isdynamic = dynamic_mode
+        self.offset = 0
+        self.plot_obj = plot_obj
+        self.finder = get_finder(freq)
+
+    def _get_default_locs(self, vmin, vmax):
+        "Returns the default locations of ticks."
+
+        if self.plot_obj.date_axis_info is None:
+            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
+
+        locator = self.plot_obj.date_axis_info
+
+        if self.isminor:
+            return np.compress(locator['min'], locator['val'])
+        return np.compress(locator['maj'], locator['val'])
+
+    def __call__(self):
+        'Return the locations of the ticks.'
+        # axis calls Locator.set_axis inside set_m<xxxx>_formatter
+        _check_implicitly_registered()
+
+        vi = tuple(self.axis.get_view_interval())
+        if vi != self.plot_obj.view_interval:
+            self.plot_obj.date_axis_info = None
+        self.plot_obj.view_interval = vi
+        vmin, vmax = vi
+        if vmax < vmin:
+            vmin, vmax = vmax, vmin
+        if self.isdynamic:
+            locs = self._get_default_locs(vmin, vmax)
+        else:  # pragma: no cover
+            base = self.base
+            (d, m) = divmod(vmin, base)
+            vmin = (d + 1) * base
+            locs = lrange(vmin, vmax + 1, base)
+        return locs
+
+    def autoscale(self):
+        """
+        Sets the view limits to the nearest multiples of base that contain the
+        data.
+        """
+        # requires matplotlib >= 0.98.0
+        (vmin, vmax) = self.axis.get_data_interval()
+
+        locs = self._get_default_locs(vmin, vmax)
+        (vmin, vmax) = locs[[0, -1]]
+        if vmin == vmax:
+            vmin -= 1
+            vmax += 1
+        return nonsingular(vmin, vmax)
+
+# -------------------------------------------------------------------------
+# --- Formatter ---
+# -------------------------------------------------------------------------
+
+
+class TimeSeries_DateFormatter(Formatter):
+    """
+    Formats the ticks along an axis controlled by a :class:`PeriodIndex`.
+
+    Parameters
+    ----------
+    freq : {int, string}
+        Valid frequency specifier.
+    minor_locator : {False, True}
+        Whether the current formatter should apply to minor ticks (True) or
+        major ticks (False).
+    dynamic_mode : {True, False}
+        Whether the formatter works in dynamic mode or not.
+    """
+
+    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
+                 plot_obj=None):
+        if isinstance(freq, compat.string_types):
+            freq = get_freq(freq)
+        self.format = None
+        self.freq = freq
+        self.locs = []
+        self.formatdict = None
+        self.isminor = minor_locator
+        self.isdynamic = dynamic_mode
+        self.offset = 0
+        self.plot_obj = plot_obj
+        self.finder = get_finder(freq)
+
+    def _set_default_format(self, vmin, vmax):
+        "Returns the default ticks spacing."
+
+        if self.plot_obj.date_axis_info is None:
+            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
+        info = self.plot_obj.date_axis_info
+
+        if self.isminor:
+            format = np.compress(info['min'] & np.logical_not(info['maj']),
+                                 info)
+        else:
+            format = np.compress(info['maj'], info)
+        self.formatdict = {x: f for (x, _, _, f) in format}
+        return self.formatdict
+
+    def set_locs(self, locs):
+        'Sets the locations of the ticks'
+        # don't actually use the locs. This is just needed to work with
+        # matplotlib. Force to use vmin, vmax
+        _check_implicitly_registered()
+
+        self.locs = locs
+
+        (vmin, vmax) = vi = tuple(self.axis.get_view_interval())
+        if vi != self.plot_obj.view_interval:
+            self.plot_obj.date_axis_info = None
+        self.plot_obj.view_interval = vi
+        if vmax < vmin:
+            (vmin, vmax) = (vmax, vmin)
+        self._set_default_format(vmin, vmax)
+
+    def __call__(self, x, pos=0):
+        _check_implicitly_registered()
+
+        if self.formatdict is None:
+            return ''
+        else:
+            fmt = self.formatdict.pop(x, '')
+            return Period(ordinal=int(x), freq=self.freq).strftime(fmt)
+
+
+class TimeSeries_TimedeltaFormatter(Formatter):
+    """
+    Formats the ticks along an axis controlled by a :class:`TimedeltaIndex`.
+    """
+
+    @staticmethod
+    def format_timedelta_ticks(x, pos, n_decimals):
+        """
+        Convert seconds to 'D days HH:MM:SS.F'
+        """
+        s, ns = divmod(x, 1e9)
+        m, s = divmod(s, 60)
+        h, m = divmod(m, 60)
+        d, h = divmod(h, 24)
+        decimals = int(ns * 10**(n_decimals - 9))
+        s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
+        if n_decimals > 0:
+            s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
+        if d != 0:
+            s = '{:d} days '.format(int(d)) + s
+        return s
+
+    def __call__(self, x, pos=0):
+        _check_implicitly_registered()
+        (vmin, vmax) = tuple(self.axis.get_view_interval())
+        n_decimals = int(np.ceil(np.log10(100 * 1e9 / (vmax - vmin))))
+        if n_decimals > 9:
+            n_decimals = 9
+        return self.format_timedelta_ticks(x, pos, n_decimals)
diff --git a/pandas/plotting/_core.py b/pandas/plotting/_core.py
new file mode 100644
index 0000000000000..0ea92a57ac3f8
--- /dev/null
+++ b/pandas/plotting/_core.py
@@ -0,0 +1,3608 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+from collections import namedtuple
+from distutils.version import LooseVersion
+import re
+import warnings
+
+import numpy as np
+
+import pandas.compat as compat
+from pandas.compat import lrange, map, range, string_types, zip
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import Appender, cache_readonly
+
+from pandas.core.dtypes.common import (
+    is_hashable, is_integer, is_iterator, is_list_like, is_number)
+from pandas.core.dtypes.generic import (
+    ABCDataFrame, ABCIndexClass, ABCMultiIndex, ABCPeriodIndex, ABCSeries)
+from pandas.core.dtypes.missing import isna, notna, remove_na_arraylike
+
+from pandas.core.base import PandasObject
+import pandas.core.common as com
+from pandas.core.config import get_option
+from pandas.core.generic import _shared_doc_kwargs, _shared_docs
+
+from pandas.io.formats.printing import pprint_thing
+from pandas.plotting._compat import _mpl_ge_3_0_0
+from pandas.plotting._style import _get_standard_colors, plot_params
+from pandas.plotting._tools import (
+    _flatten, _get_all_lines, _get_xlim, _handle_shared_axes, _set_ticks_props,
+    _subplots, format_date_labels, table)
+
+try:
+    from pandas.plotting import _converter
+except ImportError:
+    _HAS_MPL = False
+else:
+    _HAS_MPL = True
+    if get_option('plotting.matplotlib.register_converters'):
+        _converter.register(explicit=False)
+
+
+def _raise_if_no_mpl():
+    # TODO(mpl_converter): remove once converter is explicit
+    if not _HAS_MPL:
+        raise ImportError("matplotlib is required for plotting.")
+
+
+def _get_standard_kind(kind):
+    return {'density': 'kde'}.get(kind, kind)
+
+
+def _gca(rc=None):
+    import matplotlib.pyplot as plt
+    with plt.rc_context(rc):
+        return plt.gca()
+
+
+def _gcf():
+    import matplotlib.pyplot as plt
+    return plt.gcf()
+
+
+class MPLPlot(object):
+    """
+    Base class for assembling a pandas plot using matplotlib
+
+    Parameters
+    ----------
+    data :
+
+    """
+
+    @property
+    def _kind(self):
+        """Specify kind str. Must be overridden in child class"""
+        raise NotImplementedError
+
+    _layout_type = 'vertical'
+    _default_rot = 0
+    orientation = None
+    _pop_attributes = ['label', 'style', 'logy', 'logx', 'loglog',
+                       'mark_right', 'stacked']
+    _attr_defaults = {'logy': False, 'logx': False, 'loglog': False,
+                      'mark_right': True, 'stacked': False}
+
+    def __init__(self, data, kind=None, by=None, subplots=False, sharex=None,
+                 sharey=False, use_index=True,
+                 figsize=None, grid=None, legend=True, rot=None,
+                 ax=None, fig=None, title=None, xlim=None, ylim=None,
+                 xticks=None, yticks=None,
+                 sort_columns=False, fontsize=None,
+                 secondary_y=False, colormap=None,
+                 table=False, layout=None, **kwds):
+
+        _raise_if_no_mpl()
+        _converter._WARN = False
+        self.data = data
+        self.by = by
+
+        self.kind = kind
+
+        self.sort_columns = sort_columns
+
+        self.subplots = subplots
+
+        if sharex is None:
+            if ax is None:
+                self.sharex = True
+            else:
+                # if we get an axis, the users should do the visibility
+                # setting...
+                self.sharex = False
+        else:
+            self.sharex = sharex
+
+        self.sharey = sharey
+        self.figsize = figsize
+        self.layout = layout
+
+        self.xticks = xticks
+        self.yticks = yticks
+        self.xlim = xlim
+        self.ylim = ylim
+        self.title = title
+        self.use_index = use_index
+
+        self.fontsize = fontsize
+
+        if rot is not None:
+            self.rot = rot
+            # need to know for format_date_labels since it's rotated to 30 by
+            # default
+            self._rot_set = True
+        else:
+            self._rot_set = False
+            self.rot = self._default_rot
+
+        if grid is None:
+            grid = False if secondary_y else self.plt.rcParams['axes.grid']
+
+        self.grid = grid
+        self.legend = legend
+        self.legend_handles = []
+        self.legend_labels = []
+
+        for attr in self._pop_attributes:
+            value = kwds.pop(attr, self._attr_defaults.get(attr, None))
+            setattr(self, attr, value)
+
+        self.ax = ax
+        self.fig = fig
+        self.axes = None
+
+        # parse errorbar input if given
+        xerr = kwds.pop('xerr', None)
+        yerr = kwds.pop('yerr', None)
+        self.errors = {kw: self._parse_errorbars(kw, err)
+                       for kw, err in zip(['xerr', 'yerr'], [xerr, yerr])}
+
+        if not isinstance(secondary_y, (bool, tuple, list,
+                                        np.ndarray, ABCIndexClass)):
+            secondary_y = [secondary_y]
+        self.secondary_y = secondary_y
+
+        # ugly TypeError if user passes matplotlib's `cmap` name.
+        # Probably better to accept either.
+        if 'cmap' in kwds and colormap:
+            raise TypeError("Only specify one of `cmap` and `colormap`.")
+        elif 'cmap' in kwds:
+            self.colormap = kwds.pop('cmap')
+        else:
+            self.colormap = colormap
+
+        self.table = table
+
+        self.kwds = kwds
+
+        self._validate_color_args()
+
+    def _validate_color_args(self):
+        if 'color' not in self.kwds and 'colors' in self.kwds:
+            warnings.warn(("'colors' is being deprecated. Please use 'color'"
+                           "instead of 'colors'"))
+            colors = self.kwds.pop('colors')
+            self.kwds['color'] = colors
+
+        if ('color' in self.kwds and self.nseries == 1 and
+                not is_list_like(self.kwds['color'])):
+            # support series.plot(color='green')
+            self.kwds['color'] = [self.kwds['color']]
+
+        if ('color' in self.kwds and isinstance(self.kwds['color'], tuple) and
+                self.nseries == 1 and len(self.kwds['color']) in (3, 4)):
+            # support RGB and RGBA tuples in series plot
+            self.kwds['color'] = [self.kwds['color']]
+
+        if ('color' in self.kwds or 'colors' in self.kwds) and \
+                self.colormap is not None:
+            warnings.warn("'color' and 'colormap' cannot be used "
+                          "simultaneously. Using 'color'")
+
+        if 'color' in self.kwds and self.style is not None:
+            if is_list_like(self.style):
+                styles = self.style
+            else:
+                styles = [self.style]
+            # need only a single match
+            for s in styles:
+                if re.match('^[a-z]+?', s) is not None:
+                    raise ValueError(
+                        "Cannot pass 'style' string with a color "
+                        "symbol and 'color' keyword argument. Please"
+                        " use one or the other or pass 'style' "
+                        "without a color symbol")
+
+    def _iter_data(self, data=None, keep_index=False, fillna=None):
+        if data is None:
+            data = self.data
+        if fillna is not None:
+            data = data.fillna(fillna)
+
+        # TODO: unused?
+        # if self.sort_columns:
+        #     columns = com.try_sort(data.columns)
+        # else:
+        #     columns = data.columns
+
+        for col, values in data.iteritems():
+            if keep_index is True:
+                yield col, values
+            else:
+                yield col, values.values
+
+    @property
+    def nseries(self):
+        if self.data.ndim == 1:
+            return 1
+        else:
+            return self.data.shape[1]
+
+    def draw(self):
+        self.plt.draw_if_interactive()
+
+    def generate(self):
+        self._args_adjust()
+        self._compute_plot_data()
+        self._setup_subplots()
+        self._make_plot()
+        self._add_table()
+        self._make_legend()
+        self._adorn_subplots()
+
+        for ax in self.axes:
+            self._post_plot_logic_common(ax, self.data)
+            self._post_plot_logic(ax, self.data)
+
+    def _args_adjust(self):
+        pass
+
+    def _has_plotted_object(self, ax):
+        """check whether ax has data"""
+        return (len(ax.lines) != 0 or
+                len(ax.artists) != 0 or
+                len(ax.containers) != 0)
+
+    def _maybe_right_yaxis(self, ax, axes_num):
+        if not self.on_right(axes_num):
+            # secondary axes may be passed via ax kw
+            return self._get_ax_layer(ax)
+
+        if hasattr(ax, 'right_ax'):
+            # if it has right_ax proparty, ``ax`` must be left axes
+            return ax.right_ax
+        elif hasattr(ax, 'left_ax'):
+            # if it has left_ax proparty, ``ax`` must be right axes
+            return ax
+        else:
+            # otherwise, create twin axes
+            orig_ax, new_ax = ax, ax.twinx()
+            # TODO: use Matplotlib public API when available
+            new_ax._get_lines = orig_ax._get_lines
+            new_ax._get_patches_for_fill = orig_ax._get_patches_for_fill
+            orig_ax.right_ax, new_ax.left_ax = new_ax, orig_ax
+
+            if not self._has_plotted_object(orig_ax):  # no data on left y
+                orig_ax.get_yaxis().set_visible(False)
+
+            if self.logy or self.loglog:
+                new_ax.set_yscale('log')
+            return new_ax
+
+    def _setup_subplots(self):
+        if self.subplots:
+            fig, axes = _subplots(naxes=self.nseries,
+                                  sharex=self.sharex, sharey=self.sharey,
+                                  figsize=self.figsize, ax=self.ax,
+                                  layout=self.layout,
+                                  layout_type=self._layout_type)
+        else:
+            if self.ax is None:
+                fig = self.plt.figure(figsize=self.figsize)
+                axes = fig.add_subplot(111)
+            else:
+                fig = self.ax.get_figure()
+                if self.figsize is not None:
+                    fig.set_size_inches(self.figsize)
+                axes = self.ax
+
+        axes = _flatten(axes)
+
+        if self.logx or self.loglog:
+            [a.set_xscale('log') for a in axes]
+        if self.logy or self.loglog:
+            [a.set_yscale('log') for a in axes]
+
+        self.fig = fig
+        self.axes = axes
+
+    @property
+    def result(self):
+        """
+        Return result axes
+        """
+        if self.subplots:
+            if self.layout is not None and not is_list_like(self.ax):
+                return self.axes.reshape(*self.layout)
+            else:
+                return self.axes
+        else:
+            sec_true = isinstance(self.secondary_y, bool) and self.secondary_y
+            all_sec = (is_list_like(self.secondary_y) and
+                       len(self.secondary_y) == self.nseries)
+            if (sec_true or all_sec):
+                # if all data is plotted on secondary, return right axes
+                return self._get_ax_layer(self.axes[0], primary=False)
+            else:
+                return self.axes[0]
+
+    def _compute_plot_data(self):
+        data = self.data
+
+        if isinstance(data, ABCSeries):
+            label = self.label
+            if label is None and data.name is None:
+                label = 'None'
+            data = data.to_frame(name=label)
+
+        # GH16953, _convert is needed as fallback, for ``Series``
+        # with ``dtype == object``
+        data = data._convert(datetime=True, timedelta=True)
+        numeric_data = data.select_dtypes(include=[np.number,
+                                                   "datetime",
+                                                   "datetimetz",
+                                                   "timedelta"])
+
+        try:
+            is_empty = numeric_data.empty
+        except AttributeError:
+            is_empty = not len(numeric_data)
+
+        # no empty frames or series allowed
+        if is_empty:
+            raise TypeError('Empty {0!r}: no numeric data to '
+                            'plot'.format(numeric_data.__class__.__name__))
+
+        self.data = numeric_data
+
+    def _make_plot(self):
+        raise AbstractMethodError(self)
+
+    def _add_table(self):
+        if self.table is False:
+            return
+        elif self.table is True:
+            data = self.data.transpose()
+        else:
+            data = self.table
+        ax = self._get_ax(0)
+        table(ax, data)
+
+    def _post_plot_logic_common(self, ax, data):
+        """Common post process for each axes"""
+
+        def get_label(i):
+            try:
+                return pprint_thing(data.index[i])
+            except Exception:
+                return ''
+
+        if self.orientation == 'vertical' or self.orientation is None:
+            if self._need_to_set_index:
+                xticklabels = [get_label(x) for x in ax.get_xticks()]
+                ax.set_xticklabels(xticklabels)
+            self._apply_axis_properties(ax.xaxis, rot=self.rot,
+                                        fontsize=self.fontsize)
+            self._apply_axis_properties(ax.yaxis, fontsize=self.fontsize)
+
+            if hasattr(ax, 'right_ax'):
+                self._apply_axis_properties(ax.right_ax.yaxis,
+                                            fontsize=self.fontsize)
+
+        elif self.orientation == 'horizontal':
+            if self._need_to_set_index:
+                yticklabels = [get_label(y) for y in ax.get_yticks()]
+                ax.set_yticklabels(yticklabels)
+            self._apply_axis_properties(ax.yaxis, rot=self.rot,
+                                        fontsize=self.fontsize)
+            self._apply_axis_properties(ax.xaxis, fontsize=self.fontsize)
+
+            if hasattr(ax, 'right_ax'):
+                self._apply_axis_properties(ax.right_ax.yaxis,
+                                            fontsize=self.fontsize)
+        else:  # pragma no cover
+            raise ValueError
+
+    def _post_plot_logic(self, ax, data):
+        """Post process for each axes. Overridden in child classes"""
+        pass
+
+    def _adorn_subplots(self):
+        """Common post process unrelated to data"""
+        if len(self.axes) > 0:
+            all_axes = self._get_subplots()
+            nrows, ncols = self._get_axes_layout()
+            _handle_shared_axes(axarr=all_axes, nplots=len(all_axes),
+                                naxes=nrows * ncols, nrows=nrows,
+                                ncols=ncols, sharex=self.sharex,
+                                sharey=self.sharey)
+
+        for ax in self.axes:
+            if self.yticks is not None:
+                ax.set_yticks(self.yticks)
+
+            if self.xticks is not None:
+                ax.set_xticks(self.xticks)
+
+            if self.ylim is not None:
+                ax.set_ylim(self.ylim)
+
+            if self.xlim is not None:
+                ax.set_xlim(self.xlim)
+
+            ax.grid(self.grid)
+
+        if self.title:
+            if self.subplots:
+                if is_list_like(self.title):
+                    if len(self.title) != self.nseries:
+                        msg = ('The length of `title` must equal the number '
+                               'of columns if using `title` of type `list` '
+                               'and `subplots=True`.\n'
+                               'length of title = {}\n'
+                               'number of columns = {}').format(
+                            len(self.title), self.nseries)
+                        raise ValueError(msg)
+
+                    for (ax, title) in zip(self.axes, self.title):
+                        ax.set_title(title)
+                else:
+                    self.fig.suptitle(self.title)
+            else:
+                if is_list_like(self.title):
+                    msg = ('Using `title` of type `list` is not supported '
+                           'unless `subplots=True` is passed')
+                    raise ValueError(msg)
+                self.axes[0].set_title(self.title)
+
+    def _apply_axis_properties(self, axis, rot=None, fontsize=None):
+        labels = axis.get_majorticklabels() + axis.get_minorticklabels()
+        for label in labels:
+            if rot is not None:
+                label.set_rotation(rot)
+            if fontsize is not None:
+                label.set_fontsize(fontsize)
+
+    @property
+    def legend_title(self):
+        if not isinstance(self.data.columns, ABCMultiIndex):
+            name = self.data.columns.name
+            if name is not None:
+                name = pprint_thing(name)
+            return name
+        else:
+            stringified = map(pprint_thing,
+                              self.data.columns.names)
+            return ','.join(stringified)
+
+    def _add_legend_handle(self, handle, label, index=None):
+        if label is not None:
+            if self.mark_right and index is not None:
+                if self.on_right(index):
+                    label = label + ' (right)'
+            self.legend_handles.append(handle)
+            self.legend_labels.append(label)
+
+    def _make_legend(self):
+        ax, leg = self._get_ax_legend(self.axes[0])
+
+        handles = []
+        labels = []
+        title = ''
+
+        if not self.subplots:
+            if leg is not None:
+                title = leg.get_title().get_text()
+                handles = leg.legendHandles
+                labels = [x.get_text() for x in leg.get_texts()]
+
+            if self.legend:
+                if self.legend == 'reverse':
+                    self.legend_handles = reversed(self.legend_handles)
+                    self.legend_labels = reversed(self.legend_labels)
+
+                handles += self.legend_handles
+                labels += self.legend_labels
+                if self.legend_title is not None:
+                    title = self.legend_title
+
+            if len(handles) > 0:
+                ax.legend(handles, labels, loc='best', title=title)
+
+        elif self.subplots and self.legend:
+            for ax in self.axes:
+                if ax.get_visible():
+                    ax.legend(loc='best')
+
+    def _get_ax_legend(self, ax):
+        leg = ax.get_legend()
+        other_ax = (getattr(ax, 'left_ax', None) or
+                    getattr(ax, 'right_ax', None))
+        other_leg = None
+        if other_ax is not None:
+            other_leg = other_ax.get_legend()
+        if leg is None and other_leg is not None:
+            leg = other_leg
+            ax = other_ax
+        return ax, leg
+
+    @cache_readonly
+    def plt(self):
+        import matplotlib.pyplot as plt
+        return plt
+
+    _need_to_set_index = False
+
+    def _get_xticks(self, convert_period=False):
+        index = self.data.index
+        is_datetype = index.inferred_type in ('datetime', 'date',
+                                              'datetime64', 'time')
+
+        if self.use_index:
+            if convert_period and isinstance(index, ABCPeriodIndex):
+                self.data = self.data.reindex(index=index.sort_values())
+                x = self.data.index.to_timestamp()._mpl_repr()
+            elif index.is_numeric():
+                """
+                Matplotlib supports numeric values or datetime objects as
+                xaxis values. Taking LBYL approach here, by the time
+                matplotlib raises exception when using non numeric/datetime
+                values for xaxis, several actions are already taken by plt.
+                """
+                x = index._mpl_repr()
+            elif is_datetype:
+                self.data = self.data[notna(self.data.index)]
+                self.data = self.data.sort_index()
+                x = self.data.index._mpl_repr()
+            else:
+                self._need_to_set_index = True
+                x = lrange(len(index))
+        else:
+            x = lrange(len(index))
+
+        return x
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, is_errorbar=False, **kwds):
+        mask = isna(y)
+        if mask.any():
+            y = np.ma.array(y)
+            y = np.ma.masked_where(mask, y)
+
+        if isinstance(x, ABCIndexClass):
+            x = x._mpl_repr()
+
+        if is_errorbar:
+            if 'xerr' in kwds:
+                kwds['xerr'] = np.array(kwds.get('xerr'))
+            if 'yerr' in kwds:
+                kwds['yerr'] = np.array(kwds.get('yerr'))
+            return ax.errorbar(x, y, **kwds)
+        else:
+            # prevent style kwarg from going to errorbar, where it is
+            # unsupported
+            if style is not None:
+                args = (x, y, style)
+            else:
+                args = (x, y)
+            return ax.plot(*args, **kwds)
+
+    def _get_index_name(self):
+        if isinstance(self.data.index, ABCMultiIndex):
+            name = self.data.index.names
+            if com._any_not_none(*name):
+                name = ','.join(pprint_thing(x) for x in name)
+            else:
+                name = None
+        else:
+            name = self.data.index.name
+            if name is not None:
+                name = pprint_thing(name)
+
+        return name
+
+    @classmethod
+    def _get_ax_layer(cls, ax, primary=True):
+        """get left (primary) or right (secondary) axes"""
+        if primary:
+            return getattr(ax, 'left_ax', ax)
+        else:
+            return getattr(ax, 'right_ax', ax)
+
+    def _get_ax(self, i):
+        # get the twinx ax if appropriate
+        if self.subplots:
+            ax = self.axes[i]
+            ax = self._maybe_right_yaxis(ax, i)
+            self.axes[i] = ax
+        else:
+            ax = self.axes[0]
+            ax = self._maybe_right_yaxis(ax, i)
+
+        ax.get_yaxis().set_visible(True)
+        return ax
+
+    def on_right(self, i):
+        if isinstance(self.secondary_y, bool):
+            return self.secondary_y
+
+        if isinstance(self.secondary_y, (tuple, list,
+                                         np.ndarray, ABCIndexClass)):
+            return self.data.columns[i] in self.secondary_y
+
+    def _apply_style_colors(self, colors, kwds, col_num, label):
+        """
+        Manage style and color based on column number and its label.
+        Returns tuple of appropriate style and kwds which "color" may be added.
+        """
+        style = None
+        if self.style is not None:
+            if isinstance(self.style, list):
+                try:
+                    style = self.style[col_num]
+                except IndexError:
+                    pass
+            elif isinstance(self.style, dict):
+                style = self.style.get(label, style)
+            else:
+                style = self.style
+
+        has_color = 'color' in kwds or self.colormap is not None
+        nocolor_style = style is None or re.match('[a-z]+', style) is None
+        if (has_color or self.subplots) and nocolor_style:
+            kwds['color'] = colors[col_num % len(colors)]
+        return style, kwds
+
+    def _get_colors(self, num_colors=None, color_kwds='color'):
+        if num_colors is None:
+            num_colors = self.nseries
+
+        return _get_standard_colors(num_colors=num_colors,
+                                    colormap=self.colormap,
+                                    color=self.kwds.get(color_kwds))
+
+    def _parse_errorbars(self, label, err):
+        """
+        Look for error keyword arguments and return the actual errorbar data
+        or return the error DataFrame/dict
+
+        Error bars can be specified in several ways:
+            Series: the user provides a pandas.Series object of the same
+                    length as the data
+            ndarray: provides a np.ndarray of the same length as the data
+            DataFrame/dict: error values are paired with keys matching the
+                    key in the plotted DataFrame
+            str: the name of the column within the plotted DataFrame
+        """
+
+        if err is None:
+            return None
+
+        def match_labels(data, e):
+            e = e.reindex(data.index)
+            return e
+
+        # key-matched DataFrame
+        if isinstance(err, ABCDataFrame):
+
+            err = match_labels(self.data, err)
+        # key-matched dict
+        elif isinstance(err, dict):
+            pass
+
+        # Series of error values
+        elif isinstance(err, ABCSeries):
+            # broadcast error series across data
+            err = match_labels(self.data, err)
+            err = np.atleast_2d(err)
+            err = np.tile(err, (self.nseries, 1))
+
+        # errors are a column in the dataframe
+        elif isinstance(err, string_types):
+            evalues = self.data[err].values
+            self.data = self.data[self.data.columns.drop(err)]
+            err = np.atleast_2d(evalues)
+            err = np.tile(err, (self.nseries, 1))
+
+        elif is_list_like(err):
+            if is_iterator(err):
+                err = np.atleast_2d(list(err))
+            else:
+                # raw error values
+                err = np.atleast_2d(err)
+
+            err_shape = err.shape
+
+            # asymmetrical error bars
+            if err.ndim == 3:
+                if (err_shape[0] != self.nseries) or \
+                        (err_shape[1] != 2) or \
+                        (err_shape[2] != len(self.data)):
+                    msg = "Asymmetrical error bars should be provided " + \
+                        "with the shape (%u, 2, %u)" % \
+                        (self.nseries, len(self.data))
+                    raise ValueError(msg)
+
+            # broadcast errors to each data series
+            if len(err) == 1:
+                err = np.tile(err, (self.nseries, 1))
+
+        elif is_number(err):
+            err = np.tile([err], (self.nseries, len(self.data)))
+
+        else:
+            msg = "No valid {label} detected".format(label=label)
+            raise ValueError(msg)
+
+        return err
+
+    def _get_errorbars(self, label=None, index=None, xerr=True, yerr=True):
+        errors = {}
+
+        for kw, flag in zip(['xerr', 'yerr'], [xerr, yerr]):
+            if flag:
+                err = self.errors[kw]
+                # user provided label-matched dataframe of errors
+                if isinstance(err, (ABCDataFrame, dict)):
+                    if label is not None and label in err.keys():
+                        err = err[label]
+                    else:
+                        err = None
+                elif index is not None and err is not None:
+                    err = err[index]
+
+                if err is not None:
+                    errors[kw] = err
+        return errors
+
+    def _get_subplots(self):
+        from matplotlib.axes import Subplot
+        return [ax for ax in self.axes[0].get_figure().get_axes()
+                if isinstance(ax, Subplot)]
+
+    def _get_axes_layout(self):
+        axes = self._get_subplots()
+        x_set = set()
+        y_set = set()
+        for ax in axes:
+            # check axes coordinates to estimate layout
+            points = ax.get_position().get_points()
+            x_set.add(points[0][0])
+            y_set.add(points[0][1])
+        return (len(y_set), len(x_set))
+
+
+class PlanePlot(MPLPlot):
+    """
+    Abstract class for plotting on plane, currently scatter and hexbin.
+    """
+
+    _layout_type = 'single'
+
+    def __init__(self, data, x, y, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        if x is None or y is None:
+            raise ValueError(self._kind + ' requires an x and y column')
+        if is_integer(x) and not self.data.columns.holds_integer():
+            x = self.data.columns[x]
+        if is_integer(y) and not self.data.columns.holds_integer():
+            y = self.data.columns[y]
+        if len(self.data[x]._get_numeric_data()) == 0:
+            raise ValueError(self._kind + ' requires x column to be numeric')
+        if len(self.data[y]._get_numeric_data()) == 0:
+            raise ValueError(self._kind + ' requires y column to be numeric')
+
+        self.x = x
+        self.y = y
+
+    @property
+    def nseries(self):
+        return 1
+
+    def _post_plot_logic(self, ax, data):
+        x, y = self.x, self.y
+        ax.set_ylabel(pprint_thing(y))
+        ax.set_xlabel(pprint_thing(x))
+
+    def _plot_colorbar(self, ax, **kwds):
+        # Addresses issues #10611 and #10678:
+        # When plotting scatterplots and hexbinplots in IPython
+        # inline backend the colorbar axis height tends not to
+        # exactly match the parent axis height.
+        # The difference is due to small fractional differences
+        # in floating points with similar representation.
+        # To deal with this, this method forces the colorbar
+        # height to take the height of the parent axes.
+        # For a more detailed description of the issue
+        # see the following link:
+        # https://github.com/ipython/ipython/issues/11215
+        img = ax.collections[0]
+        cbar = self.fig.colorbar(img, ax=ax, **kwds)
+
+        if _mpl_ge_3_0_0():
+            # The workaround below is no longer necessary.
+            return
+
+        points = ax.get_position().get_points()
+        cbar_points = cbar.ax.get_position().get_points()
+
+        cbar.ax.set_position([cbar_points[0, 0],
+                              points[0, 1],
+                              cbar_points[1, 0] - cbar_points[0, 0],
+                              points[1, 1] - points[0, 1]])
+        # To see the discrepancy in axis heights uncomment
+        # the following two lines:
+        # print(points[1, 1] - points[0, 1])
+        # print(cbar_points[1, 1] - cbar_points[0, 1])
+
+
+class ScatterPlot(PlanePlot):
+    _kind = 'scatter'
+
+    def __init__(self, data, x, y, s=None, c=None, **kwargs):
+        if s is None:
+            # hide the matplotlib default for size, in case we want to change
+            # the handling of this argument later
+            s = 20
+        super(ScatterPlot, self).__init__(data, x, y, s=s, **kwargs)
+        if is_integer(c) and not self.data.columns.holds_integer():
+            c = self.data.columns[c]
+        self.c = c
+
+    def _make_plot(self):
+        x, y, c, data = self.x, self.y, self.c, self.data
+        ax = self.axes[0]
+
+        c_is_column = is_hashable(c) and c in self.data.columns
+
+        # plot a colorbar only if a colormap is provided or necessary
+        cb = self.kwds.pop('colorbar', self.colormap or c_is_column)
+
+        # pandas uses colormap, matplotlib uses cmap.
+        cmap = self.colormap or 'Greys'
+        cmap = self.plt.cm.get_cmap(cmap)
+        color = self.kwds.pop("color", None)
+        if c is not None and color is not None:
+            raise TypeError('Specify exactly one of `c` and `color`')
+        elif c is None and color is None:
+            c_values = self.plt.rcParams['patch.facecolor']
+        elif color is not None:
+            c_values = color
+        elif c_is_column:
+            c_values = self.data[c].values
+        else:
+            c_values = c
+
+        if self.legend and hasattr(self, 'label'):
+            label = self.label
+        else:
+            label = None
+        scatter = ax.scatter(data[x].values, data[y].values, c=c_values,
+                             label=label, cmap=cmap, **self.kwds)
+        if cb:
+            cbar_label = c if c_is_column else ''
+            self._plot_colorbar(ax, label=cbar_label)
+
+        if label is not None:
+            self._add_legend_handle(scatter, label)
+        else:
+            self.legend = False
+
+        errors_x = self._get_errorbars(label=x, index=0, yerr=False)
+        errors_y = self._get_errorbars(label=y, index=0, xerr=False)
+        if len(errors_x) > 0 or len(errors_y) > 0:
+            err_kwds = dict(errors_x, **errors_y)
+            err_kwds['ecolor'] = scatter.get_facecolor()[0]
+            ax.errorbar(data[x].values, data[y].values,
+                        linestyle='none', **err_kwds)
+
+
+class HexBinPlot(PlanePlot):
+    _kind = 'hexbin'
+
+    def __init__(self, data, x, y, C=None, **kwargs):
+        super(HexBinPlot, self).__init__(data, x, y, **kwargs)
+        if is_integer(C) and not self.data.columns.holds_integer():
+            C = self.data.columns[C]
+        self.C = C
+
+    def _make_plot(self):
+        x, y, data, C = self.x, self.y, self.data, self.C
+        ax = self.axes[0]
+        # pandas uses colormap, matplotlib uses cmap.
+        cmap = self.colormap or 'BuGn'
+        cmap = self.plt.cm.get_cmap(cmap)
+        cb = self.kwds.pop('colorbar', True)
+
+        if C is None:
+            c_values = None
+        else:
+            c_values = data[C].values
+
+        ax.hexbin(data[x].values, data[y].values, C=c_values, cmap=cmap,
+                  **self.kwds)
+        if cb:
+            self._plot_colorbar(ax)
+
+    def _make_legend(self):
+        pass
+
+
+class LinePlot(MPLPlot):
+    _kind = 'line'
+    _default_rot = 0
+    orientation = 'vertical'
+
+    def __init__(self, data, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        if self.stacked:
+            self.data = self.data.fillna(value=0)
+        self.x_compat = plot_params['x_compat']
+        if 'x_compat' in self.kwds:
+            self.x_compat = bool(self.kwds.pop('x_compat'))
+
+    def _is_ts_plot(self):
+        # this is slightly deceptive
+        return not self.x_compat and self.use_index and self._use_dynamic_x()
+
+    def _use_dynamic_x(self):
+        from pandas.plotting._timeseries import _use_dynamic_x
+        return _use_dynamic_x(self._get_ax(0), self.data)
+
+    def _make_plot(self):
+        if self._is_ts_plot():
+            from pandas.plotting._timeseries import _maybe_convert_index
+            data = _maybe_convert_index(self._get_ax(0), self.data)
+
+            x = data.index      # dummy, not used
+            plotf = self._ts_plot
+            it = self._iter_data(data=data, keep_index=True)
+        else:
+            x = self._get_xticks(convert_period=True)
+            plotf = self._plot
+            it = self._iter_data()
+
+        stacking_id = self._get_stacking_id()
+        is_errorbar = com._any_not_none(*self.errors.values())
+
+        colors = self._get_colors()
+        for i, (label, y) in enumerate(it):
+            ax = self._get_ax(i)
+            kwds = self.kwds.copy()
+            style, kwds = self._apply_style_colors(colors, kwds, i, label)
+
+            errors = self._get_errorbars(label=label, index=i)
+            kwds = dict(kwds, **errors)
+
+            label = pprint_thing(label)  # .encode('utf-8')
+            kwds['label'] = label
+
+            newlines = plotf(ax, x, y, style=style, column_num=i,
+                             stacking_id=stacking_id,
+                             is_errorbar=is_errorbar,
+                             **kwds)
+            self._add_legend_handle(newlines[0], label, index=i)
+
+            lines = _get_all_lines(ax)
+            left, right = _get_xlim(lines)
+            ax.set_xlim(left, right)
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, column_num=None,
+              stacking_id=None, **kwds):
+        # column_num is used to get the target column from protf in line and
+        # area plots
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(y))
+        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
+        lines = MPLPlot._plot(ax, x, y_values, style=style, **kwds)
+        cls._update_stacker(ax, stacking_id, y)
+        return lines
+
+    @classmethod
+    def _ts_plot(cls, ax, x, data, style=None, **kwds):
+        from pandas.plotting._timeseries import (_maybe_resample,
+                                                 _decorate_axes,
+                                                 format_dateaxis)
+        # accept x to be consistent with normal plot func,
+        # x is not passed to tsplot as it uses data.index as x coordinate
+        # column_num must be in kwds for stacking purpose
+        freq, data = _maybe_resample(data, ax, kwds)
+
+        # Set ax with freq info
+        _decorate_axes(ax, freq, kwds)
+        # digging deeper
+        if hasattr(ax, 'left_ax'):
+            _decorate_axes(ax.left_ax, freq, kwds)
+        if hasattr(ax, 'right_ax'):
+            _decorate_axes(ax.right_ax, freq, kwds)
+        ax._plot_data.append((data, cls._kind, kwds))
+
+        lines = cls._plot(ax, data.index, data.values, style=style, **kwds)
+        # set date formatter, locators and rescale limits
+        format_dateaxis(ax, ax.freq, data.index)
+        return lines
+
+    def _get_stacking_id(self):
+        if self.stacked:
+            return id(self.data)
+        else:
+            return None
+
+    @classmethod
+    def _initialize_stacker(cls, ax, stacking_id, n):
+        if stacking_id is None:
+            return
+        if not hasattr(ax, '_stacker_pos_prior'):
+            ax._stacker_pos_prior = {}
+        if not hasattr(ax, '_stacker_neg_prior'):
+            ax._stacker_neg_prior = {}
+        ax._stacker_pos_prior[stacking_id] = np.zeros(n)
+        ax._stacker_neg_prior[stacking_id] = np.zeros(n)
+
+    @classmethod
+    def _get_stacked_values(cls, ax, stacking_id, values, label):
+        if stacking_id is None:
+            return values
+        if not hasattr(ax, '_stacker_pos_prior'):
+            # stacker may not be initialized for subplots
+            cls._initialize_stacker(ax, stacking_id, len(values))
+
+        if (values >= 0).all():
+            return ax._stacker_pos_prior[stacking_id] + values
+        elif (values <= 0).all():
+            return ax._stacker_neg_prior[stacking_id] + values
+
+        raise ValueError('When stacked is True, each column must be either '
+                         'all positive or negative.'
+                         '{0} contains both positive and negative values'
+                         .format(label))
+
+    @classmethod
+    def _update_stacker(cls, ax, stacking_id, values):
+        if stacking_id is None:
+            return
+        if (values >= 0).all():
+            ax._stacker_pos_prior[stacking_id] += values
+        elif (values <= 0).all():
+            ax._stacker_neg_prior[stacking_id] += values
+
+    def _post_plot_logic(self, ax, data):
+        condition = (not self._use_dynamic_x() and
+                     data.index.is_all_dates and
+                     not self.subplots or
+                     (self.subplots and self.sharex))
+
+        index_name = self._get_index_name()
+
+        if condition:
+            # irregular TS rotated 30 deg. by default
+            # probably a better place to check / set this.
+            if not self._rot_set:
+                self.rot = 30
+            format_date_labels(ax, rot=self.rot)
+
+        if index_name is not None and self.use_index:
+            ax.set_xlabel(index_name)
+
+
+class AreaPlot(LinePlot):
+    _kind = 'area'
+
+    def __init__(self, data, **kwargs):
+        kwargs.setdefault('stacked', True)
+        data = data.fillna(value=0)
+        LinePlot.__init__(self, data, **kwargs)
+
+        if not self.stacked:
+            # use smaller alpha to distinguish overlap
+            self.kwds.setdefault('alpha', 0.5)
+
+        if self.logy or self.loglog:
+            raise ValueError("Log-y scales are not supported in area plot")
+
+    @classmethod
+    def _plot(cls, ax, x, y, style=None, column_num=None,
+              stacking_id=None, is_errorbar=False, **kwds):
+
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(y))
+        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
+
+        # need to remove label, because subplots uses mpl legend as it is
+        line_kwds = kwds.copy()
+        line_kwds.pop('label')
+        lines = MPLPlot._plot(ax, x, y_values, style=style, **line_kwds)
+
+        # get data from the line to get coordinates for fill_between
+        xdata, y_values = lines[0].get_data(orig=False)
+
+        # unable to use ``_get_stacked_values`` here to get starting point
+        if stacking_id is None:
+            start = np.zeros(len(y))
+        elif (y >= 0).all():
+            start = ax._stacker_pos_prior[stacking_id]
+        elif (y <= 0).all():
+            start = ax._stacker_neg_prior[stacking_id]
+        else:
+            start = np.zeros(len(y))
+
+        if 'color' not in kwds:
+            kwds['color'] = lines[0].get_color()
+
+        rect = ax.fill_between(xdata, start, y_values, **kwds)
+        cls._update_stacker(ax, stacking_id, y)
+
+        # LinePlot expects list of artists
+        res = [rect]
+        return res
+
+    def _post_plot_logic(self, ax, data):
+        LinePlot._post_plot_logic(self, ax, data)
+
+        if self.ylim is None:
+            if (data >= 0).all().all():
+                ax.set_ylim(0, None)
+            elif (data <= 0).all().all():
+                ax.set_ylim(None, 0)
+
+
+class BarPlot(MPLPlot):
+    _kind = 'bar'
+    _default_rot = 90
+    orientation = 'vertical'
+
+    def __init__(self, data, **kwargs):
+        # we have to treat a series differently than a
+        # 1-column DataFrame w.r.t. color handling
+        self._is_series = isinstance(data, ABCSeries)
+        self.bar_width = kwargs.pop('width', 0.5)
+        pos = kwargs.pop('position', 0.5)
+        kwargs.setdefault('align', 'center')
+        self.tick_pos = np.arange(len(data))
+
+        self.bottom = kwargs.pop('bottom', 0)
+        self.left = kwargs.pop('left', 0)
+
+        self.log = kwargs.pop('log', False)
+        MPLPlot.__init__(self, data, **kwargs)
+
+        if self.stacked or self.subplots:
+            self.tickoffset = self.bar_width * pos
+            if kwargs['align'] == 'edge':
+                self.lim_offset = self.bar_width / 2
+            else:
+                self.lim_offset = 0
+        else:
+            if kwargs['align'] == 'edge':
+                w = self.bar_width / self.nseries
+                self.tickoffset = self.bar_width * (pos - 0.5) + w * 0.5
+                self.lim_offset = w * 0.5
+            else:
+                self.tickoffset = self.bar_width * pos
+                self.lim_offset = 0
+
+        self.ax_pos = self.tick_pos - self.tickoffset
+
+    def _args_adjust(self):
+        if is_list_like(self.bottom):
+            self.bottom = np.array(self.bottom)
+        if is_list_like(self.left):
+            self.left = np.array(self.left)
+
+    @classmethod
+    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
+        return ax.bar(x, y, w, bottom=start, log=log, **kwds)
+
+    @property
+    def _start_base(self):
+        return self.bottom
+
+    def _make_plot(self):
+        import matplotlib as mpl
+
+        colors = self._get_colors()
+        ncolors = len(colors)
+
+        pos_prior = neg_prior = np.zeros(len(self.data))
+        K = self.nseries
+
+        for i, (label, y) in enumerate(self._iter_data(fillna=0)):
+            ax = self._get_ax(i)
+            kwds = self.kwds.copy()
+            if self._is_series:
+                kwds['color'] = colors
+            else:
+                kwds['color'] = colors[i % ncolors]
+
+            errors = self._get_errorbars(label=label, index=i)
+            kwds = dict(kwds, **errors)
+
+            label = pprint_thing(label)
+
+            if (('yerr' in kwds) or ('xerr' in kwds)) \
+                    and (kwds.get('ecolor') is None):
+                kwds['ecolor'] = mpl.rcParams['xtick.color']
+
+            start = 0
+            if self.log and (y >= 1).all():
+                start = 1
+            start = start + self._start_base
+
+            if self.subplots:
+                w = self.bar_width / 2
+                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+                ax.set_title(label)
+            elif self.stacked:
+                mask = y > 0
+                start = np.where(mask, pos_prior, neg_prior) + self._start_base
+                w = self.bar_width / 2
+                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+                pos_prior = pos_prior + np.where(mask, y, 0)
+                neg_prior = neg_prior + np.where(mask, 0, y)
+            else:
+                w = self.bar_width / K
+                rect = self._plot(ax, self.ax_pos + (i + 0.5) * w, y, w,
+                                  start=start, label=label,
+                                  log=self.log, **kwds)
+            self._add_legend_handle(rect, label, index=i)
+
+    def _post_plot_logic(self, ax, data):
+        if self.use_index:
+            str_index = [pprint_thing(key) for key in data.index]
+        else:
+            str_index = [pprint_thing(key) for key in range(data.shape[0])]
+        name = self._get_index_name()
+
+        s_edge = self.ax_pos[0] - 0.25 + self.lim_offset
+        e_edge = self.ax_pos[-1] + 0.25 + self.bar_width + self.lim_offset
+
+        self._decorate_ticks(ax, name, str_index, s_edge, e_edge)
+
+    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
+        ax.set_xlim((start_edge, end_edge))
+        ax.set_xticks(self.tick_pos)
+        ax.set_xticklabels(ticklabels)
+        if name is not None and self.use_index:
+            ax.set_xlabel(name)
+
+
+class BarhPlot(BarPlot):
+    _kind = 'barh'
+    _default_rot = 0
+    orientation = 'horizontal'
+
+    @property
+    def _start_base(self):
+        return self.left
+
+    @classmethod
+    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
+        return ax.barh(x, y, w, left=start, log=log, **kwds)
+
+    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
+        # horizontal bars
+        ax.set_ylim((start_edge, end_edge))
+        ax.set_yticks(self.tick_pos)
+        ax.set_yticklabels(ticklabels)
+        if name is not None and self.use_index:
+            ax.set_ylabel(name)
+
+
+class HistPlot(LinePlot):
+    _kind = 'hist'
+
+    def __init__(self, data, bins=10, bottom=0, **kwargs):
+        self.bins = bins        # use mpl default
+        self.bottom = bottom
+        # Do not call LinePlot.__init__ which may fill nan
+        MPLPlot.__init__(self, data, **kwargs)
+
+    def _args_adjust(self):
+        if is_integer(self.bins):
+            # create common bin edge
+            values = (self.data._convert(datetime=True)._get_numeric_data())
+            values = np.ravel(values)
+            values = values[~isna(values)]
+
+            hist, self.bins = np.histogram(
+                values, bins=self.bins,
+                range=self.kwds.get('range', None),
+                weights=self.kwds.get('weights', None))
+
+        if is_list_like(self.bottom):
+            self.bottom = np.array(self.bottom)
+
+    @classmethod
+    def _plot(cls, ax, y, style=None, bins=None, bottom=0, column_num=0,
+              stacking_id=None, **kwds):
+        if column_num == 0:
+            cls._initialize_stacker(ax, stacking_id, len(bins) - 1)
+        y = y[~isna(y)]
+
+        base = np.zeros(len(bins) - 1)
+        bottom = bottom + \
+            cls._get_stacked_values(ax, stacking_id, base, kwds['label'])
+        # ignore style
+        n, bins, patches = ax.hist(y, bins=bins, bottom=bottom, **kwds)
+        cls._update_stacker(ax, stacking_id, n)
+        return patches
+
+    def _make_plot(self):
+        colors = self._get_colors()
+        stacking_id = self._get_stacking_id()
+
+        for i, (label, y) in enumerate(self._iter_data()):
+            ax = self._get_ax(i)
+
+            kwds = self.kwds.copy()
+
+            label = pprint_thing(label)
+            kwds['label'] = label
+
+            style, kwds = self._apply_style_colors(colors, kwds, i, label)
+            if style is not None:
+                kwds['style'] = style
+
+            kwds = self._make_plot_keywords(kwds, y)
+            artists = self._plot(ax, y, column_num=i,
+                                 stacking_id=stacking_id, **kwds)
+            self._add_legend_handle(artists[0], label, index=i)
+
+    def _make_plot_keywords(self, kwds, y):
+        """merge BoxPlot/KdePlot properties to passed kwds"""
+        # y is required for KdePlot
+        kwds['bottom'] = self.bottom
+        kwds['bins'] = self.bins
+        return kwds
+
+    def _post_plot_logic(self, ax, data):
+        if self.orientation == 'horizontal':
+            ax.set_xlabel('Frequency')
+        else:
+            ax.set_ylabel('Frequency')
+
+    @property
+    def orientation(self):
+        if self.kwds.get('orientation', None) == 'horizontal':
+            return 'horizontal'
+        else:
+            return 'vertical'
+
+
+_kde_docstring = """
+        Generate Kernel Density Estimate plot using Gaussian kernels.
+
+        In statistics, `kernel density estimation`_ (KDE) is a non-parametric
+        way to estimate the probability density function (PDF) of a random
+        variable. This function uses Gaussian kernels and includes automatic
+        bandwidth determination.
+
+        .. _kernel density estimation:
+            https://en.wikipedia.org/wiki/Kernel_density_estimation
+
+        Parameters
+        ----------
+        bw_method : str, scalar or callable, optional
+            The method used to calculate the estimator bandwidth. This can be
+            'scott', 'silverman', a scalar constant or a callable.
+            If None (default), 'scott' is used.
+            See :class:`scipy.stats.gaussian_kde` for more information.
+        ind : NumPy array or integer, optional
+            Evaluation points for the estimated PDF. If None (default),
+            1000 equally spaced points are used. If `ind` is a NumPy array, the
+            KDE is evaluated at the points passed. If `ind` is an integer,
+            `ind` number of equally spaced points are used.
+        **kwds : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.%(this-datatype)s.plot`.
+
+        Returns
+        -------
+        matplotlib.axes.Axes or numpy.ndarray of them
+
+        See Also
+        --------
+        scipy.stats.gaussian_kde : Representation of a kernel-density
+            estimate using Gaussian kernels. This is the function used
+            internally to estimate the PDF.
+        %(sibling-datatype)s.plot.kde : Generate a KDE plot for a
+            %(sibling-datatype)s.
+
+        Examples
+        --------
+        %(examples)s
+        """
+
+
+class KdePlot(HistPlot):
+    _kind = 'kde'
+    orientation = 'vertical'
+
+    def __init__(self, data, bw_method=None, ind=None, **kwargs):
+        MPLPlot.__init__(self, data, **kwargs)
+        self.bw_method = bw_method
+        self.ind = ind
+
+    def _args_adjust(self):
+        pass
+
+    def _get_ind(self, y):
+        if self.ind is None:
+            # np.nanmax() and np.nanmin() ignores the missing values
+            sample_range = np.nanmax(y) - np.nanmin(y)
+            ind = np.linspace(np.nanmin(y) - 0.5 * sample_range,
+                              np.nanmax(y) + 0.5 * sample_range, 1000)
+        elif is_integer(self.ind):
+            sample_range = np.nanmax(y) - np.nanmin(y)
+            ind = np.linspace(np.nanmin(y) - 0.5 * sample_range,
+                              np.nanmax(y) + 0.5 * sample_range, self.ind)
+        else:
+            ind = self.ind
+        return ind
+
+    @classmethod
+    def _plot(cls, ax, y, style=None, bw_method=None, ind=None,
+              column_num=None, stacking_id=None, **kwds):
+        from scipy.stats import gaussian_kde
+        from scipy import __version__ as spv
+
+        y = remove_na_arraylike(y)
+
+        if LooseVersion(spv) >= '0.11.0':
+            gkde = gaussian_kde(y, bw_method=bw_method)
+        else:
+            gkde = gaussian_kde(y)
+            if bw_method is not None:
+                msg = ('bw_method was added in Scipy 0.11.0.' +
+                       ' Scipy version in use is {spv}.'.format(spv=spv))
+                warnings.warn(msg)
+
+        y = gkde.evaluate(ind)
+        lines = MPLPlot._plot(ax, ind, y, style=style, **kwds)
+        return lines
+
+    def _make_plot_keywords(self, kwds, y):
+        kwds['bw_method'] = self.bw_method
+        kwds['ind'] = self._get_ind(y)
+        return kwds
+
+    def _post_plot_logic(self, ax, data):
+        ax.set_ylabel('Density')
+
+
+class PiePlot(MPLPlot):
+    _kind = 'pie'
+    _layout_type = 'horizontal'
+
+    def __init__(self, data, kind=None, **kwargs):
+        data = data.fillna(value=0)
+        if (data < 0).any().any():
+            raise ValueError("{0} doesn't allow negative values".format(kind))
+        MPLPlot.__init__(self, data, kind=kind, **kwargs)
+
+    def _args_adjust(self):
+        self.grid = False
+        self.logy = False
+        self.logx = False
+        self.loglog = False
+
+    def _validate_color_args(self):
+        pass
+
+    def _make_plot(self):
+        colors = self._get_colors(
+            num_colors=len(self.data), color_kwds='colors')
+        self.kwds.setdefault('colors', colors)
+
+        for i, (label, y) in enumerate(self._iter_data()):
+            ax = self._get_ax(i)
+            if label is not None:
+                label = pprint_thing(label)
+                ax.set_ylabel(label)
+
+            kwds = self.kwds.copy()
+
+            def blank_labeler(label, value):
+                if value == 0:
+                    return ''
+                else:
+                    return label
+
+            idx = [pprint_thing(v) for v in self.data.index]
+            labels = kwds.pop('labels', idx)
+            # labels is used for each wedge's labels
+            # Blank out labels for values of 0 so they don't overlap
+            # with nonzero wedges
+            if labels is not None:
+                blabels = [blank_labeler(l, value) for
+                           l, value in zip(labels, y)]
+            else:
+                blabels = None
+            results = ax.pie(y, labels=blabels, **kwds)
+
+            if kwds.get('autopct', None) is not None:
+                patches, texts, autotexts = results
+            else:
+                patches, texts = results
+                autotexts = []
+
+            if self.fontsize is not None:
+                for t in texts + autotexts:
+                    t.set_fontsize(self.fontsize)
+
+            # leglabels is used for legend labels
+            leglabels = labels if labels is not None else idx
+            for p, l in zip(patches, leglabels):
+                self._add_legend_handle(p, l)
+
+
+class BoxPlot(LinePlot):
+    _kind = 'box'
+    _layout_type = 'horizontal'
+
+    _valid_return_types = (None, 'axes', 'dict', 'both')
+    # namedtuple to hold results
+    BP = namedtuple("Boxplot", ['ax', 'lines'])
+
+    def __init__(self, data, return_type='axes', **kwargs):
+        # Do not call LinePlot.__init__ which may fill nan
+        if return_type not in self._valid_return_types:
+            raise ValueError(
+                "return_type must be {None, 'axes', 'dict', 'both'}")
+
+        self.return_type = return_type
+        MPLPlot.__init__(self, data, **kwargs)
+
+    def _args_adjust(self):
+        if self.subplots:
+            # Disable label ax sharing. Otherwise, all subplots shows last
+            # column label
+            if self.orientation == 'vertical':
+                self.sharex = False
+            else:
+                self.sharey = False
+
+    @classmethod
+    def _plot(cls, ax, y, column_num=None, return_type='axes', **kwds):
+        if y.ndim == 2:
+            y = [remove_na_arraylike(v) for v in y]
+            # Boxplot fails with empty arrays, so need to add a NaN
+            #   if any cols are empty
+            # GH 8181
+            y = [v if v.size > 0 else np.array([np.nan]) for v in y]
+        else:
+            y = remove_na_arraylike(y)
+        bp = ax.boxplot(y, **kwds)
+
+        if return_type == 'dict':
+            return bp, bp
+        elif return_type == 'both':
+            return cls.BP(ax=ax, lines=bp), bp
+        else:
+            return ax, bp
+
+    def _validate_color_args(self):
+        if 'color' in self.kwds:
+            if self.colormap is not None:
+                warnings.warn("'color' and 'colormap' cannot be used "
+                              "simultaneously. Using 'color'")
+            self.color = self.kwds.pop('color')
+
+            if isinstance(self.color, dict):
+                valid_keys = ['boxes', 'whiskers', 'medians', 'caps']
+                for key, values in compat.iteritems(self.color):
+                    if key not in valid_keys:
+                        raise ValueError("color dict contains invalid "
+                                         "key '{0}' "
+                                         "The key must be either {1}"
+                                         .format(key, valid_keys))
+        else:
+            self.color = None
+
+        # get standard colors for default
+        colors = _get_standard_colors(num_colors=3,
+                                      colormap=self.colormap,
+                                      color=None)
+        # use 2 colors by default, for box/whisker and median
+        # flier colors isn't needed here
+        # because it can be specified by ``sym`` kw
+        self._boxes_c = colors[0]
+        self._whiskers_c = colors[0]
+        self._medians_c = colors[2]
+        self._caps_c = 'k'          # mpl default
+
+    def _get_colors(self, num_colors=None, color_kwds='color'):
+        pass
+
+    def maybe_color_bp(self, bp):
+        if isinstance(self.color, dict):
+            boxes = self.color.get('boxes', self._boxes_c)
+            whiskers = self.color.get('whiskers', self._whiskers_c)
+            medians = self.color.get('medians', self._medians_c)
+            caps = self.color.get('caps', self._caps_c)
+        else:
+            # Other types are forwarded to matplotlib
+            # If None, use default colors
+            boxes = self.color or self._boxes_c
+            whiskers = self.color or self._whiskers_c
+            medians = self.color or self._medians_c
+            caps = self.color or self._caps_c
+
+        from matplotlib.artist import setp
+        setp(bp['boxes'], color=boxes, alpha=1)
+        setp(bp['whiskers'], color=whiskers, alpha=1)
+        setp(bp['medians'], color=medians, alpha=1)
+        setp(bp['caps'], color=caps, alpha=1)
+
+    def _make_plot(self):
+        if self.subplots:
+            from pandas.core.series import Series
+            self._return_obj = Series()
+
+            for i, (label, y) in enumerate(self._iter_data()):
+                ax = self._get_ax(i)
+                kwds = self.kwds.copy()
+
+                ret, bp = self._plot(ax, y, column_num=i,
+                                     return_type=self.return_type, **kwds)
+                self.maybe_color_bp(bp)
+                self._return_obj[label] = ret
+
+                label = [pprint_thing(label)]
+                self._set_ticklabels(ax, label)
+        else:
+            y = self.data.values.T
+            ax = self._get_ax(0)
+            kwds = self.kwds.copy()
+
+            ret, bp = self._plot(ax, y, column_num=0,
+                                 return_type=self.return_type, **kwds)
+            self.maybe_color_bp(bp)
+            self._return_obj = ret
+
+            labels = [l for l, _ in self._iter_data()]
+            labels = [pprint_thing(l) for l in labels]
+            if not self.use_index:
+                labels = [pprint_thing(key) for key in range(len(labels))]
+            self._set_ticklabels(ax, labels)
+
+    def _set_ticklabels(self, ax, labels):
+        if self.orientation == 'vertical':
+            ax.set_xticklabels(labels)
+        else:
+            ax.set_yticklabels(labels)
+
+    def _make_legend(self):
+        pass
+
+    def _post_plot_logic(self, ax, data):
+        pass
+
+    @property
+    def orientation(self):
+        if self.kwds.get('vert', True):
+            return 'vertical'
+        else:
+            return 'horizontal'
+
+    @property
+    def result(self):
+        if self.return_type is None:
+            return super(BoxPlot, self).result
+        else:
+            return self._return_obj
+
+
+# kinds supported by both dataframe and series
+_common_kinds = ['line', 'bar', 'barh',
+                 'kde', 'density', 'area', 'hist', 'box']
+# kinds supported by dataframe
+_dataframe_kinds = ['scatter', 'hexbin']
+# kinds supported only by series or dataframe single column
+_series_kinds = ['pie']
+_all_kinds = _common_kinds + _dataframe_kinds + _series_kinds
+
+_klasses = [LinePlot, BarPlot, BarhPlot, KdePlot, HistPlot, BoxPlot,
+            ScatterPlot, HexBinPlot, AreaPlot, PiePlot]
+
+_plot_klass = {klass._kind: klass for klass in _klasses}
+
+
+def _plot(data, x=None, y=None, subplots=False,
+          ax=None, kind='line', **kwds):
+    kind = _get_standard_kind(kind.lower().strip())
+    if kind in _all_kinds:
+        klass = _plot_klass[kind]
+    else:
+        raise ValueError("%r is not a valid plot kind" % kind)
+
+    if kind in _dataframe_kinds:
+        if isinstance(data, ABCDataFrame):
+            plot_obj = klass(data, x=x, y=y, subplots=subplots, ax=ax,
+                             kind=kind, **kwds)
+        else:
+            raise ValueError("plot kind %r can only be used for data frames"
+                             % kind)
+
+    elif kind in _series_kinds:
+        if isinstance(data, ABCDataFrame):
+            if y is None and subplots is False:
+                msg = "{0} requires either y column or 'subplots=True'"
+                raise ValueError(msg.format(kind))
+            elif y is not None:
+                if is_integer(y) and not data.columns.holds_integer():
+                    y = data.columns[y]
+                # converted to series actually. copy to not modify
+                data = data[y].copy()
+                data.index.name = y
+        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
+    else:
+        if isinstance(data, ABCDataFrame):
+            data_cols = data.columns
+            if x is not None:
+                if is_integer(x) and not data.columns.holds_integer():
+                    x = data_cols[x]
+                elif not isinstance(data[x], ABCSeries):
+                    raise ValueError("x must be a label or position")
+                data = data.set_index(x)
+
+            if y is not None:
+                # check if we have y as int or list of ints
+                int_ylist = is_list_like(y) and all(is_integer(c) for c in y)
+                int_y_arg = is_integer(y) or int_ylist
+                if int_y_arg and not data.columns.holds_integer():
+                    y = data_cols[y]
+
+                label_kw = kwds['label'] if 'label' in kwds else False
+                for kw in ['xerr', 'yerr']:
+                    if (kw in kwds) and \
+                        (isinstance(kwds[kw], string_types) or
+                            is_integer(kwds[kw])):
+                        try:
+                            kwds[kw] = data[kwds[kw]]
+                        except (IndexError, KeyError, TypeError):
+                            pass
+
+                # don't overwrite
+                data = data[y].copy()
+
+                if isinstance(data, ABCSeries):
+                    label_name = label_kw or y
+                    data.name = label_name
+                else:
+                    match = is_list_like(label_kw) and len(label_kw) == len(y)
+                    if label_kw and not match:
+                        raise ValueError(
+                            "label should be list-like and same length as y"
+                        )
+                    label_name = label_kw or data.columns
+                    data.columns = label_name
+
+        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
+
+    plot_obj.generate()
+    plot_obj.draw()
+    return plot_obj.result
+
+
+df_kind = """- 'scatter' : scatter plot
+        - 'hexbin' : hexbin plot"""
+series_kind = ""
+
+df_coord = """x : label or position, default None
+    y : label, position or list of label, positions, default None
+        Allows plotting of one column versus another"""
+series_coord = ""
+
+df_unique = """stacked : bool, default False in line and
+        bar plots, and True in area plot. If True, create stacked plot.
+    sort_columns : bool, default False
+        Sort column names to determine plot ordering
+    secondary_y : bool or sequence, default False
+        Whether to plot on the secondary y-axis
+        If a list/tuple, which columns to plot on secondary y-axis"""
+series_unique = """label : label argument to provide to plot
+    secondary_y : bool or sequence of ints, default False
+        If True then y-axis will be on the right"""
+
+df_ax = """ax : matplotlib axes object, default None
+    subplots : bool, default False
+        Make separate subplots for each column
+    sharex : bool, default True if ax is None else False
+        In case subplots=True, share x axis and set some x axis labels to
+        invisible; defaults to True if ax is None otherwise False if an ax
+        is passed in; Be aware, that passing in both an ax and sharex=True
+        will alter all x axis labels for all axis in a figure!
+    sharey : bool, default False
+        In case subplots=True, share y axis and set some y axis labels to
+        invisible
+    layout : tuple (optional)
+        (rows, columns) for the layout of subplots"""
+series_ax = """ax : matplotlib axes object
+        If not passed, uses gca()"""
+
+df_note = """- If `kind` = 'scatter' and the argument `c` is the name of a dataframe
+      column, the values of that column are used to color each point.
+    - If `kind` = 'hexbin', you can control the size of the bins with the
+      `gridsize` argument. By default, a histogram of the counts around each
+      `(x, y)` point is computed. You can specify alternative aggregations
+      by passing values to the `C` and `reduce_C_function` arguments.
+      `C` specifies the value at each `(x, y)` point and `reduce_C_function`
+      is a function of one argument that reduces all the values in a bin to
+      a single number (e.g. `mean`, `max`, `sum`, `std`)."""
+series_note = ""
+
+_shared_doc_df_kwargs = dict(klass='DataFrame', klass_obj='df',
+                             klass_kind=df_kind, klass_coord=df_coord,
+                             klass_ax=df_ax, klass_unique=df_unique,
+                             klass_note=df_note)
+_shared_doc_series_kwargs = dict(klass='Series', klass_obj='s',
+                                 klass_kind=series_kind,
+                                 klass_coord=series_coord, klass_ax=series_ax,
+                                 klass_unique=series_unique,
+                                 klass_note=series_note)
+
+_shared_docs['plot'] = """
+    Make plots of %(klass)s using matplotlib / pylab.
+
+    *New in version 0.17.0:* Each plot kind has a corresponding method on the
+    ``%(klass)s.plot`` accessor:
+    ``%(klass_obj)s.plot(kind='line')`` is equivalent to
+    ``%(klass_obj)s.plot.line()``.
+
+    Parameters
+    ----------
+    data : %(klass)s
+    %(klass_coord)s
+    kind : str
+        - 'line' : line plot (default)
+        - 'bar' : vertical bar plot
+        - 'barh' : horizontal bar plot
+        - 'hist' : histogram
+        - 'box' : boxplot
+        - 'kde' : Kernel Density Estimation plot
+        - 'density' : same as 'kde'
+        - 'area' : area plot
+        - 'pie' : pie plot
+        %(klass_kind)s
+    %(klass_ax)s
+    figsize : a tuple (width, height) in inches
+    use_index : bool, default True
+        Use index as ticks for x axis
+    title : string or list
+        Title to use for the plot. If a string is passed, print the string at
+        the top of the figure. If a list is passed and `subplots` is True,
+        print each item in the list above the corresponding subplot.
+    grid : bool, default None (matlab style default)
+        Axis grid lines
+    legend : False/True/'reverse'
+        Place legend on axis subplots
+    style : list or dict
+        matplotlib line style per column
+    logx : bool, default False
+        Use log scaling on x axis
+    logy : bool, default False
+        Use log scaling on y axis
+    loglog : bool, default False
+        Use log scaling on both x and y axes
+    xticks : sequence
+        Values to use for the xticks
+    yticks : sequence
+        Values to use for the yticks
+    xlim : 2-tuple/list
+    ylim : 2-tuple/list
+    rot : int, default None
+        Rotation for ticks (xticks for vertical, yticks for horizontal plots)
+    fontsize : int, default None
+        Font size for xticks and yticks
+    colormap : str or matplotlib colormap object, default None
+        Colormap to select colors from. If string, load colormap with that name
+        from matplotlib.
+    colorbar : bool, optional
+        If True, plot colorbar (only relevant for 'scatter' and 'hexbin' plots)
+    position : float
+        Specify relative alignments for bar plot layout.
+        From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
+    table : bool, Series or DataFrame, default False
+        If True, draw a table using the data in the DataFrame and the data will
+        be transposed to meet matplotlib's default layout.
+        If a Series or DataFrame is passed, use passed data to draw a table.
+    yerr : DataFrame, Series, array-like, dict and str
+        See :ref:`Plotting with Error Bars <visualization.errorbars>` for
+        detail.
+    xerr : same types as yerr.
+    %(klass_unique)s
+    mark_right : bool, default True
+        When using a secondary_y axis, automatically mark the column
+        labels with "(right)" in the legend
+    `**kwds` : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+    Notes
+    -----
+
+    - See matplotlib documentation online for more on this subject
+    - If `kind` = 'bar' or 'barh', you can specify relative alignments
+      for bar plot layout by `position` keyword.
+      From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
+    %(klass_note)s
+    """
+
+
+@Appender(_shared_docs['plot'] % _shared_doc_df_kwargs)
+def plot_frame(data, x=None, y=None, kind='line', ax=None,
+               subplots=False, sharex=None, sharey=False, layout=None,
+               figsize=None, use_index=True, title=None, grid=None,
+               legend=True, style=None, logx=False, logy=False, loglog=False,
+               xticks=None, yticks=None, xlim=None, ylim=None,
+               rot=None, fontsize=None, colormap=None, table=False,
+               yerr=None, xerr=None,
+               secondary_y=False, sort_columns=False,
+               **kwds):
+    return _plot(data, kind=kind, x=x, y=y, ax=ax,
+                 subplots=subplots, sharex=sharex, sharey=sharey,
+                 layout=layout, figsize=figsize, use_index=use_index,
+                 title=title, grid=grid, legend=legend,
+                 style=style, logx=logx, logy=logy, loglog=loglog,
+                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
+                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
+                 yerr=yerr, xerr=xerr,
+                 secondary_y=secondary_y, sort_columns=sort_columns,
+                 **kwds)
+
+
+@Appender(_shared_docs['plot'] % _shared_doc_series_kwargs)
+def plot_series(data, kind='line', ax=None,                    # Series unique
+                figsize=None, use_index=True, title=None, grid=None,
+                legend=False, style=None, logx=False, logy=False, loglog=False,
+                xticks=None, yticks=None, xlim=None, ylim=None,
+                rot=None, fontsize=None, colormap=None, table=False,
+                yerr=None, xerr=None,
+                label=None, secondary_y=False,                 # Series unique
+                **kwds):
+
+    import matplotlib.pyplot as plt
+    if ax is None and len(plt.get_fignums()) > 0:
+        ax = _gca()
+        ax = MPLPlot._get_ax_layer(ax)
+    return _plot(data, kind=kind, ax=ax,
+                 figsize=figsize, use_index=use_index, title=title,
+                 grid=grid, legend=legend,
+                 style=style, logx=logx, logy=logy, loglog=loglog,
+                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
+                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
+                 yerr=yerr, xerr=xerr,
+                 label=label, secondary_y=secondary_y,
+                 **kwds)
+
+
+_shared_docs['boxplot'] = """
+    Make a box plot from DataFrame columns.
+
+    Make a box-and-whisker plot from DataFrame columns, optionally grouped
+    by some other columns. A box plot is a method for graphically depicting
+    groups of numerical data through their quartiles.
+    The box extends from the Q1 to Q3 quartile values of the data,
+    with a line at the median (Q2). The whiskers extend from the edges
+    of box to show the range of the data. The position of the whiskers
+    is set by default to `1.5 * IQR (IQR = Q3 - Q1)` from the edges of the box.
+    Outlier points are those past the end of the whiskers.
+
+    For further details see
+    Wikipedia's entry for `boxplot <https://en.wikipedia.org/wiki/Box_plot>`_.
+
+    Parameters
+    ----------
+    column : str or list of str, optional
+        Column name or list of names, or vector.
+        Can be any valid input to :meth:`pandas.DataFrame.groupby`.
+    by : str or array-like, optional
+        Column in the DataFrame to :meth:`pandas.DataFrame.groupby`.
+        One box-plot will be done per value of columns in `by`.
+    ax : object of class matplotlib.axes.Axes, optional
+        The matplotlib axes to be used by boxplot.
+    fontsize : float or str
+        Tick label font size in points or as a string (e.g., `large`).
+    rot : int or float, default 0
+        The rotation angle of labels (in degrees)
+        with respect to the screen coordinate system.
+    grid : bool, default True
+        Setting this to True will show the grid.
+    figsize : A tuple (width, height) in inches
+        The size of the figure to create in matplotlib.
+    layout : tuple (rows, columns), optional
+        For example, (3, 5) will display the subplots
+        using 3 columns and 5 rows, starting from the top-left.
+    return_type : {'axes', 'dict', 'both'} or None, default 'axes'
+        The kind of object to return. The default is ``axes``.
+
+        * 'axes' returns the matplotlib axes the boxplot is drawn on.
+        * 'dict' returns a dictionary whose values are the matplotlib
+          Lines of the boxplot.
+        * 'both' returns a namedtuple with the axes and dict.
+        * when grouping with ``by``, a Series mapping columns to
+          ``return_type`` is returned.
+
+          If ``return_type`` is `None`, a NumPy array
+          of axes with the same shape as ``layout`` is returned.
+    **kwds
+        All other plotting keyword arguments to be passed to
+        :func:`matplotlib.pyplot.boxplot`.
+
+    Returns
+    -------
+    result
+        See Notes.
+
+    See Also
+    --------
+    Series.plot.hist: Make a histogram.
+    matplotlib.pyplot.boxplot : Matplotlib equivalent plot.
+
+    Notes
+    -----
+    The return type depends on the `return_type` parameter:
+
+        * 'axes' : object of class matplotlib.axes.Axes
+        * 'dict' : dict of matplotlib.lines.Line2D objects
+        * 'both' : a namedtuple with structure (ax, lines)
+
+        For data grouped with ``by``:
+
+        * :class:`~pandas.Series`
+        * :class:`~numpy.array` (for ``return_type = None``)
+        Return Series or numpy.array.
+
+    Use ``return_type='dict'`` when you want to tweak the appearance
+    of the lines after plotting. In this case a dict containing the Lines
+    making up the boxes, caps, fliers, medians, and whiskers is returned.
+
+    Examples
+    --------
+
+    Boxplots can be created for every column in the dataframe
+    by ``df.boxplot()`` or indicating the columns to be used:
+
+    .. plot::
+        :context: close-figs
+
+        >>> np.random.seed(1234)
+        >>> df = pd.DataFrame(np.random.randn(10,4),
+        ...                   columns=['Col1', 'Col2', 'Col3', 'Col4'])
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2', 'Col3'])
+
+    Boxplots of variables distributions grouped by the values of a third
+    variable can be created using the option ``by``. For instance:
+
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame(np.random.randn(10, 2),
+        ...                   columns=['Col1', 'Col2'])
+        >>> df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A',
+        ...                      'B', 'B', 'B', 'B', 'B'])
+        >>> boxplot = df.boxplot(by='X')
+
+    A list of strings (i.e. ``['X', 'Y']``) can be passed to boxplot
+    in order to group the data by combination of the variables in the x-axis:
+
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame(np.random.randn(10,3),
+        ...                   columns=['Col1', 'Col2', 'Col3'])
+        >>> df['X'] = pd.Series(['A', 'A', 'A', 'A', 'A',
+        ...                      'B', 'B', 'B', 'B', 'B'])
+        >>> df['Y'] = pd.Series(['A', 'B', 'A', 'B', 'A',
+        ...                      'B', 'A', 'B', 'A', 'B'])
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by=['X', 'Y'])
+
+    The layout of boxplot can be adjusted giving a tuple to ``layout``:
+
+    .. plot::
+        :context: close-figs
+
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                      layout=(2, 1))
+
+    Additional formatting can be done to the boxplot, like suppressing the grid
+    (``grid=False``), rotating the labels in the x-axis (i.e. ``rot=45``)
+    or changing the fontsize (i.e. ``fontsize=15``):
+
+    .. plot::
+        :context: close-figs
+
+        >>> boxplot = df.boxplot(grid=False, rot=45, fontsize=15)
+
+    The parameter ``return_type`` can be used to select the type of element
+    returned by `boxplot`.  When ``return_type='axes'`` is selected,
+    the matplotlib axes on which the boxplot is drawn are returned:
+
+        >>> boxplot = df.boxplot(column=['Col1','Col2'], return_type='axes')
+        >>> type(boxplot)
+        <class 'matplotlib.axes._subplots.AxesSubplot'>
+
+    When grouping with ``by``, a Series mapping columns to ``return_type``
+    is returned:
+
+        >>> boxplot = df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                      return_type='axes')
+        >>> type(boxplot)
+        <class 'pandas.core.series.Series'>
+
+    If ``return_type`` is `None`, a NumPy array of axes with the same shape
+    as ``layout`` is returned:
+
+        >>> boxplot =  df.boxplot(column=['Col1', 'Col2'], by='X',
+        ...                       return_type=None)
+        >>> type(boxplot)
+        <class 'numpy.ndarray'>
+    """
+
+
+@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
+def boxplot(data, column=None, by=None, ax=None, fontsize=None,
+            rot=0, grid=True, figsize=None, layout=None, return_type=None,
+            **kwds):
+
+    # validate return_type:
+    if return_type not in BoxPlot._valid_return_types:
+        raise ValueError("return_type must be {'axes', 'dict', 'both'}")
+
+    if isinstance(data, ABCSeries):
+        data = data.to_frame('x')
+        column = 'x'
+
+    def _get_colors():
+        #  num_colors=3 is required as method maybe_color_bp takes the colors
+        #  in positions 0 and 2.
+        return _get_standard_colors(color=kwds.get('color'), num_colors=3)
+
+    def maybe_color_bp(bp):
+        if 'color' not in kwds:
+            from matplotlib.artist import setp
+            setp(bp['boxes'], color=colors[0], alpha=1)
+            setp(bp['whiskers'], color=colors[0], alpha=1)
+            setp(bp['medians'], color=colors[2], alpha=1)
+
+    def plot_group(keys, values, ax):
+        keys = [pprint_thing(x) for x in keys]
+        values = [np.asarray(remove_na_arraylike(v)) for v in values]
+        bp = ax.boxplot(values, **kwds)
+        if fontsize is not None:
+            ax.tick_params(axis='both', labelsize=fontsize)
+        if kwds.get('vert', 1):
+            ax.set_xticklabels(keys, rotation=rot)
+        else:
+            ax.set_yticklabels(keys, rotation=rot)
+        maybe_color_bp(bp)
+
+        # Return axes in multiplot case, maybe revisit later # 985
+        if return_type == 'dict':
+            return bp
+        elif return_type == 'both':
+            return BoxPlot.BP(ax=ax, lines=bp)
+        else:
+            return ax
+
+    colors = _get_colors()
+    if column is None:
+        columns = None
+    else:
+        if isinstance(column, (list, tuple)):
+            columns = column
+        else:
+            columns = [column]
+
+    if by is not None:
+        # Prefer array return type for 2-D plots to match the subplot layout
+        # https://github.com/pandas-dev/pandas/pull/12216#issuecomment-241175580
+        result = _grouped_plot_by_column(plot_group, data, columns=columns,
+                                         by=by, grid=grid, figsize=figsize,
+                                         ax=ax, layout=layout,
+                                         return_type=return_type)
+    else:
+        if return_type is None:
+            return_type = 'axes'
+        if layout is not None:
+            raise ValueError("The 'layout' keyword is not supported when "
+                             "'by' is None")
+
+        if ax is None:
+            rc = {'figure.figsize': figsize} if figsize is not None else {}
+            ax = _gca(rc)
+        data = data._get_numeric_data()
+        if columns is None:
+            columns = data.columns
+        else:
+            data = data[columns]
+
+        result = plot_group(columns, data.values.T, ax)
+        ax.grid(grid)
+
+    return result
+
+
+@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
+def boxplot_frame(self, column=None, by=None, ax=None, fontsize=None, rot=0,
+                  grid=True, figsize=None, layout=None,
+                  return_type=None, **kwds):
+    import matplotlib.pyplot as plt
+    _converter._WARN = False
+    ax = boxplot(self, column=column, by=by, ax=ax, fontsize=fontsize,
+                 grid=grid, rot=rot, figsize=figsize, layout=layout,
+                 return_type=return_type, **kwds)
+    plt.draw_if_interactive()
+    return ax
+
+
+def scatter_plot(data, x, y, by=None, ax=None, figsize=None, grid=False,
+                 **kwargs):
+    """
+    Make a scatter plot from two DataFrame columns
+
+    Parameters
+    ----------
+    data : DataFrame
+    x : Column name for the x-axis values
+    y : Column name for the y-axis values
+    ax : Matplotlib axis object
+    figsize : A tuple (width, height) in inches
+    grid : Setting this to True will show the grid
+    kwargs : other plotting keyword arguments
+        To be passed to scatter function
+
+    Returns
+    -------
+    matplotlib.Figure
+    """
+    import matplotlib.pyplot as plt
+
+    kwargs.setdefault('edgecolors', 'none')
+
+    def plot_group(group, ax):
+        xvals = group[x].values
+        yvals = group[y].values
+        ax.scatter(xvals, yvals, **kwargs)
+        ax.grid(grid)
+
+    if by is not None:
+        fig = _grouped_plot(plot_group, data, by=by, figsize=figsize, ax=ax)
+    else:
+        if ax is None:
+            fig = plt.figure()
+            ax = fig.add_subplot(111)
+        else:
+            fig = ax.get_figure()
+        plot_group(data, ax)
+        ax.set_ylabel(pprint_thing(y))
+        ax.set_xlabel(pprint_thing(x))
+
+        ax.grid(grid)
+
+    return fig
+
+
+def hist_frame(data, column=None, by=None, grid=True, xlabelsize=None,
+               xrot=None, ylabelsize=None, yrot=None, ax=None, sharex=False,
+               sharey=False, figsize=None, layout=None, bins=10, **kwds):
+    """
+    Make a histogram of the DataFrame's.
+
+    A `histogram`_ is a representation of the distribution of data.
+    This function calls :meth:`matplotlib.pyplot.hist`, on each series in
+    the DataFrame, resulting in one histogram per column.
+
+    .. _histogram: https://en.wikipedia.org/wiki/Histogram
+
+    Parameters
+    ----------
+    data : DataFrame
+        The pandas object holding the data.
+    column : string or sequence
+        If passed, will be used to limit data to a subset of columns.
+    by : object, optional
+        If passed, then used to form histograms for separate groups.
+    grid : bool, default True
+        Whether to show axis grid lines.
+    xlabelsize : int, default None
+        If specified changes the x-axis label size.
+    xrot : float, default None
+        Rotation of x axis labels. For example, a value of 90 displays the
+        x labels rotated 90 degrees clockwise.
+    ylabelsize : int, default None
+        If specified changes the y-axis label size.
+    yrot : float, default None
+        Rotation of y axis labels. For example, a value of 90 displays the
+        y labels rotated 90 degrees clockwise.
+    ax : Matplotlib axes object, default None
+        The axes to plot the histogram on.
+    sharex : bool, default True if ax is None else False
+        In case subplots=True, share x axis and set some x axis labels to
+        invisible; defaults to True if ax is None otherwise False if an ax
+        is passed in.
+        Note that passing in both an ax and sharex=True will alter all x axis
+        labels for all subplots in a figure.
+    sharey : bool, default False
+        In case subplots=True, share y axis and set some y axis labels to
+        invisible.
+    figsize : tuple
+        The size in inches of the figure to create. Uses the value in
+        `matplotlib.rcParams` by default.
+    layout : tuple, optional
+        Tuple of (rows, columns) for the layout of the histograms.
+    bins : integer or sequence, default 10
+        Number of histogram bins to be used. If an integer is given, bins + 1
+        bin edges are calculated and returned. If bins is a sequence, gives
+        bin edges, including left edge of first bin and right edge of last
+        bin. In this case, bins is returned unmodified.
+    **kwds
+        All other plotting keyword arguments to be passed to
+        :meth:`matplotlib.pyplot.hist`.
+
+    Returns
+    -------
+    matplotlib.AxesSubplot or numpy.ndarray of them
+
+    See Also
+    --------
+    matplotlib.pyplot.hist : Plot a histogram using matplotlib.
+
+    Examples
+    --------
+
+    .. plot::
+        :context: close-figs
+
+        This example draws a histogram based on the length and width of
+        some animals, displayed in three bins
+
+        >>> df = pd.DataFrame({
+        ...     'length': [1.5, 0.5, 1.2, 0.9, 3],
+        ...     'width': [0.7, 0.2, 0.15, 0.2, 1.1]
+        ...     }, index= ['pig', 'rabbit', 'duck', 'chicken', 'horse'])
+        >>> hist = df.hist(bins=3)
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+    if by is not None:
+        axes = grouped_hist(data, column=column, by=by, ax=ax, grid=grid,
+                            figsize=figsize, sharex=sharex, sharey=sharey,
+                            layout=layout, bins=bins, xlabelsize=xlabelsize,
+                            xrot=xrot, ylabelsize=ylabelsize,
+                            yrot=yrot, **kwds)
+        return axes
+
+    if column is not None:
+        if not isinstance(column, (list, np.ndarray, ABCIndexClass)):
+            column = [column]
+        data = data[column]
+    data = data._get_numeric_data()
+    naxes = len(data.columns)
+
+    fig, axes = _subplots(naxes=naxes, ax=ax, squeeze=False,
+                          sharex=sharex, sharey=sharey, figsize=figsize,
+                          layout=layout)
+    _axes = _flatten(axes)
+
+    for i, col in enumerate(com.try_sort(data.columns)):
+        ax = _axes[i]
+        ax.hist(data[col].dropna().values, bins=bins, **kwds)
+        ax.set_title(col)
+        ax.grid(grid)
+
+    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                     ylabelsize=ylabelsize, yrot=yrot)
+    fig.subplots_adjust(wspace=0.3, hspace=0.3)
+
+    return axes
+
+
+def hist_series(self, by=None, ax=None, grid=True, xlabelsize=None,
+                xrot=None, ylabelsize=None, yrot=None, figsize=None,
+                bins=10, **kwds):
+    """
+    Draw histogram of the input series using matplotlib.
+
+    Parameters
+    ----------
+    by : object, optional
+        If passed, then used to form histograms for separate groups
+    ax : matplotlib axis object
+        If not passed, uses gca()
+    grid : bool, default True
+        Whether to show axis grid lines
+    xlabelsize : int, default None
+        If specified changes the x-axis label size
+    xrot : float, default None
+        rotation of x axis labels
+    ylabelsize : int, default None
+        If specified changes the y-axis label size
+    yrot : float, default None
+        rotation of y axis labels
+    figsize : tuple, default None
+        figure size in inches by default
+    bins : integer or sequence, default 10
+        Number of histogram bins to be used. If an integer is given, bins + 1
+        bin edges are calculated and returned. If bins is a sequence, gives
+        bin edges, including left edge of first bin and right edge of last
+        bin. In this case, bins is returned unmodified.
+    bins : integer, default 10
+        Number of histogram bins to be used
+    `**kwds` : keywords
+        To be passed to the actual plotting function
+
+    See Also
+    --------
+    matplotlib.axes.Axes.hist : Plot a histogram using matplotlib.
+    """
+    import matplotlib.pyplot as plt
+
+    if by is None:
+        if kwds.get('layout', None) is not None:
+            raise ValueError("The 'layout' keyword is not supported when "
+                             "'by' is None")
+        # hack until the plotting interface is a bit more unified
+        fig = kwds.pop('figure', plt.gcf() if plt.get_fignums() else
+                       plt.figure(figsize=figsize))
+        if (figsize is not None and tuple(figsize) !=
+                tuple(fig.get_size_inches())):
+            fig.set_size_inches(*figsize, forward=True)
+        if ax is None:
+            ax = fig.gca()
+        elif ax.get_figure() != fig:
+            raise AssertionError('passed axis not bound to passed figure')
+        values = self.dropna().values
+
+        ax.hist(values, bins=bins, **kwds)
+        ax.grid(grid)
+        axes = np.array([ax])
+
+        _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                         ylabelsize=ylabelsize, yrot=yrot)
+
+    else:
+        if 'figure' in kwds:
+            raise ValueError("Cannot pass 'figure' when using the "
+                             "'by' argument, since a new 'Figure' instance "
+                             "will be created")
+        axes = grouped_hist(self, by=by, ax=ax, grid=grid, figsize=figsize,
+                            bins=bins, xlabelsize=xlabelsize, xrot=xrot,
+                            ylabelsize=ylabelsize, yrot=yrot, **kwds)
+
+    if hasattr(axes, 'ndim'):
+        if axes.ndim == 1 and len(axes) == 1:
+            return axes[0]
+    return axes
+
+
+def grouped_hist(data, column=None, by=None, ax=None, bins=50, figsize=None,
+                 layout=None, sharex=False, sharey=False, rot=90, grid=True,
+                 xlabelsize=None, xrot=None, ylabelsize=None, yrot=None,
+                 **kwargs):
+    """
+    Grouped histogram
+
+    Parameters
+    ----------
+    data : Series/DataFrame
+    column : object, optional
+    by : object, optional
+    ax : axes, optional
+    bins : int, default 50
+    figsize : tuple, optional
+    layout : optional
+    sharex : bool, default False
+    sharey : bool, default False
+    rot : int, default 90
+    grid : bool, default True
+    kwargs : dict, keyword arguments passed to matplotlib.Axes.hist
+
+    Returns
+    -------
+    collection of Matplotlib Axes
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+
+    def plot_group(group, ax):
+        ax.hist(group.dropna().values, bins=bins, **kwargs)
+
+    xrot = xrot or rot
+
+    fig, axes = _grouped_plot(plot_group, data, column=column,
+                              by=by, sharex=sharex, sharey=sharey, ax=ax,
+                              figsize=figsize, layout=layout, rot=rot)
+
+    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
+                     ylabelsize=ylabelsize, yrot=yrot)
+
+    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9,
+                        hspace=0.5, wspace=0.3)
+    return axes
+
+
+def boxplot_frame_groupby(grouped, subplots=True, column=None, fontsize=None,
+                          rot=0, grid=True, ax=None, figsize=None,
+                          layout=None, sharex=False, sharey=True, **kwds):
+    """
+    Make box plots from DataFrameGroupBy data.
+
+    Parameters
+    ----------
+    grouped : Grouped DataFrame
+    subplots : bool
+        * ``False`` - no subplots will be used
+        * ``True`` - create a subplot for each group
+    column : column name or list of names, or vector
+        Can be any valid input to groupby
+    fontsize : int or string
+    rot : label rotation angle
+    grid : Setting this to True will show the grid
+    ax : Matplotlib axis object, default None
+    figsize : A tuple (width, height) in inches
+    layout : tuple (optional)
+        (rows, columns) for the layout of the plot
+    sharex : bool, default False
+        Whether x-axes will be shared among subplots
+
+        .. versionadded:: 0.23.1
+    sharey : bool, default True
+        Whether y-axes will be shared among subplots
+
+        .. versionadded:: 0.23.1
+    `**kwds` : Keyword Arguments
+        All other plotting keyword arguments to be passed to
+        matplotlib's boxplot function
+
+    Returns
+    -------
+    dict of key/value = group key/DataFrame.boxplot return value
+    or DataFrame.boxplot return value in case subplots=figures=False
+
+    Examples
+    --------
+    >>> import itertools
+    >>> tuples = [t for t in itertools.product(range(1000), range(4))]
+    >>> index = pd.MultiIndex.from_tuples(tuples, names=['lvl0', 'lvl1'])
+    >>> data = np.random.randn(len(index),4)
+    >>> df = pd.DataFrame(data, columns=list('ABCD'), index=index)
+    >>>
+    >>> grouped = df.groupby(level='lvl1')
+    >>> boxplot_frame_groupby(grouped)
+    >>>
+    >>> grouped = df.unstack(level='lvl1').groupby(level=0, axis=1)
+    >>> boxplot_frame_groupby(grouped, subplots=False)
+    """
+    _raise_if_no_mpl()
+    _converter._WARN = False
+    if subplots is True:
+        naxes = len(grouped)
+        fig, axes = _subplots(naxes=naxes, squeeze=False,
+                              ax=ax, sharex=sharex, sharey=sharey,
+                              figsize=figsize, layout=layout)
+        axes = _flatten(axes)
+
+        from pandas.core.series import Series
+        ret = Series()
+        for (key, group), ax in zip(grouped, axes):
+            d = group.boxplot(ax=ax, column=column, fontsize=fontsize,
+                              rot=rot, grid=grid, **kwds)
+            ax.set_title(pprint_thing(key))
+            ret.loc[key] = d
+        fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1,
+                            right=0.9, wspace=0.2)
+    else:
+        from pandas.core.reshape.concat import concat
+        keys, frames = zip(*grouped)
+        if grouped.axis == 0:
+            df = concat(frames, keys=keys, axis=1)
+        else:
+            if len(frames) > 1:
+                df = frames[0].join(frames[1::])
+            else:
+                df = frames[0]
+        ret = df.boxplot(column=column, fontsize=fontsize, rot=rot,
+                         grid=grid, ax=ax, figsize=figsize,
+                         layout=layout, **kwds)
+    return ret
+
+
+def _grouped_plot(plotf, data, column=None, by=None, numeric_only=True,
+                  figsize=None, sharex=True, sharey=True, layout=None,
+                  rot=0, ax=None, **kwargs):
+
+    if figsize == 'default':
+        # allowed to specify mpl default with 'default'
+        warnings.warn("figsize='default' is deprecated. Specify figure"
+                      "size by tuple instead", FutureWarning, stacklevel=4)
+        figsize = None
+
+    grouped = data.groupby(by)
+    if column is not None:
+        grouped = grouped[column]
+
+    naxes = len(grouped)
+    fig, axes = _subplots(naxes=naxes, figsize=figsize,
+                          sharex=sharex, sharey=sharey, ax=ax,
+                          layout=layout)
+
+    _axes = _flatten(axes)
+
+    for i, (key, group) in enumerate(grouped):
+        ax = _axes[i]
+        if numeric_only and isinstance(group, ABCDataFrame):
+            group = group._get_numeric_data()
+        plotf(group, ax, **kwargs)
+        ax.set_title(pprint_thing(key))
+
+    return fig, axes
+
+
+def _grouped_plot_by_column(plotf, data, columns=None, by=None,
+                            numeric_only=True, grid=False,
+                            figsize=None, ax=None, layout=None,
+                            return_type=None, **kwargs):
+    grouped = data.groupby(by)
+    if columns is None:
+        if not isinstance(by, (list, tuple)):
+            by = [by]
+        columns = data._get_numeric_data().columns.difference(by)
+    naxes = len(columns)
+    fig, axes = _subplots(naxes=naxes, sharex=True, sharey=True,
+                          figsize=figsize, ax=ax, layout=layout)
+
+    _axes = _flatten(axes)
+
+    ax_values = []
+
+    for i, col in enumerate(columns):
+        ax = _axes[i]
+        gp_col = grouped[col]
+        keys, values = zip(*gp_col)
+        re_plotf = plotf(keys, values, ax, **kwargs)
+        ax.set_title(col)
+        ax.set_xlabel(pprint_thing(by))
+        ax_values.append(re_plotf)
+        ax.grid(grid)
+
+    from pandas.core.series import Series
+    result = Series(ax_values, index=columns)
+
+    # Return axes in multiplot case, maybe revisit later # 985
+    if return_type is None:
+        result = axes
+
+    byline = by[0] if len(by) == 1 else by
+    fig.suptitle('Boxplot grouped by {byline}'.format(byline=byline))
+    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9, wspace=0.2)
+
+    return result
+
+
+class BasePlotMethods(PandasObject):
+
+    def __init__(self, data):
+        self._parent = data  # can be Series or DataFrame
+
+    def __call__(self, *args, **kwargs):
+        raise NotImplementedError
+
+
+class SeriesPlotMethods(BasePlotMethods):
+    """
+    Series plotting accessor and method.
+
+    Examples
+    --------
+    >>> s.plot.line()
+    >>> s.plot.bar()
+    >>> s.plot.hist()
+
+    Plotting methods can also be accessed by calling the accessor as a method
+    with the ``kind`` argument:
+    ``s.plot(kind='line')`` is equivalent to ``s.plot.line()``
+    """
+
+    def __call__(self, kind='line', ax=None,
+                 figsize=None, use_index=True, title=None, grid=None,
+                 legend=False, style=None, logx=False, logy=False,
+                 loglog=False, xticks=None, yticks=None,
+                 xlim=None, ylim=None,
+                 rot=None, fontsize=None, colormap=None, table=False,
+                 yerr=None, xerr=None,
+                 label=None, secondary_y=False, **kwds):
+        return plot_series(self._parent, kind=kind, ax=ax, figsize=figsize,
+                           use_index=use_index, title=title, grid=grid,
+                           legend=legend, style=style, logx=logx, logy=logy,
+                           loglog=loglog, xticks=xticks, yticks=yticks,
+                           xlim=xlim, ylim=ylim, rot=rot, fontsize=fontsize,
+                           colormap=colormap, table=table, yerr=yerr,
+                           xerr=xerr, label=label, secondary_y=secondary_y,
+                           **kwds)
+    __call__.__doc__ = plot_series.__doc__
+
+    def line(self, **kwds):
+        """
+        Line plot.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        Examples
+        --------
+
+        .. plot::
+            :context: close-figs
+
+            >>> s = pd.Series([1, 3, 2])
+            >>> s.plot.line()
+        """
+        return self(kind='line', **kwds)
+
+    def bar(self, **kwds):
+        """
+        Vertical bar plot.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='bar', **kwds)
+
+    def barh(self, **kwds):
+        """
+        Horizontal bar plot.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='barh', **kwds)
+
+    def box(self, **kwds):
+        """
+        Boxplot.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='box', **kwds)
+
+    def hist(self, bins=10, **kwds):
+        """
+        Histogram.
+
+        Parameters
+        ----------
+        bins : integer, default 10
+            Number of histogram bins to be used
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='hist', bins=bins, **kwds)
+
+    @Appender(_kde_docstring % {
+        'this-datatype': 'Series',
+        'sibling-datatype': 'DataFrame',
+        'examples': """
+        Given a Series of points randomly sampled from an unknown
+        distribution, estimate its PDF using KDE with automatic
+        bandwidth determination and plot the results, evaluating them at
+        1000 equally spaced points (default):
+
+        .. plot::
+            :context: close-figs
+
+            >>> s = pd.Series([1, 2, 2.5, 3, 3.5, 4, 5])
+            >>> ax = s.plot.kde()
+
+        A scalar bandwidth can be specified. Using a small bandwidth value can
+        lead to over-fitting, while using a large bandwidth value may result
+        in under-fitting:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(bw_method=0.3)
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(bw_method=3)
+
+        Finally, the `ind` parameter determines the evaluation points for the
+        plot of the estimated PDF:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = s.plot.kde(ind=[1, 2, 3, 4, 5])
+        """.strip()
+    })
+    def kde(self, bw_method=None, ind=None, **kwds):
+        return self(kind='kde', bw_method=bw_method, ind=ind, **kwds)
+
+    density = kde
+
+    def area(self, **kwds):
+        """
+        Area plot.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='area', **kwds)
+
+    def pie(self, **kwds):
+        """
+        Pie chart.
+
+        Parameters
+        ----------
+        `**kwds` : optional
+            Additional keyword arguments are documented in
+            :meth:`pandas.Series.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+        """
+        return self(kind='pie', **kwds)
+
+
+class FramePlotMethods(BasePlotMethods):
+    """DataFrame plotting accessor and method
+
+    Examples
+    --------
+    >>> df.plot.line()
+    >>> df.plot.scatter('x', 'y')
+    >>> df.plot.hexbin()
+
+    These plotting methods can also be accessed by calling the accessor as a
+    method with the ``kind`` argument:
+    ``df.plot(kind='line')`` is equivalent to ``df.plot.line()``
+    """
+
+    def __call__(self, x=None, y=None, kind='line', ax=None,
+                 subplots=False, sharex=None, sharey=False, layout=None,
+                 figsize=None, use_index=True, title=None, grid=None,
+                 legend=True, style=None, logx=False, logy=False, loglog=False,
+                 xticks=None, yticks=None, xlim=None, ylim=None,
+                 rot=None, fontsize=None, colormap=None, table=False,
+                 yerr=None, xerr=None,
+                 secondary_y=False, sort_columns=False, **kwds):
+        return plot_frame(self._parent, kind=kind, x=x, y=y, ax=ax,
+                          subplots=subplots, sharex=sharex, sharey=sharey,
+                          layout=layout, figsize=figsize, use_index=use_index,
+                          title=title, grid=grid, legend=legend, style=style,
+                          logx=logx, logy=logy, loglog=loglog, xticks=xticks,
+                          yticks=yticks, xlim=xlim, ylim=ylim, rot=rot,
+                          fontsize=fontsize, colormap=colormap, table=table,
+                          yerr=yerr, xerr=xerr, secondary_y=secondary_y,
+                          sort_columns=sort_columns, **kwds)
+    __call__.__doc__ = plot_frame.__doc__
+
+    def line(self, x=None, y=None, **kwds):
+        """
+        Plot DataFrame columns as lines.
+
+        This function is useful to plot lines using DataFrame's values
+        as coordinates.
+
+        Parameters
+        ----------
+        x : int or str, optional
+            Columns to use for the horizontal axis.
+            Either the location or the label of the columns to be used.
+            By default, it will use the DataFrame indices.
+        y : int, str, or list of them, optional
+            The values to be plotted.
+            Either the location or the label of the columns to be used.
+            By default, it will use the remaining DataFrame numeric columns.
+        **kwds
+            Keyword arguments to pass on to :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or :class:`numpy.ndarray`
+            Return an ndarray when ``subplots=True``.
+
+        See Also
+        --------
+        matplotlib.pyplot.plot : Plot y versus x as lines and/or markers.
+
+        Examples
+        --------
+
+        .. plot::
+            :context: close-figs
+
+            The following example shows the populations for some animals
+            over the years.
+
+            >>> df = pd.DataFrame({
+            ...    'pig': [20, 18, 489, 675, 1776],
+            ...    'horse': [4, 25, 281, 600, 1900]
+            ...    }, index=[1990, 1997, 2003, 2009, 2014])
+            >>> lines = df.plot.line()
+
+        .. plot::
+           :context: close-figs
+
+           An example with subplots, so an array of axes is returned.
+
+           >>> axes = df.plot.line(subplots=True)
+           >>> type(axes)
+           <class 'numpy.ndarray'>
+
+        .. plot::
+            :context: close-figs
+
+            The following example shows the relationship between both
+            populations.
+
+            >>> lines = df.plot.line(x='pig', y='horse')
+        """
+        return self(kind='line', x=x, y=y, **kwds)
+
+    def bar(self, x=None, y=None, **kwds):
+        """
+        Vertical bar plot.
+
+        A bar plot is a plot that presents categorical data with
+        rectangular bars with lengths proportional to the values that they
+        represent. A bar plot shows comparisons among discrete categories. One
+        axis of the plot shows the specific categories being compared, and the
+        other axis represents a measured value.
+
+        Parameters
+        ----------
+        x : label or position, optional
+            Allows plotting of one column versus another. If not specified,
+            the index of the DataFrame is used.
+        y : label or position, optional
+            Allows plotting of one column versus another. If not specified,
+            all numerical columns are used.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        matplotlib.axes.Axes or np.ndarray of them
+            An ndarray is returned with one :class:`matplotlib.axes.Axes`
+            per column when ``subplots=True``.
+
+        See Also
+        --------
+        DataFrame.plot.barh : Horizontal bar plot.
+        DataFrame.plot : Make plots of a DataFrame.
+        matplotlib.pyplot.bar : Make a bar plot with matplotlib.
+
+        Examples
+        --------
+        Basic plot.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'lab':['A', 'B', 'C'], 'val':[10, 30, 20]})
+            >>> ax = df.plot.bar(x='lab', y='val', rot=0)
+
+        Plot a whole dataframe to a bar plot. Each column is assigned a
+        distinct color, and each row is nested in a group along the
+        horizontal axis.
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.bar(rot=0)
+
+        Instead of nesting, the figure can be split by column with
+        ``subplots=True``. In this case, a :class:`numpy.ndarray` of
+        :class:`matplotlib.axes.Axes` are returned.
+
+        .. plot::
+            :context: close-figs
+
+            >>> axes = df.plot.bar(rot=0, subplots=True)
+            >>> axes[1].legend(loc=2)  # doctest: +SKIP
+
+        Plot a single column.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.bar(y='speed', rot=0)
+
+        Plot only selected categories for the DataFrame.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.bar(x='lifespan', rot=0)
+        """
+        return self(kind='bar', x=x, y=y, **kwds)
+
+    def barh(self, x=None, y=None, **kwds):
+        """
+        Make a horizontal bar plot.
+
+        A horizontal bar plot is a plot that presents quantitative data with
+        rectangular bars with lengths proportional to the values that they
+        represent. A bar plot shows comparisons among discrete categories. One
+        axis of the plot shows the specific categories being compared, and the
+        other axis represents a measured value.
+
+        Parameters
+        ----------
+        x : label or position, default DataFrame.index
+            Column to be used for categories.
+        y : label or position, default All numeric columns in dataframe
+            Columns to be plotted from the DataFrame.
+        **kwds
+            Keyword arguments to pass on to :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        See Also
+        --------
+        DataFrame.plot.bar: Vertical bar plot.
+        DataFrame.plot : Make plots of DataFrame using matplotlib.
+        matplotlib.axes.Axes.bar : Plot a vertical bar plot using matplotlib.
+
+        Examples
+        --------
+        Basic example
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'lab':['A', 'B', 'C'], 'val':[10, 30, 20]})
+            >>> ax = df.plot.barh(x='lab', y='val')
+
+        Plot a whole DataFrame to a horizontal bar plot
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh()
+
+        Plot a column of the DataFrame to a horizontal bar plot
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh(y='speed')
+
+        Plot DataFrame versus the desired column
+
+        .. plot::
+            :context: close-figs
+
+            >>> speed = [0.1, 17.5, 40, 48, 52, 69, 88]
+            >>> lifespan = [2, 8, 70, 1.5, 25, 12, 28]
+            >>> index = ['snail', 'pig', 'elephant',
+            ...          'rabbit', 'giraffe', 'coyote', 'horse']
+            >>> df = pd.DataFrame({'speed': speed,
+            ...                    'lifespan': lifespan}, index=index)
+            >>> ax = df.plot.barh(x='lifespan')
+        """
+        return self(kind='barh', x=x, y=y, **kwds)
+
+    def box(self, by=None, **kwds):
+        r"""
+        Make a box plot of the DataFrame columns.
+
+        A box plot is a method for graphically depicting groups of numerical
+        data through their quartiles.
+        The box extends from the Q1 to Q3 quartile values of the data,
+        with a line at the median (Q2). The whiskers extend from the edges
+        of box to show the range of the data. The position of the whiskers
+        is set by default to 1.5*IQR (IQR = Q3 - Q1) from the edges of the
+        box. Outlier points are those past the end of the whiskers.
+
+        For further details see Wikipedia's
+        entry for `boxplot <https://en.wikipedia.org/wiki/Box_plot>`__.
+
+        A consideration when using this chart is that the box and the whiskers
+        can overlap, which is very common when plotting small sets of data.
+
+        Parameters
+        ----------
+        by : string or sequence
+            Column in the DataFrame to group by.
+        **kwds : optional
+            Additional keywords are documented in
+            :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        See Also
+        --------
+        DataFrame.boxplot: Another method to draw a box plot.
+        Series.plot.box: Draw a box plot from a Series object.
+        matplotlib.pyplot.boxplot: Draw a box plot in matplotlib.
+
+        Examples
+        --------
+        Draw a box plot from a DataFrame with four columns of randomly
+        generated data.
+
+        .. plot::
+            :context: close-figs
+
+            >>> data = np.random.randn(25, 4)
+            >>> df = pd.DataFrame(data, columns=list('ABCD'))
+            >>> ax = df.plot.box()
+        """
+        return self(kind='box', by=by, **kwds)
+
+    def hist(self, by=None, bins=10, **kwds):
+        """
+        Draw one histogram of the DataFrame's columns.
+
+        A histogram is a representation of the distribution of data.
+        This function groups the values of all given Series in the DataFrame
+        into bins and draws all bins in one :class:`matplotlib.axes.Axes`.
+        This is useful when the DataFrame's Series are in a similar scale.
+
+        Parameters
+        ----------
+        by : str or sequence, optional
+            Column in the DataFrame to group by.
+        bins : int, default 10
+            Number of histogram bins to be used.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        class:`matplotlib.AxesSubplot`
+            Return a histogram plot.
+
+        See Also
+        --------
+        DataFrame.hist : Draw histograms per DataFrame's Series.
+        Series.hist : Draw a histogram with Series' data.
+
+        Examples
+        --------
+        When we draw a dice 6000 times, we expect to get each value around 1000
+        times. But when we draw two dices and sum the result, the distribution
+        is going to be quite different. A histogram illustrates those
+        distributions.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame(
+            ...     np.random.randint(1, 7, 6000),
+            ...     columns = ['one'])
+            >>> df['two'] = df['one'] + np.random.randint(1, 7, 6000)
+            >>> ax = df.plot.hist(bins=12, alpha=0.5)
+        """
+        return self(kind='hist', by=by, bins=bins, **kwds)
+
+    @Appender(_kde_docstring % {
+        'this-datatype': 'DataFrame',
+        'sibling-datatype': 'Series',
+        'examples': """
+        Given several Series of points randomly sampled from unknown
+        distributions, estimate their PDFs using KDE with automatic
+        bandwidth determination and plot the results, evaluating them at
+        1000 equally spaced points (default):
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({
+            ...     'x': [1, 2, 2.5, 3, 3.5, 4, 5],
+            ...     'y': [4, 4, 4.5, 5, 5.5, 6, 6],
+            ... })
+            >>> ax = df.plot.kde()
+
+        A scalar bandwidth can be specified. Using a small bandwidth value can
+        lead to over-fitting, while using a large bandwidth value may result
+        in under-fitting:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(bw_method=0.3)
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(bw_method=3)
+
+        Finally, the `ind` parameter determines the evaluation points for the
+        plot of the estimated PDF:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.kde(ind=[1, 2, 3, 4, 5, 6])
+        """.strip()
+    })
+    def kde(self, bw_method=None, ind=None, **kwds):
+        return self(kind='kde', bw_method=bw_method, ind=ind, **kwds)
+
+    density = kde
+
+    def area(self, x=None, y=None, **kwds):
+        """
+        Draw a stacked area plot.
+
+        An area plot displays quantitative data visually.
+        This function wraps the matplotlib area function.
+
+        Parameters
+        ----------
+        x : label or position, optional
+            Coordinates for the X axis. By default uses the index.
+        y : label or position, optional
+            Column to plot. By default uses all columns.
+        stacked : bool, default True
+            Area plots are stacked by default. Set to False to create a
+            unstacked plot.
+        **kwds : optional
+            Additional keyword arguments are documented in
+            :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        matplotlib.axes.Axes or numpy.ndarray
+            Area plot, or array of area plots if subplots is True.
+
+        See Also
+        --------
+        DataFrame.plot : Make plots of DataFrame using matplotlib / pylab.
+
+        Examples
+        --------
+        Draw an area plot based on basic business metrics:
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({
+            ...     'sales': [3, 2, 3, 9, 10, 6],
+            ...     'signups': [5, 5, 6, 12, 14, 13],
+            ...     'visits': [20, 42, 28, 62, 81, 50],
+            ... }, index=pd.date_range(start='2018/01/01', end='2018/07/01',
+            ...                        freq='M'))
+            >>> ax = df.plot.area()
+
+        Area plots are stacked by default. To produce an unstacked plot,
+        pass ``stacked=False``:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.area(stacked=False)
+
+        Draw an area plot for a single column:
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax = df.plot.area(y='sales')
+
+        Draw with a different `x`:
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({
+            ...     'sales': [3, 2, 3],
+            ...     'visits': [20, 42, 28],
+            ...     'day': [1, 2, 3],
+            ... })
+            >>> ax = df.plot.area(x='day')
+        """
+        return self(kind='area', x=x, y=y, **kwds)
+
+    def pie(self, y=None, **kwds):
+        """
+        Generate a pie plot.
+
+        A pie plot is a proportional representation of the numerical data in a
+        column. This function wraps :meth:`matplotlib.pyplot.pie` for the
+        specified column. If no column reference is passed and
+        ``subplots=True`` a pie plot is drawn for each numerical column
+        independently.
+
+        Parameters
+        ----------
+        y : int or label, optional
+            Label or position of the column to plot.
+            If not provided, ``subplots=True`` argument must be passed.
+        **kwds
+            Keyword arguments to pass on to :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        matplotlib.axes.Axes or np.ndarray of them
+            A NumPy array is returned when `subplots` is True.
+
+        See Also
+        --------
+        Series.plot.pie : Generate a pie plot for a Series.
+        DataFrame.plot : Make plots of a DataFrame.
+
+        Examples
+        --------
+        In the example below we have a DataFrame with the information about
+        planet's mass and radius. We pass the the 'mass' column to the
+        pie function to get a pie plot.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame({'mass': [0.330, 4.87 , 5.97],
+            ...                    'radius': [2439.7, 6051.8, 6378.1]},
+            ...                   index=['Mercury', 'Venus', 'Earth'])
+            >>> plot = df.plot.pie(y='mass', figsize=(5, 5))
+
+        .. plot::
+            :context: close-figs
+
+            >>> plot = df.plot.pie(subplots=True, figsize=(6, 3))
+        """
+        return self(kind='pie', y=y, **kwds)
+
+    def scatter(self, x, y, s=None, c=None, **kwds):
+        """
+        Create a scatter plot with varying marker point size and color.
+
+        The coordinates of each point are defined by two dataframe columns and
+        filled circles are used to represent each point. This kind of plot is
+        useful to see complex correlations between two variables. Points could
+        be for instance natural 2D coordinates like longitude and latitude in
+        a map or, in general, any pair of metrics that can be plotted against
+        each other.
+
+        Parameters
+        ----------
+        x : int or str
+            The column name or column position to be used as horizontal
+            coordinates for each point.
+        y : int or str
+            The column name or column position to be used as vertical
+            coordinates for each point.
+        s : scalar or array_like, optional
+            The size of each point. Possible values are:
+
+            - A single scalar so all points have the same size.
+
+            - A sequence of scalars, which will be used for each point's size
+              recursively. For instance, when passing [2,14] all points size
+              will be either 2 or 14, alternatively.
+
+        c : str, int or array_like, optional
+            The color of each point. Possible values are:
+
+            - A single color string referred to by name, RGB or RGBA code,
+              for instance 'red' or '#a98d19'.
+
+            - A sequence of color strings referred to by name, RGB or RGBA
+              code, which will be used for each point's color recursively. For
+              instance ['green','yellow'] all points will be filled in green or
+              yellow, alternatively.
+
+            - A column name or position whose values will be used to color the
+              marker points according to a colormap.
+
+        **kwds
+            Keyword arguments to pass on to :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        :class:`matplotlib.axes.Axes` or numpy.ndarray of them
+
+        See Also
+        --------
+        matplotlib.pyplot.scatter : Scatter plot using multiple input data
+            formats.
+
+        Examples
+        --------
+        Let's see how to draw a scatter plot using coordinates from the values
+        in a DataFrame's columns.
+
+        .. plot::
+            :context: close-figs
+
+            >>> df = pd.DataFrame([[5.1, 3.5, 0], [4.9, 3.0, 0], [7.0, 3.2, 1],
+            ...                    [6.4, 3.2, 1], [5.9, 3.0, 2]],
+            ...                   columns=['length', 'width', 'species'])
+            >>> ax1 = df.plot.scatter(x='length',
+            ...                       y='width',
+            ...                       c='DarkBlue')
+
+        And now with the color determined by a column as well.
+
+        .. plot::
+            :context: close-figs
+
+            >>> ax2 = df.plot.scatter(x='length',
+            ...                       y='width',
+            ...                       c='species',
+            ...                       colormap='viridis')
+        """
+        return self(kind='scatter', x=x, y=y, c=c, s=s, **kwds)
+
+    def hexbin(self, x, y, C=None, reduce_C_function=None, gridsize=None,
+               **kwds):
+        """
+        Generate a hexagonal binning plot.
+
+        Generate a hexagonal binning plot of `x` versus `y`. If `C` is `None`
+        (the default), this is a histogram of the number of occurrences
+        of the observations at ``(x[i], y[i])``.
+
+        If `C` is specified, specifies values at given coordinates
+        ``(x[i], y[i])``. These values are accumulated for each hexagonal
+        bin and then reduced according to `reduce_C_function`,
+        having as default the NumPy's mean function (:meth:`numpy.mean`).
+        (If `C` is specified, it must also be a 1-D sequence
+        of the same length as `x` and `y`, or a column label.)
+
+        Parameters
+        ----------
+        x : int or str
+            The column label or position for x points.
+        y : int or str
+            The column label or position for y points.
+        C : int or str, optional
+            The column label or position for the value of `(x, y)` point.
+        reduce_C_function : callable, default `np.mean`
+            Function of one argument that reduces all the values in a bin to
+            a single number (e.g. `np.mean`, `np.max`, `np.sum`, `np.std`).
+        gridsize : int or tuple of (int, int), default 100
+            The number of hexagons in the x-direction.
+            The corresponding number of hexagons in the y-direction is
+            chosen in a way that the hexagons are approximately regular.
+            Alternatively, gridsize can be a tuple with two elements
+            specifying the number of hexagons in the x-direction and the
+            y-direction.
+        **kwds
+            Additional keyword arguments are documented in
+            :meth:`DataFrame.plot`.
+
+        Returns
+        -------
+        matplotlib.AxesSubplot
+            The matplotlib ``Axes`` on which the hexbin is plotted.
+
+        See Also
+        --------
+        DataFrame.plot : Make plots of a DataFrame.
+        matplotlib.pyplot.hexbin : Hexagonal binning plot using matplotlib,
+            the matplotlib function that is used under the hood.
+
+        Examples
+        --------
+        The following examples are generated with random data from
+        a normal distribution.
+
+        .. plot::
+            :context: close-figs
+
+            >>> n = 10000
+            >>> df = pd.DataFrame({'x': np.random.randn(n),
+            ...                    'y': np.random.randn(n)})
+            >>> ax = df.plot.hexbin(x='x', y='y', gridsize=20)
+
+        The next example uses `C` and `np.sum` as `reduce_C_function`.
+        Note that `'observations'` values ranges from 1 to 5 but the result
+        plot shows values up to more than 25. This is because of the
+        `reduce_C_function`.
+
+        .. plot::
+            :context: close-figs
+
+            >>> n = 500
+            >>> df = pd.DataFrame({
+            ...     'coord_x': np.random.uniform(-3, 3, size=n),
+            ...     'coord_y': np.random.uniform(30, 50, size=n),
+            ...     'observations': np.random.randint(1,5, size=n)
+            ...     })
+            >>> ax = df.plot.hexbin(x='coord_x',
+            ...                     y='coord_y',
+            ...                     C='observations',
+            ...                     reduce_C_function=np.sum,
+            ...                     gridsize=10,
+            ...                     cmap="viridis")
+        """
+        if reduce_C_function is not None:
+            kwds['reduce_C_function'] = reduce_C_function
+        if gridsize is not None:
+            kwds['gridsize'] = gridsize
+        return self(kind='hexbin', x=x, y=y, C=C, **kwds)
diff --git a/pandas/plotting/_misc.py b/pandas/plotting/_misc.py
new file mode 100644
index 0000000000000..5171ea68fd497
--- /dev/null
+++ b/pandas/plotting/_misc.py
@@ -0,0 +1,641 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+import numpy as np
+
+from pandas.compat import lmap, lrange, range, zip
+from pandas.util._decorators import deprecate_kwarg
+
+from pandas.core.dtypes.missing import notna
+
+from pandas.io.formats.printing import pprint_thing
+from pandas.plotting._style import _get_standard_colors
+from pandas.plotting._tools import _set_ticks_props, _subplots
+
+
+def scatter_matrix(frame, alpha=0.5, figsize=None, ax=None, grid=False,
+                   diagonal='hist', marker='.', density_kwds=None,
+                   hist_kwds=None, range_padding=0.05, **kwds):
+    """
+    Draw a matrix of scatter plots.
+
+    Parameters
+    ----------
+    frame : DataFrame
+    alpha : float, optional
+        amount of transparency applied
+    figsize : (float,float), optional
+        a tuple (width, height) in inches
+    ax : Matplotlib axis object, optional
+    grid : bool, optional
+        setting this to True will show the grid
+    diagonal : {'hist', 'kde'}
+        pick between 'kde' and 'hist' for
+        either Kernel Density Estimation or Histogram
+        plot in the diagonal
+    marker : str, optional
+        Matplotlib marker type, default '.'
+    hist_kwds : other plotting keyword arguments
+        To be passed to hist function
+    density_kwds : other plotting keyword arguments
+        To be passed to kernel density estimate plot
+    range_padding : float, optional
+        relative extension of axis range in x and y
+        with respect to (x_max - x_min) or (y_max - y_min),
+        default 0.05
+    kwds : other plotting keyword arguments
+        To be passed to scatter function
+
+    Examples
+    --------
+    >>> df = pd.DataFrame(np.random.randn(1000, 4), columns=['A','B','C','D'])
+    >>> scatter_matrix(df, alpha=0.2)
+    """
+
+    df = frame._get_numeric_data()
+    n = df.columns.size
+    naxes = n * n
+    fig, axes = _subplots(naxes=naxes, figsize=figsize, ax=ax,
+                          squeeze=False)
+
+    # no gaps between subplots
+    fig.subplots_adjust(wspace=0, hspace=0)
+
+    mask = notna(df)
+
+    marker = _get_marker_compat(marker)
+
+    hist_kwds = hist_kwds or {}
+    density_kwds = density_kwds or {}
+
+    # GH 14855
+    kwds.setdefault('edgecolors', 'none')
+
+    boundaries_list = []
+    for a in df.columns:
+        values = df[a].values[mask[a].values]
+        rmin_, rmax_ = np.min(values), np.max(values)
+        rdelta_ext = (rmax_ - rmin_) * range_padding / 2.
+        boundaries_list.append((rmin_ - rdelta_ext, rmax_ + rdelta_ext))
+
+    for i, a in zip(lrange(n), df.columns):
+        for j, b in zip(lrange(n), df.columns):
+            ax = axes[i, j]
+
+            if i == j:
+                values = df[a].values[mask[a].values]
+
+                # Deal with the diagonal by drawing a histogram there.
+                if diagonal == 'hist':
+                    ax.hist(values, **hist_kwds)
+
+                elif diagonal in ('kde', 'density'):
+                    from scipy.stats import gaussian_kde
+                    y = values
+                    gkde = gaussian_kde(y)
+                    ind = np.linspace(y.min(), y.max(), 1000)
+                    ax.plot(ind, gkde.evaluate(ind), **density_kwds)
+
+                ax.set_xlim(boundaries_list[i])
+
+            else:
+                common = (mask[a] & mask[b]).values
+
+                ax.scatter(df[b][common], df[a][common],
+                           marker=marker, alpha=alpha, **kwds)
+
+                ax.set_xlim(boundaries_list[j])
+                ax.set_ylim(boundaries_list[i])
+
+            ax.set_xlabel(b)
+            ax.set_ylabel(a)
+
+            if j != 0:
+                ax.yaxis.set_visible(False)
+            if i != n - 1:
+                ax.xaxis.set_visible(False)
+
+    if len(df.columns) > 1:
+        lim1 = boundaries_list[0]
+        locs = axes[0][1].yaxis.get_majorticklocs()
+        locs = locs[(lim1[0] <= locs) & (locs <= lim1[1])]
+        adj = (locs - lim1[0]) / (lim1[1] - lim1[0])
+
+        lim0 = axes[0][0].get_ylim()
+        adj = adj * (lim0[1] - lim0[0]) + lim0[0]
+        axes[0][0].yaxis.set_ticks(adj)
+
+        if np.all(locs == locs.astype(int)):
+            # if all ticks are int
+            locs = locs.astype(int)
+        axes[0][0].yaxis.set_ticklabels(locs)
+
+    _set_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
+
+    return axes
+
+
+def _get_marker_compat(marker):
+    import matplotlib.lines as mlines
+    if marker not in mlines.lineMarkers:
+        return 'o'
+    return marker
+
+
+def radviz(frame, class_column, ax=None, color=None, colormap=None, **kwds):
+    """
+    Plot a multidimensional dataset in 2D.
+
+    Each Series in the DataFrame is represented as a evenly distributed
+    slice on a circle. Each data point is rendered in the circle according to
+    the value on each Series. Highly correlated `Series` in the `DataFrame`
+    are placed closer on the unit circle.
+
+    RadViz allow to project a N-dimensional data set into a 2D space where the
+    influence of each dimension can be interpreted as a balance between the
+    influence of all dimensions.
+
+    More info available at the `original article
+    <http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.135.889>`_
+    describing RadViz.
+
+    Parameters
+    ----------
+    frame : `DataFrame`
+        Pandas object holding the data.
+    class_column : str
+        Column name containing the name of the data point category.
+    ax : :class:`matplotlib.axes.Axes`, optional
+        A plot instance to which to add the information.
+    color : list[str] or tuple[str], optional
+        Assign a color to each category. Example: ['blue', 'green'].
+    colormap : str or :class:`matplotlib.colors.Colormap`, default None
+        Colormap to select colors from. If string, load colormap with that
+        name from matplotlib.
+    kwds : optional
+        Options to pass to matplotlib scatter plotting method.
+
+    Returns
+    -------
+    class:`matplotlib.axes.Axes`
+
+    See Also
+    --------
+    plotting.andrews_curves : Plot clustering visualization.
+
+    Examples
+    --------
+    .. plot::
+        :context: close-figs
+
+        >>> df = pd.DataFrame({
+        ...         'SepalLength': [6.5, 7.7, 5.1, 5.8, 7.6, 5.0, 5.4, 4.6,
+        ...                         6.7, 4.6],
+        ...         'SepalWidth': [3.0, 3.8, 3.8, 2.7, 3.0, 2.3, 3.0, 3.2,
+        ...                        3.3, 3.6],
+        ...         'PetalLength': [5.5, 6.7, 1.9, 5.1, 6.6, 3.3, 4.5, 1.4,
+        ...                         5.7, 1.0],
+        ...         'PetalWidth': [1.8, 2.2, 0.4, 1.9, 2.1, 1.0, 1.5, 0.2,
+        ...                        2.1, 0.2],
+        ...         'Category': ['virginica', 'virginica', 'setosa',
+        ...                      'virginica', 'virginica', 'versicolor',
+        ...                      'versicolor', 'setosa', 'virginica',
+        ...                      'setosa']
+        ...     })
+        >>> rad_viz = pd.plotting.radviz(df, 'Category')  # doctest: +SKIP
+    """
+    import matplotlib.pyplot as plt
+    import matplotlib.patches as patches
+
+    def normalize(series):
+        a = min(series)
+        b = max(series)
+        return (series - a) / (b - a)
+
+    n = len(frame)
+    classes = frame[class_column].drop_duplicates()
+    class_col = frame[class_column]
+    df = frame.drop(class_column, axis=1).apply(normalize)
+
+    if ax is None:
+        ax = plt.gca(xlim=[-1, 1], ylim=[-1, 1])
+
+    to_plot = {}
+    colors = _get_standard_colors(num_colors=len(classes), colormap=colormap,
+                                  color_type='random', color=color)
+
+    for kls in classes:
+        to_plot[kls] = [[], []]
+
+    m = len(frame.columns) - 1
+    s = np.array([(np.cos(t), np.sin(t))
+                  for t in [2.0 * np.pi * (i / float(m))
+                            for i in range(m)]])
+
+    for i in range(n):
+        row = df.iloc[i].values
+        row_ = np.repeat(np.expand_dims(row, axis=1), 2, axis=1)
+        y = (s * row_).sum(axis=0) / row.sum()
+        kls = class_col.iat[i]
+        to_plot[kls][0].append(y[0])
+        to_plot[kls][1].append(y[1])
+
+    for i, kls in enumerate(classes):
+        ax.scatter(to_plot[kls][0], to_plot[kls][1], color=colors[i],
+                   label=pprint_thing(kls), **kwds)
+    ax.legend()
+
+    ax.add_patch(patches.Circle((0.0, 0.0), radius=1.0, facecolor='none'))
+
+    for xy, name in zip(s, df.columns):
+
+        ax.add_patch(patches.Circle(xy, radius=0.025, facecolor='gray'))
+
+        if xy[0] < 0.0 and xy[1] < 0.0:
+            ax.text(xy[0] - 0.025, xy[1] - 0.025, name,
+                    ha='right', va='top', size='small')
+        elif xy[0] < 0.0 and xy[1] >= 0.0:
+            ax.text(xy[0] - 0.025, xy[1] + 0.025, name,
+                    ha='right', va='bottom', size='small')
+        elif xy[0] >= 0.0 and xy[1] < 0.0:
+            ax.text(xy[0] + 0.025, xy[1] - 0.025, name,
+                    ha='left', va='top', size='small')
+        elif xy[0] >= 0.0 and xy[1] >= 0.0:
+            ax.text(xy[0] + 0.025, xy[1] + 0.025, name,
+                    ha='left', va='bottom', size='small')
+
+    ax.axis('equal')
+    return ax
+
+
+@deprecate_kwarg(old_arg_name='data', new_arg_name='frame')
+def andrews_curves(frame, class_column, ax=None, samples=200, color=None,
+                   colormap=None, **kwds):
+    """
+    Generate a matplotlib plot of Andrews curves, for visualising clusters of
+    multivariate data.
+
+    Andrews curves have the functional form:
+
+    f(t) = x_1/sqrt(2) + x_2 sin(t) + x_3 cos(t) +
+           x_4 sin(2t) + x_5 cos(2t) + ...
+
+    Where x coefficients correspond to the values of each dimension and t is
+    linearly spaced between -pi and +pi. Each row of frame then corresponds to
+    a single curve.
+
+    Parameters
+    ----------
+    frame : DataFrame
+        Data to be plotted, preferably normalized to (0.0, 1.0)
+    class_column : Name of the column containing class names
+    ax : matplotlib axes object, default None
+    samples : Number of points to plot in each curve
+    color : list or tuple, optional
+        Colors to use for the different classes
+    colormap : str or matplotlib colormap object, default None
+        Colormap to select colors from. If string, load colormap with that name
+        from matplotlib.
+    kwds : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    class:`matplotlip.axis.Axes`
+
+    """
+    from math import sqrt, pi
+    import matplotlib.pyplot as plt
+
+    def function(amplitudes):
+        def f(t):
+            x1 = amplitudes[0]
+            result = x1 / sqrt(2.0)
+
+            # Take the rest of the coefficients and resize them
+            # appropriately. Take a copy of amplitudes as otherwise numpy
+            # deletes the element from amplitudes itself.
+            coeffs = np.delete(np.copy(amplitudes), 0)
+            coeffs.resize(int((coeffs.size + 1) / 2), 2)
+
+            # Generate the harmonics and arguments for the sin and cos
+            # functions.
+            harmonics = np.arange(0, coeffs.shape[0]) + 1
+            trig_args = np.outer(harmonics, t)
+
+            result += np.sum(coeffs[:, 0, np.newaxis] * np.sin(trig_args) +
+                             coeffs[:, 1, np.newaxis] * np.cos(trig_args),
+                             axis=0)
+            return result
+        return f
+
+    n = len(frame)
+    class_col = frame[class_column]
+    classes = frame[class_column].drop_duplicates()
+    df = frame.drop(class_column, axis=1)
+    t = np.linspace(-pi, pi, samples)
+    used_legends = set()
+
+    color_values = _get_standard_colors(num_colors=len(classes),
+                                        colormap=colormap, color_type='random',
+                                        color=color)
+    colors = dict(zip(classes, color_values))
+    if ax is None:
+        ax = plt.gca(xlim=(-pi, pi))
+    for i in range(n):
+        row = df.iloc[i].values
+        f = function(row)
+        y = f(t)
+        kls = class_col.iat[i]
+        label = pprint_thing(kls)
+        if label not in used_legends:
+            used_legends.add(label)
+            ax.plot(t, y, color=colors[kls], label=label, **kwds)
+        else:
+            ax.plot(t, y, color=colors[kls], **kwds)
+
+    ax.legend(loc='upper right')
+    ax.grid()
+    return ax
+
+
+def bootstrap_plot(series, fig=None, size=50, samples=500, **kwds):
+    """
+    Bootstrap plot on mean, median and mid-range statistics.
+
+    The bootstrap plot is used to estimate the uncertainty of a statistic
+    by relaying on random sampling with replacement [1]_. This function will
+    generate bootstrapping plots for mean, median and mid-range statistics
+    for the given number of samples of the given size.
+
+    .. [1] "Bootstrapping (statistics)" in \
+    https://en.wikipedia.org/wiki/Bootstrapping_%28statistics%29
+
+    Parameters
+    ----------
+    series : pandas.Series
+        Pandas Series from where to get the samplings for the bootstrapping.
+    fig : matplotlib.figure.Figure, default None
+        If given, it will use the `fig` reference for plotting instead of
+        creating a new one with default parameters.
+    size : int, default 50
+        Number of data points to consider during each sampling. It must be
+        greater or equal than the length of the `series`.
+    samples : int, default 500
+        Number of times the bootstrap procedure is performed.
+    **kwds :
+        Options to pass to matplotlib plotting method.
+
+    Returns
+    -------
+    matplotlib.figure.Figure
+        Matplotlib figure.
+
+    See Also
+    --------
+    DataFrame.plot : Basic plotting for DataFrame objects.
+    Series.plot : Basic plotting for Series objects.
+
+    Examples
+    --------
+
+    .. plot::
+            :context: close-figs
+
+            >>> s = pd.Series(np.random.uniform(size=100))
+            >>> fig = pd.plotting.bootstrap_plot(s)  # doctest: +SKIP
+    """
+    import random
+    import matplotlib.pyplot as plt
+
+    # random.sample(ndarray, int) fails on python 3.3, sigh
+    data = list(series.values)
+    samplings = [random.sample(data, size) for _ in range(samples)]
+
+    means = np.array([np.mean(sampling) for sampling in samplings])
+    medians = np.array([np.median(sampling) for sampling in samplings])
+    midranges = np.array([(min(sampling) + max(sampling)) * 0.5
+                          for sampling in samplings])
+    if fig is None:
+        fig = plt.figure()
+    x = lrange(samples)
+    axes = []
+    ax1 = fig.add_subplot(2, 3, 1)
+    ax1.set_xlabel("Sample")
+    axes.append(ax1)
+    ax1.plot(x, means, **kwds)
+    ax2 = fig.add_subplot(2, 3, 2)
+    ax2.set_xlabel("Sample")
+    axes.append(ax2)
+    ax2.plot(x, medians, **kwds)
+    ax3 = fig.add_subplot(2, 3, 3)
+    ax3.set_xlabel("Sample")
+    axes.append(ax3)
+    ax3.plot(x, midranges, **kwds)
+    ax4 = fig.add_subplot(2, 3, 4)
+    ax4.set_xlabel("Mean")
+    axes.append(ax4)
+    ax4.hist(means, **kwds)
+    ax5 = fig.add_subplot(2, 3, 5)
+    ax5.set_xlabel("Median")
+    axes.append(ax5)
+    ax5.hist(medians, **kwds)
+    ax6 = fig.add_subplot(2, 3, 6)
+    ax6.set_xlabel("Midrange")
+    axes.append(ax6)
+    ax6.hist(midranges, **kwds)
+    for axis in axes:
+        plt.setp(axis.get_xticklabels(), fontsize=8)
+        plt.setp(axis.get_yticklabels(), fontsize=8)
+    return fig
+
+
+@deprecate_kwarg(old_arg_name='colors', new_arg_name='color')
+@deprecate_kwarg(old_arg_name='data', new_arg_name='frame', stacklevel=3)
+def parallel_coordinates(frame, class_column, cols=None, ax=None, color=None,
+                         use_columns=False, xticks=None, colormap=None,
+                         axvlines=True, axvlines_kwds=None, sort_labels=False,
+                         **kwds):
+    """Parallel coordinates plotting.
+
+    Parameters
+    ----------
+    frame : DataFrame
+    class_column : str
+        Column name containing class names
+    cols : list, optional
+        A list of column names to use
+    ax : matplotlib.axis, optional
+        matplotlib axis object
+    color : list or tuple, optional
+        Colors to use for the different classes
+    use_columns : bool, optional
+        If true, columns will be used as xticks
+    xticks : list or tuple, optional
+        A list of values to use for xticks
+    colormap : str or matplotlib colormap, default None
+        Colormap to use for line colors.
+    axvlines : bool, optional
+        If true, vertical lines will be added at each xtick
+    axvlines_kwds : keywords, optional
+        Options to be passed to axvline method for vertical lines
+    sort_labels : bool, False
+        Sort class_column labels, useful when assigning colors
+
+        .. versionadded:: 0.20.0
+
+    kwds : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns
+    -------
+    class:`matplotlib.axis.Axes`
+
+    Examples
+    --------
+    >>> from matplotlib import pyplot as plt
+    >>> df = pd.read_csv('https://raw.github.com/pandas-dev/pandas/master'
+                        '/pandas/tests/data/iris.csv')
+    >>> pd.plotting.parallel_coordinates(
+            df, 'Name',
+            color=('#556270', '#4ECDC4', '#C7F464'))
+    >>> plt.show()
+    """
+    if axvlines_kwds is None:
+        axvlines_kwds = {'linewidth': 1, 'color': 'black'}
+    import matplotlib.pyplot as plt
+
+    n = len(frame)
+    classes = frame[class_column].drop_duplicates()
+    class_col = frame[class_column]
+
+    if cols is None:
+        df = frame.drop(class_column, axis=1)
+    else:
+        df = frame[cols]
+
+    used_legends = set()
+
+    ncols = len(df.columns)
+
+    # determine values to use for xticks
+    if use_columns is True:
+        if not np.all(np.isreal(list(df.columns))):
+            raise ValueError('Columns must be numeric to be used as xticks')
+        x = df.columns
+    elif xticks is not None:
+        if not np.all(np.isreal(xticks)):
+            raise ValueError('xticks specified must be numeric')
+        elif len(xticks) != ncols:
+            raise ValueError('Length of xticks must match number of columns')
+        x = xticks
+    else:
+        x = lrange(ncols)
+
+    if ax is None:
+        ax = plt.gca()
+
+    color_values = _get_standard_colors(num_colors=len(classes),
+                                        colormap=colormap, color_type='random',
+                                        color=color)
+
+    if sort_labels:
+        classes = sorted(classes)
+        color_values = sorted(color_values)
+    colors = dict(zip(classes, color_values))
+
+    for i in range(n):
+        y = df.iloc[i].values
+        kls = class_col.iat[i]
+        label = pprint_thing(kls)
+        if label not in used_legends:
+            used_legends.add(label)
+            ax.plot(x, y, color=colors[kls], label=label, **kwds)
+        else:
+            ax.plot(x, y, color=colors[kls], **kwds)
+
+    if axvlines:
+        for i in x:
+            ax.axvline(i, **axvlines_kwds)
+
+    ax.set_xticks(x)
+    ax.set_xticklabels(df.columns)
+    ax.set_xlim(x[0], x[-1])
+    ax.legend(loc='upper right')
+    ax.grid()
+    return ax
+
+
+def lag_plot(series, lag=1, ax=None, **kwds):
+    """Lag plot for time series.
+
+    Parameters
+    ----------
+    series : Time series
+    lag : lag of the scatter plot, default 1
+    ax : Matplotlib axis object, optional
+    kwds : Matplotlib scatter method keyword arguments, optional
+
+    Returns
+    -------
+    class:`matplotlib.axis.Axes`
+    """
+    import matplotlib.pyplot as plt
+
+    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
+    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
+
+    data = series.values
+    y1 = data[:-lag]
+    y2 = data[lag:]
+    if ax is None:
+        ax = plt.gca()
+    ax.set_xlabel("y(t)")
+    ax.set_ylabel("y(t + {lag})".format(lag=lag))
+    ax.scatter(y1, y2, **kwds)
+    return ax
+
+
+def autocorrelation_plot(series, ax=None, **kwds):
+    """
+    Autocorrelation plot for time series.
+
+    Parameters:
+    -----------
+    series: Time series
+    ax: Matplotlib axis object, optional
+    kwds : keywords
+        Options to pass to matplotlib plotting method
+
+    Returns:
+    -----------
+    class:`matplotlib.axis.Axes`
+    """
+    import matplotlib.pyplot as plt
+    n = len(series)
+    data = np.asarray(series)
+    if ax is None:
+        ax = plt.gca(xlim=(1, n), ylim=(-1.0, 1.0))
+    mean = np.mean(data)
+    c0 = np.sum((data - mean) ** 2) / float(n)
+
+    def r(h):
+        return ((data[:n - h] - mean) *
+                (data[h:] - mean)).sum() / float(n) / c0
+    x = np.arange(n) + 1
+    y = lmap(r, x)
+    z95 = 1.959963984540054
+    z99 = 2.5758293035489004
+    ax.axhline(y=z99 / np.sqrt(n), linestyle='--', color='grey')
+    ax.axhline(y=z95 / np.sqrt(n), color='grey')
+    ax.axhline(y=0.0, color='black')
+    ax.axhline(y=-z95 / np.sqrt(n), color='grey')
+    ax.axhline(y=-z99 / np.sqrt(n), linestyle='--', color='grey')
+    ax.set_xlabel("Lag")
+    ax.set_ylabel("Autocorrelation")
+    ax.plot(x, y, **kwds)
+    if 'label' in kwds:
+        ax.legend()
+    ax.grid()
+    return ax
diff --git a/pandas/plotting/_style.py b/pandas/plotting/_style.py
new file mode 100644
index 0000000000000..d9da34e008763
--- /dev/null
+++ b/pandas/plotting/_style.py
@@ -0,0 +1,168 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+from contextlib import contextmanager
+import warnings
+
+import numpy as np
+
+import pandas.compat as compat
+from pandas.compat import lmap, lrange
+
+from pandas.core.dtypes.common import is_list_like
+
+
+def _get_standard_colors(num_colors=None, colormap=None, color_type='default',
+                         color=None):
+    import matplotlib.pyplot as plt
+
+    if color is None and colormap is not None:
+        if isinstance(colormap, compat.string_types):
+            import matplotlib.cm as cm
+            cmap = colormap
+            colormap = cm.get_cmap(colormap)
+            if colormap is None:
+                raise ValueError("Colormap {0} is not recognized".format(cmap))
+        colors = lmap(colormap, np.linspace(0, 1, num=num_colors))
+    elif color is not None:
+        if colormap is not None:
+            warnings.warn("'color' and 'colormap' cannot be used "
+                          "simultaneously. Using 'color'")
+        colors = list(color) if is_list_like(color) else color
+    else:
+        if color_type == 'default':
+            # need to call list() on the result to copy so we don't
+            # modify the global rcParams below
+            try:
+                colors = [c['color']
+                          for c in list(plt.rcParams['axes.prop_cycle'])]
+            except KeyError:
+                colors = list(plt.rcParams.get('axes.color_cycle',
+                                               list('bgrcmyk')))
+            if isinstance(colors, compat.string_types):
+                colors = list(colors)
+
+            colors = colors[0:num_colors]
+        elif color_type == 'random':
+            import pandas.core.common as com
+
+            def random_color(column):
+                """ Returns a random color represented as a list of length 3"""
+                # GH17525 use common._random_state to avoid resetting the seed
+                rs = com.random_state(column)
+                return rs.rand(3).tolist()
+
+            colors = lmap(random_color, lrange(num_colors))
+        else:
+            raise ValueError("color_type must be either 'default' or 'random'")
+
+    if isinstance(colors, compat.string_types):
+        import matplotlib.colors
+        conv = matplotlib.colors.ColorConverter()
+
+        def _maybe_valid_colors(colors):
+            try:
+                [conv.to_rgba(c) for c in colors]
+                return True
+            except ValueError:
+                return False
+
+        # check whether the string can be convertible to single color
+        maybe_single_color = _maybe_valid_colors([colors])
+        # check whether each character can be convertible to colors
+        maybe_color_cycle = _maybe_valid_colors(list(colors))
+        if maybe_single_color and maybe_color_cycle and len(colors) > 1:
+            hex_color = [c['color']
+                         for c in list(plt.rcParams['axes.prop_cycle'])]
+            colors = [hex_color[int(colors[1])]]
+        elif maybe_single_color:
+            colors = [colors]
+        else:
+            # ``colors`` is regarded as color cycle.
+            # mpl will raise error any of them is invalid
+            pass
+
+    # Append more colors by cycling if there is not enough color.
+    # Extra colors will be ignored by matplotlib if there are more colors
+    # than needed and nothing needs to be done here.
+    if len(colors) < num_colors:
+        try:
+            multiple = num_colors // len(colors) - 1
+        except ZeroDivisionError:
+            raise ValueError("Invalid color argument: ''")
+        mod = num_colors % len(colors)
+
+        colors += multiple * colors
+        colors += colors[:mod]
+
+    return colors
+
+
+class _Options(dict):
+    """
+    Stores pandas plotting options.
+    Allows for parameter aliasing so you can just use parameter names that are
+    the same as the plot function parameters, but is stored in a canonical
+    format that makes it easy to breakdown into groups later
+    """
+
+    # alias so the names are same as plotting method parameter names
+    _ALIASES = {'x_compat': 'xaxis.compat'}
+    _DEFAULT_KEYS = ['xaxis.compat']
+
+    def __init__(self, deprecated=False):
+        self._deprecated = deprecated
+        # self['xaxis.compat'] = False
+        super(_Options, self).__setitem__('xaxis.compat', False)
+
+    def __getitem__(self, key):
+        key = self._get_canonical_key(key)
+        if key not in self:
+            raise ValueError(
+                '{key} is not a valid pandas plotting option'.format(key=key))
+        return super(_Options, self).__getitem__(key)
+
+    def __setitem__(self, key, value):
+        key = self._get_canonical_key(key)
+        return super(_Options, self).__setitem__(key, value)
+
+    def __delitem__(self, key):
+        key = self._get_canonical_key(key)
+        if key in self._DEFAULT_KEYS:
+            raise ValueError(
+                'Cannot remove default parameter {key}'.format(key=key))
+        return super(_Options, self).__delitem__(key)
+
+    def __contains__(self, key):
+        key = self._get_canonical_key(key)
+        return super(_Options, self).__contains__(key)
+
+    def reset(self):
+        """
+        Reset the option store to its initial state
+
+        Returns
+        -------
+        None
+        """
+        self.__init__()
+
+    def _get_canonical_key(self, key):
+        return self._ALIASES.get(key, key)
+
+    @contextmanager
+    def use(self, key, value):
+        """
+        Temporarily set a parameter value using the with statement.
+        Aliasing allowed.
+        """
+        old_value = self[key]
+        try:
+            self[key] = value
+            yield self
+        finally:
+            self[key] = old_value
+
+
+plot_params = _Options()
diff --git a/pandas/plotting/_timeseries.py b/pandas/plotting/_timeseries.py
new file mode 100644
index 0000000000000..51b0629005942
--- /dev/null
+++ b/pandas/plotting/_timeseries.py
@@ -0,0 +1,353 @@
+# TODO: Use the fact that axis can have units to simplify the process
+
+import functools
+
+from matplotlib import pylab
+import numpy as np
+
+from pandas._libs.tslibs.frequencies import (
+    FreqGroup, get_base_alias, get_freq, is_subperiod, is_superperiod)
+from pandas._libs.tslibs.period import Period
+import pandas.compat as compat
+
+from pandas.core.dtypes.generic import (
+    ABCDatetimeIndex, ABCPeriodIndex, ABCTimedeltaIndex)
+
+from pandas.io.formats.printing import pprint_thing
+from pandas.plotting._converter import (
+    TimeSeries_DateFormatter, TimeSeries_DateLocator,
+    TimeSeries_TimedeltaFormatter)
+import pandas.tseries.frequencies as frequencies
+from pandas.tseries.offsets import DateOffset
+
+# ---------------------------------------------------------------------
+# Plotting functions and monkey patches
+
+
+def tsplot(series, plotf, ax=None, **kwargs):
+    import warnings
+    """
+    Plots a Series on the given Matplotlib axes or the current axes
+
+    Parameters
+    ----------
+    axes : Axes
+    series : Series
+
+    Notes
+    _____
+    Supports same kwargs as Axes.plot
+
+
+    .. deprecated:: 0.23.0
+       Use Series.plot() instead
+    """
+    warnings.warn("'tsplot' is deprecated and will be removed in a "
+                  "future version. Please use Series.plot() instead.",
+                  FutureWarning, stacklevel=2)
+
+    # Used inferred freq is possible, need a test case for inferred
+    if ax is None:
+        import matplotlib.pyplot as plt
+        ax = plt.gca()
+
+    freq, series = _maybe_resample(series, ax, kwargs)
+
+    # Set ax with freq info
+    _decorate_axes(ax, freq, kwargs)
+    ax._plot_data.append((series, plotf, kwargs))
+    lines = plotf(ax, series.index._mpl_repr(), series.values, **kwargs)
+
+    # set date formatter, locators and rescale limits
+    format_dateaxis(ax, ax.freq, series.index)
+    return lines
+
+
+def _maybe_resample(series, ax, kwargs):
+    # resample against axes freq if necessary
+    freq, ax_freq = _get_freq(ax, series)
+
+    if freq is None:  # pragma: no cover
+        raise ValueError('Cannot use dynamic axis without frequency info')
+
+    # Convert DatetimeIndex to PeriodIndex
+    if isinstance(series.index, ABCDatetimeIndex):
+        series = series.to_period(freq=freq)
+
+    if ax_freq is not None and freq != ax_freq:
+        if is_superperiod(freq, ax_freq):  # upsample input
+            series = series.copy()
+            series.index = series.index.asfreq(ax_freq, how='s')
+            freq = ax_freq
+        elif _is_sup(freq, ax_freq):  # one is weekly
+            how = kwargs.pop('how', 'last')
+            series = getattr(series.resample('D'), how)().dropna()
+            series = getattr(series.resample(ax_freq), how)().dropna()
+            freq = ax_freq
+        elif is_subperiod(freq, ax_freq) or _is_sub(freq, ax_freq):
+            _upsample_others(ax, freq, kwargs)
+        else:  # pragma: no cover
+            raise ValueError('Incompatible frequency conversion')
+    return freq, series
+
+
+def _is_sub(f1, f2):
+    return ((f1.startswith('W') and is_subperiod('D', f2)) or
+            (f2.startswith('W') and is_subperiod(f1, 'D')))
+
+
+def _is_sup(f1, f2):
+    return ((f1.startswith('W') and is_superperiod('D', f2)) or
+            (f2.startswith('W') and is_superperiod(f1, 'D')))
+
+
+def _upsample_others(ax, freq, kwargs):
+    legend = ax.get_legend()
+    lines, labels = _replot_ax(ax, freq, kwargs)
+    _replot_ax(ax, freq, kwargs)
+
+    other_ax = None
+    if hasattr(ax, 'left_ax'):
+        other_ax = ax.left_ax
+    if hasattr(ax, 'right_ax'):
+        other_ax = ax.right_ax
+
+    if other_ax is not None:
+        rlines, rlabels = _replot_ax(other_ax, freq, kwargs)
+        lines.extend(rlines)
+        labels.extend(rlabels)
+
+    if (legend is not None and kwargs.get('legend', True) and
+            len(lines) > 0):
+        title = legend.get_title().get_text()
+        if title == 'None':
+            title = None
+        ax.legend(lines, labels, loc='best', title=title)
+
+
+def _replot_ax(ax, freq, kwargs):
+    data = getattr(ax, '_plot_data', None)
+
+    # clear current axes and data
+    ax._plot_data = []
+    ax.clear()
+
+    _decorate_axes(ax, freq, kwargs)
+
+    lines = []
+    labels = []
+    if data is not None:
+        for series, plotf, kwds in data:
+            series = series.copy()
+            idx = series.index.asfreq(freq, how='S')
+            series.index = idx
+            ax._plot_data.append((series, plotf, kwds))
+
+            # for tsplot
+            if isinstance(plotf, compat.string_types):
+                from pandas.plotting._core import _plot_klass
+                plotf = _plot_klass[plotf]._plot
+
+            lines.append(plotf(ax, series.index._mpl_repr(),
+                               series.values, **kwds)[0])
+            labels.append(pprint_thing(series.name))
+
+    return lines, labels
+
+
+def _decorate_axes(ax, freq, kwargs):
+    """Initialize axes for time-series plotting"""
+    if not hasattr(ax, '_plot_data'):
+        ax._plot_data = []
+
+    ax.freq = freq
+    xaxis = ax.get_xaxis()
+    xaxis.freq = freq
+    if not hasattr(ax, 'legendlabels'):
+        ax.legendlabels = [kwargs.get('label', None)]
+    else:
+        ax.legendlabels.append(kwargs.get('label', None))
+    ax.view_interval = None
+    ax.date_axis_info = None
+
+
+def _get_ax_freq(ax):
+    """
+    Get the freq attribute of the ax object if set.
+    Also checks shared axes (eg when using secondary yaxis, sharex=True
+    or twinx)
+    """
+    ax_freq = getattr(ax, 'freq', None)
+    if ax_freq is None:
+        # check for left/right ax in case of secondary yaxis
+        if hasattr(ax, 'left_ax'):
+            ax_freq = getattr(ax.left_ax, 'freq', None)
+        elif hasattr(ax, 'right_ax'):
+            ax_freq = getattr(ax.right_ax, 'freq', None)
+    if ax_freq is None:
+        # check if a shared ax (sharex/twinx) has already freq set
+        shared_axes = ax.get_shared_x_axes().get_siblings(ax)
+        if len(shared_axes) > 1:
+            for shared_ax in shared_axes:
+                ax_freq = getattr(shared_ax, 'freq', None)
+                if ax_freq is not None:
+                    break
+    return ax_freq
+
+
+def _get_freq(ax, series):
+    # get frequency from data
+    freq = getattr(series.index, 'freq', None)
+    if freq is None:
+        freq = getattr(series.index, 'inferred_freq', None)
+
+    ax_freq = _get_ax_freq(ax)
+
+    # use axes freq if no data freq
+    if freq is None:
+        freq = ax_freq
+
+    # get the period frequency
+    if isinstance(freq, DateOffset):
+        freq = freq.rule_code
+    else:
+        freq = get_base_alias(freq)
+
+    freq = frequencies.get_period_alias(freq)
+    return freq, ax_freq
+
+
+def _use_dynamic_x(ax, data):
+    freq = _get_index_freq(data)
+    ax_freq = _get_ax_freq(ax)
+
+    if freq is None:  # convert irregular if axes has freq info
+        freq = ax_freq
+    else:  # do not use tsplot if irregular was plotted first
+        if (ax_freq is None) and (len(ax.get_lines()) > 0):
+            return False
+
+    if freq is None:
+        return False
+
+    if isinstance(freq, DateOffset):
+        freq = freq.rule_code
+    else:
+        freq = get_base_alias(freq)
+    freq = frequencies.get_period_alias(freq)
+
+    if freq is None:
+        return False
+
+    # hack this for 0.10.1, creating more technical debt...sigh
+    if isinstance(data.index, ABCDatetimeIndex):
+        base = get_freq(freq)
+        x = data.index
+        if (base <= FreqGroup.FR_DAY):
+            return x[:1].is_normalized
+        return Period(x[0], freq).to_timestamp(tz=x.tz) == x[0]
+    return True
+
+
+def _get_index_freq(data):
+    freq = getattr(data.index, 'freq', None)
+    if freq is None:
+        freq = getattr(data.index, 'inferred_freq', None)
+        if freq == 'B':
+            weekdays = np.unique(data.index.dayofweek)
+            if (5 in weekdays) or (6 in weekdays):
+                freq = None
+    return freq
+
+
+def _maybe_convert_index(ax, data):
+    # tsplot converts automatically, but don't want to convert index
+    # over and over for DataFrames
+    if isinstance(data.index, ABCDatetimeIndex):
+        freq = getattr(data.index, 'freq', None)
+
+        if freq is None:
+            freq = getattr(data.index, 'inferred_freq', None)
+        if isinstance(freq, DateOffset):
+            freq = freq.rule_code
+
+        if freq is None:
+            freq = _get_ax_freq(ax)
+
+        if freq is None:
+            raise ValueError('Could not get frequency alias for plotting')
+
+        freq = get_base_alias(freq)
+        freq = frequencies.get_period_alias(freq)
+
+        data = data.to_period(freq=freq)
+    return data
+
+
+# Patch methods for subplot. Only format_dateaxis is currently used.
+# Do we need the rest for convenience?
+
+def format_timedelta_ticks(x, pos, n_decimals):
+    """
+    Convert seconds to 'D days HH:MM:SS.F'
+    """
+    s, ns = divmod(x, 1e9)
+    m, s = divmod(s, 60)
+    h, m = divmod(m, 60)
+    d, h = divmod(h, 24)
+    decimals = int(ns * 10**(n_decimals - 9))
+    s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
+    if n_decimals > 0:
+        s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
+    if d != 0:
+        s = '{:d} days '.format(int(d)) + s
+    return s
+
+
+def _format_coord(freq, t, y):
+    return "t = {0}  y = {1:8f}".format(Period(ordinal=int(t), freq=freq), y)
+
+
+def format_dateaxis(subplot, freq, index):
+    """
+    Pretty-formats the date axis (x-axis).
+
+    Major and minor ticks are automatically set for the frequency of the
+    current underlying series.  As the dynamic mode is activated by
+    default, changing the limits of the x axis will intelligently change
+    the positions of the ticks.
+    """
+
+    # handle index specific formatting
+    # Note: DatetimeIndex does not use this
+    # interface. DatetimeIndex uses matplotlib.date directly
+    if isinstance(index, ABCPeriodIndex):
+
+        majlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
+                                            minor_locator=False,
+                                            plot_obj=subplot)
+        minlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
+                                            minor_locator=True,
+                                            plot_obj=subplot)
+        subplot.xaxis.set_major_locator(majlocator)
+        subplot.xaxis.set_minor_locator(minlocator)
+
+        majformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
+                                                minor_locator=False,
+                                                plot_obj=subplot)
+        minformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
+                                                minor_locator=True,
+                                                plot_obj=subplot)
+        subplot.xaxis.set_major_formatter(majformatter)
+        subplot.xaxis.set_minor_formatter(minformatter)
+
+        # x and y coord info
+        subplot.format_coord = functools.partial(_format_coord, freq)
+
+    elif isinstance(index, ABCTimedeltaIndex):
+        subplot.xaxis.set_major_formatter(
+            TimeSeries_TimedeltaFormatter())
+    else:
+        raise TypeError('index type not supported')
+
+    pylab.draw_if_interactive()
diff --git a/pandas/plotting/_tools.py b/pandas/plotting/_tools.py
new file mode 100644
index 0000000000000..4d9e97f11fdd3
--- /dev/null
+++ b/pandas/plotting/_tools.py
@@ -0,0 +1,382 @@
+# being a bit too dynamic
+# pylint: disable=E1101
+from __future__ import division
+
+from math import ceil
+import warnings
+
+import numpy as np
+
+from pandas.compat import range
+
+from pandas.core.dtypes.common import is_list_like
+from pandas.core.dtypes.generic import ABCDataFrame, ABCIndexClass, ABCSeries
+
+
+def format_date_labels(ax, rot):
+    # mini version of autofmt_xdate
+    try:
+        for label in ax.get_xticklabels():
+            label.set_ha('right')
+            label.set_rotation(rot)
+        fig = ax.get_figure()
+        fig.subplots_adjust(bottom=0.2)
+    except Exception:  # pragma: no cover
+        pass
+
+
+def table(ax, data, rowLabels=None, colLabels=None, **kwargs):
+    """
+    Helper function to convert DataFrame and Series to matplotlib.table
+
+    Parameters
+    ----------
+    ax : Matplotlib axes object
+    data : DataFrame or Series
+        data for table contents
+    kwargs : keywords, optional
+        keyword arguments which passed to matplotlib.table.table.
+        If `rowLabels` or `colLabels` is not specified, data index or column
+        name will be used.
+
+    Returns
+    -------
+    matplotlib table object
+    """
+    if isinstance(data, ABCSeries):
+        data = data.to_frame()
+    elif isinstance(data, ABCDataFrame):
+        pass
+    else:
+        raise ValueError('Input data must be DataFrame or Series')
+
+    if rowLabels is None:
+        rowLabels = data.index
+
+    if colLabels is None:
+        colLabels = data.columns
+
+    cellText = data.values
+
+    import matplotlib.table
+    table = matplotlib.table.table(ax, cellText=cellText,
+                                   rowLabels=rowLabels,
+                                   colLabels=colLabels, **kwargs)
+    return table
+
+
+def _get_layout(nplots, layout=None, layout_type='box'):
+    if layout is not None:
+        if not isinstance(layout, (tuple, list)) or len(layout) != 2:
+            raise ValueError('Layout must be a tuple of (rows, columns)')
+
+        nrows, ncols = layout
+
+        # Python 2 compat
+        ceil_ = lambda x: int(ceil(x))
+        if nrows == -1 and ncols > 0:
+            layout = nrows, ncols = (ceil_(float(nplots) / ncols), ncols)
+        elif ncols == -1 and nrows > 0:
+            layout = nrows, ncols = (nrows, ceil_(float(nplots) / nrows))
+        elif ncols <= 0 and nrows <= 0:
+            msg = "At least one dimension of layout must be positive"
+            raise ValueError(msg)
+
+        if nrows * ncols < nplots:
+            raise ValueError('Layout of {nrows}x{ncols} must be larger '
+                             'than required size {nplots}'.format(
+                                 nrows=nrows, ncols=ncols, nplots=nplots))
+
+        return layout
+
+    if layout_type == 'single':
+        return (1, 1)
+    elif layout_type == 'horizontal':
+        return (1, nplots)
+    elif layout_type == 'vertical':
+        return (nplots, 1)
+
+    layouts = {1: (1, 1), 2: (1, 2), 3: (2, 2), 4: (2, 2)}
+    try:
+        return layouts[nplots]
+    except KeyError:
+        k = 1
+        while k ** 2 < nplots:
+            k += 1
+
+        if (k - 1) * k >= nplots:
+            return k, (k - 1)
+        else:
+            return k, k
+
+# copied from matplotlib/pyplot.py and modified for pandas.plotting
+
+
+def _subplots(naxes=None, sharex=False, sharey=False, squeeze=True,
+              subplot_kw=None, ax=None, layout=None, layout_type='box',
+              **fig_kw):
+    """Create a figure with a set of subplots already made.
+
+    This utility wrapper makes it convenient to create common layouts of
+    subplots, including the enclosing figure object, in a single call.
+
+    Keyword arguments:
+
+    naxes : int
+      Number of required axes. Exceeded axes are set invisible. Default is
+      nrows * ncols.
+
+    sharex : bool
+      If True, the X axis will be shared amongst all subplots.
+
+    sharey : bool
+      If True, the Y axis will be shared amongst all subplots.
+
+    squeeze : bool
+
+      If True, extra dimensions are squeezed out from the returned axis object:
+        - if only one subplot is constructed (nrows=ncols=1), the resulting
+        single Axis object is returned as a scalar.
+        - for Nx1 or 1xN subplots, the returned object is a 1-d numpy object
+        array of Axis objects are returned as numpy 1-d arrays.
+        - for NxM subplots with N>1 and M>1 are returned as a 2d array.
+
+      If False, no squeezing is done: the returned axis object is always
+      a 2-d array containing Axis instances, even if it ends up being 1x1.
+
+    subplot_kw : dict
+      Dict with keywords passed to the add_subplot() call used to create each
+      subplots.
+
+    ax : Matplotlib axis object, optional
+
+    layout : tuple
+      Number of rows and columns of the subplot grid.
+      If not specified, calculated from naxes and layout_type
+
+    layout_type : {'box', 'horziontal', 'vertical'}, default 'box'
+      Specify how to layout the subplot grid.
+
+    fig_kw : Other keyword arguments to be passed to the figure() call.
+        Note that all keywords not recognized above will be
+        automatically included here.
+
+    Returns:
+
+    fig, ax : tuple
+      - fig is the Matplotlib Figure object
+      - ax can be either a single axis object or an array of axis objects if
+      more than one subplot was created.  The dimensions of the resulting array
+      can be controlled with the squeeze keyword, see above.
+
+    **Examples:**
+
+    x = np.linspace(0, 2*np.pi, 400)
+    y = np.sin(x**2)
+
+    # Just a figure and one subplot
+    f, ax = plt.subplots()
+    ax.plot(x, y)
+    ax.set_title('Simple plot')
+
+    # Two subplots, unpack the output array immediately
+    f, (ax1, ax2) = plt.subplots(1, 2, sharey=True)
+    ax1.plot(x, y)
+    ax1.set_title('Sharing Y axis')
+    ax2.scatter(x, y)
+
+    # Four polar axes
+    plt.subplots(2, 2, subplot_kw=dict(polar=True))
+    """
+    import matplotlib.pyplot as plt
+
+    if subplot_kw is None:
+        subplot_kw = {}
+
+    if ax is None:
+        fig = plt.figure(**fig_kw)
+    else:
+        if is_list_like(ax):
+            ax = _flatten(ax)
+            if layout is not None:
+                warnings.warn("When passing multiple axes, layout keyword is "
+                              "ignored", UserWarning)
+            if sharex or sharey:
+                warnings.warn("When passing multiple axes, sharex and sharey "
+                              "are ignored. These settings must be specified "
+                              "when creating axes", UserWarning,
+                              stacklevel=4)
+            if len(ax) == naxes:
+                fig = ax[0].get_figure()
+                return fig, ax
+            else:
+                raise ValueError("The number of passed axes must be {0}, the "
+                                 "same as the output plot".format(naxes))
+
+        fig = ax.get_figure()
+        # if ax is passed and a number of subplots is 1, return ax as it is
+        if naxes == 1:
+            if squeeze:
+                return fig, ax
+            else:
+                return fig, _flatten(ax)
+        else:
+            warnings.warn("To output multiple subplots, the figure containing "
+                          "the passed axes is being cleared", UserWarning,
+                          stacklevel=4)
+            fig.clear()
+
+    nrows, ncols = _get_layout(naxes, layout=layout, layout_type=layout_type)
+    nplots = nrows * ncols
+
+    # Create empty object array to hold all axes.  It's easiest to make it 1-d
+    # so we can just append subplots upon creation, and then
+    axarr = np.empty(nplots, dtype=object)
+
+    # Create first subplot separately, so we can share it if requested
+    ax0 = fig.add_subplot(nrows, ncols, 1, **subplot_kw)
+
+    if sharex:
+        subplot_kw['sharex'] = ax0
+    if sharey:
+        subplot_kw['sharey'] = ax0
+    axarr[0] = ax0
+
+    # Note off-by-one counting because add_subplot uses the MATLAB 1-based
+    # convention.
+    for i in range(1, nplots):
+        kwds = subplot_kw.copy()
+        # Set sharex and sharey to None for blank/dummy axes, these can
+        # interfere with proper axis limits on the visible axes if
+        # they share axes e.g. issue #7528
+        if i >= naxes:
+            kwds['sharex'] = None
+            kwds['sharey'] = None
+        ax = fig.add_subplot(nrows, ncols, i + 1, **kwds)
+        axarr[i] = ax
+
+    if naxes != nplots:
+        for ax in axarr[naxes:]:
+            ax.set_visible(False)
+
+    _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey)
+
+    if squeeze:
+        # Reshape the array to have the final desired dimension (nrow,ncol),
+        # though discarding unneeded dimensions that equal 1.  If we only have
+        # one subplot, just return it instead of a 1-element array.
+        if nplots == 1:
+            axes = axarr[0]
+        else:
+            axes = axarr.reshape(nrows, ncols).squeeze()
+    else:
+        # returned axis array will be always 2-d, even if nrows=ncols=1
+        axes = axarr.reshape(nrows, ncols)
+
+    return fig, axes
+
+
+def _remove_labels_from_axis(axis):
+    for t in axis.get_majorticklabels():
+        t.set_visible(False)
+
+    try:
+        # set_visible will not be effective if
+        # minor axis has NullLocator and NullFormattor (default)
+        import matplotlib.ticker as ticker
+        if isinstance(axis.get_minor_locator(), ticker.NullLocator):
+            axis.set_minor_locator(ticker.AutoLocator())
+        if isinstance(axis.get_minor_formatter(), ticker.NullFormatter):
+            axis.set_minor_formatter(ticker.FormatStrFormatter(''))
+        for t in axis.get_minorticklabels():
+            t.set_visible(False)
+    except Exception:   # pragma no cover
+        raise
+    axis.get_label().set_visible(False)
+
+
+def _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey):
+    if nplots > 1:
+
+        if nrows > 1:
+            try:
+                # first find out the ax layout,
+                # so that we can correctly handle 'gaps"
+                layout = np.zeros((nrows + 1, ncols + 1), dtype=np.bool)
+                for ax in axarr:
+                    layout[ax.rowNum, ax.colNum] = ax.get_visible()
+
+                for ax in axarr:
+                    # only the last row of subplots should get x labels -> all
+                    # other off layout handles the case that the subplot is
+                    # the last in the column, because below is no subplot/gap.
+                    if not layout[ax.rowNum + 1, ax.colNum]:
+                        continue
+                    if sharex or len(ax.get_shared_x_axes()
+                                     .get_siblings(ax)) > 1:
+                        _remove_labels_from_axis(ax.xaxis)
+
+            except IndexError:
+                # if gridspec is used, ax.rowNum and ax.colNum may different
+                # from layout shape. in this case, use last_row logic
+                for ax in axarr:
+                    if ax.is_last_row():
+                        continue
+                    if sharex or len(ax.get_shared_x_axes()
+                                     .get_siblings(ax)) > 1:
+                        _remove_labels_from_axis(ax.xaxis)
+
+        if ncols > 1:
+            for ax in axarr:
+                # only the first column should get y labels -> set all other to
+                # off as we only have labels in the first column and we always
+                # have a subplot there, we can skip the layout test
+                if ax.is_first_col():
+                    continue
+                if sharey or len(ax.get_shared_y_axes().get_siblings(ax)) > 1:
+                    _remove_labels_from_axis(ax.yaxis)
+
+
+def _flatten(axes):
+    if not is_list_like(axes):
+        return np.array([axes])
+    elif isinstance(axes, (np.ndarray, ABCIndexClass)):
+        return axes.ravel()
+    return np.array(axes)
+
+
+def _get_all_lines(ax):
+    lines = ax.get_lines()
+
+    if hasattr(ax, 'right_ax'):
+        lines += ax.right_ax.get_lines()
+
+    if hasattr(ax, 'left_ax'):
+        lines += ax.left_ax.get_lines()
+
+    return lines
+
+
+def _get_xlim(lines):
+    left, right = np.inf, -np.inf
+    for l in lines:
+        x = l.get_xdata(orig=False)
+        left = min(np.nanmin(x), left)
+        right = max(np.nanmax(x), right)
+    return left, right
+
+
+def _set_ticks_props(axes, xlabelsize=None, xrot=None,
+                     ylabelsize=None, yrot=None):
+    import matplotlib.pyplot as plt
+
+    for ax in _flatten(axes):
+        if xlabelsize is not None:
+            plt.setp(ax.get_xticklabels(), fontsize=xlabelsize)
+        if xrot is not None:
+            plt.setp(ax.get_xticklabels(), rotation=xrot)
+        if ylabelsize is not None:
+            plt.setp(ax.get_yticklabels(), fontsize=ylabelsize)
+        if yrot is not None:
+            plt.setp(ax.get_yticklabels(), rotation=yrot)
+    return axes
diff --git a/pandas/sparse/api.py b/pandas/sparse/api.py
deleted file mode 100644
index 90be0a216535f..0000000000000
--- a/pandas/sparse/api.py
+++ /dev/null
@@ -1,6 +0,0 @@
-# pylint: disable=W0611
-# flake8: noqa
-from pandas.sparse.array import SparseArray
-from pandas.sparse.list import SparseList
-from pandas.sparse.series import SparseSeries
-from pandas.sparse.frame import SparseDataFrame
diff --git a/pandas/sparse/array.py b/pandas/sparse/array.py
deleted file mode 100644
index f149e724c19c3..0000000000000
--- a/pandas/sparse/array.py
+++ /dev/null
@@ -1,808 +0,0 @@
-"""
-SparseArray data structure
-"""
-from __future__ import division
-# pylint: disable=E1101,E1103,W0231
-
-import numpy as np
-import warnings
-
-import pandas as pd
-from pandas.core.base import PandasObject
-
-from pandas import compat
-from pandas.compat import range
-from pandas.compat.numpy import function as nv
-
-from pandas.types.generic import ABCSparseArray, ABCSparseSeries
-from pandas.types.common import (_ensure_platform_int,
-                                 is_float, is_integer,
-                                 is_integer_dtype,
-                                 is_bool_dtype,
-                                 is_list_like,
-                                 is_string_dtype,
-                                 is_scalar, is_dtype_equal)
-from pandas.types.cast import (maybe_convert_platform, maybe_promote,
-                               astype_nansafe, find_common_type)
-from pandas.types.missing import isnull, notnull, na_value_for_dtype
-
-from pandas.sparse import libsparse as splib
-from pandas.sparse.libsparse import SparseIndex, BlockIndex, IntIndex
-from pandas._libs import index as libindex
-import pandas.core.algorithms as algos
-import pandas.core.ops as ops
-import pandas.formats.printing as printing
-from pandas.util.decorators import Appender
-from pandas.indexes.base import _index_shared_docs
-
-
-_sparray_doc_kwargs = dict(klass='SparseArray')
-
-
-def _arith_method(op, name, str_rep=None, default_axis=None, fill_zeros=None,
-                  **eval_kwargs):
-    """
-    Wrapper function for Series arithmetic operations, to avoid
-    code duplication.
-    """
-
-    def wrapper(self, other):
-        if isinstance(other, np.ndarray):
-            if len(self) != len(other):
-                raise AssertionError("length mismatch: %d vs. %d" %
-                                     (len(self), len(other)))
-            if not isinstance(other, ABCSparseArray):
-                dtype = getattr(other, 'dtype', None)
-                other = SparseArray(other, fill_value=self.fill_value,
-                                    dtype=dtype)
-            return _sparse_array_op(self, other, op, name)
-        elif is_scalar(other):
-            with np.errstate(all='ignore'):
-                fill = op(_get_fill(self), np.asarray(other))
-                result = op(self.sp_values, other)
-
-            return _wrap_result(name, result, self.sp_index, fill)
-        else:  # pragma: no cover
-            raise TypeError('operation with %s not supported' % type(other))
-
-    if name.startswith("__"):
-        name = name[2:-2]
-    wrapper.__name__ = name
-    return wrapper
-
-
-def _get_fill(arr):
-    # coerce fill_value to arr dtype if possible
-    # int64 SparseArray can have NaN as fill_value if there is no missing
-    try:
-        return np.asarray(arr.fill_value, dtype=arr.dtype)
-    except ValueError:
-        return np.asarray(arr.fill_value)
-
-
-def _sparse_array_op(left, right, op, name, series=False):
-
-    if series and is_integer_dtype(left) and is_integer_dtype(right):
-        # series coerces to float64 if result should have NaN/inf
-        if name in ('floordiv', 'mod') and (right.values == 0).any():
-            left = left.astype(np.float64)
-            right = right.astype(np.float64)
-        elif name in ('rfloordiv', 'rmod') and (left.values == 0).any():
-            left = left.astype(np.float64)
-            right = right.astype(np.float64)
-
-    # dtype used to find corresponding sparse method
-    if not is_dtype_equal(left.dtype, right.dtype):
-        dtype = find_common_type([left.dtype, right.dtype])
-        left = left.astype(dtype)
-        right = right.astype(dtype)
-    else:
-        dtype = left.dtype
-
-    # dtype the result must have
-    result_dtype = None
-
-    if left.sp_index.ngaps == 0 or right.sp_index.ngaps == 0:
-        with np.errstate(all='ignore'):
-            result = op(left.get_values(), right.get_values())
-            fill = op(_get_fill(left), _get_fill(right))
-
-        if left.sp_index.ngaps == 0:
-            index = left.sp_index
-        else:
-            index = right.sp_index
-    elif left.sp_index.equals(right.sp_index):
-        with np.errstate(all='ignore'):
-            result = op(left.sp_values, right.sp_values)
-            fill = op(_get_fill(left), _get_fill(right))
-        index = left.sp_index
-    else:
-        if name[0] == 'r':
-            left, right = right, left
-            name = name[1:]
-
-        if name in ('and', 'or') and dtype == 'bool':
-            opname = 'sparse_{name}_uint8'.format(name=name, dtype=dtype)
-            # to make template simple, cast here
-            left_sp_values = left.sp_values.view(np.uint8)
-            right_sp_values = right.sp_values.view(np.uint8)
-            result_dtype = np.bool
-        else:
-            opname = 'sparse_{name}_{dtype}'.format(name=name, dtype=dtype)
-            left_sp_values = left.sp_values
-            right_sp_values = right.sp_values
-
-        sparse_op = getattr(splib, opname)
-        with np.errstate(all='ignore'):
-            result, index, fill = sparse_op(left_sp_values, left.sp_index,
-                                            left.fill_value, right_sp_values,
-                                            right.sp_index, right.fill_value)
-
-    if result_dtype is None:
-        result_dtype = result.dtype
-
-    return _wrap_result(name, result, index, fill, dtype=result_dtype)
-
-
-def _wrap_result(name, data, sparse_index, fill_value, dtype=None):
-    """ wrap op result to have correct dtype """
-    if name in ('eq', 'ne', 'lt', 'gt', 'le', 'ge'):
-        dtype = np.bool
-
-    if is_bool_dtype(dtype):
-        # fill_value may be np.bool_
-        fill_value = bool(fill_value)
-    return SparseArray(data, sparse_index=sparse_index,
-                       fill_value=fill_value, dtype=dtype)
-
-
-class SparseArray(PandasObject, np.ndarray):
-    """Data structure for labeled, sparse floating point 1-D data
-
-    Parameters
-    ----------
-    data : {array-like (1-D), Series, SparseSeries, dict}
-    kind : {'block', 'integer'}
-    fill_value : float
-        Code for missing value. Defaults depends on dtype.
-        0 for int dtype, False for bool dtype, and NaN for other dtypes
-    sparse_index : {BlockIndex, IntIndex}, optional
-        Only if you have one. Mainly used internally
-
-    Notes
-    -----
-    SparseArray objects are immutable via the typical Python means. If you
-    must change values, convert to dense, make your changes, then convert back
-    to sparse
-    """
-    __array_priority__ = 15
-    _typ = 'array'
-    _subtyp = 'sparse_array'
-
-    sp_index = None
-    fill_value = None
-
-    def __new__(cls, data, sparse_index=None, index=None, kind='integer',
-                fill_value=None, dtype=None, copy=False):
-
-        if index is not None:
-            if data is None:
-                data = np.nan
-            if not is_scalar(data):
-                raise Exception("must only pass scalars with an index ")
-            values = np.empty(len(index), dtype='float64')
-            values.fill(data)
-            data = values
-
-        if isinstance(data, ABCSparseSeries):
-            data = data.values
-        is_sparse_array = isinstance(data, SparseArray)
-
-        if dtype is not None:
-            dtype = np.dtype(dtype)
-
-        if is_sparse_array:
-            sparse_index = data.sp_index
-            values = data.sp_values
-            fill_value = data.fill_value
-        else:
-            # array-like
-            if sparse_index is None:
-                if dtype is not None:
-                    data = np.asarray(data, dtype=dtype)
-                res = make_sparse(data, kind=kind, fill_value=fill_value)
-                values, sparse_index, fill_value = res
-            else:
-                values = _sanitize_values(data)
-                if len(values) != sparse_index.npoints:
-                    raise AssertionError("Non array-like type {0} must have"
-                                         " the same length as the"
-                                         " index".format(type(values)))
-        # Create array, do *not* copy data by default
-        if copy:
-            subarr = np.array(values, dtype=dtype, copy=True)
-        else:
-            subarr = np.asarray(values, dtype=dtype)
-        # Change the class of the array to be the subclass type.
-        return cls._simple_new(subarr, sparse_index, fill_value)
-
-    @classmethod
-    def _simple_new(cls, data, sp_index, fill_value):
-        if not isinstance(sp_index, SparseIndex):
-            # caller must pass SparseIndex
-            raise ValueError('sp_index must be a SparseIndex')
-
-        if fill_value is None:
-            if sp_index.ngaps > 0:
-                # has missing hole
-                fill_value = np.nan
-            else:
-                fill_value = na_value_for_dtype(data.dtype)
-
-        if (is_integer_dtype(data) and is_float(fill_value) and
-                sp_index.ngaps > 0):
-            # if float fill_value is being included in dense repr,
-            # convert values to float
-            data = data.astype(float)
-
-        result = data.view(cls)
-
-        if not isinstance(sp_index, SparseIndex):
-            # caller must pass SparseIndex
-            raise ValueError('sp_index must be a SparseIndex')
-
-        result.sp_index = sp_index
-        result._fill_value = fill_value
-        return result
-
-    @property
-    def _constructor(self):
-        return lambda x: SparseArray(x, fill_value=self.fill_value,
-                                     kind=self.kind)
-
-    @property
-    def kind(self):
-        if isinstance(self.sp_index, BlockIndex):
-            return 'block'
-        elif isinstance(self.sp_index, IntIndex):
-            return 'integer'
-
-    def __array_wrap__(self, out_arr, context=None):
-        """
-        NumPy calls this method when ufunc is applied
-
-        Parameters
-        ----------
-
-        out_arr : ndarray
-            ufunc result (note that ufunc is only applied to sp_values)
-        context : tuple of 3 elements (ufunc, signature, domain)
-            for example, following is a context when np.sin is applied to
-            SparseArray,
-
-            (<ufunc 'sin'>, (SparseArray,), 0))
-
-        See http://docs.scipy.org/doc/numpy/user/basics.subclassing.html
-        """
-        if isinstance(context, tuple) and len(context) == 3:
-            ufunc, args, domain = context
-            # to apply ufunc only to fill_value (to avoid recursive call)
-            args = [getattr(a, 'fill_value', a) for a in args]
-            with np.errstate(all='ignore'):
-                fill_value = ufunc(self.fill_value, *args[1:])
-        else:
-            fill_value = self.fill_value
-
-        return self._simple_new(out_arr, sp_index=self.sp_index,
-                                fill_value=fill_value)
-
-    def __array_finalize__(self, obj):
-        """
-        Gets called after any ufunc or other array operations, necessary
-        to pass on the index.
-        """
-        self.sp_index = getattr(obj, 'sp_index', None)
-        self._fill_value = getattr(obj, 'fill_value', None)
-
-    def __reduce__(self):
-        """Necessary for making this object picklable"""
-        object_state = list(np.ndarray.__reduce__(self))
-        subclass_state = self.fill_value, self.sp_index
-        object_state[2] = (object_state[2], subclass_state)
-        return tuple(object_state)
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        nd_state, own_state = state
-        np.ndarray.__setstate__(self, nd_state)
-
-        fill_value, sp_index = own_state[:2]
-        self.sp_index = sp_index
-        self._fill_value = fill_value
-
-    def __len__(self):
-        try:
-            return self.sp_index.length
-        except:
-            return 0
-
-    def __unicode__(self):
-        return '%s\nFill: %s\n%s' % (printing.pprint_thing(self),
-                                     printing.pprint_thing(self.fill_value),
-                                     printing.pprint_thing(self.sp_index))
-
-    def disable(self, other):
-        raise NotImplementedError('inplace binary ops not supported')
-    # Inplace operators
-    __iadd__ = disable
-    __isub__ = disable
-    __imul__ = disable
-    __itruediv__ = disable
-    __ifloordiv__ = disable
-    __ipow__ = disable
-
-    # Python 2 division operators
-    if not compat.PY3:
-        __idiv__ = disable
-
-    @property
-    def values(self):
-        """
-        Dense values
-        """
-        output = np.empty(len(self), dtype=self.dtype)
-        int_index = self.sp_index.to_int_index()
-        output.fill(self.fill_value)
-        output.put(int_index.indices, self)
-        return output
-
-    @property
-    def sp_values(self):
-        # caching not an option, leaks memory
-        return self.view(np.ndarray)
-
-    @property
-    def fill_value(self):
-        return self._fill_value
-
-    @fill_value.setter
-    def fill_value(self, value):
-        if not is_scalar(value):
-            raise ValueError('fill_value must be a scalar')
-        # if the specified value triggers type promotion, raise ValueError
-        new_dtype, fill_value = maybe_promote(self.dtype, value)
-        if is_dtype_equal(self.dtype, new_dtype):
-            self._fill_value = fill_value
-        else:
-            msg = 'unable to set fill_value {0} to {1} dtype'
-            raise ValueError(msg.format(value, self.dtype))
-
-    def get_values(self, fill=None):
-        """ return a dense representation """
-        return self.to_dense(fill=fill)
-
-    def to_dense(self, fill=None):
-        """
-        Convert SparseArray to a NumPy array.
-
-        Parameters
-        ----------
-        fill: float, default None
-            DEPRECATED: this argument will be removed in a future version
-            because it is not respected by this function.
-
-        Returns
-        -------
-        arr : NumPy array
-        """
-        if fill is not None:
-            warnings.warn(("The 'fill' parameter has been deprecated and "
-                           "will be removed in a future version."),
-                          FutureWarning, stacklevel=2)
-        return self.values
-
-    def __iter__(self):
-        for i in range(len(self)):
-            yield self._get_val_at(i)
-
-    def __getitem__(self, key):
-        """
-
-        """
-
-        if is_integer(key):
-            return self._get_val_at(key)
-        elif isinstance(key, tuple):
-            data_slice = self.values[key]
-        else:
-            if isinstance(key, SparseArray):
-                if is_bool_dtype(key):
-                    key = key.to_dense()
-                else:
-                    key = np.asarray(key)
-
-            if hasattr(key, '__len__') and len(self) != len(key):
-                return self.take(key)
-            else:
-                data_slice = self.values[key]
-
-        return self._constructor(data_slice)
-
-    def __getslice__(self, i, j):
-        if i < 0:
-            i = 0
-        if j < 0:
-            j = 0
-        slobj = slice(i, j)
-        return self.__getitem__(slobj)
-
-    def _get_val_at(self, loc):
-        n = len(self)
-        if loc < 0:
-            loc += n
-
-        if loc >= n or loc < 0:
-            raise IndexError('Out of bounds access')
-
-        sp_loc = self.sp_index.lookup(loc)
-        if sp_loc == -1:
-            return self.fill_value
-        else:
-            return libindex.get_value_at(self, sp_loc)
-
-    @Appender(_index_shared_docs['take'] % _sparray_doc_kwargs)
-    def take(self, indices, axis=0, allow_fill=True,
-             fill_value=None, **kwargs):
-        """
-        Sparse-compatible version of ndarray.take
-
-        Returns
-        -------
-        taken : ndarray
-        """
-        nv.validate_take(tuple(), kwargs)
-
-        if axis:
-            raise ValueError("axis must be 0, input was {0}".format(axis))
-
-        if is_integer(indices):
-            # return scalar
-            return self[indices]
-
-        indices = _ensure_platform_int(indices)
-        n = len(self)
-        if allow_fill and fill_value is not None:
-            # allow -1 to indicate self.fill_value,
-            # self.fill_value may not be NaN
-            if (indices < -1).any():
-                msg = ('When allow_fill=True and fill_value is not None, '
-                       'all indices must be >= -1')
-                raise ValueError(msg)
-            elif (n <= indices).any():
-                msg = 'index is out of bounds for size {0}'
-                raise IndexError(msg.format(n))
-        else:
-            if ((indices < -n) | (n <= indices)).any():
-                msg = 'index is out of bounds for size {0}'
-                raise IndexError(msg.format(n))
-
-        indices = indices.astype(np.int32)
-        if not (allow_fill and fill_value is not None):
-            indices = indices.copy()
-            indices[indices < 0] += n
-
-        locs = self.sp_index.lookup_array(indices)
-        indexer = np.arange(len(locs), dtype=np.int32)
-        mask = locs != -1
-        if mask.any():
-            indexer = indexer[mask]
-            new_values = self.sp_values.take(locs[mask])
-        else:
-            indexer = np.empty(shape=(0, ), dtype=np.int32)
-            new_values = np.empty(shape=(0, ), dtype=self.sp_values.dtype)
-
-        sp_index = _make_index(len(indices), indexer, kind=self.sp_index)
-        return self._simple_new(new_values, sp_index, self.fill_value)
-
-    def __setitem__(self, key, value):
-        # if is_integer(key):
-        #    self.values[key] = value
-        # else:
-        #    raise Exception("SparseArray does not support seting non-scalars
-        # via setitem")
-        raise TypeError(
-            "SparseArray does not support item assignment via setitem")
-
-    def __setslice__(self, i, j, value):
-        if i < 0:
-            i = 0
-        if j < 0:
-            j = 0
-        slobj = slice(i, j)  # noqa
-
-        # if not is_scalar(value):
-        #    raise Exception("SparseArray does not support seting non-scalars
-        # via slices")
-
-        # x = self.values
-        # x[slobj] = value
-        # self.values = x
-        raise TypeError("SparseArray does not support item assignment via "
-                        "slices")
-
-    def astype(self, dtype=None, copy=True):
-        dtype = np.dtype(dtype)
-        sp_values = astype_nansafe(self.sp_values, dtype, copy=copy)
-        try:
-            if is_bool_dtype(dtype):
-                # to avoid np.bool_ dtype
-                fill_value = bool(self.fill_value)
-            else:
-                fill_value = dtype.type(self.fill_value)
-        except ValueError:
-            msg = 'unable to coerce current fill_value {0} to {1} dtype'
-            raise ValueError(msg.format(self.fill_value, dtype))
-        return self._simple_new(sp_values, self.sp_index,
-                                fill_value=fill_value)
-
-    def copy(self, deep=True):
-        """
-        Make a copy of the SparseArray. Only the actual sparse values need to
-        be copied.
-        """
-        if deep:
-            values = self.sp_values.copy()
-        else:
-            values = self.sp_values
-        return SparseArray(values, sparse_index=self.sp_index,
-                           dtype=self.dtype, fill_value=self.fill_value)
-
-    def count(self):
-        """
-        Compute sum of non-NA/null observations in SparseArray. If the
-        fill_value is not NaN, the "sparse" locations will be included in the
-        observation count.
-
-        Returns
-        -------
-        nobs : int
-        """
-        sp_values = self.sp_values
-        valid_spvals = np.isfinite(sp_values).sum()
-        if self._null_fill_value:
-            return valid_spvals
-        else:
-            return valid_spvals + self.sp_index.ngaps
-
-    @property
-    def _null_fill_value(self):
-        return isnull(self.fill_value)
-
-    @property
-    def _valid_sp_values(self):
-        sp_vals = self.sp_values
-        mask = notnull(sp_vals)
-        return sp_vals[mask]
-
-    @Appender(_index_shared_docs['fillna'] % _sparray_doc_kwargs)
-    def fillna(self, value, downcast=None):
-        if downcast is not None:
-            raise NotImplementedError
-
-        if issubclass(self.dtype.type, np.floating):
-            value = float(value)
-
-        if self._null_fill_value:
-            return self._simple_new(self.sp_values, self.sp_index,
-                                    fill_value=value)
-        else:
-            new_values = self.sp_values.copy()
-            new_values[isnull(new_values)] = value
-            return self._simple_new(new_values, self.sp_index,
-                                    fill_value=self.fill_value)
-
-    def sum(self, axis=0, *args, **kwargs):
-        """
-        Sum of non-NA/null values
-
-        Returns
-        -------
-        sum : float
-        """
-        nv.validate_sum(args, kwargs)
-        valid_vals = self._valid_sp_values
-        sp_sum = valid_vals.sum()
-        if self._null_fill_value:
-            return sp_sum
-        else:
-            nsparse = self.sp_index.ngaps
-            return sp_sum + self.fill_value * nsparse
-
-    def cumsum(self, axis=0, *args, **kwargs):
-        """
-        Cumulative sum of non-NA/null values.
-
-        When performing the cumulative summation, any non-NA/null values will
-        be skipped. The resulting SparseArray will preserve the locations of
-        NaN values, but the fill value will be `np.nan` regardless.
-
-        Parameters
-        ----------
-        axis : int or None
-            Axis over which to perform the cumulative summation. If None,
-            perform cumulative summation over flattened array.
-
-        Returns
-        -------
-        cumsum : SparseArray
-        """
-        nv.validate_cumsum(args, kwargs)
-
-        if axis is not None and axis >= self.ndim:  # Mimic ndarray behaviour.
-            raise ValueError("axis(={axis}) out of bounds".format(axis=axis))
-
-        if not self._null_fill_value:
-            return SparseArray(self.to_dense()).cumsum()
-
-        return SparseArray(self.sp_values.cumsum(), sparse_index=self.sp_index,
-                           fill_value=self.fill_value)
-
-    def mean(self, axis=0, *args, **kwargs):
-        """
-        Mean of non-NA/null values
-
-        Returns
-        -------
-        mean : float
-        """
-        nv.validate_mean(args, kwargs)
-        valid_vals = self._valid_sp_values
-        sp_sum = valid_vals.sum()
-        ct = len(valid_vals)
-
-        if self._null_fill_value:
-            return sp_sum / ct
-        else:
-            nsparse = self.sp_index.ngaps
-            return (sp_sum + self.fill_value * nsparse) / (ct + nsparse)
-
-    def value_counts(self, dropna=True):
-        """
-        Returns a Series containing counts of unique values.
-
-        Parameters
-        ----------
-        dropna : boolean, default True
-            Don't include counts of NaN, even if NaN is in sp_values.
-
-        Returns
-        -------
-        counts : Series
-        """
-        keys, counts = algos._value_counts_arraylike(self.sp_values,
-                                                     dropna=dropna)
-        fcounts = self.sp_index.ngaps
-        if fcounts > 0:
-            if self._null_fill_value and dropna:
-                pass
-            else:
-                if self._null_fill_value:
-                    mask = pd.isnull(keys)
-                else:
-                    mask = keys == self.fill_value
-
-                if mask.any():
-                    counts[mask] += fcounts
-                else:
-                    keys = np.insert(keys, 0, self.fill_value)
-                    counts = np.insert(counts, 0, fcounts)
-
-        if not isinstance(keys, pd.Index):
-            keys = pd.Index(keys)
-        result = pd.Series(counts, index=keys)
-        return result
-
-
-def _maybe_to_dense(obj):
-    """ try to convert to dense """
-    if hasattr(obj, 'to_dense'):
-        return obj.to_dense()
-    return obj
-
-
-def _maybe_to_sparse(array):
-    """ array must be SparseSeries or SparseArray """
-    if isinstance(array, ABCSparseSeries):
-        array = array.values.copy()
-    return array
-
-
-def _sanitize_values(arr):
-    """
-    return an ndarray for our input,
-    in a platform independent manner
-    """
-
-    if hasattr(arr, 'values'):
-        arr = arr.values
-    else:
-
-        # scalar
-        if is_scalar(arr):
-            arr = [arr]
-
-        # ndarray
-        if isinstance(arr, np.ndarray):
-            pass
-
-        elif is_list_like(arr) and len(arr) > 0:
-            arr = maybe_convert_platform(arr)
-
-        else:
-            arr = np.asarray(arr)
-
-    return arr
-
-
-def make_sparse(arr, kind='block', fill_value=None):
-    """
-    Convert ndarray to sparse format
-
-    Parameters
-    ----------
-    arr : ndarray
-    kind : {'block', 'integer'}
-    fill_value : NaN or another value
-
-    Returns
-    -------
-    (sparse_values, index) : (ndarray, SparseIndex)
-    """
-
-    arr = _sanitize_values(arr)
-
-    if arr.ndim > 1:
-        raise TypeError("expected dimension <= 1 data")
-
-    if fill_value is None:
-        fill_value = na_value_for_dtype(arr.dtype)
-
-    if isnull(fill_value):
-        mask = notnull(arr)
-    else:
-        # For str arrays in NumPy 1.12.0, operator!= below isn't
-        # element-wise but just returns False if fill_value is not str,
-        # so cast to object comparison to be safe
-        if is_string_dtype(arr):
-            arr = arr.astype(object)
-
-        mask = arr != fill_value
-
-    length = len(arr)
-    if length != mask.size:
-        # the arr is a SparseArray
-        indices = mask.sp_index.indices
-    else:
-        indices = mask.nonzero()[0].astype(np.int32)
-
-    index = _make_index(length, indices, kind)
-    sparsified_values = arr[mask]
-    return sparsified_values, index, fill_value
-
-
-def _make_index(length, indices, kind):
-
-    if kind == 'block' or isinstance(kind, BlockIndex):
-        locs, lens = splib.get_blocks(indices)
-        index = BlockIndex(length, locs, lens)
-    elif kind == 'integer' or isinstance(kind, IntIndex):
-        index = IntIndex(length, indices)
-    else:  # pragma: no cover
-        raise ValueError('must be block or integer type')
-    return index
-
-
-ops.add_special_arithmetic_methods(SparseArray, arith_method=_arith_method,
-                                   comp_method=_arith_method,
-                                   bool_method=_arith_method,
-                                   use_numexpr=False)
diff --git a/pandas/sparse/frame.py b/pandas/sparse/frame.py
deleted file mode 100644
index 455d120cca640..0000000000000
--- a/pandas/sparse/frame.py
+++ /dev/null
@@ -1,944 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-from __future__ import division
-# pylint: disable=E1101,E1103,W0231,E0202
-
-from numpy import nan
-from pandas.compat import lmap
-from pandas import compat
-import numpy as np
-
-from pandas.types.missing import isnull, notnull
-from pandas.types.cast import maybe_upcast, find_common_type
-from pandas.types.common import _ensure_platform_int, is_scipy_sparse
-
-from pandas.core.common import _try_sort
-from pandas.compat.numpy import function as nv
-from pandas.core.index import Index, MultiIndex, _ensure_index
-from pandas.core.series import Series
-from pandas.core.frame import (DataFrame, extract_index, _prep_ndarray,
-                               _default_index)
-import pandas.core.algorithms as algos
-from pandas.core.internals import (BlockManager,
-                                   create_block_manager_from_arrays)
-import pandas.core.generic as generic
-from pandas.sparse.series import SparseSeries, SparseArray
-from pandas.sparse.libsparse import BlockIndex, get_blocks
-from pandas.util.decorators import Appender
-import pandas.core.ops as ops
-
-
-_shared_doc_kwargs = dict(klass='SparseDataFrame')
-
-
-class SparseDataFrame(DataFrame):
-    """
-    DataFrame containing sparse floating point data in the form of SparseSeries
-    objects
-
-    Parameters
-    ----------
-    data : same types as can be passed to DataFrame or scipy.sparse.spmatrix
-    index : array-like, optional
-    column : array-like, optional
-    default_kind : {'block', 'integer'}, default 'block'
-        Default sparse kind for converting Series to SparseSeries. Will not
-        override SparseSeries passed into constructor
-    default_fill_value : float
-        Default fill_value for converting Series to SparseSeries
-        (default: nan). Will not override SparseSeries passed in.
-    """
-    _constructor_sliced = SparseSeries
-    _subtyp = 'sparse_frame'
-
-    def __init__(self, data=None, index=None, columns=None, default_kind=None,
-                 default_fill_value=None, dtype=None, copy=False):
-
-        # pick up the defaults from the Sparse structures
-        if isinstance(data, SparseDataFrame):
-            if index is None:
-                index = data.index
-            if columns is None:
-                columns = data.columns
-            if default_fill_value is None:
-                default_fill_value = data.default_fill_value
-            if default_kind is None:
-                default_kind = data.default_kind
-        elif isinstance(data, (SparseSeries, SparseArray)):
-            if index is None:
-                index = data.index
-            if default_fill_value is None:
-                default_fill_value = data.fill_value
-            if columns is None and hasattr(data, 'name'):
-                columns = [data.name]
-            if columns is None:
-                raise Exception("cannot pass a series w/o a name or columns")
-            data = {columns[0]: data}
-
-        if default_fill_value is None:
-            default_fill_value = np.nan
-        if default_kind is None:
-            default_kind = 'block'
-
-        self._default_kind = default_kind
-        self._default_fill_value = default_fill_value
-
-        if is_scipy_sparse(data):
-            mgr = self._init_spmatrix(data, index, columns, dtype=dtype,
-                                      fill_value=default_fill_value)
-        elif isinstance(data, dict):
-            mgr = self._init_dict(data, index, columns, dtype=dtype)
-        elif isinstance(data, (np.ndarray, list)):
-            mgr = self._init_matrix(data, index, columns, dtype=dtype)
-        elif isinstance(data, SparseDataFrame):
-            mgr = self._init_mgr(data._data,
-                                 dict(index=index, columns=columns),
-                                 dtype=dtype, copy=copy)
-        elif isinstance(data, DataFrame):
-            mgr = self._init_dict(data, data.index, data.columns, dtype=dtype)
-        elif isinstance(data, BlockManager):
-            mgr = self._init_mgr(data, axes=dict(index=index, columns=columns),
-                                 dtype=dtype, copy=copy)
-        elif data is None:
-            data = DataFrame()
-
-            if index is None:
-                index = Index([])
-            else:
-                index = _ensure_index(index)
-
-            if columns is None:
-                columns = Index([])
-            else:
-                for c in columns:
-                    data[c] = SparseArray(np.nan, index=index,
-                                          kind=self._default_kind,
-                                          fill_value=self._default_fill_value)
-            mgr = to_manager(data, columns, index)
-            if dtype is not None:
-                mgr = mgr.astype(dtype)
-
-        generic.NDFrame.__init__(self, mgr)
-
-    @property
-    def _constructor(self):
-        return SparseDataFrame
-
-    _constructor_sliced = SparseSeries
-
-    def _init_dict(self, data, index, columns, dtype=None):
-        # pre-filter out columns if we passed it
-        if columns is not None:
-            columns = _ensure_index(columns)
-            data = dict((k, v) for k, v in compat.iteritems(data)
-                        if k in columns)
-        else:
-            columns = Index(_try_sort(list(data.keys())))
-
-        if index is None:
-            index = extract_index(list(data.values()))
-
-        sp_maker = lambda x: SparseArray(x, kind=self._default_kind,
-                                         fill_value=self._default_fill_value,
-                                         copy=True, dtype=dtype)
-        sdict = DataFrame()
-        for k, v in compat.iteritems(data):
-            if isinstance(v, Series):
-                # Force alignment, no copy necessary
-                if not v.index.equals(index):
-                    v = v.reindex(index)
-
-                if not isinstance(v, SparseSeries):
-                    v = sp_maker(v.values)
-            elif isinstance(v, SparseArray):
-                v = v.copy()
-            else:
-                if isinstance(v, dict):
-                    v = [v.get(i, nan) for i in index]
-
-                v = sp_maker(v)
-            sdict[k] = v
-
-        # TODO: figure out how to handle this case, all nan's?
-        # add in any other columns we want to have (completeness)
-        nan_vec = np.empty(len(index))
-        nan_vec.fill(nan)
-        for c in columns:
-            if c not in sdict:
-                sdict[c] = sp_maker(nan_vec)
-
-        return to_manager(sdict, columns, index)
-
-    def _init_matrix(self, data, index, columns, dtype=None):
-        """ Init self from ndarray or list of lists """
-        data = _prep_ndarray(data, copy=False)
-        index, columns = self._prep_index(data, index, columns)
-        data = dict([(idx, data[:, i]) for i, idx in enumerate(columns)])
-        return self._init_dict(data, index, columns, dtype)
-
-    def _init_spmatrix(self, data, index, columns, dtype=None,
-                       fill_value=None):
-        """ Init self from scipy.sparse matrix """
-        index, columns = self._prep_index(data, index, columns)
-        data = data.tocoo()
-        N = len(index)
-
-        # Construct a dict of SparseSeries
-        sdict = {}
-        values = Series(data.data, index=data.row, copy=False)
-        for col, rowvals in values.groupby(data.col):
-            # get_blocks expects int32 row indices in sorted order
-            rows = rowvals.index.values.astype(np.int32)
-            rows.sort()
-            blocs, blens = get_blocks(rows)
-
-            sdict[columns[col]] = SparseSeries(
-                rowvals.values, index=index,
-                fill_value=fill_value,
-                sparse_index=BlockIndex(N, blocs, blens))
-
-        # Add any columns that were empty and thus not grouped on above
-        sdict.update({column: SparseSeries(index=index,
-                                           fill_value=fill_value,
-                                           sparse_index=BlockIndex(N, [], []))
-                      for column in columns
-                      if column not in sdict})
-
-        return self._init_dict(sdict, index, columns, dtype)
-
-    def _prep_index(self, data, index, columns):
-        N, K = data.shape
-        if index is None:
-            index = _default_index(N)
-        if columns is None:
-            columns = _default_index(K)
-
-        if len(columns) != K:
-            raise ValueError('Column length mismatch: %d vs. %d' %
-                             (len(columns), K))
-        if len(index) != N:
-            raise ValueError('Index length mismatch: %d vs. %d' %
-                             (len(index), N))
-        return index, columns
-
-    def to_coo(self):
-        """
-        Return the contents of the frame as a sparse SciPy COO matrix.
-
-        .. versionadded:: 0.20.0
-
-        Returns
-        -------
-        coo_matrix : scipy.sparse.spmatrix
-            If the caller is heterogeneous and contains booleans or objects,
-            the result will be of dtype=object. See Notes.
-
-        Notes
-        -----
-        The dtype will be the lowest-common-denominator type (implicit
-        upcasting); that is to say if the dtypes (even of numeric types)
-        are mixed, the one that accommodates all will be chosen.
-
-        e.g. If the dtypes are float16 and float32, dtype will be upcast to
-        float32. By numpy.find_common_type convention, mixing int64 and
-        and uint64 will result in a float64 dtype.
-        """
-        try:
-            from scipy.sparse import coo_matrix
-        except ImportError:
-            raise ImportError('Scipy is not installed')
-
-        dtype = find_common_type(self.dtypes)
-        cols, rows, datas = [], [], []
-        for col, name in enumerate(self):
-            s = self[name]
-            row = s.sp_index.to_int_index().indices
-            cols.append(np.repeat(col, len(row)))
-            rows.append(row)
-            datas.append(s.sp_values.astype(dtype, copy=False))
-
-        cols = np.concatenate(cols)
-        rows = np.concatenate(rows)
-        datas = np.concatenate(datas)
-        return coo_matrix((datas, (rows, cols)), shape=self.shape)
-
-    def __array_wrap__(self, result):
-        return self._constructor(
-            result, index=self.index, columns=self.columns,
-            default_kind=self._default_kind,
-            default_fill_value=self._default_fill_value).__finalize__(self)
-
-    def __getstate__(self):
-        # pickling
-        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
-                    _default_fill_value=self._default_fill_value,
-                    _default_kind=self._default_kind)
-
-    def _unpickle_sparse_frame_compat(self, state):
-        """ original pickle format """
-        series, cols, idx, fv, kind = state
-
-        if not isinstance(cols, Index):  # pragma: no cover
-            from pandas.io.pickle import _unpickle_array
-            columns = _unpickle_array(cols)
-        else:
-            columns = cols
-
-        if not isinstance(idx, Index):  # pragma: no cover
-            from pandas.io.pickle import _unpickle_array
-            index = _unpickle_array(idx)
-        else:
-            index = idx
-
-        series_dict = DataFrame()
-        for col, (sp_index, sp_values) in compat.iteritems(series):
-            series_dict[col] = SparseSeries(sp_values, sparse_index=sp_index,
-                                            fill_value=fv)
-
-        self._data = to_manager(series_dict, columns, index)
-        self._default_fill_value = fv
-        self._default_kind = kind
-
-    def to_dense(self):
-        """
-        Convert to dense DataFrame
-
-        Returns
-        -------
-        df : DataFrame
-        """
-        data = dict((k, v.to_dense()) for k, v in compat.iteritems(self))
-        return DataFrame(data, index=self.index, columns=self.columns)
-
-    def _apply_columns(self, func):
-        """ get new SparseDataFrame applying func to each columns """
-
-        new_data = {}
-        for col, series in compat.iteritems(self):
-            new_data[col] = func(series)
-
-        return self._constructor(
-            data=new_data, index=self.index, columns=self.columns,
-            default_fill_value=self.default_fill_value).__finalize__(self)
-
-    def astype(self, dtype):
-        return self._apply_columns(lambda x: x.astype(dtype))
-
-    def copy(self, deep=True):
-        """
-        Make a copy of this SparseDataFrame
-        """
-        result = super(SparseDataFrame, self).copy(deep=deep)
-        result._default_fill_value = self._default_fill_value
-        result._default_kind = self._default_kind
-        return result
-
-    @property
-    def default_fill_value(self):
-        return self._default_fill_value
-
-    @property
-    def default_kind(self):
-        return self._default_kind
-
-    @property
-    def density(self):
-        """
-        Ratio of non-sparse points to total (dense) data points
-        represented in the frame
-        """
-        tot_nonsparse = sum([ser.sp_index.npoints
-                             for _, ser in compat.iteritems(self)])
-        tot = len(self.index) * len(self.columns)
-        return tot_nonsparse / float(tot)
-
-    def fillna(self, value=None, method=None, axis=0, inplace=False,
-               limit=None, downcast=None):
-        new_self = super(SparseDataFrame,
-                         self).fillna(value=value, method=method, axis=axis,
-                                      inplace=inplace, limit=limit,
-                                      downcast=downcast)
-        if not inplace:
-            self = new_self
-
-        # set the fill value if we are filling as a scalar with nothing special
-        # going on
-        if (value is not None and value == value and method is None and
-                limit is None):
-            self._default_fill_value = value
-
-        if not inplace:
-            return self
-
-    # ----------------------------------------------------------------------
-    # Support different internal representation of SparseDataFrame
-
-    def _sanitize_column(self, key, value, **kwargs):
-        """
-        Creates a new SparseArray from the input value.
-
-        Parameters
-        ----------
-        key : object
-        value : scalar, Series, or array-like
-        kwargs : dict
-
-        Returns
-        -------
-        sanitized_column : SparseArray
-
-        """
-        sp_maker = lambda x, index=None: SparseArray(
-            x, index=index, fill_value=self._default_fill_value,
-            kind=self._default_kind)
-        if isinstance(value, SparseSeries):
-            clean = value.reindex(self.index).as_sparse_array(
-                fill_value=self._default_fill_value, kind=self._default_kind)
-
-        elif isinstance(value, SparseArray):
-            if len(value) != len(self.index):
-                raise AssertionError('Length of values does not match '
-                                     'length of index')
-            clean = value
-
-        elif hasattr(value, '__iter__'):
-            if isinstance(value, Series):
-                clean = value.reindex(self.index)
-                if not isinstance(value, SparseSeries):
-                    clean = sp_maker(clean)
-            else:
-                if len(value) != len(self.index):
-                    raise AssertionError('Length of values does not match '
-                                         'length of index')
-                clean = sp_maker(value)
-
-        # Scalar
-        else:
-            clean = sp_maker(value, self.index)
-
-        # always return a SparseArray!
-        return clean
-
-    def __getitem__(self, key):
-        """
-        Retrieve column or slice from DataFrame
-        """
-        if isinstance(key, slice):
-            date_rng = self.index[key]
-            return self.reindex(date_rng)
-        elif isinstance(key, (np.ndarray, list, Series)):
-            return self._getitem_array(key)
-        else:
-            return self._get_item_cache(key)
-
-    @Appender(DataFrame.get_value.__doc__, indents=0)
-    def get_value(self, index, col, takeable=False):
-        if takeable is True:
-            series = self._iget_item_cache(col)
-        else:
-            series = self._get_item_cache(col)
-
-        return series.get_value(index, takeable=takeable)
-
-    def set_value(self, index, col, value, takeable=False):
-        """
-        Put single value at passed column and index
-
-        Parameters
-        ----------
-        index : row label
-        col : column label
-        value : scalar value
-        takeable : interpret the index/col as indexers, default False
-
-        Notes
-        -----
-        This method *always* returns a new object. It is currently not
-        particularly efficient (and potentially very expensive) but is provided
-        for API compatibility with DataFrame
-
-        Returns
-        -------
-        frame : DataFrame
-        """
-        dense = self.to_dense().set_value(index, col, value, takeable=takeable)
-        return dense.to_sparse(kind=self._default_kind,
-                               fill_value=self._default_fill_value)
-
-    def _slice(self, slobj, axis=0, kind=None):
-        if axis == 0:
-            new_index = self.index[slobj]
-            new_columns = self.columns
-        else:
-            new_index = self.index
-            new_columns = self.columns[slobj]
-
-        return self.reindex(index=new_index, columns=new_columns)
-
-    def xs(self, key, axis=0, copy=False):
-        """
-        Returns a row (cross-section) from the SparseDataFrame as a Series
-        object.
-
-        Parameters
-        ----------
-        key : some index contained in the index
-
-        Returns
-        -------
-        xs : Series
-        """
-        if axis == 1:
-            data = self[key]
-            return data
-
-        i = self.index.get_loc(key)
-        data = self.take([i]).get_values()[0]
-        return Series(data, index=self.columns)
-
-    # ----------------------------------------------------------------------
-    # Arithmetic-related methods
-
-    def _combine_frame(self, other, func, fill_value=None, level=None):
-        this, other = self.align(other, join='outer', level=level, copy=False)
-        new_index, new_columns = this.index, this.columns
-
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        if self.empty and other.empty:
-            return self._constructor(index=new_index).__finalize__(self)
-
-        new_data = {}
-        new_fill_value = None
-        if fill_value is not None:
-            # TODO: be a bit more intelligent here
-            for col in new_columns:
-                if col in this and col in other:
-                    dleft = this[col].to_dense()
-                    dright = other[col].to_dense()
-                    result = dleft._binop(dright, func, fill_value=fill_value)
-                    result = result.to_sparse(fill_value=this[col].fill_value)
-                    new_data[col] = result
-        else:
-
-            for col in new_columns:
-                if col in this and col in other:
-                    new_data[col] = func(this[col], other[col])
-
-        # if the fill values are the same use them? or use a valid one
-        other_fill_value = getattr(other, 'default_fill_value', np.nan)
-        if self.default_fill_value == other_fill_value:
-            new_fill_value = self.default_fill_value
-        elif np.isnan(self.default_fill_value) and not np.isnan(
-                other_fill_value):
-            new_fill_value = other_fill_value
-        elif not np.isnan(self.default_fill_value) and np.isnan(
-                other_fill_value):
-            new_fill_value = self.default_fill_value
-
-        return self._constructor(data=new_data, index=new_index,
-                                 columns=new_columns,
-                                 default_fill_value=new_fill_value
-                                 ).__finalize__(self)
-
-    def _combine_match_index(self, other, func, level=None, fill_value=None):
-        new_data = {}
-
-        if fill_value is not None:
-            raise NotImplementedError("'fill_value' argument is not supported")
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        new_index = self.index.union(other.index)
-        this = self
-        if self.index is not new_index:
-            this = self.reindex(new_index)
-
-        if other.index is not new_index:
-            other = other.reindex(new_index)
-
-        for col, series in compat.iteritems(this):
-            new_data[col] = func(series.values, other.values)
-
-        # fill_value is a function of our operator
-        if isnull(other.fill_value) or isnull(self.default_fill_value):
-            fill_value = np.nan
-        else:
-            fill_value = func(np.float64(self.default_fill_value),
-                              np.float64(other.fill_value))
-
-        return self._constructor(
-            new_data, index=new_index, columns=self.columns,
-            default_fill_value=fill_value).__finalize__(self)
-
-    def _combine_match_columns(self, other, func, level=None, fill_value=None):
-        # patched version of DataFrame._combine_match_columns to account for
-        # NumPy circumventing __rsub__ with float64 types, e.g.: 3.0 - series,
-        # where 3.0 is numpy.float64 and series is a SparseSeries. Still
-        # possible for this to happen, which is bothersome
-
-        if fill_value is not None:
-            raise NotImplementedError("'fill_value' argument is not supported")
-        if level is not None:
-            raise NotImplementedError("'level' argument is not supported")
-
-        new_data = {}
-
-        union = intersection = self.columns
-
-        if not union.equals(other.index):
-            union = other.index.union(self.columns)
-            intersection = other.index.intersection(self.columns)
-
-        for col in intersection:
-            new_data[col] = func(self[col], float(other[col]))
-
-        return self._constructor(
-            new_data, index=self.index, columns=union,
-            default_fill_value=self.default_fill_value).__finalize__(self)
-
-    def _combine_const(self, other, func, raise_on_error=True):
-        return self._apply_columns(lambda x: func(x, other))
-
-    def _reindex_index(self, index, method, copy, level, fill_value=np.nan,
-                       limit=None, takeable=False):
-        if level is not None:
-            raise TypeError('Reindex by level not supported for sparse')
-
-        if self.index.equals(index):
-            if copy:
-                return self.copy()
-            else:
-                return self
-
-        if len(self.index) == 0:
-            return self._constructor(
-                index=index, columns=self.columns).__finalize__(self)
-
-        indexer = self.index.get_indexer(index, method, limit=limit)
-        indexer = _ensure_platform_int(indexer)
-        mask = indexer == -1
-        need_mask = mask.any()
-
-        new_series = {}
-        for col, series in self.iteritems():
-            if mask.all():
-                continue
-
-            values = series.values
-            # .take returns SparseArray
-            new = values.take(indexer)
-            if need_mask:
-                new = new.values
-                # convert integer to float if necessary. need to do a lot
-                # more than that, handle boolean etc also
-                new, fill_value = maybe_upcast(new, fill_value=fill_value)
-                np.putmask(new, mask, fill_value)
-
-            new_series[col] = new
-
-        return self._constructor(
-            new_series, index=index, columns=self.columns,
-            default_fill_value=self._default_fill_value).__finalize__(self)
-
-    def _reindex_columns(self, columns, method, copy, level, fill_value=None,
-                         limit=None, takeable=False):
-        if level is not None:
-            raise TypeError('Reindex by level not supported for sparse')
-
-        if notnull(fill_value):
-            raise NotImplementedError("'fill_value' argument is not supported")
-
-        if limit:
-            raise NotImplementedError("'limit' argument is not supported")
-
-        if method is not None:
-            raise NotImplementedError("'method' argument is not supported")
-
-        # TODO: fill value handling
-        sdict = dict((k, v) for k, v in compat.iteritems(self) if k in columns)
-        return self._constructor(
-            sdict, index=self.index, columns=columns,
-            default_fill_value=self._default_fill_value).__finalize__(self)
-
-    def _reindex_with_indexers(self, reindexers, method=None, fill_value=None,
-                               limit=None, copy=False, allow_dups=False):
-
-        if method is not None or limit is not None:
-            raise NotImplementedError("cannot reindex with a method or limit "
-                                      "with sparse")
-
-        if fill_value is None:
-            fill_value = np.nan
-
-        index, row_indexer = reindexers.get(0, (None, None))
-        columns, col_indexer = reindexers.get(1, (None, None))
-
-        if columns is None:
-            columns = self.columns
-
-        new_arrays = {}
-        for col in columns:
-            if col not in self:
-                continue
-            if row_indexer is not None:
-                new_arrays[col] = algos.take_1d(self[col].get_values(),
-                                                row_indexer,
-                                                fill_value=fill_value)
-            else:
-                new_arrays[col] = self[col]
-
-        return self._constructor(new_arrays, index=index,
-                                 columns=columns).__finalize__(self)
-
-    def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
-                     sort=False):
-        if on is not None:
-            raise NotImplementedError("'on' keyword parameter is not yet "
-                                      "implemented")
-        return self._join_index(other, how, lsuffix, rsuffix)
-
-    def _join_index(self, other, how, lsuffix, rsuffix):
-        if isinstance(other, Series):
-            if other.name is None:
-                raise ValueError('Other Series must have a name')
-
-            other = SparseDataFrame(
-                {other.name: other},
-                default_fill_value=self._default_fill_value)
-
-        join_index = self.index.join(other.index, how=how)
-
-        this = self.reindex(join_index)
-        other = other.reindex(join_index)
-
-        this, other = this._maybe_rename_join(other, lsuffix, rsuffix)
-
-        from pandas import concat
-        return concat([this, other], axis=1, verify_integrity=True)
-
-    def _maybe_rename_join(self, other, lsuffix, rsuffix):
-        to_rename = self.columns.intersection(other.columns)
-        if len(to_rename) > 0:
-            if not lsuffix and not rsuffix:
-                raise ValueError('columns overlap but no suffix specified: %s'
-                                 % to_rename)
-
-            def lrenamer(x):
-                if x in to_rename:
-                    return '%s%s' % (x, lsuffix)
-                return x
-
-            def rrenamer(x):
-                if x in to_rename:
-                    return '%s%s' % (x, rsuffix)
-                return x
-
-            this = self.rename(columns=lrenamer)
-            other = other.rename(columns=rrenamer)
-        else:
-            this = self
-
-        return this, other
-
-    def transpose(self, *args, **kwargs):
-        """
-        Returns a DataFrame with the rows/columns switched.
-        """
-        nv.validate_transpose(args, kwargs)
-        return self._constructor(
-            self.values.T, index=self.columns, columns=self.index,
-            default_fill_value=self._default_fill_value,
-            default_kind=self._default_kind).__finalize__(self)
-
-    T = property(transpose)
-
-    @Appender(DataFrame.count.__doc__)
-    def count(self, axis=0, **kwds):
-        if axis is None:
-            axis = self._stat_axis_number
-
-        return self.apply(lambda x: x.count(), axis=axis)
-
-    def cumsum(self, axis=0, *args, **kwargs):
-        """
-        Return SparseDataFrame of cumulative sums over requested axis.
-
-        Parameters
-        ----------
-        axis : {0, 1}
-            0 for row-wise, 1 for column-wise
-
-        Returns
-        -------
-        y : SparseDataFrame
-        """
-        nv.validate_cumsum(args, kwargs)
-
-        if axis is None:
-            axis = self._stat_axis_number
-
-        return self.apply(lambda x: x.cumsum(), axis=axis)
-
-    @Appender(generic._shared_docs['isnull'])
-    def isnull(self):
-        return self._apply_columns(lambda x: x.isnull())
-
-    @Appender(generic._shared_docs['isnotnull'])
-    def isnotnull(self):
-        return self._apply_columns(lambda x: x.isnotnull())
-
-    def apply(self, func, axis=0, broadcast=False, reduce=False):
-        """
-        Analogous to DataFrame.apply, for SparseDataFrame
-
-        Parameters
-        ----------
-        func : function
-            Function to apply to each column
-        axis : {0, 1, 'index', 'columns'}
-        broadcast : bool, default False
-            For aggregation functions, return object of same size with values
-            propagated
-
-        Returns
-        -------
-        applied : Series or SparseDataFrame
-        """
-        if not len(self.columns):
-            return self
-        axis = self._get_axis_number(axis)
-
-        if isinstance(func, np.ufunc):
-            new_series = {}
-            for k, v in compat.iteritems(self):
-                applied = func(v)
-                applied.fill_value = func(v.fill_value)
-                new_series[k] = applied
-            return self._constructor(
-                new_series, index=self.index, columns=self.columns,
-                default_fill_value=self._default_fill_value,
-                default_kind=self._default_kind).__finalize__(self)
-        else:
-            if not broadcast:
-                return self._apply_standard(func, axis, reduce=reduce)
-            else:
-                return self._apply_broadcast(func, axis)
-
-    def applymap(self, func):
-        """
-        Apply a function to a DataFrame that is intended to operate
-        elementwise, i.e. like doing map(func, series) for each series in the
-        DataFrame
-
-        Parameters
-        ----------
-        func : function
-            Python function, returns a single value from a single value
-
-        Returns
-        -------
-        applied : DataFrame
-        """
-        return self.apply(lambda x: lmap(func, x))
-
-
-def to_manager(sdf, columns, index):
-    """ create and return the block manager from a dataframe of series,
-    columns, index
-    """
-
-    # from BlockManager perspective
-    axes = [_ensure_index(columns), _ensure_index(index)]
-
-    return create_block_manager_from_arrays(
-        [sdf[c] for c in columns], columns, axes)
-
-
-def stack_sparse_frame(frame):
-    """
-    Only makes sense when fill_value is NaN
-    """
-    lengths = [s.sp_index.npoints for _, s in compat.iteritems(frame)]
-    nobs = sum(lengths)
-
-    # this is pretty fast
-    minor_labels = np.repeat(np.arange(len(frame.columns)), lengths)
-
-    inds_to_concat = []
-    vals_to_concat = []
-    # TODO: Figure out whether this can be reached.
-    # I think this currently can't be reached because you can't build a
-    # SparseDataFrame with a non-np.NaN fill value (fails earlier).
-    for _, series in compat.iteritems(frame):
-        if not np.isnan(series.fill_value):
-            raise TypeError('This routine assumes NaN fill value')
-
-        int_index = series.sp_index.to_int_index()
-        inds_to_concat.append(int_index.indices)
-        vals_to_concat.append(series.sp_values)
-
-    major_labels = np.concatenate(inds_to_concat)
-    stacked_values = np.concatenate(vals_to_concat)
-    index = MultiIndex(levels=[frame.index, frame.columns],
-                       labels=[major_labels, minor_labels],
-                       verify_integrity=False)
-
-    lp = DataFrame(stacked_values.reshape((nobs, 1)), index=index,
-                   columns=['foo'])
-    return lp.sort_index(level=0)
-
-
-def homogenize(series_dict):
-    """
-    Conform a set of SparseSeries (with NaN fill_value) to a common SparseIndex
-    corresponding to the locations where they all have data
-
-    Parameters
-    ----------
-    series_dict : dict or DataFrame
-
-    Notes
-    -----
-    Using the dumbest algorithm I could think of. Should put some more thought
-    into this
-
-    Returns
-    -------
-    homogenized : dict of SparseSeries
-    """
-    index = None
-
-    need_reindex = False
-
-    for _, series in compat.iteritems(series_dict):
-        if not np.isnan(series.fill_value):
-            raise TypeError('this method is only valid with NaN fill values')
-
-        if index is None:
-            index = series.sp_index
-        elif not series.sp_index.equals(index):
-            need_reindex = True
-            index = index.intersect(series.sp_index)
-
-    if need_reindex:
-        output = {}
-        for name, series in compat.iteritems(series_dict):
-            if not series.sp_index.equals(index):
-                series = series.sparse_reindex(index)
-
-            output[name] = series
-    else:
-        output = series_dict
-
-    return output
-
-
-# use unaccelerated ops for sparse objects
-ops.add_flex_arithmetic_methods(SparseDataFrame, use_numexpr=False,
-                                **ops.frame_flex_funcs)
-ops.add_special_arithmetic_methods(SparseDataFrame, use_numexpr=False,
-                                   **ops.frame_special_funcs)
diff --git a/pandas/sparse/list.py b/pandas/sparse/list.py
deleted file mode 100644
index 54ebf5e51045d..0000000000000
--- a/pandas/sparse/list.py
+++ /dev/null
@@ -1,151 +0,0 @@
-import warnings
-import numpy as np
-from pandas.core.base import PandasObject
-from pandas.formats.printing import pprint_thing
-
-from pandas.types.common import is_scalar
-from pandas.sparse.array import SparseArray
-from pandas.util.validators import validate_bool_kwarg
-import pandas.sparse.libsparse as splib
-
-
-class SparseList(PandasObject):
-
-    """
-    Data structure for accumulating data to be converted into a
-    SparseArray. Has similar API to the standard Python list
-
-    Parameters
-    ----------
-    data : scalar or array-like
-    fill_value : scalar, default NaN
-    """
-
-    def __init__(self, data=None, fill_value=np.nan):
-
-        # see gh-13784
-        warnings.warn("SparseList is deprecated and will be removed "
-                      "in a future version", FutureWarning, stacklevel=2)
-
-        self.fill_value = fill_value
-        self._chunks = []
-
-        if data is not None:
-            self.append(data)
-
-    def __unicode__(self):
-        contents = '\n'.join(repr(c) for c in self._chunks)
-        return '%s\n%s' % (object.__repr__(self), pprint_thing(contents))
-
-    def __len__(self):
-        return sum(len(c) for c in self._chunks)
-
-    def __getitem__(self, i):
-        if i < 0:
-            if i + len(self) < 0:  # pragma: no cover
-                raise ValueError('%d out of range' % i)
-            i += len(self)
-
-        passed = 0
-        j = 0
-        while i >= passed + len(self._chunks[j]):
-            passed += len(self._chunks[j])
-            j += 1
-        return self._chunks[j][i - passed]
-
-    def __setitem__(self, i, value):
-        raise NotImplementedError
-
-    @property
-    def nchunks(self):
-        return len(self._chunks)
-
-    @property
-    def is_consolidated(self):
-        return self.nchunks == 1
-
-    def consolidate(self, inplace=True):
-        """
-        Internally consolidate chunks of data
-
-        Parameters
-        ----------
-        inplace : boolean, default True
-            Modify the calling object instead of constructing a new one
-
-        Returns
-        -------
-        splist : SparseList
-            If inplace=False, new object, otherwise reference to existing
-            object
-        """
-        inplace = validate_bool_kwarg(inplace, 'inplace')
-        if not inplace:
-            result = self.copy()
-        else:
-            result = self
-
-        if result.is_consolidated:
-            return result
-
-        result._consolidate_inplace()
-        return result
-
-    def _consolidate_inplace(self):
-        new_values = np.concatenate([c.sp_values for c in self._chunks])
-        new_index = _concat_sparse_indexes([c.sp_index for c in self._chunks])
-        new_arr = SparseArray(new_values, sparse_index=new_index,
-                              fill_value=self.fill_value)
-        self._chunks = [new_arr]
-
-    def copy(self):
-        """
-        Return copy of the list
-
-        Returns
-        -------
-        new_list : SparseList
-        """
-        new_splist = SparseList(fill_value=self.fill_value)
-        new_splist._chunks = list(self._chunks)
-        return new_splist
-
-    def to_array(self):
-        """
-        Return SparseArray from data stored in the SparseList
-
-        Returns
-        -------
-        sparr : SparseArray
-        """
-        self.consolidate(inplace=True)
-        return self._chunks[0]
-
-    def append(self, value):
-        """
-        Append element or array-like chunk of data to the SparseList
-
-        Parameters
-        ----------
-        value: scalar or array-like
-        """
-        if is_scalar(value):
-            value = [value]
-
-        sparr = SparseArray(value, fill_value=self.fill_value)
-        self._chunks.append(sparr)
-        self._consolidated = False
-
-
-def _concat_sparse_indexes(indexes):
-    all_indices = []
-    total_length = 0
-
-    for index in indexes:
-        # increment by offset
-        inds = index.to_int_index().indices + total_length
-
-        all_indices.append(inds)
-        total_length += index.length
-
-    return splib.IntIndex(total_length, np.concatenate(all_indices))
diff --git a/pandas/sparse/series.py b/pandas/sparse/series.py
deleted file mode 100644
index 7ec42f02c3998..0000000000000
--- a/pandas/sparse/series.py
+++ /dev/null
@@ -1,832 +0,0 @@
-"""
-Data structures for sparse float data. Life is made simpler by dealing only
-with float64 data
-"""
-
-# pylint: disable=E1101,E1103,W0231
-
-import numpy as np
-import warnings
-
-from pandas.types.missing import isnull, notnull
-from pandas.types.common import is_scalar
-from pandas.core.common import _values_from_object, _maybe_match_name
-
-from pandas.compat.numpy import function as nv
-from pandas.core.index import Index, _ensure_index, InvalidIndexError
-from pandas.core.series import Series
-from pandas.core.frame import DataFrame
-from pandas.core.internals import SingleBlockManager
-from pandas.core import generic
-import pandas.core.common as com
-import pandas.core.ops as ops
-import pandas._libs.index as _index
-from pandas.util.decorators import Appender
-
-from pandas.sparse.array import (make_sparse, _sparse_array_op, SparseArray,
-                                 _make_index)
-from pandas.sparse.libsparse import BlockIndex, IntIndex
-import pandas.sparse.libsparse as splib
-
-from pandas.sparse.scipy_sparse import (_sparse_series_to_coo,
-                                        _coo_to_sparse_series)
-
-
-_shared_doc_kwargs = dict(axes='index', klass='SparseSeries',
-                          axes_single_arg="{0, 'index'}")
-
-# -----------------------------------------------------------------------------
-# Wrapper function for Series arithmetic methods
-
-
-def _arith_method(op, name, str_rep=None, default_axis=None, fill_zeros=None,
-                  **eval_kwargs):
-    """
-    Wrapper function for Series arithmetic operations, to avoid
-    code duplication.
-
-    str_rep, default_axis, fill_zeros and eval_kwargs are not used, but are
-    present for compatibility.
-    """
-
-    def wrapper(self, other):
-        if isinstance(other, Series):
-            if not isinstance(other, SparseSeries):
-                other = other.to_sparse(fill_value=self.fill_value)
-            return _sparse_series_op(self, other, op, name)
-        elif isinstance(other, DataFrame):
-            return NotImplemented
-        elif is_scalar(other):
-            with np.errstate(all='ignore'):
-                new_values = op(self.values, other)
-            return self._constructor(new_values,
-                                     index=self.index,
-                                     name=self.name)
-        else:  # pragma: no cover
-            raise TypeError('operation with %s not supported' % type(other))
-
-    wrapper.__name__ = name
-    if name.startswith("__"):
-        # strip special method names, e.g. `__add__` needs to be `add` when
-        # passed to _sparse_series_op
-        name = name[2:-2]
-    return wrapper
-
-
-def _sparse_series_op(left, right, op, name):
-    left, right = left.align(right, join='outer', copy=False)
-    new_index = left.index
-    new_name = _maybe_match_name(left, right)
-
-    result = _sparse_array_op(left.values, right.values, op, name,
-                              series=True)
-    return left._constructor(result, index=new_index, name=new_name)
-
-
-class SparseSeries(Series):
-    """Data structure for labeled, sparse floating point data
-
-    Parameters
-    ----------
-    data : {array-like, Series, SparseSeries, dict}
-    kind : {'block', 'integer'}
-    fill_value : float
-        Code for missing value. Defaults depends on dtype.
-        0 for int dtype, False for bool dtype, and NaN for other dtypes
-    sparse_index : {BlockIndex, IntIndex}, optional
-        Only if you have one. Mainly used internally
-
-    Notes
-    -----
-    SparseSeries objects are immutable via the typical Python means. If you
-    must change values, convert to dense, make your changes, then convert back
-    to sparse
-    """
-    _subtyp = 'sparse_series'
-
-    def __init__(self, data=None, index=None, sparse_index=None, kind='block',
-                 fill_value=None, name=None, dtype=None, copy=False,
-                 fastpath=False):
-
-        # we are called internally, so short-circuit
-        if fastpath:
-
-            # data is an ndarray, index is defined
-
-            if not isinstance(data, SingleBlockManager):
-                data = SingleBlockManager(data, index, fastpath=True)
-            if copy:
-                data = data.copy()
-
-        else:
-
-            if data is None:
-                data = []
-
-            if isinstance(data, Series) and name is None:
-                name = data.name
-
-            if isinstance(data, SparseArray):
-                if index is not None:
-                    assert (len(index) == len(data))
-                sparse_index = data.sp_index
-                if fill_value is None:
-                    fill_value = data.fill_value
-
-                data = np.asarray(data)
-
-            elif isinstance(data, SparseSeries):
-                if index is None:
-                    index = data.index.view()
-                if fill_value is None:
-                    fill_value = data.fill_value
-                # extract the SingleBlockManager
-                data = data._data
-
-            elif isinstance(data, (Series, dict)):
-                if index is None:
-                    index = data.index.view()
-
-                data = Series(data)
-                res = make_sparse(data, kind=kind, fill_value=fill_value)
-                data, sparse_index, fill_value = res
-
-            elif isinstance(data, (tuple, list, np.ndarray)):
-                # array-like
-                if sparse_index is None:
-                    res = make_sparse(data, kind=kind, fill_value=fill_value)
-                    data, sparse_index, fill_value = res
-                else:
-                    assert (len(data) == sparse_index.npoints)
-
-            elif isinstance(data, SingleBlockManager):
-                if dtype is not None:
-                    data = data.astype(dtype)
-                if index is None:
-                    index = data.index.view()
-                else:
-
-                    data = data.reindex(index, copy=False)
-
-            else:
-                length = len(index)
-
-                if data == fill_value or (isnull(data) and isnull(fill_value)):
-                    if kind == 'block':
-                        sparse_index = BlockIndex(length, [], [])
-                    else:
-                        sparse_index = IntIndex(length, [])
-                    data = np.array([])
-
-                else:
-                    if kind == 'block':
-                        locs, lens = ([0], [length]) if length else ([], [])
-                        sparse_index = BlockIndex(length, locs, lens)
-                    else:
-                        sparse_index = IntIndex(length, index)
-                    v = data
-                    data = np.empty(length)
-                    data.fill(v)
-
-            if index is None:
-                index = com._default_index(sparse_index.length)
-            index = _ensure_index(index)
-
-            # create/copy the manager
-            if isinstance(data, SingleBlockManager):
-
-                if copy:
-                    data = data.copy()
-            else:
-
-                # create a sparse array
-                if not isinstance(data, SparseArray):
-                    data = SparseArray(data, sparse_index=sparse_index,
-                                       fill_value=fill_value, dtype=dtype,
-                                       copy=copy)
-
-                data = SingleBlockManager(data, index)
-
-        generic.NDFrame.__init__(self, data)
-
-        self.index = index
-        self.name = name
-
-    @property
-    def values(self):
-        """ return the array """
-        return self.block.values
-
-    def __array__(self, result=None):
-        """ the array interface, return my values """
-        return self.block.values
-
-    def get_values(self):
-        """ same as values """
-        return self.block.to_dense().view()
-
-    @property
-    def block(self):
-        return self._data._block
-
-    @property
-    def fill_value(self):
-        return self.block.fill_value
-
-    @fill_value.setter
-    def fill_value(self, v):
-        self.block.fill_value = v
-
-    @property
-    def sp_index(self):
-        return self.block.sp_index
-
-    @property
-    def sp_values(self):
-        return self.values.sp_values
-
-    @property
-    def npoints(self):
-        return self.sp_index.npoints
-
-    @classmethod
-    def from_array(cls, arr, index=None, name=None, copy=False,
-                   fill_value=None, fastpath=False):
-        """
-        Simplified alternate constructor
-        """
-        return cls(arr, index=index, name=name, copy=copy,
-                   fill_value=fill_value, fastpath=fastpath)
-
-    @property
-    def _constructor(self):
-        return SparseSeries
-
-    @property
-    def _constructor_expanddim(self):
-        from pandas.sparse.api import SparseDataFrame
-        return SparseDataFrame
-
-    @property
-    def kind(self):
-        if isinstance(self.sp_index, BlockIndex):
-            return 'block'
-        elif isinstance(self.sp_index, IntIndex):
-            return 'integer'
-
-    def as_sparse_array(self, kind=None, fill_value=None, copy=False):
-        """ return my self as a sparse array, do not copy by default """
-
-        if fill_value is None:
-            fill_value = self.fill_value
-        if kind is None:
-            kind = self.kind
-        return SparseArray(self.values, sparse_index=self.sp_index,
-                           fill_value=fill_value, kind=kind, copy=copy)
-
-    def __len__(self):
-        return len(self.block)
-
-    @property
-    def shape(self):
-        return self._data.shape
-
-    def __unicode__(self):
-        # currently, unicode is same as repr...fixes infinite loop
-        series_rep = Series.__unicode__(self)
-        rep = '%s\n%s' % (series_rep, repr(self.sp_index))
-        return rep
-
-    def __array_wrap__(self, result, context=None):
-        """
-        Gets called prior to a ufunc (and after)
-
-        See SparseArray.__array_wrap__ for detail.
-        """
-        if isinstance(context, tuple) and len(context) == 3:
-            ufunc, args, domain = context
-            args = [getattr(a, 'fill_value', a) for a in args]
-            with np.errstate(all='ignore'):
-                fill_value = ufunc(self.fill_value, *args[1:])
-        else:
-            fill_value = self.fill_value
-
-        return self._constructor(result, index=self.index,
-                                 sparse_index=self.sp_index,
-                                 fill_value=fill_value,
-                                 copy=False).__finalize__(self)
-
-    def __array_finalize__(self, obj):
-        """
-        Gets called after any ufunc or other array operations, necessary
-        to pass on the index.
-        """
-        self.name = getattr(obj, 'name', None)
-        self.fill_value = getattr(obj, 'fill_value', None)
-
-    def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
-                filter_type=None, **kwds):
-        """ perform a reduction operation """
-        return op(self.get_values(), skipna=skipna, **kwds)
-
-    def __getstate__(self):
-        # pickling
-        return dict(_typ=self._typ, _subtyp=self._subtyp, _data=self._data,
-                    fill_value=self.fill_value, name=self.name)
-
-    def _unpickle_series_compat(self, state):
-
-        nd_state, own_state = state
-
-        # recreate the ndarray
-        data = np.empty(nd_state[1], dtype=nd_state[2])
-        np.ndarray.__setstate__(data, nd_state)
-
-        index, fill_value, sp_index = own_state[:3]
-        name = None
-        if len(own_state) > 3:
-            name = own_state[3]
-
-        # create a sparse array
-        if not isinstance(data, SparseArray):
-            data = SparseArray(data, sparse_index=sp_index,
-                               fill_value=fill_value, copy=False)
-
-        # recreate
-        data = SingleBlockManager(data, index, fastpath=True)
-        generic.NDFrame.__init__(self, data)
-
-        self._set_axis(0, index)
-        self.name = name
-
-    def __iter__(self):
-        """ forward to the array """
-        return iter(self.values)
-
-    def _set_subtyp(self, is_all_dates):
-        if is_all_dates:
-            object.__setattr__(self, '_subtyp', 'sparse_time_series')
-        else:
-            object.__setattr__(self, '_subtyp', 'sparse_series')
-
-    def _ixs(self, i, axis=0):
-        """
-        Return the i-th value or values in the SparseSeries by location
-
-        Parameters
-        ----------
-        i : int, slice, or sequence of integers
-
-        Returns
-        -------
-        value : scalar (int) or Series (slice, sequence)
-        """
-        label = self.index[i]
-        if isinstance(label, Index):
-            return self.take(i, axis=axis, convert=True)
-        else:
-            return self._get_val_at(i)
-
-    def _get_val_at(self, loc):
-        """ forward to the array """
-        return self.block.values._get_val_at(loc)
-
-    def __getitem__(self, key):
-        try:
-            return self.index.get_value(self, key)
-
-        except InvalidIndexError:
-            pass
-        except KeyError:
-            if isinstance(key, (int, np.integer)):
-                return self._get_val_at(key)
-            elif key is Ellipsis:
-                return self
-            raise Exception('Requested index not in this series!')
-
-        except TypeError:
-            # Could not hash item, must be array-like?
-            pass
-
-        key = _values_from_object(key)
-        if self.index.nlevels > 1 and isinstance(key, tuple):
-            # to handle MultiIndex labels
-            key = self.index.get_loc(key)
-        return self._constructor(self.values[key],
-                                 index=self.index[key]).__finalize__(self)
-
-    def _get_values(self, indexer):
-        try:
-            return self._constructor(self._data.get_slice(indexer),
-                                     fastpath=True).__finalize__(self)
-        except Exception:
-            return self[indexer]
-
-    def _set_with_engine(self, key, value):
-        return self.set_value(key, value)
-
-    def abs(self):
-        """
-        Return an object with absolute value taken. Only applicable to objects
-        that are all numeric
-
-        Returns
-        -------
-        abs: type of caller
-        """
-        return self._constructor(np.abs(self.values),
-                                 index=self.index).__finalize__(self)
-
-    def get(self, label, default=None):
-        """
-        Returns value occupying requested label, default to specified
-        missing value if not present. Analogous to dict.get
-
-        Parameters
-        ----------
-        label : object
-            Label value looking for
-        default : object, optional
-            Value to return if label not in index
-
-        Returns
-        -------
-        y : scalar
-        """
-        if label in self.index:
-            loc = self.index.get_loc(label)
-            return self._get_val_at(loc)
-        else:
-            return default
-
-    def get_value(self, label, takeable=False):
-        """
-        Retrieve single value at passed index label
-
-        Parameters
-        ----------
-        index : label
-        takeable : interpret the index as indexers, default False
-
-        Returns
-        -------
-        value : scalar value
-        """
-        loc = label if takeable is True else self.index.get_loc(label)
-        return self._get_val_at(loc)
-
-    def set_value(self, label, value, takeable=False):
-        """
-        Quickly set single value at passed label. If label is not contained, a
-        new object is created with the label placed at the end of the result
-        index
-
-        Parameters
-        ----------
-        label : object
-            Partial indexing with MultiIndex not allowed
-        value : object
-            Scalar value
-        takeable : interpret the index as indexers, default False
-
-        Notes
-        -----
-        This method *always* returns a new object. It is not particularly
-        efficient but is provided for API compatibility with Series
-
-        Returns
-        -------
-        series : SparseSeries
-        """
-        values = self.to_dense()
-
-        # if the label doesn't exist, we will create a new object here
-        # and possibily change the index
-        new_values = values.set_value(label, value, takeable=takeable)
-        if new_values is not None:
-            values = new_values
-        new_index = values.index
-        values = SparseArray(values, fill_value=self.fill_value,
-                             kind=self.kind)
-        self._data = SingleBlockManager(values, new_index)
-        self._index = new_index
-
-    def _set_values(self, key, value):
-
-        # this might be inefficient as we have to recreate the sparse array
-        # rather than setting individual elements, but have to convert
-        # the passed slice/boolean that's in dense space into a sparse indexer
-        # not sure how to do that!
-        if isinstance(key, Series):
-            key = key.values
-
-        values = self.values.to_dense()
-        values[key] = _index.convert_scalar(values, value)
-        values = SparseArray(values, fill_value=self.fill_value,
-                             kind=self.kind)
-        self._data = SingleBlockManager(values, self.index)
-
-    def to_dense(self, sparse_only=False):
-        """
-        Convert SparseSeries to a Series.
-
-        Parameters
-        ----------
-        sparse_only: bool, default False
-            DEPRECATED: this argument will be removed in a future version.
-
-            If True, return just the non-sparse values, or the dense version
-            of `self.values` if False.
-
-        Returns
-        -------
-        s : Series
-        """
-        if sparse_only:
-            warnings.warn(("The 'sparse_only' parameter has been deprecated "
-                           "and will be removed in a future version."),
-                          FutureWarning, stacklevel=2)
-            int_index = self.sp_index.to_int_index()
-            index = self.index.take(int_index.indices)
-            return Series(self.sp_values, index=index, name=self.name)
-        else:
-            return Series(self.values.to_dense(), index=self.index,
-                          name=self.name)
-
-    @property
-    def density(self):
-        r = float(self.sp_index.npoints) / float(self.sp_index.length)
-        return r
-
-    def copy(self, deep=True):
-        """
-        Make a copy of the SparseSeries. Only the actual sparse values need to
-        be copied
-        """
-        new_data = self._data
-        if deep:
-            new_data = self._data.copy()
-
-        return self._constructor(new_data, sparse_index=self.sp_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    @Appender(generic._shared_docs['reindex'] % _shared_doc_kwargs)
-    def reindex(self, index=None, method=None, copy=True, limit=None,
-                **kwargs):
-
-        return super(SparseSeries, self).reindex(index=index, method=method,
-                                                 copy=copy, limit=limit,
-                                                 **kwargs)
-
-    def sparse_reindex(self, new_index):
-        """
-        Conform sparse values to new SparseIndex
-
-        Parameters
-        ----------
-        new_index : {BlockIndex, IntIndex}
-
-        Returns
-        -------
-        reindexed : SparseSeries
-        """
-        if not isinstance(new_index, splib.SparseIndex):
-            raise TypeError('new index must be a SparseIndex')
-
-        block = self.block.sparse_reindex(new_index)
-        new_data = SingleBlockManager(block, self.index)
-        return self._constructor(new_data, index=self.index,
-                                 sparse_index=new_index,
-                                 fill_value=self.fill_value).__finalize__(self)
-
-    def take(self, indices, axis=0, convert=True, *args, **kwargs):
-        """
-        Sparse-compatible version of ndarray.take
-
-        Returns
-        -------
-        taken : ndarray
-        """
-
-        convert = nv.validate_take_with_convert(convert, args, kwargs)
-        new_values = SparseArray.take(self.values, indices)
-        new_index = self.index.take(indices)
-        return self._constructor(new_values,
-                                 index=new_index).__finalize__(self)
-
-    def cumsum(self, axis=0, *args, **kwargs):
-        """
-        Cumulative sum of non-NA/null values.
-
-        When performing the cumulative summation, any non-NA/null values will
-        be skipped. The resulting SparseSeries will preserve the locations of
-        NaN values, but the fill value will be `np.nan` regardless.
-
-        Parameters
-        ----------
-        axis : {0}
-
-        Returns
-        -------
-        cumsum : SparseSeries
-        """
-        nv.validate_cumsum(args, kwargs)
-        if axis is not None:
-            axis = self._get_axis_number(axis)
-
-        new_array = self.values.cumsum()
-
-        return self._constructor(
-            new_array, index=self.index,
-            sparse_index=new_array.sp_index).__finalize__(self)
-
-    @Appender(generic._shared_docs['isnull'])
-    def isnull(self):
-        arr = SparseArray(isnull(self.values.sp_values),
-                          sparse_index=self.values.sp_index,
-                          fill_value=isnull(self.fill_value))
-        return self._constructor(arr, index=self.index).__finalize__(self)
-
-    @Appender(generic._shared_docs['isnotnull'])
-    def isnotnull(self):
-        arr = SparseArray(notnull(self.values.sp_values),
-                          sparse_index=self.values.sp_index,
-                          fill_value=notnull(self.fill_value))
-        return self._constructor(arr, index=self.index).__finalize__(self)
-
-    def dropna(self, axis=0, inplace=False, **kwargs):
-        """
-        Analogous to Series.dropna. If fill_value=NaN, returns a dense Series
-        """
-        # TODO: make more efficient
-        axis = self._get_axis_number(axis or 0)
-        dense_valid = self.to_dense().valid()
-        if inplace:
-            raise NotImplementedError("Cannot perform inplace dropna"
-                                      " operations on a SparseSeries")
-        if isnull(self.fill_value):
-            return dense_valid
-        else:
-            dense_valid = dense_valid[dense_valid != self.fill_value]
-            return dense_valid.to_sparse(fill_value=self.fill_value)
-
-    @Appender(generic._shared_docs['shift'] % _shared_doc_kwargs)
-    def shift(self, periods, freq=None, axis=0):
-        if periods == 0:
-            return self.copy()
-
-        # no special handling of fill values yet
-        if not isnull(self.fill_value):
-            shifted = self.to_dense().shift(periods, freq=freq,
-                                            axis=axis)
-            return shifted.to_sparse(fill_value=self.fill_value,
-                                     kind=self.kind)
-
-        if freq is not None:
-            return self._constructor(
-                self.sp_values, sparse_index=self.sp_index,
-                index=self.index.shift(periods, freq),
-                fill_value=self.fill_value).__finalize__(self)
-
-        int_index = self.sp_index.to_int_index()
-        new_indices = int_index.indices + periods
-        start, end = new_indices.searchsorted([0, int_index.length])
-
-        new_indices = new_indices[start:end]
-        new_sp_index = _make_index(len(self), new_indices, self.sp_index)
-
-        arr = self.values._simple_new(self.sp_values[start:end].copy(),
-                                      new_sp_index, fill_value=np.nan)
-        return self._constructor(arr, index=self.index).__finalize__(self)
-
-    def combine_first(self, other):
-        """
-        Combine Series values, choosing the calling Series's values
-        first. Result index will be the union of the two indexes
-
-        Parameters
-        ----------
-        other : Series
-
-        Returns
-        -------
-        y : Series
-        """
-        if isinstance(other, SparseSeries):
-            other = other.to_dense()
-
-        dense_combined = self.to_dense().combine_first(other)
-        return dense_combined.to_sparse(fill_value=self.fill_value)
-
-    def to_coo(self, row_levels=(0, ), column_levels=(1, ), sort_labels=False):
-        """
-        Create a scipy.sparse.coo_matrix from a SparseSeries with MultiIndex.
-
-        Use row_levels and column_levels to determine the row and column
-        coordinates respectively. row_levels and column_levels are the names
-        (labels) or numbers of the levels. {row_levels, column_levels} must be
-        a partition of the MultiIndex level names (or numbers).
-
-        .. versionadded:: 0.16.0
-
-        Parameters
-        ----------
-        row_levels : tuple/list
-        column_levels : tuple/list
-        sort_labels : bool, default False
-            Sort the row and column labels before forming the sparse matrix.
-
-        Returns
-        -------
-        y : scipy.sparse.coo_matrix
-        rows : list (row labels)
-        columns : list (column labels)
-
-        Examples
-        --------
-        >>> from numpy import nan
-        >>> s = Series([3.0, nan, 1.0, 3.0, nan, nan])
-        >>> s.index = MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                              (1, 2, 'a', 1),
-                                              (1, 1, 'b', 0),
-                                              (1, 1, 'b', 1),
-                                              (2, 1, 'b', 0),
-                                              (2, 1, 'b', 1)],
-                                              names=['A', 'B', 'C', 'D'])
-        >>> ss = s.to_sparse()
-        >>> A, rows, columns = ss.to_coo(row_levels=['A', 'B'],
-                                         column_levels=['C', 'D'],
-                                         sort_labels=True)
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  3.],
-        [ 3.,  0.,  0.,  0.],
-        [ 0.,  0.,  0.,  0.]])
-        >>> rows
-        [(1, 1), (1, 2), (2, 1)]
-        >>> columns
-        [('a', 0), ('a', 1), ('b', 0), ('b', 1)]
-        """
-        A, rows, columns = _sparse_series_to_coo(self, row_levels,
-                                                 column_levels,
-                                                 sort_labels=sort_labels)
-        return A, rows, columns
-
-    @classmethod
-    def from_coo(cls, A, dense_index=False):
-        """
-        Create a SparseSeries from a scipy.sparse.coo_matrix.
-
-        .. versionadded:: 0.16.0
-
-        Parameters
-        ----------
-        A : scipy.sparse.coo_matrix
-        dense_index : bool, default False
-            If False (default), the SparseSeries index consists of only the
-            coords of the non-null entries of the original coo_matrix.
-            If True, the SparseSeries index consists of the full sorted
-            (row, col) coordinates of the coo_matrix.
-
-        Returns
-        -------
-        s : SparseSeries
-
-        Examples
-        ---------
-        >>> from scipy import sparse
-        >>> A = sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])),
-                               shape=(3, 4))
-        >>> A
-        <3x4 sparse matrix of type '<class 'numpy.float64'>'
-                with 3 stored elements in COOrdinate format>
-        >>> A.todense()
-        matrix([[ 0.,  0.,  1.,  2.],
-                [ 3.,  0.,  0.,  0.],
-                [ 0.,  0.,  0.,  0.]])
-        >>> ss = SparseSeries.from_coo(A)
-        >>> ss
-        0  2    1
-           3    2
-        1  0    3
-        dtype: float64
-        BlockIndex
-        Block locations: array([0], dtype=int32)
-        Block lengths: array([3], dtype=int32)
-        """
-        return _coo_to_sparse_series(A, dense_index=dense_index)
-
-
-# overwrite series methods with unaccelerated versions
-ops.add_special_arithmetic_methods(SparseSeries, use_numexpr=False,
-                                   **ops.series_special_funcs)
-ops.add_flex_arithmetic_methods(SparseSeries, use_numexpr=False,
-                                **ops.series_flex_funcs)
-# overwrite basic arithmetic to use SparseSeries version
-# force methods to overwrite previous definitions.
-ops.add_special_arithmetic_methods(SparseSeries, _arith_method,
-                                   comp_method=_arith_method,
-                                   bool_method=None, use_numexpr=False,
-                                   force=True)
diff --git a/pandas/stats/api.py b/pandas/stats/api.py
deleted file mode 100644
index 2a11456d4f9e5..0000000000000
--- a/pandas/stats/api.py
+++ /dev/null
@@ -1,7 +0,0 @@
-"""
-Common namespace of statistical functions
-"""
-
-# flake8: noqa
-
-from pandas.stats.moments import *
diff --git a/pandas/stats/moments.py b/pandas/stats/moments.py
deleted file mode 100644
index 914c4c08863a2..0000000000000
--- a/pandas/stats/moments.py
+++ /dev/null
@@ -1,854 +0,0 @@
-"""
-Provides rolling statistical moments and related descriptive
-statistics implemented in Cython
-"""
-from __future__ import division
-
-import warnings
-import numpy as np
-from pandas.types.common import is_scalar
-from pandas.core.api import DataFrame, Series
-from pandas.util.decorators import Substitution, Appender
-
-__all__ = ['rolling_count', 'rolling_max', 'rolling_min',
-           'rolling_sum', 'rolling_mean', 'rolling_std', 'rolling_cov',
-           'rolling_corr', 'rolling_var', 'rolling_skew', 'rolling_kurt',
-           'rolling_quantile', 'rolling_median', 'rolling_apply',
-           'rolling_window',
-           'ewma', 'ewmvar', 'ewmstd', 'ewmvol', 'ewmcorr', 'ewmcov',
-           'expanding_count', 'expanding_max', 'expanding_min',
-           'expanding_sum', 'expanding_mean', 'expanding_std',
-           'expanding_cov', 'expanding_corr', 'expanding_var',
-           'expanding_skew', 'expanding_kurt', 'expanding_quantile',
-           'expanding_median', 'expanding_apply']
-
-# -----------------------------------------------------------------------------
-# Docs
-
-# The order of arguments for the _doc_template is:
-# (header, args, kwargs, returns, notes)
-
-_doc_template = """
-%s
-
-Parameters
-----------
-%s%s
-Returns
--------
-%s
-%s
-"""
-
-_roll_kw = """window : int
-    Size of the moving window. This is the number of observations used for
-    calculating the statistic.
-min_periods : int, default None
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : string or DateOffset object, optional (default None)
-    Frequency to conform the data to before computing the statistic. Specified
-    as a frequency string or DateOffset object.
-center : boolean, default False
-    Set the labels at the center of the window.
-how : string, default '%s'
-    Method for down- or re-sampling
-"""
-
-_roll_notes = r"""
-Notes
------
-By default, the result is set to the right edge of the window. This can be
-changed to the center of the window by setting ``center=True``.
-
-The `freq` keyword is used to conform time series data to a specified
-frequency by resampling the data. This is done with the default parameters
-of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-"""
-
-
-_ewm_kw = r"""com : float, optional
-    Specify decay in terms of center of mass,
-    :math:`\alpha = 1 / (1 + com),\text{ for } com \geq 0`
-span : float, optional
-    Specify decay in terms of span,
-    :math:`\alpha = 2 / (span + 1),\text{ for } span \geq 1`
-halflife : float, optional
-    Specify decay in terms of half-life,
-    :math:`\alpha = 1 - exp(log(0.5) / halflife),\text{ for } halflife > 0`
-alpha : float, optional
-    Specify smoothing factor :math:`\alpha` directly,
-    :math:`0 < \alpha \leq 1`
-
-    .. versionadded:: 0.18.0
-
-min_periods : int, default 0
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : None or string alias / date offset object, default=None
-    Frequency to conform to before computing statistic
-adjust : boolean, default True
-    Divide by decaying adjustment factor in beginning periods to account for
-    imbalance in relative weightings (viewing EWMA as a moving average)
-how : string, default 'mean'
-    Method for down- or re-sampling
-ignore_na : boolean, default False
-    Ignore missing values when calculating weights;
-    specify True to reproduce pre-0.15.0 behavior
-"""
-
-_ewm_notes = r"""
-Notes
------
-Exactly one of center of mass, span, half-life, and alpha must be provided.
-Allowed values and relationship between the parameters are specified in the
-parameter descriptions above; see the link at the end of this section for
-a detailed explanation.
-
-When adjust is True (default), weighted averages are calculated using weights
-    (1-alpha)**(n-1), (1-alpha)**(n-2), ..., 1-alpha, 1.
-
-When adjust is False, weighted averages are calculated recursively as:
-    weighted_average[0] = arg[0];
-    weighted_average[i] = (1-alpha)*weighted_average[i-1] + alpha*arg[i].
-
-When ignore_na is False (default), weights are based on absolute positions.
-For example, the weights of x and y used in calculating the final weighted
-average of [x, None, y] are (1-alpha)**2 and 1 (if adjust is True), and
-(1-alpha)**2 and alpha (if adjust is False).
-
-When ignore_na is True (reproducing pre-0.15.0 behavior), weights are based on
-relative positions. For example, the weights of x and y used in calculating
-the final weighted average of [x, None, y] are 1-alpha and 1 (if adjust is
-True), and 1-alpha and alpha (if adjust is False).
-
-More details can be found at
-http://pandas.pydata.org/pandas-docs/stable/computation.html#exponentially-weighted-windows
-"""
-
-_expanding_kw = """min_periods : int, default None
-    Minimum number of observations in window required to have a value
-    (otherwise result is NA).
-freq : string or DateOffset object, optional (default None)
-    Frequency to conform the data to before computing the statistic. Specified
-    as a frequency string or DateOffset object.
-"""
-
-
-_type_of_input_retval = "y : type of input argument"
-
-_flex_retval = """y : type depends on inputs
-    DataFrame / DataFrame -> DataFrame (matches on columns) or Panel (pairwise)
-    DataFrame / Series -> Computes result for each column
-    Series / Series -> Series"""
-
-_pairwise_retval = "y : Panel whose items are df1.index values"
-
-_unary_arg = "arg : Series, DataFrame\n"
-
-_binary_arg_flex = """arg1 : Series, DataFrame, or ndarray
-arg2 : Series, DataFrame, or ndarray, optional
-    if not supplied then will default to arg1 and produce pairwise output
-"""
-
-_binary_arg = """arg1 : Series, DataFrame, or ndarray
-arg2 : Series, DataFrame, or ndarray
-"""
-
-_pairwise_arg = """df1 : DataFrame
-df2 : DataFrame
-"""
-
-_pairwise_kw = """pairwise : bool, default False
-    If False then only matching columns between arg1 and arg2 will be used and
-    the output will be a DataFrame.
-    If True then all pairwise combinations will be calculated and the output
-    will be a Panel in the case of DataFrame inputs. In the case of missing
-    elements, only complete pairwise observations will be used.
-"""
-
-_ddof_kw = """ddof : int, default 1
-    Delta Degrees of Freedom.  The divisor used in calculations
-    is ``N - ddof``, where ``N`` represents the number of elements.
-"""
-
-_bias_kw = r"""bias : boolean, default False
-    Use a standard estimation bias correction
-"""
-
-
-def ensure_compat(dispatch, name, arg, func_kw=None, *args, **kwargs):
-    """
-    wrapper function to dispatch to the appropriate window functions
-    wraps/unwraps ndarrays for compat
-
-    can be removed when ndarray support is removed
-    """
-    is_ndarray = isinstance(arg, np.ndarray)
-    if is_ndarray:
-        if arg.ndim == 1:
-            arg = Series(arg)
-        elif arg.ndim == 2:
-            arg = DataFrame(arg)
-        else:
-            raise AssertionError("cannot support ndim > 2 for ndarray compat")
-
-        warnings.warn("pd.{dispatch}_{name} is deprecated for ndarrays and "
-                      "will be removed "
-                      "in a future version"
-                      .format(dispatch=dispatch, name=name),
-                      FutureWarning, stacklevel=3)
-
-    # get the functional keywords here
-    if func_kw is None:
-        func_kw = []
-    kwds = {}
-    for k in func_kw:
-        value = kwargs.pop(k, None)
-        if value is not None:
-            kwds[k] = value
-
-    # how is a keyword that if not-None should be in kwds
-    how = kwargs.pop('how', None)
-    if how is not None:
-        kwds['how'] = how
-
-    r = getattr(arg, dispatch)(**kwargs)
-
-    if not is_ndarray:
-
-        # give a helpful deprecation message
-        # with copy-pastable arguments
-        pargs = ','.join(["{a}={b}".format(a=a, b=b)
-                          for a, b in kwargs.items() if b is not None])
-        aargs = ','.join(args)
-        if len(aargs):
-            aargs += ','
-
-        def f(a, b):
-            if is_scalar(b):
-                return "{a}={b}".format(a=a, b=b)
-            return "{a}=<{b}>".format(a=a, b=type(b).__name__)
-        aargs = ','.join([f(a, b) for a, b in kwds.items() if b is not None])
-        warnings.warn("pd.{dispatch}_{name} is deprecated for {klass} "
-                      "and will be removed in a future version, replace with "
-                      "\n\t{klass}.{dispatch}({pargs}).{name}({aargs})"
-                      .format(klass=type(arg).__name__, pargs=pargs,
-                              aargs=aargs, dispatch=dispatch, name=name),
-                      FutureWarning, stacklevel=3)
-
-    result = getattr(r, name)(*args, **kwds)
-
-    if is_ndarray:
-        result = result.values
-    return result
-
-
-def rolling_count(arg, window, **kwargs):
-    """
-    Rolling count of number of non-NaN observations inside provided window.
-
-    Parameters
-    ----------
-    arg :  DataFrame or numpy ndarray-like
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    how : string, default 'mean'
-        Method for down- or re-sampling
-
-    Returns
-    -------
-    rolling_count : type of caller
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('rolling', 'count', arg, window=window, **kwargs)
-
-
-@Substitution("Unbiased moving covariance.", _binary_arg_flex,
-              _roll_kw % 'None' + _pairwise_kw + _ddof_kw, _flex_retval,
-              _roll_notes)
-@Appender(_doc_template)
-def rolling_cov(arg1, arg2=None, window=None, pairwise=None, **kwargs):
-    if window is None and isinstance(arg2, (int, float)):
-        window = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    elif arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    return ensure_compat('rolling',
-                         'cov',
-                         arg1,
-                         other=arg2,
-                         window=window,
-                         pairwise=pairwise,
-                         func_kw=['other', 'pairwise', 'ddof'],
-                         **kwargs)
-
-
-@Substitution("Moving sample correlation.", _binary_arg_flex,
-              _roll_kw % 'None' + _pairwise_kw, _flex_retval, _roll_notes)
-@Appender(_doc_template)
-def rolling_corr(arg1, arg2=None, window=None, pairwise=None, **kwargs):
-    if window is None and isinstance(arg2, (int, float)):
-        window = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    elif arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise  # only default unset
-    return ensure_compat('rolling',
-                         'corr',
-                         arg1,
-                         other=arg2,
-                         window=window,
-                         pairwise=pairwise,
-                         func_kw=['other', 'pairwise'],
-                         **kwargs)
-
-
-# -----------------------------------------------------------------------------
-# Exponential moving moments
-
-
-@Substitution("Exponentially-weighted moving average", _unary_arg, _ewm_kw,
-              _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewma(arg, com=None, span=None, halflife=None, alpha=None, min_periods=0,
-         freq=None, adjust=True, how=None, ignore_na=False):
-    return ensure_compat('ewm',
-                         'mean',
-                         arg,
-                         com=com,
-                         span=span,
-                         halflife=halflife,
-                         alpha=alpha,
-                         min_periods=min_periods,
-                         freq=freq,
-                         adjust=adjust,
-                         how=how,
-                         ignore_na=ignore_na)
-
-
-@Substitution("Exponentially-weighted moving variance", _unary_arg,
-              _ewm_kw + _bias_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmvar(arg, com=None, span=None, halflife=None, alpha=None, min_periods=0,
-           bias=False, freq=None, how=None, ignore_na=False, adjust=True):
-    return ensure_compat('ewm',
-                         'var',
-                         arg,
-                         com=com,
-                         span=span,
-                         halflife=halflife,
-                         alpha=alpha,
-                         min_periods=min_periods,
-                         freq=freq,
-                         adjust=adjust,
-                         how=how,
-                         ignore_na=ignore_na,
-                         bias=bias,
-                         func_kw=['bias'])
-
-
-@Substitution("Exponentially-weighted moving std", _unary_arg,
-              _ewm_kw + _bias_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmstd(arg, com=None, span=None, halflife=None, alpha=None, min_periods=0,
-           bias=False, freq=None, how=None, ignore_na=False, adjust=True):
-    return ensure_compat('ewm',
-                         'std',
-                         arg,
-                         com=com,
-                         span=span,
-                         halflife=halflife,
-                         alpha=alpha,
-                         min_periods=min_periods,
-                         freq=freq,
-                         adjust=adjust,
-                         how=how,
-                         ignore_na=ignore_na,
-                         bias=bias,
-                         func_kw=['bias'])
-
-
-ewmvol = ewmstd
-
-
-@Substitution("Exponentially-weighted moving covariance", _binary_arg_flex,
-              _ewm_kw + _pairwise_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmcov(arg1, arg2=None, com=None, span=None, halflife=None, alpha=None,
-           min_periods=0, bias=False, freq=None, pairwise=None, how=None,
-           ignore_na=False, adjust=True):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and com is None:
-        com = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-
-    return ensure_compat('ewm',
-                         'cov',
-                         arg1,
-                         other=arg2,
-                         com=com,
-                         span=span,
-                         halflife=halflife,
-                         alpha=alpha,
-                         min_periods=min_periods,
-                         bias=bias,
-                         freq=freq,
-                         how=how,
-                         ignore_na=ignore_na,
-                         adjust=adjust,
-                         pairwise=pairwise,
-                         func_kw=['other', 'pairwise', 'bias'])
-
-
-@Substitution("Exponentially-weighted moving correlation", _binary_arg_flex,
-              _ewm_kw + _pairwise_kw, _type_of_input_retval, _ewm_notes)
-@Appender(_doc_template)
-def ewmcorr(arg1, arg2=None, com=None, span=None, halflife=None, alpha=None,
-            min_periods=0, freq=None, pairwise=None, how=None, ignore_na=False,
-            adjust=True):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and com is None:
-        com = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    return ensure_compat('ewm',
-                         'corr',
-                         arg1,
-                         other=arg2,
-                         com=com,
-                         span=span,
-                         halflife=halflife,
-                         alpha=alpha,
-                         min_periods=min_periods,
-                         freq=freq,
-                         how=how,
-                         ignore_na=ignore_na,
-                         adjust=adjust,
-                         pairwise=pairwise,
-                         func_kw=['other', 'pairwise'])
-
-# ---------------------------------------------------------------------
-# Python interface to Cython functions
-
-
-def _rolling_func(name, desc, how=None, func_kw=None, additional_kw=''):
-    if how is None:
-        how_arg_str = 'None'
-    else:
-        how_arg_str = "'%s" % how
-
-    @Substitution(desc, _unary_arg, _roll_kw % how_arg_str + additional_kw,
-                  _type_of_input_retval, _roll_notes)
-    @Appender(_doc_template)
-    def f(arg, window, min_periods=None, freq=None, center=False,
-          **kwargs):
-
-        return ensure_compat('rolling',
-                             name,
-                             arg,
-                             window=window,
-                             min_periods=min_periods,
-                             freq=freq,
-                             center=center,
-                             func_kw=func_kw,
-                             **kwargs)
-    return f
-
-
-rolling_max = _rolling_func('max', 'Moving maximum.', how='max')
-rolling_min = _rolling_func('min', 'Moving minimum.', how='min')
-rolling_sum = _rolling_func('sum', 'Moving sum.')
-rolling_mean = _rolling_func('mean', 'Moving mean.')
-rolling_median = _rolling_func('median', 'Moving median.', how='median')
-rolling_std = _rolling_func('std', 'Moving standard deviation.',
-                            func_kw=['ddof'],
-                            additional_kw=_ddof_kw)
-rolling_var = _rolling_func('var', 'Moving variance.',
-                            func_kw=['ddof'],
-                            additional_kw=_ddof_kw)
-rolling_skew = _rolling_func('skew', 'Unbiased moving skewness.')
-rolling_kurt = _rolling_func('kurt', 'Unbiased moving kurtosis.')
-
-
-def rolling_quantile(arg, window, quantile, min_periods=None, freq=None,
-                     center=False):
-    """Moving quantile.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    quantile : float
-        0 <= quantile <= 1
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('rolling',
-                         'quantile',
-                         arg,
-                         window=window,
-                         freq=freq,
-                         center=center,
-                         min_periods=min_periods,
-                         func_kw=['quantile'],
-                         quantile=quantile)
-
-
-def rolling_apply(arg, window, func, min_periods=None, freq=None,
-                  center=False, args=(), kwargs={}):
-    """Generic moving function application.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int
-        Size of the moving window. This is the number of observations used for
-        calculating the statistic.
-    func : function
-        Must produce a single value from an ndarray input
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    args : tuple
-        Passed on to func
-    kwargs : dict
-        Passed on to func
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('rolling',
-                         'apply',
-                         arg,
-                         window=window,
-                         freq=freq,
-                         center=center,
-                         min_periods=min_periods,
-                         func_kw=['func', 'args', 'kwargs'],
-                         func=func,
-                         args=args,
-                         kwargs=kwargs)
-
-
-def rolling_window(arg, window=None, win_type=None, min_periods=None,
-                   freq=None, center=False, mean=True,
-                   axis=0, how=None, **kwargs):
-    """
-    Applies a moving window of type ``window_type`` and size ``window``
-    on the data.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    window : int or ndarray
-        Weighting window specification. If the window is an integer, then it is
-        treated as the window length and win_type is required
-    win_type : str, default None
-        Window type (see Notes)
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-    center : boolean, default False
-        Whether the label should correspond with center of window
-    mean : boolean, default True
-        If True computes weighted mean, else weighted sum
-    axis : {0, 1}, default 0
-    how : string, default 'mean'
-        Method for down- or re-sampling
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The recognized window types are:
-
-    * ``boxcar``
-    * ``triang``
-    * ``blackman``
-    * ``hamming``
-    * ``bartlett``
-    * ``parzen``
-    * ``bohman``
-    * ``blackmanharris``
-    * ``nuttall``
-    * ``barthann``
-    * ``kaiser`` (needs beta)
-    * ``gaussian`` (needs std)
-    * ``general_gaussian`` (needs power, width)
-    * ``slepian`` (needs width).
-
-    By default, the result is set to the right edge of the window. This can be
-    changed to the center of the window by setting ``center=True``.
-
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    func = 'mean' if mean else 'sum'
-    return ensure_compat('rolling',
-                         func,
-                         arg,
-                         window=window,
-                         win_type=win_type,
-                         freq=freq,
-                         center=center,
-                         min_periods=min_periods,
-                         axis=axis,
-                         func_kw=kwargs.keys(),
-                         **kwargs)
-
-
-def _expanding_func(name, desc, func_kw=None, additional_kw=''):
-    @Substitution(desc, _unary_arg, _expanding_kw + additional_kw,
-                  _type_of_input_retval, "")
-    @Appender(_doc_template)
-    def f(arg, min_periods=1, freq=None, **kwargs):
-        return ensure_compat('expanding',
-                             name,
-                             arg,
-                             min_periods=min_periods,
-                             freq=freq,
-                             func_kw=func_kw,
-                             **kwargs)
-    return f
-
-
-expanding_max = _expanding_func('max', 'Expanding maximum.')
-expanding_min = _expanding_func('min', 'Expanding minimum.')
-expanding_sum = _expanding_func('sum', 'Expanding sum.')
-expanding_mean = _expanding_func('mean', 'Expanding mean.')
-expanding_median = _expanding_func('median', 'Expanding median.')
-
-expanding_std = _expanding_func('std', 'Expanding standard deviation.',
-                                func_kw=['ddof'],
-                                additional_kw=_ddof_kw)
-expanding_var = _expanding_func('var', 'Expanding variance.',
-                                func_kw=['ddof'],
-                                additional_kw=_ddof_kw)
-expanding_skew = _expanding_func('skew', 'Unbiased expanding skewness.')
-expanding_kurt = _expanding_func('kurt', 'Unbiased expanding kurtosis.')
-
-
-def expanding_count(arg, freq=None):
-    """
-    Expanding count of number of non-NaN observations.
-
-    Parameters
-    ----------
-    arg :  DataFrame or numpy ndarray-like
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-
-    Returns
-    -------
-    expanding_count : type of caller
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('expanding', 'count', arg, freq=freq)
-
-
-def expanding_quantile(arg, quantile, min_periods=1, freq=None):
-    """Expanding quantile.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    quantile : float
-        0 <= quantile <= 1
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('expanding',
-                         'quantile',
-                         arg,
-                         freq=freq,
-                         min_periods=min_periods,
-                         func_kw=['quantile'],
-                         quantile=quantile)
-
-
-@Substitution("Unbiased expanding covariance.", _binary_arg_flex,
-              _expanding_kw + _pairwise_kw + _ddof_kw, _flex_retval, "")
-@Appender(_doc_template)
-def expanding_cov(arg1, arg2=None, min_periods=1, freq=None,
-                  pairwise=None, ddof=1):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and min_periods is None:
-        min_periods = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    return ensure_compat('expanding',
-                         'cov',
-                         arg1,
-                         other=arg2,
-                         min_periods=min_periods,
-                         pairwise=pairwise,
-                         freq=freq,
-                         ddof=ddof,
-                         func_kw=['other', 'pairwise', 'ddof'])
-
-
-@Substitution("Expanding sample correlation.", _binary_arg_flex,
-              _expanding_kw + _pairwise_kw, _flex_retval, "")
-@Appender(_doc_template)
-def expanding_corr(arg1, arg2=None, min_periods=1, freq=None, pairwise=None):
-    if arg2 is None:
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    elif isinstance(arg2, (int, float)) and min_periods is None:
-        min_periods = arg2
-        arg2 = arg1
-        pairwise = True if pairwise is None else pairwise
-    return ensure_compat('expanding',
-                         'corr',
-                         arg1,
-                         other=arg2,
-                         min_periods=min_periods,
-                         pairwise=pairwise,
-                         freq=freq,
-                         func_kw=['other', 'pairwise', 'ddof'])
-
-
-def expanding_apply(arg, func, min_periods=1, freq=None,
-                    args=(), kwargs={}):
-    """Generic expanding function application.
-
-    Parameters
-    ----------
-    arg : Series, DataFrame
-    func : function
-        Must produce a single value from an ndarray input
-    min_periods : int, default None
-        Minimum number of observations in window required to have a value
-        (otherwise result is NA).
-    freq : string or DateOffset object, optional (default None)
-        Frequency to conform the data to before computing the
-        statistic. Specified as a frequency string or DateOffset object.
-    args : tuple
-        Passed on to func
-    kwargs : dict
-        Passed on to func
-
-    Returns
-    -------
-    y : type of input argument
-
-    Notes
-    -----
-    The `freq` keyword is used to conform time series data to a specified
-    frequency by resampling the data. This is done with the default parameters
-    of :meth:`~pandas.Series.resample` (i.e. using the `mean`).
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return ensure_compat('expanding',
-                         'apply',
-                         arg,
-                         freq=freq,
-                         min_periods=min_periods,
-                         func_kw=['func', 'args', 'kwargs'],
-                         func=func,
-                         args=args,
-                         kwargs=kwargs)
diff --git a/pandas/testing.py b/pandas/testing.py
new file mode 100644
index 0000000000000..dbea1ecc7362a
--- /dev/null
+++ b/pandas/testing.py
@@ -0,0 +1,8 @@
+# flake8: noqa
+
+"""
+Public testing utility functions.
+"""
+
+from pandas.util.testing import (
+    assert_frame_equal, assert_index_equal, assert_series_equal)
diff --git a/pandas/tests/api/test_api.py b/pandas/tests/api/test_api.py
index 73222c246fc70..599ab9a3c5f7c 100644
--- a/pandas/tests/api/test_api.py
+++ b/pandas/tests/api/test_api.py
@@ -1,12 +1,8 @@
 # -*- coding: utf-8 -*-
-
-from warnings import catch_warnings
-import numpy as np
+import sys
 
 import pandas as pd
-from pandas.core import common as com
 from pandas import api
-from pandas.api import types
 from pandas.util import testing as tm
 
 
@@ -17,7 +13,7 @@ def check(self, namespace, expected, ignored=None):
         # ignored ones
         # compare vs the expected
 
-        result = sorted([f for f in dir(namespace) if not f.startswith('_')])
+        result = sorted(f for f in dir(namespace) if not f.startswith('_'))
         if ignored is not None:
             result = sorted(list(set(result) - set(ignored)))
 
@@ -25,21 +21,19 @@ def check(self, namespace, expected, ignored=None):
         tm.assert_almost_equal(result, expected)
 
 
-class TestPDApi(Base, tm.TestCase):
+class TestPDApi(Base):
 
     # these are optionally imported based on testing
     # & need to be ignored
     ignored = ['tests', 'locale', 'conftest']
 
     # top-level sub-packages
-    lib = ['api', 'compat', 'computation', 'core',
-           'indexes', 'formats', 'pandas',
-           'test', 'tools', 'tseries', 'sparse',
-           'types', 'util', 'options', 'io']
+    lib = ['api', 'arrays', 'compat', 'core', 'errors', 'pandas',
+           'plotting', 'test', 'testing', 'tseries',
+           'util', 'options', 'io']
 
     # these are already deprecated; awaiting removal
-    deprecated_modules = ['stats', 'datetools', 'parser',
-                          'json', 'lib', 'tslib']
+    deprecated_modules = []
 
     # misc
     misc = ['IndexSlice', 'NaT']
@@ -49,13 +43,17 @@ class TestPDApi(Base, tm.TestCase):
                'DatetimeIndex', 'ExcelFile', 'ExcelWriter', 'Float64Index',
                'Grouper', 'HDFStore', 'Index', 'Int64Index', 'MultiIndex',
                'Period', 'PeriodIndex', 'RangeIndex', 'UInt64Index',
-               'Series', 'SparseArray', 'SparseDataFrame',
-               'SparseSeries', 'TimeGrouper', 'Timedelta',
-               'TimedeltaIndex', 'Timestamp']
+               'Series', 'SparseArray', 'SparseDataFrame', 'SparseDtype',
+               'SparseSeries', 'Timedelta',
+               'TimedeltaIndex', 'Timestamp', 'Interval', 'IntervalIndex',
+               'CategoricalDtype', 'PeriodDtype', 'IntervalDtype',
+               'DatetimeTZDtype',
+               'Int8Dtype', 'Int16Dtype', 'Int32Dtype', 'Int64Dtype',
+               'UInt8Dtype', 'UInt16Dtype', 'UInt32Dtype', 'UInt64Dtype',
+               ]
 
     # these are already deprecated; awaiting removal
-    deprecated_classes = ['WidePanel', 'Panel4D',
-                          'SparseList', 'Expr', 'Term']
+    deprecated_classes = ['TimeGrouper']
 
     # these should be deprecated in the future
     deprecated_classes_in_future = ['Panel']
@@ -64,15 +62,14 @@ class TestPDApi(Base, tm.TestCase):
     modules = ['np', 'datetime']
 
     # top-level functions
-    funcs = ['bdate_range', 'concat', 'crosstab', 'cut',
-             'date_range', 'eval',
-             'factorize', 'get_dummies', 'get_store',
-             'infer_freq', 'isnull', 'lreshape',
-             'melt', 'notnull', 'offsets',
+    funcs = ['array', 'bdate_range', 'concat', 'crosstab', 'cut',
+             'date_range', 'interval_range', 'eval',
+             'factorize', 'get_dummies',
+             'infer_freq', 'isna', 'isnull', 'lreshape',
+             'melt', 'notna', 'notnull', 'offsets',
              'merge', 'merge_ordered', 'merge_asof',
              'period_range',
-             'pivot', 'pivot_table', 'plot_params', 'qcut',
-             'scatter_matrix',
+             'pivot', 'pivot_table', 'qcut',
              'show_versions', 'timedelta_range', 'unique',
              'value_counts', 'wide_to_long']
 
@@ -86,26 +83,17 @@ class TestPDApi(Base, tm.TestCase):
                   'read_gbq', 'read_hdf', 'read_html', 'read_json',
                   'read_msgpack', 'read_pickle', 'read_sas', 'read_sql',
                   'read_sql_query', 'read_sql_table', 'read_stata',
-                  'read_table', 'read_feather']
+                  'read_table', 'read_feather', 'read_parquet']
 
     # top-level to_* funcs
     funcs_to = ['to_datetime', 'to_msgpack',
                 'to_numeric', 'to_pickle', 'to_timedelta']
 
+    # top-level to deprecate in the future
+    deprecated_funcs_in_future = []
+
     # these are already deprecated; awaiting removal
-    deprecated_funcs = ['ewma', 'ewmcorr', 'ewmcov', 'ewmstd', 'ewmvar',
-                        'ewmvol', 'expanding_apply', 'expanding_corr',
-                        'expanding_count', 'expanding_cov', 'expanding_kurt',
-                        'expanding_max', 'expanding_mean', 'expanding_median',
-                        'expanding_min', 'expanding_quantile',
-                        'expanding_skew', 'expanding_std', 'expanding_sum',
-                        'expanding_var', 'rolling_apply',
-                        'rolling_corr', 'rolling_count', 'rolling_cov',
-                        'rolling_kurt', 'rolling_max', 'rolling_mean',
-                        'rolling_median', 'rolling_min', 'rolling_quantile',
-                        'rolling_skew', 'rolling_std', 'rolling_sum',
-                        'rolling_var', 'rolling_window', 'ordered_merge',
-                        'pnow', 'match', 'groupby']
+    deprecated_funcs = []
 
     def test_api(self):
 
@@ -116,159 +104,62 @@ def test_api(self):
                    self.deprecated_classes_in_future +
                    self.funcs + self.funcs_option +
                    self.funcs_read + self.funcs_to +
+                   self.deprecated_funcs_in_future +
                    self.deprecated_funcs,
                    self.ignored)
 
 
-class TestApi(Base, tm.TestCase):
+class TestApi(Base):
 
-    allowed = ['types']
+    allowed = ['types', 'extensions']
 
     def test_api(self):
 
         self.check(api, self.allowed)
 
 
-class TestTypes(Base, tm.TestCase):
-
-    allowed = ['is_any_int_dtype', 'is_bool', 'is_bool_dtype',
-               'is_categorical', 'is_categorical_dtype', 'is_complex',
-               'is_complex_dtype', 'is_datetime64_any_dtype',
-               'is_datetime64_dtype', 'is_datetime64_ns_dtype',
-               'is_datetime64tz_dtype', 'is_datetimetz', 'is_dtype_equal',
-               'is_extension_type', 'is_float', 'is_float_dtype',
-               'is_floating_dtype', 'is_int64_dtype', 'is_integer',
-               'is_integer_dtype', 'is_number', 'is_numeric_dtype',
-               'is_object_dtype', 'is_scalar', 'is_sparse',
-               'is_string_dtype', 'is_signed_integer_dtype',
-               'is_timedelta64_dtype', 'is_timedelta64_ns_dtype',
-               'is_unsigned_integer_dtype', 'is_period',
-               'is_period_dtype', 'is_re', 'is_re_compilable',
-               'is_dict_like', 'is_iterator',
-               'is_list_like', 'is_hashable',
-               'is_named_tuple', 'is_sequence',
-               'pandas_dtype']
-
-    def test_types(self):
-
-        self.check(types, self.allowed)
-
-    def check_deprecation(self, fold, fnew):
-        with tm.assert_produces_warning(DeprecationWarning):
-            try:
-                result = fold('foo')
-                expected = fnew('foo')
-                self.assertEqual(result, expected)
-            except TypeError:
-                self.assertRaises(TypeError,
-                                  lambda: fnew('foo'))
-            except AttributeError:
-                self.assertRaises(AttributeError,
-                                  lambda: fnew('foo'))
-
-    def test_deprecation_core_common(self):
-
-        # test that we are in fact deprecating
-        # the pandas.core.common introspectors
-        for t in self.allowed:
-            self.check_deprecation(getattr(com, t), getattr(types, t))
-
-    def test_deprecation_core_common_array_equivalent(self):
-
-        with tm.assert_produces_warning(DeprecationWarning):
-            com.array_equivalent(np.array([1, 2]), np.array([1, 2]))
-
-    def test_deprecation_core_common_moved(self):
-
-        # these are in pandas.types.common
-        l = ['is_datetime_arraylike',
-             'is_datetime_or_timedelta_dtype',
-             'is_datetimelike',
-             'is_datetimelike_v_numeric',
-             'is_datetimelike_v_object',
-             'is_datetimetz',
-             'is_int_or_datetime_dtype',
-             'is_period_arraylike',
-             'is_string_like',
-             'is_string_like_dtype']
-
-        from pandas.types import common as c
-        for t in l:
-            self.check_deprecation(getattr(com, t), getattr(c, t))
-
-    def test_removed_from_core_common(self):
-
-        for t in ['is_null_datelike_scalar',
-                  'ensure_float']:
-            self.assertRaises(AttributeError, lambda: getattr(com, t))
-
-
-class TestDatetoolsDeprecation(tm.TestCase):
-
-    def test_deprecation_access_func(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            pd.datetools.to_datetime('2016-01-01')
+class TestTesting(Base):
 
-    def test_deprecation_access_obj(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            pd.datetools.monthEnd
+    funcs = ['assert_frame_equal', 'assert_series_equal',
+             'assert_index_equal']
 
+    def test_testing(self):
+
+        from pandas import testing
+        self.check(testing, self.funcs)
+
+
+class TestTopLevelDeprecations(object):
 
-class TestTopLevelDeprecations(tm.TestCase):
     # top-level API deprecations
     # GH 13790
 
-    def test_pnow(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            pd.pnow(freq='M')
-
-    def test_term(self):
+    def test_TimeGrouper(self):
         with tm.assert_produces_warning(FutureWarning,
                                         check_stacklevel=False):
-            pd.Term('index>=date')
+            pd.TimeGrouper(freq='D')
 
-    def test_expr(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            pd.Expr('2>1')
 
-    def test_match(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            pd.match([1, 2, 3], [1])
+class TestCDateRange(object):
 
-    def test_groupby(self):
+    def test_deprecation_cdaterange(self):
+        # GH17596
+        from pandas.core.indexes.datetimes import cdate_range
         with tm.assert_produces_warning(FutureWarning,
                                         check_stacklevel=False):
-            pd.groupby(pd.Series([1, 2, 3]), [1, 1, 1])
-
-
-class TestJson(tm.TestCase):
-
-    def test_deprecation_access_func(self):
-        with catch_warnings(record=True):
-            pd.json.dumps([])
-
-
-class TestParser(tm.TestCase):
-
-    def test_deprecation_access_func(self):
-        with catch_warnings(record=True):
-            pd.parser.na_values
+            cdate_range('2017-01-01', '2017-12-31')
 
 
-class TestLib(tm.TestCase):
+class TestCategoricalMove(object):
 
-    def test_deprecation_access_func(self):
-        with catch_warnings(record=True):
-            pd.lib.infer_dtype
+    def test_categorical_move(self):
+        # May have been cached by another import, e.g. pickle tests.
+        sys.modules.pop("pandas.core.categorical", None)
 
+        with tm.assert_produces_warning(FutureWarning):
+            from pandas.core.categorical import Categorical  # noqa
 
-class TestTSLib(tm.TestCase):
+        sys.modules.pop("pandas.core.categorical", None)
 
-    def test_deprecation_access_func(self):
-        with catch_warnings(record=True):
-            pd.tslib.Timestamp
+        with tm.assert_produces_warning(FutureWarning):
+            from pandas.core.categorical import CategoricalDtype  # noqa
diff --git a/pandas/tests/api/test_types.py b/pandas/tests/api/test_types.py
new file mode 100644
index 0000000000000..235d7ecc64f60
--- /dev/null
+++ b/pandas/tests/api/test_types.py
@@ -0,0 +1,42 @@
+# -*- coding: utf-8 -*-
+from pandas.api import types
+from pandas.util import testing as tm
+
+from .test_api import Base
+
+
+class TestTypes(Base):
+
+    allowed = ['is_bool', 'is_bool_dtype',
+               'is_categorical', 'is_categorical_dtype', 'is_complex',
+               'is_complex_dtype', 'is_datetime64_any_dtype',
+               'is_datetime64_dtype', 'is_datetime64_ns_dtype',
+               'is_datetime64tz_dtype', 'is_dtype_equal',
+               'is_extension_type', 'is_float', 'is_float_dtype',
+               'is_int64_dtype', 'is_integer',
+               'is_integer_dtype', 'is_number', 'is_numeric_dtype',
+               'is_object_dtype', 'is_scalar', 'is_sparse',
+               'is_string_dtype', 'is_signed_integer_dtype',
+               'is_timedelta64_dtype', 'is_timedelta64_ns_dtype',
+               'is_unsigned_integer_dtype',
+               'is_period_dtype', 'is_interval', 'is_interval_dtype',
+               'is_re', 'is_re_compilable',
+               'is_dict_like', 'is_iterator', 'is_file_like',
+               'is_list_like', 'is_hashable', 'is_array_like',
+               'is_named_tuple',
+               'pandas_dtype', 'union_categoricals', 'infer_dtype',
+               'is_extension_array_dtype']
+    deprecated = ['is_period', 'is_datetimetz']
+    dtypes = ['CategoricalDtype', 'DatetimeTZDtype',
+              'PeriodDtype', 'IntervalDtype']
+
+    def test_types(self):
+
+        self.check(types, self.allowed + self.dtypes + self.deprecated)
+
+    def test_deprecated_from_api_types(self):
+
+        for t in self.deprecated:
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                getattr(types, t)(1)
diff --git a/bench/larry.py b/pandas/tests/arithmetic/__init__.py
similarity index 100%
rename from bench/larry.py
rename to pandas/tests/arithmetic/__init__.py
diff --git a/pandas/tests/arithmetic/conftest.py b/pandas/tests/arithmetic/conftest.py
new file mode 100644
index 0000000000000..671fe69750c57
--- /dev/null
+++ b/pandas/tests/arithmetic/conftest.py
@@ -0,0 +1,192 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+from pandas.compat import long
+
+import pandas as pd
+import pandas.util.testing as tm
+
+# ------------------------------------------------------------------
+# Helper Functions
+
+
+def id_func(x):
+    if isinstance(x, tuple):
+        assert len(x) == 2
+        return x[0].__name__ + '-' + str(x[1])
+    else:
+        return x.__name__
+
+
+# ------------------------------------------------------------------
+
+@pytest.fixture(params=[1, np.array(1, dtype=np.int64)])
+def one(request):
+    # zero-dim integer array behaves like an integer
+    return request.param
+
+
+zeros = [box_cls([0] * 5, dtype=dtype)
+         for box_cls in [pd.Index, np.array]
+         for dtype in [np.int64, np.uint64, np.float64]]
+zeros.extend([np.array(0, dtype=dtype)
+              for dtype in [np.int64, np.uint64, np.float64]])
+zeros.extend([0, 0.0, long(0)])
+
+
+@pytest.fixture(params=zeros)
+def zero(request):
+    # For testing division by (or of) zero for Index with length 5, this
+    # gives several scalar-zeros and length-5 vector-zeros
+    return request.param
+
+
+# ------------------------------------------------------------------
+# Vector Fixtures
+
+@pytest.fixture(params=[pd.Float64Index(np.arange(5, dtype='float64')),
+                        pd.Int64Index(np.arange(5, dtype='int64')),
+                        pd.UInt64Index(np.arange(5, dtype='uint64')),
+                        pd.RangeIndex(5)],
+                ids=lambda x: type(x).__name__)
+def numeric_idx(request):
+    """
+    Several types of numeric-dtypes Index objects
+    """
+    return request.param
+
+
+# ------------------------------------------------------------------
+# Scalar Fixtures
+
+@pytest.fixture(params=[pd.Timedelta('5m4s').to_pytimedelta(),
+                        pd.Timedelta('5m4s'),
+                        pd.Timedelta('5m4s').to_timedelta64()],
+                ids=lambda x: type(x).__name__)
+def scalar_td(request):
+    """
+    Several variants of Timedelta scalars representing 5 minutes and 4 seconds
+    """
+    return request.param
+
+
+@pytest.fixture(params=[pd.offsets.Day(3),
+                        pd.offsets.Hour(72),
+                        pd.Timedelta(days=3).to_pytimedelta(),
+                        pd.Timedelta('72:00:00'),
+                        np.timedelta64(3, 'D'),
+                        np.timedelta64(72, 'h')],
+                ids=lambda x: type(x).__name__)
+def three_days(request):
+    """
+    Several timedelta-like and DateOffset objects that each represent
+    a 3-day timedelta
+    """
+    return request.param
+
+
+@pytest.fixture(params=[pd.offsets.Hour(2),
+                        pd.offsets.Minute(120),
+                        pd.Timedelta(hours=2).to_pytimedelta(),
+                        pd.Timedelta(seconds=2 * 3600),
+                        np.timedelta64(2, 'h'),
+                        np.timedelta64(120, 'm')],
+                ids=lambda x: type(x).__name__)
+def two_hours(request):
+    """
+    Several timedelta-like and DateOffset objects that each represent
+    a 2-hour timedelta
+    """
+    return request.param
+
+
+_common_mismatch = [pd.offsets.YearBegin(2),
+                    pd.offsets.MonthBegin(1),
+                    pd.offsets.Minute()]
+
+
+@pytest.fixture(params=[pd.Timedelta(minutes=30).to_pytimedelta(),
+                        np.timedelta64(30, 's'),
+                        pd.Timedelta(seconds=30)] + _common_mismatch)
+def not_hourly(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Hourly frequencies.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[np.timedelta64(4, 'h'),
+                        pd.Timedelta(hours=23).to_pytimedelta(),
+                        pd.Timedelta('23:00:00')] + _common_mismatch)
+def not_daily(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Daily frequencies.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[np.timedelta64(365, 'D'),
+                        pd.Timedelta(days=365).to_pytimedelta(),
+                        pd.Timedelta(days=365)] + _common_mismatch)
+def mismatched_freq(request):
+    """
+    Several timedelta-like and DateOffset instances that are _not_
+    compatible with Monthly or Annual frequencies.
+    """
+    return request.param
+
+
+# ------------------------------------------------------------------
+
+@pytest.fixture(params=[pd.Index, pd.Series, pd.DataFrame],
+                ids=id_func)
+def box(request):
+    """
+    Several array-like containers that should have effectively identical
+    behavior with respect to arithmetic operations.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[pd.Index,
+                        pd.Series,
+                        pytest.param(pd.DataFrame,
+                                     marks=pytest.mark.xfail)],
+                ids=id_func)
+def box_df_fail(request):
+    """
+    Fixture equivalent to `box` fixture but xfailing the DataFrame case.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[(pd.Index, False),
+                        (pd.Series, False),
+                        (pd.DataFrame, False),
+                        pytest.param((pd.DataFrame, True),
+                                     marks=pytest.mark.xfail)],
+                ids=id_func)
+def box_transpose_fail(request):
+    """
+    Fixture similar to `box` but testing both transpose cases for DataFrame,
+    with the tranpose=True case xfailed.
+    """
+    # GH#23620
+    return request.param
+
+
+@pytest.fixture(params=[pd.Index, pd.Series, pd.DataFrame, tm.to_array],
+                ids=id_func)
+def box_with_array(request):
+    """
+    Fixture to test behavior for Index, Series, DataFrame, and pandas Array
+    classes
+    """
+    return request.param
+
+
+# alias so we can use the same fixture for multiple parameters in a test
+box_with_array2 = box_with_array
diff --git a/pandas/tests/arithmetic/test_datetime64.py b/pandas/tests/arithmetic/test_datetime64.py
new file mode 100644
index 0000000000000..c81a371f37dc1
--- /dev/null
+++ b/pandas/tests/arithmetic/test_datetime64.py
@@ -0,0 +1,2352 @@
+# -*- coding: utf-8 -*-
+# Arithmetic tests for DataFrame/Series/Index/Array classes that should
+# behave identically.
+# Specifically for datetime64 and datetime64tz dtypes
+from datetime import datetime, timedelta
+from itertools import product, starmap
+import operator
+import warnings
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslibs.conversion import localize_pydatetime
+from pandas._libs.tslibs.offsets import shift_months
+from pandas.compat.numpy import np_datetime64_compat
+from pandas.errors import NullFrequencyError, PerformanceWarning
+
+import pandas as pd
+from pandas import (
+    DatetimeIndex, NaT, Period, Series, Timedelta, TimedeltaIndex, Timestamp,
+    date_range)
+from pandas.core.indexes.datetimes import _to_M8
+import pandas.util.testing as tm
+
+
+def assert_all(obj):
+    """
+    Test helper to call call obj.all() the appropriate number of times on
+    a Series or DataFrame.
+    """
+    if isinstance(obj, pd.DataFrame):
+        assert obj.all().all()
+    else:
+        assert obj.all()
+
+
+# ------------------------------------------------------------------
+# Comparisons
+
+class TestDatetime64DataFrameComparison(object):
+    @pytest.mark.parametrize('timestamps', [
+        [pd.Timestamp('2012-01-01 13:00:00+00:00')] * 2,
+        [pd.Timestamp('2012-01-01 13:00:00')] * 2])
+    def test_tz_aware_scalar_comparison(self, timestamps):
+        # GH#15966
+        df = pd.DataFrame({'test': timestamps})
+        expected = pd.DataFrame({'test': [False, False]})
+        tm.assert_frame_equal(df == -1, expected)
+
+    def test_dt64_nat_comparison(self):
+        # GH#22242, GH#22163 DataFrame considered NaT == ts incorrectly
+        ts = pd.Timestamp.now()
+        df = pd.DataFrame([ts, pd.NaT])
+        expected = pd.DataFrame([True, False])
+
+        result = df == ts
+        tm.assert_frame_equal(result, expected)
+
+
+class TestDatetime64SeriesComparison(object):
+    # TODO: moved from tests.series.test_operators; needs cleanup
+
+    @pytest.mark.parametrize('pair', [
+        ([pd.Timestamp('2011-01-01'), NaT, pd.Timestamp('2011-01-03')],
+         [NaT, NaT, pd.Timestamp('2011-01-03')]),
+
+        ([pd.Timedelta('1 days'), NaT, pd.Timedelta('3 days')],
+         [NaT, NaT, pd.Timedelta('3 days')]),
+
+        ([pd.Period('2011-01', freq='M'), NaT,
+          pd.Period('2011-03', freq='M')],
+         [NaT, NaT, pd.Period('2011-03', freq='M')]),
+
+    ])
+    @pytest.mark.parametrize('reverse', [True, False])
+    @pytest.mark.parametrize('box', [Series, pd.Index])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_nat_comparisons(self, dtype, box, reverse, pair):
+        l, r = pair
+        if reverse:
+            # add lhs / rhs switched data
+            l, r = r, l
+
+        left = Series(l, dtype=dtype)
+        right = box(r, dtype=dtype)
+        # Series, Index
+
+        expected = Series([False, False, True])
+        tm.assert_series_equal(left == right, expected)
+
+        expected = Series([True, True, False])
+        tm.assert_series_equal(left != right, expected)
+
+        expected = Series([False, False, False])
+        tm.assert_series_equal(left < right, expected)
+
+        expected = Series([False, False, False])
+        tm.assert_series_equal(left > right, expected)
+
+        expected = Series([False, False, True])
+        tm.assert_series_equal(left >= right, expected)
+
+        expected = Series([False, False, True])
+        tm.assert_series_equal(left <= right, expected)
+
+    def test_comparison_invalid(self, box_with_array):
+        # GH#4968
+        # invalid date/int comparisons
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        ser = Series(range(5))
+        ser2 = Series(pd.date_range('20010101', periods=5))
+
+        ser = tm.box_expected(ser, box_with_array)
+        ser2 = tm.box_expected(ser2, box_with_array)
+
+        for (x, y) in [(ser, ser2), (ser2, ser)]:
+
+            result = x == y
+            expected = tm.box_expected([False] * 5, xbox)
+            tm.assert_equal(result, expected)
+
+            result = x != y
+            expected = tm.box_expected([True] * 5, xbox)
+            tm.assert_equal(result, expected)
+            msg = 'Invalid comparison between'
+            with pytest.raises(TypeError, match=msg):
+                x >= y
+            with pytest.raises(TypeError, match=msg):
+                x > y
+            with pytest.raises(TypeError, match=msg):
+                x < y
+            with pytest.raises(TypeError, match=msg):
+                x <= y
+
+    @pytest.mark.parametrize('data', [
+        [Timestamp('2011-01-01'), NaT, Timestamp('2011-01-03')],
+        [Timedelta('1 days'), NaT, Timedelta('3 days')],
+        [Period('2011-01', freq='M'), NaT, Period('2011-03', freq='M')]
+    ])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_nat_comparisons_scalar(self, dtype, data, box_with_array):
+        if box_with_array is tm.to_array and dtype is object:
+            # dont bother testing ndarray comparison methods as this fails
+            #  on older numpys (since they check object identity)
+            return
+
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        left = Series(data, dtype=dtype)
+        left = tm.box_expected(left, box_with_array)
+
+        expected = [False, False, False]
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(left == NaT, expected)
+        tm.assert_equal(NaT == left, expected)
+
+        expected = [True, True, True]
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(left != NaT, expected)
+        tm.assert_equal(NaT != left, expected)
+
+        expected = [False, False, False]
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(left < NaT, expected)
+        tm.assert_equal(NaT > left, expected)
+        tm.assert_equal(left <= NaT, expected)
+        tm.assert_equal(NaT >= left, expected)
+
+        tm.assert_equal(left > NaT, expected)
+        tm.assert_equal(NaT < left, expected)
+        tm.assert_equal(left >= NaT, expected)
+        tm.assert_equal(NaT <= left, expected)
+
+    def test_series_comparison_scalars(self):
+        series = Series(date_range('1/1/2000', periods=10))
+
+        val = datetime(2000, 1, 4)
+        result = series > val
+        expected = Series([x > val for x in series])
+        tm.assert_series_equal(result, expected)
+
+        val = series[5]
+        result = series > val
+        expected = Series([x > val for x in series])
+        tm.assert_series_equal(result, expected)
+
+    def test_dt64_ser_cmp_date_warning(self):
+        # https://github.com/pandas-dev/pandas/issues/21359
+        # Remove this test and enble invalid test below
+        ser = pd.Series(pd.date_range('20010101', periods=10), name='dates')
+        date = ser.iloc[0].to_pydatetime().date()
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser == date
+        expected = pd.Series([True] + [False] * 9, name='dates')
+        tm.assert_series_equal(result, expected)
+        assert "Comparing Series of datetimes " in str(m[0].message)
+        assert "will not compare equal" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser != date
+        tm.assert_series_equal(result, ~expected)
+        assert "will not compare equal" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser <= date
+        tm.assert_series_equal(result, expected)
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser < date
+        tm.assert_series_equal(result, pd.Series([False] * 10, name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser >= date
+        tm.assert_series_equal(result, pd.Series([True] * 10, name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ser > date
+        tm.assert_series_equal(result, pd.Series([False] + [True] * 9,
+                                                 name='dates'))
+        assert "a TypeError will be raised" in str(m[0].message)
+
+    @pytest.mark.skip(reason="GH#21359")
+    def test_dt64ser_cmp_date_invalid(self, box_with_array):
+        # GH#19800 datetime.date comparison raises to
+        # match DatetimeIndex/Timestamp.  This also matches the behavior
+        # of stdlib datetime.datetime
+
+        ser = pd.date_range('20010101', periods=10)
+        date = ser.iloc[0].to_pydatetime().date()
+
+        ser = tm.box_expected(ser, box_with_array)
+        assert not (ser == date).any()
+        assert (ser != date).all()
+        with pytest.raises(TypeError):
+            ser > date
+        with pytest.raises(TypeError):
+            ser < date
+        with pytest.raises(TypeError):
+            ser >= date
+        with pytest.raises(TypeError):
+            ser <= date
+
+    @pytest.mark.parametrize("left,right", [
+        ("lt", "gt"),
+        ("le", "ge"),
+        ("eq", "eq"),
+        ("ne", "ne"),
+    ])
+    def test_timestamp_compare_series(self, left, right):
+        # see gh-4982
+        # Make sure we can compare Timestamps on the right AND left hand side.
+        ser = pd.Series(pd.date_range("20010101", periods=10), name="dates")
+        s_nat = ser.copy(deep=True)
+
+        ser[0] = pd.Timestamp("nat")
+        ser[3] = pd.Timestamp("nat")
+
+        left_f = getattr(operator, left)
+        right_f = getattr(operator, right)
+
+        # No NaT
+        expected = left_f(ser, pd.Timestamp("20010109"))
+        result = right_f(pd.Timestamp("20010109"), ser)
+        tm.assert_series_equal(result, expected)
+
+        # NaT
+        expected = left_f(ser, pd.Timestamp("nat"))
+        result = right_f(pd.Timestamp("nat"), ser)
+        tm.assert_series_equal(result, expected)
+
+        # Compare to Timestamp with series containing NaT
+        expected = left_f(s_nat, pd.Timestamp("20010109"))
+        result = right_f(pd.Timestamp("20010109"), s_nat)
+        tm.assert_series_equal(result, expected)
+
+        # Compare to NaT with series containing NaT
+        expected = left_f(s_nat, pd.Timestamp("nat"))
+        result = right_f(pd.Timestamp("nat"), s_nat)
+        tm.assert_series_equal(result, expected)
+
+    def test_dt64arr_timestamp_equality(self, box_with_array):
+        # GH#11034
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        ser = pd.Series([pd.Timestamp('2000-01-29 01:59:00'), 'NaT'])
+        ser = tm.box_expected(ser, box_with_array)
+
+        result = ser != ser
+        expected = tm.box_expected([False, True], xbox)
+        tm.assert_equal(result, expected)
+
+        result = ser != ser[0]
+        expected = tm.box_expected([False, True], xbox)
+        tm.assert_equal(result, expected)
+
+        result = ser != ser[1]
+        expected = tm.box_expected([True, True], xbox)
+        tm.assert_equal(result, expected)
+
+        result = ser == ser
+        expected = tm.box_expected([True, False], xbox)
+        tm.assert_equal(result, expected)
+
+        result = ser == ser[0]
+        expected = tm.box_expected([True, False], xbox)
+        tm.assert_equal(result, expected)
+
+        result = ser == ser[1]
+        expected = tm.box_expected([False, False], xbox)
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_comparison_tzawareness_compat(self, op):
+        # GH#18162
+        dr = pd.date_range('2016-01-01', periods=6)
+        dz = dr.tz_localize('US/Pacific')
+
+        # Check that there isn't a problem aware-aware and naive-naive do not
+        # raise
+        naive_series = Series(dr)
+        aware_series = Series(dz)
+        msg = 'Cannot compare tz-naive and tz-aware'
+        with pytest.raises(TypeError, match=msg):
+            op(dz, naive_series)
+        with pytest.raises(TypeError, match=msg):
+            op(dr, aware_series)
+
+        # TODO: implement _assert_tzawareness_compat for the reverse
+        # comparison with the Series on the left-hand side
+
+
+class TestDatetimeIndexComparisons(object):
+
+    # TODO: moved from tests.indexes.test_base; parametrize and de-duplicate
+    @pytest.mark.parametrize("op", [
+        operator.eq, operator.ne, operator.gt, operator.lt,
+        operator.ge, operator.le
+    ])
+    def test_comparators(self, op):
+        index = tm.makeDateIndex(100)
+        element = index[len(index) // 2]
+        element = _to_M8(element)
+
+        arr = np.array(index)
+        arr_result = op(arr, element)
+        index_result = op(index, element)
+
+        assert isinstance(index_result, np.ndarray)
+        tm.assert_numpy_array_equal(arr_result, index_result)
+
+    @pytest.mark.parametrize('other', [datetime(2016, 1, 1),
+                                       Timestamp('2016-01-01'),
+                                       np.datetime64('2016-01-01')])
+    def test_dti_cmp_datetimelike(self, other, tz_naive_fixture):
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        if tz is not None:
+            if isinstance(other, np.datetime64):
+                # no tzaware version available
+                return
+            other = localize_pydatetime(other, dti.tzinfo)
+
+        result = dti == other
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti > other
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti >= other
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti < other
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti <= other
+        expected = np.array([True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def dt64arr_cmp_non_datetime(self, tz_naive_fixture, box_with_array):
+        # GH#19301 by convention datetime.date is not considered comparable
+        # to Timestamp or DatetimeIndex.  This may change in the future.
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        dtarr = tm.box_expected(dti, box_with_array)
+
+        other = datetime(2016, 1, 1).date()
+        assert not (dtarr == other).any()
+        assert (dtarr != other).all()
+        with pytest.raises(TypeError):
+            dtarr < other
+        with pytest.raises(TypeError):
+            dtarr <= other
+        with pytest.raises(TypeError):
+            dtarr > other
+        with pytest.raises(TypeError):
+            dtarr >= other
+
+    @pytest.mark.parametrize('other', [None, np.nan, pd.NaT])
+    def test_dti_eq_null_scalar(self, other, tz_naive_fixture):
+        # GH#19301
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        assert not (dti == other).any()
+
+    @pytest.mark.parametrize('other', [None, np.nan, pd.NaT])
+    def test_dti_ne_null_scalar(self, other, tz_naive_fixture):
+        # GH#19301
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        assert (dti != other).all()
+
+    @pytest.mark.parametrize('other', [None, np.nan])
+    def test_dti_cmp_null_scalar_inequality(self, tz_naive_fixture, other,
+                                            box_with_array):
+        # GH#19301
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+        # FIXME: ValueError with transpose
+        dtarr = tm.box_expected(dti, box_with_array, transpose=False)
+        msg = 'Invalid comparison between'
+        with pytest.raises(TypeError, match=msg):
+            dtarr < other
+        with pytest.raises(TypeError, match=msg):
+            dtarr <= other
+        with pytest.raises(TypeError, match=msg):
+            dtarr > other
+        with pytest.raises(TypeError, match=msg):
+            dtarr >= other
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_dti_cmp_nat(self, dtype, box_with_array):
+        if box_with_array is tm.to_array and dtype is object:
+            # dont bother testing ndarray comparison methods as this fails
+            #  on older numpys (since they check object identity)
+            return
+
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        left = pd.DatetimeIndex([pd.Timestamp('2011-01-01'), pd.NaT,
+                                 pd.Timestamp('2011-01-03')])
+        right = pd.DatetimeIndex([pd.NaT, pd.NaT, pd.Timestamp('2011-01-03')])
+
+        left = tm.box_expected(left, box_with_array)
+        right = tm.box_expected(right, box_with_array)
+
+        lhs, rhs = left, right
+        if dtype is object:
+            lhs, rhs = left.astype(object), right.astype(object)
+
+        result = rhs == lhs
+        expected = np.array([False, False, True])
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(result, expected)
+
+        result = lhs != rhs
+        expected = np.array([True, True, False])
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(result, expected)
+
+        expected = np.array([False, False, False])
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(lhs == pd.NaT, expected)
+        tm.assert_equal(pd.NaT == rhs, expected)
+
+        expected = np.array([True, True, True])
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(lhs != pd.NaT, expected)
+        tm.assert_equal(pd.NaT != lhs, expected)
+
+        expected = np.array([False, False, False])
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(lhs < pd.NaT, expected)
+        tm.assert_equal(pd.NaT > lhs, expected)
+
+    def test_dti_cmp_nat_behaves_like_float_cmp_nan(self):
+        fidx1 = pd.Index([1.0, np.nan, 3.0, np.nan, 5.0, 7.0])
+        fidx2 = pd.Index([2.0, 3.0, np.nan, np.nan, 6.0, 7.0])
+
+        didx1 = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
+                                  '2014-05-01', '2014-07-01'])
+        didx2 = pd.DatetimeIndex(['2014-02-01', '2014-03-01', pd.NaT, pd.NaT,
+                                  '2014-06-01', '2014-07-01'])
+        darr = np.array([np_datetime64_compat('2014-02-01 00:00Z'),
+                         np_datetime64_compat('2014-03-01 00:00Z'),
+                         np_datetime64_compat('nat'), np.datetime64('nat'),
+                         np_datetime64_compat('2014-06-01 00:00Z'),
+                         np_datetime64_compat('2014-07-01 00:00Z')])
+
+        cases = [(fidx1, fidx2), (didx1, didx2), (didx1, darr)]
+
+        # Check pd.NaT is handles as the same as np.nan
+        with tm.assert_produces_warning(None):
+            for idx1, idx2 in cases:
+
+                result = idx1 < idx2
+                expected = np.array([True, False, False, False, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx2 > idx1
+                expected = np.array([True, False, False, False, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= idx2
+                expected = np.array([True, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx2 >= idx1
+                expected = np.array([True, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == idx2
+                expected = np.array([False, False, False, False, False, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != idx2
+                expected = np.array([True, True, True, True, True, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+        with tm.assert_produces_warning(None):
+            for idx1, val in [(fidx1, np.nan), (didx1, pd.NaT)]:
+                result = idx1 < val
+                expected = np.array([False, False, False, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 > val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= val
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 >= val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == val
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != val
+                expected = np.array([True, True, True, True, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+        # Check pd.NaT is handles as the same as np.nan
+        with tm.assert_produces_warning(None):
+            for idx1, val in [(fidx1, 3), (didx1, datetime(2014, 3, 1))]:
+                result = idx1 < val
+                expected = np.array([True, False, False, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 > val
+                expected = np.array([False, False, False, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 <= val
+                expected = np.array([True, False, True, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+                result = idx1 >= val
+                expected = np.array([False, False, True, False, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 == val
+                expected = np.array([False, False, True, False, False, False])
+                tm.assert_numpy_array_equal(result, expected)
+
+                result = idx1 != val
+                expected = np.array([True, True, False, True, True, True])
+                tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_comparison_tzawareness_compat(self, op, box_with_array):
+        # GH#18162
+        dr = pd.date_range('2016-01-01', periods=6)
+        dz = dr.tz_localize('US/Pacific')
+
+        # FIXME: ValueError with transpose
+        dr = tm.box_expected(dr, box_with_array, transpose=False)
+        dz = tm.box_expected(dz, box_with_array, transpose=False)
+
+        msg = 'Cannot compare tz-naive and tz-aware'
+        with pytest.raises(TypeError, match=msg):
+            op(dr, dz)
+        if box_with_array is not pd.DataFrame:
+            # DataFrame op is invalid until transpose bug is fixed
+            with pytest.raises(TypeError, match=msg):
+                op(dr, list(dz))
+            with pytest.raises(TypeError, match=msg):
+                op(dr, np.array(list(dz), dtype=object))
+
+        with pytest.raises(TypeError, match=msg):
+            op(dz, dr)
+        if box_with_array is not pd.DataFrame:
+            # DataFrame op is invalid until transpose bug is fixed
+            with pytest.raises(TypeError, match=msg):
+                op(dz, list(dr))
+            with pytest.raises(TypeError, match=msg):
+                op(dz, np.array(list(dr), dtype=object))
+
+        # Check that there isn't a problem aware-aware and naive-naive do not
+        # raise
+        assert_all(dr == dr)
+        assert_all(dz == dz)
+        if box_with_array is not pd.DataFrame:
+            # DataFrame doesn't align the lists correctly unless we transpose,
+            #  which we cannot do at the moment
+            assert (dr == list(dr)).all()
+            assert (dz == list(dz)).all()
+
+        # Check comparisons against scalar Timestamps
+        ts = pd.Timestamp('2000-03-14 01:59')
+        ts_tz = pd.Timestamp('2000-03-14 01:59', tz='Europe/Amsterdam')
+
+        assert_all(dr > ts)
+        with pytest.raises(TypeError, match=msg):
+            op(dr, ts_tz)
+
+        assert_all(dz > ts_tz)
+        with pytest.raises(TypeError, match=msg):
+            op(dz, ts)
+
+        # GH#12601: Check comparison against Timestamps and DatetimeIndex
+        with pytest.raises(TypeError, match=msg):
+            op(ts, dz)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    @pytest.mark.parametrize('other', [datetime(2016, 1, 1),
+                                       Timestamp('2016-01-01'),
+                                       np.datetime64('2016-01-01')])
+    def test_scalar_comparison_tzawareness(self, op, other, tz_aware_fixture,
+                                           box_with_array):
+        tz = tz_aware_fixture
+        dti = pd.date_range('2016-01-01', periods=2, tz=tz)
+
+        # FIXME: ValueError with transpose
+        dtarr = tm.box_expected(dti, box_with_array, transpose=False)
+        msg = 'Cannot compare tz-naive and tz-aware'
+        with pytest.raises(TypeError, match=msg):
+            op(dtarr, other)
+        with pytest.raises(TypeError, match=msg):
+            op(other, dtarr)
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.gt, operator.ge,
+                                    operator.lt, operator.le])
+    def test_nat_comparison_tzawareness(self, op):
+        # GH#19276
+        # tzaware DatetimeIndex should not raise when compared to NaT
+        dti = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
+                                '2014-05-01', '2014-07-01'])
+        expected = np.array([op == operator.ne] * len(dti))
+        result = op(dti, pd.NaT)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = op(dti.tz_localize('US/Pacific'), pd.NaT)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_dti_cmp_str(self, tz_naive_fixture):
+        # GH#22074
+        # regardless of tz, we expect these comparisons are valid
+        tz = tz_naive_fixture
+        rng = date_range('1/1/2000', periods=10, tz=tz)
+        other = '1/1/2000'
+
+        result = rng == other
+        expected = np.array([True] + [False] * 9)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rng != other
+        expected = np.array([False] + [True] * 9)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rng < other
+        expected = np.array([False] * 10)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rng <= other
+        expected = np.array([True] + [False] * 9)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rng > other
+        expected = np.array([False] + [True] * 9)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rng >= other
+        expected = np.array([True] * 10)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('other', ['foo', 99, 4.0,
+                                       object(), timedelta(days=2)])
+    def test_dt64arr_cmp_scalar_invalid(self, other, tz_naive_fixture,
+                                        box_with_array):
+        # GH#22074
+        tz = tz_naive_fixture
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        rng = date_range('1/1/2000', periods=10, tz=tz)
+        # FIXME: ValueError with transpose
+        rng = tm.box_expected(rng, box_with_array, transpose=False)
+
+        result = rng == other
+        expected = np.array([False] * 10)
+        expected = tm.box_expected(expected, xbox, transpose=False)
+        tm.assert_equal(result, expected)
+
+        result = rng != other
+        expected = np.array([True] * 10)
+        expected = tm.box_expected(expected, xbox, transpose=False)
+        tm.assert_equal(result, expected)
+        msg = 'Invalid comparison between'
+        with pytest.raises(TypeError, match=msg):
+            rng < other
+        with pytest.raises(TypeError, match=msg):
+            rng <= other
+        with pytest.raises(TypeError, match=msg):
+            rng > other
+        with pytest.raises(TypeError, match=msg):
+            rng >= other
+
+    def test_dti_cmp_list(self):
+        rng = date_range('1/1/2000', periods=10)
+
+        result = rng == list(rng)
+        expected = rng == rng
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('other', [
+        pd.timedelta_range('1D', periods=10),
+        pd.timedelta_range('1D', periods=10).to_series(),
+        pd.timedelta_range('1D', periods=10).asi8.view('m8[ns]')
+    ], ids=lambda x: type(x).__name__)
+    def test_dti_cmp_tdi_tzawareness(self, other):
+        # GH#22074
+        # reversion test that we _don't_ call _assert_tzawareness_compat
+        # when comparing against TimedeltaIndex
+        dti = date_range('2000-01-01', periods=10, tz='Asia/Tokyo')
+
+        result = dti == other
+        expected = np.array([False] * 10)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = dti != other
+        expected = np.array([True] * 10)
+        tm.assert_numpy_array_equal(result, expected)
+        msg = 'Invalid comparison between'
+        with pytest.raises(TypeError, match=msg):
+            dti < other
+        with pytest.raises(TypeError, match=msg):
+            dti <= other
+        with pytest.raises(TypeError, match=msg):
+            dti > other
+        with pytest.raises(TypeError, match=msg):
+            dti >= other
+
+    def test_dti_cmp_object_dtype(self):
+        # GH#22074
+        dti = date_range('2000-01-01', periods=10, tz='Asia/Tokyo')
+
+        other = dti.astype('O')
+
+        result = dti == other
+        expected = np.array([True] * 10)
+        tm.assert_numpy_array_equal(result, expected)
+
+        other = dti.tz_localize(None)
+        msg = 'Cannot compare tz-naive and tz-aware'
+        with pytest.raises(TypeError, match=msg):
+            # tzawareness failure
+            dti != other
+
+        other = np.array(list(dti[:5]) + [Timedelta(days=1)] * 5)
+        result = dti == other
+        expected = np.array([True] * 5 + [False] * 5)
+        tm.assert_numpy_array_equal(result, expected)
+        msg = "Cannot compare type"
+        with pytest.raises(TypeError, match=msg):
+            dti >= other
+
+
+# ------------------------------------------------------------------
+# Arithmetic
+
+class TestDatetime64Arithmetic(object):
+    # This class is intended for "finished" tests that are fully parametrized
+    #  over DataFrame/Series/Index/DatetimeArray
+
+    # -------------------------------------------------------------
+    # Addition/Subtraction of timedelta-like
+
+    def test_dt64arr_add_timedeltalike_scalar(self, tz_naive_fixture,
+                                              two_hours, box_with_array):
+        # GH#22005, GH#22163 check DataFrame doesn't raise TypeError
+        tz = tz_naive_fixture
+
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('2000-01-01 02:00',
+                                 '2000-02-01 02:00', tz=tz)
+
+        # FIXME: calling with transpose=True raises ValueError
+        rng = tm.box_expected(rng, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = rng + two_hours
+        tm.assert_equal(result, expected)
+
+    def test_dt64arr_iadd_timedeltalike_scalar(self, tz_naive_fixture,
+                                               two_hours, box_with_array):
+        tz = tz_naive_fixture
+
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('2000-01-01 02:00',
+                                 '2000-02-01 02:00', tz=tz)
+
+        # FIXME: calling with transpose=True raises ValueError
+        rng = tm.box_expected(rng, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        rng += two_hours
+        tm.assert_equal(rng, expected)
+
+    def test_dt64arr_sub_timedeltalike_scalar(self, tz_naive_fixture,
+                                              two_hours, box_with_array):
+        tz = tz_naive_fixture
+
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('1999-12-31 22:00',
+                                 '2000-01-31 22:00', tz=tz)
+
+        # FIXME: calling with transpose=True raises ValueError
+        rng = tm.box_expected(rng, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = rng - two_hours
+        tm.assert_equal(result, expected)
+
+    def test_dt64arr_isub_timedeltalike_scalar(self, tz_naive_fixture,
+                                               two_hours, box_with_array):
+        tz = tz_naive_fixture
+
+        rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
+        expected = pd.date_range('1999-12-31 22:00',
+                                 '2000-01-31 22:00', tz=tz)
+
+        # FIXME: calling with transpose=True raises ValueError
+        rng = tm.box_expected(rng, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        rng -= two_hours
+        tm.assert_equal(rng, expected)
+
+    def test_dt64arr_add_td64_scalar(self, box_with_array):
+        # scalar timedeltas/np.timedelta64 objects
+        # operate with np.timedelta64 correctly
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+
+        expected = Series([Timestamp('20130101 9:01:01'),
+                           Timestamp('20130101 9:02:01')])
+
+        dtarr = tm.box_expected(ser, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = dtarr + np.timedelta64(1, 's')
+        tm.assert_equal(result, expected)
+        result = np.timedelta64(1, 's') + dtarr
+        tm.assert_equal(result, expected)
+
+        expected = Series([Timestamp('20130101 9:01:00.005'),
+                           Timestamp('20130101 9:02:00.005')])
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = dtarr + np.timedelta64(5, 'ms')
+        tm.assert_equal(result, expected)
+        result = np.timedelta64(5, 'ms') + dtarr
+        tm.assert_equal(result, expected)
+
+    def test_dt64arr_add_sub_td64_nat(self, box_with_array, tz_naive_fixture):
+        # GH#23320 special handling for timedelta64("NaT")
+        tz = tz_naive_fixture
+
+        dti = pd.date_range("1994-04-01", periods=9, tz=tz, freq="QS")
+        other = np.timedelta64("NaT")
+        expected = pd.DatetimeIndex(["NaT"] * 9, tz=tz)
+
+        # FIXME: fails with transpose=True due to tz-aware DataFrame
+        #  transpose bug
+        obj = tm.box_expected(dti, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = obj + other
+        tm.assert_equal(result, expected)
+        result = other + obj
+        tm.assert_equal(result, expected)
+        result = obj - other
+        tm.assert_equal(result, expected)
+        msg = 'cannot subtract'
+        with pytest.raises(TypeError, match=msg):
+            other - obj
+
+    def test_dt64arr_add_sub_td64ndarray(self, tz_naive_fixture,
+                                         box_with_array):
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("FIXME: ValueError with transpose; "
+                         "alignment error without")
+
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        tdi = pd.TimedeltaIndex(['-1 Day', '-1 Day', '-1 Day'])
+        tdarr = tdi.values
+
+        expected = pd.date_range('2015-12-31', periods=3, tz=tz)
+
+        dtarr = tm.box_expected(dti, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = dtarr + tdarr
+        tm.assert_equal(result, expected)
+        result = tdarr + dtarr
+        tm.assert_equal(result, expected)
+
+        expected = pd.date_range('2016-01-02', periods=3, tz=tz)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = dtarr - tdarr
+        tm.assert_equal(result, expected)
+        msg = 'cannot subtract'
+        with pytest.raises(TypeError, match=msg):
+            tdarr - dtarr
+
+    # -----------------------------------------------------------------
+    # Subtraction of datetime-like scalars
+
+    @pytest.mark.parametrize('ts', [
+        pd.Timestamp('2013-01-01'),
+        pd.Timestamp('2013-01-01').to_pydatetime(),
+        pd.Timestamp('2013-01-01').to_datetime64()])
+    def test_dt64arr_sub_dtscalar(self, box_with_array, ts):
+        # GH#8554, GH#22163 DataFrame op should _not_ return dt64 dtype
+        idx = pd.date_range('2013-01-01', periods=3)
+        idx = tm.box_expected(idx, box_with_array)
+
+        expected = pd.TimedeltaIndex(['0 Days', '1 Day', '2 Days'])
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = idx - ts
+        tm.assert_equal(result, expected)
+
+    def test_dt64arr_sub_datetime64_not_ns(self, box_with_array):
+        # GH#7996, GH#22163 ensure non-nano datetime64 is converted to nano
+        #  for DataFrame operation
+        dt64 = np.datetime64('2013-01-01')
+        assert dt64.dtype == 'datetime64[D]'
+
+        dti = pd.date_range('20130101', periods=3)
+        dtarr = tm.box_expected(dti, box_with_array)
+
+        expected = pd.TimedeltaIndex(['0 Days', '1 Day', '2 Days'])
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = dtarr - dt64
+        tm.assert_equal(result, expected)
+
+        result = dt64 - dtarr
+        tm.assert_equal(result, -expected)
+
+    def test_dt64arr_sub_timestamp(self, box_with_array):
+        ser = pd.date_range('2014-03-17', periods=2, freq='D',
+                            tz='US/Eastern')
+        ts = ser[0]
+
+        # FIXME: transpose raises ValueError
+        ser = tm.box_expected(ser, box_with_array, transpose=False)
+
+        delta_series = pd.Series([np.timedelta64(0, 'D'),
+                                  np.timedelta64(1, 'D')])
+        expected = tm.box_expected(delta_series, box_with_array,
+                                   transpose=False)
+
+        tm.assert_equal(ser - ts, expected)
+        tm.assert_equal(ts - ser, -expected)
+
+    def test_dt64arr_sub_NaT(self, box_with_array):
+        # GH#18808
+        dti = pd.DatetimeIndex([pd.NaT, pd.Timestamp('19900315')])
+        ser = tm.box_expected(dti, box_with_array, transpose=False)
+
+        result = ser - pd.NaT
+        expected = pd.Series([pd.NaT, pd.NaT], dtype='timedelta64[ns]')
+        # FIXME: raises ValueError with transpose
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+        tm.assert_equal(result, expected)
+
+        dti_tz = dti.tz_localize('Asia/Tokyo')
+        ser_tz = tm.box_expected(dti_tz, box_with_array, transpose=False)
+
+        result = ser_tz - pd.NaT
+        expected = pd.Series([pd.NaT, pd.NaT], dtype='timedelta64[ns]')
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+        tm.assert_equal(result, expected)
+
+    # -------------------------------------------------------------
+    # Subtraction of datetime-like array-like
+
+    def test_dt64arr_naive_sub_dt64ndarray(self, box_with_array):
+        dti = pd.date_range('2016-01-01', periods=3, tz=None)
+        dt64vals = dti.values
+
+        dtarr = tm.box_expected(dti, box_with_array)
+
+        expected = dtarr - dtarr
+        result = dtarr - dt64vals
+        tm.assert_equal(result, expected)
+        result = dt64vals - dtarr
+        tm.assert_equal(result, expected)
+
+    def test_dt64arr_aware_sub_dt64ndarray_raises(self, tz_aware_fixture,
+                                                  box_with_array):
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("FIXME: ValueError with transpose; "
+                         "alignment error without")
+
+        tz = tz_aware_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        dt64vals = dti.values
+
+        dtarr = tm.box_expected(dti, box_with_array)
+        msg = 'DatetimeArray subtraction must have the same timezones or'
+        with pytest.raises(TypeError, match=msg):
+            dtarr - dt64vals
+        with pytest.raises(TypeError, match=msg):
+            dt64vals - dtarr
+
+    # -------------------------------------------------------------
+    # Addition of datetime-like others (invalid)
+
+    def test_dt64arr_add_dt64ndarray_raises(self, tz_naive_fixture,
+                                            box_with_array):
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("FIXME: ValueError with transpose; "
+                         "alignment error without")
+
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        dt64vals = dti.values
+
+        dtarr = tm.box_expected(dti, box_with_array)
+        msg = 'cannot add'
+        with pytest.raises(TypeError, match=msg):
+            dtarr + dt64vals
+        with pytest.raises(TypeError, match=msg):
+            dt64vals + dtarr
+
+    def test_dt64arr_add_timestamp_raises(self, box_with_array):
+        # GH#22163 ensure DataFrame doesn't cast Timestamp to i8
+        idx = DatetimeIndex(['2011-01-01', '2011-01-02'])
+        idx = tm.box_expected(idx, box_with_array)
+        msg = 'cannot add'
+        with pytest.raises(TypeError, match=msg):
+            idx + Timestamp('2011-01-01')
+        with pytest.raises(TypeError, match=msg):
+            Timestamp('2011-01-01') + idx
+
+    # -------------------------------------------------------------
+    # Other Invalid Addition/Subtraction
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    def test_dt64arr_add_sub_float(self, other, box_with_array):
+        dti = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        dtarr = tm.box_expected(dti, box_with_array)
+        msg = '|'.join(['unsupported operand type', 'cannot (add|subtract)'])
+        with pytest.raises(TypeError, match=msg):
+            dtarr + other
+        with pytest.raises(TypeError, match=msg):
+            other + dtarr
+        with pytest.raises(TypeError, match=msg):
+            dtarr - other
+        with pytest.raises(TypeError, match=msg):
+            other - dtarr
+
+    @pytest.mark.parametrize('pi_freq', ['D', 'W', 'Q', 'H'])
+    @pytest.mark.parametrize('dti_freq', [None, 'D'])
+    def test_dt64arr_add_sub_parr(self, dti_freq, pi_freq,
+                                  box_with_array, box_with_array2):
+        # GH#20049 subtracting PeriodIndex should raise TypeError
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq=dti_freq)
+        pi = dti.to_period(pi_freq)
+
+        dtarr = tm.box_expected(dti, box_with_array)
+        parr = tm.box_expected(pi, box_with_array2)
+        msg = '|'.join(['cannot (add|subtract)', 'unsupported operand',
+                        'descriptor.*requires', 'ufunc.*cannot use operands'])
+        with pytest.raises(TypeError, match=msg):
+            dtarr + parr
+        with pytest.raises(TypeError, match=msg):
+            parr + dtarr
+        with pytest.raises(TypeError, match=msg):
+            dtarr - parr
+        with pytest.raises(TypeError, match=msg):
+            parr - dtarr
+
+    @pytest.mark.parametrize('dti_freq', [None, 'D'])
+    def test_dt64arr_add_sub_period_scalar(self, dti_freq, box_with_array):
+        # GH#13078
+        # not supported, check TypeError
+        per = pd.Period('2011-01-01', freq='D')
+
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq=dti_freq)
+        dtarr = tm.box_expected(idx, box_with_array)
+        msg = '|'.join(['unsupported operand type', 'cannot (add|subtract)'])
+        with pytest.raises(TypeError, match=msg):
+            dtarr + per
+        with pytest.raises(TypeError, match=msg):
+            per + dtarr
+        with pytest.raises(TypeError, match=msg):
+            dtarr - per
+        with pytest.raises(TypeError, match=msg):
+            per - dtarr
+
+
+class TestDatetime64DateOffsetArithmetic(object):
+
+    # -------------------------------------------------------------
+    # Tick DateOffsets
+
+    # TODO: parametrize over timezone?
+    def test_dt64arr_series_add_tick_DateOffset(self, box_with_array):
+        # GH#4532
+        # operate with pd.offsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+        expected = Series([Timestamp('20130101 9:01:05'),
+                           Timestamp('20130101 9:02:05')])
+
+        ser = tm.box_expected(ser, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = ser + pd.offsets.Second(5)
+        tm.assert_equal(result, expected)
+
+        result2 = pd.offsets.Second(5) + ser
+        tm.assert_equal(result2, expected)
+
+    def test_dt64arr_series_sub_tick_DateOffset(self, box_with_array):
+        # GH#4532
+        # operate with pd.offsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+        expected = Series([Timestamp('20130101 9:00:55'),
+                           Timestamp('20130101 9:01:55')])
+
+        ser = tm.box_expected(ser, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = ser - pd.offsets.Second(5)
+        tm.assert_equal(result, expected)
+
+        result2 = -pd.offsets.Second(5) + ser
+        tm.assert_equal(result2, expected)
+        msg = "bad operand type for unary"
+        with pytest.raises(TypeError, match=msg):
+            pd.offsets.Second(5) - ser
+
+    @pytest.mark.parametrize('cls_name', ['Day', 'Hour', 'Minute', 'Second',
+                                          'Milli', 'Micro', 'Nano'])
+    def test_dt64arr_add_sub_tick_DateOffset_smoke(self, cls_name,
+                                                   box_with_array):
+        # GH#4532
+        # smoke tests for valid DateOffsets
+        ser = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+        ser = tm.box_expected(ser, box_with_array)
+
+        offset_cls = getattr(pd.offsets, cls_name)
+        ser + offset_cls(5)
+        offset_cls(5) + ser
+        ser - offset_cls(5)
+
+    def test_dti_add_tick_tzaware(self, tz_aware_fixture, box_with_array):
+        # GH#21610, GH#22163 ensure DataFrame doesn't return object-dtype
+        tz = tz_aware_fixture
+        if tz == 'US/Pacific':
+            dates = date_range('2012-11-01', periods=3, tz=tz)
+            offset = dates + pd.offsets.Hour(5)
+            assert dates[0] + pd.offsets.Hour(5) == offset[0]
+
+        dates = date_range('2010-11-01 00:00',
+                           periods=3, tz=tz, freq='H')
+        expected = DatetimeIndex(['2010-11-01 05:00', '2010-11-01 06:00',
+                                  '2010-11-01 07:00'], freq='H', tz=tz)
+
+        # FIXME: these raise ValueError with transpose=True
+        dates = tm.box_expected(dates, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        # TODO: parametrize over the scalar being added?  radd?  sub?
+        offset = dates + pd.offsets.Hour(5)
+        tm.assert_equal(offset, expected)
+        offset = dates + np.timedelta64(5, 'h')
+        tm.assert_equal(offset, expected)
+        offset = dates + timedelta(hours=5)
+        tm.assert_equal(offset, expected)
+
+    # -------------------------------------------------------------
+    # RelativeDelta DateOffsets
+
+    def test_dt64arr_add_sub_relativedelta_offsets(self, box_with_array):
+        # GH#10699
+        vec = DatetimeIndex([Timestamp('2000-01-05 00:15:00'),
+                             Timestamp('2000-01-31 00:23:00'),
+                             Timestamp('2000-01-01'),
+                             Timestamp('2000-03-31'),
+                             Timestamp('2000-02-29'),
+                             Timestamp('2000-12-31'),
+                             Timestamp('2000-05-15'),
+                             Timestamp('2001-06-15')])
+        vec = tm.box_expected(vec, box_with_array)
+        vec_items = vec.squeeze() if box_with_array is pd.DataFrame else vec
+
+        # DateOffset relativedelta fastpath
+        relative_kwargs = [('years', 2), ('months', 5), ('days', 3),
+                           ('hours', 5), ('minutes', 10), ('seconds', 2),
+                           ('microseconds', 5)]
+        for i, kwd in enumerate(relative_kwargs):
+            off = pd.DateOffset(**dict([kwd]))
+
+            expected = DatetimeIndex([x + off for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec + off)
+
+            expected = DatetimeIndex([x - off for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec - off)
+
+            off = pd.DateOffset(**dict(relative_kwargs[:i + 1]))
+
+            expected = DatetimeIndex([x + off for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec + off)
+
+            expected = DatetimeIndex([x - off for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec - off)
+            msg = "bad operand type for unary"
+            with pytest.raises(TypeError, match=msg):
+                off - vec
+
+    # -------------------------------------------------------------
+    # Non-Tick, Non-RelativeDelta DateOffsets
+
+    # TODO: redundant with test_dt64arr_add_sub_DateOffset?  that includes
+    #  tz-aware cases which this does not
+    @pytest.mark.parametrize('cls_and_kwargs', [
+        'YearBegin', ('YearBegin', {'month': 5}),
+        'YearEnd', ('YearEnd', {'month': 5}),
+        'MonthBegin', 'MonthEnd',
+        'SemiMonthEnd', 'SemiMonthBegin',
+        'Week', ('Week', {'weekday': 3}),
+        'Week', ('Week', {'weekday': 6}),
+        'BusinessDay', 'BDay', 'QuarterEnd', 'QuarterBegin',
+        'CustomBusinessDay', 'CDay', 'CBMonthEnd',
+        'CBMonthBegin', 'BMonthBegin', 'BMonthEnd',
+        'BusinessHour', 'BYearBegin', 'BYearEnd',
+        'BQuarterBegin', ('LastWeekOfMonth', {'weekday': 2}),
+        ('FY5253Quarter', {'qtr_with_extra_week': 1,
+                           'startingMonth': 1,
+                           'weekday': 2,
+                           'variation': 'nearest'}),
+        ('FY5253', {'weekday': 0, 'startingMonth': 2, 'variation': 'nearest'}),
+        ('WeekOfMonth', {'weekday': 2, 'week': 2}),
+        'Easter', ('DateOffset', {'day': 4}),
+        ('DateOffset', {'month': 5})])
+    @pytest.mark.parametrize('normalize', [True, False])
+    @pytest.mark.parametrize('n', [0, 5])
+    def test_dt64arr_add_sub_DateOffsets(self, box_with_array,
+                                         n, normalize, cls_and_kwargs):
+        # GH#10699
+        # assert vectorized operation matches pointwise operations
+
+        if isinstance(cls_and_kwargs, tuple):
+            # If cls_name param is a tuple, then 2nd entry is kwargs for
+            # the offset constructor
+            cls_name, kwargs = cls_and_kwargs
+        else:
+            cls_name = cls_and_kwargs
+            kwargs = {}
+
+        if n == 0 and cls_name in ['WeekOfMonth', 'LastWeekOfMonth',
+                                   'FY5253Quarter', 'FY5253']:
+            # passing n = 0 is invalid for these offset classes
+            return
+
+        vec = DatetimeIndex([Timestamp('2000-01-05 00:15:00'),
+                             Timestamp('2000-01-31 00:23:00'),
+                             Timestamp('2000-01-01'),
+                             Timestamp('2000-03-31'),
+                             Timestamp('2000-02-29'),
+                             Timestamp('2000-12-31'),
+                             Timestamp('2000-05-15'),
+                             Timestamp('2001-06-15')])
+        vec = tm.box_expected(vec, box_with_array)
+        vec_items = vec.squeeze() if box_with_array is pd.DataFrame else vec
+
+        offset_cls = getattr(pd.offsets, cls_name)
+
+        with warnings.catch_warnings(record=True):
+            # pandas.errors.PerformanceWarning: Non-vectorized DateOffset being
+            # applied to Series or DatetimeIndex
+            # we aren't testing that here, so ignore.
+            warnings.simplefilter("ignore", PerformanceWarning)
+
+            offset = offset_cls(n, normalize=normalize, **kwargs)
+
+            expected = DatetimeIndex([x + offset for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec + offset)
+
+            expected = DatetimeIndex([x - offset for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, vec - offset)
+
+            expected = DatetimeIndex([offset + x for x in vec_items])
+            expected = tm.box_expected(expected, box_with_array)
+            tm.assert_equal(expected, offset + vec)
+            msg = "bad operand type for unary"
+            with pytest.raises(TypeError, match=msg):
+                offset - vec
+
+    def test_dt64arr_add_sub_DateOffset(self, box_with_array):
+        # GH#10699
+        s = date_range('2000-01-01', '2000-01-31', name='a')
+        s = tm.box_expected(s, box_with_array)
+        result = s + pd.DateOffset(years=1)
+        result2 = pd.DateOffset(years=1) + s
+        exp = date_range('2001-01-01', '2001-01-31', name='a')
+        exp = tm.box_expected(exp, box_with_array)
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+        result = s - pd.DateOffset(years=1)
+        exp = date_range('1999-01-01', '1999-01-31', name='a')
+        exp = tm.box_expected(exp, box_with_array)
+        tm.assert_equal(result, exp)
+
+        s = DatetimeIndex([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                           Timestamp('2000-02-15', tz='US/Central')], name='a')
+        # FIXME: ValueError with tzaware DataFrame transpose
+        s = tm.box_expected(s, box_with_array, transpose=False)
+        result = s + pd.offsets.Day()
+        result2 = pd.offsets.Day() + s
+        exp = DatetimeIndex([Timestamp('2000-01-16 00:15:00', tz='US/Central'),
+                             Timestamp('2000-02-16', tz='US/Central')],
+                            name='a')
+        exp = tm.box_expected(exp, box_with_array, transpose=False)
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+        s = DatetimeIndex([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                           Timestamp('2000-02-15', tz='US/Central')], name='a')
+        s = tm.box_expected(s, box_with_array, transpose=False)
+        result = s + pd.offsets.MonthEnd()
+        result2 = pd.offsets.MonthEnd() + s
+        exp = DatetimeIndex([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
+                             Timestamp('2000-02-29', tz='US/Central')],
+                            name='a')
+        exp = tm.box_expected(exp, box_with_array, transpose=False)
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+    # TODO: __sub__, __rsub__
+    def test_dt64arr_add_mixed_offset_array(self, box_with_array):
+        # GH#10699
+        # array of offsets
+        s = DatetimeIndex([Timestamp('2000-1-1'), Timestamp('2000-2-1')])
+        s = tm.box_expected(s, box_with_array)
+
+        warn = None if box_with_array is pd.DataFrame else PerformanceWarning
+        with tm.assert_produces_warning(warn,
+                                        clear=[pd.core.arrays.datetimelike]):
+            other = pd.Index([pd.offsets.DateOffset(years=1),
+                              pd.offsets.MonthEnd()])
+            other = tm.box_expected(other, box_with_array)
+            result = s + other
+            exp = DatetimeIndex([Timestamp('2001-1-1'),
+                                 Timestamp('2000-2-29')])
+            exp = tm.box_expected(exp, box_with_array)
+            tm.assert_equal(result, exp)
+
+            # same offset
+            other = pd.Index([pd.offsets.DateOffset(years=1),
+                              pd.offsets.DateOffset(years=1)])
+            other = tm.box_expected(other, box_with_array)
+            result = s + other
+            exp = DatetimeIndex([Timestamp('2001-1-1'),
+                                 Timestamp('2001-2-1')])
+            exp = tm.box_expected(exp, box_with_array)
+            tm.assert_equal(result, exp)
+
+    # TODO: overlap with test_dt64arr_add_mixed_offset_array?
+    def test_dt64arr_add_sub_offset_ndarray(self, tz_naive_fixture,
+                                            box_with_array):
+        # GH#18849
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("FIXME: ValueError with transpose; "
+                         "alignment error without")
+
+        tz = tz_naive_fixture
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz)
+        dtarr = tm.box_expected(dti, box_with_array)
+
+        other = np.array([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        warn = None if box_with_array is pd.DataFrame else PerformanceWarning
+        with tm.assert_produces_warning(warn,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res = dtarr + other
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))],
+                                 name=dti.name, freq='infer')
+        expected = tm.box_expected(expected, box_with_array)
+        tm.assert_equal(res, expected)
+
+        with tm.assert_produces_warning(warn,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res2 = other + dtarr
+        tm.assert_equal(res2, expected)
+
+        with tm.assert_produces_warning(warn,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res = dtarr - other
+        expected = DatetimeIndex([dti[n] - other[n] for n in range(len(dti))],
+                                 name=dti.name, freq='infer')
+        expected = tm.box_expected(expected, box_with_array)
+        tm.assert_equal(res, expected)
+
+
+class TestDatetime64OverflowHandling(object):
+    # TODO: box + de-duplicate
+
+    def test_dt64_overflow_masking(self, box_with_array):
+        # GH#25317
+        left = Series([Timestamp('1969-12-31')])
+        right = Series([NaT])
+
+        left = tm.box_expected(left, box_with_array)
+        right = tm.box_expected(right, box_with_array)
+
+        expected = TimedeltaIndex([NaT])
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = left - right
+        tm.assert_equal(result, expected)
+
+    def test_dt64_series_arith_overflow(self):
+        # GH#12534, fixed by GH#19024
+        dt = pd.Timestamp('1700-01-31')
+        td = pd.Timedelta('20000 Days')
+        dti = pd.date_range('1949-09-30', freq='100Y', periods=4)
+        ser = pd.Series(dti)
+        msg = 'Overflow in int64 addition'
+        with pytest.raises(OverflowError, match=msg):
+            ser - dt
+        with pytest.raises(OverflowError, match=msg):
+            dt - ser
+        with pytest.raises(OverflowError, match=msg):
+            ser + td
+        with pytest.raises(OverflowError, match=msg):
+            td + ser
+
+        ser.iloc[-1] = pd.NaT
+        expected = pd.Series(['2004-10-03', '2104-10-04', '2204-10-04', 'NaT'],
+                             dtype='datetime64[ns]')
+        res = ser + td
+        tm.assert_series_equal(res, expected)
+        res = td + ser
+        tm.assert_series_equal(res, expected)
+
+        ser.iloc[1:] = pd.NaT
+        expected = pd.Series(['91279 Days', 'NaT', 'NaT', 'NaT'],
+                             dtype='timedelta64[ns]')
+        res = ser - dt
+        tm.assert_series_equal(res, expected)
+        res = dt - ser
+        tm.assert_series_equal(res, -expected)
+
+    def test_datetimeindex_sub_timestamp_overflow(self):
+        dtimax = pd.to_datetime(['now', pd.Timestamp.max])
+        dtimin = pd.to_datetime(['now', pd.Timestamp.min])
+
+        tsneg = Timestamp('1950-01-01')
+        ts_neg_variants = [tsneg,
+                           tsneg.to_pydatetime(),
+                           tsneg.to_datetime64().astype('datetime64[ns]'),
+                           tsneg.to_datetime64().astype('datetime64[D]')]
+
+        tspos = Timestamp('1980-01-01')
+        ts_pos_variants = [tspos,
+                           tspos.to_pydatetime(),
+                           tspos.to_datetime64().astype('datetime64[ns]'),
+                           tspos.to_datetime64().astype('datetime64[D]')]
+        msg = 'Overflow in int64 addition'
+        for variant in ts_neg_variants:
+            with pytest.raises(OverflowError, match=msg):
+                dtimax - variant
+
+        expected = pd.Timestamp.max.value - tspos.value
+        for variant in ts_pos_variants:
+            res = dtimax - variant
+            assert res[1].value == expected
+
+        expected = pd.Timestamp.min.value - tsneg.value
+        for variant in ts_neg_variants:
+            res = dtimin - variant
+            assert res[1].value == expected
+
+        for variant in ts_pos_variants:
+            with pytest.raises(OverflowError, match=msg):
+                dtimin - variant
+
+    def test_datetimeindex_sub_datetimeindex_overflow(self):
+        # GH#22492, GH#22508
+        dtimax = pd.to_datetime(['now', pd.Timestamp.max])
+        dtimin = pd.to_datetime(['now', pd.Timestamp.min])
+
+        ts_neg = pd.to_datetime(['1950-01-01', '1950-01-01'])
+        ts_pos = pd.to_datetime(['1980-01-01', '1980-01-01'])
+
+        # General tests
+        expected = pd.Timestamp.max.value - ts_pos[1].value
+        result = dtimax - ts_pos
+        assert result[1].value == expected
+
+        expected = pd.Timestamp.min.value - ts_neg[1].value
+        result = dtimin - ts_neg
+        assert result[1].value == expected
+        msg = 'Overflow in int64 addition'
+        with pytest.raises(OverflowError, match=msg):
+            dtimax - ts_neg
+
+        with pytest.raises(OverflowError, match=msg):
+            dtimin - ts_pos
+
+        # Edge cases
+        tmin = pd.to_datetime([pd.Timestamp.min])
+        t1 = tmin + pd.Timedelta.max + pd.Timedelta('1us')
+        with pytest.raises(OverflowError, match=msg):
+            t1 - tmin
+
+        tmax = pd.to_datetime([pd.Timestamp.max])
+        t2 = tmax + pd.Timedelta.min - pd.Timedelta('1us')
+        with pytest.raises(OverflowError, match=msg):
+            tmax - t2
+
+
+class TestTimestampSeriesArithmetic(object):
+
+    def test_empty_series_add_sub(self):
+        # GH#13844
+        a = Series(dtype='M8[ns]')
+        b = Series(dtype='m8[ns]')
+        tm.assert_series_equal(a, a + b)
+        tm.assert_series_equal(a, a - b)
+        tm.assert_series_equal(a, b + a)
+        msg = 'cannot subtract'
+        with pytest.raises(TypeError, match=msg):
+            b - a
+
+    def test_operators_datetimelike(self):
+
+        # ## timedelta64 ###
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # ## datetime64 ###
+        dt1 = Series([pd.Timestamp('20111230'), pd.Timestamp('20120101'),
+                      pd.Timestamp('20120103')])
+        dt1.iloc[2] = np.nan
+        dt2 = Series([pd.Timestamp('20111231'), pd.Timestamp('20120102'),
+                      pd.Timestamp('20120104')])
+        dt1 - dt2
+        dt2 - dt1
+
+        # ## datetime64 with timetimedelta ###
+        dt1 + td1
+        td1 + dt1
+        dt1 - td1
+        # TODO: Decide if this ought to work.
+        # td1 - dt1
+
+        # ## timetimedelta with datetime64 ###
+        td1 + dt1
+        dt1 + td1
+
+    def test_dt64ser_sub_datetime_dtype(self):
+        ts = Timestamp(datetime(1993, 1, 7, 13, 30, 00))
+        dt = datetime(1993, 6, 22, 13, 30)
+        ser = Series([ts])
+        result = pd.to_timedelta(np.abs(ser - dt))
+        assert result.dtype == 'timedelta64[ns]'
+
+    # -------------------------------------------------------------
+    # TODO: This next block of tests came from tests.series.test_operators,
+    # needs to be de-duplicated and parametrized over `box` classes
+
+    def test_operators_datetimelike_invalid(self, all_arithmetic_operators):
+        # these are all TypeEror ops
+        op_str = all_arithmetic_operators
+
+        def check(get_ser, test_ser):
+
+            # check that we are getting a TypeError
+            # with 'operate' (from core/ops.py) for the ops that are not
+            # defined
+            op = getattr(get_ser, op_str, None)
+            # Previously, _validate_for_numeric_binop in core/indexes/base.py
+            # did this for us.
+            with pytest.raises(TypeError,
+                               match='operate|[cC]annot|unsupported operand'):
+                op(test_ser)
+
+        # ## timedelta64 ###
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        # ## datetime64 ###
+        dt1 = Series([Timestamp('20111230'), Timestamp('20120101'),
+                      Timestamp('20120103')])
+        dt1.iloc[2] = np.nan
+        dt2 = Series([Timestamp('20111231'), Timestamp('20120102'),
+                      Timestamp('20120104')])
+        if op_str not in ['__sub__', '__rsub__']:
+            check(dt1, dt2)
+
+        # ## datetime64 with timetimedelta ###
+        # TODO(jreback) __rsub__ should raise?
+        if op_str not in ['__add__', '__radd__', '__sub__']:
+            check(dt1, td1)
+
+        # 8260, 10763
+        # datetime64 with tz
+        tz = 'US/Eastern'
+        dt1 = Series(date_range('2000-01-01 09:00:00', periods=5,
+                                tz=tz), name='foo')
+        dt2 = dt1.copy()
+        dt2.iloc[2] = np.nan
+        td1 = Series(pd.timedelta_range('1 days 1 min', periods=5, freq='H'))
+        td2 = td1.copy()
+        td2.iloc[1] = np.nan
+
+        if op_str not in ['__add__', '__radd__', '__sub__', '__rsub__']:
+            check(dt2, td2)
+
+    def test_sub_single_tz(self):
+        # GH#12290
+        s1 = Series([pd.Timestamp('2016-02-10', tz='America/Sao_Paulo')])
+        s2 = Series([pd.Timestamp('2016-02-08', tz='America/Sao_Paulo')])
+        result = s1 - s2
+        expected = Series([Timedelta('2days')])
+        tm.assert_series_equal(result, expected)
+        result = s2 - s1
+        expected = Series([Timedelta('-2days')])
+        tm.assert_series_equal(result, expected)
+
+    def test_dt64tz_series_sub_dtitz(self):
+        # GH#19071 subtracting tzaware DatetimeIndex from tzaware Series
+        # (with same tz) raises, fixed by #19024
+        dti = pd.date_range('1999-09-30', periods=10, tz='US/Pacific')
+        ser = pd.Series(dti)
+        expected = pd.Series(pd.TimedeltaIndex(['0days'] * 10))
+
+        res = dti - ser
+        tm.assert_series_equal(res, expected)
+        res = ser - dti
+        tm.assert_series_equal(res, expected)
+
+    def test_sub_datetime_compat(self):
+        # see GH#14088
+        s = Series([datetime(2016, 8, 23, 12, tzinfo=pytz.utc), pd.NaT])
+        dt = datetime(2016, 8, 22, 12, tzinfo=pytz.utc)
+        exp = Series([Timedelta('1 days'), pd.NaT])
+        tm.assert_series_equal(s - dt, exp)
+        tm.assert_series_equal(s - Timestamp(dt), exp)
+
+    def test_dt64_series_add_mixed_tick_DateOffset(self):
+        # GH#4532
+        # operate with pd.offsets
+        s = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
+
+        result = s + pd.offsets.Milli(5)
+        result2 = pd.offsets.Milli(5) + s
+        expected = Series([Timestamp('20130101 9:01:00.005'),
+                           Timestamp('20130101 9:02:00.005')])
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result2, expected)
+
+        result = s + pd.offsets.Minute(5) + pd.offsets.Milli(5)
+        expected = Series([Timestamp('20130101 9:06:00.005'),
+                           Timestamp('20130101 9:07:00.005')])
+        tm.assert_series_equal(result, expected)
+
+    def test_datetime64_ops_nat(self):
+        # GH#11349
+        datetime_series = Series([NaT, Timestamp('19900315')])
+        nat_series_dtype_timestamp = Series([NaT, NaT], dtype='datetime64[ns]')
+        single_nat_dtype_datetime = Series([NaT], dtype='datetime64[ns]')
+
+        # subtraction
+        tm.assert_series_equal(-NaT + datetime_series,
+                               nat_series_dtype_timestamp)
+        msg = 'Unary negative expects'
+        with pytest.raises(TypeError, match=msg):
+            -single_nat_dtype_datetime + datetime_series
+
+        tm.assert_series_equal(-NaT + nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+        with pytest.raises(TypeError, match=msg):
+            -single_nat_dtype_datetime + nat_series_dtype_timestamp
+
+        # addition
+        tm.assert_series_equal(nat_series_dtype_timestamp + NaT,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(NaT + nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+
+        tm.assert_series_equal(nat_series_dtype_timestamp + NaT,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(NaT + nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+    # TODO: this block also needs to be de-duplicated and parametrized
+
+    @pytest.mark.parametrize('dt64_series', [
+        Series([Timestamp('19900315'), Timestamp('19900315')]),
+        Series([pd.NaT, Timestamp('19900315')]),
+        Series([pd.NaT, pd.NaT], dtype='datetime64[ns]')])
+    @pytest.mark.parametrize('one', [1, 1.0, np.array(1)])
+    def test_dt64_mul_div_numeric_invalid(self, one, dt64_series):
+        # multiplication
+        msg = 'cannot perform .* with this index type'
+        with pytest.raises(TypeError, match=msg):
+            dt64_series * one
+        with pytest.raises(TypeError, match=msg):
+            one * dt64_series
+
+        # division
+        with pytest.raises(TypeError, match=msg):
+            dt64_series / one
+        with pytest.raises(TypeError, match=msg):
+            one / dt64_series
+
+    @pytest.mark.parametrize('op', ['__add__', '__radd__',
+                                    '__sub__', '__rsub__'])
+    @pytest.mark.parametrize('tz', [None, 'Asia/Tokyo'])
+    def test_dt64_series_add_intlike(self, tz, op):
+        # GH#19123
+        dti = pd.DatetimeIndex(['2016-01-02', '2016-02-03', 'NaT'], tz=tz)
+        ser = Series(dti)
+
+        other = Series([20, 30, 40], dtype='uint8')
+
+        method = getattr(ser, op)
+        msg = '|'.join(['incompatible type for a .* operation',
+                        'cannot evaluate a numeric op',
+                        'ufunc .* cannot use operands',
+                        'cannot (add|subtract)'])
+        with pytest.raises(TypeError, match=msg):
+            method(1)
+        with pytest.raises(TypeError, match=msg):
+            method(other)
+        with pytest.raises(TypeError, match=msg):
+            method(other.values)
+        with pytest.raises(TypeError, match=msg):
+            method(pd.Index(other))
+
+    # -------------------------------------------------------------
+    # Timezone-Centric Tests
+
+    def test_operators_datetimelike_with_timezones(self):
+        tz = 'US/Eastern'
+        dt1 = Series(date_range('2000-01-01 09:00:00', periods=5,
+                                tz=tz), name='foo')
+        dt2 = dt1.copy()
+        dt2.iloc[2] = np.nan
+
+        td1 = Series(pd.timedelta_range('1 days 1 min', periods=5, freq='H'))
+        td2 = td1.copy()
+        td2.iloc[1] = np.nan
+
+        result = dt1 + td1[0]
+        exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = dt2 + td2[0]
+        exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        # odd numpy behavior with scalar timedeltas
+        result = td1[0] + dt1
+        exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = td2[0] + dt2
+        exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = dt1 - td1[0]
+        exp = (dt1.dt.tz_localize(None) - td1[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+        msg = "bad operand type for unary"
+        with pytest.raises(TypeError, match=msg):
+            td1[0] - dt1
+
+        result = dt2 - td2[0]
+        exp = (dt2.dt.tz_localize(None) - td2[0]).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+        with pytest.raises(TypeError, match=msg):
+            td2[0] - dt2
+
+        result = dt1 + td1
+        exp = (dt1.dt.tz_localize(None) + td1).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = dt2 + td2
+        exp = (dt2.dt.tz_localize(None) + td2).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = dt1 - td1
+        exp = (dt1.dt.tz_localize(None) - td1).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+
+        result = dt2 - td2
+        exp = (dt2.dt.tz_localize(None) - td2).dt.tz_localize(tz)
+        tm.assert_series_equal(result, exp)
+        msg = 'cannot (add|subtract)'
+        with pytest.raises(TypeError, match=msg):
+            td1 - dt1
+        with pytest.raises(TypeError, match=msg):
+            td2 - dt2
+
+
+class TestDatetimeIndexArithmetic(object):
+
+    # -------------------------------------------------------------
+    # Binary operations DatetimeIndex and int
+
+    def test_dti_add_int(self, tz_naive_fixture, one):
+        # Variants of `one` for #19012
+        tz = tz_naive_fixture
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = rng + one
+        expected = pd.date_range('2000-01-01 10:00', freq='H',
+                                 periods=10, tz=tz)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_iadd_int(self, tz_naive_fixture, one):
+        tz = tz_naive_fixture
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        expected = pd.date_range('2000-01-01 10:00', freq='H',
+                                 periods=10, tz=tz)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_dti_sub_int(self, tz_naive_fixture, one):
+        tz = tz_naive_fixture
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = rng - one
+        expected = pd.date_range('2000-01-01 08:00', freq='H',
+                                 periods=10, tz=tz)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_isub_int(self, tz_naive_fixture, one):
+        tz = tz_naive_fixture
+        rng = pd.date_range('2000-01-01 09:00', freq='H',
+                            periods=10, tz=tz)
+        expected = pd.date_range('2000-01-01 08:00', freq='H',
+                                 periods=10, tz=tz)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('freq', ['H', 'D'])
+    @pytest.mark.parametrize('int_holder', [np.array, pd.Index])
+    def test_dti_add_intarray_tick(self, int_holder, freq):
+        # GH#19959
+        dti = pd.date_range('2016-01-01', periods=2, freq=freq)
+        other = int_holder([4, -1])
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            expected = DatetimeIndex([dti[n] + other[n]
+                                      for n in range(len(dti))])
+            result = dti + other
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = other + dti
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['W', 'M', 'MS', 'Q'])
+    @pytest.mark.parametrize('int_holder', [np.array, pd.Index])
+    def test_dti_add_intarray_non_tick(self, int_holder, freq):
+        # GH#19959
+        dti = pd.date_range('2016-01-01', periods=2, freq=freq)
+        other = int_holder([4, -1])
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            expected = DatetimeIndex([dti[n] + other[n]
+                                      for n in range(len(dti))])
+
+        # tm.assert_produces_warning does not handle cases where we expect
+        # two warnings, in this case PerformanceWarning and FutureWarning.
+        # Until that is fixed, we don't catch either
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            result = dti + other
+        tm.assert_index_equal(result, expected)
+
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            result = other + dti
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('int_holder', [np.array, pd.Index])
+    def test_dti_add_intarray_no_freq(self, int_holder):
+        # GH#19959
+        dti = pd.DatetimeIndex(['2016-01-01', 'NaT', '2017-04-05 06:07:08'])
+        other = int_holder([9, 4, -1])
+        nfmsg = 'Cannot shift with no freq'
+        tmsg = 'cannot subtract DatetimeArray from'
+        with pytest.raises(NullFrequencyError, match=nfmsg):
+            dti + other
+        with pytest.raises(NullFrequencyError, match=nfmsg):
+            other + dti
+        with pytest.raises(NullFrequencyError, match=nfmsg):
+            dti - other
+        with pytest.raises(TypeError, match=tmsg):
+            other - dti
+
+    # -------------------------------------------------------------
+    # Binary operations DatetimeIndex and TimedeltaIndex/array
+
+    def test_dti_add_tdi(self, tz_naive_fixture):
+        # GH#17558
+        tz = tz_naive_fixture
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz)
+
+        # add with TimdeltaIndex
+        result = dti + tdi
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + dti
+        tm.assert_index_equal(result, expected)
+
+        # add with timedelta64 array
+        result = dti + tdi.values
+        tm.assert_index_equal(result, expected)
+
+        result = tdi.values + dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_iadd_tdi(self, tz_naive_fixture):
+        # GH#17558
+        tz = tz_naive_fixture
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz)
+
+        # iadd with TimdeltaIndex
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result += tdi
+        tm.assert_index_equal(result, expected)
+
+        result = pd.timedelta_range('0 days', periods=10)
+        result += dti
+        tm.assert_index_equal(result, expected)
+
+        # iadd with timedelta64 array
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result += tdi.values
+        tm.assert_index_equal(result, expected)
+
+        result = pd.timedelta_range('0 days', periods=10)
+        result += dti
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_sub_tdi(self, tz_naive_fixture):
+        # GH#17558
+        tz = tz_naive_fixture
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz, freq='-1D')
+
+        # sub with TimedeltaIndex
+        result = dti - tdi
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract .*TimedeltaArray'
+        with pytest.raises(TypeError, match=msg):
+            tdi - dti
+
+        # sub with timedelta64 array
+        result = dti - tdi.values
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract DatetimeArray from'
+        with pytest.raises(TypeError, match=msg):
+            tdi.values - dti
+
+    def test_dti_isub_tdi(self, tz_naive_fixture):
+        # GH#17558
+        tz = tz_naive_fixture
+        dti = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        tdi = pd.timedelta_range('0 days', periods=10)
+        expected = pd.date_range('2017-01-01', periods=10, tz=tz, freq='-1D')
+
+        # isub with TimedeltaIndex
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result -= tdi
+        tm.assert_index_equal(result, expected)
+
+        msg = 'cannot subtract .* from a TimedeltaArray'
+        with pytest.raises(TypeError, match=msg):
+            tdi -= dti
+
+        # isub with timedelta64 array
+        result = DatetimeIndex([Timestamp('2017-01-01', tz=tz)] * 10)
+        result -= tdi.values
+        tm.assert_index_equal(result, expected)
+
+        msg = '|'.join(['cannot perform __neg__ with this index type:',
+                        'ufunc subtract cannot use operands with types',
+                        'cannot subtract DatetimeArray from'])
+        with pytest.raises(TypeError, match=msg):
+            tdi.values -= dti
+
+    # -------------------------------------------------------------
+    # Binary Operations DatetimeIndex and datetime-like
+    # TODO: A couple other tests belong in this section.  Move them in
+    # A PR where there isn't already a giant diff.
+
+    @pytest.mark.parametrize('addend', [
+        datetime(2011, 1, 1),
+        DatetimeIndex(['2011-01-01', '2011-01-02']),
+        DatetimeIndex(['2011-01-01', '2011-01-02']).tz_localize('US/Eastern'),
+        np.datetime64('2011-01-01'),
+        Timestamp('2011-01-01')
+    ], ids=lambda x: type(x).__name__)
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    def test_add_datetimelike_and_dti(self, addend, tz):
+        # GH#9631
+        dti = DatetimeIndex(['2011-01-01', '2011-01-02']).tz_localize(tz)
+        msg = ('cannot add DatetimeArray and {0}'
+               .format(type(addend).__name__)).replace('DatetimeIndex',
+                                                       'DatetimeArray')
+        with pytest.raises(TypeError, match=msg):
+            dti + addend
+        with pytest.raises(TypeError, match=msg):
+            addend + dti
+
+    # -------------------------------------------------------------
+
+    def test_sub_dti_dti(self):
+        # previously performed setop (deprecated in 0.16.0), now changed to
+        # return subtraction -> TimeDeltaIndex (GH ...)
+
+        dti = date_range('20130101', periods=3)
+        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
+        dti_tz2 = date_range('20130101', periods=3).tz_localize('UTC')
+        expected = TimedeltaIndex([0, 0, 0])
+
+        result = dti - dti
+        tm.assert_index_equal(result, expected)
+
+        result = dti_tz - dti_tz
+        tm.assert_index_equal(result, expected)
+        msg = 'DatetimeArray subtraction must have the same timezones or'
+        with pytest.raises(TypeError, match=msg):
+            dti_tz - dti
+
+        with pytest.raises(TypeError, match=msg):
+            dti - dti_tz
+
+        with pytest.raises(TypeError, match=msg):
+            dti_tz - dti_tz2
+
+        # isub
+        dti -= dti
+        tm.assert_index_equal(dti, expected)
+
+        # different length raises ValueError
+        dti1 = date_range('20130101', periods=3)
+        dti2 = date_range('20130101', periods=4)
+        msg = 'cannot add indices of unequal length'
+        with pytest.raises(ValueError, match=msg):
+            dti1 - dti2
+
+        # NaN propagation
+        dti1 = DatetimeIndex(['2012-01-01', np.nan, '2012-01-03'])
+        dti2 = DatetimeIndex(['2012-01-02', '2012-01-03', np.nan])
+        expected = TimedeltaIndex(['1 days', np.nan, np.nan])
+        result = dti2 - dti1
+        tm.assert_index_equal(result, expected)
+
+    # -------------------------------------------------------------------
+    # TODO: Most of this block is moved from series or frame tests, needs
+    # cleanup, box-parametrization, and de-duplication
+
+    @pytest.mark.parametrize('op', [operator.add, operator.sub])
+    def test_timedelta64_equal_timedelta_supported_ops(self, op):
+        ser = Series([Timestamp('20130301'),
+                      Timestamp('20130228 23:00:00'),
+                      Timestamp('20130228 22:00:00'),
+                      Timestamp('20130228 21:00:00')])
+
+        intervals = ['D', 'h', 'm', 's', 'us']
+
+        # TODO: unused
+        # npy16_mappings = {'D': 24 * 60 * 60 * 1000000,
+        #                   'h': 60 * 60 * 1000000,
+        #                   'm': 60 * 1000000,
+        #                   's': 1000000,
+        #                   'us': 1}
+
+        def timedelta64(*args):
+            return sum(starmap(np.timedelta64, zip(args, intervals)))
+
+        for d, h, m, s, us in product(*([range(2)] * 5)):
+            nptd = timedelta64(d, h, m, s, us)
+            pytd = timedelta(days=d, hours=h, minutes=m, seconds=s,
+                             microseconds=us)
+            lhs = op(ser, nptd)
+            rhs = op(ser, pytd)
+
+            tm.assert_series_equal(lhs, rhs)
+
+    def test_ops_nat_mixed_datetime64_timedelta64(self):
+        # GH#11349
+        timedelta_series = Series([NaT, Timedelta('1s')])
+        datetime_series = Series([NaT, Timestamp('19900315')])
+        nat_series_dtype_timedelta = Series([NaT, NaT],
+                                            dtype='timedelta64[ns]')
+        nat_series_dtype_timestamp = Series([NaT, NaT], dtype='datetime64[ns]')
+        single_nat_dtype_datetime = Series([NaT], dtype='datetime64[ns]')
+        single_nat_dtype_timedelta = Series([NaT], dtype='timedelta64[ns]')
+
+        # subtraction
+        tm.assert_series_equal(datetime_series - single_nat_dtype_datetime,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(datetime_series - single_nat_dtype_timedelta,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(-single_nat_dtype_timedelta + datetime_series,
+                               nat_series_dtype_timestamp)
+
+        # without a Series wrapping the NaT, it is ambiguous
+        # whether it is a datetime64 or timedelta64
+        # defaults to interpreting it as timedelta64
+        tm.assert_series_equal(nat_series_dtype_timestamp -
+                               single_nat_dtype_datetime,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(nat_series_dtype_timestamp -
+                               single_nat_dtype_timedelta,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(-single_nat_dtype_timedelta +
+                               nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+        msg = 'cannot subtract a datelike'
+        with pytest.raises(TypeError, match=msg):
+            timedelta_series - single_nat_dtype_datetime
+
+        # addition
+        tm.assert_series_equal(nat_series_dtype_timestamp +
+                               single_nat_dtype_timedelta,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(single_nat_dtype_timedelta +
+                               nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+
+        tm.assert_series_equal(nat_series_dtype_timestamp +
+                               single_nat_dtype_timedelta,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(single_nat_dtype_timedelta +
+                               nat_series_dtype_timestamp,
+                               nat_series_dtype_timestamp)
+
+        tm.assert_series_equal(nat_series_dtype_timedelta +
+                               single_nat_dtype_datetime,
+                               nat_series_dtype_timestamp)
+        tm.assert_series_equal(single_nat_dtype_datetime +
+                               nat_series_dtype_timedelta,
+                               nat_series_dtype_timestamp)
+
+    def test_ufunc_coercions(self):
+        idx = date_range('2011-01-01', periods=3, freq='2D', name='x')
+
+        delta = np.timedelta64(1, 'D')
+        for result in [idx + delta, np.add(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = date_range('2011-01-02', periods=3, freq='2D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '2D'
+
+        for result in [idx - delta, np.subtract(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = date_range('2010-12-31', periods=3, freq='2D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '2D'
+
+        delta = np.array([np.timedelta64(1, 'D'), np.timedelta64(2, 'D'),
+                          np.timedelta64(3, 'D')])
+        for result in [idx + delta, np.add(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = DatetimeIndex(['2011-01-02', '2011-01-05', '2011-01-08'],
+                                freq='3D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '3D'
+
+        for result in [idx - delta, np.subtract(idx, delta)]:
+            assert isinstance(result, DatetimeIndex)
+            exp = DatetimeIndex(['2010-12-31', '2011-01-01', '2011-01-02'],
+                                freq='D', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == 'D'
+
+    @pytest.mark.parametrize('names', [('foo', None, None),
+                                       ('baz', 'bar', None),
+                                       ('bar', 'bar', 'bar')])
+    @pytest.mark.parametrize('tz', [None, 'America/Chicago'])
+    def test_dti_add_series(self, tz, names):
+        # GH#13905
+        index = DatetimeIndex(['2016-06-28 05:30', '2016-06-28 05:31'],
+                              tz=tz, name=names[0])
+        ser = Series([Timedelta(seconds=5)] * 2,
+                     index=index, name=names[1])
+        expected = Series(index + Timedelta(seconds=5),
+                          index=index, name=names[2])
+
+        # passing name arg isn't enough when names[2] is None
+        expected.name = names[2]
+        assert expected.dtype == index.dtype
+        result = ser + index
+        tm.assert_series_equal(result, expected)
+        result2 = index + ser
+        tm.assert_series_equal(result2, expected)
+
+        expected = index + Timedelta(seconds=5)
+        result3 = ser.values + index
+        tm.assert_index_equal(result3, expected)
+        result4 = index + ser.values
+        tm.assert_index_equal(result4, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_add_offset_index(self, tz_naive_fixture, names):
+        # GH#18849, GH#19744
+        tz = tz_naive_fixture
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = pd.Index([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                         name=names[1])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res = dti + other
+        expected = DatetimeIndex([dti[n] + other[n] for n in range(len(dti))],
+                                 name=names[2], freq='infer')
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res2 = other + dti
+        tm.assert_index_equal(res2, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_sub_offset_index(self, tz_naive_fixture, names):
+        # GH#18824, GH#19744
+        tz = tz_naive_fixture
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = pd.Index([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                         name=names[1])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res = dti - other
+        expected = DatetimeIndex([dti[n] - other[n] for n in range(len(dti))],
+                                 name=names[2], freq='infer')
+        tm.assert_index_equal(res, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_dti_with_offset_series(self, tz_naive_fixture, names):
+        # GH#18849
+        tz = tz_naive_fixture
+        dti = pd.date_range('2017-01-01', periods=2, tz=tz, name=names[0])
+        other = Series([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)],
+                       name=names[1])
+
+        expected_add = Series([dti[n] + other[n] for n in range(len(dti))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res = dti + other
+        tm.assert_series_equal(res, expected_add)
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res2 = other + dti
+        tm.assert_series_equal(res2, expected_add)
+
+        expected_sub = Series([dti[n] - other[n] for n in range(len(dti))],
+                              name=names[2])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.arrays.datetimelike]):
+            res3 = dti - other
+        tm.assert_series_equal(res3, expected_sub)
+
+
+@pytest.mark.parametrize('years', [-1, 0, 1])
+@pytest.mark.parametrize('months', [-2, 0, 2])
+def test_shift_months(years, months):
+    dti = DatetimeIndex([Timestamp('2000-01-05 00:15:00'),
+                         Timestamp('2000-01-31 00:23:00'),
+                         Timestamp('2000-01-01'),
+                         Timestamp('2000-02-29'),
+                         Timestamp('2000-12-31')])
+    actual = DatetimeIndex(shift_months(dti.asi8, years * 12 + months))
+
+    raw = [x + pd.offsets.DateOffset(years=years, months=months)
+           for x in dti]
+    expected = DatetimeIndex(raw)
+    tm.assert_index_equal(actual, expected)
diff --git a/pandas/tests/arithmetic/test_numeric.py b/pandas/tests/arithmetic/test_numeric.py
new file mode 100644
index 0000000000000..da1b3f1da5322
--- /dev/null
+++ b/pandas/tests/arithmetic/test_numeric.py
@@ -0,0 +1,1076 @@
+# -*- coding: utf-8 -*-
+# Arithmetc tests for DataFrame/Series/Index/Array classes that should
+# behave identically.
+# Specifically for numeric dtypes
+from decimal import Decimal
+from itertools import combinations
+import operator
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY3, Iterable
+
+import pandas as pd
+from pandas import Index, Series, Timedelta, TimedeltaIndex
+from pandas.core import ops
+import pandas.util.testing as tm
+
+# ------------------------------------------------------------------
+# Comparisons
+
+
+class TestNumericComparisons(object):
+    def test_operator_series_comparison_zerorank(self):
+        # GH#13006
+        result = np.float64(0) > pd.Series([1, 2, 3])
+        expected = 0.0 > pd.Series([1, 2, 3])
+        tm.assert_series_equal(result, expected)
+        result = pd.Series([1, 2, 3]) < np.float64(0)
+        expected = pd.Series([1, 2, 3]) < 0.0
+        tm.assert_series_equal(result, expected)
+        result = np.array([0, 1, 2])[0] > pd.Series([0, 1, 2])
+        expected = 0.0 > pd.Series([1, 2, 3])
+        tm.assert_series_equal(result, expected)
+
+    def test_df_numeric_cmp_dt64_raises(self):
+        # GH#8932, GH#22163
+        ts = pd.Timestamp.now()
+        df = pd.DataFrame({'x': range(5)})
+        with pytest.raises(TypeError):
+            df > ts
+        with pytest.raises(TypeError):
+            df < ts
+        with pytest.raises(TypeError):
+            ts < df
+        with pytest.raises(TypeError):
+            ts > df
+
+        assert not (df == ts).any().any()
+        assert (df != ts).all().all()
+
+    def test_compare_invalid(self):
+        # GH#8058
+        # ops testing
+        a = pd.Series(np.random.randn(5), name=0)
+        b = pd.Series(np.random.randn(5))
+        b.name = pd.Timestamp('2000-01-01')
+        tm.assert_series_equal(a / b, 1 / (b / a))
+
+
+# ------------------------------------------------------------------
+# Numeric dtypes Arithmetic with Timedelta Scalar
+
+class TestNumericArraylikeArithmeticWithTimedeltaLike(object):
+
+    # TODO: also check name retentention
+    @pytest.mark.parametrize('box_cls', [np.array, pd.Index, pd.Series])
+    @pytest.mark.parametrize('left', [
+        pd.RangeIndex(10, 40, 10)] + [cls([10, 20, 30], dtype=dtype)
+                                      for dtype in ['i1', 'i2', 'i4', 'i8',
+                                                    'u1', 'u2', 'u4', 'u8',
+                                                    'f2', 'f4', 'f8']
+                                      for cls in [pd.Series, pd.Index]],
+        ids=lambda x: type(x).__name__ + str(x.dtype))
+    def test_mul_td64arr(self, left, box_cls):
+        # GH#22390
+        right = np.array([1, 2, 3], dtype='m8[s]')
+        right = box_cls(right)
+
+        expected = pd.TimedeltaIndex(['10s', '40s', '90s'])
+        if isinstance(left, pd.Series) or box_cls is pd.Series:
+            expected = pd.Series(expected)
+
+        result = left * right
+        tm.assert_equal(result, expected)
+
+        result = right * left
+        tm.assert_equal(result, expected)
+
+    # TODO: also check name retentention
+    @pytest.mark.parametrize('box_cls', [np.array, pd.Index, pd.Series])
+    @pytest.mark.parametrize('left', [
+        pd.RangeIndex(10, 40, 10)] + [cls([10, 20, 30], dtype=dtype)
+                                      for dtype in ['i1', 'i2', 'i4', 'i8',
+                                                    'u1', 'u2', 'u4', 'u8',
+                                                    'f2', 'f4', 'f8']
+                                      for cls in [pd.Series, pd.Index]],
+        ids=lambda x: type(x).__name__ + str(x.dtype))
+    def test_div_td64arr(self, left, box_cls):
+        # GH#22390
+        right = np.array([10, 40, 90], dtype='m8[s]')
+        right = box_cls(right)
+
+        expected = pd.TimedeltaIndex(['1s', '2s', '3s'])
+        if isinstance(left, pd.Series) or box_cls is pd.Series:
+            expected = pd.Series(expected)
+
+        result = right / left
+        tm.assert_equal(result, expected)
+
+        result = right // left
+        tm.assert_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            left / right
+
+        with pytest.raises(TypeError):
+            left // right
+
+    # TODO: de-duplicate with test_numeric_arr_mul_tdscalar
+    def test_ops_series(self):
+        # regression test for G#H8813
+        td = Timedelta('1 day')
+        other = pd.Series([1, 2])
+        expected = pd.Series(pd.to_timedelta(['1 day', '2 days']))
+        tm.assert_series_equal(expected, td * other)
+        tm.assert_series_equal(expected, other * td)
+
+    # TODO: also test non-nanosecond timedelta64 and Tick objects;
+    #  see test_numeric_arr_rdiv_tdscalar for note on these failing
+    @pytest.mark.parametrize('scalar_td', [
+        Timedelta(days=1),
+        Timedelta(days=1).to_timedelta64(),
+        Timedelta(days=1).to_pytimedelta()],
+        ids=lambda x: type(x).__name__)
+    def test_numeric_arr_mul_tdscalar(self, scalar_td, numeric_idx, box):
+        # GH#19333
+        index = numeric_idx
+
+        expected = pd.timedelta_range('0 days', '4 days')
+
+        index = tm.box_expected(index, box)
+        expected = tm.box_expected(expected, box)
+
+        result = index * scalar_td
+        tm.assert_equal(result, expected)
+
+        commute = scalar_td * index
+        tm.assert_equal(commute, expected)
+
+    def test_numeric_arr_rdiv_tdscalar(self, three_days, numeric_idx, box):
+        index = numeric_idx[1:3]
+
+        expected = TimedeltaIndex(['3 Days', '36 Hours'])
+
+        index = tm.box_expected(index, box)
+        expected = tm.box_expected(expected, box)
+
+        result = three_days / index
+        tm.assert_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            index / three_days
+
+    @pytest.mark.parametrize('other', [
+        pd.Timedelta(hours=31),
+        pd.Timedelta(hours=31).to_pytimedelta(),
+        pd.Timedelta(hours=31).to_timedelta64(),
+        pd.Timedelta(hours=31).to_timedelta64().astype('m8[h]'),
+        np.timedelta64('NaT'),
+        np.timedelta64('NaT', 'D'),
+        pd.offsets.Minute(3),
+        pd.offsets.Second(0)])
+    def test_add_sub_timedeltalike_invalid(self, numeric_idx, other, box):
+        left = tm.box_expected(numeric_idx, box)
+        with pytest.raises(TypeError):
+            left + other
+        with pytest.raises(TypeError):
+            other + left
+        with pytest.raises(TypeError):
+            left - other
+        with pytest.raises(TypeError):
+            other - left
+
+
+# ------------------------------------------------------------------
+# Arithmetic
+
+class TestDivisionByZero(object):
+
+    def test_div_zero(self, zero, numeric_idx):
+        idx = numeric_idx
+
+        expected = pd.Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                            dtype=np.float64)
+        result = idx / zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') / np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_floordiv_zero(self, zero, numeric_idx):
+        idx = numeric_idx
+
+        expected = pd.Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                            dtype=np.float64)
+
+        result = idx // zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') // np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_mod_zero(self, zero, numeric_idx):
+        idx = numeric_idx
+
+        expected = pd.Index([np.nan, np.nan, np.nan, np.nan, np.nan],
+                            dtype=np.float64)
+        result = idx % zero
+        tm.assert_index_equal(result, expected)
+        ser_compat = Series(idx).astype('i8') % np.array(zero).astype('i8')
+        tm.assert_series_equal(ser_compat, Series(result))
+
+    def test_divmod_zero(self, zero, numeric_idx):
+        idx = numeric_idx
+
+        exleft = pd.Index([np.nan, np.inf, np.inf, np.inf, np.inf],
+                          dtype=np.float64)
+        exright = pd.Index([np.nan, np.nan, np.nan, np.nan, np.nan],
+                           dtype=np.float64)
+
+        result = divmod(idx, zero)
+        tm.assert_index_equal(result[0], exleft)
+        tm.assert_index_equal(result[1], exright)
+
+    # ------------------------------------------------------------------
+
+    @pytest.mark.parametrize('dtype2', [
+        np.int64, np.int32, np.int16, np.int8,
+        np.float64, np.float32, np.float16,
+        np.uint64, np.uint32, np.uint16, np.uint8])
+    @pytest.mark.parametrize('dtype1', [np.int64, np.float64, np.uint64])
+    def test_ser_div_ser(self, dtype1, dtype2):
+        # no longer do integer div for any ops, but deal with the 0's
+        first = Series([3, 4, 5, 8], name='first').astype(dtype1)
+        second = Series([0, 0, 0, 3], name='second').astype(dtype2)
+
+        with np.errstate(all='ignore'):
+            expected = Series(first.values.astype(np.float64) / second.values,
+                              dtype='float64', name=None)
+        expected.iloc[0:3] = np.inf
+
+        result = first / second
+        tm.assert_series_equal(result, expected)
+        assert not result.equals(second / first)
+
+    def test_rdiv_zero_compat(self):
+        # GH#8674
+        zero_array = np.array([0] * 5)
+        data = np.random.randn(5)
+        expected = Series([0.] * 5)
+
+        result = zero_array / Series(data)
+        tm.assert_series_equal(result, expected)
+
+        result = Series(zero_array) / data
+        tm.assert_series_equal(result, expected)
+
+        result = Series(zero_array) / Series(data)
+        tm.assert_series_equal(result, expected)
+
+    def test_div_zero_inf_signs(self):
+        # GH#9144, inf signing
+        ser = Series([-1, 0, 1], name='first')
+        expected = Series([-np.inf, np.nan, np.inf], name='first')
+
+        result = ser / 0
+        tm.assert_series_equal(result, expected)
+
+    def test_rdiv_zero(self):
+        # GH#9144
+        ser = Series([-1, 0, 1], name='first')
+        expected = Series([0.0, np.nan, 0.0], name='first')
+
+        result = 0 / ser
+        tm.assert_series_equal(result, expected)
+
+    def test_floordiv_div(self):
+        # GH#9144
+        ser = Series([-1, 0, 1], name='first')
+
+        result = ser // 0
+        expected = Series([-np.inf, np.nan, np.inf], name='first')
+        tm.assert_series_equal(result, expected)
+
+    def test_df_div_zero_df(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+        result = df / df
+
+        first = pd.Series([1.0, 1.0, 1.0, 1.0])
+        second = pd.Series([np.nan, np.nan, np.nan, 1])
+        expected = pd.DataFrame({'first': first, 'second': second})
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_div_zero_array(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        first = pd.Series([1.0, 1.0, 1.0, 1.0])
+        second = pd.Series([np.nan, np.nan, np.nan, 1])
+        expected = pd.DataFrame({'first': first, 'second': second})
+
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float') / df.values
+        result = pd.DataFrame(arr, index=df.index,
+                              columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_div_zero_int(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        result = df / 0
+        expected = pd.DataFrame(np.inf, index=df.index, columns=df.columns)
+        expected.iloc[0:3, 1] = np.nan
+        tm.assert_frame_equal(result, expected)
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float64') / 0
+        result2 = pd.DataFrame(arr, index=df.index,
+                               columns=df.columns)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_div_zero_series_does_not_commute(self):
+        # integer div, but deal with the 0's (GH#9144)
+        df = pd.DataFrame(np.random.randn(10, 5))
+        ser = df[0]
+        res = ser / df
+        res2 = df / ser
+        assert not res.fillna(0).equals(res2.fillna(0))
+
+    # ------------------------------------------------------------------
+    # Mod By Zero
+
+    def test_df_mod_zero_df(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        # this is technically wrong, as the integer portion is coerced to float
+        # ###
+        first = pd.Series([0, 0, 0, 0], dtype='float64')
+        second = pd.Series([np.nan, np.nan, np.nan, 0])
+        expected = pd.DataFrame({'first': first, 'second': second})
+        result = df % df
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_mod_zero_array(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        # this is technically wrong, as the integer portion is coerced to float
+        # ###
+        first = pd.Series([0, 0, 0, 0], dtype='float64')
+        second = pd.Series([np.nan, np.nan, np.nan, 0])
+        expected = pd.DataFrame({'first': first, 'second': second})
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values % df.values
+        result2 = pd.DataFrame(arr, index=df.index,
+                               columns=df.columns, dtype='float64')
+        result2.iloc[0:3, 1] = np.nan
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_mod_zero_int(self):
+        # GH#3590, modulo as ints
+        df = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+
+        result = df % 0
+        expected = pd.DataFrame(np.nan, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
+
+        # numpy has a slightly different (wrong) treatment
+        with np.errstate(all='ignore'):
+            arr = df.values.astype('float64') % 0
+        result2 = pd.DataFrame(arr, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_df_mod_zero_series_does_not_commute(self):
+        # GH#3590, modulo as ints
+        # not commutative with series
+        df = pd.DataFrame(np.random.randn(10, 5))
+        ser = df[0]
+        res = ser % df
+        res2 = df % ser
+        assert not res.fillna(0).equals(res2.fillna(0))
+
+
+class TestMultiplicationDivision(object):
+    # __mul__, __rmul__, __div__, __rdiv__, __floordiv__, __rfloordiv__
+    # for non-timestamp/timedelta/period dtypes
+
+    @pytest.mark.parametrize('box', [
+        pytest.param(pd.Index,
+                     marks=pytest.mark.xfail(reason="Index.__div__ always "
+                                                    "raises",
+                                             raises=TypeError)),
+        pd.Series,
+        pd.DataFrame
+    ], ids=lambda x: x.__name__)
+    def test_divide_decimal(self, box):
+        # resolves issue GH#9787
+        ser = Series([Decimal(10)])
+        expected = Series([Decimal(5)])
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = ser / Decimal(2)
+
+        tm.assert_equal(result, expected)
+
+        result = ser // Decimal(2)
+        tm.assert_equal(result, expected)
+
+    def test_div_equiv_binop(self):
+        # Test Series.div as well as Series.__div__
+        # float/integer issue
+        # GH#7785
+        first = Series([1, 0], name='first')
+        second = Series([-0.01, -0.02], name='second')
+        expected = Series([-0.01, -np.inf])
+
+        result = second.div(first)
+        tm.assert_series_equal(result, expected, check_names=False)
+
+        result = second / first
+        tm.assert_series_equal(result, expected)
+
+    def test_div_int(self, numeric_idx):
+        # truediv under PY3
+        idx = numeric_idx
+        result = idx / 1
+        expected = idx
+        if PY3:
+            expected = expected.astype('float64')
+        tm.assert_index_equal(result, expected)
+
+        result = idx / 2
+        if PY3:
+            expected = expected.astype('float64')
+        expected = Index(idx.values / 2)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul, operator.floordiv])
+    def test_mul_int_identity(self, op, numeric_idx, box):
+        idx = numeric_idx
+        idx = tm.box_expected(idx, box)
+
+        result = op(idx, 1)
+        tm.assert_equal(result, idx)
+
+    def test_mul_int_array(self, numeric_idx):
+        idx = numeric_idx
+        didx = idx * idx
+
+        result = idx * np.array(5, dtype='int64')
+        tm.assert_index_equal(result, idx * 5)
+
+        arr_dtype = 'uint64' if isinstance(idx, pd.UInt64Index) else 'int64'
+        result = idx * np.arange(5, dtype=arr_dtype)
+        tm.assert_index_equal(result, didx)
+
+    def test_mul_int_series(self, numeric_idx):
+        idx = numeric_idx
+        didx = idx * idx
+
+        arr_dtype = 'uint64' if isinstance(idx, pd.UInt64Index) else 'int64'
+        result = idx * Series(np.arange(5, dtype=arr_dtype))
+        tm.assert_series_equal(result, Series(didx))
+
+    def test_mul_float_series(self, numeric_idx):
+        idx = numeric_idx
+        rng5 = np.arange(5, dtype='float64')
+
+        result = idx * Series(rng5 + 0.1)
+        expected = Series(rng5 * (rng5 + 0.1))
+        tm.assert_series_equal(result, expected)
+
+    def test_mul_index(self, numeric_idx):
+        # in general not true for RangeIndex
+        idx = numeric_idx
+        if not isinstance(idx, pd.RangeIndex):
+            result = idx * idx
+            tm.assert_index_equal(result, idx ** 2)
+
+    def test_mul_datelike_raises(self, numeric_idx):
+        idx = numeric_idx
+        with pytest.raises(TypeError):
+            idx * pd.date_range('20130101', periods=5)
+
+    def test_mul_size_mismatch_raises(self, numeric_idx):
+        idx = numeric_idx
+        with pytest.raises(ValueError):
+            idx * idx[0:3]
+        with pytest.raises(ValueError):
+            idx * np.array([1, 2])
+
+    @pytest.mark.parametrize('op', [operator.pow, ops.rpow])
+    def test_pow_float(self, op, numeric_idx, box):
+        # test power calculations both ways, GH#14973
+        idx = numeric_idx
+        expected = pd.Float64Index(op(idx.values, 2.0))
+
+        idx = tm.box_expected(idx, box)
+        expected = tm.box_expected(expected, box)
+
+        result = op(idx, 2.0)
+        tm.assert_equal(result, expected)
+
+    def test_modulo(self, numeric_idx, box):
+        # GH#9244
+        idx = numeric_idx
+        expected = Index(idx.values % 2)
+
+        idx = tm.box_expected(idx, box)
+        expected = tm.box_expected(expected, box)
+
+        result = idx % 2
+        tm.assert_equal(result, expected)
+
+    def test_divmod_scalar(self, numeric_idx):
+        idx = numeric_idx
+
+        result = divmod(idx, 2)
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, 2)
+
+        expected = Index(div), Index(mod)
+        for r, e in zip(result, expected):
+            tm.assert_index_equal(r, e)
+
+    def test_divmod_ndarray(self, numeric_idx):
+        idx = numeric_idx
+        other = np.ones(idx.values.shape, dtype=idx.values.dtype) * 2
+
+        result = divmod(idx, other)
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, other)
+
+        expected = Index(div), Index(mod)
+        for r, e in zip(result, expected):
+            tm.assert_index_equal(r, e)
+
+    def test_divmod_series(self, numeric_idx):
+        idx = numeric_idx
+        other = np.ones(idx.values.shape, dtype=idx.values.dtype) * 2
+
+        result = divmod(idx, Series(other))
+        with np.errstate(all='ignore'):
+            div, mod = divmod(idx.values, other)
+
+        expected = Series(div), Series(mod)
+        for r, e in zip(result, expected):
+            tm.assert_series_equal(r, e)
+
+    @pytest.mark.parametrize('other', [np.nan, 7, -23, 2.718, -3.14, np.inf])
+    def test_ops_np_scalar(self, other):
+        vals = np.random.randn(5, 3)
+        f = lambda x: pd.DataFrame(x, index=list('ABCDE'),
+                                   columns=['jim', 'joe', 'jolie'])
+
+        df = f(vals)
+
+        tm.assert_frame_equal(df / np.array(other), f(vals / other))
+        tm.assert_frame_equal(np.array(other) * df, f(vals * other))
+        tm.assert_frame_equal(df + np.array(other), f(vals + other))
+        tm.assert_frame_equal(np.array(other) - df, f(other - vals))
+
+    # TODO: This came from series.test.test_operators, needs cleanup
+    def test_operators_frame(self):
+        # rpow does not work with DataFrame
+        ts = tm.makeTimeSeries()
+        ts.name = 'ts'
+
+        df = pd.DataFrame({'A': ts})
+
+        tm.assert_series_equal(ts + ts, ts + df['A'],
+                               check_names=False)
+        tm.assert_series_equal(ts ** ts, ts ** df['A'],
+                               check_names=False)
+        tm.assert_series_equal(ts < ts, ts < df['A'],
+                               check_names=False)
+        tm.assert_series_equal(ts / ts, ts / df['A'],
+                               check_names=False)
+
+    # TODO: this came from tests.series.test_analytics, needs cleannup and
+    #  de-duplication with test_modulo above
+    def test_modulo2(self):
+        with np.errstate(all='ignore'):
+
+            # GH#3590, modulo as ints
+            p = pd.DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
+            result = p['first'] % p['second']
+            expected = Series(p['first'].values % p['second'].values,
+                              dtype='float64')
+            expected.iloc[0:3] = np.nan
+            tm.assert_series_equal(result, expected)
+
+            result = p['first'] % 0
+            expected = Series(np.nan, index=p.index, name='first')
+            tm.assert_series_equal(result, expected)
+
+            p = p.astype('float64')
+            result = p['first'] % p['second']
+            expected = Series(p['first'].values % p['second'].values)
+            tm.assert_series_equal(result, expected)
+
+            p = p.astype('float64')
+            result = p['first'] % p['second']
+            result2 = p['second'] % p['first']
+            assert not result.equals(result2)
+
+            # GH#9144
+            s = Series([0, 1])
+
+            result = s % 0
+            expected = Series([np.nan, np.nan])
+            tm.assert_series_equal(result, expected)
+
+            result = 0 % s
+            expected = Series([np.nan, 0.0])
+            tm.assert_series_equal(result, expected)
+
+
+class TestAdditionSubtraction(object):
+    # __add__, __sub__, __radd__, __rsub__, __iadd__, __isub__
+    # for non-timestamp/timedelta/period dtypes
+
+    # TODO: This came from series.test.test_operators, needs cleanup
+    def test_arith_ops_df_compat(self):
+        # GH#1134
+        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
+
+        exp = pd.Series([3.0, 4.0, np.nan, np.nan],
+                        index=list('ABCD'), name='x')
+        tm.assert_series_equal(s1 + s2, exp)
+        tm.assert_series_equal(s2 + s1, exp)
+
+        exp = pd.DataFrame({'x': [3.0, 4.0, np.nan, np.nan]},
+                           index=list('ABCD'))
+        tm.assert_frame_equal(s1.to_frame() + s2.to_frame(), exp)
+        tm.assert_frame_equal(s2.to_frame() + s1.to_frame(), exp)
+
+        # different length
+        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
+
+        exp = pd.Series([3, 4, 5, np.nan],
+                        index=list('ABCD'), name='x')
+        tm.assert_series_equal(s3 + s4, exp)
+        tm.assert_series_equal(s4 + s3, exp)
+
+        exp = pd.DataFrame({'x': [3, 4, 5, np.nan]},
+                           index=list('ABCD'))
+        tm.assert_frame_equal(s3.to_frame() + s4.to_frame(), exp)
+        tm.assert_frame_equal(s4.to_frame() + s3.to_frame(), exp)
+
+    # TODO: This came from series.test.test_operators, needs cleanup
+    def test_series_frame_radd_bug(self):
+        # GH#353
+        vals = pd.Series(tm.rands_array(5, 10))
+        result = 'foo_' + vals
+        expected = vals.map(lambda x: 'foo_' + x)
+        tm.assert_series_equal(result, expected)
+
+        frame = pd.DataFrame({'vals': vals})
+        result = 'foo_' + frame
+        expected = pd.DataFrame({'vals': vals.map(lambda x: 'foo_' + x)})
+        tm.assert_frame_equal(result, expected)
+
+        ts = tm.makeTimeSeries()
+        ts.name = 'ts'
+
+        # really raise this time
+        now = pd.Timestamp.now().to_pydatetime()
+        with pytest.raises(TypeError):
+            now + ts
+
+        with pytest.raises(TypeError):
+            ts + now
+
+    # TODO: This came from series.test.test_operators, needs cleanup
+    def test_datetime64_with_index(self):
+        # arithmetic integer ops with an index
+        ser = pd.Series(np.random.randn(5))
+        expected = ser - ser.index.to_series()
+        result = ser - ser.index
+        tm.assert_series_equal(result, expected)
+
+        # GH#4629
+        # arithmetic datetime64 ops with an index
+        ser = pd.Series(pd.date_range('20130101', periods=5),
+                        index=pd.date_range('20130101', periods=5))
+        expected = ser - ser.index.to_series()
+        result = ser - ser.index
+        tm.assert_series_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            # GH#18850
+            result = ser - ser.index.to_period()
+
+        df = pd.DataFrame(np.random.randn(5, 2),
+                          index=pd.date_range('20130101', periods=5))
+        df['date'] = pd.Timestamp('20130102')
+        df['expected'] = df['date'] - df.index.to_series()
+        df['result'] = df['date'] - df.index
+        tm.assert_series_equal(df['result'], df['expected'], check_names=False)
+
+    # TODO: taken from tests.frame.test_operators, needs cleanup
+    def test_frame_operators(self):
+        seriesd = tm.getSeriesData()
+        frame = pd.DataFrame(seriesd)
+        frame2 = pd.DataFrame(seriesd, columns=['D', 'C', 'B', 'A'])
+
+        garbage = np.random.random(4)
+        colSeries = pd.Series(garbage, index=np.array(frame.columns))
+
+        idSum = frame + frame
+        seriesSum = frame + colSeries
+
+        for col, series in idSum.items():
+            for idx, val in series.items():
+                origVal = frame[col][idx] * 2
+                if not np.isnan(val):
+                    assert val == origVal
+                else:
+                    assert np.isnan(origVal)
+
+        for col, series in seriesSum.items():
+            for idx, val in series.items():
+                origVal = frame[col][idx] + colSeries[col]
+                if not np.isnan(val):
+                    assert val == origVal
+                else:
+                    assert np.isnan(origVal)
+
+        added = frame2 + frame2
+        expected = frame2 * 2
+        tm.assert_frame_equal(added, expected)
+
+        df = pd.DataFrame({'a': ['a', None, 'b']})
+        tm.assert_frame_equal(df + df,
+                              pd.DataFrame({'a': ['aa', np.nan, 'bb']}))
+
+        # Test for issue #10181
+        for dtype in ('float', 'int64'):
+            frames = [
+                pd.DataFrame(dtype=dtype),
+                pd.DataFrame(columns=['A'], dtype=dtype),
+                pd.DataFrame(index=[0], dtype=dtype),
+            ]
+            for df in frames:
+                assert (df + df).equals(df)
+                tm.assert_frame_equal(df + df, df)
+
+    # TODO: taken from tests.series.test_operators; needs cleanup
+    def test_series_operators(self):
+        def _check_op(series, other, op, pos_only=False, check_dtype=True):
+            left = np.abs(series) if pos_only else series
+            right = np.abs(other) if pos_only else other
+
+            cython_or_numpy = op(left, right)
+            python = left.combine(right, op)
+            tm.assert_series_equal(cython_or_numpy, python,
+                                   check_dtype=check_dtype)
+
+        def check(series, other):
+            simple_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'mod']
+
+            for opname in simple_ops:
+                _check_op(series, other, getattr(operator, opname))
+
+            _check_op(series, other, operator.pow, pos_only=True)
+
+            _check_op(series, other, lambda x, y: operator.add(y, x))
+            _check_op(series, other, lambda x, y: operator.sub(y, x))
+            _check_op(series, other, lambda x, y: operator.truediv(y, x))
+            _check_op(series, other, lambda x, y: operator.floordiv(y, x))
+            _check_op(series, other, lambda x, y: operator.mul(y, x))
+            _check_op(series, other, lambda x, y: operator.pow(y, x),
+                      pos_only=True)
+            _check_op(series, other, lambda x, y: operator.mod(y, x))
+
+        tser = tm.makeTimeSeries().rename('ts')
+        check(tser, tser * 2)
+        check(tser, tser * 0)
+        check(tser, tser[::2])
+        check(tser, 5)
+
+        def check_comparators(series, other, check_dtype=True):
+            _check_op(series, other, operator.gt, check_dtype=check_dtype)
+            _check_op(series, other, operator.ge, check_dtype=check_dtype)
+            _check_op(series, other, operator.eq, check_dtype=check_dtype)
+            _check_op(series, other, operator.lt, check_dtype=check_dtype)
+            _check_op(series, other, operator.le, check_dtype=check_dtype)
+
+        check_comparators(tser, 5)
+        check_comparators(tser, tser + 1, check_dtype=False)
+
+    # TODO: taken from tests.series.test_operators; needs cleanup
+    def test_divmod(self):
+        def check(series, other):
+            results = divmod(series, other)
+            if isinstance(other, Iterable) and len(series) != len(other):
+                # if the lengths don't match, this is the test where we use
+                # `tser[::2]`. Pad every other value in `other_np` with nan.
+                other_np = []
+                for n in other:
+                    other_np.append(n)
+                    other_np.append(np.nan)
+            else:
+                other_np = other
+            other_np = np.asarray(other_np)
+            with np.errstate(all='ignore'):
+                expecteds = divmod(series.values, np.asarray(other_np))
+
+            for result, expected in zip(results, expecteds):
+                # check the values, name, and index separately
+                tm.assert_almost_equal(np.asarray(result), expected)
+
+                assert result.name == series.name
+                tm.assert_index_equal(result.index, series.index)
+
+        tser = tm.makeTimeSeries().rename('ts')
+        check(tser, tser * 2)
+        check(tser, tser * 0)
+        check(tser, tser[::2])
+        check(tser, 5)
+
+
+class TestUFuncCompat(object):
+
+    @pytest.mark.parametrize('holder', [pd.Int64Index, pd.UInt64Index,
+                                        pd.Float64Index, pd.RangeIndex,
+                                        pd.Series])
+    def test_ufunc_compat(self, holder):
+        box = pd.Series if holder is pd.Series else pd.Index
+
+        if holder is pd.RangeIndex:
+            idx = pd.RangeIndex(0, 5)
+        else:
+            idx = holder(np.arange(5, dtype='int64'))
+        result = np.sin(idx)
+        expected = box(np.sin(np.arange(5, dtype='int64')))
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('holder', [pd.Int64Index, pd.UInt64Index,
+                                        pd.Float64Index, pd.Series])
+    def test_ufunc_coercions(self, holder):
+        idx = holder([1, 2, 3, 4, 5], name='x')
+        box = pd.Series if holder is pd.Series else pd.Index
+
+        result = np.sqrt(idx)
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index(np.sqrt(np.array([1, 2, 3, 4, 5])), name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+        result = np.divide(idx, 2.)
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+        # _evaluate_numeric_binop
+        result = idx + 2.
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index([3., 4., 5., 6., 7.], name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+        result = idx - 2.
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index([-1., 0., 1., 2., 3.], name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+        result = idx * 1.
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index([1., 2., 3., 4., 5.], name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+        result = idx / 2.
+        assert result.dtype == 'f8' and isinstance(result, box)
+        exp = pd.Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
+        exp = tm.box_expected(exp, box)
+        tm.assert_equal(result, exp)
+
+
+class TestObjectDtypeEquivalence(object):
+    # Tests that arithmetic operations match operations executed elementwise
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_numarr_with_dtype_add_nan(self, dtype, box):
+        ser = pd.Series([1, 2, 3], dtype=dtype)
+        expected = pd.Series([np.nan, np.nan, np.nan], dtype=dtype)
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = np.nan + ser
+        tm.assert_equal(result, expected)
+
+        result = ser + np.nan
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_numarr_with_dtype_add_int(self, dtype, box):
+        ser = pd.Series([1, 2, 3], dtype=dtype)
+        expected = pd.Series([2, 3, 4], dtype=dtype)
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = 1 + ser
+        tm.assert_equal(result, expected)
+
+        result = ser + 1
+        tm.assert_equal(result, expected)
+
+    # TODO: moved from tests.series.test_operators; needs cleanup
+    @pytest.mark.parametrize('op', [operator.add, operator.sub, operator.mul,
+                                    operator.truediv, operator.floordiv])
+    def test_operators_reverse_object(self, op):
+        # GH#56
+        arr = pd.Series(np.random.randn(10), index=np.arange(10), dtype=object)
+
+        result = op(1., arr)
+        expected = op(1., arr.astype(float))
+        tm.assert_series_equal(result.astype(float), expected)
+
+
+class TestNumericArithmeticUnsorted(object):
+    # Tests in this class have been moved from type-specific test modules
+    #  but not yet sorted, parametrized, and de-duplicated
+
+    def check_binop(self, ops, scalars, idxs):
+        for op in ops:
+            for a, b in combinations(idxs, 2):
+                result = op(a, b)
+                expected = op(pd.Int64Index(a), pd.Int64Index(b))
+                tm.assert_index_equal(result, expected)
+            for idx in idxs:
+                for scalar in scalars:
+                    result = op(idx, scalar)
+                    expected = op(pd.Int64Index(idx), scalar)
+                    tm.assert_index_equal(result, expected)
+
+    def test_binops(self):
+        ops = [operator.add, operator.sub, operator.mul, operator.floordiv,
+               operator.truediv]
+        scalars = [-1, 1, 2]
+        idxs = [pd.RangeIndex(0, 10, 1), pd.RangeIndex(0, 20, 2),
+                pd.RangeIndex(-10, 10, 2), pd.RangeIndex(5, -5, -1)]
+        self.check_binop(ops, scalars, idxs)
+
+    def test_binops_pow(self):
+        # later versions of numpy don't allow powers of negative integers
+        # so test separately
+        # https://github.com/numpy/numpy/pull/8127
+        ops = [pow]
+        scalars = [1, 2]
+        idxs = [pd.RangeIndex(0, 10, 1), pd.RangeIndex(0, 20, 2)]
+        self.check_binop(ops, scalars, idxs)
+
+    # TODO: mod, divmod?
+    @pytest.mark.parametrize('op', [operator.add, operator.sub,
+                                    operator.mul, operator.floordiv,
+                                    operator.truediv, operator.pow])
+    def test_arithmetic_with_frame_or_series(self, op):
+        # check that we return NotImplemented when operating with Series
+        # or DataFrame
+        index = pd.RangeIndex(5)
+        other = pd.Series(np.random.randn(5))
+
+        expected = op(pd.Series(index), other)
+        result = op(index, other)
+        tm.assert_series_equal(result, expected)
+
+        other = pd.DataFrame(np.random.randn(2, 5))
+        expected = op(pd.DataFrame([index, index]), other)
+        result = op(index, other)
+        tm.assert_frame_equal(result, expected)
+
+    def test_numeric_compat2(self):
+        # validate that we are handling the RangeIndex overrides to numeric ops
+        # and returning RangeIndex where possible
+
+        idx = pd.RangeIndex(0, 10, 2)
+
+        result = idx * 2
+        expected = pd.RangeIndex(0, 20, 4)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx + 2
+        expected = pd.RangeIndex(2, 12, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx - 2
+        expected = pd.RangeIndex(-2, 8, 2)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # truediv under PY3
+        result = idx / 2
+
+        if PY3:
+            expected = pd.RangeIndex(0, 5, 1).astype('float64')
+        else:
+            expected = pd.RangeIndex(0, 5, 1)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx / 4
+        expected = pd.RangeIndex(0, 10, 2) / 4
+        tm.assert_index_equal(result, expected, exact=True)
+
+        result = idx // 1
+        expected = idx
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # __mul__
+        result = idx * idx
+        expected = Index(idx.values * idx.values)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # __pow__
+        idx = pd.RangeIndex(0, 1000, 2)
+        result = idx ** 2
+        expected = idx._int64index ** 2
+        tm.assert_index_equal(Index(result.values), expected, exact=True)
+
+        # __floordiv__
+        cases_exact = [
+            (pd.RangeIndex(0, 1000, 2), 2, pd.RangeIndex(0, 500, 1)),
+            (pd.RangeIndex(-99, -201, -3), -3, pd.RangeIndex(33, 67, 1)),
+            (pd.RangeIndex(0, 1000, 1), 2,
+             pd.RangeIndex(0, 1000, 1)._int64index // 2),
+            (pd.RangeIndex(0, 100, 1), 2.0,
+             pd.RangeIndex(0, 100, 1)._int64index // 2.0),
+            (pd.RangeIndex(0), 50, pd.RangeIndex(0)),
+            (pd.RangeIndex(2, 4, 2), 3, pd.RangeIndex(0, 1, 1)),
+            (pd.RangeIndex(-5, -10, -6), 4, pd.RangeIndex(-2, -1, 1)),
+            (pd.RangeIndex(-100, -200, 3), 2, pd.RangeIndex(0))]
+        for idx, div, expected in cases_exact:
+            tm.assert_index_equal(idx // div, expected, exact=True)
+
+    @pytest.mark.parametrize('dtype', [np.int64, np.float64])
+    @pytest.mark.parametrize('delta', [1, 0, -1])
+    def test_addsub_arithmetic(self, dtype, delta):
+        # GH#8142
+        delta = dtype(delta)
+        index = pd.Index([10, 11, 12], dtype=dtype)
+        result = index + delta
+        expected = pd.Index(index.values + delta, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        # this subtraction used to fail
+        result = index - delta
+        expected = pd.Index(index.values - delta, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        tm.assert_index_equal(index + index, 2 * index)
+        tm.assert_index_equal(index - index, 0 * index)
+        assert not (index - index).empty
diff --git a/pandas/tests/arithmetic/test_object.py b/pandas/tests/arithmetic/test_object.py
new file mode 100644
index 0000000000000..29063ae3f50e3
--- /dev/null
+++ b/pandas/tests/arithmetic/test_object.py
@@ -0,0 +1,314 @@
+# -*- coding: utf-8 -*-
+# Arithmetc tests for DataFrame/Series/Index/Array classes that should
+# behave identically.
+# Specifically for object dtype
+from decimal import Decimal
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Series, Timestamp
+from pandas.core import ops
+import pandas.util.testing as tm
+
+# ------------------------------------------------------------------
+# Comparisons
+
+
+class TestObjectComparisons(object):
+
+    def test_comparison_object_numeric_nas(self):
+        ser = Series(np.random.randn(10), dtype=object)
+        shifted = ser.shift(2)
+
+        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
+        for op in ops:
+            func = getattr(operator, op)
+
+            result = func(ser, shifted)
+            expected = func(ser.astype(float), shifted.astype(float))
+            tm.assert_series_equal(result, expected)
+
+    def test_object_comparisons(self):
+        ser = Series(['a', 'b', np.nan, 'c', 'a'])
+
+        result = ser == 'a'
+        expected = Series([True, False, False, False, True])
+        tm.assert_series_equal(result, expected)
+
+        result = ser < 'a'
+        expected = Series([False, False, False, False, False])
+        tm.assert_series_equal(result, expected)
+
+        result = ser != 'a'
+        expected = -(ser == 'a')
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_more_na_comparisons(self, dtype):
+        left = Series(['a', np.nan, 'c'], dtype=dtype)
+        right = Series(['a', np.nan, 'd'], dtype=dtype)
+
+        result = left == right
+        expected = Series([True, False, False])
+        tm.assert_series_equal(result, expected)
+
+        result = left != right
+        expected = Series([False, True, True])
+        tm.assert_series_equal(result, expected)
+
+        result = left == np.nan
+        expected = Series([False, False, False])
+        tm.assert_series_equal(result, expected)
+
+        result = left != np.nan
+        expected = Series([True, True, True])
+        tm.assert_series_equal(result, expected)
+
+
+# ------------------------------------------------------------------
+# Arithmetic
+
+class TestArithmetic(object):
+
+    # TODO: parametrize
+    def test_pow_ops_object(self):
+        # GH#22922
+        # pow is weird with masking & 1, so testing here
+        a = Series([1, np.nan, 1, np.nan], dtype=object)
+        b = Series([1, np.nan, np.nan, 1], dtype=object)
+        result = a ** b
+        expected = Series(a.values ** b.values, dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        result = b ** a
+        expected = Series(b.values ** a.values, dtype=object)
+
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("op", [operator.add, ops.radd])
+    @pytest.mark.parametrize("other", ["category", "Int64"])
+    def test_add_extension_scalar(self, other, box, op):
+        # GH#22378
+        # Check that scalars satisfying is_extension_array_dtype(obj)
+        # do not incorrectly try to dispatch to an ExtensionArray operation
+
+        arr = pd.Series(['a', 'b', 'c'])
+        expected = pd.Series([op(x, other) for x in arr])
+
+        arr = tm.box_expected(arr, box)
+        expected = tm.box_expected(expected, box)
+
+        result = op(arr, other)
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [
+        pytest.param(pd.Index,
+                     marks=pytest.mark.xfail(reason="Does not mask nulls",
+                                             raises=TypeError)),
+        pd.Series,
+        pd.DataFrame
+    ], ids=lambda x: x.__name__)
+    def test_objarr_add_str(self, box):
+        ser = pd.Series(['x', np.nan, 'x'])
+        expected = pd.Series(['xa', np.nan, 'xa'])
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = ser + 'a'
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [
+        pytest.param(pd.Index,
+                     marks=pytest.mark.xfail(reason="Does not mask nulls",
+                                             raises=TypeError)),
+        pd.Series,
+        pd.DataFrame
+    ], ids=lambda x: x.__name__)
+    def test_objarr_radd_str(self, box):
+        ser = pd.Series(['x', np.nan, 'x'])
+        expected = pd.Series(['ax', np.nan, 'ax'])
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = 'a' + ser
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('data', [
+        [1, 2, 3],
+        [1.1, 2.2, 3.3],
+        [Timestamp('2011-01-01'), Timestamp('2011-01-02'), pd.NaT],
+        ['x', 'y', 1]])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_objarr_radd_str_invalid(self, dtype, data, box):
+        ser = Series(data, dtype=dtype)
+
+        ser = tm.box_expected(ser, box)
+        with pytest.raises(TypeError):
+            'foo_' + ser
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    def test_objarr_add_invalid(self, op, box):
+        # invalid ops
+
+        obj_ser = tm.makeObjectSeries()
+        obj_ser.name = 'objects'
+
+        obj_ser = tm.box_expected(obj_ser, box)
+        with pytest.raises(Exception):
+            op(obj_ser, 1)
+        with pytest.raises(Exception):
+            op(obj_ser, np.array(1, dtype=np.int64))
+
+    # TODO: Moved from tests.series.test_operators; needs cleanup
+    def test_operators_na_handling(self):
+        ser = Series(['foo', 'bar', 'baz', np.nan])
+        result = 'prefix_' + ser
+        expected = pd.Series(['prefix_foo', 'prefix_bar',
+                              'prefix_baz', np.nan])
+        tm.assert_series_equal(result, expected)
+
+        result = ser + '_suffix'
+        expected = pd.Series(['foo_suffix', 'bar_suffix',
+                              'baz_suffix', np.nan])
+        tm.assert_series_equal(result, expected)
+
+    # TODO: parametrize over box
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_series_with_dtype_radd_timedelta(self, dtype):
+        # note this test is _not_ aimed at timedelta64-dtyped Series
+        ser = pd.Series([pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+                         pd.Timedelta('3 days')], dtype=dtype)
+        expected = pd.Series([pd.Timedelta('4 days'), pd.Timedelta('5 days'),
+                              pd.Timedelta('6 days')])
+
+        result = pd.Timedelta('3 days') + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + pd.Timedelta('3 days')
+        tm.assert_series_equal(result, expected)
+
+    # TODO: cleanup & parametrize over box
+    def test_mixed_timezone_series_ops_object(self):
+        # GH#13043
+        ser = pd.Series([pd.Timestamp('2015-01-01', tz='US/Eastern'),
+                         pd.Timestamp('2015-01-01', tz='Asia/Tokyo')],
+                        name='xxx')
+        assert ser.dtype == object
+
+        exp = pd.Series([pd.Timestamp('2015-01-02', tz='US/Eastern'),
+                         pd.Timestamp('2015-01-02', tz='Asia/Tokyo')],
+                        name='xxx')
+        tm.assert_series_equal(ser + pd.Timedelta('1 days'), exp)
+        tm.assert_series_equal(pd.Timedelta('1 days') + ser, exp)
+
+        # object series & object series
+        ser2 = pd.Series([pd.Timestamp('2015-01-03', tz='US/Eastern'),
+                          pd.Timestamp('2015-01-05', tz='Asia/Tokyo')],
+                         name='xxx')
+        assert ser2.dtype == object
+        exp = pd.Series([pd.Timedelta('2 days'), pd.Timedelta('4 days')],
+                        name='xxx')
+        tm.assert_series_equal(ser2 - ser, exp)
+        tm.assert_series_equal(ser - ser2, -exp)
+
+        ser = pd.Series([pd.Timedelta('01:00:00'), pd.Timedelta('02:00:00')],
+                        name='xxx', dtype=object)
+        assert ser.dtype == object
+
+        exp = pd.Series([pd.Timedelta('01:30:00'), pd.Timedelta('02:30:00')],
+                        name='xxx')
+        tm.assert_series_equal(ser + pd.Timedelta('00:30:00'), exp)
+        tm.assert_series_equal(pd.Timedelta('00:30:00') + ser, exp)
+
+    # TODO: cleanup & parametrize over box
+    def test_iadd_preserves_name(self):
+        # GH#17067, GH#19723 __iadd__ and __isub__ should preserve index name
+        ser = pd.Series([1, 2, 3])
+        ser.index.name = 'foo'
+
+        ser.index += 1
+        assert ser.index.name == "foo"
+
+        ser.index -= 1
+        assert ser.index.name == "foo"
+
+    def test_add_string(self):
+        # from bug report
+        index = pd.Index(['a', 'b', 'c'])
+        index2 = index + 'foo'
+
+        assert 'a' not in index2
+        assert 'afoo' in index2
+
+    def test_iadd_string(self):
+        index = pd.Index(['a', 'b', 'c'])
+        # doesn't fail test unless there is a check before `+=`
+        assert 'a' in index
+
+        index += '_x'
+        assert 'a_x' in index
+
+    def test_add(self):
+        index = tm.makeStringIndex(100)
+        expected = pd.Index(index.values * 2)
+        tm.assert_index_equal(index + index, expected)
+        tm.assert_index_equal(index + index.tolist(), expected)
+        tm.assert_index_equal(index.tolist() + index, expected)
+
+        # test add and radd
+        index = pd.Index(list('abc'))
+        expected = pd.Index(['a1', 'b1', 'c1'])
+        tm.assert_index_equal(index + '1', expected)
+        expected = pd.Index(['1a', '1b', '1c'])
+        tm.assert_index_equal('1' + index, expected)
+
+    def test_sub_fail(self):
+        index = tm.makeStringIndex(100)
+        with pytest.raises(TypeError):
+            index - 'a'
+        with pytest.raises(TypeError):
+            index - index
+        with pytest.raises(TypeError):
+            index - index.tolist()
+        with pytest.raises(TypeError):
+            index.tolist() - index
+
+    def test_sub_object(self):
+        # GH#19369
+        index = pd.Index([Decimal(1), Decimal(2)])
+        expected = pd.Index([Decimal(0), Decimal(1)])
+
+        result = index - Decimal(1)
+        tm.assert_index_equal(result, expected)
+
+        result = index - pd.Index([Decimal(1), Decimal(1)])
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            index - 'foo'
+
+        with pytest.raises(TypeError):
+            index - np.array([2, 'foo'])
+
+    def test_rsub_object(self):
+        # GH#19369
+        index = pd.Index([Decimal(1), Decimal(2)])
+        expected = pd.Index([Decimal(1), Decimal(0)])
+
+        result = Decimal(2) - index
+        tm.assert_index_equal(result, expected)
+
+        result = np.array([Decimal(2), Decimal(2)]) - index
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            'foo' - index
+
+        with pytest.raises(TypeError):
+            np.array([True, pd.Timestamp.now()]) - index
diff --git a/pandas/tests/arithmetic/test_period.py b/pandas/tests/arithmetic/test_period.py
new file mode 100644
index 0000000000000..92f209b94f00d
--- /dev/null
+++ b/pandas/tests/arithmetic/test_period.py
@@ -0,0 +1,1213 @@
+# -*- coding: utf-8 -*-
+# Arithmetc tests for DataFrame/Series/Index/Array classes that should
+# behave identically.
+# Specifically for Period dtype
+import operator
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas.errors import PerformanceWarning
+
+import pandas as pd
+from pandas import Period, PeriodIndex, Series, period_range
+from pandas.core import ops
+import pandas.util.testing as tm
+
+from pandas.tseries.frequencies import to_offset
+
+# ------------------------------------------------------------------
+# Comparisons
+
+
+class TestPeriodIndexComparisons(object):
+
+    @pytest.mark.parametrize("other", ["2017", 2017])
+    def test_eq(self, other):
+        idx = PeriodIndex(['2017', '2017', '2018'], freq="D")
+        expected = np.array([True, True, False])
+        result = idx == other
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_pi_cmp_period(self):
+        idx = period_range('2007-01', periods=20, freq='M')
+
+        result = idx < idx[10]
+        exp = idx.values < idx.values[10]
+        tm.assert_numpy_array_equal(result, exp)
+
+    # TODO: moved from test_datetime64; de-duplicate with version below
+    def test_parr_cmp_period_scalar2(self, box_with_array):
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+
+        pi = pd.period_range('2000-01-01', periods=10, freq='D')
+
+        val = Period('2000-01-04', freq='D')
+        expected = [x > val for x in pi]
+
+        ser = tm.box_expected(pi, box_with_array)
+        expected = tm.box_expected(expected, xbox)
+        result = ser > val
+        tm.assert_equal(result, expected)
+
+        val = pi[5]
+        result = ser > val
+        expected = [x > val for x in pi]
+        expected = tm.box_expected(expected, xbox)
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_parr_cmp_period_scalar(self, freq, box_with_array):
+        # GH#13200
+        xbox = np.ndarray if box_with_array is pd.Index else box_with_array
+
+        base = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                           freq=freq)
+        base = tm.box_expected(base, box_with_array)
+        per = Period('2011-02', freq=freq)
+
+        exp = np.array([False, True, False, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base == per, exp)
+        tm.assert_equal(per == base, exp)
+
+        exp = np.array([True, False, True, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base != per, exp)
+        tm.assert_equal(per != base, exp)
+
+        exp = np.array([False, False, True, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base > per, exp)
+        tm.assert_equal(per < base, exp)
+
+        exp = np.array([True, False, False, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base < per, exp)
+        tm.assert_equal(per > base, exp)
+
+        exp = np.array([False, True, True, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base >= per, exp)
+        tm.assert_equal(per <= base, exp)
+
+        exp = np.array([True, True, False, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base <= per, exp)
+        tm.assert_equal(per >= base, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_parr_cmp_pi(self, freq, box_with_array):
+        # GH#13200
+        xbox = np.ndarray if box_with_array is pd.Index else box_with_array
+
+        base = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                           freq=freq)
+        base = tm.box_expected(base, box_with_array)
+
+        # TODO: could also box idx?
+        idx = PeriodIndex(['2011-02', '2011-01', '2011-03', '2011-05'],
+                          freq=freq)
+
+        exp = np.array([False, False, True, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base == idx, exp)
+
+        exp = np.array([True, True, False, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base != idx, exp)
+
+        exp = np.array([False, True, False, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base > idx, exp)
+
+        exp = np.array([True, False, False, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base < idx, exp)
+
+        exp = np.array([False, True, True, False])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base >= idx, exp)
+
+        exp = np.array([True, False, True, True])
+        exp = tm.box_expected(exp, xbox)
+        tm.assert_equal(base <= idx, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_parr_cmp_pi_mismatched_freq_raises(self, freq, box_with_array):
+        # GH#13200
+        # different base freq
+        base = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                           freq=freq)
+        base = tm.box_expected(base, box_with_array)
+
+        msg = "Input has different freq=A-DEC from "
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            base <= Period('2011', freq='A')
+
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            Period('2011', freq='A') >= base
+
+        # TODO: Could parametrize over boxes for idx?
+        idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='A')
+        rev_msg = (r'Input has different freq=(M|2M|3M) from '
+                   r'PeriodArray\(freq=A-DEC\)')
+        idx_msg = rev_msg if box_with_array is tm.to_array else msg
+        with pytest.raises(IncompatibleFrequency, match=idx_msg):
+            base <= idx
+
+        # Different frequency
+        msg = "Input has different freq=4M from "
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            base <= Period('2011', freq='4M')
+
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            Period('2011', freq='4M') >= base
+
+        idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='4M')
+        rev_msg = (r'Input has different freq=(M|2M|3M) from '
+                   r'PeriodArray\(freq=4M\)')
+        idx_msg = rev_msg if box_with_array is tm.to_array else msg
+        with pytest.raises(IncompatibleFrequency, match=idx_msg):
+            base <= idx
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_nat(self, freq):
+        idx1 = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
+
+        result = idx1 > Period('2011-02', freq=freq)
+        exp = np.array([False, False, False, True])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('2011-02', freq=freq) < idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == Period('NaT', freq=freq)
+        exp = np.array([False, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('NaT', freq=freq) == idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != Period('NaT', freq=freq)
+        exp = np.array([True, True, True, True])
+        tm.assert_numpy_array_equal(result, exp)
+        result = Period('NaT', freq=freq) != idx1
+        tm.assert_numpy_array_equal(result, exp)
+
+        idx2 = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq=freq)
+        result = idx1 < idx2
+        exp = np.array([True, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == idx2
+        exp = np.array([False, False, False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != idx2
+        exp = np.array([True, True, True, True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 == idx1
+        exp = np.array([True, True, False, True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = idx1 != idx1
+        exp = np.array([False, False, True, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_pi_cmp_nat_mismatched_freq_raises(self, freq):
+        idx1 = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
+
+        diff = PeriodIndex(['2011-02', '2011-01', '2011-04', 'NaT'], freq='4M')
+        msg = "Input has different freq=4M from Period(Array|Index)"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            idx1 > diff
+
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            idx1 == diff
+
+    # TODO: De-duplicate with test_pi_cmp_nat
+    @pytest.mark.parametrize('dtype', [object, None])
+    def test_comp_nat(self, dtype):
+        left = pd.PeriodIndex([pd.Period('2011-01-01'), pd.NaT,
+                               pd.Period('2011-01-03')])
+        right = pd.PeriodIndex([pd.NaT, pd.NaT, pd.Period('2011-01-03')])
+
+        if dtype is not None:
+            left = left.astype(dtype)
+            right = right.astype(dtype)
+
+        result = left == right
+        expected = np.array([False, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = left != right
+        expected = np.array([True, True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(left == pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT == right, expected)
+
+        expected = np.array([True, True, True])
+        tm.assert_numpy_array_equal(left != pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT != left, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(left < pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT > left, expected)
+
+
+class TestPeriodSeriesComparisons(object):
+    def test_cmp_series_period_series_mixed_freq(self):
+        # GH#13200
+        base = Series([Period('2011', freq='A'),
+                       Period('2011-02', freq='M'),
+                       Period('2013', freq='A'),
+                       Period('2011-04', freq='M')])
+
+        ser = Series([Period('2012', freq='A'),
+                      Period('2011-01', freq='M'),
+                      Period('2013', freq='A'),
+                      Period('2011-05', freq='M')])
+
+        exp = Series([False, False, True, False])
+        tm.assert_series_equal(base == ser, exp)
+
+        exp = Series([True, True, False, True])
+        tm.assert_series_equal(base != ser, exp)
+
+        exp = Series([False, True, False, False])
+        tm.assert_series_equal(base > ser, exp)
+
+        exp = Series([True, False, False, True])
+        tm.assert_series_equal(base < ser, exp)
+
+        exp = Series([False, True, True, False])
+        tm.assert_series_equal(base >= ser, exp)
+
+        exp = Series([True, False, True, True])
+        tm.assert_series_equal(base <= ser, exp)
+
+
+class TestPeriodIndexSeriesComparisonConsistency(object):
+    """ Test PeriodIndex and Period Series Ops consistency """
+    # TODO: needs parametrization+de-duplication
+
+    def _check(self, values, func, expected):
+        # Test PeriodIndex and Period Series Ops consistency
+
+        idx = pd.PeriodIndex(values)
+        result = func(idx)
+
+        # check that we don't pass an unwanted type to tm.assert_equal
+        assert isinstance(expected, (pd.Index, np.ndarray))
+        tm.assert_equal(result, expected)
+
+        s = pd.Series(values)
+        result = func(s)
+
+        exp = pd.Series(expected, name=values.name)
+        tm.assert_series_equal(result, exp)
+
+    def test_pi_comp_period(self):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
+                           '2011-04'], freq='M', name='idx')
+
+        f = lambda x: x == pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != pd.Period('2011-03', freq='M')
+        exp = np.array([True, True, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') != x
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, True, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x > pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, True, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+    def test_pi_comp_period_nat(self):
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-03',
+                           '2011-04'], freq='M', name='idx')
+
+        f = lambda x: x == pd.Period('2011-03', freq='M')
+        exp = np.array([False, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x == pd.NaT
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.NaT == x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != pd.Period('2011-03', freq='M')
+        exp = np.array([True, True, False, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.Period('2011-03', freq='M') != x
+        self._check(idx, f, exp)
+
+        f = lambda x: x != pd.NaT
+        exp = np.array([True, True, True, True], dtype=np.bool)
+        self._check(idx, f, exp)
+        f = lambda x: pd.NaT != x
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.Period('2011-03', freq='M') >= x
+        exp = np.array([True, False, True, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x < pd.Period('2011-03', freq='M')
+        exp = np.array([True, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: x > pd.NaT
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+        f = lambda x: pd.NaT >= x
+        exp = np.array([False, False, False, False], dtype=np.bool)
+        self._check(idx, f, exp)
+
+
+# ------------------------------------------------------------------
+# Arithmetic
+
+class TestPeriodFrameArithmetic(object):
+
+    def test_ops_frame_period(self):
+        # GH#13043
+        df = pd.DataFrame({'A': [pd.Period('2015-01', freq='M'),
+                                 pd.Period('2015-02', freq='M')],
+                           'B': [pd.Period('2014-01', freq='M'),
+                                 pd.Period('2014-02', freq='M')]})
+        assert df['A'].dtype == 'Period[M]'
+        assert df['B'].dtype == 'Period[M]'
+
+        p = pd.Period('2015-03', freq='M')
+        off = p.freq
+        # dtype will be object because of original dtype
+        exp = pd.DataFrame({'A': np.array([2 * off, 1 * off], dtype=object),
+                            'B': np.array([14 * off, 13 * off], dtype=object)})
+        tm.assert_frame_equal(p - df, exp)
+        tm.assert_frame_equal(df - p, -1 * exp)
+
+        df2 = pd.DataFrame({'A': [pd.Period('2015-05', freq='M'),
+                                  pd.Period('2015-06', freq='M')],
+                            'B': [pd.Period('2015-05', freq='M'),
+                                  pd.Period('2015-06', freq='M')]})
+        assert df2['A'].dtype == 'Period[M]'
+        assert df2['B'].dtype == 'Period[M]'
+
+        exp = pd.DataFrame({'A': np.array([4 * off, 4 * off], dtype=object),
+                            'B': np.array([16 * off, 16 * off], dtype=object)})
+        tm.assert_frame_equal(df2 - df, exp)
+        tm.assert_frame_equal(df - df2, -1 * exp)
+
+
+class TestPeriodIndexArithmetic(object):
+    # ---------------------------------------------------------------
+    # __add__/__sub__ with PeriodIndex
+    # PeriodIndex + other is defined for integers and timedelta-like others
+    # PeriodIndex - other is defined for integers, timedelta-like others,
+    #   and PeriodIndex (with matching freq)
+
+    def test_parr_add_iadd_parr_raises(self, box_with_array):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='D', periods=5)
+        # TODO: parametrize over boxes for other?
+
+        rng = tm.box_expected(rng, box_with_array)
+        # An earlier implementation of PeriodIndex addition performed
+        # a set operation (union).  This has since been changed to
+        # raise a TypeError. See GH#14164 and GH#13077 for historical
+        # reference.
+        with pytest.raises(TypeError):
+            rng + other
+
+        with pytest.raises(TypeError):
+            rng += other
+
+    def test_pi_sub_isub_pi(self):
+        # GH#20049
+        # For historical reference see GH#14164, GH#13077.
+        # PeriodIndex subtraction originally performed set difference,
+        # then changed to raise TypeError before being implemented in GH#20049
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='D', periods=5)
+
+        off = rng.freq
+        expected = pd.Index([-5 * off] * 5)
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_pi_with_nat(self):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = rng[1:].insert(0, pd.NaT)
+        assert other[1:].equals(rng[1:])
+
+        result = rng - other
+        off = rng.freq
+        expected = pd.Index([pd.NaT, 0 * off, 0 * off, 0 * off, 0 * off])
+        tm.assert_index_equal(result, expected)
+
+    def test_parr_sub_pi_mismatched_freq(self, box_with_array):
+        rng = pd.period_range('1/1/2000', freq='D', periods=5)
+        other = pd.period_range('1/6/2000', freq='H', periods=5)
+        # TODO: parametrize over boxes for other?
+
+        rng = tm.box_expected(rng, box_with_array)
+        with pytest.raises(IncompatibleFrequency):
+            rng - other
+
+    @pytest.mark.parametrize('n', [1, 2, 3, 4])
+    def test_sub_n_gt_1_ticks(self, tick_classes, n):
+        # GH 23878
+        p1_d = '19910905'
+        p2_d = '19920406'
+        p1 = pd.PeriodIndex([p1_d], freq=tick_classes(n))
+        p2 = pd.PeriodIndex([p2_d], freq=tick_classes(n))
+
+        expected = (pd.PeriodIndex([p2_d], freq=p2.freq.base)
+                    - pd.PeriodIndex([p1_d], freq=p1.freq.base))
+
+        tm.assert_index_equal((p2 - p1), expected)
+
+    @pytest.mark.parametrize('n', [1, 2, 3, 4])
+    @pytest.mark.parametrize('offset, kwd_name', [
+        (pd.offsets.YearEnd, 'month'),
+        (pd.offsets.QuarterEnd, 'startingMonth'),
+        (pd.offsets.MonthEnd, None),
+        (pd.offsets.Week, 'weekday')
+    ])
+    def test_sub_n_gt_1_offsets(self, offset, kwd_name, n):
+        # GH 23878
+        kwds = {kwd_name: 3} if kwd_name is not None else {}
+        p1_d = '19910905'
+        p2_d = '19920406'
+        freq = offset(n, normalize=False, **kwds)
+        p1 = pd.PeriodIndex([p1_d], freq=freq)
+        p2 = pd.PeriodIndex([p2_d], freq=freq)
+
+        result = p2 - p1
+        expected = (pd.PeriodIndex([p2_d], freq=freq.base)
+                    - pd.PeriodIndex([p1_d], freq=freq.base))
+
+        tm.assert_index_equal(result, expected)
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd,
+                                    operator.sub, ops.rsub])
+    def test_parr_add_sub_float_raises(self, op, other, box_with_array):
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        pi = dti.to_period('D')
+        pi = tm.box_expected(pi, box_with_array)
+        with pytest.raises(TypeError):
+            op(pi, other)
+
+    @pytest.mark.parametrize('other', [pd.Timestamp.now(),
+                                       pd.Timestamp.now().to_pydatetime(),
+                                       pd.Timestamp.now().to_datetime64()])
+    def test_parr_add_sub_datetime_scalar(self, other, box_with_array):
+        # GH#23215
+        rng = pd.period_range('1/1/2000', freq='D', periods=3)
+        rng = tm.box_expected(rng, box_with_array)
+
+        with pytest.raises(TypeError):
+            rng + other
+        with pytest.raises(TypeError):
+            other + rng
+        with pytest.raises(TypeError):
+            rng - other
+        with pytest.raises(TypeError):
+            other - rng
+
+    # -----------------------------------------------------------------
+    # __add__/__sub__ with ndarray[datetime64] and ndarray[timedelta64]
+
+    def test_parr_add_sub_dt64_array_raises(self, box_with_array):
+        rng = pd.period_range('1/1/2000', freq='D', periods=3)
+        dti = pd.date_range('2016-01-01', periods=3)
+        dtarr = dti.values
+
+        rng = tm.box_expected(rng, box_with_array)
+
+        with pytest.raises(TypeError):
+            rng + dtarr
+        with pytest.raises(TypeError):
+            dtarr + rng
+
+        with pytest.raises(TypeError):
+            rng - dtarr
+        with pytest.raises(TypeError):
+            dtarr - rng
+
+    def test_pi_add_sub_td64_array_non_tick_raises(self):
+        rng = pd.period_range('1/1/2000', freq='Q', periods=3)
+        tdi = pd.TimedeltaIndex(['-1 Day', '-1 Day', '-1 Day'])
+        tdarr = tdi.values
+
+        with pytest.raises(IncompatibleFrequency):
+            rng + tdarr
+        with pytest.raises(IncompatibleFrequency):
+            tdarr + rng
+
+        with pytest.raises(IncompatibleFrequency):
+            rng - tdarr
+        with pytest.raises(TypeError):
+            tdarr - rng
+
+    def test_pi_add_sub_td64_array_tick(self):
+        # PeriodIndex + Timedelta-like is allowed only with
+        #   tick-like frequencies
+        rng = pd.period_range('1/1/2000', freq='90D', periods=3)
+        tdi = pd.TimedeltaIndex(['-1 Day', '-1 Day', '-1 Day'])
+        tdarr = tdi.values
+
+        expected = pd.period_range('12/31/1999', freq='90D', periods=3)
+        result = rng + tdi
+        tm.assert_index_equal(result, expected)
+        result = rng + tdarr
+        tm.assert_index_equal(result, expected)
+        result = tdi + rng
+        tm.assert_index_equal(result, expected)
+        result = tdarr + rng
+        tm.assert_index_equal(result, expected)
+
+        expected = pd.period_range('1/2/2000', freq='90D', periods=3)
+
+        result = rng - tdi
+        tm.assert_index_equal(result, expected)
+        result = rng - tdarr
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            tdarr - rng
+
+        with pytest.raises(TypeError):
+            tdi - rng
+
+    # -----------------------------------------------------------------
+    # operations with array/Index of DateOffset objects
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_pi_add_offset_array(self, box):
+        # GH#18849
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('2016Q2')])
+        offs = box([pd.offsets.QuarterEnd(n=1, startingMonth=12),
+                    pd.offsets.QuarterEnd(n=-2, startingMonth=12)])
+        expected = pd.PeriodIndex([pd.Period('2015Q2'), pd.Period('2015Q4')])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pi + offs
+        tm.assert_index_equal(res, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = offs + pi
+        tm.assert_index_equal(res2, expected)
+
+        unanchored = np.array([pd.offsets.Hour(n=1),
+                               pd.offsets.Minute(n=-2)])
+        # addition/subtraction ops with incompatible offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                pi + unanchored
+        with pytest.raises(IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                unanchored + pi
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_pi_sub_offset_array(self, box):
+        # GH#18824
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('2016Q2')])
+        other = box([pd.offsets.QuarterEnd(n=1, startingMonth=12),
+                     pd.offsets.QuarterEnd(n=-2, startingMonth=12)])
+
+        expected = PeriodIndex([pi[n] - other[n] for n in range(len(pi))])
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pi - other
+        tm.assert_index_equal(res, expected)
+
+        anchored = box([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        # addition/subtraction ops with anchored offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                pi - anchored
+        with pytest.raises(IncompatibleFrequency):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored - pi
+
+    def test_pi_add_iadd_int(self, one):
+        # Variants of `one` for #19012
+        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
+        result = rng + one
+        expected = pd.period_range('2000-01-01 10:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+        rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_isub_int(self, one):
+        """
+        PeriodIndex.__sub__ and __isub__ with several representations of
+        the integer 1, e.g. int, long, np.int64, np.uint8, ...
+        """
+        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
+        result = rng - one
+        expected = pd.period_range('2000-01-01 08:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+        rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    @pytest.mark.parametrize('five', [5, np.array(5, dtype=np.int64)])
+    def test_pi_sub_intlike(self, five):
+        rng = period_range('2007-01', periods=50)
+
+        result = rng - five
+        exp = rng + (-five)
+        tm.assert_index_equal(result, exp)
+
+    def test_pi_sub_isub_offset(self):
+        # offset
+        # DateOffset
+        rng = pd.period_range('2014', '2024', freq='A')
+        result = rng - pd.offsets.YearEnd(5)
+        expected = pd.period_range('2009', '2019', freq='A')
+        tm.assert_index_equal(result, expected)
+        rng -= pd.offsets.YearEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        result = rng - pd.offsets.MonthEnd(5)
+        expected = pd.period_range('2013-08', '2016-07', freq='M')
+        tm.assert_index_equal(result, expected)
+
+        rng -= pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_offset_n_gt1(self, box_transpose_fail):
+        # GH#23215
+        # add offset to PeriodIndex with freq.n > 1
+        box, transpose = box_transpose_fail
+
+        per = pd.Period('2016-01', freq='2M')
+        pi = pd.PeriodIndex([per])
+
+        expected = pd.PeriodIndex(['2016-03'], freq='2M')
+
+        pi = tm.box_expected(pi, box, transpose=transpose)
+        expected = tm.box_expected(expected, box, transpose=transpose)
+
+        result = pi + per.freq
+        tm.assert_equal(result, expected)
+
+        result = per.freq + pi
+        tm.assert_equal(result, expected)
+
+    def test_pi_add_offset_n_gt1_not_divisible(self, box_with_array):
+        # GH#23215
+        # PeriodIndex with freq.n > 1 add offset with offset.n % freq.n != 0
+        pi = pd.PeriodIndex(['2016-01'], freq='2M')
+        expected = pd.PeriodIndex(['2016-04'], freq='2M')
+
+        # FIXME: with transposing these tests fail
+        pi = tm.box_expected(pi, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = pi + to_offset('3M')
+        tm.assert_equal(result, expected)
+
+        result = to_offset('3M') + pi
+        tm.assert_equal(result, expected)
+
+    # ---------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('int_holder', [np.array, pd.Index])
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_pi_add_intarray(self, int_holder, op):
+        # GH#19959
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('NaT')])
+        other = int_holder([4, -1])
+
+        result = op(pi, other)
+        expected = pd.PeriodIndex([pd.Period('2016Q1'), pd.Period('NaT')])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('int_holder', [np.array, pd.Index])
+    def test_pi_sub_intarray(self, int_holder):
+        # GH#19959
+        pi = pd.PeriodIndex([pd.Period('2015Q1'), pd.Period('NaT')])
+        other = int_holder([4, -1])
+
+        result = pi - other
+        expected = pd.PeriodIndex([pd.Period('2014Q1'), pd.Period('NaT')])
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            other - pi
+
+    # ---------------------------------------------------------------
+    # Timedelta-like (timedelta, timedelta64, Timedelta, Tick)
+    # TODO: Some of these are misnomers because of non-Tick DateOffsets
+
+    def test_pi_add_timedeltalike_minute_gt1(self, three_days):
+        # GH#23031 adding a time-delta-like offset to a PeriodArray that has
+        # minute frequency with n != 1.  A more general case is tested below
+        # in test_pi_add_timedeltalike_tick_gt1, but here we write out the
+        # expected result more explicitly.
+        other = three_days
+        rng = pd.period_range('2014-05-01', periods=3, freq='2D')
+
+        expected = pd.PeriodIndex(['2014-05-04', '2014-05-06', '2014-05-08'],
+                                  freq='2D')
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        result = other + rng
+        tm.assert_index_equal(result, expected)
+
+        # subtraction
+        expected = pd.PeriodIndex(['2014-04-28', '2014-04-30', '2014-05-02'],
+                                  freq='2D')
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            other - rng
+
+    @pytest.mark.parametrize('freqstr', ['5ns', '5us', '5ms',
+                                         '5s', '5T', '5h', '5d'])
+    def test_pi_add_timedeltalike_tick_gt1(self, three_days, freqstr):
+        # GH#23031 adding a time-delta-like offset to a PeriodArray that has
+        # tick-like frequency with n != 1
+        other = three_days
+        rng = pd.period_range('2014-05-01', periods=6, freq=freqstr)
+
+        expected = pd.period_range(rng[0] + other, periods=6, freq=freqstr)
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        result = other + rng
+        tm.assert_index_equal(result, expected)
+
+        # subtraction
+        expected = pd.period_range(rng[0] - other, periods=6, freq=freqstr)
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            other - rng
+
+    def test_pi_add_iadd_timedeltalike_daily(self, three_days):
+        # Tick
+        other = three_days
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        expected = pd.period_range('2014-05-04', '2014-05-18', freq='D')
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        rng += other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_sub_isub_timedeltalike_daily(self, three_days):
+        # Tick-like 3 Days
+        other = three_days
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        expected = pd.period_range('2014-04-28', '2014-05-12', freq='D')
+
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_sub_timedeltalike_freq_mismatch_daily(self, not_daily):
+        other = not_daily
+        rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=D\\)'
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng + other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng += other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng - other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng -= other
+
+    def test_pi_add_iadd_timedeltalike_hourly(self, two_hours):
+        other = two_hours
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        expected = pd.period_range('2014-01-01 12:00', '2014-01-05 12:00',
+                                   freq='H')
+
+        result = rng + other
+        tm.assert_index_equal(result, expected)
+
+        rng += other
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_timedeltalike_mismatched_freq_hourly(self, not_hourly):
+        other = not_hourly
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=H\\)'
+
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng + other
+
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng += other
+
+    def test_pi_sub_isub_timedeltalike_hourly(self, two_hours):
+        other = two_hours
+        rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00', freq='H')
+        expected = pd.period_range('2014-01-01 08:00', '2014-01-05 08:00',
+                                   freq='H')
+
+        result = rng - other
+        tm.assert_index_equal(result, expected)
+
+        rng -= other
+        tm.assert_index_equal(rng, expected)
+
+    def test_add_iadd_timedeltalike_annual(self):
+        # offset
+        # DateOffset
+        rng = pd.period_range('2014', '2024', freq='A')
+        result = rng + pd.offsets.YearEnd(5)
+        expected = pd.period_range('2019', '2029', freq='A')
+        tm.assert_index_equal(result, expected)
+        rng += pd.offsets.YearEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_sub_timedeltalike_freq_mismatch_annual(self,
+                                                           mismatched_freq):
+        other = mismatched_freq
+        rng = pd.period_range('2014', '2024', freq='A')
+        msg = ('Input has different freq(=.+)? '
+               'from Period.*?\\(freq=A-DEC\\)')
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng + other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng += other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng - other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng -= other
+
+    def test_pi_add_iadd_timedeltalike_M(self):
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        expected = pd.period_range('2014-06', '2017-05', freq='M')
+
+        result = rng + pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(result, expected)
+
+        rng += pd.offsets.MonthEnd(5)
+        tm.assert_index_equal(rng, expected)
+
+    def test_pi_add_sub_timedeltalike_freq_mismatch_monthly(self,
+                                                            mismatched_freq):
+        other = mismatched_freq
+        rng = pd.period_range('2014-01', '2016-12', freq='M')
+        msg = 'Input has different freq(=.+)? from Period.*?\\(freq=M\\)'
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng + other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng += other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng - other
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            rng -= other
+
+    def test_parr_add_sub_td64_nat(self, box_transpose_fail):
+        # GH#23320 special handling for timedelta64("NaT")
+        box, transpose = box_transpose_fail
+
+        pi = pd.period_range("1994-04-01", periods=9, freq="19D")
+        other = np.timedelta64("NaT")
+        expected = pd.PeriodIndex(["NaT"] * 9, freq="19D")
+
+        obj = tm.box_expected(pi, box, transpose=transpose)
+        expected = tm.box_expected(expected, box, transpose=transpose)
+
+        result = obj + other
+        tm.assert_equal(result, expected)
+        result = other + obj
+        tm.assert_equal(result, expected)
+        result = obj - other
+        tm.assert_equal(result, expected)
+        with pytest.raises(TypeError):
+            other - obj
+
+
+class TestPeriodSeriesArithmetic(object):
+    def test_ops_series_timedelta(self):
+        # GH#13043
+        ser = pd.Series([pd.Period('2015-01-01', freq='D'),
+                         pd.Period('2015-01-02', freq='D')], name='xxx')
+        assert ser.dtype == 'Period[D]'
+
+        expected = pd.Series([pd.Period('2015-01-02', freq='D'),
+                              pd.Period('2015-01-03', freq='D')], name='xxx')
+
+        result = ser + pd.Timedelta('1 days')
+        tm.assert_series_equal(result, expected)
+
+        result = pd.Timedelta('1 days') + ser
+        tm.assert_series_equal(result, expected)
+
+        result = ser + pd.tseries.offsets.Day()
+        tm.assert_series_equal(result, expected)
+
+        result = pd.tseries.offsets.Day() + ser
+        tm.assert_series_equal(result, expected)
+
+    def test_ops_series_period(self):
+        # GH#13043
+        ser = pd.Series([pd.Period('2015-01-01', freq='D'),
+                         pd.Period('2015-01-02', freq='D')], name='xxx')
+        assert ser.dtype == "Period[D]"
+
+        per = pd.Period('2015-01-10', freq='D')
+        off = per.freq
+        # dtype will be object because of original dtype
+        expected = pd.Series([9 * off, 8 * off], name='xxx', dtype=object)
+        tm.assert_series_equal(per - ser, expected)
+        tm.assert_series_equal(ser - per, -1 * expected)
+
+        s2 = pd.Series([pd.Period('2015-01-05', freq='D'),
+                        pd.Period('2015-01-04', freq='D')], name='xxx')
+        assert s2.dtype == "Period[D]"
+
+        expected = pd.Series([4 * off, 2 * off], name='xxx', dtype=object)
+        tm.assert_series_equal(s2 - ser, expected)
+        tm.assert_series_equal(ser - s2, -1 * expected)
+
+
+class TestPeriodIndexSeriesMethods(object):
+    """ Test PeriodIndex and Period Series Ops consistency """
+
+    def _check(self, values, func, expected):
+        idx = pd.PeriodIndex(values)
+        result = func(idx)
+        tm.assert_equal(result, expected)
+
+        ser = pd.Series(values)
+        result = func(ser)
+
+        exp = pd.Series(expected, name=values.name)
+        tm.assert_series_equal(result, exp)
+
+    def test_pi_ops(self):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        expected = PeriodIndex(['2011-03', '2011-04', '2011-05', '2011-06'],
+                               freq='M', name='idx')
+
+        self._check(idx, lambda x: x + 2, expected)
+        self._check(idx, lambda x: 2 + x, expected)
+
+        self._check(idx + 2, lambda x: x - 2, idx)
+
+        result = idx - Period('2011-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([0 * off, 1 * off, 2 * off, 3 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = Period('2011-01', freq='M') - idx
+        exp = pd.Index([0 * off, -1 * off, -2 * off, -3 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+    @pytest.mark.parametrize('ng', ["str", 1.5])
+    def test_parr_ops_errors(self, ng, box_with_array):
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+        obj = tm.box_expected(idx, box_with_array)
+
+        msg = r"unsupported operand type\(s\)"
+        with pytest.raises(TypeError, match=msg):
+            obj + ng
+
+        with pytest.raises(TypeError):
+            # error message differs between PY2 and 3
+            ng + obj
+
+        with pytest.raises(TypeError, match=msg):
+            obj - ng
+
+        with pytest.raises(TypeError):
+            np.add(obj, ng)
+
+        with pytest.raises(TypeError):
+            np.add(ng, obj)
+
+        with pytest.raises(TypeError):
+            np.subtract(obj, ng)
+
+        with pytest.raises(TypeError):
+            np.subtract(ng, obj)
+
+    def test_pi_ops_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        expected = PeriodIndex(['2011-03', '2011-04', 'NaT', '2011-06'],
+                               freq='M', name='idx')
+
+        self._check(idx, lambda x: x + 2, expected)
+        self._check(idx, lambda x: 2 + x, expected)
+        self._check(idx, lambda x: np.add(x, 2), expected)
+
+        self._check(idx + 2, lambda x: x - 2, idx)
+        self._check(idx + 2, lambda x: np.subtract(x, 2), idx)
+
+        # freq with mult
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='2M', name='idx')
+        expected = PeriodIndex(['2011-07', '2011-08', 'NaT', '2011-10'],
+                               freq='2M', name='idx')
+
+        self._check(idx, lambda x: x + 3, expected)
+        self._check(idx, lambda x: 3 + x, expected)
+        self._check(idx, lambda x: np.add(x, 3), expected)
+
+        self._check(idx + 3, lambda x: x - 3, idx)
+        self._check(idx + 3, lambda x: np.subtract(x, 3), idx)
+
+    def test_pi_ops_array_int(self):
+
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        f = lambda x: x + np.array([1, 2, 3, 4])
+        exp = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: np.add(x, np.array([4, -1, 1, 2]))
+        exp = PeriodIndex(['2011-05', '2011-01', 'NaT', '2011-06'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x - np.array([1, 2, 3, 4])
+        exp = PeriodIndex(['2010-12', '2010-12', 'NaT', '2010-12'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: np.subtract(x, np.array([3, 2, 3, -2]))
+        exp = PeriodIndex(['2010-10', '2010-12', 'NaT', '2011-06'],
+                          freq='M', name='idx')
+        self._check(idx, f, exp)
+
+    def test_pi_ops_offset(self):
+        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
+                           '2011-04-01'], freq='D', name='idx')
+        f = lambda x: x + pd.offsets.Day()
+        exp = PeriodIndex(['2011-01-02', '2011-02-02', '2011-03-02',
+                           '2011-04-02'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x + pd.offsets.Day(2)
+        exp = PeriodIndex(['2011-01-03', '2011-02-03', '2011-03-03',
+                           '2011-04-03'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+        f = lambda x: x - pd.offsets.Day(2)
+        exp = PeriodIndex(['2010-12-30', '2011-01-30', '2011-02-27',
+                           '2011-03-30'], freq='D', name='idx')
+        self._check(idx, f, exp)
+
+    def test_pi_offset_errors(self):
+        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
+                           '2011-04-01'], freq='D', name='idx')
+        ser = pd.Series(idx)
+
+        # Series op is applied per Period instance, thus error is raised
+        # from Period
+        for obj in [idx, ser]:
+            msg = r"Input has different freq=2H from Period.*?\(freq=D\)"
+            with pytest.raises(IncompatibleFrequency, match=msg):
+                obj + pd.offsets.Hour(2)
+
+            with pytest.raises(IncompatibleFrequency, match=msg):
+                pd.offsets.Hour(2) + obj
+
+            msg = r"Input has different freq=-2H from Period.*?\(freq=D\)"
+            with pytest.raises(IncompatibleFrequency, match=msg):
+                obj - pd.offsets.Hour(2)
+
+    def test_pi_sub_period(self):
+        # GH#13071
+        idx = PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        result = idx - pd.Period('2012-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([-12 * off, -11 * off, -10 * off, -9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = np.subtract(idx, pd.Period('2012-01', freq='M'))
+        tm.assert_index_equal(result, exp)
+
+        result = pd.Period('2012-01', freq='M') - idx
+        exp = pd.Index([12 * off, 11 * off, 10 * off, 9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = np.subtract(pd.Period('2012-01', freq='M'), idx)
+        tm.assert_index_equal(result, exp)
+
+        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
+        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
+        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
+
+    def test_pi_sub_pdnat(self):
+        # GH#13071
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        exp = pd.TimedeltaIndex([pd.NaT] * 4, name='idx')
+        tm.assert_index_equal(pd.NaT - idx, exp)
+        tm.assert_index_equal(idx - pd.NaT, exp)
+
+    def test_pi_sub_period_nat(self):
+        # GH#13071
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-03', '2011-04'],
+                          freq='M', name='idx')
+
+        result = idx - pd.Period('2012-01', freq='M')
+        off = idx.freq
+        exp = pd.Index([-12 * off, pd.NaT, -10 * off, -9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        result = pd.Period('2012-01', freq='M') - idx
+        exp = pd.Index([12 * off, pd.NaT, 10 * off, 9 * off], name='idx')
+        tm.assert_index_equal(result, exp)
+
+        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
+        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
+        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
diff --git a/pandas/tests/arithmetic/test_timedelta64.py b/pandas/tests/arithmetic/test_timedelta64.py
new file mode 100644
index 0000000000000..0faed74d4a021
--- /dev/null
+++ b/pandas/tests/arithmetic/test_timedelta64.py
@@ -0,0 +1,2009 @@
+# -*- coding: utf-8 -*-
+# Arithmetc tests for DataFrame/Series/Index/Array classes that should
+# behave identically.
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas.errors import NullFrequencyError, PerformanceWarning
+
+import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, NaT, Series, Timedelta, TimedeltaIndex,
+    Timestamp, timedelta_range)
+import pandas.util.testing as tm
+
+
+def get_upcast_box(box, vector):
+    """
+    Given two box-types, find the one that takes priority
+    """
+    if box is DataFrame or isinstance(vector, DataFrame):
+        return DataFrame
+    if box is Series or isinstance(vector, Series):
+        return Series
+    if box is pd.Index or isinstance(vector, pd.Index):
+        return pd.Index
+    return box
+
+
+# ------------------------------------------------------------------
+# Timedelta64[ns] dtype Comparisons
+
+class TestTimedelta64ArrayComparisons(object):
+    # TODO: All of these need to be parametrized over box
+
+    def test_compare_timedelta_series(self):
+        # regresssion test for GH#5963
+        s = pd.Series([timedelta(days=1), timedelta(days=2)])
+        actual = s > timedelta(days=1)
+        expected = pd.Series([False, True])
+        tm.assert_series_equal(actual, expected)
+
+    def test_tdi_cmp_str_invalid(self, box_with_array):
+        # GH#13624
+        xbox = box_with_array if box_with_array is not pd.Index else np.ndarray
+        tdi = TimedeltaIndex(['1 day', '2 days'])
+        tdarr = tm.box_expected(tdi, box_with_array)
+
+        for left, right in [(tdarr, 'a'), ('a', tdarr)]:
+            with pytest.raises(TypeError):
+                left > right
+            with pytest.raises(TypeError):
+                left >= right
+            with pytest.raises(TypeError):
+                left < right
+            with pytest.raises(TypeError):
+                left <= right
+
+            result = left == right
+            expected = np.array([False, False], dtype=bool)
+            expected = tm.box_expected(expected, xbox)
+            tm.assert_equal(result, expected)
+
+            result = left != right
+            expected = np.array([True, True], dtype=bool)
+            expected = tm.box_expected(expected, xbox)
+            tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_comp_nat(self, dtype):
+        left = pd.TimedeltaIndex([pd.Timedelta('1 days'), pd.NaT,
+                                  pd.Timedelta('3 days')])
+        right = pd.TimedeltaIndex([pd.NaT, pd.NaT, pd.Timedelta('3 days')])
+
+        lhs, rhs = left, right
+        if dtype is object:
+            lhs, rhs = left.astype(object), right.astype(object)
+
+        result = rhs == lhs
+        expected = np.array([False, False, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = rhs != lhs
+        expected = np.array([True, True, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(lhs == pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT == rhs, expected)
+
+        expected = np.array([True, True, True])
+        tm.assert_numpy_array_equal(lhs != pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT != lhs, expected)
+
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(lhs < pd.NaT, expected)
+        tm.assert_numpy_array_equal(pd.NaT > lhs, expected)
+
+    def test_comparisons_nat(self):
+        tdidx1 = pd.TimedeltaIndex(['1 day', pd.NaT, '1 day 00:00:01', pd.NaT,
+                                    '1 day 00:00:01', '5 day 00:00:03'])
+        tdidx2 = pd.TimedeltaIndex(['2 day', '2 day', pd.NaT, pd.NaT,
+                                    '1 day 00:00:02', '5 days 00:00:03'])
+        tdarr = np.array([np.timedelta64(2, 'D'),
+                          np.timedelta64(2, 'D'), np.timedelta64('nat'),
+                          np.timedelta64('nat'),
+                          np.timedelta64(1, 'D') + np.timedelta64(2, 's'),
+                          np.timedelta64(5, 'D') + np.timedelta64(3, 's')])
+
+        cases = [(tdidx1, tdidx2), (tdidx1, tdarr)]
+
+        # Check pd.NaT is handles as the same as np.nan
+        for idx1, idx2 in cases:
+
+            result = idx1 < idx2
+            expected = np.array([True, False, False, False, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx2 > idx1
+            expected = np.array([True, False, False, False, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 <= idx2
+            expected = np.array([True, False, False, False, True, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx2 >= idx1
+            expected = np.array([True, False, False, False, True, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 == idx2
+            expected = np.array([False, False, False, False, False, True])
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = idx1 != idx2
+            expected = np.array([True, True, True, True, True, False])
+            tm.assert_numpy_array_equal(result, expected)
+
+    # TODO: better name
+    def test_comparisons_coverage(self):
+        rng = timedelta_range('1 days', periods=10)
+
+        result = rng < rng[3]
+        expected = np.array([True, True, True] + [False] * 7)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # raise TypeError for now
+        with pytest.raises(TypeError):
+            rng < rng[3].value
+
+        result = rng == list(rng)
+        exp = rng == rng
+        tm.assert_numpy_array_equal(result, exp)
+
+
+# ------------------------------------------------------------------
+# Timedelta64[ns] dtype Arithmetic Operations
+
+class TestTimedelta64ArithmeticUnsorted(object):
+    # Tests moved from type-specific test files but not
+    #  yet sorted/parametrized/de-duplicated
+
+    def test_ufunc_coercions(self):
+        # normal ops are also tested in tseries/test_timedeltas.py
+        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
+                             freq='2H', name='x')
+
+        for result in [idx * 2, np.multiply(idx, 2)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['4H', '8H', '12H', '16H', '20H'],
+                                 freq='4H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '4H'
+
+        for result in [idx / 2, np.divide(idx, 2)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['1H', '2H', '3H', '4H', '5H'],
+                                 freq='H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == 'H'
+
+        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
+                             freq='2H', name='x')
+        for result in [-idx, np.negative(idx)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['-2H', '-4H', '-6H', '-8H', '-10H'],
+                                 freq='-2H', name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq == '-2H'
+
+        idx = TimedeltaIndex(['-2H', '-1H', '0H', '1H', '2H'],
+                             freq='H', name='x')
+        for result in [abs(idx), np.absolute(idx)]:
+            assert isinstance(result, TimedeltaIndex)
+            exp = TimedeltaIndex(['2H', '1H', '0H', '1H', '2H'],
+                                 freq=None, name='x')
+            tm.assert_index_equal(result, exp)
+            assert result.freq is None
+
+    def test_subtraction_ops(self):
+        # with datetimes/timedelta and tdi/dti
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = pd.date_range('20130101', periods=3, name='bar')
+        td = Timedelta('1 days')
+        dt = Timestamp('20130101')
+
+        msg = "cannot subtract a datelike from a TimedeltaArray"
+        with pytest.raises(TypeError, match=msg):
+            tdi - dt
+        with pytest.raises(TypeError, match=msg):
+            tdi - dti
+
+        msg = (r"descriptor '__sub__' requires a 'datetime\.datetime' object"
+               " but received a 'Timedelta'")
+        with pytest.raises(TypeError, match=msg):
+            td - dt
+
+        msg = "bad operand type for unary -: 'DatetimeArray'"
+        with pytest.raises(TypeError, match=msg):
+            td - dti
+
+        result = dt - dti
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'], name='bar')
+        tm.assert_index_equal(result, expected)
+
+        result = dti - dt
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'], name='bar')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi - td
+        expected = TimedeltaIndex(['0 days', pd.NaT, '1 days'], name='foo')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = td - tdi
+        expected = TimedeltaIndex(['0 days', pd.NaT, '-1 days'], name='foo')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = dti - td
+        expected = DatetimeIndex(
+            ['20121231', '20130101', '20130102'], name='bar')
+        tm.assert_index_equal(result, expected, check_names=False)
+
+        result = dt - tdi
+        expected = DatetimeIndex(['20121231', pd.NaT, '20121230'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_subtraction_ops_with_tz(self):
+
+        # check that dt/dti subtraction ops with tz are validated
+        dti = pd.date_range('20130101', periods=3)
+        ts = Timestamp('20130101')
+        dt = ts.to_pydatetime()
+        dti_tz = pd.date_range('20130101', periods=3).tz_localize('US/Eastern')
+        ts_tz = Timestamp('20130101').tz_localize('US/Eastern')
+        ts_tz2 = Timestamp('20130101').tz_localize('CET')
+        dt_tz = ts_tz.to_pydatetime()
+        td = Timedelta('1 days')
+
+        def _check(result, expected):
+            assert result == expected
+            assert isinstance(result, Timedelta)
+
+        # scalars
+        result = ts - ts
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = dt_tz - ts_tz
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = ts_tz - dt_tz
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        # tz mismatches
+        msg = ("Timestamp subtraction must have the same timezones or no"
+               " timezones")
+        with pytest.raises(TypeError, match=msg):
+            dt_tz - ts
+        msg = "can't subtract offset-naive and offset-aware datetimes"
+        with pytest.raises(TypeError, match=msg):
+            dt_tz - dt
+        msg = ("Timestamp subtraction must have the same timezones or no"
+               " timezones")
+        with pytest.raises(TypeError, match=msg):
+            dt_tz - ts_tz2
+        msg = "can't subtract offset-naive and offset-aware datetimes"
+        with pytest.raises(TypeError, match=msg):
+            dt - dt_tz
+        msg = ("Timestamp subtraction must have the same timezones or no"
+               " timezones")
+        with pytest.raises(TypeError, match=msg):
+            ts - dt_tz
+        with pytest.raises(TypeError, match=msg):
+            ts_tz2 - ts
+        with pytest.raises(TypeError, match=msg):
+            ts_tz2 - dt
+        with pytest.raises(TypeError, match=msg):
+            ts_tz - ts_tz2
+
+        # with dti
+        with pytest.raises(TypeError, match=msg):
+            dti - ts_tz
+        with pytest.raises(TypeError, match=msg):
+            dti_tz - ts
+        with pytest.raises(TypeError, match=msg):
+            dti_tz - ts_tz2
+
+        result = dti_tz - dt_tz
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = dt_tz - dti_tz
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = dti_tz - ts_tz
+        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = ts_tz - dti_tz
+        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
+        tm.assert_index_equal(result, expected)
+
+        result = td - td
+        expected = Timedelta('0 days')
+        _check(result, expected)
+
+        result = dti_tz - td
+        expected = DatetimeIndex(
+            ['20121231', '20130101', '20130102'], tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_tdi_numeric_ops(self):
+        # These are normally union/diff set-like ops
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = pd.date_range('20130101', periods=3, name='bar')
+
+        # TODO(wesm): unused?
+        # td = Timedelta('1 days')
+        # dt = Timestamp('20130101')
+
+        result = tdi - tdi
+        expected = TimedeltaIndex(['0 days', pd.NaT, '0 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + tdi
+        expected = TimedeltaIndex(['2 days', pd.NaT, '4 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = dti - tdi  # name will be reset
+        expected = DatetimeIndex(['20121231', pd.NaT, '20130101'])
+        tm.assert_index_equal(result, expected)
+
+    def test_addition_ops(self):
+        # with datetimes/timedelta and tdi/dti
+        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        dti = pd.date_range('20130101', periods=3, name='bar')
+        td = Timedelta('1 days')
+        dt = Timestamp('20130101')
+
+        result = tdi + dt
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = dt + tdi
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = td + tdi
+        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = tdi + td
+        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # unequal length
+        msg = "cannot add indices of unequal length"
+        with pytest.raises(ValueError, match=msg):
+            tdi + dti[0:1]
+        with pytest.raises(ValueError, match=msg):
+            tdi[0:1] + dti
+
+        # random indexes
+        with pytest.raises(NullFrequencyError):
+            tdi + pd.Int64Index([1, 2, 3])
+
+        # this is a union!
+        # pytest.raises(TypeError, lambda : Int64Index([1,2,3]) + tdi)
+
+        result = tdi + dti  # name will be reset
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
+        tm.assert_index_equal(result, expected)
+
+        result = dti + tdi  # name will be reset
+        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
+        tm.assert_index_equal(result, expected)
+
+        result = dt + td
+        expected = Timestamp('20130102')
+        assert result == expected
+
+        result = td + dt
+        expected = Timestamp('20130102')
+        assert result == expected
+
+    # TODO: Needs more informative name, probably split up into
+    # more targeted tests
+    @pytest.mark.parametrize('freq', ['D', 'B'])
+    def test_timedelta(self, freq):
+        index = pd.date_range('1/1/2000', periods=50, freq=freq)
+
+        shifted = index + timedelta(1)
+        back = shifted + timedelta(-1)
+        tm.assert_index_equal(index, back)
+
+        if freq == 'D':
+            expected = pd.tseries.offsets.Day(1)
+            assert index.freq == expected
+            assert shifted.freq == expected
+            assert back.freq == expected
+        else:  # freq == 'B'
+            assert index.freq == pd.tseries.offsets.BusinessDay(1)
+            assert shifted.freq is None
+            assert back.freq == pd.tseries.offsets.BusinessDay(1)
+
+        result = index - timedelta(1)
+        expected = index + timedelta(-1)
+        tm.assert_index_equal(result, expected)
+
+        # GH#4134, buggy with timedeltas
+        rng = pd.date_range('2013', '2014')
+        s = Series(rng)
+        result1 = rng - pd.offsets.Hour(1)
+        result2 = DatetimeIndex(s - np.timedelta64(100000000))
+        result3 = rng - np.timedelta64(100000000)
+        result4 = DatetimeIndex(s - pd.offsets.Hour(1))
+        tm.assert_index_equal(result1, result4)
+        tm.assert_index_equal(result2, result3)
+
+
+class TestAddSubNaTMasking(object):
+    # TODO: parametrize over boxes
+
+    def test_tdi_add_timestamp_nat_masking(self):
+        # GH#17991 checking for overflow-masking with NaT
+        tdinat = pd.to_timedelta(['24658 days 11:15:00', 'NaT'])
+
+        tsneg = Timestamp('1950-01-01')
+        ts_neg_variants = [tsneg,
+                           tsneg.to_pydatetime(),
+                           tsneg.to_datetime64().astype('datetime64[ns]'),
+                           tsneg.to_datetime64().astype('datetime64[D]')]
+
+        tspos = Timestamp('1980-01-01')
+        ts_pos_variants = [tspos,
+                           tspos.to_pydatetime(),
+                           tspos.to_datetime64().astype('datetime64[ns]'),
+                           tspos.to_datetime64().astype('datetime64[D]')]
+
+        for variant in ts_neg_variants + ts_pos_variants:
+            res = tdinat + variant
+            assert res[1] is pd.NaT
+
+    def test_tdi_add_overflow(self):
+        # See GH#14068
+        msg = "too (big|large) to convert"
+        with pytest.raises(OverflowError, match=msg):
+            pd.to_timedelta(106580, 'D') + Timestamp('2000')
+        with pytest.raises(OverflowError, match=msg):
+            Timestamp('2000') + pd.to_timedelta(106580, 'D')
+
+        _NaT = int(pd.NaT) + 1
+        msg = "Overflow in int64 addition"
+        with pytest.raises(OverflowError, match=msg):
+            pd.to_timedelta([106580], 'D') + Timestamp('2000')
+        with pytest.raises(OverflowError, match=msg):
+            Timestamp('2000') + pd.to_timedelta([106580], 'D')
+        with pytest.raises(OverflowError, match=msg):
+            pd.to_timedelta([_NaT]) - Timedelta('1 days')
+        with pytest.raises(OverflowError, match=msg):
+            pd.to_timedelta(['5 days', _NaT]) - Timedelta('1 days')
+        with pytest.raises(OverflowError, match=msg):
+            (pd.to_timedelta([_NaT, '5 days', '1 hours']) -
+             pd.to_timedelta(['7 seconds', _NaT, '4 hours']))
+
+        # These should not overflow!
+        exp = TimedeltaIndex([pd.NaT])
+        result = pd.to_timedelta([pd.NaT]) - Timedelta('1 days')
+        tm.assert_index_equal(result, exp)
+
+        exp = TimedeltaIndex(['4 days', pd.NaT])
+        result = pd.to_timedelta(['5 days', pd.NaT]) - Timedelta('1 days')
+        tm.assert_index_equal(result, exp)
+
+        exp = TimedeltaIndex([pd.NaT, pd.NaT, '5 hours'])
+        result = (pd.to_timedelta([pd.NaT, '5 days', '1 hours']) +
+                  pd.to_timedelta(['7 seconds', pd.NaT, '4 hours']))
+        tm.assert_index_equal(result, exp)
+
+
+class TestTimedeltaArraylikeAddSubOps(object):
+    # Tests for timedelta64[ns] __add__, __sub__, __radd__, __rsub__
+
+    # TODO: moved from frame tests; needs parametrization/de-duplication
+    def test_td64_df_add_int_frame(self):
+        # GH#22696 Check that we don't dispatch to numpy implementation,
+        #  which treats int64 as m8[ns]
+        tdi = pd.timedelta_range('1', periods=3)
+        df = tdi.to_frame()
+        other = pd.DataFrame([1, 2, 3], index=tdi)  # indexed like `df`
+        with pytest.raises(TypeError):
+            df + other
+        with pytest.raises(TypeError):
+            other + df
+        with pytest.raises(TypeError):
+            df - other
+        with pytest.raises(TypeError):
+            other - df
+
+    # TODO: moved from tests.indexes.timedeltas.test_arithmetic; needs
+    #  parametrization+de-duplication
+    def test_timedelta_ops_with_missing_values(self):
+        # setup
+        s1 = pd.to_timedelta(Series(['00:00:01']))
+        s2 = pd.to_timedelta(Series(['00:00:02']))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # Passing datetime64-dtype data to TimedeltaIndex is deprecated
+            sn = pd.to_timedelta(Series([pd.NaT]))
+
+        df1 = pd.DataFrame(['00:00:01']).apply(pd.to_timedelta)
+        df2 = pd.DataFrame(['00:00:02']).apply(pd.to_timedelta)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # Passing datetime64-dtype data to TimedeltaIndex is deprecated
+            dfn = pd.DataFrame([pd.NaT]).apply(pd.to_timedelta)
+
+        scalar1 = pd.to_timedelta('00:00:01')
+        scalar2 = pd.to_timedelta('00:00:02')
+        timedelta_NaT = pd.to_timedelta('NaT')
+
+        actual = scalar1 + scalar1
+        assert actual == scalar2
+        actual = scalar2 - scalar1
+        assert actual == scalar1
+
+        actual = s1 + s1
+        tm.assert_series_equal(actual, s2)
+        actual = s2 - s1
+        tm.assert_series_equal(actual, s1)
+
+        actual = s1 + scalar1
+        tm.assert_series_equal(actual, s2)
+        actual = scalar1 + s1
+        tm.assert_series_equal(actual, s2)
+        actual = s2 - scalar1
+        tm.assert_series_equal(actual, s1)
+        actual = -scalar1 + s2
+        tm.assert_series_equal(actual, s1)
+
+        actual = s1 + timedelta_NaT
+        tm.assert_series_equal(actual, sn)
+        actual = timedelta_NaT + s1
+        tm.assert_series_equal(actual, sn)
+        actual = s1 - timedelta_NaT
+        tm.assert_series_equal(actual, sn)
+        actual = -timedelta_NaT + s1
+        tm.assert_series_equal(actual, sn)
+
+        with pytest.raises(TypeError):
+            s1 + np.nan
+        with pytest.raises(TypeError):
+            np.nan + s1
+        with pytest.raises(TypeError):
+            s1 - np.nan
+        with pytest.raises(TypeError):
+            -np.nan + s1
+
+        actual = s1 + pd.NaT
+        tm.assert_series_equal(actual, sn)
+        actual = s2 - pd.NaT
+        tm.assert_series_equal(actual, sn)
+
+        actual = s1 + df1
+        tm.assert_frame_equal(actual, df2)
+        actual = s2 - df1
+        tm.assert_frame_equal(actual, df1)
+        actual = df1 + s1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - s1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + df1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - df1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + scalar1
+        tm.assert_frame_equal(actual, df2)
+        actual = df2 - scalar1
+        tm.assert_frame_equal(actual, df1)
+
+        actual = df1 + timedelta_NaT
+        tm.assert_frame_equal(actual, dfn)
+        actual = df1 - timedelta_NaT
+        tm.assert_frame_equal(actual, dfn)
+
+        with pytest.raises(TypeError):
+            df1 + np.nan
+        with pytest.raises(TypeError):
+            df1 - np.nan
+
+        actual = df1 + pd.NaT  # NaT is datetime, not timedelta
+        tm.assert_frame_equal(actual, dfn)
+        actual = df1 - pd.NaT
+        tm.assert_frame_equal(actual, dfn)
+
+    # TODO: moved from tests.series.test_operators, needs splitting, cleanup,
+    # de-duplication, box-parametrization...
+    def test_operators_timedelta64(self):
+        # series ops
+        v1 = pd.date_range('2012-1-1', periods=3, freq='D')
+        v2 = pd.date_range('2012-1-2', periods=3, freq='D')
+        rs = Series(v2) - Series(v1)
+        xp = Series(1e9 * 3600 * 24,
+                    rs.index).astype('int64').astype('timedelta64[ns]')
+        tm.assert_series_equal(rs, xp)
+        assert rs.dtype == 'timedelta64[ns]'
+
+        df = DataFrame(dict(A=v1))
+        td = Series([timedelta(days=i) for i in range(3)])
+        assert td.dtype == 'timedelta64[ns]'
+
+        # series on the rhs
+        result = df['A'] - df['A'].shift()
+        assert result.dtype == 'timedelta64[ns]'
+
+        result = df['A'] + td
+        assert result.dtype == 'M8[ns]'
+
+        # scalar Timestamp on rhs
+        maxa = df['A'].max()
+        assert isinstance(maxa, Timestamp)
+
+        resultb = df['A'] - df['A'].max()
+        assert resultb.dtype == 'timedelta64[ns]'
+
+        # timestamp on lhs
+        result = resultb + df['A']
+        values = [Timestamp('20111230'), Timestamp('20120101'),
+                  Timestamp('20120103')]
+        expected = Series(values, name='A')
+        tm.assert_series_equal(result, expected)
+
+        # datetimes on rhs
+        result = df['A'] - datetime(2001, 1, 1)
+        expected = Series(
+            [timedelta(days=4017 + i) for i in range(3)], name='A')
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'm8[ns]'
+
+        d = datetime(2001, 1, 1, 3, 4)
+        resulta = df['A'] - d
+        assert resulta.dtype == 'm8[ns]'
+
+        # roundtrip
+        resultb = resulta + d
+        tm.assert_series_equal(df['A'], resultb)
+
+        # timedeltas on rhs
+        td = timedelta(days=1)
+        resulta = df['A'] + td
+        resultb = resulta - td
+        tm.assert_series_equal(resultb, df['A'])
+        assert resultb.dtype == 'M8[ns]'
+
+        # roundtrip
+        td = timedelta(minutes=5, seconds=3)
+        resulta = df['A'] + td
+        resultb = resulta - td
+        tm.assert_series_equal(df['A'], resultb)
+        assert resultb.dtype == 'M8[ns]'
+
+        # inplace
+        value = rs[2] + np.timedelta64(timedelta(minutes=5, seconds=1))
+        rs[2] += np.timedelta64(timedelta(minutes=5, seconds=1))
+        assert rs[2] == value
+
+    def test_timedelta64_ops_nat(self):
+        # GH 11349
+        timedelta_series = Series([NaT, Timedelta('1s')])
+        nat_series_dtype_timedelta = Series([NaT, NaT],
+                                            dtype='timedelta64[ns]')
+        single_nat_dtype_timedelta = Series([NaT], dtype='timedelta64[ns]')
+
+        # subtraction
+        tm.assert_series_equal(timedelta_series - NaT,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(-NaT + timedelta_series,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(timedelta_series - single_nat_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(-single_nat_dtype_timedelta + timedelta_series,
+                               nat_series_dtype_timedelta)
+
+        # addition
+        tm.assert_series_equal(nat_series_dtype_timedelta + NaT,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(NaT + nat_series_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(nat_series_dtype_timedelta +
+                               single_nat_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(single_nat_dtype_timedelta +
+                               nat_series_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(timedelta_series + NaT,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(NaT + timedelta_series,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(timedelta_series + single_nat_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(single_nat_dtype_timedelta + timedelta_series,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(nat_series_dtype_timedelta + NaT,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(NaT + nat_series_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(nat_series_dtype_timedelta +
+                               single_nat_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(single_nat_dtype_timedelta +
+                               nat_series_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+
+        # multiplication
+        tm.assert_series_equal(nat_series_dtype_timedelta * 1.0,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(1.0 * nat_series_dtype_timedelta,
+                               nat_series_dtype_timedelta)
+
+        tm.assert_series_equal(timedelta_series * 1, timedelta_series)
+        tm.assert_series_equal(1 * timedelta_series, timedelta_series)
+
+        tm.assert_series_equal(timedelta_series * 1.5,
+                               Series([NaT, Timedelta('1.5s')]))
+        tm.assert_series_equal(1.5 * timedelta_series,
+                               Series([NaT, Timedelta('1.5s')]))
+
+        tm.assert_series_equal(timedelta_series * np.nan,
+                               nat_series_dtype_timedelta)
+        tm.assert_series_equal(np.nan * timedelta_series,
+                               nat_series_dtype_timedelta)
+
+        # division
+        tm.assert_series_equal(timedelta_series / 2,
+                               Series([NaT, Timedelta('0.5s')]))
+        tm.assert_series_equal(timedelta_series / 2.0,
+                               Series([NaT, Timedelta('0.5s')]))
+        tm.assert_series_equal(timedelta_series / np.nan,
+                               nat_series_dtype_timedelta)
+
+    # -------------------------------------------------------------
+    # Invalid Operations
+
+    def test_td64arr_add_str_invalid(self, box_with_array):
+        # GH#13624
+        tdi = TimedeltaIndex(['1 day', '2 days'])
+        tdi = tm.box_expected(tdi, box_with_array)
+
+        with pytest.raises(TypeError):
+            tdi + 'a'
+        with pytest.raises(TypeError):
+            'a' + tdi
+
+    @pytest.mark.parametrize('other', [3.14, np.array([2.0, 3.0])])
+    def test_td64arr_add_sub_float(self, box_with_array, other):
+        tdi = TimedeltaIndex(['-1 days', '-1 days'])
+        tdarr = tm.box_expected(tdi, box_with_array)
+
+        with pytest.raises(TypeError):
+            tdarr + other
+        with pytest.raises(TypeError):
+            other + tdarr
+        with pytest.raises(TypeError):
+            tdarr - other
+        with pytest.raises(TypeError):
+            other - tdarr
+
+    @pytest.mark.parametrize('freq', [None, 'H'])
+    def test_td64arr_sub_period(self, box_with_array, freq):
+        # GH#13078
+        # not supported, check TypeError
+        p = pd.Period('2011-01-01', freq='D')
+        idx = TimedeltaIndex(['1 hours', '2 hours'], freq=freq)
+        idx = tm.box_expected(idx, box_with_array)
+
+        with pytest.raises(TypeError):
+            idx - p
+
+        with pytest.raises(TypeError):
+            p - idx
+
+    @pytest.mark.parametrize('pi_freq', ['D', 'W', 'Q', 'H'])
+    @pytest.mark.parametrize('tdi_freq', [None, 'H'])
+    def test_td64arr_sub_pi(self, box_with_array, tdi_freq, pi_freq):
+        # GH#20049 subtracting PeriodIndex should raise TypeError
+        tdi = TimedeltaIndex(['1 hours', '2 hours'], freq=tdi_freq)
+        dti = Timestamp('2018-03-07 17:16:40') + tdi
+        pi = dti.to_period(pi_freq)
+
+        # TODO: parametrize over box for pi?
+        tdi = tm.box_expected(tdi, box_with_array)
+        with pytest.raises(TypeError):
+            tdi - pi
+
+    # -------------------------------------------------------------
+    # Binary operations td64 arraylike and datetime-like
+
+    def test_td64arr_sub_timestamp_raises(self, box_with_array):
+        idx = TimedeltaIndex(['1 day', '2 day'])
+        idx = tm.box_expected(idx, box_with_array)
+
+        msg = ("cannot subtract a datelike from|"
+               "Could not operate|"
+               "cannot perform operation")
+        with pytest.raises(TypeError, match=msg):
+            idx - Timestamp('2011-01-01')
+
+    def test_td64arr_add_timestamp(self, box_with_array, tz_naive_fixture):
+        # GH#23215
+
+        # TODO: parametrize over scalar datetime types?
+        tz = tz_naive_fixture
+        other = Timestamp('2011-01-01', tz=tz)
+
+        idx = TimedeltaIndex(['1 day', '2 day'])
+        expected = DatetimeIndex(['2011-01-02', '2011-01-03'], tz=tz)
+
+        # FIXME: fails with transpose=True because of tz-aware DataFrame
+        #  transpose bug
+        idx = tm.box_expected(idx, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = idx + other
+        tm.assert_equal(result, expected)
+
+        result = other + idx
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_add_sub_timestamp(self, box_with_array):
+        # GH#11925
+        ts = Timestamp('2012-01-01')
+        # TODO: parametrize over types of datetime scalar?
+
+        tdi = timedelta_range('1 day', periods=3)
+        expected = pd.date_range('2012-01-02', periods=3)
+
+        tdarr = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        tm.assert_equal(ts + tdarr, expected)
+        tm.assert_equal(tdarr + ts, expected)
+
+        expected2 = pd.date_range('2011-12-31', periods=3, freq='-1D')
+        expected2 = tm.box_expected(expected2, box_with_array)
+
+        tm.assert_equal(ts - tdarr, expected2)
+        tm.assert_equal(ts + (-tdarr), expected2)
+
+        with pytest.raises(TypeError):
+            tdarr - ts
+
+    def test_tdi_sub_dt64_array(self, box_with_array):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        dtarr = dti.values
+        expected = pd.DatetimeIndex(dtarr) - tdi
+
+        tdi = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        with pytest.raises(TypeError):
+            tdi - dtarr
+
+        # TimedeltaIndex.__rsub__
+        result = dtarr - tdi
+        tm.assert_equal(result, expected)
+
+    def test_tdi_add_dt64_array(self, box_with_array):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        dtarr = dti.values
+        expected = pd.DatetimeIndex(dtarr) + tdi
+
+        tdi = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdi + dtarr
+        tm.assert_equal(result, expected)
+        result = dtarr + tdi
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_add_datetime64_nat(self, box_with_array):
+        # GH#23215
+        other = np.datetime64('NaT')
+
+        tdi = timedelta_range('1 day', periods=3)
+        expected = pd.DatetimeIndex(["NaT", "NaT", "NaT"])
+
+        tdser = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        tm.assert_equal(tdser + other, expected)
+        tm.assert_equal(other + tdser, expected)
+
+    # ------------------------------------------------------------------
+    # Operations with int-like others
+
+    def test_td64arr_add_int_series_invalid(self, box):
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        tdser = tm.box_expected(tdser, box)
+        err = TypeError if box is not pd.Index else NullFrequencyError
+        int_ser = Series([2, 3, 4])
+
+        with pytest.raises(err):
+            tdser + int_ser
+        with pytest.raises(err):
+            int_ser + tdser
+        with pytest.raises(err):
+            tdser - int_ser
+        with pytest.raises(err):
+            int_ser - tdser
+
+    def test_td64arr_add_intlike(self, box_with_array):
+        # GH#19123
+        tdi = TimedeltaIndex(['59 days', '59 days', 'NaT'])
+        ser = tm.box_expected(tdi, box_with_array)
+
+        err = TypeError
+        if box_with_array in [pd.Index, tm.to_array]:
+            err = NullFrequencyError
+
+        other = Series([20, 30, 40], dtype='uint8')
+
+        # TODO: separate/parametrize
+        with pytest.raises(err):
+            ser + 1
+        with pytest.raises(err):
+            ser - 1
+
+        with pytest.raises(err):
+            ser + other
+        with pytest.raises(err):
+            ser - other
+
+        with pytest.raises(err):
+            ser + np.array(other)
+        with pytest.raises(err):
+            ser - np.array(other)
+
+        with pytest.raises(err):
+            ser + pd.Index(other)
+        with pytest.raises(err):
+            ser - pd.Index(other)
+
+    @pytest.mark.parametrize('scalar', [1, 1.5, np.array(2)])
+    def test_td64arr_add_sub_numeric_scalar_invalid(self, box_with_array,
+                                                    scalar):
+        box = box_with_array
+
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        tdser = tm.box_expected(tdser, box)
+        err = TypeError
+        if box in [pd.Index, tm.to_array] and not isinstance(scalar, float):
+            err = NullFrequencyError
+
+        with pytest.raises(err):
+            tdser + scalar
+        with pytest.raises(err):
+            scalar + tdser
+        with pytest.raises(err):
+            tdser - scalar
+        with pytest.raises(err):
+            scalar - tdser
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vec', [
+        np.array([1, 2, 3]),
+        pd.Index([1, 2, 3]),
+        Series([1, 2, 3])
+        # TODO: Add DataFrame in here?
+    ], ids=lambda x: type(x).__name__)
+    def test_td64arr_add_sub_numeric_arr_invalid(self, box, vec, dtype):
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        tdser = tm.box_expected(tdser, box)
+        err = TypeError
+        if box is pd.Index and not dtype.startswith('float'):
+            err = NullFrequencyError
+
+        vector = vec.astype(dtype)
+        with pytest.raises(err):
+            tdser + vector
+        with pytest.raises(err):
+            vector + tdser
+        with pytest.raises(err):
+            tdser - vector
+        with pytest.raises(err):
+            vector - tdser
+
+    # ------------------------------------------------------------------
+    # Operations with timedelta-like others
+
+    # TODO: this was taken from tests.series.test_ops; de-duplicate
+    @pytest.mark.parametrize('scalar_td', [timedelta(minutes=5, seconds=4),
+                                           Timedelta(minutes=5, seconds=4),
+                                           Timedelta('5m4s').to_timedelta64()])
+    def test_operators_timedelta64_with_timedelta(self, scalar_td):
+        # smoke tests
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        td1 + scalar_td
+        scalar_td + td1
+        td1 - scalar_td
+        scalar_td - td1
+        td1 / scalar_td
+        scalar_td / td1
+
+    # TODO: this was taken from tests.series.test_ops; de-duplicate
+    def test_timedelta64_operations_with_timedeltas(self):
+        # td operate with td
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td2 = timedelta(minutes=5, seconds=4)
+        result = td1 - td2
+        expected = (Series([timedelta(seconds=0)] * 3) -
+                    Series([timedelta(seconds=1)] * 3))
+        assert result.dtype == 'm8[ns]'
+        tm.assert_series_equal(result, expected)
+
+        result2 = td2 - td1
+        expected = (Series([timedelta(seconds=1)] * 3) -
+                    Series([timedelta(seconds=0)] * 3))
+        tm.assert_series_equal(result2, expected)
+
+        # roundtrip
+        tm.assert_series_equal(result + td2, td1)
+
+        # Now again, using pd.to_timedelta, which should build
+        # a Series or a scalar, depending on input.
+        td1 = Series(pd.to_timedelta(['00:05:03'] * 3))
+        td2 = pd.to_timedelta('00:05:04')
+        result = td1 - td2
+        expected = (Series([timedelta(seconds=0)] * 3) -
+                    Series([timedelta(seconds=1)] * 3))
+        assert result.dtype == 'm8[ns]'
+        tm.assert_series_equal(result, expected)
+
+        result2 = td2 - td1
+        expected = (Series([timedelta(seconds=1)] * 3) -
+                    Series([timedelta(seconds=0)] * 3))
+        tm.assert_series_equal(result2, expected)
+
+        # roundtrip
+        tm.assert_series_equal(result + td2, td1)
+
+    def test_td64arr_add_td64_array(self, box):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = 2 * tdi
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        result = tdi + tdarr
+        tm.assert_equal(result, expected)
+        result = tdarr + tdi
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_sub_td64_array(self, box):
+        dti = pd.date_range('2016-01-01', periods=3)
+        tdi = dti - dti.shift(1)
+        tdarr = tdi.values
+
+        expected = 0 * tdi
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        result = tdi - tdarr
+        tm.assert_equal(result, expected)
+        result = tdarr - tdi
+        tm.assert_equal(result, expected)
+
+    # TODO: parametrize over [add, sub, radd, rsub]?
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_td64arr_add_sub_tdi(self, box, names):
+        # GH#17250 make sure result dtype is correct
+        # GH#19043 make sure names are propagated correctly
+        if box is pd.DataFrame and names[1] == 'Venkman':
+            pytest.skip("Name propagation for DataFrame does not behave like "
+                        "it does for Index/Series")
+
+        tdi = TimedeltaIndex(['0 days', '1 day'], name=names[0])
+        ser = Series([Timedelta(hours=3), Timedelta(hours=4)], name=names[1])
+        expected = Series([Timedelta(hours=3), Timedelta(days=1, hours=4)],
+                          name=names[2])
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        result = tdi + ser
+        tm.assert_equal(result, expected)
+        if box is not pd.DataFrame:
+            assert result.dtype == 'timedelta64[ns]'
+        else:
+            assert result.dtypes[0] == 'timedelta64[ns]'
+
+        result = ser + tdi
+        tm.assert_equal(result, expected)
+        if box is not pd.DataFrame:
+            assert result.dtype == 'timedelta64[ns]'
+        else:
+            assert result.dtypes[0] == 'timedelta64[ns]'
+
+        expected = Series([Timedelta(hours=-3), Timedelta(days=1, hours=-4)],
+                          name=names[2])
+        expected = tm.box_expected(expected, box)
+
+        result = tdi - ser
+        tm.assert_equal(result, expected)
+        if box is not pd.DataFrame:
+            assert result.dtype == 'timedelta64[ns]'
+        else:
+            assert result.dtypes[0] == 'timedelta64[ns]'
+
+        result = ser - tdi
+        tm.assert_equal(result, -expected)
+        if box is not pd.DataFrame:
+            assert result.dtype == 'timedelta64[ns]'
+        else:
+            assert result.dtypes[0] == 'timedelta64[ns]'
+
+    def test_td64arr_add_sub_td64_nat(self, box):
+        # GH#23320 special handling for timedelta64("NaT")
+        tdi = pd.TimedeltaIndex([NaT, Timedelta('1s')])
+        other = np.timedelta64("NaT")
+        expected = pd.TimedeltaIndex(["NaT"] * 2)
+
+        obj = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        result = obj + other
+        tm.assert_equal(result, expected)
+        result = other + obj
+        tm.assert_equal(result, expected)
+        result = obj - other
+        tm.assert_equal(result, expected)
+        result = other - obj
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_sub_NaT(self, box):
+        # GH#18808
+        ser = Series([NaT, Timedelta('1s')])
+        expected = Series([NaT, NaT], dtype='timedelta64[ns]')
+
+        ser = tm.box_expected(ser, box)
+        expected = tm.box_expected(expected, box)
+
+        res = ser - pd.NaT
+        tm.assert_equal(res, expected)
+
+    def test_td64arr_add_timedeltalike(self, two_hours, box):
+        # only test adding/sub offsets as + is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('1 days 02:00:00', '10 days 02:00:00',
+                                   freq='D')
+        rng = tm.box_expected(rng, box)
+        expected = tm.box_expected(expected, box)
+
+        result = rng + two_hours
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_sub_timedeltalike(self, two_hours, box):
+        # only test adding/sub offsets as - is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
+
+        rng = tm.box_expected(rng, box)
+        expected = tm.box_expected(expected, box)
+
+        result = rng - two_hours
+        tm.assert_equal(result, expected)
+
+    # ------------------------------------------------------------------
+    # __add__/__sub__ with DateOffsets and arrays of DateOffsets
+
+    # TODO: this was taken from tests.series.test_operators; de-duplicate
+    def test_timedelta64_operations_with_DateOffset(self):
+        # GH#10699
+        td = Series([timedelta(minutes=5, seconds=3)] * 3)
+        result = td + pd.offsets.Minute(1)
+        expected = Series([timedelta(minutes=6, seconds=3)] * 3)
+        tm.assert_series_equal(result, expected)
+
+        result = td - pd.offsets.Minute(1)
+        expected = Series([timedelta(minutes=4, seconds=3)] * 3)
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = td + Series([pd.offsets.Minute(1), pd.offsets.Second(3),
+                                  pd.offsets.Hour(2)])
+        expected = Series([timedelta(minutes=6, seconds=3),
+                           timedelta(minutes=5, seconds=6),
+                           timedelta(hours=2, minutes=5, seconds=3)])
+        tm.assert_series_equal(result, expected)
+
+        result = td + pd.offsets.Minute(1) + pd.offsets.Second(12)
+        expected = Series([timedelta(minutes=6, seconds=15)] * 3)
+        tm.assert_series_equal(result, expected)
+
+        # valid DateOffsets
+        for do in ['Hour', 'Minute', 'Second', 'Day', 'Micro', 'Milli',
+                   'Nano']:
+            op = getattr(pd.offsets, do)
+            td + op(5)
+            op(5) + td
+            td - op(5)
+            op(5) - td
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_td64arr_add_offset_index(self, names, box):
+        # GH#18849, GH#19744
+        if box is pd.DataFrame and names[1] == 'bar':
+            pytest.skip("Name propagation for DataFrame does not behave like "
+                        "it does for Index/Series")
+
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = pd.Index([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                         name=names[1])
+
+        expected = TimedeltaIndex([tdi[n] + other[n] for n in range(len(tdi))],
+                                  freq='infer', name=names[2])
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        # The DataFrame operation is transposed and so operates as separate
+        #  scalar operations, which do not issue a PerformanceWarning
+        warn = PerformanceWarning if box is not pd.DataFrame else None
+        with tm.assert_produces_warning(warn):
+            res = tdi + other
+        tm.assert_equal(res, expected)
+
+        with tm.assert_produces_warning(warn):
+            res2 = other + tdi
+        tm.assert_equal(res2, expected)
+
+    # TODO: combine with test_td64arr_add_offset_index by parametrizing
+    # over second box?
+    def test_td64arr_add_offset_array(self, box):
+        # GH#18849
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+        other = np.array([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)])
+
+        expected = TimedeltaIndex([tdi[n] + other[n] for n in range(len(tdi))],
+                                  freq='infer')
+
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        # The DataFrame operation is transposed and so operates as separate
+        #  scalar operations, which do not issue a PerformanceWarning
+        warn = PerformanceWarning if box is not pd.DataFrame else None
+        with tm.assert_produces_warning(warn):
+            res = tdi + other
+        tm.assert_equal(res, expected)
+
+        with tm.assert_produces_warning(warn):
+            res2 = other + tdi
+        tm.assert_equal(res2, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_td64arr_sub_offset_index(self, names, box):
+        # GH#18824, GH#19744
+        if box is pd.DataFrame and names[1] == 'bar':
+            pytest.skip("Name propagation for DataFrame does not behave like "
+                        "it does for Index/Series")
+
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = pd.Index([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                         name=names[1])
+
+        expected = TimedeltaIndex([tdi[n] - other[n] for n in range(len(tdi))],
+                                  freq='infer', name=names[2])
+
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, box)
+
+        # The DataFrame operation is transposed and so operates as separate
+        #  scalar operations, which do not issue a PerformanceWarning
+        warn = PerformanceWarning if box is not pd.DataFrame else None
+        with tm.assert_produces_warning(warn):
+            res = tdi - other
+        tm.assert_equal(res, expected)
+
+    def test_td64arr_sub_offset_array(self, box_with_array):
+        # GH#18824
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+        other = np.array([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)])
+
+        expected = TimedeltaIndex([tdi[n] - other[n] for n in range(len(tdi))],
+                                  freq='infer')
+
+        tdi = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        # The DataFrame operation is transposed and so operates as separate
+        #  scalar operations, which do not issue a PerformanceWarning
+        warn = None if box_with_array is pd.DataFrame else PerformanceWarning
+        with tm.assert_produces_warning(warn):
+            res = tdi - other
+        tm.assert_equal(res, expected)
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('foo', 'foo', 'foo')])
+    def test_td64arr_with_offset_series(self, names, box_df_fail):
+        # GH#18849
+        box = box_df_fail
+        box2 = Series if box in [pd.Index, tm.to_array] else box
+
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'],
+                             name=names[0])
+        other = Series([pd.offsets.Hour(n=1), pd.offsets.Minute(n=-2)],
+                       name=names[1])
+
+        expected_add = Series([tdi[n] + other[n] for n in range(len(tdi))],
+                              name=names[2])
+        tdi = tm.box_expected(tdi, box)
+        expected_add = tm.box_expected(expected_add, box2)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = tdi + other
+        tm.assert_equal(res, expected_add)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res2 = other + tdi
+        tm.assert_equal(res2, expected_add)
+
+        # TODO: separate/parametrize add/sub test?
+        expected_sub = Series([tdi[n] - other[n] for n in range(len(tdi))],
+                              name=names[2])
+        expected_sub = tm.box_expected(expected_sub, box2)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res3 = tdi - other
+        tm.assert_equal(res3, expected_sub)
+
+    @pytest.mark.parametrize('obox', [np.array, pd.Index, pd.Series])
+    def test_td64arr_addsub_anchored_offset_arraylike(self, obox,
+                                                      box_with_array):
+        # GH#18824
+        tdi = TimedeltaIndex(['1 days 00:00:00', '3 days 04:00:00'])
+        tdi = tm.box_expected(tdi, box_with_array)
+
+        anchored = obox([pd.offsets.MonthEnd(), pd.offsets.Day(n=2)])
+
+        # addition/subtraction ops with anchored offsets should issue
+        # a PerformanceWarning and _then_ raise a TypeError.
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                tdi + anchored
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored + tdi
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                tdi - anchored
+        with pytest.raises(TypeError):
+            with tm.assert_produces_warning(PerformanceWarning):
+                anchored - tdi
+
+
+class TestTimedeltaArraylikeMulDivOps(object):
+    # Tests for timedelta64[ns]
+    # __mul__, __rmul__, __div__, __rdiv__, __floordiv__, __rfloordiv__
+
+    # TODO: Moved from tests.series.test_operators; needs cleanup
+    @pytest.mark.parametrize("m", [1, 3, 10])
+    @pytest.mark.parametrize("unit", ['D', 'h', 'm', 's', 'ms', 'us', 'ns'])
+    def test_timedelta64_conversions(self, m, unit):
+        startdate = Series(pd.date_range('2013-01-01', '2013-01-03'))
+        enddate = Series(pd.date_range('2013-03-01', '2013-03-03'))
+
+        ser = enddate - startdate
+        ser[2] = np.nan
+
+        # op
+        expected = Series([x / np.timedelta64(m, unit) for x in ser])
+        result = ser / np.timedelta64(m, unit)
+        tm.assert_series_equal(result, expected)
+
+        # reverse op
+        expected = Series([Timedelta(np.timedelta64(m, unit)) / x
+                           for x in ser])
+        result = np.timedelta64(m, unit) / ser
+        tm.assert_series_equal(result, expected)
+
+    # ------------------------------------------------------------------
+    # Multiplication
+    # organized with scalar others first, then array-like
+
+    def test_td64arr_mul_int(self, box_with_array):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box_with_array)
+
+        result = idx * 1
+        tm.assert_equal(result, idx)
+
+        result = 1 * idx
+        tm.assert_equal(result, idx)
+
+    def test_td64arr_mul_tdlike_scalar_raises(self, two_hours, box_with_array):
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        rng = tm.box_expected(rng, box_with_array)
+        with pytest.raises(TypeError):
+            rng * two_hours
+
+    def test_tdi_mul_int_array_zerodim(self, box_with_array):
+        rng5 = np.arange(5, dtype='int64')
+        idx = TimedeltaIndex(rng5)
+        expected = TimedeltaIndex(rng5 * 5)
+
+        idx = tm.box_expected(idx, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = idx * np.array(5, dtype='int64')
+        tm.assert_equal(result, expected)
+
+    def test_tdi_mul_int_array(self, box_with_array):
+        rng5 = np.arange(5, dtype='int64')
+        idx = TimedeltaIndex(rng5)
+        expected = TimedeltaIndex(rng5 ** 2)
+
+        idx = tm.box_expected(idx, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = idx * rng5
+        tm.assert_equal(result, expected)
+
+    def test_tdi_mul_int_series(self, box_with_array):
+        box = box_with_array
+        xbox = pd.Series if box in [pd.Index, tm.to_array] else box
+
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        expected = TimedeltaIndex(np.arange(5, dtype='int64') ** 2)
+
+        idx = tm.box_expected(idx, box)
+        expected = tm.box_expected(expected, xbox)
+
+        result = idx * pd.Series(np.arange(5, dtype='int64'))
+        tm.assert_equal(result, expected)
+
+    def test_tdi_mul_float_series(self, box_with_array):
+        box = box_with_array
+        xbox = pd.Series if box in [pd.Index, tm.to_array] else box
+
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box)
+
+        rng5f = np.arange(5, dtype='float64')
+        expected = TimedeltaIndex(rng5f * (rng5f + 1.0))
+        expected = tm.box_expected(expected, xbox)
+
+        result = idx * Series(rng5f + 1.0)
+        tm.assert_equal(result, expected)
+
+    # TODO: Put Series/DataFrame in others?
+    @pytest.mark.parametrize('other', [
+        np.arange(1, 11),
+        pd.Int64Index(range(1, 11)),
+        pd.UInt64Index(range(1, 11)),
+        pd.Float64Index(range(1, 11)),
+        pd.RangeIndex(1, 11)
+    ], ids=lambda x: type(x).__name__)
+    def test_tdi_rmul_arraylike(self, other, box_with_array):
+        box = box_with_array
+        xbox = get_upcast_box(box, other)
+
+        tdi = TimedeltaIndex(['1 Day'] * 10)
+        expected = timedelta_range('1 days', '10 days')
+        expected._data.freq = None
+
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, xbox)
+
+        result = other * tdi
+        tm.assert_equal(result, expected)
+        commute = tdi * other
+        tm.assert_equal(commute, expected)
+
+    # ------------------------------------------------------------------
+    # __div__, __rdiv__
+
+    def test_td64arr_div_nat_invalid(self, box_with_array):
+        # don't allow division by NaT (maybe could in the future)
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        rng = tm.box_expected(rng, box_with_array)
+
+        with pytest.raises(TypeError, match='true_divide cannot use operands'):
+            rng / pd.NaT
+        with pytest.raises(TypeError, match='Cannot divide NaTType by'):
+            pd.NaT / rng
+
+    def test_td64arr_div_td64nat(self, box_with_array):
+        # GH#23829
+        rng = timedelta_range('1 days', '10 days',)
+        rng = tm.box_expected(rng, box_with_array)
+
+        other = np.timedelta64('NaT')
+
+        expected = np.array([np.nan] * 10)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = rng / other
+        tm.assert_equal(result, expected)
+
+        result = other / rng
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_div_int(self, box_with_array):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box_with_array)
+
+        result = idx / 1
+        tm.assert_equal(result, idx)
+
+        with pytest.raises(TypeError, match='Cannot divide'):
+            # GH#23829
+            1 / idx
+
+    def test_td64arr_div_tdlike_scalar(self, two_hours, box_with_array):
+        # GH#20088, GH#22163 ensure DataFrame returns correct dtype
+        rng = timedelta_range('1 days', '10 days', name='foo')
+        expected = pd.Float64Index((np.arange(10) + 1) * 12, name='foo')
+
+        rng = tm.box_expected(rng, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = rng / two_hours
+        tm.assert_equal(result, expected)
+
+        result = two_hours / rng
+        expected = 1 / expected
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_div_tdlike_scalar_with_nat(self, two_hours,
+                                                box_with_array):
+        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
+        expected = pd.Float64Index([12, np.nan, 24], name='foo')
+
+        rng = tm.box_expected(rng, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = rng / two_hours
+        tm.assert_equal(result, expected)
+
+        result = two_hours / rng
+        expected = 1 / expected
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_div_td64_ndarray(self, box_with_array):
+        # GH#22631
+        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'])
+        expected = pd.Float64Index([12, np.nan, 24])
+
+        rng = tm.box_expected(rng, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        other = np.array([2, 4, 2], dtype='m8[h]')
+        result = rng / other
+        tm.assert_equal(result, expected)
+
+        result = rng / tm.box_expected(other, box_with_array)
+        tm.assert_equal(result, expected)
+
+        result = rng / other.astype(object)
+        tm.assert_equal(result, expected)
+
+        result = rng / list(other)
+        tm.assert_equal(result, expected)
+
+        # reversed op
+        expected = 1 / expected
+        result = other / rng
+        tm.assert_equal(result, expected)
+
+        result = tm.box_expected(other, box_with_array) / rng
+        tm.assert_equal(result, expected)
+
+        result = other.astype(object) / rng
+        tm.assert_equal(result, expected)
+
+        result = list(other) / rng
+        tm.assert_equal(result, expected)
+
+    def test_tdarr_div_length_mismatch(self, box_with_array):
+        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'])
+        mismatched = [1, 2, 3, 4]
+
+        rng = tm.box_expected(rng, box_with_array)
+        for obj in [mismatched, mismatched[:2]]:
+            # one shorter, one longer
+            for other in [obj, np.array(obj), pd.Index(obj)]:
+                with pytest.raises(ValueError):
+                    rng / other
+                with pytest.raises(ValueError):
+                    other / rng
+
+    # ------------------------------------------------------------------
+    # __floordiv__, __rfloordiv__
+
+    def test_td64arr_floordiv_tdscalar(self, box_with_array, scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        expected = Series([0, 0, np.nan])
+
+        td1 = tm.box_expected(td1, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = td1 // scalar_td
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_rfloordiv_tdscalar(self, box_with_array, scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        expected = Series([1, 1, np.nan])
+
+        td1 = tm.box_expected(td1, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        result = scalar_td // td1
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_rfloordiv_tdscalar_explicit(self, box_with_array,
+                                                 scalar_td):
+        # GH#18831
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        expected = Series([1, 1, np.nan])
+
+        td1 = tm.box_expected(td1, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        # We can test __rfloordiv__ using this syntax,
+        # see `test_timedelta_rfloordiv`
+        result = td1.__rfloordiv__(scalar_td)
+        tm.assert_equal(result, expected)
+
+    def test_td64arr_floordiv_int(self, box_with_array):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box_with_array)
+        result = idx // 1
+        tm.assert_equal(result, idx)
+
+        pattern = ('floor_divide cannot use operands|'
+                   'Cannot divide int by Timedelta*')
+        with pytest.raises(TypeError, match=pattern):
+            1 // idx
+
+    def test_td64arr_floordiv_tdlike_scalar(self, two_hours, box_with_array):
+        tdi = timedelta_range('1 days', '10 days', name='foo')
+        expected = pd.Int64Index((np.arange(10) + 1) * 12, name='foo')
+
+        tdi = tm.box_expected(tdi, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdi // two_hours
+        tm.assert_equal(result, expected)
+
+    # TODO: Is this redundant with test_td64arr_floordiv_tdlike_scalar?
+    @pytest.mark.parametrize('scalar_td', [
+        timedelta(minutes=10, seconds=7),
+        Timedelta('10m7s'),
+        Timedelta('10m7s').to_timedelta64()
+    ], ids=lambda x: type(x).__name__)
+    def test_td64arr_rfloordiv_tdlike_scalar(self, scalar_td, box_with_array):
+        # GH#19125
+        tdi = TimedeltaIndex(['00:05:03', '00:05:03', pd.NaT], freq=None)
+        expected = pd.Index([2.0, 2.0, np.nan])
+
+        tdi = tm.box_expected(tdi, box_with_array, transpose=False)
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        res = tdi.__rfloordiv__(scalar_td)
+        tm.assert_equal(res, expected)
+
+        expected = pd.Index([0.0, 0.0, np.nan])
+        expected = tm.box_expected(expected, box_with_array, transpose=False)
+
+        res = tdi // (scalar_td)
+        tm.assert_equal(res, expected)
+
+    # ------------------------------------------------------------------
+    # mod, divmod
+    # TODO: operations with timedelta-like arrays, numeric arrays,
+    #  reversed ops
+
+    def test_td64arr_mod_tdscalar(self, box_with_array, three_days):
+        tdi = timedelta_range('1 Day', '9 days')
+        tdarr = tm.box_expected(tdi, box_with_array)
+
+        expected = TimedeltaIndex(['1 Day', '2 Days', '0 Days'] * 3)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdarr % three_days
+        tm.assert_equal(result, expected)
+
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("DataFrame does not have __divmod__ or __rdivmod__")
+
+        result = divmod(tdarr, three_days)
+        tm.assert_equal(result[1], expected)
+        tm.assert_equal(result[0], tdarr // three_days)
+
+    def test_td64arr_mod_int(self, box_with_array):
+        tdi = timedelta_range('1 ns', '10 ns', periods=10)
+        tdarr = tm.box_expected(tdi, box_with_array)
+
+        expected = TimedeltaIndex(['1 ns', '0 ns'] * 5)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdarr % 2
+        tm.assert_equal(result, expected)
+
+        with pytest.raises(TypeError):
+            2 % tdarr
+
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("DataFrame does not have __divmod__ or __rdivmod__")
+
+        result = divmod(tdarr, 2)
+        tm.assert_equal(result[1], expected)
+        tm.assert_equal(result[0], tdarr // 2)
+
+    def test_td64arr_rmod_tdscalar(self, box_with_array, three_days):
+        tdi = timedelta_range('1 Day', '9 days')
+        tdarr = tm.box_expected(tdi, box_with_array)
+
+        expected = ['0 Days', '1 Day', '0 Days'] + ['3 Days'] * 6
+        expected = TimedeltaIndex(expected)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = three_days % tdarr
+        tm.assert_equal(result, expected)
+
+        if box_with_array is pd.DataFrame:
+            pytest.xfail("DataFrame does not have __divmod__ or __rdivmod__")
+
+        result = divmod(three_days, tdarr)
+        tm.assert_equal(result[1], expected)
+        tm.assert_equal(result[0], three_days // tdarr)
+
+    # ------------------------------------------------------------------
+    # Operations with invalid others
+
+    def test_td64arr_mul_tdscalar_invalid(self, box_with_array, scalar_td):
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        td1 = tm.box_expected(td1, box_with_array)
+
+        # check that we are getting a TypeError
+        # with 'operate' (from core/ops.py) for the ops that are not
+        # defined
+        pattern = 'operate|unsupported|cannot|not supported'
+        with pytest.raises(TypeError, match=pattern):
+            td1 * scalar_td
+        with pytest.raises(TypeError, match=pattern):
+            scalar_td * td1
+
+    def test_td64arr_mul_too_short_raises(self, box_with_array):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box_with_array)
+        with pytest.raises(TypeError):
+            idx * idx[:3]
+        with pytest.raises(ValueError):
+            idx * np.array([1, 2])
+
+    def test_td64arr_mul_td64arr_raises(self, box_with_array):
+        idx = TimedeltaIndex(np.arange(5, dtype='int64'))
+        idx = tm.box_expected(idx, box_with_array)
+        with pytest.raises(TypeError):
+            idx * idx
+
+    # ------------------------------------------------------------------
+    # Operations with numeric others
+
+    @pytest.mark.parametrize('one', [1, np.array(1), 1.0, np.array(1.0)])
+    def test_td64arr_mul_numeric_scalar(self, box_with_array, one):
+        # GH#4521
+        # divide/multiply by integers
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        expected = Series(['-59 Days', '-59 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        tdser = tm.box_expected(tdser, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdser * (-one)
+        tm.assert_equal(result, expected)
+        result = (-one) * tdser
+        tm.assert_equal(result, expected)
+
+        expected = Series(['118 Days', '118 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdser * (2 * one)
+        tm.assert_equal(result, expected)
+        result = (2 * one) * tdser
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('two', [2, 2.0, np.array(2), np.array(2.0)])
+    def test_td64arr_div_numeric_scalar(self, box_with_array, two):
+        # GH#4521
+        # divide/multiply by integers
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        expected = Series(['29.5D', '29.5D', 'NaT'], dtype='timedelta64[ns]')
+
+        tdser = tm.box_expected(tdser, box_with_array)
+        expected = tm.box_expected(expected, box_with_array)
+
+        result = tdser / two
+        tm.assert_equal(result, expected)
+
+        with pytest.raises(TypeError, match='Cannot divide'):
+            two / tdser
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [np.array([20, 30, 40]),
+                                        pd.Index([20, 30, 40]),
+                                        Series([20, 30, 40])],
+                             ids=lambda x: type(x).__name__)
+    def test_td64arr_rmul_numeric_array(self, box_with_array, vector, dtype):
+        # GH#4521
+        # divide/multiply by integers
+        xbox = get_upcast_box(box_with_array, vector)
+
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        vector = vector.astype(dtype)
+
+        expected = Series(['1180 Days', '1770 Days', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        tdser = tm.box_expected(tdser, box_with_array)
+        expected = tm.box_expected(expected, xbox)
+
+        result = tdser * vector
+        tm.assert_equal(result, expected)
+
+        result = vector * tdser
+        tm.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', ['int64', 'int32', 'int16',
+                                       'uint64', 'uint32', 'uint16', 'uint8',
+                                       'float64', 'float32', 'float16'])
+    @pytest.mark.parametrize('vector', [np.array([20, 30, 40]),
+                                        pd.Index([20, 30, 40]),
+                                        Series([20, 30, 40])],
+                             ids=lambda x: type(x).__name__)
+    def test_td64arr_div_numeric_array(self, box_with_array, vector, dtype):
+        # GH#4521
+        # divide/multiply by integers
+        xbox = get_upcast_box(box_with_array, vector)
+        tdser = pd.Series(['59 Days', '59 Days', 'NaT'], dtype='m8[ns]')
+        vector = vector.astype(dtype)
+        expected = Series(['2.95D', '1D 23H 12m', 'NaT'],
+                          dtype='timedelta64[ns]')
+
+        tdser = tm.box_expected(tdser, box_with_array)
+        expected = tm.box_expected(expected, xbox)
+
+        result = tdser / vector
+        tm.assert_equal(result, expected)
+
+        pattern = ('true_divide cannot use operands|'
+                   'cannot perform __div__|'
+                   'cannot perform __truediv__|'
+                   'unsupported operand|'
+                   'Cannot divide')
+        with pytest.raises(TypeError, match=pattern):
+            vector / tdser
+
+        if not isinstance(vector, pd.Index):
+            # Index.__rdiv__ won't try to operate elementwise, just raises
+            result = tdser / vector.astype(object)
+            if box_with_array is pd.DataFrame:
+                expected = [tdser.iloc[0, n] / vector[n]
+                            for n in range(len(vector))]
+            else:
+                expected = [tdser[n] / vector[n] for n in range(len(tdser))]
+            expected = tm.box_expected(expected, xbox)
+            tm.assert_equal(result, expected)
+
+        with pytest.raises(TypeError, match=pattern):
+            vector.astype(object) / tdser
+
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_td64arr_mul_int_series(self, box_df_fail, names):
+        # GH#19042 test for correct name attachment
+        box = box_df_fail  # broadcasts along wrong axis, but doesn't raise
+        tdi = TimedeltaIndex(['0days', '1day', '2days', '3days', '4days'],
+                             name=names[0])
+        # TODO: Should we be parametrizing over types for `ser` too?
+        ser = Series([0, 1, 2, 3, 4], dtype=np.int64, name=names[1])
+
+        expected = Series(['0days', '1day', '4days', '9days', '16days'],
+                          dtype='timedelta64[ns]',
+                          name=names[2])
+
+        tdi = tm.box_expected(tdi, box)
+        box = Series if (box is pd.Index and type(ser) is Series) else box
+        expected = tm.box_expected(expected, box)
+
+        result = ser * tdi
+        tm.assert_equal(result, expected)
+
+        # The direct operation tdi * ser still needs to be fixed.
+        result = ser.__rmul__(tdi)
+        tm.assert_equal(result, expected)
+
+    # TODO: Should we be parametrizing over types for `ser` too?
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('Egon', 'Venkman', None),
+                                       ('NCC1701D', 'NCC1701D', 'NCC1701D')])
+    def test_float_series_rdiv_td64arr(self, box_with_array, names):
+        # GH#19042 test for correct name attachment
+        # TODO: the direct operation TimedeltaIndex / Series still
+        # needs to be fixed.
+        box = box_with_array
+        tdi = TimedeltaIndex(['0days', '1day', '2days', '3days', '4days'],
+                             name=names[0])
+        ser = Series([1.5, 3, 4.5, 6, 7.5], dtype=np.float64, name=names[1])
+
+        xname = names[2] if box is not tm.to_array else names[1]
+        expected = Series([tdi[n] / ser[n] for n in range(len(ser))],
+                          dtype='timedelta64[ns]',
+                          name=xname)
+
+        xbox = box
+        if box in [pd.Index, tm.to_array] and type(ser) is Series:
+            xbox = Series
+
+        tdi = tm.box_expected(tdi, box)
+        expected = tm.box_expected(expected, xbox)
+
+        result = ser.__rdiv__(tdi)
+        if box is pd.DataFrame:
+            # TODO: Should we skip this case sooner or test something else?
+            assert result is NotImplemented
+        else:
+            tm.assert_equal(result, expected)
+
+
+class TestTimedeltaArraylikeInvalidArithmeticOps(object):
+
+    def test_td64arr_pow_invalid(self, scalar_td, box_with_array):
+        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
+        td1.iloc[2] = np.nan
+
+        td1 = tm.box_expected(td1, box_with_array)
+
+        # check that we are getting a TypeError
+        # with 'operate' (from core/ops.py) for the ops that are not
+        # defined
+        pattern = 'operate|unsupported|cannot|not supported'
+        with pytest.raises(TypeError, match=pattern):
+            scalar_td ** td1
+
+        with pytest.raises(TypeError, match=pattern):
+            td1 ** scalar_td
diff --git a/ci/requirements-2.7_SLOW.pip b/pandas/tests/arrays/__init__.py
similarity index 100%
rename from ci/requirements-2.7_SLOW.pip
rename to pandas/tests/arrays/__init__.py
diff --git a/ci/requirements-3.6.pip b/pandas/tests/arrays/categorical/__init__.py
similarity index 100%
rename from ci/requirements-3.6.pip
rename to pandas/tests/arrays/categorical/__init__.py
diff --git a/pandas/tests/arrays/categorical/common.py b/pandas/tests/arrays/categorical/common.py
new file mode 100644
index 0000000000000..9462482553ed8
--- /dev/null
+++ b/pandas/tests/arrays/categorical/common.py
@@ -0,0 +1,10 @@
+# -*- coding: utf-8 -*-
+
+from pandas import Categorical
+
+
+class TestCategorical(object):
+
+    def setup_method(self, method):
+        self.factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
+                                  ordered=True)
diff --git a/pandas/tests/arrays/categorical/conftest.py b/pandas/tests/arrays/categorical/conftest.py
new file mode 100644
index 0000000000000..274389d484995
--- /dev/null
+++ b/pandas/tests/arrays/categorical/conftest.py
@@ -0,0 +1,13 @@
+import pytest
+
+
+@pytest.fixture(params=[True, False])
+def allow_fill(request):
+    """Boolean 'allow_fill' parameter for Categorical.take"""
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def ordered(request):
+    """Boolean 'ordered' parameter for Categorical."""
+    return request.param
diff --git a/pandas/tests/arrays/categorical/test_algos.py b/pandas/tests/arrays/categorical/test_algos.py
new file mode 100644
index 0000000000000..50f643756c5dc
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_algos.py
@@ -0,0 +1,142 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('ordered', [True, False])
+@pytest.mark.parametrize('categories', [
+    ['b', 'a', 'c'],
+    ['a', 'b', 'c', 'd'],
+])
+def test_factorize(categories, ordered):
+    cat = pd.Categorical(['b', 'b', 'a', 'c', None],
+                         categories=categories,
+                         ordered=ordered)
+    labels, uniques = pd.factorize(cat)
+    expected_labels = np.array([0, 0, 1, 2, -1], dtype=np.intp)
+    expected_uniques = pd.Categorical(['b', 'a', 'c'],
+                                      categories=categories,
+                                      ordered=ordered)
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_factorized_sort():
+    cat = pd.Categorical(['b', 'b', None, 'a'])
+    labels, uniques = pd.factorize(cat, sort=True)
+    expected_labels = np.array([1, 1, -1, 0], dtype=np.intp)
+    expected_uniques = pd.Categorical(['a', 'b'])
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_factorized_sort_ordered():
+    cat = pd.Categorical(['b', 'b', None, 'a'],
+                         categories=['c', 'b', 'a'],
+                         ordered=True)
+
+    labels, uniques = pd.factorize(cat, sort=True)
+    expected_labels = np.array([0, 0, -1, 1], dtype=np.intp)
+    expected_uniques = pd.Categorical(['b', 'a'],
+                                      categories=['c', 'b', 'a'],
+                                      ordered=True)
+
+    tm.assert_numpy_array_equal(labels, expected_labels)
+    tm.assert_categorical_equal(uniques, expected_uniques)
+
+
+def test_isin_cats():
+    # GH2003
+    cat = pd.Categorical(["a", "b", np.nan])
+
+    result = cat.isin(["a", np.nan])
+    expected = np.array([True, False, True], dtype=bool)
+    tm.assert_numpy_array_equal(expected, result)
+
+    result = cat.isin(["a", "c"])
+    expected = np.array([True, False, False], dtype=bool)
+    tm.assert_numpy_array_equal(expected, result)
+
+
+@pytest.mark.parametrize("empty", [[], pd.Series(), np.array([])])
+def test_isin_empty(empty):
+    s = pd.Categorical(["a", "b"])
+    expected = np.array([False, False], dtype=bool)
+
+    result = s.isin(empty)
+    tm.assert_numpy_array_equal(expected, result)
+
+
+class TestTake(object):
+    # https://github.com/pandas-dev/pandas/issues/20664
+
+    def test_take_warns(self):
+        cat = pd.Categorical(['a', 'b'])
+        with tm.assert_produces_warning(FutureWarning):
+            cat.take([0, -1])
+
+    def test_take_positive_no_warning(self):
+        cat = pd.Categorical(['a', 'b'])
+        with tm.assert_produces_warning(None):
+            cat.take([0, 0])
+
+    def test_take_bounds(self, allow_fill):
+        # https://github.com/pandas-dev/pandas/issues/20664
+        cat = pd.Categorical(['a', 'b', 'a'])
+        with pytest.raises(IndexError):
+            cat.take([4, 5], allow_fill=allow_fill)
+
+    def test_take_empty(self, allow_fill):
+        # https://github.com/pandas-dev/pandas/issues/20664
+        cat = pd.Categorical([], categories=['a', 'b'])
+        with pytest.raises(IndexError):
+            cat.take([0], allow_fill=allow_fill)
+
+    def test_positional_take(self, ordered):
+        cat = pd.Categorical(['a', 'a', 'b', 'b'], categories=['b', 'a'],
+                             ordered=ordered)
+        result = cat.take([0, 1, 2], allow_fill=False)
+        expected = pd.Categorical(['a', 'a', 'b'], categories=cat.categories,
+                                  ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_positional_take_unobserved(self, ordered):
+        cat = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'],
+                             ordered=ordered)
+        result = cat.take([1, 0], allow_fill=False)
+        expected = pd.Categorical(['b', 'a'], categories=cat.categories,
+                                  ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_take_allow_fill(self):
+        # https://github.com/pandas-dev/pandas/issues/23296
+        cat = pd.Categorical(['a', 'a', 'b'])
+        result = cat.take([0, -1, -1], allow_fill=True)
+        expected = pd.Categorical(['a', np.nan, np.nan],
+                                  categories=['a', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_take_fill_with_negative_one(self):
+        # -1 was a category
+        cat = pd.Categorical([-1, 0, 1])
+        result = cat.take([0, -1, 1], allow_fill=True, fill_value=-1)
+        expected = pd.Categorical([-1, -1, 0], categories=[-1, 0, 1])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_take_fill_value(self):
+        # https://github.com/pandas-dev/pandas/issues/23296
+        cat = pd.Categorical(['a', 'b', 'c'])
+        result = cat.take([0, 1, -1], fill_value='a', allow_fill=True)
+        expected = pd.Categorical(['a', 'b', 'a'], categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_take_fill_value_new_raises(self):
+        # https://github.com/pandas-dev/pandas/issues/23296
+        cat = pd.Categorical(['a', 'b', 'c'])
+        xpr = r"'fill_value' \('d'\) is not in this Categorical's categories."
+        with pytest.raises(TypeError, match=xpr):
+            cat.take([0, 1, -1], fill_value='d', allow_fill=True)
diff --git a/pandas/tests/arrays/categorical/test_analytics.py b/pandas/tests/arrays/categorical/test_analytics.py
new file mode 100644
index 0000000000000..7ce82d5bcdded
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_analytics.py
@@ -0,0 +1,312 @@
+# -*- coding: utf-8 -*-
+
+import sys
+
+import numpy as np
+import pytest
+
+from pandas.compat import PYPY
+
+from pandas import Categorical, Index, Series
+from pandas.api.types import is_scalar
+import pandas.util.testing as tm
+
+
+class TestCategoricalAnalytics(object):
+
+    def test_min_max(self):
+
+        # unordered cats have no min/max
+        cat = Categorical(["a", "b", "c", "d"], ordered=False)
+        msg = "Categorical is not ordered for operation {}"
+        with pytest.raises(TypeError, match=msg.format('min')):
+            cat.min()
+        with pytest.raises(TypeError, match=msg.format('max')):
+            cat.max()
+
+        cat = Categorical(["a", "b", "c", "d"], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "a"
+        assert _max == "d"
+
+        cat = Categorical(["a", "b", "c", "d"],
+                          categories=['d', 'c', 'b', 'a'], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "d"
+        assert _max == "a"
+
+        cat = Categorical([np.nan, "b", "c", np.nan],
+                          categories=['d', 'c', 'b', 'a'], ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == "b"
+
+        _min = cat.min(numeric_only=True)
+        assert _min == "c"
+        _max = cat.max(numeric_only=True)
+        assert _max == "b"
+
+        cat = Categorical([np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1],
+                          ordered=True)
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == 1
+
+        _min = cat.min(numeric_only=True)
+        assert _min == 2
+        _max = cat.max(numeric_only=True)
+        assert _max == 1
+
+    @pytest.mark.parametrize("values,categories,exp_mode", [
+        ([1, 1, 2, 4, 5, 5, 5], [5, 4, 3, 2, 1], [5]),
+        ([1, 1, 1, 4, 5, 5, 5], [5, 4, 3, 2, 1], [5, 1]),
+        ([1, 2, 3, 4, 5], [5, 4, 3, 2, 1], [5, 4, 3, 2, 1]),
+        ([np.nan, np.nan, np.nan, 4, 5], [5, 4, 3, 2, 1], [5, 4]),
+        ([np.nan, np.nan, np.nan, 4, 5, 4], [5, 4, 3, 2, 1], [4]),
+        ([np.nan, np.nan, 4, 5, 4], [5, 4, 3, 2, 1], [4])])
+    def test_mode(self, values, categories, exp_mode):
+        s = Categorical(values, categories=categories, ordered=True)
+        res = s.mode()
+        exp = Categorical(exp_mode, categories=categories, ordered=True)
+        tm.assert_categorical_equal(res, exp)
+
+    def test_searchsorted(self):
+        # https://github.com/pandas-dev/pandas/issues/8420
+        # https://github.com/pandas-dev/pandas/issues/14522
+
+        c1 = Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
+                         categories=['cheese', 'milk', 'apple', 'bread'],
+                         ordered=True)
+        s1 = Series(c1)
+        c2 = Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
+                         categories=['cheese', 'milk', 'apple', 'bread'],
+                         ordered=False)
+        s2 = Series(c2)
+
+        # Searching for single item argument, side='left' (default)
+        res_cat = c1.searchsorted('apple')
+        assert res_cat == 2
+        assert is_scalar(res_cat)
+
+        res_ser = s1.searchsorted('apple')
+        assert res_ser == 2
+        assert is_scalar(res_ser)
+
+        # Searching for single item array, side='left' (default)
+        res_cat = c1.searchsorted(['bread'])
+        res_ser = s1.searchsorted(['bread'])
+        exp = np.array([3], dtype=np.intp)
+        tm.assert_numpy_array_equal(res_cat, exp)
+        tm.assert_numpy_array_equal(res_ser, exp)
+
+        # Searching for several items array, side='right'
+        res_cat = c1.searchsorted(['apple', 'bread'], side='right')
+        res_ser = s1.searchsorted(['apple', 'bread'], side='right')
+        exp = np.array([3, 5], dtype=np.intp)
+        tm.assert_numpy_array_equal(res_cat, exp)
+        tm.assert_numpy_array_equal(res_ser, exp)
+
+        # Searching for a single value that is not from the Categorical
+        msg = r"Value\(s\) to be inserted must be in categories"
+        with pytest.raises(KeyError, match=msg):
+            c1.searchsorted('cucumber')
+        with pytest.raises(KeyError, match=msg):
+            s1.searchsorted('cucumber')
+
+        # Searching for multiple values one of each is not from the Categorical
+        with pytest.raises(KeyError, match=msg):
+            c1.searchsorted(['bread', 'cucumber'])
+        with pytest.raises(KeyError, match=msg):
+            s1.searchsorted(['bread', 'cucumber'])
+
+        # searchsorted call for unordered Categorical
+        msg = "Categorical not ordered"
+        with pytest.raises(ValueError, match=msg):
+            c2.searchsorted('apple')
+        with pytest.raises(ValueError, match=msg):
+            s2.searchsorted('apple')
+
+    def test_unique(self):
+        # categories are reordered based on value when ordered=False
+        cat = Categorical(["a", "b"])
+        exp = Index(["a", "b"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        tm.assert_categorical_equal(res, cat)
+
+        cat = Categorical(["a", "b", "a", "a"], categories=["a", "b", "c"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        tm.assert_categorical_equal(res, Categorical(exp))
+
+        cat = Categorical(["c", "a", "b", "a", "a"],
+                          categories=["a", "b", "c"])
+        exp = Index(["c", "a", "b"])
+        res = cat.unique()
+        tm.assert_index_equal(res.categories, exp)
+        exp_cat = Categorical(exp, categories=['c', 'a', 'b'])
+        tm.assert_categorical_equal(res, exp_cat)
+
+        # nan must be removed
+        cat = Categorical(["b", np.nan, "b", np.nan, "a"],
+                          categories=["a", "b", "c"])
+        res = cat.unique()
+        exp = Index(["b", "a"])
+        tm.assert_index_equal(res.categories, exp)
+        exp_cat = Categorical(["b", np.nan, "a"], categories=["b", "a"])
+        tm.assert_categorical_equal(res, exp_cat)
+
+    def test_unique_ordered(self):
+        # keep categories order when ordered=True
+        cat = Categorical(['b', 'a', 'b'], categories=['a', 'b'], ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['c', 'b', 'a', 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['c', 'b', 'a'], categories=['a', 'b', 'c'],
+                              ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['b', 'a', 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+        cat = Categorical(['b', 'b', np.nan, 'a'], categories=['a', 'b', 'c'],
+                          ordered=True)
+        res = cat.unique()
+        exp_cat = Categorical(['b', np.nan, 'a'], categories=['a', 'b'],
+                              ordered=True)
+        tm.assert_categorical_equal(res, exp_cat)
+
+    def test_unique_index_series(self):
+        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1])
+        # Categorical.unique sorts categories by appearance order
+        # if ordered=False
+        exp = Categorical([3, 1, 2], categories=[3, 1, 2])
+        tm.assert_categorical_equal(c.unique(), exp)
+
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+        c = Categorical([1, 1, 2, 2], categories=[3, 2, 1])
+        exp = Categorical([1, 2], categories=[1, 2])
+        tm.assert_categorical_equal(c.unique(), exp)
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1], ordered=True)
+        # Categorical.unique keeps categories order if ordered=True
+        exp = Categorical([3, 1, 2], categories=[3, 2, 1], ordered=True)
+        tm.assert_categorical_equal(c.unique(), exp)
+
+        tm.assert_index_equal(Index(c).unique(), Index(exp))
+        tm.assert_categorical_equal(Series(c).unique(), exp)
+
+    def test_shift(self):
+        # GH 9416
+        cat = Categorical(['a', 'b', 'c', 'd', 'a'])
+
+        # shift forward
+        sp1 = cat.shift(1)
+        xp1 = Categorical([np.nan, 'a', 'b', 'c', 'd'])
+        tm.assert_categorical_equal(sp1, xp1)
+        tm.assert_categorical_equal(cat[:-1], sp1[1:])
+
+        # shift back
+        sn2 = cat.shift(-2)
+        xp2 = Categorical(['c', 'd', 'a', np.nan, np.nan],
+                          categories=['a', 'b', 'c', 'd'])
+        tm.assert_categorical_equal(sn2, xp2)
+        tm.assert_categorical_equal(cat[2:], sn2[:-2])
+
+        # shift by zero
+        tm.assert_categorical_equal(cat, cat.shift(0))
+
+    def test_nbytes(self):
+        cat = Categorical([1, 2, 3])
+        exp = 3 + 3 * 8  # 3 int8s for values + 3 int64s for categories
+        assert cat.nbytes == exp
+
+    def test_memory_usage(self):
+        cat = Categorical([1, 2, 3])
+
+        # .categories is an index, so we include the hashtable
+        assert 0 < cat.nbytes <= cat.memory_usage()
+        assert 0 < cat.nbytes <= cat.memory_usage(deep=True)
+
+        cat = Categorical(['foo', 'foo', 'bar'])
+        assert cat.memory_usage(deep=True) > cat.nbytes
+
+        if not PYPY:
+            # sys.getsizeof will call the .memory_usage with
+            # deep=True, and add on some GC overhead
+            diff = cat.memory_usage(deep=True) - sys.getsizeof(cat)
+            assert abs(diff) < 100
+
+    def test_map(self):
+        c = Categorical(list('ABABC'), categories=list('CBA'), ordered=True)
+        result = c.map(lambda x: x.lower())
+        exp = Categorical(list('ababc'), categories=list('cba'), ordered=True)
+        tm.assert_categorical_equal(result, exp)
+
+        c = Categorical(list('ABABC'), categories=list('ABC'), ordered=False)
+        result = c.map(lambda x: x.lower())
+        exp = Categorical(list('ababc'), categories=list('abc'), ordered=False)
+        tm.assert_categorical_equal(result, exp)
+
+        result = c.map(lambda x: 1)
+        # GH 12766: Return an index not an array
+        tm.assert_index_equal(result, Index(np.array([1] * 5, dtype=np.int64)))
+
+    def test_validate_inplace(self):
+        cat = Categorical(['A', 'B', 'B', 'C', 'A'])
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                cat.set_ordered(value=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.as_ordered(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.as_unordered(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.set_categories(['X', 'Y', 'Z'], rename=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.rename_categories(['X', 'Y', 'Z'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.reorder_categories(
+                    ['X', 'Y', 'Z'], ordered=True, inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.add_categories(
+                    new_categories=['D', 'E', 'F'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.remove_categories(removals=['D', 'E', 'F'], inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.remove_unused_categories(inplace=value)
+
+            with pytest.raises(ValueError):
+                cat.sort_values(inplace=value)
+
+    def test_isna(self):
+        exp = np.array([False, False, True])
+        c = Categorical(["a", "b", np.nan])
+        res = c.isna()
+
+        tm.assert_numpy_array_equal(res, exp)
diff --git a/pandas/tests/arrays/categorical/test_api.py b/pandas/tests/arrays/categorical/test_api.py
new file mode 100644
index 0000000000000..86dbc5ebf9fe1
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_api.py
@@ -0,0 +1,508 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import Categorical, CategoricalIndex, DataFrame, Index, Series
+from pandas.core.arrays.categorical import _recode_for_categories
+from pandas.tests.arrays.categorical.common import TestCategorical
+import pandas.util.testing as tm
+
+
+class TestCategoricalAPI(object):
+
+    def test_ordered_api(self):
+        # GH 9347
+        cat1 = Categorical(list('acb'), ordered=False)
+        tm.assert_index_equal(cat1.categories, Index(['a', 'b', 'c']))
+        assert not cat1.ordered
+
+        cat2 = Categorical(list('acb'), categories=list('bca'), ordered=False)
+        tm.assert_index_equal(cat2.categories, Index(['b', 'c', 'a']))
+        assert not cat2.ordered
+
+        cat3 = Categorical(list('acb'), ordered=True)
+        tm.assert_index_equal(cat3.categories, Index(['a', 'b', 'c']))
+        assert cat3.ordered
+
+        cat4 = Categorical(list('acb'), categories=list('bca'), ordered=True)
+        tm.assert_index_equal(cat4.categories, Index(['b', 'c', 'a']))
+        assert cat4.ordered
+
+    def test_set_ordered(self):
+
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        cat2 = cat.as_unordered()
+        assert not cat2.ordered
+        cat2 = cat.as_ordered()
+        assert cat2.ordered
+        cat2.as_unordered(inplace=True)
+        assert not cat2.ordered
+        cat2.as_ordered(inplace=True)
+        assert cat2.ordered
+
+        assert cat2.set_ordered(True).ordered
+        assert not cat2.set_ordered(False).ordered
+        cat2.set_ordered(True, inplace=True)
+        assert cat2.ordered
+        cat2.set_ordered(False, inplace=True)
+        assert not cat2.ordered
+
+        # removed in 0.19.0
+        msg = "can\'t set attribute"
+        with pytest.raises(AttributeError, match=msg):
+            cat.ordered = True
+        with pytest.raises(AttributeError, match=msg):
+            cat.ordered = False
+
+    def test_rename_categories(self):
+        cat = Categorical(["a", "b", "c", "a"])
+
+        # inplace=False: the old one must not be changed
+        res = cat.rename_categories([1, 2, 3])
+        tm.assert_numpy_array_equal(res.__array__(), np.array([1, 2, 3, 1],
+                                                              dtype=np.int64))
+        tm.assert_index_equal(res.categories, Index([1, 2, 3]))
+
+        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        exp_cat = Index(["a", "b", "c"])
+        tm.assert_index_equal(cat.categories, exp_cat)
+
+        # GH18862 (let rename_categories take callables)
+        result = cat.rename_categories(lambda x: x.upper())
+        expected = Categorical(["A", "B", "C", "A"])
+        tm.assert_categorical_equal(result, expected)
+
+        # and now inplace
+        res = cat.rename_categories([1, 2, 3], inplace=True)
+        assert res is None
+        tm.assert_numpy_array_equal(cat.__array__(), np.array([1, 2, 3, 1],
+                                                              dtype=np.int64))
+        tm.assert_index_equal(cat.categories, Index([1, 2, 3]))
+
+        # Lengthen
+        with pytest.raises(ValueError):
+            cat.rename_categories([1, 2, 3, 4])
+
+        # Shorten
+        with pytest.raises(ValueError):
+            cat.rename_categories([1, 2])
+
+    def test_rename_categories_series(self):
+        # https://github.com/pandas-dev/pandas/issues/17981
+        c = Categorical(['a', 'b'])
+        xpr = "Treating Series 'new_categories' as a list-like "
+        with tm.assert_produces_warning(FutureWarning) as rec:
+            result = c.rename_categories(Series([0, 1]))
+
+        assert len(rec) == 1
+        assert xpr in str(rec[0].message)
+        expected = Categorical([0, 1])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_rename_categories_dict(self):
+        # GH 17336
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 4, 'b': 3, 'c': 2, 'd': 1})
+        expected = Index([4, 3, 2, 1])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for inplace
+        res = cat.rename_categories({'a': 4, 'b': 3, 'c': 2, 'd': 1},
+                                    inplace=True)
+        assert res is None
+        tm.assert_index_equal(cat.categories, expected)
+
+        # Test for dicts of smaller length
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 1, 'c': 3})
+
+        expected = Index([1, 'b', 3, 'd'])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for dicts with bigger length
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'a': 1, 'b': 2, 'c': 3,
+                                     'd': 4, 'e': 5, 'f': 6})
+        expected = Index([1, 2, 3, 4])
+        tm.assert_index_equal(res.categories, expected)
+
+        # Test for dicts with no items from old categories
+        cat = Categorical(['a', 'b', 'c', 'd'])
+        res = cat.rename_categories({'f': 1, 'g': 3})
+
+        expected = Index(['a', 'b', 'c', 'd'])
+        tm.assert_index_equal(res.categories, expected)
+
+    def test_reorder_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", "c", "a"], categories=["c", "b", "a"],
+                          ordered=True)
+
+        # first inplace == False
+        res = cat.reorder_categories(["c", "b", "a"])
+        # cat must be the same as before
+        tm.assert_categorical_equal(cat, old)
+        # only res is changed
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.reorder_categories(["c", "b", "a"], inplace=True)
+        assert res is None
+        tm.assert_categorical_equal(cat, new)
+
+        # not all "old" included in "new"
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+
+        with pytest.raises(ValueError):
+            cat.reorder_categories(["a"])
+
+        # still not all "old" in "new"
+        with pytest.raises(ValueError):
+            cat.reorder_categories(["a", "b", "d"])
+
+        # all "old" included in "new", but too long
+        with pytest.raises(ValueError):
+            cat.reorder_categories(["a", "b", "c", "d"])
+
+    def test_add_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", "c", "a"],
+                          categories=["a", "b", "c", "d"], ordered=True)
+
+        # first inplace == False
+        res = cat.add_categories("d")
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        res = cat.add_categories(["d"])
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.add_categories("d", inplace=True)
+        tm.assert_categorical_equal(cat, new)
+        assert res is None
+
+        # new is in old categories
+        with pytest.raises(ValueError):
+            cat.add_categories(["d"])
+
+        # GH 9927
+        cat = Categorical(list("abc"), ordered=True)
+        expected = Categorical(
+            list("abc"), categories=list("abcde"), ordered=True)
+        # test with Series, np.array, index, list
+        res = cat.add_categories(Series(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(np.array(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(Index(["d", "e"]))
+        tm.assert_categorical_equal(res, expected)
+        res = cat.add_categories(["d", "e"])
+        tm.assert_categorical_equal(res, expected)
+
+    def test_set_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        exp_categories = Index(["c", "b", "a"])
+        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
+
+        res = cat.set_categories(["c", "b", "a"], inplace=True)
+        tm.assert_index_equal(cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_values)
+        assert res is None
+
+        res = cat.set_categories(["a", "b", "c"])
+        # cat must be the same as before
+        tm.assert_index_equal(cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_values)
+        # only res is changed
+        exp_categories_back = Index(["a", "b", "c"])
+        tm.assert_index_equal(res.categories, exp_categories_back)
+        tm.assert_numpy_array_equal(res.__array__(), exp_values)
+
+        # not all "old" included in "new" -> all not included ones are now
+        # np.nan
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        res = cat.set_categories(["a"])
+        tm.assert_numpy_array_equal(res.codes, np.array([0, -1, -1, 0],
+                                                        dtype=np.int8))
+
+        # still not all "old" in "new"
+        res = cat.set_categories(["a", "b", "d"])
+        tm.assert_numpy_array_equal(res.codes, np.array([0, 1, -1, 0],
+                                                        dtype=np.int8))
+        tm.assert_index_equal(res.categories, Index(["a", "b", "d"]))
+
+        # all "old" included in "new"
+        cat = cat.set_categories(["a", "b", "c", "d"])
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_index_equal(cat.categories, exp_categories)
+
+        # internals...
+        c = Categorical([1, 2, 3, 4, 1], categories=[1, 2, 3, 4], ordered=True)
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, 2, 3, 0],
+                                                       dtype=np.int8))
+        tm.assert_index_equal(c.categories, Index([1, 2, 3, 4]))
+
+        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(c.get_values(), exp)
+
+        # all "pointers" to '4' must be changed from 3 to 0,...
+        c = c.set_categories([4, 3, 2, 1])
+
+        # positions are changed
+        tm.assert_numpy_array_equal(c._codes, np.array([3, 2, 1, 0, 3],
+                                                       dtype=np.int8))
+
+        # categories are now in new order
+        tm.assert_index_equal(c.categories, Index([4, 3, 2, 1]))
+
+        # output is the same
+        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(c.get_values(), exp)
+        assert c.min() == 4
+        assert c.max() == 1
+
+        # set_categories should set the ordering if specified
+        c2 = c.set_categories([4, 3, 2, 1], ordered=False)
+        assert not c2.ordered
+
+        tm.assert_numpy_array_equal(c.get_values(), c2.get_values())
+
+        # set_categories should pass thru the ordering
+        c2 = c.set_ordered(False).set_categories([4, 3, 2, 1])
+        assert not c2.ordered
+
+        tm.assert_numpy_array_equal(c.get_values(), c2.get_values())
+
+    @pytest.mark.parametrize('values, categories, new_categories', [
+        # No NaNs, same cats, same order
+        (['a', 'b', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['a', 'b', 'a'], ['a', 'b'], ['b', 'a'],),
+        # Same, unsorted
+        (['b', 'a', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['b', 'a', 'a'], ['a', 'b'], ['b', 'a'],),
+        # NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a', 'b']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b', 'a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        # Introduce NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        # No overlap
+        (['a', 'b', 'c'], ['a', 'b'], ['d', 'e']),
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_set_categories_many(self, values, categories, new_categories,
+                                 ordered):
+        c = Categorical(values, categories)
+        expected = Categorical(values, new_categories, ordered)
+        result = c.set_categories(new_categories, ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_set_categories_rename_less(self):
+        # GH 24675
+        cat = Categorical(['A', 'B'])
+        result = cat.set_categories(['A'], rename=True)
+        expected = Categorical(['A', np.nan])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_set_categories_private(self):
+        cat = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c', 'd'])
+        cat._set_categories(['a', 'c', 'd', 'e'])
+        expected = Categorical(['a', 'c', 'd'], categories=list('acde'))
+        tm.assert_categorical_equal(cat, expected)
+
+        # fastpath
+        cat = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c', 'd'])
+        cat._set_categories(['a', 'c', 'd', 'e'], fastpath=True)
+        expected = Categorical(['a', 'c', 'd'], categories=list('acde'))
+        tm.assert_categorical_equal(cat, expected)
+
+    def test_remove_categories(self):
+        cat = Categorical(["a", "b", "c", "a"], ordered=True)
+        old = cat.copy()
+        new = Categorical(["a", "b", np.nan, "a"], categories=["a", "b"],
+                          ordered=True)
+
+        # first inplace == False
+        res = cat.remove_categories("c")
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        res = cat.remove_categories(["c"])
+        tm.assert_categorical_equal(cat, old)
+        tm.assert_categorical_equal(res, new)
+
+        # inplace == True
+        res = cat.remove_categories("c", inplace=True)
+        tm.assert_categorical_equal(cat, new)
+        assert res is None
+
+        # removal is not in categories
+        with pytest.raises(ValueError):
+            cat.remove_categories(["c"])
+
+    def test_remove_unused_categories(self):
+        c = Categorical(["a", "b", "c", "d", "a"],
+                        categories=["a", "b", "c", "d", "e"])
+        exp_categories_all = Index(["a", "b", "c", "d", "e"])
+        exp_categories_dropped = Index(["a", "b", "c", "d"])
+
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        res = c.remove_unused_categories()
+        tm.assert_index_equal(res.categories, exp_categories_dropped)
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        res = c.remove_unused_categories(inplace=True)
+        tm.assert_index_equal(c.categories, exp_categories_dropped)
+        assert res is None
+
+        # with NaN values (GH11599)
+        c = Categorical(["a", "b", "c", np.nan],
+                        categories=["a", "b", "c", "d", "e"])
+        res = c.remove_unused_categories()
+        tm.assert_index_equal(res.categories,
+                              Index(np.array(["a", "b", "c"])))
+        exp_codes = np.array([0, 1, 2, -1], dtype=np.int8)
+        tm.assert_numpy_array_equal(res.codes, exp_codes)
+        tm.assert_index_equal(c.categories, exp_categories_all)
+
+        val = ['F', np.nan, 'D', 'B', 'D', 'F', np.nan]
+        cat = Categorical(values=val, categories=list('ABCDEFG'))
+        out = cat.remove_unused_categories()
+        tm.assert_index_equal(out.categories, Index(['B', 'D', 'F']))
+        exp_codes = np.array([2, -1, 1, 0, 1, 2, -1], dtype=np.int8)
+        tm.assert_numpy_array_equal(out.codes, exp_codes)
+        assert out.get_values().tolist() == val
+
+        alpha = list('abcdefghijklmnopqrstuvwxyz')
+        val = np.random.choice(alpha[::2], 10000).astype('object')
+        val[np.random.choice(len(val), 100)] = np.nan
+
+        cat = Categorical(values=val, categories=alpha)
+        out = cat.remove_unused_categories()
+        assert out.get_values().tolist() == val.tolist()
+
+
+class TestCategoricalAPIWithFactor(TestCategorical):
+
+    def test_describe(self):
+        # string type
+        desc = self.factor.describe()
+        assert self.factor.ordered
+        exp_index = CategoricalIndex(['a', 'b', 'c'], name='categories',
+                                     ordered=self.factor.ordered)
+        expected = DataFrame({'counts': [3, 2, 3],
+                              'freqs': [3 / 8., 2 / 8., 3 / 8.]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # check unused categories
+        cat = self.factor.copy()
+        cat.set_categories(["a", "b", "c", "d"], inplace=True)
+        desc = cat.describe()
+
+        exp_index = CategoricalIndex(
+            list('abcd'), ordered=self.factor.ordered, name='categories')
+        expected = DataFrame({'counts': [3, 2, 3, 0],
+                              'freqs': [3 / 8., 2 / 8., 3 / 8., 0]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # check an integer one
+        cat = Categorical([1, 2, 3, 1, 2, 3, 3, 2, 1, 1, 1])
+        desc = cat.describe()
+        exp_index = CategoricalIndex([1, 2, 3], ordered=cat.ordered,
+                                     name='categories')
+        expected = DataFrame({'counts': [5, 3, 3],
+                              'freqs': [5 / 11., 3 / 11., 3 / 11.]},
+                             index=exp_index)
+        tm.assert_frame_equal(desc, expected)
+
+        # https://github.com/pandas-dev/pandas/issues/3678
+        # describe should work with NaN
+        cat = Categorical([np.nan, 1, 2, 2])
+        desc = cat.describe()
+        expected = DataFrame({'counts': [1, 2, 1],
+                              'freqs': [1 / 4., 2 / 4., 1 / 4.]},
+                             index=CategoricalIndex([1, 2, np.nan],
+                                                    categories=[1, 2],
+                                                    name='categories'))
+        tm.assert_frame_equal(desc, expected)
+
+    def test_set_categories_inplace(self):
+        cat = self.factor.copy()
+        cat.set_categories(['a', 'b', 'c', 'd'], inplace=True)
+        tm.assert_index_equal(cat.categories, Index(['a', 'b', 'c', 'd']))
+
+
+class TestPrivateCategoricalAPI(object):
+
+    def test_codes_immutable(self):
+
+        # Codes should be read only
+        c = Categorical(["a", "b", "c", "a", np.nan])
+        exp = np.array([0, 1, 2, 0, -1], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+
+        # Assignments to codes should raise
+        with pytest.raises(ValueError):
+            c.codes = np.array([0, 1, 2, 0, 1], dtype='int8')
+
+        # changes in the codes array should raise
+        codes = c.codes
+
+        with pytest.raises(ValueError):
+            codes[4] = 1
+
+        # But even after getting the codes, the original array should still be
+        # writeable!
+        c[4] = "a"
+        exp = np.array([0, 1, 2, 0, 0], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+        c._codes[4] = 2
+        exp = np.array([0, 1, 2, 0, 2], dtype='int8')
+        tm.assert_numpy_array_equal(c.codes, exp)
+
+    @pytest.mark.parametrize('codes, old, new, expected', [
+        ([0, 1], ['a', 'b'], ['a', 'b'], [0, 1]),
+        ([0, 1], ['b', 'a'], ['b', 'a'], [0, 1]),
+        ([0, 1], ['a', 'b'], ['b', 'a'], [1, 0]),
+        ([0, 1], ['b', 'a'], ['a', 'b'], [1, 0]),
+        ([0, 1, 0, 1], ['a', 'b'], ['a', 'b', 'c'], [0, 1, 0, 1]),
+        ([0, 1, 2, 2], ['a', 'b', 'c'], ['a', 'b'], [0, 1, -1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['a', 'b', 'c'], [0, 1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['b'], [-1, 0, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], ['d'], [-1, -1, -1]),
+        ([0, 1, -1], ['a', 'b', 'c'], [], [-1, -1, -1]),
+        ([-1, -1], [], ['a', 'b'], [-1, -1]),
+        ([1, 0], ['b', 'a'], ['a', 'b'], [0, 1]),
+    ])
+    def test_recode_to_categories(self, codes, old, new, expected):
+        codes = np.asanyarray(codes, dtype=np.int8)
+        expected = np.asanyarray(expected, dtype=np.int8)
+        old = Index(old)
+        new = Index(new)
+        result = _recode_for_categories(codes, old, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_recode_to_categories_large(self):
+        N = 1000
+        codes = np.arange(N)
+        old = Index(codes)
+        expected = np.arange(N - 1, -1, -1, dtype=np.int16)
+        new = Index(expected)
+        result = _recode_for_categories(codes, old, new)
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/arrays/categorical/test_constructors.py b/pandas/tests/arrays/categorical/test_constructors.py
new file mode 100644
index 0000000000000..f07e3aba53cd4
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_constructors.py
@@ -0,0 +1,586 @@
+# -*- coding: utf-8 -*-
+
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.common import is_float_dtype, is_integer_dtype
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DatetimeIndex, Index, Interval,
+    IntervalIndex, NaT, Series, Timestamp, date_range, period_range,
+    timedelta_range)
+import pandas.util.testing as tm
+
+
+class TestCategoricalConstructors(object):
+
+    def test_validate_ordered(self):
+        # see gh-14058
+        exp_msg = "'ordered' must either be 'True' or 'False'"
+        exp_err = TypeError
+
+        # This should be a boolean.
+        ordered = np.array([0, 1, 2])
+
+        with pytest.raises(exp_err, match=exp_msg):
+            Categorical([1, 2, 3], ordered=ordered)
+
+        with pytest.raises(exp_err, match=exp_msg):
+            Categorical.from_codes([0, 0, 1], categories=['a', 'b', 'c'],
+                                   ordered=ordered)
+
+    def test_constructor_empty(self):
+        # GH 17248
+        c = Categorical([])
+        expected = Index([])
+        tm.assert_index_equal(c.categories, expected)
+
+        c = Categorical([], categories=[1, 2, 3])
+        expected = pd.Int64Index([1, 2, 3])
+        tm.assert_index_equal(c.categories, expected)
+
+    def test_constructor_empty_boolean(self):
+        # see gh-22702
+        cat = pd.Categorical([], categories=[True, False])
+        categories = sorted(cat.categories.tolist())
+        assert categories == [False, True]
+
+    def test_constructor_tuples(self):
+        values = np.array([(1,), (1, 2), (1,), (1, 2)], dtype=object)
+        result = Categorical(values)
+        expected = Index([(1,), (1, 2)], tupleize_cols=False)
+        tm.assert_index_equal(result.categories, expected)
+        assert result.ordered is False
+
+    def test_constructor_tuples_datetimes(self):
+        # numpy will auto reshape when all of the tuples are the
+        # same len, so add an extra one with 2 items and slice it off
+        values = np.array([(Timestamp('2010-01-01'),),
+                           (Timestamp('2010-01-02'),),
+                           (Timestamp('2010-01-01'),),
+                           (Timestamp('2010-01-02'),),
+                           ('a', 'b')], dtype=object)[:-1]
+        result = Categorical(values)
+        expected = Index([(Timestamp('2010-01-01'),),
+                          (Timestamp('2010-01-02'),)], tupleize_cols=False)
+        tm.assert_index_equal(result.categories, expected)
+
+    def test_constructor_unsortable(self):
+
+        # it works!
+        arr = np.array([1, 2, 3, datetime.now()], dtype='O')
+        factor = Categorical(arr, ordered=False)
+        assert not factor.ordered
+
+        # this however will raise as cannot be sorted
+        msg = ("'values' is not ordered, please explicitly specify the "
+               "categories order by passing in a categories argument.")
+        with pytest.raises(TypeError, match=msg):
+            Categorical(arr, ordered=True)
+
+    def test_constructor_interval(self):
+        result = Categorical([Interval(1, 2), Interval(2, 3), Interval(3, 6)],
+                             ordered=True)
+        ii = IntervalIndex([Interval(1, 2), Interval(2, 3), Interval(3, 6)])
+        exp = Categorical(ii, ordered=True)
+        tm.assert_categorical_equal(result, exp)
+        tm.assert_index_equal(result.categories, ii)
+
+    def test_constructor(self):
+
+        exp_arr = np.array(["a", "b", "c", "a", "b", "c"], dtype=np.object_)
+        c1 = Categorical(exp_arr)
+        tm.assert_numpy_array_equal(c1.__array__(), exp_arr)
+        c2 = Categorical(exp_arr, categories=["a", "b", "c"])
+        tm.assert_numpy_array_equal(c2.__array__(), exp_arr)
+        c2 = Categorical(exp_arr, categories=["c", "b", "a"])
+        tm.assert_numpy_array_equal(c2.__array__(), exp_arr)
+
+        # categories must be unique
+        msg = "Categorical categories must be unique"
+        with pytest.raises(ValueError, match=msg):
+            Categorical([1, 2], [1, 2, 2])
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical(["a", "b"], ["a", "b", "b"])
+
+        # The default should be unordered
+        c1 = Categorical(["a", "b", "c", "a"])
+        assert not c1.ordered
+
+        # Categorical as input
+        c1 = Categorical(["a", "b", "c", "a"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(c1)
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(c1, categories=["a", "b", "c"])
+        tm.assert_numpy_array_equal(c1.__array__(), c2.__array__())
+        tm.assert_index_equal(c2.categories, Index(["a", "b", "c"]))
+
+        # Series of dtype category
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(Series(c1))
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
+        c2 = Categorical(Series(c1))
+        tm.assert_categorical_equal(c1, c2)
+
+        # Series
+        c1 = Categorical(["a", "b", "c", "a"])
+        c2 = Categorical(Series(["a", "b", "c", "a"]))
+        tm.assert_categorical_equal(c1, c2)
+
+        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
+        c2 = Categorical(Series(["a", "b", "c", "a"]),
+                         categories=["a", "b", "c", "d"])
+        tm.assert_categorical_equal(c1, c2)
+
+        # This should result in integer categories, not float!
+        cat = Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
+        assert is_integer_dtype(cat.categories)
+
+        # https://github.com/pandas-dev/pandas/issues/3678
+        cat = Categorical([np.nan, 1, 2, 3])
+        assert is_integer_dtype(cat.categories)
+
+        # this should result in floats
+        cat = Categorical([np.nan, 1, 2., 3])
+        assert is_float_dtype(cat.categories)
+
+        cat = Categorical([np.nan, 1., 2., 3.])
+        assert is_float_dtype(cat.categories)
+
+        # This doesn't work -> this would probably need some kind of "remember
+        # the original type" feature to try to cast the array interface result
+        # to...
+
+        # vals = np.asarray(cat[cat.notna()])
+        # assert is_integer_dtype(vals)
+
+        # corner cases
+        cat = Categorical([1])
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == 1
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        cat = Categorical(["a"])
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == "a"
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        # Scalars should be converted to lists
+        cat = Categorical(1)
+        assert len(cat.categories) == 1
+        assert cat.categories[0] == 1
+        assert len(cat.codes) == 1
+        assert cat.codes[0] == 0
+
+        # two arrays
+        #  - when the first is an integer dtype and the second is not
+        #  - when the resulting codes are all -1/NaN
+        with tm.assert_produces_warning(None):
+            c_old = Categorical([0, 1, 2, 0, 1, 2],
+                                categories=["a", "b", "c"])  # noqa
+
+        with tm.assert_produces_warning(None):
+            c_old = Categorical([0, 1, 2, 0, 1, 2],  # noqa
+                                categories=[3, 4, 5])
+
+        # the next one are from the old docs
+        with tm.assert_produces_warning(None):
+            c_old2 = Categorical([0, 1, 2, 0, 1, 2], [1, 2, 3])  # noqa
+            cat = Categorical([1, 2], categories=[1, 2, 3])
+
+        # this is a legitimate constructor
+        with tm.assert_produces_warning(None):
+            c = Categorical(np.array([], dtype='int64'),  # noqa
+                            categories=[3, 2, 1], ordered=True)
+
+    def test_constructor_with_existing_categories(self):
+        # GH25318: constructing with pd.Series used to bogusly skip recoding
+        # categories
+        c0 = Categorical(["a", "b", "c", "a"])
+        c1 = Categorical(["a", "b", "c", "a"], categories=["b", "c"])
+
+        c2 = Categorical(c0, categories=c1.categories)
+        tm.assert_categorical_equal(c1, c2)
+
+        c3 = Categorical(Series(c0), categories=c1.categories)
+        tm.assert_categorical_equal(c1, c3)
+
+    def test_constructor_not_sequence(self):
+        # https://github.com/pandas-dev/pandas/issues/16022
+        msg = r"^Parameter 'categories' must be list-like, was"
+        with pytest.raises(TypeError, match=msg):
+            Categorical(['a', 'b'], categories='a')
+
+    def test_constructor_with_null(self):
+
+        # Cannot have NaN in categories
+        msg = "Categorial categories cannot be null"
+        with pytest.raises(ValueError, match=msg):
+            Categorical([np.nan, "a", "b", "c"],
+                        categories=[np.nan, "a", "b", "c"])
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical([None, "a", "b", "c"],
+                        categories=[None, "a", "b", "c"])
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical(DatetimeIndex(['nat', '20160101']),
+                        categories=[NaT, Timestamp('20160101')])
+
+    def test_constructor_with_index(self):
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        tm.assert_categorical_equal(ci.values, Categorical(ci))
+
+        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
+        tm.assert_categorical_equal(ci.values,
+                                    Categorical(ci.astype(object),
+                                                categories=ci.categories))
+
+    def test_constructor_with_generator(self):
+        # This was raising an Error in isna(single_val).any() because isna
+        # returned a scalar for a generator
+        xrange = range
+
+        exp = Categorical([0, 1, 2])
+        cat = Categorical((x for x in [0, 1, 2]))
+        tm.assert_categorical_equal(cat, exp)
+        cat = Categorical(xrange(3))
+        tm.assert_categorical_equal(cat, exp)
+
+        # This uses xrange internally
+        from pandas.core.index import MultiIndex
+        MultiIndex.from_product([range(5), ['a', 'b', 'c']])
+
+        # check that categories accept generators and sequences
+        cat = Categorical([0, 1, 2], categories=(x for x in [0, 1, 2]))
+        tm.assert_categorical_equal(cat, exp)
+        cat = Categorical([0, 1, 2], categories=xrange(3))
+        tm.assert_categorical_equal(cat, exp)
+
+    @pytest.mark.parametrize("dtl", [
+        date_range("1995-01-01 00:00:00", periods=5, freq="s"),
+        date_range("1995-01-01 00:00:00", periods=5,
+                   freq="s", tz="US/Eastern"),
+        timedelta_range("1 day", periods=5, freq="s")
+    ])
+    def test_constructor_with_datetimelike(self, dtl):
+        # see gh-12077
+        # constructor with a datetimelike and NaT
+
+        s = Series(dtl)
+        c = Categorical(s)
+
+        expected = type(dtl)(s)
+        expected.freq = None
+
+        tm.assert_index_equal(c.categories, expected)
+        tm.assert_numpy_array_equal(c.codes, np.arange(5, dtype="int8"))
+
+        # with NaT
+        s2 = s.copy()
+        s2.iloc[-1] = NaT
+        c = Categorical(s2)
+
+        expected = type(dtl)(s2.dropna())
+        expected.freq = None
+
+        tm.assert_index_equal(c.categories, expected)
+
+        exp = np.array([0, 1, 2, 3, -1], dtype=np.int8)
+        tm.assert_numpy_array_equal(c.codes, exp)
+
+        result = repr(c)
+        assert "NaT" in result
+
+    def test_constructor_from_index_series_datetimetz(self):
+        idx = date_range('2015-01-01 10:00', freq='D', periods=3,
+                         tz='US/Eastern')
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_from_index_series_timedelta(self):
+        idx = timedelta_range('1 days', freq='D', periods=3)
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_from_index_series_period(self):
+        idx = period_range('2015-01-01', freq='D', periods=3)
+        result = Categorical(idx)
+        tm.assert_index_equal(result.categories, idx)
+
+        result = Categorical(Series(idx))
+        tm.assert_index_equal(result.categories, idx)
+
+    def test_constructor_invariant(self):
+        # GH 14190
+        vals = [
+            np.array([1., 1.2, 1.8, np.nan]),
+            np.array([1, 2, 3], dtype='int64'),
+            ['a', 'b', 'c', np.nan],
+            [pd.Period('2014-01'), pd.Period('2014-02'), NaT],
+            [Timestamp('2014-01-01'), Timestamp('2014-01-02'), NaT],
+            [Timestamp('2014-01-01', tz='US/Eastern'),
+             Timestamp('2014-01-02', tz='US/Eastern'), NaT],
+        ]
+        for val in vals:
+            c = Categorical(val)
+            c2 = Categorical(c)
+            tm.assert_categorical_equal(c, c2)
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_constructor_with_dtype(self, ordered):
+        categories = ['b', 'a', 'c']
+        dtype = CategoricalDtype(categories, ordered=ordered)
+        result = Categorical(['a', 'b', 'a', 'c'], dtype=dtype)
+        expected = Categorical(['a', 'b', 'a', 'c'], categories=categories,
+                               ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+        assert result.ordered is ordered
+
+    def test_constructor_dtype_and_others_raises(self):
+        dtype = CategoricalDtype(['a', 'b'], ordered=True)
+        msg = "Cannot specify `categories` or `ordered` together with `dtype`."
+        with pytest.raises(ValueError, match=msg):
+            Categorical(['a', 'b'], categories=['a', 'b'], dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical(['a', 'b'], ordered=True, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical(['a', 'b'], ordered=False, dtype=dtype)
+
+    @pytest.mark.parametrize('categories', [
+        None, ['a', 'b'], ['a', 'c'],
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_constructor_str_category(self, categories, ordered):
+        result = Categorical(['a', 'b'], categories=categories,
+                             ordered=ordered, dtype='category')
+        expected = Categorical(['a', 'b'], categories=categories,
+                               ordered=ordered)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_str_unknown(self):
+        with pytest.raises(ValueError, match="Unknown dtype"):
+            Categorical([1, 2], dtype="foo")
+
+    def test_constructor_from_categorical_with_dtype(self):
+        dtype = CategoricalDtype(['a', 'b', 'c'], ordered=True)
+        values = Categorical(['a', 'b', 'd'])
+        result = Categorical(values, dtype=dtype)
+        # We use dtype.categories, not values.categories
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'c'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_from_categorical_with_unknown_dtype(self):
+        dtype = CategoricalDtype(None, ordered=True)
+        values = Categorical(['a', 'b', 'd'])
+        result = Categorical(values, dtype=dtype)
+        # We use values.categories, not dtype.categories
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'd'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_from_categorical_string(self):
+        values = Categorical(['a', 'b', 'd'])
+        # use categories, ordered
+        result = Categorical(values, categories=['a', 'b', 'c'], ordered=True,
+                             dtype='category')
+        expected = Categorical(['a', 'b', 'd'], categories=['a', 'b', 'c'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+        # No string
+        result = Categorical(values, categories=['a', 'b', 'c'], ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_constructor_with_categorical_categories(self):
+        # GH17884
+        expected = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+
+        result = Categorical(
+            ['a', 'b'], categories=Categorical(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        result = Categorical(
+            ['a', 'b'], categories=CategoricalIndex(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_codes(self):
+
+        # too few categories
+        dtype = CategoricalDtype(categories=[1, 2])
+        msg = "codes need to be between "
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([1, 2], categories=dtype.categories)
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([1, 2], dtype=dtype)
+
+        # no int codes
+        msg = "codes need to be array-like integers"
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes(["a"], categories=dtype.categories)
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes(["a"], dtype=dtype)
+
+        # no unique categories
+        with pytest.raises(ValueError,
+                           match="Categorical categories must be unique"):
+            Categorical.from_codes([0, 1, 2], categories=["a", "a", "b"])
+
+        # NaN categories included
+        with pytest.raises(ValueError,
+                           match="Categorial categories cannot be null"):
+            Categorical.from_codes([0, 1, 2], categories=["a", "b", np.nan])
+
+        # too negative
+        dtype = CategoricalDtype(categories=["a", "b", "c"])
+        msg = r"codes need to be between -1 and len\(categories\)-1"
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([-2, 1, 2], categories=dtype.categories)
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([-2, 1, 2], dtype=dtype)
+
+        exp = Categorical(["a", "b", "c"], ordered=False)
+        res = Categorical.from_codes([0, 1, 2], categories=dtype.categories)
+        tm.assert_categorical_equal(exp, res)
+
+        res = Categorical.from_codes([0, 1, 2], dtype=dtype)
+        tm.assert_categorical_equal(exp, res)
+
+    def test_from_codes_with_categorical_categories(self):
+        # GH17884
+        expected = Categorical(['a', 'b'], categories=['a', 'b', 'c'])
+
+        result = Categorical.from_codes(
+            [0, 1], categories=Categorical(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        result = Categorical.from_codes(
+            [0, 1], categories=CategoricalIndex(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, expected)
+
+        # non-unique Categorical still raises
+        with pytest.raises(ValueError,
+                           match="Categorical categories must be unique"):
+            Categorical.from_codes([0, 1], Categorical(['a', 'b', 'a']))
+
+    def test_from_codes_with_nan_code(self):
+        # GH21767
+        codes = [1, 2, np.nan]
+        dtype = CategoricalDtype(categories=['a', 'b', 'c'])
+        with pytest.raises(ValueError,
+                           match="codes need to be array-like integers"):
+            Categorical.from_codes(codes, categories=dtype.categories)
+        with pytest.raises(ValueError,
+                           match="codes need to be array-like integers"):
+            Categorical.from_codes(codes, dtype=dtype)
+
+    def test_from_codes_with_float(self):
+        # GH21767
+        codes = [1.0, 2.0, 0]  # integer, but in float dtype
+        dtype = CategoricalDtype(categories=['a', 'b', 'c'])
+
+        with tm.assert_produces_warning(FutureWarning):
+            cat = Categorical.from_codes(codes, dtype.categories)
+        tm.assert_numpy_array_equal(cat.codes, np.array([1, 2, 0], dtype='i1'))
+
+        with tm.assert_produces_warning(FutureWarning):
+            cat = Categorical.from_codes(codes, dtype=dtype)
+        tm.assert_numpy_array_equal(cat.codes, np.array([1, 2, 0], dtype='i1'))
+
+        codes = [1.1, 2.0, 0]  # non-integer
+        with pytest.raises(ValueError,
+                           match="codes need to be array-like integers"):
+            Categorical.from_codes(codes, dtype.categories)
+        with pytest.raises(ValueError,
+                           match="codes need to be array-like integers"):
+            Categorical.from_codes(codes, dtype=dtype)
+
+    def test_from_codes_with_dtype_raises(self):
+        msg = 'Cannot specify'
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([0, 1], categories=['a', 'b'],
+                                   dtype=CategoricalDtype(['a', 'b']))
+
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([0, 1], ordered=True,
+                                   dtype=CategoricalDtype(['a', 'b']))
+
+    def test_from_codes_neither(self):
+        msg = "Both were None"
+        with pytest.raises(ValueError, match=msg):
+            Categorical.from_codes([0, 1])
+
+    @pytest.mark.parametrize('dtype', [None, 'category'])
+    def test_from_inferred_categories(self, dtype):
+        cats = ['a', 'b']
+        codes = np.array([0, 0, 1, 1], dtype='i8')
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical.from_codes(codes, cats)
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, 'category'])
+    def test_from_inferred_categories_sorts(self, dtype):
+        cats = ['b', 'a']
+        codes = np.array([0, 1, 1, 1], dtype='i8')
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical.from_codes([1, 0, 0, 0], ['a', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_inferred_categories_dtype(self):
+        cats = ['a', 'b', 'd']
+        codes = np.array([0, 1, 0, 2], dtype='i8')
+        dtype = CategoricalDtype(['c', 'b', 'a'], ordered=True)
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical(['a', 'b', 'a', 'd'],
+                               categories=['c', 'b', 'a'],
+                               ordered=True)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_from_inferred_categories_coerces(self):
+        cats = ['1', '2', 'bad']
+        codes = np.array([0, 0, 1, 2], dtype='i8')
+        dtype = CategoricalDtype([1, 2])
+        result = Categorical._from_inferred_categories(cats, codes, dtype)
+        expected = Categorical([1, 1, 2, np.nan])
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize('ordered', [None, True, False])
+    def test_construction_with_ordered(self, ordered):
+        # GH 9347, 9190
+        cat = Categorical([0, 1, 2], ordered=ordered)
+        assert cat.ordered == bool(ordered)
+
+    @pytest.mark.xfail(reason="Imaginary values not supported in Categorical")
+    def test_constructor_imaginary(self):
+        values = [1, 2, 3 + 1j]
+        c1 = Categorical(values)
+        tm.assert_index_equal(c1.categories, Index(values))
+        tm.assert_numpy_array_equal(np.array(c1), np.array(values))
diff --git a/pandas/tests/arrays/categorical/test_dtypes.py b/pandas/tests/arrays/categorical/test_dtypes.py
new file mode 100644
index 0000000000000..66f08355e7516
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_dtypes.py
@@ -0,0 +1,177 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+from pandas.compat import long
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+from pandas import Categorical, CategoricalIndex, Index, Series, Timestamp
+import pandas.util.testing as tm
+
+
+class TestCategoricalDtypes(object):
+
+    def test_is_equal_dtype(self):
+
+        # test dtype comparisons between cats
+
+        c1 = Categorical(list('aabca'), categories=list('abc'), ordered=False)
+        c2 = Categorical(list('aabca'), categories=list('cab'), ordered=False)
+        c3 = Categorical(list('aabca'), categories=list('cab'), ordered=True)
+        assert c1.is_dtype_equal(c1)
+        assert c2.is_dtype_equal(c2)
+        assert c3.is_dtype_equal(c3)
+        assert c1.is_dtype_equal(c2)
+        assert not c1.is_dtype_equal(c3)
+        assert not c1.is_dtype_equal(Index(list('aabca')))
+        assert not c1.is_dtype_equal(c1.astype(object))
+        assert c1.is_dtype_equal(CategoricalIndex(c1))
+        assert (c1.is_dtype_equal(
+            CategoricalIndex(c1, categories=list('cab'))))
+        assert not c1.is_dtype_equal(CategoricalIndex(c1, ordered=True))
+
+        # GH 16659
+        s1 = Series(c1)
+        s2 = Series(c2)
+        s3 = Series(c3)
+        assert c1.is_dtype_equal(s1)
+        assert c2.is_dtype_equal(s2)
+        assert c3.is_dtype_equal(s3)
+        assert c1.is_dtype_equal(s2)
+        assert not c1.is_dtype_equal(s3)
+        assert not c1.is_dtype_equal(s1.astype(object))
+
+    def test_set_dtype_same(self):
+        c = Categorical(['a', 'b', 'c'])
+        result = c._set_dtype(CategoricalDtype(['a', 'b', 'c']))
+        tm.assert_categorical_equal(result, c)
+
+    def test_set_dtype_new_categories(self):
+        c = Categorical(['a', 'b', 'c'])
+        result = c._set_dtype(CategoricalDtype(list('abcd')))
+        tm.assert_numpy_array_equal(result.codes, c.codes)
+        tm.assert_index_equal(result.dtype.categories, Index(list('abcd')))
+
+    @pytest.mark.parametrize('values, categories, new_categories', [
+        # No NaNs, same cats, same order
+        (['a', 'b', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['a', 'b', 'a'], ['a', 'b'], ['b', 'a'],),
+        # Same, unsorted
+        (['b', 'a', 'a'], ['a', 'b'], ['a', 'b'],),
+        # No NaNs, same cats, different order
+        (['b', 'a', 'a'], ['a', 'b'], ['b', 'a'],),
+        # NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a', 'b']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b', 'a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a', 'b']),
+        # Introduce NaNs
+        (['a', 'b', 'c'], ['a', 'b'], ['a']),
+        (['a', 'b', 'c'], ['a', 'b'], ['b']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        (['b', 'a', 'c'], ['a', 'b'], ['a']),
+        # No overlap
+        (['a', 'b', 'c'], ['a', 'b'], ['d', 'e']),
+    ])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_set_dtype_many(self, values, categories, new_categories,
+                            ordered):
+        c = Categorical(values, categories)
+        expected = Categorical(values, new_categories, ordered)
+        result = c._set_dtype(expected.dtype)
+        tm.assert_categorical_equal(result, expected)
+
+    def test_set_dtype_no_overlap(self):
+        c = Categorical(['a', 'b', 'c'], ['d', 'e'])
+        result = c._set_dtype(CategoricalDtype(['a', 'b']))
+        expected = Categorical([None, None, None], categories=['a', 'b'])
+        tm.assert_categorical_equal(result, expected)
+
+    def test_codes_dtypes(self):
+
+        # GH 8453
+        result = Categorical(['foo', 'bar', 'baz'])
+        assert result.codes.dtype == 'int8'
+
+        result = Categorical(['foo%05d' % i for i in range(400)])
+        assert result.codes.dtype == 'int16'
+
+        result = Categorical(['foo%05d' % i for i in range(40000)])
+        assert result.codes.dtype == 'int32'
+
+        # adding cats
+        result = Categorical(['foo', 'bar', 'baz'])
+        assert result.codes.dtype == 'int8'
+        result = result.add_categories(['foo%05d' % i for i in range(400)])
+        assert result.codes.dtype == 'int16'
+
+        # removing cats
+        result = result.remove_categories(['foo%05d' % i for i in range(300)])
+        assert result.codes.dtype == 'int8'
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_astype(self, ordered):
+        # string
+        cat = Categorical(list('abbaaccc'), ordered=ordered)
+        result = cat.astype(object)
+        expected = np.array(cat)
+        tm.assert_numpy_array_equal(result, expected)
+
+        msg = 'could not convert string to float'
+        with pytest.raises(ValueError, match=msg):
+            cat.astype(float)
+
+        # numeric
+        cat = Categorical([0, 1, 2, 2, 1, 0, 1, 0, 2], ordered=ordered)
+        result = cat.astype(object)
+        expected = np.array(cat, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = cat.astype(int)
+        expected = np.array(cat, dtype=np.int)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = cat.astype(float)
+        expected = np.array(cat, dtype=np.float)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('cat_ordered', [True, False])
+    def test_astype_category(self, dtype_ordered, cat_ordered):
+        # GH 10696/18593
+        data = list('abcaacbab')
+        cat = Categorical(data, categories=list('bac'), ordered=cat_ordered)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = cat.astype(dtype)
+        expected = Categorical(
+            data, categories=cat.categories, ordered=dtype_ordered)
+        tm.assert_categorical_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(list('adc'), dtype_ordered)
+        result = cat.astype(dtype)
+        expected = Categorical(data, dtype=dtype)
+        tm.assert_categorical_equal(result, expected)
+
+        if dtype_ordered is False:
+            # dtype='category' can't specify ordered, so only test once
+            result = cat.astype('category')
+            expected = cat
+            tm.assert_categorical_equal(result, expected)
+
+    def test_iter_python_types(self):
+        # GH-19909
+        # TODO(Py2): Remove long
+        cat = Categorical([1, 2])
+        assert isinstance(list(cat)[0], (int, long))
+        assert isinstance(cat.tolist()[0], (int, long))
+
+    def test_iter_python_types_datetime(self):
+        cat = Categorical([Timestamp('2017-01-01'),
+                           Timestamp('2017-01-02')])
+        assert isinstance(list(cat)[0], Timestamp)
+        assert isinstance(cat.tolist()[0], Timestamp)
diff --git a/pandas/tests/arrays/categorical/test_indexing.py b/pandas/tests/arrays/categorical/test_indexing.py
new file mode 100644
index 0000000000000..294344da7c95e
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_indexing.py
@@ -0,0 +1,264 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Categorical, CategoricalIndex, Index, PeriodIndex, Series
+import pandas.core.common as com
+from pandas.tests.arrays.categorical.common import TestCategorical
+import pandas.util.testing as tm
+
+
+class TestCategoricalIndexingWithFactor(TestCategorical):
+
+    def test_getitem(self):
+        assert self.factor[0] == 'a'
+        assert self.factor[-1] == 'c'
+
+        subf = self.factor[[0, 1, 2]]
+        tm.assert_numpy_array_equal(subf._codes,
+                                    np.array([0, 1, 1], dtype=np.int8))
+
+        subf = self.factor[np.asarray(self.factor) == 'c']
+        tm.assert_numpy_array_equal(subf._codes,
+                                    np.array([2, 2, 2], dtype=np.int8))
+
+    def test_setitem(self):
+
+        # int/positional
+        c = self.factor.copy()
+        c[0] = 'b'
+        assert c[0] == 'b'
+        c[-1] = 'a'
+        assert c[-1] == 'a'
+
+        # boolean
+        c = self.factor.copy()
+        indexer = np.zeros(len(c), dtype='bool')
+        indexer[0] = True
+        indexer[-1] = True
+        c[indexer] = 'c'
+        expected = Categorical(['c', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
+                               ordered=True)
+
+        tm.assert_categorical_equal(c, expected)
+
+    @pytest.mark.parametrize('other', [
+        pd.Categorical(['b', 'a']),
+        pd.Categorical(['b', 'a'], categories=['b', 'a']),
+    ])
+    def test_setitem_same_but_unordered(self, other):
+        # GH-24142
+        target = pd.Categorical(['a', 'b'], categories=['a', 'b'])
+        mask = np.array([True, False])
+        target[mask] = other[mask]
+        expected = pd.Categorical(['b', 'b'], categories=['a', 'b'])
+        tm.assert_categorical_equal(target, expected)
+
+    @pytest.mark.parametrize('other', [
+        pd.Categorical(['b', 'a'], categories=['b', 'a', 'c']),
+        pd.Categorical(['b', 'a'], categories=['a', 'b', 'c']),
+        pd.Categorical(['a', 'a'], categories=['a']),
+        pd.Categorical(['b', 'b'], categories=['b']),
+    ])
+    def test_setitem_different_unordered_raises(self, other):
+        # GH-24142
+        target = pd.Categorical(['a', 'b'], categories=['a', 'b'])
+        mask = np.array([True, False])
+        with pytest.raises(ValueError):
+            target[mask] = other[mask]
+
+    @pytest.mark.parametrize('other', [
+        pd.Categorical(['b', 'a']),
+        pd.Categorical(['b', 'a'], categories=['b', 'a'], ordered=True),
+        pd.Categorical(['b', 'a'], categories=['a', 'b', 'c'], ordered=True),
+    ])
+    def test_setitem_same_ordered_rasies(self, other):
+        # Gh-24142
+        target = pd.Categorical(['a', 'b'], categories=['a', 'b'],
+                                ordered=True)
+        mask = np.array([True, False])
+
+        with pytest.raises(ValueError):
+            target[mask] = other[mask]
+
+
+class TestCategoricalIndexing(object):
+
+    def test_getitem_listlike(self):
+
+        # GH 9469
+        # properly coerce the input indexers
+        np.random.seed(1)
+        c = Categorical(np.random.randint(0, 5, size=150000).astype(np.int8))
+        result = c.codes[np.array([100000]).astype(np.int64)]
+        expected = c[np.array([100000]).astype(np.int64)].codes
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_periodindex(self):
+        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
+                            '2014-03', '2014-03'], freq='M')
+
+        cat1 = Categorical(idx1)
+        str(cat1)
+        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.int8)
+        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
+        tm.assert_numpy_array_equal(cat1._codes, exp_arr)
+        tm.assert_index_equal(cat1.categories, exp_idx)
+
+        idx2 = PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
+                            '2014-03', '2014-01'], freq='M')
+        cat2 = Categorical(idx2, ordered=True)
+        str(cat2)
+        exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.int8)
+        exp_idx2 = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
+        tm.assert_numpy_array_equal(cat2._codes, exp_arr)
+        tm.assert_index_equal(cat2.categories, exp_idx2)
+
+        idx3 = PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
+                            '2013-08', '2013-07', '2013-05'], freq='M')
+        cat3 = Categorical(idx3, ordered=True)
+        exp_arr = np.array([6, 5, 4, 3, 2, 1, 0], dtype=np.int8)
+        exp_idx = PeriodIndex(['2013-05', '2013-07', '2013-08', '2013-09',
+                               '2013-10', '2013-11', '2013-12'], freq='M')
+        tm.assert_numpy_array_equal(cat3._codes, exp_arr)
+        tm.assert_index_equal(cat3.categories, exp_idx)
+
+    def test_categories_assigments(self):
+        s = Categorical(["a", "b", "c", "a"])
+        exp = np.array([1, 2, 3, 1], dtype=np.int64)
+        s.categories = [1, 2, 3]
+        tm.assert_numpy_array_equal(s.__array__(), exp)
+        tm.assert_index_equal(s.categories, Index([1, 2, 3]))
+
+        # lengthen
+        with pytest.raises(ValueError):
+            s.categories = [1, 2, 3, 4]
+
+        # shorten
+        with pytest.raises(ValueError):
+            s.categories = [1, 2]
+
+    # Combinations of sorted/unique:
+    @pytest.mark.parametrize("idx_values", [[1, 2, 3, 4], [1, 3, 2, 4],
+                                            [1, 3, 3, 4], [1, 2, 2, 4]])
+    # Combinations of missing/unique
+    @pytest.mark.parametrize("key_values", [[1, 2], [1, 5], [1, 1], [5, 5]])
+    @pytest.mark.parametrize("key_class", [Categorical, CategoricalIndex])
+    def test_get_indexer_non_unique(self, idx_values, key_values, key_class):
+        # GH 21448
+        key = key_class(key_values, categories=range(1, 5))
+        # Test for flat index and CategoricalIndex with same/different cats:
+        for dtype in None, 'category', key.dtype:
+            idx = Index(idx_values, dtype=dtype)
+            expected, exp_miss = idx.get_indexer_non_unique(key_values)
+            result, res_miss = idx.get_indexer_non_unique(key)
+
+            tm.assert_numpy_array_equal(expected, result)
+            tm.assert_numpy_array_equal(exp_miss, res_miss)
+
+    def test_where_unobserved_nan(self):
+        ser = pd.Series(pd.Categorical(['a', 'b']))
+        result = ser.where([True, False])
+        expected = pd.Series(pd.Categorical(['a', None],
+                                            categories=['a', 'b']))
+        tm.assert_series_equal(result, expected)
+
+        # all NA
+        ser = pd.Series(pd.Categorical(['a', 'b']))
+        result = ser.where([False, False])
+        expected = pd.Series(pd.Categorical([None, None],
+                                            categories=['a', 'b']))
+        tm.assert_series_equal(result, expected)
+
+    def test_where_unobserved_categories(self):
+        ser = pd.Series(
+            Categorical(['a', 'b', 'c'], categories=['d', 'c', 'b', 'a'])
+        )
+        result = ser.where([True, True, False], other='b')
+        expected = pd.Series(
+            Categorical(['a', 'b', 'b'], categories=ser.cat.categories)
+        )
+        tm.assert_series_equal(result, expected)
+
+    def test_where_other_categorical(self):
+        ser = pd.Series(
+            Categorical(['a', 'b', 'c'], categories=['d', 'c', 'b', 'a'])
+        )
+        other = Categorical(['b', 'c', 'a'], categories=['a', 'c', 'b', 'd'])
+        result = ser.where([True, False, True], other)
+        expected = pd.Series(Categorical(['a', 'c', 'c'], dtype=ser.dtype))
+        tm.assert_series_equal(result, expected)
+
+    def test_where_warns(self):
+        ser = pd.Series(Categorical(['a', 'b', 'c']))
+        with tm.assert_produces_warning(FutureWarning):
+            result = ser.where([True, False, True], 'd')
+
+        expected = pd.Series(np.array(['a', 'd', 'c'], dtype='object'))
+        tm.assert_series_equal(result, expected)
+
+    def test_where_ordered_differs_rasies(self):
+        ser = pd.Series(
+            Categorical(['a', 'b', 'c'], categories=['d', 'c', 'b', 'a'],
+                        ordered=True)
+        )
+        other = Categorical(['b', 'c', 'a'], categories=['a', 'c', 'b', 'd'],
+                            ordered=True)
+        with tm.assert_produces_warning(FutureWarning):
+            result = ser.where([True, False, True], other)
+
+        expected = pd.Series(np.array(['a', 'c', 'c'], dtype=object))
+        tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("index", [True, False])
+def test_mask_with_boolean(index):
+    s = Series(range(3))
+    idx = Categorical([True, False, True])
+    if index:
+        idx = CategoricalIndex(idx)
+
+    assert com.is_bool_indexer(idx)
+    result = s[idx]
+    expected = s[idx.astype('object')]
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("index", [True, False])
+def test_mask_with_boolean_raises(index):
+    s = Series(range(3))
+    idx = Categorical([True, False, None])
+    if index:
+        idx = CategoricalIndex(idx)
+
+    with pytest.raises(ValueError, match='NA / NaN'):
+        s[idx]
+
+
+@pytest.fixture
+def non_coercible_categorical(monkeypatch):
+    """
+    Monkeypatch Categorical.__array__ to ensure no implicit conversion.
+
+    Raises
+    ------
+    ValueError
+        When Categorical.__array__ is called.
+    """
+    # TODO(Categorical): identify other places where this may be
+    # useful and move to a conftest.py
+    def array(self, dtype=None):
+        raise ValueError("I cannot be converted.")
+
+    with monkeypatch.context() as m:
+        m.setattr(Categorical, "__array__", array)
+        yield
+
+
+def test_series_at(non_coercible_categorical):
+    arr = Categorical(['a', 'b', 'c'])
+    ser = Series(arr)
+    result = ser.at[0]
+    assert result == 'a'
diff --git a/pandas/tests/arrays/categorical/test_missing.py b/pandas/tests/arrays/categorical/test_missing.py
new file mode 100644
index 0000000000000..b4b361dabac61
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_missing.py
@@ -0,0 +1,87 @@
+# -*- coding: utf-8 -*-
+import collections
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+from pandas import Categorical, Index, isna
+import pandas.util.testing as tm
+
+
+class TestCategoricalMissing(object):
+
+    def test_na_flags_int_categories(self):
+        # #1457
+
+        categories = lrange(10)
+        labels = np.random.randint(0, 10, 20)
+        labels[::5] = -1
+
+        cat = Categorical(labels, categories, fastpath=True)
+        repr(cat)
+
+        tm.assert_numpy_array_equal(isna(cat), labels == -1)
+
+    def test_nan_handling(self):
+
+        # Nans are represented as -1 in codes
+        c = Categorical(["a", "b", np.nan, "a"])
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, -1, 0],
+                                                       dtype=np.int8))
+        c[1] = np.nan
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, -1, -1, 0],
+                                                       dtype=np.int8))
+
+        # Adding nan to categories should make assigned nan point to the
+        # category!
+        c = Categorical(["a", "b", np.nan, "a"])
+        tm.assert_index_equal(c.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(c._codes, np.array([0, 1, -1, 0],
+                                                       dtype=np.int8))
+
+    def test_set_dtype_nans(self):
+        c = Categorical(['a', 'b', np.nan])
+        result = c._set_dtype(CategoricalDtype(['a', 'c']))
+        tm.assert_numpy_array_equal(result.codes, np.array([0, -1, -1],
+                                                           dtype='int8'))
+
+    def test_set_item_nan(self):
+        cat = Categorical([1, 2, 3])
+        cat[1] = np.nan
+
+        exp = Categorical([1, np.nan, 3], categories=[1, 2, 3])
+        tm.assert_categorical_equal(cat, exp)
+
+    @pytest.mark.parametrize('fillna_kwargs, msg', [
+        (dict(value=1, method='ffill'),
+         "Cannot specify both 'value' and 'method'."),
+        (dict(),
+         "Must specify a fill 'value' or 'method'."),
+        (dict(method='bad'),
+         "Invalid fill method. Expecting .* bad"),
+    ])
+    def test_fillna_raises(self, fillna_kwargs, msg):
+        # https://github.com/pandas-dev/pandas/issues/19682
+        cat = Categorical([1, 2, 3])
+
+        with pytest.raises(ValueError, match=msg):
+            cat.fillna(**fillna_kwargs)
+
+    @pytest.mark.parametrize("named", [True, False])
+    def test_fillna_iterable_category(self, named):
+        # https://github.com/pandas-dev/pandas/issues/21097
+        if named:
+            Point = collections.namedtuple("Point", "x y")
+        else:
+            Point = lambda *args: args  # tuple
+        cat = Categorical([Point(0, 0), Point(0, 1), None])
+        result = cat.fillna(Point(0, 0))
+        expected = Categorical([Point(0, 0), Point(0, 1), Point(0, 0)])
+
+        tm.assert_categorical_equal(result, expected)
diff --git a/pandas/tests/arrays/categorical/test_operators.py b/pandas/tests/arrays/categorical/test_operators.py
new file mode 100644
index 0000000000000..e1264722aedcd
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_operators.py
@@ -0,0 +1,369 @@
+# -*- coding: utf-8 -*-
+import operator
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2
+
+import pandas as pd
+from pandas import Categorical, DataFrame, Series, date_range
+from pandas.tests.arrays.categorical.common import TestCategorical
+import pandas.util.testing as tm
+
+
+class TestCategoricalOpsWithFactor(TestCategorical):
+
+    def test_categories_none_comparisons(self):
+        factor = Categorical(['a', 'b', 'b', 'a',
+                              'a', 'c', 'c', 'c'], ordered=True)
+        tm.assert_categorical_equal(factor, self.factor)
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_comparisons(self):
+
+        result = self.factor[self.factor == 'a']
+        expected = self.factor[np.asarray(self.factor) == 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor != 'a']
+        expected = self.factor[np.asarray(self.factor) != 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor < 'c']
+        expected = self.factor[np.asarray(self.factor) < 'c']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor > 'a']
+        expected = self.factor[np.asarray(self.factor) > 'a']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor >= 'b']
+        expected = self.factor[np.asarray(self.factor) >= 'b']
+        tm.assert_categorical_equal(result, expected)
+
+        result = self.factor[self.factor <= 'b']
+        expected = self.factor[np.asarray(self.factor) <= 'b']
+        tm.assert_categorical_equal(result, expected)
+
+        n = len(self.factor)
+
+        other = self.factor[np.random.permutation(n)]
+        result = self.factor == other
+        expected = np.asarray(self.factor) == np.asarray(other)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = self.factor == 'd'
+        expected = np.repeat(False, len(self.factor))
+        tm.assert_numpy_array_equal(result, expected)
+
+        # comparisons with categoricals
+        cat_rev = Categorical(
+            ["a", "b", "c"], categories=["c", "b", "a"], ordered=True)
+        cat_rev_base = Categorical(
+            ["b", "b", "b"], categories=["c", "b", "a"], ordered=True)
+        cat = Categorical(["a", "b", "c"], ordered=True)
+        cat_base = Categorical(
+            ["b", "b", "b"], categories=cat.categories, ordered=True)
+
+        # comparisons need to take categories ordering into account
+        res_rev = cat_rev > cat_rev_base
+        exp_rev = np.array([True, False, False])
+        tm.assert_numpy_array_equal(res_rev, exp_rev)
+
+        res_rev = cat_rev < cat_rev_base
+        exp_rev = np.array([False, False, True])
+        tm.assert_numpy_array_equal(res_rev, exp_rev)
+
+        res = cat > cat_base
+        exp = np.array([False, False, True])
+        tm.assert_numpy_array_equal(res, exp)
+
+        # Only categories with same categories can be compared
+        with pytest.raises(TypeError):
+            cat > cat_rev
+
+        cat_rev_base2 = Categorical(
+            ["b", "b", "b"], categories=["c", "b", "a", "d"])
+
+        with pytest.raises(TypeError):
+            cat_rev > cat_rev_base2
+
+        # Only categories with same ordering information can be compared
+        cat_unorderd = cat.set_ordered(False)
+        assert not (cat > cat).any()
+
+        with pytest.raises(TypeError):
+            cat > cat_unorderd
+
+        # comparison (in both directions) with Series will raise
+        s = Series(["b", "b", "b"])
+        msg = ("Cannot compare a Categorical for op __gt__ with type"
+               r" <class 'numpy\.ndarray'>")
+        with pytest.raises(TypeError, match=msg):
+            cat > s
+        with pytest.raises(TypeError, match=msg):
+            cat_rev > s
+        with pytest.raises(TypeError, match=msg):
+            s < cat
+        with pytest.raises(TypeError, match=msg):
+            s < cat_rev
+
+        # comparison with numpy.array will raise in both direction, but only on
+        # newer numpy versions
+        a = np.array(["b", "b", "b"])
+        with pytest.raises(TypeError, match=msg):
+            cat > a
+        with pytest.raises(TypeError, match=msg):
+            cat_rev > a
+
+        # Make sure that unequal comparison take the categories order in
+        # account
+        cat_rev = Categorical(
+            list("abc"), categories=list("cba"), ordered=True)
+        exp = np.array([True, False, False])
+        res = cat_rev > "b"
+        tm.assert_numpy_array_equal(res, exp)
+
+        # check that zero-dim array gets unboxed
+        res = cat_rev > np.array("b")
+        tm.assert_numpy_array_equal(res, exp)
+
+
+class TestCategoricalOps(object):
+
+    def test_compare_frame(self):
+        # GH#24282 check that Categorical.__cmp__(DataFrame) defers to frame
+        data = ["a", "b", 2, "a"]
+        cat = Categorical(data)
+
+        df = DataFrame(cat)
+
+        for op in [operator.eq, operator.ne, operator.ge,
+                   operator.gt, operator.le, operator.lt]:
+            with pytest.raises(ValueError):
+                # alignment raises unless we transpose
+                op(cat, df)
+
+        result = cat == df.T
+        expected = DataFrame([[True, True, True, True]])
+        tm.assert_frame_equal(result, expected)
+
+        result = cat[::-1] != df.T
+        expected = DataFrame([[False, True, True, False]])
+        tm.assert_frame_equal(result, expected)
+
+    def test_datetime_categorical_comparison(self):
+        dt_cat = Categorical(date_range('2014-01-01', periods=3), ordered=True)
+        tm.assert_numpy_array_equal(dt_cat > dt_cat[0],
+                                    np.array([False, True, True]))
+        tm.assert_numpy_array_equal(dt_cat[0] < dt_cat,
+                                    np.array([False, True, True]))
+
+    def test_reflected_comparison_with_scalars(self):
+        # GH8658
+        cat = Categorical([1, 2, 3], ordered=True)
+        tm.assert_numpy_array_equal(cat > cat[0],
+                                    np.array([False, True, True]))
+        tm.assert_numpy_array_equal(cat[0] < cat,
+                                    np.array([False, True, True]))
+
+    def test_comparison_with_unknown_scalars(self):
+        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
+        # and following comparisons with scalars not in categories should raise
+        # for unequal comps, but not for equal/not equal
+        cat = Categorical([1, 2, 3], ordered=True)
+
+        msg = ("Cannot compare a Categorical for op __{}__ with a scalar,"
+               " which is not a category")
+        with pytest.raises(TypeError, match=msg.format('lt')):
+            cat < 4
+        with pytest.raises(TypeError, match=msg.format('gt')):
+            cat > 4
+        with pytest.raises(TypeError, match=msg.format('gt')):
+            4 < cat
+        with pytest.raises(TypeError, match=msg.format('lt')):
+            4 > cat
+
+        tm.assert_numpy_array_equal(cat == 4,
+                                    np.array([False, False, False]))
+        tm.assert_numpy_array_equal(cat != 4,
+                                    np.array([True, True, True]))
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    @pytest.mark.parametrize('data,reverse,base', [
+        (list("abc"), list("cba"), list("bbb")),
+        ([1, 2, 3], [3, 2, 1], [2, 2, 2])]
+    )
+    def test_comparisons(self, data, reverse, base):
+        cat_rev = Series(
+            Categorical(data, categories=reverse, ordered=True))
+        cat_rev_base = Series(
+            Categorical(base, categories=reverse, ordered=True))
+        cat = Series(Categorical(data, ordered=True))
+        cat_base = Series(
+            Categorical(base, categories=cat.cat.categories, ordered=True))
+        s = Series(base)
+        a = np.array(base)
+
+        # comparisons need to take categories ordering into account
+        res_rev = cat_rev > cat_rev_base
+        exp_rev = Series([True, False, False])
+        tm.assert_series_equal(res_rev, exp_rev)
+
+        res_rev = cat_rev < cat_rev_base
+        exp_rev = Series([False, False, True])
+        tm.assert_series_equal(res_rev, exp_rev)
+
+        res = cat > cat_base
+        exp = Series([False, False, True])
+        tm.assert_series_equal(res, exp)
+
+        scalar = base[1]
+        res = cat > scalar
+        exp = Series([False, False, True])
+        exp2 = cat.values > scalar
+        tm.assert_series_equal(res, exp)
+        tm.assert_numpy_array_equal(res.values, exp2)
+        res_rev = cat_rev > scalar
+        exp_rev = Series([True, False, False])
+        exp_rev2 = cat_rev.values > scalar
+        tm.assert_series_equal(res_rev, exp_rev)
+        tm.assert_numpy_array_equal(res_rev.values, exp_rev2)
+
+        # Only categories with same categories can be compared
+        with pytest.raises(TypeError):
+            cat > cat_rev
+
+        # categorical cannot be compared to Series or numpy array, and also
+        # not the other way around
+        msg = ("Cannot compare a Categorical for op __gt__ with type"
+               r" <class 'numpy\.ndarray'>")
+        with pytest.raises(TypeError, match=msg):
+            cat > s
+        with pytest.raises(TypeError, match=msg):
+            cat_rev > s
+        with pytest.raises(TypeError, match=msg):
+            cat > a
+        with pytest.raises(TypeError, match=msg):
+            cat_rev > a
+
+        with pytest.raises(TypeError, match=msg):
+            s < cat
+        with pytest.raises(TypeError, match=msg):
+            s < cat_rev
+
+        with pytest.raises(TypeError, match=msg):
+            a < cat
+        with pytest.raises(TypeError, match=msg):
+            a < cat_rev
+
+    @pytest.mark.parametrize('ctor', [
+        lambda *args, **kwargs: Categorical(*args, **kwargs),
+        lambda *args, **kwargs: Series(Categorical(*args, **kwargs)),
+    ])
+    def test_unordered_different_order_equal(self, ctor):
+        # https://github.com/pandas-dev/pandas/issues/16014
+        c1 = ctor(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['a', 'b'], categories=['b', 'a'], ordered=False)
+        assert (c1 == c2).all()
+
+        c1 = ctor(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['b', 'a'], categories=['b', 'a'], ordered=False)
+        assert (c1 != c2).all()
+
+        c1 = ctor(['a', 'a'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['b', 'b'], categories=['b', 'a'], ordered=False)
+        assert (c1 != c2).all()
+
+        c1 = ctor(['a', 'a'], categories=['a', 'b'], ordered=False)
+        c2 = ctor(['a', 'b'], categories=['b', 'a'], ordered=False)
+        result = c1 == c2
+        tm.assert_numpy_array_equal(np.array(result), np.array([True, False]))
+
+    def test_unordered_different_categories_raises(self):
+        c1 = Categorical(['a', 'b'], categories=['a', 'b'], ordered=False)
+        c2 = Categorical(['a', 'c'], categories=['c', 'a'], ordered=False)
+
+        with pytest.raises(TypeError, match=("Categoricals can "
+                                             "only be compared")):
+            c1 == c2
+
+    def test_compare_different_lengths(self):
+        c1 = Categorical([], categories=['a', 'b'])
+        c2 = Categorical([], categories=['a'])
+
+        msg = "Categories are different lengths"
+        with pytest.raises(TypeError, match=msg):
+            c1 == c2
+
+    def test_compare_unordered_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/16603#issuecomment-
+        # 349290078
+        a = pd.Categorical(['a'], categories=['a', 'b'])
+        b = pd.Categorical(['b'], categories=['b', 'a'])
+        assert not a.equals(b)
+
+    def test_numeric_like_ops(self):
+
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+
+        # numeric ops should not succeed
+        for op, str_rep in [('__add__', r'\+'),
+                            ('__sub__', '-'),
+                            ('__mul__', r'\*'),
+                            ('__truediv__', '/')]:
+            msg = r"Series cannot perform the operation {}".format(str_rep)
+            with pytest.raises(TypeError, match=msg):
+                getattr(df, op)(df)
+
+        # reduction ops should not succeed (unless specifically defined, e.g.
+        # min/max)
+        s = df['value_group']
+        for op in ['kurt', 'skew', 'var', 'std', 'mean', 'sum', 'median']:
+            msg = "Categorical cannot perform the operation {}".format(op)
+            with pytest.raises(TypeError, match=msg):
+                getattr(s, op)(numeric_only=False)
+
+        # mad technically works because it takes always the numeric data
+
+        # numpy ops
+        s = Series(Categorical([1, 2, 3, 4]))
+        with pytest.raises(TypeError):
+            np.sum(s)
+
+        # numeric ops on a Series
+        for op, str_rep in [('__add__', r'\+'),
+                            ('__sub__', '-'),
+                            ('__mul__', r'\*'),
+                            ('__truediv__', '/')]:
+            msg = r"Series cannot perform the operation {}".format(str_rep)
+            with pytest.raises(TypeError, match=msg):
+                getattr(s, op)(2)
+
+        # invalid ufunc
+        with pytest.raises(TypeError):
+            np.log(s)
+
+    def test_contains(self):
+        # GH21508
+        c = pd.Categorical(list('aabbca'), categories=list('cab'))
+
+        assert 'b' in c
+        assert 'z' not in c
+        assert np.nan not in c
+        with pytest.raises(TypeError):
+            assert [1] in c
+
+        # assert codes NOT in index
+        assert 0 not in c
+        assert 1 not in c
+
+        c = pd.Categorical(list('aabbca') + [np.nan], categories=list('cab'))
+        assert np.nan in c
diff --git a/pandas/tests/arrays/categorical/test_repr.py b/pandas/tests/arrays/categorical/test_repr.py
new file mode 100644
index 0000000000000..08b32a216ffb6
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_repr.py
@@ -0,0 +1,529 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+
+from pandas.compat import PY3, u
+
+from pandas import (
+    Categorical, CategoricalIndex, Series, date_range, period_range,
+    timedelta_range)
+from pandas.core.config import option_context
+from pandas.tests.arrays.categorical.common import TestCategorical
+
+
+class TestCategoricalReprWithFactor(TestCategorical):
+
+    def test_print(self):
+        expected = ["[a, b, b, a, a, c, c, c]",
+                    "Categories (3, object): [a < b < c]"]
+        expected = "\n".join(expected)
+        actual = repr(self.factor)
+        assert actual == expected
+
+
+class TestCategoricalRepr(object):
+
+    def test_big_print(self):
+        factor = Categorical([0, 1, 2, 0, 1, 2] * 100, ['a', 'b', 'c'],
+                             fastpath=True)
+        expected = ["[a, b, c, a, b, ..., b, c, a, b, c]", "Length: 600",
+                    "Categories (3, object): [a, b, c]"]
+        expected = "\n".join(expected)
+
+        actual = repr(factor)
+
+        assert actual == expected
+
+    def test_empty_print(self):
+        factor = Categorical([], ["a", "b", "c"])
+        expected = ("[], Categories (3, object): [a, b, c]")
+        actual = repr(factor)
+        assert actual == expected
+
+        assert expected == actual
+        factor = Categorical([], ["a", "b", "c"], ordered=True)
+        expected = ("[], Categories (3, object): [a < b < c]")
+        actual = repr(factor)
+        assert expected == actual
+
+        factor = Categorical([], [])
+        expected = ("[], Categories (0, object): []")
+        assert expected == repr(factor)
+
+    def test_print_none_width(self):
+        # GH10087
+        a = Series(Categorical([1, 2, 3, 4]))
+        exp = u("0    1\n1    2\n2    3\n3    4\n" +
+                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
+
+        with option_context("display.width", None):
+            assert exp == repr(a)
+
+    def test_unicode_print(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+
+        c = Categorical(['aaaaa', 'bb', 'cccc'] * 20)
+        expected = u"""\
+[aaaaa, bb, cccc, aaaaa, bb, ..., bb, cccc, aaaaa, bb, cccc]
+Length: 60
+Categories (3, object): [aaaaa, bb, cccc]"""
+
+        assert _rep(c) == expected
+
+        c = Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
+        expected = u"""\
+[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
+Length: 60
+Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
+
+        assert _rep(c) == expected
+
+        # unicode option should not affect to Categorical, as it doesn't care
+        # the repr width
+        with option_context('display.unicode.east_asian_width', True):
+
+            c = Categorical([u'ああああ', u'いいいいい', u'ううううううう'] * 20)
+            expected = u"""[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
+Length: 60
+Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
+
+            assert _rep(c) == expected
+
+    def test_categorical_repr(self):
+        c = Categorical([1, 2, 3])
+        exp = """[1, 2, 3]
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3])
+        exp = """[1, 2, 3, 1, 2, 3]
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 4, 5] * 10)
+        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
+Length: 50
+Categories (5, int64): [1, 2, 3, 4, 5]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(np.arange(20))
+        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
+Length: 20
+Categories (20, int64): [0, 1, 2, 3, ..., 16, 17, 18, 19]"""
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_ordered(self):
+        c = Categorical([1, 2, 3], ordered=True)
+        exp = """[1, 2, 3]
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3], ordered=True)
+        exp = """[1, 2, 3, 1, 2, 3]
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(c) == exp
+
+        c = Categorical([1, 2, 3, 4, 5] * 10, ordered=True)
+        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
+Length: 50
+Categories (5, int64): [1 < 2 < 3 < 4 < 5]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(np.arange(20), ordered=True)
+        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
+Length: 20
+Categories (20, int64): [0 < 1 < 2 < 3 ... 16 < 17 < 18 < 19]"""
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx)
+
+        # TODO(wesm): exceeding 80 characters in the console is not good
+        # behavior
+        exp = (
+            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
+            "2011-01-01 12:00:00, 2011-01-01 13:00:00]\n"
+            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
+            "                                 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]""")
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = (
+            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
+            "2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]\n"
+            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
+            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
+            "                                 2011-01-01 12:00:00, "
+            "2011-01-01 13:00:00]")
+
+        assert repr(c) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        c = Categorical(idx)
+        exp = (
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
+            "2011-01-01 13:00:00-05:00]\n"
+            "Categories (5, datetime64[ns, US/Eastern]): "
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 13:00:00-05:00]")
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = (
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
+            "2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, "
+            "2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, "
+            "2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]\n"
+            "Categories (5, datetime64[ns, US/Eastern]): "
+            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
+            "                                             "
+            "2011-01-01 13:00:00-05:00]")
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_int_with_nan(self):
+        c = Categorical([1, 2, np.nan])
+        c_exp = """[1, 2, NaN]\nCategories (2, int64): [1, 2]"""
+        assert repr(c) == c_exp
+
+        s = Series([1, 2, np.nan], dtype="object").astype("category")
+        s_exp = """0      1\n1      2\n2    NaN
+dtype: category
+Categories (2, int64): [1, 2]"""
+        assert repr(s) == s_exp
+
+    def test_categorical_repr_period(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        c = Categorical(idx)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        c = Categorical(idx)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = timedelta_range('1 hours', periods=20)
+        c = Categorical(idx)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 20
+Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
+                                   18 days 01:00:00, 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 40
+Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
+                                   18 days 01:00:00, 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        c = Categorical(idx, ordered=True)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(c) == exp
+
+        idx = timedelta_range('1 hours', periods=20)
+        c = Categorical(idx, ordered=True)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 20
+Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
+                                   18 days 01:00:00 < 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+        c = Categorical(idx.append(idx), categories=idx, ordered=True)
+        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
+Length: 40
+Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
+                                   18 days 01:00:00 < 19 days 01:00:00]"""  # noqa
+
+        assert repr(c) == exp
+
+    def test_categorical_index_repr(self):
+        idx = CategoricalIndex(Categorical([1, 2, 3]))
+        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=False, dtype='category')"""  # noqa
+        assert repr(idx) == exp
+
+        i = CategoricalIndex(Categorical(np.arange(10)))
+        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_ordered(self):
+        i = CategoricalIndex(Categorical([1, 2, 3], ordered=True))
+        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(np.arange(10), ordered=True))
+        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
+                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
+                  '2011-01-01 13:00:00'],
+                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
+                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
+                  '2011-01-01 13:00:00'],
+                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(idx.append(idx), ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
+                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
+                  '2011-01-01 13:00:00-05:00', '2011-01-01 09:00:00-05:00',
+                  '2011-01-01 10:00:00-05:00', '2011-01-01 11:00:00-05:00',
+                  '2011-01-01 12:00:00-05:00', '2011-01-01 13:00:00-05:00'],
+                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_period(self):
+        # test all length
+        idx = period_range('2011-01-01 09:00', freq='H', periods=1)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00'], categories=[2011-01-01 09:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=2)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=3)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        i = CategoricalIndex(Categorical(idx.append(idx)))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00', '2011-01-01 09:00',
+                  '2011-01-01 10:00', '2011-01-01 11:00', '2011-01-01 12:00',
+                  '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
+                  '2011-01-01 12:00', '2011-01-01 13:00'],
+                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=False, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        i = CategoricalIndex(Categorical(idx))
+        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
+                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
+                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
+                  '9 days 01:00:00'],
+                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=False, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
+
+    def test_categorical_index_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=True, dtype='category')"""  # noqa
+        assert repr(i) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        i = CategoricalIndex(Categorical(idx, ordered=True))
+        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
+                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
+                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
+                  '9 days 01:00:00'],
+                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=True, dtype='category')"""  # noqa
+
+        assert repr(i) == exp
diff --git a/pandas/tests/arrays/categorical/test_sorting.py b/pandas/tests/arrays/categorical/test_sorting.py
new file mode 100644
index 0000000000000..3d55862cd2cc0
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_sorting.py
@@ -0,0 +1,124 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import Categorical, Index
+import pandas.util.testing as tm
+
+
+class TestCategoricalSort(object):
+
+    def test_argsort(self):
+        c = Categorical([5, 3, 1, 4, 2], ordered=True)
+
+        expected = np.array([2, 4, 1, 3, 0])
+        tm.assert_numpy_array_equal(c.argsort(ascending=True), expected,
+                                    check_dtype=False)
+
+        expected = expected[::-1]
+        tm.assert_numpy_array_equal(c.argsort(ascending=False), expected,
+                                    check_dtype=False)
+
+    def test_numpy_argsort(self):
+        c = Categorical([5, 3, 1, 4, 2], ordered=True)
+
+        expected = np.array([2, 4, 1, 3, 0])
+        tm.assert_numpy_array_equal(np.argsort(c), expected,
+                                    check_dtype=False)
+
+        tm.assert_numpy_array_equal(np.argsort(c, kind='mergesort'), expected,
+                                    check_dtype=False)
+
+        msg = "the 'axis' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.argsort(c, axis=0)
+
+        msg = "the 'order' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.argsort(c, order='C')
+
+    def test_sort_values(self):
+
+        # unordered cats are sortable
+        cat = Categorical(["a", "b", "b", "a"], ordered=False)
+        cat.sort_values()
+
+        cat = Categorical(["a", "c", "b", "d"], ordered=True)
+
+        # sort_values
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        cat = Categorical(["a", "c", "b", "d"],
+                          categories=["a", "b", "c", "d"], ordered=True)
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        res = cat.sort_values(ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=object)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        # sort (inplace order)
+        cat1 = cat.copy()
+        cat1.sort_values(inplace=True)
+        exp = np.array(["a", "b", "c", "d"], dtype=object)
+        tm.assert_numpy_array_equal(cat1.__array__(), exp)
+        tm.assert_index_equal(res.categories, cat.categories)
+
+        # reverse
+        cat = Categorical(["a", "c", "c", "b", "d"], ordered=True)
+        res = cat.sort_values(ascending=False)
+        exp_val = np.array(["d", "c", "c", "b", "a"], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+    def test_sort_values_na_position(self):
+        # see gh-12882
+        cat = Categorical([5, 2, np.nan, 2, np.nan], ordered=True)
+        exp_categories = Index([2, 5])
+
+        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
+        res = cat.sort_values()  # default arguments
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([np.nan, np.nan, 2.0, 2.0, 5.0])
+        res = cat.sort_values(ascending=True, na_position='first')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([np.nan, np.nan, 5.0, 2.0, 2.0])
+        res = cat.sort_values(ascending=False, na_position='first')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
+        res = cat.sort_values(ascending=True, na_position='last')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        exp = np.array([5.0, 2.0, 2.0, np.nan, np.nan])
+        res = cat.sort_values(ascending=False, na_position='last')
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
+        res = cat.sort_values(ascending=False, na_position='last')
+        exp_val = np.array(["d", "c", "b", "a", np.nan], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
+
+        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
+        res = cat.sort_values(ascending=False, na_position='first')
+        exp_val = np.array([np.nan, "d", "c", "b", "a"], dtype=object)
+        exp_categories = Index(["a", "b", "c", "d"])
+        tm.assert_numpy_array_equal(res.__array__(), exp_val)
+        tm.assert_index_equal(res.categories, exp_categories)
diff --git a/pandas/tests/arrays/categorical/test_subclass.py b/pandas/tests/arrays/categorical/test_subclass.py
new file mode 100644
index 0000000000000..7e90f8d51a3ef
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_subclass.py
@@ -0,0 +1,25 @@
+# -*- coding: utf-8 -*-
+
+from pandas import Categorical
+import pandas.util.testing as tm
+
+
+class TestCategoricalSubclassing(object):
+
+    def test_constructor(self):
+        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
+        assert isinstance(sc, tm.SubclassedCategorical)
+        tm.assert_categorical_equal(sc, Categorical(['a', 'b', 'c']))
+
+    def test_from_codes(self):
+        sc = tm.SubclassedCategorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
+        assert isinstance(sc, tm.SubclassedCategorical)
+        exp = Categorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
+        tm.assert_categorical_equal(sc, exp)
+
+    def test_map(self):
+        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
+        res = sc.map(lambda x: x.upper())
+        assert isinstance(res, tm.SubclassedCategorical)
+        exp = Categorical(['A', 'B', 'C'])
+        tm.assert_categorical_equal(res, exp)
diff --git a/pandas/tests/arrays/categorical/test_warnings.py b/pandas/tests/arrays/categorical/test_warnings.py
new file mode 100644
index 0000000000000..23d00585f950e
--- /dev/null
+++ b/pandas/tests/arrays/categorical/test_warnings.py
@@ -0,0 +1,31 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+class TestCategoricalWarnings(object):
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; c = Categorical([])"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('c.', 1))
+
+    def test_CategoricalAccessor_categorical_deprecation(object):
+        with tm.assert_produces_warning(FutureWarning):
+            pd.Series(['a', 'b'], dtype='category').cat.categorical
+
+    def test_CategoricalAccessor_name_deprecation(object):
+        with tm.assert_produces_warning(FutureWarning):
+            pd.Series(['a', 'b'], dtype='category').cat.name
+
+    def test_CategoricalAccessor_index_deprecation(object):
+        with tm.assert_produces_warning(FutureWarning):
+            pd.Series(['a', 'b'], dtype='category').cat.index
diff --git a/vb_suite/source/_static/stub b/pandas/tests/arrays/interval/__init__.py
similarity index 100%
rename from vb_suite/source/_static/stub
rename to pandas/tests/arrays/interval/__init__.py
diff --git a/pandas/tests/arrays/interval/test_interval.py b/pandas/tests/arrays/interval/test_interval.py
new file mode 100644
index 0000000000000..e81e64d90ff5f
--- /dev/null
+++ b/pandas/tests/arrays/interval/test_interval.py
@@ -0,0 +1,68 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, Interval, IntervalIndex, date_range, timedelta_range
+from pandas.core.arrays import IntervalArray
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[
+    (Index([0, 2, 4]), Index([1, 3, 5])),
+    (Index([0., 1., 2.]), Index([1., 2., 3.])),
+    (timedelta_range('0 days', periods=3),
+     timedelta_range('1 day', periods=3)),
+    (date_range('20170101', periods=3), date_range('20170102', periods=3)),
+    (date_range('20170101', periods=3, tz='US/Eastern'),
+     date_range('20170102', periods=3, tz='US/Eastern'))],
+    ids=lambda x: str(x[0].dtype))
+def left_right_dtypes(request):
+    """
+    Fixture for building an IntervalArray from various dtypes
+    """
+    return request.param
+
+
+class TestMethods(object):
+
+    @pytest.mark.parametrize('new_closed', [
+        'left', 'right', 'both', 'neither'])
+    def test_set_closed(self, closed, new_closed):
+        # GH 21670
+        array = IntervalArray.from_breaks(range(10), closed=closed)
+        result = array.set_closed(new_closed)
+        expected = IntervalArray.from_breaks(range(10), closed=new_closed)
+        tm.assert_extension_array_equal(result, expected)
+
+    @pytest.mark.parametrize('other', [
+        Interval(0, 1, closed='right'),
+        IntervalArray.from_breaks([1, 2, 3, 4], closed='right'),
+    ])
+    def test_where_raises(self, other):
+        ser = pd.Series(IntervalArray.from_breaks([1, 2, 3, 4],
+                                                  closed='left'))
+        match = "'value.closed' is 'right', expected 'left'."
+        with pytest.raises(ValueError, match=match):
+            ser.where([True, False, True], other=other)
+
+
+class TestSetitem(object):
+
+    def test_set_na(self, left_right_dtypes):
+        left, right = left_right_dtypes
+        result = IntervalArray.from_arrays(left, right)
+        result[0] = np.nan
+
+        expected_left = Index([left._na_value] + list(left[1:]))
+        expected_right = Index([right._na_value] + list(right[1:]))
+        expected = IntervalArray.from_arrays(expected_left, expected_right)
+
+        tm.assert_extension_array_equal(result, expected)
+
+
+def test_repr_matches():
+    idx = IntervalIndex.from_breaks([1, 2, 3])
+    a = repr(idx)
+    b = repr(idx.values)
+    assert a.replace("Index", "Array") == b
diff --git a/pandas/tests/arrays/interval/test_ops.py b/pandas/tests/arrays/interval/test_ops.py
new file mode 100644
index 0000000000000..bdbd145ed2a80
--- /dev/null
+++ b/pandas/tests/arrays/interval/test_ops.py
@@ -0,0 +1,82 @@
+"""Tests for Interval-Interval operations, such as overlaps, contains, etc."""
+import numpy as np
+import pytest
+
+from pandas import Interval, IntervalIndex, Timedelta, Timestamp
+from pandas.core.arrays import IntervalArray
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[IntervalArray, IntervalIndex])
+def constructor(request):
+    """
+    Fixture for testing both interval container classes.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[
+    (Timedelta('0 days'), Timedelta('1 day')),
+    (Timestamp('2018-01-01'), Timedelta('1 day')),
+    (0, 1)], ids=lambda x: type(x[0]).__name__)
+def start_shift(request):
+    """
+    Fixture for generating intervals of different types from a start value
+    and a shift value that can be added to start to generate an endpoint.
+    """
+    return request.param
+
+
+class TestOverlaps(object):
+
+    def test_overlaps_interval(
+            self, constructor, start_shift, closed, other_closed):
+        start, shift = start_shift
+        interval = Interval(start, start + 3 * shift, other_closed)
+
+        # intervals: identical, nested, spanning, partial, adjacent, disjoint
+        tuples = [(start, start + 3 * shift),
+                  (start + shift, start + 2 * shift),
+                  (start - shift, start + 4 * shift),
+                  (start + 2 * shift, start + 4 * shift),
+                  (start + 3 * shift, start + 4 * shift),
+                  (start + 4 * shift, start + 5 * shift)]
+        interval_container = constructor.from_tuples(tuples, closed)
+
+        adjacent = (interval.closed_right and interval_container.closed_left)
+        expected = np.array([True, True, True, True, adjacent, False])
+        result = interval_container.overlaps(interval)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('other_constructor', [
+        IntervalArray, IntervalIndex])
+    def test_overlaps_interval_container(self, constructor, other_constructor):
+        # TODO: modify this test when implemented
+        interval_container = constructor.from_breaks(range(5))
+        other_container = other_constructor.from_breaks(range(5))
+        with pytest.raises(NotImplementedError):
+            interval_container.overlaps(other_container)
+
+    def test_overlaps_na(self, constructor, start_shift):
+        """NA values are marked as False"""
+        start, shift = start_shift
+        interval = Interval(start, start + shift)
+
+        tuples = [(start, start + shift),
+                  np.nan,
+                  (start + 2 * shift, start + 3 * shift)]
+        interval_container = constructor.from_tuples(tuples)
+
+        expected = np.array([True, False, False])
+        result = interval_container.overlaps(interval)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('other', [
+        10, True, 'foo', Timedelta('1 day'), Timestamp('2018-01-01')],
+        ids=lambda x: type(x).__name__)
+    def test_overlaps_invalid_type(self, constructor, other):
+        interval_container = constructor.from_breaks(range(5))
+        msg = '`other` must be Interval-like, got {other}'.format(
+            other=type(other).__name__)
+        with pytest.raises(TypeError, match=msg):
+            interval_container.overlaps(other)
diff --git a/pandas/tests/arrays/sparse/__init__.py b/pandas/tests/arrays/sparse/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/test_arithmetics.py b/pandas/tests/arrays/sparse/test_arithmetics.py
similarity index 82%
rename from pandas/tests/sparse/test_arithmetics.py
rename to pandas/tests/arrays/sparse/test_arithmetics.py
index eb926082a7b7c..42a29654b44d5 100644
--- a/pandas/tests/sparse/test_arithmetics.py
+++ b/pandas/tests/arrays/sparse/test_arithmetics.py
@@ -1,9 +1,14 @@
+import operator
+
 import numpy as np
+import pytest
+
 import pandas as pd
+from pandas.core.sparse.api import SparseDtype
 import pandas.util.testing as tm
 
 
-class TestSparseArrayArithmetics(tm.TestCase):
+class TestSparseArrayArithmetics(object):
 
     _base = np.array
     _klass = pd.SparseArray
@@ -31,7 +36,8 @@ def _check_numeric_ops(self, a, b, a_dense, b_dense):
             self._assert((b / a).to_dense(), b_dense * 1.0 / a_dense)
 
             # ToDo: FIXME in GH 13843
-            if not (self._base == pd.Series and a.dtype == 'int64'):
+            if not (self._base == pd.Series and
+                    a.dtype.subtype == np.dtype('int64')):
                 self._assert((a // b).to_dense(), a_dense // b_dense)
                 self._assert((b // a).to_dense(), b_dense // a_dense)
 
@@ -56,7 +62,8 @@ def _check_numeric_ops(self, a, b, a_dense, b_dense):
             self._assert((b_dense / a).to_dense(), b_dense * 1.0 / a_dense)
 
             # ToDo: FIXME in GH 13843
-            if not (self._base == pd.Series and a.dtype == 'int64'):
+            if not (self._base == pd.Series and
+                    a.dtype.subtype == np.dtype('int64')):
                 self._assert((a // b_dense).to_dense(), a_dense // b_dense)
                 self._assert((b_dense // a).to_dense(), b_dense // a_dense)
 
@@ -67,9 +74,10 @@ def _check_numeric_ops(self, a, b, a_dense, b_dense):
             self._assert((b_dense ** a).to_dense(), b_dense ** a_dense)
 
     def _check_bool_result(self, res):
-        tm.assertIsInstance(res, self._klass)
-        self.assertEqual(res.dtype, np.bool)
-        self.assertIsInstance(res.fill_value, bool)
+        assert isinstance(res, self._klass)
+        assert isinstance(res.dtype, SparseDtype)
+        assert res.dtype.subtype == np.bool
+        assert isinstance(res.fill_value, bool)
 
     def _check_comparison_ops(self, a, b, a_dense, b_dense):
         with np.errstate(invalid='ignore'):
@@ -274,30 +282,30 @@ def test_int_array(self):
 
         for kind in ['integer', 'block']:
             a = self._klass(values, dtype=dtype, kind=kind)
-            self.assertEqual(a.dtype, dtype)
+            assert a.dtype == SparseDtype(dtype)
             b = self._klass(rvalues, dtype=dtype, kind=kind)
-            self.assertEqual(b.dtype, dtype)
+            assert b.dtype == SparseDtype(dtype)
 
             self._check_numeric_ops(a, b, values, rvalues)
             self._check_numeric_ops(a, b * 0, values, rvalues * 0)
 
             a = self._klass(values, fill_value=0, dtype=dtype, kind=kind)
-            self.assertEqual(a.dtype, dtype)
+            assert a.dtype == SparseDtype(dtype)
             b = self._klass(rvalues, dtype=dtype, kind=kind)
-            self.assertEqual(b.dtype, dtype)
+            assert b.dtype == SparseDtype(dtype)
 
             self._check_numeric_ops(a, b, values, rvalues)
 
             a = self._klass(values, fill_value=0, dtype=dtype, kind=kind)
-            self.assertEqual(a.dtype, dtype)
+            assert a.dtype == SparseDtype(dtype)
             b = self._klass(rvalues, fill_value=0, dtype=dtype, kind=kind)
-            self.assertEqual(b.dtype, dtype)
+            assert b.dtype == SparseDtype(dtype)
             self._check_numeric_ops(a, b, values, rvalues)
 
             a = self._klass(values, fill_value=1, dtype=dtype, kind=kind)
-            self.assertEqual(a.dtype, dtype)
+            assert a.dtype == SparseDtype(dtype, fill_value=1)
             b = self._klass(rvalues, fill_value=2, dtype=dtype, kind=kind)
-            self.assertEqual(b.dtype, dtype)
+            assert b.dtype == SparseDtype(dtype, fill_value=2)
             self._check_numeric_ops(a, b, values, rvalues)
 
     def test_int_array_comparison(self):
@@ -364,24 +372,24 @@ def test_mixed_array_float_int(self):
             for kind in ['integer', 'block']:
                 a = self._klass(values, kind=kind)
                 b = self._klass(rvalues, kind=kind)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
 
                 self._check_numeric_ops(a, b, values, rvalues)
                 self._check_numeric_ops(a, b * 0, values, rvalues * 0)
 
                 a = self._klass(values, kind=kind, fill_value=0)
                 b = self._klass(rvalues, kind=kind)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
                 self._check_numeric_ops(a, b, values, rvalues)
 
                 a = self._klass(values, kind=kind, fill_value=0)
                 b = self._klass(rvalues, kind=kind, fill_value=0)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
                 self._check_numeric_ops(a, b, values, rvalues)
 
                 a = self._klass(values, kind=kind, fill_value=1)
                 b = self._klass(rvalues, kind=kind, fill_value=2)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype, fill_value=2)
                 self._check_numeric_ops(a, b, values, rvalues)
 
     def test_mixed_array_comparison(self):
@@ -394,24 +402,24 @@ def test_mixed_array_comparison(self):
             for kind in ['integer', 'block']:
                 a = self._klass(values, kind=kind)
                 b = self._klass(rvalues, kind=kind)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
 
                 self._check_comparison_ops(a, b, values, rvalues)
                 self._check_comparison_ops(a, b * 0, values, rvalues * 0)
 
                 a = self._klass(values, kind=kind, fill_value=0)
                 b = self._klass(rvalues, kind=kind)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
                 self._check_comparison_ops(a, b, values, rvalues)
 
                 a = self._klass(values, kind=kind, fill_value=0)
                 b = self._klass(rvalues, kind=kind, fill_value=0)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype)
                 self._check_comparison_ops(a, b, values, rvalues)
 
                 a = self._klass(values, kind=kind, fill_value=1)
                 b = self._klass(rvalues, kind=kind, fill_value=2)
-                self.assertEqual(b.dtype, rdtype)
+                assert b.dtype == SparseDtype(rdtype, fill_value=2)
                 self._check_comparison_ops(a, b, values, rvalues)
 
 
@@ -449,3 +457,82 @@ def test_alignment(self):
         sb = pd.SparseSeries(np.arange(4), index=[10, 11, 12, 13],
                              dtype=np.int64, fill_value=np.nan)
         self._check_numeric_ops(sa, sb, da, db)
+
+
+@pytest.mark.parametrize("op", [
+    operator.eq,
+    operator.add,
+])
+def test_with_list(op):
+    arr = pd.SparseArray([0, 1], fill_value=0)
+    result = op(arr, [0, 1])
+    expected = op(arr, pd.SparseArray([0, 1]))
+    tm.assert_sp_array_equal(result, expected)
+
+
+@pytest.mark.parametrize('ufunc', [
+    np.abs, np.exp,
+])
+@pytest.mark.parametrize('arr', [
+    pd.SparseArray([0, 0, -1, 1]),
+    pd.SparseArray([None, None, -1, 1]),
+])
+def test_ufuncs(ufunc, arr):
+    result = ufunc(arr)
+    fill_value = ufunc(arr.fill_value)
+    expected = pd.SparseArray(ufunc(np.asarray(arr)), fill_value=fill_value)
+    tm.assert_sp_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("a, b", [
+    (pd.SparseArray([0, 0, 0]), np.array([0, 1, 2])),
+    (pd.SparseArray([0, 0, 0], fill_value=1), np.array([0, 1, 2])),
+    (pd.SparseArray([0, 0, 0], fill_value=1), np.array([0, 1, 2])),
+    (pd.SparseArray([0, 0, 0], fill_value=1), np.array([0, 1, 2])),
+    (pd.SparseArray([0, 0, 0], fill_value=1), np.array([0, 1, 2])),
+])
+@pytest.mark.parametrize("ufunc", [
+    np.add,
+    np.greater,
+])
+def test_binary_ufuncs(ufunc, a, b):
+    # can't say anything about fill value here.
+    result = ufunc(a, b)
+    expected = ufunc(np.asarray(a), np.asarray(b))
+    assert isinstance(result, pd.SparseArray)
+    tm.assert_numpy_array_equal(np.asarray(result), expected)
+
+
+def test_ndarray_inplace():
+    sparray = pd.SparseArray([0, 2, 0, 0])
+    ndarray = np.array([0, 1, 2, 3])
+    ndarray += sparray
+    expected = np.array([0, 3, 2, 3])
+    tm.assert_numpy_array_equal(ndarray, expected)
+
+
+def test_sparray_inplace():
+    sparray = pd.SparseArray([0, 2, 0, 0])
+    ndarray = np.array([0, 1, 2, 3])
+    sparray += ndarray
+    expected = pd.SparseArray([0, 3, 2, 3], fill_value=0)
+    tm.assert_sp_array_equal(sparray, expected)
+
+
+@pytest.mark.parametrize("fill_value", [True, False])
+def test_invert(fill_value):
+    arr = np.array([True, False, False, True])
+    sparray = pd.SparseArray(arr, fill_value=fill_value)
+    result = ~sparray
+    expected = pd.SparseArray(~arr, fill_value=not fill_value)
+    tm.assert_sp_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("fill_value", [0, np.nan])
+@pytest.mark.parametrize("op", [operator.pos, operator.neg])
+def test_unary_op(op, fill_value):
+    arr = np.array([0, 1, np.nan, 2])
+    sparray = pd.SparseArray(arr, fill_value=fill_value)
+    result = op(sparray)
+    expected = pd.SparseArray(op(arr), fill_value=op(fill_value))
+    tm.assert_sp_array_equal(result, expected)
diff --git a/pandas/tests/arrays/sparse/test_array.py b/pandas/tests/arrays/sparse/test_array.py
new file mode 100644
index 0000000000000..9c13a20726553
--- /dev/null
+++ b/pandas/tests/arrays/sparse/test_array.py
@@ -0,0 +1,1203 @@
+import operator
+import re
+import warnings
+
+import numpy as np
+import pytest
+
+from pandas._libs.sparse import IntIndex
+from pandas.compat import range
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import isna
+from pandas.core.sparse.api import SparseArray, SparseDtype, SparseSeries
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal
+
+
+@pytest.fixture(params=["integer", "block"])
+def kind(request):
+    return request.param
+
+
+class TestSparseArray(object):
+
+    def setup_method(self, method):
+        self.arr_data = np.array([np.nan, np.nan, 1, 2, 3,
+                                  np.nan, 4, 5, np.nan, 6])
+        self.arr = SparseArray(self.arr_data)
+        self.zarr = SparseArray([0, 0, 1, 2, 3, 0, 4, 5, 0, 6], fill_value=0)
+
+    def test_constructor_dtype(self):
+        arr = SparseArray([np.nan, 1, 2, np.nan])
+        assert arr.dtype == SparseDtype(np.float64, np.nan)
+        assert arr.dtype.subtype == np.float64
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray([np.nan, 1, 2, np.nan], fill_value=0)
+        assert arr.dtype == SparseDtype(np.float64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], dtype=np.float64)
+        assert arr.dtype == SparseDtype(np.float64, np.nan)
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray([0, 1, 2, 4], dtype=np.int64)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=np.int64)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], dtype=None)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=None)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+    def test_constructor_dtype_str(self):
+        result = SparseArray([1, 2, 3], dtype='int')
+        expected = SparseArray([1, 2, 3], dtype=int)
+        tm.assert_sp_array_equal(result, expected)
+
+    def test_constructor_sparse_dtype(self):
+        result = SparseArray([1, 0, 0, 1], dtype=SparseDtype('int64', -1))
+        expected = SparseArray([1, 0, 0, 1], fill_value=-1, dtype=np.int64)
+        tm.assert_sp_array_equal(result, expected)
+        assert result.sp_values.dtype == np.dtype('int64')
+
+    def test_constructor_sparse_dtype_str(self):
+        result = SparseArray([1, 0, 0, 1], dtype='Sparse[int32]')
+        expected = SparseArray([1, 0, 0, 1], dtype=np.int32)
+        tm.assert_sp_array_equal(result, expected)
+        assert result.sp_values.dtype == np.dtype('int32')
+
+    def test_constructor_object_dtype(self):
+        # GH 11856
+        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object)
+        assert arr.dtype == SparseDtype(np.object)
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object,
+                          fill_value='A')
+        assert arr.dtype == SparseDtype(np.object, 'A')
+        assert arr.fill_value == 'A'
+
+        # GH 17574
+        data = [False, 0, 100.0, 0.0]
+        arr = SparseArray(data, dtype=np.object, fill_value=False)
+        assert arr.dtype == SparseDtype(np.object, False)
+        assert arr.fill_value is False
+        arr_expected = np.array(data, dtype=np.object)
+        it = (type(x) == type(y) and x == y for x, y in zip(arr, arr_expected))
+        assert np.fromiter(it, dtype=np.bool).all()
+
+    @pytest.mark.parametrize("dtype", [SparseDtype(int, 0), int])
+    def test_constructor_na_dtype(self, dtype):
+        with pytest.raises(ValueError, match="Cannot convert"):
+            SparseArray([0, 1, np.nan], dtype=dtype)
+
+    def test_constructor_spindex_dtype(self):
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]))
+        # XXX: Behavior change: specifying SparseIndex no longer changes the
+        # fill_value
+        expected = SparseArray([0, 1, 2, 0], kind='integer')
+        tm.assert_sp_array_equal(arr, expected)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2, 3],
+                          sparse_index=IntIndex(4, [1, 2, 3]),
+                          dtype=np.int64, fill_value=0)
+        exp = SparseArray([0, 1, 2, 3], dtype=np.int64, fill_value=0)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
+                          fill_value=0, dtype=np.int64)
+        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=np.int64)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=[1, 2, 3],
+                          sparse_index=IntIndex(4, [1, 2, 3]),
+                          dtype=None, fill_value=0)
+        exp = SparseArray([0, 1, 2, 3], dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+    @pytest.mark.parametrize("sparse_index", [
+        None, IntIndex(1, [0]),
+    ])
+    def test_constructor_spindex_dtype_scalar(self, sparse_index):
+        # scalar input
+        arr = SparseArray(data=1, sparse_index=sparse_index, dtype=None)
+        exp = SparseArray([1], dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        arr = SparseArray(data=1, sparse_index=IntIndex(1, [0]), dtype=None)
+        exp = SparseArray([1], dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+    def test_constructor_spindex_dtype_scalar_broadcasts(self):
+        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
+                          fill_value=0, dtype=None)
+        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=None)
+        tm.assert_sp_array_equal(arr, exp)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+    @pytest.mark.parametrize('data, fill_value', [
+        (np.array([1, 2]), 0),
+        (np.array([1.0, 2.0]), np.nan),
+        ([True, False], False),
+        ([pd.Timestamp('2017-01-01')], pd.NaT),
+    ])
+    def test_constructor_inferred_fill_value(self, data, fill_value):
+        result = SparseArray(data).fill_value
+
+        if pd.isna(fill_value):
+            assert pd.isna(result)
+        else:
+            assert result == fill_value
+
+    @pytest.mark.parametrize('scalar,dtype', [
+        (False, SparseDtype(bool, False)),
+        (0.0, SparseDtype('float64', 0)),
+        (1, SparseDtype('int64', 1)),
+        ('z', SparseDtype('object', 'z'))])
+    def test_scalar_with_index_infer_dtype(self, scalar, dtype):
+        # GH 19163
+        arr = SparseArray(scalar, index=[1, 2, 3], fill_value=scalar)
+        exp = SparseArray([scalar, scalar, scalar], fill_value=scalar)
+
+        tm.assert_sp_array_equal(arr, exp)
+
+        assert arr.dtype == dtype
+        assert exp.dtype == dtype
+
+    @pytest.mark.parametrize("fill", [1, np.nan, 0])
+    def test_sparse_series_round_trip(self, kind, fill):
+        # see gh-13999
+        arr = SparseArray([np.nan, 1, np.nan, 2, 3],
+                          kind=kind, fill_value=fill)
+        res = SparseArray(SparseSeries(arr))
+        tm.assert_sp_array_equal(arr, res)
+
+        arr = SparseArray([0, 0, 0, 1, 1, 2], dtype=np.int64,
+                          kind=kind, fill_value=fill)
+        res = SparseArray(SparseSeries(arr), dtype=np.int64)
+        tm.assert_sp_array_equal(arr, res)
+
+        res = SparseArray(SparseSeries(arr))
+        tm.assert_sp_array_equal(arr, res)
+
+    @pytest.mark.parametrize("fill", [True, False, np.nan])
+    def test_sparse_series_round_trip2(self, kind, fill):
+        # see gh-13999
+        arr = SparseArray([True, False, True, True], dtype=np.bool,
+                          kind=kind, fill_value=fill)
+        res = SparseArray(SparseSeries(arr))
+        tm.assert_sp_array_equal(arr, res)
+
+        res = SparseArray(SparseSeries(arr))
+        tm.assert_sp_array_equal(arr, res)
+
+    def test_get_item(self):
+
+        assert np.isnan(self.arr[1])
+        assert self.arr[2] == 1
+        assert self.arr[7] == 5
+
+        assert self.zarr[0] == 0
+        assert self.zarr[2] == 1
+        assert self.zarr[7] == 5
+
+        errmsg = re.compile("bounds")
+
+        with pytest.raises(IndexError, match=errmsg):
+            self.arr[11]
+
+        with pytest.raises(IndexError, match=errmsg):
+            self.arr[-11]
+
+        assert self.arr[-1] == self.arr[len(self.arr) - 1]
+
+    def test_take_scalar_raises(self):
+        msg = "'indices' must be an array, not a scalar '2'."
+        with pytest.raises(ValueError, match=msg):
+            self.arr.take(2)
+
+    def test_take(self):
+        exp = SparseArray(np.take(self.arr_data, [2, 3]))
+        tm.assert_sp_array_equal(self.arr.take([2, 3]), exp)
+
+        exp = SparseArray(np.take(self.arr_data, [0, 1, 2]))
+        tm.assert_sp_array_equal(self.arr.take([0, 1, 2]), exp)
+
+    def test_take_fill_value(self):
+        data = np.array([1, np.nan, 0, 3, 0])
+        sparse = SparseArray(data, fill_value=0)
+
+        exp = SparseArray(np.take(data, [0]), fill_value=0)
+        tm.assert_sp_array_equal(sparse.take([0]), exp)
+
+        exp = SparseArray(np.take(data, [1, 3, 4]), fill_value=0)
+        tm.assert_sp_array_equal(sparse.take([1, 3, 4]), exp)
+
+    def test_take_negative(self):
+        exp = SparseArray(np.take(self.arr_data, [-1]))
+        tm.assert_sp_array_equal(self.arr.take([-1]), exp)
+
+        exp = SparseArray(np.take(self.arr_data, [-4, -3, -2]))
+        tm.assert_sp_array_equal(self.arr.take([-4, -3, -2]), exp)
+
+    @pytest.mark.parametrize('fill_value', [0, None, np.nan])
+    def test_shift_fill_value(self, fill_value):
+        # GH #24128
+        sparse = SparseArray(np.array([1, 0, 0, 3, 0]),
+                             fill_value=8.0)
+        res = sparse.shift(1, fill_value=fill_value)
+        if isna(fill_value):
+            fill_value = res.dtype.na_value
+        exp = SparseArray(np.array([fill_value, 1, 0, 0, 3]),
+                          fill_value=8.0)
+        tm.assert_sp_array_equal(res, exp)
+
+    def test_bad_take(self):
+        with pytest.raises(IndexError, match="bounds"):
+            self.arr.take([11])
+
+    def test_take_filling(self):
+        # similar tests as GH 12631
+        sparse = SparseArray([np.nan, np.nan, 1, np.nan, 4])
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([np.nan, np.nan, 4])
+        tm.assert_sp_array_equal(result, expected)
+
+        # XXX: test change: fill_value=True -> allow_fill=True
+        result = sparse.take(np.array([1, 0, -1]), allow_fill=True)
+        expected = SparseArray([np.nan, np.nan, np.nan])
+        tm.assert_sp_array_equal(result, expected)
+
+        # allow_fill=False
+        result = sparse.take(np.array([1, 0, -1]),
+                             allow_fill=False, fill_value=True)
+        expected = SparseArray([np.nan, np.nan, 4])
+        tm.assert_sp_array_equal(result, expected)
+
+        msg = "Invalid value in 'indices'"
+        with pytest.raises(ValueError, match=msg):
+            sparse.take(np.array([1, 0, -2]), allow_fill=True)
+
+        with pytest.raises(ValueError, match=msg):
+            sparse.take(np.array([1, 0, -5]), allow_fill=True)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), allow_fill=True)
+
+    def test_take_filling_fill_value(self):
+        # same tests as GH 12631
+        sparse = SparseArray([np.nan, 0, 1, 0, 4], fill_value=0)
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([0, np.nan, 4], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        # fill_value
+        result = sparse.take(np.array([1, 0, -1]), allow_fill=True)
+        # XXX: behavior change.
+        # the old way of filling self.fill_value doesn't follow EA rules.
+        # It's supposed to be self.dtype.na_value (nan in this case)
+        expected = SparseArray([0, np.nan, np.nan], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        # allow_fill=False
+        result = sparse.take(np.array([1, 0, -1]),
+                             allow_fill=False, fill_value=True)
+        expected = SparseArray([0, np.nan, 4], fill_value=0)
+        tm.assert_sp_array_equal(result, expected)
+
+        msg = ("Invalid value in 'indices'.")
+        with pytest.raises(ValueError, match=msg):
+            sparse.take(np.array([1, 0, -2]), allow_fill=True)
+        with pytest.raises(ValueError, match=msg):
+            sparse.take(np.array([1, 0, -5]), allow_fill=True)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), fill_value=True)
+
+    def test_take_filling_all_nan(self):
+        sparse = SparseArray([np.nan, np.nan, np.nan, np.nan, np.nan])
+        # XXX: did the default kind from take change?
+        result = sparse.take(np.array([1, 0, -1]))
+        expected = SparseArray([np.nan, np.nan, np.nan], kind='block')
+        tm.assert_sp_array_equal(result, expected)
+
+        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
+        expected = SparseArray([np.nan, np.nan, np.nan], kind='block')
+        tm.assert_sp_array_equal(result, expected)
+
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, -6]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]))
+        with pytest.raises(IndexError):
+            sparse.take(np.array([1, 5]), fill_value=True)
+
+    def test_set_item(self):
+        def setitem():
+            self.arr[5] = 3
+
+        def setslice():
+            self.arr[1:5] = 2
+
+        with pytest.raises(TypeError, match="assignment via setitem"):
+            setitem()
+
+        with pytest.raises(TypeError, match="assignment via setitem"):
+            setslice()
+
+    def test_constructor_from_too_large_array(self):
+        with pytest.raises(TypeError, match="expected dimension <= 1 data"):
+            SparseArray(np.arange(10).reshape((2, 5)))
+
+    def test_constructor_from_sparse(self):
+        res = SparseArray(self.zarr)
+        assert res.fill_value == 0
+        assert_almost_equal(res.sp_values, self.zarr.sp_values)
+
+    def test_constructor_copy(self):
+        cp = SparseArray(self.arr, copy=True)
+        cp.sp_values[:3] = 0
+        assert not (self.arr.sp_values[:3] == 0).any()
+
+        not_copy = SparseArray(self.arr)
+        not_copy.sp_values[:3] = 0
+        assert (self.arr.sp_values[:3] == 0).all()
+
+    def test_constructor_bool(self):
+        # GH 10648
+        data = np.array([False, False, True, True, False, False])
+        arr = SparseArray(data, fill_value=False, dtype=bool)
+
+        assert arr.dtype == SparseDtype(bool)
+        tm.assert_numpy_array_equal(arr.sp_values, np.array([True, True]))
+        # Behavior change: np.asarray densifies.
+        # tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
+        tm.assert_numpy_array_equal(arr.sp_index.indices,
+                                    np.array([2, 3], np.int32))
+
+        for dense in [arr.to_dense(), arr.values]:
+            assert dense.dtype == bool
+            tm.assert_numpy_array_equal(dense, data)
+
+    def test_constructor_bool_fill_value(self):
+        arr = SparseArray([True, False, True], dtype=None)
+        assert arr.dtype == SparseDtype(np.bool)
+        assert not arr.fill_value
+
+        arr = SparseArray([True, False, True], dtype=np.bool)
+        assert arr.dtype == SparseDtype(np.bool)
+        assert not arr.fill_value
+
+        arr = SparseArray([True, False, True], dtype=np.bool, fill_value=True)
+        assert arr.dtype == SparseDtype(np.bool, True)
+        assert arr.fill_value
+
+    def test_constructor_float32(self):
+        # GH 10648
+        data = np.array([1., np.nan, 3], dtype=np.float32)
+        arr = SparseArray(data, dtype=np.float32)
+
+        assert arr.dtype == SparseDtype(np.float32)
+        tm.assert_numpy_array_equal(arr.sp_values,
+                                    np.array([1, 3], dtype=np.float32))
+        # Behavior change: np.asarray densifies.
+        # tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
+        tm.assert_numpy_array_equal(arr.sp_index.indices,
+                                    np.array([0, 2], dtype=np.int32))
+
+        for dense in [arr.to_dense(), arr.values]:
+            assert dense.dtype == np.float32
+            tm.assert_numpy_array_equal(dense, data)
+
+    def test_astype(self):
+        # float -> float
+        arr = SparseArray([None, None, 0, 2])
+        result = arr.astype("Sparse[float32]")
+        expected = SparseArray([None, None, 0, 2], dtype=np.dtype('float32'))
+        tm.assert_sp_array_equal(result, expected)
+
+        dtype = SparseDtype("float64", fill_value=0)
+        result = arr.astype(dtype)
+        expected = SparseArray._simple_new(np.array([0., 2.],
+                                                    dtype=dtype.subtype),
+                                           IntIndex(4, [2, 3]),
+                                           dtype)
+        tm.assert_sp_array_equal(result, expected)
+
+        dtype = SparseDtype("int64", 0)
+        result = arr.astype(dtype)
+        expected = SparseArray._simple_new(np.array([0, 2], dtype=np.int64),
+                                           IntIndex(4, [2, 3]),
+                                           dtype)
+        tm.assert_sp_array_equal(result, expected)
+
+        arr = SparseArray([0, np.nan, 0, 1], fill_value=0)
+        with pytest.raises(ValueError, match='NA'):
+            arr.astype('Sparse[i8]')
+
+    def test_astype_bool(self):
+        a = pd.SparseArray([1, 0, 0, 1], dtype=SparseDtype(int, 0))
+        result = a.astype(bool)
+        expected = SparseArray([True, 0, 0, True],
+                               dtype=SparseDtype(bool, 0))
+        tm.assert_sp_array_equal(result, expected)
+
+        # update fill value
+        result = a.astype(SparseDtype(bool, False))
+        expected = SparseArray([True, False, False, True],
+                               dtype=SparseDtype(bool, False))
+        tm.assert_sp_array_equal(result, expected)
+
+    def test_astype_all(self, any_real_dtype):
+        vals = np.array([1, 2, 3])
+        arr = SparseArray(vals, fill_value=1)
+        typ = np.dtype(any_real_dtype)
+        res = arr.astype(typ)
+        assert res.dtype == SparseDtype(typ, 1)
+        assert res.sp_values.dtype == typ
+
+        tm.assert_numpy_array_equal(np.asarray(res.values),
+                                    vals.astype(typ))
+
+    @pytest.mark.parametrize('array, dtype, expected', [
+        (SparseArray([0, 1]), 'float',
+         SparseArray([0., 1.], dtype=SparseDtype(float, 0.0))),
+        (SparseArray([0, 1]), bool, SparseArray([False, True])),
+        (SparseArray([0, 1], fill_value=1), bool,
+         SparseArray([False, True], dtype=SparseDtype(bool, True))),
+        pytest.param(
+            SparseArray([0, 1]), 'datetime64[ns]',
+            SparseArray(np.array([0, 1], dtype='datetime64[ns]'),
+                        dtype=SparseDtype('datetime64[ns]',
+                                          pd.Timestamp('1970'))),
+            marks=[pytest.mark.xfail(reason="NumPy-7619")],
+        ),
+        (SparseArray([0, 1, 10]), str,
+         SparseArray(['0', '1', '10'], dtype=SparseDtype(str, '0'))),
+        (SparseArray(['10', '20']), float, SparseArray([10.0, 20.0])),
+        (SparseArray([0, 1, 0]), object,
+         SparseArray([0, 1, 0], dtype=SparseDtype(object, 0))),
+    ])
+    def test_astype_more(self, array, dtype, expected):
+        result = array.astype(dtype)
+        tm.assert_sp_array_equal(result, expected)
+
+    def test_astype_nan_raises(self):
+        arr = SparseArray([1.0, np.nan])
+        with pytest.raises(ValueError, match='Cannot convert non-finite'):
+            arr.astype(int)
+
+    def test_set_fill_value(self):
+        arr = SparseArray([1., np.nan, 2.], fill_value=np.nan)
+        arr.fill_value = 2
+        assert arr.fill_value == 2
+
+        arr = SparseArray([1, 0, 2], fill_value=0, dtype=np.int64)
+        arr.fill_value = 2
+        assert arr.fill_value == 2
+
+        # XXX: this seems fine? You can construct an integer
+        # sparsearray with NaN fill value, why not update one?
+        # coerces to int
+        # msg = "unable to set fill_value 3\\.1 to int64 dtype"
+        # with pytest.raises(ValueError, match=msg):
+        arr.fill_value = 3.1
+        assert arr.fill_value == 3.1
+
+        # msg = "unable to set fill_value nan to int64 dtype"
+        # with pytest.raises(ValueError, match=msg):
+        arr.fill_value = np.nan
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseArray([True, False, True], fill_value=False, dtype=np.bool)
+        arr.fill_value = True
+        assert arr.fill_value
+
+        # coerces to bool
+        # msg = "unable to set fill_value 0 to bool dtype"
+        # with pytest.raises(ValueError, match=msg):
+        arr.fill_value = 0
+        assert arr.fill_value == 0
+
+        # msg = "unable to set fill_value nan to bool dtype"
+        # with pytest.raises(ValueError, match=msg):
+        arr.fill_value = np.nan
+        assert np.isnan(arr.fill_value)
+
+    @pytest.mark.parametrize("val", [[1, 2, 3], np.array([1, 2]), (1, 2, 3)])
+    def test_set_fill_invalid_non_scalar(self, val):
+        arr = SparseArray([True, False, True], fill_value=False, dtype=np.bool)
+        msg = "fill_value must be a scalar"
+
+        with pytest.raises(ValueError, match=msg):
+            arr.fill_value = val
+
+    def test_copy_shallow(self):
+        arr2 = self.arr.copy(deep=False)
+        assert arr2.sp_values is self.arr.sp_values
+        assert arr2.sp_index is self.arr.sp_index
+
+    def test_values_asarray(self):
+        assert_almost_equal(self.arr.values, self.arr_data)
+        assert_almost_equal(self.arr.to_dense(), self.arr_data)
+
+    @pytest.mark.parametrize('data,shape,dtype', [
+        ([0, 0, 0, 0, 0], (5,), None),
+        ([], (0,), None),
+        ([0], (1,), None),
+        (['A', 'A', np.nan, 'B'], (4,), np.object)
+    ])
+    def test_shape(self, data, shape, dtype):
+        # GH 21126
+        out = SparseArray(data, dtype=dtype)
+        assert out.shape == shape
+
+    @pytest.mark.parametrize("vals", [
+        [np.nan, np.nan, np.nan, np.nan, np.nan],
+        [1, np.nan, np.nan, 3, np.nan],
+        [1, np.nan, 0, 3, 0],
+    ])
+    @pytest.mark.parametrize("method", ["to_dense", "get_values"])
+    @pytest.mark.parametrize("fill_value", [None, 0])
+    def test_dense_repr(self, vals, fill_value, method):
+        vals = np.array(vals)
+        arr = SparseArray(vals, fill_value=fill_value)
+        dense_func = getattr(arr, method)
+
+        res = dense_func()
+        tm.assert_numpy_array_equal(res, vals)
+
+    def test_getitem(self):
+        def _checkit(i):
+            assert_almost_equal(self.arr[i], self.arr.values[i])
+
+        for i in range(len(self.arr)):
+            _checkit(i)
+            _checkit(-i)
+
+    def test_getitem_arraylike_mask(self):
+        arr = SparseArray([0, 1, 2])
+        result = arr[[True, False, True]]
+        expected = SparseArray([0, 2])
+        tm.assert_sp_array_equal(result, expected)
+
+    def test_getslice(self):
+        result = self.arr[:-3]
+        exp = SparseArray(self.arr.values[:-3])
+        tm.assert_sp_array_equal(result, exp)
+
+        result = self.arr[-4:]
+        exp = SparseArray(self.arr.values[-4:])
+        tm.assert_sp_array_equal(result, exp)
+
+        # two corner cases from Series
+        result = self.arr[-12:]
+        exp = SparseArray(self.arr)
+        tm.assert_sp_array_equal(result, exp)
+
+        result = self.arr[:-12]
+        exp = SparseArray(self.arr.values[:0])
+        tm.assert_sp_array_equal(result, exp)
+
+    def test_getslice_tuple(self):
+        dense = np.array([np.nan, 0, 3, 4, 0, 5, np.nan, np.nan, 0])
+
+        sparse = SparseArray(dense)
+        res = sparse[4:, ]
+        exp = SparseArray(dense[4:, ])
+        tm.assert_sp_array_equal(res, exp)
+
+        sparse = SparseArray(dense, fill_value=0)
+        res = sparse[4:, ]
+        exp = SparseArray(dense[4:, ], fill_value=0)
+        tm.assert_sp_array_equal(res, exp)
+
+        with pytest.raises(IndexError):
+            sparse[4:, :]
+
+        with pytest.raises(IndexError):
+            # check numpy compat
+            dense[4:, :]
+
+    def test_boolean_slice_empty(self):
+        arr = pd.SparseArray([0, 1, 2])
+        res = arr[[False, False, False]]
+        assert res.dtype == arr.dtype
+
+    @pytest.mark.parametrize("op", ["add", "sub", "mul",
+                                    "truediv", "floordiv", "pow"])
+    def test_binary_operators(self, op):
+        op = getattr(operator, op)
+        data1 = np.random.randn(20)
+        data2 = np.random.randn(20)
+
+        data1[::2] = np.nan
+        data2[::3] = np.nan
+
+        arr1 = SparseArray(data1)
+        arr2 = SparseArray(data2)
+
+        data1[::2] = 3
+        data2[::3] = 3
+        farr1 = SparseArray(data1, fill_value=3)
+        farr2 = SparseArray(data2, fill_value=3)
+
+        def _check_op(op, first, second):
+            res = op(first, second)
+            exp = SparseArray(op(first.values, second.values),
+                              fill_value=first.fill_value)
+            assert isinstance(res, SparseArray)
+            assert_almost_equal(res.values, exp.values)
+
+            res2 = op(first, second.values)
+            assert isinstance(res2, SparseArray)
+            tm.assert_sp_array_equal(res, res2)
+
+            res3 = op(first.values, second)
+            assert isinstance(res3, SparseArray)
+            tm.assert_sp_array_equal(res, res3)
+
+            res4 = op(first, 4)
+            assert isinstance(res4, SparseArray)
+
+            # Ignore this if the actual op raises (e.g. pow).
+            try:
+                exp = op(first.values, 4)
+                exp_fv = op(first.fill_value, 4)
+            except ValueError:
+                pass
+            else:
+                assert_almost_equal(res4.fill_value, exp_fv)
+                assert_almost_equal(res4.values, exp)
+
+        with np.errstate(all="ignore"):
+            for first_arr, second_arr in [(arr1, arr2), (farr1, farr2)]:
+                _check_op(op, first_arr, second_arr)
+
+    def test_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            tm.assert_sp_array_equal(unpickled, obj)
+
+        _check_roundtrip(self.arr)
+        _check_roundtrip(self.zarr)
+
+    def test_generator_warnings(self):
+        sp_arr = SparseArray([1, 2, 3])
+        with warnings.catch_warnings(record=True) as w:
+            warnings.filterwarnings(action='always',
+                                    category=DeprecationWarning)
+            warnings.filterwarnings(action='always',
+                                    category=PendingDeprecationWarning)
+            for _ in sp_arr:
+                pass
+            assert len(w) == 0
+
+    def test_fillna(self):
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, -1, 3, -1], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, -1, 3, -1], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, 0, 3, 0])
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, 0, 3, 0], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([1, np.nan, 0, 3, 0], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([1, -1, 0, 3, 0], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([np.nan, np.nan, np.nan, np.nan])
+        res = s.fillna(-1)
+        exp = SparseArray([-1, -1, -1, -1], fill_value=-1, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        s = SparseArray([np.nan, np.nan, np.nan, np.nan], fill_value=0)
+        res = s.fillna(-1)
+        exp = SparseArray([-1, -1, -1, -1], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+        # float dtype's fill_value is np.nan, replaced by -1
+        s = SparseArray([0., 0., 0., 0.])
+        res = s.fillna(-1)
+        exp = SparseArray([0., 0., 0., 0.], fill_value=-1)
+        tm.assert_sp_array_equal(res, exp)
+
+        # int dtype shouldn't have missing. No changes.
+        s = SparseArray([0, 0, 0, 0])
+        assert s.dtype == SparseDtype(np.int64)
+        assert s.fill_value == 0
+        res = s.fillna(-1)
+        tm.assert_sp_array_equal(res, s)
+
+        s = SparseArray([0, 0, 0, 0], fill_value=0)
+        assert s.dtype == SparseDtype(np.int64)
+        assert s.fill_value == 0
+        res = s.fillna(-1)
+        exp = SparseArray([0, 0, 0, 0], fill_value=0)
+        tm.assert_sp_array_equal(res, exp)
+
+        # fill_value can be nan if there is no missing hole.
+        # only fill_value will be changed
+        s = SparseArray([0, 0, 0, 0], fill_value=np.nan)
+        assert s.dtype == SparseDtype(np.int64, fill_value=np.nan)
+        assert np.isnan(s.fill_value)
+        res = s.fillna(-1)
+        exp = SparseArray([0, 0, 0, 0], fill_value=-1)
+        tm.assert_sp_array_equal(res, exp)
+
+    def test_fillna_overlap(self):
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
+        # filling with existing value doesn't replace existing value with
+        # fill_value, i.e. existing 3 remains in sp_values
+        res = s.fillna(3)
+        exp = np.array([1, 3, 3, 3, 3], dtype=np.float64)
+        tm.assert_numpy_array_equal(res.to_dense(), exp)
+
+        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
+        res = s.fillna(3)
+        exp = SparseArray([1, 3, 3, 3, 3], fill_value=0, dtype=np.float64)
+        tm.assert_sp_array_equal(res, exp)
+
+    def test_nonzero(self):
+        # Tests regression #21172.
+        sa = pd.SparseArray([
+            float('nan'),
+            float('nan'),
+            1, 0, 0,
+            2, 0, 0, 0,
+            3, 0, 0
+        ])
+        expected = np.array([2, 5, 9], dtype=np.int32)
+        result, = sa.nonzero()
+        tm.assert_numpy_array_equal(expected, result)
+
+        sa = pd.SparseArray([0, 0, 1, 0, 0, 2, 0, 0, 0, 3, 0, 0])
+        result, = sa.nonzero()
+        tm.assert_numpy_array_equal(expected, result)
+
+
+class TestSparseArrayAnalytics(object):
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([True, True, True], True, False),
+        ([1, 2, 1], 1, 0),
+        ([1.0, 2.0, 1.0], 1.0, 0.0)
+    ])
+    def test_all(self, data, pos, neg):
+        # GH 17570
+        out = SparseArray(data).all()
+        assert out
+
+        out = SparseArray(data, fill_value=pos).all()
+        assert out
+
+        data[1] = neg
+        out = SparseArray(data).all()
+        assert not out
+
+        out = SparseArray(data, fill_value=pos).all()
+        assert not out
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([True, True, True], True, False),
+        ([1, 2, 1], 1, 0),
+        ([1.0, 2.0, 1.0], 1.0, 0.0)
+    ])
+    @td.skip_if_np_lt_115  # prior didn't dispatch
+    def test_numpy_all(self, data, pos, neg):
+        # GH 17570
+        out = np.all(SparseArray(data))
+        assert out
+
+        out = np.all(SparseArray(data, fill_value=pos))
+        assert out
+
+        data[1] = neg
+        out = np.all(SparseArray(data))
+        assert not out
+
+        out = np.all(SparseArray(data, fill_value=pos))
+        assert not out
+
+        # raises with a different message on py2.
+        msg = "the \'out\' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.all(SparseArray(data), out=np.array([]))
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([False, True, False], True, False),
+        ([0, 2, 0], 2, 0),
+        ([0.0, 2.0, 0.0], 2.0, 0.0)
+    ])
+    def test_any(self, data, pos, neg):
+        # GH 17570
+        out = SparseArray(data).any()
+        assert out
+
+        out = SparseArray(data, fill_value=pos).any()
+        assert out
+
+        data[1] = neg
+        out = SparseArray(data).any()
+        assert not out
+
+        out = SparseArray(data, fill_value=pos).any()
+        assert not out
+
+    @pytest.mark.parametrize('data,pos,neg', [
+        ([False, True, False], True, False),
+        ([0, 2, 0], 2, 0),
+        ([0.0, 2.0, 0.0], 2.0, 0.0)
+    ])
+    @td.skip_if_np_lt_115  # prior didn't dispatch
+    def test_numpy_any(self, data, pos, neg):
+        # GH 17570
+        out = np.any(SparseArray(data))
+        assert out
+
+        out = np.any(SparseArray(data, fill_value=pos))
+        assert out
+
+        data[1] = neg
+        out = np.any(SparseArray(data))
+        assert not out
+
+        out = np.any(SparseArray(data, fill_value=pos))
+        assert not out
+
+        msg = "the \'out\' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.any(SparseArray(data), out=out)
+
+    def test_sum(self):
+        data = np.arange(10).astype(float)
+        out = SparseArray(data).sum()
+        assert out == 45.0
+
+        data[5] = np.nan
+        out = SparseArray(data, fill_value=2).sum()
+        assert out == 40.0
+
+        out = SparseArray(data, fill_value=np.nan).sum()
+        assert out == 40.0
+
+    def test_numpy_sum(self):
+        data = np.arange(10).astype(float)
+        out = np.sum(SparseArray(data))
+        assert out == 45.0
+
+        data[5] = np.nan
+        out = np.sum(SparseArray(data, fill_value=2))
+        assert out == 40.0
+
+        out = np.sum(SparseArray(data, fill_value=np.nan))
+        assert out == 40.0
+
+        msg = "the 'dtype' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.sum(SparseArray(data), dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.sum(SparseArray(data), out=out)
+
+    @pytest.mark.parametrize("data,expected", [
+        (np.array([1, 2, 3, 4, 5], dtype=float),  # non-null data
+         SparseArray(np.array([1.0, 3.0, 6.0, 10.0, 15.0]))),
+        (np.array([1, 2, np.nan, 4, 5], dtype=float),  # null data
+         SparseArray(np.array([1.0, 3.0, np.nan, 7.0, 12.0])))
+    ])
+    @pytest.mark.parametrize("numpy", [True, False])
+    def test_cumsum(self, data, expected, numpy):
+        cumsum = np.cumsum if numpy else lambda s: s.cumsum()
+
+        out = cumsum(SparseArray(data))
+        tm.assert_sp_array_equal(out, expected)
+
+        out = cumsum(SparseArray(data, fill_value=np.nan))
+        tm.assert_sp_array_equal(out, expected)
+
+        out = cumsum(SparseArray(data, fill_value=2))
+        tm.assert_sp_array_equal(out, expected)
+
+        if numpy:  # numpy compatibility checks.
+            msg = "the 'dtype' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.cumsum(SparseArray(data), dtype=np.int64)
+
+            msg = "the 'out' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.cumsum(SparseArray(data), out=out)
+        else:
+            axis = 1  # SparseArray currently 1-D, so only axis = 0 is valid.
+            msg = "axis\\(={axis}\\) out of bounds".format(axis=axis)
+            with pytest.raises(ValueError, match=msg):
+                SparseArray(data).cumsum(axis=axis)
+
+    def test_mean(self):
+        data = np.arange(10).astype(float)
+        out = SparseArray(data).mean()
+        assert out == 4.5
+
+        data[5] = np.nan
+        out = SparseArray(data).mean()
+        assert out == 40.0 / 9
+
+    def test_numpy_mean(self):
+        data = np.arange(10).astype(float)
+        out = np.mean(SparseArray(data))
+        assert out == 4.5
+
+        data[5] = np.nan
+        out = np.mean(SparseArray(data))
+        assert out == 40.0 / 9
+
+        msg = "the 'dtype' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.mean(SparseArray(data), dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.mean(SparseArray(data), out=out)
+
+    def test_ufunc(self):
+        # GH 13853 make sure ufunc is applied to fill_value
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray([1, np.nan, 2, np.nan, 2])
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
+                             fill_value=1)
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=-1)
+        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
+                             fill_value=1)
+        tm.assert_sp_array_equal(abs(sparse), result)
+        tm.assert_sp_array_equal(np.abs(sparse), result)
+
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray(np.sin([1, np.nan, 2, np.nan, -2]))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray(np.sin([1, -1, 2, -2]), fill_value=np.sin(1))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
+        result = SparseArray(np.sin([1, -1, 0, -2]), fill_value=np.sin(0))
+        tm.assert_sp_array_equal(np.sin(sparse), result)
+
+    def test_ufunc_args(self):
+        # GH 13853 make sure ufunc is applied to fill_value, including its arg
+        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
+        result = SparseArray([2, np.nan, 3, np.nan, -1])
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
+
+        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
+        result = SparseArray([2, 0, 3, -1], fill_value=2)
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
+
+        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
+        result = SparseArray([2, 0, 1, -1], fill_value=1)
+        tm.assert_sp_array_equal(np.add(sparse, 1), result)
+
+    def test_nbytes_integer(self):
+        arr = SparseArray([1, 0, 0, 0, 2], kind='integer')
+        result = arr.nbytes
+        # (2 * 8) + 2 * 4
+        assert result == 24
+
+    def test_nbytes_block(self):
+        arr = SparseArray([1, 2, 0, 0, 0], kind='block')
+        result = arr.nbytes
+        # (2 * 8) + 4 + 4
+        # sp_values, blocs, blenghts
+        assert result == 24
+
+    def test_asarray_datetime64(self):
+        s = pd.SparseArray(
+            pd.to_datetime(['2012', None, None, '2013'])
+        )
+        np.asarray(s)
+
+    def test_density(self):
+        arr = SparseArray([0, 1])
+        assert arr.density == 0.5
+
+    def test_npoints(self):
+        arr = SparseArray([0, 1])
+        assert arr.npoints == 1
+
+
+class TestAccessor(object):
+
+    @pytest.mark.parametrize('attr', [
+        'npoints', 'density', 'fill_value', 'sp_values',
+    ])
+    def test_get_attributes(self, attr):
+        arr = SparseArray([0, 1])
+        ser = pd.Series(arr)
+
+        result = getattr(ser.sparse, attr)
+        expected = getattr(arr, attr)
+        assert result == expected
+
+    def test_from_coo(self):
+        sparse = pytest.importorskip("scipy.sparse")
+
+        row = [0, 3, 1, 0]
+        col = [0, 3, 1, 2]
+        data = [4, 5, 7, 9]
+        sp_array = sparse.coo_matrix(data, (row, col))
+        result = pd.Series.sparse.from_coo(sp_array)
+
+        index = pd.MultiIndex.from_product([[0], [0, 1, 2, 3]])
+        expected = pd.Series(data, index=index, dtype='Sparse[int]')
+        tm.assert_series_equal(result, expected)
+
+    def test_to_coo(self):
+        sparse = pytest.importorskip("scipy.sparse")
+        ser = pd.Series([1, 2, 3],
+                        index=pd.MultiIndex.from_product([[0], [1, 2, 3]],
+                                                         names=['a', 'b']),
+                        dtype='Sparse[int]')
+        A, _, _ = ser.sparse.to_coo()
+        assert isinstance(A, sparse.coo.coo_matrix)
+
+    def test_non_sparse_raises(self):
+        ser = pd.Series([1, 2, 3])
+        with pytest.raises(AttributeError, match='.sparse'):
+            ser.sparse.density
+
+
+def test_setting_fill_value_fillna_still_works():
+    # This is why letting users update fill_value / dtype is bad
+    # astype has the same problem.
+    arr = SparseArray([1., np.nan, 1.0], fill_value=0.0)
+    arr.fill_value = np.nan
+    result = arr.isna()
+    # Can't do direct comparison, since the sp_index will be different
+    # So let's convert to ndarray and check there.
+    result = np.asarray(result)
+
+    expected = np.array([False, True, False])
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_setting_fill_value_updates():
+    arr = SparseArray([0.0, np.nan], fill_value=0)
+    arr.fill_value = np.nan
+    # use private constructor to get the index right
+    # otherwise both nans would be un-stored.
+    expected = SparseArray._simple_new(
+        sparse_array=np.array([np.nan]),
+        sparse_index=IntIndex(2, [1]),
+        dtype=SparseDtype(float, np.nan),
+    )
+    tm.assert_sp_array_equal(arr, expected)
+
+
+@pytest.mark.parametrize("arr, loc", [
+    ([None, 1, 2], 0),
+    ([0, None, 2], 1),
+    ([0, 1, None], 2),
+    ([0, 1, 1, None, None], 3),
+    ([1, 1, 1, 2], -1),
+    ([], -1),
+])
+def test_first_fill_value_loc(arr, loc):
+    result = SparseArray(arr)._first_fill_value_loc()
+    assert result == loc
+
+
+@pytest.mark.parametrize('arr', [
+    [1, 2, np.nan, np.nan],
+    [1, np.nan, 2, np.nan],
+    [1, 2, np.nan],
+])
+@pytest.mark.parametrize("fill_value", [
+    np.nan, 0, 1
+])
+def test_unique_na_fill(arr, fill_value):
+    a = pd.SparseArray(arr, fill_value=fill_value).unique()
+    b = pd.Series(arr).unique()
+    assert isinstance(a, SparseArray)
+    a = np.asarray(a)
+    tm.assert_numpy_array_equal(a, b)
+
+
+def test_unique_all_sparse():
+    # https://github.com/pandas-dev/pandas/issues/23168
+    arr = SparseArray([0, 0])
+    result = arr.unique()
+    expected = SparseArray([0])
+    tm.assert_sp_array_equal(result, expected)
+
+
+def test_map():
+    arr = SparseArray([0, 1, 2])
+    expected = SparseArray([10, 11, 12], fill_value=10)
+
+    # dict
+    result = arr.map({0: 10, 1: 11, 2: 12})
+    tm.assert_sp_array_equal(result, expected)
+
+    # series
+    result = arr.map(pd.Series({0: 10, 1: 11, 2: 12}))
+    tm.assert_sp_array_equal(result, expected)
+
+    # function
+    result = arr.map(pd.Series({0: 10, 1: 11, 2: 12}))
+    expected = SparseArray([10, 11, 12], fill_value=10)
+    tm.assert_sp_array_equal(result, expected)
+
+
+def test_map_missing():
+    arr = SparseArray([0, 1, 2])
+    expected = SparseArray([10, 11, None], fill_value=10)
+
+    result = arr.map({0: 10, 1: 11})
+    tm.assert_sp_array_equal(result, expected)
diff --git a/pandas/tests/arrays/sparse/test_dtype.py b/pandas/tests/arrays/sparse/test_dtype.py
new file mode 100644
index 0000000000000..2d386de0d31a3
--- /dev/null
+++ b/pandas/tests/arrays/sparse/test_dtype.py
@@ -0,0 +1,161 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.core.sparse.api import SparseDtype
+
+
+@pytest.mark.parametrize("dtype, fill_value", [
+    ('int', 0),
+    ('float', np.nan),
+    ('bool', False),
+    ('object', np.nan),
+    ('datetime64[ns]', pd.NaT),
+    ('timedelta64[ns]', pd.NaT),
+])
+def test_inferred_dtype(dtype, fill_value):
+    sparse_dtype = SparseDtype(dtype)
+    result = sparse_dtype.fill_value
+    if pd.isna(fill_value):
+        assert pd.isna(result) and type(result) == type(fill_value)
+    else:
+        assert result == fill_value
+
+
+def test_from_sparse_dtype():
+    dtype = SparseDtype('float', 0)
+    result = SparseDtype(dtype)
+    assert result.fill_value == 0
+
+
+def test_from_sparse_dtype_fill_value():
+    dtype = SparseDtype('int', 1)
+    result = SparseDtype(dtype, fill_value=2)
+    expected = SparseDtype('int', 2)
+    assert result == expected
+
+
+@pytest.mark.parametrize('dtype, fill_value', [
+    ('int', None),
+    ('float', None),
+    ('bool', None),
+    ('object', None),
+    ('datetime64[ns]', None),
+    ('timedelta64[ns]', None),
+    ('int', np.nan),
+    ('float', 0),
+])
+def test_equal(dtype, fill_value):
+    a = SparseDtype(dtype, fill_value)
+    b = SparseDtype(dtype, fill_value)
+    assert a == b
+    assert b == a
+
+
+def test_nans_equal():
+    a = SparseDtype(float, float('nan'))
+    b = SparseDtype(float, np.nan)
+    assert a == b
+    assert b == a
+
+
+@pytest.mark.parametrize('a, b', [
+    (SparseDtype('float64'), SparseDtype('float32')),
+    (SparseDtype('float64'), SparseDtype('float64', 0)),
+    (SparseDtype('float64'), SparseDtype('datetime64[ns]', np.nan)),
+    (SparseDtype(int, pd.NaT), SparseDtype(float, pd.NaT)),
+    (SparseDtype('float64'), np.dtype('float64')),
+])
+def test_not_equal(a, b):
+    assert a != b
+
+
+def test_construct_from_string_raises():
+    with pytest.raises(TypeError):
+        SparseDtype.construct_from_string('not a dtype')
+
+
+@pytest.mark.parametrize("dtype, expected", [
+    (SparseDtype(int), True),
+    (SparseDtype(float), True),
+    (SparseDtype(bool), True),
+    (SparseDtype(object), False),
+    (SparseDtype(str), False),
+])
+def test_is_numeric(dtype, expected):
+    assert dtype._is_numeric is expected
+
+
+def test_str_uses_object():
+    result = SparseDtype(str).subtype
+    assert result == np.dtype('object')
+
+
+@pytest.mark.parametrize("string, expected", [
+    ('Sparse[float64]', SparseDtype(np.dtype('float64'))),
+    ('Sparse[float32]', SparseDtype(np.dtype('float32'))),
+    ('Sparse[int]', SparseDtype(np.dtype('int'))),
+    ('Sparse[str]', SparseDtype(np.dtype('str'))),
+    ('Sparse[datetime64[ns]]', SparseDtype(np.dtype('datetime64[ns]'))),
+    ("Sparse", SparseDtype(np.dtype("float"), np.nan))
+])
+def test_construct_from_string(string, expected):
+    result = SparseDtype.construct_from_string(string)
+    assert result == expected
+
+
+@pytest.mark.parametrize("a, b, expected", [
+    (SparseDtype(float, 0.0), SparseDtype(np.dtype('float'), 0.0), True),
+    (SparseDtype(int, 0), SparseDtype(int, 0), True),
+    (SparseDtype(float, float('nan')), SparseDtype(float, np.nan), True),
+    (SparseDtype(float, 0), SparseDtype(float, np.nan), False),
+    (SparseDtype(int, 0.0), SparseDtype(float, 0.0), False),
+])
+def test_hash_equal(a, b, expected):
+    result = a == b
+    assert result is expected
+
+    result = hash(a) == hash(b)
+    assert result is expected
+
+
+@pytest.mark.parametrize('string, expected', [
+    ('Sparse[int]', 'int'),
+    ('Sparse[int, 0]', 'int'),
+    ('Sparse[int64]', 'int64'),
+    ('Sparse[int64, 0]', 'int64'),
+    ('Sparse[datetime64[ns], 0]', 'datetime64[ns]'),
+])
+def test_parse_subtype(string, expected):
+    subtype, _ = SparseDtype._parse_subtype(string)
+    assert subtype == expected
+
+
+@pytest.mark.parametrize("string", [
+    "Sparse[int, 1]",
+    "Sparse[float, 0.0]",
+    "Sparse[bool, True]",
+])
+def test_construct_from_string_fill_value_raises(string):
+    with pytest.raises(TypeError, match='fill_value in the string is not'):
+        SparseDtype.construct_from_string(string)
+
+
+@pytest.mark.parametrize('original, dtype, expected', [
+    (SparseDtype(int, 0), float, SparseDtype(float, 0.0)),
+    (SparseDtype(int, 1), float, SparseDtype(float, 1.0)),
+    (SparseDtype(int, 1), str, SparseDtype(object, '1')),
+    (SparseDtype(float, 1.5), int, SparseDtype(int, 1)),
+])
+def test_update_dtype(original, dtype, expected):
+    result = original.update_dtype(dtype)
+    assert result == expected
+
+
+@pytest.mark.parametrize("original, dtype", [
+    (SparseDtype(float, np.nan), int),
+    (SparseDtype(str, 'abc'), int),
+])
+def test_update_dtype_raises(original, dtype):
+    with pytest.raises(ValueError):
+        original.update_dtype(dtype)
diff --git a/pandas/tests/sparse/test_libsparse.py b/pandas/tests/arrays/sparse/test_libsparse.py
similarity index 76%
rename from pandas/tests/sparse/test_libsparse.py
rename to pandas/tests/arrays/sparse/test_libsparse.py
index b6ab99dc66cda..2cbe7d9ea084c 100644
--- a/pandas/tests/sparse/test_libsparse.py
+++ b/pandas/tests/arrays/sparse/test_libsparse.py
@@ -1,14 +1,14 @@
-from pandas import Series
+import operator
 
-import pytest
 import numpy as np
-import operator
-import pandas.util.testing as tm
+import pytest
 
-from pandas import compat
+import pandas._libs.sparse as splib
+import pandas.util._test_decorators as td
 
-from pandas.sparse.array import IntIndex, BlockIndex, _make_index
-import pandas.sparse.libsparse as splib
+from pandas import Series
+from pandas.core.arrays.sparse import BlockIndex, IntIndex, _make_index
+import pandas.util.testing as tm
 
 TEST_LENGTH = 20
 
@@ -42,7 +42,7 @@ def _check_case_dict(case):
     _check_case([], [], [], [], [], [])
 
 
-class TestSparseIndexUnion(tm.TestCase):
+class TestSparseIndexUnion(object):
 
     def test_index_make_union(self):
         def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
@@ -162,41 +162,42 @@ def test_intindex_make_union(self):
         b = IntIndex(5, np.array([0, 2], dtype=np.int32))
         res = a.make_union(b)
         exp = IntIndex(5, np.array([0, 2, 3, 4], np.int32))
-        self.assertTrue(res.equals(exp))
+        assert res.equals(exp)
 
         a = IntIndex(5, np.array([], dtype=np.int32))
         b = IntIndex(5, np.array([0, 2], dtype=np.int32))
         res = a.make_union(b)
         exp = IntIndex(5, np.array([0, 2], np.int32))
-        self.assertTrue(res.equals(exp))
+        assert res.equals(exp)
 
         a = IntIndex(5, np.array([], dtype=np.int32))
         b = IntIndex(5, np.array([], dtype=np.int32))
         res = a.make_union(b)
         exp = IntIndex(5, np.array([], np.int32))
-        self.assertTrue(res.equals(exp))
+        assert res.equals(exp)
 
         a = IntIndex(5, np.array([0, 1, 2, 3, 4], dtype=np.int32))
         b = IntIndex(5, np.array([0, 1, 2, 3, 4], dtype=np.int32))
         res = a.make_union(b)
         exp = IntIndex(5, np.array([0, 1, 2, 3, 4], np.int32))
-        self.assertTrue(res.equals(exp))
+        assert res.equals(exp)
 
         a = IntIndex(5, np.array([0, 1], dtype=np.int32))
         b = IntIndex(4, np.array([0, 1], dtype=np.int32))
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             a.make_union(b)
 
 
-class TestSparseIndexIntersect(tm.TestCase):
+class TestSparseIndexIntersect(object):
 
+    @td.skip_if_windows
     def test_intersect(self):
         def _check_correct(a, b, expected):
             result = a.intersect(b)
             assert (result.equals(expected))
 
         def _check_length_exc(a, longer):
-            self.assertRaises(Exception, a.intersect, longer)
+            pytest.raises(Exception, a.intersect, longer)
 
         def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
             xindex = BlockIndex(TEST_LENGTH, xloc, xlen)
@@ -212,20 +213,18 @@ def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
             _check_length_exc(xindex.to_int_index(),
                               longer_index.to_int_index())
 
-        if compat.is_platform_windows():
-            pytest.skip("segfaults on win-64 when all tests are run")
         check_cases(_check_case)
 
     def test_intersect_empty(self):
         xindex = IntIndex(4, np.array([], dtype=np.int32))
         yindex = IntIndex(4, np.array([2, 3], dtype=np.int32))
-        self.assertTrue(xindex.intersect(yindex).equals(xindex))
-        self.assertTrue(yindex.intersect(xindex).equals(xindex))
+        assert xindex.intersect(yindex).equals(xindex)
+        assert yindex.intersect(xindex).equals(xindex)
 
         xindex = xindex.to_block_index()
         yindex = yindex.to_block_index()
-        self.assertTrue(xindex.intersect(yindex).equals(xindex))
-        self.assertTrue(yindex.intersect(xindex).equals(xindex))
+        assert xindex.intersect(yindex).equals(xindex)
+        assert yindex.intersect(xindex).equals(xindex)
 
     def test_intersect_identical(self):
         cases = [IntIndex(5, np.array([1, 2], dtype=np.int32)),
@@ -234,45 +233,45 @@ def test_intersect_identical(self):
                  IntIndex(5, np.array([], dtype=np.int32))]
 
         for case in cases:
-            self.assertTrue(case.intersect(case).equals(case))
+            assert case.intersect(case).equals(case)
             case = case.to_block_index()
-            self.assertTrue(case.intersect(case).equals(case))
+            assert case.intersect(case).equals(case)
 
 
-class TestSparseIndexCommon(tm.TestCase):
+class TestSparseIndexCommon(object):
 
     def test_int_internal(self):
         idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 2)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 2
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([2, 3], dtype=np.int32))
 
         idx = _make_index(4, np.array([], dtype=np.int32), kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 0)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 0
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([], dtype=np.int32))
 
         idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
                           kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 4)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 4
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([0, 1, 2, 3], dtype=np.int32))
 
     def test_block_internal(self):
         idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 2)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 2
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([2], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
                                     np.array([2], dtype=np.int32))
 
         idx = _make_index(4, np.array([], dtype=np.int32), kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 0)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 0
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
@@ -280,8 +279,8 @@ def test_block_internal(self):
 
         idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
                           kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 4)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 4
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([0], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
@@ -289,8 +288,8 @@ def test_block_internal(self):
 
         idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
                           kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 3)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 3
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([0, 2], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
@@ -299,35 +298,35 @@ def test_block_internal(self):
     def test_lookup(self):
         for kind in ['integer', 'block']:
             idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind=kind)
-            self.assertEqual(idx.lookup(-1), -1)
-            self.assertEqual(idx.lookup(0), -1)
-            self.assertEqual(idx.lookup(1), -1)
-            self.assertEqual(idx.lookup(2), 0)
-            self.assertEqual(idx.lookup(3), 1)
-            self.assertEqual(idx.lookup(4), -1)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == -1
+            assert idx.lookup(1) == -1
+            assert idx.lookup(2) == 0
+            assert idx.lookup(3) == 1
+            assert idx.lookup(4) == -1
 
             idx = _make_index(4, np.array([], dtype=np.int32), kind=kind)
 
             for i in range(-1, 5):
-                self.assertEqual(idx.lookup(i), -1)
+                assert idx.lookup(i) == -1
 
             idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
                               kind=kind)
-            self.assertEqual(idx.lookup(-1), -1)
-            self.assertEqual(idx.lookup(0), 0)
-            self.assertEqual(idx.lookup(1), 1)
-            self.assertEqual(idx.lookup(2), 2)
-            self.assertEqual(idx.lookup(3), 3)
-            self.assertEqual(idx.lookup(4), -1)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == 0
+            assert idx.lookup(1) == 1
+            assert idx.lookup(2) == 2
+            assert idx.lookup(3) == 3
+            assert idx.lookup(4) == -1
 
             idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
                               kind=kind)
-            self.assertEqual(idx.lookup(-1), -1)
-            self.assertEqual(idx.lookup(0), 0)
-            self.assertEqual(idx.lookup(1), -1)
-            self.assertEqual(idx.lookup(2), 1)
-            self.assertEqual(idx.lookup(3), 2)
-            self.assertEqual(idx.lookup(4), -1)
+            assert idx.lookup(-1) == -1
+            assert idx.lookup(0) == 0
+            assert idx.lookup(1) == -1
+            assert idx.lookup(2) == 1
+            assert idx.lookup(3) == 2
+            assert idx.lookup(4) == -1
 
     def test_lookup_array(self):
         for kind in ['integer', 'block']:
@@ -335,11 +334,11 @@ def test_lookup_array(self):
 
             res = idx.lookup_array(np.array([-1, 0, 2], dtype=np.int32))
             exp = np.array([-1, -1, 0], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
             res = idx.lookup_array(np.array([4, 2, 1, 3], dtype=np.int32))
             exp = np.array([-1, 0, -1, 1], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
             idx = _make_index(4, np.array([], dtype=np.int32), kind=kind)
             res = idx.lookup_array(np.array([-1, 0, 2, 4], dtype=np.int32))
@@ -349,21 +348,21 @@ def test_lookup_array(self):
                               kind=kind)
             res = idx.lookup_array(np.array([-1, 0, 2], dtype=np.int32))
             exp = np.array([-1, 0, 2], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
             res = idx.lookup_array(np.array([4, 2, 1, 3], dtype=np.int32))
             exp = np.array([-1, 2, 1, 3], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
             idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32),
                               kind=kind)
             res = idx.lookup_array(np.array([2, 1, 3, 0], dtype=np.int32))
             exp = np.array([1, -1, 2, 0], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
             res = idx.lookup_array(np.array([1, 4, 2, 5], dtype=np.int32))
             exp = np.array([-1, -1, 1, -1], dtype=np.int32)
-            self.assert_numpy_array_equal(res, exp)
+            tm.assert_numpy_array_equal(res, exp)
 
     def test_lookup_basics(self):
         def _check(index):
@@ -387,20 +386,20 @@ def _check(index):
         # corner cases
 
 
-class TestBlockIndex(tm.TestCase):
+class TestBlockIndex(object):
 
     def test_block_internal(self):
         idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 2)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 2
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([2], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
                                     np.array([2], dtype=np.int32))
 
         idx = _make_index(4, np.array([], dtype=np.int32), kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 0)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 0
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
@@ -408,16 +407,16 @@ def test_block_internal(self):
 
         idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
                           kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 4)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 4
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([0], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
                                     np.array([4], dtype=np.int32))
 
         idx = _make_index(4, np.array([0, 2, 3], dtype=np.int32), kind='block')
-        self.assertIsInstance(idx, BlockIndex)
-        self.assertEqual(idx.npoints, 3)
+        assert isinstance(idx, BlockIndex)
+        assert idx.npoints == 3
         tm.assert_numpy_array_equal(idx.blocs,
                                     np.array([0, 2], dtype=np.int32))
         tm.assert_numpy_array_equal(idx.blengths,
@@ -436,8 +435,8 @@ def test_make_block_boundary(self):
     def test_equals(self):
         index = BlockIndex(10, [0, 4], [2, 5])
 
-        self.assertTrue(index.equals(index))
-        self.assertFalse(index.equals(BlockIndex(10, [0, 4], [2, 6])))
+        assert index.equals(index)
+        assert not index.equals(BlockIndex(10, [0, 4], [2, 6]))
 
     def test_check_integrity(self):
         locs = []
@@ -450,11 +449,13 @@ def test_check_integrity(self):
         # also OK even though empty
         index = BlockIndex(1, locs, lengths)  # noqa
 
-        # block extend beyond end
-        self.assertRaises(Exception, BlockIndex, 10, [5], [10])
+        msg = "Block 0 extends beyond end"
+        with pytest.raises(ValueError, match=msg):
+            BlockIndex(10, [5], [10])
 
-        # block overlap
-        self.assertRaises(Exception, BlockIndex, 10, [2, 5], [5, 3])
+        msg = "Block 0 overlaps"
+        with pytest.raises(ValueError, match=msg):
+            BlockIndex(10, [2, 5], [5, 3])
 
     def test_to_int_index(self):
         locs = [0, 10]
@@ -469,35 +470,73 @@ def test_to_int_index(self):
 
     def test_to_block_index(self):
         index = BlockIndex(10, [0, 5], [4, 5])
-        self.assertIs(index.to_block_index(), index)
+        assert index.to_block_index() is index
+
+
+class TestIntIndex(object):
+
+    def test_check_integrity(self):
+
+        # Too many indices than specified in self.length
+        msg = "Too many indices"
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=1, indices=[1, 2, 3])
 
+        # No index can be negative.
+        msg = "No index can be less than zero"
 
-class TestIntIndex(tm.TestCase):
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, -2, 3])
+
+        # No index can be negative.
+        msg = "No index can be less than zero"
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, -2, 3])
+
+        # All indices must be less than the length.
+        msg = "All indices must be less than the length"
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, 2, 5])
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, 2, 6])
+
+        # Indices must be strictly ascending.
+        msg = "Indices must be strictly increasing"
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, 3, 2])
+
+        with pytest.raises(ValueError, match=msg):
+            IntIndex(length=5, indices=[1, 3, 3])
 
     def test_int_internal(self):
         idx = _make_index(4, np.array([2, 3], dtype=np.int32), kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 2)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 2
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([2, 3], dtype=np.int32))
 
         idx = _make_index(4, np.array([], dtype=np.int32), kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 0)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 0
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([], dtype=np.int32))
 
         idx = _make_index(4, np.array([0, 1, 2, 3], dtype=np.int32),
                           kind='integer')
-        self.assertIsInstance(idx, IntIndex)
-        self.assertEqual(idx.npoints, 4)
+        assert isinstance(idx, IntIndex)
+        assert idx.npoints == 4
         tm.assert_numpy_array_equal(idx.indices,
                                     np.array([0, 1, 2, 3], dtype=np.int32))
 
     def test_equals(self):
         index = IntIndex(10, [0, 1, 2, 3, 4])
-        self.assertTrue(index.equals(index))
-        self.assertFalse(index.equals(IntIndex(10, [0, 1, 2, 3])))
+        assert index.equals(index)
+        assert not index.equals(IntIndex(10, [0, 1, 2, 3]))
 
     def test_to_block_index(self):
 
@@ -508,18 +547,18 @@ def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
             # see if survive the round trip
             xbindex = xindex.to_int_index().to_block_index()
             ybindex = yindex.to_int_index().to_block_index()
-            tm.assertIsInstance(xbindex, BlockIndex)
-            self.assertTrue(xbindex.equals(xindex))
-            self.assertTrue(ybindex.equals(yindex))
+            assert isinstance(xbindex, BlockIndex)
+            assert xbindex.equals(xindex)
+            assert ybindex.equals(yindex)
 
         check_cases(_check_case)
 
     def test_to_int_index(self):
         index = IntIndex(10, [2, 3, 4, 5, 6])
-        self.assertIs(index.to_int_index(), index)
+        assert index.to_int_index() is index
 
 
-class TestSparseOperators(tm.TestCase):
+class TestSparseOperators(object):
 
     def _op_tests(self, sparse_op, python_op):
         def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
@@ -540,9 +579,9 @@ def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
             result_int_vals, ri_index, ifill = sparse_op(x, xdindex, xfill, y,
                                                          ydindex, yfill)
 
-            self.assertTrue(rb_index.to_int_index().equals(ri_index))
+            assert rb_index.to_int_index().equals(ri_index)
             tm.assert_numpy_array_equal(result_block_vals, result_int_vals)
-            self.assertEqual(bfill, ifill)
+            assert bfill == ifill
 
             # check versus Series...
             xseries = Series(x, xdindex.indices)
@@ -560,22 +599,9 @@ def _check_case(xloc, xlen, yloc, ylen, eloc, elen):
 
         check_cases(_check_case)
 
-
-# too cute? oh but how I abhor code duplication
-check_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv']
-
-
-def make_optestf(op):
-    def f(self):
-        sparse_op = getattr(splib, 'sparse_%s_float64' % op)
-        python_op = getattr(operator, op)
+    @pytest.mark.parametrize('opname',
+                             ['add', 'sub', 'mul', 'truediv', 'floordiv'])
+    def test_op(self, opname):
+        sparse_op = getattr(splib, 'sparse_%s_float64' % opname)
+        python_op = getattr(operator, opname)
         self._op_tests(sparse_op, python_op)
-
-    f.__name__ = 'test_%s' % op
-    return f
-
-
-for op in check_ops:
-    g = make_optestf(op)
-    setattr(TestSparseOperators, g.__name__, g)
-    del g
diff --git a/pandas/tests/arrays/test_array.py b/pandas/tests/arrays/test_array.py
new file mode 100644
index 0000000000000..b68ec2bf348b4
--- /dev/null
+++ b/pandas/tests/arrays/test_array.py
@@ -0,0 +1,305 @@
+import datetime
+import decimal
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas.core.dtypes.dtypes import registry
+
+import pandas as pd
+from pandas.api.extensions import register_extension_dtype
+from pandas.api.types import is_scalar
+from pandas.core.arrays import PandasArray, integer_array, period_array
+from pandas.tests.extension.decimal import (
+    DecimalArray, DecimalDtype, to_decimal)
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("data, dtype, expected", [
+    # Basic NumPy defaults.
+    ([1, 2], None, PandasArray(np.array([1, 2]))),
+    ([1, 2], object, PandasArray(np.array([1, 2], dtype=object))),
+    ([1, 2], np.dtype('float32'),
+     PandasArray(np.array([1., 2.0], dtype=np.dtype('float32')))),
+    (np.array([1, 2]), None, PandasArray(np.array([1, 2]))),
+
+    # String alias passes through to NumPy
+    ([1, 2], 'float32', PandasArray(np.array([1, 2], dtype='float32'))),
+
+    # Period alias
+    ([pd.Period('2000', 'D'), pd.Period('2001', 'D')], 'Period[D]',
+     period_array(['2000', '2001'], freq='D')),
+
+    # Period dtype
+    ([pd.Period('2000', 'D')], pd.PeriodDtype('D'),
+     period_array(['2000'], freq='D')),
+
+    # Datetime (naive)
+    ([1, 2], np.dtype('datetime64[ns]'),
+     pd.arrays.DatetimeArray._from_sequence(
+         np.array([1, 2], dtype='datetime64[ns]'))),
+
+    (np.array([1, 2], dtype='datetime64[ns]'), None,
+     pd.arrays.DatetimeArray._from_sequence(
+         np.array([1, 2], dtype='datetime64[ns]'))),
+
+    (pd.DatetimeIndex(['2000', '2001']), np.dtype('datetime64[ns]'),
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'])),
+
+    (pd.DatetimeIndex(['2000', '2001']), None,
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'])),
+
+    (['2000', '2001'], np.dtype('datetime64[ns]'),
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'])),
+
+    # Datetime (tz-aware)
+    (['2000', '2001'], pd.DatetimeTZDtype(tz="CET"),
+     pd.arrays.DatetimeArray._from_sequence(
+         ['2000', '2001'], dtype=pd.DatetimeTZDtype(tz="CET"))),
+
+    # Timedelta
+    (['1H', '2H'], np.dtype('timedelta64[ns]'),
+     pd.arrays.TimedeltaArray._from_sequence(['1H', '2H'])),
+
+    (pd.TimedeltaIndex(['1H', '2H']), np.dtype('timedelta64[ns]'),
+     pd.arrays.TimedeltaArray._from_sequence(['1H', '2H'])),
+
+    (pd.TimedeltaIndex(['1H', '2H']), None,
+     pd.arrays.TimedeltaArray._from_sequence(['1H', '2H'])),
+
+    # Category
+    (['a', 'b'], 'category', pd.Categorical(['a', 'b'])),
+    (['a', 'b'], pd.CategoricalDtype(None, ordered=True),
+     pd.Categorical(['a', 'b'], ordered=True)),
+
+    # Interval
+    ([pd.Interval(1, 2), pd.Interval(3, 4)], 'interval',
+     pd.arrays.IntervalArray.from_tuples([(1, 2), (3, 4)])),
+
+    # Sparse
+    ([0, 1], 'Sparse[int64]', pd.SparseArray([0, 1], dtype='int64')),
+
+    # IntegerNA
+    ([1, None], 'Int16', integer_array([1, None], dtype='Int16')),
+    (pd.Series([1, 2]), None, PandasArray(np.array([1, 2], dtype=np.int64))),
+
+    # Index
+    (pd.Index([1, 2]), None, PandasArray(np.array([1, 2], dtype=np.int64))),
+
+    # Series[EA] returns the EA
+    (pd.Series(pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])),
+     None,
+     pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])),
+
+    # "3rd party" EAs work
+    ([decimal.Decimal(0), decimal.Decimal(1)], 'decimal', to_decimal([0, 1])),
+
+    # pass an ExtensionArray, but a different dtype
+    (period_array(['2000', '2001'], freq='D'),
+     'category',
+     pd.Categorical([pd.Period('2000', 'D'), pd.Period('2001', 'D')])),
+])
+def test_array(data, dtype, expected):
+    result = pd.array(data, dtype=dtype)
+    tm.assert_equal(result, expected)
+
+
+def test_array_copy():
+    a = np.array([1, 2])
+    # default is to copy
+    b = pd.array(a)
+    assert np.shares_memory(a, b._ndarray) is False
+
+    # copy=True
+    b = pd.array(a, copy=True)
+    assert np.shares_memory(a, b._ndarray) is False
+
+    # copy=False
+    b = pd.array(a, copy=False)
+    assert np.shares_memory(a, b._ndarray) is True
+
+
+cet = pytz.timezone("CET")
+
+
+@pytest.mark.parametrize('data, expected', [
+    # period
+    ([pd.Period("2000", "D"), pd.Period("2001", "D")],
+     period_array(["2000", "2001"], freq="D")),
+
+    # interval
+    ([pd.Interval(0, 1), pd.Interval(1, 2)],
+     pd.arrays.IntervalArray.from_breaks([0, 1, 2])),
+
+    # datetime
+    ([pd.Timestamp('2000',), pd.Timestamp('2001')],
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'])),
+
+    ([datetime.datetime(2000, 1, 1), datetime.datetime(2001, 1, 1)],
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'])),
+
+    (np.array([1, 2], dtype='M8[ns]'),
+     pd.arrays.DatetimeArray(np.array([1, 2], dtype='M8[ns]'))),
+
+    (np.array([1, 2], dtype='M8[us]'),
+     pd.arrays.DatetimeArray(np.array([1000, 2000], dtype='M8[ns]'))),
+
+    # datetimetz
+    ([pd.Timestamp('2000', tz='CET'), pd.Timestamp('2001', tz='CET')],
+     pd.arrays.DatetimeArray._from_sequence(
+         ['2000', '2001'], dtype=pd.DatetimeTZDtype(tz='CET'))),
+
+    ([datetime.datetime(2000, 1, 1, tzinfo=cet),
+      datetime.datetime(2001, 1, 1, tzinfo=cet)],
+     pd.arrays.DatetimeArray._from_sequence(['2000', '2001'],
+                                            tz=cet)),
+
+    # timedelta
+    ([pd.Timedelta('1H'), pd.Timedelta('2H')],
+     pd.arrays.TimedeltaArray._from_sequence(['1H', '2H'])),
+
+    (np.array([1, 2], dtype='m8[ns]'),
+     pd.arrays.TimedeltaArray(np.array([1, 2], dtype='m8[ns]'))),
+
+    (np.array([1, 2], dtype='m8[us]'),
+     pd.arrays.TimedeltaArray(np.array([1000, 2000], dtype='m8[ns]'))),
+
+])
+def test_array_inference(data, expected):
+    result = pd.array(data)
+    tm.assert_equal(result, expected)
+
+
+@pytest.mark.parametrize('data', [
+    # mix of frequencies
+    [pd.Period("2000", "D"), pd.Period("2001", "A")],
+    # mix of closed
+    [pd.Interval(0, 1, closed='left'), pd.Interval(1, 2, closed='right')],
+    # Mix of timezones
+    [pd.Timestamp("2000", tz="CET"), pd.Timestamp("2000", tz="UTC")],
+    # Mix of tz-aware and tz-naive
+    [pd.Timestamp("2000", tz="CET"), pd.Timestamp("2000")],
+    np.array([pd.Timestamp('2000'), pd.Timestamp('2000', tz='CET')]),
+])
+def test_array_inference_fails(data):
+    result = pd.array(data)
+    expected = PandasArray(np.array(data, dtype=object))
+    tm.assert_extension_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("data", [
+    np.array([[1, 2], [3, 4]]),
+    [[1, 2], [3, 4]],
+])
+def test_nd_raises(data):
+    with pytest.raises(ValueError, match='PandasArray must be 1-dimensional'):
+        pd.array(data)
+
+
+def test_scalar_raises():
+    with pytest.raises(ValueError,
+                       match="Cannot pass scalar '1'"):
+        pd.array(1)
+
+# ---------------------------------------------------------------------------
+# A couple dummy classes to ensure that Series and Indexes are unboxed before
+# getting to the EA classes.
+
+
+@register_extension_dtype
+class DecimalDtype2(DecimalDtype):
+    name = 'decimal2'
+
+    @classmethod
+    def construct_array_type(cls):
+        return DecimalArray2
+
+
+class DecimalArray2(DecimalArray):
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        if isinstance(scalars, (pd.Series, pd.Index)):
+            raise TypeError
+
+        return super(DecimalArray2, cls)._from_sequence(
+            scalars, dtype=dtype, copy=copy
+        )
+
+
+@pytest.mark.parametrize("box", [pd.Series, pd.Index])
+def test_array_unboxes(box):
+    data = box([decimal.Decimal('1'), decimal.Decimal('2')])
+    # make sure it works
+    with pytest.raises(TypeError):
+        DecimalArray2._from_sequence(data)
+
+    result = pd.array(data, dtype='decimal2')
+    expected = DecimalArray2._from_sequence(data.values)
+    tm.assert_equal(result, expected)
+
+
+@pytest.fixture
+def registry_without_decimal():
+    idx = registry.dtypes.index(DecimalDtype)
+    registry.dtypes.pop(idx)
+    yield
+    registry.dtypes.append(DecimalDtype)
+
+
+def test_array_not_registered(registry_without_decimal):
+    # check we aren't on it
+    assert registry.find('decimal') is None
+    data = [decimal.Decimal('1'), decimal.Decimal('2')]
+
+    result = pd.array(data, dtype=DecimalDtype)
+    expected = DecimalArray._from_sequence(data)
+    tm.assert_equal(result, expected)
+
+
+class TestArrayAnalytics(object):
+    def test_searchsorted(self, string_dtype):
+        arr = pd.array(['a', 'b', 'c'], dtype=string_dtype)
+
+        result = arr.searchsorted('a', side='left')
+        assert is_scalar(result)
+        assert result == 0
+
+        result = arr.searchsorted('a', side='right')
+        assert is_scalar(result)
+        assert result == 1
+
+    def test_searchsorted_numeric_dtypes_scalar(self, any_real_dtype):
+        arr = pd.array([1, 3, 90], dtype=any_real_dtype)
+        result = arr.searchsorted(30)
+        assert is_scalar(result)
+        assert result == 2
+
+        result = arr.searchsorted([30])
+        expected = np.array([2], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_searchsorted_numeric_dtypes_vector(self, any_real_dtype):
+        arr = pd.array([1, 3, 90], dtype=any_real_dtype)
+        result = arr.searchsorted([2, 30])
+        expected = np.array([1, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('arr, val', [
+        [pd.date_range('20120101', periods=10, freq='2D'),
+         pd.Timestamp('20120102')],
+        [pd.date_range('20120101', periods=10, freq='2D', tz='Asia/Hong_Kong'),
+         pd.Timestamp('20120102', tz='Asia/Hong_Kong')],
+        [pd.timedelta_range(start='1 day', end='10 days', periods=10),
+         pd.Timedelta('2 days')]])
+    def test_search_sorted_datetime64_scalar(self, arr, val):
+        arr = pd.array(arr)
+        result = arr.searchsorted(val)
+        assert is_scalar(result)
+        assert result == 1
+
+    def test_searchsorted_sorter(self, any_real_dtype):
+        arr = pd.array([3, 1, 2], dtype=any_real_dtype)
+        result = arr.searchsorted([0, 3], sorter=np.argsort(arr))
+        expected = np.array([0, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/arrays/test_datetimelike.py b/pandas/tests/arrays/test_datetimelike.py
new file mode 100644
index 0000000000000..f234e4fadec61
--- /dev/null
+++ b/pandas/tests/arrays/test_datetimelike.py
@@ -0,0 +1,657 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+import pandas.compat as compat
+
+import pandas as pd
+from pandas.core.arrays import DatetimeArray, PeriodArray, TimedeltaArray
+import pandas.util.testing as tm
+
+
+# TODO: more freq variants
+@pytest.fixture(params=['D', 'B', 'W', 'M', 'Q', 'Y'])
+def period_index(request):
+    """
+    A fixture to provide PeriodIndex objects with different frequencies.
+
+    Most PeriodArray behavior is already tested in PeriodIndex tests,
+    so here we just test that the PeriodArray behavior matches
+    the PeriodIndex behavior.
+    """
+    freqstr = request.param
+    # TODO: non-monotone indexes; NaTs, different start dates
+    pi = pd.period_range(start=pd.Timestamp('2000-01-01'),
+                         periods=100,
+                         freq=freqstr)
+    return pi
+
+
+@pytest.fixture(params=['D', 'B', 'W', 'M', 'Q', 'Y'])
+def datetime_index(request):
+    """
+    A fixture to provide DatetimeIndex objects with different frequencies.
+
+    Most DatetimeArray behavior is already tested in DatetimeIndex tests,
+    so here we just test that the DatetimeArray behavior matches
+    the DatetimeIndex behavior.
+    """
+    freqstr = request.param
+    # TODO: non-monotone indexes; NaTs, different start dates, timezones
+    pi = pd.date_range(start=pd.Timestamp('2000-01-01'),
+                       periods=100,
+                       freq=freqstr)
+    return pi
+
+
+@pytest.fixture
+def timedelta_index(request):
+    """
+    A fixture to provide TimedeltaIndex objects with different frequencies.
+     Most TimedeltaArray behavior is already tested in TimedeltaIndex tests,
+    so here we just test that the TimedeltaArray behavior matches
+    the TimedeltaIndex behavior.
+    """
+    # TODO: flesh this out
+    return pd.TimedeltaIndex(['1 Day', '3 Hours', 'NaT'])
+
+
+class SharedTests(object):
+    index_cls = None
+
+    def test_compare_len1_raises(self):
+        # make sure we raise when comparing with different lengths, specific
+        #  to the case where one has length-1, which numpy would broadcast
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+
+        idx = self.index_cls._simple_new(data, freq='D')
+        arr = self.array_cls(idx)
+
+        with pytest.raises(ValueError, match="Lengths must match"):
+            arr == arr[:1]
+
+        # test the index classes while we're at it, GH#23078
+        with pytest.raises(ValueError, match="Lengths must match"):
+            idx <= idx[[0]]
+
+    def test_take(self):
+        data = np.arange(100, dtype='i8') * 24 * 3600 * 10**9
+        np.random.shuffle(data)
+
+        idx = self.index_cls._simple_new(data, freq='D')
+        arr = self.array_cls(idx)
+
+        takers = [1, 4, 94]
+        result = arr.take(takers)
+        expected = idx.take(takers)
+
+        tm.assert_index_equal(self.index_cls(result), expected)
+
+        takers = np.array([1, 4, 94])
+        result = arr.take(takers)
+        expected = idx.take(takers)
+
+        tm.assert_index_equal(self.index_cls(result), expected)
+
+    def test_take_fill(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+
+        idx = self.index_cls._simple_new(data, freq='D')
+        arr = self.array_cls(idx)
+
+        result = arr.take([-1, 1], allow_fill=True, fill_value=None)
+        assert result[0] is pd.NaT
+
+        result = arr.take([-1, 1], allow_fill=True, fill_value=np.nan)
+        assert result[0] is pd.NaT
+
+        result = arr.take([-1, 1], allow_fill=True, fill_value=pd.NaT)
+        assert result[0] is pd.NaT
+
+        with pytest.raises(ValueError):
+            arr.take([0, 1], allow_fill=True, fill_value=2)
+
+        with pytest.raises(ValueError):
+            arr.take([0, 1], allow_fill=True, fill_value=2.0)
+
+        with pytest.raises(ValueError):
+            arr.take([0, 1], allow_fill=True,
+                     fill_value=pd.Timestamp.now().time)
+
+    def test_concat_same_type(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+
+        idx = self.index_cls._simple_new(data, freq='D').insert(0, pd.NaT)
+        arr = self.array_cls(idx)
+
+        result = arr._concat_same_type([arr[:-1], arr[1:], arr])
+        expected = idx._concat_same_dtype([idx[:-1], idx[1:], idx], None)
+
+        tm.assert_index_equal(self.index_cls(result), expected)
+
+    def test_unbox_scalar(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+        result = arr._unbox_scalar(arr[0])
+        assert isinstance(result, (int, compat.long))
+
+        result = arr._unbox_scalar(pd.NaT)
+        assert isinstance(result, (int, compat.long))
+
+        with pytest.raises(ValueError):
+            arr._unbox_scalar('foo')
+
+    def test_check_compatible_with(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+
+        arr._check_compatible_with(arr[0])
+        arr._check_compatible_with(arr[:1])
+        arr._check_compatible_with(pd.NaT)
+
+    def test_scalar_from_string(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+        result = arr._scalar_from_string(str(arr[0]))
+        assert result == arr[0]
+
+    def test_reduce_invalid(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+
+        with pytest.raises(TypeError, match='cannot perform'):
+            arr._reduce("not a method")
+
+    @pytest.mark.parametrize('method', ['pad', 'backfill'])
+    def test_fillna_method_doesnt_change_orig(self, method):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+        arr[4] = pd.NaT
+
+        fill_value = arr[3] if method == 'pad' else arr[5]
+
+        result = arr.fillna(method=method)
+        assert result[4] == fill_value
+
+        # check that the original was not changed
+        assert arr[4] is pd.NaT
+
+    def test_searchsorted(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+
+        # scalar
+        result = arr.searchsorted(arr[1])
+        assert result == 1
+
+        result = arr.searchsorted(arr[2], side="right")
+        assert result == 3
+
+        # own-type
+        result = arr.searchsorted(arr[1:3])
+        expected = np.array([1, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = arr.searchsorted(arr[1:3], side="right")
+        expected = np.array([2, 3], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # Following numpy convention, NaT goes at the beginning
+        #  (unlike NaN which goes at the end)
+        result = arr.searchsorted(pd.NaT)
+        assert result == 0
+
+    def test_setitem(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+
+        arr[0] = arr[1]
+        expected = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        expected[0] = expected[1]
+
+        tm.assert_numpy_array_equal(arr.asi8, expected)
+
+        arr[:2] = arr[-2:]
+        expected[:2] = expected[-2:]
+        tm.assert_numpy_array_equal(arr.asi8, expected)
+
+    def test_setitem_raises(self):
+        data = np.arange(10, dtype='i8') * 24 * 3600 * 10**9
+        arr = self.array_cls(data, freq='D')
+        val = arr[0]
+
+        with pytest.raises(IndexError, match="index 12 is out of bounds"):
+            arr[12] = val
+
+        with pytest.raises(TypeError, match="'value' should be a.* 'object'"):
+            arr[0] = object()
+
+
+class TestDatetimeArray(SharedTests):
+    index_cls = pd.DatetimeIndex
+    array_cls = DatetimeArray
+
+    def test_round(self, tz_naive_fixture):
+        # GH#24064
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01 01:01:00', periods=3, freq='H', tz=tz)
+
+        result = dti.round(freq='2T')
+        expected = dti - pd.Timedelta(minutes=1)
+        tm.assert_index_equal(result, expected)
+
+    def test_array_interface(self, datetime_index):
+        arr = DatetimeArray(datetime_index)
+
+        # default asarray gives the same underlying data (for tz naive)
+        result = np.asarray(arr)
+        expected = arr._data
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, copy=False)
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+
+        # specifying M8[ns] gives the same result as default
+        result = np.asarray(arr, dtype='datetime64[ns]')
+        expected = arr._data
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, dtype='datetime64[ns]', copy=False)
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, dtype='datetime64[ns]')
+        assert result is not expected
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to object dtype
+        result = np.asarray(arr, dtype=object)
+        expected = np.array(list(arr), dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to other dtype always copies
+        result = np.asarray(arr, dtype='int64')
+        assert result is not arr.asi8
+        assert not np.may_share_memory(arr, result)
+        expected = arr.asi8.copy()
+        tm.assert_numpy_array_equal(result, expected)
+
+        # other dtypes handled by numpy
+        for dtype in ['float64', str]:
+            result = np.asarray(arr, dtype=dtype)
+            expected = np.asarray(arr).astype(dtype)
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_array_object_dtype(self, tz_naive_fixture):
+        # GH#23524
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        arr = DatetimeArray(dti)
+
+        expected = np.array(list(dti))
+
+        result = np.array(arr, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # also test the DatetimeIndex method while we're at it
+        result = np.array(dti, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_array_tz(self, tz_naive_fixture):
+        # GH#23524
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        arr = DatetimeArray(dti)
+
+        expected = dti.asi8.view('M8[ns]')
+        result = np.array(arr, dtype='M8[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.array(arr, dtype='datetime64[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+        # check that we are not making copies when setting copy=False
+        result = np.array(arr, dtype='M8[ns]', copy=False)
+        assert result.base is expected.base
+        assert result.base is not None
+        result = np.array(arr, dtype='datetime64[ns]', copy=False)
+        assert result.base is expected.base
+        assert result.base is not None
+
+    def test_array_i8_dtype(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        arr = DatetimeArray(dti)
+
+        expected = dti.asi8
+        result = np.array(arr, dtype='i8')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.array(arr, dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # check that we are still making copies when setting copy=False
+        result = np.array(arr, dtype='i8', copy=False)
+        assert result.base is not expected.base
+        assert result.base is None
+
+    def test_from_array_keeps_base(self):
+        # Ensure that DatetimeArray._data.base isn't lost.
+        arr = np.array(['2000-01-01', '2000-01-02'], dtype='M8[ns]')
+        dta = DatetimeArray(arr)
+
+        assert dta._data is arr
+        dta = DatetimeArray(arr[:0])
+        assert dta._data.base is arr
+
+    def test_from_dti(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        arr = DatetimeArray(dti)
+        assert list(dti) == list(arr)
+
+        # Check that Index.__new__ knows what to do with DatetimeArray
+        dti2 = pd.Index(arr)
+        assert isinstance(dti2, pd.DatetimeIndex)
+        assert list(dti2) == list(arr)
+
+    def test_astype_object(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        arr = DatetimeArray(dti)
+        asobj = arr.astype('O')
+        assert isinstance(asobj, np.ndarray)
+        assert asobj.dtype == 'O'
+        assert list(asobj) == list(dti)
+
+    @pytest.mark.parametrize('freqstr', ['D', 'B', 'W', 'M', 'Q', 'Y'])
+    def test_to_perioddelta(self, datetime_index, freqstr):
+        # GH#23113
+        dti = datetime_index
+        arr = DatetimeArray(dti)
+
+        expected = dti.to_perioddelta(freq=freqstr)
+        result = arr.to_perioddelta(freq=freqstr)
+        assert isinstance(result, TimedeltaArray)
+
+        # placeholder until these become actual EA subclasses and we can use
+        #  an EA-specific tm.assert_ function
+        tm.assert_index_equal(pd.Index(result), pd.Index(expected))
+
+    @pytest.mark.parametrize('freqstr', ['D', 'B', 'W', 'M', 'Q', 'Y'])
+    def test_to_period(self, datetime_index, freqstr):
+        dti = datetime_index
+        arr = DatetimeArray(dti)
+
+        expected = dti.to_period(freq=freqstr)
+        result = arr.to_period(freq=freqstr)
+        assert isinstance(result, PeriodArray)
+
+        # placeholder until these become actual EA subclasses and we can use
+        #  an EA-specific tm.assert_ function
+        tm.assert_index_equal(pd.Index(result), pd.Index(expected))
+
+    @pytest.mark.parametrize('propname', pd.DatetimeIndex._bool_ops)
+    def test_bool_properties(self, datetime_index, propname):
+        # in this case _bool_ops is just `is_leap_year`
+        dti = datetime_index
+        arr = DatetimeArray(dti)
+        assert dti.freq == arr.freq
+
+        result = getattr(arr, propname)
+        expected = np.array(getattr(dti, propname), dtype=result.dtype)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('propname', pd.DatetimeIndex._field_ops)
+    def test_int_properties(self, datetime_index, propname):
+        dti = datetime_index
+        arr = DatetimeArray(dti)
+
+        result = getattr(arr, propname)
+        expected = np.array(getattr(dti, propname), dtype=result.dtype)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_fill_valid(self, datetime_index, tz_naive_fixture):
+        dti = datetime_index.tz_localize(tz_naive_fixture)
+        arr = DatetimeArray(dti)
+
+        now = pd.Timestamp.now().tz_localize(dti.tz)
+        result = arr.take([-1, 1], allow_fill=True, fill_value=now)
+        assert result[0] == now
+
+        with pytest.raises(ValueError):
+            # fill_value Timedelta invalid
+            arr.take([-1, 1], allow_fill=True, fill_value=now - now)
+
+        with pytest.raises(ValueError):
+            # fill_value Period invalid
+            arr.take([-1, 1], allow_fill=True, fill_value=pd.Period('2014Q1'))
+
+        tz = None if dti.tz is not None else 'US/Eastern'
+        now = pd.Timestamp.now().tz_localize(tz)
+        with pytest.raises(TypeError):
+            # Timestamp with mismatched tz-awareness
+            arr.take([-1, 1], allow_fill=True, fill_value=now)
+
+        with pytest.raises(ValueError):
+            # require NaT, not iNaT, as it could be confused with an integer
+            arr.take([-1, 1], allow_fill=True, fill_value=pd.NaT.value)
+
+    def test_concat_same_type_invalid(self, datetime_index):
+        # different timezones
+        dti = datetime_index
+        arr = DatetimeArray(dti)
+
+        if arr.tz is None:
+            other = arr.tz_localize('UTC')
+        else:
+            other = arr.tz_localize(None)
+
+        with pytest.raises(AssertionError):
+            arr._concat_same_type([arr, other])
+
+    def test_concat_same_type_different_freq(self):
+        # we *can* concatentate DTI with different freqs.
+        a = DatetimeArray(pd.date_range('2000', periods=2, freq='D',
+                                        tz='US/Central'))
+        b = DatetimeArray(pd.date_range('2000', periods=2, freq='H',
+                                        tz='US/Central'))
+        result = DatetimeArray._concat_same_type([a, b])
+        expected = DatetimeArray(pd.to_datetime([
+            '2000-01-01 00:00:00', '2000-01-02 00:00:00',
+            '2000-01-01 00:00:00', '2000-01-01 01:00:00',
+        ]).tz_localize("US/Central"))
+
+        tm.assert_datetime_array_equal(result, expected)
+
+
+class TestTimedeltaArray(SharedTests):
+    index_cls = pd.TimedeltaIndex
+    array_cls = TimedeltaArray
+
+    def test_from_tdi(self):
+        tdi = pd.TimedeltaIndex(['1 Day', '3 Hours'])
+        arr = TimedeltaArray(tdi)
+        assert list(arr) == list(tdi)
+
+        # Check that Index.__new__ knows what to do with TimedeltaArray
+        tdi2 = pd.Index(arr)
+        assert isinstance(tdi2, pd.TimedeltaIndex)
+        assert list(tdi2) == list(arr)
+
+    def test_astype_object(self):
+        tdi = pd.TimedeltaIndex(['1 Day', '3 Hours'])
+        arr = TimedeltaArray(tdi)
+        asobj = arr.astype('O')
+        assert isinstance(asobj, np.ndarray)
+        assert asobj.dtype == 'O'
+        assert list(asobj) == list(tdi)
+
+    def test_to_pytimedelta(self, timedelta_index):
+        tdi = timedelta_index
+        arr = TimedeltaArray(tdi)
+
+        expected = tdi.to_pytimedelta()
+        result = arr.to_pytimedelta()
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_total_seconds(self, timedelta_index):
+        tdi = timedelta_index
+        arr = TimedeltaArray(tdi)
+
+        expected = tdi.total_seconds()
+        result = arr.total_seconds()
+
+        tm.assert_numpy_array_equal(result, expected.values)
+
+    @pytest.mark.parametrize('propname', pd.TimedeltaIndex._field_ops)
+    def test_int_properties(self, timedelta_index, propname):
+        tdi = timedelta_index
+        arr = TimedeltaArray(tdi)
+
+        result = getattr(arr, propname)
+        expected = np.array(getattr(tdi, propname), dtype=result.dtype)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_array_interface(self, timedelta_index):
+        arr = TimedeltaArray(timedelta_index)
+
+        # default asarray gives the same underlying data
+        result = np.asarray(arr)
+        expected = arr._data
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, copy=False)
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+
+        # specifying m8[ns] gives the same result as default
+        result = np.asarray(arr, dtype='timedelta64[ns]')
+        expected = arr._data
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, dtype='timedelta64[ns]', copy=False)
+        assert result is expected
+        tm.assert_numpy_array_equal(result, expected)
+        result = np.array(arr, dtype='timedelta64[ns]')
+        assert result is not expected
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to object dtype
+        result = np.asarray(arr, dtype=object)
+        expected = np.array(list(arr), dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to other dtype always copies
+        result = np.asarray(arr, dtype='int64')
+        assert result is not arr.asi8
+        assert not np.may_share_memory(arr, result)
+        expected = arr.asi8.copy()
+        tm.assert_numpy_array_equal(result, expected)
+
+        # other dtypes handled by numpy
+        for dtype in ['float64', str]:
+            result = np.asarray(arr, dtype=dtype)
+            expected = np.asarray(arr).astype(dtype)
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_fill_valid(self, timedelta_index):
+        tdi = timedelta_index
+        arr = TimedeltaArray(tdi)
+
+        td1 = pd.Timedelta(days=1)
+        result = arr.take([-1, 1], allow_fill=True, fill_value=td1)
+        assert result[0] == td1
+
+        now = pd.Timestamp.now()
+        with pytest.raises(ValueError):
+            # fill_value Timestamp invalid
+            arr.take([0, 1], allow_fill=True, fill_value=now)
+
+        with pytest.raises(ValueError):
+            # fill_value Period invalid
+            arr.take([0, 1], allow_fill=True, fill_value=now.to_period('D'))
+
+
+class TestPeriodArray(SharedTests):
+    index_cls = pd.PeriodIndex
+    array_cls = PeriodArray
+
+    def test_from_pi(self, period_index):
+        pi = period_index
+        arr = PeriodArray(pi)
+        assert list(arr) == list(pi)
+
+        # Check that Index.__new__ knows what to do with PeriodArray
+        pi2 = pd.Index(arr)
+        assert isinstance(pi2, pd.PeriodIndex)
+        assert list(pi2) == list(arr)
+
+    def test_astype_object(self, period_index):
+        pi = period_index
+        arr = PeriodArray(pi)
+        asobj = arr.astype('O')
+        assert isinstance(asobj, np.ndarray)
+        assert asobj.dtype == 'O'
+        assert list(asobj) == list(pi)
+
+    @pytest.mark.parametrize('how', ['S', 'E'])
+    def test_to_timestamp(self, how, period_index):
+        pi = period_index
+        arr = PeriodArray(pi)
+
+        expected = DatetimeArray(pi.to_timestamp(how=how))
+        result = arr.to_timestamp(how=how)
+        assert isinstance(result, DatetimeArray)
+
+        # placeholder until these become actual EA subclasses and we can use
+        #  an EA-specific tm.assert_ function
+        tm.assert_index_equal(pd.Index(result), pd.Index(expected))
+
+    @pytest.mark.parametrize('propname', PeriodArray._bool_ops)
+    def test_bool_properties(self, period_index, propname):
+        # in this case _bool_ops is just `is_leap_year`
+        pi = period_index
+        arr = PeriodArray(pi)
+
+        result = getattr(arr, propname)
+        expected = np.array(getattr(pi, propname))
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('propname', PeriodArray._field_ops)
+    def test_int_properties(self, period_index, propname):
+        pi = period_index
+        arr = PeriodArray(pi)
+
+        result = getattr(arr, propname)
+        expected = np.array(getattr(pi, propname))
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_array_interface(self, period_index):
+        arr = PeriodArray(period_index)
+
+        # default asarray gives objects
+        result = np.asarray(arr)
+        expected = np.array(list(arr), dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to object dtype (same as default)
+        result = np.asarray(arr, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # to other dtypes
+        with pytest.raises(TypeError):
+            np.asarray(arr, dtype='int64')
+
+        with pytest.raises(TypeError):
+            np.asarray(arr, dtype='float64')
+
+        result = np.asarray(arr, dtype='S20')
+        expected = np.asarray(arr).astype('S20')
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/arrays/test_datetimes.py b/pandas/tests/arrays/test_datetimes.py
new file mode 100644
index 0000000000000..60caf61782bbf
--- /dev/null
+++ b/pandas/tests/arrays/test_datetimes.py
@@ -0,0 +1,292 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DatetimeArray
+"""
+import operator
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+
+import pandas as pd
+from pandas.core.arrays import DatetimeArray
+from pandas.core.arrays.datetimes import sequence_to_dt64ns
+import pandas.util.testing as tm
+
+
+class TestDatetimeArrayConstructor(object):
+    def test_freq_validation(self):
+        # GH#24623 check that invalid instances cannot be created with the
+        #  public constructor
+        arr = np.arange(5, dtype=np.int64) * 3600 * 10**9
+
+        msg = ("Inferred frequency H from passed values does not "
+               "conform to passed frequency W-SUN")
+        with pytest.raises(ValueError, match=msg):
+            DatetimeArray(arr, freq="W")
+
+    @pytest.mark.parametrize('meth', [DatetimeArray._from_sequence,
+                                      sequence_to_dt64ns,
+                                      pd.to_datetime,
+                                      pd.DatetimeIndex])
+    def test_mixing_naive_tzaware_raises(self, meth):
+        # GH#24569
+        arr = np.array([pd.Timestamp('2000'), pd.Timestamp('2000', tz='CET')])
+
+        msg = ('Cannot mix tz-aware with tz-naive values|'
+               'Tz-aware datetime.datetime cannot be converted '
+               'to datetime64 unless utc=True')
+
+        for obj in [arr, arr[::-1]]:
+            # check that we raise regardless of whether naive is found
+            #  before aware or vice-versa
+            with pytest.raises(ValueError, match=msg):
+                meth(obj)
+
+    def test_from_pandas_array(self):
+        arr = pd.array(np.arange(5, dtype=np.int64)) * 3600 * 10**9
+
+        result = DatetimeArray._from_sequence(arr, freq='infer')
+
+        expected = pd.date_range('1970-01-01', periods=5, freq='H')._data
+        tm.assert_datetime_array_equal(result, expected)
+
+    def test_mismatched_timezone_raises(self):
+        arr = DatetimeArray(np.array(['2000-01-01T06:00:00'], dtype='M8[ns]'),
+                            dtype=DatetimeTZDtype(tz='US/Central'))
+        dtype = DatetimeTZDtype(tz='US/Eastern')
+        with pytest.raises(TypeError, match='Timezone of the array'):
+            DatetimeArray(arr, dtype=dtype)
+
+    def test_non_array_raises(self):
+        with pytest.raises(ValueError, match='list'):
+            DatetimeArray([1, 2, 3])
+
+    def test_other_type_raises(self):
+        with pytest.raises(ValueError,
+                           match="The dtype of 'values' is incorrect.*bool"):
+            DatetimeArray(np.array([1, 2, 3], dtype='bool'))
+
+    def test_incorrect_dtype_raises(self):
+        with pytest.raises(ValueError, match="Unexpected value for 'dtype'."):
+            DatetimeArray(np.array([1, 2, 3], dtype='i8'), dtype='category')
+
+    def test_freq_infer_raises(self):
+        with pytest.raises(ValueError, match='Frequency inference'):
+            DatetimeArray(np.array([1, 2, 3], dtype='i8'), freq="infer")
+
+    def test_copy(self):
+        data = np.array([1, 2, 3], dtype='M8[ns]')
+        arr = DatetimeArray(data, copy=False)
+        assert arr._data is data
+
+        arr = DatetimeArray(data, copy=True)
+        assert arr._data is not data
+
+
+class TestDatetimeArrayComparisons(object):
+    # TODO: merge this into tests/arithmetic/test_datetime64 once it is
+    #  sufficiently robust
+
+    def test_cmp_dt64_arraylike_tznaive(self, all_compare_operators):
+        # arbitrary tz-naive DatetimeIndex
+        opname = all_compare_operators.strip('_')
+        op = getattr(operator, opname)
+
+        dti = pd.date_range('2016-01-1', freq='MS', periods=9, tz=None)
+        arr = DatetimeArray(dti)
+        assert arr.freq == dti.freq
+        assert arr.tz == dti.tz
+
+        right = dti
+
+        expected = np.ones(len(arr), dtype=bool)
+        if opname in ['ne', 'gt', 'lt']:
+            # for these the comparisons should be all-False
+            expected = ~expected
+
+        result = op(arr, arr)
+        tm.assert_numpy_array_equal(result, expected)
+        for other in [right, np.array(right)]:
+            # TODO: add list and tuple, and object-dtype once those
+            #  are fixed in the constructor
+            result = op(arr, other)
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = op(other, arr)
+            tm.assert_numpy_array_equal(result, expected)
+
+
+class TestDatetimeArray(object):
+    def test_astype_to_same(self):
+        arr = DatetimeArray._from_sequence(['2000'], tz='US/Central')
+        result = arr.astype(DatetimeTZDtype(tz="US/Central"), copy=False)
+        assert result is arr
+
+    @pytest.mark.parametrize("dtype", [
+        int, np.int32, np.int64, 'uint32', 'uint64',
+    ])
+    def test_astype_int(self, dtype):
+        arr = DatetimeArray._from_sequence([pd.Timestamp('2000'),
+                                            pd.Timestamp('2001')])
+        result = arr.astype(dtype)
+
+        if np.dtype(dtype).kind == 'u':
+            expected_dtype = np.dtype('uint64')
+        else:
+            expected_dtype = np.dtype('int64')
+        expected = arr.astype(expected_dtype)
+
+        assert result.dtype == expected_dtype
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_tz_setter_raises(self):
+        arr = DatetimeArray._from_sequence(['2000'], tz='US/Central')
+        with pytest.raises(AttributeError, match='tz_localize'):
+            arr.tz = 'UTC'
+
+    def test_setitem_different_tz_raises(self):
+        data = np.array([1, 2, 3], dtype='M8[ns]')
+        arr = DatetimeArray(data, copy=False,
+                            dtype=DatetimeTZDtype(tz="US/Central"))
+        with pytest.raises(ValueError, match="None"):
+            arr[0] = pd.Timestamp('2000')
+
+        with pytest.raises(ValueError, match="US/Central"):
+            arr[0] = pd.Timestamp('2000', tz="US/Eastern")
+
+    def test_setitem_clears_freq(self):
+        a = DatetimeArray(pd.date_range('2000', periods=2, freq='D',
+                                        tz='US/Central'))
+        a[0] = pd.Timestamp("2000", tz="US/Central")
+        assert a.freq is None
+
+    def test_repeat_preserves_tz(self):
+        dti = pd.date_range('2000', periods=2, freq='D', tz='US/Central')
+        arr = DatetimeArray(dti)
+
+        repeated = arr.repeat([1, 1])
+
+        # preserves tz and values, but not freq
+        expected = DatetimeArray(arr.asi8, freq=None, dtype=arr.dtype)
+        tm.assert_equal(repeated, expected)
+
+    def test_value_counts_preserves_tz(self):
+        dti = pd.date_range('2000', periods=2, freq='D', tz='US/Central')
+        arr = DatetimeArray(dti).repeat([4, 3])
+
+        result = arr.value_counts()
+
+        # Note: not tm.assert_index_equal, since `freq`s do not match
+        assert result.index.equals(dti)
+
+        arr[-2] = pd.NaT
+        result = arr.value_counts()
+        expected = pd.Series([1, 4, 2],
+                             index=[pd.NaT, dti[0], dti[1]])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('method', ['pad', 'backfill'])
+    def test_fillna_preserves_tz(self, method):
+        dti = pd.date_range('2000-01-01', periods=5, freq='D', tz='US/Central')
+        arr = DatetimeArray(dti, copy=True)
+        arr[2] = pd.NaT
+
+        fill_val = dti[1] if method == 'pad' else dti[3]
+        expected = DatetimeArray._from_sequence(
+            [dti[0], dti[1], fill_val, dti[3], dti[4]],
+            freq=None, tz='US/Central'
+        )
+
+        result = arr.fillna(method=method)
+        tm.assert_extension_array_equal(result, expected)
+
+        # assert that arr and dti were not modified in-place
+        assert arr[2] is pd.NaT
+        assert dti[2] == pd.Timestamp('2000-01-03', tz='US/Central')
+
+    def test_array_interface_tz(self):
+        tz = "US/Central"
+        data = DatetimeArray(pd.date_range('2017', periods=2, tz=tz))
+        result = np.asarray(data)
+
+        expected = np.array([pd.Timestamp('2017-01-01T00:00:00', tz=tz),
+                             pd.Timestamp('2017-01-02T00:00:00', tz=tz)],
+                            dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.asarray(data, dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.asarray(data, dtype='M8[ns]')
+
+        expected = np.array(['2017-01-01T06:00:00',
+                             '2017-01-02T06:00:00'], dtype="M8[ns]")
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_array_interface(self):
+        data = DatetimeArray(pd.date_range('2017', periods=2))
+        expected = np.array(['2017-01-01T00:00:00', '2017-01-02T00:00:00'],
+                            dtype='datetime64[ns]')
+
+        result = np.asarray(data)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.asarray(data, dtype=object)
+        expected = np.array([pd.Timestamp('2017-01-01T00:00:00'),
+                             pd.Timestamp('2017-01-02T00:00:00')],
+                            dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestSequenceToDT64NS(object):
+
+    def test_tz_dtype_mismatch_raises(self):
+        arr = DatetimeArray._from_sequence(['2000'], tz='US/Central')
+        with pytest.raises(TypeError, match='data is already tz-aware'):
+            sequence_to_dt64ns(arr, dtype=DatetimeTZDtype(tz="UTC"))
+
+    def test_tz_dtype_matches(self):
+        arr = DatetimeArray._from_sequence(['2000'], tz='US/Central')
+        result, _, _ = sequence_to_dt64ns(
+            arr, dtype=DatetimeTZDtype(tz="US/Central"))
+        tm.assert_numpy_array_equal(arr._data, result)
+
+
+class TestReductions(object):
+
+    @pytest.mark.parametrize("tz", [None, "US/Central"])
+    def test_min_max(self, tz):
+        arr = DatetimeArray._from_sequence([
+            '2000-01-03',
+            '2000-01-03',
+            'NaT',
+            '2000-01-02',
+            '2000-01-05',
+            '2000-01-04',
+        ], tz=tz)
+
+        result = arr.min()
+        expected = pd.Timestamp('2000-01-02', tz=tz)
+        assert result == expected
+
+        result = arr.max()
+        expected = pd.Timestamp('2000-01-05', tz=tz)
+        assert result == expected
+
+        result = arr.min(skipna=False)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=False)
+        assert result is pd.NaT
+
+    @pytest.mark.parametrize("tz", [None, "US/Central"])
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_min_max_empty(self, skipna, tz):
+        arr = DatetimeArray._from_sequence([], tz=tz)
+        result = arr.min(skipna=skipna)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=skipna)
+        assert result is pd.NaT
diff --git a/pandas/tests/arrays/test_integer.py b/pandas/tests/arrays/test_integer.py
new file mode 100644
index 0000000000000..67e7db5460e6d
--- /dev/null
+++ b/pandas/tests/arrays/test_integer.py
@@ -0,0 +1,713 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.generic import ABCIndexClass
+
+import pandas as pd
+from pandas.api.types import is_float, is_float_dtype, is_integer, is_scalar
+from pandas.core.arrays import IntegerArray, integer_array
+from pandas.core.arrays.integer import (
+    Int8Dtype, Int16Dtype, Int32Dtype, Int64Dtype, UInt8Dtype, UInt16Dtype,
+    UInt32Dtype, UInt64Dtype)
+from pandas.tests.extension.base import BaseOpsUtil
+import pandas.util.testing as tm
+
+
+def make_data():
+    return (list(range(8)) +
+            [np.nan] +
+            list(range(10, 98)) +
+            [np.nan] +
+            [99, 100])
+
+
+@pytest.fixture(params=[Int8Dtype, Int16Dtype, Int32Dtype, Int64Dtype,
+                        UInt8Dtype, UInt16Dtype, UInt32Dtype, UInt64Dtype])
+def dtype(request):
+    return request.param()
+
+
+@pytest.fixture
+def data(dtype):
+    return integer_array(make_data(), dtype=dtype)
+
+
+@pytest.fixture
+def data_missing(dtype):
+    return integer_array([np.nan, 1], dtype=dtype)
+
+
+@pytest.fixture(params=['data', 'data_missing'])
+def all_data(request, data, data_missing):
+    """Parametrized fixture giving 'data' and 'data_missing'"""
+    if request.param == 'data':
+        return data
+    elif request.param == 'data_missing':
+        return data_missing
+
+
+def test_dtypes(dtype):
+    # smoke tests on auto dtype construction
+
+    if dtype.is_signed_integer:
+        assert np.dtype(dtype.type).kind == 'i'
+    else:
+        assert np.dtype(dtype.type).kind == 'u'
+    assert dtype.name is not None
+
+
+@pytest.mark.parametrize('dtype, expected', [
+    (Int8Dtype(), 'Int8Dtype()'),
+    (Int16Dtype(), 'Int16Dtype()'),
+    (Int32Dtype(), 'Int32Dtype()'),
+    (Int64Dtype(), 'Int64Dtype()'),
+    (UInt8Dtype(), 'UInt8Dtype()'),
+    (UInt16Dtype(), 'UInt16Dtype()'),
+    (UInt32Dtype(), 'UInt32Dtype()'),
+    (UInt64Dtype(), 'UInt64Dtype()'),
+])
+def test_repr_dtype(dtype, expected):
+    assert repr(dtype) == expected
+
+
+def test_repr_array():
+    result = repr(integer_array([1, None, 3]))
+    expected = (
+        '<IntegerArray>\n'
+        '[1, NaN, 3]\n'
+        'Length: 3, dtype: Int64'
+    )
+    assert result == expected
+
+
+def test_repr_array_long():
+    data = integer_array([1, 2, None] * 1000)
+    expected = (
+        "<IntegerArray>\n"
+        "[  1,   2, NaN,   1,   2, NaN,   1,   2, NaN,   1,\n"
+        " ...\n"
+        " NaN,   1,   2, NaN,   1,   2, NaN,   1,   2, NaN]\n"
+        "Length: 3000, dtype: Int64"
+    )
+    result = repr(data)
+    assert result == expected
+
+
+class TestConstructors(object):
+
+    def test_from_dtype_from_float(self, data):
+        # construct from our dtype & string dtype
+        dtype = data.dtype
+
+        # from float
+        expected = pd.Series(data)
+        result = pd.Series(np.array(data).astype('float'), dtype=str(dtype))
+        tm.assert_series_equal(result, expected)
+
+        # from int / list
+        expected = pd.Series(data)
+        result = pd.Series(np.array(data).tolist(), dtype=str(dtype))
+        tm.assert_series_equal(result, expected)
+
+        # from int / array
+        expected = pd.Series(data).dropna().reset_index(drop=True)
+        dropped = np.array(data.dropna()).astype(np.dtype((dtype.type)))
+        result = pd.Series(dropped, dtype=str(dtype))
+        tm.assert_series_equal(result, expected)
+
+
+class TestArithmeticOps(BaseOpsUtil):
+
+    def _check_divmod_op(self, s, op, other, exc=None):
+        super(TestArithmeticOps, self)._check_divmod_op(s, op, other, None)
+
+    def _check_op(self, s, op_name, other, exc=None):
+        op = self.get_op_from_name(op_name)
+        result = op(s, other)
+
+        # compute expected
+        mask = s.isna()
+
+        # if s is a DataFrame, squeeze to a Series
+        # for comparison
+        if isinstance(s, pd.DataFrame):
+            result = result.squeeze()
+            s = s.squeeze()
+            mask = mask.squeeze()
+
+        # other array is an Integer
+        if isinstance(other, IntegerArray):
+            omask = getattr(other, 'mask', None)
+            mask = getattr(other, 'data', other)
+            if omask is not None:
+                mask |= omask
+
+        # 1 ** na is na, so need to unmask those
+        if op_name == '__pow__':
+            mask = np.where(s == 1, False, mask)
+
+        elif op_name == '__rpow__':
+            mask = np.where(other == 1, False, mask)
+
+        # float result type or float op
+        if ((is_float_dtype(other) or is_float(other) or
+             op_name in ['__rtruediv__', '__truediv__',
+                         '__rdiv__', '__div__'])):
+            rs = s.astype('float')
+            expected = op(rs, other)
+            self._check_op_float(result, expected, mask, s, op_name, other)
+
+        # integer result type
+        else:
+            rs = pd.Series(s.values._data)
+            expected = op(rs, other)
+            self._check_op_integer(result, expected, mask, s, op_name, other)
+
+    def _check_op_float(self, result, expected, mask, s, op_name, other):
+        # check comparisions that are resulting in float dtypes
+
+        expected[mask] = np.nan
+        tm.assert_series_equal(result, expected)
+
+    def _check_op_integer(self, result, expected, mask, s, op_name, other):
+        # check comparisions that are resulting in integer dtypes
+
+        # to compare properly, we convert the expected
+        # to float, mask to nans and convert infs
+        # if we have uints then we process as uints
+        # then conert to float
+        # and we ultimately want to create a IntArray
+        # for comparisons
+
+        fill_value = 0
+
+        # mod/rmod turn floating 0 into NaN while
+        # integer works as expected (no nan)
+        if op_name in ['__mod__', '__rmod__']:
+            if is_scalar(other):
+                if other == 0:
+                    expected[s.values == 0] = 0
+                else:
+                    expected = expected.fillna(0)
+            else:
+                expected[(s.values == 0) &
+                         ((expected == 0) | expected.isna())] = 0
+        try:
+            expected[(expected == np.inf) | (expected == -np.inf)] = fill_value
+            original = expected
+            expected = expected.astype(s.dtype)
+
+        except ValueError:
+
+            expected = expected.astype(float)
+            expected[(expected == np.inf) | (expected == -np.inf)] = fill_value
+            original = expected
+            expected = expected.astype(s.dtype)
+
+        expected[mask] = np.nan
+
+        # assert that the expected astype is ok
+        # (skip for unsigned as they have wrap around)
+        if not s.dtype.is_unsigned_integer:
+            original = pd.Series(original)
+
+            # we need to fill with 0's to emulate what an astype('int') does
+            # (truncation) for certain ops
+            if op_name in ['__rtruediv__', '__rdiv__']:
+                mask |= original.isna()
+                original = original.fillna(0).astype('int')
+
+            original = original.astype('float')
+            original[mask] = np.nan
+            tm.assert_series_equal(original, expected.astype('float'))
+
+        # assert our expected result
+        tm.assert_series_equal(result, expected)
+
+    def test_arith_integer_array(self, data, all_arithmetic_operators):
+        # we operate with a rhs of an integer array
+
+        op = all_arithmetic_operators
+
+        s = pd.Series(data)
+        rhs = pd.Series([1] * len(data), dtype=data.dtype)
+        rhs.iloc[-1] = np.nan
+
+        self._check_op(s, op, rhs)
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        # scalar
+        op = all_arithmetic_operators
+
+        s = pd.Series(data)
+        self._check_op(s, op, 1, exc=TypeError)
+
+    def test_arith_frame_with_scalar(self, data, all_arithmetic_operators):
+        # frame & scalar
+        op = all_arithmetic_operators
+
+        df = pd.DataFrame({'A': data})
+        self._check_op(df, op, 1, exc=TypeError)
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        # ndarray & other series
+        op = all_arithmetic_operators
+
+        s = pd.Series(data)
+        other = np.ones(len(s), dtype=s.dtype.type)
+        self._check_op(s, op, other, exc=TypeError)
+
+    def test_arith_coerce_scalar(self, data, all_arithmetic_operators):
+
+        op = all_arithmetic_operators
+        s = pd.Series(data)
+
+        other = 0.01
+        self._check_op(s, op, other)
+
+    @pytest.mark.parametrize("other", [1., 1.0, np.array(1.), np.array([1.])])
+    def test_arithmetic_conversion(self, all_arithmetic_operators, other):
+        # if we have a float operand we should have a float result
+        # if that is equal to an integer
+        op = self.get_op_from_name(all_arithmetic_operators)
+
+        s = pd.Series([1, 2, 3], dtype='Int64')
+        result = op(s, other)
+        assert result.dtype is np.dtype('float')
+
+    @pytest.mark.parametrize("other", [0, 0.5])
+    def test_arith_zero_dim_ndarray(self, other):
+        arr = integer_array([1, None, 2])
+        result = arr + np.array(other)
+        expected = arr + other
+        tm.assert_equal(result, expected)
+
+    def test_error(self, data, all_arithmetic_operators):
+        # invalid ops
+
+        op = all_arithmetic_operators
+        s = pd.Series(data)
+        ops = getattr(s, op)
+        opa = getattr(data, op)
+
+        # invalid scalars
+        with pytest.raises(TypeError):
+            ops('foo')
+        with pytest.raises(TypeError):
+            ops(pd.Timestamp('20180101'))
+
+        # invalid array-likes
+        with pytest.raises(TypeError):
+            ops(pd.Series('foo', index=s.index))
+
+        if op != '__rpow__':
+            # TODO(extension)
+            # rpow with a datetimelike coerces the integer array incorrectly
+            with pytest.raises(TypeError):
+                ops(pd.Series(pd.date_range('20180101', periods=len(s))))
+
+        # 2d
+        with pytest.raises(NotImplementedError):
+            opa(pd.DataFrame({'A': s}))
+        with pytest.raises(NotImplementedError):
+            opa(np.arange(len(s)).reshape(-1, len(s)))
+
+    def test_pow(self):
+        # https://github.com/pandas-dev/pandas/issues/22022
+        a = integer_array([1, np.nan, np.nan, 1])
+        b = integer_array([1, np.nan, 1, np.nan])
+        result = a ** b
+        expected = pd.core.arrays.integer_array([1, np.nan, np.nan, 1])
+        tm.assert_extension_array_equal(result, expected)
+
+    def test_rpow_one_to_na(self):
+        # https://github.com/pandas-dev/pandas/issues/22022
+        arr = integer_array([np.nan, np.nan])
+        result = np.array([1.0, 2.0]) ** arr
+        expected = np.array([1.0, np.nan])
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestComparisonOps(BaseOpsUtil):
+
+    def _compare_other(self, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+
+        # array
+        result = pd.Series(op(data, other))
+        expected = pd.Series(op(data._data, other))
+
+        # fill the nan locations
+        expected[data._mask] = op_name == '__ne__'
+
+        tm.assert_series_equal(result, expected)
+
+        # series
+        s = pd.Series(data)
+        result = op(s, other)
+
+        expected = pd.Series(data._data)
+        expected = op(expected, other)
+
+        # fill the nan locations
+        expected[data._mask] = op_name == '__ne__'
+
+        tm.assert_series_equal(result, expected)
+
+    def test_compare_scalar(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        self._compare_other(data, op_name, 0)
+
+    def test_compare_array(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        other = pd.Series([0] * len(data))
+        self._compare_other(data, op_name, other)
+
+
+class TestCasting(object):
+    pass
+
+    @pytest.mark.parametrize('dropna', [True, False])
+    def test_construct_index(self, all_data, dropna):
+        # ensure that we do not coerce to Float64Index, rather
+        # keep as Index
+
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Index(integer_array(other, dtype=all_data.dtype))
+        expected = pd.Index(other, dtype=object)
+
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna', [True, False])
+    def test_astype_index(self, all_data, dropna):
+        # as an int/uint index to Index
+
+        all_data = all_data[:10]
+        if dropna:
+            other = all_data[~all_data.isna()]
+        else:
+            other = all_data
+
+        dtype = all_data.dtype
+        idx = pd.Index(np.array(other))
+        assert isinstance(idx, ABCIndexClass)
+
+        result = idx.astype(dtype)
+        expected = idx.astype(object).astype(dtype)
+        tm.assert_index_equal(result, expected)
+
+    def test_astype(self, all_data):
+        all_data = all_data[:10]
+
+        ints = all_data[~all_data.isna()]
+        mixed = all_data
+        dtype = Int8Dtype()
+
+        # coerce to same type - ints
+        s = pd.Series(ints)
+        result = s.astype(all_data.dtype)
+        expected = pd.Series(ints)
+        tm.assert_series_equal(result, expected)
+
+        # coerce to same other - ints
+        s = pd.Series(ints)
+        result = s.astype(dtype)
+        expected = pd.Series(ints, dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+        # coerce to same numpy_dtype - ints
+        s = pd.Series(ints)
+        result = s.astype(all_data.dtype.numpy_dtype)
+        expected = pd.Series(ints._data.astype(
+            all_data.dtype.numpy_dtype))
+        tm.assert_series_equal(result, expected)
+
+        # coerce to same type - mixed
+        s = pd.Series(mixed)
+        result = s.astype(all_data.dtype)
+        expected = pd.Series(mixed)
+        tm.assert_series_equal(result, expected)
+
+        # coerce to same other - mixed
+        s = pd.Series(mixed)
+        result = s.astype(dtype)
+        expected = pd.Series(mixed, dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+        # coerce to same numpy_dtype - mixed
+        s = pd.Series(mixed)
+        with pytest.raises(ValueError):
+            s.astype(all_data.dtype.numpy_dtype)
+
+        # coerce to object
+        s = pd.Series(mixed)
+        result = s.astype('object')
+        expected = pd.Series(np.asarray(mixed))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [Int8Dtype(), 'Int8',
+                                       UInt32Dtype(), 'UInt32'])
+    def test_astype_specific_casting(self, dtype):
+        s = pd.Series([1, 2, 3], dtype='Int64')
+        result = s.astype(dtype)
+        expected = pd.Series([1, 2, 3], dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+        s = pd.Series([1, 2, 3, None], dtype='Int64')
+        result = s.astype(dtype)
+        expected = pd.Series([1, 2, 3, None], dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+    def test_construct_cast_invalid(self, dtype):
+
+        msg = "cannot safely"
+        arr = [1.2, 2.3, 3.7]
+        with pytest.raises(TypeError, match=msg):
+            integer_array(arr, dtype=dtype)
+
+        with pytest.raises(TypeError, match=msg):
+            pd.Series(arr).astype(dtype)
+
+        arr = [1.2, 2.3, 3.7, np.nan]
+        with pytest.raises(TypeError, match=msg):
+            integer_array(arr, dtype=dtype)
+
+        with pytest.raises(TypeError, match=msg):
+            pd.Series(arr).astype(dtype)
+
+
+def test_frame_repr(data_missing):
+
+    df = pd.DataFrame({'A': data_missing})
+    result = repr(df)
+    expected = '     A\n0  NaN\n1    1'
+    assert result == expected
+
+
+def test_conversions(data_missing):
+
+    # astype to object series
+    df = pd.DataFrame({'A': data_missing})
+    result = df['A'].astype('object')
+    expected = pd.Series(np.array([np.nan, 1], dtype=object), name='A')
+    tm.assert_series_equal(result, expected)
+
+    # convert to object ndarray
+    # we assert that we are exactly equal
+    # including type conversions of scalars
+    result = df['A'].astype('object').values
+    expected = np.array([np.nan, 1], dtype=object)
+    tm.assert_numpy_array_equal(result, expected)
+
+    for r, e in zip(result, expected):
+        if pd.isnull(r):
+            assert pd.isnull(e)
+        elif is_integer(r):
+            # PY2 can be int or long
+            assert r == e
+            assert is_integer(e)
+        else:
+            assert r == e
+            assert type(r) == type(e)
+
+
+def test_integer_array_constructor():
+    values = np.array([1, 2, 3, 4], dtype='int64')
+    mask = np.array([False, False, False, True], dtype='bool')
+
+    result = IntegerArray(values, mask)
+    expected = integer_array([1, 2, 3, np.nan], dtype='int64')
+    tm.assert_extension_array_equal(result, expected)
+
+    with pytest.raises(TypeError):
+        IntegerArray(values.tolist(), mask)
+
+    with pytest.raises(TypeError):
+        IntegerArray(values, mask.tolist())
+
+    with pytest.raises(TypeError):
+        IntegerArray(values.astype(float), mask)
+
+    with pytest.raises(TypeError):
+        IntegerArray(values)
+
+
+@pytest.mark.parametrize('a, b', [
+    ([1, None], [1, np.nan]),
+    ([None], [np.nan]),
+    ([None, np.nan], [np.nan, np.nan]),
+    ([np.nan, np.nan], [np.nan, np.nan]),
+])
+def test_integer_array_constructor_none_is_nan(a, b):
+    result = integer_array(a)
+    expected = integer_array(b)
+    tm.assert_extension_array_equal(result, expected)
+
+
+def test_integer_array_constructor_copy():
+    values = np.array([1, 2, 3, 4], dtype='int64')
+    mask = np.array([False, False, False, True], dtype='bool')
+
+    result = IntegerArray(values, mask)
+    assert result._data is values
+    assert result._mask is mask
+
+    result = IntegerArray(values, mask, copy=True)
+    assert result._data is not values
+    assert result._mask is not mask
+
+
+@pytest.mark.parametrize(
+    'values',
+    [
+        ['foo', 'bar'],
+        ['1', '2'],
+        'foo',
+        1,
+        1.0,
+        pd.date_range('20130101', periods=2),
+        np.array(['foo']),
+        [[1, 2], [3, 4]],
+        [np.nan, {'a': 1}]])
+def test_to_integer_array_error(values):
+    # error in converting existing arrays to IntegerArrays
+    with pytest.raises(TypeError):
+        integer_array(values)
+
+
+def test_to_integer_array_inferred_dtype():
+    # if values has dtype -> respect it
+    result = integer_array(np.array([1, 2], dtype='int8'))
+    assert result.dtype == Int8Dtype()
+    result = integer_array(np.array([1, 2], dtype='int32'))
+    assert result.dtype == Int32Dtype()
+
+    # if values have no dtype -> always int64
+    result = integer_array([1, 2])
+    assert result.dtype == Int64Dtype()
+
+
+def test_to_integer_array_dtype_keyword():
+    result = integer_array([1, 2], dtype='int8')
+    assert result.dtype == Int8Dtype()
+
+    # if values has dtype -> override it
+    result = integer_array(np.array([1, 2], dtype='int8'), dtype='int32')
+    assert result.dtype == Int32Dtype()
+
+
+def test_to_integer_array_float():
+    result = integer_array([1., 2.])
+    expected = integer_array([1, 2])
+    tm.assert_extension_array_equal(result, expected)
+
+    with pytest.raises(TypeError, match="cannot safely cast non-equivalent"):
+        integer_array([1.5, 2.])
+
+    # for float dtypes, the itemsize is not preserved
+    result = integer_array(np.array([1., 2.], dtype='float32'))
+    assert result.dtype == Int64Dtype()
+
+
+@pytest.mark.parametrize(
+    'values, to_dtype, result_dtype',
+    [
+        (np.array([1], dtype='int64'), None, Int64Dtype),
+        (np.array([1, np.nan]), None, Int64Dtype),
+        (np.array([1, np.nan]), 'int8', Int8Dtype)])
+def test_to_integer_array(values, to_dtype, result_dtype):
+    # convert existing arrays to IntegerArrays
+    result = integer_array(values, dtype=to_dtype)
+    assert result.dtype == result_dtype()
+    expected = integer_array(values, dtype=result_dtype())
+    tm.assert_extension_array_equal(result, expected)
+
+
+def test_cross_type_arithmetic():
+
+    df = pd.DataFrame({'A': pd.Series([1, 2, np.nan], dtype='Int64'),
+                       'B': pd.Series([1, np.nan, 3], dtype='UInt8'),
+                       'C': [1, 2, 3]})
+
+    result = df.A + df.C
+    expected = pd.Series([2, 4, np.nan], dtype='Int64')
+    tm.assert_series_equal(result, expected)
+
+    result = (df.A + df.C) * 3 == 12
+    expected = pd.Series([False, True, False])
+    tm.assert_series_equal(result, expected)
+
+    result = df.A + df.B
+    expected = pd.Series([2, np.nan, np.nan], dtype='Int64')
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('op', ['sum', 'min', 'max', 'prod'])
+def test_preserve_dtypes(op):
+    # TODO(#22346): preserve Int64 dtype
+    # for ops that enable (mean would actually work here
+    # but generally it is a float return value)
+    df = pd.DataFrame({
+        "A": ['a', 'b', 'b'],
+        "B": [1, None, 3],
+        "C": integer_array([1, None, 3], dtype='Int64'),
+    })
+
+    # op
+    result = getattr(df.C, op)()
+    assert isinstance(result, int)
+
+    # groupby
+    result = getattr(df.groupby("A"), op)()
+
+    expected = pd.DataFrame({
+        "B": np.array([1.0, 3.0]),
+        "C": integer_array([1, 3], dtype="Int64")
+    }, index=pd.Index(['a', 'b'], name='A'))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('op', ['mean'])
+def test_reduce_to_float(op):
+    # some reduce ops always return float, even if the result
+    # is a rounded number
+    df = pd.DataFrame({
+        "A": ['a', 'b', 'b'],
+        "B": [1, None, 3],
+        "C": integer_array([1, None, 3], dtype='Int64'),
+    })
+
+    # op
+    result = getattr(df.C, op)()
+    assert isinstance(result, float)
+
+    # groupby
+    result = getattr(df.groupby("A"), op)()
+
+    expected = pd.DataFrame({
+        "B": np.array([1.0, 3.0]),
+        "C": integer_array([1, 3], dtype="Int64")
+    }, index=pd.Index(['a', 'b'], name='A'))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_astype_nansafe():
+    # see gh-22343
+    arr = integer_array([np.nan, 1, 2], dtype="Int8")
+    msg = "cannot convert float NaN to integer"
+
+    with pytest.raises(ValueError, match=msg):
+        arr.astype('uint32')
+
+
+# TODO(jreback) - these need testing / are broken
+
+# shift
+
+# set_index (destroys type)
diff --git a/pandas/tests/arrays/test_numpy.py b/pandas/tests/arrays/test_numpy.py
new file mode 100644
index 0000000000000..a77f1f8a7b3d1
--- /dev/null
+++ b/pandas/tests/arrays/test_numpy.py
@@ -0,0 +1,206 @@
+"""
+Additional tests for PandasArray that aren't covered by
+the interface tests.
+"""
+import numpy as np
+import pytest
+
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import compat
+from pandas.arrays import PandasArray
+from pandas.core.arrays.numpy_ import PandasDtype
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[
+    np.array(['a', 'b'], dtype=object),
+    np.array([0, 1], dtype=float),
+    np.array([0, 1], dtype=int),
+    np.array([0, 1 + 2j], dtype=complex),
+    np.array([True, False], dtype=bool),
+    np.array([0, 1], dtype='datetime64[ns]'),
+    np.array([0, 1], dtype='timedelta64[ns]'),
+])
+def any_numpy_array(request):
+    """
+    Parametrized fixture for NumPy arrays with different dtypes.
+
+    This excludes string and bytes.
+    """
+    return request.param
+
+
+# ----------------------------------------------------------------------------
+# PandasDtype
+
+@pytest.mark.parametrize('dtype, expected', [
+    ('bool', True),
+    ('int', True),
+    ('uint', True),
+    ('float', True),
+    ('complex', True),
+    ('str', False),
+    pytest.param('bytes', False,
+                 marks=pytest.mark.skipif(compat.PY2, reason="PY2")),
+    ('datetime64[ns]', False),
+    ('object', False),
+    ('void', False),
+])
+def test_is_numeric(dtype, expected):
+    dtype = PandasDtype(dtype)
+    assert dtype._is_numeric is expected
+
+
+@pytest.mark.parametrize('dtype, expected', [
+    ('bool', True),
+    ('int', False),
+    ('uint', False),
+    ('float', False),
+    ('complex', False),
+    ('str', False),
+    pytest.param('bytes', False,
+                 marks=pytest.mark.skipif(compat.PY2, reason="PY2")),
+    ('datetime64[ns]', False),
+    ('object', False),
+    ('void', False)
+])
+def test_is_boolean(dtype, expected):
+    dtype = PandasDtype(dtype)
+    assert dtype._is_boolean is expected
+
+
+def test_repr():
+    dtype = PandasDtype(np.dtype("int64"))
+    assert repr(dtype) == "PandasDtype('int64')"
+
+
+def test_constructor_from_string():
+    result = PandasDtype.construct_from_string("int64")
+    expected = PandasDtype(np.dtype("int64"))
+    assert result == expected
+
+
+# ----------------------------------------------------------------------------
+# Construction
+
+def test_constructor_no_coercion():
+    with pytest.raises(ValueError, match='NumPy array'):
+        PandasArray([1, 2, 3])
+
+
+def test_series_constructor_with_copy():
+    ndarray = np.array([1, 2, 3])
+    ser = pd.Series(PandasArray(ndarray), copy=True)
+
+    assert ser.values is not ndarray
+
+
+def test_series_constructor_with_astype():
+    ndarray = np.array([1, 2, 3])
+    result = pd.Series(PandasArray(ndarray), dtype="float64")
+    expected = pd.Series([1.0, 2.0, 3.0], dtype="float64")
+    tm.assert_series_equal(result, expected)
+
+
+def test_from_sequence_dtype():
+    arr = np.array([1, 2, 3], dtype='int64')
+    result = PandasArray._from_sequence(arr, dtype='uint64')
+    expected = PandasArray(np.array([1, 2, 3], dtype='uint64'))
+    tm.assert_extension_array_equal(result, expected)
+
+
+def test_constructor_copy():
+    arr = np.array([0, 1])
+    result = PandasArray(arr, copy=True)
+
+    assert np.shares_memory(result._ndarray, arr) is False
+
+
+def test_constructor_with_data(any_numpy_array):
+    nparr = any_numpy_array
+    arr = PandasArray(nparr)
+    assert arr.dtype.numpy_dtype == nparr.dtype
+
+
+# ----------------------------------------------------------------------------
+# Conversion
+
+def test_to_numpy():
+    arr = PandasArray(np.array([1, 2, 3]))
+    result = arr.to_numpy()
+    assert result is arr._ndarray
+
+    result = arr.to_numpy(copy=True)
+    assert result is not arr._ndarray
+
+    result = arr.to_numpy(dtype='f8')
+    expected = np.array([1, 2, 3], dtype='f8')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+# ----------------------------------------------------------------------------
+# Setitem
+
+def test_setitem_series():
+    ser = pd.Series([1, 2, 3])
+    ser.array[0] = 10
+    expected = pd.Series([10, 2, 3])
+    tm.assert_series_equal(ser, expected)
+
+
+def test_setitem(any_numpy_array):
+    nparr = any_numpy_array
+    arr = PandasArray(nparr, copy=True)
+
+    arr[0] = arr[1]
+    nparr[0] = nparr[1]
+
+    tm.assert_numpy_array_equal(arr.to_numpy(), nparr)
+
+
+# ----------------------------------------------------------------------------
+# Reductions
+
+def test_bad_reduce_raises():
+    arr = np.array([1, 2, 3], dtype='int64')
+    arr = PandasArray(arr)
+    msg = "cannot perform not_a_method with type int"
+    with pytest.raises(TypeError, match=msg):
+        arr._reduce(msg)
+
+
+def test_validate_reduction_keyword_args():
+    arr = PandasArray(np.array([1, 2, 3]))
+    msg = "the 'keepdims' parameter is not supported .*all"
+    with pytest.raises(ValueError, match=msg):
+        arr.all(keepdims=True)
+
+
+# ----------------------------------------------------------------------------
+# Ops
+
+@td.skip_if_no("numpy", min_version="1.13.0")
+def test_ufunc():
+    arr = PandasArray(np.array([-1.0, 0.0, 1.0]))
+    result = np.abs(arr)
+    expected = PandasArray(np.abs(arr._ndarray))
+    tm.assert_extension_array_equal(result, expected)
+
+    r1, r2 = np.divmod(arr, np.add(arr, 2))
+    e1, e2 = np.divmod(arr._ndarray, np.add(arr._ndarray, 2))
+    e1 = PandasArray(e1)
+    e2 = PandasArray(e2)
+    tm.assert_extension_array_equal(r1, e1)
+    tm.assert_extension_array_equal(r2, e2)
+
+
+@td.skip_if_no("numpy", min_version="1.13.0")
+def test_basic_binop():
+    # Just a basic smoke test. The EA interface tests exercise this
+    # more thoroughly.
+    x = PandasArray(np.array([1, 2, 3]))
+    result = x + x
+    expected = PandasArray(np.array([2, 4, 6]))
+    tm.assert_extension_array_equal(result, expected)
diff --git a/pandas/tests/arrays/test_period.py b/pandas/tests/arrays/test_period.py
new file mode 100644
index 0000000000000..99255d819d28e
--- /dev/null
+++ b/pandas/tests/arrays/test_period.py
@@ -0,0 +1,317 @@
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import iNaT
+from pandas._libs.tslibs.period import IncompatibleFrequency
+
+from pandas.core.dtypes.dtypes import PeriodDtype, registry
+
+import pandas as pd
+from pandas.core.arrays import PeriodArray, period_array
+import pandas.util.testing as tm
+
+# ----------------------------------------------------------------------------
+# Dtype
+
+
+def test_registered():
+    assert PeriodDtype in registry.dtypes
+    result = registry.find("Period[D]")
+    expected = PeriodDtype("D")
+    assert result == expected
+
+# ----------------------------------------------------------------------------
+# period_array
+
+
+@pytest.mark.parametrize("data, freq, expected", [
+    ([pd.Period("2017", "D")], None, [17167]),
+    ([pd.Period("2017", "D")], "D", [17167]),
+    ([2017], "D", [17167]),
+    (["2017"], "D", [17167]),
+    ([pd.Period("2017", "D")], pd.tseries.offsets.Day(), [17167]),
+    ([pd.Period("2017", "D"), None], None, [17167, iNaT]),
+    (pd.Series(pd.date_range("2017", periods=3)), None,
+     [17167, 17168, 17169]),
+    (pd.date_range("2017", periods=3), None, [17167, 17168, 17169]),
+])
+def test_period_array_ok(data, freq, expected):
+    result = period_array(data, freq=freq).asi8
+    expected = np.asarray(expected, dtype=np.int64)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_period_array_readonly_object():
+    # https://github.com/pandas-dev/pandas/issues/25403
+    pa = period_array([pd.Period('2019-01-01')])
+    arr = np.asarray(pa, dtype='object')
+    arr.setflags(write=False)
+
+    result = period_array(arr)
+    tm.assert_period_array_equal(result, pa)
+
+    result = pd.Series(arr)
+    tm.assert_series_equal(result, pd.Series(pa))
+
+    result = pd.DataFrame({"A": arr})
+    tm.assert_frame_equal(result, pd.DataFrame({"A": pa}))
+
+
+def test_from_datetime64_freq_changes():
+    # https://github.com/pandas-dev/pandas/issues/23438
+    arr = pd.date_range("2017", periods=3, freq="D")
+    result = PeriodArray._from_datetime64(arr, freq="M")
+    expected = period_array(['2017-01-01', '2017-01-01', '2017-01-01'],
+                            freq="M")
+    tm.assert_period_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("data, freq, msg", [
+    ([pd.Period('2017', 'D'),
+      pd.Period('2017', 'A')],
+     None,
+     "Input has different freq"),
+    ([pd.Period('2017', 'D')],
+     "A",
+     "Input has different freq"),
+])
+def test_period_array_raises(data, freq, msg):
+    with pytest.raises(IncompatibleFrequency, match=msg):
+        period_array(data, freq)
+
+
+def test_period_array_non_period_series_raies():
+    ser = pd.Series([1, 2, 3])
+    with pytest.raises(TypeError, match='dtype'):
+        PeriodArray(ser, freq='D')
+
+
+def test_period_array_freq_mismatch():
+    arr = period_array(['2000', '2001'], freq='D')
+    with pytest.raises(IncompatibleFrequency, match='freq'):
+        PeriodArray(arr, freq='M')
+
+    with pytest.raises(IncompatibleFrequency, match='freq'):
+        PeriodArray(arr, freq=pd.tseries.offsets.MonthEnd())
+
+
+def test_asi8():
+    result = period_array(['2000', '2001', None], freq='D').asi8
+    expected = np.array([10957, 11323, iNaT])
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_take_raises():
+    arr = period_array(['2000', '2001'], freq='D')
+    with pytest.raises(IncompatibleFrequency, match='freq'):
+        arr.take([0, -1], allow_fill=True,
+                 fill_value=pd.Period('2000', freq='W'))
+
+    with pytest.raises(ValueError, match='foo'):
+        arr.take([0, -1], allow_fill=True, fill_value='foo')
+
+
+@pytest.mark.parametrize('dtype', [
+    int, np.int32, np.int64, 'uint32', 'uint64',
+])
+def test_astype(dtype):
+    # We choose to ignore the sign and size of integers for
+    # Period/Datetime/Timedelta astype
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(dtype)
+
+    if np.dtype(dtype).kind == 'u':
+        expected_dtype = np.dtype('uint64')
+    else:
+        expected_dtype = np.dtype('int64')
+    expected = arr.astype(expected_dtype)
+
+    assert result.dtype == expected_dtype
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_astype_copies():
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(np.int64, copy=False)
+    # Add the `.base`, since we now use `.asi8` which returns a view.
+    # We could maybe override it in PeriodArray to return ._data directly.
+    assert result.base is arr._data
+
+    result = arr.astype(np.int64, copy=True)
+    assert result is not arr._data
+    tm.assert_numpy_array_equal(result, arr._data.view('i8'))
+
+
+def test_astype_categorical():
+    arr = period_array(['2000', '2001', '2001', None], freq='D')
+    result = arr.astype('category')
+    categories = pd.PeriodIndex(['2000', '2001'], freq='D')
+    expected = pd.Categorical.from_codes([0, 1, 1, -1], categories=categories)
+    tm.assert_categorical_equal(result, expected)
+
+
+def test_astype_period():
+    arr = period_array(['2000', '2001', None], freq='D')
+    result = arr.astype(PeriodDtype("M"))
+    expected = period_array(['2000', '2001', None], freq='M')
+    tm.assert_period_array_equal(result, expected)
+
+
+@pytest.mark.parametrize('other', [
+    'datetime64[ns]', 'timedelta64[ns]',
+])
+def test_astype_datetime(other):
+    arr = period_array(['2000', '2001', None], freq='D')
+    # slice off the [ns] so that the regex matches.
+    with pytest.raises(TypeError, match=other[:-4]):
+        arr.astype(other)
+
+
+def test_fillna_raises():
+    arr = period_array(['2000', '2001', '2002'], freq='D')
+    with pytest.raises(ValueError, match='Length'):
+        arr.fillna(arr[:2])
+
+
+def test_fillna_copies():
+    arr = period_array(['2000', '2001', '2002'], freq='D')
+    result = arr.fillna(pd.Period("2000", "D"))
+    assert result is not arr
+
+
+# ----------------------------------------------------------------------------
+# setitem
+
+@pytest.mark.parametrize('key, value, expected', [
+    ([0], pd.Period("2000", "D"), [10957, 1, 2]),
+    ([0], None, [iNaT, 1, 2]),
+    ([0], np.nan, [iNaT, 1, 2]),
+    ([0, 1, 2], pd.Period("2000", "D"), [10957] * 3),
+    ([0, 1, 2], [pd.Period("2000", "D"),
+                 pd.Period("2001", "D"),
+                 pd.Period("2002", "D")],
+     [10957, 11323, 11688]),
+])
+def test_setitem(key, value, expected):
+    arr = PeriodArray(np.arange(3), freq="D")
+    expected = PeriodArray(expected, freq="D")
+    arr[key] = value
+    tm.assert_period_array_equal(arr, expected)
+
+
+def test_setitem_raises_incompatible_freq():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with pytest.raises(IncompatibleFrequency, match="freq"):
+        arr[0] = pd.Period("2000", freq="A")
+
+    other = period_array(['2000', '2001'], freq='A')
+    with pytest.raises(IncompatibleFrequency, match="freq"):
+        arr[[0, 1]] = other
+
+
+def test_setitem_raises_length():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with pytest.raises(ValueError, match="length"):
+        arr[[0, 1]] = [pd.Period("2000", freq="D")]
+
+
+def test_setitem_raises_type():
+    arr = PeriodArray(np.arange(3), freq="D")
+    with pytest.raises(TypeError, match="int"):
+        arr[0] = 1
+
+
+# ----------------------------------------------------------------------------
+# Ops
+
+def test_sub_period():
+    arr = period_array(['2000', '2001'], freq='D')
+    other = pd.Period("2000", freq="M")
+    with pytest.raises(IncompatibleFrequency, match="freq"):
+        arr - other
+
+
+# ----------------------------------------------------------------------------
+# Methods
+
+@pytest.mark.parametrize('other', [
+    pd.Period('2000', freq='H'),
+    period_array(['2000', '2001', '2000'], freq='H')
+])
+def test_where_different_freq_raises(other):
+    ser = pd.Series(period_array(['2000', '2001', '2002'], freq='D'))
+    cond = np.array([True, False, True])
+    with pytest.raises(IncompatibleFrequency, match="freq"):
+        ser.where(cond, other)
+
+
+# ----------------------------------------------------------------------------
+# Printing
+
+def test_repr_small():
+    arr = period_array(['2000', '2001'], freq='D')
+    result = str(arr)
+    expected = (
+        "<PeriodArray>\n"
+        "['2000-01-01', '2001-01-01']\n"
+        "Length: 2, dtype: period[D]"
+    )
+    assert result == expected
+
+
+def test_repr_large():
+    arr = period_array(['2000', '2001'] * 500, freq='D')
+    result = str(arr)
+    expected = (
+        "<PeriodArray>\n"
+        "['2000-01-01', '2001-01-01', '2000-01-01', '2001-01-01', "
+        "'2000-01-01',\n"
+        " '2001-01-01', '2000-01-01', '2001-01-01', '2000-01-01', "
+        "'2001-01-01',\n"
+        " ...\n"
+        " '2000-01-01', '2001-01-01', '2000-01-01', '2001-01-01', "
+        "'2000-01-01',\n"
+        " '2001-01-01', '2000-01-01', '2001-01-01', '2000-01-01', "
+        "'2001-01-01']\n"
+        "Length: 1000, dtype: period[D]"
+    )
+    assert result == expected
+
+
+# ----------------------------------------------------------------------------
+# Reductions
+
+class TestReductions(object):
+
+    def test_min_max(self):
+        arr = period_array([
+            '2000-01-03',
+            '2000-01-03',
+            'NaT',
+            '2000-01-02',
+            '2000-01-05',
+            '2000-01-04',
+        ], freq='D')
+
+        result = arr.min()
+        expected = pd.Period('2000-01-02', freq='D')
+        assert result == expected
+
+        result = arr.max()
+        expected = pd.Period('2000-01-05', freq='D')
+        assert result == expected
+
+        result = arr.min(skipna=False)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=False)
+        assert result is pd.NaT
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_min_max_empty(self, skipna):
+        arr = period_array([], freq='D')
+        result = arr.min(skipna=skipna)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=skipna)
+        assert result is pd.NaT
diff --git a/pandas/tests/arrays/test_timedeltas.py b/pandas/tests/arrays/test_timedeltas.py
new file mode 100644
index 0000000000000..1fec533a14a6f
--- /dev/null
+++ b/pandas/tests/arrays/test_timedeltas.py
@@ -0,0 +1,161 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.core.arrays import TimedeltaArray
+import pandas.util.testing as tm
+
+
+class TestTimedeltaArrayConstructor(object):
+    def test_only_1dim_accepted(self):
+        # GH#25282
+        arr = np.array([0, 1, 2, 3], dtype='m8[h]').astype('m8[ns]')
+
+        with pytest.raises(ValueError, match="Only 1-dimensional"):
+            # 2-dim
+            TimedeltaArray(arr.reshape(2, 2))
+
+        with pytest.raises(ValueError, match="Only 1-dimensional"):
+            # 0-dim
+            TimedeltaArray(arr[[0]].squeeze())
+
+    def test_freq_validation(self):
+        # ensure that the public constructor cannot create an invalid instance
+        arr = np.array([0, 0, 1], dtype=np.int64) * 3600 * 10**9
+
+        msg = ("Inferred frequency None from passed values does not "
+               "conform to passed frequency D")
+        with pytest.raises(ValueError, match=msg):
+            TimedeltaArray(arr.view('timedelta64[ns]'), freq="D")
+
+    def test_non_array_raises(self):
+        with pytest.raises(ValueError, match='list'):
+            TimedeltaArray([1, 2, 3])
+
+    def test_other_type_raises(self):
+        with pytest.raises(ValueError,
+                           match="dtype bool cannot be converted"):
+            TimedeltaArray(np.array([1, 2, 3], dtype='bool'))
+
+    def test_incorrect_dtype_raises(self):
+        # TODO: why TypeError for 'category' but ValueError for i8?
+        with pytest.raises(ValueError,
+                           match=r'category cannot be converted '
+                                 r'to timedelta64\[ns\]'):
+            TimedeltaArray(np.array([1, 2, 3], dtype='i8'), dtype='category')
+
+        with pytest.raises(ValueError,
+                           match=r"dtype int64 cannot be converted "
+                                 r"to timedelta64\[ns\]"):
+            TimedeltaArray(np.array([1, 2, 3], dtype='i8'),
+                           dtype=np.dtype("int64"))
+
+    def test_copy(self):
+        data = np.array([1, 2, 3], dtype='m8[ns]')
+        arr = TimedeltaArray(data, copy=False)
+        assert arr._data is data
+
+        arr = TimedeltaArray(data, copy=True)
+        assert arr._data is not data
+        assert arr._data.base is not data
+
+
+class TestTimedeltaArray(object):
+    def test_np_sum(self):
+        # GH#25282
+        vals = np.arange(5, dtype=np.int64).view('m8[h]').astype('m8[ns]')
+        arr = TimedeltaArray(vals)
+        result = np.sum(arr)
+        assert result == vals.sum()
+
+        result = np.sum(pd.TimedeltaIndex(arr))
+        assert result == vals.sum()
+
+    def test_from_sequence_dtype(self):
+        msg = "dtype .*object.* cannot be converted to timedelta64"
+        with pytest.raises(ValueError, match=msg):
+            TimedeltaArray._from_sequence([], dtype=object)
+
+    def test_abs(self):
+        vals = np.array([-3600 * 10**9, 'NaT', 7200 * 10**9], dtype='m8[ns]')
+        arr = TimedeltaArray(vals)
+
+        evals = np.array([3600 * 10**9, 'NaT', 7200 * 10**9], dtype='m8[ns]')
+        expected = TimedeltaArray(evals)
+
+        result = abs(arr)
+        tm.assert_timedelta_array_equal(result, expected)
+
+    def test_neg(self):
+        vals = np.array([-3600 * 10**9, 'NaT', 7200 * 10**9], dtype='m8[ns]')
+        arr = TimedeltaArray(vals)
+
+        evals = np.array([3600 * 10**9, 'NaT', -7200 * 10**9], dtype='m8[ns]')
+        expected = TimedeltaArray(evals)
+
+        result = -arr
+        tm.assert_timedelta_array_equal(result, expected)
+
+    def test_neg_freq(self):
+        tdi = pd.timedelta_range('2 Days', periods=4, freq='H')
+        arr = TimedeltaArray(tdi, freq=tdi.freq)
+
+        expected = TimedeltaArray(-tdi._data, freq=-tdi.freq)
+
+        result = -arr
+        tm.assert_timedelta_array_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [
+        int, np.int32, np.int64, 'uint32', 'uint64',
+    ])
+    def test_astype_int(self, dtype):
+        arr = TimedeltaArray._from_sequence([pd.Timedelta('1H'),
+                                             pd.Timedelta('2H')])
+        result = arr.astype(dtype)
+
+        if np.dtype(dtype).kind == 'u':
+            expected_dtype = np.dtype('uint64')
+        else:
+            expected_dtype = np.dtype('int64')
+        expected = arr.astype(expected_dtype)
+
+        assert result.dtype == expected_dtype
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_setitem_clears_freq(self):
+        a = TimedeltaArray(pd.timedelta_range('1H', periods=2, freq='H'))
+        a[0] = pd.Timedelta("1H")
+        assert a.freq is None
+
+
+class TestReductions(object):
+
+    def test_min_max(self):
+        arr = TimedeltaArray._from_sequence([
+            '3H', '3H', 'NaT', '2H', '5H', '4H',
+        ])
+
+        result = arr.min()
+        expected = pd.Timedelta('2H')
+        assert result == expected
+
+        result = arr.max()
+        expected = pd.Timedelta('5H')
+        assert result == expected
+
+        result = arr.min(skipna=False)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=False)
+        assert result is pd.NaT
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_min_max_empty(self, skipna):
+        arr = TimedeltaArray._from_sequence([])
+        result = arr.min(skipna=skipna)
+        assert result is pd.NaT
+
+        result = arr.max(skipna=skipna)
+        assert result is pd.NaT
diff --git a/pandas/tests/computation/test_compat.py b/pandas/tests/computation/test_compat.py
index 56a7cab730f1f..7cc373d06cfe1 100644
--- a/pandas/tests/computation/test_compat.py
+++ b/pandas/tests/computation/test_compat.py
@@ -1,22 +1,21 @@
-import pytest
 from distutils.version import LooseVersion
 
-import pandas as pd
-from pandas.util import testing as tm
+import pytest
 
-from pandas.computation.engines import _engines
-import pandas.computation.expr as expr
-from pandas.computation import _MIN_NUMEXPR_VERSION
+import pandas as pd
+from pandas.core.computation.check import _MIN_NUMEXPR_VERSION
+from pandas.core.computation.engines import _engines
+import pandas.core.computation.expr as expr
 
 
 def test_compat():
     # test we have compat with our version of nu
 
-    from pandas.computation import _NUMEXPR_INSTALLED
+    from pandas.core.computation.check import _NUMEXPR_INSTALLED
     try:
         import numexpr as ne
         ver = ne.__version__
-        if ver < LooseVersion(_MIN_NUMEXPR_VERSION):
+        if LooseVersion(ver) < LooseVersion(_MIN_NUMEXPR_VERSION):
             assert not _NUMEXPR_INSTALLED
         else:
             assert _NUMEXPR_INSTALLED
@@ -30,7 +29,7 @@ def test_invalid_numexpr_version(engine, parser):
     def testit():
         a, b = 1, 2  # noqa
         res = pd.eval('a + b', engine=engine, parser=parser)
-        tm.assert_equal(res, 3)
+        assert res == 3
 
     if engine == 'numexpr':
         try:
@@ -38,8 +37,9 @@ def testit():
         except ImportError:
             pytest.skip("no numexpr")
         else:
-            if ne.__version__ < LooseVersion(_MIN_NUMEXPR_VERSION):
-                with tm.assertRaises(ImportError):
+            if (LooseVersion(ne.__version__) <
+                    LooseVersion(_MIN_NUMEXPR_VERSION)):
+                with pytest.raises(ImportError):
                     testit()
             else:
                 testit()
diff --git a/pandas/tests/computation/test_eval.py b/pandas/tests/computation/test_eval.py
index ed6006440441e..a14d8e4471c23 100644
--- a/pandas/tests/computation/test_eval.py
+++ b/pandas/tests/computation/test_eval.py
@@ -1,52 +1,48 @@
-
-# flake8: noqa
-
-import warnings
-import operator
-from itertools import product
 from distutils.version import LooseVersion
+from itertools import product
+import operator
+import warnings
 
+import numpy as np
+from numpy.random import rand, randint, randn
 import pytest
 
-from numpy.random import randn, rand, randint
-import numpy as np
+from pandas.compat import PY3, reduce
+from pandas.errors import PerformanceWarning
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.common import is_bool, is_list_like, is_scalar
 
-from pandas.types.common import is_list_like, is_scalar
 import pandas as pd
-from pandas.core import common as com
-from pandas import DataFrame, Series, Panel, date_range
-from pandas.util.testing import makeCustomDataframe as mkdf
-
-from pandas.computation import pytables
-from pandas.computation.engines import _engines, NumExprClobberingError
-from pandas.computation.expr import PythonExprVisitor, PandasExprVisitor
-from pandas.computation.expressions import _USE_NUMEXPR, _NUMEXPR_INSTALLED
-from pandas.computation.ops import (_binary_ops_dict,
-                                    _special_case_arith_ops_syms,
-                                    _arith_ops_syms, _bool_ops_syms,
-                                    _unary_math_ops, _binary_math_ops)
-
-import pandas.computation.expr as expr
+from pandas import DataFrame, Panel, Series, date_range
+from pandas.core.computation import pytables
+from pandas.core.computation.check import _NUMEXPR_VERSION
+from pandas.core.computation.engines import NumExprClobberingError, _engines
+import pandas.core.computation.expr as expr
+from pandas.core.computation.expr import PandasExprVisitor, PythonExprVisitor
+from pandas.core.computation.expressions import (
+    _NUMEXPR_INSTALLED, _USE_NUMEXPR)
+from pandas.core.computation.ops import (
+    _arith_ops_syms, _binary_math_ops, _binary_ops_dict, _bool_ops_syms,
+    _special_case_arith_ops_syms, _unary_math_ops)
 import pandas.util.testing as tm
-import pandas._libs.lib as lib
-from pandas.util.testing import (assert_frame_equal, randbool,
-                                 assertRaisesRegexp, assert_numpy_array_equal,
-                                 assert_produces_warning, assert_series_equal,
-                                 slow)
-from pandas.compat import PY3, u, reduce
+from pandas.util.testing import (
+    assert_frame_equal, assert_numpy_array_equal, assert_produces_warning,
+    assert_series_equal, makeCustomDataframe as mkdf, randbool)
 
 _series_frame_incompatible = _bool_ops_syms
 _scalar_skip = 'in', 'not in'
 
 
 @pytest.fixture(params=(
-    pytest.mark.skipif(engine == 'numexpr' and not _USE_NUMEXPR,
-                       reason='numexpr enabled->{enabled}, '
-                              'installed->{installed}'.format(
-                            enabled=_USE_NUMEXPR,
-                            installed=_NUMEXPR_INSTALLED))(engine)
-    for engine in _engines
-))
+    pytest.param(engine,
+                 marks=pytest.mark.skipif(
+                     engine == 'numexpr' and not _USE_NUMEXPR,
+                     reason='numexpr enabled->{enabled}, '
+                            'installed->{installed}'.format(
+                                enabled=_USE_NUMEXPR,
+                                installed=_NUMEXPR_INSTALLED)))
+                 for engine in _engines))  # noqa
 def engine(request):
     return request.param
 
@@ -56,6 +52,25 @@ def parser(request):
     return request.param
 
 
+@pytest.fixture
+def ne_lt_2_6_9():
+    if _NUMEXPR_INSTALLED and _NUMEXPR_VERSION >= LooseVersion('2.6.9'):
+        pytest.skip("numexpr is >= 2.6.9")
+    return 'numexpr'
+
+
+@pytest.fixture
+def unary_fns_for_ne():
+    if _NUMEXPR_INSTALLED:
+        if _NUMEXPR_VERSION >= LooseVersion('2.6.9'):
+            return _unary_math_ops
+        else:
+            return tuple(x for x in _unary_math_ops
+                         if x not in ("floor", "ceil"))
+    else:
+        pytest.skip("numexpr is not present")
+
+
 def engine_has_neg_frac(engine):
     return _engines[engine].has_neg_frac
 
@@ -66,7 +81,8 @@ def _eval_single_bin(lhs, cmp1, rhs, engine):
         try:
             return c(lhs, rhs)
         except ValueError as e:
-            if str(e).startswith('negative number cannot be raised to a fractional power'):
+            if str(e).startswith('negative number cannot be '
+                                 'raised to a fractional power'):
                 return np.nan
             raise
     return c(lhs, rhs)
@@ -74,14 +90,14 @@ def _eval_single_bin(lhs, cmp1, rhs, engine):
 
 def _series_and_2d_ndarray(lhs, rhs):
     return ((isinstance(lhs, Series) and
-             isinstance(rhs, np.ndarray) and rhs.ndim > 1)
-            or (isinstance(rhs, Series) and
-                isinstance(lhs, np.ndarray) and lhs.ndim > 1))
+             isinstance(rhs, np.ndarray) and rhs.ndim > 1) or
+            (isinstance(rhs, Series) and
+             isinstance(lhs, np.ndarray) and lhs.ndim > 1))
 
 
 def _series_and_frame(lhs, rhs):
-    return ((isinstance(lhs, Series) and isinstance(rhs, DataFrame))
-            or (isinstance(rhs, Series) and isinstance(lhs, DataFrame)))
+    return ((isinstance(lhs, Series) and isinstance(rhs, DataFrame)) or
+            (isinstance(rhs, Series) and isinstance(lhs, DataFrame)))
 
 
 def _bool_and_frame(lhs, rhs):
@@ -93,23 +109,21 @@ def _is_py3_complex_incompat(result, expected):
             np.isnan(result))
 
 
-_good_arith_ops = com.difference(_arith_ops_syms, _special_case_arith_ops_syms)
+_good_arith_ops = set(_arith_ops_syms).difference(_special_case_arith_ops_syms)
 
 
-class TestEvalNumexprPandas(tm.TestCase):
+@td.skip_if_no_ne
+class TestEvalNumexprPandas(object):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestEvalNumexprPandas, cls).setUpClass()
-        tm.skip_if_no_ne()
+    def setup_class(cls):
         import numexpr as ne
         cls.ne = ne
         cls.engine = 'numexpr'
         cls.parser = 'pandas'
 
     @classmethod
-    def tearDownClass(cls):
-        super(TestEvalNumexprPandas, cls).tearDownClass()
+    def teardown_class(cls):
         del cls.engine, cls.parser
         if hasattr(cls, 'ne'):
             del cls.ne
@@ -138,16 +152,16 @@ def setup_ops(self):
         self.arith_ops = _good_arith_ops
         self.unary_ops = '-', '~', 'not '
 
-    def setUp(self):
+    def setup_method(self, method):
         self.setup_ops()
         self.setup_data()
         self.current_engines = filter(lambda x: x != self.engine, _engines)
 
-    def tearDown(self):
+    def teardown_method(self, method):
         del self.lhses, self.rhses, self.scalar_rhses, self.scalar_lhses
         del self.pandas_rhses, self.pandas_lhses, self.current_engines
 
-    @slow
+    @pytest.mark.slow
     def test_complex_cmp_ops(self):
         cmp_ops = ('!=', '==', '<=', '>=', '<', '>')
         cmp2_ops = ('>', '<')
@@ -164,7 +178,7 @@ def test_simple_cmp_ops(self):
         for lhs, rhs, cmp_op in product(bool_lhses, bool_rhses, self.cmp_ops):
             self.check_simple_cmp_op(lhs, cmp_op, rhs)
 
-    @slow
+    @pytest.mark.slow
     def test_binary_arith_ops(self):
         for lhs, op, rhs in product(self.lhses, self.arith_ops, self.rhses):
             self.check_binary_arith_op(lhs, op, rhs)
@@ -177,24 +191,23 @@ def test_floor_division(self):
         for lhs, rhs in product(self.lhses, self.rhses):
             self.check_floor_division(lhs, '//', rhs)
 
+    @td.skip_if_windows
     def test_pow(self):
-        tm._skip_if_windows()
-
         # odd failure on win32 platform, so skip
         for lhs, rhs in product(self.lhses, self.rhses):
             self.check_pow(lhs, '**', rhs)
 
-    @slow
+    @pytest.mark.slow
     def test_single_invert_op(self):
         for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
             self.check_single_invert_op(lhs, op, rhs)
 
-    @slow
+    @pytest.mark.slow
     def test_compound_invert_op(self):
         for lhs, op, rhs in product(self.lhses, self.cmp_ops, self.rhses):
             self.check_compound_invert_op(lhs, op, rhs)
 
-    @slow
+    @pytest.mark.slow
     def test_chained_cmp_op(self):
         mids = self.lhses
         cmp_ops = '<', '>'
@@ -210,7 +223,7 @@ def check_equal(self, result, expected):
         elif isinstance(result, np.ndarray):
             tm.assert_numpy_array_equal(result, expected)
         else:
-            self.assertEqual(result, expected)
+            assert result == expected
 
     def check_complex_cmp_op(self, lhs, cmp1, rhs, binop, cmp2):
         skip_these = _scalar_skip
@@ -220,27 +233,30 @@ def check_complex_cmp_op(self, lhs, cmp1, rhs, binop, cmp2):
         scalar_with_in_notin = (is_scalar(rhs) and (cmp1 in skip_these or
                                                     cmp2 in skip_these))
         if scalar_with_in_notin:
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 pd.eval(ex, engine=self.engine, parser=self.parser)
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
+            with pytest.raises(TypeError):
+                pd.eval(ex, engine=self.engine, parser=self.parser,
+                        local_dict={'lhs': lhs, 'rhs': rhs})
         else:
             lhs_new = _eval_single_bin(lhs, cmp1, rhs, self.engine)
             rhs_new = _eval_single_bin(lhs, cmp2, rhs, self.engine)
-            if (isinstance(lhs_new, Series) and isinstance(rhs_new, DataFrame)
-                    and binop in _series_frame_incompatible):
+            if (isinstance(lhs_new, Series) and
+                    isinstance(rhs_new, DataFrame) and
+                    binop in _series_frame_incompatible):
                 pass
                 # TODO: the code below should be added back when left and right
                 # hand side bool ops are fixed.
-
+                #
                 # try:
-                # self.assertRaises(Exception, pd.eval, ex,
-                #local_dict={'lhs': lhs, 'rhs': rhs},
-                # engine=self.engine, parser=self.parser)
+                #     pytest.raises(Exception, pd.eval, ex,
+                #                   local_dict={'lhs': lhs, 'rhs': rhs},
+                #                   engine=self.engine, parser=self.parser)
                 # except AssertionError:
-                #import ipdb; ipdb.set_trace()
-                # raise
+                #     import ipdb
+                #
+                #     ipdb.set_trace()
+                #     raise
             else:
                 expected = _eval_single_bin(
                     lhs_new, binop, rhs_new, self.engine)
@@ -248,7 +264,6 @@ def check_complex_cmp_op(self, lhs, cmp1, rhs, binop, cmp2):
                 self.check_equal(result, expected)
 
     def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
-        skip_these = _scalar_skip
 
         def check_operands(left, right, cmp_op):
             return _eval_single_bin(left, cmp_op, right, self.engine)
@@ -270,10 +285,14 @@ def check_operands(left, right, cmp_op):
 
     def check_simple_cmp_op(self, lhs, cmp1, rhs):
         ex = 'lhs {0} rhs'.format(cmp1)
+        msg = (r"only list-like( or dict-like)? objects are allowed to be"
+               r" passed to (DataFrame\.)?isin\(\), you passed a"
+               r" (\[|')bool(\]|')|"
+               "argument of type 'bool' is not iterable")
         if cmp1 in ('in', 'not in') and not is_list_like(rhs):
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
+            with pytest.raises(TypeError, match=msg):
+                pd.eval(ex, engine=self.engine, parser=self.parser,
+                        local_dict={'lhs': lhs, 'rhs': rhs})
         else:
             expected = _eval_single_bin(lhs, cmp1, rhs, self.engine)
             result = pd.eval(ex, engine=self.engine, parser=self.parser)
@@ -326,15 +345,18 @@ def check_floor_division(self, lhs, arith1, rhs):
             expected = lhs // rhs
             self.check_equal(res, expected)
         else:
-            self.assertRaises(TypeError, pd.eval, ex, local_dict={'lhs': lhs,
-                                                                  'rhs': rhs},
-                              engine=self.engine, parser=self.parser)
+            msg = (r"unsupported operand type\(s\) for //: 'VariableNode' and"
+                   " 'VariableNode'")
+            with pytest.raises(TypeError, match=msg):
+                pd.eval(ex, local_dict={'lhs': lhs, 'rhs': rhs},
+                        engine=self.engine, parser=self.parser)
 
     def get_expected_pow_result(self, lhs, rhs):
         try:
             expected = _eval_single_bin(lhs, '**', rhs, self.engine)
         except ValueError as e:
-            if str(e).startswith('negative number cannot be raised to a fractional power'):
+            if str(e).startswith('negative number cannot be '
+                                 'raised to a fractional power'):
                 if self.engine == 'python':
                     pytest.skip(str(e))
                 else:
@@ -350,8 +372,8 @@ def check_pow(self, lhs, arith1, rhs):
 
         if (is_scalar(lhs) and is_scalar(rhs) and
                 _is_py3_complex_incompat(result, expected)):
-            self.assertRaises(AssertionError, tm.assert_numpy_array_equal,
-                              result, expected)
+            pytest.raises(AssertionError, tm.assert_numpy_array_equal,
+                          result, expected)
         else:
             tm.assert_almost_equal(result, expected)
 
@@ -373,7 +395,6 @@ def check_single_invert_op(self, lhs, cmp1, rhs):
             tm.assert_almost_equal(expected, result)
 
             for engine in self.current_engines:
-                tm.skip_if_no_ne(engine)
                 tm.assert_almost_equal(result, pd.eval('~elb', engine=engine,
                                                        parser=self.parser))
 
@@ -381,10 +402,14 @@ def check_compound_invert_op(self, lhs, cmp1, rhs):
         skip_these = 'in', 'not in'
         ex = '~(lhs {0} rhs)'.format(cmp1)
 
+        msg = (r"only list-like( or dict-like)? objects are allowed to be"
+               r" passed to (DataFrame\.)?isin\(\), you passed a"
+               r" (\[|')float(\]|')|"
+               "argument of type 'float' is not iterable")
         if is_scalar(rhs) and cmp1 in skip_these:
-            self.assertRaises(TypeError, pd.eval, ex, engine=self.engine,
-                              parser=self.parser, local_dict={'lhs': lhs,
-                                                              'rhs': rhs})
+            with pytest.raises(TypeError, match=msg):
+                pd.eval(ex, engine=self.engine, parser=self.parser,
+                        local_dict={'lhs': lhs, 'rhs': rhs})
         else:
             # compound
             if is_scalar(lhs) and is_scalar(rhs):
@@ -399,7 +424,6 @@ def check_compound_invert_op(self, lhs, cmp1, rhs):
 
             # make sure the other engines work the same as this one
             for engine in self.current_engines:
-                tm.skip_if_no_ne(engine)
                 ev = pd.eval(ex, engine=self.engine, parser=self.parser)
                 tm.assert_almost_equal(ev, result)
 
@@ -414,16 +438,16 @@ def test_frame_invert(self):
         # float always raises
         lhs = DataFrame(randn(5, 2))
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
 
         # int raises on numexpr
         lhs = DataFrame(randint(5, size=(5, 2)))
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
             expect = ~lhs
@@ -439,10 +463,10 @@ def test_frame_invert(self):
         # object raises
         lhs = DataFrame({'b': ['a', 1, 2.0], 'c': rand(3) > 0.5})
         if self.engine == 'numexpr':
-            with tm.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
 
     def test_series_invert(self):
@@ -453,16 +477,16 @@ def test_series_invert(self):
         # float raises
         lhs = Series(randn(5))
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
 
         # int raises on numexpr
         lhs = Series(randint(5, size=5))
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
             expect = ~lhs
@@ -482,10 +506,10 @@ def test_series_invert(self):
         # object
         lhs = Series(['a', 1, 2.0])
         if self.engine == 'numexpr':
-            with tm.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
 
     def test_frame_negate(self):
@@ -506,7 +530,7 @@ def test_frame_negate(self):
         # bool doesn't work with numexpr but works elsewhere
         lhs = DataFrame(rand(5, 2) > 0.5)
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
             expect = -lhs
@@ -531,7 +555,7 @@ def test_series_negate(self):
         # bool doesn't work with numexpr but works elsewhere
         lhs = Series(rand(5) > 0.5)
         if self.engine == 'numexpr':
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 result = pd.eval(expr, engine=self.engine, parser=self.parser)
         else:
             expect = -lhs
@@ -543,95 +567,69 @@ def test_frame_pos(self):
 
         # float
         lhs = DataFrame(randn(5, 2))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
 
         # int
         lhs = DataFrame(randint(5, size=(5, 2)))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
 
         # bool doesn't work with numexpr but works elsewhere
         lhs = DataFrame(rand(5, 2) > 0.5)
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_frame_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_frame_equal(expect, result)
 
     def test_series_pos(self):
         expr = self.ex('+')
 
         # float
         lhs = Series(randn(5))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
 
         # int
         lhs = Series(randint(5, size=5))
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
 
         # bool doesn't work with numexpr but works elsewhere
         lhs = Series(rand(5) > 0.5)
-        if self.engine == 'python':
-            with tm.assertRaises(TypeError):
-                result = pd.eval(expr, engine=self.engine, parser=self.parser)
-        else:
-            expect = lhs
-            result = pd.eval(expr, engine=self.engine, parser=self.parser)
-            assert_series_equal(expect, result)
+        expect = lhs
+        result = pd.eval(expr, engine=self.engine, parser=self.parser)
+        assert_series_equal(expect, result)
 
     def test_scalar_unary(self):
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             pd.eval('~1.0', engine=self.engine, parser=self.parser)
 
-        self.assertEqual(
-            pd.eval('-1.0', parser=self.parser, engine=self.engine), -1.0)
-        self.assertEqual(
-            pd.eval('+1.0', parser=self.parser, engine=self.engine), +1.0)
-
-        self.assertEqual(
-            pd.eval('~1', parser=self.parser, engine=self.engine), ~1)
-        self.assertEqual(
-            pd.eval('-1', parser=self.parser, engine=self.engine), -1)
-        self.assertEqual(
-            pd.eval('+1', parser=self.parser, engine=self.engine), +1)
-
-        self.assertEqual(
-            pd.eval('~True', parser=self.parser, engine=self.engine), ~True)
-        self.assertEqual(
-            pd.eval('~False', parser=self.parser, engine=self.engine), ~False)
-        self.assertEqual(
-            pd.eval('-True', parser=self.parser, engine=self.engine), -True)
-        self.assertEqual(
-            pd.eval('-False', parser=self.parser, engine=self.engine), -False)
-        self.assertEqual(
-            pd.eval('+True', parser=self.parser, engine=self.engine), +True)
-        self.assertEqual(
-            pd.eval('+False', parser=self.parser, engine=self.engine), +False)
+        assert pd.eval('-1.0', parser=self.parser,
+                       engine=self.engine) == -1.0
+        assert pd.eval('+1.0', parser=self.parser,
+                       engine=self.engine) == +1.0
+        assert pd.eval('~1', parser=self.parser,
+                       engine=self.engine) == ~1
+        assert pd.eval('-1', parser=self.parser,
+                       engine=self.engine) == -1
+        assert pd.eval('+1', parser=self.parser,
+                       engine=self.engine) == +1
+        assert pd.eval('~True', parser=self.parser,
+                       engine=self.engine) == ~True
+        assert pd.eval('~False', parser=self.parser,
+                       engine=self.engine) == ~False
+        assert pd.eval('-True', parser=self.parser,
+                       engine=self.engine) == -True
+        assert pd.eval('-False', parser=self.parser,
+                       engine=self.engine) == -False
+        assert pd.eval('+True', parser=self.parser,
+                       engine=self.engine) == +True
+        assert pd.eval('+False', parser=self.parser,
+                       engine=self.engine) == +False
 
     def test_unary_in_array(self):
         # GH 11235
@@ -650,63 +648,64 @@ def test_disallow_scalar_bool_ops(self):
         exprs += '2 * x > 2 or 1 and 2',
         exprs += '2 * df > 3 and 1 or a',
 
-        x, a, b, df = np.random.randn(3), 1, 2, DataFrame(randn(3, 2))
+        x, a, b, df = np.random.randn(3), 1, 2, DataFrame(randn(3, 2))  # noqa
         for ex in exprs:
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval(ex, engine=self.engine, parser=self.parser)
 
     def test_identical(self):
-        # GH 10546
+        # see gh-10546
         x = 1
         result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, 1)
-        self.assertTrue(is_scalar(result))
+        assert result == 1
+        assert is_scalar(result)
 
         x = 1.5
         result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, 1.5)
-        self.assertTrue(is_scalar(result))
+        assert result == 1.5
+        assert is_scalar(result)
 
         x = False
         result = pd.eval('x', engine=self.engine, parser=self.parser)
-        self.assertEqual(result, False)
-        self.assertTrue(is_scalar(result))
+        assert not result
+        assert is_bool(result)
+        assert is_scalar(result)
 
         x = np.array([1])
         result = pd.eval('x', engine=self.engine, parser=self.parser)
         tm.assert_numpy_array_equal(result, np.array([1]))
-        self.assertEqual(result.shape, (1, ))
+        assert result.shape == (1, )
 
         x = np.array([1.5])
         result = pd.eval('x', engine=self.engine, parser=self.parser)
         tm.assert_numpy_array_equal(result, np.array([1.5]))
-        self.assertEqual(result.shape, (1, ))
+        assert result.shape == (1, )
 
-        x = np.array([False])
+        x = np.array([False])  # noqa
         result = pd.eval('x', engine=self.engine, parser=self.parser)
         tm.assert_numpy_array_equal(result, np.array([False]))
-        self.assertEqual(result.shape, (1, ))
+        assert result.shape == (1, )
 
     def test_line_continuation(self):
         # GH 11149
         exp = """1 + 2 * \
         5 - 1 + 2 """
         result = pd.eval(exp, engine=self.engine, parser=self.parser)
-        self.assertEqual(result, 12)
+        assert result == 12
 
     def test_float_truncation(self):
         # GH 14241
         exp = '1000000000.006'
         result = pd.eval(exp, engine=self.engine, parser=self.parser)
         expected = np.float64(exp)
-        self.assertEqual(result, expected)
+        assert result == expected
 
         df = pd.DataFrame({'A': [1000000000.0009,
                                  1000000000.0011,
                                  1000000000.0015]})
         cutoff = 1000000000.0006
         result = df.query("A < %.4f" % cutoff)
-        self.assertTrue(result.empty)
+        assert result.empty
 
         cutoff = 1000000000.0010
         result = df.query("A > %.4f" % cutoff)
@@ -718,13 +717,25 @@ def test_float_truncation(self):
         expected = df.loc[[1], :]
         tm.assert_frame_equal(expected, result)
 
+    def test_disallow_python_keywords(self):
+        # GH 18221
+        df = pd.DataFrame([[0, 0, 0]], columns=['foo', 'bar', 'class'])
+        msg = "Python keyword not valid identifier in numexpr query"
+        with pytest.raises(SyntaxError, match=msg):
+            df.query('class == 0')
+
+        df = pd.DataFrame()
+        df.index.name = 'lambda'
+        with pytest.raises(SyntaxError, match=msg):
+            df.query('lambda == 0')
+
 
+@td.skip_if_no_ne
 class TestEvalNumexprPython(TestEvalNumexprPandas):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestEvalNumexprPython, cls).setUpClass()
-        tm.skip_if_no_ne()
+    def setup_class(cls):
+        super(TestEvalNumexprPython, cls).setup_class()
         import numexpr as ne
         cls.ne = ne
         cls.engine = 'numexpr'
@@ -742,15 +753,15 @@ def setup_ops(self):
 
     def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
         ex1 = 'lhs {0} mid {1} rhs'.format(cmp1, cmp2)
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             pd.eval(ex1, engine=self.engine, parser=self.parser)
 
 
 class TestEvalPythonPython(TestEvalNumexprPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestEvalPythonPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestEvalPythonPython, cls).setup_class()
         cls.engine = 'python'
         cls.parser = 'python'
 
@@ -779,8 +790,8 @@ def check_alignment(self, result, nlhs, ghs, op):
 class TestEvalPythonPandas(TestEvalPythonPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestEvalPythonPandas, cls).setUpClass()
+    def setup_class(cls):
+        super(TestEvalPythonPandas, cls).setup_class()
         cls.engine = 'python'
         cls.parser = 'pandas'
 
@@ -792,9 +803,8 @@ def check_chained_cmp_op(self, lhs, cmp1, mid, cmp2, rhs):
 f = lambda *args, **kwargs: np.random.randn()
 
 
-#-------------------------------------
-# typecasting rules consistency with python
-# issue #12388
+# -------------------------------------
+# gh-12388: Typecasting rules consistency with python
 
 
 class TestTypeCasting(object):
@@ -817,8 +827,8 @@ def test_binop_typecasting(self, engine, parser, op, dt):
         assert_frame_equal(res, eval(s))
 
 
-#-------------------------------------
-# basic and complex alignment
+# -------------------------------------
+# Basic and complex alignment
 
 def _is_datetime(x):
     return issubclass(x.dtype.type, np.datetime64)
@@ -872,7 +882,7 @@ def test_frame_comparison(self, engine, parser):
             res = pd.eval('df < df3', engine=engine, parser=parser)
             assert_frame_equal(res, df < df3)
 
-    @slow
+    @pytest.mark.slow
     def test_medium_complex_frame_alignment(self, engine, parser):
         args = product(self.lhs_index_types, self.index_types,
                        self.index_types, self.index_types)
@@ -940,12 +950,18 @@ def testit(r_idx_type, c_idx_type, index_name):
         # only test dt with dt, otherwise weird joins result
         args = product(['i', 'u', 's'], ['i', 'u', 's'], ('index', 'columns'))
         with warnings.catch_warnings(record=True):
+            # avoid warning about comparing strings and ints
+            warnings.simplefilter("ignore", RuntimeWarning)
+
             for r_idx_type, c_idx_type, index_name in args:
                 testit(r_idx_type, c_idx_type, index_name)
 
         # dt with dt
         args = product(['dt'], ['dt'], ('index', 'columns'))
         with warnings.catch_warnings(record=True):
+            # avoid warning about comparing strings and ints
+            warnings.simplefilter("ignore", RuntimeWarning)
+
             for r_idx_type, c_idx_type, index_name in args:
                 testit(r_idx_type, c_idx_type, index_name)
 
@@ -976,7 +992,7 @@ def test_series_frame_commutativity(self, engine, parser):
                     if engine == 'numexpr':
                         assert_frame_equal(a, b)
 
-    @slow
+    @pytest.mark.slow
     def test_complex_series_frame_alignment(self, engine, parser):
         import random
         args = product(self.lhs_index_types, self.index_types,
@@ -1018,14 +1034,14 @@ def test_complex_series_frame_alignment(self, engine, parser):
                                       parser=parser)
                 else:
                     res = pd.eval('df2 + s + df', engine=engine, parser=parser)
-                tm.assert_equal(res.shape, expected.shape)
+                assert res.shape == expected.shape
                 assert_frame_equal(res, expected)
 
     def test_performance_warning_for_poor_alignment(self, engine, parser):
         df = DataFrame(randn(1000, 10))
         s = Series(randn(10000))
         if engine == 'numexpr':
-            seen = pd.core.common.PerformanceWarning
+            seen = PerformanceWarning
         else:
             seen = False
 
@@ -1047,7 +1063,7 @@ def test_performance_warning_for_poor_alignment(self, engine, parser):
         is_python_engine = engine == 'python'
 
         if not is_python_engine:
-            wrn = pd.core.common.PerformanceWarning
+            wrn = PerformanceWarning
         else:
             wrn = False
 
@@ -1055,31 +1071,29 @@ def test_performance_warning_for_poor_alignment(self, engine, parser):
             pd.eval('df + s', engine=engine, parser=parser)
 
             if not is_python_engine:
-                tm.assert_equal(len(w), 1)
+                assert len(w) == 1
                 msg = str(w[0].message)
                 expected = ("Alignment difference on axis {0} is larger"
                             " than an order of magnitude on term {1!r}, "
                             "by more than {2:.4g}; performance may suffer"
                             "".format(1, 'df', np.log10(s.size - df.shape[1])))
-                tm.assert_equal(msg, expected)
+                assert msg == expected
 
 
-#------------------------------------
-# slightly more complex ops
+# ------------------------------------
+# Slightly more complex ops
 
-class TestOperationsNumExprPandas(tm.TestCase):
+@td.skip_if_no_ne
+class TestOperationsNumExprPandas(object):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestOperationsNumExprPandas, cls).setUpClass()
-        tm.skip_if_no_ne()
+    def setup_class(cls):
         cls.engine = 'numexpr'
         cls.parser = 'pandas'
         cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
 
     @classmethod
-    def tearDownClass(cls):
-        super(TestOperationsNumExprPandas, cls).tearDownClass()
+    def teardown_class(cls):
         del cls.engine, cls.parser
 
     def eval(self, *args, **kwargs):
@@ -1097,22 +1111,23 @@ def test_simple_arith_ops(self):
             ex3 = '1 {0} (x + 1)'.format(op)
 
             if op in ('in', 'not in'):
-                self.assertRaises(TypeError, pd.eval, ex,
-                                  engine=self.engine, parser=self.parser)
+                msg = "argument of type 'int' is not iterable"
+                with pytest.raises(TypeError, match=msg):
+                    pd.eval(ex, engine=self.engine, parser=self.parser)
             else:
                 expec = _eval_single_bin(1, op, 1, self.engine)
                 x = self.eval(ex, engine=self.engine, parser=self.parser)
-                tm.assert_equal(x, expec)
+                assert x == expec
 
                 expec = _eval_single_bin(x, op, 1, self.engine)
                 y = self.eval(ex2, local_dict={'x': x}, engine=self.engine,
                               parser=self.parser)
-                tm.assert_equal(y, expec)
+                assert y == expec
 
                 expec = _eval_single_bin(1, op, x + 1, self.engine)
                 y = self.eval(ex3, local_dict={'x': x},
                               engine=self.engine, parser=self.parser)
-                tm.assert_equal(y, expec)
+                assert y == expec
 
     def test_simple_bool_ops(self):
         for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
@@ -1120,7 +1135,7 @@ def test_simple_bool_ops(self):
             ex = '{0} {1} {2}'.format(lhs, op, rhs)
             res = self.eval(ex)
             exp = eval(ex)
-            self.assertEqual(res, exp)
+            assert res == exp
 
     def test_bool_ops_with_constants(self):
         for op, lhs, rhs in product(expr._bool_ops_syms, ('True', 'False'),
@@ -1128,8 +1143,9 @@ def test_bool_ops_with_constants(self):
             ex = '{0} {1} {2}'.format(lhs, op, rhs)
             res = self.eval(ex)
             exp = eval(ex)
-            self.assertEqual(res, exp)
+            assert res == exp
 
+    @pytest.mark.filterwarnings("ignore::FutureWarning")
     def test_panel_fails(self):
         x = Panel(randn(3, 4, 5))
         y = Series(randn(10))
@@ -1146,7 +1162,7 @@ def test_4d_ndarray_fails(self):
 
     def test_constant(self):
         x = self.eval('1')
-        tm.assert_equal(x, 1)
+        assert x == 1
 
     def test_single_variable(self):
         df = DataFrame(randn(10, 2))
@@ -1156,7 +1172,7 @@ def test_single_variable(self):
     def test_truediv(self):
         s = np.array([1])
         ex = 's / 1'
-        d = {'s': s}
+        d = {'s': s}  # noqa
 
         if PY3:
             res = self.eval(ex, truediv=False)
@@ -1167,19 +1183,19 @@ def test_truediv(self):
 
             res = self.eval('1 / 2', truediv=True)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('1 / 2', truediv=False)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('s / 2', truediv=False)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('s / 2', truediv=True)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
         else:
             res = self.eval(ex, truediv=False)
             tm.assert_numpy_array_equal(res, np.array([1]))
@@ -1189,23 +1205,23 @@ def test_truediv(self):
 
             res = self.eval('1 / 2', truediv=True)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('1 / 2', truediv=False)
             expec = 0
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('s / 2', truediv=False)
             expec = 0
-            self.assertEqual(res, expec)
+            assert res == expec
 
             res = self.eval('s / 2', truediv=True)
             expec = 0.5
-            self.assertEqual(res, expec)
+            assert res == expec
 
     def test_failing_subscript_with_name_error(self):
-        df = DataFrame(np.random.randn(5, 3))
-        with tm.assertRaises(NameError):
+        df = DataFrame(np.random.randn(5, 3))  # noqa
+        with pytest.raises(NameError):
             self.eval('df[x > 2] > 2')
 
     def test_lhs_expression_subscript(self):
@@ -1231,20 +1247,25 @@ def test_assignment_fails(self):
         df = DataFrame(np.random.randn(5, 3), columns=list('abc'))
         df2 = DataFrame(np.random.randn(5, 3))
         expr1 = 'df = df2'
-        self.assertRaises(ValueError, self.eval, expr1,
-                          local_dict={'df': df, 'df2': df2})
+        msg = "cannot assign without a target object"
+        with pytest.raises(ValueError, match=msg):
+            self.eval(expr1, local_dict={'df': df, 'df2': df2})
 
     def test_assignment_column(self):
         df = DataFrame(np.random.randn(5, 2), columns=list('ab'))
         orig_df = df.copy()
 
         # multiple assignees
-        self.assertRaises(SyntaxError, df.eval, 'd c = a + b')
+        with pytest.raises(SyntaxError, match="invalid syntax"):
+            df.eval('d c = a + b')
 
         # invalid assignees
-        self.assertRaises(SyntaxError, df.eval, 'd,c = a + b')
-        self.assertRaises(
-            SyntaxError, df.eval, 'Timestamp("20131001") = a + b')
+        msg = "left hand side of an assignment must be a single name"
+        with pytest.raises(SyntaxError, match=msg):
+            df.eval('d,c = a + b')
+        msg = "can't assign to function call"
+        with pytest.raises(SyntaxError, match=msg):
+            df.eval('Timestamp("20131001") = a + b')
 
         # single assignment - existing variable
         expected = orig_df.copy()
@@ -1280,14 +1301,16 @@ def f():
             df.eval('a = a + b', inplace=True)
             result = old_a + df.b
             assert_series_equal(result, df.a, check_names=False)
-            self.assertTrue(result.name is None)
+            assert result.name is None
 
         f()
 
         # multiple assignment
         df = orig_df.copy()
         df.eval('c = a + b', inplace=True)
-        self.assertRaises(SyntaxError, df.eval, 'c = a = b')
+        msg = "can only assign a single expression"
+        with pytest.raises(SyntaxError, match=msg):
+            df.eval('c = a = b')
 
         # explicit targets
         df = orig_df.copy()
@@ -1305,22 +1328,15 @@ def test_column_in(self):
         assert_series_equal(result, expected)
 
     def assignment_not_inplace(self):
-        # GH 9297
+        # see gh-9297
         df = DataFrame(np.random.randn(5, 2), columns=list('ab'))
 
         actual = df.eval('c = a + b', inplace=False)
-        self.assertIsNotNone(actual)
+        assert actual is not None
+
         expected = df.copy()
         expected['c'] = expected['a'] + expected['b']
-        assert_frame_equal(df, expected)
-
-        # default for inplace will change
-        with tm.assert_produces_warnings(FutureWarning):
-            df.eval('c = a + b')
-
-        # but don't warn without assignment
-        with tm.assert_produces_warnings(None):
-            df.eval('a + b')
+        tm.assert_frame_equal(df, expected)
 
     def test_multi_line_expression(self):
         # GH 11149
@@ -1333,7 +1349,7 @@ def test_multi_line_expression(self):
         c = a + b
         d = c + b""", inplace=True)
         assert_frame_equal(expected, df)
-        self.assertIsNone(ans)
+        assert ans is None
 
         expected['a'] = expected['a'] - 1
         expected['e'] = expected['a'] + 2
@@ -1341,10 +1357,10 @@ def test_multi_line_expression(self):
         a = a - 1
         e = a + 2""", inplace=True)
         assert_frame_equal(expected, df)
-        self.assertIsNone(ans)
+        assert ans is None
 
         # multi-line not valid if not all assignments
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.eval("""
             a = b + 2
             b - 2""", inplace=False)
@@ -1381,24 +1397,63 @@ def test_multi_line_expression_local_variable(self):
         d = c + @local_var
         """, inplace=True)
         assert_frame_equal(expected, df)
-        self.assertIsNone(ans)
+        assert ans is None
 
     def test_assignment_in_query(self):
         # GH 8664
         df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
         df_orig = df.copy()
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.query('a = 1')
         assert_frame_equal(df, df_orig)
 
-    def query_inplace(self):
-        # GH 11149
+    def test_query_inplace(self):
+        # see gh-11149
         df = pd.DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
         expected = df.copy()
         expected = expected[expected['a'] == 2]
         df.query('a == 2', inplace=True)
         assert_frame_equal(expected, df)
 
+        df = {}
+        expected = {"a": 3}
+
+        self.eval("a = 1 + 2", target=df, inplace=True)
+        tm.assert_dict_equal(df, expected)
+
+    @pytest.mark.parametrize("invalid_target", [1, "cat", [1, 2],
+                                                np.array([]), (1, 3)])
+    @pytest.mark.filterwarnings("ignore::FutureWarning")
+    def test_cannot_item_assign(self, invalid_target):
+        msg = "Cannot assign expression output to target"
+        expression = "a = 1 + 2"
+
+        with pytest.raises(ValueError, match=msg):
+            self.eval(expression, target=invalid_target, inplace=True)
+
+        if hasattr(invalid_target, "copy"):
+            with pytest.raises(ValueError, match=msg):
+                self.eval(expression, target=invalid_target, inplace=False)
+
+    @pytest.mark.parametrize("invalid_target", [1, "cat", (1, 3)])
+    def test_cannot_copy_item(self, invalid_target):
+        msg = "Cannot return a copy of the target"
+        expression = "a = 1 + 2"
+
+        with pytest.raises(ValueError, match=msg):
+            self.eval(expression, target=invalid_target, inplace=False)
+
+    @pytest.mark.parametrize("target", [1, "cat", [1, 2],
+                                        np.array([]), (1, 3), {1: 2}])
+    def test_inplace_no_assignment(self, target):
+        expression = "1 + 2"
+
+        assert self.eval(expression, target=target, inplace=False) == 3
+
+        msg = "Cannot operate inplace if there is no assignment"
+        with pytest.raises(ValueError, match=msg):
+            self.eval(expression, target=target, inplace=True)
+
     def test_basic_period_index_boolean_expression(self):
         df = mkdf(2, 2, data_gen_f=f, c_idx_type='p', r_idx_type='i')
 
@@ -1433,108 +1488,111 @@ def test_simple_in_ops(self):
         if self.parser != 'python':
             res = pd.eval('1 in [1, 2]', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('2 in (1, 2)', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('3 in (1, 2)', engine=self.engine,
                           parser=self.parser)
-            self.assertFalse(res)
+            assert not res
 
             res = pd.eval('3 not in (1, 2)', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('[3] not in (1, 2)', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('[3] in ([3], 2)', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('[[3]] in [[[3]], 2]', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('(3,) in [(3,), 2]', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
 
             res = pd.eval('(3,) not in [(3,), 2]', engine=self.engine,
                           parser=self.parser)
-            self.assertFalse(res)
+            assert not res
 
             res = pd.eval('[(3,)] in [[(3,)], 2]', engine=self.engine,
                           parser=self.parser)
-            self.assertTrue(res)
+            assert res
         else:
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('1 in [1, 2]', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('2 in (1, 2)', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('3 in (1, 2)', engine=self.engine, parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('3 not in (1, 2)', engine=self.engine,
                         parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('[(3,)] in (1, 2, [(3,)])', engine=self.engine,
                         parser=self.parser)
-            with tm.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 pd.eval('[3] not in (1, 2, [[3]])', engine=self.engine,
                         parser=self.parser)
 
 
+@td.skip_if_no_ne
 class TestOperationsNumExprPython(TestOperationsNumExprPandas):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestOperationsNumExprPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestOperationsNumExprPython, cls).setup_class()
         cls.engine = 'numexpr'
         cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
         cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
         cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
                                cls.arith_ops)
 
     def test_check_many_exprs(self):
-        a = 1
+        a = 1  # noqa
         expr = ' * '.join('a' * 33)
         expected = 1
         res = pd.eval(expr, engine=self.engine, parser=self.parser)
-        tm.assert_equal(res, expected)
+        assert res == expected
 
     def test_fails_and(self):
         df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'df > 2 and df > 3',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
+        msg = "'BoolOp' nodes are not implemented"
+        with pytest.raises(NotImplementedError, match=msg):
+            pd.eval('df > 2 and df > 3', local_dict={'df': df},
+                    parser=self.parser, engine=self.engine)
 
     def test_fails_or(self):
         df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'df > 2 or df > 3',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
+        msg = "'BoolOp' nodes are not implemented"
+        with pytest.raises(NotImplementedError, match=msg):
+            pd.eval('df > 2 or df > 3', local_dict={'df': df},
+                    parser=self.parser, engine=self.engine)
 
     def test_fails_not(self):
         df = DataFrame(np.random.randn(5, 3))
-        self.assertRaises(NotImplementedError, pd.eval, 'not df > 2',
-                          local_dict={'df': df}, parser=self.parser,
-                          engine=self.engine)
+        msg = "'Not' nodes are not implemented"
+        with pytest.raises(NotImplementedError, match=msg):
+            pd.eval('not df > 2', local_dict={'df': df}, parser=self.parser,
+                    engine=self.engine)
 
     def test_fails_ampersand(self):
-        df = DataFrame(np.random.randn(5, 3))
+        df = DataFrame(np.random.randn(5, 3))  # noqa
         ex = '(df + 2)[df > 1] > 0 & (df > 0)'
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             pd.eval(ex, parser=self.parser, engine=self.engine)
 
     def test_fails_pipe(self):
-        df = DataFrame(np.random.randn(5, 3))
+        df = DataFrame(np.random.randn(5, 3))  # noqa
         ex = '(df + 2)[df > 1] > 0 | (df > 0)'
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             pd.eval(ex, parser=self.parser, engine=self.engine)
 
     def test_bool_ops_with_constants(self):
@@ -1542,31 +1600,31 @@ def test_bool_ops_with_constants(self):
                                     ('True', 'False')):
             ex = '{0} {1} {2}'.format(lhs, op, rhs)
             if op in ('and', 'or'):
-                with tm.assertRaises(NotImplementedError):
+                with pytest.raises(NotImplementedError):
                     self.eval(ex)
             else:
                 res = self.eval(ex)
                 exp = eval(ex)
-                self.assertEqual(res, exp)
+                assert res == exp
 
     def test_simple_bool_ops(self):
         for op, lhs, rhs in product(expr._bool_ops_syms, (True, False),
                                     (True, False)):
             ex = 'lhs {0} rhs'.format(op)
             if op in ('and', 'or'):
-                with tm.assertRaises(NotImplementedError):
+                with pytest.raises(NotImplementedError):
                     pd.eval(ex, engine=self.engine, parser=self.parser)
             else:
                 res = pd.eval(ex, engine=self.engine, parser=self.parser)
                 exp = eval(ex)
-                self.assertEqual(res, exp)
+                assert res == exp
 
 
 class TestOperationsPythonPython(TestOperationsNumExprPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestOperationsPythonPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestOperationsPythonPython, cls).setup_class()
         cls.engine = cls.parser = 'python'
         cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
         cls.arith_ops = filter(lambda x: x not in ('in', 'not in'),
@@ -1576,26 +1634,25 @@ def setUpClass(cls):
 class TestOperationsPythonPandas(TestOperationsNumExprPandas):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestOperationsPythonPandas, cls).setUpClass()
+    def setup_class(cls):
+        super(TestOperationsPythonPandas, cls).setup_class()
         cls.engine = 'python'
         cls.parser = 'pandas'
         cls.arith_ops = expr._arith_ops_syms + expr._cmp_ops_syms
 
 
-class TestMathPythonPython(tm.TestCase):
+@td.skip_if_no_ne
+class TestMathPythonPython(object):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestMathPythonPython, cls).setUpClass()
-        tm.skip_if_no_ne()
+    def setup_class(cls):
         cls.engine = 'python'
         cls.parser = 'pandas'
         cls.unary_fns = _unary_math_ops
         cls.binary_fns = _binary_math_ops
 
     @classmethod
-    def tearDownClass(cls):
+    def teardown_class(cls):
         del cls.engine, cls.parser
 
     def eval(self, *args, **kwargs):
@@ -1604,16 +1661,26 @@ def eval(self, *args, **kwargs):
         kwargs['level'] = kwargs.pop('level', 0) + 1
         return pd.eval(*args, **kwargs)
 
-    def test_unary_functions(self):
+    def test_unary_functions(self, unary_fns_for_ne):
         df = DataFrame({'a': np.random.randn(10)})
         a = df.a
-        for fn in self.unary_fns:
+
+        for fn in unary_fns_for_ne:
             expr = "{0}(a)".format(fn)
             got = self.eval(expr)
             with np.errstate(all='ignore'):
                 expect = getattr(np, fn)(a)
             tm.assert_series_equal(got, expect, check_names=False)
 
+    def test_floor_and_ceil_functions_raise_error(self,
+                                                  ne_lt_2_6_9,
+                                                  unary_fns_for_ne):
+        for fn in ('floor', 'ceil'):
+            msg = "\"{0}\" is not a supported function".format(fn)
+            with pytest.raises(ValueError, match=msg):
+                expr = "{0}(100)".format(fn)
+                self.eval(expr)
+
     def test_binary_functions(self):
         df = DataFrame({'a': np.random.randn(10),
                         'b': np.random.randn(10)})
@@ -1648,14 +1715,14 @@ def test_df_arithmetic_subexpression(self):
 
     def check_result_type(self, dtype, expect_dtype):
         df = DataFrame({'a': np.random.randn(10).astype(dtype)})
-        self.assertEqual(df.a.dtype, dtype)
+        assert df.a.dtype == dtype
         df.eval("b = sin(a)",
                 engine=self.engine,
                 parser=self.parser, inplace=True)
         got = df.b
         expect = np.sin(df.a)
-        self.assertEqual(expect.dtype, got.dtype)
-        self.assertEqual(expect_dtype, got.dtype)
+        assert expect.dtype == got.dtype
+        assert expect_dtype == got.dtype
         tm.assert_series_equal(got, expect, check_names=False)
 
     def test_result_types(self):
@@ -1674,17 +1741,18 @@ def test_result_types2(self):
 
     def test_undefined_func(self):
         df = DataFrame({'a': np.random.randn(10)})
-        with tm.assertRaisesRegexp(ValueError,
-                                   "\"mysin\" is not a supported function"):
+        msg = "\"mysin\" is not a supported function"
+
+        with pytest.raises(ValueError, match=msg):
             df.eval("mysin(a)",
                     engine=self.engine,
                     parser=self.parser)
 
     def test_keyword_arg(self):
         df = DataFrame({'a': np.random.randn(10)})
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Function \"sin\" does not support "
-                                   "keyword arguments"):
+        msg = "Function \"sin\" does not support keyword arguments"
+
+        with pytest.raises(TypeError, match=msg):
             df.eval("sin(x=a)",
                     engine=self.engine,
                     parser=self.parser)
@@ -1693,8 +1761,8 @@ def test_keyword_arg(self):
 class TestMathPythonPandas(TestMathPythonPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestMathPythonPandas, cls).setUpClass()
+    def setup_class(cls):
+        super(TestMathPythonPandas, cls).setup_class()
         cls.engine = 'python'
         cls.parser = 'pandas'
 
@@ -1702,8 +1770,8 @@ def setUpClass(cls):
 class TestMathNumExprPandas(TestMathPythonPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestMathNumExprPandas, cls).setUpClass()
+    def setup_class(cls):
+        super(TestMathNumExprPandas, cls).setup_class()
         cls.engine = 'numexpr'
         cls.parser = 'pandas'
 
@@ -1711,8 +1779,8 @@ def setUpClass(cls):
 class TestMathNumExprPython(TestMathPythonPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestMathNumExprPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestMathNumExprPython, cls).setup_class()
         cls.engine = 'numexpr'
         cls.parser = 'python'
 
@@ -1728,43 +1796,42 @@ def test_global_scope(self, engine, parser):
                                                         parser=parser))
 
     def test_no_new_locals(self, engine, parser):
-        x = 1
+        x = 1  # noqa
         lcls = locals().copy()
         pd.eval('x + 1', local_dict=lcls, engine=engine, parser=parser)
         lcls2 = locals().copy()
         lcls2.pop('lcls')
-        tm.assert_equal(lcls, lcls2)
+        assert lcls == lcls2
 
     def test_no_new_globals(self, engine, parser):
-        x = 1
+        x = 1  # noqa
         gbls = globals().copy()
         pd.eval('x + 1', engine=engine, parser=parser)
         gbls2 = globals().copy()
-        tm.assert_equal(gbls, gbls2)
+        assert gbls == gbls2
 
 
+@td.skip_if_no_ne
 def test_invalid_engine():
-    tm.skip_if_no_ne()
-    assertRaisesRegexp(KeyError, 'Invalid engine \'asdf\' passed',
-                       pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
-                       engine='asdf')
+    msg = 'Invalid engine \'asdf\' passed'
+    with pytest.raises(KeyError, match=msg):
+        pd.eval('x + y', local_dict={'x': 1, 'y': 2}, engine='asdf')
 
 
+@td.skip_if_no_ne
 def test_invalid_parser():
-    tm.skip_if_no_ne()
-    assertRaisesRegexp(KeyError, 'Invalid parser \'asdf\' passed',
-                       pd.eval, 'x + y', local_dict={'x': 1, 'y': 2},
-                       parser='asdf')
+    msg = 'Invalid parser \'asdf\' passed'
+    with pytest.raises(KeyError, match=msg):
+        pd.eval('x + y', local_dict={'x': 1, 'y': 2}, parser='asdf')
 
 
 _parsers = {'python': PythonExprVisitor, 'pytables': pytables.ExprVisitor,
             'pandas': PandasExprVisitor}
 
 
-@pytest.mark.parametrize('engine', _parsers)
+@pytest.mark.parametrize('engine', _engines)
 @pytest.mark.parametrize('parser', _parsers)
 def test_disallowed_nodes(engine, parser):
-    tm.skip_if_no_ne(engine)
     VisitorClass = _parsers[parser]
     uns_ops = VisitorClass.unsupported_nodes
     inst = VisitorClass('x + 1', engine, parser)
@@ -1782,49 +1849,50 @@ def test_syntax_error_exprs(engine, parser):
 
 def test_name_error_exprs(engine, parser):
     e = 's + t'
-    with tm.assertRaises(NameError):
+    with pytest.raises(NameError):
         pd.eval(e, engine=engine, parser=parser)
 
 
 def test_invalid_local_variable_reference(engine, parser):
-    a, b = 1, 2
+    a, b = 1, 2  # noqa
     exprs = 'a + @b', '@a + b', '@a + @b'
-    for expr in exprs:
+
+    for _expr in exprs:
         if parser != 'pandas':
-            with tm.assertRaisesRegexp(SyntaxError, "The '@' prefix is only"):
-                pd.eval(exprs, engine=engine, parser=parser)
+            with pytest.raises(SyntaxError, match="The '@' prefix is only"):
+                pd.eval(_expr, engine=engine, parser=parser)
         else:
-            with tm.assertRaisesRegexp(SyntaxError, "The '@' prefix is not"):
-                pd.eval(exprs, engine=engine, parser=parser)
+            with pytest.raises(SyntaxError, match="The '@' prefix is not"):
+                pd.eval(_expr, engine=engine, parser=parser)
 
 
 def test_numexpr_builtin_raises(engine, parser):
     sin, dotted_line = 1, 2
     if engine == 'numexpr':
-        with tm.assertRaisesRegexp(NumExprClobberingError,
-                                   'Variables in expression .+'):
+        msg = 'Variables in expression .+'
+        with pytest.raises(NumExprClobberingError, match=msg):
             pd.eval('sin + dotted_line', engine=engine, parser=parser)
     else:
         res = pd.eval('sin + dotted_line', engine=engine, parser=parser)
-        tm.assert_equal(res, sin + dotted_line)
+        assert res == sin + dotted_line
 
 
 def test_bad_resolver_raises(engine, parser):
     cannot_resolve = 42, 3.0
-    with tm.assertRaisesRegexp(TypeError, 'Resolver of type .+'):
+    with pytest.raises(TypeError, match='Resolver of type .+'):
         pd.eval('1 + 2', resolvers=cannot_resolve, engine=engine,
                 parser=parser)
 
 
 def test_empty_string_raises(engine, parser):
     # GH 13139
-    with tm.assertRaisesRegexp(ValueError, 'expr cannot be an empty string'):
+    with pytest.raises(ValueError, match="expr cannot be an empty string"):
         pd.eval('', engine=engine, parser=parser)
 
 
 def test_more_than_one_expression_raises(engine, parser):
-    with tm.assertRaisesRegexp(SyntaxError,
-                               'only a single expression is allowed'):
+    with pytest.raises(SyntaxError, match=("only a single expression "
+                                           "is allowed")):
         pd.eval('1 + 1; 2 + 2', engine=engine, parser=parser)
 
 
@@ -1834,15 +1902,15 @@ def test_more_than_one_expression_raises(engine, parser):
 def test_bool_ops_fails_on_scalars(lhs, cmp, rhs, engine, parser):
     gen = {int: lambda: np.random.randint(10), float: np.random.randn}
 
-    mid = gen[lhs]()
-    lhs = gen[lhs]()
-    rhs = gen[rhs]()
+    mid = gen[lhs]()  # noqa
+    lhs = gen[lhs]()  # noqa
+    rhs = gen[rhs]()  # noqa
 
     ex1 = 'lhs {0} mid {1} rhs'.format(cmp, cmp)
     ex2 = 'lhs {0} mid and mid {1} rhs'.format(cmp, cmp)
     ex3 = '(lhs {0} mid) & (mid {1} rhs)'.format(cmp, cmp)
     for ex in (ex1, ex2, ex3):
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             pd.eval(ex, engine=engine, parser=parser)
 
 
@@ -1850,7 +1918,7 @@ def test_inf(engine, parser):
     s = 'inf + 1'
     expected = np.inf
     result = pd.eval(s, engine=engine, parser=parser)
-    tm.assert_equal(result, expected)
+    assert result == expected
 
 
 def test_negate_lt_eq_le(engine, parser):
@@ -1861,18 +1929,18 @@ def test_negate_lt_eq_le(engine, parser):
     tm.assert_frame_equal(result, expected)
 
     if parser == 'python':
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             df.query('not (cat > 0)', engine=engine, parser=parser)
     else:
         result = df.query('not (cat > 0)', engine=engine, parser=parser)
         tm.assert_frame_equal(result, expected)
 
 
-class TestValidate(tm.TestCase):
+class TestValidate(object):
 
     def test_validate_bool_args(self):
         invalid_values = [1, "True", [1, 2, 3], 5.0]
 
         for value in invalid_values:
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 pd.eval("2+2", inplace=value)
diff --git a/pandas/tests/dtypes/__init__.py b/pandas/tests/dtypes/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/dtypes/cast/__init__.py b/pandas/tests/dtypes/cast/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/dtypes/cast/test_construct_from_scalar.py b/pandas/tests/dtypes/cast/test_construct_from_scalar.py
new file mode 100644
index 0000000000000..d0f58c811e34c
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_construct_from_scalar.py
@@ -0,0 +1,22 @@
+# -*- coding: utf-8 -*-
+
+from pandas.core.dtypes.cast import construct_1d_arraylike_from_scalar
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+from pandas import Categorical
+from pandas.util import testing as tm
+
+
+def test_cast_1d_array_like_from_scalar_categorical():
+    # see gh-19565
+    #
+    # Categorical result from scalar did not maintain
+    # categories and ordering of the passed dtype.
+    cats = ["a", "b", "c"]
+    cat_type = CategoricalDtype(categories=cats, ordered=False)
+    expected = Categorical(["a", "a"], categories=cats)
+
+    result = construct_1d_arraylike_from_scalar("a", len(expected), cat_type)
+    tm.assert_categorical_equal(result, expected,
+                                check_category_order=True,
+                                check_dtype=True)
diff --git a/pandas/tests/dtypes/cast/test_construct_ndarray.py b/pandas/tests/dtypes/cast/test_construct_ndarray.py
new file mode 100644
index 0000000000000..aa2cb25e62d52
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_construct_ndarray.py
@@ -0,0 +1,20 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.cast import construct_1d_ndarray_preserving_na
+
+from pandas.util import testing as tm
+
+
+@pytest.mark.parametrize('values, dtype, expected', [
+    ([1, 2, 3], None, np.array([1, 2, 3])),
+    (np.array([1, 2, 3]), None, np.array([1, 2, 3])),
+    (['1', '2', None], None, np.array(['1', '2', None])),
+    (['1', '2', None], np.dtype('str'), np.array(['1', '2', None])),
+    ([1, 2, None], np.dtype('str'), np.array(['1', '2', None])),
+])
+def test_construct_1d_ndarray_preserving_na(values, dtype, expected):
+    result = construct_1d_ndarray_preserving_na(values, dtype=dtype)
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/dtypes/cast/test_construct_object_arr.py b/pandas/tests/dtypes/cast/test_construct_object_arr.py
new file mode 100644
index 0000000000000..61fc17880ed65
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_construct_object_arr.py
@@ -0,0 +1,22 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+
+
+@pytest.mark.parametrize("datum1", [1, 2., "3", (4, 5), [6, 7], None])
+@pytest.mark.parametrize("datum2", [8, 9., "10", (11, 12), [13, 14], None])
+def test_cast_1d_array(datum1, datum2):
+    data = [datum1, datum2]
+    result = construct_1d_object_array_from_listlike(data)
+
+    # Direct comparison fails: https://github.com/numpy/numpy/issues/10218
+    assert result.dtype == "object"
+    assert list(result) == data
+
+
+@pytest.mark.parametrize("val", [1, 2., None])
+def test_cast_1d_array_invalid_scalar(val):
+    with pytest.raises(TypeError, match="has no len()"):
+        construct_1d_object_array_from_listlike(val)
diff --git a/pandas/tests/dtypes/cast/test_convert_objects.py b/pandas/tests/dtypes/cast/test_convert_objects.py
new file mode 100644
index 0000000000000..58ba4161e96a9
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_convert_objects.py
@@ -0,0 +1,15 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.cast import maybe_convert_objects
+
+
+@pytest.mark.parametrize("data", [[1, 2], ["apply", "banana"]])
+@pytest.mark.parametrize("copy", [True, False])
+def test_maybe_convert_objects_copy(data, copy):
+    arr = np.array(data)
+    out = maybe_convert_objects(arr, copy=copy)
+
+    assert (arr is out) is (not copy)
diff --git a/pandas/tests/dtypes/cast/test_downcast.py b/pandas/tests/dtypes/cast/test_downcast.py
new file mode 100644
index 0000000000000..41607c948b909
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_downcast.py
@@ -0,0 +1,82 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.cast import maybe_downcast_to_dtype
+
+from pandas import DatetimeIndex, Series, Timestamp
+from pandas.util import testing as tm
+
+
+@pytest.mark.parametrize("arr,dtype,expected", [
+    (np.array([8.5, 8.6, 8.7, 8.8, 8.9999999999995]), "infer",
+     np.array([8.5, 8.6, 8.7, 8.8, 8.9999999999995])),
+
+    (np.array([8., 8., 8., 8., 8.9999999999995]), "infer",
+     np.array([8, 8, 8, 8, 9], dtype=np.int64)),
+
+    (np.array([8., 8., 8., 8., 9.0000000000005]), "infer",
+     np.array([8, 8, 8, 8, 9], dtype=np.int64)),
+])
+def test_downcast(arr, expected, dtype):
+    result = maybe_downcast_to_dtype(arr, dtype)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_downcast_booleans():
+    # see gh-16875: coercing of booleans.
+    ser = Series([True, True, False])
+    result = maybe_downcast_to_dtype(ser, np.dtype(np.float64))
+
+    expected = ser
+    tm.assert_series_equal(result, expected)
+
+
+def test_downcast_conversion_no_nan(any_real_dtype):
+    dtype = any_real_dtype
+    expected = np.array([1, 2])
+    arr = np.array([1.0, 2.0], dtype=dtype)
+
+    result = maybe_downcast_to_dtype(arr, "infer")
+    tm.assert_almost_equal(result, expected, check_dtype=False)
+
+
+def test_downcast_conversion_nan(float_dtype):
+    dtype = float_dtype
+    data = [1.0, 2.0, np.nan]
+
+    expected = np.array(data, dtype=dtype)
+    arr = np.array(data, dtype=dtype)
+
+    result = maybe_downcast_to_dtype(arr, "infer")
+    tm.assert_almost_equal(result, expected)
+
+
+def test_downcast_conversion_empty(any_real_dtype):
+    dtype = any_real_dtype
+    arr = np.array([], dtype=dtype)
+    result = maybe_downcast_to_dtype(arr, "int64")
+    tm.assert_numpy_array_equal(result, np.array([], dtype=np.int64))
+
+
+@pytest.mark.parametrize("klass", [np.datetime64, np.timedelta64])
+def test_datetime_likes_nan(klass):
+    dtype = klass.__name__ + "[ns]"
+    arr = np.array([1, 2, np.nan])
+
+    exp = np.array([1, 2, klass("NaT")], dtype)
+    res = maybe_downcast_to_dtype(arr, dtype)
+    tm.assert_numpy_array_equal(res, exp)
+
+
+@pytest.mark.parametrize("as_asi", [True, False])
+def test_datetime_with_timezone(as_asi):
+    # see gh-15426
+    ts = Timestamp("2016-01-01 12:00:00", tz="US/Pacific")
+    exp = DatetimeIndex([ts, ts])
+
+    obj = exp.asi8 if as_asi else exp
+    res = maybe_downcast_to_dtype(obj, exp.dtype)
+
+    tm.assert_index_equal(res, exp)
diff --git a/pandas/tests/dtypes/cast/test_find_common_type.py b/pandas/tests/dtypes/cast/test_find_common_type.py
new file mode 100644
index 0000000000000..d83c8d03e9e42
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_find_common_type.py
@@ -0,0 +1,108 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.cast import find_common_type
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, DatetimeTZDtype, PeriodDtype)
+
+
+@pytest.mark.parametrize("source_dtypes,expected_common_dtype", [
+    ((np.int64,), np.int64),
+    ((np.uint64,), np.uint64),
+    ((np.float32,), np.float32),
+    ((np.object,), np.object),
+
+    # Into ints.
+    ((np.int16, np.int64), np.int64),
+    ((np.int32, np.uint32), np.int64),
+    ((np.uint16, np.uint64), np.uint64),
+
+    # Into floats.
+    ((np.float16, np.float32), np.float32),
+    ((np.float16, np.int16), np.float32),
+    ((np.float32, np.int16), np.float32),
+    ((np.uint64, np.int64), np.float64),
+    ((np.int16, np.float64), np.float64),
+    ((np.float16, np.int64), np.float64),
+
+    # Into others.
+    ((np.complex128, np.int32), np.complex128),
+    ((np.object, np.float32), np.object),
+    ((np.object, np.int16), np.object),
+
+    # Bool with int.
+    ((np.dtype("bool"), np.int64), np.object),
+    ((np.dtype("bool"), np.int32), np.object),
+    ((np.dtype("bool"), np.int16), np.object),
+    ((np.dtype("bool"), np.int8), np.object),
+    ((np.dtype("bool"), np.uint64), np.object),
+    ((np.dtype("bool"), np.uint32), np.object),
+    ((np.dtype("bool"), np.uint16), np.object),
+    ((np.dtype("bool"), np.uint8), np.object),
+
+    # Bool with float.
+    ((np.dtype("bool"), np.float64), np.object),
+    ((np.dtype("bool"), np.float32), np.object),
+
+    ((np.dtype("datetime64[ns]"), np.dtype("datetime64[ns]")),
+     np.dtype("datetime64[ns]")),
+    ((np.dtype("timedelta64[ns]"), np.dtype("timedelta64[ns]")),
+     np.dtype("timedelta64[ns]")),
+
+    ((np.dtype("datetime64[ns]"), np.dtype("datetime64[ms]")),
+     np.dtype("datetime64[ns]")),
+    ((np.dtype("timedelta64[ms]"), np.dtype("timedelta64[ns]")),
+     np.dtype("timedelta64[ns]")),
+
+    ((np.dtype("datetime64[ns]"), np.dtype("timedelta64[ns]")), np.object),
+    ((np.dtype("datetime64[ns]"), np.int64), np.object)
+])
+def test_numpy_dtypes(source_dtypes, expected_common_dtype):
+    assert find_common_type(source_dtypes) == expected_common_dtype
+
+
+def test_raises_empty_input():
+    with pytest.raises(ValueError, match="no types given"):
+        find_common_type([])
+
+
+@pytest.mark.parametrize("dtypes,exp_type", [
+    ([CategoricalDtype()], "category"),
+    ([np.object, CategoricalDtype()], np.object),
+    ([CategoricalDtype(), CategoricalDtype()], "category"),
+])
+def test_categorical_dtype(dtypes, exp_type):
+    assert find_common_type(dtypes) == exp_type
+
+
+def test_datetimetz_dtype_match():
+    dtype = DatetimeTZDtype(unit="ns", tz="US/Eastern")
+    assert find_common_type([dtype, dtype]) == "datetime64[ns, US/Eastern]"
+
+
+@pytest.mark.parametrize("dtype2", [
+    DatetimeTZDtype(unit="ns", tz="Asia/Tokyo"),
+    np.dtype("datetime64[ns]"), np.object, np.int64
+])
+def test_datetimetz_dtype_mismatch(dtype2):
+    dtype = DatetimeTZDtype(unit="ns", tz="US/Eastern")
+    assert find_common_type([dtype, dtype2]) == np.object
+    assert find_common_type([dtype2, dtype]) == np.object
+
+
+def test_period_dtype_match():
+    dtype = PeriodDtype(freq="D")
+    assert find_common_type([dtype, dtype]) == "period[D]"
+
+
+@pytest.mark.parametrize("dtype2", [
+    DatetimeTZDtype(unit="ns", tz="Asia/Tokyo"),
+    PeriodDtype(freq="2D"), PeriodDtype(freq="H"),
+    np.dtype("datetime64[ns]"), np.object, np.int64
+])
+def test_period_dtype_mismatch(dtype2):
+    dtype = PeriodDtype(freq="D")
+    assert find_common_type([dtype, dtype2]) == np.object
+    assert find_common_type([dtype2, dtype]) == np.object
diff --git a/pandas/tests/dtypes/cast/test_infer_datetimelike.py b/pandas/tests/dtypes/cast/test_infer_datetimelike.py
new file mode 100644
index 0000000000000..b2d63a6bfbd1c
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_infer_datetimelike.py
@@ -0,0 +1,22 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import DataFrame, NaT, Series, Timestamp
+
+
+@pytest.mark.parametrize("data,exp_size", [
+    # see gh-16362.
+    ([[NaT, "a", "b", 0], [NaT, "b", "c", 1]], 8),
+    ([[NaT, "a", 0], [NaT, "b", 1]], 6)
+])
+def test_maybe_infer_to_datetimelike_df_construct(data, exp_size):
+    result = DataFrame(np.array(data))
+    assert result.size == exp_size
+
+
+def test_maybe_infer_to_datetimelike_ser_construct():
+    # see gh-19671.
+    result = Series(["M1701", Timestamp("20130101")])
+    assert result.dtype.kind == "O"
diff --git a/pandas/tests/dtypes/cast/test_infer_dtype.py b/pandas/tests/dtypes/cast/test_infer_dtype.py
new file mode 100644
index 0000000000000..c7842ac591ed9
--- /dev/null
+++ b/pandas/tests/dtypes/cast/test_infer_dtype.py
@@ -0,0 +1,160 @@
+# -*- coding: utf-8 -*-
+
+from datetime import date, datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.cast import (
+    cast_scalar_to_array, infer_dtype_from_array, infer_dtype_from_scalar)
+from pandas.core.dtypes.common import is_dtype_equal
+
+from pandas import (
+    Categorical, Period, Series, Timedelta, Timestamp, date_range)
+from pandas.util import testing as tm
+
+
+@pytest.fixture(params=[True, False])
+def pandas_dtype(request):
+    return request.param
+
+
+def test_infer_dtype_from_int_scalar(any_int_dtype):
+    # Test that infer_dtype_from_scalar is
+    # returning correct dtype for int and float.
+    data = np.dtype(any_int_dtype).type(12)
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == type(data)
+
+
+def test_infer_dtype_from_float_scalar(float_dtype):
+    float_dtype = np.dtype(float_dtype).type
+    data = float_dtype(12)
+
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == float_dtype
+
+
+@pytest.mark.parametrize("data,exp_dtype", [
+    (12, np.int64), (np.float(12), np.float64)
+])
+def test_infer_dtype_from_python_scalar(data, exp_dtype):
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == exp_dtype
+
+
+@pytest.mark.parametrize("bool_val", [True, False])
+def test_infer_dtype_from_boolean(bool_val):
+    dtype, val = infer_dtype_from_scalar(bool_val)
+    assert dtype == np.bool_
+
+
+def test_infer_dtype_from_complex(complex_dtype):
+    data = np.dtype(complex_dtype).type(1)
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == np.complex_
+
+
+@pytest.mark.parametrize("data", [np.datetime64(1, "ns"), Timestamp(1),
+                                  datetime(2000, 1, 1, 0, 0)])
+def test_infer_dtype_from_datetime(data):
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == "M8[ns]"
+
+
+@pytest.mark.parametrize("data", [np.timedelta64(1, "ns"), Timedelta(1),
+                                  timedelta(1)])
+def test_infer_dtype_from_timedelta(data):
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == "m8[ns]"
+
+
+@pytest.mark.parametrize("freq", ["M", "D"])
+def test_infer_dtype_from_period(freq, pandas_dtype):
+    p = Period("2011-01-01", freq=freq)
+    dtype, val = infer_dtype_from_scalar(p, pandas_dtype=pandas_dtype)
+
+    if pandas_dtype:
+        exp_dtype = "period[{0}]".format(freq)
+        exp_val = p.ordinal
+    else:
+        exp_dtype = np.object_
+        exp_val = p
+
+    assert dtype == exp_dtype
+    assert val == exp_val
+
+
+@pytest.mark.parametrize("data", [date(2000, 1, 1), "foo",
+                                  Timestamp(1, tz="US/Eastern")])
+def test_infer_dtype_misc(data):
+    dtype, val = infer_dtype_from_scalar(data)
+    assert dtype == np.object_
+
+
+@pytest.mark.parametrize("tz", ["UTC", "US/Eastern", "Asia/Tokyo"])
+def test_infer_from_scalar_tz(tz, pandas_dtype):
+    dt = Timestamp(1, tz=tz)
+    dtype, val = infer_dtype_from_scalar(dt, pandas_dtype=pandas_dtype)
+
+    if pandas_dtype:
+        exp_dtype = "datetime64[ns, {0}]".format(tz)
+        exp_val = dt.value
+    else:
+        exp_dtype = np.object_
+        exp_val = dt
+
+    assert dtype == exp_dtype
+    assert val == exp_val
+
+
+def test_infer_dtype_from_scalar_errors():
+    msg = "invalid ndarray passed to infer_dtype_from_scalar"
+
+    with pytest.raises(ValueError, match=msg):
+        infer_dtype_from_scalar(np.array([1]))
+
+
+@pytest.mark.parametrize(
+    "arr, expected, pandas_dtype",
+    [("foo", np.object_, False),
+     (b"foo", np.object_, False),
+     (1, np.int_, False),
+     (1.5, np.float_, False),
+     ([1], np.int_, False),
+     (np.array([1], dtype=np.int64), np.int64, False),
+     ([np.nan, 1, ""], np.object_, False),
+     (np.array([[1.0, 2.0]]), np.float_, False),
+     (Categorical(list("aabc")), np.object_, False),
+     (Categorical([1, 2, 3]), np.int64, False),
+     (Categorical(list("aabc")), "category", True),
+     (Categorical([1, 2, 3]), "category", True),
+     (Timestamp("20160101"), np.object_, False),
+     (np.datetime64("2016-01-01"), np.dtype("=M8[D]"), False),
+     (date_range("20160101", periods=3),
+      np.dtype("=M8[ns]"), False),
+     (date_range("20160101", periods=3, tz="US/Eastern"),
+      "datetime64[ns, US/Eastern]", True),
+     (Series([1., 2, 3]), np.float64, False),
+     (Series(list("abc")), np.object_, False),
+     (Series(date_range("20160101", periods=3, tz="US/Eastern")),
+      "datetime64[ns, US/Eastern]", True)])
+def test_infer_dtype_from_array(arr, expected, pandas_dtype):
+    dtype, _ = infer_dtype_from_array(arr, pandas_dtype=pandas_dtype)
+    assert is_dtype_equal(dtype, expected)
+
+
+@pytest.mark.parametrize("obj,dtype", [
+    (1, np.int64), (1.1, np.float64),
+    (Timestamp("2011-01-01"), "datetime64[ns]"),
+    (Timestamp("2011-01-01", tz="US/Eastern"), np.object),
+    (Period("2011-01-01", freq="D"), np.object)
+])
+def test_cast_scalar_to_array(obj, dtype):
+    shape = (3, 2)
+
+    exp = np.empty(shape, dtype=dtype)
+    exp.fill(obj)
+
+    arr = cast_scalar_to_array(shape, obj, dtype=dtype)
+    tm.assert_numpy_array_equal(arr, exp)
diff --git a/pandas/tests/dtypes/test_common.py b/pandas/tests/dtypes/test_common.py
new file mode 100644
index 0000000000000..5c1f6ff405b3b
--- /dev/null
+++ b/pandas/tests/dtypes/test_common.py
@@ -0,0 +1,656 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas.util._test_decorators as td
+
+import pandas.core.dtypes.common as com
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, CategoricalDtypeType, DatetimeTZDtype, IntervalDtype,
+    PeriodDtype)
+
+import pandas as pd
+from pandas.conftest import (
+    ALL_EA_INT_DTYPES, ALL_INT_DTYPES, SIGNED_EA_INT_DTYPES, SIGNED_INT_DTYPES,
+    UNSIGNED_EA_INT_DTYPES, UNSIGNED_INT_DTYPES)
+from pandas.core.sparse.api import SparseDtype
+import pandas.util.testing as tm
+
+
+# EA & Actual Dtypes
+def to_ea_dtypes(dtypes):
+    """ convert list of string dtypes to EA dtype """
+    return [getattr(pd, dt + 'Dtype') for dt in dtypes]
+
+
+def to_numpy_dtypes(dtypes):
+    """ convert list of string dtypes to numpy dtype """
+    return [getattr(np, dt) for dt in dtypes if isinstance(dt, str)]
+
+
+class TestPandasDtype(object):
+
+    # Passing invalid dtype, both as a string or object, must raise TypeError
+    # Per issue GH15520
+    @pytest.mark.parametrize('box', [pd.Timestamp, 'pd.Timestamp', list])
+    def test_invalid_dtype_error(self, box):
+        with pytest.raises(TypeError, match='not understood'):
+            com.pandas_dtype(box)
+
+    @pytest.mark.parametrize('dtype', [
+        object, 'float64', np.object_, np.dtype('object'), 'O',
+        np.float64, float, np.dtype('float64')])
+    def test_pandas_dtype_valid(self, dtype):
+        assert com.pandas_dtype(dtype) == dtype
+
+    @pytest.mark.parametrize('dtype', [
+        'M8[ns]', 'm8[ns]', 'object', 'float64', 'int64'])
+    def test_numpy_dtype(self, dtype):
+        assert com.pandas_dtype(dtype) == np.dtype(dtype)
+
+    def test_numpy_string_dtype(self):
+        # do not parse freq-like string as period dtype
+        assert com.pandas_dtype('U') == np.dtype('U')
+        assert com.pandas_dtype('S') == np.dtype('S')
+
+    @pytest.mark.parametrize('dtype', [
+        'datetime64[ns, US/Eastern]',
+        'datetime64[ns, Asia/Tokyo]',
+        'datetime64[ns, UTC]'])
+    def test_datetimetz_dtype(self, dtype):
+        assert (com.pandas_dtype(dtype) ==
+                DatetimeTZDtype.construct_from_string(dtype))
+        assert com.pandas_dtype(dtype) == dtype
+
+    def test_categorical_dtype(self):
+        assert com.pandas_dtype('category') == CategoricalDtype()
+
+    @pytest.mark.parametrize('dtype', [
+        'period[D]', 'period[3M]', 'period[U]',
+        'Period[D]', 'Period[3M]', 'Period[U]'])
+    def test_period_dtype(self, dtype):
+        assert com.pandas_dtype(dtype) is PeriodDtype(dtype)
+        assert com.pandas_dtype(dtype) == PeriodDtype(dtype)
+        assert com.pandas_dtype(dtype) == dtype
+
+
+dtypes = dict(datetime_tz=com.pandas_dtype('datetime64[ns, US/Eastern]'),
+              datetime=com.pandas_dtype('datetime64[ns]'),
+              timedelta=com.pandas_dtype('timedelta64[ns]'),
+              period=PeriodDtype('D'),
+              integer=np.dtype(np.int64),
+              float=np.dtype(np.float64),
+              object=np.dtype(np.object),
+              category=com.pandas_dtype('category'))
+
+
+@pytest.mark.parametrize('name1,dtype1',
+                         list(dtypes.items()),
+                         ids=lambda x: str(x))
+@pytest.mark.parametrize('name2,dtype2',
+                         list(dtypes.items()),
+                         ids=lambda x: str(x))
+def test_dtype_equal(name1, dtype1, name2, dtype2):
+
+    # match equal to self, but not equal to other
+    assert com.is_dtype_equal(dtype1, dtype1)
+    if name1 != name2:
+        assert not com.is_dtype_equal(dtype1, dtype2)
+
+
+@pytest.mark.parametrize("dtype1,dtype2", [
+    (np.int8, np.int64),
+    (np.int16, np.int64),
+    (np.int32, np.int64),
+    (np.float32, np.float64),
+    (PeriodDtype("D"), PeriodDtype("2D")),  # PeriodType
+    (com.pandas_dtype("datetime64[ns, US/Eastern]"),
+     com.pandas_dtype("datetime64[ns, CET]")),  # Datetime
+    (None, None)  # gh-15941: no exception should be raised.
+])
+def test_dtype_equal_strict(dtype1, dtype2):
+    assert not com.is_dtype_equal(dtype1, dtype2)
+
+
+def get_is_dtype_funcs():
+    """
+    Get all functions in pandas.core.dtypes.common that
+    begin with 'is_' and end with 'dtype'
+
+    """
+
+    fnames = [f for f in dir(com) if (f.startswith('is_') and
+                                      f.endswith('dtype'))]
+    return [getattr(com, fname) for fname in fnames]
+
+
+@pytest.mark.parametrize('func',
+                         get_is_dtype_funcs(),
+                         ids=lambda x: x.__name__)
+def test_get_dtype_error_catch(func):
+    # see gh-15941
+    #
+    # No exception should be raised.
+
+    assert not func(None)
+
+
+def test_is_object():
+    assert com.is_object_dtype(object)
+    assert com.is_object_dtype(np.array([], dtype=object))
+
+    assert not com.is_object_dtype(int)
+    assert not com.is_object_dtype(np.array([], dtype=int))
+    assert not com.is_object_dtype([1, 2, 3])
+
+
+@pytest.mark.parametrize("check_scipy", [
+    False, pytest.param(True, marks=td.skip_if_no_scipy)
+])
+def test_is_sparse(check_scipy):
+    assert com.is_sparse(pd.SparseArray([1, 2, 3]))
+    assert com.is_sparse(pd.SparseSeries([1, 2, 3]))
+
+    assert not com.is_sparse(np.array([1, 2, 3]))
+
+    if check_scipy:
+        import scipy.sparse
+        assert not com.is_sparse(scipy.sparse.bsr_matrix([1, 2, 3]))
+
+
+@td.skip_if_no_scipy
+def test_is_scipy_sparse():
+    from scipy.sparse import bsr_matrix
+    assert com.is_scipy_sparse(bsr_matrix([1, 2, 3]))
+
+    assert not com.is_scipy_sparse(pd.SparseArray([1, 2, 3]))
+    assert not com.is_scipy_sparse(pd.SparseSeries([1, 2, 3]))
+
+
+def test_is_categorical():
+    cat = pd.Categorical([1, 2, 3])
+    assert com.is_categorical(cat)
+    assert com.is_categorical(pd.Series(cat))
+    assert com.is_categorical(pd.CategoricalIndex([1, 2, 3]))
+
+    assert not com.is_categorical([1, 2, 3])
+
+
+def test_is_datetimetz():
+    with tm.assert_produces_warning(FutureWarning):
+        assert not com.is_datetimetz([1, 2, 3])
+        assert not com.is_datetimetz(pd.DatetimeIndex([1, 2, 3]))
+
+        assert com.is_datetimetz(pd.DatetimeIndex([1, 2, 3], tz="US/Eastern"))
+
+        dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+        s = pd.Series([], dtype=dtype)
+        assert com.is_datetimetz(s)
+
+
+def test_is_period_deprecated():
+    with tm.assert_produces_warning(FutureWarning):
+        assert not com.is_period([1, 2, 3])
+        assert not com.is_period(pd.Index([1, 2, 3]))
+        assert com.is_period(pd.PeriodIndex(["2017-01-01"], freq="D"))
+
+
+def test_is_datetime64_dtype():
+    assert not com.is_datetime64_dtype(object)
+    assert not com.is_datetime64_dtype([1, 2, 3])
+    assert not com.is_datetime64_dtype(np.array([], dtype=int))
+
+    assert com.is_datetime64_dtype(np.datetime64)
+    assert com.is_datetime64_dtype(np.array([], dtype=np.datetime64))
+
+
+def test_is_datetime64tz_dtype():
+    assert not com.is_datetime64tz_dtype(object)
+    assert not com.is_datetime64tz_dtype([1, 2, 3])
+    assert not com.is_datetime64tz_dtype(pd.DatetimeIndex([1, 2, 3]))
+    assert com.is_datetime64tz_dtype(pd.DatetimeIndex(['2000'],
+                                                      tz="US/Eastern"))
+
+
+def test_is_timedelta64_dtype():
+    assert not com.is_timedelta64_dtype(object)
+    assert not com.is_timedelta64_dtype(None)
+    assert not com.is_timedelta64_dtype([1, 2, 3])
+    assert not com.is_timedelta64_dtype(np.array([], dtype=np.datetime64))
+    assert not com.is_timedelta64_dtype('0 days')
+    assert not com.is_timedelta64_dtype("0 days 00:00:00")
+    assert not com.is_timedelta64_dtype(["0 days 00:00:00"])
+    assert not com.is_timedelta64_dtype("NO DATE")
+
+    assert com.is_timedelta64_dtype(np.timedelta64)
+    assert com.is_timedelta64_dtype(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.is_timedelta64_dtype(pd.to_timedelta(['0 days', '1 days']))
+
+
+def test_is_period_dtype():
+    assert not com.is_period_dtype(object)
+    assert not com.is_period_dtype([1, 2, 3])
+    assert not com.is_period_dtype(pd.Period("2017-01-01"))
+
+    assert com.is_period_dtype(PeriodDtype(freq="D"))
+    assert com.is_period_dtype(pd.PeriodIndex([], freq="A"))
+
+
+def test_is_interval_dtype():
+    assert not com.is_interval_dtype(object)
+    assert not com.is_interval_dtype([1, 2, 3])
+
+    assert com.is_interval_dtype(IntervalDtype())
+
+    interval = pd.Interval(1, 2, closed="right")
+    assert not com.is_interval_dtype(interval)
+    assert com.is_interval_dtype(pd.IntervalIndex([interval]))
+
+
+def test_is_categorical_dtype():
+    assert not com.is_categorical_dtype(object)
+    assert not com.is_categorical_dtype([1, 2, 3])
+
+    assert com.is_categorical_dtype(CategoricalDtype())
+    assert com.is_categorical_dtype(pd.Categorical([1, 2, 3]))
+    assert com.is_categorical_dtype(pd.CategoricalIndex([1, 2, 3]))
+
+
+def test_is_string_dtype():
+    assert not com.is_string_dtype(int)
+    assert not com.is_string_dtype(pd.Series([1, 2]))
+
+    assert com.is_string_dtype(str)
+    assert com.is_string_dtype(object)
+    assert com.is_string_dtype(np.array(['a', 'b']))
+
+
+def test_is_period_arraylike():
+    assert not com.is_period_arraylike([1, 2, 3])
+    assert not com.is_period_arraylike(pd.Index([1, 2, 3]))
+    assert com.is_period_arraylike(pd.PeriodIndex(["2017-01-01"], freq="D"))
+
+
+def test_is_datetime_arraylike():
+    assert not com.is_datetime_arraylike([1, 2, 3])
+    assert not com.is_datetime_arraylike(pd.Index([1, 2, 3]))
+    assert com.is_datetime_arraylike(pd.DatetimeIndex([1, 2, 3]))
+
+
+def test_is_datetimelike():
+    assert not com.is_datetimelike([1, 2, 3])
+    assert not com.is_datetimelike(pd.Index([1, 2, 3]))
+
+    assert com.is_datetimelike(pd.DatetimeIndex([1, 2, 3]))
+    assert com.is_datetimelike(pd.PeriodIndex([], freq="A"))
+    assert com.is_datetimelike(np.array([], dtype=np.datetime64))
+    assert com.is_datetimelike(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.is_datetimelike(pd.DatetimeIndex(["2000"], tz="US/Eastern"))
+
+    dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    s = pd.Series([], dtype=dtype)
+    assert com.is_datetimelike(s)
+
+
+@pytest.mark.parametrize(
+    'dtype', [
+        pd.Series([1, 2])] +
+    ALL_INT_DTYPES + to_numpy_dtypes(ALL_INT_DTYPES) +
+    ALL_EA_INT_DTYPES + to_ea_dtypes(ALL_EA_INT_DTYPES))
+def test_is_integer_dtype(dtype):
+    assert com.is_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype', [str, float, np.datetime64, np.timedelta64,
+              pd.Index([1, 2.]), np.array(['a', 'b']),
+              np.array([], dtype=np.timedelta64)])
+def test_is_not_integer_dtype(dtype):
+    assert not com.is_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype', [
+        pd.Series([1, 2])] +
+    SIGNED_INT_DTYPES + to_numpy_dtypes(SIGNED_INT_DTYPES) +
+    SIGNED_EA_INT_DTYPES + to_ea_dtypes(SIGNED_EA_INT_DTYPES))
+def test_is_signed_integer_dtype(dtype):
+    assert com.is_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype',
+    [
+        str, float, np.datetime64, np.timedelta64,
+        pd.Index([1, 2.]), np.array(['a', 'b']),
+        np.array([], dtype=np.timedelta64)] +
+    UNSIGNED_INT_DTYPES + to_numpy_dtypes(UNSIGNED_INT_DTYPES) +
+    UNSIGNED_EA_INT_DTYPES + to_ea_dtypes(UNSIGNED_EA_INT_DTYPES))
+def test_is_not_signed_integer_dtype(dtype):
+    assert not com.is_signed_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype',
+    [pd.Series([1, 2], dtype=np.uint32)] +
+    UNSIGNED_INT_DTYPES + to_numpy_dtypes(UNSIGNED_INT_DTYPES) +
+    UNSIGNED_EA_INT_DTYPES + to_ea_dtypes(UNSIGNED_EA_INT_DTYPES))
+def test_is_unsigned_integer_dtype(dtype):
+    assert com.is_unsigned_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype',
+    [
+        str, float, np.datetime64, np.timedelta64,
+        pd.Index([1, 2.]), np.array(['a', 'b']),
+        np.array([], dtype=np.timedelta64)] +
+    SIGNED_INT_DTYPES + to_numpy_dtypes(SIGNED_INT_DTYPES) +
+    SIGNED_EA_INT_DTYPES + to_ea_dtypes(SIGNED_EA_INT_DTYPES))
+def test_is_not_unsigned_integer_dtype(dtype):
+    assert not com.is_unsigned_integer_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype',
+    [np.int64, np.array([1, 2], dtype=np.int64), 'Int64', pd.Int64Dtype])
+def test_is_int64_dtype(dtype):
+    assert com.is_int64_dtype(dtype)
+
+
+@pytest.mark.parametrize(
+    'dtype',
+    [
+        str, float, np.int32, np.uint64, pd.Index([1, 2.]),
+        np.array(['a', 'b']), np.array([1, 2], dtype=np.uint32),
+        'int8', 'Int8', pd.Int8Dtype])
+def test_is_not_int64_dtype(dtype):
+    assert not com.is_int64_dtype(dtype)
+
+
+def test_is_datetime64_any_dtype():
+    assert not com.is_datetime64_any_dtype(int)
+    assert not com.is_datetime64_any_dtype(str)
+    assert not com.is_datetime64_any_dtype(np.array([1, 2]))
+    assert not com.is_datetime64_any_dtype(np.array(['a', 'b']))
+
+    assert com.is_datetime64_any_dtype(np.datetime64)
+    assert com.is_datetime64_any_dtype(np.array([], dtype=np.datetime64))
+    assert com.is_datetime64_any_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    assert com.is_datetime64_any_dtype(
+        pd.DatetimeIndex([1, 2, 3], dtype="datetime64[ns]"))
+
+
+def test_is_datetime64_ns_dtype():
+    assert not com.is_datetime64_ns_dtype(int)
+    assert not com.is_datetime64_ns_dtype(str)
+    assert not com.is_datetime64_ns_dtype(np.datetime64)
+    assert not com.is_datetime64_ns_dtype(np.array([1, 2]))
+    assert not com.is_datetime64_ns_dtype(np.array(['a', 'b']))
+    assert not com.is_datetime64_ns_dtype(np.array([], dtype=np.datetime64))
+
+    # This datetime array has the wrong unit (ps instead of ns)
+    assert not com.is_datetime64_ns_dtype(np.array([], dtype="datetime64[ps]"))
+
+    assert com.is_datetime64_ns_dtype(DatetimeTZDtype("ns", "US/Eastern"))
+    assert com.is_datetime64_ns_dtype(
+        pd.DatetimeIndex([1, 2, 3], dtype=np.dtype('datetime64[ns]')))
+
+
+def test_is_timedelta64_ns_dtype():
+    assert not com.is_timedelta64_ns_dtype(np.dtype('m8[ps]'))
+    assert not com.is_timedelta64_ns_dtype(
+        np.array([1, 2], dtype=np.timedelta64))
+
+    assert com.is_timedelta64_ns_dtype(np.dtype('m8[ns]'))
+    assert com.is_timedelta64_ns_dtype(np.array([1, 2], dtype='m8[ns]'))
+
+
+def test_is_datetime_or_timedelta_dtype():
+    assert not com.is_datetime_or_timedelta_dtype(int)
+    assert not com.is_datetime_or_timedelta_dtype(str)
+    assert not com.is_datetime_or_timedelta_dtype(pd.Series([1, 2]))
+    assert not com.is_datetime_or_timedelta_dtype(np.array(['a', 'b']))
+
+    # TODO(jreback), this is sligthly suspect
+    assert not com.is_datetime_or_timedelta_dtype(
+        DatetimeTZDtype("ns", "US/Eastern"))
+
+    assert com.is_datetime_or_timedelta_dtype(np.datetime64)
+    assert com.is_datetime_or_timedelta_dtype(np.timedelta64)
+    assert com.is_datetime_or_timedelta_dtype(
+        np.array([], dtype=np.timedelta64))
+    assert com.is_datetime_or_timedelta_dtype(
+        np.array([], dtype=np.datetime64))
+
+
+def test_is_numeric_v_string_like():
+    assert not com.is_numeric_v_string_like(1, 1)
+    assert not com.is_numeric_v_string_like(1, "foo")
+    assert not com.is_numeric_v_string_like("foo", "foo")
+    assert not com.is_numeric_v_string_like(np.array([1]), np.array([2]))
+    assert not com.is_numeric_v_string_like(
+        np.array(["foo"]), np.array(["foo"]))
+
+    assert com.is_numeric_v_string_like(np.array([1]), "foo")
+    assert com.is_numeric_v_string_like("foo", np.array([1]))
+    assert com.is_numeric_v_string_like(np.array([1, 2]), np.array(["foo"]))
+    assert com.is_numeric_v_string_like(np.array(["foo"]), np.array([1, 2]))
+
+
+def test_is_datetimelike_v_numeric():
+    dt = np.datetime64(pd.datetime(2017, 1, 1))
+
+    assert not com.is_datetimelike_v_numeric(1, 1)
+    assert not com.is_datetimelike_v_numeric(dt, dt)
+    assert not com.is_datetimelike_v_numeric(np.array([1]), np.array([2]))
+    assert not com.is_datetimelike_v_numeric(np.array([dt]), np.array([dt]))
+
+    assert com.is_datetimelike_v_numeric(1, dt)
+    assert com.is_datetimelike_v_numeric(1, dt)
+    assert com.is_datetimelike_v_numeric(np.array([dt]), 1)
+    assert com.is_datetimelike_v_numeric(np.array([1]), dt)
+    assert com.is_datetimelike_v_numeric(np.array([dt]), np.array([1]))
+
+
+def test_is_datetimelike_v_object():
+    obj = object()
+    dt = np.datetime64(pd.datetime(2017, 1, 1))
+
+    assert not com.is_datetimelike_v_object(dt, dt)
+    assert not com.is_datetimelike_v_object(obj, obj)
+    assert not com.is_datetimelike_v_object(np.array([dt]), np.array([1]))
+    assert not com.is_datetimelike_v_object(np.array([dt]), np.array([dt]))
+    assert not com.is_datetimelike_v_object(np.array([obj]), np.array([obj]))
+
+    assert com.is_datetimelike_v_object(dt, obj)
+    assert com.is_datetimelike_v_object(obj, dt)
+    assert com.is_datetimelike_v_object(np.array([dt]), obj)
+    assert com.is_datetimelike_v_object(np.array([obj]), dt)
+    assert com.is_datetimelike_v_object(np.array([dt]), np.array([obj]))
+
+
+def test_needs_i8_conversion():
+    assert not com.needs_i8_conversion(str)
+    assert not com.needs_i8_conversion(np.int64)
+    assert not com.needs_i8_conversion(pd.Series([1, 2]))
+    assert not com.needs_i8_conversion(np.array(['a', 'b']))
+
+    assert com.needs_i8_conversion(np.datetime64)
+    assert com.needs_i8_conversion(pd.Series([], dtype="timedelta64[ns]"))
+    assert com.needs_i8_conversion(pd.DatetimeIndex(
+        ["2000"], tz="US/Eastern"))
+
+
+def test_is_numeric_dtype():
+    assert not com.is_numeric_dtype(str)
+    assert not com.is_numeric_dtype(np.datetime64)
+    assert not com.is_numeric_dtype(np.timedelta64)
+    assert not com.is_numeric_dtype(np.array(['a', 'b']))
+    assert not com.is_numeric_dtype(np.array([], dtype=np.timedelta64))
+
+    assert com.is_numeric_dtype(int)
+    assert com.is_numeric_dtype(float)
+    assert com.is_numeric_dtype(np.uint64)
+    assert com.is_numeric_dtype(pd.Series([1, 2]))
+    assert com.is_numeric_dtype(pd.Index([1, 2.]))
+
+
+def test_is_string_like_dtype():
+    assert not com.is_string_like_dtype(object)
+    assert not com.is_string_like_dtype(pd.Series([1, 2]))
+
+    assert com.is_string_like_dtype(str)
+    assert com.is_string_like_dtype(np.array(['a', 'b']))
+
+
+def test_is_float_dtype():
+    assert not com.is_float_dtype(str)
+    assert not com.is_float_dtype(int)
+    assert not com.is_float_dtype(pd.Series([1, 2]))
+    assert not com.is_float_dtype(np.array(['a', 'b']))
+
+    assert com.is_float_dtype(float)
+    assert com.is_float_dtype(pd.Index([1, 2.]))
+
+
+def test_is_bool_dtype():
+    assert not com.is_bool_dtype(int)
+    assert not com.is_bool_dtype(str)
+    assert not com.is_bool_dtype(pd.Series([1, 2]))
+    assert not com.is_bool_dtype(np.array(['a', 'b']))
+    assert not com.is_bool_dtype(pd.Index(['a', 'b']))
+
+    assert com.is_bool_dtype(bool)
+    assert com.is_bool_dtype(np.bool)
+    assert com.is_bool_dtype(np.array([True, False]))
+    assert com.is_bool_dtype(pd.Index([True, False]))
+
+
+@pytest.mark.parametrize("check_scipy", [
+    False, pytest.param(True, marks=td.skip_if_no_scipy)
+])
+def test_is_extension_type(check_scipy):
+    assert not com.is_extension_type([1, 2, 3])
+    assert not com.is_extension_type(np.array([1, 2, 3]))
+    assert not com.is_extension_type(pd.DatetimeIndex([1, 2, 3]))
+
+    cat = pd.Categorical([1, 2, 3])
+    assert com.is_extension_type(cat)
+    assert com.is_extension_type(pd.Series(cat))
+    assert com.is_extension_type(pd.SparseArray([1, 2, 3]))
+    assert com.is_extension_type(pd.SparseSeries([1, 2, 3]))
+    assert com.is_extension_type(pd.DatetimeIndex(['2000'], tz="US/Eastern"))
+
+    dtype = DatetimeTZDtype("ns", tz="US/Eastern")
+    s = pd.Series([], dtype=dtype)
+    assert com.is_extension_type(s)
+
+    if check_scipy:
+        import scipy.sparse
+        assert not com.is_extension_type(scipy.sparse.bsr_matrix([1, 2, 3]))
+
+
+def test_is_complex_dtype():
+    assert not com.is_complex_dtype(int)
+    assert not com.is_complex_dtype(str)
+    assert not com.is_complex_dtype(pd.Series([1, 2]))
+    assert not com.is_complex_dtype(np.array(['a', 'b']))
+
+    assert com.is_complex_dtype(np.complex)
+    assert com.is_complex_dtype(np.array([1 + 1j, 5]))
+
+
+def test_is_offsetlike():
+    assert com.is_offsetlike(np.array([pd.DateOffset(month=3),
+                                       pd.offsets.Nano()]))
+    assert com.is_offsetlike(pd.offsets.MonthEnd())
+    assert com.is_offsetlike(pd.Index([pd.DateOffset(second=1)]))
+
+    assert not com.is_offsetlike(pd.Timedelta(1))
+    assert not com.is_offsetlike(np.array([1 + 1j, 5]))
+
+    # mixed case
+    assert not com.is_offsetlike(np.array([pd.DateOffset(), pd.Timestamp(0)]))
+
+
+@pytest.mark.parametrize('input_param,result', [
+    (int, np.dtype(int)),
+    ('int32', np.dtype('int32')),
+    (float, np.dtype(float)),
+    ('float64', np.dtype('float64')),
+    (np.dtype('float64'), np.dtype('float64')),
+    (str, np.dtype(str)),
+    (pd.Series([1, 2], dtype=np.dtype('int16')), np.dtype('int16')),
+    (pd.Series(['a', 'b']), np.dtype(object)),
+    (pd.Index([1, 2]), np.dtype('int64')),
+    (pd.Index(['a', 'b']), np.dtype(object)),
+    ('category', 'category'),
+    (pd.Categorical(['a', 'b']).dtype, CategoricalDtype(['a', 'b'])),
+    (pd.Categorical(['a', 'b']), CategoricalDtype(['a', 'b'])),
+    (pd.CategoricalIndex(['a', 'b']).dtype, CategoricalDtype(['a', 'b'])),
+    (pd.CategoricalIndex(['a', 'b']), CategoricalDtype(['a', 'b'])),
+    (CategoricalDtype(), CategoricalDtype()),
+    (CategoricalDtype(['a', 'b']), CategoricalDtype()),
+    (pd.DatetimeIndex([1, 2]), np.dtype('=M8[ns]')),
+    (pd.DatetimeIndex([1, 2]).dtype, np.dtype('=M8[ns]')),
+    ('<M8[ns]', np.dtype('<M8[ns]')),
+    ('datetime64[ns, Europe/London]', DatetimeTZDtype('ns', 'Europe/London')),
+    (pd.SparseSeries([1, 2], dtype='int32'), SparseDtype('int32')),
+    (pd.SparseSeries([1, 2], dtype='int32').dtype, SparseDtype('int32')),
+    (PeriodDtype(freq='D'), PeriodDtype(freq='D')),
+    ('period[D]', PeriodDtype(freq='D')),
+    (IntervalDtype(), IntervalDtype()),
+])
+def test__get_dtype(input_param, result):
+    assert com._get_dtype(input_param) == result
+
+
+@pytest.mark.parametrize('input_param,expected_error_message', [
+    (None, "Cannot deduce dtype from null object"),
+    (1, "data type not understood"),
+    (1.2, "data type not understood"),
+    ('random string', "data type 'random string' not understood"),
+    (pd.DataFrame([1, 2]), "data type not understood")])
+def test__get_dtype_fails(input_param, expected_error_message):
+    # python objects
+    with pytest.raises(TypeError, match=expected_error_message):
+        com._get_dtype(input_param)
+
+
+@pytest.mark.parametrize('input_param,result', [
+    (int, np.dtype(int).type),
+    ('int32', np.int32),
+    (float, np.dtype(float).type),
+    ('float64', np.float64),
+    (np.dtype('float64'), np.float64),
+    (str, np.dtype(str).type),
+    (pd.Series([1, 2], dtype=np.dtype('int16')), np.int16),
+    (pd.Series(['a', 'b']), np.object_),
+    (pd.Index([1, 2], dtype='int64'), np.int64),
+    (pd.Index(['a', 'b']), np.object_),
+    ('category', CategoricalDtypeType),
+    (pd.Categorical(['a', 'b']).dtype, CategoricalDtypeType),
+    (pd.Categorical(['a', 'b']), CategoricalDtypeType),
+    (pd.CategoricalIndex(['a', 'b']).dtype, CategoricalDtypeType),
+    (pd.CategoricalIndex(['a', 'b']), CategoricalDtypeType),
+    (pd.DatetimeIndex([1, 2]), np.datetime64),
+    (pd.DatetimeIndex([1, 2]).dtype, np.datetime64),
+    ('<M8[ns]', np.datetime64),
+    (pd.DatetimeIndex(['2000'], tz='Europe/London'), pd.Timestamp),
+    (pd.DatetimeIndex(['2000'], tz='Europe/London').dtype,
+     pd.Timestamp),
+    ('datetime64[ns, Europe/London]', pd.Timestamp),
+    (pd.SparseSeries([1, 2], dtype='int32'), np.int32),
+    (pd.SparseSeries([1, 2], dtype='int32').dtype, np.int32),
+    (PeriodDtype(freq='D'), pd.Period),
+    ('period[D]', pd.Period),
+    (IntervalDtype(), pd.Interval),
+    (None, type(None)),
+    (1, type(None)),
+    (1.2, type(None)),
+    (pd.DataFrame([1, 2]), type(None)),  # composite dtype
+])
+def test__is_dtype_type(input_param, result):
+    assert com._is_dtype_type(input_param, lambda tipo: tipo == result)
diff --git a/pandas/tests/dtypes/test_concat.py b/pandas/tests/dtypes/test_concat.py
new file mode 100644
index 0000000000000..d58f8ee3b74f1
--- /dev/null
+++ b/pandas/tests/dtypes/test_concat.py
@@ -0,0 +1,53 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas.core.dtypes.concat as _concat
+
+from pandas import (
+    DatetimeIndex, Index, Period, PeriodIndex, Series, TimedeltaIndex)
+
+
+@pytest.mark.parametrize('to_concat, expected', [
+    # int/float/str
+    ([['a'], [1, 2]], ['i', 'object']),
+    ([[3, 4], [1, 2]], ['i']),
+    ([[3, 4], [1, 2.1]], ['i', 'f']),
+
+    # datetimelike
+    ([DatetimeIndex(['2011-01-01']), DatetimeIndex(['2011-01-02'])],
+     ['datetime']),
+    ([TimedeltaIndex(['1 days']), TimedeltaIndex(['2 days'])],
+     ['timedelta']),
+
+    # datetimelike object
+    ([DatetimeIndex(['2011-01-01']),
+      DatetimeIndex(['2011-01-02'], tz='US/Eastern')],
+     ['datetime', 'datetime64[ns, US/Eastern]']),
+    ([DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
+      DatetimeIndex(['2011-01-02'], tz='US/Eastern')],
+     ['datetime64[ns, Asia/Tokyo]', 'datetime64[ns, US/Eastern]']),
+    ([TimedeltaIndex(['1 days']), TimedeltaIndex(['2 hours'])],
+     ['timedelta']),
+    ([DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
+      TimedeltaIndex(['1 days'])],
+     ['datetime64[ns, Asia/Tokyo]', 'timedelta'])])
+@pytest.mark.parametrize('klass', [Index, Series])
+def test_get_dtype_kinds(klass, to_concat, expected):
+    to_concat_klass = [klass(c) for c in to_concat]
+    result = _concat.get_dtype_kinds(to_concat_klass)
+    assert result == set(expected)
+
+
+@pytest.mark.parametrize('to_concat, expected', [
+    ([PeriodIndex(['2011-01'], freq='M'),
+      PeriodIndex(['2011-01'], freq='M')], ['period[M]']),
+    ([Series([Period('2011-01', freq='M')]),
+      Series([Period('2011-02', freq='M')])], ['period[M]']),
+    ([PeriodIndex(['2011-01'], freq='M'),
+      PeriodIndex(['2011-01'], freq='D')], ['period[M]', 'period[D]']),
+    ([Series([Period('2011-01', freq='M')]),
+      Series([Period('2011-02', freq='D')])], ['period[M]', 'period[D]'])])
+def test_get_dtype_kinds_period(to_concat, expected):
+    result = _concat.get_dtype_kinds(to_concat)
+    assert result == set(expected)
diff --git a/pandas/tests/dtypes/test_dtypes.py b/pandas/tests/dtypes/test_dtypes.py
new file mode 100644
index 0000000000000..4366f610871ff
--- /dev/null
+++ b/pandas/tests/dtypes/test_dtypes.py
@@ -0,0 +1,904 @@
+# -*- coding: utf-8 -*-
+import re
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas.core.dtypes.common import (
+    is_bool_dtype, is_categorical, is_categorical_dtype,
+    is_datetime64_any_dtype, is_datetime64_dtype, is_datetime64_ns_dtype,
+    is_datetime64tz_dtype, is_datetimetz, is_dtype_equal, is_interval_dtype,
+    is_period, is_period_dtype, is_string_dtype)
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, DatetimeTZDtype, IntervalDtype, PeriodDtype, registry)
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, IntervalIndex, Series, date_range)
+from pandas.core.sparse.api import SparseDtype
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[True, False, None])
+def ordered(request):
+    return request.param
+
+
+class Base(object):
+
+    def setup_method(self, method):
+        self.dtype = self.create()
+
+    def test_hash(self):
+        hash(self.dtype)
+
+    def test_equality_invalid(self):
+        assert not self.dtype == 'foo'
+        assert not is_dtype_equal(self.dtype, np.int64)
+
+    def test_numpy_informed(self):
+        with pytest.raises(TypeError, match="data type not understood"):
+            np.dtype(self.dtype)
+
+        assert not self.dtype == np.str_
+        assert not np.str_ == self.dtype
+
+    def test_pickle(self):
+        # make sure our cache is NOT pickled
+
+        # clear the cache
+        type(self.dtype).reset_cache()
+        assert not len(self.dtype._cache)
+
+        # force back to the cache
+        result = tm.round_trip_pickle(self.dtype)
+        assert not len(self.dtype._cache)
+        assert result == self.dtype
+
+
+class TestCategoricalDtype(Base):
+
+    def create(self):
+        return CategoricalDtype()
+
+    def test_pickle(self):
+        # make sure our cache is NOT pickled
+
+        # clear the cache
+        type(self.dtype).reset_cache()
+        assert not len(self.dtype._cache)
+
+        # force back to the cache
+        result = tm.round_trip_pickle(self.dtype)
+        assert result == self.dtype
+
+    def test_hash_vs_equality(self):
+        dtype = self.dtype
+        dtype2 = CategoricalDtype()
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert hash(dtype) == hash(dtype2)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'category')
+        assert is_dtype_equal(self.dtype, CategoricalDtype())
+        assert not is_dtype_equal(self.dtype, 'foo')
+
+    def test_construction_from_string(self):
+        result = CategoricalDtype.construct_from_string('category')
+        assert is_dtype_equal(self.dtype, result)
+        msg = "cannot construct a CategoricalDtype"
+        with pytest.raises(TypeError, match=msg):
+            CategoricalDtype.construct_from_string('foo')
+
+    def test_constructor_invalid(self):
+        msg = "Parameter 'categories' must be list-like"
+        with pytest.raises(TypeError, match=msg):
+            CategoricalDtype("category")
+
+    dtype1 = CategoricalDtype(['a', 'b'], ordered=True)
+    dtype2 = CategoricalDtype(['x', 'y'], ordered=False)
+    c = Categorical([0, 1], dtype=dtype1, fastpath=True)
+
+    @pytest.mark.parametrize('values, categories, ordered, dtype, expected',
+                             [
+                                 [None, None, None, None,
+                                  CategoricalDtype()],
+                                 [None, ['a', 'b'], True, None, dtype1],
+                                 [c, None, None, dtype2, dtype2],
+                                 [c, ['x', 'y'], False, None, dtype2],
+                             ])
+    def test_from_values_or_dtype(
+            self, values, categories, ordered, dtype, expected):
+        result = CategoricalDtype._from_values_or_dtype(values, categories,
+                                                        ordered, dtype)
+        assert result == expected
+
+    @pytest.mark.parametrize('values, categories, ordered, dtype', [
+        [None, ['a', 'b'], True, dtype2],
+        [None, ['a', 'b'], None, dtype2],
+        [None, None, True, dtype2],
+    ])
+    def test_from_values_or_dtype_raises(self, values, categories,
+                                         ordered, dtype):
+        msg = "Cannot specify `categories` or `ordered` together with `dtype`."
+        with pytest.raises(ValueError, match=msg):
+            CategoricalDtype._from_values_or_dtype(values, categories,
+                                                   ordered, dtype)
+
+    def test_is_dtype(self):
+        assert CategoricalDtype.is_dtype(self.dtype)
+        assert CategoricalDtype.is_dtype('category')
+        assert CategoricalDtype.is_dtype(CategoricalDtype())
+        assert not CategoricalDtype.is_dtype('foo')
+        assert not CategoricalDtype.is_dtype(np.float64)
+
+    def test_basic(self):
+
+        assert is_categorical_dtype(self.dtype)
+
+        factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+
+        s = Series(factor, name='A')
+
+        # dtypes
+        assert is_categorical_dtype(s.dtype)
+        assert is_categorical_dtype(s)
+        assert not is_categorical_dtype(np.dtype('float64'))
+
+        assert is_categorical(s.dtype)
+        assert is_categorical(s)
+        assert not is_categorical(np.dtype('float64'))
+        assert not is_categorical(1.0)
+
+    def test_tuple_categories(self):
+        categories = [(1, 'a'), (2, 'b'), (3, 'c')]
+        result = CategoricalDtype(categories)
+        assert all(result.categories == categories)
+
+    @pytest.mark.parametrize("categories, expected", [
+        ([True, False], True),
+        ([True, False, None], True),
+        ([True, False, "a", "b'"], False),
+        ([0, 1], False),
+    ])
+    def test_is_boolean(self, categories, expected):
+        cat = Categorical(categories)
+        assert cat.dtype._is_boolean is expected
+        assert is_bool_dtype(cat) is expected
+        assert is_bool_dtype(cat.dtype) is expected
+
+
+class TestDatetimeTZDtype(Base):
+
+    def create(self):
+        return DatetimeTZDtype('ns', 'US/Eastern')
+
+    def test_alias_to_unit_raises(self):
+        # 23990
+        with tm.assert_produces_warning(FutureWarning):
+            DatetimeTZDtype('datetime64[ns, US/Central]')
+
+    def test_alias_to_unit_bad_alias_raises(self):
+        # 23990
+        with pytest.raises(TypeError, match=''):
+            DatetimeTZDtype('this is a bad string')
+
+        with pytest.raises(TypeError, match=''):
+            DatetimeTZDtype('datetime64[ns, US/NotATZ]')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = DatetimeTZDtype('ns', 'US/Eastern')
+        dtype3 = DatetimeTZDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+        dtype4 = DatetimeTZDtype("ns", "US/Central")
+        assert dtype2 != dtype4
+        assert hash(dtype2) != hash(dtype4)
+
+    def test_construction(self):
+        msg = "DatetimeTZDtype only supports ns units"
+        with pytest.raises(ValueError, match=msg):
+            DatetimeTZDtype('ms', 'US/Eastern')
+
+    def test_subclass(self):
+        a = DatetimeTZDtype.construct_from_string('datetime64[ns, US/Eastern]')
+        b = DatetimeTZDtype.construct_from_string('datetime64[ns, CET]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_compat(self):
+        assert is_datetime64tz_dtype(self.dtype)
+        assert is_datetime64tz_dtype('datetime64[ns, US/Eastern]')
+        assert is_datetime64_any_dtype(self.dtype)
+        assert is_datetime64_any_dtype('datetime64[ns, US/Eastern]')
+        assert is_datetime64_ns_dtype(self.dtype)
+        assert is_datetime64_ns_dtype('datetime64[ns, US/Eastern]')
+        assert not is_datetime64_dtype(self.dtype)
+        assert not is_datetime64_dtype('datetime64[ns, US/Eastern]')
+
+    def test_construction_from_string(self):
+        result = DatetimeTZDtype.construct_from_string(
+            'datetime64[ns, US/Eastern]')
+        assert is_dtype_equal(self.dtype, result)
+        msg = "Could not construct DatetimeTZDtype from 'foo'"
+        with pytest.raises(TypeError, match=msg):
+            DatetimeTZDtype.construct_from_string('foo')
+
+    def test_construct_from_string_raises(self):
+        with pytest.raises(TypeError, match="notatz"):
+            DatetimeTZDtype.construct_from_string('datetime64[ns, notatz]')
+
+        with pytest.raises(TypeError,
+                           match="^Could not construct DatetimeTZDtype$"):
+            DatetimeTZDtype.construct_from_string(['datetime64[ns, notatz]'])
+
+    def test_is_dtype(self):
+        assert not DatetimeTZDtype.is_dtype(None)
+        assert DatetimeTZDtype.is_dtype(self.dtype)
+        assert DatetimeTZDtype.is_dtype('datetime64[ns, US/Eastern]')
+        assert not DatetimeTZDtype.is_dtype('foo')
+        assert DatetimeTZDtype.is_dtype(DatetimeTZDtype('ns', 'US/Pacific'))
+        assert not DatetimeTZDtype.is_dtype(np.float64)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'datetime64[ns, US/Eastern]')
+        assert is_dtype_equal(self.dtype, DatetimeTZDtype('ns', 'US/Eastern'))
+        assert not is_dtype_equal(self.dtype, 'foo')
+        assert not is_dtype_equal(self.dtype, DatetimeTZDtype('ns', 'CET'))
+        assert not is_dtype_equal(DatetimeTZDtype('ns', 'US/Eastern'),
+                                  DatetimeTZDtype('ns', 'US/Pacific'))
+
+        # numpy compat
+        assert is_dtype_equal(np.dtype("M8[ns]"), "datetime64[ns]")
+
+    def test_basic(self):
+
+        assert is_datetime64tz_dtype(self.dtype)
+
+        dr = date_range('20130101', periods=3, tz='US/Eastern')
+        s = Series(dr, name='A')
+
+        # dtypes
+        assert is_datetime64tz_dtype(s.dtype)
+        assert is_datetime64tz_dtype(s)
+        assert not is_datetime64tz_dtype(np.dtype('float64'))
+        assert not is_datetime64tz_dtype(1.0)
+
+        with tm.assert_produces_warning(FutureWarning):
+            assert is_datetimetz(s)
+            assert is_datetimetz(s.dtype)
+            assert not is_datetimetz(np.dtype('float64'))
+            assert not is_datetimetz(1.0)
+
+    def test_dst(self):
+
+        dr1 = date_range('2013-01-01', periods=3, tz='US/Eastern')
+        s1 = Series(dr1, name='A')
+        assert is_datetime64tz_dtype(s1)
+        with tm.assert_produces_warning(FutureWarning):
+            assert is_datetimetz(s1)
+
+        dr2 = date_range('2013-08-01', periods=3, tz='US/Eastern')
+        s2 = Series(dr2, name='A')
+        assert is_datetime64tz_dtype(s2)
+        with tm.assert_produces_warning(FutureWarning):
+            assert is_datetimetz(s2)
+        assert s1.dtype == s2.dtype
+
+    @pytest.mark.parametrize('tz', ['UTC', 'US/Eastern'])
+    @pytest.mark.parametrize('constructor', ['M8', 'datetime64'])
+    def test_parser(self, tz, constructor):
+        # pr #11245
+        dtz_str = '{con}[ns, {tz}]'.format(con=constructor, tz=tz)
+        result = DatetimeTZDtype.construct_from_string(dtz_str)
+        expected = DatetimeTZDtype('ns', tz)
+        assert result == expected
+
+    def test_empty(self):
+        with pytest.raises(TypeError, match="A 'tz' is required."):
+            DatetimeTZDtype()
+
+    def test_tz_standardize(self):
+        # GH 24713
+        tz = pytz.timezone('US/Eastern')
+        dr = date_range('2013-01-01', periods=3, tz='US/Eastern')
+        dtype = DatetimeTZDtype('ns', dr.tz)
+        assert dtype.tz == tz
+        dtype = DatetimeTZDtype('ns', dr[0].tz)
+        assert dtype.tz == tz
+
+
+class TestPeriodDtype(Base):
+
+    def create(self):
+        return PeriodDtype('D')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = PeriodDtype('D')
+        dtype3 = PeriodDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert dtype is dtype2
+        assert dtype2 is dtype
+        assert dtype3 is dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+    def test_construction(self):
+        with pytest.raises(ValueError):
+            PeriodDtype('xx')
+
+        for s in ['period[D]', 'Period[D]', 'D']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Day()
+            assert is_period_dtype(dt)
+
+        for s in ['period[3D]', 'Period[3D]', '3D']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Day(3)
+            assert is_period_dtype(dt)
+
+        for s in ['period[26H]', 'Period[26H]', '26H',
+                  'period[1D2H]', 'Period[1D2H]', '1D2H']:
+            dt = PeriodDtype(s)
+            assert dt.freq == pd.tseries.offsets.Hour(26)
+            assert is_period_dtype(dt)
+
+    def test_subclass(self):
+        a = PeriodDtype('period[D]')
+        b = PeriodDtype('period[3D]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_identity(self):
+        assert PeriodDtype('period[D]') == PeriodDtype('period[D]')
+        assert PeriodDtype('period[D]') is PeriodDtype('period[D]')
+
+        assert PeriodDtype('period[3D]') == PeriodDtype('period[3D]')
+        assert PeriodDtype('period[3D]') is PeriodDtype('period[3D]')
+
+        assert PeriodDtype('period[1S1U]') == PeriodDtype('period[1000001U]')
+        assert PeriodDtype('period[1S1U]') is PeriodDtype('period[1000001U]')
+
+    def test_compat(self):
+        assert not is_datetime64_ns_dtype(self.dtype)
+        assert not is_datetime64_ns_dtype('period[D]')
+        assert not is_datetime64_dtype(self.dtype)
+        assert not is_datetime64_dtype('period[D]')
+
+    def test_construction_from_string(self):
+        result = PeriodDtype('period[D]')
+        assert is_dtype_equal(self.dtype, result)
+        result = PeriodDtype.construct_from_string('period[D]')
+        assert is_dtype_equal(self.dtype, result)
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('foo')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('period[foo]')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('foo[D]')
+
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('datetime64[ns]')
+        with pytest.raises(TypeError):
+            PeriodDtype.construct_from_string('datetime64[ns, US/Eastern]')
+
+    def test_is_dtype(self):
+        assert PeriodDtype.is_dtype(self.dtype)
+        assert PeriodDtype.is_dtype('period[D]')
+        assert PeriodDtype.is_dtype('period[3D]')
+        assert PeriodDtype.is_dtype(PeriodDtype('3D'))
+        assert PeriodDtype.is_dtype('period[U]')
+        assert PeriodDtype.is_dtype('period[S]')
+        assert PeriodDtype.is_dtype(PeriodDtype('U'))
+        assert PeriodDtype.is_dtype(PeriodDtype('S'))
+
+        assert not PeriodDtype.is_dtype('D')
+        assert not PeriodDtype.is_dtype('3D')
+        assert not PeriodDtype.is_dtype('U')
+        assert not PeriodDtype.is_dtype('S')
+        assert not PeriodDtype.is_dtype('foo')
+        assert not PeriodDtype.is_dtype(np.object_)
+        assert not PeriodDtype.is_dtype(np.int64)
+        assert not PeriodDtype.is_dtype(np.float64)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'period[D]')
+        assert is_dtype_equal(self.dtype, PeriodDtype('D'))
+        assert is_dtype_equal(self.dtype, PeriodDtype('D'))
+        assert is_dtype_equal(PeriodDtype('D'), PeriodDtype('D'))
+
+        assert not is_dtype_equal(self.dtype, 'D')
+        assert not is_dtype_equal(PeriodDtype('D'), PeriodDtype('2D'))
+
+    def test_basic(self):
+        assert is_period_dtype(self.dtype)
+
+        pidx = pd.period_range('2013-01-01 09:00', periods=5, freq='H')
+
+        assert is_period_dtype(pidx.dtype)
+        assert is_period_dtype(pidx)
+        with tm.assert_produces_warning(FutureWarning):
+            assert is_period(pidx)
+
+        s = Series(pidx, name='A')
+
+        assert is_period_dtype(s.dtype)
+        assert is_period_dtype(s)
+        with tm.assert_produces_warning(FutureWarning):
+            assert is_period(s)
+
+        assert not is_period_dtype(np.dtype('float64'))
+        assert not is_period_dtype(1.0)
+        with tm.assert_produces_warning(FutureWarning):
+            assert not is_period(np.dtype('float64'))
+        with tm.assert_produces_warning(FutureWarning):
+            assert not is_period(1.0)
+
+    def test_empty(self):
+        dt = PeriodDtype()
+        with pytest.raises(AttributeError):
+            str(dt)
+
+    def test_not_string(self):
+        # though PeriodDtype has object kind, it cannot be string
+        assert not is_string_dtype(PeriodDtype('D'))
+
+
+class TestIntervalDtype(Base):
+
+    def create(self):
+        return IntervalDtype('int64')
+
+    def test_hash_vs_equality(self):
+        # make sure that we satisfy is semantics
+        dtype = self.dtype
+        dtype2 = IntervalDtype('int64')
+        dtype3 = IntervalDtype(dtype2)
+        assert dtype == dtype2
+        assert dtype2 == dtype
+        assert dtype3 == dtype
+        assert dtype is dtype2
+        assert dtype2 is dtype3
+        assert dtype3 is dtype
+        assert hash(dtype) == hash(dtype2)
+        assert hash(dtype) == hash(dtype3)
+
+        dtype1 = IntervalDtype('interval')
+        dtype2 = IntervalDtype(dtype1)
+        dtype3 = IntervalDtype('interval')
+        assert dtype2 == dtype1
+        assert dtype2 == dtype2
+        assert dtype2 == dtype3
+        assert dtype2 is dtype1
+        assert dtype2 is dtype2
+        assert dtype2 is dtype3
+        assert hash(dtype2) == hash(dtype1)
+        assert hash(dtype2) == hash(dtype2)
+        assert hash(dtype2) == hash(dtype3)
+
+    @pytest.mark.parametrize('subtype', [
+        'interval[int64]', 'Interval[int64]', 'int64', np.dtype('int64')])
+    def test_construction(self, subtype):
+        i = IntervalDtype(subtype)
+        assert i.subtype == np.dtype('int64')
+        assert is_interval_dtype(i)
+
+    @pytest.mark.parametrize('subtype', [None, 'interval', 'Interval'])
+    def test_construction_generic(self, subtype):
+        # generic
+        i = IntervalDtype(subtype)
+        assert i.subtype is None
+        assert is_interval_dtype(i)
+
+    @pytest.mark.parametrize('subtype', [
+        CategoricalDtype(list('abc'), False),
+        CategoricalDtype(list('wxyz'), True),
+        object, str, '<U10', 'interval[category]', 'interval[object]'])
+    def test_construction_not_supported(self, subtype):
+        # GH 19016
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalDtype')
+        with pytest.raises(TypeError, match=msg):
+            IntervalDtype(subtype)
+
+    @pytest.mark.parametrize('subtype', ['xx', 'IntervalA', 'Interval[foo]'])
+    def test_construction_errors(self, subtype):
+        msg = 'could not construct IntervalDtype'
+        with pytest.raises(TypeError, match=msg):
+            IntervalDtype(subtype)
+
+    def test_construction_from_string(self):
+        result = IntervalDtype('interval[int64]')
+        assert is_dtype_equal(self.dtype, result)
+        result = IntervalDtype.construct_from_string('interval[int64]')
+        assert is_dtype_equal(self.dtype, result)
+
+    @pytest.mark.parametrize('string', [
+        0, 3.14, ('a', 'b'), None])
+    def test_construction_from_string_errors(self, string):
+        # these are invalid entirely
+        msg = 'a string needs to be passed, got type'
+
+        with pytest.raises(TypeError, match=msg):
+            IntervalDtype.construct_from_string(string)
+
+    @pytest.mark.parametrize('string', [
+        'foo', 'foo[int64]', 'IntervalA'])
+    def test_construction_from_string_error_subtype(self, string):
+        # this is an invalid subtype
+        msg = ("Incorrectly formatted string passed to constructor. "
+               r"Valid formats include Interval or Interval\[dtype\] "
+               "where dtype is numeric, datetime, or timedelta")
+
+        with pytest.raises(TypeError, match=msg):
+            IntervalDtype.construct_from_string(string)
+
+    def test_subclass(self):
+        a = IntervalDtype('interval[int64]')
+        b = IntervalDtype('interval[int64]')
+
+        assert issubclass(type(a), type(a))
+        assert issubclass(type(a), type(b))
+
+    def test_is_dtype(self):
+        assert IntervalDtype.is_dtype(self.dtype)
+        assert IntervalDtype.is_dtype('interval')
+        assert IntervalDtype.is_dtype(IntervalDtype('float64'))
+        assert IntervalDtype.is_dtype(IntervalDtype('int64'))
+        assert IntervalDtype.is_dtype(IntervalDtype(np.int64))
+
+        assert not IntervalDtype.is_dtype('D')
+        assert not IntervalDtype.is_dtype('3D')
+        assert not IntervalDtype.is_dtype('U')
+        assert not IntervalDtype.is_dtype('S')
+        assert not IntervalDtype.is_dtype('foo')
+        assert not IntervalDtype.is_dtype('IntervalA')
+        assert not IntervalDtype.is_dtype(np.object_)
+        assert not IntervalDtype.is_dtype(np.int64)
+        assert not IntervalDtype.is_dtype(np.float64)
+
+    def test_equality(self):
+        assert is_dtype_equal(self.dtype, 'interval[int64]')
+        assert is_dtype_equal(self.dtype, IntervalDtype('int64'))
+        assert is_dtype_equal(IntervalDtype('int64'), IntervalDtype('int64'))
+
+        assert not is_dtype_equal(self.dtype, 'int64')
+        assert not is_dtype_equal(IntervalDtype('int64'),
+                                  IntervalDtype('float64'))
+
+        # invalid subtype comparisons do not raise when directly compared
+        dtype1 = IntervalDtype('float64')
+        dtype2 = IntervalDtype('datetime64[ns, US/Eastern]')
+        assert dtype1 != dtype2
+        assert dtype2 != dtype1
+
+    @pytest.mark.parametrize('subtype', [
+        None, 'interval', 'Interval', 'int64', 'uint64', 'float64',
+        'complex128', 'datetime64', 'timedelta64', PeriodDtype('Q')])
+    def test_equality_generic(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        assert is_dtype_equal(dtype, 'interval')
+        assert is_dtype_equal(dtype, IntervalDtype())
+
+    @pytest.mark.parametrize('subtype', [
+        'int64', 'uint64', 'float64', 'complex128', 'datetime64',
+        'timedelta64', PeriodDtype('Q')])
+    def test_name_repr(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        expected = 'interval[{subtype}]'.format(subtype=subtype)
+        assert str(dtype) == expected
+        assert dtype.name == 'interval'
+
+    @pytest.mark.parametrize('subtype', [None, 'interval', 'Interval'])
+    def test_name_repr_generic(self, subtype):
+        # GH 18980
+        dtype = IntervalDtype(subtype)
+        assert str(dtype) == 'interval'
+        assert dtype.name == 'interval'
+
+    def test_basic(self):
+        assert is_interval_dtype(self.dtype)
+
+        ii = IntervalIndex.from_breaks(range(3))
+
+        assert is_interval_dtype(ii.dtype)
+        assert is_interval_dtype(ii)
+
+        s = Series(ii, name='A')
+
+        assert is_interval_dtype(s.dtype)
+        assert is_interval_dtype(s)
+
+    def test_basic_dtype(self):
+        assert is_interval_dtype('interval[int64]')
+        assert is_interval_dtype(IntervalIndex.from_tuples([(0, 1)]))
+        assert is_interval_dtype(IntervalIndex.from_breaks(np.arange(4)))
+        assert is_interval_dtype(IntervalIndex.from_breaks(
+            date_range('20130101', periods=3)))
+        assert not is_interval_dtype('U')
+        assert not is_interval_dtype('S')
+        assert not is_interval_dtype('foo')
+        assert not is_interval_dtype(np.object_)
+        assert not is_interval_dtype(np.int64)
+        assert not is_interval_dtype(np.float64)
+
+    def test_caching(self):
+        IntervalDtype.reset_cache()
+        dtype = IntervalDtype("int64")
+        assert len(IntervalDtype._cache) == 1
+
+        IntervalDtype("interval")
+        assert len(IntervalDtype._cache) == 2
+
+        IntervalDtype.reset_cache()
+        tm.round_trip_pickle(dtype)
+        assert len(IntervalDtype._cache) == 0
+
+
+class TestCategoricalDtypeParametrized(object):
+
+    @pytest.mark.parametrize('categories', [
+        list('abcd'),
+        np.arange(1000),
+        ['a', 'b', 10, 2, 1.3, True],
+        [True, False],
+        pd.date_range('2017', periods=4)])
+    def test_basic(self, categories, ordered):
+        c1 = CategoricalDtype(categories, ordered=ordered)
+        tm.assert_index_equal(c1.categories, pd.Index(categories))
+        assert c1.ordered is ordered
+
+    def test_order_matters(self):
+        categories = ['a', 'b']
+        c1 = CategoricalDtype(categories, ordered=True)
+        c2 = CategoricalDtype(categories, ordered=False)
+        c3 = CategoricalDtype(categories, ordered=None)
+        assert c1 is not c2
+        assert c1 is not c3
+
+    @pytest.mark.parametrize('ordered', [False, None])
+    def test_unordered_same(self, ordered):
+        c1 = CategoricalDtype(['a', 'b'], ordered=ordered)
+        c2 = CategoricalDtype(['b', 'a'], ordered=ordered)
+        assert hash(c1) == hash(c2)
+
+    def test_categories(self):
+        result = CategoricalDtype(['a', 'b', 'c'])
+        tm.assert_index_equal(result.categories, pd.Index(['a', 'b', 'c']))
+        assert result.ordered is None
+
+    def test_equal_but_different(self, ordered):
+        c1 = CategoricalDtype([1, 2, 3])
+        c2 = CategoricalDtype([1., 2., 3.])
+        assert c1 is not c2
+        assert c1 != c2
+
+    @pytest.mark.parametrize('v1, v2', [
+        ([1, 2, 3], [1, 2, 3]),
+        ([1, 2, 3], [3, 2, 1]),
+    ])
+    def test_order_hashes_different(self, v1, v2):
+        c1 = CategoricalDtype(v1, ordered=False)
+        c2 = CategoricalDtype(v2, ordered=True)
+        c3 = CategoricalDtype(v1, ordered=None)
+        assert c1 is not c2
+        assert c1 is not c3
+
+    def test_nan_invalid(self):
+        with pytest.raises(ValueError):
+            CategoricalDtype([1, 2, np.nan])
+
+    def test_non_unique_invalid(self):
+        with pytest.raises(ValueError):
+            CategoricalDtype([1, 2, 1])
+
+    def test_same_categories_different_order(self):
+        c1 = CategoricalDtype(['a', 'b'], ordered=True)
+        c2 = CategoricalDtype(['b', 'a'], ordered=True)
+        assert c1 is not c2
+
+    @pytest.mark.parametrize('ordered1', [True, False, None])
+    @pytest.mark.parametrize('ordered2', [True, False, None])
+    def test_categorical_equality(self, ordered1, ordered2):
+        # same categories, same order
+        # any combination of None/False are equal
+        # True/True is the only combination with True that are equal
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(list('abc'), ordered2)
+        result = c1 == c2
+        expected = bool(ordered1) is bool(ordered2)
+        assert result is expected
+
+        # same categories, different order
+        # any combination of None/False are equal (order doesn't matter)
+        # any combination with True are not equal (different order of cats)
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(list('cab'), ordered2)
+        result = c1 == c2
+        expected = (bool(ordered1) is False) and (bool(ordered2) is False)
+        assert result is expected
+
+        # different categories
+        c2 = CategoricalDtype([1, 2, 3], ordered2)
+        assert c1 != c2
+
+        # none categories
+        c1 = CategoricalDtype(list('abc'), ordered1)
+        c2 = CategoricalDtype(None, ordered2)
+        c3 = CategoricalDtype(None, ordered1)
+        assert c1 == c2
+        assert c2 == c1
+        assert c2 == c3
+
+    @pytest.mark.parametrize('categories', [list('abc'), None])
+    @pytest.mark.parametrize('other', ['category', 'not a category'])
+    def test_categorical_equality_strings(self, categories, ordered, other):
+        c1 = CategoricalDtype(categories, ordered)
+        result = c1 == other
+        expected = other == 'category'
+        assert result is expected
+
+    def test_invalid_raises(self):
+        with pytest.raises(TypeError, match='ordered'):
+            CategoricalDtype(['a', 'b'], ordered='foo')
+
+        with pytest.raises(TypeError, match="'categories' must be list-like"):
+            CategoricalDtype('category')
+
+    def test_mixed(self):
+        a = CategoricalDtype(['a', 'b', 1, 2])
+        b = CategoricalDtype(['a', 'b', '1', '2'])
+        assert hash(a) != hash(b)
+
+    def test_from_categorical_dtype_identity(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # Identity test for no changes
+        c2 = CategoricalDtype._from_categorical_dtype(c1)
+        assert c2 is c1
+
+    def test_from_categorical_dtype_categories(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override categories
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, categories=[2, 3])
+        assert result == CategoricalDtype([2, 3], ordered=True)
+
+    def test_from_categorical_dtype_ordered(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override ordered
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, ordered=False)
+        assert result == CategoricalDtype([1, 2, 3], ordered=False)
+
+    def test_from_categorical_dtype_both(self):
+        c1 = Categorical([1, 2], categories=[1, 2, 3], ordered=True)
+        # override ordered
+        result = CategoricalDtype._from_categorical_dtype(
+            c1, categories=[1, 2], ordered=False)
+        assert result == CategoricalDtype([1, 2], ordered=False)
+
+    def test_str_vs_repr(self, ordered):
+        c1 = CategoricalDtype(['a', 'b'], ordered=ordered)
+        assert str(c1) == 'category'
+        # Py2 will have unicode prefixes
+        pat = r"CategoricalDtype\(categories=\[.*\], ordered={ordered}\)"
+        assert re.match(pat.format(ordered=ordered), repr(c1))
+
+    def test_categorical_categories(self):
+        # GH17884
+        c1 = CategoricalDtype(Categorical(['a', 'b']))
+        tm.assert_index_equal(c1.categories, pd.Index(['a', 'b']))
+        c1 = CategoricalDtype(CategoricalIndex(['a', 'b']))
+        tm.assert_index_equal(c1.categories, pd.Index(['a', 'b']))
+
+    @pytest.mark.parametrize('new_categories', [
+        list('abc'), list('cba'), list('wxyz'), None])
+    @pytest.mark.parametrize('new_ordered', [True, False, None])
+    def test_update_dtype(self, ordered, new_categories, new_ordered):
+        dtype = CategoricalDtype(list('abc'), ordered)
+        new_dtype = CategoricalDtype(new_categories, new_ordered)
+
+        expected_categories = new_dtype.categories
+        if expected_categories is None:
+            expected_categories = dtype.categories
+
+        expected_ordered = new_dtype.ordered
+        if expected_ordered is None:
+            expected_ordered = dtype.ordered
+
+        result = dtype.update_dtype(new_dtype)
+        tm.assert_index_equal(result.categories, expected_categories)
+        assert result.ordered is expected_ordered
+
+    def test_update_dtype_string(self, ordered):
+        dtype = CategoricalDtype(list('abc'), ordered)
+        expected_categories = dtype.categories
+        expected_ordered = dtype.ordered
+        result = dtype.update_dtype('category')
+        tm.assert_index_equal(result.categories, expected_categories)
+        assert result.ordered is expected_ordered
+
+    @pytest.mark.parametrize('bad_dtype', [
+        'foo', object, np.int64, PeriodDtype('Q')])
+    def test_update_dtype_errors(self, bad_dtype):
+        dtype = CategoricalDtype(list('abc'), False)
+        msg = 'a CategoricalDtype must be passed to perform an update, '
+        with pytest.raises(ValueError, match=msg):
+            dtype.update_dtype(bad_dtype)
+
+
+@pytest.mark.parametrize('dtype', [
+    CategoricalDtype,
+    IntervalDtype,
+    DatetimeTZDtype,
+    PeriodDtype,
+])
+def test_registry(dtype):
+    assert dtype in registry.dtypes
+
+
+@pytest.mark.parametrize('dtype, expected', [
+    ('int64', None),
+    ('interval', IntervalDtype()),
+    ('interval[int64]', IntervalDtype()),
+    ('interval[datetime64[ns]]', IntervalDtype('datetime64[ns]')),
+    ('period[D]', PeriodDtype('D')),
+    ('category', CategoricalDtype()),
+    ('datetime64[ns, US/Eastern]', DatetimeTZDtype('ns', 'US/Eastern')),
+])
+def test_registry_find(dtype, expected):
+    assert registry.find(dtype) == expected
+
+
+@pytest.mark.parametrize('dtype, expected', [
+    (str, False),
+    (int, False),
+    (bool, True),
+    (np.bool, True),
+    (np.array(['a', 'b']), False),
+    (pd.Series([1, 2]), False),
+    (np.array([True, False]), True),
+    (pd.Series([True, False]), True),
+    (pd.SparseSeries([True, False]), True),
+    (pd.SparseArray([True, False]), True),
+    (SparseDtype(bool), True)
+])
+def test_is_bool_dtype(dtype, expected):
+    result = is_bool_dtype(dtype)
+    assert result is expected
+
+
+@pytest.mark.parametrize("check", [
+    is_categorical_dtype,
+    is_datetime64tz_dtype,
+    is_period_dtype,
+    is_datetime64_ns_dtype,
+    is_datetime64_dtype,
+    is_interval_dtype,
+    is_datetime64_any_dtype,
+    is_string_dtype,
+    is_bool_dtype,
+])
+def test_is_dtype_no_warning(check):
+    data = pd.DataFrame({"A": [1, 2]})
+    with tm.assert_produces_warning(None):
+        check(data)
+
+    with tm.assert_produces_warning(None):
+        check(data["A"])
diff --git a/pandas/tests/dtypes/test_generic.py b/pandas/tests/dtypes/test_generic.py
new file mode 100644
index 0000000000000..2bb3559d56d61
--- /dev/null
+++ b/pandas/tests/dtypes/test_generic.py
@@ -0,0 +1,92 @@
+# -*- coding: utf-8 -*-
+
+from warnings import catch_warnings
+
+import numpy as np
+
+from pandas.core.dtypes import generic as gt
+
+import pandas as pd
+from pandas.util import testing as tm
+
+
+class TestABCClasses(object):
+    tuples = [[1, 2, 2], ['red', 'blue', 'red']]
+    multi_index = pd.MultiIndex.from_arrays(tuples, names=('number', 'color'))
+    datetime_index = pd.to_datetime(['2000/1/1', '2010/1/1'])
+    timedelta_index = pd.to_timedelta(np.arange(5), unit='s')
+    period_index = pd.period_range('2000/1/1', '2010/1/1/', freq='M')
+    categorical = pd.Categorical([1, 2, 3], categories=[2, 3, 1])
+    categorical_df = pd.DataFrame({"values": [1, 2, 3]}, index=categorical)
+    df = pd.DataFrame({'names': ['a', 'b', 'c']}, index=multi_index)
+    sparse_series = pd.Series([1, 2, 3]).to_sparse()
+    sparse_array = pd.SparseArray(np.random.randn(10))
+    sparse_frame = pd.SparseDataFrame({'a': [1, -1, None]})
+    datetime_array = pd.core.arrays.DatetimeArray(datetime_index)
+    timedelta_array = pd.core.arrays.TimedeltaArray(timedelta_index)
+
+    def test_abc_types(self):
+        assert isinstance(pd.Index(['a', 'b', 'c']), gt.ABCIndex)
+        assert isinstance(pd.Int64Index([1, 2, 3]), gt.ABCInt64Index)
+        assert isinstance(pd.UInt64Index([1, 2, 3]), gt.ABCUInt64Index)
+        assert isinstance(pd.Float64Index([1, 2, 3]), gt.ABCFloat64Index)
+        assert isinstance(self.multi_index, gt.ABCMultiIndex)
+        assert isinstance(self.datetime_index, gt.ABCDatetimeIndex)
+        assert isinstance(self.timedelta_index, gt.ABCTimedeltaIndex)
+        assert isinstance(self.period_index, gt.ABCPeriodIndex)
+        assert isinstance(self.categorical_df.index, gt.ABCCategoricalIndex)
+        assert isinstance(pd.Index(['a', 'b', 'c']), gt.ABCIndexClass)
+        assert isinstance(pd.Int64Index([1, 2, 3]), gt.ABCIndexClass)
+        assert isinstance(pd.Series([1, 2, 3]), gt.ABCSeries)
+        assert isinstance(self.df, gt.ABCDataFrame)
+        assert isinstance(self.sparse_series, gt.ABCSparseSeries)
+        assert isinstance(self.sparse_array, gt.ABCSparseArray)
+        assert isinstance(self.sparse_frame, gt.ABCSparseDataFrame)
+        assert isinstance(self.categorical, gt.ABCCategorical)
+        assert isinstance(pd.Period('2012', freq='A-DEC'), gt.ABCPeriod)
+
+        assert isinstance(pd.DateOffset(), gt.ABCDateOffset)
+        assert isinstance(pd.Period('2012', freq='A-DEC').freq,
+                          gt.ABCDateOffset)
+        assert not isinstance(pd.Period('2012', freq='A-DEC'),
+                              gt.ABCDateOffset)
+        assert isinstance(pd.Interval(0, 1.5), gt.ABCInterval)
+        assert not isinstance(pd.Period('2012', freq='A-DEC'), gt.ABCInterval)
+
+        assert isinstance(self.datetime_array, gt.ABCDatetimeArray)
+        assert not isinstance(self.datetime_index, gt.ABCDatetimeArray)
+
+        assert isinstance(self.timedelta_array, gt.ABCTimedeltaArray)
+        assert not isinstance(self.timedelta_index, gt.ABCTimedeltaArray)
+
+
+def test_setattr_warnings():
+    # GH7175 - GOTCHA: You can't use dot notation to add a column...
+    d = {'one': pd.Series([1., 2., 3.], index=['a', 'b', 'c']),
+         'two': pd.Series([1., 2., 3., 4.], index=['a', 'b', 'c', 'd'])}
+    df = pd.DataFrame(d)
+
+    with catch_warnings(record=True) as w:
+        #  successfully add new column
+        #  this should not raise a warning
+        df['three'] = df.two + 1
+        assert len(w) == 0
+        assert df.three.sum() > df.two.sum()
+
+    with catch_warnings(record=True) as w:
+        #  successfully modify column in place
+        #  this should not raise a warning
+        df.one += 1
+        assert len(w) == 0
+        assert df.one.iloc[0] == 2
+
+    with catch_warnings(record=True) as w:
+        #  successfully add an attribute to a series
+        #  this should not raise a warning
+        df.two.not_an_index = [1, 2]
+        assert len(w) == 0
+
+    with tm.assert_produces_warning(UserWarning):
+        #  warn when setting column to nonexistent name
+        df.four = df.two + 2
+        assert df.four.sum() > df.two.sum()
diff --git a/pandas/tests/dtypes/test_inference.py b/pandas/tests/dtypes/test_inference.py
new file mode 100644
index 0000000000000..187b37d4f788e
--- /dev/null
+++ b/pandas/tests/dtypes/test_inference.py
@@ -0,0 +1,1364 @@
+# -*- coding: utf-8 -*-
+
+"""
+These the test the public routines exposed in types/common.py
+related to inference and not otherwise tested in types/test_common.py
+
+"""
+import collections
+from datetime import date, datetime, time, timedelta
+from decimal import Decimal
+from fractions import Fraction
+from numbers import Number
+import re
+from warnings import catch_warnings, simplefilter
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs import iNaT, lib, missing as libmissing
+from pandas.compat import PY2, StringIO, lrange, u
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes import inference
+from pandas.core.dtypes.common import (
+    ensure_categorical, ensure_int32, is_bool, is_datetime64_any_dtype,
+    is_datetime64_dtype, is_datetime64_ns_dtype, is_datetime64tz_dtype,
+    is_float, is_integer, is_number, is_scalar, is_scipy_sparse,
+    is_timedelta64_dtype, is_timedelta64_ns_dtype)
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DateOffset, DatetimeIndex, Index, Interval, Panel,
+    Period, Series, Timedelta, TimedeltaIndex, Timestamp, compat, isna)
+from pandas.util import testing as tm
+
+
+@pytest.fixture(params=[True, False], ids=str)
+def coerce(request):
+    return request.param
+
+
+# collect all objects to be tested for list-like-ness; use tuples of objects,
+# whether they are list-like or not (special casing for sets), and their ID
+ll_params = [
+    ([1],                       True,  'list'),                 # noqa: E241
+    ([],                        True,  'list-empty'),           # noqa: E241
+    ((1, ),                     True,  'tuple'),                # noqa: E241
+    (tuple(),                   True,  'tuple-empty'),          # noqa: E241
+    ({'a': 1},                  True,  'dict'),                 # noqa: E241
+    (dict(),                    True,  'dict-empty'),           # noqa: E241
+    ({'a', 1},                  'set', 'set'),                  # noqa: E241
+    (set(),                     'set', 'set-empty'),            # noqa: E241
+    (frozenset({'a', 1}),       'set', 'frozenset'),            # noqa: E241
+    (frozenset(),               'set', 'frozenset-empty'),      # noqa: E241
+    (iter([1, 2]),              True,  'iterator'),             # noqa: E241
+    (iter([]),                  True,  'iterator-empty'),       # noqa: E241
+    ((x for x in [1, 2]),       True,  'generator'),            # noqa: E241
+    ((x for x in []),           True,  'generator-empty'),      # noqa: E241
+    (Series([1]),               True,  'Series'),               # noqa: E241
+    (Series([]),                True,  'Series-empty'),         # noqa: E241
+    (Series(['a']).str,         True,  'StringMethods'),        # noqa: E241
+    (Series([], dtype='O').str, True,  'StringMethods-empty'),  # noqa: E241
+    (Index([1]),                True,  'Index'),                # noqa: E241
+    (Index([]),                 True,  'Index-empty'),          # noqa: E241
+    (DataFrame([[1]]),          True,  'DataFrame'),            # noqa: E241
+    (DataFrame(),               True,  'DataFrame-empty'),      # noqa: E241
+    (np.ndarray((2,) * 1),      True,  'ndarray-1d'),           # noqa: E241
+    (np.array([]),              True,  'ndarray-1d-empty'),     # noqa: E241
+    (np.ndarray((2,) * 2),      True,  'ndarray-2d'),           # noqa: E241
+    (np.array([[]]),            True,  'ndarray-2d-empty'),     # noqa: E241
+    (np.ndarray((2,) * 3),      True,  'ndarray-3d'),           # noqa: E241
+    (np.array([[[]]]),          True,  'ndarray-3d-empty'),     # noqa: E241
+    (np.ndarray((2,) * 4),      True,  'ndarray-4d'),           # noqa: E241
+    (np.array([[[[]]]]),        True,  'ndarray-4d-empty'),     # noqa: E241
+    (np.array(2),               False, 'ndarray-0d'),           # noqa: E241
+    (1,                         False, 'int'),                  # noqa: E241
+    (b'123',                    False, 'bytes'),                # noqa: E241
+    (b'',                       False, 'bytes-empty'),          # noqa: E241
+    ('123',                     False, 'string'),               # noqa: E241
+    ('',                        False, 'string-empty'),         # noqa: E241
+    (str,                       False, 'string-type'),          # noqa: E241
+    (object(),                  False, 'object'),               # noqa: E241
+    (np.nan,                    False, 'NaN'),                  # noqa: E241
+    (None,                      False, 'None')                  # noqa: E241
+]
+objs, expected, ids = zip(*ll_params)
+
+
+@pytest.fixture(params=zip(objs, expected), ids=ids)
+def maybe_list_like(request):
+    return request.param
+
+
+def test_is_list_like(maybe_list_like):
+    obj, expected = maybe_list_like
+    expected = True if expected == 'set' else expected
+    assert inference.is_list_like(obj) == expected
+
+
+def test_is_list_like_disallow_sets(maybe_list_like):
+    obj, expected = maybe_list_like
+    expected = False if expected == 'set' else expected
+    assert inference.is_list_like(obj, allow_sets=False) == expected
+
+
+def test_is_sequence():
+    is_seq = inference.is_sequence
+    assert (is_seq((1, 2)))
+    assert (is_seq([1, 2]))
+    assert (not is_seq("abcd"))
+    assert (not is_seq(u("abcd")))
+    assert (not is_seq(np.int64))
+
+    class A(object):
+
+        def __getitem__(self):
+            return 1
+
+    assert (not is_seq(A()))
+
+
+def test_is_array_like():
+    assert inference.is_array_like(Series([]))
+    assert inference.is_array_like(Series([1, 2]))
+    assert inference.is_array_like(np.array(["a", "b"]))
+    assert inference.is_array_like(Index(["2016-01-01"]))
+
+    class DtypeList(list):
+        dtype = "special"
+
+    assert inference.is_array_like(DtypeList())
+
+    assert not inference.is_array_like([1, 2, 3])
+    assert not inference.is_array_like(tuple())
+    assert not inference.is_array_like("foo")
+    assert not inference.is_array_like(123)
+
+
+@pytest.mark.parametrize('inner', [
+    [], [1], (1, ), (1, 2), {'a': 1}, {1, 'a'}, Series([1]),
+    Series([]), Series(['a']).str, (x for x in range(5))
+])
+@pytest.mark.parametrize('outer', [
+    list, Series, np.array, tuple
+])
+def test_is_nested_list_like_passes(inner, outer):
+    result = outer([inner for _ in range(5)])
+    assert inference.is_list_like(result)
+
+
+@pytest.mark.parametrize('obj', [
+    'abc', [], [1], (1,), ['a'], 'a', {'a'},
+    [1, 2, 3], Series([1]), DataFrame({"A": [1]}),
+    ([1, 2] for _ in range(5)),
+])
+def test_is_nested_list_like_fails(obj):
+    assert not inference.is_nested_list_like(obj)
+
+
+@pytest.mark.parametrize(
+    "ll", [{}, {'A': 1}, Series([1]), collections.defaultdict()])
+def test_is_dict_like_passes(ll):
+    assert inference.is_dict_like(ll)
+
+
+@pytest.mark.parametrize("ll", [
+    '1', 1, [1, 2], (1, 2), range(2), Index([1]),
+    dict, collections.defaultdict, Series
+])
+def test_is_dict_like_fails(ll):
+    assert not inference.is_dict_like(ll)
+
+
+@pytest.mark.parametrize("has_keys", [True, False])
+@pytest.mark.parametrize("has_getitem", [True, False])
+@pytest.mark.parametrize("has_contains", [True, False])
+def test_is_dict_like_duck_type(has_keys, has_getitem, has_contains):
+    class DictLike(object):
+        def __init__(self, d):
+            self.d = d
+
+        if has_keys:
+            def keys(self):
+                return self.d.keys()
+
+        if has_getitem:
+            def __getitem__(self, key):
+                return self.d.__getitem__(key)
+
+        if has_contains:
+            def __contains__(self, key):
+                return self.d.__contains__(key)
+
+    d = DictLike({1: 2})
+    result = inference.is_dict_like(d)
+    expected = has_keys and has_getitem and has_contains
+
+    assert result is expected
+
+
+def test_is_file_like():
+    class MockFile(object):
+        pass
+
+    is_file = inference.is_file_like
+
+    data = StringIO("data")
+    assert is_file(data)
+
+    # No read / write attributes
+    # No iterator attributes
+    m = MockFile()
+    assert not is_file(m)
+
+    MockFile.write = lambda self: 0
+
+    # Write attribute but not an iterator
+    m = MockFile()
+    assert not is_file(m)
+
+    # gh-16530: Valid iterator just means we have the
+    # __iter__ attribute for our purposes.
+    MockFile.__iter__ = lambda self: self
+
+    # Valid write-only file
+    m = MockFile()
+    assert is_file(m)
+
+    del MockFile.write
+    MockFile.read = lambda self: 0
+
+    # Valid read-only file
+    m = MockFile()
+    assert is_file(m)
+
+    # Iterator but no read / write attributes
+    data = [1, 2, 3]
+    assert not is_file(data)
+
+
+@pytest.mark.parametrize(
+    "ll", [collections.namedtuple('Test', list('abc'))(1, 2, 3)])
+def test_is_names_tuple_passes(ll):
+    assert inference.is_named_tuple(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [(1, 2, 3), 'a', Series({'pi': 3.14})])
+def test_is_names_tuple_fails(ll):
+    assert not inference.is_named_tuple(ll)
+
+
+def test_is_hashable():
+
+    # all new-style classes are hashable by default
+    class HashableClass(object):
+        pass
+
+    class UnhashableClass1(object):
+        __hash__ = None
+
+    class UnhashableClass2(object):
+
+        def __hash__(self):
+            raise TypeError("Not hashable")
+
+    hashable = (1,
+                3.14,
+                np.float64(3.14),
+                'a',
+                tuple(),
+                (1, ),
+                HashableClass(), )
+    not_hashable = ([], UnhashableClass1(), )
+    abc_hashable_not_really_hashable = (([], ), UnhashableClass2(), )
+
+    for i in hashable:
+        assert inference.is_hashable(i)
+    for i in not_hashable:
+        assert not inference.is_hashable(i)
+    for i in abc_hashable_not_really_hashable:
+        assert not inference.is_hashable(i)
+
+    # numpy.array is no longer collections.Hashable as of
+    # https://github.com/numpy/numpy/pull/5326, just test
+    # is_hashable()
+    assert not inference.is_hashable(np.array([]))
+
+    # old-style classes in Python 2 don't appear hashable to
+    # collections.Hashable but also seem to support hash() by default
+    if PY2:
+
+        class OldStyleClass():
+            pass
+
+        c = OldStyleClass()
+        assert not isinstance(c, compat.Hashable)
+        assert inference.is_hashable(c)
+        hash(c)  # this will not raise
+
+
+@pytest.mark.parametrize(
+    "ll", [re.compile('ad')])
+def test_is_re_passes(ll):
+    assert inference.is_re(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", ['x', 2, 3, object()])
+def test_is_re_fails(ll):
+    assert not inference.is_re(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [r'a', u('x'),
+           r'asdf',
+           re.compile('adsf'),
+           u(r'\u2233\s*'),
+           re.compile(r'')])
+def test_is_recompilable_passes(ll):
+    assert inference.is_re_compilable(ll)
+
+
+@pytest.mark.parametrize(
+    "ll", [1, [], object()])
+def test_is_recompilable_fails(ll):
+    assert not inference.is_re_compilable(ll)
+
+
+class TestInference(object):
+
+    def test_infer_dtype_bytes(self):
+        compare = 'string' if PY2 else 'bytes'
+
+        # string array of bytes
+        arr = np.array(list('abc'), dtype='S1')
+        assert lib.infer_dtype(arr, skipna=True) == compare
+
+        # object array of bytes
+        arr = arr.astype(object)
+        assert lib.infer_dtype(arr, skipna=True) == compare
+
+        # object array of bytes with missing values
+        assert lib.infer_dtype([b'a', np.nan, b'c'], skipna=True) == compare
+
+    def test_isinf_scalar(self):
+        # GH 11352
+        assert libmissing.isposinf_scalar(float('inf'))
+        assert libmissing.isposinf_scalar(np.inf)
+        assert not libmissing.isposinf_scalar(-np.inf)
+        assert not libmissing.isposinf_scalar(1)
+        assert not libmissing.isposinf_scalar('a')
+
+        assert libmissing.isneginf_scalar(float('-inf'))
+        assert libmissing.isneginf_scalar(-np.inf)
+        assert not libmissing.isneginf_scalar(np.inf)
+        assert not libmissing.isneginf_scalar(1)
+        assert not libmissing.isneginf_scalar('a')
+
+    def test_maybe_convert_numeric_infinities(self):
+        # see gh-13274
+        infinities = ['inf', 'inF', 'iNf', 'Inf',
+                      'iNF', 'InF', 'INf', 'INF']
+        na_values = {'', 'NULL', 'nan'}
+
+        pos = np.array(['inf'], dtype=np.float64)
+        neg = np.array(['-inf'], dtype=np.float64)
+
+        msg = "Unable to parse string"
+
+        for infinity in infinities:
+            for maybe_int in (True, False):
+                out = lib.maybe_convert_numeric(
+                    np.array([infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                out = lib.maybe_convert_numeric(
+                    np.array(['-' + infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, neg)
+
+                out = lib.maybe_convert_numeric(
+                    np.array([u(infinity)], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                out = lib.maybe_convert_numeric(
+                    np.array(['+' + infinity], dtype=object),
+                    na_values, maybe_int)
+                tm.assert_numpy_array_equal(out, pos)
+
+                # too many characters
+                with pytest.raises(ValueError, match=msg):
+                    lib.maybe_convert_numeric(
+                        np.array(['foo_' + infinity], dtype=object),
+                        na_values, maybe_int)
+
+    def test_maybe_convert_numeric_post_floatify_nan(self, coerce):
+        # see gh-13314
+        data = np.array(['1.200', '-999.000', '4.500'], dtype=object)
+        expected = np.array([1.2, np.nan, 4.5], dtype=np.float64)
+        nan_values = {-999, -999.0}
+
+        out = lib.maybe_convert_numeric(data, nan_values, coerce)
+        tm.assert_numpy_array_equal(out, expected)
+
+    def test_convert_infs(self):
+        arr = np.array(['inf', 'inf', 'inf'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False)
+        assert result.dtype == np.float64
+
+        arr = np.array(['-inf', '-inf', '-inf'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False)
+        assert result.dtype == np.float64
+
+    def test_scientific_no_exponent(self):
+        # See PR 12215
+        arr = np.array(['42E', '2E', '99e', '6e'], dtype='O')
+        result = lib.maybe_convert_numeric(arr, set(), False, True)
+        assert np.all(np.isnan(result))
+
+    def test_convert_non_hashable(self):
+        # GH13324
+        # make sure that we are handing non-hashables
+        arr = np.array([[10.0, 2], 1.0, 'apple'])
+        result = lib.maybe_convert_numeric(arr, set(), False, True)
+        tm.assert_numpy_array_equal(result, np.array([np.nan, 1.0, np.nan]))
+
+    def test_convert_numeric_uint64(self):
+        arr = np.array([2**63], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+        arr = np.array([str(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+        arr = np.array([np.uint64(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
+
+    @pytest.mark.parametrize("arr", [
+        np.array([2**63, np.nan], dtype=object),
+        np.array([str(2**63), np.nan], dtype=object),
+        np.array([np.nan, 2**63], dtype=object),
+        np.array([np.nan, str(2**63)], dtype=object)])
+    def test_convert_numeric_uint64_nan(self, coerce, arr):
+        expected = arr.astype(float) if coerce else arr.copy()
+        result = lib.maybe_convert_numeric(arr, set(),
+                                           coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    def test_convert_numeric_uint64_nan_values(self, coerce):
+        arr = np.array([2**63, 2**63 + 1], dtype=object)
+        na_values = {2**63}
+
+        expected = (np.array([np.nan, 2**63 + 1], dtype=float)
+                    if coerce else arr.copy())
+        result = lib.maybe_convert_numeric(arr, na_values,
+                                           coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("case", [
+        np.array([2**63, -1], dtype=object),
+        np.array([str(2**63), -1], dtype=object),
+        np.array([str(2**63), str(-1)], dtype=object),
+        np.array([-1, 2**63], dtype=object),
+        np.array([-1, str(2**63)], dtype=object),
+        np.array([str(-1), str(2**63)], dtype=object)])
+    def test_convert_numeric_int64_uint64(self, case, coerce):
+        expected = case.astype(float) if coerce else case.copy()
+        result = lib.maybe_convert_numeric(case, set(), coerce_numeric=coerce)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [-2**63 - 1, 2**64])
+    def test_convert_int_overflow(self, value):
+        # see gh-18584
+        arr = np.array([value], dtype=object)
+        result = lib.maybe_convert_objects(arr)
+        tm.assert_numpy_array_equal(arr, result)
+
+    def test_maybe_convert_objects_uint64(self):
+        # see gh-4471
+        arr = np.array([2**63], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        # NumPy bug: can't compare uint64 to int64, as that
+        # results in both casting to float64, so we should
+        # make sure that this function is robust against it
+        arr = np.array([np.uint64(2**63)], dtype=object)
+        exp = np.array([2**63], dtype=np.uint64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        arr = np.array([2, -1], dtype=object)
+        exp = np.array([2, -1], dtype=np.int64)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+        arr = np.array([2**63, -1], dtype=object)
+        exp = np.array([2**63, -1], dtype=object)
+        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
+
+    def test_mixed_dtypes_remain_object_array(self):
+        # GH14956
+        array = np.array([datetime(2015, 1, 1, tzinfo=pytz.utc), 1],
+                         dtype=object)
+        result = lib.maybe_convert_objects(array, convert_datetime=1)
+        tm.assert_numpy_array_equal(result, array)
+
+
+class TestTypeInference(object):
+
+    # Dummy class used for testing with Python objects
+    class Dummy():
+        pass
+
+    def test_inferred_dtype_fixture(self, any_skipna_inferred_dtype):
+        # see pandas/conftest.py
+        inferred_dtype, values = any_skipna_inferred_dtype
+
+        # make sure the inferred dtype of the fixture is as requested
+        assert inferred_dtype == lib.infer_dtype(values, skipna=True)
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_length_zero(self, skipna):
+        result = lib.infer_dtype(np.array([], dtype='i4'), skipna=skipna)
+        assert result == 'integer'
+
+        result = lib.infer_dtype([], skipna=skipna)
+        assert result == 'empty'
+
+        # GH 18004
+        arr = np.array([np.array([], dtype=object),
+                        np.array([], dtype=object)])
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'empty'
+
+    def test_integers(self):
+        arr = np.array([1, 2, 3, np.int64(4), np.int32(5)], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'integer'
+
+        arr = np.array([1, 2, 3, np.int64(4), np.int32(5), 'foo'], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'mixed-integer'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='i4')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'integer'
+
+    def test_deprecation(self):
+        # GH 24050
+        arr = np.array([1, 2, 3], dtype=object)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = lib.infer_dtype(arr)  # default: skipna=None -> warn
+            assert result == 'integer'
+
+    def test_bools(self):
+        arr = np.array([True, False, True, True, True], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'boolean'
+
+        arr = np.array([np.bool_(True), np.bool_(False)], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'boolean'
+
+        arr = np.array([True, False, True, 'foo'], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'mixed'
+
+        arr = np.array([True, False, True], dtype=bool)
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'boolean'
+
+        arr = np.array([True, np.nan, False], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'boolean'
+
+        result = lib.infer_dtype(arr, skipna=False)
+        assert result == 'mixed'
+
+    def test_floats(self):
+        arr = np.array([1., 2., 3., np.float64(4), np.float32(5)], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'floating'
+
+        arr = np.array([1, 2, 3, np.float64(4), np.float32(5), 'foo'],
+                       dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'mixed-integer'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='f4')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'floating'
+
+        arr = np.array([1, 2, 3, 4, 5], dtype='f8')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'floating'
+
+    def test_decimals(self):
+        # GH15690
+        arr = np.array([Decimal(1), Decimal(2), Decimal(3)])
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'decimal'
+
+        arr = np.array([1.0, 2.0, Decimal(3)])
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'mixed'
+
+        arr = np.array([Decimal(1), Decimal('NaN'), Decimal(3)])
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'decimal'
+
+        arr = np.array([Decimal(1), np.nan, Decimal(3)], dtype='O')
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'decimal'
+
+    # complex is compatible with nan, so skipna has no effect
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_complex(self, skipna):
+        # gets cast to complex on array construction
+        arr = np.array([1.0, 2.0, 1 + 1j])
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'complex'
+
+        arr = np.array([1.0, 2.0, 1 + 1j], dtype='O')
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'mixed'
+
+        # gets cast to complex on array construction
+        arr = np.array([1, np.nan, 1 + 1j])
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'complex'
+
+        arr = np.array([1.0, np.nan, 1 + 1j], dtype='O')
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'mixed'
+
+        # complex with nans stays complex
+        arr = np.array([1 + 1j, np.nan, 3 + 3j], dtype='O')
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'complex'
+
+        # test smaller complex dtype; will pass through _try_infer_map fastpath
+        arr = np.array([1 + 1j, np.nan, 3 + 3j], dtype=np.complex64)
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == 'complex'
+
+    def test_string(self):
+        pass
+
+    def test_unicode(self):
+        arr = [u'a', np.nan, u'c']
+        result = lib.infer_dtype(arr, skipna=False)
+        assert result == 'mixed'
+
+        arr = [u'a', np.nan, u'c']
+        result = lib.infer_dtype(arr, skipna=True)
+        expected = 'unicode' if PY2 else 'string'
+        assert result == expected
+
+    @pytest.mark.parametrize('dtype, missing, skipna, expected', [
+        (float, np.nan, False, 'floating'),
+        (float, np.nan, True, 'floating'),
+        (object, np.nan, False, 'floating'),
+        (object, np.nan, True, 'empty'),
+        (object, None, False, 'mixed'),
+        (object, None, True, 'empty')
+    ])
+    @pytest.mark.parametrize('box', [pd.Series, np.array])
+    def test_object_empty(self, box, missing, dtype, skipna, expected):
+        # GH 23421
+        arr = box([missing, missing], dtype=dtype)
+
+        result = lib.infer_dtype(arr, skipna=skipna)
+        assert result == expected
+
+    def test_datetime(self):
+
+        dates = [datetime(2012, 1, x) for x in range(1, 20)]
+        index = Index(dates)
+        assert index.inferred_type == 'datetime64'
+
+    def test_infer_dtype_datetime(self):
+
+        arr = np.array([Timestamp('2011-01-01'),
+                        Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+        arr = np.array([np.datetime64('2011-01-01'),
+                        np.datetime64('2011-01-01')], dtype=object)
+        assert lib.infer_dtype(arr, skipna=True) == 'datetime64'
+
+        arr = np.array([datetime(2011, 1, 1), datetime(2012, 2, 1)])
+        assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, pd.Timestamp('2011-01-02')])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+            arr = np.array([n, np.datetime64('2011-01-02')])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime64'
+
+            arr = np.array([n, datetime(2011, 1, 1)])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+            arr = np.array([n, pd.Timestamp('2011-01-02'), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+            arr = np.array([n, np.datetime64('2011-01-02'), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime64'
+
+            arr = np.array([n, datetime(2011, 1, 1), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+        # different type of nat
+        arr = np.array([np.timedelta64('nat'),
+                        np.datetime64('2011-01-02')], dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        arr = np.array([np.datetime64('2011-01-02'),
+                        np.timedelta64('nat')], dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        # mixed datetime
+        arr = np.array([datetime(2011, 1, 1),
+                        pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr, skipna=True) == 'datetime'
+
+        # should be datetime?
+        arr = np.array([np.datetime64('2011-01-01'),
+                        pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr, skipna=True) == 'mixed'
+
+        arr = np.array([pd.Timestamp('2011-01-02'),
+                        np.datetime64('2011-01-01')])
+        assert lib.infer_dtype(arr, skipna=True) == 'mixed'
+
+        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1])
+        assert lib.infer_dtype(arr, skipna=True) == 'mixed-integer'
+
+        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1.1])
+        assert lib.infer_dtype(arr, skipna=True) == 'mixed'
+
+        arr = np.array([np.nan, '2011-01-01', pd.Timestamp('2011-01-02')])
+        assert lib.infer_dtype(arr, skipna=True) == 'mixed'
+
+    def test_infer_dtype_timedelta(self):
+
+        arr = np.array([pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')])
+        assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+        arr = np.array([np.timedelta64(1, 'D'),
+                        np.timedelta64(2, 'D')], dtype=object)
+        assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+        arr = np.array([timedelta(1), timedelta(2)])
+        assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, Timedelta('1 days')])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+            arr = np.array([n, np.timedelta64(1, 'D')])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+            arr = np.array([n, timedelta(1)])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+            arr = np.array([n, pd.Timedelta('1 days'), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+            arr = np.array([n, np.timedelta64(1, 'D'), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+            arr = np.array([n, timedelta(1), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'timedelta'
+
+        # different type of nat
+        arr = np.array([np.datetime64('nat'), np.timedelta64(1, 'D')],
+                       dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        arr = np.array([np.timedelta64(1, 'D'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+    def test_infer_dtype_period(self):
+        # GH 13664
+        arr = np.array([pd.Period('2011-01', freq='D'),
+                        pd.Period('2011-02', freq='D')])
+        assert lib.infer_dtype(arr, skipna=True) == 'period'
+
+        arr = np.array([pd.Period('2011-01', freq='D'),
+                        pd.Period('2011-02', freq='M')])
+        assert lib.infer_dtype(arr, skipna=True) == 'period'
+
+        # starts with nan
+        for n in [pd.NaT, np.nan]:
+            arr = np.array([n, pd.Period('2011-01', freq='D')])
+            assert lib.infer_dtype(arr, skipna=True) == 'period'
+
+            arr = np.array([n, pd.Period('2011-01', freq='D'), n])
+            assert lib.infer_dtype(arr, skipna=True) == 'period'
+
+        # different type of nat
+        arr = np.array([np.datetime64('nat'), pd.Period('2011-01', freq='M')],
+                       dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        arr = np.array([pd.Period('2011-01', freq='M'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            [datetime(2017, 6, 12, 19, 30), datetime(2017, 3, 11, 1, 15)],
+            [Timestamp("20170612"), Timestamp("20170311")],
+            [Timestamp("20170612", tz='US/Eastern'),
+             Timestamp("20170311", tz='US/Eastern')],
+            [date(2017, 6, 12),
+             Timestamp("20170311", tz='US/Eastern')],
+            [np.datetime64("2017-06-12"), np.datetime64("2017-03-11")],
+            [np.datetime64("2017-06-12"), datetime(2017, 3, 11, 1, 15)]
+        ]
+    )
+    def test_infer_datetimelike_array_datetime(self, data):
+        assert lib.infer_datetimelike_array(data) == "datetime"
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            [timedelta(2017, 6, 12), timedelta(2017, 3, 11)],
+            [timedelta(2017, 6, 12), date(2017, 3, 11)],
+            [np.timedelta64(2017, "D"), np.timedelta64(6, "s")],
+            [np.timedelta64(2017, "D"), timedelta(2017, 3, 11)]
+        ]
+    )
+    def test_infer_datetimelike_array_timedelta(self, data):
+        assert lib.infer_datetimelike_array(data) == "timedelta"
+
+    def test_infer_datetimelike_array_date(self):
+        arr = [date(2017, 6, 12), date(2017, 3, 11)]
+        assert lib.infer_datetimelike_array(arr) == "date"
+
+    @pytest.mark.parametrize(
+        "data",
+        [
+            ["2017-06-12", "2017-03-11"],
+            [20170612, 20170311],
+            [20170612.5, 20170311.8],
+            [Dummy(), Dummy()],
+            [Timestamp("20170612"), Timestamp("20170311", tz='US/Eastern')],
+            [Timestamp("20170612"), 20170311],
+            [timedelta(2017, 6, 12), Timestamp("20170311", tz='US/Eastern')]
+        ]
+    )
+    def test_infer_datetimelike_array_mixed(self, data):
+        assert lib.infer_datetimelike_array(data) == "mixed"
+
+    @pytest.mark.parametrize(
+        "first, expected",
+        [
+            [[None], "mixed"],
+            [[np.nan], "mixed"],
+            [[pd.NaT], "nat"],
+            [[datetime(2017, 6, 12, 19, 30), pd.NaT], "datetime"],
+            [[np.datetime64("2017-06-12"), pd.NaT], "datetime"],
+            [[date(2017, 6, 12), pd.NaT], "date"],
+            [[timedelta(2017, 6, 12), pd.NaT], "timedelta"],
+            [[np.timedelta64(2017, "D"), pd.NaT], "timedelta"]
+        ]
+    )
+    @pytest.mark.parametrize("second", [None, np.nan])
+    def test_infer_datetimelike_array_nan_nat_like(self, first, second,
+                                                   expected):
+        first.append(second)
+        assert lib.infer_datetimelike_array(first) == expected
+
+    def test_infer_dtype_all_nan_nat_like(self):
+        arr = np.array([np.nan, np.nan])
+        assert lib.infer_dtype(arr, skipna=True) == 'floating'
+
+        # nan and None mix are result in mixed
+        arr = np.array([np.nan, np.nan, None])
+        assert lib.infer_dtype(arr, skipna=True) == 'empty'
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        arr = np.array([None, np.nan, np.nan])
+        assert lib.infer_dtype(arr, skipna=True) == 'empty'
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        # pd.NaT
+        arr = np.array([pd.NaT])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime'
+
+        arr = np.array([pd.NaT, np.nan])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime'
+
+        arr = np.array([np.nan, pd.NaT])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime'
+
+        arr = np.array([np.nan, pd.NaT, np.nan])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime'
+
+        arr = np.array([None, pd.NaT, None])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime'
+
+        # np.datetime64(nat)
+        arr = np.array([np.datetime64('nat')])
+        assert lib.infer_dtype(arr, skipna=False) == 'datetime64'
+
+        for n in [np.nan, pd.NaT, None]:
+            arr = np.array([n, np.datetime64('nat'), n])
+            assert lib.infer_dtype(arr, skipna=False) == 'datetime64'
+
+            arr = np.array([pd.NaT, n, np.datetime64('nat'), n])
+            assert lib.infer_dtype(arr, skipna=False) == 'datetime64'
+
+        arr = np.array([np.timedelta64('nat')], dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'timedelta'
+
+        for n in [np.nan, pd.NaT, None]:
+            arr = np.array([n, np.timedelta64('nat'), n])
+            assert lib.infer_dtype(arr, skipna=False) == 'timedelta'
+
+            arr = np.array([pd.NaT, n, np.timedelta64('nat'), n])
+            assert lib.infer_dtype(arr, skipna=False) == 'timedelta'
+
+        # datetime / timedelta mixed
+        arr = np.array([pd.NaT, np.datetime64('nat'),
+                        np.timedelta64('nat'), np.nan])
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+        arr = np.array([np.timedelta64('nat'), np.datetime64('nat')],
+                       dtype=object)
+        assert lib.infer_dtype(arr, skipna=False) == 'mixed'
+
+    def test_is_datetimelike_array_all_nan_nat_like(self):
+        arr = np.array([np.nan, pd.NaT, np.datetime64('nat')])
+        assert lib.is_datetime_array(arr)
+        assert lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT, np.timedelta64('nat')])
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT, np.datetime64('nat'),
+                        np.timedelta64('nat')])
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, pd.NaT])
+        assert lib.is_datetime_array(arr)
+        assert lib.is_datetime64_array(arr)
+        assert lib.is_timedelta_or_timedelta64_array(arr)
+
+        arr = np.array([np.nan, np.nan], dtype=object)
+        assert not lib.is_datetime_array(arr)
+        assert not lib.is_datetime64_array(arr)
+        assert not lib.is_timedelta_or_timedelta64_array(arr)
+
+        assert lib.is_datetime_with_singletz_array(
+            np.array([pd.Timestamp('20130101', tz='US/Eastern'),
+                      pd.Timestamp('20130102', tz='US/Eastern')],
+                     dtype=object))
+        assert not lib.is_datetime_with_singletz_array(
+            np.array([pd.Timestamp('20130101', tz='US/Eastern'),
+                      pd.Timestamp('20130102', tz='CET')],
+                     dtype=object))
+
+    @pytest.mark.parametrize(
+        "func",
+        [
+            'is_datetime_array',
+            'is_datetime64_array',
+            'is_bool_array',
+            'is_timedelta_or_timedelta64_array',
+            'is_date_array',
+            'is_time_array',
+            'is_interval_array',
+            'is_period_array'])
+    def test_other_dtypes_for_array(self, func):
+        func = getattr(lib, func)
+        arr = np.array(['foo', 'bar'])
+        assert not func(arr)
+
+        arr = np.array([1, 2])
+        assert not func(arr)
+
+    def test_date(self):
+
+        dates = [date(2012, 1, day) for day in range(1, 20)]
+        index = Index(dates)
+        assert index.inferred_type == 'date'
+
+        dates = [date(2012, 1, day) for day in range(1, 20)] + [np.nan]
+        result = lib.infer_dtype(dates, skipna=False)
+        assert result == 'mixed'
+
+        result = lib.infer_dtype(dates, skipna=True)
+        assert result == 'date'
+
+    def test_is_numeric_array(self):
+
+        assert lib.is_float_array(np.array([1, 2.0]))
+        assert lib.is_float_array(np.array([1, 2.0, np.nan]))
+        assert not lib.is_float_array(np.array([1, 2]))
+
+        assert lib.is_integer_array(np.array([1, 2]))
+        assert not lib.is_integer_array(np.array([1, 2.0]))
+
+    def test_is_string_array(self):
+
+        assert lib.is_string_array(np.array(['foo', 'bar']))
+        assert not lib.is_string_array(
+            np.array(['foo', 'bar', np.nan], dtype=object), skipna=False)
+        assert lib.is_string_array(
+            np.array(['foo', 'bar', np.nan], dtype=object), skipna=True)
+        assert not lib.is_string_array(np.array([1, 2]))
+
+    def test_to_object_array_tuples(self):
+        r = (5, 6)
+        values = [r]
+        result = lib.to_object_array_tuples(values)
+
+        try:
+            # make sure record array works
+            from collections import namedtuple
+            record = namedtuple('record', 'x y')
+            r = record(5, 6)
+            values = [r]
+            result = lib.to_object_array_tuples(values)  # noqa
+        except ImportError:
+            pass
+
+    def test_object(self):
+
+        # GH 7431
+        # cannot infer more than this as only a single element
+        arr = np.array([None], dtype='O')
+        result = lib.infer_dtype(arr, skipna=False)
+        assert result == 'mixed'
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'empty'
+
+    def test_to_object_array_width(self):
+        # see gh-13320
+        rows = [[1, 2, 3], [4, 5, 6]]
+
+        expected = np.array(rows, dtype=object)
+        out = lib.to_object_array(rows)
+        tm.assert_numpy_array_equal(out, expected)
+
+        expected = np.array(rows, dtype=object)
+        out = lib.to_object_array(rows, min_width=1)
+        tm.assert_numpy_array_equal(out, expected)
+
+        expected = np.array([[1, 2, 3, None, None],
+                             [4, 5, 6, None, None]], dtype=object)
+        out = lib.to_object_array(rows, min_width=5)
+        tm.assert_numpy_array_equal(out, expected)
+
+    def test_is_period(self):
+        assert lib.is_period(pd.Period('2011-01', freq='M'))
+        assert not lib.is_period(pd.PeriodIndex(['2011-01'], freq='M'))
+        assert not lib.is_period(pd.Timestamp('2011-01'))
+        assert not lib.is_period(1)
+        assert not lib.is_period(np.nan)
+
+    def test_categorical(self):
+
+        # GH 8974
+        from pandas import Categorical, Series
+        arr = Categorical(list('abc'))
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'categorical'
+
+        result = lib.infer_dtype(Series(arr), skipna=True)
+        assert result == 'categorical'
+
+        arr = Categorical(list('abc'), categories=['cegfab'], ordered=True)
+        result = lib.infer_dtype(arr, skipna=True)
+        assert result == 'categorical'
+
+        result = lib.infer_dtype(Series(arr), skipna=True)
+        assert result == 'categorical'
+
+
+class TestNumberScalar(object):
+
+    def test_is_number(self):
+
+        assert is_number(True)
+        assert is_number(1)
+        assert is_number(1.1)
+        assert is_number(1 + 3j)
+        assert is_number(np.bool(False))
+        assert is_number(np.int64(1))
+        assert is_number(np.float64(1.1))
+        assert is_number(np.complex128(1 + 3j))
+        assert is_number(np.nan)
+
+        assert not is_number(None)
+        assert not is_number('x')
+        assert not is_number(datetime(2011, 1, 1))
+        assert not is_number(np.datetime64('2011-01-01'))
+        assert not is_number(Timestamp('2011-01-01'))
+        assert not is_number(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_number(timedelta(1000))
+        assert not is_number(Timedelta('1 days'))
+
+        # questionable
+        assert not is_number(np.bool_(False))
+        assert is_number(np.timedelta64(1, 'D'))
+
+    def test_is_bool(self):
+        assert is_bool(True)
+        assert is_bool(np.bool(False))
+        assert is_bool(np.bool_(False))
+
+        assert not is_bool(1)
+        assert not is_bool(1.1)
+        assert not is_bool(1 + 3j)
+        assert not is_bool(np.int64(1))
+        assert not is_bool(np.float64(1.1))
+        assert not is_bool(np.complex128(1 + 3j))
+        assert not is_bool(np.nan)
+        assert not is_bool(None)
+        assert not is_bool('x')
+        assert not is_bool(datetime(2011, 1, 1))
+        assert not is_bool(np.datetime64('2011-01-01'))
+        assert not is_bool(Timestamp('2011-01-01'))
+        assert not is_bool(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_bool(timedelta(1000))
+        assert not is_bool(np.timedelta64(1, 'D'))
+        assert not is_bool(Timedelta('1 days'))
+
+    def test_is_integer(self):
+        assert is_integer(1)
+        assert is_integer(np.int64(1))
+
+        assert not is_integer(True)
+        assert not is_integer(1.1)
+        assert not is_integer(1 + 3j)
+        assert not is_integer(np.bool(False))
+        assert not is_integer(np.bool_(False))
+        assert not is_integer(np.float64(1.1))
+        assert not is_integer(np.complex128(1 + 3j))
+        assert not is_integer(np.nan)
+        assert not is_integer(None)
+        assert not is_integer('x')
+        assert not is_integer(datetime(2011, 1, 1))
+        assert not is_integer(np.datetime64('2011-01-01'))
+        assert not is_integer(Timestamp('2011-01-01'))
+        assert not is_integer(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_integer(timedelta(1000))
+        assert not is_integer(Timedelta('1 days'))
+
+        # questionable
+        assert is_integer(np.timedelta64(1, 'D'))
+
+    def test_is_float(self):
+        assert is_float(1.1)
+        assert is_float(np.float64(1.1))
+        assert is_float(np.nan)
+
+        assert not is_float(True)
+        assert not is_float(1)
+        assert not is_float(1 + 3j)
+        assert not is_float(np.bool(False))
+        assert not is_float(np.bool_(False))
+        assert not is_float(np.int64(1))
+        assert not is_float(np.complex128(1 + 3j))
+        assert not is_float(None)
+        assert not is_float('x')
+        assert not is_float(datetime(2011, 1, 1))
+        assert not is_float(np.datetime64('2011-01-01'))
+        assert not is_float(Timestamp('2011-01-01'))
+        assert not is_float(Timestamp('2011-01-01', tz='US/Eastern'))
+        assert not is_float(timedelta(1000))
+        assert not is_float(np.timedelta64(1, 'D'))
+        assert not is_float(Timedelta('1 days'))
+
+    def test_is_datetime_dtypes(self):
+
+        ts = pd.date_range('20130101', periods=3)
+        tsa = pd.date_range('20130101', periods=3, tz='US/Eastern')
+
+        assert is_datetime64_dtype('datetime64')
+        assert is_datetime64_dtype('datetime64[ns]')
+        assert is_datetime64_dtype(ts)
+        assert not is_datetime64_dtype(tsa)
+
+        assert not is_datetime64_ns_dtype('datetime64')
+        assert is_datetime64_ns_dtype('datetime64[ns]')
+        assert is_datetime64_ns_dtype(ts)
+        assert is_datetime64_ns_dtype(tsa)
+
+        assert is_datetime64_any_dtype('datetime64')
+        assert is_datetime64_any_dtype('datetime64[ns]')
+        assert is_datetime64_any_dtype(ts)
+        assert is_datetime64_any_dtype(tsa)
+
+        assert not is_datetime64tz_dtype('datetime64')
+        assert not is_datetime64tz_dtype('datetime64[ns]')
+        assert not is_datetime64tz_dtype(ts)
+        assert is_datetime64tz_dtype(tsa)
+
+        for tz in ['US/Eastern', 'UTC']:
+            dtype = 'datetime64[ns, {}]'.format(tz)
+            assert not is_datetime64_dtype(dtype)
+            assert is_datetime64tz_dtype(dtype)
+            assert is_datetime64_ns_dtype(dtype)
+            assert is_datetime64_any_dtype(dtype)
+
+    def test_is_timedelta(self):
+        assert is_timedelta64_dtype('timedelta64')
+        assert is_timedelta64_dtype('timedelta64[ns]')
+        assert not is_timedelta64_ns_dtype('timedelta64')
+        assert is_timedelta64_ns_dtype('timedelta64[ns]')
+
+        tdi = TimedeltaIndex([1e14, 2e14], dtype='timedelta64[ns]')
+        assert is_timedelta64_dtype(tdi)
+        assert is_timedelta64_ns_dtype(tdi)
+        assert is_timedelta64_ns_dtype(tdi.astype('timedelta64[ns]'))
+
+        # Conversion to Int64Index:
+        assert not is_timedelta64_ns_dtype(tdi.astype('timedelta64'))
+        assert not is_timedelta64_ns_dtype(tdi.astype('timedelta64[h]'))
+
+
+class TestIsScalar(object):
+
+    def test_is_scalar_builtin_scalars(self):
+        assert is_scalar(None)
+        assert is_scalar(True)
+        assert is_scalar(False)
+        assert is_scalar(Number())
+        assert is_scalar(Fraction())
+        assert is_scalar(0.)
+        assert is_scalar(np.nan)
+        assert is_scalar('foobar')
+        assert is_scalar(b'foobar')
+        assert is_scalar(u('efoobar'))
+        assert is_scalar(datetime(2014, 1, 1))
+        assert is_scalar(date(2014, 1, 1))
+        assert is_scalar(time(12, 0))
+        assert is_scalar(timedelta(hours=1))
+        assert is_scalar(pd.NaT)
+
+    def test_is_scalar_builtin_nonscalars(self):
+        assert not is_scalar({})
+        assert not is_scalar([])
+        assert not is_scalar([1])
+        assert not is_scalar(())
+        assert not is_scalar((1, ))
+        assert not is_scalar(slice(None))
+        assert not is_scalar(Ellipsis)
+
+    def test_is_scalar_numpy_array_scalars(self):
+        assert is_scalar(np.int64(1))
+        assert is_scalar(np.float64(1.))
+        assert is_scalar(np.int32(1))
+        assert is_scalar(np.object_('foobar'))
+        assert is_scalar(np.str_('foobar'))
+        assert is_scalar(np.unicode_(u('foobar')))
+        assert is_scalar(np.bytes_(b'foobar'))
+        assert is_scalar(np.datetime64('2014-01-01'))
+        assert is_scalar(np.timedelta64(1, 'h'))
+
+    def test_is_scalar_numpy_zerodim_arrays(self):
+        for zerodim in [np.array(1), np.array('foobar'),
+                        np.array(np.datetime64('2014-01-01')),
+                        np.array(np.timedelta64(1, 'h')),
+                        np.array(np.datetime64('NaT'))]:
+            assert not is_scalar(zerodim)
+            assert is_scalar(lib.item_from_zerodim(zerodim))
+
+    @pytest.mark.filterwarnings("ignore::PendingDeprecationWarning")
+    def test_is_scalar_numpy_arrays(self):
+        assert not is_scalar(np.array([]))
+        assert not is_scalar(np.array([[]]))
+        assert not is_scalar(np.matrix('1; 2'))
+
+    def test_is_scalar_pandas_scalars(self):
+        assert is_scalar(Timestamp('2014-01-01'))
+        assert is_scalar(Timedelta(hours=1))
+        assert is_scalar(Period('2014-01-01'))
+        assert is_scalar(Interval(left=0, right=1))
+        assert is_scalar(DateOffset(days=1))
+
+    def test_is_scalar_pandas_containers(self):
+        assert not is_scalar(Series())
+        assert not is_scalar(Series([1]))
+        assert not is_scalar(DataFrame())
+        assert not is_scalar(DataFrame([[1]]))
+        with catch_warnings(record=True):
+            simplefilter("ignore", FutureWarning)
+            assert not is_scalar(Panel())
+            assert not is_scalar(Panel([[[1]]]))
+        assert not is_scalar(Index([]))
+        assert not is_scalar(Index([1]))
+
+
+def test_datetimeindex_from_empty_datetime64_array():
+    for unit in ['ms', 'us', 'ns']:
+        idx = DatetimeIndex(np.array([], dtype='datetime64[%s]' % unit))
+        assert (len(idx) == 0)
+
+
+def test_nan_to_nat_conversions():
+
+    df = DataFrame(dict({
+        'A': np.asarray(
+            lrange(10), dtype='float64'),
+        'B': Timestamp('20010101')
+    }))
+    df.iloc[3:6, :] = np.nan
+    result = df.loc[4, 'B'].value
+    assert (result == iNaT)
+
+    s = df['B'].copy()
+    s._data = s._data.setitem(indexer=tuple([slice(8, 9)]), value=np.nan)
+    assert (isna(s[8]))
+
+    assert (s[8].value == np.datetime64('NaT').astype(np.int64))
+
+
+@td.skip_if_no_scipy
+@pytest.mark.filterwarnings("ignore::PendingDeprecationWarning")
+def test_is_scipy_sparse(spmatrix):  # noqa: F811
+    assert is_scipy_sparse(spmatrix([[0, 1]]))
+    assert not is_scipy_sparse(np.array([1]))
+
+
+def test_ensure_int32():
+    values = np.arange(10, dtype=np.int32)
+    result = ensure_int32(values)
+    assert (result.dtype == np.int32)
+
+    values = np.arange(10, dtype=np.int64)
+    result = ensure_int32(values)
+    assert (result.dtype == np.int32)
+
+
+def test_ensure_categorical():
+    values = np.arange(10, dtype=np.int32)
+    result = ensure_categorical(values)
+    assert (result.dtype == 'category')
+
+    values = Categorical(values)
+    result = ensure_categorical(values)
+    tm.assert_categorical_equal(result, values)
diff --git a/pandas/tests/dtypes/test_missing.py b/pandas/tests/dtypes/test_missing.py
new file mode 100644
index 0000000000000..7ca01e13a33a9
--- /dev/null
+++ b/pandas/tests/dtypes/test_missing.py
@@ -0,0 +1,489 @@
+# -*- coding: utf-8 -*-
+
+from datetime import datetime
+from decimal import Decimal
+from warnings import catch_warnings, filterwarnings
+
+import numpy as np
+import pytest
+
+from pandas._libs import missing as libmissing
+from pandas._libs.tslibs import iNaT, is_null_datetimelike
+from pandas.compat import u
+
+from pandas.core.dtypes.common import is_scalar
+from pandas.core.dtypes.dtypes import (
+    DatetimeTZDtype, IntervalDtype, PeriodDtype)
+from pandas.core.dtypes.missing import (
+    array_equivalent, isna, isnull, na_value_for_dtype, notna, notnull)
+
+import pandas as pd
+from pandas import (
+    DatetimeIndex, Float64Index, NaT, Series, TimedeltaIndex, date_range)
+from pandas.core import config as cf
+from pandas.util import testing as tm
+
+
+@pytest.mark.parametrize('notna_f', [notna, notnull])
+def test_notna_notnull(notna_f):
+    assert notna_f(1.)
+    assert not notna_f(None)
+    assert not notna_f(np.NaN)
+
+    with cf.option_context("mode.use_inf_as_na", False):
+        assert notna_f(np.inf)
+        assert notna_f(-np.inf)
+
+        arr = np.array([1.5, np.inf, 3.5, -np.inf])
+        result = notna_f(arr)
+        assert result.all()
+
+    with cf.option_context("mode.use_inf_as_na", True):
+        assert not notna_f(np.inf)
+        assert not notna_f(-np.inf)
+
+        arr = np.array([1.5, np.inf, 3.5, -np.inf])
+        result = notna_f(arr)
+        assert result.sum() == 2
+
+    with cf.option_context("mode.use_inf_as_na", False):
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries(), tm.makeTimeSeries(),
+                  tm.makePeriodSeries()]:
+            assert (isinstance(notna_f(s), Series))
+
+
+class TestIsNA(object):
+
+    def test_0d_array(self):
+        assert isna(np.array(np.nan))
+        assert not isna(np.array(0.0))
+        assert not isna(np.array(0))
+        # test object dtype
+        assert isna(np.array(np.nan, dtype=object))
+        assert not isna(np.array(0.0, dtype=object))
+        assert not isna(np.array(0, dtype=object))
+
+    def test_empty_object(self):
+
+        for shape in [(4, 0), (4,)]:
+            arr = np.empty(shape=shape, dtype=object)
+            result = isna(arr)
+            expected = np.ones(shape=shape, dtype=bool)
+            tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('isna_f', [isna, isnull])
+    def test_isna_isnull(self, isna_f):
+        assert not isna_f(1.)
+        assert isna_f(None)
+        assert isna_f(np.NaN)
+        assert float('nan')
+        assert not isna_f(np.inf)
+        assert not isna_f(-np.inf)
+
+        # series
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries(), tm.makeTimeSeries(),
+                  tm.makePeriodSeries()]:
+            assert isinstance(isna_f(s), Series)
+
+        # frame
+        for df in [tm.makeTimeDataFrame(), tm.makePeriodFrame(),
+                   tm.makeMixedDataFrame()]:
+            result = isna_f(df)
+            expected = df.apply(isna_f)
+            tm.assert_frame_equal(result, expected)
+
+    def test_isna_lists(self):
+        result = isna([[False]])
+        exp = np.array([[False]])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna([[1], [2]])
+        exp = np.array([[False], [False]])
+        tm.assert_numpy_array_equal(result, exp)
+
+        # list of strings / unicode
+        result = isna(['foo', 'bar'])
+        exp = np.array([False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna([u('foo'), u('bar')])
+        exp = np.array([False, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+        # GH20675
+        result = isna([np.NaN, 'world'])
+        exp = np.array([True, False])
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_isna_nat(self):
+        result = isna([NaT])
+        exp = np.array([True])
+        tm.assert_numpy_array_equal(result, exp)
+
+        result = isna(np.array([NaT], dtype=object))
+        exp = np.array([True])
+        tm.assert_numpy_array_equal(result, exp)
+
+    def test_isna_numpy_nat(self):
+        arr = np.array([NaT, np.datetime64('NaT'), np.timedelta64('NaT'),
+                        np.datetime64('NaT', 's')])
+        result = isna(arr)
+        expected = np.array([True] * 4)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_isna_datetime(self):
+        assert not isna(datetime.now())
+        assert notna(datetime.now())
+
+        idx = date_range('1/1/1990', periods=20)
+        exp = np.ones(len(idx), dtype=bool)
+        tm.assert_numpy_array_equal(notna(idx), exp)
+
+        idx = np.asarray(idx)
+        idx[0] = iNaT
+        idx = DatetimeIndex(idx)
+        mask = isna(idx)
+        assert mask[0]
+        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+        # GH 9129
+        pidx = idx.to_period(freq='M')
+        mask = isna(pidx)
+        assert mask[0]
+        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+        mask = isna(pidx[1:])
+        exp = np.zeros(len(mask), dtype=bool)
+        tm.assert_numpy_array_equal(mask, exp)
+
+    @pytest.mark.parametrize(
+        "value, expected",
+        [(np.complex128(np.nan), True),
+         (np.float64(1), False),
+         (np.array([1, 1 + 0j, np.nan, 3]),
+          np.array([False, False, True, False])),
+         (np.array([1, 1 + 0j, np.nan, 3], dtype=object),
+          np.array([False, False, True, False])),
+         (np.array([1, 1 + 0j, np.nan, 3]).astype(object),
+          np.array([False, False, True, False]))])
+    def test_complex(self, value, expected):
+        result = isna(value)
+        if is_scalar(result):
+            assert result is expected
+        else:
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_datetime_other_units(self):
+        idx = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-02'])
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+        tm.assert_numpy_array_equal(isna(idx.values), exp)
+        tm.assert_numpy_array_equal(notna(idx.values), ~exp)
+
+        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
+                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
+                      'datetime64[ns]']:
+            values = idx.values.astype(dtype)
+
+            exp = np.array([False, True, False])
+            tm.assert_numpy_array_equal(isna(values), exp)
+            tm.assert_numpy_array_equal(notna(values), ~exp)
+
+            exp = pd.Series([False, True, False])
+            s = pd.Series(values)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+            s = pd.Series(values, dtype=object)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+
+    def test_timedelta_other_units(self):
+        idx = pd.TimedeltaIndex(['1 days', 'NaT', '2 days'])
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+        tm.assert_numpy_array_equal(isna(idx.values), exp)
+        tm.assert_numpy_array_equal(notna(idx.values), ~exp)
+
+        for dtype in ['timedelta64[D]', 'timedelta64[h]', 'timedelta64[m]',
+                      'timedelta64[s]', 'timedelta64[ms]', 'timedelta64[us]',
+                      'timedelta64[ns]']:
+            values = idx.values.astype(dtype)
+
+            exp = np.array([False, True, False])
+            tm.assert_numpy_array_equal(isna(values), exp)
+            tm.assert_numpy_array_equal(notna(values), ~exp)
+
+            exp = pd.Series([False, True, False])
+            s = pd.Series(values)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+            s = pd.Series(values, dtype=object)
+            tm.assert_series_equal(isna(s), exp)
+            tm.assert_series_equal(notna(s), ~exp)
+
+    def test_period(self):
+        idx = pd.PeriodIndex(['2011-01', 'NaT', '2012-01'], freq='M')
+        exp = np.array([False, True, False])
+        tm.assert_numpy_array_equal(isna(idx), exp)
+        tm.assert_numpy_array_equal(notna(idx), ~exp)
+
+        exp = pd.Series([False, True, False])
+        s = pd.Series(idx)
+        tm.assert_series_equal(isna(s), exp)
+        tm.assert_series_equal(notna(s), ~exp)
+        s = pd.Series(idx, dtype=object)
+        tm.assert_series_equal(isna(s), exp)
+        tm.assert_series_equal(notna(s), ~exp)
+
+
+def test_array_equivalent():
+    assert array_equivalent(np.array([np.nan, np.nan]),
+                            np.array([np.nan, np.nan]))
+    assert array_equivalent(np.array([np.nan, 1, np.nan]),
+                            np.array([np.nan, 1, np.nan]))
+    assert array_equivalent(np.array([np.nan, None], dtype='object'),
+                            np.array([np.nan, None], dtype='object'))
+    assert array_equivalent(np.array([np.nan, 1 + 1j], dtype='complex'),
+                            np.array([np.nan, 1 + 1j], dtype='complex'))
+    assert not array_equivalent(
+        np.array([np.nan, 1 + 1j], dtype='complex'), np.array(
+            [np.nan, 1 + 2j], dtype='complex'))
+    assert not array_equivalent(
+        np.array([np.nan, 1, np.nan]), np.array([np.nan, 2, np.nan]))
+    assert not array_equivalent(
+        np.array(['a', 'b', 'c', 'd']), np.array(['e', 'e']))
+    assert array_equivalent(Float64Index([0, np.nan]),
+                            Float64Index([0, np.nan]))
+    assert not array_equivalent(
+        Float64Index([0, np.nan]), Float64Index([1, np.nan]))
+    assert array_equivalent(DatetimeIndex([0, np.nan]),
+                            DatetimeIndex([0, np.nan]))
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan]), DatetimeIndex([1, np.nan]))
+    assert array_equivalent(TimedeltaIndex([0, np.nan]),
+                            TimedeltaIndex([0, np.nan]))
+    assert not array_equivalent(
+        TimedeltaIndex([0, np.nan]), TimedeltaIndex([1, np.nan]))
+    with catch_warnings():
+        filterwarnings("ignore", "Converting timezone", FutureWarning)
+        assert array_equivalent(DatetimeIndex([0, np.nan], tz='US/Eastern'),
+                                DatetimeIndex([0, np.nan], tz='US/Eastern'))
+        assert not array_equivalent(
+            DatetimeIndex([0, np.nan], tz='US/Eastern'), DatetimeIndex(
+                [1, np.nan], tz='US/Eastern'))
+        assert not array_equivalent(
+            DatetimeIndex([0, np.nan]), DatetimeIndex(
+                [0, np.nan], tz='US/Eastern'))
+        assert not array_equivalent(
+            DatetimeIndex([0, np.nan], tz='CET'), DatetimeIndex(
+                [0, np.nan], tz='US/Eastern'))
+
+    assert not array_equivalent(
+        DatetimeIndex([0, np.nan]), TimedeltaIndex([0, np.nan]))
+
+
+def test_array_equivalent_compat():
+    # see gh-13388
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    assert (array_equivalent(m, n, strict_nan=True))
+    assert (array_equivalent(m, n, strict_nan=False))
+
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (4, 3)], dtype=[('a', int), ('b', float)])
+    assert (not array_equivalent(m, n, strict_nan=True))
+    assert (not array_equivalent(m, n, strict_nan=False))
+
+    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
+    n = np.array([(1, 2), (3, 4)], dtype=[('b', int), ('a', float)])
+    assert (not array_equivalent(m, n, strict_nan=True))
+    assert (not array_equivalent(m, n, strict_nan=False))
+
+
+def test_array_equivalent_str():
+    for dtype in ['O', 'S', 'U']:
+        assert array_equivalent(np.array(['A', 'B'], dtype=dtype),
+                                np.array(['A', 'B'], dtype=dtype))
+        assert not array_equivalent(np.array(['A', 'B'], dtype=dtype),
+                                    np.array(['A', 'X'], dtype=dtype))
+
+
+@pytest.mark.parametrize('dtype, na_value', [
+    # Datetime-like
+    (np.dtype("M8[ns]"), NaT),
+    (np.dtype("m8[ns]"), NaT),
+    (DatetimeTZDtype.construct_from_string('datetime64[ns, US/Eastern]'), NaT),
+    (PeriodDtype("M"), NaT),
+    # Integer
+    ('u1', 0), ('u2', 0), ('u4', 0), ('u8', 0),
+    ('i1', 0), ('i2', 0), ('i4', 0), ('i8', 0),
+    # Bool
+    ('bool', False),
+    # Float
+    ('f2', np.nan), ('f4', np.nan), ('f8', np.nan),
+    # Object
+    ('O', np.nan),
+    # Interval
+    (IntervalDtype(), np.nan),
+])
+def test_na_value_for_dtype(dtype, na_value):
+    result = na_value_for_dtype(dtype)
+    assert result is na_value
+
+
+class TestNAObj(object):
+
+    _1d_methods = ['isnaobj', 'isnaobj_old']
+    _2d_methods = ['isnaobj2d', 'isnaobj2d_old']
+
+    def _check_behavior(self, arr, expected):
+        for method in TestNAObj._1d_methods:
+            result = getattr(libmissing, method)(arr)
+            tm.assert_numpy_array_equal(result, expected)
+
+        arr = np.atleast_2d(arr)
+        expected = np.atleast_2d(expected)
+
+        for method in TestNAObj._2d_methods:
+            result = getattr(libmissing, method)(arr)
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_basic(self):
+        arr = np.array([1, None, 'foo', -5.1, pd.NaT, np.nan])
+        expected = np.array([False, True, False, False, True, True])
+
+        self._check_behavior(arr, expected)
+
+    def test_non_obj_dtype(self):
+        arr = np.array([1, 3, np.nan, 5], dtype=float)
+        expected = np.array([False, False, True, False])
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_arr(self):
+        arr = np.array([])
+        expected = np.array([], dtype=bool)
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_str_inp(self):
+        arr = np.array([""])  # empty but not na
+        expected = np.array([False])
+
+        self._check_behavior(arr, expected)
+
+    def test_empty_like(self):
+        # see gh-13717: no segfaults!
+        arr = np.empty_like([None])
+        expected = np.array([True])
+
+        self._check_behavior(arr, expected)
+
+
+m8_units = ['as', 'ps', 'ns', 'us', 'ms', 's',
+            'm', 'h', 'D', 'W', 'M', 'Y']
+
+na_vals = [
+    None,
+    NaT,
+    float('NaN'),
+    complex('NaN'),
+    np.nan,
+    np.float64('NaN'),
+    np.float32('NaN'),
+    np.complex64(np.nan),
+    np.complex128(np.nan),
+    np.datetime64('NaT'),
+    np.timedelta64('NaT'),
+] + [
+    np.datetime64('NaT', unit) for unit in m8_units
+] + [
+    np.timedelta64('NaT', unit) for unit in m8_units
+]
+
+inf_vals = [
+    float('inf'),
+    float('-inf'),
+    complex('inf'),
+    complex('-inf'),
+    np.inf,
+    np.NINF,
+]
+
+int_na_vals = [
+    # Values that match iNaT, which we treat as null in specific cases
+    np.int64(NaT.value),
+    int(NaT.value),
+]
+
+sometimes_na_vals = [
+    Decimal('NaN'),
+]
+
+never_na_vals = [
+    # float/complex values that when viewed as int64 match iNaT
+    -0.0,
+    np.float64('-0.0'),
+    -0j,
+    np.complex64(-0j),
+]
+
+
+class TestLibMissing(object):
+    def test_checknull(self):
+        for value in na_vals:
+            assert libmissing.checknull(value)
+
+        for value in inf_vals:
+            assert not libmissing.checknull(value)
+
+        for value in int_na_vals:
+            assert not libmissing.checknull(value)
+
+        for value in sometimes_na_vals:
+            assert not libmissing.checknull(value)
+
+        for value in never_na_vals:
+            assert not libmissing.checknull(value)
+
+    def checknull_old(self):
+        for value in na_vals:
+            assert libmissing.checknull_old(value)
+
+        for value in inf_vals:
+            assert libmissing.checknull_old(value)
+
+        for value in int_na_vals:
+            assert not libmissing.checknull_old(value)
+
+        for value in sometimes_na_vals:
+            assert not libmissing.checknull_old(value)
+
+        for value in never_na_vals:
+            assert not libmissing.checknull_old(value)
+
+    def test_is_null_datetimelike(self):
+        for value in na_vals:
+            assert is_null_datetimelike(value)
+            assert is_null_datetimelike(value, False)
+
+        for value in inf_vals:
+            assert not is_null_datetimelike(value)
+            assert not is_null_datetimelike(value, False)
+
+        for value in int_na_vals:
+            assert is_null_datetimelike(value)
+            assert not is_null_datetimelike(value, False)
+
+        for value in sometimes_na_vals:
+            assert not is_null_datetimelike(value)
+            assert not is_null_datetimelike(value, False)
+
+        for value in never_na_vals:
+            assert not is_null_datetimelike(value)
diff --git a/pandas/tests/extension/__init__.py b/pandas/tests/extension/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/extension/arrow/__init__.py b/pandas/tests/extension/arrow/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/extension/arrow/bool.py b/pandas/tests/extension/arrow/bool.py
new file mode 100644
index 0000000000000..025c4cacd8fa1
--- /dev/null
+++ b/pandas/tests/extension/arrow/bool.py
@@ -0,0 +1,144 @@
+"""Rudimentary Apache Arrow-backed ExtensionArray.
+
+At the moment, just a boolean array / type is implemented.
+Eventually, we'll want to parametrize the type and support
+multiple dtypes. Not all methods are implemented yet, and the
+current implementation is not efficient.
+"""
+import copy
+import itertools
+
+import numpy as np
+import pyarrow as pa
+
+import pandas as pd
+from pandas.api.extensions import (
+    ExtensionArray, ExtensionDtype, register_extension_dtype, take)
+
+
+@register_extension_dtype
+class ArrowBoolDtype(ExtensionDtype):
+
+    type = np.bool_
+    kind = 'b'
+    name = 'arrow_bool'
+    na_value = pa.NULL
+
+    @classmethod
+    def construct_from_string(cls, string):
+        if string == cls.name:
+            return cls()
+        else:
+            raise TypeError("Cannot construct a '{}' from "
+                            "'{}'".format(cls, string))
+
+    @classmethod
+    def construct_array_type(cls):
+        return ArrowBoolArray
+
+    def _is_boolean(self):
+        return True
+
+
+class ArrowBoolArray(ExtensionArray):
+    def __init__(self, values):
+        if not isinstance(values, pa.ChunkedArray):
+            raise ValueError
+
+        assert values.type == pa.bool_()
+        self._data = values
+        self._dtype = ArrowBoolDtype()
+
+    def __repr__(self):
+        return "ArrowBoolArray({})".format(repr(self._data))
+
+    @classmethod
+    def from_scalars(cls, values):
+        arr = pa.chunked_array([pa.array(np.asarray(values))])
+        return cls(arr)
+
+    @classmethod
+    def from_array(cls, arr):
+        assert isinstance(arr, pa.Array)
+        return cls(pa.chunked_array([arr]))
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return cls.from_scalars(scalars)
+
+    def __getitem__(self, item):
+        if pd.api.types.is_scalar(item):
+            return self._data.to_pandas()[item]
+        else:
+            vals = self._data.to_pandas()[item]
+            return type(self).from_scalars(vals)
+
+    def __len__(self):
+        return len(self._data)
+
+    def astype(self, dtype, copy=True):
+        # needed to fix this astype for the Series constructor.
+        if isinstance(dtype, type(self.dtype)) and dtype == self.dtype:
+            if copy:
+                return self.copy()
+            return self
+        return super(ArrowBoolArray, self).astype(dtype, copy)
+
+    @property
+    def dtype(self):
+        return self._dtype
+
+    @property
+    def nbytes(self):
+        return sum(x.size for chunk in self._data.chunks
+                   for x in chunk.buffers()
+                   if x is not None)
+
+    def isna(self):
+        nas = pd.isna(self._data.to_pandas())
+        return type(self).from_scalars(nas)
+
+    def take(self, indices, allow_fill=False, fill_value=None):
+        data = self._data.to_pandas()
+
+        if allow_fill and fill_value is None:
+            fill_value = self.dtype.na_value
+
+        result = take(data, indices, fill_value=fill_value,
+                      allow_fill=allow_fill)
+        return self._from_sequence(result, dtype=self.dtype)
+
+    def copy(self, deep=False):
+        if deep:
+            return type(self)(copy.deepcopy(self._data))
+        else:
+            return type(self)(copy.copy(self._data))
+
+    def _concat_same_type(cls, to_concat):
+        chunks = list(itertools.chain.from_iterable(x._data.chunks
+                                                    for x in to_concat))
+        arr = pa.chunked_array(chunks)
+        return cls(arr)
+
+    def __invert__(self):
+        return type(self).from_scalars(
+            ~self._data.to_pandas()
+        )
+
+    def _reduce(self, method, skipna=True, **kwargs):
+        if skipna:
+            arr = self[~self.isna()]
+        else:
+            arr = self
+
+        try:
+            op = getattr(arr, method)
+        except AttributeError:
+            raise TypeError
+        return op(**kwargs)
+
+    def any(self, axis=0, out=None):
+        return self._data.to_pandas().any()
+
+    def all(self, axis=0, out=None):
+        return self._data.to_pandas().all()
diff --git a/pandas/tests/extension/arrow/test_bool.py b/pandas/tests/extension/arrow/test_bool.py
new file mode 100644
index 0000000000000..15ceb6adff59c
--- /dev/null
+++ b/pandas/tests/extension/arrow/test_bool.py
@@ -0,0 +1,68 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.tests.extension import base
+import pandas.util.testing as tm
+
+pytest.importorskip('pyarrow', minversion="0.10.0")
+
+from .bool import ArrowBoolArray, ArrowBoolDtype  # isort:skip
+
+
+@pytest.fixture
+def dtype():
+    return ArrowBoolDtype()
+
+
+@pytest.fixture
+def data():
+    return ArrowBoolArray.from_scalars(np.random.randint(0, 2, size=100,
+                                                         dtype=bool))
+
+
+@pytest.fixture
+def data_missing():
+    return ArrowBoolArray.from_scalars([None, True])
+
+
+class BaseArrowTests(object):
+    pass
+
+
+class TestDtype(BaseArrowTests, base.BaseDtypeTests):
+    def test_array_type_with_arg(self, data, dtype):
+        pytest.skip("GH-22666")
+
+
+class TestInterface(BaseArrowTests, base.BaseInterfaceTests):
+    def test_repr(self, data):
+        raise pytest.skip("TODO")
+
+
+class TestConstructors(BaseArrowTests, base.BaseConstructorsTests):
+    def test_from_dtype(self, data):
+        pytest.skip("GH-22666")
+
+    # seems like some bug in isna on empty BoolArray returning floats.
+    @pytest.mark.xfail(reason='bad is-na for empty data')
+    def test_from_sequence_from_cls(self, data):
+        super(TestConstructors, self).test_from_sequence_from_cls(data)
+
+
+class TestReduce(base.BaseNoReduceTests):
+    def test_reduce_series_boolean(self):
+        pass
+
+
+class TestReduceBoolean(base.BaseBooleanReduceTests):
+    pass
+
+
+def test_is_bool_dtype(data):
+    assert pd.api.types.is_bool_dtype(data)
+    assert pd.core.common.is_bool_indexer(data)
+    s = pd.Series(range(len(data)))
+    result = s[data]
+    expected = s[np.asarray(data)]
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/__init__.py b/pandas/tests/extension/base/__init__.py
new file mode 100644
index 0000000000000..1f7ee2ae17e4a
--- /dev/null
+++ b/pandas/tests/extension/base/__init__.py
@@ -0,0 +1,56 @@
+"""Base test suite for extension arrays.
+
+These tests are intended for third-party libraries to subclass to validate
+that their extension arrays and dtypes satisfy the interface. Moving or
+renaming the tests should not be done lightly.
+
+Libraries are expected to implement a few pytest fixtures to provide data
+for the tests. The fixtures may be located in either
+
+* The same module as your test class.
+* A ``conftest.py`` in the same directory as your test class.
+
+The full list of fixtures may be found in the ``conftest.py`` next to this
+file.
+
+.. code-block:: python
+
+   import pytest
+   from pandas.tests.extension.base import BaseDtypeTests
+
+
+   @pytest.fixture
+   def dtype():
+       return MyDtype()
+
+
+   class TestMyDtype(BaseDtypeTests):
+       pass
+
+
+Your class ``TestDtype`` will inherit all the tests defined on
+``BaseDtypeTests``. pytest's fixture discover will supply your ``dtype``
+wherever the test requires it. You're free to implement additional tests.
+
+All the tests in these modules use ``self.assert_frame_equal`` or
+``self.assert_series_equal`` for dataframe or series comparisons. By default,
+they use the usual ``pandas.testing.assert_frame_equal`` and
+``pandas.testing.assert_series_equal``. You can override the checks used
+by defining the staticmethods ``assert_frame_equal`` and
+``assert_series_equal`` on your base test class.
+
+"""
+from .casting import BaseCastingTests  # noqa
+from .constructors import BaseConstructorsTests  # noqa
+from .dtype import BaseDtypeTests  # noqa
+from .getitem import BaseGetitemTests  # noqa
+from .groupby import BaseGroupbyTests  # noqa
+from .interface import BaseInterfaceTests  # noqa
+from .methods import BaseMethodsTests  # noqa
+from .ops import BaseArithmeticOpsTests, BaseComparisonOpsTests, BaseOpsUtil  # noqa
+from .printing import BasePrintingTests  # noqa
+from .reduce import BaseNoReduceTests, BaseNumericReduceTests, BaseBooleanReduceTests  # noqa
+from .missing import BaseMissingTests  # noqa
+from .reshaping import BaseReshapingTests  # noqa
+from .setitem import BaseSetitemTests  # noqa
+from .io import BaseParsingTests  # noqa
diff --git a/pandas/tests/extension/base/base.py b/pandas/tests/extension/base/base.py
new file mode 100644
index 0000000000000..2a4a1b9c4668b
--- /dev/null
+++ b/pandas/tests/extension/base/base.py
@@ -0,0 +1,10 @@
+import pandas.util.testing as tm
+
+
+class BaseExtensionTests(object):
+    assert_equal = staticmethod(tm.assert_equal)
+    assert_series_equal = staticmethod(tm.assert_series_equal)
+    assert_frame_equal = staticmethod(tm.assert_frame_equal)
+    assert_extension_array_equal = staticmethod(
+        tm.assert_extension_array_equal
+    )
diff --git a/pandas/tests/extension/base/casting.py b/pandas/tests/extension/base/casting.py
new file mode 100644
index 0000000000000..7146443bf8de5
--- /dev/null
+++ b/pandas/tests/extension/base/casting.py
@@ -0,0 +1,23 @@
+import pandas as pd
+from pandas.core.internals import ObjectBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseCastingTests(BaseExtensionTests):
+    """Casting to and from ExtensionDtypes"""
+
+    def test_astype_object_series(self, all_data):
+        ser = pd.Series({"A": all_data})
+        result = ser.astype(object)
+        assert isinstance(result._data.blocks[0], ObjectBlock)
+
+    def test_tolist(self, data):
+        result = pd.Series(data).tolist()
+        expected = list(data)
+        assert result == expected
+
+    def test_astype_str(self, data):
+        result = pd.Series(data[:5]).astype(str)
+        expected = pd.Series(data[:5].astype(str))
+        self.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/constructors.py b/pandas/tests/extension/base/constructors.py
new file mode 100644
index 0000000000000..231a1f648f8e8
--- /dev/null
+++ b/pandas/tests/extension/base/constructors.py
@@ -0,0 +1,77 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.core.internals import ExtensionBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseConstructorsTests(BaseExtensionTests):
+
+    def test_from_sequence_from_cls(self, data):
+        result = type(data)._from_sequence(data, dtype=data.dtype)
+        self.assert_extension_array_equal(result, data)
+
+        data = data[:0]
+        result = type(data)._from_sequence(data, dtype=data.dtype)
+        self.assert_extension_array_equal(result, data)
+
+    def test_array_from_scalars(self, data):
+        scalars = [data[0], data[1], data[2]]
+        result = data._from_sequence(scalars)
+        assert isinstance(result, type(data))
+
+    def test_series_constructor(self, data):
+        result = pd.Series(data)
+        assert result.dtype == data.dtype
+        assert len(result) == len(data)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+        assert result._data.blocks[0].values is data
+
+        # Series[EA] is unboxed / boxed correctly
+        result2 = pd.Series(result)
+        assert result2.dtype == data.dtype
+        assert isinstance(result2._data.blocks[0], ExtensionBlock)
+
+    @pytest.mark.parametrize("from_series", [True, False])
+    def test_dataframe_constructor_from_dict(self, data, from_series):
+        if from_series:
+            data = pd.Series(data)
+        result = pd.DataFrame({"A": data})
+        assert result.dtypes['A'] == data.dtype
+        assert result.shape == (len(data), 1)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    def test_dataframe_from_series(self, data):
+        result = pd.DataFrame(pd.Series(data))
+        assert result.dtypes[0] == data.dtype
+        assert result.shape == (len(data), 1)
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    def test_series_given_mismatched_index_raises(self, data):
+        msg = 'Length of passed values is 3, index implies 5'
+        with pytest.raises(ValueError, match=msg):
+            pd.Series(data[:3], index=[0, 1, 2, 3, 4])
+
+    def test_from_dtype(self, data):
+        # construct from our dtype & string dtype
+        dtype = data.dtype
+
+        expected = pd.Series(data)
+        result = pd.Series(list(data), dtype=dtype)
+        self.assert_series_equal(result, expected)
+
+        result = pd.Series(list(data), dtype=str(dtype))
+        self.assert_series_equal(result, expected)
+
+    def test_pandas_array(self, data):
+        # pd.array(extension_array) should be idempotent...
+        result = pd.array(data)
+        self.assert_extension_array_equal(result, data)
+
+    def test_pandas_array_dtype(self, data):
+        # ... but specifying dtype will override idempotency
+        result = pd.array(data, dtype=np.dtype(object))
+        expected = pd.arrays.PandasArray(np.asarray(data, dtype=object))
+        self.assert_equal(result, expected)
diff --git a/pandas/tests/extension/base/dtype.py b/pandas/tests/extension/base/dtype.py
new file mode 100644
index 0000000000000..e9d1f183812cc
--- /dev/null
+++ b/pandas/tests/extension/base/dtype.py
@@ -0,0 +1,91 @@
+import warnings
+
+import numpy as np
+
+import pandas as pd
+
+from .base import BaseExtensionTests
+
+
+class BaseDtypeTests(BaseExtensionTests):
+    """Base class for ExtensionDtype classes"""
+
+    def test_name(self, dtype):
+        assert isinstance(dtype.name, str)
+
+    def test_kind(self, dtype):
+        valid = set('biufcmMOSUV')
+        if dtype.kind is not None:
+            assert dtype.kind in valid
+
+    def test_construct_from_string_own_name(self, dtype):
+        result = dtype.construct_from_string(dtype.name)
+        assert type(result) is type(dtype)
+
+        # check OK as classmethod
+        result = type(dtype).construct_from_string(dtype.name)
+        assert type(result) is type(dtype)
+
+    def test_is_dtype_from_name(self, dtype):
+        result = type(dtype).is_dtype(dtype.name)
+        assert result is True
+
+    def test_is_dtype_unboxes_dtype(self, data, dtype):
+        assert dtype.is_dtype(data) is True
+
+    def test_is_dtype_from_self(self, dtype):
+        result = type(dtype).is_dtype(dtype)
+        assert result is True
+
+    def test_is_not_string_type(self, dtype):
+        return not pd.api.types.is_string_dtype(dtype)
+
+    def test_is_not_object_type(self, dtype):
+        return not pd.api.types.is_object_dtype(dtype)
+
+    def test_eq_with_str(self, dtype):
+        assert dtype == dtype.name
+        assert dtype != dtype.name + '-suffix'
+
+    def test_eq_with_numpy_object(self, dtype):
+        assert dtype != np.dtype('object')
+
+    def test_eq_with_self(self, dtype):
+        assert dtype == dtype
+        assert dtype != object()
+
+    def test_array_type(self, data, dtype):
+        assert dtype.construct_array_type() is type(data)
+
+    def test_check_dtype(self, data):
+        dtype = data.dtype
+
+        # check equivalency for using .dtypes
+        df = pd.DataFrame({'A': pd.Series(data, dtype=dtype),
+                           'B': data,
+                           'C': 'foo', 'D': 1})
+
+        # np.dtype('int64') == 'Int64' == 'int64'
+        # so can't distinguish
+        if dtype.name == 'Int64':
+            expected = pd.Series([True, True, False, True],
+                                 index=list('ABCD'))
+        else:
+            expected = pd.Series([True, True, False, False],
+                                 index=list('ABCD'))
+
+        # XXX: This should probably be *fixed* not ignored.
+        # See libops.scalar_compare
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", DeprecationWarning)
+            result = df.dtypes == str(dtype)
+
+        self.assert_series_equal(result, expected)
+
+        expected = pd.Series([True, True, False, False],
+                             index=list('ABCD'))
+        result = df.dtypes.apply(str) == str(dtype)
+        self.assert_series_equal(result, expected)
+
+    def test_hashable(self, dtype):
+        hash(dtype)  # no error
diff --git a/pandas/tests/extension/base/getitem.py b/pandas/tests/extension/base/getitem.py
new file mode 100644
index 0000000000000..dfc82c6041eae
--- /dev/null
+++ b/pandas/tests/extension/base/getitem.py
@@ -0,0 +1,248 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+
+from .base import BaseExtensionTests
+
+
+class BaseGetitemTests(BaseExtensionTests):
+    """Tests for ExtensionArray.__getitem__."""
+
+    def test_iloc_series(self, data):
+        ser = pd.Series(data)
+        result = ser.iloc[:4]
+        expected = pd.Series(data[:4])
+        self.assert_series_equal(result, expected)
+
+        result = ser.iloc[[0, 1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+    def test_iloc_frame(self, data):
+        df = pd.DataFrame({"A": data, 'B':
+                           np.arange(len(data), dtype='int64')})
+        expected = pd.DataFrame({"A": data[:4]})
+
+        # slice -> frame
+        result = df.iloc[:4, [0]]
+        self.assert_frame_equal(result, expected)
+
+        # sequence -> frame
+        result = df.iloc[[0, 1, 2, 3], [0]]
+        self.assert_frame_equal(result, expected)
+
+        expected = pd.Series(data[:4], name='A')
+
+        # slice -> series
+        result = df.iloc[:4, 0]
+        self.assert_series_equal(result, expected)
+
+        # sequence -> series
+        result = df.iloc[:4, 0]
+        self.assert_series_equal(result, expected)
+
+    def test_loc_series(self, data):
+        ser = pd.Series(data)
+        result = ser.loc[:3]
+        expected = pd.Series(data[:4])
+        self.assert_series_equal(result, expected)
+
+        result = ser.loc[[0, 1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+    def test_loc_frame(self, data):
+        df = pd.DataFrame({"A": data,
+                           'B': np.arange(len(data), dtype='int64')})
+        expected = pd.DataFrame({"A": data[:4]})
+
+        # slice -> frame
+        result = df.loc[:3, ['A']]
+        self.assert_frame_equal(result, expected)
+
+        # sequence -> frame
+        result = df.loc[[0, 1, 2, 3], ['A']]
+        self.assert_frame_equal(result, expected)
+
+        expected = pd.Series(data[:4], name='A')
+
+        # slice -> series
+        result = df.loc[:3, 'A']
+        self.assert_series_equal(result, expected)
+
+        # sequence -> series
+        result = df.loc[:3, 'A']
+        self.assert_series_equal(result, expected)
+
+    def test_getitem_scalar(self, data):
+        result = data[0]
+        assert isinstance(result, data.dtype.type)
+
+        result = pd.Series(data)[0]
+        assert isinstance(result, data.dtype.type)
+
+    def test_getitem_scalar_na(self, data_missing, na_cmp, na_value):
+        result = data_missing[0]
+        assert na_cmp(result, na_value)
+
+    def test_getitem_mask(self, data):
+        # Empty mask, raw array
+        mask = np.zeros(len(data), dtype=bool)
+        result = data[mask]
+        assert len(result) == 0
+        assert isinstance(result, type(data))
+
+        # Empty mask, in series
+        mask = np.zeros(len(data), dtype=bool)
+        result = pd.Series(data)[mask]
+        assert len(result) == 0
+        assert result.dtype == data.dtype
+
+        # non-empty mask, raw array
+        mask[0] = True
+        result = data[mask]
+        assert len(result) == 1
+        assert isinstance(result, type(data))
+
+        # non-empty mask, in series
+        result = pd.Series(data)[mask]
+        assert len(result) == 1
+        assert result.dtype == data.dtype
+
+    def test_getitem_slice(self, data):
+        # getitem[slice] should return an array
+        result = data[slice(0)]  # empty
+        assert isinstance(result, type(data))
+
+        result = data[slice(1)]  # scalar
+        assert isinstance(result, type(data))
+
+    def test_get(self, data):
+        # GH 20882
+        s = pd.Series(data, index=[2 * i for i in range(len(data))])
+        assert s.get(4) == s.iloc[2]
+
+        result = s.get([4, 6])
+        expected = s.iloc[[2, 3]]
+        self.assert_series_equal(result, expected)
+
+        result = s.get(slice(2))
+        expected = s.iloc[[0, 1]]
+        self.assert_series_equal(result, expected)
+
+        assert s.get(-1) is None
+        assert s.get(s.index.max() + 1) is None
+
+        s = pd.Series(data[:6], index=list('abcdef'))
+        assert s.get('c') == s.iloc[2]
+
+        result = s.get(slice('b', 'd'))
+        expected = s.iloc[[1, 2, 3]]
+        self.assert_series_equal(result, expected)
+
+        result = s.get('Z')
+        assert result is None
+
+        assert s.get(4) == s.iloc[4]
+        assert s.get(-1) == s.iloc[-1]
+        assert s.get(len(s)) is None
+
+        # GH 21257
+        s = pd.Series(data)
+        s2 = s[::2]
+        assert s2.get(1) is None
+
+    def test_take_sequence(self, data):
+        result = pd.Series(data)[[0, 1, 3]]
+        assert result.iloc[0] == data[0]
+        assert result.iloc[1] == data[1]
+        assert result.iloc[2] == data[3]
+
+    def test_take(self, data, na_value, na_cmp):
+        result = data.take([0, -1])
+        assert result.dtype == data.dtype
+        assert result[0] == data[0]
+        assert result[1] == data[-1]
+
+        result = data.take([0, -1], allow_fill=True, fill_value=na_value)
+        assert result[0] == data[0]
+        assert na_cmp(result[1], na_value)
+
+        with pytest.raises(IndexError, match="out of bounds"):
+            data.take([len(data) + 1])
+
+    def test_take_empty(self, data, na_value, na_cmp):
+        empty = data[:0]
+
+        result = empty.take([-1], allow_fill=True)
+        assert na_cmp(result[0], na_value)
+
+        with pytest.raises(IndexError):
+            empty.take([-1])
+
+        with pytest.raises(IndexError, match="cannot do a non-empty take"):
+            empty.take([0, 1])
+
+    def test_take_negative(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20640
+        n = len(data)
+        result = data.take([0, -n, n - 1, -1])
+        expected = data.take([0, 0, n - 1, n - 1])
+        self.assert_extension_array_equal(result, expected)
+
+    def test_take_non_na_fill_value(self, data_missing):
+        fill_value = data_missing[1]  # valid
+        na = data_missing[0]
+
+        array = data_missing._from_sequence([na, fill_value, na])
+        result = array.take([-1, 1], fill_value=fill_value, allow_fill=True)
+        expected = array.take([1, 1])
+        self.assert_extension_array_equal(result, expected)
+
+    def test_take_pandas_style_negative_raises(self, data, na_value):
+        with pytest.raises(ValueError):
+            data.take([0, -2], fill_value=na_value, allow_fill=True)
+
+    @pytest.mark.parametrize('allow_fill', [True, False])
+    def test_take_out_of_bounds_raises(self, data, allow_fill):
+        arr = data[:3]
+        with pytest.raises(IndexError):
+            arr.take(np.asarray([0, 3]), allow_fill=allow_fill)
+
+    def test_take_series(self, data):
+        s = pd.Series(data)
+        result = s.take([0, -1])
+        expected = pd.Series(
+            data._from_sequence([data[0], data[len(data) - 1]], dtype=s.dtype),
+            index=[0, len(data) - 1])
+        self.assert_series_equal(result, expected)
+
+    def test_reindex(self, data, na_value):
+        s = pd.Series(data)
+        result = s.reindex([0, 1, 3])
+        expected = pd.Series(data.take([0, 1, 3]), index=[0, 1, 3])
+        self.assert_series_equal(result, expected)
+
+        n = len(data)
+        result = s.reindex([-1, 0, n])
+        expected = pd.Series(
+            data._from_sequence([na_value, data[0], na_value],
+                                dtype=s.dtype),
+            index=[-1, 0, n])
+        self.assert_series_equal(result, expected)
+
+        result = s.reindex([n, n + 1])
+        expected = pd.Series(data._from_sequence([na_value, na_value],
+                                                 dtype=s.dtype),
+                             index=[n, n + 1])
+        self.assert_series_equal(result, expected)
+
+    def test_reindex_non_na_fill_value(self, data_missing):
+        valid = data_missing[1]
+        na = data_missing[0]
+
+        array = data_missing._from_sequence([na, valid])
+        ser = pd.Series(array)
+        result = ser.reindex([0, 1, 2], fill_value=valid)
+        expected = pd.Series(data_missing._from_sequence([na, valid, valid]))
+
+        self.assert_series_equal(result, expected)
diff --git a/pandas/tests/extension/base/groupby.py b/pandas/tests/extension/base/groupby.py
new file mode 100644
index 0000000000000..1929dad075695
--- /dev/null
+++ b/pandas/tests/extension/base/groupby.py
@@ -0,0 +1,78 @@
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseGroupbyTests(BaseExtensionTests):
+    """Groupby-specific tests."""
+
+    def test_grouping_grouper(self, data_for_grouping):
+        df = pd.DataFrame({
+            "A": ["B", "B", None, None, "A", "A", "B", "C"],
+            "B": data_for_grouping
+        })
+        gr1 = df.groupby("A").grouper.groupings[0]
+        gr2 = df.groupby("B").grouper.groupings[0]
+
+        tm.assert_numpy_array_equal(gr1.grouper, df.A.values)
+        tm.assert_extension_array_equal(gr2.grouper, data_for_grouping)
+
+    @pytest.mark.parametrize('as_index', [True, False])
+    def test_groupby_extension_agg(self, as_index, data_for_grouping):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        result = df.groupby("B", as_index=as_index).A.mean()
+        _, index = pd.factorize(data_for_grouping, sort=True)
+
+        index = pd.Index(index, name="B")
+        expected = pd.Series([3, 1, 4], index=index, name="A")
+        if as_index:
+            self.assert_series_equal(result, expected)
+        else:
+            expected = expected.reset_index()
+            self.assert_frame_equal(result, expected)
+
+    def test_groupby_extension_no_sort(self, data_for_grouping):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        result = df.groupby("B", sort=False).A.mean()
+        _, index = pd.factorize(data_for_grouping, sort=False)
+
+        index = pd.Index(index, name="B")
+        expected = pd.Series([1, 3, 4], index=index, name="A")
+        self.assert_series_equal(result, expected)
+
+    def test_groupby_extension_transform(self, data_for_grouping):
+        valid = data_for_grouping[~data_for_grouping.isna()]
+        df = pd.DataFrame({"A": [1, 1, 3, 3, 1, 4],
+                           "B": valid})
+
+        result = df.groupby("B").A.transform(len)
+        expected = pd.Series([3, 3, 2, 2, 3, 1], name="A")
+
+        self.assert_series_equal(result, expected)
+
+    def test_groupby_extension_apply(
+            self, data_for_grouping, groupby_apply_op):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping})
+        df.groupby("B").apply(groupby_apply_op)
+        df.groupby("B").A.apply(groupby_apply_op)
+        df.groupby("A").apply(groupby_apply_op)
+        df.groupby("A").B.apply(groupby_apply_op)
+
+    def test_in_numeric_groupby(self, data_for_grouping):
+        df = pd.DataFrame({"A": [1, 1, 2, 2, 3, 3, 1, 4],
+                           "B": data_for_grouping,
+                           "C": [1, 1, 1, 1, 1, 1, 1, 1]})
+        result = df.groupby("A").sum().columns
+
+        if data_for_grouping.dtype._is_numeric:
+            expected = pd.Index(['B', 'C'])
+        else:
+            expected = pd.Index(['C'])
+
+        tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/extension/base/interface.py b/pandas/tests/extension/base/interface.py
new file mode 100644
index 0000000000000..6388902e45627
--- /dev/null
+++ b/pandas/tests/extension/base/interface.py
@@ -0,0 +1,68 @@
+import numpy as np
+
+from pandas.core.dtypes.common import is_extension_array_dtype
+from pandas.core.dtypes.dtypes import ExtensionDtype
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseInterfaceTests(BaseExtensionTests):
+    """Tests that the basic interface is satisfied."""
+    # ------------------------------------------------------------------------
+    # Interface
+    # ------------------------------------------------------------------------
+
+    def test_len(self, data):
+        assert len(data) == 100
+
+    def test_ndim(self, data):
+        assert data.ndim == 1
+
+    def test_can_hold_na_valid(self, data):
+        # GH-20761
+        assert data._can_hold_na is True
+
+    def test_memory_usage(self, data):
+        s = pd.Series(data)
+        result = s.memory_usage(index=False)
+        assert result == s.nbytes
+
+    def test_array_interface(self, data):
+        result = np.array(data)
+        assert result[0] == data[0]
+
+        result = np.array(data, dtype=object)
+        expected = np.array(list(data), dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_is_extension_array_dtype(self, data):
+        assert is_extension_array_dtype(data)
+        assert is_extension_array_dtype(data.dtype)
+        assert is_extension_array_dtype(pd.Series(data))
+        assert isinstance(data.dtype, ExtensionDtype)
+
+    def test_no_values_attribute(self, data):
+        # GH-20735: EA's with .values attribute give problems with internal
+        # code, disallowing this for now until solved
+        assert not hasattr(data, 'values')
+        assert not hasattr(data, '_values')
+
+    def test_is_numeric_honored(self, data):
+        result = pd.Series(data)
+        assert result._data.blocks[0].is_numeric is data.dtype._is_numeric
+
+    def test_isna_extension_array(self, data_missing):
+        # If your `isna` returns an ExtensionArray, you must also implement
+        # _reduce. At the *very* least, you must implement any and all
+        na = data_missing.isna()
+        if is_extension_array_dtype(na):
+            assert na._reduce('any')
+            assert na.any()
+
+            assert not na._reduce('all')
+            assert not na.all()
+
+            assert na.dtype._is_boolean
diff --git a/pandas/tests/extension/base/io.py b/pandas/tests/extension/base/io.py
new file mode 100644
index 0000000000000..7ea62e4e9d678
--- /dev/null
+++ b/pandas/tests/extension/base/io.py
@@ -0,0 +1,23 @@
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO
+
+import pandas as pd
+
+from .base import BaseExtensionTests
+
+
+class BaseParsingTests(BaseExtensionTests):
+
+    @pytest.mark.parametrize('engine', ['c', 'python'])
+    def test_EA_types(self, engine, data):
+        df = pd.DataFrame({
+            'with_dtype': pd.Series(data, dtype=str(data.dtype))
+        })
+        csv_output = df.to_csv(index=False, na_rep=np.nan)
+        result = pd.read_csv(StringIO(csv_output), dtype={
+            'with_dtype': str(data.dtype)
+        }, engine=engine)
+        expected = df
+        self.assert_frame_equal(result, expected)
diff --git a/pandas/tests/extension/base/methods.py b/pandas/tests/extension/base/methods.py
new file mode 100644
index 0000000000000..1852edaa9e748
--- /dev/null
+++ b/pandas/tests/extension/base/methods.py
@@ -0,0 +1,335 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseMethodsTests(BaseExtensionTests):
+    """Various Series and DataFrame methods."""
+
+    @pytest.mark.parametrize('dropna', [True, False])
+    def test_value_counts(self, all_data, dropna):
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Series(all_data).value_counts(dropna=dropna).sort_index()
+        expected = pd.Series(other).value_counts(
+            dropna=dropna).sort_index()
+
+        self.assert_series_equal(result, expected)
+
+    def test_count(self, data_missing):
+        df = pd.DataFrame({"A": data_missing})
+        result = df.count(axis='columns')
+        expected = pd.Series([0, 1])
+        self.assert_series_equal(result, expected)
+
+    def test_apply_simple_series(self, data):
+        result = pd.Series(data).apply(id)
+        assert isinstance(result, pd.Series)
+
+    def test_argsort(self, data_for_sorting):
+        result = pd.Series(data_for_sorting).argsort()
+        expected = pd.Series(np.array([2, 0, 1], dtype=np.int64))
+        self.assert_series_equal(result, expected)
+
+    def test_argsort_missing(self, data_missing_for_sorting):
+        result = pd.Series(data_missing_for_sorting).argsort()
+        expected = pd.Series(np.array([1, -1, 0], dtype=np.int64))
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values(self, data_for_sorting, ascending):
+        ser = pd.Series(data_for_sorting)
+        result = ser.sort_values(ascending=ascending)
+        expected = ser.iloc[[2, 0, 1]]
+        if not ascending:
+            expected = expected[::-1]
+
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_missing(self, data_missing_for_sorting, ascending):
+        ser = pd.Series(data_missing_for_sorting)
+        result = ser.sort_values(ascending=ascending)
+        if ascending:
+            expected = ser.iloc[[2, 0, 1]]
+        else:
+            expected = ser.iloc[[0, 2, 1]]
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_frame(self, data_for_sorting, ascending):
+        df = pd.DataFrame({"A": [1, 2, 1],
+                           "B": data_for_sorting})
+        result = df.sort_values(['A', 'B'])
+        expected = pd.DataFrame({"A": [1, 1, 2],
+                                 'B': data_for_sorting.take([2, 0, 1])},
+                                index=[2, 0, 1])
+        self.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [pd.Series, lambda x: x])
+    @pytest.mark.parametrize('method', [lambda x: x.unique(), pd.unique])
+    def test_unique(self, data, box, method):
+        duplicated = box(data._from_sequence([data[0], data[0]]))
+
+        result = method(duplicated)
+
+        assert len(result) == 1
+        assert isinstance(result, type(data))
+        assert result[0] == duplicated[0]
+
+    @pytest.mark.parametrize('na_sentinel', [-1, -2])
+    def test_factorize(self, data_for_grouping, na_sentinel):
+        labels, uniques = pd.factorize(data_for_grouping,
+                                       na_sentinel=na_sentinel)
+        expected_labels = np.array([0, 0, na_sentinel,
+                                   na_sentinel, 1, 1, 0, 2],
+                                   dtype=np.intp)
+        expected_uniques = data_for_grouping.take([0, 4, 7])
+
+        tm.assert_numpy_array_equal(labels, expected_labels)
+        self.assert_extension_array_equal(uniques, expected_uniques)
+
+    @pytest.mark.parametrize('na_sentinel', [-1, -2])
+    def test_factorize_equivalence(self, data_for_grouping, na_sentinel):
+        l1, u1 = pd.factorize(data_for_grouping, na_sentinel=na_sentinel)
+        l2, u2 = data_for_grouping.factorize(na_sentinel=na_sentinel)
+
+        tm.assert_numpy_array_equal(l1, l2)
+        self.assert_extension_array_equal(u1, u2)
+
+    def test_factorize_empty(self, data):
+        labels, uniques = pd.factorize(data[:0])
+        expected_labels = np.array([], dtype=np.intp)
+        expected_uniques = type(data)._from_sequence([], dtype=data[:0].dtype)
+
+        tm.assert_numpy_array_equal(labels, expected_labels)
+        self.assert_extension_array_equal(uniques, expected_uniques)
+
+    def test_fillna_copy_frame(self, data_missing):
+        arr = data_missing.take([1, 1])
+        df = pd.DataFrame({"A": arr})
+
+        filled_val = df.iloc[0, 0]
+        result = df.fillna(filled_val)
+
+        assert df.A.values is not result.A.values
+
+    def test_fillna_copy_series(self, data_missing):
+        arr = data_missing.take([1, 1])
+        ser = pd.Series(arr)
+
+        filled_val = ser[0]
+        result = ser.fillna(filled_val)
+
+        assert ser._values is not result._values
+        assert ser._values is arr
+
+    def test_fillna_length_mismatch(self, data_missing):
+        msg = "Length of 'value' does not match."
+        with pytest.raises(ValueError, match=msg):
+            data_missing.fillna(data_missing.take([1]))
+
+    def test_combine_le(self, data_repeated):
+        # GH 20825
+        # Test that combine works when doing a <= (le) comparison
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 <= x2)
+        expected = pd.Series([a <= b for (a, b) in
+                              zip(list(orig_data1), list(orig_data2))])
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 <= x2)
+        expected = pd.Series([a <= val for a in list(orig_data1)])
+        self.assert_series_equal(result, expected)
+
+    def test_combine_add(self, data_repeated):
+        # GH 20825
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 + x2)
+        with np.errstate(over='ignore'):
+            expected = pd.Series(
+                orig_data1._from_sequence([a + b for (a, b) in
+                                           zip(list(orig_data1),
+                                               list(orig_data2))]))
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 + x2)
+        expected = pd.Series(
+            orig_data1._from_sequence([a + val for a in list(orig_data1)]))
+        self.assert_series_equal(result, expected)
+
+    def test_combine_first(self, data):
+        # https://github.com/pandas-dev/pandas/issues/24147
+        a = pd.Series(data[:3])
+        b = pd.Series(data[2:5], index=[2, 3, 4])
+        result = a.combine_first(b)
+        expected = pd.Series(data[:5])
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('frame', [True, False])
+    @pytest.mark.parametrize('periods, indices', [
+        (-2, [2, 3, 4, -1, -1]),
+        (0, [0, 1, 2, 3, 4]),
+        (2, [-1, -1, 0, 1, 2]),
+    ])
+    def test_container_shift(self, data, frame, periods, indices):
+        # https://github.com/pandas-dev/pandas/issues/22386
+        subset = data[:5]
+        data = pd.Series(subset, name='A')
+        expected = pd.Series(subset.take(indices, allow_fill=True), name='A')
+
+        if frame:
+            result = data.to_frame(name='A').assign(B=1).shift(periods)
+            expected = pd.concat([
+                expected,
+                pd.Series([1] * 5, name='B').shift(periods)
+            ], axis=1)
+            compare = self.assert_frame_equal
+        else:
+            result = data.shift(periods)
+            compare = self.assert_series_equal
+
+        compare(result, expected)
+
+    @pytest.mark.parametrize('periods, indices', [
+        [-4, [-1, -1]],
+        [-1, [1, -1]],
+        [0, [0, 1]],
+        [1, [-1, 0]],
+        [4, [-1, -1]]
+    ])
+    def test_shift_non_empty_array(self, data, periods, indices):
+        # https://github.com/pandas-dev/pandas/issues/23911
+        subset = data[:2]
+        result = subset.shift(periods)
+        expected = subset.take(indices, allow_fill=True)
+        self.assert_extension_array_equal(result, expected)
+
+    @pytest.mark.parametrize('periods', [
+        -4, -1, 0, 1, 4
+    ])
+    def test_shift_empty_array(self, data, periods):
+        # https://github.com/pandas-dev/pandas/issues/23911
+        empty = data[:0]
+        result = empty.shift(periods)
+        expected = empty
+        self.assert_extension_array_equal(result, expected)
+
+    def test_shift_fill_value(self, data):
+        arr = data[:4]
+        fill_value = data[0]
+        result = arr.shift(1, fill_value=fill_value)
+        expected = data.take([0, 0, 1, 2])
+        self.assert_extension_array_equal(result, expected)
+
+        result = arr.shift(-2, fill_value=fill_value)
+        expected = data.take([2, 3, 0, 0])
+        self.assert_extension_array_equal(result, expected)
+
+    def test_hash_pandas_object_works(self, data, as_frame):
+        # https://github.com/pandas-dev/pandas/issues/23066
+        data = pd.Series(data)
+        if as_frame:
+            data = data.to_frame()
+        a = pd.util.hash_pandas_object(data)
+        b = pd.util.hash_pandas_object(data)
+        self.assert_equal(a, b)
+
+    def test_searchsorted(self, data_for_sorting, as_series):
+        b, c, a = data_for_sorting
+        arr = type(data_for_sorting)._from_sequence([a, b, c])
+
+        if as_series:
+            arr = pd.Series(arr)
+        assert arr.searchsorted(a) == 0
+        assert arr.searchsorted(a, side="right") == 1
+
+        assert arr.searchsorted(b) == 1
+        assert arr.searchsorted(b, side="right") == 2
+
+        assert arr.searchsorted(c) == 2
+        assert arr.searchsorted(c, side="right") == 3
+
+        result = arr.searchsorted(arr.take([0, 2]))
+        expected = np.array([0, 2], dtype=np.intp)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # sorter
+        sorter = np.array([1, 2, 0])
+        assert data_for_sorting.searchsorted(a, sorter=sorter) == 0
+
+    def test_where_series(self, data, na_value, as_frame):
+        assert data[0] != data[1]
+        cls = type(data)
+        a, b = data[:2]
+
+        ser = pd.Series(cls._from_sequence([a, a, b, b], dtype=data.dtype))
+        cond = np.array([True, True, False, False])
+
+        if as_frame:
+            ser = ser.to_frame(name='a')
+            cond = cond.reshape(-1, 1)
+
+        result = ser.where(cond)
+        expected = pd.Series(cls._from_sequence([a, a, na_value, na_value],
+                                                dtype=data.dtype))
+
+        if as_frame:
+            expected = expected.to_frame(name='a')
+        self.assert_equal(result, expected)
+
+        # array other
+        cond = np.array([True, False, True, True])
+        other = cls._from_sequence([a, b, a, b], dtype=data.dtype)
+        if as_frame:
+            other = pd.DataFrame({"a": other})
+            cond = pd.DataFrame({"a": cond})
+        result = ser.where(cond, other)
+        expected = pd.Series(cls._from_sequence([a, b, b, b],
+                                                dtype=data.dtype))
+        if as_frame:
+            expected = expected.to_frame(name='a')
+        self.assert_equal(result, expected)
+
+    @pytest.mark.parametrize("repeats", [0, 1, 2, [1, 2, 3]])
+    def test_repeat(self, data, repeats, as_series, use_numpy):
+        arr = type(data)._from_sequence(data[:3], dtype=data.dtype)
+        if as_series:
+            arr = pd.Series(arr)
+
+        result = np.repeat(arr, repeats) if use_numpy else arr.repeat(repeats)
+
+        repeats = [repeats] * 3 if isinstance(repeats, int) else repeats
+        expected = [x for x, n in zip(arr, repeats) for _ in range(n)]
+        expected = type(data)._from_sequence(expected, dtype=data.dtype)
+        if as_series:
+            expected = pd.Series(expected, index=arr.index.repeat(repeats))
+
+        self.assert_equal(result, expected)
+
+    @pytest.mark.parametrize('repeats, kwargs, error, msg', [
+        (2, dict(axis=1), ValueError, "'axis"),
+        (-1, dict(), ValueError, "negative"),
+        ([1, 2], dict(), ValueError, "shape"),
+        (2, dict(foo='bar'), TypeError, "'foo'")])
+    def test_repeat_raises(self, data, repeats, kwargs, error, msg, use_numpy):
+        with pytest.raises(error, match=msg):
+            if use_numpy:
+                np.repeat(data, repeats, **kwargs)
+            else:
+                data.repeat(repeats, **kwargs)
diff --git a/pandas/tests/extension/base/missing.py b/pandas/tests/extension/base/missing.py
new file mode 100644
index 0000000000000..834f49f0461f0
--- /dev/null
+++ b/pandas/tests/extension/base/missing.py
@@ -0,0 +1,130 @@
+import numpy as np
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseMissingTests(BaseExtensionTests):
+    def test_isna(self, data_missing):
+        expected = np.array([True, False])
+
+        result = pd.isna(data_missing)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.Series(data_missing).isna()
+        expected = pd.Series(expected)
+        self.assert_series_equal(result, expected)
+
+        # GH 21189
+        result = pd.Series(data_missing).drop([0, 1]).isna()
+        expected = pd.Series([], dtype=bool)
+        self.assert_series_equal(result, expected)
+
+    def test_dropna_array(self, data_missing):
+        result = data_missing.dropna()
+        expected = data_missing[[1]]
+        self.assert_extension_array_equal(result, expected)
+
+    def test_dropna_series(self, data_missing):
+        ser = pd.Series(data_missing)
+        result = ser.dropna()
+        expected = ser.iloc[[1]]
+        self.assert_series_equal(result, expected)
+
+    def test_dropna_frame(self, data_missing):
+        df = pd.DataFrame({"A": data_missing})
+
+        # defaults
+        result = df.dropna()
+        expected = df.iloc[[1]]
+        self.assert_frame_equal(result, expected)
+
+        # axis = 1
+        result = df.dropna(axis='columns')
+        expected = pd.DataFrame(index=[0, 1])
+        self.assert_frame_equal(result, expected)
+
+        # multiple
+        df = pd.DataFrame({"A": data_missing,
+                           "B": [1, np.nan]})
+        result = df.dropna()
+        expected = df.iloc[:0]
+        self.assert_frame_equal(result, expected)
+
+    def test_fillna_scalar(self, data_missing):
+        valid = data_missing[1]
+        result = data_missing.fillna(valid)
+        expected = data_missing.fillna(valid)
+        self.assert_extension_array_equal(result, expected)
+
+    def test_fillna_limit_pad(self, data_missing):
+        arr = data_missing.take([1, 0, 0, 0, 1])
+        result = pd.Series(arr).fillna(method='ffill', limit=2)
+        expected = pd.Series(data_missing.take([1, 1, 1, 0, 1]))
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_limit_backfill(self, data_missing):
+        arr = data_missing.take([1, 0, 0, 0, 1])
+        result = pd.Series(arr).fillna(method='backfill', limit=2)
+        expected = pd.Series(data_missing.take([1, 0, 1, 1, 1]))
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_series(self, data_missing):
+        fill_value = data_missing[1]
+        ser = pd.Series(data_missing)
+
+        result = ser.fillna(fill_value)
+        expected = pd.Series(data_missing._from_sequence(
+            [fill_value, fill_value], dtype=data_missing.dtype))
+        self.assert_series_equal(result, expected)
+
+        # Fill with a series
+        result = ser.fillna(expected)
+        self.assert_series_equal(result, expected)
+
+        # Fill with a series not affecting the missing values
+        result = ser.fillna(ser)
+        self.assert_series_equal(result, ser)
+
+    def test_fillna_series_method(self, data_missing, fillna_method):
+        fill_value = data_missing[1]
+
+        if fillna_method == 'ffill':
+            data_missing = data_missing[::-1]
+
+        result = pd.Series(data_missing).fillna(method=fillna_method)
+        expected = pd.Series(data_missing._from_sequence(
+            [fill_value, fill_value], dtype=data_missing.dtype))
+
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_frame(self, data_missing):
+        fill_value = data_missing[1]
+
+        result = pd.DataFrame({
+            "A": data_missing,
+            "B": [1, 2]
+        }).fillna(fill_value)
+
+        expected = pd.DataFrame({
+            "A": data_missing._from_sequence([fill_value, fill_value],
+                                             dtype=data_missing.dtype),
+            "B": [1, 2],
+        })
+
+        self.assert_frame_equal(result, expected)
+
+    def test_fillna_fill_other(self, data):
+        result = pd.DataFrame({
+            "A": data,
+            "B": [np.nan] * len(data)
+        }).fillna({"B": 0.0})
+
+        expected = pd.DataFrame({
+            "A": data,
+            "B": [0.0] * len(result),
+        })
+
+        self.assert_frame_equal(result, expected)
diff --git a/pandas/tests/extension/base/ops.py b/pandas/tests/extension/base/ops.py
new file mode 100644
index 0000000000000..cd5e55d9871b2
--- /dev/null
+++ b/pandas/tests/extension/base/ops.py
@@ -0,0 +1,166 @@
+import operator
+
+import pytest
+
+import pandas as pd
+from pandas.core import ops
+
+from .base import BaseExtensionTests
+
+
+class BaseOpsUtil(BaseExtensionTests):
+
+    def get_op_from_name(self, op_name):
+        short_opname = op_name.strip('_')
+        try:
+            op = getattr(operator, short_opname)
+        except AttributeError:
+            # Assume it is the reverse operator
+            rop = getattr(operator, short_opname[1:])
+            op = lambda x, y: rop(y, x)
+
+        return op
+
+    def check_opname(self, s, op_name, other, exc=Exception):
+        op = self.get_op_from_name(op_name)
+
+        self._check_op(s, op, other, op_name, exc)
+
+    def _check_op(self, s, op, other, op_name, exc=NotImplementedError):
+        if exc is None:
+            result = op(s, other)
+            expected = s.combine(other, op)
+            self.assert_series_equal(result, expected)
+        else:
+            with pytest.raises(exc):
+                op(s, other)
+
+    def _check_divmod_op(self, s, op, other, exc=Exception):
+        # divmod has multiple return values, so check separatly
+        if exc is None:
+            result_div, result_mod = op(s, other)
+            if op is divmod:
+                expected_div, expected_mod = s // other, s % other
+            else:
+                expected_div, expected_mod = other // s, other % s
+            self.assert_series_equal(result_div, expected_div)
+            self.assert_series_equal(result_mod, expected_mod)
+        else:
+            with pytest.raises(exc):
+                divmod(s, other)
+
+
+class BaseArithmeticOpsTests(BaseOpsUtil):
+    """Various Series and DataFrame arithmetic ops methods.
+
+    Subclasses supporting various ops should set the class variables
+    to indicate that they support ops of that kind
+
+    * series_scalar_exc = TypeError
+    * frame_scalar_exc = TypeError
+    * series_array_exc = TypeError
+    * divmod_exc = TypeError
+    """
+    series_scalar_exc = TypeError
+    frame_scalar_exc = TypeError
+    series_array_exc = TypeError
+    divmod_exc = TypeError
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        # series & scalar
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+        self.check_opname(s, op_name, s.iloc[0], exc=self.series_scalar_exc)
+
+    @pytest.mark.xfail(run=False, reason="_reduce needs implementation")
+    def test_arith_frame_with_scalar(self, data, all_arithmetic_operators):
+        # frame & scalar
+        op_name = all_arithmetic_operators
+        df = pd.DataFrame({'A': data})
+        self.check_opname(df, op_name, data[0], exc=self.frame_scalar_exc)
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        # ndarray & other series
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+        self.check_opname(s, op_name, pd.Series([s.iloc[0]] * len(s)),
+                          exc=self.series_array_exc)
+
+    def test_divmod(self, data):
+        s = pd.Series(data)
+        self._check_divmod_op(s, divmod, 1, exc=self.divmod_exc)
+        self._check_divmod_op(1, ops.rdivmod, s, exc=self.divmod_exc)
+
+    def test_divmod_series_array(self, data):
+        s = pd.Series(data)
+        self._check_divmod_op(s, divmod, data)
+
+    def test_add_series_with_extension_array(self, data):
+        s = pd.Series(data)
+        result = s + data
+        expected = pd.Series(data + data)
+        self.assert_series_equal(result, expected)
+
+    def test_error(self, data, all_arithmetic_operators):
+        # invalid ops
+        op_name = all_arithmetic_operators
+        with pytest.raises(AttributeError):
+            getattr(data, op_name)
+
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        # EAs should return NotImplemented for ops with Series.
+        # Pandas takes care of unboxing the series and calling the EA's op.
+        other = pd.Series(data)
+        if hasattr(data, '__add__'):
+            result = data.__add__(other)
+            assert result is NotImplemented
+        else:
+            raise pytest.skip(
+                "{} does not implement add".format(data.__class__.__name__)
+            )
+
+
+class BaseComparisonOpsTests(BaseOpsUtil):
+    """Various Series and DataFrame comparison ops methods."""
+
+    def _compare_other(self, s, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+        if op_name == '__eq__':
+            assert getattr(data, op_name)(other) is NotImplemented
+            assert not op(s, other).all()
+        elif op_name == '__ne__':
+            assert getattr(data, op_name)(other) is NotImplemented
+            assert op(s, other).all()
+
+        else:
+
+            # array
+            assert getattr(data, op_name)(other) is NotImplemented
+
+            # series
+            s = pd.Series(data)
+            with pytest.raises(TypeError):
+                op(s, other)
+
+    def test_compare_scalar(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        self._compare_other(s, data, op_name, 0)
+
+    def test_compare_array(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        other = pd.Series([data[0]] * len(data))
+        self._compare_other(s, data, op_name, other)
+
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        # EAs should return NotImplemented for ops with Series.
+        # Pandas takes care of unboxing the series and calling the EA's op.
+        other = pd.Series(data)
+        if hasattr(data, '__eq__'):
+            result = data.__eq__(other)
+            assert result is NotImplemented
+        else:
+            raise pytest.skip(
+                "{} does not implement __eq__".format(data.__class__.__name__)
+            )
diff --git a/pandas/tests/extension/base/printing.py b/pandas/tests/extension/base/printing.py
new file mode 100644
index 0000000000000..b2ba1d95cf33e
--- /dev/null
+++ b/pandas/tests/extension/base/printing.py
@@ -0,0 +1,44 @@
+import io
+
+import pytest
+
+import pandas as pd
+from pandas import compat
+
+from .base import BaseExtensionTests
+
+
+class BasePrintingTests(BaseExtensionTests):
+    """Tests checking the formatting of your EA when printed."""
+
+    @pytest.mark.parametrize("size", ["big", "small"])
+    def test_array_repr(self, data, size):
+        if size == "small":
+            data = data[:5]
+        else:
+            data = type(data)._concat_same_type([data] * 5)
+
+        result = repr(data)
+        assert data.__class__.__name__ in result
+        assert 'Length: {}'.format(len(data)) in result
+        assert str(data.dtype) in result
+        if size == 'big':
+            assert '...' in result
+
+    def test_array_repr_unicode(self, data):
+        result = compat.text_type(data)
+        assert isinstance(result, compat.text_type)
+
+    def test_series_repr(self, data):
+        ser = pd.Series(data)
+        assert data.dtype.name in repr(ser)
+
+    def test_dataframe_repr(self, data):
+        df = pd.DataFrame({"A": data})
+        repr(df)
+
+    def test_dtype_name_in_info(self, data):
+        buf = io.StringIO()
+        pd.DataFrame({"A": data}).info(buf=buf)
+        result = buf.getvalue()
+        assert data.dtype.name in result
diff --git a/pandas/tests/extension/base/reduce.py b/pandas/tests/extension/base/reduce.py
new file mode 100644
index 0000000000000..c4b70f2013265
--- /dev/null
+++ b/pandas/tests/extension/base/reduce.py
@@ -0,0 +1,61 @@
+import warnings
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+from .base import BaseExtensionTests
+
+
+class BaseReduceTests(BaseExtensionTests):
+    """
+    Reduction specific tests. Generally these only
+    make sense for numeric/boolean operations.
+    """
+    def check_reduce(self, s, op_name, skipna):
+        result = getattr(s, op_name)(skipna=skipna)
+        expected = getattr(s.astype('float64'), op_name)(skipna=skipna)
+        tm.assert_almost_equal(result, expected)
+
+
+class BaseNoReduceTests(BaseReduceTests):
+    """ we don't define any reductions """
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_reduce_series_numeric(self, data, all_numeric_reductions, skipna):
+        op_name = all_numeric_reductions
+        s = pd.Series(data)
+
+        with pytest.raises(TypeError):
+            getattr(s, op_name)(skipna=skipna)
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_reduce_series_boolean(self, data, all_boolean_reductions, skipna):
+        op_name = all_boolean_reductions
+        s = pd.Series(data)
+
+        with pytest.raises(TypeError):
+            getattr(s, op_name)(skipna=skipna)
+
+
+class BaseNumericReduceTests(BaseReduceTests):
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_reduce_series(self, data, all_numeric_reductions, skipna):
+        op_name = all_numeric_reductions
+        s = pd.Series(data)
+
+        # min/max with empty produce numpy warnings
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", RuntimeWarning)
+            self.check_reduce(s, op_name, skipna)
+
+
+class BaseBooleanReduceTests(BaseReduceTests):
+
+    @pytest.mark.parametrize('skipna', [True, False])
+    def test_reduce_series(self, data, all_boolean_reductions, skipna):
+        op_name = all_boolean_reductions
+        s = pd.Series(data)
+        self.check_reduce(s, op_name, skipna)
diff --git a/pandas/tests/extension/base/reshaping.py b/pandas/tests/extension/base/reshaping.py
new file mode 100644
index 0000000000000..ee22ffb3ccf97
--- /dev/null
+++ b/pandas/tests/extension/base/reshaping.py
@@ -0,0 +1,271 @@
+import itertools
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.core.internals import ExtensionBlock
+
+from .base import BaseExtensionTests
+
+
+class BaseReshapingTests(BaseExtensionTests):
+    """Tests for reshaping and concatenation."""
+    @pytest.mark.parametrize('in_frame', [True, False])
+    def test_concat(self, data, in_frame):
+        wrapped = pd.Series(data)
+        if in_frame:
+            wrapped = pd.DataFrame(wrapped)
+        result = pd.concat([wrapped, wrapped], ignore_index=True)
+
+        assert len(result) == len(data) * 2
+
+        if in_frame:
+            dtype = result.dtypes[0]
+        else:
+            dtype = result.dtype
+
+        assert dtype == data.dtype
+        assert isinstance(result._data.blocks[0], ExtensionBlock)
+
+    @pytest.mark.parametrize('in_frame', [True, False])
+    def test_concat_all_na_block(self, data_missing, in_frame):
+        valid_block = pd.Series(data_missing.take([1, 1]), index=[0, 1])
+        na_block = pd.Series(data_missing.take([0, 0]), index=[2, 3])
+        if in_frame:
+            valid_block = pd.DataFrame({"a": valid_block})
+            na_block = pd.DataFrame({"a": na_block})
+        result = pd.concat([valid_block, na_block])
+        if in_frame:
+            expected = pd.DataFrame({"a": data_missing.take([1, 1, 0, 0])})
+            self.assert_frame_equal(result, expected)
+        else:
+            expected = pd.Series(data_missing.take([1, 1, 0, 0]))
+            self.assert_series_equal(result, expected)
+
+    def test_concat_mixed_dtypes(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20762
+        df1 = pd.DataFrame({'A': data[:3]})
+        df2 = pd.DataFrame({"A": [1, 2, 3]})
+        df3 = pd.DataFrame({"A": ['a', 'b', 'c']}).astype('category')
+        dfs = [df1, df2, df3]
+
+        # dataframes
+        result = pd.concat(dfs)
+        expected = pd.concat([x.astype(object) for x in dfs])
+        self.assert_frame_equal(result, expected)
+
+        # series
+        result = pd.concat([x['A'] for x in dfs])
+        expected = pd.concat([x['A'].astype(object) for x in dfs])
+        self.assert_series_equal(result, expected)
+
+        # simple test for just EA and one other
+        result = pd.concat([df1, df2])
+        expected = pd.concat([df1.astype('object'), df2.astype('object')])
+        self.assert_frame_equal(result, expected)
+
+        result = pd.concat([df1['A'], df2['A']])
+        expected = pd.concat([df1['A'].astype('object'),
+                              df2['A'].astype('object')])
+        self.assert_series_equal(result, expected)
+
+    def test_concat_columns(self, data, na_value):
+        df1 = pd.DataFrame({'A': data[:3]})
+        df2 = pd.DataFrame({'B': [1, 2, 3]})
+
+        expected = pd.DataFrame({'A': data[:3], 'B': [1, 2, 3]})
+        result = pd.concat([df1, df2], axis=1)
+        self.assert_frame_equal(result, expected)
+        result = pd.concat([df1['A'], df2['B']], axis=1)
+        self.assert_frame_equal(result, expected)
+
+        # non-aligned
+        df2 = pd.DataFrame({'B': [1, 2, 3]}, index=[1, 2, 3])
+        expected = pd.DataFrame({
+            'A': data._from_sequence(list(data[:3]) + [na_value],
+                                     dtype=data.dtype),
+            'B': [np.nan, 1, 2, 3]})
+
+        result = pd.concat([df1, df2], axis=1)
+        self.assert_frame_equal(result, expected)
+        result = pd.concat([df1['A'], df2['B']], axis=1)
+        self.assert_frame_equal(result, expected)
+
+    def test_align(self, data, na_value):
+        a = data[:3]
+        b = data[2:5]
+        r1, r2 = pd.Series(a).align(pd.Series(b, index=[1, 2, 3]))
+
+        # Assumes that the ctor can take a list of scalars of the type
+        e1 = pd.Series(data._from_sequence(list(a) + [na_value],
+                                           dtype=data.dtype))
+        e2 = pd.Series(data._from_sequence([na_value] + list(b),
+                                           dtype=data.dtype))
+        self.assert_series_equal(r1, e1)
+        self.assert_series_equal(r2, e2)
+
+    def test_align_frame(self, data, na_value):
+        a = data[:3]
+        b = data[2:5]
+        r1, r2 = pd.DataFrame({'A': a}).align(
+            pd.DataFrame({'A': b}, index=[1, 2, 3])
+        )
+
+        # Assumes that the ctor can take a list of scalars of the type
+        e1 = pd.DataFrame({'A': data._from_sequence(list(a) + [na_value],
+                                                    dtype=data.dtype)})
+        e2 = pd.DataFrame({'A': data._from_sequence([na_value] + list(b),
+                                                    dtype=data.dtype)})
+        self.assert_frame_equal(r1, e1)
+        self.assert_frame_equal(r2, e2)
+
+    def test_align_series_frame(self, data, na_value):
+        # https://github.com/pandas-dev/pandas/issues/20576
+        ser = pd.Series(data, name='a')
+        df = pd.DataFrame({"col": np.arange(len(ser) + 1)})
+        r1, r2 = ser.align(df)
+
+        e1 = pd.Series(data._from_sequence(list(data) + [na_value],
+                                           dtype=data.dtype),
+                       name=ser.name)
+
+        self.assert_series_equal(r1, e1)
+        self.assert_frame_equal(r2, df)
+
+    def test_set_frame_expand_regular_with_extension(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        df['B'] = data
+        expected = pd.DataFrame({"A": [1] * len(data), "B": data})
+        self.assert_frame_equal(df, expected)
+
+    def test_set_frame_expand_extension_with_regular(self, data):
+        df = pd.DataFrame({'A': data})
+        df['B'] = [1] * len(data)
+        expected = pd.DataFrame({"A": data, "B": [1] * len(data)})
+        self.assert_frame_equal(df, expected)
+
+    def test_set_frame_overwrite_object(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20555
+        df = pd.DataFrame({"A": [1] * len(data)}, dtype=object)
+        df['A'] = data
+        assert df.dtypes['A'] == data.dtype
+
+    def test_merge(self, data, na_value):
+        # GH-20743
+        df1 = pd.DataFrame({'ext': data[:3], 'int1': [1, 2, 3],
+                            'key': [0, 1, 2]})
+        df2 = pd.DataFrame({'int2': [1, 2, 3, 4], 'key': [0, 0, 1, 3]})
+
+        res = pd.merge(df1, df2)
+        exp = pd.DataFrame(
+            {'int1': [1, 1, 2], 'int2': [1, 2, 3], 'key': [0, 0, 1],
+             'ext': data._from_sequence([data[0], data[0], data[1]],
+                                        dtype=data.dtype)})
+        self.assert_frame_equal(res, exp[['ext', 'int1', 'key', 'int2']])
+
+        res = pd.merge(df1, df2, how='outer')
+        exp = pd.DataFrame(
+            {'int1': [1, 1, 2, 3, np.nan], 'int2': [1, 2, 3, np.nan, 4],
+             'key': [0, 0, 1, 2, 3],
+             'ext': data._from_sequence(
+                 [data[0], data[0], data[1], data[2], na_value],
+                 dtype=data.dtype)})
+        self.assert_frame_equal(res, exp[['ext', 'int1', 'key', 'int2']])
+
+    def test_merge_on_extension_array(self, data):
+        # GH 23020
+        a, b = data[:2]
+        key = type(data)._from_sequence([a, b], dtype=data.dtype)
+
+        df = pd.DataFrame({"key": key, "val": [1, 2]})
+        result = pd.merge(df, df, on='key')
+        expected = pd.DataFrame({"key": key,
+                                 "val_x": [1, 2],
+                                 "val_y": [1, 2]})
+        self.assert_frame_equal(result, expected)
+
+        # order
+        result = pd.merge(df.iloc[[1, 0]], df, on='key')
+        expected = expected.iloc[[1, 0]].reset_index(drop=True)
+        self.assert_frame_equal(result, expected)
+
+    def test_merge_on_extension_array_duplicates(self, data):
+        # GH 23020
+        a, b = data[:2]
+        key = type(data)._from_sequence([a, b, a], dtype=data.dtype)
+        df1 = pd.DataFrame({"key": key, "val": [1, 2, 3]})
+        df2 = pd.DataFrame({"key": key, "val": [1, 2, 3]})
+
+        result = pd.merge(df1, df2, on='key')
+        expected = pd.DataFrame({
+            "key": key.take([0, 0, 0, 0, 1]),
+            "val_x": [1, 1, 3, 3, 2],
+            "val_y": [1, 3, 1, 3, 2],
+        })
+        self.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("columns", [
+        ["A", "B"],
+        pd.MultiIndex.from_tuples([('A', 'a'), ('A', 'b')],
+                                  names=['outer', 'inner']),
+    ])
+    def test_stack(self, data, columns):
+        df = pd.DataFrame({"A": data[:5], "B": data[:5]})
+        df.columns = columns
+        result = df.stack()
+        expected = df.astype(object).stack()
+        # we need a second astype(object), in case the constructor inferred
+        # object -> specialized, as is done for period.
+        expected = expected.astype(object)
+
+        if isinstance(expected, pd.Series):
+            assert result.dtype == df.iloc[:, 0].dtype
+        else:
+            assert all(result.dtypes == df.iloc[:, 0].dtype)
+
+        result = result.astype(object)
+        self.assert_equal(result, expected)
+
+    @pytest.mark.parametrize("index", [
+        # Two levels, uniform.
+        pd.MultiIndex.from_product(([['A', 'B'], ['a', 'b']]),
+                                   names=['a', 'b']),
+
+        # non-uniform
+        pd.MultiIndex.from_tuples([('A', 'a'), ('A', 'b'), ('B', 'b')]),
+
+        # three levels, non-uniform
+        pd.MultiIndex.from_product([('A', 'B'), ('a', 'b', 'c'), (0, 1, 2)]),
+        pd.MultiIndex.from_tuples([
+            ('A', 'a', 1),
+            ('A', 'b', 0),
+            ('A', 'a', 0),
+            ('B', 'a', 0),
+            ('B', 'c', 1),
+        ]),
+    ])
+    @pytest.mark.parametrize("obj", ["series", "frame"])
+    def test_unstack(self, data, index, obj):
+        data = data[:len(index)]
+        if obj == "series":
+            ser = pd.Series(data, index=index)
+        else:
+            ser = pd.DataFrame({"A": data, "B": data}, index=index)
+
+        n = index.nlevels
+        levels = list(range(n))
+        # [0, 1, 2]
+        # [(0,), (1,), (2,), (0, 1), (0, 2), (1, 0), (1, 2), (2, 0), (2, 1)]
+        combinations = itertools.chain.from_iterable(
+            itertools.permutations(levels, i) for i in range(1, n)
+        )
+
+        for level in combinations:
+            result = ser.unstack(level=level)
+            assert all(isinstance(result[col].array, type(data))
+                       for col in result.columns)
+            expected = ser.astype(object).unstack(level=level)
+            result = result.astype(object)
+
+            self.assert_frame_equal(result, expected)
diff --git a/pandas/tests/extension/base/setitem.py b/pandas/tests/extension/base/setitem.py
new file mode 100644
index 0000000000000..db6328e39e6cc
--- /dev/null
+++ b/pandas/tests/extension/base/setitem.py
@@ -0,0 +1,188 @@
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+
+from .base import BaseExtensionTests
+
+
+class BaseSetitemTests(BaseExtensionTests):
+    def test_setitem_scalar_series(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        data[0] = data[1]
+        assert data[0] == data[1]
+
+    def test_setitem_sequence(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        original = data.copy()
+
+        data[[0, 1]] = [data[1], data[0]]
+        assert data[0] == original[1]
+        assert data[1] == original[0]
+
+    def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
+        ser = pd.Series(data)
+        original = ser.copy()
+        value = [data[0]]
+        if as_array:
+            value = data._from_sequence(value)
+
+        xpr = 'cannot set using a {} indexer with a different length'
+        with pytest.raises(ValueError, match=xpr.format('list-like')):
+            ser[[0, 1]] = value
+        # Ensure no modifications made before the exception
+        self.assert_series_equal(ser, original)
+
+        with pytest.raises(ValueError, match=xpr.format('slice')):
+            ser[slice(3)] = value
+        self.assert_series_equal(ser, original)
+
+    def test_setitem_empty_indxer(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        original = data.copy()
+        data[np.array([], dtype=int)] = []
+        self.assert_equal(data, original)
+
+    def test_setitem_sequence_broadcasts(self, data, box_in_series):
+        if box_in_series:
+            data = pd.Series(data)
+        data[[0, 1]] = data[2]
+        assert data[0] == data[2]
+        assert data[1] == data[2]
+
+    @pytest.mark.parametrize('setter', ['loc', 'iloc'])
+    def test_setitem_scalar(self, data, setter):
+        arr = pd.Series(data)
+        setter = getattr(arr, setter)
+        operator.setitem(setter, 0, data[1])
+        assert arr[0] == data[1]
+
+    def test_setitem_loc_scalar_mixed(self, data):
+        df = pd.DataFrame({"A": np.arange(len(data)), "B": data})
+        df.loc[0, 'B'] = data[1]
+        assert df.loc[0, 'B'] == data[1]
+
+    def test_setitem_loc_scalar_single(self, data):
+        df = pd.DataFrame({"B": data})
+        df.loc[10, 'B'] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_loc_scalar_multiple_homogoneous(self, data):
+        df = pd.DataFrame({"A": data, "B": data})
+        df.loc[10, 'B'] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_mixed(self, data):
+        df = pd.DataFrame({"A": np.arange(len(data)), "B": data})
+        df.iloc[0, 1] = data[1]
+        assert df.loc[0, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_single(self, data):
+        df = pd.DataFrame({"B": data})
+        df.iloc[10, 0] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    def test_setitem_iloc_scalar_multiple_homogoneous(self, data):
+        df = pd.DataFrame({"A": data, "B": data})
+        df.iloc[10, 1] = data[1]
+        assert df.loc[10, 'B'] == data[1]
+
+    @pytest.mark.parametrize('as_callable', [True, False])
+    @pytest.mark.parametrize('setter', ['loc', None])
+    def test_setitem_mask_aligned(self, data, as_callable, setter):
+        ser = pd.Series(data)
+        mask = np.zeros(len(data), dtype=bool)
+        mask[:2] = True
+
+        if as_callable:
+            mask2 = lambda x: mask
+        else:
+            mask2 = mask
+
+        if setter:
+            # loc
+            target = getattr(ser, setter)
+        else:
+            # Series.__setitem__
+            target = ser
+
+        operator.setitem(target, mask2, data[5:7])
+
+        ser[mask2] = data[5:7]
+        assert ser[0] == data[5]
+        assert ser[1] == data[6]
+
+    @pytest.mark.parametrize('setter', ['loc', None])
+    def test_setitem_mask_broadcast(self, data, setter):
+        ser = pd.Series(data)
+        mask = np.zeros(len(data), dtype=bool)
+        mask[:2] = True
+
+        if setter:   # loc
+            target = getattr(ser, setter)
+        else:  # __setitem__
+            target = ser
+
+        operator.setitem(target, mask, data[10])
+        assert ser[0] == data[10]
+        assert ser[1] == data[10]
+
+    def test_setitem_expand_columns(self, data):
+        df = pd.DataFrame({"A": data})
+        result = df.copy()
+        result['B'] = 1
+        expected = pd.DataFrame({"A": data, "B": [1] * len(data)})
+        self.assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[:, 'B'] = 1
+        self.assert_frame_equal(result, expected)
+
+        # overwrite with new type
+        result['B'] = data
+        expected = pd.DataFrame({"A": data, "B": data})
+        self.assert_frame_equal(result, expected)
+
+    def test_setitem_expand_with_extension(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        result = df.copy()
+        result['B'] = data
+        expected = pd.DataFrame({"A": [1] * len(data), "B": data})
+        self.assert_frame_equal(result, expected)
+
+        result = df.copy()
+        result.loc[:, 'B'] = data
+        self.assert_frame_equal(result, expected)
+
+    def test_setitem_frame_invalid_length(self, data):
+        df = pd.DataFrame({"A": [1] * len(data)})
+        xpr = "Length of values does not match length of index"
+        with pytest.raises(ValueError, match=xpr):
+            df['B'] = data[:5]
+
+    @pytest.mark.xfail(reason="GH#20441: setitem on extension types.")
+    def test_setitem_tuple_index(self, data):
+        s = pd.Series(data[:2], index=[(0, 0), (0, 1)])
+        expected = pd.Series(data.take([1, 1]), index=s.index)
+        s[(0, 1)] = data[1]
+        self.assert_series_equal(s, expected)
+
+    def test_setitem_slice_mismatch_length_raises(self, data):
+        arr = data[:5]
+        with pytest.raises(ValueError):
+            arr[:1] = arr[:2]
+
+    def test_setitem_slice_array(self, data):
+        arr = data[:5].copy()
+        arr[:5] = data[-5:]
+        self.assert_extension_array_equal(arr, data[-5:])
+
+    def test_setitem_scalar_key_sequence_raise(self, data):
+        arr = data[:5].copy()
+        with pytest.raises(ValueError):
+            arr[0] = arr[[0, 1]]
diff --git a/pandas/tests/extension/conftest.py b/pandas/tests/extension/conftest.py
new file mode 100644
index 0000000000000..3cc2d313b09f5
--- /dev/null
+++ b/pandas/tests/extension/conftest.py
@@ -0,0 +1,167 @@
+import operator
+
+import pytest
+
+from pandas import Series
+
+
+@pytest.fixture
+def dtype():
+    """A fixture providing the ExtensionDtype to validate."""
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data():
+    """Length-100 array for this type.
+
+    * data[0] and data[1] should both be non missing
+    * data[0] and data[1] should not gbe equal
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data_missing():
+    """Length-2 array with [NA, Valid]"""
+    raise NotImplementedError
+
+
+@pytest.fixture(params=['data', 'data_missing'])
+def all_data(request, data, data_missing):
+    """Parametrized fixture giving 'data' and 'data_missing'"""
+    if request.param == 'data':
+        return data
+    elif request.param == 'data_missing':
+        return data_missing
+
+
+@pytest.fixture
+def data_repeated(data):
+    """
+    Generate many datasets.
+
+    Parameters
+    ----------
+    data : fixture implementing `data`
+
+    Returns
+    -------
+    Callable[[int], Generator]:
+        A callable that takes a `count` argument and
+        returns a generator yielding `count` datasets.
+    """
+    def gen(count):
+        for _ in range(count):
+            yield data
+    return gen
+
+
+@pytest.fixture
+def data_for_sorting():
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, C, A] with
+    A < B < C
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, NA, A] with
+    A < B and NA missing.
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture
+def na_cmp():
+    """Binary operator for comparing NA values.
+
+    Should return a function of two arguments that returns
+    True if both arguments are (scalar) NA for your type.
+
+    By default, uses ``operator.is_``
+    """
+    return operator.is_
+
+
+@pytest.fixture
+def na_value():
+    """The scalar missing value for this type. Default 'None'"""
+    return None
+
+
+@pytest.fixture
+def data_for_grouping():
+    """Data for factorization, grouping, and unique tests.
+
+    Expected to be like [B, B, NA, NA, A, A, B, C]
+
+    Where A < B < C and NA is missing
+    """
+    raise NotImplementedError
+
+
+@pytest.fixture(params=[True, False])
+def box_in_series(request):
+    """Whether to box the data in a Series"""
+    return request.param
+
+
+@pytest.fixture(params=[
+    lambda x: 1,
+    lambda x: [1] * len(x),
+    lambda x: Series([1] * len(x)),
+    lambda x: x,
+], ids=['scalar', 'list', 'series', 'object'])
+def groupby_apply_op(request):
+    """
+    Functions to test groupby.apply().
+    """
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def as_frame(request):
+    """
+    Boolean fixture to support Series and Series.to_frame() comparison testing.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def as_series(request):
+    """
+    Boolean fixture to support arr and Series(arr) comparison testing.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def use_numpy(request):
+    """
+    Boolean fixture to support comparison testing of ExtensionDtype array
+    and numpy array.
+    """
+    return request.param
+
+
+@pytest.fixture(params=['ffill', 'bfill'])
+def fillna_method(request):
+    """
+    Parametrized fixture giving method parameters 'ffill' and 'bfill' for
+    Series.fillna(method=<method>) testing.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def as_array(request):
+    """
+    Boolean fixture to support ExtensionDtype _from_sequence method testing.
+    """
+    return request.param
diff --git a/pandas/tests/extension/decimal/__init__.py b/pandas/tests/extension/decimal/__init__.py
new file mode 100644
index 0000000000000..c37aad0af8407
--- /dev/null
+++ b/pandas/tests/extension/decimal/__init__.py
@@ -0,0 +1,4 @@
+from .array import DecimalArray, DecimalDtype, to_decimal, make_data
+
+
+__all__ = ['DecimalArray', 'DecimalDtype', 'to_decimal', 'make_data']
diff --git a/pandas/tests/extension/decimal/array.py b/pandas/tests/extension/decimal/array.py
new file mode 100644
index 0000000000000..1823eeb4d7fc0
--- /dev/null
+++ b/pandas/tests/extension/decimal/array.py
@@ -0,0 +1,166 @@
+import decimal
+import numbers
+import random
+import sys
+
+import numpy as np
+
+from pandas.core.dtypes.base import ExtensionDtype
+
+import pandas as pd
+from pandas.api.extensions import register_extension_dtype
+from pandas.core.arrays import ExtensionArray, ExtensionScalarOpsMixin
+
+
+@register_extension_dtype
+class DecimalDtype(ExtensionDtype):
+    type = decimal.Decimal
+    name = 'decimal'
+    na_value = decimal.Decimal('NaN')
+    _metadata = ('context',)
+
+    def __init__(self, context=None):
+        self.context = context or decimal.getcontext()
+
+    def __repr__(self):
+        return 'DecimalDtype(context={})'.format(self.context)
+
+    @classmethod
+    def construct_array_type(cls):
+        """Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        return DecimalArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        if string == cls.name:
+            return cls()
+        else:
+            raise TypeError("Cannot construct a '{}' from "
+                            "'{}'".format(cls, string))
+
+    @property
+    def _is_numeric(self):
+        return True
+
+
+class DecimalArray(ExtensionArray, ExtensionScalarOpsMixin):
+    __array_priority__ = 1000
+
+    def __init__(self, values, dtype=None, copy=False, context=None):
+        for val in values:
+            if not isinstance(val, decimal.Decimal):
+                raise TypeError("All values must be of type " +
+                                str(decimal.Decimal))
+        values = np.asarray(values, dtype=object)
+
+        self._data = values
+        # Some aliases for common attribute names to ensure pandas supports
+        # these
+        self._items = self.data = self._data
+        # those aliases are currently not working due to assumptions
+        # in internal code (GH-20735)
+        # self._values = self.values = self.data
+        self._dtype = DecimalDtype(context)
+
+    @property
+    def dtype(self):
+        return self._dtype
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return cls(scalars)
+
+    @classmethod
+    def _from_sequence_of_strings(cls, strings, dtype=None, copy=False):
+        return cls._from_sequence([decimal.Decimal(x) for x in strings],
+                                  dtype, copy)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls(values)
+
+    def __getitem__(self, item):
+        if isinstance(item, numbers.Integral):
+            return self._data[item]
+        else:
+            return type(self)(self._data[item])
+
+    def take(self, indexer, allow_fill=False, fill_value=None):
+        from pandas.api.extensions import take
+
+        data = self._data
+        if allow_fill and fill_value is None:
+            fill_value = self.dtype.na_value
+
+        result = take(data, indexer, fill_value=fill_value,
+                      allow_fill=allow_fill)
+        return self._from_sequence(result)
+
+    def copy(self, deep=False):
+        if deep:
+            return type(self)(self._data.copy())
+        return type(self)(self)
+
+    def astype(self, dtype, copy=True):
+        if isinstance(dtype, type(self.dtype)):
+            return type(self)(self._data, context=dtype.context)
+        return np.asarray(self, dtype=dtype)
+
+    def __setitem__(self, key, value):
+        if pd.api.types.is_list_like(value):
+            if pd.api.types.is_scalar(key):
+                raise ValueError("setting an array element with a sequence.")
+            value = [decimal.Decimal(v) for v in value]
+        else:
+            value = decimal.Decimal(value)
+        self._data[key] = value
+
+    def __len__(self):
+        return len(self._data)
+
+    @property
+    def nbytes(self):
+        n = len(self)
+        if n:
+            return n * sys.getsizeof(self[0])
+        return 0
+
+    def isna(self):
+        return np.array([x.is_nan() for x in self._data], dtype=bool)
+
+    @property
+    def _na_value(self):
+        return decimal.Decimal('NaN')
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        return cls(np.concatenate([x._data for x in to_concat]))
+
+    def _reduce(self, name, skipna=True, **kwargs):
+
+        if skipna:
+            raise NotImplementedError("decimal does not support skipna=True")
+
+        try:
+            op = getattr(self.data, name)
+        except AttributeError:
+            raise NotImplementedError("decimal does not support "
+                                      "the {} operation".format(name))
+        return op(axis=0)
+
+
+def to_decimal(values, context=None):
+    return DecimalArray([decimal.Decimal(x) for x in values], context=context)
+
+
+def make_data():
+    return [decimal.Decimal(random.random()) for _ in range(100)]
+
+
+DecimalArray._add_arithmetic_ops()
+DecimalArray._add_comparison_ops()
diff --git a/pandas/tests/extension/decimal/test_decimal.py b/pandas/tests/extension/decimal/test_decimal.py
new file mode 100644
index 0000000000000..6281c5360cd03
--- /dev/null
+++ b/pandas/tests/extension/decimal/test_decimal.py
@@ -0,0 +1,401 @@
+import decimal
+import math
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import compat
+from pandas.tests.extension import base
+import pandas.util.testing as tm
+
+from .array import DecimalArray, DecimalDtype, make_data, to_decimal
+
+
+@pytest.fixture
+def dtype():
+    return DecimalDtype()
+
+
+@pytest.fixture
+def data():
+    return DecimalArray(make_data())
+
+
+@pytest.fixture
+def data_missing():
+    return DecimalArray([decimal.Decimal('NaN'), decimal.Decimal(1)])
+
+
+@pytest.fixture
+def data_for_sorting():
+    return DecimalArray([decimal.Decimal('1'),
+                         decimal.Decimal('2'),
+                         decimal.Decimal('0')])
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return DecimalArray([decimal.Decimal('1'),
+                         decimal.Decimal('NaN'),
+                         decimal.Decimal('0')])
+
+
+@pytest.fixture
+def na_cmp():
+    return lambda x, y: x.is_nan() and y.is_nan()
+
+
+@pytest.fixture
+def na_value():
+    return decimal.Decimal("NaN")
+
+
+@pytest.fixture
+def data_for_grouping():
+    b = decimal.Decimal('1.0')
+    a = decimal.Decimal('0.0')
+    c = decimal.Decimal('2.0')
+    na = decimal.Decimal('NaN')
+    return DecimalArray([b, b, na, na, a, a, b, c])
+
+
+class BaseDecimal(object):
+
+    def assert_series_equal(self, left, right, *args, **kwargs):
+        def convert(x):
+            # need to convert array([Decimal(NaN)], dtype='object') to np.NaN
+            # because Series[object].isnan doesn't recognize decimal(NaN) as
+            # NA.
+            try:
+                return math.isnan(x)
+            except TypeError:
+                return False
+
+        if left.dtype == 'object':
+            left_na = left.apply(convert)
+        else:
+            left_na = left.isna()
+        if right.dtype == 'object':
+            right_na = right.apply(convert)
+        else:
+            right_na = right.isna()
+
+        tm.assert_series_equal(left_na, right_na)
+        return tm.assert_series_equal(left[~left_na],
+                                      right[~right_na],
+                                      *args, **kwargs)
+
+    def assert_frame_equal(self, left, right, *args, **kwargs):
+        # TODO(EA): select_dtypes
+        tm.assert_index_equal(
+            left.columns, right.columns,
+            exact=kwargs.get('check_column_type', 'equiv'),
+            check_names=kwargs.get('check_names', True),
+            check_exact=kwargs.get('check_exact', False),
+            check_categorical=kwargs.get('check_categorical', True),
+            obj='{obj}.columns'.format(obj=kwargs.get('obj', 'DataFrame')))
+
+        decimals = (left.dtypes == 'decimal').index
+
+        for col in decimals:
+            self.assert_series_equal(left[col], right[col],
+                                     *args, **kwargs)
+
+        left = left.drop(columns=decimals)
+        right = right.drop(columns=decimals)
+        tm.assert_frame_equal(left, right, *args, **kwargs)
+
+
+class TestDtype(BaseDecimal, base.BaseDtypeTests):
+    @pytest.mark.skipif(compat.PY2, reason="Context not hashable.")
+    def test_hashable(self, dtype):
+        pass
+
+
+class TestInterface(BaseDecimal, base.BaseInterfaceTests):
+
+    pytestmark = pytest.mark.skipif(compat.PY2,
+                                    reason="Unhashble dtype in Py2.")
+
+
+class TestConstructors(BaseDecimal, base.BaseConstructorsTests):
+
+    @pytest.mark.skip(reason="not implemented constructor from dtype")
+    def test_from_dtype(self, data):
+        # construct from our dtype & string dtype
+        pass
+
+
+class TestReshaping(BaseDecimal, base.BaseReshapingTests):
+    pytestmark = pytest.mark.skipif(compat.PY2,
+                                    reason="Unhashble dtype in Py2.")
+
+
+class TestGetitem(BaseDecimal, base.BaseGetitemTests):
+
+    def test_take_na_value_other_decimal(self):
+        arr = DecimalArray([decimal.Decimal('1.0'),
+                            decimal.Decimal('2.0')])
+        result = arr.take([0, -1], allow_fill=True,
+                          fill_value=decimal.Decimal('-1.0'))
+        expected = DecimalArray([decimal.Decimal('1.0'),
+                                 decimal.Decimal('-1.0')])
+        self.assert_extension_array_equal(result, expected)
+
+
+class TestMissing(BaseDecimal, base.BaseMissingTests):
+    pass
+
+
+class Reduce(object):
+
+    def check_reduce(self, s, op_name, skipna):
+
+        if skipna or op_name in ['median', 'skew', 'kurt']:
+            with pytest.raises(NotImplementedError):
+                getattr(s, op_name)(skipna=skipna)
+
+        else:
+            result = getattr(s, op_name)(skipna=skipna)
+            expected = getattr(np.asarray(s), op_name)()
+            tm.assert_almost_equal(result, expected)
+
+
+class TestNumericReduce(Reduce, base.BaseNumericReduceTests):
+    pass
+
+
+class TestBooleanReduce(Reduce, base.BaseBooleanReduceTests):
+    pass
+
+
+class TestMethods(BaseDecimal, base.BaseMethodsTests):
+    @pytest.mark.parametrize('dropna', [True, False])
+    @pytest.mark.xfail(reason="value_counts not implemented yet.")
+    def test_value_counts(self, all_data, dropna):
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Series(all_data).value_counts(dropna=dropna).sort_index()
+        expected = pd.Series(other).value_counts(dropna=dropna).sort_index()
+
+        tm.assert_series_equal(result, expected)
+
+
+class TestCasting(BaseDecimal, base.BaseCastingTests):
+    pytestmark = pytest.mark.skipif(compat.PY2,
+                                    reason="Unhashble dtype in Py2.")
+
+
+class TestGroupby(BaseDecimal, base.BaseGroupbyTests):
+    pytestmark = pytest.mark.skipif(compat.PY2,
+                                    reason="Unhashble dtype in Py2.")
+
+
+class TestSetitem(BaseDecimal, base.BaseSetitemTests):
+    pass
+
+
+class TestPrinting(BaseDecimal, base.BasePrintingTests):
+    pytestmark = pytest.mark.skipif(compat.PY2,
+                                    reason="Unhashble dtype in Py2.")
+
+
+# TODO(extension)
+@pytest.mark.xfail(reason=(
+    "raising AssertionError as this is not implemented, "
+    "though easy enough to do"))
+def test_series_constructor_coerce_data_to_extension_dtype_raises():
+    xpr = ("Cannot cast data to extension dtype 'decimal'. Pass the "
+           "extension array directly.")
+    with pytest.raises(ValueError, match=xpr):
+        pd.Series([0, 1, 2], dtype=DecimalDtype())
+
+
+def test_series_constructor_with_dtype():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+    result = pd.Series(arr, dtype=DecimalDtype())
+    expected = pd.Series(arr)
+    tm.assert_series_equal(result, expected)
+
+    result = pd.Series(arr, dtype='int64')
+    expected = pd.Series([10])
+    tm.assert_series_equal(result, expected)
+
+
+def test_dataframe_constructor_with_dtype():
+    arr = DecimalArray([decimal.Decimal('10.0')])
+
+    result = pd.DataFrame({"A": arr}, dtype=DecimalDtype())
+    expected = pd.DataFrame({"A": arr})
+    tm.assert_frame_equal(result, expected)
+
+    arr = DecimalArray([decimal.Decimal('10.0')])
+    result = pd.DataFrame({"A": arr}, dtype='int64')
+    expected = pd.DataFrame({"A": [10]})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("frame", [True, False])
+def test_astype_dispatches(frame):
+    # This is a dtype-specific test that ensures Series[decimal].astype
+    # gets all the way through to ExtensionArray.astype
+    # Designing a reliable smoke test that works for arbitrary data types
+    # is difficult.
+    data = pd.Series(DecimalArray([decimal.Decimal(2)]), name='a')
+    ctx = decimal.Context()
+    ctx.prec = 5
+
+    if frame:
+        data = data.to_frame()
+
+    result = data.astype(DecimalDtype(ctx))
+
+    if frame:
+        result = result['a']
+
+    assert result.dtype.context.prec == ctx.prec
+
+
+class TestArithmeticOps(BaseDecimal, base.BaseArithmeticOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        super(TestArithmeticOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        op_name = all_arithmetic_operators
+        s = pd.Series(data)
+
+        context = decimal.getcontext()
+        divbyzerotrap = context.traps[decimal.DivisionByZero]
+        invalidoptrap = context.traps[decimal.InvalidOperation]
+        context.traps[decimal.DivisionByZero] = 0
+        context.traps[decimal.InvalidOperation] = 0
+
+        # Decimal supports ops with int, but not float
+        other = pd.Series([int(d * 100) for d in data])
+        self.check_opname(s, op_name, other)
+
+        if "mod" not in op_name:
+            self.check_opname(s, op_name, s * 2)
+
+        self.check_opname(s, op_name, 0)
+        self.check_opname(s, op_name, 5)
+        context.traps[decimal.DivisionByZero] = divbyzerotrap
+        context.traps[decimal.InvalidOperation] = invalidoptrap
+
+    def _check_divmod_op(self, s, op, other, exc=NotImplementedError):
+        # We implement divmod
+        super(TestArithmeticOps, self)._check_divmod_op(
+            s, op, other, exc=None
+        )
+
+    def test_error(self):
+        pass
+
+
+class TestComparisonOps(BaseDecimal, base.BaseComparisonOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        super(TestComparisonOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def _compare_other(self, s, data, op_name, other):
+        self.check_opname(s, op_name, other)
+
+    def test_compare_scalar(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+        self._compare_other(s, data, op_name, 0.5)
+
+    def test_compare_array(self, data, all_compare_operators):
+        op_name = all_compare_operators
+        s = pd.Series(data)
+
+        alter = np.random.choice([-1, 0, 1], len(data))
+        # Randomly double, halve or keep same value
+        other = pd.Series(data) * [decimal.Decimal(pow(2.0, i))
+                                   for i in alter]
+        self._compare_other(s, data, op_name, other)
+
+
+class DecimalArrayWithoutFromSequence(DecimalArray):
+    """Helper class for testing error handling in _from_sequence."""
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        raise KeyError("For the test")
+
+
+class DecimalArrayWithoutCoercion(DecimalArrayWithoutFromSequence):
+    @classmethod
+    def _create_arithmetic_method(cls, op):
+        return cls._create_method(op, coerce_to_dtype=False)
+
+
+DecimalArrayWithoutCoercion._add_arithmetic_ops()
+
+
+def test_combine_from_sequence_raises():
+    # https://github.com/pandas-dev/pandas/issues/22850
+    ser = pd.Series(DecimalArrayWithoutFromSequence([
+        decimal.Decimal("1.0"),
+        decimal.Decimal("2.0")
+    ]))
+    result = ser.combine(ser, operator.add)
+
+    # note: object dtype
+    expected = pd.Series([decimal.Decimal("2.0"),
+                          decimal.Decimal("4.0")], dtype="object")
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("class_", [DecimalArrayWithoutFromSequence,
+                                    DecimalArrayWithoutCoercion])
+def test_scalar_ops_from_sequence_raises(class_):
+    # op(EA, EA) should return an EA, or an ndarray if it's not possible
+    # to return an EA with the return values.
+    arr = class_([
+        decimal.Decimal("1.0"),
+        decimal.Decimal("2.0")
+    ])
+    result = arr + arr
+    expected = np.array([decimal.Decimal("2.0"), decimal.Decimal("4.0")],
+                        dtype="object")
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("reverse, expected_div, expected_mod", [
+    (False, [0, 1, 1, 2], [1, 0, 1, 0]),
+    (True, [2, 1, 0, 0], [0, 0, 2, 2]),
+])
+def test_divmod_array(reverse, expected_div, expected_mod):
+    # https://github.com/pandas-dev/pandas/issues/22930
+    arr = to_decimal([1, 2, 3, 4])
+    if reverse:
+        div, mod = divmod(2, arr)
+    else:
+        div, mod = divmod(arr, 2)
+    expected_div = to_decimal(expected_div)
+    expected_mod = to_decimal(expected_mod)
+
+    tm.assert_extension_array_equal(div, expected_div)
+    tm.assert_extension_array_equal(mod, expected_mod)
+
+
+def test_formatting_values_deprecated():
+    class DecimalArray2(DecimalArray):
+        def _formatting_values(self):
+            return np.array(self)
+
+    ser = pd.Series(DecimalArray2([decimal.Decimal('1.0')]))
+    # different levels for 2 vs. 3
+    check_stacklevel = compat.PY3
+
+    with tm.assert_produces_warning(DeprecationWarning,
+                                    check_stacklevel=check_stacklevel):
+        repr(ser)
diff --git a/pandas/tests/extension/json/__init__.py b/pandas/tests/extension/json/__init__.py
new file mode 100644
index 0000000000000..f2679d087c841
--- /dev/null
+++ b/pandas/tests/extension/json/__init__.py
@@ -0,0 +1,3 @@
+from .array import JSONArray, JSONDtype, make_data
+
+__all__ = ['JSONArray', 'JSONDtype', 'make_data']
diff --git a/pandas/tests/extension/json/array.py b/pandas/tests/extension/json/array.py
new file mode 100644
index 0000000000000..10fd21f89c564
--- /dev/null
+++ b/pandas/tests/extension/json/array.py
@@ -0,0 +1,199 @@
+"""Test extension array for storing nested data in a pandas container.
+
+The JSONArray stores lists of dictionaries. The storage mechanism is a list,
+not an ndarray.
+
+Note:
+
+We currently store lists of UserDicts (Py3 only). Pandas has a few places
+internally that specifically check for dicts, and does non-scalar things
+in that case. We *want* the dictionaries to be treated as scalars, so we
+hack around pandas by using UserDicts.
+"""
+import collections
+import itertools
+import numbers
+import random
+import string
+import sys
+
+import numpy as np
+
+from pandas.core.dtypes.base import ExtensionDtype
+
+from pandas import compat
+from pandas.core.arrays import ExtensionArray
+
+
+class JSONDtype(ExtensionDtype):
+    type = compat.Mapping
+    name = 'json'
+
+    try:
+        na_value = collections.UserDict()
+    except AttributeError:
+        # source compatibility with Py2.
+        na_value = {}
+
+    @classmethod
+    def construct_array_type(cls):
+        """Return the array type associated with this dtype
+
+        Returns
+        -------
+        type
+        """
+        return JSONArray
+
+    @classmethod
+    def construct_from_string(cls, string):
+        if string == cls.name:
+            return cls()
+        else:
+            raise TypeError("Cannot construct a '{}' from "
+                            "'{}'".format(cls, string))
+
+
+class JSONArray(ExtensionArray):
+    dtype = JSONDtype()
+    __array_priority__ = 1000
+
+    def __init__(self, values, dtype=None, copy=False):
+        for val in values:
+            if not isinstance(val, self.dtype.type):
+                raise TypeError("All values must be of type " +
+                                str(self.dtype.type))
+        self.data = values
+
+        # Some aliases for common attribute names to ensure pandas supports
+        # these
+        self._items = self._data = self.data
+        # those aliases are currently not working due to assumptions
+        # in internal code (GH-20735)
+        # self._values = self.values = self.data
+
+    @classmethod
+    def _from_sequence(cls, scalars, dtype=None, copy=False):
+        return cls(scalars)
+
+    @classmethod
+    def _from_factorized(cls, values, original):
+        return cls([collections.UserDict(x) for x in values if x != ()])
+
+    def __getitem__(self, item):
+        if isinstance(item, numbers.Integral):
+            return self.data[item]
+        elif isinstance(item, np.ndarray) and item.dtype == 'bool':
+            return self._from_sequence([x for x, m in zip(self, item) if m])
+        elif isinstance(item, compat.Iterable):
+            # fancy indexing
+            return type(self)([self.data[i] for i in item])
+        else:
+            # slice
+            return type(self)(self.data[item])
+
+    def __setitem__(self, key, value):
+        if isinstance(key, numbers.Integral):
+            self.data[key] = value
+        else:
+            if not isinstance(value, (type(self),
+                                      compat.Sequence)):
+                # broadcast value
+                value = itertools.cycle([value])
+
+            if isinstance(key, np.ndarray) and key.dtype == 'bool':
+                # masking
+                for i, (k, v) in enumerate(zip(key, value)):
+                    if k:
+                        assert isinstance(v, self.dtype.type)
+                        self.data[i] = v
+            else:
+                for k, v in zip(key, value):
+                    assert isinstance(v, self.dtype.type)
+                    self.data[k] = v
+
+    def __len__(self):
+        return len(self.data)
+
+    @property
+    def nbytes(self):
+        return sys.getsizeof(self.data)
+
+    def isna(self):
+        return np.array([x == self.dtype.na_value for x in self.data],
+                        dtype=bool)
+
+    def take(self, indexer, allow_fill=False, fill_value=None):
+        # re-implement here, since NumPy has trouble setting
+        # sized objects like UserDicts into scalar slots of
+        # an ndarary.
+        indexer = np.asarray(indexer)
+        msg = ("Index is out of bounds or cannot do a "
+               "non-empty take from an empty array.")
+
+        if allow_fill:
+            if fill_value is None:
+                fill_value = self.dtype.na_value
+            # bounds check
+            if (indexer < -1).any():
+                raise ValueError
+            try:
+                output = [self.data[loc] if loc != -1 else fill_value
+                          for loc in indexer]
+            except IndexError:
+                raise IndexError(msg)
+        else:
+            try:
+                output = [self.data[loc] for loc in indexer]
+            except IndexError:
+                raise IndexError(msg)
+
+        return self._from_sequence(output)
+
+    def copy(self, deep=False):
+        return type(self)(self.data[:])
+
+    def astype(self, dtype, copy=True):
+        # NumPy has issues when all the dicts are the same length.
+        # np.array([UserDict(...), UserDict(...)]) fails,
+        # but np.array([{...}, {...}]) works, so cast.
+
+        # needed to add this check for the Series constructor
+        if isinstance(dtype, type(self.dtype)) and dtype == self.dtype:
+            if copy:
+                return self.copy()
+            return self
+        return np.array([dict(x) for x in self], dtype=dtype, copy=copy)
+
+    def unique(self):
+        # Parent method doesn't work since np.array will try to infer
+        # a 2-dim object.
+        return type(self)([
+            dict(x) for x in list({tuple(d.items()) for d in self.data})
+        ])
+
+    @classmethod
+    def _concat_same_type(cls, to_concat):
+        data = list(itertools.chain.from_iterable([x.data for x in to_concat]))
+        return cls(data)
+
+    def _values_for_factorize(self):
+        frozen = self._values_for_argsort()
+        if len(frozen) == 0:
+            # _factorize_array expects 1-d array, this is a len-0 2-d array.
+            frozen = frozen.ravel()
+        return frozen, ()
+
+    def _values_for_argsort(self):
+        # Disable NumPy's shape inference by including an empty tuple...
+        # If all the elemnts of self are the same size P, NumPy will
+        # cast them to an (N, P) array, instead of an (N,) array of tuples.
+        frozen = [()] + [tuple(x.items()) for x in self]
+        return np.array(frozen, dtype=object)[1:]
+
+
+def make_data():
+    # TODO: Use a regular dict. See _NDFrameIndexer._setitem_with_indexer
+    return [collections.UserDict([
+        (random.choice(string.ascii_letters), random.randint(0, 100))
+        for _ in range(random.randint(0, 10))]) for _ in range(100)]
diff --git a/pandas/tests/extension/json/test_json.py b/pandas/tests/extension/json/test_json.py
new file mode 100644
index 0000000000000..9ee131950f19c
--- /dev/null
+++ b/pandas/tests/extension/json/test_json.py
@@ -0,0 +1,304 @@
+import collections
+import operator
+
+import pytest
+
+from pandas.compat import PY2, PY36
+
+import pandas as pd
+from pandas.tests.extension import base
+import pandas.util.testing as tm
+
+from .array import JSONArray, JSONDtype, make_data
+
+pytestmark = pytest.mark.skipif(PY2, reason="Py2 doesn't have a UserDict")
+
+
+@pytest.fixture
+def dtype():
+    return JSONDtype()
+
+
+@pytest.fixture
+def data():
+    """Length-100 PeriodArray for semantics test."""
+    data = make_data()
+
+    # Why the while loop? NumPy is unable to construct an ndarray from
+    # equal-length ndarrays. Many of our operations involve coercing the
+    # EA to an ndarray of objects. To avoid random test failures, we ensure
+    # that our data is coercable to an ndarray. Several tests deal with only
+    # the first two elements, so that's what we'll check.
+
+    while len(data[0]) == len(data[1]):
+        data = make_data()
+
+    return JSONArray(data)
+
+
+@pytest.fixture
+def data_missing():
+    """Length 2 array with [NA, Valid]"""
+    return JSONArray([{}, {'a': 10}])
+
+
+@pytest.fixture
+def data_for_sorting():
+    return JSONArray([{'b': 1}, {'c': 4}, {'a': 2, 'c': 3}])
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return JSONArray([{'b': 1}, {}, {'a': 4}])
+
+
+@pytest.fixture
+def na_value(dtype):
+    return dtype.na_value
+
+
+@pytest.fixture
+def na_cmp():
+    return operator.eq
+
+
+@pytest.fixture
+def data_for_grouping():
+    return JSONArray([
+        {'b': 1}, {'b': 1},
+        {}, {},
+        {'a': 0, 'c': 2}, {'a': 0, 'c': 2},
+        {'b': 1},
+        {'c': 2},
+    ])
+
+
+class BaseJSON(object):
+    # NumPy doesn't handle an array of equal-length UserDicts.
+    # The default assert_series_equal eventually does a
+    # Series.values, which raises. We work around it by
+    # converting the UserDicts to dicts.
+    def assert_series_equal(self, left, right, **kwargs):
+        if left.dtype.name == 'json':
+            assert left.dtype == right.dtype
+            left = pd.Series(JSONArray(left.values.astype(object)),
+                             index=left.index, name=left.name)
+            right = pd.Series(JSONArray(right.values.astype(object)),
+                              index=right.index, name=right.name)
+        tm.assert_series_equal(left, right, **kwargs)
+
+    def assert_frame_equal(self, left, right, *args, **kwargs):
+        tm.assert_index_equal(
+            left.columns, right.columns,
+            exact=kwargs.get('check_column_type', 'equiv'),
+            check_names=kwargs.get('check_names', True),
+            check_exact=kwargs.get('check_exact', False),
+            check_categorical=kwargs.get('check_categorical', True),
+            obj='{obj}.columns'.format(obj=kwargs.get('obj', 'DataFrame')))
+
+        jsons = (left.dtypes == 'json').index
+
+        for col in jsons:
+            self.assert_series_equal(left[col], right[col],
+                                     *args, **kwargs)
+
+        left = left.drop(columns=jsons)
+        right = right.drop(columns=jsons)
+        tm.assert_frame_equal(left, right, *args, **kwargs)
+
+
+class TestDtype(BaseJSON, base.BaseDtypeTests):
+    pass
+
+
+class TestInterface(BaseJSON, base.BaseInterfaceTests):
+    def test_custom_asserts(self):
+        # This would always trigger the KeyError from trying to put
+        # an array of equal-length UserDicts inside an ndarray.
+        data = JSONArray([collections.UserDict({'a': 1}),
+                          collections.UserDict({'b': 2}),
+                          collections.UserDict({'c': 3})])
+        a = pd.Series(data)
+        self.assert_series_equal(a, a)
+        self.assert_frame_equal(a.to_frame(), a.to_frame())
+
+        b = pd.Series(data.take([0, 0, 1]))
+        with pytest.raises(AssertionError):
+            self.assert_series_equal(a, b)
+
+        with pytest.raises(AssertionError):
+            self.assert_frame_equal(a.to_frame(), b.to_frame())
+
+
+class TestConstructors(BaseJSON, base.BaseConstructorsTests):
+
+    @pytest.mark.skip(reason="not implemented constructor from dtype")
+    def test_from_dtype(self, data):
+        # construct from our dtype & string dtype
+        pass
+
+
+class TestReshaping(BaseJSON, base.BaseReshapingTests):
+
+    @pytest.mark.skip(reason="Different definitions of NA")
+    def test_stack(self):
+        """
+        The test does .astype(object).stack(). If we happen to have
+        any missing values in `data`, then we'll end up with different
+        rows since we consider `{}` NA, but `.astype(object)` doesn't.
+        """
+
+    @pytest.mark.xfail(reason="dict for NA")
+    def test_unstack(self, data, index):
+        # The base test has NaN for the expected NA value.
+        # this matches otherwise
+        return super().test_unstack(data, index)
+
+
+class TestGetitem(BaseJSON, base.BaseGetitemTests):
+    pass
+
+
+class TestMissing(BaseJSON, base.BaseMissingTests):
+    @pytest.mark.skip(reason="Setting a dict as a scalar")
+    def test_fillna_series(self):
+        """We treat dictionaries as a mapping in fillna, not a scalar."""
+
+    @pytest.mark.skip(reason="Setting a dict as a scalar")
+    def test_fillna_frame(self):
+        """We treat dictionaries as a mapping in fillna, not a scalar."""
+
+
+unhashable = pytest.mark.skip(reason="Unhashable")
+unstable = pytest.mark.skipif(not PY36,  # 3.6 or higher
+                              reason="Dictionary order unstable")
+
+
+class TestReduce(base.BaseNoReduceTests):
+    pass
+
+
+class TestMethods(BaseJSON, base.BaseMethodsTests):
+    @unhashable
+    def test_value_counts(self, all_data, dropna):
+        pass
+
+    @unhashable
+    def test_sort_values_frame(self):
+        # TODO (EA.factorize): see if _values_for_factorize allows this.
+        pass
+
+    @unstable
+    def test_argsort(self, data_for_sorting):
+        super(TestMethods, self).test_argsort(data_for_sorting)
+
+    @unstable
+    def test_argsort_missing(self, data_missing_for_sorting):
+        super(TestMethods, self).test_argsort_missing(
+            data_missing_for_sorting)
+
+    @unstable
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values(self, data_for_sorting, ascending):
+        super(TestMethods, self).test_sort_values(
+            data_for_sorting, ascending)
+
+    @unstable
+    @pytest.mark.parametrize('ascending', [True, False])
+    def test_sort_values_missing(self, data_missing_for_sorting, ascending):
+        super(TestMethods, self).test_sort_values_missing(
+            data_missing_for_sorting, ascending)
+
+    @pytest.mark.skip(reason="combine for JSONArray not supported")
+    def test_combine_le(self, data_repeated):
+        pass
+
+    @pytest.mark.skip(reason="combine for JSONArray not supported")
+    def test_combine_add(self, data_repeated):
+        pass
+
+    @pytest.mark.skip(reason="combine for JSONArray not supported")
+    def test_combine_first(self, data):
+        pass
+
+    @unhashable
+    def test_hash_pandas_object_works(self, data, kind):
+        super().test_hash_pandas_object_works(data, kind)
+
+    @pytest.mark.skip(reason="broadcasting error")
+    def test_where_series(self, data, na_value):
+        # Fails with
+        # *** ValueError: operands could not be broadcast together
+        # with shapes (4,) (4,) (0,)
+        super().test_where_series(data, na_value)
+
+    @pytest.mark.skip(reason="Can't compare dicts.")
+    def test_searchsorted(self, data_for_sorting):
+        super(TestMethods, self).test_searchsorted(data_for_sorting)
+
+
+class TestCasting(BaseJSON, base.BaseCastingTests):
+    @pytest.mark.skip(reason="failing on np.array(self, dtype=str)")
+    def test_astype_str(self):
+        """This currently fails in NumPy on np.array(self, dtype=str) with
+
+        *** ValueError: setting an array element with a sequence
+        """
+
+
+# We intentionally don't run base.BaseSetitemTests because pandas'
+# internals has trouble setting sequences of values into scalar positions.
+
+
+class TestGroupby(BaseJSON, base.BaseGroupbyTests):
+
+    @unhashable
+    def test_groupby_extension_transform(self):
+        """
+        This currently fails in Series.name.setter, since the
+        name must be hashable, but the value is a dictionary.
+        I think this is what we want, i.e. `.name` should be the original
+        values, and not the values for factorization.
+        """
+
+    @unhashable
+    def test_groupby_extension_apply(self):
+        """
+        This fails in Index._do_unique_check with
+
+        >   hash(val)
+        E   TypeError: unhashable type: 'UserDict' with
+
+        I suspect that once we support Index[ExtensionArray],
+        we'll be able to dispatch unique.
+        """
+
+    @unstable
+    @pytest.mark.parametrize('as_index', [True, False])
+    def test_groupby_extension_agg(self, as_index, data_for_grouping):
+        super(TestGroupby, self).test_groupby_extension_agg(
+            as_index, data_for_grouping
+        )
+
+
+class TestArithmeticOps(BaseJSON, base.BaseArithmeticOpsTests):
+    def test_error(self, data, all_arithmetic_operators):
+        pass
+
+    def test_add_series_with_extension_array(self, data):
+        ser = pd.Series(data)
+        with pytest.raises(TypeError, match="unsupported"):
+            ser + data
+
+    def _check_divmod_op(self, s, op, other, exc=NotImplementedError):
+        return super(TestArithmeticOps, self)._check_divmod_op(
+            s, op, other, exc=TypeError
+        )
+
+
+class TestComparisonOps(BaseJSON, base.BaseComparisonOpsTests):
+    pass
+
+
+class TestPrinting(BaseJSON, base.BasePrintingTests):
+    pass
diff --git a/pandas/tests/extension/test_categorical.py b/pandas/tests/extension/test_categorical.py
new file mode 100644
index 0000000000000..ac52d8f15b8ce
--- /dev/null
+++ b/pandas/tests/extension/test_categorical.py
@@ -0,0 +1,243 @@
+"""
+This file contains a minimal set of tests for compliance with the extension
+array interface test suite, and should contain no other tests.
+The test suite for the full functionality of the array is located in
+`pandas/tests/arrays/`.
+
+The tests in this file are inherited from the BaseExtensionTests, and only
+minimal tweaks should be applied to get the tests passing (by overwriting a
+parent method).
+
+Additional tests should either be added to one of the BaseExtensionTests
+classes (if they are relevant for the extension interface for all dtypes), or
+be added to the array-specific tests in `pandas/tests/arrays/`.
+
+"""
+import string
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Categorical
+from pandas.api.types import CategoricalDtype
+from pandas.tests.extension import base
+
+
+def make_data():
+    while True:
+        values = np.random.choice(list(string.ascii_letters), size=100)
+        # ensure we meet the requirements
+        # 1. first two not null
+        # 2. first and second are different
+        if values[0] != values[1]:
+            break
+    return values
+
+
+@pytest.fixture
+def dtype():
+    return CategoricalDtype()
+
+
+@pytest.fixture
+def data():
+    """Length-100 array for this type.
+
+    * data[0] and data[1] should both be non missing
+    * data[0] and data[1] should not gbe equal
+    """
+    return Categorical(make_data())
+
+
+@pytest.fixture
+def data_missing():
+    """Length 2 array with [NA, Valid]"""
+    return Categorical([np.nan, 'A'])
+
+
+@pytest.fixture
+def data_for_sorting():
+    return Categorical(['A', 'B', 'C'], categories=['C', 'A', 'B'],
+                       ordered=True)
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return Categorical(['A', None, 'B'], categories=['B', 'A'],
+                       ordered=True)
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def data_for_grouping():
+    return Categorical(['a', 'a', None, None, 'b', 'b', 'a', 'c'])
+
+
+class TestDtype(base.BaseDtypeTests):
+    pass
+
+
+class TestInterface(base.BaseInterfaceTests):
+    @pytest.mark.skip(reason="Memory usage doesn't match")
+    def test_memory_usage(self, data):
+        # Is this deliberate?
+        super(TestInterface, self).test_memory_usage(data)
+
+
+class TestConstructors(base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(base.BaseReshapingTests):
+    pass
+
+
+class TestGetitem(base.BaseGetitemTests):
+    skip_take = pytest.mark.skip(reason="GH-20664.")
+
+    @pytest.mark.skip(reason="Backwards compatibility")
+    def test_getitem_scalar(self, data):
+        # CategoricalDtype.type isn't "correct" since it should
+        # be a parent of the elements (object). But don't want
+        # to break things by changing.
+        super(TestGetitem, self).test_getitem_scalar(data)
+
+    @skip_take
+    def test_take(self, data, na_value, na_cmp):
+        # TODO remove this once Categorical.take is fixed
+        super(TestGetitem, self).test_take(data, na_value, na_cmp)
+
+    @skip_take
+    def test_take_negative(self, data):
+        super().test_take_negative(data)
+
+    @skip_take
+    def test_take_pandas_style_negative_raises(self, data, na_value):
+        super().test_take_pandas_style_negative_raises(data, na_value)
+
+    @skip_take
+    def test_take_non_na_fill_value(self, data_missing):
+        super().test_take_non_na_fill_value(data_missing)
+
+    @skip_take
+    def test_take_out_of_bounds_raises(self, data, allow_fill):
+        return super().test_take_out_of_bounds_raises(data, allow_fill)
+
+    @pytest.mark.skip(reason="GH-20747. Unobserved categories.")
+    def test_take_series(self, data):
+        super().test_take_series(data)
+
+    @skip_take
+    def test_reindex_non_na_fill_value(self, data_missing):
+        super().test_reindex_non_na_fill_value(data_missing)
+
+    @pytest.mark.skip(reason="Categorical.take buggy")
+    def test_take_empty(self, data, na_value, na_cmp):
+        super().test_take_empty(data, na_value, na_cmp)
+
+    @pytest.mark.skip(reason="test not written correctly for categorical")
+    def test_reindex(self, data, na_value):
+        super().test_reindex(data, na_value)
+
+
+class TestSetitem(base.BaseSetitemTests):
+    pass
+
+
+class TestMissing(base.BaseMissingTests):
+
+    @pytest.mark.skip(reason="Not implemented")
+    def test_fillna_limit_pad(self, data_missing):
+        super().test_fillna_limit_pad(data_missing)
+
+    @pytest.mark.skip(reason="Not implemented")
+    def test_fillna_limit_backfill(self, data_missing):
+        super().test_fillna_limit_backfill(data_missing)
+
+
+class TestReduce(base.BaseNoReduceTests):
+    pass
+
+
+class TestMethods(base.BaseMethodsTests):
+    @pytest.mark.skip(reason="Unobserved categories included")
+    def test_value_counts(self, all_data, dropna):
+        return super().test_value_counts(all_data, dropna)
+
+    def test_combine_add(self, data_repeated):
+        # GH 20825
+        # When adding categoricals in combine, result is a string
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 + x2)
+        expected = pd.Series(([a + b for (a, b) in
+                               zip(list(orig_data1), list(orig_data2))]))
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 + x2)
+        expected = pd.Series([a + val for a in list(orig_data1)])
+        self.assert_series_equal(result, expected)
+
+    @pytest.mark.skip(reason="Not Applicable")
+    def test_fillna_length_mismatch(self, data_missing):
+        super().test_fillna_length_mismatch(data_missing)
+
+    def test_searchsorted(self, data_for_sorting):
+        if not data_for_sorting.ordered:
+            raise pytest.skip(reason="searchsorted requires ordered data.")
+
+
+class TestCasting(base.BaseCastingTests):
+    pass
+
+
+class TestArithmeticOps(base.BaseArithmeticOpsTests):
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+
+        op_name = all_arithmetic_operators
+        if op_name != '__rmod__':
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, op_name)
+        else:
+            pytest.skip('rmod never called when string is first argument')
+
+    def test_add_series_with_extension_array(self, data):
+        ser = pd.Series(data)
+        with pytest.raises(TypeError, match="cannot perform"):
+            ser + data
+
+    def _check_divmod_op(self, s, op, other, exc=NotImplementedError):
+        return super(TestArithmeticOps, self)._check_divmod_op(
+            s, op, other, exc=TypeError
+        )
+
+
+class TestComparisonOps(base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+        if op_name == '__eq__':
+            result = op(s, other)
+            expected = s.combine(other, lambda x, y: x == y)
+            assert (result == expected).all()
+
+        elif op_name == '__ne__':
+            result = op(s, other)
+            expected = s.combine(other, lambda x, y: x != y)
+            assert (result == expected).all()
+
+        else:
+            with pytest.raises(TypeError):
+                op(data, other)
+
+
+class TestParsing(base.BaseParsingTests):
+    pass
diff --git a/pandas/tests/extension/test_common.py b/pandas/tests/extension/test_common.py
new file mode 100644
index 0000000000000..db3f3b80bca6b
--- /dev/null
+++ b/pandas/tests/extension/test_common.py
@@ -0,0 +1,86 @@
+import numpy as np
+import pytest
+
+from pandas.core.dtypes import dtypes
+from pandas.core.dtypes.common import is_extension_array_dtype
+
+import pandas as pd
+from pandas.core.arrays import ExtensionArray
+import pandas.util.testing as tm
+
+
+class DummyDtype(dtypes.ExtensionDtype):
+    pass
+
+
+class DummyArray(ExtensionArray):
+
+    def __init__(self, data):
+        self.data = data
+
+    def __array__(self, dtype):
+        return self.data
+
+    @property
+    def dtype(self):
+        return DummyDtype()
+
+    def astype(self, dtype, copy=True):
+        # we don't support anything but a single dtype
+        if isinstance(dtype, DummyDtype):
+            if copy:
+                return type(self)(self.data)
+            return self
+
+        return np.array(self, dtype=dtype, copy=copy)
+
+
+class TestExtensionArrayDtype(object):
+
+    @pytest.mark.parametrize('values', [
+        pd.Categorical([]),
+        pd.Categorical([]).dtype,
+        pd.Series(pd.Categorical([])),
+        DummyDtype(),
+        DummyArray(np.array([1, 2])),
+    ])
+    def test_is_extension_array_dtype(self, values):
+        assert is_extension_array_dtype(values)
+
+    @pytest.mark.parametrize('values', [
+        np.array([]),
+        pd.Series(np.array([])),
+    ])
+    def test_is_not_extension_array_dtype(self, values):
+        assert not is_extension_array_dtype(values)
+
+
+def test_astype():
+
+    arr = DummyArray(np.array([1, 2, 3]))
+    expected = np.array([1, 2, 3], dtype=object)
+
+    result = arr.astype(object)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = arr.astype('object')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_astype_no_copy():
+    arr = DummyArray(np.array([1, 2, 3], dtype=np.int64))
+    result = arr.astype(arr.dtype, copy=False)
+
+    assert arr is result
+
+    result = arr.astype(arr.dtype)
+    assert arr is not result
+
+
+@pytest.mark.parametrize('dtype', [
+    dtypes.CategoricalDtype(),
+    dtypes.IntervalDtype(),
+])
+def test_is_extension_array_dtype(dtype):
+    assert isinstance(dtype, dtypes.ExtensionDtype)
+    assert is_extension_array_dtype(dtype)
diff --git a/pandas/tests/extension/test_datetime.py b/pandas/tests/extension/test_datetime.py
new file mode 100644
index 0000000000000..00ad35bf6a924
--- /dev/null
+++ b/pandas/tests/extension/test_datetime.py
@@ -0,0 +1,237 @@
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+
+import pandas as pd
+from pandas.core.arrays import DatetimeArray
+from pandas.tests.extension import base
+
+
+@pytest.fixture(params=["US/Central"])
+def dtype(request):
+    return DatetimeTZDtype(unit="ns", tz=request.param)
+
+
+@pytest.fixture
+def data(dtype):
+    data = DatetimeArray(pd.date_range("2000", periods=100, tz=dtype.tz),
+                         dtype=dtype)
+    return data
+
+
+@pytest.fixture
+def data_missing(dtype):
+    return DatetimeArray(
+        np.array(['NaT', '2000-01-01'], dtype='datetime64[ns]'),
+        dtype=dtype
+    )
+
+
+@pytest.fixture
+def data_for_sorting(dtype):
+    a = pd.Timestamp('2000-01-01')
+    b = pd.Timestamp('2000-01-02')
+    c = pd.Timestamp('2000-01-03')
+    return DatetimeArray(np.array([b, c, a], dtype='datetime64[ns]'),
+                         dtype=dtype)
+
+
+@pytest.fixture
+def data_missing_for_sorting(dtype):
+    a = pd.Timestamp('2000-01-01')
+    b = pd.Timestamp('2000-01-02')
+    return DatetimeArray(np.array([b, 'NaT', a], dtype='datetime64[ns]'),
+                         dtype=dtype)
+
+
+@pytest.fixture
+def data_for_grouping(dtype):
+    """
+        Expected to be like [B, B, NA, NA, A, A, B, C]
+
+        Where A < B < C and NA is missing
+    """
+    a = pd.Timestamp('2000-01-01')
+    b = pd.Timestamp('2000-01-02')
+    c = pd.Timestamp('2000-01-03')
+    na = 'NaT'
+    return DatetimeArray(np.array([b, b, na, na, a, a, b, c],
+                                  dtype='datetime64[ns]'),
+                         dtype=dtype)
+
+
+@pytest.fixture
+def na_cmp():
+    def cmp(a, b):
+        return a is pd.NaT and a is b
+    return cmp
+
+
+@pytest.fixture
+def na_value():
+    return pd.NaT
+
+
+# ----------------------------------------------------------------------------
+class BaseDatetimeTests(object):
+    pass
+
+
+# ----------------------------------------------------------------------------
+# Tests
+class TestDatetimeDtype(BaseDatetimeTests, base.BaseDtypeTests):
+    pass
+
+
+class TestConstructors(BaseDatetimeTests, base.BaseConstructorsTests):
+    pass
+
+
+class TestGetitem(BaseDatetimeTests, base.BaseGetitemTests):
+    pass
+
+
+class TestMethods(BaseDatetimeTests, base.BaseMethodsTests):
+    @pytest.mark.skip(reason="Incorrect expected")
+    def test_value_counts(self, all_data, dropna):
+        pass
+
+    def test_combine_add(self, data_repeated):
+        # Timestamp.__add__(Timestamp) not defined
+        pass
+
+
+class TestInterface(BaseDatetimeTests, base.BaseInterfaceTests):
+
+    def test_array_interface(self, data):
+        if data.tz:
+            # np.asarray(DTA) is currently always tz-naive.
+            pytest.skip("GH-23569")
+        else:
+            super(TestInterface, self).test_array_interface(data)
+
+
+class TestArithmeticOps(BaseDatetimeTests, base.BaseArithmeticOpsTests):
+    implements = {'__sub__', '__rsub__'}
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def test_add_series_with_extension_array(self, data):
+        # Datetime + Datetime not implemented
+        s = pd.Series(data)
+        msg = 'cannot add DatetimeArray and DatetimeArray'
+        with pytest.raises(TypeError, match=msg):
+            s + data
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def test_error(self, data, all_arithmetic_operators):
+        pass
+
+    @pytest.mark.xfail(reason="different implementation", strict=False)
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        # Right now, we have trouble with this. Returning NotImplemented
+        # fails other tests like
+        # tests/arithmetic/test_datetime64::TestTimestampSeriesArithmetic::
+        # test_dt64_seris_add_intlike
+        return super(
+            TestArithmeticOps,
+            self
+        ).test_direct_arith_with_series_returns_not_implemented(data)
+
+
+class TestCasting(BaseDatetimeTests, base.BaseCastingTests):
+    pass
+
+
+class TestComparisonOps(BaseDatetimeTests, base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        # the base test is not appropriate for us. We raise on comparison
+        # with (some) integers, depending on the value.
+        pass
+
+    @pytest.mark.xfail(reason="different implementation", strict=False)
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        return super(
+            TestComparisonOps,
+            self
+        ).test_direct_arith_with_series_returns_not_implemented(data)
+
+
+class TestMissing(BaseDatetimeTests, base.BaseMissingTests):
+    pass
+
+
+class TestReshaping(BaseDatetimeTests, base.BaseReshapingTests):
+
+    @pytest.mark.skip(reason="We have DatetimeTZBlock")
+    def test_concat(self, data, in_frame):
+        pass
+
+    def test_concat_mixed_dtypes(self, data):
+        # concat(Series[datetimetz], Series[category]) uses a
+        # plain np.array(values) on the DatetimeArray, which
+        # drops the tz.
+        super(TestReshaping, self).test_concat_mixed_dtypes(data)
+
+    @pytest.mark.parametrize("obj", ["series", "frame"])
+    def test_unstack(self, obj):
+        # GH-13287: can't use base test, since building the expected fails.
+        data = DatetimeArray._from_sequence(['2000', '2001', '2002', '2003'],
+                                            tz='US/Central')
+        index = pd.MultiIndex.from_product(([['A', 'B'], ['a', 'b']]),
+                                           names=['a', 'b'])
+
+        if obj == "series":
+            ser = pd.Series(data, index=index)
+            expected = pd.DataFrame({
+                "A": data.take([0, 1]),
+                "B": data.take([2, 3])
+            }, index=pd.Index(['a', 'b'], name='b'))
+            expected.columns.name = 'a'
+
+        else:
+            ser = pd.DataFrame({"A": data, "B": data}, index=index)
+            expected = pd.DataFrame(
+                {("A", "A"): data.take([0, 1]),
+                 ("A", "B"): data.take([2, 3]),
+                 ("B", "A"): data.take([0, 1]),
+                 ("B", "B"): data.take([2, 3])},
+                index=pd.Index(['a', 'b'], name='b')
+            )
+            expected.columns.names = [None, 'a']
+
+        result = ser.unstack(0)
+        self.assert_equal(result, expected)
+
+
+class TestSetitem(BaseDatetimeTests, base.BaseSetitemTests):
+    pass
+
+
+class TestGroupby(BaseDatetimeTests, base.BaseGroupbyTests):
+    pass
+
+
+class TestPrinting(BaseDatetimeTests, base.BasePrintingTests):
+    pass
diff --git a/pandas/tests/extension/test_external_block.py b/pandas/tests/extension/test_external_block.py
new file mode 100644
index 0000000000000..1b3f285e64059
--- /dev/null
+++ b/pandas/tests/extension/test_external_block.py
@@ -0,0 +1,76 @@
+# -*- coding: utf-8 -*-
+# pylint: disable=W0102
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.core.internals import BlockManager, SingleBlockManager
+from pandas.core.internals.blocks import Block, NonConsolidatableMixIn
+
+
+class CustomBlock(NonConsolidatableMixIn, Block):
+
+    _holder = np.ndarray
+
+    def formatting_values(self):
+        return np.array(["Val: {}".format(i) for i in self.values])
+
+    def concat_same_type(self, to_concat, placement=None):
+        """
+        Always concatenate disregarding self.ndim as the values are
+        always 1D in this custom Block
+        """
+        values = np.concatenate([blk.values for blk in to_concat])
+        return self.make_block_same_class(
+            values, placement=placement or slice(0, len(values), 1))
+
+
+@pytest.fixture
+def df():
+    df1 = pd.DataFrame({'a': [1, 2, 3]})
+    blocks = df1._data.blocks
+    values = np.arange(3, dtype='int64')
+    custom_block = CustomBlock(values, placement=slice(1, 2))
+    blocks = blocks + (custom_block,)
+    block_manager = BlockManager(blocks, [pd.Index(['a', 'b']), df1.index])
+    return pd.DataFrame(block_manager)
+
+
+def test_custom_repr():
+    values = np.arange(3, dtype='int64')
+
+    # series
+    block = CustomBlock(values, placement=slice(0, 3))
+
+    s = pd.Series(SingleBlockManager(block, pd.RangeIndex(3)))
+    assert repr(s) == '0    Val: 0\n1    Val: 1\n2    Val: 2\ndtype: int64'
+
+    # dataframe
+    block = CustomBlock(values, placement=slice(0, 1))
+    blk_mgr = BlockManager([block], [['col'], range(3)])
+    df = pd.DataFrame(blk_mgr)
+    assert repr(df) == '      col\n0  Val: 0\n1  Val: 1\n2  Val: 2'
+
+
+def test_concat_series():
+    # GH17728
+    values = np.arange(3, dtype='int64')
+    block = CustomBlock(values, placement=slice(0, 3))
+    s = pd.Series(block, pd.RangeIndex(3), fastpath=True)
+
+    res = pd.concat([s, s])
+    assert isinstance(res._data.blocks[0], CustomBlock)
+
+
+def test_concat_dataframe(df):
+    # GH17728
+    res = pd.concat([df, df])
+    assert isinstance(res._data.blocks[1], CustomBlock)
+
+
+def test_concat_axis1(df):
+    # GH17954
+    df2 = pd.DataFrame({'c': [.1, .2, .3]})
+    res = pd.concat([df, df2], axis=1)
+    assert isinstance(res._data.blocks[1], CustomBlock)
diff --git a/pandas/tests/extension/test_integer.py b/pandas/tests/extension/test_integer.py
new file mode 100644
index 0000000000000..aadf9f2f12b68
--- /dev/null
+++ b/pandas/tests/extension/test_integer.py
@@ -0,0 +1,224 @@
+"""
+This file contains a minimal set of tests for compliance with the extension
+array interface test suite, and should contain no other tests.
+The test suite for the full functionality of the array is located in
+`pandas/tests/arrays/`.
+
+The tests in this file are inherited from the BaseExtensionTests, and only
+minimal tweaks should be applied to get the tests passing (by overwriting a
+parent method).
+
+Additional tests should either be added to one of the BaseExtensionTests
+classes (if they are relevant for the extension interface for all dtypes), or
+be added to the array-specific tests in `pandas/tests/arrays/`.
+
+"""
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.common import is_extension_array_dtype
+
+import pandas as pd
+from pandas.core.arrays import integer_array
+from pandas.core.arrays.integer import (
+    Int8Dtype, Int16Dtype, Int32Dtype, Int64Dtype, UInt8Dtype, UInt16Dtype,
+    UInt32Dtype, UInt64Dtype)
+from pandas.tests.extension import base
+
+
+def make_data():
+    return (list(range(1, 9)) + [np.nan] + list(range(10, 98))
+            + [np.nan] + [99, 100])
+
+
+@pytest.fixture(params=[Int8Dtype, Int16Dtype, Int32Dtype, Int64Dtype,
+                        UInt8Dtype, UInt16Dtype, UInt32Dtype, UInt64Dtype])
+def dtype(request):
+    return request.param()
+
+
+@pytest.fixture
+def data(dtype):
+    return integer_array(make_data(), dtype=dtype)
+
+
+@pytest.fixture
+def data_missing(dtype):
+    return integer_array([np.nan, 1], dtype=dtype)
+
+
+@pytest.fixture
+def data_for_sorting(dtype):
+    return integer_array([1, 2, 0], dtype=dtype)
+
+
+@pytest.fixture
+def data_missing_for_sorting(dtype):
+    return integer_array([1, np.nan, 0], dtype=dtype)
+
+
+@pytest.fixture
+def na_cmp():
+    # we are np.nan
+    return lambda x, y: np.isnan(x) and np.isnan(y)
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def data_for_grouping(dtype):
+    b = 1
+    a = 0
+    c = 2
+    na = np.nan
+    return integer_array([b, b, na, na, a, a, b, c], dtype=dtype)
+
+
+class TestDtype(base.BaseDtypeTests):
+
+    @pytest.mark.skip(reason="using multiple dtypes")
+    def test_is_dtype_unboxes_dtype(self):
+        # we have multiple dtypes, so skip
+        pass
+
+
+class TestArithmeticOps(base.BaseArithmeticOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        # overwriting to indicate ops don't raise an error
+        super(TestArithmeticOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def _check_op(self, s, op, other, op_name, exc=NotImplementedError):
+        if exc is None:
+            if s.dtype.is_unsigned_integer and (op_name == '__rsub__'):
+                # TODO see https://github.com/pandas-dev/pandas/issues/22023
+                pytest.skip("unsigned subtraction gives negative values")
+
+            if (hasattr(other, 'dtype')
+                    and not is_extension_array_dtype(other.dtype)
+                    and pd.api.types.is_integer_dtype(other.dtype)):
+                # other is np.int64 and would therefore always result in
+                # upcasting, so keeping other as same numpy_dtype
+                other = other.astype(s.dtype.numpy_dtype)
+
+            result = op(s, other)
+            expected = s.combine(other, op)
+
+            if op_name == '__rdiv__':
+                # combine is not giving the correct result for this case
+                pytest.skip("skipping reverse div in python 2")
+            elif op_name in ('__rtruediv__', '__truediv__', '__div__'):
+                expected = expected.astype(float)
+                if op_name == '__rtruediv__':
+                    # TODO reverse operators result in object dtype
+                    result = result.astype(float)
+            elif op_name.startswith('__r'):
+                # TODO reverse operators result in object dtype
+                # see https://github.com/pandas-dev/pandas/issues/22024
+                expected = expected.astype(s.dtype)
+                result = result.astype(s.dtype)
+            else:
+                # combine method result in 'biggest' (int64) dtype
+                expected = expected.astype(s.dtype)
+                pass
+            if (op_name == '__rpow__') and isinstance(other, pd.Series):
+                # TODO pow on Int arrays gives different result with NA
+                # see https://github.com/pandas-dev/pandas/issues/22022
+                result = result.fillna(1)
+
+            self.assert_series_equal(result, expected)
+        else:
+            with pytest.raises(exc):
+                op(s, other)
+
+    def _check_divmod_op(self, s, op, other, exc=None):
+        super(TestArithmeticOps, self)._check_divmod_op(s, op, other, None)
+
+    @pytest.mark.skip(reason="intNA does not error on ops")
+    def test_error(self, data, all_arithmetic_operators):
+        # other specific errors tested in the integer array specific tests
+        pass
+
+
+class TestComparisonOps(base.BaseComparisonOpsTests):
+
+    def check_opname(self, s, op_name, other, exc=None):
+        super(TestComparisonOps, self).check_opname(s, op_name,
+                                                    other, exc=None)
+
+    def _compare_other(self, s, data, op_name, other):
+        self.check_opname(s, op_name, other)
+
+
+class TestInterface(base.BaseInterfaceTests):
+    pass
+
+
+class TestConstructors(base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(base.BaseReshapingTests):
+    pass
+
+    # for test_concat_mixed_dtypes test
+    # concat of an Integer and Int coerces to object dtype
+    # TODO(jreback) once integrated this would
+
+
+class TestGetitem(base.BaseGetitemTests):
+    pass
+
+
+class TestSetitem(base.BaseSetitemTests):
+    pass
+
+
+class TestMissing(base.BaseMissingTests):
+    pass
+
+
+class TestMethods(base.BaseMethodsTests):
+
+    @pytest.mark.parametrize('dropna', [True, False])
+    def test_value_counts(self, all_data, dropna):
+        all_data = all_data[:10]
+        if dropna:
+            other = np.array(all_data[~all_data.isna()])
+        else:
+            other = all_data
+
+        result = pd.Series(all_data).value_counts(dropna=dropna).sort_index()
+        expected = pd.Series(other).value_counts(
+            dropna=dropna).sort_index()
+        expected.index = expected.index.astype(all_data.dtype)
+
+        self.assert_series_equal(result, expected)
+
+
+class TestCasting(base.BaseCastingTests):
+    pass
+
+
+class TestGroupby(base.BaseGroupbyTests):
+    pass
+
+
+class TestNumericReduce(base.BaseNumericReduceTests):
+    pass
+
+
+class TestBooleanReduce(base.BaseBooleanReduceTests):
+    pass
+
+
+class TestPrinting(base.BasePrintingTests):
+    pass
+
+
+class TestParsing(base.BaseParsingTests):
+    pass
diff --git a/pandas/tests/extension/test_interval.py b/pandas/tests/extension/test_interval.py
new file mode 100644
index 0000000000000..6eedbfb4aba39
--- /dev/null
+++ b/pandas/tests/extension/test_interval.py
@@ -0,0 +1,162 @@
+"""
+This file contains a minimal set of tests for compliance with the extension
+array interface test suite, and should contain no other tests.
+The test suite for the full functionality of the array is located in
+`pandas/tests/arrays/`.
+
+The tests in this file are inherited from the BaseExtensionTests, and only
+minimal tweaks should be applied to get the tests passing (by overwriting a
+parent method).
+
+Additional tests should either be added to one of the BaseExtensionTests
+classes (if they are relevant for the extension interface for all dtypes), or
+be added to the array-specific tests in `pandas/tests/arrays/`.
+
+"""
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import IntervalDtype
+
+from pandas import Interval
+from pandas.core.arrays import IntervalArray
+from pandas.tests.extension import base
+
+
+def make_data():
+    N = 100
+    left = np.random.uniform(size=N).cumsum()
+    right = left + np.random.uniform(size=N)
+    return [Interval(l, r) for l, r in zip(left, right)]
+
+
+@pytest.fixture
+def dtype():
+    return IntervalDtype()
+
+
+@pytest.fixture
+def data():
+    """Length-100 PeriodArray for semantics test."""
+    return IntervalArray(make_data())
+
+
+@pytest.fixture
+def data_missing():
+    """Length 2 array with [NA, Valid]"""
+    return IntervalArray.from_tuples([None, (0, 1)])
+
+
+@pytest.fixture
+def data_for_sorting():
+    return IntervalArray.from_tuples([(1, 2), (2, 3), (0, 1)])
+
+
+@pytest.fixture
+def data_missing_for_sorting():
+    return IntervalArray.from_tuples([(1, 2), None, (0, 1)])
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def data_for_grouping():
+    a = (0, 1)
+    b = (1, 2)
+    c = (2, 3)
+    return IntervalArray.from_tuples([b, b, None, None, a, a, b, c])
+
+
+class BaseInterval(object):
+    pass
+
+
+class TestDtype(BaseInterval, base.BaseDtypeTests):
+    pass
+
+
+class TestCasting(BaseInterval, base.BaseCastingTests):
+    pass
+
+
+class TestConstructors(BaseInterval, base.BaseConstructorsTests):
+    pass
+
+
+class TestGetitem(BaseInterval, base.BaseGetitemTests):
+    pass
+
+
+class TestGrouping(BaseInterval, base.BaseGroupbyTests):
+    pass
+
+
+class TestInterface(BaseInterval, base.BaseInterfaceTests):
+    pass
+
+
+class TestReduce(base.BaseNoReduceTests):
+    pass
+
+
+class TestMethods(BaseInterval, base.BaseMethodsTests):
+
+    @pytest.mark.skip(reason='addition is not defined for intervals')
+    def test_combine_add(self, data_repeated):
+        pass
+
+    @pytest.mark.skip(reason="Not Applicable")
+    def test_fillna_length_mismatch(self, data_missing):
+        pass
+
+
+class TestMissing(BaseInterval, base.BaseMissingTests):
+    # Index.fillna only accepts scalar `value`, so we have to skip all
+    # non-scalar fill tests.
+    unsupported_fill = pytest.mark.skip("Unsupported fillna option.")
+
+    @unsupported_fill
+    def test_fillna_limit_pad(self):
+        pass
+
+    @unsupported_fill
+    def test_fillna_series_method(self):
+        pass
+
+    @unsupported_fill
+    def test_fillna_limit_backfill(self):
+        pass
+
+    @unsupported_fill
+    def test_fillna_series(self):
+        pass
+
+    def test_non_scalar_raises(self, data_missing):
+        msg = "Got a 'list' instead."
+        with pytest.raises(TypeError, match=msg):
+            data_missing.fillna([1, 1])
+
+
+class TestReshaping(BaseInterval, base.BaseReshapingTests):
+    pass
+
+
+class TestSetitem(BaseInterval, base.BaseSetitemTests):
+    pass
+
+
+class TestPrinting(BaseInterval, base.BasePrintingTests):
+    @pytest.mark.skip(reason="custom repr")
+    def test_array_repr(self, data, size):
+        pass
+
+
+class TestParsing(BaseInterval, base.BaseParsingTests):
+    @pytest.mark.parametrize('engine', ['c', 'python'])
+    def test_EA_types(self, engine, data):
+        expected_msg = r'.*must implement _from_sequence_of_strings.*'
+        with pytest.raises(NotImplementedError, match=expected_msg):
+            super(TestParsing, self).test_EA_types(engine, data)
diff --git a/pandas/tests/extension/test_numpy.py b/pandas/tests/extension/test_numpy.py
new file mode 100644
index 0000000000000..41f5beb8c885d
--- /dev/null
+++ b/pandas/tests/extension/test_numpy.py
@@ -0,0 +1,430 @@
+import numpy as np
+import pytest
+
+from pandas.compat.numpy import _np_version_under1p16
+
+import pandas as pd
+from pandas import compat
+from pandas.core.arrays.numpy_ import PandasArray, PandasDtype
+import pandas.util.testing as tm
+
+from . import base
+
+
+@pytest.fixture(params=['float', 'object'])
+def dtype(request):
+    return PandasDtype(np.dtype(request.param))
+
+
+@pytest.fixture
+def allow_in_pandas(monkeypatch):
+    """
+    A monkeypatch to tells pandas to let us in.
+
+    By default, passing a PandasArray to an index / series / frame
+    constructor will unbox that PandasArray to an ndarray, and treat
+    it as a non-EA column. We don't want people using EAs without
+    reason.
+
+    The mechanism for this is a check against ABCPandasArray
+    in each constructor.
+
+    But, for testing, we need to allow them in pandas. So we patch
+    the _typ of PandasArray, so that we evade the ABCPandasArray
+    check.
+    """
+    with monkeypatch.context() as m:
+        m.setattr(PandasArray, '_typ', 'extension')
+        yield
+
+
+@pytest.fixture
+def data(allow_in_pandas, dtype):
+    if dtype.numpy_dtype == 'object':
+        return pd.Series([(i,) for i in range(100)]).array
+    return PandasArray(np.arange(1, 101, dtype=dtype._dtype))
+
+
+@pytest.fixture
+def data_missing(allow_in_pandas, dtype):
+    # For NumPy <1.16, np.array([np.nan, (1,)]) raises
+    # ValueError: setting an array element with a sequence.
+    if dtype.numpy_dtype == 'object':
+        if _np_version_under1p16:
+            raise pytest.skip("Skipping for NumPy <1.16")
+        return PandasArray(np.array([np.nan, (1,)]))
+    return PandasArray(np.array([np.nan, 1.0]))
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def na_cmp():
+    def cmp(a, b):
+        return np.isnan(a) and np.isnan(b)
+    return cmp
+
+
+@pytest.fixture
+def data_for_sorting(allow_in_pandas, dtype):
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, C, A] with
+    A < B < C
+    """
+    if dtype.numpy_dtype == 'object':
+        # Use an empty tuple for first element, then remove,
+        # to disable np.array's shape inference.
+        return PandasArray(
+            np.array([(), (2,), (3,), (1,)])[1:]
+        )
+    return PandasArray(
+        np.array([1, 2, 0])
+    )
+
+
+@pytest.fixture
+def data_missing_for_sorting(allow_in_pandas, dtype):
+    """Length-3 array with a known sort order.
+
+    This should be three items [B, NA, A] with
+    A < B and NA missing.
+    """
+    if dtype.numpy_dtype == 'object':
+        return PandasArray(
+            np.array([(1,), np.nan, (0,)])
+        )
+    return PandasArray(
+        np.array([1, np.nan, 0])
+    )
+
+
+@pytest.fixture
+def data_for_grouping(allow_in_pandas, dtype):
+    """Data for factorization, grouping, and unique tests.
+
+    Expected to be like [B, B, NA, NA, A, A, B, C]
+
+    Where A < B < C and NA is missing
+    """
+    if dtype.numpy_dtype == 'object':
+        a, b, c = (1,), (2,), (3,)
+    else:
+        a, b, c = np.arange(3)
+    return PandasArray(np.array(
+        [b, b, np.nan, np.nan, a, a, b, c]
+    ))
+
+
+@pytest.fixture
+def skip_numpy_object(dtype):
+    """
+    Tests for PandasArray with nested data. Users typically won't create
+    these objects via `pd.array`, but they can show up through `.array`
+    on a Series with nested data. Many of the base tests fail, as they aren't
+    appropriate for nested data.
+
+    This fixture allows these tests to be skipped when used as a usefixtures
+    marker to either an individual test or a test class.
+    """
+    if dtype == 'object':
+        raise pytest.skip("Skipping for object dtype.")
+
+
+skip_nested = pytest.mark.usefixtures('skip_numpy_object')
+
+
+class BaseNumPyTests(object):
+    pass
+
+
+class TestCasting(BaseNumPyTests, base.BaseCastingTests):
+
+    @skip_nested
+    def test_astype_str(self, data):
+        # ValueError: setting an array element with a sequence
+        super(TestCasting, self).test_astype_str(data)
+
+
+class TestConstructors(BaseNumPyTests, base.BaseConstructorsTests):
+    @pytest.mark.skip(reason="We don't register our dtype")
+    # We don't want to register. This test should probably be split in two.
+    def test_from_dtype(self, data):
+        pass
+
+    @skip_nested
+    def test_array_from_scalars(self, data):
+        # ValueError: PandasArray must be 1-dimensional.
+        super(TestConstructors, self).test_array_from_scalars(data)
+
+
+class TestDtype(BaseNumPyTests, base.BaseDtypeTests):
+
+    @pytest.mark.skip(reason="Incorrect expected.")
+    # we unsurprisingly clash with a NumPy name.
+    def test_check_dtype(self, data):
+        pass
+
+
+class TestGetitem(BaseNumPyTests, base.BaseGetitemTests):
+
+    @skip_nested
+    def test_getitem_scalar(self, data):
+        # AssertionError
+        super(TestGetitem, self).test_getitem_scalar(data)
+
+    @skip_nested
+    def test_take_series(self, data):
+        # ValueError: PandasArray must be 1-dimensional.
+        super(TestGetitem, self).test_take_series(data)
+
+
+class TestGroupby(BaseNumPyTests, base.BaseGroupbyTests):
+    @skip_nested
+    def test_groupby_extension_apply(
+            self, data_for_grouping, groupby_apply_op):
+        # ValueError: Names should be list-like for a MultiIndex
+        super(TestGroupby, self).test_groupby_extension_apply(
+            data_for_grouping, groupby_apply_op)
+
+
+class TestInterface(BaseNumPyTests, base.BaseInterfaceTests):
+    @skip_nested
+    def test_array_interface(self, data):
+        # NumPy array shape inference
+        super(TestInterface, self).test_array_interface(data)
+
+
+class TestMethods(BaseNumPyTests, base.BaseMethodsTests):
+
+    @pytest.mark.skip(reason="TODO: remove?")
+    def test_value_counts(self, all_data, dropna):
+        pass
+
+    @pytest.mark.skip(reason="Incorrect expected")
+    # We have a bool dtype, so the result is an ExtensionArray
+    # but expected is not
+    def test_combine_le(self, data_repeated):
+        super(TestMethods, self).test_combine_le(data_repeated)
+
+    @skip_nested
+    def test_combine_add(self, data_repeated):
+        # Not numeric
+        super(TestMethods, self).test_combine_add(data_repeated)
+
+    @skip_nested
+    def test_shift_fill_value(self, data):
+        # np.array shape inference. Shift implementation fails.
+        super(TestMethods, self).test_shift_fill_value(data)
+
+    @skip_nested
+    @pytest.mark.parametrize('box', [pd.Series, lambda x: x])
+    @pytest.mark.parametrize('method', [lambda x: x.unique(), pd.unique])
+    def test_unique(self, data, box, method):
+        # Fails creating expected
+        super(TestMethods, self).test_unique(data, box, method)
+
+    @skip_nested
+    def test_fillna_copy_frame(self, data_missing):
+        # The "scalar" for this array isn't a scalar.
+        super(TestMethods, self).test_fillna_copy_frame(data_missing)
+
+    @skip_nested
+    def test_fillna_copy_series(self, data_missing):
+        # The "scalar" for this array isn't a scalar.
+        super(TestMethods, self).test_fillna_copy_series(data_missing)
+
+    @skip_nested
+    def test_hash_pandas_object_works(self, data, as_frame):
+        # ndarray of tuples not hashable
+        super(TestMethods, self).test_hash_pandas_object_works(data, as_frame)
+
+    @skip_nested
+    def test_searchsorted(self, data_for_sorting, as_series):
+        # Test setup fails.
+        super(TestMethods, self).test_searchsorted(data_for_sorting, as_series)
+
+    @skip_nested
+    def test_where_series(self, data, na_value, as_frame):
+        # Test setup fails.
+        super(TestMethods, self).test_where_series(data, na_value, as_frame)
+
+    @skip_nested
+    @pytest.mark.parametrize("repeats", [0, 1, 2, [1, 2, 3]])
+    def test_repeat(self, data, repeats, as_series, use_numpy):
+        # Fails creating expected
+        super(TestMethods, self).test_repeat(
+            data, repeats, as_series, use_numpy)
+
+
+@skip_nested
+class TestArithmetics(BaseNumPyTests, base.BaseArithmeticOpsTests):
+    divmod_exc = None
+    series_scalar_exc = None
+    frame_scalar_exc = None
+    series_array_exc = None
+
+    def test_divmod_series_array(self, data):
+        s = pd.Series(data)
+        self._check_divmod_op(s, divmod, data, exc=None)
+
+    @pytest.mark.skip("We implement ops")
+    def test_error(self, data, all_arithmetic_operators):
+        pass
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        if (compat.PY2 and
+                all_arithmetic_operators in {'__div__', '__rdiv__'}):
+            raise pytest.skip(
+                "Matching NumPy int / int -> float behavior."
+            )
+        super(TestArithmetics, self).test_arith_series_with_scalar(
+            data, all_arithmetic_operators
+        )
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        if (compat.PY2 and
+                all_arithmetic_operators in {'__div__', '__rdiv__'}):
+            raise pytest.skip(
+                "Matching NumPy int / int -> float behavior."
+            )
+        super(TestArithmetics, self).test_arith_series_with_array(
+            data, all_arithmetic_operators
+        )
+
+
+class TestPrinting(BaseNumPyTests, base.BasePrintingTests):
+    pass
+
+
+@skip_nested
+class TestNumericReduce(BaseNumPyTests, base.BaseNumericReduceTests):
+
+    def check_reduce(self, s, op_name, skipna):
+        result = getattr(s, op_name)(skipna=skipna)
+        # avoid coercing int -> float. Just cast to the actual numpy type.
+        expected = getattr(s.astype(s.dtype._dtype), op_name)(skipna=skipna)
+        tm.assert_almost_equal(result, expected)
+
+
+@skip_nested
+class TestBooleanReduce(BaseNumPyTests, base.BaseBooleanReduceTests):
+    pass
+
+
+class TestMissing(BaseNumPyTests, base.BaseMissingTests):
+
+    @skip_nested
+    def test_fillna_scalar(self, data_missing):
+        # Non-scalar "scalar" values.
+        super(TestMissing, self).test_fillna_scalar(data_missing)
+
+    @skip_nested
+    def test_fillna_series_method(self, data_missing, fillna_method):
+        # Non-scalar "scalar" values.
+        super(TestMissing, self).test_fillna_series_method(
+            data_missing, fillna_method)
+
+    @skip_nested
+    def test_fillna_series(self, data_missing):
+        # Non-scalar "scalar" values.
+        super(TestMissing, self).test_fillna_series(data_missing)
+
+    @skip_nested
+    def test_fillna_frame(self, data_missing):
+        # Non-scalar "scalar" values.
+        super(TestMissing, self).test_fillna_frame(data_missing)
+
+
+class TestReshaping(BaseNumPyTests, base.BaseReshapingTests):
+
+    @pytest.mark.skip("Incorrect parent test")
+    # not actually a mixed concat, since we concat int and int.
+    def test_concat_mixed_dtypes(self, data):
+        super(TestReshaping, self).test_concat_mixed_dtypes(data)
+
+    @skip_nested
+    def test_merge(self, data, na_value):
+        # Fails creating expected
+        super(TestReshaping, self).test_merge(data, na_value)
+
+    @skip_nested
+    def test_merge_on_extension_array(self, data):
+        # Fails creating expected
+        super(TestReshaping, self).test_merge_on_extension_array(data)
+
+    @skip_nested
+    def test_merge_on_extension_array_duplicates(self, data):
+        # Fails creating expected
+        super(TestReshaping, self).test_merge_on_extension_array_duplicates(
+            data)
+
+
+class TestSetitem(BaseNumPyTests, base.BaseSetitemTests):
+
+    @skip_nested
+    def test_setitem_scalar_series(self, data, box_in_series):
+        # AssertionError
+        super(TestSetitem, self).test_setitem_scalar_series(
+            data, box_in_series)
+
+    @skip_nested
+    def test_setitem_sequence(self, data, box_in_series):
+        # ValueError: shape mismatch: value array of shape (2,1) could not
+        # be broadcast to indexing result of shape (2,)
+        super(TestSetitem, self).test_setitem_sequence(data, box_in_series)
+
+    @skip_nested
+    def test_setitem_sequence_mismatched_length_raises(self, data, as_array):
+        # ValueError: PandasArray must be 1-dimensional.
+        (super(TestSetitem, self).
+         test_setitem_sequence_mismatched_length_raises(data, as_array))
+
+    @skip_nested
+    def test_setitem_sequence_broadcasts(self, data, box_in_series):
+        # ValueError: cannot set using a list-like indexer with a different
+        # length than the value
+        super(TestSetitem, self).test_setitem_sequence_broadcasts(
+            data, box_in_series)
+
+    @skip_nested
+    def test_setitem_loc_scalar_mixed(self, data):
+        # AssertionError
+        super(TestSetitem, self).test_setitem_loc_scalar_mixed(data)
+
+    @skip_nested
+    def test_setitem_loc_scalar_multiple_homogoneous(self, data):
+        # AssertionError
+        super(TestSetitem, self).test_setitem_loc_scalar_multiple_homogoneous(
+            data)
+
+    @skip_nested
+    def test_setitem_iloc_scalar_mixed(self, data):
+        # AssertionError
+        super(TestSetitem, self).test_setitem_iloc_scalar_mixed(data)
+
+    @skip_nested
+    def test_setitem_iloc_scalar_multiple_homogoneous(self, data):
+        # AssertionError
+        super(TestSetitem, self).test_setitem_iloc_scalar_multiple_homogoneous(
+            data)
+
+    @skip_nested
+    @pytest.mark.parametrize('setter', ['loc', None])
+    def test_setitem_mask_broadcast(self, data, setter):
+        # ValueError: cannot set using a list-like indexer with a different
+        # length than the value
+        super(TestSetitem, self).test_setitem_mask_broadcast(data, setter)
+
+    @skip_nested
+    def test_setitem_scalar_key_sequence_raise(self, data):
+        # Failed: DID NOT RAISE <class 'ValueError'>
+        super(TestSetitem, self).test_setitem_scalar_key_sequence_raise(data)
+
+
+@skip_nested
+class TestParsing(BaseNumPyTests, base.BaseParsingTests):
+    pass
diff --git a/pandas/tests/extension/test_period.py b/pandas/tests/extension/test_period.py
new file mode 100644
index 0000000000000..813efcb5678d3
--- /dev/null
+++ b/pandas/tests/extension/test_period.py
@@ -0,0 +1,166 @@
+import numpy as np
+import pytest
+
+from pandas._libs.tslib import iNaT
+
+from pandas.core.dtypes.dtypes import PeriodDtype
+
+import pandas as pd
+from pandas.core.arrays import PeriodArray
+from pandas.tests.extension import base
+
+
+@pytest.fixture
+def dtype():
+    return PeriodDtype(freq='D')
+
+
+@pytest.fixture
+def data(dtype):
+    return PeriodArray(np.arange(1970, 2070), freq=dtype.freq)
+
+
+@pytest.fixture
+def data_for_sorting(dtype):
+    return PeriodArray([2018, 2019, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_missing(dtype):
+    return PeriodArray([iNaT, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_missing_for_sorting(dtype):
+    return PeriodArray([2018, iNaT, 2017], freq=dtype.freq)
+
+
+@pytest.fixture
+def data_for_grouping(dtype):
+    B = 2018
+    NA = iNaT
+    A = 2017
+    C = 2019
+    return PeriodArray([B, B, NA, NA, A, A, B, C], freq=dtype.freq)
+
+
+@pytest.fixture
+def na_value():
+    return pd.NaT
+
+
+class BasePeriodTests(object):
+    pass
+
+
+class TestPeriodDtype(BasePeriodTests, base.BaseDtypeTests):
+    pass
+
+
+class TestConstructors(BasePeriodTests, base.BaseConstructorsTests):
+    pass
+
+
+class TestGetitem(BasePeriodTests, base.BaseGetitemTests):
+    pass
+
+
+class TestMethods(BasePeriodTests, base.BaseMethodsTests):
+
+    def test_combine_add(self, data_repeated):
+        # Period + Period is not defined.
+        pass
+
+
+class TestInterface(BasePeriodTests, base.BaseInterfaceTests):
+
+    pass
+
+
+class TestArithmeticOps(BasePeriodTests, base.BaseArithmeticOpsTests):
+    implements = {'__sub__', '__rsub__'}
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        # we implement substitution...
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        if all_arithmetic_operators in self.implements:
+            s = pd.Series(data)
+            self.check_opname(s, all_arithmetic_operators, s.iloc[0],
+                              exc=None)
+        else:
+            # ... but not the rest.
+            super(TestArithmeticOps, self).test_arith_series_with_scalar(
+                data, all_arithmetic_operators
+            )
+
+    def _check_divmod_op(self, s, op, other, exc=NotImplementedError):
+        super(TestArithmeticOps, self)._check_divmod_op(
+            s, op, other, exc=TypeError
+        )
+
+    def test_add_series_with_extension_array(self, data):
+        # we don't implement + for Period
+        s = pd.Series(data)
+        msg = (r"unsupported operand type\(s\) for \+: "
+               r"\'PeriodArray\' and \'PeriodArray\'")
+        with pytest.raises(TypeError, match=msg):
+            s + data
+
+    def test_error(self):
+        pass
+
+    def test_direct_arith_with_series_returns_not_implemented(self, data):
+        # Override to use __sub__ instead of __add__
+        other = pd.Series(data)
+        result = data.__sub__(other)
+        assert result is NotImplemented
+
+
+class TestCasting(BasePeriodTests, base.BaseCastingTests):
+    pass
+
+
+class TestComparisonOps(BasePeriodTests, base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        # the base test is not appropriate for us. We raise on comparison
+        # with (some) integers, depending on the value.
+        pass
+
+
+class TestMissing(BasePeriodTests, base.BaseMissingTests):
+    pass
+
+
+class TestReshaping(BasePeriodTests, base.BaseReshapingTests):
+    pass
+
+
+class TestSetitem(BasePeriodTests, base.BaseSetitemTests):
+    pass
+
+
+class TestGroupby(BasePeriodTests, base.BaseGroupbyTests):
+    pass
+
+
+class TestPrinting(BasePeriodTests, base.BasePrintingTests):
+    pass
+
+
+class TestParsing(BasePeriodTests, base.BaseParsingTests):
+    @pytest.mark.parametrize('engine', ['c', 'python'])
+    def test_EA_types(self, engine, data):
+        expected_msg = r'.*must implement _from_sequence_of_strings.*'
+        with pytest.raises(NotImplementedError, match=expected_msg):
+            super(TestParsing, self).test_EA_types(engine, data)
diff --git a/pandas/tests/extension/test_sparse.py b/pandas/tests/extension/test_sparse.py
new file mode 100644
index 0000000000000..146dea2b65d83
--- /dev/null
+++ b/pandas/tests/extension/test_sparse.py
@@ -0,0 +1,369 @@
+import numpy as np
+import pytest
+
+from pandas.errors import PerformanceWarning
+
+import pandas as pd
+from pandas import SparseArray, SparseDtype
+from pandas.tests.extension import base
+import pandas.util.testing as tm
+
+
+def make_data(fill_value):
+    if np.isnan(fill_value):
+        data = np.random.uniform(size=100)
+    else:
+        data = np.random.randint(1, 100, size=100)
+        if data[0] == data[1]:
+            data[0] += 1
+
+    data[2::3] = fill_value
+    return data
+
+
+@pytest.fixture
+def dtype():
+    return SparseDtype()
+
+
+@pytest.fixture(params=[0, np.nan])
+def data(request):
+    """Length-100 PeriodArray for semantics test."""
+    res = SparseArray(make_data(request.param),
+                      fill_value=request.param)
+    return res
+
+
+@pytest.fixture(params=[0, np.nan])
+def data_missing(request):
+    """Length 2 array with [NA, Valid]"""
+    return SparseArray([np.nan, 1], fill_value=request.param)
+
+
+@pytest.fixture(params=[0, np.nan])
+def data_repeated(request):
+    """Return different versions of data for count times"""
+    def gen(count):
+        for _ in range(count):
+            yield SparseArray(make_data(request.param),
+                              fill_value=request.param)
+    yield gen
+
+
+@pytest.fixture(params=[0, np.nan])
+def data_for_sorting(request):
+    return SparseArray([2, 3, 1], fill_value=request.param)
+
+
+@pytest.fixture(params=[0, np.nan])
+def data_missing_for_sorting(request):
+    return SparseArray([2, np.nan, 1], fill_value=request.param)
+
+
+@pytest.fixture
+def na_value():
+    return np.nan
+
+
+@pytest.fixture
+def na_cmp():
+    return lambda left, right: pd.isna(left) and pd.isna(right)
+
+
+@pytest.fixture(params=[0, np.nan])
+def data_for_grouping(request):
+    return SparseArray([1, 1, np.nan, np.nan, 2, 2, 1, 3],
+                       fill_value=request.param)
+
+
+class BaseSparseTests(object):
+
+    def _check_unsupported(self, data):
+        if data.dtype == SparseDtype(int, 0):
+            pytest.skip("Can't store nan in int array.")
+
+
+class TestDtype(BaseSparseTests, base.BaseDtypeTests):
+
+    def test_array_type_with_arg(self, data, dtype):
+        assert dtype.construct_array_type() is SparseArray
+
+
+class TestInterface(BaseSparseTests, base.BaseInterfaceTests):
+    def test_no_values_attribute(self, data):
+        pytest.skip("We have values")
+
+
+class TestConstructors(BaseSparseTests, base.BaseConstructorsTests):
+    pass
+
+
+class TestReshaping(BaseSparseTests, base.BaseReshapingTests):
+
+    def test_concat_mixed_dtypes(self, data):
+        # https://github.com/pandas-dev/pandas/issues/20762
+        # This should be the same, aside from concat([sparse, float])
+        df1 = pd.DataFrame({'A': data[:3]})
+        df2 = pd.DataFrame({"A": [1, 2, 3]})
+        df3 = pd.DataFrame({"A": ['a', 'b', 'c']}).astype('category')
+        dfs = [df1, df2, df3]
+
+        # dataframes
+        result = pd.concat(dfs)
+        expected = pd.concat([x.apply(lambda s: np.asarray(s).astype(object))
+                              for x in dfs])
+        self.assert_frame_equal(result, expected)
+
+    def test_concat_columns(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestReshaping, self).test_concat_columns(data, na_value)
+
+    def test_align(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestReshaping, self).test_align(data, na_value)
+
+    def test_align_frame(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestReshaping, self).test_align_frame(data, na_value)
+
+    def test_align_series_frame(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestReshaping, self).test_align_series_frame(data, na_value)
+
+    def test_merge(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestReshaping, self).test_merge(data, na_value)
+
+
+class TestGetitem(BaseSparseTests, base.BaseGetitemTests):
+
+    def test_get(self, data):
+        s = pd.Series(data, index=[2 * i for i in range(len(data))])
+        if np.isnan(s.values.fill_value):
+            assert np.isnan(s.get(4)) and np.isnan(s.iloc[2])
+        else:
+            assert s.get(4) == s.iloc[2]
+        assert s.get(2) == s.iloc[1]
+
+    def test_reindex(self, data, na_value):
+        self._check_unsupported(data)
+        super(TestGetitem, self).test_reindex(data, na_value)
+
+
+# Skipping TestSetitem, since we don't implement it.
+
+class TestMissing(BaseSparseTests, base.BaseMissingTests):
+
+    def test_isna(self, data_missing):
+        expected_dtype = SparseDtype(bool,
+                                     pd.isna(data_missing.dtype.fill_value))
+        expected = SparseArray([True, False], dtype=expected_dtype)
+
+        result = pd.isna(data_missing)
+        self.assert_equal(result, expected)
+
+        result = pd.Series(data_missing).isna()
+        expected = pd.Series(expected)
+        self.assert_series_equal(result, expected)
+
+        # GH 21189
+        result = pd.Series(data_missing).drop([0, 1]).isna()
+        expected = pd.Series([], dtype=expected_dtype)
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_limit_pad(self, data_missing):
+        with tm.assert_produces_warning(PerformanceWarning):
+            super(TestMissing, self).test_fillna_limit_pad(data_missing)
+
+    def test_fillna_limit_backfill(self, data_missing):
+        with tm.assert_produces_warning(PerformanceWarning):
+            super(TestMissing, self).test_fillna_limit_backfill(data_missing)
+
+    def test_fillna_series_method(self, data_missing):
+        with tm.assert_produces_warning(PerformanceWarning):
+            super(TestMissing, self).test_fillna_limit_backfill(data_missing)
+
+    @pytest.mark.skip(reason="Unsupported")
+    def test_fillna_series(self):
+        # this one looks doable.
+        pass
+
+    def test_fillna_frame(self, data_missing):
+        # Have to override to specify that fill_value will change.
+        fill_value = data_missing[1]
+
+        result = pd.DataFrame({
+            "A": data_missing,
+            "B": [1, 2]
+        }).fillna(fill_value)
+
+        if pd.isna(data_missing.fill_value):
+            dtype = SparseDtype(data_missing.dtype, fill_value)
+        else:
+            dtype = data_missing.dtype
+
+        expected = pd.DataFrame({
+            "A": data_missing._from_sequence([fill_value, fill_value],
+                                             dtype=dtype),
+            "B": [1, 2],
+        })
+
+        self.assert_frame_equal(result, expected)
+
+
+class TestMethods(BaseSparseTests, base.BaseMethodsTests):
+
+    def test_combine_le(self, data_repeated):
+        # We return a Series[SparseArray].__le__ returns a
+        # Series[Sparse[bool]]
+        # rather than Series[bool]
+        orig_data1, orig_data2 = data_repeated(2)
+        s1 = pd.Series(orig_data1)
+        s2 = pd.Series(orig_data2)
+        result = s1.combine(s2, lambda x1, x2: x1 <= x2)
+        expected = pd.Series(pd.SparseArray([
+            a <= b for (a, b) in
+            zip(list(orig_data1), list(orig_data2))
+        ], fill_value=False))
+        self.assert_series_equal(result, expected)
+
+        val = s1.iloc[0]
+        result = s1.combine(val, lambda x1, x2: x1 <= x2)
+        expected = pd.Series(pd.SparseArray([
+            a <= val for a in list(orig_data1)
+        ], fill_value=False))
+        self.assert_series_equal(result, expected)
+
+    def test_fillna_copy_frame(self, data_missing):
+        arr = data_missing.take([1, 1])
+        df = pd.DataFrame({"A": arr})
+
+        filled_val = df.iloc[0, 0]
+        result = df.fillna(filled_val)
+
+        assert df.values.base is not result.values.base
+        assert df.A._values.to_dense() is arr.to_dense()
+
+    def test_fillna_copy_series(self, data_missing):
+        arr = data_missing.take([1, 1])
+        ser = pd.Series(arr)
+
+        filled_val = ser[0]
+        result = ser.fillna(filled_val)
+
+        assert ser._values is not result._values
+        assert ser._values.to_dense() is arr.to_dense()
+
+    @pytest.mark.skip(reason="Not Applicable")
+    def test_fillna_length_mismatch(self, data_missing):
+        pass
+
+    def test_where_series(self, data, na_value):
+        assert data[0] != data[1]
+        cls = type(data)
+        a, b = data[:2]
+
+        ser = pd.Series(cls._from_sequence([a, a, b, b], dtype=data.dtype))
+
+        cond = np.array([True, True, False, False])
+        result = ser.where(cond)
+
+        new_dtype = SparseDtype('float', 0.0)
+        expected = pd.Series(cls._from_sequence([a, a, na_value, na_value],
+                                                dtype=new_dtype))
+        self.assert_series_equal(result, expected)
+
+        other = cls._from_sequence([a, b, a, b], dtype=data.dtype)
+        cond = np.array([True, False, True, True])
+        result = ser.where(cond, other)
+        expected = pd.Series(cls._from_sequence([a, b, b, b],
+                                                dtype=data.dtype))
+        self.assert_series_equal(result, expected)
+
+    def test_combine_first(self, data):
+        if data.dtype.subtype == 'int':
+            # Right now this is upcasted to float, just like combine_first
+            # for Series[int]
+            pytest.skip("TODO(SparseArray.__setitem__ will preserve dtype.")
+        super(TestMethods, self).test_combine_first(data)
+
+    def test_searchsorted(self, data_for_sorting, as_series):
+        with tm.assert_produces_warning(PerformanceWarning):
+            super(TestMethods, self).test_searchsorted(data_for_sorting,
+                                                       as_series)
+
+
+class TestCasting(BaseSparseTests, base.BaseCastingTests):
+    pass
+
+
+class TestArithmeticOps(BaseSparseTests, base.BaseArithmeticOpsTests):
+    series_scalar_exc = None
+    frame_scalar_exc = None
+    divmod_exc = None
+    series_array_exc = None
+
+    def _skip_if_different_combine(self, data):
+        if data.fill_value == 0:
+            # arith ops call on dtype.fill_value so that the sparsity
+            # is maintained. Combine can't be called on a dtype in
+            # general, so we can't make the expected. This is tested elsewhere
+            raise pytest.skip("Incorrected expected from Series.combine")
+
+    def test_error(self, data, all_arithmetic_operators):
+        pass
+
+    def test_arith_series_with_scalar(self, data, all_arithmetic_operators):
+        self._skip_if_different_combine(data)
+        super(TestArithmeticOps, self).test_arith_series_with_scalar(
+            data,
+            all_arithmetic_operators
+        )
+
+    def test_arith_series_with_array(self, data, all_arithmetic_operators):
+        self._skip_if_different_combine(data)
+        super(TestArithmeticOps, self).test_arith_series_with_array(
+            data,
+            all_arithmetic_operators
+        )
+
+
+class TestComparisonOps(BaseSparseTests, base.BaseComparisonOpsTests):
+
+    def _compare_other(self, s, data, op_name, other):
+        op = self.get_op_from_name(op_name)
+
+        # array
+        result = pd.Series(op(data, other))
+        # hard to test the fill value, since we don't know what expected
+        # is in general.
+        # Rely on tests in `tests/sparse` to validate that.
+        assert isinstance(result.dtype, SparseDtype)
+        assert result.dtype.subtype == np.dtype('bool')
+
+        with np.errstate(all='ignore'):
+            expected = pd.Series(
+                pd.SparseArray(op(np.asarray(data), np.asarray(other)),
+                               fill_value=result.values.fill_value)
+            )
+
+        tm.assert_series_equal(result, expected)
+
+        # series
+        s = pd.Series(data)
+        result = op(s, other)
+        tm.assert_series_equal(result, expected)
+
+
+class TestPrinting(BaseSparseTests, base.BasePrintingTests):
+    @pytest.mark.xfail(reason='Different repr', strict=True)
+    def test_array_repr(self, data, size):
+        super(TestPrinting, self).test_array_repr(data, size)
+
+
+class TestParsing(BaseSparseTests, base.BaseParsingTests):
+    @pytest.mark.parametrize('engine', ['c', 'python'])
+    def test_EA_types(self, engine, data):
+        expected_msg = r'.*must implement _from_sequence_of_strings.*'
+        with pytest.raises(NotImplementedError, match=expected_msg):
+            super(TestParsing, self).test_EA_types(engine, data)
diff --git a/pandas/tests/formats/data/unicode_series.csv b/pandas/tests/formats/data/unicode_series.csv
deleted file mode 100644
index 2485e149edb06..0000000000000
--- a/pandas/tests/formats/data/unicode_series.csv
+++ /dev/null
@@ -1,18 +0,0 @@
-1617,King of New York (1990)
-1618,All Things Fair (1996)
-1619,"Sixth Man, The (1997)"
-1620,Butterfly Kiss (1995)
-1621,"Paris, France (1993)"
-1622,"C�r�monie, La (1995)"
-1623,Hush (1998)
-1624,Nightwatch (1997)
-1625,Nobody Loves Me (Keiner liebt mich) (1994)
-1626,"Wife, The (1995)"
-1627,Lamerica (1994)
-1628,Nico Icon (1995)
-1629,"Silence of the Palace, The (Saimt el Qusur) (1994)"
-1630,"Slingshot, The (1993)"
-1631,Land and Freedom (Tierra y libertad) (1995)
-1632,� k�ldum klaka (Cold Fever) (1994)
-1633,Etz Hadomim Tafus (Under the Domin Tree) (1994)
-1634,Two Friends (1986)
diff --git a/pandas/tests/formats/test_format.py b/pandas/tests/formats/test_format.py
deleted file mode 100644
index 83458c82a3d7c..0000000000000
--- a/pandas/tests/formats/test_format.py
+++ /dev/null
@@ -1,2545 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Test output formatting for Series/DataFrame, including to_string & reprs
-"""
-
-from __future__ import print_function
-import re
-
-import itertools
-from operator import methodcaller
-import os
-import sys
-import warnings
-from datetime import datetime
-
-import pytest
-
-import numpy as np
-import pandas as pd
-from pandas import (DataFrame, Series, Index, Timestamp, MultiIndex,
-                    date_range, NaT, read_table)
-from pandas.compat import (range, zip, lrange, StringIO, PY3,
-                           u, lzip, is_platform_windows,
-                           is_platform_32bit)
-import pandas.compat as compat
-
-import pandas.formats.format as fmt
-import pandas.formats.printing as printing
-
-import pandas.util.testing as tm
-from pandas.util.terminal import get_terminal_size
-from pandas.core.config import (set_option, get_option, option_context,
-                                reset_option)
-
-use_32bit_repr = is_platform_windows() or is_platform_32bit()
-
-_frame = DataFrame(tm.getSeriesData())
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
-
-
-def has_info_repr(df):
-    r = repr(df)
-    c1 = r.split('\n')[0].startswith("<class")
-    c2 = r.split('\n')[0].startswith(r"&lt;class")  # _repr_html_
-    return c1 or c2
-
-
-def has_non_verbose_info_repr(df):
-    has_info = has_info_repr(df)
-    r = repr(df)
-
-    # 1. <class>
-    # 2. Index
-    # 3. Columns
-    # 4. dtype
-    # 5. memory usage
-    # 6. trailing newline
-    nv = len(r.split('\n')) == 6
-    return has_info and nv
-
-
-def has_horizontally_truncated_repr(df):
-    try:  # Check header row
-        fst_line = np.array(repr(df).splitlines()[0].split())
-        cand_col = np.where(fst_line == '...')[0][0]
-    except:
-        return False
-    # Make sure each row has this ... in the same place
-    r = repr(df)
-    for ix, l in enumerate(r.splitlines()):
-        if not r.split()[cand_col] == '...':
-            return False
-    return True
-
-
-def has_vertically_truncated_repr(df):
-    r = repr(df)
-    only_dot_row = False
-    for row in r.splitlines():
-        if re.match(r'^[\.\ ]+$', row):
-            only_dot_row = True
-    return only_dot_row
-
-
-def has_truncated_repr(df):
-    return has_horizontally_truncated_repr(
-        df) or has_vertically_truncated_repr(df)
-
-
-def has_doubly_truncated_repr(df):
-    return has_horizontally_truncated_repr(
-        df) and has_vertically_truncated_repr(df)
-
-
-def has_expanded_repr(df):
-    r = repr(df)
-    for line in r.split('\n'):
-        if line.endswith('\\'):
-            return True
-    return False
-
-
-class TestDataFrameFormatting(tm.TestCase):
-
-    def setUp(self):
-        self.warn_filters = warnings.filters
-        warnings.filterwarnings('ignore', category=FutureWarning,
-                                module=".*format")
-
-        self.frame = _frame.copy()
-
-    def tearDown(self):
-        warnings.filters = self.warn_filters
-
-    def test_repr_embedded_ndarray(self):
-        arr = np.empty(10, dtype=[('err', object)])
-        for i in range(len(arr)):
-            arr['err'][i] = np.random.randn(i)
-
-        df = DataFrame(arr)
-        repr(df['err'])
-        repr(df)
-        df.to_string()
-
-    def test_eng_float_formatter(self):
-        self.frame.loc[5] = 0
-
-        fmt.set_eng_float_format()
-        repr(self.frame)
-
-        fmt.set_eng_float_format(use_eng_prefix=True)
-        repr(self.frame)
-
-        fmt.set_eng_float_format(accuracy=0)
-        repr(self.frame)
-        self.reset_display_options()
-
-    def test_show_null_counts(self):
-
-        df = DataFrame(1, columns=range(10), index=range(10))
-        df.iloc[1, 1] = np.nan
-
-        def check(null_counts, result):
-            buf = StringIO()
-            df.info(buf=buf, null_counts=null_counts)
-            self.assertTrue(('non-null' in buf.getvalue()) is result)
-
-        with option_context('display.max_info_rows', 20,
-                            'display.max_info_columns', 20):
-            check(None, True)
-            check(True, True)
-            check(False, False)
-
-        with option_context('display.max_info_rows', 5,
-                            'display.max_info_columns', 5):
-            check(None, False)
-            check(True, False)
-            check(False, False)
-
-    def test_repr_tuples(self):
-        buf = StringIO()
-
-        df = DataFrame({'tups': lzip(range(10), range(10))})
-        repr(df)
-        df.to_string(col_space=10, buf=buf)
-
-    def test_repr_truncation(self):
-        max_len = 20
-        with option_context("display.max_colwidth", max_len):
-            df = DataFrame({'A': np.random.randn(10),
-                            'B': [tm.rands(np.random.randint(
-                                max_len - 1, max_len + 1)) for i in range(10)
-            ]})
-            r = repr(df)
-            r = r[r.find('\n') + 1:]
-
-            adj = fmt._get_adjustment()
-
-            for line, value in lzip(r.split('\n'), df['B']):
-                if adj.len(value) + 1 > max_len:
-                    self.assertIn('...', line)
-                else:
-                    self.assertNotIn('...', line)
-
-        with option_context("display.max_colwidth", 999999):
-            self.assertNotIn('...', repr(df))
-
-        with option_context("display.max_colwidth", max_len + 2):
-            self.assertNotIn('...', repr(df))
-
-    def test_repr_chop_threshold(self):
-        df = DataFrame([[0.1, 0.5], [0.5, -0.1]])
-        pd.reset_option("display.chop_threshold")  # default None
-        self.assertEqual(repr(df), '     0    1\n0  0.1  0.5\n1  0.5 -0.1')
-
-        with option_context("display.chop_threshold", 0.2):
-            self.assertEqual(repr(df), '     0    1\n0  0.0  0.5\n1  0.5  0.0')
-
-        with option_context("display.chop_threshold", 0.6):
-            self.assertEqual(repr(df), '     0    1\n0  0.0  0.0\n1  0.0  0.0')
-
-        with option_context("display.chop_threshold", None):
-            self.assertEqual(repr(df), '     0    1\n0  0.1  0.5\n1  0.5 -0.1')
-
-    def test_repr_obeys_max_seq_limit(self):
-        with option_context("display.max_seq_items", 2000):
-            self.assertTrue(len(printing.pprint_thing(lrange(1000))) > 1000)
-
-        with option_context("display.max_seq_items", 5):
-            self.assertTrue(len(printing.pprint_thing(lrange(1000))) < 100)
-
-    def test_repr_set(self):
-        self.assertEqual(printing.pprint_thing(set([1])), '{1}')
-
-    def test_repr_is_valid_construction_code(self):
-        # for the case of Index, where the repr is traditional rather then
-        # stylized
-        idx = Index(['a', 'b'])
-        res = eval("pd." + repr(idx))
-        tm.assert_series_equal(Series(res), Series(idx))
-
-    def test_repr_should_return_str(self):
-        # http://docs.python.org/py3k/reference/datamodel.html#object.__repr__
-        # http://docs.python.org/reference/datamodel.html#object.__repr__
-        # "...The return value must be a string object."
-
-        # (str on py2.x, str (unicode) on py3)
-
-        data = [8, 5, 3, 5]
-        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
-        cols = [u("\u03c8")]
-        df = DataFrame(data, columns=cols, index=index1)
-        self.assertTrue(type(df.__repr__()) == str)  # both py2 / 3
-
-    def test_repr_no_backslash(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame(np.random.randn(10, 4))
-            self.assertTrue('\\' not in repr(df))
-
-    def test_expand_frame_repr(self):
-        df_small = DataFrame('hello', [0], [0])
-        df_wide = DataFrame('hello', [0], lrange(10))
-        df_tall = DataFrame('hello', lrange(30), lrange(5))
-
-        with option_context('mode.sim_interactive', True):
-            with option_context('display.max_columns', 10, 'display.width', 20,
-                                'display.max_rows', 20,
-                                'display.show_dimensions', True):
-                with option_context('display.expand_frame_repr', True):
-                    self.assertFalse(has_truncated_repr(df_small))
-                    self.assertFalse(has_expanded_repr(df_small))
-                    self.assertFalse(has_truncated_repr(df_wide))
-                    self.assertTrue(has_expanded_repr(df_wide))
-                    self.assertTrue(has_vertically_truncated_repr(df_tall))
-                    self.assertTrue(has_expanded_repr(df_tall))
-
-                with option_context('display.expand_frame_repr', False):
-                    self.assertFalse(has_truncated_repr(df_small))
-                    self.assertFalse(has_expanded_repr(df_small))
-                    self.assertFalse(has_horizontally_truncated_repr(df_wide))
-                    self.assertFalse(has_expanded_repr(df_wide))
-                    self.assertTrue(has_vertically_truncated_repr(df_tall))
-                    self.assertFalse(has_expanded_repr(df_tall))
-
-    def test_repr_non_interactive(self):
-        # in non interactive mode, there can be no dependency on the
-        # result of terminal auto size detection
-        df = DataFrame('hello', lrange(1000), lrange(5))
-
-        with option_context('mode.sim_interactive', False, 'display.width', 0,
-                            'display.height', 0, 'display.max_rows', 5000):
-            self.assertFalse(has_truncated_repr(df))
-            self.assertFalse(has_expanded_repr(df))
-
-    def test_repr_max_columns_max_rows(self):
-        term_width, term_height = get_terminal_size()
-        if term_width < 10 or term_height < 10:
-            pytest.skip("terminal size too small, "
-                        "{0} x {1}".format(term_width, term_height))
-
-        def mkframe(n):
-            index = ['%05d' % i for i in range(n)]
-            return DataFrame(0, index, index)
-
-        df6 = mkframe(6)
-        df10 = mkframe(10)
-        with option_context('mode.sim_interactive', True):
-            with option_context('display.width', term_width * 2):
-                with option_context('display.max_rows', 5,
-                                    'display.max_columns', 5):
-                    self.assertFalse(has_expanded_repr(mkframe(4)))
-                    self.assertFalse(has_expanded_repr(mkframe(5)))
-                    self.assertFalse(has_expanded_repr(df6))
-                    self.assertTrue(has_doubly_truncated_repr(df6))
-
-                with option_context('display.max_rows', 20,
-                                    'display.max_columns', 10):
-                    # Out off max_columns boundary, but no extending
-                    # since not exceeding width
-                    self.assertFalse(has_expanded_repr(df6))
-                    self.assertFalse(has_truncated_repr(df6))
-
-                with option_context('display.max_rows', 9,
-                                    'display.max_columns', 10):
-                    # out vertical bounds can not result in exanded repr
-                    self.assertFalse(has_expanded_repr(df10))
-                    self.assertTrue(has_vertically_truncated_repr(df10))
-
-            # width=None in terminal, auto detection
-            with option_context('display.max_columns', 100, 'display.max_rows',
-                                term_width * 20, 'display.width', None):
-                df = mkframe((term_width // 7) - 2)
-                self.assertFalse(has_expanded_repr(df))
-                df = mkframe((term_width // 7) + 2)
-                printing.pprint_thing(df._repr_fits_horizontal_())
-                self.assertTrue(has_expanded_repr(df))
-
-    def test_str_max_colwidth(self):
-        # GH 7856
-        df = pd.DataFrame([{'a': 'foo',
-                            'b': 'bar',
-                            'c': 'uncomfortably long line with lots of stuff',
-                            'd': 1}, {'a': 'foo',
-                                      'b': 'bar',
-                                      'c': 'stuff',
-                                      'd': 1}])
-        df.set_index(['a', 'b', 'c'])
-        self.assertTrue(
-            str(df) ==
-            '     a    b                                           c  d\n'
-            '0  foo  bar  uncomfortably long line with lots of stuff  1\n'
-            '1  foo  bar                                       stuff  1')
-        with option_context('max_colwidth', 20):
-            self.assertTrue(str(df) == '     a    b                    c  d\n'
-                            '0  foo  bar  uncomfortably lo...  1\n'
-                            '1  foo  bar                stuff  1')
-
-    def test_auto_detect(self):
-        term_width, term_height = get_terminal_size()
-        fac = 1.05  # Arbitrary large factor to exceed term widht
-        cols = range(int(term_width * fac))
-        index = range(10)
-        df = DataFrame(index=index, columns=cols)
-        with option_context('mode.sim_interactive', True):
-            with option_context('max_rows', None):
-                with option_context('max_columns', None):
-                    # Wrap around with None
-                    self.assertTrue(has_expanded_repr(df))
-            with option_context('max_rows', 0):
-                with option_context('max_columns', 0):
-                    # Truncate with auto detection.
-                    self.assertTrue(has_horizontally_truncated_repr(df))
-
-            index = range(int(term_height * fac))
-            df = DataFrame(index=index, columns=cols)
-            with option_context('max_rows', 0):
-                with option_context('max_columns', None):
-                    # Wrap around with None
-                    self.assertTrue(has_expanded_repr(df))
-                    # Truncate vertically
-                    self.assertTrue(has_vertically_truncated_repr(df))
-
-            with option_context('max_rows', None):
-                with option_context('max_columns', 0):
-                    self.assertTrue(has_horizontally_truncated_repr(df))
-
-    def test_to_string_repr_unicode(self):
-        buf = StringIO()
-
-        unicode_values = [u('\u03c3')] * 10
-        unicode_values = np.array(unicode_values, dtype=object)
-        df = DataFrame({'unicode': unicode_values})
-        df.to_string(col_space=10, buf=buf)
-
-        # it works!
-        repr(df)
-
-        idx = Index(['abc', u('\u03c3a'), 'aegdvg'])
-        ser = Series(np.random.randn(len(idx)), idx)
-        rs = repr(ser).split('\n')
-        line_len = len(rs[0])
-        for line in rs[1:]:
-            try:
-                line = line.decode(get_option("display.encoding"))
-            except:
-                pass
-            if not line.startswith('dtype:'):
-                self.assertEqual(len(line), line_len)
-
-        # it works even if sys.stdin in None
-        _stdin = sys.stdin
-        try:
-            sys.stdin = None
-            repr(df)
-        finally:
-            sys.stdin = _stdin
-
-    def test_to_string_unicode_columns(self):
-        df = DataFrame({u('\u03c3'): np.arange(10.)})
-
-        buf = StringIO()
-        df.to_string(buf=buf)
-        buf.getvalue()
-
-        buf = StringIO()
-        df.info(buf=buf)
-        buf.getvalue()
-
-        result = self.frame.to_string()
-        tm.assertIsInstance(result, compat.text_type)
-
-    def test_to_string_utf8_columns(self):
-        n = u("\u05d0").encode('utf-8')
-
-        with option_context('display.max_rows', 1):
-            df = DataFrame([1, 2], columns=[n])
-            repr(df)
-
-    def test_to_string_unicode_two(self):
-        dm = DataFrame({u('c/\u03c3'): []})
-        buf = StringIO()
-        dm.to_string(buf)
-
-    def test_to_string_unicode_three(self):
-        dm = DataFrame(['\xc2'])
-        buf = StringIO()
-        dm.to_string(buf)
-
-    def test_to_string_with_formatters(self):
-        df = DataFrame({'int': [1, 2, 3],
-                        'float': [1.0, 2.0, 3.0],
-                        'object': [(1, 2), True, False]},
-                       columns=['int', 'float', 'object'])
-
-        formatters = [('int', lambda x: '0x%x' % x),
-                      ('float', lambda x: '[% 4.1f]' % x),
-                      ('object', lambda x: '-%s-' % str(x))]
-        result = df.to_string(formatters=dict(formatters))
-        result2 = df.to_string(formatters=lzip(*formatters)[1])
-        self.assertEqual(result, ('  int  float    object\n'
-                                  '0 0x1 [ 1.0]  -(1, 2)-\n'
-                                  '1 0x2 [ 2.0]    -True-\n'
-                                  '2 0x3 [ 3.0]   -False-'))
-        self.assertEqual(result, result2)
-
-    def test_to_string_with_datetime64_monthformatter(self):
-        months = [datetime(2016, 1, 1), datetime(2016, 2, 2)]
-        x = DataFrame({'months': months})
-
-        def format_func(x):
-            return x.strftime('%Y-%m')
-        result = x.to_string(formatters={'months': format_func})
-        expected = 'months\n0 2016-01\n1 2016-02'
-        self.assertEqual(result.strip(), expected)
-
-    def test_to_string_with_datetime64_hourformatter(self):
-
-        x = DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
-                                             format='%H:%M:%S.%f')})
-
-        def format_func(x):
-            return x.strftime('%H:%M')
-
-        result = x.to_string(formatters={'hod': format_func})
-        expected = 'hod\n0 10:10\n1 12:12'
-        self.assertEqual(result.strip(), expected)
-
-    def test_to_string_with_formatters_unicode(self):
-        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
-        result = df.to_string(formatters={u('c/\u03c3'): lambda x: '%s' % x})
-        self.assertEqual(result, u('  c/\u03c3\n') + '0   1\n1   2\n2   3')
-
-    def test_east_asian_unicode_frame(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode  # noqa
-
-        # not alighned properly because of east asian width
-
-        # mid col
-        df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
-                        'b': [1, 222, 33333, 4]},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"          a      b\na         あ      1\n"
-                    u"bb      いいい    222\nc         う  33333\n"
-                    u"ddd  ええええええ      4")
-        self.assertEqual(_rep(df), expected)
-
-        # last col
-        df = DataFrame({'a': [1, 222, 33333, 4],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"         a       b\na        1       あ\n"
-                    u"bb     222     いいい\nc    33333       う\n"
-                    u"ddd      4  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # all col
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"         a       b\na    あああああ       あ\n"
-                    u"bb       い     いいい\nc        う       う\n"
-                    u"ddd    えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # column name
-        df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"          b  あああああ\na         あ      1\n"
-                    u"bb      いいい    222\nc         う  33333\n"
-                    u"ddd  ええええええ      4")
-        self.assertEqual(_rep(df), expected)
-
-        # index
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=[u'あああ', u'いいいいいい', u'うう', u'え'])
-        expected = (u"            a       b\nあああ     あああああ       あ\n"
-                    u"いいいいいい      い     いいい\nうう          う       う\n"
-                    u"え         えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # index name
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=pd.Index([u'あ', u'い', u'うう', u'え'],
-                                      name=u'おおおお'))
-        expected = (u"          a       b\n"
-                    u"おおおお               \n"
-                    u"あ     あああああ       あ\n"
-                    u"い         い     いいい\n"
-                    u"うう        う       う\n"
-                    u"え       えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # all
-        df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
-                        u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
-                       index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
-                                      name=u'お'))
-        expected = (u"       あああ いいいいい\n"
-                    u"お               \n"
-                    u"あ      あああ     あ\n"
-                    u"いいい      い   いいい\n"
-                    u"うう       う     う\n"
-                    u"え    えええええ    ええ")
-        self.assertEqual(_rep(df), expected)
-
-        # MultiIndex
-        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
-            u'おおお', u'かかかか'), (u'き', u'くく')])
-        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                       index=idx)
-        expected = (u"              a       b\n"
-                    u"あ   いい    あああああ       あ\n"
-                    u"う   え         い     いいい\n"
-                    u"おおお かかかか      う       う\n"
-                    u"き   くく      えええ  ええええええ")
-        self.assertEqual(_rep(df), expected)
-
-        # truncate
-        with option_context('display.max_rows', 3, 'display.max_columns', 3):
-            df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                               'b': [u'あ', u'いいい', u'う', u'ええええええ'],
-                               'c': [u'お', u'か', u'ききき', u'くくくくくく'],
-                               u'ああああ': [u'さ', u'し', u'す', u'せ']},
-                              columns=['a', 'b', 'c', u'ああああ'])
-
-            expected = (u"        a ...  ああああ\n0   あああああ ...     さ\n"
-                        u"..    ... ...   ...\n3     えええ ...     せ\n"
-                        u"\n[4 rows x 4 columns]")
-            self.assertEqual(_rep(df), expected)
-
-            df.index = [u'あああ', u'いいいい', u'う', 'aaa']
-            expected = (u"         a ...  ああああ\nあああ  あああああ ...     さ\n"
-                        u"..     ... ...   ...\naaa    えええ ...     せ\n"
-                        u"\n[4 rows x 4 columns]")
-            self.assertEqual(_rep(df), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with option_context('display.unicode.east_asian_width', True):
-
-            # mid col
-            df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
-                            'b': [1, 222, 33333, 4]},
-                           index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"                a      b\na              あ      1\n"
-                        u"bb         いいい    222\nc              う  33333\n"
-                        u"ddd  ええええええ      4")
-            self.assertEqual(_rep(df), expected)
-
-            # last col
-            df = DataFrame({'a': [1, 222, 33333, 4],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"         a             b\na        1            あ\n"
-                        u"bb     222        いいい\nc    33333            う\n"
-                        u"ddd      4  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # all col
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"              a             b\n"
-                        u"a    あああああ            あ\n"
-                        u"bb           い        いいい\n"
-                        u"c            う            う\n"
-                        u"ddd      えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # column name
-            df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"                b  あああああ\n"
-                        u"a              あ           1\n"
-                        u"bb         いいい         222\n"
-                        u"c              う       33333\n"
-                        u"ddd  ええええええ           4")
-            self.assertEqual(_rep(df), expected)
-
-            # index
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=[u'あああ', u'いいいいいい', u'うう', u'え'])
-            expected = (u"                       a             b\n"
-                        u"あああ        あああああ            あ\n"
-                        u"いいいいいい          い        いいい\n"
-                        u"うう                  う            う\n"
-                        u"え                えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # index name
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=pd.Index([u'あ', u'い', u'うう', u'え'],
-                                          name=u'おおおお'))
-            expected = (u"                   a             b\n"
-                        u"おおおお                          \n"
-                        u"あ        あああああ            あ\n"
-                        u"い                い        いいい\n"
-                        u"うう              う            う\n"
-                        u"え            えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # all
-            df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
-                            u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
-                           index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
-                                          name=u'お'))
-            expected = (u"            あああ いいいいい\n"
-                        u"お                           \n"
-                        u"あ          あああ         あ\n"
-                        u"いいい          い     いいい\n"
-                        u"うう            う         う\n"
-                        u"え      えええええ       ええ")
-            self.assertEqual(_rep(df), expected)
-
-            # MultiIndex
-            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
-                u'おおお', u'かかかか'), (u'き', u'くく')])
-            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
-                           index=idx)
-            expected = (u"                          a             b\n"
-                        u"あ     いい      あああああ            あ\n"
-                        u"う     え                い        いいい\n"
-                        u"おおお かかかか          う            う\n"
-                        u"き     くく          えええ  ええええええ")
-            self.assertEqual(_rep(df), expected)
-
-            # truncate
-            with option_context('display.max_rows', 3, 'display.max_columns',
-                                3):
-
-                df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
-                                   'b': [u'あ', u'いいい', u'う', u'ええええええ'],
-                                   'c': [u'お', u'か', u'ききき', u'くくくくくく'],
-                                   u'ああああ': [u'さ', u'し', u'す', u'せ']},
-                                  columns=['a', 'b', 'c', u'ああああ'])
-
-                expected = (u"             a   ...    ああああ\n"
-                            u"0   あああああ   ...          さ\n"
-                            u"..         ...   ...         ...\n"
-                            u"3       えええ   ...          せ\n"
-                            u"\n[4 rows x 4 columns]")
-                self.assertEqual(_rep(df), expected)
-
-                df.index = [u'あああ', u'いいいい', u'う', 'aaa']
-                expected = (u"                 a   ...    ああああ\n"
-                            u"あああ  あああああ   ...          さ\n"
-                            u"...            ...   ...         ...\n"
-                            u"aaa         えええ   ...          せ\n"
-                            u"\n[4 rows x 4 columns]")
-                self.assertEqual(_rep(df), expected)
-
-            # ambiguous unicode
-            df = DataFrame({u'あああああ': [1, 222, 33333, 4],
-                            'b': [u'あ', u'いいい', u'¡¡', u'ええええええ']},
-                           index=['a', 'bb', 'c', '¡¡¡'])
-            expected = (u"                b  あああああ\n"
-                        u"a              あ           1\n"
-                        u"bb         いいい         222\n"
-                        u"c              ¡¡       33333\n"
-                        u"¡¡¡  ええええええ           4")
-            self.assertEqual(_rep(df), expected)
-
-    def test_to_string_buffer_all_unicode(self):
-        buf = StringIO()
-
-        empty = DataFrame({u('c/\u03c3'): Series()})
-        nonempty = DataFrame({u('c/\u03c3'): Series([1, 2, 3])})
-
-        print(empty, file=buf)
-        print(nonempty, file=buf)
-
-        # this should work
-        buf.getvalue()
-
-    def test_to_string_with_col_space(self):
-        df = DataFrame(np.random.random(size=(1, 3)))
-        c10 = len(df.to_string(col_space=10).split("\n")[1])
-        c20 = len(df.to_string(col_space=20).split("\n")[1])
-        c30 = len(df.to_string(col_space=30).split("\n")[1])
-        self.assertTrue(c10 < c20 < c30)
-
-        # GH 8230
-        # col_space wasn't being applied with header=False
-        with_header = df.to_string(col_space=20)
-        with_header_row1 = with_header.splitlines()[1]
-        no_header = df.to_string(col_space=20, header=False)
-        self.assertEqual(len(with_header_row1), len(no_header))
-
-    def test_to_string_truncate_indices(self):
-        for index in [tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
-                      tm.makeDateIndex, tm.makePeriodIndex]:
-            for column in [tm.makeStringIndex]:
-                for h in [10, 20]:
-                    for w in [10, 20]:
-                        with option_context("display.expand_frame_repr",
-                                            False):
-                            df = DataFrame(index=index(h), columns=column(w))
-                            with option_context("display.max_rows", 15):
-                                if h == 20:
-                                    self.assertTrue(
-                                        has_vertically_truncated_repr(df))
-                                else:
-                                    self.assertFalse(
-                                        has_vertically_truncated_repr(df))
-                            with option_context("display.max_columns", 15):
-                                if w == 20:
-                                    self.assertTrue(
-                                        has_horizontally_truncated_repr(df))
-                                else:
-                                    self.assertFalse(
-                                        has_horizontally_truncated_repr(df))
-                            with option_context("display.max_rows", 15,
-                                                "display.max_columns", 15):
-                                if h == 20 and w == 20:
-                                    self.assertTrue(has_doubly_truncated_repr(
-                                        df))
-                                else:
-                                    self.assertFalse(has_doubly_truncated_repr(
-                                        df))
-
-    def test_to_string_truncate_multilevel(self):
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays, columns=arrays)
-        with option_context("display.max_rows", 7, "display.max_columns", 7):
-            self.assertTrue(has_doubly_truncated_repr(df))
-
-    def test_truncate_with_different_dtypes(self):
-
-        # 11594, 12045
-        # when truncated the dtypes of the splits can differ
-
-        # 11594
-        import datetime
-        s = Series([datetime.datetime(2012, 1, 1)] * 10 +
-                   [datetime.datetime(1012, 1, 2)] + [
-            datetime.datetime(2012, 1, 3)] * 10)
-
-        with pd.option_context('display.max_rows', 8):
-            result = str(s)
-            self.assertTrue('object' in result)
-
-        # 12045
-        df = DataFrame({'text': ['some words'] + [None] * 9})
-
-        with pd.option_context('display.max_rows', 8,
-                               'display.max_columns', 3):
-            result = str(df)
-            self.assertTrue('None' in result)
-            self.assertFalse('NaN' in result)
-
-    def test_datetimelike_frame(self):
-
-        # GH 12211
-        df = DataFrame(
-            {'date': [pd.Timestamp('20130101').tz_localize('UTC')] +
-                     [pd.NaT] * 5})
-
-        with option_context("display.max_rows", 5):
-            result = str(df)
-            self.assertTrue('2013-01-01 00:00:00+00:00' in result)
-            self.assertTrue('NaT' in result)
-            self.assertTrue('...' in result)
-            self.assertTrue('[6 rows x 1 columns]' in result)
-
-        dts = [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5 + [pd.NaT] * 5
-        df = pd.DataFrame({"dt": dts,
-                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
-        with option_context('display.max_rows', 5):
-            expected = ('                          dt   x\n'
-                        '0  2011-01-01 00:00:00-05:00   1\n'
-                        '1  2011-01-01 00:00:00-05:00   2\n'
-                        '..                       ...  ..\n'
-                        '8                        NaT   9\n'
-                        '9                        NaT  10\n\n'
-                        '[10 rows x 2 columns]')
-            self.assertEqual(repr(df), expected)
-
-        dts = [pd.NaT] * 5 + [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5
-        df = pd.DataFrame({"dt": dts,
-                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
-        with option_context('display.max_rows', 5):
-            expected = ('                          dt   x\n'
-                        '0                        NaT   1\n'
-                        '1                        NaT   2\n'
-                        '..                       ...  ..\n'
-                        '8  2011-01-01 00:00:00-05:00   9\n'
-                        '9  2011-01-01 00:00:00-05:00  10\n\n'
-                        '[10 rows x 2 columns]')
-            self.assertEqual(repr(df), expected)
-
-        dts = ([pd.Timestamp('2011-01-01', tz='Asia/Tokyo')] * 5 +
-               [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5)
-        df = pd.DataFrame({"dt": dts,
-                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
-        with option_context('display.max_rows', 5):
-            expected = ('                           dt   x\n'
-                        '0   2011-01-01 00:00:00+09:00   1\n'
-                        '1   2011-01-01 00:00:00+09:00   2\n'
-                        '..                        ...  ..\n'
-                        '8   2011-01-01 00:00:00-05:00   9\n'
-                        '9   2011-01-01 00:00:00-05:00  10\n\n'
-                        '[10 rows x 2 columns]')
-            self.assertEqual(repr(df), expected)
-
-    def test_nonunicode_nonascii_alignment(self):
-        df = DataFrame([["aa\xc3\xa4\xc3\xa4", 1], ["bbbb", 2]])
-        rep_str = df.to_string()
-        lines = rep_str.split('\n')
-        self.assertEqual(len(lines[1]), len(lines[2]))
-
-    def test_unicode_problem_decoding_as_ascii(self):
-        dm = DataFrame({u('c/\u03c3'): Series({'test': np.nan})})
-        compat.text_type(dm.to_string())
-
-    def test_string_repr_encoding(self):
-        filepath = tm.get_data_path('unicode_series.csv')
-        df = pd.read_csv(filepath, header=None, encoding='latin1')
-        repr(df)
-        repr(df[1])
-
-    def test_repr_corner(self):
-        # representing infs poses no problems
-        df = DataFrame({'foo': [-np.inf, np.inf]})
-        repr(df)
-
-    def test_frame_info_encoding(self):
-        index = ['\'Til There Was You (1997)',
-                 'ldum klaka (Cold Fever) (1994)']
-        fmt.set_option('display.max_rows', 1)
-        df = DataFrame(columns=['a', 'b', 'c'], index=index)
-        repr(df)
-        repr(df.T)
-        fmt.set_option('display.max_rows', 200)
-
-    def test_pprint_thing(self):
-        from pandas.formats.printing import pprint_thing as pp_t
-
-        if PY3:
-            pytest.skip("doesn't work on Python 3")
-
-        self.assertEqual(pp_t('a'), u('a'))
-        self.assertEqual(pp_t(u('a')), u('a'))
-        self.assertEqual(pp_t(None), 'None')
-        self.assertEqual(pp_t(u('\u05d0'), quote_strings=True), u("u'\u05d0'"))
-        self.assertEqual(pp_t(u('\u05d0'), quote_strings=False), u('\u05d0'))
-        self.assertEqual(pp_t((u('\u05d0'),
-                               u('\u05d1')), quote_strings=True),
-                         u("(u'\u05d0', u'\u05d1')"))
-        self.assertEqual(pp_t((u('\u05d0'), (u('\u05d1'),
-                                             u('\u05d2'))),
-                              quote_strings=True),
-                         u("(u'\u05d0', (u'\u05d1', u'\u05d2'))"))
-        self.assertEqual(pp_t(('foo', u('\u05d0'), (u('\u05d0'),
-                                                    u('\u05d0'))),
-                              quote_strings=True),
-                         u("(u'foo', u'\u05d0', (u'\u05d0', u'\u05d0'))"))
-
-        # escape embedded tabs in string
-        # GH #2038
-        assert "\t" not in pp_t("a\tb", escape_chars=("\t", ))
-
-    def test_wide_repr(self):
-        with option_context('mode.sim_interactive', True,
-                            'display.show_dimensions', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-
-            assert "10 rows x %d columns" % (max_cols - 1) in rep_str
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 120):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_wide_columns(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame(np.random.randn(5, 3),
-                           columns=['a' * 90, 'b' * 90, 'c' * 90])
-            rep_str = repr(df)
-
-            self.assertEqual(len(rep_str.splitlines()), 20)
-
-    def test_wide_repr_named(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            df.index.name = 'DataFrame Index'
-            set_option('display.expand_frame_repr', False)
-
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-            for line in wide_repr.splitlines()[1::13]:
-                self.assertIn('DataFrame Index', line)
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_multiindex(self):
-        with option_context('mode.sim_interactive', True):
-            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)),
-                           index=midx)
-            df.index.names = ['Level 0', 'Level 1']
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-            for line in wide_repr.splitlines()[1::13]:
-                self.assertIn('Level 0 Level 1', line)
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_multiindex_cols(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
-            mcols = MultiIndex.from_arrays(
-                tm.rands_array(3, size=(2, max_cols - 1)))
-            df = DataFrame(tm.rands_array(25, (10, max_cols - 1)),
-                           index=midx, columns=mcols)
-            df.index.names = ['Level 0', 'Level 1']
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-        with option_context('display.width', 150):
-            wider_repr = repr(df)
-            self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_unicode(self):
-        with option_context('mode.sim_interactive', True):
-            max_cols = get_option('display.max_columns')
-            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-            set_option('display.expand_frame_repr', False)
-            rep_str = repr(df)
-            set_option('display.expand_frame_repr', True)
-            wide_repr = repr(df)
-            self.assertNotEqual(rep_str, wide_repr)
-
-            with option_context('display.width', 150):
-                wider_repr = repr(df)
-                self.assertTrue(len(wider_repr) < len(wide_repr))
-
-        reset_option('display.expand_frame_repr')
-
-    def test_wide_repr_wide_long_columns(self):
-        with option_context('mode.sim_interactive', True):
-            df = DataFrame({'a': ['a' * 30, 'b' * 30],
-                            'b': ['c' * 70, 'd' * 80]})
-
-            result = repr(df)
-            self.assertTrue('ccccc' in result)
-            self.assertTrue('ddddd' in result)
-
-    def test_long_series(self):
-        n = 1000
-        s = Series(
-            np.random.randint(-50, 50, n),
-            index=['s%04d' % x for x in range(n)], dtype='int64')
-
-        import re
-        str_rep = str(s)
-        nmatches = len(re.findall('dtype', str_rep))
-        self.assertEqual(nmatches, 1)
-
-    def test_index_with_nan(self):
-        #  GH 2850
-        df = DataFrame({'id1': {0: '1a3',
-                                1: '9h4'},
-                        'id2': {0: np.nan,
-                                1: 'd67'},
-                        'id3': {0: '78d',
-                                1: '79d'},
-                        'value': {0: 123,
-                                  1: 64}})
-
-        # multi-index
-        y = df.set_index(['id1', 'id2', 'id3'])
-        result = y.to_string()
-        expected = u(
-            '             value\nid1 id2 id3       \n'
-            '1a3 NaN 78d    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-        # index
-        y = df.set_index('id2')
-        result = y.to_string()
-        expected = u(
-            '     id1  id3  value\nid2                 \n'
-            'NaN  1a3  78d    123\nd67  9h4  79d     64')
-        self.assertEqual(result, expected)
-
-        # with append (this failed in 0.12)
-        y = df.set_index(['id1', 'id2']).set_index('id3', append=True)
-        result = y.to_string()
-        expected = u(
-            '             value\nid1 id2 id3       \n'
-            '1a3 NaN 78d    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-        # all-nan in mi
-        df2 = df.copy()
-        df2.loc[:, 'id2'] = np.nan
-        y = df2.set_index('id2')
-        result = y.to_string()
-        expected = u(
-            '     id1  id3  value\nid2                 \n'
-            'NaN  1a3  78d    123\nNaN  9h4  79d     64')
-        self.assertEqual(result, expected)
-
-        # partial nan in mi
-        df2 = df.copy()
-        df2.loc[:, 'id2'] = np.nan
-        y = df2.set_index(['id2', 'id3'])
-        result = y.to_string()
-        expected = u(
-            '         id1  value\nid2 id3            \n'
-            'NaN 78d  1a3    123\n    79d  9h4     64')
-        self.assertEqual(result, expected)
-
-        df = DataFrame({'id1': {0: np.nan,
-                                1: '9h4'},
-                        'id2': {0: np.nan,
-                                1: 'd67'},
-                        'id3': {0: np.nan,
-                                1: '79d'},
-                        'value': {0: 123,
-                                  1: 64}})
-
-        y = df.set_index(['id1', 'id2', 'id3'])
-        result = y.to_string()
-        expected = u(
-            '             value\nid1 id2 id3       \n'
-            'NaN NaN NaN    123\n9h4 d67 79d     64')
-        self.assertEqual(result, expected)
-
-    def test_to_string(self):
-
-        # big mixed
-        biggie = DataFrame({'A': np.random.randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20, 'A'] = np.nan
-        biggie.loc[:20, 'B'] = np.nan
-        s = biggie.to_string()
-
-        buf = StringIO()
-        retval = biggie.to_string(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue(), s)
-
-        tm.assertIsInstance(s, compat.string_types)
-
-        # print in right order
-        result = biggie.to_string(columns=['B', 'A'], col_space=17,
-                                  float_format='%.5f'.__mod__)
-        lines = result.split('\n')
-        header = lines[0].strip().split()
-        joined = '\n'.join([re.sub(r'\s+', ' ', x).strip() for x in lines[1:]])
-        recons = read_table(StringIO(joined), names=header,
-                            header=None, sep=' ')
-        tm.assert_series_equal(recons['B'], biggie['B'])
-        self.assertEqual(recons['A'].count(), biggie['A'].count())
-        self.assertTrue((np.abs(recons['A'].dropna() - biggie['A'].dropna()) <
-                         0.1).all())
-
-        # expected = ['B', 'A']
-        # self.assertEqual(header, expected)
-
-        result = biggie.to_string(columns=['A'], col_space=17)
-        header = result.split('\n')[0].strip().split()
-        expected = ['A']
-        self.assertEqual(header, expected)
-
-        biggie.to_string(columns=['B', 'A'],
-                         formatters={'A': lambda x: '%.1f' % x})
-
-        biggie.to_string(columns=['B', 'A'], float_format=str)
-        biggie.to_string(columns=['B', 'A'], col_space=12, float_format=str)
-
-        frame = DataFrame(index=np.arange(200))
-        frame.to_string()
-
-    def test_to_string_no_header(self):
-        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
-
-        df_s = df.to_string(header=False)
-        expected = "0  1  4\n1  2  5\n2  3  6"
-
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_specified_header(self):
-        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
-
-        df_s = df.to_string(header=['X', 'Y'])
-        expected = '   X  Y\n0  1  4\n1  2  5\n2  3  6'
-
-        self.assertEqual(df_s, expected)
-
-        with tm.assertRaises(ValueError):
-            df.to_string(header=['X'])
-
-    def test_to_string_no_index(self):
-        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
-
-        df_s = df.to_string(index=False)
-        expected = "x  y\n1  4\n2  5\n3  6"
-
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_line_width_no_index(self):
-        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
-
-        df_s = df.to_string(line_width=1, index=False)
-        expected = "x  \\\n1   \n2   \n3   \n\ny  \n4  \n5  \n6"
-
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_float_formatting(self):
-        self.reset_display_options()
-        fmt.set_option('display.precision', 5, 'display.column_space', 12,
-                       'display.notebook_repr_html', False)
-
-        df = DataFrame({'x': [0, 0.25, 3456.000, 12e+45, 1.64e+6, 1.7e+8,
-                              1.253456, np.pi, -1e6]})
-
-        df_s = df.to_string()
-
-        # Python 2.5 just wants me to be sad. And debian 32-bit
-        # sys.version_info[0] == 2 and sys.version_info[1] < 6:
-        if _three_digit_exp():
-            expected = ('              x\n0  0.00000e+000\n1  2.50000e-001\n'
-                        '2  3.45600e+003\n3  1.20000e+046\n4  1.64000e+006\n'
-                        '5  1.70000e+008\n6  1.25346e+000\n7  3.14159e+000\n'
-                        '8 -1.00000e+006')
-        else:
-            expected = ('             x\n0  0.00000e+00\n1  2.50000e-01\n'
-                        '2  3.45600e+03\n3  1.20000e+46\n4  1.64000e+06\n'
-                        '5  1.70000e+08\n6  1.25346e+00\n7  3.14159e+00\n'
-                        '8 -1.00000e+06')
-        self.assertEqual(df_s, expected)
-
-        df = DataFrame({'x': [3234, 0.253]})
-        df_s = df.to_string()
-
-        expected = ('          x\n' '0  3234.000\n' '1     0.253')
-        self.assertEqual(df_s, expected)
-
-        self.reset_display_options()
-        self.assertEqual(get_option("display.precision"), 6)
-
-        df = DataFrame({'x': [1e9, 0.2512]})
-        df_s = df.to_string()
-        # Python 2.5 just wants me to be sad. And debian 32-bit
-        # sys.version_info[0] == 2 and sys.version_info[1] < 6:
-        if _three_digit_exp():
-            expected = ('               x\n'
-                        '0  1.000000e+009\n'
-                        '1  2.512000e-001')
-        else:
-            expected = ('              x\n'
-                        '0  1.000000e+09\n'
-                        '1  2.512000e-01')
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_small_float_values(self):
-        df = DataFrame({'a': [1.5, 1e-17, -5.5e-7]})
-
-        result = df.to_string()
-        # sadness per above
-        if '%.4g' % 1.7e8 == '1.7e+008':
-            expected = ('               a\n'
-                        '0  1.500000e+000\n'
-                        '1  1.000000e-017\n'
-                        '2 -5.500000e-007')
-        else:
-            expected = ('              a\n'
-                        '0  1.500000e+00\n'
-                        '1  1.000000e-17\n'
-                        '2 -5.500000e-07')
-        self.assertEqual(result, expected)
-
-        # but not all exactly zero
-        df = df * 0
-        result = df.to_string()
-        expected = ('   0\n' '0  0\n' '1  0\n' '2 -0')
-
-    def test_to_string_float_index(self):
-        index = Index([1.5, 2, 3, 4, 5])
-        df = DataFrame(lrange(5), index=index)
-
-        result = df.to_string()
-        expected = ('     0\n'
-                    '1.5  0\n'
-                    '2.0  1\n'
-                    '3.0  2\n'
-                    '4.0  3\n'
-                    '5.0  4')
-        self.assertEqual(result, expected)
-
-    def test_to_string_ascii_error(self):
-        data = [('0  ', u('                        .gitignore '), u('     5 '),
-                 ' \xe2\x80\xa2\xe2\x80\xa2\xe2\x80'
-                 '\xa2\xe2\x80\xa2\xe2\x80\xa2')]
-        df = DataFrame(data)
-
-        # it works!
-        repr(df)
-
-    def test_to_string_int_formatting(self):
-        df = DataFrame({'x': [-15, 20, 25, -35]})
-        self.assertTrue(issubclass(df['x'].dtype.type, np.integer))
-
-        output = df.to_string()
-        expected = ('    x\n' '0 -15\n' '1  20\n' '2  25\n' '3 -35')
-        self.assertEqual(output, expected)
-
-    def test_to_string_index_formatter(self):
-        df = DataFrame([lrange(5), lrange(5, 10), lrange(10, 15)])
-
-        rs = df.to_string(formatters={'__index__': lambda x: 'abc' [x]})
-
-        xp = """\
-    0   1   2   3   4
-a   0   1   2   3   4
-b   5   6   7   8   9
-c  10  11  12  13  14\
-"""
-
-        self.assertEqual(rs, xp)
-
-    def test_to_string_left_justify_cols(self):
-        self.reset_display_options()
-        df = DataFrame({'x': [3234, 0.253]})
-        df_s = df.to_string(justify='left')
-        expected = ('   x       \n' '0  3234.000\n' '1     0.253')
-        self.assertEqual(df_s, expected)
-
-    def test_to_string_format_na(self):
-        self.reset_display_options()
-        df = DataFrame({'A': [np.nan, -1, -2.1234, 3, 4],
-                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
-        result = df.to_string()
-
-        expected = ('        A       B\n'
-                    '0     NaN     NaN\n'
-                    '1 -1.0000     foo\n'
-                    '2 -2.1234   foooo\n'
-                    '3  3.0000  fooooo\n'
-                    '4  4.0000     bar')
-        self.assertEqual(result, expected)
-
-        df = DataFrame({'A': [np.nan, -1., -2., 3., 4.],
-                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
-        result = df.to_string()
-
-        expected = ('     A       B\n'
-                    '0  NaN     NaN\n'
-                    '1 -1.0     foo\n'
-                    '2 -2.0   foooo\n'
-                    '3  3.0  fooooo\n'
-                    '4  4.0     bar')
-        self.assertEqual(result, expected)
-
-    def test_to_string_line_width(self):
-        df = DataFrame(123, lrange(10, 15), lrange(30))
-        s = df.to_string(line_width=80)
-        self.assertEqual(max(len(l) for l in s.split('\n')), 80)
-
-    def test_show_dimensions(self):
-        df = DataFrame(123, lrange(10, 15), lrange(30))
-
-        with option_context('display.max_rows', 10, 'display.max_columns', 40,
-                            'display.width', 500, 'display.expand_frame_repr',
-                            'info', 'display.show_dimensions', True):
-            self.assertTrue('5 rows' in str(df))
-            self.assertTrue('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 10, 'display.max_columns', 40,
-                            'display.width', 500, 'display.expand_frame_repr',
-                            'info', 'display.show_dimensions', False):
-            self.assertFalse('5 rows' in str(df))
-            self.assertFalse('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 2, 'display.max_columns', 2,
-                            'display.width', 500, 'display.expand_frame_repr',
-                            'info', 'display.show_dimensions', 'truncate'):
-            self.assertTrue('5 rows' in str(df))
-            self.assertTrue('5 rows' in df._repr_html_())
-        with option_context('display.max_rows', 10, 'display.max_columns', 40,
-                            'display.width', 500, 'display.expand_frame_repr',
-                            'info', 'display.show_dimensions', 'truncate'):
-            self.assertFalse('5 rows' in str(df))
-            self.assertFalse('5 rows' in df._repr_html_())
-
-    def test_repr_html(self):
-        self.frame._repr_html_()
-
-        fmt.set_option('display.max_rows', 1, 'display.max_columns', 1)
-        self.frame._repr_html_()
-
-        fmt.set_option('display.notebook_repr_html', False)
-        self.frame._repr_html_()
-
-        self.reset_display_options()
-
-        df = DataFrame([[1, 2], [3, 4]])
-        fmt.set_option('display.show_dimensions', True)
-        self.assertTrue('2 rows' in df._repr_html_())
-        fmt.set_option('display.show_dimensions', False)
-        self.assertFalse('2 rows' in df._repr_html_())
-
-        self.reset_display_options()
-
-    def test_repr_html_wide(self):
-        max_cols = get_option('display.max_columns')
-        df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
-        reg_repr = df._repr_html_()
-        assert "..." not in reg_repr
-
-        wide_df = DataFrame(tm.rands_array(25, size=(10, max_cols + 1)))
-        wide_repr = wide_df._repr_html_()
-        assert "..." in wide_repr
-
-    def test_repr_html_wide_multiindex_cols(self):
-        max_cols = get_option('display.max_columns')
-
-        mcols = MultiIndex.from_product([np.arange(max_cols // 2),
-                                         ['foo', 'bar']],
-                                        names=['first', 'second'])
-        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
-                       columns=mcols)
-        reg_repr = df._repr_html_()
-        assert '...' not in reg_repr
-
-        mcols = MultiIndex.from_product((np.arange(1 + (max_cols // 2)),
-                                         ['foo', 'bar']),
-                                        names=['first', 'second'])
-        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
-                       columns=mcols)
-        wide_repr = df._repr_html_()
-        assert '...' in wide_repr
-
-    def test_repr_html_long(self):
-        max_rows = get_option('display.max_rows')
-        h = max_rows - 1
-        df = DataFrame({'A': np.arange(1, 1 + h), 'B': np.arange(41, 41 + h)})
-        reg_repr = df._repr_html_()
-        assert '..' not in reg_repr
-        assert str(41 + max_rows // 2) in reg_repr
-
-        h = max_rows + 1
-        df = DataFrame({'A': np.arange(1, 1 + h), 'B': np.arange(41, 41 + h)})
-        long_repr = df._repr_html_()
-        assert '..' in long_repr
-        assert str(41 + max_rows // 2) not in long_repr
-        assert u('%d rows ') % h in long_repr
-        assert u('2 columns') in long_repr
-
-    def test_repr_html_float(self):
-        with option_context('display.max_rows', 60):
-
-            max_rows = get_option('display.max_rows')
-            h = max_rows - 1
-            df = DataFrame({'idx': np.linspace(-10, 10, h),
-                            'A': np.arange(1, 1 + h),
-                            'B': np.arange(41, 41 + h)}).set_index('idx')
-            reg_repr = df._repr_html_()
-            assert '..' not in reg_repr
-            assert str(40 + h) in reg_repr
-
-            h = max_rows + 1
-            df = DataFrame({'idx': np.linspace(-10, 10, h),
-                            'A': np.arange(1, 1 + h),
-                            'B': np.arange(41, 41 + h)}).set_index('idx')
-            long_repr = df._repr_html_()
-            assert '..' in long_repr
-            assert '31' not in long_repr
-            assert u('%d rows ') % h in long_repr
-            assert u('2 columns') in long_repr
-
-    def test_repr_html_long_multiindex(self):
-        max_rows = get_option('display.max_rows')
-        max_L1 = max_rows // 2
-
-        tuples = list(itertools.product(np.arange(max_L1), ['foo', 'bar']))
-        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        df = DataFrame(np.random.randn(max_L1 * 2, 2), index=idx,
-                       columns=['A', 'B'])
-        reg_repr = df._repr_html_()
-        assert '...' not in reg_repr
-
-        tuples = list(itertools.product(np.arange(max_L1 + 1), ['foo', 'bar']))
-        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        df = DataFrame(np.random.randn((max_L1 + 1) * 2, 2), index=idx,
-                       columns=['A', 'B'])
-        long_repr = df._repr_html_()
-        assert '...' in long_repr
-
-    def test_repr_html_long_and_wide(self):
-        max_cols = get_option('display.max_columns')
-        max_rows = get_option('display.max_rows')
-
-        h, w = max_rows - 1, max_cols - 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert '...' not in df._repr_html_()
-
-        h, w = max_rows + 1, max_cols + 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert '...' in df._repr_html_()
-
-    def test_info_repr(self):
-        max_rows = get_option('display.max_rows')
-        max_cols = get_option('display.max_columns')
-        # Long
-        h, w = max_rows + 1, max_cols - 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert has_vertically_truncated_repr(df)
-        with option_context('display.large_repr', 'info'):
-            assert has_info_repr(df)
-
-        # Wide
-        h, w = max_rows - 1, max_cols + 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert has_horizontally_truncated_repr(df)
-        with option_context('display.large_repr', 'info'):
-            assert has_info_repr(df)
-
-    def test_info_repr_max_cols(self):
-        # GH #6939
-        df = DataFrame(np.random.randn(10, 5))
-        with option_context('display.large_repr', 'info',
-                            'display.max_columns', 1,
-                            'display.max_info_columns', 4):
-            self.assertTrue(has_non_verbose_info_repr(df))
-
-        with option_context('display.large_repr', 'info',
-                            'display.max_columns', 1,
-                            'display.max_info_columns', 5):
-            self.assertFalse(has_non_verbose_info_repr(df))
-
-        # test verbose overrides
-        # fmt.set_option('display.max_info_columns', 4)  # exceeded
-
-    def test_info_repr_html(self):
-        max_rows = get_option('display.max_rows')
-        max_cols = get_option('display.max_columns')
-        # Long
-        h, w = max_rows + 1, max_cols - 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert r'&lt;class' not in df._repr_html_()
-        with option_context('display.large_repr', 'info'):
-            assert r'&lt;class' in df._repr_html_()
-
-        # Wide
-        h, w = max_rows - 1, max_cols + 1
-        df = DataFrame(dict((k, np.arange(1, 1 + h)) for k in np.arange(w)))
-        assert '<class' not in df._repr_html_()
-        with option_context('display.large_repr', 'info'):
-            assert '&lt;class' in df._repr_html_()
-
-    def test_fake_qtconsole_repr_html(self):
-        def get_ipython():
-            return {'config': {'KernelApp':
-                               {'parent_appname': 'ipython-qtconsole'}}}
-
-        repstr = self.frame._repr_html_()
-        self.assertIsNotNone(repstr)
-
-        fmt.set_option('display.max_rows', 5, 'display.max_columns', 2)
-        repstr = self.frame._repr_html_()
-        self.assertIn('class', repstr)  # info fallback
-
-        self.reset_display_options()
-
-    def test_pprint_pathological_object(self):
-        """
-        if the test fails, the stack will overflow and nose crash,
-        but it won't hang.
-        """
-
-        class A:
-
-            def __getitem__(self, key):
-                return 3  # obviously simplified
-
-        df = DataFrame([A()])
-        repr(df)  # just don't dine
-
-    def test_float_trim_zeros(self):
-        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
-                2.03954217305e+10, 5.59897817305e+10]
-        skip = True
-        for line in repr(DataFrame({'A': vals})).split('\n')[:-2]:
-            if line.startswith('dtype:'):
-                continue
-            if _three_digit_exp():
-                self.assertTrue(('+010' in line) or skip)
-            else:
-                self.assertTrue(('+10' in line) or skip)
-            skip = False
-
-    def test_dict_entries(self):
-        df = DataFrame({'A': [{'a': 1, 'b': 2}]})
-
-        val = df.to_string()
-        self.assertTrue("'a': 1" in val)
-        self.assertTrue("'b': 2" in val)
-
-    def test_period(self):
-        # GH 12615
-        df = pd.DataFrame({'A': pd.period_range('2013-01',
-                                                periods=4, freq='M'),
-                           'B': [pd.Period('2011-01', freq='M'),
-                                 pd.Period('2011-02-01', freq='D'),
-                                 pd.Period('2011-03-01 09:00', freq='H'),
-                                 pd.Period('2011-04', freq='M')],
-                           'C': list('abcd')})
-        exp = ("        A                B  C\n0 2013-01          2011-01  a\n"
-               "1 2013-02       2011-02-01  b\n2 2013-03 2011-03-01 09:00  c\n"
-               "3 2013-04          2011-04  d")
-        self.assertEqual(str(df), exp)
-
-
-def gen_series_formatting():
-    s1 = pd.Series(['a'] * 100)
-    s2 = pd.Series(['ab'] * 100)
-    s3 = pd.Series(['a', 'ab', 'abc', 'abcd', 'abcde', 'abcdef'])
-    s4 = s3[::-1]
-    test_sers = {'onel': s1, 'twol': s2, 'asc': s3, 'desc': s4}
-    return test_sers
-
-
-class TestSeriesFormatting(tm.TestCase):
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-    def test_repr_unicode(self):
-        s = Series([u('\u03c3')] * 10)
-        repr(s)
-
-        a = Series([u("\u05d0")] * 1000)
-        a.name = 'title1'
-        repr(a)
-
-    def test_to_string(self):
-        buf = StringIO()
-
-        s = self.ts.to_string()
-
-        retval = self.ts.to_string(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue().strip(), s)
-
-        # pass float_format
-        format = '%.4f'.__mod__
-        result = self.ts.to_string(float_format=format)
-        result = [x.split()[1] for x in result.split('\n')[:-1]]
-        expected = [format(x) for x in self.ts]
-        self.assertEqual(result, expected)
-
-        # empty string
-        result = self.ts[:0].to_string()
-        self.assertEqual(result, 'Series([], Freq: B)')
-
-        result = self.ts[:0].to_string(length=0)
-        self.assertEqual(result, 'Series([], Freq: B)')
-
-        # name and length
-        cp = self.ts.copy()
-        cp.name = 'foo'
-        result = cp.to_string(length=True, name=True, dtype=True)
-        last_line = result.split('\n')[-1].strip()
-        self.assertEqual(last_line,
-                         "Freq: B, Name: foo, Length: %d, dtype: float64" %
-                         len(cp))
-
-    def test_freq_name_separation(self):
-        s = Series(np.random.randn(10),
-                   index=date_range('1/1/2000', periods=10), name=0)
-
-        result = repr(s)
-        self.assertTrue('Freq: D, Name: 0' in result)
-
-    def test_to_string_mixed(self):
-        s = Series(['foo', np.nan, -1.23, 4.56])
-        result = s.to_string()
-        expected = (u('0     foo\n') + u('1     NaN\n') + u('2   -1.23\n') +
-                    u('3    4.56'))
-        self.assertEqual(result, expected)
-
-        # but don't count NAs as floats
-        s = Series(['foo', np.nan, 'bar', 'baz'])
-        result = s.to_string()
-        expected = (u('0    foo\n') + '1    NaN\n' + '2    bar\n' + '3    baz')
-        self.assertEqual(result, expected)
-
-        s = Series(['foo', 5, 'bar', 'baz'])
-        result = s.to_string()
-        expected = (u('0    foo\n') + '1      5\n' + '2    bar\n' + '3    baz')
-        self.assertEqual(result, expected)
-
-    def test_to_string_float_na_spacing(self):
-        s = Series([0., 1.5678, 2., -3., 4.])
-        s[::2] = np.nan
-
-        result = s.to_string()
-        expected = (u('0       NaN\n') + '1    1.5678\n' + '2       NaN\n' +
-                    '3   -3.0000\n' + '4       NaN')
-        self.assertEqual(result, expected)
-
-    def test_to_string_without_index(self):
-        # GH 11729 Test index=False option
-        s = Series([1, 2, 3, 4])
-        result = s.to_string(index=False)
-        expected = (u('1\n') + '2\n' + '3\n' + '4')
-        self.assertEqual(result, expected)
-
-    def test_unicode_name_in_footer(self):
-        s = Series([1, 2], name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
-        sf = fmt.SeriesFormatter(s, name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
-        sf._get_footer()  # should not raise exception
-
-    def test_east_asian_unicode_series(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode  # noqa
-        # not aligned properly because of east asian width
-
-        # unicode index
-        s = Series(['a', 'bb', 'CCC', 'D'],
-                   index=[u'あ', u'いい', u'ううう', u'ええええ'])
-        expected = (u"あ         a\nいい       bb\nううう     CCC\n"
-                    u"ええええ      D\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # unicode values
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                   index=['a', 'bb', 'c', 'ddd'])
-        expected = (u"a         あ\nbb       いい\nc       ううう\n"
-                    u"ddd    ええええ\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # both
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                   index=[u'ああ', u'いいいい', u'う', u'えええ'])
-        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
-                    u"えええ     ええええ\ndtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # unicode footer
-        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                   index=[u'ああ', u'いいいい', u'う', u'えええ'],
-                   name=u'おおおおおおお')
-        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
-                    u"えええ     ええええ\nName: おおおおおおお, dtype: object")
-        self.assertEqual(_rep(s), expected)
-
-        # MultiIndex
-        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
-            u'おおお', u'かかかか'), (u'き', u'くく')])
-        s = Series([1, 22, 3333, 44444], index=idx)
-        expected = (u"あ    いい          1\n"
-                    u"う    え          22\n"
-                    u"おおお  かかかか     3333\n"
-                    u"き    くく      44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # object dtype, shorter than unicode repr
-        s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
-        expected = (u"1          1\nAB        22\nNaN     3333\n"
-                    u"あああ    44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # object dtype, longer than unicode repr
-        s = Series([1, 22, 3333, 44444],
-                   index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
-        expected = (u"1                          1\n"
-                    u"AB                        22\n"
-                    u"2011-01-01 00:00:00     3333\n"
-                    u"あああ                    44444\ndtype: int64")
-        self.assertEqual(_rep(s), expected)
-
-        # truncate
-        with option_context('display.max_rows', 3):
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       name=u'おおおおおおお')
-
-            expected = (u"0       あ\n     ... \n"
-                        u"3    ええええ\nName: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            s.index = [u'ああ', u'いいいい', u'う', u'えええ']
-            expected = (u"ああ        あ\n       ... \n"
-                        u"えええ    ええええ\nName: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-        # Emable Unicode option -----------------------------------------
-        with option_context('display.unicode.east_asian_width', True):
-
-            # unicode index
-            s = Series(['a', 'bb', 'CCC', 'D'],
-                       index=[u'あ', u'いい', u'ううう', u'ええええ'])
-            expected = (u"あ            a\nいい         bb\nううう      CCC\n"
-                        u"ええええ      D\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # unicode values
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       index=['a', 'bb', 'c', 'ddd'])
-            expected = (u"a            あ\nbb         いい\nc        ううう\n"
-                        u"ddd    ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # both
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'いいいい', u'う', u'えええ'])
-            expected = (u"ああ              あ\n"
-                        u"いいいい        いい\n"
-                        u"う            ううう\n"
-                        u"えええ      ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # unicode footer
-            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'いいいい', u'う', u'えええ'],
-                       name=u'おおおおおおお')
-            expected = (u"ああ              あ\n"
-                        u"いいいい        いい\n"
-                        u"う            ううう\n"
-                        u"えええ      ええええ\n"
-                        u"Name: おおおおおおお, dtype: object")
-            self.assertEqual(_rep(s), expected)
-
-            # MultiIndex
-            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
-                u'おおお', u'かかかか'), (u'き', u'くく')])
-            s = Series([1, 22, 3333, 44444], index=idx)
-            expected = (u"あ      いい            1\n"
-                        u"う      え             22\n"
-                        u"おおお  かかかか     3333\n"
-                        u"き      くく        44444\n"
-                        u"dtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # object dtype, shorter than unicode repr
-            s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
-            expected = (u"1             1\nAB           22\nNaN        3333\n"
-                        u"あああ    44444\ndtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # object dtype, longer than unicode repr
-            s = Series([1, 22, 3333, 44444],
-                       index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
-            expected = (u"1                          1\n"
-                        u"AB                        22\n"
-                        u"2011-01-01 00:00:00     3333\n"
-                        u"あああ                 44444\ndtype: int64")
-            self.assertEqual(_rep(s), expected)
-
-            # truncate
-            with option_context('display.max_rows', 3):
-                s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
-                           name=u'おおおおおおお')
-                expected = (u"0          あ\n       ...   \n"
-                            u"3    ええええ\nName: おおおおおおお, dtype: object")
-                self.assertEqual(_rep(s), expected)
-
-                s.index = [u'ああ', u'いいいい', u'う', u'えええ']
-                expected = (u"ああ            あ\n"
-                            u"            ...   \n"
-                            u"えええ    ええええ\n"
-                            u"Name: おおおおおおお, dtype: object")
-                self.assertEqual(_rep(s), expected)
-
-            # ambiguous unicode
-            s = Series([u'¡¡', u'い¡¡', u'ううう', u'ええええ'],
-                       index=[u'ああ', u'¡¡¡¡いい', u'¡¡', u'えええ'])
-            expected = (u"ああ              ¡¡\n"
-                        u"¡¡¡¡いい        い¡¡\n"
-                        u"¡¡            ううう\n"
-                        u"えええ      ええええ\ndtype: object")
-            self.assertEqual(_rep(s), expected)
-
-    def test_float_trim_zeros(self):
-        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
-                2.03954217305e+10, 5.59897817305e+10]
-        for line in repr(Series(vals)).split('\n'):
-            if line.startswith('dtype:'):
-                continue
-            if _three_digit_exp():
-                self.assertIn('+010', line)
-            else:
-                self.assertIn('+10', line)
-
-    def test_datetimeindex(self):
-
-        index = date_range('20130102', periods=6)
-        s = Series(1, index=index)
-        result = s.to_string()
-        self.assertTrue('2013-01-02' in result)
-
-        # nat in index
-        s2 = Series(2, index=[Timestamp('20130111'), NaT])
-        s = s2.append(s)
-        result = s.to_string()
-        self.assertTrue('NaT' in result)
-
-        # nat in summary
-        result = str(s2.index)
-        self.assertTrue('NaT' in result)
-
-    def test_timedelta64(self):
-
-        from datetime import datetime, timedelta
-
-        Series(np.array([1100, 20], dtype='timedelta64[ns]')).to_string()
-
-        s = Series(date_range('2012-1-1', periods=3, freq='D'))
-
-        # GH2146
-
-        # adding NaTs
-        y = s - s.shift(1)
-        result = y.to_string()
-        self.assertTrue('1 days' in result)
-        self.assertTrue('00:00:00' not in result)
-        self.assertTrue('NaT' in result)
-
-        # with frac seconds
-        o = Series([datetime(2012, 1, 1, microsecond=150)] * 3)
-        y = s - o
-        result = y.to_string()
-        self.assertTrue('-1 days +23:59:59.999850' in result)
-
-        # rounding?
-        o = Series([datetime(2012, 1, 1, 1)] * 3)
-        y = s - o
-        result = y.to_string()
-        self.assertTrue('-1 days +23:00:00' in result)
-        self.assertTrue('1 days 23:00:00' in result)
-
-        o = Series([datetime(2012, 1, 1, 1, 1)] * 3)
-        y = s - o
-        result = y.to_string()
-        self.assertTrue('-1 days +22:59:00' in result)
-        self.assertTrue('1 days 22:59:00' in result)
-
-        o = Series([datetime(2012, 1, 1, 1, 1, microsecond=150)] * 3)
-        y = s - o
-        result = y.to_string()
-        self.assertTrue('-1 days +22:58:59.999850' in result)
-        self.assertTrue('0 days 22:58:59.999850' in result)
-
-        # neg time
-        td = timedelta(minutes=5, seconds=3)
-        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
-        y = s - s2
-        result = y.to_string()
-        self.assertTrue('-1 days +23:54:57' in result)
-
-        td = timedelta(microseconds=550)
-        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
-        y = s - td
-        result = y.to_string()
-        self.assertTrue('2012-01-01 23:59:59.999450' in result)
-
-        # no boxing of the actual elements
-        td = Series(pd.timedelta_range('1 days', periods=3))
-        result = td.to_string()
-        self.assertEqual(result, u("0   1 days\n1   2 days\n2   3 days"))
-
-    def test_mixed_datetime64(self):
-        df = DataFrame({'A': [1, 2], 'B': ['2012-01-01', '2012-01-02']})
-        df['B'] = pd.to_datetime(df.B)
-
-        result = repr(df.loc[0])
-        self.assertTrue('2012-01-01' in result)
-
-    def test_period(self):
-        # GH 12615
-        index = pd.period_range('2013-01', periods=6, freq='M')
-        s = Series(np.arange(6, dtype='int64'), index=index)
-        exp = ("2013-01    0\n2013-02    1\n2013-03    2\n2013-04    3\n"
-               "2013-05    4\n2013-06    5\nFreq: M, dtype: int64")
-        self.assertEqual(str(s), exp)
-
-        s = Series(index)
-        exp = ("0   2013-01\n1   2013-02\n2   2013-03\n3   2013-04\n"
-               "4   2013-05\n5   2013-06\ndtype: object")
-        self.assertEqual(str(s), exp)
-
-        # periods with mixed freq
-        s = Series([pd.Period('2011-01', freq='M'),
-                    pd.Period('2011-02-01', freq='D'),
-                    pd.Period('2011-03-01 09:00', freq='H')])
-        exp = ("0            2011-01\n1         2011-02-01\n"
-               "2   2011-03-01 09:00\ndtype: object")
-        self.assertEqual(str(s), exp)
-
-    def test_max_multi_index_display(self):
-        # GH 7101
-
-        # doc example (indexing.rst)
-
-        # multi-index
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        tuples = list(zip(*arrays))
-        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        s = Series(np.random.randn(8), index=index)
-
-        with option_context("display.max_rows", 10):
-            self.assertEqual(len(str(s).split('\n')), 10)
-        with option_context("display.max_rows", 3):
-            self.assertEqual(len(str(s).split('\n')), 5)
-        with option_context("display.max_rows", 2):
-            self.assertEqual(len(str(s).split('\n')), 5)
-        with option_context("display.max_rows", 1):
-            self.assertEqual(len(str(s).split('\n')), 4)
-        with option_context("display.max_rows", 0):
-            self.assertEqual(len(str(s).split('\n')), 10)
-
-        # index
-        s = Series(np.random.randn(8), None)
-
-        with option_context("display.max_rows", 10):
-            self.assertEqual(len(str(s).split('\n')), 9)
-        with option_context("display.max_rows", 3):
-            self.assertEqual(len(str(s).split('\n')), 4)
-        with option_context("display.max_rows", 2):
-            self.assertEqual(len(str(s).split('\n')), 4)
-        with option_context("display.max_rows", 1):
-            self.assertEqual(len(str(s).split('\n')), 3)
-        with option_context("display.max_rows", 0):
-            self.assertEqual(len(str(s).split('\n')), 9)
-
-    # Make sure #8532 is fixed
-    def test_consistent_format(self):
-        s = pd.Series([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0.9999, 1, 1] * 10)
-        with option_context("display.max_rows", 10):
-            res = repr(s)
-        exp = ('0      1.0000\n1      1.0000\n2      1.0000\n3      '
-               '1.0000\n4      1.0000\n        ...  \n125    '
-               '1.0000\n126    1.0000\n127    0.9999\n128    '
-               '1.0000\n129    1.0000\ndtype: float64')
-        self.assertEqual(res, exp)
-
-    def chck_ncols(self, s):
-        with option_context("display.max_rows", 10):
-            res = repr(s)
-        lines = res.split('\n')
-        lines = [line for line in repr(s).split('\n')
-                 if not re.match(r'[^\.]*\.+', line)][:-1]
-        ncolsizes = len(set(len(line.strip()) for line in lines))
-        self.assertEqual(ncolsizes, 1)
-
-    def test_format_explicit(self):
-        test_sers = gen_series_formatting()
-        with option_context("display.max_rows", 4):
-            res = repr(test_sers['onel'])
-            exp = '0     a\n1     a\n     ..\n98    a\n99    a\ndtype: object'
-            self.assertEqual(exp, res)
-            res = repr(test_sers['twol'])
-            exp = ('0     ab\n1     ab\n      ..\n98    ab\n99    ab\ndtype:'
-                   ' object')
-            self.assertEqual(exp, res)
-            res = repr(test_sers['asc'])
-            exp = ('0         a\n1        ab\n      ...  \n4     abcde\n5'
-                   '    abcdef\ndtype: object')
-            self.assertEqual(exp, res)
-            res = repr(test_sers['desc'])
-            exp = ('5    abcdef\n4     abcde\n      ...  \n1        ab\n0'
-                   '         a\ndtype: object')
-            self.assertEqual(exp, res)
-
-    def test_ncols(self):
-        test_sers = gen_series_formatting()
-        for s in test_sers.values():
-            self.chck_ncols(s)
-
-    def test_max_rows_eq_one(self):
-        s = Series(range(10), dtype='int64')
-        with option_context("display.max_rows", 1):
-            strrepr = repr(s).split('\n')
-        exp1 = ['0', '0']
-        res1 = strrepr[0].split()
-        self.assertEqual(exp1, res1)
-        exp2 = ['..']
-        res2 = strrepr[1].split()
-        self.assertEqual(exp2, res2)
-
-    def test_truncate_ndots(self):
-        def getndots(s):
-            return len(re.match(r'[^\.]*(\.*)', s).groups()[0])
-
-        s = Series([0, 2, 3, 6])
-        with option_context("display.max_rows", 2):
-            strrepr = repr(s).replace('\n', '')
-        self.assertEqual(getndots(strrepr), 2)
-
-        s = Series([0, 100, 200, 400])
-        with option_context("display.max_rows", 2):
-            strrepr = repr(s).replace('\n', '')
-        self.assertEqual(getndots(strrepr), 3)
-
-    def test_to_string_name(self):
-        s = Series(range(100), dtype='int64')
-        s.name = 'myser'
-        res = s.to_string(max_rows=2, name=True)
-        exp = '0      0\n      ..\n99    99\nName: myser'
-        self.assertEqual(res, exp)
-        res = s.to_string(max_rows=2, name=False)
-        exp = '0      0\n      ..\n99    99'
-        self.assertEqual(res, exp)
-
-    def test_to_string_dtype(self):
-        s = Series(range(100), dtype='int64')
-        res = s.to_string(max_rows=2, dtype=True)
-        exp = '0      0\n      ..\n99    99\ndtype: int64'
-        self.assertEqual(res, exp)
-        res = s.to_string(max_rows=2, dtype=False)
-        exp = '0      0\n      ..\n99    99'
-        self.assertEqual(res, exp)
-
-    def test_to_string_length(self):
-        s = Series(range(100), dtype='int64')
-        res = s.to_string(max_rows=2, length=True)
-        exp = '0      0\n      ..\n99    99\nLength: 100'
-        self.assertEqual(res, exp)
-
-    def test_to_string_na_rep(self):
-        s = pd.Series(index=range(100))
-        res = s.to_string(na_rep='foo', max_rows=2)
-        exp = '0    foo\n      ..\n99   foo'
-        self.assertEqual(res, exp)
-
-    def test_to_string_float_format(self):
-        s = pd.Series(range(10), dtype='float64')
-        res = s.to_string(float_format=lambda x: '{0:2.1f}'.format(x),
-                          max_rows=2)
-        exp = '0   0.0\n     ..\n9   9.0'
-        self.assertEqual(res, exp)
-
-    def test_to_string_header(self):
-        s = pd.Series(range(10), dtype='int64')
-        s.index.name = 'foo'
-        res = s.to_string(header=True, max_rows=2)
-        exp = 'foo\n0    0\n    ..\n9    9'
-        self.assertEqual(res, exp)
-        res = s.to_string(header=False, max_rows=2)
-        exp = '0    0\n    ..\n9    9'
-        self.assertEqual(res, exp)
-
-
-def _three_digit_exp():
-    return '%.4g' % 1.7e8 == '1.7e+008'
-
-
-class TestFloatArrayFormatter(tm.TestCase):
-
-    def test_misc(self):
-        obj = fmt.FloatArrayFormatter(np.array([], dtype=np.float64))
-        result = obj.get_result()
-        self.assertTrue(len(result) == 0)
-
-    def test_format(self):
-        obj = fmt.FloatArrayFormatter(np.array([12, 0], dtype=np.float64))
-        result = obj.get_result()
-        self.assertEqual(result[0], " 12.0")
-        self.assertEqual(result[1], "  0.0")
-
-    def test_output_significant_digits(self):
-        # Issue #9764
-
-        # In case default display precision changes:
-        with pd.option_context('display.precision', 6):
-            # DataFrame example from issue #9764
-            d = pd.DataFrame(
-                {'col1': [9.999e-8, 1e-7, 1.0001e-7, 2e-7, 4.999e-7, 5e-7,
-                          5.0001e-7, 6e-7, 9.999e-7, 1e-6, 1.0001e-6, 2e-6,
-                          4.999e-6, 5e-6, 5.0001e-6, 6e-6]})
-
-            expected_output = {
-                (0, 6):
-                '           col1\n'
-                '0  9.999000e-08\n'
-                '1  1.000000e-07\n'
-                '2  1.000100e-07\n'
-                '3  2.000000e-07\n'
-                '4  4.999000e-07\n'
-                '5  5.000000e-07',
-                (1, 6):
-                '           col1\n'
-                '1  1.000000e-07\n'
-                '2  1.000100e-07\n'
-                '3  2.000000e-07\n'
-                '4  4.999000e-07\n'
-                '5  5.000000e-07',
-                (1, 8):
-                '           col1\n'
-                '1  1.000000e-07\n'
-                '2  1.000100e-07\n'
-                '3  2.000000e-07\n'
-                '4  4.999000e-07\n'
-                '5  5.000000e-07\n'
-                '6  5.000100e-07\n'
-                '7  6.000000e-07',
-                (8, 16):
-                '            col1\n'
-                '8   9.999000e-07\n'
-                '9   1.000000e-06\n'
-                '10  1.000100e-06\n'
-                '11  2.000000e-06\n'
-                '12  4.999000e-06\n'
-                '13  5.000000e-06\n'
-                '14  5.000100e-06\n'
-                '15  6.000000e-06',
-                (9, 16):
-                '        col1\n'
-                '9   0.000001\n'
-                '10  0.000001\n'
-                '11  0.000002\n'
-                '12  0.000005\n'
-                '13  0.000005\n'
-                '14  0.000005\n'
-                '15  0.000006'
-            }
-
-            for (start, stop), v in expected_output.items():
-                self.assertEqual(str(d[start:stop]), v)
-
-    def test_too_long(self):
-        # GH 10451
-        with pd.option_context('display.precision', 4):
-            # need both a number > 1e6 and something that normally formats to
-            # having length > display.precision + 6
-            df = pd.DataFrame(dict(x=[12345.6789]))
-            self.assertEqual(str(df), '            x\n0  12345.6789')
-            df = pd.DataFrame(dict(x=[2e6]))
-            self.assertEqual(str(df), '           x\n0  2000000.0')
-            df = pd.DataFrame(dict(x=[12345.6789, 2e6]))
-            self.assertEqual(
-                str(df), '            x\n0  1.2346e+04\n1  2.0000e+06')
-
-
-class TestRepr_timedelta64(tm.TestCase):
-
-    def test_none(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base()
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "0 days")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(
-            drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_even_day(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='even_day')
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "0 days")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(
-            drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_sub_day(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='sub_day')
-        self.assertEqual(drepr(delta_1d), "1 days")
-        self.assertEqual(drepr(-delta_1d), "-1 days")
-        self.assertEqual(drepr(delta_0d), "00:00:00")
-        self.assertEqual(drepr(delta_1s), "00:00:01")
-        self.assertEqual(drepr(delta_500ms), "00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(
-            drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_long(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1s = pd.to_timedelta(1, unit='s')
-        delta_500ms = pd.to_timedelta(500, unit='ms')
-
-        drepr = lambda x: x._repr_base(format='long')
-        self.assertEqual(drepr(delta_1d), "1 days 00:00:00")
-        self.assertEqual(drepr(-delta_1d), "-1 days +00:00:00")
-        self.assertEqual(drepr(delta_0d), "0 days 00:00:00")
-        self.assertEqual(drepr(delta_1s), "0 days 00:00:01")
-        self.assertEqual(drepr(delta_500ms), "0 days 00:00:00.500000")
-        self.assertEqual(drepr(delta_1d + delta_1s), "1 days 00:00:01")
-        self.assertEqual(
-            drepr(delta_1d + delta_500ms), "1 days 00:00:00.500000")
-
-    def test_all(self):
-        delta_1d = pd.to_timedelta(1, unit='D')
-        delta_0d = pd.to_timedelta(0, unit='D')
-        delta_1ns = pd.to_timedelta(1, unit='ns')
-
-        drepr = lambda x: x._repr_base(format='all')
-        self.assertEqual(drepr(delta_1d), "1 days 00:00:00.000000000")
-        self.assertEqual(drepr(delta_0d), "0 days 00:00:00.000000000")
-        self.assertEqual(drepr(delta_1ns), "0 days 00:00:00.000000001")
-
-
-class TestTimedelta64Formatter(tm.TestCase):
-
-    def test_days(self):
-        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(x, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-        self.assertEqual(result[1].strip(), "'1 days'")
-
-        result = fmt.Timedelta64Formatter(x[1:2], box=True).get_result()
-        self.assertEqual(result[0].strip(), "'1 days'")
-
-        result = fmt.Timedelta64Formatter(x, box=False).get_result()
-        self.assertEqual(result[0].strip(), "0 days")
-        self.assertEqual(result[1].strip(), "1 days")
-
-        result = fmt.Timedelta64Formatter(x[1:2], box=False).get_result()
-        self.assertEqual(result[0].strip(), "1 days")
-
-    def test_days_neg(self):
-        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(-x, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-        self.assertEqual(result[1].strip(), "'-1 days'")
-
-    def test_subdays(self):
-        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
-        result = fmt.Timedelta64Formatter(y, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'00:00:00'")
-        self.assertEqual(result[1].strip(), "'00:00:01'")
-
-    def test_subdays_neg(self):
-        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
-        result = fmt.Timedelta64Formatter(-y, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'00:00:00'")
-        self.assertEqual(result[1].strip(), "'-1 days +23:59:59'")
-
-    def test_zero(self):
-        x = pd.to_timedelta(list(range(1)) + [pd.NaT], unit='D')
-        result = fmt.Timedelta64Formatter(x, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-
-        x = pd.to_timedelta(list(range(1)), unit='D')
-        result = fmt.Timedelta64Formatter(x, box=True).get_result()
-        self.assertEqual(result[0].strip(), "'0 days'")
-
-
-class TestDatetime64Formatter(tm.TestCase):
-
-    def test_mixed(self):
-        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 1, 12), pd.NaT])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 00:00:00")
-        self.assertEqual(result[1].strip(), "2013-01-01 12:00:00")
-
-    def test_dates(self):
-        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01")
-        self.assertEqual(result[1].strip(), "2013-01-02")
-
-    def test_date_nanos(self):
-        x = Series([Timestamp(200)])
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "1970-01-01 00:00:00.000000200")
-
-    def test_dates_display(self):
-
-        # 10170
-        # make sure that we are consistently display date formatting
-        x = Series(date_range('20130101 09:00:00', periods=5, freq='D'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-05 09:00:00")
-
-        x = Series(date_range('20130101 09:00:00', periods=5, freq='s'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:04")
-
-        x = Series(date_range('20130101 09:00:00', periods=5, freq='ms'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.004")
-
-        x = Series(date_range('20130101 09:00:00', periods=5, freq='us'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.000004")
-
-        x = Series(date_range('20130101 09:00:00', periods=5, freq='N'))
-        x.iloc[1] = np.nan
-        result = fmt.Datetime64Formatter(x).get_result()
-        self.assertEqual(result[0].strip(), "2013-01-01 09:00:00.000000000")
-        self.assertEqual(result[1].strip(), "NaT")
-        self.assertEqual(result[4].strip(), "2013-01-01 09:00:00.000000004")
-
-    def test_datetime64formatter_yearmonth(self):
-        x = Series([datetime(2016, 1, 1), datetime(2016, 2, 2)])
-
-        def format_func(x):
-            return x.strftime('%Y-%m')
-
-        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
-        result = formatter.get_result()
-        self.assertEqual(result, ['2016-01', '2016-02'])
-
-    def test_datetime64formatter_hoursecond(self):
-
-        x = Series(pd.to_datetime(['10:10:10.100', '12:12:12.120'],
-                                  format='%H:%M:%S.%f'))
-
-        def format_func(x):
-            return x.strftime('%H:%M')
-
-        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
-        result = formatter.get_result()
-        self.assertEqual(result, ['10:10', '12:12'])
-
-
-class TestNaTFormatting(tm.TestCase):
-
-    def test_repr(self):
-        self.assertEqual(repr(pd.NaT), "NaT")
-
-    def test_str(self):
-        self.assertEqual(str(pd.NaT), "NaT")
-
-
-class TestDatetimeIndexFormat(tm.TestCase):
-
-    def test_datetime(self):
-        formatted = pd.to_datetime([datetime(2003, 1, 1, 12), pd.NaT]).format()
-        self.assertEqual(formatted[0], "2003-01-01 12:00:00")
-        self.assertEqual(formatted[1], "NaT")
-
-    def test_date(self):
-        formatted = pd.to_datetime([datetime(2003, 1, 1), pd.NaT]).format()
-        self.assertEqual(formatted[0], "2003-01-01")
-        self.assertEqual(formatted[1], "NaT")
-
-    def test_date_tz(self):
-        formatted = pd.to_datetime([datetime(2013, 1, 1)], utc=True).format()
-        self.assertEqual(formatted[0], "2013-01-01 00:00:00+00:00")
-
-        formatted = pd.to_datetime(
-            [datetime(2013, 1, 1), pd.NaT], utc=True).format()
-        self.assertEqual(formatted[0], "2013-01-01 00:00:00+00:00")
-
-    def test_date_explict_date_format(self):
-        formatted = pd.to_datetime([datetime(2003, 2, 1), pd.NaT]).format(
-            date_format="%m-%d-%Y", na_rep="UT")
-        self.assertEqual(formatted[0], "02-01-2003")
-        self.assertEqual(formatted[1], "UT")
-
-
-class TestDatetimeIndexUnicode(tm.TestCase):
-
-    def test_dates(self):
-        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(2014, 1, 1)
-                                   ]))
-        self.assertTrue("['2013-01-01'," in text)
-        self.assertTrue(", '2014-01-01']" in text)
-
-    def test_mixed(self):
-        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(
-            2014, 1, 1, 12), datetime(2014, 1, 1)]))
-        self.assertTrue("'2013-01-01 00:00:00'," in text)
-        self.assertTrue("'2014-01-01 00:00:00']" in text)
-
-
-class TestStringRepTimestamp(tm.TestCase):
-
-    def test_no_tz(self):
-        dt_date = datetime(2013, 1, 2)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-        ts_nanos_only = Timestamp(200)
-        self.assertEqual(str(ts_nanos_only), "1970-01-01 00:00:00.000000200")
-
-        ts_nanos_micros = Timestamp(1200)
-        self.assertEqual(str(ts_nanos_micros), "1970-01-01 00:00:00.000001200")
-
-    def test_tz_pytz(self):
-        tm._skip_if_no_pytz()
-
-        import pytz
-
-        dt_date = datetime(2013, 1, 2, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=pytz.utc)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-    def test_tz_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        utc = dateutil.tz.tzutc()
-
-        dt_date = datetime(2013, 1, 2, tzinfo=utc)
-        self.assertEqual(str(dt_date), str(Timestamp(dt_date)))
-
-        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=utc)
-        self.assertEqual(str(dt_datetime), str(Timestamp(dt_datetime)))
-
-        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=utc)
-        self.assertEqual(str(dt_datetime_us), str(Timestamp(dt_datetime_us)))
-
-    def test_nat_representations(self):
-        for f in (str, repr, methodcaller('isoformat')):
-            self.assertEqual(f(pd.NaT), 'NaT')
-
-
-def test_format_percentiles():
-    result = fmt.format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
-    expected = ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
-    tm.assert_equal(result, expected)
-
-    result = fmt.format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
-    expected = ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
-    tm.assert_equal(result, expected)
-
-    tm.assertRaises(ValueError, fmt.format_percentiles, [0.1, np.nan, 0.5])
-    tm.assertRaises(ValueError, fmt.format_percentiles, [-0.001, 0.1, 0.5])
-    tm.assertRaises(ValueError, fmt.format_percentiles, [2, 0.1, 0.5])
-    tm.assertRaises(ValueError, fmt.format_percentiles, [0.1, 0.5, 'a'])
diff --git a/pandas/tests/formats/test_printing.py b/pandas/tests/formats/test_printing.py
deleted file mode 100644
index cacba2ad3f3ba..0000000000000
--- a/pandas/tests/formats/test_printing.py
+++ /dev/null
@@ -1,195 +0,0 @@
-# -*- coding: utf-8 -*-
-import pytest
-from pandas import compat
-import pandas as pd
-import pandas.formats.printing as printing
-import pandas.formats.format as fmt
-import pandas.util.testing as tm
-import pandas.core.config as cf
-
-
-def test_adjoin():
-    data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
-    expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
-
-    adjoined = printing.adjoin(2, *data)
-
-    assert (adjoined == expected)
-
-
-def test_repr_binary_type():
-    import string
-    letters = string.ascii_letters
-    btype = compat.binary_type
-    try:
-        raw = btype(letters, encoding=cf.get_option('display.encoding'))
-    except TypeError:
-        raw = btype(letters)
-    b = compat.text_type(compat.bytes_to_str(raw))
-    res = printing.pprint_thing(b, quote_strings=True)
-    tm.assert_equal(res, repr(b))
-    res = printing.pprint_thing(b, quote_strings=False)
-    tm.assert_equal(res, b)
-
-
-class TestFormattBase(tm.TestCase):
-
-    def test_adjoin(self):
-        data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
-        expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
-
-        adjoined = printing.adjoin(2, *data)
-
-        self.assertEqual(adjoined, expected)
-
-    def test_adjoin_unicode(self):
-        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'], ['ggg', 'hhh', u'いいい']]
-        expected = u'あ  dd  ggg\nb  ええ  hhh\nc  ff  いいい'
-        adjoined = printing.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
-
-        adj = fmt.EastAsianTextAdjustment()
-
-        expected = u"""あ  dd    ggg
-b   ええ  hhh
-c   ff    いいい"""
-
-        adjoined = adj.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
-        cols = adjoined.split('\n')
-        self.assertEqual(adj.len(cols[0]), 13)
-        self.assertEqual(adj.len(cols[1]), 13)
-        self.assertEqual(adj.len(cols[2]), 16)
-
-        expected = u"""あ       dd         ggg
-b        ええ       hhh
-c        ff         いいい"""
-
-        adjoined = adj.adjoin(7, *data)
-        self.assertEqual(adjoined, expected)
-        cols = adjoined.split('\n')
-        self.assertEqual(adj.len(cols[0]), 23)
-        self.assertEqual(adj.len(cols[1]), 23)
-        self.assertEqual(adj.len(cols[2]), 26)
-
-    def test_justify(self):
-        adj = fmt.EastAsianTextAdjustment()
-
-        def just(x, *args, **kwargs):
-            # wrapper to test single str
-            return adj.justify([x], *args, **kwargs)[0]
-
-        self.assertEqual(just('abc', 5, mode='left'), 'abc  ')
-        self.assertEqual(just('abc', 5, mode='center'), ' abc ')
-        self.assertEqual(just('abc', 5, mode='right'), '  abc')
-        self.assertEqual(just(u'abc', 5, mode='left'), 'abc  ')
-        self.assertEqual(just(u'abc', 5, mode='center'), ' abc ')
-        self.assertEqual(just(u'abc', 5, mode='right'), '  abc')
-
-        self.assertEqual(just(u'パンダ', 5, mode='left'), u'パンダ')
-        self.assertEqual(just(u'パンダ', 5, mode='center'), u'パンダ')
-        self.assertEqual(just(u'パンダ', 5, mode='right'), u'パンダ')
-
-        self.assertEqual(just(u'パンダ', 10, mode='left'), u'パンダ    ')
-        self.assertEqual(just(u'パンダ', 10, mode='center'), u'  パンダ  ')
-        self.assertEqual(just(u'パンダ', 10, mode='right'), u'    パンダ')
-
-    def test_east_asian_len(self):
-        adj = fmt.EastAsianTextAdjustment()
-
-        self.assertEqual(adj.len('abc'), 3)
-        self.assertEqual(adj.len(u'abc'), 3)
-
-        self.assertEqual(adj.len(u'パンダ'), 6)
-        self.assertEqual(adj.len(u'ﾊﾟﾝﾀﾞ'), 5)
-        self.assertEqual(adj.len(u'パンダpanda'), 11)
-        self.assertEqual(adj.len(u'ﾊﾟﾝﾀﾞpanda'), 10)
-
-    def test_ambiguous_width(self):
-        adj = fmt.EastAsianTextAdjustment()
-        self.assertEqual(adj.len(u'¡¡ab'), 4)
-
-        with cf.option_context('display.unicode.ambiguous_as_wide', True):
-            adj = fmt.EastAsianTextAdjustment()
-            self.assertEqual(adj.len(u'¡¡ab'), 6)
-
-        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'],
-                ['ggg', u'¡¡ab', u'いいい']]
-        expected = u'あ  dd    ggg \nb   ええ  ¡¡ab\nc   ff    いいい'
-        adjoined = adj.adjoin(2, *data)
-        self.assertEqual(adjoined, expected)
-
-
-class TestTableSchemaRepr(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        pytest.importorskip('IPython')
-        try:
-            import mock
-        except ImportError:
-            try:
-                from unittest import mock
-            except ImportError:
-                pytest.skip("Mock is not installed")
-        cls.mock = mock
-
-    def test_publishes(self):
-        df = pd.DataFrame({"A": [1, 2]})
-        objects = [df['A'], df, df]  # dataframe / series
-        expected_keys = [
-            {'text/plain', 'application/vnd.dataresource+json'},
-            {'text/plain', 'text/html', 'application/vnd.dataresource+json'},
-        ]
-
-        make_patch = self.mock.patch('IPython.display.display')
-        opt = pd.option_context('display.html.table_schema', True)
-        for obj, expected in zip(objects, expected_keys):
-            with opt, make_patch as mock_display:
-                handle = obj._ipython_display_()
-                self.assertEqual(mock_display.call_count, 1)
-                self.assertIsNone(handle)
-                args, kwargs = mock_display.call_args
-                arg, = args  # just one argument
-
-            self.assertEqual(kwargs, {"raw": True})
-            self.assertEqual(set(arg.keys()), expected)
-
-        with_latex = pd.option_context('display.latex.repr', True)
-
-        with opt, with_latex, make_patch as mock_display:
-            handle = obj._ipython_display_()
-            args, kwargs = mock_display.call_args
-            arg, = args
-
-        expected = {'text/plain', 'text/html', 'text/latex',
-                    'application/vnd.dataresource+json'}
-        self.assertEqual(set(arg.keys()), expected)
-
-    def test_config_on(self):
-        df = pd.DataFrame({"A": [1, 2]})
-        with pd.option_context("display.html.table_schema", True):
-            result = df._repr_table_schema_()
-        self.assertIsNotNone(result)
-
-    def test_config_default_off(self):
-        df = pd.DataFrame({"A": [1, 2]})
-        with pd.option_context("display.html.table_schema", False):
-            result = df._repr_table_schema_()
-        self.assertIsNone(result)
-
-
-# TODO: fix this broken test
-
-# def test_console_encode():
-#     """
-#     On Python 2, if sys.stdin.encoding is None (IPython with zmq frontend)
-#     common.console_encode should encode things as utf-8.
-#     """
-#     if compat.PY3:
-#         pytest.skip
-
-#     with tm.stdin_encoding(encoding=None):
-#         result = printing.console_encode(u"\u05d0")
-#         expected = u"\u05d0".encode('utf-8')
-#         assert (result == expected)
diff --git a/pandas/tests/formats/test_style.py b/pandas/tests/formats/test_style.py
deleted file mode 100644
index 44af0b8ebb085..0000000000000
--- a/pandas/tests/formats/test_style.py
+++ /dev/null
@@ -1,719 +0,0 @@
-import pytest
-
-import copy
-import numpy as np
-import pandas as pd
-from pandas import DataFrame
-from pandas.util.testing import TestCase
-import pandas.util.testing as tm
-
-jinja2 = pytest.importorskip('jinja2')
-from pandas.formats.style import Styler, _get_level_lengths  # noqa
-
-
-class TestStyler(TestCase):
-
-    def setUp(self):
-        np.random.seed(24)
-        self.s = DataFrame({'A': np.random.permutation(range(6))})
-        self.df = DataFrame({'A': [0, 1], 'B': np.random.randn(2)})
-        self.f = lambda x: x
-        self.g = lambda x: x
-
-        def h(x, foo='bar'):
-            return pd.Series(['color: %s' % foo], index=x.index, name=x.name)
-
-        self.h = h
-        self.styler = Styler(self.df)
-        self.attrs = pd.DataFrame({'A': ['color: red', 'color: blue']})
-        self.dataframes = [
-            self.df,
-            pd.DataFrame({'f': [1., 2.], 'o': ['a', 'b'],
-                          'c': pd.Categorical(['a', 'b'])})
-        ]
-
-    def test_init_non_pandas(self):
-        with tm.assertRaises(TypeError):
-            Styler([1, 2, 3])
-
-    def test_init_series(self):
-        result = Styler(pd.Series([1, 2]))
-        self.assertEqual(result.data.ndim, 2)
-
-    def test_repr_html_ok(self):
-        self.styler._repr_html_()
-
-    def test_update_ctx(self):
-        self.styler._update_ctx(self.attrs)
-        expected = {(0, 0): ['color: red'],
-                    (1, 0): ['color: blue']}
-        self.assertEqual(self.styler.ctx, expected)
-
-    def test_update_ctx_flatten_multi(self):
-        attrs = DataFrame({"A": ['color: red; foo: bar',
-                                 'color: blue; foo: baz']})
-        self.styler._update_ctx(attrs)
-        expected = {(0, 0): ['color: red', ' foo: bar'],
-                    (1, 0): ['color: blue', ' foo: baz']}
-        self.assertEqual(self.styler.ctx, expected)
-
-    def test_update_ctx_flatten_multi_traliing_semi(self):
-        attrs = DataFrame({"A": ['color: red; foo: bar;',
-                                 'color: blue; foo: baz;']})
-        self.styler._update_ctx(attrs)
-        expected = {(0, 0): ['color: red', ' foo: bar'],
-                    (1, 0): ['color: blue', ' foo: baz']}
-        self.assertEqual(self.styler.ctx, expected)
-
-    def test_copy(self):
-        s2 = copy.copy(self.styler)
-        self.assertTrue(self.styler is not s2)
-        self.assertTrue(self.styler.ctx is s2.ctx)  # shallow
-        self.assertTrue(self.styler._todo is s2._todo)
-
-        self.styler._update_ctx(self.attrs)
-        self.styler.highlight_max()
-        self.assertEqual(self.styler.ctx, s2.ctx)
-        self.assertEqual(self.styler._todo, s2._todo)
-
-    def test_deepcopy(self):
-        s2 = copy.deepcopy(self.styler)
-        self.assertTrue(self.styler is not s2)
-        self.assertTrue(self.styler.ctx is not s2.ctx)
-        self.assertTrue(self.styler._todo is not s2._todo)
-
-        self.styler._update_ctx(self.attrs)
-        self.styler.highlight_max()
-        self.assertNotEqual(self.styler.ctx, s2.ctx)
-        self.assertEqual(s2._todo, [])
-        self.assertNotEqual(self.styler._todo, s2._todo)
-
-    def test_clear(self):
-        s = self.df.style.highlight_max()._compute()
-        self.assertTrue(len(s.ctx) > 0)
-        self.assertTrue(len(s._todo) > 0)
-        s.clear()
-        self.assertTrue(len(s.ctx) == 0)
-        self.assertTrue(len(s._todo) == 0)
-
-    def test_render(self):
-        df = pd.DataFrame({"A": [0, 1]})
-        style = lambda x: pd.Series(["color: red", "color: blue"], name=x.name)
-        s = Styler(df, uuid='AB').apply(style)
-        s.render()
-        # it worked?
-
-    def test_render_double(self):
-        df = pd.DataFrame({"A": [0, 1]})
-        style = lambda x: pd.Series(["color: red; border: 1px",
-                                     "color: blue; border: 2px"], name=x.name)
-        s = Styler(df, uuid='AB').apply(style)
-        s.render()
-        # it worked?
-
-    def test_set_properties(self):
-        df = pd.DataFrame({"A": [0, 1]})
-        result = df.style.set_properties(color='white',
-                                         size='10px')._compute().ctx
-        # order is deterministic
-        v = ["color: white", "size: 10px"]
-        expected = {(0, 0): v, (1, 0): v}
-        self.assertEqual(result.keys(), expected.keys())
-        for v1, v2 in zip(result.values(), expected.values()):
-            self.assertEqual(sorted(v1), sorted(v2))
-
-    def test_set_properties_subset(self):
-        df = pd.DataFrame({'A': [0, 1]})
-        result = df.style.set_properties(subset=pd.IndexSlice[0, 'A'],
-                                         color='white')._compute().ctx
-        expected = {(0, 0): ['color: white']}
-        self.assertEqual(result, expected)
-
-    def test_empty_index_name_doesnt_display(self):
-        # https://github.com/pandas-dev/pandas/pull/12090#issuecomment-180695902
-        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
-        result = df.style._translate()
-
-        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
-                      'is_visible': True, 'display_value': ''},
-                     {'class': 'col_heading level0 col0',
-                      'display_value': 'A',
-                      'type': 'th',
-                      'value': 'A',
-                      'is_visible': True,
-                      },
-                     {'class': 'col_heading level0 col1',
-                      'display_value': 'B',
-                      'type': 'th',
-                      'value': 'B',
-                      'is_visible': True,
-                      },
-                     {'class': 'col_heading level0 col2',
-                      'display_value': 'C',
-                      'type': 'th',
-                      'value': 'C',
-                      'is_visible': True,
-                      }]]
-
-        self.assertEqual(result['head'], expected)
-
-    def test_index_name(self):
-        # https://github.com/pandas-dev/pandas/issues/11655
-        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
-        result = df.set_index('A').style._translate()
-
-        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
-                      'display_value': '', 'is_visible': True},
-                     {'class': 'col_heading level0 col0', 'type': 'th',
-                      'value': 'B', 'display_value': 'B', 'is_visible': True},
-                     {'class': 'col_heading level0 col1', 'type': 'th',
-                      'value': 'C', 'display_value': 'C', 'is_visible': True}],
-                    [{'class': 'index_name level0', 'type': 'th',
-                      'value': 'A'},
-                     {'class': 'blank', 'type': 'th', 'value': ''},
-                     {'class': 'blank', 'type': 'th', 'value': ''}]]
-
-        self.assertEqual(result['head'], expected)
-
-    def test_multiindex_name(self):
-        # https://github.com/pandas-dev/pandas/issues/11655
-        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
-        result = df.set_index(['A', 'B']).style._translate()
-
-        expected = [[
-            {'class': 'blank', 'type': 'th', 'value': '',
-             'display_value': '', 'is_visible': True},
-            {'class': 'blank level0', 'type': 'th', 'value': '',
-             'display_value': '', 'is_visible': True},
-            {'class': 'col_heading level0 col0', 'type': 'th',
-             'value': 'C', 'display_value': 'C', 'is_visible': True}],
-            [{'class': 'index_name level0', 'type': 'th',
-              'value': 'A'},
-             {'class': 'index_name level1', 'type': 'th',
-              'value': 'B'},
-             {'class': 'blank', 'type': 'th', 'value': ''}]]
-
-        self.assertEqual(result['head'], expected)
-
-    def test_numeric_columns(self):
-        # https://github.com/pandas-dev/pandas/issues/12125
-        # smoke test for _translate
-        df = pd.DataFrame({0: [1, 2, 3]})
-        df.style._translate()
-
-    def test_apply_axis(self):
-        df = pd.DataFrame({'A': [0, 0], 'B': [1, 1]})
-        f = lambda x: ['val: %s' % x.max() for v in x]
-        result = df.style.apply(f, axis=1)
-        self.assertEqual(len(result._todo), 1)
-        self.assertEqual(len(result.ctx), 0)
-        result._compute()
-        expected = {(0, 0): ['val: 1'], (0, 1): ['val: 1'],
-                    (1, 0): ['val: 1'], (1, 1): ['val: 1']}
-        self.assertEqual(result.ctx, expected)
-
-        result = df.style.apply(f, axis=0)
-        expected = {(0, 0): ['val: 0'], (0, 1): ['val: 1'],
-                    (1, 0): ['val: 0'], (1, 1): ['val: 1']}
-        result._compute()
-        self.assertEqual(result.ctx, expected)
-        result = df.style.apply(f)  # default
-        result._compute()
-        self.assertEqual(result.ctx, expected)
-
-    def test_apply_subset(self):
-        axes = [0, 1]
-        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
-                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
-                  pd.IndexSlice[:2, ['A', 'B']]]
-        for ax in axes:
-            for slice_ in slices:
-                result = self.df.style.apply(self.h, axis=ax, subset=slice_,
-                                             foo='baz')._compute().ctx
-                expected = dict(((r, c), ['color: baz'])
-                                for r, row in enumerate(self.df.index)
-                                for c, col in enumerate(self.df.columns)
-                                if row in self.df.loc[slice_].index and
-                                col in self.df.loc[slice_].columns)
-                self.assertEqual(result, expected)
-
-    def test_applymap_subset(self):
-        def f(x):
-            return 'foo: bar'
-
-        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
-                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
-                  pd.IndexSlice[:2, ['A', 'B']]]
-
-        for slice_ in slices:
-            result = self.df.style.applymap(f, subset=slice_)._compute().ctx
-            expected = dict(((r, c), ['foo: bar'])
-                            for r, row in enumerate(self.df.index)
-                            for c, col in enumerate(self.df.columns)
-                            if row in self.df.loc[slice_].index and
-                            col in self.df.loc[slice_].columns)
-            self.assertEqual(result, expected)
-
-    def test_empty(self):
-        df = pd.DataFrame({'A': [1, 0]})
-        s = df.style
-        s.ctx = {(0, 0): ['color: red'],
-                 (1, 0): ['']}
-
-        result = s._translate()['cellstyle']
-        expected = [{'props': [['color', ' red']], 'selector': 'row0_col0'},
-                    {'props': [['', '']], 'selector': 'row1_col0'}]
-        self.assertEqual(result, expected)
-
-    def test_bar(self):
-        df = pd.DataFrame({'A': [0, 1, 2]})
-        result = df.style.bar()._compute().ctx
-        expected = {
-            (0, 0): ['width: 10em', ' height: 80%'],
-            (1, 0): ['width: 10em', ' height: 80%',
-                     'background: linear-gradient('
-                     '90deg,#d65f5f 50.0%, transparent 0%)'],
-            (2, 0): ['width: 10em', ' height: 80%',
-                     'background: linear-gradient('
-                     '90deg,#d65f5f 100.0%, transparent 0%)']
-        }
-        self.assertEqual(result, expected)
-
-        result = df.style.bar(color='red', width=50)._compute().ctx
-        expected = {
-            (0, 0): ['width: 10em', ' height: 80%'],
-            (1, 0): ['width: 10em', ' height: 80%',
-                     'background: linear-gradient('
-                     '90deg,red 25.0%, transparent 0%)'],
-            (2, 0): ['width: 10em', ' height: 80%',
-                     'background: linear-gradient('
-                     '90deg,red 50.0%, transparent 0%)']
-        }
-        self.assertEqual(result, expected)
-
-        df['C'] = ['a'] * len(df)
-        result = df.style.bar(color='red', width=50)._compute().ctx
-        self.assertEqual(result, expected)
-        df['C'] = df['C'].astype('category')
-        result = df.style.bar(color='red', width=50)._compute().ctx
-        self.assertEqual(result, expected)
-
-    def test_bar_0points(self):
-        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
-        result = df.style.bar()._compute().ctx
-        expected = {(0, 0): ['width: 10em', ' height: 80%'],
-                    (0, 1): ['width: 10em', ' height: 80%'],
-                    (0, 2): ['width: 10em', ' height: 80%'],
-                    (1, 0): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
-                             ' transparent 0%)'],
-                    (1, 1): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
-                             ' transparent 0%)'],
-                    (1, 2): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
-                             ' transparent 0%)'],
-                    (2, 0): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)'],
-                    (2, 1): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)'],
-                    (2, 2): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)']}
-        self.assertEqual(result, expected)
-
-        result = df.style.bar(axis=1)._compute().ctx
-        expected = {(0, 0): ['width: 10em', ' height: 80%'],
-                    (0, 1): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
-                             ' transparent 0%)'],
-                    (0, 2): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)'],
-                    (1, 0): ['width: 10em', ' height: 80%'],
-                    (1, 1): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%'
-                             ', transparent 0%)'],
-                    (1, 2): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)'],
-                    (2, 0): ['width: 10em', ' height: 80%'],
-                    (2, 1): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 50.0%'
-                             ', transparent 0%)'],
-                    (2, 2): ['width: 10em', ' height: 80%',
-                             'background: linear-gradient(90deg,#d65f5f 100.0%'
-                             ', transparent 0%)']}
-        self.assertEqual(result, expected)
-
-    def test_highlight_null(self, null_color='red'):
-        df = pd.DataFrame({'A': [0, np.nan]})
-        result = df.style.highlight_null()._compute().ctx
-        expected = {(0, 0): [''],
-                    (1, 0): ['background-color: red']}
-        self.assertEqual(result, expected)
-
-    def test_nonunique_raises(self):
-        df = pd.DataFrame([[1, 2]], columns=['A', 'A'])
-        with tm.assertRaises(ValueError):
-            df.style
-
-        with tm.assertRaises(ValueError):
-            Styler(df)
-
-    def test_caption(self):
-        styler = Styler(self.df, caption='foo')
-        result = styler.render()
-        self.assertTrue(all(['caption' in result, 'foo' in result]))
-
-        styler = self.df.style
-        result = styler.set_caption('baz')
-        self.assertTrue(styler is result)
-        self.assertEqual(styler.caption, 'baz')
-
-    def test_uuid(self):
-        styler = Styler(self.df, uuid='abc123')
-        result = styler.render()
-        self.assertTrue('abc123' in result)
-
-        styler = self.df.style
-        result = styler.set_uuid('aaa')
-        self.assertTrue(result is styler)
-        self.assertEqual(result.uuid, 'aaa')
-
-    def test_table_styles(self):
-        style = [{'selector': 'th', 'props': [('foo', 'bar')]}]
-        styler = Styler(self.df, table_styles=style)
-        result = ' '.join(styler.render().split())
-        self.assertTrue('th { foo: bar; }' in result)
-
-        styler = self.df.style
-        result = styler.set_table_styles(style)
-        self.assertTrue(styler is result)
-        self.assertEqual(styler.table_styles, style)
-
-    def test_table_attributes(self):
-        attributes = 'class="foo" data-bar'
-        styler = Styler(self.df, table_attributes=attributes)
-        result = styler.render()
-        self.assertTrue('class="foo" data-bar' in result)
-
-        result = self.df.style.set_table_attributes(attributes).render()
-        self.assertTrue('class="foo" data-bar' in result)
-
-    def test_precision(self):
-        with pd.option_context('display.precision', 10):
-            s = Styler(self.df)
-        self.assertEqual(s.precision, 10)
-        s = Styler(self.df, precision=2)
-        self.assertEqual(s.precision, 2)
-
-        s2 = s.set_precision(4)
-        self.assertTrue(s is s2)
-        self.assertEqual(s.precision, 4)
-
-    def test_apply_none(self):
-        def f(x):
-            return pd.DataFrame(np.where(x == x.max(), 'color: red', ''),
-                                index=x.index, columns=x.columns)
-        result = (pd.DataFrame([[1, 2], [3, 4]])
-                  .style.apply(f, axis=None)._compute().ctx)
-        self.assertEqual(result[(1, 1)], ['color: red'])
-
-    def test_trim(self):
-        result = self.df.style.render()  # trim=True
-        self.assertEqual(result.count('#'), 0)
-
-        result = self.df.style.highlight_max().render()
-        self.assertEqual(result.count('#'), len(self.df.columns))
-
-    def test_highlight_max(self):
-        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
-        # max(df) = min(-df)
-        for max_ in [True, False]:
-            if max_:
-                attr = 'highlight_max'
-            else:
-                df = -df
-                attr = 'highlight_min'
-            result = getattr(df.style, attr)()._compute().ctx
-            self.assertEqual(result[(1, 1)], ['background-color: yellow'])
-
-            result = getattr(df.style, attr)(color='green')._compute().ctx
-            self.assertEqual(result[(1, 1)], ['background-color: green'])
-
-            result = getattr(df.style, attr)(subset='A')._compute().ctx
-            self.assertEqual(result[(1, 0)], ['background-color: yellow'])
-
-            result = getattr(df.style, attr)(axis=0)._compute().ctx
-            expected = {(1, 0): ['background-color: yellow'],
-                        (1, 1): ['background-color: yellow'],
-                        (0, 1): [''], (0, 0): ['']}
-            self.assertEqual(result, expected)
-
-            result = getattr(df.style, attr)(axis=1)._compute().ctx
-            expected = {(0, 1): ['background-color: yellow'],
-                        (1, 1): ['background-color: yellow'],
-                        (0, 0): [''], (1, 0): ['']}
-            self.assertEqual(result, expected)
-
-        # separate since we cant negate the strs
-        df['C'] = ['a', 'b']
-        result = df.style.highlight_max()._compute().ctx
-        expected = {(1, 1): ['background-color: yellow']}
-
-        result = df.style.highlight_min()._compute().ctx
-        expected = {(0, 0): ['background-color: yellow']}
-
-    def test_export(self):
-        f = lambda x: 'color: red' if x > 0 else 'color: blue'
-        g = lambda x, y, z: 'color: %s' if x > 0 else 'color: %s' % z
-        style1 = self.styler
-        style1.applymap(f)\
-            .applymap(g, y='a', z='b')\
-            .highlight_max()
-        result = style1.export()
-        style2 = self.df.style
-        style2.use(result)
-        self.assertEqual(style1._todo, style2._todo)
-        style2.render()
-
-    def test_display_format(self):
-        df = pd.DataFrame(np.random.random(size=(2, 2)))
-        ctx = df.style.format("{:0.1f}")._translate()
-
-        self.assertTrue(all(['display_value' in c for c in row]
-                            for row in ctx['body']))
-        self.assertTrue(all([len(c['display_value']) <= 3 for c in row[1:]]
-                            for row in ctx['body']))
-        self.assertTrue(
-            len(ctx['body'][0][1]['display_value'].lstrip('-')) <= 3)
-
-    def test_display_format_raises(self):
-        df = pd.DataFrame(np.random.randn(2, 2))
-        with tm.assertRaises(TypeError):
-            df.style.format(5)
-        with tm.assertRaises(TypeError):
-            df.style.format(True)
-
-    def test_display_subset(self):
-        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
-                          columns=['a', 'b'])
-        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"},
-                              subset=pd.IndexSlice[0, :])._translate()
-        expected = '0.1'
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][1][1]['display_value'], '1.1234')
-        self.assertEqual(ctx['body'][0][2]['display_value'], '12.34%')
-
-        raw_11 = '1.1234'
-        ctx = df.style.format("{:0.1f}",
-                              subset=pd.IndexSlice[0, :])._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][1][1]['display_value'], raw_11)
-
-        ctx = df.style.format("{:0.1f}",
-                              subset=pd.IndexSlice[0, :])._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][1][1]['display_value'], raw_11)
-
-        ctx = df.style.format("{:0.1f}",
-                              subset=pd.IndexSlice['a'])._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][0][2]['display_value'], '0.1234')
-
-        ctx = df.style.format("{:0.1f}",
-                              subset=pd.IndexSlice[0, 'a'])._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][1][1]['display_value'], raw_11)
-
-        ctx = df.style.format("{:0.1f}",
-                              subset=pd.IndexSlice[[0, 1], ['a']])._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], expected)
-        self.assertEqual(ctx['body'][1][1]['display_value'], '1.1')
-        self.assertEqual(ctx['body'][0][2]['display_value'], '0.1234')
-        self.assertEqual(ctx['body'][1][2]['display_value'], '1.1234')
-
-    def test_display_dict(self):
-        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
-                          columns=['a', 'b'])
-        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"})._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], '0.1')
-        self.assertEqual(ctx['body'][0][2]['display_value'], '12.34%')
-        df['c'] = ['aaa', 'bbb']
-        ctx = df.style.format({"a": "{:0.1f}", "c": str.upper})._translate()
-        self.assertEqual(ctx['body'][0][1]['display_value'], '0.1')
-        self.assertEqual(ctx['body'][0][3]['display_value'], 'AAA')
-
-    def test_bad_apply_shape(self):
-        df = pd.DataFrame([[1, 2], [3, 4]])
-        with tm.assertRaises(ValueError):
-            df.style._apply(lambda x: 'x', subset=pd.IndexSlice[[0, 1], :])
-
-        with tm.assertRaises(ValueError):
-            df.style._apply(lambda x: [''], subset=pd.IndexSlice[[0, 1], :])
-
-        with tm.assertRaises(ValueError):
-            df.style._apply(lambda x: ['', '', '', ''])
-
-        with tm.assertRaises(ValueError):
-            df.style._apply(lambda x: ['', '', ''], subset=1)
-
-        with tm.assertRaises(ValueError):
-            df.style._apply(lambda x: ['', '', ''], axis=1)
-
-    def test_apply_bad_return(self):
-        def f(x):
-            return ''
-        df = pd.DataFrame([[1, 2], [3, 4]])
-        with tm.assertRaises(TypeError):
-            df.style._apply(f, axis=None)
-
-    def test_apply_bad_labels(self):
-        def f(x):
-            return pd.DataFrame(index=[1, 2], columns=['a', 'b'])
-        df = pd.DataFrame([[1, 2], [3, 4]])
-        with tm.assertRaises(ValueError):
-            df.style._apply(f, axis=None)
-
-    def test_get_level_lengths(self):
-        index = pd.MultiIndex.from_product([['a', 'b'], [0, 1, 2]])
-        expected = {(0, 0): 3, (0, 3): 3, (1, 0): 1, (1, 1): 1, (1, 2): 1,
-                    (1, 3): 1, (1, 4): 1, (1, 5): 1}
-        result = _get_level_lengths(index)
-        tm.assert_dict_equal(result, expected)
-
-    def test_get_level_lengths_un_sorted(self):
-        index = pd.MultiIndex.from_arrays([
-            [1, 1, 2, 1],
-            ['a', 'b', 'b', 'd']
-        ])
-        expected = {(0, 0): 2, (0, 2): 1, (0, 3): 1,
-                    (1, 0): 1, (1, 1): 1, (1, 2): 1, (1, 3): 1}
-        result = _get_level_lengths(index)
-        tm.assert_dict_equal(result, expected)
-
-    def test_mi_sparse(self):
-        df = pd.DataFrame({'A': [1, 2]},
-                          index=pd.MultiIndex.from_arrays([['a', 'a'],
-                                                           [0, 1]]))
-        result = df.style._translate()
-        body_0 = result['body'][0][0]
-        expected_0 = {
-            "value": "a", "display_value": "a", "is_visible": True,
-            "type": "th", "attributes": ["rowspan=2"],
-            "class": "row_heading level0 row0",
-        }
-        tm.assert_dict_equal(body_0, expected_0)
-
-        body_1 = result['body'][0][1]
-        expected_1 = {
-            "value": 0, "display_value": 0, "is_visible": True,
-            "type": "th", "class": "row_heading level1 row0",
-        }
-        tm.assert_dict_equal(body_1, expected_1)
-
-        body_10 = result['body'][1][0]
-        expected_10 = {
-            "value": 'a', "display_value": 'a', "is_visible": False,
-            "type": "th", "class": "row_heading level0 row1",
-        }
-        tm.assert_dict_equal(body_10, expected_10)
-
-        head = result['head'][0]
-        expected = [
-            {'type': 'th', 'class': 'blank', 'value': '',
-             'is_visible': True, "display_value": ''},
-            {'type': 'th', 'class': 'blank level0', 'value': '',
-             'is_visible': True, 'display_value': ''},
-            {'type': 'th', 'class': 'col_heading level0 col0', 'value': 'A',
-             'is_visible': True, 'display_value': 'A'}]
-        self.assertEqual(head, expected)
-
-    def test_mi_sparse_disabled(self):
-        with pd.option_context('display.multi_sparse', False):
-            df = pd.DataFrame({'A': [1, 2]},
-                              index=pd.MultiIndex.from_arrays([['a', 'a'],
-                                                               [0, 1]]))
-            result = df.style._translate()
-        body = result['body']
-        for row in body:
-            assert 'attributes' not in row[0]
-
-    def test_mi_sparse_index_names(self):
-        df = pd.DataFrame({'A': [1, 2]}, index=pd.MultiIndex.from_arrays(
-            [['a', 'a'], [0, 1]],
-            names=['idx_level_0', 'idx_level_1'])
-        )
-        result = df.style._translate()
-        head = result['head'][1]
-        expected = [{
-            'class': 'index_name level0', 'value': 'idx_level_0',
-            'type': 'th'},
-            {'class': 'index_name level1', 'value': 'idx_level_1',
-             'type': 'th'},
-            {'class': 'blank', 'value': '', 'type': 'th'}]
-
-        self.assertEqual(head, expected)
-
-    def test_mi_sparse_column_names(self):
-        df = pd.DataFrame(
-            np.arange(16).reshape(4, 4),
-            index=pd.MultiIndex.from_arrays(
-                [['a', 'a', 'b', 'a'], [0, 1, 1, 2]],
-                names=['idx_level_0', 'idx_level_1']),
-            columns=pd.MultiIndex.from_arrays(
-                [['C1', 'C1', 'C2', 'C2'], [1, 0, 1, 0]],
-                names=['col_0', 'col_1']
-            )
-        )
-        result = df.style._translate()
-        head = result['head'][1]
-        expected = [
-            {'class': 'blank', 'value': '', 'display_value': '',
-             'type': 'th', 'is_visible': True},
-            {'class': 'index_name level1', 'value': 'col_1',
-             'display_value': 'col_1', 'is_visible': True, 'type': 'th'},
-            {'class': 'col_heading level1 col0',
-             'display_value': 1,
-             'is_visible': True,
-             'type': 'th',
-             'value': 1},
-            {'class': 'col_heading level1 col1',
-             'display_value': 0,
-             'is_visible': True,
-             'type': 'th',
-             'value': 0},
-
-            {'class': 'col_heading level1 col2',
-             'display_value': 1,
-             'is_visible': True,
-             'type': 'th',
-             'value': 1},
-
-            {'class': 'col_heading level1 col3',
-             'display_value': 0,
-             'is_visible': True,
-             'type': 'th',
-             'value': 0},
-        ]
-        self.assertEqual(head, expected)
-
-
-@tm.mplskip
-class TestStylerMatplotlibDep(TestCase):
-
-    def test_background_gradient(self):
-        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
-        for axis in [0, 1, 'index', 'columns']:
-            for cmap in [None, 'YlOrRd']:
-                result = df.style.background_gradient(cmap=cmap)._compute().ctx
-                self.assertTrue(all("#" in x[0] for x in result.values()))
-                self.assertEqual(result[(0, 0)], result[(0, 1)])
-                self.assertEqual(result[(1, 0)], result[(1, 1)])
-
-        result = (df.style.background_gradient(subset=pd.IndexSlice[1, 'A'])
-                    ._compute().ctx)
-        self.assertEqual(result[(1, 0)], ['background-color: #fff7fb'])
diff --git a/pandas/tests/formats/test_to_csv.py b/pandas/tests/formats/test_to_csv.py
deleted file mode 100644
index 51295fd750602..0000000000000
--- a/pandas/tests/formats/test_to_csv.py
+++ /dev/null
@@ -1,216 +0,0 @@
-from pandas import DataFrame
-import numpy as np
-import pandas as pd
-from pandas.util import testing as tm
-
-
-class TestToCSV(tm.TestCase):
-
-    def test_to_csv_quotechar(self):
-        df = DataFrame({'col': [1, 2]})
-        expected = """\
-"","col"
-"0","1"
-"1","2"
-"""
-
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1)  # 1=QUOTE_ALL
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        expected = """\
-$$,$col$
-$0$,$1$
-$1$,$2$
-"""
-
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, quotechar="$")
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(TypeError, 'quotechar'):
-                df.to_csv(path, quoting=1, quotechar=None)
-
-    def test_to_csv_doublequote(self):
-        df = DataFrame({'col': ['a"a', '"bb"']})
-        expected = '''\
-"","col"
-"0","a""a"
-"1","""bb"""
-'''
-
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=1, doublequote=True)  # QUOTE_ALL
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        from _csv import Error
-        with tm.ensure_clean('test.csv') as path:
-            with tm.assertRaisesRegexp(Error, 'escapechar'):
-                df.to_csv(path, doublequote=False)  # no escapechar set
-
-    def test_to_csv_escapechar(self):
-        df = DataFrame({'col': ['a"a', '"bb"']})
-        expected = '''\
-"","col"
-"0","a\\"a"
-"1","\\"bb\\""
-'''
-
-        with tm.ensure_clean('test.csv') as path:  # QUOTE_ALL
-            df.to_csv(path, quoting=1, doublequote=False, escapechar='\\')
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-        df = DataFrame({'col': ['a,a', ',bb,']})
-        expected = """\
-,col
-0,a\\,a
-1,\\,bb\\,
-"""
-
-        with tm.ensure_clean('test.csv') as path:
-            df.to_csv(path, quoting=3, escapechar='\\')  # QUOTE_NONE
-            with open(path, 'r') as f:
-                self.assertEqual(f.read(), expected)
-
-    def test_csv_to_string(self):
-        df = DataFrame({'col': [1, 2]})
-        expected = ',col\n0,1\n1,2\n'
-        self.assertEqual(df.to_csv(), expected)
-
-    def test_to_csv_decimal(self):
-        # GH 781
-        df = DataFrame({'col1': [1], 'col2': ['a'], 'col3': [10.1]})
-
-        expected_default = ',col1,col2,col3\n0,1,a,10.1\n'
-        self.assertEqual(df.to_csv(), expected_default)
-
-        expected_european_excel = ';col1;col2;col3\n0;1;a;10,1\n'
-        self.assertEqual(
-            df.to_csv(decimal=',', sep=';'), expected_european_excel)
-
-        expected_float_format_default = ',col1,col2,col3\n0,1,a,10.10\n'
-        self.assertEqual(
-            df.to_csv(float_format='%.2f'), expected_float_format_default)
-
-        expected_float_format = ';col1;col2;col3\n0;1;a;10,10\n'
-        self.assertEqual(
-            df.to_csv(decimal=',', sep=';',
-                      float_format='%.2f'), expected_float_format)
-
-        # GH 11553: testing if decimal is taken into account for '0.0'
-        df = pd.DataFrame({'a': [0, 1.1], 'b': [2.2, 3.3], 'c': 1})
-        expected = 'a,b,c\n0^0,2^2,1\n1^1,3^3,1\n'
-        self.assertEqual(df.to_csv(index=False, decimal='^'), expected)
-
-        # same but for an index
-        self.assertEqual(df.set_index('a').to_csv(decimal='^'), expected)
-
-        # same for a multi-index
-        self.assertEqual(
-            df.set_index(['a', 'b']).to_csv(decimal="^"), expected)
-
-    def test_to_csv_float_format(self):
-        # testing if float_format is taken into account for the index
-        # GH 11553
-        df = pd.DataFrame({'a': [0, 1], 'b': [2.2, 3.3], 'c': 1})
-        expected = 'a,b,c\n0,2.20,1\n1,3.30,1\n'
-        self.assertEqual(
-            df.set_index('a').to_csv(float_format='%.2f'), expected)
-
-        # same for a multi-index
-        self.assertEqual(
-            df.set_index(['a', 'b']).to_csv(float_format='%.2f'), expected)
-
-    def test_to_csv_na_rep(self):
-        # testing if NaN values are correctly represented in the index
-        # GH 11553
-        df = DataFrame({'a': [0, np.NaN], 'b': [0, 1], 'c': [2, 3]})
-        expected = "a,b,c\n0.0,0,2\n_,1,3\n"
-        self.assertEqual(df.set_index('a').to_csv(na_rep='_'), expected)
-        self.assertEqual(df.set_index(['a', 'b']).to_csv(na_rep='_'), expected)
-
-        # now with an index containing only NaNs
-        df = DataFrame({'a': np.NaN, 'b': [0, 1], 'c': [2, 3]})
-        expected = "a,b,c\n_,0,2\n_,1,3\n"
-        self.assertEqual(df.set_index('a').to_csv(na_rep='_'), expected)
-        self.assertEqual(df.set_index(['a', 'b']).to_csv(na_rep='_'), expected)
-
-        # check if na_rep parameter does not break anything when no NaN
-        df = DataFrame({'a': 0, 'b': [0, 1], 'c': [2, 3]})
-        expected = "a,b,c\n0,0,2\n0,1,3\n"
-        self.assertEqual(df.set_index('a').to_csv(na_rep='_'), expected)
-        self.assertEqual(df.set_index(['a', 'b']).to_csv(na_rep='_'), expected)
-
-    def test_to_csv_date_format(self):
-        # GH 10209
-        df_sec = DataFrame({'A': pd.date_range('20130101', periods=5, freq='s')
-                            })
-        df_day = DataFrame({'A': pd.date_range('20130101', periods=5, freq='d')
-                            })
-
-        expected_default_sec = (',A\n0,2013-01-01 00:00:00\n1,'
-                                '2013-01-01 00:00:01\n2,2013-01-01 00:00:02'
-                                '\n3,2013-01-01 00:00:03\n4,'
-                                '2013-01-01 00:00:04\n')
-        self.assertEqual(df_sec.to_csv(), expected_default_sec)
-
-        expected_ymdhms_day = (',A\n0,2013-01-01 00:00:00\n1,'
-                               '2013-01-02 00:00:00\n2,2013-01-03 00:00:00'
-                               '\n3,2013-01-04 00:00:00\n4,'
-                               '2013-01-05 00:00:00\n')
-        self.assertEqual(
-            df_day.to_csv(
-                date_format='%Y-%m-%d %H:%M:%S'), expected_ymdhms_day)
-
-        expected_ymd_sec = (',A\n0,2013-01-01\n1,2013-01-01\n2,'
-                            '2013-01-01\n3,2013-01-01\n4,2013-01-01\n')
-        self.assertEqual(
-            df_sec.to_csv(date_format='%Y-%m-%d'), expected_ymd_sec)
-
-        expected_default_day = (',A\n0,2013-01-01\n1,2013-01-02\n2,'
-                                '2013-01-03\n3,2013-01-04\n4,2013-01-05\n')
-        self.assertEqual(df_day.to_csv(), expected_default_day)
-        self.assertEqual(
-            df_day.to_csv(date_format='%Y-%m-%d'), expected_default_day)
-
-        # testing if date_format parameter is taken into account for
-        # multi-indexed dataframes (GH 7791)
-        df_sec['B'] = 0
-        df_sec['C'] = 1
-        expected_ymd_sec = 'A,B,C\n2013-01-01,0,1\n'
-        df_sec_grouped = df_sec.groupby([pd.Grouper(key='A', freq='1h'), 'B'])
-        self.assertEqual(df_sec_grouped.mean().to_csv(date_format='%Y-%m-%d'),
-                         expected_ymd_sec)
-
-    def test_to_csv_multi_index(self):
-        # see gh-6618
-        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]))
-
-        exp = ",1\n,2\n0,1\n"
-        self.assertEqual(df.to_csv(), exp)
-
-        exp = "1\n2\n1\n"
-        self.assertEqual(df.to_csv(index=False), exp)
-
-        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]),
-                       index=pd.MultiIndex.from_arrays([[1], [2]]))
-
-        exp = ",,1\n,,2\n1,2,1\n"
-        self.assertEqual(df.to_csv(), exp)
-
-        exp = "1\n2\n1\n"
-        self.assertEqual(df.to_csv(index=False), exp)
-
-        df = DataFrame(
-            [1], columns=pd.MultiIndex.from_arrays([['foo'], ['bar']]))
-
-        exp = ",foo\n,bar\n0,1\n"
-        self.assertEqual(df.to_csv(), exp)
-
-        exp = "foo\nbar\n1\n"
-        self.assertEqual(df.to_csv(index=False), exp)
diff --git a/pandas/tests/formats/test_to_html.py b/pandas/tests/formats/test_to_html.py
deleted file mode 100644
index 771c66e84037c..0000000000000
--- a/pandas/tests/formats/test_to_html.py
+++ /dev/null
@@ -1,1861 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import re
-from textwrap import dedent
-from datetime import datetime
-from distutils.version import LooseVersion
-
-import pytest
-import numpy as np
-import pandas as pd
-from pandas import compat, DataFrame, MultiIndex, option_context, Index
-from pandas.compat import u, lrange, StringIO
-from pandas.util import testing as tm
-import pandas.formats.format as fmt
-
-div_style = ''
-try:
-    import IPython
-    if IPython.__version__ < LooseVersion('3.0.0'):
-        div_style = ' style="max-width:1500px;overflow:auto;"'
-except (ImportError, AttributeError):
-    pass
-
-
-class TestToHTML(tm.TestCase):
-
-    def test_to_html_with_col_space(self):
-        def check_with_width(df, col_space):
-            # check that col_space affects HTML generation
-            # and be very brittle about it.
-            html = df.to_html(col_space=col_space)
-            hdrs = [x for x in html.split(r"\n") if re.search(r"<th[>\s]", x)]
-            self.assertTrue(len(hdrs) > 0)
-            for h in hdrs:
-                self.assertTrue("min-width" in h)
-                self.assertTrue(str(col_space) in h)
-
-        df = DataFrame(np.random.random(size=(1, 3)))
-
-        check_with_width(df, 30)
-        check_with_width(df, 50)
-
-    def test_to_html_with_empty_string_label(self):
-        # GH3547, to_html regards empty string labels as repeated labels
-        data = {'c1': ['a', 'b'], 'c2': ['a', ''], 'data': [1, 2]}
-        df = DataFrame(data).set_index(['c1', 'c2'])
-        res = df.to_html()
-        self.assertTrue("rowspan" not in res)
-
-    def test_to_html_unicode(self):
-        df = DataFrame({u('\u03c3'): np.arange(10.)})
-        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>\u03c3</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>0.0</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>1.0</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>2.0</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>3.0</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>4.0</td>\n    </tr>\n    <tr>\n      <th>5</th>\n      <td>5.0</td>\n    </tr>\n    <tr>\n      <th>6</th>\n      <td>6.0</td>\n    </tr>\n    <tr>\n      <th>7</th>\n      <td>7.0</td>\n    </tr>\n    <tr>\n      <th>8</th>\n      <td>8.0</td>\n    </tr>\n    <tr>\n      <th>9</th>\n      <td>9.0</td>\n    </tr>\n  </tbody>\n</table>'  # noqa
-        self.assertEqual(df.to_html(), expected)
-        df = DataFrame({'A': [u('\u03c3')]})
-        expected = u'<table border="1" class="dataframe">\n  <thead>\n    <tr style="text-align: right;">\n      <th></th>\n      <th>A</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>\u03c3</td>\n    </tr>\n  </tbody>\n</table>'  # noqa
-        self.assertEqual(df.to_html(), expected)
-
-    def test_to_html_decimal(self):
-        # GH 12031
-        df = DataFrame({'A': [6.0, 3.1, 2.2]})
-        result = df.to_html(decimal=',')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr style="text-align: right;">\n'
-                    '      <th></th>\n'
-                    '      <th>A</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>6,0</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>3,1</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>2</th>\n'
-                    '      <td>2,2</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-        self.assertEqual(result, expected)
-
-    def test_to_html_escaped(self):
-        a = 'str<ing1 &amp;'
-        b = 'stri>ng2 &amp;'
-
-        test_dict = {'co<l1': {a: "<type 'str'>",
-                               b: "<type 'str'>"},
-                     'co>l2': {a: "<type 'str'>",
-                               b: "<type 'str'>"}}
-        rs = DataFrame(test_dict).to_html()
-        xp = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>co&lt;l1</th>
-      <th>co&gt;l2</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>str&lt;ing1 &amp;amp;</th>
-      <td>&lt;type 'str'&gt;</td>
-      <td>&lt;type 'str'&gt;</td>
-    </tr>
-    <tr>
-      <th>stri&gt;ng2 &amp;amp;</th>
-      <td>&lt;type 'str'&gt;</td>
-      <td>&lt;type 'str'&gt;</td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(xp, rs)
-
-    def test_to_html_escape_disabled(self):
-        a = 'str<ing1 &amp;'
-        b = 'stri>ng2 &amp;'
-
-        test_dict = {'co<l1': {a: "<b>bold</b>",
-                               b: "<b>bold</b>"},
-                     'co>l2': {a: "<b>bold</b>",
-                               b: "<b>bold</b>"}}
-        rs = DataFrame(test_dict).to_html(escape=False)
-        xp = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>co<l1</th>
-      <th>co>l2</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>str<ing1 &amp;</th>
-      <td><b>bold</b></td>
-      <td><b>bold</b></td>
-    </tr>
-    <tr>
-      <th>stri>ng2 &amp;</th>
-      <td><b>bold</b></td>
-      <td><b>bold</b></td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(xp, rs)
-
-    def test_to_html_multiindex_index_false(self):
-        # issue 8452
-        df = DataFrame({
-            'a': range(2),
-            'b': range(3, 5),
-            'c': range(5, 7),
-            'd': range(3, 5)
-        })
-        df.columns = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
-        result = df.to_html(index=False)
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th colspan="2" halign="left">a</th>
-      <th colspan="2" halign="left">b</th>
-    </tr>
-    <tr>
-      <th>c</th>
-      <th>d</th>
-      <th>c</th>
-      <th>d</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <td>0</td>
-      <td>3</td>
-      <td>5</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <td>1</td>
-      <td>4</td>
-      <td>6</td>
-      <td>4</td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(result, expected)
-
-        df.index = Index(df.index.values, name='idx')
-        result = df.to_html(index=False)
-        self.assertEqual(result, expected)
-
-    def test_to_html_multiindex_sparsify_false_multi_sparse(self):
-        with option_context('display.multi_sparse', False):
-            index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
-                                           names=['foo', None])
-
-            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
-
-            result = df.to_html()
-            expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>0</th>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-
-            self.assertEqual(result, expected)
-
-            df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]],
-                           columns=index[::2], index=index)
-
-            result = df.to_html()
-            expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th>foo</th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>0</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>0</th>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-
-            self.assertEqual(result, expected)
-
-    def test_to_html_multiindex_sparsify(self):
-        index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
-                                       names=['foo', None])
-
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
-
-        result = df.to_html()
-        expected = """<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(result, expected)
-
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], columns=index[::2],
-                       index=index)
-
-        result = df.to_html()
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th>foo</th>
-      <th>0</th>
-      <th>1</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>0</th>
-      <th>0</th>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th></th>
-      <th></th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">0</th>
-      <th>0</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">1</th>
-      <th>0</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(result, expected)
-
-    def test_to_html_multiindex_odd_even_truncate(self):
-        # GH 14882 - Issue on truncation with odd length DataFrame
-        mi = MultiIndex.from_product([[100, 200, 300],
-                                      [10, 20, 30],
-                                      [1, 2, 3, 4, 5, 6, 7]],
-                                     names=['a', 'b', 'c'])
-        df = DataFrame({'n': range(len(mi))}, index=mi)
-        result = df.to_html(max_rows=60)
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th></th>
-      <th>n</th>
-    </tr>
-    <tr>
-      <th>a</th>
-      <th>b</th>
-      <th>c</th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="21" valign="top">100</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>0</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>2</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>4</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>6</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">20</th>
-      <th>1</th>
-      <td>7</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>8</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>9</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>10</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>11</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>12</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>13</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>14</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>15</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>16</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>17</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>18</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>19</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>20</td>
-    </tr>
-    <tr>
-      <th rowspan="19" valign="top">200</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>21</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>22</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>23</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>24</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>25</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>26</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>27</td>
-    </tr>
-    <tr>
-      <th rowspan="5" valign="top">20</th>
-      <th>1</th>
-      <td>28</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>29</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>33</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>34</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>35</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>36</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>37</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>38</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>39</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>40</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>41</td>
-    </tr>
-    <tr>
-      <th rowspan="21" valign="top">300</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>42</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>43</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>44</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>45</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>46</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>47</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>48</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">20</th>
-      <th>1</th>
-      <td>49</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>50</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>51</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>52</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>53</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>54</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>55</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>56</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>57</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>58</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>59</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>60</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>61</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>62</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-        # Test that ... appears in a middle level
-        result = df.to_html(max_rows=56)
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th></th>
-      <th></th>
-      <th>n</th>
-    </tr>
-    <tr>
-      <th>a</th>
-      <th>b</th>
-      <th>c</th>
-      <th></th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="21" valign="top">100</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>0</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>2</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>4</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>6</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">20</th>
-      <th>1</th>
-      <td>7</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>8</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>9</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>10</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>11</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>12</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>13</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>14</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>15</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>16</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>17</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>18</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>19</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>20</td>
-    </tr>
-    <tr>
-      <th rowspan="15" valign="top">200</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>21</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>22</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>23</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>24</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>25</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>26</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>27</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <th>...</th>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>35</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>36</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>37</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>38</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>39</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>40</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>41</td>
-    </tr>
-    <tr>
-      <th rowspan="21" valign="top">300</th>
-      <th rowspan="7" valign="top">10</th>
-      <th>1</th>
-      <td>42</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>43</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>44</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>45</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>46</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>47</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>48</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">20</th>
-      <th>1</th>
-      <td>49</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>50</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>51</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>52</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>53</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>54</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>55</td>
-    </tr>
-    <tr>
-      <th rowspan="7" valign="top">30</th>
-      <th>1</th>
-      <td>56</td>
-    </tr>
-    <tr>
-      <th>2</th>
-      <td>57</td>
-    </tr>
-    <tr>
-      <th>3</th>
-      <td>58</td>
-    </tr>
-    <tr>
-      <th>4</th>
-      <td>59</td>
-    </tr>
-    <tr>
-      <th>5</th>
-      <td>60</td>
-    </tr>
-    <tr>
-      <th>6</th>
-      <td>61</td>
-    </tr>
-    <tr>
-      <th>7</th>
-      <td>62</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-    def test_to_html_index_formatter(self):
-        df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], columns=['foo', None],
-                       index=lrange(4))
-
-        f = lambda x: 'abcd' [x]
-        result = df.to_html(formatters={'__index__': f})
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>foo</th>
-      <th>None</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>a</th>
-      <td>0</td>
-      <td>1</td>
-    </tr>
-    <tr>
-      <th>b</th>
-      <td>2</td>
-      <td>3</td>
-    </tr>
-    <tr>
-      <th>c</th>
-      <td>4</td>
-      <td>5</td>
-    </tr>
-    <tr>
-      <th>d</th>
-      <td>6</td>
-      <td>7</td>
-    </tr>
-  </tbody>
-</table>"""
-
-        self.assertEqual(result, expected)
-
-    def test_to_html_datetime64_monthformatter(self):
-        months = [datetime(2016, 1, 1), datetime(2016, 2, 2)]
-        x = DataFrame({'months': months})
-
-        def format_func(x):
-            return x.strftime('%Y-%m')
-        result = x.to_html(formatters={'months': format_func})
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>months</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <td>2016-01</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>2016-02</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-    def test_to_html_datetime64_hourformatter(self):
-
-        x = DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
-                                             format='%H:%M:%S.%f')})
-
-        def format_func(x):
-            return x.strftime('%H:%M')
-        result = x.to_html(formatters={'hod': format_func})
-        expected = """\
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>hod</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>0</th>
-      <td>10:10</td>
-    </tr>
-    <tr>
-      <th>1</th>
-      <td>12:12</td>
-    </tr>
-  </tbody>
-</table>"""
-        self.assertEqual(result, expected)
-
-    def test_to_html_regression_GH6098(self):
-        df = DataFrame({
-            u('clé1'): [u('a'), u('a'), u('b'), u('b'), u('a')],
-            u('clé2'): [u('1er'), u('2ème'), u('1er'), u('2ème'), u('1er')],
-            'données1': np.random.randn(5),
-            'données2': np.random.randn(5)})
-
-        # it works
-        df.pivot_table(index=[u('clé1')], columns=[u('clé2')])._repr_html_()
-
-    def test_to_html_truncate(self):
-        pytest.skip("unreliable on travis")
-        index = pd.DatetimeIndex(start='20010101', freq='D', periods=20)
-        df = DataFrame(index=index, columns=range(20))
-        fmt.set_option('display.max_rows', 8)
-        fmt.set_option('display.max_columns', 4)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr style="text-align: right;">
-      <th></th>
-      <th>0</th>
-      <th>1</th>
-      <th>...</th>
-      <th>18</th>
-      <th>19</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>2001-01-01</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-02</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-03</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-04</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th>2001-01-17</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-18</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-19</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>2001-01-20</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>20 rows × 20 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-    def test_to_html_truncate_multi_index(self):
-        pytest.skip("unreliable on travis")
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays, columns=arrays)
-        fmt.set_option('display.max_rows', 7)
-        fmt.set_option('display.max_columns', 7)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th></th>
-      <th colspan="2" halign="left">bar</th>
-      <th>baz</th>
-      <th>...</th>
-      <th>foo</th>
-      <th colspan="2" halign="left">qux</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>one</th>
-      <th>two</th>
-      <th>one</th>
-      <th>...</th>
-      <th>two</th>
-      <th>one</th>
-      <th>two</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th rowspan="2" valign="top">bar</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>baz</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>...</th>
-      <th>...</th>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-      <td>...</td>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th rowspan="2" valign="top">qux</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>8 rows × 8 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-    def test_to_html_truncate_multi_index_sparse_off(self):
-        pytest.skip("unreliable on travis")
-        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
-        df = DataFrame(index=arrays, columns=arrays)
-        fmt.set_option('display.max_rows', 7)
-        fmt.set_option('display.max_columns', 7)
-        fmt.set_option('display.multi_sparse', False)
-        result = df._repr_html_()
-        expected = '''\
-<div{0}>
-<table border="1" class="dataframe">
-  <thead>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>bar</th>
-      <th>bar</th>
-      <th>baz</th>
-      <th>...</th>
-      <th>foo</th>
-      <th>qux</th>
-      <th>qux</th>
-    </tr>
-    <tr>
-      <th></th>
-      <th></th>
-      <th>one</th>
-      <th>two</th>
-      <th>one</th>
-      <th>...</th>
-      <th>two</th>
-      <th>one</th>
-      <th>two</th>
-    </tr>
-  </thead>
-  <tbody>
-    <tr>
-      <th>bar</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>bar</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>baz</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>foo</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>qux</th>
-      <th>one</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-    <tr>
-      <th>qux</th>
-      <th>two</th>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>...</td>
-      <td>NaN</td>
-      <td>NaN</td>
-      <td>NaN</td>
-    </tr>
-  </tbody>
-</table>
-<p>8 rows × 8 columns</p>
-</div>'''.format(div_style)
-        if compat.PY2:
-            expected = expected.decode('utf-8')
-        self.assertEqual(result, expected)
-
-    def test_to_html_border(self):
-        df = DataFrame({'A': [1, 2]})
-        result = df.to_html()
-        assert 'border="1"' in result
-
-    def test_to_html_border_option(self):
-        df = DataFrame({'A': [1, 2]})
-        with pd.option_context('html.border', 0):
-            result = df.to_html()
-            self.assertTrue('border="0"' in result)
-            self.assertTrue('border="0"' in df._repr_html_())
-
-    def test_to_html_border_zero(self):
-        df = DataFrame({'A': [1, 2]})
-        result = df.to_html(border=0)
-        self.assertTrue('border="0"' in result)
-
-    def test_to_html(self):
-        # big mixed
-        biggie = DataFrame({'A': np.random.randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20, 'A'] = np.nan
-        biggie.loc[:20, 'B'] = np.nan
-        s = biggie.to_html()
-
-        buf = StringIO()
-        retval = biggie.to_html(buf=buf)
-        self.assertIsNone(retval)
-        self.assertEqual(buf.getvalue(), s)
-
-        tm.assertIsInstance(s, compat.string_types)
-
-        biggie.to_html(columns=['B', 'A'], col_space=17)
-        biggie.to_html(columns=['B', 'A'],
-                       formatters={'A': lambda x: '%.1f' % x})
-
-        biggie.to_html(columns=['B', 'A'], float_format=str)
-        biggie.to_html(columns=['B', 'A'], col_space=12, float_format=str)
-
-        frame = DataFrame(index=np.arange(200))
-        frame.to_html()
-
-    def test_to_html_filename(self):
-        biggie = DataFrame({'A': np.random.randn(200),
-                            'B': tm.makeStringIndex(200)},
-                           index=lrange(200))
-
-        biggie.loc[:20, 'A'] = np.nan
-        biggie.loc[:20, 'B'] = np.nan
-        with tm.ensure_clean('test.html') as path:
-            biggie.to_html(path)
-            with open(path, 'r') as f:
-                s = biggie.to_html()
-                s2 = f.read()
-                self.assertEqual(s, s2)
-
-        frame = DataFrame(index=np.arange(200))
-        with tm.ensure_clean('test.html') as path:
-            frame.to_html(path)
-            with open(path, 'r') as f:
-                self.assertEqual(frame.to_html(), f.read())
-
-    def test_to_html_with_no_bold(self):
-        x = DataFrame({'x': np.random.randn(5)})
-        ashtml = x.to_html(bold_rows=False)
-        self.assertFalse('<strong' in ashtml[ashtml.find("</thead>")])
-
-    def test_to_html_columns_arg(self):
-        frame = DataFrame(tm.getSeriesData())
-        result = frame.to_html(columns=['A'])
-        self.assertNotIn('<th>B</th>', result)
-
-    def test_to_html_multiindex(self):
-        columns = MultiIndex.from_tuples(list(zip(np.arange(2).repeat(2),
-                                                  np.mod(lrange(4), 2))),
-                                         names=['CL0', 'CL1'])
-        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
-        result = df.to_html(justify='left')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr>\n'
-                    '      <th>CL0</th>\n'
-                    '      <th colspan="2" halign="left">0</th>\n'
-                    '      <th colspan="2" halign="left">1</th>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>CL1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>a</td>\n'
-                    '      <td>b</td>\n'
-                    '      <td>c</td>\n'
-                    '      <td>d</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>e</td>\n'
-                    '      <td>f</td>\n'
-                    '      <td>g</td>\n'
-                    '      <td>h</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-
-        self.assertEqual(result, expected)
-
-        columns = MultiIndex.from_tuples(list(zip(
-            range(4), np.mod(
-                lrange(4), 2))))
-        df = DataFrame([list('abcd'), list('efgh')], columns=columns)
-
-        result = df.to_html(justify='right')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr>\n'
-                    '      <th></th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>2</th>\n'
-                    '      <th>3</th>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th></th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '      <th>0</th>\n'
-                    '      <th>1</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>a</td>\n'
-                    '      <td>b</td>\n'
-                    '      <td>c</td>\n'
-                    '      <td>d</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>e</td>\n'
-                    '      <td>f</td>\n'
-                    '      <td>g</td>\n'
-                    '      <td>h</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-
-        self.assertEqual(result, expected)
-
-    def test_to_html_justify(self):
-        df = DataFrame({'A': [6, 30000, 2],
-                        'B': [1, 2, 70000],
-                        'C': [223442, 0, 1]},
-                       columns=['A', 'B', 'C'])
-        result = df.to_html(justify='left')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr style="text-align: left;">\n'
-                    '      <th></th>\n'
-                    '      <th>A</th>\n'
-                    '      <th>B</th>\n'
-                    '      <th>C</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>6</td>\n'
-                    '      <td>1</td>\n'
-                    '      <td>223442</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>30000</td>\n'
-                    '      <td>2</td>\n'
-                    '      <td>0</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>2</th>\n'
-                    '      <td>2</td>\n'
-                    '      <td>70000</td>\n'
-                    '      <td>1</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-        self.assertEqual(result, expected)
-
-        result = df.to_html(justify='right')
-        expected = ('<table border="1" class="dataframe">\n'
-                    '  <thead>\n'
-                    '    <tr style="text-align: right;">\n'
-                    '      <th></th>\n'
-                    '      <th>A</th>\n'
-                    '      <th>B</th>\n'
-                    '      <th>C</th>\n'
-                    '    </tr>\n'
-                    '  </thead>\n'
-                    '  <tbody>\n'
-                    '    <tr>\n'
-                    '      <th>0</th>\n'
-                    '      <td>6</td>\n'
-                    '      <td>1</td>\n'
-                    '      <td>223442</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>1</th>\n'
-                    '      <td>30000</td>\n'
-                    '      <td>2</td>\n'
-                    '      <td>0</td>\n'
-                    '    </tr>\n'
-                    '    <tr>\n'
-                    '      <th>2</th>\n'
-                    '      <td>2</td>\n'
-                    '      <td>70000</td>\n'
-                    '      <td>1</td>\n'
-                    '    </tr>\n'
-                    '  </tbody>\n'
-                    '</table>')
-        self.assertEqual(result, expected)
-
-    def test_to_html_index(self):
-        index = ['foo', 'bar', 'baz']
-        df = DataFrame({'A': [1, 2, 3],
-                        'B': [1.2, 3.4, 5.6],
-                        'C': ['one', 'two', np.nan]},
-                       columns=['A', 'B', 'C'],
-                       index=index)
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th>foo</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>baz</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-
-        expected_without_index = ('<table border="1" class="dataframe">\n'
-                                  '  <thead>\n'
-                                  '    <tr style="text-align: right;">\n'
-                                  '      <th>A</th>\n'
-                                  '      <th>B</th>\n'
-                                  '      <th>C</th>\n'
-                                  '    </tr>\n'
-                                  '  </thead>\n'
-                                  '  <tbody>\n'
-                                  '    <tr>\n'
-                                  '      <td>1</td>\n'
-                                  '      <td>1.2</td>\n'
-                                  '      <td>one</td>\n'
-                                  '    </tr>\n'
-                                  '    <tr>\n'
-                                  '      <td>2</td>\n'
-                                  '      <td>3.4</td>\n'
-                                  '      <td>two</td>\n'
-                                  '    </tr>\n'
-                                  '    <tr>\n'
-                                  '      <td>3</td>\n'
-                                  '      <td>5.6</td>\n'
-                                  '      <td>NaN</td>\n'
-                                  '    </tr>\n'
-                                  '  </tbody>\n'
-                                  '</table>')
-        result = df.to_html(index=False)
-        for i in index:
-            self.assertNotIn(i, result)
-        self.assertEqual(result, expected_without_index)
-        df.index = Index(['foo', 'bar', 'baz'], name='idx')
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>idx</th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th>foo</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>baz</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-        self.assertEqual(df.to_html(index=False), expected_without_index)
-
-        tuples = [('foo', 'car'), ('foo', 'bike'), ('bar', 'car')]
-        df.index = MultiIndex.from_tuples(tuples)
-
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th rowspan="2" valign="top">foo</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bike</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-
-        result = df.to_html(index=False)
-        for i in ['foo', 'bar', 'car', 'bike']:
-            self.assertNotIn(i, result)
-        # must be the same result as normal index
-        self.assertEqual(result, expected_without_index)
-
-        df.index = MultiIndex.from_tuples(tuples, names=['idx1', 'idx2'])
-        expected_with_index = ('<table border="1" class="dataframe">\n'
-                               '  <thead>\n'
-                               '    <tr style="text-align: right;">\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th>A</th>\n'
-                               '      <th>B</th>\n'
-                               '      <th>C</th>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>idx1</th>\n'
-                               '      <th>idx2</th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '      <th></th>\n'
-                               '    </tr>\n'
-                               '  </thead>\n'
-                               '  <tbody>\n'
-                               '    <tr>\n'
-                               '      <th rowspan="2" valign="top">foo</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>1</td>\n'
-                               '      <td>1.2</td>\n'
-                               '      <td>one</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bike</th>\n'
-                               '      <td>2</td>\n'
-                               '      <td>3.4</td>\n'
-                               '      <td>two</td>\n'
-                               '    </tr>\n'
-                               '    <tr>\n'
-                               '      <th>bar</th>\n'
-                               '      <th>car</th>\n'
-                               '      <td>3</td>\n'
-                               '      <td>5.6</td>\n'
-                               '      <td>NaN</td>\n'
-                               '    </tr>\n'
-                               '  </tbody>\n'
-                               '</table>')
-        self.assertEqual(df.to_html(), expected_with_index)
-        self.assertEqual(df.to_html(index=False), expected_without_index)
-
-    def test_to_html_with_classes(self):
-        df = DataFrame()
-        result = df.to_html(classes="sortable draggable")
-        expected = dedent("""
-
-            <table border="1" class="dataframe sortable draggable">
-              <thead>
-                <tr style="text-align: right;">
-                  <th></th>
-                </tr>
-              </thead>
-              <tbody>
-              </tbody>
-            </table>
-
-        """).strip()
-        self.assertEqual(result, expected)
-
-        result = df.to_html(classes=["sortable", "draggable"])
-        self.assertEqual(result, expected)
-
-    def test_to_html_no_index_max_rows(self):
-        # GH https://github.com/pandas-dev/pandas/issues/14998
-        df = DataFrame({"A": [1, 2, 3, 4]})
-        result = df.to_html(index=False, max_rows=1)
-        expected = dedent("""\
-        <table border="1" class="dataframe">
-          <thead>
-            <tr style="text-align: right;">
-              <th>A</th>
-            </tr>
-          </thead>
-          <tbody>
-            <tr>
-              <td>1</td>
-            </tr>
-          </tbody>
-        </table>""")
-        self.assertEqual(result, expected)
diff --git a/pandas/tests/formats/test_to_latex.py b/pandas/tests/formats/test_to_latex.py
deleted file mode 100644
index 29ead83f3bcd9..0000000000000
--- a/pandas/tests/formats/test_to_latex.py
+++ /dev/null
@@ -1,493 +0,0 @@
-from datetime import datetime
-
-import pytest
-
-import pandas as pd
-from pandas import DataFrame, compat
-from pandas.util import testing as tm
-from pandas.compat import u
-import codecs
-
-
-@pytest.fixture
-def frame():
-    return DataFrame(tm.getSeriesData())
-
-
-class TestToLatex(object):
-
-    def test_to_latex_filename(self, frame):
-        with tm.ensure_clean('test.tex') as path:
-            frame.to_latex(path)
-
-            with open(path, 'r') as f:
-                assert frame.to_latex() == f.read()
-
-        # test with utf-8 and encoding option (GH 7061)
-        df = DataFrame([[u'au\xdfgangen']])
-        with tm.ensure_clean('test.tex') as path:
-            df.to_latex(path, encoding='utf-8')
-            with codecs.open(path, 'r', encoding='utf-8') as f:
-                assert df.to_latex() == f.read()
-
-        # test with utf-8 without encoding option
-        if compat.PY3:  # python3: pandas default encoding is utf-8
-            with tm.ensure_clean('test.tex') as path:
-                df.to_latex(path)
-                with codecs.open(path, 'r', encoding='utf-8') as f:
-                    assert df.to_latex() == f.read()
-        else:
-            # python2 default encoding is ascii, so an error should be raised
-            with tm.ensure_clean('test.tex') as path:
-                with pytest.raises(UnicodeEncodeError):
-                    df.to_latex(path)
-
-    def test_to_latex(self, frame):
-        # it works!
-        frame.to_latex()
-
-        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex()
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-{} &  a &   b \\
-\midrule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withindex_result == withindex_expected
-
-        withoutindex_result = df.to_latex(index=False)
-        withoutindex_expected = r"""\begin{tabular}{rl}
-\toprule
- a &   b \\
-\midrule
- 1 &  b1 \\
- 2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withoutindex_result == withoutindex_expected
-
-    def test_to_latex_format(self, frame):
-        # GH Bug #9402
-        frame.to_latex(column_format='ccc')
-
-        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(column_format='ccc')
-        withindex_expected = r"""\begin{tabular}{ccc}
-\toprule
-{} &  a &   b \\
-\midrule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withindex_result == withindex_expected
-
-    def test_to_latex_with_formatters(self):
-        df = DataFrame({'int': [1, 2, 3],
-                        'float': [1.0, 2.0, 3.0],
-                        'object': [(1, 2), True, False],
-                        'datetime64': [datetime(2016, 1, 1),
-                                       datetime(2016, 2, 5),
-                                       datetime(2016, 3, 3)]})
-
-        formatters = {'int': lambda x: '0x%x' % x,
-                      'float': lambda x: '[% 4.1f]' % x,
-                      'object': lambda x: '-%s-' % str(x),
-                      'datetime64': lambda x: x.strftime('%Y-%m'),
-                      '__index__': lambda x: 'index: %s' % x}
-        result = df.to_latex(formatters=dict(formatters))
-
-        expected = r"""\begin{tabular}{llrrl}
-\toprule
-{} & datetime64 &  float & int &    object \\
-\midrule
-index: 0 &    2016-01 & [ 1.0] & 0x1 &  -(1, 2)- \\
-index: 1 &    2016-02 & [ 2.0] & 0x2 &    -True- \\
-index: 2 &    2016-03 & [ 3.0] & 0x3 &   -False- \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-    def test_to_latex_multiindex(self):
-        df = DataFrame({('x', 'y'): ['a']})
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{ll}
-\toprule
-{} &  x \\
-{} &  y \\
-\midrule
-0 &  a \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert result == expected
-
-        result = df.T.to_latex()
-        expected = r"""\begin{tabular}{lll}
-\toprule
-  &   &  0 \\
-\midrule
-x & y &  a \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert result == expected
-
-        df = DataFrame.from_dict({
-            ('c1', 0): pd.Series(dict((x, x) for x in range(4))),
-            ('c1', 1): pd.Series(dict((x, x + 4) for x in range(4))),
-            ('c2', 0): pd.Series(dict((x, x) for x in range(4))),
-            ('c2', 1): pd.Series(dict((x, x + 4) for x in range(4))),
-            ('c3', 0): pd.Series(dict((x, x) for x in range(4))),
-        }).T
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{llrrrr}
-\toprule
-   &   &  0 &  1 &  2 &  3 \\
-\midrule
-c1 & 0 &  0 &  1 &  2 &  3 \\
-   & 1 &  4 &  5 &  6 &  7 \\
-c2 & 0 &  0 &  1 &  2 &  3 \\
-   & 1 &  4 &  5 &  6 &  7 \\
-c3 & 0 &  0 &  1 &  2 &  3 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert result == expected
-
-        # GH 14184
-        df = df.T
-        df.columns.names = ['a', 'b']
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{lrrrrr}
-\toprule
-a & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
-b &  0 &  1 &  0 &  1 &  0 \\
-\midrule
-0 &  0 &  4 &  0 &  4 &  0 \\
-1 &  1 &  5 &  1 &  5 &  1 \\
-2 &  2 &  6 &  2 &  6 &  2 \\
-3 &  3 &  7 &  3 &  7 &  3 \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-        # GH 10660
-        df = pd.DataFrame({'a': [0, 0, 1, 1],
-                           'b': list('abab'),
-                           'c': [1, 2, 3, 4]})
-        result = df.set_index(['a', 'b']).to_latex()
-        expected = r"""\begin{tabular}{llr}
-\toprule
-  &   &  c \\
-a & b &    \\
-\midrule
-0 & a &  1 \\
-  & b &  2 \\
-1 & a &  3 \\
-  & b &  4 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert result == expected
-
-        result = df.groupby('a').describe().to_latex()
-        expected = r"""\begin{tabular}{lrrrrrrrr}
-\toprule
-{} & \multicolumn{8}{l}{c} \\
-{} & count & mean &       std &  min &   25\% &  50\% &   75\% &  max \\
-a &       &      &           &      &       &      &       &      \\
-\midrule
-0 &   2.0 &  1.5 &  0.707107 &  1.0 &  1.25 &  1.5 &  1.75 &  2.0 \\
-1 &   2.0 &  3.5 &  0.707107 &  3.0 &  3.25 &  3.5 &  3.75 &  4.0 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert result == expected
-
-    def test_to_latex_multicolumnrow(self):
-        df = pd.DataFrame({
-            ('c1', 0): dict((x, x) for x in range(5)),
-            ('c1', 1): dict((x, x + 5) for x in range(5)),
-            ('c2', 0): dict((x, x) for x in range(5)),
-            ('c2', 1): dict((x, x + 5) for x in range(5)),
-            ('c3', 0): dict((x, x) for x in range(5))
-        })
-        result = df.to_latex()
-        expected = r"""\begin{tabular}{lrrrrr}
-\toprule
-{} & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
-{} &  0 &  1 &  0 &  1 &  0 \\
-\midrule
-0 &  0 &  5 &  0 &  5 &  0 \\
-1 &  1 &  6 &  1 &  6 &  1 \\
-2 &  2 &  7 &  2 &  7 &  2 \\
-3 &  3 &  8 &  3 &  8 &  3 \\
-4 &  4 &  9 &  4 &  9 &  4 \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-        result = df.to_latex(multicolumn=False)
-        expected = r"""\begin{tabular}{lrrrrr}
-\toprule
-{} & c1 &    & c2 &    & c3 \\
-{} &  0 &  1 &  0 &  1 &  0 \\
-\midrule
-0 &  0 &  5 &  0 &  5 &  0 \\
-1 &  1 &  6 &  1 &  6 &  1 \\
-2 &  2 &  7 &  2 &  7 &  2 \\
-3 &  3 &  8 &  3 &  8 &  3 \\
-4 &  4 &  9 &  4 &  9 &  4 \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-        result = df.T.to_latex(multirow=True)
-        expected = r"""\begin{tabular}{llrrrrr}
-\toprule
-   &   &  0 &  1 &  2 &  3 &  4 \\
-\midrule
-\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
-   & 1 &  5 &  6 &  7 &  8 &  9 \\
-\cline{1-7}
-\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
-   & 1 &  5 &  6 &  7 &  8 &  9 \\
-\cline{1-7}
-c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-        df.index = df.T.index
-        result = df.T.to_latex(multirow=True, multicolumn=True,
-                               multicolumn_format='c')
-        expected = r"""\begin{tabular}{llrrrrr}
-\toprule
-   &   & \multicolumn{2}{c}{c1} & \multicolumn{2}{c}{c2} & c3 \\
-   &   &  0 &  1 &  0 &  1 &  0 \\
-\midrule
-\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
-   & 1 &  5 &  6 &  7 &  8 &  9 \\
-\cline{1-7}
-\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
-   & 1 &  5 &  6 &  7 &  8 &  9 \\
-\cline{1-7}
-c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
-\bottomrule
-\end{tabular}
-"""
-        assert result == expected
-
-    def test_to_latex_escape(self):
-        a = 'a'
-        b = 'b'
-
-        test_dict = {u('co^l1'): {a: "a",
-                                  b: "b"},
-                     u('co$e^x$'): {a: "a",
-                                    b: "b"}}
-
-        unescaped_result = DataFrame(test_dict).to_latex(escape=False)
-        escaped_result = DataFrame(test_dict).to_latex(
-        )  # default: escape=True
-
-        unescaped_expected = r'''\begin{tabular}{lll}
-\toprule
-{} & co$e^x$ & co^l1 \\
-\midrule
-a &       a &     a \\
-b &       b &     b \\
-\bottomrule
-\end{tabular}
-'''
-
-        escaped_expected = r'''\begin{tabular}{lll}
-\toprule
-{} & co\$e\textasciicircumx\$ & co\textasciicircuml1 \\
-\midrule
-a &       a &     a \\
-b &       b &     b \\
-\bottomrule
-\end{tabular}
-'''
-
-        assert unescaped_result == unescaped_expected
-        assert escaped_result == escaped_expected
-
-    def test_to_latex_longtable(self, frame):
-        frame.to_latex(longtable=True)
-
-        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(longtable=True)
-        withindex_expected = r"""\begin{longtable}{lrl}
-\toprule
-{} &  a &   b \\
-\midrule
-\endhead
-\midrule
-\multicolumn{3}{r}{{Continued on next page}} \\
-\midrule
-\endfoot
-
-\bottomrule
-\endlastfoot
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\end{longtable}
-"""
-
-        assert withindex_result == withindex_expected
-
-        withoutindex_result = df.to_latex(index=False, longtable=True)
-        withoutindex_expected = r"""\begin{longtable}{rl}
-\toprule
- a &   b \\
-\midrule
-\endhead
-\midrule
-\multicolumn{3}{r}{{Continued on next page}} \\
-\midrule
-\endfoot
-
-\bottomrule
-\endlastfoot
- 1 &  b1 \\
- 2 &  b2 \\
-\end{longtable}
-"""
-
-        assert withoutindex_result == withoutindex_expected
-
-    def test_to_latex_escape_special_chars(self):
-        special_characters = ['&', '%', '$', '#', '_', '{', '}', '~', '^',
-                              '\\']
-        df = DataFrame(data=special_characters)
-        observed = df.to_latex()
-        expected = r"""\begin{tabular}{ll}
-\toprule
-{} &  0 \\
-\midrule
-0 &  \& \\
-1 &  \% \\
-2 &  \$ \\
-3 &  \# \\
-4 &  \_ \\
-5 &  \{ \\
-6 &  \} \\
-7 &  \textasciitilde \\
-8 &  \textasciicircum \\
-9 &  \textbackslash \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert observed == expected
-
-    def test_to_latex_no_header(self):
-        # GH 7124
-        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(header=False)
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withindex_result == withindex_expected
-
-        withoutindex_result = df.to_latex(index=False, header=False)
-        withoutindex_expected = r"""\begin{tabular}{rl}
-\toprule
- 1 &  b1 \\
- 2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withoutindex_result == withoutindex_expected
-
-    def test_to_latex_specified_header(self):
-        # GH 7124
-        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(header=['AA', 'BB'])
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-{} & AA &  BB \\
-\midrule
-0 &  1 &  b1 \\
-1 &  2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withindex_result == withindex_expected
-
-        withoutindex_result = df.to_latex(header=['AA', 'BB'], index=False)
-        withoutindex_expected = r"""\begin{tabular}{rl}
-\toprule
-AA &  BB \\
-\midrule
- 1 &  b1 \\
- 2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withoutindex_result == withoutindex_expected
-
-        withoutescape_result = df.to_latex(header=['$A$', '$B$'], escape=False)
-        withoutescape_expected = r"""\begin{tabular}{lrl}
-\toprule
-{} & $A$ & $B$ \\
-\midrule
-0 &   1 &  b1 \\
-1 &   2 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withoutescape_result == withoutescape_expected
-
-        with tm.assertRaises(ValueError):
-            df.to_latex(header=['A'])
-
-    def test_to_latex_decimal(self, frame):
-        # GH 12031
-        frame.to_latex()
-
-        df = DataFrame({'a': [1.0, 2.1], 'b': ['b1', 'b2']})
-        withindex_result = df.to_latex(decimal=',')
-
-        withindex_expected = r"""\begin{tabular}{lrl}
-\toprule
-{} &    a &   b \\
-\midrule
-0 &  1,0 &  b1 \\
-1 &  2,1 &  b2 \\
-\bottomrule
-\end{tabular}
-"""
-
-        assert withindex_result == withindex_expected
diff --git a/pandas/tests/frame/common.py b/pandas/tests/frame/common.py
index b9cd764c8704c..5624f7c1303b6 100644
--- a/pandas/tests/frame/common.py
+++ b/pandas/tests/frame/common.py
@@ -1,17 +1,18 @@
 import numpy as np
 
+from pandas.util._decorators import cache_readonly
+
+import pandas as pd
 from pandas import compat
-from pandas.util.decorators import cache_readonly
 import pandas.util.testing as tm
-import pandas as pd
 
 _seriesd = tm.getSeriesData()
 _tsd = tm.getTimeSeriesData()
 
 _frame = pd.DataFrame(_seriesd)
 _frame2 = pd.DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
-_intframe = pd.DataFrame(dict((k, v.astype(int))
-                              for k, v in compat.iteritems(_seriesd)))
+_intframe = pd.DataFrame({k: v.astype(int)
+                          for k, v in compat.iteritems(_seriesd)})
 
 _tsframe = pd.DataFrame(_tsd)
 
@@ -32,8 +33,7 @@ def frame2(self):
     @cache_readonly
     def intframe(self):
         # force these all to int64 to avoid platform testing issues
-        return pd.DataFrame(dict([(c, s) for c, s in
-                                  compat.iteritems(_intframe)]),
+        return pd.DataFrame({c: s for c, s in compat.iteritems(_intframe)},
                             dtype=np.int64)
 
     @cache_readonly
@@ -85,7 +85,7 @@ def tzframe(self):
 
     @cache_readonly
     def empty(self):
-        return pd.DataFrame({})
+        return pd.DataFrame()
 
     @cache_readonly
     def ts1(self):
@@ -112,7 +112,7 @@ def _check_mixed_float(df, dtype=None):
     # float16 are most likely to be upcasted to float32
     dtypes = dict(A='float32', B='float32', C='float16', D='float64')
     if isinstance(dtype, compat.string_types):
-        dtypes = dict([(k, dtype) for k, v in dtypes.items()])
+        dtypes = {k: dtype for k, v in dtypes.items()}
     elif isinstance(dtype, dict):
         dtypes.update(dtype)
     if dtypes.get('A'):
@@ -128,7 +128,7 @@ def _check_mixed_float(df, dtype=None):
 def _check_mixed_int(df, dtype=None):
     dtypes = dict(A='int32', B='uint64', C='uint8', D='int64')
     if isinstance(dtype, compat.string_types):
-        dtypes = dict([(k, dtype) for k, v in dtypes.items()])
+        dtypes = {k: dtype for k, v in dtypes.items()}
     elif isinstance(dtype, dict):
         dtypes.update(dtype)
     if dtypes.get('A'):
diff --git a/pandas/tests/frame/conftest.py b/pandas/tests/frame/conftest.py
new file mode 100644
index 0000000000000..fbe03325a3ad9
--- /dev/null
+++ b/pandas/tests/frame/conftest.py
@@ -0,0 +1,159 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, NaT, compat, date_range
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def float_frame():
+    """
+    Fixture for DataFrame of floats with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D'].
+    """
+    return DataFrame(tm.getSeriesData())
+
+
+@pytest.fixture
+def float_frame_with_na():
+    """
+    Fixture for DataFrame of floats with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D']; some entries are missing
+    """
+    df = DataFrame(tm.getSeriesData())
+    # set some NAs
+    df.loc[5:10] = np.nan
+    df.loc[15:20, -2:] = np.nan
+    return df
+
+
+@pytest.fixture
+def bool_frame_with_na():
+    """
+    Fixture for DataFrame of booleans with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D']; some entries are missing
+    """
+    df = DataFrame(tm.getSeriesData()) > 0
+    df = df.astype(object)
+    # set some NAs
+    df.loc[5:10] = np.nan
+    df.loc[15:20, -2:] = np.nan
+    return df
+
+
+@pytest.fixture
+def int_frame():
+    """
+    Fixture for DataFrame of ints with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D']
+    """
+    df = DataFrame({k: v.astype(int)
+                   for k, v in compat.iteritems(tm.getSeriesData())})
+    # force these all to int64 to avoid platform testing issues
+    return DataFrame({c: s for c, s in compat.iteritems(df)}, dtype=np.int64)
+
+
+@pytest.fixture
+def datetime_frame():
+    """
+    Fixture for DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']
+    """
+    return DataFrame(tm.getTimeSeriesData())
+
+
+@pytest.fixture
+def float_string_frame():
+    """
+    Fixture for DataFrame of floats and strings with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D', 'foo'].
+    """
+    df = DataFrame(tm.getSeriesData())
+    df['foo'] = 'bar'
+    return df
+
+
+@pytest.fixture
+def mixed_float_frame():
+    """
+    Fixture for DataFrame of different float types with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D'].
+    """
+    df = DataFrame(tm.getSeriesData())
+    df.A = df.A.astype('float32')
+    df.B = df.B.astype('float32')
+    df.C = df.C.astype('float16')
+    df.D = df.D.astype('float64')
+    return df
+
+
+@pytest.fixture
+def mixed_int_frame():
+    """
+    Fixture for DataFrame of different int types with index of unique strings
+
+    Columns are ['A', 'B', 'C', 'D'].
+    """
+    df = DataFrame({k: v.astype(int)
+                   for k, v in compat.iteritems(tm.getSeriesData())})
+    df.A = df.A.astype('int32')
+    df.B = np.ones(len(df.B), dtype='uint64')
+    df.C = df.C.astype('uint8')
+    df.D = df.C.astype('int64')
+    return df
+
+
+@pytest.fixture
+def timezone_frame():
+    """
+    Fixture for DataFrame of date_range Series with different time zones
+
+    Columns are ['A', 'B', 'C']; some entries are missing
+    """
+    df = DataFrame({'A': date_range('20130101', periods=3),
+                    'B': date_range('20130101', periods=3,
+                                    tz='US/Eastern'),
+                    'C': date_range('20130101', periods=3,
+                                    tz='CET')})
+    df.iloc[1, 1] = NaT
+    df.iloc[1, 2] = NaT
+    return df
+
+
+@pytest.fixture
+def simple_frame():
+    """
+    Fixture for simple 3x3 DataFrame
+
+    Columns are ['one', 'two', 'three'], index is ['a', 'b', 'c'].
+    """
+    arr = np.array([[1., 2., 3.],
+                    [4., 5., 6.],
+                    [7., 8., 9.]])
+
+    return DataFrame(arr, columns=['one', 'two', 'three'],
+                     index=['a', 'b', 'c'])
+
+
+@pytest.fixture
+def frame_of_index_cols():
+    """
+    Fixture for DataFrame of columns that can be used for indexing
+
+    Columns are ['A', 'B', 'C', 'D', 'E', ('tuple', 'as', 'label')];
+    'A' & 'B' contain duplicates (but are jointly unique), the rest are unique.
+    """
+    df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
+                    'B': ['one', 'two', 'three', 'one', 'two'],
+                    'C': ['a', 'b', 'c', 'd', 'e'],
+                    'D': np.random.randn(5),
+                    'E': np.random.randn(5),
+                    ('tuple', 'as', 'label'): np.random.randn(5)})
+    return df
diff --git a/pandas/tests/frame/test_alter_axes.py b/pandas/tests/frame/test_alter_axes.py
index e52bfdbd4f837..bc5cf30d096fd 100644
--- a/pandas/tests/frame/test_alter_axes.py
+++ b/pandas/tests/frame/test_alter_axes.py
@@ -3,189 +3,424 @@
 from __future__ import print_function
 
 from datetime import datetime, timedelta
+import inspect
 
 import numpy as np
+import pytest
 
-from pandas.compat import lrange
-from pandas import (DataFrame, Series, Index, MultiIndex,
-                    RangeIndex, date_range)
-import pandas as pd
+from pandas.compat import PY2, lrange
 
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_interval_dtype, is_object_dtype)
 
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, IntervalIndex, MultiIndex,
+    RangeIndex, Series, Timestamp, cut, date_range, to_datetime)
 import pandas.util.testing as tm
 
-from pandas.tests.frame.common import TestData
 
+class TestDataFrameAlterAxes():
 
-class TestDataFrameAlterAxes(tm.TestCase, TestData):
+    def test_set_index_directly(self, float_string_frame):
+        df = float_string_frame
+        idx = Index(np.arange(len(df))[::-1])
 
-    def test_set_index(self):
-        idx = Index(np.arange(len(self.mixed_frame)))
+        df.index = idx
+        tm.assert_index_equal(df.index, idx)
+        with pytest.raises(ValueError, match='Length mismatch'):
+            df.index = idx[::2]
 
-        # cache it
-        _ = self.mixed_frame['foo']  # noqa
-        self.mixed_frame.index = idx
-        self.assertIs(self.mixed_frame['foo'].index, idx)
-        with assertRaisesRegexp(ValueError, 'Length mismatch'):
-            self.mixed_frame.index = idx[::2]
+    def test_set_index(self, float_string_frame):
+        df = float_string_frame
+        idx = Index(np.arange(len(df))[::-1])
 
-    def test_set_index_cast(self):
+        df = df.set_index(idx)
+        tm.assert_index_equal(df.index, idx)
+        with pytest.raises(ValueError, match='Length mismatch'):
+            df.set_index(idx[::2])
 
+    def test_set_index_cast(self):
         # issue casting an index then set_index
         df = DataFrame({'A': [1.1, 2.2, 3.3], 'B': [5.0, 6.1, 7.2]},
                        index=[2010, 2011, 2012])
-        expected = df.loc[2010]
-        new_index = df.index.astype(np.int32)
-        df.index = new_index
-        result = df.loc[2010]
-        assert_series_equal(result, expected)
-
-    def test_set_index2(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
-                        'B': ['one', 'two', 'three', 'one', 'two'],
-                        'C': ['a', 'b', 'c', 'd', 'e'],
-                        'D': np.random.randn(5),
-                        'E': np.random.randn(5)})
-
-        # new object, single-column
-        result = df.set_index('C')
-        result_nodrop = df.set_index('C', drop=False)
-
-        index = Index(df['C'], name='C')
-
-        expected = df.loc[:, ['A', 'B', 'D', 'E']]
-        expected.index = index
-
-        expected_nodrop = df.copy()
-        expected_nodrop.index = index
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result_nodrop, expected_nodrop)
-        self.assertEqual(result.index.name, index.name)
-
-        # inplace, single
-        df2 = df.copy()
-
-        df2.set_index('C', inplace=True)
-
-        assert_frame_equal(df2, expected)
-
-        df3 = df.copy()
-        df3.set_index('C', drop=False, inplace=True)
-
-        assert_frame_equal(df3, expected_nodrop)
-
-        # create new object, multi-column
-        result = df.set_index(['A', 'B'])
-        result_nodrop = df.set_index(['A', 'B'], drop=False)
-
-        index = MultiIndex.from_arrays([df['A'], df['B']], names=['A', 'B'])
-
-        expected = df.loc[:, ['C', 'D', 'E']]
-        expected.index = index
-
-        expected_nodrop = df.copy()
-        expected_nodrop.index = index
+        df2 = df.set_index(df.index.astype(np.int32))
+        tm.assert_frame_equal(df, df2)
+
+    # A has duplicate values, C does not
+    @pytest.mark.parametrize('keys', ['A', 'C', ['A', 'B'],
+                                      ('tuple', 'as', 'label')])
+    @pytest.mark.parametrize('inplace', [True, False])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_drop_inplace(self, frame_of_index_cols,
+                                    drop, inplace, keys):
+        df = frame_of_index_cols
+
+        if isinstance(keys, list):
+            idx = MultiIndex.from_arrays([df[x] for x in keys], names=keys)
+        else:
+            idx = Index(df[keys], name=keys)
+        expected = df.drop(keys, axis=1) if drop else df
+        expected.index = idx
+
+        if inplace:
+            result = df.copy()
+            result.set_index(keys, drop=drop, inplace=True)
+        else:
+            result = df.set_index(keys, drop=drop)
+
+        tm.assert_frame_equal(result, expected)
+
+    # A has duplicate values, C does not
+    @pytest.mark.parametrize('keys', ['A', 'C', ['A', 'B'],
+                                      ('tuple', 'as', 'label')])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_append(self, frame_of_index_cols, drop, keys):
+        df = frame_of_index_cols
+
+        keys = keys if isinstance(keys, list) else [keys]
+        idx = MultiIndex.from_arrays([df.index] + [df[x] for x in keys],
+                                     names=[None] + keys)
+        expected = df.drop(keys, axis=1) if drop else df.copy()
+        expected.index = idx
+
+        result = df.set_index(keys, drop=drop, append=True)
+
+        tm.assert_frame_equal(result, expected)
+
+    # A has duplicate values, C does not
+    @pytest.mark.parametrize('keys', ['A', 'C', ['A', 'B'],
+                                      ('tuple', 'as', 'label')])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_append_to_multiindex(self, frame_of_index_cols,
+                                            drop, keys):
+        # append to existing multiindex
+        df = frame_of_index_cols.set_index(['D'], drop=drop, append=True)
 
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result_nodrop, expected_nodrop)
-        self.assertEqual(result.index.names, index.names)
+        keys = keys if isinstance(keys, list) else [keys]
+        expected = frame_of_index_cols.set_index(['D'] + keys,
+                                                 drop=drop, append=True)
 
-        # inplace
-        df2 = df.copy()
-        df2.set_index(['A', 'B'], inplace=True)
-        assert_frame_equal(df2, expected)
+        result = df.set_index(keys, drop=drop, append=True)
 
-        df3 = df.copy()
-        df3.set_index(['A', 'B'], drop=False, inplace=True)
-        assert_frame_equal(df3, expected_nodrop)
+        tm.assert_frame_equal(result, expected)
 
-        # corner case
-        with assertRaisesRegexp(ValueError, 'Index has duplicate keys'):
+    def test_set_index_after_mutation(self):
+        # GH1590
+        df = DataFrame({'val': [0, 1, 2], 'key': ['a', 'b', 'c']})
+        expected = DataFrame({'val': [1, 2]},
+                             Index(['b', 'c'], name='key'))
+
+        df2 = df.loc[df.index.map(lambda indx: indx >= 1)]
+        result = df2.set_index('key')
+        tm.assert_frame_equal(result, expected)
+
+    # MultiIndex constructor does not work directly on Series -> lambda
+    # Add list-of-list constructor because list is ambiguous -> lambda
+    # also test index name if append=True (name is duplicate here for B)
+    @pytest.mark.parametrize('box', [Series, Index, np.array,
+                                     list, lambda x: [list(x)],
+                                     lambda x: MultiIndex.from_arrays([x])])
+    @pytest.mark.parametrize('append, index_name', [(True, None),
+                             (True, 'B'), (True, 'test'), (False, None)])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_pass_single_array(self, frame_of_index_cols,
+                                         drop, append, index_name, box):
+        df = frame_of_index_cols
+        df.index.name = index_name
+
+        key = box(df['B'])
+        if box == list:
+            # list of strings gets interpreted as list of keys
+            msg = "['one', 'two', 'three', 'one', 'two']"
+            with pytest.raises(KeyError, match=msg):
+                df.set_index(key, drop=drop, append=append)
+        else:
+            # np.array/list-of-list "forget" the name of B
+            name_mi = getattr(key, 'names', None)
+            name = [getattr(key, 'name', None)] if name_mi is None else name_mi
+
+            result = df.set_index(key, drop=drop, append=append)
+
+            # only valid column keys are dropped
+            # since B is always passed as array above, nothing is dropped
+            expected = df.set_index(['B'], drop=False, append=append)
+            expected.index.names = [index_name] + name if append else name
+
+            tm.assert_frame_equal(result, expected)
+
+    # MultiIndex constructor does not work directly on Series -> lambda
+    # also test index name if append=True (name is duplicate here for A & B)
+    @pytest.mark.parametrize('box', [Series, Index, np.array, list,
+                                     lambda x: MultiIndex.from_arrays([x])])
+    @pytest.mark.parametrize('append, index_name',
+                             [(True, None), (True, 'A'), (True, 'B'),
+                              (True, 'test'), (False, None)])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_pass_arrays(self, frame_of_index_cols,
+                                   drop, append, index_name, box):
+        df = frame_of_index_cols
+        df.index.name = index_name
+
+        keys = ['A', box(df['B'])]
+        # np.array/list "forget" the name of B
+        names = ['A', None if box in [np.array, list, tuple, iter] else 'B']
+
+        result = df.set_index(keys, drop=drop, append=append)
+
+        # only valid column keys are dropped
+        # since B is always passed as array above, only A is dropped, if at all
+        expected = df.set_index(['A', 'B'], drop=False, append=append)
+        expected = expected.drop('A', axis=1) if drop else expected
+        expected.index.names = [index_name] + names if append else names
+
+        tm.assert_frame_equal(result, expected)
+
+    # MultiIndex constructor does not work directly on Series -> lambda
+    # We also emulate a "constructor" for the label -> lambda
+    # also test index name if append=True (name is duplicate here for A)
+    @pytest.mark.parametrize('box2', [Series, Index, np.array, list, iter,
+                                      lambda x: MultiIndex.from_arrays([x]),
+                                      lambda x: x.name])
+    @pytest.mark.parametrize('box1', [Series, Index, np.array, list, iter,
+                                      lambda x: MultiIndex.from_arrays([x]),
+                                      lambda x: x.name])
+    @pytest.mark.parametrize('append, index_name', [(True, None),
+                             (True, 'A'), (True, 'test'), (False, None)])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_pass_arrays_duplicate(self, frame_of_index_cols, drop,
+                                             append, index_name, box1, box2):
+        df = frame_of_index_cols
+        df.index.name = index_name
+
+        keys = [box1(df['A']), box2(df['A'])]
+        result = df.set_index(keys, drop=drop, append=append)
+
+        # if either box is iter, it has been consumed; re-read
+        keys = [box1(df['A']), box2(df['A'])]
+
+        # need to adapt first drop for case that both keys are 'A' --
+        # cannot drop the same column twice;
+        # use "is" because == would give ambiguous Boolean error for containers
+        first_drop = False if (keys[0] is 'A' and keys[1] is 'A') else drop
+
+        # to test against already-tested behaviour, we add sequentially,
+        # hence second append always True; must wrap keys in list, otherwise
+        # box = list would be interpreted as keys
+        expected = df.set_index([keys[0]], drop=first_drop, append=append)
+        expected = expected.set_index([keys[1]], drop=drop, append=True)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('append', [True, False])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_pass_multiindex(self, frame_of_index_cols,
+                                       drop, append):
+        df = frame_of_index_cols
+        keys = MultiIndex.from_arrays([df['A'], df['B']], names=['A', 'B'])
+
+        result = df.set_index(keys, drop=drop, append=append)
+
+        # setting with a MultiIndex will never drop columns
+        expected = df.set_index(['A', 'B'], drop=False, append=append)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_set_index_verify_integrity(self, frame_of_index_cols):
+        df = frame_of_index_cols
+
+        with pytest.raises(ValueError, match='Index has duplicate keys'):
             df.set_index('A', verify_integrity=True)
+        # with MultiIndex
+        with pytest.raises(ValueError, match='Index has duplicate keys'):
+            df.set_index([df['A'], df['A']], verify_integrity=True)
+
+    @pytest.mark.parametrize('append', [True, False])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_raise_keys(self, frame_of_index_cols, drop, append):
+        df = frame_of_index_cols
+
+        with pytest.raises(KeyError, match="['foo', 'bar', 'baz']"):
+            # column names are A-E, as well as one tuple
+            df.set_index(['foo', 'bar', 'baz'], drop=drop, append=append)
+
+        # non-existent key in list with arrays
+        with pytest.raises(KeyError, match='X'):
+            df.set_index([df['A'], df['B'], 'X'], drop=drop, append=append)
+
+        msg = "[('foo', 'foo', 'foo', 'bar', 'bar')]"
+        # tuples always raise KeyError
+        with pytest.raises(KeyError, match=msg):
+            df.set_index(tuple(df['A']), drop=drop, append=append)
+
+        # also within a list
+        with pytest.raises(KeyError, match=msg):
+            df.set_index(['A', df['A'], tuple(df['A'])],
+                         drop=drop, append=append)
+
+    @pytest.mark.parametrize('append', [True, False])
+    @pytest.mark.parametrize('drop', [True, False])
+    @pytest.mark.parametrize('box', [set], ids=['set'])
+    def test_set_index_raise_on_type(self, frame_of_index_cols, box,
+                                     drop, append):
+        df = frame_of_index_cols
+
+        msg = 'The parameter "keys" may be a column key, .*'
+        # forbidden type, e.g. set
+        with pytest.raises(TypeError, match=msg):
+            df.set_index(box(df['A']), drop=drop, append=append)
+
+        # forbidden type in list, e.g. set
+        with pytest.raises(TypeError, match=msg):
+            df.set_index(['A', df['A'], box(df['A'])],
+                         drop=drop, append=append)
+
+    # MultiIndex constructor does not work directly on Series -> lambda
+    @pytest.mark.parametrize('box', [Series, Index, np.array, iter,
+                                     lambda x: MultiIndex.from_arrays([x])],
+                             ids=['Series', 'Index', 'np.array',
+                                  'iter', 'MultiIndex'])
+    @pytest.mark.parametrize('length', [4, 6], ids=['too_short', 'too_long'])
+    @pytest.mark.parametrize('append', [True, False])
+    @pytest.mark.parametrize('drop', [True, False])
+    def test_set_index_raise_on_len(self, frame_of_index_cols, box, length,
+                                    drop, append):
+        # GH 24984
+        df = frame_of_index_cols  # has length 5
+
+        values = np.random.randint(0, 10, (length,))
+
+        msg = 'Length mismatch: Expected 5 rows, received array of length.*'
+
+        # wrong length directly
+        with pytest.raises(ValueError, match=msg):
+            df.set_index(box(values), drop=drop, append=append)
+
+        # wrong length in list
+        with pytest.raises(ValueError, match=msg):
+            df.set_index(['A', df.A, box(values)], drop=drop, append=append)
+
+    def test_set_index_custom_label_type(self):
+        # GH 24969
+
+        class Thing(object):
+            def __init__(self, name, color):
+                self.name = name
+                self.color = color
+
+            def __str__(self):
+                return "<Thing %r>" % (self.name,)
+
+            # necessary for pretty KeyError
+            __repr__ = __str__
+
+        thing1 = Thing('One', 'red')
+        thing2 = Thing('Two', 'blue')
+        df = DataFrame({thing1: [0, 1], thing2: [2, 3]})
+        expected = DataFrame({thing1: [0, 1]},
+                             index=Index([2, 3], name=thing2))
+
+        # use custom label directly
+        result = df.set_index(thing2)
+        tm.assert_frame_equal(result, expected)
+
+        # custom label wrapped in list
+        result = df.set_index([thing2])
+        tm.assert_frame_equal(result, expected)
+
+        # missing key
+        thing3 = Thing('Three', 'pink')
+        msg = "<Thing 'Three'>"
+        with pytest.raises(KeyError, match=msg):
+            # missing label directly
+            df.set_index(thing3)
+
+        with pytest.raises(KeyError, match=msg):
+            # missing label in list
+            df.set_index([thing3])
+
+    def test_set_index_custom_label_hashable_iterable(self):
+        # GH 24969
+
+        # actual example discussed in GH 24984 was e.g. for shapely.geometry
+        # objects (e.g. a collection of Points) that can be both hashable and
+        # iterable; using frozenset as a stand-in for testing here
+
+        class Thing(frozenset):
+            # need to stabilize repr for KeyError (due to random order in sets)
+            def __repr__(self):
+                tmp = sorted(list(self))
+                # double curly brace prints one brace in format string
+                return "frozenset({{{}}})".format(', '.join(map(repr, tmp)))
+
+        thing1 = Thing(['One', 'red'])
+        thing2 = Thing(['Two', 'blue'])
+        df = DataFrame({thing1: [0, 1], thing2: [2, 3]})
+        expected = DataFrame({thing1: [0, 1]},
+                             index=Index([2, 3], name=thing2))
+
+        # use custom label directly
+        result = df.set_index(thing2)
+        tm.assert_frame_equal(result, expected)
+
+        # custom label wrapped in list
+        result = df.set_index([thing2])
+        tm.assert_frame_equal(result, expected)
+
+        # missing key
+        thing3 = Thing(['Three', 'pink'])
+        msg = r"frozenset\(\{'Three', 'pink'\}\)"
+        with pytest.raises(KeyError, match=msg):
+            # missing label directly
+            df.set_index(thing3)
+
+        with pytest.raises(KeyError, match=msg):
+            # missing label in list
+            df.set_index([thing3])
+
+    def test_set_index_custom_label_type_raises(self):
+        # GH 24969
+
+        # purposefully inherit from something unhashable
+        class Thing(set):
+            def __init__(self, name, color):
+                self.name = name
+                self.color = color
 
-        # append
-        result = df.set_index(['A', 'B'], append=True)
-        xp = df.reset_index().set_index(['index', 'A', 'B'])
-        xp.index.names = [None, 'A', 'B']
-        assert_frame_equal(result, xp)
+            def __str__(self):
+                return "<Thing %r>" % (self.name,)
 
-        # append to existing multiindex
-        rdf = df.set_index(['A'], append=True)
-        rdf = rdf.set_index(['B', 'C'], append=True)
-        expected = df.set_index(['A', 'B', 'C'], append=True)
-        assert_frame_equal(rdf, expected)
-
-        # Series
-        result = df.set_index(df.C)
-        self.assertEqual(result.index.name, 'C')
-
-    def test_set_index_nonuniq(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'bar', 'bar'],
-                        'B': ['one', 'two', 'three', 'one', 'two'],
-                        'C': ['a', 'b', 'c', 'd', 'e'],
-                        'D': np.random.randn(5),
-                        'E': np.random.randn(5)})
-        with assertRaisesRegexp(ValueError, 'Index has duplicate keys'):
-            df.set_index('A', verify_integrity=True, inplace=True)
-        self.assertIn('A', df)
-
-    def test_set_index_bug(self):
-        # GH1590
-        df = DataFrame({'val': [0, 1, 2], 'key': ['a', 'b', 'c']})
-        df2 = df.select(lambda indx: indx >= 1)
-        rs = df2.set_index('key')
-        xp = DataFrame({'val': [1, 2]},
-                       Index(['b', 'c'], name='key'))
-        assert_frame_equal(rs, xp)
-
-    def test_set_index_pass_arrays(self):
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'three',
-                              'two', 'two', 'one', 'three'],
-                        'C': np.random.randn(8),
-                        'D': np.random.randn(8)})
-
-        # multiple columns
-        result = df.set_index(['A', df['B'].values], drop=False)
-        expected = df.set_index(['A', 'B'], drop=False)
-
-        # TODO should set_index check_names ?
-        assert_frame_equal(result, expected, check_names=False)
+        thing1 = Thing('One', 'red')
+        thing2 = Thing('Two', 'blue')
+        df = DataFrame([[0, 2], [1, 3]], columns=[thing1, thing2])
+
+        msg = 'The parameter "keys" may be a column key, .*'
+
+        with pytest.raises(TypeError, match=msg):
+            # use custom label directly
+            df.set_index(thing2)
+
+        with pytest.raises(TypeError, match=msg):
+            # custom label wrapped in list
+            df.set_index([thing2])
 
     def test_construction_with_categorical_index(self):
-
         ci = tm.makeCategoricalIndex(10)
+        ci.name = 'B'
 
         # with Categorical
         df = DataFrame({'A': np.random.randn(10),
                         'B': ci.values})
         idf = df.set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
+        tm.assert_index_equal(idf.index, ci)
 
         # from a CategoricalIndex
         df = DataFrame({'A': np.random.randn(10),
                         'B': ci})
         idf = df.set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
+        tm.assert_index_equal(idf.index, ci)
 
-        idf = df.set_index('B').reset_index().set_index('B')
-        str(idf)
-        tm.assert_index_equal(idf.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
-
-        new_df = idf.reset_index()
-        new_df.index = df.B
-        tm.assert_index_equal(new_df.index, ci, check_names=False)
-        self.assertEqual(idf.index.name, 'B')
+        # round-trip
+        idf = idf.reset_index().set_index('B')
+        tm.assert_index_equal(idf.index, ci)
 
     def test_set_index_cast_datetimeindex(self):
         df = DataFrame({'A': [datetime(2000, 1, 1) + timedelta(i)
@@ -193,48 +428,55 @@ def test_set_index_cast_datetimeindex(self):
                         'B': np.random.randn(1000)})
 
         idf = df.set_index('A')
-        tm.assertIsInstance(idf.index, pd.DatetimeIndex)
+        assert isinstance(idf.index, DatetimeIndex)
 
+    def test_convert_dti_to_series(self):
         # don't cast a DatetimeIndex WITH a tz, leave as object
         # GH 6032
-        i = (pd.DatetimeIndex(
-            pd.tseries.tools.to_datetime(['2013-1-1 13:00',
-                                          '2013-1-2 14:00'], errors="raise"))
-             .tz_localize('US/Pacific'))
+        idx = DatetimeIndex(to_datetime(['2013-1-1 13:00',
+                                         '2013-1-2 14:00']),
+                            name='B').tz_localize('US/Pacific')
         df = DataFrame(np.random.randn(2, 1), columns=['A'])
 
-        expected = Series(np.array([pd.Timestamp('2013-01-01 13:00:00-0800',
-                                                 tz='US/Pacific'),
-                                    pd.Timestamp('2013-01-02 14:00:00-0800',
-                                                 tz='US/Pacific')],
-                                   dtype="object"))
+        expected = Series(np.array([Timestamp('2013-01-01 13:00:00-0800',
+                                              tz='US/Pacific'),
+                                    Timestamp('2013-01-02 14:00:00-0800',
+                                              tz='US/Pacific')],
+                                   dtype="object"), name='B')
 
         # convert index to series
-        result = Series(i)
-        assert_series_equal(result, expected)
+        result = Series(idx)
+        tm.assert_series_equal(result, expected)
 
-        # assignt to frame
-        df['B'] = i
+        # assign to frame
+        df['B'] = idx
         result = df['B']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'B')
+        tm.assert_series_equal(result, expected)
 
-        # keep the timezone
-        result = i.to_series(keep_tz=True)
-        assert_series_equal(result.reset_index(drop=True), expected)
+        # convert to series while keeping the timezone
+        result = idx.to_series(keep_tz=True, index=[0, 1])
+        tm.assert_series_equal(result, expected)
 
         # convert to utc
-        df['C'] = i.to_series().reset_index(drop=True)
-        result = df['C']
-        comp = pd.DatetimeIndex(expected.values).copy()
-        comp.tz = None
-        self.assert_numpy_array_equal(result.values, comp.values)
+        with tm.assert_produces_warning(FutureWarning):
+            df['B'] = idx.to_series(keep_tz=False, index=[0, 1])
+        result = df['B']
+        comp = Series(DatetimeIndex(expected.values).tz_localize(None),
+                      name='B')
+        tm.assert_series_equal(result, comp)
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = idx.to_series(index=[0, 1])
+        tm.assert_series_equal(result, expected.dt.tz_convert(None))
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = idx.to_series(keep_tz=False, index=[0, 1])
+        tm.assert_series_equal(result, expected.dt.tz_convert(None))
 
         # list of datetimes with a tz
-        df['D'] = i.to_pydatetime()
-        result = df['D']
-        assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'D')
+        df['B'] = idx.to_pydatetime()
+        result = df['B']
+        tm.assert_series_equal(result, expected)
 
         # GH 6785
         # set the index manually
@@ -244,84 +486,97 @@ def test_set_index_cast_datetimeindex(self):
         expected = df.set_index('ts')
         df.index = df['ts']
         df.pop('ts')
-        assert_frame_equal(df, expected)
+        tm.assert_frame_equal(df, expected)
 
+    def test_reset_index_tz(self, tz_aware_fixture):
         # GH 3950
         # reset_index with single level
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern']:
-            idx = pd.date_range('1/1/2011', periods=5,
-                                freq='D', tz=tz, name='idx')
-            df = pd.DataFrame(
-                {'a': range(5), 'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
-
-            expected = pd.DataFrame({'idx': [datetime(2011, 1, 1),
-                                             datetime(2011, 1, 2),
-                                             datetime(2011, 1, 3),
-                                             datetime(2011, 1, 4),
-                                             datetime(2011, 1, 5)],
-                                     'a': range(5),
-                                     'b': ['A', 'B', 'C', 'D', 'E']},
-                                    columns=['idx', 'a', 'b'])
-            expected['idx'] = expected['idx'].apply(
-                lambda d: pd.Timestamp(d, tz=tz))
-            assert_frame_equal(df.reset_index(), expected)
+        tz = tz_aware_fixture
+        idx = date_range('1/1/2011', periods=5,
+                         freq='D', tz=tz, name='idx')
+        df = DataFrame({'a': range(5), 'b': ['A', 'B', 'C', 'D', 'E']},
+                       index=idx)
+
+        expected = DataFrame({'idx': [datetime(2011, 1, 1),
+                                      datetime(2011, 1, 2),
+                                      datetime(2011, 1, 3),
+                                      datetime(2011, 1, 4),
+                                      datetime(2011, 1, 5)],
+                              'a': range(5),
+                              'b': ['A', 'B', 'C', 'D', 'E']},
+                             columns=['idx', 'a', 'b'])
+        expected['idx'] = expected['idx'].apply(lambda d: Timestamp(d, tz=tz))
+        tm.assert_frame_equal(df.reset_index(), expected)
 
     def test_set_index_timezone(self):
         # GH 12358
         # tz-aware Series should retain the tz
-        i = pd.to_datetime(["2014-01-01 10:10:10"],
-                           utc=True).tz_convert('Europe/Rome')
-        df = DataFrame({'i': i})
-        self.assertEqual(df.set_index(i).index[0].hour, 11)
-        self.assertEqual(pd.DatetimeIndex(pd.Series(df.i))[0].hour, 11)
-        self.assertEqual(df.set_index(df.i).index[0].hour, 11)
+        idx = to_datetime(["2014-01-01 10:10:10"],
+                          utc=True).tz_convert('Europe/Rome')
+        df = DataFrame({'A': idx})
+        assert df.set_index(idx).index[0].hour == 11
+        assert DatetimeIndex(Series(df.A))[0].hour == 11
+        assert df.set_index(df.A).index[0].hour == 11
 
     def test_set_index_dst(self):
-        di = pd.date_range('2006-10-29 00:00:00', periods=3,
-                           req='H', tz='US/Pacific')
+        di = date_range('2006-10-29 00:00:00', periods=3,
+                        freq='H', tz='US/Pacific')
 
-        df = pd.DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
-                          index=di).reset_index()
+        df = DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
+                       index=di).reset_index()
         # single level
         res = df.set_index('index')
-        exp = pd.DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
-                           index=pd.Index(di, name='index'))
+        exp = DataFrame(data={'a': [0, 1, 2], 'b': [3, 4, 5]},
+                        index=Index(di, name='index'))
         tm.assert_frame_equal(res, exp)
 
         # GH 12920
         res = df.set_index(['index', 'a'])
-        exp_index = pd.MultiIndex.from_arrays([di, [0, 1, 2]],
-                                              names=['index', 'a'])
-        exp = pd.DataFrame({'b': [3, 4, 5]}, index=exp_index)
+        exp_index = MultiIndex.from_arrays([di, [0, 1, 2]],
+                                           names=['index', 'a'])
+        exp = DataFrame({'b': [3, 4, 5]}, index=exp_index)
         tm.assert_frame_equal(res, exp)
 
+    def test_reset_index_with_intervals(self):
+        idx = IntervalIndex.from_breaks(np.arange(11), name='x')
+        original = DataFrame({'x': idx, 'y': np.arange(10)})[['x', 'y']]
+
+        result = original.set_index('x')
+        expected = DataFrame({'y': np.arange(10)}, index=idx)
+        tm.assert_frame_equal(result, expected)
+
+        result2 = result.reset_index()
+        tm.assert_frame_equal(result2, original)
+
     def test_set_index_multiindexcolumns(self):
         columns = MultiIndex.from_tuples([('foo', 1), ('foo', 2), ('bar', 1)])
         df = DataFrame(np.random.randn(3, 3), columns=columns)
-        rs = df.set_index(df.columns[0])
-        xp = df.iloc[:, 1:]
-        xp.index = df.iloc[:, 0].values
-        xp.index.names = [df.columns[0]]
-        assert_frame_equal(rs, xp)
+        result = df.set_index(df.columns[0])
+        expected = df.iloc[:, 1:]
+        expected.index = df.iloc[:, 0].values
+        expected.index.names = [df.columns[0]]
+        tm.assert_frame_equal(result, expected)
 
     def test_set_index_empty_column(self):
-        # #1971
+        # GH 1971
         df = DataFrame([
-            dict(a=1, p=0),
-            dict(a=2, m=10),
-            dict(a=3, m=11, p=20),
-            dict(a=4, m=12, p=21)
+            {'a': 1, 'p': 0},
+            {'a': 2, 'm': 10},
+            {'a': 3, 'm': 11, 'p': 20},
+            {'a': 4, 'm': 12, 'p': 21}
         ], columns=('a', 'm', 'p', 'x'))
 
-        # it works!
         result = df.set_index(['a', 'x'])
-        repr(result)
+        expected = df[['m', 'p']]
+        expected.index = MultiIndex.from_arrays([df['a'], df['x']],
+                                                names=['a', 'x'])
+        tm.assert_frame_equal(result, expected)
 
-    def test_set_columns(self):
-        cols = Index(np.arange(len(self.mixed_frame.columns)))
-        self.mixed_frame.columns = cols
-        with assertRaisesRegexp(ValueError, 'Length mismatch'):
-            self.mixed_frame.columns = cols[::2]
+    def test_set_columns(self, float_string_frame):
+        cols = Index(np.arange(len(float_string_frame.columns)))
+        float_string_frame.columns = cols
+        with pytest.raises(ValueError, match='Length mismatch'):
+            float_string_frame.columns = cols[::2]
 
     def test_dti_set_index_reindex(self):
         # GH 6631
@@ -334,7 +589,7 @@ def test_dti_set_index_reindex(self):
         df = df.reindex(idx2)
         tm.assert_index_equal(df.index, idx2)
 
-        # 11314
+        # GH 11314
         # with tz
         index = date_range(datetime(2015, 10, 1),
                            datetime(2015, 10, 1, 23),
@@ -344,14 +599,12 @@ def test_dti_set_index_reindex(self):
                                datetime(2015, 10, 2, 23),
                                freq='H', tz='US/Eastern')
 
-        # TODO: unused?
-        result = df.set_index(new_index)  # noqa
-
-        self.assertEqual(new_index.freq, index.freq)
+        result = df.set_index(new_index)
+        assert result.index.freq == index.freq
 
     # Renaming
 
-    def test_rename(self):
+    def test_rename(self, float_frame):
         mapping = {
             'A': 'a',
             'B': 'b',
@@ -359,12 +612,12 @@ def test_rename(self):
             'D': 'd'
         }
 
-        renamed = self.frame.rename(columns=mapping)
-        renamed2 = self.frame.rename(columns=str.lower)
+        renamed = float_frame.rename(columns=mapping)
+        renamed2 = float_frame.rename(columns=str.lower)
 
-        assert_frame_equal(renamed, renamed2)
-        assert_frame_equal(renamed2.rename(columns=str.upper),
-                           self.frame, check_names=False)
+        tm.assert_frame_equal(renamed, renamed2)
+        tm.assert_frame_equal(renamed2.rename(columns=str.upper),
+                              float_frame, check_names=False)
 
         # index
         data = {
@@ -374,69 +627,224 @@ def test_rename(self):
         # gets sorted alphabetical
         df = DataFrame(data)
         renamed = df.rename(index={'foo': 'bar', 'bar': 'foo'})
-        tm.assert_index_equal(renamed.index, pd.Index(['foo', 'bar']))
+        tm.assert_index_equal(renamed.index, Index(['foo', 'bar']))
 
         renamed = df.rename(index=str.upper)
-        tm.assert_index_equal(renamed.index, pd.Index(['BAR', 'FOO']))
+        tm.assert_index_equal(renamed.index, Index(['BAR', 'FOO']))
 
         # have to pass something
-        self.assertRaises(TypeError, self.frame.rename)
+        with pytest.raises(TypeError, match="must pass an index to rename"):
+            float_frame.rename()
 
         # partial columns
-        renamed = self.frame.rename(columns={'C': 'foo', 'D': 'bar'})
-        tm.assert_index_equal(renamed.columns,
-                              pd.Index(['A', 'B', 'foo', 'bar']))
+        renamed = float_frame.rename(columns={'C': 'foo', 'D': 'bar'})
+        tm.assert_index_equal(renamed.columns, Index(['A', 'B', 'foo', 'bar']))
 
         # other axis
-        renamed = self.frame.T.rename(index={'C': 'foo', 'D': 'bar'})
-        tm.assert_index_equal(renamed.index,
-                              pd.Index(['A', 'B', 'foo', 'bar']))
+        renamed = float_frame.T.rename(index={'C': 'foo', 'D': 'bar'})
+        tm.assert_index_equal(renamed.index, Index(['A', 'B', 'foo', 'bar']))
 
         # index with name
         index = Index(['foo', 'bar'], name='name')
         renamer = DataFrame(data, index=index)
         renamed = renamer.rename(index={'foo': 'bar', 'bar': 'foo'})
         tm.assert_index_equal(renamed.index,
-                              pd.Index(['bar', 'foo'], name='name'))
-        self.assertEqual(renamed.index.name, renamer.index.name)
+                              Index(['bar', 'foo'], name='name'))
+        assert renamed.index.name == renamer.index.name
+
+    def test_rename_axis_inplace(self, float_frame):
+        # GH 15704
+        expected = float_frame.rename_axis('foo')
+        result = float_frame.copy()
+        no_return = result.rename_axis('foo', inplace=True)
+
+        assert no_return is None
+        tm.assert_frame_equal(result, expected)
+
+        expected = float_frame.rename_axis('bar', axis=1)
+        result = float_frame.copy()
+        no_return = result.rename_axis('bar', axis=1, inplace=True)
+
+        assert no_return is None
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename_axis_warns(self):
+        # https://github.com/pandas-dev/pandas/issues/17833
+        df = DataFrame({"A": [1, 2], "B": [1, 2]})
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis(id, axis=0)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis({0: 10, 1: 20}, axis=0)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df.rename_axis(id, axis=1)
+            assert 'rename' in str(w[0].message)
+
+        with tm.assert_produces_warning(FutureWarning) as w:
+            df['A'].rename_axis(id)
+            assert 'rename' in str(w[0].message)
+
+    def test_rename_axis_mapper(self):
+        # GH 19978
+        mi = MultiIndex.from_product([['a', 'b', 'c'], [1, 2]],
+                                     names=['ll', 'nn'])
+        df = DataFrame({'x': [i for i in range(len(mi))],
+                        'y': [i * 10 for i in range(len(mi))]},
+                       index=mi)
+
+        # Test for rename of the Index object of columns
+        result = df.rename_axis('cols', axis=1)
+        tm.assert_index_equal(result.columns,
+                              Index(['x', 'y'], name='cols'))
+
+        # Test for rename of the Index object of columns using dict
+        result = result.rename_axis(columns={'cols': 'new'}, axis=1)
+        tm.assert_index_equal(result.columns,
+                              Index(['x', 'y'], name='new'))
+
+        # Test for renaming index using dict
+        result = df.rename_axis(index={'ll': 'foo'})
+        assert result.index.names == ['foo', 'nn']
+
+        # Test for renaming index using a function
+        result = df.rename_axis(index=str.upper, axis=0)
+        assert result.index.names == ['LL', 'NN']
+
+        # Test for renaming index providing complete list
+        result = df.rename_axis(index=['foo', 'goo'])
+        assert result.index.names == ['foo', 'goo']
+
+        # Test for changing index and columns at same time
+        sdf = df.reset_index().set_index('nn').drop(columns=['ll', 'y'])
+        result = sdf.rename_axis(index='foo', columns='meh')
+        assert result.index.name == 'foo'
+        assert result.columns.name == 'meh'
+
+        # Test different error cases
+        with pytest.raises(TypeError, match='Must pass'):
+            df.rename_axis(index='wrong')
+
+        with pytest.raises(ValueError, match='Length of names'):
+            df.rename_axis(index=['wrong'])
+
+        with pytest.raises(TypeError, match='bogus'):
+            df.rename_axis(bogus=None)
+
+    @pytest.mark.parametrize('kwargs, rename_index, rename_columns', [
+        ({'mapper': None, 'axis': 0}, True, False),
+        ({'mapper': None, 'axis': 1}, False, True),
+        ({'index': None}, True, False),
+        ({'columns': None}, False, True),
+        ({'index': None, 'columns': None}, True, True),
+        ({}, False, False)])
+    def test_rename_axis_none(self, kwargs, rename_index, rename_columns):
+        # GH 25034
+        index = Index(list('abc'), name='foo')
+        columns = Index(['col1', 'col2'], name='bar')
+        data = np.arange(6).reshape(3, 2)
+        df = DataFrame(data, index, columns)
+
+        result = df.rename_axis(**kwargs)
+        expected_index = index.rename(None) if rename_index else index
+        expected_columns = columns.rename(None) if rename_columns else columns
+        expected = DataFrame(data, expected_index, expected_columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename_multiindex(self):
 
-        # MultiIndex
         tuples_index = [('foo1', 'bar1'), ('foo2', 'bar2')]
         tuples_columns = [('fizz1', 'buzz1'), ('fizz2', 'buzz2')]
         index = MultiIndex.from_tuples(tuples_index, names=['foo', 'bar'])
         columns = MultiIndex.from_tuples(
             tuples_columns, names=['fizz', 'buzz'])
-        renamer = DataFrame([(0, 0), (1, 1)], index=index, columns=columns)
-        renamed = renamer.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
-                                 columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'})
+        df = DataFrame([(0, 0), (1, 1)], index=index, columns=columns)
+
+        #
+        # without specifying level -> across all levels
+
+        renamed = df.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
+                            columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'})
         new_index = MultiIndex.from_tuples([('foo3', 'bar1'),
                                             ('foo2', 'bar3')],
                                            names=['foo', 'bar'])
         new_columns = MultiIndex.from_tuples([('fizz3', 'buzz1'),
                                               ('fizz2', 'buzz3')],
                                              names=['fizz', 'buzz'])
-        self.assert_index_equal(renamed.index, new_index)
-        self.assert_index_equal(renamed.columns, new_columns)
-        self.assertEqual(renamed.index.names, renamer.index.names)
-        self.assertEqual(renamed.columns.names, renamer.columns.names)
+        tm.assert_index_equal(renamed.index, new_index)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        assert renamed.index.names == df.index.names
+        assert renamed.columns.names == df.columns.names
 
-    def test_rename_nocopy(self):
-        renamed = self.frame.rename(columns={'C': 'foo'}, copy=False)
+        #
+        # with specifying a level (GH13766)
+
+        # dict
+        new_columns = MultiIndex.from_tuples([('fizz3', 'buzz1'),
+                                              ('fizz2', 'buzz2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level=0)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level='fizz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        new_columns = MultiIndex.from_tuples([('fizz1', 'buzz1'),
+                                              ('fizz2', 'buzz3')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level=1)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns={'fizz1': 'fizz3', 'buzz2': 'buzz3'},
+                            level='buzz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        # function
+        func = str.upper
+        new_columns = MultiIndex.from_tuples([('FIZZ1', 'buzz1'),
+                                              ('FIZZ2', 'buzz2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns=func, level=0)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns=func, level='fizz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        new_columns = MultiIndex.from_tuples([('fizz1', 'BUZZ1'),
+                                              ('fizz2', 'BUZZ2')],
+                                             names=['fizz', 'buzz'])
+        renamed = df.rename(columns=func, level=1)
+        tm.assert_index_equal(renamed.columns, new_columns)
+        renamed = df.rename(columns=func, level='buzz')
+        tm.assert_index_equal(renamed.columns, new_columns)
+
+        # index
+        new_index = MultiIndex.from_tuples([('foo3', 'bar1'),
+                                            ('foo2', 'bar2')],
+                                           names=['foo', 'bar'])
+        renamed = df.rename(index={'foo1': 'foo3', 'bar2': 'bar3'},
+                            level=0)
+        tm.assert_index_equal(renamed.index, new_index)
+
+    def test_rename_nocopy(self, float_frame):
+        renamed = float_frame.rename(columns={'C': 'foo'}, copy=False)
         renamed['foo'] = 1.
-        self.assertTrue((self.frame['C'] == 1.).all())
+        assert (float_frame['C'] == 1.).all()
 
-    def test_rename_inplace(self):
-        self.frame.rename(columns={'C': 'foo'})
-        self.assertIn('C', self.frame)
-        self.assertNotIn('foo', self.frame)
+    def test_rename_inplace(self, float_frame):
+        float_frame.rename(columns={'C': 'foo'})
+        assert 'C' in float_frame
+        assert 'foo' not in float_frame
 
-        c_id = id(self.frame['C'])
-        frame = self.frame.copy()
-        frame.rename(columns={'C': 'foo'}, inplace=True)
+        c_id = id(float_frame['C'])
+        float_frame = float_frame.copy()
+        float_frame.rename(columns={'C': 'foo'}, inplace=True)
 
-        self.assertNotIn('C', frame)
-        self.assertIn('foo', frame)
-        self.assertNotEqual(id(frame['foo']), c_id)
+        assert 'C' not in float_frame
+        assert 'foo' in float_frame
+        assert id(float_frame['foo']) != c_id
 
     def test_rename_bug(self):
         # GH 5344
@@ -451,58 +859,86 @@ def test_rename_bug(self):
                                  [('foo', 'bah'), ('bar', 'bas')],
                                  names=['a', 'b']),
                              columns=['2001-01-01'])
-        assert_frame_equal(df, expected)
+        tm.assert_frame_equal(df, expected)
+
+    def test_rename_bug2(self):
+        # GH 19497
+        # rename was changing Index to MultiIndex if Index contained tuples
+
+        df = DataFrame(data=np.arange(3), index=[(0, 0), (1, 1), (2, 2)],
+                       columns=["a"])
+        df = df.rename({(1, 1): (5, 4)}, axis="index")
+        expected = DataFrame(data=np.arange(3), index=[(0, 0), (5, 4), (2, 2)],
+                             columns=["a"])
+        tm.assert_frame_equal(df, expected)
+
+    def test_rename_errors_raises(self):
+        df = DataFrame(columns=['A', 'B', 'C', 'D'])
+        with pytest.raises(KeyError, match='\'E\'] not found in axis'):
+            df.rename(columns={'A': 'a', 'E': 'e'}, errors='raise')
+
+    @pytest.mark.parametrize('mapper, errors, expected_columns', [
+        ({'A': 'a', 'E': 'e'}, 'ignore', ['a', 'B', 'C', 'D']),
+        ({'A': 'a'}, 'raise', ['a', 'B', 'C', 'D']),
+        (str.lower, 'raise', ['a', 'b', 'c', 'd'])])
+    def test_rename_errors(self, mapper, errors, expected_columns):
+        # GH 13473
+        # rename now works with errors parameter
+        df = DataFrame(columns=['A', 'B', 'C', 'D'])
+        result = df.rename(columns=mapper, errors=errors)
+        expected = DataFrame(columns=expected_columns)
+        tm.assert_frame_equal(result, expected)
 
     def test_reorder_levels(self):
         index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]],
+                           codes=[[0, 0, 0, 0, 0, 0],
+                                  [0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1]],
                            names=['L0', 'L1', 'L2'])
         df = DataFrame({'A': np.arange(6), 'B': np.arange(6)}, index=index)
 
         # no change, position
         result = df.reorder_levels([0, 1, 2])
-        assert_frame_equal(df, result)
+        tm.assert_frame_equal(df, result)
 
         # no change, labels
         result = df.reorder_levels(['L0', 'L1', 'L2'])
-        assert_frame_equal(df, result)
+        tm.assert_frame_equal(df, result)
 
         # rotate, position
         result = df.reorder_levels([1, 2, 0])
         e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
-                           labels=[[0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1],
-                                   [0, 0, 0, 0, 0, 0]],
+                           codes=[[0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1],
+                                  [0, 0, 0, 0, 0, 0]],
                            names=['L1', 'L2', 'L0'])
         expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
                              index=e_idx)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = df.reorder_levels([0, 0, 0])
         e_idx = MultiIndex(levels=[['bar'], ['bar'], ['bar']],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0]],
+                           codes=[[0, 0, 0, 0, 0, 0],
+                                  [0, 0, 0, 0, 0, 0],
+                                  [0, 0, 0, 0, 0, 0]],
                            names=['L0', 'L0', 'L0'])
         expected = DataFrame({'A': np.arange(6), 'B': np.arange(6)},
                              index=e_idx)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = df.reorder_levels(['L0', 'L0', 'L0'])
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
-    def test_reset_index(self):
-        stacked = self.frame.stack()[::2]
+    def test_reset_index(self, float_frame):
+        stacked = float_frame.stack()[::2]
         stacked = DataFrame({'foo': stacked, 'bar': stacked})
 
         names = ['first', 'second']
         stacked.index.names = names
         deleveled = stacked.reset_index()
-        for i, (lev, lab) in enumerate(zip(stacked.index.levels,
-                                           stacked.index.labels)):
-            values = lev.take(lab)
+        for i, (lev, level_codes) in enumerate(zip(stacked.index.levels,
+                                                   stacked.index.codes)):
+            values = lev.take(level_codes)
             name = names[i]
             tm.assert_index_equal(values, Index(deleveled[name]))
 
@@ -514,59 +950,104 @@ def test_reset_index(self):
                                check_names=False)
 
         # default name assigned
-        rdf = self.frame.reset_index()
-        exp = pd.Series(self.frame.index.values, name='index')
-        self.assert_series_equal(rdf['index'], exp)
+        rdf = float_frame.reset_index()
+        exp = Series(float_frame.index.values, name='index')
+        tm.assert_series_equal(rdf['index'], exp)
 
         # default name assigned, corner case
-        df = self.frame.copy()
+        df = float_frame.copy()
         df['index'] = 'foo'
         rdf = df.reset_index()
-        exp = pd.Series(self.frame.index.values, name='level_0')
-        self.assert_series_equal(rdf['level_0'], exp)
+        exp = Series(float_frame.index.values, name='level_0')
+        tm.assert_series_equal(rdf['level_0'], exp)
 
         # but this is ok
-        self.frame.index.name = 'index'
-        deleveled = self.frame.reset_index()
-        self.assert_series_equal(deleveled['index'],
-                                 pd.Series(self.frame.index))
-        self.assert_index_equal(deleveled.index,
-                                pd.Index(np.arange(len(deleveled))))
+        float_frame.index.name = 'index'
+        deleveled = float_frame.reset_index()
+        tm.assert_series_equal(deleveled['index'], Series(float_frame.index))
+        tm.assert_index_equal(deleveled.index,
+                              Index(np.arange(len(deleveled))))
 
         # preserve column names
-        self.frame.columns.name = 'columns'
-        resetted = self.frame.reset_index()
-        self.assertEqual(resetted.columns.name, 'columns')
+        float_frame.columns.name = 'columns'
+        resetted = float_frame.reset_index()
+        assert resetted.columns.name == 'columns'
 
         # only remove certain columns
-        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
-        rs = frame.reset_index(['A', 'B'])
+        df = float_frame.reset_index().set_index(['index', 'A', 'B'])
+        rs = df.reset_index(['A', 'B'])
 
         # TODO should reset_index check_names ?
-        assert_frame_equal(rs, self.frame, check_names=False)
+        tm.assert_frame_equal(rs, float_frame, check_names=False)
 
-        rs = frame.reset_index(['index', 'A', 'B'])
-        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
+        rs = df.reset_index(['index', 'A', 'B'])
+        tm.assert_frame_equal(rs, float_frame.reset_index(), check_names=False)
 
-        rs = frame.reset_index(['index', 'A', 'B'])
-        assert_frame_equal(rs, self.frame.reset_index(), check_names=False)
+        rs = df.reset_index(['index', 'A', 'B'])
+        tm.assert_frame_equal(rs, float_frame.reset_index(), check_names=False)
 
-        rs = frame.reset_index('A')
-        xp = self.frame.reset_index().set_index(['index', 'B'])
-        assert_frame_equal(rs, xp, check_names=False)
+        rs = df.reset_index('A')
+        xp = float_frame.reset_index().set_index(['index', 'B'])
+        tm.assert_frame_equal(rs, xp, check_names=False)
 
         # test resetting in place
-        df = self.frame.copy()
-        resetted = self.frame.reset_index()
+        df = float_frame.copy()
+        resetted = float_frame.reset_index()
         df.reset_index(inplace=True)
-        assert_frame_equal(df, resetted, check_names=False)
+        tm.assert_frame_equal(df, resetted, check_names=False)
 
-        frame = self.frame.reset_index().set_index(['index', 'A', 'B'])
-        rs = frame.reset_index('A', drop=True)
-        xp = self.frame.copy()
+        df = float_frame.reset_index().set_index(['index', 'A', 'B'])
+        rs = df.reset_index('A', drop=True)
+        xp = float_frame.copy()
         del xp['A']
         xp = xp.set_index(['B'], append=True)
-        assert_frame_equal(rs, xp, check_names=False)
+        tm.assert_frame_equal(rs, xp, check_names=False)
+
+    def test_reset_index_name(self):
+        df = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                       columns=['A', 'B', 'C', 'D'],
+                       index=Index(range(2), name='x'))
+        assert df.reset_index().index.name is None
+        assert df.reset_index(drop=True).index.name is None
+        df.reset_index(inplace=True)
+        assert df.index.name is None
+
+    def test_reset_index_level(self):
+        df = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                       columns=['A', 'B', 'C', 'D'])
+
+        for levels in ['A', 'B'], [0, 1]:
+            # With MultiIndex
+            result = df.set_index(['A', 'B']).reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels)
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels,
+                                                          drop=True)
+            tm.assert_frame_equal(result, df[['C', 'D']])
+
+            # With single-level Index (GH 16263)
+            result = df.set_index('A').reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index('A').reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A']).reset_index(level=levels[0],
+                                                     drop=True)
+            tm.assert_frame_equal(result, df[['B', 'C', 'D']])
+
+        # Missing levels - for both MultiIndex and single-level Index:
+        for idx_lev in ['A', 'B'], ['A']:
+            with pytest.raises(KeyError, match='Level E '):
+                df.set_index(idx_lev).reset_index(level=['A', 'E'])
+            with pytest.raises(IndexError, match='Too many levels'):
+                df.set_index(idx_lev).reset_index(level=[0, 1, 2])
 
     def test_reset_index_right_dtype(self):
         time = np.arange(0.0, 10, np.sqrt(2) / 2)
@@ -576,10 +1057,10 @@ def test_reset_index_right_dtype(self):
         df = DataFrame(s1)
 
         resetted = s1.reset_index()
-        self.assertEqual(resetted['time'].dtype, np.float64)
+        assert resetted['time'].dtype == np.float64
 
         resetted = df.reset_index()
-        self.assertEqual(resetted['time'].dtype, np.float64)
+        assert resetted['time'].dtype == np.float64
 
     def test_reset_index_multiindex_col(self):
         vals = np.random.randn(3, 3).astype(object)
@@ -590,17 +1071,17 @@ def test_reset_index_multiindex_col(self):
         rs = df.reset_index()
         xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
                                       ['', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
         rs = df.reset_index(col_fill=None)
         xp = DataFrame(full, columns=[['a', 'b', 'b', 'c'],
                                       ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
         rs = df.reset_index(col_level=1, col_fill='blah')
         xp = DataFrame(full, columns=[['blah', 'b', 'b', 'c'],
                                       ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
         df = DataFrame(vals,
                        MultiIndex.from_arrays([[0, 1, 2], ['x', 'y', 'z']],
@@ -610,123 +1091,398 @@ def test_reset_index_multiindex_col(self):
         xp = DataFrame(full, Index([0, 1, 2], name='d'),
                        columns=[['a', 'b', 'b', 'c'],
                                 ['', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
         rs = df.reset_index('a', col_fill=None)
         xp = DataFrame(full, Index(lrange(3), name='d'),
                        columns=[['a', 'b', 'b', 'c'],
                                 ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
         rs = df.reset_index('a', col_fill='blah', col_level=1)
         xp = DataFrame(full, Index(lrange(3), name='d'),
                        columns=[['blah', 'b', 'b', 'c'],
                                 ['a', 'mean', 'median', 'mean']])
-        assert_frame_equal(rs, xp)
+        tm.assert_frame_equal(rs, xp)
 
     def test_reset_index_multiindex_nan(self):
         # GH6322, testing reset_index on MultiIndexes
         # when we have a nan or all nan
-        df = pd.DataFrame({'A': ['a', 'b', 'c'],
-                           'B': [0, 1, np.nan],
-                           'C': np.random.rand(3)})
+        df = DataFrame({'A': ['a', 'b', 'c'],
+                        'B': [0, 1, np.nan],
+                        'C': np.random.rand(3)})
         rs = df.set_index(['A', 'B']).reset_index()
-        assert_frame_equal(rs, df)
+        tm.assert_frame_equal(rs, df)
 
-        df = pd.DataFrame({'A': [np.nan, 'b', 'c'],
-                           'B': [0, 1, 2],
-                           'C': np.random.rand(3)})
+        df = DataFrame({'A': [np.nan, 'b', 'c'],
+                        'B': [0, 1, 2],
+                        'C': np.random.rand(3)})
         rs = df.set_index(['A', 'B']).reset_index()
-        assert_frame_equal(rs, df)
+        tm.assert_frame_equal(rs, df)
 
-        df = pd.DataFrame({'A': ['a', 'b', 'c'],
-                           'B': [0, 1, 2],
-                           'C': [np.nan, 1.1, 2.2]})
+        df = DataFrame({'A': ['a', 'b', 'c'],
+                        'B': [0, 1, 2],
+                        'C': [np.nan, 1.1, 2.2]})
         rs = df.set_index(['A', 'B']).reset_index()
-        assert_frame_equal(rs, df)
+        tm.assert_frame_equal(rs, df)
 
-        df = pd.DataFrame({'A': ['a', 'b', 'c'],
-                           'B': [np.nan, np.nan, np.nan],
-                           'C': np.random.rand(3)})
+        df = DataFrame({'A': ['a', 'b', 'c'],
+                        'B': [np.nan, np.nan, np.nan],
+                        'C': np.random.rand(3)})
         rs = df.set_index(['A', 'B']).reset_index()
-        assert_frame_equal(rs, df)
+        tm.assert_frame_equal(rs, df)
 
     def test_reset_index_with_datetimeindex_cols(self):
         # GH5818
         #
-        df = pd.DataFrame([[1, 2], [3, 4]],
-                          columns=pd.date_range('1/1/2013', '1/2/2013'),
-                          index=['A', 'B'])
+        df = DataFrame([[1, 2], [3, 4]],
+                       columns=date_range('1/1/2013', '1/2/2013'),
+                       index=['A', 'B'])
 
         result = df.reset_index()
-        expected = pd.DataFrame([['A', 1, 2], ['B', 3, 4]],
-                                columns=['index', datetime(2013, 1, 1),
-                                         datetime(2013, 1, 2)])
-        assert_frame_equal(result, expected)
+        expected = DataFrame([['A', 1, 2], ['B', 3, 4]],
+                             columns=['index', datetime(2013, 1, 1),
+                                      datetime(2013, 1, 2)])
+        tm.assert_frame_equal(result, expected)
 
     def test_reset_index_range(self):
         # GH 12071
-        df = pd.DataFrame([[0, 0], [1, 1]], columns=['A', 'B'],
-                          index=RangeIndex(stop=2))
+        df = DataFrame([[0, 0], [1, 1]], columns=['A', 'B'],
+                       index=RangeIndex(stop=2))
         result = df.reset_index()
-        tm.assertIsInstance(result.index, RangeIndex)
-        expected = pd.DataFrame([[0, 0, 0], [1, 1, 1]],
-                                columns=['index', 'A', 'B'],
-                                index=RangeIndex(stop=2))
-        assert_frame_equal(result, expected)
+        assert isinstance(result.index, RangeIndex)
+        expected = DataFrame([[0, 0, 0], [1, 1, 1]],
+                             columns=['index', 'A', 'B'],
+                             index=RangeIndex(stop=2))
+        tm.assert_frame_equal(result, expected)
 
     def test_set_index_names(self):
-        df = pd.util.testing.makeDataFrame()
+        df = tm.makeDataFrame()
         df.index.name = 'name'
 
-        self.assertEqual(df.set_index(df.index).index.names, ['name'])
+        assert df.set_index(df.index).index.names == ['name']
 
         mi = MultiIndex.from_arrays(df[['A', 'B']].T.values, names=['A', 'B'])
         mi2 = MultiIndex.from_arrays(df[['A', 'B', 'A', 'B']].T.values,
-                                     names=['A', 'B', 'A', 'B'])
+                                     names=['A', 'B', 'C', 'D'])
 
         df = df.set_index(['A', 'B'])
 
-        self.assertEqual(df.set_index(df.index).index.names, ['A', 'B'])
+        assert df.set_index(df.index).index.names == ['A', 'B']
 
         # Check that set_index isn't converting a MultiIndex into an Index
-        self.assertTrue(isinstance(df.set_index(df.index).index, MultiIndex))
+        assert isinstance(df.set_index(df.index).index, MultiIndex)
 
         # Check actual equality
         tm.assert_index_equal(df.set_index(df.index).index, mi)
 
+        idx2 = df.index.rename(['C', 'D'])
+
         # Check that [MultiIndex, MultiIndex] yields a MultiIndex rather
         # than a pair of tuples
-        self.assertTrue(isinstance(df.set_index(
-            [df.index, df.index]).index, MultiIndex))
+        assert isinstance(df.set_index([df.index, idx2]).index, MultiIndex)
 
         # Check equality
-        tm.assert_index_equal(df.set_index([df.index, df.index]).index, mi2)
+        tm.assert_index_equal(df.set_index([df.index, idx2]).index, mi2)
 
-    def test_rename_objects(self):
-        renamed = self.mixed_frame.rename(columns=str.upper)
-        self.assertIn('FOO', renamed)
-        self.assertNotIn('foo', renamed)
-
-    def test_assign_columns(self):
-        self.frame['hi'] = 'there'
-
-        frame = self.frame.copy()
-        frame.columns = ['foo', 'bar', 'baz', 'quux', 'foo2']
-        assert_series_equal(self.frame['C'], frame['baz'], check_names=False)
-        assert_series_equal(self.frame['hi'], frame['foo2'], check_names=False)
+    def test_rename_objects(self, float_string_frame):
+        renamed = float_string_frame.rename(columns=str.upper)
+
+        assert 'FOO' in renamed
+        assert 'foo' not in renamed
+
+    def test_rename_axis_style(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = DataFrame({"A": [1, 2], "B": [1, 2]}, index=['X', 'Y'])
+        expected = DataFrame({"a": [1, 2], "b": [1, 2]}, index=['X', 'Y'])
+
+        result = df.rename(str.lower, axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename(str.lower, axis='columns')
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename({"A": 'a', 'B': 'b'}, axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename({"A": 'a', 'B': 'b'}, axis='columns')
+        tm.assert_frame_equal(result, expected)
+
+        # Index
+        expected = DataFrame({"A": [1, 2], "B": [1, 2]}, index=['x', 'y'])
+        result = df.rename(str.lower, axis=0)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename(str.lower, axis='index')
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename({'X': 'x', 'Y': 'y'}, axis=0)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename({'X': 'x', 'Y': 'y'}, axis='index')
+        tm.assert_frame_equal(result, expected)
+
+        result = df.rename(mapper=str.lower, axis='index')
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename_mapper_multi(self):
+        df = DataFrame({"A": ['a', 'b'], "B": ['c', 'd'],
+                        'C': [1, 2]}).set_index(["A", "B"])
+        result = df.rename(str.upper)
+        expected = df.rename(index=str.upper)
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename_positional_named(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = DataFrame({"a": [1, 2], "b": [1, 2]}, index=['X', 'Y'])
+        result = df.rename(str.lower, columns=str.upper)
+        expected = DataFrame({"A": [1, 2], "B": [1, 2]}, index=['x', 'y'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename_axis_style_raises(self):
+        # see gh-12392
+        df = DataFrame({"A": [1, 2], "B": [1, 2]}, index=["0", "1"])
+
+        # Named target and axis
+        over_spec_msg = ("Cannot specify both 'axis' and "
+                         "any of 'index' or 'columns'")
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(index=str.lower, axis=1)
+
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(index=str.lower, axis="columns")
+
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(columns=str.lower, axis="columns")
+
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(index=str.lower, axis=0)
+
+        # Multiple targets and axis
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(str.lower, str.lower, axis="columns")
+
+        # Too many targets
+        over_spec_msg = "Cannot specify all of 'mapper', 'index', 'columns'."
+        with pytest.raises(TypeError, match=over_spec_msg):
+            df.rename(str.lower, str.lower, str.lower)
+
+        # Duplicates
+        with pytest.raises(TypeError, match="multiple values"):
+            df.rename(id, mapper=id)
+
+    def test_reindex_api_equivalence(self):
+            # equivalence of the labels/axis and index/columns API's
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.reindex(['b', 'a'])
+        res2 = df.reindex(index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'])
+        res4 = df.reindex(labels=['b', 'a'], axis=0)
+        res5 = df.reindex(['b', 'a'], axis=0)
+        for res in [res2, res3, res4, res5]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(columns=['e', 'd'])
+        res2 = df.reindex(['e', 'd'], axis=1)
+        res3 = df.reindex(labels=['e', 'd'], axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(index=['b', 'a'], columns=['e', 'd'])
+        res2 = df.reindex(columns=['e', 'd'], index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'], axis=0).reindex(labels=['e', 'd'],
+                                                             axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+    def test_rename_positional(self):
+        df = DataFrame(columns=['A', 'B'])
+        with tm.assert_produces_warning(FutureWarning) as rec:
+            result = df.rename(None, str.lower)
+        expected = DataFrame(columns=['a', 'b'])
+        tm.assert_frame_equal(result, expected)
+        assert len(rec) == 1
+        message = str(rec[0].message)
+        assert 'rename' in message
+        assert 'Use named arguments' in message
+
+    def test_assign_columns(self, float_frame):
+        float_frame['hi'] = 'there'
+
+        df = float_frame.copy()
+        df.columns = ['foo', 'bar', 'baz', 'quux', 'foo2']
+        tm.assert_series_equal(float_frame['C'], df['baz'], check_names=False)
+        tm.assert_series_equal(float_frame['hi'], df['foo2'],
+                               check_names=False)
 
     def test_set_index_preserve_categorical_dtype(self):
         # GH13743, GH13854
         df = DataFrame({'A': [1, 2, 1, 1, 2],
                         'B': [10, 16, 22, 28, 34],
-                        'C1': pd.Categorical(list("abaab"),
-                                             categories=list("bac"),
-                                             ordered=False),
-                        'C2': pd.Categorical(list("abaab"),
-                                             categories=list("bac"),
-                                             ordered=True)})
+                        'C1': Categorical(list("abaab"),
+                                          categories=list("bac"),
+                                          ordered=False),
+                        'C2': Categorical(list("abaab"),
+                                          categories=list("bac"),
+                                          ordered=True)})
         for cols in ['C1', 'C2', ['A', 'C1'], ['A', 'C2'], ['C1', 'C2']]:
             result = df.set_index(cols).reset_index()
             result = result.reindex(columns=df.columns)
             tm.assert_frame_equal(result, df)
+
+    def test_ambiguous_warns(self):
+        df = DataFrame({"A": [1, 2]})
+        with tm.assert_produces_warning(FutureWarning):
+            df.rename(id, id)
+
+        with tm.assert_produces_warning(FutureWarning):
+            df.rename({0: 10}, {"A": "B"})
+
+    @pytest.mark.skipif(PY2, reason="inspect.signature")
+    def test_rename_signature(self):
+        sig = inspect.signature(DataFrame.rename)
+        parameters = set(sig.parameters)
+        assert parameters == {"self", "mapper", "index", "columns", "axis",
+                              "inplace", "copy", "level", "errors"}
+
+    @pytest.mark.skipif(PY2, reason="inspect.signature")
+    def test_reindex_signature(self):
+        sig = inspect.signature(DataFrame.reindex)
+        parameters = set(sig.parameters)
+        assert parameters == {"self", "labels", "index", "columns", "axis",
+                              "limit", "copy", "level", "method",
+                              "fill_value", "tolerance"}
+
+    def test_droplevel(self):
+        # GH20342
+        df = DataFrame([
+            [1, 2, 3, 4],
+            [5, 6, 7, 8],
+            [9, 10, 11, 12]
+        ])
+        df = df.set_index([0, 1]).rename_axis(['a', 'b'])
+        df.columns = MultiIndex.from_tuples([('c', 'e'), ('d', 'f')],
+                                            names=['level_1', 'level_2'])
+
+        # test that dropping of a level in index works
+        expected = df.reset_index('a', drop=True)
+        result = df.droplevel('a', axis='index')
+        tm.assert_frame_equal(result, expected)
+
+        # test that dropping of a level in columns works
+        expected = df.copy()
+        expected.columns = Index(['c', 'd'], name='level_1')
+        result = df.droplevel('level_2', axis='columns')
+        tm.assert_frame_equal(result, expected)
+
+
+class TestIntervalIndex(object):
+
+    def test_setitem(self):
+
+        df = DataFrame({'A': range(10)})
+        s = cut(df.A, 5)
+        assert isinstance(s.cat.categories, IntervalIndex)
+
+        # B & D end up as Categoricals
+        # the remainer are converted to in-line objects
+        # contining an IntervalIndex.values
+        df['B'] = s
+        df['C'] = np.array(s)
+        df['D'] = s.values
+        df['E'] = np.array(s.values)
+
+        assert is_categorical_dtype(df['B'])
+        assert is_interval_dtype(df['B'].cat.categories)
+        assert is_categorical_dtype(df['D'])
+        assert is_interval_dtype(df['D'].cat.categories)
+
+        assert is_object_dtype(df['C'])
+        assert is_object_dtype(df['E'])
+
+        # they compare equal as Index
+        # when converted to numpy objects
+        c = lambda x: Index(np.array(x))
+        tm.assert_index_equal(c(df.B), c(df.B), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.C), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.D), check_names=False)
+        tm.assert_index_equal(c(df.B), c(df.D), check_names=False)
+
+        # B & D are the same Series
+        tm.assert_series_equal(df['B'], df['B'], check_names=False)
+        tm.assert_series_equal(df['B'], df['D'], check_names=False)
+
+        # C & E are the same Series
+        tm.assert_series_equal(df['C'], df['C'], check_names=False)
+        tm.assert_series_equal(df['C'], df['E'], check_names=False)
+
+    def test_set_reset_index(self):
+
+        df = DataFrame({'A': range(10)})
+        s = cut(df.A, 5)
+        df['B'] = s
+        df = df.set_index('B')
+
+        df = df.reset_index()
+
+    def test_set_axis_inplace(self):
+        # GH14636
+        df = DataFrame({'A': [1.1, 2.2, 3.3],
+                        'B': [5.0, 6.1, 7.2],
+                        'C': [4.4, 5.5, 6.6]},
+                       index=[2010, 2011, 2012])
+
+        expected = {0: df.copy(),
+                    1: df.copy()}
+        expected[0].index = list('abc')
+        expected[1].columns = list('abc')
+        expected['index'] = expected[0]
+        expected['columns'] = expected[1]
+
+        for axis in expected:
+            # inplace=True
+            # The FutureWarning comes from the fact that we would like to have
+            # inplace default to False some day
+            for inplace, warn in (None, FutureWarning), (True, None):
+                kwargs = {'inplace': inplace}
+
+                result = df.copy()
+                with tm.assert_produces_warning(warn):
+                    result.set_axis(list('abc'), axis=axis, **kwargs)
+                tm.assert_frame_equal(result, expected[axis])
+
+            # inplace=False
+            result = df.set_axis(list('abc'), axis=axis, inplace=False)
+            tm.assert_frame_equal(expected[axis], result)
+
+        # omitting the "axis" parameter
+        with tm.assert_produces_warning(None):
+            result = df.set_axis(list('abc'), inplace=False)
+        tm.assert_frame_equal(result, expected[0])
+
+        # wrong values for the "axis" parameter
+        for axis in 3, 'foo':
+            with pytest.raises(ValueError, match='No axis named'):
+                df.set_axis(list('abc'), axis=axis, inplace=False)
+
+    def test_set_axis_prior_to_deprecation_signature(self):
+        df = DataFrame({'A': [1.1, 2.2, 3.3],
+                        'B': [5.0, 6.1, 7.2],
+                        'C': [4.4, 5.5, 6.6]},
+                       index=[2010, 2011, 2012])
+
+        expected = {0: df.copy(),
+                    1: df.copy()}
+        expected[0].index = list('abc')
+        expected[1].columns = list('abc')
+        expected['index'] = expected[0]
+        expected['columns'] = expected[1]
+
+        # old signature
+        for axis in expected:
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.set_axis(axis, list('abc'), inplace=False)
+            tm.assert_frame_equal(result, expected[axis])
diff --git a/pandas/tests/frame/test_analytics.py b/pandas/tests/frame/test_analytics.py
index aa15e9fbab4cc..2969e8be2db03 100644
--- a/pandas/tests/frame/test_analytics.py
+++ b/pandas/tests/frame/test_analytics.py
@@ -1,113 +1,311 @@
 # -*- coding: utf-8 -*-
 
-from __future__ import print_function
-
 from datetime import timedelta
-from distutils.version import LooseVersion
-import sys
-import pytest
+import operator
+from string import ascii_lowercase
+import warnings
 
-from numpy import nan
-from numpy.random import randn
 import numpy as np
+import pytest
+
+from pandas.compat import PY2, PY35, is_platform_windows, lrange
+import pandas.util._test_decorators as td
 
-from pandas.compat import lrange
-from pandas import (compat, isnull, notnull, DataFrame, Series,
-                    MultiIndex, date_range, Timestamp)
 import pandas as pd
-import pandas.core.nanops as nanops
+from pandas import (
+    Categorical, DataFrame, MultiIndex, Series, Timestamp, compat, date_range,
+    isna, notna, to_datetime, to_timedelta)
 import pandas.core.algorithms as algorithms
-import pandas.formats.printing as printing
-
+import pandas.core.nanops as nanops
 import pandas.util.testing as tm
-from pandas.tests.frame.common import TestData
 
 
-class TestDataFrameAnalytics(tm.TestCase, TestData):
+def assert_stat_op_calc(opname, alternative, frame, has_skipna=True,
+                        check_dtype=True, check_dates=False,
+                        check_less_precise=False, skipna_alternative=None):
+    """
+    Check that operator opname works as advertised on frame
+
+    Parameters
+    ----------
+    opname : string
+        Name of the operator to test on frame
+    alternative : function
+        Function that opname is tested against; i.e. "frame.opname()" should
+        equal "alternative(frame)".
+    frame : DataFrame
+        The object that the tests are executed on
+    has_skipna : bool, default True
+        Whether the method "opname" has the kwarg "skip_na"
+    check_dtype : bool, default True
+        Whether the dtypes of the result of "frame.opname()" and
+        "alternative(frame)" should be checked.
+    check_dates : bool, default false
+        Whether opname should be tested on a Datetime Series
+    check_less_precise : bool, default False
+        Whether results should only be compared approximately;
+        passed on to tm.assert_series_equal
+    skipna_alternative : function, default None
+        NaN-safe version of alternative
+    """
+
+    f = getattr(frame, opname)
+
+    if check_dates:
+        df = DataFrame({'b': date_range('1/1/2001', periods=2)})
+        result = getattr(df, opname)()
+        assert isinstance(result, Series)
+
+        df['a'] = lrange(len(df))
+        result = getattr(df, opname)()
+        assert isinstance(result, Series)
+        assert len(result)
+
+    if has_skipna:
+        def wrapper(x):
+            return alternative(x.values)
+
+        skipna_wrapper = tm._make_skipna_wrapper(alternative,
+                                                 skipna_alternative)
+        result0 = f(axis=0, skipna=False)
+        result1 = f(axis=1, skipna=False)
+        tm.assert_series_equal(result0, frame.apply(wrapper),
+                               check_dtype=check_dtype,
+                               check_less_precise=check_less_precise)
+        # HACK: win32
+        tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
+                               check_dtype=False,
+                               check_less_precise=check_less_precise)
+    else:
+        skipna_wrapper = alternative
+
+    result0 = f(axis=0)
+    result1 = f(axis=1)
+    tm.assert_series_equal(result0, frame.apply(skipna_wrapper),
+                           check_dtype=check_dtype,
+                           check_less_precise=check_less_precise)
+
+    if opname in ['sum', 'prod']:
+        expected = frame.apply(skipna_wrapper, axis=1)
+        tm.assert_series_equal(result1, expected, check_dtype=False,
+                               check_less_precise=check_less_precise)
+
+    # check dtypes
+    if check_dtype:
+        lcd_dtype = frame.values.dtype
+        assert lcd_dtype == result0.dtype
+        assert lcd_dtype == result1.dtype
+
+    # bad axis
+    with pytest.raises(ValueError, match='No axis named 2'):
+        f(axis=2)
+
+    # all NA case
+    if has_skipna:
+        all_na = frame * np.NaN
+        r0 = getattr(all_na, opname)(axis=0)
+        r1 = getattr(all_na, opname)(axis=1)
+        if opname in ['sum', 'prod']:
+            unit = 1 if opname == 'prod' else 0  # result for empty sum/prod
+            expected = pd.Series(unit, index=r0.index, dtype=r0.dtype)
+            tm.assert_series_equal(r0, expected)
+            expected = pd.Series(unit, index=r1.index, dtype=r1.dtype)
+            tm.assert_series_equal(r1, expected)
+
+
+def assert_stat_op_api(opname, float_frame, float_string_frame,
+                       has_numeric_only=False):
+    """
+    Check that API for operator opname works as advertised on frame
+
+    Parameters
+    ----------
+    opname : string
+        Name of the operator to test on frame
+    float_frame : DataFrame
+        DataFrame with columns of type float
+    float_string_frame : DataFrame
+        DataFrame with both float and string columns
+    has_numeric_only : bool, default False
+        Whether the method "opname" has the kwarg "numeric_only"
+    """
+
+    # make sure works on mixed-type frame
+    getattr(float_string_frame, opname)(axis=0)
+    getattr(float_string_frame, opname)(axis=1)
+
+    if has_numeric_only:
+        getattr(float_string_frame, opname)(axis=0, numeric_only=True)
+        getattr(float_string_frame, opname)(axis=1, numeric_only=True)
+        getattr(float_frame, opname)(axis=0, numeric_only=False)
+        getattr(float_frame, opname)(axis=1, numeric_only=False)
+
+
+def assert_bool_op_calc(opname, alternative, frame, has_skipna=True):
+    """
+    Check that bool operator opname works as advertised on frame
+
+    Parameters
+    ----------
+    opname : string
+        Name of the operator to test on frame
+    alternative : function
+        Function that opname is tested against; i.e. "frame.opname()" should
+        equal "alternative(frame)".
+    frame : DataFrame
+        The object that the tests are executed on
+    has_skipna : bool, default True
+        Whether the method "opname" has the kwarg "skip_na"
+    """
+
+    f = getattr(frame, opname)
+
+    if has_skipna:
+        def skipna_wrapper(x):
+            nona = x.dropna().values
+            return alternative(nona)
+
+        def wrapper(x):
+            return alternative(x.values)
+
+        result0 = f(axis=0, skipna=False)
+        result1 = f(axis=1, skipna=False)
+
+        tm.assert_series_equal(result0, frame.apply(wrapper))
+        tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
+                               check_dtype=False)  # HACK: win32
+    else:
+        skipna_wrapper = alternative
+        wrapper = alternative
+
+    result0 = f(axis=0)
+    result1 = f(axis=1)
+
+    tm.assert_series_equal(result0, frame.apply(skipna_wrapper))
+    tm.assert_series_equal(result1, frame.apply(skipna_wrapper, axis=1),
+                           check_dtype=False)
+
+    # bad axis
+    with pytest.raises(ValueError, match='No axis named 2'):
+        f(axis=2)
+
+    # all NA case
+    if has_skipna:
+        all_na = frame * np.NaN
+        r0 = getattr(all_na, opname)(axis=0)
+        r1 = getattr(all_na, opname)(axis=1)
+        if opname == 'any':
+            assert not r0.any()
+            assert not r1.any()
+        else:
+            assert r0.all()
+            assert r1.all()
+
 
-    # ---------------------------------------------------------------------=
+def assert_bool_op_api(opname, bool_frame_with_na, float_string_frame,
+                       has_bool_only=False):
+    """
+    Check that API for boolean operator opname works as advertised on frame
+
+    Parameters
+    ----------
+    opname : string
+        Name of the operator to test on frame
+    float_frame : DataFrame
+        DataFrame with columns of type float
+    float_string_frame : DataFrame
+        DataFrame with both float and string columns
+    has_bool_only : bool, default False
+        Whether the method "opname" has the kwarg "bool_only"
+    """
+    # make sure op works on mixed-type frame
+    mixed = float_string_frame
+    mixed['_bool_'] = np.random.randn(len(mixed)) > 0.5
+    getattr(mixed, opname)(axis=0)
+    getattr(mixed, opname)(axis=1)
+
+    if has_bool_only:
+        getattr(mixed, opname)(axis=0, bool_only=True)
+        getattr(mixed, opname)(axis=1, bool_only=True)
+        getattr(bool_frame_with_na, opname)(axis=0, bool_only=False)
+        getattr(bool_frame_with_na, opname)(axis=1, bool_only=False)
+
+
+class TestDataFrameAnalytics(object):
+
+    # ---------------------------------------------------------------------
     # Correlation and covariance
 
-    def test_corr_pearson(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
+    @td.skip_if_no_scipy
+    def test_corr_pearson(self, float_frame):
+        float_frame['A'][:5] = np.nan
+        float_frame['B'][5:10] = np.nan
 
-        self._check_method('pearson')
+        self._check_method(float_frame, 'pearson')
 
-    def test_corr_kendall(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
+    @td.skip_if_no_scipy
+    def test_corr_kendall(self, float_frame):
+        float_frame['A'][:5] = np.nan
+        float_frame['B'][5:10] = np.nan
 
-        self._check_method('kendall')
+        self._check_method(float_frame, 'kendall')
 
-    def test_corr_spearman(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
+    @td.skip_if_no_scipy
+    def test_corr_spearman(self, float_frame):
+        float_frame['A'][:5] = np.nan
+        float_frame['B'][5:10] = np.nan
 
-        self._check_method('spearman')
+        self._check_method(float_frame, 'spearman')
 
-    def _check_method(self, method='pearson', check_minp=False):
-        if not check_minp:
-            correls = self.frame.corr(method=method)
-            exp = self.frame['A'].corr(self.frame['C'], method=method)
-            tm.assert_almost_equal(correls['A']['C'], exp)
-        else:
-            result = self.frame.corr(min_periods=len(self.frame) - 8)
-            expected = self.frame.corr()
-            expected.loc['A', 'B'] = expected.loc['B', 'A'] = nan
-            tm.assert_frame_equal(result, expected)
+    def _check_method(self, frame, method='pearson'):
+        correls = frame.corr(method=method)
+        expected = frame['A'].corr(frame['C'], method=method)
+        tm.assert_almost_equal(correls['A']['C'], expected)
 
-    def test_corr_non_numeric(self):
-        tm._skip_if_no_scipy()
-        self.frame['A'][:5] = nan
-        self.frame['B'][5:10] = nan
+    @td.skip_if_no_scipy
+    def test_corr_non_numeric(self, float_frame, float_string_frame):
+        float_frame['A'][:5] = np.nan
+        float_frame['B'][5:10] = np.nan
 
         # exclude non-numeric types
-        result = self.mixed_frame.corr()
-        expected = self.mixed_frame.loc[:, ['A', 'B', 'C', 'D']].corr()
+        result = float_string_frame.corr()
+        expected = float_string_frame.loc[:, ['A', 'B', 'C', 'D']].corr()
         tm.assert_frame_equal(result, expected)
 
-    def test_corr_nooverlap(self):
-        tm._skip_if_no_scipy()
-
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize('meth', ['pearson', 'kendall', 'spearman'])
+    def test_corr_nooverlap(self, meth):
         # nothing in common
-        for meth in ['pearson', 'kendall', 'spearman']:
-            df = DataFrame({'A': [1, 1.5, 1, np.nan, np.nan, np.nan],
-                            'B': [np.nan, np.nan, np.nan, 1, 1.5, 1],
-                            'C': [np.nan, np.nan, np.nan, np.nan,
-                                  np.nan, np.nan]})
-            rs = df.corr(meth)
-            self.assertTrue(isnull(rs.loc['A', 'B']))
-            self.assertTrue(isnull(rs.loc['B', 'A']))
-            self.assertEqual(rs.loc['A', 'A'], 1)
-            self.assertEqual(rs.loc['B', 'B'], 1)
-            self.assertTrue(isnull(rs.loc['C', 'C']))
-
-    def test_corr_constant(self):
-        tm._skip_if_no_scipy()
-
+        df = DataFrame({'A': [1, 1.5, 1, np.nan, np.nan, np.nan],
+                        'B': [np.nan, np.nan, np.nan, 1, 1.5, 1],
+                        'C': [np.nan, np.nan, np.nan, np.nan,
+                              np.nan, np.nan]})
+        rs = df.corr(meth)
+        assert isna(rs.loc['A', 'B'])
+        assert isna(rs.loc['B', 'A'])
+        assert rs.loc['A', 'A'] == 1
+        assert rs.loc['B', 'B'] == 1
+        assert isna(rs.loc['C', 'C'])
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize('meth', ['pearson', 'spearman'])
+    def test_corr_constant(self, meth):
         # constant --> all NA
 
-        for meth in ['pearson', 'spearman']:
-            df = DataFrame({'A': [1, 1, 1, np.nan, np.nan, np.nan],
-                            'B': [np.nan, np.nan, np.nan, 1, 1, 1]})
-            rs = df.corr(meth)
-            self.assertTrue(isnull(rs.values).all())
+        df = DataFrame({'A': [1, 1, 1, np.nan, np.nan, np.nan],
+                        'B': [np.nan, np.nan, np.nan, 1, 1, 1]})
+        rs = df.corr(meth)
+        assert isna(rs.values).all()
 
     def test_corr_int(self):
         # dtypes other than float64 #1761
         df3 = DataFrame({"a": [1, 2, 3, 4], "b": [1, 2, 3, 4]})
 
-        # it works!
         df3.cov()
         df3.corr()
 
+    @td.skip_if_no_scipy
     def test_corr_int_and_boolean(self):
-        tm._skip_if_no_scipy()
-
         # when dtypes of pandas series are different
         # then ndarray will have dtype=object,
         # so it need to be properly handled
@@ -116,7 +314,11 @@ def test_corr_int_and_boolean(self):
         expected = DataFrame(np.ones((2, 2)), index=[
                              'a', 'b'], columns=['a', 'b'])
         for meth in ['pearson', 'kendall', 'spearman']:
-            tm.assert_frame_equal(df.corr(meth), expected)
+
+            with warnings.catch_warnings(record=True):
+                warnings.simplefilter("ignore", RuntimeWarning)
+                result = df.corr(meth)
+            tm.assert_frame_equal(result, expected)
 
     def test_corr_cov_independent_index_column(self):
         # GH 14617
@@ -127,36 +329,44 @@ def test_corr_cov_independent_index_column(self):
             assert result.index is not result.columns
             assert result.index.equals(result.columns)
 
-    def test_cov(self):
+    def test_corr_invalid_method(self):
+        # GH 22298
+        df = pd.DataFrame(np.random.normal(size=(10, 2)))
+        msg = ("method must be either 'pearson', 'spearman', "
+               "or 'kendall'")
+        with pytest.raises(ValueError, match=msg):
+            df.corr(method="____")
+
+    def test_cov(self, float_frame, float_string_frame):
         # min_periods no NAs (corner case)
-        expected = self.frame.cov()
-        result = self.frame.cov(min_periods=len(self.frame))
+        expected = float_frame.cov()
+        result = float_frame.cov(min_periods=len(float_frame))
 
         tm.assert_frame_equal(expected, result)
 
-        result = self.frame.cov(min_periods=len(self.frame) + 1)
-        self.assertTrue(isnull(result.values).all())
+        result = float_frame.cov(min_periods=len(float_frame) + 1)
+        assert isna(result.values).all()
 
         # with NAs
-        frame = self.frame.copy()
-        frame['A'][:5] = nan
-        frame['B'][5:10] = nan
-        result = self.frame.cov(min_periods=len(self.frame) - 8)
-        expected = self.frame.cov()
+        frame = float_frame.copy()
+        frame['A'][:5] = np.nan
+        frame['B'][5:10] = np.nan
+        result = float_frame.cov(min_periods=len(float_frame) - 8)
+        expected = float_frame.cov()
         expected.loc['A', 'B'] = np.nan
         expected.loc['B', 'A'] = np.nan
 
         # regular
-        self.frame['A'][:5] = nan
-        self.frame['B'][:10] = nan
-        cov = self.frame.cov()
+        float_frame['A'][:5] = np.nan
+        float_frame['B'][:10] = np.nan
+        cov = float_frame.cov()
 
         tm.assert_almost_equal(cov['A']['C'],
-                               self.frame['A'].cov(self.frame['C']))
+                               float_frame['A'].cov(float_frame['C']))
 
         # exclude non-numeric types
-        result = self.mixed_frame.cov()
-        expected = self.mixed_frame.loc[:, ['A', 'B', 'C', 'D']].cov()
+        result = float_string_frame.cov()
+        expected = float_string_frame.loc[:, ['A', 'B', 'C', 'D']].cov()
         tm.assert_frame_equal(result, expected)
 
         # Single column frame
@@ -171,11 +381,11 @@ def test_cov(self):
                              index=df.columns, columns=df.columns)
         tm.assert_frame_equal(result, expected)
 
-    def test_corrwith(self):
-        a = self.tsframe
-        noise = Series(randn(len(a)), index=a.index)
+    def test_corrwith(self, datetime_frame):
+        a = datetime_frame
+        noise = Series(np.random.randn(len(a)), index=a.index)
 
-        b = self.tsframe.add(noise, axis=0)
+        b = datetime_frame.add(noise, axis=0)
 
         # make sure order does not matter
         b = b.reindex(columns=b.columns[::-1], index=b.index[::-1][10:])
@@ -189,16 +399,17 @@ def test_corrwith(self):
 
         dropped = a.corrwith(b, axis=0, drop=True)
         tm.assert_almost_equal(dropped['A'], a['A'].corr(b['A']))
-        self.assertNotIn('B', dropped)
+        assert 'B' not in dropped
 
         dropped = a.corrwith(b, axis=1, drop=True)
-        self.assertNotIn(a.index[-1], dropped.index)
+        assert a.index[-1] not in dropped.index
 
         # non time-series data
         index = ['a', 'b', 'c', 'd', 'e']
         columns = ['one', 'two', 'three', 'four']
-        df1 = DataFrame(randn(5, 4), index=index, columns=columns)
-        df2 = DataFrame(randn(4, 4), index=index[:4], columns=columns)
+        df1 = DataFrame(np.random.randn(5, 4), index=index, columns=columns)
+        df2 = DataFrame(np.random.randn(4, 4),
+                        index=index[:4], columns=columns)
         correls = df1.corrwith(df2, axis=1)
         for row in index[:4]:
             tm.assert_almost_equal(correls[row],
@@ -220,9 +431,9 @@ def test_corrwith_with_objects(self):
         expected = df1.loc[:, cols].corrwith(df2.loc[:, cols], axis=1)
         tm.assert_series_equal(result, expected)
 
-    def test_corrwith_series(self):
-        result = self.tsframe.corrwith(self.tsframe['A'])
-        expected = self.tsframe.apply(self.tsframe['A'].corr)
+    def test_corrwith_series(self, datetime_frame):
+        result = datetime_frame.corrwith(datetime_frame['A'])
+        expected = datetime_frame.apply(datetime_frame['A'].corr)
 
         tm.assert_series_equal(result, expected)
 
@@ -233,7 +444,66 @@ def test_corrwith_matches_corrcoef(self):
         c2 = np.corrcoef(df1['a'], df2['a'])[0][1]
 
         tm.assert_almost_equal(c1, c2)
-        self.assertTrue(c1 < 1)
+        assert c1 < 1
+
+    def test_corrwith_mixed_dtypes(self):
+        # GH 18570
+        df = pd.DataFrame({'a': [1, 4, 3, 2], 'b': [4, 6, 7, 3],
+                           'c': ['a', 'b', 'c', 'd']})
+        s = pd.Series([0, 6, 7, 3])
+        result = df.corrwith(s)
+        corrs = [df['a'].corr(s), df['b'].corr(s)]
+        expected = pd.Series(data=corrs, index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+    def test_corrwith_index_intersection(self):
+        df1 = pd.DataFrame(np.random.random(size=(10, 2)),
+                           columns=["a", "b"])
+        df2 = pd.DataFrame(np.random.random(size=(10, 3)),
+                           columns=["a", "b", "c"])
+
+        result = df1.corrwith(df2, drop=True).index.sort_values()
+        expected = df1.columns.intersection(df2.columns).sort_values()
+        tm.assert_index_equal(result, expected)
+
+    def test_corrwith_index_union(self):
+        df1 = pd.DataFrame(np.random.random(size=(10, 2)),
+                           columns=["a", "b"])
+        df2 = pd.DataFrame(np.random.random(size=(10, 3)),
+                           columns=["a", "b", "c"])
+
+        result = df1.corrwith(df2, drop=False).index.sort_values()
+        expected = df1.columns.union(df2.columns).sort_values()
+        tm.assert_index_equal(result, expected)
+
+    def test_corrwith_dup_cols(self):
+        # GH 21925
+        df1 = pd.DataFrame(np.vstack([np.arange(10)] * 3).T)
+        df2 = df1.copy()
+        df2 = pd.concat((df2, df2[0]), axis=1)
+
+        result = df1.corrwith(df2)
+        expected = pd.Series(np.ones(4), index=[0, 0, 1, 2])
+        tm.assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corrwith_spearman(self):
+        # GH 21925
+        df = pd.DataFrame(np.random.random(size=(100, 3)))
+        result = df.corrwith(df**2, method="spearman")
+        expected = Series(np.ones(len(result)))
+        tm.assert_series_equal(result, expected)
+
+    @td.skip_if_no_scipy
+    def test_corrwith_kendall(self):
+        # GH 21925
+        df = pd.DataFrame(np.random.random(size=(100, 3)))
+        result = df.corrwith(df**2, method="kendall")
+        expected = Series(np.ones(len(result)))
+        tm.assert_series_equal(result, expected)
+
+    # ---------------------------------------------------------------------
+    # Describe
 
     def test_bool_describe_in_mixed_frame(self):
         df = DataFrame({
@@ -291,6 +561,36 @@ def test_describe_bool_frame(self):
                              index=['count', 'unique', 'top', 'freq'])
         tm.assert_frame_equal(result, expected)
 
+    def test_describe_categorical(self):
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+        cat = df
+
+        # Categoricals should not show up together with numerical columns
+        result = cat.describe()
+        assert len(result.columns) == 1
+
+        # In a frame, describe() for the cat should be the same as for string
+        # arrays (count, unique, top, freq)
+
+        cat = Categorical(["a", "b", "b", "b"], categories=['a', 'b', 'c'],
+                          ordered=True)
+        s = Series(cat)
+        result = s.describe()
+        expected = Series([4, 2, "b", 3],
+                          index=['count', 'unique', 'top', 'freq'])
+        tm.assert_series_equal(result, expected)
+
+        cat = Series(Categorical(["a", "b", "c", "c"]))
+        df3 = DataFrame({"cat": cat, "s": ["a", "b", "c", "c"]})
+        result = df3.describe()
+        tm.assert_numpy_array_equal(result["cat"].values, result["s"].values)
+
     def test_describe_categorical_columns(self):
         # GH 11558
         columns = pd.CategoricalIndex(['int1', 'int2', 'obj'],
@@ -334,8 +634,8 @@ def test_describe_datetime_columns(self):
                                     '50%', '75%', 'max'])
         expected.columns = exp_columns
         tm.assert_frame_equal(result, expected)
-        self.assertEqual(result.columns.freq, 'MS')
-        self.assertEqual(result.columns.tz, expected.columns.tz)
+        assert result.columns.freq == 'MS'
+        assert result.columns.tz == expected.columns.tz
 
     def test_describe_timedelta_values(self):
         # GH 6145
@@ -360,8 +660,8 @@ def test_describe_timedelta_values(self):
                              index=['count', 'mean', 'std', 'min', '25%',
                                     '50%', '75%', 'max'])
 
-        res = df.describe()
-        tm.assert_frame_equal(res, expected)
+        result = df.describe()
+        tm.assert_frame_equal(result, expected)
 
         exp_repr = ("                           t1                      t2\n"
                     "count                       5                       5\n"
@@ -372,78 +672,137 @@ def test_describe_timedelta_values(self):
                     "50%           3 days 00:00:00         0 days 03:00:00\n"
                     "75%           4 days 00:00:00         0 days 04:00:00\n"
                     "max           5 days 00:00:00         0 days 05:00:00")
-        self.assertEqual(repr(res), exp_repr)
+        assert repr(result) == exp_repr
+
+    def test_describe_tz_values(self, tz_naive_fixture):
+        # GH 21332
+        tz = tz_naive_fixture
+        s1 = Series(range(5))
+        start = Timestamp(2018, 1, 1)
+        end = Timestamp(2018, 1, 5)
+        s2 = Series(date_range(start, end, tz=tz))
+        df = pd.DataFrame({'s1': s1, 's2': s2})
+
+        expected = DataFrame({'s1': [5, np.nan, np.nan, np.nan, np.nan, np.nan,
+                                     2, 1.581139, 0, 1, 2, 3, 4],
+                              's2': [5, 5, s2.value_counts().index[0], 1,
+                                     start.tz_localize(tz),
+                                     end.tz_localize(tz), np.nan, np.nan,
+                                     np.nan, np.nan, np.nan, np.nan, np.nan]},
+                             index=['count', 'unique', 'top', 'freq', 'first',
+                                    'last', 'mean', 'std', 'min', '25%', '50%',
+                                    '75%', 'max']
+                             )
+        result = df.describe(include='all')
+        tm.assert_frame_equal(result, expected)
+
+    # ---------------------------------------------------------------------
+    # Reductions
+
+    def test_stat_op_api(self, float_frame, float_string_frame):
+        assert_stat_op_api('count', float_frame, float_string_frame,
+                           has_numeric_only=True)
+        assert_stat_op_api('sum', float_frame, float_string_frame,
+                           has_numeric_only=True)
+
+        assert_stat_op_api('nunique', float_frame, float_string_frame)
+        assert_stat_op_api('mean', float_frame, float_string_frame)
+        assert_stat_op_api('product', float_frame, float_string_frame)
+        assert_stat_op_api('median', float_frame, float_string_frame)
+        assert_stat_op_api('min', float_frame, float_string_frame)
+        assert_stat_op_api('max', float_frame, float_string_frame)
+        assert_stat_op_api('mad', float_frame, float_string_frame)
+        assert_stat_op_api('var', float_frame, float_string_frame)
+        assert_stat_op_api('std', float_frame, float_string_frame)
+        assert_stat_op_api('sem', float_frame, float_string_frame)
+        assert_stat_op_api('median', float_frame, float_string_frame)
+
+        try:
+            from scipy.stats import skew, kurtosis  # noqa:F401
+            assert_stat_op_api('skew', float_frame, float_string_frame)
+            assert_stat_op_api('kurt', float_frame, float_string_frame)
+        except ImportError:
+            pass
+
+    def test_stat_op_calc(self, float_frame_with_na, mixed_float_frame):
+
+        def count(s):
+            return notna(s).sum()
+
+        def nunique(s):
+            return len(algorithms.unique1d(s.dropna()))
+
+        def mad(x):
+            return np.abs(x - x.mean()).mean()
+
+        def var(x):
+            return np.var(x, ddof=1)
+
+        def std(x):
+            return np.std(x, ddof=1)
+
+        def sem(x):
+            return np.std(x, ddof=1) / np.sqrt(len(x))
+
+        def skewness(x):
+            from scipy.stats import skew  # noqa:F811
+            if len(x) < 3:
+                return np.nan
+            return skew(x, bias=False)
 
-    def test_reduce_mixed_frame(self):
-        # GH 6806
-        df = DataFrame({
-            'bool_data': [True, True, False, False, False],
-            'int_data': [10, 20, 30, 40, 50],
-            'string_data': ['a', 'b', 'c', 'd', 'e'],
-        })
-        df.reindex(columns=['bool_data', 'int_data', 'string_data'])
-        test = df.sum(axis=0)
-        tm.assert_numpy_array_equal(test.values,
-                                    np.array([2, 150, 'abcde'], dtype=object))
-        tm.assert_series_equal(test, df.T.sum(axis=1))
+        def kurt(x):
+            from scipy.stats import kurtosis  # noqa:F811
+            if len(x) < 4:
+                return np.nan
+            return kurtosis(x, bias=False)
 
-    def test_count(self):
-        f = lambda s: notnull(s).sum()
-        self._check_stat_op('count', f,
-                            has_skipna=False,
-                            has_numeric_only=True,
-                            check_dtype=False,
+        assert_stat_op_calc('nunique', nunique, float_frame_with_na,
+                            has_skipna=False, check_dtype=False,
                             check_dates=True)
 
-        # corner case
-        frame = DataFrame()
-        ct1 = frame.count(1)
-        tm.assertIsInstance(ct1, Series)
-
-        ct2 = frame.count(0)
-        tm.assertIsInstance(ct2, Series)
-
-        # GH #423
-        df = DataFrame(index=lrange(10))
-        result = df.count(1)
-        expected = Series(0, index=df.index)
-        tm.assert_series_equal(result, expected)
+        # mixed types (with upcasting happening)
+        assert_stat_op_calc('sum', np.sum, mixed_float_frame.astype('float32'),
+                            check_dtype=False, check_less_precise=True)
 
-        df = DataFrame(columns=lrange(10))
-        result = df.count(0)
-        expected = Series(0, index=df.columns)
-        tm.assert_series_equal(result, expected)
+        assert_stat_op_calc('sum', np.sum, float_frame_with_na,
+                            skipna_alternative=np.nansum)
+        assert_stat_op_calc('mean', np.mean, float_frame_with_na,
+                            check_dates=True)
+        assert_stat_op_calc('product', np.prod, float_frame_with_na)
 
-        df = DataFrame()
-        result = df.count()
-        expected = Series(0, index=[])
-        tm.assert_series_equal(result, expected)
+        assert_stat_op_calc('mad', mad, float_frame_with_na)
+        assert_stat_op_calc('var', var, float_frame_with_na)
+        assert_stat_op_calc('std', std, float_frame_with_na)
+        assert_stat_op_calc('sem', sem, float_frame_with_na)
 
-    def test_nunique(self):
-        f = lambda s: len(algorithms.unique1d(s.dropna()))
-        self._check_stat_op('nunique', f, has_skipna=False,
-                            check_dtype=False, check_dates=True)
+        assert_stat_op_calc('count', count, float_frame_with_na,
+                            has_skipna=False, check_dtype=False,
+                            check_dates=True)
 
-        df = DataFrame({'A': [1, 1, 1],
-                        'B': [1, 2, 3],
-                        'C': [1, np.nan, 3]})
-        tm.assert_series_equal(df.nunique(), Series({'A': 1, 'B': 3, 'C': 2}))
-        tm.assert_series_equal(df.nunique(dropna=False),
-                               Series({'A': 1, 'B': 3, 'C': 3}))
-        tm.assert_series_equal(df.nunique(axis=1), Series({0: 1, 1: 2, 2: 2}))
-        tm.assert_series_equal(df.nunique(axis=1, dropna=False),
-                               Series({0: 1, 1: 3, 2: 2}))
+        try:
+            from scipy import skew, kurtosis  # noqa:F401
+            assert_stat_op_calc('skew', skewness, float_frame_with_na)
+            assert_stat_op_calc('kurt', kurt, float_frame_with_na)
+        except ImportError:
+            pass
 
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum, has_numeric_only=True)
+    # TODO: Ensure warning isn't emitted in the first place
+    @pytest.mark.filterwarnings("ignore:All-NaN:RuntimeWarning")
+    def test_median(self, float_frame_with_na, int_frame):
+        def wrapper(x):
+            if isna(x).any():
+                return np.nan
+            return np.median(x)
 
-        # mixed types (with upcasting happening)
-        self._check_stat_op('sum', np.sum,
-                            frame=self.mixed_float.astype('float32'),
-                            has_numeric_only=True, check_dtype=False,
-                            check_less_precise=True)
+        assert_stat_op_calc('median', wrapper, float_frame_with_na,
+                            check_dates=True)
+        assert_stat_op_calc('median', wrapper, int_frame, check_dtype=False,
+                            check_dates=True)
 
-    def test_stat_operators_attempt_obj_array(self):
+    @pytest.mark.parametrize('method', ['sum', 'mean', 'prod', 'var',
+                                        'std', 'skew', 'min', 'max'])
+    def test_stat_operators_attempt_obj_array(self, method):
+        # GH#676
         data = {
             'a': [-0.00049987540199591344, -0.0016467257772919831,
                   0.00067695870775883013],
@@ -451,122 +810,99 @@ def test_stat_operators_attempt_obj_array(self):
             'c': [0.00031111847529610595, 0.0014902627951905339,
                   -0.00094099200035979691]
         }
-        df1 = DataFrame(data, index=['foo', 'bar', 'baz'],
-                        dtype='O')
-        methods = ['sum', 'mean', 'prod', 'var', 'std', 'skew', 'min', 'max']
+        df1 = DataFrame(data, index=['foo', 'bar', 'baz'], dtype='O')
 
-        # GH #676
         df2 = DataFrame({0: [np.nan, 2], 1: [np.nan, 3],
                          2: [np.nan, 4]}, dtype=object)
 
         for df in [df1, df2]:
-            for meth in methods:
-                self.assertEqual(df.values.dtype, np.object_)
-                result = getattr(df, meth)(1)
-                expected = getattr(df.astype('f8'), meth)(1)
+            assert df.values.dtype == np.object_
+            result = getattr(df, method)(1)
+            expected = getattr(df.astype('f8'), method)(1)
 
-                if not tm._incompat_bottleneck_version(meth):
-                    tm.assert_series_equal(result, expected)
+            if method in ['sum', 'prod']:
+                tm.assert_series_equal(result, expected)
 
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean, check_dates=True)
+    @pytest.mark.parametrize('op', ['mean', 'std', 'var',
+                                    'skew', 'kurt', 'sem'])
+    def test_mixed_ops(self, op):
+        # GH#16116
+        df = DataFrame({'int': [1, 2, 3, 4],
+                        'float': [1., 2., 3., 4.],
+                        'str': ['a', 'b', 'c', 'd']})
 
-    def test_product(self):
-        self._check_stat_op('product', np.prod)
+        result = getattr(df, op)()
+        assert len(result) == 2
 
-    def test_median(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper, check_dates=True)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min, check_dates=True)
-        self._check_stat_op('min', np.min, frame=self.intframe)
-
-    def test_cummin(self):
-        self.tsframe.loc[5:10, 0] = nan
-        self.tsframe.loc[10:15, 1] = nan
-        self.tsframe.loc[15:, 2] = nan
-
-        # axis = 0
-        cummin = self.tsframe.cummin()
-        expected = self.tsframe.apply(Series.cummin)
-        tm.assert_frame_equal(cummin, expected)
+        with pd.option_context('use_bottleneck', False):
+            result = getattr(df, op)()
+            assert len(result) == 2
 
-        # axis = 1
-        cummin = self.tsframe.cummin(axis=1)
-        expected = self.tsframe.apply(Series.cummin, axis=1)
-        tm.assert_frame_equal(cummin, expected)
-
-        # it works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cummin()  # noqa
-
-        # fix issue
-        cummin_xs = self.tsframe.cummin(axis=1)
-        self.assertEqual(np.shape(cummin_xs), np.shape(self.tsframe))
-
-    def test_cummax(self):
-        self.tsframe.loc[5:10, 0] = nan
-        self.tsframe.loc[10:15, 1] = nan
-        self.tsframe.loc[15:, 2] = nan
-
-        # axis = 0
-        cummax = self.tsframe.cummax()
-        expected = self.tsframe.apply(Series.cummax)
-        tm.assert_frame_equal(cummax, expected)
-
-        # axis = 1
-        cummax = self.tsframe.cummax(axis=1)
-        expected = self.tsframe.apply(Series.cummax, axis=1)
-        tm.assert_frame_equal(cummax, expected)
-
-        # it works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cummax()  # noqa
-
-        # fix issue
-        cummax_xs = self.tsframe.cummax(axis=1)
-        self.assertEqual(np.shape(cummax_xs), np.shape(self.tsframe))
-
-    def test_max(self):
-        self._check_stat_op('max', np.max, check_dates=True)
-        self._check_stat_op('max', np.max, frame=self.intframe)
+    def test_reduce_mixed_frame(self):
+        # GH 6806
+        df = DataFrame({
+            'bool_data': [True, True, False, False, False],
+            'int_data': [10, 20, 30, 40, 50],
+            'string_data': ['a', 'b', 'c', 'd', 'e'],
+        })
+        df.reindex(columns=['bool_data', 'int_data', 'string_data'])
+        test = df.sum(axis=0)
+        tm.assert_numpy_array_equal(test.values,
+                                    np.array([2, 150, 'abcde'], dtype=object))
+        tm.assert_series_equal(test, df.T.sum(axis=1))
 
-    def test_mad(self):
-        f = lambda x: np.abs(x - x.mean()).mean()
-        self._check_stat_op('mad', f)
+    def test_nunique(self):
+        df = DataFrame({'A': [1, 1, 1],
+                        'B': [1, 2, 3],
+                        'C': [1, np.nan, 3]})
+        tm.assert_series_equal(df.nunique(), Series({'A': 1, 'B': 3, 'C': 2}))
+        tm.assert_series_equal(df.nunique(dropna=False),
+                               Series({'A': 1, 'B': 3, 'C': 3}))
+        tm.assert_series_equal(df.nunique(axis=1), Series({0: 1, 1: 2, 2: 2}))
+        tm.assert_series_equal(df.nunique(axis=1, dropna=False),
+                               Series({0: 1, 1: 3, 2: 2}))
 
-    def test_var_std(self):
-        alt = lambda x: np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_mean_mixed_datetime_numeric(self, tz):
+        # https://github.com/pandas-dev/pandas/issues/24752
+        df = pd.DataFrame({"A": [1, 1],
+                           "B": [pd.Timestamp('2000', tz=tz)] * 2})
+        result = df.mean()
+        expected = pd.Series([1.0], index=['A'])
+        tm.assert_series_equal(result, expected)
 
-        alt = lambda x: np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_mean_excludeds_datetimes(self, tz):
+        # https://github.com/pandas-dev/pandas/issues/24752
+        # Our long-term desired behavior is unclear, but the behavior in
+        # 0.24.0rc1 was buggy.
+        df = pd.DataFrame({"A": [pd.Timestamp('2000', tz=tz)] * 2})
+        result = df.mean()
+        expected = pd.Series()
+        tm.assert_series_equal(result, expected)
 
-        result = self.tsframe.std(ddof=4)
-        expected = self.tsframe.apply(lambda x: x.std(ddof=4))
+    def test_var_std(self, datetime_frame):
+        result = datetime_frame.std(ddof=4)
+        expected = datetime_frame.apply(lambda x: x.std(ddof=4))
         tm.assert_almost_equal(result, expected)
 
-        result = self.tsframe.var(ddof=4)
-        expected = self.tsframe.apply(lambda x: x.var(ddof=4))
+        result = datetime_frame.var(ddof=4)
+        expected = datetime_frame.apply(lambda x: x.var(ddof=4))
         tm.assert_almost_equal(result, expected)
 
         arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
         result = nanops.nanvar(arr, axis=0)
-        self.assertFalse((result < 0).any())
-        if nanops._USE_BOTTLENECK:
-            nanops._USE_BOTTLENECK = False
+        assert not (result < 0).any()
+
+        with pd.option_context('use_bottleneck', False):
             result = nanops.nanvar(arr, axis=0)
-            self.assertFalse((result < 0).any())
-            nanops._USE_BOTTLENECK = True
+            assert not (result < 0).any()
 
-    def test_numeric_only_flag(self):
-        # GH #9201
-        methods = ['sem', 'var', 'std']
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    @pytest.mark.parametrize(
+        "meth", ['sem', 'var', 'std'])
+    def test_numeric_only_flag(self, meth):
+        # GH 9201
         df1 = DataFrame(np.random.randn(5, 3), columns=['foo', 'bar', 'baz'])
         # set one entry to a number in str format
         df1.loc[0, 'foo'] = '100'
@@ -575,263 +911,120 @@ def test_numeric_only_flag(self):
         # set one entry to a non-number str
         df2.loc[0, 'foo'] = 'a'
 
-        for meth in methods:
-            result = getattr(df1, meth)(axis=1, numeric_only=True)
-            expected = getattr(df1[['bar', 'baz']], meth)(axis=1)
-            tm.assert_series_equal(expected, result)
-
-            result = getattr(df2, meth)(axis=1, numeric_only=True)
-            expected = getattr(df2[['bar', 'baz']], meth)(axis=1)
-            tm.assert_series_equal(expected, result)
-
-            # df1 has all numbers, df2 has a letter inside
-            self.assertRaises(TypeError, lambda: getattr(df1, meth)
-                              (axis=1, numeric_only=False))
-            self.assertRaises(TypeError, lambda: getattr(df2, meth)
-                              (axis=1, numeric_only=False))
-
-    def test_cumsum(self):
-        self.tsframe.loc[5:10, 0] = nan
-        self.tsframe.loc[10:15, 1] = nan
-        self.tsframe.loc[15:, 2] = nan
-
-        # axis = 0
-        cumsum = self.tsframe.cumsum()
-        expected = self.tsframe.apply(Series.cumsum)
-        tm.assert_frame_equal(cumsum, expected)
-
-        # axis = 1
-        cumsum = self.tsframe.cumsum(axis=1)
-        expected = self.tsframe.apply(Series.cumsum, axis=1)
-        tm.assert_frame_equal(cumsum, expected)
-
-        # works
-        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
-        result = df.cumsum()  # noqa
-
-        # fix issue
-        cumsum_xs = self.tsframe.cumsum(axis=1)
-        self.assertEqual(np.shape(cumsum_xs), np.shape(self.tsframe))
-
-    def test_cumprod(self):
-        self.tsframe.loc[5:10, 0] = nan
-        self.tsframe.loc[10:15, 1] = nan
-        self.tsframe.loc[15:, 2] = nan
-
-        # axis = 0
-        cumprod = self.tsframe.cumprod()
-        expected = self.tsframe.apply(Series.cumprod)
-        tm.assert_frame_equal(cumprod, expected)
-
-        # axis = 1
-        cumprod = self.tsframe.cumprod(axis=1)
-        expected = self.tsframe.apply(Series.cumprod, axis=1)
-        tm.assert_frame_equal(cumprod, expected)
-
-        # fix issue
-        cumprod_xs = self.tsframe.cumprod(axis=1)
-        self.assertEqual(np.shape(cumprod_xs), np.shape(self.tsframe))
-
-        # ints
-        df = self.tsframe.fillna(0).astype(int)
-        df.cumprod(0)
-        df.cumprod(1)
-
-        # ints32
-        df = self.tsframe.fillna(0).astype(np.int32)
-        df.cumprod(0)
-        df.cumprod(1)
-
-    def test_sem(self):
-        alt = lambda x: np.std(x, ddof=1) / np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-        result = self.tsframe.sem(ddof=4)
-        expected = self.tsframe.apply(
+        result = getattr(df1, meth)(axis=1, numeric_only=True)
+        expected = getattr(df1[['bar', 'baz']], meth)(axis=1)
+        tm.assert_series_equal(expected, result)
+
+        result = getattr(df2, meth)(axis=1, numeric_only=True)
+        expected = getattr(df2[['bar', 'baz']], meth)(axis=1)
+        tm.assert_series_equal(expected, result)
+
+        # df1 has all numbers, df2 has a letter inside
+        msg = r"unsupported operand type\(s\) for -: 'float' and 'str'"
+        with pytest.raises(TypeError, match=msg):
+            getattr(df1, meth)(axis=1, numeric_only=False)
+        msg = "could not convert string to float: 'a'"
+        with pytest.raises(TypeError, match=msg):
+            getattr(df2, meth)(axis=1, numeric_only=False)
+
+    def test_sem(self, datetime_frame):
+        result = datetime_frame.sem(ddof=4)
+        expected = datetime_frame.apply(
             lambda x: x.std(ddof=4) / np.sqrt(len(x)))
         tm.assert_almost_equal(result, expected)
 
         arr = np.repeat(np.random.random((1, 1000)), 1000, 0)
         result = nanops.nansem(arr, axis=0)
-        self.assertFalse((result < 0).any())
-        if nanops._USE_BOTTLENECK:
-            nanops._USE_BOTTLENECK = False
-            result = nanops.nansem(arr, axis=0)
-            self.assertFalse((result < 0).any())
-            nanops._USE_BOTTLENECK = True
-
-    def test_skew(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import skew
-
-        def alt(x):
-            if len(x) < 3:
-                return np.nan
-            return skew(x, bias=False)
+        assert not (result < 0).any()
 
-        self._check_stat_op('skew', alt)
+        with pd.option_context('use_bottleneck', False):
+            result = nanops.nansem(arr, axis=0)
+            assert not (result < 0).any()
 
+    @td.skip_if_no_scipy
     def test_kurt(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import kurtosis
-
-        def alt(x):
-            if len(x) < 4:
-                return np.nan
-            return kurtosis(x, bias=False)
-
-        self._check_stat_op('kurt', alt)
-
         index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0],
-                                   [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
+                           codes=[[0, 0, 0, 0, 0, 0],
+                                  [0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1]])
         df = DataFrame(np.random.randn(6, 3), index=index)
 
         kurt = df.kurt()
         kurt2 = df.kurt(level=0).xs('bar')
         tm.assert_series_equal(kurt, kurt2, check_names=False)
-        self.assertTrue(kurt.name is None)
-        self.assertEqual(kurt2.name, 'bar')
-
-    def _check_stat_op(self, name, alternative, frame=None, has_skipna=True,
-                       has_numeric_only=False, check_dtype=True,
-                       check_dates=False, check_less_precise=False):
-        if frame is None:
-            frame = self.frame
-            # set some NAs
-            frame.loc[5:10] = np.nan
-            frame.loc[15:20, -2:] = np.nan
-
-        f = getattr(frame, name)
-
-        if check_dates:
-            df = DataFrame({'b': date_range('1/1/2001', periods=2)})
-            _f = getattr(df, name)
-            result = _f()
-            self.assertIsInstance(result, Series)
-
-            df['a'] = lrange(len(df))
-            result = getattr(df, name)()
-            self.assertIsInstance(result, Series)
-            self.assertTrue(len(result))
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = x.dropna()
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(x.values)
-
-            result0 = f(axis=0, skipna=False)
-            result1 = f(axis=1, skipna=False)
-            tm.assert_series_equal(result0, frame.apply(wrapper),
-                                   check_dtype=check_dtype,
-                                   check_less_precise=check_less_precise)
-            # HACK: win32
-            tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
-                                   check_dtype=False,
-                                   check_less_precise=check_less_precise)
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
+        assert kurt.name is None
+        assert kurt2.name == 'bar'
+
+    @pytest.mark.parametrize("dropna, expected", [
+        (True, {'A': [12],
+                'B': [10.0],
+                'C': [1.0],
+                'D': ['a'],
+                'E': Categorical(['a'], categories=['a']),
+                'F': to_datetime(['2000-1-2']),
+                'G': to_timedelta(['1 days'])}),
+        (False, {'A': [12],
+                 'B': [10.0],
+                 'C': [np.nan],
+                 'D': np.array([np.nan], dtype=object),
+                 'E': Categorical([np.nan], categories=['a']),
+                 'F': [pd.NaT],
+                 'G': to_timedelta([pd.NaT])}),
+        (True, {'H': [8, 9, np.nan, np.nan],
+                'I': [8, 9, np.nan, np.nan],
+                'J': [1, np.nan, np.nan, np.nan],
+                'K': Categorical(['a', np.nan, np.nan, np.nan],
+                                 categories=['a']),
+                'L': to_datetime(['2000-1-2', 'NaT', 'NaT', 'NaT']),
+                'M': to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                'N': [0, 1, 2, 3]}),
+        (False, {'H': [8, 9, np.nan, np.nan],
+                 'I': [8, 9, np.nan, np.nan],
+                 'J': [1, np.nan, np.nan, np.nan],
+                 'K': Categorical([np.nan, 'a', np.nan, np.nan],
+                                  categories=['a']),
+                 'L': to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                 'M': to_timedelta(['nan', '1 days', 'nan', 'nan']),
+                 'N': [0, 1, 2, 3]})
+    ])
+    def test_mode_dropna(self, dropna, expected):
+
+        df = DataFrame({"A": [12, 12, 19, 11],
+                        "B": [10, 10, np.nan, 3],
+                        "C": [1, np.nan, np.nan, np.nan],
+                        "D": [np.nan, np.nan, 'a', np.nan],
+                        "E": Categorical([np.nan, np.nan, 'a', np.nan]),
+                        "F": to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                        "G": to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                        "H": [8, 8, 9, 9],
+                        "I": [9, 9, 8, 8],
+                        "J": [1, 1, np.nan, np.nan],
+                        "K": Categorical(['a', np.nan, 'a', np.nan]),
+                        "L": to_datetime(['2000-1-2', '2000-1-2',
+                                          'NaT', 'NaT']),
+                        "M": to_timedelta(['1 days', 'nan',
+                                           '1 days', 'nan']),
+                        "N": np.arange(4, dtype='int64')})
+
+        result = df[sorted(list(expected.keys()))].mode(dropna=dropna)
+        expected = DataFrame(expected)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(not compat.PY3, reason="only PY3")
+    def test_mode_sortwarning(self):
+        # Check for the warning that is raised when the mode
+        # results cannot be sorted
+
+        df = DataFrame({"A": [np.nan, np.nan, 'a', 'a']})
+        expected = DataFrame({'A': ['a', np.nan]})
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            result = df.mode(dropna=False)
+            result = result.sort_values(by='A').reset_index(drop=True)
 
-        result0 = f(axis=0)
-        result1 = f(axis=1)
-        tm.assert_series_equal(result0, frame.apply(skipna_wrapper),
-                               check_dtype=check_dtype,
-                               check_less_precise=check_less_precise)
-        if not tm._incompat_bottleneck_version(name):
-            exp = frame.apply(skipna_wrapper, axis=1)
-            tm.assert_series_equal(result1, exp, check_dtype=False,
-                                   check_less_precise=check_less_precise)
-
-        # check dtypes
-        if check_dtype:
-            lcd_dtype = frame.values.dtype
-            self.assertEqual(lcd_dtype, result0.dtype)
-            self.assertEqual(lcd_dtype, result1.dtype)
-
-        # result = f(axis=1)
-        # comp = frame.apply(alternative, axis=1).reindex(result.index)
-        # assert_series_equal(result, comp)
-
-        # bad axis
-        tm.assertRaisesRegexp(ValueError, 'No axis named 2', f, axis=2)
-        # make sure works on mixed-type frame
-        getattr(self.mixed_frame, name)(axis=0)
-        getattr(self.mixed_frame, name)(axis=1)
-
-        if has_numeric_only:
-            getattr(self.mixed_frame, name)(axis=0, numeric_only=True)
-            getattr(self.mixed_frame, name)(axis=1, numeric_only=True)
-            getattr(self.frame, name)(axis=0, numeric_only=False)
-            getattr(self.frame, name)(axis=1, numeric_only=False)
-
-        # all NA case
-        if has_skipna:
-            all_na = self.frame * np.NaN
-            r0 = getattr(all_na, name)(axis=0)
-            r1 = getattr(all_na, name)(axis=1)
-            if not tm._incompat_bottleneck_version(name):
-                self.assertTrue(np.isnan(r0).all())
-                self.assertTrue(np.isnan(r1).all())
-
-    def test_mode(self):
-        df = pd.DataFrame({"A": [12, 12, 11, 12, 19, 11],
-                           "B": [10, 10, 10, np.nan, 3, 4],
-                           "C": [8, 8, 8, 9, 9, 9],
-                           "D": np.arange(6, dtype='int64'),
-                           "E": [8, 8, 1, 1, 3, 3]})
-        tm.assert_frame_equal(df[["A"]].mode(),
-                              pd.DataFrame({"A": [12]}))
-        expected = pd.Series([0, 1, 2, 3, 4, 5], dtype='int64', name='D').\
-            to_frame()
-        tm.assert_frame_equal(df[["D"]].mode(), expected)
-        expected = pd.Series([1, 3, 8], dtype='int64', name='E').to_frame()
-        tm.assert_frame_equal(df[["E"]].mode(), expected)
-        tm.assert_frame_equal(df[["A", "B"]].mode(),
-                              pd.DataFrame({"A": [12], "B": [10.]}))
-        tm.assert_frame_equal(df.mode(),
-                              pd.DataFrame({"A": [12, np.nan, np.nan, np.nan,
-                                                  np.nan, np.nan],
-                                            "B": [10, np.nan, np.nan, np.nan,
-                                                  np.nan, np.nan],
-                                            "C": [8, 9, np.nan, np.nan, np.nan,
-                                                  np.nan],
-                                            "D": [0, 1, 2, 3, 4, 5],
-                                            "E": [1, 3, 8, np.nan, np.nan,
-                                                  np.nan]}))
-
-        # outputs in sorted order
-        df["C"] = list(reversed(df["C"]))
-        printing.pprint_thing(df["C"])
-        printing.pprint_thing(df["C"].mode())
-        a, b = (df[["A", "B", "C"]].mode(),
-                pd.DataFrame({"A": [12, np.nan],
-                              "B": [10, np.nan],
-                              "C": [8, 9]}))
-        printing.pprint_thing(a)
-        printing.pprint_thing(b)
-        tm.assert_frame_equal(a, b)
-        # should work with heterogeneous types
-        df = pd.DataFrame({"A": np.arange(6, dtype='int64'),
-                           "B": pd.date_range('2011', periods=6),
-                           "C": list('abcdef')})
-        exp = pd.DataFrame({"A": pd.Series(np.arange(6, dtype='int64'),
-                                           dtype=df["A"].dtype),
-                            "B": pd.Series(pd.date_range('2011', periods=6),
-                                           dtype=df["B"].dtype),
-                            "C": pd.Series(list('abcdef'),
-                                           dtype=df["C"].dtype)})
-        tm.assert_frame_equal(df.mode(), exp)
+        tm.assert_frame_equal(result, expected)
 
     def test_operators_timedelta64(self):
-        from datetime import timedelta
         df = DataFrame(dict(A=date_range('2012-1-1', periods=3, freq='D'),
                             B=date_range('2012-1-2', periods=3, freq='D'),
                             C=Timestamp('20120101') -
@@ -842,19 +1035,19 @@ def test_operators_timedelta64(self):
 
         # min
         result = diffs.min()
-        self.assertEqual(result[0], diffs.loc[0, 'A'])
-        self.assertEqual(result[1], diffs.loc[0, 'B'])
+        assert result[0] == diffs.loc[0, 'A']
+        assert result[1] == diffs.loc[0, 'B']
 
         result = diffs.min(axis=1)
-        self.assertTrue((result == diffs.loc[0, 'B']).all())
+        assert (result == diffs.loc[0, 'B']).all()
 
         # max
         result = diffs.max()
-        self.assertEqual(result[0], diffs.loc[2, 'A'])
-        self.assertEqual(result[1], diffs.loc[2, 'B'])
+        assert result[0] == diffs.loc[2, 'A']
+        assert result[1] == diffs.loc[2, 'B']
 
         result = diffs.max(axis=1)
-        self.assertTrue((result == diffs['A']).all())
+        assert (result == diffs['A']).all()
 
         # abs
         result = diffs.abs()
@@ -872,12 +1065,9 @@ def test_operators_timedelta64(self):
         mixed['F'] = Timestamp('20130101')
 
         # results in an object array
-        from pandas.tseries.timedeltas import (
-            _coerce_scalar_to_timedelta_type as _coerce)
-
         result = mixed.min()
-        expected = Series([_coerce(timedelta(seconds=5 * 60 + 5)),
-                           _coerce(timedelta(days=-1)),
+        expected = Series([pd.Timedelta(timedelta(seconds=5 * 60 + 5)),
+                           pd.Timedelta(timedelta(days=-1)),
                            'foo', 1, 1.0,
                            Timestamp('20130101')],
                           index=mixed.columns)
@@ -902,295 +1092,484 @@ def test_operators_timedelta64(self):
         df = DataFrame({'time': date_range('20130102', periods=5),
                         'time2': date_range('20130105', periods=5)})
         df['off1'] = df['time2'] - df['time']
-        self.assertEqual(df['off1'].dtype, 'timedelta64[ns]')
+        assert df['off1'].dtype == 'timedelta64[ns]'
 
         df['off2'] = df['time'] - df['time2']
         df._consolidate_inplace()
-        self.assertTrue(df['off1'].dtype == 'timedelta64[ns]')
-        self.assertTrue(df['off2'].dtype == 'timedelta64[ns]')
+        assert df['off1'].dtype == 'timedelta64[ns]'
+        assert df['off2'].dtype == 'timedelta64[ns]'
 
     def test_sum_corner(self):
-        axis0 = self.empty.sum(0)
-        axis1 = self.empty.sum(1)
-        tm.assertIsInstance(axis0, Series)
-        tm.assertIsInstance(axis1, Series)
-        self.assertEqual(len(axis0), 0)
-        self.assertEqual(len(axis1), 0)
-
-    def test_sum_object(self):
-        values = self.frame.values.astype(int)
-        frame = DataFrame(values, index=self.frame.index,
-                          columns=self.frame.columns)
+        empty_frame = DataFrame()
+
+        axis0 = empty_frame.sum(0)
+        axis1 = empty_frame.sum(1)
+        assert isinstance(axis0, Series)
+        assert isinstance(axis1, Series)
+        assert len(axis0) == 0
+        assert len(axis1) == 0
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0),
+        ('prod', 1),
+    ])
+    def test_sum_prod_nanops(self, method, unit):
+        idx = ['a', 'b', 'c']
+        df = pd.DataFrame({"a": [unit, unit],
+                           "b": [unit, np.nan],
+                           "c": [np.nan, np.nan]})
+        # The default
+        result = getattr(df, method)
+        expected = pd.Series([unit, unit, unit], index=idx, dtype='float64')
+
+        # min_count=1
+        result = getattr(df, method)(min_count=1)
+        expected = pd.Series([unit, unit, np.nan], index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = getattr(df, method)(min_count=0)
+        expected = pd.Series([unit, unit, unit], index=idx, dtype='float64')
+        tm.assert_series_equal(result, expected)
+
+        result = getattr(df.iloc[1:], method)(min_count=1)
+        expected = pd.Series([unit, np.nan, np.nan], index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count > 1
+        df = pd.DataFrame({"A": [unit] * 10, "B": [unit] * 5 + [np.nan] * 5})
+        result = getattr(df, method)(min_count=5)
+        expected = pd.Series(result, index=['A', 'B'])
+        tm.assert_series_equal(result, expected)
+
+        result = getattr(df, method)(min_count=6)
+        expected = pd.Series(result, index=['A', 'B'])
+        tm.assert_series_equal(result, expected)
+
+    def test_sum_nanops_timedelta(self):
+        # prod isn't defined on timedeltas
+        idx = ['a', 'b', 'c']
+        df = pd.DataFrame({"a": [0, 0],
+                           "b": [0, np.nan],
+                           "c": [np.nan, np.nan]})
+
+        df2 = df.apply(pd.to_timedelta)
+
+        # 0 by default
+        result = df2.sum()
+        expected = pd.Series([0, 0, 0], dtype='m8[ns]', index=idx)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = df2.sum(min_count=0)
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = df2.sum(min_count=1)
+        expected = pd.Series([0, 0, np.nan], dtype='m8[ns]', index=idx)
+        tm.assert_series_equal(result, expected)
+
+    def test_sum_object(self, float_frame):
+        values = float_frame.values.astype(int)
+        frame = DataFrame(values, index=float_frame.index,
+                          columns=float_frame.columns)
         deltas = frame * timedelta(1)
         deltas.sum()
 
-    def test_sum_bool(self):
+    def test_sum_bool(self, float_frame):
         # ensure this works, bug report
-        bools = np.isnan(self.frame)
+        bools = np.isnan(float_frame)
         bools.sum(1)
         bools.sum(0)
 
-    def test_mean_corner(self):
+    def test_mean_corner(self, float_frame, float_string_frame):
         # unit test when have object data
-        the_mean = self.mixed_frame.mean(axis=0)
-        the_sum = self.mixed_frame.sum(axis=0, numeric_only=True)
-        self.assert_index_equal(the_sum.index, the_mean.index)
-        self.assertTrue(len(the_mean.index) < len(self.mixed_frame.columns))
+        the_mean = float_string_frame.mean(axis=0)
+        the_sum = float_string_frame.sum(axis=0, numeric_only=True)
+        tm.assert_index_equal(the_sum.index, the_mean.index)
+        assert len(the_mean.index) < len(float_string_frame.columns)
 
         # xs sum mixed type, just want to know it works...
-        the_mean = self.mixed_frame.mean(axis=1)
-        the_sum = self.mixed_frame.sum(axis=1, numeric_only=True)
-        self.assert_index_equal(the_sum.index, the_mean.index)
+        the_mean = float_string_frame.mean(axis=1)
+        the_sum = float_string_frame.sum(axis=1, numeric_only=True)
+        tm.assert_index_equal(the_sum.index, the_mean.index)
 
         # take mean of boolean column
-        self.frame['bool'] = self.frame['A'] > 0
-        means = self.frame.mean(0)
-        self.assertEqual(means['bool'], self.frame['bool'].values.mean())
+        float_frame['bool'] = float_frame['A'] > 0
+        means = float_frame.mean(0)
+        assert means['bool'] == float_frame['bool'].values.mean()
 
-    def test_stats_mixed_type(self):
+    def test_stats_mixed_type(self, float_string_frame):
         # don't blow up
-        self.mixed_frame.std(1)
-        self.mixed_frame.var(1)
-        self.mixed_frame.mean(1)
-        self.mixed_frame.skew(1)
+        float_string_frame.std(1)
+        float_string_frame.var(1)
+        float_string_frame.mean(1)
+        float_string_frame.skew(1)
+
+    def test_sum_bools(self):
+        df = DataFrame(index=lrange(1), columns=lrange(10))
+        bools = isna(df)
+        assert bools.sum(axis=1)[0] == 10
+
+    # ---------------------------------------------------------------------
+    # Cumulative Reductions - cumsum, cummax, ...
+
+    def test_cumsum_corner(self):
+        dm = DataFrame(np.arange(20).reshape(4, 5),
+                       index=lrange(4), columns=lrange(5))
+        # ?(wesm)
+        result = dm.cumsum()  # noqa
+
+    def test_cumsum(self, datetime_frame):
+        datetime_frame.loc[5:10, 0] = np.nan
+        datetime_frame.loc[10:15, 1] = np.nan
+        datetime_frame.loc[15:, 2] = np.nan
+
+        # axis = 0
+        cumsum = datetime_frame.cumsum()
+        expected = datetime_frame.apply(Series.cumsum)
+        tm.assert_frame_equal(cumsum, expected)
+
+        # axis = 1
+        cumsum = datetime_frame.cumsum(axis=1)
+        expected = datetime_frame.apply(Series.cumsum, axis=1)
+        tm.assert_frame_equal(cumsum, expected)
+
+        # works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cumsum()  # noqa
+
+        # fix issue
+        cumsum_xs = datetime_frame.cumsum(axis=1)
+        assert np.shape(cumsum_xs) == np.shape(datetime_frame)
+
+    def test_cumprod(self, datetime_frame):
+        datetime_frame.loc[5:10, 0] = np.nan
+        datetime_frame.loc[10:15, 1] = np.nan
+        datetime_frame.loc[15:, 2] = np.nan
+
+        # axis = 0
+        cumprod = datetime_frame.cumprod()
+        expected = datetime_frame.apply(Series.cumprod)
+        tm.assert_frame_equal(cumprod, expected)
+
+        # axis = 1
+        cumprod = datetime_frame.cumprod(axis=1)
+        expected = datetime_frame.apply(Series.cumprod, axis=1)
+        tm.assert_frame_equal(cumprod, expected)
+
+        # fix issue
+        cumprod_xs = datetime_frame.cumprod(axis=1)
+        assert np.shape(cumprod_xs) == np.shape(datetime_frame)
+
+        # ints
+        df = datetime_frame.fillna(0).astype(int)
+        df.cumprod(0)
+        df.cumprod(1)
+
+        # ints32
+        df = datetime_frame.fillna(0).astype(np.int32)
+        df.cumprod(0)
+        df.cumprod(1)
+
+    def test_cummin(self, datetime_frame):
+        datetime_frame.loc[5:10, 0] = np.nan
+        datetime_frame.loc[10:15, 1] = np.nan
+        datetime_frame.loc[15:, 2] = np.nan
+
+        # axis = 0
+        cummin = datetime_frame.cummin()
+        expected = datetime_frame.apply(Series.cummin)
+        tm.assert_frame_equal(cummin, expected)
+
+        # axis = 1
+        cummin = datetime_frame.cummin(axis=1)
+        expected = datetime_frame.apply(Series.cummin, axis=1)
+        tm.assert_frame_equal(cummin, expected)
+
+        # it works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cummin()  # noqa
+
+        # fix issue
+        cummin_xs = datetime_frame.cummin(axis=1)
+        assert np.shape(cummin_xs) == np.shape(datetime_frame)
+
+    def test_cummax(self, datetime_frame):
+        datetime_frame.loc[5:10, 0] = np.nan
+        datetime_frame.loc[10:15, 1] = np.nan
+        datetime_frame.loc[15:, 2] = np.nan
+
+        # axis = 0
+        cummax = datetime_frame.cummax()
+        expected = datetime_frame.apply(Series.cummax)
+        tm.assert_frame_equal(cummax, expected)
+
+        # axis = 1
+        cummax = datetime_frame.cummax(axis=1)
+        expected = datetime_frame.apply(Series.cummax, axis=1)
+        tm.assert_frame_equal(cummax, expected)
+
+        # it works
+        df = DataFrame({'A': np.arange(20)}, index=np.arange(20))
+        result = df.cummax()  # noqa
+
+        # fix issue
+        cummax_xs = datetime_frame.cummax(axis=1)
+        assert np.shape(cummax_xs) == np.shape(datetime_frame)
+
+    # ---------------------------------------------------------------------
+    # Miscellanea
+
+    def test_count(self):
+        # corner case
+        frame = DataFrame()
+        ct1 = frame.count(1)
+        assert isinstance(ct1, Series)
+
+        ct2 = frame.count(0)
+        assert isinstance(ct2, Series)
 
-    def test_median_corner(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
+        # GH#423
+        df = DataFrame(index=lrange(10))
+        result = df.count(1)
+        expected = Series(0, index=df.index)
+        tm.assert_series_equal(result, expected)
 
-        self._check_stat_op('median', wrapper, frame=self.intframe,
-                            check_dtype=False, check_dates=True)
+        df = DataFrame(columns=lrange(10))
+        result = df.count(0)
+        expected = Series(0, index=df.columns)
+        tm.assert_series_equal(result, expected)
 
-    # Miscellanea
+        df = DataFrame()
+        result = df.count()
+        expected = Series(0, index=[])
+        tm.assert_series_equal(result, expected)
 
-    def test_count_objects(self):
-        dm = DataFrame(self.mixed_frame._series)
-        df = DataFrame(self.mixed_frame._series)
+    def test_count_objects(self, float_string_frame):
+        dm = DataFrame(float_string_frame._series)
+        df = DataFrame(float_string_frame._series)
 
         tm.assert_series_equal(dm.count(), df.count())
         tm.assert_series_equal(dm.count(1), df.count(1))
 
-    def test_cumsum_corner(self):
-        dm = DataFrame(np.arange(20).reshape(4, 5),
-                       index=lrange(4), columns=lrange(5))
-        # ?(wesm)
-        result = dm.cumsum()  # noqa
+    def test_pct_change(self):
+        # GH#11150
+        pnl = DataFrame([np.arange(0, 40, 10),
+                         np.arange(0, 40, 10),
+                         np.arange(0, 40, 10)]).astype(np.float64)
+        pnl.iat[1, 0] = np.nan
+        pnl.iat[1, 1] = np.nan
+        pnl.iat[2, 3] = 60
 
-    def test_sum_bools(self):
-        df = DataFrame(index=lrange(1), columns=lrange(10))
-        bools = isnull(df)
-        self.assertEqual(bools.sum(axis=1)[0], 10)
+        for axis in range(2):
+            expected = pnl.ffill(axis=axis) / pnl.ffill(axis=axis).shift(
+                axis=axis) - 1
+            result = pnl.pct_change(axis=axis, fill_method='pad')
+
+            tm.assert_frame_equal(result, expected)
 
+    # ----------------------------------------------------------------------
     # Index of max / min
 
-    def test_idxmin(self):
-        frame = self.frame
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_idxmin(self, float_frame, int_frame):
+        frame = float_frame
         frame.loc[5:10] = np.nan
         frame.loc[15:20, -2:] = np.nan
         for skipna in [True, False]:
             for axis in [0, 1]:
-                for df in [frame, self.intframe]:
+                for df in [frame, int_frame]:
                     result = df.idxmin(axis=axis, skipna=skipna)
                     expected = df.apply(Series.idxmin, axis=axis,
                                         skipna=skipna)
                     tm.assert_series_equal(result, expected)
 
-        self.assertRaises(ValueError, frame.idxmin, axis=2)
+        msg = ("No axis named 2 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            frame.idxmin(axis=2)
 
-    def test_idxmax(self):
-        frame = self.frame
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_idxmax(self, float_frame, int_frame):
+        frame = float_frame
         frame.loc[5:10] = np.nan
         frame.loc[15:20, -2:] = np.nan
         for skipna in [True, False]:
             for axis in [0, 1]:
-                for df in [frame, self.intframe]:
+                for df in [frame, int_frame]:
                     result = df.idxmax(axis=axis, skipna=skipna)
                     expected = df.apply(Series.idxmax, axis=axis,
                                         skipna=skipna)
                     tm.assert_series_equal(result, expected)
 
-        self.assertRaises(ValueError, frame.idxmax, axis=2)
+        msg = ("No axis named 2 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            frame.idxmax(axis=2)
 
     # ----------------------------------------------------------------------
     # Logical reductions
 
-    def test_any_all(self):
-        self._check_bool_op('any', np.any, has_skipna=True, has_bool_only=True)
-        self._check_bool_op('all', np.all, has_skipna=True, has_bool_only=True)
+    @pytest.mark.parametrize('opname', ['any', 'all'])
+    def test_any_all(self, opname, bool_frame_with_na, float_string_frame):
+        assert_bool_op_calc(opname, getattr(np, opname), bool_frame_with_na,
+                            has_skipna=True)
+        assert_bool_op_api(opname, bool_frame_with_na, float_string_frame,
+                           has_bool_only=True)
 
-        df = DataFrame(randn(10, 4)) > 0
-        df.any(1)
-        df.all(1)
-        df.any(1, bool_only=True)
-        df.all(1, bool_only=True)
-
-        # skip pathological failure cases
-        # class CantNonzero(object):
+    def test_any_all_extra(self):
+        df = DataFrame({
+            'A': [True, False, False],
+            'B': [True, True, False],
+            'C': [True, True, True],
+        }, index=['a', 'b', 'c'])
+        result = df[['A', 'B']].any(1)
+        expected = Series([True, True, False], index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
 
-        #     def __nonzero__(self):
-        #         raise ValueError
+        result = df[['A', 'B']].any(1, bool_only=True)
+        tm.assert_series_equal(result, expected)
 
-        # df[4] = CantNonzero()
+        result = df.all(1)
+        expected = Series([True, False, False], index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
 
-        # it works!
-        # df.any(1)
-        # df.all(1)
-        # df.any(1, bool_only=True)
-        # df.all(1, bool_only=True)
+        result = df.all(1, bool_only=True)
+        tm.assert_series_equal(result, expected)
 
-        # df[4][4] = np.nan
-        # df.any(1)
-        # df.all(1)
-        # df.any(1, bool_only=True)
-        # df.all(1, bool_only=True)
+        # Axis is None
+        result = df.all(axis=None).item()
+        assert result is False
 
-    def _check_bool_op(self, name, alternative, frame=None, has_skipna=True,
-                       has_bool_only=False):
-        if frame is None:
-            frame = self.frame > 0
-            # set some NAs
-            frame = DataFrame(frame.values.astype(object), frame.index,
-                              frame.columns)
-            frame.loc[5:10] = np.nan
-            frame.loc[15:20, -2:] = np.nan
-
-        f = getattr(frame, name)
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = x.dropna().values
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(x.values)
-
-            result0 = f(axis=0, skipna=False)
-            result1 = f(axis=1, skipna=False)
-            tm.assert_series_equal(result0, frame.apply(wrapper))
-            tm.assert_series_equal(result1, frame.apply(wrapper, axis=1),
-                                   check_dtype=False)  # HACK: win32
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        result0 = f(axis=0)
-        result1 = f(axis=1)
-        tm.assert_series_equal(result0, frame.apply(skipna_wrapper))
-        tm.assert_series_equal(result1, frame.apply(skipna_wrapper, axis=1),
-                               check_dtype=False)
-
-        # result = f(axis=1)
-        # comp = frame.apply(alternative, axis=1).reindex(result.index)
-        # assert_series_equal(result, comp)
-
-        # bad axis
-        self.assertRaises(ValueError, f, axis=2)
-
-        # make sure works on mixed-type frame
-        mixed = self.mixed_frame
-        mixed['_bool_'] = np.random.randn(len(mixed)) > 0
-        getattr(mixed, name)(axis=0)
-        getattr(mixed, name)(axis=1)
-
-        class NonzeroFail:
-
-            def __nonzero__(self):
-                raise ValueError
-
-        mixed['_nonzero_fail_'] = NonzeroFail()
-
-        if has_bool_only:
-            getattr(mixed, name)(axis=0, bool_only=True)
-            getattr(mixed, name)(axis=1, bool_only=True)
-            getattr(frame, name)(axis=0, bool_only=False)
-            getattr(frame, name)(axis=1, bool_only=False)
-
-        # all NA case
-        if has_skipna:
-            all_na = frame * np.NaN
-            r0 = getattr(all_na, name)(axis=0)
-            r1 = getattr(all_na, name)(axis=1)
-            if name == 'any':
-                self.assertFalse(r0.any())
-                self.assertFalse(r1.any())
-            else:
-                self.assertTrue(r0.all())
-                self.assertTrue(r1.all())
+        result = df.any(axis=None).item()
+        assert result is True
 
-    # ----------------------------------------------------------------------
-    # Top / bottom
+        result = df[['C']].all(axis=None).item()
+        assert result is True
 
-    def test_nlargest(self):
-        # GH10393
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10])})
-        result = df.nlargest(5, 'a')
-        expected = df.sort_values('a', ascending=False).head(5)
-        tm.assert_frame_equal(result, expected)
+    def test_any_datetime(self):
 
-    def test_nlargest_multiple_columns(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10]),
-                           'c': np.random.permutation(10).astype('float64')})
-        result = df.nlargest(5, ['a', 'b'])
-        expected = df.sort_values(['a', 'b'], ascending=False).head(5)
-        tm.assert_frame_equal(result, expected)
+        # GH 23070
+        float_data = [1, np.nan, 3, np.nan]
+        datetime_data = [pd.Timestamp('1960-02-15'),
+                         pd.Timestamp('1960-02-16'),
+                         pd.NaT,
+                         pd.NaT]
+        df = DataFrame({
+            "A": float_data,
+            "B": datetime_data
+        })
 
-    def test_nsmallest(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10])})
-        result = df.nsmallest(5, 'a')
-        expected = df.sort_values('a').head(5)
-        tm.assert_frame_equal(result, expected)
+        result = df.any(1)
+        expected = Series([True, True, True, False])
+        tm.assert_series_equal(result, expected)
 
-    def test_nsmallest_multiple_columns(self):
-        from string import ascii_lowercase
-        df = pd.DataFrame({'a': np.random.permutation(10),
-                           'b': list(ascii_lowercase[:10]),
-                           'c': np.random.permutation(10).astype('float64')})
-        result = df.nsmallest(5, ['a', 'c'])
-        expected = df.sort_values(['a', 'c']).head(5)
-        tm.assert_frame_equal(result, expected)
+    def test_any_all_bool_only(self):
 
-    def test_nsmallest_nlargest_duplicate_index(self):
-        # GH 13412
-        df = pd.DataFrame({'a': [1, 2, 3, 4],
-                           'b': [4, 3, 2, 1],
-                           'c': [0, 1, 2, 3]},
-                          index=[0, 0, 1, 1])
-        result = df.nsmallest(4, 'a')
-        expected = df.sort_values('a').head(4)
-        tm.assert_frame_equal(result, expected)
+        # GH 25101
+        df = DataFrame({"col1": [1, 2, 3],
+                        "col2": [4, 5, 6],
+                        "col3": [None, None, None]})
 
-        result = df.nlargest(4, 'a')
-        expected = df.sort_values('a', ascending=False).head(4)
-        tm.assert_frame_equal(result, expected)
+        result = df.all(bool_only=True)
+        expected = Series(dtype=np.bool)
+        tm.assert_series_equal(result, expected)
 
-        result = df.nsmallest(4, ['a', 'c'])
-        expected = df.sort_values(['a', 'c']).head(4)
-        tm.assert_frame_equal(result, expected)
+        df = DataFrame({"col1": [1, 2, 3],
+                        "col2": [4, 5, 6],
+                        "col3": [None, None, None],
+                        "col4": [False, False, True]})
 
-        result = df.nsmallest(4, ['c', 'a'])
-        expected = df.sort_values(['c', 'a']).head(4)
-        tm.assert_frame_equal(result, expected)
+        result = df.all(bool_only=True)
+        expected = Series({"col4": False})
+        tm.assert_series_equal(result, expected)
 
-        result = df.nlargest(4, ['a', 'c'])
-        expected = df.sort_values(['a', 'c'], ascending=False).head(4)
-        tm.assert_frame_equal(result, expected)
+    @pytest.mark.parametrize('func, data, expected', [
+        (np.any, {}, False),
+        (np.all, {}, True),
+        (np.any, {'A': []}, False),
+        (np.all, {'A': []}, True),
+        (np.any, {'A': [False, False]}, False),
+        (np.all, {'A': [False, False]}, False),
+        (np.any, {'A': [True, False]}, True),
+        (np.all, {'A': [True, False]}, False),
+        (np.any, {'A': [True, True]}, True),
+        (np.all, {'A': [True, True]}, True),
+
+        (np.any, {'A': [False], 'B': [False]}, False),
+        (np.all, {'A': [False], 'B': [False]}, False),
+
+        (np.any, {'A': [False, False], 'B': [False, True]}, True),
+        (np.all, {'A': [False, False], 'B': [False, True]}, False),
+
+        # other types
+        (np.all, {'A': pd.Series([0.0, 1.0], dtype='float')}, False),
+        (np.any, {'A': pd.Series([0.0, 1.0], dtype='float')}, True),
+        (np.all, {'A': pd.Series([0, 1], dtype=int)}, False),
+        (np.any, {'A': pd.Series([0, 1], dtype=int)}, True),
+        pytest.param(np.all, {'A': pd.Series([0, 1], dtype='M8[ns]')}, False,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([0, 1], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([1, 2], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([1, 2], dtype='M8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([0, 1], dtype='m8[ns]')}, False,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([0, 1], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.all, {'A': pd.Series([1, 2], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        pytest.param(np.any, {'A': pd.Series([1, 2], dtype='m8[ns]')}, True,
+                     marks=[td.skip_if_np_lt_115]),
+        (np.all, {'A': pd.Series([0, 1], dtype='category')}, False),
+        (np.any, {'A': pd.Series([0, 1], dtype='category')}, True),
+        (np.all, {'A': pd.Series([1, 2], dtype='category')}, True),
+        (np.any, {'A': pd.Series([1, 2], dtype='category')}, True),
+
+        # # Mix
+        # GH 21484
+        # (np.all, {'A': pd.Series([10, 20], dtype='M8[ns]'),
+        #           'B': pd.Series([10, 20], dtype='m8[ns]')}, True),
+    ])
+    def test_any_all_np_func(self, func, data, expected):
+        # GH 19976
+        data = DataFrame(data)
+        result = func(data)
+        assert isinstance(result, np.bool_)
+        assert result.item() is expected
+
+        # method version
+        result = getattr(DataFrame(data), func.__name__)(axis=None)
+        assert isinstance(result, np.bool_)
+        assert result.item() is expected
+
+    def test_any_all_object(self):
+        # GH 19976
+        result = np.all(DataFrame(columns=['a', 'b'])).item()
+        assert result is True
+
+        result = np.any(DataFrame(columns=['a', 'b'])).item()
+        assert result is False
+
+    @pytest.mark.parametrize('method', ['any', 'all'])
+    def test_any_all_level_axis_none_raises(self, method):
+        df = DataFrame(
+            {"A": 1},
+            index=MultiIndex.from_product([['A', 'B'], ['a', 'b']],
+                                          names=['out', 'in'])
+        )
+        xpr = "Must specify 'axis' when aggregating by level."
+        with pytest.raises(ValueError, match=xpr):
+            getattr(df, method)(axis=None, level='out')
 
-        result = df.nlargest(4, ['c', 'a'])
-        expected = df.sort_values(['c', 'a'], ascending=False).head(4)
-        tm.assert_frame_equal(result, expected)
     # ----------------------------------------------------------------------
     # Isin
 
     def test_isin(self):
-        # GH #4211
+        # GH 4211
         df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
                         'ids2': ['a', 'n', 'c', 'n']},
                        index=['foo', 'bar', 'baz', 'qux'])
@@ -1200,10 +1579,13 @@ def test_isin(self):
         expected = DataFrame([df.loc[s].isin(other) for s in df.index])
         tm.assert_frame_equal(result, expected)
 
-    def test_isin_empty(self):
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # GH 16991
         df = DataFrame({'A': ['a', 'b', 'c'], 'B': ['a', 'e', 'f']})
-        result = df.isin([])
-        expected = pd.DataFrame(False, df.index, df.columns)
+        expected = DataFrame(False, df.index, df.columns)
+
+        result = df.isin(empty)
         tm.assert_frame_equal(result, expected)
 
     def test_isin_dict(self):
@@ -1225,14 +1607,14 @@ def test_isin_dict(self):
         tm.assert_frame_equal(result, expected)
 
     def test_isin_with_string_scalar(self):
-        # GH4763
+        # GH 4763
         df = DataFrame({'vals': [1, 2, 3, 4], 'ids': ['a', 'b', 'f', 'n'],
                         'ids2': ['a', 'n', 'c', 'n']},
                        index=['foo', 'bar', 'baz', 'qux'])
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.isin('a')
 
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.isin('aaa')
 
     def test_isin_df(self):
@@ -1250,23 +1632,31 @@ def test_isin_df(self):
         expected['B'] = False
         tm.assert_frame_equal(result, expected)
 
+    def test_isin_tuples(self):
+        # GH 16394
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'f']})
+        df['C'] = list(zip(df['A'], df['B']))
+        result = df['C'].isin([(1, 'a')])
+        tm.assert_series_equal(result,
+                               Series([True, False, False], name="C"))
+
     def test_isin_df_dupe_values(self):
         df1 = DataFrame({'A': [1, 2, 3, 4], 'B': [2, np.nan, 4, 4]})
         # just cols duped
         df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
                         columns=['B', 'B'])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df1.isin(df2)
 
         # just index duped
         df2 = DataFrame([[0, 2], [12, 4], [2, np.nan], [4, 5]],
                         columns=['A', 'B'], index=[0, 0, 1, 1])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df1.isin(df2)
 
         # cols and index:
         df2.columns = ['B', 'B']
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df1.isin(df2)
 
     def test_isin_dupe_self(self):
@@ -1333,340 +1723,9 @@ def test_isin_empty_datetimelike(self):
         result = df1_td.isin(df3)
         tm.assert_frame_equal(result, expected)
 
-    # ----------------------------------------------------------------------
-    # Row deduplication
-
-    def test_drop_duplicates(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('AAA')
-        expected = df[:2]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep='last')
-        expected = df.loc[[6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep=False)
-        expected = df.loc[[]]
-        tm.assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # multi column
-        expected = df.loc[[0, 1, 2, 3]]
-        result = df.drop_duplicates(np.array(['AAA', 'B']))
-        tm.assert_frame_equal(result, expected)
-        result = df.drop_duplicates(['AAA', 'B'])
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AAA', 'B'), keep='last')
-        expected = df.loc[[0, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AAA', 'B'), keep=False)
-        expected = df.loc[[0]]
-        tm.assert_frame_equal(result, expected)
-
-        # consider everything
-        df2 = df.loc[:, ['AAA', 'B', 'C']]
-
-        result = df2.drop_duplicates()
-        # in this case only
-        expected = df2.drop_duplicates(['AAA', 'B'])
-        tm.assert_frame_equal(result, expected)
-
-        result = df2.drop_duplicates(keep='last')
-        expected = df2.drop_duplicates(['AAA', 'B'], keep='last')
-        tm.assert_frame_equal(result, expected)
-
-        result = df2.drop_duplicates(keep=False)
-        expected = df2.drop_duplicates(['AAA', 'B'], keep=False)
-        tm.assert_frame_equal(result, expected)
-
-        # integers
-        result = df.drop_duplicates('C')
-        expected = df.iloc[[0, 2]]
-        tm.assert_frame_equal(result, expected)
-        result = df.drop_duplicates('C', keep='last')
-        expected = df.iloc[[-2, -1]]
-        tm.assert_frame_equal(result, expected)
-
-        df['E'] = df['C'].astype('int8')
-        result = df.drop_duplicates('E')
-        expected = df.iloc[[0, 2]]
-        tm.assert_frame_equal(result, expected)
-        result = df.drop_duplicates('E', keep='last')
-        expected = df.iloc[[-2, -1]]
-        tm.assert_frame_equal(result, expected)
-
-        # GH 11376
-        df = pd.DataFrame({'x': [7, 6, 3, 3, 4, 8, 0],
-                           'y': [0, 6, 5, 5, 9, 1, 2]})
-        expected = df.loc[df.index != 3]
-        tm.assert_frame_equal(df.drop_duplicates(), expected)
-
-        df = pd.DataFrame([[1, 0], [0, 2]])
-        tm.assert_frame_equal(df.drop_duplicates(), df)
-
-        df = pd.DataFrame([[-2, 0], [0, -4]])
-        tm.assert_frame_equal(df.drop_duplicates(), df)
-
-        x = np.iinfo(np.int64).max / 3 * 2
-        df = pd.DataFrame([[-x, x], [0, x + 4]])
-        tm.assert_frame_equal(df.drop_duplicates(), df)
-
-        df = pd.DataFrame([[-x, x], [x, x + 4]])
-        tm.assert_frame_equal(df.drop_duplicates(), df)
-
-        # GH 11864
-        df = pd.DataFrame([i] * 9 for i in range(16))
-        df = df.append([[1] + [0] * 8], ignore_index=True)
-
-        for keep in ['first', 'last', False]:
-            self.assertEqual(df.duplicated(keep=keep).sum(), 0)
-
-    def test_drop_duplicates_for_take_all(self):
-        df = DataFrame({'AAA': ['foo', 'bar', 'baz', 'bar',
-                                'foo', 'bar', 'qux', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('AAA')
-        expected = df.iloc[[0, 1, 2, 6]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep='last')
-        expected = df.iloc[[2, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('AAA', keep=False)
-        expected = df.iloc[[2, 6]]
-        tm.assert_frame_equal(result, expected)
-
-        # multiple columns
-        result = df.drop_duplicates(['AAA', 'B'])
-        expected = df.iloc[[0, 1, 2, 3, 4, 6]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['AAA', 'B'], keep='last')
-        expected = df.iloc[[0, 1, 2, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['AAA', 'B'], keep=False)
-        expected = df.iloc[[0, 1, 2, 6]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_tuple(self):
-        df = DataFrame({('AA', 'AB'): ['foo', 'bar', 'foo', 'bar',
-                                       'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates(('AA', 'AB'))
-        expected = df[:2]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AA', 'AB'), keep='last')
-        expected = df.loc[[6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(('AA', 'AB'), keep=False)
-        expected = df.loc[[]]  # empty df
-        self.assertEqual(len(result), 0)
-        tm.assert_frame_equal(result, expected)
-
-        # multi column
-        expected = df.loc[[0, 1, 2, 3]]
-        result = df.drop_duplicates((('AA', 'AB'), 'B'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_NA(self):
-        # none
-        df = DataFrame({'A': [None, None, 'foo', 'bar',
-                              'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('A')
-        expected = df.loc[[0, 2, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep='last')
-        expected = df.loc[[1, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep=False)
-        expected = df.loc[[]]  # empty df
-        tm.assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # multi column
-        result = df.drop_duplicates(['A', 'B'])
-        expected = df.loc[[0, 2, 3, 6]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['A', 'B'], keep='last')
-        expected = df.loc[[1, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['A', 'B'], keep=False)
-        expected = df.loc[[6]]
-        tm.assert_frame_equal(result, expected)
-
-        # nan
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'bar', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
-                        'D': lrange(8)})
-
-        # single column
-        result = df.drop_duplicates('C')
-        expected = df[:2]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep='last')
-        expected = df.loc[[3, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep=False)
-        expected = df.loc[[]]  # empty df
-        tm.assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 0)
-
-        # multi column
-        result = df.drop_duplicates(['C', 'B'])
-        expected = df.loc[[0, 1, 2, 4]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['C', 'B'], keep='last')
-        expected = df.loc[[1, 3, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates(['C', 'B'], keep=False)
-        expected = df.loc[[1]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_NA_for_take_all(self):
-        # none
-        df = DataFrame({'A': [None, None, 'foo', 'bar',
-                              'foo', 'baz', 'bar', 'qux'],
-                        'C': [1.0, np.nan, np.nan, np.nan, 1., 2., 3, 1.]})
-
-        # single column
-        result = df.drop_duplicates('A')
-        expected = df.iloc[[0, 2, 3, 5, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep='last')
-        expected = df.iloc[[1, 4, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('A', keep=False)
-        expected = df.iloc[[5, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        # nan
-
-        # single column
-        result = df.drop_duplicates('C')
-        expected = df.iloc[[0, 1, 5, 6]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep='last')
-        expected = df.iloc[[3, 5, 6, 7]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.drop_duplicates('C', keep=False)
-        expected = df.iloc[[5, 6]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_drop_duplicates_inplace(self):
-        orig = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                                'foo', 'bar', 'bar', 'foo'],
-                          'B': ['one', 'one', 'two', 'two',
-                                'two', 'two', 'one', 'two'],
-                          'C': [1, 1, 2, 2, 2, 2, 1, 2],
-                          'D': lrange(8)})
-
-        # single column
-        df = orig.copy()
-        df.drop_duplicates('A', inplace=True)
-        expected = orig[:2]
-        result = df
-        tm.assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates('A', keep='last', inplace=True)
-        expected = orig.loc[[6, 7]]
-        result = df
-        tm.assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates('A', keep=False, inplace=True)
-        expected = orig.loc[[]]
-        result = df
-        tm.assert_frame_equal(result, expected)
-        self.assertEqual(len(df), 0)
-
-        # multi column
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], inplace=True)
-        expected = orig.loc[[0, 1, 2, 3]]
-        result = df
-        tm.assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], keep='last', inplace=True)
-        expected = orig.loc[[0, 5, 6, 7]]
-        result = df
-        tm.assert_frame_equal(result, expected)
-
-        df = orig.copy()
-        df.drop_duplicates(['A', 'B'], keep=False, inplace=True)
-        expected = orig.loc[[0]]
-        result = df
-        tm.assert_frame_equal(result, expected)
-
-        # consider everything
-        orig2 = orig.loc[:, ['A', 'B', 'C']].copy()
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(inplace=True)
-        # in this case only
-        expected = orig2.drop_duplicates(['A', 'B'])
-        result = df2
-        tm.assert_frame_equal(result, expected)
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(keep='last', inplace=True)
-        expected = orig2.drop_duplicates(['A', 'B'], keep='last')
-        result = df2
-        tm.assert_frame_equal(result, expected)
-
-        df2 = orig2.copy()
-        df2.drop_duplicates(keep=False, inplace=True)
-        expected = orig2.drop_duplicates(['A', 'B'], keep=False)
-        result = df2
-        tm.assert_frame_equal(result, expected)
-
+    # ---------------------------------------------------------------------
     # Rounding
+
     def test_round(self):
         # GH 2665
 
@@ -1695,7 +1754,7 @@ def test_round(self):
 
         # Round with a list
         round_list = [1, 2]
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(round_list)
 
         # Round with a dictionary
@@ -1718,34 +1777,34 @@ def test_round(self):
 
         # float input to `decimals`
         non_int_round_dict = {'col1': 1, 'col2': 0.5}
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_dict)
 
         # String input
         non_int_round_dict = {'col1': 1, 'col2': 'foo'}
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_dict)
 
         non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_Series)
 
         # List input
         non_int_round_dict = {'col1': 1, 'col2': [1, 2]}
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_dict)
 
         non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_Series)
 
         # Non integer Series inputs
         non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_Series)
 
         non_int_round_Series = Series(non_int_round_dict)
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.round(non_int_round_Series)
 
         # Negative numbers
@@ -1757,20 +1816,15 @@ def test_round(self):
                               expected_neg_rounded)
 
         # nan in Series round
-        nan_round_Series = Series({'col1': nan, 'col2': 1})
+        nan_round_Series = Series({'col1': np.nan, 'col2': 1})
 
         # TODO(wesm): unused?
         expected_nan_round = DataFrame({  # noqa
             'col1': [1.123, 2.123, 3.123],
             'col2': [1.2, 2.2, 3.2]})
 
-        if sys.version < LooseVersion('2.7'):
-            # Rounding with decimal is a ValueError in Python < 2.7
-            with self.assertRaises(ValueError):
-                df.round(nan_round_Series)
-        else:
-            with self.assertRaises(TypeError):
-                df.round(nan_round_Series)
+        with pytest.raises(TypeError):
+            df.round(nan_round_Series)
 
         # Make sure this doesn't break existing Series.round
         tm.assert_series_equal(df['col1'].round(1), expected_rounded['col1'])
@@ -1791,18 +1845,29 @@ def test_round(self):
                                expected_rounded['col1'])
 
     def test_numpy_round(self):
-        # See gh-12600
+        # GH 12600
         df = DataFrame([[1.53, 1.36], [0.06, 7.01]])
         out = np.round(df, decimals=0)
         expected = DataFrame([[2., 1.], [0., 7.]])
         tm.assert_frame_equal(out, expected)
 
         msg = "the 'out' parameter is not supported"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             np.round(df, decimals=0, out=df)
 
+    @pytest.mark.xfail(
+        PY2 and is_platform_windows(), reason="numpy/numpy#7882",
+        raises=AssertionError, strict=True)
+    def test_numpy_round_nan(self):
+        # See gh-14197
+        df = Series([1.53, np.nan, 0.06]).to_frame()
+        with tm.assert_produces_warning(None):
+            result = df.round()
+        expected = Series([2., np.nan, 0.]).to_frame()
+        tm.assert_frame_equal(result, expected)
+
     def test_round_mixed_type(self):
-        # GH11885
+        # GH 11885
         df = DataFrame({'col1': [1.1, 2.2, 3.3, 4.4],
                         'col2': ['1', 'a', 'c', 'f'],
                         'col3': date_range('20111111', periods=4)})
@@ -1817,24 +1882,26 @@ def test_round_mixed_type(self):
         tm.assert_frame_equal(df.round({'col3': 1}), df)
 
     def test_round_issue(self):
-        # GH11611
+        # GH 11611
 
         df = pd.DataFrame(np.random.random([3, 3]), columns=['A', 'B', 'C'],
                           index=['first', 'second', 'third'])
 
         dfs = pd.concat((df, df), axis=1)
         rounded = dfs.round()
-        self.assert_index_equal(rounded.index, dfs.index)
+        tm.assert_index_equal(rounded.index, dfs.index)
 
         decimals = pd.Series([1, 0, 2], index=['A', 'B', 'A'])
-        self.assertRaises(ValueError, df.round, decimals)
+        msg = "Index of decimals must be unique"
+        with pytest.raises(ValueError, match=msg):
+            df.round(decimals)
 
     def test_built_in_round(self):
         if not compat.PY3:
-            pytest.skip("build in round cannot be overriden "
+            pytest.skip("build in round cannot be overridden "
                         "prior to Python 3")
 
-        # GH11763
+        # GH 11763
         # Here's the test frame we'll be working with
         df = DataFrame(
             {'col1': [1.123, 2.123, 3.123], 'col2': [1.234, 2.234, 3.234]})
@@ -1844,22 +1911,62 @@ def test_built_in_round(self):
             {'col1': [1., 2., 3.], 'col2': [1., 2., 3.]})
         tm.assert_frame_equal(round(df), expected_rounded)
 
+    def test_round_nonunique_categorical(self):
+        # See GH21809
+        idx = pd.CategoricalIndex(['low'] * 3 + ['hi'] * 3)
+        df = pd.DataFrame(np.random.rand(6, 3), columns=list('abc'))
+
+        expected = df.round(3)
+        expected.index = idx
+
+        df_categorical = df.copy().set_index(idx)
+        assert df_categorical.shape == (6, 3)
+        result = df_categorical.round(3)
+        assert result.shape == (6, 3)
+
+        tm.assert_frame_equal(result, expected)
+
+    # ---------------------------------------------------------------------
     # Clip
 
-    def test_clip(self):
-        median = self.frame.median().median()
+    def test_clip(self, float_frame):
+        median = float_frame.median().median()
+        original = float_frame.copy()
+
+        with tm.assert_produces_warning(FutureWarning):
+            capped = float_frame.clip_upper(median)
+        assert not (capped.values > median).any()
 
-        capped = self.frame.clip_upper(median)
-        self.assertFalse((capped.values > median).any())
+        with tm.assert_produces_warning(FutureWarning):
+            floored = float_frame.clip_lower(median)
+        assert not (floored.values < median).any()
 
-        floored = self.frame.clip_lower(median)
-        self.assertFalse((floored.values < median).any())
+        double = float_frame.clip(upper=median, lower=median)
+        assert not (double.values != median).any()
 
-        double = self.frame.clip(upper=median, lower=median)
-        self.assertFalse((double.values != median).any())
+        # Verify that float_frame was not changed inplace
+        assert (float_frame.values == original.values).all()
+
+    def test_inplace_clip(self, float_frame):
+        # GH 15388
+        median = float_frame.median().median()
+        frame_copy = float_frame.copy()
+
+        with tm.assert_produces_warning(FutureWarning):
+            frame_copy.clip_upper(median, inplace=True)
+        assert not (frame_copy.values > median).any()
+        frame_copy = float_frame.copy()
+
+        with tm.assert_produces_warning(FutureWarning):
+            frame_copy.clip_lower(median, inplace=True)
+        assert not (frame_copy.values < median).any()
+        frame_copy = float_frame.copy()
+
+        frame_copy.clip(upper=median, lower=median, inplace=True)
+        assert not (frame_copy.values != median).any()
 
     def test_dataframe_clip(self):
-        # GH #2747
+        # GH 2747
         df = DataFrame(np.random.randn(1000, 2))
 
         for lb, ub in [(-1, 1), (1, -1)]:
@@ -1869,41 +1976,85 @@ def test_dataframe_clip(self):
             lb_mask = df.values <= lb
             ub_mask = df.values >= ub
             mask = ~lb_mask & ~ub_mask
-            self.assertTrue((clipped_df.values[lb_mask] == lb).all())
-            self.assertTrue((clipped_df.values[ub_mask] == ub).all())
-            self.assertTrue((clipped_df.values[mask] ==
-                             df.values[mask]).all())
+            assert (clipped_df.values[lb_mask] == lb).all()
+            assert (clipped_df.values[ub_mask] == ub).all()
+            assert (clipped_df.values[mask] == df.values[mask]).all()
+
+    def test_clip_mixed_numeric(self):
+        # TODO(jreback)
+        # clip on mixed integer or floats
+        # with integer clippers coerces to float
+        df = DataFrame({'A': [1, 2, 3],
+                        'B': [1., np.nan, 3.]})
+        result = df.clip(1, 2)
+        expected = DataFrame({'A': [1, 2, 2],
+                              'B': [1., np.nan, 2.]})
+        tm.assert_frame_equal(result, expected, check_like=True)
+
+        # GH 24162, clipping now preserves numeric types per column
+        df = DataFrame([[1, 2, 3.4], [3, 4, 5.6]],
+                       columns=['foo', 'bar', 'baz'])
+        expected = df.dtypes
+        result = df.clip(upper=3).dtypes
+        tm.assert_series_equal(result, expected)
 
-    def test_clip_against_series(self):
-        # GH #6966
+    @pytest.mark.parametrize("inplace", [True, False])
+    def test_clip_against_series(self, inplace):
+        # GH 6966
 
         df = DataFrame(np.random.randn(1000, 2))
         lb = Series(np.random.randn(1000))
         ub = lb + 1
 
-        clipped_df = df.clip(lb, ub, axis=0)
+        original = df.copy()
+        clipped_df = df.clip(lb, ub, axis=0, inplace=inplace)
+
+        if inplace:
+            clipped_df = df
 
         for i in range(2):
-            lb_mask = df.iloc[:, i] <= lb
-            ub_mask = df.iloc[:, i] >= ub
+            lb_mask = original.iloc[:, i] <= lb
+            ub_mask = original.iloc[:, i] >= ub
             mask = ~lb_mask & ~ub_mask
 
             result = clipped_df.loc[lb_mask, i]
             tm.assert_series_equal(result, lb[lb_mask], check_names=False)
-            self.assertEqual(result.name, i)
+            assert result.name == i
 
             result = clipped_df.loc[ub_mask, i]
             tm.assert_series_equal(result, ub[ub_mask], check_names=False)
-            self.assertEqual(result.name, i)
+            assert result.name == i
 
             tm.assert_series_equal(clipped_df.loc[mask, i], df.loc[mask, i])
 
-    def test_clip_against_frame(self):
+    @pytest.mark.parametrize("inplace", [True, False])
+    @pytest.mark.parametrize("lower", [[2, 3, 4], np.asarray([2, 3, 4])])
+    @pytest.mark.parametrize("axis,res", [
+        (0, [[2., 2., 3.], [4., 5., 6.], [7., 7., 7.]]),
+        (1, [[2., 3., 4.], [4., 5., 6.], [5., 6., 7.]])
+    ])
+    def test_clip_against_list_like(self, simple_frame,
+                                    inplace, lower, axis, res):
+        # GH 15390
+        original = simple_frame.copy(deep=True)
+
+        result = original.clip(lower=lower, upper=[5, 6, 7],
+                               axis=axis, inplace=inplace)
+
+        expected = pd.DataFrame(res,
+                                columns=original.columns,
+                                index=original.index)
+        if inplace:
+            result = original
+        tm.assert_frame_equal(result, expected, check_exact=True)
+
+    @pytest.mark.parametrize("axis", [0, 1, None])
+    def test_clip_against_frame(self, axis):
         df = DataFrame(np.random.randn(1000, 2))
         lb = DataFrame(np.random.randn(1000, 2))
         ub = lb + 1
 
-        clipped_df = df.clip(lb, ub)
+        clipped_df = df.clip(lb, ub, axis=axis)
 
         lb_mask = df <= lb
         ub_mask = df >= ub
@@ -1913,6 +2064,44 @@ def test_clip_against_frame(self):
         tm.assert_frame_equal(clipped_df[ub_mask], ub[ub_mask])
         tm.assert_frame_equal(clipped_df[mask], df[mask])
 
+    def test_clip_against_unordered_columns(self):
+        # GH 20911
+        df1 = DataFrame(np.random.randn(1000, 4), columns=['A', 'B', 'C', 'D'])
+        df2 = DataFrame(np.random.randn(1000, 4), columns=['D', 'A', 'B', 'C'])
+        df3 = DataFrame(df2.values - 1, columns=['B', 'D', 'C', 'A'])
+        result_upper = df1.clip(lower=0, upper=df2)
+        expected_upper = df1.clip(lower=0, upper=df2[df1.columns])
+        result_lower = df1.clip(lower=df3, upper=3)
+        expected_lower = df1.clip(lower=df3[df1.columns], upper=3)
+        result_lower_upper = df1.clip(lower=df3, upper=df2)
+        expected_lower_upper = df1.clip(lower=df3[df1.columns],
+                                        upper=df2[df1.columns])
+        tm.assert_frame_equal(result_upper, expected_upper)
+        tm.assert_frame_equal(result_lower, expected_lower)
+        tm.assert_frame_equal(result_lower_upper, expected_lower_upper)
+
+    def test_clip_with_na_args(self, float_frame):
+        """Should process np.nan argument as None """
+        # GH 17276
+        tm.assert_frame_equal(float_frame.clip(np.nan), float_frame)
+        tm.assert_frame_equal(float_frame.clip(upper=np.nan, lower=np.nan),
+                              float_frame)
+
+        # GH 19992
+        df = DataFrame({'col_0': [1, 2, 3], 'col_1': [4, 5, 6],
+                        'col_2': [7, 8, 9]})
+
+        result = df.clip(lower=[4, 5, np.nan], axis=0)
+        expected = DataFrame({'col_0': [4, 5, np.nan], 'col_1': [4, 5, np.nan],
+                              'col_2': [7, 8, np.nan]})
+        tm.assert_frame_equal(result, expected)
+
+        result = df.clip(lower=[4, 5, np.nan], axis=1)
+        expected = DataFrame({'col_0': [4, 4, 4], 'col_1': [5, 5, 6],
+                              'col_2': [np.nan, np.nan, np.nan]})
+        tm.assert_frame_equal(result, expected)
+
+    # ---------------------------------------------------------------------
     # Matrix-like
 
     def test_dot(self):
@@ -1933,20 +2122,20 @@ def test_dot(self):
         # Check series argument
         result = a.dot(b['one'])
         tm.assert_series_equal(result, expected['one'], check_names=False)
-        self.assertTrue(result.name is None)
+        assert result.name is None
 
         result = a.dot(b1['one'])
         tm.assert_series_equal(result, expected['one'], check_names=False)
-        self.assertTrue(result.name is None)
+        assert result.name is None
 
         # can pass correct-length arrays
         row = a.iloc[0].values
 
         result = a.dot(row)
-        exp = a.dot(a.iloc[0])
-        tm.assert_series_equal(result, exp)
+        expected = a.dot(a.iloc[0])
+        tm.assert_series_equal(result, expected)
 
-        with tm.assertRaisesRegexp(ValueError, 'Dot product shape mismatch'):
+        with pytest.raises(ValueError, match='Dot product shape mismatch'):
             a.dot(row[:-1])
 
         a = np.random.rand(1, 5)
@@ -1960,8 +2149,272 @@ def test_dot(self):
         result = A.dot(b)
 
         # unaligned
-        df = DataFrame(randn(3, 4), index=[1, 2, 3], columns=lrange(4))
-        df2 = DataFrame(randn(5, 3), index=lrange(5), columns=[1, 2, 3])
+        df = DataFrame(np.random.randn(3, 4),
+                       index=[1, 2, 3], columns=lrange(4))
+        df2 = DataFrame(np.random.randn(5, 3),
+                        index=lrange(5), columns=[1, 2, 3])
 
-        with tm.assertRaisesRegexp(ValueError, 'aligned'):
+        with pytest.raises(ValueError, match='aligned'):
             df.dot(df2)
+
+    @pytest.mark.skipif(not PY35,
+                        reason='matmul supported for Python>=3.5')
+    def test_matmul(self):
+        # matmul test is for GH 10259
+        a = DataFrame(np.random.randn(3, 4), index=['a', 'b', 'c'],
+                      columns=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(4, 2), index=['p', 'q', 'r', 's'],
+                      columns=['one', 'two'])
+
+        # DataFrame @ DataFrame
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # DataFrame @ Series
+        result = operator.matmul(a, b.one)
+        expected = Series(np.dot(a.values, b.one.values),
+                          index=['a', 'b', 'c'])
+        tm.assert_series_equal(result, expected)
+
+        # np.array @ DataFrame
+        result = operator.matmul(a.values, b)
+        assert isinstance(result, DataFrame)
+        assert result.columns.equals(b.columns)
+        assert result.index.equals(pd.Index(range(3)))
+        expected = np.dot(a.values, b.values)
+        tm.assert_almost_equal(result.values, expected)
+
+        # nested list @ DataFrame (__rmatmul__)
+        result = operator.matmul(a.values.tolist(), b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_almost_equal(result.values, expected.values)
+
+        # mixed dtype DataFrame @ DataFrame
+        a['q'] = a.q.round().astype(int)
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # different dtypes DataFrame @ DataFrame
+        a = a.astype(int)
+        result = operator.matmul(a, b)
+        expected = DataFrame(np.dot(a.values, b.values),
+                             index=['a', 'b', 'c'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        # unaligned
+        df = DataFrame(np.random.randn(3, 4),
+                       index=[1, 2, 3], columns=lrange(4))
+        df2 = DataFrame(np.random.randn(5, 3),
+                        index=lrange(5), columns=[1, 2, 3])
+
+        with pytest.raises(ValueError, match='aligned'):
+            operator.matmul(df, df2)
+
+
+@pytest.fixture
+def df_duplicates():
+    return pd.DataFrame({'a': [1, 2, 3, 4, 4],
+                         'b': [1, 1, 1, 1, 1],
+                         'c': [0, 1, 2, 5, 4]},
+                        index=[0, 0, 1, 1, 1])
+
+
+@pytest.fixture
+def df_strings():
+    return pd.DataFrame({'a': np.random.permutation(10),
+                         'b': list(ascii_lowercase[:10]),
+                         'c': np.random.permutation(10).astype('float64')})
+
+
+@pytest.fixture
+def df_main_dtypes():
+    return pd.DataFrame(
+        {'group': [1, 1, 2],
+         'int': [1, 2, 3],
+         'float': [4., 5., 6.],
+         'string': list('abc'),
+         'category_string': pd.Series(list('abc')).astype('category'),
+         'category_int': [7, 8, 9],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetimetz': pd.date_range('20130101',
+                                     periods=3,
+                                     tz='US/Eastern'),
+         'timedelta': pd.timedelta_range('1 s', periods=3, freq='s')},
+        columns=['group', 'int', 'float', 'string',
+                 'category_string', 'category_int',
+                 'datetime', 'datetimetz',
+                 'timedelta'])
+
+
+class TestNLargestNSmallest(object):
+
+    dtype_error_msg_template = ("Column {column!r} has dtype {dtype}, cannot "
+                                "use method {method!r} with this dtype")
+
+    # ----------------------------------------------------------------------
+    # Top / bottom
+    @pytest.mark.parametrize('order', [
+        ['a'],
+        ['c'],
+        ['a', 'b'],
+        ['a', 'c'],
+        ['b', 'a'],
+        ['b', 'c'],
+        ['a', 'b', 'c'],
+        ['c', 'a', 'b'],
+        ['c', 'b', 'a'],
+        ['b', 'c', 'a'],
+        ['b', 'a', 'c'],
+
+        # dups!
+        ['b', 'c', 'c']])
+    @pytest.mark.parametrize('n', range(1, 11))
+    def test_n(self, df_strings, nselect_method, n, order):
+        # GH 10393
+        df = df_strings
+        if 'b' in order:
+
+            error_msg = self.dtype_error_msg_template.format(
+                column='b', method=nselect_method, dtype='object')
+            with pytest.raises(TypeError, match=error_msg):
+                getattr(df, nselect_method)(n, order)
+        else:
+            ascending = nselect_method == 'nsmallest'
+            result = getattr(df, nselect_method)(n, order)
+            expected = df.sort_values(order, ascending=ascending).head(n)
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('columns', [
+        ['group', 'category_string'], ['group', 'string']])
+    def test_n_error(self, df_main_dtypes, nselect_method, columns):
+        df = df_main_dtypes
+        col = columns[1]
+        error_msg = self.dtype_error_msg_template.format(
+            column=col, method=nselect_method, dtype=df[col].dtype)
+        # escape some characters that may be in the repr
+        error_msg = (error_msg.replace('(', '\\(').replace(")", "\\)")
+                              .replace("[", "\\[").replace("]", "\\]"))
+        with pytest.raises(TypeError, match=error_msg):
+            getattr(df, nselect_method)(2, columns)
+
+    def test_n_all_dtypes(self, df_main_dtypes):
+        df = df_main_dtypes
+        df.nsmallest(2, list(set(df) - {'category_string', 'string'}))
+        df.nlargest(2, list(set(df) - {'category_string', 'string'}))
+
+    @pytest.mark.parametrize('method,expected', [
+        ('nlargest',
+         pd.DataFrame({'a': [2, 2, 2, 1], 'b': [3, 2, 1, 3]},
+                      index=[2, 1, 0, 3])),
+        ('nsmallest',
+         pd.DataFrame({'a': [1, 1, 1, 2], 'b': [1, 2, 3, 1]},
+                      index=[5, 4, 3, 0]))])
+    def test_duplicates_on_starter_columns(self, method, expected):
+        # regression test for #22752
+
+        df = pd.DataFrame({
+            'a': [2, 2, 2, 1, 1, 1],
+            'b': [1, 2, 3, 3, 2, 1]
+        })
+
+        result = getattr(df, method)(4, columns=['a', 'b'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_n_identical_values(self):
+        # GH 15297
+        df = pd.DataFrame({'a': [1] * 5, 'b': [1, 2, 3, 4, 5]})
+
+        result = df.nlargest(3, 'a')
+        expected = pd.DataFrame(
+            {'a': [1] * 3, 'b': [1, 2, 3]}, index=[0, 1, 2]
+        )
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nsmallest(3, 'a')
+        expected = pd.DataFrame({'a': [1] * 3, 'b': [1, 2, 3]})
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('order', [
+        ['a', 'b', 'c'],
+        ['c', 'b', 'a'],
+        ['a'],
+        ['b'],
+        ['a', 'b'],
+        ['c', 'b']])
+    @pytest.mark.parametrize('n', range(1, 6))
+    def test_n_duplicate_index(self, df_duplicates, n, order):
+        # GH 13412
+
+        df = df_duplicates
+        result = df.nsmallest(n, order)
+        expected = df.sort_values(order).head(n)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nlargest(n, order)
+        expected = df.sort_values(order, ascending=False).head(n)
+        tm.assert_frame_equal(result, expected)
+
+    def test_duplicate_keep_all_ties(self):
+        # GH 16818
+        df = pd.DataFrame({'a': [5, 4, 4, 2, 3, 3, 3, 3],
+                           'b': [10, 9, 8, 7, 5, 50, 10, 20]})
+        result = df.nlargest(4, 'a', keep='all')
+        expected = pd.DataFrame({'a': {0: 5, 1: 4, 2: 4, 4: 3,
+                                       5: 3, 6: 3, 7: 3},
+                                 'b': {0: 10, 1: 9, 2: 8, 4: 5,
+                                       5: 50, 6: 10, 7: 20}})
+        tm.assert_frame_equal(result, expected)
+
+        result = df.nsmallest(2, 'a', keep='all')
+        expected = pd.DataFrame({'a': {3: 2, 4: 3, 5: 3, 6: 3, 7: 3},
+                                 'b': {3: 7, 4: 5, 5: 50, 6: 10, 7: 20}})
+        tm.assert_frame_equal(result, expected)
+
+    def test_series_broadcasting(self):
+        # smoke test for numpy warnings
+        # GH 16378, GH 16306
+        df = DataFrame([1.0, 1.0, 1.0])
+        df_nan = DataFrame({'A': [np.nan, 2.0, np.nan]})
+        s = Series([1, 1, 1])
+        s_nan = Series([np.nan, np.nan, 1])
+
+        with tm.assert_produces_warning(None):
+            with tm.assert_produces_warning(FutureWarning):
+                df_nan.clip_lower(s, axis=0)
+            for op in ['lt', 'le', 'gt', 'ge', 'eq', 'ne']:
+                getattr(df, op)(s_nan, axis=0)
+
+    def test_series_nat_conversion(self):
+        # GH 18521
+        # Check rank does not mutate DataFrame
+        df = DataFrame(np.random.randn(10, 3), dtype='float64')
+        expected = df.copy()
+        df.rank()
+        result = df
+        tm.assert_frame_equal(result, expected)
+
+    def test_multiindex_column_lookup(self):
+        # Check whether tuples are correctly treated as multi-level lookups.
+        # GH 23033
+        df = pd.DataFrame(
+            columns=pd.MultiIndex.from_product([['x'], ['a', 'b']]),
+            data=[[0.33, 0.13], [0.86, 0.25], [0.25, 0.70], [0.85, 0.91]])
+
+        # nsmallest
+        result = df.nsmallest(3, ('x', 'a'))
+        expected = df.iloc[[2, 0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # nlargest
+        result = df.nlargest(3, ('x', 'b'))
+        expected = df.iloc[[3, 2, 1]]
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_api.py b/pandas/tests/frame/test_api.py
new file mode 100644
index 0000000000000..badfa0ca8fd15
--- /dev/null
+++ b/pandas/tests/frame/test_api.py
@@ -0,0 +1,547 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+# pylint: disable-msg=W0612,E1101
+from copy import deepcopy
+import pydoc
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2, long, lrange, range
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Series, SparseDataFrame, compat, date_range,
+    timedelta_range)
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+
+class SharedWithSparse(object):
+    """
+    A collection of tests DataFrame and SparseDataFrame can share.
+
+    In generic tests on this class, use ``self._assert_frame_equal()`` and
+    ``self._assert_series_equal()`` which are implemented in sub-classes
+    and dispatch correctly.
+    """
+    def _assert_frame_equal(self, left, right):
+        """Dispatch to frame class dependent assertion"""
+        raise NotImplementedError
+
+    def _assert_series_equal(self, left, right):
+        """Dispatch to series class dependent assertion"""
+        raise NotImplementedError
+
+    def test_copy_index_name_checking(self, float_frame):
+        # don't want to be able to modify the index stored elsewhere after
+        # making a copy
+        for attr in ('index', 'columns'):
+            ind = getattr(float_frame, attr)
+            ind.name = None
+            cp = float_frame.copy()
+            getattr(cp, attr).name = 'foo'
+            assert getattr(float_frame, attr).name is None
+
+    def test_getitem_pop_assign_name(self, float_frame):
+        s = float_frame['A']
+        assert s.name == 'A'
+
+        s = float_frame.pop('A')
+        assert s.name == 'A'
+
+        s = float_frame.loc[:, 'B']
+        assert s.name == 'B'
+
+        s2 = s.loc[:]
+        assert s2.name == 'B'
+
+    def test_get_value(self, float_frame):
+        for idx in float_frame.index:
+            for col in float_frame.columns:
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    result = float_frame.get_value(idx, col)
+                expected = float_frame[col][idx]
+                tm.assert_almost_equal(result, expected)
+
+    def test_add_prefix_suffix(self, float_frame):
+        with_prefix = float_frame.add_prefix('foo#')
+        expected = pd.Index(['foo#%s' % c for c in float_frame.columns])
+        tm.assert_index_equal(with_prefix.columns, expected)
+
+        with_suffix = float_frame.add_suffix('#foo')
+        expected = pd.Index(['%s#foo' % c for c in float_frame.columns])
+        tm.assert_index_equal(with_suffix.columns, expected)
+
+        with_pct_prefix = float_frame.add_prefix('%')
+        expected = pd.Index(['%{}'.format(c) for c in float_frame.columns])
+        tm.assert_index_equal(with_pct_prefix.columns, expected)
+
+        with_pct_suffix = float_frame.add_suffix('%')
+        expected = pd.Index(['{}%'.format(c) for c in float_frame.columns])
+        tm.assert_index_equal(with_pct_suffix.columns, expected)
+
+    def test_get_axis(self, float_frame):
+        f = float_frame
+        assert f._get_axis_number(0) == 0
+        assert f._get_axis_number(1) == 1
+        assert f._get_axis_number('index') == 0
+        assert f._get_axis_number('rows') == 0
+        assert f._get_axis_number('columns') == 1
+
+        assert f._get_axis_name(0) == 'index'
+        assert f._get_axis_name(1) == 'columns'
+        assert f._get_axis_name('index') == 'index'
+        assert f._get_axis_name('rows') == 'index'
+        assert f._get_axis_name('columns') == 'columns'
+
+        assert f._get_axis(0) is f.index
+        assert f._get_axis(1) is f.columns
+
+        with pytest.raises(ValueError, match='No axis named'):
+            f._get_axis_number(2)
+
+        with pytest.raises(ValueError, match='No axis.*foo'):
+            f._get_axis_name('foo')
+
+        with pytest.raises(ValueError, match='No axis.*None'):
+            f._get_axis_name(None)
+
+        with pytest.raises(ValueError, match='No axis named'):
+            f._get_axis_number(None)
+
+    def test_keys(self, float_frame):
+        getkeys = float_frame.keys
+        assert getkeys() is float_frame.columns
+
+    def test_column_contains_typeerror(self, float_frame):
+        try:
+            float_frame.columns in float_frame
+        except TypeError:
+            pass
+
+    def test_tab_completion(self):
+        # DataFrame whose columns are identifiers shall have them in __dir__.
+        df = pd.DataFrame([list('abcd'), list('efgh')], columns=list('ABCD'))
+        for key in list('ABCD'):
+            assert key in dir(df)
+        assert isinstance(df.__getitem__('A'), pd.Series)
+
+        # DataFrame whose first-level columns are identifiers shall have
+        # them in __dir__.
+        df = pd.DataFrame(
+            [list('abcd'), list('efgh')],
+            columns=pd.MultiIndex.from_tuples(list(zip('ABCD', 'EFGH'))))
+        for key in list('ABCD'):
+            assert key in dir(df)
+        for key in list('EFGH'):
+            assert key not in dir(df)
+        assert isinstance(df.__getitem__('A'), pd.DataFrame)
+
+    def test_not_hashable(self):
+        empty_frame = DataFrame()
+
+        df = self.klass([1])
+        msg = ("'(Sparse)?DataFrame' objects are mutable, thus they cannot be"
+               " hashed")
+        with pytest.raises(TypeError, match=msg):
+            hash(df)
+        with pytest.raises(TypeError, match=msg):
+            hash(empty_frame)
+
+    def test_new_empty_index(self):
+        df1 = self.klass(np.random.randn(0, 3))
+        df2 = self.klass(np.random.randn(0, 3))
+        df1.index.name = 'foo'
+        assert df2.index.name is None
+
+    def test_array_interface(self, float_frame):
+        with np.errstate(all='ignore'):
+            result = np.sqrt(float_frame)
+        assert isinstance(result, type(float_frame))
+        assert result.index is float_frame.index
+        assert result.columns is float_frame.columns
+
+        self._assert_frame_equal(result, float_frame.apply(np.sqrt))
+
+    def test_get_agg_axis(self, float_frame):
+        cols = float_frame._get_agg_axis(0)
+        assert cols is float_frame.columns
+
+        idx = float_frame._get_agg_axis(1)
+        assert idx is float_frame.index
+
+        msg = r"Axis must be 0 or 1 \(got 2\)"
+        with pytest.raises(ValueError, match=msg):
+            float_frame._get_agg_axis(2)
+
+    def test_nonzero(self, float_frame, float_string_frame):
+        empty_frame = DataFrame()
+        assert empty_frame.empty
+
+        assert not float_frame.empty
+        assert not float_string_frame.empty
+
+        # corner case
+        df = DataFrame({'A': [1., 2., 3.],
+                        'B': ['a', 'b', 'c']},
+                       index=np.arange(3))
+        del df['A']
+        assert not df.empty
+
+    def test_iteritems(self):
+        df = self.klass([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
+        for k, v in compat.iteritems(df):
+            assert isinstance(v, self.klass._constructor_sliced)
+
+    def test_items(self):
+        # GH 17213, GH 13918
+        cols = ['a', 'b', 'c']
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=cols)
+        for c, (k, v) in zip(cols, df.items()):
+            assert c == k
+            assert isinstance(v, Series)
+            assert (df[k] == v).all()
+
+    def test_iter(self, float_frame):
+        assert tm.equalContents(list(float_frame), float_frame.columns)
+
+    def test_iterrows(self, float_frame, float_string_frame):
+        for k, v in float_frame.iterrows():
+            exp = float_frame.loc[k]
+            self._assert_series_equal(v, exp)
+
+        for k, v in float_string_frame.iterrows():
+            exp = float_string_frame.loc[k]
+            self._assert_series_equal(v, exp)
+
+    def test_iterrows_iso8601(self):
+        # GH 19671
+        if self.klass == SparseDataFrame:
+            pytest.xfail(reason='SparseBlock datetime type not implemented.')
+
+        s = self.klass(
+            {'non_iso8601': ['M1701', 'M1802', 'M1903', 'M2004'],
+             'iso8601': date_range('2000-01-01', periods=4, freq='M')})
+        for k, v in s.iterrows():
+            exp = s.loc[k]
+            self._assert_series_equal(v, exp)
+
+    def test_itertuples(self, float_frame):
+        for i, tup in enumerate(float_frame.itertuples()):
+            s = self.klass._constructor_sliced(tup[1:])
+            s.name = tup[0]
+            expected = float_frame.iloc[i, :].reset_index(drop=True)
+            self._assert_series_equal(s, expected)
+
+        df = self.klass({'floats': np.random.randn(5),
+                         'ints': lrange(5)}, columns=['floats', 'ints'])
+
+        for tup in df.itertuples(index=False):
+            assert isinstance(tup[1], (int, long))
+
+        df = self.klass(data={"a": [1, 2, 3], "b": [4, 5, 6]})
+        dfaa = df[['a', 'a']]
+
+        assert (list(dfaa.itertuples()) ==
+                [(0, 1, 1), (1, 2, 2), (2, 3, 3)])
+
+        # repr with be int/long on 32-bit/windows
+        if not (compat.is_platform_windows() or compat.is_platform_32bit()):
+            assert (repr(list(df.itertuples(name=None))) ==
+                    '[(0, 1, 4), (1, 2, 5), (2, 3, 6)]')
+
+        tup = next(df.itertuples(name='TestName'))
+        assert tup._fields == ('Index', 'a', 'b')
+        assert (tup.Index, tup.a, tup.b) == tup
+        assert type(tup).__name__ == 'TestName'
+
+        df.columns = ['def', 'return']
+        tup2 = next(df.itertuples(name='TestName'))
+        assert tup2 == (0, 1, 4)
+        assert tup2._fields == ('Index', '_1', '_2')
+
+        df3 = DataFrame({'f' + str(i): [i] for i in range(1024)})
+        # will raise SyntaxError if trying to create namedtuple
+        tup3 = next(df3.itertuples())
+        assert not hasattr(tup3, '_fields')
+        assert isinstance(tup3, tuple)
+
+    def test_sequence_like_with_categorical(self):
+
+        # GH 7839
+        # make sure can iterate
+        df = DataFrame({"id": [1, 2, 3, 4, 5, 6],
+                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+        df['grade'] = Categorical(df['raw_grade'])
+
+        # basic sequencing testing
+        result = list(df.grade.values)
+        expected = np.array(df.grade.values).tolist()
+        tm.assert_almost_equal(result, expected)
+
+        # iteration
+        for t in df.itertuples(index=False):
+            str(t)
+
+        for row, s in df.iterrows():
+            str(s)
+
+        for c, col in df.iteritems():
+            str(s)
+
+    def test_len(self, float_frame):
+        assert len(float_frame) == len(float_frame.index)
+
+    def test_values(self, float_frame, float_string_frame):
+        frame = float_frame
+        arr = frame.values
+
+        frame_cols = frame.columns
+        for i, row in enumerate(arr):
+            for j, value in enumerate(row):
+                col = frame_cols[j]
+                if np.isnan(value):
+                    assert np.isnan(frame[col][i])
+                else:
+                    assert value == frame[col][i]
+
+        # mixed type
+        arr = float_string_frame[['foo', 'A']].values
+        assert arr[0, 0] == 'bar'
+
+        df = self.klass({'complex': [1j, 2j, 3j], 'real': [1, 2, 3]})
+        arr = df.values
+        assert arr[0, 0] == 1j
+
+        # single block corner case
+        arr = float_frame[['A', 'B']].values
+        expected = float_frame.reindex(columns=['A', 'B']).values
+        assert_almost_equal(arr, expected)
+
+    def test_to_numpy(self):
+        df = pd.DataFrame({"A": [1, 2], "B": [3, 4.5]})
+        expected = np.array([[1, 3], [2, 4.5]])
+        result = df.to_numpy()
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_to_numpy_dtype(self):
+        df = pd.DataFrame({"A": [1, 2], "B": [3, 4.5]})
+        expected = np.array([[1, 3], [2, 4]], dtype="int64")
+        result = df.to_numpy(dtype="int64")
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_to_numpy_copy(self):
+        arr = np.random.randn(4, 3)
+        df = pd.DataFrame(arr)
+        assert df.values.base is arr
+        assert df.to_numpy(copy=False).base is arr
+        assert df.to_numpy(copy=True).base is None
+
+    def test_transpose(self, float_frame):
+        frame = float_frame
+        dft = frame.T
+        for idx, series in compat.iteritems(dft):
+            for col, value in compat.iteritems(series):
+                if np.isnan(value):
+                    assert np.isnan(frame[col][idx])
+                else:
+                    assert value == frame[col][idx]
+
+        # mixed type
+        index, data = tm.getMixedTypeDict()
+        mixed = self.klass(data, index=index)
+
+        mixed_T = mixed.T
+        for col, s in compat.iteritems(mixed_T):
+            assert s.dtype == np.object_
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_swapaxes(self):
+        df = self.klass(np.random.randn(10, 5))
+        self._assert_frame_equal(df.T, df.swapaxes(0, 1))
+        self._assert_frame_equal(df.T, df.swapaxes(1, 0))
+        self._assert_frame_equal(df, df.swapaxes(0, 0))
+        msg = ("No axis named 2 for object type"
+               r" <class 'pandas.core(.sparse)?.frame.(Sparse)?DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            df.swapaxes(2, 5)
+
+    def test_axis_aliases(self, float_frame):
+        f = float_frame
+
+        # reg name
+        expected = f.sum(axis=0)
+        result = f.sum(axis='index')
+        assert_series_equal(result, expected)
+
+        expected = f.sum(axis=1)
+        result = f.sum(axis='columns')
+        assert_series_equal(result, expected)
+
+    def test_class_axis(self):
+        # GH 18147
+        # no exception and no empty docstring
+        assert pydoc.getdoc(DataFrame.index)
+        assert pydoc.getdoc(DataFrame.columns)
+
+    def test_more_values(self, float_string_frame):
+        values = float_string_frame.values
+        assert values.shape[1] == len(float_string_frame.columns)
+
+    def test_repr_with_mi_nat(self, float_string_frame):
+        df = self.klass({'X': [1, 2]},
+                        index=[[pd.NaT, pd.Timestamp('20130101')], ['a', 'b']])
+        result = repr(df)
+        expected = '              X\nNaT        a  1\n2013-01-01 b  2'
+        assert result == expected
+
+    def test_iteritems_names(self, float_string_frame):
+        for k, v in compat.iteritems(float_string_frame):
+            assert v.name == k
+
+    def test_series_put_names(self, float_string_frame):
+        series = float_string_frame._series
+        for k, v in compat.iteritems(series):
+            assert v.name == k
+
+    def test_empty_nonzero(self):
+        df = self.klass([1, 2, 3])
+        assert not df.empty
+        df = self.klass(index=[1], columns=[1])
+        assert not df.empty
+        df = self.klass(index=['a', 'b'], columns=['c', 'd']).dropna()
+        assert df.empty
+        assert df.T.empty
+        empty_frames = [self.klass(),
+                        self.klass(index=[1]),
+                        self.klass(columns=[1]),
+                        self.klass({1: []})]
+        for df in empty_frames:
+            assert df.empty
+            assert df.T.empty
+
+    def test_with_datetimelikes(self):
+
+        df = self.klass({'A': date_range('20130101', periods=10),
+                         'B': timedelta_range('1 day', periods=10)})
+        t = df.T
+
+        result = t.get_dtype_counts()
+        if self.klass is DataFrame:
+            expected = Series({'object': 10})
+        else:
+            expected = Series({'Sparse[object, nan]': 10})
+        tm.assert_series_equal(result, expected)
+
+
+class TestDataFrameMisc(SharedWithSparse):
+
+    klass = DataFrame
+    # SharedWithSparse tests use generic, klass-agnostic assertion
+    _assert_frame_equal = staticmethod(assert_frame_equal)
+    _assert_series_equal = staticmethod(assert_series_equal)
+
+    def test_values(self, float_frame):
+        float_frame.values[:, 0] = 5.
+        assert (float_frame.values[:, 0] == 5).all()
+
+    def test_as_matrix_deprecated(self, float_frame):
+        # GH 18458
+        with tm.assert_produces_warning(FutureWarning):
+            cols = float_frame.columns.tolist()
+            result = float_frame.as_matrix(columns=cols)
+        expected = float_frame.values
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_deepcopy(self, float_frame):
+        cp = deepcopy(float_frame)
+        series = cp['A']
+        series[:] = 10
+        for idx, value in compat.iteritems(series):
+            assert float_frame['A'][idx] != value
+
+    def test_transpose_get_view(self, float_frame):
+        dft = float_frame.T
+        dft.values[:, 5:10] = 5
+
+        assert (float_frame.values[5:10] == 5).all()
+
+    def test_inplace_return_self(self):
+        # GH 1893
+
+        data = DataFrame({'a': ['foo', 'bar', 'baz', 'qux'],
+                          'b': [0, 0, 1, 1],
+                          'c': [1, 2, 3, 4]})
+
+        def _check_f(base, f):
+            result = f(base)
+            assert result is None
+
+        # -----DataFrame-----
+
+        # set_index
+        f = lambda x: x.set_index('a', inplace=True)
+        _check_f(data.copy(), f)
+
+        # reset_index
+        f = lambda x: x.reset_index(inplace=True)
+        _check_f(data.set_index('a'), f)
+
+        # drop_duplicates
+        f = lambda x: x.drop_duplicates(inplace=True)
+        _check_f(data.copy(), f)
+
+        # sort
+        f = lambda x: x.sort_values('b', inplace=True)
+        _check_f(data.copy(), f)
+
+        # sort_index
+        f = lambda x: x.sort_index(inplace=True)
+        _check_f(data.copy(), f)
+
+        # fillna
+        f = lambda x: x.fillna(0, inplace=True)
+        _check_f(data.copy(), f)
+
+        # replace
+        f = lambda x: x.replace(1, 0, inplace=True)
+        _check_f(data.copy(), f)
+
+        # rename
+        f = lambda x: x.rename({1: 'foo'}, inplace=True)
+        _check_f(data.copy(), f)
+
+        # -----Series-----
+        d = data.copy()['c']
+
+        # reset_index
+        f = lambda x: x.reset_index(inplace=True, drop=True)
+        _check_f(data.set_index('a')['c'], f)
+
+        # fillna
+        f = lambda x: x.fillna(0, inplace=True)
+        _check_f(d.copy(), f)
+
+        # replace
+        f = lambda x: x.replace(1, 0, inplace=True)
+        _check_f(d.copy(), f)
+
+        # rename
+        f = lambda x: x.rename({1: 'foo'}, inplace=True)
+        _check_f(d.copy(), f)
+
+    def test_tab_complete_warning(self, ip):
+        # GH 16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; df = pd.DataFrame()"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('df.', 1))
diff --git a/pandas/tests/frame/test_apply.py b/pandas/tests/frame/test_apply.py
index 30fde4b5b78d8..4d1e3e7ae1f38 100644
--- a/pandas/tests/frame/test_apply.py
+++ b/pandas/tests/frame/test_apply.py
@@ -2,50 +2,69 @@
 
 from __future__ import print_function
 
+from collections import OrderedDict
 from datetime import datetime
-
+from itertools import chain
+import operator
 import warnings
+
 import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
 
-from pandas import (notnull, DataFrame, Series, MultiIndex, date_range,
-                    Timestamp, compat)
 import pandas as pd
-from pandas.types.dtypes import CategoricalDtype
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal)
+from pandas import (
+    DataFrame, MultiIndex, Series, Timestamp, compat, date_range, notna)
+from pandas.conftest import _get_cython_table_params
+from pandas.core.apply import frame_apply
 import pandas.util.testing as tm
-from pandas.tests.frame.common import TestData
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+@pytest.fixture
+def int_frame_const_col():
+    """
+    Fixture for DataFrame of ints which are constant per column
 
+    Columns are ['A', 'B', 'C'], with values (per column): [1, 2, 3]
+    """
+    df = DataFrame(np.tile(np.arange(3, dtype='int64'), 6).reshape(6, -1) + 1,
+                   columns=['A', 'B', 'C'])
+    return df
 
-class TestDataFrameApply(tm.TestCase, TestData):
 
-    def test_apply(self):
+class TestDataFrameApply():
+
+    def test_apply(self, float_frame):
         with np.errstate(all='ignore'):
             # ufunc
-            applied = self.frame.apply(np.sqrt)
-            assert_series_equal(np.sqrt(self.frame['A']), applied['A'])
+            applied = float_frame.apply(np.sqrt)
+            tm.assert_series_equal(np.sqrt(float_frame['A']), applied['A'])
 
             # aggregator
-            applied = self.frame.apply(np.mean)
-            self.assertEqual(applied['A'], np.mean(self.frame['A']))
+            applied = float_frame.apply(np.mean)
+            assert applied['A'] == np.mean(float_frame['A'])
 
-            d = self.frame.index[0]
-            applied = self.frame.apply(np.mean, axis=1)
-            self.assertEqual(applied[d], np.mean(self.frame.xs(d)))
-            self.assertIs(applied.index, self.frame.index)  # want this
+            d = float_frame.index[0]
+            applied = float_frame.apply(np.mean, axis=1)
+            assert applied[d] == np.mean(float_frame.xs(d))
+            assert applied.index is float_frame.index  # want this
 
         # invalid axis
         df = DataFrame(
             [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
-        self.assertRaises(ValueError, df.apply, lambda x: x, 2)
+        with pytest.raises(ValueError):
+            df.apply(lambda x: x, 2)
 
-        # GH9573
+        # GH 9573
         df = DataFrame({'c0': ['A', 'A', 'B', 'B'],
                         'c1': ['C', 'C', 'D', 'D']})
         df = df.apply(lambda ts: ts.astype('category'))
-        self.assertEqual(df.shape, (4, 2))
-        self.assertTrue(isinstance(df['c0'].dtype, CategoricalDtype))
-        self.assertTrue(isinstance(df['c1'].dtype, CategoricalDtype))
+
+        assert df.shape == (4, 2)
+        assert isinstance(df['c0'].dtype, CategoricalDtype)
+        assert isinstance(df['c1'].dtype, CategoricalDtype)
 
     def test_apply_mixed_datetimelike(self):
         # mixed datetimelike
@@ -55,93 +74,170 @@ def test_apply_mixed_datetimelike(self):
         result = df.apply(lambda x: x, axis=1)
         assert_frame_equal(result, df)
 
-    def test_apply_empty(self):
+    def test_apply_empty(self, float_frame):
         # empty
-        applied = self.empty.apply(np.sqrt)
-        self.assertTrue(applied.empty)
+        empty_frame = DataFrame()
 
-        applied = self.empty.apply(np.mean)
-        self.assertTrue(applied.empty)
+        applied = empty_frame.apply(np.sqrt)
+        assert applied.empty
 
-        no_rows = self.frame[:0]
+        applied = empty_frame.apply(np.mean)
+        assert applied.empty
+
+        no_rows = float_frame[:0]
         result = no_rows.apply(lambda x: x.mean())
-        expected = Series(np.nan, index=self.frame.columns)
+        expected = Series(np.nan, index=float_frame.columns)
         assert_series_equal(result, expected)
 
-        no_cols = self.frame.loc[:, []]
+        no_cols = float_frame.loc[:, []]
         result = no_cols.apply(lambda x: x.mean(), axis=1)
-        expected = Series(np.nan, index=self.frame.index)
+        expected = Series(np.nan, index=float_frame.index)
         assert_series_equal(result, expected)
 
-        # 2476
-        xp = DataFrame(index=['a'])
-        rs = xp.apply(lambda x: x['a'], axis=1)
-        assert_frame_equal(xp, rs)
+        # GH 2476
+        expected = DataFrame(index=['a'])
+        result = expected.apply(lambda x: x['a'], axis=1)
+        assert_frame_equal(expected, result)
 
+    def test_apply_with_reduce_empty(self):
         # reduce with an empty DataFrame
+        empty_frame = DataFrame()
+
         x = []
-        result = self.empty.apply(x.append, axis=1, reduce=False)
-        assert_frame_equal(result, self.empty)
-        result = self.empty.apply(x.append, axis=1, reduce=True)
+        result = empty_frame.apply(x.append, axis=1, result_type='expand')
+        assert_frame_equal(result, empty_frame)
+        result = empty_frame.apply(x.append, axis=1, result_type='reduce')
         assert_series_equal(result, Series(
             [], index=pd.Index([], dtype=object)))
 
         empty_with_cols = DataFrame(columns=['a', 'b', 'c'])
-        result = empty_with_cols.apply(x.append, axis=1, reduce=False)
+        result = empty_with_cols.apply(x.append, axis=1, result_type='expand')
         assert_frame_equal(result, empty_with_cols)
-        result = empty_with_cols.apply(x.append, axis=1, reduce=True)
+        result = empty_with_cols.apply(x.append, axis=1, result_type='reduce')
         assert_series_equal(result, Series(
             [], index=pd.Index([], dtype=object)))
 
         # Ensure that x.append hasn't been called
-        self.assertEqual(x, [])
+        assert x == []
+
+    def test_apply_deprecate_reduce(self):
+        empty_frame = DataFrame()
+
+        x = []
+        with tm.assert_produces_warning(FutureWarning):
+            empty_frame.apply(x.append, axis=1, reduce=True)
 
     def test_apply_standard_nonunique(self):
         df = DataFrame(
             [[1, 2, 3], [4, 5, 6], [7, 8, 9]], index=['a', 'a', 'c'])
-        rs = df.apply(lambda s: s[0], axis=1)
-        xp = Series([1, 4, 7], ['a', 'a', 'c'])
-        assert_series_equal(rs, xp)
-
-        rs = df.T.apply(lambda s: s[0], axis=0)
-        assert_series_equal(rs, xp)
-
-    def test_apply_broadcast(self):
-        broadcasted = self.frame.apply(np.mean, broadcast=True)
-        agged = self.frame.apply(np.mean)
 
-        for col, ts in compat.iteritems(broadcasted):
-            self.assertTrue((ts == agged[col]).all())
-
-        broadcasted = self.frame.apply(np.mean, axis=1, broadcast=True)
-        agged = self.frame.apply(np.mean, axis=1)
-        for idx in broadcasted.index:
-            self.assertTrue((broadcasted.xs(idx) == agged[idx]).all())
+        result = df.apply(lambda s: s[0], axis=1)
+        expected = Series([1, 4, 7], ['a', 'a', 'c'])
+        assert_series_equal(result, expected)
 
-    def test_apply_raw(self):
-        result0 = self.frame.apply(np.mean, raw=True)
-        result1 = self.frame.apply(np.mean, axis=1, raw=True)
+        result = df.T.apply(lambda s: s[0], axis=0)
+        assert_series_equal(result, expected)
 
-        expected0 = self.frame.apply(lambda x: x.values.mean())
-        expected1 = self.frame.apply(lambda x: x.values.mean(), axis=1)
+    @pytest.mark.parametrize('func', ['sum', 'mean', 'min', 'max', 'std'])
+    @pytest.mark.parametrize('args,kwds', [
+        pytest.param([], {}, id='no_args_or_kwds'),
+        pytest.param([1], {}, id='axis_from_args'),
+        pytest.param([], {'axis': 1}, id='axis_from_kwds'),
+        pytest.param([], {'numeric_only': True}, id='optional_kwds'),
+        pytest.param([1, None], {'numeric_only': True}, id='args_and_kwds')
+    ])
+    def test_apply_with_string_funcs(self, float_frame, func, args, kwds):
+        result = float_frame.apply(func, *args, **kwds)
+        expected = getattr(float_frame, func)(*args, **kwds)
+        tm.assert_series_equal(result, expected)
+
+    def test_apply_broadcast_deprecated(self, float_frame):
+        with tm.assert_produces_warning(FutureWarning):
+            float_frame.apply(np.mean, broadcast=True)
+
+    def test_apply_broadcast(self, float_frame, int_frame_const_col):
+
+        # scalars
+        result = float_frame.apply(np.mean, result_type='broadcast')
+        expected = DataFrame([float_frame.mean()], index=float_frame.index)
+        tm.assert_frame_equal(result, expected)
+
+        result = float_frame.apply(np.mean, axis=1, result_type='broadcast')
+        m = float_frame.mean(axis=1)
+        expected = DataFrame({c: m for c in float_frame.columns})
+        tm.assert_frame_equal(result, expected)
+
+        # lists
+        result = float_frame.apply(
+            lambda x: list(range(len(float_frame.columns))),
+            axis=1,
+            result_type='broadcast')
+        m = list(range(len(float_frame.columns)))
+        expected = DataFrame([m] * len(float_frame.index),
+                             dtype='float64',
+                             index=float_frame.index,
+                             columns=float_frame.columns)
+        tm.assert_frame_equal(result, expected)
+
+        result = float_frame.apply(lambda x:
+                                   list(range(len(float_frame.index))),
+                                   result_type='broadcast')
+        m = list(range(len(float_frame.index)))
+        expected = DataFrame({c: m for c in float_frame.columns},
+                             dtype='float64',
+                             index=float_frame.index)
+        tm.assert_frame_equal(result, expected)
+
+        # preserve columns
+        df = int_frame_const_col
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type='broadcast')
+        tm.assert_frame_equal(result, df)
+
+        df = int_frame_const_col
+        result = df.apply(lambda x: Series([1, 2, 3], index=list('abc')),
+                          axis=1, result_type='broadcast')
+        expected = df.copy()
+        tm.assert_frame_equal(result, expected)
+
+    def test_apply_broadcast_error(self, int_frame_const_col):
+        df = int_frame_const_col
+
+        # > 1 ndim
+        with pytest.raises(ValueError):
+            df.apply(lambda x: np.array([1, 2]).reshape(-1, 2),
+                     axis=1, result_type='broadcast')
+
+        # cannot broadcast
+        with pytest.raises(ValueError):
+            df.apply(lambda x: [1, 2], axis=1, result_type='broadcast')
+
+        with pytest.raises(ValueError):
+            df.apply(lambda x: Series([1, 2]), axis=1, result_type='broadcast')
+
+    def test_apply_raw(self, float_frame):
+        result0 = float_frame.apply(np.mean, raw=True)
+        result1 = float_frame.apply(np.mean, axis=1, raw=True)
+
+        expected0 = float_frame.apply(lambda x: x.values.mean())
+        expected1 = float_frame.apply(lambda x: x.values.mean(), axis=1)
 
         assert_series_equal(result0, expected0)
         assert_series_equal(result1, expected1)
 
         # no reduction
-        result = self.frame.apply(lambda x: x * 2, raw=True)
-        expected = self.frame * 2
+        result = float_frame.apply(lambda x: x * 2, raw=True)
+        expected = float_frame * 2
         assert_frame_equal(result, expected)
 
-    def test_apply_axis1(self):
-        d = self.frame.index[0]
-        tapplied = self.frame.apply(np.mean, axis=1)
-        self.assertEqual(tapplied[d], np.mean(self.frame.xs(d)))
+    def test_apply_axis1(self, float_frame):
+        d = float_frame.index[0]
+        tapplied = float_frame.apply(np.mean, axis=1)
+        assert tapplied[d] == np.mean(float_frame.xs(d))
 
-    def test_apply_ignore_failures(self):
-        result = self.mixed_frame._apply_standard(np.mean, 0,
-                                                  ignore_failures=True)
-        expected = self.mixed_frame._get_numeric_data().apply(np.mean)
+    def test_apply_ignore_failures(self, float_string_frame):
+        result = frame_apply(float_string_frame, np.mean, 0,
+                             ignore_failures=True).apply_standard()
+        expected = float_string_frame._get_numeric_data().apply(np.mean)
         assert_series_equal(result, expected)
 
     def test_apply_mixed_dtype_corner(self):
@@ -169,17 +265,18 @@ def test_apply_empty_infer_type(self):
 
         def _check(df, f):
             with warnings.catch_warnings(record=True):
+                warnings.simplefilter("ignore", RuntimeWarning)
                 test_res = f(np.array([], dtype='f8'))
             is_reduction = not isinstance(test_res, np.ndarray)
 
             def _checkit(axis=0, raw=False):
-                res = df.apply(f, axis=axis, raw=raw)
+                result = df.apply(f, axis=axis, raw=raw)
                 if is_reduction:
                     agg_axis = df._get_agg_axis(axis)
-                    tm.assertIsInstance(res, Series)
-                    self.assertIs(res.index, agg_axis)
+                    assert isinstance(result, Series)
+                    assert result.index is agg_axis
                 else:
-                    tm.assertIsInstance(res, DataFrame)
+                    assert isinstance(result, DataFrame)
 
             _checkit()
             _checkit(axis=1)
@@ -192,10 +289,10 @@ def _checkit(axis=0, raw=False):
             _check(no_index, lambda x: x)
             _check(no_index, lambda x: x.mean())
 
-        result = no_cols.apply(lambda x: x.mean(), broadcast=True)
-        tm.assertIsInstance(result, DataFrame)
+        result = no_cols.apply(lambda x: x.mean(), result_type='broadcast')
+        assert isinstance(result, DataFrame)
 
-    def test_apply_with_args_kwds(self):
+    def test_apply_with_args_kwds(self, float_frame):
         def add_some(x, howmuch=0):
             return x + howmuch
 
@@ -205,40 +302,47 @@ def agg_and_add(x, howmuch=0):
         def subtract_and_divide(x, sub, divide=1):
             return (x - sub) / divide
 
-        result = self.frame.apply(add_some, howmuch=2)
-        exp = self.frame.apply(lambda x: x + 2)
-        assert_frame_equal(result, exp)
+        result = float_frame.apply(add_some, howmuch=2)
+        expected = float_frame.apply(lambda x: x + 2)
+        assert_frame_equal(result, expected)
+
+        result = float_frame.apply(agg_and_add, howmuch=2)
+        expected = float_frame.apply(lambda x: x.mean() + 2)
+        assert_series_equal(result, expected)
 
-        result = self.frame.apply(agg_and_add, howmuch=2)
-        exp = self.frame.apply(lambda x: x.mean() + 2)
-        assert_series_equal(result, exp)
+        result = float_frame.apply(subtract_and_divide, args=(2,), divide=2)
+        expected = float_frame.apply(lambda x: (x - 2.) / 2.)
+        assert_frame_equal(result, expected)
 
-        res = self.frame.apply(subtract_and_divide, args=(2,), divide=2)
-        exp = self.frame.apply(lambda x: (x - 2.) / 2.)
-        assert_frame_equal(res, exp)
+    def test_apply_yield_list(self, float_frame):
+        result = float_frame.apply(list)
+        assert_frame_equal(result, float_frame)
 
-    def test_apply_yield_list(self):
-        result = self.frame.apply(list)
-        assert_frame_equal(result, self.frame)
+    def test_apply_reduce_Series(self, float_frame):
+        float_frame.loc[::2, 'A'] = np.nan
+        expected = float_frame.mean(1)
+        result = float_frame.apply(np.mean, axis=1)
+        assert_series_equal(result, expected)
 
-    def test_apply_reduce_Series(self):
-        self.frame.loc[::2, 'A'] = np.nan
-        expected = self.frame.mean(1)
-        result = self.frame.apply(np.mean, axis=1)
+    def test_apply_reduce_rows_to_dict(self):
+        # GH 25196
+        data = pd.DataFrame([[1, 2], [3, 4]])
+        expected = pd.Series([{0: 1, 1: 3}, {0: 2, 1: 4}])
+        result = data.apply(dict)
         assert_series_equal(result, expected)
 
     def test_apply_differently_indexed(self):
         df = DataFrame(np.random.randn(20, 10))
 
         result0 = df.apply(Series.describe, axis=0)
-        expected0 = DataFrame(dict((i, v.describe())
-                                   for i, v in compat.iteritems(df)),
+        expected0 = DataFrame({i: v.describe()
+                               for i, v in compat.iteritems(df)},
                               columns=df.columns)
         assert_frame_equal(result0, expected0)
 
         result1 = df.apply(Series.describe, axis=1)
-        expected1 = DataFrame(dict((i, v.describe())
-                                   for i, v in compat.iteritems(df.T)),
+        expected1 = DataFrame({i: v.describe()
+                               for i, v in compat.iteritems(df.T)},
                               columns=df.index).T
         assert_frame_equal(result1, expected1)
 
@@ -264,18 +368,17 @@ def transform(row):
             return row
 
         def transform2(row):
-            if (notnull(row['C']) and row['C'].startswith('shin') and
+            if (notna(row['C']) and row['C'].startswith('shin') and
                     row['A'] == 'foo'):
                 row['D'] = 7
             return row
 
         try:
-            transformed = data.apply(transform, axis=1)  # noqa
+            data.apply(transform, axis=1)
         except AttributeError as e:
-            self.assertEqual(len(e.args), 2)
-            self.assertEqual(e.args[1], 'occurred at index 4')
-            self.assertEqual(
-                e.args[0], "'float' object has no attribute 'startswith'")
+            assert len(e.args) == 2
+            assert e.args[1] == 'occurred at index 4'
+            assert e.args[0] == "'float' object has no attribute 'startswith'"
 
     def test_apply_bug(self):
 
@@ -316,76 +419,80 @@ def test_apply_convert_objects(self):
         result = data.apply(lambda x: x, axis=1)
         assert_frame_equal(result._convert(datetime=True), data)
 
-    def test_apply_attach_name(self):
-        result = self.frame.apply(lambda x: x.name)
-        expected = Series(self.frame.columns, index=self.frame.columns)
+    def test_apply_attach_name(self, float_frame):
+        result = float_frame.apply(lambda x: x.name)
+        expected = Series(float_frame.columns, index=float_frame.columns)
         assert_series_equal(result, expected)
 
-        result = self.frame.apply(lambda x: x.name, axis=1)
-        expected = Series(self.frame.index, index=self.frame.index)
+        result = float_frame.apply(lambda x: x.name, axis=1)
+        expected = Series(float_frame.index, index=float_frame.index)
         assert_series_equal(result, expected)
 
         # non-reductions
-        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)))
-        expected = DataFrame(np.tile(self.frame.columns,
-                                     (len(self.frame.index), 1)),
-                             index=self.frame.index,
-                             columns=self.frame.columns)
+        result = float_frame.apply(lambda x: np.repeat(x.name, len(x)))
+        expected = DataFrame(np.tile(float_frame.columns,
+                                     (len(float_frame.index), 1)),
+                             index=float_frame.index,
+                             columns=float_frame.columns)
         assert_frame_equal(result, expected)
 
-        result = self.frame.apply(lambda x: np.repeat(x.name, len(x)),
-                                  axis=1)
-        expected = DataFrame(np.tile(self.frame.index,
-                                     (len(self.frame.columns), 1)).T,
-                             index=self.frame.index,
-                             columns=self.frame.columns)
-        assert_frame_equal(result, expected)
+        result = float_frame.apply(lambda x: np.repeat(x.name, len(x)),
+                                   axis=1)
+        expected = Series(np.repeat(t[0], len(float_frame.columns))
+                          for t in float_frame.itertuples())
+        expected.index = float_frame.index
+        assert_series_equal(result, expected)
 
-    def test_apply_multi_index(self):
-        s = DataFrame([[1, 2], [3, 4], [5, 6]])
-        s.index = MultiIndex.from_arrays([['a', 'a', 'b'], ['c', 'd', 'd']])
-        s.columns = ['col1', 'col2']
-        res = s.apply(lambda x: Series({'min': min(x), 'max': max(x)}), 1)
-        tm.assertIsInstance(res.index, MultiIndex)
+    def test_apply_multi_index(self, float_frame):
+        index = MultiIndex.from_arrays([['a', 'a', 'b'], ['c', 'd', 'd']])
+        s = DataFrame([[1, 2], [3, 4], [5, 6]],
+                      index=index,
+                      columns=['col1', 'col2'])
+        result = s.apply(
+            lambda x: Series({'min': min(x), 'max': max(x)}), 1)
+        expected = DataFrame([[1, 2], [3, 4], [5, 6]],
+                             index=index,
+                             columns=['min', 'max'])
+        assert_frame_equal(result, expected, check_like=True)
 
     def test_apply_dict(self):
 
         # GH 8735
         A = DataFrame([['foo', 'bar'], ['spam', 'eggs']])
-        A_dicts = pd.Series([dict([(0, 'foo'), (1, 'spam')]),
-                             dict([(0, 'bar'), (1, 'eggs')])])
+        A_dicts = Series([dict([(0, 'foo'), (1, 'spam')]),
+                          dict([(0, 'bar'), (1, 'eggs')])])
         B = DataFrame([[0, 1], [2, 3]])
-        B_dicts = pd.Series([dict([(0, 0), (1, 2)]), dict([(0, 1), (1, 3)])])
+        B_dicts = Series([dict([(0, 0), (1, 2)]), dict([(0, 1), (1, 3)])])
         fn = lambda x: x.to_dict()
 
         for df, dicts in [(A, A_dicts), (B, B_dicts)]:
-            reduce_true = df.apply(fn, reduce=True)
-            reduce_false = df.apply(fn, reduce=False)
-            reduce_none = df.apply(fn, reduce=None)
+            reduce_true = df.apply(fn, result_type='reduce')
+            reduce_false = df.apply(fn, result_type='expand')
+            reduce_none = df.apply(fn)
 
             assert_series_equal(reduce_true, dicts)
             assert_frame_equal(reduce_false, df)
             assert_series_equal(reduce_none, dicts)
 
-    def test_applymap(self):
-        applied = self.frame.applymap(lambda x: x * 2)
-        assert_frame_equal(applied, self.frame * 2)
-        result = self.frame.applymap(type)
+    def test_applymap(self, float_frame):
+        applied = float_frame.applymap(lambda x: x * 2)
+        tm.assert_frame_equal(applied, float_frame * 2)
+        float_frame.applymap(type)
 
-        # GH #465, function returning tuples
-        result = self.frame.applymap(lambda x: (x, x))
-        tm.assertIsInstance(result['A'][0], tuple)
+        # GH 465: function returning tuples
+        result = float_frame.applymap(lambda x: (x, x))
+        assert isinstance(result['A'][0], tuple)
 
-        # GH 2909, object conversion to float in constructor?
+        # GH 2909: object conversion to float in constructor?
         df = DataFrame(data=[1, 'a'])
         result = df.applymap(lambda x: x)
-        self.assertEqual(result.dtypes[0], object)
+        assert result.dtypes[0] == object
 
         df = DataFrame(data=[1., 'a'])
         result = df.applymap(lambda x: x)
-        self.assertEqual(result.dtypes[0], object)
+        assert result.dtypes[0] == object
 
-        # GH2786
+        # GH 2786
         df = DataFrame(np.random.random((3, 4)))
         df2 = df.copy()
         cols = ['a', 'a', 'a', 'a']
@@ -394,14 +501,14 @@ def test_applymap(self):
         expected = df2.applymap(str)
         expected.columns = cols
         result = df.applymap(str)
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         # datetime/timedelta
         df['datetime'] = Timestamp('20130101')
         df['timedelta'] = pd.Timedelta('1 min')
         result = df.applymap(str)
         for f in ['datetime', 'timedelta']:
-            self.assertEqual(result.loc[0, f], str(df.loc[0, f]))
+            assert result.loc[0, f] == str(df.loc[0, f])
 
         # GH 8222
         empty_frames = [pd.DataFrame(),
@@ -413,6 +520,16 @@ def test_applymap(self):
                 result = frame.applymap(func)
                 tm.assert_frame_equal(result, frame)
 
+    def test_applymap_box_timestamps(self):
+        # GH 2689, GH 2627
+        ser = pd.Series(date_range('1/1/2000', periods=10))
+
+        def func(x):
+            return (x.hour, x.day, x.month)
+
+        # it works!
+        pd.DataFrame(ser).applymap(func)
+
     def test_applymap_box(self):
         # ufunc will not be boxed. Same test cases as the test_map_box
         df = pd.DataFrame({'a': [pd.Timestamp('2011-01-01'),
@@ -424,12 +541,12 @@ def test_applymap_box(self):
                            'd': [pd.Period('2011-01-01', freq='M'),
                                  pd.Period('2011-01-02', freq='M')]})
 
-        res = df.applymap(lambda x: '{0}'.format(x.__class__.__name__))
-        exp = pd.DataFrame({'a': ['Timestamp', 'Timestamp'],
-                            'b': ['Timestamp', 'Timestamp'],
-                            'c': ['Timedelta', 'Timedelta'],
-                            'd': ['Period', 'Period']})
-        tm.assert_frame_equal(res, exp)
+        result = df.applymap(lambda x: '{0}'.format(x.__class__.__name__))
+        expected = pd.DataFrame({'a': ['Timestamp', 'Timestamp'],
+                                 'b': ['Timestamp', 'Timestamp'],
+                                 'c': ['Timedelta', 'Timedelta'],
+                                 'd': ['Period', 'Period']})
+        tm.assert_frame_equal(result, expected)
 
     def test_frame_apply_dont_convert_datetime64(self):
         from pandas.tseries.offsets import BDay
@@ -438,10 +555,10 @@ def test_frame_apply_dont_convert_datetime64(self):
         df = df.applymap(lambda x: x + BDay())
         df = df.applymap(lambda x: x + BDay())
 
-        self.assertTrue(df.x1.dtype == 'M8[ns]')
+        assert df.x1.dtype == 'M8[ns]'
 
-    # See gh-12244
     def test_apply_non_numpy_dtype(self):
+        # GH 12244
         df = DataFrame({'dt': pd.date_range(
             "2015-01-01", periods=3, tz='Europe/Brussels')})
         result = df.apply(lambda x: x)
@@ -455,3 +572,589 @@ def test_apply_non_numpy_dtype(self):
         df = DataFrame({'dt': ['a', 'b', 'c', 'a']}, dtype='category')
         result = df.apply(lambda x: x)
         assert_frame_equal(result, df)
+
+    def test_apply_dup_names_multi_agg(self):
+        # GH 21063
+        df = pd.DataFrame([[0, 1], [2, 3]], columns=['a', 'a'])
+        expected = pd.DataFrame([[0, 1]], columns=['a', 'a'], index=['min'])
+        result = df.agg(['min'])
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestInferOutputShape(object):
+    # the user has supplied an opaque UDF where
+    # they are transforming the input that requires
+    # us to infer the output
+
+    def test_infer_row_shape(self):
+        # GH 17437
+        # if row shape is changing, infer it
+        df = pd.DataFrame(np.random.rand(10, 2))
+        result = df.apply(np.fft.fft, axis=0)
+        assert result.shape == (10, 2)
+
+        result = df.apply(np.fft.rfft, axis=0)
+        assert result.shape == (6, 2)
+
+    def test_with_dictlike_columns(self):
+        # GH 17602
+        df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1)
+        expected = Series([{'s': 3} for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        df['tm'] = [pd.Timestamp('2017-05-01 00:00:00'),
+                    pd.Timestamp('2017-05-02 00:00:00')]
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1)
+        assert_series_equal(result, expected)
+
+        # compose a series
+        result = (df['a'] + df['b']).apply(lambda x: {'s': x})
+        expected = Series([{'s': 3}, {'s': 3}])
+        assert_series_equal(result, expected)
+
+        # GH 18775
+        df = DataFrame()
+        df["author"] = ["X", "Y", "Z"]
+        df["publisher"] = ["BBC", "NBC", "N24"]
+        df["date"] = pd.to_datetime(['17-10-2010 07:15:30',
+                                     '13-05-2011 08:20:35',
+                                     '15-01-2013 09:09:09'])
+        result = df.apply(lambda x: {}, axis=1)
+        expected = Series([{}, {}, {}])
+        assert_series_equal(result, expected)
+
+    def test_with_dictlike_columns_with_infer(self):
+        # GH 17602
+        df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1, result_type='expand')
+        expected = DataFrame({'s': [3, 3]})
+        assert_frame_equal(result, expected)
+
+        df['tm'] = [pd.Timestamp('2017-05-01 00:00:00'),
+                    pd.Timestamp('2017-05-02 00:00:00')]
+        result = df.apply(lambda x: {'s': x['a'] + x['b']},
+                          axis=1, result_type='expand')
+        assert_frame_equal(result, expected)
+
+    def test_with_listlike_columns(self):
+        # GH 17348
+        df = DataFrame({'a': Series(np.random.randn(4)),
+                        'b': ['a', 'list', 'of', 'words'],
+                        'ts': date_range('2016-10-01', periods=4, freq='H')})
+
+        result = df[['a', 'b']].apply(tuple, axis=1)
+        expected = Series([t[1:] for t in df[['a', 'b']].itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df[['a', 'ts']].apply(tuple, axis=1)
+        expected = Series([t[1:] for t in df[['a', 'ts']].itertuples()])
+        assert_series_equal(result, expected)
+
+        # GH 18919
+        df = DataFrame({'x': Series([['a', 'b'], ['q']]),
+                        'y': Series([['z'], ['q', 't']])})
+        df.index = MultiIndex.from_tuples([('i0', 'j0'), ('i1', 'j1')])
+
+        result = df.apply(
+            lambda row: [el for el in row['x'] if el in row['y']],
+            axis=1)
+        expected = Series([[], ['q']], index=df.index)
+        assert_series_equal(result, expected)
+
+    def test_infer_output_shape_columns(self):
+        # GH 18573
+
+        df = DataFrame({'number': [1., 2.],
+                        'string': ['foo', 'bar'],
+                        'datetime': [pd.Timestamp('2017-11-29 03:30:00'),
+                                     pd.Timestamp('2017-11-29 03:45:00')]})
+        result = df.apply(lambda row: (row.number, row.string), axis=1)
+        expected = Series([(t.number, t.string) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_infer_output_shape_listlike_columns(self):
+        # GH 16353
+
+        df = DataFrame(np.random.randn(6, 3), columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        expected = Series([[1, 2, 3] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1)
+        expected = Series([[1, 2] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        # GH 17970
+        df = DataFrame({"a": [1, 2, 3]}, index=list('abc'))
+
+        result = df.apply(lambda row: np.ones(1), axis=1)
+        expected = Series([np.ones(1) for t in df.itertuples()],
+                          index=df.index)
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda row: np.ones(2), axis=1)
+        expected = Series([np.ones(2) for t in df.itertuples()],
+                          index=df.index)
+        assert_series_equal(result, expected)
+
+        # GH 17892
+        df = pd.DataFrame({'a': [pd.Timestamp('2010-02-01'),
+                                 pd.Timestamp('2010-02-04'),
+                                 pd.Timestamp('2010-02-05'),
+                                 pd.Timestamp('2010-02-06')],
+                           'b': [9, 5, 4, 3],
+                           'c': [5, 3, 4, 2],
+                           'd': [1, 2, 3, 4]})
+
+        def fun(x):
+            return (1, 2)
+
+        result = df.apply(fun, axis=1)
+        expected = Series([(1, 2) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_consistent_coerce_for_shapes(self):
+        # we want column names to NOT be propagated
+        # just because the shape matches the input shape
+        df = DataFrame(np.random.randn(4, 3), columns=['A', 'B', 'C'])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        expected = Series([[1, 2, 3] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1)
+        expected = Series([[1, 2] for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+    def test_consistent_names(self, int_frame_const_col):
+        # if a Series is returned, we should use the resulting index names
+        df = int_frame_const_col
+
+        result = df.apply(lambda x: Series([1, 2, 3],
+                                           index=['test', 'other', 'cols']),
+                          axis=1)
+        expected = int_frame_const_col.rename(columns={'A': 'test',
+                                                       'B': 'other',
+                                                       'C': 'cols'})
+        assert_frame_equal(result, expected)
+
+        result = df.apply(lambda x: Series([1, 2], index=['test', 'other']),
+                          axis=1)
+        expected = expected[['test', 'other']]
+        assert_frame_equal(result, expected)
+
+    def test_result_type(self, int_frame_const_col):
+        # result_type should be consistent no matter which
+        # path we take in the code
+        df = int_frame_const_col
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type='expand')
+        expected = df.copy()
+        expected.columns = [0, 1, 2]
+        assert_frame_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2], axis=1, result_type='expand')
+        expected = df[['A', 'B']].copy()
+        expected.columns = [0, 1]
+        assert_frame_equal(result, expected)
+
+        # broadcast result
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type='broadcast')
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        columns = ['other', 'col', 'names']
+        result = df.apply(lambda x: Series([1, 2, 3], index=columns),
+                          axis=1, result_type='broadcast')
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        # series result
+        result = df.apply(lambda x: Series([1, 2, 3], index=x.index), axis=1)
+        expected = df.copy()
+        assert_frame_equal(result, expected)
+
+        # series result with other index
+        columns = ['other', 'col', 'names']
+        result = df.apply(lambda x: Series([1, 2, 3], index=columns), axis=1)
+        expected = df.copy()
+        expected.columns = columns
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("result_type", ['foo', 1])
+    def test_result_type_error(self, result_type, int_frame_const_col):
+        # allowed result_type
+        df = int_frame_const_col
+
+        with pytest.raises(ValueError):
+            df.apply(lambda x: [1, 2, 3], axis=1, result_type=result_type)
+
+    @pytest.mark.parametrize(
+        "box",
+        [lambda x: list(x),
+         lambda x: tuple(x),
+         lambda x: np.array(x, dtype='int64')],
+        ids=['list', 'tuple', 'array'])
+    def test_consistency_for_boxed(self, box, int_frame_const_col):
+        # passing an array or list should not affect the output shape
+        df = int_frame_const_col
+
+        result = df.apply(lambda x: box([1, 2]), axis=1)
+        expected = Series([box([1, 2]) for t in df.itertuples()])
+        assert_series_equal(result, expected)
+
+        result = df.apply(lambda x: box([1, 2]), axis=1, result_type='expand')
+        expected = int_frame_const_col[['A', 'B']].rename(columns={'A': 0,
+                                                                   'B': 1})
+        assert_frame_equal(result, expected)
+
+
+def zip_frames(frames, axis=1):
+    """
+    take a list of frames, zip them together under the
+    assumption that these all have the first frames' index/columns.
+
+    Returns
+    -------
+    new_frame : DataFrame
+    """
+    if axis == 1:
+        columns = frames[0].columns
+        zipped = [f.loc[:, c] for c in columns for f in frames]
+        return pd.concat(zipped, axis=1)
+    else:
+        index = frames[0].index
+        zipped = [f.loc[i, :] for i in index for f in frames]
+        return pd.DataFrame(zipped)
+
+
+class TestDataFrameAggregate():
+
+    def test_agg_transform(self, axis, float_frame):
+        other_axis = 1 if axis in {0, 'index'} else 0
+
+        with np.errstate(all='ignore'):
+
+            f_abs = np.abs(float_frame)
+            f_sqrt = np.sqrt(float_frame)
+
+            # ufunc
+            result = float_frame.transform(np.sqrt, axis=axis)
+            expected = f_sqrt.copy()
+            assert_frame_equal(result, expected)
+
+            result = float_frame.apply(np.sqrt, axis=axis)
+            assert_frame_equal(result, expected)
+
+            result = float_frame.transform(np.sqrt, axis=axis)
+            assert_frame_equal(result, expected)
+
+            # list-like
+            result = float_frame.apply([np.sqrt], axis=axis)
+            expected = f_sqrt.copy()
+            if axis in {0, 'index'}:
+                expected.columns = pd.MultiIndex.from_product(
+                    [float_frame.columns, ['sqrt']])
+            else:
+                expected.index = pd.MultiIndex.from_product(
+                    [float_frame.index, ['sqrt']])
+            assert_frame_equal(result, expected)
+
+            result = float_frame.transform([np.sqrt], axis=axis)
+            assert_frame_equal(result, expected)
+
+            # multiple items in list
+            # these are in the order as if we are applying both
+            # functions per series and then concatting
+            result = float_frame.apply([np.abs, np.sqrt], axis=axis)
+            expected = zip_frames([f_abs, f_sqrt], axis=other_axis)
+            if axis in {0, 'index'}:
+                expected.columns = pd.MultiIndex.from_product(
+                    [float_frame.columns, ['absolute', 'sqrt']])
+            else:
+                expected.index = pd.MultiIndex.from_product(
+                    [float_frame.index, ['absolute', 'sqrt']])
+            assert_frame_equal(result, expected)
+
+            result = float_frame.transform([np.abs, 'sqrt'], axis=axis)
+            assert_frame_equal(result, expected)
+
+    def test_transform_and_agg_err(self, axis, float_frame):
+        # cannot both transform and agg
+        with pytest.raises(ValueError):
+            float_frame.transform(['max', 'min'], axis=axis)
+
+        with pytest.raises(ValueError):
+            with np.errstate(all='ignore'):
+                float_frame.agg(['max', 'sqrt'], axis=axis)
+
+        with pytest.raises(ValueError):
+            with np.errstate(all='ignore'):
+                float_frame.transform(['max', 'sqrt'], axis=axis)
+
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        def f():
+            with np.errstate(all='ignore'):
+                df.agg({'A': ['abs', 'sum'], 'B': ['mean', 'max']}, axis=axis)
+
+    @pytest.mark.parametrize('method', [
+        'abs', 'shift', 'pct_change', 'cumsum', 'rank',
+    ])
+    def test_transform_method_name(self, method):
+        # GH 19760
+        df = pd.DataFrame({"A": [-1, 2]})
+        result = df.transform(method)
+        expected = operator.methodcaller(method)(df)
+        tm.assert_frame_equal(result, expected)
+
+    def test_demo(self):
+        # demonstration tests
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        result = df.agg(['min', 'max'])
+        expected = DataFrame({'A': [0, 4], 'B': [5, 5]},
+                             columns=['A', 'B'],
+                             index=['min', 'max'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.agg({'A': ['min', 'max'], 'B': ['sum', 'max']})
+        expected = DataFrame({'A': [4.0, 0.0, np.nan],
+                              'B': [5.0, np.nan, 25.0]},
+                             columns=['A', 'B'],
+                             index=['max', 'min', 'sum'])
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+    def test_agg_multiple_mixed_no_warning(self):
+        # GH 20909
+        mdf = pd.DataFrame({'A': [1, 2, 3],
+                            'B': [1., 2., 3.],
+                            'C': ['foo', 'bar', 'baz'],
+                            'D': pd.date_range('20130101', periods=3)})
+        expected = pd.DataFrame({"A": [1, 6], 'B': [1.0, 6.0],
+                                 "C": ['bar', 'foobarbaz'],
+                                 "D": [pd.Timestamp('2013-01-01'), pd.NaT]},
+                                index=['min', 'sum'])
+        # sorted index
+        with tm.assert_produces_warning(None):
+            result = mdf.agg(['min', 'sum'])
+
+        tm.assert_frame_equal(result, expected)
+
+        with tm.assert_produces_warning(None):
+            result = mdf[['D', 'C', 'B', 'A']].agg(['sum', 'min'])
+
+        # For backwards compatibility, the result's index is
+        # still sorted by function name, so it's ['min', 'sum']
+        # not ['sum', 'min'].
+        expected = expected[['D', 'C', 'B', 'A']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_agg_dict_nested_renaming_depr(self):
+
+        df = pd.DataFrame({'A': range(5), 'B': 5})
+
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df.agg({'A': {'foo': 'min'},
+                    'B': {'bar': 'max'}})
+
+    def test_agg_reduce(self, axis, float_frame):
+        other_axis = 1 if axis in {0, 'index'} else 0
+        name1, name2 = float_frame.axes[other_axis].unique()[:2].sort_values()
+
+        # all reducers
+        expected = pd.concat([float_frame.mean(axis=axis),
+                              float_frame.max(axis=axis),
+                              float_frame.sum(axis=axis),
+                              ], axis=1)
+        expected.columns = ['mean', 'max', 'sum']
+        expected = expected.T if axis in {0, 'index'} else expected
+
+        result = float_frame.agg(['mean', 'max', 'sum'], axis=axis)
+        assert_frame_equal(result, expected)
+
+        # dict input with scalars
+        func = OrderedDict([(name1, 'mean'), (name2, 'sum')])
+        result = float_frame.agg(func, axis=axis)
+        expected = Series([float_frame.loc(other_axis)[name1].mean(),
+                           float_frame.loc(other_axis)[name2].sum()],
+                          index=[name1, name2])
+        assert_series_equal(result, expected)
+
+        # dict input with lists
+        func = OrderedDict([(name1, ['mean']), (name2, ['sum'])])
+        result = float_frame.agg(func, axis=axis)
+        expected = DataFrame({
+            name1: Series([float_frame.loc(other_axis)[name1].mean()],
+                          index=['mean']),
+            name2: Series([float_frame.loc(other_axis)[name2].sum()],
+                          index=['sum'])})
+        expected = expected.T if axis in {1, 'columns'} else expected
+        assert_frame_equal(result, expected)
+
+        # dict input with lists with multiple
+        func = OrderedDict([(name1, ['mean', 'sum']), (name2, ['sum', 'max'])])
+        result = float_frame.agg(func, axis=axis)
+        expected = DataFrame(OrderedDict([
+            (name1, Series([float_frame.loc(other_axis)[name1].mean(),
+                           float_frame.loc(other_axis)[name1].sum()],
+                           index=['mean', 'sum'])),
+            (name2, Series([float_frame.loc(other_axis)[name2].sum(),
+                           float_frame.loc(other_axis)[name2].max()],
+                           index=['sum', 'max'])),
+        ]))
+        expected = expected.T if axis in {1, 'columns'} else expected
+        assert_frame_equal(result, expected)
+
+    def test_nuiscance_columns(self):
+
+        # GH 15015
+        df = DataFrame({'A': [1, 2, 3],
+                        'B': [1., 2., 3.],
+                        'C': ['foo', 'bar', 'baz'],
+                        'D': pd.date_range('20130101', periods=3)})
+
+        result = df.agg('min')
+        expected = Series([1, 1., 'bar', pd.Timestamp('20130101')],
+                          index=df.columns)
+        assert_series_equal(result, expected)
+
+        result = df.agg(['min'])
+        expected = DataFrame([[1, 1., 'bar', pd.Timestamp('20130101')]],
+                             index=['min'], columns=df.columns)
+        assert_frame_equal(result, expected)
+
+        result = df.agg('sum')
+        expected = Series([6, 6., 'foobarbaz'],
+                          index=['A', 'B', 'C'])
+        assert_series_equal(result, expected)
+
+        result = df.agg(['sum'])
+        expected = DataFrame([[6, 6., 'foobarbaz']],
+                             index=['sum'], columns=['A', 'B', 'C'])
+        assert_frame_equal(result, expected)
+
+    def test_non_callable_aggregates(self):
+
+        # GH 16405
+        # 'size' is a property of frame/series
+        # validate that this is working
+        df = DataFrame({'A': [None, 2, 3],
+                        'B': [1.0, np.nan, 3.0],
+                        'C': ['foo', None, 'bar']})
+
+        # Function aggregate
+        result = df.agg({'A': 'count'})
+        expected = Series({'A': 2})
+
+        assert_series_equal(result, expected)
+
+        # Non-function aggregate
+        result = df.agg({'A': 'size'})
+        expected = Series({'A': 3})
+
+        assert_series_equal(result, expected)
+
+        # Mix function and non-function aggs
+        result1 = df.agg(['count', 'size'])
+        result2 = df.agg({'A': ['count', 'size'],
+                          'B': ['count', 'size'],
+                          'C': ['count', 'size']})
+        expected = pd.DataFrame({'A': {'count': 2, 'size': 3},
+                                 'B': {'count': 2, 'size': 3},
+                                 'C': {'count': 2, 'size': 3}})
+
+        assert_frame_equal(result1, result2, check_like=True)
+        assert_frame_equal(result2, expected, check_like=True)
+
+        # Just functional string arg is same as calling df.arg()
+        result = df.agg('count')
+        expected = df.count()
+
+        assert_series_equal(result, expected)
+
+        # Just a string attribute arg same as calling df.arg
+        result = df.agg('size')
+        expected = df.size
+
+        assert result == expected
+
+    @pytest.mark.parametrize("df, func, expected", chain(
+        _get_cython_table_params(
+            DataFrame(), [
+                ('sum', Series()),
+                ('max', Series()),
+                ('min', Series()),
+                ('all', Series(dtype=bool)),
+                ('any', Series(dtype=bool)),
+                ('mean', Series()),
+                ('prod', Series()),
+                ('std', Series()),
+                ('var', Series()),
+                ('median', Series()),
+            ]),
+        _get_cython_table_params(
+            DataFrame([[np.nan, 1], [1, 2]]), [
+                ('sum', Series([1., 3])),
+                ('max', Series([1., 2])),
+                ('min', Series([1., 1])),
+                ('all', Series([True, True])),
+                ('any', Series([True, True])),
+                ('mean', Series([1, 1.5])),
+                ('prod', Series([1., 2])),
+                ('std', Series([np.nan, 0.707107])),
+                ('var', Series([np.nan, 0.5])),
+                ('median', Series([1, 1.5])),
+            ]),
+    ))
+    def test_agg_cython_table(self, df, func, expected, axis):
+        # GH 21224
+        # test reducing functions in
+        # pandas.core.base.SelectionMixin._cython_table
+        result = df.agg(func, axis=axis)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("df, func, expected", chain(
+        _get_cython_table_params(
+            DataFrame(), [
+                ('cumprod', DataFrame()),
+                ('cumsum', DataFrame()),
+            ]),
+        _get_cython_table_params(
+            DataFrame([[np.nan, 1], [1, 2]]), [
+                ('cumprod', DataFrame([[np.nan, 1], [1., 2.]])),
+                ('cumsum', DataFrame([[np.nan, 1], [1., 3.]])),
+            ]),
+    ))
+    def test_agg_cython_table_transform(self, df, func, expected, axis):
+        # GH 21224
+        # test transforming functions in
+        # pandas.core.base.SelectionMixin._cython_table (cumprod, cumsum)
+        result = df.agg(func, axis=axis)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("df, func, expected", _get_cython_table_params(
+        DataFrame([['a', 'b'], ['b', 'a']]), [
+            ['cumprod', TypeError],
+        ]),
+    )
+    def test_agg_cython_table_raises(self, df, func, expected, axis):
+        # GH 21224
+        with pytest.raises(expected):
+            df.agg(func, axis=axis)
+
+    @pytest.mark.parametrize("num_cols", [2, 3, 5])
+    def test_frequency_is_original(self, num_cols):
+        # GH 22150
+        index = pd.DatetimeIndex(["1950-06-30", "1952-10-24", "1953-05-29"])
+        original = index.copy()
+        df = DataFrame(1, index=index, columns=range(num_cols))
+        df.apply(lambda x: x)
+        assert index.freq == original.freq
diff --git a/pandas/tests/frame/test_arithmetic.py b/pandas/tests/frame/test_arithmetic.py
new file mode 100644
index 0000000000000..f14ecae448723
--- /dev/null
+++ b/pandas/tests/frame/test_arithmetic.py
@@ -0,0 +1,636 @@
+# -*- coding: utf-8 -*-
+from collections import deque
+from datetime import datetime
+import operator
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas.tests.frame.common import _check_mixed_float, _check_mixed_int
+import pandas.util.testing as tm
+
+# -------------------------------------------------------------------
+# Comparisons
+
+
+class TestFrameComparisons(object):
+    # Specifically _not_ flex-comparisons
+
+    def test_comparison_invalid(self):
+
+        def check(df, df2):
+
+            for (x, y) in [(df, df2), (df2, df)]:
+                # we expect the result to match Series comparisons for
+                # == and !=, inequalities should raise
+                result = x == y
+                expected = pd.DataFrame({col: x[col] == y[col]
+                                         for col in x.columns},
+                                        index=x.index, columns=x.columns)
+                tm.assert_frame_equal(result, expected)
+
+                result = x != y
+                expected = pd.DataFrame({col: x[col] != y[col]
+                                         for col in x.columns},
+                                        index=x.index, columns=x.columns)
+                tm.assert_frame_equal(result, expected)
+
+                with pytest.raises(TypeError):
+                    x >= y
+                with pytest.raises(TypeError):
+                    x > y
+                with pytest.raises(TypeError):
+                    x < y
+                with pytest.raises(TypeError):
+                    x <= y
+
+        # GH4968
+        # invalid date/int comparisons
+        df = pd.DataFrame(np.random.randint(10, size=(10, 1)), columns=['a'])
+        df['dates'] = pd.date_range('20010101', periods=len(df))
+
+        df2 = df.copy()
+        df2['dates'] = df['a']
+        check(df, df2)
+
+        df = pd.DataFrame(np.random.randint(10, size=(10, 2)),
+                          columns=['a', 'b'])
+        df2 = pd.DataFrame({'a': pd.date_range('20010101', periods=len(df)),
+                            'b': pd.date_range('20100101', periods=len(df))})
+        check(df, df2)
+
+    def test_timestamp_compare(self):
+        # make sure we can compare Timestamps on the right AND left hand side
+        # GH#4982
+        df = pd. DataFrame({'dates1': pd.date_range('20010101', periods=10),
+                            'dates2': pd.date_range('20010102', periods=10),
+                            'intcol': np.random.randint(1000000000, size=10),
+                            'floatcol': np.random.randn(10),
+                            'stringcol': list(tm.rands(10))})
+        df.loc[np.random.rand(len(df)) > 0.5, 'dates2'] = pd.NaT
+        ops = {'gt': 'lt', 'lt': 'gt', 'ge': 'le', 'le': 'ge', 'eq': 'eq',
+               'ne': 'ne'}
+
+        for left, right in ops.items():
+            left_f = getattr(operator, left)
+            right_f = getattr(operator, right)
+
+            # no nats
+            if left in ['eq', 'ne']:
+                expected = left_f(df, pd.Timestamp('20010109'))
+                result = right_f(pd.Timestamp('20010109'), df)
+                tm.assert_frame_equal(result, expected)
+            else:
+                with pytest.raises(TypeError):
+                    left_f(df, pd.Timestamp('20010109'))
+                with pytest.raises(TypeError):
+                    right_f(pd.Timestamp('20010109'), df)
+            # nats
+            expected = left_f(df, pd.Timestamp('nat'))
+            result = right_f(pd.Timestamp('nat'), df)
+            tm.assert_frame_equal(result, expected)
+
+    def test_mixed_comparison(self):
+        # GH#13128, GH#22163 != datetime64 vs non-dt64 should be False,
+        # not raise TypeError
+        # (this appears to be fixed before GH#22163, not sure when)
+        df = pd.DataFrame([['1989-08-01', 1], ['1989-08-01', 2]])
+        other = pd.DataFrame([['a', 'b'], ['c', 'd']])
+
+        result = df == other
+        assert not result.any().any()
+
+        result = df != other
+        assert result.all().all()
+
+    def test_df_boolean_comparison_error(self):
+        # GH#4576, GH#22880
+        # comparing DataFrame against list/tuple with len(obj) matching
+        #  len(df.columns) is supported as of GH#22800
+        df = pd.DataFrame(np.arange(6).reshape((3, 2)))
+
+        expected = pd.DataFrame([[False, False],
+                                 [True, False],
+                                 [False, False]])
+
+        result = df == (2, 2)
+        tm.assert_frame_equal(result, expected)
+
+        result = df == [2, 2]
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_float_none_comparison(self):
+        df = pd.DataFrame(np.random.randn(8, 3), index=range(8),
+                          columns=['A', 'B', 'C'])
+
+        result = df.__eq__(None)
+        assert not result.any().any()
+
+    def test_df_string_comparison(self):
+        df = pd.DataFrame([{"a": 1, "b": "foo"}, {"a": 2, "b": "bar"}])
+        mask_a = df.a > 1
+        tm.assert_frame_equal(df[mask_a], df.loc[1:1, :])
+        tm.assert_frame_equal(df[-mask_a], df.loc[0:0, :])
+
+        mask_b = df.b == "foo"
+        tm.assert_frame_equal(df[mask_b], df.loc[0:0, :])
+        tm.assert_frame_equal(df[-mask_b], df.loc[1:1, :])
+
+
+class TestFrameFlexComparisons(object):
+    # TODO: test_bool_flex_frame needs a better name
+    def test_bool_flex_frame(self):
+        data = np.random.randn(5, 3)
+        other_data = np.random.randn(5, 3)
+        df = pd.DataFrame(data)
+        other = pd.DataFrame(other_data)
+        ndim_5 = np.ones(df.shape + (1, 3))
+
+        # Unaligned
+        def _check_unaligned_frame(meth, op, df, other):
+            part_o = other.loc[3:, 1:].copy()
+            rs = meth(part_o)
+            xp = op(df, part_o.reindex(index=df.index, columns=df.columns))
+            tm.assert_frame_equal(rs, xp)
+
+        # DataFrame
+        assert df.eq(df).values.all()
+        assert not df.ne(df).values.any()
+        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
+            f = getattr(df, op)
+            o = getattr(operator, op)
+            # No NAs
+            tm.assert_frame_equal(f(other), o(df, other))
+            _check_unaligned_frame(f, o, df, other)
+            # ndarray
+            tm.assert_frame_equal(f(other.values), o(df, other.values))
+            # scalar
+            tm.assert_frame_equal(f(0), o(df, 0))
+            # NAs
+            msg = "Unable to coerce to Series/DataFrame"
+            tm.assert_frame_equal(f(np.nan), o(df, np.nan))
+            with pytest.raises(ValueError, match=msg):
+                f(ndim_5)
+
+        # Series
+        def _test_seq(df, idx_ser, col_ser):
+            idx_eq = df.eq(idx_ser, axis=0)
+            col_eq = df.eq(col_ser)
+            idx_ne = df.ne(idx_ser, axis=0)
+            col_ne = df.ne(col_ser)
+            tm.assert_frame_equal(col_eq, df == pd.Series(col_ser))
+            tm.assert_frame_equal(col_eq, -col_ne)
+            tm.assert_frame_equal(idx_eq, -idx_ne)
+            tm.assert_frame_equal(idx_eq, df.T.eq(idx_ser).T)
+            tm.assert_frame_equal(col_eq, df.eq(list(col_ser)))
+            tm.assert_frame_equal(idx_eq, df.eq(pd.Series(idx_ser), axis=0))
+            tm.assert_frame_equal(idx_eq, df.eq(list(idx_ser), axis=0))
+
+            idx_gt = df.gt(idx_ser, axis=0)
+            col_gt = df.gt(col_ser)
+            idx_le = df.le(idx_ser, axis=0)
+            col_le = df.le(col_ser)
+
+            tm.assert_frame_equal(col_gt, df > pd.Series(col_ser))
+            tm.assert_frame_equal(col_gt, -col_le)
+            tm.assert_frame_equal(idx_gt, -idx_le)
+            tm.assert_frame_equal(idx_gt, df.T.gt(idx_ser).T)
+
+            idx_ge = df.ge(idx_ser, axis=0)
+            col_ge = df.ge(col_ser)
+            idx_lt = df.lt(idx_ser, axis=0)
+            col_lt = df.lt(col_ser)
+            tm.assert_frame_equal(col_ge, df >= pd.Series(col_ser))
+            tm.assert_frame_equal(col_ge, -col_lt)
+            tm.assert_frame_equal(idx_ge, -idx_lt)
+            tm.assert_frame_equal(idx_ge, df.T.ge(idx_ser).T)
+
+        idx_ser = pd.Series(np.random.randn(5))
+        col_ser = pd.Series(np.random.randn(3))
+        _test_seq(df, idx_ser, col_ser)
+
+        # list/tuple
+        _test_seq(df, idx_ser.values, col_ser.values)
+
+        # NA
+        df.loc[0, 0] = np.nan
+        rs = df.eq(df)
+        assert not rs.loc[0, 0]
+        rs = df.ne(df)
+        assert rs.loc[0, 0]
+        rs = df.gt(df)
+        assert not rs.loc[0, 0]
+        rs = df.lt(df)
+        assert not rs.loc[0, 0]
+        rs = df.ge(df)
+        assert not rs.loc[0, 0]
+        rs = df.le(df)
+        assert not rs.loc[0, 0]
+
+        # complex
+        arr = np.array([np.nan, 1, 6, np.nan])
+        arr2 = np.array([2j, np.nan, 7, None])
+        df = pd.DataFrame({'a': arr})
+        df2 = pd.DataFrame({'a': arr2})
+        rs = df.gt(df2)
+        assert not rs.values.any()
+        rs = df.ne(df2)
+        assert rs.values.all()
+
+        arr3 = np.array([2j, np.nan, None])
+        df3 = pd.DataFrame({'a': arr3})
+        rs = df3.gt(2j)
+        assert not rs.values.any()
+
+        # corner, dtype=object
+        df1 = pd.DataFrame({'col': ['foo', np.nan, 'bar']})
+        df2 = pd.DataFrame({'col': ['foo', datetime.now(), 'bar']})
+        result = df1.ne(df2)
+        exp = pd.DataFrame({'col': [False, True, False]})
+        tm.assert_frame_equal(result, exp)
+
+    def test_flex_comparison_nat(self):
+        # GH 15697, GH 22163 df.eq(pd.NaT) should behave like df == pd.NaT,
+        # and _definitely_ not be NaN
+        df = pd.DataFrame([pd.NaT])
+
+        result = df == pd.NaT
+        # result.iloc[0, 0] is a np.bool_ object
+        assert result.iloc[0, 0].item() is False
+
+        result = df.eq(pd.NaT)
+        assert result.iloc[0, 0].item() is False
+
+        result = df != pd.NaT
+        assert result.iloc[0, 0].item() is True
+
+        result = df.ne(pd.NaT)
+        assert result.iloc[0, 0].item() is True
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_df_flex_cmp_constant_return_types(self, opname):
+        # GH 15077, non-empty DataFrame
+        df = pd.DataFrame({'x': [1, 2, 3], 'y': [1., 2., 3.]})
+        const = 2
+
+        result = getattr(df, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, pd.Series([2], ['bool']))
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_df_flex_cmp_constant_return_types_empty(self, opname):
+        # GH 15077 empty DataFrame
+        df = pd.DataFrame({'x': [1, 2, 3], 'y': [1., 2., 3.]})
+        const = 2
+
+        empty = df.iloc[:0]
+        result = getattr(empty, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, pd.Series([2], ['bool']))
+
+
+# -------------------------------------------------------------------
+# Arithmetic
+
+class TestFrameFlexArithmetic(object):
+
+    def test_df_add_td64_columnwise(self):
+        # GH 22534 Check that column-wise addition broadcasts correctly
+        dti = pd.date_range('2016-01-01', periods=10)
+        tdi = pd.timedelta_range('1', periods=10)
+        tser = pd.Series(tdi)
+        df = pd.DataFrame({0: dti, 1: tdi})
+
+        result = df.add(tser, axis=0)
+        expected = pd.DataFrame({0: dti + tdi,
+                                 1: tdi + tdi})
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_add_flex_filled_mixed_dtypes(self):
+        # GH 19611
+        dti = pd.date_range('2016-01-01', periods=3)
+        ser = pd.Series(['1 Day', 'NaT', '2 Days'], dtype='timedelta64[ns]')
+        df = pd.DataFrame({'A': dti, 'B': ser})
+        other = pd.DataFrame({'A': ser, 'B': ser})
+        fill = pd.Timedelta(days=1).to_timedelta64()
+        result = df.add(other, fill_value=fill)
+
+        expected = pd.DataFrame(
+            {'A': pd.Series(['2016-01-02', '2016-01-03', '2016-01-05'],
+                            dtype='datetime64[ns]'),
+             'B': ser * 2})
+        tm.assert_frame_equal(result, expected)
+
+    def test_arith_flex_frame(self, all_arithmetic_operators, float_frame,
+                              mixed_float_frame):
+        # one instance of parametrized fixture
+        op = all_arithmetic_operators
+
+        def f(x, y):
+            # r-versions not in operator-stdlib; get op without "r" and invert
+            if op.startswith('__r'):
+                return getattr(operator, op.replace('__r', '__'))(y, x)
+            return getattr(operator, op)(x, y)
+
+        result = getattr(float_frame, op)(2 * float_frame)
+        expected = f(float_frame, 2 * float_frame)
+        tm.assert_frame_equal(result, expected)
+
+        # vs mix float
+        result = getattr(mixed_float_frame, op)(2 * mixed_float_frame)
+        expected = f(mixed_float_frame, 2 * mixed_float_frame)
+        tm.assert_frame_equal(result, expected)
+        _check_mixed_float(result, dtype=dict(C=None))
+
+    @pytest.mark.parametrize('op', ['__add__', '__sub__', '__mul__'])
+    def test_arith_flex_frame_mixed(self, op, int_frame, mixed_int_frame,
+                                    mixed_float_frame):
+        f = getattr(operator, op)
+
+        # vs mix int
+        result = getattr(mixed_int_frame, op)(2 + mixed_int_frame)
+        expected = f(mixed_int_frame, 2 + mixed_int_frame)
+
+        # no overflow in the uint
+        dtype = None
+        if op in ['__sub__']:
+            dtype = dict(B='uint64', C=None)
+        elif op in ['__add__', '__mul__']:
+            dtype = dict(C=None)
+        tm.assert_frame_equal(result, expected)
+        _check_mixed_int(result, dtype=dtype)
+
+        # vs mix float
+        result = getattr(mixed_float_frame, op)(2 * mixed_float_frame)
+        expected = f(mixed_float_frame, 2 * mixed_float_frame)
+        tm.assert_frame_equal(result, expected)
+        _check_mixed_float(result, dtype=dict(C=None))
+
+        # vs plain int
+        result = getattr(int_frame, op)(2 * int_frame)
+        expected = f(int_frame, 2 * int_frame)
+        tm.assert_frame_equal(result, expected)
+
+    def test_arith_flex_frame_raise(self, all_arithmetic_operators,
+                                    float_frame):
+        # one instance of parametrized fixture
+        op = all_arithmetic_operators
+
+        # Check that arrays with dim >= 3 raise
+        for dim in range(3, 6):
+            arr = np.ones((1,) * dim)
+            msg = "Unable to coerce to Series/DataFrame"
+            with pytest.raises(ValueError, match=msg):
+                getattr(float_frame, op)(arr)
+
+    def test_arith_flex_frame_corner(self, float_frame):
+
+        const_add = float_frame.add(1)
+        tm.assert_frame_equal(const_add, float_frame + 1)
+
+        # corner cases
+        result = float_frame.add(float_frame[:0])
+        tm.assert_frame_equal(result, float_frame * np.nan)
+
+        result = float_frame[:0].add(float_frame)
+        tm.assert_frame_equal(result, float_frame * np.nan)
+
+        with pytest.raises(NotImplementedError, match='fill_value'):
+            float_frame.add(float_frame.iloc[0], fill_value=3)
+
+        with pytest.raises(NotImplementedError, match='fill_value'):
+            float_frame.add(float_frame.iloc[0], axis='index', fill_value=3)
+
+    def test_arith_flex_series(self, simple_frame):
+        df = simple_frame
+
+        row = df.xs('a')
+        col = df['two']
+        # after arithmetic refactor, add truediv here
+        ops = ['add', 'sub', 'mul', 'mod']
+        for op in ops:
+            f = getattr(df, op)
+            op = getattr(operator, op)
+            tm.assert_frame_equal(f(row), op(df, row))
+            tm.assert_frame_equal(f(col, axis=0), op(df.T, col).T)
+
+        # special case for some reason
+        tm.assert_frame_equal(df.add(row, axis=None), df + row)
+
+        # cases which will be refactored after big arithmetic refactor
+        tm.assert_frame_equal(df.div(row), df / row)
+        tm.assert_frame_equal(df.div(col, axis=0), (df.T / col).T)
+
+        # broadcasting issue in GH 7325
+        df = pd.DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='int64')
+        expected = pd.DataFrame([[np.nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
+        result = df.div(df[0], axis='index')
+        tm.assert_frame_equal(result, expected)
+
+        df = pd.DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='float64')
+        expected = pd.DataFrame([[np.nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
+        result = df.div(df[0], axis='index')
+        tm.assert_frame_equal(result, expected)
+
+    def test_arith_flex_zero_len_raises(self):
+        # GH 19522 passing fill_value to frame flex arith methods should
+        # raise even in the zero-length special cases
+        ser_len0 = pd.Series([])
+        df_len0 = pd.DataFrame([], columns=['A', 'B'])
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+
+        with pytest.raises(NotImplementedError, match='fill_value'):
+            df.add(ser_len0, fill_value='E')
+
+        with pytest.raises(NotImplementedError, match='fill_value'):
+            df_len0.sub(df['A'], axis=None, fill_value=3)
+
+
+class TestFrameArithmetic(object):
+    def test_df_add_2d_array_rowlike_broadcasts(self):
+        # GH#23000
+        arr = np.arange(6).reshape(3, 2)
+        df = pd.DataFrame(arr, columns=[True, False], index=['A', 'B', 'C'])
+
+        rowlike = arr[[1], :]  # shape --> (1, ncols)
+        assert rowlike.shape == (1, df.shape[1])
+
+        expected = pd.DataFrame([[2, 4],
+                                 [4, 6],
+                                 [6, 8]],
+                                columns=df.columns, index=df.index,
+                                # specify dtype explicitly to avoid failing
+                                # on 32bit builds
+                                dtype=arr.dtype)
+        result = df + rowlike
+        tm.assert_frame_equal(result, expected)
+        result = rowlike + df
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_add_2d_array_collike_broadcasts(self):
+        # GH#23000
+        arr = np.arange(6).reshape(3, 2)
+        df = pd.DataFrame(arr, columns=[True, False], index=['A', 'B', 'C'])
+
+        collike = arr[:, [1]]  # shape --> (nrows, 1)
+        assert collike.shape == (df.shape[0], 1)
+
+        expected = pd.DataFrame([[1, 2],
+                                 [5, 6],
+                                 [9, 10]],
+                                columns=df.columns, index=df.index,
+                                # specify dtype explicitly to avoid failing
+                                # on 32bit builds
+                                dtype=arr.dtype)
+        result = df + collike
+        tm.assert_frame_equal(result, expected)
+        result = collike + df
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_arith_2d_array_rowlike_broadcasts(self,
+                                                  all_arithmetic_operators):
+        # GH#23000
+        opname = all_arithmetic_operators
+
+        arr = np.arange(6).reshape(3, 2)
+        df = pd.DataFrame(arr, columns=[True, False], index=['A', 'B', 'C'])
+
+        rowlike = arr[[1], :]  # shape --> (1, ncols)
+        assert rowlike.shape == (1, df.shape[1])
+
+        exvals = [getattr(df.loc['A'], opname)(rowlike.squeeze()),
+                  getattr(df.loc['B'], opname)(rowlike.squeeze()),
+                  getattr(df.loc['C'], opname)(rowlike.squeeze())]
+
+        expected = pd.DataFrame(exvals, columns=df.columns, index=df.index)
+
+        if opname in ['__rmod__', '__rfloordiv__']:
+            # exvals will have dtypes [f8, i8, i8] so expected will be
+            #   all-f8, but the DataFrame operation will return mixed dtypes
+            # use exvals[-1].dtype instead of "i8" for compat with 32-bit
+            # systems/pythons
+            expected[False] = expected[False].astype(exvals[-1].dtype)
+
+        result = getattr(df, opname)(rowlike)
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_arith_2d_array_collike_broadcasts(self,
+                                                  all_arithmetic_operators):
+        # GH#23000
+        opname = all_arithmetic_operators
+
+        arr = np.arange(6).reshape(3, 2)
+        df = pd.DataFrame(arr, columns=[True, False], index=['A', 'B', 'C'])
+
+        collike = arr[:, [1]]  # shape --> (nrows, 1)
+        assert collike.shape == (df.shape[0], 1)
+
+        exvals = {True: getattr(df[True], opname)(collike.squeeze()),
+                  False: getattr(df[False], opname)(collike.squeeze())}
+
+        dtype = None
+        if opname in ['__rmod__', '__rfloordiv__']:
+            # Series ops may return mixed int/float dtypes in cases where
+            #   DataFrame op will return all-float.  So we upcast `expected`
+            dtype = np.common_type(*[x.values for x in exvals.values()])
+
+        expected = pd.DataFrame(exvals, columns=df.columns, index=df.index,
+                                dtype=dtype)
+
+        result = getattr(df, opname)(collike)
+        tm.assert_frame_equal(result, expected)
+
+    def test_df_bool_mul_int(self):
+        # GH 22047, GH 22163 multiplication by 1 should result in int dtype,
+        # not object dtype
+        df = pd.DataFrame([[False, True], [False, False]])
+        result = df * 1
+
+        # On appveyor this comes back as np.int32 instead of np.int64,
+        # so we check dtype.kind instead of just dtype
+        kinds = result.dtypes.apply(lambda x: x.kind)
+        assert (kinds == 'i').all()
+
+        result = 1 * df
+        kinds = result.dtypes.apply(lambda x: x.kind)
+        assert (kinds == 'i').all()
+
+    def test_arith_mixed(self):
+
+        left = pd.DataFrame({'A': ['a', 'b', 'c'],
+                             'B': [1, 2, 3]})
+
+        result = left + left
+        expected = pd.DataFrame({'A': ['aa', 'bb', 'cc'],
+                                 'B': [2, 4, 6]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_arith_getitem_commute(self):
+        df = pd.DataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
+
+        def _test_op(df, op):
+            result = op(df, 1)
+
+            if not df.columns.is_unique:
+                raise ValueError("Only unique columns supported by this test")
+
+            for col in result.columns:
+                tm.assert_series_equal(result[col], op(df[col], 1))
+
+        _test_op(df, operator.add)
+        _test_op(df, operator.sub)
+        _test_op(df, operator.mul)
+        _test_op(df, operator.truediv)
+        _test_op(df, operator.floordiv)
+        _test_op(df, operator.pow)
+
+        _test_op(df, lambda x, y: y + x)
+        _test_op(df, lambda x, y: y - x)
+        _test_op(df, lambda x, y: y * x)
+        _test_op(df, lambda x, y: y / x)
+        _test_op(df, lambda x, y: y ** x)
+
+        _test_op(df, lambda x, y: x + y)
+        _test_op(df, lambda x, y: x - y)
+        _test_op(df, lambda x, y: x * y)
+        _test_op(df, lambda x, y: x / y)
+        _test_op(df, lambda x, y: x ** y)
+
+    @pytest.mark.parametrize('values', [[1, 2], (1, 2), np.array([1, 2]),
+                                        range(1, 3), deque([1, 2])])
+    def test_arith_alignment_non_pandas_object(self, values):
+        # GH#17901
+        df = pd.DataFrame({'A': [1, 1], 'B': [1, 1]})
+        expected = pd.DataFrame({'A': [2, 2], 'B': [3, 3]})
+        result = df + values
+        tm.assert_frame_equal(result, expected)
+
+    def test_arith_non_pandas_object(self):
+        df = pd.DataFrame(np.arange(1, 10, dtype='f8').reshape(3, 3),
+                          columns=['one', 'two', 'three'],
+                          index=['a', 'b', 'c'])
+
+        val1 = df.xs('a').values
+        added = pd.DataFrame(df.values + val1,
+                             index=df.index, columns=df.columns)
+        tm.assert_frame_equal(df + val1, added)
+
+        added = pd.DataFrame((df.values.T + val1).T,
+                             index=df.index, columns=df.columns)
+        tm.assert_frame_equal(df.add(val1, axis=0), added)
+
+        val2 = list(df['two'])
+
+        added = pd.DataFrame(df.values + val2,
+                             index=df.index, columns=df.columns)
+        tm.assert_frame_equal(df + val2, added)
+
+        added = pd.DataFrame((df.values.T + val2).T, index=df.index,
+                             columns=df.columns)
+        tm.assert_frame_equal(df.add(val2, axis='index'), added)
+
+        val3 = np.random.rand(*df.shape)
+        added = pd.DataFrame(df.values + val3,
+                             index=df.index, columns=df.columns)
+        tm.assert_frame_equal(df.add(val3), added)
diff --git a/pandas/tests/frame/test_asof.py b/pandas/tests/frame/test_asof.py
index dd03f8f7cb7a9..0947e6f252dab 100644
--- a/pandas/tests/frame/test_asof.py
+++ b/pandas/tests/frame/test_asof.py
@@ -1,16 +1,16 @@
 # coding=utf-8
 
 import numpy as np
-from pandas import (DataFrame, date_range, Timestamp, Series,
-                    to_datetime)
+import pytest
 
+from pandas import DataFrame, Series, Timestamp, date_range, to_datetime
 import pandas.util.testing as tm
 
 from .common import TestData
 
 
-class TestFrameAsof(TestData, tm.TestCase):
-    def setUp(self):
+class TestFrameAsof(TestData):
+    def setup_method(self, method):
         self.N = N = 50
         self.rng = date_range('1/1/1990', periods=N, freq='53s')
         self.df = DataFrame({'A': np.arange(N), 'B': np.arange(N)},
@@ -23,17 +23,17 @@ def test_basic(self):
                            freq='25s')
 
         result = df.asof(dates)
-        self.assertTrue(result.notnull().all(1).all())
+        assert result.notna().all(1).all()
         lb = df.index[14]
         ub = df.index[30]
 
         dates = list(dates)
         result = df.asof(dates)
-        self.assertTrue(result.notnull().all(1).all())
+        assert result.notna().all(1).all()
 
         mask = (result.index >= lb) & (result.index < ub)
         rs = result[mask]
-        self.assertTrue((rs == 14).all(1).all())
+        assert (rs == 14).all(1).all()
 
     def test_subset(self):
         N = 10
@@ -106,3 +106,21 @@ def test_all_nans(self):
         result = DataFrame(np.nan, index=[1, 2], columns=['A', 'B']).asof(3)
         expected = Series(np.nan, index=['A', 'B'], name=3)
         tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "stamp,expected",
+        [(Timestamp('2018-01-01 23:22:43.325+00:00'),
+          Series(2.0, name=Timestamp('2018-01-01 23:22:43.325+00:00'))),
+         (Timestamp('2018-01-01 22:33:20.682+01:00'),
+          Series(1.0, name=Timestamp('2018-01-01 22:33:20.682+01:00'))),
+         ]
+    )
+    def test_time_zone_aware_index(self, stamp, expected):
+        # GH21194
+        # Testing awareness of DataFrame index considering different
+        # UTC and timezone
+        df = DataFrame(data=[1, 2],
+                       index=[Timestamp('2018-01-01 21:00:05.001+00:00'),
+                              Timestamp('2018-01-01 22:35:10.550+00:00')])
+        result = df.asof(stamp)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/frame/test_axis_select_reindex.py b/pandas/tests/frame/test_axis_select_reindex.py
index 839ceb5368240..cf8c55f00b061 100644
--- a/pandas/tests/frame/test_axis_select_reindex.py
+++ b/pandas/tests/frame/test_axis_select_reindex.py
@@ -4,25 +4,22 @@
 
 from datetime import datetime
 
-from numpy import random
 import numpy as np
+import pytest
 
-from pandas.compat import lrange, lzip, u
-from pandas import (compat, DataFrame, Series, Index, MultiIndex,
-                    date_range, isnull)
-import pandas as pd
-
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
-from pandas.core.common import PerformanceWarning
-import pandas.util.testing as tm
+from pandas.compat import PY2, lrange, lzip, u
+from pandas.errors import PerformanceWarning
 
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, MultiIndex, Series, compat, date_range,
+    isna)
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
 
 
-class TestDataFrameSelectReindex(tm.TestCase, TestData):
+class TestDataFrameSelectReindex(TestData):
     # These are specific reindex-based tests; other indexing tests should go in
     # test_indexing
 
@@ -37,29 +34,37 @@ def test_drop_names(self):
         df_inplace_b.drop('b', inplace=True)
         df_inplace_e.drop('e', axis=1, inplace=True)
         for obj in (df_dropped_b, df_dropped_e, df_inplace_b, df_inplace_e):
-            self.assertEqual(obj.index.name, 'first')
-            self.assertEqual(obj.columns.name, 'second')
-        self.assertEqual(list(df.columns), ['d', 'e', 'f'])
+            assert obj.index.name == 'first'
+            assert obj.columns.name == 'second'
+        assert list(df.columns) == ['d', 'e', 'f']
 
-        self.assertRaises(ValueError, df.drop, ['g'])
-        self.assertRaises(ValueError, df.drop, ['g'], 1)
+        msg = r"\['g'\] not found in axis"
+        with pytest.raises(KeyError, match=msg):
+            df.drop(['g'])
+        with pytest.raises(KeyError, match=msg):
+            df.drop(['g'], 1)
 
         # errors = 'ignore'
         dropped = df.drop(['g'], errors='ignore')
         expected = Index(['a', 'b', 'c'], name='first')
-        self.assert_index_equal(dropped.index, expected)
+        tm.assert_index_equal(dropped.index, expected)
 
         dropped = df.drop(['b', 'g'], errors='ignore')
         expected = Index(['a', 'c'], name='first')
-        self.assert_index_equal(dropped.index, expected)
+        tm.assert_index_equal(dropped.index, expected)
 
         dropped = df.drop(['g'], axis=1, errors='ignore')
         expected = Index(['d', 'e', 'f'], name='second')
-        self.assert_index_equal(dropped.columns, expected)
+        tm.assert_index_equal(dropped.columns, expected)
 
         dropped = df.drop(['d', 'g'], axis=1, errors='ignore')
         expected = Index(['e', 'f'], name='second')
-        self.assert_index_equal(dropped.columns, expected)
+        tm.assert_index_equal(dropped.columns, expected)
+
+        # GH 16398
+        dropped = df.drop([], errors='ignore')
+        expected = Index(['a', 'b', 'c'], name='first')
+        tm.assert_index_equal(dropped.index, expected)
 
     def test_drop_col_still_multiindex(self):
         arrays = [['a', 'b', 'c', 'top'],
@@ -82,10 +87,14 @@ def test_drop(self):
         assert_frame_equal(simple.drop(
             [0, 3], axis='index'), simple.loc[[1, 2], :])
 
-        self.assertRaises(ValueError, simple.drop, 5)
-        self.assertRaises(ValueError, simple.drop, 'C', 1)
-        self.assertRaises(ValueError, simple.drop, [1, 5])
-        self.assertRaises(ValueError, simple.drop, ['A', 'C'], 1)
+        with pytest.raises(KeyError, match=r"\[5\] not found in axis"):
+            simple.drop(5)
+        with pytest.raises(KeyError, match=r"\['C'\] not found in axis"):
+            simple.drop('C', 1)
+        with pytest.raises(KeyError, match=r"\[5\] not found in axis"):
+            simple.drop([1, 5])
+        with pytest.raises(KeyError, match=r"\['C'\] not found in axis"):
+            simple.drop(['A', 'C'], 1)
 
         # errors = 'ignore'
         assert_frame_equal(simple.drop(5, errors='ignore'), simple)
@@ -100,6 +109,7 @@ def test_drop(self):
                           columns=['a', 'a', 'b'])
         assert_frame_equal(nu_df.drop('a', axis=1), nu_df[['b']])
         assert_frame_equal(nu_df.drop('b', axis='columns'), nu_df['a'])
+        assert_frame_equal(nu_df.drop([]), nu_df)  # GH 16398
 
         nu_df = nu_df.set_index(pd.Index(['X', 'Y', 'X']))
         nu_df.columns = list('abc')
@@ -120,7 +130,7 @@ def test_drop_multiindex_not_lexsorted(self):
         lexsorted_mi = MultiIndex.from_tuples(
             [('a', ''), ('b1', 'c1'), ('b2', 'c2')], names=['b', 'c'])
         lexsorted_df = DataFrame([[1, 3, 4]], columns=lexsorted_mi)
-        self.assertTrue(lexsorted_df.columns.is_lexsorted())
+        assert lexsorted_df.columns.is_lexsorted()
 
         # define the non-lexsorted version
         not_lexsorted_df = DataFrame(columns=['a', 'b', 'c', 'd'],
@@ -129,7 +139,7 @@ def test_drop_multiindex_not_lexsorted(self):
         not_lexsorted_df = not_lexsorted_df.pivot_table(
             index='a', columns=['b', 'c'], values='d')
         not_lexsorted_df = not_lexsorted_df.reset_index()
-        self.assertFalse(not_lexsorted_df.columns.is_lexsorted())
+        assert not not_lexsorted_df.columns.is_lexsorted()
 
         # compare the results
         tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
@@ -140,6 +150,41 @@ def test_drop_multiindex_not_lexsorted(self):
 
         tm.assert_frame_equal(result, expected)
 
+    def test_drop_api_equivalence(self):
+        # equivalence of the labels/axis and index/columns API's (GH12392)
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.drop('a')
+        res2 = df.drop(index='a')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop('d', 1)
+        res2 = df.drop(columns='d')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(labels='e', axis=1)
+        res2 = df.drop(columns='e')
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(['a'], axis=0)
+        res2 = df.drop(index=['a'])
+        tm.assert_frame_equal(res1, res2)
+
+        res1 = df.drop(['a'], axis=0).drop(['d'], axis=1)
+        res2 = df.drop(index=['a'], columns=['d'])
+        tm.assert_frame_equal(res1, res2)
+
+        with pytest.raises(ValueError):
+            df.drop(labels='a', index='b')
+
+        with pytest.raises(ValueError):
+            df.drop(labels='a', columns='b')
+
+        with pytest.raises(ValueError):
+            df.drop(axis=1)
+
     def test_merge_join_different_levels(self):
         # GH 9455
 
@@ -172,16 +217,16 @@ def test_reindex(self):
             for idx, val in compat.iteritems(newFrame[col]):
                 if idx in self.frame.index:
                     if np.isnan(val):
-                        self.assertTrue(np.isnan(self.frame[col][idx]))
+                        assert np.isnan(self.frame[col][idx])
                     else:
-                        self.assertEqual(val, self.frame[col][idx])
+                        assert val == self.frame[col][idx]
                 else:
-                    self.assertTrue(np.isnan(val))
+                    assert np.isnan(val)
 
         for col, series in compat.iteritems(newFrame):
-            self.assertTrue(tm.equalContents(series.index, newFrame.index))
+            assert tm.equalContents(series.index, newFrame.index)
         emptyFrame = self.frame.reindex(Index([]))
-        self.assertEqual(len(emptyFrame.index), 0)
+        assert len(emptyFrame.index) == 0
 
         # Cython code should be unit-tested directly
         nonContigFrame = self.frame.reindex(self.ts1.index[::2])
@@ -190,41 +235,40 @@ def test_reindex(self):
             for idx, val in compat.iteritems(nonContigFrame[col]):
                 if idx in self.frame.index:
                     if np.isnan(val):
-                        self.assertTrue(np.isnan(self.frame[col][idx]))
+                        assert np.isnan(self.frame[col][idx])
                     else:
-                        self.assertEqual(val, self.frame[col][idx])
+                        assert val == self.frame[col][idx]
                 else:
-                    self.assertTrue(np.isnan(val))
+                    assert np.isnan(val)
 
         for col, series in compat.iteritems(nonContigFrame):
-            self.assertTrue(tm.equalContents(series.index,
-                                             nonContigFrame.index))
+            assert tm.equalContents(series.index, nonContigFrame.index)
 
         # corner cases
 
         # Same index, copies values but not index if copy=False
         newFrame = self.frame.reindex(self.frame.index, copy=False)
-        self.assertIs(newFrame.index, self.frame.index)
+        assert newFrame.index is self.frame.index
 
         # length zero
         newFrame = self.frame.reindex([])
-        self.assertTrue(newFrame.empty)
-        self.assertEqual(len(newFrame.columns), len(self.frame.columns))
+        assert newFrame.empty
+        assert len(newFrame.columns) == len(self.frame.columns)
 
         # length zero with columns reindexed with non-empty index
         newFrame = self.frame.reindex([])
         newFrame = newFrame.reindex(self.frame.index)
-        self.assertEqual(len(newFrame.index), len(self.frame.index))
-        self.assertEqual(len(newFrame.columns), len(self.frame.columns))
+        assert len(newFrame.index) == len(self.frame.index)
+        assert len(newFrame.columns) == len(self.frame.columns)
 
         # pass non-Index
         newFrame = self.frame.reindex(list(self.ts1.index))
-        self.assert_index_equal(newFrame.index, self.ts1.index)
+        tm.assert_index_equal(newFrame.index, self.ts1.index)
 
         # copy with no axes
         result = self.frame.reindex()
         assert_frame_equal(result, self.frame)
-        self.assertFalse(result is self.frame)
+        assert result is not self.frame
 
     def test_reindex_nan(self):
         df = pd.DataFrame([[1, 2], [3, 5], [7, 11], [9, 23]],
@@ -251,32 +295,32 @@ def test_reindex_nan(self):
         assert_frame_equal(left, right)
 
     def test_reindex_name_remains(self):
-        s = Series(random.rand(10))
+        s = Series(np.random.rand(10))
         df = DataFrame(s, index=np.arange(len(s)))
         i = Series(np.arange(10), name='iname')
 
         df = df.reindex(i)
-        self.assertEqual(df.index.name, 'iname')
+        assert df.index.name == 'iname'
 
         df = df.reindex(Index(np.arange(10), name='tmpname'))
-        self.assertEqual(df.index.name, 'tmpname')
+        assert df.index.name == 'tmpname'
 
-        s = Series(random.rand(10))
+        s = Series(np.random.rand(10))
         df = DataFrame(s.T, index=np.arange(len(s)))
         i = Series(np.arange(10), name='iname')
         df = df.reindex(columns=i)
-        self.assertEqual(df.columns.name, 'iname')
+        assert df.columns.name == 'iname'
 
     def test_reindex_int(self):
         smaller = self.intframe.reindex(self.intframe.index[::2])
 
-        self.assertEqual(smaller['A'].dtype, np.int64)
+        assert smaller['A'].dtype == np.int64
 
         bigger = smaller.reindex(self.intframe.index)
-        self.assertEqual(bigger['A'].dtype, np.float64)
+        assert bigger['A'].dtype == np.float64
 
         smaller = self.intframe.reindex(columns=['A', 'B'])
-        self.assertEqual(smaller['A'].dtype, np.int64)
+        assert smaller['A'].dtype == np.int64
 
     def test_reindex_like(self):
         other = self.frame.reindex(index=self.frame.index[:10],
@@ -285,15 +329,15 @@ def test_reindex_like(self):
         assert_frame_equal(other, self.frame.reindex_like(other))
 
     def test_reindex_columns(self):
-        newFrame = self.frame.reindex(columns=['A', 'B', 'E'])
+        new_frame = self.frame.reindex(columns=['A', 'B', 'E'])
 
-        assert_series_equal(newFrame['B'], self.frame['B'])
-        self.assertTrue(np.isnan(newFrame['E']).all())
-        self.assertNotIn('C', newFrame)
+        tm.assert_series_equal(new_frame['B'], self.frame['B'])
+        assert np.isnan(new_frame['E']).all()
+        assert 'C' not in new_frame
 
-        # length zero
-        newFrame = self.frame.reindex(columns=[])
-        self.assertTrue(newFrame.empty)
+        # Length zero
+        new_frame = self.frame.reindex(columns=[])
+        assert new_frame.empty
 
     def test_reindex_columns_method(self):
 
@@ -347,15 +391,15 @@ def test_reindex_axes(self):
         both_freq = df.reindex(index=time_freq, columns=some_cols).index.freq
         seq_freq = df.reindex(index=time_freq).reindex(
             columns=some_cols).index.freq
-        self.assertEqual(index_freq, both_freq)
-        self.assertEqual(index_freq, seq_freq)
+        assert index_freq == both_freq
+        assert index_freq == seq_freq
 
     def test_reindex_fill_value(self):
         df = DataFrame(np.random.randn(10, 4))
 
         # axis=0
         result = df.reindex(lrange(15))
-        self.assertTrue(np.isnan(result.values[-5:]).all())
+        assert np.isnan(result.values[-5:]).all()
 
         result = df.reindex(lrange(15), fill_value=0)
         expected = df.reindex(lrange(15)).fillna(0)
@@ -378,11 +422,13 @@ def test_reindex_fill_value(self):
         assert_frame_equal(result, expected)
 
         # reindex_axis
-        result = df.reindex_axis(lrange(15), fill_value=0., axis=0)
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex_axis(lrange(15), fill_value=0., axis=0)
         expected = df.reindex(lrange(15)).fillna(0)
         assert_frame_equal(result, expected)
 
-        result = df.reindex_axis(lrange(5), fill_value=0., axis=1)
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex_axis(lrange(5), fill_value=0., axis=1)
         expected = df.reindex(columns=lrange(5)).fillna(0)
         assert_frame_equal(result, expected)
 
@@ -405,37 +451,137 @@ def test_reindex_dups(self):
         assert_frame_equal(result, expected)
 
         # reindex fails
-        self.assertRaises(ValueError, df.reindex, index=list(range(len(df))))
+        msg = "cannot reindex from a duplicate axis"
+        with pytest.raises(ValueError, match=msg):
+            df.reindex(index=list(range(len(df))))
+
+    def test_reindex_axis_style(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        expected = pd.DataFrame({"A": [1, 2, np.nan], "B": [4, 5, np.nan]},
+                                index=[0, 1, 3])
+        result = df.reindex([0, 1, 3])
+        assert_frame_equal(result, expected)
+
+        result = df.reindex([0, 1, 3], axis=0)
+        assert_frame_equal(result, expected)
+
+        result = df.reindex([0, 1, 3], axis='index')
+        assert_frame_equal(result, expected)
+
+    def test_reindex_positional_warns(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+        expected = pd.DataFrame({"A": [1., 2], 'B': [4., 5],
+                                 "C": [np.nan, np.nan]})
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.reindex([0, 1], ['A', 'B', 'C'])
+
+        assert_frame_equal(result, expected)
+
+    def test_reindex_axis_style_raises(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], 'B': [4, 5, 6]})
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex([0, 1], ['A'], axis=1)
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex([0, 1], ['A'], axis='index')
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='index')
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='columns')
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(columns=[0, 1], axis='columns')
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], columns=[0, 1], axis='columns')
+
+        with pytest.raises(TypeError, match='Cannot specify all'):
+            df.reindex([0, 1], [0], ['A'])
+
+        # Mixing styles
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='index')
+
+        with pytest.raises(TypeError, match="Cannot specify both 'axis'"):
+            df.reindex(index=[0, 1], axis='columns')
+
+        # Duplicates
+        with pytest.raises(TypeError, match="multiple values"):
+            df.reindex([0, 1], labels=[0, 1])
+
+    def test_reindex_single_named_indexer(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        df = pd.DataFrame({"A": [1, 2, 3], "B": [1, 2, 3]})
+        result = df.reindex([0, 1], columns=['A'])
+        expected = pd.DataFrame({"A": [1, 2]})
+        assert_frame_equal(result, expected)
+
+    def test_reindex_api_equivalence(self):
+        # https://github.com/pandas-dev/pandas/issues/12392
+        # equivalence of the labels/axis and index/columns API's
+        df = DataFrame([[1, 2, 3], [3, 4, 5], [5, 6, 7]],
+                       index=['a', 'b', 'c'],
+                       columns=['d', 'e', 'f'])
+
+        res1 = df.reindex(['b', 'a'])
+        res2 = df.reindex(index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'])
+        res4 = df.reindex(labels=['b', 'a'], axis=0)
+        res5 = df.reindex(['b', 'a'], axis=0)
+        for res in [res2, res3, res4, res5]:
+            tm.assert_frame_equal(res1, res)
+
+        res1 = df.reindex(columns=['e', 'd'])
+        res2 = df.reindex(['e', 'd'], axis=1)
+        res3 = df.reindex(labels=['e', 'd'], axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
+
+        with tm.assert_produces_warning(FutureWarning) as m:
+            res1 = df.reindex(['b', 'a'], ['e', 'd'])
+        assert 'reindex' in str(m[0].message)
+        res2 = df.reindex(columns=['e', 'd'], index=['b', 'a'])
+        res3 = df.reindex(labels=['b', 'a'], axis=0).reindex(labels=['e', 'd'],
+                                                             axis=1)
+        for res in [res2, res3]:
+            tm.assert_frame_equal(res1, res)
 
     def test_align(self):
         af, bf = self.frame.align(self.frame)
-        self.assertIsNot(af._data, self.frame._data)
+        assert af._data is not self.frame._data
 
         af, bf = self.frame.align(self.frame, copy=False)
-        self.assertIs(af._data, self.frame._data)
+        assert af._data is self.frame._data
 
         # axis = 0
         other = self.frame.iloc[:-5, :3]
         af, bf = self.frame.align(other, axis=0, fill_value=-1)
-        self.assert_index_equal(bf.columns, other.columns)
+
+        tm.assert_index_equal(bf.columns, other.columns)
+
         # test fill value
         join_idx = self.frame.index.join(other.index)
         diff_a = self.frame.index.difference(join_idx)
         diff_b = other.index.difference(join_idx)
         diff_a_vals = af.reindex(diff_a).values
         diff_b_vals = bf.reindex(diff_b).values
-        self.assertTrue((diff_a_vals == -1).all())
+        assert (diff_a_vals == -1).all()
 
         af, bf = self.frame.align(other, join='right', axis=0)
-        self.assert_index_equal(bf.columns, other.columns)
-        self.assert_index_equal(bf.index, other.index)
-        self.assert_index_equal(af.index, other.index)
+        tm.assert_index_equal(bf.columns, other.columns)
+        tm.assert_index_equal(bf.index, other.index)
+        tm.assert_index_equal(af.index, other.index)
 
         # axis = 1
         other = self.frame.iloc[:-5, :3].copy()
         af, bf = self.frame.align(other, axis=1)
-        self.assert_index_equal(bf.columns, self.frame.columns)
-        self.assert_index_equal(bf.index, other.index)
+        tm.assert_index_equal(bf.columns, self.frame.columns)
+        tm.assert_index_equal(bf.index, other.index)
 
         # test fill value
         join_idx = self.frame.index.join(other.index)
@@ -446,42 +592,42 @@ def test_align(self):
         # TODO(wesm): unused?
         diff_b_vals = bf.reindex(diff_b).values  # noqa
 
-        self.assertTrue((diff_a_vals == -1).all())
+        assert (diff_a_vals == -1).all()
 
         af, bf = self.frame.align(other, join='inner', axis=1)
-        self.assert_index_equal(bf.columns, other.columns)
+        tm.assert_index_equal(bf.columns, other.columns)
 
         af, bf = self.frame.align(other, join='inner', axis=1, method='pad')
-        self.assert_index_equal(bf.columns, other.columns)
+        tm.assert_index_equal(bf.columns, other.columns)
 
         # test other non-float types
         af, bf = self.intframe.align(other, join='inner', axis=1, method='pad')
-        self.assert_index_equal(bf.columns, other.columns)
+        tm.assert_index_equal(bf.columns, other.columns)
 
         af, bf = self.mixed_frame.align(self.mixed_frame,
                                         join='inner', axis=1, method='pad')
-        self.assert_index_equal(bf.columns, self.mixed_frame.columns)
+        tm.assert_index_equal(bf.columns, self.mixed_frame.columns)
 
         af, bf = self.frame.align(other.iloc[:, 0], join='inner', axis=1,
                                   method=None, fill_value=None)
-        self.assert_index_equal(bf.index, Index([]))
+        tm.assert_index_equal(bf.index, Index([]))
 
         af, bf = self.frame.align(other.iloc[:, 0], join='inner', axis=1,
                                   method=None, fill_value=0)
-        self.assert_index_equal(bf.index, Index([]))
+        tm.assert_index_equal(bf.index, Index([]))
 
         # mixed floats/ints
         af, bf = self.mixed_float.align(other.iloc[:, 0], join='inner', axis=1,
                                         method=None, fill_value=0)
-        self.assert_index_equal(bf.index, Index([]))
+        tm.assert_index_equal(bf.index, Index([]))
 
         af, bf = self.mixed_int.align(other.iloc[:, 0], join='inner', axis=1,
                                       method=None, fill_value=0)
-        self.assert_index_equal(bf.index, Index([]))
+        tm.assert_index_equal(bf.index, Index([]))
 
-        # try to align dataframe to series along bad axis
-        self.assertRaises(ValueError, self.frame.align, af.iloc[0, :3],
-                          join='inner', axis=2)
+        # Try to align DataFrame to Series along bad axis
+        with pytest.raises(ValueError):
+            self.frame.align(af.iloc[0, :3], join='inner', axis=2)
 
         # align dataframe to series with broadcast or not
         idx = self.frame.index
@@ -490,26 +636,24 @@ def test_align(self):
         left, right = self.frame.align(s, axis=0)
         tm.assert_index_equal(left.index, self.frame.index)
         tm.assert_index_equal(right.index, self.frame.index)
-        self.assertTrue(isinstance(right, Series))
+        assert isinstance(right, Series)
 
         left, right = self.frame.align(s, broadcast_axis=1)
         tm.assert_index_equal(left.index, self.frame.index)
-        expected = {}
-        for c in self.frame.columns:
-            expected[c] = s
+        expected = {c: s for c in self.frame.columns}
         expected = DataFrame(expected, index=self.frame.index,
                              columns=self.frame.columns)
-        assert_frame_equal(right, expected)
+        tm.assert_frame_equal(right, expected)
 
-        # GH 9558
+        # see gh-9558
         df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
         result = df[df['a'] == 2]
         expected = DataFrame([[2, 5]], index=[1], columns=['a', 'b'])
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         result = df.where(df['a'] == 2, 0)
         expected = DataFrame({'a': [0, 2, 0], 'b': [0, 5, 0]})
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def _check_align(self, a, b, axis, fill_axis, how, method, limit=None):
         aa, ab = a.align(b, axis=axis, join=how, method=method, limit=limit,
@@ -534,29 +678,12 @@ def _check_align(self, a, b, axis, fill_axis, how, method, limit=None):
         assert_frame_equal(aa, ea)
         assert_frame_equal(ab, eb)
 
-    def test_align_fill_method_inner(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('inner', meth, ax, fax)
-
-    def test_align_fill_method_outer(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('outer', meth, ax, fax)
-
-    def test_align_fill_method_left(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('left', meth, ax, fax)
-
-    def test_align_fill_method_right(self):
-        for meth in ['pad', 'bfill']:
-            for ax in [0, 1, None]:
-                for fax in [0, 1]:
-                    self._check_align_fill('right', meth, ax, fax)
+    @pytest.mark.parametrize('meth', ['pad', 'bfill'])
+    @pytest.mark.parametrize('ax', [0, 1, None])
+    @pytest.mark.parametrize('fax', [0, 1])
+    @pytest.mark.parametrize('how', ['inner', 'outer', 'left', 'right'])
+    def test_align_fill_method(self, how, meth, ax, fax):
+        self._check_align_fill(how, meth, ax, fax)
 
     def _check_align_fill(self, kind, meth, ax, fax):
         left = self.frame.iloc[0:4, :10]
@@ -655,33 +782,33 @@ def test_align_series_combinations(self):
         tm.assert_frame_equal(res2, exp1)
 
     def test_filter(self):
-        # items
+        # Items
         filtered = self.frame.filter(['A', 'B', 'E'])
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertNotIn('E', filtered)
+        assert len(filtered.columns) == 2
+        assert 'E' not in filtered
 
         filtered = self.frame.filter(['A', 'B', 'E'], axis='columns')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertNotIn('E', filtered)
+        assert len(filtered.columns) == 2
+        assert 'E' not in filtered
 
-        # other axis
+        # Other axis
         idx = self.frame.index[0:4]
         filtered = self.frame.filter(idx, axis='index')
         expected = self.frame.reindex(index=idx)
-        assert_frame_equal(filtered, expected)
+        tm.assert_frame_equal(filtered, expected)
 
         # like
         fcopy = self.frame.copy()
         fcopy['AA'] = 1
 
         filtered = fcopy.filter(like='A')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertIn('AA', filtered)
+        assert len(filtered.columns) == 2
+        assert 'AA' in filtered
 
         # like with ints in column names
         df = DataFrame(0., index=[0, 1, 2], columns=[0, 1, '_A', '_B'])
         filtered = df.filter(like='_')
-        self.assertEqual(len(filtered.columns), 2)
+        assert len(filtered.columns) == 2
 
         # regex with ints in column names
         # from PR #10384
@@ -689,41 +816,41 @@ def test_filter(self):
         expected = DataFrame(
             0., index=[0, 1, 2], columns=pd.Index([1, 2], dtype=object))
         filtered = df.filter(regex='^[0-9]+$')
-        assert_frame_equal(filtered, expected)
+        tm.assert_frame_equal(filtered, expected)
 
         expected = DataFrame(0., index=[0, 1, 2], columns=[0, '0', 1, '1'])
         # shouldn't remove anything
         filtered = expected.filter(regex='^[0-9]+$')
-        assert_frame_equal(filtered, expected)
+        tm.assert_frame_equal(filtered, expected)
 
         # pass in None
-        with assertRaisesRegexp(TypeError, 'Must pass'):
+        with pytest.raises(TypeError, match='Must pass'):
             self.frame.filter()
-        with assertRaisesRegexp(TypeError, 'Must pass'):
+        with pytest.raises(TypeError, match='Must pass'):
             self.frame.filter(items=None)
-        with assertRaisesRegexp(TypeError, 'Must pass'):
+        with pytest.raises(TypeError, match='Must pass'):
             self.frame.filter(axis=1)
 
         # test mutually exclusive arguments
-        with assertRaisesRegexp(TypeError, 'mutually exclusive'):
+        with pytest.raises(TypeError, match='mutually exclusive'):
             self.frame.filter(items=['one', 'three'], regex='e$', like='bbi')
-        with assertRaisesRegexp(TypeError, 'mutually exclusive'):
+        with pytest.raises(TypeError, match='mutually exclusive'):
             self.frame.filter(items=['one', 'three'], regex='e$', axis=1)
-        with assertRaisesRegexp(TypeError, 'mutually exclusive'):
+        with pytest.raises(TypeError, match='mutually exclusive'):
             self.frame.filter(items=['one', 'three'], regex='e$')
-        with assertRaisesRegexp(TypeError, 'mutually exclusive'):
+        with pytest.raises(TypeError, match='mutually exclusive'):
             self.frame.filter(items=['one', 'three'], like='bbi', axis=0)
-        with assertRaisesRegexp(TypeError, 'mutually exclusive'):
+        with pytest.raises(TypeError, match='mutually exclusive'):
             self.frame.filter(items=['one', 'three'], like='bbi')
 
         # objects
         filtered = self.mixed_frame.filter(like='foo')
-        self.assertIn('foo', filtered)
+        assert 'foo' in filtered
 
         # unicode columns, won't ascii-encode
         df = self.frame.rename(columns={'B': u('\u2202')})
         filtered = df.filter(like='C')
-        self.assertTrue('C' in filtered)
+        assert 'C' in filtered
 
     def test_filter_regex_search(self):
         fcopy = self.frame.copy()
@@ -731,8 +858,8 @@ def test_filter_regex_search(self):
 
         # regex
         filtered = fcopy.filter(regex='[A]+')
-        self.assertEqual(len(filtered.columns), 2)
-        self.assertIn('AA', filtered)
+        assert len(filtered.columns) == 2
+        assert 'AA' in filtered
 
         # doesn't have to be at beginning
         df = DataFrame({'aBBa': [1, 2],
@@ -744,6 +871,27 @@ def test_filter_regex_search(self):
         exp = df[[x for x in df.columns if 'BB' in x]]
         assert_frame_equal(result, exp)
 
+    @pytest.mark.parametrize('name,expected', [
+        ('a', DataFrame({u'a': [1, 2]})),
+        (u'a', DataFrame({u'a': [1, 2]})),
+        (u'あ', DataFrame({u'あ': [3, 4]}))
+    ])
+    def test_filter_unicode(self, name, expected):
+        # GH13101
+        df = DataFrame({u'a': [1, 2], u'あ': [3, 4]})
+
+        assert_frame_equal(df.filter(like=name), expected)
+        assert_frame_equal(df.filter(regex=name), expected)
+
+    @pytest.mark.parametrize('name', ['a', u'a'])
+    def test_filter_bytestring(self, name):
+        # GH13101
+        df = DataFrame({b'a': [1, 2], b'b': [3, 4]})
+        expected = DataFrame({b'a': [1, 2]})
+
+        assert_frame_equal(df.filter(like=name), expected)
+        assert_frame_equal(df.filter(regex=name), expected)
+
     def test_filter_corner(self):
         empty = DataFrame()
 
@@ -754,16 +902,38 @@ def test_filter_corner(self):
         assert_frame_equal(result, empty)
 
     def test_select(self):
+
+        # deprecated: gh-12410
         f = lambda x: x.weekday() == 2
-        result = self.tsframe.select(f, axis=0)
-        expected = self.tsframe.reindex(
-            index=self.tsframe.index[[f(x) for x in self.tsframe.index]])
-        assert_frame_equal(result, expected)
+        index = self.tsframe.index[[f(x) for x in self.tsframe.index]]
+        expected_weekdays = self.tsframe.reindex(index=index)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = self.tsframe.select(f, axis=0)
+            assert_frame_equal(result, expected_weekdays)
+
+            result = self.frame.select(lambda x: x in ('B', 'D'), axis=1)
+            expected = self.frame.reindex(columns=['B', 'D'])
+            assert_frame_equal(result, expected, check_names=False)
 
-        result = self.frame.select(lambda x: x in ('B', 'D'), axis=1)
+        # replacement
+        f = lambda x: x.weekday == 2
+        result = self.tsframe.loc(axis=0)[f(self.tsframe.index)]
+        assert_frame_equal(result, expected_weekdays)
+
+        crit = lambda x: x in ['B', 'D']
+        result = self.frame.loc(axis=1)[(self.frame.columns.map(crit))]
         expected = self.frame.reindex(columns=['B', 'D'])
+        assert_frame_equal(result, expected, check_names=False)
 
-        # TODO should reindex check_names?
+        # doc example
+        df = DataFrame({'A': [1, 2, 3]}, index=['foo', 'bar', 'baz'])
+
+        crit = lambda x: x in ['bar', 'baz']
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.select(crit)
+        result = df.loc[df.index.map(crit)]
         assert_frame_equal(result, expected, check_names=False)
 
     def test_take(self):
@@ -780,7 +950,7 @@ def test_take(self):
             expected = df.loc[:, ['D', 'B', 'C', 'A']]
             assert_frame_equal(result, expected, check_names=False)
 
-        # neg indicies
+        # negative indices
         order = [2, 1, -1]
         for df in [self.frame]:
 
@@ -788,16 +958,29 @@ def test_take(self):
             expected = df.reindex(df.index.take(order))
             assert_frame_equal(result, expected)
 
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.take(order, convert=True, axis=0)
+                assert_frame_equal(result, expected)
+
+            with tm.assert_produces_warning(FutureWarning):
+                result = df.take(order, convert=False, axis=0)
+                assert_frame_equal(result, expected)
+
             # axis = 1
             result = df.take(order, axis=1)
             expected = df.loc[:, ['C', 'B', 'D']]
             assert_frame_equal(result, expected, check_names=False)
 
         # illegal indices
-        self.assertRaises(IndexError, df.take, [3, 1, 2, 30], axis=0)
-        self.assertRaises(IndexError, df.take, [3, 1, 2, -31], axis=0)
-        self.assertRaises(IndexError, df.take, [3, 1, 2, 5], axis=1)
-        self.assertRaises(IndexError, df.take, [3, 1, 2, -5], axis=1)
+        msg = "indices are out-of-bounds"
+        with pytest.raises(IndexError, match=msg):
+            df.take([3, 1, 2, 30], axis=0)
+        with pytest.raises(IndexError, match=msg):
+            df.take([3, 1, 2, -31], axis=0)
+        with pytest.raises(IndexError, match=msg):
+            df.take([3, 1, 2, 5], axis=1)
+        with pytest.raises(IndexError, match=msg):
+            df.take([3, 1, 2, -5], axis=1)
 
         # mixed-dtype
         order = [4, 1, 2, 0, 3]
@@ -812,7 +995,7 @@ def test_take(self):
             expected = df.loc[:, ['foo', 'B', 'C', 'A', 'D']]
             assert_frame_equal(result, expected)
 
-        # neg indicies
+        # negative indices
         order = [4, 1, -2]
         for df in [self.mixed_frame]:
 
@@ -844,46 +1027,56 @@ def test_reindex_boolean(self):
                           columns=[0, 2])
 
         reindexed = frame.reindex(np.arange(10))
-        self.assertEqual(reindexed.values.dtype, np.object_)
-        self.assertTrue(isnull(reindexed[0][1]))
+        assert reindexed.values.dtype == np.object_
+        assert isna(reindexed[0][1])
 
         reindexed = frame.reindex(columns=lrange(3))
-        self.assertEqual(reindexed.values.dtype, np.object_)
-        self.assertTrue(isnull(reindexed[1]).all())
+        assert reindexed.values.dtype == np.object_
+        assert isna(reindexed[1]).all()
 
     def test_reindex_objects(self):
         reindexed = self.mixed_frame.reindex(columns=['foo', 'A', 'B'])
-        self.assertIn('foo', reindexed)
+        assert 'foo' in reindexed
 
         reindexed = self.mixed_frame.reindex(columns=['A', 'B'])
-        self.assertNotIn('foo', reindexed)
+        assert 'foo' not in reindexed
 
     def test_reindex_corner(self):
         index = Index(['a', 'b', 'c'])
         dm = self.empty.reindex(index=[1, 2, 3])
         reindexed = dm.reindex(columns=index)
-        self.assert_index_equal(reindexed.columns, index)
+        tm.assert_index_equal(reindexed.columns, index)
 
         # ints are weird
         smaller = self.intframe.reindex(columns=['A', 'B', 'E'])
-        self.assertEqual(smaller['E'].dtype, np.float64)
+        assert smaller['E'].dtype == np.float64
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_reindex_axis(self):
         cols = ['A', 'B', 'E']
-        reindexed1 = self.intframe.reindex_axis(cols, axis=1)
+        with tm.assert_produces_warning(FutureWarning) as m:
+            reindexed1 = self.intframe.reindex_axis(cols, axis=1)
+            assert 'reindex' in str(m[0].message)
         reindexed2 = self.intframe.reindex(columns=cols)
         assert_frame_equal(reindexed1, reindexed2)
 
         rows = self.intframe.index[0:5]
-        reindexed1 = self.intframe.reindex_axis(rows, axis=0)
+        with tm.assert_produces_warning(FutureWarning) as m:
+            reindexed1 = self.intframe.reindex_axis(rows, axis=0)
+            assert 'reindex' in str(m[0].message)
         reindexed2 = self.intframe.reindex(index=rows)
         assert_frame_equal(reindexed1, reindexed2)
 
-        self.assertRaises(ValueError, self.intframe.reindex_axis, rows, axis=2)
+        msg = ("No axis named 2 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            self.intframe.reindex_axis(rows, axis=2)
 
         # no-op case
         cols = self.frame.columns.copy()
-        newFrame = self.frame.reindex_axis(cols, axis=1)
+        with tm.assert_produces_warning(FutureWarning) as m:
+            newFrame = self.frame.reindex_axis(cols, axis=1)
+            assert 'reindex' in str(m[0].message)
         assert_frame_equal(newFrame, self.frame)
 
     def test_reindex_with_nans(self):
@@ -906,21 +1099,21 @@ def test_reindex_with_nans(self):
     def test_reindex_multi(self):
         df = DataFrame(np.random.randn(3, 3))
 
-        result = df.reindex(lrange(4), lrange(4))
+        result = df.reindex(index=lrange(4), columns=lrange(4))
         expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
 
         assert_frame_equal(result, expected)
 
         df = DataFrame(np.random.randint(0, 10, (3, 3)))
 
-        result = df.reindex(lrange(4), lrange(4))
+        result = df.reindex(index=lrange(4), columns=lrange(4))
         expected = df.reindex(lrange(4)).reindex(columns=lrange(4))
 
         assert_frame_equal(result, expected)
 
         df = DataFrame(np.random.randint(0, 10, (3, 3)))
 
-        result = df.reindex(lrange(2), lrange(2))
+        result = df.reindex(index=lrange(2), columns=lrange(2))
         expected = df.reindex(lrange(2)).reindex(columns=lrange(2))
 
         assert_frame_equal(result, expected)
@@ -931,3 +1124,54 @@ def test_reindex_multi(self):
         expected = df.reindex([0, 1]).reindex(columns=['a', 'b'])
 
         assert_frame_equal(result, expected)
+
+    def test_reindex_multi_categorical_time(self):
+        # https://github.com/pandas-dev/pandas/issues/21390
+        midx = pd.MultiIndex.from_product(
+            [Categorical(['a', 'b', 'c']),
+             Categorical(date_range("2012-01-01", periods=3, freq='H'))])
+        df = pd.DataFrame({'a': range(len(midx))}, index=midx)
+        df2 = df.iloc[[0, 1, 2, 3, 4, 5, 6, 8]]
+
+        result = df2.reindex(midx)
+        expected = pd.DataFrame(
+            {'a': [0, 1, 2, 3, 4, 5, 6, np.nan, 8]}, index=midx)
+        assert_frame_equal(result, expected)
+
+    data = [[1, 2, 3], [1, 2, 3]]
+
+    @pytest.mark.parametrize('actual', [
+        DataFrame(data=data, index=['a', 'a']),
+        DataFrame(data=data, index=['a', 'b']),
+        DataFrame(data=data, index=['a', 'b']).set_index([0, 1]),
+        DataFrame(data=data, index=['a', 'a']).set_index([0, 1])
+    ])
+    def test_raise_on_drop_duplicate_index(self, actual):
+
+        # issue 19186
+        level = 0 if isinstance(actual.index, MultiIndex) else None
+        with pytest.raises(KeyError):
+            actual.drop('c', level=level, axis=0)
+        with pytest.raises(KeyError):
+            actual.T.drop('c', level=level, axis=1)
+        expected_no_err = actual.drop('c', axis=0, level=level,
+                                      errors='ignore')
+        assert_frame_equal(expected_no_err, actual)
+        expected_no_err = actual.T.drop('c', axis=1, level=level,
+                                        errors='ignore')
+        assert_frame_equal(expected_no_err.T, actual)
+
+    @pytest.mark.parametrize('index', [[1, 2, 3], [1, 1, 2]])
+    @pytest.mark.parametrize('drop_labels', [[], [1], [2]])
+    def test_drop_empty_list(self, index, drop_labels):
+        # GH 21494
+        expected_index = [i for i in index if i not in drop_labels]
+        frame = pd.DataFrame(index=index).drop(drop_labels)
+        tm.assert_frame_equal(frame, pd.DataFrame(index=expected_index))
+
+    @pytest.mark.parametrize('index', [[1, 2, 3], [1, 2, 2]])
+    @pytest.mark.parametrize('drop_labels', [[1, 4], [4, 5]])
+    def test_drop_non_empty_list(self, index, drop_labels):
+        # GH 21494
+        with pytest.raises(KeyError, match='not found in axis'):
+            pd.DataFrame(index=index).drop(drop_labels)
diff --git a/pandas/tests/frame/test_block_internals.py b/pandas/tests/frame/test_block_internals.py
index accd3ddeb03d7..4b06d2e35cdfc 100644
--- a/pandas/tests/frame/test_block_internals.py
+++ b/pandas/tests/frame/test_block_internals.py
@@ -5,135 +5,144 @@
 from datetime import datetime, timedelta
 import itertools
 
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas import (DataFrame, Series, Timestamp, date_range, compat,
-                    option_context)
 from pandas.compat import StringIO
+
 import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Series, Timestamp, compat, date_range,
+    option_context)
+from pandas.core.arrays import IntervalArray, integer_array
+from pandas.core.internals.blocks import IntBlock
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
 
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+# Segregated collection of methods that require the BlockManager internal data
+# structure
 
-import pandas.util.testing as tm
 
-from pandas.tests.frame.common import TestData
+class TestDataFrameBlockInternals():
+    def test_setitem_invalidates_datetime_index_freq(self):
+        # GH#24096 altering a datetime64tz column inplace invalidates the
+        #  `freq` attribute on the underlying DatetimeIndex
 
+        dti = date_range('20130101', periods=3, tz='US/Eastern')
+        ts = dti[1]
 
-# Segregated collection of methods that require the BlockManager internal data
-# structure
+        df = DataFrame({'B': dti})
+        assert df['B']._values.freq == 'D'
 
+        df.iloc[1, 0] = pd.NaT
+        assert df['B']._values.freq is None
 
-class TestDataFrameBlockInternals(tm.TestCase, TestData):
+        # check that the DatetimeIndex was not altered in place
+        assert dti.freq == 'D'
+        assert dti[1] == ts
 
-    def test_cast_internals(self):
-        casted = DataFrame(self.frame._data, dtype=int)
-        expected = DataFrame(self.frame._series, dtype=int)
+    def test_cast_internals(self, float_frame):
+        casted = DataFrame(float_frame._data, dtype=int)
+        expected = DataFrame(float_frame._series, dtype=int)
         assert_frame_equal(casted, expected)
 
-        casted = DataFrame(self.frame._data, dtype=np.int32)
-        expected = DataFrame(self.frame._series, dtype=np.int32)
+        casted = DataFrame(float_frame._data, dtype=np.int32)
+        expected = DataFrame(float_frame._series, dtype=np.int32)
         assert_frame_equal(casted, expected)
 
-    def test_consolidate(self):
-        self.frame['E'] = 7.
-        consolidated = self.frame._consolidate()
-        self.assertEqual(len(consolidated._data.blocks), 1)
+    def test_consolidate(self, float_frame):
+        float_frame['E'] = 7.
+        consolidated = float_frame._consolidate()
+        assert len(consolidated._data.blocks) == 1
 
         # Ensure copy, do I want this?
         recons = consolidated._consolidate()
-        self.assertIsNot(recons, consolidated)
-        assert_frame_equal(recons, consolidated)
+        assert recons is not consolidated
+        tm.assert_frame_equal(recons, consolidated)
 
-        self.frame['F'] = 8.
-        self.assertEqual(len(self.frame._data.blocks), 3)
-        self.frame._consolidate(inplace=True)
-        self.assertEqual(len(self.frame._data.blocks), 1)
+        float_frame['F'] = 8.
+        assert len(float_frame._data.blocks) == 3
 
-    def test_consolidate_deprecation(self):
-        self.frame['E'] = 7
-        with tm.assert_produces_warning(FutureWarning):
-            self.frame.consolidate()
+        float_frame._consolidate(inplace=True)
+        assert len(float_frame._data.blocks) == 1
 
-    def test_consolidate_inplace(self):
-        frame = self.frame.copy()  # noqa
+    def test_consolidate_inplace(self, float_frame):
+        frame = float_frame.copy()  # noqa
 
         # triggers in-place consolidation
         for letter in range(ord('A'), ord('Z')):
-            self.frame[chr(letter)] = chr(letter)
+            float_frame[chr(letter)] = chr(letter)
 
-    def test_as_matrix_consolidate(self):
-        self.frame['E'] = 7.
-        self.assertFalse(self.frame._data.is_consolidated())
-        _ = self.frame.as_matrix()  # noqa
-        self.assertTrue(self.frame._data.is_consolidated())
+    def test_values_consolidate(self, float_frame):
+        float_frame['E'] = 7.
+        assert not float_frame._data.is_consolidated()
+        _ = float_frame.values  # noqa
+        assert float_frame._data.is_consolidated()
 
-    def test_modify_values(self):
-        self.frame.values[5] = 5
-        self.assertTrue((self.frame.values[5] == 5).all())
+    def test_modify_values(self, float_frame):
+        float_frame.values[5] = 5
+        assert (float_frame.values[5] == 5).all()
 
         # unconsolidated
-        self.frame['E'] = 7.
-        self.frame.values[6] = 6
-        self.assertTrue((self.frame.values[6] == 6).all())
+        float_frame['E'] = 7.
+        float_frame.values[6] = 6
+        assert (float_frame.values[6] == 6).all()
 
-    def test_boolean_set_uncons(self):
-        self.frame['E'] = 7.
+    def test_boolean_set_uncons(self, float_frame):
+        float_frame['E'] = 7.
 
-        expected = self.frame.values.copy()
+        expected = float_frame.values.copy()
         expected[expected > 1] = 2
 
-        self.frame[self.frame > 1] = 2
-        assert_almost_equal(expected, self.frame.values)
+        float_frame[float_frame > 1] = 2
+        assert_almost_equal(expected, float_frame.values)
 
-    def test_as_matrix_numeric_cols(self):
-        self.frame['foo'] = 'bar'
+    def test_values_numeric_cols(self, float_frame):
+        float_frame['foo'] = 'bar'
 
-        values = self.frame.as_matrix(['A', 'B', 'C', 'D'])
-        self.assertEqual(values.dtype, np.float64)
+        values = float_frame[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
 
-    def test_as_matrix_lcd(self):
+    def test_values_lcd(self, mixed_float_frame, mixed_int_frame):
 
         # mixed lcd
-        values = self.mixed_float.as_matrix(['A', 'B', 'C', 'D'])
-        self.assertEqual(values.dtype, np.float64)
+        values = mixed_float_frame[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
 
-        values = self.mixed_float.as_matrix(['A', 'B', 'C'])
-        self.assertEqual(values.dtype, np.float32)
+        values = mixed_float_frame[['A', 'B', 'C']].values
+        assert values.dtype == np.float32
 
-        values = self.mixed_float.as_matrix(['C'])
-        self.assertEqual(values.dtype, np.float16)
+        values = mixed_float_frame[['C']].values
+        assert values.dtype == np.float16
 
         # GH 10364
         # B uint64 forces float because there are other signed int types
-        values = self.mixed_int.as_matrix(['A', 'B', 'C', 'D'])
-        self.assertEqual(values.dtype, np.float64)
+        values = mixed_int_frame[['A', 'B', 'C', 'D']].values
+        assert values.dtype == np.float64
 
-        values = self.mixed_int.as_matrix(['A', 'D'])
-        self.assertEqual(values.dtype, np.int64)
+        values = mixed_int_frame[['A', 'D']].values
+        assert values.dtype == np.int64
 
         # B uint64 forces float because there are other signed int types
-        values = self.mixed_int.as_matrix(['A', 'B', 'C'])
-        self.assertEqual(values.dtype, np.float64)
+        values = mixed_int_frame[['A', 'B', 'C']].values
+        assert values.dtype == np.float64
 
         # as B and C are both unsigned, no forcing to float is needed
-        values = self.mixed_int.as_matrix(['B', 'C'])
-        self.assertEqual(values.dtype, np.uint64)
+        values = mixed_int_frame[['B', 'C']].values
+        assert values.dtype == np.uint64
 
-        values = self.mixed_int.as_matrix(['A', 'C'])
-        self.assertEqual(values.dtype, np.int32)
+        values = mixed_int_frame[['A', 'C']].values
+        assert values.dtype == np.int32
 
-        values = self.mixed_int.as_matrix(['C', 'D'])
-        self.assertEqual(values.dtype, np.int64)
+        values = mixed_int_frame[['C', 'D']].values
+        assert values.dtype == np.int64
 
-        values = self.mixed_int.as_matrix(['A'])
-        self.assertEqual(values.dtype, np.int32)
+        values = mixed_int_frame[['A']].values
+        assert values.dtype == np.int32
 
-        values = self.mixed_int.as_matrix(['C'])
-        self.assertEqual(values.dtype, np.uint8)
+        values = mixed_int_frame[['C']].values
+        assert values.dtype == np.uint8
 
     def test_constructor_with_convert(self):
         # this is actually mostly a test of lib.maybe_convert_objects
@@ -202,11 +211,11 @@ def test_constructor_with_convert(self):
                                       None], np.object_), name='A')
         assert_series_equal(result, expected)
 
-    def test_construction_with_mixed(self):
+    def test_construction_with_mixed(self, float_string_frame):
         # test construction edge cases with mixed types
 
         # f7u12, this does not work without extensive workaround
-        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
+        data = [[datetime(2001, 1, 5), np.nan, datetime(2001, 1, 2)],
                 [datetime(2000, 1, 2), datetime(2000, 1, 3),
                  datetime(2000, 1, 1)]]
         df = DataFrame(data)
@@ -216,11 +225,11 @@ def test_construction_with_mixed(self):
         expected = Series({'datetime64[ns]': 3})
 
         # mixed-type frames
-        self.mixed_frame['datetime'] = datetime.now()
-        self.mixed_frame['timedelta'] = timedelta(days=1, seconds=1)
-        self.assertEqual(self.mixed_frame['datetime'].dtype, 'M8[ns]')
-        self.assertEqual(self.mixed_frame['timedelta'].dtype, 'm8[ns]')
-        result = self.mixed_frame.get_dtype_counts().sort_values()
+        float_string_frame['datetime'] = datetime.now()
+        float_string_frame['timedelta'] = timedelta(days=1, seconds=1)
+        assert float_string_frame['datetime'].dtype == 'M8[ns]'
+        assert float_string_frame['timedelta'].dtype == 'm8[ns]'
+        result = float_string_frame.get_dtype_counts().sort_values()
         expected = Series({'float64': 4,
                            'object': 1,
                            'datetime64[ns]': 1,
@@ -231,10 +240,6 @@ def test_construction_with_conversions(self):
 
         # convert from a numpy array of non-ns timedelta64
         arr = np.array([1, 2, 3], dtype='timedelta64[s]')
-        s = Series(arr)
-        expected = Series(pd.timedelta_range('00:00:01', periods=3, freq='s'))
-        assert_series_equal(s, expected)
-
         df = DataFrame(index=range(3))
         df['A'] = arr
         expected = DataFrame({'A': pd.timedelta_range('00:00:01', periods=3,
@@ -242,21 +247,6 @@ def test_construction_with_conversions(self):
                              index=range(3))
         assert_frame_equal(df, expected)
 
-        # convert from a numpy array of non-ns datetime64
-        # note that creating a numpy datetime64 is in LOCAL time!!!!
-        # seems to work for M8[D], but not for M8[s]
-
-        s = Series(np.array(['2013-01-01', '2013-01-02',
-                             '2013-01-03'], dtype='datetime64[D]'))
-        assert_series_equal(s, Series(date_range('20130101', periods=3,
-                                                 freq='D')))
-
-        # s = Series(np.array(['2013-01-01 00:00:01','2013-01-01
-        # 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]'))
-
-        # assert_series_equal(s,date_range('20130101
-        # 00:00:01',period=3,freq='s'))
-
         expected = DataFrame({
             'dt1': Timestamp('20130101'),
             'dt2': date_range('20130101', periods=3),
@@ -284,10 +274,12 @@ def f(dtype):
                              columns=["A", "B", "C"],
                              dtype=dtype)
 
-        self.assertRaises(NotImplementedError, f,
-                          [("A", "datetime64[h]"),
-                           ("B", "str"),
-                           ("C", "int32")])
+        msg = ("compound dtypes are not implemented in the DataFrame"
+               " constructor")
+        with pytest.raises(NotImplementedError, match=msg):
+            f([("A", "datetime64[h]"),
+               ("B", "str"),
+               ("C", "int32")])
 
         # these work (though results may be unexpected)
         f('int64')
@@ -305,64 +297,74 @@ def test_equals_different_blocks(self):
         df1 = df0.reset_index()[["A", "B", "C"]]
         # this assert verifies that the above operations have
         # induced a block rearrangement
-        self.assertTrue(df0._data.blocks[0].dtype !=
-                        df1._data.blocks[0].dtype)
+        assert (df0._data.blocks[0].dtype != df1._data.blocks[0].dtype)
+
         # do the real tests
         assert_frame_equal(df0, df1)
-        self.assertTrue(df0.equals(df1))
-        self.assertTrue(df1.equals(df0))
+        assert df0.equals(df1)
+        assert df1.equals(df0)
 
-    def test_copy_blocks(self):
+    def test_copy_blocks(self, float_frame):
         # API/ENH 9607
-        df = DataFrame(self.frame, copy=True)
+        df = DataFrame(float_frame, copy=True)
         column = df.columns[0]
 
         # use the default copy=True, change a column
-        blocks = df.as_blocks()
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            blocks = df.as_blocks()
         for dtype, _df in blocks.items():
             if column in _df:
                 _df.loc[:, column] = _df[column] + 1
 
         # make sure we did not change the original DataFrame
-        self.assertFalse(_df[column].equals(df[column]))
+        assert not _df[column].equals(df[column])
 
-    def test_no_copy_blocks(self):
+    def test_no_copy_blocks(self, float_frame):
         # API/ENH 9607
-        df = DataFrame(self.frame, copy=True)
+        df = DataFrame(float_frame, copy=True)
         column = df.columns[0]
 
         # use the copy=False, change a column
-        blocks = df.as_blocks(copy=False)
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            blocks = df.as_blocks(copy=False)
         for dtype, _df in blocks.items():
             if column in _df:
                 _df.loc[:, column] = _df[column] + 1
 
         # make sure we did change the original DataFrame
-        self.assertTrue(_df[column].equals(df[column]))
+        assert _df[column].equals(df[column])
 
-    def test_copy(self):
-        cop = self.frame.copy()
+    def test_copy(self, float_frame, float_string_frame):
+        cop = float_frame.copy()
         cop['E'] = cop['A']
-        self.assertNotIn('E', self.frame)
+        assert 'E' not in float_frame
 
         # copy objects
-        copy = self.mixed_frame.copy()
-        self.assertIsNot(copy._data, self.mixed_frame._data)
+        copy = float_string_frame.copy()
+        assert copy._data is not float_string_frame._data
 
-    def test_pickle(self):
-        unpickled = self.round_trip_pickle(self.mixed_frame)
-        assert_frame_equal(self.mixed_frame, unpickled)
+    def test_pickle(self, float_string_frame, timezone_frame):
+        empty_frame = DataFrame()
+
+        unpickled = tm.round_trip_pickle(float_string_frame)
+        assert_frame_equal(float_string_frame, unpickled)
 
         # buglet
-        self.mixed_frame._data.ndim
+        float_string_frame._data.ndim
 
         # empty
-        unpickled = self.round_trip_pickle(self.empty)
+        unpickled = tm.round_trip_pickle(empty_frame)
         repr(unpickled)
 
         # tz frame
-        unpickled = self.round_trip_pickle(self.tzframe)
-        assert_frame_equal(self.tzframe, unpickled)
+        unpickled = tm.round_trip_pickle(timezone_frame)
+        assert_frame_equal(timezone_frame, unpickled)
 
     def test_consolidate_datetime64(self):
         # numpy vstack bug
@@ -396,9 +398,9 @@ def test_consolidate_datetime64(self):
             df.starting), ser_starting.index)
         tm.assert_index_equal(pd.DatetimeIndex(df.ending), ser_ending.index)
 
-    def test_is_mixed_type(self):
-        self.assertFalse(self.frame._is_mixed_type)
-        self.assertTrue(self.mixed_frame._is_mixed_type)
+    def test_is_mixed_type(self, float_frame, float_string_frame):
+        assert not float_frame._is_mixed_type
+        assert float_string_frame._is_mixed_type
 
     def test_get_numeric_data(self):
         # TODO(wesm): unused?
@@ -414,8 +416,8 @@ def test_get_numeric_data(self):
         result = df.get_dtype_counts()
         expected = Series({'int64': 1, 'float64': 1,
                            datetime64name: 1, objectname: 1})
-        result.sort_index()
-        expected.sort_index()
+        result = result.sort_index()
+        expected = expected.sort_index()
         assert_series_equal(result, expected)
 
         df = DataFrame({'a': 1., 'b': 2, 'c': 'foo',
@@ -445,40 +447,51 @@ def test_get_numeric_data(self):
         expected = df
         assert_frame_equal(result, expected)
 
-    def test_convert_objects(self):
+    def test_get_numeric_data_extension_dtype(self):
+        # GH 22290
+        df = DataFrame({
+            'A': integer_array([-10, np.nan, 0, 10, 20, 30], dtype='Int64'),
+            'B': Categorical(list('abcabc')),
+            'C': integer_array([0, 1, 2, 3, np.nan, 5], dtype='UInt8'),
+            'D': IntervalArray.from_breaks(range(7))})
+        result = df._get_numeric_data()
+        expected = df.loc[:, ['A', 'C']]
+        assert_frame_equal(result, expected)
 
-        oops = self.mixed_frame.T.T
+    def test_convert_objects(self, float_string_frame):
+
+        oops = float_string_frame.T.T
         converted = oops._convert(datetime=True)
-        assert_frame_equal(converted, self.mixed_frame)
-        self.assertEqual(converted['A'].dtype, np.float64)
+        assert_frame_equal(converted, float_string_frame)
+        assert converted['A'].dtype == np.float64
 
         # force numeric conversion
-        self.mixed_frame['H'] = '1.'
-        self.mixed_frame['I'] = '1'
+        float_string_frame['H'] = '1.'
+        float_string_frame['I'] = '1'
 
         # add in some items that will be nan
-        l = len(self.mixed_frame)
-        self.mixed_frame['J'] = '1.'
-        self.mixed_frame['K'] = '1'
-        self.mixed_frame.loc[0:5, ['J', 'K']] = 'garbled'
-        converted = self.mixed_frame._convert(datetime=True, numeric=True)
-        self.assertEqual(converted['H'].dtype, 'float64')
-        self.assertEqual(converted['I'].dtype, 'int64')
-        self.assertEqual(converted['J'].dtype, 'float64')
-        self.assertEqual(converted['K'].dtype, 'float64')
-        self.assertEqual(len(converted['J'].dropna()), l - 5)
-        self.assertEqual(len(converted['K'].dropna()), l - 5)
+        length = len(float_string_frame)
+        float_string_frame['J'] = '1.'
+        float_string_frame['K'] = '1'
+        float_string_frame.loc[0:5, ['J', 'K']] = 'garbled'
+        converted = float_string_frame._convert(datetime=True, numeric=True)
+        assert converted['H'].dtype == 'float64'
+        assert converted['I'].dtype == 'int64'
+        assert converted['J'].dtype == 'float64'
+        assert converted['K'].dtype == 'float64'
+        assert len(converted['J'].dropna()) == length - 5
+        assert len(converted['K'].dropna()) == length - 5
 
         # via astype
-        converted = self.mixed_frame.copy()
+        converted = float_string_frame.copy()
         converted['H'] = converted['H'].astype('float64')
         converted['I'] = converted['I'].astype('int64')
-        self.assertEqual(converted['H'].dtype, 'float64')
-        self.assertEqual(converted['I'].dtype, 'int64')
+        assert converted['H'].dtype == 'float64'
+        assert converted['I'].dtype == 'int64'
 
         # via astype, but errors
-        converted = self.mixed_frame.copy()
-        with assertRaisesRegexp(ValueError, 'invalid literal'):
+        converted = float_string_frame.copy()
+        with pytest.raises(ValueError, match='invalid literal'):
             converted['H'].astype('int32')
 
         # mixed in a single column
@@ -493,6 +506,32 @@ def test_convert_objects_no_conversion(self):
         mixed2 = mixed1._convert(datetime=True)
         assert_frame_equal(mixed1, mixed2)
 
+    def test_infer_objects(self):
+        # GH 11221
+        df = DataFrame({'a': ['a', 1, 2, 3],
+                        'b': ['b', 2.0, 3.0, 4.1],
+                        'c': ['c', datetime(2016, 1, 1),
+                              datetime(2016, 1, 2),
+                              datetime(2016, 1, 3)],
+                        'd': [1, 2, 3, 'd']},
+                       columns=['a', 'b', 'c', 'd'])
+        df = df.iloc[1:].infer_objects()
+
+        assert df['a'].dtype == 'int64'
+        assert df['b'].dtype == 'float64'
+        assert df['c'].dtype == 'M8[ns]'
+        assert df['d'].dtype == 'object'
+
+        expected = DataFrame({'a': [1, 2, 3],
+                              'b': [2.0, 3.0, 4.1],
+                              'c': [datetime(2016, 1, 1),
+                                    datetime(2016, 1, 2),
+                                    datetime(2016, 1, 3)],
+                              'd': [2, 3, 'd']},
+                             columns=['a', 'b', 'c', 'd'])
+        # reconstruct frame to verify inference is same
+        tm.assert_frame_equal(df.reset_index(drop=True), expected)
+
     def test_stale_cached_series_bug_473(self):
 
         # this is chained, but ok
@@ -505,7 +544,7 @@ def test_stale_cached_series_bug_473(self):
             repr(Y)
             result = Y.sum()  # noqa
             exp = Y['g'].sum()  # noqa
-            self.assertTrue(pd.isnull(Y['g']['c']))
+            assert pd.isna(Y['g']['c'])
 
     def test_get_X_columns(self):
         # numeric and object columns
@@ -516,28 +555,37 @@ def test_get_X_columns(self):
                         'd': [None, None, None],
                         'e': [3.14, 0.577, 2.773]})
 
-        self.assert_index_equal(df._get_numeric_data().columns,
-                                pd.Index(['a', 'b', 'e']))
+        tm.assert_index_equal(df._get_numeric_data().columns,
+                              pd.Index(['a', 'b', 'e']))
 
     def test_strange_column_corruption_issue(self):
         # (wesm) Unclear how exactly this is related to internal matters
         df = DataFrame(index=[0, 1])
-        df[0] = nan
+        df[0] = np.nan
         wasCol = {}
         # uncommenting these makes the results match
         # for col in xrange(100, 200):
         #    wasCol[col] = 1
-        #    df[col] = nan
+        #    df[col] = np.nan
 
         for i, dt in enumerate(df.index):
             for col in range(100, 200):
                 if col not in wasCol:
                     wasCol[col] = 1
-                    df[col] = nan
+                    df[col] = np.nan
                 df[col][dt] = i
 
         myid = 100
 
-        first = len(df.loc[pd.isnull(df[myid]), [myid]])
-        second = len(df.loc[pd.isnull(df[myid]), [myid]])
-        self.assertTrue(first == second == 0)
+        first = len(df.loc[pd.isna(df[myid]), [myid]])
+        second = len(df.loc[pd.isna(df[myid]), [myid]])
+        assert first == second == 0
+
+    def test_constructor_no_pandas_array(self):
+        # Ensure that PandasArray isn't allowed inside Series
+        # See https://github.com/pandas-dev/pandas/issues/23995 for more.
+        arr = pd.Series([1, 2, 3]).array
+        result = pd.DataFrame({"A": arr})
+        expected = pd.DataFrame({"A": [1, 2, 3]})
+        tm.assert_frame_equal(result, expected)
+        assert isinstance(result._data.blocks[0], IntBlock)
diff --git a/pandas/tests/frame/test_combine_concat.py b/pandas/tests/frame/test_combine_concat.py
index 6f06a55ad065e..c2364dc135a9a 100644
--- a/pandas/tests/frame/test_combine_concat.py
+++ b/pandas/tests/frame/test_combine_concat.py
@@ -5,22 +5,18 @@
 from datetime import datetime
 
 import numpy as np
-from numpy import nan
+import pytest
 
-import pandas as pd
-
-from pandas import DataFrame, Index, Series, Timestamp, date_range
 from pandas.compat import lrange
 
+import pandas as pd
+from pandas import DataFrame, Index, Series, Timestamp, date_range
 from pandas.tests.frame.common import TestData
-
 import pandas.util.testing as tm
-from pandas.util.testing import (assertRaisesRegexp,
-                                 assert_frame_equal,
-                                 assert_series_equal)
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameConcatCommon(tm.TestCase, TestData):
+class TestDataFrameConcatCommon(TestData):
 
     def test_concat_multiple_frames_dtypes(self):
 
@@ -32,6 +28,24 @@ def test_concat_multiple_frames_dtypes(self):
         expected = Series(dict(float64=2, float32=2))
         assert_series_equal(results, expected)
 
+    @pytest.mark.parametrize('data', [
+        pd.date_range('2000', periods=4),
+        pd.date_range('2000', periods=4, tz="US/Central"),
+        pd.period_range('2000', periods=4),
+        pd.timedelta_range(0, periods=4),
+    ])
+    def test_combine_datetlike_udf(self, data):
+        # https://github.com/pandas-dev/pandas/issues/23079
+        df = pd.DataFrame({"A": data})
+        other = df.copy()
+        df.iloc[1, 0] = None
+
+        def combiner(a, b):
+            return b
+
+        result = df.combine(other, combiner)
+        tm.assert_frame_equal(result, other)
+
     def test_concat_multiple_tzs(self):
         # GH 12467
         # combining datetime tz-aware and naive DataFrames
@@ -55,6 +69,37 @@ def test_concat_multiple_tzs(self):
         expected = DataFrame(dict(time=[ts2, ts3]))
         assert_frame_equal(results, expected)
 
+    @pytest.mark.parametrize(
+        't1',
+        [
+            '2015-01-01',
+            pytest.param(pd.NaT, marks=pytest.mark.xfail(
+                reason='GH23037 incorrect dtype when concatenating'))])
+    def test_concat_tz_NaT(self, t1):
+        # GH 22796
+        # Concating tz-aware multicolumn DataFrames
+        ts1 = Timestamp(t1, tz='UTC')
+        ts2 = Timestamp('2015-01-01', tz='UTC')
+        ts3 = Timestamp('2015-01-01', tz='UTC')
+
+        df1 = DataFrame([[ts1, ts2]])
+        df2 = DataFrame([[ts3]])
+
+        result = pd.concat([df1, df2])
+        expected = DataFrame([[ts1, ts2], [ts3, pd.NaT]], index=[0, 0])
+
+        assert_frame_equal(result, expected)
+
+    def test_concat_tz_not_aligned(self):
+        # GH 22796
+        ts = pd.to_datetime([1, 2]).tz_localize("UTC")
+        a = pd.DataFrame({"A": ts})
+        b = pd.DataFrame({"A": ts, "B": ts})
+        result = pd.concat([a, b], sort=True, ignore_index=True)
+        expected = pd.DataFrame({"A": list(ts) + list(ts),
+                                 "B": [pd.NaT, pd.NaT] + list(ts)})
+        assert_frame_equal(result, expected)
+
     def test_concat_tuple_keys(self):
         # GH 14438
         df1 = pd.DataFrame(np.ones((2, 2)), columns=list('AB'))
@@ -78,11 +123,13 @@ def test_append_series_dict(self):
                        columns=['foo', 'bar', 'baz', 'qux'])
 
         series = df.loc[4]
-        with assertRaisesRegexp(ValueError, 'Indexes have overlapping values'):
+        msg = 'Indexes have overlapping values'
+        with pytest.raises(ValueError, match=msg):
             df.append(series, verify_integrity=True)
+
         series.name = None
-        with assertRaisesRegexp(TypeError, 'Can only append a Series if '
-                                'ignore_index=True'):
+        msg = 'Can only append a Series if ignore_index=True'
+        with pytest.raises(TypeError, match=msg):
             df.append(series, verify_integrity=True)
 
         result = df.append(series[::-1], ignore_index=True)
@@ -96,7 +143,7 @@ def test_append_series_dict(self):
 
         result = df.append(series[::-1][:3], ignore_index=True)
         expected = df.append(DataFrame({0: series[::-1][:3]}).T,
-                             ignore_index=True)
+                             ignore_index=True, sort=True)
         assert_frame_equal(result, expected.loc[:, result.columns])
 
         # can append when name set
@@ -119,8 +166,8 @@ def test_append_list_of_series_dicts(self):
         # different columns
         dicts = [{'foo': 1, 'bar': 2, 'baz': 3, 'peekaboo': 4},
                  {'foo': 5, 'bar': 6, 'baz': 7, 'peekaboo': 8}]
-        result = df.append(dicts, ignore_index=True)
-        expected = df.append(DataFrame(dicts), ignore_index=True)
+        result = df.append(dicts, ignore_index=True, sort=True)
+        expected = df.append(DataFrame(dicts), ignore_index=True, sort=True)
         assert_frame_equal(result, expected)
 
     def test_append_empty_dataframe(self):
@@ -199,20 +246,20 @@ def test_append_dtypes(self):
         assert_frame_equal(result, expected)
 
     def test_update(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
+        df = DataFrame([[1.5, np.nan, 3.],
+                        [1.5, np.nan, 3.],
+                        [1.5, np.nan, 3],
+                        [1.5, np.nan, 3]])
 
         other = DataFrame([[3.6, 2., np.nan],
                            [np.nan, np.nan, 7]], index=[1, 3])
 
         df.update(other)
 
-        expected = DataFrame([[1.5, nan, 3],
+        expected = DataFrame([[1.5, np.nan, 3],
                               [3.6, 2, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 7.]])
+                              [1.5, np.nan, 3],
+                              [1.5, np.nan, 7.]])
         assert_frame_equal(df, expected)
 
     def test_update_dtypes(self):
@@ -229,49 +276,66 @@ def test_update_dtypes(self):
         assert_frame_equal(df, expected)
 
     def test_update_nooverwrite(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
+        df = DataFrame([[1.5, np.nan, 3.],
+                        [1.5, np.nan, 3.],
+                        [1.5, np.nan, 3],
+                        [1.5, np.nan, 3]])
 
         other = DataFrame([[3.6, 2., np.nan],
                            [np.nan, np.nan, 7]], index=[1, 3])
 
         df.update(other, overwrite=False)
 
-        expected = DataFrame([[1.5, nan, 3],
+        expected = DataFrame([[1.5, np.nan, 3],
                               [1.5, 2, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 3.]])
+                              [1.5, np.nan, 3],
+                              [1.5, np.nan, 3.]])
         assert_frame_equal(df, expected)
 
     def test_update_filtered(self):
-        df = DataFrame([[1.5, nan, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
+        df = DataFrame([[1.5, np.nan, 3.],
+                        [1.5, np.nan, 3.],
+                        [1.5, np.nan, 3],
+                        [1.5, np.nan, 3]])
 
         other = DataFrame([[3.6, 2., np.nan],
                            [np.nan, np.nan, 7]], index=[1, 3])
 
         df.update(other, filter_func=lambda x: x > 2)
 
-        expected = DataFrame([[1.5, nan, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 3],
-                              [1.5, nan, 7.]])
+        expected = DataFrame([[1.5, np.nan, 3],
+                              [1.5, np.nan, 3],
+                              [1.5, np.nan, 3],
+                              [1.5, np.nan, 7.]])
         assert_frame_equal(df, expected)
 
-    def test_update_raise(self):
+    @pytest.mark.parametrize('bad_kwarg, exception, msg', [
+        # errors must be 'ignore' or 'raise'
+        ({'errors': 'something'}, ValueError, 'The parameter errors must.*'),
+        ({'join': 'inner'}, NotImplementedError, 'Only left join is supported')
+    ])
+    def test_update_raise_bad_parameter(self, bad_kwarg, exception, msg):
+        df = DataFrame([[1.5, 1, 3.]])
+        with pytest.raises(exception, match=msg):
+            df.update(df, **bad_kwarg)
+
+    def test_update_raise_on_overlap(self):
         df = DataFrame([[1.5, 1, 3.],
-                        [1.5, nan, 3.],
-                        [1.5, nan, 3],
-                        [1.5, nan, 3]])
-
-        other = DataFrame([[2., nan],
-                           [nan, 7]], index=[1, 3], columns=[1, 2])
-        with assertRaisesRegexp(ValueError, "Data overlaps"):
-            df.update(other, raise_conflict=True)
+                        [1.5, np.nan, 3.],
+                        [1.5, np.nan, 3],
+                        [1.5, np.nan, 3]])
+
+        other = DataFrame([[2., np.nan],
+                           [np.nan, 7]], index=[1, 3], columns=[1, 2])
+        with pytest.raises(ValueError, match="Data overlaps"):
+            df.update(other, errors='raise')
+
+    @pytest.mark.parametrize('raise_conflict', [True, False])
+    def test_update_deprecation(self, raise_conflict):
+        df = DataFrame([[1.5, 1, 3.]])
+        other = DataFrame()
+        with tm.assert_produces_warning(FutureWarning):
+            df.update(other, raise_conflict=raise_conflict)
 
     def test_update_from_non_df(self):
         d = {'a': Series([1, 2, 3, 4]), 'b': Series([5, 6, 7, 8])}
@@ -303,7 +367,7 @@ def test_join_str_datetime(self):
 
         tst = A.join(C, on='aa')
 
-        self.assertEqual(len(tst.columns), 3)
+        assert len(tst.columns) == 3
 
     def test_join_multiindex_leftright(self):
         # GH 10741
@@ -419,7 +483,7 @@ def test_concat_axis_parameter(self):
         assert_frame_equal(concatted_1_series, expected_columns_series)
 
         # Testing ValueError
-        with assertRaisesRegexp(ValueError, 'No axis named'):
+        with pytest.raises(ValueError, match='No axis named'):
             pd.concat([series1, series2], axis='something')
 
     def test_concat_numerical_names(self):
@@ -440,8 +504,18 @@ def test_concat_numerical_names(self):
                                                                 names=[1, 2]))
         tm.assert_frame_equal(result, expected)
 
+    def test_concat_astype_dup_col(self):
+        # gh 23049
+        df = pd.DataFrame([{'a': 'b'}])
+        df = pd.concat([df, df], axis=1)
+
+        result = df.astype('category')
+        expected = pd.DataFrame(np.array(["b", "b"]).reshape(1, 2),
+                                columns=["a", "a"]).astype("category")
+        tm.assert_frame_equal(result, expected)
 
-class TestDataFrameCombineFirst(tm.TestCase, TestData):
+
+class TestDataFrameCombineFirst(TestData):
 
     def test_combine_first_mixed(self):
         a = Series(['a', 'b'], index=lrange(2))
@@ -464,7 +538,7 @@ def test_combine_first(self):
         combined = head.combine_first(tail)
         reordered_frame = self.frame.reindex(combined.index)
         assert_frame_equal(combined, reordered_frame)
-        self.assertTrue(tm.equalContents(combined.columns, self.frame.columns))
+        assert tm.equalContents(combined.columns, self.frame.columns)
         assert_series_equal(combined['A'], reordered_frame['A'])
 
         # same index
@@ -478,7 +552,7 @@ def test_combine_first(self):
 
         combined = fcopy.combine_first(fcopy2)
 
-        self.assertTrue((combined['A'] == 1).all())
+        assert (combined['A'] == 1).all()
         assert_series_equal(combined['B'], fcopy['B'])
         assert_series_equal(combined['C'], fcopy2['C'])
         assert_series_equal(combined['D'], fcopy['D'])
@@ -488,12 +562,12 @@ def test_combine_first(self):
         head['A'] = 1
 
         combined = head.combine_first(tail)
-        self.assertTrue((combined['A'][:10] == 1).all())
+        assert (combined['A'][:10] == 1).all()
 
         # reverse overlap
         tail['A'][:10] = 0
         combined = tail.combine_first(head)
-        self.assertTrue((combined['A'][:10] == 0).all())
+        assert (combined['A'][:10] == 0).all()
 
         # no overlap
         f = self.frame[:10]
@@ -510,13 +584,13 @@ def test_combine_first(self):
         assert_frame_equal(comb, self.frame)
 
         comb = self.frame.combine_first(DataFrame(index=["faz", "boo"]))
-        self.assertTrue("faz" in comb.index)
+        assert "faz" in comb.index
 
         # #2525
         df = DataFrame({'a': [1]}, index=[datetime(2012, 1, 1)])
         df2 = DataFrame({}, columns=['b'])
         result = df.combine_first(df2)
-        self.assertTrue('b' in result)
+        assert 'b' in result
 
     def test_combine_first_mixed_bug(self):
         idx = Index(['a', 'b', 'c', 'e'])
@@ -538,7 +612,7 @@ def test_combine_first_mixed_bug(self):
                             "col5": ser3})
 
         combined = frame1.combine_first(frame2)
-        self.assertEqual(len(combined.columns), 5)
+        assert len(combined.columns) == 5
 
         # gh 3016 (same as in update)
         df = DataFrame([[1., 2., False, True], [4., 5., True, False]],
@@ -603,28 +677,28 @@ def test_combine_first_align_nan(self):
         dfa = pd.DataFrame([[pd.Timestamp('2011-01-01'), 2]],
                            columns=['a', 'b'])
         dfb = pd.DataFrame([[4], [5]], columns=['b'])
-        self.assertEqual(dfa['a'].dtype, 'datetime64[ns]')
-        self.assertEqual(dfa['b'].dtype, 'int64')
+        assert dfa['a'].dtype == 'datetime64[ns]'
+        assert dfa['b'].dtype == 'int64'
 
         res = dfa.combine_first(dfb)
         exp = pd.DataFrame({'a': [pd.Timestamp('2011-01-01'), pd.NaT],
                             'b': [2., 5.]}, columns=['a', 'b'])
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['a'].dtype, 'datetime64[ns]')
+        assert res['a'].dtype == 'datetime64[ns]'
         # ToDo: this must be int64
-        self.assertEqual(res['b'].dtype, 'float64')
+        assert res['b'].dtype == 'float64'
 
         res = dfa.iloc[:0].combine_first(dfb)
         exp = pd.DataFrame({'a': [np.nan, np.nan],
                             'b': [4, 5]}, columns=['a', 'b'])
         tm.assert_frame_equal(res, exp)
         # ToDo: this must be datetime64
-        self.assertEqual(res['a'].dtype, 'float64')
+        assert res['a'].dtype == 'float64'
         # ToDo: this must be int64
-        self.assertEqual(res['b'].dtype, 'int64')
+        assert res['b'].dtype == 'int64'
 
     def test_combine_first_timezone(self):
-        # GH 7630
+        # see gh-7630
         data1 = pd.to_datetime('20100101 01:01').tz_localize('UTC')
         df1 = pd.DataFrame(columns=['UTCdatetime', 'abc'],
                            data=data1,
@@ -644,10 +718,10 @@ def test_combine_first_timezone(self):
                            index=pd.date_range('20140627', periods=2,
                                                freq='D'))
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['UTCdatetime'].dtype, 'datetime64[ns, UTC]')
-        self.assertEqual(res['abc'].dtype, 'datetime64[ns, UTC]')
+        assert res['UTCdatetime'].dtype == 'datetime64[ns, UTC]'
+        assert res['abc'].dtype == 'datetime64[ns, UTC]'
 
-        # GH 10567
+        # see gh-10567
         dts1 = pd.date_range('2015-01-01', '2015-01-05', tz='UTC')
         df1 = pd.DataFrame({'DATE': dts1})
         dts2 = pd.date_range('2015-01-03', '2015-01-05', tz='UTC')
@@ -655,7 +729,7 @@ def test_combine_first_timezone(self):
 
         res = df1.combine_first(df2)
         tm.assert_frame_equal(res, df1)
-        self.assertEqual(res['DATE'].dtype, 'datetime64[ns, UTC]')
+        assert res['DATE'].dtype == 'datetime64[ns, UTC]'
 
         dts1 = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03',
                                  '2011-01-04'], tz='US/Eastern')
@@ -680,7 +754,7 @@ def test_combine_first_timezone(self):
         # if df1 doesn't have NaN, keep its dtype
         res = df1.combine_first(df2)
         tm.assert_frame_equal(res, df1)
-        self.assertEqual(res['DATE'].dtype, 'datetime64[ns, US/Eastern]')
+        assert res['DATE'].dtype == 'datetime64[ns, US/Eastern]'
 
         dts1 = pd.date_range('2015-01-01', '2015-01-02', tz='US/Eastern')
         df1 = pd.DataFrame({'DATE': dts1})
@@ -693,7 +767,7 @@ def test_combine_first_timezone(self):
                    pd.Timestamp('2015-01-03')]
         exp = pd.DataFrame({'DATE': exp_dts})
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['DATE'].dtype, 'object')
+        assert res['DATE'].dtype == 'object'
 
     def test_combine_first_timedelta(self):
         data1 = pd.TimedeltaIndex(['1 day', 'NaT', '3 day', '4day'])
@@ -706,7 +780,7 @@ def test_combine_first_timedelta(self):
                                      '11 day', '3 day', '4 day'])
         exp = pd.DataFrame({'TD': exp_dts}, index=[1, 2, 3, 4, 5, 7])
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['TD'].dtype, 'timedelta64[ns]')
+        assert res['TD'].dtype == 'timedelta64[ns]'
 
     def test_combine_first_period(self):
         data1 = pd.PeriodIndex(['2011-01', 'NaT', '2011-03',
@@ -722,7 +796,7 @@ def test_combine_first_period(self):
                                  freq='M')
         exp = pd.DataFrame({'P': exp_dts}, index=[1, 2, 3, 4, 5, 7])
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['P'].dtype, 'object')
+        assert res['P'].dtype == data1.dtype
 
         # different freq
         dts2 = pd.PeriodIndex(['2012-01-01', '2012-01-02',
@@ -738,7 +812,7 @@ def test_combine_first_period(self):
                    pd.Period('2011-04', freq='M')]
         exp = pd.DataFrame({'P': exp_dts}, index=[1, 2, 3, 4, 5, 7])
         tm.assert_frame_equal(res, exp)
-        self.assertEqual(res['P'].dtype, 'object')
+        assert res['P'].dtype == 'object'
 
     def test_combine_first_int(self):
         # GH14687 - integer series that do no align exactly
@@ -748,7 +822,18 @@ def test_combine_first_int(self):
 
         res = df1.combine_first(df2)
         tm.assert_frame_equal(res, df1)
-        self.assertEqual(res['a'].dtype, 'int64')
+        assert res['a'].dtype == 'int64'
+
+    @pytest.mark.parametrize("val", [1, 1.0])
+    def test_combine_first_with_asymmetric_other(self, val):
+        # see gh-20699
+        df1 = pd.DataFrame({'isNum': [val]})
+        df2 = pd.DataFrame({'isBool': [True]})
+
+        res = df1.combine_first(df2)
+        exp = pd.DataFrame({'isBool': [True], 'isNum': [val]})
+
+        tm.assert_frame_equal(res, exp)
 
     def test_concat_datetime_datetime64_frame(self):
         # #2624
@@ -763,3 +848,26 @@ def test_concat_datetime_datetime64_frame(self):
 
         # it works!
         pd.concat([df1, df2_obj])
+
+
+class TestDataFrameUpdate(TestData):
+
+    def test_update_nan(self):
+        # #15593 #15617
+        # test 1
+        df1 = DataFrame({'A': [1.0, 2, 3], 'B': date_range('2000', periods=3)})
+        df2 = DataFrame({'A': [None, 2, 3]})
+        expected = df1.copy()
+        df1.update(df2, overwrite=False)
+
+        tm.assert_frame_equal(df1, expected)
+
+        # test 2
+        df1 = DataFrame({'A': [1.0, None, 3],
+                         'B': date_range('2000', periods=3)})
+        df2 = DataFrame({'A': [None, 2, 3]})
+        expected = DataFrame({'A': [1.0, 2, 3],
+                              'B': date_range('2000', periods=3)})
+        df1.update(df2, overwrite=False)
+
+        tm.assert_frame_equal(df1, expected)
diff --git a/pandas/tests/frame/test_constructors.py b/pandas/tests/frame/test_constructors.py
index ba7e45d7e66fb..fc642d211b30c 100644
--- a/pandas/tests/frame/test_constructors.py
+++ b/pandas/tests/frame/test_constructors.py
@@ -2,46 +2,42 @@
 
 from __future__ import print_function
 
+from collections import OrderedDict
 from datetime import datetime, timedelta
 import functools
 import itertools
 
-import pytest
-from numpy.random import randn
-
 import numpy as np
 import numpy.ma as ma
-import numpy.ma.mrecords as mrecords
-
-from pandas.types.common import is_integer_dtype
-from pandas.compat import (lmap, long, zip, range, lrange, lzip,
-                           OrderedDict, is_platform_little_endian)
-from pandas import compat
-from pandas import (DataFrame, Index, Series, isnull,
-                    MultiIndex, Timedelta, Timestamp,
-                    date_range)
-from pandas.core.common import PandasError
-import pandas as pd
-import pandas.core.common as com
-import pandas._libs.lib as lib
-import pandas.util.testing as tm
+import pytest
 
-from pandas.tests.frame.common import TestData
+from pandas.compat import (
+    PY2, PY3, PY36, is_platform_little_endian, lmap, long, lrange, lzip, range,
+    zip)
 
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+from pandas.core.dtypes.common import is_integer_dtype
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, MultiIndex, Series, Timedelta, Timestamp,
+    compat, date_range, isna)
+from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
 
 MIXED_FLOAT_DTYPES = ['float16', 'float32', 'float64']
 MIXED_INT_DTYPES = ['uint8', 'uint16', 'uint32', 'uint64', 'int8', 'int16',
                     'int32', 'int64']
 
 
-class TestDataFrameConstructors(tm.TestCase, TestData):
+class TestDataFrameConstructors(TestData):
 
     def test_constructor(self):
         df = DataFrame()
-        self.assertEqual(len(df.index), 0)
+        assert len(df.index) == 0
 
         df = DataFrame(data={})
-        self.assertEqual(len(df.index), 0)
+        assert len(df.index) == 0
 
     def test_constructor_mixed(self):
         index, data = tm.getMixedTypeDict()
@@ -50,11 +46,11 @@ def test_constructor_mixed(self):
         indexed_frame = DataFrame(data, index=index)  # noqa
         unindexed_frame = DataFrame(data)  # noqa
 
-        self.assertEqual(self.mixed_frame['foo'].dtype, np.object_)
+        assert self.mixed_frame['foo'].dtype == np.object_
 
     def test_constructor_cast_failure(self):
         foo = DataFrame({'a': ['a', 'b', 'c']}, dtype=np.float64)
-        self.assertEqual(foo['a'].dtype, object)
+        assert foo['a'].dtype == object
 
         # GH 3010, constructing with odd arrays
         df = DataFrame(np.ones((4, 2)))
@@ -63,8 +59,9 @@ def test_constructor_cast_failure(self):
         df['foo'] = np.ones((4, 2)).tolist()
 
         # this is not ok
-        self.assertRaises(ValueError, df.__setitem__, tuple(['test']),
-                          np.ones((4, 2)))
+        msg = "Wrong number of items passed 2, placement implies 1"
+        with pytest.raises(ValueError, match=msg):
+            df['test'] = np.ones((4, 2))
 
         # this is ok
         df['foo2'] = np.ones((4, 2)).tolist()
@@ -78,32 +75,31 @@ def test_constructor_dtype_copy(self):
         new_df = pd.DataFrame(orig_df, dtype=float, copy=True)
 
         new_df['col1'] = 200.
-        self.assertEqual(orig_df['col1'][0], 1.)
+        assert orig_df['col1'][0] == 1.
 
     def test_constructor_dtype_nocast_view(self):
         df = DataFrame([[1, 2]])
         should_be_view = DataFrame(df, dtype=df[0].dtype)
         should_be_view[0][0] = 99
-        self.assertEqual(df.values[0, 0], 99)
+        assert df.values[0, 0] == 99
 
         should_be_view = DataFrame(df.values, dtype=df[0].dtype)
         should_be_view[0][0] = 97
-        self.assertEqual(df.values[0, 0], 97)
+        assert df.values[0, 0] == 97
 
     def test_constructor_dtype_list_data(self):
         df = DataFrame([[1, '2'],
                         [None, 'a']], dtype=object)
-        self.assertIsNone(df.loc[1, 0])
-        self.assertEqual(df.loc[0, 1], '2')
+        assert df.loc[1, 0] is None
+        assert df.loc[0, 1] == '2'
 
     def test_constructor_list_frames(self):
-
-        # GH 3243
+        # see gh-3243
         result = DataFrame([DataFrame([])])
-        self.assertEqual(result.shape, (1, 0))
+        assert result.shape == (1, 0)
 
         result = DataFrame([DataFrame(dict(A=lrange(5)))])
-        tm.assertIsInstance(result.iloc[0, 0], DataFrame)
+        assert isinstance(result.iloc[0, 0], DataFrame)
 
     def test_constructor_mixed_dtypes(self):
 
@@ -123,7 +119,7 @@ def _make_mixed_dtypes_df(typ, ad=None):
                 assert(a.dtype == d)
             if ad is None:
                 ad = dict()
-            ad.update(dict([(d, a) for d, a in zipper]))
+            ad.update({d: a for d, a in zipper})
             return DataFrame(ad)
 
         def _check_mixed_dtypes(df, dtypes=None):
@@ -151,23 +147,34 @@ def test_constructor_complex_dtypes(self):
         b = np.random.rand(10).astype(np.complex128)
 
         df = DataFrame({'a': a, 'b': b})
-        self.assertEqual(a.dtype, df.a.dtype)
-        self.assertEqual(b.dtype, df.b.dtype)
+        assert a.dtype == df.a.dtype
+        assert b.dtype == df.b.dtype
+
+    def test_constructor_dtype_str_na_values(self, string_dtype):
+        # https://github.com/pandas-dev/pandas/issues/21083
+        df = DataFrame({'A': ['x', None]}, dtype=string_dtype)
+        result = df.isna()
+        expected = DataFrame({"A": [False, True]})
+        tm.assert_frame_equal(result, expected)
+        assert df.iloc[1, 0] is None
+
+        df = DataFrame({'A': ['x', np.nan]}, dtype=string_dtype)
+        assert np.isnan(df.iloc[1, 0])
 
     def test_constructor_rec(self):
         rec = self.frame.to_records(index=False)
-
-        # Assigning causes segfault in NumPy < 1.5.1
-        # rec.dtype.names = list(rec.dtype.names)[::-1]
+        if PY3:
+            # unicode error under PY2
+            rec.dtype.names = list(rec.dtype.names)[::-1]
 
         index = self.frame.index
 
         df = DataFrame(rec)
-        self.assert_index_equal(df.columns, pd.Index(rec.dtype.names))
+        tm.assert_index_equal(df.columns, pd.Index(rec.dtype.names))
 
         df2 = DataFrame(rec, index=index)
-        self.assert_index_equal(df2.columns, pd.Index(rec.dtype.names))
-        self.assert_index_equal(df2.index, index)
+        tm.assert_index_equal(df2.columns, pd.Index(rec.dtype.names))
+        tm.assert_index_equal(df2.index, index)
 
         rng = np.arange(len(rec))[::-1]
         df3 = DataFrame(rec, index=rng, columns=['C', 'B'])
@@ -177,7 +184,7 @@ def test_constructor_rec(self):
     def test_constructor_bool(self):
         df = DataFrame({0: np.ones(10, dtype=bool),
                         1: np.zeros(10, dtype=bool)})
-        self.assertEqual(df.values.dtype, np.bool_)
+        assert df.values.dtype == np.bool_
 
     def test_constructor_overflow_int64(self):
         # see gh-14881
@@ -185,7 +192,7 @@ def test_constructor_overflow_int64(self):
                           dtype=np.uint64)
 
         result = DataFrame({'a': values})
-        self.assertEqual(result['a'].dtype, np.uint64)
+        assert result['a'].dtype == np.uint64
 
         # see gh-2355
         data_scores = [(6311132704823138710, 273), (2685045978526272070, 23),
@@ -196,7 +203,19 @@ def test_constructor_overflow_int64(self):
         data = np.zeros((len(data_scores),), dtype=dtype)
         data[:] = data_scores
         df_crawls = DataFrame(data)
-        self.assertEqual(df_crawls['uid'].dtype, np.uint64)
+        assert df_crawls['uid'].dtype == np.uint64
+
+    @pytest.mark.parametrize("values", [np.array([2**64], dtype=object),
+                                        np.array([2**65]), [2**64 + 1],
+                                        np.array([-2**63 - 4], dtype=object),
+                                        np.array([-2**64 - 1]), [-2**65 - 2]])
+    def test_constructor_int_overflow(self, values):
+        # see gh-18584
+        value = values[0]
+        result = DataFrame(values)
+
+        assert result[0].dtype == object
+        assert result[0][0] == value
 
     def test_constructor_ordereddict(self):
         import random
@@ -205,15 +224,15 @@ def test_constructor_ordereddict(self):
         random.shuffle(nums)
         expected = ['A%d' % i for i in nums]
         df = DataFrame(OrderedDict(zip(expected, [[0]] * nitems)))
-        self.assertEqual(expected, list(df.columns))
+        assert expected == list(df.columns)
 
     def test_constructor_dict(self):
         frame = DataFrame({'col1': self.ts1,
                            'col2': self.ts2})
 
         # col2 is padded with NaN
-        self.assertEqual(len(self.ts1), 30)
-        self.assertEqual(len(self.ts2), 25)
+        assert len(self.ts1) == 30
+        assert len(self.ts2) == 25
 
         tm.assert_series_equal(self.ts1, frame['col1'], check_names=False)
 
@@ -225,56 +244,121 @@ def test_constructor_dict(self):
                            'col2': self.ts2},
                           columns=['col2', 'col3', 'col4'])
 
-        self.assertEqual(len(frame), len(self.ts2))
-        self.assertNotIn('col1', frame)
-        self.assertTrue(isnull(frame['col3']).all())
+        assert len(frame) == len(self.ts2)
+        assert 'col1' not in frame
+        assert isna(frame['col3']).all()
 
         # Corner cases
-        self.assertEqual(len(DataFrame({})), 0)
+        assert len(DataFrame()) == 0
 
         # mix dict and array, wrong size - no spec for which error should raise
         # first
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             DataFrame({'A': {'a': 'a', 'b': 'b'}, 'B': ['a', 'b', 'c']})
 
         # Length-one dict micro-optimization
         frame = DataFrame({'A': {'1': 1, '2': 2}})
-        self.assert_index_equal(frame.index, pd.Index(['1', '2']))
+        tm.assert_index_equal(frame.index, pd.Index(['1', '2']))
 
         # empty dict plus index
         idx = Index([0, 1, 2])
         frame = DataFrame({}, index=idx)
-        self.assertIs(frame.index, idx)
+        assert frame.index is idx
 
         # empty with index and columns
         idx = Index([0, 1, 2])
         frame = DataFrame({}, index=idx, columns=idx)
-        self.assertIs(frame.index, idx)
-        self.assertIs(frame.columns, idx)
-        self.assertEqual(len(frame._series), 3)
+        assert frame.index is idx
+        assert frame.columns is idx
+        assert len(frame._series) == 3
 
         # with dict of empty list and Series
         frame = DataFrame({'A': [], 'B': []}, columns=['A', 'B'])
-        self.assert_index_equal(frame.index, Index([], dtype=np.int64))
+        tm.assert_index_equal(frame.index, Index([], dtype=np.int64))
 
         # GH 14381
         # Dict with None value
         frame_none = DataFrame(dict(a=None), index=[0])
         frame_none_list = DataFrame(dict(a=[None]), index=[0])
-        tm.assert_equal(frame_none.get_value(0, 'a'), None)
-        tm.assert_equal(frame_none_list.get_value(0, 'a'), None)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert frame_none.get_value(0, 'a') is None
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert frame_none_list.get_value(0, 'a') is None
         tm.assert_frame_equal(frame_none, frame_none_list)
 
         # GH10856
         # dict with scalar values should raise error, even if columns passed
-        with tm.assertRaises(ValueError):
+        msg = 'If using all scalar values, you must pass an index'
+        with pytest.raises(ValueError, match=msg):
             DataFrame({'a': 0.7})
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError, match=msg):
             DataFrame({'a': 0.7}, columns=['a'])
 
-        with tm.assertRaises(ValueError):
-            DataFrame({'a': 0.7}, columns=['b'])
+    @pytest.mark.parametrize("scalar", [2, np.nan, None, 'D'])
+    def test_constructor_invalid_items_unused(self, scalar):
+        # No error if invalid (scalar) value is in fact not used:
+        result = DataFrame({'a': scalar}, columns=['b'])
+        expected = DataFrame(columns=['b'])
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [2, np.nan, None, float('nan')])
+    def test_constructor_dict_nan_key(self, value):
+        # GH 18455
+        cols = [1, value, 3]
+        idx = ['a', value]
+        values = [[0, 3], [1, 4], [2, 5]]
+        data = {cols[c]: Series(values[c], index=idx) for c in range(3)}
+        result = DataFrame(data).sort_values(1).sort_values('a', axis=1)
+        expected = DataFrame(np.arange(6, dtype='int64').reshape(2, 3),
+                             index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx).sort_values('a', axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [np.nan, None, float('nan')])
+    def test_constructor_dict_nan_tuple_key(self, value):
+        # GH 18455
+        cols = Index([(11, 21), (value, 22), (13, value)])
+        idx = Index([('a', value), (value, 2)])
+        values = [[0, 3], [1, 4], [2, 5]]
+        data = {cols[c]: Series(values[c], index=idx) for c in range(3)}
+        result = (DataFrame(data)
+                  .sort_values((11, 21))
+                  .sort_values(('a', value), axis=1))
+        expected = DataFrame(np.arange(6, dtype='int64').reshape(2, 3),
+                             index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx).sort_values(('a', value), axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        result = DataFrame(data, index=idx, columns=cols)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(not PY36, reason='Insertion order for Python>=3.6')
+    def test_constructor_dict_order_insertion(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6
+        d = {'b': self.ts2, 'a': self.ts1}
+        frame = DataFrame(data=d)
+        expected = DataFrame(data=d, columns=list('ba'))
+        tm.assert_frame_equal(frame, expected)
+
+    @pytest.mark.skipif(PY36, reason='order by value for Python<3.6')
+    def test_constructor_dict_order_by_values(self):
+        # GH19018
+        # initialization ordering: by value if python<3.6
+        d = {'b': self.ts2, 'a': self.ts1}
+        frame = DataFrame(data=d)
+        expected = DataFrame(data=d, columns=list('ab'))
+        tm.assert_frame_equal(frame, expected)
 
     def test_constructor_multi_index(self):
         # GH 4078
@@ -282,47 +366,63 @@ def test_constructor_multi_index(self):
         tuples = [(2, 3), (3, 3), (3, 3)]
         mi = MultiIndex.from_tuples(tuples)
         df = DataFrame(index=mi, columns=mi)
-        self.assertTrue(pd.isnull(df).values.ravel().all())
+        assert pd.isna(df).values.ravel().all()
 
         tuples = [(3, 3), (2, 3), (3, 3)]
         mi = MultiIndex.from_tuples(tuples)
         df = DataFrame(index=mi, columns=mi)
-        self.assertTrue(pd.isnull(df).values.ravel().all())
+        assert pd.isna(df).values.ravel().all()
 
     def test_constructor_error_msgs(self):
         msg = "Empty data passed with indices specified."
         # passing an empty array with columns specified.
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             DataFrame(np.empty(0), columns=list('abc'))
 
         msg = "Mixing dicts with non-Series may lead to ambiguous ordering."
         # mix dict and array, wrong size
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             DataFrame({'A': {'a': 'a', 'b': 'b'},
                        'B': ['a', 'b', 'c']})
 
         # wrong size ndarray, GH 3105
-        msg = r"Shape of passed values is \(3, 4\), indices imply \(3, 3\)"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = r"Shape of passed values is \(4, 3\), indices imply \(3, 3\)"
+        with pytest.raises(ValueError, match=msg):
             DataFrame(np.arange(12).reshape((4, 3)),
                       columns=['foo', 'bar', 'baz'],
                       index=pd.date_range('2000-01-01', periods=3))
 
+        arr = np.array([[4, 5, 6]])
+        msg = r"Shape of passed values is \(1, 3\), indices imply \(1, 4\)"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame(index=[0], columns=range(0, 4), data=arr)
+
+        arr = np.array([4, 5, 6])
+        msg = r"Shape of passed values is \(3, 1\), indices imply \(1, 4\)"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame(index=[0], columns=range(0, 4), data=arr)
+
         # higher dim raise exception
-        with tm.assertRaisesRegexp(ValueError, 'Must pass 2-d input'):
+        with pytest.raises(ValueError, match='Must pass 2-d input'):
             DataFrame(np.zeros((3, 3, 3)), columns=['A', 'B', 'C'], index=[1])
 
         # wrong size axis labels
-        with tm.assertRaisesRegexp(ValueError, "Shape of passed values is "
-                                   r"\(3, 2\), indices imply \(3, 1\)"):
+        msg = ("Shape of passed values "
+               r"is \(2, 3\), indices "
+               r"imply \(1, 3\)")
+        with pytest.raises(ValueError, match=msg):
             DataFrame(np.random.rand(2, 3), columns=['A', 'B', 'C'], index=[1])
 
-        with tm.assertRaisesRegexp(ValueError, "Shape of passed values is "
-                                   r"\(3, 2\), indices imply \(2, 2\)"):
+        msg = ("Shape of passed values "
+               r"is \(2, 3\), indices "
+               r"imply \(2, 2\)")
+        with pytest.raises(ValueError, match=msg):
             DataFrame(np.random.rand(2, 3), columns=['A', 'B'], index=[1, 2])
 
-        with tm.assertRaisesRegexp(ValueError, 'If using all scalar values, '
-                                   'you must pass an index'):
+        msg = ("If using all scalar "
+               "values, you must pass "
+               "an index")
+        with pytest.raises(ValueError, match=msg):
             DataFrame({'a': False, 'b': True})
 
     def test_constructor_with_embedded_frames(self):
@@ -345,8 +445,8 @@ def test_constructor_subclass_dict(self):
         data = {'col1': tm.TestSubDict((x, 10.0 * x) for x in range(10)),
                 'col2': tm.TestSubDict((x, 20.0 * x) for x in range(10))}
         df = DataFrame(data)
-        refdf = DataFrame(dict((col, dict(compat.iteritems(val)))
-                               for col, val in compat.iteritems(data)))
+        refdf = DataFrame({col: dict(compat.iteritems(val))
+                           for col, val in compat.iteritems(data)})
         tm.assert_frame_equal(refdf, df)
 
         data = tm.TestSubDict(compat.iteritems(data))
@@ -377,46 +477,47 @@ def test_constructor_dict_cast(self):
             'B': {'1': '1', '2': '2', '3': '3'},
         }
         frame = DataFrame(test_data, dtype=float)
-        self.assertEqual(len(frame), 3)
-        self.assertEqual(frame['B'].dtype, np.float64)
-        self.assertEqual(frame['A'].dtype, np.float64)
+        assert len(frame) == 3
+        assert frame['B'].dtype == np.float64
+        assert frame['A'].dtype == np.float64
 
         frame = DataFrame(test_data)
-        self.assertEqual(len(frame), 3)
-        self.assertEqual(frame['B'].dtype, np.object_)
-        self.assertEqual(frame['A'].dtype, np.float64)
+        assert len(frame) == 3
+        assert frame['B'].dtype == np.object_
+        assert frame['A'].dtype == np.float64
 
         # can't cast to float
         test_data = {
             'A': dict(zip(range(20), tm.makeStringIndex(20))),
-            'B': dict(zip(range(15), randn(15)))
+            'B': dict(zip(range(15), np.random.randn(15)))
         }
         frame = DataFrame(test_data, dtype=float)
-        self.assertEqual(len(frame), 20)
-        self.assertEqual(frame['A'].dtype, np.object_)
-        self.assertEqual(frame['B'].dtype, np.float64)
+        assert len(frame) == 20
+        assert frame['A'].dtype == np.object_
+        assert frame['B'].dtype == np.float64
 
     def test_constructor_dict_dont_upcast(self):
         d = {'Col1': {'Row1': 'A String', 'Row2': np.nan}}
         df = DataFrame(d)
-        tm.assertIsInstance(df['Col1']['Row2'], float)
+        assert isinstance(df['Col1']['Row2'], float)
 
         dm = DataFrame([[1, 2], ['a', 'b']], index=[1, 2], columns=[1, 2])
-        tm.assertIsInstance(dm[1][1], int)
+        assert isinstance(dm[1][1], int)
 
     def test_constructor_dict_of_tuples(self):
         # GH #1491
         data = {'a': (1, 2, 3), 'b': (4, 5, 6)}
 
         result = DataFrame(data)
-        expected = DataFrame(dict((k, list(v))
-                                  for k, v in compat.iteritems(data)))
+        expected = DataFrame({k: list(v) for k, v in compat.iteritems(data)})
         tm.assert_frame_equal(result, expected, check_dtype=False)
 
     def test_constructor_dict_multiindex(self):
-        check = lambda result, expected: tm.assert_frame_equal(
-            result, expected, check_dtype=True, check_index_type=True,
-            check_column_type=True, check_names=True)
+        def check(result, expected):
+            return tm.assert_frame_equal(result, expected, check_dtype=True,
+                                         check_index_type=True,
+                                         check_column_type=True,
+                                         check_names=True)
         d = {('a', 'a'): {('i', 'i'): 0, ('i', 'j'): 1, ('j', 'i'): 2},
              ('b', 'a'): {('i', 'i'): 6, ('i', 'j'): 5, ('j', 'i'): 4},
              ('b', 'c'): {('i', 'i'): 7, ('i', 'j'): 8, ('j', 'i'): 9}}
@@ -443,8 +544,8 @@ def test_constructor_dict_datetime64_index(self):
         dates_as_str = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
 
         def create_data(constructor):
-            return dict((i, {constructor(s): 2 * i})
-                        for i, s in enumerate(dates_as_str))
+            return {i: {constructor(s): 2 * i}
+                    for i, s in enumerate(dates_as_str)}
 
         data_datetime64 = create_data(np.datetime64)
         data_datetime = create_data(lambda x: datetime.strptime(x, '%Y-%m-%d'))
@@ -468,8 +569,8 @@ def test_constructor_dict_timedelta64_index(self):
         td_as_int = [1, 2, 3, 4]
 
         def create_data(constructor):
-            return dict((i, {constructor(s): 2 * i})
-                        for i, s in enumerate(td_as_int))
+            return {i: {constructor(s): 2 * i}
+                    for i, s in enumerate(td_as_int)}
 
         data_timedelta64 = create_data(lambda x: np.timedelta64(x, 'D'))
         data_timedelta = create_data(lambda x: timedelta(days=x))
@@ -493,23 +594,25 @@ def test_constructor_period(self):
         a = pd.PeriodIndex(['2012-01', 'NaT', '2012-04'], freq='M')
         b = pd.PeriodIndex(['2012-02-01', '2012-03-01', 'NaT'], freq='D')
         df = pd.DataFrame({'a': a, 'b': b})
-        self.assertEqual(df['a'].dtype, 'object')
-        self.assertEqual(df['b'].dtype, 'object')
+        assert df['a'].dtype == a.dtype
+        assert df['b'].dtype == b.dtype
 
         # list of periods
-        df = pd.DataFrame({'a': a.asobject.tolist(),
-                           'b': b.asobject.tolist()})
-        self.assertEqual(df['a'].dtype, 'object')
-        self.assertEqual(df['b'].dtype, 'object')
+        df = pd.DataFrame({'a': a.astype(object).tolist(),
+                           'b': b.astype(object).tolist()})
+        assert df['a'].dtype == a.dtype
+        assert df['b'].dtype == b.dtype
 
     def test_nested_dict_frame_constructor(self):
         rng = pd.period_range('1/1/2000', periods=5)
-        df = DataFrame(randn(10, 5), columns=rng)
+        df = DataFrame(np.random.randn(10, 5), columns=rng)
 
         data = {}
         for col in df.columns:
             for row in df.index:
-                data.setdefault(col, {})[row] = df.get_value(row, col)
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    data.setdefault(col, {})[row] = df.get_value(row, col)
 
         result = DataFrame(data, columns=rng)
         tm.assert_frame_equal(result, df)
@@ -517,67 +620,69 @@ def test_nested_dict_frame_constructor(self):
         data = {}
         for col in df.columns:
             for row in df.index:
-                data.setdefault(row, {})[col] = df.get_value(row, col)
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    data.setdefault(row, {})[col] = df.get_value(row, col)
 
         result = DataFrame(data, index=rng).T
         tm.assert_frame_equal(result, df)
 
     def _check_basic_constructor(self, empty):
-        # mat: 2d matrix with shpae (3, 2) to input. empty - makes sized
+        # mat: 2d matrix with shape (3, 2) to input. empty - makes sized
         # objects
         mat = empty((2, 3), dtype=float)
         # 2-D input
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
 
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
 
         # 1-D input
         frame = DataFrame(empty((3,)), columns=['A'], index=[1, 2, 3])
-        self.assertEqual(len(frame.index), 3)
-        self.assertEqual(len(frame.columns), 1)
+        assert len(frame.index) == 3
+        assert len(frame.columns) == 1
 
         # cast type
         frame = DataFrame(mat, columns=['A', 'B', 'C'],
                           index=[1, 2], dtype=np.int64)
-        self.assertEqual(frame.values.dtype, np.int64)
+        assert frame.values.dtype == np.int64
 
         # wrong size axis labels
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = r'Shape of passed values is \(2, 3\), indices imply \(1, 3\)'
+        with pytest.raises(ValueError, match=msg):
             DataFrame(mat, columns=['A', 'B', 'C'], index=[1])
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(2, 2\)'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = r'Shape of passed values is \(2, 3\), indices imply \(2, 2\)'
+        with pytest.raises(ValueError, match=msg):
             DataFrame(mat, columns=['A', 'B'], index=[1, 2])
 
         # higher dim raise exception
-        with tm.assertRaisesRegexp(ValueError, 'Must pass 2-d input'):
+        with pytest.raises(ValueError, match='Must pass 2-d input'):
             DataFrame(empty((3, 3, 3)), columns=['A', 'B', 'C'],
                       index=[1])
 
         # automatic labeling
         frame = DataFrame(mat)
-        self.assert_index_equal(frame.index, pd.Index(lrange(2)))
-        self.assert_index_equal(frame.columns, pd.Index(lrange(3)))
+        tm.assert_index_equal(frame.index, pd.Index(lrange(2)))
+        tm.assert_index_equal(frame.columns, pd.Index(lrange(3)))
 
         frame = DataFrame(mat, index=[1, 2])
-        self.assert_index_equal(frame.columns, pd.Index(lrange(3)))
+        tm.assert_index_equal(frame.columns, pd.Index(lrange(3)))
 
         frame = DataFrame(mat, columns=['A', 'B', 'C'])
-        self.assert_index_equal(frame.index, pd.Index(lrange(2)))
+        tm.assert_index_equal(frame.index, pd.Index(lrange(2)))
 
         # 0-length axis
         frame = DataFrame(empty((0, 3)))
-        self.assertEqual(len(frame.index), 0)
+        assert len(frame.index) == 0
 
         frame = DataFrame(empty((3, 0)))
-        self.assertEqual(len(frame.columns), 0)
+        assert len(frame.columns) == 0
 
     def test_constructor_ndarray(self):
         self._check_basic_constructor(np.ones)
 
         frame = DataFrame(['foo', 'bar'], index=[0, 1], columns=['A'])
-        self.assertEqual(len(frame), 2)
+        assert len(frame) == 2
 
     def test_constructor_maskedarray(self):
         self._check_basic_constructor(ma.masked_all)
@@ -587,13 +692,13 @@ def test_constructor_maskedarray(self):
         mat[0, 0] = 1.0
         mat[1, 2] = 2.0
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1.0, frame['A'][1])
-        self.assertEqual(2.0, frame['C'][2])
+        assert 1.0 == frame['A'][1]
+        assert 2.0 == frame['C'][2]
 
         # what is this even checking??
         mat = ma.masked_all((2, 3), dtype=float)
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
+        assert np.all(~np.asarray(frame == frame))
 
     def test_constructor_maskedarray_nonfloat(self):
         # masked int promoted to float
@@ -601,66 +706,99 @@ def test_constructor_maskedarray_nonfloat(self):
         # 2-D input
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
 
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert np.all(~np.asarray(frame == frame))
 
         # cast type
         frame = DataFrame(mat, columns=['A', 'B', 'C'],
                           index=[1, 2], dtype=np.float64)
-        self.assertEqual(frame.values.dtype, np.float64)
+        assert frame.values.dtype == np.float64
 
         # Check non-masked values
         mat2 = ma.copy(mat)
         mat2[0, 0] = 1
         mat2[1, 2] = 2
         frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1, frame['A'][1])
-        self.assertEqual(2, frame['C'][2])
+        assert 1 == frame['A'][1]
+        assert 2 == frame['C'][2]
 
-        # masked np.datetime64 stays (use lib.NaT as null)
+        # masked np.datetime64 stays (use NaT as null)
         mat = ma.masked_all((2, 3), dtype='M8[ns]')
         # 2-D input
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
 
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(isnull(frame).values.all())
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert isna(frame).values.all()
 
         # cast type
         frame = DataFrame(mat, columns=['A', 'B', 'C'],
                           index=[1, 2], dtype=np.int64)
-        self.assertEqual(frame.values.dtype, np.int64)
+        assert frame.values.dtype == np.int64
 
         # Check non-masked values
         mat2 = ma.copy(mat)
         mat2[0, 0] = 1
         mat2[1, 2] = 2
         frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(1, frame['A'].view('i8')[1])
-        self.assertEqual(2, frame['C'].view('i8')[2])
+        assert 1 == frame['A'].view('i8')[1]
+        assert 2 == frame['C'].view('i8')[2]
 
         # masked bool promoted to object
         mat = ma.masked_all((2, 3), dtype=bool)
         # 2-D input
         frame = DataFrame(mat, columns=['A', 'B', 'C'], index=[1, 2])
 
-        self.assertEqual(len(frame.index), 2)
-        self.assertEqual(len(frame.columns), 3)
-        self.assertTrue(np.all(~np.asarray(frame == frame)))
+        assert len(frame.index) == 2
+        assert len(frame.columns) == 3
+        assert np.all(~np.asarray(frame == frame))
 
         # cast type
         frame = DataFrame(mat, columns=['A', 'B', 'C'],
                           index=[1, 2], dtype=object)
-        self.assertEqual(frame.values.dtype, object)
+        assert frame.values.dtype == object
 
         # Check non-masked values
         mat2 = ma.copy(mat)
         mat2[0, 0] = True
         mat2[1, 2] = False
         frame = DataFrame(mat2, columns=['A', 'B', 'C'], index=[1, 2])
-        self.assertEqual(True, frame['A'][1])
-        self.assertEqual(False, frame['C'][2])
+        assert frame['A'][1] is True
+        assert frame['C'][2] is False
+
+    def test_constructor_maskedarray_hardened(self):
+        # Check numpy masked arrays with hard masks -- from GH24574
+        mat_hard = ma.masked_all((2, 2), dtype=float).harden_mask()
+        result = pd.DataFrame(mat_hard, columns=['A', 'B'], index=[1, 2])
+        expected = pd.DataFrame({
+            'A': [np.nan, np.nan],
+            'B': [np.nan, np.nan]},
+            columns=['A', 'B'],
+            index=[1, 2],
+            dtype=float)
+        tm.assert_frame_equal(result, expected)
+        # Check case where mask is hard but no data are masked
+        mat_hard = ma.ones((2, 2), dtype=float).harden_mask()
+        result = pd.DataFrame(mat_hard, columns=['A', 'B'], index=[1, 2])
+        expected = pd.DataFrame({
+            'A': [1.0, 1.0],
+            'B': [1.0, 1.0]},
+            columns=['A', 'B'],
+            index=[1, 2],
+            dtype=float)
+        tm.assert_frame_equal(result, expected)
+
+    def test_constructor_maskedrecarray_dtype(self):
+        # Ensure constructor honors dtype
+        data = np.ma.array(
+            np.ma.zeros(5, dtype=[('date', '<f8'), ('price', '<f8')]),
+            mask=[False] * 5)
+        data = data.view(ma.mrecords.mrecarray)
+        result = pd.DataFrame(data, dtype=int)
+        expected = pd.DataFrame(np.zeros((5, 2), dtype=int),
+                                columns=['date', 'price'])
+        tm.assert_frame_equal(result, expected)
 
     def test_constructor_mrecarray(self):
         # Ensure mrecarray produces frame identical to dict of masked arrays
@@ -685,11 +823,11 @@ def test_constructor_mrecarray(self):
         # call assert_frame_equal for all selections of 3 arrays
         for comb in itertools.combinations(arrays, 3):
             names, data = zip(*comb)
-            mrecs = mrecords.fromarrays(data, names=names)
+            mrecs = ma.mrecords.fromarrays(data, names=names)
 
             # fill the comb
-            comb = dict([(k, v.filled()) if hasattr(
-                v, 'filled') else (k, v) for k, v in comb])
+            comb = {k: (v.filled() if hasattr(v, 'filled') else v)
+                    for k, v in comb}
 
             expected = DataFrame(comb, columns=names)
             result = DataFrame(mrecs)
@@ -705,43 +843,38 @@ def test_constructor_mrecarray(self):
             result = DataFrame(mrecs, index=[1, 2])
             assert_fr_equal(result, expected)
 
-    def test_constructor_corner(self):
+    def test_constructor_corner_shape(self):
         df = DataFrame(index=[])
-        self.assertEqual(df.values.shape, (0, 0))
-
-        # empty but with specified dtype
-        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=object)
-        self.assertEqual(df.values.dtype, np.object_)
-
-        # does not error but ends up float
-        df = DataFrame(index=lrange(10), columns=['a', 'b'], dtype=int)
-        self.assertEqual(df.values.dtype, np.object_)
-
-        # #1783 empty dtype object
-        df = DataFrame({}, columns=['foo', 'bar'])
-        self.assertEqual(df.values.dtype, np.object_)
-
-        df = DataFrame({'b': 1}, index=lrange(10), columns=list('abc'),
-                       dtype=int)
-        self.assertEqual(df.values.dtype, np.object_)
+        assert df.values.shape == (0, 0)
+
+    @pytest.mark.parametrize("data, index, columns, dtype, expected", [
+        (None, lrange(10), ['a', 'b'], object, np.object_),
+        (None, None, ['a', 'b'], 'int64', np.dtype('int64')),
+        (None, lrange(10), ['a', 'b'], int, np.dtype('float64')),
+        ({}, None, ['foo', 'bar'], None, np.object_),
+        ({'b': 1}, lrange(10), list('abc'), int, np.dtype('float64'))
+    ])
+    def test_constructor_dtype(self, data, index, columns, dtype, expected):
+        df = DataFrame(data, index, columns, dtype)
+        assert df.values.dtype == expected
 
     def test_constructor_scalar_inference(self):
         data = {'int': 1, 'bool': True,
                 'float': 3., 'complex': 4j, 'object': 'foo'}
         df = DataFrame(data, index=np.arange(10))
 
-        self.assertEqual(df['int'].dtype, np.int64)
-        self.assertEqual(df['bool'].dtype, np.bool_)
-        self.assertEqual(df['float'].dtype, np.float64)
-        self.assertEqual(df['complex'].dtype, np.complex128)
-        self.assertEqual(df['object'].dtype, np.object_)
+        assert df['int'].dtype == np.int64
+        assert df['bool'].dtype == np.bool_
+        assert df['float'].dtype == np.float64
+        assert df['complex'].dtype == np.complex128
+        assert df['object'].dtype == np.object_
 
     def test_constructor_arrays_and_scalars(self):
-        df = DataFrame({'a': randn(10), 'b': True})
+        df = DataFrame({'a': np.random.randn(10), 'b': True})
         exp = DataFrame({'a': df['a'].values, 'b': [True] * 10})
 
         tm.assert_frame_equal(df, exp)
-        with tm.assertRaisesRegexp(ValueError, 'must pass an index'):
+        with pytest.raises(ValueError, match='must pass an index'):
             DataFrame({'a': False, 'b': True})
 
     def test_constructor_DataFrame(self):
@@ -749,38 +882,32 @@ def test_constructor_DataFrame(self):
         tm.assert_frame_equal(df, self.frame)
 
         df_casted = DataFrame(self.frame, dtype=np.int64)
-        self.assertEqual(df_casted.values.dtype, np.int64)
+        assert df_casted.values.dtype == np.int64
 
     def test_constructor_more(self):
         # used to be in test_matrix.py
-        arr = randn(10)
+        arr = np.random.randn(10)
         dm = DataFrame(arr, columns=['A'], index=np.arange(10))
-        self.assertEqual(dm.values.ndim, 2)
+        assert dm.values.ndim == 2
 
-        arr = randn(0)
+        arr = np.random.randn(0)
         dm = DataFrame(arr)
-        self.assertEqual(dm.values.ndim, 2)
-        self.assertEqual(dm.values.ndim, 2)
+        assert dm.values.ndim == 2
+        assert dm.values.ndim == 2
 
         # no data specified
         dm = DataFrame(columns=['A', 'B'], index=np.arange(10))
-        self.assertEqual(dm.values.shape, (10, 2))
+        assert dm.values.shape == (10, 2)
 
         dm = DataFrame(columns=['A', 'B'])
-        self.assertEqual(dm.values.shape, (0, 2))
+        assert dm.values.shape == (0, 2)
 
         dm = DataFrame(index=np.arange(10))
-        self.assertEqual(dm.values.shape, (10, 0))
-
-        # corner, silly
-        # TODO: Fix this Exception to be better...
-        with tm.assertRaisesRegexp(PandasError, 'constructor not '
-                                   'properly called'):
-            DataFrame((1, 2, 3))
+        assert dm.values.shape == (10, 0)
 
         # can't cast
         mat = np.array(['foo', 'bar'], dtype=object).reshape(2, 1)
-        with tm.assertRaisesRegexp(ValueError, 'cast'):
+        with pytest.raises(ValueError, match='cast'):
             DataFrame(mat, index=[0, 1], columns=[0], dtype=float)
 
         dm = DataFrame(DataFrame(self.frame._series))
@@ -791,8 +918,8 @@ def test_constructor_more(self):
                         'B': np.ones(10, dtype=np.float64)},
                        index=np.arange(10))
 
-        self.assertEqual(len(dm.columns), 2)
-        self.assertEqual(dm.values.dtype, np.float64)
+        assert len(dm.columns) == 2
+        assert dm.values.dtype == np.float64
 
     def test_constructor_empty_list(self):
         df = DataFrame([], index=[])
@@ -814,14 +941,13 @@ def empty_gen():
 
     def test_constructor_list_of_lists(self):
         # GH #484
-        l = [[1, 'a'], [2, 'b']]
-        df = DataFrame(data=l, columns=["num", "str"])
-        self.assertTrue(is_integer_dtype(df['num']))
-        self.assertEqual(df['str'].dtype, np.object_)
+        df = DataFrame(data=[[1, 'a'], [2, 'b']], columns=["num", "str"])
+        assert is_integer_dtype(df['num'])
+        assert df['str'].dtype == np.object_
 
         # GH 4851
         # list of 0-dim ndarrays
-        expected = DataFrame({0: range(10)})
+        expected = DataFrame({0: np.arange(10)})
         data = [np.array(x) for x in range(10)]
         result = DataFrame(data)
         tm.assert_frame_equal(result, expected)
@@ -829,9 +955,8 @@ def test_constructor_list_of_lists(self):
     def test_constructor_sequence_like(self):
         # GH 3783
         # collections.Squence like
-        import collections
 
-        class DummyContainer(collections.Sequence):
+        class DummyContainer(compat.Sequence):
 
             def __init__(self, lst):
                 self._lst = lst
@@ -842,16 +967,16 @@ def __getitem__(self, n):
             def __len__(self, n):
                 return self._lst.__len__()
 
-        l = [DummyContainer([1, 'a']), DummyContainer([2, 'b'])]
+        lst_containers = [DummyContainer([1, 'a']), DummyContainer([2, 'b'])]
         columns = ["num", "str"]
-        result = DataFrame(l, columns=columns)
+        result = DataFrame(lst_containers, columns=columns)
         expected = DataFrame([[1, 'a'], [2, 'b']], columns=columns)
         tm.assert_frame_equal(result, expected, check_dtype=False)
 
         # GH 4297
         # support Array
         import array
-        result = DataFrame.from_items([('A', array.array('i', range(10)))])
+        result = DataFrame({'A': array.array('i', range(10))})
         expected = DataFrame({'A': list(range(10))})
         tm.assert_frame_equal(result, expected, check_dtype=False)
 
@@ -860,6 +985,17 @@ def __len__(self, n):
                             array.array('i', range(10))])
         tm.assert_frame_equal(result, expected, check_dtype=False)
 
+    def test_constructor_iterable(self):
+        # GH 21987
+        class Iter():
+            def __iter__(self):
+                for i in range(10):
+                    yield [1, 2, 3]
+
+        expected = DataFrame([[1, 2, 3]] * 10)
+        result = DataFrame(Iter())
+        tm.assert_frame_equal(result, expected)
+
     def test_constructor_iterator(self):
 
         expected = DataFrame([list(range(10)), list(range(10))])
@@ -991,6 +1127,17 @@ def test_constructor_list_of_series(self):
         expected = DataFrame.from_dict(sdict, orient='index')
         tm.assert_frame_equal(result, expected)
 
+    def test_constructor_list_of_series_aligned_index(self):
+        series = [pd.Series(i, index=['b', 'a', 'c'], name=str(i))
+                  for i in range(3)]
+        result = pd.DataFrame(series)
+        expected = pd.DataFrame({'b': [0, 1, 2],
+                                 'a': [0, 1, 2],
+                                 'c': [0, 1, 2]},
+                                columns=['b', 'a', 'c'],
+                                index=['0', '1', '2'])
+        tm.assert_frame_equal(result, expected)
+
     def test_constructor_list_of_derived_dicts(self):
         class CustomDict(dict):
             pass
@@ -1004,10 +1151,9 @@ class CustomDict(dict):
         tm.assert_frame_equal(result, result_custom)
 
     def test_constructor_ragged(self):
-        data = {'A': randn(10),
-                'B': randn(8)}
-        with tm.assertRaisesRegexp(ValueError,
-                                   'arrays must all be same length'):
+        data = {'A': np.random.randn(10),
+                'B': np.random.randn(8)}
+        with pytest.raises(ValueError, match='arrays must all be same length'):
             DataFrame(data)
 
     def test_constructor_scalar(self):
@@ -1026,10 +1172,10 @@ def test_constructor_mixed_dict_and_Series(self):
         data['B'] = Series([4, 3, 2, 1], index=['bar', 'qux', 'baz', 'foo'])
 
         result = DataFrame(data)
-        self.assertTrue(result.index.is_monotonic)
+        assert result.index.is_monotonic
 
         # ordering ambiguous, raise exception
-        with tm.assertRaisesRegexp(ValueError, 'ambiguous ordering'):
+        with pytest.raises(ValueError, match='ambiguous ordering'):
             DataFrame({'A': ['a', 'b'], 'B': {'a': 'a', 'b': 'b'}})
 
         # this is OK though
@@ -1039,6 +1185,13 @@ def test_constructor_mixed_dict_and_Series(self):
                              index=['a', 'b'])
         tm.assert_frame_equal(result, expected)
 
+    def test_constructor_mixed_type_rows(self):
+        # Issue 25075
+        data = [[1, 2], (3, 4)]
+        result = DataFrame(data)
+        expected = DataFrame([[1, 2], [3, 4]])
+        tm.assert_frame_equal(result, expected)
+
     def test_constructor_tuples(self):
         result = DataFrame({'A': [(1, 2), (3, 4)]})
         expected = DataFrame({'A': Series([(1, 2), (3, 4)])})
@@ -1071,11 +1224,30 @@ def test_constructor_orient(self):
         xp = DataFrame.from_dict(a).T.reindex(list(a.keys()))
         tm.assert_frame_equal(rs, xp)
 
+    def test_from_dict_columns_parameter(self):
+        # GH 18529
+        # Test new columns parameter for from_dict that was added to make
+        # from_items(..., orient='index', columns=[...]) easier to replicate
+        result = DataFrame.from_dict(OrderedDict([('A', [1, 2]),
+                                                  ('B', [4, 5])]),
+                                     orient='index', columns=['one', 'two'])
+        expected = DataFrame([[1, 2], [4, 5]], index=['A', 'B'],
+                             columns=['one', 'two'])
+        tm.assert_frame_equal(result, expected)
+
+        msg = "cannot use columns parameter with orient='columns'"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame.from_dict(dict([('A', [1, 2]), ('B', [4, 5])]),
+                                orient='columns', columns=['one', 'two'])
+        with pytest.raises(ValueError, match=msg):
+            DataFrame.from_dict(dict([('A', [1, 2]), ('B', [4, 5])]),
+                                columns=['one', 'two'])
+
     def test_constructor_Series_named(self):
         a = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
         df = DataFrame(a)
-        self.assertEqual(df.columns[0], 'x')
-        self.assert_index_equal(df.index, a.index)
+        assert df.columns[0] == 'x'
+        tm.assert_index_equal(df.index, a.index)
 
         # ndarray like
         arr = np.random.randn(10)
@@ -1089,12 +1261,14 @@ def test_constructor_Series_named(self):
         expected = DataFrame({0: s})
         tm.assert_frame_equal(df, expected)
 
-        self.assertRaises(ValueError, DataFrame, s, columns=[1, 2])
+        msg = r"Shape of passed values is \(10, 1\), indices imply \(10, 2\)"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame(s, columns=[1, 2])
 
         # #2234
         a = Series([], name='x')
         df = DataFrame(a)
-        self.assertEqual(df.columns[0], 'x')
+        assert df.columns[0] == 'x'
 
         # series with name and w/o
         s1 = Series(arr, name='x')
@@ -1108,6 +1282,22 @@ def test_constructor_Series_named(self):
         expected = DataFrame({1: s1, 0: arr}, columns=[0, 1])
         tm.assert_frame_equal(df, expected)
 
+    def test_constructor_Series_named_and_columns(self):
+        # GH 9232 validation
+
+        s0 = Series(range(5), name=0)
+        s1 = Series(range(5), name=1)
+
+        # matching name and column gives standard frame
+        tm.assert_frame_equal(pd.DataFrame(s0, columns=[0]),
+                              s0.to_frame())
+        tm.assert_frame_equal(pd.DataFrame(s1, columns=[1]),
+                              s1.to_frame())
+
+        # non-matching produces empty frame
+        assert pd.DataFrame(s0, columns=[1]).empty
+        assert pd.DataFrame(s1, columns=[0]).empty
+
     def test_constructor_Series_differently_indexed(self):
         # name
         s1 = Series([1, 2, 3], index=['a', 'b', 'c'], name='x')
@@ -1119,13 +1309,13 @@ def test_constructor_Series_differently_indexed(self):
 
         df1 = DataFrame(s1, index=other_index)
         exp1 = DataFrame(s1.reindex(other_index))
-        self.assertEqual(df1.columns[0], 'x')
+        assert df1.columns[0] == 'x'
         tm.assert_frame_equal(df1, exp1)
 
         df2 = DataFrame(s2, index=other_index)
         exp2 = DataFrame(s2.reindex(other_index))
-        self.assertEqual(df2.columns[0], 0)
-        self.assert_index_equal(df2.index, other_index)
+        assert df2.columns[0] == 0
+        tm.assert_index_equal(df2.index, other_index)
         tm.assert_frame_equal(df2, exp2)
 
     def test_constructor_manager_resize(self):
@@ -1134,58 +1324,99 @@ def test_constructor_manager_resize(self):
 
         result = DataFrame(self.frame._data, index=index,
                            columns=columns)
-        self.assert_index_equal(result.index, Index(index))
-        self.assert_index_equal(result.columns, Index(columns))
+        tm.assert_index_equal(result.index, Index(index))
+        tm.assert_index_equal(result.columns, Index(columns))
 
     def test_constructor_from_items(self):
         items = [(c, self.frame[c]) for c in self.frame.columns]
-        recons = DataFrame.from_items(items)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(items)
         tm.assert_frame_equal(recons, self.frame)
 
         # pass some columns
-        recons = DataFrame.from_items(items, columns=['C', 'B', 'A'])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(items, columns=['C', 'B', 'A'])
         tm.assert_frame_equal(recons, self.frame.loc[:, ['C', 'B', 'A']])
 
         # orient='index'
 
         row_items = [(idx, self.mixed_frame.xs(idx))
                      for idx in self.mixed_frame.index]
-
-        recons = DataFrame.from_items(row_items,
-                                      columns=self.mixed_frame.columns,
-                                      orient='index')
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(row_items,
+                                          columns=self.mixed_frame.columns,
+                                          orient='index')
         tm.assert_frame_equal(recons, self.mixed_frame)
-        self.assertEqual(recons['A'].dtype, np.float64)
+        assert recons['A'].dtype == np.float64
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Must pass columns with orient='index'"):
-            DataFrame.from_items(row_items, orient='index')
+        msg = "Must pass columns with orient='index'"
+        with pytest.raises(TypeError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items(row_items, orient='index')
 
         # orient='index', but thar be tuples
-        arr = lib.list_to_object_array(
+        arr = construct_1d_object_array_from_listlike(
             [('bar', 'baz')] * len(self.mixed_frame))
         self.mixed_frame['foo'] = arr
         row_items = [(idx, list(self.mixed_frame.xs(idx)))
                      for idx in self.mixed_frame.index]
-        recons = DataFrame.from_items(row_items,
-                                      columns=self.mixed_frame.columns,
-                                      orient='index')
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            recons = DataFrame.from_items(row_items,
+                                          columns=self.mixed_frame.columns,
+                                          orient='index')
         tm.assert_frame_equal(recons, self.mixed_frame)
-        tm.assertIsInstance(recons['foo'][0], tuple)
+        assert isinstance(recons['foo'][0], tuple)
 
-        rs = DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
-                                  orient='index',
-                                  columns=['one', 'two', 'three'])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            rs = DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
+                                      orient='index',
+                                      columns=['one', 'two', 'three'])
         xp = DataFrame([[1, 2, 3], [4, 5, 6]], index=['A', 'B'],
                        columns=['one', 'two', 'three'])
         tm.assert_frame_equal(rs, xp)
 
+    def test_constructor_from_items_scalars(self):
+        # GH 17312
+        msg = (r'The value in each \(key, value\) '
+               'pair must be an array, Series, or dict')
+        with pytest.raises(ValueError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items([('A', 1), ('B', 4)])
+
+        msg = (r'The value in each \(key, value\) '
+               'pair must be an array, Series, or dict')
+        with pytest.raises(ValueError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                DataFrame.from_items([('A', 1), ('B', 2)], columns=['col1'],
+                                     orient='index')
+
+    def test_from_items_deprecation(self):
+        # GH 17320
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])])
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            DataFrame.from_items([('A', [1, 2, 3]), ('B', [4, 5, 6])],
+                                 columns=['col1', 'col2', 'col3'],
+                                 orient='index')
+
     def test_constructor_mix_series_nonseries(self):
         df = DataFrame({'A': self.frame['A'],
                         'B': list(self.frame['B'])}, columns=['A', 'B'])
         tm.assert_frame_equal(df, self.frame.loc[:, ['A', 'B']])
 
-        with tm.assertRaisesRegexp(ValueError, 'does not match index length'):
+        msg = 'does not match index length'
+        with pytest.raises(ValueError, match=msg):
             DataFrame({'A': self.frame['A'], 'B': list(self.frame['B'])[:-2]})
 
     def test_constructor_miscast_na_int_dtype(self):
@@ -1193,10 +1424,6 @@ def test_constructor_miscast_na_int_dtype(self):
         expected = DataFrame([[np.nan, 1], [1, 0]])
         tm.assert_frame_equal(df, expected)
 
-    def test_constructor_iterator_failure(self):
-        with tm.assertRaisesRegexp(TypeError, 'iterator'):
-            df = DataFrame(iter([1, 2, 3]))  # noqa
-
     def test_constructor_column_duplicates(self):
         # it works! #2079
         df = DataFrame([[8, 5]], columns=['a', 'a'])
@@ -1205,13 +1432,15 @@ def test_constructor_column_duplicates(self):
 
         tm.assert_frame_equal(df, edf)
 
-        idf = DataFrame.from_items(
-            [('a', [8]), ('a', [5])], columns=['a', 'a'])
+        idf = DataFrame.from_records([(8, 5)],
+                                     columns=['a', 'a'])
+
         tm.assert_frame_equal(idf, edf)
 
-        self.assertRaises(ValueError, DataFrame.from_items,
-                          [('a', [8]), ('a', [5]), ('b', [6])],
-                          columns=['b', 'a', 'a'])
+        msg = "If using all scalar values, you must pass an index"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame.from_dict(
+                OrderedDict([('b', 8), ('a', 5), ('a', 6)]))
 
     def test_constructor_empty_with_string_dtype(self):
         # GH 9428
@@ -1242,9 +1471,14 @@ def test_constructor_single_value(self):
                                                      dtype=object),
                                             index=[1, 2], columns=['a', 'c']))
 
-        self.assertRaises(com.PandasError, DataFrame, 'a', [1, 2])
-        self.assertRaises(com.PandasError, DataFrame, 'a', columns=['a', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'incompatible data and dtype'):
+        msg = "DataFrame constructor not properly called!"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame('a', [1, 2])
+        with pytest.raises(ValueError, match=msg):
+            DataFrame('a', columns=['a', 'c'])
+
+        msg = 'incompatible data and dtype'
+        with pytest.raises(TypeError, match=msg):
             DataFrame('a', [1, 2], ['a', 'c'], float)
 
     def test_constructor_with_datetimes(self):
@@ -1283,9 +1517,8 @@ def test_constructor_with_datetimes(self):
             expected['float64'] = 1
             expected[floatname] = 1
 
-        result.sort_index()
-        expected = Series(expected)
-        expected.sort_index()
+        result = result.sort_index()
+        expected = Series(expected).sort_index()
         tm.assert_series_equal(result, expected)
 
         # check with ndarray construction ndim>0
@@ -1294,19 +1527,19 @@ def test_constructor_with_datetimes(self):
                         intname: np.array([1] * 10, dtype=intname)},
                        index=np.arange(10))
         result = df.get_dtype_counts()
-        result.sort_index()
+        result = result.sort_index()
         tm.assert_series_equal(result, expected)
 
         # GH 2809
         ind = date_range(start="2000-01-01", freq="D", periods=10)
         datetimes = [ts.to_pydatetime() for ts in ind]
         datetime_s = Series(datetimes)
-        self.assertEqual(datetime_s.dtype, 'M8[ns]')
+        assert datetime_s.dtype == 'M8[ns]'
         df = DataFrame({'datetime_s': datetime_s})
         result = df.get_dtype_counts()
         expected = Series({datetime64name: 1})
-        result.sort_index()
-        expected.sort_index()
+        result = result.sort_index()
+        expected = expected.sort_index()
         tm.assert_series_equal(result, expected)
 
         # GH 2810
@@ -1316,8 +1549,8 @@ def test_constructor_with_datetimes(self):
         df = DataFrame({'datetimes': datetimes, 'dates': dates})
         result = df.get_dtype_counts()
         expected = Series({datetime64name: 1, objectname: 1})
-        result.sort_index()
-        expected.sort_index()
+        result = result.sort_index()
+        expected = expected.sort_index()
         tm.assert_series_equal(result, expected)
 
         # GH 7594
@@ -1327,12 +1560,12 @@ def test_constructor_with_datetimes(self):
         dt = tz.localize(datetime(2012, 1, 1))
 
         df = DataFrame({'End Date': dt}, index=[0])
-        self.assertEqual(df.iat[0, 0], dt)
+        assert df.iat[0, 0] == dt
         tm.assert_series_equal(df.dtypes, Series(
             {'End Date': 'datetime64[ns, US/Eastern]'}))
 
         df = DataFrame([{'End Date': dt}])
-        self.assertEqual(df.iat[0, 0], dt)
+        assert df.iat[0, 0] == dt
         tm.assert_series_equal(df.dtypes, Series(
             {'End Date': 'datetime64[ns, US/Eastern]'}))
 
@@ -1340,13 +1573,13 @@ def test_constructor_with_datetimes(self):
         # GH 8411
         dr = date_range('20130101', periods=3)
         df = DataFrame({'value': dr})
-        self.assertTrue(df.iat[0, 0].tz is None)
+        assert df.iat[0, 0].tz is None
         dr = date_range('20130101', periods=3, tz='UTC')
         df = DataFrame({'value': dr})
-        self.assertTrue(str(df.iat[0, 0].tz) == 'UTC')
+        assert str(df.iat[0, 0].tz) == 'UTC'
         dr = date_range('20130101', periods=3, tz='US/Eastern')
         df = DataFrame({'value': dr})
-        self.assertTrue(str(df.iat[0, 0].tz) == 'US/Eastern')
+        assert str(df.iat[0, 0].tz) == 'US/Eastern'
 
         # GH 7822
         # preserver an index with a tz on dict construction
@@ -1368,6 +1601,15 @@ def test_constructor_with_datetimes(self):
                               .reset_index(drop=True), 'b': i_no_tz})
         tm.assert_frame_equal(df, expected)
 
+    def test_constructor_datetimes_with_nulls(self):
+        # gh-15869
+        for arr in [np.array([None, None, None, None,
+                              datetime.now(), None]),
+                    np.array([None, None, datetime.now(), None])]:
+            result = DataFrame(arr).get_dtype_counts()
+            expected = Series({'datetime64[ns]': 1})
+            tm.assert_series_equal(result, expected)
+
     def test_constructor_for_list_with_dtypes(self):
         # TODO(wesm): unused
         intname = np.dtype(np.int_).name  # noqa
@@ -1431,25 +1673,25 @@ def test_constructor_for_list_with_dtypes(self):
         result = df.get_dtype_counts()
         expected = Series(
             {'int64': 1, 'float64': 2, datetime64name: 1, objectname: 1})
-        result.sort_index()
-        expected.sort_index()
+        result = result.sort_index()
+        expected = expected.sort_index()
         tm.assert_series_equal(result, expected)
 
     def test_constructor_frame_copy(self):
         cop = DataFrame(self.frame, copy=True)
         cop['A'] = 5
-        self.assertTrue((cop['A'] == 5).all())
-        self.assertFalse((self.frame['A'] == 5).all())
+        assert (cop['A'] == 5).all()
+        assert not (self.frame['A'] == 5).all()
 
     def test_constructor_ndarray_copy(self):
         df = DataFrame(self.frame.values)
 
         self.frame.values[5] = 5
-        self.assertTrue((df.values[5] == 5).all())
+        assert (df.values[5] == 5).all()
 
         df = DataFrame(self.frame.values, copy=True)
         self.frame.values[6] = 6
-        self.assertFalse((df.values[6] == 6).all())
+        assert not (df.values[6] == 6).all()
 
     def test_constructor_series_copy(self):
         series = self.frame._series
@@ -1457,29 +1699,34 @@ def test_constructor_series_copy(self):
         df = DataFrame({'A': series['A']})
         df['A'][:] = 5
 
-        self.assertFalse((series['A'] == 5).all())
+        assert not (series['A'] == 5).all()
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_constructor_with_nas(self):
         # GH 5016
-        # na's in indicies
+        # na's in indices
 
         def check(df):
             for i in range(len(df.columns)):
                 df.iloc[:, i]
 
-            # allow single nans to succeed
-            indexer = np.arange(len(df.columns))[isnull(df.columns)]
+            indexer = np.arange(len(df.columns))[isna(df.columns)]
 
-            if len(indexer) == 1:
+            # No NaN found -> error
+            if len(indexer) == 0:
+                msg = ("cannot do label indexing on"
+                       r" <class 'pandas\.core\.indexes\.range\.RangeIndex'>"
+                       r" with these indexers \[nan\] of <class 'float'>")
+                with pytest.raises(TypeError, match=msg):
+                    df.loc[:, np.nan]
+            # single nan should result in Series
+            elif len(indexer) == 1:
                 tm.assert_series_equal(df.iloc[:, indexer[0]],
                                        df.loc[:, np.nan])
-
-            # multiple nans should fail
+            # multiple nans should result in DataFrame
             else:
-
-                def f():
-                    df.loc[:, np.nan]
-                self.assertRaises(TypeError, f)
+                tm.assert_frame_equal(df.iloc[:, indexer],
+                                      df.loc[:, np.nan])
 
         df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[1, np.nan])
         check(df)
@@ -1495,11 +1742,91 @@ def f():
                        columns=[np.nan, 1.1, 2.2, np.nan])
         check(df)
 
+        # GH 21428 (non-unique columns)
+        df = DataFrame([[0.0, 1, 2, 3.0], [4, 5, 6, 7]],
+                       columns=[np.nan, 1, 2, 2])
+        check(df)
+
     def test_constructor_lists_to_object_dtype(self):
         # from #1074
         d = DataFrame({'a': [np.nan, False]})
-        self.assertEqual(d['a'].dtype, np.object_)
-        self.assertFalse(d['a'][1])
+        assert d['a'].dtype == np.object_
+        assert not d['a'][1]
+
+    def test_constructor_categorical(self):
+
+        # GH8626
+
+        # dict creation
+        df = DataFrame({'A': list('abc')}, dtype='category')
+        expected = Series(list('abc'), dtype='category', name='A')
+        tm.assert_series_equal(df['A'], expected)
+
+        # to_frame
+        s = Series(list('abc'), dtype='category')
+        result = s.to_frame()
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(result[0], expected)
+        result = s.to_frame(name='foo')
+        expected = Series(list('abc'), dtype='category', name='foo')
+        tm.assert_series_equal(result['foo'], expected)
+
+        # list-like creation
+        df = DataFrame(list('abc'), dtype='category')
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(df[0], expected)
+
+        # ndim != 1
+        df = DataFrame([Categorical(list('abc'))])
+        expected = DataFrame({0: Series(list('abc'), dtype='category')})
+        tm.assert_frame_equal(df, expected)
+
+        df = DataFrame([Categorical(list('abc')), Categorical(list('abd'))])
+        expected = DataFrame({0: Series(list('abc'), dtype='category'),
+                              1: Series(list('abd'), dtype='category')},
+                             columns=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # mixed
+        df = DataFrame([Categorical(list('abc')), list('def')])
+        expected = DataFrame({0: Series(list('abc'), dtype='category'),
+                              1: list('def')}, columns=[0, 1])
+        tm.assert_frame_equal(df, expected)
+
+        # invalid (shape)
+        msg = r"Shape of passed values is \(6, 2\), indices imply \(3, 2\)"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame([Categorical(list('abc')),
+                       Categorical(list('abdefg'))])
+
+        # ndim > 1
+        msg = "> 1 ndim Categorical are not supported at this time"
+        with pytest.raises(NotImplementedError, match=msg):
+            Categorical(np.array([list('abcd')]))
+
+    def test_constructor_categorical_series(self):
+
+        items = [1, 2, 3, 1]
+        exp = Series(items).astype('category')
+        res = Series(items, dtype='category')
+        tm.assert_series_equal(res, exp)
+
+        items = ["a", "b", "c", "a"]
+        exp = Series(items).astype('category')
+        res = Series(items, dtype='category')
+        tm.assert_series_equal(res, exp)
+
+        # insert into frame with different index
+        # GH 8076
+        index = date_range('20000101', periods=3)
+        expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
+                                      categories=['a', 'b', 'c']))
+        expected.index = index
+
+        expected = DataFrame({'x': expected})
+        df = DataFrame(
+            {'x': Series(['a', 'b', 'c'], dtype='category')}, index=index)
+        tm.assert_frame_equal(df, expected)
 
     def test_from_records_to_records(self):
         # from numpy documentation
@@ -1511,26 +1838,26 @@ def test_from_records_to_records(self):
 
         index = pd.Index(np.arange(len(arr))[::-1])
         indexed_frame = DataFrame.from_records(arr, index=index)
-        self.assert_index_equal(indexed_frame.index, index)
+        tm.assert_index_equal(indexed_frame.index, index)
 
         # without names, it should go to last ditch
         arr2 = np.zeros((2, 3))
         tm.assert_frame_equal(DataFrame.from_records(arr2), DataFrame(arr2))
 
         # wrong length
-        msg = r'Shape of passed values is \(3, 2\), indices imply \(3, 1\)'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = r'Shape of passed values is \(2, 3\), indices imply \(1, 3\)'
+        with pytest.raises(ValueError, match=msg):
             DataFrame.from_records(arr, index=index[:-1])
 
         indexed_frame = DataFrame.from_records(arr, index='f1')
 
         # what to do?
         records = indexed_frame.to_records()
-        self.assertEqual(len(records.dtype.names), 3)
+        assert len(records.dtype.names) == 3
 
         records = indexed_frame.to_records(index=False)
-        self.assertEqual(len(records.dtype.names), 2)
-        self.assertNotIn('index', records.dtype.names)
+        assert len(records.dtype.names) == 2
+        assert 'index' not in records.dtype.names
 
     def test_from_records_nones(self):
         tuples = [(1, 2, None, 3),
@@ -1538,7 +1865,7 @@ def test_from_records_nones(self):
                   (None, 2, 5, 3)]
 
         df = DataFrame.from_records(tuples, columns=['a', 'b', 'c', 'd'])
-        self.assertTrue(np.isnan(df['c'][0]))
+        assert np.isnan(df['c'][0])
 
     def test_from_records_iterator(self):
         arr = np.array([(1.0, 1.0, 2, 2), (3.0, 3.0, 4, 4), (5., 5., 6, 6),
@@ -1603,7 +1930,7 @@ def test_from_records_columns_not_modified(self):
 
         df = DataFrame.from_records(tuples, columns=columns, index='a')  # noqa
 
-        self.assertEqual(columns, original_columns)
+        assert columns == original_columns
 
     def test_from_records_decimal(self):
         from decimal import Decimal
@@ -1611,11 +1938,11 @@ def test_from_records_decimal(self):
         tuples = [(Decimal('1.5'),), (Decimal('2.5'),), (None,)]
 
         df = DataFrame.from_records(tuples, columns=['a'])
-        self.assertEqual(df['a'].dtype, object)
+        assert df['a'].dtype == object
 
         df = DataFrame.from_records(tuples, columns=['a'], coerce_float=True)
-        self.assertEqual(df['a'].dtype, np.float64)
-        self.assertTrue(np.isnan(df['a'].values[-1]))
+        assert df['a'].dtype == np.float64
+        assert np.isnan(df['a'].values[-1])
 
     def test_from_records_duplicates(self):
         result = DataFrame.from_records([(1, 2, 3), (4, 5, 6)],
@@ -1635,12 +1962,12 @@ def create_dict(order_id):
         documents.append({'order_id': 10, 'quantity': 5})
 
         result = DataFrame.from_records(documents, index='order_id')
-        self.assertEqual(result.index.name, 'order_id')
+        assert result.index.name == 'order_id'
 
         # MultiIndex
         result = DataFrame.from_records(documents,
                                         index=['order_id', 'quantity'])
-        self.assertEqual(result.index.names, ('order_id', 'quantity'))
+        assert result.index.names == ('order_id', 'quantity')
 
     def test_from_records_misc_brokenness(self):
         # #2179
@@ -1671,7 +1998,7 @@ def test_from_records_misc_brokenness(self):
         rows.append([datetime(2010, 1, 1), 1])
         rows.append([datetime(2010, 1, 2), 1])
         df2_obj = DataFrame.from_records(rows, columns=['date', 'test'])
-        results = df2_obj.get_dtype_counts()
+        results = df2_obj.get_dtype_counts().sort_index()
         expected = Series({'datetime64[ns]': 1, 'int64': 1})
         tm.assert_series_equal(results, expected)
 
@@ -1689,13 +2016,13 @@ def test_from_records_empty_with_nonempty_fields_gh3682(self):
         a = np.array([(1, 2)], dtype=[('id', np.int64), ('value', np.int64)])
         df = DataFrame.from_records(a, index='id')
         tm.assert_index_equal(df.index, Index([1], name='id'))
-        self.assertEqual(df.index.name, 'id')
+        assert df.index.name == 'id'
         tm.assert_index_equal(df.columns, Index(['value']))
 
         b = np.array([], dtype=[('id', np.int64), ('value', np.int64)])
         df = DataFrame.from_records(b, index='id')
         tm.assert_index_equal(df.index, Index([], name='id'))
-        self.assertEqual(df.index.name, 'id')
+        assert df.index.name == 'id'
 
     def test_from_records_with_datetimes(self):
 
@@ -1738,7 +2065,7 @@ def test_from_records_sequencelike(self):
 
         # this is actually tricky to create the recordlike arrays and
         # have the dtypes be intact
-        blocks = df.blocks
+        blocks = df._to_dict_of_blocks()
         tuples = []
         columns = []
         dtypes = []
@@ -1791,13 +2118,13 @@ def test_from_records_sequencelike(self):
 
         # empty case
         result = DataFrame.from_records([], columns=['foo', 'bar', 'baz'])
-        self.assertEqual(len(result), 0)
-        self.assert_index_equal(result.columns,
-                                pd.Index(['foo', 'bar', 'baz']))
+        assert len(result) == 0
+        tm.assert_index_equal(result.columns,
+                              pd.Index(['foo', 'bar', 'baz']))
 
         result = DataFrame.from_records([])
-        self.assertEqual(len(result), 0)
-        self.assertEqual(len(result.columns), 0)
+        assert len(result) == 0
+        assert len(result.columns) == 0
 
     def test_from_records_dictlike(self):
 
@@ -1813,12 +2140,13 @@ def test_from_records_dictlike(self):
 
         # columns is in a different order here than the actual items iterated
         # from the dict
+        blocks = df._to_dict_of_blocks()
         columns = []
-        for dtype, b in compat.iteritems(df.blocks):
+        for dtype, b in compat.iteritems(blocks):
             columns.extend(b.columns)
 
-        asdict = dict((x, y) for x, y in compat.iteritems(df))
-        asdict2 = dict((x, y.values) for x, y in compat.iteritems(df))
+        asdict = {x: y for x, y in compat.iteritems(df)}
+        asdict2 = {x: y.values for x, y in compat.iteritems(df)}
 
         # dict of series & dict of ndarrays (have dtype info)
         results = []
@@ -1850,8 +2178,11 @@ def test_from_records_bad_index_column(self):
         tm.assert_index_equal(df1.index, Index(df.C))
 
         # should fail
-        self.assertRaises(ValueError, DataFrame.from_records, df, index=[2])
-        self.assertRaises(KeyError, DataFrame.from_records, df, index=2)
+        msg = r"Shape of passed values is \(10, 3\), indices imply \(1, 3\)"
+        with pytest.raises(ValueError, match=msg):
+            DataFrame.from_records(df, index=[2])
+        with pytest.raises(KeyError, match=r"^2$"):
+            DataFrame.from_records(df, index=2)
 
     def test_from_records_non_tuple(self):
         class Record(object):
@@ -1876,13 +2207,39 @@ def test_from_records_len0_with_columns(self):
         # #2633
         result = DataFrame.from_records([], index='foo',
                                         columns=['foo', 'bar'])
+        expected = Index(['bar'])
 
-        self.assertTrue(np.array_equal(result.columns, ['bar']))
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.index.name, 'foo')
+        assert len(result) == 0
+        assert result.index.name == 'foo'
+        tm.assert_index_equal(result.columns, expected)
 
+    def test_to_frame_with_falsey_names(self):
+        # GH 16114
+        result = Series(name=0).to_frame().dtypes
+        expected = Series({0: np.float64})
+        tm.assert_series_equal(result, expected)
 
-class TestDataFrameConstructorWithDatetimeTZ(tm.TestCase, TestData):
+        result = DataFrame(Series(name=0)).dtypes
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [None, 'uint8', 'category'])
+    def test_constructor_range_dtype(self, dtype):
+        # GH 16804
+        expected = DataFrame({'A': [0, 1, 2, 3, 4]}, dtype=dtype or 'int64')
+        result = DataFrame({'A': range(5)}, dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_from_list_subclass(self):
+        # GH21226
+        class List(list):
+            pass
+
+        expected = DataFrame([[1, 2, 3], [4, 5, 6]])
+        result = DataFrame(List([List([1, 2, 3]), List([4, 5, 6])]))
+        tm.assert_frame_equal(result, expected)
+
+
+class TestDataFrameConstructorWithDatetimeTZ(TestData):
 
     def test_from_dict(self):
 
@@ -1895,8 +2252,8 @@ def test_from_dict(self):
 
         # construction
         df = DataFrame({'A': idx, 'B': dr})
-        self.assertTrue(df['A'].dtype, 'M8[ns, US/Eastern')
-        self.assertTrue(df['A'].name == 'A')
+        assert df['A'].dtype, 'M8[ns, US/Eastern'
+        assert df['A'].name == 'A'
         tm.assert_series_equal(df['A'], Series(idx, name='A'))
         tm.assert_series_equal(df['B'], Series(dr, name='B'))
 
@@ -1929,7 +2286,7 @@ def test_frame_datetime64_mixed_index_ctor_1681(self):
 
         # it works!
         d = DataFrame({'A': 'foo', 'B': ts}, index=dr)
-        self.assertTrue(d['B'].isnull().all())
+        assert d['B'].isna().all()
 
     def test_frame_timeseries_to_records(self):
         index = date_range('1/1/2000', periods=10)
@@ -1940,3 +2297,27 @@ def test_frame_timeseries_to_records(self):
         result['index'].dtype == 'M8[ns]'
 
         result = df.to_records(index=False)
+
+    def test_frame_timeseries_column(self):
+        # GH19157
+        dr = date_range(start='20130101T10:00:00', periods=3, freq='T',
+                        tz='US/Eastern')
+        result = DataFrame(dr, columns=['timestamps'])
+        expected = DataFrame({'timestamps': [
+            Timestamp('20130101T10:00:00', tz='US/Eastern'),
+            Timestamp('20130101T10:01:00', tz='US/Eastern'),
+            Timestamp('20130101T10:02:00', tz='US/Eastern')]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_nested_dict_construction(self):
+        # GH22227
+        columns = ['Nevada', 'Ohio']
+        pop = {'Nevada': {2001: 2.4, 2002: 2.9},
+               'Ohio': {2000: 1.5, 2001: 1.7, 2002: 3.6}}
+        result = pd.DataFrame(pop, index=[2001, 2002, 2003], columns=columns)
+        expected = pd.DataFrame(
+            [(2.4, 1.7), (2.9, 3.6), (np.nan, np.nan)],
+            columns=columns,
+            index=pd.Index([2001, 2002, 2003])
+        )
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_convert_to.py b/pandas/tests/frame/test_convert_to.py
index 8323d5ed9069f..db60fbf0f8563 100644
--- a/pandas/tests/frame/test_convert_to.py
+++ b/pandas/tests/frame/test_convert_to.py
@@ -1,61 +1,23 @@
 # -*- coding: utf-8 -*-
 
-import pytest
+import collections
+from collections import OrderedDict, defaultdict
+from datetime import datetime
+
 import numpy as np
+import pytest
+import pytz
 
-from pandas import compat
-from pandas import (DataFrame, Series, MultiIndex, Timestamp,
-                    date_range)
+from pandas.compat import long
 
-import pandas.util.testing as tm
+from pandas import (
+    CategoricalDtype, DataFrame, MultiIndex, Series, Timestamp, compat,
+    date_range)
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
 
 
-class TestDataFrameConvertTo(tm.TestCase, TestData):
-
-    def test_to_dict(self):
-        test_data = {
-            'A': {'1': 1, '2': 2},
-            'B': {'1': '1', '2': '2', '3': '3'},
-        }
-        recons_data = DataFrame(test_data).to_dict()
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][k2])
-
-        recons_data = DataFrame(test_data).to_dict("l")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][int(k2) - 1])
-
-        recons_data = DataFrame(test_data).to_dict("s")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k][k2])
-
-        recons_data = DataFrame(test_data).to_dict("sp")
-        expected_split = {'columns': ['A', 'B'], 'index': ['1', '2', '3'],
-                          'data': [[1.0, '1'], [2.0, '2'], [np.nan, '3']]}
-        tm.assert_dict_equal(recons_data, expected_split)
-
-        recons_data = DataFrame(test_data).to_dict("r")
-        expected_records = [{'A': 1.0, 'B': '1'},
-                            {'A': 2.0, 'B': '2'},
-                            {'A': np.nan, 'B': '3'}]
-        tm.assertIsInstance(recons_data, list)
-        self.assertEqual(len(recons_data), 3)
-        for l, r in zip(recons_data, expected_records):
-            tm.assert_dict_equal(l, r)
-
-        # GH10844
-        recons_data = DataFrame(test_data).to_dict("i")
-
-        for k, v in compat.iteritems(test_data):
-            for k2, v2 in compat.iteritems(v):
-                self.assertEqual(v2, recons_data[k2][k])
+class TestDataFrameConvertTo(TestData):
 
     def test_to_dict_timestamp(self):
 
@@ -72,10 +34,10 @@ def test_to_dict_timestamp(self):
         expected_records_mixed = [{'A': tsmp, 'B': 1},
                                   {'A': tsmp, 'B': 2}]
 
-        self.assertEqual(test_data.to_dict(orient='records'),
-                         expected_records)
-        self.assertEqual(test_data_mixed.to_dict(orient='records'),
-                         expected_records_mixed)
+        assert (test_data.to_dict(orient='records') ==
+                expected_records)
+        assert (test_data_mixed.to_dict(orient='records') ==
+                expected_records_mixed)
 
         expected_series = {
             'A': Series([tsmp, tsmp], name='A'),
@@ -109,18 +71,41 @@ def test_to_dict_timestamp(self):
         tm.assert_dict_equal(test_data_mixed.to_dict(orient='split'),
                              expected_split_mixed)
 
+    def test_to_dict_index_not_unique_with_index_orient(self):
+        # GH22801
+        # Data loss when indexes are not unique. Raise ValueError.
+        df = DataFrame({'a': [1, 2], 'b': [0.5, 0.75]}, index=['A', 'A'])
+        msg = "DataFrame index must be unique for orient='index'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_dict(orient='index')
+
     def test_to_dict_invalid_orient(self):
         df = DataFrame({'A': [0, 1]})
-        self.assertRaises(ValueError, df.to_dict, orient='xinvalid')
+        msg = "orient 'xinvalid' not understood"
+        with pytest.raises(ValueError, match=msg):
+            df.to_dict(orient='xinvalid')
 
     def test_to_records_dt64(self):
         df = DataFrame([["one", "two", "three"],
                         ["four", "five", "six"]],
                        index=date_range("2012-01-01", "2012-01-02"))
-        self.assertEqual(df.to_records()['index'][0], df.index[0])
 
-        rs = df.to_records(convert_datetime64=False)
-        self.assertEqual(rs['index'][0], df.index.values[0])
+        # convert_datetime64 defaults to None
+        expected = df.index.values[0]
+        result = df.to_records()['index'][0]
+        assert expected == result
+
+        # check for FutureWarning if convert_datetime64=False is passed
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.index.values[0]
+            result = df.to_records(convert_datetime64=False)['index'][0]
+            assert expected == result
+
+        # check for FutureWarning if convert_datetime64=True is passed
+        with tm.assert_produces_warning(FutureWarning):
+            expected = df.index[0]
+            result = df.to_records(convert_datetime64=True)['index'][0]
+            assert expected == result
 
     def test_to_records_with_multindex(self):
         # GH3189
@@ -129,15 +114,14 @@ def test_to_records_with_multindex(self):
         data = np.zeros((8, 4))
         df = DataFrame(data, index=index)
         r = df.to_records(index=True)['level_0']
-        self.assertTrue('bar' in r)
-        self.assertTrue('one' not in r)
+        assert 'bar' in r
+        assert 'one' not in r
 
     def test_to_records_with_Mapping_type(self):
         import email
         from email.parser import Parser
-        import collections
 
-        collections.Mapping.register(email.message.Message)
+        compat.Mapping.register(email.message.Message)
 
         headers = Parser().parsestr('From: <user@example.com>\n'
                                     'To: <someone_else@example.com>\n'
@@ -156,21 +140,21 @@ def test_to_records_index_name(self):
         df = DataFrame(np.random.randn(3, 3))
         df.index.name = 'X'
         rs = df.to_records()
-        self.assertIn('X', rs.dtype.fields)
+        assert 'X' in rs.dtype.fields
 
         df = DataFrame(np.random.randn(3, 3))
         rs = df.to_records()
-        self.assertIn('index', rs.dtype.fields)
+        assert 'index' in rs.dtype.fields
 
         df.index = MultiIndex.from_tuples([('a', 'x'), ('a', 'y'), ('b', 'z')])
         df.index.names = ['A', None]
         rs = df.to_records()
-        self.assertIn('level_0', rs.dtype.fields)
+        assert 'level_0' in rs.dtype.fields
 
     def test_to_records_with_unicode_index(self):
         # GH13172
         # unicode_literals conflict with to_records
-        result = DataFrame([{u'a': u'x', u'b': 'y'}]).set_index(u'a')\
+        result = DataFrame([{u'a': u'x', u'b': 'y'}]).set_index(u'a') \
             .to_records()
         expected = np.rec.array([('x', 'y')], dtype=[('a', 'O'), ('b', 'O')])
         tm.assert_almost_equal(result, expected)
@@ -178,29 +162,370 @@ def test_to_records_with_unicode_index(self):
     def test_to_records_with_unicode_column_names(self):
         # xref issue: https://github.com/numpy/numpy/issues/2407
         # Issue #11879. to_records used to raise an exception when used
-        # with column names containing non ascii caracters in Python 2
+        # with column names containing non-ascii characters in Python 2
         result = DataFrame(data={u"accented_name_é": [1.0]}).to_records()
 
         # Note that numpy allows for unicode field names but dtypes need
-        # to be specified using dictionnary intsead of list of tuples.
+        # to be specified using dictionary instead of list of tuples.
         expected = np.rec.array(
             [(0, 1.0)],
             dtype={"names": ["index", u"accented_name_é"],
-                   "formats": ['<i8', '<f8']}
+                   "formats": ['=i8', '=f8']}
         )
         tm.assert_almost_equal(result, expected)
 
+    def test_to_records_with_categorical(self):
+
+        # GH8626
+
+        # dict creation
+        df = DataFrame({'A': list('abc')}, dtype='category')
+        expected = Series(list('abc'), dtype='category', name='A')
+        tm.assert_series_equal(df['A'], expected)
+
+        # list-like creation
+        df = DataFrame(list('abc'), dtype='category')
+        expected = Series(list('abc'), dtype='category', name=0)
+        tm.assert_series_equal(df[0], expected)
+
+        # to record array
+        # this coerces
+        result = df.to_records()
+        expected = np.rec.array([(0, 'a'), (1, 'b'), (2, 'c')],
+                                dtype=[('index', '=i8'), ('0', 'O')])
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("kwargs,expected", [
+        # No dtypes --> default to array dtypes.
+        (dict(),
+         np.rec.array([(0, 1, 0.2, "a"), (1, 2, 1.5, "bc")],
+                      dtype=[("index", "<i8"), ("A", "<i8"),
+                             ("B", "<f8"), ("C", "O")])),
+
+        # Should have no effect in this case.
+        (dict(index=True),
+         np.rec.array([(0, 1, 0.2, "a"), (1, 2, 1.5, "bc")],
+                      dtype=[("index", "<i8"), ("A", "<i8"),
+                             ("B", "<f8"), ("C", "O")])),
+
+        # Column dtype applied across the board. Index unaffected.
+        (dict(column_dtypes="<U4"),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "<U4"),
+                             ("B", "<U4"), ("C", "<U4")])),
+
+        # Index dtype applied across the board. Columns unaffected.
+        (dict(index_dtypes="<U1"),
+         np.rec.array([("0", 1, 0.2, "a"), ("1", 2, 1.5, "bc")],
+                      dtype=[("index", "<U1"), ("A", "<i8"),
+                             ("B", "<f8"), ("C", "O")])),
+
+        # Pass in a type instance.
+        (dict(column_dtypes=np.unicode),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "<U"),
+                             ("B", "<U"), ("C", "<U")])),
+
+        # Pass in a dtype instance.
+        (dict(column_dtypes=np.dtype('unicode')),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "<U"),
+                             ("B", "<U"), ("C", "<U")])),
+
+        # Pass in a dictionary (name-only).
+        (dict(column_dtypes={"A": np.int8, "B": np.float32, "C": "<U2"}),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "i1"),
+                             ("B", "<f4"), ("C", "<U2")])),
+
+        # Pass in a dictionary (indices-only).
+        (dict(index_dtypes={0: "int16"}),
+         np.rec.array([(0, 1, 0.2, "a"), (1, 2, 1.5, "bc")],
+                      dtype=[("index", "i2"), ("A", "<i8"),
+                             ("B", "<f8"), ("C", "O")])),
+
+        # Ignore index mappings if index is not True.
+        (dict(index=False, index_dtypes="<U2"),
+         np.rec.array([(1, 0.2, "a"), (2, 1.5, "bc")],
+                      dtype=[("A", "<i8"), ("B", "<f8"), ("C", "O")])),
+
+        # Non-existent names / indices in mapping should not error.
+        (dict(index_dtypes={0: "int16", "not-there": "float32"}),
+         np.rec.array([(0, 1, 0.2, "a"), (1, 2, 1.5, "bc")],
+                      dtype=[("index", "i2"), ("A", "<i8"),
+                             ("B", "<f8"), ("C", "O")])),
+
+        # Names / indices not in mapping default to array dtype.
+        (dict(column_dtypes={"A": np.int8, "B": np.float32}),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "i1"),
+                             ("B", "<f4"), ("C", "O")])),
+
+        # Names / indices not in dtype mapping default to array dtype.
+        (dict(column_dtypes={"A": np.dtype('int8'), "B": np.dtype('float32')}),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<i8"), ("A", "i1"),
+                             ("B", "<f4"), ("C", "O")])),
+
+        # Mixture of everything.
+        (dict(column_dtypes={"A": np.int8, "B": np.float32},
+              index_dtypes="<U2"),
+         np.rec.array([("0", "1", "0.2", "a"), ("1", "2", "1.5", "bc")],
+                      dtype=[("index", "<U2"), ("A", "i1"),
+                             ("B", "<f4"), ("C", "O")])),
+
+        # Invalid dype values.
+        (dict(index=False, column_dtypes=list()),
+         (ValueError, "Invalid dtype \\[\\] specified for column A")),
+
+        (dict(index=False, column_dtypes={"A": "int32", "B": 5}),
+         (ValueError, "Invalid dtype 5 specified for column B")),
+
+        # Numpy can't handle EA types, so check error is raised
+        (dict(index=False, column_dtypes={"A": "int32",
+                                          "B": CategoricalDtype(['a', 'b'])}),
+         (ValueError, 'Invalid dtype category specified for column B')),
+
+        # Check that bad types raise
+        (dict(index=False, column_dtypes={"A": "int32", "B": "foo"}),
+         (TypeError, 'data type "foo" not understood')),
+    ])
+    def test_to_records_dtype(self, kwargs, expected):
+        # see gh-18146
+        df = DataFrame({"A": [1, 2], "B": [0.2, 1.5], "C": ["a", "bc"]})
+
+        if not isinstance(expected, np.recarray):
+            with pytest.raises(expected[0], match=expected[1]):
+                df.to_records(**kwargs)
+        else:
+            result = df.to_records(**kwargs)
+            tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize("df,kwargs,expected", [
+        # MultiIndex in the index.
+        (DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                   columns=list("abc")).set_index(["a", "b"]),
+         dict(column_dtypes="float64", index_dtypes={0: "int32", 1: "int8"}),
+         np.rec.array([(1, 2, 3.), (4, 5, 6.), (7, 8, 9.)],
+                      dtype=[("a", "<i4"), ("b", "i1"), ("c", "<f8")])),
+
+        # MultiIndex in the columns.
+        (DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                   columns=MultiIndex.from_tuples([("a", "d"), ("b", "e"),
+                                                   ("c", "f")])),
+         dict(column_dtypes={0: "<U1", 2: "float32"}, index_dtypes="float32"),
+         np.rec.array([(0., u"1", 2, 3.), (1., u"4", 5, 6.),
+                       (2., u"7", 8, 9.)],
+                      dtype=[("index", "<f4"),
+                             ("('a', 'd')", "<U1"),
+                             ("('b', 'e')", "<i8"),
+                             ("('c', 'f')", "<f4")])),
+
+        # MultiIndex in both the columns and index.
+        (DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                   columns=MultiIndex.from_tuples([
+                       ("a", "d"), ("b", "e"), ("c", "f")], names=list("ab")),
+                   index=MultiIndex.from_tuples([
+                       ("d", -4), ("d", -5), ("f", -6)], names=list("cd"))),
+         dict(column_dtypes="float64", index_dtypes={0: "<U2", 1: "int8"}),
+         np.rec.array([("d", -4, 1., 2., 3.), ("d", -5, 4., 5., 6.),
+                       ("f", -6, 7, 8, 9.)],
+                      dtype=[("c", "<U2"), ("d", "i1"),
+                             ("('a', 'd')", "<f8"), ("('b', 'e')", "<f8"),
+                             ("('c', 'f')", "<f8")]))
+    ])
+    def test_to_records_dtype_mi(self, df, kwargs, expected):
+        # see gh-18146
+        result = df.to_records(**kwargs)
+        tm.assert_almost_equal(result, expected)
+
+    def test_to_records_dict_like(self):
+        # see gh-18146
+        class DictLike(object):
+            def __init__(self, **kwargs):
+                self.d = kwargs.copy()
+
+            def __getitem__(self, key):
+                return self.d.__getitem__(key)
+
+            def __contains__(self, key):
+                return key in self.d
+
+            def keys(self):
+                return self.d.keys()
+
+        df = DataFrame({"A": [1, 2], "B": [0.2, 1.5], "C": ["a", "bc"]})
+
+        dtype_mappings = dict(column_dtypes=DictLike(**{"A": np.int8,
+                                                        "B": np.float32}),
+                              index_dtypes="<U2")
+
+        result = df.to_records(**dtype_mappings)
+        expected = np.rec.array([("0", "1", "0.2", "a"),
+                                 ("1", "2", "1.5", "bc")],
+                                dtype=[("index", "<U2"), ("A", "i1"),
+                                       ("B", "<f4"), ("C", "O")])
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize('mapping', [
+        dict,
+        collections.defaultdict(list),
+        collections.OrderedDict])
+    def test_to_dict(self, mapping):
+        test_data = {
+            'A': {'1': 1, '2': 2},
+            'B': {'1': '1', '2': '2', '3': '3'},
+        }
 
-@pytest.mark.parametrize('tz', ['UTC', 'GMT', 'US/Eastern'])
-def test_to_records_datetimeindex_with_tz(tz):
-    # GH13937
-    dr = date_range('2016-01-01', periods=10,
-                    freq='S', tz=tz)
+        # GH16122
+        recons_data = DataFrame(test_data).to_dict(into=mapping)
 
-    df = DataFrame({'datetime': dr}, index=dr)
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][k2])
+
+        recons_data = DataFrame(test_data).to_dict("l", mapping)
 
-    expected = df.to_records()
-    result = df.tz_convert("UTC").to_records()
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][int(k2) - 1])
 
-    # both converted to UTC, so they are equal
-    tm.assert_numpy_array_equal(result, expected)
+        recons_data = DataFrame(test_data).to_dict("s", mapping)
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k][k2])
+
+        recons_data = DataFrame(test_data).to_dict("sp", mapping)
+        expected_split = {'columns': ['A', 'B'], 'index': ['1', '2', '3'],
+                          'data': [[1.0, '1'], [2.0, '2'], [np.nan, '3']]}
+        tm.assert_dict_equal(recons_data, expected_split)
+
+        recons_data = DataFrame(test_data).to_dict("r", mapping)
+        expected_records = [{'A': 1.0, 'B': '1'},
+                            {'A': 2.0, 'B': '2'},
+                            {'A': np.nan, 'B': '3'}]
+        assert isinstance(recons_data, list)
+        assert (len(recons_data) == 3)
+        for l, r in zip(recons_data, expected_records):
+            tm.assert_dict_equal(l, r)
+
+        # GH10844
+        recons_data = DataFrame(test_data).to_dict("i")
+
+        for k, v in compat.iteritems(test_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k2][k])
+
+        df = DataFrame(test_data)
+        df['duped'] = df[df.columns[0]]
+        recons_data = df.to_dict("i")
+        comp_data = test_data.copy()
+        comp_data['duped'] = comp_data[df.columns[0]]
+        for k, v in compat.iteritems(comp_data):
+            for k2, v2 in compat.iteritems(v):
+                assert (v2 == recons_data[k2][k])
+
+    @pytest.mark.parametrize('mapping', [
+        list,
+        collections.defaultdict,
+        []])
+    def test_to_dict_errors(self, mapping):
+        # GH16122
+        df = DataFrame(np.random.randn(3, 3))
+        with pytest.raises(TypeError):
+            df.to_dict(into=mapping)
+
+    def test_to_dict_not_unique_warning(self):
+        # GH16927: When converting to a dict, if a column has a non-unique name
+        # it will be dropped, throwing a warning.
+        df = DataFrame([[1, 2, 3]], columns=['a', 'a', 'b'])
+        with tm.assert_produces_warning(UserWarning):
+            df.to_dict()
+
+    @pytest.mark.parametrize('tz', ['UTC', 'GMT', 'US/Eastern'])
+    def test_to_records_datetimeindex_with_tz(self, tz):
+        # GH13937
+        dr = date_range('2016-01-01', periods=10,
+                        freq='S', tz=tz)
+
+        df = DataFrame({'datetime': dr}, index=dr)
+
+        expected = df.to_records()
+        result = df.tz_convert("UTC").to_records()
+
+        # both converted to UTC, so they are equal
+        tm.assert_numpy_array_equal(result, expected)
+
+    # orient - orient argument to to_dict function
+    # item_getter - function for extracting value from
+    # the resulting dict using column name and index
+    @pytest.mark.parametrize('orient,item_getter', [
+        ('dict', lambda d, col, idx: d[col][idx]),
+        ('records', lambda d, col, idx: d[idx][col]),
+        ('list', lambda d, col, idx: d[col][idx]),
+        ('split', lambda d, col, idx: d['data'][idx][d['columns'].index(col)]),
+        ('index', lambda d, col, idx: d[idx][col])
+    ])
+    def test_to_dict_box_scalars(self, orient, item_getter):
+        # 14216, 23753
+        # make sure that we are boxing properly
+        df = DataFrame({'a': [1, 2], 'b': [.1, .2]})
+        result = df.to_dict(orient=orient)
+        assert isinstance(item_getter(result, 'a', 0), (int, long))
+        assert isinstance(item_getter(result, 'b', 0), float)
+
+    def test_frame_to_dict_tz(self):
+        # GH18372 When converting to dict with orient='records' columns of
+        # datetime that are tz-aware were not converted to required arrays
+        data = [(datetime(2017, 11, 18, 21, 53, 0, 219225, tzinfo=pytz.utc),),
+                (datetime(2017, 11, 18, 22, 6, 30, 61810, tzinfo=pytz.utc,),)]
+        df = DataFrame(list(data), columns=["d", ])
+
+        result = df.to_dict(orient='records')
+        expected = [
+            {'d': Timestamp('2017-11-18 21:53:00.219225+0000', tz=pytz.utc)},
+            {'d': Timestamp('2017-11-18 22:06:30.061810+0000', tz=pytz.utc)},
+        ]
+        tm.assert_dict_equal(result[0], expected[0])
+        tm.assert_dict_equal(result[1], expected[1])
+
+    @pytest.mark.parametrize('into, expected', [
+        (dict, {0: {'int_col': 1, 'float_col': 1.0},
+                1: {'int_col': 2, 'float_col': 2.0},
+                2: {'int_col': 3, 'float_col': 3.0}}),
+        (OrderedDict, OrderedDict([(0, {'int_col': 1, 'float_col': 1.0}),
+                                   (1, {'int_col': 2, 'float_col': 2.0}),
+                                   (2, {'int_col': 3, 'float_col': 3.0})])),
+        (defaultdict(list), defaultdict(list,
+                                        {0: {'int_col': 1, 'float_col': 1.0},
+                                         1: {'int_col': 2, 'float_col': 2.0},
+                                         2: {'int_col': 3, 'float_col': 3.0}}))
+    ])
+    def test_to_dict_index_dtypes(self, into, expected):
+        # GH 18580
+        # When using to_dict(orient='index') on a dataframe with int
+        # and float columns only the int columns were cast to float
+
+        df = DataFrame({'int_col': [1, 2, 3],
+                        'float_col': [1.0, 2.0, 3.0]})
+
+        result = df.to_dict(orient='index', into=into)
+        cols = ['int_col', 'float_col']
+        result = DataFrame.from_dict(result, orient='index')[cols]
+        expected = DataFrame.from_dict(expected, orient='index')[cols]
+        tm.assert_frame_equal(result, expected)
+
+    def test_to_dict_numeric_names(self):
+        # https://github.com/pandas-dev/pandas/issues/24940
+        df = DataFrame({str(i): [i] for i in range(5)})
+        result = set(df.to_dict('records')[0].keys())
+        expected = set(df.columns)
+        assert result == expected
+
+    def test_to_dict_wide(self):
+        # https://github.com/pandas-dev/pandas/issues/24939
+        df = DataFrame({('A_{:d}'.format(i)): [i] for i in range(256)})
+        result = df.to_dict('records')[0]
+        expected = {'A_{:d}'.format(i): i for i in range(256)}
+        assert result == expected
diff --git a/pandas/tests/frame/test_dtypes.py b/pandas/tests/frame/test_dtypes.py
index f7d2c1a654cd5..b37bf02a6b8e7 100644
--- a/pandas/tests/frame/test_dtypes.py
+++ b/pandas/tests/frame/test_dtypes.py
@@ -1,22 +1,34 @@
 # -*- coding: utf-8 -*-
 
 from __future__ import print_function
+
+from collections import OrderedDict
 from datetime import timedelta
 
 import numpy as np
-from pandas import (DataFrame, Series, date_range, Timedelta, Timestamp,
-                    compat, concat, option_context)
+import pytest
+
 from pandas.compat import u
-from pandas.types.dtypes import DatetimeTZDtype
+
+from pandas.core.dtypes.dtypes import CategoricalDtype, DatetimeTZDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Series, Timedelta, Timestamp,
+    _np_version_under1p14, compat, concat, date_range, option_context)
+from pandas.core.arrays import integer_array
 from pandas.tests.frame.common import TestData
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 makeCustomDataframe as mkdf)
 import pandas.util.testing as tm
-import pandas as pd
+from pandas.util.testing import (
+    assert_frame_equal, assert_series_equal, makeCustomDataframe as mkdf)
+
 
+@pytest.fixture(params=[str, compat.text_type])
+def text_dtype(request):
+    return request.param
 
-class TestDataFrameDataTypes(tm.TestCase, TestData):
+
+class TestDataFrameDataTypes(TestData):
 
     def test_concat_empty_dataframe_dtypes(self):
         df = DataFrame(columns=list("abc"))
@@ -25,14 +37,14 @@ def test_concat_empty_dataframe_dtypes(self):
         df['c'] = df['c'].astype(np.float64)
 
         result = pd.concat([df, df])
-        self.assertEqual(result['a'].dtype, np.bool_)
-        self.assertEqual(result['b'].dtype, np.int32)
-        self.assertEqual(result['c'].dtype, np.float64)
+        assert result['a'].dtype == np.bool_
+        assert result['b'].dtype == np.int32
+        assert result['c'].dtype == np.float64
 
         result = pd.concat([df, df.astype(np.float64)])
-        self.assertEqual(result['a'].dtype, np.object_)
-        self.assertEqual(result['b'].dtype, np.float64)
-        self.assertEqual(result['c'].dtype, np.float64)
+        assert result['a'].dtype == np.object_
+        assert result['b'].dtype == np.float64
+        assert result['c'].dtype == np.float64
 
     def test_empty_frame_dtypes_ftypes(self):
         empty_df = pd.DataFrame()
@@ -55,7 +67,7 @@ def test_empty_frame_dtypes_ftypes(self):
         assert_series_equal(norows_int_df.ftypes, pd.Series(
             'int32:dense', index=list("abc")))
 
-        odict = compat.OrderedDict
+        odict = OrderedDict
         df = pd.DataFrame(odict([('a', 1), ('b', True), ('c', 1.0)]),
                           index=[1, 2, 3])
         ex_dtypes = pd.Series(odict([('a', np.int64),
@@ -80,8 +92,8 @@ def test_datetime_with_tz_dtypes(self):
         tzframe.iloc[1, 2] = pd.NaT
         result = tzframe.dtypes.sort_index()
         expected = Series([np.dtype('datetime64[ns]'),
-                           DatetimeTZDtype('datetime64[ns, US/Eastern]'),
-                           DatetimeTZDtype('datetime64[ns, CET]')],
+                           DatetimeTZDtype('ns', 'US/Eastern'),
+                           DatetimeTZDtype('ns', 'CET')],
                           ['A', 'B', 'C'])
 
         assert_series_equal(result, expected)
@@ -89,7 +101,7 @@ def test_datetime_with_tz_dtypes(self):
     def test_dtypes_are_correct_after_column_slice(self):
         # GH6525
         df = pd.DataFrame(index=range(5), columns=list("abc"), dtype=np.float_)
-        odict = compat.OrderedDict
+        odict = OrderedDict
         assert_series_equal(df.dtypes,
                             pd.Series(odict([('a', np.float_),
                                              ('b', np.float_),
@@ -101,7 +113,7 @@ def test_dtypes_are_correct_after_column_slice(self):
                                              ('b', np.float_),
                                              ('c', np.float_)])))
 
-    def test_select_dtypes_include(self):
+    def test_select_dtypes_include_using_list_like(self):
         df = DataFrame({'a': list('abc'),
                         'b': list(range(1, 4)),
                         'c': np.arange(3, 6).astype('u1'),
@@ -142,14 +154,10 @@ def test_select_dtypes_include(self):
         ei = df[['h', 'i']]
         assert_frame_equal(ri, ei)
 
-        ri = df.select_dtypes(include=['timedelta'])
-        ei = df[['k']]
-        assert_frame_equal(ri, ei)
+        with pytest.raises(NotImplementedError, match=r"^$"):
+            df.select_dtypes(include=['period'])
 
-        self.assertRaises(NotImplementedError,
-                          lambda: df.select_dtypes(include=['period']))
-
-    def test_select_dtypes_exclude(self):
+    def test_select_dtypes_exclude_using_list_like(self):
         df = DataFrame({'a': list('abc'),
                         'b': list(range(1, 4)),
                         'c': np.arange(3, 6).astype('u1'),
@@ -159,7 +167,7 @@ def test_select_dtypes_exclude(self):
         ee = df[['a', 'e']]
         assert_frame_equal(re, ee)
 
-    def test_select_dtypes_exclude_include(self):
+    def test_select_dtypes_exclude_include_using_list_like(self):
         df = DataFrame({'a': list('abc'),
                         'b': list(range(1, 4)),
                         'c': np.arange(3, 6).astype('u1'),
@@ -178,6 +186,131 @@ def test_select_dtypes_exclude_include(self):
         e = df[['b', 'e']]
         assert_frame_equal(r, e)
 
+    def test_select_dtypes_include_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number)
+        ei = df[['b', 'c', 'd', 'k']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='datetime')
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='datetime64')
+        ei = df[['g']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include='category')
+        ei = df[['f']]
+        assert_frame_equal(ri, ei)
+
+        with pytest.raises(NotImplementedError, match=r"^$"):
+            df.select_dtypes(include='period')
+
+    def test_select_dtypes_exclude_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(exclude=np.number)
+        ei = df[['a', 'e', 'f', 'g', 'h', 'i', 'j']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(exclude='category')
+        ei = df[['a', 'b', 'c', 'd', 'e', 'g', 'h', 'i', 'j', 'k']]
+        assert_frame_equal(ri, ei)
+
+        with pytest.raises(NotImplementedError, match=r"^$"):
+            df.select_dtypes(exclude='period')
+
+    def test_select_dtypes_include_exclude_using_scalars(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number, exclude='floating')
+        ei = df[['b', 'c', 'k']]
+        assert_frame_equal(ri, ei)
+
+    def test_select_dtypes_include_exclude_mixed_scalars_lists(self):
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101', periods=3,
+                                           tz='US/Eastern'),
+                        'i': pd.date_range('20130101', periods=3,
+                                           tz='CET'),
+                        'j': pd.period_range('2013-01', periods=3,
+                                             freq='M'),
+                        'k': pd.timedelta_range('1 day', periods=3)})
+
+        ri = df.select_dtypes(include=np.number,
+                              exclude=['floating', 'timedelta'])
+        ei = df[['b', 'c']]
+        assert_frame_equal(ri, ei)
+
+        ri = df.select_dtypes(include=[np.number, 'category'],
+                              exclude='floating')
+        ei = df[['b', 'c', 'f', 'k']]
+        assert_frame_equal(ri, ei)
+
+    def test_select_dtypes_duplicate_columns(self):
+        # GH20839
+        odict = OrderedDict
+        df = DataFrame(odict([('a', list('abc')),
+                              ('b', list(range(1, 4))),
+                              ('c', np.arange(3, 6).astype('u1')),
+                              ('d', np.arange(4.0, 7.0, dtype='float64')),
+                              ('e', [True, False, True]),
+                              ('f', pd.date_range('now', periods=3).values)]))
+        df.columns = ['a', 'a', 'b', 'b', 'b', 'c']
+
+        expected = DataFrame({'a': list(range(1, 4)),
+                              'b': np.arange(3, 6).astype('u1')})
+
+        result = df.select_dtypes(include=[np.number], exclude=['floating'])
+        assert_frame_equal(result, expected)
+
     def test_select_dtypes_not_an_attr_but_still_valid_dtype(self):
         df = DataFrame({'a': list('abc'),
                         'b': list(range(1, 4)),
@@ -197,19 +330,10 @@ def test_select_dtypes_not_an_attr_but_still_valid_dtype(self):
 
     def test_select_dtypes_empty(self):
         df = DataFrame({'a': list('abc'), 'b': list(range(1, 4))})
-        with tm.assertRaisesRegexp(ValueError, 'at least one of include or '
-                                   'exclude must be nonempty'):
+        msg = 'at least one of include or exclude must be nonempty'
+        with pytest.raises(ValueError, match=msg):
             df.select_dtypes()
 
-    def test_select_dtypes_raises_on_string(self):
-        df = DataFrame({'a': list('abc'), 'b': list(range(1, 4))})
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(include='object')
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(exclude='object')
-        with tm.assertRaisesRegexp(TypeError, 'include and exclude .+ non-'):
-            df.select_dtypes(include=int, exclude='object')
-
     def test_select_dtypes_bad_datetime64(self):
         df = DataFrame({'a': list('abc'),
                         'b': list(range(1, 4)),
@@ -217,10 +341,10 @@ def test_select_dtypes_bad_datetime64(self):
                         'd': np.arange(4.0, 7.0, dtype='float64'),
                         'e': [True, False, True],
                         'f': pd.date_range('now', periods=3).values})
-        with tm.assertRaisesRegexp(ValueError, '.+ is too specific'):
+        with pytest.raises(ValueError, match='.+ is too specific'):
             df.select_dtypes(include=['datetime64[D]'])
 
-        with tm.assertRaisesRegexp(ValueError, '.+ is too specific'):
+        with pytest.raises(ValueError, match='.+ is too specific'):
             df.select_dtypes(exclude=['datetime64[as]'])
 
     def test_select_dtypes_datetime_with_tz(self):
@@ -233,27 +357,24 @@ def test_select_dtypes_datetime_with_tz(self):
         expected = df3.reindex(columns=[])
         assert_frame_equal(result, expected)
 
-    def test_select_dtypes_str_raises(self):
-        df = DataFrame({'a': list('abc'),
-                        'g': list(u('abc')),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.date_range('now', periods=3).values})
-        string_dtypes = set((str, 'str', np.string_, 'S1',
-                             'unicode', np.unicode_, 'U1'))
-        try:
-            string_dtypes.add(unicode)
-        except NameError:
-            pass
-        for dt in string_dtypes:
-            with tm.assertRaisesRegexp(TypeError,
-                                       'string dtypes are not allowed'):
-                df.select_dtypes(include=[dt])
-            with tm.assertRaisesRegexp(TypeError,
-                                       'string dtypes are not allowed'):
-                df.select_dtypes(exclude=[dt])
+    @pytest.mark.parametrize("dtype", [
+        str, "str", np.string_, "S1", "unicode", np.unicode_, "U1",
+        compat.text_type
+    ])
+    @pytest.mark.parametrize("arg", ["include", "exclude"])
+    def test_select_dtypes_str_raises(self, dtype, arg):
+        df = DataFrame({"a": list("abc"),
+                        "g": list(u("abc")),
+                        "b": list(range(1, 4)),
+                        "c": np.arange(3, 6).astype("u1"),
+                        "d": np.arange(4.0, 7.0, dtype="float64"),
+                        "e": [True, False, True],
+                        "f": pd.date_range("now", periods=3).values})
+        msg = "string dtypes are not allowed"
+        kwargs = {arg: [dtype]}
+
+        with pytest.raises(TypeError, match=msg):
+            df.select_dtypes(**kwargs)
 
     def test_select_dtypes_bad_arg_raises(self):
         df = DataFrame({'a': list('abc'),
@@ -263,7 +384,9 @@ def test_select_dtypes_bad_arg_raises(self):
                         'd': np.arange(4.0, 7.0, dtype='float64'),
                         'e': [True, False, True],
                         'f': pd.date_range('now', periods=3).values})
-        with tm.assertRaisesRegexp(TypeError, 'data type.*not understood'):
+
+        msg = 'data type.*not understood'
+        with pytest.raises(TypeError, match=msg):
             df.select_dtypes(['blargy, blarg, blarg'])
 
     def test_select_dtypes_typecodes(self):
@@ -276,13 +399,13 @@ def test_select_dtypes_typecodes(self):
     def test_dtypes_gh8722(self):
         self.mixed_frame['bool'] = self.mixed_frame['A'] > 0
         result = self.mixed_frame.dtypes
-        expected = Series(dict((k, v.dtype)
-                               for k, v in compat.iteritems(self.mixed_frame)),
+        expected = Series({k: v.dtype
+                           for k, v in compat.iteritems(self.mixed_frame)},
                           index=result.index)
         assert_series_equal(result, expected)
 
         # compat, GH 8722
-        with option_context('use_inf_as_null', True):
+        with option_context('use_inf_as_na', True):
             df = DataFrame([[1]])
             result = df.dtypes
             assert_series_equal(result, Series({0: np.dtype('int64')}))
@@ -318,9 +441,8 @@ def test_astype(self):
 
         # mixed casting
         def _check_cast(df, v):
-            self.assertEqual(
-                list(set([s.dtype.name
-                          for _, s in compat.iteritems(df)]))[0], v)
+            assert (list({s.dtype.name for
+                          _, s in compat.iteritems(df)})[0] == v)
 
         mn = self.all_mixed._get_numeric_data().copy()
         mn['little_float'] = np.array(12345., dtype='float16')
@@ -384,59 +506,63 @@ def test_astype_with_view(self):
         tf = self.frame.astype(np.float64)
         casted = tf.astype(np.int64, copy=False)  # noqa
 
-    def test_astype_cast_nan_inf_int(self):
-        # GH14265, check nan and inf raise error when converting to int
-        types = [np.int32, np.int64]
-        values = [np.nan, np.inf]
-        msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
-
-        for this_type in types:
-            for this_val in values:
-                df = DataFrame([this_val])
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    df.astype(this_type)
-
-    def test_astype_str(self):
-        # GH9757
-        a = Series(date_range('2010-01-04', periods=5))
-        b = Series(date_range('3/6/2012 00:00', periods=5, tz='US/Eastern'))
-        c = Series([Timedelta(x, unit='d') for x in range(5)])
+    @pytest.mark.parametrize("dtype", [np.int32, np.int64])
+    @pytest.mark.parametrize("val", [np.nan, np.inf])
+    def test_astype_cast_nan_inf_int(self, val, dtype):
+        # see gh-14265
+        #
+        # Check NaN and inf --> raise error when converting to int.
+        msg = "Cannot convert non-finite values \\(NA or inf\\) to integer"
+        df = DataFrame([val])
+
+        with pytest.raises(ValueError, match=msg):
+            df.astype(dtype)
+
+    def test_astype_str(self, text_dtype):
+        # see gh-9757
+        a = Series(date_range("2010-01-04", periods=5))
+        b = Series(date_range("3/6/2012 00:00", periods=5, tz="US/Eastern"))
+        c = Series([Timedelta(x, unit="d") for x in range(5)])
         d = Series(range(5))
         e = Series([0.0, 0.2, 0.4, 0.6, 0.8])
 
-        df = DataFrame({'a': a, 'b': b, 'c': c, 'd': d, 'e': e})
-
-        # datetimelike
-        # Test str and unicode on python 2.x and just str on python 3.x
-        for tt in set([str, compat.text_type]):
-            result = df.astype(tt)
-
-            expected = DataFrame({
-                'a': list(map(tt, map(lambda x: Timestamp(x)._date_repr,
-                                      a._values))),
-                'b': list(map(tt, map(Timestamp, b._values))),
-                'c': list(map(tt, map(lambda x: Timedelta(x)
-                                      ._repr_base(format='all'), c._values))),
-                'd': list(map(tt, d._values)),
-                'e': list(map(tt, e._values)),
-            })
-
-            assert_frame_equal(result, expected)
-
-        # float/nan
-        # 11302
-        # consistency in astype(str)
-        for tt in set([str, compat.text_type]):
-            result = DataFrame([np.NaN]).astype(tt)
-            expected = DataFrame(['nan'])
-            assert_frame_equal(result, expected)
-
-            result = DataFrame([1.12345678901234567890]).astype(tt)
-            expected = DataFrame(['1.12345678901'])
-            assert_frame_equal(result, expected)
-
-    def test_astype_dict(self):
-        # GH7271
+        df = DataFrame({"a": a, "b": b, "c": c, "d": d, "e": e})
+
+        # Datetime-like
+        # Test str and unicode on Python 2.x and just str on Python 3.x
+        result = df.astype(text_dtype)
+
+        expected = DataFrame({
+            "a": list(map(text_dtype,
+                          map(lambda x: Timestamp(x)._date_repr, a._values))),
+            "b": list(map(text_dtype, map(Timestamp, b._values))),
+            "c": list(map(text_dtype,
+                          map(lambda x: Timedelta(x)._repr_base(format="all"),
+                              c._values))),
+            "d": list(map(text_dtype, d._values)),
+            "e": list(map(text_dtype, e._values)),
+        })
+
+        assert_frame_equal(result, expected)
+
+    def test_astype_str_float(self, text_dtype):
+        # see gh-11302
+        result = DataFrame([np.NaN]).astype(text_dtype)
+        expected = DataFrame(["nan"])
+
+        assert_frame_equal(result, expected)
+        result = DataFrame([1.12345678901234567890]).astype(text_dtype)
+
+        # < 1.14 truncates
+        # >= 1.14 preserves the full repr
+        val = ("1.12345678901" if _np_version_under1p14
+               else "1.1234567890123457")
+        expected = DataFrame([val])
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype_class", [dict, Series])
+    def test_astype_dict_like(self, dtype_class):
+        # GH7271 & GH16717
         a = Series(date_range('2010-01-04', periods=5))
         b = Series(range(5))
         c = Series([0.0, 0.2, 0.4, 0.6, 0.8])
@@ -445,7 +571,8 @@ def test_astype_dict(self):
         original = df.copy(deep=True)
 
         # change type of a subset of columns
-        result = df.astype({'b': 'str', 'd': 'float32'})
+        dt1 = dtype_class({'b': 'str', 'd': 'float32'})
+        result = df.astype(dt1)
         expected = DataFrame({
             'a': a,
             'b': Series(['0', '1', '2', '3', '4']),
@@ -454,7 +581,8 @@ def test_astype_dict(self):
         assert_frame_equal(result, expected)
         assert_frame_equal(df, original)
 
-        result = df.astype({'b': np.float32, 'c': 'float32', 'd': np.float64})
+        dt2 = dtype_class({'b': np.float32, 'c': 'float32', 'd': np.float64})
+        result = df.astype(dt2)
         expected = DataFrame({
             'a': a,
             'b': Series([0.0, 1.0, 2.0, 3.0, 4.0], dtype='float32'),
@@ -464,19 +592,35 @@ def test_astype_dict(self):
         assert_frame_equal(df, original)
 
         # change all columns
-        assert_frame_equal(df.astype({'a': str, 'b': str, 'c': str, 'd': str}),
+        dt3 = dtype_class({'a': str, 'b': str, 'c': str, 'd': str})
+        assert_frame_equal(df.astype(dt3),
                            df.astype(str))
         assert_frame_equal(df, original)
 
         # error should be raised when using something other than column labels
         # in the keys of the dtype dict
-        self.assertRaises(KeyError, df.astype, {'b': str, 2: str})
-        self.assertRaises(KeyError, df.astype, {'e': str})
+        dt4 = dtype_class({'b': str, 2: str})
+        dt5 = dtype_class({'e': str})
+        msg = ("Only a column name can be used for the key in a dtype mappings"
+               " argument")
+        with pytest.raises(KeyError, match=msg):
+            df.astype(dt4)
+        with pytest.raises(KeyError, match=msg):
+            df.astype(dt5)
         assert_frame_equal(df, original)
 
         # if the dtypes provided are the same as the original dtypes, the
         # resulting DataFrame should be the same as the original DataFrame
-        equiv = df.astype({col: df[col].dtype for col in df.columns})
+        dt6 = dtype_class({col: df[col].dtype for col in df.columns})
+        equiv = df.astype(dt6)
+        assert_frame_equal(df, equiv)
+        assert_frame_equal(df, original)
+
+        # GH 16717
+        # if dtypes provided is empty, the resulting DataFrame
+        # should be the same as the original DataFrame
+        dt7 = dtype_class({})
+        result = df.astype(dt7)
         assert_frame_equal(df, equiv)
         assert_frame_equal(df, original)
 
@@ -498,13 +642,186 @@ def test_astype_duplicate_col(self):
         expected = concat([a1_str, b, a2_str], axis=1)
         assert_frame_equal(result, expected)
 
+    @pytest.mark.parametrize('dtype', [
+        'category',
+        CategoricalDtype(),
+        CategoricalDtype(ordered=True),
+        CategoricalDtype(ordered=False),
+        CategoricalDtype(categories=list('abcdef')),
+        CategoricalDtype(categories=list('edba'), ordered=False),
+        CategoricalDtype(categories=list('edcb'), ordered=True)], ids=repr)
+    def test_astype_categorical(self, dtype):
+        # GH 18099
+        d = {'A': list('abbc'), 'B': list('bccd'), 'C': list('cdde')}
+        df = DataFrame(d)
+        result = df.astype(dtype)
+        expected = DataFrame({k: Categorical(d[k], dtype=dtype) for k in d})
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("cls", [
+        pd.api.types.CategoricalDtype,
+        pd.api.types.DatetimeTZDtype,
+        pd.api.types.IntervalDtype
+    ])
+    def test_astype_categoricaldtype_class_raises(self, cls):
+        df = DataFrame({"A": ['a', 'a', 'b', 'c']})
+        xpr = "Expected an instance of {}".format(cls.__name__)
+        with pytest.raises(TypeError, match=xpr):
+            df.astype({"A": cls})
+
+        with pytest.raises(TypeError, match=xpr):
+            df['A'].astype(cls)
+
+    @pytest.mark.parametrize("dtype", ['Int64', 'Int32', 'Int16'])
+    def test_astype_extension_dtypes(self, dtype):
+        # GH 22578
+        df = pd.DataFrame([[1., 2.], [3., 4.], [5., 6.]], columns=['a', 'b'])
+
+        expected1 = pd.DataFrame({'a': integer_array([1, 3, 5],
+                                                     dtype=dtype),
+                                  'b': integer_array([2, 4, 6],
+                                                     dtype=dtype)})
+        tm.assert_frame_equal(df.astype(dtype), expected1)
+        tm.assert_frame_equal(df.astype('int64').astype(dtype), expected1)
+        tm.assert_frame_equal(df.astype(dtype).astype('float64'), df)
+
+        df = pd.DataFrame([[1., 2.], [3., 4.], [5., 6.]], columns=['a', 'b'])
+        df['b'] = df['b'].astype(dtype)
+        expected2 = pd.DataFrame({'a': [1., 3., 5.],
+                                  'b': integer_array([2, 4, 6],
+                                                     dtype=dtype)})
+        tm.assert_frame_equal(df, expected2)
+
+        tm.assert_frame_equal(df.astype(dtype), expected1)
+        tm.assert_frame_equal(df.astype('int64').astype(dtype), expected1)
+
+    @pytest.mark.parametrize("dtype", ['Int64', 'Int32', 'Int16'])
+    def test_astype_extension_dtypes_1d(self, dtype):
+        # GH 22578
+        df = pd.DataFrame({'a': [1., 2., 3.]})
+
+        expected1 = pd.DataFrame({'a': integer_array([1, 2, 3],
+                                                     dtype=dtype)})
+        tm.assert_frame_equal(df.astype(dtype), expected1)
+        tm.assert_frame_equal(df.astype('int64').astype(dtype), expected1)
+
+        df = pd.DataFrame({'a': [1., 2., 3.]})
+        df['a'] = df['a'].astype(dtype)
+        expected2 = pd.DataFrame({'a': integer_array([1, 2, 3],
+                                                     dtype=dtype)})
+        tm.assert_frame_equal(df, expected2)
+
+        tm.assert_frame_equal(df.astype(dtype), expected1)
+        tm.assert_frame_equal(df.astype('int64').astype(dtype), expected1)
+
+    @pytest.mark.parametrize("dtype", ['category', 'Int64'])
+    def test_astype_extension_dtypes_duplicate_col(self, dtype):
+        # GH 24704
+        a1 = Series([0, np.nan, 4], name='a')
+        a2 = Series([np.nan, 3, 5], name='a')
+        df = concat([a1, a2], axis=1)
+
+        result = df.astype(dtype)
+        expected = concat([a1.astype(dtype), a2.astype(dtype)], axis=1)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        {100: 'float64', 200: 'uint64'}, 'category', 'float64'])
+    def test_astype_column_metadata(self, dtype):
+        # GH 19920
+        columns = pd.UInt64Index([100, 200, 300], name='foo')
+        df = DataFrame(np.arange(15).reshape(5, 3), columns=columns)
+        df = df.astype(dtype)
+        tm.assert_index_equal(df.columns, columns)
+
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_from_datetimelike_to_objectt(self, dtype, unit):
+        # tests astype to object dtype
+        # gh-19223 / gh-12425
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(object)
+        assert (result.dtypes == object).all()
+
+        if dtype.startswith('M8'):
+            assert result.iloc[0, 0] == pd.to_datetime(1, unit=unit)
+        else:
+            assert result.iloc[0, 0] == pd.to_timedelta(1, unit=unit)
+
+    @pytest.mark.parametrize("arr_dtype", [np.int64, np.float64])
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_datetimelike_unit(self, arr_dtype, dtype, unit):
+        # tests all units from numeric origination
+        # gh-19223 / gh-12425
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([[1, 2, 3]], dtype=arr_dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_datetime_unit(self, unit):
+        # tests all units from datetime origination
+        # gh-19223
+        dtype = "M8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns'])
+    def test_astype_to_timedelta_unit_ns(self, unit):
+        # preserver the timedelta conversion
+        # gh-19223
+        dtype = "m8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(arr.astype(dtype))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_timedelta_unit(self, unit):
+        # coerce to float
+        # gh-19223
+        dtype = "m8[{}]".format(unit)
+        arr = np.array([[1, 2, 3]], dtype=dtype)
+        df = DataFrame(arr)
+        result = df.astype(dtype)
+        expected = DataFrame(df.values.astype(dtype).astype(float))
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_astype_to_incorrect_datetimelike(self, unit):
+        # trying to astype a m to a M, or vice-versa
+        # gh-19224
+        dtype = "M8[{}]".format(unit)
+        other = "m8[{}]".format(unit)
+
+        df = DataFrame(np.array([[1, 2, 3]], dtype=dtype))
+        with pytest.raises(TypeError):
+            df.astype(other)
+
+        df = DataFrame(np.array([[1, 2, 3]], dtype=other))
+        with pytest.raises(TypeError):
+            df.astype(dtype)
+
     def test_timedeltas(self):
         df = DataFrame(dict(A=Series(date_range('2012-1-1', periods=3,
                                                 freq='D')),
                             B=Series([timedelta(days=i) for i in range(3)])))
-        result = df.get_dtype_counts().sort_values()
+        result = df.get_dtype_counts().sort_index()
         expected = Series(
-            {'datetime64[ns]': 1, 'timedelta64[ns]': 1}).sort_values()
+            {'datetime64[ns]': 1, 'timedelta64[ns]': 1}).sort_index()
         assert_series_equal(result, expected)
 
         df['C'] = df['A'] + df['B']
@@ -526,16 +843,68 @@ def test_arg_for_errors_in_astype(self):
 
         df = DataFrame([1, 2, 3])
 
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.astype(np.float64, errors=True)
 
-        with tm.assert_produces_warning(FutureWarning):
-            df.astype(np.int8, raise_on_error=False)
-
         df.astype(np.int8, errors='ignore')
 
+    @pytest.mark.parametrize('input_vals', [
+        ([1, 2]),
+        (['1', '2']),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H'))),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H',
+                            tz='US/Eastern'))),
+        ([pd.Interval(left=0, right=5)]),
+    ])
+    def test_constructor_list_str(self, input_vals, string_dtype):
+        # GH 16605
+        # Ensure that data elements are converted to strings when
+        # dtype is str, 'str', or 'U'
+
+        result = DataFrame({'A': input_vals}, dtype=string_dtype)
+        expected = DataFrame({'A': input_vals}).astype({'A': string_dtype})
+        assert_frame_equal(result, expected)
+
+    def test_constructor_list_str_na(self, string_dtype):
+
+        result = DataFrame({"A": [1.0, 2.0, None]}, dtype=string_dtype)
+        expected = DataFrame({"A": ['1.0', '2.0', None]}, dtype=object)
+        assert_frame_equal(result, expected)
 
-class TestDataFrameDatetimeWithTZ(tm.TestCase, TestData):
+    @pytest.mark.parametrize("data, expected", [
+        # empty
+        (DataFrame(), True),
+        # multi-same
+        (DataFrame({"A": [1, 2], "B": [1, 2]}), True),
+        # multi-object
+        (DataFrame({"A": np.array([1, 2], dtype=object),
+                    "B": np.array(["a", "b"], dtype=object)}), True),
+        # multi-extension
+        (DataFrame({"A": pd.Categorical(['a', 'b']),
+                    "B": pd.Categorical(['a', 'b'])}), True),
+        # differ types
+        (DataFrame({"A": [1, 2], "B": [1., 2.]}), False),
+        # differ sizes
+        (DataFrame({"A": np.array([1, 2], dtype=np.int32),
+                    "B": np.array([1, 2], dtype=np.int64)}), False),
+        # multi-extension differ
+        (DataFrame({"A": pd.Categorical(['a', 'b']),
+                    "B": pd.Categorical(['b', 'c'])}), False),
+
+    ])
+    def test_is_homogeneous_type(self, data, expected):
+        assert data._is_homogeneous_type is expected
+
+    def test_asarray_homogenous(self):
+        df = pd.DataFrame({"A": pd.Categorical([1, 2]),
+                           "B": pd.Categorical([1, 2])})
+        result = np.asarray(df)
+        # may change from object in the future
+        expected = np.array([[1, 1], [2, 2]], dtype='object')
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestDataFrameDatetimeWithTZ(TestData):
 
     def test_interleave(self):
 
@@ -553,7 +922,7 @@ def test_interleave(self):
                               pd.NaT,
                               Timestamp('2013-01-03 00:00:00+0100', tz='CET')],
                              ['foo', 'foo', 'foo']], dtype=object).T
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         # interleave with only datetime64[ns]
         result = self.tzframe.values
@@ -569,7 +938,7 @@ def test_interleave(self):
                               pd.NaT,
                               Timestamp('2013-01-03 00:00:00+0100',
                                         tz='CET')]], dtype=object).T
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_astype(self):
         # astype
@@ -613,12 +982,13 @@ def test_astype_str(self):
                               ['2013-01-03', '2013-01-03 00:00:00-05:00',
                                '2013-01-03 00:00:00+01:00']],
                              columns=self.tzframe.columns)
-        self.assert_frame_equal(result, expected)
-
-        result = str(self.tzframe)
-        self.assertTrue('0 2013-01-01 2013-01-01 00:00:00-05:00 '
-                        '2013-01-01 00:00:00+01:00' in result)
-        self.assertTrue('1 2013-01-02                       '
-                        'NaT                       NaT' in result)
-        self.assertTrue('2 2013-01-03 2013-01-03 00:00:00-05:00 '
-                        '2013-01-03 00:00:00+01:00' in result)
+        tm.assert_frame_equal(result, expected)
+
+        with option_context('display.max_columns', 20):
+            result = str(self.tzframe)
+            assert ('0 2013-01-01 2013-01-01 00:00:00-05:00 '
+                    '2013-01-01 00:00:00+01:00') in result
+            assert ('1 2013-01-02                       '
+                    'NaT                       NaT') in result
+            assert ('2 2013-01-03 2013-01-03 00:00:00-05:00 '
+                    '2013-01-03 00:00:00+01:00') in result
diff --git a/pandas/tests/frame/test_duplicates.py b/pandas/tests/frame/test_duplicates.py
new file mode 100644
index 0000000000000..3396670fb5879
--- /dev/null
+++ b/pandas/tests/frame/test_duplicates.py
@@ -0,0 +1,466 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import print_function
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, string_types
+
+from pandas import DataFrame, Series
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('subset', ['a', ['a'], ['a', 'B']])
+def test_duplicated_with_misspelled_column_name(subset):
+    # GH 19730
+    df = DataFrame({'A': [0, 0, 1],
+                    'B': [0, 0, 1],
+                    'C': [0, 0, 1]})
+
+    with pytest.raises(KeyError):
+        df.duplicated(subset)
+
+    with pytest.raises(KeyError):
+        df.drop_duplicates(subset)
+
+
+@pytest.mark.slow
+def test_duplicated_do_not_fail_on_wide_dataframes():
+    # gh-21524
+    # Given the wide dataframe with a lot of columns
+    # with different (important!) values
+    data = {'col_{0:02d}'.format(i): np.random.randint(0, 1000, 30000)
+            for i in range(100)}
+    df = DataFrame(data).T
+    result = df.duplicated()
+
+    # Then duplicates produce the bool Series as a result and don't fail during
+    # calculation. Actual values doesn't matter here, though usually it's all
+    # False in this case
+    assert isinstance(result, Series)
+    assert result.dtype == np.bool
+
+
+@pytest.mark.parametrize('keep, expected', [
+    ('first', Series([False, False, True, False, True])),
+    ('last', Series([True, True, False, False, False])),
+    (False, Series([True, True, True, False, True]))
+])
+def test_duplicated_keep(keep, expected):
+    df = DataFrame({'A': [0, 1, 1, 2, 0], 'B': ['a', 'b', 'b', 'c', 'a']})
+
+    result = df.duplicated(keep=keep)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.xfail(reason="GH#21720; nan/None falsely considered equal")
+@pytest.mark.parametrize('keep, expected', [
+    ('first', Series([False, False, True, False, True])),
+    ('last', Series([True, True, False, False, False])),
+    (False, Series([True, True, True, False, True]))
+])
+def test_duplicated_nan_none(keep, expected):
+    df = DataFrame({'C': [np.nan, 3, 3, None, np.nan]}, dtype=object)
+
+    result = df.duplicated(keep=keep)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('keep', ['first', 'last', False])
+@pytest.mark.parametrize('subset', [None, ['A', 'B'], 'A'])
+def test_duplicated_subset(subset, keep):
+    df = DataFrame({'A': [0, 1, 1, 2, 0],
+                    'B': ['a', 'b', 'b', 'c', 'a'],
+                    'C': [np.nan, 3, 3, None, np.nan]})
+
+    if subset is None:
+        subset = list(df.columns)
+    elif isinstance(subset, string_types):
+        # need to have a DataFrame, not a Series
+        # -> select columns with singleton list, not string
+        subset = [subset]
+
+    expected = df[subset].duplicated(keep=keep)
+    result = df.duplicated(keep=keep, subset=subset)
+    tm.assert_series_equal(result, expected)
+
+
+def test_drop_duplicates():
+    df = DataFrame({'AAA': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'bar', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                    'D': lrange(8)})
+
+    # single column
+    result = df.drop_duplicates('AAA')
+    expected = df[:2]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('AAA', keep='last')
+    expected = df.loc[[6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('AAA', keep=False)
+    expected = df.loc[[]]
+    tm.assert_frame_equal(result, expected)
+    assert len(result) == 0
+
+    # multi column
+    expected = df.loc[[0, 1, 2, 3]]
+    result = df.drop_duplicates(np.array(['AAA', 'B']))
+    tm.assert_frame_equal(result, expected)
+    result = df.drop_duplicates(['AAA', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(('AAA', 'B'), keep='last')
+    expected = df.loc[[0, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(('AAA', 'B'), keep=False)
+    expected = df.loc[[0]]
+    tm.assert_frame_equal(result, expected)
+
+    # consider everything
+    df2 = df.loc[:, ['AAA', 'B', 'C']]
+
+    result = df2.drop_duplicates()
+    # in this case only
+    expected = df2.drop_duplicates(['AAA', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    result = df2.drop_duplicates(keep='last')
+    expected = df2.drop_duplicates(['AAA', 'B'], keep='last')
+    tm.assert_frame_equal(result, expected)
+
+    result = df2.drop_duplicates(keep=False)
+    expected = df2.drop_duplicates(['AAA', 'B'], keep=False)
+    tm.assert_frame_equal(result, expected)
+
+    # integers
+    result = df.drop_duplicates('C')
+    expected = df.iloc[[0, 2]]
+    tm.assert_frame_equal(result, expected)
+    result = df.drop_duplicates('C', keep='last')
+    expected = df.iloc[[-2, -1]]
+    tm.assert_frame_equal(result, expected)
+
+    df['E'] = df['C'].astype('int8')
+    result = df.drop_duplicates('E')
+    expected = df.iloc[[0, 2]]
+    tm.assert_frame_equal(result, expected)
+    result = df.drop_duplicates('E', keep='last')
+    expected = df.iloc[[-2, -1]]
+    tm.assert_frame_equal(result, expected)
+
+    # GH 11376
+    df = DataFrame({'x': [7, 6, 3, 3, 4, 8, 0],
+                    'y': [0, 6, 5, 5, 9, 1, 2]})
+    expected = df.loc[df.index != 3]
+    tm.assert_frame_equal(df.drop_duplicates(), expected)
+
+    df = DataFrame([[1, 0], [0, 2]])
+    tm.assert_frame_equal(df.drop_duplicates(), df)
+
+    df = DataFrame([[-2, 0], [0, -4]])
+    tm.assert_frame_equal(df.drop_duplicates(), df)
+
+    x = np.iinfo(np.int64).max / 3 * 2
+    df = DataFrame([[-x, x], [0, x + 4]])
+    tm.assert_frame_equal(df.drop_duplicates(), df)
+
+    df = DataFrame([[-x, x], [x, x + 4]])
+    tm.assert_frame_equal(df.drop_duplicates(), df)
+
+    # GH 11864
+    df = DataFrame([i] * 9 for i in range(16))
+    df = df.append([[1] + [0] * 8], ignore_index=True)
+
+    for keep in ['first', 'last', False]:
+        assert df.duplicated(keep=keep).sum() == 0
+
+
+def test_duplicated_on_empty_frame():
+    # GH 25184
+
+    df = DataFrame(columns=['a', 'b'])
+    dupes = df.duplicated('a')
+
+    result = df[dupes]
+    expected = df.copy()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_drop_duplicates_with_duplicate_column_names():
+    # GH17836
+    df = DataFrame([
+        [1, 2, 5],
+        [3, 4, 6],
+        [3, 4, 7]
+    ], columns=['a', 'a', 'b'])
+
+    result0 = df.drop_duplicates()
+    tm.assert_frame_equal(result0, df)
+
+    result1 = df.drop_duplicates('a')
+    expected1 = df[:2]
+    tm.assert_frame_equal(result1, expected1)
+
+
+def test_drop_duplicates_for_take_all():
+    df = DataFrame({'AAA': ['foo', 'bar', 'baz', 'bar',
+                            'foo', 'bar', 'qux', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                    'D': lrange(8)})
+
+    # single column
+    result = df.drop_duplicates('AAA')
+    expected = df.iloc[[0, 1, 2, 6]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('AAA', keep='last')
+    expected = df.iloc[[2, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('AAA', keep=False)
+    expected = df.iloc[[2, 6]]
+    tm.assert_frame_equal(result, expected)
+
+    # multiple columns
+    result = df.drop_duplicates(['AAA', 'B'])
+    expected = df.iloc[[0, 1, 2, 3, 4, 6]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['AAA', 'B'], keep='last')
+    expected = df.iloc[[0, 1, 2, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['AAA', 'B'], keep=False)
+    expected = df.iloc[[0, 1, 2, 6]]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_drop_duplicates_tuple():
+    df = DataFrame({('AA', 'AB'): ['foo', 'bar', 'foo', 'bar',
+                                   'foo', 'bar', 'bar', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                    'D': lrange(8)})
+
+    # single column
+    result = df.drop_duplicates(('AA', 'AB'))
+    expected = df[:2]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(('AA', 'AB'), keep='last')
+    expected = df.loc[[6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(('AA', 'AB'), keep=False)
+    expected = df.loc[[]]  # empty df
+    assert len(result) == 0
+    tm.assert_frame_equal(result, expected)
+
+    # multi column
+    expected = df.loc[[0, 1, 2, 3]]
+    result = df.drop_duplicates((('AA', 'AB'), 'B'))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('df', [
+    DataFrame(),
+    DataFrame(columns=[]),
+    DataFrame(columns=['A', 'B', 'C']),
+    DataFrame(index=[]),
+    DataFrame(index=['A', 'B', 'C'])
+])
+def test_drop_duplicates_empty(df):
+    # GH 20516
+    result = df.drop_duplicates()
+    tm.assert_frame_equal(result, df)
+
+    result = df.copy()
+    result.drop_duplicates(inplace=True)
+    tm.assert_frame_equal(result, df)
+
+
+def test_drop_duplicates_NA():
+    # none
+    df = DataFrame({'A': [None, None, 'foo', 'bar',
+                          'foo', 'bar', 'bar', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
+                    'D': lrange(8)})
+
+    # single column
+    result = df.drop_duplicates('A')
+    expected = df.loc[[0, 2, 3]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('A', keep='last')
+    expected = df.loc[[1, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('A', keep=False)
+    expected = df.loc[[]]  # empty df
+    tm.assert_frame_equal(result, expected)
+    assert len(result) == 0
+
+    # multi column
+    result = df.drop_duplicates(['A', 'B'])
+    expected = df.loc[[0, 2, 3, 6]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['A', 'B'], keep='last')
+    expected = df.loc[[1, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['A', 'B'], keep=False)
+    expected = df.loc[[6]]
+    tm.assert_frame_equal(result, expected)
+
+    # nan
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'bar', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': [1.0, np.nan, np.nan, np.nan, 1., 1., 1, 1.],
+                    'D': lrange(8)})
+
+    # single column
+    result = df.drop_duplicates('C')
+    expected = df[:2]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('C', keep='last')
+    expected = df.loc[[3, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('C', keep=False)
+    expected = df.loc[[]]  # empty df
+    tm.assert_frame_equal(result, expected)
+    assert len(result) == 0
+
+    # multi column
+    result = df.drop_duplicates(['C', 'B'])
+    expected = df.loc[[0, 1, 2, 4]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['C', 'B'], keep='last')
+    expected = df.loc[[1, 3, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates(['C', 'B'], keep=False)
+    expected = df.loc[[1]]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_drop_duplicates_NA_for_take_all():
+    # none
+    df = DataFrame({'A': [None, None, 'foo', 'bar',
+                          'foo', 'baz', 'bar', 'qux'],
+                    'C': [1.0, np.nan, np.nan, np.nan, 1., 2., 3, 1.]})
+
+    # single column
+    result = df.drop_duplicates('A')
+    expected = df.iloc[[0, 2, 3, 5, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('A', keep='last')
+    expected = df.iloc[[1, 4, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('A', keep=False)
+    expected = df.iloc[[5, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    # nan
+
+    # single column
+    result = df.drop_duplicates('C')
+    expected = df.iloc[[0, 1, 5, 6]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('C', keep='last')
+    expected = df.iloc[[3, 5, 6, 7]]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.drop_duplicates('C', keep=False)
+    expected = df.iloc[[5, 6]]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_drop_duplicates_inplace():
+    orig = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'bar', 'foo'],
+                      'B': ['one', 'one', 'two', 'two',
+                            'two', 'two', 'one', 'two'],
+                      'C': [1, 1, 2, 2, 2, 2, 1, 2],
+                      'D': lrange(8)})
+
+    # single column
+    df = orig.copy()
+    df.drop_duplicates('A', inplace=True)
+    expected = orig[:2]
+    result = df
+    tm.assert_frame_equal(result, expected)
+
+    df = orig.copy()
+    df.drop_duplicates('A', keep='last', inplace=True)
+    expected = orig.loc[[6, 7]]
+    result = df
+    tm.assert_frame_equal(result, expected)
+
+    df = orig.copy()
+    df.drop_duplicates('A', keep=False, inplace=True)
+    expected = orig.loc[[]]
+    result = df
+    tm.assert_frame_equal(result, expected)
+    assert len(df) == 0
+
+    # multi column
+    df = orig.copy()
+    df.drop_duplicates(['A', 'B'], inplace=True)
+    expected = orig.loc[[0, 1, 2, 3]]
+    result = df
+    tm.assert_frame_equal(result, expected)
+
+    df = orig.copy()
+    df.drop_duplicates(['A', 'B'], keep='last', inplace=True)
+    expected = orig.loc[[0, 5, 6, 7]]
+    result = df
+    tm.assert_frame_equal(result, expected)
+
+    df = orig.copy()
+    df.drop_duplicates(['A', 'B'], keep=False, inplace=True)
+    expected = orig.loc[[0]]
+    result = df
+    tm.assert_frame_equal(result, expected)
+
+    # consider everything
+    orig2 = orig.loc[:, ['A', 'B', 'C']].copy()
+
+    df2 = orig2.copy()
+    df2.drop_duplicates(inplace=True)
+    # in this case only
+    expected = orig2.drop_duplicates(['A', 'B'])
+    result = df2
+    tm.assert_frame_equal(result, expected)
+
+    df2 = orig2.copy()
+    df2.drop_duplicates(keep='last', inplace=True)
+    expected = orig2.drop_duplicates(['A', 'B'], keep='last')
+    result = df2
+    tm.assert_frame_equal(result, expected)
+
+    df2 = orig2.copy()
+    df2.drop_duplicates(keep=False, inplace=True)
+    expected = orig2.drop_duplicates(['A', 'B'], keep=False)
+    result = df2
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_indexing.py b/pandas/tests/frame/test_indexing.py
index f0dfc4553886b..ffe54f7a94307 100644
--- a/pandas/tests/frame/test_indexing.py
+++ b/pandas/tests/frame/test_indexing.py
@@ -1,131 +1,138 @@
 # -*- coding: utf-8 -*-
 
 from __future__ import print_function
-from warnings import catch_warnings
 
-from datetime import datetime, date, timedelta, time
+from datetime import date, datetime, time, timedelta
+from warnings import catch_warnings, simplefilter
 
-from pandas.compat import map, zip, range, lrange, lzip, long
-from pandas import compat
-
-from numpy import nan
-from numpy.random import randn
 import numpy as np
-
-import pandas.core.common as com
-from pandas import (DataFrame, Index, Series, notnull, isnull,
-                    MultiIndex, DatetimeIndex, Timestamp,
-                    date_range)
-import pandas as pd
+import pytest
 
 from pandas._libs.tslib import iNaT
-from pandas.tseries.offsets import BDay
-from pandas.types.common import (is_float_dtype,
-                                 is_integer,
-                                 is_scalar)
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_numpy_array_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp,
-                                 assertRaises)
-from pandas.core.indexing import IndexingError
+from pandas.compat import PY2, long, lrange, lzip, map, range, zip
 
-import pandas.util.testing as tm
+from pandas.core.dtypes.common import is_float_dtype, is_integer, is_scalar
+from pandas.core.dtypes.dtypes import CategoricalDtype
 
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, MultiIndex, Series,
+    Timestamp, compat, date_range, isna, notna)
+import pandas.core.common as com
+from pandas.core.indexing import IndexingError
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+from pandas.tseries.offsets import BDay
 
 
-class TestDataFrameIndexing(tm.TestCase, TestData):
+class TestDataFrameIndexing(TestData):
 
     def test_getitem(self):
-        # slicing
+        # Slicing
         sl = self.frame[:20]
-        self.assertEqual(20, len(sl.index))
-
-        # column access
+        assert len(sl.index) == 20
 
+        # Column access
         for _, series in compat.iteritems(sl):
-            self.assertEqual(20, len(series.index))
-            self.assertTrue(tm.equalContents(series.index, sl.index))
+            assert len(series.index) == 20
+            assert tm.equalContents(series.index, sl.index)
 
         for key, _ in compat.iteritems(self.frame._series):
-            self.assertIsNotNone(self.frame[key])
+            assert self.frame[key] is not None
 
-        self.assertNotIn('random', self.frame)
-        with assertRaisesRegexp(KeyError, 'random'):
+        assert 'random' not in self.frame
+        with pytest.raises(KeyError, match='random'):
             self.frame['random']
 
         df = self.frame.copy()
-        df['$10'] = randn(len(df))
-        ad = randn(len(df))
+        df['$10'] = np.random.randn(len(df))
+
+        ad = np.random.randn(len(df))
         df['@awesome_domain'] = ad
-        self.assertRaises(KeyError, df.__getitem__, 'df["$10"]')
+
+        with pytest.raises(KeyError):
+            df.__getitem__('df["$10"]')
+
         res = df['@awesome_domain']
-        assert_numpy_array_equal(ad, res.values)
+        tm.assert_numpy_array_equal(ad, res.values)
 
     def test_getitem_dupe_cols(self):
         df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
-        try:
+        with pytest.raises(KeyError):
             df[['baf']]
-        except KeyError:
-            pass
-        else:
-            self.fail("Dataframe failed to raise KeyError")
 
     def test_get(self):
         b = self.frame.get('B')
         assert_series_equal(b, self.frame['B'])
 
-        self.assertIsNone(self.frame.get('foo'))
+        assert self.frame.get('foo') is None
         assert_series_equal(self.frame.get('foo', self.frame['B']),
                             self.frame['B'])
-        # None
-        # GH 5652
-        for df in [DataFrame(), DataFrame(columns=list('AB')),
-                   DataFrame(columns=list('AB'), index=range(3))]:
-            result = df.get(None)
-            self.assertIsNone(result)
-
-    def test_getitem_iterator(self):
-        idx = iter(['A', 'B', 'C'])
-        result = self.frame.loc[:, idx]
-        expected = self.frame.loc[:, ['A', 'B', 'C']]
-        assert_frame_equal(result, expected)
 
+    @pytest.mark.parametrize("df", [
+        DataFrame(),
+        DataFrame(columns=list("AB")),
+        DataFrame(columns=list("AB"), index=range(3))
+    ])
+    def test_get_none(self, df):
+        # see gh-5652
+        assert df.get(None) is None
+
+    def test_loc_iterable(self):
         idx = iter(['A', 'B', 'C'])
         result = self.frame.loc[:, idx]
         expected = self.frame.loc[:, ['A', 'B', 'C']]
         assert_frame_equal(result, expected)
 
-    def test_getitem_list(self):
-        self.frame.columns.name = 'foo'
+    @pytest.mark.parametrize(
+        "idx_type",
+        [list, iter, Index, set,
+         lambda l: dict(zip(l, range(len(l)))),
+         lambda l: dict(zip(l, range(len(l)))).keys()],
+        ids=["list", "iter", "Index", "set", "dict", "dict_keys"])
+    @pytest.mark.parametrize("levels", [1, 2])
+    def test_getitem_listlike(self, idx_type, levels):
+        # GH 21294
+
+        if levels == 1:
+            frame, missing = self.frame, 'food'
+        else:
+            # MultiIndex columns
+            frame = DataFrame(np.random.randn(8, 3),
+                              columns=Index([('foo', 'bar'), ('baz', 'qux'),
+                                             ('peek', 'aboo')],
+                                            name=('sth', 'sth2')))
+            missing = ('good', 'food')
 
-        result = self.frame[['B', 'A']]
-        result2 = self.frame[Index(['B', 'A'])]
+        keys = [frame.columns[1], frame.columns[0]]
+        idx = idx_type(keys)
+        idx_check = list(idx_type(keys))
 
-        expected = self.frame.loc[:, ['B', 'A']]
-        expected.columns.name = 'foo'
+        result = frame[idx]
 
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
+        expected = frame.loc[:, idx_check]
+        expected.columns.names = frame.columns.names
 
-        self.assertEqual(result.columns.name, 'foo')
+        assert_frame_equal(result, expected)
 
-        with assertRaisesRegexp(KeyError, 'not in index'):
-            self.frame[['B', 'A', 'food']]
-        with assertRaisesRegexp(KeyError, 'not in index'):
-            self.frame[Index(['B', 'A', 'foo'])]
+        idx = idx_type(keys + [missing])
+        with pytest.raises(KeyError, match='not in index'):
+            frame[idx]
 
-        # tuples
-        df = DataFrame(randn(8, 3),
-                       columns=Index([('foo', 'bar'), ('baz', 'qux'),
-                                      ('peek', 'aboo')], name=['sth', 'sth2']))
+    @pytest.mark.parametrize("val,expected", [
+        (2**63 - 1, Series([1])),
+        (2**63, Series([2])),
+    ])
+    def test_loc_uint64(self, val, expected):
+        # see gh-19399
+        df = DataFrame([1, 2], index=[2**63 - 1, 2**63])
+        result = df.loc[val]
 
-        result = df[[('foo', 'bar'), ('baz', 'qux')]]
-        expected = df.iloc[:, :2]
-        assert_frame_equal(result, expected)
-        self.assertEqual(result.columns.names, ['sth', 'sth2'])
+        expected.name = val
+        tm.assert_series_equal(result, expected)
 
     def test_getitem_callable(self):
         # GH 12533
@@ -148,12 +155,12 @@ def test_setitem_list(self):
         assert_series_equal(self.frame['B'], data['A'], check_names=False)
         assert_series_equal(self.frame['A'], data['B'], check_names=False)
 
-        with assertRaisesRegexp(ValueError,
-                                'Columns must be same length as key'):
+        msg = 'Columns must be same length as key'
+        with pytest.raises(ValueError, match=msg):
             data[['A']] = self.frame[['A', 'B']]
 
-        with assertRaisesRegexp(ValueError, 'Length of values does not match '
-                                'length of index'):
+        msg = 'Length of values does not match length of index'
+        with pytest.raises(ValueError, match=msg):
             data['A'] = range(len(data.index) - 1)
 
         df = DataFrame(0, lrange(3), ['tt1', 'tt2'], dtype=np.int_)
@@ -217,7 +224,8 @@ def test_setitem_callable(self):
 
     def test_setitem_other_callable(self):
         # GH 13299
-        inc = lambda x: x + 1
+        def inc(x):
+            return x + 1
 
         df = pd.DataFrame([[-1, 1], [1, -1]])
         df[df > 0] = inc
@@ -234,14 +242,14 @@ def test_getitem_boolean(self):
         subindex = self.tsframe.index[indexer]
         subframe = self.tsframe[indexer]
 
-        self.assert_index_equal(subindex, subframe.index)
-        with assertRaisesRegexp(ValueError, 'Item wrong length'):
+        tm.assert_index_equal(subindex, subframe.index)
+        with pytest.raises(ValueError, match='Item wrong length'):
             self.tsframe[indexer[:-1]]
 
         subframe_obj = self.tsframe[indexer_obj]
         assert_frame_equal(subframe_obj, subframe)
 
-        with tm.assertRaisesRegexp(ValueError, 'boolean values only'):
+        with pytest.raises(ValueError, match='boolean values only'):
             self.tsframe[self.tsframe]
 
         # test that Series work
@@ -262,11 +270,13 @@ def test_getitem_boolean(self):
         # test df[df > 0]
         for df in [self.tsframe, self.mixed_frame,
                    self.mixed_float, self.mixed_int]:
+            if compat.PY3 and df is self.mixed_frame:
+                continue
 
             data = df._get_numeric_data()
             bif = df[df > 0]
-            bifw = DataFrame(dict([(c, np.where(data[c] > 0, data[c], np.nan))
-                                   for c in data.columns]),
+            bifw = DataFrame({c: np.where(data[c] > 0, data[c], np.nan)
+                              for c in data.columns},
                              index=data.index, columns=data.columns)
 
             # add back other columns to compare
@@ -278,7 +288,7 @@ def test_getitem_boolean(self):
             assert_frame_equal(bif, bifw, check_dtype=False)
             for c in df.columns:
                 if bif[c].dtype != bifw[c].dtype:
-                    self.assertEqual(bif[c].dtype, df[c].dtype)
+                    assert bif[c].dtype == df[c].dtype
 
     def test_getitem_boolean_casting(self):
 
@@ -308,7 +318,7 @@ def test_getitem_boolean_casting(self):
         df = DataFrame(data=np.random.randn(100, 50))
         df = df.where(df > 0)  # create nans
         bools = df > 0
-        mask = isnull(df)
+        mask = isna(df)
         expected = bools.astype(float).mask(mask)
         result = bools.mask(mask)
         assert_frame_equal(result, expected)
@@ -326,7 +336,7 @@ def _checkit(lst):
         _checkit([False, False, False])
 
     def test_getitem_boolean_iadd(self):
-        arr = randn(5, 5)
+        arr = np.random.randn(5, 5)
 
         df = DataFrame(arr.copy(), columns=['A', 'B', 'C', 'D', 'E'])
 
@@ -355,6 +365,7 @@ def test_getitem_ix_mixed_integer(self):
         assert_frame_equal(result, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[[1, 10]]
             expected = df.ix[Index([1, 10], dtype=object)]
         assert_frame_equal(result, expected)
@@ -374,54 +385,70 @@ def test_getitem_ix_mixed_integer(self):
 
     def test_getitem_setitem_ix_negative_integers(self):
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = self.frame.ix[:, -1]
         assert_series_equal(result, self.frame['D'])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = self.frame.ix[:, [-1]]
         assert_frame_equal(result, self.frame[['D']])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = self.frame.ix[:, [-1, -2]]
         assert_frame_equal(result, self.frame[['D', 'C']])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             self.frame.ix[:, [-1]] = 0
-        self.assertTrue((self.frame['D'] == 0).all())
+        assert (self.frame['D'] == 0).all()
 
         df = DataFrame(np.random.randn(8, 4))
+        # ix does label-based indexing when having an integer index
+        with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
+            with pytest.raises(KeyError):
+                df.ix[[-1]]
+
         with catch_warnings(record=True):
-            self.assertTrue(isnull(df.ix[:, [-1]].values).all())
+            simplefilter("ignore", DeprecationWarning)
+            with pytest.raises(KeyError):
+                df.ix[:, [-1]]
 
         # #1942
-        a = DataFrame(randn(20, 2), index=[chr(x + 65) for x in range(20)])
+        a = DataFrame(np.random.randn(20, 2),
+                      index=[chr(x + 65) for x in range(20)])
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             a.ix[-1] = a.ix[-2]
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_series_equal(a.ix[-1], a.ix[-2], check_names=False)
-            self.assertEqual(a.ix[-1].name, 'T')
-            self.assertEqual(a.ix[-2].name, 'S')
+            assert a.ix[-1].name == 'T'
+            assert a.ix[-2].name == 'S'
 
     def test_getattr(self):
         assert_series_equal(self.frame.A, self.frame['A'])
-        self.assertRaises(AttributeError, getattr, self.frame,
-                          'NONEXISTENT_NAME')
+        msg = "'DataFrame' object has no attribute 'NONEXISTENT_NAME'"
+        with pytest.raises(AttributeError, match=msg):
+            self.frame.NONEXISTENT_NAME
 
     def test_setattr_column(self):
         df = DataFrame({'foobar': 1}, index=lrange(10))
 
         df.foobar = 5
-        self.assertTrue((df.foobar == 5).all())
+        assert (df.foobar == 5).all()
 
     def test_setitem(self):
         # not sure what else to do here
         series = self.frame['A'][::2]
         self.frame['col5'] = series
-        self.assertIn('col5', self.frame)
+        assert 'col5' in self.frame
 
-        self.assertEqual(len(series), 15)
-        self.assertEqual(len(self.frame), 30)
+        assert len(series) == 15
+        assert len(self.frame) == 30
 
         exp = np.ravel(np.column_stack((series.values, [np.nan] * 15)))
         exp = Series(exp, index=self.frame.index, name='col5')
@@ -431,13 +458,13 @@ def test_setitem(self):
         self.frame['col6'] = series
         tm.assert_series_equal(series, self.frame['col6'], check_names=False)
 
-        with tm.assertRaises(KeyError):
-            self.frame[randn(len(self.frame) + 1)] = 1
+        with pytest.raises(KeyError):
+            self.frame[np.random.randn(len(self.frame) + 1)] = 1
 
         # set ndarray
-        arr = randn(len(self.frame))
+        arr = np.random.randn(len(self.frame))
         self.frame['col9'] = arr
-        self.assertTrue((self.frame['col9'] == arr).all())
+        assert (self.frame['col9'] == arr).all()
 
         self.frame['col7'] = 5
         assert((self.frame['col7'] == 5).all())
@@ -452,16 +479,11 @@ def test_setitem(self):
         # so raise/warn
         smaller = self.frame[:2]
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             smaller['col10'] = ['1', '2']
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertEqual(smaller['col10'].dtype, np.object_)
-        self.assertTrue((smaller['col10'] == ['1', '2']).all())
 
-        # with a dtype
-        for dtype in ['int32', 'int64', 'float32', 'float64']:
-            self.frame[dtype] = np.array(arr, dtype=dtype)
-            self.assertEqual(self.frame[dtype].dtype.name, dtype)
+        assert smaller['col10'].dtype == np.object_
+        assert (smaller['col10'] == ['1', '2']).all()
 
         # dtype changing GH4204
         df = DataFrame([[0, 0]])
@@ -473,6 +495,13 @@ def f():
         df.loc[0] = np.nan
         assert_frame_equal(df, expected)
 
+    @pytest.mark.parametrize("dtype", ["int32", "int64", "float32", "float64"])
+    def test_setitem_dtype(self, dtype):
+        arr = np.random.randn(len(self.frame))
+
+        self.frame[dtype] = np.array(arr, dtype=dtype)
+        assert self.frame[dtype].dtype.name == dtype
+
     def test_setitem_tuple(self):
         self.frame['A', 'B'] = self.frame['A']
         assert_series_equal(self.frame['A', 'B'], self.frame[
@@ -482,8 +511,8 @@ def test_setitem_always_copy(self):
         s = self.frame['A'].copy()
         self.frame['E'] = s
 
-        self.frame['E'][5:10] = nan
-        self.assertTrue(notnull(s[5:10]).all())
+        self.frame['E'][5:10] = np.nan
+        assert notna(s[5:10]).all()
 
     def test_setitem_boolean(self):
         df = self.frame.copy()
@@ -518,15 +547,15 @@ def test_setitem_boolean(self):
         values[values == 2] = 3
         assert_almost_equal(df.values, values)
 
-        with assertRaisesRegexp(TypeError, 'Must pass DataFrame with boolean '
-                                'values only'):
+        msg = "Must pass DataFrame or 2-d ndarray with boolean values only"
+        with pytest.raises(TypeError, match=msg):
             df[df * 0] = 2
 
         # index with DataFrame
         mask = df > np.abs(df)
         expected = df.copy()
-        df[df > np.abs(df)] = nan
-        expected.values[mask.values] = nan
+        df[df > np.abs(df)] = np.nan
+        expected.values[mask.values] = np.nan
         assert_frame_equal(df, expected)
 
         # set from DataFrame
@@ -535,34 +564,53 @@ def test_setitem_boolean(self):
         np.putmask(expected.values, mask.values, df.values * 2)
         assert_frame_equal(df, expected)
 
+    @pytest.mark.parametrize(
+        "mask_type",
+        [lambda df: df > np.abs(df) / 2,
+         lambda df: (df > np.abs(df) / 2).values],
+        ids=['dataframe', 'array'])
+    def test_setitem_boolean_mask(self, mask_type):
+
+        # Test for issue #18582
+        df = self.frame.copy()
+        mask = mask_type(df)
+
+        # index with boolean mask
+        result = df.copy()
+        result[mask] = np.nan
+
+        expected = df.copy()
+        expected.values[np.array(mask)] = np.nan
+        assert_frame_equal(result, expected)
+
     def test_setitem_cast(self):
         self.frame['D'] = self.frame['D'].astype('i8')
-        self.assertEqual(self.frame['D'].dtype, np.int64)
+        assert self.frame['D'].dtype == np.int64
 
         # #669, should not cast?
         # this is now set to int64, which means a replacement of the column to
         # the value dtype (and nothing to do with the existing dtype)
         self.frame['B'] = 0
-        self.assertEqual(self.frame['B'].dtype, np.int64)
+        assert self.frame['B'].dtype == np.int64
 
         # cast if pass array of course
         self.frame['B'] = np.arange(len(self.frame))
-        self.assertTrue(issubclass(self.frame['B'].dtype.type, np.integer))
+        assert issubclass(self.frame['B'].dtype.type, np.integer)
 
         self.frame['foo'] = 'bar'
         self.frame['foo'] = 0
-        self.assertEqual(self.frame['foo'].dtype, np.int64)
+        assert self.frame['foo'].dtype == np.int64
 
         self.frame['foo'] = 'bar'
         self.frame['foo'] = 2.5
-        self.assertEqual(self.frame['foo'].dtype, np.float64)
+        assert self.frame['foo'].dtype == np.float64
 
         self.frame['something'] = 0
-        self.assertEqual(self.frame['something'].dtype, np.int64)
+        assert self.frame['something'].dtype == np.int64
         self.frame['something'] = 2
-        self.assertEqual(self.frame['something'].dtype, np.int64)
+        assert self.frame['something'].dtype == np.int64
         self.frame['something'] = 2.5
-        self.assertEqual(self.frame['something'].dtype, np.float64)
+        assert self.frame['something'].dtype == np.float64
 
         # GH 7704
         # dtype conversion on setting
@@ -576,9 +624,9 @@ def test_setitem_cast(self):
         # Test that data type is preserved . #5782
         df = DataFrame({'one': np.arange(6, dtype=np.int8)})
         df.loc[1, 'one'] = 6
-        self.assertEqual(df.dtypes.one, np.dtype(np.int8))
+        assert df.dtypes.one == np.dtype(np.int8)
         df.one = np.int8(7)
-        self.assertEqual(df.dtypes.one, np.dtype(np.int8))
+        assert df.dtypes.one == np.dtype(np.int8)
 
     def test_setitem_boolean_column(self):
         expected = self.frame.copy()
@@ -589,6 +637,16 @@ def test_setitem_boolean_column(self):
 
         assert_frame_equal(self.frame, expected)
 
+    def test_frame_setitem_timestamp(self):
+        # GH#2155
+        columns = date_range(start='1/1/2012', end='2/1/2012', freq=BDay())
+        index = lrange(10)
+        data = DataFrame(columns=columns, index=index)
+        t = datetime(2012, 11, 1)
+        ts = Timestamp(t)
+        data[ts] = np.nan  # works, mostly a smoke-test
+        assert np.isnan(data[ts]).all()
+
     def test_setitem_corner(self):
         # corner case
         df = DataFrame({'B': [1., 2., 3.],
@@ -596,8 +654,8 @@ def test_setitem_corner(self):
                        index=np.arange(3))
         del df['B']
         df['B'] = [1., 2., 3.]
-        self.assertIn('B', df)
-        self.assertEqual(len(df.columns), 2)
+        assert 'B' in df
+        assert len(df.columns) == 2
 
         df['A'] = 'beginning'
         df['E'] = 'foo'
@@ -609,29 +667,29 @@ def test_setitem_corner(self):
         dm = DataFrame(index=self.frame.index)
         dm['A'] = 'foo'
         dm['B'] = 'bar'
-        self.assertEqual(len(dm.columns), 2)
-        self.assertEqual(dm.values.dtype, np.object_)
+        assert len(dm.columns) == 2
+        assert dm.values.dtype == np.object_
 
         # upcast
         dm['C'] = 1
-        self.assertEqual(dm['C'].dtype, np.int64)
+        assert dm['C'].dtype == np.int64
 
         dm['E'] = 1.
-        self.assertEqual(dm['E'].dtype, np.float64)
+        assert dm['E'].dtype == np.float64
 
         # set existing column
         dm['A'] = 'bar'
-        self.assertEqual('bar', dm['A'][0])
+        assert 'bar' == dm['A'][0]
 
         dm = DataFrame(index=np.arange(3))
         dm['A'] = 1
         dm['foo'] = 'bar'
         del dm['foo']
         dm['foo'] = 'bar'
-        self.assertEqual(dm['foo'].dtype, np.object_)
+        assert dm['foo'].dtype == np.object_
 
         dm['coercable'] = ['1', '2', '3']
-        self.assertEqual(dm['coercable'].dtype, np.object_)
+        assert dm['coercable'].dtype == np.object_
 
     def test_setitem_corner2(self):
         data = {"title": ['foobar', 'bar', 'foobar'] + ['foobar'] * 17,
@@ -643,14 +701,14 @@ def test_setitem_corner2(self):
         df.loc[ix, ['title']] = 'foobar'
         df.loc[ix, ['cruft']] = 0
 
-        self.assertEqual(df.loc[1, 'title'], 'foobar')
-        self.assertEqual(df.loc[1, 'cruft'], 0)
+        assert df.loc[1, 'title'] == 'foobar'
+        assert df.loc[1, 'cruft'] == 0
 
     def test_setitem_ambig(self):
-        # difficulties with mixed-type data
+        # Difficulties with mixed-type data
         from decimal import Decimal
 
-        # created as float type
+        # Created as float type
         dm = DataFrame(index=lrange(3), columns=lrange(3))
 
         coercable_series = Series([Decimal(1) for _ in range(3)],
@@ -658,32 +716,29 @@ def test_setitem_ambig(self):
         uncoercable_series = Series(['foo', 'bzr', 'baz'], index=lrange(3))
 
         dm[0] = np.ones(3)
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNone(dm.objects)
+        assert len(dm.columns) == 3
 
         dm[1] = coercable_series
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNone(dm.objects)
+        assert len(dm.columns) == 3
 
         dm[2] = uncoercable_series
-        self.assertEqual(len(dm.columns), 3)
-        # self.assertIsNotNone(dm.objects)
-        self.assertEqual(dm[2].dtype, np.object_)
+        assert len(dm.columns) == 3
+        assert dm[2].dtype == np.object_
 
     def test_setitem_clear_caches(self):
-        # GH #304
+        # see gh-304
         df = DataFrame({'x': [1.1, 2.1, 3.1, 4.1], 'y': [5.1, 6.1, 7.1, 8.1]},
                        index=[0, 1, 2, 3])
         df.insert(2, 'z', np.nan)
 
         # cache it
         foo = df['z']
-
         df.loc[df.index[2:], 'z'] = 42
 
         expected = Series([np.nan, np.nan, 42, 42], index=df.index, name='z')
-        self.assertIsNot(df['z'], foo)
-        assert_series_equal(df['z'], expected)
+
+        assert df['z'] is not foo
+        tm.assert_series_equal(df['z'], expected)
 
     def test_setitem_None(self):
         # GH #766
@@ -703,21 +758,30 @@ def test_setitem_empty(self):
                            'c': ['111', '222', '333']})
 
         result = df.copy()
-        result.loc[result.b.isnull(), 'a'] = result.a
+        result.loc[result.b.isna(), 'a'] = result.a
         assert_frame_equal(result, df)
 
-    def test_setitem_empty_frame_with_boolean(self):
-        # Test for issue #10126
+    @pytest.mark.parametrize("dtype", ["float", "int64"])
+    @pytest.mark.parametrize("kwargs", [
+        dict(),
+        dict(index=[1]),
+        dict(columns=["A"])
+    ])
+    def test_setitem_empty_frame_with_boolean(self, dtype, kwargs):
+        # see gh-10126
+        kwargs["dtype"] = dtype
+        df = DataFrame(**kwargs)
 
-        for dtype in ('float', 'int64'):
-            for df in [
-                    pd.DataFrame(dtype=dtype),
-                    pd.DataFrame(dtype=dtype, index=[1]),
-                    pd.DataFrame(dtype=dtype, columns=['A']),
-            ]:
-                df2 = df.copy()
-                df[df > df2] = 47
-                assert_frame_equal(df, df2)
+        df2 = df.copy()
+        df[df > df2] = 47
+        assert_frame_equal(df, df2)
+
+    def test_setitem_scalars_no_index(self):
+        # GH16823 / 17894
+        df = DataFrame()
+        df['foo'] = 1
+        expected = DataFrame(columns=['foo']).astype(np.int64)
+        assert_frame_equal(df, expected)
 
     def test_getitem_empty_frame_with_boolean(self):
         # Test for issue #11859
@@ -729,25 +793,29 @@ def test_getitem_empty_frame_with_boolean(self):
     def test_delitem_corner(self):
         f = self.frame.copy()
         del f['D']
-        self.assertEqual(len(f.columns), 3)
-        self.assertRaises(KeyError, f.__delitem__, 'D')
+        assert len(f.columns) == 3
+        with pytest.raises(KeyError, match=r"^'D'$"):
+            del f['D']
         del f['B']
-        self.assertEqual(len(f.columns), 2)
+        assert len(f.columns) == 2
 
     def test_getitem_fancy_2d(self):
         f = self.frame
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(f.ix[:, ['B', 'A']],
                                f.reindex(columns=['B', 'A']))
 
         subidx = self.frame.index[[5, 4, 1]]
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(f.ix[subidx, ['B', 'A']],
                                f.reindex(index=subidx, columns=['B', 'A']))
 
         # slicing rows, etc.
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(f.ix[5:10], f[5:10])
             assert_frame_equal(f.ix[5:10, :], f[5:10])
             assert_frame_equal(f.ix[:5, ['A', 'B']],
@@ -756,36 +824,42 @@ def test_getitem_fancy_2d(self):
 
         # slice rows with labels, inclusive!
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             expected = f.ix[5:11]
             result = f.ix[f.index[5]:f.index[10]]
         assert_frame_equal(expected, result)
 
         # slice columns
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(f.ix[:, :2], f.reindex(columns=['A', 'B']))
 
         # get view
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             exp = f.copy()
             f.ix[5:10].values[:] = 5
             exp.values[5:10] = 5
             assert_frame_equal(f, exp)
 
         with catch_warnings(record=True):
-            self.assertRaises(ValueError, f.ix.__getitem__, f > 0.5)
+            simplefilter("ignore", DeprecationWarning)
+            msg = "Cannot index with multidimensional key"
+            with pytest.raises(ValueError, match=msg):
+                f.ix[f > 0.5]
 
     def test_slice_floats(self):
         index = [52195.504153, 52196.303147, 52198.369883]
         df = DataFrame(np.random.rand(3, 2), index=index)
 
         s1 = df.loc[52195.1:52196.5]
-        self.assertEqual(len(s1), 2)
+        assert len(s1) == 2
 
         s1 = df.loc[52195.1:52196.6]
-        self.assertEqual(len(s1), 2)
+        assert len(s1) == 2
 
         s1 = df.loc[52195.1:52198.9]
-        self.assertEqual(len(s1), 3)
+        assert len(s1) == 3
 
     def test_getitem_fancy_slice_integers_step(self):
         df = DataFrame(np.random.randn(10, 5))
@@ -793,20 +867,21 @@ def test_getitem_fancy_slice_integers_step(self):
         # this is OK
         result = df.iloc[:8:2]  # noqa
         df.iloc[:8:2] = np.nan
-        self.assertTrue(isnull(df.iloc[:8:2]).values.all())
+        assert isna(df.iloc[:8:2]).values.all()
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_getitem_setitem_integer_slice_keyerrors(self):
         df = DataFrame(np.random.randn(10, 5), index=lrange(0, 20, 2))
 
         # this is OK
         cp = df.copy()
         cp.iloc[4:10] = 0
-        self.assertTrue((cp.iloc[4:10] == 0).values.all())
+        assert (cp.iloc[4:10] == 0).values.all()
 
         # so is this
         cp = df.copy()
         cp.iloc[3:11] = 0
-        self.assertTrue((cp.iloc[3:11] == 0).values.all())
+        assert (cp.iloc[3:11] == 0).values.all()
 
         result = df.iloc[2:6]
         result2 = df.loc[3:11]
@@ -817,8 +892,10 @@ def test_getitem_setitem_integer_slice_keyerrors(self):
 
         # non-monotonic, raise KeyError
         df2 = df.iloc[lrange(5) + lrange(5, 10)[::-1]]
-        self.assertRaises(KeyError, df2.loc.__getitem__, slice(3, 11))
-        self.assertRaises(KeyError, df2.loc.__setitem__, slice(3, 11), 0)
+        with pytest.raises(KeyError, match=r"^3$"):
+            df2.loc[3:11]
+        with pytest.raises(KeyError, match=r"^3$"):
+            df2.loc[3:11] = 0
 
     def test_setitem_fancy_2d(self):
 
@@ -827,6 +904,7 @@ def test_setitem_fancy_2d(self):
         expected = frame.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[:, ['B', 'A']] = 1
         expected['B'] = 1.
         expected['A'] = 1.
@@ -839,9 +917,10 @@ def test_setitem_fancy_2d(self):
         expected = frame.copy()
 
         subidx = self.frame.index[[5, 4, 1]]
-        values = randn(3, 2)
+        values = np.random.randn(3, 2)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[subidx, ['B', 'A']] = values
             frame2.ix[[5, 4, 1], ['B', 'A']] = values
 
@@ -855,20 +934,23 @@ def test_setitem_fancy_2d(self):
         frame = self.frame.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             expected1 = self.frame.copy()
             frame.ix[5:10] = 1.
             expected1.values[5:10] = 1.
         assert_frame_equal(frame, expected1)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             expected2 = self.frame.copy()
-            arr = randn(5, len(frame.columns))
+            arr = np.random.randn(5, len(frame.columns))
             frame.ix[5:10] = arr
             expected2.values[5:10] = arr
         assert_frame_equal(frame, expected2)
 
         # case 4
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame = self.frame.copy()
             frame.ix[5:10, :] = 1.
             assert_frame_equal(frame, expected1)
@@ -877,11 +959,12 @@ def test_setitem_fancy_2d(self):
 
         # case 5
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame = self.frame.copy()
             frame2 = self.frame.copy()
 
             expected = self.frame.copy()
-            values = randn(5, 2)
+            values = np.random.randn(5, 2)
 
             frame.ix[:5, ['A', 'B']] = values
             expected['A'][:5] = values[:, 0]
@@ -889,11 +972,13 @@ def test_setitem_fancy_2d(self):
         assert_frame_equal(frame, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame2.ix[:5, [0, 1]] = values
         assert_frame_equal(frame2, expected)
 
         # case 6: slice rows with labels, inclusive!
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame = self.frame.copy()
             expected = self.frame.copy()
 
@@ -903,6 +988,7 @@ def test_setitem_fancy_2d(self):
 
         # case 7: slice columns
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame = self.frame.copy()
             frame2 = self.frame.copy()
             expected = self.frame.copy()
@@ -928,16 +1014,16 @@ def test_setitem_fancy_2d(self):
 
     def test_fancy_getitem_slice_mixed(self):
         sliced = self.mixed_frame.iloc[:, -3:]
-        self.assertEqual(sliced['D'].dtype, np.float64)
+        assert sliced['D'].dtype == np.float64
 
         # get view with single block
         # setting it triggers setting with copy
         sliced = self.frame.iloc[:, -3:]
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             sliced['C'] = 4.
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertTrue((self.frame['C'] == 4).all())
+
+        assert (self.frame['C'] == 4).all()
 
     def test_fancy_setitem_int_labels(self):
         # integer index defers to label-based indexing
@@ -945,6 +1031,7 @@ def test_fancy_setitem_int_labels(self):
         df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             tmp = df.copy()
             exp = df.copy()
             tmp.ix[[0, 2, 4]] = 5
@@ -952,6 +1039,7 @@ def test_fancy_setitem_int_labels(self):
         assert_frame_equal(tmp, exp)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             tmp = df.copy()
             exp = df.copy()
             tmp.ix[6] = 5
@@ -959,6 +1047,7 @@ def test_fancy_setitem_int_labels(self):
         assert_frame_equal(tmp, exp)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             tmp = df.copy()
             exp = df.copy()
             tmp.ix[:, 2] = 5
@@ -972,56 +1061,64 @@ def test_fancy_getitem_int_labels(self):
         df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[[4, 2, 0], [2, 0]]
             expected = df.reindex(index=[4, 2, 0], columns=[2, 0])
         assert_frame_equal(result, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[[4, 2, 0]]
             expected = df.reindex(index=[4, 2, 0])
         assert_frame_equal(result, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[4]
             expected = df.xs(4)
         assert_series_equal(result, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[:, 3]
             expected = df[3]
         assert_series_equal(result, expected)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_fancy_index_int_labels_exceptions(self):
         df = DataFrame(np.random.randn(10, 5), index=np.arange(0, 20, 2))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
 
             # labels that aren't contained
-            self.assertRaises(KeyError, df.ix.__setitem__,
-                              ([0, 1, 2], [2, 3, 4]), 5)
+            with pytest.raises(KeyError, match=r"\[1\] not in index"):
+                df.ix[[0, 1, 2], [2, 3, 4]] = 5
 
             # try to set indices not contained in frame
-            self.assertRaises(KeyError,
-                              self.frame.ix.__setitem__,
-                              ['foo', 'bar', 'baz'], 1)
-            self.assertRaises(KeyError,
-                              self.frame.ix.__setitem__,
-                              (slice(None, None), ['E']), 1)
+            msg = (r"None of \[Index\(\['foo', 'bar', 'baz'\],"
+                   r" dtype='object'\)\] are in the \[index\]")
+            with pytest.raises(KeyError, match=msg):
+                self.frame.ix[['foo', 'bar', 'baz']] = 1
+            msg = (r"None of \[Index\(\['E'\], dtype='object'\)\] are in the"
+                   r" \[columns\]")
+            with pytest.raises(KeyError, match=msg):
+                self.frame.ix[:, ['E']] = 1
 
             # partial setting now allows this GH2578
-            # self.assertRaises(KeyError,
-            #                  self.frame.ix.__setitem__,
-            #                  (slice(None, None), 'E'), 1)
+            # pytest.raises(KeyError, self.frame.ix.__setitem__,
+            #               (slice(None, None), 'E'), 1)
 
     def test_setitem_fancy_mixed_2d(self):
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             self.mixed_frame.ix[:5, ['C', 'B', 'A']] = 5
             result = self.mixed_frame.ix[:5, ['C', 'B', 'A']]
-            self.assertTrue((result.values == 5).all())
+            assert (result.values == 5).all()
 
             self.mixed_frame.ix[5] = np.nan
-            self.assertTrue(isnull(self.mixed_frame.ix[5]).all())
+            assert isna(self.mixed_frame.ix[5]).all()
 
             self.mixed_frame.ix[5] = self.mixed_frame.ix[6]
             assert_series_equal(self.mixed_frame.ix[5], self.mixed_frame.ix[6],
@@ -1029,9 +1126,10 @@ def test_setitem_fancy_mixed_2d(self):
 
         # #1432
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df = DataFrame({1: [1., 2., 3.],
                             2: [3, 4, 5]})
-            self.assertTrue(df._is_mixed_type)
+            assert df._is_mixed_type
 
             df.ix[1] = [5, 10]
 
@@ -1041,32 +1139,37 @@ def test_setitem_fancy_mixed_2d(self):
             assert_frame_equal(df, expected)
 
     def test_ix_align(self):
-        b = Series(randn(10), name=0).sort_values()
-        df_orig = DataFrame(randn(10, 4))
+        b = Series(np.random.randn(10), name=0).sort_values()
+        df_orig = DataFrame(np.random.randn(10, 4))
         df = df_orig.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df.ix[:, 0] = b
             assert_series_equal(df.ix[:, 0].reindex(b.index), b)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             dft = df_orig.T
             dft.ix[0, :] = b
             assert_series_equal(dft.ix[0, :].reindex(b.index), b)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df = df_orig.copy()
             df.ix[:5, 0] = b
             s = df.ix[:5, 0]
             assert_series_equal(s, b.reindex(s.index))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             dft = df_orig.T
             dft.ix[0, :5] = b
             s = dft.ix[0, :5]
             assert_series_equal(s, b.reindex(s.index))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df = df_orig.copy()
             idx = [0, 1, 3, 5]
             df.ix[idx, 0] = b
@@ -1074,6 +1177,7 @@ def test_ix_align(self):
             assert_series_equal(s, b.reindex(s.index))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             dft = df_orig.T
             dft.ix[0, idx] = b
             s = dft.ix[0, idx]
@@ -1081,10 +1185,11 @@ def test_ix_align(self):
 
     def test_ix_frame_align(self):
         b = DataFrame(np.random.randn(3, 4))
-        df_orig = DataFrame(randn(10, 4))
+        df_orig = DataFrame(np.random.randn(10, 4))
         df = df_orig.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df.ix[:3] = b
             out = b.ix[:3]
             assert_frame_equal(out, b)
@@ -1092,12 +1197,14 @@ def test_ix_frame_align(self):
         b.sort_index(inplace=True)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df = df_orig.copy()
             df.ix[[0, 1, 2]] = b
             out = df.ix[[0, 1, 2]].reindex(b.index)
             assert_frame_equal(out, b)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             df = df_orig.copy()
             df.ix[:3] = b
             out = df.ix[:3]
@@ -1140,6 +1247,7 @@ def test_ix_multi_take_nonint_index(self):
         df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
                        columns=['a', 'b'])
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             rs = df.ix[[0], [0]]
         xp = df.reindex(['x'], columns=['a'])
         assert_frame_equal(rs, xp)
@@ -1148,6 +1256,7 @@ def test_ix_multi_take_multiindex(self):
         df = DataFrame(np.random.randn(3, 2), index=['x', 'y', 'z'],
                        columns=[['a', 'b'], ['1', '2']])
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             rs = df.ix[[0], [0]]
         xp = df.reindex(['x'], columns=[('a', '1')])
         assert_frame_equal(rs, xp)
@@ -1157,14 +1266,17 @@ def test_ix_dup(self):
         df = DataFrame(np.random.randn(len(idx), 3), idx)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             sub = df.ix[:'d']
             assert_frame_equal(sub, df)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             sub = df.ix['a':'c']
             assert_frame_equal(sub, df.ix[0:4])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             sub = df.ix['b':'d']
             assert_frame_equal(sub, df.ix[2:])
 
@@ -1173,51 +1285,60 @@ def test_getitem_fancy_1d(self):
 
         # return self if no slicing...for now
         with catch_warnings(record=True):
-            self.assertIs(f.ix[:, :], f)
+            simplefilter("ignore", DeprecationWarning)
+            assert f.ix[:, :] is f
 
         # low dimensional slice
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             xs1 = f.ix[2, ['C', 'B', 'A']]
         xs2 = f.xs(f.index[2]).reindex(['C', 'B', 'A'])
-        assert_series_equal(xs1, xs2)
+        tm.assert_series_equal(xs1, xs2)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             ts1 = f.ix[5:10, 2]
         ts2 = f[f.columns[2]][5:10]
-        assert_series_equal(ts1, ts2)
+        tm.assert_series_equal(ts1, ts2)
 
         # positional xs
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             xs1 = f.ix[0]
         xs2 = f.xs(f.index[0])
-        assert_series_equal(xs1, xs2)
+        tm.assert_series_equal(xs1, xs2)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             xs1 = f.ix[f.index[5]]
         xs2 = f.xs(f.index[5])
-        assert_series_equal(xs1, xs2)
+        tm.assert_series_equal(xs1, xs2)
 
         # single column
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_series_equal(f.ix[:, 'A'], f['A'])
 
         # return view
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             exp = f.copy()
             exp.values[5] = 4
             f.ix[5][:] = 4
-        assert_frame_equal(exp, f)
+        tm.assert_frame_equal(exp, f)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             exp.values[:, 1] = 6
             f.ix[:, 1][:] = 6
-        assert_frame_equal(exp, f)
+        tm.assert_frame_equal(exp, f)
 
         # slice of mixed-frame
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             xs = self.mixed_frame.ix[5]
         exp = self.mixed_frame.xs(self.mixed_frame.index[5])
-        assert_series_equal(xs, exp)
+        tm.assert_series_equal(xs, exp)
 
     def test_setitem_fancy_1d(self):
 
@@ -1226,6 +1347,7 @@ def test_setitem_fancy_1d(self):
         expected = self.frame.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[2, ['C', 'B', 'A']] = [1., 2., 3.]
         expected['C'][2] = 1.
         expected['B'][2] = 2.
@@ -1233,6 +1355,7 @@ def test_setitem_fancy_1d(self):
         assert_frame_equal(frame, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame2 = self.frame.copy()
             frame2.ix[2, [3, 2, 1]] = [1., 2., 3.]
         assert_frame_equal(frame, expected)
@@ -1242,12 +1365,14 @@ def test_setitem_fancy_1d(self):
         expected = self.frame.copy()
 
         with catch_warnings(record=True):
-            vals = randn(5)
+            simplefilter("ignore", DeprecationWarning)
+            vals = np.random.randn(5)
             expected.values[5:10, 2] = vals
             frame.ix[5:10, 2] = vals
         assert_frame_equal(frame, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame2 = self.frame.copy()
             frame2.ix[5:10, 'B'] = vals
         assert_frame_equal(frame, expected)
@@ -1257,11 +1382,13 @@ def test_setitem_fancy_1d(self):
         expected = self.frame.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[4] = 5.
             expected.values[4] = 5.
         assert_frame_equal(frame, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[frame.index[4]] = 6.
             expected.values[4] = 6.
         assert_frame_equal(frame, expected)
@@ -1271,6 +1398,7 @@ def test_setitem_fancy_1d(self):
         expected = self.frame.copy()
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             frame.ix[:, 'A'] = 7.
             expected['A'] = 7.
         assert_frame_equal(frame, expected)
@@ -1283,7 +1411,7 @@ def test_getitem_fancy_scalar(self):
         for col in f.columns:
             ts = f[col]
             for idx in f.index[::5]:
-                self.assertEqual(ix[idx, col], ts[idx])
+                assert ix[idx, col] == ts[idx]
 
     def test_setitem_fancy_scalar(self):
         f = self.frame
@@ -1295,7 +1423,7 @@ def test_setitem_fancy_scalar(self):
             ts = f[col]  # noqa
             for idx in f.index[::5]:
                 i = f.index.get_loc(idx)
-                val = randn()
+                val = np.random.randn()
                 expected.values[i, j] = val
 
                 ix[idx, col] = val
@@ -1352,10 +1480,10 @@ def test_getitem_fancy_ints(self):
 
     def test_getitem_setitem_fancy_exceptions(self):
         ix = self.frame.iloc
-        with assertRaisesRegexp(IndexingError, 'Too many indexers'):
+        with pytest.raises(IndexingError, match='Too many indexers'):
             ix[:, :, :]
 
-        with assertRaises(IndexingError):
+        with pytest.raises(IndexingError):
             ix[:, :, :] = 1
 
     def test_getitem_setitem_boolean_misaligned(self):
@@ -1388,6 +1516,7 @@ def test_getitem_setitem_boolean_multi(self):
         expected.loc[[0, 2], [1]] = 5
         assert_frame_equal(df, expected)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_getitem_setitem_float_labels(self):
         index = Index([1.5, 2, 3, 4, 5])
         df = DataFrame(np.random.randn(5, 5), index=index)
@@ -1395,17 +1524,17 @@ def test_getitem_setitem_float_labels(self):
         result = df.loc[1.5:4]
         expected = df.reindex([1.5, 2, 3, 4])
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 4)
+        assert len(result) == 4
 
         result = df.loc[4:5]
         expected = df.reindex([4, 5])  # reindex with int
         assert_frame_equal(result, expected, check_index_type=False)
-        self.assertEqual(len(result), 2)
+        assert len(result) == 2
 
         result = df.loc[4:5]
         expected = df.reindex([4.0, 5.0])  # reindex with float
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 2)
+        assert len(result) == 2
 
         # loc_float changes this to work properly
         result = df.loc[1:2]
@@ -1414,74 +1543,77 @@ def test_getitem_setitem_float_labels(self):
 
         df.loc[1:2] = 0
         result = df[1:2]
-        self.assertTrue((result == 0).all().all())
+        assert (result == 0).all().all()
 
         # #2727
         index = Index([1.0, 2.5, 3.5, 4.5, 5.0])
         df = DataFrame(np.random.randn(5, 5), index=index)
 
         # positional slicing only via iloc!
-        self.assertRaises(TypeError, lambda: df.iloc[1.0:5])
+        msg = ("cannot do slice indexing on"
+               r" <class 'pandas\.core\.indexes\.numeric\.Float64Index'> with"
+               r" these indexers \[1.0\] of <class 'float'>")
+        with pytest.raises(TypeError, match=msg):
+            df.iloc[1.0:5]
 
         result = df.iloc[4:5]
         expected = df.reindex([5.0])
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         cp = df.copy()
 
-        def f():
+        with pytest.raises(TypeError):
             cp.iloc[1.0:5] = 0
-        self.assertRaises(TypeError, f)
 
-        def f():
+        with pytest.raises(TypeError):
             result = cp.iloc[1.0:5] == 0  # noqa
 
-        self.assertRaises(TypeError, f)
-        self.assertTrue(result.values.all())
-        self.assertTrue((cp.iloc[0:1] == df.iloc[0:1]).values.all())
+        assert result.values.all()
+        assert (cp.iloc[0:1] == df.iloc[0:1]).values.all()
 
         cp = df.copy()
         cp.iloc[4:5] = 0
-        self.assertTrue((cp.iloc[4:5] == 0).values.all())
-        self.assertTrue((cp.iloc[0:4] == df.iloc[0:4]).values.all())
+        assert (cp.iloc[4:5] == 0).values.all()
+        assert (cp.iloc[0:4] == df.iloc[0:4]).values.all()
 
         # float slicing
         result = df.loc[1.0:5]
         expected = df
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 5)
+        assert len(result) == 5
 
         result = df.loc[1.1:5]
         expected = df.reindex([2.5, 3.5, 4.5, 5.0])
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 4)
+        assert len(result) == 4
 
         result = df.loc[4.51:5]
         expected = df.reindex([5.0])
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         result = df.loc[1.0:5.0]
         expected = df.reindex([1.0, 2.5, 3.5, 4.5, 5.0])
         assert_frame_equal(result, expected)
-        self.assertEqual(len(result), 5)
+        assert len(result) == 5
 
         cp = df.copy()
         cp.loc[1.0:5.0] = 0
         result = cp.loc[1.0:5.0]
-        self.assertTrue((result == 0).values.all())
+        assert (result == 0).values.all()
 
     def test_setitem_single_column_mixed(self):
-        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
+        df = DataFrame(np.random.randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
                        columns=['foo', 'bar', 'baz'])
         df['str'] = 'qux'
-        df.loc[df.index[::2], 'str'] = nan
-        expected = np.array([nan, 'qux', nan, 'qux', nan], dtype=object)
+        df.loc[df.index[::2], 'str'] = np.nan
+        expected = np.array([np.nan, 'qux', np.nan, 'qux', np.nan],
+                            dtype=object)
         assert_almost_equal(df['str'].values, expected)
 
     def test_setitem_single_column_mixed_datetime(self):
-        df = DataFrame(randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
+        df = DataFrame(np.random.randn(5, 3), index=['a', 'b', 'c', 'd', 'e'],
                        columns=['foo', 'bar', 'baz'])
 
         df['timestamp'] = Timestamp('20010102')
@@ -1493,20 +1625,39 @@ def test_setitem_single_column_mixed_datetime(self):
 
         # set an allowable datetime64 type
         df.loc['b', 'timestamp'] = iNaT
-        self.assertTrue(isnull(df.loc['b', 'timestamp']))
+        assert isna(df.loc['b', 'timestamp'])
 
         # allow this syntax
-        df.loc['c', 'timestamp'] = nan
-        self.assertTrue(isnull(df.loc['c', 'timestamp']))
+        df.loc['c', 'timestamp'] = np.nan
+        assert isna(df.loc['c', 'timestamp'])
 
         # allow this syntax
-        df.loc['d', :] = nan
-        self.assertTrue(isnull(df.loc['c', :]).all() == False)  # noqa
+        df.loc['d', :] = np.nan
+        assert not isna(df.loc['c', :]).all()
 
         # as of GH 3216 this will now work!
         # try to set with a list like item
-        # self.assertRaises(
-        #    Exception, df.loc.__setitem__, ('d', 'timestamp'), [nan])
+        # pytest.raises(
+        #    Exception, df.loc.__setitem__, ('d', 'timestamp'), [np.nan])
+
+    def test_setitem_mixed_datetime(self):
+        # GH 9336
+        expected = DataFrame({'a': [0, 0, 0, 0, 13, 14],
+                              'b': [pd.datetime(2012, 1, 1),
+                                    1,
+                                    'x',
+                                    'y',
+                                    pd.datetime(2013, 1, 1),
+                                    pd.datetime(2014, 1, 1)]})
+        df = pd.DataFrame(0, columns=list('ab'), index=range(6))
+        df['b'] = pd.NaT
+        df.loc[0, 'b'] = pd.datetime(2012, 1, 1)
+        df.loc[1, 'b'] = 1
+        df.loc[[2, 3], 'b'] = 'x', 'y'
+        A = np.array([[13, np.datetime64('2013-01-01T00:00:00')],
+                      [14, np.datetime64('2014-01-01T00:00:00')]])
+        df.loc[[4, 5], ['a', 'b']] = A
+        assert_frame_equal(df, expected)
 
     def test_setitem_frame(self):
         piece = self.frame.loc[self.frame.index[:2], ['A', 'B']]
@@ -1610,11 +1761,16 @@ def test_getitem_setitem_ix_bool_keyerror(self):
         # #2199
         df = DataFrame({'a': [1, 2, 3]})
 
-        self.assertRaises(KeyError, df.loc.__getitem__, False)
-        self.assertRaises(KeyError, df.loc.__getitem__, True)
+        with pytest.raises(KeyError, match=r"^False$"):
+            df.loc[False]
+        with pytest.raises(KeyError, match=r"^True$"):
+            df.loc[True]
 
-        self.assertRaises(KeyError, df.loc.__setitem__, False, 0)
-        self.assertRaises(KeyError, df.loc.__setitem__, True, 0)
+        msg = "cannot use a single bool to index into setitem"
+        with pytest.raises(KeyError, match=msg):
+            df.loc[False] = 0
+        with pytest.raises(KeyError, match=msg):
+            df.loc[True] = 0
 
     def test_getitem_list_duplicates(self):
         # #1943
@@ -1622,7 +1778,7 @@ def test_getitem_list_duplicates(self):
         df.columns.name = 'foo'
 
         result = df[['B', 'C']]
-        self.assertEqual(result.columns.name, 'foo')
+        assert result.columns.name == 'foo'
 
         expected = df.iloc[:, 2:]
         assert_frame_equal(result, expected)
@@ -1630,15 +1786,17 @@ def test_getitem_list_duplicates(self):
     def test_get_value(self):
         for idx in self.frame.index:
             for col in self.frame.columns:
-                result = self.frame.get_value(idx, col)
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    result = self.frame.get_value(idx, col)
                 expected = self.frame[col][idx]
-                self.assertEqual(result, expected)
+                assert result == expected
 
     def test_lookup(self):
         def alt(df, rows, cols, dtype):
-            result = []
-            for r, c in zip(rows, cols):
-                result.append(df.get_value(r, c))
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = [df.get_value(r, c) for r, c in zip(rows, cols)]
             return np.array(result, dtype=dtype)
 
         def testit(df):
@@ -1658,104 +1816,132 @@ def testit(df):
         df['mask'] = df.lookup(df.index, 'mask_' + df['label'])
         exp_mask = alt(df, df.index, 'mask_' + df['label'], dtype=np.bool_)
         tm.assert_series_equal(df['mask'], pd.Series(exp_mask, name='mask'))
-        self.assertEqual(df['mask'].dtype, np.bool_)
+        assert df['mask'].dtype == np.bool_
 
-        with tm.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             self.frame.lookup(['xyz'], ['A'])
 
-        with tm.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             self.frame.lookup([self.frame.index[0]], ['xyz'])
 
-        with tm.assertRaisesRegexp(ValueError, 'same size'):
+        with pytest.raises(ValueError, match='same size'):
             self.frame.lookup(['a', 'b', 'c'], ['a'])
 
     def test_set_value(self):
         for idx in self.frame.index:
             for col in self.frame.columns:
-                self.frame.set_value(idx, col, 1)
-                self.assertEqual(self.frame[col][idx], 1)
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    self.frame.set_value(idx, col, 1)
+                assert self.frame[col][idx] == 1
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_set_value_resize(self):
 
-        res = self.frame.set_value('foobar', 'B', 0)
-        self.assertIs(res, self.frame)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res.get_value('foobar', 'B'), 0)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = self.frame.set_value('foobar', 'B', 0)
+        assert res is self.frame
+        assert res.index[-1] == 'foobar'
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res.get_value('foobar', 'B') == 0
 
         self.frame.loc['foobar', 'qux'] = 0
-        self.assertEqual(self.frame.get_value('foobar', 'qux'), 0)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert self.frame.get_value('foobar', 'qux') == 0
 
         res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', 'sam')
-        self.assertEqual(res3['baz'].dtype, np.object_)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', 'sam')
+        assert res3['baz'].dtype == np.object_
 
         res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', True)
-        self.assertEqual(res3['baz'].dtype, np.object_)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', True)
+        assert res3['baz'].dtype == np.object_
 
         res = self.frame.copy()
-        res3 = res.set_value('foobar', 'baz', 5)
-        self.assertTrue(is_float_dtype(res3['baz']))
-        self.assertTrue(isnull(res3['baz'].drop(['foobar'])).all())
-        self.assertRaises(ValueError, res3.set_value, 'foobar', 'baz', 'sam')
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res3 = res.set_value('foobar', 'baz', 5)
+        assert is_float_dtype(res3['baz'])
+        assert isna(res3['baz'].drop(['foobar'])).all()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            msg = "could not convert string to float: 'sam'"
+            with pytest.raises(ValueError, match=msg):
+                res3.set_value('foobar', 'baz', 'sam')
 
     def test_set_value_with_index_dtype_change(self):
-        df_orig = DataFrame(randn(3, 3), index=lrange(3), columns=list('ABC'))
+        df_orig = DataFrame(np.random.randn(3, 3),
+                            index=lrange(3), columns=list('ABC'))
 
         # this is actually ambiguous as the 2 is interpreted as a positional
         # so column is not created
         df = df_orig.copy()
-        df.set_value('C', 2, 1.0)
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        # self.assertEqual(list(df.columns), list(df_orig.columns) + [2])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df.set_value('C', 2, 1.0)
+        assert list(df.index) == list(df_orig.index) + ['C']
+        # assert list(df.columns) == list(df_orig.columns) + [2]
 
         df = df_orig.copy()
         df.loc['C', 2] = 1.0
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        # self.assertEqual(list(df.columns), list(df_orig.columns) + [2])
+        assert list(df.index) == list(df_orig.index) + ['C']
+        # assert list(df.columns) == list(df_orig.columns) + [2]
 
         # create both new
         df = df_orig.copy()
-        df.set_value('C', 'D', 1.0)
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        self.assertEqual(list(df.columns), list(df_orig.columns) + ['D'])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df.set_value('C', 'D', 1.0)
+        assert list(df.index) == list(df_orig.index) + ['C']
+        assert list(df.columns) == list(df_orig.columns) + ['D']
 
         df = df_orig.copy()
         df.loc['C', 'D'] = 1.0
-        self.assertEqual(list(df.index), list(df_orig.index) + ['C'])
-        self.assertEqual(list(df.columns), list(df_orig.columns) + ['D'])
+        assert list(df.index) == list(df_orig.index) + ['C']
+        assert list(df.columns) == list(df_orig.columns) + ['D']
 
     def test_get_set_value_no_partial_indexing(self):
         # partial w/ MultiIndex raise exception
         index = MultiIndex.from_tuples([(0, 1), (0, 2), (1, 1), (1, 2)])
         df = DataFrame(index=index, columns=lrange(4))
-        self.assertRaises(KeyError, df.get_value, 0, 1)
-        # self.assertRaises(KeyError, df.set_value, 0, 1, 0)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            with pytest.raises(KeyError, match=r"^0$"):
+                df.get_value(0, 1)
 
     def test_single_element_ix_dont_upcast(self):
         self.frame['E'] = 1
-        self.assertTrue(issubclass(self.frame['E'].dtype.type,
-                                   (int, np.integer)))
+        assert issubclass(self.frame['E'].dtype.type, (int, np.integer))
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = self.frame.ix[self.frame.index[5], 'E']
-            self.assertTrue(is_integer(result))
+            assert is_integer(result)
 
         result = self.frame.loc[self.frame.index[5], 'E']
-        self.assertTrue(is_integer(result))
+        assert is_integer(result)
 
         # GH 11617
         df = pd.DataFrame(dict(a=[1.23]))
         df["b"] = 666
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[0, "b"]
-        self.assertTrue(is_integer(result))
+        assert is_integer(result)
         result = df.loc[0, "b"]
-        self.assertTrue(is_integer(result))
+        assert is_integer(result)
 
         expected = Series([666], [0], name='b')
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[[0], "b"]
         assert_series_equal(result, expected)
         result = df.loc[[0], "b"]
@@ -1779,9 +1965,9 @@ def test_iloc_row(self):
 
         # verify slice is view
         # setting it makes it raise/warn
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             result[2] = 0.
-        self.assertRaises(com.SettingWithCopyError, f)
+
         exp_col = df[2].copy()
         exp_col[4:8] = 0.
         assert_series_equal(df[2], exp_col)
@@ -1810,10 +1996,10 @@ def test_iloc_col(self):
 
         # verify slice is view
         # and that we are setting a copy
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             result[8] = 0.
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertTrue((df[8] == 0).all())
+
+        assert (df[8] == 0).all()
 
         # list of integers
         result = df.iloc[:, [1, 2, 4, 6]]
@@ -1827,15 +2013,17 @@ def test_iloc_duplicates(self):
 
         result = df.iloc[0]
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result2 = df.ix[0]
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         assert_almost_equal(result.values, df.values[0])
         assert_series_equal(result, result2)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.T.iloc[:, 0]
             result2 = df.T.ix[:, 0]
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         assert_almost_equal(result.values, df.values[0])
         assert_series_equal(result, result2)
 
@@ -1845,16 +2033,19 @@ def test_iloc_duplicates(self):
                        index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             rs = df.iloc[0]
             xp = df.ix[0]
         assert_series_equal(rs, xp)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             rs = df.iloc[:, 0]
             xp = df.T.ix[0]
         assert_series_equal(rs, xp)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             rs = df.iloc[:, [0]]
             xp = df.ix[:, [0]]
         assert_frame_equal(rs, xp)
@@ -1865,10 +2056,36 @@ def test_iloc_duplicates(self):
         expected = df.take([0], axis=1)
         assert_frame_equal(result, expected)
 
+    def test_loc_duplicates(self):
+        # gh-17105
+
+        # insert a duplicate element to the index
+        trange = pd.date_range(start=pd.Timestamp(year=2017, month=1, day=1),
+                               end=pd.Timestamp(year=2017, month=1, day=5))
+
+        trange = trange.insert(loc=5,
+                               item=pd.Timestamp(year=2017, month=1, day=5))
+
+        df = pd.DataFrame(0, index=trange, columns=["A", "B"])
+        bool_idx = np.array([False, False, False, False, False, True])
+
+        # assignment
+        df.loc[trange[bool_idx], "A"] = 6
+
+        expected = pd.DataFrame({'A': [0, 0, 0, 0, 6, 6],
+                                 'B': [0, 0, 0, 0, 0, 0]},
+                                index=trange)
+        tm.assert_frame_equal(df, expected)
+
+        # in-place
+        df = pd.DataFrame(0, index=trange, columns=["A", "B"])
+        df.loc[trange[bool_idx], "A"] += 6
+        tm.assert_frame_equal(df, expected)
+
     def test_iloc_sparse_propegate_fill_value(self):
-        from pandas.sparse.api import SparseDataFrame
+        from pandas.core.sparse.api import SparseDataFrame
         df = SparseDataFrame({'A': [999, 1]}, default_fill_value=999)
-        self.assertTrue(len(df['A'].sp_values) == len(df.iloc[:, 0].sp_values))
+        assert len(df['A'].sp_values) == len(df.iloc[:, 0].sp_values)
 
     def test_iat(self):
 
@@ -1876,7 +2093,7 @@ def test_iat(self):
             for j, col in enumerate(self.frame.columns):
                 result = self.frame.iat[i, j]
                 expected = self.frame.at[row, col]
-                self.assertEqual(result, expected)
+                assert result == expected
 
     def test_nested_exception(self):
         # Ignore the strange way of triggering the problem
@@ -1885,49 +2102,64 @@ def test_nested_exception(self):
         # a named argument
         df = DataFrame({"a": [1, 2, 3], "b": [4, 5, 6],
                         "c": [7, 8, 9]}).set_index(["a", "b"])
-        l = list(df.index)
-        l[0] = ["a", "b"]
-        df.index = l
+        index = list(df.index)
+        index[0] = ["a", "b"]
+        df.index = index
 
         try:
             repr(df)
         except Exception as e:
-            self.assertNotEqual(type(e), UnboundLocalError)
-
-    def test_reindex_methods(self):
-        df = pd.DataFrame({'x': list(range(5))})
+            assert type(e) != UnboundLocalError
+
+    @pytest.mark.parametrize("method,expected_values", [
+        ("nearest", [0, 1, 1, 2]),
+        ("pad", [np.nan, 0, 1, 1]),
+        ("backfill", [0, 1, 2, 2])
+    ])
+    def test_reindex_methods(self, method, expected_values):
+        df = pd.DataFrame({"x": list(range(5))})
         target = np.array([-0.1, 0.9, 1.1, 1.5])
 
-        for method, expected_values in [('nearest', [0, 1, 1, 2]),
-                                        ('pad', [np.nan, 0, 1, 1]),
-                                        ('backfill', [0, 1, 2, 2])]:
-            expected = pd.DataFrame({'x': expected_values}, index=target)
-            actual = df.reindex(target, method=method)
-            assert_frame_equal(expected, actual)
+        expected = pd.DataFrame({'x': expected_values}, index=target)
+        actual = df.reindex(target, method=method)
+        assert_frame_equal(expected, actual)
+
+        actual = df.reindex_like(df, method=method, tolerance=0)
+        assert_frame_equal(df, actual)
+        actual = df.reindex_like(df, method=method, tolerance=[0, 0, 0, 0])
+        assert_frame_equal(df, actual)
 
-            actual = df.reindex_like(df, method=method, tolerance=0)
-            assert_frame_equal(df, actual)
+        actual = df.reindex(target, method=method, tolerance=1)
+        assert_frame_equal(expected, actual)
+        actual = df.reindex(target, method=method, tolerance=[1, 1, 1, 1])
+        assert_frame_equal(expected, actual)
 
-            actual = df.reindex(target, method=method, tolerance=1)
-            assert_frame_equal(expected, actual)
+        e2 = expected[::-1]
+        actual = df.reindex(target[::-1], method=method)
+        assert_frame_equal(e2, actual)
 
-            e2 = expected[::-1]
-            actual = df.reindex(target[::-1], method=method)
-            assert_frame_equal(e2, actual)
+        new_order = [3, 0, 2, 1]
+        e2 = expected.iloc[new_order]
+        actual = df.reindex(target[new_order], method=method)
+        assert_frame_equal(e2, actual)
 
-            new_order = [3, 0, 2, 1]
-            e2 = expected.iloc[new_order]
-            actual = df.reindex(target[new_order], method=method)
-            assert_frame_equal(e2, actual)
+        switched_method = ('pad' if method == 'backfill'
+                           else 'backfill' if method == 'pad'
+                           else method)
+        actual = df[::-1].reindex(target, method=switched_method)
+        assert_frame_equal(expected, actual)
 
-            switched_method = ('pad' if method == 'backfill'
-                               else 'backfill' if method == 'pad'
-                               else method)
-            actual = df[::-1].reindex(target, method=switched_method)
-            assert_frame_equal(expected, actual)
+    def test_reindex_methods_nearest_special(self):
+        df = pd.DataFrame({"x": list(range(5))})
+        target = np.array([-0.1, 0.9, 1.1, 1.5])
 
-        expected = pd.DataFrame({'x': [0, 1, 1, np.nan]}, index=target)
-        actual = df.reindex(target, method='nearest', tolerance=0.2)
+        expected = pd.DataFrame({"x": [0, 1, 1, np.nan]}, index=target)
+        actual = df.reindex(target, method="nearest", tolerance=0.2)
+        assert_frame_equal(expected, actual)
+
+        expected = pd.DataFrame({"x": [0, np.nan, 1, np.nan]}, index=target)
+        actual = df.reindex(target, method="nearest",
+                            tolerance=[0.5, 0.01, 0.4, 0.1])
         assert_frame_equal(expected, actual)
 
     def test_reindex_frame_add_nat(self):
@@ -1935,15 +2167,15 @@ def test_reindex_frame_add_nat(self):
         df = DataFrame({'A': np.random.randn(len(rng)), 'B': rng})
 
         result = df.reindex(lrange(15))
-        self.assertTrue(np.issubdtype(result['B'].dtype, np.dtype('M8[ns]')))
+        assert np.issubdtype(result['B'].dtype, np.dtype('M8[ns]'))
 
-        mask = com.isnull(result)['B']
-        self.assertTrue(mask[-5:].all())
-        self.assertFalse(mask[:-5].any())
+        mask = com.isna(result)['B']
+        assert mask[-5:].all()
+        assert not mask[:-5].any()
 
     def test_set_dataframe_column_ns_dtype(self):
         x = DataFrame([datetime.now(), datetime.now()])
-        self.assertEqual(x[0].dtype, np.dtype('M8[ns]'))
+        assert x[0].dtype == np.dtype('M8[ns]')
 
     def test_non_monotonic_reindex_methods(self):
         dr = pd.date_range('2013-08-01', periods=6, freq='B')
@@ -1952,18 +2184,23 @@ def test_non_monotonic_reindex_methods(self):
         df_rev = pd.DataFrame(data, index=dr[[3, 4, 5] + [0, 1, 2]],
                               columns=list('A'))
         # index is not monotonic increasing or decreasing
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='pad')
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='ffill')
-        self.assertRaises(ValueError, df_rev.reindex, df.index, method='bfill')
-        self.assertRaises(ValueError, df_rev.reindex,
-                          df.index, method='nearest')
+        msg = "index must be monotonic increasing or decreasing"
+        with pytest.raises(ValueError, match=msg):
+            df_rev.reindex(df.index, method='pad')
+        with pytest.raises(ValueError, match=msg):
+            df_rev.reindex(df.index, method='ffill')
+        with pytest.raises(ValueError, match=msg):
+            df_rev.reindex(df.index, method='bfill')
+        with pytest.raises(ValueError, match=msg):
+            df_rev.reindex(df.index, method='nearest')
 
     def test_reindex_level(self):
         from itertools import permutations
         icol = ['jim', 'joe', 'jolie']
 
         def verify_first_level(df, level, idx, check_index_type=True):
-            f = lambda val: np.nonzero(df[level] == val)[0]
+            def f(val):
+                return np.nonzero((df[level] == val).to_numpy())[0]
             i = np.concatenate(list(map(f, idx)))
             left = df.set_index(icol).reindex(idx, level=level)
             right = df.iloc[i].set_index(icol)
@@ -2035,6 +2272,7 @@ def test_getitem_ix_float_duplicates(self):
         expect = df.iloc[1:]
         assert_frame_equal(df.loc[0.2], expect)
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(df.ix[0.2], expect)
 
         expect = df.iloc[1:, 0]
@@ -2044,6 +2282,7 @@ def test_getitem_ix_float_duplicates(self):
         expect = df.iloc[1:]
         assert_frame_equal(df.loc[0.2], expect)
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(df.ix[0.2], expect)
 
         expect = df.iloc[1:, 0]
@@ -2054,6 +2293,7 @@ def test_getitem_ix_float_duplicates(self):
         expect = df.iloc[1:-1]
         assert_frame_equal(df.loc[0.2], expect)
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(df.ix[0.2], expect)
 
         expect = df.iloc[1:-1, 0]
@@ -2063,24 +2303,40 @@ def test_getitem_ix_float_duplicates(self):
         expect = df.iloc[[1, -1]]
         assert_frame_equal(df.loc[0.2], expect)
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             assert_frame_equal(df.ix[0.2], expect)
 
         expect = df.iloc[[1, -1], 0]
         assert_series_equal(df.loc[0.2, 'a'], expect)
 
+    def test_getitem_sparse_column(self):
+        # https://github.com/pandas-dev/pandas/issues/23559
+        data = pd.SparseArray([0, 1])
+        df = pd.DataFrame({"A": data})
+        expected = pd.Series(data, name="A")
+        result = df['A']
+        tm.assert_series_equal(result, expected)
+
+        result = df.iloc[:, 0]
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc[:, 'A']
+        tm.assert_series_equal(result, expected)
+
     def test_setitem_with_sparse_value(self):
         # GH8131
         df = pd.DataFrame({'c_1': ['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
-        sp_series = pd.Series([0, 0, 1]).to_sparse(fill_value=0)
-        df['new_column'] = sp_series
-        assert_series_equal(df['new_column'], sp_series, check_names=False)
+        sp_array = pd.SparseArray([0, 0, 1])
+        df['new_column'] = sp_array
+        assert_series_equal(df['new_column'],
+                            pd.Series(sp_array, name='new_column'),
+                            check_names=False)
 
     def test_setitem_with_unaligned_sparse_value(self):
         df = pd.DataFrame({'c_1': ['a', 'b', 'c'], 'n_1': [1., 2., 3.]})
-        sp_series = (pd.Series([0, 0, 1], index=[2, 1, 0])
-                     .to_sparse(fill_value=0))
+        sp_series = pd.Series(pd.SparseArray([0, 0, 1]), index=[2, 1, 0])
         df['new_column'] = sp_series
-        exp = pd.Series([1, 0, 0], name='new_column')
+        exp = pd.Series(pd.SparseArray([1, 0, 0]), name='new_column')
         assert_series_equal(df['new_column'], exp)
 
     def test_setitem_with_unaligned_tz_aware_datetime_column(self):
@@ -2098,13 +2354,13 @@ def test_setitem_with_unaligned_tz_aware_datetime_column(self):
         assert_series_equal(df['dates'], column)
 
     def test_setitem_datetime_coercion(self):
-        # GH 1048
+        # gh-1048
         df = pd.DataFrame({'c': [pd.Timestamp('2010-10-01')] * 3})
         df.loc[0:1, 'c'] = np.datetime64('2008-08-08')
-        self.assertEqual(pd.Timestamp('2008-08-08'), df.loc[0, 'c'])
-        self.assertEqual(pd.Timestamp('2008-08-08'), df.loc[1, 'c'])
+        assert pd.Timestamp('2008-08-08') == df.loc[0, 'c']
+        assert pd.Timestamp('2008-08-08') == df.loc[1, 'c']
         df.loc[2, 'c'] = date(2005, 5, 5)
-        self.assertEqual(pd.Timestamp('2005-05-05'), df.loc[2, 'c'])
+        assert pd.Timestamp('2005-05-05') == df.loc[2, 'c']
 
     def test_setitem_datetimelike_with_inference(self):
         # GH 7592
@@ -2129,9 +2385,19 @@ def test_setitem_datetimelike_with_inference(self):
                           index=list('ABCDEFGH'))
         assert_series_equal(result, expected)
 
+    @pytest.mark.parametrize('idxer', ['var', ['var']])
+    def test_setitem_datetimeindex_tz(self, idxer, tz_naive_fixture):
+        # GH 11365
+        tz = tz_naive_fixture
+        idx = date_range(start='2015-07-12', periods=3, freq='H', tz=tz)
+        expected = DataFrame(1.2, index=idx, columns=['var'])
+        result = DataFrame(index=idx, columns=['var'])
+        result.loc[:, idxer] = expected
+        tm.assert_frame_equal(result, expected)
+
     def test_at_time_between_time_datetimeindex(self):
         index = date_range("2012-01-01", "2012-01-05", freq='30min')
-        df = DataFrame(randn(len(index), 5), index=index)
+        df = DataFrame(np.random.randn(len(index), 5), index=index)
         akey = time(12, 0, 0)
         bkey = slice(time(13, 0, 0), time(14, 0, 0))
         ainds = [24, 72, 120, 168]
@@ -2142,14 +2408,14 @@ def test_at_time_between_time_datetimeindex(self):
         expected2 = df.iloc[ainds]
         assert_frame_equal(result, expected)
         assert_frame_equal(result, expected2)
-        self.assertEqual(len(result), 4)
+        assert len(result) == 4
 
         result = df.between_time(bkey.start, bkey.stop)
         expected = df.loc[bkey]
         expected2 = df.iloc[binds]
         assert_frame_equal(result, expected)
         assert_frame_equal(result, expected2)
-        self.assertEqual(len(result), 12)
+        assert len(result) == 12
 
         result = df.copy()
         result.loc[akey] = 0
@@ -2180,9 +2446,9 @@ def test_xs(self):
         xs = self.frame.xs(idx)
         for item, value in compat.iteritems(xs):
             if np.isnan(value):
-                self.assertTrue(np.isnan(self.frame[item][idx]))
+                assert np.isnan(self.frame[item][idx])
             else:
-                self.assertEqual(value, self.frame[item][idx])
+                assert value == self.frame[item][idx]
 
         # mixed-type xs
         test_data = {
@@ -2191,11 +2457,11 @@ def test_xs(self):
         }
         frame = DataFrame(test_data)
         xs = frame.xs('1')
-        self.assertEqual(xs.dtype, np.object_)
-        self.assertEqual(xs['A'], 1)
-        self.assertEqual(xs['B'], '1')
+        assert xs.dtype == np.object_
+        assert xs['A'] == 1
+        assert xs['B'] == '1'
 
-        with tm.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             self.tsframe.xs(self.tsframe.index[0] - BDay())
 
         # xs get column
@@ -2206,7 +2472,7 @@ def test_xs(self):
         # view is returned if possible
         series = self.frame.xs('A', axis=1)
         series[:] = 5
-        self.assertTrue((expected == 5).all())
+        assert (expected == 5).all()
 
     def test_xs_corner(self):
         # pathological mixed-type reordering case
@@ -2229,7 +2495,7 @@ def test_xs_corner(self):
         assert_series_equal(result, expected)
 
     def test_xs_duplicates(self):
-        df = DataFrame(randn(5, 2), index=['b', 'b', 'c', 'b', 'a'])
+        df = DataFrame(np.random.randn(5, 2), index=['b', 'b', 'c', 'b', 'a'])
 
         cross = df.xs('c')
         exp = df.iloc[2]
@@ -2256,7 +2522,7 @@ def test_xs_view(self):
                        index=lrange(4), columns=lrange(5))
 
         dm.xs(2)[:] = 10
-        self.assertTrue((dm.xs(2) == 10).all())
+        assert (dm.xs(2) == 10).all()
 
     def test_index_namedtuple(self):
         from collections import namedtuple
@@ -2268,11 +2534,12 @@ def test_index_namedtuple(self):
         df = DataFrame([(1, 2), (3, 4)], index=index, columns=["A", "B"])
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             result = df.ix[IndexType("foo", "bar")]["A"]
-        self.assertEqual(result, 1)
+        assert result == 1
 
         result = df.loc[IndexType("foo", "bar")]["A"]
-        self.assertEqual(result, 1)
+        assert result == 1
 
     def test_boolean_indexing(self):
         idx = lrange(3)
@@ -2292,7 +2559,7 @@ def test_boolean_indexing(self):
 
         df1[df1 > 2.0 * df2] = -1
         assert_frame_equal(df1, expected)
-        with assertRaisesRegexp(ValueError, 'Item wrong length'):
+        with pytest.raises(ValueError, match='Item wrong length'):
             df1[df1.index[:-1] > 2] = -1
 
     def test_boolean_indexing_mixed(self):
@@ -2323,7 +2590,11 @@ def test_boolean_indexing_mixed(self):
         assert_frame_equal(df2, expected)
 
         df['foo'] = 'test'
-        with tm.assertRaisesRegexp(TypeError, 'boolean setting on mixed-type'):
+        msg = ("boolean setting on mixed-type|"
+               "not supported between|"
+               "unorderable types")
+        with pytest.raises(TypeError, match=msg):
+            # TODO: This message should be the same in PY2/PY3
             df[df > 0.3] = 1
 
     def test_where(self):
@@ -2336,8 +2607,8 @@ def is_ok(s):
                 return (issubclass(s.dtype.type, (np.integer, np.floating)) and
                         s.dtype != 'uint8')
 
-            return DataFrame(dict([(c, s + 1) if is_ok(s) else (c, s)
-                                   for c, s in compat.iteritems(df)]))
+            return DataFrame(dict((c, s + 1) if is_ok(s) else (c, s)
+                                  for c, s in compat.iteritems(df)))
 
         def _check_get(df, cond, check_dtypes=True):
             other1 = _safe_add(df)
@@ -2351,18 +2622,22 @@ def _check_get(df, cond, check_dtypes=True):
 
             # dtypes
             if check_dtypes:
-                self.assertTrue((rs.dtypes == df.dtypes).all())
+                assert (rs.dtypes == df.dtypes).all()
 
         # check getting
         for df in [default_frame, self.mixed_frame,
                    self.mixed_float, self.mixed_int]:
+            if compat.PY3 and df is self.mixed_frame:
+                with pytest.raises(TypeError):
+                    df > 0
+                continue
             cond = df > 0
             _check_get(df, cond)
 
         # upcasting case (GH # 2794)
-        df = DataFrame(dict([(c, Series([1] * 3, dtype=c))
-                             for c in ['int64', 'int32',
-                                       'float32', 'float64']]))
+        df = DataFrame({c: Series([1] * 3, dtype=c)
+                        for c in ['float32', 'float64',
+                                  'int32', 'int64']})
         df.iloc[1, :] = 0
         result = df.where(df >= 0).get_dtype_counts()
 
@@ -2400,9 +2675,13 @@ def _check_align(df, cond, other, check_dtypes=True):
             # can't check dtype when other is an ndarray
 
             if check_dtypes and not isinstance(other, np.ndarray):
-                self.assertTrue((rs.dtypes == df.dtypes).all())
+                assert (rs.dtypes == df.dtypes).all()
 
         for df in [self.mixed_frame, self.mixed_float, self.mixed_int]:
+            if compat.PY3 and df is self.mixed_frame:
+                with pytest.raises(TypeError):
+                    df > 0
+                continue
 
             # other is a frame
             cond = (df > 0)[1:]
@@ -2414,21 +2693,27 @@ def _check_align(df, cond, other, check_dtypes=True):
 
             # integers are upcast, so don't check the dtypes
             cond = df > 0
-            check_dtypes = all([not issubclass(s.type, np.integer)
-                                for s in df.dtypes])
+            check_dtypes = all(not issubclass(s.type, np.integer)
+                               for s in df.dtypes)
             _check_align(df, cond, np.nan, check_dtypes=check_dtypes)
 
         # invalid conditions
         df = default_frame
         err1 = (df + 1).values[0:2, :]
-        self.assertRaises(ValueError, df.where, cond, err1)
+        msg = "other must be the same shape as self when an ndarray"
+        with pytest.raises(ValueError, match=msg):
+            df.where(cond, err1)
 
         err2 = cond.iloc[:2, :].values
         other1 = _safe_add(df)
-        self.assertRaises(ValueError, df.where, err2, other1)
+        msg = "Array conditional must be same shape as self"
+        with pytest.raises(ValueError, match=msg):
+            df.where(err2, other1)
 
-        self.assertRaises(ValueError, df.mask, True)
-        self.assertRaises(ValueError, df.mask, 0)
+        with pytest.raises(ValueError, match=msg):
+            df.mask(True)
+        with pytest.raises(ValueError, match=msg):
+            df.mask(0)
 
         # where inplace
         def _check_set(df, cond, check_dtypes=True):
@@ -2444,10 +2729,14 @@ def _check_set(df, cond, check_dtypes=True):
                 for k, v in compat.iteritems(df.dtypes):
                     if issubclass(v.type, np.integer) and not cond[k].all():
                         v = np.dtype('float64')
-                    self.assertEqual(dfi[k].dtype, v)
+                    assert dfi[k].dtype == v
 
         for df in [default_frame, self.mixed_frame, self.mixed_float,
                    self.mixed_int]:
+            if compat.PY3 and df is self.mixed_frame:
+                with pytest.raises(TypeError):
+                    df > 0
+                continue
 
             cond = df > 0
             _check_set(df, cond)
@@ -2466,79 +2755,77 @@ def _check_set(df, cond, check_dtypes=True):
         expected = df[df['a'] == 1].reindex(df.index)
         assert_frame_equal(result, expected)
 
-    def test_where_array_like(self):
+    @pytest.mark.parametrize("klass", [list, tuple, np.array])
+    def test_where_array_like(self, klass):
         # see gh-15414
-        klasses = [list, tuple, np.array]
-
-        df = DataFrame({'a': [1, 2, 3]})
+        df = DataFrame({"a": [1, 2, 3]})
         cond = [[False], [True], [True]]
-        expected = DataFrame({'a': [np.nan, 2, 3]})
+        expected = DataFrame({"a": [np.nan, 2, 3]})
 
-        for klass in klasses:
-            result = df.where(klass(cond))
-            assert_frame_equal(result, expected)
+        result = df.where(klass(cond))
+        assert_frame_equal(result, expected)
 
-        df['b'] = 2
-        expected['b'] = [2, np.nan, 2]
+        df["b"] = 2
+        expected["b"] = [2, np.nan, 2]
         cond = [[False, True], [True, False], [True, True]]
 
-        for klass in klasses:
-            result = df.where(klass(cond))
-            assert_frame_equal(result, expected)
+        result = df.where(klass(cond))
+        assert_frame_equal(result, expected)
 
-    def test_where_invalid_input(self):
+    @pytest.mark.parametrize("cond", [
+        [[1], [0], [1]],
+        Series([[2], [5], [7]]),
+        DataFrame({"a": [2, 5, 7]}),
+        [["True"], ["False"], ["True"]],
+        [[Timestamp("2017-01-01")],
+         [pd.NaT], [Timestamp("2017-01-02")]]
+    ])
+    def test_where_invalid_input_single(self, cond):
         # see gh-15414: only boolean arrays accepted
-        df = DataFrame({'a': [1, 2, 3]})
+        df = DataFrame({"a": [1, 2, 3]})
+        msg = "Boolean array expected for the condition"
+
+        with pytest.raises(ValueError, match=msg):
+            df.where(cond)
+
+    @pytest.mark.parametrize("cond", [
+        [[0, 1], [1, 0], [1, 1]],
+        Series([[0, 2], [5, 0], [4, 7]]),
+        [["False", "True"], ["True", "False"],
+         ["True", "True"]],
+        DataFrame({"a": [2, 5, 7], "b": [4, 8, 9]}),
+        [[pd.NaT, Timestamp("2017-01-01")],
+         [Timestamp("2017-01-02"), pd.NaT],
+         [Timestamp("2017-01-03"), Timestamp("2017-01-03")]]
+    ])
+    def test_where_invalid_input_multiple(self, cond):
+        # see gh-15414: only boolean arrays accepted
+        df = DataFrame({"a": [1, 2, 3], "b": [2, 2, 2]})
         msg = "Boolean array expected for the condition"
 
-        conds = [
-            [[1], [0], [1]],
-            Series([[2], [5], [7]]),
-            DataFrame({'a': [2, 5, 7]}),
-            [["True"], ["False"], ["True"]],
-            [[Timestamp("2017-01-01")],
-             [pd.NaT], [Timestamp("2017-01-02")]]
-        ]
-
-        for cond in conds:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                df.where(cond)
-
-        df['b'] = 2
-        conds = [
-            [[0, 1], [1, 0], [1, 1]],
-            Series([[0, 2], [5, 0], [4, 7]]),
-            [["False", "True"], ["True", "False"],
-             ["True", "True"]],
-            DataFrame({'a': [2, 5, 7], 'b': [4, 8, 9]}),
-            [[pd.NaT, Timestamp("2017-01-01")],
-             [Timestamp("2017-01-02"), pd.NaT],
-             [Timestamp("2017-01-03"), Timestamp("2017-01-03")]]
-        ]
-
-        for cond in conds:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                df.where(cond)
+        with pytest.raises(ValueError, match=msg):
+            df.where(cond)
 
     def test_where_dataframe_col_match(self):
         df = DataFrame([[1, 2, 3], [4, 5, 6]])
         cond = DataFrame([[True, False, True], [False, False, True]])
 
-        out = df.where(cond)
+        result = df.where(cond)
         expected = DataFrame([[1.0, np.nan, 3], [np.nan, np.nan, 6]])
-        tm.assert_frame_equal(out, expected)
+        tm.assert_frame_equal(result, expected)
 
-        cond.columns = ["a", "b", "c"]  # Columns no longer match.
-        msg = "Boolean array expected for the condition"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.where(cond)
+        # this *does* align, though has no matching columns
+        cond.columns = ["a", "b", "c"]
+        result = df.where(cond)
+        expected = DataFrame(np.nan, index=df.index, columns=df.columns)
+        tm.assert_frame_equal(result, expected)
 
     def test_where_ndframe_align(self):
         msg = "Array conditional must be same shape as self"
         df = DataFrame([[1, 2, 3], [4, 5, 6]])
 
         cond = [True]
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df.where(cond)
 
         expected = DataFrame([[1, 2, 3], [np.nan, np.nan, np.nan]])
@@ -2547,7 +2834,7 @@ def test_where_ndframe_align(self):
         tm.assert_frame_equal(out, expected)
 
         cond = np.array([False, True, False, True])
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df.where(cond)
 
         expected = DataFrame([[np.nan, np.nan, np.nan], [4, 5, 6]])
@@ -2556,9 +2843,7 @@ def test_where_ndframe_align(self):
         tm.assert_frame_equal(out, expected)
 
     def test_where_bug(self):
-
-        # GH 2793
-
+        # see gh-2793
         df = DataFrame({'a': [1.0, 2.0, 3.0, 4.0], 'b': [
                        4.0, 3.0, 2.0, 1.0]}, dtype='float64')
         expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0], 'b': [
@@ -2570,28 +2855,28 @@ def test_where_bug(self):
         result.where(result > 2, np.nan, inplace=True)
         assert_frame_equal(result, expected)
 
-        # mixed
-        for dtype in ['int16', 'int8', 'int32', 'int64']:
-            df = DataFrame({'a': np.array([1, 2, 3, 4], dtype=dtype),
-                            'b': np.array([4.0, 3.0, 2.0, 1.0],
-                                          dtype='float64')})
+    def test_where_bug_mixed(self, sint_dtype):
+        # see gh-2793
+        df = DataFrame({"a": np.array([1, 2, 3, 4], dtype=sint_dtype),
+                        "b": np.array([4.0, 3.0, 2.0, 1.0],
+                                      dtype="float64")})
 
-            expected = DataFrame({'a': [np.nan, np.nan, 3.0, 4.0],
-                                  'b': [4.0, 3.0, np.nan, np.nan]},
-                                 dtype='float64')
+        expected = DataFrame({"a": [np.nan, np.nan, 3.0, 4.0],
+                              "b": [4.0, 3.0, np.nan, np.nan]},
+                             dtype="float64")
 
-            result = df.where(df > 2, np.nan)
-            assert_frame_equal(result, expected)
+        result = df.where(df > 2, np.nan)
+        assert_frame_equal(result, expected)
 
-            result = df.copy()
-            result.where(result > 2, np.nan, inplace=True)
-            assert_frame_equal(result, expected)
+        result = df.copy()
+        result.where(result > 2, np.nan, inplace=True)
+        assert_frame_equal(result, expected)
 
-        # transpositional issue
-        # GH7506
+    def test_where_bug_transposition(self):
+        # see gh-7506
         a = DataFrame({0: [1, 2], 1: [3, 4], 2: [5, 6]})
         b = DataFrame({0: [np.nan, 8], 1: [9, np.nan], 2: [np.nan, np.nan]})
-        do_not_replace = b.isnull() | (a > b)
+        do_not_replace = b.isna() | (a > b)
 
         expected = a.copy()
         expected[~do_not_replace] = b
@@ -2601,7 +2886,7 @@ def test_where_bug(self):
 
         a = DataFrame({0: [4, 6], 1: [1, 0]})
         b = DataFrame({0: [np.nan, 3], 1: [3, np.nan]})
-        do_not_replace = b.isnull() | (a > b)
+        do_not_replace = b.isna() | (a > b)
 
         expected = a.copy()
         expected[~do_not_replace] = b
@@ -2617,9 +2902,14 @@ def test_where_datetime(self):
                             C=np.random.randn(5)))
 
         stamp = datetime(2013, 1, 3)
-        result = df[df > stamp]
+        with pytest.raises(TypeError):
+            df > stamp
+
+        result = df[df.iloc[:, :-1] > stamp]
+
         expected = df.copy()
         expected.loc[[0, 1], 'A'] = np.nan
+        expected.loc[:, 'C'] = np.nan
         assert_frame_equal(result, expected)
 
     def test_where_none(self):
@@ -2634,9 +2924,18 @@ def test_where_none(self):
         # GH 7656
         df = DataFrame([{'A': 1, 'B': np.nan, 'C': 'Test'}, {
                        'A': np.nan, 'B': 'Test', 'C': np.nan}])
-        expected = df.where(~isnull(df), None)
-        with tm.assertRaisesRegexp(TypeError, 'boolean setting on mixed-type'):
-            df.where(~isnull(df), None, inplace=True)
+        msg = 'boolean setting on mixed-type'
+
+        with pytest.raises(TypeError, match=msg):
+            df.where(~isna(df), None, inplace=True)
+
+    def test_where_empty_df_and_empty_cond_having_non_bool_dtypes(self):
+        # see gh-21947
+        df = pd.DataFrame(columns=["a"])
+        cond = df.applymap(lambda x: x > 0)
+
+        result = df.where(cond)
+        tm.assert_frame_equal(result, df)
 
     def test_where_align(self):
 
@@ -2650,10 +2949,10 @@ def create():
         # series
         df = create()
         expected = df.fillna(df.mean())
-        result = df.where(pd.notnull(df), df.mean(), axis='columns')
+        result = df.where(pd.notna(df), df.mean(), axis='columns')
         assert_frame_equal(result, expected)
 
-        df.where(pd.notnull(df), df.mean(), inplace=True, axis='columns')
+        df.where(pd.notna(df), df.mean(), inplace=True, axis='columns')
         assert_frame_equal(df, expected)
 
         df = create().fillna(0)
@@ -2666,7 +2965,7 @@ def create():
         # frame
         df = create()
         expected = df.fillna(1)
-        result = df.where(pd.notnull(df), DataFrame(
+        result = df.where(pd.notna(df), DataFrame(
             1, index=df.index, columns=df.columns))
         assert_frame_equal(result, expected)
 
@@ -2713,7 +3012,7 @@ def test_where_axis(self):
         result.where(mask, s, axis='index', inplace=True)
         assert_frame_equal(result, expected)
 
-        expected = DataFrame([[0, np.nan], [0, np.nan]], dtype='float64')
+        expected = DataFrame([[0, np.nan], [0, np.nan]])
         result = df.where(mask, s, axis='columns')
         assert_frame_equal(result, expected)
 
@@ -2724,17 +3023,18 @@ def test_where_axis(self):
         assert_frame_equal(result, expected)
 
         # Multiple dtypes (=> multiple Blocks)
-        df = pd.concat([DataFrame(np.random.randn(10, 2)),
-                        DataFrame(np.random.randint(0, 10, size=(10, 2)))],
-                       ignore_index=True, axis=1)
+        df = pd.concat([
+            DataFrame(np.random.randn(10, 2)),
+            DataFrame(np.random.randint(0, 10, size=(10, 2)), dtype='int64')],
+            ignore_index=True, axis=1)
         mask = DataFrame(False, columns=df.columns, index=df.index)
         s1 = Series(1, index=df.columns)
         s2 = Series(2, index=df.index)
 
         result = df.where(mask, s1, axis='columns')
         expected = DataFrame(1.0, columns=df.columns, index=df.index)
-        expected[2] = expected[2].astype(int)
-        expected[3] = expected[3].astype(int)
+        expected[2] = expected[2].astype('int64')
+        expected[3] = expected[3].astype('int64')
         assert_frame_equal(result, expected)
 
         result = df.copy()
@@ -2743,8 +3043,8 @@ def test_where_axis(self):
 
         result = df.where(mask, s2, axis='index')
         expected = DataFrame(2.0, columns=df.columns, index=df.index)
-        expected[2] = expected[2].astype(int)
-        expected[3] = expected[3].astype(int)
+        expected[2] = expected[2].astype('int64')
+        expected[3] = expected[3].astype('int64')
         assert_frame_equal(result, expected)
 
         result = df.copy()
@@ -2803,6 +3103,20 @@ def test_where_callable(self):
         tm.assert_frame_equal(result,
                               (df + 2).where((df + 2) > 8, (df + 2) + 10))
 
+    def test_where_tz_values(self, tz_naive_fixture):
+        df1 = DataFrame(DatetimeIndex(['20150101', '20150102', '20150103'],
+                                      tz=tz_naive_fixture),
+                        columns=['date'])
+        df2 = DataFrame(DatetimeIndex(['20150103', '20150104', '20150105'],
+                                      tz=tz_naive_fixture),
+                        columns=['date'])
+        mask = DataFrame([True, True, False], columns=['date'])
+        exp = DataFrame(DatetimeIndex(['20150101', '20150102', '20150105'],
+                                      tz=tz_naive_fixture),
+                        columns=['date'])
+        result = df1.where(mask, df2)
+        assert_frame_equal(exp, result)
+
     def test_mask(self):
         df = DataFrame(np.random.randn(5, 3))
         cond = df > 0
@@ -2816,6 +3130,13 @@ def test_mask(self):
         assert_frame_equal(rs, df.mask(df <= 0, other))
         assert_frame_equal(rs, df.mask(~cond, other))
 
+        # see gh-21891
+        df = DataFrame([1, 2])
+        res = df.mask([[True], [False]])
+
+        exp = DataFrame([np.nan, 2])
+        tm.assert_frame_equal(res, exp)
+
     def test_mask_inplace(self):
         # GH8801
         df = DataFrame(np.random.randn(5, 3))
@@ -2836,7 +3157,7 @@ def test_mask_edge_case_1xN_frame(self):
         # GH4071
         df = DataFrame([[1, 2]])
         res = df.mask(DataFrame([[True, False]]))
-        expec = DataFrame([[nan, 2]])
+        expec = DataFrame([[np.nan, 2]])
         assert_frame_equal(res, expec)
 
     def test_mask_callable(self):
@@ -2893,12 +3214,12 @@ def test_type_error_multiindex(self):
         dg = df.pivot_table(index='i', columns='c',
                             values=['x', 'y'])
 
-        with assertRaisesRegexp(TypeError, "is an invalid key"):
+        with pytest.raises(TypeError, match="is an invalid key"):
             str(dg[:, 0])
 
         index = Index(range(2), name='i')
         columns = MultiIndex(levels=[['x', 'y'], [0, 1]],
-                             labels=[[0, 1], [0, 0]],
+                             codes=[[0, 1], [0, 0]],
                              names=[None, 'c'])
         expected = DataFrame([[1, 2], [3, 4]], columns=columns, index=index)
 
@@ -2912,10 +3233,32 @@ def test_type_error_multiindex(self):
         result = dg['x', 0]
         assert_series_equal(result, expected)
 
+    def test_interval_index(self):
+        # GH 19977
+        index = pd.interval_range(start=0, periods=3)
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                          index=index,
+                          columns=['A', 'B', 'C'])
+
+        expected = 1
+        result = df.loc[0.5, 'A']
+        assert_almost_equal(result, expected)
+
+        index = pd.interval_range(start=0, periods=3, closed='both')
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                          index=index,
+                          columns=['A', 'B', 'C'])
+
+        index_exp = pd.interval_range(start=0, periods=2,
+                                      freq=1, closed='both')
+        expected = pd.Series([1, 4], index=index_exp, name='A')
+        result = df.loc[1, 'A']
+        assert_series_equal(result, expected)
+
 
-class TestDataFrameIndexingDatetimeWithTZ(tm.TestCase, TestData):
+class TestDataFrameIndexingDatetimeWithTZ(TestData):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.idx = Index(date_range('20130101', periods=3, tz='US/Eastern'),
                          name='foo')
         self.dr = date_range('20130110', periods=3)
@@ -2939,16 +3282,15 @@ def test_setitem(self):
         # are copies)
         b1 = df._data.blocks[1]
         b2 = df._data.blocks[2]
-        self.assertTrue(b1.values.equals(b2.values))
-        self.assertFalse(id(b1.values.values.base) ==
-                         id(b2.values.values.base))
+        tm.assert_extension_array_equal(b1.values, b2.values)
+        assert id(b1.values._data.base) != id(b2.values._data.base)
 
         # with nan
         df2 = df.copy()
         df2.iloc[1, 1] = pd.NaT
         df2.iloc[1, 2] = pd.NaT
         result = df2['B']
-        assert_series_equal(notnull(result), Series(
+        assert_series_equal(notna(result), Series(
             [True, False, True], name='B'))
         assert_series_equal(df2.dtypes, df.dtypes)
 
@@ -2959,7 +3301,7 @@ def test_set_reset(self):
         # set/reset
         df = DataFrame({'A': [0, 1, 2]}, index=idx)
         result = df.reset_index()
-        self.assertTrue(result['foo'].dtype, 'M8[ns, US/Eastern')
+        assert result['foo'].dtype, 'M8[ns, US/Eastern'
 
         df = result.set_index('foo')
         tm.assert_index_equal(df.index, idx)
@@ -2971,10 +3313,18 @@ def test_transpose(self):
         expected.index = ['A', 'B']
         assert_frame_equal(result, expected)
 
+    def test_scalar_assignment(self):
+        # issue #19843
+        df = pd.DataFrame(index=(0, 1, 2))
+        df['now'] = pd.Timestamp('20130101', tz='UTC')
+        expected = pd.DataFrame(
+            {'now': pd.Timestamp('20130101', tz='UTC')}, index=[0, 1, 2])
+        tm.assert_frame_equal(df, expected)
+
 
-class TestDataFrameIndexingUInt64(tm.TestCase, TestData):
+class TestDataFrameIndexingUInt64(TestData):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.ir = Index(np.arange(3), dtype=np.uint64)
         self.idx = Index([2**63, 2**63 + 5, 2**63 + 10], name='foo')
 
@@ -3000,7 +3350,7 @@ def test_setitem(self):
         df2.iloc[1, 1] = pd.NaT
         df2.iloc[1, 2] = pd.NaT
         result = df2['B']
-        assert_series_equal(notnull(result), Series(
+        assert_series_equal(notna(result), Series(
             [True, False, True], name='B'))
         assert_series_equal(df2.dtypes, Series([np.dtype('uint64'),
                                                 np.dtype('O'), np.dtype('O')],
@@ -3013,7 +3363,7 @@ def test_set_reset(self):
         # set/reset
         df = DataFrame({'A': [0, 1, 2]}, index=idx)
         result = df.reset_index()
-        self.assertEqual(result['foo'].dtype, np.dtype('uint64'))
+        assert result['foo'].dtype == np.dtype('uint64')
 
         df = result.set_index('foo')
         tm.assert_index_equal(df.index, idx)
@@ -3024,3 +3374,348 @@ def test_transpose(self):
         expected = DataFrame(self.df.values.T)
         expected.index = ['A', 'B']
         assert_frame_equal(result, expected)
+
+
+class TestDataFrameIndexingCategorical(object):
+
+    def test_assignment(self):
+        # assignment
+        df = DataFrame({'value': np.array(
+            np.random.randint(0, 10000, 100), dtype='int32')})
+        labels = Categorical(["{0} - {1}".format(i, i + 499)
+                              for i in range(0, 10000, 500)])
+
+        df = df.sort_values(by=['value'], ascending=True)
+        s = pd.cut(df.value, range(0, 10500, 500), right=False, labels=labels)
+        d = s.values
+        df['D'] = d
+        str(df)
+
+        result = df.dtypes
+        expected = Series(
+            [np.dtype('int32'), CategoricalDtype(categories=labels,
+                                                 ordered=False)],
+            index=['value', 'D'])
+        tm.assert_series_equal(result, expected)
+
+        df['E'] = s
+        str(df)
+
+        result = df.dtypes
+        expected = Series([np.dtype('int32'),
+                           CategoricalDtype(categories=labels, ordered=False),
+                           CategoricalDtype(categories=labels, ordered=False)],
+                          index=['value', 'D', 'E'])
+        tm.assert_series_equal(result, expected)
+
+        result1 = df['D']
+        result2 = df['E']
+        tm.assert_categorical_equal(result1._data._block.values, d)
+
+        # sorting
+        s.name = 'E'
+        tm.assert_series_equal(result2.sort_index(), s.sort_index())
+
+        cat = Categorical([1, 2, 3, 10], categories=[1, 2, 3, 4, 10])
+        df = DataFrame(Series(cat))
+
+    def test_assigning_ops(self):
+        # systematically test the assigning operations:
+        # for all slicing ops:
+        #  for value in categories and value not in categories:
+
+        #   - assign a single value -> exp_single_cats_value
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+
+        # assign multiple rows (mixed values) (-> array) -> exp_multi_row
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+
+        cats = Categorical(["a", "a", "a", "a", "a", "a", "a"],
+                           categories=["a", "b"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values = [1, 1, 1, 1, 1, 1, 1]
+        orig = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        # the expected values
+        # changed single row
+        cats1 = Categorical(["a", "a", "b", "a", "a", "a", "a"],
+                            categories=["a", "b"])
+        idx1 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values1 = [1, 1, 2, 1, 1, 1, 1]
+        exp_single_row = DataFrame({"cats": cats1,
+                                    "values": values1}, index=idx1)
+
+        # changed multiple rows
+        cats2 = Categorical(["a", "a", "b", "b", "a", "a", "a"],
+                            categories=["a", "b"])
+        idx2 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values2 = [1, 1, 2, 2, 1, 1, 1]
+        exp_multi_row = DataFrame({"cats": cats2,
+                                   "values": values2}, index=idx2)
+
+        # changed part of the cats column
+        cats3 = Categorical(
+            ["a", "a", "b", "b", "a", "a", "a"], categories=["a", "b"])
+        idx3 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values3 = [1, 1, 1, 1, 1, 1, 1]
+        exp_parts_cats_col = DataFrame({"cats": cats3,
+                                        "values": values3}, index=idx3)
+
+        # changed single value in cats col
+        cats4 = Categorical(
+            ["a", "a", "b", "a", "a", "a", "a"], categories=["a", "b"])
+        idx4 = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values4 = [1, 1, 1, 1, 1, 1, 1]
+        exp_single_cats_value = DataFrame({"cats": cats4,
+                                           "values": values4}, index=idx4)
+
+        #  iloc
+        # ###############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.iloc[2, 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.iloc[df.index == "j", 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.iloc[2, 0] = "c"
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.iloc[2, :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.iloc[2, :] = ["c", 2]
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.iloc[2:4, :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.iloc[2:4, :] = [["c", 2], ["c", 2]]
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.iloc[2:4, 0] = Categorical(["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.iloc[2:4, 0] = Categorical(list('bb'), categories=list('abc'))
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.iloc[2:4, 0] = Categorical(list('cc'), categories=list('abc'))
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.iloc[2:4, 0] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.iloc[2:4, 0] = ["c", "c"]
+
+        #  loc
+        # ##############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.loc["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.loc[df.index == "j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j", "cats"] = "c"
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.loc["j", :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j", :] = ["c", 2]
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", "cats"] = Categorical(
+            ["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.loc["j":"k", "cats"] = Categorical(
+                ["b", "b"], categories=["a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.loc["j":"k", "cats"] = Categorical(
+                ["c", "c"], categories=["a", "b", "c"])
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", "cats"] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.loc["j":"k", "cats"] = ["c", "c"]
+
+        #  loc
+        # ##############
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.loc["j", df.columns[0]] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        df = orig.copy()
+        df.loc[df.index == "j", df.columns[0]] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j", df.columns[0]] = "c"
+
+        #   - assign a complete row (mixed values) -> exp_single_row
+        df = orig.copy()
+        df.loc["j", :] = ["b", 2]
+        tm.assert_frame_equal(df, exp_single_row)
+
+        #   - assign a complete row (mixed values) not in categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j", :] = ["c", 2]
+
+        #   - assign multiple rows (mixed values) -> exp_multi_row
+        df = orig.copy()
+        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
+        tm.assert_frame_equal(df, exp_multi_row)
+
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
+
+        # assign a part of a column with dtype == categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", df.columns[0]] = Categorical(
+            ["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            # different categories -> not sure if this should fail or pass
+            df = orig.copy()
+            df.loc["j":"k", df.columns[0]] = Categorical(
+                ["b", "b"], categories=["a", "b", "c"])
+
+        with pytest.raises(ValueError):
+            # different values
+            df = orig.copy()
+            df.loc["j":"k", df.columns[0]] = Categorical(
+                ["c", "c"], categories=["a", "b", "c"])
+
+        # assign a part of a column with dtype != categorical ->
+        # exp_parts_cats_col
+        df = orig.copy()
+        df.loc["j":"k", df.columns[0]] = ["b", "b"]
+        tm.assert_frame_equal(df, exp_parts_cats_col)
+
+        with pytest.raises(ValueError):
+            df.loc["j":"k", df.columns[0]] = ["c", "c"]
+
+        # iat
+        df = orig.copy()
+        df.iat[2, 0] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.iat[2, 0] = "c"
+
+        # at
+        #   - assign a single value -> exp_single_cats_value
+        df = orig.copy()
+        df.at["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        #   - assign a single value not in the current categories set
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.at["j", "cats"] = "c"
+
+        # fancy indexing
+        catsf = Categorical(["a", "a", "c", "c", "a", "a", "a"],
+                            categories=["a", "b", "c"])
+        idxf = Index(["h", "i", "j", "k", "l", "m", "n"])
+        valuesf = [1, 1, 3, 3, 1, 1, 1]
+        df = DataFrame({"cats": catsf, "values": valuesf}, index=idxf)
+
+        exp_fancy = exp_multi_row.copy()
+        exp_fancy["cats"].cat.set_categories(["a", "b", "c"], inplace=True)
+
+        df[df["cats"] == "c"] = ["b", 2]
+        # category c is kept in .categories
+        tm.assert_frame_equal(df, exp_fancy)
+
+        # set_value
+        df = orig.copy()
+        df.at["j", "cats"] = "b"
+        tm.assert_frame_equal(df, exp_single_cats_value)
+
+        with pytest.raises(ValueError):
+            df = orig.copy()
+            df.at["j", "cats"] = "c"
+
+        # Assigning a Category to parts of a int/... column uses the values of
+        # the Catgorical
+        df = DataFrame({"a": [1, 1, 1, 1, 1], "b": list("aaaaa")})
+        exp = DataFrame({"a": [1, "b", "b", 1, 1], "b": list("aabba")})
+        df.loc[1:2, "a"] = Categorical(["b", "b"], categories=["a", "b"])
+        df.loc[2:3, "b"] = Categorical(["b", "b"], categories=["a", "b"])
+        tm.assert_frame_equal(df, exp)
+
+    def test_functions_no_warnings(self):
+        df = DataFrame({'value': np.random.randint(0, 100, 20)})
+        labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
+        with tm.assert_produces_warning(False):
+            df['group'] = pd.cut(df.value, range(0, 105, 10), right=False,
+                                 labels=labels)
diff --git a/pandas/tests/frame/test_join.py b/pandas/tests/frame/test_join.py
index f7a510023ca07..0508658766cd3 100644
--- a/pandas/tests/frame/test_join.py
+++ b/pandas/tests/frame/test_join.py
@@ -1,13 +1,21 @@
 # -*- coding: utf-8 -*-
 
-import pytest
 import numpy as np
+import pytest
 
-from pandas import DataFrame, Index
+from pandas import DataFrame, Index, period_range
 from pandas.tests.frame.common import TestData
 import pandas.util.testing as tm
 
 
+@pytest.fixture
+def frame_with_period_index():
+    return DataFrame(
+        data=np.arange(20).reshape(4, 5),
+        columns=list('abcde'),
+        index=period_range(start='2000', freq='A', periods=4))
+
+
 @pytest.fixture
 def frame():
     return TestData().frame
@@ -86,12 +94,13 @@ def test_join_index(frame):
     tm.assert_index_equal(joined.index, frame.index.sort_values())
     tm.assert_index_equal(joined.columns, expected_columns)
 
-    tm.assertRaisesRegexp(ValueError, 'join method', f.join, f2, how='foo')
+    with pytest.raises(ValueError, match='join method'):
+        f.join(f2, how='foo')
 
     # corner case - overlapping columns
+    msg = 'columns overlap but no suffix'
     for how in ('outer', 'left', 'inner'):
-        with tm.assertRaisesRegexp(ValueError, 'columns overlap but '
-                                   'no suffix'):
+        with pytest.raises(ValueError, match=msg):
             frame.join(frame, how=how)
 
 
@@ -122,7 +131,8 @@ def test_join_index_series(frame):
     tm.assert_frame_equal(joined, frame, check_names=False)
 
     s.name = None
-    tm.assertRaisesRegexp(ValueError, 'must have a name', df.join, s)
+    with pytest.raises(ValueError, match='must have a name'):
+        df.join(s)
 
 
 def test_join_overlap(frame):
@@ -138,3 +148,38 @@ def test_join_overlap(frame):
 
     # column order not necessarily sorted
     tm.assert_frame_equal(joined, expected.loc[:, joined.columns])
+
+
+def test_join_period_index(frame_with_period_index):
+    other = frame_with_period_index.rename(
+        columns=lambda x: '{key}{key}'.format(key=x))
+
+    joined_values = np.concatenate(
+        [frame_with_period_index.values] * 2, axis=1)
+
+    joined_cols = frame_with_period_index.columns.append(other.columns)
+
+    joined = frame_with_period_index.join(other)
+    expected = DataFrame(
+        data=joined_values,
+        columns=joined_cols,
+        index=frame_with_period_index.index)
+
+    tm.assert_frame_equal(joined, expected)
+
+
+def test_join_left_sequence_non_unique_index():
+    # https://github.com/pandas-dev/pandas/issues/19607
+    df1 = DataFrame({'a': [0, 10, 20]}, index=[1, 2, 3])
+    df2 = DataFrame({'b': [100, 200, 300]}, index=[4, 3, 2])
+    df3 = DataFrame({'c': [400, 500, 600]}, index=[2, 2, 4])
+
+    joined = df1.join([df2, df3], how='left')
+
+    expected = DataFrame({
+        'a': [0, 10, 10, 20],
+        'b': [np.nan, 300, 300, 200],
+        'c': [np.nan, 400, 500, np.nan]
+    }, index=[1, 2, 2, 3])
+
+    tm.assert_frame_equal(joined, expected)
diff --git a/pandas/tests/frame/test_misc_api.py b/pandas/tests/frame/test_misc_api.py
deleted file mode 100644
index 42427df90401d..0000000000000
--- a/pandas/tests/frame/test_misc_api.py
+++ /dev/null
@@ -1,393 +0,0 @@
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-# pylint: disable-msg=W0612,E1101
-from copy import deepcopy
-import sys
-from distutils.version import LooseVersion
-
-from pandas.compat import range, lrange
-from pandas import compat
-
-from numpy.random import randn
-import numpy as np
-
-from pandas import DataFrame, Series
-import pandas as pd
-
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
-import pandas.util.testing as tm
-
-from pandas.tests.frame.common import TestData
-
-
-class SharedWithSparse(object):
-
-    def test_copy_index_name_checking(self):
-        # don't want to be able to modify the index stored elsewhere after
-        # making a copy
-        for attr in ('index', 'columns'):
-            ind = getattr(self.frame, attr)
-            ind.name = None
-            cp = self.frame.copy()
-            getattr(cp, attr).name = 'foo'
-            self.assertIsNone(getattr(self.frame, attr).name)
-
-    def test_getitem_pop_assign_name(self):
-        s = self.frame['A']
-        self.assertEqual(s.name, 'A')
-
-        s = self.frame.pop('A')
-        self.assertEqual(s.name, 'A')
-
-        s = self.frame.loc[:, 'B']
-        self.assertEqual(s.name, 'B')
-
-        s2 = s.loc[:]
-        self.assertEqual(s2.name, 'B')
-
-    def test_get_value(self):
-        for idx in self.frame.index:
-            for col in self.frame.columns:
-                result = self.frame.get_value(idx, col)
-                expected = self.frame[col][idx]
-                tm.assert_almost_equal(result, expected)
-
-    def test_add_prefix_suffix(self):
-        with_prefix = self.frame.add_prefix('foo#')
-        expected = pd.Index(['foo#%s' % c for c in self.frame.columns])
-        self.assert_index_equal(with_prefix.columns, expected)
-
-        with_suffix = self.frame.add_suffix('#foo')
-        expected = pd.Index(['%s#foo' % c for c in self.frame.columns])
-        self.assert_index_equal(with_suffix.columns, expected)
-
-
-class TestDataFrameMisc(tm.TestCase, SharedWithSparse, TestData):
-
-    klass = DataFrame
-
-    def test_get_axis(self):
-        f = self.frame
-        self.assertEqual(f._get_axis_number(0), 0)
-        self.assertEqual(f._get_axis_number(1), 1)
-        self.assertEqual(f._get_axis_number('index'), 0)
-        self.assertEqual(f._get_axis_number('rows'), 0)
-        self.assertEqual(f._get_axis_number('columns'), 1)
-
-        self.assertEqual(f._get_axis_name(0), 'index')
-        self.assertEqual(f._get_axis_name(1), 'columns')
-        self.assertEqual(f._get_axis_name('index'), 'index')
-        self.assertEqual(f._get_axis_name('rows'), 'index')
-        self.assertEqual(f._get_axis_name('columns'), 'columns')
-
-        self.assertIs(f._get_axis(0), f.index)
-        self.assertIs(f._get_axis(1), f.columns)
-
-        assertRaisesRegexp(ValueError, 'No axis named', f._get_axis_number, 2)
-        assertRaisesRegexp(ValueError, 'No axis.*foo', f._get_axis_name, 'foo')
-        assertRaisesRegexp(ValueError, 'No axis.*None', f._get_axis_name, None)
-        assertRaisesRegexp(ValueError, 'No axis named', f._get_axis_number,
-                           None)
-
-    def test_keys(self):
-        getkeys = self.frame.keys
-        self.assertIs(getkeys(), self.frame.columns)
-
-    def test_column_contains_typeerror(self):
-        try:
-            self.frame.columns in self.frame
-        except TypeError:
-            pass
-
-    def test_not_hashable(self):
-        df = pd.DataFrame([1])
-        self.assertRaises(TypeError, hash, df)
-        self.assertRaises(TypeError, hash, self.empty)
-
-    def test_new_empty_index(self):
-        df1 = DataFrame(randn(0, 3))
-        df2 = DataFrame(randn(0, 3))
-        df1.index.name = 'foo'
-        self.assertIsNone(df2.index.name)
-
-    def test_array_interface(self):
-        with np.errstate(all='ignore'):
-            result = np.sqrt(self.frame)
-        tm.assertIsInstance(result, type(self.frame))
-        self.assertIs(result.index, self.frame.index)
-        self.assertIs(result.columns, self.frame.columns)
-
-        assert_frame_equal(result, self.frame.apply(np.sqrt))
-
-    def test_get_agg_axis(self):
-        cols = self.frame._get_agg_axis(0)
-        self.assertIs(cols, self.frame.columns)
-
-        idx = self.frame._get_agg_axis(1)
-        self.assertIs(idx, self.frame.index)
-
-        self.assertRaises(ValueError, self.frame._get_agg_axis, 2)
-
-    def test_nonzero(self):
-        self.assertTrue(self.empty.empty)
-
-        self.assertFalse(self.frame.empty)
-        self.assertFalse(self.mixed_frame.empty)
-
-        # corner case
-        df = DataFrame({'A': [1., 2., 3.],
-                        'B': ['a', 'b', 'c']},
-                       index=np.arange(3))
-        del df['A']
-        self.assertFalse(df.empty)
-
-    def test_iteritems(self):
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], columns=['a', 'a', 'b'])
-        for k, v in compat.iteritems(df):
-            self.assertEqual(type(v), Series)
-
-    def test_iter(self):
-        self.assertTrue(tm.equalContents(list(self.frame), self.frame.columns))
-
-    def test_iterrows(self):
-        for i, (k, v) in enumerate(self.frame.iterrows()):
-            exp = self.frame.xs(self.frame.index[i])
-            assert_series_equal(v, exp)
-
-        for i, (k, v) in enumerate(self.mixed_frame.iterrows()):
-            exp = self.mixed_frame.xs(self.mixed_frame.index[i])
-            assert_series_equal(v, exp)
-
-    def test_itertuples(self):
-        for i, tup in enumerate(self.frame.itertuples()):
-            s = Series(tup[1:])
-            s.name = tup[0]
-            expected = self.frame.iloc[i, :].reset_index(drop=True)
-            assert_series_equal(s, expected)
-
-        df = DataFrame({'floats': np.random.randn(5),
-                        'ints': lrange(5)}, columns=['floats', 'ints'])
-
-        for tup in df.itertuples(index=False):
-            tm.assertIsInstance(tup[1], np.integer)
-
-        df = DataFrame(data={"a": [1, 2, 3], "b": [4, 5, 6]})
-        dfaa = df[['a', 'a']]
-        self.assertEqual(list(dfaa.itertuples()), [
-                         (0, 1, 1), (1, 2, 2), (2, 3, 3)])
-
-        self.assertEqual(repr(list(df.itertuples(name=None))),
-                         '[(0, 1, 4), (1, 2, 5), (2, 3, 6)]')
-
-        tup = next(df.itertuples(name='TestName'))
-
-        # no support for field renaming in Python 2.6, regular tuples are
-        # returned
-        if sys.version >= LooseVersion('2.7'):
-            self.assertEqual(tup._fields, ('Index', 'a', 'b'))
-            self.assertEqual((tup.Index, tup.a, tup.b), tup)
-            self.assertEqual(type(tup).__name__, 'TestName')
-
-        df.columns = ['def', 'return']
-        tup2 = next(df.itertuples(name='TestName'))
-        self.assertEqual(tup2, (0, 1, 4))
-
-        if sys.version >= LooseVersion('2.7'):
-            self.assertEqual(tup2._fields, ('Index', '_1', '_2'))
-
-        df3 = DataFrame(dict(('f' + str(i), [i]) for i in range(1024)))
-        # will raise SyntaxError if trying to create namedtuple
-        tup3 = next(df3.itertuples())
-        self.assertFalse(hasattr(tup3, '_fields'))
-        self.assertIsInstance(tup3, tuple)
-
-    def test_len(self):
-        self.assertEqual(len(self.frame), len(self.frame.index))
-
-    def test_as_matrix(self):
-        frame = self.frame
-        mat = frame.as_matrix()
-
-        frameCols = frame.columns
-        for i, row in enumerate(mat):
-            for j, value in enumerate(row):
-                col = frameCols[j]
-                if np.isnan(value):
-                    self.assertTrue(np.isnan(frame[col][i]))
-                else:
-                    self.assertEqual(value, frame[col][i])
-
-        # mixed type
-        mat = self.mixed_frame.as_matrix(['foo', 'A'])
-        self.assertEqual(mat[0, 0], 'bar')
-
-        df = DataFrame({'real': [1, 2, 3], 'complex': [1j, 2j, 3j]})
-        mat = df.as_matrix()
-        self.assertEqual(mat[0, 0], 1j)
-
-        # single block corner case
-        mat = self.frame.as_matrix(['A', 'B'])
-        expected = self.frame.reindex(columns=['A', 'B']).values
-        assert_almost_equal(mat, expected)
-
-    def test_values(self):
-        self.frame.values[:, 0] = 5.
-        self.assertTrue((self.frame.values[:, 0] == 5).all())
-
-    def test_deepcopy(self):
-        cp = deepcopy(self.frame)
-        series = cp['A']
-        series[:] = 10
-        for idx, value in compat.iteritems(series):
-            self.assertNotEqual(self.frame['A'][idx], value)
-
-    # ---------------------------------------------------------------------
-    # Transposing
-
-    def test_transpose(self):
-        frame = self.frame
-        dft = frame.T
-        for idx, series in compat.iteritems(dft):
-            for col, value in compat.iteritems(series):
-                if np.isnan(value):
-                    self.assertTrue(np.isnan(frame[col][idx]))
-                else:
-                    self.assertEqual(value, frame[col][idx])
-
-        # mixed type
-        index, data = tm.getMixedTypeDict()
-        mixed = DataFrame(data, index=index)
-
-        mixed_T = mixed.T
-        for col, s in compat.iteritems(mixed_T):
-            self.assertEqual(s.dtype, np.object_)
-
-    def test_transpose_get_view(self):
-        dft = self.frame.T
-        dft.values[:, 5:10] = 5
-
-        self.assertTrue((self.frame.values[5:10] == 5).all())
-
-    def test_swapaxes(self):
-        df = DataFrame(np.random.randn(10, 5))
-        assert_frame_equal(df.T, df.swapaxes(0, 1))
-        assert_frame_equal(df.T, df.swapaxes(1, 0))
-        assert_frame_equal(df, df.swapaxes(0, 0))
-        self.assertRaises(ValueError, df.swapaxes, 2, 5)
-
-    def test_axis_aliases(self):
-        f = self.frame
-
-        # reg name
-        expected = f.sum(axis=0)
-        result = f.sum(axis='index')
-        assert_series_equal(result, expected)
-
-        expected = f.sum(axis=1)
-        result = f.sum(axis='columns')
-        assert_series_equal(result, expected)
-
-    def test_more_asMatrix(self):
-        values = self.mixed_frame.as_matrix()
-        self.assertEqual(values.shape[1], len(self.mixed_frame.columns))
-
-    def test_repr_with_mi_nat(self):
-        df = DataFrame({'X': [1, 2]},
-                       index=[[pd.NaT, pd.Timestamp('20130101')], ['a', 'b']])
-        res = repr(df)
-        exp = '              X\nNaT        a  1\n2013-01-01 b  2'
-        self.assertEqual(res, exp)
-
-    def test_iteritems_names(self):
-        for k, v in compat.iteritems(self.mixed_frame):
-            self.assertEqual(v.name, k)
-
-    def test_series_put_names(self):
-        series = self.mixed_frame._series
-        for k, v in compat.iteritems(series):
-            self.assertEqual(v.name, k)
-
-    def test_empty_nonzero(self):
-        df = DataFrame([1, 2, 3])
-        self.assertFalse(df.empty)
-        df = pd.DataFrame(index=[1], columns=[1])
-        self.assertFalse(df.empty)
-        df = DataFrame(index=['a', 'b'], columns=['c', 'd']).dropna()
-        self.assertTrue(df.empty)
-        self.assertTrue(df.T.empty)
-        empty_frames = [pd.DataFrame(),
-                        pd.DataFrame(index=[1]),
-                        pd.DataFrame(columns=[1]),
-                        pd.DataFrame({1: []})]
-        for df in empty_frames:
-            self.assertTrue(df.empty)
-            self.assertTrue(df.T.empty)
-
-    def test_inplace_return_self(self):
-        # re #1893
-
-        data = DataFrame({'a': ['foo', 'bar', 'baz', 'qux'],
-                          'b': [0, 0, 1, 1],
-                          'c': [1, 2, 3, 4]})
-
-        def _check_f(base, f):
-            result = f(base)
-            self.assertTrue(result is None)
-
-        # -----DataFrame-----
-
-        # set_index
-        f = lambda x: x.set_index('a', inplace=True)
-        _check_f(data.copy(), f)
-
-        # reset_index
-        f = lambda x: x.reset_index(inplace=True)
-        _check_f(data.set_index('a'), f)
-
-        # drop_duplicates
-        f = lambda x: x.drop_duplicates(inplace=True)
-        _check_f(data.copy(), f)
-
-        # sort
-        f = lambda x: x.sort_values('b', inplace=True)
-        _check_f(data.copy(), f)
-
-        # sort_index
-        f = lambda x: x.sort_index(inplace=True)
-        _check_f(data.copy(), f)
-
-        # fillna
-        f = lambda x: x.fillna(0, inplace=True)
-        _check_f(data.copy(), f)
-
-        # replace
-        f = lambda x: x.replace(1, 0, inplace=True)
-        _check_f(data.copy(), f)
-
-        # rename
-        f = lambda x: x.rename({1: 'foo'}, inplace=True)
-        _check_f(data.copy(), f)
-
-        # -----Series-----
-        d = data.copy()['c']
-
-        # reset_index
-        f = lambda x: x.reset_index(inplace=True, drop=True)
-        _check_f(data.set_index('a')['c'], f)
-
-        # fillna
-        f = lambda x: x.fillna(0, inplace=True)
-        _check_f(d.copy(), f)
-
-        # replace
-        f = lambda x: x.replace(1, 0, inplace=True)
-        _check_f(d.copy(), f)
-
-        # rename
-        f = lambda x: x.rename({1: 'foo'}, inplace=True)
-        _check_f(d.copy(), f)
diff --git a/pandas/tests/frame/test_missing.py b/pandas/tests/frame/test_missing.py
index 93c3ba78a0abf..189531c7b4459 100644
--- a/pandas/tests/frame/test_missing.py
+++ b/pandas/tests/frame/test_missing.py
@@ -2,27 +2,27 @@
 
 from __future__ import print_function
 
+import datetime
 from distutils.version import LooseVersion
-from numpy import nan, random
-import numpy as np
 
-from pandas.compat import lrange
-from pandas import (DataFrame, Series, Timestamp,
-                    date_range)
-import pandas as pd
+import dateutil
+import numpy as np
+import pytest
 
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+from pandas.compat import PY2, lrange
+import pandas.util._test_decorators as td
 
-import pandas.util.testing as tm
+import pandas as pd
+from pandas import Categorical, DataFrame, Series, Timestamp, date_range
 from pandas.tests.frame.common import TestData, _check_mixed_float
-
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 try:
     import scipy
-    _is_scipy_ge_0190 = scipy.__version__ >= LooseVersion('0.19.0')
-except:
+    _is_scipy_ge_0190 = (LooseVersion(scipy.__version__) >=
+                         LooseVersion('0.19.0'))
+except ImportError:
     _is_scipy_ge_0190 = False
 
 
@@ -34,12 +34,12 @@ def _skip_if_no_pchip():
         pytest.skip('scipy.interpolate.pchip missing')
 
 
-class TestDataFrameMissingData(tm.TestCase, TestData):
+class TestDataFrameMissingData(TestData):
 
     def test_dropEmptyRows(self):
         N = len(self.frame.index)
-        mat = random.randn(N)
-        mat[:5] = nan
+        mat = np.random.randn(N)
+        mat[:5] = np.nan
 
         frame = DataFrame({'foo': mat}, index=self.frame.index)
         original = Series(mat, index=self.frame.index, name='foo')
@@ -60,8 +60,8 @@ def test_dropEmptyRows(self):
 
     def test_dropIncompleteRows(self):
         N = len(self.frame.index)
-        mat = random.randn(N)
-        mat[:5] = nan
+        mat = np.random.randn(N)
+        mat[:5] = np.nan
 
         frame = DataFrame({'foo': mat}, index=self.frame.index)
         frame['bar'] = 5
@@ -78,14 +78,15 @@ def test_dropIncompleteRows(self):
 
         samesize_frame = frame.dropna(subset=['bar'])
         assert_series_equal(frame['foo'], original)
-        self.assertTrue((frame['bar'] == 5).all())
+        assert (frame['bar'] == 5).all()
         inp_frame2.dropna(subset=['bar'], inplace=True)
-        self.assert_index_equal(samesize_frame.index, self.frame.index)
-        self.assert_index_equal(inp_frame2.index, self.frame.index)
+        tm.assert_index_equal(samesize_frame.index, self.frame.index)
+        tm.assert_index_equal(inp_frame2.index, self.frame.index)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_dropna(self):
         df = DataFrame(np.random.randn(6, 4))
-        df[2][:2] = nan
+        df[2][:2] = np.nan
 
         dropped = df.dropna(axis=1)
         expected = df.loc[:, [0, 1, 3]]
@@ -133,13 +134,16 @@ def test_dropna(self):
         dropped = df.dropna(axis=1, how='all')
         assert_frame_equal(dropped, df)
 
-        df[2] = nan
+        df[2] = np.nan
         dropped = df.dropna(axis=1, how='all')
         expected = df.loc[:, [0, 1, 3]]
         assert_frame_equal(dropped, expected)
 
         # bad input
-        self.assertRaises(ValueError, df.dropna, axis=3)
+        msg = ("No axis named 3 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            df.dropna(axis=3)
 
     def test_drop_and_dropna_caching(self):
         # tst that cacher updates
@@ -158,10 +162,15 @@ def test_drop_and_dropna_caching(self):
 
     def test_dropna_corner(self):
         # bad input
-        self.assertRaises(ValueError, self.frame.dropna, how='foo')
-        self.assertRaises(TypeError, self.frame.dropna, how=None)
+        msg = "invalid how option: foo"
+        with pytest.raises(ValueError, match=msg):
+            self.frame.dropna(how='foo')
+        msg = "must specify how or thresh"
+        with pytest.raises(TypeError, match=msg):
+            self.frame.dropna(how=None)
         # non-existent column - 8303
-        self.assertRaises(KeyError, self.frame.dropna, subset=['A', 'X'])
+        with pytest.raises(KeyError, match=r"^\['X'\]$"):
+            self.frame.dropna(subset=['A', 'X'])
 
     def test_dropna_multiple_axes(self):
         df = DataFrame([[1, np.nan, 2, 3],
@@ -169,8 +178,12 @@ def test_dropna_multiple_axes(self):
                         [np.nan, np.nan, np.nan, np.nan],
                         [7, np.nan, 8, 9]])
         cp = df.copy()
-        result = df.dropna(how='all', axis=[0, 1])
-        result2 = df.dropna(how='all', axis=(0, 1))
+
+        # GH20987
+        with tm.assert_produces_warning(FutureWarning):
+            result = df.dropna(how='all', axis=[0, 1])
+        with tm.assert_produces_warning(FutureWarning):
+            result2 = df.dropna(how='all', axis=(0, 1))
         expected = df.dropna(how='all').dropna(how='all', axis=1)
 
         assert_frame_equal(result, expected)
@@ -178,36 +191,60 @@ def test_dropna_multiple_axes(self):
         assert_frame_equal(df, cp)
 
         inp = df.copy()
-        inp.dropna(how='all', axis=(0, 1), inplace=True)
+        with tm.assert_produces_warning(FutureWarning):
+            inp.dropna(how='all', axis=(0, 1), inplace=True)
         assert_frame_equal(inp, expected)
 
+    def test_dropna_tz_aware_datetime(self):
+        # GH13407
+        df = DataFrame()
+        dt1 = datetime.datetime(2015, 1, 1,
+                                tzinfo=dateutil.tz.tzutc())
+        dt2 = datetime.datetime(2015, 2, 2,
+                                tzinfo=dateutil.tz.tzutc())
+        df['Time'] = [dt1]
+        result = df.dropna(axis=0)
+        expected = DataFrame({'Time': [dt1]})
+        assert_frame_equal(result, expected)
+
+        # Ex2
+        df = DataFrame({'Time': [dt1, None, np.nan, dt2]})
+        result = df.dropna(axis=0)
+        expected = DataFrame([dt1, dt2],
+                             columns=['Time'],
+                             index=[0, 3])
+        assert_frame_equal(result, expected)
+
     def test_fillna(self):
         tf = self.tsframe
-        tf.loc[tf.index[:5], 'A'] = nan
-        tf.loc[tf.index[-5:], 'A'] = nan
+        tf.loc[tf.index[:5], 'A'] = np.nan
+        tf.loc[tf.index[-5:], 'A'] = np.nan
 
         zero_filled = self.tsframe.fillna(0)
-        self.assertTrue((zero_filled.loc[zero_filled.index[:5], 'A'] == 0
-                         ).all())
+        assert (zero_filled.loc[zero_filled.index[:5], 'A'] == 0).all()
 
         padded = self.tsframe.fillna(method='pad')
-        self.assertTrue(np.isnan(padded.loc[padded.index[:5], 'A']).all())
-        self.assertTrue((padded.loc[padded.index[-5:], 'A'] ==
-                         padded.loc[padded.index[-5], 'A']).all())
+        assert np.isnan(padded.loc[padded.index[:5], 'A']).all()
+        assert (padded.loc[padded.index[-5:], 'A'] ==
+                padded.loc[padded.index[-5], 'A']).all()
 
         # mixed type
         mf = self.mixed_frame
-        mf.loc[mf.index[5:20], 'foo'] = nan
-        mf.loc[mf.index[-10:], 'A'] = nan
+        mf.loc[mf.index[5:20], 'foo'] = np.nan
+        mf.loc[mf.index[-10:], 'A'] = np.nan
         result = self.mixed_frame.fillna(value=0)
         result = self.mixed_frame.fillna(method='pad')
 
-        self.assertRaises(ValueError, self.tsframe.fillna)
-        self.assertRaises(ValueError, self.tsframe.fillna, 5, method='ffill')
+        msg = "Must specify a fill 'value' or 'method'"
+        with pytest.raises(ValueError, match=msg):
+            self.tsframe.fillna()
+        msg = "Cannot specify both 'value' and 'method'"
+        with pytest.raises(ValueError, match=msg):
+            self.tsframe.fillna(5, method='ffill')
 
         # mixed numeric (but no float16)
         mf = self.mixed_float.reindex(columns=['A', 'B', 'D'])
-        mf.loc[mf.index[-10:], 'A'] = nan
+        mf.loc[mf.index[-10:], 'A'] = np.nan
         result = mf.fillna(value=0)
         _check_mixed_float(result, dtype=dict(C=None))
 
@@ -257,6 +294,106 @@ def test_fillna(self):
         result = df.fillna(value={'Date': df['Date2']})
         assert_frame_equal(result, expected)
 
+        # with timezone
+        # GH 15855
+        df = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                 pd.NaT]})
+        exp = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                  pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        assert_frame_equal(df.fillna(method='pad'), exp)
+
+        df = pd.DataFrame({'A': [pd.NaT,
+                                 pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        exp = pd.DataFrame({'A': [pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                                  pd.Timestamp('2012-11-11 00:00:00+01:00')]})
+        assert_frame_equal(df.fillna(method='bfill'), exp)
+
+        # with timezone in another column
+        # GH 15522
+        df = pd.DataFrame({'A': pd.date_range('20130101', periods=4,
+                                              tz='US/Eastern'),
+                           'B': [1, 2, np.nan, np.nan]})
+        result = df.fillna(method='pad')
+        expected = pd.DataFrame({'A': pd.date_range('20130101', periods=4,
+                                                    tz='US/Eastern'),
+                                 'B': [1., 2., 2., 2.]})
+        assert_frame_equal(result, expected)
+
+    def test_na_actions_categorical(self):
+
+        cat = Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
+        vals = ["a", "b", np.nan, "d"]
+        df = DataFrame({"cats": cat, "vals": vals})
+        cat2 = Categorical([1, 2, 3, 3], categories=[1, 2, 3])
+        vals2 = ["a", "b", "b", "d"]
+        df_exp_fill = DataFrame({"cats": cat2, "vals": vals2})
+        cat3 = Categorical([1, 2, 3], categories=[1, 2, 3])
+        vals3 = ["a", "b", np.nan]
+        df_exp_drop_cats = DataFrame({"cats": cat3, "vals": vals3})
+        cat4 = Categorical([1, 2], categories=[1, 2, 3])
+        vals4 = ["a", "b"]
+        df_exp_drop_all = DataFrame({"cats": cat4, "vals": vals4})
+
+        # fillna
+        res = df.fillna(value={"cats": 3, "vals": "b"})
+        tm.assert_frame_equal(res, df_exp_fill)
+
+        with pytest.raises(ValueError, match=("fill value must "
+                                              "be in categories")):
+            df.fillna(value={"cats": 4, "vals": "c"})
+
+        res = df.fillna(method='pad')
+        tm.assert_frame_equal(res, df_exp_fill)
+
+        # dropna
+        res = df.dropna(subset=["cats"])
+        tm.assert_frame_equal(res, df_exp_drop_cats)
+
+        res = df.dropna()
+        tm.assert_frame_equal(res, df_exp_drop_all)
+
+        # make sure that fillna takes missing values into account
+        c = Categorical([np.nan, "b", np.nan], categories=["a", "b"])
+        df = pd.DataFrame({"cats": c, "vals": [1, 2, 3]})
+
+        cat_exp = Categorical(["a", "b", "a"], categories=["a", "b"])
+        df_exp = DataFrame({"cats": cat_exp, "vals": [1, 2, 3]})
+
+        res = df.fillna("a")
+        tm.assert_frame_equal(res, df_exp)
+
+    def test_fillna_categorical_nan(self):
+        # GH 14021
+        # np.nan should always be a valid filler
+        cat = Categorical([np.nan, 2, np.nan])
+        val = Categorical([np.nan, np.nan, np.nan])
+        df = DataFrame({"cats": cat, "vals": val})
+        res = df.fillna(df.median())
+        v_exp = [np.nan, np.nan, np.nan]
+        df_exp = DataFrame({"cats": [2, 2, 2], "vals": v_exp},
+                           dtype='category')
+        tm.assert_frame_equal(res, df_exp)
+
+        result = df.cats.fillna(np.nan)
+        tm.assert_series_equal(result, df.cats)
+        result = df.vals.fillna(np.nan)
+        tm.assert_series_equal(result, df.vals)
+
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', '2016-01-01 23:45',
+                                '2011-01-01 09:00', pd.NaT, pd.NaT])
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
+        idx = pd.PeriodIndex(['2011-01', '2011-01', '2011-01',
+                              pd.NaT, pd.NaT], freq='M')
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
+        idx = pd.TimedeltaIndex(['1 days', '2 days',
+                                 '1 days', pd.NaT, pd.NaT])
+        df = DataFrame({'a': Categorical(idx)})
+        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
+
     def test_fillna_downcast(self):
         # GH 15277
         # infer int64 from float64
@@ -310,7 +447,7 @@ def test_fillna_datetime_columns(self):
                                  'C': ['foo', 'bar', '?'],
                                  'D': ['foo2', 'bar2', '?']},
                                 index=date_range('20130110', periods=3))
-        self.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
         df = pd.DataFrame({'A': [-1, -2, np.nan],
                            'B': [pd.Timestamp('2013-01-01'),
@@ -325,18 +462,18 @@ def test_fillna_datetime_columns(self):
                                  'C': ['foo', 'bar', '?'],
                                  'D': ['foo2', 'bar2', '?']},
                                 index=pd.date_range('20130110', periods=3))
-        self.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_ffill(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
+        self.tsframe['A'][:5] = np.nan
+        self.tsframe['A'][-5:] = np.nan
 
         assert_frame_equal(self.tsframe.ffill(),
                            self.tsframe.fillna(method='ffill'))
 
     def test_bfill(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
+        self.tsframe['A'][:5] = np.nan
+        self.tsframe['A'][-5:] = np.nan
 
         assert_frame_equal(self.tsframe.bfill(),
                            self.tsframe.fillna(method='bfill'))
@@ -389,23 +526,26 @@ def test_fillna_inplace(self):
         df[3][-4:] = np.nan
 
         expected = df.fillna(value=0)
-        self.assertIsNot(expected, df)
+        assert expected is not df
 
         df.fillna(value=0, inplace=True)
-        assert_frame_equal(df, expected)
+        tm.assert_frame_equal(df, expected)
+
+        expected = df.fillna(value={0: 0}, inplace=True)
+        assert expected is None
 
         df[1][:4] = np.nan
         df[3][-4:] = np.nan
         expected = df.fillna(method='ffill')
-        self.assertIsNot(expected, df)
+        assert expected is not df
 
         df.fillna(method='ffill', inplace=True)
-        assert_frame_equal(df, expected)
+        tm.assert_frame_equal(df, expected)
 
     def test_fillna_dict_series(self):
-        df = DataFrame({'a': [nan, 1, 2, nan, nan],
-                        'b': [1, 2, 3, nan, nan],
-                        'c': [nan, 1, 2, 3, 4]})
+        df = DataFrame({'a': [np.nan, 1, 2, np.nan, np.nan],
+                        'b': [1, 2, 3, np.nan, np.nan],
+                        'c': [np.nan, 1, 2, 3, 4]})
 
         result = df.fillna({'a': 0, 'b': 5})
 
@@ -423,18 +563,18 @@ def test_fillna_dict_series(self):
         assert_frame_equal(result, expected)
 
         # disable this for now
-        with assertRaisesRegexp(NotImplementedError, 'column by column'):
+        with pytest.raises(NotImplementedError, match='column by column'):
             df.fillna(df.max(1), axis=1)
 
     def test_fillna_dataframe(self):
         # GH 8377
-        df = DataFrame({'a': [nan, 1, 2, nan, nan],
-                        'b': [1, 2, 3, nan, nan],
-                        'c': [nan, 1, 2, 3, 4]},
+        df = DataFrame({'a': [np.nan, 1, 2, np.nan, np.nan],
+                        'b': [1, 2, 3, np.nan, np.nan],
+                        'c': [np.nan, 1, 2, 3, 4]},
                        index=list('VWXYZ'))
 
         # df2 may have different index and columns
-        df2 = DataFrame({'a': [nan, 10, 20, 30, 40],
+        df2 = DataFrame({'a': [np.nan, 10, 20, 30, 40],
                          'b': [50, 60, 70, 80, 90],
                          'foo': ['bar'] * 5},
                         index=list('VWXuZ'))
@@ -442,9 +582,9 @@ def test_fillna_dataframe(self):
         result = df.fillna(df2)
 
         # only those columns and indices which are shared get filled
-        expected = DataFrame({'a': [nan, 1, 2, nan, 40],
-                              'b': [1, 2, 3, nan, 90],
-                              'c': [nan, 1, 2, 3, 4]},
+        expected = DataFrame({'a': [np.nan, 1, 2, np.nan, 40],
+                              'b': [1, 2, 3, np.nan, 90],
+                              'c': [np.nan, 1, 2, 3, 4]},
                              index=list('VWXYZ'))
 
         assert_frame_equal(result, expected)
@@ -463,32 +603,38 @@ def test_fillna_columns(self):
         assert_frame_equal(result, expected)
 
     def test_fillna_invalid_method(self):
-        with assertRaisesRegexp(ValueError, 'ffil'):
+        with pytest.raises(ValueError, match='ffil'):
             self.frame.fillna(method='ffil')
 
     def test_fillna_invalid_value(self):
         # list
-        self.assertRaises(TypeError, self.frame.fillna, [1, 2])
+        msg = ("\"value\" parameter must be a scalar or dict, but you passed"
+               " a \"{}\"")
+        with pytest.raises(TypeError, match=msg.format('list')):
+            self.frame.fillna([1, 2])
         # tuple
-        self.assertRaises(TypeError, self.frame.fillna, (1, 2))
+        with pytest.raises(TypeError, match=msg.format('tuple')):
+            self.frame.fillna((1, 2))
         # frame with series
-        self.assertRaises(ValueError, self.frame.iloc[:, 0].fillna,
-                          self.frame)
+        msg = ("\"value\" parameter must be a scalar, dict or Series, but you"
+               " passed a \"DataFrame\"")
+        with pytest.raises(TypeError, match=msg):
+            self.frame.iloc[:, 0].fillna(self.frame)
 
     def test_fillna_col_reordering(self):
         cols = ["COL." + str(i) for i in range(5, 0, -1)]
         data = np.random.rand(20, 5)
         df = DataFrame(index=lrange(20), columns=cols, data=data)
         filled = df.fillna(method='ffill')
-        self.assertEqual(df.columns.tolist(), filled.columns.tolist())
+        assert df.columns.tolist() == filled.columns.tolist()
 
     def test_fill_corner(self):
         mf = self.mixed_frame
-        mf.loc[mf.index[5:20], 'foo'] = nan
-        mf.loc[mf.index[-10:], 'A'] = nan
+        mf.loc[mf.index[5:20], 'foo'] = np.nan
+        mf.loc[mf.index[-10:], 'A'] = np.nan
 
         filled = self.mixed_frame.fillna(value=0)
-        self.assertTrue((filled.loc[filled.index[5:20], 'foo'] == 0).all())
+        assert (filled.loc[filled.index[5:20], 'foo'] == 0).all()
         del self.mixed_frame['foo']
 
         empty_float = self.frame.reindex(columns=[])
@@ -506,7 +652,7 @@ def test_fill_value_when_combine_const(self):
         assert_frame_equal(res, exp)
 
 
-class TestDataFrameInterpolate(tm.TestCase, TestData):
+class TestDataFrameInterpolate(TestData):
 
     def test_interp_basic(self):
         df = DataFrame({'A': [1, 2, np.nan, 4],
@@ -531,7 +677,7 @@ def test_interp_bad_method(self):
                         'B': [1, 4, 9, np.nan],
                         'C': [1, 2, 3, 5],
                         'D': list('abcd')})
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.interpolate(method='not_a_method')
 
     def test_interp_combo(self):
@@ -551,12 +697,11 @@ def test_interp_combo(self):
     def test_interp_nan_idx(self):
         df = DataFrame({'A': [1, 2, np.nan, 4], 'B': [np.nan, 2, 3, 4]})
         df = df.set_index('A')
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             df.interpolate(method='values')
 
+    @td.skip_if_no_scipy
     def test_interp_various(self):
-        tm._skip_if_no_scipy()
-
         df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
                         'C': [1, 2, 3, 5, 8, 13, 21]})
         df = df.set_index('C')
@@ -603,8 +748,8 @@ def test_interp_various(self):
         expected.A.loc[13] = 5
         assert_frame_equal(result, expected, check_dtype=False)
 
+    @td.skip_if_no_scipy
     def test_interp_alt_scipy(self):
-        tm._skip_if_no_scipy()
         df = DataFrame({'A': [1, 2, np.nan, 4, 5, np.nan, 7],
                         'C': [1, 2, 3, 5, 8, 13, 21]})
         result = df.interpolate(method='barycentric')
@@ -626,7 +771,7 @@ def test_interp_alt_scipy(self):
         result = df.interpolate(method='pchip')
         expected.loc[2, 'A'] = 3
 
-        if LooseVersion(scipy.__version__) >= '0.17.0':
+        if LooseVersion(scipy.__version__) >= LooseVersion('0.17.0'):
             expected.loc[5, 'A'] = 6.0
         else:
             expected.loc[5, 'A'] = 6.125
@@ -647,8 +792,6 @@ def test_interp_rowwise(self):
         expected[4] = expected[4].astype(np.float64)
         assert_frame_equal(result, expected)
 
-        # scipy route
-        tm._skip_if_no_scipy()
         result = df.interpolate(axis=1, method='values')
         assert_frame_equal(result, expected)
 
@@ -661,7 +804,10 @@ def test_rowwise_alt(self):
                         1: [1, 2, 3, 4, 3, 2, 1, 0, -1]})
         df.interpolate(axis=0)
 
-    def test_interp_leading_nans(self):
+    @pytest.mark.parametrize("check_scipy", [
+        False, pytest.param(True, marks=td.skip_if_no_scipy)
+    ])
+    def test_interp_leading_nans(self, check_scipy):
         df = DataFrame({"A": [np.nan, np.nan, .5, .25, 0],
                         "B": [np.nan, -3, -3.5, np.nan, -4]})
         result = df.interpolate()
@@ -669,9 +815,9 @@ def test_interp_leading_nans(self):
         expected['B'].loc[3] = -3.75
         assert_frame_equal(result, expected)
 
-        tm._skip_if_no_scipy()
-        result = df.interpolate(method='polynomial', order=1)
-        assert_frame_equal(result, expected)
+        if check_scipy:
+            result = df.interpolate(method='polynomial', order=1)
+            assert_frame_equal(result, expected)
 
     def test_interp_raise_on_only_mixed(self):
         df = DataFrame({'A': [1, 2, np.nan, 4],
@@ -679,9 +825,21 @@ def test_interp_raise_on_only_mixed(self):
                         'C': [np.nan, 2, 5, 7],
                         'D': [np.nan, np.nan, 9, 9],
                         'E': [1, 2, 3, 4]})
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.interpolate(axis=1)
 
+    def test_interp_raise_on_all_object_dtype(self):
+        # GH 22985
+        df = DataFrame({
+            'A': [1, 2, 3],
+            'B': [4, 5, 6]},
+            dtype='object')
+        msg = ("Cannot interpolate with all object-dtype columns "
+               "in the DataFrame. Try setting at least one "
+               "column to a numeric dtype.")
+        with pytest.raises(TypeError, match=msg):
+            df.interpolate()
+
     def test_interp_inplace(self):
         df = DataFrame({'a': [1., 2., np.nan, 4.]})
         expected = DataFrame({'a': [1., 2., 3., 4.]})
diff --git a/pandas/tests/frame/test_mutate_columns.py b/pandas/tests/frame/test_mutate_columns.py
index fe3f3c554a9b5..6bef7e3f65b21 100644
--- a/pandas/tests/frame/test_mutate_columns.py
+++ b/pandas/tests/frame/test_mutate_columns.py
@@ -1,25 +1,21 @@
 # -*- coding: utf-8 -*-
 
 from __future__ import print_function
-import pytest
-from pandas.compat import range, lrange
-import numpy as np
 
-from pandas import DataFrame, Series, Index, MultiIndex
-
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+import numpy as np
+import pytest
 
-import pandas.util.testing as tm
+from pandas.compat import PY36, lrange, range
 
+from pandas import DataFrame, Index, MultiIndex, Series
 from pandas.tests.frame.common import TestData
-
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
 
 # Column add, remove, delete.
 
 
-class TestDataFrameMutateColumns(tm.TestCase, TestData):
+class TestDataFrameMutateColumns(TestData):
 
     def test_assign(self):
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
@@ -63,28 +59,62 @@ def test_assign_multiple(self):
                               [3, 6, 9, 3, 6]], columns=list('ABCDE'))
         assert_frame_equal(result, expected)
 
-    def test_assign_alphabetical(self):
+    def test_assign_order(self):
         # GH 9818
         df = DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
         result = df.assign(D=df.A + df.B, C=df.A - df.B)
-        expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
-                             columns=list('ABCD'))
+
+        if PY36:
+            expected = DataFrame([[1, 2, 3, -1], [3, 4, 7, -1]],
+                                 columns=list('ABDC'))
+        else:
+            expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
+                                 columns=list('ABCD'))
         assert_frame_equal(result, expected)
         result = df.assign(C=df.A - df.B, D=df.A + df.B)
+
+        expected = DataFrame([[1, 2, -1, 3], [3, 4, -1, 7]],
+                             columns=list('ABCD'))
+
         assert_frame_equal(result, expected)
 
     def test_assign_bad(self):
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+
         # non-keyword argument
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.assign(lambda x: x.A)
-        with tm.assertRaises(AttributeError):
+        with pytest.raises(AttributeError):
             df.assign(C=df.A, D=df.A + df.C)
-        with tm.assertRaises(KeyError):
-            df.assign(C=lambda df: df.A, D=lambda df: df['A'] + df['C'])
-        with tm.assertRaises(KeyError):
+
+    @pytest.mark.skipif(PY36, reason="""Issue #14207: valid for python
+                        3.6 and above""")
+    def test_assign_dependent_old_python(self):
+        df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+
+        # Key C does not exist at definition time of df
+        with pytest.raises(KeyError):
+            df.assign(C=lambda df: df.A,
+                      D=lambda df: df['A'] + df['C'])
+        with pytest.raises(KeyError):
             df.assign(C=df.A, D=lambda x: x['A'] + x['C'])
 
+    @pytest.mark.skipif(not PY36, reason="""Issue #14207: not valid for
+                        python 3.5 and below""")
+    def test_assign_dependent(self):
+        df = DataFrame({'A': [1, 2], 'B': [3, 4]})
+
+        result = df.assign(C=df.A, D=lambda x: x['A'] + x['C'])
+        expected = DataFrame([[1, 3, 1, 2], [2, 4, 2, 4]],
+                             columns=list('ABCD'))
+        assert_frame_equal(result, expected)
+
+        result = df.assign(C=lambda df: df.A,
+                           D=lambda df: df['A'] + df['C'])
+        expected = DataFrame([[1, 3, 1, 2], [2, 4, 2, 4]],
+                             columns=list('ABCD'))
+        assert_frame_equal(result, expected)
+
     def test_insert_error_msmgs(self):
 
         # GH 7432
@@ -93,7 +123,7 @@ def test_insert_error_msmgs(self):
         s = DataFrame({'foo': ['a', 'b', 'c', 'a'], 'fiz': [
                       'g', 'h', 'i', 'j']}).set_index('foo')
         msg = 'cannot reindex from a duplicate axis'
-        with assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df['newcol'] = s
 
         # GH 4107, more descriptive error message
@@ -101,7 +131,7 @@ def test_insert_error_msmgs(self):
                        columns=['a', 'b', 'c', 'd'])
 
         msg = 'incompatible index of inserted column with frame index'
-        with assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             df['gr'] = df.groupby(['b', 'c']).count()
 
     def test_insert_benchmark(self):
@@ -121,38 +151,40 @@ def test_insert(self):
                        columns=['c', 'b', 'a'])
 
         df.insert(0, 'foo', df['a'])
-        self.assert_index_equal(df.columns, Index(['foo', 'c', 'b', 'a']))
+        tm.assert_index_equal(df.columns, Index(['foo', 'c', 'b', 'a']))
         tm.assert_series_equal(df['a'], df['foo'], check_names=False)
 
         df.insert(2, 'bar', df['c'])
-        self.assert_index_equal(df.columns,
-                                Index(['foo', 'c', 'bar', 'b', 'a']))
+        tm.assert_index_equal(df.columns,
+                              Index(['foo', 'c', 'bar', 'b', 'a']))
         tm.assert_almost_equal(df['c'], df['bar'], check_names=False)
 
         # diff dtype
 
         # new item
         df['x'] = df['a'].astype('float32')
-        result = Series(dict(float64=5, float32=1))
-        self.assertTrue((df.get_dtype_counts() == result).all())
+        result = Series(dict(float32=1, float64=5))
+        assert (df.get_dtype_counts().sort_index() == result).all()
 
         # replacing current (in different block)
         df['a'] = df['a'].astype('float32')
-        result = Series(dict(float64=4, float32=2))
-        self.assertTrue((df.get_dtype_counts() == result).all())
+        result = Series(dict(float32=2, float64=4))
+        assert (df.get_dtype_counts().sort_index() == result).all()
 
         df['y'] = df['a'].astype('int32')
-        result = Series(dict(float64=4, float32=2, int32=1))
-        self.assertTrue((df.get_dtype_counts() == result).all())
+        result = Series(dict(float32=2, float64=4, int32=1))
+        assert (df.get_dtype_counts().sort_index() == result).all()
 
-        with assertRaisesRegexp(ValueError, 'already exists'):
+        with pytest.raises(ValueError, match='already exists'):
             df.insert(1, 'a', df['b'])
-        self.assertRaises(ValueError, df.insert, 1, 'c', df['b'])
+        msg = "cannot insert c, already exists"
+        with pytest.raises(ValueError, match=msg):
+            df.insert(1, 'c', df['b'])
 
         df.columns.name = 'some_name'
         # preserve columns name field
         df.insert(0, 'baz', df['c'])
-        self.assertEqual(df.columns.name, 'some_name')
+        assert df.columns.name == 'some_name'
 
         # GH 13522
         df = DataFrame(index=['A', 'B', 'C'])
@@ -163,7 +195,7 @@ def test_insert(self):
 
     def test_delitem(self):
         del self.frame['A']
-        self.assertNotIn('A', self.frame)
+        assert 'A' not in self.frame
 
     def test_delitem_multiindex(self):
         midx = MultiIndex.from_product([['A', 'B'], [1, 2]])
@@ -184,9 +216,10 @@ def test_delitem_multiindex(self):
         with pytest.raises(KeyError):
             del df[('A',)]
 
-        # xref: https://github.com/pandas-dev/pandas/issues/2770
-        # the 'A' is STILL in the columns!
-        assert 'A' in df.columns
+        # behavior of dropped/deleted MultiIndex levels changed from
+        # GH 2770 to GH 19027: MultiIndex no longer '.__contains__'
+        # levels which are dropped/deleted
+        assert 'A' not in df.columns
         with pytest.raises(KeyError):
             del df['A']
 
@@ -194,15 +227,14 @@ def test_pop(self):
         self.frame.columns.name = 'baz'
 
         self.frame.pop('A')
-        self.assertNotIn('A', self.frame)
+        assert 'A' not in self.frame
 
         self.frame['foo'] = 'bar'
         self.frame.pop('foo')
-        self.assertNotIn('foo', self.frame)
-        # TODO self.assertEqual(self.frame.columns.name, 'baz')
+        assert 'foo' not in self.frame
+        assert self.frame.columns.name == 'baz'
 
-        # 10912
-        # inplace ops cause caching issue
+        # gh-10912: inplace ops cause caching issue
         a = DataFrame([[1, 2, 3], [4, 5, 6]], columns=[
                       'A', 'B', 'C'], index=['X', 'Y'])
         b = a.pop('B')
@@ -211,23 +243,23 @@ def test_pop(self):
         # original frame
         expected = DataFrame([[1, 3], [4, 6]], columns=[
                              'A', 'C'], index=['X', 'Y'])
-        assert_frame_equal(a, expected)
+        tm.assert_frame_equal(a, expected)
 
         # result
         expected = Series([2, 5], index=['X', 'Y'], name='B') + 1
-        assert_series_equal(b, expected)
+        tm.assert_series_equal(b, expected)
 
     def test_pop_non_unique_cols(self):
         df = DataFrame({0: [0, 1], 1: [0, 1], 2: [4, 5]})
         df.columns = ["a", "b", "a"]
 
         res = df.pop("a")
-        self.assertEqual(type(res), DataFrame)
-        self.assertEqual(len(res), 2)
-        self.assertEqual(len(df.columns), 1)
-        self.assertTrue("b" in df.columns)
-        self.assertFalse("a" in df.columns)
-        self.assertEqual(len(df.index), 2)
+        assert type(res) == DataFrame
+        assert len(res) == 2
+        assert len(df.columns) == 1
+        assert "b" in df.columns
+        assert "a" not in df.columns
+        assert len(df.index) == 2
 
     def test_insert_column_bug_4032(self):
 
diff --git a/pandas/tests/frame/test_nonunique_indexes.py b/pandas/tests/frame/test_nonunique_indexes.py
index bb7c7c2bd012d..799d548100b5e 100644
--- a/pandas/tests/frame/test_nonunique_indexes.py
+++ b/pandas/tests/frame/test_nonunique_indexes.py
@@ -3,21 +3,18 @@
 from __future__ import print_function
 
 import numpy as np
+import pytest
 
 from pandas.compat import lrange, u
-from pandas import DataFrame, Series, MultiIndex, date_range
-import pandas as pd
-
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
-import pandas.util.testing as tm
 
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Series, date_range
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameNonuniqueIndexes(tm.TestCase, TestData):
+class TestDataFrameNonuniqueIndexes(TestData):
 
     def test_column_dups_operations(self):
 
@@ -52,7 +49,7 @@ def check(result, expected=None):
                               [2, 1, 3, 5, 'bah']],
                              columns=['foo', 'bar', 'foo', 'hello', 'string'])
         check(df, expected)
-        with assertRaisesRegexp(ValueError, 'Length of value'):
+        with pytest.raises(ValueError, match='Length of value'):
             df.insert(0, 'AnotherColumn', range(len(df.index) - 1))
 
         # insert same dtype
@@ -102,8 +99,9 @@ def check(result, expected=None):
         check(df, expected)
 
         # insert a dup
-        assertRaisesRegexp(ValueError, 'cannot insert',
-                           df.insert, 2, 'new_col', 4.)
+        with pytest.raises(ValueError, match='cannot insert'):
+            df.insert(2, 'new_col', 4.)
+
         df.insert(2, 'new_col', 4., allow_duplicates=True)
         expected = DataFrame([[1, 1, 4., 5., 'bah', 3],
                               [1, 2, 4., 5., 'bah', 3],
@@ -152,18 +150,18 @@ def check(result, expected=None):
         df = DataFrame([[1, 2.5], [3, 4.5]], index=[1, 2], columns=['x', 'x'])
         result = df.values
         expected = np.array([[1, 2.5], [3, 4.5]])
-        self.assertTrue((result == expected).all().all())
+        assert (result == expected).all().all()
 
         # rename, GH 4403
         df4 = DataFrame(
-            {'TClose': [22.02],
-             'RT': [0.0454],
+            {'RT': [0.0454],
+             'TClose': [22.02],
              'TExg': [0.0422]},
             index=MultiIndex.from_tuples([(600809, 20130331)],
                                          names=['STK_ID', 'RPT_Date']))
 
-        df5 = DataFrame({'STK_ID': [600809] * 3,
-                         'RPT_Date': [20120930, 20121231, 20130331],
+        df5 = DataFrame({'RPT_Date': [20120930, 20121231, 20130331],
+                         'STK_ID': [600809] * 3,
                          'STK_Name': [u('饡驦'), u('饡驦'), u('饡驦')],
                          'TClose': [38.05, 41.66, 30.01]},
                         index=MultiIndex.from_tuples(
@@ -189,8 +187,11 @@ def check(result, expected=None):
         # reindex is invalid!
         df = DataFrame([[1, 5, 7.], [1, 5, 7.], [1, 5, 7.]],
                        columns=['bar', 'a', 'a'])
-        self.assertRaises(ValueError, df.reindex, columns=['bar'])
-        self.assertRaises(ValueError, df.reindex, columns=['bar', 'foo'])
+        msg = "cannot reindex from a duplicate axis"
+        with pytest.raises(ValueError, match=msg):
+            df.reindex(columns=['bar'])
+        with pytest.raises(ValueError, match=msg):
+            df.reindex(columns=['bar', 'foo'])
 
         # drop
         df = DataFrame([[1, 5, 7.], [1, 5, 7.], [1, 5, 7.]],
@@ -215,9 +216,10 @@ def check(result, expected=None):
         for index in [df.index, pd.Index(list('edcba'))]:
             this_df = df.copy()
             expected_ser = pd.Series(index.values, index=this_df.index)
-            expected_df = DataFrame.from_items([('A', expected_ser),
-                                                ('B', this_df['B']),
-                                                ('A', expected_ser)])
+            expected_df = DataFrame({'A': expected_ser,
+                                     'B': this_df['B'],
+                                     'A': expected_ser},
+                                    columns=['A', 'B', 'A'])
             this_df['A'] = index
             check(this_df, expected_df)
 
@@ -307,7 +309,9 @@ def check(result, expected=None):
         # boolean with the duplicate raises
         df = DataFrame(np.arange(12).reshape(3, 4),
                        columns=dups, dtype='float64')
-        self.assertRaises(ValueError, lambda: df[df.A > 6])
+        msg = "cannot reindex from a duplicate axis"
+        with pytest.raises(ValueError, match=msg):
+            df[df.A > 6]
 
         # dup aligining operations should work
         # GH 5185
@@ -324,7 +328,9 @@ def check(result, expected=None):
                         columns=['A', 'A'])
 
         # not-comparing like-labelled
-        self.assertRaises(ValueError, lambda: df1 == df2)
+        msg = "Can only compare identically-labeled DataFrame objects"
+        with pytest.raises(ValueError, match=msg):
+            df1 == df2
 
         df1r = df1.reindex_like(df2)
         result = df1r == df2
@@ -411,7 +417,7 @@ def test_columns_with_dups(self):
         assert_frame_equal(df, expected)
 
         # this is an error because we cannot disambiguate the dup columns
-        self.assertRaises(Exception, lambda x: DataFrame(
+        pytest.raises(Exception, lambda x: DataFrame(
             [[1, 2, 'foo', 'bar']], columns=['a', 'a', 'a', 'a']))
 
         # dups across blocks
@@ -426,8 +432,8 @@ def test_columns_with_dups(self):
                           columns=df_float.columns)
         df = pd.concat([df_float, df_int, df_bool, df_object, df_dt], axis=1)
 
-        self.assertEqual(len(df._data._blknos), len(df.columns))
-        self.assertEqual(len(df._data._blklocs), len(df.columns))
+        assert len(df._data._blknos) == len(df.columns)
+        assert len(df._data._blklocs) == len(df.columns)
 
         # testing iloc
         for i in range(len(df.columns)):
@@ -440,7 +446,7 @@ def test_columns_with_dups(self):
         xp.columns = ['A', 'A', 'B']
         assert_frame_equal(rs, xp)
 
-    def test_as_matrix_duplicates(self):
+    def test_values_duplicates(self):
         df = DataFrame([[1, 2, 'a', 'b'],
                         [1, 2, 'a', 'b']],
                        columns=['one', 'one', 'two', 'two'])
@@ -449,7 +455,7 @@ def test_as_matrix_duplicates(self):
         expected = np.array([[1, 2, 'a', 'b'], [1, 2, 'a', 'b']],
                             dtype=object)
 
-        self.assertTrue(np.array_equal(result, expected))
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_set_value_by_index(self):
         # See gh-12344
diff --git a/pandas/tests/frame/test_operators.py b/pandas/tests/frame/test_operators.py
index 268854fe6b62d..e9521fa1506af 100644
--- a/pandas/tests/frame/test_operators.py
+++ b/pandas/tests/frame/test_operators.py
@@ -2,276 +2,149 @@
 
 from __future__ import print_function
 
-from datetime import datetime
+from decimal import Decimal
 import operator
 
+import numpy as np
 import pytest
 
-from numpy import nan, random
-import numpy as np
+from pandas.compat import range
 
-from pandas.compat import lrange
-from pandas import compat
-from pandas import (DataFrame, Series, MultiIndex, Timestamp,
-                    date_range)
-import pandas.core.common as com
-import pandas.formats.printing as printing
 import pandas as pd
-
-from pandas.util.testing import (assert_numpy_array_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
+from pandas import DataFrame, MultiIndex, Series, compat
+import pandas.core.common as com
+from pandas.tests.frame.common import TestData, _check_mixed_float
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_frame_equal, assert_numpy_array_equal, assert_series_equal)
+
+
+class TestDataFrameUnaryOperators(object):
+    # __pos__, __neg__, __inv__
+
+    @pytest.mark.parametrize('df,expected', [
+        (pd.DataFrame({'a': [-1, 1]}), pd.DataFrame({'a': [1, -1]})),
+        (pd.DataFrame({'a': [False, True]}),
+            pd.DataFrame({'a': [True, False]})),
+        (pd.DataFrame({'a': pd.Series(pd.to_timedelta([-1, 1]))}),
+            pd.DataFrame({'a': pd.Series(pd.to_timedelta([1, -1]))}))
+    ])
+    def test_neg_numeric(self, df, expected):
+        assert_frame_equal(-df, expected)
+        assert_series_equal(-df['a'], expected['a'])
+
+    @pytest.mark.parametrize('df, expected', [
+        (np.array([1, 2], dtype=object), np.array([-1, -2], dtype=object)),
+        ([Decimal('1.0'), Decimal('2.0')], [Decimal('-1.0'), Decimal('-2.0')]),
+    ])
+    def test_neg_object(self, df, expected):
+        # GH#21380
+        df = pd.DataFrame({'a': df})
+        expected = pd.DataFrame({'a': expected})
+        assert_frame_equal(-df, expected)
+        assert_series_equal(-df['a'], expected['a'])
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': ['a', 'b']}),
+        pd.DataFrame({'a': pd.to_datetime(['2017-01-22', '1970-01-01'])}),
+    ])
+    def test_neg_raises(self, df):
+        with pytest.raises(TypeError):
+            (- df)
+        with pytest.raises(TypeError):
+            (- df['a'])
 
-from pandas.tests.frame.common import (TestData, _check_mixed_float,
-                                       _check_mixed_int)
-
-
-class TestDataFrameOperators(tm.TestCase, TestData):
-
-    def test_operators(self):
-        garbage = random.random(4)
-        colSeries = Series(garbage, index=np.array(self.frame.columns))
-
-        idSum = self.frame + self.frame
-        seriesSum = self.frame + colSeries
-
-        for col, series in compat.iteritems(idSum):
-            for idx, val in compat.iteritems(series):
-                origVal = self.frame[col][idx] * 2
-                if not np.isnan(val):
-                    self.assertEqual(val, origVal)
-                else:
-                    self.assertTrue(np.isnan(origVal))
-
-        for col, series in compat.iteritems(seriesSum):
-            for idx, val in compat.iteritems(series):
-                origVal = self.frame[col][idx] + colSeries[col]
-                if not np.isnan(val):
-                    self.assertEqual(val, origVal)
-                else:
-                    self.assertTrue(np.isnan(origVal))
-
-        added = self.frame2 + self.frame2
-        expected = self.frame2 * 2
-        assert_frame_equal(added, expected)
-
-        df = DataFrame({'a': ['a', None, 'b']})
-        assert_frame_equal(df + df, DataFrame({'a': ['aa', np.nan, 'bb']}))
-
-        # Test for issue #10181
-        for dtype in ('float', 'int64'):
-            frames = [
-                DataFrame(dtype=dtype),
-                DataFrame(columns=['A'], dtype=dtype),
-                DataFrame(index=[0], dtype=dtype),
-            ]
-            for df in frames:
-                self.assertTrue((df + df).equals(df))
-                assert_frame_equal(df + df, df)
-
-    def test_ops_np_scalar(self):
-        vals, xs = np.random.rand(5, 3), [nan, 7, -23, 2.718, -3.14, np.inf]
-        f = lambda x: DataFrame(x, index=list('ABCDE'),
-                                columns=['jim', 'joe', 'jolie'])
-
-        df = f(vals)
-
-        for x in xs:
-            assert_frame_equal(df / np.array(x), f(vals / x))
-            assert_frame_equal(np.array(x) * df, f(vals * x))
-            assert_frame_equal(df + np.array(x), f(vals + x))
-            assert_frame_equal(np.array(x) - df, f(x - vals))
-
-    def test_operators_boolean(self):
-
-        # GH 5808
+    def test_invert(self):
+        _seriesd = tm.getSeriesData()
+        df = pd.DataFrame(_seriesd)
+
+        assert_frame_equal(-(df < 0), ~(df < 0))
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': [-1, 1]}),
+        pd.DataFrame({'a': [False, True]}),
+        pd.DataFrame({'a': pd.Series(pd.to_timedelta([-1, 1]))}),
+    ])
+    def test_pos_numeric(self, df):
+        # GH#16073
+        assert_frame_equal(+df, df)
+        assert_series_equal(+df['a'], df['a'])
+
+    @pytest.mark.parametrize('df', [
+        # numpy changing behavior in the future
+        pytest.param(pd.DataFrame({'a': ['a', 'b']}),
+                     marks=[pytest.mark.filterwarnings("ignore")]),
+        pd.DataFrame({'a': np.array([-1, 2], dtype=object)}),
+        pd.DataFrame({'a': [Decimal('-1.0'), Decimal('2.0')]}),
+    ])
+    def test_pos_object(self, df):
+        # GH#21380
+        assert_frame_equal(+df, df)
+        assert_series_equal(+df['a'], df['a'])
+
+    @pytest.mark.parametrize('df', [
+        pd.DataFrame({'a': pd.to_datetime(['2017-01-22', '1970-01-01'])}),
+    ])
+    def test_pos_raises(self, df):
+        with pytest.raises(TypeError):
+            (+ df)
+        with pytest.raises(TypeError):
+            (+ df['a'])
+
+
+class TestDataFrameLogicalOperators(object):
+    # &, |, ^
+
+    def test_logical_ops_empty_frame(self):
+        # GH#5808
         # empty frames, non-mixed dtype
+        df = DataFrame(index=[1])
 
-        result = DataFrame(index=[1]) & DataFrame(index=[1])
-        assert_frame_equal(result, DataFrame(index=[1]))
-
-        result = DataFrame(index=[1]) | DataFrame(index=[1])
-        assert_frame_equal(result, DataFrame(index=[1]))
-
-        result = DataFrame(index=[1]) & DataFrame(index=[1, 2])
-        assert_frame_equal(result, DataFrame(index=[1, 2]))
-
-        result = DataFrame(index=[1], columns=['A']) & DataFrame(
-            index=[1], columns=['A'])
-        assert_frame_equal(result, DataFrame(index=[1], columns=['A']))
-
-        result = DataFrame(True, index=[1], columns=['A']) & DataFrame(
-            True, index=[1], columns=['A'])
-        assert_frame_equal(result, DataFrame(True, index=[1], columns=['A']))
-
-        result = DataFrame(True, index=[1], columns=['A']) | DataFrame(
-            True, index=[1], columns=['A'])
-        assert_frame_equal(result, DataFrame(True, index=[1], columns=['A']))
-
-        # boolean ops
-        result = DataFrame(1, index=[1], columns=['A']) | DataFrame(
-            True, index=[1], columns=['A'])
-        assert_frame_equal(result, DataFrame(1, index=[1], columns=['A']))
+        result = df & df
+        assert_frame_equal(result, df)
 
-        def f():
-            DataFrame(1.0, index=[1], columns=['A']) | DataFrame(
-                True, index=[1], columns=['A'])
-        self.assertRaises(TypeError, f)
+        result = df | df
+        assert_frame_equal(result, df)
 
-        def f():
-            DataFrame('foo', index=[1], columns=['A']) | DataFrame(
-                True, index=[1], columns=['A'])
-        self.assertRaises(TypeError, f)
+        df2 = DataFrame(index=[1, 2])
+        result = df & df2
+        assert_frame_equal(result, df2)
 
-    def test_operators_none_as_na(self):
-        df = DataFrame({"col1": [2, 5.0, 123, None],
-                        "col2": [1, 2, 3, 4]}, dtype=object)
+        dfa = DataFrame(index=[1], columns=['A'])
 
-        ops = [operator.add, operator.sub, operator.mul, operator.truediv]
+        result = dfa & dfa
+        assert_frame_equal(result, dfa)
 
-        # since filling converts dtypes from object, changed expected to be
-        # object
-        for op in ops:
-            filled = df.fillna(np.nan)
-            result = op(df, 3)
-            expected = op(filled, 3).astype(object)
-            expected[com.isnull(expected)] = None
-            assert_frame_equal(result, expected)
+    def test_logical_ops_bool_frame(self):
+        # GH#5808
+        df1a_bool = DataFrame(True, index=[1], columns=['A'])
 
-            result = op(df, df)
-            expected = op(filled, filled).astype(object)
-            expected[com.isnull(expected)] = None
-            assert_frame_equal(result, expected)
+        result = df1a_bool & df1a_bool
+        assert_frame_equal(result, df1a_bool)
 
-            result = op(df, df.fillna(7))
-            assert_frame_equal(result, expected)
+        result = df1a_bool | df1a_bool
+        assert_frame_equal(result, df1a_bool)
 
-            result = op(df.fillna(7), df)
-            assert_frame_equal(result, expected, check_dtype=False)
+    def test_logical_ops_int_frame(self):
+        # GH#5808
+        df1a_int = DataFrame(1, index=[1], columns=['A'])
+        df1a_bool = DataFrame(True, index=[1], columns=['A'])
 
-    def test_comparison_invalid(self):
+        result = df1a_int | df1a_bool
+        assert_frame_equal(result, df1a_int)
 
-        def check(df, df2):
+    def test_logical_ops_invalid(self):
+        # GH#5808
 
-            for (x, y) in [(df, df2), (df2, df)]:
-                self.assertRaises(TypeError, lambda: x == y)
-                self.assertRaises(TypeError, lambda: x != y)
-                self.assertRaises(TypeError, lambda: x >= y)
-                self.assertRaises(TypeError, lambda: x > y)
-                self.assertRaises(TypeError, lambda: x < y)
-                self.assertRaises(TypeError, lambda: x <= y)
-
-        # GH4968
-        # invalid date/int comparisons
-        df = DataFrame(np.random.randint(10, size=(10, 1)), columns=['a'])
-        df['dates'] = date_range('20010101', periods=len(df))
-
-        df2 = df.copy()
-        df2['dates'] = df['a']
-        check(df, df2)
-
-        df = DataFrame(np.random.randint(10, size=(10, 2)), columns=['a', 'b'])
-        df2 = DataFrame({'a': date_range('20010101', periods=len(
-            df)), 'b': date_range('20100101', periods=len(df))})
-        check(df, df2)
-
-    def test_timestamp_compare(self):
-        # make sure we can compare Timestamps on the right AND left hand side
-        # GH4982
-        df = DataFrame({'dates1': date_range('20010101', periods=10),
-                        'dates2': date_range('20010102', periods=10),
-                        'intcol': np.random.randint(1000000000, size=10),
-                        'floatcol': np.random.randn(10),
-                        'stringcol': list(tm.rands(10))})
-        df.loc[np.random.rand(len(df)) > 0.5, 'dates2'] = pd.NaT
-        ops = {'gt': 'lt', 'lt': 'gt', 'ge': 'le', 'le': 'ge', 'eq': 'eq',
-               'ne': 'ne'}
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-
-            # no nats
-            expected = left_f(df, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), df)
-            assert_frame_equal(result, expected)
-
-            # nats
-            expected = left_f(df, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), df)
-            assert_frame_equal(result, expected)
+        df1 = DataFrame(1.0, index=[1], columns=['A'])
+        df2 = DataFrame(True, index=[1], columns=['A'])
+        with pytest.raises(TypeError):
+            df1 | df2
 
-    def test_modulo(self):
-        # GH3590, modulo as ints
-        p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-
-        # this is technically wrong as the integer portion is coerced to float
-        # ###
-        expected = DataFrame({'first': Series([0, 0, 0, 0], dtype='float64'),
-                              'second': Series([np.nan, np.nan, np.nan, 0])})
-        result = p % p
-        assert_frame_equal(result, expected)
-
-        # numpy has a slightly different (wrong) treatement
-        with np.errstate(all='ignore'):
-            arr = p.values % p.values
-        result2 = DataFrame(arr, index=p.index,
-                            columns=p.columns, dtype='float64')
-        result2.iloc[0:3, 1] = np.nan
-        assert_frame_equal(result2, expected)
-
-        result = p % 0
-        expected = DataFrame(np.nan, index=p.index, columns=p.columns)
-        assert_frame_equal(result, expected)
-
-        # numpy has a slightly different (wrong) treatement
-        with np.errstate(all='ignore'):
-            arr = p.values.astype('float64') % 0
-        result2 = DataFrame(arr, index=p.index, columns=p.columns)
-        assert_frame_equal(result2, expected)
-
-        # not commutative with series
-        p = DataFrame(np.random.randn(10, 5))
-        s = p[0]
-        res = s % p
-        res2 = p % s
-        self.assertFalse(np.array_equal(res.fillna(0), res2.fillna(0)))
-
-    def test_div(self):
-
-        # integer div, but deal with the 0's (GH 9144)
-        p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-        result = p / p
-
-        expected = DataFrame({'first': Series([1.0, 1.0, 1.0, 1.0]),
-                              'second': Series([nan, nan, nan, 1])})
-        assert_frame_equal(result, expected)
-
-        with np.errstate(all='ignore'):
-            arr = p.values.astype('float') / p.values
-        result2 = DataFrame(arr, index=p.index,
-                            columns=p.columns)
-        assert_frame_equal(result2, expected)
-
-        result = p / 0
-        expected = DataFrame(np.inf, index=p.index, columns=p.columns)
-        expected.iloc[0:3, 1] = nan
-        assert_frame_equal(result, expected)
-
-        # numpy has a slightly different (wrong) treatement
-        with np.errstate(all='ignore'):
-            arr = p.values.astype('float64') / 0
-        result2 = DataFrame(arr, index=p.index,
-                            columns=p.columns)
-        assert_frame_equal(result2, expected)
-
-        p = DataFrame(np.random.randn(10, 5))
-        s = p[0]
-        res = s / p
-        res2 = p / s
-        self.assertFalse(np.array_equal(res.fillna(0), res2.fillna(0)))
+        df1 = DataFrame('foo', index=[1], columns=['A'])
+        df2 = DataFrame(True, index=[1], columns=['A'])
+        with pytest.raises(TypeError):
+            df1 | df2
 
     def test_logical_operators(self):
 
@@ -279,14 +152,14 @@ def _check_bin_op(op):
             result = op(df1, df2)
             expected = DataFrame(op(df1.values, df2.values), index=df1.index,
                                  columns=df1.columns)
-            self.assertEqual(result.values.dtype, np.bool_)
+            assert result.values.dtype == np.bool_
             assert_frame_equal(result, expected)
 
         def _check_unary_op(op):
             result = op(df1)
             expected = DataFrame(op(df1.values), index=df1.index,
                                  columns=df1.columns)
-            self.assertEqual(result.values.dtype, np.bool_)
+            assert result.values.dtype == np.bool_
             assert_frame_equal(result, expected)
 
         df1 = {'a': {'a': True, 'b': False, 'c': False, 'd': True, 'e': True},
@@ -313,17 +186,7 @@ def _check_unary_op(op):
         _check_bin_op(operator.or_)
         _check_bin_op(operator.xor)
 
-        # operator.neg is deprecated in numpy >= 1.9
-        _check_unary_op(operator.inv)
-
-    def test_logical_typeerror(self):
-        if not compat.PY3:
-            self.assertRaises(TypeError, self.frame.__eq__, 'foo')
-            self.assertRaises(TypeError, self.frame.__lt__, 'foo')
-            self.assertRaises(TypeError, self.frame.__gt__, 'foo')
-            self.assertRaises(TypeError, self.frame.__ne__, 'foo')
-        else:
-            pytest.skip('test_logical_typeerror not tested on PY3')
+        _check_unary_op(operator.inv)  # TODO: belongs elsewhere
 
     def test_logical_with_nas(self):
         d = DataFrame({'a': [np.nan, False], 'b': [True, True]})
@@ -343,115 +206,42 @@ def test_logical_with_nas(self):
         expected = Series([True, True])
         assert_series_equal(result, expected)
 
-    def test_neg(self):
-        # what to do?
-        assert_frame_equal(-self.frame, -1 * self.frame)
 
-    def test_invert(self):
-        assert_frame_equal(-(self.frame < 0), ~(self.frame < 0))
-
-    def test_arith_flex_frame(self):
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'pow', 'floordiv', 'mod']
-        if not compat.PY3:
-            aliases = {}
-        else:
-            aliases = {'div': 'truediv'}
-
-        for op in ops:
-            try:
-                alias = aliases.get(op, op)
-                f = getattr(operator, alias)
-                result = getattr(self.frame, op)(2 * self.frame)
-                exp = f(self.frame, 2 * self.frame)
-                assert_frame_equal(result, exp)
-
-                # vs mix float
-                result = getattr(self.mixed_float, op)(2 * self.mixed_float)
-                exp = f(self.mixed_float, 2 * self.mixed_float)
-                assert_frame_equal(result, exp)
-                _check_mixed_float(result, dtype=dict(C=None))
-
-                # vs mix int
-                if op in ['add', 'sub', 'mul']:
-                    result = getattr(self.mixed_int, op)(2 + self.mixed_int)
-                    exp = f(self.mixed_int, 2 + self.mixed_int)
-
-                    # no overflow in the uint
-                    dtype = None
-                    if op in ['sub']:
-                        dtype = dict(B='uint64', C=None)
-                    elif op in ['add', 'mul']:
-                        dtype = dict(C=None)
-                    assert_frame_equal(result, exp)
-                    _check_mixed_int(result, dtype=dtype)
-
-                    # rops
-                    r_f = lambda x, y: f(y, x)
-                    result = getattr(self.frame, 'r' + op)(2 * self.frame)
-                    exp = r_f(self.frame, 2 * self.frame)
-                    assert_frame_equal(result, exp)
-
-                    # vs mix float
-                    result = getattr(self.mixed_float, op)(
-                        2 * self.mixed_float)
-                    exp = f(self.mixed_float, 2 * self.mixed_float)
-                    assert_frame_equal(result, exp)
-                    _check_mixed_float(result, dtype=dict(C=None))
-
-                    result = getattr(self.intframe, op)(2 * self.intframe)
-                    exp = f(self.intframe, 2 * self.intframe)
-                    assert_frame_equal(result, exp)
-
-                    # vs mix int
-                    if op in ['add', 'sub', 'mul']:
-                        result = getattr(self.mixed_int, op)(
-                            2 + self.mixed_int)
-                        exp = f(self.mixed_int, 2 + self.mixed_int)
-
-                        # no overflow in the uint
-                        dtype = None
-                        if op in ['sub']:
-                            dtype = dict(B='uint64', C=None)
-                        elif op in ['add', 'mul']:
-                            dtype = dict(C=None)
-                        assert_frame_equal(result, exp)
-                        _check_mixed_int(result, dtype=dtype)
-            except:
-                printing.pprint_thing("Failing operation %r" % op)
-                raise
-
-            # ndim >= 3
-            ndim_5 = np.ones(self.frame.shape + (3, 4, 5))
-            msg = "Unable to coerce to Series/DataFrame"
-            with assertRaisesRegexp(ValueError, msg):
-                f(self.frame, ndim_5)
-
-            with assertRaisesRegexp(ValueError, msg):
-                getattr(self.frame, op)(ndim_5)
-
-        # res_add = self.frame.add(self.frame)
-        # res_sub = self.frame.sub(self.frame)
-        # res_mul = self.frame.mul(self.frame)
-        # res_div = self.frame.div(2 * self.frame)
-
-        # assert_frame_equal(res_add, self.frame + self.frame)
-        # assert_frame_equal(res_sub, self.frame - self.frame)
-        # assert_frame_equal(res_mul, self.frame * self.frame)
-        # assert_frame_equal(res_div, self.frame / (2 * self.frame))
-
-        const_add = self.frame.add(1)
-        assert_frame_equal(const_add, self.frame + 1)
+class TestDataFrameOperators(TestData):
 
-        # corner cases
-        result = self.frame.add(self.frame[:0])
-        assert_frame_equal(result, self.frame * np.nan)
+    @pytest.mark.parametrize('op', [operator.add, operator.sub,
+                                    operator.mul, operator.truediv])
+    def test_operators_none_as_na(self, op):
+        df = DataFrame({"col1": [2, 5.0, 123, None],
+                        "col2": [1, 2, 3, 4]}, dtype=object)
+
+        # since filling converts dtypes from object, changed expected to be
+        # object
+        filled = df.fillna(np.nan)
+        result = op(df, 3)
+        expected = op(filled, 3).astype(object)
+        expected[com.isna(expected)] = None
+        assert_frame_equal(result, expected)
 
-        result = self.frame[:0].add(self.frame)
-        assert_frame_equal(result, self.frame * np.nan)
-        with assertRaisesRegexp(NotImplementedError, 'fill_value'):
-            self.frame.add(self.frame.iloc[0], fill_value=3)
-        with assertRaisesRegexp(NotImplementedError, 'fill_value'):
-            self.frame.add(self.frame.iloc[0], axis='index', fill_value=3)
+        result = op(df, df)
+        expected = op(filled, filled).astype(object)
+        expected[com.isna(expected)] = None
+        assert_frame_equal(result, expected)
+
+        result = op(df, df.fillna(7))
+        assert_frame_equal(result, expected)
+
+        result = op(df.fillna(7), df)
+        assert_frame_equal(result, expected, check_dtype=False)
+
+    @pytest.mark.parametrize('op,res', [('__eq__', False),
+                                        ('__ne__', True)])
+    # TODO: not sure what's correct here.
+    @pytest.mark.filterwarnings("ignore:elementwise:FutureWarning")
+    def test_logical_typeerror_with_non_valid(self, op, res):
+        # we are comparing floats vs a string
+        result = getattr(self.frame, op)('foo')
+        assert bool(result.all().all()) is res
 
     def test_binary_ops_align(self):
 
@@ -517,174 +307,6 @@ def test_binary_ops_align(self):
         for res in [res3, res4, res5, res6]:
             assert_frame_equal(res, exp)
 
-    def test_arith_mixed(self):
-
-        left = DataFrame({'A': ['a', 'b', 'c'],
-                          'B': [1, 2, 3]})
-
-        result = left + left
-        expected = DataFrame({'A': ['aa', 'bb', 'cc'],
-                              'B': [2, 4, 6]})
-        assert_frame_equal(result, expected)
-
-    def test_arith_getitem_commute(self):
-        df = DataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
-
-        self._test_op(df, operator.add)
-        self._test_op(df, operator.sub)
-        self._test_op(df, operator.mul)
-        self._test_op(df, operator.truediv)
-        self._test_op(df, operator.floordiv)
-        self._test_op(df, operator.pow)
-
-        self._test_op(df, lambda x, y: y + x)
-        self._test_op(df, lambda x, y: y - x)
-        self._test_op(df, lambda x, y: y * x)
-        self._test_op(df, lambda x, y: y / x)
-        self._test_op(df, lambda x, y: y ** x)
-
-        self._test_op(df, lambda x, y: x + y)
-        self._test_op(df, lambda x, y: x - y)
-        self._test_op(df, lambda x, y: x * y)
-        self._test_op(df, lambda x, y: x / y)
-        self._test_op(df, lambda x, y: x ** y)
-
-    @staticmethod
-    def _test_op(df, op):
-        result = op(df, 1)
-
-        if not df.columns.is_unique:
-            raise ValueError("Only unique columns supported by this test")
-
-        for col in result.columns:
-            assert_series_equal(result[col], op(df[col], 1))
-
-    def test_bool_flex_frame(self):
-        data = np.random.randn(5, 3)
-        other_data = np.random.randn(5, 3)
-        df = DataFrame(data)
-        other = DataFrame(other_data)
-        ndim_5 = np.ones(df.shape + (1, 3))
-
-        # Unaligned
-        def _check_unaligned_frame(meth, op, df, other):
-            part_o = other.loc[3:, 1:].copy()
-            rs = meth(part_o)
-            xp = op(df, part_o.reindex(index=df.index, columns=df.columns))
-            assert_frame_equal(rs, xp)
-
-        # DataFrame
-        self.assertTrue(df.eq(df).values.all())
-        self.assertFalse(df.ne(df).values.any())
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            f = getattr(df, op)
-            o = getattr(operator, op)
-            # No NAs
-            assert_frame_equal(f(other), o(df, other))
-            _check_unaligned_frame(f, o, df, other)
-            # ndarray
-            assert_frame_equal(f(other.values), o(df, other.values))
-            # scalar
-            assert_frame_equal(f(0), o(df, 0))
-            # NAs
-            msg = "Unable to coerce to Series/DataFrame"
-            assert_frame_equal(f(np.nan), o(df, np.nan))
-            with assertRaisesRegexp(ValueError, msg):
-                f(ndim_5)
-
-        # Series
-        def _test_seq(df, idx_ser, col_ser):
-            idx_eq = df.eq(idx_ser, axis=0)
-            col_eq = df.eq(col_ser)
-            idx_ne = df.ne(idx_ser, axis=0)
-            col_ne = df.ne(col_ser)
-            assert_frame_equal(col_eq, df == Series(col_ser))
-            assert_frame_equal(col_eq, -col_ne)
-            assert_frame_equal(idx_eq, -idx_ne)
-            assert_frame_equal(idx_eq, df.T.eq(idx_ser).T)
-            assert_frame_equal(col_eq, df.eq(list(col_ser)))
-            assert_frame_equal(idx_eq, df.eq(Series(idx_ser), axis=0))
-            assert_frame_equal(idx_eq, df.eq(list(idx_ser), axis=0))
-
-            idx_gt = df.gt(idx_ser, axis=0)
-            col_gt = df.gt(col_ser)
-            idx_le = df.le(idx_ser, axis=0)
-            col_le = df.le(col_ser)
-
-            assert_frame_equal(col_gt, df > Series(col_ser))
-            assert_frame_equal(col_gt, -col_le)
-            assert_frame_equal(idx_gt, -idx_le)
-            assert_frame_equal(idx_gt, df.T.gt(idx_ser).T)
-
-            idx_ge = df.ge(idx_ser, axis=0)
-            col_ge = df.ge(col_ser)
-            idx_lt = df.lt(idx_ser, axis=0)
-            col_lt = df.lt(col_ser)
-            assert_frame_equal(col_ge, df >= Series(col_ser))
-            assert_frame_equal(col_ge, -col_lt)
-            assert_frame_equal(idx_ge, -idx_lt)
-            assert_frame_equal(idx_ge, df.T.ge(idx_ser).T)
-
-        idx_ser = Series(np.random.randn(5))
-        col_ser = Series(np.random.randn(3))
-        _test_seq(df, idx_ser, col_ser)
-
-        # list/tuple
-        _test_seq(df, idx_ser.values, col_ser.values)
-
-        # NA
-        df.loc[0, 0] = np.nan
-        rs = df.eq(df)
-        self.assertFalse(rs.loc[0, 0])
-        rs = df.ne(df)
-        self.assertTrue(rs.loc[0, 0])
-        rs = df.gt(df)
-        self.assertFalse(rs.loc[0, 0])
-        rs = df.lt(df)
-        self.assertFalse(rs.loc[0, 0])
-        rs = df.ge(df)
-        self.assertFalse(rs.loc[0, 0])
-        rs = df.le(df)
-        self.assertFalse(rs.loc[0, 0])
-
-        # complex
-        arr = np.array([np.nan, 1, 6, np.nan])
-        arr2 = np.array([2j, np.nan, 7, None])
-        df = DataFrame({'a': arr})
-        df2 = DataFrame({'a': arr2})
-        rs = df.gt(df2)
-        self.assertFalse(rs.values.any())
-        rs = df.ne(df2)
-        self.assertTrue(rs.values.all())
-
-        arr3 = np.array([2j, np.nan, None])
-        df3 = DataFrame({'a': arr3})
-        rs = df3.gt(2j)
-        self.assertFalse(rs.values.any())
-
-        # corner, dtype=object
-        df1 = DataFrame({'col': ['foo', np.nan, 'bar']})
-        df2 = DataFrame({'col': ['foo', datetime.now(), 'bar']})
-        result = df1.ne(df2)
-        exp = DataFrame({'col': [False, True, False]})
-        assert_frame_equal(result, exp)
-
-    def test_return_dtypes_bool_op_costant(self):
-        # GH15077
-        df = DataFrame({'x': [1, 2, 3], 'y': [1., 2., 3.]})
-        const = 2
-
-        # not empty DataFrame
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            result = getattr(df, op)(const).get_dtype_counts()
-            self.assert_series_equal(result, Series([2], ['bool']))
-
-        # empty DataFrame
-        empty = df.iloc[:0]
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            result = getattr(empty, op)(const).get_dtype_counts()
-            self.assert_series_equal(result, Series([2], ['bool']))
-
     def test_dti_tz_convert_to_utc(self):
         base = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
                                  '2011-01-03'], tz='UTC')
@@ -696,102 +318,46 @@ def test_dti_tz_convert_to_utc(self):
         exp = DataFrame({'A': [np.nan, 3, np.nan]}, index=base)
         assert_frame_equal(df1 + df2, exp)
 
-    def test_arith_flex_series(self):
-        df = self.simple
-
-        row = df.xs('a')
-        col = df['two']
-        # after arithmetic refactor, add truediv here
-        ops = ['add', 'sub', 'mul', 'mod']
-        for op in ops:
-            f = getattr(df, op)
-            op = getattr(operator, op)
-            assert_frame_equal(f(row), op(df, row))
-            assert_frame_equal(f(col, axis=0), op(df.T, col).T)
-
-        # special case for some reason
-        assert_frame_equal(df.add(row, axis=None), df + row)
-
-        # cases which will be refactored after big arithmetic refactor
-        assert_frame_equal(df.div(row), df / row)
-        assert_frame_equal(df.div(col, axis=0), (df.T / col).T)
-
-        # broadcasting issue in GH7325
-        df = DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='int64')
-        expected = DataFrame([[nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
-        result = df.div(df[0], axis='index')
-        assert_frame_equal(result, expected)
-
-        df = DataFrame(np.arange(3 * 2).reshape((3, 2)), dtype='float64')
-        expected = DataFrame([[np.nan, np.inf], [1.0, 1.5], [1.0, 1.25]])
-        result = df.div(df[0], axis='index')
-        assert_frame_equal(result, expected)
-
-    def test_arith_non_pandas_object(self):
-        df = self.simple
-
-        val1 = df.xs('a').values
-        added = DataFrame(df.values + val1, index=df.index, columns=df.columns)
-        assert_frame_equal(df + val1, added)
-
-        added = DataFrame((df.values.T + val1).T,
-                          index=df.index, columns=df.columns)
-        assert_frame_equal(df.add(val1, axis=0), added)
-
-        val2 = list(df['two'])
-
-        added = DataFrame(df.values + val2, index=df.index, columns=df.columns)
-        assert_frame_equal(df + val2, added)
-
-        added = DataFrame((df.values.T + val2).T, index=df.index,
-                          columns=df.columns)
-        assert_frame_equal(df.add(val2, axis='index'), added)
-
-        val3 = np.random.rand(*df.shape)
-        added = DataFrame(df.values + val3, index=df.index, columns=df.columns)
-        assert_frame_equal(df.add(val3), added)
-
     def test_combineFrame(self):
         frame_copy = self.frame.reindex(self.frame.index[::2])
 
         del frame_copy['D']
-        frame_copy['C'][:5] = nan
+        frame_copy['C'][:5] = np.nan
 
         added = self.frame + frame_copy
 
-        indexer = added['A'].valid().index
+        indexer = added['A'].dropna().index
         exp = (self.frame['A'] * 2).copy()
 
-        tm.assert_series_equal(added['A'].valid(), exp.loc[indexer])
+        tm.assert_series_equal(added['A'].dropna(), exp.loc[indexer])
 
         exp.loc[~exp.index.isin(indexer)] = np.nan
         tm.assert_series_equal(added['A'], exp.loc[added['A'].index])
 
-        self.assertTrue(
-            np.isnan(added['C'].reindex(frame_copy.index)[:5]).all())
+        assert np.isnan(added['C'].reindex(frame_copy.index)[:5]).all()
 
         # assert(False)
 
-        self.assertTrue(np.isnan(added['D']).all())
+        assert np.isnan(added['D']).all()
 
         self_added = self.frame + self.frame
-        self.assert_index_equal(self_added.index, self.frame.index)
+        tm.assert_index_equal(self_added.index, self.frame.index)
 
         added_rev = frame_copy + self.frame
-        self.assertTrue(np.isnan(added['D']).all())
-        self.assertTrue(np.isnan(added_rev['D']).all())
+        assert np.isnan(added['D']).all()
+        assert np.isnan(added_rev['D']).all()
 
         # corner cases
 
         # empty
         plus_empty = self.frame + self.empty
-        self.assertTrue(np.isnan(plus_empty.values).all())
+        assert np.isnan(plus_empty.values).all()
 
         empty_plus = self.empty + self.frame
-        self.assertTrue(np.isnan(empty_plus.values).all())
+        assert np.isnan(empty_plus.values).all()
 
         empty_empty = self.empty + self.empty
-        self.assertTrue(empty_empty.empty)
+        assert empty_empty.empty
 
         # out of order
         reverse = self.frame.reindex(columns=self.frame.columns[::-1])
@@ -831,12 +397,14 @@ def test_combineSeries(self):
 
         for key, s in compat.iteritems(self.frame):
             assert_series_equal(larger_added[key], s + series[key])
-        self.assertIn('E', larger_added)
-        self.assertTrue(np.isnan(larger_added['E']).all())
+        assert 'E' in larger_added
+        assert np.isnan(larger_added['E']).all()
 
-        # vs mix (upcast) as needed
+        # no upcast needed
         added = self.mixed_float + series
-        _check_mixed_float(added, dtype='float64')
+        _check_mixed_float(added)
+
+        # vs mix (upcast) as needed
         added = self.mixed_float + series.astype('float32')
         _check_mixed_float(added, dtype=dict(C=None))
         added = self.mixed_float + series.astype('float16')
@@ -857,22 +425,22 @@ def test_combineSeries(self):
 
         # 10890
         # we no longer allow auto timeseries broadcasting
-        # and require explict broadcasting
+        # and require explicit broadcasting
         added = self.tsframe.add(ts, axis='index')
 
         for key, col in compat.iteritems(self.tsframe):
             result = col + ts
             assert_series_equal(added[key], result, check_names=False)
-            self.assertEqual(added[key].name, key)
+            assert added[key].name == key
             if col.name == ts.name:
-                self.assertEqual(result.name, 'A')
+                assert result.name == 'A'
             else:
-                self.assertTrue(result.name is None)
+                assert result.name is None
 
         smaller_frame = self.tsframe[:-5]
         smaller_added = smaller_frame.add(ts, axis='index')
 
-        self.assert_index_equal(smaller_added.index, self.tsframe.index)
+        tm.assert_index_equal(smaller_added.index, self.tsframe.index)
 
         smaller_ts = ts[:-5]
         smaller_added2 = self.tsframe.add(smaller_ts, axis='index')
@@ -893,22 +461,22 @@ def test_combineSeries(self):
         # empty but with non-empty index
         frame = self.tsframe[:1].reindex(columns=[])
         result = frame.mul(ts, axis='index')
-        self.assertEqual(len(result), len(ts))
+        assert len(result) == len(ts)
 
     def test_combineFunc(self):
         result = self.frame * 2
-        self.assert_numpy_array_equal(result.values, self.frame.values * 2)
+        tm.assert_numpy_array_equal(result.values, self.frame.values * 2)
 
         # vs mix
         result = self.mixed_float * 2
         for c, s in compat.iteritems(result):
-            self.assert_numpy_array_equal(
+            tm.assert_numpy_array_equal(
                 s.values, self.mixed_float[c].values * 2)
         _check_mixed_float(result, dtype=dict(C=None))
 
         result = self.empty * 2
-        self.assertIs(result.index, self.empty.index)
-        self.assertEqual(len(result.columns), 0)
+        assert result.index is self.empty.index
+        assert len(result.columns) == 0
 
     def test_comparisons(self):
         df1 = tm.makeTimeDataFrame()
@@ -919,21 +487,22 @@ def test_comparisons(self):
 
         def test_comp(func):
             result = func(df1, df2)
-            self.assert_numpy_array_equal(result.values,
-                                          func(df1.values, df2.values))
-            with assertRaisesRegexp(ValueError, 'Wrong number of dimensions'):
+            tm.assert_numpy_array_equal(result.values,
+                                        func(df1.values, df2.values))
+
+            with pytest.raises(ValueError, match='dim must be <= 2'):
                 func(df1, ndim_5)
 
             result2 = func(self.simple, row)
-            self.assert_numpy_array_equal(result2.values,
-                                          func(self.simple.values, row.values))
+            tm.assert_numpy_array_equal(result2.values,
+                                        func(self.simple.values, row.values))
 
             result3 = func(self.frame, 0)
-            self.assert_numpy_array_equal(result3.values,
-                                          func(self.frame.values, 0))
+            tm.assert_numpy_array_equal(result3.values,
+                                        func(self.frame.values, 0))
 
-            with assertRaisesRegexp(ValueError, 'Can only compare '
-                                    'identically-labeled DataFrame'):
+            msg = 'Can only compare identically-labeled DataFrame'
+            with pytest.raises(ValueError, match=msg):
                 func(self.simple, self.simple[:2])
 
         test_comp(operator.eq)
@@ -950,23 +519,7 @@ def test_comparison_protected_from_errstate(self):
             expected = missing_df.values < 0
         with np.errstate(invalid='raise'):
             result = (missing_df < 0).values
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_string_comparison(self):
-        df = DataFrame([{"a": 1, "b": "foo"}, {"a": 2, "b": "bar"}])
-        mask_a = df.a > 1
-        assert_frame_equal(df[mask_a], df.loc[1:1, :])
-        assert_frame_equal(df[-mask_a], df.loc[0:0, :])
-
-        mask_b = df.b == "foo"
-        assert_frame_equal(df[mask_b], df.loc[0:0, :])
-        assert_frame_equal(df[-mask_b], df.loc[1:1, :])
-
-    def test_float_none_comparison(self):
-        df = DataFrame(np.random.randn(8, 3), index=lrange(8),
-                       columns=['A', 'B', 'C'])
-
-        self.assertRaises(TypeError, df.__eq__, None)
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_boolean_comparison(self):
 
@@ -976,8 +529,8 @@ def test_boolean_comparison(self):
         b = np.array([2, 2])
         b_r = np.atleast_2d([2, 2])
         b_c = b_r.T
-        l = (2, 2, 2)
-        tup = tuple(l)
+        lst = [2, 2, 2]
+        tup = tuple(lst)
 
         # gt
         expected = DataFrame([[False, False], [False, True], [True, True]])
@@ -987,40 +540,52 @@ def test_boolean_comparison(self):
         result = df.values > b
         assert_numpy_array_equal(result, expected.values)
 
-        result = df > l
-        assert_frame_equal(result, expected)
+        msg1d = 'Unable to coerce to Series, length must be 2: given 3'
+        msg2d = 'Unable to coerce to DataFrame, shape must be'
+        msg2db = 'operands could not be broadcast together with shapes'
+        with pytest.raises(ValueError, match=msg1d):
+            # wrong shape
+            df > lst
 
-        result = df > tup
-        assert_frame_equal(result, expected)
+        with pytest.raises(ValueError, match=msg1d):
+            # wrong shape
+            result = df > tup
 
+        # broadcasts like ndarray (GH#23000)
         result = df > b_r
         assert_frame_equal(result, expected)
 
         result = df.values > b_r
         assert_numpy_array_equal(result, expected.values)
 
-        self.assertRaises(ValueError, df.__gt__, b_c)
-        self.assertRaises(ValueError, df.values.__gt__, b_c)
+        with pytest.raises(ValueError, match=msg2d):
+            df > b_c
+
+        with pytest.raises(ValueError, match=msg2db):
+            df.values > b_c
 
         # ==
         expected = DataFrame([[False, False], [True, False], [False, False]])
         result = df == b
         assert_frame_equal(result, expected)
 
-        result = df == l
-        assert_frame_equal(result, expected)
+        with pytest.raises(ValueError, match=msg1d):
+            result = df == lst
 
-        result = df == tup
-        assert_frame_equal(result, expected)
+        with pytest.raises(ValueError, match=msg1d):
+            result = df == tup
 
+        # broadcasts like ndarray (GH#23000)
         result = df == b_r
         assert_frame_equal(result, expected)
 
         result = df.values == b_r
         assert_numpy_array_equal(result, expected.values)
 
-        self.assertRaises(ValueError, lambda: df == b_c)
-        self.assertFalse(np.array_equal(df.values, b_c))
+        with pytest.raises(ValueError, match=msg2d):
+            df == b_c
+
+        assert df.values.shape != b_c.shape
 
         # with alignment
         df = DataFrame(np.arange(6).reshape((3, 2)),
@@ -1028,15 +593,11 @@ def test_boolean_comparison(self):
         expected.index = df.index
         expected.columns = df.columns
 
-        result = df == l
-        assert_frame_equal(result, expected)
+        with pytest.raises(ValueError, match=msg1d):
+            result = df == lst
 
-        result = df == tup
-        assert_frame_equal(result, expected)
-
-        # not shape compatible
-        self.assertRaises(ValueError, lambda: df == (2, 2))
-        self.assertRaises(ValueError, lambda: df == [2, 2])
+        with pytest.raises(ValueError, match=msg1d):
+            result = df == tup
 
     def test_combine_generic(self):
         df1 = self.frame
@@ -1044,8 +605,8 @@ def test_combine_generic(self):
 
         combined = df1.combine(df2, np.add)
         combined2 = df2.combine(df1, np.add)
-        self.assertTrue(combined['D'].isnull().all())
-        self.assertTrue(combined2['D'].isnull().all())
+        assert combined['D'].isna().all()
+        assert combined2['D'].isna().all()
 
         chunk = combined.loc[combined.index[:-5], ['A', 'B', 'C']]
         chunk2 = combined2.loc[combined2.index[:-5], ['A', 'B', 'C']]
@@ -1115,16 +676,16 @@ def test_inplace_ops_identity(self):
         s += 1
         assert_series_equal(s, s2)
         assert_series_equal(s_orig + 1, s)
-        self.assertIs(s, s2)
-        self.assertIs(s._data, s2._data)
+        assert s is s2
+        assert s._data is s2._data
 
         df = df_orig.copy()
         df2 = df
         df += 1
         assert_frame_equal(df, df2)
         assert_frame_equal(df_orig + 1, df)
-        self.assertIs(df, df2)
-        self.assertIs(df._data, df2._data)
+        assert df is df2
+        assert df._data is df2._data
 
         # dtype change
         s = s_orig.copy()
@@ -1138,8 +699,8 @@ def test_inplace_ops_identity(self):
         df += 1.5
         assert_frame_equal(df, df2)
         assert_frame_equal(df_orig + 1.5, df)
-        self.assertIs(df, df2)
-        self.assertIs(df._data, df2._data)
+        assert df is df2
+        assert df._data is df2._data
 
         # mixed dtype
         arr = np.random.randint(0, 10, size=5)
@@ -1150,7 +711,7 @@ def test_inplace_ops_identity(self):
         expected = DataFrame({'A': arr.copy() + 1, 'B': 'foo'})
         assert_frame_equal(df, expected)
         assert_frame_equal(df2, expected)
-        self.assertIs(df._data, df2._data)
+        assert df._data is df2._data
 
         df = df_orig.copy()
         df2 = df
@@ -1158,7 +719,34 @@ def test_inplace_ops_identity(self):
         expected = DataFrame({'A': arr.copy() + 1.5, 'B': 'foo'})
         assert_frame_equal(df, expected)
         assert_frame_equal(df2, expected)
-        self.assertIs(df._data, df2._data)
+        assert df._data is df2._data
+
+    @pytest.mark.parametrize('op', ['add', 'and', 'div', 'floordiv', 'mod',
+                                    'mul', 'or', 'pow', 'sub', 'truediv',
+                                    'xor'])
+    def test_inplace_ops_identity2(self, op):
+
+        if compat.PY3 and op == 'div':
+            return
+
+        df = DataFrame({'a': [1., 2., 3.],
+                        'b': [1, 2, 3]})
+
+        operand = 2
+        if op in ('and', 'or', 'xor'):
+            # cannot use floats for boolean ops
+            df['a'] = [True, False, True]
+
+        df_copy = df.copy()
+        iop = '__i{}__'.format(op)
+        op = '__{}__'.format(op)
+
+        # no id change and value is correct
+        getattr(df, iop)(operand)
+        expected = getattr(df_copy, op)(operand)
+        assert_frame_equal(df, expected)
+        expected = id(df)
+        assert id(df) == expected
 
     def test_alignment_non_pandas(self):
         index = ['A', 'B', 'C']
@@ -1166,8 +754,8 @@ def test_alignment_non_pandas(self):
         df = pd.DataFrame(np.random.randn(3, 3), index=index, columns=columns)
 
         align = pd.core.ops._align_method_FRAME
-
-        for val in [[1, 2, 3], (1, 2, 3), np.array([1, 2, 3], dtype=np.int64)]:
+        for val in [[1, 2, 3], (1, 2, 3), np.array([1, 2, 3], dtype=np.int64),
+                    range(1, 4)]:
 
             tm.assert_series_equal(align(df, val, 'index'),
                                    Series([1, 2, 3], index=df.index))
@@ -1176,11 +764,12 @@ def test_alignment_non_pandas(self):
 
         # length mismatch
         msg = 'Unable to coerce to Series, length must be 3: given 2'
-        for val in [[1, 2], (1, 2), np.array([1, 2])]:
-            with tm.assertRaisesRegexp(ValueError, msg):
+        for val in [[1, 2], (1, 2), np.array([1, 2]), range(1, 3)]:
+
+            with pytest.raises(ValueError, match=msg):
                 align(df, val, 'index')
 
-            with tm.assertRaisesRegexp(ValueError, msg):
+            with pytest.raises(ValueError, match=msg):
                 align(df, val, 'columns')
 
         val = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
@@ -1194,14 +783,20 @@ def test_alignment_non_pandas(self):
         # shape mismatch
         msg = 'Unable to coerce to DataFrame, shape must be'
         val = np.array([[1, 2, 3], [4, 5, 6]])
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             align(df, val, 'index')
 
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             align(df, val, 'columns')
 
         val = np.zeros((3, 3, 3))
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             align(df, val, 'index')
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             align(df, val, 'columns')
+
+    def test_no_warning(self, all_arithmetic_operators):
+        df = pd.DataFrame({"A": [0., 0.], "B": [0., None]})
+        b = df['B']
+        with tm.assert_produces_warning(None):
+            getattr(df, all_arithmetic_operators)(b, 0)
diff --git a/pandas/tests/frame/test_period.py b/pandas/tests/frame/test_period.py
index 84d10a2e78d28..8b37d4ff2cf9e 100644
--- a/pandas/tests/frame/test_period.py
+++ b/pandas/tests/frame/test_period.py
@@ -1,25 +1,24 @@
-import numpy as np
-from numpy.random import randn
 from datetime import timedelta
 
+import numpy as np
+import pytest
+
 import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, PeriodIndex, Timedelta, date_range,
+    period_range, to_datetime)
 import pandas.util.testing as tm
-from pandas import (PeriodIndex, period_range, DataFrame, date_range,
-                    Index, to_datetime, DatetimeIndex)
 
 
 def _permute(obj):
     return obj.take(np.random.permutation(len(obj)))
 
 
-class TestPeriodIndex(tm.TestCase):
-
-    def setUp(self):
-        pass
+class TestPeriodIndex(object):
 
     def test_as_frame_columns(self):
         rng = period_range('1/1/2000', periods=5)
-        df = DataFrame(randn(10, 5), columns=rng)
+        df = DataFrame(np.random.randn(10, 5), columns=rng)
 
         ts = df[rng[0]]
         tm.assert_series_equal(ts, df.iloc[:, 0])
@@ -32,25 +31,26 @@ def test_as_frame_columns(self):
 
     def test_frame_setitem(self):
         rng = period_range('1/1/2000', periods=5, name='index')
-        df = DataFrame(randn(5, 3), index=rng)
+        df = DataFrame(np.random.randn(5, 3), index=rng)
 
         df['Index'] = rng
         rs = Index(df['Index'])
         tm.assert_index_equal(rs, rng, check_names=False)
-        self.assertEqual(rs.name, 'Index')
-        self.assertEqual(rng.name, 'index')
+        assert rs.name == 'Index'
+        assert rng.name == 'index'
 
         rs = df.reset_index().set_index('index')
-        tm.assertIsInstance(rs.index, PeriodIndex)
+        assert isinstance(rs.index, PeriodIndex)
         tm.assert_index_equal(rs.index, rng)
 
     def test_frame_to_time_stamp(self):
         K = 5
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        df = DataFrame(randn(len(index), K), index=index)
+        index = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        df = DataFrame(np.random.randn(len(index), K), index=index)
         df['mix'] = 'a'
 
         exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
+        exp_index = exp_index + Timedelta(1, 'D') - Timedelta(1, 'ns')
         result = df.to_timestamp('D', 'end')
         tm.assert_index_equal(result.index, exp_index)
         tm.assert_numpy_array_equal(result.values, df.values)
@@ -66,22 +66,26 @@ def _get_with_delta(delta, freq='A-DEC'):
         delta = timedelta(hours=23)
         result = df.to_timestamp('H', 'end')
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'h') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
         delta = timedelta(hours=23, minutes=59)
         result = df.to_timestamp('T', 'end')
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'm') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
         result = df.to_timestamp('S', 'end')
         delta = timedelta(hours=23, minutes=59, seconds=59)
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 's') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
         # columns
         df = df.T
 
         exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
+        exp_index = exp_index + Timedelta(1, 'D') - Timedelta(1, 'ns')
         result = df.to_timestamp('D', 'end', axis=1)
         tm.assert_index_equal(result.columns, exp_index)
         tm.assert_numpy_array_equal(result.values, df.values)
@@ -93,31 +97,35 @@ def _get_with_delta(delta, freq='A-DEC'):
         delta = timedelta(hours=23)
         result = df.to_timestamp('H', 'end', axis=1)
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'h') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.columns, exp_index)
 
         delta = timedelta(hours=23, minutes=59)
         result = df.to_timestamp('T', 'end', axis=1)
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'm') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.columns, exp_index)
 
         result = df.to_timestamp('S', 'end', axis=1)
         delta = timedelta(hours=23, minutes=59, seconds=59)
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 's') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.columns, exp_index)
 
         # invalid axis
-        tm.assertRaisesRegexp(ValueError, 'axis', df.to_timestamp, axis=2)
+        with pytest.raises(ValueError, match='axis'):
+            df.to_timestamp(axis=2)
 
         result1 = df.to_timestamp('5t', axis=1)
         result2 = df.to_timestamp('t', axis=1)
         expected = pd.date_range('2001-01-01', '2009-01-01', freq='AS')
-        self.assertTrue(isinstance(result1.columns, DatetimeIndex))
-        self.assertTrue(isinstance(result2.columns, DatetimeIndex))
-        self.assert_numpy_array_equal(result1.columns.asi8, expected.asi8)
-        self.assert_numpy_array_equal(result2.columns.asi8, expected.asi8)
+        assert isinstance(result1.columns, DatetimeIndex)
+        assert isinstance(result2.columns, DatetimeIndex)
+        tm.assert_numpy_array_equal(result1.columns.asi8, expected.asi8)
+        tm.assert_numpy_array_equal(result2.columns.asi8, expected.asi8)
         # PeriodIndex.to_timestamp always use 'infer'
-        self.assertEqual(result1.columns.freqstr, 'AS-JAN')
-        self.assertEqual(result2.columns.freqstr, 'AS-JAN')
+        assert result1.columns.freqstr == 'AS-JAN'
+        assert result2.columns.freqstr == 'AS-JAN'
 
     def test_frame_index_to_string(self):
         index = PeriodIndex(['2011-1', '2011-2', '2011-3'], freq='M')
diff --git a/pandas/tests/frame/test_quantile.py b/pandas/tests/frame/test_quantile.py
index 909a1a6a4c917..facbfdd0c032b 100644
--- a/pandas/tests/frame/test_quantile.py
+++ b/pandas/tests/frame/test_quantile.py
@@ -2,35 +2,30 @@
 
 from __future__ import print_function
 
-
-import pytest
 import numpy as np
+import pytest
 
-from pandas import (DataFrame, Series, Timestamp, _np_version_under1p11)
-import pandas as pd
-
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
-import pandas.util.testing as tm
-from pandas import _np_version_under1p9
+from pandas.compat import PY2
 
+import pandas as pd
+from pandas import DataFrame, Series, Timestamp
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameQuantile(tm.TestCase, TestData):
+class TestDataFrameQuantile(TestData):
 
     def test_quantile(self):
         from numpy import percentile
 
         q = self.tsframe.quantile(0.1, axis=0)
-        self.assertEqual(q['A'], percentile(self.tsframe['A'], 10))
+        assert q['A'] == percentile(self.tsframe['A'], 10)
         tm.assert_index_equal(q.index, self.tsframe.columns)
 
         q = self.tsframe.quantile(0.9, axis=1)
-        self.assertEqual(q['2000-01-17'],
-                         percentile(self.tsframe.loc['2000-01-17'], 90))
+        assert (q['2000-01-17'] ==
+                percentile(self.tsframe.loc['2000-01-17'], 90))
         tm.assert_index_equal(q.index, self.tsframe.index)
 
         # test degenerate case
@@ -75,10 +70,10 @@ def test_quantile_axis_mixed(self):
         assert_series_equal(result, expected)
 
         # must raise
-        def f():
+        with pytest.raises(TypeError):
             df.quantile(.5, axis=1, numeric_only=False)
-        self.assertRaises(TypeError, f)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_quantile_axis_parameter(self):
         # GH 9543/9544
 
@@ -100,44 +95,47 @@ def test_quantile_axis_parameter(self):
         result = df.quantile(.5, axis="columns")
         assert_series_equal(result, expected)
 
-        self.assertRaises(ValueError, df.quantile, 0.1, axis=-1)
-        self.assertRaises(ValueError, df.quantile, 0.1, axis="column")
+        msg = ("No axis named -1 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            df.quantile(0.1, axis=-1)
+        msg = ("No axis named column for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            df.quantile(0.1, axis="column")
 
     def test_quantile_interpolation(self):
-        # GH #10174
-        if _np_version_under1p9:
-            pytest.skip("Numpy version under 1.9")
-
+        # see gh-10174
         from numpy import percentile
 
         # interpolation = linear (default case)
         q = self.tsframe.quantile(0.1, axis=0, interpolation='linear')
-        self.assertEqual(q['A'], percentile(self.tsframe['A'], 10))
+        assert q['A'] == percentile(self.tsframe['A'], 10)
         q = self.intframe.quantile(0.1)
-        self.assertEqual(q['A'], percentile(self.intframe['A'], 10))
+        assert q['A'] == percentile(self.intframe['A'], 10)
 
         # test with and without interpolation keyword
         q1 = self.intframe.quantile(0.1)
-        self.assertEqual(q1['A'], np.percentile(self.intframe['A'], 10))
-        assert_series_equal(q, q1)
+        assert q1['A'] == np.percentile(self.intframe['A'], 10)
+        tm.assert_series_equal(q, q1)
 
         # interpolation method other than default linear
         df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
         result = df.quantile(.5, axis=1, interpolation='nearest')
         expected = Series([1, 2, 3], index=[1, 2, 3], name=0.5)
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         # cross-check interpolation=nearest results in original dtype
         exp = np.percentile(np.array([[1, 2, 3], [2, 3, 4]]), .5,
                             axis=0, interpolation='nearest')
         expected = Series(exp, index=[1, 2, 3], name=0.5, dtype='int64')
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         # float
         df = DataFrame({"A": [1., 2., 3.], "B": [2., 3., 4.]}, index=[1, 2, 3])
         result = df.quantile(.5, axis=1, interpolation='nearest')
         expected = Series([1., 2., 3.], index=[1, 2, 3], name=0.5)
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
         exp = np.percentile(np.array([[1., 2., 3.], [2., 3., 4.]]), .5,
                             axis=0, interpolation='nearest')
         expected = Series(exp, index=[1, 2, 3], name=0.5, dtype='float64')
@@ -160,52 +158,10 @@ def test_quantile_interpolation(self):
         result = df.quantile([.25, .5], interpolation='midpoint')
 
         # https://github.com/numpy/numpy/issues/7163
-        if _np_version_under1p11:
-            expected = DataFrame([[1.5, 1.5, 1.5], [2.5, 2.5, 2.5]],
-                                 index=[.25, .5], columns=['a', 'b', 'c'])
-        else:
-            expected = DataFrame([[1.5, 1.5, 1.5], [2.0, 2.0, 2.0]],
-                                 index=[.25, .5], columns=['a', 'b', 'c'])
+        expected = DataFrame([[1.5, 1.5, 1.5], [2.0, 2.0, 2.0]],
+                             index=[.25, .5], columns=['a', 'b', 'c'])
         assert_frame_equal(result, expected)
 
-    def test_quantile_interpolation_np_lt_1p9(self):
-        # GH #10174
-        if not _np_version_under1p9:
-            pytest.skip("Numpy version is greater than 1.9")
-
-        from numpy import percentile
-
-        # interpolation = linear (default case)
-        q = self.tsframe.quantile(0.1, axis=0, interpolation='linear')
-        self.assertEqual(q['A'], percentile(self.tsframe['A'], 10))
-        q = self.intframe.quantile(0.1)
-        self.assertEqual(q['A'], percentile(self.intframe['A'], 10))
-
-        # test with and without interpolation keyword
-        q1 = self.intframe.quantile(0.1)
-        self.assertEqual(q1['A'], np.percentile(self.intframe['A'], 10))
-        assert_series_equal(q, q1)
-
-        # interpolation method other than default linear
-        expErrMsg = "Interpolation methods other than linear"
-        df = DataFrame({"A": [1, 2, 3], "B": [2, 3, 4]}, index=[1, 2, 3])
-        with assertRaisesRegexp(ValueError, expErrMsg):
-            df.quantile(.5, axis=1, interpolation='nearest')
-
-        with assertRaisesRegexp(ValueError, expErrMsg):
-            df.quantile([.5, .75], axis=1, interpolation='lower')
-
-        # test degenerate case
-        df = DataFrame({'x': [], 'y': []})
-        with assertRaisesRegexp(ValueError, expErrMsg):
-            q = df.quantile(0.1, axis=0, interpolation='higher')
-
-        # multi
-        df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
-                       columns=['a', 'b', 'c'])
-        with assertRaisesRegexp(ValueError, expErrMsg):
-            df.quantile([.25, .5], interpolation='midpoint')
-
     def test_quantile_multi(self):
         df = DataFrame([[1, 1, 1], [2, 2, 2], [3, 3, 3]],
                        columns=['a', 'b', 'c'])
@@ -268,7 +224,7 @@ def test_quantile_datetime(self):
     def test_quantile_invalid(self):
         msg = 'percentiles should all be in the interval \\[0, 1\\]'
         for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
-            with tm.assertRaisesRegexp(ValueError, msg):
+            with pytest.raises(ValueError, match=msg):
                 self.tsframe.quantile(invalid)
 
     def test_quantile_box(self):
@@ -431,7 +387,7 @@ def test_quantile_empty(self):
         # res = df.quantile(0.5)
 
         # datetimes
-        df = DataFrame(columns=['a', 'b'], dtype='datetime64')
+        df = DataFrame(columns=['a', 'b'], dtype='datetime64[ns]')
 
         # FIXME (gives NaNs instead of NaT in 0.18.1 or 0.19.0)
         # res = df.quantile(0.5, numeric_only=False)
diff --git a/pandas/tests/frame/test_query_eval.py b/pandas/tests/frame/test_query_eval.py
index 647af92b42273..ba02cb54bcea1 100644
--- a/pandas/tests/frame/test_query_eval.py
+++ b/pandas/tests/frame/test_query_eval.py
@@ -3,29 +3,32 @@
 from __future__ import print_function
 
 import operator
-import pytest
-from itertools import product
 
-from pandas.compat import (zip, range, lrange, StringIO)
-from pandas import DataFrame, Series, Index, MultiIndex, date_range
-import pandas as pd
 import numpy as np
+import pytest
 
-from numpy.random import randn
+from pandas.compat import StringIO, lrange, range, zip
+import pandas.util._test_decorators as td
 
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaises,
-                                 makeCustomDataframe as mkdf)
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, date_range
+from pandas.core.computation.check import _NUMEXPR_INSTALLED
+from pandas.tests.frame.common import TestData
+from pandas.util.testing import (
+    assert_frame_equal, assert_series_equal, makeCustomDataframe as mkdf)
 
-import pandas.util.testing as tm
-from pandas.computation import _NUMEXPR_INSTALLED
+PARSERS = 'python', 'pandas'
+ENGINES = 'python', pytest.param('numexpr', marks=td.skip_if_no_ne)
 
-from pandas.tests.frame.common import TestData
 
+@pytest.fixture(params=PARSERS, ids=lambda x: x)
+def parser(request):
+    return request.param
 
-PARSERS = 'python', 'pandas'
-ENGINES = 'python', 'numexpr'
+
+@pytest.fixture(params=ENGINES, ids=lambda x: x)
+def engine(request):
+    return request.param
 
 
 def skip_if_no_pandas_parser(parser):
@@ -33,16 +36,9 @@ def skip_if_no_pandas_parser(parser):
         pytest.skip("cannot evaluate with parser {0!r}".format(parser))
 
 
-def skip_if_no_ne(engine='numexpr'):
-    if engine == 'numexpr':
-        if not _NUMEXPR_INSTALLED:
-            pytest.skip("cannot query engine numexpr when numexpr not "
-                        "installed")
-
+class TestCompat(object):
 
-class TestCompat(tm.TestCase):
-
-    def setUp(self):
+    def setup_method(self, method):
         self.df = DataFrame({'A': [1, 2, 3]})
         self.expected1 = self.df[self.df.A > 0]
         self.expected2 = self.df.A + 1
@@ -82,13 +78,13 @@ def test_query_numexpr(self):
             result = df.eval('A+1', engine='numexpr')
             assert_series_equal(result, self.expected2, check_names=False)
         else:
-            self.assertRaises(ImportError,
-                              lambda: df.query('A>0', engine='numexpr'))
-            self.assertRaises(ImportError,
-                              lambda: df.eval('A+1', engine='numexpr'))
+            with pytest.raises(ImportError):
+                df.query('A>0', engine='numexpr')
+            with pytest.raises(ImportError):
+                df.eval('A+1', engine='numexpr')
 
 
-class TestDataFrameEval(tm.TestCase, TestData):
+class TestDataFrameEval(TestData):
 
     def test_ops(self):
 
@@ -139,10 +135,10 @@ def test_query_non_str(self):
         df = pd.DataFrame({'A': [1, 2, 3], 'B': ['a', 'b', 'b']})
 
         msg = "expr must be a string to be evaluated"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df.query(lambda x: x.B == "b")
 
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df.query(111)
 
     def test_query_empty_string(self):
@@ -150,28 +146,28 @@ def test_query_empty_string(self):
         df = pd.DataFrame({'A': [1, 2, 3]})
 
         msg = "expr cannot be an empty string"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             df.query('')
 
     def test_eval_resolvers_as_list(self):
         # GH 14095
-        df = DataFrame(randn(10, 2), columns=list('ab'))
+        df = DataFrame(np.random.randn(10, 2), columns=list('ab'))
         dict1 = {'a': 1}
         dict2 = {'b': 2}
-        self.assertTrue(df.eval('a + b', resolvers=[dict1, dict2]) ==
-                        dict1['a'] + dict2['b'])
-        self.assertTrue(pd.eval('a + b', resolvers=[dict1, dict2]) ==
-                        dict1['a'] + dict2['b'])
+        assert (df.eval('a + b', resolvers=[dict1, dict2]) ==
+                dict1['a'] + dict2['b'])
+        assert (pd.eval('a + b', resolvers=[dict1, dict2]) ==
+                dict1['a'] + dict2['b'])
 
 
-class TestDataFrameQueryWithMultiIndex(tm.TestCase):
+class TestDataFrameQueryWithMultiIndex(object):
 
-    def check_query_with_named_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_with_named_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
         a = np.random.choice(['red', 'green'], size=10)
         b = np.random.choice(['eggs', 'ham'], size=10)
         index = MultiIndex.from_arrays([a, b], names=['color', 'food'])
-        df = DataFrame(randn(10, 2), index=index)
+        df = DataFrame(np.random.randn(10, 2), index=index)
         ind = Series(df.index.get_level_values('color').values, index=index,
                      name='color')
 
@@ -215,16 +211,12 @@ def check_query_with_named_multiindex(self, parser, engine):
         assert_frame_equal(res1, exp)
         assert_frame_equal(res2, exp)
 
-    def test_query_with_named_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_with_named_multiindex, parser, engine
-
-    def check_query_with_unnamed_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_with_unnamed_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
         a = np.random.choice(['red', 'green'], size=10)
         b = np.random.choice(['eggs', 'ham'], size=10)
         index = MultiIndex.from_arrays([a, b])
-        df = DataFrame(randn(10, 2), index=index)
+        df = DataFrame(np.random.randn(10, 2), index=index)
         ind = Series(df.index.get_level_values(0).values, index=index)
 
         res1 = df.query('ilevel_0 == "red"', parser=parser, engine=engine)
@@ -309,17 +301,13 @@ def check_query_with_unnamed_multiindex(self, parser, engine):
         assert_frame_equal(res1, exp)
         assert_frame_equal(res2, exp)
 
-    def test_query_with_unnamed_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_with_unnamed_multiindex, parser, engine
-
-    def check_query_with_partially_named_multiindex(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_with_partially_named_multiindex(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
         a = np.random.choice(['red', 'green'], size=10)
         b = np.arange(10)
         index = MultiIndex.from_arrays([a, b])
         index.names = [None, 'rating']
-        df = DataFrame(randn(10, 2), index=index)
+        df = DataFrame(np.random.randn(10, 2), index=index)
         res = df.query('rating == 1', parser=parser, engine=engine)
         ind = Series(df.index.get_level_values('rating').values, index=index,
                      name='rating')
@@ -342,17 +330,7 @@ def check_query_with_partially_named_multiindex(self, parser, engine):
         exp = df[ind != "red"]
         assert_frame_equal(res, exp)
 
-    def test_query_with_partially_named_multiindex(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield (self.check_query_with_partially_named_multiindex,
-                   parser, engine)
-
     def test_query_multiindex_get_index_resolvers(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield (self.check_query_multiindex_get_index_resolvers, parser,
-                   engine)
-
-    def check_query_multiindex_get_index_resolvers(self, parser, engine):
         df = mkdf(10, 3, r_idx_nlevels=2, r_idx_names=['spam', 'eggs'])
         resolvers = df._get_index_resolvers()
 
@@ -376,47 +354,23 @@ def to_series(mi, level):
             else:
                 raise AssertionError("object must be a Series or Index")
 
-    def test_raise_on_panel_with_multiindex(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_raise_on_panel_with_multiindex, parser, engine
-
-    def check_raise_on_panel_with_multiindex(self, parser, engine):
-        tm.skip_if_no_ne()
-        p = tm.makePanel(7)
-        p.items = tm.makeCustomIndex(len(p.items), nlevels=2)
-        with tm.assertRaises(NotImplementedError):
-            pd.eval('p + 1', parser=parser, engine=engine)
 
-    def test_raise_on_panel4d_with_multiindex(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_raise_on_panel4d_with_multiindex, parser, engine
-
-    def check_raise_on_panel4d_with_multiindex(self, parser, engine):
-        tm.skip_if_no_ne()
-        p4d = tm.makePanel4D(7)
-        p4d.items = tm.makeCustomIndex(len(p4d.items), nlevels=2)
-        with tm.assertRaises(NotImplementedError):
-            pd.eval('p4d + 1', parser=parser, engine=engine)
-
-
-class TestDataFrameQueryNumExprPandas(tm.TestCase):
+@td.skip_if_no_ne
+class TestDataFrameQueryNumExprPandas(object):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryNumExprPandas, cls).setUpClass()
+    def setup_class(cls):
         cls.engine = 'numexpr'
         cls.parser = 'pandas'
-        tm.skip_if_no_ne(cls.engine)
 
     @classmethod
-    def tearDownClass(cls):
-        super(TestDataFrameQueryNumExprPandas, cls).tearDownClass()
+    def teardown_class(cls):
         del cls.engine, cls.parser
 
     def test_date_query_with_attribute_access(self):
         engine, parser = self.engine, self.parser
         skip_if_no_pandas_parser(parser)
-        df = DataFrame(randn(5, 3))
+        df = DataFrame(np.random.randn(5, 3))
         df['dates1'] = date_range('1/1/2012', periods=5)
         df['dates2'] = date_range('1/1/2013', periods=5)
         df['dates3'] = date_range('1/1/2014', periods=5)
@@ -427,7 +381,7 @@ def test_date_query_with_attribute_access(self):
 
     def test_date_query_no_attribute_access(self):
         engine, parser = self.engine, self.parser
-        df = DataFrame(randn(5, 3))
+        df = DataFrame(np.random.randn(5, 3))
         df['dates1'] = date_range('1/1/2012', periods=5)
         df['dates2'] = date_range('1/1/2013', periods=5)
         df['dates3'] = date_range('1/1/2014', periods=5)
@@ -439,7 +393,7 @@ def test_date_query_no_attribute_access(self):
     def test_date_query_with_NaT(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates2'] = date_range('1/1/2013', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
@@ -453,7 +407,7 @@ def test_date_query_with_NaT(self):
     def test_date_index_query(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
         df.set_index('dates1', inplace=True, drop=True)
@@ -465,7 +419,7 @@ def test_date_index_query(self):
     def test_date_index_query_with_NaT(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
         df.iloc[0, 0] = pd.NaT
@@ -484,7 +438,7 @@ def test_date_index_query_with_NaT_duplicates(self):
         df = DataFrame(d)
         df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
         df.set_index('dates1', inplace=True, drop=True)
-        res = df.query('index < 20130101 < dates3', engine=engine,
+        res = df.query('dates1 < 20130101 < dates3', engine=engine,
                        parser=parser)
         expec = df[(df.index.to_series() < '20130101') &
                    ('20130101' < df.dates3)]
@@ -497,21 +451,25 @@ def test_date_query_with_non_date(self):
         df = DataFrame({'dates': date_range('1/1/2012', periods=n),
                         'nondate': np.arange(n)})
 
-        ops = '==', '!=', '<', '>', '<=', '>='
+        result = df.query('dates == nondate', parser=parser, engine=engine)
+        assert len(result) == 0
+
+        result = df.query('dates != nondate', parser=parser, engine=engine)
+        assert_frame_equal(result, df)
 
-        for op in ops:
-            with tm.assertRaises(TypeError):
+        for op in ['<', '>', '<=', '>=']:
+            with pytest.raises(TypeError):
                 df.query('dates %s nondate' % op, parser=parser, engine=engine)
 
     def test_query_syntax_error(self):
         engine, parser = self.engine, self.parser
         df = DataFrame({"i": lrange(10), "+": lrange(3, 13),
                         "r": lrange(4, 14)})
-        with tm.assertRaises(SyntaxError):
+        with pytest.raises(SyntaxError):
             df.query('i - +', engine=engine, parser=parser)
 
     def test_query_scope(self):
-        from pandas.computation.ops import UndefinedVariableError
+        from pandas.core.computation.ops import UndefinedVariableError
         engine, parser = self.engine, self.parser
         skip_if_no_pandas_parser(parser)
 
@@ -527,34 +485,34 @@ def test_query_scope(self):
         assert_frame_equal(res, expected)
 
         # no local variable c
-        with tm.assertRaises(UndefinedVariableError):
+        with pytest.raises(UndefinedVariableError):
             df.query('@a > b > @c', engine=engine, parser=parser)
 
         # no column named 'c'
-        with tm.assertRaises(UndefinedVariableError):
+        with pytest.raises(UndefinedVariableError):
             df.query('@a > b > c', engine=engine, parser=parser)
 
     def test_query_doesnt_pickup_local(self):
-        from pandas.computation.ops import UndefinedVariableError
+        from pandas.core.computation.ops import UndefinedVariableError
 
         engine, parser = self.engine, self.parser
         n = m = 10
         df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
 
         # we don't pick up the local 'sin'
-        with tm.assertRaises(UndefinedVariableError):
+        with pytest.raises(UndefinedVariableError):
             df.query('sin > 5', engine=engine, parser=parser)
 
     def test_query_builtin(self):
-        from pandas.computation.engines import NumExprClobberingError
+        from pandas.core.computation.engines import NumExprClobberingError
         engine, parser = self.engine, self.parser
 
         n = m = 10
         df = DataFrame(np.random.randint(m, size=(n, 3)), columns=list('abc'))
 
         df.index.name = 'sin'
-        with tm.assertRaisesRegexp(NumExprClobberingError,
-                                   'Variables in expression.+'):
+        msg = 'Variables in expression.+'
+        with pytest.raises(NumExprClobberingError, match=msg):
             df.query('sin > 5', engine=engine, parser=parser)
 
     def test_query(self):
@@ -624,19 +582,19 @@ def test_nested_scope(self):
         assert_frame_equal(result, expected)
 
     def test_nested_raises_on_local_self_reference(self):
-        from pandas.computation.ops import UndefinedVariableError
+        from pandas.core.computation.ops import UndefinedVariableError
 
         df = DataFrame(np.random.randn(5, 3))
 
         # can't reference ourself b/c we're a local so @ is necessary
-        with tm.assertRaises(UndefinedVariableError):
+        with pytest.raises(UndefinedVariableError):
             df.query('df > 0', engine=self.engine, parser=self.parser)
 
     def test_local_syntax(self):
         skip_if_no_pandas_parser(self.parser)
 
         engine, parser = self.engine, self.parser
-        df = DataFrame(randn(100, 10), columns=list('abcdefghij'))
+        df = DataFrame(np.random.randn(100, 10), columns=list('abcdefghij'))
         b = 1
         expect = df[df.a < b]
         result = df.query('a < @b', engine=engine, parser=parser)
@@ -650,7 +608,7 @@ def test_chained_cmp_and_in(self):
         skip_if_no_pandas_parser(self.parser)
         engine, parser = self.engine, self.parser
         cols = list('abc')
-        df = DataFrame(randn(100, len(cols)), columns=cols)
+        df = DataFrame(np.random.randn(100, len(cols)), columns=cols)
         res = df.query('a < b < c and a not in b not in c', engine=engine,
                        parser=parser)
         ind = (df.a < df.b) & (df.b < df.c) & ~df.b.isin(df.a) & ~df.c.isin(df.b)  # noqa
@@ -683,12 +641,14 @@ def test_at_inside_string(self):
         assert_frame_equal(result, expected)
 
     def test_query_undefined_local(self):
-        from pandas.computation.ops import UndefinedVariableError
+        from pandas.core.computation.ops import UndefinedVariableError
         engine, parser = self.engine, self.parser
         skip_if_no_pandas_parser(parser)
+
         df = DataFrame(np.random.rand(10, 2), columns=list('ab'))
-        with tm.assertRaisesRegexp(UndefinedVariableError,
-                                   "local variable 'c' is not defined"):
+        msg = "local variable 'c' is not defined"
+
+        with pytest.raises(UndefinedVariableError, match=msg):
             df.query('a == @c', engine=engine, parser=parser)
 
     def test_index_resolvers_come_after_columns_with_the_same_name(self):
@@ -731,19 +691,19 @@ def test_inf(self):
             assert_frame_equal(result, expected)
 
 
+@td.skip_if_no_ne
 class TestDataFrameQueryNumExprPython(TestDataFrameQueryNumExprPandas):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryNumExprPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestDataFrameQueryNumExprPython, cls).setup_class()
         cls.engine = 'numexpr'
         cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
         cls.frame = TestData().frame
 
     def test_date_query_no_attribute_access(self):
         engine, parser = self.engine, self.parser
-        df = DataFrame(randn(5, 3))
+        df = DataFrame(np.random.randn(5, 3))
         df['dates1'] = date_range('1/1/2012', periods=5)
         df['dates2'] = date_range('1/1/2013', periods=5)
         df['dates3'] = date_range('1/1/2014', periods=5)
@@ -755,7 +715,7 @@ def test_date_query_no_attribute_access(self):
     def test_date_query_with_NaT(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates2'] = date_range('1/1/2013', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
@@ -769,7 +729,7 @@ def test_date_query_with_NaT(self):
     def test_date_index_query(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
         df.set_index('dates1', inplace=True, drop=True)
@@ -781,7 +741,7 @@ def test_date_index_query(self):
     def test_date_index_query_with_NaT(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
         df.iloc[0, 0] = pd.NaT
@@ -794,31 +754,31 @@ def test_date_index_query_with_NaT(self):
     def test_date_index_query_with_NaT_duplicates(self):
         engine, parser = self.engine, self.parser
         n = 10
-        df = DataFrame(randn(n, 3))
+        df = DataFrame(np.random.randn(n, 3))
         df['dates1'] = date_range('1/1/2012', periods=n)
         df['dates3'] = date_range('1/1/2014', periods=n)
         df.loc[np.random.rand(n) > 0.5, 'dates1'] = pd.NaT
         df.set_index('dates1', inplace=True, drop=True)
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             df.query('index < 20130101 < dates3', engine=engine, parser=parser)
 
     def test_nested_scope(self):
-        from pandas.computation.ops import UndefinedVariableError
+        from pandas.core.computation.ops import UndefinedVariableError
         engine = self.engine
         parser = self.parser
         # smoke test
         x = 1  # noqa
         result = pd.eval('x + 1', engine=engine, parser=parser)
-        self.assertEqual(result, 2)
+        assert result == 2
 
         df = DataFrame(np.random.randn(5, 3))
         df2 = DataFrame(np.random.randn(5, 3))
 
         # don't have the pandas parser
-        with tm.assertRaises(SyntaxError):
+        with pytest.raises(SyntaxError):
             df.query('(@df>0) & (@df2>0)', engine=engine, parser=parser)
 
-        with tm.assertRaises(UndefinedVariableError):
+        with pytest.raises(UndefinedVariableError):
             df.query('(df>0) & (df2>0)', engine=engine, parser=parser)
 
         expected = df[(df > 0) & (df2 > 0)]
@@ -835,8 +795,8 @@ def test_nested_scope(self):
 class TestDataFrameQueryPythonPandas(TestDataFrameQueryNumExprPandas):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryPythonPandas, cls).setUpClass()
+    def setup_class(cls):
+        super(TestDataFrameQueryPythonPandas, cls).setup_class()
         cls.engine = 'python'
         cls.parser = 'pandas'
         cls.frame = TestData().frame
@@ -856,8 +816,8 @@ def test_query_builtin(self):
 class TestDataFrameQueryPythonPython(TestDataFrameQueryNumExprPython):
 
     @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameQueryPythonPython, cls).setUpClass()
+    def setup_class(cls):
+        super(TestDataFrameQueryPythonPython, cls).setup_class()
         cls.engine = cls.parser = 'python'
         cls.frame = TestData().frame
 
@@ -873,11 +833,10 @@ def test_query_builtin(self):
         assert_frame_equal(expected, result)
 
 
-class TestDataFrameQueryStrings(tm.TestCase):
+class TestDataFrameQueryStrings(object):
 
-    def check_str_query_method(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame(randn(10, 1), columns=['b'])
+    def test_str_query_method(self, parser, engine):
+        df = DataFrame(np.random.randn(10, 1), columns=['b'])
         df['strings'] = Series(list('aabbccddee'))
         expect = df[df.strings == 'a']
 
@@ -893,8 +852,10 @@ def check_str_query_method(self, parser, engine):
 
             for lhs, op, rhs in zip(lhs, ops, rhs):
                 ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
-                assertRaises(NotImplementedError, df.query, ex, engine=engine,
-                             parser=parser, local_dict={'strings': df.strings})
+                msg = r"'(Not)?In' nodes are not implemented"
+                with pytest.raises(NotImplementedError, match=msg):
+                    df.query(ex, engine=engine, parser=parser,
+                             local_dict={'strings': df.strings})
         else:
             res = df.query('"a" == strings', engine=engine, parser=parser)
             assert_frame_equal(res, expect)
@@ -911,17 +872,8 @@ def check_str_query_method(self, parser, engine):
             assert_frame_equal(res, expect)
             assert_frame_equal(res, df[~df.strings.isin(['a'])])
 
-    def test_str_query_method(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_str_query_method, parser, engine
-
-    def test_str_list_query_method(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_str_list_query_method, parser, engine
-
-    def check_str_list_query_method(self, parser, engine):
-        tm.skip_if_no_ne(engine)
-        df = DataFrame(randn(10, 1), columns=['b'])
+    def test_str_list_query_method(self, parser, engine):
+        df = DataFrame(np.random.randn(10, 1), columns=['b'])
         df['strings'] = Series(list('aabbccddee'))
         expect = df[df.strings.isin(['a', 'b'])]
 
@@ -937,7 +889,7 @@ def check_str_list_query_method(self, parser, engine):
 
             for lhs, op, rhs in zip(lhs, ops, rhs):
                 ex = '{lhs} {op} {rhs}'.format(lhs=lhs, op=op, rhs=rhs)
-                with tm.assertRaises(NotImplementedError):
+                with pytest.raises(NotImplementedError):
                     df.query(ex, engine=engine, parser=parser)
         else:
             res = df.query('strings == ["a", "b"]', engine=engine,
@@ -958,8 +910,7 @@ def check_str_list_query_method(self, parser, engine):
                            parser=parser)
             assert_frame_equal(res, expect)
 
-    def check_query_with_string_columns(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_with_string_columns(self, parser, engine):
         df = DataFrame({'a': list('aaaabbbbcccc'),
                         'b': list('aabbccddeeff'),
                         'c': np.random.randint(5, size=12),
@@ -973,18 +924,13 @@ def check_query_with_string_columns(self, parser, engine):
             expec = df[df.a.isin(df.b) & (df.c < df.d)]
             assert_frame_equal(res, expec)
         else:
-            with assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 df.query('a in b', parser=parser, engine=engine)
 
-            with assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 df.query('a in b and c < d', parser=parser, engine=engine)
 
-    def test_query_with_string_columns(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_with_string_columns, parser, engine
-
-    def check_object_array_eq_ne(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_object_array_eq_ne(self, parser, engine):
         df = DataFrame({'a': list('aaaabbbbcccc'),
                         'b': list('aabbccddeeff'),
                         'c': np.random.randint(5, size=12),
@@ -997,12 +943,7 @@ def check_object_array_eq_ne(self, parser, engine):
         exp = df[df.a != df.b]
         assert_frame_equal(res, exp)
 
-    def test_object_array_eq_ne(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_object_array_eq_ne, parser, engine
-
-    def check_query_with_nested_strings(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_with_nested_strings(self, parser, engine):
         skip_if_no_pandas_parser(parser)
         raw = """id          event          timestamp
         1   "page 1 load"   1/1/2014 0:00:01
@@ -1025,26 +966,15 @@ def check_query_with_nested_strings(self, parser, engine):
                        engine=engine)
         assert_frame_equal(expected, res)
 
-    def test_query_with_nested_string(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_with_nested_strings, parser, engine
-
-    def check_query_with_nested_special_character(self, parser, engine):
+    def test_query_with_nested_special_character(self, parser, engine):
         skip_if_no_pandas_parser(parser)
-        tm.skip_if_no_ne(engine)
         df = DataFrame({'a': ['a', 'b', 'test & test'],
                         'b': [1, 2, 3]})
         res = df.query('a == "test & test"', parser=parser, engine=engine)
         expec = df[df.a == 'test & test']
         assert_frame_equal(res, expec)
 
-    def test_query_with_nested_special_character(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield (self.check_query_with_nested_special_character,
-                   parser, engine)
-
-    def check_query_lex_compare_strings(self, parser, engine):
-        tm.skip_if_no_ne(engine=engine)
+    def test_query_lex_compare_strings(self, parser, engine):
         import operator as opr
 
         a = Series(np.random.choice(list('abcde'), 20))
@@ -1058,12 +988,7 @@ def check_query_lex_compare_strings(self, parser, engine):
             expected = df[func(df.X, 'd')]
             assert_frame_equal(res, expected)
 
-    def test_query_lex_compare_strings(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_lex_compare_strings, parser, engine
-
-    def check_query_single_element_booleans(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_single_element_booleans(self, parser, engine):
         columns = 'bid', 'bidsize', 'ask', 'asksize'
         data = np.random.randint(2, size=(1, len(columns))).astype(bool)
         df = DataFrame(data, columns=columns)
@@ -1071,12 +996,8 @@ def check_query_single_element_booleans(self, parser, engine):
         expected = df[df.bid & df.ask]
         assert_frame_equal(res, expected)
 
-    def test_query_single_element_booleans(self):
-        for parser, engine in product(PARSERS, ENGINES):
-            yield self.check_query_single_element_booleans, parser, engine
-
-    def check_query_string_scalar_variable(self, parser, engine):
-        tm.skip_if_no_ne(engine)
+    def test_query_string_scalar_variable(self, parser, engine):
+        skip_if_no_pandas_parser(parser)
         df = pd.DataFrame({'Symbol': ['BUD US', 'BUD US', 'IBM US', 'IBM US'],
                            'Price': [109.70, 109.72, 183.30, 183.35]})
         e = df[df.Symbol == 'BUD US']
@@ -1084,70 +1005,29 @@ def check_query_string_scalar_variable(self, parser, engine):
         r = df.query('Symbol == @symb', parser=parser, engine=engine)
         assert_frame_equal(e, r)
 
-    def test_query_string_scalar_variable(self):
-        for parser, engine in product(['pandas'], ENGINES):
-            yield self.check_query_string_scalar_variable, parser, engine
 
+class TestDataFrameEvalWithFrame(object):
 
-class TestDataFrameEvalNumExprPandas(tm.TestCase):
+    def setup_method(self, method):
+        self.frame = DataFrame(np.random.randn(10, 3), columns=list('abc'))
 
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalNumExprPandas, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'pandas'
-        tm.skip_if_no_ne()
-
-    def setUp(self):
-        self.frame = DataFrame(randn(10, 3), columns=list('abc'))
-
-    def tearDown(self):
+    def teardown_method(self, method):
         del self.frame
 
-    def test_simple_expr(self):
-        res = self.frame.eval('a + b', engine=self.engine, parser=self.parser)
+    def test_simple_expr(self, parser, engine):
+        res = self.frame.eval('a + b', engine=engine, parser=parser)
         expect = self.frame.a + self.frame.b
         assert_series_equal(res, expect)
 
-    def test_bool_arith_expr(self):
-        res = self.frame.eval('a[a < 1] + b', engine=self.engine,
-                              parser=self.parser)
+    def test_bool_arith_expr(self, parser, engine):
+        res = self.frame.eval('a[a < 1] + b', engine=engine, parser=parser)
         expect = self.frame.a[self.frame.a < 1] + self.frame.b
         assert_series_equal(res, expect)
 
-    def test_invalid_type_for_operator_raises(self):
+    @pytest.mark.parametrize('op', ['+', '-', '*', '/'])
+    def test_invalid_type_for_operator_raises(self, parser, engine, op):
         df = DataFrame({'a': [1, 2], 'b': ['c', 'd']})
-        ops = '+', '-', '*', '/'
-        for op in ops:
-            with tm.assertRaisesRegexp(TypeError,
-                                       r"unsupported operand type\(s\) for "
-                                       r".+: '.+' and '.+'"):
-                df.eval('a {0} b'.format(op), engine=self.engine,
-                        parser=self.parser)
-
+        msg = r"unsupported operand type\(s\) for .+: '.+' and '.+'"
 
-class TestDataFrameEvalNumExprPython(TestDataFrameEvalNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalNumExprPython, cls).setUpClass()
-        cls.engine = 'numexpr'
-        cls.parser = 'python'
-        tm.skip_if_no_ne(cls.engine)
-
-
-class TestDataFrameEvalPythonPandas(TestDataFrameEvalNumExprPandas):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalPythonPandas, cls).setUpClass()
-        cls.engine = 'python'
-        cls.parser = 'pandas'
-
-
-class TestDataFrameEvalPythonPython(TestDataFrameEvalNumExprPython):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestDataFrameEvalPythonPython, cls).tearDownClass()
-        cls.engine = cls.parser = 'python'
+        with pytest.raises(TypeError, match=msg):
+            df.eval('a {0} b'.format(op), engine=engine, parser=parser)
diff --git a/pandas/tests/frame/test_rank.py b/pandas/tests/frame/test_rank.py
index b115218d76958..6bb9dea15d1ce 100644
--- a/pandas/tests/frame/test_rank.py
+++ b/pandas/tests/frame/test_rank.py
@@ -1,33 +1,38 @@
 # -*- coding: utf-8 -*-
-from datetime import timedelta, datetime
+from datetime import datetime, timedelta
 from distutils.version import LooseVersion
-from numpy import nan
-import numpy as np
 
-from pandas import Series, DataFrame
+import numpy as np
+import pytest
 
-from pandas.compat import product
-from pandas.util.testing import assert_frame_equal
-import pandas.util.testing as tm
+from pandas import DataFrame, Series
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
 
 
-class TestRank(tm.TestCase, TestData):
-    s = Series([1, 3, 4, 2, nan, 2, 1, 5, nan, 3])
+class TestRank(TestData):
+    s = Series([1, 3, 4, 2, np.nan, 2, 1, 5, np.nan, 3])
     df = DataFrame({'A': s, 'B': s})
 
     results = {
-        'average': np.array([1.5, 5.5, 7.0, 3.5, nan,
-                             3.5, 1.5, 8.0, nan, 5.5]),
-        'min': np.array([1, 5, 7, 3, nan, 3, 1, 8, nan, 5]),
-        'max': np.array([2, 6, 7, 4, nan, 4, 2, 8, nan, 6]),
-        'first': np.array([1, 5, 7, 3, nan, 4, 2, 8, nan, 6]),
-        'dense': np.array([1, 3, 4, 2, nan, 2, 1, 5, nan, 3]),
+        'average': np.array([1.5, 5.5, 7.0, 3.5, np.nan,
+                             3.5, 1.5, 8.0, np.nan, 5.5]),
+        'min': np.array([1, 5, 7, 3, np.nan, 3, 1, 8, np.nan, 5]),
+        'max': np.array([2, 6, 7, 4, np.nan, 4, 2, 8, np.nan, 6]),
+        'first': np.array([1, 5, 7, 3, np.nan, 4, 2, 8, np.nan, 6]),
+        'dense': np.array([1, 3, 4, 2, np.nan, 2, 1, 5, np.nan, 3]),
     }
 
+    @pytest.fixture(params=['average', 'min', 'max', 'first', 'dense'])
+    def method(self, request):
+        """
+        Fixture for trying all rank methods
+        """
+        return request.param
+
     def test_rank(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
 
         self.frame['A'][::2] = np.nan
         self.frame['B'][::3] = np.nan
@@ -81,27 +86,27 @@ def test_rank2(self):
         tm.assert_frame_equal(result, expected)
 
         df = DataFrame([['b', np.nan, 'a'], ['a', 'c', 'b']])
-        expected = DataFrame([[2.0, nan, 1.0], [1.0, 3.0, 2.0]])
+        expected = DataFrame([[2.0, np.nan, 1.0], [1.0, 3.0, 2.0]])
         result = df.rank(1, numeric_only=False)
         tm.assert_frame_equal(result, expected)
 
-        expected = DataFrame([[2.0, nan, 1.0], [1.0, 1.0, 2.0]])
+        expected = DataFrame([[2.0, np.nan, 1.0], [1.0, 1.0, 2.0]])
         result = df.rank(0, numeric_only=False)
         tm.assert_frame_equal(result, expected)
 
         # f7u12, this does not work without extensive workaround
-        data = [[datetime(2001, 1, 5), nan, datetime(2001, 1, 2)],
+        data = [[datetime(2001, 1, 5), np.nan, datetime(2001, 1, 2)],
                 [datetime(2000, 1, 2), datetime(2000, 1, 3),
                  datetime(2000, 1, 1)]]
         df = DataFrame(data)
 
         # check the rank
-        expected = DataFrame([[2., nan, 1.],
+        expected = DataFrame([[2., np.nan, 1.],
                               [2., 3., 1.]])
         result = df.rank(1, numeric_only=False, ascending=True)
         tm.assert_frame_equal(result, expected)
 
-        expected = DataFrame([[1., nan, 2.],
+        expected = DataFrame([[1., np.nan, 2.],
                               [2., 1., 3.]])
         result = df.rank(1, numeric_only=False, ascending=False)
         tm.assert_frame_equal(result, expected)
@@ -120,8 +125,7 @@ def test_rank2(self):
         tm.assert_frame_equal(df.rank(), exp)
 
     def test_rank_na_option(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
 
         self.frame['A'][::2] = np.nan
         self.frame['B'][::3] = np.nan
@@ -186,6 +190,16 @@ def test_rank_na_option(self):
         tm.assert_numpy_array_equal(ranks0.values, exp0)
         tm.assert_numpy_array_equal(ranks1.values, exp1)
 
+        # bad values throw error
+        msg = "na_option must be one of 'keep', 'top', or 'bottom'"
+
+        with pytest.raises(ValueError, match=msg):
+            self.frame.rank(na_option='bad', ascending=False)
+
+        # invalid type
+        with pytest.raises(ValueError, match=msg):
+            self.frame.rank(na_option=True, ascending=False)
+
     def test_rank_axis(self):
         # check if using axes' names gives the same result
         df = DataFrame([[2, 1], [4, 3]])
@@ -193,10 +207,9 @@ def test_rank_axis(self):
         tm.assert_frame_equal(df.rank(axis=1), df.rank(axis='columns'))
 
     def test_rank_methods_frame(self):
-        tm.skip_if_no_package('scipy', min_version='0.13',
-                              app='scipy.stats.rankdata')
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
         import scipy
-        from scipy.stats import rankdata
 
         xs = np.random.randint(0, 21, (100, 26))
         xs = (xs - 10.0) / 10.0
@@ -214,38 +227,40 @@ def test_rank_methods_frame(self):
                     sprank = sprank.astype(np.float64)
                     expected = DataFrame(sprank, columns=cols)
 
-                    if LooseVersion(scipy.__version__) >= '0.17.0':
+                    if (LooseVersion(scipy.__version__) >=
+                            LooseVersion('0.17.0')):
                         expected = expected.astype('float64')
                     tm.assert_frame_equal(result, expected)
 
-    def test_rank_descending(self):
-        dtypes = ['O', 'f8', 'i8']
+    @pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+    def test_rank_descending(self, method, dtype):
 
-        for dtype, method in product(dtypes, self.results):
-            if 'i' in dtype:
-                df = self.df.dropna()
-            else:
-                df = self.df.astype(dtype)
+        if 'i' in dtype:
+            df = self.df.dropna()
+        else:
+            df = self.df.astype(dtype)
 
-            res = df.rank(ascending=False)
-            expected = (df.max() - df).rank()
-            assert_frame_equal(res, expected)
+        res = df.rank(ascending=False)
+        expected = (df.max() - df).rank()
+        assert_frame_equal(res, expected)
 
-            if method == 'first' and dtype == 'O':
-                continue
+        if method == 'first' and dtype == 'O':
+            return
 
-            expected = (df.max() - df).rank(method=method)
+        expected = (df.max() - df).rank(method=method)
 
-            if dtype != 'O':
-                res2 = df.rank(method=method, ascending=False,
-                               numeric_only=True)
-                assert_frame_equal(res2, expected)
+        if dtype != 'O':
+            res2 = df.rank(method=method, ascending=False,
+                           numeric_only=True)
+            assert_frame_equal(res2, expected)
 
-            res3 = df.rank(method=method, ascending=False,
-                           numeric_only=False)
-            assert_frame_equal(res3, expected)
+        res3 = df.rank(method=method, ascending=False,
+                       numeric_only=False)
+        assert_frame_equal(res3, expected)
 
-    def test_rank_2d_tie_methods(self):
+    @pytest.mark.parametrize('axis', [0, 1])
+    @pytest.mark.parametrize('dtype', [None, object])
+    def test_rank_2d_tie_methods(self, method, axis, dtype):
         df = self.df
 
         def _check2d(df, expected, method='average', axis=0):
@@ -258,12 +273,47 @@ def _check2d(df, expected, method='average', axis=0):
             result = df.rank(method=method, axis=axis)
             assert_frame_equal(result, exp_df)
 
-        dtypes = [None, object]
-        disabled = set([(object, 'first')])
-        results = self.results
+        disabled = {(object, 'first')}
+        if (dtype, method) in disabled:
+            return
+        frame = df if dtype is None else df.astype(dtype)
+        _check2d(frame, self.results[method], method=method, axis=axis)
+
+    @pytest.mark.parametrize(
+        "method,exp", [("dense",
+                        [[1., 1., 1.],
+                         [1., 0.5, 2. / 3],
+                         [1., 0.5, 1. / 3]]),
+                       ("min",
+                        [[1. / 3, 1., 1.],
+                         [1. / 3, 1. / 3, 2. / 3],
+                         [1. / 3, 1. / 3, 1. / 3]]),
+                       ("max",
+                        [[1., 1., 1.],
+                         [1., 2. / 3, 2. / 3],
+                         [1., 2. / 3, 1. / 3]]),
+                       ("average",
+                        [[2. / 3, 1., 1.],
+                         [2. / 3, 0.5, 2. / 3],
+                         [2. / 3, 0.5, 1. / 3]]),
+                       ("first",
+                        [[1. / 3, 1., 1.],
+                         [2. / 3, 1. / 3, 2. / 3],
+                         [3. / 3, 2. / 3, 1. / 3]])])
+    def test_rank_pct_true(self, method, exp):
+        # see gh-15630.
+
+        df = DataFrame([[2012, 66, 3], [2012, 65, 2], [2012, 65, 1]])
+        result = df.rank(method=method, pct=True)
+
+        expected = DataFrame(exp)
+        tm.assert_frame_equal(result, expected)
 
-        for method, axis, dtype in product(results, [0, 1], dtypes):
-            if (dtype, method) in disabled:
-                continue
-            frame = df if dtype is None else df.astype(dtype)
-            _check2d(frame, results[method], method=method, axis=axis)
+    @pytest.mark.single
+    @pytest.mark.high_memory
+    def test_pct_max_many_rows(self):
+        # GH 18271
+        df = DataFrame({'A': np.arange(2**24 + 1),
+                        'B': np.arange(2**24 + 1, 0, -1)})
+        result = df.rank(pct=True).max()
+        assert (result == 1).all()
diff --git a/pandas/tests/frame/test_replace.py b/pandas/tests/frame/test_replace.py
index fce59e10bf4bd..50c66d3f8db00 100644
--- a/pandas/tests/frame/test_replace.py
+++ b/pandas/tests/frame/test_replace.py
@@ -5,46 +5,38 @@
 from datetime import datetime
 import re
 
-from pandas.compat import (zip, range, lrange, StringIO)
-from pandas import (DataFrame, Series, Index, date_range, compat,
-                    Timestamp)
-import pandas as pd
-
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal)
-
-import pandas.util.testing as tm
+from pandas.compat import StringIO, lrange, range, zip
 
+import pandas as pd
+from pandas import DataFrame, Index, Series, Timestamp, compat, date_range
 from pandas.tests.frame.common import TestData
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameReplace(tm.TestCase, TestData):
+class TestDataFrameReplace(TestData):
 
     def test_replace_inplace(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
+        self.tsframe['A'][:5] = np.nan
+        self.tsframe['A'][-5:] = np.nan
 
         tsframe = self.tsframe.copy()
-        tsframe.replace(nan, 0, inplace=True)
+        tsframe.replace(np.nan, 0, inplace=True)
         assert_frame_equal(tsframe, self.tsframe.fillna(0))
 
-        self.assertRaises(TypeError, self.tsframe.replace, nan, inplace=True)
-        self.assertRaises(TypeError, self.tsframe.replace, nan)
-
         # mixed type
         mf = self.mixed_frame
-        mf.iloc[5:20, mf.columns.get_loc('foo')] = nan
-        mf.iloc[-10:, mf.columns.get_loc('A')] = nan
+        mf.iloc[5:20, mf.columns.get_loc('foo')] = np.nan
+        mf.iloc[-10:, mf.columns.get_loc('A')] = np.nan
 
         result = self.mixed_frame.replace(np.nan, 0)
         expected = self.mixed_frame.fillna(value=0)
         assert_frame_equal(result, expected)
 
         tsframe = self.tsframe.copy()
-        tsframe.replace([nan], [0], inplace=True)
+        tsframe.replace([np.nan], [0], inplace=True)
         assert_frame_equal(tsframe, self.tsframe.fillna(0))
 
     def test_regex_replace_scalar(self):
@@ -56,11 +48,11 @@ def test_regex_replace_scalar(self):
         # simplest cases
         # regex -> value
         # obj frame
-        res = dfobj.replace(r'\s*\.\s*', nan, regex=True)
+        res = dfobj.replace(r'\s*\.\s*', np.nan, regex=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
-        res = dfmix.replace(r'\s*\.\s*', nan, regex=True)
+        res = dfmix.replace(r'\s*\.\s*', np.nan, regex=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -79,11 +71,11 @@ def test_regex_replace_scalar(self):
         assert_frame_equal(res, expec)
 
         # everything with compiled regexs as well
-        res = dfobj.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
+        res = dfobj.replace(re.compile(r'\s*\.\s*'), np.nan, regex=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
-        res = dfmix.replace(re.compile(r'\s*\.\s*'), nan, regex=True)
+        res = dfmix.replace(re.compile(r'\s*\.\s*'), np.nan, regex=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -123,12 +115,12 @@ def test_regex_replace_scalar_inplace(self):
         # regex -> value
         # obj frame
         res = dfobj.copy()
-        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
+        res.replace(r'\s*\.\s*', np.nan, regex=True, inplace=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
         res = dfmix.copy()
-        res.replace(r'\s*\.\s*', nan, regex=True, inplace=True)
+        res.replace(r'\s*\.\s*', np.nan, regex=True, inplace=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -150,12 +142,12 @@ def test_regex_replace_scalar_inplace(self):
 
         # everything with compiled regexs as well
         res = dfobj.copy()
-        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
+        res.replace(re.compile(r'\s*\.\s*'), np.nan, regex=True, inplace=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
         res = dfmix.copy()
-        res.replace(re.compile(r'\s*\.\s*'), nan, regex=True, inplace=True)
+        res.replace(re.compile(r'\s*\.\s*'), np.nan, regex=True, inplace=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -178,12 +170,12 @@ def test_regex_replace_scalar_inplace(self):
         assert_frame_equal(res, expec)
 
         res = dfobj.copy()
-        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
+        res.replace(regex=r'\s*\.\s*', value=np.nan, inplace=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
         res = dfmix.copy()
-        res.replace(regex=r'\s*\.\s*', value=nan, inplace=True)
+        res.replace(regex=r'\s*\.\s*', value=np.nan, inplace=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -205,12 +197,12 @@ def test_regex_replace_scalar_inplace(self):
 
         # everything with compiled regexs as well
         res = dfobj.copy()
-        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
+        res.replace(regex=re.compile(r'\s*\.\s*'), value=np.nan, inplace=True)
         assert_frame_equal(dfobj, res.fillna('.'))
 
         # mixed
         res = dfmix.copy()
-        res.replace(regex=re.compile(r'\s*\.\s*'), value=nan, inplace=True)
+        res.replace(regex=re.compile(r'\s*\.\s*'), value=np.nan, inplace=True)
         assert_frame_equal(dfmix, res.fillna('.'))
 
         # regex -> regex
@@ -239,9 +231,9 @@ def test_regex_replace_list_obj(self):
         # lists of regexes and values
         # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
         to_replace_res = [r'\s*\.\s*', r'e|f|g']
-        values = [nan, 'crap']
+        values = [np.nan, 'crap']
         res = dfobj.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
+        expec = DataFrame({'a': ['a', 'b', np.nan, np.nan], 'b': ['crap'] * 3 +
                            ['h'], 'c': ['h', 'crap', 'l', 'o']})
         assert_frame_equal(res, expec)
 
@@ -283,10 +275,10 @@ def test_regex_replace_list_obj_inplace(self):
         # lists of regexes and values
         # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
         to_replace_res = [r'\s*\.\s*', r'e|f|g']
-        values = [nan, 'crap']
+        values = [np.nan, 'crap']
         res = dfobj.copy()
         res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': ['a', 'b', nan, nan], 'b': ['crap'] * 3 +
+        expec = DataFrame({'a': ['a', 'b', np.nan, np.nan], 'b': ['crap'] * 3 +
                            ['h'], 'c': ['h', 'crap', 'l', 'o']})
         assert_frame_equal(res, expec)
 
@@ -330,11 +322,11 @@ def test_regex_replace_list_mixed(self):
         # lists of regexes and values
         # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
         to_replace_res = [r'\s*\.\s*', r'a']
-        values = [nan, 'crap']
+        values = [np.nan, 'crap']
         mix2 = {'a': lrange(4), 'b': list('ab..'), 'c': list('halo')}
         dfmix2 = DataFrame(mix2)
         res = dfmix2.replace(to_replace_res, values, regex=True)
-        expec = DataFrame({'a': mix2['a'], 'b': ['crap', 'b', nan, nan],
+        expec = DataFrame({'a': mix2['a'], 'b': ['crap', 'b', np.nan, np.nan],
                            'c': ['h', 'crap', 'l', 'o']})
         assert_frame_equal(res, expec)
 
@@ -368,10 +360,10 @@ def test_regex_replace_list_mixed_inplace(self):
         # lists of regexes and values
         # list of [re1, re2, ..., reN] -> [v1, v2, ..., vN]
         to_replace_res = [r'\s*\.\s*', r'a']
-        values = [nan, 'crap']
+        values = [np.nan, 'crap']
         res = dfmix.copy()
         res.replace(to_replace_res, values, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b', nan, nan]})
+        expec = DataFrame({'a': mix['a'], 'b': ['crap', 'b', np.nan, np.nan]})
         assert_frame_equal(res, expec)
 
         # list of [re1, re2, ..., reN] -> [re1, re2, .., reN]
@@ -401,7 +393,7 @@ def test_regex_replace_list_mixed_inplace(self):
         assert_frame_equal(res, expec)
 
     def test_regex_replace_dict_mixed(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         dfmix = DataFrame(mix)
 
         # dicts
@@ -410,10 +402,11 @@ def test_regex_replace_dict_mixed(self):
 
         # list of dicts {re1: v1, re2: v2, ..., re3: v3}, search the whole
         # frame
-        res = dfmix.replace({'b': r'\s*\.\s*'}, {'b': nan}, regex=True)
+        res = dfmix.replace({'b': r'\s*\.\s*'}, {'b': np.nan}, regex=True)
         res2 = dfmix.copy()
-        res2.replace({'b': r'\s*\.\s*'}, {'b': nan}, inplace=True, regex=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+        res2.replace({'b': r'\s*\.\s*'}, {'b': np.nan},
+                     inplace=True, regex=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', np.nan, np.nan], 'c':
                            mix['c']})
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
@@ -440,39 +433,46 @@ def test_regex_replace_dict_mixed(self):
 
         # scalar -> dict
         # to_replace regex, {value: value}
-        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
+        expec = DataFrame({'a': mix['a'], 'b': [np.nan, 'b', '.', '.'], 'c':
                            mix['c']})
-        res = dfmix.replace('a', {'b': nan}, regex=True)
+        res = dfmix.replace('a', {'b': np.nan}, regex=True)
         res2 = dfmix.copy()
-        res2.replace('a', {'b': nan}, regex=True, inplace=True)
+        res2.replace('a', {'b': np.nan}, regex=True, inplace=True)
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
 
-        res = dfmix.replace('a', {'b': nan}, regex=True)
+        res = dfmix.replace('a', {'b': np.nan}, regex=True)
         res2 = dfmix.copy()
-        res2.replace(regex='a', value={'b': nan}, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': [nan, 'b', '.', '.'], 'c':
+        res2.replace(regex='a', value={'b': np.nan}, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': [np.nan, 'b', '.', '.'], 'c':
                            mix['c']})
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
 
     def test_regex_replace_dict_nested(self):
         # nested dicts will not work until this is implemented for Series
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         dfmix = DataFrame(mix)
-        res = dfmix.replace({'b': {r'\s*\.\s*': nan}}, regex=True)
+        res = dfmix.replace({'b': {r'\s*\.\s*': np.nan}}, regex=True)
         res2 = dfmix.copy()
         res4 = dfmix.copy()
-        res2.replace({'b': {r'\s*\.\s*': nan}}, inplace=True, regex=True)
-        res3 = dfmix.replace(regex={'b': {r'\s*\.\s*': nan}})
-        res4.replace(regex={'b': {r'\s*\.\s*': nan}}, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+        res2.replace({'b': {r'\s*\.\s*': np.nan}}, inplace=True, regex=True)
+        res3 = dfmix.replace(regex={'b': {r'\s*\.\s*': np.nan}})
+        res4.replace(regex={'b': {r'\s*\.\s*': np.nan}}, inplace=True)
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', np.nan, np.nan], 'c':
                            mix['c']})
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
         assert_frame_equal(res3, expec)
         assert_frame_equal(res4, expec)
 
+    def test_regex_replace_dict_nested_non_first_character(self):
+        # GH 25259
+        df = pd.DataFrame({'first': ['abc', 'bca', 'cab']})
+        expected = pd.DataFrame({'first': ['.bc', 'bc.', 'c.b']})
+        result = df.replace({'a': '.'}, regex=True)
+        assert_frame_equal(result, expected)
+
     def test_regex_replace_dict_nested_gh4115(self):
         df = pd.DataFrame({'Type': ['Q', 'T', 'Q', 'Q', 'T'], 'tmp': 2})
         expected = DataFrame({'Type': [0, 1, 0, 0, 1], 'tmp': 2})
@@ -480,23 +480,23 @@ def test_regex_replace_dict_nested_gh4115(self):
         assert_frame_equal(result, expected)
 
     def test_regex_replace_list_to_scalar(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
-        expec = DataFrame({'a': mix['a'], 'b': np.array([nan] * 4),
-                           'c': [nan, nan, nan, 'd']})
+        expec = DataFrame({'a': mix['a'], 'b': np.array([np.nan] * 4),
+                           'c': [np.nan, np.nan, np.nan, 'd']})
 
-        res = df.replace([r'\s*\.\s*', 'a|b'], nan, regex=True)
+        res = df.replace([r'\s*\.\s*', 'a|b'], np.nan, regex=True)
         res2 = df.copy()
         res3 = df.copy()
-        res2.replace([r'\s*\.\s*', 'a|b'], nan, regex=True, inplace=True)
-        res3.replace(regex=[r'\s*\.\s*', 'a|b'], value=nan, inplace=True)
+        res2.replace([r'\s*\.\s*', 'a|b'], np.nan, regex=True, inplace=True)
+        res3.replace(regex=[r'\s*\.\s*', 'a|b'], value=np.nan, inplace=True)
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
         assert_frame_equal(res3, expec)
 
     def test_regex_replace_str_to_numeric(self):
         # what happens when you try to replace a numeric value with a regex?
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
         res = df.replace(r'\s*\.\s*', 0, regex=True)
         res2 = df.copy()
@@ -510,7 +510,7 @@ def test_regex_replace_str_to_numeric(self):
         assert_frame_equal(res3, expec)
 
     def test_regex_replace_regex_list_to_numeric(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
         res = df.replace([r'\s*\.\s*', 'b'], 0, regex=True)
         res2 = df.copy()
@@ -518,55 +518,53 @@ def test_regex_replace_regex_list_to_numeric(self):
         res3 = df.copy()
         res3.replace(regex=[r'\s*\.\s*', 'b'], value=0, inplace=True)
         expec = DataFrame({'a': mix['a'], 'b': ['a', 0, 0, 0], 'c': ['a', 0,
-                                                                     nan,
+                                                                     np.nan,
                                                                      'd']})
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
         assert_frame_equal(res3, expec)
 
     def test_regex_replace_series_of_regexes(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
         s1 = Series({'b': r'\s*\.\s*'})
-        s2 = Series({'b': nan})
+        s2 = Series({'b': np.nan})
         res = df.replace(s1, s2, regex=True)
         res2 = df.copy()
         res2.replace(s1, s2, inplace=True, regex=True)
         res3 = df.copy()
         res3.replace(regex=s1, value=s2, inplace=True)
-        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', nan, nan], 'c':
+        expec = DataFrame({'a': mix['a'], 'b': ['a', 'b', np.nan, np.nan], 'c':
                            mix['c']})
         assert_frame_equal(res, expec)
         assert_frame_equal(res2, expec)
         assert_frame_equal(res3, expec)
 
     def test_regex_replace_numeric_to_object_conversion(self):
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
         expec = DataFrame({'a': ['a', 1, 2, 3], 'b': mix['b'], 'c': mix['c']})
         res = df.replace(0, 'a')
         assert_frame_equal(res, expec)
-        self.assertEqual(res.a.dtype, np.object_)
+        assert res.a.dtype == np.object_
 
-    def test_replace_regex_metachar(self):
-        metachars = '[]', '()', r'\d', r'\w', r'\s'
-
-        for metachar in metachars:
-            df = DataFrame({'a': [metachar, 'else']})
-            result = df.replace({'a': {metachar: 'paren'}})
-            expected = DataFrame({'a': ['paren', 'else']})
-            assert_frame_equal(result, expected)
+    @pytest.mark.parametrize('metachar', ['[]', '()', r'\d', r'\w', r'\s'])
+    def test_replace_regex_metachar(self, metachar):
+        df = DataFrame({'a': [metachar, 'else']})
+        result = df.replace({'a': {metachar: 'paren'}})
+        expected = DataFrame({'a': ['paren', 'else']})
+        assert_frame_equal(result, expected)
 
     def test_replace(self):
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
+        self.tsframe['A'][:5] = np.nan
+        self.tsframe['A'][-5:] = np.nan
 
-        zero_filled = self.tsframe.replace(nan, -1e8)
+        zero_filled = self.tsframe.replace(np.nan, -1e8)
         assert_frame_equal(zero_filled, self.tsframe.fillna(-1e8))
-        assert_frame_equal(zero_filled.replace(-1e8, nan), self.tsframe)
+        assert_frame_equal(zero_filled.replace(-1e8, np.nan), self.tsframe)
 
-        self.tsframe['A'][:5] = nan
-        self.tsframe['A'][-5:] = nan
+        self.tsframe['A'][:5] = np.nan
+        self.tsframe['A'][-5:] = np.nan
         self.tsframe['B'][:5] = -1e8
 
         # empty
@@ -589,9 +587,9 @@ def test_replace_list(self):
         # lists of regexes and values
         # list of [v1, v2, ..., vN] -> [v1, v2, ..., vN]
         to_replace_res = [r'.', r'e']
-        values = [nan, 'crap']
+        values = [np.nan, 'crap']
         res = dfobj.replace(to_replace_res, values)
-        expec = DataFrame({'a': ['a', 'b', nan, nan],
+        expec = DataFrame({'a': ['a', 'b', np.nan, np.nan],
                            'b': ['crap', 'f', 'g', 'h'], 'c': ['h', 'crap',
                                                                'l', 'o']})
         assert_frame_equal(res, expec)
@@ -606,6 +604,20 @@ def test_replace_list(self):
 
         assert_frame_equal(res, expec)
 
+    def test_replace_with_empty_list(self):
+        # GH 21977
+        s = pd.Series([['a', 'b'], [], np.nan, [1]])
+        df = pd.DataFrame({'col': s})
+        expected = df
+        result = df.replace([], np.nan)
+        assert_frame_equal(result, expected)
+
+        # GH 19266
+        with pytest.raises(ValueError, match="cannot assign mismatch"):
+            df.replace({np.nan: []})
+        with pytest.raises(ValueError, match="cannot assign mismatch"):
+            df.replace({np.nan: ['dummy', 'alt']})
+
     def test_replace_series_dict(self):
         # from GH 3064
         df = DataFrame({'zero': {'a': 0.0, 'b': 1}, 'one': {'a': 2.0, 'b': 0}})
@@ -639,18 +651,18 @@ def test_replace_convert(self):
 
     def test_replace_mixed(self):
         mf = self.mixed_frame
-        mf.iloc[5:20, mf.columns.get_loc('foo')] = nan
-        mf.iloc[-10:, mf.columns.get_loc('A')] = nan
+        mf.iloc[5:20, mf.columns.get_loc('foo')] = np.nan
+        mf.iloc[-10:, mf.columns.get_loc('A')] = np.nan
 
         result = self.mixed_frame.replace(np.nan, -18)
         expected = self.mixed_frame.fillna(value=-18)
         assert_frame_equal(result, expected)
-        assert_frame_equal(result.replace(-18, nan), self.mixed_frame)
+        assert_frame_equal(result.replace(-18, np.nan), self.mixed_frame)
 
         result = self.mixed_frame.replace(np.nan, -1e8)
         expected = self.mixed_frame.fillna(value=-1e8)
         assert_frame_equal(result, expected)
-        assert_frame_equal(result.replace(-1e8, nan), self.mixed_frame)
+        assert_frame_equal(result.replace(-1e8, np.nan), self.mixed_frame)
 
         # int block upcasting
         df = DataFrame({'A': Series([1.0, 2.0], dtype='float64'),
@@ -718,18 +730,17 @@ def test_replace_simple_nested_dict_with_nonexistent_value(self):
         assert_frame_equal(expected, result)
 
     def test_replace_value_is_none(self):
-        self.assertRaises(TypeError, self.tsframe.replace, nan)
         orig_value = self.tsframe.iloc[0, 0]
         orig2 = self.tsframe.iloc[1, 0]
 
-        self.tsframe.iloc[0, 0] = nan
+        self.tsframe.iloc[0, 0] = np.nan
         self.tsframe.iloc[1, 0] = 1
 
-        result = self.tsframe.replace(to_replace={nan: 0})
-        expected = self.tsframe.T.replace(to_replace={nan: 0}).T
+        result = self.tsframe.replace(to_replace={np.nan: 0})
+        expected = self.tsframe.T.replace(to_replace={np.nan: 0}).T
         assert_frame_equal(result, expected)
 
-        result = self.tsframe.replace(to_replace={nan: 0, 1: -1e8})
+        result = self.tsframe.replace(to_replace={np.nan: 0, 1: -1e8})
         tsframe = self.tsframe.copy()
         tsframe.iloc[0, 0] = 0
         tsframe.iloc[1, 0] = -1e8
@@ -742,57 +753,54 @@ def test_replace_for_new_dtypes(self):
 
         # dtypes
         tsframe = self.tsframe.copy().astype(np.float32)
-        tsframe['A'][:5] = nan
-        tsframe['A'][-5:] = nan
+        tsframe['A'][:5] = np.nan
+        tsframe['A'][-5:] = np.nan
 
-        zero_filled = tsframe.replace(nan, -1e8)
+        zero_filled = tsframe.replace(np.nan, -1e8)
         assert_frame_equal(zero_filled, tsframe.fillna(-1e8))
-        assert_frame_equal(zero_filled.replace(-1e8, nan), tsframe)
+        assert_frame_equal(zero_filled.replace(-1e8, np.nan), tsframe)
 
-        tsframe['A'][:5] = nan
-        tsframe['A'][-5:] = nan
+        tsframe['A'][:5] = np.nan
+        tsframe['A'][-5:] = np.nan
         tsframe['B'][:5] = -1e8
 
         b = tsframe['B']
-        b[b == -1e8] = nan
+        b[b == -1e8] = np.nan
         tsframe['B'] = b
         result = tsframe.fillna(method='bfill')
         assert_frame_equal(result, tsframe.fillna(method='bfill'))
 
-    def test_replace_dtypes(self):
-        # int
-        df = DataFrame({'ints': [1, 2, 3]})
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]})
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int32)
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int32)
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({'ints': [1, 2, 3]}, dtype=np.int16)
-        result = df.replace(1, 0)
-        expected = DataFrame({'ints': [0, 2, 3]}, dtype=np.int16)
-        assert_frame_equal(result, expected)
-
-        # bools
-        df = DataFrame({'bools': [True, False, True]})
-        result = df.replace(False, True)
-        self.assertTrue(result.values.all())
-
-        # complex blocks
-        df = DataFrame({'complex': [1j, 2j, 3j]})
-        result = df.replace(1j, 0j)
-        expected = DataFrame({'complex': [0j, 2j, 3j]})
-        assert_frame_equal(result, expected)
-
-        # datetime blocks
-        prev = datetime.today()
-        now = datetime.today()
-        df = DataFrame({'datetime64': Index([prev, now, prev])})
-        result = df.replace(prev, now)
-        expected = DataFrame({'datetime64': Index([now] * 3)})
+    @pytest.mark.parametrize('frame, to_replace, value, expected', [
+        (DataFrame({'ints': [1, 2, 3]}), 1, 0,
+         DataFrame({'ints': [0, 2, 3]})),
+        (DataFrame({'ints': [1, 2, 3]}, dtype=np.int32), 1, 0,
+         DataFrame({'ints': [0, 2, 3]}, dtype=np.int32)),
+        (DataFrame({'ints': [1, 2, 3]}, dtype=np.int16), 1, 0,
+         DataFrame({'ints': [0, 2, 3]}, dtype=np.int16)),
+        (DataFrame({'bools': [True, False, True]}), False, True,
+         DataFrame({'bools': [True, True, True]})),
+        (DataFrame({'complex': [1j, 2j, 3j]}), 1j, 0,
+         DataFrame({'complex': [0j, 2j, 3j]})),
+        (DataFrame({'datetime64': Index([datetime(2018, 5, 28),
+                                         datetime(2018, 7, 28),
+                                         datetime(2018, 5, 28)])}),
+         datetime(2018, 5, 28), datetime(2018, 7, 28),
+         DataFrame({'datetime64': Index([datetime(2018, 7, 28)] * 3)})),
+        # GH 20380
+        (DataFrame({'dt': [datetime(3017, 12, 20)], 'str': ['foo']}),
+         'foo', 'bar',
+         DataFrame({'dt': [datetime(3017, 12, 20)], 'str': ['bar']})),
+        (DataFrame({'A': date_range('20130101', periods=3, tz='US/Eastern'),
+                    'B': [0, np.nan, 2]}),
+         Timestamp('20130102', tz='US/Eastern'),
+         Timestamp('20130104', tz='US/Eastern'),
+         DataFrame({'A': [Timestamp('20130101', tz='US/Eastern'),
+                          Timestamp('20130104', tz='US/Eastern'),
+                          Timestamp('20130103', tz='US/Eastern')],
+                    'B': [0, np.nan, 2]}))
+    ])
+    def test_replace_dtypes(self, frame, to_replace, value, expected):
+        result = getattr(frame, 'replace')(to_replace, value)
         assert_frame_equal(result, expected)
 
     def test_replace_input_formats_listlike(self):
@@ -802,9 +810,8 @@ def test_replace_input_formats_listlike(self):
         df = DataFrame({'A': [np.nan, 0, np.inf], 'B': [0, 2, 5],
                         'C': ['', 'asdf', 'fd']})
         filled = df.replace(to_rep, values)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(to_rep[k], values[k])
+        expected = {k: v.replace(to_rep[k], values[k])
+                    for k, v in compat.iteritems(df)}
         assert_frame_equal(filled, DataFrame(expected))
 
         result = df.replace([0, 2, 5], [5, 2, 0])
@@ -817,9 +824,8 @@ def test_replace_input_formats_listlike(self):
         df = DataFrame({'A': [np.nan, 0, np.nan], 'B': [0, 2, 5],
                         'C': ['', 'asdf', 'fd']})
         filled = df.replace(np.nan, values)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(np.nan, values[k])
+        expected = {k: v.replace(np.nan, values[k])
+                    for k, v in compat.iteritems(df)}
         assert_frame_equal(filled, DataFrame(expected))
 
         # list to list
@@ -831,7 +837,9 @@ def test_replace_input_formats_listlike(self):
             expected.replace(to_rep[i], values[i], inplace=True)
         assert_frame_equal(result, expected)
 
-        self.assertRaises(ValueError, df.replace, to_rep, values[1:])
+        msg = r"Replacement lists must match in length\. Expecting 3 got 2"
+        with pytest.raises(ValueError, match=msg):
+            df.replace(to_rep, values[1:])
 
     def test_replace_input_formats_scalar(self):
         df = DataFrame({'A': [np.nan, 0, np.inf], 'B': [0, 2, 5],
@@ -840,12 +848,13 @@ def test_replace_input_formats_scalar(self):
         # dict to scalar
         to_rep = {'A': np.nan, 'B': 0, 'C': ''}
         filled = df.replace(to_rep, 0)
-        expected = {}
-        for k, v in compat.iteritems(df):
-            expected[k] = v.replace(to_rep[k], 0)
+        expected = {k: v.replace(to_rep[k], 0)
+                    for k, v in compat.iteritems(df)}
         assert_frame_equal(filled, DataFrame(expected))
 
-        self.assertRaises(TypeError, df.replace, to_rep, [np.nan, 0, ''])
+        msg = "value argument must be scalar, dict, or Series"
+        with pytest.raises(TypeError, match=msg):
+            df.replace(to_rep, [np.nan, 0, ''])
 
         # list to scalar
         to_rep = [np.nan, 0, '']
@@ -877,10 +886,10 @@ def test_replace_series_no_regex(self):
         assert_series_equal(result, expected)
 
     def test_replace_dict_tuple_list_ordering_remains_the_same(self):
-        df = DataFrame(dict(A=[nan, 1]))
-        res1 = df.replace(to_replace={nan: 0, 1: -1e8})
-        res2 = df.replace(to_replace=(1, nan), value=[-1e8, 0])
-        res3 = df.replace(to_replace=[1, nan], value=[-1e8, 0])
+        df = DataFrame(dict(A=[np.nan, 1]))
+        res1 = df.replace(to_replace={np.nan: 0, 1: -1e8})
+        res2 = df.replace(to_replace=(1, np.nan), value=[-1e8, 0])
+        res3 = df.replace(to_replace=[1, np.nan], value=[-1e8, 0])
 
         expected = DataFrame({'A': [0, -1e8]})
         assert_frame_equal(res1, res2)
@@ -916,7 +925,7 @@ def test_replace_bool_with_bool(self):
 
     def test_replace_with_dict_with_bool_keys(self):
         df = DataFrame({0: [True, False], 1: [False, True]})
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
+        with pytest.raises(TypeError, match='Cannot compare types .+'):
             df.replace({'asdf': 'asdb', True: 'yes'})
 
     def test_replace_truthy(self):
@@ -927,7 +936,7 @@ def test_replace_truthy(self):
 
     def test_replace_int_to_int_chain(self):
         df = DataFrame({'a': lrange(1, 5)})
-        with tm.assertRaisesRegexp(ValueError, "Replacement not allowed .+"):
+        with pytest.raises(ValueError, match="Replacement not allowed .+"):
             df.replace({'a': dict(zip(range(1, 5), range(2, 6)))})
 
     def test_replace_str_to_str_chain(self):
@@ -935,7 +944,7 @@ def test_replace_str_to_str_chain(self):
         astr = a.astype(str)
         bstr = np.arange(2, 6).astype(str)
         df = DataFrame({'a': astr})
-        with tm.assertRaisesRegexp(ValueError, "Replacement not allowed .+"):
+        with pytest.raises(ValueError, match="Replacement not allowed .+"):
             df.replace({'a': dict(zip(astr, bstr))})
 
     def test_replace_swapping_bug(self):
@@ -974,9 +983,12 @@ def test_replace_period(self):
                            'out_augmented_MAY_2011.json',
                            'out_augmented_AUG_2011.json',
                            'out_augmented_JAN_2011.json'], columns=['fname'])
-        tm.assert_equal(set(df.fname.values), set(d['fname'].keys()))
+        assert set(df.fname.values) == set(d['fname'].keys())
+        # We don't support converting object -> specialized EA in
+        # replace yet.
         expected = DataFrame({'fname': [d['fname'][k]
-                                        for k in df.fname.values]})
+                                        for k in df.fname.values]},
+                             dtype=object)
         result = df.replace(d)
         assert_frame_equal(result, expected)
 
@@ -997,7 +1009,7 @@ def test_replace_datetime(self):
                            'out_augmented_MAY_2011.json',
                            'out_augmented_AUG_2011.json',
                            'out_augmented_JAN_2011.json'], columns=['fname'])
-        tm.assert_equal(set(df.fname.values), set(d['fname'].keys()))
+        assert set(df.fname.values) == set(d['fname'].keys())
         expected = DataFrame({'fname': [d['fname'][k]
                                         for k in df.fname.values]})
         result = df.replace(d)
@@ -1061,10 +1073,43 @@ def test_replace_datetimetz(self):
 
     def test_replace_with_empty_dictlike(self):
         # GH 15289
-        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', nan, 'd']}
+        mix = {'a': lrange(4), 'b': list('ab..'), 'c': ['a', 'b', np.nan, 'd']}
         df = DataFrame(mix)
         assert_frame_equal(df, df.replace({}))
         assert_frame_equal(df, df.replace(Series([])))
 
         assert_frame_equal(df, df.replace({'b': {}}))
         assert_frame_equal(df, df.replace(Series({'b': {}})))
+
+    @pytest.mark.parametrize("to_replace, method, expected", [
+        (0, 'bfill', {'A': [1, 1, 2],
+                      'B': [5, np.nan, 7],
+                      'C': ['a', 'b', 'c']}),
+        (np.nan, 'bfill', {'A': [0, 1, 2],
+                           'B': [5.0, 7.0, 7.0],
+                           'C': ['a', 'b', 'c']}),
+        ('d', 'ffill', {'A': [0, 1, 2],
+                        'B': [5, np.nan, 7],
+                        'C': ['a', 'b', 'c']}),
+        ([0, 2], 'bfill', {'A': [1, 1, 2],
+                           'B': [5, np.nan, 7],
+                           'C': ['a', 'b', 'c']}),
+        ([1, 2], 'pad', {'A': [0, 0, 0],
+                         'B': [5, np.nan, 7],
+                         'C': ['a', 'b', 'c']}),
+        ((1, 2), 'bfill', {'A': [0, 2, 2],
+                           'B': [5, np.nan, 7],
+                           'C': ['a', 'b', 'c']}),
+        (['b', 'c'], 'ffill', {'A': [0, 1, 2],
+                               'B': [5, np.nan, 7],
+                               'C': ['a', 'a', 'a']}),
+    ])
+    def test_replace_method(self, to_replace, method, expected):
+        # GH 19632
+        df = DataFrame({'A': [0, 1, 2],
+                        'B': [5, np.nan, 7],
+                        'C': ['a', 'b', 'c']})
+
+        result = df.replace(to_replace=to_replace, value=None, method=method)
+        expected = DataFrame(expected)
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_repr_info.py b/pandas/tests/frame/test_repr_info.py
index 024e11e63a924..4a7cb7f508926 100644
--- a/pandas/tests/frame/test_repr_info.py
+++ b/pandas/tests/frame/test_repr_info.py
@@ -5,25 +5,27 @@
 from datetime import datetime, timedelta
 import re
 import sys
+import textwrap
 
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas import (DataFrame, compat, option_context)
-from pandas.compat import StringIO, lrange, u
-import pandas.formats.format as fmt
-import pandas as pd
-
-import pandas.util.testing as tm
+from pandas.compat import PYPY, StringIO, lrange, u
 
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Series, compat, date_range, option_context,
+    period_range)
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
 
+import pandas.io.formats.format as fmt
 
 # Segregated collection of methods that require the BlockManager internal data
 # structure
 
 
-class TestDataFrameReprInfoEtc(tm.TestCase, TestData):
+class TestDataFrameReprInfoEtc(TestData):
 
     def test_repr_empty(self):
         # empty
@@ -40,14 +42,14 @@ def test_repr_mixed(self):
         foo = repr(self.mixed_frame)  # noqa
         self.mixed_frame.info(verbose=False, buf=buf)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_repr_mixed_big(self):
         # big mixed
         biggie = DataFrame({'A': np.random.randn(200),
                             'B': tm.makeStringIndex(200)},
                            index=lrange(200))
-        biggie.loc[:20, 'A'] = nan
-        biggie.loc[:20, 'B'] = nan
+        biggie.loc[:20, 'A'] = np.nan
+        biggie.loc[:20, 'B'] = np.nan
 
         foo = repr(biggie)  # noqa
 
@@ -72,22 +74,22 @@ def test_repr(self):
         self.empty.info(buf=buf)
 
         df = DataFrame(["a\n\r\tb"], columns=["a\n\r\td"], index=["a\n\r\tf"])
-        self.assertFalse("\t" in repr(df))
-        self.assertFalse("\r" in repr(df))
-        self.assertFalse("a\n" in repr(df))
+        assert "\t" not in repr(df)
+        assert "\r" not in repr(df)
+        assert "a\n" not in repr(df)
 
     def test_repr_dimensions(self):
         df = DataFrame([[1, 2, ], [3, 4]])
         with option_context('display.show_dimensions', True):
-            self.assertTrue("2 rows x 2 columns" in repr(df))
+            assert "2 rows x 2 columns" in repr(df)
 
         with option_context('display.show_dimensions', False):
-            self.assertFalse("2 rows x 2 columns" in repr(df))
+            assert "2 rows x 2 columns" not in repr(df)
 
         with option_context('display.show_dimensions', 'truncate'):
-            self.assertFalse("2 rows x 2 columns" in repr(df))
+            assert "2 rows x 2 columns" not in repr(df)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_repr_big(self):
         # big one
         biggie = DataFrame(np.zeros((200, 4)), columns=lrange(4),
@@ -118,7 +120,7 @@ def test_repr_unsortable(self):
         fmt.set_option('display.max_rows', 1000, 'display.max_columns', 1000)
         repr(self.frame)
 
-        self.reset_display_options()
+        tm.reset_display_options()
 
         warnings.filters = warn_filters
 
@@ -132,11 +134,11 @@ def test_repr_unicode(self):
 
         result = repr(df)
         ex_top = '      A'
-        self.assertEqual(result.split('\n')[0].rstrip(), ex_top)
+        assert result.split('\n')[0].rstrip() == ex_top
 
         df = DataFrame({'A': [uval, uval]})
         result = repr(df)
-        self.assertEqual(result.split('\n')[0].rstrip(), ex_top)
+        assert result.split('\n')[0].rstrip() == ex_top
 
     def test_unicode_string_with_unicode(self):
         df = DataFrame({'A': [u("\u05d0")]})
@@ -170,8 +172,8 @@ def test_repr_column_name_unicode_truncation_bug(self):
                                       'the CSV file externally. I want to Call'
                                       ' the File through the code..')})
 
-        result = repr(df)
-        self.assertIn('StringCol', result)
+        with option_context('display.max_columns', 20):
+            assert 'StringCol' in repr(df)
 
     def test_latex_repr(self):
         result = r"""\begin{tabular}{llll}
@@ -186,10 +188,10 @@ def test_latex_repr(self):
         with option_context("display.latex.escape", False,
                             'display.latex.repr', True):
             df = DataFrame([[r'$\alpha$', 'b', 'c'], [1, 2, 3]])
-            self.assertEqual(result, df._repr_latex_())
+            assert result == df._repr_latex_()
 
         # GH 12182
-        self.assertIsNone(df._repr_latex_())
+        assert df._repr_latex_() is None
 
     def test_info(self):
         io = StringIO()
@@ -198,11 +200,27 @@ def test_info(self):
 
         frame = DataFrame(np.random.randn(5, 3))
 
-        import sys
-        sys.stdout = StringIO()
         frame.info()
         frame.info(verbose=False)
-        sys.stdout = sys.__stdout__
+
+    def test_info_memory(self):
+        # https://github.com/pandas-dev/pandas/issues/21056
+        df = pd.DataFrame({'a': pd.Series([1, 2], dtype='i8')})
+        buf = StringIO()
+        df.info(buf=buf)
+        result = buf.getvalue()
+        bytes = float(df.memory_usage().sum())
+
+        expected = textwrap.dedent("""\
+        <class 'pandas.core.frame.DataFrame'>
+        RangeIndex: 2 entries, 0 to 1
+        Data columns (total 1 columns):
+        a    2 non-null int64
+        dtypes: int64(1)
+        memory usage: {} bytes
+        """.format(bytes))
+
+        assert result == expected
 
     def test_info_wide(self):
         from pandas import set_option, reset_option
@@ -213,13 +231,13 @@ def test_info_wide(self):
         io = StringIO()
         df.info(buf=io, max_cols=101)
         rs = io.getvalue()
-        self.assertTrue(len(rs.splitlines()) > 100)
+        assert len(rs.splitlines()) > 100
         xp = rs
 
         set_option('display.max_info_columns', 101)
         io = StringIO()
         df.info(buf=io)
-        self.assertEqual(rs, xp)
+        assert rs == xp
         reset_option('display.max_info_columns')
 
     def test_info_duplicate_columns(self):
@@ -239,8 +257,8 @@ def test_info_duplicate_columns_shows_correct_dtypes(self):
         frame.info(buf=io)
         io.seek(0)
         lines = io.readlines()
-        self.assertEqual('a    1 non-null int64\n', lines[3])
-        self.assertEqual('a    1 non-null float64\n', lines[4])
+        assert 'a    1 non-null int64\n' == lines[3]
+        assert 'a    1 non-null float64\n' == lines[4]
 
     def test_info_shows_column_dtypes(self):
         dtypes = ['int64', 'float64', 'datetime64[ns]', 'timedelta64[ns]',
@@ -265,7 +283,7 @@ def test_info_max_cols(self):
                 buf = StringIO()
                 df.info(buf=buf, verbose=verbose)
                 res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
+                assert len(res.strip().split('\n')) == len_
 
         for len_, verbose in [(10, None), (5, False), (10, True)]:
 
@@ -274,7 +292,7 @@ def test_info_max_cols(self):
                 buf = StringIO()
                 df.info(buf=buf, verbose=verbose)
                 res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
+                assert len(res.strip().split('\n')) == len_
 
         for len_, max_cols in [(10, 5), (5, 4)]:
             # setting truncates
@@ -282,14 +300,14 @@ def test_info_max_cols(self):
                 buf = StringIO()
                 df.info(buf=buf, max_cols=max_cols)
                 res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
+                assert len(res.strip().split('\n')) == len_
 
             # setting wouldn't truncate
             with option_context('max_info_columns', 5):
                 buf = StringIO()
                 df.info(buf=buf, max_cols=max_cols)
                 res = buf.getvalue()
-                self.assertEqual(len(res.strip().split('\n')), len_)
+                assert len(res.strip().split('\n')) == len_
 
     def test_info_memory_usage(self):
         # Ensure memory usage is displayed, when asserted, on the last line
@@ -305,41 +323,24 @@ def test_info_memory_usage(self):
         # display memory usage case
         df.info(buf=buf, memory_usage=True)
         res = buf.getvalue().splitlines()
-        self.assertTrue("memory usage: " in res[-1])
+        assert "memory usage: " in res[-1]
 
-        # do not display memory usage cas
+        # do not display memory usage case
         df.info(buf=buf, memory_usage=False)
         res = buf.getvalue().splitlines()
-        self.assertTrue("memory usage: " not in res[-1])
+        assert "memory usage: " not in res[-1]
 
         df.info(buf=buf, memory_usage=True)
         res = buf.getvalue().splitlines()
 
         # memory usage is a lower bound, so print it as XYZ+ MB
-        self.assertTrue(re.match(r"memory usage: [^+]+\+", res[-1]))
+        assert re.match(r"memory usage: [^+]+\+", res[-1])
 
         df.iloc[:, :5].info(buf=buf, memory_usage=True)
         res = buf.getvalue().splitlines()
 
         # excluded column with object dtype, so estimate is accurate
-        self.assertFalse(re.match(r"memory usage: [^+]+\+", res[-1]))
-
-        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
-        df_with_object_index.info(buf=buf, memory_usage=True)
-        res = buf.getvalue().splitlines()
-        self.assertTrue(re.match(r"memory usage: [^+]+\+", res[-1]))
-
-        df_with_object_index.info(buf=buf, memory_usage='deep')
-        res = buf.getvalue().splitlines()
-        self.assertTrue(re.match(r"memory usage: [^+]+$", res[-1]))
-
-        self.assertGreater(df_with_object_index.memory_usage(index=True,
-                                                             deep=True).sum(),
-                           df_with_object_index.memory_usage(index=True).sum())
-
-        df_object = pd.DataFrame({'a': ['a']})
-        self.assertGreater(df_object.memory_usage(deep=True).sum(),
-                           df_object.memory_usage().sum())
+        assert not re.match(r"memory usage: [^+]+\+", res[-1])
 
         # Test a DataFrame with duplicate columns
         dtypes = ['int64', 'int64', 'int64', 'float64']
@@ -350,19 +351,27 @@ def test_info_memory_usage(self):
         df = DataFrame(data)
         df.columns = dtypes
 
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        df_with_object_index.info(buf=buf, memory_usage=True)
+        res = buf.getvalue().splitlines()
+        assert re.match(r"memory usage: [^+]+\+", res[-1])
+
+        df_with_object_index.info(buf=buf, memory_usage='deep')
+        res = buf.getvalue().splitlines()
+        assert re.match(r"memory usage: [^+]+$", res[-1])
+
         # Ensure df size is as expected
         # (cols * rows * bytes) + index size
         df_size = df.memory_usage().sum()
         exp_size = len(dtypes) * n * 8 + df.index.nbytes
-        self.assertEqual(df_size, exp_size)
+        assert df_size == exp_size
 
         # Ensure number of cols in memory_usage is the same as df
         size_df = np.size(df.columns.values) + 1  # index=True; default
-        self.assertEqual(size_df, np.size(df.memory_usage()))
+        assert size_df == np.size(df.memory_usage())
 
         # assert deep works only on object
-        self.assertEqual(df.memory_usage().sum(),
-                         df.memory_usage(deep=True).sum())
+        assert df.memory_usage().sum() == df.memory_usage(deep=True).sum()
 
         # test for validity
         DataFrame(1, index=['a'], columns=['A']
@@ -379,10 +388,48 @@ def test_info_memory_usage(self):
         df.memory_usage(index=True)
         df.index.values.nbytes
 
+        mem = df.memory_usage(deep=True).sum()
+        assert mem > 0
+
+    @pytest.mark.skipif(PYPY,
+                        reason="on PyPy deep=True doesn't change result")
+    def test_info_memory_usage_deep_not_pypy(self):
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        assert (df_with_object_index.memory_usage(
+                index=True, deep=True).sum() >
+                df_with_object_index.memory_usage(
+                    index=True).sum())
+
+        df_object = pd.DataFrame({'a': ['a']})
+        assert (df_object.memory_usage(deep=True).sum() >
+                df_object.memory_usage().sum())
+
+    @pytest.mark.skipif(not PYPY,
+                        reason="on PyPy deep=True does not change result")
+    def test_info_memory_usage_deep_pypy(self):
+        df_with_object_index = pd.DataFrame({'a': [1]}, index=['foo'])
+        assert (df_with_object_index.memory_usage(
+                index=True, deep=True).sum() ==
+                df_with_object_index.memory_usage(
+                    index=True).sum())
+
+        df_object = pd.DataFrame({'a': ['a']})
+        assert (df_object.memory_usage(deep=True).sum() ==
+                df_object.memory_usage().sum())
+
+    @pytest.mark.skipif(PYPY, reason="PyPy getsizeof() fails by design")
+    def test_usage_via_getsizeof(self):
+        df = DataFrame(
+            data=1,
+            index=pd.MultiIndex.from_product(
+                [['a'], range(1000)]),
+            columns=['A']
+        )
+        mem = df.memory_usage(deep=True).sum()
         # sys.getsizeof will call the .memory_usage with
         # deep=True, and add on some GC overhead
-        diff = df.memory_usage(deep=True).sum() - sys.getsizeof(df)
-        self.assertTrue(abs(diff) < 100)
+        diff = mem - sys.getsizeof(df)
+        assert abs(diff) < 100
 
     def test_info_memory_usage_qualified(self):
 
@@ -390,27 +437,27 @@ def test_info_memory_usage_qualified(self):
         df = DataFrame(1, columns=list('ab'),
                        index=[1, 2, 3])
         df.info(buf=buf)
-        self.assertFalse('+' in buf.getvalue())
+        assert '+' not in buf.getvalue()
 
         buf = StringIO()
         df = DataFrame(1, columns=list('ab'),
                        index=list('ABC'))
         df.info(buf=buf)
-        self.assertTrue('+' in buf.getvalue())
+        assert '+' in buf.getvalue()
 
         buf = StringIO()
         df = DataFrame(1, columns=list('ab'),
                        index=pd.MultiIndex.from_product(
                            [range(3), range(3)]))
         df.info(buf=buf)
-        self.assertFalse('+' in buf.getvalue())
+        assert '+' not in buf.getvalue()
 
         buf = StringIO()
         df = DataFrame(1, columns=list('ab'),
                        index=pd.MultiIndex.from_product(
                            [range(3), ['foo', 'bar']]))
         df.info(buf=buf)
-        self.assertTrue('+' in buf.getvalue())
+        assert '+' in buf.getvalue()
 
     def test_info_memory_usage_bug_on_multiindex(self):
         # GH 14308
@@ -430,11 +477,11 @@ def memory_usage(f):
         df = DataFrame({'value': np.random.randn(N * M)}, index=index)
 
         unstacked = df.unstack('id')
-        self.assertEqual(df.values.nbytes, unstacked.values.nbytes)
-        self.assertTrue(memory_usage(df) > memory_usage(unstacked))
+        assert df.values.nbytes == unstacked.values.nbytes
+        assert memory_usage(df) > memory_usage(unstacked)
 
         # high upper bound
-        self.assertTrue(memory_usage(unstacked) - memory_usage(df) < 2000)
+        assert memory_usage(unstacked) - memory_usage(df) < 2000
 
     def test_info_categorical(self):
         # GH14298
@@ -443,3 +490,34 @@ def test_info_categorical(self):
 
         buf = StringIO()
         df.info(buf=buf)
+
+    def test_info_categorical_column(self):
+
+        # make sure it works
+        n = 2500
+        df = DataFrame({'int64': np.random.randint(100, size=n)})
+        df['category'] = Series(np.array(list('abcdefghij')).take(
+            np.random.randint(0, 10, size=n))).astype('category')
+        df.isna()
+        buf = StringIO()
+        df.info(buf=buf)
+
+        df2 = df[df['category'] == 'd']
+        buf = compat.StringIO()
+        df2.info(buf=buf)
+
+    def test_repr_categorical_dates_periods(self):
+        # normal DataFrame
+        dt = date_range('2011-01-01 09:00', freq='H', periods=5,
+                        tz='US/Eastern')
+        p = period_range('2011-01', freq='M', periods=5)
+        df = DataFrame({'dt': dt, 'p': p})
+        exp = """                         dt        p
+0 2011-01-01 09:00:00-05:00  2011-01
+1 2011-01-01 10:00:00-05:00  2011-02
+2 2011-01-01 11:00:00-05:00  2011-03
+3 2011-01-01 12:00:00-05:00  2011-04
+4 2011-01-01 13:00:00-05:00  2011-05"""
+
+        df = DataFrame({'dt': Categorical(dt), 'p': Categorical(p)})
+        assert repr(df) == exp
diff --git a/pandas/tests/frame/test_reshape.py b/pandas/tests/frame/test_reshape.py
index c8c7313ddd071..8abf3a6706886 100644
--- a/pandas/tests/frame/test_reshape.py
+++ b/pandas/tests/frame/test_reshape.py
@@ -5,25 +5,20 @@
 from datetime import datetime
 import itertools
 
-from numpy.random import randn
-from numpy import nan
 import numpy as np
+import pytest
 
 from pandas.compat import u
-from pandas import (DataFrame, Index, Series, MultiIndex, date_range,
-                    Timedelta, Period)
-import pandas as pd
-
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
-
-import pandas.util.testing as tm
 
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, Period, Series, Timedelta, date_range)
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameReshape(tm.TestCase, TestData):
+class TestDataFrameReshape(TestData):
 
     def test_pivot(self):
         data = {
@@ -40,44 +35,38 @@ def test_pivot(self):
             'One': {'A': 1., 'B': 2., 'C': 3.},
             'Two': {'A': 1., 'B': 2., 'C': 3.}
         })
-        expected.index.name, expected.columns.name = 'index', 'columns'
 
-        assert_frame_equal(pivoted, expected)
+        expected.index.name, expected.columns.name = 'index', 'columns'
+        tm.assert_frame_equal(pivoted, expected)
 
         # name tracking
-        self.assertEqual(pivoted.index.name, 'index')
-        self.assertEqual(pivoted.columns.name, 'columns')
+        assert pivoted.index.name == 'index'
+        assert pivoted.columns.name == 'columns'
 
         # don't specify values
         pivoted = frame.pivot(index='index', columns='columns')
-        self.assertEqual(pivoted.index.name, 'index')
-        self.assertEqual(pivoted.columns.names, (None, 'columns'))
-
-        # pivot multiple columns
-        wp = tm.makePanel()
-        lp = wp.to_frame()
-        df = lp.reset_index()
-        assert_frame_equal(df.pivot('major', 'minor'), lp.unstack())
+        assert pivoted.index.name == 'index'
+        assert pivoted.columns.names == (None, 'columns')
 
     def test_pivot_duplicates(self):
         data = DataFrame({'a': ['bar', 'bar', 'foo', 'foo', 'foo'],
                           'b': ['one', 'two', 'one', 'one', 'two'],
                           'c': [1., 2., 3., 3., 4.]})
-        with assertRaisesRegexp(ValueError, 'duplicate entries'):
+        with pytest.raises(ValueError, match='duplicate entries'):
             data.pivot('a', 'b', 'c')
 
     def test_pivot_empty(self):
         df = DataFrame({}, columns=['a', 'b', 'c'])
         result = df.pivot('a', 'b', 'c')
-        expected = DataFrame({})
-        assert_frame_equal(result, expected, check_names=False)
+        expected = DataFrame()
+        tm.assert_frame_equal(result, expected, check_names=False)
 
     def test_pivot_integer_bug(self):
         df = DataFrame(data=[("A", "1", "A1"), ("B", "2", "B2")])
 
         result = df.pivot(index=1, columns=0, values=2)
         repr(result)
-        self.assert_index_equal(result.columns, Index(['A', 'B'], name=0))
+        tm.assert_index_equal(result.columns, Index(['A', 'B'], name=0))
 
     def test_pivot_index_none(self):
         # gh-3962
@@ -104,39 +93,56 @@ def test_pivot_index_none(self):
                                                       ('values', 'Two')],
                                                      names=[None, 'columns'])
         expected.index.name = 'index'
-        assert_frame_equal(result, expected, check_names=False)
-        self.assertEqual(result.index.name, 'index',)
-        self.assertEqual(result.columns.names, (None, 'columns'))
+        tm.assert_frame_equal(result, expected, check_names=False)
+        assert result.index.name == 'index'
+        assert result.columns.names == (None, 'columns')
         expected.columns = expected.columns.droplevel(0)
-
-        data = {
-            'index': range(7),
-            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
-            'values': [1., 2., 3., 3., 2., 1.]
-        }
-
         result = frame.pivot(columns='columns', values='values')
 
         expected.columns.name = 'columns'
-        assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
     def test_stack_unstack(self):
-        f = self.frame.copy()
-        f[:] = np.arange(np.prod(f.shape)).reshape(f.shape)
+        df = self.frame.copy()
+        df[:] = np.arange(np.prod(df.shape)).reshape(df.shape)
 
-        stacked = f.stack()
+        stacked = df.stack()
         stacked_df = DataFrame({'foo': stacked, 'bar': stacked})
 
         unstacked = stacked.unstack()
         unstacked_df = stacked_df.unstack()
 
-        assert_frame_equal(unstacked, f)
-        assert_frame_equal(unstacked_df['bar'], f)
+        assert_frame_equal(unstacked, df)
+        assert_frame_equal(unstacked_df['bar'], df)
 
         unstacked_cols = stacked.unstack(0)
         unstacked_cols_df = stacked_df.unstack(0)
-        assert_frame_equal(unstacked_cols.T, f)
-        assert_frame_equal(unstacked_cols_df['bar'].T, f)
+        assert_frame_equal(unstacked_cols.T, df)
+        assert_frame_equal(unstacked_cols_df['bar'].T, df)
+
+    def test_stack_mixed_level(self):
+        # GH 18310
+        levels = [range(3), [3, 'a', 'b'], [1, 2]]
+
+        # flat columns:
+        df = DataFrame(1, index=levels[0], columns=levels[1])
+        result = df.stack()
+        expected = Series(1, index=MultiIndex.from_product(levels[:2]))
+        assert_series_equal(result, expected)
+
+        # MultiIndex columns:
+        df = DataFrame(1, index=levels[0],
+                       columns=MultiIndex.from_product(levels[1:]))
+        result = df.stack(1)
+        expected = DataFrame(1, index=MultiIndex.from_product([levels[0],
+                                                               levels[2]]),
+                             columns=levels[1])
+        assert_frame_equal(result, expected)
+
+        # as above, but used labels in level are actually of homogeneous type
+        result = df[['a', 'b']].stack(1)
+        expected = expected[['a', 'b']]
+        assert_frame_equal(result, expected)
 
     def test_unstack_fill(self):
 
@@ -159,6 +165,30 @@ def test_unstack_fill(self):
                              index=['x', 'y', 'z'], dtype=np.float)
         assert_frame_equal(result, expected)
 
+        # GH #13971: fill_value when unstacking multiple levels:
+        df = DataFrame({'x': ['a', 'a', 'b'],
+                        'y': ['j', 'k', 'j'],
+                        'z': [0, 1, 2],
+                        'w': [0, 1, 2]}).set_index(['x', 'y', 'z'])
+        unstacked = df.unstack(['x', 'y'], fill_value=0)
+        key = ('w', 'b', 'j')
+        expected = unstacked[key]
+        result = pd.Series([0, 0, 2], index=unstacked.index, name=key)
+        assert_series_equal(result, expected)
+
+        stacked = unstacked.stack(['x', 'y'])
+        stacked.index = stacked.index.reorder_levels(df.index.names)
+        # Workaround for GH #17886 (unnecessarily casts to float):
+        stacked = stacked.astype(np.int64)
+        result = stacked.loc[df.index]
+        assert_frame_equal(result, df)
+
+        # From a series
+        s = df['w']
+        result = s.unstack(['x', 'y'], fill_value=0)
+        expected = unstacked['w']
+        assert_frame_equal(result, expected)
+
     def test_unstack_fill_frame(self):
 
         # From a dataframe
@@ -259,7 +289,8 @@ def test_unstack_fill_frame_categorical(self):
         # Test unstacking with categorical
         data = pd.Series(['a', 'b', 'c', 'a'], dtype='category')
         data.index = pd.MultiIndex.from_tuples(
-            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+            [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')],
+        )
 
         # By default missing values will be NaN
         result = data.unstack()
@@ -270,9 +301,10 @@ def test_unstack_fill_frame_categorical(self):
                              index=list('xyz'))
         assert_frame_equal(result, expected)
 
-        # Fill with non-category results in NaN entries similar to above
-        result = data.unstack(fill_value='d')
-        assert_frame_equal(result, expected)
+        # Fill with non-category results in a TypeError
+        msg = r"'fill_value' \('d'\) is not in"
+        with pytest.raises(TypeError, match=msg):
+            data.unstack(fill_value='d')
 
         # Fill with category value replaces missing values as expected
         result = data.unstack(fill_value='c')
@@ -345,7 +377,7 @@ def test_stack_mixed_levels(self):
              ('A', 'dog', 'short'), ('B', 'dog', 'short')],
             names=['exp', 'animal', 'hair_length']
         )
-        df = DataFrame(randn(4, 4), columns=columns)
+        df = DataFrame(np.random.randn(4, 4), columns=columns)
 
         animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
         exp_hair_stacked = df.stack(level=['exp', 'hair_length'])
@@ -362,7 +394,10 @@ def test_stack_mixed_levels(self):
 
         # When mixed types are passed and the ints are not level
         # names, raise
-        self.assertRaises(ValueError, df2.stack, level=['animal', 0])
+        msg = ("level should contain all level names or all level numbers, not"
+               " a mixture of the two")
+        with pytest.raises(ValueError, match=msg):
+            df2.stack(level=['animal', 0])
 
         # GH #8584: Having 0 in the level names could raise a
         # strange error about lexsort depth
@@ -377,7 +412,7 @@ def test_stack_int_level_names(self):
              ('A', 'dog', 'short'), ('B', 'dog', 'short')],
             names=['exp', 'animal', 'hair_length']
         )
-        df = DataFrame(randn(4, 4), columns=columns)
+        df = DataFrame(np.random.randn(4, 4), columns=columns)
 
         exp_animal_stacked = df.stack(level=['exp', 'animal'])
         animal_hair_stacked = df.stack(level=['animal', 'hair_length'])
@@ -419,14 +454,14 @@ def test_unstack_level_binding(self):
         mi = pd.MultiIndex(
             levels=[[u('foo'), u('bar')], [u('one'), u('two')],
                     [u('a'), u('b')]],
-            labels=[[0, 0, 1, 1], [0, 1, 0, 1], [1, 0, 1, 0]],
+            codes=[[0, 0, 1, 1], [0, 1, 0, 1], [1, 0, 1, 0]],
             names=[u('first'), u('second'), u('third')])
         s = pd.Series(0, index=mi)
         result = s.unstack([1, 2]).stack(0)
 
         expected_mi = pd.MultiIndex(
             levels=[['foo', 'bar'], ['one', 'two']],
-            labels=[[0, 0, 1, 1], [0, 1, 0, 1]],
+            codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
             names=['first', 'second'])
 
         expected = pd.DataFrame(np.array([[np.nan, 0],
@@ -443,7 +478,7 @@ def test_unstack_to_series(self):
         # check reversibility
         data = self.frame.unstack()
 
-        self.assertTrue(isinstance(data, Series))
+        assert isinstance(data, Series)
         undo = data.unstack().T
         assert_frame_equal(undo, self.frame)
 
@@ -453,7 +488,7 @@ def test_unstack_to_series(self):
         result = data.unstack()
 
         midx = MultiIndex(levels=[['x', 'y'], ['a', 'b', 'c']],
-                          labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
+                          codes=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
         expected = Series([1, 2, np.NaN, 3, 4, np.NaN], index=midx)
 
         assert_series_equal(result, expected)
@@ -514,33 +549,94 @@ def test_unstack_dtypes(self):
             right = right.set_index(['A', 'B']).unstack(0)
             right[('D', 'a')] = right[('D', 'a')].astype('int64')
 
-            self.assertEqual(left.shape, (3, 2))
-            assert_frame_equal(left, right)
+            assert left.shape == (3, 2)
+            tm.assert_frame_equal(left, right)
 
     def test_unstack_non_unique_index_names(self):
         idx = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')],
                                      names=['c1', 'c1'])
         df = DataFrame([1, 2], index=idx)
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.unstack('c1')
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.T.stack('c1')
 
+    def test_unstack_unused_levels(self):
+        # GH 17845: unused codes in index make unstack() cast int to float
+        idx = pd.MultiIndex.from_product([['a'], ['A', 'B', 'C', 'D']])[:-1]
+        df = pd.DataFrame([[1, 0]] * 3, index=idx)
+
+        result = df.unstack()
+        exp_col = pd.MultiIndex.from_product([[0, 1], ['A', 'B', 'C']])
+        expected = pd.DataFrame([[1, 1, 1, 0, 0, 0]], index=['a'],
+                                columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+        assert((result.columns.levels[1] == idx.levels[1]).all())
+
+        # Unused items on both levels
+        levels = [[0, 1, 7], [0, 1, 2, 3]]
+        codes = [[0, 0, 1, 1], [0, 2, 0, 2]]
+        idx = pd.MultiIndex(levels, codes)
+        block = np.arange(4).reshape(2, 2)
+        df = pd.DataFrame(np.concatenate([block, block + 4]), index=idx)
+        result = df.unstack()
+        expected = pd.DataFrame(np.concatenate([block * 2, block * 2 + 1],
+                                               axis=1),
+                                columns=idx)
+        tm.assert_frame_equal(result, expected)
+        assert((result.columns.levels[1] == idx.levels[1]).all())
+
+        # With mixed dtype and NaN
+        levels = [['a', 2, 'c'], [1, 3, 5, 7]]
+        codes = [[0, -1, 1, 1], [0, 2, -1, 2]]
+        idx = pd.MultiIndex(levels, codes)
+        data = np.arange(8)
+        df = pd.DataFrame(data.reshape(4, 2), index=idx)
+
+        cases = ((0, [13, 16, 6, 9, 2, 5, 8, 11],
+                  [np.nan, 'a', 2], [np.nan, 5, 1]),
+                 (1, [8, 11, 1, 4, 12, 15, 13, 16],
+                  [np.nan, 5, 1], [np.nan, 'a', 2]))
+        for level, idces, col_level, idx_level in cases:
+            result = df.unstack(level=level)
+            exp_data = np.zeros(18) * np.nan
+            exp_data[idces] = data
+            cols = pd.MultiIndex.from_product([[0, 1], col_level])
+            expected = pd.DataFrame(exp_data.reshape(3, 6),
+                                    index=idx_level, columns=cols)
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("cols", [['A', 'C'], slice(None)])
+    def test_unstack_unused_level(self, cols):
+        # GH 18562 : unused codes on the unstacked level
+        df = pd.DataFrame([[2010, 'a', 'I'],
+                           [2011, 'b', 'II']],
+                          columns=['A', 'B', 'C'])
+
+        ind = df.set_index(['A', 'B', 'C'], drop=False)
+        selection = ind.loc[(slice(None), slice(None), 'I'), cols]
+        result = selection.unstack()
+
+        expected = ind.iloc[[0]][cols]
+        expected.columns = MultiIndex.from_product([expected.columns, ['I']],
+                                                   names=[None, 'C'])
+        expected.index = expected.index.droplevel('C')
+        tm.assert_frame_equal(result, expected)
+
     def test_unstack_nan_index(self):  # GH7466
         cast = lambda val: '{0:1}'.format('' if val != val else val)
-        nan = np.nan
 
         def verify(df):
             mk_list = lambda a: list(a) if isinstance(a, tuple) else [a]
-            rows, cols = df.notnull().values.nonzero()
+            rows, cols = df.notna().values.nonzero()
             for i, j in zip(rows, cols):
                 left = sorted(df.iloc[i, j].split('.'))
                 right = mk_list(df.index[i]) + mk_list(df.columns[j])
                 right = sorted(list(map(cast, right)))
-                self.assertEqual(left, right)
+                assert left == right
 
-        df = DataFrame({'jim': ['a', 'b', nan, 'd'],
+        df = DataFrame({'jim': ['a', 'b', np.nan, 'd'],
                         'joe': ['w', 'x', 'y', 'z'],
                         'jolie': ['a.w', 'b.x', ' .y', 'd.z']})
 
@@ -552,13 +648,13 @@ def verify(df):
             mi = df.set_index(list(idx))
             for lev in range(2):
                 udf = mi.unstack(level=lev)
-                self.assertEqual(udf.notnull().values.sum(), len(df))
+                assert udf.notna().values.sum() == len(df)
                 verify(udf['jolie'])
 
-        df = DataFrame({'1st': ['d'] * 3 + [nan] * 5 + ['a'] * 2 +
+        df = DataFrame({'1st': ['d'] * 3 + [np.nan] * 5 + ['a'] * 2 +
                         ['c'] * 3 + ['e'] * 2 + ['b'] * 5,
-                        '2nd': ['y'] * 2 + ['w'] * 3 + [nan] * 3 +
-                        ['z'] * 4 + [nan] * 3 + ['x'] * 3 + [nan] * 2,
+                        '2nd': ['y'] * 2 + ['w'] * 3 + [np.nan] * 3 +
+                        ['z'] * 4 + [np.nan] * 3 + ['x'] * 3 + [np.nan] * 2,
                         '3rd': [67, 39, 53, 72, 57, 80, 31, 18, 11, 30, 59,
                                 50, 62, 59, 76, 52, 14, 53, 60, 51]})
 
@@ -570,7 +666,7 @@ def verify(df):
             mi = df.set_index(list(idx))
             for lev in range(3):
                 udf = mi.unstack(level=lev)
-                self.assertEqual(udf.notnull().values.sum(), 2 * len(df))
+                assert udf.notna().values.sum() == 2 * len(df)
                 for col in ['4th', '5th']:
                     verify(udf[col])
 
@@ -580,12 +676,12 @@ def verify(df):
         df.iloc[3, 1] = np.NaN
         left = df.set_index(['A', 'B']).unstack(0)
 
-        vals = [[3, 0, 1, 2, nan, nan, nan, nan],
-                [nan, nan, nan, nan, 4, 5, 6, 7]]
+        vals = [[3, 0, 1, 2, np.nan, np.nan, np.nan, np.nan],
+                [np.nan, np.nan, np.nan, np.nan, 4, 5, 6, 7]]
         vals = list(map(list, zip(*vals)))
-        idx = Index([nan, 0, 1, 2, 4, 5, 6, 7], name='B')
+        idx = Index([np.nan, 0, 1, 2, 4, 5, 6, 7], name='B')
         cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
+                          codes=[[0, 0], [0, 1]],
                           names=[None, 'A'])
 
         right = DataFrame(vals, columns=cols, index=idx)
@@ -596,11 +692,11 @@ def verify(df):
         df.iloc[2, 1] = np.NaN
         left = df.set_index(['A', 'B']).unstack(0)
 
-        vals = [[2, nan], [0, 4], [1, 5], [nan, 6], [3, 7]]
+        vals = [[2, np.nan], [0, 4], [1, 5], [np.nan, 6], [3, 7]]
         cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
+                          codes=[[0, 0], [0, 1]],
                           names=[None, 'A'])
-        idx = Index([nan, 0, 1, 2, 3], name='B')
+        idx = Index([np.nan, 0, 1, 2, 3], name='B')
         right = DataFrame(vals, columns=cols, index=idx)
         assert_frame_equal(left, right)
 
@@ -609,35 +705,36 @@ def verify(df):
         df.iloc[3, 1] = np.NaN
         left = df.set_index(['A', 'B']).unstack(0)
 
-        vals = [[3, nan], [0, 4], [1, 5], [2, 6], [nan, 7]]
+        vals = [[3, np.nan], [0, 4], [1, 5], [2, 6], [np.nan, 7]]
         cols = MultiIndex(levels=[['C'], ['a', 'b']],
-                          labels=[[0, 0], [0, 1]],
+                          codes=[[0, 0], [0, 1]],
                           names=[None, 'A'])
-        idx = Index([nan, 0, 1, 2, 3], name='B')
+        idx = Index([np.nan, 0, 1, 2, 3], name='B')
         right = DataFrame(vals, columns=cols, index=idx)
         assert_frame_equal(left, right)
 
         # GH7401
-        df = pd.DataFrame({'A': list('aaaaabbbbb'), 'C': np.arange(10),
+        df = pd.DataFrame({'A': list('aaaaabbbbb'),
                            'B': (date_range('2012-01-01', periods=5)
-                                 .tolist() * 2)})
+                                 .tolist() * 2),
+                           'C': np.arange(10)})
 
         df.iloc[3, 1] = np.NaN
         left = df.set_index(['A', 'B']).unstack()
 
-        vals = np.array([[3, 0, 1, 2, nan, 4], [nan, 5, 6, 7, 8, 9]])
+        vals = np.array([[3, 0, 1, 2, np.nan, 4], [np.nan, 5, 6, 7, 8, 9]])
         idx = Index(['a', 'b'], name='A')
         cols = MultiIndex(levels=[['C'], date_range('2012-01-01', periods=5)],
-                          labels=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
+                          codes=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
                           names=[None, 'B'])
 
         right = DataFrame(vals, columns=cols, index=idx)
         assert_frame_equal(left, right)
 
         # GH4862
-        vals = [['Hg', nan, nan, 680585148],
-                ['U', 0.0, nan, 680585148],
-                ['Pb', 7.07e-06, nan, 680585148],
+        vals = [['Hg', np.nan, np.nan, 680585148],
+                ['U', 0.0, np.nan, 680585148],
+                ['Pb', 7.07e-06, np.nan, 680585148],
                 ['Sn', 2.3614e-05, 0.0133, 680607017],
                 ['Ag', 0.0, 0.0133, 680607017],
                 ['Hg', -0.00015, 0.0133, 680607017]]
@@ -646,15 +743,15 @@ def verify(df):
 
         left = df.copy().set_index(['s_id', 'dosage', 'agent']).unstack()
 
-        vals = [[nan, nan, 7.07e-06, nan, 0.0],
-                [0.0, -0.00015, nan, 2.3614e-05, nan]]
+        vals = [[np.nan, np.nan, 7.07e-06, np.nan, 0.0],
+                [0.0, -0.00015, np.nan, 2.3614e-05, np.nan]]
 
         idx = MultiIndex(levels=[[680585148, 680607017], [0.0133]],
-                         labels=[[0, 1], [-1, 0]],
+                         codes=[[0, 1], [-1, 0]],
                          names=['s_id', 'dosage'])
 
         cols = MultiIndex(levels=[['change'], ['Ag', 'Hg', 'Pb', 'Sn', 'U']],
-                          labels=[[0, 0, 0, 0, 0], [0, 1, 2, 3, 4]],
+                          codes=[[0, 0, 0, 0, 0], [0, 1, 2, 3, 4]],
                           names=[None, 'agent'])
 
         right = DataFrame(vals, columns=cols, index=idx)
@@ -671,16 +768,16 @@ def verify(df):
                         'joe': (np.random.randn(6) * 10).round(2)})
 
         df['3rd'] = df['2nd'] - pd.Timestamp('2014-02-02')
-        df.loc[1, '2nd'] = df.loc[3, '2nd'] = nan
-        df.loc[1, '3rd'] = df.loc[4, '3rd'] = nan
+        df.loc[1, '2nd'] = df.loc[3, '2nd'] = np.nan
+        df.loc[1, '3rd'] = df.loc[4, '3rd'] = np.nan
 
         left = df.set_index(['1st', '2nd', '3rd']).unstack(['2nd', '3rd'])
-        self.assertEqual(left.notnull().values.sum(), 2 * len(df))
+        assert left.notna().values.sum() == 2 * len(df)
 
         for col in ['jim', 'joe']:
             for _, r in df.iterrows():
                 key = r['1st'], (col, r['2nd'], r['3rd'])
-                self.assertEqual(r[col], left.loc[key])
+                assert r[col] == left.loc[key]
 
     def test_stack_datetime_column_multiIndex(self):
         # GH 8039
@@ -739,28 +836,127 @@ def _test_stack_with_multiindex(multiindex):
         df = DataFrame(np.arange(6).reshape(2, 3),
                        columns=full_multiindex[[0, 1, 3]])
         result = df.stack(dropna=False)
-        expected = DataFrame([[0, 2], [1, nan], [3, 5], [4, nan]],
+        expected = DataFrame([[0, 2], [1, np.nan], [3, 5], [4, np.nan]],
                              index=MultiIndex(
                                  levels=[[0, 1], ['u', 'x', 'y', 'z']],
-                                 labels=[[0, 0, 1, 1],
-                                         [1, 3, 1, 3]],
+                                 codes=[[0, 0, 1, 1],
+                                        [1, 3, 1, 3]],
                                  names=[None, 'Lower']),
                              columns=Index(['B', 'C'], name='Upper'),
                              dtype=df.dtypes[0])
         assert_frame_equal(result, expected)
 
-    def test_stack_preserve_categorical_dtype(self):
+    @pytest.mark.parametrize('ordered', [False, True])
+    @pytest.mark.parametrize('labels', [list("yxz"), list("yxy")])
+    def test_stack_preserve_categorical_dtype(self, ordered, labels):
         # GH13854
-        for ordered in [False, True]:
-            for labels in [list("yxz"), list("yxy")]:
-                cidx = pd.CategoricalIndex(labels, categories=list("xyz"),
-                                           ordered=ordered)
-                df = DataFrame([[10, 11, 12]], columns=cidx)
-                result = df.stack()
-
-                # `MutliIndex.from_product` preserves categorical dtype -
-                # it's tested elsewhere.
-                midx = pd.MultiIndex.from_product([df.index, cidx])
-                expected = Series([10, 11, 12], index=midx)
-
-                tm.assert_series_equal(result, expected)
+        cidx = pd.CategoricalIndex(labels, categories=list("xyz"),
+                                   ordered=ordered)
+        df = DataFrame([[10, 11, 12]], columns=cidx)
+        result = df.stack()
+
+        # `MutliIndex.from_product` preserves categorical dtype -
+        # it's tested elsewhere.
+        midx = pd.MultiIndex.from_product([df.index, cidx])
+        expected = Series([10, 11, 12], index=midx)
+
+        tm.assert_series_equal(result, expected)
+
+    def test_stack_preserve_categorical_dtype_values(self):
+        # GH-23077
+        cat = pd.Categorical(['a', 'a', 'b', 'c'])
+        df = pd.DataFrame({"A": cat, "B": cat})
+        result = df.stack()
+        index = pd.MultiIndex.from_product([[0, 1, 2, 3], ['A', 'B']])
+        expected = pd.Series(pd.Categorical(['a', 'a', 'a', 'a',
+                                             'b', 'b', 'c', 'c']),
+                             index=index)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('level', [0, 1])
+    def test_unstack_mixed_extension_types(self, level):
+        index = pd.MultiIndex.from_tuples([('A', 0), ('A', 1), ('B', 1)],
+                                          names=['a', 'b'])
+        df = pd.DataFrame({"A": pd.core.arrays.integer_array([0, 1, None]),
+                           "B": pd.Categorical(['a', 'a', 'b'])}, index=index)
+
+        result = df.unstack(level=level)
+        expected = df.astype(object).unstack(level=level)
+
+        expected_dtypes = pd.Series([df.A.dtype] * 2 + [df.B.dtype] * 2,
+                                    index=result.columns)
+        tm.assert_series_equal(result.dtypes, expected_dtypes)
+        tm.assert_frame_equal(result.astype(object), expected)
+
+    @pytest.mark.parametrize("level", [0, 'baz'])
+    def test_unstack_swaplevel_sortlevel(self, level):
+        # GH 20994
+        mi = pd.MultiIndex.from_product([[0], ['d', 'c']],
+                                        names=['bar', 'baz'])
+        df = pd.DataFrame([[0, 2], [1, 3]], index=mi, columns=['B', 'A'])
+        df.columns.name = 'foo'
+
+        expected = pd.DataFrame([
+            [3, 1, 2, 0]], columns=pd.MultiIndex.from_tuples([
+                ('c', 'A'), ('c', 'B'), ('d', 'A'), ('d', 'B')], names=[
+                    'baz', 'foo']))
+        expected.index.name = 'bar'
+
+        result = df.unstack().swaplevel(axis=1).sort_index(axis=1, level=level)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_unstack_fill_frame_object():
+    # GH12815 Test unstacking with object.
+    data = pd.Series(['a', 'b', 'c', 'a'], dtype='object')
+    data.index = pd.MultiIndex.from_tuples(
+        [('x', 'a'), ('x', 'b'), ('y', 'b'), ('z', 'a')])
+
+    # By default missing values will be NaN
+    result = data.unstack()
+    expected = pd.DataFrame(
+        {'a': ['a', np.nan, 'a'], 'b': ['b', 'c', np.nan]},
+        index=list('xyz')
+    )
+    assert_frame_equal(result, expected)
+
+    # Fill with any value replaces missing values as expected
+    result = data.unstack(fill_value='d')
+    expected = pd.DataFrame(
+        {'a': ['a', 'd', 'a'], 'b': ['b', 'c', 'd']},
+        index=list('xyz')
+    )
+    assert_frame_equal(result, expected)
+
+
+def test_unstack_timezone_aware_values():
+    # GH 18338
+    df = pd.DataFrame({
+        'timestamp': [
+            pd.Timestamp('2017-08-27 01:00:00.709949+0000', tz='UTC')],
+        'a': ['a'],
+        'b': ['b'],
+        'c': ['c'],
+    }, columns=['timestamp', 'a', 'b', 'c'])
+    result = df.set_index(['a', 'b']).unstack()
+    expected = pd.DataFrame([[pd.Timestamp('2017-08-27 01:00:00.709949+0000',
+                                           tz='UTC'),
+                              'c']],
+                            index=pd.Index(['a'], name='a'),
+                            columns=pd.MultiIndex(
+                                levels=[['timestamp', 'c'], ['b']],
+                                codes=[[0, 1], [0, 0]],
+                                names=[None, 'b']))
+    assert_frame_equal(result, expected)
+
+
+def test_stack_timezone_aware_values():
+    # GH 19420
+    ts = pd.date_range(freq="D", start="20180101", end="20180103",
+                       tz="America/New_York")
+    df = pd.DataFrame({"A": ts}, index=["a", "b", "c"])
+    result = df.stack()
+    expected = pd.Series(ts,
+                         index=pd.MultiIndex(levels=[['a', 'b', 'c'], ['A']],
+                                             codes=[[0, 1, 2], [0, 0, 0]]))
+    assert_series_equal(result, expected)
diff --git a/pandas/tests/frame/test_sort_values_level_as_str.py b/pandas/tests/frame/test_sort_values_level_as_str.py
new file mode 100644
index 0000000000000..3dca82a229b2b
--- /dev/null
+++ b/pandas/tests/frame/test_sort_values_level_as_str.py
@@ -0,0 +1,96 @@
+import numpy as np
+import pytest
+
+from pandas.errors import PerformanceWarning
+
+from pandas import DataFrame
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+@pytest.fixture
+def df_none():
+    return DataFrame({
+        'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+        'inner': [1, 2, 2, 2, 1, 1],
+        'A': np.arange(6, 0, -1),
+        ('B', 5): ['one', 'one', 'two', 'two', 'one', 'one']})
+
+
+@pytest.fixture(params=[
+    ['outer'],
+    ['outer', 'inner']
+])
+def df_idx(request, df_none):
+    levels = request.param
+    return df_none.set_index(levels)
+
+
+@pytest.fixture(params=[
+    'inner',     # index level
+    ['outer'],   # list of index level
+    'A',         # column
+    [('B', 5)],  # list of column
+    ['inner', 'outer'],   # two index levels
+    [('B', 5), 'outer'],  # index level and column
+    ['A', ('B', 5)],      # Two columns
+    ['inner', 'outer']    # two index levels and column
+])
+def sort_names(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def ascending(request):
+    return request.param
+
+
+def test_sort_index_level_and_column_label(
+        df_none, df_idx, sort_names, ascending):
+
+    # GH 14353
+
+    # Get index levels from df_idx
+    levels = df_idx.index.names
+
+    # Compute expected by sorting on columns and the setting index
+    expected = df_none.sort_values(by=sort_names,
+                                   ascending=ascending,
+                                   axis=0).set_index(levels)
+
+    # Compute result sorting on mix on columns and index levels
+    result = df_idx.sort_values(by=sort_names,
+                                ascending=ascending,
+                                axis=0)
+
+    assert_frame_equal(result, expected)
+
+
+def test_sort_column_level_and_index_label(
+        df_none, df_idx, sort_names, ascending):
+
+    # GH 14353
+
+    # Get levels from df_idx
+    levels = df_idx.index.names
+
+    # Compute expected by sorting on axis=0, setting index levels, and then
+    # transposing. For some cases this will result in a frame with
+    # multiple column levels
+    expected = df_none.sort_values(by=sort_names,
+                                   ascending=ascending,
+                                   axis=0).set_index(levels).T
+
+    # Compute result by transposing and sorting on axis=1.
+    result = df_idx.T.sort_values(by=sort_names,
+                                  ascending=ascending,
+                                  axis=1)
+
+    if len(levels) > 1:
+        # Accessing multi-level columns that are not lexsorted raises a
+        # performance warning
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        check_stacklevel=False):
+            assert_frame_equal(result, expected)
+    else:
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_sorting.py b/pandas/tests/frame/test_sorting.py
index 5108fc6080866..baf50982d8ab0 100644
--- a/pandas/tests/frame/test_sorting.py
+++ b/pandas/tests/frame/test_sorting.py
@@ -2,70 +2,26 @@
 
 from __future__ import print_function
 
-import numpy as np
-
-from pandas.compat import lrange
-from pandas import (DataFrame, Series, MultiIndex, Timestamp,
-                    date_range, NaT)
+import random
 
-from pandas.util.testing import (assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+import numpy as np
+import pytest
 
-import pandas.util.testing as tm
+from pandas.compat import PY2, lrange
 
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, IntervalIndex, MultiIndex, NaT, Series, Timestamp,
+    date_range)
+from pandas.api.types import CategoricalDtype
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestDataFrameSorting(tm.TestCase, TestData):
-
-    def test_sort_index(self):
-        # GH13496
-
-        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        # axis=0 : sort rows by index labels
-        unordered = frame.loc[[3, 2, 4, 1]]
-        result = unordered.sort_index(axis=0)
-        expected = frame
-        assert_frame_equal(result, expected)
-
-        result = unordered.sort_index(ascending=False)
-        expected = frame[::-1]
-        assert_frame_equal(result, expected)
-
-        # axis=1 : sort columns by column names
-        unordered = frame.iloc[:, [2, 1, 3, 0]]
-        result = unordered.sort_index(axis=1)
-        assert_frame_equal(result, frame)
-
-        result = unordered.sort_index(axis=1, ascending=False)
-        expected = frame.iloc[:, ::-1]
-        assert_frame_equal(result, expected)
-
-    def test_sort_index_multiindex(self):
-        # GH13496
-
-        # sort rows by specified level of multi-index
-        mi = MultiIndex.from_tuples([[2, 1, 3], [1, 1, 1]], names=list('ABC'))
-        df = DataFrame([[1, 2], [3, 4]], mi)
-
-        # MI sort, but no level: sort_level has no effect
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        df = DataFrame([[1, 2], [3, 4]], mi)
-        result = df.sort_index(sort_remaining=False)
-        expected = df.sort_index()
-        assert_frame_equal(result, expected)
-
-    def test_sort(self):
-        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
-                          columns=['A', 'B', 'C', 'D'])
-
-        # see gh-9816
-        with tm.assert_produces_warning(FutureWarning):
-            frame.sortlevel()
+class TestDataFrameSorting(TestData):
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_sort_values(self):
         frame = DataFrame([[1, 1, 2], [3, 1, 0], [4, 5, 6]],
                           index=[1, 2, 3], columns=list('ABC'))
@@ -99,8 +55,10 @@ def test_sort_values(self):
         sorted_df = frame.sort_values(by=['B', 'A'], ascending=[True, False])
         assert_frame_equal(sorted_df, expected)
 
-        self.assertRaises(ValueError, lambda: frame.sort_values(
-            by=['A', 'B'], axis=2, inplace=True))
+        msg = ("No axis named 2 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            frame.sort_values(by=['A', 'B'], axis=2, inplace=True)
 
         # by row (axis=1): GH 10806
         sorted_df = frame.sort_values(by=3, axis=1)
@@ -124,7 +82,7 @@ def test_sort_values(self):
         assert_frame_equal(sorted_df, expected)
 
         msg = r'Length of ascending \(5\) != length of by \(2\)'
-        with assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             frame.sort_values(by=['A', 'B'], axis=0, ascending=[True] * 5)
 
     def test_sort_values_inplace(self):
@@ -151,21 +109,6 @@ def test_sort_values_inplace(self):
         expected = frame.sort_values(by=['A', 'B'], ascending=False)
         assert_frame_equal(sorted_df, expected)
 
-    def test_sort_index_categorical_index(self):
-
-        df = (DataFrame({'A': np.arange(6, dtype='int64'),
-                         'B': Series(list('aabbca'))
-                         .astype('category', categories=list('cab'))})
-              .set_index('B'))
-
-        result = df.sort_index()
-        expected = df.iloc[[4, 0, 1, 5, 2, 3]]
-        assert_frame_equal(result, expected)
-
-        result = df.sort_index(ascending=False)
-        expected = df.iloc[[3, 2, 5, 1, 0, 4]]
-        assert_frame_equal(result, expected)
-
     def test_sort_nan(self):
         # GH3917
         nan = np.nan
@@ -213,7 +156,7 @@ def test_sort_nan(self):
              'B': [5, 9, 2, nan, 5, 5, 4]},
             index=[2, 0, 3, 1, 6, 4, 5])
         sorted_df = df.sort_values(['A', 'B'], ascending=[
-                                   1, 0], na_position='first')
+            1, 0], na_position='first')
         assert_frame_equal(sorted_df, expected)
 
         # na_position='last', not order
@@ -222,7 +165,7 @@ def test_sort_nan(self):
              'B': [4, 5, 5, nan, 2, 9, 5]},
             index=[5, 4, 6, 1, 3, 0, 2])
         sorted_df = df.sort_values(['A', 'B'], ascending=[
-                                   0, 1], na_position='last')
+            0, 1], na_position='last')
         assert_frame_equal(sorted_df, expected)
 
         # Test DataFrame with nan label
@@ -291,8 +234,122 @@ def test_stable_descending_multicolumn_sort(self):
                                    kind='mergesort')
         assert_frame_equal(sorted_df, expected)
 
+    def test_stable_categorial(self):
+        # GH 16793
+        df = DataFrame({
+            'x': pd.Categorical(np.repeat([1, 2, 3, 4], 5), ordered=True)
+        })
+        expected = df.copy()
+        sorted_df = df.sort_values('x', kind='mergesort')
+        assert_frame_equal(sorted_df, expected)
+
+    def test_sort_datetimes(self):
+
+        # GH 3461, argsort / lexsort differences for a datetime column
+        df = DataFrame(['a', 'a', 'a', 'b', 'c', 'd', 'e', 'f', 'g'],
+                       columns=['A'],
+                       index=date_range('20130101', periods=9))
+        dts = [Timestamp(x)
+               for x in ['2004-02-11', '2004-01-21', '2004-01-26',
+                         '2005-09-20', '2010-10-04', '2009-05-12',
+                         '2008-11-12', '2010-09-28', '2010-09-28']]
+        df['B'] = dts[::2] + dts[1::2]
+        df['C'] = 2.
+        df['A1'] = 3.
+
+        df1 = df.sort_values(by='A')
+        df2 = df.sort_values(by=['A'])
+        assert_frame_equal(df1, df2)
+
+        df1 = df.sort_values(by='B')
+        df2 = df.sort_values(by=['B'])
+        assert_frame_equal(df1, df2)
+
+        df1 = df.sort_values(by='B')
+
+        df2 = df.sort_values(by=['C', 'B'])
+        assert_frame_equal(df1, df2)
+
+    def test_frame_column_inplace_sort_exception(self):
+        s = self.frame['A']
+        with pytest.raises(ValueError, match="This Series is a view"):
+            s.sort_values(inplace=True)
+
+        cp = s.copy()
+        cp.sort_values()  # it works!
+
+    def test_sort_nat_values_in_int_column(self):
+
+        # GH 14922: "sorting with large float and multiple columns incorrect"
+
+        # cause was that the int64 value NaT was considered as "na". Which is
+        # only correct for datetime64 columns.
+
+        int_values = (2, int(NaT))
+        float_values = (2.0, -1.797693e308)
+
+        df = DataFrame(dict(int=int_values, float=float_values),
+                       columns=["int", "float"])
+
+        df_reversed = DataFrame(dict(int=int_values[::-1],
+                                     float=float_values[::-1]),
+                                columns=["int", "float"],
+                                index=[1, 0])
+
+        # NaT is not a "na" for int64 columns, so na_position must not
+        # influence the result:
+        df_sorted = df.sort_values(["int", "float"], na_position="last")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        df_sorted = df.sort_values(["int", "float"], na_position="first")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        # reverse sorting order
+        df_sorted = df.sort_values(["int", "float"], ascending=False)
+        assert_frame_equal(df_sorted, df)
+
+        # and now check if NaT is still considered as "na" for datetime64
+        # columns:
+        df = DataFrame(dict(datetime=[Timestamp("2016-01-01"), NaT],
+                            float=float_values), columns=["datetime", "float"])
+
+        df_reversed = DataFrame(dict(datetime=[NaT, Timestamp("2016-01-01")],
+                                     float=float_values[::-1]),
+                                columns=["datetime", "float"],
+                                index=[1, 0])
+
+        df_sorted = df.sort_values(["datetime", "float"], na_position="first")
+        assert_frame_equal(df_sorted, df_reversed)
+
+        df_sorted = df.sort_values(["datetime", "float"], na_position="last")
+        assert_frame_equal(df_sorted, df)
+
+        # Ascending should not affect the results.
+        df_sorted = df.sort_values(["datetime", "float"], ascending=False)
+        assert_frame_equal(df_sorted, df)
+
+    def test_sort_nat(self):
+
+        # GH 16836
+
+        d1 = [Timestamp(x) for x in ['2016-01-01', '2015-01-01',
+                                     np.nan, '2016-01-01']]
+        d2 = [Timestamp(x) for x in ['2017-01-01', '2014-01-01',
+                                     '2016-01-01', '2015-01-01']]
+        df = pd.DataFrame({'a': d1, 'b': d2}, index=[0, 1, 2, 3])
+
+        d3 = [Timestamp(x) for x in ['2015-01-01', '2016-01-01',
+                                     '2016-01-01', np.nan]]
+        d4 = [Timestamp(x) for x in ['2014-01-01', '2015-01-01',
+                                     '2017-01-01', '2016-01-01']]
+        expected = pd.DataFrame({'a': d3, 'b': d4}, index=[1, 3, 0, 2])
+        sorted_df = df.sort_values(by=['a', 'b'], )
+        tm.assert_frame_equal(sorted_df, expected)
+
+
+class TestDataFrameSortIndexKinds(TestData):
+
     def test_sort_index_multicolumn(self):
-        import random
         A = np.arange(5).repeat(20)
         B = np.tile(np.arange(5), 20)
         random.shuffle(A)
@@ -336,7 +393,7 @@ def test_sort_index_inplace(self):
         df.sort_index(inplace=True)
         expected = frame
         assert_frame_equal(df, expected)
-        self.assertNotEqual(a_id, id(df['A']))
+        assert a_id != id(df['A'])
 
         df = unordered.copy()
         df.sort_index(ascending=False, inplace=True)
@@ -393,26 +450,26 @@ def test_sort_index_duplicates(self):
         df = DataFrame([lrange(5, 9), lrange(4)],
                        columns=['a', 'a', 'b', 'b'])
 
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             # use .sort_values #9816
             with tm.assert_produces_warning(FutureWarning):
                 df.sort_index(by='a')
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             df.sort_values(by='a')
 
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             # use .sort_values #9816
             with tm.assert_produces_warning(FutureWarning):
                 df.sort_index(by=['a'])
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             df.sort_values(by=['a'])
 
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             # use .sort_values #9816
             with tm.assert_produces_warning(FutureWarning):
                 # multi-column 'by' is separate codepath
                 df.sort_index(by=['a', 'b'])
-        with assertRaisesRegexp(ValueError, 'duplicate'):
+        with pytest.raises(ValueError, match='not unique'):
             # multi-column 'by' is separate codepath
             df.sort_values(by=['a', 'b'])
 
@@ -420,11 +477,11 @@ def test_sort_index_duplicates(self):
         # GH4370
         df = DataFrame(np.random.randn(4, 2),
                        columns=MultiIndex.from_tuples([('a', 0), ('a', 1)]))
-        with assertRaisesRegexp(ValueError, 'levels'):
+        with pytest.raises(ValueError, match='level'):
             # use .sort_values #9816
             with tm.assert_produces_warning(FutureWarning):
                 df.sort_index(by='a')
-        with assertRaisesRegexp(ValueError, 'levels'):
+        with pytest.raises(ValueError, match='level'):
             df.sort_values(by='a')
 
         # convert tuples to a list of tuples
@@ -448,78 +505,169 @@ def test_sort_index_level(self):
         res = df.sort_index(level=['A', 'B'], sort_remaining=False)
         assert_frame_equal(df, res)
 
-    def test_sort_datetimes(self):
+    def test_sort_index_categorical_index(self):
 
-        # GH 3461, argsort / lexsort differences for a datetime column
-        df = DataFrame(['a', 'a', 'a', 'b', 'c', 'd', 'e', 'f', 'g'],
-                       columns=['A'],
-                       index=date_range('20130101', periods=9))
-        dts = [Timestamp(x)
-               for x in ['2004-02-11', '2004-01-21', '2004-01-26',
-                         '2005-09-20', '2010-10-04', '2009-05-12',
-                         '2008-11-12', '2010-09-28', '2010-09-28']]
-        df['B'] = dts[::2] + dts[1::2]
-        df['C'] = 2.
-        df['A1'] = 3.
+        df = (DataFrame({'A': np.arange(6, dtype='int64'),
+                         'B': Series(list('aabbca'))
+                        .astype(CategoricalDtype(list('cab')))})
+              .set_index('B'))
 
-        df1 = df.sort_values(by='A')
-        df2 = df.sort_values(by=['A'])
-        assert_frame_equal(df1, df2)
+        result = df.sort_index()
+        expected = df.iloc[[4, 0, 1, 5, 2, 3]]
+        assert_frame_equal(result, expected)
 
-        df1 = df.sort_values(by='B')
-        df2 = df.sort_values(by=['B'])
-        assert_frame_equal(df1, df2)
+        result = df.sort_index(ascending=False)
+        expected = df.iloc[[3, 2, 5, 1, 0, 4]]
+        assert_frame_equal(result, expected)
 
-    def test_frame_column_inplace_sort_exception(self):
-        s = self.frame['A']
-        with assertRaisesRegexp(ValueError, "This Series is a view"):
-            s.sort_values(inplace=True)
+    def test_sort_index(self):
+        # GH13496
 
-        cp = s.copy()
-        cp.sort_values()  # it works!
+        frame = DataFrame(np.arange(16).reshape(4, 4), index=[1, 2, 3, 4],
+                          columns=['A', 'B', 'C', 'D'])
 
-    def test_sort_nat_values_in_int_column(self):
+        # axis=0 : sort rows by index labels
+        unordered = frame.loc[[3, 2, 4, 1]]
+        result = unordered.sort_index(axis=0)
+        expected = frame
+        assert_frame_equal(result, expected)
 
-        # GH 14922: "sorting with large float and multiple columns incorrect"
+        result = unordered.sort_index(ascending=False)
+        expected = frame[::-1]
+        assert_frame_equal(result, expected)
 
-        # cause was that the int64 value NaT was considered as "na". Which is
-        # only correct for datetime64 columns.
+        # axis=1 : sort columns by column names
+        unordered = frame.iloc[:, [2, 1, 3, 0]]
+        result = unordered.sort_index(axis=1)
+        assert_frame_equal(result, frame)
 
-        int_values = (2, int(NaT))
-        float_values = (2.0, -1.797693e308)
+        result = unordered.sort_index(axis=1, ascending=False)
+        expected = frame.iloc[:, ::-1]
+        assert_frame_equal(result, expected)
 
-        df = DataFrame(dict(int=int_values, float=float_values),
-                       columns=["int", "float"])
+    @pytest.mark.parametrize("level", ['A', 0])  # GH 21052
+    def test_sort_index_multiindex(self, level):
+        # GH13496
 
-        df_reversed = DataFrame(dict(int=int_values[::-1],
-                                     float=float_values[::-1]),
-                                columns=["int", "float"],
-                                index=[1, 0])
+        # sort rows by specified level of multi-index
+        mi = MultiIndex.from_tuples([
+            [2, 1, 3], [2, 1, 2], [1, 1, 1]], names=list('ABC'))
+        df = DataFrame([[1, 2], [3, 4], [5, 6]], index=mi)
+
+        expected_mi = MultiIndex.from_tuples([
+            [1, 1, 1],
+            [2, 1, 2],
+            [2, 1, 3]], names=list('ABC'))
+        expected = pd.DataFrame([
+            [5, 6],
+            [3, 4],
+            [1, 2]], index=expected_mi)
+        result = df.sort_index(level=level)
+        assert_frame_equal(result, expected)
 
-        # NaT is not a "na" for int64 columns, so na_position must not
-        # influence the result:
-        df_sorted = df.sort_values(["int", "float"], na_position="last")
-        assert_frame_equal(df_sorted, df_reversed)
+        # sort_remaining=False
+        expected_mi = MultiIndex.from_tuples([
+            [1, 1, 1],
+            [2, 1, 3],
+            [2, 1, 2]], names=list('ABC'))
+        expected = pd.DataFrame([
+            [5, 6],
+            [1, 2],
+            [3, 4]], index=expected_mi)
+        result = df.sort_index(level=level, sort_remaining=False)
+        assert_frame_equal(result, expected)
 
-        df_sorted = df.sort_values(["int", "float"], na_position="first")
-        assert_frame_equal(df_sorted, df_reversed)
+    def test_sort_index_intervalindex(self):
+        # this is a de-facto sort via unstack
+        # confirming that we sort in the order of the bins
+        y = Series(np.random.randn(100))
+        x1 = Series(np.sign(np.random.randn(100)))
+        x2 = pd.cut(Series(np.random.randn(100)),
+                    bins=[-3, -0.5, 0, 0.5, 3])
+        model = pd.concat([y, x1, x2], axis=1, keys=['Y', 'X1', 'X2'])
+
+        result = model.groupby(['X1', 'X2'], observed=True).mean().unstack()
+        expected = IntervalIndex.from_tuples(
+            [(-3.0, -0.5), (-0.5, 0.0),
+             (0.0, 0.5), (0.5, 3.0)],
+            closed='right')
+        result = result.columns.levels[1].categories
+        tm.assert_index_equal(result, expected)
+
+    def test_sort_index_na_position_with_categories(self):
+        # GH 22556
+        # Positioning missing value properly when column is Categorical.
+        categories = ['A', 'B', 'C']
+        category_indices = [0, 2, 4]
+        list_of_nans = [np.nan, np.nan]
+        na_indices = [1, 3]
+        na_position_first = 'first'
+        na_position_last = 'last'
+        column_name = 'c'
+
+        reversed_categories = sorted(categories, reverse=True)
+        reversed_category_indices = sorted(category_indices, reverse=True)
+        reversed_na_indices = sorted(na_indices, reverse=True)
+
+        df = pd.DataFrame({
+            column_name: pd.Categorical(['A', np.nan, 'B', np.nan, 'C'],
+                                        categories=categories,
+                                        ordered=True)})
+        # sort ascending with na first
+        result = df.sort_values(by=column_name,
+                                ascending=True,
+                                na_position=na_position_first)
+        expected = DataFrame({
+            column_name: Categorical(list_of_nans + categories,
+                                     categories=categories,
+                                     ordered=True)
+        }, index=na_indices + category_indices)
 
-        # reverse sorting order
-        df_sorted = df.sort_values(["int", "float"], ascending=False)
-        assert_frame_equal(df_sorted, df)
+        assert_frame_equal(result, expected)
 
-        # and now check if NaT is still considered as "na" for datetime64
-        # columns:
-        df = DataFrame(dict(datetime=[Timestamp("2016-01-01"), NaT],
-                            float=float_values), columns=["datetime", "float"])
+        # sort ascending with na last
+        result = df.sort_values(by=column_name,
+                                ascending=True,
+                                na_position=na_position_last)
+        expected = DataFrame({
+            column_name: Categorical(categories + list_of_nans,
+                                     categories=categories,
+                                     ordered=True)
+        }, index=category_indices + na_indices)
 
-        df_reversed = DataFrame(dict(datetime=[NaT, Timestamp("2016-01-01")],
-                                     float=float_values[::-1]),
-                                columns=["datetime", "float"],
-                                index=[1, 0])
+        assert_frame_equal(result, expected)
 
-        df_sorted = df.sort_values(["datetime", "float"], na_position="first")
-        assert_frame_equal(df_sorted, df_reversed)
+        # sort descending with na first
+        result = df.sort_values(by=column_name,
+                                ascending=False,
+                                na_position=na_position_first)
+        expected = DataFrame({
+            column_name: Categorical(list_of_nans + reversed_categories,
+                                     categories=categories,
+                                     ordered=True)
+        }, index=reversed_na_indices + reversed_category_indices)
 
-        df_sorted = df.sort_values(["datetime", "float"], na_position="last")
-        assert_frame_equal(df_sorted, df_reversed)
+        assert_frame_equal(result, expected)
+
+        # sort descending with na last
+        result = df.sort_values(by=column_name,
+                                ascending=False,
+                                na_position=na_position_last)
+        expected = DataFrame({
+            column_name: Categorical(reversed_categories + list_of_nans,
+                                     categories=categories,
+                                     ordered=True)
+        }, index=reversed_category_indices + reversed_na_indices)
+
+        assert_frame_equal(result, expected)
+
+    def test_sort_index_na_position_with_categories_raises(self):
+        df = pd.DataFrame({
+            'c': pd.Categorical(['A', np.nan, 'B', np.nan, 'C'],
+                                categories=['A', 'B', 'C'],
+                                ordered=True)})
+
+        with pytest.raises(ValueError):
+            df.sort_values(by='c',
+                           ascending=False,
+                           na_position='bad_position')
diff --git a/pandas/tests/frame/test_subclass.py b/pandas/tests/frame/test_subclass.py
index 9052a16bf973c..2e3696e7e04cc 100644
--- a/pandas/tests/frame/test_subclass.py
+++ b/pandas/tests/frame/test_subclass.py
@@ -3,15 +3,15 @@
 from __future__ import print_function
 
 import numpy as np
+import pytest
 
-from pandas import DataFrame, Series, MultiIndex, Panel
 import pandas as pd
-import pandas.util.testing as tm
-
+from pandas import DataFrame, Index, MultiIndex, Series
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
 
 
-class TestDataFrameSubclassing(tm.TestCase, TestData):
+class TestDataFrameSubclassing(TestData):
 
     def test_frame_subclassing_and_slicing(self):
         # Subclass frame and ensure it returns the right class on slicing it
@@ -49,45 +49,45 @@ def custom_frame_function(self):
         cdf = CustomDataFrame(data)
 
         # Did we get back our own DF class?
-        self.assertTrue(isinstance(cdf, CustomDataFrame))
+        assert isinstance(cdf, CustomDataFrame)
 
         # Do we get back our own Series class after selecting a column?
         cdf_series = cdf.col1
-        self.assertTrue(isinstance(cdf_series, CustomSeries))
-        self.assertEqual(cdf_series.custom_series_function(), 'OK')
+        assert isinstance(cdf_series, CustomSeries)
+        assert cdf_series.custom_series_function() == 'OK'
 
         # Do we get back our own DF class after slicing row-wise?
         cdf_rows = cdf[1:5]
-        self.assertTrue(isinstance(cdf_rows, CustomDataFrame))
-        self.assertEqual(cdf_rows.custom_frame_function(), 'OK')
+        assert isinstance(cdf_rows, CustomDataFrame)
+        assert cdf_rows.custom_frame_function() == 'OK'
 
         # Make sure sliced part of multi-index frame is custom class
         mcol = pd.MultiIndex.from_tuples([('A', 'A'), ('A', 'B')])
         cdf_multi = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
-        self.assertTrue(isinstance(cdf_multi['A'], CustomDataFrame))
+        assert isinstance(cdf_multi['A'], CustomDataFrame)
 
         mcol = pd.MultiIndex.from_tuples([('A', ''), ('B', '')])
         cdf_multi2 = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
-        self.assertTrue(isinstance(cdf_multi2['A'], CustomSeries))
+        assert isinstance(cdf_multi2['A'], CustomSeries)
 
     def test_dataframe_metadata(self):
         df = tm.SubclassedDataFrame({'X': [1, 2, 3], 'Y': [1, 2, 3]},
                                     index=['a', 'b', 'c'])
         df.testattr = 'XXX'
 
-        self.assertEqual(df.testattr, 'XXX')
-        self.assertEqual(df[['X']].testattr, 'XXX')
-        self.assertEqual(df.loc[['a', 'b'], :].testattr, 'XXX')
-        self.assertEqual(df.iloc[[0, 1], :].testattr, 'XXX')
+        assert df.testattr == 'XXX'
+        assert df[['X']].testattr == 'XXX'
+        assert df.loc[['a', 'b'], :].testattr == 'XXX'
+        assert df.iloc[[0, 1], :].testattr == 'XXX'
 
-        # GH9776
-        self.assertEqual(df.iloc[0:1, :].testattr, 'XXX')
+        # see gh-9776
+        assert df.iloc[0:1, :].testattr == 'XXX'
 
-        # GH10553
-        unpickled = self.round_trip_pickle(df)
+        # see gh-10553
+        unpickled = tm.round_trip_pickle(df)
         tm.assert_frame_equal(df, unpickled)
-        self.assertEqual(df._metadata, unpickled._metadata)
-        self.assertEqual(df.testattr, unpickled.testattr)
+        assert df._metadata == unpickled._metadata
+        assert df.testattr == unpickled.testattr
 
     def test_indexing_sliced(self):
         # GH 11559
@@ -98,54 +98,32 @@ def test_indexing_sliced(self):
         res = df.loc[:, 'X']
         exp = tm.SubclassedSeries([1, 2, 3], index=list('abc'), name='X')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
+        assert isinstance(res, tm.SubclassedSeries)
 
         res = df.iloc[:, 1]
         exp = tm.SubclassedSeries([4, 5, 6], index=list('abc'), name='Y')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
+        assert isinstance(res, tm.SubclassedSeries)
 
         res = df.loc[:, 'Z']
         exp = tm.SubclassedSeries([7, 8, 9], index=list('abc'), name='Z')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
+        assert isinstance(res, tm.SubclassedSeries)
 
         res = df.loc['a', :]
         exp = tm.SubclassedSeries([1, 4, 7], index=list('XYZ'), name='a')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
+        assert isinstance(res, tm.SubclassedSeries)
 
         res = df.iloc[1, :]
         exp = tm.SubclassedSeries([2, 5, 8], index=list('XYZ'), name='b')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
+        assert isinstance(res, tm.SubclassedSeries)
 
         res = df.loc['c', :]
         exp = tm.SubclassedSeries([3, 6, 9], index=list('XYZ'), name='c')
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
-
-    def test_to_panel_expanddim(self):
-        # GH 9762
-
-        class SubclassedFrame(DataFrame):
-
-            @property
-            def _constructor_expanddim(self):
-                return SubclassedPanel
-
-        class SubclassedPanel(Panel):
-            pass
-
-        index = MultiIndex.from_tuples([(0, 0), (0, 1), (0, 2)])
-        df = SubclassedFrame({'X': [1, 2, 3], 'Y': [4, 5, 6]}, index=index)
-        result = df.to_panel()
-        self.assertTrue(isinstance(result, SubclassedPanel))
-        expected = SubclassedPanel([[[1, 2, 3]], [[4, 5, 6]]],
-                                   items=['X', 'Y'], major_axis=[0],
-                                   minor_axis=[0, 1, 2],
-                                   dtype='int64')
-        tm.assert_panel_equal(result, expected)
+        assert isinstance(res, tm.SubclassedSeries)
 
     def test_subclass_attr_err_propagation(self):
         # GH 11808
@@ -154,7 +132,7 @@ class A(DataFrame):
             @property
             def bar(self):
                 return self.i_dont_exist
-        with tm.assertRaisesRegexp(AttributeError, '.*i_dont_exist.*'):
+        with pytest.raises(AttributeError, match='.*i_dont_exist.*'):
             A().bar
 
     def test_subclass_align(self):
@@ -171,15 +149,15 @@ def test_subclass_align(self):
         exp2 = tm.SubclassedDataFrame({'c': [1, 2, np.nan, 4, np.nan],
                                        'd': [1, 2, np.nan, 4, np.nan]},
                                       index=list('ABCDE'))
-        tm.assertIsInstance(res1, tm.SubclassedDataFrame)
+        assert isinstance(res1, tm.SubclassedDataFrame)
         tm.assert_frame_equal(res1, exp1)
-        tm.assertIsInstance(res2, tm.SubclassedDataFrame)
+        assert isinstance(res2, tm.SubclassedDataFrame)
         tm.assert_frame_equal(res2, exp2)
 
         res1, res2 = df1.a.align(df2.c)
-        tm.assertIsInstance(res1, tm.SubclassedSeries)
+        assert isinstance(res1, tm.SubclassedSeries)
         tm.assert_series_equal(res1, exp1.a)
-        tm.assertIsInstance(res2, tm.SubclassedSeries)
+        assert isinstance(res2, tm.SubclassedSeries)
         tm.assert_series_equal(res2, exp2.c)
 
     def test_subclass_align_combinations(self):
@@ -197,23 +175,23 @@ def test_subclass_align_combinations(self):
         exp2 = pd.Series([1, 2, np.nan, 4, np.nan],
                          index=list('ABCDE'), name='x')
 
-        tm.assertIsInstance(res1, tm.SubclassedDataFrame)
+        assert isinstance(res1, tm.SubclassedDataFrame)
         tm.assert_frame_equal(res1, exp1)
-        tm.assertIsInstance(res2, tm.SubclassedSeries)
+        assert isinstance(res2, tm.SubclassedSeries)
         tm.assert_series_equal(res2, exp2)
 
         # series + frame
         res1, res2 = s.align(df)
-        tm.assertIsInstance(res1, tm.SubclassedSeries)
+        assert isinstance(res1, tm.SubclassedSeries)
         tm.assert_series_equal(res1, exp2)
-        tm.assertIsInstance(res2, tm.SubclassedDataFrame)
+        assert isinstance(res2, tm.SubclassedDataFrame)
         tm.assert_frame_equal(res2, exp1)
 
     def test_subclass_iterrows(self):
         # GH 13977
         df = tm.SubclassedDataFrame({'a': [1]})
         for i, row in df.iterrows():
-            tm.assertIsInstance(row, tm.SubclassedSeries)
+            assert isinstance(row, tm.SubclassedSeries)
             tm.assert_series_equal(row, df.loc[i])
 
     def test_subclass_sparse_slice(self):
@@ -227,16 +205,18 @@ def test_subclass_sparse_slice(self):
                                  tm.SubclassedSparseDataFrame(rows[:2]))
         tm.assert_sp_frame_equal(ssdf[:2],
                                  tm.SubclassedSparseDataFrame(rows[:2]))
-        tm.assert_equal(ssdf.loc[:2].testattr, "testattr")
-        tm.assert_equal(ssdf.iloc[:2].testattr, "testattr")
-        tm.assert_equal(ssdf[:2].testattr, "testattr")
+        assert ssdf.loc[:2].testattr == "testattr"
+        assert ssdf.iloc[:2].testattr == "testattr"
+        assert ssdf[:2].testattr == "testattr"
 
         tm.assert_sp_series_equal(ssdf.loc[1],
                                   tm.SubclassedSparseSeries(rows[1]),
-                                  check_names=False)
+                                  check_names=False,
+                                  check_kind=False)
         tm.assert_sp_series_equal(ssdf.iloc[1],
                                   tm.SubclassedSparseSeries(rows[1]),
-                                  check_names=False)
+                                  check_names=False,
+                                  check_kind=False)
 
     def test_subclass_sparse_transpose(self):
         ossdf = tm.SubclassedSparseDataFrame([[1, 2, 3],
@@ -245,3 +225,326 @@ def test_subclass_sparse_transpose(self):
                                               [2, 5],
                                               [3, 6]])
         tm.assert_sp_frame_equal(ossdf.T, essdf)
+
+    def test_subclass_stack(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                                    index=['a', 'b', 'c'],
+                                    columns=['X', 'Y', 'Z'])
+
+        res = df.stack()
+        exp = tm.SubclassedSeries(
+            [1, 2, 3, 4, 5, 6, 7, 8, 9],
+            index=[list('aaabbbccc'), list('XYZXYZXYZ')])
+
+        tm.assert_series_equal(res, exp)
+
+    def test_subclass_stack_multi(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12, 13],
+            [20, 21, 22, 23],
+            [30, 31, 32, 33],
+            [40, 41, 42, 43]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 12],
+            [11, 13],
+            [20, 22],
+            [21, 23],
+            [30, 32],
+            [31, 33],
+            [40, 42],
+            [41, 43]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('yzyzyzyz'))),
+                names=['aaa', 'ccc', 'yyy']),
+            columns=Index(['W', 'X'], name='www'))
+
+        res = df.stack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.stack('yyy')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 11],
+            [12, 13],
+            [20, 21],
+            [22, 23],
+            [30, 31],
+            [32, 33],
+            [40, 41],
+            [42, 43]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('WXWXWXWX'))),
+                names=['aaa', 'ccc', 'www']),
+            columns=Index(['y', 'z'], name='yyy'))
+
+        res = df.stack('www')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_stack_multi_mixed(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12.0, 13.0],
+            [20, 21, 22.0, 23.0],
+            [30, 31, 32.0, 33.0],
+            [40, 41, 42.0, 43.0]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 12.0],
+            [11, 13.0],
+            [20, 22.0],
+            [21, 23.0],
+            [30, 32.0],
+            [31, 33.0],
+            [40, 42.0],
+            [41, 43.0]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('yzyzyzyz'))),
+                names=['aaa', 'ccc', 'yyy']),
+            columns=Index(['W', 'X'], name='www'))
+
+        res = df.stack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.stack('yyy')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10.0, 11.0],
+            [12.0, 13.0],
+            [20.0, 21.0],
+            [22.0, 23.0],
+            [30.0, 31.0],
+            [32.0, 33.0],
+            [40.0, 41.0],
+            [42.0, 43.0]],
+            index=MultiIndex.from_tuples(list(zip(
+                list('AAAABBBB'), list('ccddccdd'), list('WXWXWXWX'))),
+                names=['aaa', 'ccc', 'www']),
+            columns=Index(['y', 'z'], name='yyy'))
+
+        res = df.stack('www')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_unstack(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                                    index=['a', 'b', 'c'],
+                                    columns=['X', 'Y', 'Z'])
+
+        res = df.unstack()
+        exp = tm.SubclassedSeries(
+            [1, 4, 7, 2, 5, 8, 3, 6, 9],
+            index=[list('XXXYYYZZZ'), list('abcabcabc')])
+
+        tm.assert_series_equal(res, exp)
+
+    def test_subclass_unstack_multi(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12, 13],
+            [20, 21, 22, 23],
+            [30, 31, 32, 33],
+            [40, 41, 42, 43]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 20, 11, 21, 12, 22, 13, 23],
+            [30, 40, 31, 41, 32, 42, 33, 43]],
+            index=Index(['A', 'B'], name='aaa'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('cdcdcdcd'))),
+            names=['www', 'yyy', 'ccc']))
+
+        res = df.unstack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.unstack('ccc')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 30, 11, 31, 12, 32, 13, 33],
+            [20, 40, 21, 41, 22, 42, 23, 43]],
+            index=Index(['c', 'd'], name='ccc'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('ABABABAB'))),
+                names=['www', 'yyy', 'aaa']))
+
+        res = df.unstack('aaa')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_unstack_multi_mixed(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame([
+            [10, 11, 12.0, 13.0],
+            [20, 21, 22.0, 23.0],
+            [30, 31, 32.0, 33.0],
+            [40, 41, 42.0, 43.0]],
+            index=MultiIndex.from_tuples(
+                list(zip(list('AABB'), list('cdcd'))),
+                names=['aaa', 'ccc']),
+            columns=MultiIndex.from_tuples(
+                list(zip(list('WWXX'), list('yzyz'))),
+                names=['www', 'yyy']))
+
+        exp = tm.SubclassedDataFrame([
+            [10, 20, 11, 21, 12.0, 22.0, 13.0, 23.0],
+            [30, 40, 31, 41, 32.0, 42.0, 33.0, 43.0]],
+            index=Index(['A', 'B'], name='aaa'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('cdcdcdcd'))),
+            names=['www', 'yyy', 'ccc']))
+
+        res = df.unstack()
+        tm.assert_frame_equal(res, exp)
+
+        res = df.unstack('ccc')
+        tm.assert_frame_equal(res, exp)
+
+        exp = tm.SubclassedDataFrame([
+            [10, 30, 11, 31, 12.0, 32.0, 13.0, 33.0],
+            [20, 40, 21, 41, 22.0, 42.0, 23.0, 43.0]],
+            index=Index(['c', 'd'], name='ccc'),
+            columns=MultiIndex.from_tuples(list(zip(
+                list('WWWWXXXX'), list('yyzzyyzz'), list('ABABABAB'))),
+                names=['www', 'yyy', 'aaa']))
+
+        res = df.unstack('aaa')
+        tm.assert_frame_equal(res, exp)
+
+    def test_subclass_pivot(self):
+        # GH 15564
+        df = tm.SubclassedDataFrame({
+            'index': ['A', 'B', 'C', 'C', 'B', 'A'],
+            'columns': ['One', 'One', 'One', 'Two', 'Two', 'Two'],
+            'values': [1., 2., 3., 3., 2., 1.]})
+
+        pivoted = df.pivot(
+            index='index', columns='columns', values='values')
+
+        expected = tm.SubclassedDataFrame({
+            'One': {'A': 1., 'B': 2., 'C': 3.},
+            'Two': {'A': 1., 'B': 2., 'C': 3.}})
+
+        expected.index.name, expected.columns.name = 'index', 'columns'
+
+        tm.assert_frame_equal(pivoted, expected)
+
+    def test_subclassed_melt(self):
+        # GH 15564
+        cheese = tm.SubclassedDataFrame({
+            'first': ['John', 'Mary'],
+            'last': ['Doe', 'Bo'],
+            'height': [5.5, 6.0],
+            'weight': [130, 150]})
+
+        melted = pd.melt(cheese, id_vars=['first', 'last'])
+
+        expected = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 5.5],
+            ['Mary', 'Bo', 'height', 6.0],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        tm.assert_frame_equal(melted, expected)
+
+    def test_subclassed_wide_to_long(self):
+        # GH 9762
+
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = tm.SubclassedDataFrame({
+            "A1970": {0: "a", 1: "b", 2: "c"},
+            "A1980": {0: "d", 1: "e", 2: "f"},
+            "B1970": {0: 2.5, 1: 1.2, 2: .7},
+            "B1980": {0: 3.2, 1: 1.3, 2: .1},
+            "X": dict(zip(range(3), x))})
+
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = tm.SubclassedDataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        long_frame = pd.wide_to_long(df, ["A", "B"], i="id", j="year")
+
+        tm.assert_frame_equal(long_frame, expected)
+
+    def test_subclassed_apply(self):
+        # GH 19822
+
+        def check_row_subclass(row):
+            assert isinstance(row, tm.SubclassedSeries)
+
+        def strech(row):
+            if row["variable"] == "height":
+                row["value"] += 0.5
+            return row
+
+        df = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 5.5],
+            ['Mary', 'Bo', 'height', 6.0],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        df.apply(lambda x: check_row_subclass(x))
+        df.apply(lambda x: check_row_subclass(x), axis=1)
+
+        expected = tm.SubclassedDataFrame([
+            ['John', 'Doe', 'height', 6.0],
+            ['Mary', 'Bo', 'height', 6.5],
+            ['John', 'Doe', 'weight', 130],
+            ['Mary', 'Bo', 'weight', 150]],
+            columns=['first', 'last', 'variable', 'value'])
+
+        result = df.apply(lambda x: strech(x), axis=1)
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        expected = tm.SubclassedDataFrame([
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3]])
+
+        result = df.apply(lambda x: tm.SubclassedSeries([1, 2, 3]), axis=1)
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1, result_type="expand")
+        assert isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_frame_equal(result, expected)
+
+        expected = tm.SubclassedSeries([
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3],
+            [1, 2, 3]])
+
+        result = df.apply(lambda x: [1, 2, 3], axis=1)
+        assert not isinstance(result, tm.SubclassedDataFrame)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/frame/test_timeseries.py b/pandas/tests/frame/test_timeseries.py
index 862f76b4ecc05..9965be9091451 100644
--- a/pandas/tests/frame/test_timeseries.py
+++ b/pandas/tests/frame/test_timeseries.py
@@ -4,28 +4,30 @@
 
 from datetime import datetime, time
 
-from numpy import nan
-from numpy.random import randn
 import numpy as np
+import pytest
+import pytz
+
+from pandas.compat import PY2, product
 
-from pandas import (DataFrame, Series, Index,
-                    Timestamp, DatetimeIndex,
-                    to_datetime, date_range)
 import pandas as pd
-import pandas.tseries.offsets as offsets
+from pandas import (
+    DataFrame, DatetimeIndex, Index, MultiIndex, Series, Timestamp, date_range,
+    period_range, to_datetime)
+from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_frame_equal, assert_index_equal, assert_series_equal)
 
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assertRaisesRegexp)
+import pandas.tseries.offsets as offsets
 
-import pandas.util.testing as tm
-from pandas.compat import product
 
-from pandas.tests.frame.common import TestData
+@pytest.fixture(params=product([True, False], [True, False]))
+def close_open_fixture(request):
+    return request.param
 
 
-class TestDataFrameTimeSeriesMethods(tm.TestCase, TestData):
+class TestDataFrameTimeSeriesMethods(TestData):
 
     def test_diff(self):
         the_diff = self.tsframe.diff(1)
@@ -39,7 +41,7 @@ def test_diff(self):
         s = Series([a, b])
 
         rs = DataFrame({'s': s}).diff()
-        self.assertEqual(rs.s[1], 1)
+        assert rs.s[1] == 1
 
         # mixed numeric
         tf = self.tsframe.astype('float32')
@@ -55,6 +57,32 @@ def test_diff(self):
             1), 'z': pd.Series(1)}).astype('float64')
         assert_frame_equal(result, expected)
 
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_diff_datetime_axis0(self, tz):
+        # GH 18578
+        df = DataFrame({0: date_range('2010', freq='D', periods=2, tz=tz),
+                        1: date_range('2010', freq='D', periods=2, tz=tz)})
+
+        result = df.diff(axis=0)
+        expected = DataFrame({0: pd.TimedeltaIndex(['NaT', '1 days']),
+                              1: pd.TimedeltaIndex(['NaT', '1 days'])})
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_diff_datetime_axis1(self, tz):
+        # GH 18578
+        df = DataFrame({0: date_range('2010', freq='D', periods=2, tz=tz),
+                        1: date_range('2010', freq='D', periods=2, tz=tz)})
+        if tz is None:
+            result = df.diff(axis=1)
+            expected = DataFrame({0: pd.TimedeltaIndex(['NaT', 'NaT']),
+                                  1: pd.TimedeltaIndex(['0 days',
+                                                        '0 days'])})
+            assert_frame_equal(result, expected)
+        else:
+            with pytest.raises(NotImplementedError):
+                result = df.diff(axis=1)
+
     def test_diff_timedelta(self):
         # GH 4533
         df = DataFrame(dict(time=[Timestamp('20130101 9:01'),
@@ -72,7 +100,7 @@ def test_diff_mixed_dtype(self):
         df['A'] = np.array([1, 2, 3, 4, 5], dtype=object)
 
         result = df.diff()
-        self.assertEqual(result[0].dtype, np.float64)
+        assert result[0].dtype == np.float64
 
     def test_diff_neg_n(self):
         rs = self.tsframe.diff(-1)
@@ -106,7 +134,9 @@ def test_pct_change(self):
 
         rs = self.tsframe.pct_change(freq='5D')
         filled = self.tsframe.fillna(method='pad')
-        assert_frame_equal(rs, filled / filled.shift(freq='5D') - 1)
+        assert_frame_equal(rs,
+                           (filled / filled.shift(freq='5D') - 1)
+                           .reindex_like(filled))
 
     def test_pct_change_shift_over_nas(self):
         s = Series([1., 1.5, np.nan, 2.5, 3.])
@@ -114,23 +144,50 @@ def test_pct_change_shift_over_nas(self):
         df = DataFrame({'a': s, 'b': s})
 
         chg = df.pct_change()
-        expected = Series([np.nan, 0.5, np.nan, 2.5 / 1.5 - 1, .2])
+        expected = Series([np.nan, 0.5, 0., 2.5 / 1.5 - 1, .2])
         edf = DataFrame({'a': expected, 'b': expected})
         assert_frame_equal(chg, edf)
 
+    @pytest.mark.parametrize("freq, periods, fill_method, limit",
+                             [('5B', 5, None, None),
+                              ('3B', 3, None, None),
+                              ('3B', 3, 'bfill', None),
+                              ('7B', 7, 'pad', 1),
+                              ('7B', 7, 'bfill', 3),
+                              ('14B', 14, None, None)])
+    def test_pct_change_periods_freq(self, freq, periods, fill_method, limit):
+        # GH 7292
+        rs_freq = self.tsframe.pct_change(freq=freq,
+                                          fill_method=fill_method,
+                                          limit=limit)
+        rs_periods = self.tsframe.pct_change(periods,
+                                             fill_method=fill_method,
+                                             limit=limit)
+        assert_frame_equal(rs_freq, rs_periods)
+
+        empty_ts = DataFrame(index=self.tsframe.index,
+                             columns=self.tsframe.columns)
+        rs_freq = empty_ts.pct_change(freq=freq,
+                                      fill_method=fill_method,
+                                      limit=limit)
+        rs_periods = empty_ts.pct_change(periods,
+                                         fill_method=fill_method,
+                                         limit=limit)
+        assert_frame_equal(rs_freq, rs_periods)
+
     def test_frame_ctor_datetime64_column(self):
         rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50', freq='10s')
         dates = np.asarray(rng)
 
         df = DataFrame({'A': np.random.randn(len(rng)), 'B': dates})
-        self.assertTrue(np.issubdtype(df['B'].dtype, np.dtype('M8[ns]')))
+        assert np.issubdtype(df['B'].dtype, np.dtype('M8[ns]'))
 
-    def test_frame_add_datetime64_column(self):
+    def test_frame_append_datetime64_column(self):
         rng = date_range('1/1/2000 00:00:00', '1/1/2000 1:59:50', freq='10s')
         df = DataFrame(index=np.arange(len(rng)))
 
         df['A'] = rng
-        self.assertTrue(np.issubdtype(df['A'].dtype, np.dtype('M8[ns]')))
+        assert np.issubdtype(df['A'].dtype, np.dtype('M8[ns]'))
 
     def test_frame_datetime64_pre1900_repr(self):
         df = DataFrame({'year': date_range('1/1/1700', periods=50,
@@ -138,7 +195,7 @@ def test_frame_datetime64_pre1900_repr(self):
         # it works!
         repr(df)
 
-    def test_frame_add_datetime64_col_other_units(self):
+    def test_frame_append_datetime64_col_other_units(self):
         n = 100
 
         units = ['h', 'm', 's', 'ms', 'D', 'M', 'Y']
@@ -154,8 +211,8 @@ def test_frame_add_datetime64_col_other_units(self):
 
             ex_vals = to_datetime(vals.astype('O')).values
 
-            self.assertEqual(df[unit].dtype, ns_dtype)
-            self.assertTrue((df[unit].values == ex_vals).all())
+            assert df[unit].dtype == ns_dtype
+            assert (df[unit].values == ex_vals).all()
 
         # Test insertion into existing datetime64 column
         df = DataFrame({'ints': np.arange(n)}, index=np.arange(n))
@@ -170,18 +227,18 @@ def test_frame_add_datetime64_col_other_units(self):
             tmp['dates'] = vals
             ex_vals = to_datetime(vals.astype('O')).values
 
-            self.assertTrue((tmp['dates'].values == ex_vals).all())
+            assert (tmp['dates'].values == ex_vals).all()
 
     def test_shift(self):
         # naive shift
         shiftedFrame = self.tsframe.shift(5)
-        self.assert_index_equal(shiftedFrame.index, self.tsframe.index)
+        tm.assert_index_equal(shiftedFrame.index, self.tsframe.index)
 
         shiftedSeries = self.tsframe['A'].shift(5)
         assert_series_equal(shiftedFrame['A'], shiftedSeries)
 
         shiftedFrame = self.tsframe.shift(-5)
-        self.assert_index_equal(shiftedFrame.index, self.tsframe.index)
+        tm.assert_index_equal(shiftedFrame.index, self.tsframe.index)
 
         shiftedSeries = self.tsframe['A'].shift(-5)
         assert_series_equal(shiftedFrame['A'], shiftedSeries)
@@ -192,7 +249,7 @@ def test_shift(self):
 
         # shift by DateOffset
         shiftedFrame = self.tsframe.shift(5, freq=offsets.BDay())
-        self.assertEqual(len(shiftedFrame), len(self.tsframe))
+        assert len(shiftedFrame) == len(self.tsframe)
 
         shiftedFrame2 = self.tsframe.shift(5, freq='B')
         assert_frame_equal(shiftedFrame, shiftedFrame2)
@@ -209,9 +266,9 @@ def test_shift(self):
         ps = tm.makePeriodFrame()
         shifted = ps.shift(1)
         unshifted = shifted.shift(-1)
-        self.assert_index_equal(shifted.index, ps.index)
-        self.assert_index_equal(unshifted.index, ps.index)
-        tm.assert_numpy_array_equal(unshifted.iloc[:, 0].valid().values,
+        tm.assert_index_equal(shifted.index, ps.index)
+        tm.assert_index_equal(unshifted.index, ps.index)
+        tm.assert_numpy_array_equal(unshifted.iloc[:, 0].dropna().values,
                                     ps.iloc[:-1, 0].values)
 
         shifted2 = ps.shift(1, 'B')
@@ -219,8 +276,9 @@ def test_shift(self):
         assert_frame_equal(shifted2, shifted3)
         assert_frame_equal(ps, shifted2.shift(-1, 'B'))
 
-        assertRaisesRegexp(ValueError, 'does not match PeriodIndex freq',
-                           ps.shift, freq='D')
+        msg = 'does not match PeriodIndex freq'
+        with pytest.raises(ValueError, match=msg):
+            ps.shift(freq='D')
 
         # shift other axis
         # GH 6371
@@ -259,6 +317,20 @@ def test_shift_categorical(self):
         xp = DataFrame({'one': s1.shift(1), 'two': s2.shift(1)})
         assert_frame_equal(rs, xp)
 
+    def test_shift_fill_value(self):
+        # GH #24128
+        df = DataFrame([1, 2, 3, 4, 5],
+                       index=date_range('1/1/2000', periods=5, freq='H'))
+        exp = DataFrame([0, 1, 2, 3, 4],
+                        index=date_range('1/1/2000', periods=5, freq='H'))
+        result = df.shift(1, fill_value=0)
+        assert_frame_equal(result, exp)
+
+        exp = DataFrame([0, 0, 1, 2, 3],
+                        index=date_range('1/1/2000', periods=5, freq='H'))
+        result = df.shift(2, fill_value=0)
+        assert_frame_equal(result, exp)
+
     def test_shift_empty(self):
         # Regression test for #8019
         df = DataFrame({'foo': []})
@@ -266,6 +338,28 @@ def test_shift_empty(self):
 
         assert_frame_equal(df, rs)
 
+    def test_shift_duplicate_columns(self):
+        # GH 9092; verify that position-based shifting works
+        # in the presence of duplicate columns
+        column_lists = [list(range(5)), [1] * 5, [1, 1, 2, 2, 1]]
+        data = np.random.randn(20, 5)
+
+        shifted = []
+        for columns in column_lists:
+            df = pd.DataFrame(data.copy(), columns=columns)
+            for s in range(5):
+                df.iloc[:, s] = df.iloc[:, s].shift(s + 1)
+            df.columns = range(5)
+            shifted.append(df)
+
+        # sanity check the base case
+        nulls = shifted[0].isna().sum()
+        assert_series_equal(nulls, Series(range(1, 6), dtype='int64'))
+
+        # check all answers are the same
+        assert_frame_equal(shifted[0], shifted[1])
+        assert_frame_equal(shifted[0], shifted[2])
+
     def test_tshift(self):
         # PeriodIndex
         ps = tm.makePeriodFrame()
@@ -280,7 +374,8 @@ def test_tshift(self):
         shifted3 = ps.tshift(freq=offsets.BDay())
         assert_frame_equal(shifted, shifted3)
 
-        assertRaisesRegexp(ValueError, 'does not match', ps.tshift, freq='M')
+        with pytest.raises(ValueError, match='does not match'):
+            ps.tshift(freq='M')
 
         # DatetimeIndex
         shifted = self.tsframe.tshift(1)
@@ -300,7 +395,9 @@ def test_tshift(self):
         assert_frame_equal(unshifted, inferred_ts)
 
         no_freq = self.tsframe.iloc[[0, 5, 7], :]
-        self.assertRaises(ValueError, no_freq.tshift)
+        msg = "Freq was not given and was not set in the index"
+        with pytest.raises(ValueError, match=msg):
+            no_freq.tshift()
 
     def test_truncate(self):
         ts = self.tsframe[::3]
@@ -341,21 +438,49 @@ def test_truncate(self):
         truncated = ts.truncate(after=end_missing)
         assert_frame_equal(truncated, expected)
 
-        self.assertRaises(ValueError, ts.truncate,
-                          before=ts.index[-1] - 1,
-                          after=ts.index[0] + 1)
+        msg = "Truncate: 2000-01-06 00:00:00 must be after 2000-02-04 00:00:00"
+        with pytest.raises(ValueError, match=msg):
+            ts.truncate(before=ts.index[-1] - ts.index.freq,
+                        after=ts.index[0] + ts.index.freq)
 
     def test_truncate_copy(self):
         index = self.tsframe.index
         truncated = self.tsframe.truncate(index[5], index[10])
         truncated.values[:] = 5.
-        self.assertFalse((self.tsframe.values[5:11] == 5).any())
+        assert not (self.tsframe.values[5:11] == 5).any()
+
+    def test_truncate_nonsortedindex(self):
+        # GH 17935
+
+        df = pd.DataFrame({'A': ['a', 'b', 'c', 'd', 'e']},
+                          index=[5, 3, 2, 9, 0])
+        msg = 'truncate requires a sorted index'
+        with pytest.raises(ValueError, match=msg):
+            df.truncate(before=3, after=9)
+
+        rng = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+        ts = pd.DataFrame({'A': np.random.randn(len(rng)),
+                           'B': np.random.randn(len(rng))},
+                          index=rng)
+        msg = 'truncate requires a sorted index'
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values('A', ascending=False).truncate(before='2011-11',
+                                                          after='2011-12')
+
+        df = pd.DataFrame({3: np.random.randn(5),
+                           20: np.random.randn(5),
+                           2: np.random.randn(5),
+                           0: np.random.randn(5)},
+                          columns=[3, 20, 2, 0])
+        msg = 'truncate requires a sorted index'
+        with pytest.raises(ValueError, match=msg):
+            df.truncate(before=2, after=20, axis=1)
 
     def test_asfreq(self):
         offset_monthly = self.tsframe.asfreq(offsets.BMonthEnd())
         rule_monthly = self.tsframe.asfreq('BM')
 
-        assert_almost_equal(offset_monthly['A'], rule_monthly['A'])
+        tm.assert_almost_equal(offset_monthly['A'], rule_monthly['A'])
 
         filled = rule_monthly.asfreq('B', method='pad')  # noqa
         # TODO: actually check that this worked.
@@ -366,17 +491,17 @@ def test_asfreq(self):
         # test does not blow up on length-0 DataFrame
         zero_length = self.tsframe.reindex([])
         result = zero_length.asfreq('BM')
-        self.assertIsNot(result, zero_length)
+        assert result is not zero_length
 
     def test_asfreq_datetimeindex(self):
         df = DataFrame({'A': [1, 2, 3]},
                        index=[datetime(2011, 11, 1), datetime(2011, 11, 2),
                               datetime(2011, 11, 3)])
         df = df.asfreq('B')
-        tm.assertIsInstance(df.index, DatetimeIndex)
+        assert isinstance(df.index, DatetimeIndex)
 
         ts = df['A'].asfreq('B')
-        tm.assertIsInstance(ts.index, DatetimeIndex)
+        assert isinstance(ts.index, DatetimeIndex)
 
     def test_asfreq_fillvalue(self):
         # test for fill value during upsampling, related to issue 3715
@@ -398,32 +523,111 @@ def test_asfreq_fillvalue(self):
         actual_series = ts.asfreq(freq='1S', fill_value=9.0)
         assert_series_equal(expected_series, actual_series)
 
-    def test_first_last_valid(self):
+    @pytest.mark.parametrize("data,idx,expected_first,expected_last", [
+        ({'A': [1, 2, 3]}, [1, 1, 2], 1, 2),
+        ({'A': [1, 2, 3]}, [1, 2, 2], 1, 2),
+        ({'A': [1, 2, 3, 4]}, ['d', 'd', 'd', 'd'], 'd', 'd'),
+        ({'A': [1, np.nan, 3]}, [1, 1, 2], 1, 2),
+        ({'A': [np.nan, np.nan, 3]}, [1, 1, 2], 2, 2),
+        ({'A': [1, np.nan, 3]}, [1, 2, 2], 1, 2)])
+    def test_first_last_valid(self, data, idx,
+                              expected_first, expected_last):
         N = len(self.frame.index)
-        mat = randn(N)
-        mat[:5] = nan
-        mat[-5:] = nan
+        mat = np.random.randn(N)
+        mat[:5] = np.nan
+        mat[-5:] = np.nan
 
         frame = DataFrame({'foo': mat}, index=self.frame.index)
         index = frame.first_valid_index()
 
-        self.assertEqual(index, frame.index[5])
+        assert index == frame.index[5]
 
         index = frame.last_valid_index()
-        self.assertEqual(index, frame.index[-6])
+        assert index == frame.index[-6]
 
         # GH12800
         empty = DataFrame()
-        self.assertIsNone(empty.last_valid_index())
-        self.assertIsNone(empty.first_valid_index())
+        assert empty.last_valid_index() is None
+        assert empty.first_valid_index() is None
+
+        # GH17400: no valid entries
+        frame[:] = np.nan
+        assert frame.last_valid_index() is None
+        assert frame.first_valid_index() is None
+
+        # GH20499: its preserves freq with holes
+        frame.index = date_range("20110101", periods=N, freq="B")
+        frame.iloc[1] = 1
+        frame.iloc[-2] = 1
+        assert frame.first_valid_index() == frame.index[1]
+        assert frame.last_valid_index() == frame.index[-2]
+        assert frame.first_valid_index().freq == frame.index.freq
+        assert frame.last_valid_index().freq == frame.index.freq
+
+        # GH 21441
+        df = DataFrame(data, index=idx)
+        assert expected_first == df.first_valid_index()
+        assert expected_last == df.last_valid_index()
+
+    def test_first_subset(self):
+        ts = tm.makeTimeDataFrame(freq='12h')
+        result = ts.first('10d')
+        assert len(result) == 20
+
+        ts = tm.makeTimeDataFrame(freq='D')
+        result = ts.first('10d')
+        assert len(result) == 10
+
+        result = ts.first('3M')
+        expected = ts[:'3/31/2000']
+        assert_frame_equal(result, expected)
+
+        result = ts.first('21D')
+        expected = ts[:21]
+        assert_frame_equal(result, expected)
+
+        result = ts[:0].first('3M')
+        assert_frame_equal(result, ts[:0])
+
+    def test_first_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.first('1D')
+
+    def test_last_subset(self):
+        ts = tm.makeTimeDataFrame(freq='12h')
+        result = ts.last('10d')
+        assert len(result) == 20
+
+        ts = tm.makeTimeDataFrame(nper=30, freq='D')
+        result = ts.last('10d')
+        assert len(result) == 10
+
+        result = ts.last('21D')
+        expected = ts['2000-01-10':]
+        assert_frame_equal(result, expected)
+
+        result = ts.last('21D')
+        expected = ts[-21:]
+        assert_frame_equal(result, expected)
+
+        result = ts[:0].last('3M')
+        assert_frame_equal(result, ts[:0])
 
-    def test_at_time_frame(self):
+    def test_last_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.last('1D')
+
+    def test_at_time(self):
         rng = date_range('1/1/2000', '1/5/2000', freq='5min')
         ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
         rs = ts.at_time(rng[1])
-        self.assertTrue((rs.index.hour == rng[1].hour).all())
-        self.assertTrue((rs.index.minute == rng[1].minute).all())
-        self.assertTrue((rs.index.second == rng[1].second).all())
+        assert (rs.index.hour == rng[1].hour).all()
+        assert (rs.index.minute == rng[1].minute).all()
+        assert (rs.index.second == rng[1].second).all()
 
         result = ts.at_time('9:30')
         expected = ts.at_time(time(9, 30))
@@ -445,35 +649,79 @@ def test_at_time_frame(self):
         rng = date_range('1/1/2012', freq='23Min', periods=384)
         ts = DataFrame(np.random.randn(len(rng), 2), rng)
         rs = ts.at_time('16:00')
-        self.assertEqual(len(rs), 0)
+        assert len(rs) == 0
+
+    @pytest.mark.parametrize('hour', ['1:00', '1:00AM', time(1),
+                                      time(1, tzinfo=pytz.UTC)])
+    def test_at_time_errors(self, hour):
+        # GH 24043
+        dti = pd.date_range('2018', periods=3, freq='H')
+        df = pd.DataFrame(list(range(len(dti))), index=dti)
+        if getattr(hour, 'tzinfo', None) is None:
+            result = df.at_time(hour)
+            expected = df.iloc[1:2]
+            tm.assert_frame_equal(result, expected)
+        else:
+            with pytest.raises(ValueError, match="Index must be timezone"):
+                df.at_time(hour)
+
+    def test_at_time_tz(self):
+        # GH 24043
+        dti = pd.date_range('2018', periods=3, freq='H', tz='US/Pacific')
+        df = pd.DataFrame(list(range(len(dti))), index=dti)
+        result = df.at_time(time(4, tzinfo=pytz.timezone('US/Eastern')))
+        expected = df.iloc[1:2]
+        tm.assert_frame_equal(result, expected)
+
+    def test_at_time_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.at_time('00:00')
+
+    @pytest.mark.parametrize('axis', ['index', 'columns', 0, 1])
+    def test_at_time_axis(self, axis):
+        # issue 8839
+        rng = date_range('1/1/2000', '1/5/2000', freq='5min')
+        ts = DataFrame(np.random.randn(len(rng), len(rng)))
+        ts.index, ts.columns = rng, rng
 
-    def test_between_time_frame(self):
+        indices = rng[(rng.hour == 9) & (rng.minute == 30) & (rng.second == 0)]
+
+        if axis in ['index', 0]:
+            expected = ts.loc[indices, :]
+        elif axis in ['columns', 1]:
+            expected = ts.loc[:, indices]
+
+        result = ts.at_time('9:30', axis=axis)
+        assert_frame_equal(result, expected)
+
+    def test_between_time(self, close_open_fixture):
         rng = date_range('1/1/2000', '1/5/2000', freq='5min')
         ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
         stime = time(0, 0)
         etime = time(1, 0)
-
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = 13 * 4 + 1
-            if not inc_start:
-                exp_len -= 5
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue(t >= stime)
-                else:
-                    self.assertTrue(t > stime)
-
-                if inc_end:
-                    self.assertTrue(t <= etime)
-                else:
-                    self.assertTrue(t < etime)
+        inc_start, inc_end = close_open_fixture
+
+        filtered = ts.between_time(stime, etime, inc_start, inc_end)
+        exp_len = 13 * 4 + 1
+        if not inc_start:
+            exp_len -= 5
+        if not inc_end:
+            exp_len -= 4
+
+        assert len(filtered) == exp_len
+        for rs in filtered.index:
+            t = rs.time()
+            if inc_start:
+                assert t >= stime
+            else:
+                assert t > stime
+
+            if inc_end:
+                assert t <= etime
+            else:
+                assert t < etime
 
         result = ts.between_time('00:00', '01:00')
         expected = ts.between_time(stime, etime)
@@ -485,27 +733,69 @@ def test_between_time_frame(self):
         stime = time(22, 0)
         etime = time(9, 0)
 
-        close_open = product([True, False], [True, False])
-        for inc_start, inc_end in close_open:
-            filtered = ts.between_time(stime, etime, inc_start, inc_end)
-            exp_len = (12 * 11 + 1) * 4 + 1
-            if not inc_start:
-                exp_len -= 4
-            if not inc_end:
-                exp_len -= 4
-
-            self.assertEqual(len(filtered), exp_len)
-            for rs in filtered.index:
-                t = rs.time()
-                if inc_start:
-                    self.assertTrue((t >= stime) or (t <= etime))
-                else:
-                    self.assertTrue((t > stime) or (t <= etime))
-
-                if inc_end:
-                    self.assertTrue((t <= etime) or (t >= stime))
-                else:
-                    self.assertTrue((t < etime) or (t >= stime))
+        filtered = ts.between_time(stime, etime, inc_start, inc_end)
+        exp_len = (12 * 11 + 1) * 4 + 1
+        if not inc_start:
+            exp_len -= 4
+        if not inc_end:
+            exp_len -= 4
+
+        assert len(filtered) == exp_len
+        for rs in filtered.index:
+            t = rs.time()
+            if inc_start:
+                assert (t >= stime) or (t <= etime)
+            else:
+                assert (t > stime) or (t <= etime)
+
+            if inc_end:
+                assert (t <= etime) or (t >= stime)
+            else:
+                assert (t < etime) or (t >= stime)
+
+    def test_between_time_raises(self):
+        # GH20725
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
+        with pytest.raises(TypeError):  # index is not a DatetimeIndex
+            df.between_time(start_time='00:00', end_time='12:00')
+
+    def test_between_time_axis(self, axis):
+        # issue 8839
+        rng = date_range('1/1/2000', periods=100, freq='10min')
+        ts = DataFrame(np.random.randn(len(rng), len(rng)))
+        stime, etime = ('08:00:00', '09:00:00')
+        exp_len = 7
+
+        if axis in ['index', 0]:
+            ts.index = rng
+            assert len(ts.between_time(stime, etime)) == exp_len
+            assert len(ts.between_time(stime, etime, axis=0)) == exp_len
+
+        if axis in ['columns', 1]:
+            ts.columns = rng
+            selected = ts.between_time(stime, etime, axis=1).columns
+            assert len(selected) == exp_len
+
+    def test_between_time_axis_raises(self, axis):
+        # issue 8839
+        rng = date_range('1/1/2000', periods=100, freq='10min')
+        mask = np.arange(0, len(rng))
+        rand_data = np.random.randn(len(rng), len(rng))
+        ts = DataFrame(rand_data, index=rng, columns=rng)
+        stime, etime = ('08:00:00', '09:00:00')
+
+        msg = "Index must be DatetimeIndex"
+        if axis in ['columns', 1]:
+            ts.index = mask
+            with pytest.raises(TypeError, match=msg):
+                ts.between_time(stime, etime)
+            with pytest.raises(TypeError, match=msg):
+                ts.between_time(stime, etime, axis=0)
+
+        if axis in ['index', 0]:
+            ts.columns = mask
+            with pytest.raises(TypeError, match=msg):
+                ts.between_time(stime, etime, axis=1)
 
     def test_operation_on_NaT(self):
         # Both NaT and Timestamp are in DataFrame.
@@ -546,13 +836,13 @@ def test_datetime_assignment_with_NaT_and_diff_time_units(self):
                                  'new': [1e9, None]}, dtype='datetime64[ns]')
         tm.assert_frame_equal(result, expected)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_frame_to_period(self):
         K = 5
-        from pandas.tseries.period import period_range
 
         dr = date_range('1/1/2000', '1/1/2001')
         pr = period_range('1/1/2000', '1/1/2001')
-        df = DataFrame(randn(len(dr), K), index=dr)
+        df = DataFrame(np.random.randn(len(dr), K), index=dr)
         df['mix'] = 'a'
 
         pts = df.to_period()
@@ -572,4 +862,72 @@ def test_frame_to_period(self):
         pts = df.to_period('M', axis=1)
         tm.assert_index_equal(pts.columns, exp.columns.asfreq('M'))
 
-        self.assertRaises(ValueError, df.to_period, axis=2)
+        msg = ("No axis named 2 for object type"
+               " <class 'pandas.core.frame.DataFrame'>")
+        with pytest.raises(ValueError, match=msg):
+            df.to_period(axis=2)
+
+    @pytest.mark.parametrize("fn", ['tz_localize', 'tz_convert'])
+    def test_tz_convert_and_localize(self, fn):
+        l0 = date_range('20140701', periods=5, freq='D')
+        l1 = date_range('20140701', periods=5, freq='D')
+
+        int_idx = Index(range(5))
+
+        if fn == 'tz_convert':
+            l0 = l0.tz_localize('UTC')
+            l1 = l1.tz_localize('UTC')
+
+        for idx in [l0, l1]:
+
+            l0_expected = getattr(idx, fn)('US/Pacific')
+            l1_expected = getattr(idx, fn)('US/Pacific')
+
+            df1 = DataFrame(np.ones(5), index=l0)
+            df1 = getattr(df1, fn)('US/Pacific')
+            assert_index_equal(df1.index, l0_expected)
+
+            # MultiIndex
+            # GH7846
+            df2 = DataFrame(np.ones(5), MultiIndex.from_arrays([l0, l1]))
+
+            df3 = getattr(df2, fn)('US/Pacific', level=0)
+            assert not df3.index.levels[0].equals(l0)
+            assert_index_equal(df3.index.levels[0], l0_expected)
+            assert_index_equal(df3.index.levels[1], l1)
+            assert not df3.index.levels[1].equals(l1_expected)
+
+            df3 = getattr(df2, fn)('US/Pacific', level=1)
+            assert_index_equal(df3.index.levels[0], l0)
+            assert not df3.index.levels[0].equals(l0_expected)
+            assert_index_equal(df3.index.levels[1], l1_expected)
+            assert not df3.index.levels[1].equals(l1)
+
+            df4 = DataFrame(np.ones(5),
+                            MultiIndex.from_arrays([int_idx, l0]))
+
+            # TODO: untested
+            df5 = getattr(df4, fn)('US/Pacific', level=1)  # noqa
+
+            assert_index_equal(df3.index.levels[0], l0)
+            assert not df3.index.levels[0].equals(l0_expected)
+            assert_index_equal(df3.index.levels[1], l1_expected)
+            assert not df3.index.levels[1].equals(l1)
+
+        # Bad Inputs
+
+        # Not DatetimeIndex / PeriodIndex
+        with pytest.raises(TypeError, match='DatetimeIndex'):
+            df = DataFrame(index=int_idx)
+            df = getattr(df, fn)('US/Pacific')
+
+        # Not DatetimeIndex / PeriodIndex
+        with pytest.raises(TypeError, match='DatetimeIndex'):
+            df = DataFrame(np.ones(5),
+                           MultiIndex.from_arrays([int_idx, l0]))
+            df = getattr(df, fn)('US/Pacific', level=0)
+
+        # Invalid level
+        with pytest.raises(ValueError, match='not valid'):
+            df = DataFrame(index=l0)
+            df = getattr(df, fn)('US/Pacific', level=1)
diff --git a/pandas/tests/frame/test_timezones.py b/pandas/tests/frame/test_timezones.py
new file mode 100644
index 0000000000000..fd6587c73b8fa
--- /dev/null
+++ b/pandas/tests/frame/test_timezones.py
@@ -0,0 +1,198 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DataFrame timezone-related methods
+"""
+from datetime import datetime
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas.compat import lrange
+
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+
+import pandas as pd
+from pandas import DataFrame, Series
+from pandas.core.indexes.datetimes import date_range
+import pandas.util.testing as tm
+
+
+class TestDataFrameTimezones(object):
+
+    def test_frame_values_with_tz(self):
+        tz = "US/Central"
+        df = DataFrame({"A": date_range('2000', periods=4, tz=tz)})
+        result = df.values
+        expected = np.array([
+            [pd.Timestamp('2000-01-01', tz=tz)],
+            [pd.Timestamp('2000-01-02', tz=tz)],
+            [pd.Timestamp('2000-01-03', tz=tz)],
+            [pd.Timestamp('2000-01-04', tz=tz)],
+        ])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # two columns, homogenous
+
+        df = df.assign(B=df.A)
+        result = df.values
+        expected = np.concatenate([expected, expected], axis=1)
+        tm.assert_numpy_array_equal(result, expected)
+
+        # three columns, heterogenous
+        est = "US/Eastern"
+        df = df.assign(C=df.A.dt.tz_convert(est))
+
+        new = np.array([
+            [pd.Timestamp('2000-01-01T01:00:00', tz=est)],
+            [pd.Timestamp('2000-01-02T01:00:00', tz=est)],
+            [pd.Timestamp('2000-01-03T01:00:00', tz=est)],
+            [pd.Timestamp('2000-01-04T01:00:00', tz=est)],
+        ])
+        expected = np.concatenate([expected, new], axis=1)
+        result = df.values
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_frame_from_records_utc(self):
+        rec = {'datum': 1.5,
+               'begin_time': datetime(2006, 4, 27, tzinfo=pytz.utc)}
+
+        # it works
+        DataFrame.from_records([rec], index='begin_time')
+
+    def test_frame_tz_localize(self):
+        rng = date_range('1/1/2011', periods=100, freq='H')
+
+        df = DataFrame({'a': 1}, index=rng)
+        result = df.tz_localize('utc')
+        expected = DataFrame({'a': 1}, rng.tz_localize('UTC'))
+        assert result.index.tz.zone == 'UTC'
+        tm.assert_frame_equal(result, expected)
+
+        df = df.T
+        result = df.tz_localize('utc', axis=1)
+        assert result.columns.tz.zone == 'UTC'
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_frame_tz_convert(self):
+        rng = date_range('1/1/2011', periods=200, freq='D', tz='US/Eastern')
+
+        df = DataFrame({'a': 1}, index=rng)
+        result = df.tz_convert('Europe/Berlin')
+        expected = DataFrame({'a': 1}, rng.tz_convert('Europe/Berlin'))
+        assert result.index.tz.zone == 'Europe/Berlin'
+        tm.assert_frame_equal(result, expected)
+
+        df = df.T
+        result = df.tz_convert('Europe/Berlin', axis=1)
+        assert result.columns.tz.zone == 'Europe/Berlin'
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_frame_join_tzaware(self):
+        test1 = DataFrame(np.zeros((6, 3)),
+                          index=date_range("2012-11-15 00:00:00", periods=6,
+                                           freq="100L", tz="US/Central"))
+        test2 = DataFrame(np.zeros((3, 3)),
+                          index=date_range("2012-11-15 00:00:00", periods=3,
+                                           freq="250L", tz="US/Central"),
+                          columns=lrange(3, 6))
+
+        result = test1.join(test2, how='outer')
+        ex_index = test1.index.union(test2.index)
+
+        tm.assert_index_equal(result.index, ex_index)
+        assert result.index.tz.zone == 'US/Central'
+
+    def test_frame_add_tz_mismatch_converts_to_utc(self):
+        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
+        df = DataFrame(np.random.randn(len(rng)), index=rng, columns=['a'])
+
+        df_moscow = df.tz_convert('Europe/Moscow')
+        result = df + df_moscow
+        assert result.index.tz is pytz.utc
+
+        result = df_moscow + df
+        assert result.index.tz is pytz.utc
+
+    def test_frame_align_aware(self):
+        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
+        idx2 = date_range('2001', periods=5, freq='2H', tz='US/Eastern')
+        df1 = DataFrame(np.random.randn(len(idx1), 3), idx1)
+        df2 = DataFrame(np.random.randn(len(idx2), 3), idx2)
+        new1, new2 = df1.align(df2)
+        assert df1.index.tz == new1.index.tz
+        assert df2.index.tz == new2.index.tz
+
+        # different timezones convert to UTC
+
+        # frame with frame
+        df1_central = df1.tz_convert('US/Central')
+        new1, new2 = df1.align(df1_central)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+        # frame with Series
+        new1, new2 = df1.align(df1_central[0], axis=0)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+        df1[0].align(df1_central, axis=0)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_frame_no_datetime64_dtype(self, tz):
+        # after GH#7822
+        # these retain the timezones on dict construction
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        dr_tz = dr.tz_localize(tz)
+        df = DataFrame({'A': 'foo', 'B': dr_tz}, index=dr)
+        tz_expected = DatetimeTZDtype('ns', dr_tz.tzinfo)
+        assert df['B'].dtype == tz_expected
+
+        # GH#2810 (with timezones)
+        datetimes_naive = [ts.to_pydatetime() for ts in dr]
+        datetimes_with_tz = [ts.to_pydatetime() for ts in dr_tz]
+        df = DataFrame({'dr': dr,
+                        'dr_tz': dr_tz,
+                        'datetimes_naive': datetimes_naive,
+                        'datetimes_with_tz': datetimes_with_tz})
+        result = df.get_dtype_counts().sort_index()
+        expected = Series({'datetime64[ns]': 2,
+                           str(tz_expected): 2}).sort_index()
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_frame_reset_index(self, tz):
+        dr = date_range('2012-06-02', periods=10, tz=tz)
+        df = DataFrame(np.random.randn(len(dr)), dr)
+        roundtripped = df.reset_index().set_index('index')
+        xp = df.index.tz
+        rs = roundtripped.index.tz
+        assert xp == rs
+
+    @pytest.mark.parametrize('tz', [None, 'America/New_York'])
+    def test_boolean_compare_transpose_tzindex_with_dst(self, tz):
+        # GH 19970
+        idx = date_range('20161101', '20161130', freq='4H', tz=tz)
+        df = DataFrame({'a': range(len(idx)), 'b': range(len(idx))},
+                       index=idx)
+        result = df.T == df.T
+        expected = DataFrame(True, index=list('ab'), columns=idx)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('copy', [True, False])
+    @pytest.mark.parametrize('method, tz', [
+        ['tz_localize', None],
+        ['tz_convert', 'Europe/Berlin']
+    ])
+    def test_tz_localize_convert_copy_inplace_mutate(self, copy, method, tz):
+        # GH 6326
+        result = DataFrame(np.arange(0, 5),
+                           index=date_range('20131027', periods=5,
+                                            freq='1H', tz=tz))
+        getattr(result, method)('UTC', copy=copy)
+        expected = DataFrame(np.arange(0, 5),
+                             index=date_range('20131027', periods=5,
+                                              freq='1H', tz=tz))
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/frame/test_to_csv.py b/pandas/tests/frame/test_to_csv.py
index e49dfffc48803..54a8712a9c645 100644
--- a/pandas/tests/frame/test_to_csv.py
+++ b/pandas/tests/frame/test_to_csv.py
@@ -3,38 +3,53 @@
 from __future__ import print_function
 
 import csv
+import os
 
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas.compat import (lmap, range, lrange, StringIO, u)
-from pandas.io.common import ParserError
-from pandas import (DataFrame, Index, Series, MultiIndex, Timestamp,
-                    date_range, read_csv, compat, to_datetime)
-import pandas as pd
-
-from pandas.util.testing import (assert_almost_equal,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 ensure_clean,
-                                 makeCustomDataframe as mkdf,
-                                 assertRaisesRegexp, slow)
-import pandas.util.testing as tm
+from pandas.compat import StringIO, lmap, lrange, range, u
+from pandas.errors import ParserError
 
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, Series, Timestamp, compat, date_range,
+    read_csv, to_datetime)
+import pandas.core.common as com
 from pandas.tests.frame.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal, ensure_clean,
+    makeCustomDataframe as mkdf)
 
+from pandas.io.common import _get_handle
 
 MIXED_FLOAT_DTYPES = ['float16', 'float32', 'float64']
 MIXED_INT_DTYPES = ['uint8', 'uint16', 'uint32', 'uint64', 'int8', 'int16',
                     'int32', 'int64']
 
 
-class TestDataFrameToCSV(tm.TestCase, TestData):
+class TestDataFrameToCSV(TestData):
+
+    def read_csv(self, path, **kwargs):
+        params = dict(index_col=0, parse_dates=True)
+        params.update(**kwargs)
+
+        return pd.read_csv(path, **params)
+
+    def test_from_csv_deprecation(self):
+        # see gh-17812
+        with ensure_clean('__tmp_from_csv_deprecation__') as path:
+            self.tsframe.to_csv(path)
+
+            with tm.assert_produces_warning(FutureWarning):
+                depr_recons = DataFrame.from_csv(path)
+                assert_frame_equal(self.tsframe, depr_recons)
 
     def test_to_csv_from_csv1(self):
 
         with ensure_clean('__tmp_to_csv_from_csv1__') as path:
-            self.frame['A'][:5] = nan
+            self.frame['A'][:5] = np.nan
 
             self.frame.to_csv(path)
             self.frame.to_csv(path, columns=['A', 'B'])
@@ -43,24 +58,25 @@ def test_to_csv_from_csv1(self):
 
             # test roundtrip
             self.tsframe.to_csv(path)
-            recons = DataFrame.from_csv(path)
-
+            recons = self.read_csv(path)
             assert_frame_equal(self.tsframe, recons)
 
             self.tsframe.to_csv(path, index_label='index')
-            recons = DataFrame.from_csv(path, index_col=None)
+            recons = self.read_csv(path, index_col=None)
+
             assert(len(recons.columns) == len(self.tsframe.columns) + 1)
 
             # no index
             self.tsframe.to_csv(path, index=False)
-            recons = DataFrame.from_csv(path, index_col=None)
+            recons = self.read_csv(path, index_col=None)
             assert_almost_equal(self.tsframe.values, recons.values)
 
             # corner case
             dm = DataFrame({'s1': Series(lrange(3), lrange(3)),
                             's2': Series(lrange(2), lrange(2))})
             dm.to_csv(path)
-            recons = DataFrame.from_csv(path)
+
+            recons = self.read_csv(path)
             assert_frame_equal(dm, recons)
 
     def test_to_csv_from_csv2(self):
@@ -71,31 +87,31 @@ def test_to_csv_from_csv2(self):
             df = DataFrame(np.random.randn(3, 3), index=['a', 'a', 'b'],
                            columns=['x', 'y', 'z'])
             df.to_csv(path)
-            result = DataFrame.from_csv(path)
+            result = self.read_csv(path)
             assert_frame_equal(result, df)
 
             midx = MultiIndex.from_tuples(
                 [('A', 1, 2), ('A', 1, 2), ('B', 1, 2)])
             df = DataFrame(np.random.randn(3, 3), index=midx,
                            columns=['x', 'y', 'z'])
+
             df.to_csv(path)
-            result = DataFrame.from_csv(path, index_col=[0, 1, 2],
-                                        parse_dates=False)
-            # TODO from_csv names index ['Unnamed: 1', 'Unnamed: 2'] should it
-            # ?
+            result = self.read_csv(path, index_col=[0, 1, 2],
+                                   parse_dates=False)
             assert_frame_equal(result, df, check_names=False)
 
             # column aliases
             col_aliases = Index(['AA', 'X', 'Y', 'Z'])
             self.frame2.to_csv(path, header=col_aliases)
-            rs = DataFrame.from_csv(path)
+
+            rs = self.read_csv(path)
             xp = self.frame2.copy()
             xp.columns = col_aliases
-
             assert_frame_equal(xp, rs)
 
-            self.assertRaises(ValueError, self.frame2.to_csv, path,
-                              header=['AA', 'X'])
+            msg = "Writing 4 cols but got 2 aliases"
+            with pytest.raises(ValueError, match=msg):
+                self.frame2.to_csv(path, header=['AA', 'X'])
 
     def test_to_csv_from_csv3(self):
 
@@ -137,7 +153,7 @@ def test_to_csv_from_csv5(self):
             self.tzframe.to_csv(path)
             result = pd.read_csv(path, index_col=0, parse_dates=['A'])
 
-            converter = lambda c: to_datetime(result[c]).dt.tz_localize(
+            converter = lambda c: to_datetime(result[c]).dt.tz_convert(
                 'UTC').dt.tz_convert(self.tzframe[c].dt.tz)
             result['B'] = converter('B')
             result['C'] = converter('C')
@@ -205,7 +221,7 @@ def _check_df(df, cols=None):
         cols = ['b', 'a']
         _check_df(df, cols)
 
-    @slow
+    @pytest.mark.slow
     def test_to_csv_dtnat(self):
         # GH3437
         from pandas import NaT
@@ -231,12 +247,13 @@ def make_dtnat_arr(n, nnat=None):
         with ensure_clean('1.csv') as pth:
             df = DataFrame(dict(a=s1, b=s2))
             df.to_csv(pth, chunksize=chunksize)
-            recons = DataFrame.from_csv(pth)._convert(datetime=True,
-                                                      coerce=True)
+
+            recons = self.read_csv(pth)._convert(datetime=True,
+                                                 coerce=True)
             assert_frame_equal(df, recons, check_names=False,
                                check_less_precise=True)
 
-    @slow
+    @pytest.mark.slow
     def test_to_csv_moar(self):
 
         def _do_test(df, r_dtype=None, c_dtype=None,
@@ -247,16 +264,17 @@ def _do_test(df, r_dtype=None, c_dtype=None,
                 if rnlvl is not None:
                     kwargs['index_col'] = lrange(rnlvl)
                 kwargs['header'] = lrange(cnlvl)
+
                 with ensure_clean('__tmp_to_csv_moar__') as path:
                     df.to_csv(path, encoding='utf8',
-                              chunksize=chunksize, tupleize_cols=False)
-                    recons = DataFrame.from_csv(
-                        path, tupleize_cols=False, **kwargs)
+                              chunksize=chunksize)
+                    recons = self.read_csv(path, **kwargs)
             else:
                 kwargs['header'] = 0
+
                 with ensure_clean('__tmp_to_csv_moar__') as path:
                     df.to_csv(path, encoding='utf8', chunksize=chunksize)
-                    recons = DataFrame.from_csv(path, **kwargs)
+                    recons = self.read_csv(path, **kwargs)
 
             def _to_uni(x):
                 if not isinstance(x, compat.text_type):
@@ -398,7 +416,7 @@ def test_to_csv_from_csv_w_some_infs(self):
 
         with ensure_clean() as path:
             self.frame.to_csv(path)
-            recons = DataFrame.from_csv(path)
+            recons = self.read_csv(path)
 
             # TODO to_csv drops column name
             assert_frame_equal(self.frame, recons, check_names=False)
@@ -413,7 +431,7 @@ def test_to_csv_from_csv_w_all_infs(self):
 
         with ensure_clean() as path:
             self.frame.to_csv(path)
-            recons = DataFrame.from_csv(path)
+            recons = self.read_csv(path)
 
             # TODO to_csv drops column name
             assert_frame_equal(self.frame, recons, check_names=False)
@@ -433,13 +451,13 @@ def test_to_csv_no_index(self):
             assert_frame_equal(df, result)
 
     def test_to_csv_with_mix_columns(self):
-        # GH11637, incorrect output when a mix of integer and string column
+        # gh-11637: incorrect output when a mix of integer and string column
         # names passed as columns parameter in to_csv
 
         df = DataFrame({0: ['a', 'b', 'c'],
                         1: ['aa', 'bb', 'cc']})
         df['test'] = 'txt'
-        self.assertEqual(df.to_csv(), df.to_csv(columns=[0, 1, 'test']))
+        assert df.to_csv() == df.to_csv(columns=[0, 1, 'test'])
 
     def test_to_csv_headers(self):
         # GH6186, the presence or absence of `index` incorrectly
@@ -448,11 +466,13 @@ def test_to_csv_headers(self):
         to_df = DataFrame([[1, 2], [3, 4]], columns=['X', 'Y'])
         with ensure_clean('__tmp_to_csv_headers__') as path:
             from_df.to_csv(path, header=['X', 'Y'])
-            recons = DataFrame.from_csv(path)
+            recons = self.read_csv(path)
+
             assert_frame_equal(to_df, recons)
 
             from_df.to_csv(path, index=False, header=['X', 'Y'])
-            recons = DataFrame.from_csv(path)
+            recons = self.read_csv(path)
+
             recons.reset_index(inplace=True)
             assert_frame_equal(to_df, recons)
 
@@ -471,13 +491,15 @@ def test_to_csv_multiindex(self):
 
             # round trip
             frame.to_csv(path)
-            df = DataFrame.from_csv(path, index_col=[0, 1], parse_dates=False)
+
+            df = self.read_csv(path, index_col=[0, 1],
+                               parse_dates=False)
 
             # TODO to_csv drops column name
             assert_frame_equal(frame, df, check_names=False)
-            self.assertEqual(frame.index.names, df.index.names)
+            assert frame.index.names == df.index.names
 
-            # needed if setUP becomes a classmethod
+            # needed if setUp becomes a class method
             self.frame.index = old_index
 
             # try multiindex with dates
@@ -487,21 +509,22 @@ def test_to_csv_multiindex(self):
             tsframe.index = MultiIndex.from_arrays(new_index)
 
             tsframe.to_csv(path, index_label=['time', 'foo'])
-            recons = DataFrame.from_csv(path, index_col=[0, 1])
+            recons = self.read_csv(path, index_col=[0, 1])
+
             # TODO to_csv drops column name
             assert_frame_equal(tsframe, recons, check_names=False)
 
             # do not load index
             tsframe.to_csv(path)
-            recons = DataFrame.from_csv(path, index_col=None)
-            self.assertEqual(len(recons.columns), len(tsframe.columns) + 2)
+            recons = self.read_csv(path, index_col=None)
+            assert len(recons.columns) == len(tsframe.columns) + 2
 
             # no index
             tsframe.to_csv(path, index=False)
-            recons = DataFrame.from_csv(path, index_col=None)
+            recons = self.read_csv(path, index_col=None)
             assert_almost_equal(recons.values, self.tsframe.values)
 
-            # needed if setUP becomes classmethod
+            # needed if setUp becomes class method
             self.tsframe.index = old_index
 
         with ensure_clean('__tmp_to_csv_multiindex__') as path:
@@ -519,92 +542,101 @@ def _make_frame(names=None):
 
             # column & index are multi-index
             df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
-            df.to_csv(path, tupleize_cols=False)
-            result = read_csv(path, header=[0, 1, 2, 3], index_col=[
-                              0, 1], tupleize_cols=False)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1, 2, 3],
+                              index_col=[0, 1])
             assert_frame_equal(df, result)
 
             # column is mi
             df = mkdf(5, 3, r_idx_nlevels=1, c_idx_nlevels=4)
-            df.to_csv(path, tupleize_cols=False)
+            df.to_csv(path)
             result = read_csv(
-                path, header=[0, 1, 2, 3], index_col=0, tupleize_cols=False)
+                path, header=[0, 1, 2, 3], index_col=0)
             assert_frame_equal(df, result)
 
             # dup column names?
             df = mkdf(5, 3, r_idx_nlevels=3, c_idx_nlevels=4)
-            df.to_csv(path, tupleize_cols=False)
-            result = read_csv(path, header=[0, 1, 2, 3], index_col=[
-                              0, 1, 2], tupleize_cols=False)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1, 2, 3],
+                              index_col=[0, 1, 2])
             assert_frame_equal(df, result)
 
             # writing with no index
             df = _make_frame()
-            df.to_csv(path, tupleize_cols=False, index=False)
-            result = read_csv(path, header=[0, 1], tupleize_cols=False)
+            df.to_csv(path, index=False)
+            result = read_csv(path, header=[0, 1])
             assert_frame_equal(df, result)
 
             # we lose the names here
             df = _make_frame(True)
-            df.to_csv(path, tupleize_cols=False, index=False)
-            result = read_csv(path, header=[0, 1], tupleize_cols=False)
-            self.assertTrue(all([x is None for x in result.columns.names]))
+            df.to_csv(path, index=False)
+            result = read_csv(path, header=[0, 1])
+            assert com._all_none(*result.columns.names)
             result.columns.names = df.columns.names
             assert_frame_equal(df, result)
 
             # tupleize_cols=True and index=False
             df = _make_frame(True)
-            df.to_csv(path, tupleize_cols=True, index=False)
-            result = read_csv(
-                path, header=0, tupleize_cols=True, index_col=None)
+            with tm.assert_produces_warning(FutureWarning):
+                df.to_csv(path, tupleize_cols=True, index=False)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = read_csv(path, header=0,
+                                  tupleize_cols=True,
+                                  index_col=None)
             result.columns = df.columns
             assert_frame_equal(df, result)
 
             # whatsnew example
             df = _make_frame()
-            df.to_csv(path, tupleize_cols=False)
-            result = read_csv(path, header=[0, 1], index_col=[
-                              0], tupleize_cols=False)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1],
+                              index_col=[0])
             assert_frame_equal(df, result)
 
             df = _make_frame(True)
-            df.to_csv(path, tupleize_cols=False)
-            result = read_csv(path, header=[0, 1], index_col=[
-                              0], tupleize_cols=False)
+            df.to_csv(path)
+            result = read_csv(path, header=[0, 1],
+                              index_col=[0])
             assert_frame_equal(df, result)
 
             # column & index are multi-index (compatibility)
             df = mkdf(5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
-            df.to_csv(path, tupleize_cols=True)
-            result = read_csv(path, header=0, index_col=[
-                              0, 1], tupleize_cols=True)
+            with tm.assert_produces_warning(FutureWarning):
+                df.to_csv(path, tupleize_cols=True)
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = read_csv(path, header=0, index_col=[0, 1],
+                                  tupleize_cols=True)
             result.columns = df.columns
             assert_frame_equal(df, result)
 
             # invalid options
             df = _make_frame(True)
-            df.to_csv(path, tupleize_cols=False)
+            df.to_csv(path)
 
             for i in [6, 7]:
                 msg = 'len of {i}, but only 5 lines in file'.format(i=i)
-                with assertRaisesRegexp(ParserError, msg):
-                    read_csv(path, tupleize_cols=False,
-                             header=lrange(i), index_col=0)
+                with pytest.raises(ParserError, match=msg):
+                    read_csv(path, header=lrange(i), index_col=0)
 
             # write with cols
-            with assertRaisesRegexp(TypeError, 'cannot specify cols with a '
-                                    'MultiIndex'):
-                df.to_csv(path, tupleize_cols=False, columns=['foo', 'bar'])
+            msg = 'cannot specify cols with a MultiIndex'
+            with pytest.raises(TypeError, match=msg):
+                df.to_csv(path, columns=['foo', 'bar'])
 
         with ensure_clean('__tmp_to_csv_multiindex__') as path:
             # empty
             tsframe[:0].to_csv(path)
-            recons = DataFrame.from_csv(path)
+            recons = self.read_csv(path)
+
             exp = tsframe[:0]
             exp.index = []
 
-            self.assert_index_equal(recons.columns, exp.columns)
-            self.assertEqual(len(recons), 0)
+            tm.assert_index_equal(recons.columns, exp.columns)
+            assert len(recons) == 0
 
     def test_to_csv_float32_nanrep(self):
         df = DataFrame(np.random.randn(1, 4).astype(np.float32))
@@ -615,7 +647,7 @@ def test_to_csv_float32_nanrep(self):
 
             with open(path) as f:
                 lines = f.readlines()
-                self.assertEqual(lines[1].split(',')[2], '999')
+                assert lines[1].split(',')[2] == '999'
 
     def test_to_csv_withcommas(self):
 
@@ -624,7 +656,7 @@ def test_to_csv_withcommas(self):
 
         with ensure_clean('__tmp_to_csv_withcommas__.csv') as path:
             df.to_csv(path)
-            df2 = DataFrame.from_csv(path)
+            df2 = self.read_csv(path)
             assert_frame_equal(df2, df)
 
     def test_to_csv_mixed(self):
@@ -728,7 +760,7 @@ def test_to_csv_chunking(self):
                 rs = read_csv(filename, index_col=0)
                 assert_frame_equal(rs, aa)
 
-    @slow
+    @pytest.mark.slow
     def test_to_csv_wide_frame_formatting(self):
         # Issue #8621
         df = DataFrame(np.random.randn(1, 100010), columns=None, index=None)
@@ -739,7 +771,7 @@ def test_to_csv_wide_frame_formatting(self):
 
     def test_to_csv_bug(self):
         f1 = StringIO('a,1.0\nb,2.0')
-        df = DataFrame.from_csv(f1, header=None)
+        df = self.read_csv(f1, header=None)
         newdf = DataFrame({'t': df[df.columns[0]]})
 
         with ensure_clean() as path:
@@ -808,12 +840,12 @@ def test_to_csv_unicodewriter_quoting(self):
                   encoding='utf-8')
 
         result = buf.getvalue()
-        expected = ('"A","B"\n'
-                    '1,"foo"\n'
-                    '2,"bar"\n'
-                    '3,"baz"\n')
-
-        self.assertEqual(result, expected)
+        expected_rows = ['"A","B"',
+                         '1,"foo"',
+                         '2,"bar"',
+                         '3,"baz"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert result == expected
 
     def test_to_csv_quote_none(self):
         # GH4328
@@ -822,9 +854,13 @@ def test_to_csv_quote_none(self):
             buf = StringIO()
             df.to_csv(buf, quoting=csv.QUOTE_NONE,
                       encoding=encoding, index=False)
+
             result = buf.getvalue()
-            expected = 'A\nhello\n{"hello"}\n'
-            self.assertEqual(result, expected)
+            expected_rows = ['A',
+                             'hello',
+                             '{"hello"}']
+            expected = tm.convert_rows_list_to_csv_str(expected_rows)
+            assert result == expected
 
     def test_to_csv_index_no_leading_comma(self):
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
@@ -832,141 +868,119 @@ def test_to_csv_index_no_leading_comma(self):
 
         buf = StringIO()
         df.to_csv(buf, index_label=False)
-        expected = ('A,B\n'
-                    'one,1,4\n'
-                    'two,2,5\n'
-                    'three,3,6\n')
-        self.assertEqual(buf.getvalue(), expected)
+
+        expected_rows = ['A,B',
+                         'one,1,4',
+                         'two,2,5',
+                         'three,3,6']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert buf.getvalue() == expected
 
     def test_to_csv_line_terminators(self):
+        # see gh-20353
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
                        index=['one', 'two', 'three'])
 
-        buf = StringIO()
-        df.to_csv(buf, line_terminator='\r\n')
-        expected = (',A,B\r\n'
-                    'one,1,4\r\n'
-                    'two,2,5\r\n'
-                    'three,3,6\r\n')
-        self.assertEqual(buf.getvalue(), expected)
+        with ensure_clean() as path:
+            # case 1: CRLF as line terminator
+            df.to_csv(path, line_terminator='\r\n')
+            expected = b',A,B\r\none,1,4\r\ntwo,2,5\r\nthree,3,6\r\n'
 
-        buf = StringIO()
-        df.to_csv(buf)  # The default line terminator remains \n
-        expected = (',A,B\n'
-                    'one,1,4\n'
-                    'two,2,5\n'
-                    'three,3,6\n')
-        self.assertEqual(buf.getvalue(), expected)
+            with open(path, mode='rb') as f:
+                assert f.read() == expected
+
+        with ensure_clean() as path:
+            # case 2: LF as line terminator
+            df.to_csv(path, line_terminator='\n')
+            expected = b',A,B\none,1,4\ntwo,2,5\nthree,3,6\n'
+
+            with open(path, mode='rb') as f:
+                assert f.read() == expected
+
+        with ensure_clean() as path:
+            # case 3: The default line terminator(=os.linesep)(gh-21406)
+            df.to_csv(path)
+            os_linesep = os.linesep.encode('utf-8')
+            expected = (b',A,B' + os_linesep + b'one,1,4' + os_linesep +
+                        b'two,2,5' + os_linesep + b'three,3,6' + os_linesep)
+
+            with open(path, mode='rb') as f:
+                assert f.read() == expected
 
     def test_to_csv_from_csv_categorical(self):
 
-        # CSV with categoricals should result in the same output as when one
-        # would add a "normal" Series/DataFrame.
-        s = Series(pd.Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
-        s2 = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        # CSV with categoricals should result in the same output
+        # as when one would add a "normal" Series/DataFrame.
+        s = Series(pd.Categorical(["a", "b", "b", "a", "a", "c", "c", "c"]))
+        s2 = Series(["a", "b", "b", "a", "a", "c", "c", "c"])
         res = StringIO()
-        s.to_csv(res)
+
+        s.to_csv(res, header=False)
         exp = StringIO()
-        s2.to_csv(exp)
-        self.assertEqual(res.getvalue(), exp.getvalue())
+
+        s2.to_csv(exp, header=False)
+        assert res.getvalue() == exp.getvalue()
 
         df = DataFrame({"s": s})
         df2 = DataFrame({"s": s2})
+
         res = StringIO()
         df.to_csv(res)
+
         exp = StringIO()
         df2.to_csv(exp)
-        self.assertEqual(res.getvalue(), exp.getvalue())
+
+        assert res.getvalue() == exp.getvalue()
 
     def test_to_csv_path_is_none(self):
         # GH 8215
         # Make sure we return string for consistency with
         # Series.to_csv()
         csv_str = self.frame.to_csv(path_or_buf=None)
-        self.assertIsInstance(csv_str, str)
+        assert isinstance(csv_str, str)
         recons = pd.read_csv(StringIO(csv_str), index_col=0)
         assert_frame_equal(self.frame, recons)
 
-    def test_to_csv_compression_gzip(self):
-        # GH7615
-        # use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+    @pytest.mark.parametrize('df,encoding', [
+        (DataFrame([[0.123456, 0.234567, 0.567567],
+                    [12.32112, 123123.2, 321321.2]],
+                   index=['A', 'B'], columns=['X', 'Y', 'Z']), None),
+        # GH 21241, 21118
+        (DataFrame([['abc', 'def', 'ghi']], columns=['X', 'Y', 'Z']), 'ascii'),
+        (DataFrame(5 * [[123, u"你好", u"世界"]],
+                   columns=['X', 'Y', 'Z']), 'gb2312'),
+        (DataFrame(5 * [[123, u"Γειά σου", u"Κόσμε"]],
+                   columns=['X', 'Y', 'Z']), 'cp737')
+    ])
+    def test_to_csv_compression(self, df, encoding, compression):
 
         with ensure_clean() as filename:
 
-            df.to_csv(filename, compression="gzip")
-
-            # test the round trip - to_csv -> read_csv
-            rs = read_csv(filename, compression="gzip", index_col=0)
-            assert_frame_equal(df, rs)
-
-            # explicitly make sure file is gziped
-            import gzip
-            f = gzip.open(filename, 'rb')
-            text = f.read().decode('utf8')
-            f.close()
-            for col in df.columns:
-                self.assertIn(col, text)
-
-    def test_to_csv_compression_bz2(self):
-        # GH7615
-        # use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
-
-            df.to_csv(filename, compression="bz2")
-
+            df.to_csv(filename, compression=compression, encoding=encoding)
             # test the round trip - to_csv -> read_csv
-            rs = read_csv(filename, compression="bz2", index_col=0)
-            assert_frame_equal(df, rs)
-
-            # explicitly make sure file is bz2ed
-            import bz2
-            f = bz2.BZ2File(filename, 'rb')
-            text = f.read().decode('utf8')
-            f.close()
-            for col in df.columns:
-                self.assertIn(col, text)
-
-    def test_to_csv_compression_xz(self):
-        # GH11852
-        # use the compression kw in to_csv
-        tm._skip_if_no_lzma()
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-        with ensure_clean() as filename:
+            result = read_csv(filename, compression=compression,
+                              index_col=0, encoding=encoding)
+            assert_frame_equal(df, result)
 
-            df.to_csv(filename, compression="xz")
+            # test the round trip using file handle - to_csv -> read_csv
+            f, _handles = _get_handle(filename, 'w', compression=compression,
+                                      encoding=encoding)
+            with f:
+                df.to_csv(f, encoding=encoding)
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_frame_equal(df, result)
 
-            # test the round trip - to_csv -> read_csv
-            rs = read_csv(filename, compression="xz", index_col=0)
-            assert_frame_equal(df, rs)
-
-            # explicitly make sure file is xzipped
-            lzma = compat.import_lzma()
-            f = lzma.open(filename, 'rb')
-            assert_frame_equal(df, read_csv(f, index_col=0))
-            f.close()
-
-    def test_to_csv_compression_value_error(self):
-        # GH7615
-        # use the compression kw in to_csv
-        df = DataFrame([[0.123456, 0.234567, 0.567567],
-                        [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+            # explicitly make sure file is compressed
+            with tm.decompress_file(filename, compression) as fh:
+                text = fh.read().decode(encoding or 'utf8')
+                for col in df.columns:
+                    assert col in text
 
-        with ensure_clean() as filename:
-            # zip compression is not supported and should raise ValueError
-            import zipfile
-            self.assertRaises(zipfile.BadZipfile, df.to_csv,
-                              filename, compression="zip")
+            with tm.decompress_file(filename, compression) as fh:
+                assert_frame_equal(df, read_csv(fh,
+                                                index_col=0,
+                                                encoding=encoding))
 
     def test_to_csv_date_format(self):
         with ensure_clean('__tmp_to_csv_date_format__') as path:
@@ -1034,12 +1048,11 @@ def test_to_csv_with_dst_transitions(self):
                 time_range = np.array(range(len(i)), dtype='int64')
                 df = DataFrame({'A': time_range}, index=i)
                 df.to_csv(path, index=True)
-
                 # we have to reconvert the index as we
                 # don't parse the tz's
                 result = read_csv(path, index_col=0)
-                result.index = to_datetime(result.index).tz_localize(
-                    'UTC').tz_convert('Europe/London')
+                result.index = to_datetime(result.index, utc=True).tz_convert(
+                    'Europe/London')
                 assert_frame_equal(result, df)
 
         # GH11619
@@ -1050,9 +1063,9 @@ def test_to_csv_with_dst_transitions(self):
         with ensure_clean('csv_date_format_with_dst') as path:
             df.to_csv(path, index=True)
             result = read_csv(path, index_col=0)
-            result.index = to_datetime(result.index).tz_localize(
-                'UTC').tz_convert('Europe/Paris')
-            result['idx'] = to_datetime(result['idx']).astype(
+            result.index = to_datetime(result.index, utc=True).tz_convert(
+                'Europe/Paris')
+            result['idx'] = to_datetime(result['idx'], utc=True).astype(
                 'datetime64[ns, Europe/Paris]')
             assert_frame_equal(result, df)
 
@@ -1066,80 +1079,145 @@ def test_to_csv_with_dst_transitions(self):
 
     def test_to_csv_quoting(self):
         df = DataFrame({
-            'c_string': ['a', 'b,c'],
-            'c_int': [42, np.nan],
-            'c_float': [1.0, 3.2],
             'c_bool': [True, False],
+            'c_float': [1.0, 3.2],
+            'c_int': [42, np.nan],
+            'c_string': ['a', 'b,c'],
         })
 
-        expected = """\
-,c_bool,c_float,c_int,c_string
-0,True,1.0,42.0,a
-1,False,3.2,,"b,c"
-"""
+        expected_rows = [',c_bool,c_float,c_int,c_string',
+                         '0,True,1.0,42.0,a',
+                         '1,False,3.2,,"b,c"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+
         result = df.to_csv()
-        self.assertEqual(result, expected)
+        assert result == expected
 
         result = df.to_csv(quoting=None)
-        self.assertEqual(result, expected)
+        assert result == expected
+
+        expected_rows = [',c_bool,c_float,c_int,c_string',
+                         '0,True,1.0,42.0,a',
+                         '1,False,3.2,,"b,c"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
 
         result = df.to_csv(quoting=csv.QUOTE_MINIMAL)
-        self.assertEqual(result, expected)
+        assert result == expected
+
+        expected_rows = ['"","c_bool","c_float","c_int","c_string"',
+                         '"0","True","1.0","42.0","a"',
+                         '"1","False","3.2","","b,c"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
 
-        expected = """\
-"","c_bool","c_float","c_int","c_string"
-"0","True","1.0","42.0","a"
-"1","False","3.2","","b,c"
-"""
         result = df.to_csv(quoting=csv.QUOTE_ALL)
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # see gh-12922, gh-13259: make sure changes to
         # the formatters do not break this behaviour
-        expected = """\
-"","c_bool","c_float","c_int","c_string"
-0,True,1.0,42.0,"a"
-1,False,3.2,"","b,c"
-"""
+        expected_rows = ['"","c_bool","c_float","c_int","c_string"',
+                         '0,True,1.0,42.0,"a"',
+                         '1,False,3.2,"","b,c"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
         result = df.to_csv(quoting=csv.QUOTE_NONNUMERIC)
-        self.assertEqual(result, expected)
+        assert result == expected
 
         msg = "need to escape, but no escapechar set"
-        tm.assertRaisesRegexp(csv.Error, msg, df.to_csv,
-                              quoting=csv.QUOTE_NONE)
-        tm.assertRaisesRegexp(csv.Error, msg, df.to_csv,
-                              quoting=csv.QUOTE_NONE,
-                              escapechar=None)
-
-        expected = """\
-,c_bool,c_float,c_int,c_string
-0,True,1.0,42.0,a
-1,False,3.2,,b!,c
-"""
+        with pytest.raises(csv.Error, match=msg):
+            df.to_csv(quoting=csv.QUOTE_NONE)
+
+        with pytest.raises(csv.Error, match=msg):
+            df.to_csv(quoting=csv.QUOTE_NONE, escapechar=None)
+
+        expected_rows = [',c_bool,c_float,c_int,c_string',
+                         '0,True,1.0,42.0,a',
+                         '1,False,3.2,,b!,c']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
         result = df.to_csv(quoting=csv.QUOTE_NONE,
                            escapechar='!')
-        self.assertEqual(result, expected)
+        assert result == expected
 
-        expected = """\
-,c_bool,c_ffloat,c_int,c_string
-0,True,1.0,42.0,a
-1,False,3.2,,bf,c
-"""
+        expected_rows = [',c_bool,c_ffloat,c_int,c_string',
+                         '0,True,1.0,42.0,a',
+                         '1,False,3.2,,bf,c']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
         result = df.to_csv(quoting=csv.QUOTE_NONE,
                            escapechar='f')
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # see gh-3503: quoting Windows line terminators
         # presents with encoding?
-        text = 'a,b,c\n1,"test \r\n",3\n'
+        text_rows = ['a,b,c',
+                     '1,"test \r\n",3']
+        text = tm.convert_rows_list_to_csv_str(text_rows)
         df = pd.read_csv(StringIO(text))
+
         buf = StringIO()
         df.to_csv(buf, encoding='utf-8', index=False)
-        self.assertEqual(buf.getvalue(), text)
+        assert buf.getvalue() == text
 
         # xref gh-7791: make sure the quoting parameter is passed through
         # with multi-indexes
         df = pd.DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
         df = df.set_index(['a', 'b'])
-        expected = '"a","b","c"\n"1","3","5"\n"2","4","6"\n'
-        self.assertEqual(df.to_csv(quoting=csv.QUOTE_ALL), expected)
+
+        expected_rows = ['"a","b","c"',
+                         '"1","3","5"',
+                         '"2","4","6"']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.to_csv(quoting=csv.QUOTE_ALL) == expected
+
+    def test_period_index_date_overflow(self):
+        # see gh-15982
+
+        dates = ["1990-01-01", "2000-01-01", "3005-01-01"]
+        index = pd.PeriodIndex(dates, freq="D")
+
+        df = pd.DataFrame([4, 5, 6], index=index)
+        result = df.to_csv()
+
+        expected_rows = [',0',
+                         '1990-01-01,4',
+                         '2000-01-01,5',
+                         '3005-01-01,6']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert result == expected
+
+        date_format = "%m-%d-%Y"
+        result = df.to_csv(date_format=date_format)
+
+        expected_rows = [',0',
+                         '01-01-1990,4',
+                         '01-01-2000,5',
+                         '01-01-3005,6']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert result == expected
+
+        # Overflow with pd.NaT
+        dates = ["1990-01-01", pd.NaT, "3005-01-01"]
+        index = pd.PeriodIndex(dates, freq="D")
+
+        df = pd.DataFrame([4, 5, 6], index=index)
+        result = df.to_csv()
+
+        expected_rows = [',0',
+                         '1990-01-01,4',
+                         ',5',
+                         '3005-01-01,6']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert result == expected
+
+    def test_multi_index_header(self):
+        # see gh-5539
+        columns = pd.MultiIndex.from_tuples([("a", 1), ("a", 2),
+                                             ("b", 1), ("b", 2)])
+        df = pd.DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]])
+        df.columns = columns
+
+        header = ["a", "b", "c", "d"]
+        result = df.to_csv(header=header)
+
+        expected_rows = [',a,b,c,d',
+                         '0,1,2,3,4',
+                         '1,5,6,7,8']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert result == expected
diff --git a/pandas/tests/frame/test_validate.py b/pandas/tests/frame/test_validate.py
index e1ef87bb3271a..6513c332c6798 100644
--- a/pandas/tests/frame/test_validate.py
+++ b/pandas/tests/frame/test_validate.py
@@ -1,33 +1,32 @@
-from unittest import TestCase
-from pandas.core.frame import DataFrame
-
-
-class TestDataFrameValidate(TestCase):
-    """Tests for error handling related to data types of method arguments."""
-    df = DataFrame({'a': [1, 2], 'b': [3, 4]})
+import pytest
 
-    def test_validate_bool_args(self):
-        # Tests for error handling related to boolean arguments.
-        invalid_values = [1, "True", [1, 2, 3], 5.0]
-
-        for value in invalid_values:
-            with self.assertRaises(ValueError):
-                self.df.query('a > b', inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.df.eval('a + b', inplace=value)
+from pandas.core.frame import DataFrame
 
-            with self.assertRaises(ValueError):
-                self.df.set_index(keys=['a'], inplace=value)
 
-            with self.assertRaises(ValueError):
-                self.df.reset_index(inplace=value)
+@pytest.fixture
+def dataframe():
+    return DataFrame({'a': [1, 2], 'b': [3, 4]})
 
-            with self.assertRaises(ValueError):
-                self.df.dropna(inplace=value)
 
-            with self.assertRaises(ValueError):
-                self.df.drop_duplicates(inplace=value)
+class TestDataFrameValidate(object):
+    """Tests for error handling related to data types of method arguments."""
 
-            with self.assertRaises(ValueError):
-                self.df.sort_values(by=['a'], inplace=value)
+    @pytest.mark.parametrize("func", ["query", "eval", "set_index",
+                                      "reset_index", "dropna",
+                                      "drop_duplicates", "sort_values"])
+    @pytest.mark.parametrize("inplace", [1, "True", [1, 2, 3], 5.0])
+    def test_validate_bool_args(self, dataframe, func, inplace):
+        msg = "For argument \"inplace\" expected type bool"
+        kwargs = dict(inplace=inplace)
+
+        if func == "query":
+            kwargs["expr"] = "a > b"
+        elif func == "eval":
+            kwargs["expr"] = "a + b"
+        elif func == "set_index":
+            kwargs["keys"] = ["a"]
+        elif func == "sort_values":
+            kwargs["by"] = ["a"]
+
+        with pytest.raises(ValueError, match=msg):
+            getattr(dataframe, func)(**kwargs)
diff --git a/pandas/tests/generic/__init__.py b/pandas/tests/generic/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/generic/test_frame.py b/pandas/tests/generic/test_frame.py
new file mode 100644
index 0000000000000..25440702a339b
--- /dev/null
+++ b/pandas/tests/generic/test_frame.py
@@ -0,0 +1,271 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from copy import deepcopy
+from distutils.version import LooseVersion
+from operator import methodcaller
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Series, date_range
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+from .test_generic import Generic
+
+try:
+    import xarray
+    _XARRAY_INSTALLED = True
+except ImportError:
+    _XARRAY_INSTALLED = False
+
+
+class TestDataFrame(Generic):
+    _typ = DataFrame
+    _comparator = lambda self, x, y: assert_frame_equal(x, y)
+
+    def test_rename_mi(self):
+        df = DataFrame([
+            11, 21, 31
+        ], index=MultiIndex.from_tuples([("A", x) for x in ["a", "B", "c"]]))
+        df.rename(str.lower)
+
+    def test_set_axis_name(self):
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        funcs = ['_set_axis_name', 'rename_axis']
+        for func in funcs:
+            result = methodcaller(func, 'foo')(df)
+            assert df.index.name is None
+            assert result.index.name == 'foo'
+
+            result = methodcaller(func, 'cols', axis=1)(df)
+            assert df.columns.name is None
+            assert result.columns.name == 'cols'
+
+    def test_set_axis_name_mi(self):
+        df = DataFrame(
+            np.empty((3, 3)),
+            index=MultiIndex.from_tuples([("A", x) for x in list('aBc')]),
+            columns=MultiIndex.from_tuples([('C', x) for x in list('xyz')])
+        )
+
+        level_names = ['L1', 'L2']
+        funcs = ['_set_axis_name', 'rename_axis']
+        for func in funcs:
+            result = methodcaller(func, level_names)(df)
+            assert result.index.names == level_names
+            assert result.columns.names == [None, None]
+
+            result = methodcaller(func, level_names, axis=1)(df)
+            assert result.columns.names == ["L1", "L2"]
+            assert result.index.names == [None, None]
+
+    def test_nonzero_single_element(self):
+
+        # allow single item via bool method
+        df = DataFrame([[True]])
+        assert df.bool()
+
+        df = DataFrame([[False]])
+        assert not df.bool()
+
+        df = DataFrame([[False, False]])
+        with pytest.raises(ValueError):
+            df.bool()
+        with pytest.raises(ValueError):
+            bool(df)
+
+    def test_get_numeric_data_preserve_dtype(self):
+
+        # get the numeric data
+        o = DataFrame({'A': [1, '2', 3.]})
+        result = o._get_numeric_data()
+        expected = DataFrame(index=[0, 1, 2], dtype=object)
+        self._compare(result, expected)
+
+    def test_metadata_propagation_indiv(self):
+
+        # groupby
+        df = DataFrame(
+            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+             'C': np.random.randn(8),
+             'D': np.random.randn(8)})
+        result = df.groupby('A').sum()
+        self.check_metadata(df, result)
+
+        # resample
+        df = DataFrame(np.random.randn(1000, 2),
+                       index=date_range('20130101', periods=1000, freq='s'))
+        result = df.resample('1T')
+        self.check_metadata(df, result)
+
+        # merging with override
+        # GH 6923
+        _metadata = DataFrame._metadata
+        _finalize = DataFrame.__finalize__
+
+        np.random.seed(10)
+        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['a', 'b'])
+        df2 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['c', 'd'])
+        DataFrame._metadata = ['filename']
+        df1.filename = 'fname1.csv'
+        df2.filename = 'fname2.csv'
+
+        def finalize(self, other, method=None, **kwargs):
+
+            for name in self._metadata:
+                if method == 'merge':
+                    left, right = other.left, other.right
+                    value = getattr(left, name, '') + '|' + getattr(right,
+                                                                    name, '')
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, ''))
+
+            return self
+
+        DataFrame.__finalize__ = finalize
+        result = df1.merge(df2, left_on=['a'], right_on=['c'], how='inner')
+        assert result.filename == 'fname1.csv|fname2.csv'
+
+        # concat
+        # GH 6927
+        DataFrame._metadata = ['filename']
+        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=list('ab'))
+        df1.filename = 'foo'
+
+        def finalize(self, other, method=None, **kwargs):
+            for name in self._metadata:
+                if method == 'concat':
+                    value = '+'.join([getattr(
+                        o, name) for o in other.objs if getattr(o, name, None)
+                    ])
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, None))
+
+            return self
+
+        DataFrame.__finalize__ = finalize
+
+        result = pd.concat([df1, df1])
+        assert result.filename == 'foo+foo'
+
+        # reset
+        DataFrame._metadata = _metadata
+        DataFrame.__finalize__ = _finalize
+
+    def test_set_attribute(self):
+        # Test for consistent setattr behavior when an attribute and a column
+        # have the same name (Issue #8994)
+        df = DataFrame({'x': [1, 2, 3]})
+
+        df.y = 2
+        df['y'] = [2, 4, 6]
+        df.y = 5
+
+        assert df.y == 5
+        assert_series_equal(df['y'], Series([2, 4, 6], name='y'))
+
+    @pytest.mark.skipif(not _XARRAY_INSTALLED or _XARRAY_INSTALLED and
+                        LooseVersion(xarray.__version__) <
+                        LooseVersion('0.10.0'),
+                        reason='xarray >= 0.10.0 required')
+    @pytest.mark.parametrize(
+        "index", ['FloatIndex', 'IntIndex',
+                  'StringIndex', 'UnicodeIndex',
+                  'DateIndex', 'PeriodIndex',
+                  'CategoricalIndex', 'TimedeltaIndex'])
+    def test_to_xarray_index_types(self, index):
+        from xarray import Dataset
+
+        index = getattr(tm, 'make{}'.format(index))
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101',
+                                           periods=3,
+                                           tz='US/Eastern')}
+                       )
+
+        df.index = index(3)
+        df.index.name = 'foo'
+        df.columns.name = 'bar'
+        result = df.to_xarray()
+        assert result.dims['foo'] == 3
+        assert len(result.coords) == 1
+        assert len(result.data_vars) == 8
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, Dataset)
+
+        # idempotency
+        # categoricals are not preserved
+        # datetimes w/tz are not preserved
+        # column names are lost
+        expected = df.copy()
+        expected['f'] = expected['f'].astype(object)
+        expected['h'] = expected['h'].astype('datetime64[ns]')
+        expected.columns.name = None
+        assert_frame_equal(result.to_dataframe(), expected,
+                           check_index_type=False, check_categorical=False)
+
+    @td.skip_if_no('xarray', min_version='0.7.0')
+    def test_to_xarray(self):
+        from xarray import Dataset
+
+        df = DataFrame({'a': list('abc'),
+                        'b': list(range(1, 4)),
+                        'c': np.arange(3, 6).astype('u1'),
+                        'd': np.arange(4.0, 7.0, dtype='float64'),
+                        'e': [True, False, True],
+                        'f': pd.Categorical(list('abc')),
+                        'g': pd.date_range('20130101', periods=3),
+                        'h': pd.date_range('20130101',
+                                           periods=3,
+                                           tz='US/Eastern')}
+                       )
+
+        df.index.name = 'foo'
+        result = df[0:0].to_xarray()
+        assert result.dims['foo'] == 0
+        assert isinstance(result, Dataset)
+
+        # available in 0.7.1
+        # MultiIndex
+        df.index = pd.MultiIndex.from_product([['a'], range(3)],
+                                              names=['one', 'two'])
+        result = df.to_xarray()
+        assert result.dims['one'] == 1
+        assert result.dims['two'] == 3
+        assert len(result.coords) == 2
+        assert len(result.data_vars) == 8
+        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
+        assert isinstance(result, Dataset)
+
+        result = result.to_dataframe()
+        expected = df.copy()
+        expected['f'] = expected['f'].astype(object)
+        expected['h'] = expected['h'].astype('datetime64[ns]')
+        expected.columns.name = None
+        assert_frame_equal(result,
+                           expected,
+                           check_index_type=False)
+
+    def test_deepcopy_empty(self):
+        # This test covers empty frame copying with non-empty column sets
+        # as reported in issue GH15370
+        empty_frame = DataFrame(data=[], index=[], columns=['A'])
+        empty_frame_copy = deepcopy(empty_frame)
+
+        self._compare(empty_frame_copy, empty_frame)
diff --git a/pandas/tests/generic/test_generic.py b/pandas/tests/generic/test_generic.py
new file mode 100644
index 0000000000000..c2f6cbf4c564c
--- /dev/null
+++ b/pandas/tests/generic/test_generic.py
@@ -0,0 +1,955 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from copy import copy, deepcopy
+from warnings import catch_warnings, simplefilter
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY3, range, zip
+
+from pandas.core.dtypes.common import is_scalar
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Panel, Series, date_range
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+import pandas.io.formats.printing as printing
+
+# ----------------------------------------------------------------------
+# Generic types test cases
+
+
+class Generic(object):
+
+    @property
+    def _ndim(self):
+        return self._typ._AXIS_LEN
+
+    def _axes(self):
+        """ return the axes for my object typ """
+        return self._typ._AXIS_ORDERS
+
+    def _construct(self, shape, value=None, dtype=None, **kwargs):
+        """ construct an object for the given shape
+            if value is specified use that if its a scalar
+            if value is an array, repeat it as needed """
+
+        if isinstance(shape, int):
+            shape = tuple([shape] * self._ndim)
+        if value is not None:
+            if is_scalar(value):
+                if value == 'empty':
+                    arr = None
+
+                    # remove the info axis
+                    kwargs.pop(self._typ._info_axis_name, None)
+                else:
+                    arr = np.empty(shape, dtype=dtype)
+                    arr.fill(value)
+            else:
+                fshape = np.prod(shape)
+                arr = value.ravel()
+                new_shape = fshape / arr.shape[0]
+                if fshape % arr.shape[0] != 0:
+                    raise Exception("invalid value passed in _construct")
+
+                arr = np.repeat(arr, new_shape).reshape(shape)
+        else:
+            arr = np.random.randn(*shape)
+        return self._typ(arr, dtype=dtype, **kwargs)
+
+    def _compare(self, result, expected):
+        self._comparator(result, expected)
+
+    def test_rename(self):
+
+        # single axis
+        idx = list('ABCD')
+        # relabeling values passed into self.rename
+        args = [
+            str.lower,
+            {x: x.lower() for x in idx},
+            Series({x: x.lower() for x in idx}),
+        ]
+
+        for axis in self._axes():
+            kwargs = {axis: idx}
+            obj = self._construct(4, **kwargs)
+
+            for arg in args:
+                # rename a single axis
+                result = obj.rename(**{axis: arg})
+                expected = obj.copy()
+                setattr(expected, axis, list('abcd'))
+                self._compare(result, expected)
+
+        # multiple axes at once
+
+    def test_get_numeric_data(self):
+
+        n = 4
+        kwargs = {self._typ._AXIS_NAMES[i]: list(range(n))
+                  for i in range(self._ndim)}
+
+        # get the numeric data
+        o = self._construct(n, **kwargs)
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        # non-inclusion
+        result = o._get_bool_data()
+        expected = self._construct(n, value='empty', **kwargs)
+        self._compare(result, expected)
+
+        # get the bool data
+        arr = np.array([True, True, False, True])
+        o = self._construct(n, value=arr, **kwargs)
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        # _get_numeric_data is includes _get_bool_data, so can't test for
+        # non-inclusion
+
+    def test_get_default(self):
+
+        # GH 7725
+        d0 = "a", "b", "c", "d"
+        d1 = np.arange(4, dtype='int64')
+        others = "e", 10
+
+        for data, index in ((d0, d1), (d1, d0)):
+            s = Series(data, index=index)
+            for i, d in zip(index, data):
+                assert s.get(i) == d
+                assert s.get(i, d) == d
+                assert s.get(i, "z") == d
+                for other in others:
+                    assert s.get(other, "z") == "z"
+                    assert s.get(other, other) == other
+
+    def test_nonzero(self):
+
+        # GH 4633
+        # look at the boolean/nonzero behavior for objects
+        obj = self._construct(shape=4)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        obj = self._construct(shape=4, value=1)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        obj = self._construct(shape=4, value=np.nan)
+        pytest.raises(ValueError, lambda: bool(obj == 0))
+        pytest.raises(ValueError, lambda: bool(obj == 1))
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        # empty
+        obj = self._construct(shape=0)
+        pytest.raises(ValueError, lambda: bool(obj))
+
+        # invalid behaviors
+
+        obj1 = self._construct(shape=4, value=1)
+        obj2 = self._construct(shape=4, value=1)
+
+        def f():
+            if obj1:
+                printing.pprint_thing("this works and shouldn't")
+
+        pytest.raises(ValueError, f)
+        pytest.raises(ValueError, lambda: obj1 and obj2)
+        pytest.raises(ValueError, lambda: obj1 or obj2)
+        pytest.raises(ValueError, lambda: not obj1)
+
+    def test_downcast(self):
+        # test close downcasting
+
+        o = self._construct(shape=4, value=9, dtype=np.int64)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, o)
+
+        o = self._construct(shape=4, value=9.)
+        expected = o.astype(np.int64)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, expected)
+
+        o = self._construct(shape=4, value=9.5)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        self._compare(result, o)
+
+        # are close
+        o = self._construct(shape=4, value=9.000000000005)
+        result = o.copy()
+        result._data = o._data.downcast(dtypes='infer')
+        expected = o.astype(np.int64)
+        self._compare(result, expected)
+
+    def test_constructor_compound_dtypes(self):
+        # see gh-5191
+        # Compound dtypes should raise NotImplementedError.
+
+        def f(dtype):
+            return self._construct(shape=3, value=1, dtype=dtype)
+
+        pytest.raises(NotImplementedError, f, [("A", "datetime64[h]"),
+                                               ("B", "str"),
+                                               ("C", "int32")])
+
+        # these work (though results may be unexpected)
+        f('int64')
+        f('float64')
+        f('M8[ns]')
+
+    def check_metadata(self, x, y=None):
+        for m in x._metadata:
+            v = getattr(x, m, None)
+            if y is None:
+                assert v is None
+            else:
+                assert v == getattr(y, m, None)
+
+    def test_metadata_propagation(self):
+        # check that the metadata matches up on the resulting ops
+
+        o = self._construct(shape=3)
+        o.name = 'foo'
+        o2 = self._construct(shape=3)
+        o2.name = 'bar'
+
+        # TODO
+        # Once panel can do non-trivial combine operations
+        # (currently there is an a raise in the Panel arith_ops to prevent
+        # this, though it actually does work)
+        # can remove all of these try: except: blocks on the actual operations
+
+        # ----------
+        # preserving
+        # ----------
+
+        # simple ops with scalars
+        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
+            result = getattr(o, op)(1)
+            self.check_metadata(o, result)
+
+        # ops with like
+        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
+            try:
+                result = getattr(o, op)(o)
+                self.check_metadata(o, result)
+            except (ValueError, AttributeError):
+                pass
+
+        # simple boolean
+        for op in ['__eq__', '__le__', '__ge__']:
+            v1 = getattr(o, op)(o)
+            self.check_metadata(o, v1)
+
+            try:
+                self.check_metadata(o, v1 & v1)
+            except (ValueError):
+                pass
+
+            try:
+                self.check_metadata(o, v1 | v1)
+            except (ValueError):
+                pass
+
+        # combine_first
+        try:
+            result = o.combine_first(o2)
+            self.check_metadata(o, result)
+        except (AttributeError):
+            pass
+
+        # ---------------------------
+        # non-preserving (by default)
+        # ---------------------------
+
+        # add non-like
+        try:
+            result = o + o2
+            self.check_metadata(result)
+        except (ValueError, AttributeError):
+            pass
+
+        # simple boolean
+        for op in ['__eq__', '__le__', '__ge__']:
+
+            # this is a name matching op
+            v1 = getattr(o, op)(o)
+
+            v2 = getattr(o, op)(o2)
+            self.check_metadata(v2)
+
+            try:
+                self.check_metadata(v1 & v2)
+            except (ValueError):
+                pass
+
+            try:
+                self.check_metadata(v1 | v2)
+            except (ValueError):
+                pass
+
+    def test_head_tail(self):
+        # GH5370
+
+        o = self._construct(shape=10)
+
+        # check all index types
+        for index in [tm.makeFloatIndex, tm.makeIntIndex, tm.makeStringIndex,
+                      tm.makeUnicodeIndex, tm.makeDateIndex,
+                      tm.makePeriodIndex]:
+            axis = o._get_axis_name(0)
+            setattr(o, axis, index(len(getattr(o, axis))))
+
+            # Panel + dims
+            try:
+                o.head()
+            except (NotImplementedError):
+                pytest.skip('not implemented on {0}'.format(
+                    o.__class__.__name__))
+
+            self._compare(o.head(), o.iloc[:5])
+            self._compare(o.tail(), o.iloc[-5:])
+
+            # 0-len
+            self._compare(o.head(0), o.iloc[0:0])
+            self._compare(o.tail(0), o.iloc[0:0])
+
+            # bounded
+            self._compare(o.head(len(o) + 1), o)
+            self._compare(o.tail(len(o) + 1), o)
+
+            # neg index
+            self._compare(o.head(-3), o.head(7))
+            self._compare(o.tail(-3), o.tail(7))
+
+    def test_sample(self):
+        # Fixes issue: 2419
+
+        o = self._construct(shape=10)
+
+        ###
+        # Check behavior of random_state argument
+        ###
+
+        # Check for stability when receives seed or random state -- run 10
+        # times.
+        for test in range(10):
+            seed = np.random.randint(0, 100)
+            self._compare(
+                o.sample(n=4, random_state=seed), o.sample(n=4,
+                                                           random_state=seed))
+            self._compare(
+                o.sample(frac=0.7, random_state=seed), o.sample(
+                    frac=0.7, random_state=seed))
+
+            self._compare(
+                o.sample(n=4, random_state=np.random.RandomState(test)),
+                o.sample(n=4, random_state=np.random.RandomState(test)))
+
+            self._compare(
+                o.sample(frac=0.7, random_state=np.random.RandomState(test)),
+                o.sample(frac=0.7, random_state=np.random.RandomState(test)))
+
+            os1, os2 = [], []
+            for _ in range(2):
+                np.random.seed(test)
+                os1.append(o.sample(n=4))
+                os2.append(o.sample(frac=0.7))
+            self._compare(*os1)
+            self._compare(*os2)
+
+        # Check for error when random_state argument invalid.
+        with pytest.raises(ValueError):
+            o.sample(random_state='astring!')
+
+        ###
+        # Check behavior of `frac` and `N`
+        ###
+
+        # Giving both frac and N throws error
+        with pytest.raises(ValueError):
+            o.sample(n=3, frac=0.3)
+
+        # Check that raises right error for negative lengths
+        with pytest.raises(ValueError):
+            o.sample(n=-3)
+        with pytest.raises(ValueError):
+            o.sample(frac=-0.3)
+
+        # Make sure float values of `n` give error
+        with pytest.raises(ValueError):
+            o.sample(n=3.2)
+
+        # Check lengths are right
+        assert len(o.sample(n=4) == 4)
+        assert len(o.sample(frac=0.34) == 3)
+        assert len(o.sample(frac=0.36) == 4)
+
+        ###
+        # Check weights
+        ###
+
+        # Weight length must be right
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=[0, 1])
+
+        with pytest.raises(ValueError):
+            bad_weights = [0.5] * 11
+            o.sample(n=3, weights=bad_weights)
+
+        with pytest.raises(ValueError):
+            bad_weight_series = Series([0, 0, 0.2])
+            o.sample(n=4, weights=bad_weight_series)
+
+        # Check won't accept negative weights
+        with pytest.raises(ValueError):
+            bad_weights = [-0.1] * 10
+            o.sample(n=3, weights=bad_weights)
+
+        # Check inf and -inf throw errors:
+        with pytest.raises(ValueError):
+            weights_with_inf = [0.1] * 10
+            weights_with_inf[0] = np.inf
+            o.sample(n=3, weights=weights_with_inf)
+
+        with pytest.raises(ValueError):
+            weights_with_ninf = [0.1] * 10
+            weights_with_ninf[0] = -np.inf
+            o.sample(n=3, weights=weights_with_ninf)
+
+        # All zeros raises errors
+        zero_weights = [0] * 10
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=zero_weights)
+
+        # All missing weights
+        nan_weights = [np.nan] * 10
+        with pytest.raises(ValueError):
+            o.sample(n=3, weights=nan_weights)
+
+        # Check np.nan are replaced by zeros.
+        weights_with_nan = [np.nan] * 10
+        weights_with_nan[5] = 0.5
+        self._compare(
+            o.sample(n=1, axis=0, weights=weights_with_nan), o.iloc[5:6])
+
+        # Check None are also replaced by zeros.
+        weights_with_None = [None] * 10
+        weights_with_None[5] = 0.5
+        self._compare(
+            o.sample(n=1, axis=0, weights=weights_with_None), o.iloc[5:6])
+
+    def test_size_compat(self):
+        # GH8846
+        # size property should be defined
+
+        o = self._construct(shape=10)
+        assert o.size == np.prod(o.shape)
+        assert o.size == 10 ** len(o.axes)
+
+    def test_split_compat(self):
+        # xref GH8846
+        o = self._construct(shape=10)
+        assert len(np.array_split(o, 5)) == 5
+        assert len(np.array_split(o, 2)) == 2
+
+    def test_unexpected_keyword(self):  # GH8597
+        df = DataFrame(np.random.randn(5, 2), columns=['jim', 'joe'])
+        ca = pd.Categorical([0, 0, 2, 2, 3, np.nan])
+        ts = df['joe'].copy()
+        ts[2] = np.nan
+
+        with pytest.raises(TypeError, match='unexpected keyword'):
+            df.drop('joe', axis=1, in_place=True)
+
+        with pytest.raises(TypeError, match='unexpected keyword'):
+            df.reindex([1, 0], inplace=True)
+
+        with pytest.raises(TypeError, match='unexpected keyword'):
+            ca.fillna(0, inplace=True)
+
+        with pytest.raises(TypeError, match='unexpected keyword'):
+            ts.fillna(0, in_place=True)
+
+    # See gh-12301
+    def test_stat_unexpected_keyword(self):
+        obj = self._construct(5)
+        starwars = 'Star Wars'
+        errmsg = 'unexpected keyword'
+
+        with pytest.raises(TypeError, match=errmsg):
+            obj.max(epic=starwars)  # stat_function
+        with pytest.raises(TypeError, match=errmsg):
+            obj.var(epic=starwars)  # stat_function_ddof
+        with pytest.raises(TypeError, match=errmsg):
+            obj.sum(epic=starwars)  # cum_function
+        with pytest.raises(TypeError, match=errmsg):
+            obj.any(epic=starwars)  # logical_function
+
+    def test_api_compat(self):
+
+        # GH 12021
+        # compat for __name__, __qualname__
+
+        obj = self._construct(5)
+        for func in ['sum', 'cumsum', 'any', 'var']:
+            f = getattr(obj, func)
+            assert f.__name__ == func
+            if PY3:
+                assert f.__qualname__.endswith(func)
+
+    def test_stat_non_defaults_args(self):
+        obj = self._construct(5)
+        out = np.array([0])
+        errmsg = "the 'out' parameter is not supported"
+
+        with pytest.raises(ValueError, match=errmsg):
+            obj.max(out=out)  # stat_function
+        with pytest.raises(ValueError, match=errmsg):
+            obj.var(out=out)  # stat_function_ddof
+        with pytest.raises(ValueError, match=errmsg):
+            obj.sum(out=out)  # cum_function
+        with pytest.raises(ValueError, match=errmsg):
+            obj.any(out=out)  # logical_function
+
+    def test_truncate_out_of_bounds(self):
+        # GH11382
+
+        # small
+        shape = [int(2e3)] + ([1] * (self._ndim - 1))
+        small = self._construct(shape, dtype='int8', value=1)
+        self._compare(small.truncate(), small)
+        self._compare(small.truncate(before=0, after=3e3), small)
+        self._compare(small.truncate(before=-1, after=2e3), small)
+
+        # big
+        shape = [int(2e6)] + ([1] * (self._ndim - 1))
+        big = self._construct(shape, dtype='int8', value=1)
+        self._compare(big.truncate(), big)
+        self._compare(big.truncate(before=0, after=3e6), big)
+        self._compare(big.truncate(before=-1, after=2e6), big)
+
+    def test_validate_bool_args(self):
+        df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
+        invalid_values = [1, "True", [1, 2, 3], 5.0]
+
+        for value in invalid_values:
+            with pytest.raises(ValueError):
+                super(DataFrame, df).rename_axis(mapper={'a': 'x', 'b': 'y'},
+                                                 axis=1, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).drop('a', axis=1, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).sort_index(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df)._consolidate(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).fillna(value=0, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).replace(to_replace=1, value=7,
+                                             inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).interpolate(inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df)._where(cond=df.a > 2, inplace=value)
+
+            with pytest.raises(ValueError):
+                super(DataFrame, df).mask(cond=df.a > 2, inplace=value)
+
+    def test_copy_and_deepcopy(self):
+        # GH 15444
+        for shape in [0, 1, 2]:
+            obj = self._construct(shape)
+            for func in [copy,
+                         deepcopy,
+                         lambda x: x.copy(deep=False),
+                         lambda x: x.copy(deep=True)]:
+                obj_copy = func(obj)
+                assert obj_copy is not obj
+                self._compare(obj_copy, obj)
+
+    @pytest.mark.parametrize("periods,fill_method,limit,exp", [
+        (1, "ffill", None, [np.nan, np.nan, np.nan, 1, 1, 1.5, 0, 0]),
+        (1, "ffill", 1, [np.nan, np.nan, np.nan, 1, 1, 1.5, 0, np.nan]),
+        (1, "bfill", None, [np.nan, 0, 0, 1, 1, 1.5, np.nan, np.nan]),
+        (1, "bfill", 1, [np.nan, np.nan, 0, 1, 1, 1.5, np.nan, np.nan]),
+        (-1, "ffill", None, [np.nan, np.nan, -.5, -.5, -.6, 0, 0, np.nan]),
+        (-1, "ffill", 1, [np.nan, np.nan, -.5, -.5, -.6, 0, np.nan, np.nan]),
+        (-1, "bfill", None, [0, 0, -.5, -.5, -.6, np.nan, np.nan, np.nan]),
+        (-1, "bfill", 1, [np.nan, 0, -.5, -.5, -.6, np.nan, np.nan, np.nan])
+    ])
+    def test_pct_change(self, periods, fill_method, limit, exp):
+        vals = [np.nan, np.nan, 1, 2, 4, 10, np.nan, np.nan]
+        obj = self._typ(vals)
+        func = getattr(obj, 'pct_change')
+        res = func(periods=periods, fill_method=fill_method, limit=limit)
+        if type(obj) is DataFrame:
+            tm.assert_frame_equal(res, DataFrame(exp))
+        else:
+            tm.assert_series_equal(res, Series(exp))
+
+
+class TestNDFrame(object):
+    # tests that don't fit elsewhere
+
+    def test_sample(sel):
+        # Fixes issue: 2419
+        # additional specific object based tests
+
+        # A few dataframe test with degenerate weights.
+        easy_weight_list = [0] * 10
+        easy_weight_list[5] = 1
+
+        df = pd.DataFrame({'col1': range(10, 20),
+                           'col2': range(20, 30),
+                           'colString': ['a'] * 10,
+                           'easyweights': easy_weight_list})
+        sample1 = df.sample(n=1, weights='easyweights')
+        assert_frame_equal(sample1, df.iloc[5:6])
+
+        # Ensure proper error if string given as weight for Series, panel, or
+        # DataFrame with axis = 1.
+        s = Series(range(10))
+        with pytest.raises(ValueError):
+            s.sample(n=3, weights='weight_column')
+
+        with catch_warnings(record=True):
+            simplefilter("ignore", FutureWarning)
+            panel = Panel(items=[0, 1, 2], major_axis=[2, 3, 4],
+                          minor_axis=[3, 4, 5])
+            with pytest.raises(ValueError):
+                panel.sample(n=1, weights='weight_column')
+
+        with pytest.raises(ValueError):
+            df.sample(n=1, weights='weight_column', axis=1)
+
+        # Check weighting key error
+        with pytest.raises(KeyError):
+            df.sample(n=3, weights='not_a_real_column_name')
+
+        # Check that re-normalizes weights that don't sum to one.
+        weights_less_than_1 = [0] * 10
+        weights_less_than_1[0] = 0.5
+        tm.assert_frame_equal(
+            df.sample(n=1, weights=weights_less_than_1), df.iloc[:1])
+
+        ###
+        # Test axis argument
+        ###
+
+        # Test axis argument
+        df = pd.DataFrame({'col1': range(10), 'col2': ['a'] * 10})
+        second_column_weight = [0, 1]
+        assert_frame_equal(
+            df.sample(n=1, axis=1, weights=second_column_weight), df[['col2']])
+
+        # Different axis arg types
+        assert_frame_equal(df.sample(n=1, axis='columns',
+                                     weights=second_column_weight),
+                           df[['col2']])
+
+        weight = [0] * 10
+        weight[5] = 0.5
+        assert_frame_equal(df.sample(n=1, axis='rows', weights=weight),
+                           df.iloc[5:6])
+        assert_frame_equal(df.sample(n=1, axis='index', weights=weight),
+                           df.iloc[5:6])
+
+        # Check out of range axis values
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis=2)
+
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis='not_a_name')
+
+        with pytest.raises(ValueError):
+            s = pd.Series(range(10))
+            s.sample(n=1, axis=1)
+
+        # Test weight length compared to correct axis
+        with pytest.raises(ValueError):
+            df.sample(n=1, axis=1, weights=[0.5] * 10)
+
+        # Check weights with axis = 1
+        easy_weight_list = [0] * 3
+        easy_weight_list[2] = 1
+
+        df = pd.DataFrame({'col1': range(10, 20),
+                           'col2': range(20, 30),
+                           'colString': ['a'] * 10})
+        sample1 = df.sample(n=1, axis=1, weights=easy_weight_list)
+        assert_frame_equal(sample1, df[['colString']])
+
+        # Test default axes
+        assert_frame_equal(
+            df.sample(n=3, random_state=42), df.sample(n=3, axis=0,
+                                                       random_state=42))
+
+        # Test that function aligns weights with frame
+        df = DataFrame(
+            {'col1': [5, 6, 7],
+             'col2': ['a', 'b', 'c'], }, index=[9, 5, 3])
+        s = Series([1, 0, 0], index=[3, 5, 9])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s))
+
+        # Weights have index values to be dropped because not in
+        # sampled DataFrame
+        s2 = Series([0.001, 0, 10000], index=[3, 5, 10])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s2))
+
+        # Weights have empty values to be filed with zeros
+        s3 = Series([0.01, 0], index=[3, 5])
+        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s3))
+
+        # No overlap in weight and sampled DataFrame indices
+        s4 = Series([1, 0], index=[1, 2])
+        with pytest.raises(ValueError):
+            df.sample(1, weights=s4)
+
+    def test_squeeze(self):
+        # noop
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            tm.assert_series_equal(s.squeeze(), s)
+        for df in [tm.makeTimeDataFrame()]:
+            tm.assert_frame_equal(df.squeeze(), df)
+
+        # squeezing
+        df = tm.makeTimeDataFrame().reindex(columns=['A'])
+        tm.assert_series_equal(df.squeeze(), df['A'])
+
+        # don't fail with 0 length dimensions GH11229 & GH8999
+        empty_series = Series([], name='five')
+        empty_frame = DataFrame([empty_series])
+        with catch_warnings(record=True):
+            simplefilter("ignore", FutureWarning)
+            empty_panel = Panel({'six': empty_frame})
+
+        [tm.assert_series_equal(empty_series, higher_dim.squeeze())
+         for higher_dim in [empty_series, empty_frame, empty_panel]]
+
+        # axis argument
+        df = tm.makeTimeDataFrame(nper=1).iloc[:, :1]
+        assert df.shape == (1, 1)
+        tm.assert_series_equal(df.squeeze(axis=0), df.iloc[0])
+        tm.assert_series_equal(df.squeeze(axis='index'), df.iloc[0])
+        tm.assert_series_equal(df.squeeze(axis=1), df.iloc[:, 0])
+        tm.assert_series_equal(df.squeeze(axis='columns'), df.iloc[:, 0])
+        assert df.squeeze() == df.iloc[0, 0]
+        pytest.raises(ValueError, df.squeeze, axis=2)
+        pytest.raises(ValueError, df.squeeze, axis='x')
+
+        df = tm.makeTimeDataFrame(3)
+        tm.assert_frame_equal(df.squeeze(axis=0), df)
+
+    def test_numpy_squeeze(self):
+        s = tm.makeFloatSeries()
+        tm.assert_series_equal(np.squeeze(s), s)
+
+        df = tm.makeTimeDataFrame().reindex(columns=['A'])
+        tm.assert_series_equal(np.squeeze(df), df['A'])
+
+    def test_transpose(self):
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            # calls implementation in pandas/core/base.py
+            tm.assert_series_equal(s.transpose(), s)
+        for df in [tm.makeTimeDataFrame()]:
+            tm.assert_frame_equal(df.transpose().transpose(), df)
+
+    def test_numpy_transpose(self):
+        msg = "the 'axes' parameter is not supported"
+
+        s = tm.makeFloatSeries()
+        tm.assert_series_equal(np.transpose(s), s)
+
+        with pytest.raises(ValueError, match=msg):
+            np.transpose(s, axes=1)
+
+        df = tm.makeTimeDataFrame()
+        tm.assert_frame_equal(np.transpose(np.transpose(df)), df)
+
+        with pytest.raises(ValueError, match=msg):
+            np.transpose(df, axes=1)
+
+    def test_take(self):
+        indices = [1, 5, -2, 6, 3, -1]
+        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
+                  tm.makeObjectSeries()]:
+            out = s.take(indices)
+            expected = Series(data=s.values.take(indices),
+                              index=s.index.take(indices), dtype=s.dtype)
+            tm.assert_series_equal(out, expected)
+        for df in [tm.makeTimeDataFrame()]:
+            out = df.take(indices)
+            expected = DataFrame(data=df.values.take(indices, axis=0),
+                                 index=df.index.take(indices),
+                                 columns=df.columns)
+            tm.assert_frame_equal(out, expected)
+
+    def test_take_invalid_kwargs(self):
+        indices = [-3, 2, 0, 1]
+        s = tm.makeFloatSeries()
+        df = tm.makeTimeDataFrame()
+
+        for obj in (s, df):
+            msg = r"take\(\) got an unexpected keyword argument 'foo'"
+            with pytest.raises(TypeError, match=msg):
+                obj.take(indices, foo=2)
+
+            msg = "the 'out' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                obj.take(indices, out=indices)
+
+            msg = "the 'mode' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                obj.take(indices, mode='clip')
+
+    def test_equals(self):
+        s1 = pd.Series([1, 2, 3], index=[0, 2, 1])
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        s1[1] = 99
+        assert not s1.equals(s2)
+
+        # NaNs compare as equal
+        s1 = pd.Series([1, np.nan, 3, np.nan], index=[0, 2, 1, 3])
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        s2[0] = 9.9
+        assert not s1.equals(s2)
+
+        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
+        s1 = Series([1, 2, np.nan], index=idx)
+        s2 = s1.copy()
+        assert s1.equals(s2)
+
+        # Add object dtype column with nans
+        index = np.random.random(10)
+        df1 = DataFrame(
+            np.random.random(10, ), index=index, columns=['floats'])
+        df1['text'] = 'the sky is so blue. we could use more chocolate.'.split(
+        )
+        df1['start'] = date_range('2000-1-1', periods=10, freq='T')
+        df1['end'] = date_range('2000-1-1', periods=10, freq='D')
+        df1['diff'] = df1['end'] - df1['start']
+        df1['bool'] = (np.arange(10) % 3 == 0)
+        df1.loc[::2] = np.nan
+        df2 = df1.copy()
+        assert df1['text'].equals(df2['text'])
+        assert df1['start'].equals(df2['start'])
+        assert df1['end'].equals(df2['end'])
+        assert df1['diff'].equals(df2['diff'])
+        assert df1['bool'].equals(df2['bool'])
+        assert df1.equals(df2)
+        assert not df1.equals(object)
+
+        # different dtype
+        different = df1.copy()
+        different['floats'] = different['floats'].astype('float32')
+        assert not df1.equals(different)
+
+        # different index
+        different_index = -index
+        different = df2.set_index(different_index)
+        assert not df1.equals(different)
+
+        # different columns
+        different = df2.copy()
+        different.columns = df2.columns[::-1]
+        assert not df1.equals(different)
+
+        # DatetimeIndex
+        index = pd.date_range('2000-1-1', periods=10, freq='T')
+        df1 = df1.set_index(index)
+        df2 = df1.copy()
+        assert df1.equals(df2)
+
+        # MultiIndex
+        df3 = df1.set_index(['text'], append=True)
+        df2 = df1.set_index(['text'], append=True)
+        assert df3.equals(df2)
+
+        df2 = df1.set_index(['floats'], append=True)
+        assert not df3.equals(df2)
+
+        # NaN in index
+        df3 = df1.set_index(['floats'], append=True)
+        df2 = df1.set_index(['floats'], append=True)
+        assert df3.equals(df2)
+
+        # GH 8437
+        a = pd.Series([False, np.nan])
+        b = pd.Series([False, np.nan])
+        c = pd.Series(index=range(2))
+        d = pd.Series(index=range(2))
+        e = pd.Series(index=range(2))
+        f = pd.Series(index=range(2))
+        c[:-1] = d[:-1] = e[0] = f[0] = False
+        assert a.equals(a)
+        assert a.equals(b)
+        assert a.equals(c)
+        assert a.equals(d)
+        assert a.equals(e)
+        assert e.equals(f)
+
+    def test_pipe(self):
+        df = DataFrame({'A': [1, 2, 3]})
+        f = lambda x, y: x ** y
+        result = df.pipe(f, 2)
+        expected = DataFrame({'A': [1, 4, 9]})
+        assert_frame_equal(result, expected)
+
+        result = df.A.pipe(f, 2)
+        assert_series_equal(result, expected.A)
+
+    def test_pipe_tuple(self):
+        df = DataFrame({'A': [1, 2, 3]})
+        f = lambda x, y: y
+        result = df.pipe((f, 'y'), 0)
+        assert_frame_equal(result, df)
+
+        result = df.A.pipe((f, 'y'), 0)
+        assert_series_equal(result, df.A)
+
+    def test_pipe_tuple_error(self):
+        df = DataFrame({"A": [1, 2, 3]})
+        f = lambda x, y: y
+        with pytest.raises(ValueError):
+            df.pipe((f, 'y'), x=1, y=0)
+
+        with pytest.raises(ValueError):
+            df.A.pipe((f, 'y'), x=1, y=0)
+
+    @pytest.mark.parametrize('box', [pd.Series, pd.DataFrame])
+    def test_axis_classmethods(self, box):
+        obj = box()
+        values = (list(box._AXIS_NAMES.keys()) +
+                  list(box._AXIS_NUMBERS.keys()) +
+                  list(box._AXIS_ALIASES.keys()))
+        for v in values:
+            assert obj._get_axis_number(v) == box._get_axis_number(v)
+            assert obj._get_axis_name(v) == box._get_axis_name(v)
+            assert obj._get_block_manager_axis(v) == \
+                box._get_block_manager_axis(v)
diff --git a/pandas/tests/generic/test_label_or_level_utils.py b/pandas/tests/generic/test_label_or_level_utils.py
new file mode 100644
index 0000000000000..91c58e01f0c45
--- /dev/null
+++ b/pandas/tests/generic/test_label_or_level_utils.py
@@ -0,0 +1,406 @@
+import pytest
+
+from pandas.core.dtypes.missing import array_equivalent
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+# Fixtures
+# ========
+@pytest.fixture
+def df():
+    """DataFrame with columns 'L1', 'L2', and 'L3' """
+    return pd.DataFrame({'L1': [1, 2, 3],
+                         'L2': [11, 12, 13],
+                         'L3': ['A', 'B', 'C']})
+
+
+@pytest.fixture(params=[[], ['L1'], ['L1', 'L2'], ['L1', 'L2', 'L3']])
+def df_levels(request, df):
+    """DataFrame with columns or index levels 'L1', 'L2', and 'L3' """
+    levels = request.param
+
+    if levels:
+        df = df.set_index(levels)
+
+    return df
+
+
+@pytest.fixture
+def df_ambig(df):
+    """DataFrame with levels 'L1' and 'L2' and labels 'L1' and 'L3' """
+    df = df.set_index(['L1', 'L2'])
+
+    df['L1'] = df['L3']
+
+    return df
+
+
+@pytest.fixture
+def df_duplabels(df):
+    """DataFrame with level 'L1' and labels 'L2', 'L3', and 'L2' """
+    df = df.set_index(['L1'])
+    df = pd.concat([df, df['L2']], axis=1)
+
+    return df
+
+
+@pytest.fixture
+def panel():
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        return pd.Panel()
+
+
+# Test is label/level reference
+# =============================
+def get_labels_levels(df_levels):
+    expected_labels = list(df_levels.columns)
+    expected_levels = [name for name in df_levels.index.names
+                       if name is not None]
+    return expected_labels, expected_levels
+
+
+def assert_label_reference(frame, labels, axis):
+    for label in labels:
+        assert frame._is_label_reference(label, axis=axis)
+        assert not frame._is_level_reference(label, axis=axis)
+        assert frame._is_label_or_level_reference(label, axis=axis)
+
+
+def assert_level_reference(frame, levels, axis):
+    for level in levels:
+        assert frame._is_level_reference(level, axis=axis)
+        assert not frame._is_label_reference(level, axis=axis)
+        assert frame._is_label_or_level_reference(level, axis=axis)
+
+
+# DataFrame
+# ---------
+def test_is_level_or_label_reference_df_simple(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_level_reference(df_levels, expected_levels, axis=axis)
+    assert_label_reference(df_levels, expected_labels, axis=axis)
+
+
+def test_is_level_reference_df_ambig(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_ambig = df_ambig.T
+
+    # df has both an on-axis level and off-axis label named L1
+    # Therefore L1 should reference the label, not the level
+    assert_label_reference(df_ambig, ['L1'], axis=axis)
+
+    # df has an on-axis level named L2 and it is not ambiguous
+    # Therefore L2 is an level reference
+    assert_level_reference(df_ambig, ['L2'], axis=axis)
+
+    # df has a column named L3 and it not an level reference
+    assert_label_reference(df_ambig, ['L3'], axis=axis)
+
+
+# Series
+# ------
+def test_is_level_reference_series_simple_axis0(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_level_reference(s, ['L1'], axis=0)
+    assert not s._is_level_reference('L2')
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_level_reference(s, ['L1', 'L2'], axis=0)
+    assert not s._is_level_reference('L3')
+
+
+def test_is_level_reference_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with pytest.raises(ValueError, match="No axis named 1"):
+        s._is_level_reference('L1', axis=1)
+
+
+# Panel
+# -----
+def test_is_level_reference_panel_error(panel):
+    msg = ("_is_level_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._is_level_reference('L1', axis=0)
+
+
+def test_is_label_reference_panel_error(panel):
+    msg = ("_is_label_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._is_label_reference('L1', axis=0)
+
+
+def test_is_label_or_level_reference_panel_error(panel):
+    msg = ("_is_label_or_level_reference is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._is_label_or_level_reference('L1', axis=0)
+
+
+# Test _check_label_or_level_ambiguity_df
+# =======================================
+
+# DataFrame
+# ---------
+def test_check_label_or_level_ambiguity_df(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis in {1, "columns"}:
+        df_ambig = df_ambig.T
+
+    if axis in {0, "index"}:
+        msg = "'L1' is both an index level and a column label"
+    else:
+        msg = "'L1' is both a column level and an index label"
+
+    # df_ambig has both an on-axis level and off-axis label named L1
+    # Therefore, L1 is ambiguous.
+    with pytest.raises(ValueError, match=msg):
+        df_ambig._check_label_or_level_ambiguity("L1", axis=axis)
+
+    # df_ambig has an on-axis level named L2,, and it is not ambiguous.
+    df_ambig._check_label_or_level_ambiguity("L2", axis=axis)
+
+    # df_ambig has an off-axis label named L3, and it is not ambiguous
+    assert not df_ambig._check_label_or_level_ambiguity("L3", axis=axis)
+
+
+# Series
+# ------
+def test_check_label_or_level_ambiguity_series(df):
+
+    # A series has no columns and therefore references are never ambiguous
+
+    # Make series with L1 as index
+    s = df.set_index("L1").L2
+    s._check_label_or_level_ambiguity("L1", axis=0)
+    s._check_label_or_level_ambiguity("L2", axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(["L1", "L2"]).L3
+    s._check_label_or_level_ambiguity("L1", axis=0)
+    s._check_label_or_level_ambiguity("L2", axis=0)
+    s._check_label_or_level_ambiguity("L3", axis=0)
+
+
+def test_check_label_or_level_ambiguity_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with pytest.raises(ValueError, match="No axis named 1"):
+        s._check_label_or_level_ambiguity('L1', axis=1)
+
+
+# Panel
+# -----
+def test_check_label_or_level_ambiguity_panel_error(panel):
+    msg = ("_check_label_or_level_ambiguity is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._check_label_or_level_ambiguity("L1", axis=0)
+
+
+# Test _get_label_or_level_values
+# ===============================
+def assert_label_values(frame, labels, axis):
+    for label in labels:
+        if axis in {0, 'index'}:
+            expected = frame[label]._values
+        else:
+            expected = frame.loc[label]._values
+
+        result = frame._get_label_or_level_values(label, axis=axis)
+        assert array_equivalent(expected, result)
+
+
+def assert_level_values(frame, levels, axis):
+    for level in levels:
+        if axis in {0, "index"}:
+            expected = frame.index.get_level_values(level=level)._values
+        else:
+            expected = frame.columns.get_level_values(level=level)._values
+
+        result = frame._get_label_or_level_values(level, axis=axis)
+        assert array_equivalent(expected, result)
+
+
+# DataFrame
+# ---------
+def test_get_label_or_level_values_df_simple(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_label_values(df_levels, expected_labels, axis=axis)
+    assert_level_values(df_levels, expected_levels, axis=axis)
+
+
+def test_get_label_or_level_values_df_ambig(df_ambig, axis):
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_ambig = df_ambig.T
+
+    # df has an on-axis level named L2, and it is not ambiguous.
+    assert_level_values(df_ambig, ['L2'], axis=axis)
+
+    # df has an off-axis label named L3, and it is not ambiguous.
+    assert_label_values(df_ambig, ['L3'], axis=axis)
+
+
+def test_get_label_or_level_values_df_duplabels(df_duplabels, axis):
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_duplabels = df_duplabels.T
+
+    # df has unambiguous level 'L1'
+    assert_level_values(df_duplabels, ['L1'], axis=axis)
+
+    # df has unique label 'L3'
+    assert_label_values(df_duplabels, ['L3'], axis=axis)
+
+    # df has duplicate labels 'L2'
+    if axis in {0, 'index'}:
+        expected_msg = "The column label 'L2' is not unique"
+    else:
+        expected_msg = "The index label 'L2' is not unique"
+
+    with pytest.raises(ValueError, match=expected_msg):
+        assert_label_values(df_duplabels, ['L2'], axis=axis)
+
+
+# Series
+# ------
+def test_get_label_or_level_values_series_axis0(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_level_values(s, ['L1'], axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_level_values(s, ['L1', 'L2'], axis=0)
+
+
+def test_get_label_or_level_values_series_axis1_error(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+
+    with pytest.raises(ValueError, match="No axis named 1"):
+        s._get_label_or_level_values('L1', axis=1)
+
+
+# Panel
+# -----
+def test_get_label_or_level_values_panel_error(panel):
+    msg = ("_get_label_or_level_values is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._get_label_or_level_values('L1', axis=0)
+
+
+# Test _drop_labels_or_levels
+# ===========================
+def assert_labels_dropped(frame, labels, axis):
+    for label in labels:
+        df_dropped = frame._drop_labels_or_levels(label, axis=axis)
+
+        if axis in {0, 'index'}:
+            assert label in frame.columns
+            assert label not in df_dropped.columns
+        else:
+            assert label in frame.index
+            assert label not in df_dropped.index
+
+
+def assert_levels_dropped(frame, levels, axis):
+    for level in levels:
+        df_dropped = frame._drop_labels_or_levels(level, axis=axis)
+
+        if axis in {0, 'index'}:
+            assert level in frame.index.names
+            assert level not in df_dropped.index.names
+        else:
+            assert level in frame.columns.names
+            assert level not in df_dropped.columns.names
+
+
+# DataFrame
+# ---------
+def test_drop_labels_or_levels_df(df_levels, axis):
+
+    # Compute expected labels and levels
+    expected_labels, expected_levels = get_labels_levels(df_levels)
+
+    # Transpose frame if axis == 1
+    if axis in {1, 'columns'}:
+        df_levels = df_levels.T
+
+    # Perform checks
+    assert_labels_dropped(df_levels, expected_labels, axis=axis)
+    assert_levels_dropped(df_levels, expected_levels, axis=axis)
+
+    with pytest.raises(ValueError, match="not valid labels or levels"):
+        df_levels._drop_labels_or_levels('L4', axis=axis)
+
+
+# Series
+# ------
+def test_drop_labels_or_levels_series(df):
+
+    # Make series with L1 as index
+    s = df.set_index('L1').L2
+    assert_levels_dropped(s, ['L1'], axis=0)
+
+    with pytest.raises(ValueError, match="not valid labels or levels"):
+        s._drop_labels_or_levels('L4', axis=0)
+
+    # Make series with L1 and L2 as index
+    s = df.set_index(['L1', 'L2']).L3
+    assert_levels_dropped(s, ['L1', 'L2'], axis=0)
+
+    with pytest.raises(ValueError, match="not valid labels or levels"):
+        s._drop_labels_or_levels('L4', axis=0)
+
+
+# Panel
+# -----
+def test_drop_labels_or_levels_panel_error(panel):
+    msg = ("_drop_labels_or_levels is not implemented for {type}"
+           .format(type=type(panel)))
+
+    with pytest.raises(NotImplementedError, match=msg):
+        panel._drop_labels_or_levels('L1', axis=0)
diff --git a/pandas/tests/generic/test_series.py b/pandas/tests/generic/test_series.py
new file mode 100644
index 0000000000000..10430ebde8225
--- /dev/null
+++ b/pandas/tests/generic/test_series.py
@@ -0,0 +1,247 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=E1101,W0612
+
+from distutils.version import LooseVersion
+from operator import methodcaller
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import MultiIndex, Series, date_range
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal, assert_series_equal
+
+from .test_generic import Generic
+
+try:
+    import xarray
+    _XARRAY_INSTALLED = True
+except ImportError:
+    _XARRAY_INSTALLED = False
+
+
+class TestSeries(Generic):
+    _typ = Series
+    _comparator = lambda self, x, y: assert_series_equal(x, y)
+
+    def setup_method(self):
+        self.ts = tm.makeTimeSeries()  # Was at top level in test_series
+        self.ts.name = 'ts'
+
+        self.series = tm.makeStringSeries()
+        self.series.name = 'series'
+
+    def test_rename_mi(self):
+        s = Series([11, 21, 31],
+                   index=MultiIndex.from_tuples(
+                       [("A", x) for x in ["a", "B", "c"]]))
+        s.rename(str.lower)
+
+    def test_set_axis_name(self):
+        s = Series([1, 2, 3], index=['a', 'b', 'c'])
+        funcs = ['rename_axis', '_set_axis_name']
+        name = 'foo'
+        for func in funcs:
+            result = methodcaller(func, name)(s)
+            assert s.index.name is None
+            assert result.index.name == name
+
+    def test_set_axis_name_mi(self):
+        s = Series([11, 21, 31], index=MultiIndex.from_tuples(
+            [("A", x) for x in ["a", "B", "c"]],
+            names=['l1', 'l2'])
+        )
+        funcs = ['rename_axis', '_set_axis_name']
+        for func in funcs:
+            result = methodcaller(func, ['L1', 'L2'])(s)
+            assert s.index.name is None
+            assert s.index.names == ['l1', 'l2']
+            assert result.index.name is None
+            assert result.index.names, ['L1', 'L2']
+
+    def test_set_axis_name_raises(self):
+        s = pd.Series([1])
+        with pytest.raises(ValueError):
+            s._set_axis_name(name='a', axis=1)
+
+    def test_get_numeric_data_preserve_dtype(self):
+
+        # get the numeric data
+        o = Series([1, 2, 3])
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        o = Series([1, '2', 3.])
+        result = o._get_numeric_data()
+        expected = Series([], dtype=object, index=pd.Index([], dtype=object))
+        self._compare(result, expected)
+
+        o = Series([True, False, True])
+        result = o._get_numeric_data()
+        self._compare(result, o)
+
+        o = Series([True, False, True])
+        result = o._get_bool_data()
+        self._compare(result, o)
+
+        o = Series(date_range('20130101', periods=3))
+        result = o._get_numeric_data()
+        expected = Series([], dtype='M8[ns]', index=pd.Index([], dtype=object))
+        self._compare(result, expected)
+
+    def test_nonzero_single_element(self):
+
+        # allow single item via bool method
+        s = Series([True])
+        assert s.bool()
+
+        s = Series([False])
+        assert not s.bool()
+
+        # single item nan to raise
+        for s in [Series([np.nan]), Series([pd.NaT]), Series([True]),
+                  Series([False])]:
+            pytest.raises(ValueError, lambda: bool(s))
+
+        for s in [Series([np.nan]), Series([pd.NaT])]:
+            pytest.raises(ValueError, lambda: s.bool())
+
+        # multiple bool are still an error
+        for s in [Series([True, True]), Series([False, False])]:
+            pytest.raises(ValueError, lambda: bool(s))
+            pytest.raises(ValueError, lambda: s.bool())
+
+        # single non-bool are an error
+        for s in [Series([1]), Series([0]), Series(['a']), Series([0.0])]:
+            pytest.raises(ValueError, lambda: bool(s))
+            pytest.raises(ValueError, lambda: s.bool())
+
+    def test_metadata_propagation_indiv(self):
+        # check that the metadata matches up on the resulting ops
+
+        o = Series(range(3), range(3))
+        o.name = 'foo'
+        o2 = Series(range(3), range(3))
+        o2.name = 'bar'
+
+        result = o.T
+        self.check_metadata(o, result)
+
+        # resample
+        ts = Series(np.random.rand(1000),
+                    index=date_range('20130101', periods=1000, freq='s'),
+                    name='foo')
+        result = ts.resample('1T').mean()
+        self.check_metadata(ts, result)
+
+        result = ts.resample('1T').min()
+        self.check_metadata(ts, result)
+
+        result = ts.resample('1T').apply(lambda x: x.sum())
+        self.check_metadata(ts, result)
+
+        _metadata = Series._metadata
+        _finalize = Series.__finalize__
+        Series._metadata = ['name', 'filename']
+        o.filename = 'foo'
+        o2.filename = 'bar'
+
+        def finalize(self, other, method=None, **kwargs):
+            for name in self._metadata:
+                if method == 'concat' and name == 'filename':
+                    value = '+'.join([getattr(
+                        o, name) for o in other.objs if getattr(o, name, None)
+                    ])
+                    object.__setattr__(self, name, value)
+                else:
+                    object.__setattr__(self, name, getattr(other, name, None))
+
+            return self
+
+        Series.__finalize__ = finalize
+
+        result = pd.concat([o, o2])
+        assert result.filename == 'foo+bar'
+        assert result.name is None
+
+        # reset
+        Series._metadata = _metadata
+        Series.__finalize__ = _finalize
+
+    @pytest.mark.skipif(not _XARRAY_INSTALLED or _XARRAY_INSTALLED and
+                        LooseVersion(xarray.__version__) <
+                        LooseVersion('0.10.0'),
+                        reason='xarray >= 0.10.0 required')
+    @pytest.mark.parametrize(
+        "index",
+        ['FloatIndex', 'IntIndex',
+         'StringIndex', 'UnicodeIndex',
+         'DateIndex', 'PeriodIndex',
+         'TimedeltaIndex', 'CategoricalIndex'])
+    def test_to_xarray_index_types(self, index):
+        from xarray import DataArray
+
+        index = getattr(tm, 'make{}'.format(index))
+        s = Series(range(6), index=index(6))
+        s.index.name = 'foo'
+        result = s.to_xarray()
+        repr(result)
+        assert len(result) == 6
+        assert len(result.coords) == 1
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, DataArray)
+
+        # idempotency
+        assert_series_equal(result.to_series(), s,
+                            check_index_type=False,
+                            check_categorical=True)
+
+    @td.skip_if_no('xarray', min_version='0.7.0')
+    def test_to_xarray(self):
+        from xarray import DataArray
+
+        s = Series([])
+        s.index.name = 'foo'
+        result = s.to_xarray()
+        assert len(result) == 0
+        assert len(result.coords) == 1
+        assert_almost_equal(list(result.coords.keys()), ['foo'])
+        assert isinstance(result, DataArray)
+
+        s = Series(range(6))
+        s.index.name = 'foo'
+        s.index = pd.MultiIndex.from_product([['a', 'b'], range(3)],
+                                             names=['one', 'two'])
+        result = s.to_xarray()
+        assert len(result) == 2
+        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
+        assert isinstance(result, DataArray)
+        assert_series_equal(result.to_series(), s)
+
+    def test_valid_deprecated(self):
+        # GH18800
+        with tm.assert_produces_warning(FutureWarning):
+            pd.Series([]).valid()
+
+    @pytest.mark.parametrize("s", [
+        Series([np.arange(5)]),
+        pd.date_range('1/1/2011', periods=24, freq='H'),
+        pd.Series(range(5), index=pd.date_range("2017", periods=5))
+    ])
+    @pytest.mark.parametrize("shift_size", [0, 1, 2])
+    def test_shift_always_copy(self, s, shift_size):
+        # GH22397
+        assert s.shift(shift_size) is not s
+
+    @pytest.mark.parametrize("move_by_freq", [
+        pd.Timedelta('1D'),
+        pd.Timedelta('1M'),
+    ])
+    def test_datetime_shift_always_copy(self, move_by_freq):
+        # GH22397
+        s = pd.Series(range(5), index=pd.date_range("2017", periods=5))
+        assert s.shift(freq=move_by_freq) is not s
diff --git a/pandas/tests/groupby/aggregate/__init__.py b/pandas/tests/groupby/aggregate/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/groupby/aggregate/test_aggregate.py b/pandas/tests/groupby/aggregate/test_aggregate.py
new file mode 100644
index 0000000000000..0c2e74c0b735f
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_aggregate.py
@@ -0,0 +1,305 @@
+# -*- coding: utf-8 -*-
+
+"""
+test .agg behavior / note that .apply is tested generally in test_groupby.py
+"""
+from collections import OrderedDict
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, concat
+from pandas.core.base import SpecificationError
+from pandas.core.groupby.grouper import Grouping
+import pandas.util.testing as tm
+
+
+def test_agg_regression1(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_must_agg(df):
+    grouped = df.groupby('A')['C']
+
+    msg = "Must produce aggregated value"
+    with pytest.raises(Exception, match=msg):
+        grouped.agg(lambda x: x.describe())
+    with pytest.raises(Exception, match=msg):
+        grouped.agg(lambda x: x.index[:2])
+
+
+def test_agg_ser_multi_key(df):
+    # TODO(wesm): unused
+    ser = df.C  # noqa
+
+    f = lambda x: x.sum()
+    results = df.C.groupby([df.A, df.B]).aggregate(f)
+    expected = df.groupby(['A', 'B']).sum()['C']
+    tm.assert_series_equal(results, expected)
+
+
+def test_groupby_aggregation_mixed_dtype():
+
+    # GH 6212
+    expected = DataFrame({
+        'v1': [5, 5, 7, np.nan, 3, 3, 4, 1],
+        'v2': [55, 55, 77, np.nan, 33, 33, 44, 11]},
+        index=MultiIndex.from_tuples([(1, 95), (1, 99), (2, 95), (2, 99),
+                                      ('big', 'damp'),
+                                      ('blue', 'dry'),
+                                      ('red', 'red'), ('red', 'wet')],
+                                     names=['by1', 'by2']))
+
+    df = DataFrame({
+        'v1': [1, 3, 5, 7, 8, 3, 5, np.nan, 4, 5, 7, 9],
+        'v2': [11, 33, 55, 77, 88, 33, 55, np.nan, 44, 55, 77, 99],
+        'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan,
+                12],
+        'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99,
+                np.nan, np.nan]
+    })
+
+    g = df.groupby(['by1', 'by2'])
+    result = g[['v1', 'v2']].mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_apply_corner(ts, tsframe):
+    # nothing to group, all NA
+    grouped = ts.groupby(ts * np.nan)
+    assert ts.dtype == np.float64
+
+    # groupby float64 values results in Float64Index
+    exp = Series([], dtype=np.float64,
+                 index=pd.Index([], dtype=np.float64))
+    tm.assert_series_equal(grouped.sum(), exp)
+    tm.assert_series_equal(grouped.agg(np.sum), exp)
+    tm.assert_series_equal(grouped.apply(np.sum), exp,
+                           check_index_type=False)
+
+    # DataFrame
+    grouped = tsframe.groupby(tsframe['A'] * np.nan)
+    exp_df = DataFrame(columns=tsframe.columns, dtype=float,
+                       index=pd.Index([], dtype=np.float64))
+    tm.assert_frame_equal(grouped.sum(), exp_df, check_names=False)
+    tm.assert_frame_equal(grouped.agg(np.sum), exp_df, check_names=False)
+    tm.assert_frame_equal(grouped.apply(np.sum), exp_df.iloc[:, :0],
+                          check_names=False)
+
+
+def test_agg_grouping_is_list_tuple(ts):
+    df = tm.makeTimeDataFrame()
+
+    grouped = df.groupby(lambda x: x.year)
+    grouper = grouped.grouper.groupings[0].grouper
+    grouped.grouper.groupings[0] = Grouping(ts.index, list(grouper))
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+    grouped.grouper.groupings[0] = Grouping(ts.index, tuple(grouper))
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_python_multiindex(mframe):
+    grouped = mframe.groupby(['A', 'B'])
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('groupbyfunc', [
+    lambda x: x.weekday(),
+    [lambda x: x.month, lambda x: x.weekday()],
+])
+def test_aggregate_str_func(tsframe, groupbyfunc):
+    grouped = tsframe.groupby(groupbyfunc)
+
+    # single series
+    result = grouped['A'].agg('std')
+    expected = grouped['A'].std()
+    tm.assert_series_equal(result, expected)
+
+    # group frame by function name
+    result = grouped.aggregate('var')
+    expected = grouped.var()
+    tm.assert_frame_equal(result, expected)
+
+    # group frame by function dict
+    result = grouped.agg(OrderedDict([['A', 'var'],
+                                      ['B', 'std'],
+                                      ['C', 'mean'],
+                                      ['D', 'sem']]))
+    expected = DataFrame(OrderedDict([['A', grouped['A'].var()],
+                                      ['B', grouped['B'].std()],
+                                      ['C', grouped['C'].mean()],
+                                      ['D', grouped['D'].sem()]]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_aggregate_item_by_item(df):
+    grouped = df.groupby('A')
+
+    aggfun = lambda ser: ser.size
+    result = grouped.agg(aggfun)
+    foo = (df.A == 'foo').sum()
+    bar = (df.A == 'bar').sum()
+    K = len(result.columns)
+
+    # GH5782
+    # odd comparisons can result here, so cast to make easy
+    exp = pd.Series(np.array([foo] * K), index=list('BCD'),
+                    dtype=np.float64, name='foo')
+    tm.assert_series_equal(result.xs('foo'), exp)
+
+    exp = pd.Series(np.array([bar] * K), index=list('BCD'),
+                    dtype=np.float64, name='bar')
+    tm.assert_almost_equal(result.xs('bar'), exp)
+
+    def aggfun(ser):
+        return ser.size
+
+    result = DataFrame().groupby(df.A).agg(aggfun)
+    assert isinstance(result, DataFrame)
+    assert len(result) == 0
+
+
+def test_wrap_agg_out(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    def func(ser):
+        if ser.dtype == np.object:
+            raise TypeError
+        else:
+            return ser.sum()
+
+    result = grouped.aggregate(func)
+    exp_grouped = three_group.loc[:, three_group.columns != 'C']
+    expected = exp_grouped.groupby(['A', 'B']).aggregate(func)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_multiple_functions_maintain_order(df):
+    # GH #610
+    funcs = [('mean', np.mean), ('max', np.max), ('min', np.min)]
+    result = df.groupby('A')['C'].agg(funcs)
+    exp_cols = Index(['mean', 'max', 'min'])
+
+    tm.assert_index_equal(result.columns, exp_cols)
+
+
+def test_multiple_functions_tuples_and_non_tuples(df):
+    # #1359
+    funcs = [('foo', 'mean'), 'std']
+    ex_funcs = [('foo', 'mean'), ('std', 'std')]
+
+    result = df.groupby('A')['C'].agg(funcs)
+    expected = df.groupby('A')['C'].agg(ex_funcs)
+    tm.assert_frame_equal(result, expected)
+
+    result = df.groupby('A').agg(funcs)
+    expected = df.groupby('A').agg(ex_funcs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_multiple_functions_too_many_lambdas(df):
+    grouped = df.groupby('A')
+    funcs = ['mean', lambda x: x.mean(), lambda x: x.std()]
+
+    msg = 'Function names must be unique, found multiple named <lambda>'
+    with pytest.raises(SpecificationError, match=msg):
+        grouped.agg(funcs)
+
+
+def test_more_flexible_frame_multi_function(df):
+    grouped = df.groupby('A')
+
+    exmean = grouped.agg(OrderedDict([['C', np.mean], ['D', np.mean]]))
+    exstd = grouped.agg(OrderedDict([['C', np.std], ['D', np.std]]))
+
+    expected = concat([exmean, exstd], keys=['mean', 'std'], axis=1)
+    expected = expected.swaplevel(0, 1, axis=1).sort_index(level=0, axis=1)
+
+    d = OrderedDict([['C', [np.mean, np.std]], ['D', [np.mean, np.std]]])
+    result = grouped.aggregate(d)
+
+    tm.assert_frame_equal(result, expected)
+
+    # be careful
+    result = grouped.aggregate(OrderedDict([['C', np.mean],
+                                            ['D', [np.mean, np.std]]]))
+    expected = grouped.aggregate(OrderedDict([['C', np.mean],
+                                              ['D', [np.mean, np.std]]]))
+    tm.assert_frame_equal(result, expected)
+
+    def foo(x):
+        return np.mean(x)
+
+    def bar(x):
+        return np.std(x, ddof=1)
+
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        d = OrderedDict([['C', np.mean],
+                         ['D', OrderedDict([['foo', np.mean],
+                                            ['bar', np.std]])]])
+        result = grouped.aggregate(d)
+
+    d = OrderedDict([['C', [np.mean]], ['D', [foo, bar]]])
+    expected = grouped.aggregate(d)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multi_function_flexible_mix(df):
+    # GH #1268
+    grouped = df.groupby('A')
+
+    # Expected
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', {'sum': 'sum'}]])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        expected = grouped.aggregate(d)
+
+    # Test 1
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', 'sum']])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped.aggregate(d)
+    tm.assert_frame_equal(result, expected)
+
+    # Test 2
+    d = OrderedDict([['C', OrderedDict([['foo', 'mean'], ['bar', 'std']])],
+                     ['D', ['sum']]])
+    # this uses column selection & renaming
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped.aggregate(d)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_agg_coercing_bools():
+    # issue 14873
+    dat = pd.DataFrame(
+        {'a': [1, 1, 2, 2], 'b': [0, 1, 2, 3], 'c': [None, None, 1, 1]})
+    gp = dat.groupby('a')
+
+    index = Index([1, 2], name='a')
+
+    result = gp['b'].aggregate(lambda x: (x != 0).all())
+    expected = Series([False, True], index=index, name='b')
+    tm.assert_series_equal(result, expected)
+
+    result = gp['c'].aggregate(lambda x: x.isnull().all())
+    expected = Series([True, False], index=index, name='c')
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/groupby/aggregate/test_cython.py b/pandas/tests/groupby/aggregate/test_cython.py
new file mode 100644
index 0000000000000..ad3974d5e2fb8
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_cython.py
@@ -0,0 +1,218 @@
+# -*- coding: utf-8 -*-
+
+"""
+test cython .agg behavior
+"""
+
+from __future__ import print_function
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import (
+    DataFrame, Index, NaT, Series, Timedelta, Timestamp, bdate_range)
+from pandas.core.groupby.groupby import DataError
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('op_name', [
+    'count',
+    'sum',
+    'std',
+    'var',
+    'sem',
+    'mean',
+    pytest.param('median',
+                 # ignore mean of empty slice
+                 # and all-NaN
+                 marks=[pytest.mark.filterwarnings(
+                     "ignore::RuntimeWarning"
+                 )]),
+    'prod',
+    'min',
+    'max',
+])
+def test_cythonized_aggers(op_name):
+    data = {'A': [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., np.nan, np.nan],
+            'B': ['A', 'B'] * 6,
+            'C': np.random.randn(12)}
+    df = DataFrame(data)
+    df.loc[2:10:2, 'C'] = np.nan
+
+    op = lambda x: getattr(x, op_name)()
+
+    # single column
+    grouped = df.drop(['B'], axis=1).groupby('A')
+    exp = {cat: op(group['C']) for cat, group in grouped}
+    exp = DataFrame({'C': exp})
+    exp.index.name = 'A'
+    result = op(grouped)
+    tm.assert_frame_equal(result, exp)
+
+    # multiple columns
+    grouped = df.groupby(['A', 'B'])
+    expd = {}
+    for (cat1, cat2), group in grouped:
+        expd.setdefault(cat1, {})[cat2] = op(group['C'])
+    exp = DataFrame(expd).T.stack(dropna=False)
+    exp.index.names = ['A', 'B']
+    exp.name = 'C'
+
+    result = op(grouped)['C']
+    if op_name in ['sum', 'prod']:
+        tm.assert_series_equal(result, exp)
+
+
+def test_cython_agg_boolean():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': np.random.randint(0, 2, 50).astype('bool')})
+    result = frame.groupby('a')['b'].mean()
+    expected = frame.groupby('a')['b'].agg(np.mean)
+
+    tm.assert_series_equal(result, expected)
+
+
+def test_cython_agg_nothing_to_agg():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25})
+    msg = "No numeric types to aggregate"
+
+    with pytest.raises(DataError, match=msg):
+        frame.groupby('a')['b'].mean()
+
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25})
+    with pytest.raises(DataError, match=msg):
+        frame[['b']].groupby(frame['a']).mean()
+
+
+def test_cython_agg_nothing_to_agg_with_dates():
+    frame = DataFrame({'a': np.random.randint(0, 5, 50),
+                       'b': ['foo', 'bar'] * 25,
+                       'dates': pd.date_range('now', periods=50, freq='T')})
+    msg = "No numeric types to aggregate"
+    with pytest.raises(DataError, match=msg):
+        frame.groupby('b').dates.mean()
+
+
+def test_cython_agg_frame_columns():
+    # #2113
+    df = DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
+
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+    df.groupby(level=0, axis='columns').mean()
+
+
+def test_cython_agg_return_dict():
+    # GH 16741
+    df = DataFrame(
+        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+         'C': np.random.randn(8),
+         'D': np.random.randn(8)})
+
+    ts = df.groupby('A')['B'].agg(lambda x: x.value_counts().to_dict())
+    expected = Series([{'two': 1, 'one': 1, 'three': 1},
+                       {'two': 2, 'one': 2, 'three': 1}],
+                      index=Index(['bar', 'foo'], name='A'),
+                      name='B')
+    tm.assert_series_equal(ts, expected)
+
+
+def test_cython_fail_agg():
+    dr = bdate_range('1/1/2000', periods=50)
+    ts = Series(['A', 'B', 'C', 'D', 'E'] * 10, index=dr)
+
+    grouped = ts.groupby(lambda x: x.month)
+    summed = grouped.sum()
+    expected = grouped.agg(np.sum)
+    tm.assert_series_equal(summed, expected)
+
+
+@pytest.mark.parametrize('op, targop', [
+    ('mean', np.mean),
+    ('median', np.median),
+    ('var', np.var),
+    ('add', np.sum),
+    ('prod', np.prod),
+    ('min', np.min),
+    ('max', np.max),
+    ('first', lambda x: x.iloc[0]),
+    ('last', lambda x: x.iloc[-1]),
+])
+def test__cython_agg_general(op, targop):
+    df = DataFrame(np.random.randn(1000))
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    result = df.groupby(labels)._cython_agg_general(op)
+    expected = df.groupby(labels).agg(targop)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('op, targop', [
+    ('mean', np.mean),
+    ('median', lambda x: np.median(x) if len(x) > 0 else np.nan),
+    ('var', lambda x: np.var(x, ddof=1)),
+    ('min', np.min),
+    ('max', np.max), ]
+)
+def test_cython_agg_empty_buckets(op, targop, observed):
+    df = pd.DataFrame([11, 12, 13])
+    grps = range(0, 55, 5)
+
+    # calling _cython_agg_general directly, instead of via the user API
+    # which sets different values for min_count, so do that here.
+    g = df.groupby(pd.cut(df[0], grps), observed=observed)
+    result = g._cython_agg_general(op)
+
+    g = df.groupby(pd.cut(df[0], grps), observed=observed)
+    expected = g.agg(lambda x: targop(x))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_agg_empty_buckets_nanops(observed):
+    # GH-18869 can't call nanops on empty groups, so hardcode expected
+    # for these
+    df = pd.DataFrame([11, 12, 13], columns=['a'])
+    grps = range(0, 25, 5)
+    # add / sum
+    result = df.groupby(pd.cut(df['a'], grps),
+                        observed=observed)._cython_agg_general('add')
+    intervals = pd.interval_range(0, 20, freq=5)
+    expected = pd.DataFrame(
+        {"a": [0, 0, 36, 0]},
+        index=pd.CategoricalIndex(intervals, name='a', ordered=True))
+    if observed:
+        expected = expected[expected.a != 0]
+
+    tm.assert_frame_equal(result, expected)
+
+    # prod
+    result = df.groupby(pd.cut(df['a'], grps),
+                        observed=observed)._cython_agg_general('prod')
+    expected = pd.DataFrame(
+        {"a": [1, 1, 1716, 1]},
+        index=pd.CategoricalIndex(intervals, name='a', ordered=True))
+    if observed:
+        expected = expected[expected.a != 1]
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('op', ['first', 'last', 'max', 'min'])
+@pytest.mark.parametrize('data', [
+    Timestamp('2016-10-14 21:00:44.557'),
+    Timedelta('17088 days 21:00:44.557'), ])
+def test_cython_with_timestamp_and_nat(op, data):
+    # https://github.com/pandas-dev/pandas/issues/19526
+    df = DataFrame({'a': [0, 1], 'b': [data, NaT]})
+    index = Index([0, 1], name='a')
+
+    # We will group by a and test the cython aggregations
+    expected = DataFrame({'b': [data, NaT]}, index=index)
+
+    result = df.groupby('a').aggregate(op)
+    tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/groupby/aggregate/test_other.py b/pandas/tests/groupby/aggregate/test_other.py
new file mode 100644
index 0000000000000..cacfdb7694de1
--- /dev/null
+++ b/pandas/tests/groupby/aggregate/test_other.py
@@ -0,0 +1,529 @@
+# -*- coding: utf-8 -*-
+
+"""
+test all other .agg behavior
+"""
+
+from __future__ import print_function
+
+from collections import OrderedDict
+import datetime as dt
+from functools import partial
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, PeriodIndex, Series, date_range,
+    period_range)
+from pandas.core.groupby.groupby import SpecificationError
+import pandas.util.testing as tm
+
+from pandas.io.formats.printing import pprint_thing
+
+
+def test_agg_api():
+    # GH 6337
+    # http://stackoverflow.com/questions/21706030/pandas-groupby-agg-function-column-dtype-error
+    # different api for agg when passed custom function with mixed frame
+
+    df = DataFrame({'data1': np.random.randn(5),
+                    'data2': np.random.randn(5),
+                    'key1': ['a', 'a', 'b', 'b', 'a'],
+                    'key2': ['one', 'two', 'one', 'two', 'one']})
+    grouped = df.groupby('key1')
+
+    def peak_to_peak(arr):
+        return arr.max() - arr.min()
+
+    expected = grouped.agg([peak_to_peak])
+    expected.columns = ['data1', 'data2']
+    result = grouped.agg(peak_to_peak)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_datetimes_mixed():
+    data = [[1, '2012-01-01', 1.0],
+            [2, '2012-01-02', 2.0],
+            [3, None, 3.0]]
+
+    df1 = DataFrame({'key': [x[0] for x in data],
+                     'date': [x[1] for x in data],
+                     'value': [x[2] for x in data]})
+
+    data = [[row[0],
+             (dt.datetime.strptime(row[1], '%Y-%m-%d').date()
+              if row[1] else None),
+             row[2]]
+            for row in data]
+
+    df2 = DataFrame({'key': [x[0] for x in data],
+                     'date': [x[1] for x in data],
+                     'value': [x[2] for x in data]})
+
+    df1['weights'] = df1['value'] / df1['value'].sum()
+    gb1 = df1.groupby('date').aggregate(np.sum)
+
+    df2['weights'] = df1['value'] / df1['value'].sum()
+    gb2 = df2.groupby('date').aggregate(np.sum)
+
+    assert (len(gb1) == len(gb2))
+
+
+def test_agg_period_index():
+    prng = period_range('2012-1-1', freq='M', periods=3)
+    df = DataFrame(np.random.randn(3, 2), index=prng)
+    rs = df.groupby(level=0).sum()
+    assert isinstance(rs.index, PeriodIndex)
+
+    # GH 3579
+    index = period_range(start='1999-01', periods=5, freq='M')
+    s1 = Series(np.random.rand(len(index)), index=index)
+    s2 = Series(np.random.rand(len(index)), index=index)
+    series = [('s1', s1), ('s2', s2)]
+    df = DataFrame.from_dict(OrderedDict(series))
+    grouped = df.groupby(df.index.month)
+    list(grouped)
+
+
+def test_agg_dict_parameter_cast_result_dtypes():
+    # GH 12821
+
+    df = DataFrame({'class': ['A', 'A', 'B', 'B', 'C', 'C', 'D', 'D'],
+                    'time': date_range('1/1/2011', periods=8, freq='H')})
+    df.loc[[0, 1, 2, 5], 'time'] = None
+
+    # test for `first` function
+    exp = df.loc[[0, 3, 4, 6]].set_index('class')
+    grouped = df.groupby('class')
+    tm.assert_frame_equal(grouped.first(), exp)
+    tm.assert_frame_equal(grouped.agg('first'), exp)
+    tm.assert_frame_equal(grouped.agg({'time': 'first'}), exp)
+    tm.assert_series_equal(grouped.time.first(), exp['time'])
+    tm.assert_series_equal(grouped.time.agg('first'), exp['time'])
+
+    # test for `last` function
+    exp = df.loc[[0, 3, 4, 7]].set_index('class')
+    grouped = df.groupby('class')
+    tm.assert_frame_equal(grouped.last(), exp)
+    tm.assert_frame_equal(grouped.agg('last'), exp)
+    tm.assert_frame_equal(grouped.agg({'time': 'last'}), exp)
+    tm.assert_series_equal(grouped.time.last(), exp['time'])
+    tm.assert_series_equal(grouped.time.agg('last'), exp['time'])
+
+    # count
+    exp = pd.Series([2, 2, 2, 2],
+                    index=Index(list('ABCD'), name='class'),
+                    name='time')
+    tm.assert_series_equal(grouped.time.agg(len), exp)
+    tm.assert_series_equal(grouped.time.size(), exp)
+
+    exp = pd.Series([0, 1, 1, 2],
+                    index=Index(list('ABCD'), name='class'),
+                    name='time')
+    tm.assert_series_equal(grouped.time.count(), exp)
+
+
+def test_agg_cast_results_dtypes():
+    # similar to GH12821
+    # xref #11444
+    u = [dt.datetime(2015, x + 1, 1) for x in range(12)]
+    v = list('aaabbbbbbccd')
+    df = pd.DataFrame({'X': v, 'Y': u})
+
+    result = df.groupby('X')['Y'].agg(len)
+    expected = df.groupby('X')['Y'].count()
+    tm.assert_series_equal(result, expected)
+
+
+def test_aggregate_float64_no_int64():
+    # see gh-11199
+    df = DataFrame({"a": [1, 2, 3, 4, 5],
+                    "b": [1, 2, 2, 4, 5],
+                    "c": [1, 2, 3, 4, 5]})
+
+    expected = DataFrame({"a": [1, 2.5, 4, 5]}, index=[1, 2, 4, 5])
+    expected.index.name = "b"
+
+    result = df.groupby("b")[["a"]].mean()
+    tm.assert_frame_equal(result, expected)
+
+    expected = DataFrame({"a": [1, 2.5, 4, 5], "c": [1, 2.5, 4, 5]},
+                         index=[1, 2, 4, 5])
+    expected.index.name = "b"
+
+    result = df.groupby("b")[["a", "c"]].mean()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_aggregate_api_consistency():
+    # GH 9052
+    # make sure that the aggregates via dict
+    # are consistent
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    grouped = df.groupby(['A', 'B'])
+    c_mean = grouped['C'].mean()
+    c_sum = grouped['C'].sum()
+    d_mean = grouped['D'].mean()
+    d_sum = grouped['D'].sum()
+
+    result = grouped['D'].agg(['sum', 'mean'])
+    expected = pd.concat([d_sum, d_mean], axis=1)
+    expected.columns = ['sum', 'mean']
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg([np.sum, np.mean])
+    expected = pd.concat([c_sum, c_mean, d_sum, d_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['C', 'D'],
+                                                ['sum', 'mean']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped[['D', 'C']].agg([np.sum, np.mean])
+    expected = pd.concat([d_sum, d_mean, c_sum, c_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['D', 'C'],
+                                                ['sum', 'mean']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg({'C': 'mean', 'D': 'sum'})
+    expected = pd.concat([d_sum, c_mean], axis=1)
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    result = grouped.agg({'C': ['mean', 'sum'],
+                          'D': ['mean', 'sum']})
+    expected = pd.concat([c_mean, c_sum, d_mean, d_sum], axis=1)
+    expected.columns = MultiIndex.from_product([['C', 'D'],
+                                                ['mean', 'sum']])
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = grouped[['D', 'C']].agg({'r': np.sum,
+                                          'r2': np.mean})
+    expected = pd.concat([d_sum, c_sum, d_mean, c_mean], axis=1)
+    expected.columns = MultiIndex.from_product([['r', 'r2'],
+                                                ['D', 'C']])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_dict_renaming_deprecation():
+    # 15931
+    df = pd.DataFrame({'A': [1, 1, 1, 2, 2],
+                       'B': range(5),
+                       'C': range(5)})
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False) as w:
+        df.groupby('A').agg({'B': {'foo': ['sum', 'max']},
+                             'C': {'bar': ['count', 'min']}})
+        assert "using a dict with renaming" in str(w[0].message)
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        df.groupby('A')[['B', 'C']].agg({'ma': 'max'})
+
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df.groupby('A').B.agg({'foo': 'count'})
+        assert "using a dict on a Series for aggregation" in str(w[0].message)
+
+
+def test_agg_compat():
+    # GH 12334
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    g = df.groupby(['A', 'B'])
+
+    expected = pd.concat([g['D'].sum(), g['D'].std()], axis=1)
+    expected.columns = MultiIndex.from_tuples([('C', 'sum'),
+                                               ('C', 'std')])
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'C': ['sum', 'std']})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([g['D'].sum(), g['D'].std()], axis=1)
+    expected.columns = ['C', 'D']
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'C': 'sum', 'D': 'std'})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_nested_dicts():
+    # API change for disallowing these types of nested dicts
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    g = df.groupby(['A', 'B'])
+
+    msg = r'cannot perform renaming for r[1-2] with a nested dictionary'
+    with pytest.raises(SpecificationError, match=msg):
+        g.aggregate({'r1': {'C': ['mean', 'sum']},
+                     'r2': {'D': ['mean', 'sum']}})
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g.agg({'C': {'ra': ['mean', 'std']},
+                        'D': {'rb': ['mean', 'std']}})
+    expected = pd.concat([g['C'].mean(), g['C'].std(),
+                          g['D'].mean(), g['D'].std()],
+                         axis=1)
+    expected.columns = pd.MultiIndex.from_tuples(
+        [('ra', 'mean'), ('ra', 'std'),
+         ('rb', 'mean'), ('rb', 'std')])
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+    # same name as the original column
+    # GH9052
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        expected = g['D'].agg({'result1': np.sum, 'result2': np.mean})
+    expected = expected.rename(columns={'result1': 'D'})
+
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        result = g['D'].agg({'D': np.sum, 'result2': np.mean})
+    tm.assert_frame_equal(result, expected, check_like=True)
+
+
+def test_agg_item_by_item_raise_typeerror():
+    df = DataFrame(np.random.randint(10, size=(20, 10)))
+
+    def raiseException(df):
+        pprint_thing('----------------------------------------')
+        pprint_thing(df.to_string())
+        raise TypeError('test')
+
+    with pytest.raises(TypeError, match='test'):
+        df.groupby(0).agg(raiseException)
+
+
+def test_series_agg_multikey():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+
+    result = grouped.agg(np.sum)
+    expected = grouped.sum()
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_agg_multi_pure_python():
+    data = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny'],
+         'D': np.random.randn(11),
+         'E': np.random.randn(11),
+         'F': np.random.randn(11)})
+
+    def bad(x):
+        assert (len(x.values.base) > 0)
+        return 'foo'
+
+    result = data.groupby(['A', 'B']).agg(bad)
+    expected = data.groupby(['A', 'B']).agg(lambda x: 'foo')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_consistency():
+    # agg with ([]) and () not consistent
+    # GH 6715
+    def P1(a):
+        try:
+            return np.percentile(a.dropna(), q=1)
+        except Exception:
+            return np.nan
+
+    df = DataFrame({'col1': [1, 2, 3, 4],
+                    'col2': [10, 25, 26, 31],
+                    'date': [dt.date(2013, 2, 10), dt.date(2013, 2, 10),
+                             dt.date(2013, 2, 11), dt.date(2013, 2, 11)]})
+
+    g = df.groupby('date')
+
+    expected = g.agg([P1])
+    expected.columns = expected.columns.levels[0]
+
+    result = g.agg(P1)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_callables():
+    # GH 7929
+    df = DataFrame({'foo': [1, 2], 'bar': [3, 4]}).astype(np.int64)
+
+    class fn_class(object):
+
+        def __call__(self, x):
+            return sum(x)
+
+    equiv_callables = [sum,
+                       np.sum,
+                       lambda x: sum(x),
+                       lambda x: x.sum(),
+                       partial(sum),
+                       fn_class(), ]
+
+    expected = df.groupby("foo").agg(sum)
+    for ecall in equiv_callables:
+        result = df.groupby('foo').agg(ecall)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_agg_over_numpy_arrays():
+    # GH 3788
+    df = pd.DataFrame([[1, np.array([10, 20, 30])],
+                       [1, np.array([40, 50, 60])],
+                       [2, np.array([20, 30, 40])]],
+                      columns=['category', 'arraydata'])
+    result = df.groupby('category').agg(sum)
+
+    expected_data = [[np.array([50, 70, 90])], [np.array([20, 30, 40])]]
+    expected_index = pd.Index([1, 2], name='category')
+    expected_column = ['arraydata']
+    expected = pd.DataFrame(expected_data,
+                            index=expected_index,
+                            columns=expected_column)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_timezone_round_trip():
+    # GH 15426
+    ts = pd.Timestamp("2016-01-01 12:00:00", tz='US/Pacific')
+    df = pd.DataFrame({'a': 1,
+                       'b': [ts + dt.timedelta(minutes=nn)
+                             for nn in range(10)]})
+
+    result1 = df.groupby('a')['b'].agg(np.min).iloc[0]
+    result2 = df.groupby('a')['b'].agg(lambda x: np.min(x)).iloc[0]
+    result3 = df.groupby('a')['b'].min().iloc[0]
+
+    assert result1 == ts
+    assert result2 == ts
+    assert result3 == ts
+
+    dates = [pd.Timestamp("2016-01-0%d 12:00:00" % i, tz='US/Pacific')
+             for i in range(1, 5)]
+    df = pd.DataFrame({'A': ['a', 'b'] * 2, 'B': dates})
+    grouped = df.groupby('A')
+
+    ts = df['B'].iloc[0]
+    assert ts == grouped.nth(0)['B'].iloc[0]
+    assert ts == grouped.head(1)['B'].iloc[0]
+    assert ts == grouped.first()['B'].iloc[0]
+    assert ts == grouped.apply(lambda x: x.iloc[0])[0]
+
+    ts = df['B'].iloc[2]
+    assert ts == grouped.last()['B'].iloc[0]
+    assert ts == grouped.apply(lambda x: x.iloc[-1])[0]
+
+
+def test_sum_uint64_overflow():
+    # see gh-14758
+    # Convert to uint64 and don't overflow
+    df = pd.DataFrame([[1, 2], [3, 4], [5, 6]], dtype=object)
+    df = df + 9223372036854775807
+
+    index = pd.Index([9223372036854775808,
+                      9223372036854775810,
+                      9223372036854775812],
+                     dtype=np.uint64)
+    expected = pd.DataFrame({1: [9223372036854775809,
+                                 9223372036854775811,
+                                 9223372036854775813]},
+                            index=index)
+
+    expected.index.name = 0
+    result = df.groupby(0).sum()
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("structure, expected", [
+    (tuple, pd.DataFrame({'C': {(1, 1): (1, 1, 1), (3, 4): (3, 4, 4)}})),
+    (list, pd.DataFrame({'C': {(1, 1): [1, 1, 1], (3, 4): [3, 4, 4]}})),
+    (lambda x: tuple(x), pd.DataFrame({'C': {(1, 1): (1, 1, 1),
+                                             (3, 4): (3, 4, 4)}})),
+    (lambda x: list(x), pd.DataFrame({'C': {(1, 1): [1, 1, 1],
+                                            (3, 4): [3, 4, 4]}}))
+])
+def test_agg_structs_dataframe(structure, expected):
+    df = pd.DataFrame({'A': [1, 1, 1, 3, 3, 3],
+                       'B': [1, 1, 1, 4, 4, 4],
+                       'C': [1, 1, 1, 3, 4, 4]})
+
+    result = df.groupby(['A', 'B']).aggregate(structure)
+    expected.index.names = ['A', 'B']
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("structure, expected", [
+    (tuple, pd.Series([(1, 1, 1), (3, 4, 4)], index=[1, 3], name='C')),
+    (list, pd.Series([[1, 1, 1], [3, 4, 4]], index=[1, 3], name='C')),
+    (lambda x: tuple(x), pd.Series([(1, 1, 1), (3, 4, 4)],
+                                   index=[1, 3], name='C')),
+    (lambda x: list(x), pd.Series([[1, 1, 1], [3, 4, 4]],
+                                  index=[1, 3], name='C'))
+])
+def test_agg_structs_series(structure, expected):
+    # Issue #18079
+    df = pd.DataFrame({'A': [1, 1, 1, 3, 3, 3],
+                       'B': [1, 1, 1, 4, 4, 4],
+                       'C': [1, 1, 1, 3, 4, 4]})
+
+    result = df.groupby('A')['C'].aggregate(structure)
+    expected.index.name = 'A'
+    tm.assert_series_equal(result, expected)
+
+
+def test_agg_category_nansum(observed):
+    categories = ['a', 'b', 'c']
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=categories),
+                       'B': [1, 2, 3]})
+    result = df.groupby("A", observed=observed).B.agg(np.nansum)
+    expected = pd.Series([3, 3, 0],
+                         index=pd.CategoricalIndex(['a', 'b', 'c'],
+                                                   categories=categories,
+                                                   name='A'),
+                         name='B')
+    if observed:
+        expected = expected[expected != 0]
+    tm.assert_series_equal(result, expected)
+
+
+def test_agg_list_like_func():
+    # GH 18473
+    df = pd.DataFrame({'A': [str(x) for x in range(3)],
+                       'B': [str(x) for x in range(3)]})
+    grouped = df.groupby('A', as_index=False, sort=False)
+    result = grouped.agg({'B': lambda x: list(x)})
+    expected = pd.DataFrame({'A': [str(x) for x in range(3)],
+                             'B': [[str(x)] for x in range(3)]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_agg_lambda_with_timezone():
+    # GH 23683
+    df = pd.DataFrame({
+        'tag': [1, 1],
+        'date': [
+            pd.Timestamp('2018-01-01', tz='UTC'),
+            pd.Timestamp('2018-01-02', tz='UTC')]
+    })
+    result = df.groupby('tag').agg({'date': lambda e: e.head(1)})
+    expected = pd.DataFrame([pd.Timestamp('2018-01-01', tz='UTC')],
+                            index=pd.Index([1], name='tag'),
+                            columns=['date'])
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/common.py b/pandas/tests/groupby/common.py
deleted file mode 100644
index f3dccf473f53a..0000000000000
--- a/pandas/tests/groupby/common.py
+++ /dev/null
@@ -1,62 +0,0 @@
-""" Base setup """
-
-import pytest
-import numpy as np
-from pandas.util import testing as tm
-from pandas import DataFrame, MultiIndex
-
-
-@pytest.fixture
-def mframe():
-    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
-                                                              'three']],
-                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                       names=['first', 'second'])
-    return DataFrame(np.random.randn(10, 3), index=index,
-                     columns=['A', 'B', 'C'])
-
-
-@pytest.fixture
-def df():
-    return DataFrame(
-        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-         'C': np.random.randn(8),
-         'D': np.random.randn(8)})
-
-
-class MixIn(object):
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-        self.seriesd = tm.getSeriesData()
-        self.tsd = tm.getTimeSeriesData()
-        self.frame = DataFrame(self.seriesd)
-        self.tsframe = DataFrame(self.tsd)
-
-        self.df = df()
-        self.df_mixed_floats = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.array(
-                 np.random.randn(8), dtype='float32')})
-
-        self.mframe = mframe()
-
-        self.three_group = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny'],
-             'D': np.random.randn(11),
-             'E': np.random.randn(11),
-             'F': np.random.randn(11)})
-
-
-def assert_fp_equal(a, b):
-    assert (np.abs(a - b) < 1e-12).all()
diff --git a/pandas/tests/groupby/conftest.py b/pandas/tests/groupby/conftest.py
new file mode 100644
index 0000000000000..cb4fe511651ee
--- /dev/null
+++ b/pandas/tests/groupby/conftest.py
@@ -0,0 +1,78 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, MultiIndex
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def mframe():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    return DataFrame(np.random.randn(10, 3), index=index,
+                     columns=['A', 'B', 'C'])
+
+
+@pytest.fixture
+def df():
+    return DataFrame(
+        {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+         'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+         'C': np.random.randn(8),
+         'D': np.random.randn(8)})
+
+
+@pytest.fixture
+def ts():
+    return tm.makeTimeSeries()
+
+
+@pytest.fixture
+def seriesd():
+    return tm.getSeriesData()
+
+
+@pytest.fixture
+def tsd():
+    return tm.getTimeSeriesData()
+
+
+@pytest.fixture
+def frame(seriesd):
+    return DataFrame(seriesd)
+
+
+@pytest.fixture
+def tsframe(tsd):
+    return DataFrame(tsd)
+
+
+@pytest.fixture
+def df_mixed_floats():
+    return DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                            'foo', 'bar', 'foo', 'foo'],
+                      'B': ['one', 'one', 'two', 'three',
+                            'two', 'two', 'one', 'three'],
+                      'C': np.random.randn(8),
+                      'D': np.array(
+                          np.random.randn(8), dtype='float32')})
+
+
+@pytest.fixture
+def three_group():
+    return DataFrame({'A': ['foo', 'foo', 'foo',
+                            'foo', 'bar', 'bar',
+                            'bar', 'bar',
+                            'foo', 'foo', 'foo'],
+                      'B': ['one', 'one', 'one',
+                            'two', 'one', 'one', 'one', 'two',
+                            'two', 'two', 'one'],
+                      'C': ['dull', 'dull', 'shiny',
+                            'dull', 'dull', 'shiny', 'shiny',
+                            'dull', 'shiny', 'shiny', 'shiny'],
+                      'D': np.random.randn(11),
+                      'E': np.random.randn(11),
+                      'F': np.random.randn(11)})
diff --git a/pandas/tests/groupby/test_aggregate.py b/pandas/tests/groupby/test_aggregate.py
deleted file mode 100644
index 52b35048b6762..0000000000000
--- a/pandas/tests/groupby/test_aggregate.py
+++ /dev/null
@@ -1,792 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-we test .agg behavior / note that .apply is tested
-generally in test_groupby.py
-"""
-
-from __future__ import print_function
-from datetime import datetime, timedelta
-from functools import partial
-
-import numpy as np
-from numpy import nan
-import pandas as pd
-
-from pandas import (date_range, MultiIndex, DataFrame,
-                    Series, Index, bdate_range)
-from pandas.util.testing import assert_frame_equal, assert_series_equal
-from pandas.core.groupby import SpecificationError, DataError
-from pandas.compat import OrderedDict
-from pandas.formats.printing import pprint_thing
-import pandas.util.testing as tm
-
-
-class TestGroupByAggregate(tm.TestCase):
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-        self.seriesd = tm.getSeriesData()
-        self.tsd = tm.getTimeSeriesData()
-        self.frame = DataFrame(self.seriesd)
-        self.tsframe = DataFrame(self.tsd)
-
-        self.df = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.random.randn(8)})
-
-        self.df_mixed_floats = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.array(
-                 np.random.randn(8), dtype='float32')})
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
-                                                                  'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        self.mframe = DataFrame(np.random.randn(10, 3), index=index,
-                                columns=['A', 'B', 'C'])
-
-        self.three_group = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny'],
-             'D': np.random.randn(11),
-             'E': np.random.randn(11),
-             'F': np.random.randn(11)})
-
-    def test_agg_api(self):
-
-        # GH 6337
-        # http://stackoverflow.com/questions/21706030/pandas-groupby-agg-function-column-dtype-error
-        # different api for agg when passed custom function with mixed frame
-
-        df = DataFrame({'data1': np.random.randn(5),
-                        'data2': np.random.randn(5),
-                        'key1': ['a', 'a', 'b', 'b', 'a'],
-                        'key2': ['one', 'two', 'one', 'two', 'one']})
-        grouped = df.groupby('key1')
-
-        def peak_to_peak(arr):
-            return arr.max() - arr.min()
-
-        expected = grouped.agg([peak_to_peak])
-        expected.columns = ['data1', 'data2']
-        result = grouped.agg(peak_to_peak)
-        assert_frame_equal(result, expected)
-
-    def test_agg_regression1(self):
-        grouped = self.tsframe.groupby([lambda x: x.year, lambda x: x.month])
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_agg_datetimes_mixed(self):
-        data = [[1, '2012-01-01', 1.0], [2, '2012-01-02', 2.0], [3, None, 3.0]]
-
-        df1 = DataFrame({'key': [x[0] for x in data],
-                         'date': [x[1] for x in data],
-                         'value': [x[2] for x in data]})
-
-        data = [[row[0], datetime.strptime(row[1], '%Y-%m-%d').date() if row[1]
-                 else None, row[2]] for row in data]
-
-        df2 = DataFrame({'key': [x[0] for x in data],
-                         'date': [x[1] for x in data],
-                         'value': [x[2] for x in data]})
-
-        df1['weights'] = df1['value'] / df1['value'].sum()
-        gb1 = df1.groupby('date').aggregate(np.sum)
-
-        df2['weights'] = df1['value'] / df1['value'].sum()
-        gb2 = df2.groupby('date').aggregate(np.sum)
-
-        assert (len(gb1) == len(gb2))
-
-    def test_agg_period_index(self):
-        from pandas import period_range, PeriodIndex
-        prng = period_range('2012-1-1', freq='M', periods=3)
-        df = DataFrame(np.random.randn(3, 2), index=prng)
-        rs = df.groupby(level=0).sum()
-        tm.assertIsInstance(rs.index, PeriodIndex)
-
-        # GH 3579
-        index = period_range(start='1999-01', periods=5, freq='M')
-        s1 = Series(np.random.rand(len(index)), index=index)
-        s2 = Series(np.random.rand(len(index)), index=index)
-        series = [('s1', s1), ('s2', s2)]
-        df = DataFrame.from_items(series)
-        grouped = df.groupby(df.index.month)
-        list(grouped)
-
-    def test_agg_dict_parameter_cast_result_dtypes(self):
-        # GH 12821
-
-        df = DataFrame(
-            {'class': ['A', 'A', 'B', 'B', 'C', 'C', 'D', 'D'],
-             'time': date_range('1/1/2011', periods=8, freq='H')})
-        df.loc[[0, 1, 2, 5], 'time'] = None
-
-        # test for `first` function
-        exp = df.loc[[0, 3, 4, 6]].set_index('class')
-        grouped = df.groupby('class')
-        assert_frame_equal(grouped.first(), exp)
-        assert_frame_equal(grouped.agg('first'), exp)
-        assert_frame_equal(grouped.agg({'time': 'first'}), exp)
-        assert_series_equal(grouped.time.first(), exp['time'])
-        assert_series_equal(grouped.time.agg('first'), exp['time'])
-
-        # test for `last` function
-        exp = df.loc[[0, 3, 4, 7]].set_index('class')
-        grouped = df.groupby('class')
-        assert_frame_equal(grouped.last(), exp)
-        assert_frame_equal(grouped.agg('last'), exp)
-        assert_frame_equal(grouped.agg({'time': 'last'}), exp)
-        assert_series_equal(grouped.time.last(), exp['time'])
-        assert_series_equal(grouped.time.agg('last'), exp['time'])
-
-        # count
-        exp = pd.Series([2, 2, 2, 2],
-                        index=Index(list('ABCD'), name='class'),
-                        name='time')
-        assert_series_equal(grouped.time.agg(len), exp)
-        assert_series_equal(grouped.time.size(), exp)
-
-        exp = pd.Series([0, 1, 1, 2],
-                        index=Index(list('ABCD'), name='class'),
-                        name='time')
-        assert_series_equal(grouped.time.count(), exp)
-
-    def test_agg_cast_results_dtypes(self):
-        # similar to GH12821
-        # xref #11444
-        u = [datetime(2015, x + 1, 1) for x in range(12)]
-        v = list('aaabbbbbbccd')
-        df = pd.DataFrame({'X': v, 'Y': u})
-
-        result = df.groupby('X')['Y'].agg(len)
-        expected = df.groupby('X')['Y'].count()
-        assert_series_equal(result, expected)
-
-    def test_agg_must_agg(self):
-        grouped = self.df.groupby('A')['C']
-        self.assertRaises(Exception, grouped.agg, lambda x: x.describe())
-        self.assertRaises(Exception, grouped.agg, lambda x: x.index[:2])
-
-    def test_agg_ser_multi_key(self):
-        # TODO(wesm): unused
-        ser = self.df.C  # noqa
-
-        f = lambda x: x.sum()
-        results = self.df.C.groupby([self.df.A, self.df.B]).aggregate(f)
-        expected = self.df.groupby(['A', 'B']).sum()['C']
-        assert_series_equal(results, expected)
-
-    def test_agg_apply_corner(self):
-        # nothing to group, all NA
-        grouped = self.ts.groupby(self.ts * np.nan)
-        self.assertEqual(self.ts.dtype, np.float64)
-
-        # groupby float64 values results in Float64Index
-        exp = Series([], dtype=np.float64, index=pd.Index(
-            [], dtype=np.float64))
-        assert_series_equal(grouped.sum(), exp)
-        assert_series_equal(grouped.agg(np.sum), exp)
-        assert_series_equal(grouped.apply(np.sum), exp, check_index_type=False)
-
-        # DataFrame
-        grouped = self.tsframe.groupby(self.tsframe['A'] * np.nan)
-        exp_df = DataFrame(columns=self.tsframe.columns, dtype=float,
-                           index=pd.Index([], dtype=np.float64))
-        assert_frame_equal(grouped.sum(), exp_df, check_names=False)
-        assert_frame_equal(grouped.agg(np.sum), exp_df, check_names=False)
-        assert_frame_equal(grouped.apply(np.sum), exp_df.iloc[:, :0],
-                           check_names=False)
-
-    def test_agg_grouping_is_list_tuple(self):
-        from pandas.core.groupby import Grouping
-
-        df = tm.makeTimeDataFrame()
-
-        grouped = df.groupby(lambda x: x.year)
-        grouper = grouped.grouper.groupings[0].grouper
-        grouped.grouper.groupings[0] = Grouping(self.ts.index, list(grouper))
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-        grouped.grouper.groupings[0] = Grouping(self.ts.index, tuple(grouper))
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-    def test_aggregate_api_consistency(self):
-        # GH 9052
-        # make sure that the aggregates via dict
-        # are consistent
-
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': np.random.randn(8) + 1.0,
-                        'D': np.arange(8)})
-
-        grouped = df.groupby(['A', 'B'])
-        c_mean = grouped['C'].mean()
-        c_sum = grouped['C'].sum()
-        d_mean = grouped['D'].mean()
-        d_sum = grouped['D'].sum()
-
-        result = grouped['D'].agg(['sum', 'mean'])
-        expected = pd.concat([d_sum, d_mean],
-                             axis=1)
-        expected.columns = ['sum', 'mean']
-        assert_frame_equal(result, expected, check_like=True)
-
-        result = grouped.agg([np.sum, np.mean])
-        expected = pd.concat([c_sum,
-                              c_mean,
-                              d_sum,
-                              d_mean],
-                             axis=1)
-        expected.columns = MultiIndex.from_product([['C', 'D'],
-                                                    ['sum', 'mean']])
-        assert_frame_equal(result, expected, check_like=True)
-
-        result = grouped[['D', 'C']].agg([np.sum, np.mean])
-        expected = pd.concat([d_sum,
-                              d_mean,
-                              c_sum,
-                              c_mean],
-                             axis=1)
-        expected.columns = MultiIndex.from_product([['D', 'C'],
-                                                    ['sum', 'mean']])
-        assert_frame_equal(result, expected, check_like=True)
-
-        result = grouped.agg({'C': 'mean', 'D': 'sum'})
-        expected = pd.concat([d_sum,
-                              c_mean],
-                             axis=1)
-        assert_frame_equal(result, expected, check_like=True)
-
-        result = grouped.agg({'C': ['mean', 'sum'],
-                              'D': ['mean', 'sum']})
-        expected = pd.concat([c_mean,
-                              c_sum,
-                              d_mean,
-                              d_sum],
-                             axis=1)
-        expected.columns = MultiIndex.from_product([['C', 'D'],
-                                                    ['mean', 'sum']])
-
-        result = grouped[['D', 'C']].agg({'r': np.sum,
-                                          'r2': np.mean})
-        expected = pd.concat([d_sum,
-                              c_sum,
-                              d_mean,
-                              c_mean],
-                             axis=1)
-        expected.columns = MultiIndex.from_product([['r', 'r2'],
-                                                    ['D', 'C']])
-        assert_frame_equal(result, expected, check_like=True)
-
-    def test_agg_compat(self):
-
-        # GH 12334
-
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': np.random.randn(8) + 1.0,
-                        'D': np.arange(8)})
-
-        g = df.groupby(['A', 'B'])
-
-        expected = pd.concat([g['D'].sum(),
-                              g['D'].std()],
-                             axis=1)
-        expected.columns = MultiIndex.from_tuples([('C', 'sum'),
-                                                   ('C', 'std')])
-        result = g['D'].agg({'C': ['sum', 'std']})
-        assert_frame_equal(result, expected, check_like=True)
-
-        expected = pd.concat([g['D'].sum(),
-                              g['D'].std()],
-                             axis=1)
-        expected.columns = ['C', 'D']
-        result = g['D'].agg({'C': 'sum', 'D': 'std'})
-        assert_frame_equal(result, expected, check_like=True)
-
-    def test_agg_nested_dicts(self):
-
-        # API change for disallowing these types of nested dicts
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': np.random.randn(8) + 1.0,
-                        'D': np.arange(8)})
-
-        g = df.groupby(['A', 'B'])
-
-        def f():
-            g.aggregate({'r1': {'C': ['mean', 'sum']},
-                         'r2': {'D': ['mean', 'sum']}})
-
-        self.assertRaises(SpecificationError, f)
-
-        result = g.agg({'C': {'ra': ['mean', 'std']},
-                        'D': {'rb': ['mean', 'std']}})
-        expected = pd.concat([g['C'].mean(), g['C'].std(), g['D'].mean(),
-                              g['D'].std()], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
-            'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
-        assert_frame_equal(result, expected, check_like=True)
-
-        # same name as the original column
-        # GH9052
-        expected = g['D'].agg({'result1': np.sum, 'result2': np.mean})
-        expected = expected.rename(columns={'result1': 'D'})
-        result = g['D'].agg({'D': np.sum, 'result2': np.mean})
-        assert_frame_equal(result, expected, check_like=True)
-
-    def test_agg_python_multiindex(self):
-        grouped = self.mframe.groupby(['A', 'B'])
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        tm.assert_frame_equal(result, expected)
-
-    def test_aggregate_str_func(self):
-        def _check_results(grouped):
-            # single series
-            result = grouped['A'].agg('std')
-            expected = grouped['A'].std()
-            assert_series_equal(result, expected)
-
-            # group frame by function name
-            result = grouped.aggregate('var')
-            expected = grouped.var()
-            assert_frame_equal(result, expected)
-
-            # group frame by function dict
-            result = grouped.agg(OrderedDict([['A', 'var'], ['B', 'std'],
-                                              ['C', 'mean'], ['D', 'sem']]))
-            expected = DataFrame(OrderedDict([['A', grouped['A'].var(
-            )], ['B', grouped['B'].std()], ['C', grouped['C'].mean()],
-                ['D', grouped['D'].sem()]]))
-            assert_frame_equal(result, expected)
-
-        by_weekday = self.tsframe.groupby(lambda x: x.weekday())
-        _check_results(by_weekday)
-
-        by_mwkday = self.tsframe.groupby([lambda x: x.month,
-                                          lambda x: x.weekday()])
-        _check_results(by_mwkday)
-
-    def test_aggregate_item_by_item(self):
-
-        df = self.df.copy()
-        df['E'] = ['a'] * len(self.df)
-        grouped = self.df.groupby('A')
-
-        # API change in 0.11
-        # def aggfun(ser):
-        #     return len(ser + 'a')
-        # result = grouped.agg(aggfun)
-        # self.assertEqual(len(result.columns), 1)
-
-        aggfun = lambda ser: ser.size
-        result = grouped.agg(aggfun)
-        foo = (self.df.A == 'foo').sum()
-        bar = (self.df.A == 'bar').sum()
-        K = len(result.columns)
-
-        # GH5782
-        # odd comparisons can result here, so cast to make easy
-        exp = pd.Series(np.array([foo] * K), index=list('BCD'),
-                        dtype=np.float64, name='foo')
-        tm.assert_series_equal(result.xs('foo'), exp)
-
-        exp = pd.Series(np.array([bar] * K), index=list('BCD'),
-                        dtype=np.float64, name='bar')
-        tm.assert_almost_equal(result.xs('bar'), exp)
-
-        def aggfun(ser):
-            return ser.size
-
-        result = DataFrame().groupby(self.df.A).agg(aggfun)
-        tm.assertIsInstance(result, DataFrame)
-        self.assertEqual(len(result), 0)
-
-    def test_agg_item_by_item_raise_typeerror(self):
-        from numpy.random import randint
-
-        df = DataFrame(randint(10, size=(20, 10)))
-
-        def raiseException(df):
-            pprint_thing('----------------------------------------')
-            pprint_thing(df.to_string())
-            raise TypeError
-
-        self.assertRaises(TypeError, df.groupby(0).agg, raiseException)
-
-    def test_series_agg_multikey(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
-
-        result = grouped.agg(np.sum)
-        expected = grouped.sum()
-        assert_series_equal(result, expected)
-
-    def test_series_agg_multi_pure_python(self):
-        data = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny'],
-             'D': np.random.randn(11),
-             'E': np.random.randn(11),
-             'F': np.random.randn(11)})
-
-        def bad(x):
-            assert (len(x.base) > 0)
-            return 'foo'
-
-        result = data.groupby(['A', 'B']).agg(bad)
-        expected = data.groupby(['A', 'B']).agg(lambda x: 'foo')
-        assert_frame_equal(result, expected)
-
-    def test_cythonized_aggers(self):
-        data = {'A': [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., nan, nan],
-                'B': ['A', 'B'] * 6,
-                'C': np.random.randn(12)}
-        df = DataFrame(data)
-        df.loc[2:10:2, 'C'] = nan
-
-        def _testit(name):
-
-            op = lambda x: getattr(x, name)()
-
-            # single column
-            grouped = df.drop(['B'], axis=1).groupby('A')
-            exp = {}
-            for cat, group in grouped:
-                exp[cat] = op(group['C'])
-            exp = DataFrame({'C': exp})
-            exp.index.name = 'A'
-            result = op(grouped)
-            assert_frame_equal(result, exp)
-
-            # multiple columns
-            grouped = df.groupby(['A', 'B'])
-            expd = {}
-            for (cat1, cat2), group in grouped:
-                expd.setdefault(cat1, {})[cat2] = op(group['C'])
-            exp = DataFrame(expd).T.stack(dropna=False)
-            exp.index.names = ['A', 'B']
-            exp.name = 'C'
-
-            result = op(grouped)['C']
-            if not tm._incompat_bottleneck_version(name):
-                assert_series_equal(result, exp)
-
-        _testit('count')
-        _testit('sum')
-        _testit('std')
-        _testit('var')
-        _testit('sem')
-        _testit('mean')
-        _testit('median')
-        _testit('prod')
-        _testit('min')
-        _testit('max')
-
-    def test_cython_agg_boolean(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': np.random.randint(0, 2, 50).astype('bool')})
-        result = frame.groupby('a')['b'].mean()
-        expected = frame.groupby('a')['b'].agg(np.mean)
-
-        assert_series_equal(result, expected)
-
-    def test_cython_agg_nothing_to_agg(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25})
-        self.assertRaises(DataError, frame.groupby('a')['b'].mean)
-
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25})
-        self.assertRaises(DataError, frame[['b']].groupby(frame['a']).mean)
-
-    def test_cython_agg_nothing_to_agg_with_dates(self):
-        frame = DataFrame({'a': np.random.randint(0, 5, 50),
-                           'b': ['foo', 'bar'] * 25,
-                           'dates': pd.date_range('now', periods=50,
-                                                  freq='T')})
-        with tm.assertRaisesRegexp(DataError, "No numeric types to aggregate"):
-            frame.groupby('b').dates.mean()
-
-    def test_cython_agg_frame_columns(self):
-        # #2113
-        df = DataFrame({'x': [1, 2, 3], 'y': [3, 4, 5]})
-
-        df.groupby(level=0, axis='columns').mean()
-        df.groupby(level=0, axis='columns').mean()
-        df.groupby(level=0, axis='columns').mean()
-        df.groupby(level=0, axis='columns').mean()
-
-    def test_cython_fail_agg(self):
-        dr = bdate_range('1/1/2000', periods=50)
-        ts = Series(['A', 'B', 'C', 'D', 'E'] * 10, index=dr)
-
-        grouped = ts.groupby(lambda x: x.month)
-        summed = grouped.sum()
-        expected = grouped.agg(np.sum)
-        assert_series_equal(summed, expected)
-
-    def test_agg_consistency(self):
-        # agg with ([]) and () not consistent
-        # GH 6715
-
-        def P1(a):
-            try:
-                return np.percentile(a.dropna(), q=1)
-            except:
-                return np.nan
-
-        import datetime as dt
-        df = DataFrame({'col1': [1, 2, 3, 4],
-                        'col2': [10, 25, 26, 31],
-                        'date': [dt.date(2013, 2, 10), dt.date(2013, 2, 10),
-                                 dt.date(2013, 2, 11), dt.date(2013, 2, 11)]})
-
-        g = df.groupby('date')
-
-        expected = g.agg([P1])
-        expected.columns = expected.columns.levels[0]
-
-        result = g.agg(P1)
-        assert_frame_equal(result, expected)
-
-    def test_wrap_agg_out(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        def func(ser):
-            if ser.dtype == np.object:
-                raise TypeError
-            else:
-                return ser.sum()
-
-        result = grouped.aggregate(func)
-        exp_grouped = self.three_group.loc[:, self.three_group.columns != 'C']
-        expected = exp_grouped.groupby(['A', 'B']).aggregate(func)
-        assert_frame_equal(result, expected)
-
-    def test_agg_multiple_functions_maintain_order(self):
-        # GH #610
-        funcs = [('mean', np.mean), ('max', np.max), ('min', np.min)]
-        result = self.df.groupby('A')['C'].agg(funcs)
-        exp_cols = Index(['mean', 'max', 'min'])
-
-        self.assert_index_equal(result.columns, exp_cols)
-
-    def test_multiple_functions_tuples_and_non_tuples(self):
-        # #1359
-
-        funcs = [('foo', 'mean'), 'std']
-        ex_funcs = [('foo', 'mean'), ('std', 'std')]
-
-        result = self.df.groupby('A')['C'].agg(funcs)
-        expected = self.df.groupby('A')['C'].agg(ex_funcs)
-        assert_frame_equal(result, expected)
-
-        result = self.df.groupby('A').agg(funcs)
-        expected = self.df.groupby('A').agg(ex_funcs)
-        assert_frame_equal(result, expected)
-
-    def test_agg_multiple_functions_too_many_lambdas(self):
-        grouped = self.df.groupby('A')
-        funcs = ['mean', lambda x: x.mean(), lambda x: x.std()]
-
-        self.assertRaises(SpecificationError, grouped.agg, funcs)
-
-    def test_more_flexible_frame_multi_function(self):
-        from pandas import concat
-
-        grouped = self.df.groupby('A')
-
-        exmean = grouped.agg(OrderedDict([['C', np.mean], ['D', np.mean]]))
-        exstd = grouped.agg(OrderedDict([['C', np.std], ['D', np.std]]))
-
-        expected = concat([exmean, exstd], keys=['mean', 'std'], axis=1)
-        expected = expected.swaplevel(0, 1, axis=1).sort_index(level=0, axis=1)
-
-        d = OrderedDict([['C', [np.mean, np.std]], ['D', [np.mean, np.std]]])
-        result = grouped.aggregate(d)
-
-        assert_frame_equal(result, expected)
-
-        # be careful
-        result = grouped.aggregate(OrderedDict([['C', np.mean],
-                                                ['D', [np.mean, np.std]]]))
-        expected = grouped.aggregate(OrderedDict([['C', np.mean],
-                                                  ['D', [np.mean, np.std]]]))
-        assert_frame_equal(result, expected)
-
-        def foo(x):
-            return np.mean(x)
-
-        def bar(x):
-            return np.std(x, ddof=1)
-
-        d = OrderedDict([['C', np.mean], ['D', OrderedDict(
-            [['foo', np.mean], ['bar', np.std]])]])
-        result = grouped.aggregate(d)
-
-        d = OrderedDict([['C', [np.mean]], ['D', [foo, bar]]])
-        expected = grouped.aggregate(d)
-
-        assert_frame_equal(result, expected)
-
-    def test_multi_function_flexible_mix(self):
-        # GH #1268
-        grouped = self.df.groupby('A')
-
-        d = OrderedDict([['C', OrderedDict([['foo', 'mean'], [
-            'bar', 'std'
-        ]])], ['D', 'sum']])
-        result = grouped.aggregate(d)
-        d2 = OrderedDict([['C', OrderedDict([['foo', 'mean'], [
-            'bar', 'std'
-        ]])], ['D', ['sum']]])
-        result2 = grouped.aggregate(d2)
-
-        d3 = OrderedDict([['C', OrderedDict([['foo', 'mean'], [
-            'bar', 'std'
-        ]])], ['D', {'sum': 'sum'}]])
-        expected = grouped.aggregate(d3)
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-    def test_agg_callables(self):
-        # GH 7929
-        df = DataFrame({'foo': [1, 2], 'bar': [3, 4]}).astype(np.int64)
-
-        class fn_class(object):
-
-            def __call__(self, x):
-                return sum(x)
-
-        equiv_callables = [sum, np.sum, lambda x: sum(x), lambda x: x.sum(),
-                           partial(sum), fn_class()]
-
-        expected = df.groupby("foo").agg(sum)
-        for ecall in equiv_callables:
-            result = df.groupby('foo').agg(ecall)
-            assert_frame_equal(result, expected)
-
-    def test__cython_agg_general(self):
-        ops = [('mean', np.mean),
-               ('median', np.median),
-               ('var', np.var),
-               ('add', np.sum),
-               ('prod', np.prod),
-               ('min', np.min),
-               ('max', np.max),
-               ('first', lambda x: x.iloc[0]),
-               ('last', lambda x: x.iloc[-1]), ]
-        df = DataFrame(np.random.randn(1000))
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-
-        for op, targop in ops:
-            result = df.groupby(labels)._cython_agg_general(op)
-            expected = df.groupby(labels).agg(targop)
-            try:
-                tm.assert_frame_equal(result, expected)
-            except BaseException as exc:
-                exc.args += ('operation: %s' % op, )
-                raise
-
-    def test_cython_agg_empty_buckets(self):
-        ops = [('mean', np.mean),
-               ('median', lambda x: np.median(x) if len(x) > 0 else np.nan),
-               ('var', lambda x: np.var(x, ddof=1)),
-               ('add', lambda x: np.sum(x) if len(x) > 0 else np.nan),
-               ('prod', np.prod),
-               ('min', np.min),
-               ('max', np.max), ]
-
-        df = pd.DataFrame([11, 12, 13])
-        grps = range(0, 55, 5)
-
-        for op, targop in ops:
-            result = df.groupby(pd.cut(df[0], grps))._cython_agg_general(op)
-            expected = df.groupby(pd.cut(df[0], grps)).agg(lambda x: targop(x))
-            try:
-                tm.assert_frame_equal(result, expected)
-            except BaseException as exc:
-                exc.args += ('operation: %s' % op,)
-                raise
-
-    def test_agg_over_numpy_arrays(self):
-        # GH 3788
-        df = pd.DataFrame([[1, np.array([10, 20, 30])],
-                           [1, np.array([40, 50, 60])],
-                           [2, np.array([20, 30, 40])]],
-                          columns=['category', 'arraydata'])
-        result = df.groupby('category').agg(sum)
-
-        expected_data = [[np.array([50, 70, 90])], [np.array([20, 30, 40])]]
-        expected_index = pd.Index([1, 2], name='category')
-        expected_column = ['arraydata']
-        expected = pd.DataFrame(expected_data,
-                                index=expected_index,
-                                columns=expected_column)
-
-        assert_frame_equal(result, expected)
-
-    def test_agg_timezone_round_trip(self):
-        # GH 15426
-        ts = pd.Timestamp("2016-01-01 12:00:00", tz='US/Pacific')
-        df = pd.DataFrame({'a': 1, 'b': [ts + timedelta(minutes=nn)
-                                         for nn in range(10)]})
-
-        result1 = df.groupby('a')['b'].agg(np.min).iloc[0]
-        result2 = df.groupby('a')['b'].agg(lambda x: np.min(x)).iloc[0]
-        result3 = df.groupby('a')['b'].min().iloc[0]
-
-        assert result1 == ts
-        assert result2 == ts
-        assert result3 == ts
-
-        dates = [pd.Timestamp("2016-01-0%d 12:00:00" % i, tz='US/Pacific')
-                 for i in range(1, 5)]
-        df = pd.DataFrame({'A': ['a', 'b'] * 2, 'B': dates})
-        grouped = df.groupby('A')
-
-        ts = df['B'].iloc[0]
-        assert ts == grouped.nth(0)['B'].iloc[0]
-        assert ts == grouped.head(1)['B'].iloc[0]
-        assert ts == grouped.first()['B'].iloc[0]
-        assert ts == grouped.apply(lambda x: x.iloc[0])[0]
-
-        ts = df['B'].iloc[2]
-        assert ts == grouped.last()['B'].iloc[0]
-        assert ts == grouped.apply(lambda x: x.iloc[-1])[0]
diff --git a/pandas/tests/groupby/test_apply.py b/pandas/tests/groupby/test_apply.py
new file mode 100644
index 0000000000000..659d1a9cf9813
--- /dev/null
+++ b/pandas/tests/groupby/test_apply.py
@@ -0,0 +1,542 @@
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, bdate_range, compat
+from pandas.util import testing as tm
+
+
+def test_apply_issues():
+        # GH 5788
+
+    s = """2011.05.16,00:00,1.40893
+2011.05.16,01:00,1.40760
+2011.05.16,02:00,1.40750
+2011.05.16,03:00,1.40649
+2011.05.17,02:00,1.40893
+2011.05.17,03:00,1.40760
+2011.05.17,04:00,1.40750
+2011.05.17,05:00,1.40649
+2011.05.18,02:00,1.40893
+2011.05.18,03:00,1.40760
+2011.05.18,04:00,1.40750
+2011.05.18,05:00,1.40649"""
+
+    df = pd.read_csv(
+        compat.StringIO(s), header=None, names=['date', 'time', 'value'],
+        parse_dates=[['date', 'time']])
+    df = df.set_index('date_time')
+
+    expected = df.groupby(df.index.date).idxmax()
+    result = df.groupby(df.index.date).apply(lambda x: x.idxmax())
+    tm.assert_frame_equal(result, expected)
+
+    # GH 5789
+    # don't auto coerce dates
+    df = pd.read_csv(
+        compat.StringIO(s), header=None, names=['date', 'time', 'value'])
+    exp_idx = pd.Index(
+        ['2011.05.16', '2011.05.17', '2011.05.18'
+         ], dtype=object, name='date')
+    expected = Series(['00:00', '02:00', '02:00'], index=exp_idx)
+    result = df.groupby('date').apply(
+        lambda x: x['time'][x['value'].idxmax()])
+    tm.assert_series_equal(result, expected)
+
+
+def test_apply_trivial():
+    # GH 20066
+    # trivial apply: ignore input and return a constant dataframe.
+    df = pd.DataFrame({'key': ['a', 'a', 'b', 'b', 'a'],
+                       'data': [1.0, 2.0, 3.0, 4.0, 5.0]},
+                      columns=['key', 'data'])
+    expected = pd.concat([df.iloc[1:], df.iloc[1:]],
+                         axis=1, keys=['float64', 'object'])
+    result = df.groupby([str(x) for x in df.dtypes],
+                        axis=1).apply(lambda x: df.iloc[1:])
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.xfail(reason="GH#20066; function passed into apply "
+                          "returns a DataFrame with the same index "
+                          "as the one to create GroupBy object.")
+def test_apply_trivial_fail():
+    # GH 20066
+    # trivial apply fails if the constant dataframe has the same index
+    # with the one used to create GroupBy object.
+    df = pd.DataFrame({'key': ['a', 'a', 'b', 'b', 'a'],
+                       'data': [1.0, 2.0, 3.0, 4.0, 5.0]},
+                      columns=['key', 'data'])
+    expected = pd.concat([df, df],
+                         axis=1, keys=['float64', 'object'])
+    result = df.groupby([str(x) for x in df.dtypes],
+                        axis=1).apply(lambda x: df)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_fast_apply():
+    # make sure that fast apply is correctly called
+    # rather than raising any kind of error
+    # otherwise the python path will be callsed
+    # which slows things down
+    N = 1000
+    labels = np.random.randint(0, 2000, size=N)
+    labels2 = np.random.randint(0, 3, size=N)
+    df = DataFrame({'key': labels,
+                    'key2': labels2,
+                    'value1': np.random.randn(N),
+                    'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
+
+    def f(g):
+        return 1
+
+    g = df.groupby(['key', 'key2'])
+
+    grouper = g.grouper
+
+    splitter = grouper._get_splitter(g._selected_obj, axis=g.axis)
+    group_keys = grouper._get_group_keys()
+
+    values, mutated = splitter.fast_apply(f, group_keys)
+    assert not mutated
+
+
+def test_apply_with_mixed_dtype():
+    # GH3480, apply with mixed dtype on axis=1 breaks in 0.11
+    df = DataFrame({'foo1': np.random.randn(6),
+                    'foo2': ['one', 'two', 'two', 'three', 'one', 'two']})
+    result = df.apply(lambda x: x, axis=1)
+    tm.assert_series_equal(df.get_dtype_counts(), result.get_dtype_counts())
+
+    # GH 3610 incorrect dtype conversion with as_index=False
+    df = DataFrame({"c1": [1, 2, 6, 6, 8]})
+    df["c2"] = df.c1 / 2.0
+    result1 = df.groupby("c2").mean().reset_index().c2
+    result2 = df.groupby("c2", as_index=False).mean().c2
+    tm.assert_series_equal(result1, result2)
+
+
+def test_groupby_as_index_apply(df):
+    # GH #4648 and #3417
+    df = DataFrame({'item_id': ['b', 'b', 'a', 'c', 'a', 'b'],
+                    'user_id': [1, 2, 1, 1, 3, 1],
+                    'time': range(6)})
+
+    g_as = df.groupby('user_id', as_index=True)
+    g_not_as = df.groupby('user_id', as_index=False)
+
+    res_as = g_as.head(2).index
+    res_not_as = g_not_as.head(2).index
+    exp = Index([0, 1, 2, 4])
+    tm.assert_index_equal(res_as, exp)
+    tm.assert_index_equal(res_not_as, exp)
+
+    res_as_apply = g_as.apply(lambda x: x.head(2)).index
+    res_not_as_apply = g_not_as.apply(lambda x: x.head(2)).index
+
+    # apply doesn't maintain the original ordering
+    # changed in GH5610 as the as_index=False returns a MI here
+    exp_not_as_apply = MultiIndex.from_tuples([(0, 0), (0, 2), (1, 1), (
+        2, 4)])
+    tp = [(1, 0), (1, 2), (2, 1), (3, 4)]
+    exp_as_apply = MultiIndex.from_tuples(tp, names=['user_id', None])
+
+    tm.assert_index_equal(res_as_apply, exp_as_apply)
+    tm.assert_index_equal(res_not_as_apply, exp_not_as_apply)
+
+    ind = Index(list('abcde'))
+    df = DataFrame([[1, 2], [2, 3], [1, 4], [1, 5], [2, 6]], index=ind)
+    res = df.groupby(0, as_index=False).apply(lambda x: x).index
+    tm.assert_index_equal(res, ind)
+
+
+def test_apply_concat_preserve_names(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    def desc(group):
+        result = group.describe()
+        result.index.name = 'stat'
+        return result
+
+    def desc2(group):
+        result = group.describe()
+        result.index.name = 'stat'
+        result = result[:len(group)]
+        # weirdo
+        return result
+
+    def desc3(group):
+        result = group.describe()
+
+        # names are different
+        result.index.name = 'stat_%d' % len(group)
+
+        result = result[:len(group)]
+        # weirdo
+        return result
+
+    result = grouped.apply(desc)
+    assert result.index.names == ('A', 'B', 'stat')
+
+    result2 = grouped.apply(desc2)
+    assert result2.index.names == ('A', 'B', 'stat')
+
+    result3 = grouped.apply(desc3)
+    assert result3.index.names == ('A', 'B', None)
+
+
+def test_apply_series_to_frame():
+    def f(piece):
+        with np.errstate(invalid='ignore'):
+            logged = np.log(piece)
+        return DataFrame({'value': piece,
+                          'demeaned': piece - piece.mean(),
+                          'logged': logged})
+
+    dr = bdate_range('1/1/2000', periods=100)
+    ts = Series(np.random.randn(100), index=dr)
+
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(f)
+
+    assert isinstance(result, DataFrame)
+    tm.assert_index_equal(result.index, ts.index)
+
+
+def test_apply_series_yield_constant(df):
+    result = df.groupby(['A', 'B'])['C'].apply(len)
+    assert result.index.names[:2] == ('A', 'B')
+
+
+def test_apply_frame_yield_constant(df):
+    # GH13568
+    result = df.groupby(['A', 'B']).apply(len)
+    assert isinstance(result, Series)
+    assert result.name is None
+
+    result = df.groupby(['A', 'B'])[['C', 'D']].apply(len)
+    assert isinstance(result, Series)
+    assert result.name is None
+
+
+def test_apply_frame_to_series(df):
+    grouped = df.groupby(['A', 'B'])
+    result = grouped.apply(len)
+    expected = grouped.count()['C']
+    tm.assert_index_equal(result.index, expected.index)
+    tm.assert_numpy_array_equal(result.values, expected.values)
+
+
+def test_apply_frame_concat_series():
+    def trans(group):
+        return group.groupby('B')['C'].sum().sort_values()[:2]
+
+    def trans2(group):
+        grouped = group.groupby(df.reindex(group.index)['B'])
+        return grouped.sum().sort_values()[:2]
+
+    df = DataFrame({'A': np.random.randint(0, 5, 1000),
+                    'B': np.random.randint(0, 5, 1000),
+                    'C': np.random.randn(1000)})
+
+    result = df.groupby('A').apply(trans)
+    exp = df.groupby('A')['C'].apply(trans2)
+    tm.assert_series_equal(result, exp, check_names=False)
+    assert result.name == 'C'
+
+
+def test_apply_transform(ts):
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(lambda x: x * 2)
+    expected = grouped.transform(lambda x: x * 2)
+    tm.assert_series_equal(result, expected)
+
+
+def test_apply_multikey_corner(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+
+    def f(group):
+        return group.sort_values('A')[-5:]
+
+    result = grouped.apply(f)
+    for key, group in grouped:
+        tm.assert_frame_equal(result.loc[key], f(group))
+
+
+def test_apply_chunk_view():
+    # Low level tinkering could be unsafe, make sure not
+    df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+                    'value': compat.lrange(9)})
+
+    result = df.groupby('key', group_keys=False).apply(lambda x: x[:2])
+    expected = df.take([0, 1, 3, 4, 6, 7])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_no_name_column_conflict():
+    df = DataFrame({'name': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2],
+                    'name2': [0, 0, 0, 1, 1, 1, 0, 0, 1, 1],
+                    'value': compat.lrange(10)[::-1]})
+
+    # it works! #2605
+    grouped = df.groupby(['name', 'name2'])
+    grouped.apply(lambda x: x.sort_values('value', inplace=True))
+
+
+def test_apply_typecast_fail():
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(
+                        ['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)})
+
+    def f(group):
+        v = group['v']
+        group['v2'] = (v - v.min()) / (v.max() - v.min())
+        return group
+
+    result = df.groupby('d').apply(f)
+
+    expected = df.copy()
+    expected['v2'] = np.tile([0., 0.5, 1], 2)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_multiindex_fail():
+    index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
+                                    ])
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)}, index=index)
+
+    def f(group):
+        v = group['v']
+        group['v2'] = (v - v.min()) / (v.max() - v.min())
+        return group
+
+    result = df.groupby('d').apply(f)
+
+    expected = df.copy()
+    expected['v2'] = np.tile([0., 0.5, 1], 2)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_corner(tsframe):
+    result = tsframe.groupby(lambda x: x.year).apply(lambda x: x * 2)
+    expected = tsframe * 2
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_without_copy():
+    # GH 5545
+    # returning a non-copy in an applied function fails
+
+    data = DataFrame({'id_field': [100, 100, 200, 300],
+                      'category': ['a', 'b', 'c', 'c'],
+                      'value': [1, 2, 3, 4]})
+
+    def filt1(x):
+        if x.shape[0] == 1:
+            return x.copy()
+        else:
+            return x[x.category == 'c']
+
+    def filt2(x):
+        if x.shape[0] == 1:
+            return x
+        else:
+            return x[x.category == 'c']
+
+    expected = data.groupby('id_field').apply(filt1)
+    result = data.groupby('id_field').apply(filt2)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_apply_corner_cases():
+    # #535, can't use sliding iterator
+
+    N = 1000
+    labels = np.random.randint(0, 100, size=N)
+    df = DataFrame({'key': labels,
+                    'value1': np.random.randn(N),
+                    'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
+
+    grouped = df.groupby('key')
+
+    def f(g):
+        g['value3'] = g['value1'] * 2
+        return g
+
+    result = grouped.apply(f)
+    assert 'value3' in result
+
+
+def test_apply_numeric_coercion_when_datetime():
+    # In the past, group-by/apply operations have been over-eager
+    # in converting dtypes to numeric, in the presence of datetime
+    # columns.  Various GH issues were filed, the reproductions
+    # for which are here.
+
+    # GH 15670
+    df = pd.DataFrame({'Number': [1, 2],
+                       'Date': ["2017-03-02"] * 2,
+                       'Str': ["foo", "inf"]})
+    expected = df.groupby(['Number']).apply(lambda x: x.iloc[0])
+    df.Date = pd.to_datetime(df.Date)
+    result = df.groupby(['Number']).apply(lambda x: x.iloc[0])
+    tm.assert_series_equal(result['Str'], expected['Str'])
+
+    # GH 15421
+    df = pd.DataFrame({'A': [10, 20, 30],
+                       'B': ['foo', '3', '4'],
+                       'T': [pd.Timestamp("12:31:22")] * 3})
+
+    def get_B(g):
+        return g.iloc[0][['B']]
+    result = df.groupby('A').apply(get_B)['B']
+    expected = df.B
+    expected.index = df.A
+    tm.assert_series_equal(result, expected)
+
+    # GH 14423
+    def predictions(tool):
+        out = pd.Series(index=['p1', 'p2', 'useTime'], dtype=object)
+        if 'step1' in list(tool.State):
+            out['p1'] = str(tool[tool.State == 'step1'].Machine.values[0])
+        if 'step2' in list(tool.State):
+            out['p2'] = str(tool[tool.State == 'step2'].Machine.values[0])
+            out['useTime'] = str(
+                tool[tool.State == 'step2'].oTime.values[0])
+        return out
+    df1 = pd.DataFrame({'Key': ['B', 'B', 'A', 'A'],
+                        'State': ['step1', 'step2', 'step1', 'step2'],
+                        'oTime': ['', '2016-09-19 05:24:33',
+                                  '', '2016-09-19 23:59:04'],
+                        'Machine': ['23', '36L', '36R', '36R']})
+    df2 = df1.copy()
+    df2.oTime = pd.to_datetime(df2.oTime)
+    expected = df1.groupby('Key').apply(predictions).p1
+    result = df2.groupby('Key').apply(predictions).p1
+    tm.assert_series_equal(expected, result)
+
+
+def test_time_field_bug():
+    # Test a fix for the following error related to GH issue 11324 When
+    # non-key fields in a group-by dataframe contained time-based fields
+    # that were not returned by the apply function, an exception would be
+    # raised.
+
+    df = pd.DataFrame({'a': 1, 'b': [datetime.now() for nn in range(10)]})
+
+    def func_with_no_date(batch):
+        return pd.Series({'c': 2})
+
+    def func_with_date(batch):
+        return pd.Series({'b': datetime(2015, 1, 1), 'c': 2})
+
+    dfg_no_conversion = df.groupby(by=['a']).apply(func_with_no_date)
+    dfg_no_conversion_expected = pd.DataFrame({'c': 2}, index=[1])
+    dfg_no_conversion_expected.index.name = 'a'
+
+    dfg_conversion = df.groupby(by=['a']).apply(func_with_date)
+    dfg_conversion_expected = pd.DataFrame(
+        {'b': datetime(2015, 1, 1),
+         'c': 2}, index=[1])
+    dfg_conversion_expected.index.name = 'a'
+
+    tm.assert_frame_equal(dfg_no_conversion, dfg_no_conversion_expected)
+    tm.assert_frame_equal(dfg_conversion, dfg_conversion_expected)
+
+
+def test_gb_apply_list_of_unequal_len_arrays():
+
+    # GH1738
+    df = DataFrame({'group1': ['a', 'a', 'a', 'b', 'b', 'b', 'a', 'a', 'a',
+                               'b', 'b', 'b'],
+                    'group2': ['c', 'c', 'd', 'd', 'd', 'e', 'c', 'c', 'd',
+                               'd', 'd', 'e'],
+                    'weight': [1.1, 2, 3, 4, 5, 6, 2, 4, 6, 8, 1, 2],
+                    'value': [7.1, 8, 9, 10, 11, 12, 8, 7, 6, 5, 4, 3]})
+    df = df.set_index(['group1', 'group2'])
+    df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
+
+    def noddy(value, weight):
+        out = np.array(value * weight).repeat(3)
+        return out
+
+    # the kernel function returns arrays of unequal length
+    # pandas sniffs the first one, sees it's an array and not
+    # a list, and assumed the rest are of equal length
+    # and so tries a vstack
+
+    # don't die
+    df_grouped.apply(lambda x: noddy(x.value, x.weight))
+
+
+def test_groupby_apply_all_none():
+    # Tests to make sure no errors if apply function returns all None
+    # values. Issue 9684.
+    test_df = DataFrame({'groups': [0, 0, 1, 1],
+                         'random_vars': [8, 7, 4, 5]})
+
+    def test_func(x):
+        pass
+
+    result = test_df.groupby('groups').apply(test_func)
+    expected = DataFrame()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_apply_none_first():
+    # GH 12824. Tests if apply returns None first.
+    test_df1 = DataFrame({'groups': [1, 1, 1, 2], 'vars': [0, 1, 2, 3]})
+    test_df2 = DataFrame({'groups': [1, 2, 2, 2], 'vars': [0, 1, 2, 3]})
+
+    def test_func(x):
+        if x.shape[0] < 2:
+            return None
+        return x.iloc[[0, -1]]
+
+    result1 = test_df1.groupby('groups').apply(test_func)
+    result2 = test_df2.groupby('groups').apply(test_func)
+    index1 = MultiIndex.from_arrays([[1, 1], [0, 2]],
+                                    names=['groups', None])
+    index2 = MultiIndex.from_arrays([[2, 2], [1, 3]],
+                                    names=['groups', None])
+    expected1 = DataFrame({'groups': [1, 1], 'vars': [0, 2]},
+                          index=index1)
+    expected2 = DataFrame({'groups': [2, 2], 'vars': [1, 3]},
+                          index=index2)
+    tm.assert_frame_equal(result1, expected1)
+    tm.assert_frame_equal(result2, expected2)
+
+
+def test_groupby_apply_return_empty_chunk():
+    # GH 22221: apply filter which returns some empty groups
+    df = pd.DataFrame(dict(value=[0, 1], group=['filled', 'empty']))
+    groups = df.groupby('group')
+    result = groups.apply(lambda group: group[group.value != 1]['value'])
+    expected = pd.Series([0], name='value',
+                         index=MultiIndex.from_product([['empty', 'filled'],
+                                                        [0]],
+                                                       names=['group', None]
+                                                       ).drop('empty'))
+    tm.assert_series_equal(result, expected)
+
+
+def test_apply_with_mixed_types():
+    # gh-20949
+    df = pd.DataFrame({'A': 'a a b'.split(), 'B': [1, 2, 3], 'C': [4, 6, 5]})
+    g = df.groupby('A')
+
+    result = g.transform(lambda x: x / x.sum())
+    expected = pd.DataFrame({'B': [1 / 3., 2 / 3., 1], 'C': [0.4, 0.6, 1.0]})
+    tm.assert_frame_equal(result, expected)
+
+    result = g.apply(lambda x: x / x.sum())
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_bin_groupby.py b/pandas/tests/groupby/test_bin_groupby.py
index 02c7933e020ea..d7ea9bdf9209b 100644
--- a/pandas/tests/groupby/test_bin_groupby.py
+++ b/pandas/tests/groupby/test_bin_groupby.py
@@ -1,13 +1,17 @@
 # -*- coding: utf-8 -*-
 
-from numpy import nan
 import numpy as np
+from numpy import nan
+import pytest
 
-from pandas.types.common import _ensure_int64
-from pandas import Index, isnull
-from pandas.util.testing import assert_almost_equal
+from pandas._libs import groupby, lib, reduction
+
+from pandas.core.dtypes.common import ensure_int64
+
+from pandas import Index, isna
+from pandas.core.groupby.ops import generate_bins_generic
 import pandas.util.testing as tm
-from pandas._libs import lib, groupby
+from pandas.util.testing import assert_almost_equal
 
 
 def test_series_grouper():
@@ -17,7 +21,7 @@ def test_series_grouper():
 
     labels = np.array([-1, -1, -1, 0, 0, 0, 1, 1, 1, 1], dtype=np.int64)
 
-    grouper = lib.SeriesGrouper(obj, np.mean, labels, 2, dummy)
+    grouper = reduction.SeriesGrouper(obj, np.mean, labels, 2, dummy)
     result, counts = grouper.get_result()
 
     expected = np.array([obj[3:6].mean(), obj[6:].mean()])
@@ -34,7 +38,7 @@ def test_series_bin_grouper():
 
     bins = np.array([3, 6])
 
-    grouper = lib.SeriesBinGrouper(obj, np.mean, bins, dummy)
+    grouper = reduction.SeriesBinGrouper(obj, np.mean, bins, dummy)
     result, counts = grouper.get_result()
 
     expected = np.array([obj[:3].mean(), obj[3:6].mean(), obj[6:].mean()])
@@ -44,15 +48,14 @@ def test_series_bin_grouper():
     assert_almost_equal(counts, exp_counts)
 
 
-class TestBinGroupers(tm.TestCase):
+class TestBinGroupers(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.obj = np.random.randn(10, 1)
         self.labels = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2, 2], dtype=np.int64)
         self.bins = np.array([3, 6], dtype=np.int64)
 
     def test_generate_bins(self):
-        from pandas.core.groupby import generate_bins_generic
         values = np.array([1, 2, 3, 4, 5, 6], dtype=np.int64)
         binner = np.array([0, 3, 6, 9], dtype=np.int64)
 
@@ -70,15 +73,18 @@ def test_generate_bins(self):
             bins = func(values, binner, closed='right')
             assert ((bins == np.array([3, 6])).all())
 
-        self.assertRaises(ValueError, generate_bins_generic, values, [],
-                          'right')
-        self.assertRaises(ValueError, generate_bins_generic, values[:0],
-                          binner, 'right')
+        msg = "Invalid length for values or for binner"
+        with pytest.raises(ValueError, match=msg):
+            generate_bins_generic(values, [], 'right')
+        with pytest.raises(ValueError, match=msg):
+            generate_bins_generic(values[:0], binner, 'right')
 
-        self.assertRaises(ValueError, generate_bins_generic, values, [4],
-                          'right')
-        self.assertRaises(ValueError, generate_bins_generic, values, [-3, -1],
-                          'right')
+        msg = "Values falls before first bin"
+        with pytest.raises(ValueError, match=msg):
+            generate_bins_generic(values, [4], 'right')
+        msg = "Values falls after last bin"
+        with pytest.raises(ValueError, match=msg):
+            generate_bins_generic(values, [-3, -1], 'right')
 
 
 def test_group_ohlc():
@@ -88,14 +94,14 @@ def _check(dtype):
         bins = np.array([6, 12, 20])
         out = np.zeros((3, 4), dtype)
         counts = np.zeros(len(out), dtype=np.int64)
-        labels = _ensure_int64(np.repeat(np.arange(3),
-                                         np.diff(np.r_[0, bins])))
+        labels = ensure_int64(np.repeat(np.arange(3),
+                                        np.diff(np.r_[0, bins])))
 
         func = getattr(groupby, 'group_ohlc_%s' % dtype)
         func(out, counts, obj[:, None], labels)
 
         def _ohlc(group):
-            if isnull(group).all():
+            if isna(group).all():
                 return np.repeat(nan, 4)
             return [group[0], group.max(), group.min(), group[-1]]
 
@@ -115,36 +121,37 @@ def _ohlc(group):
     _check('float64')
 
 
-class TestMoments(tm.TestCase):
+class TestMoments(object):
     pass
 
 
-class TestReducer(tm.TestCase):
+class TestReducer(object):
 
     def test_int_index(self):
         from pandas.core.series import Series
 
         arr = np.random.randn(100, 4)
-        result = lib.reduce(arr, np.sum, labels=Index(np.arange(4)))
+        result = reduction.reduce(arr, np.sum, labels=Index(np.arange(4)))
         expected = arr.sum(0)
         assert_almost_equal(result, expected)
 
-        result = lib.reduce(arr, np.sum, axis=1, labels=Index(np.arange(100)))
+        result = reduction.reduce(arr, np.sum, axis=1,
+                                  labels=Index(np.arange(100)))
         expected = arr.sum(1)
         assert_almost_equal(result, expected)
 
         dummy = Series(0., index=np.arange(100))
-        result = lib.reduce(arr, np.sum, dummy=dummy,
-                            labels=Index(np.arange(4)))
+        result = reduction.reduce(arr, np.sum, dummy=dummy,
+                                  labels=Index(np.arange(4)))
         expected = arr.sum(0)
         assert_almost_equal(result, expected)
 
         dummy = Series(0., index=np.arange(4))
-        result = lib.reduce(arr, np.sum, axis=1, dummy=dummy,
-                            labels=Index(np.arange(100)))
+        result = reduction.reduce(arr, np.sum, axis=1, dummy=dummy,
+                                  labels=Index(np.arange(100)))
         expected = arr.sum(1)
         assert_almost_equal(result, expected)
 
-        result = lib.reduce(arr, np.sum, axis=1, dummy=dummy,
-                            labels=Index(np.arange(100)))
+        result = reduction.reduce(arr, np.sum, axis=1, dummy=dummy,
+                                  labels=Index(np.arange(100)))
         assert_almost_equal(result, expected)
diff --git a/pandas/tests/groupby/test_categorical.py b/pandas/tests/groupby/test_categorical.py
index cfcb531bedab8..e118135ccc75d 100644
--- a/pandas/tests/groupby/test_categorical.py
+++ b/pandas/tests/groupby/test_categorical.py
@@ -1,529 +1,936 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
+
 from datetime import datetime
 
 import numpy as np
-from numpy import nan
+import pytest
+
+from pandas.compat import PY37
 
 import pandas as pd
-from pandas import (Index, MultiIndex, CategoricalIndex,
-                    DataFrame, Categorical, Series)
-from pandas.util.testing import assert_frame_equal, assert_series_equal
+from pandas import (
+    Categorical, CategoricalIndex, DataFrame, Index, MultiIndex, Series, qcut)
 import pandas.util.testing as tm
-from .common import MixIn
-
-
-class TestGroupByCategorical(MixIn, tm.TestCase):
-
-    def test_level_groupby_get_group(self):
-        # GH15155
-        df = DataFrame(data=np.arange(2, 22, 2),
-                       index=MultiIndex(
-                           levels=[pd.CategoricalIndex(["a", "b"]), range(10)],
-                           labels=[[0] * 5 + [1] * 5, range(10)],
-                           names=["Index1", "Index2"]))
-        g = df.groupby(level=["Index1"])
-
-        # expected should equal test.loc[["a"]]
-        # GH15166
-        expected = DataFrame(data=np.arange(2, 12, 2),
-                             index=pd.MultiIndex(levels=[pd.CategoricalIndex(
-                                 ["a", "b"]), range(5)],
-            labels=[[0] * 5, range(5)],
-            names=["Index1", "Index2"]))
-        result = g.get_group('a')
-
-        assert_frame_equal(result, expected)
-
-    def test_apply_use_categorical_name(self):
-        from pandas import qcut
-        cats = qcut(self.df.C, 4)
-
-        def get_stats(group):
-            return {'min': group.min(),
-                    'max': group.max(),
-                    'count': group.count(),
-                    'mean': group.mean()}
-
-        result = self.df.groupby(cats).D.apply(get_stats)
-        self.assertEqual(result.index.names[0], 'C')
-
-    def test_apply_categorical_data(self):
-        # GH 10138
-        for ordered in [True, False]:
-            dense = Categorical(list('abc'), ordered=ordered)
-            # 'b' is in the categories but not in the list
-            missing = Categorical(
-                list('aaa'), categories=['a', 'b'], ordered=ordered)
-            values = np.arange(len(dense))
-            df = DataFrame({'missing': missing,
-                            'dense': dense,
-                            'values': values})
-            grouped = df.groupby(['missing', 'dense'])
-
-            # missing category 'b' should still exist in the output index
-            idx = MultiIndex.from_product(
-                [Categorical(['a', 'b'], ordered=ordered),
-                 Categorical(['a', 'b', 'c'], ordered=ordered)],
-                names=['missing', 'dense'])
-            expected = DataFrame([0, 1, 2, np.nan, np.nan, np.nan],
-                                 index=idx,
-                                 columns=['values'])
-
-            assert_frame_equal(grouped.apply(lambda x: np.mean(x)), expected)
-            assert_frame_equal(grouped.mean(), expected)
-            assert_frame_equal(grouped.agg(np.mean), expected)
-
-            # but for transform we should still get back the original index
-            idx = MultiIndex.from_product([['a'], ['a', 'b', 'c']],
-                                          names=['missing', 'dense'])
-            expected = Series(1, index=idx)
-            assert_series_equal(grouped.apply(lambda x: 1), expected)
-
-    def test_groupby_categorical(self):
-        levels = ['foo', 'bar', 'baz', 'qux']
-        codes = np.random.randint(0, 4, size=100)
-
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-
-        data = DataFrame(np.random.randn(100, 4))
-
-        result = data.groupby(cats).mean()
-
-        expected = data.groupby(np.asarray(cats)).mean()
-        exp_idx = CategoricalIndex(levels, categories=cats.categories,
-                                   ordered=True)
-        expected = expected.reindex(exp_idx)
-
-        assert_frame_equal(result, expected)
-
-        grouped = data.groupby(cats)
-        desc_result = grouped.describe()
-
-        idx = cats.codes.argsort()
-        ord_labels = np.asarray(cats).take(idx)
-        ord_data = data.take(idx)
-
-        exp_cats = Categorical(ord_labels, ordered=True,
-                               categories=['foo', 'bar', 'baz', 'qux'])
-        expected = ord_data.groupby(exp_cats, sort=False).describe()
-        assert_frame_equal(desc_result, expected)
-
-        # GH 10460
-        expc = Categorical.from_codes(np.arange(4).repeat(8),
-                                      levels, ordered=True)
-        exp = CategoricalIndex(expc)
-        self.assert_index_equal((desc_result.stack()
-                                            .index
-                                            .get_level_values(0)), exp)
-        exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
-                     '75%', 'max'] * 4)
-        self.assert_index_equal((desc_result.stack()
-                                            .index
-                                            .get_level_values(1)), exp)
-
-    def test_groupby_datetime_categorical(self):
-        # GH9049: ensure backward compatibility
-        levels = pd.date_range('2014-01-01', periods=4)
-        codes = np.random.randint(0, 4, size=100)
-
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-
-        data = DataFrame(np.random.randn(100, 4))
-        result = data.groupby(cats).mean()
-
-        expected = data.groupby(np.asarray(cats)).mean()
-        expected = expected.reindex(levels)
-        expected.index = CategoricalIndex(expected.index,
-                                          categories=expected.index,
-                                          ordered=True)
-
+from pandas.util.testing import (
+    assert_equal, assert_frame_equal, assert_series_equal)
+
+
+def cartesian_product_for_groupers(result, args, names):
+    """ Reindex to a cartesian production for the groupers,
+    preserving the nature (Categorical) of each grouper """
+
+    def f(a):
+        if isinstance(a, (CategoricalIndex, Categorical)):
+            categories = a.categories
+            a = Categorical.from_codes(np.arange(len(categories)),
+                                       categories=categories,
+                                       ordered=a.ordered)
+        return a
+
+    index = pd.MultiIndex.from_product(map(f, args), names=names)
+    return result.reindex(index).sort_index()
+
+
+def test_apply_use_categorical_name(df):
+    cats = qcut(df.C, 4)
+
+    def get_stats(group):
+        return {'min': group.min(),
+                'max': group.max(),
+                'count': group.count(),
+                'mean': group.mean()}
+
+    result = df.groupby(cats, observed=False).D.apply(get_stats)
+    assert result.index.names[0] == 'C'
+
+
+def test_basic():
+
+    cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
+                       categories=["a", "b", "c", "d"], ordered=True)
+    data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
+
+    exp_index = CategoricalIndex(list('abcd'), name='b', ordered=True)
+    expected = DataFrame({'a': [1, 2, 4, np.nan]}, index=exp_index)
+    result = data.groupby("b", observed=False).mean()
+    tm.assert_frame_equal(result, expected)
+
+    cat1 = Categorical(["a", "a", "b", "b"],
+                       categories=["a", "b", "z"], ordered=True)
+    cat2 = Categorical(["c", "d", "c", "d"],
+                       categories=["c", "d", "y"], ordered=True)
+    df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+
+    # single grouper
+    gb = df.groupby("A", observed=False)
+    exp_idx = CategoricalIndex(['a', 'b', 'z'], name='A', ordered=True)
+    expected = DataFrame({'values': Series([3, 7, 0], index=exp_idx)})
+    result = gb.sum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 8623
+    x = DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
+                   [1, 'John P. Doe']],
+                  columns=['person_id', 'person_name'])
+    x['person_name'] = Categorical(x.person_name)
+
+    g = x.groupby(['person_id'], observed=False)
+    result = g.transform(lambda x: x)
+    tm.assert_frame_equal(result, x[['person_name']])
+
+    result = x.drop_duplicates('person_name')
+    expected = x.iloc[[0, 1]]
+    tm.assert_frame_equal(result, expected)
+
+    def f(x):
+        return x.drop_duplicates('person_name').iloc[0]
+
+    result = g.apply(f)
+    expected = x.iloc[[0, 1]].copy()
+    expected.index = Index([1, 2], name='person_id')
+    expected['person_name'] = expected['person_name'].astype('object')
+    tm.assert_frame_equal(result, expected)
+
+    # GH 9921
+    # Monotonic
+    df = DataFrame({"a": [5, 15, 25]})
+    c = pd.cut(df.a, bins=[0, 10, 20, 30, 40])
+
+    result = df.a.groupby(c, observed=False).transform(sum)
+    tm.assert_series_equal(result, df['a'])
+
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(sum),
+        df[['a']])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(lambda xs: np.max(xs)),
+        df[['a']])
+
+    # Filter
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).filter(np.all),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).filter(np.all),
+        df)
+
+    # Non-monotonic
+    df = DataFrame({"a": [5, 15, 25, -5]})
+    c = pd.cut(df.a, bins=[-10, 0, 10, 20, 30, 40])
+
+    result = df.a.groupby(c, observed=False).transform(sum)
+    tm.assert_series_equal(result, df['a'])
+
+    tm.assert_series_equal(
+        df.a.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df['a'])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(sum),
+        df[['a']])
+    tm.assert_frame_equal(
+        df.groupby(c, observed=False).transform(lambda xs: np.sum(xs)),
+        df[['a']])
+
+    # GH 9603
+    df = DataFrame({'a': [1, 0, 0, 0]})
+    c = pd.cut(df.a, [0, 1, 2, 3, 4], labels=Categorical(list('abcd')))
+    result = df.groupby(c, observed=False).apply(len)
+
+    exp_index = CategoricalIndex(
+        c.values.categories, ordered=c.values.ordered)
+    expected = Series([1, 0, 0, 0], index=exp_index)
+    expected.index.name = 'a'
+    tm.assert_series_equal(result, expected)
+
+    # more basic
+    levels = ['foo', 'bar', 'baz', 'qux']
+    codes = np.random.randint(0, 4, size=100)
+
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+
+    data = DataFrame(np.random.randn(100, 4))
+
+    result = data.groupby(cats, observed=False).mean()
+
+    expected = data.groupby(np.asarray(cats), observed=False).mean()
+    exp_idx = CategoricalIndex(levels, categories=cats.categories,
+                               ordered=True)
+    expected = expected.reindex(exp_idx)
+
+    assert_frame_equal(result, expected)
+
+    grouped = data.groupby(cats, observed=False)
+    desc_result = grouped.describe()
+
+    idx = cats.codes.argsort()
+    ord_labels = np.asarray(cats).take(idx)
+    ord_data = data.take(idx)
+
+    exp_cats = Categorical(ord_labels, ordered=True,
+                           categories=['foo', 'bar', 'baz', 'qux'])
+    expected = ord_data.groupby(
+        exp_cats, sort=False, observed=False).describe()
+    assert_frame_equal(desc_result, expected)
+
+    # GH 10460
+    expc = Categorical.from_codes(np.arange(4).repeat(8),
+                                  levels, ordered=True)
+    exp = CategoricalIndex(expc)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(0)), exp)
+    exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
+                 '75%', 'max'] * 4)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(1)), exp)
+
+
+def test_level_get_group(observed):
+    # GH15155
+    df = DataFrame(data=np.arange(2, 22, 2),
+                   index=MultiIndex(
+                       levels=[pd.CategoricalIndex(["a", "b"]), range(10)],
+                       codes=[[0] * 5 + [1] * 5, range(10)],
+                       names=["Index1", "Index2"]))
+    g = df.groupby(level=["Index1"], observed=observed)
+
+    # expected should equal test.loc[["a"]]
+    # GH15166
+    expected = DataFrame(data=np.arange(2, 12, 2),
+                         index=pd.MultiIndex(levels=[pd.CategoricalIndex(
+                             ["a", "b"]), range(5)],
+        codes=[[0] * 5, range(5)],
+        names=["Index1", "Index2"]))
+    result = g.get_group('a')
+
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.xfail(PY37, reason="flaky on 3.7, xref gh-21636", strict=False)
+@pytest.mark.parametrize('ordered', [True, False])
+def test_apply(ordered):
+    # GH 10138
+
+    dense = Categorical(list('abc'), ordered=ordered)
+
+    # 'b' is in the categories but not in the list
+    missing = Categorical(
+        list('aaa'), categories=['a', 'b'], ordered=ordered)
+    values = np.arange(len(dense))
+    df = DataFrame({'missing': missing,
+                    'dense': dense,
+                    'values': values})
+    grouped = df.groupby(['missing', 'dense'], observed=True)
+
+    # missing category 'b' should still exist in the output index
+    idx = MultiIndex.from_arrays(
+        [missing, dense], names=['missing', 'dense'])
+    expected = DataFrame([0, 1, 2.],
+                         index=idx,
+                         columns=['values'])
+
+    result = grouped.apply(lambda x: np.mean(x))
+    assert_frame_equal(result, expected)
+
+    # we coerce back to ints
+    expected = expected.astype('int')
+    result = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    result = grouped.agg(np.mean)
+    assert_frame_equal(result, expected)
+
+    # but for transform we should still get back the original index
+    idx = MultiIndex.from_arrays([missing, dense],
+                                 names=['missing', 'dense'])
+    expected = Series(1, index=idx)
+    result = grouped.apply(lambda x: 1)
+    assert_series_equal(result, expected)
+
+
+def test_observed(observed):
+    # multiple groupers, don't re-expand the output space
+    # of the grouper
+    # gh-14942 (implement)
+    # gh-10132 (back-compat)
+    # gh-8138 (back-compat)
+    # gh-8869
+
+    cat1 = Categorical(["a", "a", "b", "b"],
+                       categories=["a", "b", "z"], ordered=True)
+    cat2 = Categorical(["c", "d", "c", "d"],
+                       categories=["c", "d", "y"], ordered=True)
+    df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+    df['C'] = ['foo', 'bar'] * 2
+
+    # multiple groupers with a non-cat
+    gb = df.groupby(['A', 'B', 'C'], observed=observed)
+    exp_index = pd.MultiIndex.from_arrays(
+        [cat1, cat2, ['foo', 'bar'] * 2],
+        names=['A', 'B', 'C'])
+    expected = DataFrame({'values': Series(
+        [1, 2, 3, 4], index=exp_index)}).sort_index()
+    result = gb.sum()
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [cat1, cat2, ['foo', 'bar']],
+            list('ABC'))
+
+    tm.assert_frame_equal(result, expected)
+
+    gb = df.groupby(['A', 'B'], observed=observed)
+    exp_index = pd.MultiIndex.from_arrays(
+        [cat1, cat2],
+        names=['A', 'B'])
+    expected = DataFrame({'values': [1, 2, 3, 4]},
+                         index=exp_index)
+    result = gb.sum()
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [cat1, cat2],
+            list('AB'))
+
+    tm.assert_frame_equal(result, expected)
+
+    # https://github.com/pandas-dev/pandas/issues/8138
+    d = {'cat':
+         pd.Categorical(["a", "b", "a", "b"], categories=["a", "b", "c"],
+                        ordered=True),
+         'ints': [1, 1, 2, 2],
+         'val': [10, 20, 30, 40]}
+    df = pd.DataFrame(d)
+
+    # Grouping on a single column
+    groups_single_key = df.groupby("cat", observed=observed)
+    result = groups_single_key.mean()
+
+    exp_index = pd.CategoricalIndex(list('ab'), name="cat",
+                                    categories=list('abc'),
+                                    ordered=True)
+    expected = DataFrame({"ints": [1.5, 1.5], "val": [20., 30]},
+                         index=exp_index)
+    if not observed:
+        index = pd.CategoricalIndex(list('abc'), name="cat",
+                                    categories=list('abc'),
+                                    ordered=True)
+        expected = expected.reindex(index)
+
+    tm.assert_frame_equal(result, expected)
+
+    # Grouping on two columns
+    groups_double_key = df.groupby(["cat", "ints"], observed=observed)
+    result = groups_double_key.agg('mean')
+    expected = DataFrame(
+        {"val": [10, 30, 20, 40],
+         "cat": pd.Categorical(['a', 'a', 'b', 'b'],
+                               categories=['a', 'b', 'c'],
+                               ordered=True),
+         "ints": [1, 2, 1, 2]}).set_index(["cat", "ints"])
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [df.cat.values, [1, 2]],
+            ['cat', 'ints'])
+
+    tm.assert_frame_equal(result, expected)
+
+    # GH 10132
+    for key in [('a', 1), ('b', 2), ('b', 1), ('a', 2)]:
+        c, i = key
+        result = groups_double_key.get_group(key)
+        expected = df[(df.cat == c) & (df.ints == i)]
         assert_frame_equal(result, expected)
 
-        grouped = data.groupby(cats)
-        desc_result = grouped.describe()
-
-        idx = cats.codes.argsort()
-        ord_labels = cats.take_nd(idx)
-        ord_data = data.take(idx)
-        expected = ord_data.groupby(ord_labels).describe()
-        assert_frame_equal(desc_result, expected)
-        tm.assert_index_equal(desc_result.index, expected.index)
-        tm.assert_index_equal(
-            desc_result.index.get_level_values(0),
-            expected.index.get_level_values(0))
-
-        # GH 10460
-        expc = Categorical.from_codes(
-            np.arange(4).repeat(8), levels, ordered=True)
-        exp = CategoricalIndex(expc)
-        self.assert_index_equal((desc_result.stack()
-                                            .index
-                                            .get_level_values(0)), exp)
-        exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
-                     '75%', 'max'] * 4)
-        self.assert_index_equal((desc_result.stack()
-                                            .index
-                                            .get_level_values(1)), exp)
-
-    def test_groupby_categorical_index(self):
-
-        s = np.random.RandomState(12345)
-        levels = ['foo', 'bar', 'baz', 'qux']
-        codes = s.randint(0, 4, size=20)
-        cats = Categorical.from_codes(codes, levels, ordered=True)
-        df = DataFrame(
-            np.repeat(
-                np.arange(20), 4).reshape(-1, 4), columns=list('abcd'))
-        df['cats'] = cats
-
-        # with a cat index
-        result = df.set_index('cats').groupby(level=0).sum()
-        expected = df[list('abcd')].groupby(cats.codes).sum()
-        expected.index = CategoricalIndex(
-            Categorical.from_codes(
-                [0, 1, 2, 3], levels, ordered=True), name='cats')
-        assert_frame_equal(result, expected)
-
-        # with a cat column, should produce a cat index
-        result = df.groupby('cats').sum()
-        expected = df[list('abcd')].groupby(cats.codes).sum()
-        expected.index = CategoricalIndex(
-            Categorical.from_codes(
-                [0, 1, 2, 3], levels, ordered=True), name='cats')
-        assert_frame_equal(result, expected)
-
-    def test_groupby_describe_categorical_columns(self):
-        # GH 11558
-        cats = pd.CategoricalIndex(['qux', 'foo', 'baz', 'bar'],
-                                   categories=['foo', 'bar', 'baz', 'qux'],
-                                   ordered=True)
-        df = DataFrame(np.random.randn(20, 4), columns=cats)
-        result = df.groupby([1, 2, 3, 4] * 5).describe()
-
-        tm.assert_index_equal(result.stack().columns, cats)
-        tm.assert_categorical_equal(result.stack().columns.values, cats.values)
-
-    def test_groupby_unstack_categorical(self):
-        # GH11558 (example is taken from the original issue)
-        df = pd.DataFrame({'a': range(10),
-                           'medium': ['A', 'B'] * 5,
-                           'artist': list('XYXXY') * 2})
-        df['medium'] = df['medium'].astype('category')
-
-        gcat = df.groupby(['artist', 'medium'])['a'].count().unstack()
-        result = gcat.describe()
-
-        exp_columns = pd.CategoricalIndex(['A', 'B'], ordered=False,
-                                          name='medium')
-        tm.assert_index_equal(result.columns, exp_columns)
-        tm.assert_categorical_equal(result.columns.values, exp_columns.values)
-
-        result = gcat['A'] + gcat['B']
-        expected = pd.Series([6, 4], index=pd.Index(['X', 'Y'], name='artist'))
-        tm.assert_series_equal(result, expected)
-
-    def test_groupby_bins_unequal_len(self):
-        # GH3011
-        series = Series([np.nan, np.nan, 1, 1, 2, 2, 3, 3, 4, 4])
-        bins = pd.cut(series.dropna().values, 4)
-
-        # len(bins) != len(series) here
-        def f():
-            series.groupby(bins).mean()
-        self.assertRaises(ValueError, f)
-
-    def test_groupby_multi_categorical_as_index(self):
-        # GH13204
-        df = DataFrame({'cat': Categorical([1, 2, 2], [1, 2, 3]),
-                        'A': [10, 11, 11],
-                        'B': [101, 102, 103]})
-        result = df.groupby(['cat', 'A'], as_index=False).sum()
-        expected = DataFrame({'cat': Categorical([1, 1, 2, 2, 3, 3]),
-                              'A': [10, 11, 10, 11, 10, 11],
-                              'B': [101.0, nan, nan, 205.0, nan, nan]},
-                             columns=['cat', 'A', 'B'])
-        tm.assert_frame_equal(result, expected)
-
-        # function grouper
-        f = lambda r: df.loc[r, 'A']
-        result = df.groupby(['cat', f], as_index=False).sum()
-        expected = DataFrame({'cat': Categorical([1, 1, 2, 2, 3, 3]),
-                              'A': [10.0, nan, nan, 22.0, nan, nan],
-                              'B': [101.0, nan, nan, 205.0, nan, nan]},
-                             columns=['cat', 'A', 'B'])
-        tm.assert_frame_equal(result, expected)
+    # gh-8869
+    # with as_index
+    d = {'foo': [10, 8, 4, 8, 4, 1, 1], 'bar': [10, 20, 30, 40, 50, 60, 70],
+         'baz': ['d', 'c', 'e', 'a', 'a', 'd', 'c']}
+    df = pd.DataFrame(d)
+    cat = pd.cut(df['foo'], np.linspace(0, 10, 3))
+    df['range'] = cat
+    groups = df.groupby(['range', 'baz'], as_index=False, observed=observed)
+    result = groups.agg('mean')
+
+    groups2 = df.groupby(['range', 'baz'], as_index=True, observed=observed)
+    expected = groups2.agg('mean').reset_index()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_observed_codes_remap(observed):
+    d = {'C1': [3, 3, 4, 5], 'C2': [1, 2, 3, 4], 'C3': [10, 100, 200, 34]}
+    df = pd.DataFrame(d)
+    values = pd.cut(df['C1'], [1, 2, 3, 6])
+    values.name = "cat"
+    groups_double_key = df.groupby([values, 'C2'], observed=observed)
+
+    idx = MultiIndex.from_arrays([values, [1, 2, 3, 4]],
+                                 names=["cat", "C2"])
+    expected = DataFrame({"C1": [3, 3, 4, 5],
+                          "C3": [10, 100, 200, 34]}, index=idx)
+    if not observed:
+        expected = cartesian_product_for_groupers(
+            expected,
+            [values.values, [1, 2, 3, 4]],
+            ['cat', 'C2'])
+
+    result = groups_double_key.agg('mean')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_observed_perf():
+    # we create a cartesian product, so this is
+    # non-performant if we don't use observed values
+    # gh-14942
+    df = DataFrame({
+        'cat': np.random.randint(0, 255, size=30000),
+        'int_id': np.random.randint(0, 255, size=30000),
+        'other_id': np.random.randint(0, 10000, size=30000),
+        'foo': 0})
+    df['cat'] = df.cat.astype(str).astype('category')
+
+    grouped = df.groupby(['cat', 'int_id', 'other_id'], observed=True)
+    result = grouped.count()
+    assert result.index.levels[0].nunique() == df.cat.nunique()
+    assert result.index.levels[1].nunique() == df.int_id.nunique()
+    assert result.index.levels[2].nunique() == df.other_id.nunique()
+
+
+def test_observed_groups(observed):
+    # gh-20583
+    # test that we have the appropriate groups
+
+    cat = pd.Categorical(['a', 'c', 'a'], categories=['a', 'b', 'c'])
+    df = pd.DataFrame({'cat': cat, 'vals': [1, 2, 3]})
+    g = df.groupby('cat', observed=observed)
+
+    result = g.groups
+    if observed:
+        expected = {'a': Index([0, 2], dtype='int64'),
+                    'c': Index([1], dtype='int64')}
+    else:
+        expected = {'a': Index([0, 2], dtype='int64'),
+                    'b': Index([], dtype='int64'),
+                    'c': Index([1], dtype='int64')}
+
+    tm.assert_dict_equal(result, expected)
+
+
+def test_observed_groups_with_nan(observed):
+    # GH 24740
+    df = pd.DataFrame({'cat': pd.Categorical(['a', np.nan, 'a'],
+                       categories=['a', 'b', 'd']),
+                       'vals': [1, 2, 3]})
+    g = df.groupby('cat', observed=observed)
+    result = g.groups
+    if observed:
+        expected = {'a': Index([0, 2], dtype='int64')}
+    else:
+        expected = {'a': Index([0, 2], dtype='int64'),
+                    'b': Index([], dtype='int64'),
+                    'd': Index([], dtype='int64')}
+    tm.assert_dict_equal(result, expected)
+
+
+def test_dataframe_categorical_with_nan(observed):
+    # GH 21151
+    s1 = pd.Categorical([np.nan, 'a', np.nan, 'a'],
+                        categories=['a', 'b', 'c'])
+    s2 = pd.Series([1, 2, 3, 4])
+    df = pd.DataFrame({'s1': s1, 's2': s2})
+    result = df.groupby('s1', observed=observed).first().reset_index()
+    if observed:
+        expected = DataFrame({'s1': pd.Categorical(['a'],
+                              categories=['a', 'b', 'c']), 's2': [2]})
+    else:
+        expected = DataFrame({'s1': pd.Categorical(['a', 'b', 'c'],
+                              categories=['a', 'b', 'c']),
+                              's2': [2, np.nan, np.nan]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_datetime():
+    # GH9049: ensure backward compatibility
+    levels = pd.date_range('2014-01-01', periods=4)
+    codes = np.random.randint(0, 4, size=100)
+
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+
+    data = DataFrame(np.random.randn(100, 4))
+    result = data.groupby(cats, observed=False).mean()
+
+    expected = data.groupby(np.asarray(cats), observed=False).mean()
+    expected = expected.reindex(levels)
+    expected.index = CategoricalIndex(expected.index,
+                                      categories=expected.index,
+                                      ordered=True)
+
+    assert_frame_equal(result, expected)
+
+    grouped = data.groupby(cats, observed=False)
+    desc_result = grouped.describe()
+
+    idx = cats.codes.argsort()
+    ord_labels = cats.take_nd(idx)
+    ord_data = data.take(idx)
+    expected = ord_data.groupby(ord_labels, observed=False).describe()
+    assert_frame_equal(desc_result, expected)
+    tm.assert_index_equal(desc_result.index, expected.index)
+    tm.assert_index_equal(
+        desc_result.index.get_level_values(0),
+        expected.index.get_level_values(0))
+
+    # GH 10460
+    expc = Categorical.from_codes(
+        np.arange(4).repeat(8), levels, ordered=True)
+    exp = CategoricalIndex(expc)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(0)), exp)
+    exp = Index(['count', 'mean', 'std', 'min', '25%', '50%',
+                 '75%', 'max'] * 4)
+    tm.assert_index_equal((desc_result.stack().index
+                           .get_level_values(1)), exp)
+
+
+def test_categorical_index():
+
+    s = np.random.RandomState(12345)
+    levels = ['foo', 'bar', 'baz', 'qux']
+    codes = s.randint(0, 4, size=20)
+    cats = Categorical.from_codes(codes, levels, ordered=True)
+    df = DataFrame(
+        np.repeat(
+            np.arange(20), 4).reshape(-1, 4), columns=list('abcd'))
+    df['cats'] = cats
+
+    # with a cat index
+    result = df.set_index('cats').groupby(level=0, observed=False).sum()
+    expected = df[list('abcd')].groupby(cats.codes, observed=False).sum()
+    expected.index = CategoricalIndex(
+        Categorical.from_codes(
+            [0, 1, 2, 3], levels, ordered=True), name='cats')
+    assert_frame_equal(result, expected)
+
+    # with a cat column, should produce a cat index
+    result = df.groupby('cats', observed=False).sum()
+    expected = df[list('abcd')].groupby(cats.codes, observed=False).sum()
+    expected.index = CategoricalIndex(
+        Categorical.from_codes(
+            [0, 1, 2, 3], levels, ordered=True), name='cats')
+    assert_frame_equal(result, expected)
+
+
+def test_describe_categorical_columns():
+    # GH 11558
+    cats = pd.CategoricalIndex(['qux', 'foo', 'baz', 'bar'],
+                               categories=['foo', 'bar', 'baz', 'qux'],
+                               ordered=True)
+    df = DataFrame(np.random.randn(20, 4), columns=cats)
+    result = df.groupby([1, 2, 3, 4] * 5).describe()
+
+    tm.assert_index_equal(result.stack().columns, cats)
+    tm.assert_categorical_equal(result.stack().columns.values, cats.values)
+
+
+def test_unstack_categorical():
+    # GH11558 (example is taken from the original issue)
+    df = pd.DataFrame({'a': range(10),
+                       'medium': ['A', 'B'] * 5,
+                       'artist': list('XYXXY') * 2})
+    df['medium'] = df['medium'].astype('category')
+
+    gcat = df.groupby(
+        ['artist', 'medium'], observed=False)['a'].count().unstack()
+    result = gcat.describe()
+
+    exp_columns = pd.CategoricalIndex(['A', 'B'], ordered=False,
+                                      name='medium')
+    tm.assert_index_equal(result.columns, exp_columns)
+    tm.assert_categorical_equal(result.columns.values, exp_columns.values)
+
+    result = gcat['A'] + gcat['B']
+    expected = pd.Series([6, 4], index=pd.Index(['X', 'Y'], name='artist'))
+    tm.assert_series_equal(result, expected)
+
+
+def test_bins_unequal_len():
+    # GH3011
+    series = Series([np.nan, np.nan, 1, 1, 2, 2, 3, 3, 4, 4])
+    bins = pd.cut(series.dropna().values, 4)
+
+    # len(bins) != len(series) here
+    with pytest.raises(ValueError):
+        series.groupby(bins).mean()
+
+
+def test_as_index():
+    # GH13204
+    df = DataFrame({'cat': Categorical([1, 2, 2], [1, 2, 3]),
+                    'A': [10, 11, 11],
+                    'B': [101, 102, 103]})
+    result = df.groupby(['cat', 'A'], as_index=False, observed=True).sum()
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 11],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    # function grouper
+    f = lambda r: df.loc[r, 'A']
+    result = df.groupby(['cat', f], as_index=False, observed=True).sum()
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 22],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+    tm.assert_frame_equal(result, expected)
+
+    # another not in-axis grouper (conflicting names in index)
+    s = Series(['a', 'b', 'b'], name='cat')
+    result = df.groupby(['cat', s], as_index=False, observed=True).sum()
+    tm.assert_frame_equal(result, expected)
+
+    # is original index dropped?
+    group_columns = ['cat', 'A']
+    expected = DataFrame(
+        {'cat': Categorical([1, 2], categories=df.cat.cat.categories),
+         'A': [10, 11],
+         'B': [101, 205]},
+        columns=['cat', 'A', 'B'])
+
+    for name in [None, 'X', 'B']:
+        df.index = Index(list("abc"), name=name)
+        result = df.groupby(group_columns, as_index=False, observed=True).sum()
 
-        # another not in-axis grouper (conflicting names in index)
-        s = Series(['a', 'b', 'b'], name='cat')
-        result = df.groupby(['cat', s], as_index=False).sum()
-        expected = DataFrame({'cat': Categorical([1, 1, 2, 2, 3, 3]),
-                              'A': [10.0, nan, nan, 22.0, nan, nan],
-                              'B': [101.0, nan, nan, 205.0, nan, nan]},
-                             columns=['cat', 'A', 'B'])
         tm.assert_frame_equal(result, expected)
 
-        # is original index dropped?
-        expected = DataFrame({'cat': Categorical([1, 1, 2, 2, 3, 3]),
-                              'A': [10, 11, 10, 11, 10, 11],
-                              'B': [101.0, nan, nan, 205.0, nan, nan]},
-                             columns=['cat', 'A', 'B'])
-
-        group_columns = ['cat', 'A']
-
-        for name in [None, 'X', 'B', 'cat']:
-            df.index = Index(list("abc"), name=name)
-
-            if name in group_columns and name in df.index.names:
-                with tm.assert_produces_warning(FutureWarning,
-                                                check_stacklevel=False):
-                    result = df.groupby(group_columns, as_index=False).sum()
-
-            else:
-                result = df.groupby(group_columns, as_index=False).sum()
-
-            tm.assert_frame_equal(result, expected, check_index_type=True)
-
-    def test_groupby_preserve_categories(self):
-        # GH-13179
-        categories = list('abc')
 
-        # ordered=True
-        df = DataFrame({'A': pd.Categorical(list('ba'),
-                                            categories=categories,
+def test_preserve_categories():
+    # GH-13179
+    categories = list('abc')
+
+    # ordered=True
+    df = DataFrame({'A': pd.Categorical(list('ba'),
+                                        categories=categories,
+                                        ordered=True)})
+    index = pd.CategoricalIndex(categories, categories, ordered=True)
+    tm.assert_index_equal(
+        df.groupby('A', sort=True, observed=False).first().index, index)
+    tm.assert_index_equal(
+        df.groupby('A', sort=False, observed=False).first().index, index)
+
+    # ordered=False
+    df = DataFrame({'A': pd.Categorical(list('ba'),
+                                        categories=categories,
+                                        ordered=False)})
+    sort_index = pd.CategoricalIndex(categories, categories, ordered=False)
+    nosort_index = pd.CategoricalIndex(list('bac'), list('bac'),
+                                       ordered=False)
+    tm.assert_index_equal(
+        df.groupby('A', sort=True, observed=False).first().index,
+        sort_index)
+    tm.assert_index_equal(
+        df.groupby('A', sort=False, observed=False).first().index,
+        nosort_index)
+
+
+def test_preserve_categorical_dtype():
+    # GH13743, GH13854
+    df = DataFrame({'A': [1, 2, 1, 1, 2],
+                    'B': [10, 16, 22, 28, 34],
+                    'C1': Categorical(list("abaab"),
+                                      categories=list("bac"),
+                                      ordered=False),
+                    'C2': Categorical(list("abaab"),
+                                      categories=list("bac"),
+                                      ordered=True)})
+    # single grouper
+    exp_full = DataFrame({'A': [2.0, 1.0, np.nan],
+                          'B': [25.0, 20.0, np.nan],
+                          'C1': Categorical(list("bac"),
+                                            categories=list("bac"),
+                                            ordered=False),
+                          'C2': Categorical(list("bac"),
+                                            categories=list("bac"),
                                             ordered=True)})
-        index = pd.CategoricalIndex(categories, categories, ordered=True)
-        tm.assert_index_equal(df.groupby('A', sort=True).first().index, index)
-        tm.assert_index_equal(df.groupby('A', sort=False).first().index, index)
-
-        # ordered=False
-        df = DataFrame({'A': pd.Categorical(list('ba'),
-                                            categories=categories,
-                                            ordered=False)})
-        sort_index = pd.CategoricalIndex(categories, categories, ordered=False)
-        nosort_index = pd.CategoricalIndex(list('bac'), list('bac'),
-                                           ordered=False)
-        tm.assert_index_equal(df.groupby('A', sort=True).first().index,
-                              sort_index)
-        tm.assert_index_equal(df.groupby('A', sort=False).first().index,
-                              nosort_index)
-
-    def test_groupby_preserve_categorical_dtype(self):
-        # GH13743, GH13854
-        df = DataFrame({'A': [1, 2, 1, 1, 2],
-                        'B': [10, 16, 22, 28, 34],
-                        'C1': Categorical(list("abaab"),
-                                          categories=list("bac"),
-                                          ordered=False),
-                        'C2': Categorical(list("abaab"),
-                                          categories=list("bac"),
-                                          ordered=True)})
-        # single grouper
-        exp_full = DataFrame({'A': [2.0, 1.0, np.nan],
-                              'B': [25.0, 20.0, np.nan],
-                              'C1': Categorical(list("bac"),
-                                                categories=list("bac"),
-                                                ordered=False),
-                              'C2': Categorical(list("bac"),
-                                                categories=list("bac"),
-                                                ordered=True)})
-        for col in ['C1', 'C2']:
-            result1 = df.groupby(by=col, as_index=False).mean()
-            result2 = df.groupby(by=col, as_index=True).mean().reset_index()
-            expected = exp_full.reindex(columns=result1.columns)
-            tm.assert_frame_equal(result1, expected)
-            tm.assert_frame_equal(result2, expected)
-
-        # multiple grouper
-        exp_full = DataFrame({'A': [1, 1, 1, 2, 2, 2],
-                              'B': [np.nan, 20.0, np.nan, 25.0, np.nan,
-                                    np.nan],
-                              'C1': Categorical(list("bacbac"),
-                                                categories=list("bac"),
-                                                ordered=False),
-                              'C2': Categorical(list("bacbac"),
-                                                categories=list("bac"),
-                                                ordered=True)})
-        for cols in [['A', 'C1'], ['A', 'C2']]:
-            result1 = df.groupby(by=cols, as_index=False).mean()
-            result2 = df.groupby(by=cols, as_index=True).mean().reset_index()
-            expected = exp_full.reindex(columns=result1.columns)
-            tm.assert_frame_equal(result1, expected)
-            tm.assert_frame_equal(result2, expected)
-
-    def test_groupby_categorical_no_compress(self):
-        data = Series(np.random.randn(9))
-
-        codes = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2])
-        cats = Categorical.from_codes(codes, [0, 1, 2], ordered=True)
-
-        result = data.groupby(cats).mean()
-        exp = data.groupby(codes).mean()
-
-        exp.index = CategoricalIndex(exp.index, categories=cats.categories,
-                                     ordered=cats.ordered)
-        assert_series_equal(result, exp)
-
-        codes = np.array([0, 0, 0, 1, 1, 1, 3, 3, 3])
-        cats = Categorical.from_codes(codes, [0, 1, 2, 3], ordered=True)
-
-        result = data.groupby(cats).mean()
-        exp = data.groupby(codes).mean().reindex(cats.categories)
-        exp.index = CategoricalIndex(exp.index, categories=cats.categories,
-                                     ordered=cats.ordered)
-        assert_series_equal(result, exp)
-
-        cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
-                           categories=["a", "b", "c", "d"], ordered=True)
-        data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
-
-        result = data.groupby("b").mean()
-        result = result["a"].values
-        exp = np.array([1, 2, 4, np.nan])
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_groupby_sort_categorical(self):
-        # dataframe groupby sort was being ignored # GH 8868
-        df = DataFrame([['(7.5, 10]', 10, 10],
-                        ['(7.5, 10]', 8, 20],
-                        ['(2.5, 5]', 5, 30],
-                        ['(5, 7.5]', 6, 40],
-                        ['(2.5, 5]', 4, 50],
-                        ['(0, 2.5]', 1, 60],
-                        ['(5, 7.5]', 7, 70]], columns=['range', 'foo', 'bar'])
-        df['range'] = Categorical(df['range'], ordered=True)
-        index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
-                                  '(7.5, 10]'], name='range', ordered=True)
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
-                                columns=['foo', 'bar'], index=index)
-
-        col = 'range'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        # when categories is ordered, group is ordered by category's order
-        assert_frame_equal(result_sort, df.groupby(col, sort=False).first())
-
-        df['range'] = Categorical(df['range'], ordered=False)
-        index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
-                                  '(7.5, 10]'], name='range')
-        result_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
-                                columns=['foo', 'bar'], index=index)
-
-        index = CategoricalIndex(['(7.5, 10]', '(2.5, 5]', '(5, 7.5]',
-                                  '(0, 2.5]'],
-                                 categories=['(7.5, 10]', '(2.5, 5]',
-                                             '(5, 7.5]', '(0, 2.5]'],
-                                 name='range')
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
-                                  index=index, columns=['foo', 'bar'])
-
-        col = 'range'
-        # this is an unordered categorical, but we allow this ####
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        assert_frame_equal(result_nosort, df.groupby(col, sort=False).first())
-
-    def test_groupby_sort_categorical_datetimelike(self):
-        # GH10505
-
-        # use same data as test_groupby_sort_categorical, which category is
-        # corresponding to datetime.month
-        df = DataFrame({'dt': [datetime(2011, 7, 1), datetime(2011, 7, 1),
-                               datetime(2011, 2, 1), datetime(2011, 5, 1),
-                               datetime(2011, 2, 1), datetime(2011, 1, 1),
-                               datetime(2011, 5, 1)],
-                        'foo': [10, 8, 5, 6, 4, 1, 7],
-                        'bar': [10, 20, 30, 40, 50, 60, 70]},
-                       columns=['dt', 'foo', 'bar'])
-
-        # ordered=True
-        df['dt'] = Categorical(df['dt'], ordered=True)
-        index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 7, 1)]
-        result_sort = DataFrame(
-            [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = CategoricalIndex(index, name='dt', ordered=True)
-
-        index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 1, 1)]
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
-                                  columns=['foo', 'bar'])
-        result_nosort.index = CategoricalIndex(index, categories=index,
-                                               name='dt', ordered=True)
-
-        col = 'dt'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        # when categories is ordered, group is ordered by category's order
-        assert_frame_equal(result_sort, df.groupby(col, sort=False).first())
-
-        # ordered = False
-        df['dt'] = Categorical(df['dt'], ordered=False)
-        index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 7, 1)]
-        result_sort = DataFrame(
-            [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
-        result_sort.index = CategoricalIndex(index, name='dt')
-
-        index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
-                 datetime(2011, 5, 1), datetime(2011, 1, 1)]
-        result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
-                                  columns=['foo', 'bar'])
-        result_nosort.index = CategoricalIndex(index, categories=index,
-                                               name='dt')
-
-        col = 'dt'
-        assert_frame_equal(result_sort, df.groupby(col, sort=True).first())
-        assert_frame_equal(result_nosort, df.groupby(col, sort=False).first())
-
-    def test_groupby_categorical_two_columns(self):
-
-        # https://github.com/pandas-dev/pandas/issues/8138
-        d = {'cat':
-             pd.Categorical(["a", "b", "a", "b"], categories=["a", "b", "c"],
-                            ordered=True),
-             'ints': [1, 1, 2, 2],
-             'val': [10, 20, 30, 40]}
-        test = pd.DataFrame(d)
-
-        # Grouping on a single column
-        groups_single_key = test.groupby("cat")
-        res = groups_single_key.agg('mean')
-
-        exp_index = pd.CategoricalIndex(["a", "b", "c"], name="cat",
-                                        ordered=True)
-        exp = DataFrame({"ints": [1.5, 1.5, np.nan], "val": [20, 30, np.nan]},
-                        index=exp_index)
-        tm.assert_frame_equal(res, exp)
-
-        # Grouping on two columns
-        groups_double_key = test.groupby(["cat", "ints"])
-        res = groups_double_key.agg('mean')
-        exp = DataFrame({"val": [10, 30, 20, 40, np.nan, np.nan],
-                         "cat": pd.Categorical(["a", "a", "b", "b", "c", "c"],
-                                               ordered=True),
-                         "ints": [1, 2, 1, 2, 1, 2]}).set_index(["cat", "ints"
-                                                                 ])
-        tm.assert_frame_equal(res, exp)
-
-        # GH 10132
-        for key in [('a', 1), ('b', 2), ('b', 1), ('a', 2)]:
-            c, i = key
-            result = groups_double_key.get_group(key)
-            expected = test[(test.cat == c) & (test.ints == i)]
-            assert_frame_equal(result, expected)
-
-        d = {'C1': [3, 3, 4, 5], 'C2': [1, 2, 3, 4], 'C3': [10, 100, 200, 34]}
-        test = pd.DataFrame(d)
-        values = pd.cut(test['C1'], [1, 2, 3, 6])
-        values.name = "cat"
-        groups_double_key = test.groupby([values, 'C2'])
-
-        res = groups_double_key.agg('mean')
-        nan = np.nan
-        idx = MultiIndex.from_product(
-            [Categorical(["(1, 2]", "(2, 3]", "(3, 6]"], ordered=True),
-             [1, 2, 3, 4]],
-            names=["cat", "C2"])
-        exp = DataFrame({"C1": [nan, nan, nan, nan, 3, 3,
-                                nan, nan, nan, nan, 4, 5],
-                         "C3": [nan, nan, nan, nan, 10, 100,
-                                nan, nan, nan, nan, 200, 34]}, index=idx)
-        tm.assert_frame_equal(res, exp)
+    for col in ['C1', 'C2']:
+        result1 = df.groupby(by=col, as_index=False, observed=False).mean()
+        result2 = df.groupby(
+            by=col, as_index=True, observed=False).mean().reset_index()
+        expected = exp_full.reindex(columns=result1.columns)
+        tm.assert_frame_equal(result1, expected)
+        tm.assert_frame_equal(result2, expected)
+
+
+def test_categorical_no_compress():
+    data = Series(np.random.randn(9))
+
+    codes = np.array([0, 0, 0, 1, 1, 1, 2, 2, 2])
+    cats = Categorical.from_codes(codes, [0, 1, 2], ordered=True)
+
+    result = data.groupby(cats, observed=False).mean()
+    exp = data.groupby(codes, observed=False).mean()
+
+    exp.index = CategoricalIndex(exp.index, categories=cats.categories,
+                                 ordered=cats.ordered)
+    assert_series_equal(result, exp)
+
+    codes = np.array([0, 0, 0, 1, 1, 1, 3, 3, 3])
+    cats = Categorical.from_codes(codes, [0, 1, 2, 3], ordered=True)
+
+    result = data.groupby(cats, observed=False).mean()
+    exp = data.groupby(codes, observed=False).mean().reindex(cats.categories)
+    exp.index = CategoricalIndex(exp.index, categories=cats.categories,
+                                 ordered=cats.ordered)
+    assert_series_equal(result, exp)
+
+    cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
+                       categories=["a", "b", "c", "d"], ordered=True)
+    data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
+
+    result = data.groupby("b", observed=False).mean()
+    result = result["a"].values
+    exp = np.array([1, 2, 4, np.nan])
+    tm.assert_numpy_array_equal(result, exp)
+
+
+def test_sort():
+
+    # http://stackoverflow.com/questions/23814368/sorting-pandas-categorical-labels-after-groupby  # noqa: flake8
+    # This should result in a properly sorted Series so that the plot
+    # has a sorted x axis
+    # self.cat.groupby(['value_group'])['value_group'].count().plot(kind='bar')
+
+    df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+    labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+    cat_labels = Categorical(labels, labels)
+
+    df = df.sort_values(by=['value'], ascending=True)
+    df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                               right=False, labels=cat_labels)
+
+    res = df.groupby(['value_group'], observed=False)['value_group'].count()
+    exp = res[sorted(res.index, key=lambda x: float(x.split()[0]))]
+    exp.index = CategoricalIndex(exp.index, name=exp.index.name)
+    tm.assert_series_equal(res, exp)
+
+
+def test_sort2():
+    # dataframe groupby sort was being ignored # GH 8868
+    df = DataFrame([['(7.5, 10]', 10, 10],
+                    ['(7.5, 10]', 8, 20],
+                    ['(2.5, 5]', 5, 30],
+                    ['(5, 7.5]', 6, 40],
+                    ['(2.5, 5]', 4, 50],
+                    ['(0, 2.5]', 1, 60],
+                    ['(5, 7.5]', 7, 70]], columns=['range', 'foo', 'bar'])
+    df['range'] = Categorical(df['range'], ordered=True)
+    index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
+                              '(7.5, 10]'], name='range', ordered=True)
+    expected_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
+                              columns=['foo', 'bar'], index=index)
+
+    col = 'range'
+    result_sort = df.groupby(col, sort=True, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    # when categories is ordered, group is ordered by category's order
+    expected_sort = result_sort
+    result_sort = df.groupby(col, sort=False, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    df['range'] = Categorical(df['range'], ordered=False)
+    index = CategoricalIndex(['(0, 2.5]', '(2.5, 5]', '(5, 7.5]',
+                              '(7.5, 10]'], name='range')
+    expected_sort = DataFrame([[1, 60], [5, 30], [6, 40], [10, 10]],
+                              columns=['foo', 'bar'], index=index)
+
+    index = CategoricalIndex(['(7.5, 10]', '(2.5, 5]', '(5, 7.5]',
+                              '(0, 2.5]'],
+                             categories=['(7.5, 10]', '(2.5, 5]',
+                                         '(5, 7.5]', '(0, 2.5]'],
+                             name='range')
+    expected_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                                index=index, columns=['foo', 'bar'])
+
+    col = 'range'
+
+    # this is an unordered categorical, but we allow this ####
+    result_sort = df.groupby(col, sort=True, observed=False).first()
+    assert_frame_equal(result_sort, expected_sort)
+
+    result_nosort = df.groupby(col, sort=False, observed=False).first()
+    assert_frame_equal(result_nosort, expected_nosort)
+
+
+def test_sort_datetimelike():
+    # GH10505
+
+    # use same data as test_groupby_sort_categorical, which category is
+    # corresponding to datetime.month
+    df = DataFrame({'dt': [datetime(2011, 7, 1), datetime(2011, 7, 1),
+                           datetime(2011, 2, 1), datetime(2011, 5, 1),
+                           datetime(2011, 2, 1), datetime(2011, 1, 1),
+                           datetime(2011, 5, 1)],
+                    'foo': [10, 8, 5, 6, 4, 1, 7],
+                    'bar': [10, 20, 30, 40, 50, 60, 70]},
+                   columns=['dt', 'foo', 'bar'])
+
+    # ordered=True
+    df['dt'] = Categorical(df['dt'], ordered=True)
+    index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 7, 1)]
+    result_sort = DataFrame(
+        [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
+    result_sort.index = CategoricalIndex(index, name='dt', ordered=True)
+
+    index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 1, 1)]
+    result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                              columns=['foo', 'bar'])
+    result_nosort.index = CategoricalIndex(index, categories=index,
+                                           name='dt', ordered=True)
+
+    col = 'dt'
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=True, observed=False).first())
+
+    # when categories is ordered, group is ordered by category's order
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=False, observed=False).first())
+
+    # ordered = False
+    df['dt'] = Categorical(df['dt'], ordered=False)
+    index = [datetime(2011, 1, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 7, 1)]
+    result_sort = DataFrame(
+        [[1, 60], [5, 30], [6, 40], [10, 10]], columns=['foo', 'bar'])
+    result_sort.index = CategoricalIndex(index, name='dt')
+
+    index = [datetime(2011, 7, 1), datetime(2011, 2, 1),
+             datetime(2011, 5, 1), datetime(2011, 1, 1)]
+    result_nosort = DataFrame([[10, 10], [5, 30], [6, 40], [1, 60]],
+                              columns=['foo', 'bar'])
+    result_nosort.index = CategoricalIndex(index, categories=index,
+                                           name='dt')
+
+    col = 'dt'
+    assert_frame_equal(
+        result_sort, df.groupby(col, sort=True, observed=False).first())
+    assert_frame_equal(
+        result_nosort, df.groupby(col, sort=False, observed=False).first())
+
+
+def test_empty_sum():
+    # https://github.com/pandas-dev/pandas/issues/18678
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=['a', 'b', 'c']),
+                       'B': [1, 2, 1]})
+    expected_idx = pd.CategoricalIndex(['a', 'b', 'c'], name='A')
+
+    # 0 by default
+    result = df.groupby("A", observed=False).B.sum()
+    expected = pd.Series([3, 1, 0], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=0
+    result = df.groupby("A", observed=False).B.sum(min_count=0)
+    expected = pd.Series([3, 1, 0], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=1
+    result = df.groupby("A", observed=False).B.sum(min_count=1)
+    expected = pd.Series([3, 1, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count>1
+    result = df.groupby("A", observed=False).B.sum(min_count=2)
+    expected = pd.Series([3, np.nan, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+
+def test_empty_prod():
+    # https://github.com/pandas-dev/pandas/issues/18678
+    df = pd.DataFrame({"A": pd.Categorical(['a', 'a', 'b'],
+                                           categories=['a', 'b', 'c']),
+                       'B': [1, 2, 1]})
+
+    expected_idx = pd.CategoricalIndex(['a', 'b', 'c'], name='A')
+
+    # 1 by default
+    result = df.groupby("A", observed=False).B.prod()
+    expected = pd.Series([2, 1, 1], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=0
+    result = df.groupby("A", observed=False).B.prod(min_count=0)
+    expected = pd.Series([2, 1, 1], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+    # min_count=1
+    result = df.groupby("A", observed=False).B.prod(min_count=1)
+    expected = pd.Series([2, 1, np.nan], expected_idx, name='B')
+    tm.assert_series_equal(result, expected)
+
+
+def test_groupby_multiindex_categorical_datetime():
+    # https://github.com/pandas-dev/pandas/issues/21390
+
+    df = pd.DataFrame({
+        'key1': pd.Categorical(list('abcbabcba')),
+        'key2': pd.Categorical(
+            list(pd.date_range('2018-06-01 00', freq='1T', periods=3)) * 3),
+        'values': np.arange(9),
+    })
+    result = df.groupby(['key1', 'key2']).mean()
+
+    idx = pd.MultiIndex.from_product(
+        [pd.Categorical(['a', 'b', 'c']),
+         pd.Categorical(pd.date_range('2018-06-01 00', freq='1T', periods=3))],
+        names=['key1', 'key2'])
+    expected = pd.DataFrame(
+        {'values': [0, 4, 8, 3, 4, 5, 6, np.nan, 2]}, index=idx)
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("as_index, expected", [
+    (True, pd.Series(
+        index=pd.MultiIndex.from_arrays(
+            [pd.Series([1, 1, 2], dtype='category'),
+                [1, 2, 2]], names=['a', 'b']
+        ),
+        data=[1, 2, 3], name='x'
+    )),
+    (False, pd.DataFrame({
+        'a': pd.Series([1, 1, 2], dtype='category'),
+        'b': [1, 2, 2],
+        'x': [1, 2, 3]
+    }))
+])
+def test_groupby_agg_observed_true_single_column(as_index, expected):
+    # GH-23970
+    df = pd.DataFrame({
+        'a': pd.Series([1, 1, 2], dtype='category'),
+        'b': [1, 2, 2],
+        'x': [1, 2, 3]
+    })
+
+    result = df.groupby(
+        ['a', 'b'], as_index=as_index, observed=True)['x'].sum()
+
+    assert_equal(result, expected)
+
+
+@pytest.mark.parametrize('fill_value', [None, np.nan, pd.NaT])
+def test_shift(fill_value):
+    ct = pd.Categorical(['a', 'b', 'c', 'd'],
+                        categories=['a', 'b', 'c', 'd'], ordered=False)
+    expected = pd.Categorical([None, 'a', 'b', 'c'],
+                              categories=['a', 'b', 'c', 'd'], ordered=False)
+    res = ct.shift(1, fill_value=fill_value)
+    assert_equal(res, expected)
diff --git a/pandas/tests/groupby/test_counting.py b/pandas/tests/groupby/test_counting.py
new file mode 100644
index 0000000000000..1438de5b7e37c
--- /dev/null
+++ b/pandas/tests/groupby/test_counting.py
@@ -0,0 +1,224 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+
+import numpy as np
+import pytest
+
+from pandas.compat import product as cart_product, range
+
+from pandas import DataFrame, MultiIndex, Period, Series, Timedelta, Timestamp
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+class TestCounting(object):
+
+    def test_cumcount(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'])
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3])
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_empty(self):
+        ge = DataFrame().groupby(level=0)
+        se = Series().groupby(level=0)
+
+        # edge case, as this is usually considered float
+        e = Series(dtype='int64')
+
+        assert_series_equal(e, ge.cumcount())
+        assert_series_equal(e, se.cumcount())
+
+    def test_cumcount_dupe_index(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=[0] * 5)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_mi(self):
+        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=mi)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=mi)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_cumcount_groupby_not_col(self):
+        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
+                       index=[0] * 5)
+        g = df.groupby([0, 0, 0, 1, 0])
+        sg = g.A
+
+        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
+
+        assert_series_equal(expected, g.cumcount())
+        assert_series_equal(expected, sg.cumcount())
+
+    def test_ngroup(self):
+        df = DataFrame({'A': list('aaaba')})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0])
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_distinct(self):
+        df = DataFrame({'A': list('abcde')})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series(range(5), dtype='int64')
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_one_group(self):
+        df = DataFrame({'A': [0] * 5})
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_empty(self):
+        ge = DataFrame().groupby(level=0)
+        se = Series().groupby(level=0)
+
+        # edge case, as this is usually considered float
+        e = Series(dtype='int64')
+
+        assert_series_equal(e, ge.ngroup())
+        assert_series_equal(e, se.ngroup())
+
+    def test_ngroup_series_matches_frame(self):
+        df = DataFrame({'A': list('aaaba')})
+        s = Series(list('aaaba'))
+
+        assert_series_equal(df.groupby(s).ngroup(),
+                            s.groupby(s).ngroup())
+
+    def test_ngroup_dupe_index(self):
+        df = DataFrame({'A': list('aaaba')}, index=[0] * 5)
+        g = df.groupby('A')
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0], index=[0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_mi(self):
+        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
+        df = DataFrame({'A': list('aaaba')}, index=mi)
+        g = df.groupby('A')
+        sg = g.A
+        expected = Series([0, 0, 0, 1, 0], index=mi)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_groupby_not_col(self):
+        df = DataFrame({'A': list('aaaba')}, index=[0] * 5)
+        g = df.groupby([0, 0, 0, 1, 0])
+        sg = g.A
+
+        expected = Series([0, 0, 0, 1, 0], index=[0] * 5)
+
+        assert_series_equal(expected, g.ngroup())
+        assert_series_equal(expected, sg.ngroup())
+
+    def test_ngroup_descending(self):
+        df = DataFrame(['a', 'a', 'b', 'a', 'b'], columns=['A'])
+        g = df.groupby(['A'])
+
+        ascending = Series([0, 0, 1, 0, 1])
+        descending = Series([1, 1, 0, 1, 0])
+
+        assert_series_equal(descending, (g.ngroups - 1) - ascending)
+        assert_series_equal(ascending, g.ngroup(ascending=True))
+        assert_series_equal(descending, g.ngroup(ascending=False))
+
+    def test_ngroup_matches_cumcount(self):
+        # verify one manually-worked out case works
+        df = DataFrame([['a', 'x'], ['a', 'y'], ['b', 'x'],
+                        ['a', 'x'], ['b', 'y']], columns=['A', 'X'])
+        g = df.groupby(['A', 'X'])
+        g_ngroup = g.ngroup()
+        g_cumcount = g.cumcount()
+        expected_ngroup = Series([0, 1, 2, 0, 3])
+        expected_cumcount = Series([0, 0, 0, 1, 0])
+
+        assert_series_equal(g_ngroup, expected_ngroup)
+        assert_series_equal(g_cumcount, expected_cumcount)
+
+    def test_ngroup_cumcount_pair(self):
+        # brute force comparison for all small series
+        for p in cart_product(range(3), repeat=4):
+            df = DataFrame({'a': p})
+            g = df.groupby(['a'])
+
+            order = sorted(set(p))
+            ngroupd = [order.index(val) for val in p]
+            cumcounted = [p[:i].count(val) for i, val in enumerate(p)]
+
+            assert_series_equal(g.ngroup(), Series(ngroupd))
+            assert_series_equal(g.cumcount(), Series(cumcounted))
+
+    def test_ngroup_respects_groupby_order(self):
+        np.random.seed(0)
+        df = DataFrame({'a': np.random.choice(list('abcdef'), 100)})
+        for sort_flag in (False, True):
+            g = df.groupby(['a'], sort=sort_flag)
+            df['group_id'] = -1
+            df['group_index'] = -1
+
+            for i, (_, group) in enumerate(g):
+                df.loc[group.index, 'group_id'] = i
+                for j, ind in enumerate(group.index):
+                    df.loc[ind, 'group_index'] = j
+
+            assert_series_equal(Series(df['group_id'].values),
+                                g.ngroup())
+            assert_series_equal(Series(df['group_index'].values),
+                                g.cumcount())
+
+    @pytest.mark.parametrize('datetimelike', [
+        [Timestamp('2016-05-%02d 20:09:25+00:00' % i) for i in range(1, 4)],
+        [Timestamp('2016-05-%02d 20:09:25' % i) for i in range(1, 4)],
+        [Timedelta(x, unit="h") for x in range(1, 4)],
+        [Period(freq="2W", year=2017, month=x) for x in range(1, 4)]])
+    def test_count_with_datetimelike(self, datetimelike):
+        # test for #13393, where DataframeGroupBy.count() fails
+        # when counting a datetimelike column.
+
+        df = DataFrame({'x': ['a', 'a', 'b'], 'y': datetimelike})
+        res = df.groupby('x').count()
+        expected = DataFrame({'y': [2, 1]}, index=['a', 'b'])
+        expected.index.name = "x"
+        assert_frame_equal(expected, res)
+
+    def test_count_with_only_nans_in_first_group(self):
+        # GH21956
+        df = DataFrame({'A': [np.nan, np.nan], 'B': ['a', 'b'], 'C': [1, 2]})
+        result = df.groupby(['A', 'B']).C.count()
+        mi = MultiIndex(levels=[[], ['a', 'b']],
+                        codes=[[], []],
+                        names=['A', 'B'])
+        expected = Series([], index=mi, dtype=np.int64, name='C')
+        assert_series_equal(result, expected, check_index_type=False)
diff --git a/pandas/tests/groupby/test_filters.py b/pandas/tests/groupby/test_filters.py
index de6757786a363..4d386db735b57 100644
--- a/pandas/tests/groupby/test_filters.py
+++ b/pandas/tests/groupby/test_filters.py
@@ -1,619 +1,588 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
-from numpy import nan
 
-
-from pandas import Timestamp
-from pandas.core.index import MultiIndex
-from pandas.core.api import DataFrame
-
-from pandas.core.series import Series
-
-from pandas.util.testing import (assert_frame_equal, assert_series_equal
-                                 )
-from pandas.compat import (lmap)
-
-from pandas import compat
-
-import pandas.core.common as com
 import numpy as np
+import pytest
 
-import pandas.util.testing as tm
 import pandas as pd
+from pandas import DataFrame, Series, Timestamp
+import pandas.util.testing as tm
 
 
-class TestGroupByFilter(tm.TestCase):
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()
-
-        self.seriesd = tm.getSeriesData()
-        self.tsd = tm.getTimeSeriesData()
-        self.frame = DataFrame(self.seriesd)
-        self.tsframe = DataFrame(self.tsd)
-
-        self.df = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.random.randn(8)})
-
-        self.df_mixed_floats = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.array(
-                 np.random.randn(8), dtype='float32')})
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
-                                                                  'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        self.mframe = DataFrame(np.random.randn(10, 3), index=index,
-                                columns=['A', 'B', 'C'])
-
-        self.three_group = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny'],
-             'D': np.random.randn(11),
-             'E': np.random.randn(11),
-             'F': np.random.randn(11)})
-
-    def test_filter_series(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        expected_odd = pd.Series([1, 3, 5, 7], index=[0, 1, 3, 6])
-        expected_even = pd.Series([20, 22, 24], index=[2, 4, 5])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() < 10), expected_odd)
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() > 10), expected_even)
-        # Test dropna=False.
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() < 10, dropna=False),
-            expected_odd.reindex(s.index))
-        assert_series_equal(
-            grouped.filter(lambda x: x.mean() > 10, dropna=False),
-            expected_even.reindex(s.index))
-
-    def test_filter_single_column_df(self):
-        df = pd.DataFrame([1, 3, 20, 5, 22, 24, 7])
-        expected_odd = pd.DataFrame([1, 3, 5, 7], index=[0, 1, 3, 6])
-        expected_even = pd.DataFrame([20, 22, 24], index=[2, 4, 5])
-        grouper = df[0].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() < 10), expected_odd)
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() > 10), expected_even)
-        # Test dropna=False.
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() < 10, dropna=False),
-            expected_odd.reindex(df.index))
-        assert_frame_equal(
-            grouped.filter(lambda x: x.mean() > 10, dropna=False),
-            expected_even.reindex(df.index))
-
-    def test_filter_multi_column_df(self):
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': [1, 1, 1, 1]})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        expected = pd.DataFrame({'A': [12, 12], 'B': [1, 1]}, index=[1, 2])
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() - x['B'].sum() > 10),
-            expected)
-
-    def test_filter_mixed_df(self):
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        expected = pd.DataFrame({'A': [12, 12], 'B': ['b', 'c']}, index=[1, 2])
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() > 10), expected)
-
-    def test_filter_out_all_groups(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        assert_series_equal(grouped.filter(lambda x: x.mean() > 1000), s[[]])
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        assert_frame_equal(
-            grouped.filter(lambda x: x['A'].sum() > 1000), df.loc[[]])
-
-    def test_filter_out_no_groups(self):
-        s = pd.Series([1, 3, 20, 5, 22, 24, 7])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        filtered = grouped.filter(lambda x: x.mean() > 0)
-        assert_series_equal(filtered, s)
-        df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
-        grouper = df['A'].apply(lambda x: x % 2)
-        grouped = df.groupby(grouper)
-        filtered = grouped.filter(lambda x: x['A'].mean() > 0)
-        assert_frame_equal(filtered, df)
-
-    def test_filter_out_all_groups_in_df(self):
-        # GH12768
-        df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
-        res = df.groupby('a')
-        res = res.filter(lambda x: x['b'].sum() > 5, dropna=False)
-        expected = pd.DataFrame({'a': [nan] * 3, 'b': [nan] * 3})
-        assert_frame_equal(expected, res)
-
-        df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
-        res = df.groupby('a')
-        res = res.filter(lambda x: x['b'].sum() > 5, dropna=True)
-        expected = pd.DataFrame({'a': [], 'b': []}, dtype="int64")
-        assert_frame_equal(expected, res)
-
-    def test_filter_condition_raises(self):
-        def raise_if_sum_is_zero(x):
-            if x.sum() == 0:
-                raise ValueError
-            else:
-                return x.sum() > 0
-
-        s = pd.Series([-1, 0, 1, 2])
-        grouper = s.apply(lambda x: x % 2)
-        grouped = s.groupby(grouper)
-        self.assertRaises(TypeError,
-                          lambda: grouped.filter(raise_if_sum_is_zero))
-
-    def test_filter_with_axis_in_groupby(self):
-        # issue 11041
-        index = pd.MultiIndex.from_product([range(10), [0, 1]])
-        data = pd.DataFrame(
-            np.arange(100).reshape(-1, 20), columns=index, dtype='int64')
-        result = data.groupby(level=0,
-                              axis=1).filter(lambda x: x.iloc[0, 0] > 10)
-        expected = data.iloc[:, 12:20]
-        assert_frame_equal(result, expected)
-
-    def test_filter_bad_shapes(self):
-        df = DataFrame({'A': np.arange(8),
-                        'B': list('aabbbbcc'),
-                        'C': np.arange(8)})
-        s = df['B']
-        g_df = df.groupby('B')
-        g_s = s.groupby(s)
-
-        f = lambda x: x
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-        f = lambda x: x == 1
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-        f = lambda x: np.outer(x, x)
-        self.assertRaises(TypeError, lambda: g_df.filter(f))
-        self.assertRaises(TypeError, lambda: g_s.filter(f))
-
-    def test_filter_nan_is_false(self):
-        df = DataFrame({'A': np.arange(8),
-                        'B': list('aabbbbcc'),
-                        'C': np.arange(8)})
-        s = df['B']
-        g_df = df.groupby(df['B'])
-        g_s = s.groupby(s)
-
-        f = lambda x: np.nan
-        assert_frame_equal(g_df.filter(f), df.loc[[]])
-        assert_series_equal(g_s.filter(f), s[[]])
-
-    def test_filter_against_workaround(self):
-        np.random.seed(0)
-        # Series of ints
-        s = Series(np.random.randint(0, 100, 1000))
-        grouper = s.apply(lambda x: np.round(x, -1))
-        grouped = s.groupby(grouper)
-        f = lambda x: x.mean() > 10
-
-        old_way = s[grouped.transform(f).astype('bool')]
-        new_way = grouped.filter(f)
-        assert_series_equal(new_way.sort_values(), old_way.sort_values())
-
-        # Series of floats
-        s = 100 * Series(np.random.random(1000))
-        grouper = s.apply(lambda x: np.round(x, -1))
-        grouped = s.groupby(grouper)
-        f = lambda x: x.mean() > 10
-        old_way = s[grouped.transform(f).astype('bool')]
-        new_way = grouped.filter(f)
-        assert_series_equal(new_way.sort_values(), old_way.sort_values())
-
-        # Set up DataFrame of ints, floats, strings.
-        from string import ascii_lowercase
-        letters = np.array(list(ascii_lowercase))
-        N = 1000
-        random_letters = letters.take(np.random.randint(0, 26, N))
-        df = DataFrame({'ints': Series(np.random.randint(0, 100, N)),
-                        'floats': N / 10 * Series(np.random.random(N)),
-                        'letters': Series(random_letters)})
-
-        # Group by ints; filter on floats.
-        grouped = df.groupby('ints')
-        old_way = df[grouped.floats.
-                     transform(lambda x: x.mean() > N / 20).astype('bool')]
-        new_way = grouped.filter(lambda x: x['floats'].mean() > N / 20)
-        assert_frame_equal(new_way, old_way)
-
-        # Group by floats (rounded); filter on strings.
-        grouper = df.floats.apply(lambda x: np.round(x, -1))
-        grouped = df.groupby(grouper)
-        old_way = df[grouped.letters.
-                     transform(lambda x: len(x) < N / 10).astype('bool')]
-        new_way = grouped.filter(lambda x: len(x.letters) < N / 10)
-        assert_frame_equal(new_way, old_way)
-
-        # Group by strings; filter on ints.
-        grouped = df.groupby('letters')
-        old_way = df[grouped.ints.
-                     transform(lambda x: x.mean() > N / 20).astype('bool')]
-        new_way = grouped.filter(lambda x: x['ints'].mean() > N / 20)
-        assert_frame_equal(new_way, old_way)
-
-    def test_filter_using_len(self):
-        # BUG GH4447
-        df = DataFrame({'A': np.arange(8),
-                        'B': list('aabbbbcc'),
-                        'C': np.arange(8)})
-        grouped = df.groupby('B')
-        actual = grouped.filter(lambda x: len(x) > 2)
-        expected = DataFrame(
-            {'A': np.arange(2, 6),
-             'B': list('bbbb'),
-             'C': np.arange(2, 6)}, index=np.arange(2, 6))
-        assert_frame_equal(actual, expected)
-
-        actual = grouped.filter(lambda x: len(x) > 4)
-        expected = df.loc[[]]
-        assert_frame_equal(actual, expected)
-
-        # Series have always worked properly, but we'll test anyway.
-        s = df['B']
-        grouped = s.groupby(s)
-        actual = grouped.filter(lambda x: len(x) > 2)
-        expected = Series(4 * ['b'], index=np.arange(2, 6), name='B')
-        assert_series_equal(actual, expected)
-
-        actual = grouped.filter(lambda x: len(x) > 4)
-        expected = s[[]]
-        assert_series_equal(actual, expected)
-
-    def test_filter_maintains_ordering(self):
-        # Simple case: index is sequential. #4621
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]})
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-        # Now index is sequentially decreasing.
-        df.index = np.arange(len(df) - 1, -1, -1)
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-        # Index is shuffled.
-        SHUFFLED = [4, 6, 7, 2, 1, 0, 5, 3]
-        df.index = df.index[SHUFFLED]
-        s = df['pid']
-        grouped = df.groupby('tag')
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = df.iloc[[1, 2, 4, 7]]
-        assert_frame_equal(actual, expected)
-
-        grouped = s.groupby(df['tag'])
-        actual = grouped.filter(lambda x: len(x) > 1)
-        expected = s.iloc[[1, 2, 4, 7]]
-        assert_series_equal(actual, expected)
-
-    def test_filter_multiple_timestamp(self):
-        # GH 10114
-        df = DataFrame({'A': np.arange(5, dtype='int64'),
-                        'B': ['foo', 'bar', 'foo', 'bar', 'bar'],
-                        'C': Timestamp('20130101')})
-
-        grouped = df.groupby(['B', 'C'])
-
-        result = grouped['A'].filter(lambda x: True)
-        assert_series_equal(df['A'], result)
-
-        result = grouped['A'].transform(len)
-        expected = Series([2, 3, 2, 3, 3], name='A')
-        assert_series_equal(result, expected)
-
-        result = grouped.filter(lambda x: True)
-        assert_frame_equal(df, result)
-
-        result = grouped.transform('sum')
-        expected = DataFrame({'A': [2, 8, 2, 8, 8]})
-        assert_frame_equal(result, expected)
-
-        result = grouped.transform(len)
-        expected = DataFrame({'A': [2, 3, 2, 3, 3]})
-        assert_frame_equal(result, expected)
-
-    def test_filter_and_transform_with_non_unique_int_index(self):
-        # GH4620
-        index = [1, 1, 1, 2, 1, 1, 0, 1]
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_multiple_non_unique_int_index(self):
-        # GH4620
-        index = [1, 1, 1, 2, 0, 0, 0, 1]
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_float_index(self):
-        # GH4620
-        index = np.array([1, 1, 1, 2, 1, 1, 0, 1], dtype=float)
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_timestamp_index(self):
-        # GH4620
-        t0 = Timestamp('2013-09-30 00:05:00')
-        t1 = Timestamp('2013-10-30 00:05:00')
-        t2 = Timestamp('2013-11-30 00:05:00')
-        index = [t1, t1, t1, t2, t1, t1, t0, t1]
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_and_transform_with_non_unique_string_index(self):
-        # GH4620
-        index = list('bbbcbbab')
-        df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
-                        'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
-        grouped_df = df.groupby('tag')
-        ser = df['pid']
-        grouped_ser = ser.groupby(df['tag'])
-        expected_indexes = [1, 2, 4, 7]
-
-        # Filter DataFrame
-        actual = grouped_df.filter(lambda x: len(x) > 1)
-        expected = df.iloc[expected_indexes]
-        assert_frame_equal(actual, expected)
-
-        actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
-        expected = df.copy()
-        expected.iloc[[0, 3, 5, 6]] = np.nan
-        assert_frame_equal(actual, expected)
-
-        # Filter Series
-        actual = grouped_ser.filter(lambda x: len(x) > 1)
-        expected = ser.take(expected_indexes)
-        assert_series_equal(actual, expected)
-
-        actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
-        NA = np.nan
-        expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
-        # ^ made manually because this can get confusing!
-        assert_series_equal(actual, expected)
-
-        # Transform Series
-        actual = grouped_ser.transform(len)
-        expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
-        assert_series_equal(actual, expected)
-
-        # Transform (a column from) DataFrameGroupBy
-        actual = grouped_df.pid.transform(len)
-        assert_series_equal(actual, expected)
-
-    def test_filter_has_access_to_grouped_cols(self):
-        df = DataFrame([[1, 2], [1, 3], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        # previously didn't have access to col A #????
-        filt = g.filter(lambda x: x['A'].sum() == 2)
-        assert_frame_equal(filt, df.iloc[[0, 1]])
-
-    def test_filter_enforces_scalarness(self):
-        df = pd.DataFrame([
-            ['best', 'a', 'x'],
-            ['worst', 'b', 'y'],
-            ['best', 'c', 'x'],
-            ['best', 'd', 'y'],
-            ['worst', 'd', 'y'],
-            ['worst', 'd', 'y'],
-            ['best', 'd', 'z'],
-        ], columns=['a', 'b', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'filter function returned a.*'):
-            df.groupby('c').filter(lambda g: g['a'] == 'best')
-
-    def test_filter_non_bool_raises(self):
-        df = pd.DataFrame([
-            ['best', 'a', 1],
-            ['worst', 'b', 1],
-            ['best', 'c', 1],
-            ['best', 'd', 1],
-            ['worst', 'd', 1],
-            ['worst', 'd', 1],
-            ['best', 'd', 1],
-        ], columns=['a', 'b', 'c'])
-        with tm.assertRaisesRegexp(TypeError, 'filter function returned a.*'):
-            df.groupby('a').filter(lambda g: g.c.mean())
-
-    def test_filter_dropna_with_empty_groups(self):
-        # GH 10780
-        data = pd.Series(np.random.rand(9), index=np.repeat([1, 2, 3], 3))
-        groupped = data.groupby(level=0)
-        result_false = groupped.filter(lambda x: x.mean() > 1, dropna=False)
-        expected_false = pd.Series([np.nan] * 9,
-                                   index=np.repeat([1, 2, 3], 3))
-        tm.assert_series_equal(result_false, expected_false)
-
-        result_true = groupped.filter(lambda x: x.mean() > 1, dropna=True)
-        expected_true = pd.Series(index=pd.Index([], dtype=int))
-        tm.assert_series_equal(result_true, expected_true)
-
-
-def assert_fp_equal(a, b):
-    assert (np.abs(a - b) < 1e-12).all()
-
-
-def _check_groupby(df, result, keys, field, f=lambda x: x.sum()):
-    tups = lmap(tuple, df[keys].values)
-    tups = com._asarray_tuplesafe(tups)
-    expected = f(df.groupby(tups)[field])
-    for k, v in compat.iteritems(expected):
-        assert (result[k] == v)
+def test_filter_series():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    expected_odd = pd.Series([1, 3, 5, 7], index=[0, 1, 3, 6])
+    expected_even = pd.Series([20, 22, 24], index=[2, 4, 5])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() < 10), expected_odd)
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() > 10), expected_even)
+    # Test dropna=False.
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() < 10, dropna=False),
+        expected_odd.reindex(s.index))
+    tm.assert_series_equal(
+        grouped.filter(lambda x: x.mean() > 10, dropna=False),
+        expected_even.reindex(s.index))
+
+
+def test_filter_single_column_df():
+    df = pd.DataFrame([1, 3, 20, 5, 22, 24, 7])
+    expected_odd = pd.DataFrame([1, 3, 5, 7], index=[0, 1, 3, 6])
+    expected_even = pd.DataFrame([20, 22, 24], index=[2, 4, 5])
+    grouper = df[0].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() < 10), expected_odd)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() > 10), expected_even)
+    # Test dropna=False.
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() < 10, dropna=False),
+        expected_odd.reindex(df.index))
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x.mean() > 10, dropna=False),
+        expected_even.reindex(df.index))
+
+
+def test_filter_multi_column_df():
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': [1, 1, 1, 1]})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    expected = pd.DataFrame({'A': [12, 12], 'B': [1, 1]}, index=[1, 2])
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() - x['B'].sum() > 10),
+        expected)
+
+
+def test_filter_mixed_df():
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    expected = pd.DataFrame({'A': [12, 12], 'B': ['b', 'c']}, index=[1, 2])
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() > 10), expected)
+
+
+def test_filter_out_all_groups():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    tm.assert_series_equal(grouped.filter(lambda x: x.mean() > 1000), s[[]])
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    tm.assert_frame_equal(
+        grouped.filter(lambda x: x['A'].sum() > 1000), df.loc[[]])
+
+
+def test_filter_out_no_groups():
+    s = pd.Series([1, 3, 20, 5, 22, 24, 7])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    filtered = grouped.filter(lambda x: x.mean() > 0)
+    tm.assert_series_equal(filtered, s)
+    df = pd.DataFrame({'A': [1, 12, 12, 1], 'B': 'a b c d'.split()})
+    grouper = df['A'].apply(lambda x: x % 2)
+    grouped = df.groupby(grouper)
+    filtered = grouped.filter(lambda x: x['A'].mean() > 0)
+    tm.assert_frame_equal(filtered, df)
+
+
+def test_filter_out_all_groups_in_df():
+    # GH12768
+    df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
+    res = df.groupby('a')
+    res = res.filter(lambda x: x['b'].sum() > 5, dropna=False)
+    expected = pd.DataFrame({'a': [np.nan] * 3, 'b': [np.nan] * 3})
+    tm.assert_frame_equal(expected, res)
+
+    df = pd.DataFrame({'a': [1, 1, 2], 'b': [1, 2, 0]})
+    res = df.groupby('a')
+    res = res.filter(lambda x: x['b'].sum() > 5, dropna=True)
+    expected = pd.DataFrame({'a': [], 'b': []}, dtype="int64")
+    tm.assert_frame_equal(expected, res)
+
+
+def test_filter_condition_raises():
+    def raise_if_sum_is_zero(x):
+        if x.sum() == 0:
+            raise ValueError
+        else:
+            return x.sum() > 0
+
+    s = pd.Series([-1, 0, 1, 2])
+    grouper = s.apply(lambda x: x % 2)
+    grouped = s.groupby(grouper)
+    msg = "the filter must return a boolean result"
+    with pytest.raises(TypeError, match=msg):
+        grouped.filter(raise_if_sum_is_zero)
+
+
+def test_filter_with_axis_in_groupby():
+    # issue 11041
+    index = pd.MultiIndex.from_product([range(10), [0, 1]])
+    data = pd.DataFrame(
+        np.arange(100).reshape(-1, 20), columns=index, dtype='int64')
+    result = data.groupby(level=0,
+                          axis=1).filter(lambda x: x.iloc[0, 0] > 10)
+    expected = data.iloc[:, 12:20]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_filter_bad_shapes():
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    s = df['B']
+    g_df = df.groupby('B')
+    g_s = s.groupby(s)
+
+    f = lambda x: x
+    msg = "filter function returned a DataFrame, but expected a scalar bool"
+    with pytest.raises(TypeError, match=msg):
+        g_df.filter(f)
+    msg = "the filter must return a boolean result"
+    with pytest.raises(TypeError, match=msg):
+        g_s.filter(f)
+
+    f = lambda x: x == 1
+    msg = "filter function returned a DataFrame, but expected a scalar bool"
+    with pytest.raises(TypeError, match=msg):
+        g_df.filter(f)
+    msg = "the filter must return a boolean result"
+    with pytest.raises(TypeError, match=msg):
+        g_s.filter(f)
+
+    f = lambda x: np.outer(x, x)
+    msg = "can't multiply sequence by non-int of type 'str'"
+    with pytest.raises(TypeError, match=msg):
+        g_df.filter(f)
+    msg = "the filter must return a boolean result"
+    with pytest.raises(TypeError, match=msg):
+        g_s.filter(f)
+
+
+def test_filter_nan_is_false():
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    s = df['B']
+    g_df = df.groupby(df['B'])
+    g_s = s.groupby(s)
+
+    f = lambda x: np.nan
+    tm.assert_frame_equal(g_df.filter(f), df.loc[[]])
+    tm.assert_series_equal(g_s.filter(f), s[[]])
+
+
+def test_filter_against_workaround():
+    np.random.seed(0)
+    # Series of ints
+    s = Series(np.random.randint(0, 100, 1000))
+    grouper = s.apply(lambda x: np.round(x, -1))
+    grouped = s.groupby(grouper)
+    f = lambda x: x.mean() > 10
+
+    old_way = s[grouped.transform(f).astype('bool')]
+    new_way = grouped.filter(f)
+    tm.assert_series_equal(new_way.sort_values(), old_way.sort_values())
+
+    # Series of floats
+    s = 100 * Series(np.random.random(1000))
+    grouper = s.apply(lambda x: np.round(x, -1))
+    grouped = s.groupby(grouper)
+    f = lambda x: x.mean() > 10
+    old_way = s[grouped.transform(f).astype('bool')]
+    new_way = grouped.filter(f)
+    tm.assert_series_equal(new_way.sort_values(), old_way.sort_values())
+
+    # Set up DataFrame of ints, floats, strings.
+    from string import ascii_lowercase
+    letters = np.array(list(ascii_lowercase))
+    N = 1000
+    random_letters = letters.take(np.random.randint(0, 26, N))
+    df = DataFrame({'ints': Series(np.random.randint(0, 100, N)),
+                    'floats': N / 10 * Series(np.random.random(N)),
+                    'letters': Series(random_letters)})
+
+    # Group by ints; filter on floats.
+    grouped = df.groupby('ints')
+    old_way = df[grouped.floats.
+                 transform(lambda x: x.mean() > N / 20).astype('bool')]
+    new_way = grouped.filter(lambda x: x['floats'].mean() > N / 20)
+    tm.assert_frame_equal(new_way, old_way)
+
+    # Group by floats (rounded); filter on strings.
+    grouper = df.floats.apply(lambda x: np.round(x, -1))
+    grouped = df.groupby(grouper)
+    old_way = df[grouped.letters.
+                 transform(lambda x: len(x) < N / 10).astype('bool')]
+    new_way = grouped.filter(lambda x: len(x.letters) < N / 10)
+    tm.assert_frame_equal(new_way, old_way)
+
+    # Group by strings; filter on ints.
+    grouped = df.groupby('letters')
+    old_way = df[grouped.ints.
+                 transform(lambda x: x.mean() > N / 20).astype('bool')]
+    new_way = grouped.filter(lambda x: x['ints'].mean() > N / 20)
+    tm.assert_frame_equal(new_way, old_way)
+
+
+def test_filter_using_len():
+    # BUG GH4447
+    df = DataFrame({'A': np.arange(8),
+                    'B': list('aabbbbcc'),
+                    'C': np.arange(8)})
+    grouped = df.groupby('B')
+    actual = grouped.filter(lambda x: len(x) > 2)
+    expected = DataFrame(
+        {'A': np.arange(2, 6),
+         'B': list('bbbb'),
+         'C': np.arange(2, 6)}, index=np.arange(2, 6))
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped.filter(lambda x: len(x) > 4)
+    expected = df.loc[[]]
+    tm.assert_frame_equal(actual, expected)
+
+    # Series have always worked properly, but we'll test anyway.
+    s = df['B']
+    grouped = s.groupby(s)
+    actual = grouped.filter(lambda x: len(x) > 2)
+    expected = Series(4 * ['b'], index=np.arange(2, 6), name='B')
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped.filter(lambda x: len(x) > 4)
+    expected = s[[]]
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_maintains_ordering():
+    # Simple case: index is sequential. #4621
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]})
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+    # Now index is sequentially decreasing.
+    df.index = np.arange(len(df) - 1, -1, -1)
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+    # Index is shuffled.
+    SHUFFLED = [4, 6, 7, 2, 1, 0, 5, 3]
+    df.index = df.index[SHUFFLED]
+    s = df['pid']
+    grouped = df.groupby('tag')
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = df.iloc[[1, 2, 4, 7]]
+    tm.assert_frame_equal(actual, expected)
+
+    grouped = s.groupby(df['tag'])
+    actual = grouped.filter(lambda x: len(x) > 1)
+    expected = s.iloc[[1, 2, 4, 7]]
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_multiple_timestamp():
+    # GH 10114
+    df = DataFrame({'A': np.arange(5, dtype='int64'),
+                    'B': ['foo', 'bar', 'foo', 'bar', 'bar'],
+                    'C': Timestamp('20130101')})
+
+    grouped = df.groupby(['B', 'C'])
+
+    result = grouped['A'].filter(lambda x: True)
+    tm.assert_series_equal(df['A'], result)
+
+    result = grouped['A'].transform(len)
+    expected = Series([2, 3, 2, 3, 3], name='A')
+    tm.assert_series_equal(result, expected)
+
+    result = grouped.filter(lambda x: True)
+    tm.assert_frame_equal(df, result)
+
+    result = grouped.transform('sum')
+    expected = DataFrame({'A': [2, 8, 2, 8, 8]})
+    tm.assert_frame_equal(result, expected)
+
+    result = grouped.transform(len)
+    expected = DataFrame({'A': [2, 3, 2, 3, 3]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_filter_and_transform_with_non_unique_int_index():
+    # GH4620
+    index = [1, 1, 1, 2, 1, 1, 0, 1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_multiple_non_unique_int_index():
+    # GH4620
+    index = [1, 1, 1, 2, 0, 0, 0, 1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_float_index():
+    # GH4620
+    index = np.array([1, 1, 1, 2, 1, 1, 0, 1], dtype=float)
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_timestamp_index():
+    # GH4620
+    t0 = Timestamp('2013-09-30 00:05:00')
+    t1 = Timestamp('2013-10-30 00:05:00')
+    t2 = Timestamp('2013-11-30 00:05:00')
+    index = [t1, t1, t1, t2, t1, t1, t0, t1]
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_and_transform_with_non_unique_string_index():
+    # GH4620
+    index = list('bbbcbbab')
+    df = DataFrame({'pid': [1, 1, 1, 2, 2, 3, 3, 3],
+                    'tag': [23, 45, 62, 24, 45, 34, 25, 62]}, index=index)
+    grouped_df = df.groupby('tag')
+    ser = df['pid']
+    grouped_ser = ser.groupby(df['tag'])
+    expected_indexes = [1, 2, 4, 7]
+
+    # Filter DataFrame
+    actual = grouped_df.filter(lambda x: len(x) > 1)
+    expected = df.iloc[expected_indexes]
+    tm.assert_frame_equal(actual, expected)
+
+    actual = grouped_df.filter(lambda x: len(x) > 1, dropna=False)
+    expected = df.copy()
+    expected.iloc[[0, 3, 5, 6]] = np.nan
+    tm.assert_frame_equal(actual, expected)
+
+    # Filter Series
+    actual = grouped_ser.filter(lambda x: len(x) > 1)
+    expected = ser.take(expected_indexes)
+    tm.assert_series_equal(actual, expected)
+
+    actual = grouped_ser.filter(lambda x: len(x) > 1, dropna=False)
+    NA = np.nan
+    expected = Series([NA, 1, 1, NA, 2, NA, NA, 3], index, name='pid')
+    # ^ made manually because this can get confusing!
+    tm.assert_series_equal(actual, expected)
+
+    # Transform Series
+    actual = grouped_ser.transform(len)
+    expected = Series([1, 2, 2, 1, 2, 1, 1, 2], index, name='pid')
+    tm.assert_series_equal(actual, expected)
+
+    # Transform (a column from) DataFrameGroupBy
+    actual = grouped_df.pid.transform(len)
+    tm.assert_series_equal(actual, expected)
+
+
+def test_filter_has_access_to_grouped_cols():
+    df = DataFrame([[1, 2], [1, 3], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    # previously didn't have access to col A #????
+    filt = g.filter(lambda x: x['A'].sum() == 2)
+    tm.assert_frame_equal(filt, df.iloc[[0, 1]])
+
+
+def test_filter_enforces_scalarness():
+    df = pd.DataFrame([
+        ['best', 'a', 'x'],
+        ['worst', 'b', 'y'],
+        ['best', 'c', 'x'],
+        ['best', 'd', 'y'],
+        ['worst', 'd', 'y'],
+        ['worst', 'd', 'y'],
+        ['best', 'd', 'z'],
+    ], columns=['a', 'b', 'c'])
+    with pytest.raises(TypeError, match='filter function returned a.*'):
+        df.groupby('c').filter(lambda g: g['a'] == 'best')
+
+
+def test_filter_non_bool_raises():
+    df = pd.DataFrame([
+        ['best', 'a', 1],
+        ['worst', 'b', 1],
+        ['best', 'c', 1],
+        ['best', 'd', 1],
+        ['worst', 'd', 1],
+        ['worst', 'd', 1],
+        ['best', 'd', 1],
+    ], columns=['a', 'b', 'c'])
+    with pytest.raises(TypeError, match='filter function returned a.*'):
+        df.groupby('a').filter(lambda g: g.c.mean())
+
+
+def test_filter_dropna_with_empty_groups():
+    # GH 10780
+    data = pd.Series(np.random.rand(9), index=np.repeat([1, 2, 3], 3))
+    groupped = data.groupby(level=0)
+    result_false = groupped.filter(lambda x: x.mean() > 1, dropna=False)
+    expected_false = pd.Series([np.nan] * 9,
+                               index=np.repeat([1, 2, 3], 3))
+    tm.assert_series_equal(result_false, expected_false)
+
+    result_true = groupped.filter(lambda x: x.mean() > 1, dropna=True)
+    expected_true = pd.Series(index=pd.Index([], dtype=int))
+    tm.assert_series_equal(result_true, expected_true)
diff --git a/pandas/tests/groupby/test_function.py b/pandas/tests/groupby/test_function.py
new file mode 100644
index 0000000000000..b5e328ef64424
--- /dev/null
+++ b/pandas/tests/groupby/test_function.py
@@ -0,0 +1,1201 @@
+from string import ascii_lowercase
+
+import numpy as np
+import pytest
+
+from pandas.compat import product as cart_product
+from pandas.errors import UnsupportedFunctionCall
+
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, Series, Timestamp, compat, date_range, isna)
+import pandas.core.nanops as nanops
+from pandas.util import testing as tm
+
+
+@pytest.mark.parametrize("agg_func", ['any', 'all'])
+@pytest.mark.parametrize("skipna", [True, False])
+@pytest.mark.parametrize("vals", [
+    ['foo', 'bar', 'baz'], ['foo', '', ''], ['', '', ''],
+    [1, 2, 3], [1, 0, 0], [0, 0, 0],
+    [1., 2., 3.], [1., 0., 0.], [0., 0., 0.],
+    [True, True, True], [True, False, False], [False, False, False],
+    [np.nan, np.nan, np.nan]
+])
+def test_groupby_bool_aggs(agg_func, skipna, vals):
+    df = DataFrame({'key': ['a'] * 3 + ['b'] * 3, 'val': vals * 2})
+
+    # Figure out expectation using Python builtin
+    exp = getattr(compat.builtins, agg_func)(vals)
+
+    # edge case for missing data with skipna and 'any'
+    if skipna and all(isna(vals)) and agg_func == 'any':
+        exp = False
+
+    exp_df = DataFrame([exp] * 2, columns=['val'], index=Index(
+        ['a', 'b'], name='key'))
+    result = getattr(df.groupby('key'), agg_func)(skipna=skipna)
+    tm.assert_frame_equal(result, exp_df)
+
+
+def test_max_min_non_numeric():
+    # #2700
+    aa = DataFrame({'nn': [11, 11, 22, 22],
+                    'ii': [1, 2, 3, 4],
+                    'ss': 4 * ['mama']})
+
+    result = aa.groupby('nn').max()
+    assert 'ss' in result
+
+    result = aa.groupby('nn').max(numeric_only=False)
+    assert 'ss' in result
+
+    result = aa.groupby('nn').min()
+    assert 'ss' in result
+
+    result = aa.groupby('nn').min(numeric_only=False)
+    assert 'ss' in result
+
+
+def test_intercept_builtin_sum():
+    s = Series([1., 2., np.nan, 3.])
+    grouped = s.groupby([0, 1, 2, 2])
+
+    result = grouped.agg(compat.builtins.sum)
+    result2 = grouped.apply(compat.builtins.sum)
+    expected = grouped.sum()
+    tm.assert_series_equal(result, expected)
+    tm.assert_series_equal(result2, expected)
+
+
+# @pytest.mark.parametrize("f", [max, min, sum])
+# def test_builtins_apply(f):
+
+@pytest.mark.parametrize("f", [max, min, sum])
+@pytest.mark.parametrize('keys', [
+    "jim",  # Single key
+    ["jim", "joe"]  # Multi-key
+])
+def test_builtins_apply(keys, f):
+    # see gh-8155
+    df = pd.DataFrame(np.random.randint(1, 50, (1000, 2)),
+                      columns=["jim", "joe"])
+    df["jolie"] = np.random.randn(1000)
+
+    fname = f.__name__
+    result = df.groupby(keys).apply(f)
+    ngroups = len(df.drop_duplicates(subset=keys))
+
+    assert_msg = ("invalid frame shape: {} "
+                  "(expected ({}, 3))".format(result.shape, ngroups))
+    assert result.shape == (ngroups, 3), assert_msg
+
+    tm.assert_frame_equal(result,  # numpy's equivalent function
+                          df.groupby(keys).apply(getattr(np, fname)))
+
+    if f != sum:
+        expected = df.groupby(keys).agg(fname).reset_index()
+        expected.set_index(keys, inplace=True, drop=False)
+        tm.assert_frame_equal(result, expected, check_dtype=False)
+
+    tm.assert_series_equal(getattr(result, fname)(),
+                           getattr(df, fname)())
+
+
+def test_arg_passthru():
+    # make sure that we are passing thru kwargs
+    # to our agg functions
+
+    # GH3668
+    # GH5724
+    df = pd.DataFrame(
+        {'group': [1, 1, 2],
+         'int': [1, 2, 3],
+         'float': [4., 5., 6.],
+         'string': list('abc'),
+         'category_string': pd.Series(list('abc')).astype('category'),
+         'category_int': [7, 8, 9],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetimetz': pd.date_range('20130101',
+                                     periods=3,
+                                     tz='US/Eastern'),
+         'timedelta': pd.timedelta_range('1 s', periods=3, freq='s')},
+        columns=['group', 'int', 'float', 'string',
+                 'category_string', 'category_int',
+                 'datetime', 'datetimetz',
+                 'timedelta'])
+
+    expected_columns_numeric = Index(['int', 'float', 'category_int'])
+
+    # mean / median
+    expected = pd.DataFrame(
+        {'category_int': [7.5, 9],
+         'float': [4.5, 6.],
+         'timedelta': [pd.Timedelta('1.5s'),
+                       pd.Timedelta('3s')],
+         'int': [1.5, 3],
+         'datetime': [pd.Timestamp('2013-01-01 12:00:00'),
+                      pd.Timestamp('2013-01-03 00:00:00')],
+         'datetimetz': [
+             pd.Timestamp('2013-01-01 12:00:00', tz='US/Eastern'),
+             pd.Timestamp('2013-01-03 00:00:00', tz='US/Eastern')]},
+        index=Index([1, 2], name='group'),
+        columns=['int', 'float', 'category_int',
+                 'datetime', 'datetimetz', 'timedelta'])
+    for attr in ['mean', 'median']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_frame_equal(result.reindex_like(expected), expected)
+
+    # TODO: min, max *should* handle
+    # categorical (ordered) dtype
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['min', 'max']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_string', 'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['first', 'last']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'string',
+                              'category_int', 'timedelta'])
+    for attr in ['sum']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'category_int'])
+    for attr in ['prod', 'cumprod']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    # like min, max, but don't include strings
+    expected_columns = Index(['int', 'float',
+                              'category_int',
+                              'datetime', 'datetimetz',
+                              'timedelta'])
+    for attr in ['cummin', 'cummax']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        # GH 15561: numeric_only=False set by default like min/max
+        tm.assert_index_equal(result.columns, expected_columns)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+    expected_columns = Index(['int', 'float', 'category_int',
+                              'timedelta'])
+    for attr in ['cumsum']:
+        f = getattr(df.groupby('group'), attr)
+        result = f()
+        tm.assert_index_equal(result.columns, expected_columns_numeric)
+
+        result = f(numeric_only=False)
+        tm.assert_index_equal(result.columns, expected_columns)
+
+
+def test_non_cython_api():
+
+    # GH5610
+    # non-cython calls should not include the grouper
+
+    df = DataFrame(
+        [[1, 2, 'foo'],
+         [1, np.nan, 'bar'],
+         [3, np.nan, 'baz']],
+        columns=['A', 'B', 'C'])
+    g = df.groupby('A')
+    gni = df.groupby('A', as_index=False)
+
+    # mad
+    expected = DataFrame([[0], [np.nan]], columns=['B'], index=[1, 3])
+    expected.index.name = 'A'
+    result = g.mad()
+    tm.assert_frame_equal(result, expected)
+
+    expected = DataFrame([[0., 0.], [0, np.nan]], columns=['A', 'B'],
+                         index=[0, 1])
+    result = gni.mad()
+    tm.assert_frame_equal(result, expected)
+
+    # describe
+    expected_index = pd.Index([1, 3], name='A')
+    expected_col = pd.MultiIndex(levels=[['B'],
+                                         ['count', 'mean', 'std', 'min',
+                                          '25%', '50%', '75%', 'max']],
+                                 codes=[[0] * 8, list(range(8))])
+    expected = pd.DataFrame([[1.0, 2.0, np.nan, 2.0, 2.0, 2.0, 2.0, 2.0],
+                             [0.0, np.nan, np.nan, np.nan, np.nan, np.nan,
+                              np.nan, np.nan]],
+                            index=expected_index,
+                            columns=expected_col)
+    result = g.describe()
+    tm.assert_frame_equal(result, expected)
+
+    expected = pd.concat([df[df.A == 1].describe().unstack().to_frame().T,
+                          df[df.A == 3].describe().unstack().to_frame().T])
+    expected.index = pd.Index([0, 1])
+    result = gni.describe()
+    tm.assert_frame_equal(result, expected)
+
+    # any
+    expected = DataFrame([[True, True], [False, True]], columns=['B', 'C'],
+                         index=[1, 3])
+    expected.index.name = 'A'
+    result = g.any()
+    tm.assert_frame_equal(result, expected)
+
+    # idxmax
+    expected = DataFrame([[0.0], [np.nan]], columns=['B'], index=[1, 3])
+    expected.index.name = 'A'
+    result = g.idxmax()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_api2():
+
+    # this takes the fast apply path
+
+    # cumsum (GH5614)
+    df = DataFrame(
+        [[1, 2, np.nan], [1, np.nan, 9], [3, 4, 9]
+         ], columns=['A', 'B', 'C'])
+    expected = DataFrame(
+        [[2, np.nan], [np.nan, 9], [4, 9]], columns=['B', 'C'])
+    result = df.groupby('A').cumsum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 5755 - cumsum is a transformer and should ignore as_index
+    result = df.groupby('A', as_index=False).cumsum()
+    tm.assert_frame_equal(result, expected)
+
+    # GH 13994
+    result = df.groupby('A').cumsum(axis=1)
+    expected = df.cumsum(axis=1)
+    tm.assert_frame_equal(result, expected)
+    result = df.groupby('A').cumprod(axis=1)
+    expected = df.cumprod(axis=1)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_cython_median():
+    df = DataFrame(np.random.randn(1000))
+    df.values[::2] = np.nan
+
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+    labels[::17] = np.nan
+
+    result = df.groupby(labels).median()
+    exp = df.groupby(labels).agg(nanops.nanmedian)
+    tm.assert_frame_equal(result, exp)
+
+    df = DataFrame(np.random.randn(1000, 5))
+    rs = df.groupby(labels).agg(np.median)
+    xp = df.groupby(labels).median()
+    tm.assert_frame_equal(rs, xp)
+
+
+def test_median_empty_bins(observed):
+    df = pd.DataFrame(np.random.randint(0, 44, 500))
+
+    grps = range(0, 55, 5)
+    bins = pd.cut(df[0], grps)
+
+    result = df.groupby(bins, observed=observed).median()
+    expected = df.groupby(bins, observed=observed).agg(lambda x: x.median())
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("dtype", [
+    'int8', 'int16', 'int32', 'int64', 'float32', 'float64'])
+@pytest.mark.parametrize("method,data", [
+    ('first', {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]}),
+    ('last', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]}),
+    ('min', {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]}),
+    ('max', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]}),
+    ('nth', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}],
+             'args': [1]}),
+    ('count', {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 2}],
+               'out_type': 'int64'})
+])
+def test_groupby_non_arithmetic_agg_types(dtype, method, data):
+    # GH9311, GH6620
+    df = pd.DataFrame(
+        [{'a': 1, 'b': 1},
+         {'a': 1, 'b': 2},
+         {'a': 2, 'b': 3},
+         {'a': 2, 'b': 4}])
+
+    df['b'] = df.b.astype(dtype)
+
+    if 'args' not in data:
+        data['args'] = []
+
+    if 'out_type' in data:
+        out_type = data['out_type']
+    else:
+        out_type = dtype
+
+    exp = data['df']
+    df_out = pd.DataFrame(exp)
+
+    df_out['b'] = df_out.b.astype(out_type)
+    df_out.set_index('a', inplace=True)
+
+    grpd = df.groupby('a')
+    t = getattr(grpd, method)(*data['args'])
+    tm.assert_frame_equal(t, df_out)
+
+
+@pytest.mark.parametrize("i", [
+    (Timestamp("2011-01-15 12:50:28.502376"),
+     Timestamp("2011-01-20 12:50:28.593448")),
+    (24650000000000001, 24650000000000002)
+])
+def test_groupby_non_arithmetic_agg_int_like_precision(i):
+    # see gh-6620, gh-9311
+    df = pd.DataFrame([{"a": 1, "b": i[0]}, {"a": 1, "b": i[1]}])
+
+    grp_exp = {"first": {"expected": i[0]},
+               "last": {"expected": i[1]},
+               "min": {"expected": i[0]},
+               "max": {"expected": i[1]},
+               "nth": {"expected": i[1],
+                       "args": [1]},
+               "count": {"expected": 2}}
+
+    for method, data in compat.iteritems(grp_exp):
+        if "args" not in data:
+            data["args"] = []
+
+        grouped = df.groupby("a")
+        res = getattr(grouped, method)(*data["args"])
+
+        assert res.iloc[0].b == data["expected"]
+
+
+def test_fill_consistency():
+
+    # GH9221
+    # pass thru keyword arguments to the generated wrapper
+    # are set if the passed kw is None (only)
+    df = DataFrame(index=pd.MultiIndex.from_product(
+        [['value1', 'value2'], date_range('2014-01-01', '2014-01-06')]),
+        columns=Index(
+        ['1', '2'], name='id'))
+    df['1'] = [np.nan, 1, np.nan, np.nan, 11, np.nan, np.nan, 2, np.nan,
+               np.nan, 22, np.nan]
+    df['2'] = [np.nan, 3, np.nan, np.nan, 33, np.nan, np.nan, 4, np.nan,
+               np.nan, 44, np.nan]
+
+    expected = df.groupby(level=0, axis=0).fillna(method='ffill')
+    result = df.T.groupby(level=0, axis=1).fillna(method='ffill').T
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_cumprod():
+    # GH 4095
+    df = pd.DataFrame({'key': ['b'] * 10, 'value': 2})
+
+    actual = df.groupby('key')['value'].cumprod()
+    expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
+    expected.name = 'value'
+    tm.assert_series_equal(actual, expected)
+
+    df = pd.DataFrame({'key': ['b'] * 100, 'value': 2})
+    actual = df.groupby('key')['value'].cumprod()
+    # if overflows, groupby product casts to float
+    # while numpy passes back invalid values
+    df['value'] = df['value'].astype(float)
+    expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
+    expected.name = 'value'
+    tm.assert_series_equal(actual, expected)
+
+
+def test_ops_general():
+    ops = [('mean', np.mean),
+           ('median', np.median),
+           ('std', np.std),
+           ('var', np.var),
+           ('sum', np.sum),
+           ('prod', np.prod),
+           ('min', np.min),
+           ('max', np.max),
+           ('first', lambda x: x.iloc[0]),
+           ('last', lambda x: x.iloc[-1]),
+           ('count', np.size), ]
+    try:
+        from scipy.stats import sem
+    except ImportError:
+        pass
+    else:
+        ops.append(('sem', sem))
+    df = DataFrame(np.random.randn(1000))
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    for op, targop in ops:
+        result = getattr(df.groupby(labels), op)().astype(float)
+        expected = df.groupby(labels).agg(targop)
+        try:
+            tm.assert_frame_equal(result, expected)
+        except BaseException as exc:
+            exc.args += ('operation: %s' % op, )
+            raise
+
+
+def test_max_nan_bug():
+    raw = """,Date,app,File
+-04-23,2013-04-23 00:00:00,,log080001.log
+-05-06,2013-05-06 00:00:00,,log.log
+-05-07,2013-05-07 00:00:00,OE,xlsx"""
+
+    df = pd.read_csv(compat.StringIO(raw), parse_dates=[0])
+    gb = df.groupby('Date')
+    r = gb[['File']].max()
+    e = gb['File'].max().to_frame()
+    tm.assert_frame_equal(r, e)
+    assert not r['File'].isna().any()
+
+
+def test_nlargest():
+    a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
+    b = Series(list('a' * 5 + 'b' * 5))
+    gb = a.groupby(b)
+    r = gb.nlargest(3)
+    e = Series([
+        7, 5, 3, 10, 9, 6
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [3, 2, 1, 9, 5, 8]]))
+    tm.assert_series_equal(r, e)
+
+    a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
+    gb = a.groupby(b)
+    e = Series([
+        3, 2, 1, 3, 3, 2
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [2, 3, 1, 6, 5, 7]]))
+    tm.assert_series_equal(gb.nlargest(3, keep='last'), e)
+
+
+def test_nsmallest():
+    a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
+    b = Series(list('a' * 5 + 'b' * 5))
+    gb = a.groupby(b)
+    r = gb.nsmallest(3)
+    e = Series([
+        1, 2, 3, 0, 4, 6
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [0, 4, 1, 6, 7, 8]]))
+    tm.assert_series_equal(r, e)
+
+    a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
+    gb = a.groupby(b)
+    e = Series([
+        0, 1, 1, 0, 1, 2
+    ], index=MultiIndex.from_arrays([list('aaabbb'), [4, 1, 0, 9, 8, 7]]))
+    tm.assert_series_equal(gb.nsmallest(3, keep='last'), e)
+
+
+@pytest.mark.parametrize("func", [
+    'mean', 'var', 'std', 'cumprod', 'cumsum'
+])
+def test_numpy_compat(func):
+    # see gh-12811
+    df = pd.DataFrame({'A': [1, 2, 1], 'B': [1, 2, 3]})
+    g = df.groupby('A')
+
+    msg = "numpy operations are not valid with groupby"
+
+    with pytest.raises(UnsupportedFunctionCall, match=msg):
+        getattr(g, func)(1, 2, 3)
+    with pytest.raises(UnsupportedFunctionCall, match=msg):
+        getattr(g, func)(foo=1)
+
+
+def test_cummin_cummax():
+    # GH 15048
+    num_types = [np.int32, np.int64, np.float32, np.float64]
+    num_mins = [np.iinfo(np.int32).min, np.iinfo(np.int64).min,
+                np.finfo(np.float32).min, np.finfo(np.float64).min]
+    num_max = [np.iinfo(np.int32).max, np.iinfo(np.int64).max,
+               np.finfo(np.float32).max, np.finfo(np.float64).max]
+    base_df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 2, 2],
+                            'B': [3, 4, 3, 2, 2, 3, 2, 1]})
+    expected_mins = [3, 3, 3, 2, 2, 2, 2, 1]
+    expected_maxs = [3, 4, 4, 4, 2, 3, 3, 3]
+
+    for dtype, min_val, max_val in zip(num_types, num_mins, num_max):
+        df = base_df.astype(dtype)
+
+        # cummin
+        expected = pd.DataFrame({'B': expected_mins}).astype(dtype)
+        result = df.groupby('A').cummin()
+        tm.assert_frame_equal(result, expected)
+        result = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # Test cummin w/ min value for dtype
+        df.loc[[2, 6], 'B'] = min_val
+        expected.loc[[2, 3, 6, 7], 'B'] = min_val
+        result = df.groupby('A').cummin()
+        tm.assert_frame_equal(result, expected)
+        expected = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # cummax
+        expected = pd.DataFrame({'B': expected_maxs}).astype(dtype)
+        result = df.groupby('A').cummax()
+        tm.assert_frame_equal(result, expected)
+        result = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+        # Test cummax w/ max value for dtype
+        df.loc[[2, 6], 'B'] = max_val
+        expected.loc[[2, 3, 6, 7], 'B'] = max_val
+        result = df.groupby('A').cummax()
+        tm.assert_frame_equal(result, expected)
+        expected = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+        tm.assert_frame_equal(result, expected)
+
+    # Test nan in some values
+    base_df.loc[[0, 2, 4, 6], 'B'] = np.nan
+    expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 2,
+                                   np.nan, 3, np.nan, 1]})
+    result = base_df.groupby('A').cummin()
+    tm.assert_frame_equal(result, expected)
+    expected = (base_df.groupby('A')
+                       .B
+                       .apply(lambda x: x.cummin())
+                       .to_frame())
+    tm.assert_frame_equal(result, expected)
+
+    expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 4,
+                                   np.nan, 3, np.nan, 3]})
+    result = base_df.groupby('A').cummax()
+    tm.assert_frame_equal(result, expected)
+    expected = (base_df.groupby('A')
+                       .B
+                       .apply(lambda x: x.cummax())
+                       .to_frame())
+    tm.assert_frame_equal(result, expected)
+
+    # Test nan in entire column
+    base_df['B'] = np.nan
+    expected = pd.DataFrame({'B': [np.nan] * 8})
+    result = base_df.groupby('A').cummin()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').cummax()
+    tm.assert_frame_equal(expected, result)
+    result = base_df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
+    tm.assert_frame_equal(expected, result)
+
+    # GH 15561
+    df = pd.DataFrame(dict(a=[1], b=pd.to_datetime(['2001'])))
+    expected = pd.Series(pd.to_datetime('2001'), index=[0], name='b')
+    for method in ['cummax', 'cummin']:
+        result = getattr(df.groupby('a')['b'], method)()
+        tm.assert_series_equal(expected, result)
+
+    # GH 15635
+    df = pd.DataFrame(dict(a=[1, 2, 1], b=[2, 1, 1]))
+    result = df.groupby('a').b.cummax()
+    expected = pd.Series([2, 1, 2], name='b')
+    tm.assert_series_equal(result, expected)
+
+    df = pd.DataFrame(dict(a=[1, 2, 1], b=[1, 2, 2]))
+    result = df.groupby('a').b.cummin()
+    expected = pd.Series([1, 2, 1], name='b')
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('in_vals, out_vals', [
+
+    # Basics: strictly increasing (T), strictly decreasing (F),
+    # abs val increasing (F), non-strictly increasing (T)
+    ([1, 2, 5, 3, 2, 0, 4, 5, -6, 1, 1],
+     [True, False, False, True]),
+
+    # Test with inf vals
+    ([1, 2.1, np.inf, 3, 2, np.inf, -np.inf, 5, 11, 1, -np.inf],
+     [True, False, True, False]),
+
+    # Test with nan vals; should always be False
+    ([1, 2, np.nan, 3, 2, np.nan, np.nan, 5, -np.inf, 1, np.nan],
+     [False, False, False, False]),
+])
+def test_is_monotonic_increasing(in_vals, out_vals):
+    # GH 17015
+    source_dict = {
+        'A': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11'],
+        'B': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c', 'd', 'd'],
+        'C': in_vals}
+    df = pd.DataFrame(source_dict)
+    result = df.groupby('B').C.is_monotonic_increasing
+    index = Index(list('abcd'), name='B')
+    expected = pd.Series(index=index, data=out_vals, name='C')
+    tm.assert_series_equal(result, expected)
+
+    # Also check result equal to manually taking x.is_monotonic_increasing.
+    expected = (
+        df.groupby(['B']).C.apply(lambda x: x.is_monotonic_increasing))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('in_vals, out_vals', [
+    # Basics: strictly decreasing (T), strictly increasing (F),
+    # abs val decreasing (F), non-strictly increasing (T)
+    ([10, 9, 7, 3, 4, 5, -3, 2, 0, 1, 1],
+     [True, False, False, True]),
+
+    # Test with inf vals
+    ([np.inf, 1, -np.inf, np.inf, 2, -3, -np.inf, 5, -3, -np.inf, -np.inf],
+     [True, True, False, True]),
+
+    # Test with nan vals; should always be False
+    ([1, 2, np.nan, 3, 2, np.nan, np.nan, 5, -np.inf, 1, np.nan],
+     [False, False, False, False]),
+])
+def test_is_monotonic_decreasing(in_vals, out_vals):
+    # GH 17015
+    source_dict = {
+        'A': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11'],
+        'B': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c', 'd', 'd'],
+        'C': in_vals}
+
+    df = pd.DataFrame(source_dict)
+    result = df.groupby('B').C.is_monotonic_decreasing
+    index = Index(list('abcd'), name='B')
+    expected = pd.Series(index=index, data=out_vals, name='C')
+    tm.assert_series_equal(result, expected)
+
+
+# describe
+# --------------------------------
+
+def test_apply_describe_bug(mframe):
+    grouped = mframe.groupby(level='first')
+    grouped.describe()  # it works!
+
+
+def test_series_describe_multikey():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.describe()
+    tm.assert_series_equal(result['mean'], grouped.mean(),
+                           check_names=False)
+    tm.assert_series_equal(result['std'], grouped.std(), check_names=False)
+    tm.assert_series_equal(result['min'], grouped.min(), check_names=False)
+
+
+def test_series_describe_single():
+    ts = tm.makeTimeSeries()
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.apply(lambda x: x.describe())
+    expected = grouped.describe().stack()
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_index_name(df):
+    grouped = df.loc[:, ['C']].groupby(df['A'])
+    result = grouped.agg(lambda x: x.mean())
+    assert result.index.name == 'A'
+
+
+def test_frame_describe_multikey(tsframe):
+    grouped = tsframe.groupby([lambda x: x.year, lambda x: x.month])
+    result = grouped.describe()
+    desc_groups = []
+    for col in tsframe:
+        group = grouped[col].describe()
+        # GH 17464 - Remove duplicate MultiIndex levels
+        group_col = pd.MultiIndex(
+            levels=[[col], group.columns],
+            codes=[[0] * len(group.columns), range(len(group.columns))])
+        group = pd.DataFrame(group.values,
+                             columns=group_col,
+                             index=group.index)
+        desc_groups.append(group)
+    expected = pd.concat(desc_groups, axis=1)
+    tm.assert_frame_equal(result, expected)
+
+    groupedT = tsframe.groupby({'A': 0, 'B': 0,
+                                'C': 1, 'D': 1}, axis=1)
+    result = groupedT.describe()
+    expected = tsframe.describe().T
+    expected.index = pd.MultiIndex(
+        levels=[[0, 1], expected.index],
+        codes=[[0, 0, 1, 1], range(len(expected.index))])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_frame_describe_tupleindex():
+
+    # GH 14848 - regression from 0.19.0 to 0.19.1
+    df1 = DataFrame({'x': [1, 2, 3, 4, 5] * 3,
+                     'y': [10, 20, 30, 40, 50] * 3,
+                     'z': [100, 200, 300, 400, 500] * 3})
+    df1['k'] = [(0, 0, 1), (0, 1, 0), (1, 0, 0)] * 5
+    df2 = df1.rename(columns={'k': 'key'})
+    msg = "Names should be list-like for a MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        df1.groupby('k').describe()
+    with pytest.raises(ValueError, match=msg):
+        df2.groupby('key').describe()
+
+
+def test_frame_describe_unstacked_format():
+    # GH 4792
+    prices = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 24990,
+              pd.Timestamp('2011-01-06 12:43:33', tz=None): 25499,
+              pd.Timestamp('2011-01-06 12:54:09', tz=None): 25499}
+    volumes = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
+               pd.Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
+               pd.Timestamp('2011-01-06 12:54:09', tz=None): 100000000}
+    df = pd.DataFrame({'PRICE': prices,
+                       'VOLUME': volumes})
+    result = df.groupby('PRICE').VOLUME.describe()
+    data = [df[df.PRICE == 24990].VOLUME.describe().values.tolist(),
+            df[df.PRICE == 25499].VOLUME.describe().values.tolist()]
+    expected = pd.DataFrame(data,
+                            index=pd.Index([24990, 25499], name='PRICE'),
+                            columns=['count', 'mean', 'std', 'min',
+                                     '25%', '50%', '75%', 'max'])
+    tm.assert_frame_equal(result, expected)
+
+
+# nunique
+# --------------------------------
+
+@pytest.mark.parametrize('n', 10 ** np.arange(2, 6))
+@pytest.mark.parametrize('m', [10, 100, 1000])
+@pytest.mark.parametrize('sort', [False, True])
+@pytest.mark.parametrize('dropna', [False, True])
+def test_series_groupby_nunique(n, m, sort, dropna):
+
+    def check_nunique(df, keys, as_index=True):
+        gr = df.groupby(keys, as_index=as_index, sort=sort)
+        left = gr['julie'].nunique(dropna=dropna)
+
+        gr = df.groupby(keys, as_index=as_index, sort=sort)
+        right = gr['julie'].apply(Series.nunique, dropna=dropna)
+        if not as_index:
+            right = right.reset_index(drop=True)
+
+        tm.assert_series_equal(left, right, check_names=False)
+
+    days = date_range('2015-08-23', periods=10)
+
+    frame = DataFrame({'jim': np.random.choice(list(ascii_lowercase), n),
+                       'joe': np.random.choice(days, n),
+                       'julie': np.random.randint(0, m, n)})
+
+    check_nunique(frame, ['jim'])
+    check_nunique(frame, ['jim', 'joe'])
+
+    frame.loc[1::17, 'jim'] = None
+    frame.loc[3::37, 'joe'] = None
+    frame.loc[7::19, 'julie'] = None
+    frame.loc[8::19, 'julie'] = None
+    frame.loc[9::19, 'julie'] = None
+
+    check_nunique(frame, ['jim'])
+    check_nunique(frame, ['jim', 'joe'])
+    check_nunique(frame, ['jim'], as_index=False)
+    check_nunique(frame, ['jim', 'joe'], as_index=False)
+
+
+def test_nunique():
+    df = DataFrame({
+        'A': list('abbacc'),
+        'B': list('abxacc'),
+        'C': list('abbacx'),
+    })
+
+    expected = DataFrame({'A': [1] * 3, 'B': [1, 2, 1], 'C': [1, 1, 2]})
+    result = df.groupby('A', as_index=False).nunique()
+    tm.assert_frame_equal(result, expected)
+
+    # as_index
+    expected.index = list('abc')
+    expected.index.name = 'A'
+    result = df.groupby('A').nunique()
+    tm.assert_frame_equal(result, expected)
+
+    # with na
+    result = df.replace({'x': None}).groupby('A').nunique(dropna=False)
+    tm.assert_frame_equal(result, expected)
+
+    # dropna
+    expected = DataFrame({'A': [1] * 3, 'B': [1] * 3, 'C': [1] * 3},
+                         index=list('abc'))
+    expected.index.name = 'A'
+    result = df.replace({'x': None}).groupby('A').nunique()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_nunique_with_object():
+    # GH 11077
+    data = pd.DataFrame(
+        [[100, 1, 'Alice'],
+         [200, 2, 'Bob'],
+         [300, 3, 'Charlie'],
+         [-400, 4, 'Dan'],
+         [500, 5, 'Edith']],
+        columns=['amount', 'id', 'name']
+    )
+
+    result = data.groupby(['id', 'amount'])['name'].nunique()
+    index = MultiIndex.from_arrays([data.id, data.amount])
+    expected = pd.Series([1] * 5, name='name', index=index)
+    tm.assert_series_equal(result, expected)
+
+
+def test_nunique_with_empty_series():
+    # GH 12553
+    data = pd.Series(name='name')
+    result = data.groupby(level=0).nunique()
+    expected = pd.Series(name='name', dtype='int64')
+    tm.assert_series_equal(result, expected)
+
+
+def test_nunique_with_timegrouper():
+    # GH 13453
+    test = pd.DataFrame({
+        'time': [Timestamp('2016-06-28 09:35:35'),
+                 Timestamp('2016-06-28 16:09:30'),
+                 Timestamp('2016-06-28 16:46:28')],
+        'data': ['1', '2', '3']}).set_index('time')
+    result = test.groupby(pd.Grouper(freq='h'))['data'].nunique()
+    expected = test.groupby(
+        pd.Grouper(freq='h')
+    )['data'].apply(pd.Series.nunique)
+    tm.assert_series_equal(result, expected)
+
+
+def test_nunique_preserves_column_level_names():
+    # GH 23222
+    test = pd.DataFrame([1, 2, 2],
+                        columns=pd.Index(['A'], name="level_0"))
+    result = test.groupby([0, 0, 0]).nunique()
+    expected = pd.DataFrame([2], columns=test.columns)
+    tm.assert_frame_equal(result, expected)
+
+
+# count
+# --------------------------------
+
+def test_groupby_timedelta_cython_count():
+    df = DataFrame({'g': list('ab' * 2),
+                    'delt': np.arange(4).astype('timedelta64[ns]')})
+    expected = Series([
+        2, 2
+    ], index=pd.Index(['a', 'b'], name='g'), name='delt')
+    result = df.groupby('g').delt.count()
+    tm.assert_series_equal(expected, result)
+
+
+def test_count():
+    n = 1 << 15
+    dr = date_range('2015-08-30', periods=n // 10, freq='T')
+
+    df = DataFrame({
+        '1st': np.random.choice(
+            list(ascii_lowercase), n),
+        '2nd': np.random.randint(0, 5, n),
+        '3rd': np.random.randn(n).round(3),
+        '4th': np.random.randint(-10, 10, n),
+        '5th': np.random.choice(dr, n),
+        '6th': np.random.randn(n).round(3),
+        '7th': np.random.randn(n).round(3),
+        '8th': np.random.choice(dr, n) - np.random.choice(dr, 1),
+        '9th': np.random.choice(
+            list(ascii_lowercase), n)
+    })
+
+    for col in df.columns.drop(['1st', '2nd', '4th']):
+        df.loc[np.random.choice(n, n // 10), col] = np.nan
+
+    df['9th'] = df['9th'].astype('category')
+
+    for key in '1st', '2nd', ['1st', '2nd']:
+        left = df.groupby(key).count()
+        right = df.groupby(key).apply(DataFrame.count).drop(key, axis=1)
+        tm.assert_frame_equal(left, right)
+
+    # GH5610
+    # count counts non-nulls
+    df = pd.DataFrame([[1, 2, 'foo'],
+                       [1, np.nan, 'bar'],
+                       [3, np.nan, np.nan]],
+                      columns=['A', 'B', 'C'])
+
+    count_as = df.groupby('A').count()
+    count_not_as = df.groupby('A', as_index=False).count()
+
+    expected = DataFrame([[1, 2], [0, 0]], columns=['B', 'C'],
+                         index=[1, 3])
+    expected.index.name = 'A'
+    tm.assert_frame_equal(count_not_as, expected.reset_index())
+    tm.assert_frame_equal(count_as, expected)
+
+    count_B = df.groupby('A')['B'].count()
+    tm.assert_series_equal(count_B, expected['B'])
+
+
+def test_count_object():
+    df = pd.DataFrame({'a': ['a'] * 3 + ['b'] * 3, 'c': [2] * 3 + [3] * 3})
+    result = df.groupby('c').a.count()
+    expected = pd.Series([
+        3, 3
+    ], index=pd.Index([2, 3], name='c'), name='a')
+    tm.assert_series_equal(result, expected)
+
+    df = pd.DataFrame({'a': ['a', np.nan, np.nan] + ['b'] * 3,
+                       'c': [2] * 3 + [3] * 3})
+    result = df.groupby('c').a.count()
+    expected = pd.Series([
+        1, 3
+    ], index=pd.Index([2, 3], name='c'), name='a')
+    tm.assert_series_equal(result, expected)
+
+
+def test_count_cross_type():
+    # GH8169
+    vals = np.hstack((np.random.randint(0, 5, (100, 2)), np.random.randint(
+        0, 2, (100, 2))))
+
+    df = pd.DataFrame(vals, columns=['a', 'b', 'c', 'd'])
+    df[df == 2] = np.nan
+    expected = df.groupby(['c', 'd']).count()
+
+    for t in ['float32', 'object']:
+        df['a'] = df['a'].astype(t)
+        df['b'] = df['b'].astype(t)
+        result = df.groupby(['c', 'd']).count()
+        tm.assert_frame_equal(result, expected)
+
+
+def test_lower_int_prec_count():
+    df = DataFrame({'a': np.array(
+        [0, 1, 2, 100], np.int8),
+        'b': np.array(
+        [1, 2, 3, 6], np.uint32),
+        'c': np.array(
+        [4, 5, 6, 8], np.int16),
+        'grp': list('ab' * 2)})
+    result = df.groupby('grp').count()
+    expected = DataFrame({'a': [2, 2],
+                          'b': [2, 2],
+                          'c': [2, 2]}, index=pd.Index(list('ab'),
+                                                       name='grp'))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_count_uses_size_on_exception():
+    class RaisingObjectException(Exception):
+        pass
+
+    class RaisingObject(object):
+
+        def __init__(self, msg='I will raise inside Cython'):
+            super(RaisingObject, self).__init__()
+            self.msg = msg
+
+        def __eq__(self, other):
+            # gets called in Cython to check that raising calls the method
+            raise RaisingObjectException(self.msg)
+
+    df = DataFrame({'a': [RaisingObject() for _ in range(4)],
+                    'grp': list('ab' * 2)})
+    result = df.groupby('grp').count()
+    expected = DataFrame({'a': [2, 2]}, index=pd.Index(
+        list('ab'), name='grp'))
+    tm.assert_frame_equal(result, expected)
+
+
+# size
+# --------------------------------
+
+def test_size(df):
+    grouped = df.groupby(['A', 'B'])
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    grouped = df.groupby('A')
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    grouped = df.groupby('B')
+    result = grouped.size()
+    for key, group in grouped:
+        assert result[key] == len(group)
+
+    df = DataFrame(np.random.choice(20, (1000, 3)), columns=list('abc'))
+    for sort, key in cart_product((False, True), ('a', 'b', ['a', 'b'])):
+        left = df.groupby(key, sort=sort).size()
+        right = df.groupby(key, sort=sort)['c'].apply(lambda a: a.shape[0])
+        tm.assert_series_equal(left, right, check_names=False)
+
+    # GH11699
+    df = DataFrame([], columns=['A', 'B'])
+    out = Series([], dtype='int64', index=Index([], name='A'))
+    tm.assert_series_equal(df.groupby('A').size(), out)
+
+
+# quantile
+# --------------------------------
+@pytest.mark.parametrize("interpolation", [
+    "linear", "lower", "higher", "nearest", "midpoint"])
+@pytest.mark.parametrize("a_vals,b_vals", [
+    # Ints
+    ([1, 2, 3, 4, 5], [5, 4, 3, 2, 1]),
+    ([1, 2, 3, 4], [4, 3, 2, 1]),
+    ([1, 2, 3, 4, 5], [4, 3, 2, 1]),
+    # Floats
+    ([1., 2., 3., 4., 5.], [5., 4., 3., 2., 1.]),
+    # Missing data
+    ([1., np.nan, 3., np.nan, 5.], [5., np.nan, 3., np.nan, 1.]),
+    ([np.nan, 4., np.nan, 2., np.nan], [np.nan, 4., np.nan, 2., np.nan]),
+    # Timestamps
+    ([x for x in pd.date_range('1/1/18', freq='D', periods=5)],
+     [x for x in pd.date_range('1/1/18', freq='D', periods=5)][::-1]),
+    # All NA
+    ([np.nan] * 5, [np.nan] * 5),
+])
+@pytest.mark.parametrize('q', [0, .25, .5, .75, 1])
+def test_quantile(interpolation, a_vals, b_vals, q):
+    if interpolation == 'nearest' and q == 0.5 and b_vals == [4, 3, 2, 1]:
+        pytest.skip("Unclear numpy expectation for nearest result with "
+                    "equidistant data")
+
+    a_expected = pd.Series(a_vals).quantile(q, interpolation=interpolation)
+    b_expected = pd.Series(b_vals).quantile(q, interpolation=interpolation)
+
+    df = DataFrame({
+        'key': ['a'] * len(a_vals) + ['b'] * len(b_vals),
+        'val': a_vals + b_vals})
+
+    expected = DataFrame([a_expected, b_expected], columns=['val'],
+                         index=Index(['a', 'b'], name='key'))
+    result = df.groupby('key').quantile(q, interpolation=interpolation)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_quantile_raises():
+    df = pd.DataFrame([
+        ['foo', 'a'], ['foo', 'b'], ['foo', 'c']], columns=['key', 'val'])
+
+    with pytest.raises(TypeError, match="cannot be performed against "
+                       "'object' dtypes"):
+        df.groupby('key').quantile()
+
+
+# pipe
+# --------------------------------
+
+def test_pipe():
+    # Test the pipe method of DataFrameGroupBy.
+    # Issue #17871
+
+    random_state = np.random.RandomState(1234567890)
+
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': random_state.randn(8),
+                    'C': random_state.randn(8)})
+
+    def f(dfgb):
+        return dfgb.B.max() - dfgb.C.min().min()
+
+    def square(srs):
+        return srs ** 2
+
+    # Note that the transformations are
+    # GroupBy -> Series
+    # Series -> Series
+    # This then chains the GroupBy.pipe and the
+    # NDFrame.pipe methods
+    result = df.groupby('A').pipe(f).pipe(square)
+
+    index = Index([u'bar', u'foo'], dtype='object', name=u'A')
+    expected = pd.Series([8.99110003361, 8.17516964785], name='B',
+                         index=index)
+
+    tm.assert_series_equal(expected, result)
+
+
+def test_pipe_args():
+    # Test passing args to the pipe method of DataFrameGroupBy.
+    # Issue #17871
+
+    df = pd.DataFrame({'group': ['A', 'A', 'B', 'B', 'C'],
+                       'x': [1.0, 2.0, 3.0, 2.0, 5.0],
+                       'y': [10.0, 100.0, 1000.0, -100.0, -1000.0]})
+
+    def f(dfgb, arg1):
+        return (dfgb.filter(lambda grp: grp.y.mean() > arg1, dropna=False)
+                    .groupby(dfgb.grouper))
+
+    def g(dfgb, arg2):
+        return dfgb.sum() / dfgb.sum().sum() + arg2
+
+    def h(df, arg3):
+        return df.x + df.y - arg3
+
+    result = (df
+              .groupby('group')
+              .pipe(f, 0)
+              .pipe(g, 10)
+              .pipe(h, 100))
+
+    # Assert the results here
+    index = pd.Index(['A', 'B', 'C'], name='group')
+    expected = pd.Series([-79.5160891089, -78.4839108911, -80],
+                         index=index)
+
+    tm.assert_series_equal(expected, result)
+
+    # test SeriesGroupby.pipe
+    ser = pd.Series([1, 1, 2, 2, 3, 3])
+    result = ser.groupby(ser).pipe(lambda grp: grp.sum() * grp.count())
+
+    expected = pd.Series([4, 8, 12], index=pd.Int64Index([1, 2, 3]))
+
+    tm.assert_series_equal(result, expected)
+
+
+def test_groupby_mean_no_overflow():
+    # Regression test for (#22487)
+    df = pd.DataFrame({
+        "user": ["A", "A", "A", "A", "A"],
+        "connections": [4970, 4749, 4719, 4704, 18446744073699999744]
+    })
+    assert df.groupby('user')['connections'].mean()['A'] == 3689348814740003840
diff --git a/pandas/tests/groupby/test_groupby.py b/pandas/tests/groupby/test_groupby.py
index 83502434e6053..c062fb90ca43b 100644
--- a/pandas/tests/groupby/test_groupby.py
+++ b/pandas/tests/groupby/test_groupby.py
@@ -1,4161 +1,1725 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
 
-from string import ascii_lowercase
+from collections import OrderedDict, defaultdict
 from datetime import datetime
-from numpy import nan
-
-from pandas import (date_range, bdate_range, Timestamp,
-                    isnull, Index, MultiIndex, DataFrame, Series,
-                    concat, Panel)
-from pandas.core.common import UnsupportedFunctionCall
-from pandas.util.testing import (assert_panel_equal, assert_frame_equal,
-                                 assert_series_equal, assert_almost_equal,
-                                 assert_index_equal, assertRaisesRegexp)
-from pandas.compat import (range, long, lrange, StringIO, lmap, lzip, map, zip,
-                           builtins, OrderedDict, product as cart_product)
-from pandas import compat
-from collections import defaultdict
-import pandas.core.common as com
+from decimal import Decimal
+
 import numpy as np
+import pytest
+
+from pandas.compat import StringIO, lmap, lrange, lzip, map, range, zip
+from pandas.errors import PerformanceWarning
 
-import pandas.core.nanops as nanops
-import pandas.util.testing as tm
 import pandas as pd
-from .common import MixIn
+from pandas import (
+    DataFrame, Index, MultiIndex, Panel, Series, Timestamp, compat, date_range,
+    read_csv)
+import pandas.core.common as com
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
 
 
-class TestGroupBy(MixIn, tm.TestCase):
-
-    def test_basic(self):
-        def checkit(dtype):
-            data = Series(np.arange(9) // 3, index=np.arange(9), dtype=dtype)
+def test_repr():
+    # GH18203
+    result = repr(pd.Grouper(key='A', level='B'))
+    expected = "Grouper(key='A', level='B', axis=0, sort=False)"
+    assert result == expected
 
-            index = np.arange(9)
-            np.random.shuffle(index)
-            data = data.reindex(index)
 
-            grouped = data.groupby(lambda x: x // 3)
+@pytest.mark.parametrize('dtype', ['int64', 'int32', 'float64', 'float32'])
+def test_basic(dtype):
 
-            for k, v in grouped:
-                self.assertEqual(len(v), 3)
-
-            agged = grouped.aggregate(np.mean)
-            self.assertEqual(agged[1], 1)
-
-            assert_series_equal(agged, grouped.agg(np.mean))  # shorthand
-            assert_series_equal(agged, grouped.mean())
-            assert_series_equal(grouped.agg(np.sum), grouped.sum())
-
-            expected = grouped.apply(lambda x: x * x.sum())
-            transformed = grouped.transform(lambda x: x * x.sum())
-            self.assertEqual(transformed[7], 12)
-            assert_series_equal(transformed, expected)
-
-            value_grouped = data.groupby(data)
-            assert_series_equal(value_grouped.aggregate(np.mean), agged,
-                                check_index_type=False)
-
-            # complex agg
-            agged = grouped.aggregate([np.mean, np.std])
-            agged = grouped.aggregate({'one': np.mean, 'two': np.std})
-
-            group_constants = {0: 10, 1: 20, 2: 30}
-            agged = grouped.agg(lambda x: group_constants[x.name] + x.mean())
-            self.assertEqual(agged[1], 21)
-
-            # corner cases
-            self.assertRaises(Exception, grouped.aggregate, lambda x: x * 2)
-
-        for dtype in ['int64', 'int32', 'float64', 'float32']:
-            checkit(dtype)
-
-    def test_select_bad_cols(self):
-        df = DataFrame([[1, 2]], columns=['A', 'B'])
-        g = df.groupby('A')
-        self.assertRaises(KeyError, g.__getitem__, ['C'])  # g[['C']]
-
-        self.assertRaises(KeyError, g.__getitem__, ['A', 'C'])  # g[['A', 'C']]
-        with assertRaisesRegexp(KeyError, '^[^A]+$'):
-            # A should not be referenced as a bad column...
-            # will have to rethink regex if you change message!
-            g[['A', 'C']]
-
-    def test_first_last_nth(self):
-        # tests for first / last / nth
-        grouped = self.df.groupby('A')
-        first = grouped.first()
-        expected = self.df.loc[[1, 0], ['B', 'C', 'D']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(first, expected)
-
-        nth = grouped.nth(0)
-        assert_frame_equal(nth, expected)
-
-        last = grouped.last()
-        expected = self.df.loc[[5, 7], ['B', 'C', 'D']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        assert_frame_equal(last, expected)
-
-        nth = grouped.nth(-1)
-        assert_frame_equal(nth, expected)
-
-        nth = grouped.nth(1)
-        expected = self.df.loc[[2, 3], ['B', 'C', 'D']].copy()
-        expected.index = Index(['foo', 'bar'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(nth, expected)
-
-        # it works!
-        grouped['B'].first()
-        grouped['B'].last()
-        grouped['B'].nth(0)
-
-        self.df.loc[self.df['A'] == 'foo', 'B'] = np.nan
-        self.assertTrue(isnull(grouped['B'].first()['foo']))
-        self.assertTrue(isnull(grouped['B'].last()['foo']))
-        self.assertTrue(isnull(grouped['B'].nth(0)['foo']))
-
-        # v0.14.0 whatsnew
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        result = g.first()
-        expected = df.iloc[[1, 2]].set_index('A')
-        assert_frame_equal(result, expected)
-
-        expected = df.iloc[[1, 2]].set_index('A')
-        result = g.nth(0, dropna='any')
-        assert_frame_equal(result, expected)
-
-    def test_first_last_nth_dtypes(self):
-
-        df = self.df_mixed_floats.copy()
-        df['E'] = True
-        df['F'] = 1
-
-        # tests for first / last / nth
-        grouped = df.groupby('A')
-        first = grouped.first()
-        expected = df.loc[[1, 0], ['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(first, expected)
-
-        last = grouped.last()
-        expected = df.loc[[5, 7], ['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(last, expected)
-
-        nth = grouped.nth(1)
-        expected = df.loc[[3, 2], ['B', 'C', 'D', 'E', 'F']]
-        expected.index = Index(['bar', 'foo'], name='A')
-        expected = expected.sort_index()
-        assert_frame_equal(nth, expected)
-
-        # GH 2763, first/last shifting dtypes
-        idx = lrange(10)
-        idx.append(9)
-        s = Series(data=lrange(11), index=idx, name='IntCol')
-        self.assertEqual(s.dtype, 'int64')
-        f = s.groupby(level=0).first()
-        self.assertEqual(f.dtype, 'int64')
-
-    def test_nth(self):
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-
-        assert_frame_equal(g.nth(0), df.iloc[[0, 2]].set_index('A'))
-        assert_frame_equal(g.nth(1), df.iloc[[1]].set_index('A'))
-        assert_frame_equal(g.nth(2), df.loc[[]].set_index('A'))
-        assert_frame_equal(g.nth(-1), df.iloc[[1, 2]].set_index('A'))
-        assert_frame_equal(g.nth(-2), df.iloc[[0]].set_index('A'))
-        assert_frame_equal(g.nth(-3), df.loc[[]].set_index('A'))
-        assert_series_equal(g.B.nth(0), df.set_index('A').B.iloc[[0, 2]])
-        assert_series_equal(g.B.nth(1), df.set_index('A').B.iloc[[1]])
-        assert_frame_equal(g[['B']].nth(0),
-                           df.loc[[0, 2], ['A', 'B']].set_index('A'))
-
-        exp = df.set_index('A')
-        assert_frame_equal(g.nth(0, dropna='any'), exp.iloc[[1, 2]])
-        assert_frame_equal(g.nth(-1, dropna='any'), exp.iloc[[1, 2]])
-
-        exp['B'] = np.nan
-        assert_frame_equal(g.nth(7, dropna='any'), exp.iloc[[1, 2]])
-        assert_frame_equal(g.nth(2, dropna='any'), exp.iloc[[1, 2]])
-
-        # out of bounds, regression from 0.13.1
-        # GH 6621
-        df = DataFrame({'color': {0: 'green',
-                                  1: 'green',
-                                  2: 'red',
-                                  3: 'red',
-                                  4: 'red'},
-                        'food': {0: 'ham',
-                                 1: 'eggs',
-                                 2: 'eggs',
-                                 3: 'ham',
-                                 4: 'pork'},
-                        'two': {0: 1.5456590000000001,
-                                1: -0.070345000000000005,
-                                2: -2.4004539999999999,
-                                3: 0.46206000000000003,
-                                4: 0.52350799999999997},
-                        'one': {0: 0.56573799999999996,
-                                1: -0.9742360000000001,
-                                2: 1.033801,
-                                3: -0.78543499999999999,
-                                4: 0.70422799999999997}}).set_index(['color',
-                                                                     'food'])
-
-        result = df.groupby(level=0, as_index=False).nth(2)
-        expected = df.iloc[[-1]]
-        assert_frame_equal(result, expected)
-
-        result = df.groupby(level=0, as_index=False).nth(3)
-        expected = df.loc[[]]
-        assert_frame_equal(result, expected)
-
-        # GH 7559
-        # from the vbench
-        df = DataFrame(np.random.randint(1, 10, (100, 2)), dtype='int64')
-        s = df[1]
-        g = df[0]
-        expected = s.groupby(g).first()
-        expected2 = s.groupby(g).apply(lambda x: x.iloc[0])
-        assert_series_equal(expected2, expected, check_names=False)
-        self.assertTrue(expected.name, 0)
-        self.assertEqual(expected.name, 1)
-
-        # validate first
-        v = s[g == 1].iloc[0]
-        self.assertEqual(expected.iloc[0], v)
-        self.assertEqual(expected2.iloc[0], v)
-
-        # this is NOT the same as .first (as sorted is default!)
-        # as it keeps the order in the series (and not the group order)
-        # related GH 7287
-        expected = s.groupby(g, sort=False).first()
-        result = s.groupby(g, sort=False).nth(0, dropna='all')
-        assert_series_equal(result, expected)
-
-        # doc example
-        df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
-        g = df.groupby('A')
-        result = g.B.nth(0, dropna=True)
-        expected = g.B.first()
-        assert_series_equal(result, expected)
-
-        # test multiple nth values
-        df = DataFrame([[1, np.nan], [1, 3], [1, 4], [5, 6], [5, 7]],
-                       columns=['A', 'B'])
-        g = df.groupby('A')
-
-        assert_frame_equal(g.nth(0), df.iloc[[0, 3]].set_index('A'))
-        assert_frame_equal(g.nth([0]), df.iloc[[0, 3]].set_index('A'))
-        assert_frame_equal(g.nth([0, 1]), df.iloc[[0, 1, 3, 4]].set_index('A'))
-        assert_frame_equal(
-            g.nth([0, -1]), df.iloc[[0, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(
-            g.nth([0, 1, 2]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(
-            g.nth([0, 1, -1]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
-        assert_frame_equal(g.nth([2]), df.iloc[[2]].set_index('A'))
-        assert_frame_equal(g.nth([3, 4]), df.loc[[]].set_index('A'))
-
-        business_dates = pd.date_range(start='4/1/2014', end='6/30/2014',
-                                       freq='B')
-        df = DataFrame(1, index=business_dates, columns=['a', 'b'])
-        # get the first, fourth and last two business days for each month
-        key = (df.index.year, df.index.month)
-        result = df.groupby(key, as_index=False).nth([0, 3, -2, -1])
-        expected_dates = pd.to_datetime(
-            ['2014/4/1', '2014/4/4', '2014/4/29', '2014/4/30', '2014/5/1',
-             '2014/5/6', '2014/5/29', '2014/5/30', '2014/6/2', '2014/6/5',
-             '2014/6/27', '2014/6/30'])
-        expected = DataFrame(1, columns=['a', 'b'], index=expected_dates)
-        assert_frame_equal(result, expected)
-
-    def test_nth_multi_index(self):
-        # PR 9090, related to issue 8979
-        # test nth on MultiIndex, should match .first()
-        grouped = self.three_group.groupby(['A', 'B'])
-        result = grouped.nth(0)
-        expected = grouped.first()
-        assert_frame_equal(result, expected)
-
-    def test_nth_multi_index_as_expected(self):
-        # PR 9090, related to issue 8979
-        # test nth on MultiIndex
-        three_group = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny']})
-        grouped = three_group.groupby(['A', 'B'])
-        result = grouped.nth(0)
-        expected = DataFrame(
-            {'C': ['dull', 'dull', 'dull', 'dull']},
-            index=MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo'],
-                                          ['one', 'two', 'one', 'two']],
-                                         names=['A', 'B']))
-        assert_frame_equal(result, expected)
-
-    def test_group_selection_cache(self):
-        # GH 12839 nth, head, and tail should return same result consistently
-        df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
-        expected = df.iloc[[0, 2]].set_index('A')
-
-        g = df.groupby('A')
-        result1 = g.head(n=2)
-        result2 = g.nth(0)
-        assert_frame_equal(result1, df)
-        assert_frame_equal(result2, expected)
-
-        g = df.groupby('A')
-        result1 = g.tail(n=2)
-        result2 = g.nth(0)
-        assert_frame_equal(result1, df)
-        assert_frame_equal(result2, expected)
-
-        g = df.groupby('A')
-        result1 = g.nth(0)
-        result2 = g.head(n=2)
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, df)
-
-        g = df.groupby('A')
-        result1 = g.nth(0)
-        result2 = g.tail(n=2)
-        assert_frame_equal(result1, expected)
-        assert_frame_equal(result2, df)
-
-    def test_grouper_index_types(self):
-        # related GH5375
-        # groupby misbehaving when using a Floatlike index
-        df = DataFrame(np.arange(10).reshape(5, 2), columns=list('AB'))
-        for index in [tm.makeFloatIndex, tm.makeStringIndex,
-                      tm.makeUnicodeIndex, tm.makeIntIndex, tm.makeDateIndex,
-                      tm.makePeriodIndex]:
-
-            df.index = index(len(df))
-            df.groupby(list('abcde')).apply(lambda x: x)
-
-            df.index = list(reversed(df.index.tolist()))
-            df.groupby(list('abcde')).apply(lambda x: x)
-
-    def test_grouper_multilevel_freq(self):
-
-        # GH 7885
-        # with level and freq specified in a pd.Grouper
-        from datetime import date, timedelta
-        d0 = date.today() - timedelta(days=14)
-        dates = date_range(d0, date.today())
-        date_index = pd.MultiIndex.from_product(
-            [dates, dates], names=['foo', 'bar'])
-        df = pd.DataFrame(np.random.randint(0, 100, 225), index=date_index)
-
-        # Check string level
-        expected = df.reset_index().groupby([pd.Grouper(
-            key='foo', freq='W'), pd.Grouper(key='bar', freq='W')]).sum()
-        # reset index changes columns dtype to object
-        expected.columns = pd.Index([0], dtype='int64')
-
-        result = df.groupby([pd.Grouper(level='foo', freq='W'), pd.Grouper(
-            level='bar', freq='W')]).sum()
-        assert_frame_equal(result, expected)
-
-        # Check integer level
-        result = df.groupby([pd.Grouper(level=0, freq='W'), pd.Grouper(
-            level=1, freq='W')]).sum()
-        assert_frame_equal(result, expected)
-
-    def test_grouper_creation_bug(self):
-
-        # GH 8795
-        df = DataFrame({'A': [0, 0, 1, 1, 2, 2], 'B': [1, 2, 3, 4, 5, 6]})
-        g = df.groupby('A')
-        expected = g.sum()
-
-        g = df.groupby(pd.Grouper(key='A'))
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        result = g.apply(lambda x: x.sum())
-        assert_frame_equal(result, expected)
-
-        g = df.groupby(pd.Grouper(key='A', axis=0))
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # GH14334
-        # pd.Grouper(key=...) may be passed in a list
-        df = DataFrame({'A': [0, 0, 0, 1, 1, 1],
-                        'B': [1, 1, 2, 2, 3, 3],
-                        'C': [1, 2, 3, 4, 5, 6]})
-        # Group by single column
-        expected = df.groupby('A').sum()
-        g = df.groupby([pd.Grouper(key='A')])
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # Group by two columns
-        # using a combination of strings and Grouper objects
-        expected = df.groupby(['A', 'B']).sum()
-
-        # Group with two Grouper objects
-        g = df.groupby([pd.Grouper(key='A'), pd.Grouper(key='B')])
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # Group with a string and a Grouper object
-        g = df.groupby(['A', pd.Grouper(key='B')])
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # Group with a Grouper object and a string
-        g = df.groupby([pd.Grouper(key='A'), 'B'])
-        result = g.sum()
-        assert_frame_equal(result, expected)
-
-        # GH8866
-        s = Series(np.arange(8, dtype='int64'),
-                   index=pd.MultiIndex.from_product(
-                       [list('ab'), range(2),
-                        date_range('20130101', periods=2)],
-                       names=['one', 'two', 'three']))
-        result = s.groupby(pd.Grouper(level='three', freq='M')).sum()
-        expected = Series([28], index=Index(
-            [Timestamp('2013-01-31')], freq='M', name='three'))
-        assert_series_equal(result, expected)
-
-        # just specifying a level breaks
-        result = s.groupby(pd.Grouper(level='one')).sum()
-        expected = s.groupby(level='one').sum()
-        assert_series_equal(result, expected)
-
-    def test_grouper_column_and_index(self):
-        # GH 14327
-
-        # Grouping a multi-index frame by a column and an index level should
-        # be equivalent to resetting the index and grouping by two columns
-        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
-                                         ('b', 1), ('b', 2), ('b', 3)])
-        idx.names = ['outer', 'inner']
-        df_multi = pd.DataFrame({"A": np.arange(6),
-                                 'B': ['one', 'one', 'two',
-                                       'two', 'one', 'one']},
-                                index=idx)
-        result = df_multi.groupby(['B', pd.Grouper(level='inner')]).mean()
-        expected = df_multi.reset_index().groupby(['B', 'inner']).mean()
-        assert_frame_equal(result, expected)
-
-        # Test the reverse grouping order
-        result = df_multi.groupby([pd.Grouper(level='inner'), 'B']).mean()
-        expected = df_multi.reset_index().groupby(['inner', 'B']).mean()
-        assert_frame_equal(result, expected)
-
-        # Grouping a single-index frame by a column and the index should
-        # be equivalent to resetting the index and grouping by two columns
-        df_single = df_multi.reset_index('outer')
-        result = df_single.groupby(['B', pd.Grouper(level='inner')]).mean()
-        expected = df_single.reset_index().groupby(['B', 'inner']).mean()
-        assert_frame_equal(result, expected)
-
-        # Test the reverse grouping order
-        result = df_single.groupby([pd.Grouper(level='inner'), 'B']).mean()
-        expected = df_single.reset_index().groupby(['inner', 'B']).mean()
-        assert_frame_equal(result, expected)
-
-    def test_grouper_index_level_as_string(self):
-        # GH 5677, allow strings passed as the `by` parameter to reference
-        # columns or index levels
-
-        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
-                                         ('b', 1), ('b', 2), ('b', 3)])
-        idx.names = ['outer', 'inner']
-        df_multi = pd.DataFrame({"A": np.arange(6),
-                                 'B': ['one', 'one', 'two',
-                                       'two', 'one', 'one']},
-                                index=idx)
-
-        df_single = df_multi.reset_index('outer')
-
-        # Column and Index on MultiIndex
-        result = df_multi.groupby(['B', 'inner']).mean()
-        expected = df_multi.groupby(['B', pd.Grouper(level='inner')]).mean()
-        assert_frame_equal(result, expected)
-
-        # Index and Column on MultiIndex
-        result = df_multi.groupby(['inner', 'B']).mean()
-        expected = df_multi.groupby([pd.Grouper(level='inner'), 'B']).mean()
-        assert_frame_equal(result, expected)
-
-        # Column and Index on single Index
-        result = df_single.groupby(['B', 'inner']).mean()
-        expected = df_single.groupby(['B', pd.Grouper(level='inner')]).mean()
-        assert_frame_equal(result, expected)
-
-        # Index and Column on single Index
-        result = df_single.groupby(['inner', 'B']).mean()
-        expected = df_single.groupby([pd.Grouper(level='inner'), 'B']).mean()
-        assert_frame_equal(result, expected)
-
-        # Single element list of Index on MultiIndex
-        result = df_multi.groupby(['inner']).mean()
-        expected = df_multi.groupby(pd.Grouper(level='inner')).mean()
-        assert_frame_equal(result, expected)
-
-        # Single element list of Index on single Index
-        result = df_single.groupby(['inner']).mean()
-        expected = df_single.groupby(pd.Grouper(level='inner')).mean()
-        assert_frame_equal(result, expected)
-
-        # Index on MultiIndex
-        result = df_multi.groupby('inner').mean()
-        expected = df_multi.groupby(pd.Grouper(level='inner')).mean()
-        assert_frame_equal(result, expected)
-
-        # Index on single Index
-        result = df_single.groupby('inner').mean()
-        expected = df_single.groupby(pd.Grouper(level='inner')).mean()
-        assert_frame_equal(result, expected)
-
-    def test_grouper_column_index_level_precedence(self):
-        # GH 5677, when a string passed as the `by` parameter
-        # matches a column and an index level the column takes
-        # precedence
-
-        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
-                                         ('b', 1), ('b', 2), ('b', 3)])
-        idx.names = ['outer', 'inner']
-        df_multi_both = pd.DataFrame({"A": np.arange(6),
-                                      'B': ['one', 'one', 'two',
-                                            'two', 'one', 'one'],
-                                      'inner': [1, 1, 1, 1, 1, 1]},
-                                     index=idx)
-
-        df_single_both = df_multi_both.reset_index('outer')
-
-        # Group MultiIndex by single key
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_multi_both.groupby('inner').mean()
-
-        expected = df_multi_both.groupby([pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_multi_both.groupby(pd.Grouper(level='inner')).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group single Index by single key
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_single_both.groupby('inner').mean()
-
-        expected = df_single_both.groupby([pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_single_both.groupby(pd.Grouper(level='inner')).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group MultiIndex by single key list
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_multi_both.groupby(['inner']).mean()
-
-        expected = df_multi_both.groupby([pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_multi_both.groupby(pd.Grouper(level='inner')).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group single Index by single key list
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_single_both.groupby(['inner']).mean()
-
-        expected = df_single_both.groupby([pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_single_both.groupby(pd.Grouper(level='inner')).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group MultiIndex by two keys (1)
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_multi_both.groupby(['B', 'inner']).mean()
-
-        expected = df_multi_both.groupby(['B',
-                                          pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_multi_both.groupby(['B',
-                                              pd.Grouper(level='inner')
-                                              ]).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group MultiIndex by two keys (2)
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_multi_both.groupby(['inner', 'B']).mean()
-
-        expected = df_multi_both.groupby([pd.Grouper(key='inner'),
-                                          'B']).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_multi_both.groupby([pd.Grouper(level='inner'),
-                                              'B']).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group single Index by two keys (1)
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_single_both.groupby(['B', 'inner']).mean()
-
-        expected = df_single_both.groupby(['B',
-                                           pd.Grouper(key='inner')]).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_single_both.groupby(['B',
-                                               pd.Grouper(level='inner')
-                                               ]).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-        # Group single Index by two keys (2)
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df_single_both.groupby(['inner', 'B']).mean()
-
-        expected = df_single_both.groupby([pd.Grouper(key='inner'),
-                                           'B']).mean()
-        assert_frame_equal(result, expected)
-        not_expected = df_single_both.groupby([pd.Grouper(level='inner'),
-                                               'B']).mean()
-        self.assertFalse(result.index.equals(not_expected.index))
-
-    def test_grouper_getting_correct_binner(self):
-
-        # GH 10063
-        # using a non-time-based grouper and a time-based grouper
-        # and specifying levels
-        df = DataFrame({'A': 1}, index=pd.MultiIndex.from_product(
-            [list('ab'), date_range('20130101', periods=80)], names=['one',
-                                                                     'two']))
-        result = df.groupby([pd.Grouper(level='one'), pd.Grouper(
-            level='two', freq='M')]).sum()
-        expected = DataFrame({'A': [31, 28, 21, 31, 28, 21]},
-                             index=MultiIndex.from_product(
-                                 [list('ab'),
-                                  date_range('20130101', freq='M', periods=3)],
-                                 names=['one', 'two']))
-        assert_frame_equal(result, expected)
-
-    def test_grouper_iter(self):
-        self.assertEqual(sorted(self.df.groupby('A').grouper), ['bar', 'foo'])
-
-    def test_empty_groups(self):
-        # GH # 1048
-        self.assertRaises(ValueError, self.df.groupby, [])
-
-    def test_groupby_grouper(self):
-        grouped = self.df.groupby('A')
-
-        result = self.df.groupby(grouped.grouper).mean()
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_duplicated_column_errormsg(self):
-        # GH7511
-        df = DataFrame(columns=['A', 'B', 'A', 'C'],
-                       data=[range(4), range(2, 6), range(0, 8, 2)])
-
-        self.assertRaises(ValueError, df.groupby, 'A')
-        self.assertRaises(ValueError, df.groupby, ['A', 'B'])
-
-        grouped = df.groupby('B')
-        c = grouped.count()
-        self.assertTrue(c.columns.nlevels == 1)
-        self.assertTrue(c.columns.size == 3)
-
-    def test_groupby_dict_mapping(self):
-        # GH #679
-        from pandas import Series
-        s = Series({'T1': 5})
-        result = s.groupby({'T1': 'T2'}).agg(sum)
-        expected = s.groupby(['T2']).agg(sum)
-        assert_series_equal(result, expected)
-
-        s = Series([1., 2., 3., 4.], index=list('abcd'))
-        mapping = {'a': 0, 'b': 0, 'c': 1, 'd': 1}
-
-        result = s.groupby(mapping).mean()
-        result2 = s.groupby(mapping).agg(np.mean)
-        expected = s.groupby([0, 0, 1, 1]).mean()
-        expected2 = s.groupby([0, 0, 1, 1]).mean()
-        assert_series_equal(result, expected)
-        assert_series_equal(result, result2)
-        assert_series_equal(result, expected2)
-
-    def test_groupby_grouper_f_sanity_checked(self):
-        dates = date_range('01-Jan-2013', periods=12, freq='MS')
-        ts = Series(np.random.randn(12), index=dates)
-
-        # GH3035
-        # index.map is used to apply grouper to the index
-        # if it fails on the elements, map tries it on the entire index as
-        # a sequence. That can yield invalid results that cause trouble
-        # down the line.
-        # the surprise comes from using key[0:6] rather then str(key)[0:6]
-        # when the elements are Timestamp.
-        # the result is Index[0:6], very confusing.
-
-        self.assertRaises(AssertionError, ts.groupby, lambda key: key[0:6])
-
-    def test_groupby_nonobject_dtype(self):
-        key = self.mframe.index.labels[0]
-        grouped = self.mframe.groupby(key)
-        result = grouped.sum()
-
-        expected = self.mframe.groupby(key.astype('O')).sum()
-        assert_frame_equal(result, expected)
-
-        # GH 3911, mixed frame non-conversion
-        df = self.df_mixed_floats.copy()
-        df['value'] = lrange(len(df))
-
-        def max_value(group):
-            return group.loc[group['value'].idxmax()]
-
-        applied = df.groupby('A').apply(max_value)
-        result = applied.get_dtype_counts().sort_values()
-        expected = Series({'object': 2,
-                           'float64': 2,
-                           'int64': 1}).sort_values()
-        assert_series_equal(result, expected)
-
-    def test_groupby_return_type(self):
-
-        # GH2893, return a reduced type
-        df1 = DataFrame(
-            [{"val1": 1, "val2": 20},
-             {"val1": 1, "val2": 19},
-             {"val1": 2, "val2": 27},
-             {"val1": 2, "val2": 12}
-             ])
-
-        def func(dataf):
-            return dataf["val2"] - dataf["val2"].mean()
-
-        result = df1.groupby("val1", squeeze=True).apply(func)
-        tm.assertIsInstance(result, Series)
-
-        df2 = DataFrame(
-            [{"val1": 1, "val2": 20},
-             {"val1": 1, "val2": 19},
-             {"val1": 1, "val2": 27},
-             {"val1": 1, "val2": 12}
-             ])
-
-        def func(dataf):
-            return dataf["val2"] - dataf["val2"].mean()
-
-        result = df2.groupby("val1", squeeze=True).apply(func)
-        tm.assertIsInstance(result, Series)
-
-        # GH3596, return a consistent type (regression in 0.11 from 0.10.1)
-        df = DataFrame([[1, 1], [1, 1]], columns=['X', 'Y'])
-        result = df.groupby('X', squeeze=False).count()
-        tm.assertIsInstance(result, DataFrame)
-
-        # GH5592
-        # inconcistent return type
-        df = DataFrame(dict(A=['Tiger', 'Tiger', 'Tiger', 'Lamb', 'Lamb',
-                               'Pony', 'Pony'], B=Series(
-                                   np.arange(7), dtype='int64'), C=date_range(
-                                       '20130101', periods=7)))
-
-        def f(grp):
-            return grp.iloc[0]
-
-        expected = df.groupby('A').first()[['B']]
-        result = df.groupby('A').apply(f)[['B']]
-        assert_frame_equal(result, expected)
-
-        def f(grp):
-            if grp.name == 'Tiger':
-                return None
-            return grp.iloc[0]
+    data = Series(np.arange(9) // 3, index=np.arange(9), dtype=dtype)
 
-        result = df.groupby('A').apply(f)[['B']]
-        e = expected.copy()
-        e.loc['Tiger'] = np.nan
-        assert_frame_equal(result, e)
+    index = np.arange(9)
+    np.random.shuffle(index)
+    data = data.reindex(index)
 
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0]
+    grouped = data.groupby(lambda x: x // 3)
 
-        result = df.groupby('A').apply(f)[['B']]
-        e = expected.copy()
-        e.loc['Pony'] = np.nan
-        assert_frame_equal(result, e)
+    for k, v in grouped:
+        assert len(v) == 3
 
-        # 5592 revisited, with datetimes
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0]
+    agged = grouped.aggregate(np.mean)
+    assert agged[1] == 1
 
-        result = df.groupby('A').apply(f)[['C']]
-        e = df.groupby('A').first()[['C']]
-        e.loc['Pony'] = pd.NaT
-        assert_frame_equal(result, e)
+    assert_series_equal(agged, grouped.agg(np.mean))  # shorthand
+    assert_series_equal(agged, grouped.mean())
+    assert_series_equal(grouped.agg(np.sum), grouped.sum())
 
-        # scalar outputs
-        def f(grp):
-            if grp.name == 'Pony':
-                return None
-            return grp.iloc[0].loc['C']
-
-        result = df.groupby('A').apply(f)
-        e = df.groupby('A').first()['C'].copy()
-        e.loc['Pony'] = np.nan
-        e.name = None
-        assert_series_equal(result, e)
-
-    def test_get_group(self):
-        wp = tm.makePanel()
-        grouped = wp.groupby(lambda x: x.month, axis='major')
-
-        gp = grouped.get_group(1)
-        expected = wp.reindex(major=[x for x in wp.major_axis if x.month == 1])
-        assert_panel_equal(gp, expected)
-
-        # GH 5267
-        # be datelike friendly
-        df = DataFrame({'DATE': pd.to_datetime(
-            ['10-Oct-2013', '10-Oct-2013', '10-Oct-2013', '11-Oct-2013',
-             '11-Oct-2013', '11-Oct-2013']),
-            'label': ['foo', 'foo', 'bar', 'foo', 'foo', 'bar'],
-            'VAL': [1, 2, 3, 4, 5, 6]})
-
-        g = df.groupby('DATE')
-        key = list(g.groups)[0]
-        result1 = g.get_group(key)
-        result2 = g.get_group(Timestamp(key).to_pydatetime())
-        result3 = g.get_group(str(Timestamp(key)))
-        assert_frame_equal(result1, result2)
-        assert_frame_equal(result1, result3)
-
-        g = df.groupby(['DATE', 'label'])
-
-        key = list(g.groups)[0]
-        result1 = g.get_group(key)
-        result2 = g.get_group((Timestamp(key[0]).to_pydatetime(), key[1]))
-        result3 = g.get_group((str(Timestamp(key[0])), key[1]))
-        assert_frame_equal(result1, result2)
-        assert_frame_equal(result1, result3)
-
-        # must pass a same-length tuple with multiple keys
-        self.assertRaises(ValueError, lambda: g.get_group('foo'))
-        self.assertRaises(ValueError, lambda: g.get_group(('foo')))
-        self.assertRaises(ValueError,
-                          lambda: g.get_group(('foo', 'bar', 'baz')))
-
-    def test_get_group_empty_bins(self):
-
-        d = pd.DataFrame([3, 1, 7, 6])
-        bins = [0, 5, 10, 15]
-        g = d.groupby(pd.cut(d[0], bins))
-
-        result = g.get_group('(0, 5]')
-        expected = DataFrame([3, 1], index=[0, 1])
-        assert_frame_equal(result, expected)
-
-        self.assertRaises(KeyError, lambda: g.get_group('(10, 15]'))
-
-    def test_get_group_grouped_by_tuple(self):
-        # GH 8121
-        df = DataFrame([[(1, ), (1, 2), (1, ), (1, 2)]], index=['ids']).T
-        gr = df.groupby('ids')
-        expected = DataFrame({'ids': [(1, ), (1, )]}, index=[0, 2])
-        result = gr.get_group((1, ))
-        assert_frame_equal(result, expected)
-
-        dt = pd.to_datetime(['2010-01-01', '2010-01-02', '2010-01-01',
-                             '2010-01-02'])
-        df = DataFrame({'ids': [(x, ) for x in dt]})
-        gr = df.groupby('ids')
-        result = gr.get_group(('2010-01-01', ))
-        expected = DataFrame({'ids': [(dt[0], ), (dt[0], )]}, index=[0, 2])
-        assert_frame_equal(result, expected)
-
-    def test_grouping_error_on_multidim_input(self):
-        from pandas.core.groupby import Grouping
-        self.assertRaises(ValueError,
-                          Grouping, self.df.index, self.df[['A', 'A']])
-
-    def test_apply_describe_bug(self):
-        grouped = self.mframe.groupby(level='first')
-        grouped.describe()  # it works!
-
-    def test_apply_issues(self):
-        # GH 5788
-
-        s = """2011.05.16,00:00,1.40893
-2011.05.16,01:00,1.40760
-2011.05.16,02:00,1.40750
-2011.05.16,03:00,1.40649
-2011.05.17,02:00,1.40893
-2011.05.17,03:00,1.40760
-2011.05.17,04:00,1.40750
-2011.05.17,05:00,1.40649
-2011.05.18,02:00,1.40893
-2011.05.18,03:00,1.40760
-2011.05.18,04:00,1.40750
-2011.05.18,05:00,1.40649"""
-
-        df = pd.read_csv(
-            StringIO(s), header=None, names=['date', 'time', 'value'],
-            parse_dates=[['date', 'time']])
-        df = df.set_index('date_time')
-
-        expected = df.groupby(df.index.date).idxmax()
-        result = df.groupby(df.index.date).apply(lambda x: x.idxmax())
-        assert_frame_equal(result, expected)
-
-        # GH 5789
-        # don't auto coerce dates
-        df = pd.read_csv(
-            StringIO(s), header=None, names=['date', 'time', 'value'])
-        exp_idx = pd.Index(
-            ['2011.05.16', '2011.05.17', '2011.05.18'
-             ], dtype=object, name='date')
-        expected = Series(['00:00', '02:00', '02:00'], index=exp_idx)
-        result = df.groupby('date').apply(
-            lambda x: x['time'][x['value'].idxmax()])
-        assert_series_equal(result, expected)
-
-    def test_time_field_bug(self):
-        # Test a fix for the following error related to GH issue 11324 When
-        # non-key fields in a group-by dataframe contained time-based fields
-        # that were not returned by the apply function, an exception would be
-        # raised.
-
-        df = pd.DataFrame({'a': 1, 'b': [datetime.now() for nn in range(10)]})
-
-        def func_with_no_date(batch):
-            return pd.Series({'c': 2})
-
-        def func_with_date(batch):
-            return pd.Series({'c': 2, 'b': datetime(2015, 1, 1)})
-
-        dfg_no_conversion = df.groupby(by=['a']).apply(func_with_no_date)
-        dfg_no_conversion_expected = pd.DataFrame({'c': 2}, index=[1])
-        dfg_no_conversion_expected.index.name = 'a'
-
-        dfg_conversion = df.groupby(by=['a']).apply(func_with_date)
-        dfg_conversion_expected = pd.DataFrame(
-            {'b': datetime(2015, 1, 1),
-             'c': 2}, index=[1])
-        dfg_conversion_expected.index.name = 'a'
-
-        self.assert_frame_equal(dfg_no_conversion, dfg_no_conversion_expected)
-        self.assert_frame_equal(dfg_conversion, dfg_conversion_expected)
-
-    def test_len(self):
-        df = tm.makeTimeDataFrame()
-        grouped = df.groupby([lambda x: x.year, lambda x: x.month,
-                              lambda x: x.day])
-        self.assertEqual(len(grouped), len(df))
-
-        grouped = df.groupby([lambda x: x.year, lambda x: x.month])
-        expected = len(set([(x.year, x.month) for x in df.index]))
-        self.assertEqual(len(grouped), expected)
-
-        # issue 11016
-        df = pd.DataFrame(dict(a=[np.nan] * 3, b=[1, 2, 3]))
-        self.assertEqual(len(df.groupby(('a'))), 0)
-        self.assertEqual(len(df.groupby(('b'))), 3)
-        self.assertEqual(len(df.groupby(('a', 'b'))), 3)
-
-    def test_groups(self):
-        grouped = self.df.groupby(['A'])
-        groups = grouped.groups
-        self.assertIs(groups, grouped.groups)  # caching works
-
-        for k, v in compat.iteritems(grouped.groups):
-            self.assertTrue((self.df.loc[v]['A'] == k).all())
-
-        grouped = self.df.groupby(['A', 'B'])
-        groups = grouped.groups
-        self.assertIs(groups, grouped.groups)  # caching works
-        for k, v in compat.iteritems(grouped.groups):
-            self.assertTrue((self.df.loc[v]['A'] == k[0]).all())
-            self.assertTrue((self.df.loc[v]['B'] == k[1]).all())
-
-    def test_basic_regression(self):
-        # regression
-        T = [1.0 * x for x in lrange(1, 10) * 10][:1095]
-        result = Series(T, lrange(0, len(T)))
-
-        groupings = np.random.random((1100, ))
-        groupings = Series(groupings, lrange(0, len(groupings))) * 10.
-
-        grouped = result.groupby(groupings)
-        grouped.mean()
-
-    def test_with_na(self):
-        index = Index(np.arange(10))
-
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'int16', 'int8']:
-            values = Series(np.ones(10), index, dtype=dtype)
-            labels = Series([nan, 'foo', 'bar', 'bar', nan, nan, 'bar',
-                             'bar', nan, 'foo'], index=index)
-
-            # this SHOULD be an int
-            grouped = values.groupby(labels)
-            agged = grouped.agg(len)
-            expected = Series([4, 2], index=['bar', 'foo'])
-
-            assert_series_equal(agged, expected, check_dtype=False)
-
-            # self.assertTrue(issubclass(agged.dtype.type, np.integer))
-
-            # explicity return a float from my function
-            def f(x):
-                return float(len(x))
-
-            agged = grouped.agg(f)
-            expected = Series([4, 2], index=['bar', 'foo'])
-
-            assert_series_equal(agged, expected, check_dtype=False)
-            self.assertTrue(issubclass(agged.dtype.type, np.dtype(dtype).type))
-
-    def test_indices_concatenation_order(self):
-
-        # GH 2808
-
-        def f1(x):
-            y = x[(x.b % 2) == 1] ** 2
-            if y.empty:
-                multiindex = MultiIndex(levels=[[]] * 2, labels=[[]] * 2,
-                                        names=['b', 'c'])
-                res = DataFrame(None, columns=['a'], index=multiindex)
-                return res
-            else:
-                y = y.set_index(['b', 'c'])
-                return y
-
-        def f2(x):
-            y = x[(x.b % 2) == 1] ** 2
-            if y.empty:
-                return DataFrame()
-            else:
-                y = y.set_index(['b', 'c'])
-                return y
-
-        def f3(x):
-            y = x[(x.b % 2) == 1] ** 2
-            if y.empty:
-                multiindex = MultiIndex(levels=[[]] * 2, labels=[[]] * 2,
-                                        names=['foo', 'bar'])
-                res = DataFrame(None, columns=['a', 'b'], index=multiindex)
-                return res
-            else:
-                return y
-
-        df = DataFrame({'a': [1, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
-
-        df2 = DataFrame({'a': [3, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
-
-        # correct result
-        result1 = df.groupby('a').apply(f1)
-        result2 = df2.groupby('a').apply(f1)
-        assert_frame_equal(result1, result2)
-
-        # should fail (not the same number of levels)
-        self.assertRaises(AssertionError, df.groupby('a').apply, f2)
-        self.assertRaises(AssertionError, df2.groupby('a').apply, f2)
-
-        # should fail (incorrect shape)
-        self.assertRaises(AssertionError, df.groupby('a').apply, f3)
-        self.assertRaises(AssertionError, df2.groupby('a').apply, f3)
-
-    def test_attr_wrapper(self):
-        grouped = self.ts.groupby(lambda x: x.weekday())
-
-        result = grouped.std()
-        expected = grouped.agg(lambda x: np.std(x, ddof=1))
-        assert_series_equal(result, expected)
-
-        # this is pretty cool
-        result = grouped.describe()
-        expected = {}
-        for name, gp in grouped:
-            expected[name] = gp.describe()
-        expected = DataFrame(expected).T
-        assert_frame_equal(result, expected)
-
-        # get attribute
-        result = grouped.dtype
-        expected = grouped.agg(lambda x: x.dtype)
-
-        # make sure raises error
-        self.assertRaises(AttributeError, getattr, grouped, 'foo')
-
-    def test_series_describe_multikey(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
-        result = grouped.describe()
-        assert_series_equal(result['mean'], grouped.mean(), check_names=False)
-        assert_series_equal(result['std'], grouped.std(), check_names=False)
-        assert_series_equal(result['min'], grouped.min(), check_names=False)
-
-    def test_series_describe_single(self):
-        ts = tm.makeTimeSeries()
-        grouped = ts.groupby(lambda x: x.month)
-        result = grouped.apply(lambda x: x.describe())
-        expected = grouped.describe().stack()
-        assert_series_equal(result, expected)
-
-    def test_series_index_name(self):
-        grouped = self.df.loc[:, ['C']].groupby(self.df['A'])
-        result = grouped.agg(lambda x: x.mean())
-        self.assertEqual(result.index.name, 'A')
-
-    def test_frame_describe_multikey(self):
-        grouped = self.tsframe.groupby([lambda x: x.year, lambda x: x.month])
-        result = grouped.describe()
-        desc_groups = []
-        for col in self.tsframe:
-            group = grouped[col].describe()
-            group_col = pd.MultiIndex([[col] * len(group.columns),
-                                       group.columns],
-                                      [[0] * len(group.columns),
-                                       range(len(group.columns))])
-            group = pd.DataFrame(group.values,
-                                 columns=group_col,
-                                 index=group.index)
-            desc_groups.append(group)
-        expected = pd.concat(desc_groups, axis=1)
-        tm.assert_frame_equal(result, expected)
-
-        groupedT = self.tsframe.groupby({'A': 0, 'B': 0,
-                                         'C': 1, 'D': 1}, axis=1)
-        result = groupedT.describe()
-        expected = self.tsframe.describe().T
-        expected.index = pd.MultiIndex([[0, 0, 1, 1], expected.index],
-                                       [range(4), range(len(expected.index))])
-        tm.assert_frame_equal(result, expected)
-
-    def test_frame_describe_tupleindex(self):
-
-        # GH 14848 - regression from 0.19.0 to 0.19.1
-        df1 = DataFrame({'x': [1, 2, 3, 4, 5] * 3,
-                         'y': [10, 20, 30, 40, 50] * 3,
-                         'z': [100, 200, 300, 400, 500] * 3})
-        df1['k'] = [(0, 0, 1), (0, 1, 0), (1, 0, 0)] * 5
-        df2 = df1.rename(columns={'k': 'key'})
-        tm.assertRaises(ValueError, lambda: df1.groupby('k').describe())
-        tm.assertRaises(ValueError, lambda: df2.groupby('key').describe())
-
-    def test_frame_describe_unstacked_format(self):
-        # GH 4792
-        prices = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 24990,
-                  pd.Timestamp('2011-01-06 12:43:33', tz=None): 25499,
-                  pd.Timestamp('2011-01-06 12:54:09', tz=None): 25499}
-        volumes = {pd.Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
-                   pd.Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
-                   pd.Timestamp('2011-01-06 12:54:09', tz=None): 100000000}
-        df = pd.DataFrame({'PRICE': prices,
-                           'VOLUME': volumes})
-        result = df.groupby('PRICE').VOLUME.describe()
-        data = [df[df.PRICE == 24990].VOLUME.describe().values.tolist(),
-                df[df.PRICE == 25499].VOLUME.describe().values.tolist()]
-        expected = pd.DataFrame(data,
-                                index=pd.Index([24990, 25499], name='PRICE'),
-                                columns=['count', 'mean', 'std', 'min',
-                                         '25%', '50%', '75%', 'max'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_frame_groupby(self):
-        grouped = self.tsframe.groupby(lambda x: x.weekday())
-
-        # aggregate
-        aggregated = grouped.aggregate(np.mean)
-        self.assertEqual(len(aggregated), 5)
-        self.assertEqual(len(aggregated.columns), 4)
-
-        # by string
-        tscopy = self.tsframe.copy()
-        tscopy['weekday'] = [x.weekday() for x in tscopy.index]
-        stragged = tscopy.groupby('weekday').aggregate(np.mean)
-        assert_frame_equal(stragged, aggregated, check_names=False)
-
-        # transform
-        grouped = self.tsframe.head(30).groupby(lambda x: x.weekday())
-        transformed = grouped.transform(lambda x: x - x.mean())
-        self.assertEqual(len(transformed), 30)
-        self.assertEqual(len(transformed.columns), 4)
-
-        # transform propagate
-        transformed = grouped.transform(lambda x: x.mean())
-        for name, group in grouped:
-            mean = group.mean()
-            for idx in group.index:
-                tm.assert_series_equal(transformed.xs(idx), mean,
-                                       check_names=False)
-
-        # iterate
-        for weekday, group in grouped:
-            self.assertEqual(group.index[0].weekday(), weekday)
-
-        # groups / group_indices
-        groups = grouped.groups
-        indices = grouped.indices
-
-        for k, v in compat.iteritems(groups):
-            samething = self.tsframe.index.take(indices[k])
-            self.assertTrue((samething == v).all())
-
-    def test_grouping_is_iterable(self):
-        # this code path isn't used anywhere else
-        # not sure it's useful
-        grouped = self.tsframe.groupby([lambda x: x.weekday(), lambda x: x.year
-                                        ])
-
-        # test it works
-        for g in grouped.grouper.groupings[0]:
-            pass
-
-    def test_frame_groupby_columns(self):
-        mapping = {'A': 0, 'B': 0, 'C': 1, 'D': 1}
-        grouped = self.tsframe.groupby(mapping, axis=1)
-
-        # aggregate
-        aggregated = grouped.aggregate(np.mean)
-        self.assertEqual(len(aggregated), len(self.tsframe))
-        self.assertEqual(len(aggregated.columns), 2)
-
-        # transform
-        tf = lambda x: x - x.mean()
-        groupedT = self.tsframe.T.groupby(mapping, axis=0)
-        assert_frame_equal(groupedT.transform(tf).T, grouped.transform(tf))
-
-        # iterate
-        for k, v in grouped:
-            self.assertEqual(len(v.columns), 2)
-
-    def test_frame_set_name_single(self):
-        grouped = self.df.groupby('A')
-
-        result = grouped.mean()
-        self.assertEqual(result.index.name, 'A')
-
-        result = self.df.groupby('A', as_index=False).mean()
-        self.assertNotEqual(result.index.name, 'A')
-
-        result = grouped.agg(np.mean)
-        self.assertEqual(result.index.name, 'A')
-
-        result = grouped.agg({'C': np.mean, 'D': np.std})
-        self.assertEqual(result.index.name, 'A')
-
-        result = grouped['C'].mean()
-        self.assertEqual(result.index.name, 'A')
-        result = grouped['C'].agg(np.mean)
-        self.assertEqual(result.index.name, 'A')
-        result = grouped['C'].agg([np.mean, np.std])
-        self.assertEqual(result.index.name, 'A')
+    expected = grouped.apply(lambda x: x * x.sum())
+    transformed = grouped.transform(lambda x: x * x.sum())
+    assert transformed[7] == 12
+    assert_series_equal(transformed, expected)
+
+    value_grouped = data.groupby(data)
+    assert_series_equal(value_grouped.aggregate(np.mean), agged,
+                        check_index_type=False)
+
+    # complex agg
+    agged = grouped.aggregate([np.mean, np.std])
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        agged = grouped.aggregate({'one': np.mean, 'two': np.std})
+
+    group_constants = {0: 10, 1: 20, 2: 30}
+    agged = grouped.agg(lambda x: group_constants[x.name] + x.mean())
+    assert agged[1] == 21
+
+    # corner cases
+    msg = "Must produce aggregated value"
+    # exception raised is type Exception
+    with pytest.raises(Exception, match=msg):
+        grouped.aggregate(lambda x: x * 2)
+
+
+def test_groupby_nonobject_dtype(mframe, df_mixed_floats):
+    key = mframe.index.codes[0]
+    grouped = mframe.groupby(key)
+    result = grouped.sum()
+
+    expected = mframe.groupby(key.astype('O')).sum()
+    assert_frame_equal(result, expected)
+
+    # GH 3911, mixed frame non-conversion
+    df = df_mixed_floats.copy()
+    df['value'] = lrange(len(df))
+
+    def max_value(group):
+        return group.loc[group['value'].idxmax()]
+
+    applied = df.groupby('A').apply(max_value)
+    result = applied.get_dtype_counts().sort_values()
+    expected = Series({'float64': 2,
+                       'int64': 1,
+                       'object': 2}).sort_values()
+    assert_series_equal(result, expected)
+
+
+def test_groupby_return_type():
+
+    # GH2893, return a reduced type
+    df1 = DataFrame(
+        [{"val1": 1, "val2": 20},
+         {"val1": 1, "val2": 19},
+         {"val1": 2, "val2": 27},
+         {"val1": 2, "val2": 12}
+         ])
+
+    def func(dataf):
+        return dataf["val2"] - dataf["val2"].mean()
+
+    result = df1.groupby("val1", squeeze=True).apply(func)
+    assert isinstance(result, Series)
+
+    df2 = DataFrame(
+        [{"val1": 1, "val2": 20},
+         {"val1": 1, "val2": 19},
+         {"val1": 1, "val2": 27},
+         {"val1": 1, "val2": 12}
+         ])
+
+    def func(dataf):
+        return dataf["val2"] - dataf["val2"].mean()
+
+    result = df2.groupby("val1", squeeze=True).apply(func)
+    assert isinstance(result, Series)
+
+    # GH3596, return a consistent type (regression in 0.11 from 0.10.1)
+    df = DataFrame([[1, 1], [1, 1]], columns=['X', 'Y'])
+    result = df.groupby('X', squeeze=False).count()
+    assert isinstance(result, DataFrame)
+
+    # GH5592
+    # inconcistent return type
+    df = DataFrame(dict(A=['Tiger', 'Tiger', 'Tiger', 'Lamb', 'Lamb',
+                           'Pony', 'Pony'], B=Series(
+                               np.arange(7), dtype='int64'), C=date_range(
+                                   '20130101', periods=7)))
+
+    def f(grp):
+        return grp.iloc[0]
+
+    expected = df.groupby('A').first()[['B']]
+    result = df.groupby('A').apply(f)[['B']]
+    assert_frame_equal(result, expected)
+
+    def f(grp):
+        if grp.name == 'Tiger':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['B']]
+    e = expected.copy()
+    e.loc['Tiger'] = np.nan
+    assert_frame_equal(result, e)
+
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['B']]
+    e = expected.copy()
+    e.loc['Pony'] = np.nan
+    assert_frame_equal(result, e)
+
+    # 5592 revisited, with datetimes
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0]
+
+    result = df.groupby('A').apply(f)[['C']]
+    e = df.groupby('A').first()[['C']]
+    e.loc['Pony'] = pd.NaT
+    assert_frame_equal(result, e)
+
+    # scalar outputs
+    def f(grp):
+        if grp.name == 'Pony':
+            return None
+        return grp.iloc[0].loc['C']
+
+    result = df.groupby('A').apply(f)
+    e = df.groupby('A').first()['C'].copy()
+    e.loc['Pony'] = np.nan
+    e.name = None
+    assert_series_equal(result, e)
+
+
+def test_pass_args_kwargs(ts, tsframe):
+
+    def f(x, q=None, axis=0):
+        return np.percentile(x, q, axis=axis)
+
+    g = lambda x: np.percentile(x, 80, axis=0)
+
+    # Series
+    ts_grouped = ts.groupby(lambda x: x.month)
+    agg_result = ts_grouped.agg(np.percentile, 80, axis=0)
+    apply_result = ts_grouped.apply(np.percentile, 80, axis=0)
+    trans_result = ts_grouped.transform(np.percentile, 80, axis=0)
+
+    agg_expected = ts_grouped.quantile(.8)
+    trans_expected = ts_grouped.transform(g)
+
+    assert_series_equal(apply_result, agg_expected)
+    assert_series_equal(agg_result, agg_expected)
+    assert_series_equal(trans_result, trans_expected)
+
+    agg_result = ts_grouped.agg(f, q=80)
+    apply_result = ts_grouped.apply(f, q=80)
+    trans_result = ts_grouped.transform(f, q=80)
+    assert_series_equal(agg_result, agg_expected)
+    assert_series_equal(apply_result, agg_expected)
+    assert_series_equal(trans_result, trans_expected)
+
+    # DataFrame
+    df_grouped = tsframe.groupby(lambda x: x.month)
+    agg_result = df_grouped.agg(np.percentile, 80, axis=0)
+    apply_result = df_grouped.apply(DataFrame.quantile, .8)
+    expected = df_grouped.quantile(.8)
+    assert_frame_equal(apply_result, expected, check_names=False)
+    assert_frame_equal(agg_result, expected)
+
+    agg_result = df_grouped.agg(f, q=80)
+    apply_result = df_grouped.apply(DataFrame.quantile, q=.8)
+    assert_frame_equal(agg_result, expected)
+    assert_frame_equal(apply_result, expected, check_names=False)
+
+
+def test_len():
+    df = tm.makeTimeDataFrame()
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month,
+                          lambda x: x.day])
+    assert len(grouped) == len(df)
+
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month])
+    expected = len({(x.year, x.month) for x in df.index})
+    assert len(grouped) == expected
+
+    # issue 11016
+    df = pd.DataFrame(dict(a=[np.nan] * 3, b=[1, 2, 3]))
+    assert len(df.groupby(('a'))) == 0
+    assert len(df.groupby(('b'))) == 3
+    assert len(df.groupby(['a', 'b'])) == 3
+
+
+def test_basic_regression():
+    # regression
+    T = [1.0 * x for x in lrange(1, 10) * 10][:1095]
+    result = Series(T, lrange(0, len(T)))
+
+    groupings = np.random.random((1100, ))
+    groupings = Series(groupings, lrange(0, len(groupings))) * 10.
+
+    grouped = result.groupby(groupings)
+    grouped.mean()
+
+
+@pytest.mark.parametrize('dtype', ['float64', 'float32', 'int64',
+                                   'int32', 'int16', 'int8'])
+def test_with_na_groups(dtype):
+    index = Index(np.arange(10))
+    values = Series(np.ones(10), index, dtype=dtype)
+    labels = Series([np.nan, 'foo', 'bar', 'bar', np.nan, np.nan,
+                     'bar', 'bar', np.nan, 'foo'], index=index)
+
+    # this SHOULD be an int
+    grouped = values.groupby(labels)
+    agged = grouped.agg(len)
+    expected = Series([4, 2], index=['bar', 'foo'])
+
+    assert_series_equal(agged, expected, check_dtype=False)
+
+    # assert issubclass(agged.dtype.type, np.integer)
+
+    # explicitly return a float from my function
+    def f(x):
+        return float(len(x))
+
+    agged = grouped.agg(f)
+    expected = Series([4, 2], index=['bar', 'foo'])
+
+    assert_series_equal(agged, expected, check_dtype=False)
+    assert issubclass(agged.dtype.type, np.dtype(dtype).type)
+
+
+def test_indices_concatenation_order():
+
+    # GH 2808
+
+    def f1(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            multiindex = MultiIndex(levels=[[]] * 2, codes=[[]] * 2,
+                                    names=['b', 'c'])
+            res = DataFrame(None, columns=['a'], index=multiindex)
+            return res
+        else:
+            y = y.set_index(['b', 'c'])
+            return y
+
+    def f2(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            return DataFrame()
+        else:
+            y = y.set_index(['b', 'c'])
+            return y
+
+    def f3(x):
+        y = x[(x.b % 2) == 1] ** 2
+        if y.empty:
+            multiindex = MultiIndex(levels=[[]] * 2, codes=[[]] * 2,
+                                    names=['foo', 'bar'])
+            res = DataFrame(None, columns=['a', 'b'], index=multiindex)
+            return res
+        else:
+            return y
+
+    df = DataFrame({'a': [1, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
+
+    df2 = DataFrame({'a': [3, 2, 2, 2], 'b': lrange(4), 'c': lrange(5, 9)})
+
+    # correct result
+    result1 = df.groupby('a').apply(f1)
+    result2 = df2.groupby('a').apply(f1)
+    assert_frame_equal(result1, result2)
+
+    # should fail (not the same number of levels)
+    msg = "Cannot concat indices that do not have the same number of levels"
+    with pytest.raises(AssertionError, match=msg):
+        df.groupby('a').apply(f2)
+    with pytest.raises(AssertionError, match=msg):
+        df2.groupby('a').apply(f2)
+
+    # should fail (incorrect shape)
+    with pytest.raises(AssertionError, match=msg):
+        df.groupby('a').apply(f3)
+    with pytest.raises(AssertionError, match=msg):
+        df2.groupby('a').apply(f3)
+
+
+def test_attr_wrapper(ts):
+    grouped = ts.groupby(lambda x: x.weekday())
+
+    result = grouped.std()
+    expected = grouped.agg(lambda x: np.std(x, ddof=1))
+    assert_series_equal(result, expected)
+
+    # this is pretty cool
+    result = grouped.describe()
+    expected = {name: gp.describe() for name, gp in grouped}
+    expected = DataFrame(expected).T
+    assert_frame_equal(result, expected)
+
+    # get attribute
+    result = grouped.dtype
+    expected = grouped.agg(lambda x: x.dtype)
+
+    # make sure raises error
+    msg = "'SeriesGroupBy' object has no attribute 'foo'"
+    with pytest.raises(AttributeError, match=msg):
+        getattr(grouped, 'foo')
+
+
+def test_frame_groupby(tsframe):
+    grouped = tsframe.groupby(lambda x: x.weekday())
+
+    # aggregate
+    aggregated = grouped.aggregate(np.mean)
+    assert len(aggregated) == 5
+    assert len(aggregated.columns) == 4
+
+    # by string
+    tscopy = tsframe.copy()
+    tscopy['weekday'] = [x.weekday() for x in tscopy.index]
+    stragged = tscopy.groupby('weekday').aggregate(np.mean)
+    assert_frame_equal(stragged, aggregated, check_names=False)
+
+    # transform
+    grouped = tsframe.head(30).groupby(lambda x: x.weekday())
+    transformed = grouped.transform(lambda x: x - x.mean())
+    assert len(transformed) == 30
+    assert len(transformed.columns) == 4
+
+    # transform propagate
+    transformed = grouped.transform(lambda x: x.mean())
+    for name, group in grouped:
+        mean = group.mean()
+        for idx in group.index:
+            tm.assert_series_equal(transformed.xs(idx), mean,
+                                   check_names=False)
+
+    # iterate
+    for weekday, group in grouped:
+        assert group.index[0].weekday() == weekday
+
+    # groups / group_indices
+    groups = grouped.groups
+    indices = grouped.indices
+
+    for k, v in compat.iteritems(groups):
+        samething = tsframe.index.take(indices[k])
+        assert (samething == v).all()
+
+
+def test_frame_groupby_columns(tsframe):
+    mapping = {'A': 0, 'B': 0, 'C': 1, 'D': 1}
+    grouped = tsframe.groupby(mapping, axis=1)
+
+    # aggregate
+    aggregated = grouped.aggregate(np.mean)
+    assert len(aggregated) == len(tsframe)
+    assert len(aggregated.columns) == 2
+
+    # transform
+    tf = lambda x: x - x.mean()
+    groupedT = tsframe.T.groupby(mapping, axis=0)
+    assert_frame_equal(groupedT.transform(tf).T, grouped.transform(tf))
+
+    # iterate
+    for k, v in grouped:
+        assert len(v.columns) == 2
+
+
+def test_frame_set_name_single(df):
+    grouped = df.groupby('A')
+
+    result = grouped.mean()
+    assert result.index.name == 'A'
 
+    result = df.groupby('A', as_index=False).mean()
+    assert result.index.name != 'A'
+
+    result = grouped.agg(np.mean)
+    assert result.index.name == 'A'
+
+    result = grouped.agg({'C': np.mean, 'D': np.std})
+    assert result.index.name == 'A'
+
+    result = grouped['C'].mean()
+    assert result.index.name == 'A'
+    result = grouped['C'].agg(np.mean)
+    assert result.index.name == 'A'
+    result = grouped['C'].agg([np.mean, np.std])
+    assert result.index.name == 'A'
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
         result = grouped['C'].agg({'foo': np.mean, 'bar': np.std})
-        self.assertEqual(result.index.name, 'A')
-
-    def test_multi_iter(self):
-        s = Series(np.arange(6))
-        k1 = np.array(['a', 'a', 'a', 'b', 'b', 'b'])
-        k2 = np.array(['1', '2', '1', '2', '1', '2'])
-
-        grouped = s.groupby([k1, k2])
-
-        iterated = list(grouped)
-        expected = [('a', '1', s[[0, 2]]), ('a', '2', s[[1]]),
-                    ('b', '1', s[[4]]), ('b', '2', s[[3, 5]])]
-        for i, ((one, two), three) in enumerate(iterated):
-            e1, e2, e3 = expected[i]
-            self.assertEqual(e1, one)
-            self.assertEqual(e2, two)
-            assert_series_equal(three, e3)
-
-    def test_multi_iter_frame(self):
-        k1 = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
-        k2 = np.array(['1', '2', '1', '2', '1', '2'])
-        df = DataFrame({'v1': np.random.randn(6),
-                        'v2': np.random.randn(6),
-                        'k1': k1, 'k2': k2},
-                       index=['one', 'two', 'three', 'four', 'five', 'six'])
-
-        grouped = df.groupby(['k1', 'k2'])
-
-        # things get sorted!
-        iterated = list(grouped)
-        idx = df.index
-        expected = [('a', '1', df.loc[idx[[4]]]),
-                    ('a', '2', df.loc[idx[[3, 5]]]),
-                    ('b', '1', df.loc[idx[[0, 2]]]),
-                    ('b', '2', df.loc[idx[[1]]])]
-        for i, ((one, two), three) in enumerate(iterated):
-            e1, e2, e3 = expected[i]
-            self.assertEqual(e1, one)
-            self.assertEqual(e2, two)
-            assert_frame_equal(three, e3)
-
-        # don't iterate through groups with no data
-        df['k1'] = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
-        df['k2'] = np.array(['1', '1', '1', '2', '2', '2'])
-        grouped = df.groupby(['k1', 'k2'])
-        groups = {}
-        for key, gp in grouped:
-            groups[key] = gp
-        self.assertEqual(len(groups), 2)
-
-        # axis = 1
-        three_levels = self.three_group.groupby(['A', 'B', 'C']).mean()
-        grouped = three_levels.T.groupby(axis=1, level=(1, 2))
-        for key, group in grouped:
-            pass
-
-    def test_multi_iter_panel(self):
-        wp = tm.makePanel()
-        grouped = wp.groupby([lambda x: x.month, lambda x: x.weekday()],
-                             axis=1)
-
-        for (month, wd), group in grouped:
-            exp_axis = [x
-                        for x in wp.major_axis
-                        if x.month == month and x.weekday() == wd]
-            expected = wp.reindex(major=exp_axis)
-            assert_panel_equal(group, expected)
-
-    def test_multi_func(self):
-        col1 = self.df['A']
-        col2 = self.df['B']
-
-        grouped = self.df.groupby([col1.get, col2.get])
-        agged = grouped.mean()
-        expected = self.df.groupby(['A', 'B']).mean()
-
-        # TODO groupby get drops names
-        assert_frame_equal(agged.loc[:, ['C', 'D']],
-                           expected.loc[:, ['C', 'D']],
-                           check_names=False)
-
-        # some "groups" with no data
-        df = DataFrame({'v1': np.random.randn(6),
-                        'v2': np.random.randn(6),
-                        'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
-                        'k2': np.array(['1', '1', '1', '2', '2', '2'])},
-                       index=['one', 'two', 'three', 'four', 'five', 'six'])
-        # only verify that it works for now
-        grouped = df.groupby(['k1', 'k2'])
-        grouped.agg(np.sum)
-
-    def test_multi_key_multiple_functions(self):
-        grouped = self.df.groupby(['A', 'B'])['C']
-
-        agged = grouped.agg([np.mean, np.std])
-        expected = DataFrame({'mean': grouped.agg(np.mean),
-                              'std': grouped.agg(np.std)})
-        assert_frame_equal(agged, expected)
-
-    def test_frame_multi_key_function_list(self):
-        data = DataFrame(
-            {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
-                   'foo', 'foo', 'foo'],
-             'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
-                   'two', 'two', 'one'],
-             'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
-                   'dull', 'shiny', 'shiny', 'shiny'],
-             'D': np.random.randn(11),
-             'E': np.random.randn(11),
-             'F': np.random.randn(11)})
-
-        grouped = data.groupby(['A', 'B'])
-        funcs = [np.mean, np.std]
-        agged = grouped.agg(funcs)
-        expected = concat([grouped['D'].agg(funcs), grouped['E'].agg(funcs),
-                           grouped['F'].agg(funcs)],
-                          keys=['D', 'E', 'F'], axis=1)
-        assert (isinstance(agged.index, MultiIndex))
-        assert (isinstance(expected.index, MultiIndex))
-        assert_frame_equal(agged, expected)
-
-    def test_groupby_multiple_columns(self):
-        data = self.df
-        grouped = data.groupby(['A', 'B'])
-
-        def _check_op(op):
-
-            result1 = op(grouped)
-
-            expected = defaultdict(dict)
-            for n1, gp1 in data.groupby('A'):
-                for n2, gp2 in gp1.groupby('B'):
-                    expected[n1][n2] = op(gp2.loc[:, ['C', 'D']])
-            expected = dict((k, DataFrame(v))
-                            for k, v in compat.iteritems(expected))
-            expected = Panel.fromDict(expected).swapaxes(0, 1)
-            expected.major_axis.name, expected.minor_axis.name = 'A', 'B'
-
-            # a little bit crude
-            for col in ['C', 'D']:
-                result_col = op(grouped[col])
-                exp = expected[col]
-                pivoted = result1[col].unstack()
-                pivoted2 = result_col.unstack()
-                assert_frame_equal(pivoted.reindex_like(exp), exp)
-                assert_frame_equal(pivoted2.reindex_like(exp), exp)
-
-        _check_op(lambda x: x.sum())
-        _check_op(lambda x: x.mean())
-
-        # test single series works the same
-        result = data['C'].groupby([data['A'], data['B']]).mean()
-        expected = data.groupby(['A', 'B']).mean()['C']
-
-        assert_series_equal(result, expected)
-
-    def test_groupby_as_index_agg(self):
-        grouped = self.df.groupby('A', as_index=False)
-
-        # single-key
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-        result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
-        expected2 = grouped.mean()
-        expected2['D'] = grouped.sum()['D']
-        assert_frame_equal(result2, expected2)
-
-        grouped = self.df.groupby('A', as_index=True)
-        expected3 = grouped['C'].sum()
-        expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
+    assert result.index.name == 'A'
+
+
+def test_multi_func(df):
+    col1 = df['A']
+    col2 = df['B']
+
+    grouped = df.groupby([col1.get, col2.get])
+    agged = grouped.mean()
+    expected = df.groupby(['A', 'B']).mean()
+
+    # TODO groupby get drops names
+    assert_frame_equal(agged.loc[:, ['C', 'D']],
+                       expected.loc[:, ['C', 'D']],
+                       check_names=False)
+
+    # some "groups" with no data
+    df = DataFrame({'v1': np.random.randn(6),
+                    'v2': np.random.randn(6),
+                    'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
+                    'k2': np.array(['1', '1', '1', '2', '2', '2'])},
+                   index=['one', 'two', 'three', 'four', 'five', 'six'])
+    # only verify that it works for now
+    grouped = df.groupby(['k1', 'k2'])
+    grouped.agg(np.sum)
+
+
+def test_multi_key_multiple_functions(df):
+    grouped = df.groupby(['A', 'B'])['C']
+
+    agged = grouped.agg([np.mean, np.std])
+    expected = DataFrame({'mean': grouped.agg(np.mean),
+                          'std': grouped.agg(np.std)})
+    assert_frame_equal(agged, expected)
+
+
+def test_frame_multi_key_function_list():
+    data = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny'],
+         'D': np.random.randn(11),
+         'E': np.random.randn(11),
+         'F': np.random.randn(11)})
+
+    grouped = data.groupby(['A', 'B'])
+    funcs = [np.mean, np.std]
+    agged = grouped.agg(funcs)
+    expected = pd.concat([grouped['D'].agg(funcs), grouped['E'].agg(funcs),
+                          grouped['F'].agg(funcs)],
+                         keys=['D', 'E', 'F'], axis=1)
+    assert (isinstance(agged.index, MultiIndex))
+    assert (isinstance(expected.index, MultiIndex))
+    assert_frame_equal(agged, expected)
+
+
+@pytest.mark.parametrize('op', [lambda x: x.sum(), lambda x: x.mean()])
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+def test_groupby_multiple_columns(df, op):
+    data = df
+    grouped = data.groupby(['A', 'B'])
+
+    result1 = op(grouped)
+
+    expected = defaultdict(dict)
+    for n1, gp1 in data.groupby('A'):
+        for n2, gp2 in gp1.groupby('B'):
+            expected[n1][n2] = op(gp2.loc[:, ['C', 'D']])
+    expected = {k: DataFrame(v)
+                for k, v in compat.iteritems(expected)}
+    expected = Panel.fromDict(expected).swapaxes(0, 1)
+    expected.major_axis.name, expected.minor_axis.name = 'A', 'B'
+
+    # a little bit crude
+    for col in ['C', 'D']:
+        result_col = op(grouped[col])
+        exp = expected[col]
+        pivoted = result1[col].unstack()
+        pivoted2 = result_col.unstack()
+        assert_frame_equal(pivoted.reindex_like(exp), exp)
+        assert_frame_equal(pivoted2.reindex_like(exp), exp)
+
+    # test single series works the same
+    result = data['C'].groupby([data['A'], data['B']]).mean()
+    expected = data.groupby(['A', 'B']).mean()['C']
+
+    assert_series_equal(result, expected)
+
+
+def test_groupby_as_index_agg(df):
+    grouped = df.groupby('A', as_index=False)
+
+    # single-key
+
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
+    expected2 = grouped.mean()
+    expected2['D'] = grouped.sum()['D']
+    assert_frame_equal(result2, expected2)
+
+    grouped = df.groupby('A', as_index=True)
+    expected3 = grouped['C'].sum()
+    expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
         result3 = grouped['C'].agg({'Q': np.sum})
-        assert_frame_equal(result3, expected3)
+    assert_frame_equal(result3, expected3)
 
-        # multi-key
+    # multi-key
 
-        grouped = self.df.groupby(['A', 'B'], as_index=False)
+    grouped = df.groupby(['A', 'B'], as_index=False)
 
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
 
-        result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
-        expected2 = grouped.mean()
-        expected2['D'] = grouped.sum()['D']
-        assert_frame_equal(result2, expected2)
+    result2 = grouped.agg(OrderedDict([['C', np.mean], ['D', np.sum]]))
+    expected2 = grouped.mean()
+    expected2['D'] = grouped.sum()['D']
+    assert_frame_equal(result2, expected2)
 
-        expected3 = grouped['C'].sum()
-        expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
-        result3 = grouped['C'].agg({'Q': np.sum})
-        assert_frame_equal(result3, expected3)
+    expected3 = grouped['C'].sum()
+    expected3 = DataFrame(expected3).rename(columns={'C': 'Q'})
+    result3 = grouped['C'].agg({'Q': np.sum})
+    assert_frame_equal(result3, expected3)
+
+    # GH7115 & GH8112 & GH8582
+    df = DataFrame(np.random.randint(0, 100, (50, 3)),
+                   columns=['jim', 'joe', 'jolie'])
+    ts = Series(np.random.randint(5, 10, 50), name='jim')
+
+    gr = df.groupby(ts)
+    gr.nth(0)  # invokes set_selection_from_grouper internally
+    assert_frame_equal(gr.apply(sum), df.groupby(ts).apply(sum))
+
+    for attr in ['mean', 'max', 'count', 'idxmax', 'cumsum', 'all']:
+        gr = df.groupby(ts, as_index=False)
+        left = getattr(gr, attr)()
+
+        gr = df.groupby(ts.values, as_index=True)
+        right = getattr(gr, attr)().reset_index(drop=True)
+
+        assert_frame_equal(left, right)
+
+
+def test_as_index_series_return_frame(df):
+    grouped = df.groupby('A', as_index=False)
+    grouped2 = df.groupby(['A', 'B'], as_index=False)
+
+    result = grouped['C'].agg(np.sum)
+    expected = grouped.agg(np.sum).loc[:, ['A', 'C']]
+    assert isinstance(result, DataFrame)
+    assert_frame_equal(result, expected)
+
+    result2 = grouped2['C'].agg(np.sum)
+    expected2 = grouped2.agg(np.sum).loc[:, ['A', 'B', 'C']]
+    assert isinstance(result2, DataFrame)
+    assert_frame_equal(result2, expected2)
+
+    result = grouped['C'].sum()
+    expected = grouped.sum().loc[:, ['A', 'C']]
+    assert isinstance(result, DataFrame)
+    assert_frame_equal(result, expected)
+
+    result2 = grouped2['C'].sum()
+    expected2 = grouped2.sum().loc[:, ['A', 'B', 'C']]
+    assert isinstance(result2, DataFrame)
+    assert_frame_equal(result2, expected2)
+
+
+def test_as_index_series_column_slice_raises(df):
+    # GH15072
+    grouped = df.groupby('A', as_index=False)
+    msg = r"Column\(s\) C already selected"
+
+    with pytest.raises(IndexError, match=msg):
+        grouped['C'].__getitem__('D')
+
+
+def test_groupby_as_index_cython(df):
+    data = df
+
+    # single-key
+    grouped = data.groupby('A', as_index=False)
+    result = grouped.mean()
+    expected = data.groupby(['A']).mean()
+    expected.insert(0, 'A', expected.index)
+    expected.index = np.arange(len(expected))
+    assert_frame_equal(result, expected)
+
+    # multi-key
+    grouped = data.groupby(['A', 'B'], as_index=False)
+    result = grouped.mean()
+    expected = data.groupby(['A', 'B']).mean()
+
+    arrays = lzip(*expected.index.values)
+    expected.insert(0, 'A', arrays[0])
+    expected.insert(1, 'B', arrays[1])
+    expected.index = np.arange(len(expected))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_as_index_series_scalar(df):
+    grouped = df.groupby(['A', 'B'], as_index=False)
+
+    # GH #421
+
+    result = grouped['C'].agg(len)
+    expected = grouped.agg(len).loc[:, ['A', 'B', 'C']]
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_as_index_corner(df, ts):
+    msg = "as_index=False only valid with DataFrame"
+    with pytest.raises(TypeError, match=msg):
+        ts.groupby(lambda x: x.weekday(), as_index=False)
+
+    msg = "as_index=False only valid for axis=0"
+    with pytest.raises(ValueError, match=msg):
+        df.groupby(lambda x: x.lower(), as_index=False, axis=1)
+
+
+def test_groupby_multiple_key(df):
+    df = tm.makeTimeDataFrame()
+    grouped = df.groupby([lambda x: x.year, lambda x: x.month,
+                          lambda x: x.day])
+    agged = grouped.sum()
+    assert_almost_equal(df.values, agged.values)
+
+    grouped = df.T.groupby([lambda x: x.year,
+                            lambda x: x.month,
+                            lambda x: x.day], axis=1)
+
+    agged = grouped.agg(lambda x: x.sum())
+    tm.assert_index_equal(agged.index, df.columns)
+    assert_almost_equal(df.T.values, agged.values)
+
+    agged = grouped.agg(lambda x: x.sum())
+    assert_almost_equal(df.T.values, agged.values)
+
+
+def test_groupby_multi_corner(df):
+    # test that having an all-NA column doesn't mess you up
+    df = df.copy()
+    df['bad'] = np.nan
+    agged = df.groupby(['A', 'B']).mean()
+
+    expected = df.groupby(['A', 'B']).mean()
+    expected['bad'] = np.nan
+
+    assert_frame_equal(agged, expected)
+
+
+def test_omit_nuisance(df):
+    grouped = df.groupby('A')
+
+    result = grouped.mean()
+    expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
+    assert_frame_equal(result, expected)
+
+    agged = grouped.agg(np.mean)
+    exp = grouped.mean()
+    assert_frame_equal(agged, exp)
+
+    df = df.loc[:, ['A', 'C', 'D']]
+    df['E'] = datetime.now()
+    grouped = df.groupby('A')
+    result = grouped.agg(np.sum)
+    expected = grouped.sum()
+    assert_frame_equal(result, expected)
+
+    # won't work with axis = 1
+    grouped = df.groupby({'A': 0, 'C': 0, 'D': 1, 'E': 1}, axis=1)
+    msg = (r'\("unsupported operand type\(s\) for \+: '
+           "'Timestamp' and 'float'\""
+           r", u?'occurred at index 0'\)")
+    with pytest.raises(TypeError, match=msg):
+        grouped.agg(lambda x: x.sum(0, numeric_only=False))
+
+
+def test_omit_nuisance_python_multiple(three_group):
+    grouped = three_group.groupby(['A', 'B'])
+
+    agged = grouped.agg(np.mean)
+    exp = grouped.mean()
+    assert_frame_equal(agged, exp)
+
+
+def test_empty_groups_corner(mframe):
+    # handle empty groups
+    df = DataFrame({'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
+                    'k2': np.array(['1', '1', '1', '2', '2', '2']),
+                    'k3': ['foo', 'bar'] * 3,
+                    'v1': np.random.randn(6),
+                    'v2': np.random.randn(6)})
+
+    grouped = df.groupby(['k1', 'k2'])
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+    grouped = mframe[3:5].groupby(level=0)
+    agged = grouped.apply(lambda x: x.mean())
+    agged_A = grouped['A'].apply(np.mean)
+    assert_series_equal(agged['A'], agged_A)
+    assert agged.index.name == 'first'
+
+
+def test_nonsense_func():
+    df = DataFrame([0])
+    msg = r"unsupported operand type\(s\) for \+: '(int|long)' and 'str'"
+    with pytest.raises(TypeError, match=msg):
+        df.groupby(lambda x: x + 'foo')
+
+
+def test_wrap_aggregated_output_multindex(mframe):
+    df = mframe.T
+    df['baz', 'two'] = 'peekaboo'
+
+    keys = [np.array([0, 0, 1]), np.array([0, 0, 1])]
+    agged = df.groupby(keys).agg(np.mean)
+    assert isinstance(agged.columns, MultiIndex)
+
+    def aggfun(ser):
+        if ser.name == ('foo', 'one'):
+            raise TypeError
+        else:
+            return ser.sum()
+
+    agged2 = df.groupby(keys).aggregate(aggfun)
+    assert len(agged2.columns) + 1 == len(df.columns)
+
+
+def test_groupby_level_apply(mframe):
+
+    result = mframe.groupby(level=0).count()
+    assert result.index.name == 'first'
+    result = mframe.groupby(level=1).count()
+    assert result.index.name == 'second'
+
+    result = mframe['A'].groupby(level=0).count()
+    assert result.index.name == 'first'
+
+
+def test_groupby_level_mapper(mframe):
+    deleveled = mframe.reset_index()
+
+    mapper0 = {'foo': 0, 'bar': 0, 'baz': 1, 'qux': 1}
+    mapper1 = {'one': 0, 'two': 0, 'three': 1}
+
+    result0 = mframe.groupby(mapper0, level=0).sum()
+    result1 = mframe.groupby(mapper1, level=1).sum()
+
+    mapped_level0 = np.array([mapper0.get(x) for x in deleveled['first']])
+    mapped_level1 = np.array([mapper1.get(x) for x in deleveled['second']])
+    expected0 = mframe.groupby(mapped_level0).sum()
+    expected1 = mframe.groupby(mapped_level1).sum()
+    expected0.index.name, expected1.index.name = 'first', 'second'
+
+    assert_frame_equal(result0, expected0)
+    assert_frame_equal(result1, expected1)
+
+
+def test_groupby_level_nonmulti():
+    # GH 1313, GH 13901
+    s = Series([1, 2, 3, 10, 4, 5, 20, 6],
+               Index([1, 2, 3, 1, 4, 5, 2, 6], name='foo'))
+    expected = Series([11, 22, 3, 4, 5, 6],
+                      Index(range(1, 7), name='foo'))
 
-        # GH7115 & GH8112 & GH8582
-        df = DataFrame(np.random.randint(0, 100, (50, 3)),
-                       columns=['jim', 'joe', 'jolie'])
-        ts = Series(np.random.randint(5, 10, 50), name='jim')
+    result = s.groupby(level=0).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=[0]).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=-1).sum()
+    tm.assert_series_equal(result, expected)
+    result = s.groupby(level=[-1]).sum()
+    tm.assert_series_equal(result, expected)
 
-        gr = df.groupby(ts)
-        gr.nth(0)  # invokes set_selection_from_grouper internally
-        assert_frame_equal(gr.apply(sum), df.groupby(ts).apply(sum))
+    msg = "level > 0 or level < -1 only valid with MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=1)
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=-2)
+    msg = "No group keys passed!"
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=[])
+    msg = "multiple levels only valid with MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=[0, 0])
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=[0, 1])
+    msg = "level > 0 or level < -1 only valid with MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        s.groupby(level=[1])
 
-        for attr in ['mean', 'max', 'count', 'idxmax', 'cumsum', 'all']:
-            gr = df.groupby(ts, as_index=False)
-            left = getattr(gr, attr)()
 
-            gr = df.groupby(ts.values, as_index=True)
-            right = getattr(gr, attr)().reset_index(drop=True)
+def test_groupby_complex():
+    # GH 12902
+    a = Series(data=np.arange(4) * (1 + 2j), index=[0, 0, 1, 1])
+    expected = Series((1 + 2j, 5 + 10j))
 
-            assert_frame_equal(left, right)
+    result = a.groupby(level=0).sum()
+    assert_series_equal(result, expected)
 
-    def test_series_groupby_nunique(self):
+    result = a.sum(level=0)
+    assert_series_equal(result, expected)
 
-        def check_nunique(df, keys, as_index=True):
-            for sort, dropna in cart_product((False, True), repeat=2):
-                gr = df.groupby(keys, as_index=as_index, sort=sort)
-                left = gr['julie'].nunique(dropna=dropna)
 
-                gr = df.groupby(keys, as_index=as_index, sort=sort)
-                right = gr['julie'].apply(Series.nunique, dropna=dropna)
-                if not as_index:
-                    right = right.reset_index(drop=True)
-
-                assert_series_equal(left, right, check_names=False)
-
-        days = date_range('2015-08-23', periods=10)
-
-        for n, m in cart_product(10 ** np.arange(2, 6), (10, 100, 1000)):
-            frame = DataFrame({
-                'jim': np.random.choice(
-                    list(ascii_lowercase), n),
-                'joe': np.random.choice(days, n),
-                'julie': np.random.randint(0, m, n)
-            })
-
-            check_nunique(frame, ['jim'])
-            check_nunique(frame, ['jim', 'joe'])
+def test_mutate_groups():
 
-            frame.loc[1::17, 'jim'] = None
-            frame.loc[3::37, 'joe'] = None
-            frame.loc[7::19, 'julie'] = None
-            frame.loc[8::19, 'julie'] = None
-            frame.loc[9::19, 'julie'] = None
-
-            check_nunique(frame, ['jim'])
-            check_nunique(frame, ['jim', 'joe'])
-            check_nunique(frame, ['jim'], as_index=False)
-            check_nunique(frame, ['jim', 'joe'], as_index=False)
+    # GH3380
 
-    def test_multiindex_passthru(self):
-
-        # GH 7997
-        # regression from 0.14.1
-        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
-        df.columns = pd.MultiIndex.from_tuples([(0, 1), (1, 1), (2, 1)])
-
-        result = df.groupby(axis=1, level=[0, 1]).first()
-        assert_frame_equal(result, df)
-
-    def test_multiindex_negative_level(self):
-        # GH 13901
-        result = self.mframe.groupby(level=-1).sum()
-        expected = self.mframe.groupby(level='second').sum()
-        assert_frame_equal(result, expected)
-
-        result = self.mframe.groupby(level=-2).sum()
-        expected = self.mframe.groupby(level='first').sum()
-        assert_frame_equal(result, expected)
-
-        result = self.mframe.groupby(level=[-2, -1]).sum()
-        expected = self.mframe
-        assert_frame_equal(result, expected)
-
-        result = self.mframe.groupby(level=[-1, 'first']).sum()
-        expected = self.mframe.groupby(level=['second', 'first']).sum()
-        assert_frame_equal(result, expected)
-
-    def test_multifunc_select_col_integer_cols(self):
-        df = self.df
-        df.columns = np.arange(len(df.columns))
-
-        # it works!
-        df.groupby(1, as_index=False)[2].agg({'Q': np.mean})
-
-    def test_as_index_series_return_frame(self):
-        grouped = self.df.groupby('A', as_index=False)
-        grouped2 = self.df.groupby(['A', 'B'], as_index=False)
-
-        result = grouped['C'].agg(np.sum)
-        expected = grouped.agg(np.sum).loc[:, ['A', 'C']]
-        tm.assertIsInstance(result, DataFrame)
-        assert_frame_equal(result, expected)
-
-        result2 = grouped2['C'].agg(np.sum)
-        expected2 = grouped2.agg(np.sum).loc[:, ['A', 'B', 'C']]
-        tm.assertIsInstance(result2, DataFrame)
-        assert_frame_equal(result2, expected2)
-
-        result = grouped['C'].sum()
-        expected = grouped.sum().loc[:, ['A', 'C']]
-        tm.assertIsInstance(result, DataFrame)
-        assert_frame_equal(result, expected)
-
-        result2 = grouped2['C'].sum()
-        expected2 = grouped2.sum().loc[:, ['A', 'B', 'C']]
-        tm.assertIsInstance(result2, DataFrame)
-        assert_frame_equal(result2, expected2)
-
-        # corner case
-        self.assertRaises(Exception, grouped['C'].__getitem__, 'D')
-
-    def test_groupby_as_index_cython(self):
-        data = self.df
-
-        # single-key
-        grouped = data.groupby('A', as_index=False)
-        result = grouped.mean()
-        expected = data.groupby(['A']).mean()
-        expected.insert(0, 'A', expected.index)
-        expected.index = np.arange(len(expected))
-        assert_frame_equal(result, expected)
-
-        # multi-key
-        grouped = data.groupby(['A', 'B'], as_index=False)
-        result = grouped.mean()
-        expected = data.groupby(['A', 'B']).mean()
-
-        arrays = lzip(*expected.index.values)
-        expected.insert(0, 'A', arrays[0])
-        expected.insert(1, 'B', arrays[1])
-        expected.index = np.arange(len(expected))
-        assert_frame_equal(result, expected)
-
-    def test_groupby_as_index_series_scalar(self):
-        grouped = self.df.groupby(['A', 'B'], as_index=False)
-
-        # GH #421
-
-        result = grouped['C'].agg(len)
-        expected = grouped.agg(len).loc[:, ['A', 'B', 'C']]
-        assert_frame_equal(result, expected)
-
-    def test_groupby_as_index_corner(self):
-        self.assertRaises(TypeError, self.ts.groupby, lambda x: x.weekday(),
-                          as_index=False)
-
-        self.assertRaises(ValueError, self.df.groupby, lambda x: x.lower(),
-                          as_index=False, axis=1)
-
-    def test_groupby_as_index_apply(self):
-        # GH #4648 and #3417
-        df = DataFrame({'item_id': ['b', 'b', 'a', 'c', 'a', 'b'],
-                        'user_id': [1, 2, 1, 1, 3, 1],
-                        'time': range(6)})
-
-        g_as = df.groupby('user_id', as_index=True)
-        g_not_as = df.groupby('user_id', as_index=False)
-
-        res_as = g_as.head(2).index
-        res_not_as = g_not_as.head(2).index
-        exp = Index([0, 1, 2, 4])
-        assert_index_equal(res_as, exp)
-        assert_index_equal(res_not_as, exp)
-
-        res_as_apply = g_as.apply(lambda x: x.head(2)).index
-        res_not_as_apply = g_not_as.apply(lambda x: x.head(2)).index
-
-        # apply doesn't maintain the original ordering
-        # changed in GH5610 as the as_index=False returns a MI here
-        exp_not_as_apply = MultiIndex.from_tuples([(0, 0), (0, 2), (1, 1), (
-            2, 4)])
-        tp = [(1, 0), (1, 2), (2, 1), (3, 4)]
-        exp_as_apply = MultiIndex.from_tuples(tp, names=['user_id', None])
-
-        assert_index_equal(res_as_apply, exp_as_apply)
-        assert_index_equal(res_not_as_apply, exp_not_as_apply)
-
-        ind = Index(list('abcde'))
-        df = DataFrame([[1, 2], [2, 3], [1, 4], [1, 5], [2, 6]], index=ind)
-        res = df.groupby(0, as_index=False).apply(lambda x: x).index
-        assert_index_equal(res, ind)
-
-    def test_groupby_head_tail(self):
-        df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
-        g_as = df.groupby('A', as_index=True)
-        g_not_as = df.groupby('A', as_index=False)
-
-        # as_index= False, much easier
-        assert_frame_equal(df.loc[[0, 2]], g_not_as.head(1))
-        assert_frame_equal(df.loc[[1, 2]], g_not_as.tail(1))
-
-        empty_not_as = DataFrame(columns=df.columns,
-                                 index=pd.Index([], dtype=df.index.dtype))
-        empty_not_as['A'] = empty_not_as['A'].astype(df.A.dtype)
-        empty_not_as['B'] = empty_not_as['B'].astype(df.B.dtype)
-        assert_frame_equal(empty_not_as, g_not_as.head(0))
-        assert_frame_equal(empty_not_as, g_not_as.tail(0))
-        assert_frame_equal(empty_not_as, g_not_as.head(-1))
-        assert_frame_equal(empty_not_as, g_not_as.tail(-1))
-
-        assert_frame_equal(df, g_not_as.head(7))  # contains all
-        assert_frame_equal(df, g_not_as.tail(7))
-
-        # as_index=True, (used to be different)
-        df_as = df
-
-        assert_frame_equal(df_as.loc[[0, 2]], g_as.head(1))
-        assert_frame_equal(df_as.loc[[1, 2]], g_as.tail(1))
-
-        empty_as = DataFrame(index=df_as.index[:0], columns=df.columns)
-        empty_as['A'] = empty_not_as['A'].astype(df.A.dtype)
-        empty_as['B'] = empty_not_as['B'].astype(df.B.dtype)
-        assert_frame_equal(empty_as, g_as.head(0))
-        assert_frame_equal(empty_as, g_as.tail(0))
-        assert_frame_equal(empty_as, g_as.head(-1))
-        assert_frame_equal(empty_as, g_as.tail(-1))
-
-        assert_frame_equal(df_as, g_as.head(7))  # contains all
-        assert_frame_equal(df_as, g_as.tail(7))
-
-        # test with selection
-        assert_frame_equal(g_as[[]].head(1), df_as.loc[[0, 2], []])
-        assert_frame_equal(g_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
-        assert_frame_equal(g_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
-        assert_frame_equal(g_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
-
-        assert_frame_equal(g_not_as[[]].head(1), df_as.loc[[0, 2], []])
-        assert_frame_equal(g_not_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
-        assert_frame_equal(g_not_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
-        assert_frame_equal(g_not_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
-
-    def test_groupby_multiple_key(self):
-        df = tm.makeTimeDataFrame()
-        grouped = df.groupby([lambda x: x.year, lambda x: x.month,
-                              lambda x: x.day])
-        agged = grouped.sum()
-        assert_almost_equal(df.values, agged.values)
-
-        grouped = df.T.groupby([lambda x: x.year,
-                                lambda x: x.month,
-                                lambda x: x.day], axis=1)
-
-        agged = grouped.agg(lambda x: x.sum())
-        self.assert_index_equal(agged.index, df.columns)
-        assert_almost_equal(df.T.values, agged.values)
-
-        agged = grouped.agg(lambda x: x.sum())
-        assert_almost_equal(df.T.values, agged.values)
-
-    def test_groupby_multi_corner(self):
-        # test that having an all-NA column doesn't mess you up
-        df = self.df.copy()
-        df['bad'] = np.nan
-        agged = df.groupby(['A', 'B']).mean()
-
-        expected = self.df.groupby(['A', 'B']).mean()
-        expected['bad'] = np.nan
-
-        assert_frame_equal(agged, expected)
-
-    def test_omit_nuisance(self):
-        grouped = self.df.groupby('A')
-
-        result = grouped.mean()
-        expected = self.df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
-        assert_frame_equal(result, expected)
-
-        agged = grouped.agg(np.mean)
-        exp = grouped.mean()
-        assert_frame_equal(agged, exp)
-
-        df = self.df.loc[:, ['A', 'C', 'D']]
-        df['E'] = datetime.now()
-        grouped = df.groupby('A')
-        result = grouped.agg(np.sum)
-        expected = grouped.sum()
-        assert_frame_equal(result, expected)
-
-        # won't work with axis = 1
-        grouped = df.groupby({'A': 0, 'C': 0, 'D': 1, 'E': 1}, axis=1)
-        result = self.assertRaises(TypeError, grouped.agg,
-                                   lambda x: x.sum(0, numeric_only=False))
-
-    def test_omit_nuisance_python_multiple(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        agged = grouped.agg(np.mean)
-        exp = grouped.mean()
-        assert_frame_equal(agged, exp)
-
-    def test_empty_groups_corner(self):
-        # handle empty groups
-        df = DataFrame({'k1': np.array(['b', 'b', 'b', 'a', 'a', 'a']),
-                        'k2': np.array(['1', '1', '1', '2', '2', '2']),
-                        'k3': ['foo', 'bar'] * 3,
-                        'v1': np.random.randn(6),
-                        'v2': np.random.randn(6)})
-
-        grouped = df.groupby(['k1', 'k2'])
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-        grouped = self.mframe[3:5].groupby(level=0)
-        agged = grouped.apply(lambda x: x.mean())
-        agged_A = grouped['A'].apply(np.mean)
-        assert_series_equal(agged['A'], agged_A)
-        self.assertEqual(agged.index.name, 'first')
-
-    def test_apply_concat_preserve_names(self):
-        grouped = self.three_group.groupby(['A', 'B'])
-
-        def desc(group):
-            result = group.describe()
-            result.index.name = 'stat'
-            return result
-
-        def desc2(group):
-            result = group.describe()
-            result.index.name = 'stat'
-            result = result[:len(group)]
-            # weirdo
-            return result
-
-        def desc3(group):
-            result = group.describe()
-
-            # names are different
-            result.index.name = 'stat_%d' % len(group)
-
-            result = result[:len(group)]
-            # weirdo
-            return result
-
-        result = grouped.apply(desc)
-        self.assertEqual(result.index.names, ('A', 'B', 'stat'))
-
-        result2 = grouped.apply(desc2)
-        self.assertEqual(result2.index.names, ('A', 'B', 'stat'))
-
-        result3 = grouped.apply(desc3)
-        self.assertEqual(result3.index.names, ('A', 'B', None))
-
-    def test_nonsense_func(self):
-        df = DataFrame([0])
-        self.assertRaises(Exception, df.groupby, lambda x: x + 'foo')
-
-    def test_builtins_apply(self):  # GH8155
-        df = pd.DataFrame(np.random.randint(1, 50, (1000, 2)),
-                          columns=['jim', 'joe'])
-        df['jolie'] = np.random.randn(1000)
-
-        for keys in ['jim', ['jim', 'joe']]:  # single key & multi-key
-            if keys == 'jim':
-                continue
-            for f in [max, min, sum]:
-                fname = f.__name__
-                result = df.groupby(keys).apply(f)
-                result.shape
-                ngroups = len(df.drop_duplicates(subset=keys))
-                assert result.shape == (ngroups, 3), 'invalid frame shape: '\
-                    '{} (expected ({}, 3))'.format(result.shape, ngroups)
-
-                assert_frame_equal(result,  # numpy's equivalent function
-                                   df.groupby(keys).apply(getattr(np, fname)))
-
-                if f != sum:
-                    expected = df.groupby(keys).agg(fname).reset_index()
-                    expected.set_index(keys, inplace=True, drop=False)
-                    assert_frame_equal(result, expected, check_dtype=False)
-
-                assert_series_equal(getattr(result, fname)(),
-                                    getattr(df, fname)())
-
-    def test_max_min_non_numeric(self):
-        # #2700
-        aa = DataFrame({'nn': [11, 11, 22, 22],
-                        'ii': [1, 2, 3, 4],
-                        'ss': 4 * ['mama']})
-
-        result = aa.groupby('nn').max()
-        self.assertTrue('ss' in result)
-
-        result = aa.groupby('nn').max(numeric_only=False)
-        self.assertTrue('ss' in result)
-
-        result = aa.groupby('nn').min()
-        self.assertTrue('ss' in result)
-
-        result = aa.groupby('nn').min(numeric_only=False)
-        self.assertTrue('ss' in result)
-
-    def test_arg_passthru(self):
-        # make sure that we are passing thru kwargs
-        # to our agg functions
-
-        # GH3668
-        # GH5724
-        df = pd.DataFrame(
-            {'group': [1, 1, 2],
-             'int': [1, 2, 3],
-             'float': [4., 5., 6.],
-             'string': list('abc'),
-             'category_string': pd.Series(list('abc')).astype('category'),
-             'category_int': [7, 8, 9],
-             'datetime': pd.date_range('20130101', periods=3),
-             'datetimetz': pd.date_range('20130101',
-                                         periods=3,
-                                         tz='US/Eastern'),
-             'timedelta': pd.timedelta_range('1 s', periods=3, freq='s')},
-            columns=['group', 'int', 'float', 'string',
-                     'category_string', 'category_int',
-                     'datetime', 'datetimetz',
-                     'timedelta'])
-
-        expected_columns_numeric = Index(['int', 'float', 'category_int'])
-
-        # mean / median
-        expected = pd.DataFrame(
-            {'category_int': [7.5, 9],
-             'float': [4.5, 6.],
-             'timedelta': [pd.Timedelta('1.5s'),
-                           pd.Timedelta('3s')],
-             'int': [1.5, 3],
-             'datetime': [pd.Timestamp('2013-01-01 12:00:00'),
-                          pd.Timestamp('2013-01-03 00:00:00')],
-             'datetimetz': [
-                 pd.Timestamp('2013-01-01 12:00:00', tz='US/Eastern'),
-                 pd.Timestamp('2013-01-03 00:00:00', tz='US/Eastern')]},
-            index=Index([1, 2], name='group'),
-            columns=['int', 'float', 'category_int',
-                     'datetime', 'datetimetz', 'timedelta'])
-        for attr in ['mean', 'median']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns_numeric)
-
-            result = f(numeric_only=False)
-            assert_frame_equal(result.reindex_like(expected), expected)
-
-        # TODO: min, max *should* handle
-        # categorical (ordered) dtype
-        expected_columns = Index(['int', 'float', 'string',
-                                  'category_int',
-                                  'datetime', 'datetimetz',
-                                  'timedelta'])
-        for attr in ['min', 'max']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-        expected_columns = Index(['int', 'float', 'string',
-                                  'category_string', 'category_int',
-                                  'datetime', 'datetimetz',
-                                  'timedelta'])
-        for attr in ['first', 'last']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-        expected_columns = Index(['int', 'float', 'string',
-                                  'category_int', 'timedelta'])
-        for attr in ['sum']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns_numeric)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-        expected_columns = Index(['int', 'float', 'category_int'])
-        for attr in ['prod', 'cumprod']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns_numeric)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-        # like min, max, but don't include strings
-        expected_columns = Index(['int', 'float',
-                                  'category_int',
-                                  'datetime', 'datetimetz',
-                                  'timedelta'])
-        for attr in ['cummin', 'cummax']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            # GH 15561: numeric_only=False set by default like min/max
-            tm.assert_index_equal(result.columns, expected_columns)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-        expected_columns = Index(['int', 'float', 'category_int',
-                                  'timedelta'])
-        for attr in ['cumsum']:
-            f = getattr(df.groupby('group'), attr)
-            result = f()
-            tm.assert_index_equal(result.columns, expected_columns_numeric)
-
-            result = f(numeric_only=False)
-            tm.assert_index_equal(result.columns, expected_columns)
-
-    def test_groupby_timedelta_cython_count(self):
-        df = DataFrame({'g': list('ab' * 2),
-                        'delt': np.arange(4).astype('timedelta64[ns]')})
-        expected = Series([
-            2, 2
-        ], index=pd.Index(['a', 'b'], name='g'), name='delt')
-        result = df.groupby('g').delt.count()
-        tm.assert_series_equal(expected, result)
-
-    def test_wrap_aggregated_output_multindex(self):
-        df = self.mframe.T
-        df['baz', 'two'] = 'peekaboo'
-
-        keys = [np.array([0, 0, 1]), np.array([0, 0, 1])]
-        agged = df.groupby(keys).agg(np.mean)
-        tm.assertIsInstance(agged.columns, MultiIndex)
-
-        def aggfun(ser):
-            if ser.name == ('foo', 'one'):
-                raise TypeError
-            else:
-                return ser.sum()
-
-        agged2 = df.groupby(keys).aggregate(aggfun)
-        self.assertEqual(len(agged2.columns) + 1, len(df.columns))
-
-    def test_groupby_level(self):
-        frame = self.mframe
-        deleveled = frame.reset_index()
-
-        result0 = frame.groupby(level=0).sum()
-        result1 = frame.groupby(level=1).sum()
-
-        expected0 = frame.groupby(deleveled['first'].values).sum()
-        expected1 = frame.groupby(deleveled['second'].values).sum()
-
-        expected0 = expected0.reindex(frame.index.levels[0])
-        expected1 = expected1.reindex(frame.index.levels[1])
-
-        self.assertEqual(result0.index.name, 'first')
-        self.assertEqual(result1.index.name, 'second')
-
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-        self.assertEqual(result0.index.name, frame.index.names[0])
-        self.assertEqual(result1.index.name, frame.index.names[1])
-
-        # groupby level name
-        result0 = frame.groupby(level='first').sum()
-        result1 = frame.groupby(level='second').sum()
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-
-        # axis=1
-
-        result0 = frame.T.groupby(level=0, axis=1).sum()
-        result1 = frame.T.groupby(level=1, axis=1).sum()
-        assert_frame_equal(result0, expected0.T)
-        assert_frame_equal(result1, expected1.T)
-
-        # raise exception for non-MultiIndex
-        self.assertRaises(ValueError, self.df.groupby, level=1)
-
-    def test_groupby_level_index_names(self):
-        # GH4014 this used to raise ValueError since 'exp'>1 (in py2)
-        df = DataFrame({'exp': ['A'] * 3 + ['B'] * 3,
-                        'var1': lrange(6), }).set_index('exp')
-        df.groupby(level='exp')
-        self.assertRaises(ValueError, df.groupby, level='foo')
-
-    def test_groupby_level_with_nas(self):
-        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, 0, 0, 0, 0], [0, 1, 2, 3, 0, 1,
-                                                              2, 3]])
-
-        # factorizing doesn't confuse things
-        s = Series(np.arange(8.), index=index)
-        result = s.groupby(level=0).sum()
-        expected = Series([22., 6.], index=[1, 0])
-        assert_series_equal(result, expected)
-
-        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
-                                                               1, 2, 3]])
-
-        # factorizing doesn't confuse things
-        s = Series(np.arange(8.), index=index)
-        result = s.groupby(level=0).sum()
-        expected = Series([18., 6.], index=[1, 0])
-        assert_series_equal(result, expected)
-
-    def test_groupby_level_apply(self):
-        frame = self.mframe
-
-        result = frame.groupby(level=0).count()
-        self.assertEqual(result.index.name, 'first')
-        result = frame.groupby(level=1).count()
-        self.assertEqual(result.index.name, 'second')
-
-        result = frame['A'].groupby(level=0).count()
-        self.assertEqual(result.index.name, 'first')
-
-    def test_groupby_args(self):
-        # PR8618 and issue 8015
-        frame = self.mframe
-
-        def j():
-            frame.groupby()
-
-        self.assertRaisesRegexp(TypeError,
-                                "You have to supply one of 'by' and 'level'",
-                                j)
-
-        def k():
-            frame.groupby(by=None, level=None)
-
-        self.assertRaisesRegexp(TypeError,
-                                "You have to supply one of 'by' and 'level'",
-                                k)
-
-    def test_groupby_level_mapper(self):
-        frame = self.mframe
-        deleveled = frame.reset_index()
-
-        mapper0 = {'foo': 0, 'bar': 0, 'baz': 1, 'qux': 1}
-        mapper1 = {'one': 0, 'two': 0, 'three': 1}
-
-        result0 = frame.groupby(mapper0, level=0).sum()
-        result1 = frame.groupby(mapper1, level=1).sum()
-
-        mapped_level0 = np.array([mapper0.get(x) for x in deleveled['first']])
-        mapped_level1 = np.array([mapper1.get(x) for x in deleveled['second']])
-        expected0 = frame.groupby(mapped_level0).sum()
-        expected1 = frame.groupby(mapped_level1).sum()
-        expected0.index.name, expected1.index.name = 'first', 'second'
-
-        assert_frame_equal(result0, expected0)
-        assert_frame_equal(result1, expected1)
-
-    def test_groupby_level_nonmulti(self):
-        # GH 1313, GH 13901
-        s = Series([1, 2, 3, 10, 4, 5, 20, 6],
-                   Index([1, 2, 3, 1, 4, 5, 2, 6], name='foo'))
-        expected = Series([11, 22, 3, 4, 5, 6],
-                          Index(range(1, 7), name='foo'))
-
-        result = s.groupby(level=0).sum()
-        self.assert_series_equal(result, expected)
-        result = s.groupby(level=[0]).sum()
-        self.assert_series_equal(result, expected)
-        result = s.groupby(level=-1).sum()
-        self.assert_series_equal(result, expected)
-        result = s.groupby(level=[-1]).sum()
-        self.assert_series_equal(result, expected)
-
-        tm.assertRaises(ValueError, s.groupby, level=1)
-        tm.assertRaises(ValueError, s.groupby, level=-2)
-        tm.assertRaises(ValueError, s.groupby, level=[])
-        tm.assertRaises(ValueError, s.groupby, level=[0, 0])
-        tm.assertRaises(ValueError, s.groupby, level=[0, 1])
-        tm.assertRaises(ValueError, s.groupby, level=[1])
-
-    def test_groupby_complex(self):
-        # GH 12902
-        a = Series(data=np.arange(4) * (1 + 2j), index=[0, 0, 1, 1])
-        expected = Series((1 + 2j, 5 + 10j))
-
-        result = a.groupby(level=0).sum()
-        assert_series_equal(result, expected)
-
-        result = a.sum(level=0)
-        assert_series_equal(result, expected)
-
-    def test_level_preserve_order(self):
-        grouped = self.mframe.groupby(level=0)
-        exp_labels = np.array([0, 0, 0, 1, 1, 2, 2, 3, 3, 3], np.intp)
-        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
-
-    def test_grouping_labels(self):
-        grouped = self.mframe.groupby(self.mframe.index.get_level_values(0))
-        exp_labels = np.array([2, 2, 2, 0, 0, 1, 1, 3, 3, 3], dtype=np.intp)
-        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
-
-    def test_apply_series_to_frame(self):
-        def f(piece):
-            with np.errstate(invalid='ignore'):
-                logged = np.log(piece)
-            return DataFrame({'value': piece,
-                              'demeaned': piece - piece.mean(),
-                              'logged': logged})
-
-        dr = bdate_range('1/1/2000', periods=100)
-        ts = Series(np.random.randn(100), index=dr)
-
-        grouped = ts.groupby(lambda x: x.month)
-        result = grouped.apply(f)
-
-        tm.assertIsInstance(result, DataFrame)
-        self.assert_index_equal(result.index, ts.index)
-
-    def test_apply_series_yield_constant(self):
-        result = self.df.groupby(['A', 'B'])['C'].apply(len)
-        self.assertEqual(result.index.names[:2], ('A', 'B'))
-
-    def test_apply_frame_yield_constant(self):
-        # GH13568
-        result = self.df.groupby(['A', 'B']).apply(len)
-        self.assertTrue(isinstance(result, Series))
-        self.assertIsNone(result.name)
-
-        result = self.df.groupby(['A', 'B'])[['C', 'D']].apply(len)
-        self.assertTrue(isinstance(result, Series))
-        self.assertIsNone(result.name)
-
-    def test_apply_frame_to_series(self):
-        grouped = self.df.groupby(['A', 'B'])
-        result = grouped.apply(len)
-        expected = grouped.count()['C']
-        self.assert_index_equal(result.index, expected.index)
-        self.assert_numpy_array_equal(result.values, expected.values)
-
-    def test_apply_frame_concat_series(self):
-        def trans(group):
-            return group.groupby('B')['C'].sum().sort_values()[:2]
-
-        def trans2(group):
-            grouped = group.groupby(df.reindex(group.index)['B'])
-            return grouped.sum().sort_values()[:2]
-
-        df = DataFrame({'A': np.random.randint(0, 5, 1000),
-                        'B': np.random.randint(0, 5, 1000),
-                        'C': np.random.randn(1000)})
-
-        result = df.groupby('A').apply(trans)
-        exp = df.groupby('A')['C'].apply(trans2)
-        assert_series_equal(result, exp, check_names=False)
-        self.assertEqual(result.name, 'C')
-
-    def test_apply_transform(self):
-        grouped = self.ts.groupby(lambda x: x.month)
-        result = grouped.apply(lambda x: x * 2)
-        expected = grouped.transform(lambda x: x * 2)
-        assert_series_equal(result, expected)
-
-    def test_apply_multikey_corner(self):
-        grouped = self.tsframe.groupby([lambda x: x.year, lambda x: x.month])
-
-        def f(group):
-            return group.sort_values('A')[-5:]
-
-        result = grouped.apply(f)
-        for key, group in grouped:
-            assert_frame_equal(result.loc[key], f(group))
-
-    def test_mutate_groups(self):
-
-        # GH3380
-
-        mydf = DataFrame({
-            'cat1': ['a'] * 8 + ['b'] * 6,
-            'cat2': ['c'] * 2 + ['d'] * 2 + ['e'] * 2 + ['f'] * 2 + ['c'] * 2 +
-            ['d'] * 2 + ['e'] * 2,
-            'cat3': lmap(lambda x: 'g%s' % x, lrange(1, 15)),
-            'val': np.random.randint(100, size=14),
-        })
-
-        def f_copy(x):
-            x = x.copy()
-            x['rank'] = x.val.rank(method='min')
-            return x.groupby('cat2')['rank'].min()
-
-        def f_no_copy(x):
-            x['rank'] = x.val.rank(method='min')
-            return x.groupby('cat2')['rank'].min()
-
-        grpby_copy = mydf.groupby('cat1').apply(f_copy)
-        grpby_no_copy = mydf.groupby('cat1').apply(f_no_copy)
-        assert_series_equal(grpby_copy, grpby_no_copy)
-
-    def test_no_mutate_but_looks_like(self):
-
-        # GH 8467
-        # first show's mutation indicator
-        # second does not, but should yield the same results
-        df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3], 'value': range(9)})
-
-        result1 = df.groupby('key', group_keys=True).apply(lambda x: x[:].key)
-        result2 = df.groupby('key', group_keys=True).apply(lambda x: x.key)
-        assert_series_equal(result1, result2)
-
-    def test_apply_chunk_view(self):
-        # Low level tinkering could be unsafe, make sure not
-        df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3],
-                        'value': lrange(9)})
-
-        # return view
-        f = lambda x: x[:2]
-
-        result = df.groupby('key', group_keys=False).apply(f)
-        expected = df.take([0, 1, 3, 4, 6, 7])
-        assert_frame_equal(result, expected)
-
-    def test_apply_no_name_column_conflict(self):
-        df = DataFrame({'name': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2],
-                        'name2': [0, 0, 0, 1, 1, 1, 0, 0, 1, 1],
-                        'value': lrange(10)[::-1]})
-
-        # it works! #2605
-        grouped = df.groupby(['name', 'name2'])
-        grouped.apply(lambda x: x.sort_values('value', inplace=True))
-
-    def test_groupby_series_indexed_differently(self):
-        s1 = Series([5.0, -9.0, 4.0, 100., -5., 55., 6.7],
-                    index=Index(['a', 'b', 'c', 'd', 'e', 'f', 'g']))
-        s2 = Series([1.0, 1.0, 4.0, 5.0, 5.0, 7.0],
-                    index=Index(['a', 'b', 'd', 'f', 'g', 'h']))
-
-        grouped = s1.groupby(s2)
-        agged = grouped.mean()
-        exp = s1.groupby(s2.reindex(s1.index).get).mean()
-        assert_series_equal(agged, exp)
-
-    def test_groupby_with_hier_columns(self):
-        tuples = list(zip(*[['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux',
-                             'qux'], ['one', 'two', 'one', 'two', 'one', 'two',
-                                      'one', 'two']]))
-        index = MultiIndex.from_tuples(tuples)
-        columns = MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'), (
-            'B', 'cat'), ('A', 'dog')])
-        df = DataFrame(np.random.randn(8, 4), index=index, columns=columns)
-
-        result = df.groupby(level=0).mean()
-        self.assert_index_equal(result.columns, columns)
-
-        result = df.groupby(level=0, axis=1).mean()
-        self.assert_index_equal(result.index, df.index)
-
-        result = df.groupby(level=0).agg(np.mean)
-        self.assert_index_equal(result.columns, columns)
-
-        result = df.groupby(level=0).apply(lambda x: x.mean())
-        self.assert_index_equal(result.columns, columns)
-
-        result = df.groupby(level=0, axis=1).agg(lambda x: x.mean(1))
-        self.assert_index_equal(result.columns, Index(['A', 'B']))
-        self.assert_index_equal(result.index, df.index)
-
-        # add a nuisance column
-        sorted_columns, _ = columns.sortlevel(0)
-        df['A', 'foo'] = 'bar'
-        result = df.groupby(level=0).mean()
-        self.assert_index_equal(result.columns, df.columns[:-1])
-
-    def test_pass_args_kwargs(self):
-        from numpy import percentile
-
-        def f(x, q=None, axis=0):
-            return percentile(x, q, axis=axis)
-
-        g = lambda x: percentile(x, 80, axis=0)
-
-        # Series
-        ts_grouped = self.ts.groupby(lambda x: x.month)
-        agg_result = ts_grouped.agg(percentile, 80, axis=0)
-        apply_result = ts_grouped.apply(percentile, 80, axis=0)
-        trans_result = ts_grouped.transform(percentile, 80, axis=0)
-
-        agg_expected = ts_grouped.quantile(.8)
-        trans_expected = ts_grouped.transform(g)
-
-        assert_series_equal(apply_result, agg_expected)
-        assert_series_equal(agg_result, agg_expected, check_names=False)
-        assert_series_equal(trans_result, trans_expected)
-
-        agg_result = ts_grouped.agg(f, q=80)
-        apply_result = ts_grouped.apply(f, q=80)
-        trans_result = ts_grouped.transform(f, q=80)
-        assert_series_equal(agg_result, agg_expected)
-        assert_series_equal(apply_result, agg_expected)
-        assert_series_equal(trans_result, trans_expected)
-
-        # DataFrame
-        df_grouped = self.tsframe.groupby(lambda x: x.month)
-        agg_result = df_grouped.agg(percentile, 80, axis=0)
-        apply_result = df_grouped.apply(DataFrame.quantile, .8)
-        expected = df_grouped.quantile(.8)
-        assert_frame_equal(apply_result, expected)
-        assert_frame_equal(agg_result, expected, check_names=False)
-
-        agg_result = df_grouped.agg(f, q=80)
-        apply_result = df_grouped.apply(DataFrame.quantile, q=.8)
-        assert_frame_equal(agg_result, expected, check_names=False)
-        assert_frame_equal(apply_result, expected)
-
-    def test_size(self):
-        grouped = self.df.groupby(['A', 'B'])
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        grouped = self.df.groupby('A')
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        grouped = self.df.groupby('B')
-        result = grouped.size()
-        for key, group in grouped:
-            self.assertEqual(result[key], len(group))
-
-        df = DataFrame(np.random.choice(20, (1000, 3)), columns=list('abc'))
-        for sort, key in cart_product((False, True), ('a', 'b', ['a', 'b'])):
-            left = df.groupby(key, sort=sort).size()
-            right = df.groupby(key, sort=sort)['c'].apply(lambda a: a.shape[0])
-            assert_series_equal(left, right, check_names=False)
-
-        # GH11699
-        df = DataFrame([], columns=['A', 'B'])
-        out = Series([], dtype='int64', index=Index([], name='A'))
-        assert_series_equal(df.groupby('A').size(), out)
-
-    def test_count(self):
-        from string import ascii_lowercase
-        n = 1 << 15
-        dr = date_range('2015-08-30', periods=n // 10, freq='T')
-
-        df = DataFrame({
-            '1st': np.random.choice(
-                list(ascii_lowercase), n),
-            '2nd': np.random.randint(0, 5, n),
-            '3rd': np.random.randn(n).round(3),
-            '4th': np.random.randint(-10, 10, n),
-            '5th': np.random.choice(dr, n),
-            '6th': np.random.randn(n).round(3),
-            '7th': np.random.randn(n).round(3),
-            '8th': np.random.choice(dr, n) - np.random.choice(dr, 1),
-            '9th': np.random.choice(
-                list(ascii_lowercase), n)
-        })
-
-        for col in df.columns.drop(['1st', '2nd', '4th']):
-            df.loc[np.random.choice(n, n // 10), col] = np.nan
-
-        df['9th'] = df['9th'].astype('category')
-
-        for key in '1st', '2nd', ['1st', '2nd']:
-            left = df.groupby(key).count()
-            right = df.groupby(key).apply(DataFrame.count).drop(key, axis=1)
-            assert_frame_equal(left, right)
-
-        # GH5610
-        # count counts non-nulls
-        df = pd.DataFrame([[1, 2, 'foo'], [1, nan, 'bar'], [3, nan, nan]],
-                          columns=['A', 'B', 'C'])
-
-        count_as = df.groupby('A').count()
-        count_not_as = df.groupby('A', as_index=False).count()
-
-        expected = DataFrame([[1, 2], [0, 0]], columns=['B', 'C'],
-                             index=[1, 3])
-        expected.index.name = 'A'
-        assert_frame_equal(count_not_as, expected.reset_index())
-        assert_frame_equal(count_as, expected)
-
-        count_B = df.groupby('A')['B'].count()
-        assert_series_equal(count_B, expected['B'])
-
-    def test_count_object(self):
-        df = pd.DataFrame({'a': ['a'] * 3 + ['b'] * 3, 'c': [2] * 3 + [3] * 3})
-        result = df.groupby('c').a.count()
-        expected = pd.Series([
-            3, 3
-        ], index=pd.Index([2, 3], name='c'), name='a')
-        tm.assert_series_equal(result, expected)
-
-        df = pd.DataFrame({'a': ['a', np.nan, np.nan] + ['b'] * 3,
-                           'c': [2] * 3 + [3] * 3})
-        result = df.groupby('c').a.count()
-        expected = pd.Series([
-            1, 3
-        ], index=pd.Index([2, 3], name='c'), name='a')
-        tm.assert_series_equal(result, expected)
-
-    def test_count_cross_type(self):  # GH8169
-        vals = np.hstack((np.random.randint(0, 5, (100, 2)), np.random.randint(
-            0, 2, (100, 2))))
-
-        df = pd.DataFrame(vals, columns=['a', 'b', 'c', 'd'])
-        df[df == 2] = np.nan
-        expected = df.groupby(['c', 'd']).count()
-
-        for t in ['float32', 'object']:
-            df['a'] = df['a'].astype(t)
-            df['b'] = df['b'].astype(t)
-            result = df.groupby(['c', 'd']).count()
-            tm.assert_frame_equal(result, expected)
-
-    def test_nunique(self):
-        df = DataFrame({
-            'A': list('abbacc'),
-            'B': list('abxacc'),
-            'C': list('abbacx'),
-        })
-
-        expected = DataFrame({'A': [1] * 3, 'B': [1, 2, 1], 'C': [1, 1, 2]})
-        result = df.groupby('A', as_index=False).nunique()
-        tm.assert_frame_equal(result, expected)
-
-        # as_index
-        expected.index = list('abc')
-        expected.index.name = 'A'
-        result = df.groupby('A').nunique()
-        tm.assert_frame_equal(result, expected)
-
-        # with na
-        result = df.replace({'x': None}).groupby('A').nunique(dropna=False)
-        tm.assert_frame_equal(result, expected)
-
-        # dropna
-        expected = DataFrame({'A': [1] * 3, 'B': [1] * 3, 'C': [1] * 3},
-                             index=list('abc'))
-        expected.index.name = 'A'
-        result = df.replace({'x': None}).groupby('A').nunique()
-        tm.assert_frame_equal(result, expected)
-
-    def test_non_cython_api(self):
-
-        # GH5610
-        # non-cython calls should not include the grouper
-
-        df = DataFrame(
-            [[1, 2, 'foo'], [1,
-                             nan,
-                             'bar', ], [3, nan, 'baz']
-             ], columns=['A', 'B', 'C'])
-        g = df.groupby('A')
-        gni = df.groupby('A', as_index=False)
-
-        # mad
-        expected = DataFrame([[0], [nan]], columns=['B'], index=[1, 3])
-        expected.index.name = 'A'
-        result = g.mad()
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame([[0., 0.], [0, nan]], columns=['A', 'B'],
-                             index=[0, 1])
-        result = gni.mad()
-        assert_frame_equal(result, expected)
-
-        # describe
-        expected_index = pd.Index([1, 3], name='A')
-        expected_col = pd.MultiIndex(levels=[['B'],
-                                             ['count', 'mean', 'std', 'min',
-                                              '25%', '50%', '75%', 'max']],
-                                     labels=[[0] * 8, list(range(8))])
-        expected = pd.DataFrame([[1.0, 2.0, nan, 2.0, 2.0, 2.0, 2.0, 2.0],
-                                 [0.0, nan, nan, nan, nan, nan, nan, nan]],
-                                index=expected_index,
-                                columns=expected_col)
-        result = g.describe()
-        assert_frame_equal(result, expected)
-
-        expected = pd.concat([df[df.A == 1].describe().unstack().to_frame().T,
-                              df[df.A == 3].describe().unstack().to_frame().T])
-        expected.index = pd.Index([0, 1])
-        result = gni.describe()
-        assert_frame_equal(result, expected)
-
-        # any
-        expected = DataFrame([[True, True], [False, True]], columns=['B', 'C'],
-                             index=[1, 3])
-        expected.index.name = 'A'
-        result = g.any()
-        assert_frame_equal(result, expected)
-
-        # idxmax
-        expected = DataFrame([[0], [nan]], columns=['B'], index=[1, 3])
-        expected.index.name = 'A'
-        result = g.idxmax()
-        assert_frame_equal(result, expected)
-
-    def test_cython_api2(self):
-
-        # this takes the fast apply path
-
-        # cumsum (GH5614)
-        df = DataFrame(
-            [[1, 2, np.nan], [1, np.nan, 9], [3, 4, 9]
-             ], columns=['A', 'B', 'C'])
-        expected = DataFrame(
-            [[2, np.nan], [np.nan, 9], [4, 9]], columns=['B', 'C'])
-        result = df.groupby('A').cumsum()
-        assert_frame_equal(result, expected)
-
-        # GH 5755 - cumsum is a transformer and should ignore as_index
-        result = df.groupby('A', as_index=False).cumsum()
-        assert_frame_equal(result, expected)
-
-        # GH 13994
-        result = df.groupby('A').cumsum(axis=1)
-        expected = df.cumsum(axis=1)
-        assert_frame_equal(result, expected)
-        result = df.groupby('A').cumprod(axis=1)
-        expected = df.cumprod(axis=1)
-        assert_frame_equal(result, expected)
-
-    def test_grouping_ndarray(self):
-        grouped = self.df.groupby(self.df['A'].values)
-
-        result = grouped.sum()
-        expected = self.df.groupby('A').sum()
-        assert_frame_equal(result, expected, check_names=False
-                           )  # Note: no names when grouping by value
-
-    def test_apply_typecast_fail(self):
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(
-                            ['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)})
-
-        def f(group):
-            v = group['v']
-            group['v2'] = (v - v.min()) / (v.max() - v.min())
-            return group
-
-        result = df.groupby('d').apply(f)
-
-        expected = df.copy()
-        expected['v2'] = np.tile([0., 0.5, 1], 2)
-
-        assert_frame_equal(result, expected)
-
-    def test_apply_multiindex_fail(self):
-        index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
-                                        ])
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)}, index=index)
-
-        def f(group):
-            v = group['v']
-            group['v2'] = (v - v.min()) / (v.max() - v.min())
-            return group
-
-        result = df.groupby('d').apply(f)
-
-        expected = df.copy()
-        expected['v2'] = np.tile([0., 0.5, 1], 2)
-
-        assert_frame_equal(result, expected)
-
-    def test_apply_corner(self):
-        result = self.tsframe.groupby(lambda x: x.year).apply(lambda x: x * 2)
-        expected = self.tsframe * 2
-        assert_frame_equal(result, expected)
-
-    def test_apply_without_copy(self):
-        # GH 5545
-        # returning a non-copy in an applied function fails
-
-        data = DataFrame({'id_field': [100, 100, 200, 300],
-                          'category': ['a', 'b', 'c', 'c'],
-                          'value': [1, 2, 3, 4]})
-
-        def filt1(x):
-            if x.shape[0] == 1:
-                return x.copy()
-            else:
-                return x[x.category == 'c']
-
-        def filt2(x):
-            if x.shape[0] == 1:
-                return x
-            else:
-                return x[x.category == 'c']
-
-        expected = data.groupby('id_field').apply(filt1)
-        result = data.groupby('id_field').apply(filt2)
-        assert_frame_equal(result, expected)
-
-    def test_apply_corner_cases(self):
-        # #535, can't use sliding iterator
-
-        N = 1000
-        labels = np.random.randint(0, 100, size=N)
-        df = DataFrame({'key': labels,
-                        'value1': np.random.randn(N),
-                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
-
-        grouped = df.groupby('key')
-
-        def f(g):
-            g['value3'] = g['value1'] * 2
-            return g
-
-        result = grouped.apply(f)
-        self.assertTrue('value3' in result)
-
-    def test_groupby_wrong_multi_labels(self):
-        from pandas import read_csv
-        data = """index,foo,bar,baz,spam,data
+    df = DataFrame({
+        'cat1': ['a'] * 8 + ['b'] * 6,
+        'cat2': ['c'] * 2 + ['d'] * 2 + ['e'] * 2 + ['f'] * 2 + ['c'] * 2 +
+        ['d'] * 2 + ['e'] * 2,
+        'cat3': lmap(lambda x: 'g%s' % x, lrange(1, 15)),
+        'val': np.random.randint(100, size=14),
+    })
+
+    def f_copy(x):
+        x = x.copy()
+        x['rank'] = x.val.rank(method='min')
+        return x.groupby('cat2')['rank'].min()
+
+    def f_no_copy(x):
+        x['rank'] = x.val.rank(method='min')
+        return x.groupby('cat2')['rank'].min()
+
+    grpby_copy = df.groupby('cat1').apply(f_copy)
+    grpby_no_copy = df.groupby('cat1').apply(f_no_copy)
+    assert_series_equal(grpby_copy, grpby_no_copy)
+
+
+def test_no_mutate_but_looks_like():
+
+    # GH 8467
+    # first show's mutation indicator
+    # second does not, but should yield the same results
+    df = DataFrame({'key': [1, 1, 1, 2, 2, 2, 3, 3, 3], 'value': range(9)})
+
+    result1 = df.groupby('key', group_keys=True).apply(lambda x: x[:].key)
+    result2 = df.groupby('key', group_keys=True).apply(lambda x: x.key)
+    assert_series_equal(result1, result2)
+
+
+def test_groupby_series_indexed_differently():
+    s1 = Series([5.0, -9.0, 4.0, 100., -5., 55., 6.7],
+                index=Index(['a', 'b', 'c', 'd', 'e', 'f', 'g']))
+    s2 = Series([1.0, 1.0, 4.0, 5.0, 5.0, 7.0],
+                index=Index(['a', 'b', 'd', 'f', 'g', 'h']))
+
+    grouped = s1.groupby(s2)
+    agged = grouped.mean()
+    exp = s1.groupby(s2.reindex(s1.index).get).mean()
+    assert_series_equal(agged, exp)
+
+
+def test_groupby_with_hier_columns():
+    tuples = list(zip(*[['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux',
+                         'qux'], ['one', 'two', 'one', 'two', 'one', 'two',
+                                  'one', 'two']]))
+    index = MultiIndex.from_tuples(tuples)
+    columns = MultiIndex.from_tuples([('A', 'cat'), ('B', 'dog'), (
+        'B', 'cat'), ('A', 'dog')])
+    df = DataFrame(np.random.randn(8, 4), index=index, columns=columns)
+
+    result = df.groupby(level=0).mean()
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0, axis=1).mean()
+    tm.assert_index_equal(result.index, df.index)
+
+    result = df.groupby(level=0).agg(np.mean)
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0).apply(lambda x: x.mean())
+    tm.assert_index_equal(result.columns, columns)
+
+    result = df.groupby(level=0, axis=1).agg(lambda x: x.mean(1))
+    tm.assert_index_equal(result.columns, Index(['A', 'B']))
+    tm.assert_index_equal(result.index, df.index)
+
+    # add a nuisance column
+    sorted_columns, _ = columns.sortlevel(0)
+    df['A', 'foo'] = 'bar'
+    result = df.groupby(level=0).mean()
+    tm.assert_index_equal(result.columns, df.columns[:-1])
+
+
+def test_grouping_ndarray(df):
+    grouped = df.groupby(df['A'].values)
+
+    result = grouped.sum()
+    expected = df.groupby('A').sum()
+    assert_frame_equal(result, expected, check_names=False
+                       )  # Note: no names when grouping by value
+
+
+def test_groupby_wrong_multi_labels():
+    data = """index,foo,bar,baz,spam,data
 0,foo1,bar1,baz1,spam2,20
 1,foo1,bar2,baz1,spam3,30
 2,foo2,bar2,baz1,spam2,40
 3,foo1,bar1,baz2,spam1,50
 4,foo3,bar1,baz2,spam1,60"""
 
-        data = read_csv(StringIO(data), index_col=0)
-
-        grouped = data.groupby(['foo', 'bar', 'baz', 'spam'])
-
-        result = grouped.agg(np.mean)
-        expected = grouped.mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_series_with_name(self):
-        result = self.df.groupby(self.df['A']).mean()
-        result2 = self.df.groupby(self.df['A'], as_index=False).mean()
-        self.assertEqual(result.index.name, 'A')
-        self.assertIn('A', result2)
-
-        result = self.df.groupby([self.df['A'], self.df['B']]).mean()
-        result2 = self.df.groupby([self.df['A'], self.df['B']],
-                                  as_index=False).mean()
-        self.assertEqual(result.index.names, ('A', 'B'))
-        self.assertIn('A', result2)
-        self.assertIn('B', result2)
-
-    def test_seriesgroupby_name_attr(self):
-        # GH 6265
-        result = self.df.groupby('A')['C']
-        self.assertEqual(result.count().name, 'C')
-        self.assertEqual(result.mean().name, 'C')
-
-        testFunc = lambda x: np.sum(x) * 2
-        self.assertEqual(result.agg(testFunc).name, 'C')
-
-    def test_consistency_name(self):
-        # GH 12363
-
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'two',
-                              'two', 'two', 'one', 'two'],
-                        'C': np.random.randn(8) + 1.0,
-                        'D': np.arange(8)})
-
-        expected = df.groupby(['A']).B.count()
-        result = df.B.groupby(df.A).count()
-        assert_series_equal(result, expected)
-
-    def test_groupby_name_propagation(self):
-        # GH 6124
-        def summarize(df, name=None):
-            return Series({'count': 1, 'mean': 2, 'omissions': 3, }, name=name)
-
-        def summarize_random_name(df):
-            # Provide a different name for each Series.  In this case, groupby
-            # should not attempt to propagate the Series name since they are
-            # inconsistent.
-            return Series({
-                'count': 1,
-                'mean': 2,
-                'omissions': 3,
-            }, name=df.iloc[0]['A'])
-
-        metrics = self.df.groupby('A').apply(summarize)
-        self.assertEqual(metrics.columns.name, None)
-        metrics = self.df.groupby('A').apply(summarize, 'metrics')
-        self.assertEqual(metrics.columns.name, 'metrics')
-        metrics = self.df.groupby('A').apply(summarize_random_name)
-        self.assertEqual(metrics.columns.name, None)
-
-    def test_groupby_nonstring_columns(self):
-        df = DataFrame([np.arange(10) for x in range(10)])
-        grouped = df.groupby(0)
-        result = grouped.mean()
-        expected = df.groupby(df[0]).mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_mixed_type_columns(self):
-        # GH 13432, unorderable types in py3
-        df = DataFrame([[0, 1, 2]], columns=['A', 'B', 0])
-        expected = DataFrame([[1, 2]], columns=['B', 0],
-                             index=Index([0], name='A'))
-
-        result = df.groupby('A').first()
-        tm.assert_frame_equal(result, expected)
-
-        result = df.groupby('A').sum()
-        tm.assert_frame_equal(result, expected)
-
-    def test_cython_grouper_series_bug_noncontig(self):
-        arr = np.empty((100, 100))
-        arr.fill(np.nan)
-        obj = Series(arr[:, 0], index=lrange(100))
-        inds = np.tile(lrange(10), 10)
-
-        result = obj.groupby(inds).agg(Series.median)
-        self.assertTrue(result.isnull().all())
-
-    def test_series_grouper_noncontig_index(self):
-        index = Index(tm.rands_array(10, 100))
-
-        values = Series(np.random.randn(50), index=index[::2])
-        labels = np.random.randint(0, 5, 50)
-
-        # it works!
-        grouped = values.groupby(labels)
-
-        # accessing the index elements causes segfault
-        f = lambda x: len(set(map(id, x.index)))
-        grouped.agg(f)
-
-    def test_convert_objects_leave_decimal_alone(self):
-
-        from decimal import Decimal
-
-        s = Series(lrange(5))
-        labels = np.array(['a', 'b', 'c', 'd', 'e'], dtype='O')
-
-        def convert_fast(x):
-            return Decimal(str(x.mean()))
-
-        def convert_force_pure(x):
-            # base will be length 0
-            assert (len(x.base) > 0)
-            return Decimal(str(x.mean()))
-
-        grouped = s.groupby(labels)
-
-        result = grouped.agg(convert_fast)
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
-
-        result = grouped.agg(convert_force_pure)
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
-
-    def test_fast_apply(self):
-        # make sure that fast apply is correctly called
-        # rather than raising any kind of error
-        # otherwise the python path will be callsed
-        # which slows things down
-        N = 1000
-        labels = np.random.randint(0, 2000, size=N)
-        labels2 = np.random.randint(0, 3, size=N)
-        df = DataFrame({'key': labels,
-                        'key2': labels2,
-                        'value1': np.random.randn(N),
-                        'value2': ['foo', 'bar', 'baz', 'qux'] * (N // 4)})
-
-        def f(g):
-            return 1
-
-        g = df.groupby(['key', 'key2'])
-
-        grouper = g.grouper
-
-        splitter = grouper._get_splitter(g._selected_obj, axis=g.axis)
-        group_keys = grouper._get_group_keys()
-
-        values, mutated = splitter.fast_apply(f, group_keys)
-        self.assertFalse(mutated)
-
-    def test_apply_with_mixed_dtype(self):
-        # GH3480, apply with mixed dtype on axis=1 breaks in 0.11
-        df = DataFrame({'foo1': ['one', 'two', 'two', 'three', 'one', 'two'],
-                        'foo2': np.random.randn(6)})
-        result = df.apply(lambda x: x, axis=1)
-        assert_series_equal(df.get_dtype_counts(), result.get_dtype_counts())
-
-        # GH 3610 incorrect dtype conversion with as_index=False
-        df = DataFrame({"c1": [1, 2, 6, 6, 8]})
-        df["c2"] = df.c1 / 2.0
-        result1 = df.groupby("c2").mean().reset_index().c2
-        result2 = df.groupby("c2", as_index=False).mean().c2
-        assert_series_equal(result1, result2)
-
-    def test_groupby_aggregation_mixed_dtype(self):
-
-        # GH 6212
-        expected = DataFrame({
-            'v1': [5, 5, 7, np.nan, 3, 3, 4, 1],
-            'v2': [55, 55, 77, np.nan, 33, 33, 44, 11]},
-            index=MultiIndex.from_tuples([(1, 95), (1, 99), (2, 95), (2, 99),
-                                          ('big', 'damp'),
-                                          ('blue', 'dry'),
-                                          ('red', 'red'), ('red', 'wet')],
-                                         names=['by1', 'by2']))
-
-        df = DataFrame({
-            'v1': [1, 3, 5, 7, 8, 3, 5, np.nan, 4, 5, 7, 9],
-            'v2': [11, 33, 55, 77, 88, 33, 55, np.nan, 44, 55, 77, 99],
-            'by1': ["red", "blue", 1, 2, np.nan, "big", 1, 2, "red", 1, np.nan,
-                    12],
-            'by2': ["wet", "dry", 99, 95, np.nan, "damp", 95, 99, "red", 99,
-                    np.nan, np.nan]
-        })
-
-        g = df.groupby(['by1', 'by2'])
-        result = g[['v1', 'v2']].mean()
-        assert_frame_equal(result, expected)
-
-    def test_groupby_dtype_inference_empty(self):
-        # GH 6733
-        df = DataFrame({'x': [], 'range': np.arange(0, dtype='int64')})
-        self.assertEqual(df['x'].dtype, np.float64)
-
-        result = df.groupby('x').first()
-        exp_index = Index([], name='x', dtype=np.float64)
-        expected = DataFrame({'range': Series(
-            [], index=exp_index, dtype='int64')})
-        assert_frame_equal(result, expected, by_blocks=True)
-
-    def test_groupby_list_infer_array_like(self):
-        result = self.df.groupby(list(self.df['A'])).mean()
-        expected = self.df.groupby(self.df['A']).mean()
-        assert_frame_equal(result, expected, check_names=False)
-
-        self.assertRaises(Exception, self.df.groupby, list(self.df['A'][:-1]))
-
-        # pathological case of ambiguity
-        df = DataFrame({'foo': [0, 1],
-                        'bar': [3, 4],
-                        'val': np.random.randn(2)})
-
-        result = df.groupby(['foo', 'bar']).mean()
-        expected = df.groupby([df['foo'], df['bar']]).mean()[['val']]
-
-    def test_groupby_keys_same_size_as_index(self):
-        # GH 11185
-        freq = 's'
-        index = pd.date_range(start=pd.Timestamp('2015-09-29T11:34:44-0700'),
-                              periods=2, freq=freq)
-        df = pd.DataFrame([['A', 10], ['B', 15]], columns=[
-            'metric', 'values'
-        ], index=index)
-        result = df.groupby([pd.Grouper(level=0, freq=freq), 'metric']).mean()
-        expected = df.set_index([df.index, 'metric'])
-
-        assert_frame_equal(result, expected)
-
-    def test_groupby_one_row(self):
-        # GH 11741
-        df1 = pd.DataFrame(np.random.randn(1, 4), columns=list('ABCD'))
-        self.assertRaises(KeyError, df1.groupby, 'Z')
-        df2 = pd.DataFrame(np.random.randn(2, 4), columns=list('ABCD'))
-        self.assertRaises(KeyError, df2.groupby, 'Z')
-
-    def test_groupby_nat_exclude(self):
-        # GH 6992
-        df = pd.DataFrame(
-            {'values': np.random.randn(8),
-             'dt': [np.nan, pd.Timestamp('2013-01-01'), np.nan, pd.Timestamp(
-                 '2013-02-01'), np.nan, pd.Timestamp('2013-02-01'), np.nan,
-                pd.Timestamp('2013-01-01')],
-             'str': [np.nan, 'a', np.nan, 'a', np.nan, 'a', np.nan, 'b']})
-        grouped = df.groupby('dt')
-
-        expected = [pd.Index([1, 7]), pd.Index([3, 5])]
-        keys = sorted(grouped.groups.keys())
-        self.assertEqual(len(keys), 2)
-        for k, e in zip(keys, expected):
-            # grouped.groups keys are np.datetime64 with system tz
-            # not to be affected by tz, only compare values
-            tm.assert_index_equal(grouped.groups[k], e)
-
-        # confirm obj is not filtered
-        tm.assert_frame_equal(grouped.grouper.groupings[0].obj, df)
-        self.assertEqual(grouped.ngroups, 2)
-
-        expected = {
-            Timestamp('2013-01-01 00:00:00'): np.array([1, 7], dtype=np.int64),
-            Timestamp('2013-02-01 00:00:00'): np.array([3, 5], dtype=np.int64)
-        }
-
-        for k in grouped.indices:
-            self.assert_numpy_array_equal(grouped.indices[k], expected[k])
-
-        tm.assert_frame_equal(
-            grouped.get_group(Timestamp('2013-01-01')), df.iloc[[1, 7]])
-        tm.assert_frame_equal(
-            grouped.get_group(Timestamp('2013-02-01')), df.iloc[[3, 5]])
-
-        self.assertRaises(KeyError, grouped.get_group, pd.NaT)
-
-        nan_df = DataFrame({'nan': [np.nan, np.nan, np.nan],
-                            'nat': [pd.NaT, pd.NaT, pd.NaT]})
-        self.assertEqual(nan_df['nan'].dtype, 'float64')
-        self.assertEqual(nan_df['nat'].dtype, 'datetime64[ns]')
-
-        for key in ['nan', 'nat']:
-            grouped = nan_df.groupby(key)
-            self.assertEqual(grouped.groups, {})
-            self.assertEqual(grouped.ngroups, 0)
-            self.assertEqual(grouped.indices, {})
-            self.assertRaises(KeyError, grouped.get_group, np.nan)
-            self.assertRaises(KeyError, grouped.get_group, pd.NaT)
-
-    def test_dictify(self):
-        dict(iter(self.df.groupby('A')))
-        dict(iter(self.df.groupby(['A', 'B'])))
-        dict(iter(self.df['C'].groupby(self.df['A'])))
-        dict(iter(self.df['C'].groupby([self.df['A'], self.df['B']])))
-        dict(iter(self.df.groupby('A')['C']))
-        dict(iter(self.df.groupby(['A', 'B'])['C']))
-
-    def test_sparse_friendly(self):
-        sdf = self.df[['C', 'D']].to_sparse()
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        def _check_work(gp):
-            gp.mean()
-            gp.agg(np.mean)
-            dict(iter(gp))
-
-        # it works!
-        _check_work(sdf.groupby(lambda x: x // 2))
-        _check_work(sdf['C'].groupby(lambda x: x // 2))
-        _check_work(sdf.groupby(self.df['A']))
-
-        # do this someday
-        # _check_work(panel.groupby(lambda x: x.month, axis=1))
-
-    def test_panel_groupby(self):
-        self.panel = tm.makePanel()
-        tm.add_nans(self.panel)
-        grouped = self.panel.groupby({'ItemA': 0, 'ItemB': 0, 'ItemC': 1},
-                                     axis='items')
-        agged = grouped.mean()
-        agged2 = grouped.agg(lambda x: x.mean('items'))
-
-        tm.assert_panel_equal(agged, agged2)
-
-        self.assert_index_equal(agged.items, Index([0, 1]))
-
-        grouped = self.panel.groupby(lambda x: x.month, axis='major')
-        agged = grouped.mean()
-
-        exp = Index(sorted(list(set(self.panel.major_axis.month))))
-        self.assert_index_equal(agged.major_axis, exp)
-
-        grouped = self.panel.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
-                                     axis='minor')
-        agged = grouped.mean()
-        self.assert_index_equal(agged.minor_axis, Index([0, 1]))
-
-    def test_groupby_2d_malformed(self):
-        d = DataFrame(index=lrange(2))
-        d['group'] = ['g1', 'g2']
-        d['zeros'] = [0, 0]
-        d['ones'] = [1, 1]
-        d['label'] = ['l1', 'l2']
-        tmp = d.groupby(['group']).mean()
-        res_values = np.array([[0, 1], [0, 1]], dtype=np.int64)
-        self.assert_index_equal(tmp.columns, Index(['zeros', 'ones']))
-        self.assert_numpy_array_equal(tmp.values, res_values)
-
-    def test_int32_overflow(self):
-        B = np.concatenate((np.arange(10000), np.arange(10000), np.arange(5000)
-                            ))
-        A = np.arange(25000)
-        df = DataFrame({'A': A,
-                        'B': B,
-                        'C': A,
-                        'D': B,
-                        'E': np.random.randn(25000)})
-
-        left = df.groupby(['A', 'B', 'C', 'D']).sum()
-        right = df.groupby(['D', 'C', 'B', 'A']).sum()
-        self.assertEqual(len(left), len(right))
-
-    def test_groupby_sort_multi(self):
-        df = DataFrame({'a': ['foo', 'bar', 'baz'],
-                        'b': [3, 2, 1],
-                        'c': [0, 1, 2],
-                        'd': np.random.randn(3)})
-
-        tups = lmap(tuple, df[['a', 'b', 'c']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['a', 'b', 'c'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values, tups[[1, 2, 0]])
-
-        tups = lmap(tuple, df[['c', 'a', 'b']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['c', 'a', 'b'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values, tups)
-
-        tups = lmap(tuple, df[['b', 'c', 'a']].values)
-        tups = com._asarray_tuplesafe(tups)
-        result = df.groupby(['b', 'c', 'a'], sort=True).sum()
-        self.assert_numpy_array_equal(result.index.values, tups[[2, 1, 0]])
-
-        df = DataFrame({'a': [0, 1, 2, 0, 1, 2],
-                        'b': [0, 0, 0, 1, 1, 1],
-                        'd': np.random.randn(6)})
-        grouped = df.groupby(['a', 'b'])['d']
-        result = grouped.sum()
-        _check_groupby(df, result, ['a', 'b'], 'd')
-
-    def test_intercept_builtin_sum(self):
-        s = Series([1., 2., np.nan, 3.])
-        grouped = s.groupby([0, 1, 2, 2])
-
-        result = grouped.agg(builtins.sum)
-        result2 = grouped.apply(builtins.sum)
-        expected = grouped.sum()
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-    def test_column_select_via_attr(self):
-        result = self.df.groupby('A').C.sum()
-        expected = self.df.groupby('A')['C'].sum()
-        assert_series_equal(result, expected)
-
-        self.df['mean'] = 1.5
-        result = self.df.groupby('A').mean()
-        expected = self.df.groupby('A').agg(np.mean)
-        assert_frame_equal(result, expected)
-
-    def test_rank_apply(self):
-        lev1 = tm.rands_array(10, 100)
-        lev2 = tm.rands_array(10, 130)
-        lab1 = np.random.randint(0, 100, size=500)
-        lab2 = np.random.randint(0, 130, size=500)
-
-        df = DataFrame({'value': np.random.randn(500),
-                        'key1': lev1.take(lab1),
-                        'key2': lev2.take(lab2)})
-
-        result = df.groupby(['key1', 'key2']).value.rank()
-
-        expected = []
-        for key, piece in df.groupby(['key1', 'key2']):
-            expected.append(piece.value.rank())
-        expected = concat(expected, axis=0)
-        expected = expected.reindex(result.index)
-        assert_series_equal(result, expected)
-
-        result = df.groupby(['key1', 'key2']).value.rank(pct=True)
-
-        expected = []
-        for key, piece in df.groupby(['key1', 'key2']):
-            expected.append(piece.value.rank(pct=True))
-        expected = concat(expected, axis=0)
-        expected = expected.reindex(result.index)
-        assert_series_equal(result, expected)
-
-    def test_dont_clobber_name_column(self):
-        df = DataFrame({'key': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'name': ['foo', 'bar', 'baz'] * 2})
-
-        result = df.groupby('key').apply(lambda x: x)
-        assert_frame_equal(result, df)
-
-    def test_skip_group_keys(self):
-        from pandas import concat
-
-        tsf = tm.makeTimeDataFrame()
-
-        grouped = tsf.groupby(lambda x: x.month, group_keys=False)
-        result = grouped.apply(lambda x: x.sort_values(by='A')[:3])
-
-        pieces = []
-        for key, group in grouped:
-            pieces.append(group.sort_values(by='A')[:3])
-
-        expected = concat(pieces)
-        assert_frame_equal(result, expected)
-
-        grouped = tsf['A'].groupby(lambda x: x.month, group_keys=False)
-        result = grouped.apply(lambda x: x.sort_values()[:3])
-
-        pieces = []
-        for key, group in grouped:
-            pieces.append(group.sort_values()[:3])
-
-        expected = concat(pieces)
-        assert_series_equal(result, expected)
-
-    def test_no_nonsense_name(self):
-        # GH #995
-        s = self.frame['C'].copy()
-        s.name = None
-
-        result = s.groupby(self.frame['A']).agg(np.sum)
-        self.assertIsNone(result.name)
-
-    def test_multifunc_sum_bug(self):
-        # GH #1065
-        x = DataFrame(np.arange(9).reshape(3, 3))
-        x['test'] = 0
-        x['fl'] = [1.3, 1.5, 1.6]
-
-        grouped = x.groupby('test')
-        result = grouped.agg({'fl': 'sum', 2: 'size'})
-        self.assertEqual(result['fl'].dtype, np.float64)
-
-    def test_handle_dict_return_value(self):
-        def f(group):
-            return {'min': group.min(), 'max': group.max()}
-
-        def g(group):
-            return Series({'min': group.min(), 'max': group.max()})
-
-        result = self.df.groupby('A')['C'].apply(f)
-        expected = self.df.groupby('A')['C'].apply(g)
-
-        tm.assertIsInstance(result, Series)
-        assert_series_equal(result, expected)
-
-    def test_getitem_list_of_columns(self):
-        df = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.random.randn(8),
-             'E': np.random.randn(8)})
-
-        result = df.groupby('A')[['C', 'D']].mean()
-        result2 = df.groupby('A')['C', 'D'].mean()
-        result3 = df.groupby('A')[df.columns[2:4]].mean()
-
-        expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected)
-
-    def test_getitem_numeric_column_names(self):
-        # GH #13731
-        df = DataFrame({0: list('abcd') * 2,
-                        2: np.random.randn(8),
-                        4: np.random.randn(8),
-                        6: np.random.randn(8)})
-        result = df.groupby(0)[df.columns[1:3]].mean()
-        result2 = df.groupby(0)[2, 4].mean()
-        result3 = df.groupby(0)[[2, 4]].mean()
-
-        expected = df.loc[:, [0, 2, 4]].groupby(0).mean()
-
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-        assert_frame_equal(result3, expected)
-
-    def test_set_group_name(self):
-        def f(group):
-            assert group.name is not None
-            return group
-
-        def freduce(group):
-            assert group.name is not None
-            return group.sum()
-
-        def foo(x):
-            return freduce(x)
-
-        def _check_all(grouped):
-            # make sure all these work
-            grouped.apply(f)
-            grouped.aggregate(freduce)
-            grouped.aggregate({'C': freduce, 'D': freduce})
-            grouped.transform(f)
-
-            grouped['C'].apply(f)
-            grouped['C'].aggregate(freduce)
-            grouped['C'].aggregate([freduce, foo])
-            grouped['C'].transform(f)
-
-        _check_all(self.df.groupby('A'))
-        _check_all(self.df.groupby(['A', 'B']))
-
-    def test_group_name_available_in_inference_pass(self):
-        # gh-15062
-        df = pd.DataFrame({'a': [0, 0, 1, 1, 2, 2], 'b': np.arange(6)})
-
-        names = []
-
-        def f(group):
-            names.append(group.name)
-            return group.copy()
-
-        df.groupby('a', sort=False, group_keys=False).apply(f)
-        # we expect 2 zeros because we call ``f`` once to see if a faster route
-        # can be used.
-        expected_names = [0, 0, 1, 2]
-        tm.assert_equal(names, expected_names)
-
-    def test_no_dummy_key_names(self):
-        # GH #1291
-
-        result = self.df.groupby(self.df['A'].values).sum()
-        self.assertIsNone(result.index.name)
+    data = read_csv(StringIO(data), index_col=0)
 
-        result = self.df.groupby([self.df['A'].values, self.df['B'].values
-                                  ]).sum()
-        self.assertEqual(result.index.names, (None, None))
+    grouped = data.groupby(['foo', 'bar', 'baz', 'spam'])
 
-    def test_groupby_sort_multiindex_series(self):
-        # series multiindex groupby sort argument was not being passed through
-        # _compress_group_index
-        # GH 9444
-        index = MultiIndex(levels=[[1, 2], [1, 2]],
-                           labels=[[0, 0, 0, 0, 1, 1], [1, 1, 0, 0, 0, 0]],
-                           names=['a', 'b'])
-        mseries = Series([0, 1, 2, 3, 4, 5], index=index)
-        index = MultiIndex(levels=[[1, 2], [1, 2]],
-                           labels=[[0, 0, 1], [1, 0, 0]], names=['a', 'b'])
-        mseries_result = Series([0, 2, 4], index=index)
-
-        result = mseries.groupby(level=['a', 'b'], sort=False).first()
-        assert_series_equal(result, mseries_result)
-        result = mseries.groupby(level=['a', 'b'], sort=True).first()
-        assert_series_equal(result, mseries_result.sort_index())
-
-    def test_groupby_reindex_inside_function(self):
-        from pandas.tseries.api import DatetimeIndex
-
-        periods = 1000
-        ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
-        df = DataFrame({'high': np.arange(
-            periods), 'low': np.arange(periods)}, index=ind)
-
-        def agg_before(hour, func, fix=False):
-            """
-                Run an aggregate func on the subset of data.
-            """
-
-            def _func(data):
-                d = data.select(lambda x: x.hour < 11).dropna()
-                if fix:
-                    data[data.index[0]]
-                if len(d) == 0:
-                    return None
-                return func(d)
-
-            return _func
-
-        def afunc(data):
-            d = data.select(lambda x: x.hour < 11).dropna()
-            return np.max(d)
-
-        grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
-        closure_bad = grouped.agg({'high': agg_before(11, np.max)})
-        closure_good = grouped.agg({'high': agg_before(11, np.max, True)})
-
-        assert_frame_equal(closure_bad, closure_good)
-
-    def test_multiindex_columns_empty_level(self):
-        l = [['count', 'values'], ['to filter', '']]
-        midx = MultiIndex.from_tuples(l)
-
-        df = DataFrame([[long(1), 'A']], columns=midx)
-
-        grouped = df.groupby('to filter').groups
-        self.assertEqual(grouped['A'], [0])
-
-        grouped = df.groupby([('to filter', '')]).groups
-        self.assertEqual(grouped['A'], [0])
-
-        df = DataFrame([[long(1), 'A'], [long(2), 'B']], columns=midx)
-
-        expected = df.groupby('to filter').groups
-        result = df.groupby([('to filter', '')]).groups
-        self.assertEqual(result, expected)
-
-        df = DataFrame([[long(1), 'A'], [long(2), 'A']], columns=midx)
-
-        expected = df.groupby('to filter').groups
-        result = df.groupby([('to filter', '')]).groups
-        tm.assert_dict_equal(result, expected)
-
-    def test_cython_median(self):
-        df = DataFrame(np.random.randn(1000))
-        df.values[::2] = np.nan
-
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-        labels[::17] = np.nan
-
-        result = df.groupby(labels).median()
-        exp = df.groupby(labels).agg(nanops.nanmedian)
-        assert_frame_equal(result, exp)
-
-        df = DataFrame(np.random.randn(1000, 5))
-        rs = df.groupby(labels).agg(np.median)
-        xp = df.groupby(labels).median()
-        assert_frame_equal(rs, xp)
-
-    def test_median_empty_bins(self):
-        df = pd.DataFrame(np.random.randint(0, 44, 500))
-
-        grps = range(0, 55, 5)
-        bins = pd.cut(df[0], grps)
-
-        result = df.groupby(bins).median()
-        expected = df.groupby(bins).agg(lambda x: x.median())
-        assert_frame_equal(result, expected)
-
-    def test_groupby_non_arithmetic_agg_types(self):
-        # GH9311, GH6620
-        df = pd.DataFrame(
-            [{'a': 1, 'b': 1},
-             {'a': 1, 'b': 2},
-             {'a': 2, 'b': 3},
-             {'a': 2, 'b': 4}])
-
-        dtypes = ['int8', 'int16', 'int32', 'int64', 'float32', 'float64']
-
-        grp_exp = {'first': {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]},
-                   'last': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]},
-                   'min': {'df': [{'a': 1, 'b': 1}, {'a': 2, 'b': 3}]},
-                   'max': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}]},
-                   'nth': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 4}],
-                           'args': [1]},
-                   'count': {'df': [{'a': 1, 'b': 2}, {'a': 2, 'b': 2}],
-                             'out_type': 'int64'}}
-
-        for dtype in dtypes:
-            df_in = df.copy()
-            df_in['b'] = df_in.b.astype(dtype)
-
-            for method, data in compat.iteritems(grp_exp):
-                if 'args' not in data:
-                    data['args'] = []
-
-                if 'out_type' in data:
-                    out_type = data['out_type']
-                else:
-                    out_type = dtype
-
-                exp = data['df']
-                df_out = pd.DataFrame(exp)
-
-                df_out['b'] = df_out.b.astype(out_type)
-                df_out.set_index('a', inplace=True)
-
-                grpd = df_in.groupby('a')
-                t = getattr(grpd, method)(*data['args'])
-                assert_frame_equal(t, df_out)
-
-    def test_groupby_non_arithmetic_agg_intlike_precision(self):
-        # GH9311, GH6620
-        c = 24650000000000000
-
-        inputs = ((Timestamp('2011-01-15 12:50:28.502376'),
-                   Timestamp('2011-01-20 12:50:28.593448')), (1 + c, 2 + c))
-
-        for i in inputs:
-            df = pd.DataFrame([{'a': 1, 'b': i[0]}, {'a': 1, 'b': i[1]}])
-
-            grp_exp = {'first': {'expected': i[0]},
-                       'last': {'expected': i[1]},
-                       'min': {'expected': i[0]},
-                       'max': {'expected': i[1]},
-                       'nth': {'expected': i[1],
-                               'args': [1]},
-                       'count': {'expected': 2}}
-
-            for method, data in compat.iteritems(grp_exp):
-                if 'args' not in data:
-                    data['args'] = []
-
-                grpd = df.groupby('a')
-                res = getattr(grpd, method)(*data['args'])
-                self.assertEqual(res.iloc[0].b, data['expected'])
-
-    def test_groupby_multiindex_missing_pair(self):
-        # GH9049
-        df = DataFrame({'group1': ['a', 'a', 'a', 'b'],
-                        'group2': ['c', 'c', 'd', 'c'],
-                        'value': [1, 1, 1, 5]})
-        df = df.set_index(['group1', 'group2'])
-        df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
-
-        res = df_grouped.agg('sum')
-        idx = MultiIndex.from_tuples(
-            [('a', 'c'), ('a', 'd'), ('b', 'c')], names=['group1', 'group2'])
-        exp = DataFrame([[2], [1], [5]], index=idx, columns=['value'])
-
-        tm.assert_frame_equal(res, exp)
-
-    def test_groupby_multiindex_not_lexsorted(self):
-        # GH 11640
-
-        # define the lexsorted version
-        lexsorted_mi = MultiIndex.from_tuples(
-            [('a', ''), ('b1', 'c1'), ('b2', 'c2')], names=['b', 'c'])
-        lexsorted_df = DataFrame([[1, 3, 4]], columns=lexsorted_mi)
-        self.assertTrue(lexsorted_df.columns.is_lexsorted())
-
-        # define the non-lexsorted version
-        not_lexsorted_df = DataFrame(columns=['a', 'b', 'c', 'd'],
-                                     data=[[1, 'b1', 'c1', 3],
-                                           [1, 'b2', 'c2', 4]])
-        not_lexsorted_df = not_lexsorted_df.pivot_table(
-            index='a', columns=['b', 'c'], values='d')
-        not_lexsorted_df = not_lexsorted_df.reset_index()
-        self.assertFalse(not_lexsorted_df.columns.is_lexsorted())
-
-        # compare the results
-        tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
-
-        expected = lexsorted_df.groupby('a').mean()
-        with tm.assert_produces_warning(com.PerformanceWarning):
-            result = not_lexsorted_df.groupby('a').mean()
-        tm.assert_frame_equal(expected, result)
-
-        # a transforming function should work regardless of sort
-        # GH 14776
-        df = DataFrame({'x': ['a', 'a', 'b', 'a'],
-                        'y': [1, 1, 2, 2],
-                        'z': [1, 2, 3, 4]}).set_index(['x', 'y'])
-        self.assertFalse(df.index.is_lexsorted())
-
-        for level in [0, 1, [0, 1]]:
-            for sort in [False, True]:
-                result = df.groupby(level=level, sort=sort).apply(
-                    DataFrame.drop_duplicates)
-                expected = df
-                tm.assert_frame_equal(expected, result)
-
-                result = df.sort_index().groupby(level=level, sort=sort).apply(
-                    DataFrame.drop_duplicates)
-                expected = df.sort_index()
-                tm.assert_frame_equal(expected, result)
-
-    def test_groupby_levels_and_columns(self):
-        # GH9344, GH9049
-        idx_names = ['x', 'y']
-        idx = pd.MultiIndex.from_tuples(
-            [(1, 1), (1, 2), (3, 4), (5, 6)], names=idx_names)
-        df = pd.DataFrame(np.arange(12).reshape(-1, 3), index=idx)
-
-        by_levels = df.groupby(level=idx_names).mean()
-        # reset_index changes columns dtype to object
-        by_columns = df.reset_index().groupby(idx_names).mean()
-
-        tm.assert_frame_equal(by_levels, by_columns, check_column_type=False)
-
-        by_columns.columns = pd.Index(by_columns.columns, dtype=np.int64)
-        tm.assert_frame_equal(by_levels, by_columns)
-
-    def test_gb_apply_list_of_unequal_len_arrays(self):
-
-        # GH1738
-        df = DataFrame({'group1': ['a', 'a', 'a', 'b', 'b', 'b', 'a', 'a', 'a',
-                                   'b', 'b', 'b'],
-                        'group2': ['c', 'c', 'd', 'd', 'd', 'e', 'c', 'c', 'd',
-                                   'd', 'd', 'e'],
-                        'weight': [1.1, 2, 3, 4, 5, 6, 2, 4, 6, 8, 1, 2],
-                        'value': [7.1, 8, 9, 10, 11, 12, 8, 7, 6, 5, 4, 3]})
-        df = df.set_index(['group1', 'group2'])
-        df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
-
-        def noddy(value, weight):
-            out = np.array(value * weight).repeat(3)
-            return out
-
-        # the kernel function returns arrays of unequal length
-        # pandas sniffs the first one, sees it's an array and not
-        # a list, and assumed the rest are of equal length
-        # and so tries a vstack
-
-        # don't die
-        df_grouped.apply(lambda x: noddy(x.value, x.weight))
-
-    def test_groupby_with_empty(self):
-        index = pd.DatetimeIndex(())
-        data = ()
-        series = pd.Series(data, index)
-        grouper = pd.tseries.resample.TimeGrouper('D')
-        grouped = series.groupby(grouper)
-        assert next(iter(grouped), None) is None
-
-    def test_groupby_with_single_column(self):
-        df = pd.DataFrame({'a': list('abssbab')})
-        tm.assert_frame_equal(df.groupby('a').get_group('a'), df.iloc[[0, 5]])
-        # GH 13530
-        exp = pd.DataFrame([], index=pd.Index(['a', 'b', 's'], name='a'))
-        tm.assert_frame_equal(df.groupby('a').count(), exp)
-        tm.assert_frame_equal(df.groupby('a').sum(), exp)
-        tm.assert_frame_equal(df.groupby('a').nth(1), exp)
-
-    def test_groupby_with_small_elem(self):
-        # GH 8542
-        # length=2
-        df = pd.DataFrame({'event': ['start', 'start'],
-                           'change': [1234, 5678]},
-                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10']))
-        grouped = df.groupby([pd.TimeGrouper(freq='M'), 'event'])
-        self.assertEqual(len(grouped.groups), 2)
-        self.assertEqual(grouped.ngroups, 2)
-        self.assertIn((pd.Timestamp('2014-09-30'), 'start'), grouped.groups)
-        self.assertIn((pd.Timestamp('2013-10-31'), 'start'), grouped.groups)
-
-        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[0], :])
-        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[1], :])
-
-        df = pd.DataFrame({'event': ['start', 'start', 'start'],
-                           'change': [1234, 5678, 9123]},
-                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
-                                                  '2014-09-15']))
-        grouped = df.groupby([pd.TimeGrouper(freq='M'), 'event'])
-        self.assertEqual(len(grouped.groups), 2)
-        self.assertEqual(grouped.ngroups, 2)
-        self.assertIn((pd.Timestamp('2014-09-30'), 'start'), grouped.groups)
-        self.assertIn((pd.Timestamp('2013-10-31'), 'start'), grouped.groups)
-
-        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[0, 2], :])
-        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[1], :])
-
-        # length=3
-        df = pd.DataFrame({'event': ['start', 'start', 'start'],
-                           'change': [1234, 5678, 9123]},
-                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
-                                                  '2014-08-05']))
-        grouped = df.groupby([pd.TimeGrouper(freq='M'), 'event'])
-        self.assertEqual(len(grouped.groups), 3)
-        self.assertEqual(grouped.ngroups, 3)
-        self.assertIn((pd.Timestamp('2014-09-30'), 'start'), grouped.groups)
-        self.assertIn((pd.Timestamp('2013-10-31'), 'start'), grouped.groups)
-        self.assertIn((pd.Timestamp('2014-08-31'), 'start'), grouped.groups)
-
-        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[0], :])
-        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[1], :])
-        res = grouped.get_group((pd.Timestamp('2014-08-31'), 'start'))
-        tm.assert_frame_equal(res, df.iloc[[2], :])
-
-    def test_cumcount(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'])
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3])
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_empty(self):
-        ge = DataFrame().groupby(level=0)
-        se = Series().groupby(level=0)
-
-        # edge case, as this is usually considered float
-        e = Series(dtype='int64')
-
-        assert_series_equal(e, ge.cumcount())
-        assert_series_equal(e, se.cumcount())
-
-    def test_cumcount_dupe_index(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
-                       index=[0] * 5)
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_mi(self):
-        mi = MultiIndex.from_tuples([[0, 1], [1, 2], [2, 2], [2, 2], [1, 0]])
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
-                       index=mi)
-        g = df.groupby('A')
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=mi)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_cumcount_groupby_not_col(self):
-        df = DataFrame([['a'], ['a'], ['a'], ['b'], ['a']], columns=['A'],
-                       index=[0] * 5)
-        g = df.groupby([0, 0, 0, 1, 0])
-        sg = g.A
-
-        expected = Series([0, 1, 2, 0, 3], index=[0] * 5)
-
-        assert_series_equal(expected, g.cumcount())
-        assert_series_equal(expected, sg.cumcount())
-
-    def test_fill_constistency(self):
-
-        # GH9221
-        # pass thru keyword arguments to the generated wrapper
-        # are set if the passed kw is None (only)
-        df = DataFrame(index=pd.MultiIndex.from_product(
-            [['value1', 'value2'], date_range('2014-01-01', '2014-01-06')]),
-            columns=Index(
-            ['1', '2'], name='id'))
-        df['1'] = [np.nan, 1, np.nan, np.nan, 11, np.nan, np.nan, 2, np.nan,
-                   np.nan, 22, np.nan]
-        df['2'] = [np.nan, 3, np.nan, np.nan, 33, np.nan, np.nan, 4, np.nan,
-                   np.nan, 44, np.nan]
-
-        expected = df.groupby(level=0, axis=0).fillna(method='ffill')
-        result = df.T.groupby(level=0, axis=1).fillna(method='ffill').T
-        assert_frame_equal(result, expected)
-
-    def test_index_label_overlaps_location(self):
-        # checking we don't have any label/location confusion in the
-        # the wake of GH5375
-        df = DataFrame(list('ABCDE'), index=[2, 0, 2, 1, 1])
-        g = df.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = df.iloc[[1, 3, 4]]
-        assert_frame_equal(actual, expected)
-
-        ser = df[0]
-        g = ser.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = ser.take([1, 3, 4])
-        assert_series_equal(actual, expected)
-
-        # ... and again, with a generic Index of floats
-        df.index = df.index.astype(float)
-        g = df.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = df.iloc[[1, 3, 4]]
-        assert_frame_equal(actual, expected)
-
-        ser = df[0]
-        g = ser.groupby(list('ababb'))
-        actual = g.filter(lambda x: len(x) > 2)
-        expected = ser.take([1, 3, 4])
-        assert_series_equal(actual, expected)
-
-    def test_lower_int_prec_count(self):
-        df = DataFrame({'a': np.array(
-            [0, 1, 2, 100], np.int8),
-            'b': np.array(
-            [1, 2, 3, 6], np.uint32),
-            'c': np.array(
-            [4, 5, 6, 8], np.int16),
-            'grp': list('ab' * 2)})
-        result = df.groupby('grp').count()
-        expected = DataFrame({'a': [2, 2],
-                              'b': [2, 2],
-                              'c': [2, 2]}, index=pd.Index(list('ab'),
-                                                           name='grp'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_count_uses_size_on_exception(self):
-        class RaisingObjectException(Exception):
-            pass
-
-        class RaisingObject(object):
-
-            def __init__(self, msg='I will raise inside Cython'):
-                super(RaisingObject, self).__init__()
-                self.msg = msg
-
-            def __eq__(self, other):
-                # gets called in Cython to check that raising calls the method
-                raise RaisingObjectException(self.msg)
-
-        df = DataFrame({'a': [RaisingObject() for _ in range(4)],
-                        'grp': list('ab' * 2)})
-        result = df.groupby('grp').count()
-        expected = DataFrame({'a': [2, 2]}, index=pd.Index(
-            list('ab'), name='grp'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_groupby_cumprod(self):
-        # GH 4095
-        df = pd.DataFrame({'key': ['b'] * 10, 'value': 2})
-
-        actual = df.groupby('key')['value'].cumprod()
-        expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
-        expected.name = 'value'
-        tm.assert_series_equal(actual, expected)
-
-        df = pd.DataFrame({'key': ['b'] * 100, 'value': 2})
-        actual = df.groupby('key')['value'].cumprod()
-        # if overflows, groupby product casts to float
-        # while numpy passes back invalid values
-        df['value'] = df['value'].astype(float)
-        expected = df.groupby('key')['value'].apply(lambda x: x.cumprod())
-        expected.name = 'value'
-        tm.assert_series_equal(actual, expected)
-
-    def test_ops_general(self):
-        ops = [('mean', np.mean),
-               ('median', np.median),
-               ('std', np.std),
-               ('var', np.var),
-               ('sum', np.sum),
-               ('prod', np.prod),
-               ('min', np.min),
-               ('max', np.max),
-               ('first', lambda x: x.iloc[0]),
-               ('last', lambda x: x.iloc[-1]),
-               ('count', np.size), ]
-        try:
-            from scipy.stats import sem
-        except ImportError:
-            pass
-        else:
-            ops.append(('sem', sem))
-        df = DataFrame(np.random.randn(1000))
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-
-        for op, targop in ops:
-            result = getattr(df.groupby(labels), op)().astype(float)
-            expected = df.groupby(labels).agg(targop)
-            try:
-                tm.assert_frame_equal(result, expected)
-            except BaseException as exc:
-                exc.args += ('operation: %s' % op, )
-                raise
-
-    def test_max_nan_bug(self):
-        raw = """,Date,app,File
-2013-04-23,2013-04-23 00:00:00,,log080001.log
-2013-05-06,2013-05-06 00:00:00,,log.log
-2013-05-07,2013-05-07 00:00:00,OE,xlsx"""
-
-        df = pd.read_csv(StringIO(raw), parse_dates=[0])
-        gb = df.groupby('Date')
-        r = gb[['File']].max()
-        e = gb['File'].max().to_frame()
-        tm.assert_frame_equal(r, e)
-        self.assertFalse(r['File'].isnull().any())
-
-    def test_nlargest(self):
-        a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
-        b = Series(list('a' * 5 + 'b' * 5))
-        gb = a.groupby(b)
-        r = gb.nlargest(3)
-        e = Series([
-            7, 5, 3, 10, 9, 6
-        ], index=MultiIndex.from_arrays([list('aaabbb'), [3, 2, 1, 9, 5, 8]]))
-        tm.assert_series_equal(r, e)
-
-        a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
-        gb = a.groupby(b)
-        e = Series([
-            3, 2, 1, 3, 3, 2
-        ], index=MultiIndex.from_arrays([list('aaabbb'), [2, 3, 1, 6, 5, 7]]))
-        assert_series_equal(gb.nlargest(3, keep='last'), e)
-
-    def test_nsmallest(self):
-        a = Series([1, 3, 5, 7, 2, 9, 0, 4, 6, 10])
-        b = Series(list('a' * 5 + 'b' * 5))
-        gb = a.groupby(b)
-        r = gb.nsmallest(3)
-        e = Series([
-            1, 2, 3, 0, 4, 6
-        ], index=MultiIndex.from_arrays([list('aaabbb'), [0, 4, 1, 6, 7, 8]]))
-        tm.assert_series_equal(r, e)
-
-        a = Series([1, 1, 3, 2, 0, 3, 3, 2, 1, 0])
-        gb = a.groupby(b)
-        e = Series([
-            0, 1, 1, 0, 1, 2
-        ], index=MultiIndex.from_arrays([list('aaabbb'), [4, 1, 0, 9, 8, 7]]))
-        assert_series_equal(gb.nsmallest(3, keep='last'), e)
-
-    def test_transform_doesnt_clobber_ints(self):
-        # GH 7972
-        n = 6
-        x = np.arange(n)
-        df = DataFrame({'a': x // 2, 'b': 2.0 * x, 'c': 3.0 * x})
-        df2 = DataFrame({'a': x // 2 * 1.0, 'b': 2.0 * x, 'c': 3.0 * x})
-
-        gb = df.groupby('a')
-        result = gb.transform('mean')
-
-        gb2 = df2.groupby('a')
-        expected = gb2.transform('mean')
-        tm.assert_frame_equal(result, expected)
-
-    def test_groupby_apply_all_none(self):
-        # Tests to make sure no errors if apply function returns all None
-        # values. Issue 9684.
-        test_df = DataFrame({'groups': [0, 0, 1, 1],
-                             'random_vars': [8, 7, 4, 5]})
-
-        def test_func(x):
-            pass
-
-        result = test_df.groupby('groups').apply(test_func)
-        expected = DataFrame()
-        tm.assert_frame_equal(result, expected)
-
-    def test_groupby_apply_none_first(self):
-        # GH 12824. Tests if apply returns None first.
-        test_df1 = DataFrame({'groups': [1, 1, 1, 2], 'vars': [0, 1, 2, 3]})
-        test_df2 = DataFrame({'groups': [1, 2, 2, 2], 'vars': [0, 1, 2, 3]})
-
-        def test_func(x):
-            if x.shape[0] < 2:
+    result = grouped.agg(np.mean)
+    expected = grouped.mean()
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_series_with_name(df):
+    result = df.groupby(df['A']).mean()
+    result2 = df.groupby(df['A'], as_index=False).mean()
+    assert result.index.name == 'A'
+    assert 'A' in result2
+
+    result = df.groupby([df['A'], df['B']]).mean()
+    result2 = df.groupby([df['A'], df['B']],
+                         as_index=False).mean()
+    assert result.index.names == ('A', 'B')
+    assert 'A' in result2
+    assert 'B' in result2
+
+
+def test_seriesgroupby_name_attr(df):
+    # GH 6265
+    result = df.groupby('A')['C']
+    assert result.count().name == 'C'
+    assert result.mean().name == 'C'
+
+    testFunc = lambda x: np.sum(x) * 2
+    assert result.agg(testFunc).name == 'C'
+
+
+def test_consistency_name():
+    # GH 12363
+
+    df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                          'foo', 'bar', 'foo', 'foo'],
+                    'B': ['one', 'one', 'two', 'two',
+                          'two', 'two', 'one', 'two'],
+                    'C': np.random.randn(8) + 1.0,
+                    'D': np.arange(8)})
+
+    expected = df.groupby(['A']).B.count()
+    result = df.B.groupby(df.A).count()
+    assert_series_equal(result, expected)
+
+
+def test_groupby_name_propagation(df):
+    # GH 6124
+    def summarize(df, name=None):
+        return Series({'count': 1, 'mean': 2, 'omissions': 3, }, name=name)
+
+    def summarize_random_name(df):
+        # Provide a different name for each Series.  In this case, groupby
+        # should not attempt to propagate the Series name since they are
+        # inconsistent.
+        return Series({
+            'count': 1,
+            'mean': 2,
+            'omissions': 3,
+        }, name=df.iloc[0]['A'])
+
+    metrics = df.groupby('A').apply(summarize)
+    assert metrics.columns.name is None
+    metrics = df.groupby('A').apply(summarize, 'metrics')
+    assert metrics.columns.name == 'metrics'
+    metrics = df.groupby('A').apply(summarize_random_name)
+    assert metrics.columns.name is None
+
+
+def test_groupby_nonstring_columns():
+    df = DataFrame([np.arange(10) for x in range(10)])
+    grouped = df.groupby(0)
+    result = grouped.mean()
+    expected = df.groupby(df[0]).mean()
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_mixed_type_columns():
+    # GH 13432, unorderable types in py3
+    df = DataFrame([[0, 1, 2]], columns=['A', 'B', 0])
+    expected = DataFrame([[1, 2]], columns=['B', 0],
+                         index=Index([0], name='A'))
+
+    result = df.groupby('A').first()
+    tm.assert_frame_equal(result, expected)
+
+    result = df.groupby('A').sum()
+    tm.assert_frame_equal(result, expected)
+
+
+# TODO: Ensure warning isn't emitted in the first place
+@pytest.mark.filterwarnings("ignore:Mean of:RuntimeWarning")
+def test_cython_grouper_series_bug_noncontig():
+    arr = np.empty((100, 100))
+    arr.fill(np.nan)
+    obj = Series(arr[:, 0], index=lrange(100))
+    inds = np.tile(lrange(10), 10)
+
+    result = obj.groupby(inds).agg(Series.median)
+    assert result.isna().all()
+
+
+def test_series_grouper_noncontig_index():
+    index = Index(tm.rands_array(10, 100))
+
+    values = Series(np.random.randn(50), index=index[::2])
+    labels = np.random.randint(0, 5, 50)
+
+    # it works!
+    grouped = values.groupby(labels)
+
+    # accessing the index elements causes segfault
+    f = lambda x: len(set(map(id, x.index)))
+    grouped.agg(f)
+
+
+def test_convert_objects_leave_decimal_alone():
+
+    s = Series(lrange(5))
+    labels = np.array(['a', 'b', 'c', 'd', 'e'], dtype='O')
+
+    def convert_fast(x):
+        return Decimal(str(x.mean()))
+
+    def convert_force_pure(x):
+        # base will be length 0
+        assert (len(x.values.base) > 0)
+        return Decimal(str(x.mean()))
+
+    grouped = s.groupby(labels)
+
+    result = grouped.agg(convert_fast)
+    assert result.dtype == np.object_
+    assert isinstance(result[0], Decimal)
+
+    result = grouped.agg(convert_force_pure)
+    assert result.dtype == np.object_
+    assert isinstance(result[0], Decimal)
+
+
+def test_groupby_dtype_inference_empty():
+    # GH 6733
+    df = DataFrame({'x': [], 'range': np.arange(0, dtype='int64')})
+    assert df['x'].dtype == np.float64
+
+    result = df.groupby('x').first()
+    exp_index = Index([], name='x', dtype=np.float64)
+    expected = DataFrame({'range': Series(
+        [], index=exp_index, dtype='int64')})
+    assert_frame_equal(result, expected, by_blocks=True)
+
+
+def test_groupby_list_infer_array_like(df):
+    result = df.groupby(list(df['A'])).mean()
+    expected = df.groupby(df['A']).mean()
+    assert_frame_equal(result, expected, check_names=False)
+
+    with pytest.raises(KeyError, match=r"^'foo'$"):
+        df.groupby(list(df['A'][:-1]))
+
+    # pathological case of ambiguity
+    df = DataFrame({'foo': [0, 1],
+                    'bar': [3, 4],
+                    'val': np.random.randn(2)})
+
+    result = df.groupby(['foo', 'bar']).mean()
+    expected = df.groupby([df['foo'], df['bar']]).mean()[['val']]
+
+
+def test_groupby_keys_same_size_as_index():
+    # GH 11185
+    freq = 's'
+    index = pd.date_range(start=pd.Timestamp('2015-09-29T11:34:44-0700'),
+                          periods=2, freq=freq)
+    df = pd.DataFrame([['A', 10], ['B', 15]], columns=[
+        'metric', 'values'
+    ], index=index)
+    result = df.groupby([pd.Grouper(level=0, freq=freq), 'metric']).mean()
+    expected = df.set_index([df.index, 'metric'])
+
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_one_row():
+    # GH 11741
+    msg = r"^'Z'$"
+    df1 = pd.DataFrame(np.random.randn(1, 4), columns=list('ABCD'))
+    with pytest.raises(KeyError, match=msg):
+        df1.groupby('Z')
+    df2 = pd.DataFrame(np.random.randn(2, 4), columns=list('ABCD'))
+    with pytest.raises(KeyError, match=msg):
+        df2.groupby('Z')
+
+
+def test_groupby_nat_exclude():
+    # GH 6992
+    df = pd.DataFrame(
+        {'values': np.random.randn(8),
+         'dt': [np.nan, pd.Timestamp('2013-01-01'), np.nan, pd.Timestamp(
+             '2013-02-01'), np.nan, pd.Timestamp('2013-02-01'), np.nan,
+            pd.Timestamp('2013-01-01')],
+         'str': [np.nan, 'a', np.nan, 'a', np.nan, 'a', np.nan, 'b']})
+    grouped = df.groupby('dt')
+
+    expected = [pd.Index([1, 7]), pd.Index([3, 5])]
+    keys = sorted(grouped.groups.keys())
+    assert len(keys) == 2
+    for k, e in zip(keys, expected):
+        # grouped.groups keys are np.datetime64 with system tz
+        # not to be affected by tz, only compare values
+        tm.assert_index_equal(grouped.groups[k], e)
+
+    # confirm obj is not filtered
+    tm.assert_frame_equal(grouped.grouper.groupings[0].obj, df)
+    assert grouped.ngroups == 2
+
+    expected = {
+        Timestamp('2013-01-01 00:00:00'): np.array([1, 7], dtype=np.int64),
+        Timestamp('2013-02-01 00:00:00'): np.array([3, 5], dtype=np.int64)
+    }
+
+    for k in grouped.indices:
+        tm.assert_numpy_array_equal(grouped.indices[k], expected[k])
+
+    tm.assert_frame_equal(
+        grouped.get_group(Timestamp('2013-01-01')), df.iloc[[1, 7]])
+    tm.assert_frame_equal(
+        grouped.get_group(Timestamp('2013-02-01')), df.iloc[[3, 5]])
+
+    with pytest.raises(KeyError, match=r"^NaT$"):
+        grouped.get_group(pd.NaT)
+
+    nan_df = DataFrame({'nan': [np.nan, np.nan, np.nan],
+                        'nat': [pd.NaT, pd.NaT, pd.NaT]})
+    assert nan_df['nan'].dtype == 'float64'
+    assert nan_df['nat'].dtype == 'datetime64[ns]'
+
+    for key in ['nan', 'nat']:
+        grouped = nan_df.groupby(key)
+        assert grouped.groups == {}
+        assert grouped.ngroups == 0
+        assert grouped.indices == {}
+        with pytest.raises(KeyError, match=r"^nan$"):
+            grouped.get_group(np.nan)
+        with pytest.raises(KeyError, match=r"^NaT$"):
+            grouped.get_group(pd.NaT)
+
+
+def test_groupby_2d_malformed():
+    d = DataFrame(index=lrange(2))
+    d['group'] = ['g1', 'g2']
+    d['zeros'] = [0, 0]
+    d['ones'] = [1, 1]
+    d['label'] = ['l1', 'l2']
+    tmp = d.groupby(['group']).mean()
+    res_values = np.array([[0, 1], [0, 1]], dtype=np.int64)
+    tm.assert_index_equal(tmp.columns, Index(['zeros', 'ones']))
+    tm.assert_numpy_array_equal(tmp.values, res_values)
+
+
+def test_int32_overflow():
+    B = np.concatenate((np.arange(10000), np.arange(10000), np.arange(5000)
+                        ))
+    A = np.arange(25000)
+    df = DataFrame({'A': A,
+                    'B': B,
+                    'C': A,
+                    'D': B,
+                    'E': np.random.randn(25000)})
+
+    left = df.groupby(['A', 'B', 'C', 'D']).sum()
+    right = df.groupby(['D', 'C', 'B', 'A']).sum()
+    assert len(left) == len(right)
+
+
+def test_groupby_sort_multi():
+    df = DataFrame({'a': ['foo', 'bar', 'baz'],
+                    'b': [3, 2, 1],
+                    'c': [0, 1, 2],
+                    'd': np.random.randn(3)})
+
+    tups = lmap(tuple, df[['a', 'b', 'c']].values)
+    tups = com.asarray_tuplesafe(tups)
+    result = df.groupby(['a', 'b', 'c'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups[[1, 2, 0]])
+
+    tups = lmap(tuple, df[['c', 'a', 'b']].values)
+    tups = com.asarray_tuplesafe(tups)
+    result = df.groupby(['c', 'a', 'b'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups)
+
+    tups = lmap(tuple, df[['b', 'c', 'a']].values)
+    tups = com.asarray_tuplesafe(tups)
+    result = df.groupby(['b', 'c', 'a'], sort=True).sum()
+    tm.assert_numpy_array_equal(result.index.values, tups[[2, 1, 0]])
+
+    df = DataFrame({'a': [0, 1, 2, 0, 1, 2],
+                    'b': [0, 0, 0, 1, 1, 1],
+                    'd': np.random.randn(6)})
+    grouped = df.groupby(['a', 'b'])['d']
+    result = grouped.sum()
+
+    def _check_groupby(df, result, keys, field, f=lambda x: x.sum()):
+        tups = lmap(tuple, df[keys].values)
+        tups = com.asarray_tuplesafe(tups)
+        expected = f(df.groupby(tups)[field])
+        for k, v in compat.iteritems(expected):
+            assert (result[k] == v)
+
+    _check_groupby(df, result, ['a', 'b'], 'd')
+
+
+def test_dont_clobber_name_column():
+    df = DataFrame({'key': ['a', 'a', 'a', 'b', 'b', 'b'],
+                    'name': ['foo', 'bar', 'baz'] * 2})
+
+    result = df.groupby('key').apply(lambda x: x)
+    assert_frame_equal(result, df)
+
+
+def test_skip_group_keys():
+
+    tsf = tm.makeTimeDataFrame()
+
+    grouped = tsf.groupby(lambda x: x.month, group_keys=False)
+    result = grouped.apply(lambda x: x.sort_values(by='A')[:3])
+
+    pieces = [group.sort_values(by='A')[:3] for key, group in grouped]
+
+    expected = pd.concat(pieces)
+    assert_frame_equal(result, expected)
+
+    grouped = tsf['A'].groupby(lambda x: x.month, group_keys=False)
+    result = grouped.apply(lambda x: x.sort_values()[:3])
+
+    pieces = [group.sort_values()[:3] for key, group in grouped]
+
+    expected = pd.concat(pieces)
+    assert_series_equal(result, expected)
+
+
+def test_no_nonsense_name(frame):
+    # GH #995
+    s = frame['C'].copy()
+    s.name = None
+
+    result = s.groupby(frame['A']).agg(np.sum)
+    assert result.name is None
+
+
+def test_multifunc_sum_bug():
+    # GH #1065
+    x = DataFrame(np.arange(9).reshape(3, 3))
+    x['test'] = 0
+    x['fl'] = [1.3, 1.5, 1.6]
+
+    grouped = x.groupby('test')
+    result = grouped.agg({'fl': 'sum', 2: 'size'})
+    assert result['fl'].dtype == np.float64
+
+
+def test_handle_dict_return_value(df):
+    def f(group):
+        return {'max': group.max(), 'min': group.min()}
+
+    def g(group):
+        return Series({'max': group.max(), 'min': group.min()})
+
+    result = df.groupby('A')['C'].apply(f)
+    expected = df.groupby('A')['C'].apply(g)
+
+    assert isinstance(result, Series)
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('grouper', ['A', ['A', 'B']])
+def test_set_group_name(df, grouper):
+    def f(group):
+        assert group.name is not None
+        return group
+
+    def freduce(group):
+        assert group.name is not None
+        return group.sum()
+
+    def foo(x):
+        return freduce(x)
+
+    grouped = df.groupby(grouper)
+
+    # make sure all these work
+    grouped.apply(f)
+    grouped.aggregate(freduce)
+    grouped.aggregate({'C': freduce, 'D': freduce})
+    grouped.transform(f)
+
+    grouped['C'].apply(f)
+    grouped['C'].aggregate(freduce)
+    grouped['C'].aggregate([freduce, foo])
+    grouped['C'].transform(f)
+
+
+def test_group_name_available_in_inference_pass():
+    # gh-15062
+    df = pd.DataFrame({'a': [0, 0, 1, 1, 2, 2], 'b': np.arange(6)})
+
+    names = []
+
+    def f(group):
+        names.append(group.name)
+        return group.copy()
+
+    df.groupby('a', sort=False, group_keys=False).apply(f)
+    # we expect 2 zeros because we call ``f`` once to see if a faster route
+    # can be used.
+    expected_names = [0, 0, 1, 2]
+    assert names == expected_names
+
+
+def test_no_dummy_key_names(df):
+    # see gh-1291
+    result = df.groupby(df['A'].values).sum()
+    assert result.index.name is None
+
+    result = df.groupby([df['A'].values, df['B'].values]).sum()
+    assert result.index.names == (None, None)
+
+
+def test_groupby_sort_multiindex_series():
+    # series multiindex groupby sort argument was not being passed through
+    # _compress_group_index
+    # GH 9444
+    index = MultiIndex(levels=[[1, 2], [1, 2]],
+                       codes=[[0, 0, 0, 0, 1, 1], [1, 1, 0, 0, 0, 0]],
+                       names=['a', 'b'])
+    mseries = Series([0, 1, 2, 3, 4, 5], index=index)
+    index = MultiIndex(levels=[[1, 2], [1, 2]],
+                       codes=[[0, 0, 1], [1, 0, 0]], names=['a', 'b'])
+    mseries_result = Series([0, 2, 4], index=index)
+
+    result = mseries.groupby(level=['a', 'b'], sort=False).first()
+    assert_series_equal(result, mseries_result)
+    result = mseries.groupby(level=['a', 'b'], sort=True).first()
+    assert_series_equal(result, mseries_result.sort_index())
+
+
+def test_groupby_reindex_inside_function():
+
+    periods = 1000
+    ind = date_range(start='2012/1/1', freq='5min', periods=periods)
+    df = DataFrame({'high': np.arange(
+        periods), 'low': np.arange(periods)}, index=ind)
+
+    def agg_before(hour, func, fix=False):
+        """
+            Run an aggregate func on the subset of data.
+        """
+
+        def _func(data):
+            d = data.loc[data.index.map(
+                lambda x: x.hour < 11)].dropna()
+            if fix:
+                data[data.index[0]]
+            if len(d) == 0:
                 return None
-            return x.iloc[[0, -1]]
-
-        result1 = test_df1.groupby('groups').apply(test_func)
-        result2 = test_df2.groupby('groups').apply(test_func)
-        index1 = MultiIndex.from_arrays([[1, 1], [0, 2]],
-                                        names=['groups', None])
-        index2 = MultiIndex.from_arrays([[2, 2], [1, 3]],
-                                        names=['groups', None])
-        expected1 = DataFrame({'groups': [1, 1], 'vars': [0, 2]},
-                              index=index1)
-        expected2 = DataFrame({'groups': [2, 2], 'vars': [1, 3]},
-                              index=index2)
-        tm.assert_frame_equal(result1, expected1)
-        tm.assert_frame_equal(result2, expected2)
-
-    def test_groupby_preserves_sort(self):
-        # Test to ensure that groupby always preserves sort order of original
-        # object. Issue #8588 and #9651
-
-        df = DataFrame(
-            {'int_groups': [3, 1, 0, 1, 0, 3, 3, 3],
-             'string_groups': ['z', 'a', 'z', 'a', 'a', 'g', 'g', 'g'],
-             'ints': [8, 7, 4, 5, 2, 9, 1, 1],
-             'floats': [2.3, 5.3, 6.2, -2.4, 2.2, 1.1, 1.1, 5],
-             'strings': ['z', 'd', 'a', 'e', 'word', 'word2', '42', '47']})
-
-        # Try sorting on different types and with different group types
-        for sort_column in ['ints', 'floats', 'strings', ['ints', 'floats'],
-                            ['ints', 'strings']]:
-            for group_column in ['int_groups', 'string_groups',
-                                 ['int_groups', 'string_groups']]:
-
-                df = df.sort_values(by=sort_column)
-
-                g = df.groupby(group_column)
-
-                def test_sort(x):
-                    assert_frame_equal(x, x.sort_values(by=sort_column))
-
-                g.apply(test_sort)
-
-    def test_nunique_with_object(self):
-        # GH 11077
-        data = pd.DataFrame(
-            [[100, 1, 'Alice'],
-             [200, 2, 'Bob'],
-             [300, 3, 'Charlie'],
-             [-400, 4, 'Dan'],
-             [500, 5, 'Edith']],
-            columns=['amount', 'id', 'name']
-        )
-
-        result = data.groupby(['id', 'amount'])['name'].nunique()
-        index = MultiIndex.from_arrays([data.id, data.amount])
-        expected = pd.Series([1] * 5, name='name', index=index)
-        tm.assert_series_equal(result, expected)
-
-    def test_nunique_with_empty_series(self):
-        # GH 12553
-        data = pd.Series(name='name')
-        result = data.groupby(level=0).nunique()
-        expected = pd.Series(name='name', dtype='int64')
-        tm.assert_series_equal(result, expected)
-
-    def test_nunique_with_timegrouper(self):
-        # GH 13453
-        test = pd.DataFrame({
-            'time': [Timestamp('2016-06-28 09:35:35'),
-                     Timestamp('2016-06-28 16:09:30'),
-                     Timestamp('2016-06-28 16:46:28')],
-            'data': ['1', '2', '3']}).set_index('time')
-        result = test.groupby(pd.TimeGrouper(freq='h'))['data'].nunique()
-        expected = test.groupby(
-            pd.TimeGrouper(freq='h')
-        )['data'].apply(pd.Series.nunique)
-        tm.assert_series_equal(result, expected)
-
-    def test_numpy_compat(self):
-        # see gh-12811
-        df = pd.DataFrame({'A': [1, 2, 1], 'B': [1, 2, 3]})
-        g = df.groupby('A')
-
-        msg = "numpy operations are not valid with groupby"
-
-        for func in ('mean', 'var', 'std', 'cumprod', 'cumsum'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(g, func), 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(g, func), foo=1)
-
-    def test_grouping_string_repr(self):
-        # GH 13394
-        mi = MultiIndex.from_arrays([list("AAB"), list("aba")])
-        df = DataFrame([[1, 2, 3]], columns=mi)
-        gr = df.groupby(df[('A', 'a')])
-
-        result = gr.grouper.groupings[0].__repr__()
-        expected = "Grouping(('A', 'a'))"
-        tm.assert_equal(result, expected)
-
-    def test_group_shift_with_null_key(self):
-        # This test is designed to replicate the segfault in issue #13813.
-        n_rows = 1200
-
-        # Generate a moderately large dataframe with occasional missing
-        # values in column `B`, and then group by [`A`, `B`]. This should
-        # force `-1` in `labels` array of `g.grouper.group_info` exactly
-        # at those places, where the group-by key is partilly missing.
-        df = DataFrame([(i % 12, i % 3 if i % 3 else np.nan, i)
-                        for i in range(n_rows)], dtype=float,
-                       columns=["A", "B", "Z"], index=None)
-        g = df.groupby(["A", "B"])
-
-        expected = DataFrame([(i + 12 if i % 3 and i < n_rows - 12
-                               else np.nan)
-                              for i in range(n_rows)], dtype=float,
-                             columns=["Z"], index=None)
-        result = g.shift(-1)
-
-        assert_frame_equal(result, expected)
-
-    def test_pivot_table_values_key_error(self):
-        # This test is designed to replicate the error in issue #14938
-        df = pd.DataFrame({'eventDate':
-                           pd.date_range(pd.datetime.today(),
-                                         periods=20, freq='M').tolist(),
-                           'thename': range(0, 20)})
-
-        df['year'] = df.set_index('eventDate').index.year
-        df['month'] = df.set_index('eventDate').index.month
-
-        with self.assertRaises(KeyError):
-            df.reset_index().pivot_table(index='year', columns='month',
-                                         values='badname', aggfunc='count')
-
-    def test_cummin_cummax(self):
-        # GH 15048
-        num_types = [np.int32, np.int64, np.float32, np.float64]
-        num_mins = [np.iinfo(np.int32).min, np.iinfo(np.int64).min,
-                    np.finfo(np.float32).min, np.finfo(np.float64).min]
-        num_max = [np.iinfo(np.int32).max, np.iinfo(np.int64).max,
-                   np.finfo(np.float32).max, np.finfo(np.float64).max]
-        base_df = pd.DataFrame({'A': [1, 1, 1, 1, 2, 2, 2, 2],
-                                'B': [3, 4, 3, 2, 2, 3, 2, 1]})
-        expected_mins = [3, 3, 3, 2, 2, 2, 2, 1]
-        expected_maxs = [3, 4, 4, 4, 2, 3, 3, 3]
-
-        for dtype, min_val, max_val in zip(num_types, num_mins, num_max):
-            df = base_df.astype(dtype)
-
-            # cummin
-            expected = pd.DataFrame({'B': expected_mins}).astype(dtype)
-            result = df.groupby('A').cummin()
-            tm.assert_frame_equal(result, expected)
-            result = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
-            tm.assert_frame_equal(result, expected)
-
-            # Test cummin w/ min value for dtype
-            df.loc[[2, 6], 'B'] = min_val
-            expected.loc[[2, 3, 6, 7], 'B'] = min_val
-            result = df.groupby('A').cummin()
-            tm.assert_frame_equal(result, expected)
-            expected = df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
-            tm.assert_frame_equal(result, expected)
-
-            # cummax
-            expected = pd.DataFrame({'B': expected_maxs}).astype(dtype)
-            result = df.groupby('A').cummax()
-            tm.assert_frame_equal(result, expected)
-            result = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
-            tm.assert_frame_equal(result, expected)
-
-            # Test cummax w/ max value for dtype
-            df.loc[[2, 6], 'B'] = max_val
-            expected.loc[[2, 3, 6, 7], 'B'] = max_val
-            result = df.groupby('A').cummax()
-            tm.assert_frame_equal(result, expected)
-            expected = df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
-            tm.assert_frame_equal(result, expected)
-
-        # Test nan in some values
-        base_df.loc[[0, 2, 4, 6], 'B'] = np.nan
-        expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 2,
-                                       np.nan, 3, np.nan, 1]})
-        result = base_df.groupby('A').cummin()
-        tm.assert_frame_equal(result, expected)
-        expected = (base_df.groupby('A')
-                           .B
-                           .apply(lambda x: x.cummin())
-                           .to_frame())
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame({'B': [np.nan, 4, np.nan, 4,
-                                       np.nan, 3, np.nan, 3]})
-        result = base_df.groupby('A').cummax()
-        tm.assert_frame_equal(result, expected)
-        expected = (base_df.groupby('A')
-                           .B
-                           .apply(lambda x: x.cummax())
-                           .to_frame())
-        tm.assert_frame_equal(result, expected)
-
-        # Test nan in entire column
-        base_df['B'] = np.nan
-        expected = pd.DataFrame({'B': [np.nan] * 8})
-        result = base_df.groupby('A').cummin()
-        tm.assert_frame_equal(expected, result)
-        result = base_df.groupby('A').B.apply(lambda x: x.cummin()).to_frame()
-        tm.assert_frame_equal(expected, result)
-        result = base_df.groupby('A').cummax()
-        tm.assert_frame_equal(expected, result)
-        result = base_df.groupby('A').B.apply(lambda x: x.cummax()).to_frame()
-        tm.assert_frame_equal(expected, result)
-
-        # GH 15561
-        df = pd.DataFrame(dict(a=[1], b=pd.to_datetime(['2001'])))
-        expected = pd.Series(pd.to_datetime('2001'), index=[0], name='b')
-        for method in ['cummax', 'cummin']:
-            result = getattr(df.groupby('a')['b'], method)()
-            tm.assert_series_equal(expected, result)
-
-        # GH 15635
-        df = pd.DataFrame(dict(a=[1, 2, 1], b=[2, 1, 1]))
-        result = df.groupby('a').b.cummax()
-        expected = pd.Series([2, 1, 2], name='b')
-        tm.assert_series_equal(result, expected)
-
-        df = pd.DataFrame(dict(a=[1, 2, 1], b=[1, 2, 2]))
-        result = df.groupby('a').b.cummin()
-        expected = pd.Series([1, 2, 1], name='b')
-        tm.assert_series_equal(result, expected)
-
-    def test_apply_numeric_coercion_when_datetime(self):
-        # In the past, group-by/apply operations have been over-eager
-        # in converting dtypes to numeric, in the presence of datetime
-        # columns.  Various GH issues were filed, the reproductions
-        # for which are here.
-
-        # GH 15670
-        df = pd.DataFrame({'Number': [1, 2],
-                           'Date': ["2017-03-02"] * 2,
-                           'Str': ["foo", "inf"]})
-        expected = df.groupby(['Number']).apply(lambda x: x.iloc[0])
-        df.Date = pd.to_datetime(df.Date)
-        result = df.groupby(['Number']).apply(lambda x: x.iloc[0])
-        tm.assert_series_equal(result['Str'], expected['Str'])
-
-        # GH 15421
-        df = pd.DataFrame({'A': [10, 20, 30],
-                           'B': ['foo', '3', '4'],
-                           'T': [pd.Timestamp("12:31:22")] * 3})
-
-        def get_B(g):
-            return g.iloc[0][['B']]
-        result = df.groupby('A').apply(get_B)['B']
-        expected = df.B
-        expected.index = df.A
-        tm.assert_series_equal(result, expected)
-
-        # GH 14423
-        def predictions(tool):
-            out = pd.Series(index=['p1', 'p2', 'useTime'], dtype=object)
-            if 'step1' in list(tool.State):
-                out['p1'] = str(tool[tool.State == 'step1'].Machine.values[0])
-            if 'step2' in list(tool.State):
-                out['p2'] = str(tool[tool.State == 'step2'].Machine.values[0])
-                out['useTime'] = str(
-                    tool[tool.State == 'step2'].oTime.values[0])
-            return out
-        df1 = pd.DataFrame({'Key': ['B', 'B', 'A', 'A'],
-                            'State': ['step1', 'step2', 'step1', 'step2'],
-                            'oTime': ['', '2016-09-19 05:24:33',
-                                      '', '2016-09-19 23:59:04'],
-                            'Machine': ['23', '36L', '36R', '36R']})
-        df2 = df1.copy()
-        df2.oTime = pd.to_datetime(df2.oTime)
-        expected = df1.groupby('Key').apply(predictions).p1
-        result = df2.groupby('Key').apply(predictions).p1
-        tm.assert_series_equal(expected, result)
-
-
-def _check_groupby(df, result, keys, field, f=lambda x: x.sum()):
-    tups = lmap(tuple, df[keys].values)
-    tups = com._asarray_tuplesafe(tups)
-    expected = f(df.groupby(tups)[field])
-    for k, v in compat.iteritems(expected):
-        assert (result[k] == v)
+            return func(d)
+
+        return _func
+
+    def afunc(data):
+        d = data.select(lambda x: x.hour < 11).dropna()
+        return np.max(d)
+
+    grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
+    closure_bad = grouped.agg({'high': agg_before(11, np.max)})
+    closure_good = grouped.agg({'high': agg_before(11, np.max, True)})
+
+    assert_frame_equal(closure_bad, closure_good)
+
+
+def test_groupby_multiindex_missing_pair():
+    # GH9049
+    df = DataFrame({'group1': ['a', 'a', 'a', 'b'],
+                    'group2': ['c', 'c', 'd', 'c'],
+                    'value': [1, 1, 1, 5]})
+    df = df.set_index(['group1', 'group2'])
+    df_grouped = df.groupby(level=['group1', 'group2'], sort=True)
+
+    res = df_grouped.agg('sum')
+    idx = MultiIndex.from_tuples(
+        [('a', 'c'), ('a', 'd'), ('b', 'c')], names=['group1', 'group2'])
+    exp = DataFrame([[2], [1], [5]], index=idx, columns=['value'])
+
+    tm.assert_frame_equal(res, exp)
+
+
+def test_groupby_multiindex_not_lexsorted():
+    # GH 11640
+
+    # define the lexsorted version
+    lexsorted_mi = MultiIndex.from_tuples(
+        [('a', ''), ('b1', 'c1'), ('b2', 'c2')], names=['b', 'c'])
+    lexsorted_df = DataFrame([[1, 3, 4]], columns=lexsorted_mi)
+    assert lexsorted_df.columns.is_lexsorted()
+
+    # define the non-lexsorted version
+    not_lexsorted_df = DataFrame(columns=['a', 'b', 'c', 'd'],
+                                 data=[[1, 'b1', 'c1', 3],
+                                       [1, 'b2', 'c2', 4]])
+    not_lexsorted_df = not_lexsorted_df.pivot_table(
+        index='a', columns=['b', 'c'], values='d')
+    not_lexsorted_df = not_lexsorted_df.reset_index()
+    assert not not_lexsorted_df.columns.is_lexsorted()
+
+    # compare the results
+    tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
+
+    expected = lexsorted_df.groupby('a').mean()
+    with tm.assert_produces_warning(PerformanceWarning):
+        result = not_lexsorted_df.groupby('a').mean()
+    tm.assert_frame_equal(expected, result)
+
+    # a transforming function should work regardless of sort
+    # GH 14776
+    df = DataFrame({'x': ['a', 'a', 'b', 'a'],
+                    'y': [1, 1, 2, 2],
+                    'z': [1, 2, 3, 4]}).set_index(['x', 'y'])
+    assert not df.index.is_lexsorted()
+
+    for level in [0, 1, [0, 1]]:
+        for sort in [False, True]:
+            result = df.groupby(level=level, sort=sort).apply(
+                DataFrame.drop_duplicates)
+            expected = df
+            tm.assert_frame_equal(expected, result)
+
+            result = df.sort_index().groupby(level=level, sort=sort).apply(
+                DataFrame.drop_duplicates)
+            expected = df.sort_index()
+            tm.assert_frame_equal(expected, result)
+
+
+def test_index_label_overlaps_location():
+    # checking we don't have any label/location confusion in the
+    # the wake of GH5375
+    df = DataFrame(list('ABCDE'), index=[2, 0, 2, 1, 1])
+    g = df.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = df.iloc[[1, 3, 4]]
+    assert_frame_equal(actual, expected)
+
+    ser = df[0]
+    g = ser.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = ser.take([1, 3, 4])
+    assert_series_equal(actual, expected)
+
+    # ... and again, with a generic Index of floats
+    df.index = df.index.astype(float)
+    g = df.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = df.iloc[[1, 3, 4]]
+    assert_frame_equal(actual, expected)
+
+    ser = df[0]
+    g = ser.groupby(list('ababb'))
+    actual = g.filter(lambda x: len(x) > 2)
+    expected = ser.take([1, 3, 4])
+    assert_series_equal(actual, expected)
+
+
+def test_transform_doesnt_clobber_ints():
+    # GH 7972
+    n = 6
+    x = np.arange(n)
+    df = DataFrame({'a': x // 2, 'b': 2.0 * x, 'c': 3.0 * x})
+    df2 = DataFrame({'a': x // 2 * 1.0, 'b': 2.0 * x, 'c': 3.0 * x})
+
+    gb = df.groupby('a')
+    result = gb.transform('mean')
+
+    gb2 = df2.groupby('a')
+    expected = gb2.transform('mean')
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('sort_column', ['ints', 'floats', 'strings',
+                                         ['ints', 'floats'],
+                                         ['ints', 'strings']])
+@pytest.mark.parametrize('group_column', ['int_groups', 'string_groups',
+                                          ['int_groups', 'string_groups']])
+def test_groupby_preserves_sort(sort_column, group_column):
+    # Test to ensure that groupby always preserves sort order of original
+    # object. Issue #8588 and #9651
+
+    df = DataFrame(
+        {'int_groups': [3, 1, 0, 1, 0, 3, 3, 3],
+         'string_groups': ['z', 'a', 'z', 'a', 'a', 'g', 'g', 'g'],
+         'ints': [8, 7, 4, 5, 2, 9, 1, 1],
+         'floats': [2.3, 5.3, 6.2, -2.4, 2.2, 1.1, 1.1, 5],
+         'strings': ['z', 'd', 'a', 'e', 'word', 'word2', '42', '47']})
+
+    # Try sorting on different types and with different group types
+
+    df = df.sort_values(by=sort_column)
+    g = df.groupby(group_column)
+
+    def test_sort(x):
+        assert_frame_equal(x, x.sort_values(by=sort_column))
+    g.apply(test_sort)
+
+
+def test_group_shift_with_null_key():
+    # This test is designed to replicate the segfault in issue #13813.
+    n_rows = 1200
+
+    # Generate a moderately large dataframe with occasional missing
+    # values in column `B`, and then group by [`A`, `B`]. This should
+    # force `-1` in `labels` array of `g.grouper.group_info` exactly
+    # at those places, where the group-by key is partially missing.
+    df = DataFrame([(i % 12, i % 3 if i % 3 else np.nan, i)
+                    for i in range(n_rows)], dtype=float,
+                   columns=["A", "B", "Z"], index=None)
+    g = df.groupby(["A", "B"])
+
+    expected = DataFrame([(i + 12 if i % 3 and i < n_rows - 12
+                           else np.nan)
+                          for i in range(n_rows)], dtype=float,
+                         columns=["Z"], index=None)
+    result = g.shift(-1)
+
+    assert_frame_equal(result, expected)
+
+
+def test_group_shift_with_fill_value():
+    # GH #24128
+    n_rows = 24
+    df = DataFrame([(i % 12, i % 3, i)
+                    for i in range(n_rows)], dtype=float,
+                   columns=["A", "B", "Z"], index=None)
+    g = df.groupby(["A", "B"])
+
+    expected = DataFrame([(i + 12 if i < n_rows - 12
+                           else 0)
+                          for i in range(n_rows)], dtype=float,
+                         columns=["Z"], index=None)
+    result = g.shift(-1, fill_value=0)[["Z"]]
+
+    assert_frame_equal(result, expected)
+
+
+def test_pivot_table_values_key_error():
+    # This test is designed to replicate the error in issue #14938
+    df = pd.DataFrame({'eventDate':
+                       pd.date_range(pd.datetime.today(),
+                                     periods=20, freq='M').tolist(),
+                       'thename': range(0, 20)})
+
+    df['year'] = df.set_index('eventDate').index.year
+    df['month'] = df.set_index('eventDate').index.month
+
+    with pytest.raises(KeyError, match="'badname'"):
+        df.reset_index().pivot_table(index='year', columns='month',
+                                     values='badname', aggfunc='count')
+
+
+def test_empty_dataframe_groupby():
+    # GH8093
+    df = DataFrame(columns=['A', 'B', 'C'])
+
+    result = df.groupby('A').sum()
+    expected = DataFrame(columns=['B', 'C'], dtype=np.float64)
+    expected.index.name = 'A'
+
+    assert_frame_equal(result, expected)
+
+
+def test_tuple_warns():
+    # https://github.com/pandas-dev/pandas/issues/18314
+    df = pd.DataFrame({('a', 'b'): [1, 1, 2, 2], 'a': [1, 1, 1, 2],
+                       'b': [1, 2, 2, 2], 'c': [1, 1, 1, 1]})
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df[['a', 'b', 'c']].groupby(('a', 'b')).c.mean()
+
+    assert "Interpreting tuple 'by' as a list" in str(w[0].message)
+
+    with tm.assert_produces_warning(None):
+        df.groupby(('a', 'b')).c.mean()
+
+
+def test_tuple_warns_unhashable():
+    # https://github.com/pandas-dev/pandas/issues/18314
+    business_dates = date_range(start='4/1/2014', end='6/30/2014',
+                                freq='B')
+    df = DataFrame(1, index=business_dates, columns=['a', 'b'])
+
+    with tm.assert_produces_warning(FutureWarning) as w:
+        df.groupby((df.index.year, df.index.month)).nth([0, 3, -1])
+
+    assert "Interpreting tuple 'by' as a list" in str(w[0].message)
+
+
+def test_tuple_correct_keyerror():
+    # https://github.com/pandas-dev/pandas/issues/18798
+    df = pd.DataFrame(1, index=range(3),
+                      columns=pd.MultiIndex.from_product([[1, 2],
+                                                          [3, 4]]))
+    with pytest.raises(KeyError, match=r"^\(7, 8\)$"):
+        df.groupby((7, 8)).mean()
+
+
+def test_groupby_agg_ohlc_non_first():
+    # GH 21716
+    df = pd.DataFrame([[1], [1]], columns=['foo'],
+                      index=pd.date_range('2018-01-01', periods=2, freq='D'))
+
+    expected = pd.DataFrame([
+        [1, 1, 1, 1, 1],
+        [1, 1, 1, 1, 1]
+    ], columns=pd.MultiIndex.from_tuples((
+        ('foo', 'ohlc', 'open'), ('foo', 'ohlc', 'high'),
+        ('foo', 'ohlc', 'low'), ('foo', 'ohlc', 'close'),
+        ('foo', 'sum', 'foo'))), index=pd.date_range(
+            '2018-01-01', periods=2, freq='D'))
+
+    result = df.groupby(pd.Grouper(freq='D')).agg(['sum', 'ohlc'])
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_groupby_multiindex_nat():
+    # GH 9236
+    values = [
+        (pd.NaT, 'a'),
+        (datetime(2012, 1, 2), 'a'),
+        (datetime(2012, 1, 2), 'b'),
+        (datetime(2012, 1, 3), 'a')
+    ]
+    mi = pd.MultiIndex.from_tuples(values, names=['date', None])
+    ser = pd.Series([3, 2, 2.5, 4], index=mi)
+
+    result = ser.groupby(level=1).mean()
+    expected = pd.Series([3., 2.5], index=["a", "b"])
+    assert_series_equal(result, expected)
+
+
+def test_groupby_empty_list_raises():
+    # GH 5289
+    values = zip(range(10), range(10))
+    df = DataFrame(values, columns=['apple', 'b'])
+    msg = "Grouper and axis must be same length"
+    with pytest.raises(ValueError, match=msg):
+        df.groupby([[]])
diff --git a/pandas/tests/groupby/test_grouping.py b/pandas/tests/groupby/test_grouping.py
new file mode 100644
index 0000000000000..44b5bd5f13992
--- /dev/null
+++ b/pandas/tests/groupby/test_grouping.py
@@ -0,0 +1,814 @@
+# -*- coding: utf-8 -*-
+
+""" test where we are determining what we are grouping, or getting groups """
+
+import numpy as np
+import pytest
+
+from pandas.compat import long, lrange
+
+import pandas as pd
+from pandas import (
+    CategoricalIndex, DataFrame, Index, MultiIndex, Series, Timestamp, compat,
+    date_range)
+from pandas.core.groupby.grouper import Grouping
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+# selection
+# --------------------------------
+
+
+class TestSelection(object):
+
+    def test_select_bad_cols(self):
+        df = DataFrame([[1, 2]], columns=['A', 'B'])
+        g = df.groupby('A')
+        with pytest.raises(KeyError, match='"Columns not found: \'C\'"'):
+            g[['C']]
+
+        with pytest.raises(KeyError, match='^[^A]+$'):
+            # A should not be referenced as a bad column...
+            # will have to rethink regex if you change message!
+            g[['A', 'C']]
+
+    def test_groupby_duplicated_column_errormsg(self):
+        # GH7511
+        df = DataFrame(columns=['A', 'B', 'A', 'C'],
+                       data=[range(4), range(2, 6), range(0, 8, 2)])
+
+        msg = "Grouper for 'A' not 1-dimensional"
+        with pytest.raises(ValueError, match=msg):
+            df.groupby('A')
+        with pytest.raises(ValueError, match=msg):
+            df.groupby(['A', 'B'])
+
+        grouped = df.groupby('B')
+        c = grouped.count()
+        assert c.columns.nlevels == 1
+        assert c.columns.size == 3
+
+    def test_column_select_via_attr(self, df):
+        result = df.groupby('A').C.sum()
+        expected = df.groupby('A')['C'].sum()
+        assert_series_equal(result, expected)
+
+        df['mean'] = 1.5
+        result = df.groupby('A').mean()
+        expected = df.groupby('A').agg(np.mean)
+        assert_frame_equal(result, expected)
+
+    def test_getitem_list_of_columns(self):
+        df = DataFrame(
+            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
+             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
+             'C': np.random.randn(8),
+             'D': np.random.randn(8),
+             'E': np.random.randn(8)})
+
+        result = df.groupby('A')[['C', 'D']].mean()
+        result2 = df.groupby('A')['C', 'D'].mean()
+        result3 = df.groupby('A')[df.columns[2:4]].mean()
+
+        expected = df.loc[:, ['A', 'C', 'D']].groupby('A').mean()
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+        assert_frame_equal(result3, expected)
+
+    def test_getitem_numeric_column_names(self):
+        # GH #13731
+        df = DataFrame({0: list('abcd') * 2,
+                        2: np.random.randn(8),
+                        4: np.random.randn(8),
+                        6: np.random.randn(8)})
+        result = df.groupby(0)[df.columns[1:3]].mean()
+        result2 = df.groupby(0)[2, 4].mean()
+        result3 = df.groupby(0)[[2, 4]].mean()
+
+        expected = df.loc[:, [0, 2, 4]].groupby(0).mean()
+
+        assert_frame_equal(result, expected)
+        assert_frame_equal(result2, expected)
+        assert_frame_equal(result3, expected)
+
+
+# grouping
+# --------------------------------
+
+class TestGrouping():
+
+    def test_grouper_index_types(self):
+        # related GH5375
+        # groupby misbehaving when using a Floatlike index
+        df = DataFrame(np.arange(10).reshape(5, 2), columns=list('AB'))
+        for index in [tm.makeFloatIndex, tm.makeStringIndex,
+                      tm.makeUnicodeIndex, tm.makeIntIndex, tm.makeDateIndex,
+                      tm.makePeriodIndex]:
+
+            df.index = index(len(df))
+            df.groupby(list('abcde')).apply(lambda x: x)
+
+            df.index = list(reversed(df.index.tolist()))
+            df.groupby(list('abcde')).apply(lambda x: x)
+
+    def test_grouper_multilevel_freq(self):
+
+        # GH 7885
+        # with level and freq specified in a pd.Grouper
+        from datetime import date, timedelta
+        d0 = date.today() - timedelta(days=14)
+        dates = date_range(d0, date.today())
+        date_index = pd.MultiIndex.from_product(
+            [dates, dates], names=['foo', 'bar'])
+        df = pd.DataFrame(np.random.randint(0, 100, 225), index=date_index)
+
+        # Check string level
+        expected = df.reset_index().groupby([pd.Grouper(
+            key='foo', freq='W'), pd.Grouper(key='bar', freq='W')]).sum()
+        # reset index changes columns dtype to object
+        expected.columns = pd.Index([0], dtype='int64')
+
+        result = df.groupby([pd.Grouper(level='foo', freq='W'), pd.Grouper(
+            level='bar', freq='W')]).sum()
+        assert_frame_equal(result, expected)
+
+        # Check integer level
+        result = df.groupby([pd.Grouper(level=0, freq='W'), pd.Grouper(
+            level=1, freq='W')]).sum()
+        assert_frame_equal(result, expected)
+
+    def test_grouper_creation_bug(self):
+
+        # GH 8795
+        df = DataFrame({'A': [0, 0, 1, 1, 2, 2], 'B': [1, 2, 3, 4, 5, 6]})
+        g = df.groupby('A')
+        expected = g.sum()
+
+        g = df.groupby(pd.Grouper(key='A'))
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        result = g.apply(lambda x: x.sum())
+        assert_frame_equal(result, expected)
+
+        g = df.groupby(pd.Grouper(key='A', axis=0))
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # GH14334
+        # pd.Grouper(key=...) may be passed in a list
+        df = DataFrame({'A': [0, 0, 0, 1, 1, 1],
+                        'B': [1, 1, 2, 2, 3, 3],
+                        'C': [1, 2, 3, 4, 5, 6]})
+        # Group by single column
+        expected = df.groupby('A').sum()
+        g = df.groupby([pd.Grouper(key='A')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group by two columns
+        # using a combination of strings and Grouper objects
+        expected = df.groupby(['A', 'B']).sum()
+
+        # Group with two Grouper objects
+        g = df.groupby([pd.Grouper(key='A'), pd.Grouper(key='B')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group with a string and a Grouper object
+        g = df.groupby(['A', pd.Grouper(key='B')])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # Group with a Grouper object and a string
+        g = df.groupby([pd.Grouper(key='A'), 'B'])
+        result = g.sum()
+        assert_frame_equal(result, expected)
+
+        # GH8866
+        s = Series(np.arange(8, dtype='int64'),
+                   index=pd.MultiIndex.from_product(
+                       [list('ab'), range(2),
+                        date_range('20130101', periods=2)],
+                       names=['one', 'two', 'three']))
+        result = s.groupby(pd.Grouper(level='three', freq='M')).sum()
+        expected = Series([28], index=Index(
+            [Timestamp('2013-01-31')], freq='M', name='three'))
+        assert_series_equal(result, expected)
+
+        # just specifying a level breaks
+        result = s.groupby(pd.Grouper(level='one')).sum()
+        expected = s.groupby(level='one').sum()
+        assert_series_equal(result, expected)
+
+    def test_grouper_column_and_index(self):
+        # GH 14327
+
+        # Grouping a multi-index frame by a column and an index level should
+        # be equivalent to resetting the index and grouping by two columns
+        idx = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('a', 3),
+                                         ('b', 1), ('b', 2), ('b', 3)])
+        idx.names = ['outer', 'inner']
+        df_multi = pd.DataFrame({"A": np.arange(6),
+                                 'B': ['one', 'one', 'two',
+                                       'two', 'one', 'one']},
+                                index=idx)
+        result = df_multi.groupby(['B', pd.Grouper(level='inner')]).mean()
+        expected = df_multi.reset_index().groupby(['B', 'inner']).mean()
+        assert_frame_equal(result, expected)
+
+        # Test the reverse grouping order
+        result = df_multi.groupby([pd.Grouper(level='inner'), 'B']).mean()
+        expected = df_multi.reset_index().groupby(['inner', 'B']).mean()
+        assert_frame_equal(result, expected)
+
+        # Grouping a single-index frame by a column and the index should
+        # be equivalent to resetting the index and grouping by two columns
+        df_single = df_multi.reset_index('outer')
+        result = df_single.groupby(['B', pd.Grouper(level='inner')]).mean()
+        expected = df_single.reset_index().groupby(['B', 'inner']).mean()
+        assert_frame_equal(result, expected)
+
+        # Test the reverse grouping order
+        result = df_single.groupby([pd.Grouper(level='inner'), 'B']).mean()
+        expected = df_single.reset_index().groupby(['inner', 'B']).mean()
+        assert_frame_equal(result, expected)
+
+    def test_groupby_levels_and_columns(self):
+        # GH9344, GH9049
+        idx_names = ['x', 'y']
+        idx = pd.MultiIndex.from_tuples(
+            [(1, 1), (1, 2), (3, 4), (5, 6)], names=idx_names)
+        df = pd.DataFrame(np.arange(12).reshape(-1, 3), index=idx)
+
+        by_levels = df.groupby(level=idx_names).mean()
+        # reset_index changes columns dtype to object
+        by_columns = df.reset_index().groupby(idx_names).mean()
+
+        tm.assert_frame_equal(by_levels, by_columns, check_column_type=False)
+
+        by_columns.columns = pd.Index(by_columns.columns, dtype=np.int64)
+        tm.assert_frame_equal(by_levels, by_columns)
+
+    def test_groupby_categorical_index_and_columns(self, observed):
+        # GH18432
+        columns = ['A', 'B', 'A', 'B']
+        categories = ['B', 'A']
+        data = np.ones((5, 4), int)
+        cat_columns = CategoricalIndex(columns,
+                                       categories=categories,
+                                       ordered=True)
+        df = DataFrame(data=data, columns=cat_columns)
+        result = df.groupby(axis=1, level=0, observed=observed).sum()
+        expected_data = 2 * np.ones((5, 2), int)
+
+        if observed:
+            # if we are not-observed we undergo a reindex
+            # so need to adjust the output as our expected sets us up
+            # to be non-observed
+            expected_columns = CategoricalIndex(['A', 'B'],
+                                                categories=categories,
+                                                ordered=True)
+        else:
+            expected_columns = CategoricalIndex(categories,
+                                                categories=categories,
+                                                ordered=True)
+        expected = DataFrame(data=expected_data, columns=expected_columns)
+        assert_frame_equal(result, expected)
+
+        # test transposed version
+        df = DataFrame(data.T, index=cat_columns)
+        result = df.groupby(axis=0, level=0, observed=observed).sum()
+        expected = DataFrame(data=expected_data.T, index=expected_columns)
+        assert_frame_equal(result, expected)
+
+    def test_grouper_getting_correct_binner(self):
+
+        # GH 10063
+        # using a non-time-based grouper and a time-based grouper
+        # and specifying levels
+        df = DataFrame({'A': 1}, index=pd.MultiIndex.from_product(
+            [list('ab'), date_range('20130101', periods=80)], names=['one',
+                                                                     'two']))
+        result = df.groupby([pd.Grouper(level='one'), pd.Grouper(
+            level='two', freq='M')]).sum()
+        expected = DataFrame({'A': [31, 28, 21, 31, 28, 21]},
+                             index=MultiIndex.from_product(
+                                 [list('ab'),
+                                  date_range('20130101', freq='M', periods=3)],
+                                 names=['one', 'two']))
+        assert_frame_equal(result, expected)
+
+    def test_grouper_iter(self, df):
+        assert sorted(df.groupby('A').grouper) == ['bar', 'foo']
+
+    def test_empty_groups(self, df):
+        # see gh-1048
+        with pytest.raises(ValueError, match="No group keys passed!"):
+            df.groupby([])
+
+    def test_groupby_grouper(self, df):
+        grouped = df.groupby('A')
+
+        result = df.groupby(grouped.grouper).mean()
+        expected = grouped.mean()
+        tm.assert_frame_equal(result, expected)
+
+    def test_groupby_dict_mapping(self):
+        # GH #679
+        from pandas import Series
+        s = Series({'T1': 5})
+        result = s.groupby({'T1': 'T2'}).agg(sum)
+        expected = s.groupby(['T2']).agg(sum)
+        assert_series_equal(result, expected)
+
+        s = Series([1., 2., 3., 4.], index=list('abcd'))
+        mapping = {'a': 0, 'b': 0, 'c': 1, 'd': 1}
+
+        result = s.groupby(mapping).mean()
+        result2 = s.groupby(mapping).agg(np.mean)
+        expected = s.groupby([0, 0, 1, 1]).mean()
+        expected2 = s.groupby([0, 0, 1, 1]).mean()
+        assert_series_equal(result, expected)
+        assert_series_equal(result, result2)
+        assert_series_equal(result, expected2)
+
+    def test_groupby_grouper_f_sanity_checked(self):
+        dates = date_range('01-Jan-2013', periods=12, freq='MS')
+        ts = Series(np.random.randn(12), index=dates)
+
+        # GH3035
+        # index.map is used to apply grouper to the index
+        # if it fails on the elements, map tries it on the entire index as
+        # a sequence. That can yield invalid results that cause trouble
+        # down the line.
+        # the surprise comes from using key[0:6] rather then str(key)[0:6]
+        # when the elements are Timestamp.
+        # the result is Index[0:6], very confusing.
+
+        msg = r"Grouper result violates len\(labels\) == len\(data\)"
+        with pytest.raises(AssertionError, match=msg):
+            ts.groupby(lambda key: key[0:6])
+
+    def test_grouping_error_on_multidim_input(self, df):
+        msg = ("Grouper for '<class 'pandas.core.frame.DataFrame'>'"
+               " not 1-dimensional")
+        with pytest.raises(ValueError, match=msg):
+            Grouping(df.index, df[['A', 'A']])
+
+    def test_multiindex_passthru(self):
+
+        # GH 7997
+        # regression from 0.14.1
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        df.columns = pd.MultiIndex.from_tuples([(0, 1), (1, 1), (2, 1)])
+
+        result = df.groupby(axis=1, level=[0, 1]).first()
+        assert_frame_equal(result, df)
+
+    def test_multiindex_negative_level(self, mframe):
+        # GH 13901
+        result = mframe.groupby(level=-1).sum()
+        expected = mframe.groupby(level='second').sum()
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=-2).sum()
+        expected = mframe.groupby(level='first').sum()
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=[-2, -1]).sum()
+        expected = mframe
+        assert_frame_equal(result, expected)
+
+        result = mframe.groupby(level=[-1, 'first']).sum()
+        expected = mframe.groupby(level=['second', 'first']).sum()
+        assert_frame_equal(result, expected)
+
+    def test_multifunc_select_col_integer_cols(self, df):
+        df.columns = np.arange(len(df.columns))
+
+        # it works!
+        df.groupby(1, as_index=False)[2].agg({'Q': np.mean})
+
+    def test_multiindex_columns_empty_level(self):
+        lst = [['count', 'values'], ['to filter', '']]
+        midx = MultiIndex.from_tuples(lst)
+
+        df = DataFrame([[long(1), 'A']], columns=midx)
+
+        grouped = df.groupby('to filter').groups
+        assert grouped['A'] == [0]
+
+        grouped = df.groupby([('to filter', '')]).groups
+        assert grouped['A'] == [0]
+
+        df = DataFrame([[long(1), 'A'], [long(2), 'B']], columns=midx)
+
+        expected = df.groupby('to filter').groups
+        result = df.groupby([('to filter', '')]).groups
+        assert result == expected
+
+        df = DataFrame([[long(1), 'A'], [long(2), 'A']], columns=midx)
+
+        expected = df.groupby('to filter').groups
+        result = df.groupby([('to filter', '')]).groups
+        tm.assert_dict_equal(result, expected)
+
+    def test_groupby_multiindex_tuple(self):
+        # GH 17979
+        df = pd.DataFrame([[1, 2, 3, 4], [3, 4, 5, 6], [1, 4, 2, 3]],
+                          columns=pd.MultiIndex.from_arrays(
+                              [['a', 'b', 'b', 'c'],
+                               [1, 1, 2, 2]]))
+        expected = df.groupby([('b', 1)]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+        df2 = pd.DataFrame(df.values,
+                           columns=pd.MultiIndex.from_arrays(
+                               [['a', 'b', 'b', 'c'],
+                                ['d', 'd', 'e', 'e']]))
+        expected = df2.groupby([('b', 'd')]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+        df3 = pd.DataFrame(df.values,
+                           columns=[('a', 'd'), ('b', 'd'), ('b', 'e'), 'c'])
+        expected = df3.groupby([('b', 'd')]).groups
+        result = df.groupby(('b', 1)).groups
+        tm.assert_dict_equal(expected, result)
+
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_groupby_level(self, sort, mframe, df):
+        # GH 17537
+        frame = mframe
+        deleveled = frame.reset_index()
+
+        result0 = frame.groupby(level=0, sort=sort).sum()
+        result1 = frame.groupby(level=1, sort=sort).sum()
+
+        expected0 = frame.groupby(deleveled['first'].values, sort=sort).sum()
+        expected1 = frame.groupby(deleveled['second'].values, sort=sort).sum()
+
+        expected0.index.name = 'first'
+        expected1.index.name = 'second'
+
+        assert result0.index.name == 'first'
+        assert result1.index.name == 'second'
+
+        assert_frame_equal(result0, expected0)
+        assert_frame_equal(result1, expected1)
+        assert result0.index.name == frame.index.names[0]
+        assert result1.index.name == frame.index.names[1]
+
+        # groupby level name
+        result0 = frame.groupby(level='first', sort=sort).sum()
+        result1 = frame.groupby(level='second', sort=sort).sum()
+        assert_frame_equal(result0, expected0)
+        assert_frame_equal(result1, expected1)
+
+        # axis=1
+
+        result0 = frame.T.groupby(level=0, axis=1, sort=sort).sum()
+        result1 = frame.T.groupby(level=1, axis=1, sort=sort).sum()
+        assert_frame_equal(result0, expected0.T)
+        assert_frame_equal(result1, expected1.T)
+
+        # raise exception for non-MultiIndex
+        msg = "level > 0 or level < -1 only valid with MultiIndex"
+        with pytest.raises(ValueError, match=msg):
+            df.groupby(level=1)
+
+    def test_groupby_level_index_names(self):
+        # GH4014 this used to raise ValueError since 'exp'>1 (in py2)
+        df = DataFrame({'exp': ['A'] * 3 + ['B'] * 3,
+                        'var1': lrange(6), }).set_index('exp')
+        df.groupby(level='exp')
+        msg = "level name foo is not the name of the index"
+        with pytest.raises(ValueError, match=msg):
+            df.groupby(level='foo')
+
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_groupby_level_with_nas(self, sort):
+        # GH 17537
+        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
+                           codes=[[1, 1, 1, 1, 0, 0, 0, 0], [0, 1, 2, 3, 0, 1,
+                                                             2, 3]])
+
+        # factorizing doesn't confuse things
+        s = Series(np.arange(8.), index=index)
+        result = s.groupby(level=0, sort=sort).sum()
+        expected = Series([6., 22.], index=[0, 1])
+        assert_series_equal(result, expected)
+
+        index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
+                           codes=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
+                                                              1, 2, 3]])
+
+        # factorizing doesn't confuse things
+        s = Series(np.arange(8.), index=index)
+        result = s.groupby(level=0, sort=sort).sum()
+        expected = Series([6., 18.], index=[0.0, 1.0])
+        assert_series_equal(result, expected)
+
+    def test_groupby_args(self, mframe):
+        # PR8618 and issue 8015
+        frame = mframe
+
+        msg = "You have to supply one of 'by' and 'level'"
+        with pytest.raises(TypeError, match=msg):
+            frame.groupby()
+
+        msg = "You have to supply one of 'by' and 'level'"
+        with pytest.raises(TypeError, match=msg):
+            frame.groupby(by=None, level=None)
+
+    @pytest.mark.parametrize('sort,labels', [
+        [True, [2, 2, 2, 0, 0, 1, 1, 3, 3, 3]],
+        [False, [0, 0, 0, 1, 1, 2, 2, 3, 3, 3]]
+    ])
+    def test_level_preserve_order(self, sort, labels, mframe):
+        # GH 17537
+        grouped = mframe.groupby(level=0, sort=sort)
+        exp_labels = np.array(labels, np.intp)
+        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
+
+    def test_grouping_labels(self, mframe):
+        grouped = mframe.groupby(mframe.index.get_level_values(0))
+        exp_labels = np.array([2, 2, 2, 0, 0, 1, 1, 3, 3, 3], dtype=np.intp)
+        assert_almost_equal(grouped.grouper.labels[0], exp_labels)
+
+    def test_list_grouper_with_nat(self):
+        # GH 14715
+        df = pd.DataFrame({'date': pd.date_range('1/1/2011',
+                                                 periods=365, freq='D')})
+        df.iloc[-1] = pd.NaT
+        grouper = pd.Grouper(key='date', freq='AS')
+
+        # Grouper in a list grouping
+        result = df.groupby([grouper])
+        expected = {pd.Timestamp('2011-01-01'): pd.Index(list(range(364)))}
+        tm.assert_dict_equal(result.groups, expected)
+
+        # Test case without a list
+        result = df.groupby(grouper)
+        expected = {pd.Timestamp('2011-01-01'): 365}
+        tm.assert_dict_equal(result.groups, expected)
+
+
+# get_group
+# --------------------------------
+
+class TestGetGroup():
+    def test_get_group(self):
+        # GH 5267
+        # be datelike friendly
+        df = DataFrame({'DATE': pd.to_datetime(
+            ['10-Oct-2013', '10-Oct-2013', '10-Oct-2013', '11-Oct-2013',
+             '11-Oct-2013', '11-Oct-2013']),
+            'label': ['foo', 'foo', 'bar', 'foo', 'foo', 'bar'],
+            'VAL': [1, 2, 3, 4, 5, 6]})
+
+        g = df.groupby('DATE')
+        key = list(g.groups)[0]
+        result1 = g.get_group(key)
+        result2 = g.get_group(Timestamp(key).to_pydatetime())
+        result3 = g.get_group(str(Timestamp(key)))
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+
+        g = df.groupby(['DATE', 'label'])
+
+        key = list(g.groups)[0]
+        result1 = g.get_group(key)
+        result2 = g.get_group((Timestamp(key[0]).to_pydatetime(), key[1]))
+        result3 = g.get_group((str(Timestamp(key[0])), key[1]))
+        assert_frame_equal(result1, result2)
+        assert_frame_equal(result1, result3)
+
+        # must pass a same-length tuple with multiple keys
+        msg = "must supply a tuple to get_group with multiple grouping keys"
+        with pytest.raises(ValueError, match=msg):
+            g.get_group('foo')
+        with pytest.raises(ValueError, match=msg):
+            g.get_group(('foo'))
+        msg = ("must supply a same-length tuple to get_group with multiple"
+               " grouping keys")
+        with pytest.raises(ValueError, match=msg):
+            g.get_group(('foo', 'bar', 'baz'))
+
+    def test_get_group_empty_bins(self, observed):
+
+        d = pd.DataFrame([3, 1, 7, 6])
+        bins = [0, 5, 10, 15]
+        g = d.groupby(pd.cut(d[0], bins), observed=observed)
+
+        # TODO: should prob allow a str of Interval work as well
+        # IOW '(0, 5]'
+        result = g.get_group(pd.Interval(0, 5))
+        expected = DataFrame([3, 1], index=[0, 1])
+        assert_frame_equal(result, expected)
+
+        msg = r"Interval\(10, 15, closed='right'\)"
+        with pytest.raises(KeyError, match=msg):
+            g.get_group(pd.Interval(10, 15))
+
+    def test_get_group_grouped_by_tuple(self):
+        # GH 8121
+        df = DataFrame([[(1, ), (1, 2), (1, ), (1, 2)]], index=['ids']).T
+        gr = df.groupby('ids')
+        expected = DataFrame({'ids': [(1, ), (1, )]}, index=[0, 2])
+        result = gr.get_group((1, ))
+        assert_frame_equal(result, expected)
+
+        dt = pd.to_datetime(['2010-01-01', '2010-01-02', '2010-01-01',
+                             '2010-01-02'])
+        df = DataFrame({'ids': [(x, ) for x in dt]})
+        gr = df.groupby('ids')
+        result = gr.get_group(('2010-01-01', ))
+        expected = DataFrame({'ids': [(dt[0], ), (dt[0], )]}, index=[0, 2])
+        assert_frame_equal(result, expected)
+
+    def test_groupby_with_empty(self):
+        index = pd.DatetimeIndex(())
+        data = ()
+        series = pd.Series(data, index)
+        grouper = pd.Grouper(freq='D')
+        grouped = series.groupby(grouper)
+        assert next(iter(grouped), None) is None
+
+    def test_groupby_with_single_column(self):
+        df = pd.DataFrame({'a': list('abssbab')})
+        tm.assert_frame_equal(df.groupby('a').get_group('a'), df.iloc[[0, 5]])
+        # GH 13530
+        exp = pd.DataFrame([], index=pd.Index(['a', 'b', 's'], name='a'))
+        tm.assert_frame_equal(df.groupby('a').count(), exp)
+        tm.assert_frame_equal(df.groupby('a').sum(), exp)
+        tm.assert_frame_equal(df.groupby('a').nth(1), exp)
+
+    def test_gb_key_len_equal_axis_len(self):
+            # GH16843
+            # test ensures that index and column keys are recognized correctly
+            # when number of keys equals axis length of groupby
+            df = pd.DataFrame([['foo', 'bar', 'B', 1],
+                               ['foo', 'bar', 'B', 2],
+                               ['foo', 'baz', 'C', 3]],
+                              columns=['first', 'second', 'third', 'one'])
+            df = df.set_index(['first', 'second'])
+            df = df.groupby(['first', 'second', 'third']).size()
+            assert df.loc[('foo', 'bar', 'B')] == 2
+            assert df.loc[('foo', 'baz', 'C')] == 1
+
+
+# groups & iteration
+# --------------------------------
+
+class TestIteration():
+
+    def test_groups(self, df):
+        grouped = df.groupby(['A'])
+        groups = grouped.groups
+        assert groups is grouped.groups  # caching works
+
+        for k, v in compat.iteritems(grouped.groups):
+            assert (df.loc[v]['A'] == k).all()
+
+        grouped = df.groupby(['A', 'B'])
+        groups = grouped.groups
+        assert groups is grouped.groups  # caching works
+
+        for k, v in compat.iteritems(grouped.groups):
+            assert (df.loc[v]['A'] == k[0]).all()
+            assert (df.loc[v]['B'] == k[1]).all()
+
+    def test_grouping_is_iterable(self, tsframe):
+        # this code path isn't used anywhere else
+        # not sure it's useful
+        grouped = tsframe.groupby([lambda x: x.weekday(), lambda x: x.year])
+
+        # test it works
+        for g in grouped.grouper.groupings[0]:
+            pass
+
+    def test_multi_iter(self):
+        s = Series(np.arange(6))
+        k1 = np.array(['a', 'a', 'a', 'b', 'b', 'b'])
+        k2 = np.array(['1', '2', '1', '2', '1', '2'])
+
+        grouped = s.groupby([k1, k2])
+
+        iterated = list(grouped)
+        expected = [('a', '1', s[[0, 2]]), ('a', '2', s[[1]]),
+                    ('b', '1', s[[4]]), ('b', '2', s[[3, 5]])]
+        for i, ((one, two), three) in enumerate(iterated):
+            e1, e2, e3 = expected[i]
+            assert e1 == one
+            assert e2 == two
+            assert_series_equal(three, e3)
+
+    def test_multi_iter_frame(self, three_group):
+        k1 = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
+        k2 = np.array(['1', '2', '1', '2', '1', '2'])
+        df = DataFrame({'v1': np.random.randn(6),
+                        'v2': np.random.randn(6),
+                        'k1': k1, 'k2': k2},
+                       index=['one', 'two', 'three', 'four', 'five', 'six'])
+
+        grouped = df.groupby(['k1', 'k2'])
+
+        # things get sorted!
+        iterated = list(grouped)
+        idx = df.index
+        expected = [('a', '1', df.loc[idx[[4]]]),
+                    ('a', '2', df.loc[idx[[3, 5]]]),
+                    ('b', '1', df.loc[idx[[0, 2]]]),
+                    ('b', '2', df.loc[idx[[1]]])]
+        for i, ((one, two), three) in enumerate(iterated):
+            e1, e2, e3 = expected[i]
+            assert e1 == one
+            assert e2 == two
+            assert_frame_equal(three, e3)
+
+        # don't iterate through groups with no data
+        df['k1'] = np.array(['b', 'b', 'b', 'a', 'a', 'a'])
+        df['k2'] = np.array(['1', '1', '1', '2', '2', '2'])
+        grouped = df.groupby(['k1', 'k2'])
+        groups = {key: gp for key, gp in grouped}
+        assert len(groups) == 2
+
+        # axis = 1
+        three_levels = three_group.groupby(['A', 'B', 'C']).mean()
+        grouped = three_levels.T.groupby(axis=1, level=(1, 2))
+        for key, group in grouped:
+            pass
+
+    def test_dictify(self, df):
+        dict(iter(df.groupby('A')))
+        dict(iter(df.groupby(['A', 'B'])))
+        dict(iter(df['C'].groupby(df['A'])))
+        dict(iter(df['C'].groupby([df['A'], df['B']])))
+        dict(iter(df.groupby('A')['C']))
+        dict(iter(df.groupby(['A', 'B'])['C']))
+
+    def test_groupby_with_small_elem(self):
+        # GH 8542
+        # length=2
+        df = pd.DataFrame({'event': ['start', 'start'],
+                           'change': [1234, 5678]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 2
+        assert grouped.ngroups == 2
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+
+        df = pd.DataFrame({'event': ['start', 'start', 'start'],
+                           'change': [1234, 5678, 9123]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
+                                                  '2014-09-15']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 2
+        assert grouped.ngroups == 2
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0, 2], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+
+        # length=3
+        df = pd.DataFrame({'event': ['start', 'start', 'start'],
+                           'change': [1234, 5678, 9123]},
+                          index=pd.DatetimeIndex(['2014-09-10', '2013-10-10',
+                                                  '2014-08-05']))
+        grouped = df.groupby([pd.Grouper(freq='M'), 'event'])
+        assert len(grouped.groups) == 3
+        assert grouped.ngroups == 3
+        assert (pd.Timestamp('2014-09-30'), 'start') in grouped.groups
+        assert (pd.Timestamp('2013-10-31'), 'start') in grouped.groups
+        assert (pd.Timestamp('2014-08-31'), 'start') in grouped.groups
+
+        res = grouped.get_group((pd.Timestamp('2014-09-30'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[0], :])
+        res = grouped.get_group((pd.Timestamp('2013-10-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[1], :])
+        res = grouped.get_group((pd.Timestamp('2014-08-31'), 'start'))
+        tm.assert_frame_equal(res, df.iloc[[2], :])
+
+    def test_grouping_string_repr(self):
+        # GH 13394
+        mi = MultiIndex.from_arrays([list("AAB"), list("aba")])
+        df = DataFrame([[1, 2, 3]], columns=mi)
+        gr = df.groupby(df[('A', 'a')])
+
+        result = gr.grouper.groupings[0].__repr__()
+        expected = "Grouping(('A', 'a'))"
+        assert result == expected
diff --git a/pandas/tests/groupby/test_index_as_string.py b/pandas/tests/groupby/test_index_as_string.py
new file mode 100644
index 0000000000000..141381f84300b
--- /dev/null
+++ b/pandas/tests/groupby/test_index_as_string.py
@@ -0,0 +1,68 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+@pytest.fixture(params=[['inner'], ['inner', 'outer']])
+def frame(request):
+    levels = request.param
+    df = pd.DataFrame({'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+                       'inner': [1, 2, 3, 1, 2, 3],
+                       'A': np.arange(6),
+                       'B': ['one', 'one', 'two', 'two', 'one', 'one']})
+    if levels:
+        df = df.set_index(levels)
+
+    return df
+
+
+@pytest.fixture()
+def series():
+    df = pd.DataFrame({'outer': ['a', 'a', 'a', 'b', 'b', 'b'],
+                       'inner': [1, 2, 3, 1, 2, 3],
+                       'A': np.arange(6),
+                       'B': ['one', 'one', 'two', 'two', 'one', 'one']})
+    s = df.set_index(['outer', 'inner', 'B'])['A']
+
+    return s
+
+
+@pytest.mark.parametrize('key_strs,groupers', [
+    ('inner',  # Index name
+     pd.Grouper(level='inner')
+     ),
+    (['inner'],  # List of index name
+     [pd.Grouper(level='inner')]
+     ),
+    (['B', 'inner'],  # Column and index
+     ['B', pd.Grouper(level='inner')]
+     ),
+    (['inner', 'B'],  # Index and column
+     [pd.Grouper(level='inner'), 'B'])])
+def test_grouper_index_level_as_string(frame, key_strs, groupers):
+    result = frame.groupby(key_strs).mean()
+    expected = frame.groupby(groupers).mean()
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('levels', [
+    'inner', 'outer', 'B',
+    ['inner'], ['outer'], ['B'],
+    ['inner', 'outer'], ['outer', 'inner'],
+    ['inner', 'outer', 'B'], ['B', 'outer', 'inner']
+])
+def test_grouper_index_level_as_string_series(series, levels):
+
+    # Compute expected result
+    if isinstance(levels, list):
+        groupers = [pd.Grouper(level=lv) for lv in levels]
+    else:
+        groupers = pd.Grouper(level=levels)
+
+    expected = series.groupby(groupers).mean()
+
+    # Compute and check result
+    result = series.groupby(levels).mean()
+    assert_series_equal(result, expected)
diff --git a/pandas/tests/groupby/test_nth.py b/pandas/tests/groupby/test_nth.py
new file mode 100644
index 0000000000000..7a3d189d3020e
--- /dev/null
+++ b/pandas/tests/groupby/test_nth.py
@@ -0,0 +1,436 @@
+import numpy as np
+import pytest
+
+from pandas.compat import lrange
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, Timestamp, isna
+from pandas.util.testing import (
+    assert_frame_equal, assert_produces_warning, assert_series_equal)
+
+
+def test_first_last_nth(df):
+    # tests for first / last / nth
+    grouped = df.groupby('A')
+    first = grouped.first()
+    expected = df.loc[[1, 0], ['B', 'C', 'D']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(first, expected)
+
+    nth = grouped.nth(0)
+    assert_frame_equal(nth, expected)
+
+    last = grouped.last()
+    expected = df.loc[[5, 7], ['B', 'C', 'D']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    assert_frame_equal(last, expected)
+
+    nth = grouped.nth(-1)
+    assert_frame_equal(nth, expected)
+
+    nth = grouped.nth(1)
+    expected = df.loc[[2, 3], ['B', 'C', 'D']].copy()
+    expected.index = Index(['foo', 'bar'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(nth, expected)
+
+    # it works!
+    grouped['B'].first()
+    grouped['B'].last()
+    grouped['B'].nth(0)
+
+    df.loc[df['A'] == 'foo', 'B'] = np.nan
+    assert isna(grouped['B'].first()['foo'])
+    assert isna(grouped['B'].last()['foo'])
+    assert isna(grouped['B'].nth(0)['foo'])
+
+    # v0.14.0 whatsnew
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    result = g.first()
+    expected = df.iloc[[1, 2]].set_index('A')
+    assert_frame_equal(result, expected)
+
+    expected = df.iloc[[1, 2]].set_index('A')
+    result = g.nth(0, dropna='any')
+    assert_frame_equal(result, expected)
+
+
+def test_first_last_nth_dtypes(df_mixed_floats):
+
+    df = df_mixed_floats.copy()
+    df['E'] = True
+    df['F'] = 1
+
+    # tests for first / last / nth
+    grouped = df.groupby('A')
+    first = grouped.first()
+    expected = df.loc[[1, 0], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(first, expected)
+
+    last = grouped.last()
+    expected = df.loc[[5, 7], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(last, expected)
+
+    nth = grouped.nth(1)
+    expected = df.loc[[3, 2], ['B', 'C', 'D', 'E', 'F']]
+    expected.index = Index(['bar', 'foo'], name='A')
+    expected = expected.sort_index()
+    assert_frame_equal(nth, expected)
+
+    # GH 2763, first/last shifting dtypes
+    idx = lrange(10)
+    idx.append(9)
+    s = Series(data=lrange(11), index=idx, name='IntCol')
+    assert s.dtype == 'int64'
+    f = s.groupby(level=0).first()
+    assert f.dtype == 'int64'
+
+
+def test_nth():
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+
+    assert_frame_equal(g.nth(0), df.iloc[[0, 2]].set_index('A'))
+    assert_frame_equal(g.nth(1), df.iloc[[1]].set_index('A'))
+    assert_frame_equal(g.nth(2), df.loc[[]].set_index('A'))
+    assert_frame_equal(g.nth(-1), df.iloc[[1, 2]].set_index('A'))
+    assert_frame_equal(g.nth(-2), df.iloc[[0]].set_index('A'))
+    assert_frame_equal(g.nth(-3), df.loc[[]].set_index('A'))
+    assert_series_equal(g.B.nth(0), df.set_index('A').B.iloc[[0, 2]])
+    assert_series_equal(g.B.nth(1), df.set_index('A').B.iloc[[1]])
+    assert_frame_equal(g[['B']].nth(0),
+                       df.loc[[0, 2], ['A', 'B']].set_index('A'))
+
+    exp = df.set_index('A')
+    assert_frame_equal(g.nth(0, dropna='any'), exp.iloc[[1, 2]])
+    assert_frame_equal(g.nth(-1, dropna='any'), exp.iloc[[1, 2]])
+
+    exp['B'] = np.nan
+    assert_frame_equal(g.nth(7, dropna='any'), exp.iloc[[1, 2]])
+    assert_frame_equal(g.nth(2, dropna='any'), exp.iloc[[1, 2]])
+
+    # out of bounds, regression from 0.13.1
+    # GH 6621
+    df = DataFrame({'color': {0: 'green',
+                              1: 'green',
+                              2: 'red',
+                              3: 'red',
+                              4: 'red'},
+                    'food': {0: 'ham',
+                             1: 'eggs',
+                             2: 'eggs',
+                             3: 'ham',
+                             4: 'pork'},
+                    'two': {0: 1.5456590000000001,
+                            1: -0.070345000000000005,
+                            2: -2.4004539999999999,
+                            3: 0.46206000000000003,
+                            4: 0.52350799999999997},
+                    'one': {0: 0.56573799999999996,
+                            1: -0.9742360000000001,
+                            2: 1.033801,
+                            3: -0.78543499999999999,
+                            4: 0.70422799999999997}}).set_index(['color',
+                                                                 'food'])
+
+    result = df.groupby(level=0, as_index=False).nth(2)
+    expected = df.iloc[[-1]]
+    assert_frame_equal(result, expected)
+
+    result = df.groupby(level=0, as_index=False).nth(3)
+    expected = df.loc[[]]
+    assert_frame_equal(result, expected)
+
+    # GH 7559
+    # from the vbench
+    df = DataFrame(np.random.randint(1, 10, (100, 2)), dtype='int64')
+    s = df[1]
+    g = df[0]
+    expected = s.groupby(g).first()
+    expected2 = s.groupby(g).apply(lambda x: x.iloc[0])
+    assert_series_equal(expected2, expected, check_names=False)
+    assert expected.name == 1
+    assert expected2.name == 1
+
+    # validate first
+    v = s[g == 1].iloc[0]
+    assert expected.iloc[0] == v
+    assert expected2.iloc[0] == v
+
+    # this is NOT the same as .first (as sorted is default!)
+    # as it keeps the order in the series (and not the group order)
+    # related GH 7287
+    expected = s.groupby(g, sort=False).first()
+    result = s.groupby(g, sort=False).nth(0, dropna='all')
+    assert_series_equal(result, expected)
+
+    # doc example
+    df = DataFrame([[1, np.nan], [1, 4], [5, 6]], columns=['A', 'B'])
+    g = df.groupby('A')
+    # PR 17493, related to issue 11038
+    # test Series.nth with True for dropna produces FutureWarning
+    with assert_produces_warning(FutureWarning):
+        result = g.B.nth(0, dropna=True)
+    expected = g.B.first()
+    assert_series_equal(result, expected)
+
+    # test multiple nth values
+    df = DataFrame([[1, np.nan], [1, 3], [1, 4], [5, 6], [5, 7]],
+                   columns=['A', 'B'])
+    g = df.groupby('A')
+
+    assert_frame_equal(g.nth(0), df.iloc[[0, 3]].set_index('A'))
+    assert_frame_equal(g.nth([0]), df.iloc[[0, 3]].set_index('A'))
+    assert_frame_equal(g.nth([0, 1]), df.iloc[[0, 1, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, -1]), df.iloc[[0, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, 1, 2]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(
+        g.nth([0, 1, -1]), df.iloc[[0, 1, 2, 3, 4]].set_index('A'))
+    assert_frame_equal(g.nth([2]), df.iloc[[2]].set_index('A'))
+    assert_frame_equal(g.nth([3, 4]), df.loc[[]].set_index('A'))
+
+    business_dates = pd.date_range(start='4/1/2014', end='6/30/2014',
+                                   freq='B')
+    df = DataFrame(1, index=business_dates, columns=['a', 'b'])
+    # get the first, fourth and last two business days for each month
+    key = [df.index.year, df.index.month]
+    result = df.groupby(key, as_index=False).nth([0, 3, -2, -1])
+    expected_dates = pd.to_datetime(
+        ['2014/4/1', '2014/4/4', '2014/4/29', '2014/4/30', '2014/5/1',
+         '2014/5/6', '2014/5/29', '2014/5/30', '2014/6/2', '2014/6/5',
+         '2014/6/27', '2014/6/30'])
+    expected = DataFrame(1, columns=['a', 'b'], index=expected_dates)
+    assert_frame_equal(result, expected)
+
+
+def test_nth_multi_index(three_group):
+    # PR 9090, related to issue 8979
+    # test nth on MultiIndex, should match .first()
+    grouped = three_group.groupby(['A', 'B'])
+    result = grouped.nth(0)
+    expected = grouped.first()
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('data, expected_first, expected_last', [
+    ({'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]},
+     {'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]},
+     {'id': ['A'],
+      'time': Timestamp('2012-02-01 14:00:00',
+                        tz='US/Central'),
+      'foo': [1]}),
+    ({'id': ['A', 'B', 'A'],
+      'time': [Timestamp('2012-01-01 13:00:00',
+                         tz='America/New_York'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central'),
+               Timestamp('2012-03-01 12:00:00',
+                         tz='Europe/London')],
+      'foo': [1, 2, 3]},
+     {'id': ['A', 'B'],
+      'time': [Timestamp('2012-01-01 13:00:00',
+                         tz='America/New_York'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central')],
+      'foo': [1, 2]},
+     {'id': ['A', 'B'],
+      'time': [Timestamp('2012-03-01 12:00:00',
+                         tz='Europe/London'),
+               Timestamp('2012-02-01 14:00:00',
+                         tz='US/Central')],
+      'foo': [3, 2]})
+])
+def test_first_last_tz(data, expected_first, expected_last):
+    # GH15884
+    # Test that the timezone is retained when calling first
+    # or last on groupby with as_index=False
+
+    df = DataFrame(data)
+
+    result = df.groupby('id', as_index=False).first()
+    expected = DataFrame(expected_first)
+    cols = ['id', 'time', 'foo']
+    assert_frame_equal(result[cols], expected[cols])
+
+    result = df.groupby('id', as_index=False)['time'].first()
+    assert_frame_equal(result, expected[['id', 'time']])
+
+    result = df.groupby('id', as_index=False).last()
+    expected = DataFrame(expected_last)
+    cols = ['id', 'time', 'foo']
+    assert_frame_equal(result[cols], expected[cols])
+
+    result = df.groupby('id', as_index=False)['time'].last()
+    assert_frame_equal(result, expected[['id', 'time']])
+
+
+@pytest.mark.parametrize('method, ts, alpha', [
+    ['first', Timestamp('2013-01-01', tz='US/Eastern'), 'a'],
+    ['last', Timestamp('2013-01-02', tz='US/Eastern'), 'b']
+])
+def test_first_last_tz_multi_column(method, ts, alpha):
+    # GH 21603
+    df = pd.DataFrame({'group': [1, 1, 2],
+                       'category_string': pd.Series(list('abc')).astype(
+                           'category'),
+                       'datetimetz': pd.date_range('20130101', periods=3,
+                                                   tz='US/Eastern')})
+    result = getattr(df.groupby('group'), method)()
+    expepcted = pd.DataFrame({'category_string': [alpha, 'c'],
+                              'datetimetz': [ts,
+                                             Timestamp('2013-01-03',
+                                                       tz='US/Eastern')]},
+                             index=pd.Index([1, 2], name='group'))
+    assert_frame_equal(result, expepcted)
+
+
+def test_nth_multi_index_as_expected():
+    # PR 9090, related to issue 8979
+    # test nth on MultiIndex
+    three_group = DataFrame(
+        {'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar', 'bar', 'bar',
+               'foo', 'foo', 'foo'],
+         'B': ['one', 'one', 'one', 'two', 'one', 'one', 'one', 'two',
+               'two', 'two', 'one'],
+         'C': ['dull', 'dull', 'shiny', 'dull', 'dull', 'shiny', 'shiny',
+               'dull', 'shiny', 'shiny', 'shiny']})
+    grouped = three_group.groupby(['A', 'B'])
+    result = grouped.nth(0)
+    expected = DataFrame(
+        {'C': ['dull', 'dull', 'dull', 'dull']},
+        index=MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo'],
+                                      ['one', 'two', 'one', 'two']],
+                                     names=['A', 'B']))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_head_tail():
+    df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+    g_as = df.groupby('A', as_index=True)
+    g_not_as = df.groupby('A', as_index=False)
+
+    # as_index= False, much easier
+    assert_frame_equal(df.loc[[0, 2]], g_not_as.head(1))
+    assert_frame_equal(df.loc[[1, 2]], g_not_as.tail(1))
+
+    empty_not_as = DataFrame(columns=df.columns,
+                             index=pd.Index([], dtype=df.index.dtype))
+    empty_not_as['A'] = empty_not_as['A'].astype(df.A.dtype)
+    empty_not_as['B'] = empty_not_as['B'].astype(df.B.dtype)
+    assert_frame_equal(empty_not_as, g_not_as.head(0))
+    assert_frame_equal(empty_not_as, g_not_as.tail(0))
+    assert_frame_equal(empty_not_as, g_not_as.head(-1))
+    assert_frame_equal(empty_not_as, g_not_as.tail(-1))
+
+    assert_frame_equal(df, g_not_as.head(7))  # contains all
+    assert_frame_equal(df, g_not_as.tail(7))
+
+    # as_index=True, (used to be different)
+    df_as = df
+
+    assert_frame_equal(df_as.loc[[0, 2]], g_as.head(1))
+    assert_frame_equal(df_as.loc[[1, 2]], g_as.tail(1))
+
+    empty_as = DataFrame(index=df_as.index[:0], columns=df.columns)
+    empty_as['A'] = empty_not_as['A'].astype(df.A.dtype)
+    empty_as['B'] = empty_not_as['B'].astype(df.B.dtype)
+    assert_frame_equal(empty_as, g_as.head(0))
+    assert_frame_equal(empty_as, g_as.tail(0))
+    assert_frame_equal(empty_as, g_as.head(-1))
+    assert_frame_equal(empty_as, g_as.tail(-1))
+
+    assert_frame_equal(df_as, g_as.head(7))  # contains all
+    assert_frame_equal(df_as, g_as.tail(7))
+
+    # test with selection
+    assert_frame_equal(g_as[[]].head(1), df_as.loc[[0, 2], []])
+    assert_frame_equal(g_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
+    assert_frame_equal(g_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
+    assert_frame_equal(g_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
+
+    assert_frame_equal(g_not_as[[]].head(1), df_as.loc[[0, 2], []])
+    assert_frame_equal(g_not_as[['A']].head(1), df_as.loc[[0, 2], ['A']])
+    assert_frame_equal(g_not_as[['B']].head(1), df_as.loc[[0, 2], ['B']])
+    assert_frame_equal(g_not_as[['A', 'B']].head(1), df_as.loc[[0, 2]])
+
+
+def test_group_selection_cache():
+    # GH 12839 nth, head, and tail should return same result consistently
+    df = DataFrame([[1, 2], [1, 4], [5, 6]], columns=['A', 'B'])
+    expected = df.iloc[[0, 2]].set_index('A')
+
+    g = df.groupby('A')
+    result1 = g.head(n=2)
+    result2 = g.nth(0)
+    assert_frame_equal(result1, df)
+    assert_frame_equal(result2, expected)
+
+    g = df.groupby('A')
+    result1 = g.tail(n=2)
+    result2 = g.nth(0)
+    assert_frame_equal(result1, df)
+    assert_frame_equal(result2, expected)
+
+    g = df.groupby('A')
+    result1 = g.nth(0)
+    result2 = g.head(n=2)
+    assert_frame_equal(result1, expected)
+    assert_frame_equal(result2, df)
+
+    g = df.groupby('A')
+    result1 = g.nth(0)
+    result2 = g.tail(n=2)
+    assert_frame_equal(result1, expected)
+    assert_frame_equal(result2, df)
+
+
+def test_nth_empty():
+    # GH 16064
+    df = DataFrame(index=[0], columns=['a', 'b', 'c'])
+    result = df.groupby('a').nth(10)
+    expected = DataFrame(index=Index([], name='a'), columns=['b', 'c'])
+    assert_frame_equal(result, expected)
+
+    result = df.groupby(['a', 'b']).nth(10)
+    expected = DataFrame(index=MultiIndex([[], []], [[], []],
+                                          names=['a', 'b']),
+                         columns=['c'])
+    assert_frame_equal(result, expected)
+
+
+def test_nth_column_order():
+    # GH 20760
+    # Check that nth preserves column order
+    df = DataFrame([[1, 'b', 100],
+                    [1, 'a', 50],
+                    [1, 'a', np.nan],
+                    [2, 'c', 200],
+                    [2, 'd', 150]],
+                   columns=['A', 'C', 'B'])
+    result = df.groupby('A').nth(0)
+    expected = DataFrame([['b', 100.0],
+                          ['c', 200.0]],
+                         columns=['C', 'B'],
+                         index=Index([1, 2], name='A'))
+    assert_frame_equal(result, expected)
+
+    result = df.groupby('A').nth(-1, dropna='any')
+    expected = DataFrame([['a', 50.0],
+                          ['d', 150.0]],
+                         columns=['C', 'B'],
+                         index=Index([1, 2], name='A'))
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_rank.py b/pandas/tests/groupby/test_rank.py
new file mode 100644
index 0000000000000..9b0396bb530a1
--- /dev/null
+++ b/pandas/tests/groupby/test_rank.py
@@ -0,0 +1,306 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Series, concat
+from pandas.util import testing as tm
+
+
+def test_rank_apply():
+    lev1 = tm.rands_array(10, 100)
+    lev2 = tm.rands_array(10, 130)
+    lab1 = np.random.randint(0, 100, size=500)
+    lab2 = np.random.randint(0, 130, size=500)
+
+    df = DataFrame({'value': np.random.randn(500),
+                    'key1': lev1.take(lab1),
+                    'key2': lev2.take(lab2)})
+
+    result = df.groupby(['key1', 'key2']).value.rank()
+
+    expected = [piece.value.rank()
+                for key, piece in df.groupby(['key1', 'key2'])]
+    expected = concat(expected, axis=0)
+    expected = expected.reindex(result.index)
+    tm.assert_series_equal(result, expected)
+
+    result = df.groupby(['key1', 'key2']).value.rank(pct=True)
+
+    expected = [piece.value.rank(pct=True)
+                for key, piece in df.groupby(['key1', 'key2'])]
+    expected = concat(expected, axis=0)
+    expected = expected.reindex(result.index)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [2, 2, 8, 2, 6],
+    [pd.Timestamp('2018-01-02'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-08'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-06')]])
+@pytest.mark.parametrize("ties_method,ascending,pct,exp", [
+    ('average', True, False, [2., 2., 5., 2., 4.]),
+    ('average', True, True, [0.4, 0.4, 1.0, 0.4, 0.8]),
+    ('average', False, False, [4., 4., 1., 4., 2.]),
+    ('average', False, True, [.8, .8, .2, .8, .4]),
+    ('min', True, False, [1., 1., 5., 1., 4.]),
+    ('min', True, True, [0.2, 0.2, 1.0, 0.2, 0.8]),
+    ('min', False, False, [3., 3., 1., 3., 2.]),
+    ('min', False, True, [.6, .6, .2, .6, .4]),
+    ('max', True, False, [3., 3., 5., 3., 4.]),
+    ('max', True, True, [0.6, 0.6, 1.0, 0.6, 0.8]),
+    ('max', False, False, [5., 5., 1., 5., 2.]),
+    ('max', False, True, [1., 1., .2, 1., .4]),
+    ('first', True, False, [1., 2., 5., 3., 4.]),
+    ('first', True, True, [0.2, 0.4, 1.0, 0.6, 0.8]),
+    ('first', False, False, [3., 4., 1., 5., 2.]),
+    ('first', False, True, [.6, .8, .2, 1., .4]),
+    ('dense', True, False, [1., 1., 3., 1., 2.]),
+    ('dense', True, True, [1. / 3., 1. / 3., 3. / 3., 1. / 3., 2. / 3.]),
+    ('dense', False, False, [3., 3., 1., 3., 2.]),
+    ('dense', False, True, [3. / 3., 3. / 3., 1. / 3., 3. / 3., 2. / 3.]),
+])
+def test_rank_args(grps, vals, ties_method, ascending, pct, exp):
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending, pct=pct)
+
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [-np.inf, -np.inf, np.nan, 1., np.nan, np.inf, np.inf],
+])
+@pytest.mark.parametrize("ties_method,ascending,na_option,exp", [
+    ('average', True, 'keep', [1.5, 1.5, np.nan, 3, np.nan, 4.5, 4.5]),
+    ('average', True, 'top', [3.5, 3.5, 1.5, 5., 1.5, 6.5, 6.5]),
+    ('average', True, 'bottom', [1.5, 1.5, 6.5, 3., 6.5, 4.5, 4.5]),
+    ('average', False, 'keep', [4.5, 4.5, np.nan, 3, np.nan, 1.5, 1.5]),
+    ('average', False, 'top', [6.5, 6.5, 1.5, 5., 1.5, 3.5, 3.5]),
+    ('average', False, 'bottom', [4.5, 4.5, 6.5, 3., 6.5, 1.5, 1.5]),
+    ('min', True, 'keep', [1., 1., np.nan, 3., np.nan, 4., 4.]),
+    ('min', True, 'top', [3., 3., 1., 5., 1., 6., 6.]),
+    ('min', True, 'bottom', [1., 1., 6., 3., 6., 4., 4.]),
+    ('min', False, 'keep', [4., 4., np.nan, 3., np.nan, 1., 1.]),
+    ('min', False, 'top', [6., 6., 1., 5., 1., 3., 3.]),
+    ('min', False, 'bottom', [4., 4., 6., 3., 6., 1., 1.]),
+    ('max', True, 'keep', [2., 2., np.nan, 3., np.nan, 5., 5.]),
+    ('max', True, 'top', [4., 4., 2., 5., 2., 7., 7.]),
+    ('max', True, 'bottom', [2., 2., 7., 3., 7., 5., 5.]),
+    ('max', False, 'keep', [5., 5., np.nan, 3., np.nan, 2., 2.]),
+    ('max', False, 'top', [7., 7., 2., 5., 2., 4., 4.]),
+    ('max', False, 'bottom', [5., 5., 7., 3., 7., 2., 2.]),
+    ('first', True, 'keep', [1., 2., np.nan, 3., np.nan, 4., 5.]),
+    ('first', True, 'top', [3., 4., 1., 5., 2., 6., 7.]),
+    ('first', True, 'bottom', [1., 2., 6., 3., 7., 4., 5.]),
+    ('first', False, 'keep', [4., 5., np.nan, 3., np.nan, 1., 2.]),
+    ('first', False, 'top', [6., 7., 1., 5., 2., 3., 4.]),
+    ('first', False, 'bottom', [4., 5., 6., 3., 7., 1., 2.]),
+    ('dense', True, 'keep', [1., 1., np.nan, 2., np.nan, 3., 3.]),
+    ('dense', True, 'top', [2., 2., 1., 3., 1., 4., 4.]),
+    ('dense', True, 'bottom', [1., 1., 4., 2., 4., 3., 3.]),
+    ('dense', False, 'keep', [3., 3., np.nan, 2., np.nan, 1., 1.]),
+    ('dense', False, 'top', [4., 4., 1., 3., 1., 2., 2.]),
+    ('dense', False, 'bottom', [3., 3., 4., 2., 4., 1., 1.])
+])
+def test_infs_n_nans(grps, vals, ties_method, ascending, na_option, exp):
+    # GH 20561
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending,
+                                    na_option=na_option)
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("grps", [
+    ['qux'], ['qux', 'quux']])
+@pytest.mark.parametrize("vals", [
+    [2, 2, np.nan, 8, 2, 6, np.nan, np.nan],
+    [pd.Timestamp('2018-01-02'), pd.Timestamp('2018-01-02'), np.nan,
+     pd.Timestamp('2018-01-08'), pd.Timestamp('2018-01-02'),
+     pd.Timestamp('2018-01-06'), np.nan, np.nan]
+])
+@pytest.mark.parametrize("ties_method,ascending,na_option,pct,exp", [
+    ('average', True, 'keep', False,
+        [2., 2., np.nan, 5., 2., 4., np.nan, np.nan]),
+    ('average', True, 'keep', True,
+        [0.4, 0.4, np.nan, 1.0, 0.4, 0.8, np.nan, np.nan]),
+    ('average', False, 'keep', False,
+        [4., 4., np.nan, 1., 4., 2., np.nan, np.nan]),
+    ('average', False, 'keep', True,
+        [.8, 0.8, np.nan, 0.2, 0.8, 0.4, np.nan, np.nan]),
+    ('min', True, 'keep', False,
+        [1., 1., np.nan, 5., 1., 4., np.nan, np.nan]),
+    ('min', True, 'keep', True,
+        [0.2, 0.2, np.nan, 1.0, 0.2, 0.8, np.nan, np.nan]),
+    ('min', False, 'keep', False,
+        [3., 3., np.nan, 1., 3., 2., np.nan, np.nan]),
+    ('min', False, 'keep', True,
+        [.6, 0.6, np.nan, 0.2, 0.6, 0.4, np.nan, np.nan]),
+    ('max', True, 'keep', False,
+        [3., 3., np.nan, 5., 3., 4., np.nan, np.nan]),
+    ('max', True, 'keep', True,
+        [0.6, 0.6, np.nan, 1.0, 0.6, 0.8, np.nan, np.nan]),
+    ('max', False, 'keep', False,
+        [5., 5., np.nan, 1., 5., 2., np.nan, np.nan]),
+    ('max', False, 'keep', True,
+        [1., 1., np.nan, 0.2, 1., 0.4, np.nan, np.nan]),
+    ('first', True, 'keep', False,
+        [1., 2., np.nan, 5., 3., 4., np.nan, np.nan]),
+    ('first', True, 'keep', True,
+        [0.2, 0.4, np.nan, 1.0, 0.6, 0.8, np.nan, np.nan]),
+    ('first', False, 'keep', False,
+        [3., 4., np.nan, 1., 5., 2., np.nan, np.nan]),
+    ('first', False, 'keep', True,
+        [.6, 0.8, np.nan, 0.2, 1., 0.4, np.nan, np.nan]),
+    ('dense', True, 'keep', False,
+        [1., 1., np.nan, 3., 1., 2., np.nan, np.nan]),
+    ('dense', True, 'keep', True,
+        [1. / 3., 1. / 3., np.nan, 3. / 3., 1. / 3., 2. / 3., np.nan, np.nan]),
+    ('dense', False, 'keep', False,
+        [3., 3., np.nan, 1., 3., 2., np.nan, np.nan]),
+    ('dense', False, 'keep', True,
+        [3. / 3., 3. / 3., np.nan, 1. / 3., 3. / 3., 2. / 3., np.nan, np.nan]),
+    ('average', True, 'bottom', False, [2., 2., 7., 5., 2., 4., 7., 7.]),
+    ('average', True, 'bottom', True,
+        [0.25, 0.25, 0.875, 0.625, 0.25, 0.5, 0.875, 0.875]),
+    ('average', False, 'bottom', False, [4., 4., 7., 1., 4., 2., 7., 7.]),
+    ('average', False, 'bottom', True,
+        [0.5, 0.5, 0.875, 0.125, 0.5, 0.25, 0.875, 0.875]),
+    ('min', True, 'bottom', False, [1., 1., 6., 5., 1., 4., 6., 6.]),
+    ('min', True, 'bottom', True,
+        [0.125, 0.125, 0.75, 0.625, 0.125, 0.5, 0.75, 0.75]),
+    ('min', False, 'bottom', False, [3., 3., 6., 1., 3., 2., 6., 6.]),
+    ('min', False, 'bottom', True,
+        [0.375, 0.375, 0.75, 0.125, 0.375, 0.25, 0.75, 0.75]),
+    ('max', True, 'bottom', False, [3., 3., 8., 5., 3., 4., 8., 8.]),
+    ('max', True, 'bottom', True,
+        [0.375, 0.375, 1., 0.625, 0.375, 0.5, 1., 1.]),
+    ('max', False, 'bottom', False, [5., 5., 8., 1., 5., 2., 8., 8.]),
+    ('max', False, 'bottom', True,
+        [0.625, 0.625, 1., 0.125, 0.625, 0.25, 1., 1.]),
+    ('first', True, 'bottom', False, [1., 2., 6., 5., 3., 4., 7., 8.]),
+    ('first', True, 'bottom', True,
+        [0.125, 0.25, 0.75, 0.625, 0.375, 0.5, 0.875, 1.]),
+    ('first', False, 'bottom', False, [3., 4., 6., 1., 5., 2., 7., 8.]),
+    ('first', False, 'bottom', True,
+        [0.375, 0.5, 0.75, 0.125, 0.625, 0.25, 0.875, 1.]),
+    ('dense', True, 'bottom', False, [1., 1., 4., 3., 1., 2., 4., 4.]),
+    ('dense', True, 'bottom', True,
+     [0.25, 0.25, 1., 0.75, 0.25, 0.5, 1., 1.]),
+    ('dense', False, 'bottom', False, [3., 3., 4., 1., 3., 2., 4., 4.]),
+    ('dense', False, 'bottom', True,
+     [0.75, 0.75, 1., 0.25, 0.75, 0.5, 1., 1.])
+])
+def test_rank_args_missing(grps, vals, ties_method, ascending,
+                           na_option, pct, exp):
+    key = np.repeat(grps, len(vals))
+    vals = vals * len(grps)
+    df = DataFrame({'key': key, 'val': vals})
+    result = df.groupby('key').rank(method=ties_method,
+                                    ascending=ascending,
+                                    na_option=na_option, pct=pct)
+
+    exp_df = DataFrame(exp * len(grps), columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("pct,exp", [
+    (False, [3., 3., 3., 3., 3.]),
+    (True, [.6, .6, .6, .6, .6])])
+def test_rank_resets_each_group(pct, exp):
+    df = DataFrame(
+        {'key': ['a', 'a', 'a', 'a', 'a', 'b', 'b', 'b', 'b', 'b'],
+         'val': [1] * 10}
+    )
+    result = df.groupby('key').rank(pct=pct)
+    exp_df = DataFrame(exp * 2, columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+def test_rank_avg_even_vals():
+    df = DataFrame({'key': ['a'] * 4, 'val': [1] * 4})
+    result = df.groupby('key').rank()
+    exp_df = DataFrame([2.5, 2.5, 2.5, 2.5], columns=['val'])
+    tm.assert_frame_equal(result, exp_df)
+
+
+@pytest.mark.parametrize("ties_method", [
+    'average', 'min', 'max', 'first', 'dense'])
+@pytest.mark.parametrize("ascending", [True, False])
+@pytest.mark.parametrize("na_option", ["keep", "top", "bottom"])
+@pytest.mark.parametrize("pct", [True, False])
+@pytest.mark.parametrize("vals", [
+    ['bar', 'bar', 'foo', 'bar', 'baz'],
+    ['bar', np.nan, 'foo', np.nan, 'baz']
+])
+def test_rank_object_raises(ties_method, ascending, na_option,
+                            pct, vals):
+    df = DataFrame({'key': ['foo'] * 5, 'val': vals})
+
+    with pytest.raises(TypeError, match="not callable"):
+        df.groupby('key').rank(method=ties_method,
+                               ascending=ascending,
+                               na_option=na_option, pct=pct)
+
+
+@pytest.mark.parametrize("na_option", [True, "bad", 1])
+@pytest.mark.parametrize("ties_method", [
+    'average', 'min', 'max', 'first', 'dense'])
+@pytest.mark.parametrize("ascending", [True, False])
+@pytest.mark.parametrize("pct", [True, False])
+@pytest.mark.parametrize("vals", [
+    ['bar', 'bar', 'foo', 'bar', 'baz'],
+    ['bar', np.nan, 'foo', np.nan, 'baz'],
+    [1, np.nan, 2, np.nan, 3]
+])
+def test_rank_naoption_raises(ties_method, ascending, na_option, pct, vals):
+    df = DataFrame({'key': ['foo'] * 5, 'val': vals})
+    msg = "na_option must be one of 'keep', 'top', or 'bottom'"
+
+    with pytest.raises(ValueError, match=msg):
+        df.groupby('key').rank(method=ties_method,
+                               ascending=ascending,
+                               na_option=na_option, pct=pct)
+
+
+def test_rank_empty_group():
+    # see gh-22519
+    column = "A"
+    df = DataFrame({
+        "A": [0, 1, 0],
+        "B": [1., np.nan, 2.]
+    })
+
+    result = df.groupby(column).B.rank(pct=True)
+    expected = Series([0.5, np.nan, 1.0], name="B")
+    tm.assert_series_equal(result, expected)
+
+    result = df.groupby(column).rank(pct=True)
+    expected = DataFrame({"B": [0.5, np.nan, 1.0]})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("input_key,input_value,output_value", [
+    ([1, 2], [1, 1], [1.0, 1.0]),
+    ([1, 1, 2, 2], [1, 2, 1, 2], [0.5, 1.0, 0.5, 1.0]),
+    ([1, 1, 2, 2], [1, 2, 1, np.nan], [0.5, 1.0, 1.0, np.nan]),
+    ([1, 1, 2], [1, 2, np.nan], [0.5, 1.0, np.nan])
+])
+def test_rank_zero_div(input_key, input_value, output_value):
+    # GH 23666
+    df = DataFrame({"A": input_key, "B": input_value})
+
+    result = df.groupby("A").rank(method="dense", pct=True)
+    expected = DataFrame({"B": output_value})
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_timegrouper.py b/pandas/tests/groupby/test_timegrouper.py
index 3142b74b56778..a2f2c1392b251 100644
--- a/pandas/tests/groupby/test_timegrouper.py
+++ b/pandas/tests/groupby/test_timegrouper.py
@@ -1,17 +1,22 @@
 """ test with the TimeGrouper / grouping with datetimes """
 
 from datetime import datetime
+
 import numpy as np
 from numpy import nan
+import pytest
+import pytz
 
-import pandas as pd
-from pandas import DataFrame, date_range, Index, Series, MultiIndex, Timestamp
 from pandas.compat import StringIO
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, Timestamp, date_range
+from pandas.core.groupby.ops import BinGrouper
 from pandas.util import testing as tm
 from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestGroupBy(tm.TestCase):
+class TestGroupBy(object):
 
     def test_groupby_with_timegrouper(self):
         # GH 4161
@@ -37,28 +42,28 @@ def test_groupby_with_timegrouper(self):
             df = df.set_index(['Date'])
 
             expected = DataFrame(
-                {'Quantity': np.nan},
-                index=date_range('20130901 13:00:00',
-                                 '20131205 13:00:00', freq='5D',
+                {'Quantity': 0},
+                index=date_range('20130901',
+                                 '20131205', freq='5D',
                                  name='Date', closed='left'))
-            expected.iloc[[0, 6, 18], 0] = np.array(
-                [24., 6., 9.], dtype='float64')
+            expected.iloc[[0, 6, 18], 0] = np.array([24, 6, 9], dtype='int64')
 
             result1 = df.resample('5D') .sum()
             assert_frame_equal(result1, expected)
 
             df_sorted = df.sort_index()
-            result2 = df_sorted.groupby(pd.TimeGrouper(freq='5D')).sum()
+            result2 = df_sorted.groupby(pd.Grouper(freq='5D')).sum()
             assert_frame_equal(result2, expected)
 
-            result3 = df.groupby(pd.TimeGrouper(freq='5D')).sum()
+            result3 = df.groupby(pd.Grouper(freq='5D')).sum()
             assert_frame_equal(result3, expected)
 
-    def test_groupby_with_timegrouper_methods(self):
+    @pytest.mark.parametrize("should_sort", [True, False])
+    def test_groupby_with_timegrouper_methods(self, should_sort):
         # GH 3881
         # make sure API of timegrouper conforms
 
-        df_original = pd.DataFrame({
+        df = pd.DataFrame({
             'Branch': 'A A A A A B'.split(),
             'Buyer': 'Carl Mark Carl Joe Joe Carl'.split(),
             'Quantity': [1, 3, 5, 8, 9, 3],
@@ -72,16 +77,17 @@ def test_groupby_with_timegrouper_methods(self):
             ]
         })
 
-        df_sorted = df_original.sort_values(by='Quantity', ascending=False)
+        if should_sort:
+            df = df.sort_values(by='Quantity', ascending=False)
 
-        for df in [df_original, df_sorted]:
-            df = df.set_index('Date', drop=False)
-            g = df.groupby(pd.TimeGrouper('6M'))
-            self.assertTrue(g.group_keys)
-            self.assertTrue(isinstance(g.grouper, pd.core.groupby.BinGrouper))
-            groups = g.groups
-            self.assertTrue(isinstance(groups, dict))
-            self.assertTrue(len(groups) == 3)
+        df = df.set_index('Date', drop=False)
+        g = df.groupby(pd.Grouper(freq='6M'))
+        assert g.group_keys
+
+        assert isinstance(g.grouper, BinGrouper)
+        groups = g.groups
+        assert isinstance(groups, dict)
+        assert len(groups) == 3
 
     def test_timegrouper_with_reg_groups(self):
 
@@ -185,7 +191,7 @@ def test_timegrouper_with_reg_groups(self):
                                  ]).sum()
             assert_frame_equal(result, expected)
 
-            with self.assertRaises(KeyError):
+            with pytest.raises(KeyError):
                 df.groupby([pd.Grouper(freq='1M', key='foo'), 'Buyer']).sum()
 
             # passing the level
@@ -197,7 +203,7 @@ def test_timegrouper_with_reg_groups(self):
             )
             assert_frame_equal(result, expected)
 
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 df.groupby([pd.Grouper(freq='1M', level='foo'),
                             'Buyer']).sum()
 
@@ -218,7 +224,7 @@ def test_timegrouper_with_reg_groups(self):
             assert_frame_equal(result, expected)
 
             # error as we have both a level and a name!
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 df.groupby([pd.Grouper(freq='1M', key='Date',
                                        level='Date'), 'Buyer']).sum()
 
@@ -241,6 +247,8 @@ def test_timegrouper_with_reg_groups(self):
             result = df.groupby([pd.Grouper(freq='1M', key='Date')]).sum()
             assert_frame_equal(result, expected)
 
+    @pytest.mark.parametrize('freq', ['D', 'M', 'A', 'Q-APR'])
+    def test_timegrouper_with_reg_groups_freq(self, freq):
         # GH 6764 multiple grouping with/without sort
         df = DataFrame({
             'date': pd.to_datetime([
@@ -254,20 +262,24 @@ def test_timegrouper_with_reg_groups(self):
             'cost1': [12, 15, 10, 24, 39, 1, 0, 90, 45, 34, 1, 12]
         }).set_index('date')
 
-        for freq in ['D', 'M', 'A', 'Q-APR']:
-            expected = df.groupby('user_id')[
-                'whole_cost'].resample(
-                    freq).sum().dropna().reorder_levels(
-                        ['date', 'user_id']).sort_index().astype('int64')
-            expected.name = 'whole_cost'
-
-            result1 = df.sort_index().groupby([pd.TimeGrouper(freq=freq),
-                                               'user_id'])['whole_cost'].sum()
-            assert_series_equal(result1, expected)
-
-            result2 = df.groupby([pd.TimeGrouper(freq=freq), 'user_id'])[
-                'whole_cost'].sum()
-            assert_series_equal(result2, expected)
+        expected = (
+            df.groupby('user_id')['whole_cost']
+              .resample(freq)
+              .sum(min_count=1)  # XXX
+              .dropna()
+              .reorder_levels(['date', 'user_id'])
+              .sort_index()
+              .astype('int64')
+        )
+        expected.name = 'whole_cost'
+
+        result1 = df.sort_index().groupby([pd.Grouper(freq=freq),
+                                           'user_id'])['whole_cost'].sum()
+        assert_series_equal(result1, expected)
+
+        result2 = df.groupby([pd.Grouper(freq=freq), 'user_id'])[
+            'whole_cost'].sum()
+        assert_series_equal(result2, expected)
 
     def test_timegrouper_get_group(self):
         # GH 6914
@@ -336,7 +348,7 @@ def sumfunc_series(x):
             return pd.Series([x['value'].sum()], ('sum',))
 
         expected = df.groupby(pd.Grouper(key='date')).apply(sumfunc_series)
-        result = (df_dt.groupby(pd.TimeGrouper(freq='M', key='date'))
+        result = (df_dt.groupby(pd.Grouper(freq='M', key='date'))
                   .apply(sumfunc_series))
         assert_frame_equal(result.reset_index(drop=True),
                            expected.reset_index(drop=True))
@@ -354,25 +366,26 @@ def sumfunc_value(x):
             return x.value.sum()
 
         expected = df.groupby(pd.Grouper(key='date')).apply(sumfunc_value)
-        result = (df_dt.groupby(pd.TimeGrouper(freq='M', key='date'))
-                  .apply(sumfunc_value))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = (df_dt.groupby(pd.TimeGrouper(freq='M', key='date'))
+                      .apply(sumfunc_value))
         assert_series_equal(result.reset_index(drop=True),
                             expected.reset_index(drop=True))
 
     def test_groupby_groups_datetimeindex(self):
-        # #1430
-        from pandas.tseries.api import DatetimeIndex
+        # GH#1430
         periods = 1000
-        ind = DatetimeIndex(start='2012/1/1', freq='5min', periods=periods)
+        ind = pd.date_range(start='2012/1/1', freq='5min', periods=periods)
         df = DataFrame({'high': np.arange(periods),
                         'low': np.arange(periods)}, index=ind)
         grouped = df.groupby(lambda x: datetime(x.year, x.month, x.day))
 
         # it works!
         groups = grouped.groups
-        tm.assertIsInstance(list(groups.keys())[0], datetime)
+        assert isinstance(list(groups.keys())[0], datetime)
 
-        # GH 11442
+        # GH#11442
         index = pd.date_range('2015/01/01', periods=5, name='date')
         df = pd.DataFrame({'A': [5, 6, 7, 8, 9],
                            'B': [1, 2, 3, 4, 5]}, index=index)
@@ -442,7 +455,7 @@ def test_frame_datetime64_handling_groupby(self):
                         (3, np.datetime64('2012-07-04'))],
                        columns=['a', 'date'])
         result = df.groupby('a').first()
-        self.assertEqual(result['date'][3], Timestamp('2012-07-03'))
+        assert result['date'][3] == Timestamp('2012-07-03')
 
     def test_groupby_multi_timezone(self):
 
@@ -526,15 +539,15 @@ def test_groupby_first_datetime64(self):
         df = DataFrame([(1, 1351036800000000000), (2, 1351036800000000000)])
         df[1] = df[1].view('M8[ns]')
 
-        self.assertTrue(issubclass(df[1].dtype.type, np.datetime64))
+        assert issubclass(df[1].dtype.type, np.datetime64)
 
         result = df.groupby(level=0).first()
         got_dt = result[1].dtype
-        self.assertTrue(issubclass(got_dt.type, np.datetime64))
+        assert issubclass(got_dt.type, np.datetime64)
 
         result = df[1].groupby(level=0).first()
         got_dt = result.dtype
-        self.assertTrue(issubclass(got_dt.type, np.datetime64))
+        assert issubclass(got_dt.type, np.datetime64)
 
     def test_groupby_max_datetime64(self):
         # GH 5869
@@ -567,16 +580,14 @@ def test_groupby_with_timezone_selection(self):
         tm.assert_series_equal(df1, df2)
 
     def test_timezone_info(self):
-        # GH 11682
-        # Timezone info lost when broadcasting scalar datetime to DataFrame
-        tm._skip_if_no_pytz()
-        import pytz
+        # see gh-11682: Timezone info lost when broadcasting
+        # scalar datetime to DataFrame
 
         df = pd.DataFrame({'a': [1], 'b': [datetime.now(pytz.utc)]})
-        self.assertEqual(df['b'][0].tzinfo, pytz.utc)
+        assert df['b'][0].tzinfo == pytz.utc
         df = pd.DataFrame({'a': [1, 2, 3]})
         df['b'] = datetime.now(pytz.utc)
-        self.assertEqual(df['b'][0].tzinfo, pytz.utc)
+        assert df['b'][0].tzinfo == pytz.utc
 
     def test_datetime_count(self):
         df = DataFrame({'a': [1, 2, 3] * 2,
@@ -598,7 +609,7 @@ def test_first_last_max_min_on_time_data(self):
              'td': [nan, td(days=1), td(days=2), td(days=3), nan]})
         df_test.dt = pd.to_datetime(df_test.dt)
         df_test['group'] = 'A'
-        df_ref = df_test[df_test.dt.notnull()]
+        df_ref = df_test[df_test.dt.notna()]
 
         grouped_test = df_test.groupby('group')
         grouped_ref = df_ref.groupby('group')
@@ -607,3 +618,35 @@ def test_first_last_max_min_on_time_data(self):
         assert_frame_equal(grouped_ref.min(), grouped_test.min())
         assert_frame_equal(grouped_ref.first(), grouped_test.first())
         assert_frame_equal(grouped_ref.last(), grouped_test.last())
+
+    def test_nunique_with_timegrouper_and_nat(self):
+        # GH 17575
+        test = pd.DataFrame({
+            'time': [Timestamp('2016-06-28 09:35:35'),
+                     pd.NaT,
+                     Timestamp('2016-06-28 16:46:28')],
+            'data': ['1', '2', '3']})
+
+        grouper = pd.Grouper(key='time', freq='h')
+        result = test.groupby(grouper)['data'].nunique()
+        expected = test[test.time.notnull()].groupby(grouper)['data'].nunique()
+        tm.assert_series_equal(result, expected)
+
+    def test_scalar_call_versus_list_call(self):
+        # Issue: 17530
+        data_frame = {
+            'location': ['shanghai', 'beijing', 'shanghai'],
+            'time': pd.Series(['2017-08-09 13:32:23', '2017-08-11 23:23:15',
+                               '2017-08-11 22:23:15'],
+                              dtype='datetime64[ns]'),
+            'value': [1, 2, 3]
+        }
+        data_frame = pd.DataFrame(data_frame).set_index('time')
+        grouper = pd.Grouper(freq='D')
+
+        grouped = data_frame.groupby(grouper)
+        result = grouped.count()
+        grouped = data_frame.groupby([grouper])
+        expected = grouped.count()
+
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_transform.py b/pandas/tests/groupby/test_transform.py
index 3b85fadda6cfe..b645073fcf72a 100644
--- a/pandas/tests/groupby/test_transform.py
+++ b/pandas/tests/groupby/test_transform.py
@@ -1,559 +1,847 @@
 """ test with the .transform """
 
 import numpy as np
-import pandas as pd
-from pandas.util import testing as tm
-from pandas import Series, DataFrame, Timestamp, MultiIndex, concat, date_range
-from pandas.types.common import _ensure_platform_int, is_timedelta64_dtype
-from pandas.compat import StringIO
+import pytest
+
 from pandas._libs import groupby
-from .common import MixIn, assert_fp_equal
+from pandas.compat import StringIO
 
-from pandas.util.testing import assert_frame_equal, assert_series_equal
-from pandas.core.groupby import DataError
+from pandas.core.dtypes.common import ensure_platform_int, is_timedelta64_dtype
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Series, Timestamp, concat, date_range
 from pandas.core.config import option_context
+from pandas.core.groupby.groupby import DataError
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+def assert_fp_equal(a, b):
+    assert (np.abs(a - b) < 1e-12).all()
+
+
+def test_transform():
+    data = Series(np.arange(9) // 3, index=np.arange(9))
+
+    index = np.arange(9)
+    np.random.shuffle(index)
+    data = data.reindex(index)
+
+    grouped = data.groupby(lambda x: x // 3)
+
+    transformed = grouped.transform(lambda x: x * x.sum())
+    assert transformed[7] == 12
+
+    # GH 8046
+    # make sure that we preserve the input order
+
+    df = DataFrame(
+        np.arange(6, dtype='int64').reshape(
+            3, 2), columns=["a", "b"], index=[0, 2, 1])
+    key = [0, 0, 1]
+    expected = df.sort_index().groupby(key).transform(
+        lambda x: x - x.mean()).groupby(key).mean()
+    result = df.groupby(key).transform(lambda x: x - x.mean()).groupby(
+        key).mean()
+    assert_frame_equal(result, expected)
+
+    def demean(arr):
+        return arr - arr.mean()
+
+    people = DataFrame(np.random.randn(5, 5),
+                       columns=['a', 'b', 'c', 'd', 'e'],
+                       index=['Joe', 'Steve', 'Wes', 'Jim', 'Travis'])
+    key = ['one', 'two', 'one', 'two', 'one']
+    result = people.groupby(key).transform(demean).groupby(key).mean()
+    expected = people.groupby(key).apply(demean).groupby(key).mean()
+    assert_frame_equal(result, expected)
+
+    # GH 8430
+    df = tm.makeTimeDataFrame()
+    g = df.groupby(pd.Grouper(freq='M'))
+    g.transform(lambda x: x - 1)
+
+    # GH 9700
+    df = DataFrame({'a': range(5, 10), 'b': range(5)})
+    result = df.groupby('a').transform(max)
+    expected = DataFrame({'b': range(5)})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_transform_fast():
+
+    df = DataFrame({'id': np.arange(100000) / 3,
+                    'val': np.random.randn(100000)})
+
+    grp = df.groupby('id')['val']
+
+    values = np.repeat(grp.mean().values,
+                       ensure_platform_int(grp.count().values))
+    expected = pd.Series(values, index=df.index, name='val')
+
+    result = grp.transform(np.mean)
+    assert_series_equal(result, expected)
+
+    result = grp.transform('mean')
+    assert_series_equal(result, expected)
+
+    # GH 12737
+    df = pd.DataFrame({'grouping': [0, 1, 1, 3], 'f': [1.1, 2.1, 3.1, 4.5],
+                       'd': pd.date_range('2014-1-1', '2014-1-4'),
+                       'i': [1, 2, 3, 4]},
+                      columns=['grouping', 'f', 'i', 'd'])
+    result = df.groupby('grouping').transform('first')
+
+    dates = [pd.Timestamp('2014-1-1'), pd.Timestamp('2014-1-2'),
+             pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-4')]
+    expected = pd.DataFrame({'f': [1.1, 2.1, 2.1, 4.5],
+                             'd': dates,
+                             'i': [1, 2, 2, 4]},
+                            columns=['f', 'i', 'd'])
+    assert_frame_equal(result, expected)
+
+    # selection
+    result = df.groupby('grouping')[['f', 'i']].transform('first')
+    expected = expected[['f', 'i']]
+    assert_frame_equal(result, expected)
+
+    # dup columns
+    df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=['g', 'a', 'a'])
+    result = df.groupby('g').transform('first')
+    expected = df.drop('g', axis=1)
+    assert_frame_equal(result, expected)
+
+
+def test_transform_broadcast(tsframe, ts):
+    grouped = ts.groupby(lambda x: x.month)
+    result = grouped.transform(np.mean)
+
+    tm.assert_index_equal(result.index, ts.index)
+    for _, gp in grouped:
+        assert_fp_equal(result.reindex(gp.index), gp.mean())
+
+    grouped = tsframe.groupby(lambda x: x.month)
+    result = grouped.transform(np.mean)
+    tm.assert_index_equal(result.index, tsframe.index)
+    for _, gp in grouped:
+        agged = gp.mean()
+        res = result.reindex(gp.index)
+        for col in tsframe:
+            assert_fp_equal(res[col], agged[col])
+
+    # group columns
+    grouped = tsframe.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
+                              axis=1)
+    result = grouped.transform(np.mean)
+    tm.assert_index_equal(result.index, tsframe.index)
+    tm.assert_index_equal(result.columns, tsframe.columns)
+    for _, gp in grouped:
+        agged = gp.mean(1)
+        res = result.reindex(columns=gp.columns)
+        for idx in gp.index:
+            assert_fp_equal(res.xs(idx), agged[idx])
+
+
+def test_transform_axis(tsframe):
+
+    # make sure that we are setting the axes
+    # correctly when on axis=0 or 1
+    # in the presence of a non-monotonic indexer
+    # GH12713
+
+    base = tsframe.iloc[0:5]
+    r = len(base.index)
+    c = len(base.columns)
+    tso = DataFrame(np.random.randn(r, c),
+                    index=base.index,
+                    columns=base.columns,
+                    dtype='float64')
+    # monotonic
+    ts = tso
+    grouped = ts.groupby(lambda x: x.weekday())
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: x - x.mean())
+    assert_frame_equal(result, expected)
+
+    ts = ts.T
+    grouped = ts.groupby(lambda x: x.weekday(), axis=1)
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
+    assert_frame_equal(result, expected)
+
+    # non-monotonic
+    ts = tso.iloc[[1, 0] + list(range(2, len(base)))]
+    grouped = ts.groupby(lambda x: x.weekday())
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: x - x.mean())
+    assert_frame_equal(result, expected)
+
+    ts = ts.T
+    grouped = ts.groupby(lambda x: x.weekday(), axis=1)
+    result = ts - grouped.transform('mean')
+    expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
+    assert_frame_equal(result, expected)
+
+
+def test_transform_dtype():
+    # GH 9807
+    # Check transform dtype output is preserved
+    df = DataFrame([[1, 3], [2, 3]])
+    result = df.groupby(1).transform('mean')
+    expected = DataFrame([[1.5], [1.5]])
+    assert_frame_equal(result, expected)
+
+
+def test_transform_bug():
+    # GH 5712
+    # transforming on a datetime column
+    df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
+    result = df.groupby('A')['B'].transform(
+        lambda x: x.rank(ascending=False))
+    expected = Series(np.arange(5, 0, step=-1), name='B')
+    assert_series_equal(result, expected)
+
+
+def test_transform_numeric_to_boolean():
+    # GH 16875
+    # inconsistency in transforming boolean values
+    expected = pd.Series([True, True], name='A')
+
+    df = pd.DataFrame({'A': [1.1, 2.2], 'B': [1, 2]})
+    result = df.groupby('B').A.transform(lambda x: True)
+    assert_series_equal(result, expected)
+
+    df = pd.DataFrame({'A': [1, 2], 'B': [1, 2]})
+    result = df.groupby('B').A.transform(lambda x: True)
+    assert_series_equal(result, expected)
+
+
+def test_transform_datetime_to_timedelta():
+    # GH 15429
+    # transforming a datetime to timedelta
+    df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
+    expected = pd.Series([
+        Timestamp('20130101') - Timestamp('20130101')] * 5, name='A')
+
+    # this does date math without changing result type in transform
+    base_time = df['A'][0]
+    result = df.groupby('A')['A'].transform(
+        lambda x: x.max() - x.min() + base_time) - base_time
+    assert_series_equal(result, expected)
+
+    # this does date math and causes the transform to return timedelta
+    result = df.groupby('A')['A'].transform(lambda x: x.max() - x.min())
+    assert_series_equal(result, expected)
+
+
+def test_transform_datetime_to_numeric():
+    # GH 10972
+    # convert dt to float
+    df = DataFrame({
+        'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
+    result = df.groupby('a').b.transform(
+        lambda x: x.dt.dayofweek - x.dt.dayofweek.mean())
+
+    expected = Series([-0.5, 0.5], name='b')
+    assert_series_equal(result, expected)
+
+    # convert dt to int
+    df = DataFrame({
+        'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
+    result = df.groupby('a').b.transform(
+        lambda x: x.dt.dayofweek - x.dt.dayofweek.min())
+
+    expected = Series([0, 1], name='b')
+    assert_series_equal(result, expected)
+
+
+def test_transform_casting():
+    # 13046
+    data = """
+    idx     A         ID3              DATETIME
+    0   B-028  b76cd912ff "2014-10-08 13:43:27"
+    1   B-054  4a57ed0b02 "2014-10-08 14:26:19"
+    2   B-076  1a682034f8 "2014-10-08 14:29:01"
+    3   B-023  b76cd912ff "2014-10-08 18:39:34"
+    4   B-023  f88g8d7sds "2014-10-08 18:40:18"
+    5   B-033  b76cd912ff "2014-10-08 18:44:30"
+    6   B-032  b76cd912ff "2014-10-08 18:46:00"
+    7   B-037  b76cd912ff "2014-10-08 18:52:15"
+    8   B-046  db959faf02 "2014-10-08 18:59:59"
+    9   B-053  b76cd912ff "2014-10-08 19:17:48"
+    10  B-065  b76cd912ff "2014-10-08 19:21:38"
+    """
+    df = pd.read_csv(StringIO(data), sep=r'\s+',
+                     index_col=[0], parse_dates=['DATETIME'])
+
+    result = df.groupby('ID3')['DATETIME'].transform(lambda x: x.diff())
+    assert is_timedelta64_dtype(result.dtype)
+
+    result = df[['ID3', 'DATETIME']].groupby('ID3').transform(
+        lambda x: x.diff())
+    assert is_timedelta64_dtype(result.DATETIME.dtype)
+
+
+def test_transform_multiple(ts):
+    grouped = ts.groupby([lambda x: x.year, lambda x: x.month])
+
+    grouped.transform(lambda x: x * 2)
+    grouped.transform(np.mean)
+
+
+def test_dispatch_transform(tsframe):
+    df = tsframe[::5].reindex(tsframe.index)
+
+    grouped = df.groupby(lambda x: x.month)
+
+    filled = grouped.fillna(method='pad')
+    fillit = lambda x: x.fillna(method='pad')
+    expected = df.groupby(lambda x: x.month).transform(fillit)
+    assert_frame_equal(filled, expected)
+
+
+def test_transform_select_columns(df):
+    f = lambda x: x.mean()
+    result = df.groupby('A')['C', 'D'].transform(f)
+
+    selection = df[['C', 'D']]
+    expected = selection.groupby(df['A']).transform(f)
+
+    assert_frame_equal(result, expected)
+
+
+def test_transform_exclude_nuisance(df):
+
+    # this also tests orderings in transform between
+    # series/frame to make sure it's consistent
+    expected = {}
+    grouped = df.groupby('A')
+    expected['C'] = grouped['C'].transform(np.mean)
+    expected['D'] = grouped['D'].transform(np.mean)
+    expected = DataFrame(expected)
+    result = df.groupby('A').transform(np.mean)
+
+    assert_frame_equal(result, expected)
+
+
+def test_transform_function_aliases(df):
+    result = df.groupby('A').transform('mean')
+    expected = df.groupby('A').transform(np.mean)
+    assert_frame_equal(result, expected)
+
+    result = df.groupby('A')['C'].transform('mean')
+    expected = df.groupby('A')['C'].transform(np.mean)
+    assert_series_equal(result, expected)
+
+
+def test_series_fast_transform_date():
+    # GH 13191
+    df = pd.DataFrame({'grouping': [np.nan, 1, 1, 3],
+                       'd': pd.date_range('2014-1-1', '2014-1-4')})
+    result = df.groupby('grouping')['d'].transform('first')
+    dates = [pd.NaT, pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-2'),
+             pd.Timestamp('2014-1-4')]
+    expected = pd.Series(dates, name='d')
+    assert_series_equal(result, expected)
+
+
+def test_transform_length():
+    # GH 9697
+    df = pd.DataFrame({'col1': [1, 1, 2, 2], 'col2': [1, 2, 3, np.nan]})
+    expected = pd.Series([3.0] * 4)
+
+    def nsum(x):
+        return np.nansum(x)
+
+    results = [df.groupby('col1').transform(sum)['col2'],
+               df.groupby('col1')['col2'].transform(sum),
+               df.groupby('col1').transform(nsum)['col2'],
+               df.groupby('col1')['col2'].transform(nsum)]
+    for result in results:
+        assert_series_equal(result, expected, check_names=False)
+
+
+def test_transform_coercion():
+
+    # 14457
+    # when we are transforming be sure to not coerce
+    # via assignment
+    df = pd.DataFrame(dict(A=['a', 'a'], B=[0, 1]))
+    g = df.groupby('A')
+
+    expected = g.transform(np.mean)
+    result = g.transform(lambda x: np.mean(x))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_transform_with_int():
+
+    # GH 3740, make sure that we might upcast on item-by-item transform
+
+    # floats
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=Series(1, dtype='float64'),
+                        C=Series(
+                            [1, 2, 3, 1, 2, 3], dtype='float64'), D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
+    expected = DataFrame(dict(B=np.nan, C=Series(
+        [-1, 0, 1, -1, 0, 1], dtype='float64')))
+    assert_frame_equal(result, expected)
+
+    # int case
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1,
+                        C=[1, 2, 3, 1, 2, 3], D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
+    expected = DataFrame(dict(B=np.nan, C=[-1, 0, 1, -1, 0, 1]))
+    assert_frame_equal(result, expected)
 
+    # int that needs float conversion
+    s = Series([2, 3, 4, 10, 5, -1])
+    df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1, C=s, D='foo'))
+    with np.errstate(all='ignore'):
+        result = df.groupby('A').transform(
+            lambda x: (x - x.mean()) / x.std())
 
-class TestGroupBy(MixIn, tm.TestCase):
-
-    def test_transform(self):
-        data = Series(np.arange(9) // 3, index=np.arange(9))
-
-        index = np.arange(9)
-        np.random.shuffle(index)
-        data = data.reindex(index)
-
-        grouped = data.groupby(lambda x: x // 3)
-
-        transformed = grouped.transform(lambda x: x * x.sum())
-        self.assertEqual(transformed[7], 12)
-
-        # GH 8046
-        # make sure that we preserve the input order
-
-        df = DataFrame(
-            np.arange(6, dtype='int64').reshape(
-                3, 2), columns=["a", "b"], index=[0, 2, 1])
-        key = [0, 0, 1]
-        expected = df.sort_index().groupby(key).transform(
-            lambda x: x - x.mean()).groupby(key).mean()
-        result = df.groupby(key).transform(lambda x: x - x.mean()).groupby(
-            key).mean()
-        assert_frame_equal(result, expected)
-
-        def demean(arr):
-            return arr - arr.mean()
-
-        people = DataFrame(np.random.randn(5, 5),
-                           columns=['a', 'b', 'c', 'd', 'e'],
-                           index=['Joe', 'Steve', 'Wes', 'Jim', 'Travis'])
-        key = ['one', 'two', 'one', 'two', 'one']
-        result = people.groupby(key).transform(demean).groupby(key).mean()
-        expected = people.groupby(key).apply(demean).groupby(key).mean()
-        assert_frame_equal(result, expected)
-
-        # GH 8430
-        df = tm.makeTimeDataFrame()
-        g = df.groupby(pd.TimeGrouper('M'))
-        g.transform(lambda x: x - 1)
-
-        # GH 9700
-        df = DataFrame({'a': range(5, 10), 'b': range(5)})
-        result = df.groupby('a').transform(max)
-        expected = DataFrame({'b': range(5)})
-        tm.assert_frame_equal(result, expected)
-
-    def test_transform_fast(self):
-
-        df = DataFrame({'id': np.arange(100000) / 3,
-                        'val': np.random.randn(100000)})
-
-        grp = df.groupby('id')['val']
-
-        values = np.repeat(grp.mean().values,
-                           _ensure_platform_int(grp.count().values))
-        expected = pd.Series(values, index=df.index, name='val')
-
-        result = grp.transform(np.mean)
-        assert_series_equal(result, expected)
-
-        result = grp.transform('mean')
-        assert_series_equal(result, expected)
-
-        # GH 12737
-        df = pd.DataFrame({'grouping': [0, 1, 1, 3], 'f': [1.1, 2.1, 3.1, 4.5],
-                           'd': pd.date_range('2014-1-1', '2014-1-4'),
-                           'i': [1, 2, 3, 4]},
-                          columns=['grouping', 'f', 'i', 'd'])
-        result = df.groupby('grouping').transform('first')
-
-        dates = [pd.Timestamp('2014-1-1'), pd.Timestamp('2014-1-2'),
-                 pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-4')]
-        expected = pd.DataFrame({'f': [1.1, 2.1, 2.1, 4.5],
-                                 'd': dates,
-                                 'i': [1, 2, 2, 4]},
-                                columns=['f', 'i', 'd'])
-        assert_frame_equal(result, expected)
-
-        # selection
-        result = df.groupby('grouping')[['f', 'i']].transform('first')
-        expected = expected[['f', 'i']]
-        assert_frame_equal(result, expected)
-
-        # dup columns
-        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=['g', 'a', 'a'])
-        result = df.groupby('g').transform('first')
-        expected = df.drop('g', axis=1)
-        assert_frame_equal(result, expected)
-
-    def test_transform_broadcast(self):
-        grouped = self.ts.groupby(lambda x: x.month)
-        result = grouped.transform(np.mean)
-
-        self.assert_index_equal(result.index, self.ts.index)
-        for _, gp in grouped:
-            assert_fp_equal(result.reindex(gp.index), gp.mean())
-
-        grouped = self.tsframe.groupby(lambda x: x.month)
-        result = grouped.transform(np.mean)
-        self.assert_index_equal(result.index, self.tsframe.index)
-        for _, gp in grouped:
-            agged = gp.mean()
-            res = result.reindex(gp.index)
-            for col in self.tsframe:
-                assert_fp_equal(res[col], agged[col])
-
-        # group columns
-        grouped = self.tsframe.groupby({'A': 0, 'B': 0, 'C': 1, 'D': 1},
-                                       axis=1)
-        result = grouped.transform(np.mean)
-        self.assert_index_equal(result.index, self.tsframe.index)
-        self.assert_index_equal(result.columns, self.tsframe.columns)
-        for _, gp in grouped:
-            agged = gp.mean(1)
-            res = result.reindex(columns=gp.columns)
-            for idx in gp.index:
-                assert_fp_equal(res.xs(idx), agged[idx])
-
-    def test_transform_axis(self):
-
-        # make sure that we are setting the axes
-        # correctly when on axis=0 or 1
-        # in the presence of a non-monotonic indexer
-        # GH12713
-
-        base = self.tsframe.iloc[0:5]
-        r = len(base.index)
-        c = len(base.columns)
-        tso = DataFrame(np.random.randn(r, c),
-                        index=base.index,
-                        columns=base.columns,
-                        dtype='float64')
-        # monotonic
-        ts = tso
-        grouped = ts.groupby(lambda x: x.weekday())
-        result = ts - grouped.transform('mean')
-        expected = grouped.apply(lambda x: x - x.mean())
-        assert_frame_equal(result, expected)
-
-        ts = ts.T
-        grouped = ts.groupby(lambda x: x.weekday(), axis=1)
-        result = ts - grouped.transform('mean')
-        expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
-        assert_frame_equal(result, expected)
-
-        # non-monotonic
-        ts = tso.iloc[[1, 0] + list(range(2, len(base)))]
-        grouped = ts.groupby(lambda x: x.weekday())
-        result = ts - grouped.transform('mean')
-        expected = grouped.apply(lambda x: x - x.mean())
-        assert_frame_equal(result, expected)
-
-        ts = ts.T
-        grouped = ts.groupby(lambda x: x.weekday(), axis=1)
-        result = ts - grouped.transform('mean')
-        expected = grouped.apply(lambda x: (x.T - x.mean(1)).T)
-        assert_frame_equal(result, expected)
-
-    def test_transform_dtype(self):
-        # GH 9807
-        # Check transform dtype output is preserved
-        df = DataFrame([[1, 3], [2, 3]])
-        result = df.groupby(1).transform('mean')
-        expected = DataFrame([[1.5], [1.5]])
-        assert_frame_equal(result, expected)
-
-    def test_transform_bug(self):
-        # GH 5712
-        # transforming on a datetime column
-        df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
-        result = df.groupby('A')['B'].transform(
-            lambda x: x.rank(ascending=False))
-        expected = Series(np.arange(5, 0, step=-1), name='B')
-        assert_series_equal(result, expected)
-
-    def test_transform_datetime_to_timedelta(self):
-        # GH 15429
-        # transforming a datetime to timedelta
-        df = DataFrame(dict(A=Timestamp('20130101'), B=np.arange(5)))
-        expected = pd.Series([
-            Timestamp('20130101') - Timestamp('20130101')] * 5, name='A')
-
-        # this does date math without changing result type in transform
-        base_time = df['A'][0]
-        result = df.groupby('A')['A'].transform(
-            lambda x: x.max() - x.min() + base_time) - base_time
-        assert_series_equal(result, expected)
-
-        # this does date math and causes the transform to return timedelta
-        result = df.groupby('A')['A'].transform(lambda x: x.max() - x.min())
-        assert_series_equal(result, expected)
-
-    def test_transform_datetime_to_numeric(self):
-        # GH 10972
-        # convert dt to float
-        df = DataFrame({
-            'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
-        result = df.groupby('a').b.transform(
-            lambda x: x.dt.dayofweek - x.dt.dayofweek.mean())
-
-        expected = Series([-0.5, 0.5], name='b')
-        assert_series_equal(result, expected)
-
-        # convert dt to int
-        df = DataFrame({
-            'a': 1, 'b': date_range('2015-01-01', periods=2, freq='D')})
-        result = df.groupby('a').b.transform(
-            lambda x: x.dt.dayofweek - x.dt.dayofweek.min())
-
-        expected = Series([0, 1], name='b')
-        assert_series_equal(result, expected)
-
-    def test_transform_casting(self):
-        # 13046
-        data = """
-        idx     A         ID3              DATETIME
-        0   B-028  b76cd912ff "2014-10-08 13:43:27"
-        1   B-054  4a57ed0b02 "2014-10-08 14:26:19"
-        2   B-076  1a682034f8 "2014-10-08 14:29:01"
-        3   B-023  b76cd912ff "2014-10-08 18:39:34"
-        4   B-023  f88g8d7sds "2014-10-08 18:40:18"
-        5   B-033  b76cd912ff "2014-10-08 18:44:30"
-        6   B-032  b76cd912ff "2014-10-08 18:46:00"
-        7   B-037  b76cd912ff "2014-10-08 18:52:15"
-        8   B-046  db959faf02 "2014-10-08 18:59:59"
-        9   B-053  b76cd912ff "2014-10-08 19:17:48"
-        10  B-065  b76cd912ff "2014-10-08 19:21:38"
-        """
-        df = pd.read_csv(StringIO(data), sep='\s+',
-                         index_col=[0], parse_dates=['DATETIME'])
-
-        result = df.groupby('ID3')['DATETIME'].transform(lambda x: x.diff())
-        assert is_timedelta64_dtype(result.dtype)
-
-        result = df[['ID3', 'DATETIME']].groupby('ID3').transform(
-            lambda x: x.diff())
-        assert is_timedelta64_dtype(result.DATETIME.dtype)
-
-    def test_transform_multiple(self):
-        grouped = self.ts.groupby([lambda x: x.year, lambda x: x.month])
-
-        grouped.transform(lambda x: x * 2)
-        grouped.transform(np.mean)
-
-    def test_dispatch_transform(self):
-        df = self.tsframe[::5].reindex(self.tsframe.index)
-
-        grouped = df.groupby(lambda x: x.month)
-
-        filled = grouped.fillna(method='pad')
-        fillit = lambda x: x.fillna(method='pad')
-        expected = df.groupby(lambda x: x.month).transform(fillit)
-        assert_frame_equal(filled, expected)
-
-    def test_transform_select_columns(self):
-        f = lambda x: x.mean()
-        result = self.df.groupby('A')['C', 'D'].transform(f)
-
-        selection = self.df[['C', 'D']]
-        expected = selection.groupby(self.df['A']).transform(f)
-
-        assert_frame_equal(result, expected)
-
-    def test_transform_exclude_nuisance(self):
-
-        # this also tests orderings in transform between
-        # series/frame to make sure it's consistent
-        expected = {}
-        grouped = self.df.groupby('A')
-        expected['C'] = grouped['C'].transform(np.mean)
-        expected['D'] = grouped['D'].transform(np.mean)
-        expected = DataFrame(expected)
-        result = self.df.groupby('A').transform(np.mean)
-
-        assert_frame_equal(result, expected)
-
-    def test_transform_function_aliases(self):
-        result = self.df.groupby('A').transform('mean')
-        expected = self.df.groupby('A').transform(np.mean)
-        assert_frame_equal(result, expected)
-
-        result = self.df.groupby('A')['C'].transform('mean')
-        expected = self.df.groupby('A')['C'].transform(np.mean)
-        assert_series_equal(result, expected)
-
-    def test_series_fast_transform_date(self):
-        # GH 13191
-        df = pd.DataFrame({'grouping': [np.nan, 1, 1, 3],
-                           'd': pd.date_range('2014-1-1', '2014-1-4')})
-        result = df.groupby('grouping')['d'].transform('first')
-        dates = [pd.NaT, pd.Timestamp('2014-1-2'), pd.Timestamp('2014-1-2'),
-                 pd.Timestamp('2014-1-4')]
-        expected = pd.Series(dates, name='d')
-        assert_series_equal(result, expected)
-
-    def test_transform_length(self):
-        # GH 9697
-        df = pd.DataFrame({'col1': [1, 1, 2, 2], 'col2': [1, 2, 3, np.nan]})
-        expected = pd.Series([3.0] * 4)
-
-        def nsum(x):
-            return np.nansum(x)
-
-        results = [df.groupby('col1').transform(sum)['col2'],
-                   df.groupby('col1')['col2'].transform(sum),
-                   df.groupby('col1').transform(nsum)['col2'],
-                   df.groupby('col1')['col2'].transform(nsum)]
-        for result in results:
-            assert_series_equal(result, expected, check_names=False)
-
-    def test_transform_coercion(self):
-
-        # 14457
-        # when we are transforming be sure to not coerce
-        # via assignment
-        df = pd.DataFrame(dict(A=['a', 'a'], B=[0, 1]))
-        g = df.groupby('A')
-
-        expected = g.transform(np.mean)
-        result = g.transform(lambda x: np.mean(x))
-        assert_frame_equal(result, expected)
-
-    def test_groupby_transform_with_int(self):
-
-        # GH 3740, make sure that we might upcast on item-by-item transform
-
-        # floats
-        df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=Series(1, dtype='float64'),
-                            C=Series(
-                                [1, 2, 3, 1, 2, 3], dtype='float64'), D='foo'))
-        with np.errstate(all='ignore'):
-            result = df.groupby('A').transform(
-                lambda x: (x - x.mean()) / x.std())
-        expected = DataFrame(dict(B=np.nan, C=Series(
-            [-1, 0, 1, -1, 0, 1], dtype='float64')))
-        assert_frame_equal(result, expected)
-
-        # int case
-        df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1,
-                            C=[1, 2, 3, 1, 2, 3], D='foo'))
-        with np.errstate(all='ignore'):
-            result = df.groupby('A').transform(
-                lambda x: (x - x.mean()) / x.std())
-        expected = DataFrame(dict(B=np.nan, C=[-1, 0, 1, -1, 0, 1]))
-        assert_frame_equal(result, expected)
-
-        # int that needs float conversion
-        s = Series([2, 3, 4, 10, 5, -1])
-        df = DataFrame(dict(A=[1, 1, 1, 2, 2, 2], B=1, C=s, D='foo'))
-        with np.errstate(all='ignore'):
-            result = df.groupby('A').transform(
-                lambda x: (x - x.mean()) / x.std())
-
-        s1 = s.iloc[0:3]
-        s1 = (s1 - s1.mean()) / s1.std()
-        s2 = s.iloc[3:6]
-        s2 = (s2 - s2.mean()) / s2.std()
-        expected = DataFrame(dict(B=np.nan, C=concat([s1, s2])))
-        assert_frame_equal(result, expected)
-
-        # int downcasting
-        result = df.groupby('A').transform(lambda x: x * 2 / 2)
-        expected = DataFrame(dict(B=1, C=[2, 3, 4, 10, 5, -1]))
-        assert_frame_equal(result, expected)
-
-    def test_groupby_transform_with_nan_group(self):
-        # GH 9941
-        df = pd.DataFrame({'a': range(10),
-                           'b': [1, 1, 2, 3, np.nan, 4, 4, 5, 5, 5]})
-        result = df.groupby(df.b)['a'].transform(max)
-        expected = pd.Series([1., 1., 2., 3., np.nan, 6., 6., 9., 9., 9.],
-                             name='a')
-        assert_series_equal(result, expected)
-
-    def test_transform_mixed_type(self):
-        index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
-                                        ])
-        df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
-                        'c': np.tile(['a', 'b', 'c'], 2),
-                        'v': np.arange(1., 7.)}, index=index)
-
-        def f(group):
-            group['g'] = group['d'] * 2
-            return group[:1]
-
-        grouped = df.groupby('c')
-        result = grouped.apply(f)
-
-        self.assertEqual(result['d'].dtype, np.float64)
-
-        # this is by definition a mutating operation!
-        with option_context('mode.chained_assignment', None):
-            for key, group in grouped:
-                res = f(group)
-                assert_frame_equal(res, result.loc[key])
-
-    def test_cython_group_transform_algos(self):
-        # GH 4095
-        dtypes = [np.int8, np.int16, np.int32, np.int64, np.uint8, np.uint32,
-                  np.uint64, np.float32, np.float64]
-
-        ops = [(groupby.group_cumprod_float64, np.cumproduct, [np.float64]),
-               (groupby.group_cumsum, np.cumsum, dtypes)]
-
-        is_datetimelike = False
-        for pd_op, np_op, dtypes in ops:
-            for dtype in dtypes:
-                data = np.array([[1], [2], [3], [4]], dtype=dtype)
-                ans = np.zeros_like(data)
-                labels = np.array([0, 0, 0, 0], dtype=np.int64)
-                pd_op(ans, data, labels, is_datetimelike)
-                self.assert_numpy_array_equal(np_op(data), ans[:, 0],
-                                              check_dtype=False)
-
-        # with nans
-        labels = np.array([0, 0, 0, 0, 0], dtype=np.int64)
-
-        data = np.array([[1], [2], [3], [np.nan], [4]], dtype='float64')
-        actual = np.zeros_like(data)
-        actual.fill(np.nan)
-        groupby.group_cumprod_float64(actual, data, labels, is_datetimelike)
-        expected = np.array([1, 2, 6, np.nan, 24], dtype='float64')
-        self.assert_numpy_array_equal(actual[:, 0], expected)
-
-        actual = np.zeros_like(data)
-        actual.fill(np.nan)
-        groupby.group_cumsum(actual, data, labels, is_datetimelike)
-        expected = np.array([1, 3, 6, np.nan, 10], dtype='float64')
-        self.assert_numpy_array_equal(actual[:, 0], expected)
-
-        # timedelta
-        is_datetimelike = True
-        data = np.array([np.timedelta64(1, 'ns')] * 5, dtype='m8[ns]')[:, None]
-        actual = np.zeros_like(data, dtype='int64')
-        groupby.group_cumsum(actual, data.view('int64'), labels,
-                             is_datetimelike)
-        expected = np.array([np.timedelta64(1, 'ns'), np.timedelta64(
-            2, 'ns'), np.timedelta64(3, 'ns'), np.timedelta64(4, 'ns'),
-            np.timedelta64(5, 'ns')])
-        self.assert_numpy_array_equal(actual[:, 0].view('m8[ns]'), expected)
-
-    def test_cython_transform(self):
-        # GH 4095
-        ops = [(('cumprod',
-                 ()), lambda x: x.cumprod()), (('cumsum', ()),
-                                               lambda x: x.cumsum()),
-               (('shift', (-1, )),
-                lambda x: x.shift(-1)), (('shift',
-                                          (1, )), lambda x: x.shift())]
-
-        s = Series(np.random.randn(1000))
-        s_missing = s.copy()
-        s_missing.iloc[2:10] = np.nan
-        labels = np.random.randint(0, 50, size=1000).astype(float)
-
-        # series
-        for (op, args), targop in ops:
-            for data in [s, s_missing]:
-                # print(data.head())
-                expected = data.groupby(labels).transform(targop)
-
-                tm.assert_series_equal(expected,
-                                       data.groupby(labels).transform(op,
-                                                                      *args))
-                tm.assert_series_equal(expected, getattr(
-                    data.groupby(labels), op)(*args))
-
-        strings = list('qwertyuiopasdfghjklz')
-        strings_missing = strings[:]
-        strings_missing[5] = np.nan
-        df = DataFrame({'float': s,
-                        'float_missing': s_missing,
-                        'int': [1, 1, 1, 1, 2] * 200,
-                        'datetime': pd.date_range('1990-1-1', periods=1000),
-                        'timedelta': pd.timedelta_range(1, freq='s',
-                                                        periods=1000),
-                        'string': strings * 50,
-                        'string_missing': strings_missing * 50})
-        df['cat'] = df['string'].astype('category')
-
-        df2 = df.copy()
-        df2.index = pd.MultiIndex.from_product([range(100), range(10)])
-
-        # DataFrame - Single and MultiIndex,
-        # group by values, index level, columns
-        for df in [df, df2]:
-            for gb_target in [dict(by=labels), dict(level=0), dict(by='string')
-                              ]:  # dict(by='string_missing')]:
-                # dict(by=['int','string'])]:
-
-                gb = df.groupby(**gb_target)
-                # whitelisted methods set the selection before applying
-                # bit a of hack to make sure the cythonized shift
-                # is equivalent to pre 0.17.1 behavior
-                if op == 'shift':
-                    gb._set_group_selection()
-
-                for (op, args), targop in ops:
-                    if op != 'shift' and 'int' not in gb_target:
-                        # numeric apply fastpath promotes dtype so have
-                        # to apply seperately and concat
-                        i = gb[['int']].apply(targop)
-                        f = gb[['float', 'float_missing']].apply(targop)
-                        expected = pd.concat([f, i], axis=1)
-                    else:
-                        expected = gb.apply(targop)
-
-                    expected = expected.sort_index(axis=1)
-                    tm.assert_frame_equal(expected,
-                                          gb.transform(op, *args).sort_index(
-                                              axis=1))
-                    tm.assert_frame_equal(expected, getattr(gb, op)(*args))
-                    # individual columns
-                    for c in df:
-                        if c not in ['float', 'int', 'float_missing'
-                                     ] and op != 'shift':
-                            self.assertRaises(DataError, gb[c].transform, op)
-                            self.assertRaises(DataError, getattr(gb[c], op))
-                        else:
-                            expected = gb[c].apply(targop)
-                            expected.name = c
-                            tm.assert_series_equal(expected,
-                                                   gb[c].transform(op, *args))
-                            tm.assert_series_equal(expected,
-                                                   getattr(gb[c], op)(*args))
-
-    def test_transform_with_non_scalar_group(self):
-        # GH 10165
-        cols = pd.MultiIndex.from_tuples([
-            ('syn', 'A'), ('mis', 'A'), ('non', 'A'),
-            ('syn', 'C'), ('mis', 'C'), ('non', 'C'),
-            ('syn', 'T'), ('mis', 'T'), ('non', 'T'),
-            ('syn', 'G'), ('mis', 'G'), ('non', 'G')])
-        df = pd.DataFrame(np.random.randint(1, 10, (4, 12)),
-                          columns=cols,
-                          index=['A', 'C', 'G', 'T'])
-        self.assertRaisesRegexp(ValueError, 'transform must return a scalar '
-                                'value for each group.*', df.groupby
-                                (axis=1, level=1).transform,
-                                lambda z: z.div(z.sum(axis=1), axis=0))
+    s1 = s.iloc[0:3]
+    s1 = (s1 - s1.mean()) / s1.std()
+    s2 = s.iloc[3:6]
+    s2 = (s2 - s2.mean()) / s2.std()
+    expected = DataFrame(dict(B=np.nan, C=concat([s1, s2])))
+    assert_frame_equal(result, expected)
+
+    # int downcasting
+    result = df.groupby('A').transform(lambda x: x * 2 / 2)
+    expected = DataFrame(dict(B=1, C=[2, 3, 4, 10, 5, -1]))
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_transform_with_nan_group():
+    # GH 9941
+    df = pd.DataFrame({'a': range(10),
+                       'b': [1, 1, 2, 3, np.nan, 4, 4, 5, 5, 5]})
+    result = df.groupby(df.b)['a'].transform(max)
+    expected = pd.Series([1., 1., 2., 3., np.nan, 6., 6., 9., 9., 9.],
+                         name='a')
+    assert_series_equal(result, expected)
+
+
+def test_transform_mixed_type():
+    index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1], [1, 2, 3, 1, 2, 3]
+                                    ])
+    df = DataFrame({'d': [1., 1., 1., 2., 2., 2.],
+                    'c': np.tile(['a', 'b', 'c'], 2),
+                    'v': np.arange(1., 7.)}, index=index)
+
+    def f(group):
+        group['g'] = group['d'] * 2
+        return group[:1]
+
+    grouped = df.groupby('c')
+    result = grouped.apply(f)
+
+    assert result['d'].dtype == np.float64
+
+    # this is by definition a mutating operation!
+    with option_context('mode.chained_assignment', None):
+        for key, group in grouped:
+            res = f(group)
+            assert_frame_equal(res, result.loc[key])
+
+
+def _check_cython_group_transform_cumulative(pd_op, np_op, dtype):
+    """
+    Check a group transform that executes a cumulative function.
+
+    Parameters
+    ----------
+    pd_op : callable
+        The pandas cumulative function.
+    np_op : callable
+        The analogous one in NumPy.
+    dtype : type
+        The specified dtype of the data.
+    """
+
+    is_datetimelike = False
+
+    data = np.array([[1], [2], [3], [4]], dtype=dtype)
+    ans = np.zeros_like(data)
+
+    labels = np.array([0, 0, 0, 0], dtype=np.int64)
+    pd_op(ans, data, labels, is_datetimelike)
+
+    tm.assert_numpy_array_equal(np_op(data), ans[:, 0],
+                                check_dtype=False)
+
+
+def test_cython_group_transform_cumsum(any_real_dtype):
+    # see gh-4095
+    dtype = np.dtype(any_real_dtype).type
+    pd_op, np_op = groupby.group_cumsum, np.cumsum
+    _check_cython_group_transform_cumulative(pd_op, np_op, dtype)
+
+
+def test_cython_group_transform_cumprod():
+    # see gh-4095
+    dtype = np.float64
+    pd_op, np_op = groupby.group_cumprod_float64, np.cumproduct
+    _check_cython_group_transform_cumulative(pd_op, np_op, dtype)
+
+
+def test_cython_group_transform_algos():
+    # see gh-4095
+    is_datetimelike = False
+
+    # with nans
+    labels = np.array([0, 0, 0, 0, 0], dtype=np.int64)
+
+    data = np.array([[1], [2], [3], [np.nan], [4]], dtype='float64')
+    actual = np.zeros_like(data)
+    actual.fill(np.nan)
+    groupby.group_cumprod_float64(actual, data, labels, is_datetimelike)
+    expected = np.array([1, 2, 6, np.nan, 24], dtype='float64')
+    tm.assert_numpy_array_equal(actual[:, 0], expected)
+
+    actual = np.zeros_like(data)
+    actual.fill(np.nan)
+    groupby.group_cumsum(actual, data, labels, is_datetimelike)
+    expected = np.array([1, 3, 6, np.nan, 10], dtype='float64')
+    tm.assert_numpy_array_equal(actual[:, 0], expected)
+
+    # timedelta
+    is_datetimelike = True
+    data = np.array([np.timedelta64(1, 'ns')] * 5, dtype='m8[ns]')[:, None]
+    actual = np.zeros_like(data, dtype='int64')
+    groupby.group_cumsum(actual, data.view('int64'), labels,
+                         is_datetimelike)
+    expected = np.array([np.timedelta64(1, 'ns'), np.timedelta64(
+        2, 'ns'), np.timedelta64(3, 'ns'), np.timedelta64(4, 'ns'),
+        np.timedelta64(5, 'ns')])
+    tm.assert_numpy_array_equal(actual[:, 0].view('m8[ns]'), expected)
+
+
+@pytest.mark.parametrize(
+    "op, args, targop",
+    [('cumprod', (), lambda x: x.cumprod()),
+     ('cumsum', (), lambda x: x.cumsum()),
+     ('shift', (-1, ), lambda x: x.shift(-1)),
+     ('shift', (1, ), lambda x: x.shift())])
+def test_cython_transform_series(op, args, targop):
+    # GH 4095
+    s = Series(np.random.randn(1000))
+    s_missing = s.copy()
+    s_missing.iloc[2:10] = np.nan
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+
+    # series
+    for data in [s, s_missing]:
+        # print(data.head())
+        expected = data.groupby(labels).transform(targop)
+
+        tm.assert_series_equal(
+            expected,
+            data.groupby(labels).transform(op, *args))
+        tm.assert_series_equal(expected, getattr(
+            data.groupby(labels), op)(*args))
+
+
+@pytest.mark.parametrize("op", ['cumprod', 'cumsum'])
+@pytest.mark.parametrize("skipna", [False, True])
+@pytest.mark.parametrize('input, exp', [
+    # When everything is NaN
+    ({'key': ['b'] * 10, 'value': np.nan},
+     pd.Series([np.nan] * 10, name='value')),
+    # When there is a single NaN
+    ({'key': ['b'] * 10 + ['a'] * 2,
+      'value': [3] * 3 + [np.nan] + [3] * 8},
+     {('cumprod', False): [3.0, 9.0, 27.0] + [np.nan] * 7 + [3.0, 9.0],
+      ('cumprod', True): [3.0, 9.0, 27.0, np.nan, 81., 243., 729.,
+                          2187., 6561., 19683., 3.0, 9.0],
+      ('cumsum', False): [3.0, 6.0, 9.0] + [np.nan] * 7 + [3.0, 6.0],
+      ('cumsum', True): [3.0, 6.0, 9.0, np.nan, 12., 15., 18.,
+                         21., 24., 27., 3.0, 6.0]})])
+def test_groupby_cum_skipna(op, skipna, input, exp):
+    df = pd.DataFrame(input)
+    result = df.groupby('key')['value'].transform(op, skipna=skipna)
+    if isinstance(exp, dict):
+        expected = exp[(op, skipna)]
+    else:
+        expected = exp
+    expected = pd.Series(expected, name='value')
+    tm.assert_series_equal(expected, result)
+
+
+@pytest.mark.parametrize(
+    "op, args, targop",
+    [('cumprod', (), lambda x: x.cumprod()),
+     ('cumsum', (), lambda x: x.cumsum()),
+     ('shift', (-1, ), lambda x: x.shift(-1)),
+     ('shift', (1, ), lambda x: x.shift())])
+def test_cython_transform_frame(op, args, targop):
+    s = Series(np.random.randn(1000))
+    s_missing = s.copy()
+    s_missing.iloc[2:10] = np.nan
+    labels = np.random.randint(0, 50, size=1000).astype(float)
+    strings = list('qwertyuiopasdfghjklz')
+    strings_missing = strings[:]
+    strings_missing[5] = np.nan
+    df = DataFrame({'float': s,
+                    'float_missing': s_missing,
+                    'int': [1, 1, 1, 1, 2] * 200,
+                    'datetime': pd.date_range('1990-1-1', periods=1000),
+                    'timedelta': pd.timedelta_range(1, freq='s',
+                                                    periods=1000),
+                    'string': strings * 50,
+                    'string_missing': strings_missing * 50},
+                   columns=['float', 'float_missing', 'int', 'datetime',
+                            'timedelta', 'string', 'string_missing'])
+    df['cat'] = df['string'].astype('category')
+
+    df2 = df.copy()
+    df2.index = pd.MultiIndex.from_product([range(100), range(10)])
+
+    # DataFrame - Single and MultiIndex,
+    # group by values, index level, columns
+    for df in [df, df2]:
+        for gb_target in [dict(by=labels), dict(level=0), dict(by='string')
+                          ]:  # dict(by='string_missing')]:
+            # dict(by=['int','string'])]:
+
+            gb = df.groupby(**gb_target)
+            # whitelisted methods set the selection before applying
+            # bit a of hack to make sure the cythonized shift
+            # is equivalent to pre 0.17.1 behavior
+            if op == 'shift':
+                gb._set_group_selection()
+
+            if op != 'shift' and 'int' not in gb_target:
+                # numeric apply fastpath promotes dtype so have
+                # to apply separately and concat
+                i = gb[['int']].apply(targop)
+                f = gb[['float', 'float_missing']].apply(targop)
+                expected = pd.concat([f, i], axis=1)
+            else:
+                expected = gb.apply(targop)
+
+            expected = expected.sort_index(axis=1)
+            tm.assert_frame_equal(expected,
+                                  gb.transform(op, *args).sort_index(
+                                      axis=1))
+            tm.assert_frame_equal(
+                expected,
+                getattr(gb, op)(*args).sort_index(axis=1))
+            # individual columns
+            for c in df:
+                if c not in ['float', 'int', 'float_missing'
+                             ] and op != 'shift':
+                    msg = "No numeric types to aggregate"
+                    with pytest.raises(DataError, match=msg):
+                        gb[c].transform(op)
+                    with pytest.raises(DataError, match=msg):
+                        getattr(gb[c], op)()
+                else:
+                    expected = gb[c].apply(targop)
+                    expected.name = c
+                    tm.assert_series_equal(expected,
+                                           gb[c].transform(op, *args))
+                    tm.assert_series_equal(expected,
+                                           getattr(gb[c], op)(*args))
+
+
+def test_transform_with_non_scalar_group():
+    # GH 10165
+    cols = pd.MultiIndex.from_tuples([
+        ('syn', 'A'), ('mis', 'A'), ('non', 'A'),
+        ('syn', 'C'), ('mis', 'C'), ('non', 'C'),
+        ('syn', 'T'), ('mis', 'T'), ('non', 'T'),
+        ('syn', 'G'), ('mis', 'G'), ('non', 'G')])
+    df = pd.DataFrame(np.random.randint(1, 10, (4, 12)),
+                      columns=cols,
+                      index=['A', 'C', 'G', 'T'])
+
+    msg = 'transform must return a scalar value for each group.*'
+    with pytest.raises(ValueError, match=msg):
+        df.groupby(axis=1, level=1).transform(
+            lambda z: z.div(z.sum(axis=1), axis=0))
+
+
+@pytest.mark.parametrize('cols,exp,comp_func', [
+    ('a', pd.Series([1, 1, 1], name='a'), tm.assert_series_equal),
+    (['a', 'c'], pd.DataFrame({'a': [1, 1, 1], 'c': [1, 1, 1]}),
+     tm.assert_frame_equal)
+])
+@pytest.mark.parametrize('agg_func', [
+    'count', 'rank', 'size'])
+def test_transform_numeric_ret(cols, exp, comp_func, agg_func):
+    if agg_func == 'size' and isinstance(cols, list):
+        pytest.xfail("'size' transformation not supported with "
+                     "NDFrameGroupy")
+
+    # GH 19200
+    df = pd.DataFrame(
+        {'a': pd.date_range('2018-01-01', periods=3),
+         'b': range(3),
+         'c': range(7, 10)})
+
+    result = df.groupby('b')[cols].transform(agg_func)
+
+    if agg_func == 'rank':
+        exp = exp.astype('float')
+
+    comp_func(result, exp)
+
+
+@pytest.mark.parametrize("mix_groupings", [True, False])
+@pytest.mark.parametrize("as_series", [True, False])
+@pytest.mark.parametrize("val1,val2", [
+    ('foo', 'bar'), (1, 2), (1., 2.)])
+@pytest.mark.parametrize("fill_method,limit,exp_vals", [
+    ("ffill", None,
+     [np.nan, np.nan, 'val1', 'val1', 'val1', 'val2', 'val2', 'val2']),
+    ("ffill", 1,
+     [np.nan, np.nan, 'val1', 'val1', np.nan, 'val2', 'val2', np.nan]),
+    ("bfill", None,
+     ['val1', 'val1', 'val1', 'val2', 'val2', 'val2', np.nan, np.nan]),
+    ("bfill", 1,
+     [np.nan, 'val1', 'val1', np.nan, 'val2', 'val2', np.nan, np.nan])
+])
+def test_group_fill_methods(mix_groupings, as_series, val1, val2,
+                            fill_method, limit, exp_vals):
+    vals = [np.nan, np.nan, val1, np.nan, np.nan, val2, np.nan, np.nan]
+    _exp_vals = list(exp_vals)
+    # Overwrite placeholder values
+    for index, exp_val in enumerate(_exp_vals):
+        if exp_val == 'val1':
+            _exp_vals[index] = val1
+        elif exp_val == 'val2':
+            _exp_vals[index] = val2
+
+    # Need to modify values and expectations depending on the
+    # Series / DataFrame that we ultimately want to generate
+    if mix_groupings:  # ['a', 'b', 'a, 'b', ...]
+        keys = ['a', 'b'] * len(vals)
+
+        def interweave(list_obj):
+            temp = list()
+            for x in list_obj:
+                temp.extend([x, x])
+
+            return temp
+
+        _exp_vals = interweave(_exp_vals)
+        vals = interweave(vals)
+    else:  # ['a', 'a', 'a', ... 'b', 'b', 'b']
+        keys = ['a'] * len(vals) + ['b'] * len(vals)
+        _exp_vals = _exp_vals * 2
+        vals = vals * 2
+
+    df = DataFrame({'key': keys, 'val': vals})
+    if as_series:
+        result = getattr(
+            df.groupby('key')['val'], fill_method)(limit=limit)
+        exp = Series(_exp_vals, name='val')
+        assert_series_equal(result, exp)
+    else:
+        result = getattr(df.groupby('key'), fill_method)(limit=limit)
+        exp = DataFrame({'key': keys, 'val': _exp_vals})
+        assert_frame_equal(result, exp)
+
+
+@pytest.mark.parametrize("fill_method", ['ffill', 'bfill'])
+def test_pad_stable_sorting(fill_method):
+    # GH 21207
+    x = [0] * 20
+    y = [np.nan] * 10 + [1] * 10
+
+    if fill_method == 'bfill':
+        y = y[::-1]
+
+    df = pd.DataFrame({'x': x, 'y': y})
+    expected = df.copy()
+
+    result = getattr(df.groupby('x'), fill_method)()
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("test_series", [True, False])
+@pytest.mark.parametrize("freq", [
+    None,
+    pytest.param('D', marks=pytest.mark.xfail(
+        reason='GH#23918 before method uses freq in vectorized approach'))])
+@pytest.mark.parametrize("periods,fill_method,limit", [
+    (1, 'ffill', None), (1, 'ffill', 1),
+    (1, 'bfill', None), (1, 'bfill', 1),
+    (-1, 'ffill', None), (-1, 'ffill', 1),
+    (-1, 'bfill', None), (-1, 'bfill', 1),
+])
+def test_pct_change(test_series, freq, periods, fill_method, limit):
+    # GH  21200, 21621
+    vals = [3, np.nan, np.nan, np.nan, 1, 2, 4, 10, np.nan, 4]
+    keys = ['a', 'b']
+    key_v = np.repeat(keys, len(vals))
+    df = DataFrame({'key': key_v, 'vals': vals * 2})
+
+    df_g = getattr(df.groupby('key'), fill_method)(limit=limit)
+    grp = df_g.groupby('key')
+
+    expected = grp['vals'].obj / grp['vals'].shift(periods) - 1
+
+    if test_series:
+        result = df.groupby('key')['vals'].pct_change(
+            periods=periods, fill_method=fill_method, limit=limit, freq=freq)
+        tm.assert_series_equal(result, expected)
+    else:
+        result = df.groupby('key').pct_change(
+            periods=periods, fill_method=fill_method, limit=limit, freq=freq)
+        tm.assert_frame_equal(result, expected.to_frame('vals'))
+
+
+@pytest.mark.parametrize("func", [np.any, np.all])
+def test_any_all_np_func(func):
+    # GH 20653
+    df = pd.DataFrame([['foo', True],
+                       [np.nan, True],
+                       ['foo', True]], columns=['key', 'val'])
+
+    exp = pd.Series([True, np.nan, True], name='val')
+
+    res = df.groupby('key')['val'].transform(func)
+    tm.assert_series_equal(res, exp)
+
+
+def test_groupby_transform_rename():
+    # https://github.com/pandas-dev/pandas/issues/23461
+    def demean_rename(x):
+        result = x - x.mean()
+
+        if isinstance(x, pd.Series):
+            return result
+
+        result = result.rename(
+            columns={c: '{}_demeaned'.format(c) for c in result.columns})
+
+        return result
+
+    df = pd.DataFrame({'group': list('ababa'),
+                       'value': [1, 1, 1, 2, 2]})
+    expected = pd.DataFrame({'value': [-1. / 3, -0.5, -1. / 3, 0.5, 2. / 3]})
+
+    result = df.groupby('group').transform(demean_rename)
+    tm.assert_frame_equal(result, expected)
+    result_single = df.groupby('group').value.transform(demean_rename)
+    tm.assert_series_equal(result_single, expected['value'])
+
+
+@pytest.mark.parametrize('func', [min, max, np.min, np.max, 'first', 'last'])
+def test_groupby_transform_timezone_column(func):
+    # GH 24198
+    ts = pd.to_datetime('now', utc=True).tz_convert('Asia/Singapore')
+    result = pd.DataFrame({'end_time': [ts], 'id': [1]})
+    result['max_end_time'] = result.groupby('id').end_time.transform(func)
+    expected = pd.DataFrame([[ts, 1, ts]], columns=['end_time', 'id',
+                                                    'max_end_time'])
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/groupby/test_value_counts.py b/pandas/tests/groupby/test_value_counts.py
index 801d0da070112..2b5f87aa59a8d 100644
--- a/pandas/tests/groupby/test_value_counts.py
+++ b/pandas/tests/groupby/test_value_counts.py
@@ -1,60 +1,76 @@
-import pytest
+"""
+these are systematically testing all of the args to value_counts
+with different size combinations. This is to ensure stability of the sorting
+and proper parameter handling
+"""
 
 from itertools import product
+
 import numpy as np
+import pytest
 
+from pandas import DataFrame, MultiIndex, Series, date_range
 from pandas.util import testing as tm
-from pandas import MultiIndex, DataFrame, Series, date_range
 
 
-@pytest.mark.parametrize("n,m", product((100, 1000), (5, 20)))
-def test_series_groupby_value_counts(n, m):
+# our starting frame
+def seed_df(seed_nans, n, m):
     np.random.seed(1234)
+    days = date_range('2015-08-24', periods=10)
 
-    def rebuild_index(df):
-        arr = list(map(df.index.get_level_values, range(df.index.nlevels)))
-        df.index = MultiIndex.from_arrays(arr, names=df.index.names)
-        return df
-
-    def check_value_counts(df, keys, bins):
-        for isort, normalize, sort, ascending, dropna \
-                in product((False, True), repeat=5):
+    frame = DataFrame({
+        '1st': np.random.choice(
+            list('abcd'), n),
+        '2nd': np.random.choice(days, n),
+        '3rd': np.random.randint(1, m + 1, n)
+    })
 
-            kwargs = dict(normalize=normalize, sort=sort,
-                          ascending=ascending, dropna=dropna, bins=bins)
+    if seed_nans:
+        frame.loc[1::11, '1st'] = np.nan
+        frame.loc[3::17, '2nd'] = np.nan
+        frame.loc[7::19, '3rd'] = np.nan
+        frame.loc[8::19, '3rd'] = np.nan
+        frame.loc[9::19, '3rd'] = np.nan
 
-            gr = df.groupby(keys, sort=isort)
-            left = gr['3rd'].value_counts(**kwargs)
+    return frame
 
-            gr = df.groupby(keys, sort=isort)
-            right = gr['3rd'].apply(Series.value_counts, **kwargs)
-            right.index.names = right.index.names[:-1] + ['3rd']
 
-            # have to sort on index because of unstable sort on values
-            left, right = map(rebuild_index, (left, right))  # xref GH9212
-            tm.assert_series_equal(left.sort_index(), right.sort_index())
+# create input df, keys, and the bins
+binned = []
+ids = []
+for seed_nans in [True, False]:
+    for n, m in product((100, 1000), (5, 20)):
 
-    def loop(df):
+        df = seed_df(seed_nans, n, m)
         bins = None, np.arange(0, max(5, df['3rd'].max()) + 1, 2)
-        keys = '1st', '2nd', ('1st', '2nd')
+        keys = '1st', '2nd', ['1st', '2nd']
         for k, b in product(keys, bins):
-            check_value_counts(df, k, b)
+            binned.append((df, k, b, n, m))
+            ids.append("{}-{}-{}".format(k, n, m))
 
-    days = date_range('2015-08-24', periods=10)
 
-    frame = DataFrame({
-        '1st': np.random.choice(
-            list('abcd'), n),
-        '2nd': np.random.choice(days, n),
-        '3rd': np.random.randint(1, m + 1, n)
-    })
+@pytest.mark.slow
+@pytest.mark.parametrize("df, keys, bins, n, m", binned, ids=ids)
+def test_series_groupby_value_counts(df, keys, bins, n, m):
+
+    def rebuild_index(df):
+        arr = list(map(df.index.get_level_values, range(df.index.nlevels)))
+        df.index = MultiIndex.from_arrays(arr, names=df.index.names)
+        return df
+
+    for isort, normalize, sort, ascending, dropna \
+            in product((False, True), repeat=5):
+
+        kwargs = dict(normalize=normalize, sort=sort,
+                      ascending=ascending, dropna=dropna, bins=bins)
 
-    loop(frame)
+        gr = df.groupby(keys, sort=isort)
+        left = gr['3rd'].value_counts(**kwargs)
 
-    frame.loc[1::11, '1st'] = np.nan
-    frame.loc[3::17, '2nd'] = np.nan
-    frame.loc[7::19, '3rd'] = np.nan
-    frame.loc[8::19, '3rd'] = np.nan
-    frame.loc[9::19, '3rd'] = np.nan
+        gr = df.groupby(keys, sort=isort)
+        right = gr['3rd'].apply(Series.value_counts, **kwargs)
+        right.index.names = right.index.names[:-1] + ['3rd']
 
-    loop(frame)
+        # have to sort on index because of unstable sort on values
+        left, right = map(rebuild_index, (left, right))  # xref GH9212
+        tm.assert_series_equal(left.sort_index(), right.sort_index())
diff --git a/pandas/tests/groupby/test_whitelist.py b/pandas/tests/groupby/test_whitelist.py
index d566f34b7eae8..b7302b3911e58 100644
--- a/pandas/tests/groupby/test_whitelist.py
+++ b/pandas/tests/groupby/test_whitelist.py
@@ -3,83 +3,53 @@
 the so-called white/black lists
 """
 
-import pytest
 from string import ascii_lowercase
+
 import numpy as np
-from pandas import DataFrame, Series, compat, date_range, Index, MultiIndex
+import pytest
+
+from pandas import DataFrame, Index, MultiIndex, Series, compat, date_range
 from pandas.util import testing as tm
-from pandas.compat import lrange, product
 
 AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew',
                  'mad', 'std', 'var', 'sem']
 AGG_FUNCTIONS_WITH_SKIPNA = ['skew', 'mad']
 
-df_whitelist = frozenset([
-    'last',
-    'first',
-    'mean',
-    'sum',
-    'min',
-    'max',
-    'head',
-    'tail',
-    'cumcount',
-    'resample',
-    'rank',
+df_whitelist = [
     'quantile',
     'fillna',
     'mad',
-    'any',
-    'all',
     'take',
     'idxmax',
     'idxmin',
-    'shift',
     'tshift',
-    'ffill',
-    'bfill',
-    'pct_change',
     'skew',
     'plot',
-    'boxplot',
     'hist',
-    'median',
     'dtypes',
     'corrwith',
     'corr',
     'cov',
     'diff',
-])
-
-s_whitelist = frozenset([
-    'last',
-    'first',
-    'mean',
-    'sum',
-    'min',
-    'max',
-    'head',
-    'tail',
-    'cumcount',
-    'resample',
-    'rank',
+]
+
+
+@pytest.fixture(params=df_whitelist)
+def df_whitelist_fixture(request):
+    return request.param
+
+
+s_whitelist = [
     'quantile',
     'fillna',
     'mad',
-    'any',
-    'all',
     'take',
     'idxmax',
     'idxmin',
-    'shift',
     'tshift',
-    'ffill',
-    'bfill',
-    'pct_change',
     'skew',
     'plot',
     'hist',
-    'median',
     'dtype',
     'corr',
     'cov',
@@ -87,15 +57,22 @@
     'unique',
     'nlargest',
     'nsmallest',
-])
+    'is_monotonic_increasing',
+    'is_monotonic_decreasing',
+]
+
+
+@pytest.fixture(params=s_whitelist)
+def s_whitelist_fixture(request):
+    return request.param
 
 
 @pytest.fixture
 def mframe():
     index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
                                                               'three']],
-                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                        names=['first', 'second'])
     return DataFrame(np.random.randn(10, 3), index=index,
                      columns=['A', 'B', 'C'])
@@ -120,50 +97,61 @@ def df_letters():
     return df
 
 
-@pytest.mark.parametrize(
-    "obj, whitelist", zip((df_letters(), df_letters().floats),
-                          (df_whitelist, s_whitelist)))
-def test_groupby_whitelist(df_letters, obj, whitelist):
+@pytest.mark.parametrize("whitelist", [df_whitelist, s_whitelist])
+def test_groupby_whitelist(df_letters, whitelist):
     df = df_letters
-
-    # these are aliases so ok to have the alias __name__
-    alias = {'bfill': 'backfill',
-             'ffill': 'pad',
-             'boxplot': None}
+    if whitelist == df_whitelist:
+        # dataframe
+        obj = df_letters
+    else:
+        obj = df_letters['floats']
 
     gb = obj.groupby(df.letters)
 
-    assert whitelist == gb._apply_whitelist
-    for m in whitelist:
+    assert set(whitelist) == set(gb._apply_whitelist)
+
+
+def check_whitelist(obj, df, m):
+    # check the obj for a particular whitelist m
+
+    gb = obj.groupby(df.letters)
 
-        m = alias.get(m, m)
-        if m is None:
-            continue
+    f = getattr(type(gb), m)
 
-        f = getattr(type(gb), m)
+    # name
+    try:
+        n = f.__name__
+    except AttributeError:
+        return
+    assert n == m
 
-        # name
+    # qualname
+    if compat.PY3:
         try:
-            n = f.__name__
+            n = f.__qualname__
         except AttributeError:
-            continue
-        assert n == m
+            return
+        assert n.endswith(m)
 
-        # qualname
-        if compat.PY3:
-            try:
-                n = f.__qualname__
-            except AttributeError:
-                continue
-            assert n.endswith(m)
+
+def test_groupby_series_whitelist(df_letters, s_whitelist_fixture):
+    m = s_whitelist_fixture
+    df = df_letters
+    check_whitelist(df.letters, df, m)
+
+
+def test_groupby_frame_whitelist(df_letters, df_whitelist_fixture):
+    m = df_whitelist_fixture
+    df = df_letters
+    check_whitelist(df, df, m)
 
 
 @pytest.fixture
 def raw_frame():
     index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
                                                               'three']],
-                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                        names=['first', 'second'])
     raw_frame = DataFrame(np.random.randn(10, 3), index=index,
                           columns=Index(['A', 'B', 'C'], name='exp'))
@@ -172,14 +160,17 @@ def raw_frame():
     return raw_frame
 
 
-@pytest.mark.parametrize(
-    "op, level, axis, skipna",
-    product(AGG_FUNCTIONS,
-            lrange(2), lrange(2),
-            [True, False]))
-def test_regression_whitelist_methods(raw_frame, op, level, axis, skipna):
+@pytest.mark.parametrize('op', AGG_FUNCTIONS)
+@pytest.mark.parametrize('level', [0, 1])
+@pytest.mark.parametrize('axis', [0, 1])
+@pytest.mark.parametrize('skipna', [True, False])
+@pytest.mark.parametrize('sort', [True, False])
+def test_regression_whitelist_methods(
+        raw_frame, op, level,
+        axis, skipna, sort):
     # GH6944
-    # explicity test the whitelest methods
+    # GH 17537
+    # explicitly test the whitelist methods
 
     if axis == 0:
         frame = raw_frame
@@ -187,15 +178,19 @@ def test_regression_whitelist_methods(raw_frame, op, level, axis, skipna):
         frame = raw_frame.T
 
     if op in AGG_FUNCTIONS_WITH_SKIPNA:
-        grouped = frame.groupby(level=level, axis=axis)
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
         result = getattr(grouped, op)(skipna=skipna)
         expected = getattr(frame, op)(level=level, axis=axis,
                                       skipna=skipna)
+        if sort:
+            expected = expected.sort_index(axis=axis, level=level)
         tm.assert_frame_equal(result, expected)
     else:
-        grouped = frame.groupby(level=level, axis=axis)
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
         result = getattr(grouped, op)()
         expected = getattr(frame, op)(level=level, axis=axis)
+        if sort:
+            expected = expected.sort_index(axis=axis, level=level)
         tm.assert_frame_equal(result, expected)
 
 
@@ -223,24 +218,25 @@ def test_groupby_blacklist(df_letters):
         for obj in (df, s):
             gb = obj.groupby(df.letters)
             msg = fmt.format(bl, type(gb).__name__)
-            with tm.assertRaisesRegexp(AttributeError, msg):
+            with pytest.raises(AttributeError, match=msg):
                 getattr(gb, bl)
 
 
 def test_tab_completion(mframe):
     grp = mframe.groupby(level='second')
-    results = set([v for v in dir(grp) if not v.startswith('_')])
-    expected = set(
-        ['A', 'B', 'C', 'agg', 'aggregate', 'apply', 'boxplot', 'filter',
-         'first', 'get_group', 'groups', 'hist', 'indices', 'last', 'max',
-         'mean', 'median', 'min', 'name', 'ngroups', 'nth', 'ohlc', 'plot',
-         'prod', 'size', 'std', 'sum', 'transform', 'var', 'sem', 'count',
-         'nunique', 'head', 'describe', 'cummax', 'quantile',
-         'rank', 'cumprod', 'tail', 'resample', 'cummin', 'fillna',
-         'cumsum', 'cumcount', 'all', 'shift', 'skew',
-         'take', 'tshift', 'pct_change', 'any', 'mad', 'corr', 'corrwith',
-         'cov', 'dtypes', 'ndim', 'diff', 'idxmax', 'idxmin',
-         'ffill', 'bfill', 'pad', 'backfill', 'rolling', 'expanding'])
+    results = {v for v in dir(grp) if not v.startswith('_')}
+    expected = {
+        'A', 'B', 'C', 'agg', 'aggregate', 'apply', 'boxplot', 'filter',
+        'first', 'get_group', 'groups', 'hist', 'indices', 'last', 'max',
+        'mean', 'median', 'min', 'ngroups', 'nth', 'ohlc', 'plot',
+        'prod', 'size', 'std', 'sum', 'transform', 'var', 'sem', 'count',
+        'nunique', 'head', 'describe', 'cummax', 'quantile',
+        'rank', 'cumprod', 'tail', 'resample', 'cummin', 'fillna',
+        'cumsum', 'cumcount', 'ngroup', 'all', 'shift', 'skew',
+        'take', 'tshift', 'pct_change', 'any', 'mad', 'corr', 'corrwith',
+        'cov', 'dtypes', 'ndim', 'diff', 'idxmax', 'idxmin',
+        'ffill', 'bfill', 'pad', 'backfill', 'rolling', 'expanding', 'pipe',
+    }
     assert results == expected
 
 
diff --git a/pandas/tests/indexes/common.py b/pandas/tests/indexes/common.py
index ba76945834aff..6d29c147c4a4a 100644
--- a/pandas/tests/indexes/common.py
+++ b/pandas/tests/indexes/common.py
@@ -1,49 +1,99 @@
 # -*- coding: utf-8 -*-
 
-from pandas import compat
-from pandas.compat import PY3
-
 import numpy as np
+import pytest
 
-from pandas import (Series, Index, Float64Index, Int64Index, UInt64Index,
-                    RangeIndex, MultiIndex, CategoricalIndex, DatetimeIndex,
-                    TimedeltaIndex, PeriodIndex, notnull, isnull)
-from pandas.types.common import needs_i8_conversion
-from pandas.util.testing import assertRaisesRegexp
 from pandas._libs.tslib import iNaT
+import pandas.compat as compat
+from pandas.compat import PY3
 
-import pandas.util.testing as tm
+from pandas.core.dtypes.dtypes import CategoricalDtype
 
 import pandas as pd
+from pandas import (
+    CategoricalIndex, DatetimeIndex, Float64Index, Index, Int64Index,
+    IntervalIndex, MultiIndex, PeriodIndex, RangeIndex, Series, TimedeltaIndex,
+    UInt64Index, isna)
+from pandas.core.indexes.base import InvalidIndexError
+from pandas.core.indexes.datetimelike import DatetimeIndexOpsMixin
+import pandas.util.testing as tm
 
 
 class Base(object):
     """ base class for index sub-class tests """
     _holder = None
-    _compat_props = ['shape', 'ndim', 'size', 'itemsize', 'nbytes']
+    _compat_props = ['shape', 'ndim', 'size', 'nbytes']
 
     def setup_indices(self):
         for name, idx in self.indices.items():
             setattr(self, name, idx)
 
-    def verify_pickle(self, index):
-        unpickled = self.round_trip_pickle(index)
-        self.assertTrue(index.equals(unpickled))
-
     def test_pickle_compat_construction(self):
-        # this is testing for pickle compat
-        if self._holder is None:
-            return
-
         # need an object to create with
-        self.assertRaises(TypeError, self._holder)
+        msg = (r"Index\(\.\.\.\) must be called with a collection of some"
+               r" kind, None was passed|"
+               r"__new__\(\) missing 1 required positional argument: 'data'|"
+               r"__new__\(\) takes at least 2 arguments \(1 given\)")
+        with pytest.raises(TypeError, match=msg):
+            self._holder()
+
+    def test_to_series(self):
+        # assert that we are creating a copy of the index
+
+        idx = self.create_index()
+        s = idx.to_series()
+        assert s.values is not idx.values
+        assert s.index is not idx
+        assert s.name == idx.name
+
+    def test_to_series_with_arguments(self):
+        # GH18699
+
+        # index kwarg
+        idx = self.create_index()
+        s = idx.to_series(index=idx)
+
+        assert s.values is not idx.values
+        assert s.index is idx
+        assert s.name == idx.name
+
+        # name kwarg
+        idx = self.create_index()
+        s = idx.to_series(name='__test')
+
+        assert s.values is not idx.values
+        assert s.index is not idx
+        assert s.name != idx.name
+
+    @pytest.mark.parametrize("name", [None, "new_name"])
+    def test_to_frame(self, name):
+        # see GH-15230, GH-22580
+        idx = self.create_index()
+
+        if name:
+            idx_name = name
+        else:
+            idx_name = idx.name or 0
+
+        df = idx.to_frame(name=idx_name)
+
+        assert df.index is idx
+        assert len(df.columns) == 1
+        assert df.columns[0] == idx_name
+        assert df[idx_name].values is not idx.values
+
+        df = idx.to_frame(index=False, name=idx_name)
+        assert df.index is not idx
 
     def test_shift(self):
 
         # GH8083 test the base class for shift
         idx = self.create_index()
-        self.assertRaises(NotImplementedError, idx.shift, 1)
-        self.assertRaises(NotImplementedError, idx.shift, 1, 2)
+        msg = "Not supported for type {}".format(type(idx).__name__)
+        with pytest.raises(NotImplementedError, match=msg):
+            idx.shift(1)
+        with pytest.raises(NotImplementedError, match=msg):
+            idx.shift(1, 2)
 
     def test_create_index_existing_name(self):
 
@@ -78,38 +128,40 @@ def test_create_index_existing_name(self):
     def test_numeric_compat(self):
 
         idx = self.create_index()
-        tm.assertRaisesRegexp(TypeError, "cannot perform __mul__",
-                              lambda: idx * 1)
-        tm.assertRaisesRegexp(TypeError, "cannot perform __mul__",
-                              lambda: 1 * idx)
-
-        div_err = "cannot perform __truediv__" if PY3 \
-                  else "cannot perform __div__"
-        tm.assertRaisesRegexp(TypeError, div_err, lambda: idx / 1)
-        tm.assertRaisesRegexp(TypeError, div_err, lambda: 1 / idx)
-        tm.assertRaisesRegexp(TypeError, "cannot perform __floordiv__",
-                              lambda: idx // 1)
-        tm.assertRaisesRegexp(TypeError, "cannot perform __floordiv__",
-                              lambda: 1 // idx)
+        with pytest.raises(TypeError, match="cannot perform __mul__"):
+            idx * 1
+        with pytest.raises(TypeError, match="cannot perform __rmul__"):
+            1 * idx
+
+        div_err = ("cannot perform __truediv__" if PY3
+                   else "cannot perform __div__")
+        with pytest.raises(TypeError, match=div_err):
+            idx / 1
+
+        div_err = div_err.replace(' __', ' __r')
+        with pytest.raises(TypeError, match=div_err):
+            1 / idx
+        with pytest.raises(TypeError, match="cannot perform __floordiv__"):
+            idx // 1
+        with pytest.raises(TypeError, match="cannot perform __rfloordiv__"):
+            1 // idx
 
     def test_logical_compat(self):
         idx = self.create_index()
-        tm.assertRaisesRegexp(TypeError, 'cannot perform all',
-                              lambda: idx.all())
-        tm.assertRaisesRegexp(TypeError, 'cannot perform any',
-                              lambda: idx.any())
+        with pytest.raises(TypeError, match='cannot perform all'):
+            idx.all()
+        with pytest.raises(TypeError, match='cannot perform any'):
+            idx.any()
 
     def test_boolean_context_compat(self):
 
         # boolean context compat
         idx = self.create_index()
 
-        def f():
+        with pytest.raises(ValueError, match='The truth value of a'):
             if idx:
                 pass
 
-        tm.assertRaisesRegexp(ValueError, 'The truth value of a', f)
-
     def test_reindex_base(self):
         idx = self.create_index()
         expected = np.arange(idx.size, dtype=np.intp)
@@ -117,17 +169,36 @@ def test_reindex_base(self):
         actual = idx.get_indexer(idx)
         tm.assert_numpy_array_equal(expected, actual)
 
-        with tm.assertRaisesRegexp(ValueError, 'Invalid fill method'):
+        with pytest.raises(ValueError, match='Invalid fill method'):
             idx.get_indexer(idx, method='invalid')
 
+    def test_get_indexer_consistency(self):
+        # See GH 16819
+        for name, index in self.indices.items():
+            if isinstance(index, IntervalIndex):
+                continue
+
+            if index.is_unique or isinstance(index, CategoricalIndex):
+                indexer = index.get_indexer(index[0:2])
+                assert isinstance(indexer, np.ndarray)
+                assert indexer.dtype == np.intp
+            else:
+                e = "Reindexing only valid with uniquely valued Index objects"
+                with pytest.raises(InvalidIndexError, match=e):
+                    index.get_indexer(index[0:2])
+
+            indexer, _ = index.get_indexer_non_unique(index[0:2])
+            assert isinstance(indexer, np.ndarray)
+            assert indexer.dtype == np.intp
+
     def test_ndarray_compat_properties(self):
         idx = self.create_index()
-        self.assertTrue(idx.T.equals(idx))
-        self.assertTrue(idx.transpose().equals(idx))
+        assert idx.T.equals(idx)
+        assert idx.transpose().equals(idx)
 
         values = idx.values
         for prop in self._compat_props:
-            self.assertEqual(getattr(idx, prop), getattr(values, prop))
+            assert getattr(idx, prop) == getattr(values, prop)
 
         # test for validity
         idx.nbytes
@@ -143,14 +214,8 @@ def test_str(self):
         # test the string repr
         idx = self.create_index()
         idx.name = 'foo'
-        self.assertTrue("'foo'" in str(idx))
-        self.assertTrue(idx.__class__.__name__ in str(idx))
-
-    def test_dtype_str(self):
-        for idx in self.indices.values():
-            dtype = idx.dtype_str
-            self.assertIsInstance(dtype, compat.string_types)
-            self.assertEqual(dtype, str(idx.dtype))
+        assert "'foo'" in str(idx)
+        assert idx.__class__.__name__ in str(idx)
 
     def test_repr_max_seq_item_setting(self):
         # GH10182
@@ -158,54 +223,12 @@ def test_repr_max_seq_item_setting(self):
         idx = idx.repeat(50)
         with pd.option_context("display.max_seq_items", None):
             repr(idx)
-            self.assertFalse('...' in str(idx))
-
-    def test_wrong_number_names(self):
-        def testit(ind):
-            ind.names = ["apple", "banana", "carrot"]
-
-        for ind in self.indices.values():
-            assertRaisesRegexp(ValueError, "^Length", testit, ind)
-
-    def test_set_name_methods(self):
-        new_name = "This is the new name for this index"
-        for ind in self.indices.values():
-
-            # don't tests a MultiIndex here (as its tested separated)
-            if isinstance(ind, MultiIndex):
-                continue
-
-            original_name = ind.name
-            new_ind = ind.set_names([new_name])
-            self.assertEqual(new_ind.name, new_name)
-            self.assertEqual(ind.name, original_name)
-            res = ind.rename(new_name, inplace=True)
-
-            # should return None
-            self.assertIsNone(res)
-            self.assertEqual(ind.name, new_name)
-            self.assertEqual(ind.names, [new_name])
-            # with assertRaisesRegexp(TypeError, "list-like"):
-            #    # should still fail even if it would be the right length
-            #    ind.set_names("a")
-            with assertRaisesRegexp(ValueError, "Level must be None"):
-                ind.set_names("a", level=0)
-
-            # rename in place just leaves tuples and other containers alone
-            name = ('A', 'B')
-            ind.rename(name, inplace=True)
-            self.assertEqual(ind.name, name)
-            self.assertEqual(ind.names, [name])
-
-    def test_hash_error(self):
-        for ind in self.indices.values():
-            with tm.assertRaisesRegexp(TypeError, "unhashable type: %r" %
-                                       type(ind).__name__):
-                hash(ind)
+            assert '...' not in str(idx)
 
     def test_copy_name(self):
-        # Check that "name" argument passed at initialization is honoured
-        # GH12309
+        # gh-12309: Check that the "name" argument
+        # passed at initialization is honored.
+
         for name, index in compat.iteritems(self.indices):
             if isinstance(index, MultiIndex):
                 continue
@@ -214,18 +237,21 @@ def test_copy_name(self):
             second = first.__class__(first, copy=False)
 
             # Even though "copy=False", we want a new object.
-            self.assertIsNot(first, second)
-            # Not using tm.assert_index_equal() since names differ:
-            self.assertTrue(index.equals(first))
+            assert first is not second
+
+            # Not using tm.assert_index_equal() since names differ.
+            assert index.equals(first)
 
-            self.assertEqual(first.name, 'mario')
-            self.assertEqual(second.name, 'mario')
+            assert first.name == 'mario'
+            assert second.name == 'mario'
 
             s1 = Series(2, index=first)
             s2 = Series(3, index=second[:-1])
-            if not isinstance(index, CategoricalIndex):  # See GH13365
+
+            if not isinstance(index, CategoricalIndex):
+                # See gh-13365
                 s3 = s1 * s2
-                self.assertEqual(s3.index.name, 'mario')
+                assert s3.index.name == 'mario'
 
     def test_ensure_copied_data(self):
         # Check the "copy" argument of each Index.__new__ is honoured
@@ -243,122 +269,27 @@ def test_ensure_copied_data(self):
             index_type = index.__class__
             result = index_type(index.values, copy=True, **init_kwargs)
             tm.assert_index_equal(index, result)
-            tm.assert_numpy_array_equal(index.values, result.values,
+            tm.assert_numpy_array_equal(index._ndarray_values,
+                                        result._ndarray_values,
                                         check_same='copy')
 
-            if not isinstance(index, PeriodIndex):
-                result = index_type(index.values, copy=False, **init_kwargs)
-                tm.assert_numpy_array_equal(index.values, result.values,
-                                            check_same='same')
-                tm.assert_numpy_array_equal(index._values, result._values,
-                                            check_same='same')
-            else:
+            if isinstance(index, PeriodIndex):
                 # .values an object array of Period, thus copied
                 result = index_type(ordinal=index.asi8, copy=False,
                                     **init_kwargs)
-                tm.assert_numpy_array_equal(index._values, result._values,
+                tm.assert_numpy_array_equal(index._ndarray_values,
+                                            result._ndarray_values,
                                             check_same='same')
-
-    def test_copy_and_deepcopy(self):
-        from copy import copy, deepcopy
-
-        for ind in self.indices.values():
-
-            # don't tests a MultiIndex here (as its tested separated)
-            if isinstance(ind, MultiIndex):
-                continue
-
-            for func in (copy, deepcopy):
-                idx_copy = func(ind)
-                self.assertIsNot(idx_copy, ind)
-                self.assertTrue(idx_copy.equals(ind))
-
-            new_copy = ind.copy(deep=True, name="banana")
-            self.assertEqual(new_copy.name, "banana")
-
-    def test_duplicates(self):
-        for ind in self.indices.values():
-
-            if not len(ind):
-                continue
-            if isinstance(ind, MultiIndex):
-                continue
-            idx = self._holder([ind[0]] * 5)
-            self.assertFalse(idx.is_unique)
-            self.assertTrue(idx.has_duplicates)
-
-            # GH 10115
-            # preserve names
-            idx.name = 'foo'
-            result = idx.drop_duplicates()
-            self.assertEqual(result.name, 'foo')
-            self.assert_index_equal(result, Index([ind[0]], name='foo'))
-
-    def test_get_unique_index(self):
-        for ind in self.indices.values():
-
-            # MultiIndex tested separately
-            if not len(ind) or isinstance(ind, MultiIndex):
-                continue
-
-            idx = ind[[0] * 5]
-            idx_unique = ind[[0]]
-            # We test against `idx_unique`, so first we make sure it's unique
-            # and doesn't contain nans.
-            self.assertTrue(idx_unique.is_unique)
-            try:
-                self.assertFalse(idx_unique.hasnans)
-            except NotImplementedError:
+            elif isinstance(index, IntervalIndex):
+                # checked in test_interval.py
                 pass
-
-            for dropna in [False, True]:
-                result = idx._get_unique_index(dropna=dropna)
-                self.assert_index_equal(result, idx_unique)
-
-            # nans:
-
-            if not ind._can_hold_na:
-                continue
-
-            if needs_i8_conversion(ind):
-                vals = ind.asi8[[0] * 5]
-                vals[0] = iNaT
             else:
-                vals = ind.values[[0] * 5]
-                vals[0] = np.nan
-
-            vals_unique = vals[:2]
-            idx_nan = ind._shallow_copy(vals)
-            idx_unique_nan = ind._shallow_copy(vals_unique)
-            self.assertTrue(idx_unique_nan.is_unique)
-
-            self.assertEqual(idx_nan.dtype, ind.dtype)
-            self.assertEqual(idx_unique_nan.dtype, ind.dtype)
-
-            for dropna, expected in zip([False, True],
-                                        [idx_unique_nan, idx_unique]):
-                for i in [idx_nan, idx_unique_nan]:
-                    result = i._get_unique_index(dropna=dropna)
-                    self.assert_index_equal(result, expected)
-
-    def test_sort(self):
-        for ind in self.indices.values():
-            self.assertRaises(TypeError, ind.sort)
-
-    def test_mutability(self):
-        for ind in self.indices.values():
-            if not len(ind):
-                continue
-            self.assertRaises(TypeError, ind.__setitem__, 0, ind[0])
-
-    def test_view(self):
-        for ind in self.indices.values():
-            i_view = ind.view()
-            self.assertEqual(i_view.name, ind.name)
-
-    def test_compat(self):
-        for ind in self.indices.values():
-            self.assertEqual(ind.tolist(), list(ind))
+                result = index_type(index.values, copy=False, **init_kwargs)
+                tm.assert_numpy_array_equal(index.values, result.values,
+                                            check_same='same')
+                tm.assert_numpy_array_equal(index._ndarray_values,
+                                            result._ndarray_values,
+                                            check_same='same')
 
     def test_memory_usage(self):
         for name, index in compat.iteritems(self.indices):
@@ -368,17 +299,18 @@ def test_memory_usage(self):
                 result2 = index.memory_usage()
                 result3 = index.memory_usage(deep=True)
 
-                # RangeIndex doesn't use a hashtable engine
-                if not isinstance(index, RangeIndex):
-                    self.assertTrue(result2 > result)
+                # RangeIndex, IntervalIndex
+                # don't have engines
+                if not isinstance(index, (RangeIndex, IntervalIndex)):
+                    assert result2 > result
 
                 if index.inferred_type == 'object':
-                    self.assertTrue(result3 > result2)
+                    assert result3 > result2
 
             else:
 
                 # we report 0 for no-length
-                self.assertEqual(result, 0)
+                assert result == 0
 
     def test_argsort(self):
         for k, ind in self.indices.items():
@@ -401,27 +333,21 @@ def test_numpy_argsort(self):
             # pandas compatibility input validation - the
             # rest already perform separate (or no) such
             # validation via their 'values' attribute as
-            # defined in pandas.indexes/base.py - they
+            # defined in pandas.core.indexes/base.py - they
             # cannot be changed at the moment due to
             # backwards compatibility concerns
             if isinstance(type(ind), (CategoricalIndex, RangeIndex)):
                 msg = "the 'axis' parameter is not supported"
-                tm.assertRaisesRegexp(ValueError, msg,
-                                      np.argsort, ind, axis=1)
+                with pytest.raises(ValueError, match=msg):
+                    np.argsort(ind, axis=1)
 
                 msg = "the 'kind' parameter is not supported"
-                tm.assertRaisesRegexp(ValueError, msg, np.argsort,
-                                      ind, kind='mergesort')
+                with pytest.raises(ValueError, match=msg):
+                    np.argsort(ind, kind='mergesort')
 
                 msg = "the 'order' parameter is not supported"
-                tm.assertRaisesRegexp(ValueError, msg, np.argsort,
-                                      ind, order=('a', 'b'))
-
-    def test_pickle(self):
-        for ind in self.indices.values():
-            self.verify_pickle(ind)
-            ind.name = 'foo'
-            self.verify_pickle(ind)
+                with pytest.raises(ValueError, match=msg):
+                    np.argsort(ind, order=('a', 'b'))
 
     def test_take(self):
         indexer = [4, 3, 0, 2]
@@ -433,12 +359,12 @@ def test_take(self):
 
             result = ind.take(indexer)
             expected = ind[indexer]
-            self.assertTrue(result.equals(expected))
+            assert result.equals(expected)
 
             if not isinstance(ind,
                               (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
                 # GH 10791
-                with tm.assertRaises(AttributeError):
+                with pytest.raises(AttributeError):
                     ind.freq
 
     def test_take_invalid_kwargs(self):
@@ -446,16 +372,16 @@ def test_take_invalid_kwargs(self):
         indices = [1, 2]
 
         msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, idx.take,
-                              indices, foo=2)
+        with pytest.raises(TypeError, match=msg):
+            idx.take(indices, foo=2)
 
         msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, out=indices)
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, out=indices)
 
         msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, mode='clip')
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, mode='clip')
 
     def test_repeat(self):
         rep = 2
@@ -475,46 +401,33 @@ def test_numpy_repeat(self):
         tm.assert_index_equal(np.repeat(i, rep), expected)
 
         msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.repeat,
-                              i, rep, axis=0)
+        with pytest.raises(ValueError, match=msg):
+            np.repeat(i, rep, axis=0)
 
-    def test_where(self):
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
         i = self.create_index()
-        result = i.where(notnull(i))
+
+        cond = [True] * len(i)
+        result = i.where(klass(cond))
         expected = i
         tm.assert_index_equal(result, expected)
 
-        _nan = i._na_value
         cond = [False] + [True] * len(i[1:])
-        expected = pd.Index([_nan] + i[1:].tolist(), dtype=i.dtype)
-
-        result = i.where(cond)
+        expected = pd.Index([i._na_value] + i[1:].tolist(), dtype=i.dtype)
+        result = i.where(klass(cond))
         tm.assert_index_equal(result, expected)
 
-    def test_where_array_like(self):
-        i = self.create_index()
-
-        _nan = i._na_value
-        cond = [False] + [True] * (len(i) - 1)
-        klasses = [list, tuple, np.array, pd.Series]
-        expected = pd.Index([_nan] + i[1:].tolist(), dtype=i.dtype)
-
-        for klass in klasses:
-            result = i.where(klass(cond))
-            tm.assert_index_equal(result, expected)
-
-    def test_setops_errorcases(self):
+    @pytest.mark.parametrize("case", [0.5, "xxx"])
+    @pytest.mark.parametrize("method", ["intersection", "union",
+                                        "difference", "symmetric_difference"])
+    def test_set_ops_error_cases(self, case, method):
         for name, idx in compat.iteritems(self.indices):
-            # # non-iterable input
-            cases = [0.5, 'xxx']
-            methods = [idx.intersection, idx.union, idx.difference,
-                       idx.symmetric_difference]
+            # non-iterable input
 
-            for method in methods:
-                for case in cases:
-                    assertRaisesRegexp(TypeError,
-                                       "Input must be Index or array-like",
-                                       method, case)
+            msg = "Input must be Index or array-like"
+            with pytest.raises(TypeError, match=msg):
+                getattr(idx, method)(case)
 
     def test_intersection_base(self):
         for name, idx in compat.iteritems(self.indices):
@@ -525,7 +438,7 @@ def test_intersection_base(self):
             if isinstance(idx, CategoricalIndex):
                 pass
             else:
-                self.assertTrue(tm.equalContents(intersect, second))
+                assert tm.equalContents(intersect, second)
 
             # GH 10149
             cases = [klass(second.values)
@@ -533,18 +446,18 @@ def test_intersection_base(self):
             for case in cases:
                 if isinstance(idx, PeriodIndex):
                     msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.intersection(case)
+                    with pytest.raises(ValueError, match=msg):
+                        first.intersection(case)
                 elif isinstance(idx, CategoricalIndex):
                     pass
                 else:
                     result = first.intersection(case)
-                    self.assertTrue(tm.equalContents(result, second))
+                    assert tm.equalContents(result, second)
 
             if isinstance(idx, MultiIndex):
                 msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.intersection([1, 2, 3])
+                with pytest.raises(TypeError, match=msg):
+                    first.intersection([1, 2, 3])
 
     def test_union_base(self):
         for name, idx in compat.iteritems(self.indices):
@@ -552,7 +465,7 @@ def test_union_base(self):
             second = idx[:5]
             everything = idx
             union = first.union(second)
-            self.assertTrue(tm.equalContents(union, everything))
+            assert tm.equalContents(union, everything)
 
             # GH 10149
             cases = [klass(second.values)
@@ -560,30 +473,31 @@ def test_union_base(self):
             for case in cases:
                 if isinstance(idx, PeriodIndex):
                     msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.union(case)
+                    with pytest.raises(ValueError, match=msg):
+                        first.union(case)
                 elif isinstance(idx, CategoricalIndex):
                     pass
                 else:
                     result = first.union(case)
-                    self.assertTrue(tm.equalContents(result, everything))
+                    assert tm.equalContents(result, everything)
 
             if isinstance(idx, MultiIndex):
                 msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.union([1, 2, 3])
+                with pytest.raises(TypeError, match=msg):
+                    first.union([1, 2, 3])
 
-    def test_difference_base(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_base(self, sort):
         for name, idx in compat.iteritems(self.indices):
             first = idx[2:]
             second = idx[:4]
             answer = idx[4:]
-            result = first.difference(second)
+            result = first.difference(second, sort)
 
             if isinstance(idx, CategoricalIndex):
                 pass
             else:
-                self.assertTrue(tm.equalContents(result, answer))
+                assert tm.equalContents(result, answer)
 
             # GH 10149
             cases = [klass(second.values)
@@ -591,21 +505,22 @@ def test_difference_base(self):
             for case in cases:
                 if isinstance(idx, PeriodIndex):
                     msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.difference(case)
+                    with pytest.raises(ValueError, match=msg):
+                        first.difference(case, sort)
                 elif isinstance(idx, CategoricalIndex):
                     pass
                 elif isinstance(idx, (DatetimeIndex, TimedeltaIndex)):
-                    self.assertEqual(result.__class__, answer.__class__)
-                    tm.assert_numpy_array_equal(result.asi8, answer.asi8)
+                    assert result.__class__ == answer.__class__
+                    tm.assert_numpy_array_equal(result.sort_values().asi8,
+                                                answer.sort_values().asi8)
                 else:
-                    result = first.difference(case)
-                    self.assertTrue(tm.equalContents(result, answer))
+                    result = first.difference(case, sort)
+                    assert tm.equalContents(result, answer)
 
             if isinstance(idx, MultiIndex):
                 msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.difference([1, 2, 3])
+                with pytest.raises(TypeError, match=msg):
+                    first.difference([1, 2, 3], sort)
 
     def test_symmetric_difference(self):
         for name, idx in compat.iteritems(self.indices):
@@ -616,7 +531,7 @@ def test_symmetric_difference(self):
             else:
                 answer = idx[[0, -1]]
                 result = first.symmetric_difference(second)
-                self.assertTrue(tm.equalContents(result, answer))
+                assert tm.equalContents(result, answer)
 
             # GH 10149
             cases = [klass(second.values)
@@ -624,22 +539,18 @@ def test_symmetric_difference(self):
             for case in cases:
                 if isinstance(idx, PeriodIndex):
                     msg = "can only call with other PeriodIndex-ed objects"
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        result = first.symmetric_difference(case)
+                    with pytest.raises(ValueError, match=msg):
+                        first.symmetric_difference(case)
                 elif isinstance(idx, CategoricalIndex):
                     pass
                 else:
                     result = first.symmetric_difference(case)
-                    self.assertTrue(tm.equalContents(result, answer))
+                    assert tm.equalContents(result, answer)
 
             if isinstance(idx, MultiIndex):
                 msg = "other must be a MultiIndex or a list of tuples"
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    result = first.symmetric_difference([1, 2, 3])
-
-        # 12591 deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            first.sym_diff(second)
+                with pytest.raises(TypeError, match=msg):
+                    first.symmetric_difference([1, 2, 3])
 
     def test_insert_base(self):
 
@@ -650,7 +561,7 @@ def test_insert_base(self):
                 continue
 
             # test 0th element
-            self.assertTrue(idx[0:4].equals(result.insert(0, idx[0])))
+            assert idx[0:4].equals(result.insert(0, idx[0]))
 
     def test_delete_base(self):
 
@@ -665,49 +576,51 @@ def test_delete_base(self):
 
             expected = idx[1:]
             result = idx.delete(0)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
+            assert result.equals(expected)
+            assert result.name == expected.name
 
             expected = idx[:-1]
             result = idx.delete(-1)
-            self.assertTrue(result.equals(expected))
-            self.assertEqual(result.name, expected.name)
+            assert result.equals(expected)
+            assert result.name == expected.name
 
-            with tm.assertRaises((IndexError, ValueError)):
+            with pytest.raises((IndexError, ValueError)):
                 # either depending on numpy version
-                result = idx.delete(len(idx))
+                idx.delete(len(idx))
 
     def test_equals(self):
 
         for name, idx in compat.iteritems(self.indices):
-            self.assertTrue(idx.equals(idx))
-            self.assertTrue(idx.equals(idx.copy()))
-            self.assertTrue(idx.equals(idx.astype(object)))
+            assert idx.equals(idx)
+            assert idx.equals(idx.copy())
+            assert idx.equals(idx.astype(object))
 
-            self.assertFalse(idx.equals(list(idx)))
-            self.assertFalse(idx.equals(np.array(idx)))
+            assert not idx.equals(list(idx))
+            assert not idx.equals(np.array(idx))
 
             # Cannot pass in non-int64 dtype to RangeIndex
             if not isinstance(idx, RangeIndex):
                 same_values = Index(idx, dtype=object)
-                self.assertTrue(idx.equals(same_values))
-                self.assertTrue(same_values.equals(idx))
+                assert idx.equals(same_values)
+                assert same_values.equals(idx)
 
             if idx.nlevels == 1:
                 # do not test MultiIndex
-                self.assertFalse(idx.equals(pd.Series(idx)))
+                assert not idx.equals(pd.Series(idx))
 
     def test_equals_op(self):
         # GH9947, GH10637
         index_a = self.create_index()
         if isinstance(index_a, PeriodIndex):
-            return
+            pytest.skip('Skip check for PeriodIndex')
 
         n = len(index_a)
         index_b = index_a[0:-1]
         index_c = index_a[0:-1].append(index_a[-2:-1])
         index_d = index_a[0:1]
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+
+        msg = "Lengths must match|could not be broadcast"
+        with pytest.raises(ValueError, match=msg):
             index_a == index_b
         expected1 = np.array([True] * n)
         expected2 = np.array([True] * (n - 1) + [False])
@@ -719,7 +632,7 @@ def test_equals_op(self):
         array_b = np.array(index_a[0:-1])
         array_c = np.array(index_a[0:-1].append(index_a[-2:-1]))
         array_d = np.array(index_a[0:1])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match=msg):
             index_a == array_b
         tm.assert_numpy_array_equal(index_a == array_a, expected1)
         tm.assert_numpy_array_equal(index_a == array_c, expected2)
@@ -729,22 +642,23 @@ def test_equals_op(self):
         series_b = Series(array_b)
         series_c = Series(array_c)
         series_d = Series(array_d)
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match=msg):
             index_a == series_b
+
         tm.assert_numpy_array_equal(index_a == series_a, expected1)
         tm.assert_numpy_array_equal(index_a == series_c, expected2)
 
         # cases where length is 1 for one of them
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match="Lengths must match"):
             index_a == index_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match="Lengths must match"):
             index_a == series_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match="Lengths must match"):
             index_a == array_d
         msg = "Can only compare identically-labeled Series objects"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             series_a == series_d
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match="Lengths must match"):
             series_a == array_d
 
         # comparing with a scalar should broadcast; note that we are excluding
@@ -759,22 +673,19 @@ def test_equals_op(self):
             tm.assert_series_equal(series_a == item, Series(expected3))
 
     def test_numpy_ufuncs(self):
-        # test ufuncs of numpy 1.9.2. see:
+        # test ufuncs of numpy, see:
         # http://docs.scipy.org/doc/numpy/reference/ufuncs.html
 
-        # some functions are skipped because it may return different result
-        # for unicode input depending on numpy version
-
         for name, idx in compat.iteritems(self.indices):
             for func in [np.exp, np.exp2, np.expm1, np.log, np.log2, np.log10,
                          np.log1p, np.sqrt, np.sin, np.cos, np.tan, np.arcsin,
                          np.arccos, np.arctan, np.sinh, np.cosh, np.tanh,
                          np.arcsinh, np.arccosh, np.arctanh, np.deg2rad,
                          np.rad2deg]:
-                if isinstance(idx, pd.tseries.base.DatetimeIndexOpsMixin):
+                if isinstance(idx, DatetimeIndexOpsMixin):
                     # raise TypeError or ValueError (PeriodIndex)
                     # PeriodIndex behavior should be changed in future version
-                    with tm.assertRaises(Exception):
+                    with pytest.raises(Exception):
                         with np.errstate(all='ignore'):
                             func(idx)
                 elif isinstance(idx, (Float64Index, Int64Index, UInt64Index)):
@@ -782,33 +693,33 @@ def test_numpy_ufuncs(self):
                     with np.errstate(all='ignore'):
                         result = func(idx)
                         exp = Index(func(idx.values), name=idx.name)
-                    self.assert_index_equal(result, exp)
-                    self.assertIsInstance(result, pd.Float64Index)
+
+                    tm.assert_index_equal(result, exp)
+                    assert isinstance(result, pd.Float64Index)
                 else:
                     # raise AttributeError or TypeError
                     if len(idx) == 0:
                         continue
                     else:
-                        with tm.assertRaises(Exception):
+                        with pytest.raises(Exception):
                             with np.errstate(all='ignore'):
                                 func(idx)
 
             for func in [np.isfinite, np.isinf, np.isnan, np.signbit]:
-                if isinstance(idx, pd.tseries.base.DatetimeIndexOpsMixin):
+                if isinstance(idx, DatetimeIndexOpsMixin):
                     # raise TypeError or ValueError (PeriodIndex)
-                    with tm.assertRaises(Exception):
+                    with pytest.raises(Exception):
                         func(idx)
                 elif isinstance(idx, (Float64Index, Int64Index, UInt64Index)):
-                    # results in bool array
+                    # Results in bool array
                     result = func(idx)
-                    exp = func(idx.values)
-                    self.assertIsInstance(result, np.ndarray)
-                    tm.assertNotIsInstance(result, Index)
+                    assert isinstance(result, np.ndarray)
+                    assert not isinstance(result, Index)
                 else:
                     if len(idx) == 0:
                         continue
                     else:
-                        with tm.assertRaises(Exception):
+                        with pytest.raises(Exception):
                             func(idx)
 
     def test_hasnans_isnans(self):
@@ -821,15 +732,15 @@ def test_hasnans_isnans(self):
 
                 # cases in indices doesn't include NaN
                 expected = np.array([False] * len(idx), dtype=bool)
-                self.assert_numpy_array_equal(idx._isnan, expected)
-                self.assertFalse(idx.hasnans)
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert idx.hasnans is False
 
                 idx = index.copy()
-                values = idx.values
+                values = np.asarray(idx.values)
 
                 if len(index) == 0:
                     continue
-                elif isinstance(index, pd.tseries.base.DatetimeIndexOpsMixin):
+                elif isinstance(index, DatetimeIndexOpsMixin):
                     values[1] = iNaT
                 elif isinstance(index, (Int64Index, UInt64Index)):
                     continue
@@ -843,8 +754,8 @@ def test_hasnans_isnans(self):
 
                 expected = np.array([False] * len(idx), dtype=bool)
                 expected[1] = True
-                self.assert_numpy_array_equal(idx._isnan, expected)
-                self.assertTrue(idx.hasnans)
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert idx.hasnans is True
 
     def test_fillna(self):
         # GH 11343
@@ -853,23 +764,23 @@ def test_fillna(self):
                 pass
             elif isinstance(index, MultiIndex):
                 idx = index.copy()
-                msg = "isnull is not defined for MultiIndex"
-                with self.assertRaisesRegexp(NotImplementedError, msg):
+                msg = "isna is not defined for MultiIndex"
+                with pytest.raises(NotImplementedError, match=msg):
                     idx.fillna(idx[0])
             else:
                 idx = index.copy()
                 result = idx.fillna(idx[0])
-                self.assert_index_equal(result, idx)
-                self.assertFalse(result is idx)
+                tm.assert_index_equal(result, idx)
+                assert result is not idx
 
                 msg = "'value' must be a scalar, passed: "
-                with self.assertRaisesRegexp(TypeError, msg):
+                with pytest.raises(TypeError, match=msg):
                     idx.fillna([idx[0]])
 
                 idx = index.copy()
-                values = idx.values
+                values = np.asarray(idx.values)
 
-                if isinstance(index, pd.tseries.base.DatetimeIndexOpsMixin):
+                if isinstance(index, DatetimeIndexOpsMixin):
                     values[1] = iNaT
                 elif isinstance(index, (Int64Index, UInt64Index)):
                     continue
@@ -883,36 +794,143 @@ def test_fillna(self):
 
                 expected = np.array([False] * len(idx), dtype=bool)
                 expected[1] = True
-                self.assert_numpy_array_equal(idx._isnan, expected)
-                self.assertTrue(idx.hasnans)
+                tm.assert_numpy_array_equal(idx._isnan, expected)
+                assert idx.hasnans is True
 
     def test_nulls(self):
         # this is really a smoke test for the methods
-        # as these are adequantely tested for function elsewhere
+        # as these are adequately tested for function elsewhere
 
         for name, index in self.indices.items():
             if len(index) == 0:
-                self.assert_numpy_array_equal(
-                    index.isnull(), np.array([], dtype=bool))
+                tm.assert_numpy_array_equal(
+                    index.isna(), np.array([], dtype=bool))
             elif isinstance(index, MultiIndex):
                 idx = index.copy()
-                msg = "isnull is not defined for MultiIndex"
-                with self.assertRaisesRegexp(NotImplementedError, msg):
-                    idx.isnull()
+                msg = "isna is not defined for MultiIndex"
+                with pytest.raises(NotImplementedError, match=msg):
+                    idx.isna()
             else:
 
                 if not index.hasnans:
-                    self.assert_numpy_array_equal(
-                        index.isnull(), np.zeros(len(index), dtype=bool))
-                    self.assert_numpy_array_equal(
-                        index.notnull(), np.ones(len(index), dtype=bool))
+                    tm.assert_numpy_array_equal(
+                        index.isna(), np.zeros(len(index), dtype=bool))
+                    tm.assert_numpy_array_equal(
+                        index.notna(), np.ones(len(index), dtype=bool))
                 else:
-                    result = isnull(index)
-                    self.assert_numpy_array_equal(index.isnull(), result)
-                    self.assert_numpy_array_equal(index.notnull(), ~result)
+                    result = isna(index)
+                    tm.assert_numpy_array_equal(index.isna(), result)
+                    tm.assert_numpy_array_equal(index.notna(), ~result)
 
     def test_empty(self):
         # GH 15270
         index = self.create_index()
-        self.assertFalse(index.empty)
-        self.assertTrue(index[:0].empty)
+        assert not index.empty
+        assert index[:0].empty
+
+    def test_join_self_unique(self, join_type):
+        index = self.create_index()
+        if index.is_unique:
+            joined = index.join(index, how=join_type)
+            assert (index == joined).all()
+
+    def test_map(self):
+        # callable
+        index = self.create_index()
+
+        # we don't infer UInt64
+        if isinstance(index, pd.UInt64Index):
+            expected = index.astype('int64')
+        else:
+            expected = index
+
+        result = index.map(lambda x: x)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+
+        index = self.create_index()
+        if isinstance(index, (pd.CategoricalIndex, pd.IntervalIndex)):
+            pytest.skip("skipping tests for {}".format(type(index)))
+
+        identity = mapper(index.values, index)
+
+        # we don't infer to UInt64 for a dict
+        if isinstance(index, pd.UInt64Index) and isinstance(identity, dict):
+            expected = index.astype('int64')
+        else:
+            expected = index
+
+        result = index.map(identity)
+        tm.assert_index_equal(result, expected)
+
+        # empty mappable
+        expected = pd.Index([np.nan] * len(index))
+        result = index.map(mapper(expected, index))
+        tm.assert_index_equal(result, expected)
+
+    def test_putmask_with_wrong_mask(self):
+        # GH18368
+        index = self.create_index()
+
+        with pytest.raises(ValueError):
+            index.putmask(np.ones(len(index) + 1, np.bool), 1)
+
+        with pytest.raises(ValueError):
+            index.putmask(np.ones(len(index) - 1, np.bool), 1)
+
+        with pytest.raises(ValueError):
+            index.putmask('foo', 1)
+
+    @pytest.mark.parametrize('copy', [True, False])
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_astype_category(self, copy, name, ordered):
+        # GH 18630
+        index = self.create_index()
+        if name:
+            index = index.rename(name)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=ordered)
+        result = index.astype(dtype, copy=copy)
+        expected = CategoricalIndex(index.values, name=name, ordered=ordered)
+        tm.assert_index_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(index.unique().tolist()[:-1], ordered)
+        result = index.astype(dtype, copy=copy)
+        expected = CategoricalIndex(index.values, name=name, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        if ordered is False:
+            # dtype='category' defaults to ordered=False, so only test once
+            result = index.astype('category', copy=copy)
+            expected = CategoricalIndex(index.values, name=name)
+            tm.assert_index_equal(result, expected)
+
+    def test_is_unique(self):
+        # initialize a unique index
+        index = self.create_index().drop_duplicates()
+        assert index.is_unique is True
+
+        # empty index should be unique
+        index_empty = index[:0]
+        assert index_empty.is_unique is True
+
+        # test basic dupes
+        index_dup = index.insert(0, index[0])
+        assert index_dup.is_unique is False
+
+        # single NA should be unique
+        index_na = index.insert(0, np.nan)
+        assert index_na.is_unique is True
+
+        # multiple NA should not be unique
+        index_na_dup = index_na.insert(0, np.nan)
+        assert index_na_dup.is_unique is False
diff --git a/pandas/tests/indexes/conftest.py b/pandas/tests/indexes/conftest.py
new file mode 100644
index 0000000000000..e82cce873e75c
--- /dev/null
+++ b/pandas/tests/indexes/conftest.py
@@ -0,0 +1,49 @@
+import numpy as np
+import pytest
+
+from pandas.compat import long, lzip
+
+import pandas as pd
+from pandas.core.indexes.api import Index, MultiIndex
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[tm.makeUnicodeIndex(100),
+                        tm.makeStringIndex(100),
+                        tm.makeDateIndex(100),
+                        tm.makePeriodIndex(100),
+                        tm.makeTimedeltaIndex(100),
+                        tm.makeIntIndex(100),
+                        tm.makeUIntIndex(100),
+                        tm.makeRangeIndex(100),
+                        tm.makeFloatIndex(100),
+                        Index([True, False]),
+                        tm.makeCategoricalIndex(100),
+                        Index([]),
+                        MultiIndex.from_tuples(lzip(
+                            ['foo', 'bar', 'baz'], [1, 2, 3])),
+                        Index([0, 0, 1, 1, 2, 2])],
+                ids=lambda x: type(x).__name__)
+def indices(request):
+    return request.param
+
+
+@pytest.fixture(params=[1, np.array(1, dtype=np.int64)])
+def one(request):
+    # zero-dim integer array behaves like an integer
+    return request.param
+
+
+zeros = [box([0] * 5, dtype=dtype)
+         for box in [pd.Index, np.array]
+         for dtype in [np.int64, np.uint64, np.float64]]
+zeros.extend([np.array(0, dtype=dtype)
+              for dtype in [np.int64, np.uint64, np.float64]])
+zeros.extend([0, 0.0, long(0)])
+
+
+@pytest.fixture(params=zeros)
+def zero(request):
+    # For testing division by (or of) zero for Index with length 5, this
+    # gives several scalar-zeros and length-5 vector-zeros
+    return request.param
diff --git a/pandas/tests/indexes/data/mindex_073.pickle b/pandas/tests/indexes/data/mindex_073.pickle
deleted file mode 100644
index c99f51fa289ac..0000000000000
Binary files a/pandas/tests/indexes/data/mindex_073.pickle and /dev/null differ
diff --git a/pandas/tests/indexes/data/multiindex_v1.pickle b/pandas/tests/indexes/data/multiindex_v1.pickle
deleted file mode 100644
index d404a78f9e397..0000000000000
--- a/pandas/tests/indexes/data/multiindex_v1.pickle
+++ /dev/null
@@ -1,149 +0,0 @@
-cnumpy.core.multiarray
-_reconstruct
-p0
-(cpandas.core.index
-MultiIndex
-p1
-(I0
-tp2
-S'b'
-p3
-tp4
-Rp5
-((I1
-(I10
-tp6
-cnumpy
-dtype
-p7
-(S'O8'
-p8
-I0
-I1
-tp9
-Rp10
-(I3
-S'|'
-p11
-NNNI-1
-I-1
-I63
-tp12
-bI00
-(lp13
-I0
-aI1
-aI2
-aI3
-aI4
-aI5
-aI6
-aI7
-aI8
-aI9
-atp14
-((lp15
-g0
-(cpandas.core.index
-Index
-p16
-(I0
-tp17
-g3
-tp18
-Rp19
-((I1
-(I4
-tp20
-g10
-I00
-(lp21
-S'foo'
-p22
-aS'bar'
-p23
-aS'baz'
-p24
-aS'qux'
-p25
-atp26
-(S'first'
-p27
-tp28
-tp29
-bag0
-(g16
-(I0
-tp30
-g3
-tp31
-Rp32
-((I1
-(I3
-tp33
-g10
-I00
-(lp34
-S'one'
-p35
-aS'two'
-p36
-aS'three'
-p37
-atp38
-(S'second'
-p39
-tp40
-tp41
-ba(lp42
-g0
-(cnumpy
-ndarray
-p43
-(I0
-tp44
-g3
-tp45
-Rp46
-(I1
-(I10
-tp47
-g7
-(S'i4'
-p48
-I0
-I1
-tp49
-Rp50
-(I3
-S'<'
-p51
-NNNI-1
-I-1
-I0
-tp52
-bI00
-S'\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x01\x00\x00\x00\x02\x00\x00\x00\x02\x00\x00\x00\x03\x00\x00\x00\x03\x00\x00\x00\x03\x00\x00\x00'
-p53
-tp54
-bag0
-(g43
-(I0
-tp55
-g3
-tp56
-Rp57
-(I1
-(I10
-tp58
-g50
-I00
-S'\x00\x00\x00\x00\x01\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x01\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x02\x00\x00\x00'
-p59
-tp60
-baN(lp61
-g27
-ag39
-atp62
-tp63
-b.
\ No newline at end of file
diff --git a/pandas/tests/indexes/datetimelike.py b/pandas/tests/indexes/datetimelike.py
index 964511a2e9d5b..180033c2d2619 100644
--- a/pandas/tests/indexes/datetimelike.py
+++ b/pandas/tests/indexes/datetimelike.py
@@ -1,34 +1,53 @@
 """ generic datetimelike tests """
+import numpy as np
+import pytest
 
-from .common import Base
+import pandas as pd
 import pandas.util.testing as tm
 
+from .common import Base
+
 
 class DatetimeLike(Base):
 
+    def test_argmax_axis_invalid(self):
+        # GH#23081
+        rng = self.create_index()
+        with pytest.raises(ValueError):
+            rng.argmax(axis=1)
+        with pytest.raises(ValueError):
+            rng.argmin(axis=2)
+        with pytest.raises(ValueError):
+            rng.min(axis=-2)
+        with pytest.raises(ValueError):
+            rng.max(axis=-3)
+
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
+
     def test_shift_identity(self):
 
         idx = self.create_index()
-        self.assert_index_equal(idx, idx.shift(0))
+        tm.assert_index_equal(idx, idx.shift(0))
 
     def test_str(self):
 
         # test the string repr
         idx = self.create_index()
         idx.name = 'foo'
-        self.assertFalse("length=%s" % len(idx) in str(idx))
-        self.assertTrue("'foo'" in str(idx))
-        self.assertTrue(idx.__class__.__name__ in str(idx))
+        assert not "length=%s" % len(idx) in str(idx)
+        assert "'foo'" in str(idx)
+        assert idx.__class__.__name__ in str(idx)
 
         if hasattr(idx, 'tz'):
             if idx.tz is not None:
-                self.assertTrue(idx.tz in str(idx))
+                assert idx.tz in str(idx)
         if hasattr(idx, 'freq'):
-            self.assertTrue("freq='%s'" % idx.freqstr in str(idx))
+            assert "freq='%s'" % idx.freqstr in str(idx)
 
     def test_view(self):
-        super(DatetimeLike, self).test_view()
-
         i = self.create_index()
 
         i_view = i.view('i8')
@@ -38,3 +57,45 @@ def test_view(self):
         i_view = i.view(self._holder)
         result = self._holder(i)
         tm.assert_index_equal(result, i_view)
+
+    def test_map_callable(self):
+        expected = self.index + self.index.freq
+        result = self.index.map(lambda x: x + x.freq)
+        tm.assert_index_equal(result, expected)
+
+        # map to NaT
+        result = self.index.map(lambda x: pd.NaT if x == self.index[0] else x)
+        expected = pd.Index([pd.NaT] + self.index[1:].tolist())
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+        expected = self.index + self.index.freq
+
+        # don't compare the freqs
+        if isinstance(expected, pd.DatetimeIndex):
+            expected.freq = None
+
+        result = self.index.map(mapper(expected, self.index))
+        tm.assert_index_equal(result, expected)
+
+        expected = pd.Index([pd.NaT] + self.index[1:].tolist())
+        result = self.index.map(mapper(expected, self.index))
+        tm.assert_index_equal(result, expected)
+
+        # empty map; these map to np.nan because we cannot know
+        # to re-infer things
+        expected = pd.Index([np.nan] * len(self.index))
+        result = self.index.map(mapper([], []))
+        tm.assert_index_equal(result, expected)
+
+    def test_asobject_deprecated(self):
+        # GH18572
+        d = self.create_index()
+        with tm.assert_produces_warning(FutureWarning):
+            i = d.asobject
+        assert isinstance(i, pd.Index)
diff --git a/pandas/tests/indexes/datetimes/test_arithmetic.py b/pandas/tests/indexes/datetimes/test_arithmetic.py
new file mode 100644
index 0000000000000..1b75d6bd34764
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_arithmetic.py
@@ -0,0 +1,109 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import pytest
+import pytz
+
+from pandas.errors import NullFrequencyError
+
+import pandas as pd
+from pandas import DatetimeIndex, Series, date_range
+import pandas.util.testing as tm
+
+
+class TestDatetimeIndexArithmetic(object):
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.shift is used in integer addition
+
+    def test_dti_shift_tzaware(self, tz_naive_fixture):
+        # GH#9903
+        tz = tz_naive_fixture
+        idx = pd.DatetimeIndex([], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        tm.assert_index_equal(idx.shift(3, freq='H'), idx)
+
+        idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-01 11:00',
+                                '2011-01-01 12:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        exp = pd.DatetimeIndex(['2011-01-01 13:00', '2011-01-01 14:00',
+                                '2011-01-01 15:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(3, freq='H'), exp)
+        exp = pd.DatetimeIndex(['2011-01-01 07:00', '2011-01-01 08:00',
+                                '2011-01-01 09:00'], name='xxx', tz=tz)
+        tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
+
+    def test_dti_shift_freqs(self):
+        # test shift for DatetimeIndex and non DatetimeIndex
+        # GH#8083
+        drange = pd.date_range('20130101', periods=5)
+        result = drange.shift(1)
+        expected = pd.DatetimeIndex(['2013-01-02', '2013-01-03', '2013-01-04',
+                                     '2013-01-05',
+                                     '2013-01-06'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+        result = drange.shift(-1)
+        expected = pd.DatetimeIndex(['2012-12-31', '2013-01-01', '2013-01-02',
+                                     '2013-01-03', '2013-01-04'],
+                                    freq='D')
+        tm.assert_index_equal(result, expected)
+
+        result = drange.shift(3, freq='2D')
+        expected = pd.DatetimeIndex(['2013-01-07', '2013-01-08', '2013-01-09',
+                                     '2013-01-10',
+                                     '2013-01-11'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_shift_int(self):
+        rng = date_range('1/1/2000', periods=20)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng + 5
+
+        expected = rng.shift(5)
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng - 5
+
+        expected = rng.shift(-5)
+        tm.assert_index_equal(result, expected)
+
+    def test_dti_shift_no_freq(self):
+        # GH#19147
+        dti = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-01'], freq=None)
+        with pytest.raises(NullFrequencyError):
+            dti.shift(2)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_shift_localized(self, tzstr):
+        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
+        dr_tz = dr.tz_localize(tzstr)
+
+        result = dr_tz.shift(1, '10T')
+        assert result.tz == dr_tz.tz
+
+    def test_dti_shift_across_dst(self):
+        # GH 8616
+        idx = date_range('2013-11-03', tz='America/Chicago',
+                         periods=7, freq='H')
+        s = Series(index=idx[:-1])
+        result = s.shift(freq='H')
+        expected = Series(index=idx[1:])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('shift, result_time', [
+        [0, '2014-11-14 00:00:00'],
+        [-1, '2014-11-13 23:00:00'],
+        [1, '2014-11-14 01:00:00']])
+    def test_dti_shift_near_midnight(self, shift, result_time):
+        # GH 8616
+        dt = datetime(2014, 11, 14, 0)
+        dt_est = pytz.timezone('EST').localize(dt)
+        s = Series(data=[1], index=[dt_est])
+        result = s.shift(shift, freq='H')
+        expected = Series(1, index=DatetimeIndex([result_time], tz='EST'))
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_astype.py b/pandas/tests/indexes/datetimes/test_astype.py
index c9a695ee8db3b..ddf6a6ded69f8 100644
--- a/pandas/tests/indexes/datetimes/test_astype.py
+++ b/pandas/tests/indexes/datetimes/test_astype.py
@@ -1,13 +1,19 @@
+from datetime import datetime
+
+import dateutil
+from dateutil.tz import tzlocal
 import numpy as np
+import pytest
+import pytz
 
-from datetime import datetime
 import pandas as pd
+from pandas import (
+    DatetimeIndex, Index, Int64Index, NaT, Period, Series, Timestamp,
+    date_range)
 import pandas.util.testing as tm
-from pandas import (DatetimeIndex, date_range, Series, NaT, Index, Timestamp,
-                    Int64Index, Period)
 
 
-class TestDatetimeIndex(tm.TestCase):
+class TestDatetimeIndex(object):
 
     def test_astype(self):
         # GH 13149, GH 13209
@@ -24,8 +30,17 @@ def test_astype(self):
 
         rng = date_range('1/1/2000', periods=10)
         result = rng.astype('i8')
-        self.assert_index_equal(result, Index(rng.asi8))
-        self.assert_numpy_array_equal(result.values, rng.asi8)
+        tm.assert_index_equal(result, Index(rng.asi8))
+        tm.assert_numpy_array_equal(result.values, rng.asi8)
+
+    def test_astype_uint(self):
+        arr = date_range('2000', periods=2)
+        expected = pd.UInt64Index(
+            np.array([946684800000000000, 946771200000000000], dtype="uint64")
+        )
+
+        tm.assert_index_equal(arr.astype("uint64"), expected)
+        tm.assert_index_equal(arr.astype("uint32"), expected)
 
     def test_astype_with_tz(self):
 
@@ -51,9 +66,21 @@ def test_astype_with_tz(self):
                           dtype=object)
         tm.assert_series_equal(result, expected)
 
+        # GH 18951: tz-aware to tz-aware
+        idx = date_range('20170101', periods=4, tz='US/Pacific')
+        result = idx.astype('datetime64[ns, US/Eastern]')
+        expected = date_range('20170101 03:00:00', periods=4, tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # GH 18951: tz-naive to tz-aware
+        idx = date_range('20170101', periods=4)
+        result = idx.astype('datetime64[ns, US/Eastern]')
+        expected = date_range('20170101', periods=4, tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
     def test_astype_str_compat(self):
         # GH 13149, GH 13209
-        # verify that we are returing NaT as a string (and not unicode)
+        # verify that we are returning NaT as a string (and not unicode)
 
         idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
         result = idx.astype(str)
@@ -99,11 +126,11 @@ def test_astype_datetime64(self):
 
         result = idx.astype('datetime64[ns]')
         tm.assert_index_equal(result, idx)
-        self.assertFalse(result is idx)
+        assert result is not idx
 
         result = idx.astype('datetime64[ns]', copy=False)
         tm.assert_index_equal(result, idx)
-        self.assertTrue(result is idx)
+        assert result is idx
 
         idx_tz = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN], tz='EST')
         result = idx_tz.astype('datetime64[ns]')
@@ -111,26 +138,57 @@ def test_astype_datetime64(self):
                                  dtype='datetime64[ns]')
         tm.assert_index_equal(result, expected)
 
-    def test_astype_raises(self):
+    def test_astype_object(self):
+        rng = date_range('1/1/2000', periods=20)
+
+        casted = rng.astype('O')
+        exp_values = list(rng)
+
+        tm.assert_index_equal(casted, Index(exp_values, dtype=np.object_))
+        assert casted.tolist() == exp_values
+
+    @pytest.mark.parametrize('tz', [None, 'Asia/Tokyo'])
+    def test_astype_object_tz(self, tz):
+        idx = pd.date_range(start='2013-01-01', periods=4, freq='M',
+                            name='idx', tz=tz)
+        expected_list = [Timestamp('2013-01-31', tz=tz),
+                         Timestamp('2013-02-28', tz=tz),
+                         Timestamp('2013-03-31', tz=tz),
+                         Timestamp('2013-04-30', tz=tz)]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    def test_astype_object_with_nat(self):
+        idx = DatetimeIndex([datetime(2013, 1, 1), datetime(2013, 1, 2),
+                             pd.NaT, datetime(2013, 1, 4)], name='idx')
+        expected_list = [Timestamp('2013-01-01'),
+                         Timestamp('2013-01-02'), pd.NaT,
+                         Timestamp('2013-01-04')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
+
+    @pytest.mark.parametrize('dtype', [
+        float, 'timedelta64', 'timedelta64[ns]', 'datetime64',
+        'datetime64[D]'])
+    def test_astype_raises(self, dtype):
         # GH 13149, GH 13209
         idx = DatetimeIndex(['2016-05-16', 'NaT', NaT, np.NaN])
-
-        self.assertRaises(ValueError, idx.astype, float)
-        self.assertRaises(ValueError, idx.astype, 'timedelta64')
-        self.assertRaises(ValueError, idx.astype, 'timedelta64[ns]')
-        self.assertRaises(ValueError, idx.astype, 'datetime64')
-        self.assertRaises(ValueError, idx.astype, 'datetime64[D]')
+        msg = 'Cannot cast DatetimeArray to dtype'
+        with pytest.raises(TypeError, match=msg):
+            idx.astype(dtype)
 
     def test_index_convert_to_datetime_array(self):
-        tm._skip_if_no_pytz()
-
         def _check_rng(rng):
             converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
+            assert isinstance(converted, np.ndarray)
             for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
 
         rng = date_range('20090415', '20090519')
         rng_eastern = date_range('20090415', '20090519', tz='US/Eastern')
@@ -141,16 +199,13 @@ def _check_rng(rng):
         _check_rng(rng_utc)
 
     def test_index_convert_to_datetime_array_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-
         def _check_rng(rng):
             converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
+            assert isinstance(converted, np.ndarray)
             for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
 
         rng = date_range('20090415', '20090519')
         rng_eastern = date_range('20090415', '20090519',
@@ -162,16 +217,13 @@ def _check_rng(rng):
         _check_rng(rng_utc)
 
     def test_index_convert_to_datetime_array_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-
         def _check_rng(rng):
             converted = rng.to_pydatetime()
-            tm.assertIsInstance(converted, np.ndarray)
+            assert isinstance(converted, np.ndarray)
             for x, stamp in zip(converted, rng):
-                tm.assertIsInstance(x, datetime)
-                self.assertEqual(x, stamp.to_pydatetime())
-                self.assertEqual(x.tzinfo, stamp.tzinfo)
+                assert isinstance(x, datetime)
+                assert x == stamp.to_pydatetime()
+                assert x.tzinfo == stamp.tzinfo
 
         rng = date_range('20090415', '20090519')
         rng_eastern = date_range('20090415', '20090519',
@@ -182,10 +234,20 @@ def _check_rng(rng):
         _check_rng(rng_eastern)
         _check_rng(rng_utc)
 
+    @pytest.mark.parametrize('tz, dtype', [
+        ['US/Pacific', 'datetime64[ns, US/Pacific]'],
+        [None, 'datetime64[ns]']])
+    def test_integer_index_astype_datetime(self, tz, dtype):
+        # GH 20997, 20964, 24559
+        val = [pd.Timestamp('2018-01-01', tz=tz).value]
+        result = pd.Index(val).astype(dtype)
+        expected = pd.DatetimeIndex(["2018-01-01"], tz=tz)
+        tm.assert_index_equal(result, expected)
+
 
-class TestToPeriod(tm.TestCase):
+class TestToPeriod(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         data = [Timestamp('2007-01-01 10:11:12.123456Z'),
                 Timestamp('2007-01-01 10:11:13.789123Z')]
         self.index = DatetimeIndex(data)
@@ -193,118 +255,89 @@ def setUp(self):
     def test_to_period_millisecond(self):
         index = self.index
 
-        period = index.to_period(freq='L')
-        self.assertEqual(2, len(period))
-        self.assertEqual(period[0], Period('2007-01-01 10:11:12.123Z', 'L'))
-        self.assertEqual(period[1], Period('2007-01-01 10:11:13.789Z', 'L'))
+        with tm.assert_produces_warning(UserWarning):
+            # warning that timezone info will be lost
+            period = index.to_period(freq='L')
+        assert 2 == len(period)
+        assert period[0] == Period('2007-01-01 10:11:12.123Z', 'L')
+        assert period[1] == Period('2007-01-01 10:11:13.789Z', 'L')
 
     def test_to_period_microsecond(self):
         index = self.index
 
-        period = index.to_period(freq='U')
-        self.assertEqual(2, len(period))
-        self.assertEqual(period[0], Period('2007-01-01 10:11:12.123456Z', 'U'))
-        self.assertEqual(period[1], Period('2007-01-01 10:11:13.789123Z', 'U'))
-
-    def test_to_period_tz_pytz(self):
-        tm._skip_if_no_pytz()
-        from dateutil.tz import tzlocal
-        from pytz import utc as UTC
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz='US/Eastern')
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
+        with tm.assert_produces_warning(UserWarning):
+            # warning that timezone info will be lost
+            period = index.to_period(freq='U')
+        assert 2 == len(period)
+        assert period[0] == Period('2007-01-01 10:11:12.123456Z', 'U')
+        assert period[1] == Period('2007-01-01 10:11:13.789123Z', 'U')
 
-        self.assertEqual(result, expected)
-        tm.assert_index_equal(ts.to_period(), xp)
+    @pytest.mark.parametrize('tz', [
+        'US/Eastern', pytz.utc, tzlocal(), 'dateutil/US/Eastern',
+        dateutil.tz.tzutc()])
+    def test_to_period_tz(self, tz):
+        ts = date_range('1/1/2000', '2/1/2000', tz=tz)
 
-        ts = date_range('1/1/2000', '4/1/2000', tz=UTC)
+        with tm.assert_produces_warning(UserWarning):
+            # GH#21333 warning that timezone info will be lost
+            result = ts.to_period()[0]
+            expected = ts[0].to_period()
 
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
+        assert result == expected
 
-        self.assertEqual(result, expected)
-        tm.assert_index_equal(ts.to_period(), xp)
+        expected = date_range('1/1/2000', '2/1/2000').to_period()
 
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
+        with tm.assert_produces_warning(UserWarning):
+            # GH#21333 warning that timezone info will be lost
+            result = ts.to_period()
 
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertEqual(result, expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-    def test_to_period_tz_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        from dateutil.tz import tzlocal
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.timezone('US/Eastern'))
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=pytz.utc)
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-    def test_to_period_tz_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        from dateutil.tz import tzlocal
-
-        xp = date_range('1/1/2000', '4/1/2000').to_period()
-
-        ts = date_range('1/1/2000', '4/1/2000', tz='dateutil/US/Eastern')
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=dateutil.tz.tzutc())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
-
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
-
-        ts = date_range('1/1/2000', '4/1/2000', tz=tzlocal())
-
-        result = ts.to_period()[0]
-        expected = ts[0].to_period()
+        tm.assert_index_equal(result, expected)
 
-        self.assertTrue(result == expected)
-        tm.assert_index_equal(ts.to_period(), xp)
+    @pytest.mark.parametrize('tz', ['Etc/GMT-1', 'Etc/GMT+1'])
+    def test_to_period_tz_utc_offset_consistency(self, tz):
+        # GH 22905
+        ts = pd.date_range('1/1/2000', '2/1/2000', tz='Etc/GMT-1')
+        with tm.assert_produces_warning(UserWarning):
+            result = ts.to_period()[0]
+            expected = ts[0].to_period()
+            assert result == expected
+
+    def test_to_period_nofreq(self):
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
+        with pytest.raises(ValueError):
+            idx.to_period()
+
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'],
+                            freq='infer')
+        assert idx.freqstr == 'D'
+        expected = pd.PeriodIndex(['2000-01-01', '2000-01-02',
+                                   '2000-01-03'], freq='D')
+        tm.assert_index_equal(idx.to_period(), expected)
+
+        # GH 7606
+        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
+        assert idx.freqstr is None
+        tm.assert_index_equal(idx.to_period(), expected)
+
+    @pytest.mark.parametrize('tz', [None, 'US/Central'])
+    def test_astype_category(self, tz):
+        obj = pd.date_range("2000", periods=2, tz=tz)
+        result = obj.astype('category')
+        expected = pd.CategoricalIndex([pd.Timestamp('2000-01-01', tz=tz),
+                                        pd.Timestamp('2000-01-02', tz=tz)])
+        tm.assert_index_equal(result, expected)
 
-    def test_astype_object(self):
-        # NumPy 1.6.1 weak ns support
-        rng = date_range('1/1/2000', periods=20)
+        result = obj._data.astype('category')
+        expected = expected.values
+        tm.assert_categorical_equal(result, expected)
 
-        casted = rng.astype('O')
-        exp_values = list(rng)
+    @pytest.mark.parametrize('tz', [None, 'US/Central'])
+    def test_astype_array_fallback(self, tz):
+        obj = pd.date_range("2000", periods=2, tz=tz)
+        result = obj.astype(bool)
+        expected = pd.Index(np.array([True, True]))
+        tm.assert_index_equal(result, expected)
 
-        tm.assert_index_equal(casted, Index(exp_values, dtype=np.object_))
-        self.assertEqual(casted.tolist(), exp_values)
+        result = obj._data.astype(bool)
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_construction.py b/pandas/tests/indexes/datetimes/test_construction.py
index 16881de6e8c39..6893f635c82ac 100644
--- a/pandas/tests/indexes/datetimes/test_construction.py
+++ b/pandas/tests/indexes/datetimes/test_construction.py
@@ -1,52 +1,154 @@
-import numpy as np
 from datetime import timedelta
+from functools import partial
+from operator import attrgetter
 
-import pandas as pd
-from pandas import offsets
-import pandas.util.testing as tm
-from pandas._libs import tslib, lib
-from pandas._libs.tslib import OutOfBoundsDatetime
-from pandas import (DatetimeIndex, Index, Timestamp, datetime, date_range,
-                    to_datetime)
-
-
-class TestDatetimeIndex(tm.TestCase):
-
-    def test_construction_with_alt(self):
+import dateutil
+import numpy as np
+import pytest
+import pytz
 
-        i = pd.date_range('20130101', periods=5, freq='H', tz='US/Eastern')
-        i2 = DatetimeIndex(i, dtype=i.dtype)
-        self.assert_index_equal(i, i2)
+from pandas._libs.tslibs import OutOfBoundsDatetime, conversion
 
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, tz=i.dtype.tz)
-        self.assert_index_equal(i, i2)
+import pandas as pd
+from pandas import (
+    DatetimeIndex, Index, Timestamp, date_range, datetime, offsets,
+    to_datetime)
+from pandas.core.arrays import DatetimeArray, period_array
+import pandas.util.testing as tm
 
-        i2 = DatetimeIndex(i.tz_localize(None).asi8, dtype=i.dtype)
-        self.assert_index_equal(i, i2)
 
-        i2 = DatetimeIndex(
-            i.tz_localize(None).asi8, dtype=i.dtype, tz=i.dtype.tz)
-        self.assert_index_equal(i, i2)
+class TestDatetimeIndex(object):
+
+    @pytest.mark.parametrize('dt_cls', [DatetimeIndex,
+                                        DatetimeArray._from_sequence])
+    def test_freq_validation_with_nat(self, dt_cls):
+        # GH#11587 make sure we get a useful error message when generate_range
+        #  raises
+        msg = ("Inferred frequency None from passed values does not conform "
+               "to passed frequency D")
+        with pytest.raises(ValueError, match=msg):
+            dt_cls([pd.NaT, pd.Timestamp('2011-01-01')], freq='D')
+        with pytest.raises(ValueError, match=msg):
+            dt_cls([pd.NaT, pd.Timestamp('2011-01-01').value],
+                   freq='D')
+
+    def test_categorical_preserves_tz(self):
+        # GH#18664 retain tz when going DTI-->Categorical-->DTI
+        # TODO: parametrize over DatetimeIndex/DatetimeArray
+        #  once CategoricalIndex(DTA) works
+
+        dti = pd.DatetimeIndex(
+            [pd.NaT, '2015-01-01', '1999-04-06 15:14:13', '2015-01-01'],
+            tz='US/Eastern')
+
+        ci = pd.CategoricalIndex(dti)
+        carr = pd.Categorical(dti)
+        cser = pd.Series(ci)
+
+        for obj in [ci, carr, cser]:
+            result = pd.DatetimeIndex(obj)
+            tm.assert_index_equal(result, dti)
+
+    def test_dti_with_period_data_raises(self):
+        # GH#23675
+        data = pd.PeriodIndex(['2016Q1', '2016Q2'], freq='Q')
+
+        with pytest.raises(TypeError, match="PeriodDtype data is invalid"):
+            DatetimeIndex(data)
+
+        with pytest.raises(TypeError, match="PeriodDtype data is invalid"):
+            to_datetime(data)
+
+        with pytest.raises(TypeError, match="PeriodDtype data is invalid"):
+            DatetimeIndex(period_array(data))
+
+        with pytest.raises(TypeError, match="PeriodDtype data is invalid"):
+            to_datetime(period_array(data))
+
+    def test_dti_with_timedelta64_data_deprecation(self):
+        # GH#23675
+        data = np.array([0], dtype='m8[ns]')
+        with tm.assert_produces_warning(FutureWarning):
+            result = DatetimeIndex(data)
+
+        assert result[0] == Timestamp('1970-01-01')
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = to_datetime(data)
+
+        assert result[0] == Timestamp('1970-01-01')
+
+        with tm.assert_produces_warning(FutureWarning):
+            result = DatetimeIndex(pd.TimedeltaIndex(data))
+
+        assert result[0] == Timestamp('1970-01-01')
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = to_datetime(pd.TimedeltaIndex(data))
+
+        assert result[0] == Timestamp('1970-01-01')
+
+    def test_construction_caching(self):
+
+        df = pd.DataFrame({'dt': pd.date_range('20130101', periods=3),
+                           'dttz': pd.date_range('20130101', periods=3,
+                                                 tz='US/Eastern'),
+                           'dt_with_null': [pd.Timestamp('20130101'), pd.NaT,
+                                            pd.Timestamp('20130103')],
+                           'dtns': pd.date_range('20130101', periods=3,
+                                                 freq='ns')})
+        assert df.dttz.dtype.tz.zone == 'US/Eastern'
+
+    @pytest.mark.parametrize('kwargs', [
+        {'tz': 'dtype.tz'},
+        {'dtype': 'dtype'},
+        {'dtype': 'dtype', 'tz': 'dtype.tz'}])
+    def test_construction_with_alt(self, kwargs, tz_aware_fixture):
+        tz = tz_aware_fixture
+        i = pd.date_range('20130101', periods=5, freq='H', tz=tz)
+        kwargs = {key: attrgetter(val)(i) for key, val in kwargs.items()}
+        result = DatetimeIndex(i, **kwargs)
+        tm.assert_index_equal(i, result)
+
+    @pytest.mark.parametrize('kwargs', [
+        {'tz': 'dtype.tz'},
+        {'dtype': 'dtype'},
+        {'dtype': 'dtype', 'tz': 'dtype.tz'}])
+    def test_construction_with_alt_tz_localize(self, kwargs, tz_aware_fixture):
+        tz = tz_aware_fixture
+        i = pd.date_range('20130101', periods=5, freq='H', tz=tz)
+        kwargs = {key: attrgetter(val)(i) for key, val in kwargs.items()}
+
+        if str(tz) in ('UTC', 'tzutc()'):
+            warn = None
+        else:
+            warn = FutureWarning
+
+        with tm.assert_produces_warning(warn, check_stacklevel=False):
+            result = DatetimeIndex(i.tz_localize(None).asi8, **kwargs)
+        expected = DatetimeIndex(i, **kwargs)
+        tm.assert_index_equal(result, expected)
 
         # localize into the provided tz
         i2 = DatetimeIndex(i.tz_localize(None).asi8, tz='UTC')
         expected = i.tz_localize(None).tz_localize('UTC')
-        self.assert_index_equal(i2, expected)
+        tm.assert_index_equal(i2, expected)
 
         # incompat tz/dtype
-        self.assertRaises(ValueError, lambda: DatetimeIndex(
-            i.tz_localize(None).asi8, dtype=i.dtype, tz='US/Pacific'))
+        msg = "cannot supply both a tz and a dtype with a tz"
+        with pytest.raises(ValueError, match=msg):
+            DatetimeIndex(i.tz_localize(None).asi8,
+                          dtype=i.dtype, tz='US/Pacific')
 
     def test_construction_index_with_mixed_timezones(self):
-        # GH 11488
-        # no tz results in DatetimeIndex
+        # gh-11488: no tz results in DatetimeIndex
         result = Index([Timestamp('2011-01-01'),
                         Timestamp('2011-01-02')], name='idx')
         exp = DatetimeIndex([Timestamp('2011-01-01'),
                              Timestamp('2011-01-02')], name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNone(result.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
 
         # same tz results in DatetimeIndex
         result = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
@@ -55,10 +157,10 @@ def test_construction_index_with_mixed_timezones(self):
         exp = DatetimeIndex(
             [Timestamp('2011-01-01 10:00'), Timestamp('2011-01-02 10:00')
              ], tz='Asia/Tokyo', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
         # same tz results in DatetimeIndex (DST)
         result = Index([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
@@ -67,20 +169,20 @@ def test_construction_index_with_mixed_timezones(self):
         exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
                              Timestamp('2011-08-01 10:00')],
                             tz='US/Eastern', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
-        # different tz results in Index(dtype=object)
+        # Different tz results in Index(dtype=object)
         result = Index([Timestamp('2011-01-01 10:00'),
                         Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                        name='idx')
         exp = Index([Timestamp('2011-01-01 10:00'),
                      Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                     dtype='object', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertFalse(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
 
         result = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                         Timestamp('2011-01-02 10:00', tz='US/Eastern')],
@@ -88,37 +190,37 @@ def test_construction_index_with_mixed_timezones(self):
         exp = Index([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                      Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                     dtype='object', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertFalse(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
 
         # length = 1
         result = Index([Timestamp('2011-01-01')], name='idx')
         exp = DatetimeIndex([Timestamp('2011-01-01')], name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNone(result.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
 
         # length = 1 with tz
         result = Index(
             [Timestamp('2011-01-01 10:00', tz='Asia/Tokyo')], name='idx')
         exp = DatetimeIndex([Timestamp('2011-01-01 10:00')], tz='Asia/Tokyo',
                             name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
     def test_construction_index_with_mixed_timezones_with_NaT(self):
-        # GH 11488
+        # see gh-11488
         result = Index([pd.NaT, Timestamp('2011-01-01'),
                         pd.NaT, Timestamp('2011-01-02')], name='idx')
         exp = DatetimeIndex([pd.NaT, Timestamp('2011-01-01'),
                              pd.NaT, Timestamp('2011-01-02')], name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNone(result.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
 
-        # same tz results in DatetimeIndex
+        # Same tz results in DatetimeIndex
         result = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                         pd.NaT, Timestamp('2011-01-02 10:00',
                                           tz='Asia/Tokyo')],
@@ -126,10 +228,10 @@ def test_construction_index_with_mixed_timezones_with_NaT(self):
         exp = DatetimeIndex([pd.NaT, Timestamp('2011-01-01 10:00'),
                              pd.NaT, Timestamp('2011-01-02 10:00')],
                             tz='Asia/Tokyo', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
         # same tz results in DatetimeIndex (DST)
         result = Index([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
@@ -139,10 +241,10 @@ def test_construction_index_with_mixed_timezones_with_NaT(self):
         exp = DatetimeIndex([Timestamp('2011-01-01 10:00'), pd.NaT,
                              Timestamp('2011-08-01 10:00')],
                             tz='US/Eastern', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
         # different tz results in Index(dtype=object)
         result = Index([pd.NaT, Timestamp('2011-01-01 10:00'),
@@ -152,8 +254,8 @@ def test_construction_index_with_mixed_timezones_with_NaT(self):
         exp = Index([pd.NaT, Timestamp('2011-01-01 10:00'),
                      pd.NaT, Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                     dtype='object', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertFalse(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
 
         result = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                         pd.NaT, Timestamp('2011-01-02 10:00',
@@ -161,23 +263,24 @@ def test_construction_index_with_mixed_timezones_with_NaT(self):
         exp = Index([pd.NaT, Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                      pd.NaT, Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                     dtype='object', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertFalse(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert not isinstance(result, DatetimeIndex)
 
         # all NaT
         result = Index([pd.NaT, pd.NaT], name='idx')
         exp = DatetimeIndex([pd.NaT, pd.NaT], name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNone(result.tz)
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is None
 
         # all NaT with tz
         result = Index([pd.NaT, pd.NaT], tz='Asia/Tokyo', name='idx')
         exp = DatetimeIndex([pd.NaT, pd.NaT], tz='Asia/Tokyo', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-        self.assertIsNotNone(result.tz)
-        self.assertEqual(result.tz, exp.tz)
+
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz is not None
+        assert result.tz == exp.tz
 
     def test_construction_dti_with_mixed_timezones(self):
         # GH 11488 (not changed, added explicit tests)
@@ -187,8 +290,8 @@ def test_construction_dti_with_mixed_timezones(self):
             [Timestamp('2011-01-01'), Timestamp('2011-01-02')], name='idx')
         exp = DatetimeIndex(
             [Timestamp('2011-01-01'), Timestamp('2011-01-02')], name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
 
         # same tz results in DatetimeIndex
         result = DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
@@ -198,8 +301,8 @@ def test_construction_dti_with_mixed_timezones(self):
         exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
                              Timestamp('2011-01-02 10:00')],
                             tz='Asia/Tokyo', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
 
         # same tz results in DatetimeIndex (DST)
         result = DatetimeIndex([Timestamp('2011-01-01 10:00', tz='US/Eastern'),
@@ -209,37 +312,28 @@ def test_construction_dti_with_mixed_timezones(self):
         exp = DatetimeIndex([Timestamp('2011-01-01 10:00'),
                              Timestamp('2011-08-01 10:00')],
                             tz='US/Eastern', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
-
-        # different tz coerces tz-naive to tz-awareIndex(dtype=object)
-        result = DatetimeIndex([Timestamp('2011-01-01 10:00'),
-                                Timestamp('2011-01-02 10:00',
-                                          tz='US/Eastern')], name='idx')
-        exp = DatetimeIndex([Timestamp('2011-01-01 05:00'),
-                             Timestamp('2011-01-02 10:00')],
-                            tz='US/Eastern', name='idx')
-        self.assert_index_equal(result, exp, exact=True)
-        self.assertTrue(isinstance(result, DatetimeIndex))
+        tm.assert_index_equal(result, exp, exact=True)
+        assert isinstance(result, DatetimeIndex)
 
         # tz mismatch affecting to tz-aware raises TypeError/ValueError
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                            Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                           name='idx')
 
-        with tm.assertRaisesRegexp(TypeError, 'data is already tz-aware'):
+        msg = 'cannot be converted to datetime64'
+        with pytest.raises(ValueError, match=msg):
             DatetimeIndex([Timestamp('2011-01-01 10:00'),
                            Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                           tz='Asia/Tokyo', name='idx')
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             DatetimeIndex([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                            Timestamp('2011-01-02 10:00', tz='US/Eastern')],
                           tz='US/Eastern', name='idx')
 
-        with tm.assertRaisesRegexp(TypeError, 'data is already tz-aware'):
+        with pytest.raises(ValueError, match=msg):
             # passing tz should results in DatetimeIndex, then mismatch raises
             # TypeError
             Index([pd.NaT, Timestamp('2011-01-01 10:00'),
@@ -265,7 +359,7 @@ def test_construction_outofbounds(self):
         # coerces to object
         tm.assert_index_equal(Index(dates), exp)
 
-        with tm.assertRaises(OutOfBoundsDatetime):
+        with pytest.raises(OutOfBoundsDatetime):
             # can't create DatetimeIndex
             DatetimeIndex(dates)
 
@@ -274,26 +368,52 @@ def test_construction_with_ndarray(self):
         dates = [datetime(2013, 10, 7),
                  datetime(2013, 10, 8),
                  datetime(2013, 10, 9)]
-        data = DatetimeIndex(dates, freq=pd.tseries.frequencies.BDay()).values
-        result = DatetimeIndex(data, freq=pd.tseries.frequencies.BDay())
+        data = DatetimeIndex(dates, freq=pd.offsets.BDay()).values
+        result = DatetimeIndex(data, freq=pd.offsets.BDay())
         expected = DatetimeIndex(['2013-10-07',
                                   '2013-10-08',
                                   '2013-10-09'],
                                  freq='B')
         tm.assert_index_equal(result, expected)
 
+    def test_verify_integrity_deprecated(self):
+        # GH#23919
+        with tm.assert_produces_warning(FutureWarning):
+            DatetimeIndex(['1/1/2000'], verify_integrity=False)
+
+    def test_range_kwargs_deprecated(self):
+        # GH#23919
+        with tm.assert_produces_warning(FutureWarning):
+            DatetimeIndex(start='1/1/2000', end='1/10/2000', freq='D')
+
+    def test_integer_values_and_tz_deprecated(self):
+        # GH-24559
+        values = np.array([946684800000000000])
+        with tm.assert_produces_warning(FutureWarning):
+            result = DatetimeIndex(values, tz='US/Central')
+        expected = pd.DatetimeIndex(['2000-01-01T00:00:00'], tz="US/Central")
+        tm.assert_index_equal(result, expected)
+
+        # but UTC is *not* deprecated.
+        with tm.assert_produces_warning(None):
+            result = DatetimeIndex(values, tz='UTC')
+        expected = pd.DatetimeIndex(['2000-01-01T00:00:00'], tz="US/Central")
+
     def test_constructor_coverage(self):
         rng = date_range('1/1/2000', periods=10.5)
         exp = date_range('1/1/2000', periods=10)
         tm.assert_index_equal(rng, exp)
 
-        self.assertRaises(ValueError, DatetimeIndex, start='1/1/2000',
-                          periods='foo', freq='D')
+        msg = 'periods must be a number, got foo'
+        with pytest.raises(TypeError, match=msg):
+            date_range(start='1/1/2000', periods='foo', freq='D')
 
-        self.assertRaises(ValueError, DatetimeIndex, start='1/1/2000',
-                          end='1/10/2000')
+        with pytest.raises(ValueError):
+            with tm.assert_produces_warning(FutureWarning):
+                DatetimeIndex(start='1/1/2000', end='1/10/2000')
 
-        self.assertRaises(ValueError, DatetimeIndex, '1/1/2000')
+        with pytest.raises(TypeError):
+            DatetimeIndex('1/1/2000')
 
         # generator expression
         gen = (datetime(2000, 1, 1) + timedelta(i) for i in range(10))
@@ -321,66 +441,65 @@ def test_constructor_coverage(self):
         tm.assert_index_equal(from_ints, expected)
 
         # non-conforming
-        self.assertRaises(ValueError, DatetimeIndex,
-                          ['2000-01-01', '2000-01-02', '2000-01-04'], freq='D')
-
-        self.assertRaises(ValueError, DatetimeIndex, start='2011-01-01',
-                          freq='b')
-        self.assertRaises(ValueError, DatetimeIndex, end='2011-01-01',
-                          freq='B')
-        self.assertRaises(ValueError, DatetimeIndex, periods=10, freq='D')
-
-    def test_constructor_datetime64_tzformat(self):
-        # GH 6572
-        tm._skip_if_no_pytz()
-        import pytz
-        # ISO 8601 format results in pytz.FixedOffset
-        for freq in ['AS', 'W-SUN']:
-            idx = date_range('2013-01-01T00:00:00-05:00',
-                             '2016-01-01T23:59:59-05:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(-300))
-            tm.assert_index_equal(idx, expected)
-            # Unable to use `US/Eastern` because of DST
-            expected_i8 = date_range('2013-01-01T00:00:00',
-                                     '2016-01-01T23:59:59', freq=freq,
-                                     tz='America/Lima')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-            idx = date_range('2013-01-01T00:00:00+09:00',
-                             '2016-01-01T23:59:59+09:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(540))
-            tm.assert_index_equal(idx, expected)
-            expected_i8 = date_range('2013-01-01T00:00:00',
-                                     '2016-01-01T23:59:59', freq=freq,
-                                     tz='Asia/Tokyo')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-        tm._skip_if_no_dateutil()
+        msg = ("Inferred frequency None from passed values does not conform"
+               " to passed frequency D")
+        with pytest.raises(ValueError, match=msg):
+            DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'], freq='D')
+
+        msg = ("Of the four parameters: start, end, periods, and freq, exactly"
+               " three must be specified")
+        with pytest.raises(ValueError, match=msg):
+            date_range(start='2011-01-01', freq='b')
+        with pytest.raises(ValueError, match=msg):
+            date_range(end='2011-01-01', freq='B')
+        with pytest.raises(ValueError, match=msg):
+            date_range(periods=10, freq='D')
+
+    @pytest.mark.parametrize('freq', ['AS', 'W-SUN'])
+    def test_constructor_datetime64_tzformat(self, freq):
+        # see GH#6572: ISO 8601 format results in pytz.FixedOffset
+        idx = date_range('2013-01-01T00:00:00-05:00',
+                         '2016-01-01T23:59:59-05:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(-300))
+        tm.assert_index_equal(idx, expected)
+        # Unable to use `US/Eastern` because of DST
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='America/Lima')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+        idx = date_range('2013-01-01T00:00:00+09:00',
+                         '2016-01-01T23:59:59+09:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(540))
+        tm.assert_index_equal(idx, expected)
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='Asia/Tokyo')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
 
         # Non ISO 8601 format results in dateutil.tz.tzoffset
-        for freq in ['AS', 'W-SUN']:
-            idx = date_range('2013/1/1 0:00:00-5:00', '2016/1/1 23:59:59-5:00',
-                             freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(-300))
-            tm.assert_index_equal(idx, expected)
-            # Unable to use `US/Eastern` because of DST
-            expected_i8 = date_range('2013-01-01T00:00:00',
-                                     '2016-01-01T23:59:59', freq=freq,
-                                     tz='America/Lima')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
-
-            idx = date_range('2013/1/1 0:00:00+9:00',
-                             '2016/1/1 23:59:59+09:00', freq=freq)
-            expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
-                                  freq=freq, tz=pytz.FixedOffset(540))
-            tm.assert_index_equal(idx, expected)
-            expected_i8 = date_range('2013-01-01T00:00:00',
-                                     '2016-01-01T23:59:59', freq=freq,
-                                     tz='Asia/Tokyo')
-            self.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+        idx = date_range('2013/1/1 0:00:00-5:00', '2016/1/1 23:59:59-5:00',
+                         freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(-300))
+        tm.assert_index_equal(idx, expected)
+        # Unable to use `US/Eastern` because of DST
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='America/Lima')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
+
+        idx = date_range('2013/1/1 0:00:00+9:00',
+                         '2016/1/1 23:59:59+09:00', freq=freq)
+        expected = date_range('2013-01-01T00:00:00', '2016-01-01T23:59:59',
+                              freq=freq, tz=pytz.FixedOffset(540))
+        tm.assert_index_equal(idx, expected)
+        expected_i8 = date_range('2013-01-01T00:00:00',
+                                 '2016-01-01T23:59:59', freq=freq,
+                                 tz='Asia/Tokyo')
+        tm.assert_numpy_array_equal(idx.asi8, expected_i8.asi8)
 
     def test_constructor_dtype(self):
 
@@ -399,120 +518,232 @@ def test_constructor_dtype(self):
         idx = DatetimeIndex(['2013-01-01', '2013-01-02'],
                             dtype='datetime64[ns, US/Eastern]')
 
-        self.assertRaises(ValueError,
-                          lambda: DatetimeIndex(idx,
-                                                dtype='datetime64[ns]'))
+        msg = ("cannot supply both a tz and a timezone-naive dtype"
+               r" \(i\.e\. datetime64\[ns\]\)")
+        with pytest.raises(ValueError, match=msg):
+            DatetimeIndex(idx, dtype='datetime64[ns]')
 
         # this is effectively trying to convert tz's
-        self.assertRaises(TypeError,
-                          lambda: DatetimeIndex(idx,
-                                                dtype='datetime64[ns, CET]'))
-        self.assertRaises(ValueError,
-                          lambda: DatetimeIndex(
-                              idx, tz='CET',
-                              dtype='datetime64[ns, US/Eastern]'))
+        msg = ("data is already tz-aware US/Eastern, unable to set specified"
+               " tz: CET")
+        with pytest.raises(TypeError, match=msg):
+            DatetimeIndex(idx, dtype='datetime64[ns, CET]')
+        msg = "cannot supply both a tz and a dtype with a tz"
+        with pytest.raises(ValueError, match=msg):
+            DatetimeIndex(idx, tz='CET', dtype='datetime64[ns, US/Eastern]')
+
         result = DatetimeIndex(idx, dtype='datetime64[ns, US/Eastern]')
         tm.assert_index_equal(idx, result)
 
     def test_constructor_name(self):
-        idx = DatetimeIndex(start='2000-01-01', periods=1, freq='A',
-                            name='TEST')
-        self.assertEqual(idx.name, 'TEST')
+        idx = date_range(start='2000-01-01', periods=1, freq='A',
+                         name='TEST')
+        assert idx.name == 'TEST'
 
     def test_000constructor_resolution(self):
         # 2252
         t1 = Timestamp((1352934390 * 1000000000) + 1000000 + 1000 + 1)
         idx = DatetimeIndex([t1])
 
-        self.assertEqual(idx.nanosecond[0], t1.nanosecond)
+        assert idx.nanosecond[0] == t1.nanosecond
+
+    def test_disallow_setting_tz(self):
+        # GH 3746
+        dti = DatetimeIndex(['2010'], tz='UTC')
+        with pytest.raises(AttributeError):
+            dti.tz = pytz.timezone('US/Pacific')
+
+    @pytest.mark.parametrize('tz', [
+        None, 'America/Los_Angeles', pytz.timezone('America/Los_Angeles'),
+        Timestamp('2000', tz='America/Los_Angeles').tz])
+    def test_constructor_start_end_with_tz(self, tz):
+        # GH 18595
+        start = Timestamp('2013-01-01 06:00:00', tz='America/Los_Angeles')
+        end = Timestamp('2013-01-02 06:00:00', tz='America/Los_Angeles')
+        result = date_range(freq='D', start=start, end=end, tz=tz)
+        expected = DatetimeIndex(['2013-01-01 06:00:00',
+                                  '2013-01-02 06:00:00'],
+                                 tz='America/Los_Angeles')
+        tm.assert_index_equal(result, expected)
+        # Especially assert that the timezone is consistent for pytz
+        assert pytz.timezone('America/Los_Angeles') is result.tz
+
+    @pytest.mark.parametrize('tz', ['US/Pacific', 'US/Eastern', 'Asia/Tokyo'])
+    def test_constructor_with_non_normalized_pytz(self, tz):
+        # GH 18595
+        non_norm_tz = Timestamp('2010', tz=tz).tz
+        result = DatetimeIndex(['2010'], tz=non_norm_tz)
+        assert pytz.timezone(tz) is result.tz
+
+    def test_constructor_timestamp_near_dst(self):
+        # GH 20854
+        ts = [Timestamp('2016-10-30 03:00:00+0300', tz='Europe/Helsinki'),
+              Timestamp('2016-10-30 03:00:00+0200', tz='Europe/Helsinki')]
+        result = DatetimeIndex(ts)
+        expected = DatetimeIndex([ts[0].to_pydatetime(),
+                                  ts[1].to_pydatetime()])
+        tm.assert_index_equal(result, expected)
+
+    # TODO(GH-24559): Remove the xfail for the tz-aware case.
+    @pytest.mark.parametrize('klass', [Index, DatetimeIndex])
+    @pytest.mark.parametrize('box', [
+        np.array, partial(np.array, dtype=object), list])
+    @pytest.mark.parametrize('tz, dtype', [
+        pytest.param('US/Pacific', 'datetime64[ns, US/Pacific]',
+                     marks=[pytest.mark.xfail(),
+                            pytest.mark.filterwarnings(
+                                "ignore:\\n    Passing:FutureWarning")]),
+        [None, 'datetime64[ns]'],
+    ])
+    def test_constructor_with_int_tz(self, klass, box, tz, dtype):
+        # GH 20997, 20964
+        ts = Timestamp('2018-01-01', tz=tz)
+        result = klass(box([ts.value]), dtype=dtype)
+        expected = klass([ts])
+        assert result == expected
+
+    # This is the desired future behavior
+    @pytest.mark.xfail(reason="Future behavior", strict=False)
+    @pytest.mark.filterwarnings("ignore:\\n    Passing:FutureWarning")
+    def test_construction_int_rountrip(self, tz_naive_fixture):
+        # GH 12619
+        # TODO(GH-24559): Remove xfail
+        tz = tz_naive_fixture
+        result = 1293858000000000000
+        expected = DatetimeIndex([1293858000000000000], tz=tz).asi8[0]
+        assert result == expected
+
+    def test_construction_from_replaced_timestamps_with_dst(self):
+        # GH 18785
+        index = pd.date_range(pd.Timestamp(2000, 1, 1),
+                              pd.Timestamp(2005, 1, 1),
+                              freq='MS', tz='Australia/Melbourne')
+        test = pd.DataFrame({'data': range(len(index))}, index=index)
+        test = test.resample('Y').mean()
+        result = pd.DatetimeIndex([x.replace(month=6, day=1)
+                                   for x in test.index])
+        expected = pd.DatetimeIndex(['2000-06-01 00:00:00',
+                                     '2001-06-01 00:00:00',
+                                     '2002-06-01 00:00:00',
+                                     '2003-06-01 00:00:00',
+                                     '2004-06-01 00:00:00',
+                                     '2005-06-01 00:00:00'],
+                                    tz='Australia/Melbourne')
+        tm.assert_index_equal(result, expected)
+
+    def test_construction_with_tz_and_tz_aware_dti(self):
+        # GH 23579
+        dti = date_range('2016-01-01', periods=3, tz='US/Central')
+        with pytest.raises(TypeError):
+            DatetimeIndex(dti, tz='Asia/Tokyo')
+
+    def test_construction_with_nat_and_tzlocal(self):
+        tz = dateutil.tz.tzlocal()
+        result = DatetimeIndex(['2018', 'NaT'], tz=tz)
+        expected = DatetimeIndex([Timestamp('2018', tz=tz), pd.NaT])
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_no_precision_warns(self):
+        # GH-24753, GH-24739
+        expected = pd.DatetimeIndex(['2000'], dtype='datetime64[ns]')
+
+        # we set the stacklevel for DatetimeIndex
+        with tm.assert_produces_warning(FutureWarning):
+            result = pd.DatetimeIndex(['2000'], dtype='datetime64')
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = pd.Index(['2000'], dtype='datetime64')
+        tm.assert_index_equal(result, expected)
 
+    def test_constructor_wrong_precision_raises(self):
+        with pytest.raises(ValueError):
+            pd.DatetimeIndex(['2000'], dtype='datetime64[us]')
 
-class TestTimeSeries(tm.TestCase):
+
+class TestTimeSeries(object):
 
     def test_dti_constructor_preserve_dti_freq(self):
         rng = date_range('1/1/2000', '1/2/2000', freq='5min')
 
         rng2 = DatetimeIndex(rng)
-        self.assertEqual(rng.freq, rng2.freq)
+        assert rng.freq == rng2.freq
 
-    def test_dti_constructor_years_only(self):
+    def test_dti_constructor_years_only(self, tz_naive_fixture):
+        tz = tz_naive_fixture
         # GH 6961
-        for tz in [None, 'UTC', 'Asia/Tokyo', 'dateutil/US/Pacific']:
-            rng1 = date_range('2014', '2015', freq='M', tz=tz)
-            expected1 = date_range('2014-01-31', '2014-12-31', freq='M', tz=tz)
+        rng1 = date_range('2014', '2015', freq='M', tz=tz)
+        expected1 = date_range('2014-01-31', '2014-12-31', freq='M', tz=tz)
 
-            rng2 = date_range('2014', '2015', freq='MS', tz=tz)
-            expected2 = date_range('2014-01-01', '2015-01-01', freq='MS',
-                                   tz=tz)
+        rng2 = date_range('2014', '2015', freq='MS', tz=tz)
+        expected2 = date_range('2014-01-01', '2015-01-01', freq='MS', tz=tz)
 
-            rng3 = date_range('2014', '2020', freq='A', tz=tz)
-            expected3 = date_range('2014-12-31', '2019-12-31', freq='A', tz=tz)
+        rng3 = date_range('2014', '2020', freq='A', tz=tz)
+        expected3 = date_range('2014-12-31', '2019-12-31', freq='A', tz=tz)
 
-            rng4 = date_range('2014', '2020', freq='AS', tz=tz)
-            expected4 = date_range('2014-01-01', '2020-01-01', freq='AS',
-                                   tz=tz)
+        rng4 = date_range('2014', '2020', freq='AS', tz=tz)
+        expected4 = date_range('2014-01-01', '2020-01-01', freq='AS', tz=tz)
 
-            for rng, expected in [(rng1, expected1), (rng2, expected2),
-                                  (rng3, expected3), (rng4, expected4)]:
-                tm.assert_index_equal(rng, expected)
+        for rng, expected in [(rng1, expected1), (rng2, expected2),
+                              (rng3, expected3), (rng4, expected4)]:
+            tm.assert_index_equal(rng, expected)
 
-    def test_dti_constructor_small_int(self):
-        # GH 13721
+    def test_dti_constructor_small_int(self, any_int_dtype):
+        # see gh-13721
         exp = DatetimeIndex(['1970-01-01 00:00:00.00000000',
                              '1970-01-01 00:00:00.00000001',
                              '1970-01-01 00:00:00.00000002'])
 
-        for dtype in [np.int64, np.int32, np.int16, np.int8]:
-            arr = np.array([0, 10, 20], dtype=dtype)
-            tm.assert_index_equal(DatetimeIndex(arr), exp)
+        arr = np.array([0, 10, 20], dtype=any_int_dtype)
+        tm.assert_index_equal(DatetimeIndex(arr), exp)
 
     def test_ctor_str_intraday(self):
         rng = DatetimeIndex(['1-1-2000 00:00:01'])
-        self.assertEqual(rng[0].second, 1)
+        assert rng[0].second == 1
 
     def test_is_(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
-        self.assertTrue(dti.is_(dti))
-        self.assertTrue(dti.is_(dti.view()))
-        self.assertFalse(dti.is_(dti.copy()))
+        dti = date_range(start='1/1/2005', end='12/1/2005', freq='M')
+        assert dti.is_(dti)
+        assert dti.is_(dti.view())
+        assert not dti.is_(dti.copy())
 
     def test_index_cast_datetime64_other_units(self):
         arr = np.arange(0, 100, 10, dtype=np.int64).view('M8[D]')
         idx = Index(arr)
 
-        self.assertTrue((idx.values == tslib.cast_to_nanoseconds(arr)).all())
+        assert (idx.values == conversion.ensure_datetime64ns(arr)).all()
 
     def test_constructor_int64_nocopy(self):
-        # #1624
+        # GH#1624
         arr = np.arange(1000, dtype=np.int64)
         index = DatetimeIndex(arr)
 
         arr[50:100] = -1
-        self.assertTrue((index.asi8[50:100] == -1).all())
+        assert (index.asi8[50:100] == -1).all()
 
         arr = np.arange(1000, dtype=np.int64)
         index = DatetimeIndex(arr, copy=True)
 
         arr[50:100] = -1
-        self.assertTrue((index.asi8[50:100] != -1).all())
-
-    def test_from_freq_recreate_from_data(self):
-        freqs = ['M', 'Q', 'A', 'D', 'B', 'BH', 'T', 'S', 'L', 'U', 'H', 'N',
-                 'C']
+        assert (index.asi8[50:100] != -1).all()
 
-        for f in freqs:
-            org = DatetimeIndex(start='2001/02/01 09:00', freq=f, periods=1)
-            idx = DatetimeIndex(org, freq=f)
-            tm.assert_index_equal(idx, org)
+    @pytest.mark.parametrize('freq', ['M', 'Q', 'A', 'D', 'B', 'BH',
+                                      'T', 'S', 'L', 'U', 'H', 'N', 'C'])
+    def test_from_freq_recreate_from_data(self, freq):
+        org = date_range(start='2001/02/01 09:00', freq=freq, periods=1)
+        idx = DatetimeIndex(org, freq=freq)
+        tm.assert_index_equal(idx, org)
 
-            org = DatetimeIndex(start='2001/02/01 09:00', freq=f,
-                                tz='US/Pacific', periods=1)
-            idx = DatetimeIndex(org, freq=f, tz='US/Pacific')
-            tm.assert_index_equal(idx, org)
+        org = date_range(start='2001/02/01 09:00', freq=freq,
+                         tz='US/Pacific', periods=1)
+        idx = DatetimeIndex(org, freq=freq, tz='US/Pacific')
+        tm.assert_index_equal(idx, org)
 
     def test_datetimeindex_constructor_misc(self):
         arr = ['1/1/2005', '1/2/2005', 'Jn 3, 2005', '2005-01-04']
-        self.assertRaises(Exception, DatetimeIndex, arr)
+        msg = r"(\(u?')?Unknown string format(:', 'Jn 3, 2005'\))?"
+        with pytest.raises(ValueError, match=msg):
+            DatetimeIndex(arr)
 
         arr = ['1/1/2005', '1/2/2005', '1/3/2005', '2005-01-04']
         idx1 = DatetimeIndex(arr)
@@ -520,7 +751,7 @@ def test_datetimeindex_constructor_misc(self):
         arr = [datetime(2005, 1, 1), '1/2/2005', '1/3/2005', '2005-01-04']
         idx2 = DatetimeIndex(arr)
 
-        arr = [lib.Timestamp(datetime(2005, 1, 1)), '1/2/2005', '1/3/2005',
+        arr = [Timestamp(datetime(2005, 1, 1)), '1/2/2005', '1/3/2005',
                '2005-01-04']
         idx3 = DatetimeIndex(arr)
 
@@ -541,34 +772,34 @@ def test_datetimeindex_constructor_misc(self):
         tm.assert_index_equal(idx7, idx8)
 
         for other in [idx2, idx3, idx4, idx5, idx6]:
-            self.assertTrue((idx1.values == other.values).all())
+            assert (idx1.values == other.values).all()
 
         sdate = datetime(1999, 12, 25)
         edate = datetime(2000, 1, 1)
-        idx = DatetimeIndex(start=sdate, freq='1B', periods=20)
-        self.assertEqual(len(idx), 20)
-        self.assertEqual(idx[0], sdate + 0 * offsets.BDay())
-        self.assertEqual(idx.freq, 'B')
-
-        idx = DatetimeIndex(end=edate, freq=('D', 5), periods=20)
-        self.assertEqual(len(idx), 20)
-        self.assertEqual(idx[-1], edate)
-        self.assertEqual(idx.freq, '5D')
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='W-SUN')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=offsets.Week(weekday=6))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='QS')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=offsets.QuarterBegin(startingMonth=1))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
-
-        idx1 = DatetimeIndex(start=sdate, end=edate, freq='BQ')
-        idx2 = DatetimeIndex(start=sdate, end=edate,
-                             freq=offsets.BQuarterEnd(startingMonth=12))
-        self.assertEqual(len(idx1), len(idx2))
-        self.assertEqual(idx1.offset, idx2.offset)
+        idx = date_range(start=sdate, freq='1B', periods=20)
+        assert len(idx) == 20
+        assert idx[0] == sdate + 0 * offsets.BDay()
+        assert idx.freq == 'B'
+
+        idx = date_range(end=edate, freq=('D', 5), periods=20)
+        assert len(idx) == 20
+        assert idx[-1] == edate
+        assert idx.freq == '5D'
+
+        idx1 = date_range(start=sdate, end=edate, freq='W-SUN')
+        idx2 = date_range(start=sdate, end=edate,
+                          freq=offsets.Week(weekday=6))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
+
+        idx1 = date_range(start=sdate, end=edate, freq='QS')
+        idx2 = date_range(start=sdate, end=edate,
+                          freq=offsets.QuarterBegin(startingMonth=1))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
+
+        idx1 = date_range(start=sdate, end=edate, freq='BQ')
+        idx2 = date_range(start=sdate, end=edate,
+                          freq=offsets.BQuarterEnd(startingMonth=12))
+        assert len(idx1) == len(idx2)
+        assert idx1.freq == idx2.freq
diff --git a/pandas/tests/indexes/datetimes/test_date_range.py b/pandas/tests/indexes/datetimes/test_date_range.py
index 67e82e5c71d75..a38ee264d362c 100644
--- a/pandas/tests/indexes/datetimes/test_date_range.py
+++ b/pandas/tests/indexes/datetimes/test_date_range.py
@@ -1,34 +1,189 @@
 """
-test date_range, bdate_range, cdate_range
-construction from the convenience range functions
+test date_range, bdate_range construction from the convenience range functions
 """
 
+from datetime import datetime, time, timedelta
+
 import numpy as np
-from datetime import datetime, timedelta, time
+import pytest
+import pytz
+from pytz import timezone
+
+import pandas.compat as compat
+from pandas.errors import OutOfBoundsDatetime
+import pandas.util._test_decorators as td
 
 import pandas as pd
+from pandas import DatetimeIndex, Timestamp, bdate_range, date_range, offsets
+from pandas.tests.series.common import TestData
 import pandas.util.testing as tm
-from pandas import compat
-from pandas.tseries.index import bdate_range, cdate_range
-from pandas import date_range, offsets, DatetimeIndex, Timestamp
-from pandas.tseries.offsets import (generate_range, CDay, BDay,
-                                    DateOffset, MonthEnd)
 
-from pandas.tests.series.common import TestData
+from pandas.tseries.offsets import (
+    BDay, CDay, DateOffset, MonthEnd, generate_range, prefix_mapping)
 
 START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
 
 
-def eq_gen_range(kwargs, expected):
-    rng = generate_range(**kwargs)
-    assert (np.array_equal(list(rng), expected))
+class TestTimestampEquivDateRange(object):
+    # Older tests in TestTimeSeries constructed their `stamp` objects
+    # using `date_range` instead of the `Timestamp` constructor.
+    # TestTimestampEquivDateRange checks that these are equivalent in the
+    # pertinent cases.
+
+    def test_date_range_timestamp_equiv(self):
+        rng = date_range('20090415', '20090519', tz='US/Eastern')
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz='US/Eastern', freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_dateutil(self):
+        rng = date_range('20090415', '20090519', tz='dateutil/US/Eastern')
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz='dateutil/US/Eastern', freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_explicit_pytz(self):
+        rng = date_range('20090415', '20090519',
+                         tz=pytz.timezone('US/Eastern'))
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz=pytz.timezone('US/Eastern'), freq='D')
+        assert ts == stamp
+
+    @td.skip_if_windows_python_3
+    def test_date_range_timestamp_equiv_explicit_dateutil(self):
+        from pandas._libs.tslibs.timezones import dateutil_gettz as gettz
+
+        rng = date_range('20090415', '20090519', tz=gettz('US/Eastern'))
+        stamp = rng[0]
+
+        ts = Timestamp('20090415', tz=gettz('US/Eastern'), freq='D')
+        assert ts == stamp
+
+    def test_date_range_timestamp_equiv_from_datetime_instance(self):
+        datetime_instance = datetime(2014, 3, 4)
+        # build a timestamp with a frequency, since then it supports
+        # addition/subtraction of integers
+        timestamp_instance = date_range(datetime_instance, periods=1,
+                                        freq='D')[0]
+
+        ts = Timestamp(datetime_instance, freq='D')
+        assert ts == timestamp_instance
 
+    def test_date_range_timestamp_equiv_preserve_frequency(self):
+        timestamp_instance = date_range('2014-03-05', periods=1, freq='D')[0]
+        ts = Timestamp('2014-03-05', freq='D')
 
-class TestDateRanges(TestData, tm.TestCase):
+        assert timestamp_instance == ts
+
+
+class TestDateRanges(TestData):
+    def test_date_range_nat(self):
+        # GH#11587
+        msg = "Neither `start` nor `end` can be NaT"
+        with pytest.raises(ValueError, match=msg):
+            date_range(start='2016-01-01', end=pd.NaT, freq='D')
+        with pytest.raises(ValueError, match=msg):
+            date_range(start=pd.NaT, end='2016-01-01', freq='D')
+
+    def test_date_range_multiplication_overflow(self):
+        # GH#24255
+        # check that overflows in calculating `addend = periods * stride`
+        #  are caught
+        with tm.assert_produces_warning(None):
+            # we should _not_ be seeing a overflow RuntimeWarning
+            dti = date_range(start='1677-09-22', periods=213503, freq='D')
+
+        assert dti[0] == Timestamp('1677-09-22')
+        assert len(dti) == 213503
+
+        msg = "Cannot generate range with"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            date_range('1969-05-04', periods=200000000, freq='30000D')
+
+    def test_date_range_unsigned_overflow_handling(self):
+        # GH#24255
+        # case where `addend = periods * stride` overflows int64 bounds
+        #  but not uint64 bounds
+        dti = date_range(start='1677-09-22', end='2262-04-11', freq='D')
+
+        dti2 = date_range(start=dti[0], periods=len(dti), freq='D')
+        assert dti2.equals(dti)
+
+        dti3 = date_range(end=dti[-1], periods=len(dti), freq='D')
+        assert dti3.equals(dti)
+
+    def test_date_range_int64_overflow_non_recoverable(self):
+        # GH#24255
+        # case with start later than 1970-01-01, overflow int64 but not uint64
+        msg = "Cannot generate range with"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            date_range(start='1970-02-01', periods=106752 * 24, freq='H')
+
+        # case with end before 1970-01-01, overflow int64 but not uint64
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            date_range(end='1969-11-14', periods=106752 * 24, freq='H')
+
+    def test_date_range_int64_overflow_stride_endpoint_different_signs(self):
+        # cases where stride * periods overflow int64 and stride/endpoint
+        #  have different signs
+        start = Timestamp('2262-02-23')
+        end = Timestamp('1969-11-14')
+
+        expected = date_range(start=start, end=end, freq='-1H')
+        assert expected[0] == start
+        assert expected[-1] == end
+
+        dti = date_range(end=end, periods=len(expected), freq='-1H')
+        tm.assert_index_equal(dti, expected)
+
+        start2 = Timestamp('1970-02-01')
+        end2 = Timestamp('1677-10-22')
+
+        expected2 = date_range(start=start2, end=end2, freq='-1H')
+        assert expected2[0] == start2
+        assert expected2[-1] == end2
+
+        dti2 = date_range(start=start2, periods=len(expected2), freq='-1H')
+        tm.assert_index_equal(dti2, expected2)
+
+    def test_date_range_out_of_bounds(self):
+        # GH#14187
+        with pytest.raises(OutOfBoundsDatetime):
+            date_range('2016-01-01', periods=100000, freq='D')
+        with pytest.raises(OutOfBoundsDatetime):
+            date_range(end='1763-10-12', periods=100000, freq='D')
 
     def test_date_range_gen_error(self):
         rng = date_range('1/1/2000 00:00', '1/1/2000 00:18', freq='5min')
-        self.assertEqual(len(rng), 4)
+        assert len(rng) == 4
+
+    @pytest.mark.parametrize("freq", ["AS", "YS"])
+    def test_begin_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-01-01", "2014-01-01",
+                                "2015-01-01", "2016-01-01",
+                                "2017-01-01"], freq=freq)
+        tm.assert_index_equal(rng, exp)
+
+    @pytest.mark.parametrize("freq", ["A", "Y"])
+    def test_end_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-12-31", "2014-12-31",
+                                "2015-12-31", "2016-12-31"], freq=freq)
+        tm.assert_index_equal(rng, exp)
+
+    @pytest.mark.parametrize("freq", ["BA", "BY"])
+    def test_business_end_year_alias(self, freq):
+        # see gh-9313
+        rng = date_range("1/1/2013", "7/1/2017", freq=freq)
+        exp = pd.DatetimeIndex(["2013-12-31", "2014-12-31",
+                                "2015-12-31", "2016-12-30"], freq=freq)
+        tm.assert_index_equal(rng, exp)
 
     def test_date_range_negative_freq(self):
         # GH 11018
@@ -36,20 +191,20 @@ def test_date_range_negative_freq(self):
         exp = pd.DatetimeIndex(['2011-12-31', '2009-12-31',
                                 '2007-12-31'], freq='-2A')
         tm.assert_index_equal(rng, exp)
-        self.assertEqual(rng.freq, '-2A')
+        assert rng.freq == '-2A'
 
         rng = date_range('2011-01-31', freq='-2M', periods=3)
         exp = pd.DatetimeIndex(['2011-01-31', '2010-11-30',
                                 '2010-09-30'], freq='-2M')
         tm.assert_index_equal(rng, exp)
-        self.assertEqual(rng.freq, '-2M')
+        assert rng.freq == '-2M'
 
     def test_date_range_bms_bug(self):
         # #1645
         rng = date_range('1/1/2000', periods=10, freq='BMS')
 
         ex_first = Timestamp('2000-01-03')
-        self.assertEqual(rng[0], ex_first)
+        assert rng[0] == ex_first
 
     def test_date_range_normalize(self):
         snap = datetime.today()
@@ -66,21 +221,59 @@ def test_date_range_normalize(self):
                          freq='B')
         the_time = time(8, 15)
         for val in rng:
-            self.assertEqual(val.time(), the_time)
+            assert val.time() == the_time
 
     def test_date_range_fy5252(self):
         dr = date_range(start="2013-01-01", periods=2, freq=offsets.FY5253(
             startingMonth=1, weekday=3, variation="nearest"))
-        self.assertEqual(dr[0], Timestamp('2013-01-31'))
-        self.assertEqual(dr[1], Timestamp('2014-01-30'))
+        assert dr[0] == Timestamp('2013-01-31')
+        assert dr[1] == Timestamp('2014-01-30')
 
     def test_date_range_ambiguous_arguments(self):
         # #2538
         start = datetime(2011, 1, 1, 5, 3, 40)
         end = datetime(2011, 1, 1, 8, 9, 40)
 
-        self.assertRaises(ValueError, date_range, start, end, freq='s',
-                          periods=10)
+        msg = ('Of the four parameters: start, end, periods, and '
+               'freq, exactly three must be specified')
+        with pytest.raises(ValueError, match=msg):
+            date_range(start, end, periods=10, freq='s')
+
+    def test_date_range_convenience_periods(self):
+        # GH 20808
+        result = date_range('2018-04-24', '2018-04-27', periods=3)
+        expected = DatetimeIndex(['2018-04-24 00:00:00',
+                                  '2018-04-25 12:00:00',
+                                  '2018-04-27 00:00:00'], freq=None)
+
+        tm.assert_index_equal(result, expected)
+
+        # Test if spacing remains linear if tz changes to dst in range
+        result = date_range('2018-04-01 01:00:00',
+                            '2018-04-01 04:00:00',
+                            tz='Australia/Sydney',
+                            periods=3)
+        expected = DatetimeIndex([Timestamp('2018-04-01 01:00:00+1100',
+                                            tz='Australia/Sydney'),
+                                  Timestamp('2018-04-01 02:00:00+1000',
+                                            tz='Australia/Sydney'),
+                                  Timestamp('2018-04-01 04:00:00+1000',
+                                            tz='Australia/Sydney')])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start,end,result_tz', [
+        ['20180101', '20180103', 'US/Eastern'],
+        [datetime(2018, 1, 1), datetime(2018, 1, 3), 'US/Eastern'],
+        [Timestamp('20180101'), Timestamp('20180103'), 'US/Eastern'],
+        [Timestamp('20180101', tz='US/Eastern'),
+         Timestamp('20180103', tz='US/Eastern'), 'US/Eastern'],
+        [Timestamp('20180101', tz='US/Eastern'),
+         Timestamp('20180103', tz='US/Eastern'), None]])
+    def test_date_range_linspacing_tz(self, start, end, result_tz):
+        # GH 20983
+        result = date_range(start, end, periods=3, tz=result_tz)
+        expected = date_range('20180101', periods=3, freq='D', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
 
     def test_date_range_businesshour(self):
         idx = DatetimeIndex(['2014-07-04 09:00', '2014-07-04 10:00',
@@ -118,174 +311,79 @@ def test_date_range_businesshour(self):
 
     def test_range_misspecified(self):
         # GH #1095
+        msg = ('Of the four parameters: start, end, periods, and '
+               'freq, exactly three must be specified')
 
-        self.assertRaises(ValueError, date_range, '1/1/2000')
-        self.assertRaises(ValueError, date_range, end='1/1/2000')
-        self.assertRaises(ValueError, date_range, periods=10)
+        with pytest.raises(ValueError, match=msg):
+            date_range(start='1/1/2000')
 
-        self.assertRaises(ValueError, date_range, '1/1/2000', freq='H')
-        self.assertRaises(ValueError, date_range, end='1/1/2000', freq='H')
-        self.assertRaises(ValueError, date_range, periods=10, freq='H')
+        with pytest.raises(ValueError, match=msg):
+            date_range(end='1/1/2000')
 
-    def test_compat_replace(self):
-        # https://github.com/statsmodels/statsmodels/issues/3349
-        # replace should take ints/longs for compat
+        with pytest.raises(ValueError, match=msg):
+            date_range(periods=10)
 
-        for f in [compat.long, int]:
-            result = date_range(Timestamp('1960-04-01 00:00:00',
-                                          freq='QS-JAN'),
-                                periods=f(76),
-                                freq='QS-JAN')
-            self.assertEqual(len(result), 76)
+        with pytest.raises(ValueError, match=msg):
+            date_range(start='1/1/2000', freq='H')
 
-    def test_catch_infinite_loop(self):
-        offset = offsets.DateOffset(minute=5)
-        # blow up, don't loop forever
-        self.assertRaises(Exception, date_range, datetime(2011, 11, 11),
-                          datetime(2011, 11, 12), freq=offset)
+        with pytest.raises(ValueError, match=msg):
+            date_range(end='1/1/2000', freq='H')
 
+        with pytest.raises(ValueError, match=msg):
+            date_range(periods=10, freq='H')
 
-class TestGenRangeGeneration(tm.TestCase):
-
-    def test_generate(self):
-        rng1 = list(generate_range(START, END, offset=BDay()))
-        rng2 = list(generate_range(START, END, time_rule='B'))
-        self.assertEqual(rng1, rng2)
-
-    def test_generate_cday(self):
-        rng1 = list(generate_range(START, END, offset=CDay()))
-        rng2 = list(generate_range(START, END, time_rule='C'))
-        self.assertEqual(rng1, rng2)
+        with pytest.raises(ValueError, match=msg):
+            date_range()
 
-    def test_1(self):
-        eq_gen_range(dict(start=datetime(2009, 3, 25), periods=2),
-                     [datetime(2009, 3, 25), datetime(2009, 3, 26)])
-
-    def test_2(self):
-        eq_gen_range(dict(start=datetime(2008, 1, 1),
-                          end=datetime(2008, 1, 3)),
-                     [datetime(2008, 1, 1),
-                      datetime(2008, 1, 2),
-                      datetime(2008, 1, 3)])
-
-    def test_3(self):
-        eq_gen_range(dict(start=datetime(2008, 1, 5),
-                          end=datetime(2008, 1, 6)),
-                     [])
-
-    def test_precision_finer_than_offset(self):
-        # GH 9907
-        result1 = DatetimeIndex(start='2015-04-15 00:00:03',
-                                end='2016-04-22 00:00:00', freq='Q')
-        result2 = DatetimeIndex(start='2015-04-15 00:00:03',
-                                end='2015-06-22 00:00:04', freq='W')
-        expected1_list = ['2015-06-30 00:00:03', '2015-09-30 00:00:03',
-                          '2015-12-31 00:00:03', '2016-03-31 00:00:03']
-        expected2_list = ['2015-04-19 00:00:03', '2015-04-26 00:00:03',
-                          '2015-05-03 00:00:03', '2015-05-10 00:00:03',
-                          '2015-05-17 00:00:03', '2015-05-24 00:00:03',
-                          '2015-05-31 00:00:03', '2015-06-07 00:00:03',
-                          '2015-06-14 00:00:03', '2015-06-21 00:00:03']
-        expected1 = DatetimeIndex(expected1_list, dtype='datetime64[ns]',
-                                  freq='Q-DEC', tz=None)
-        expected2 = DatetimeIndex(expected2_list, dtype='datetime64[ns]',
-                                  freq='W-SUN', tz=None)
-        self.assert_index_equal(result1, expected1)
-        self.assert_index_equal(result2, expected2)
-
-
-class TestBusinessDateRange(tm.TestCase):
-
-    def setUp(self):
-        self.rng = bdate_range(START, END)
-
-    def test_constructor(self):
-        bdate_range(START, END, freq=BDay())
-        bdate_range(START, periods=20, freq=BDay())
-        bdate_range(end=START, periods=20, freq=BDay())
-        self.assertRaises(ValueError, date_range, '2011-1-1', '2012-1-1', 'B')
-        self.assertRaises(ValueError, bdate_range, '2011-1-1', '2012-1-1', 'B')
-
-    def test_naive_aware_conflicts(self):
-        naive = bdate_range(START, END, freq=BDay(), tz=None)
-        aware = bdate_range(START, END, freq=BDay(),
-                            tz="Asia/Hong_Kong")
-        self.assertRaisesRegexp(TypeError, "tz-naive.*tz-aware",
-                                naive.join, aware)
-        self.assertRaisesRegexp(TypeError, "tz-naive.*tz-aware",
-                                aware.join, naive)
-
-    def test_cached_range(self):
-        DatetimeIndex._cached_range(START, END, offset=BDay())
-        DatetimeIndex._cached_range(START, periods=20, offset=BDay())
-        DatetimeIndex._cached_range(end=START, periods=20, offset=BDay())
-
-        self.assertRaisesRegexp(TypeError, "offset",
-                                DatetimeIndex._cached_range,
-                                START, END)
-
-        self.assertRaisesRegexp(TypeError, "specify period",
-                                DatetimeIndex._cached_range, START,
-                                offset=BDay())
-
-        self.assertRaisesRegexp(TypeError, "specify period",
-                                DatetimeIndex._cached_range, end=END,
-                                offset=BDay())
-
-        self.assertRaisesRegexp(TypeError, "start or end",
-                                DatetimeIndex._cached_range, periods=20,
-                                offset=BDay())
-
-    def test_cached_range_bug(self):
-        rng = date_range('2010-09-01 05:00:00', periods=50,
-                         freq=DateOffset(hours=6))
-        self.assertEqual(len(rng), 50)
-        self.assertEqual(rng[0], datetime(2010, 9, 1, 5))
-
-    def test_timezone_comparaison_bug(self):
-        # smoke test
-        start = Timestamp('20130220 10:00', tz='US/Eastern')
-        result = date_range(start, periods=2, tz='US/Eastern')
-        self.assertEqual(len(result), 2)
-
-    def test_timezone_comparaison_assert(self):
-        start = Timestamp('20130220 10:00', tz='US/Eastern')
-        self.assertRaises(AssertionError, date_range, start, periods=2,
-                          tz='Europe/Berlin')
-
-    def test_misc(self):
-        end = datetime(2009, 5, 13)
-        dr = bdate_range(end=end, periods=20)
-        firstDate = end - 19 * BDay()
-
-        assert len(dr) == 20
-        assert dr[0] == firstDate
-        assert dr[-1] == end
-
-    def test_date_parse_failure(self):
-        badly_formed_date = '2007/100/1'
-
-        self.assertRaises(ValueError, Timestamp, badly_formed_date)
-
-        self.assertRaises(ValueError, bdate_range, start=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, bdate_range, end=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, bdate_range, badly_formed_date,
-                          badly_formed_date)
-
-    def test_daterange_bug_456(self):
-        # GH #456
-        rng1 = bdate_range('12/5/2011', '12/5/2011')
-        rng2 = bdate_range('12/2/2011', '12/5/2011')
-        rng2.offset = BDay()
+    @pytest.mark.parametrize('f', [compat.long, int])
+    def test_compat_replace(self, f):
+        # https://github.com/statsmodels/statsmodels/issues/3349
+        # replace should take ints/longs for compat
+        result = date_range(Timestamp('1960-04-01 00:00:00', freq='QS-JAN'),
+                            periods=f(76), freq='QS-JAN')
+        assert len(result) == 76
 
-        result = rng1.union(rng2)
-        tm.assertIsInstance(result, DatetimeIndex)
+    def test_catch_infinite_loop(self):
+        offset = offsets.DateOffset(minute=5)
+        # blow up, don't loop forever
+        msg = "Offset <DateOffset: minute=5> did not increment date"
+        with pytest.raises(ValueError, match=msg):
+            date_range(datetime(2011, 11, 11), datetime(2011, 11, 12),
+                       freq=offset)
+
+    @pytest.mark.parametrize('periods', (1, 2))
+    def test_wom_len(self, periods):
+        # https://github.com/pandas-dev/pandas/issues/20517
+        res = date_range(start='20110101', periods=periods, freq='WOM-1MON')
+        assert len(res) == periods
+
+    def test_construct_over_dst(self):
+        # GH 20854
+        pre_dst = Timestamp('2010-11-07 01:00:00').tz_localize('US/Pacific',
+                                                               ambiguous=True)
+        pst_dst = Timestamp('2010-11-07 01:00:00').tz_localize('US/Pacific',
+                                                               ambiguous=False)
+        expect_data = [Timestamp('2010-11-07 00:00:00', tz='US/Pacific'),
+                       pre_dst,
+                       pst_dst]
+        expected = DatetimeIndex(expect_data)
+        result = date_range(start='2010-11-7', periods=3,
+                            freq='H', tz='US/Pacific')
+        tm.assert_index_equal(result, expected)
+
+    def test_construct_with_different_start_end_string_format(self):
+        # GH 12064
+        result = date_range('2013-01-01 00:00:00+09:00',
+                            '2013/01/01 02:00:00+09:00', freq='H')
+        expected = DatetimeIndex([Timestamp('2013-01-01 00:00:00+09:00'),
+                                  Timestamp('2013-01-01 01:00:00+09:00'),
+                                  Timestamp('2013-01-01 02:00:00+09:00')])
+        tm.assert_index_equal(result, expected)
 
     def test_error_with_zero_monthends(self):
-        self.assertRaises(ValueError, date_range, '1/1/2000', '1/1/2001',
-                          freq=MonthEnd(0))
+        msg = r'Offset <0 \* MonthEnds> did not increment date'
+        with pytest.raises(ValueError, match=msg):
+            date_range('1/1/2000', '1/1/2001', freq=MonthEnd(0))
 
     def test_range_bug(self):
         # GH #770
@@ -293,102 +391,96 @@ def test_range_bug(self):
         result = date_range("2011-1-1", "2012-1-31", freq=offset)
 
         start = datetime(2011, 1, 1)
-        exp_values = [start + i * offset for i in range(5)]
-        tm.assert_index_equal(result, DatetimeIndex(exp_values))
+        expected = DatetimeIndex([start + i * offset for i in range(5)])
+        tm.assert_index_equal(result, expected)
 
     def test_range_tz_pytz(self):
-        # GH 2906
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-
+        # see gh-2906
         tz = timezone('US/Eastern')
         start = tz.localize(datetime(2011, 1, 1))
         end = tz.localize(datetime(2011, 1, 3))
 
         dr = date_range(start=start, periods=3)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
 
         dr = date_range(end=end, periods=3)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
 
         dr = date_range(start=start, end=end)
-        self.assertEqual(dr.tz.zone, tz.zone)
-        self.assertEqual(dr[0], start)
-        self.assertEqual(dr[2], end)
+        assert dr.tz.zone == tz.zone
+        assert dr[0] == start
+        assert dr[2] == end
+
+    @pytest.mark.parametrize('start, end', [
+        [Timestamp(datetime(2014, 3, 6), tz='US/Eastern'),
+         Timestamp(datetime(2014, 3, 12), tz='US/Eastern')],
+        [Timestamp(datetime(2013, 11, 1), tz='US/Eastern'),
+         Timestamp(datetime(2013, 11, 6), tz='US/Eastern')]
+    ])
+    def test_range_tz_dst_straddle_pytz(self, start, end):
+        dr = date_range(start, end, freq='D')
+        assert dr[0] == start
+        assert dr[-1] == end
+        assert np.all(dr.hour == 0)
 
-    def test_range_tz_dst_straddle_pytz(self):
+        dr = date_range(start, end, freq='D', tz='US/Eastern')
+        assert dr[0] == start
+        assert dr[-1] == end
+        assert np.all(dr.hour == 0)
 
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-        tz = timezone('US/Eastern')
-        dates = [(tz.localize(datetime(2014, 3, 6)),
-                  tz.localize(datetime(2014, 3, 12))),
-                 (tz.localize(datetime(2013, 11, 1)),
-                  tz.localize(datetime(2013, 11, 6)))]
-        for (start, end) in dates:
-            dr = date_range(start, end, freq='D')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour == 0), True)
-
-            dr = date_range(start, end, freq='D', tz='US/Eastern')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour == 0), True)
-
-            dr = date_range(start.replace(tzinfo=None), end.replace(
-                tzinfo=None), freq='D', tz='US/Eastern')
-            self.assertEqual(dr[0], start)
-            self.assertEqual(dr[-1], end)
-            self.assertEqual(np.all(dr.hour == 0), True)
+        dr = date_range(start.replace(tzinfo=None), end.replace(
+            tzinfo=None), freq='D', tz='US/Eastern')
+        assert dr[0] == start
+        assert dr[-1] == end
+        assert np.all(dr.hour == 0)
 
     def test_range_tz_dateutil(self):
-        # GH 2906
-        tm._skip_if_no_dateutil()
+        # see gh-2906
+
         # Use maybe_get_tz to fix filename in tz under dateutil.
-        from pandas._libs.tslib import maybe_get_tz
+        from pandas._libs.tslibs.timezones import maybe_get_tz
         tz = lambda x: maybe_get_tz('dateutil/' + x)
 
         start = datetime(2011, 1, 1, tzinfo=tz('US/Eastern'))
         end = datetime(2011, 1, 3, tzinfo=tz('US/Eastern'))
 
         dr = date_range(start=start, periods=3)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
 
         dr = date_range(end=end, periods=3)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
 
         dr = date_range(start=start, end=end)
-        self.assertTrue(dr.tz == tz('US/Eastern'))
-        self.assertTrue(dr[0] == start)
-        self.assertTrue(dr[2] == end)
+        assert dr.tz == tz('US/Eastern')
+        assert dr[0] == start
+        assert dr[2] == end
 
-    def test_range_closed(self):
+    @pytest.mark.parametrize('freq', ["1D", "3D", "2M", "7W", "3H", "A"])
+    def test_range_closed(self, freq):
         begin = datetime(2011, 1, 1)
         end = datetime(2014, 1, 1)
 
-        for freq in ["1D", "3D", "2M", "7W", "3H", "A"]:
-            closed = date_range(begin, end, closed=None, freq=freq)
-            left = date_range(begin, end, closed="left", freq=freq)
-            right = date_range(begin, end, closed="right", freq=freq)
-            expected_left = left
-            expected_right = right
+        closed = date_range(begin, end, closed=None, freq=freq)
+        left = date_range(begin, end, closed="left", freq=freq)
+        right = date_range(begin, end, closed="right", freq=freq)
+        expected_left = left
+        expected_right = right
 
-            if end == closed[-1]:
-                expected_left = closed[:-1]
-            if begin == closed[0]:
-                expected_right = closed[1:]
+        if end == closed[-1]:
+            expected_left = closed[:-1]
+        if begin == closed[0]:
+            expected_right = closed[1:]
 
-            self.assert_index_equal(expected_left, left)
-            self.assert_index_equal(expected_right, right)
+        tm.assert_index_equal(expected_left, left)
+        tm.assert_index_equal(expected_right, right)
 
     def test_range_closed_with_tz_aware_start_end(self):
         # GH12409, GH12684
@@ -407,8 +499,8 @@ def test_range_closed_with_tz_aware_start_end(self):
             if begin == closed[0]:
                 expected_right = closed[1:]
 
-            self.assert_index_equal(expected_left, left)
-            self.assert_index_equal(expected_right, right)
+            tm.assert_index_equal(expected_left, left)
+            tm.assert_index_equal(expected_right, right)
 
         begin = Timestamp('2011/1/1')
         end = Timestamp('2014/1/1')
@@ -430,37 +522,37 @@ def test_range_closed_with_tz_aware_start_end(self):
             if begintz == closed[0]:
                 expected_right = closed[1:]
 
-            self.assert_index_equal(expected_left, left)
-            self.assert_index_equal(expected_right, right)
-
-    def test_range_closed_boundary(self):
-        # GH 11804
-        for closed in ['right', 'left', None]:
-            right_boundary = date_range('2015-09-12', '2015-12-01',
-                                        freq='QS-MAR', closed=closed)
-            left_boundary = date_range('2015-09-01', '2015-09-12',
-                                       freq='QS-MAR', closed=closed)
-            both_boundary = date_range('2015-09-01', '2015-12-01',
-                                       freq='QS-MAR', closed=closed)
-            expected_right = expected_left = expected_both = both_boundary
-
-            if closed == 'right':
-                expected_left = both_boundary[1:]
-            if closed == 'left':
-                expected_right = both_boundary[:-1]
-            if closed is None:
-                expected_right = both_boundary[1:]
-                expected_left = both_boundary[:-1]
-
-            self.assert_index_equal(right_boundary, expected_right)
-            self.assert_index_equal(left_boundary, expected_left)
-            self.assert_index_equal(both_boundary, expected_both)
+            tm.assert_index_equal(expected_left, left)
+            tm.assert_index_equal(expected_right, right)
+
+    @pytest.mark.parametrize('closed', ['right', 'left', None])
+    def test_range_closed_boundary(self, closed):
+        # GH#11804
+        right_boundary = date_range('2015-09-12', '2015-12-01',
+                                    freq='QS-MAR', closed=closed)
+        left_boundary = date_range('2015-09-01', '2015-09-12',
+                                   freq='QS-MAR', closed=closed)
+        both_boundary = date_range('2015-09-01', '2015-12-01',
+                                   freq='QS-MAR', closed=closed)
+        expected_right = expected_left = expected_both = both_boundary
+
+        if closed == 'right':
+            expected_left = both_boundary[1:]
+        if closed == 'left':
+            expected_right = both_boundary[:-1]
+        if closed is None:
+            expected_right = both_boundary[1:]
+            expected_left = both_boundary[:-1]
+
+        tm.assert_index_equal(right_boundary, expected_right)
+        tm.assert_index_equal(left_boundary, expected_left)
+        tm.assert_index_equal(both_boundary, expected_both)
 
     def test_years_only(self):
         # GH 6961
         dr = date_range('2014', '2015', freq='M')
-        self.assertEqual(dr[0], datetime(2014, 1, 31))
-        self.assertEqual(dr[-1], datetime(2014, 12, 31))
+        assert dr[0] == datetime(2014, 1, 31)
+        assert dr[-1] == datetime(2014, 12, 31)
 
     def test_freq_divides_end_in_nanos(self):
         # GH 10885
@@ -476,43 +568,139 @@ def test_freq_divides_end_in_nanos(self):
                                     '2005-01-13 15:45:00'],
                                    dtype='datetime64[ns]', freq='345T',
                                    tz=None)
-        self.assert_index_equal(result_1, expected_1)
-        self.assert_index_equal(result_2, expected_2)
+        tm.assert_index_equal(result_1, expected_1)
+        tm.assert_index_equal(result_2, expected_2)
 
+    def test_cached_range_bug(self):
+        rng = date_range('2010-09-01 05:00:00', periods=50,
+                         freq=DateOffset(hours=6))
+        assert len(rng) == 50
+        assert rng[0] == datetime(2010, 9, 1, 5)
 
-class TestCustomDateRange(tm.TestCase):
-    def setUp(self):
-        self.rng = cdate_range(START, END)
+    def test_timezone_comparaison_bug(self):
+        # smoke test
+        start = Timestamp('20130220 10:00', tz='US/Eastern')
+        result = date_range(start, periods=2, tz='US/Eastern')
+        assert len(result) == 2
+
+    def test_timezone_comparaison_assert(self):
+        start = Timestamp('20130220 10:00', tz='US/Eastern')
+        msg = 'Inferred time zone not equal to passed time zone'
+        with pytest.raises(AssertionError, match=msg):
+            date_range(start, periods=2, tz='Europe/Berlin')
+
+    def test_negative_non_tick_frequency_descending_dates(self,
+                                                          tz_aware_fixture):
+        # GH 23270
+        tz = tz_aware_fixture
+        result = pd.date_range(start='2011-06-01', end='2011-01-01',
+                               freq='-1MS', tz=tz)
+        expected = pd.date_range(end='2011-06-01', start='2011-01-01',
+                                 freq='1MS', tz=tz)[::-1]
+        tm.assert_index_equal(result, expected)
+
+
+class TestGenRangeGeneration(object):
+
+    def test_generate(self):
+        rng1 = list(generate_range(START, END, offset=BDay()))
+        rng2 = list(generate_range(START, END, offset='B'))
+        assert rng1 == rng2
+
+    def test_generate_cday(self):
+        rng1 = list(generate_range(START, END, offset=CDay()))
+        rng2 = list(generate_range(START, END, offset='C'))
+        assert rng1 == rng2
+
+    def test_1(self):
+        rng = list(generate_range(start=datetime(2009, 3, 25), periods=2))
+        expected = [datetime(2009, 3, 25), datetime(2009, 3, 26)]
+        assert rng == expected
+
+    def test_2(self):
+        rng = list(generate_range(start=datetime(2008, 1, 1),
+                                  end=datetime(2008, 1, 3)))
+        expected = [datetime(2008, 1, 1),
+                    datetime(2008, 1, 2),
+                    datetime(2008, 1, 3)]
+        assert rng == expected
+
+    def test_3(self):
+        rng = list(generate_range(start=datetime(2008, 1, 5),
+                                  end=datetime(2008, 1, 6)))
+        expected = []
+        assert rng == expected
+
+    def test_precision_finer_than_offset(self):
+        # GH#9907
+        result1 = pd.date_range(start='2015-04-15 00:00:03',
+                                end='2016-04-22 00:00:00', freq='Q')
+        result2 = pd.date_range(start='2015-04-15 00:00:03',
+                                end='2015-06-22 00:00:04', freq='W')
+        expected1_list = ['2015-06-30 00:00:03', '2015-09-30 00:00:03',
+                          '2015-12-31 00:00:03', '2016-03-31 00:00:03']
+        expected2_list = ['2015-04-19 00:00:03', '2015-04-26 00:00:03',
+                          '2015-05-03 00:00:03', '2015-05-10 00:00:03',
+                          '2015-05-17 00:00:03', '2015-05-24 00:00:03',
+                          '2015-05-31 00:00:03', '2015-06-07 00:00:03',
+                          '2015-06-14 00:00:03', '2015-06-21 00:00:03']
+        expected1 = DatetimeIndex(expected1_list, dtype='datetime64[ns]',
+                                  freq='Q-DEC', tz=None)
+        expected2 = DatetimeIndex(expected2_list, dtype='datetime64[ns]',
+                                  freq='W-SUN', tz=None)
+        tm.assert_index_equal(result1, expected1)
+        tm.assert_index_equal(result2, expected2)
+
+    dt1, dt2 = '2017-01-01', '2017-01-01'
+    tz1, tz2 = 'US/Eastern', 'Europe/London'
+
+    @pytest.mark.parametrize("start,end", [
+        (pd.Timestamp(dt1, tz=tz1), pd.Timestamp(dt2)),
+        (pd.Timestamp(dt1), pd.Timestamp(dt2, tz=tz2)),
+        (pd.Timestamp(dt1, tz=tz1), pd.Timestamp(dt2, tz=tz2)),
+        (pd.Timestamp(dt1, tz=tz2), pd.Timestamp(dt2, tz=tz1))
+    ])
+    def test_mismatching_tz_raises_err(self, start, end):
+        # issue 18488
+        with pytest.raises(TypeError):
+            pd.date_range(start, end)
+        with pytest.raises(TypeError):
+            pd.date_range(start, end, freq=BDay())
+
+
+class TestBusinessDateRange(object):
 
     def test_constructor(self):
-        cdate_range(START, END, freq=CDay())
-        cdate_range(START, periods=20, freq=CDay())
-        cdate_range(end=START, periods=20, freq=CDay())
-        self.assertRaises(ValueError, date_range, '2011-1-1', '2012-1-1', 'C')
-        self.assertRaises(ValueError, cdate_range, '2011-1-1', '2012-1-1', 'C')
+        bdate_range(START, END, freq=BDay())
+        bdate_range(START, periods=20, freq=BDay())
+        bdate_range(end=START, periods=20, freq=BDay())
+
+        msg = 'periods must be a number, got B'
+        with pytest.raises(TypeError, match=msg):
+            date_range('2011-1-1', '2012-1-1', 'B')
 
-    def test_cached_range(self):
-        DatetimeIndex._cached_range(START, END, offset=CDay())
-        DatetimeIndex._cached_range(START, periods=20,
-                                    offset=CDay())
-        DatetimeIndex._cached_range(end=START, periods=20,
-                                    offset=CDay())
+        with pytest.raises(TypeError, match=msg):
+            bdate_range('2011-1-1', '2012-1-1', 'B')
 
-        self.assertRaises(Exception, DatetimeIndex._cached_range, START, END)
+        msg = 'freq must be specified for bdate_range; use date_range instead'
+        with pytest.raises(TypeError, match=msg):
+            bdate_range(START, END, periods=10, freq=None)
 
-        self.assertRaises(Exception, DatetimeIndex._cached_range, START,
-                          freq=CDay())
+    def test_naive_aware_conflicts(self):
+        naive = bdate_range(START, END, freq=BDay(), tz=None)
+        aware = bdate_range(START, END, freq=BDay(), tz="Asia/Hong_Kong")
 
-        self.assertRaises(Exception, DatetimeIndex._cached_range, end=END,
-                          freq=CDay())
+        msg = 'tz-naive.*tz-aware'
+        with pytest.raises(TypeError, match=msg):
+            naive.join(aware)
 
-        self.assertRaises(Exception, DatetimeIndex._cached_range, periods=20,
-                          freq=CDay())
+        with pytest.raises(TypeError, match=msg):
+            aware.join(naive)
 
     def test_misc(self):
         end = datetime(2009, 5, 13)
-        dr = cdate_range(end=end, periods=20)
-        firstDate = end - 19 * CDay()
+        dr = bdate_range(end=end, periods=20)
+        firstDate = end - 19 * BDay()
 
         assert len(dr) == 20
         assert dr[0] == firstDate
@@ -521,43 +709,136 @@ def test_misc(self):
     def test_date_parse_failure(self):
         badly_formed_date = '2007/100/1'
 
-        self.assertRaises(ValueError, Timestamp, badly_formed_date)
+        with pytest.raises(ValueError):
+            Timestamp(badly_formed_date)
+
+        with pytest.raises(ValueError):
+            bdate_range(start=badly_formed_date, periods=10)
 
-        self.assertRaises(ValueError, cdate_range, start=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, cdate_range, end=badly_formed_date,
-                          periods=10)
-        self.assertRaises(ValueError, cdate_range, badly_formed_date,
-                          badly_formed_date)
+        with pytest.raises(ValueError):
+            bdate_range(end=badly_formed_date, periods=10)
+
+        with pytest.raises(ValueError):
+            bdate_range(badly_formed_date, badly_formed_date)
 
     def test_daterange_bug_456(self):
         # GH #456
-        rng1 = cdate_range('12/5/2011', '12/5/2011')
-        rng2 = cdate_range('12/2/2011', '12/5/2011')
-        rng2.offset = CDay()
+        rng1 = bdate_range('12/5/2011', '12/5/2011')
+        rng2 = bdate_range('12/2/2011', '12/5/2011')
+        rng2.freq = BDay()
 
         result = rng1.union(rng2)
-        tm.assertIsInstance(result, DatetimeIndex)
+        assert isinstance(result, DatetimeIndex)
+
+    @pytest.mark.parametrize('closed', ['left', 'right'])
+    def test_bdays_and_open_boundaries(self, closed):
+        # GH 6673
+        start = '2018-07-21'  # Saturday
+        end = '2018-07-29'  # Sunday
+        result = pd.date_range(start, end, freq='B', closed=closed)
+
+        bday_start = '2018-07-23'  # Monday
+        bday_end = '2018-07-27'  # Friday
+        expected = pd.date_range(bday_start, bday_end, freq='D')
+        tm.assert_index_equal(result, expected)
+
+
+class TestCustomDateRange(object):
+
+    def test_constructor(self):
+        bdate_range(START, END, freq=CDay())
+        bdate_range(START, periods=20, freq=CDay())
+        bdate_range(end=START, periods=20, freq=CDay())
+
+        msg = 'periods must be a number, got C'
+        with pytest.raises(TypeError, match=msg):
+            date_range('2011-1-1', '2012-1-1', 'C')
+
+        with pytest.raises(TypeError, match=msg):
+            bdate_range('2011-1-1', '2012-1-1', 'C')
+
+    def test_misc(self):
+        end = datetime(2009, 5, 13)
+        dr = bdate_range(end=end, periods=20, freq='C')
+        firstDate = end - 19 * CDay()
+
+        assert len(dr) == 20
+        assert dr[0] == firstDate
+        assert dr[-1] == end
+
+    def test_daterange_bug_456(self):
+        # GH #456
+        rng1 = bdate_range('12/5/2011', '12/5/2011', freq='C')
+        rng2 = bdate_range('12/2/2011', '12/5/2011', freq='C')
+        rng2.freq = CDay()
+
+        result = rng1.union(rng2)
+        assert isinstance(result, DatetimeIndex)
 
     def test_cdaterange(self):
-        rng = cdate_range('2013-05-01', periods=3)
-        xp = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-03'])
-        self.assert_index_equal(xp, rng)
+        result = bdate_range('2013-05-01', periods=3, freq='C')
+        expected = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-03'])
+        tm.assert_index_equal(result, expected)
 
     def test_cdaterange_weekmask(self):
-        rng = cdate_range('2013-05-01', periods=3,
-                          weekmask='Sun Mon Tue Wed Thu')
-        xp = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-05'])
-        self.assert_index_equal(xp, rng)
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             weekmask='Sun Mon Tue Wed Thu')
+        expected = DatetimeIndex(['2013-05-01', '2013-05-02', '2013-05-05'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with pytest.raises(ValueError, match=msg):
+            bdate_range('2013-05-01', periods=3,
+                        weekmask='Sun Mon Tue Wed Thu')
 
     def test_cdaterange_holidays(self):
-        rng = cdate_range('2013-05-01', periods=3, holidays=['2013-05-01'])
-        xp = DatetimeIndex(['2013-05-02', '2013-05-03', '2013-05-06'])
-        self.assert_index_equal(xp, rng)
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             holidays=['2013-05-01'])
+        expected = DatetimeIndex(['2013-05-02', '2013-05-03', '2013-05-06'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with pytest.raises(ValueError, match=msg):
+            bdate_range('2013-05-01', periods=3, holidays=['2013-05-01'])
 
     def test_cdaterange_weekmask_and_holidays(self):
-        rng = cdate_range('2013-05-01', periods=3,
-                          weekmask='Sun Mon Tue Wed Thu',
-                          holidays=['2013-05-01'])
-        xp = DatetimeIndex(['2013-05-02', '2013-05-05', '2013-05-06'])
-        self.assert_index_equal(xp, rng)
+        result = bdate_range('2013-05-01', periods=3, freq='C',
+                             weekmask='Sun Mon Tue Wed Thu',
+                             holidays=['2013-05-01'])
+        expected = DatetimeIndex(['2013-05-02', '2013-05-05', '2013-05-06'])
+        tm.assert_index_equal(result, expected)
+
+        # raise with non-custom freq
+        msg = ('a custom frequency string is required when holidays or '
+               'weekmask are passed, got frequency B')
+        with pytest.raises(ValueError, match=msg):
+            bdate_range('2013-05-01', periods=3,
+                        weekmask='Sun Mon Tue Wed Thu',
+                        holidays=['2013-05-01'])
+
+    @pytest.mark.parametrize('freq', [freq for freq in prefix_mapping
+                                      if freq.startswith('C')])
+    def test_all_custom_freq(self, freq):
+        # should not raise
+        bdate_range(START, END, freq=freq, weekmask='Mon Wed Fri',
+                    holidays=['2009-03-14'])
+
+        bad_freq = freq + 'FOO'
+        msg = 'invalid custom frequency string: {freq}'
+        with pytest.raises(ValueError, match=msg.format(freq=bad_freq)):
+            bdate_range(START, END, freq=bad_freq)
+
+    @pytest.mark.parametrize('start_end', [
+        ('2018-01-01T00:00:01.000Z', '2018-01-03T00:00:01.000Z'),
+        ('2018-01-01T00:00:00.010Z', '2018-01-03T00:00:00.010Z'),
+        ('2001-01-01T00:00:00.010Z', '2001-01-03T00:00:00.010Z')])
+    def test_range_with_millisecond_resolution(self, start_end):
+        # https://github.com/pandas-dev/pandas/issues/24110
+        start, end = start_end
+        result = pd.date_range(start=start, end=end, periods=2, closed='left')
+        expected = DatetimeIndex([start])
+        tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_datetime.py b/pandas/tests/indexes/datetimes/test_datetime.py
index 78c37f773547a..c7147e6fe7063 100644
--- a/pandas/tests/indexes/datetimes/test_datetime.py
+++ b/pandas/tests/indexes/datetimes/test_datetime.py
@@ -1,119 +1,35 @@
+from datetime import date
+
+import dateutil
 import numpy as np
-from datetime import date, timedelta, time
+import pytest
 
-import pandas as pd
-import pandas.util.testing as tm
 from pandas.compat import lrange
-from pandas.compat.numpy import np_datetime64_compat
-from pandas import (DatetimeIndex, Index, date_range, Series, DataFrame,
-                    Timestamp, datetime, offsets, _np_version_under1p8)
 
-from pandas.util.testing import assert_series_equal, assert_almost_equal
+import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, Timestamp, date_range, offsets)
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal
 
 randn = np.random.randn
 
 
-class TestDatetimeIndex(tm.TestCase):
-
-    def test_get_loc(self):
-        idx = pd.date_range('2000-01-01', periods=3)
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_pydatetime(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-            if method is not None:
-                self.assertEqual(idx.get_loc(idx[1], method,
-                                             tolerance=pd.Timedelta('0 days')),
-                                 1)
-
-        self.assertEqual(idx.get_loc('2000-01-01', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest'), 1)
-
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance='1 day'), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=pd.Timedelta('1D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=np.timedelta64(1, 'D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-01T12', method='nearest',
-                                     tolerance=timedelta(1)), 1)
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc('2000-01-01T12', method='nearest', tolerance='foo')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2000-01-01T03', method='nearest', tolerance='2 hours')
-
-        self.assertEqual(idx.get_loc('2000', method='nearest'), slice(0, 3))
-        self.assertEqual(idx.get_loc('2000-01', method='nearest'), slice(0, 3))
-
-        self.assertEqual(idx.get_loc('1999', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2001', method='nearest'), 2)
-
-        with tm.assertRaises(KeyError):
-            idx.get_loc('1999', method='pad')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2001', method='backfill')
-
-        with tm.assertRaises(KeyError):
-            idx.get_loc('foobar')
-        with tm.assertRaises(TypeError):
-            idx.get_loc(slice(2))
-
-        idx = pd.to_datetime(['2000-01-01', '2000-01-04'])
-        self.assertEqual(idx.get_loc('2000-01-02', method='nearest'), 0)
-        self.assertEqual(idx.get_loc('2000-01-03', method='nearest'), 1)
-        self.assertEqual(idx.get_loc('2000-01', method='nearest'), slice(0, 2))
-
-        # time indexing
-        idx = pd.date_range('2000-01-01', periods=24, freq='H')
-        tm.assert_numpy_array_equal(idx.get_loc(time(12)),
-                                    np.array([12]), check_dtype=False)
-        tm.assert_numpy_array_equal(idx.get_loc(time(12, 30)),
-                                    np.array([]), check_dtype=False)
-        with tm.assertRaises(NotImplementedError):
-            idx.get_loc(time(12, 30), method='pad')
-
-    def test_get_indexer(self):
-        idx = pd.date_range('2000-01-01', periods=3)
-        exp = np.array([0, 1, 2], dtype=np.intp)
-        tm.assert_numpy_array_equal(idx.get_indexer(idx), exp)
-
-        target = idx[0] + pd.to_timedelta(['-1 hour', '12 hours',
-                                           '1 day 1 hour'])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
-                                    np.array([-1, 0, 1], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
-                                    np.array([0, 1, 2], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
-                                    np.array([0, 1, 1], dtype=np.intp))
-        tm.assert_numpy_array_equal(
-            idx.get_indexer(target, 'nearest',
-                            tolerance=pd.Timedelta('1 hour')),
-            np.array([0, -1, 1], dtype=np.intp))
-        with tm.assertRaises(ValueError):
-            idx.get_indexer(idx[[0]], method='nearest', tolerance='foo')
-
-    def test_reasonable_keyerror(self):
-        # GH #1062
-        index = DatetimeIndex(['1/3/2000'])
-        try:
-            index.get_loc('1/1/2000')
-        except KeyError as e:
-            self.assertIn('2000', str(e))
+class TestDatetimeIndex(object):
 
     def test_roundtrip_pickle_with_tz(self):
 
         # GH 8367
         # round-trip of timezone
         index = date_range('20130101', periods=3, tz='US/Eastern', name='foo')
-        unpickled = self.round_trip_pickle(index)
-        self.assert_index_equal(index, unpickled)
+        unpickled = tm.round_trip_pickle(index)
+        tm.assert_index_equal(index, unpickled)
 
     def test_reindex_preserves_tz_if_target_is_empty_list_or_array(self):
         # GH7774
         index = date_range('20130101', periods=3, tz='US/Eastern')
-        self.assertEqual(str(index.reindex([])[0].tz), 'US/Eastern')
-        self.assertEqual(str(index.reindex(np.array([]))[0].tz), 'US/Eastern')
+        assert str(index.reindex([])[0].tz) == 'US/Eastern'
+        assert str(index.reindex(np.array([]))[0].tz) == 'US/Eastern'
 
     def test_time_loc(self):  # GH8667
         from datetime import time
@@ -148,45 +64,13 @@ def test_time_overflow_for_32bit_machines(self):
         periods = np.int_(1000)
 
         idx1 = pd.date_range(start='2000', periods=periods, freq='S')
-        self.assertEqual(len(idx1), periods)
+        assert len(idx1) == periods
 
         idx2 = pd.date_range(end='2000', periods=periods, freq='S')
-        self.assertEqual(len(idx2), periods)
+        assert len(idx2) == periods
 
     def test_nat(self):
-        self.assertIs(DatetimeIndex([np.nan])[0], pd.NaT)
-
-    def test_ufunc_coercions(self):
-        idx = date_range('2011-01-01', periods=3, freq='2D', name='x')
-
-        delta = np.timedelta64(1, 'D')
-        for result in [idx + delta, np.add(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = date_range('2011-01-02', periods=3, freq='2D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '2D')
-
-        for result in [idx - delta, np.subtract(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = date_range('2010-12-31', periods=3, freq='2D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '2D')
-
-        delta = np.array([np.timedelta64(1, 'D'), np.timedelta64(2, 'D'),
-                          np.timedelta64(3, 'D')])
-        for result in [idx + delta, np.add(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = DatetimeIndex(['2011-01-02', '2011-01-05', '2011-01-08'],
-                                freq='3D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '3D')
-
-        for result in [idx - delta, np.subtract(idx, delta)]:
-            tm.assertIsInstance(result, DatetimeIndex)
-            exp = DatetimeIndex(['2010-12-31', '2011-01-01', '2011-01-02'],
-                                freq='D', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, 'D')
+        assert DatetimeIndex([np.nan])[0] is pd.NaT
 
     def test_week_of_month_frequency(self):
         # GH 5348: "ValueError: Could not evaluate WOM-1SUN" shouldn't raise
@@ -210,15 +94,14 @@ def test_week_of_month_frequency(self):
 
     def test_hash_error(self):
         index = date_range('20010101', periods=10)
-        with tm.assertRaisesRegexp(TypeError, "unhashable type: %r" %
-                                   type(index).__name__):
+        with pytest.raises(TypeError, match=("unhashable type: %r" %
+                                             type(index).__name__)):
             hash(index)
 
     def test_stringified_slice_with_tz(self):
-        # GH2658
-        import datetime
-        start = datetime.datetime.now()
-        idx = DatetimeIndex(start=start, freq="1d", periods=10)
+        # GH#2658
+        start = '2013-01-07'
+        idx = date_range(start=start, freq="1d", periods=10, tz='US/Eastern')
         df = DataFrame(lrange(10), index=idx)
         df["2013-01-14 23:44:34.437768-05:00":]  # no exception here
 
@@ -227,131 +110,11 @@ def test_append_join_nondatetimeindex(self):
         idx = Index(['a', 'b', 'c', 'd'])
 
         result = rng.append(idx)
-        tm.assertIsInstance(result[0], Timestamp)
+        assert isinstance(result[0], Timestamp)
 
         # it works
         rng.join(idx, how='outer')
 
-    def test_to_period_nofreq(self):
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
-        self.assertRaises(ValueError, idx.to_period)
-
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'],
-                            freq='infer')
-        self.assertEqual(idx.freqstr, 'D')
-        expected = pd.PeriodIndex(['2000-01-01', '2000-01-02',
-                                   '2000-01-03'], freq='D')
-        tm.assert_index_equal(idx.to_period(), expected)
-
-        # GH 7606
-        idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
-        self.assertEqual(idx.freqstr, None)
-        tm.assert_index_equal(idx.to_period(), expected)
-
-    def test_comparisons_coverage(self):
-        rng = date_range('1/1/2000', periods=10)
-
-        # raise TypeError for now
-        self.assertRaises(TypeError, rng.__lt__, rng[3].value)
-
-        result = rng == list(rng)
-        exp = rng == rng
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_comparisons_nat(self):
-
-        fidx1 = pd.Index([1.0, np.nan, 3.0, np.nan, 5.0, 7.0])
-        fidx2 = pd.Index([2.0, 3.0, np.nan, np.nan, 6.0, 7.0])
-
-        didx1 = pd.DatetimeIndex(['2014-01-01', pd.NaT, '2014-03-01', pd.NaT,
-                                  '2014-05-01', '2014-07-01'])
-        didx2 = pd.DatetimeIndex(['2014-02-01', '2014-03-01', pd.NaT, pd.NaT,
-                                  '2014-06-01', '2014-07-01'])
-        darr = np.array([np_datetime64_compat('2014-02-01 00:00Z'),
-                         np_datetime64_compat('2014-03-01 00:00Z'),
-                         np_datetime64_compat('nat'), np.datetime64('nat'),
-                         np_datetime64_compat('2014-06-01 00:00Z'),
-                         np_datetime64_compat('2014-07-01 00:00Z')])
-
-        if _np_version_under1p8:
-            # cannot test array because np.datetime('nat') returns today's date
-            cases = [(fidx1, fidx2), (didx1, didx2)]
-        else:
-            cases = [(fidx1, fidx2), (didx1, didx2), (didx1, darr)]
-
-        # Check pd.NaT is handles as the same as np.nan
-        with tm.assert_produces_warning(None):
-            for idx1, idx2 in cases:
-
-                result = idx1 < idx2
-                expected = np.array([True, False, False, False, True, False])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx2 > idx1
-                expected = np.array([True, False, False, False, True, False])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 <= idx2
-                expected = np.array([True, False, False, False, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx2 >= idx1
-                expected = np.array([True, False, False, False, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 == idx2
-                expected = np.array([False, False, False, False, False, True])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 != idx2
-                expected = np.array([True, True, True, True, True, False])
-                self.assert_numpy_array_equal(result, expected)
-
-        with tm.assert_produces_warning(None):
-            for idx1, val in [(fidx1, np.nan), (didx1, pd.NaT)]:
-                result = idx1 < val
-                expected = np.array([False, False, False, False, False, False])
-                self.assert_numpy_array_equal(result, expected)
-                result = idx1 > val
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 <= val
-                self.assert_numpy_array_equal(result, expected)
-                result = idx1 >= val
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 == val
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 != val
-                expected = np.array([True, True, True, True, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
-        # Check pd.NaT is handles as the same as np.nan
-        with tm.assert_produces_warning(None):
-            for idx1, val in [(fidx1, 3), (didx1, datetime(2014, 3, 1))]:
-                result = idx1 < val
-                expected = np.array([True, False, False, False, False, False])
-                self.assert_numpy_array_equal(result, expected)
-                result = idx1 > val
-                expected = np.array([False, False, False, False, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 <= val
-                expected = np.array([True, False, True, False, False, False])
-                self.assert_numpy_array_equal(result, expected)
-                result = idx1 >= val
-                expected = np.array([False, False, True, False, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 == val
-                expected = np.array([False, False, True, False, False, False])
-                self.assert_numpy_array_equal(result, expected)
-
-                result = idx1 != val
-                expected = np.array([True, True, False, True, True, True])
-                self.assert_numpy_array_equal(result, expected)
-
     def test_map(self):
         rng = date_range('1/1/2000', periods=10)
 
@@ -360,18 +123,23 @@ def test_map(self):
         exp = Index([f(x) for x in rng], dtype='<U8')
         tm.assert_index_equal(result, exp)
 
-    def test_iteration_preserves_tz(self):
+    def test_map_fallthrough(self, capsys):
+        # GH#22067, check we don't get warnings about silently ignored errors
+        dti = date_range('2017-01-01', '2018-01-01', freq='B')
+
+        dti.map(lambda x: pd.Period(year=x.year, month=x.month, freq='M'))
 
-        tm._skip_if_no_dateutil()
+        captured = capsys.readouterr()
+        assert captured.err == ''
 
-        # GH 8890
-        import dateutil
+    def test_iteration_preserves_tz(self):
+        # see gh-8890
         index = date_range("2012-01-01", periods=3, freq='H', tz='US/Eastern')
 
         for i, ts in enumerate(index):
             result = ts
             expected = index[i]
-            self.assertEqual(result, expected)
+            assert result == expected
 
         index = date_range("2012-01-01", periods=3, freq='H',
                            tz=dateutil.tz.tzoffset(None, -28800))
@@ -379,8 +147,8 @@ def test_iteration_preserves_tz(self):
         for i, ts in enumerate(index):
             result = ts
             expected = index[i]
-            self.assertEqual(result._repr_base, expected._repr_base)
-            self.assertEqual(result, expected)
+            assert result._repr_base == expected._repr_base
+            assert result == expected
 
         # 9100
         index = pd.DatetimeIndex(['2014-12-01 03:32:39.987000-08:00',
@@ -388,19 +156,30 @@ def test_iteration_preserves_tz(self):
         for i, ts in enumerate(index):
             result = ts
             expected = index[i]
-            self.assertEqual(result._repr_base, expected._repr_base)
-            self.assertEqual(result, expected)
+            assert result._repr_base == expected._repr_base
+            assert result == expected
+
+    @pytest.mark.parametrize('periods', [0, 9999, 10000, 10001])
+    def test_iteration_over_chunksize(self, periods):
+        # GH21012
+
+        index = date_range('2000-01-01 00:00:00', periods=periods, freq='min')
+        num = 0
+        for stamp in index:
+            assert index[num] == stamp
+            num += 1
+        assert num == len(index)
 
     def test_misc_coverage(self):
         rng = date_range('1/1/2000', periods=5)
         result = rng.groupby(rng.day)
-        tm.assertIsInstance(list(result.values())[0][0], Timestamp)
+        assert isinstance(list(result.values())[0][0], Timestamp)
 
         idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
-        self.assertFalse(idx.equals(list(idx)))
+        assert not idx.equals(list(idx))
 
         non_datetime = Index(list('abc'))
-        self.assertFalse(idx.equals(list(non_datetime)))
+        assert not idx.equals(list(non_datetime))
 
     def test_string_index_series_name_converted(self):
         # #1644
@@ -408,144 +187,43 @@ def test_string_index_series_name_converted(self):
                        index=date_range('1/1/2000', periods=10))
 
         result = df.loc['1/3/2000']
-        self.assertEqual(result.name, df.index[2])
+        assert result.name == df.index[2]
 
         result = df.T['1/3/2000']
-        self.assertEqual(result.name, df.index[2])
-
-    def test_overflow_offset(self):
-        # xref https://github.com/statsmodels/statsmodels/issues/3374
-        # ends up multiplying really large numbers which overflow
-
-        t = Timestamp('2017-01-13 00:00:00', freq='D')
-        offset = 20169940 * pd.offsets.Day(1)
-
-        def f():
-            t + offset
-        self.assertRaises(OverflowError, f)
-
-        def f():
-            offset + t
-        self.assertRaises(OverflowError, f)
-
-        def f():
-            t - offset
-        self.assertRaises(OverflowError, f)
+        assert result.name == df.index[2]
 
     def test_get_duplicates(self):
         idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-02',
                              '2000-01-03', '2000-01-03', '2000-01-04'])
 
-        result = idx.get_duplicates()
+        with tm.assert_produces_warning(FutureWarning):
+            # Deprecated - see GH20239
+            result = idx.get_duplicates()
+
         ex = DatetimeIndex(['2000-01-02', '2000-01-03'])
         tm.assert_index_equal(result, ex)
 
     def test_argmin_argmax(self):
         idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
-        self.assertEqual(idx.argmin(), 1)
-        self.assertEqual(idx.argmax(), 0)
+        assert idx.argmin() == 1
+        assert idx.argmax() == 0
 
     def test_sort_values(self):
         idx = DatetimeIndex(['2000-01-04', '2000-01-01', '2000-01-02'])
 
         ordered = idx.sort_values()
-        self.assertTrue(ordered.is_monotonic)
+        assert ordered.is_monotonic
 
         ordered = idx.sort_values(ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
+        assert ordered[::-1].is_monotonic
 
         ordered, dexer = idx.sort_values(return_indexer=True)
-        self.assertTrue(ordered.is_monotonic)
-        self.assert_numpy_array_equal(dexer,
-                                      np.array([1, 2, 0], dtype=np.intp))
+        assert ordered.is_monotonic
+        tm.assert_numpy_array_equal(dexer, np.array([1, 2, 0], dtype=np.intp))
 
         ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-        self.assert_numpy_array_equal(dexer,
-                                      np.array([0, 2, 1], dtype=np.intp))
-
-    def test_take(self):
-        dates = [datetime(2010, 1, 1, 14), datetime(2010, 1, 1, 15),
-                 datetime(2010, 1, 1, 17), datetime(2010, 1, 1, 21)]
-
-        for tz in [None, 'US/Eastern', 'Asia/Tokyo']:
-            idx = DatetimeIndex(start='2010-01-01 09:00',
-                                end='2010-02-01 09:00', freq='H', tz=tz,
-                                name='idx')
-            expected = DatetimeIndex(dates, freq=None, name='idx', tz=tz)
-
-            taken1 = idx.take([5, 6, 8, 12])
-            taken2 = idx[[5, 6, 8, 12]]
-
-            for taken in [taken1, taken2]:
-                tm.assert_index_equal(taken, expected)
-                tm.assertIsInstance(taken, DatetimeIndex)
-                self.assertIsNone(taken.freq)
-                self.assertEqual(taken.tz, expected.tz)
-                self.assertEqual(taken.name, expected.name)
-
-    def test_take_fill_value(self):
-        # GH 12631
-        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
-                               name='xxx')
-        result = idx.take(np.array([1, 0, -1]))
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
-                                    name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        # fill_value
-        result = idx.take(np.array([1, 0, -1]), fill_value=True)
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
-                                    name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        # allow_fill=False
-        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
-                          fill_value=True)
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
-                                    name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            idx.take(np.array([1, -5]))
-
-    def test_take_fill_value_with_timezone(self):
-        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
-                               name='xxx', tz='US/Eastern')
-        result = idx.take(np.array([1, 0, -1]))
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
-                                    name='xxx', tz='US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-        # fill_value
-        result = idx.take(np.array([1, 0, -1]), fill_value=True)
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
-                                    name='xxx', tz='US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-        # allow_fill=False
-        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
-                          fill_value=True)
-        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
-                                    name='xxx', tz='US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            idx.take(np.array([1, -5]))
+        assert ordered[::-1].is_monotonic
+        tm.assert_numpy_array_equal(dexer, np.array([0, 2, 1], dtype=np.intp))
 
     def test_map_bug_1677(self):
         index = DatetimeIndex(['2012-04-25 09:30:00.393000'])
@@ -561,7 +239,7 @@ def test_groupby_function_tuple_1677(self):
         monthly_group = df.groupby(lambda x: (x.year, x.month))
 
         result = monthly_group.mean()
-        tm.assertIsInstance(result.index[0], tuple)
+        assert isinstance(result.index[0], tuple)
 
     def test_append_numpy_bug_1681(self):
         # another datetime64 bug
@@ -570,54 +248,33 @@ def test_append_numpy_bug_1681(self):
         c = DataFrame({'A': 'foo', 'B': dr}, index=dr)
 
         result = a.append(c)
-        self.assertTrue((result['B'] == dr).all())
+        assert (result['B'] == dr).all()
 
     def test_isin(self):
         index = tm.makeDateIndex(4)
         result = index.isin(index)
-        self.assertTrue(result.all())
+        assert result.all()
 
         result = index.isin(list(index))
-        self.assertTrue(result.all())
+        assert result.all()
 
         assert_almost_equal(index.isin([index[2], 5]),
                             np.array([False, False, True, False]))
 
-    def test_time(self):
-        rng = pd.date_range('1/1/2000', freq='12min', periods=10)
-        result = pd.Index(rng).time
-        expected = [t.time() for t in rng]
-        self.assertTrue((result == expected).all())
-
-    def test_date(self):
-        rng = pd.date_range('1/1/2000', freq='12H', periods=10)
-        result = pd.Index(rng).date
-        expected = [t.date() for t in rng]
-        self.assertTrue((result == expected).all())
-
     def test_does_not_convert_mixed_integer(self):
         df = tm.makeCustomDataframe(10, 10,
                                     data_gen_f=lambda *args, **kwargs: randn(),
                                     r_idx_type='i', c_idx_type='dt')
         cols = df.columns.join(df.index, how='outer')
         joined = cols.join(df.columns)
-        self.assertEqual(cols.dtype, np.dtype('O'))
-        self.assertEqual(cols.dtype, joined.dtype)
+        assert cols.dtype == np.dtype('O')
+        assert cols.dtype == joined.dtype
         tm.assert_numpy_array_equal(cols.values, joined.values)
 
-    def test_slice_keeps_name(self):
-        # GH4226
-        st = pd.Timestamp('2013-07-01 00:00:00', tz='America/Los_Angeles')
-        et = pd.Timestamp('2013-07-02 00:00:00', tz='America/Los_Angeles')
-        dr = pd.date_range(st, et, freq='H', name='timebucket')
-        self.assertEqual(dr[1:].name, dr.name)
-
-    def test_join_self(self):
+    def test_join_self(self, join_type):
         index = date_range('1/1/2000', periods=10)
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = index.join(index, how=kind)
-            self.assertIs(index, joined)
+        joined = index.join(index, how=join_type)
+        assert index is joined
 
     def assert_index_parameters(self, index):
         assert index.freq == '40960N'
@@ -633,21 +290,19 @@ def test_ns_index(self):
         index = pd.DatetimeIndex(dt, freq=freq, name='time')
         self.assert_index_parameters(index)
 
-        new_index = pd.DatetimeIndex(start=index[0], end=index[-1],
-                                     freq=index.freq)
+        new_index = pd.date_range(start=index[0], end=index[-1],
+                                  freq=index.freq)
         self.assert_index_parameters(new_index)
 
-    def test_join_with_period_index(self):
+    def test_join_with_period_index(self, join_type):
         df = tm.makeCustomDataframe(
             10, 10, data_gen_f=lambda *args: np.random.randint(2),
             c_idx_type='p', r_idx_type='dt')
         s = df.iloc[:5, 0]
-        joins = 'left', 'right', 'inner', 'outer'
 
-        for join in joins:
-            with tm.assertRaisesRegexp(ValueError, 'can only call with other '
-                                       'PeriodIndex-ed objects'):
-                df.columns.join(s.index, how=join)
+        msg = 'can only call with other PeriodIndex-ed objects'
+        with pytest.raises(ValueError, match=msg):
+            df.columns.join(s.index, how=join_type)
 
     def test_factorize(self):
         idx1 = DatetimeIndex(['2014-01', '2014-01', '2014-02', '2014-02',
@@ -657,11 +312,11 @@ def test_factorize(self):
         exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
 
         arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         # tz must be preserved
@@ -669,7 +324,7 @@ def test_factorize(self):
         exp_idx = exp_idx.tz_localize('Asia/Tokyo')
 
         arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         idx2 = pd.DatetimeIndex(['2014-03', '2014-03', '2014-02', '2014-01',
@@ -678,34 +333,34 @@ def test_factorize(self):
         exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.intp)
         exp_idx = DatetimeIndex(['2014-01', '2014-02', '2014-03'])
         arr, idx = idx2.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         exp_arr = np.array([0, 0, 1, 2, 0, 2], dtype=np.intp)
         exp_idx = DatetimeIndex(['2014-03', '2014-02', '2014-01'])
         arr, idx = idx2.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         # freq must be preserved
         idx3 = date_range('2000-01', periods=4, freq='M', tz='Asia/Tokyo')
         exp_arr = np.array([0, 1, 2, 3], dtype=np.intp)
         arr, idx = idx3.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, idx3)
 
-    def test_factorize_tz(self):
-        # GH 13750
-        for tz in [None, 'UTC', 'US/Eastern', 'Asia/Tokyo']:
-            base = pd.date_range('2016-11-05', freq='H', periods=100, tz=tz)
-            idx = base.repeat(5)
+    def test_factorize_tz(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # GH#13750
+        base = pd.date_range('2016-11-05', freq='H', periods=100, tz=tz)
+        idx = base.repeat(5)
 
-            exp_arr = np.arange(100, dtype=np.intp).repeat(5)
+        exp_arr = np.arange(100, dtype=np.intp).repeat(5)
 
-            for obj in [idx, pd.Series(idx)]:
-                arr, res = obj.factorize()
-                self.assert_numpy_array_equal(arr, exp_arr)
-                tm.assert_index_equal(res, base)
+        for obj in [idx, pd.Series(idx)]:
+            arr, res = obj.factorize()
+            tm.assert_numpy_array_equal(arr, exp_arr)
+            tm.assert_index_equal(res, base)
 
     def test_factorize_dst(self):
         # GH 13750
@@ -714,7 +369,7 @@ def test_factorize_dst(self):
 
         for obj in [idx, pd.Series(idx)]:
             arr, res = obj.factorize()
-            self.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
+            tm.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
             tm.assert_index_equal(res, idx)
 
         idx = pd.date_range('2016-06-13', freq='H', periods=12,
@@ -722,54 +377,59 @@ def test_factorize_dst(self):
 
         for obj in [idx, pd.Series(idx)]:
             arr, res = obj.factorize()
-            self.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
+            tm.assert_numpy_array_equal(arr, np.arange(12, dtype=np.intp))
             tm.assert_index_equal(res, idx)
 
-    def test_slice_with_negative_step(self):
-        ts = Series(np.arange(20),
-                    date_range('2014-01-01', periods=20, freq='MS'))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            assert_series_equal(ts[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
-            assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[Timestamp('2014-10-01')::-1], SLC[9::-1])
-        assert_slices_equivalent(SLC['2014-10-01'::-1], SLC[9::-1])
-
-        assert_slices_equivalent(SLC[:Timestamp('2014-10-01'):-1], SLC[:8:-1])
-        assert_slices_equivalent(SLC[:'2014-10-01':-1], SLC[:8:-1])
-
-        assert_slices_equivalent(SLC['2015-02-01':'2014-10-01':-1],
-                                 SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):Timestamp(
-            '2014-10-01'):-1], SLC[13:8:-1])
-        assert_slices_equivalent(SLC['2015-02-01':Timestamp('2014-10-01'):-1],
-                                 SLC[13:8:-1])
-        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):'2014-10-01':-1],
-                                 SLC[13:8:-1])
-
-        assert_slices_equivalent(SLC['2014-10-01':'2015-02-01':-1], SLC[:0])
-
-    def test_slice_with_zero_step_raises(self):
-        ts = Series(np.arange(20),
-                    date_range('2014-01-01', periods=20, freq='MS'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-
-    def test_slice_bounds_empty(self):
-        # GH 14354
-        empty_idx = DatetimeIndex(freq='1H', periods=0, end='2015')
-
-        right = empty_idx._maybe_cast_slice_bound('2015-01-02', 'right', 'loc')
-        exp = Timestamp('2015-01-02 23:59:59.999999999')
-        self.assertEqual(right, exp)
-
-        left = empty_idx._maybe_cast_slice_bound('2015-01-02', 'left', 'loc')
-        exp = Timestamp('2015-01-02 00:00:00')
-        self.assertEqual(left, exp)
+    @pytest.mark.parametrize('arr, expected', [
+        (pd.DatetimeIndex(['2017', '2017']), pd.DatetimeIndex(['2017'])),
+        (pd.DatetimeIndex(['2017', '2017'], tz='US/Eastern'),
+         pd.DatetimeIndex(['2017'], tz='US/Eastern')),
+    ])
+    def test_unique(self, arr, expected):
+        result = arr.unique()
+        tm.assert_index_equal(result, expected)
+        # GH 21737
+        # Ensure the underlying data is consistent
+        assert result[0] == expected[0]
+
+    def test_asarray_tz_naive(self):
+        # This shouldn't produce a warning.
+        idx = pd.date_range('2000', periods=2)
+        # M8[ns] by default
+        with tm.assert_produces_warning(None):
+            result = np.asarray(idx)
+
+        expected = np.array(['2000-01-01', '2000-01-02'], dtype='M8[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+        # optionally, object
+        with tm.assert_produces_warning(None):
+            result = np.asarray(idx, dtype=object)
+
+        expected = np.array([pd.Timestamp('2000-01-01'),
+                             pd.Timestamp('2000-01-02')])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_asarray_tz_aware(self):
+        tz = 'US/Central'
+        idx = pd.date_range('2000', periods=2, tz=tz)
+        expected = np.array(['2000-01-01T06', '2000-01-02T06'], dtype='M8[ns]')
+        # We warn by default and return an ndarray[M8[ns]]
+        with tm.assert_produces_warning(FutureWarning):
+            result = np.asarray(idx)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # Old behavior with no warning
+        with tm.assert_produces_warning(None):
+            result = np.asarray(idx, dtype="M8[ns]")
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # Future behavior with no warning
+        expected = np.array([pd.Timestamp("2000-01-01", tz=tz),
+                             pd.Timestamp("2000-01-02", tz=tz)])
+        with tm.assert_produces_warning(None):
+            result = np.asarray(idx, dtype=object)
+
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/datetimes/test_datetimelike.py b/pandas/tests/indexes/datetimes/test_datetimelike.py
index 2b254bc8be931..f095e0a06c34e 100644
--- a/pandas/tests/indexes/datetimes/test_datetimelike.py
+++ b/pandas/tests/indexes/datetimes/test_datetimelike.py
@@ -1,76 +1,31 @@
 """ generic tests from the Datetimelike class """
 
-import numpy as np
-import pandas as pd
+from pandas import DatetimeIndex, date_range
 from pandas.util import testing as tm
-from pandas import Series, Index, DatetimeIndex, date_range
 
 from ..datetimelike import DatetimeLike
 
 
-class TestDatetimeIndex(DatetimeLike, tm.TestCase):
+class TestDatetimeIndex(DatetimeLike):
     _holder = DatetimeIndex
 
-    def setUp(self):
-        self.indices = dict(index=tm.makeDateIndex(10))
+    def setup_method(self, method):
+        self.indices = dict(index=tm.makeDateIndex(10),
+                            index_dec=date_range('20130110', periods=10,
+                                                 freq='-1D'))
         self.setup_indices()
 
     def create_index(self):
         return date_range('20130101', periods=5)
 
     def test_shift(self):
-
-        # test shift for datetimeIndex and non datetimeIndex
-        # GH8083
-
-        drange = self.create_index()
-        result = drange.shift(1)
-        expected = DatetimeIndex(['2013-01-02', '2013-01-03', '2013-01-04',
-                                  '2013-01-05',
-                                  '2013-01-06'], freq='D')
-        self.assert_index_equal(result, expected)
-
-        result = drange.shift(-1)
-        expected = DatetimeIndex(['2012-12-31', '2013-01-01', '2013-01-02',
-                                  '2013-01-03', '2013-01-04'],
-                                 freq='D')
-        self.assert_index_equal(result, expected)
-
-        result = drange.shift(3, freq='2D')
-        expected = DatetimeIndex(['2013-01-07', '2013-01-08', '2013-01-09',
-                                  '2013-01-10',
-                                  '2013-01-11'], freq='D')
-        self.assert_index_equal(result, expected)
+        pass  # handled in test_ops
 
     def test_pickle_compat_construction(self):
         pass
 
     def test_intersection(self):
-        first = self.index
-        second = self.index[5:]
-        intersect = first.intersection(second)
-        self.assertTrue(tm.equalContents(intersect, second))
-
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.intersection(case)
-            self.assertTrue(tm.equalContents(result, second))
-
-        third = Index(['a', 'b', 'c'])
-        result = first.intersection(third)
-        expected = pd.Index([], dtype=object)
-        self.assert_index_equal(result, expected)
+        pass  # handled in test_setops
 
     def test_union(self):
-        first = self.index[:5]
-        second = self.index[5:]
-        everything = self.index
-        union = first.union(second)
-        self.assertTrue(tm.equalContents(union, everything))
-
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.union(case)
-            self.assertTrue(tm.equalContents(result, everything))
+        pass  # handled in test_setops
diff --git a/pandas/tests/indexes/datetimes/test_formats.py b/pandas/tests/indexes/datetimes/test_formats.py
new file mode 100644
index 0000000000000..df0a5742e7a49
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_formats.py
@@ -0,0 +1,221 @@
+from datetime import datetime
+
+import dateutil.tz
+import numpy as np
+import pytest
+import pytz
+
+import pandas as pd
+from pandas import DatetimeIndex, Series
+import pandas.util.testing as tm
+
+
+def test_to_native_types():
+    index = pd.date_range(freq='1D', periods=3, start='2017-01-01')
+
+    # First, with no arguments.
+    expected = np.array(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    # No NaN values, so na_rep has no effect
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure slicing works
+    expected = np.array(['2017-01-01', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types([0, 2])
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure date formatting works
+    expected = np.array(['01-2017-01', '01-2017-02',
+                         '01-2017-03'], dtype=object)
+
+    result = index.to_native_types(date_format='%m-%Y-%d')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # NULL object handling should work
+    index = DatetimeIndex(['2017-01-01', pd.NaT, '2017-01-03'])
+    expected = np.array(['2017-01-01', 'NaT', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = np.array(['2017-01-01', 'pandas',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+class TestDatetimeIndexRendering(object):
+    def test_dti_repr_short(self):
+        dr = pd.date_range(start='1/1/2012', periods=1)
+        repr(dr)
+
+        dr = pd.date_range(start='1/1/2012', periods=2)
+        repr(dr)
+
+        dr = pd.date_range(start='1/1/2012', periods=3)
+        repr(dr)
+
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_dti_representation(self, method):
+        idxs = []
+        idxs.append(DatetimeIndex([], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01'], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D'))
+        idxs.append(DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                                  freq='D'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'
+             ], freq='H', tz='Asia/Tokyo'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='US/Eastern'))
+        idxs.append(DatetimeIndex(
+            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='UTC'))
+
+        exp = []
+        exp.append("""DatetimeIndex([], dtype='datetime64[ns]', freq='D')""")
+        exp.append("DatetimeIndex(['2011-01-01'], dtype='datetime64[ns]', "
+                   "freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02'], "
+                   "dtype='datetime64[ns]', freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
+                   "dtype='datetime64[ns]', freq='D')")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00+09:00', "
+                   "'2011-01-01 10:00:00+09:00', '2011-01-01 11:00:00+09:00']"
+                   ", dtype='datetime64[ns, Asia/Tokyo]', freq='H')")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00-05:00', "
+                   "'2011-01-01 10:00:00-05:00', 'NaT'], "
+                   "dtype='datetime64[ns, US/Eastern]', freq=None)")
+        exp.append("DatetimeIndex(['2011-01-01 09:00:00+00:00', "
+                   "'2011-01-01 10:00:00+00:00', 'NaT'], "
+                   "dtype='datetime64[ns, UTC]', freq=None)""")
+
+        with pd.option_context('display.width', 300):
+            for indx, expected in zip(idxs, exp):
+                result = getattr(indx, method)()
+                assert result == expected
+
+    def test_dti_representation_to_series(self):
+        idx1 = DatetimeIndex([], freq='D')
+        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
+        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = DatetimeIndex(
+            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
+        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                              '2011-01-01 11:00'], freq='H', tz='Asia/Tokyo')
+        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
+                             tz='US/Eastern')
+        idx7 = DatetimeIndex(['2011-01-01 09:00', '2011-01-02 10:15'])
+
+        exp1 = """Series([], dtype: datetime64[ns])"""
+
+        exp2 = ("0   2011-01-01\n"
+                "dtype: datetime64[ns]")
+
+        exp3 = ("0   2011-01-01\n"
+                "1   2011-01-02\n"
+                "dtype: datetime64[ns]")
+
+        exp4 = ("0   2011-01-01\n"
+                "1   2011-01-02\n"
+                "2   2011-01-03\n"
+                "dtype: datetime64[ns]")
+
+        exp5 = ("0   2011-01-01 09:00:00+09:00\n"
+                "1   2011-01-01 10:00:00+09:00\n"
+                "2   2011-01-01 11:00:00+09:00\n"
+                "dtype: datetime64[ns, Asia/Tokyo]")
+
+        exp6 = ("0   2011-01-01 09:00:00-05:00\n"
+                "1   2011-01-01 10:00:00-05:00\n"
+                "2                         NaT\n"
+                "dtype: datetime64[ns, US/Eastern]")
+
+        exp7 = ("0   2011-01-01 09:00:00\n"
+                "1   2011-01-02 10:15:00\n"
+                "dtype: datetime64[ns]")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4,
+                                      idx5, idx6, idx7],
+                                     [exp1, exp2, exp3, exp4,
+                                      exp5, exp6, exp7]):
+                result = repr(Series(idx))
+                assert result == expected
+
+    def test_dti_summary(self):
+        # GH#9116
+        idx1 = DatetimeIndex([], freq='D')
+        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
+        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = DatetimeIndex(
+            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
+        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                              '2011-01-01 11:00'],
+                             freq='H', tz='Asia/Tokyo')
+        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
+                             tz='US/Eastern')
+
+        exp1 = ("DatetimeIndex: 0 entries\n"
+                "Freq: D")
+
+        exp2 = ("DatetimeIndex: 1 entries, 2011-01-01 to 2011-01-01\n"
+                "Freq: D")
+
+        exp3 = ("DatetimeIndex: 2 entries, 2011-01-01 to 2011-01-02\n"
+                "Freq: D")
+
+        exp4 = ("DatetimeIndex: 3 entries, 2011-01-01 to 2011-01-03\n"
+                "Freq: D")
+
+        exp5 = ("DatetimeIndex: 3 entries, 2011-01-01 09:00:00+09:00 "
+                "to 2011-01-01 11:00:00+09:00\n"
+                "Freq: H")
+
+        exp6 = """DatetimeIndex: 3 entries, 2011-01-01 09:00:00-05:00 to NaT"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6],
+                                 [exp1, exp2, exp3, exp4, exp5, exp6]):
+            result = idx._summary()
+            assert result == expected
+
+    def test_dti_business_repr(self):
+        # only really care that it works
+        repr(pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1)))
+
+    def test_dti_business_summary(self):
+        rng = pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1))
+        rng._summary()
+        rng[2:2]._summary()
+
+    def test_dti_business_summary_pytz(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)._summary()
+
+    def test_dti_business_summary_dateutil(self):
+        pd.bdate_range('1/1/2005', '1/1/2009',
+                       tz=dateutil.tz.tzutc())._summary()
+
+    def test_dti_custom_business_repr(self):
+        # only really care that it works
+        repr(pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1),
+                            freq='C'))
+
+    def test_dti_custom_business_summary(self):
+        rng = pd.bdate_range(datetime(2009, 1, 1), datetime(2010, 1, 1),
+                             freq='C')
+        rng._summary()
+        rng[2:2]._summary()
+
+    def test_dti_custom_business_summary_pytz(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', freq='C',
+                       tz=pytz.utc)._summary()
+
+    def test_dti_custom_business_summary_dateutil(self):
+        pd.bdate_range('1/1/2005', '1/1/2009', freq='C',
+                       tz=dateutil.tz.tzutc())._summary()
diff --git a/pandas/tests/indexes/datetimes/test_indexing.py b/pandas/tests/indexes/datetimes/test_indexing.py
index 23271a8d45499..c3b00133228d8 100644
--- a/pandas/tests/indexes/datetimes/test_indexing.py
+++ b/pandas/tests/indexes/datetimes/test_indexing.py
@@ -1,45 +1,301 @@
+from datetime import datetime, time, timedelta
+
 import numpy as np
+import pytest
+import pytz
+
+import pandas.compat as compat
 
 import pandas as pd
+from pandas import DatetimeIndex, Index, Timestamp, date_range, notna
 import pandas.util.testing as tm
-import pandas.compat as compat
-from pandas import notnull, Index, DatetimeIndex, datetime, date_range
 
+from pandas.tseries.offsets import BDay, CDay
 
-class TestDatetimeIndex(tm.TestCase):
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
 
-    def test_where_other(self):
 
+class TestGetItem(object):
+    def test_ellipsis(self):
+        # GH#21282
+        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D',
+                            tz='Asia/Tokyo', name='idx')
+
+        result = idx[...]
+        assert result.equals(idx)
+        assert result is not idx
+
+    def test_getitem(self):
+        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
+                             tz='Asia/Tokyo', name='idx')
+
+        for idx in [idx1, idx2]:
+            result = idx[0]
+            assert result == Timestamp('2011-01-01', tz=idx.tz)
+
+            result = idx[0:5]
+            expected = pd.date_range('2011-01-01', '2011-01-05', freq='D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[0:10:2]
+            expected = pd.date_range('2011-01-01', '2011-01-09', freq='2D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[-20:-5:3]
+            expected = pd.date_range('2011-01-12', '2011-01-24', freq='3D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[4::-1]
+            expected = DatetimeIndex(['2011-01-05', '2011-01-04', '2011-01-03',
+                                      '2011-01-02', '2011-01-01'],
+                                     freq='-1D', tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+    def test_dti_business_getitem(self):
+        rng = pd.bdate_range(START, END)
+        smaller = rng[:5]
+        exp = DatetimeIndex(rng.view(np.ndarray)[:5])
+        tm.assert_index_equal(smaller, exp)
+
+        assert smaller.freq == rng.freq
+
+        sliced = rng[::5]
+        assert sliced.freq == BDay() * 5
+
+        fancy_indexed = rng[[4, 3, 2, 1, 0]]
+        assert len(fancy_indexed) == 5
+        assert isinstance(fancy_indexed, DatetimeIndex)
+        assert fancy_indexed.freq is None
+
+        # 32-bit vs. 64-bit platforms
+        assert rng[4] == rng[np.int_(4)]
+
+    def test_dti_business_getitem_matplotlib_hackaround(self):
+        rng = pd.bdate_range(START, END)
+        values = rng[:, None]
+        expected = rng.values[:, None]
+        tm.assert_numpy_array_equal(values, expected)
+
+    def test_dti_custom_getitem(self):
+        rng = pd.bdate_range(START, END, freq='C')
+        smaller = rng[:5]
+        exp = DatetimeIndex(rng.view(np.ndarray)[:5])
+        tm.assert_index_equal(smaller, exp)
+        assert smaller.freq == rng.freq
+
+        sliced = rng[::5]
+        assert sliced.freq == CDay() * 5
+
+        fancy_indexed = rng[[4, 3, 2, 1, 0]]
+        assert len(fancy_indexed) == 5
+        assert isinstance(fancy_indexed, DatetimeIndex)
+        assert fancy_indexed.freq is None
+
+        # 32-bit vs. 64-bit platforms
+        assert rng[4] == rng[np.int_(4)]
+
+    def test_dti_custom_getitem_matplotlib_hackaround(self):
+        rng = pd.bdate_range(START, END, freq='C')
+        values = rng[:, None]
+        expected = rng.values[:, None]
+        tm.assert_numpy_array_equal(values, expected)
+
+
+class TestWhere(object):
+    def test_where_other(self):
         # other is ndarray or Index
         i = pd.date_range('20130101', periods=3, tz='US/Eastern')
 
         for arr in [np.nan, pd.NaT]:
-            result = i.where(notnull(i), other=np.nan)
+            result = i.where(notna(i), other=np.nan)
             expected = i
             tm.assert_index_equal(result, expected)
 
         i2 = i.copy()
         i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
-        result = i.where(notnull(i2), i2)
+        result = i.where(notna(i2), i2)
         tm.assert_index_equal(result, i2)
 
         i2 = i.copy()
         i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
-        result = i.where(notnull(i2), i2.values)
+        result = i.where(notna(i2), i2.values)
         tm.assert_index_equal(result, i2)
 
     def test_where_tz(self):
         i = pd.date_range('20130101', periods=3, tz='US/Eastern')
-        result = i.where(notnull(i))
+        result = i.where(notna(i))
         expected = i
         tm.assert_index_equal(result, expected)
 
         i2 = i.copy()
         i2 = Index([pd.NaT, pd.NaT] + i[2:].tolist())
-        result = i.where(notnull(i2))
+        result = i.where(notna(i2))
         expected = i2
         tm.assert_index_equal(result, expected)
 
+
+class TestTake(object):
+    def test_take(self):
+        # GH#10295
+        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
+                             tz='Asia/Tokyo', name='idx')
+
+        for idx in [idx1, idx2]:
+            result = idx.take([0])
+            assert result == Timestamp('2011-01-01', tz=idx.tz)
+
+            result = idx.take([0, 1, 2])
+            expected = pd.date_range('2011-01-01', '2011-01-03', freq='D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([0, 2, 4])
+            expected = pd.date_range('2011-01-01', '2011-01-05', freq='2D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([7, 4, 1])
+            expected = pd.date_range('2011-01-08', '2011-01-02', freq='-3D',
+                                     tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([3, 2, 5])
+            expected = DatetimeIndex(['2011-01-04', '2011-01-03',
+                                      '2011-01-06'],
+                                     freq=None, tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+            result = idx.take([-3, 2, 5])
+            expected = DatetimeIndex(['2011-01-29', '2011-01-03',
+                                      '2011-01-06'],
+                                     freq=None, tz=idx.tz, name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+    def test_take_invalid_kwargs(self):
+        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
+        indices = [1, 6, 5, 9, 10, 13, 15, 3]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        with pytest.raises(TypeError, match=msg):
+            idx.take(indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, mode='clip')
+
+    # TODO: This method came from test_datetime; de-dup with version above
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern', 'Asia/Tokyo'])
+    def test_take2(self, tz):
+        dates = [datetime(2010, 1, 1, 14), datetime(2010, 1, 1, 15),
+                 datetime(2010, 1, 1, 17), datetime(2010, 1, 1, 21)]
+
+        idx = pd.date_range(start='2010-01-01 09:00',
+                            end='2010-02-01 09:00', freq='H', tz=tz,
+                            name='idx')
+        expected = DatetimeIndex(dates, freq=None, name='idx', tz=tz)
+
+        taken1 = idx.take([5, 6, 8, 12])
+        taken2 = idx[[5, 6, 8, 12]]
+
+        for taken in [taken1, taken2]:
+            tm.assert_index_equal(taken, expected)
+            assert isinstance(taken, DatetimeIndex)
+            assert taken.freq is None
+            assert taken.tz == expected.tz
+            assert taken.name == expected.name
+
+    def test_take_fill_value(self):
+        # GH#12631
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+    def test_take_fill_value_with_timezone(self):
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               name='xxx', tz='US/Eastern')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', 'NaT'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = pd.DatetimeIndex(['2011-02-01', '2011-01-01', '2011-03-01'],
+                                    name='xxx', tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class TestDatetimeIndex(object):
+    @pytest.mark.parametrize('null', [None, np.nan, pd.NaT])
+    @pytest.mark.parametrize('tz', [None, 'UTC', 'US/Eastern'])
+    def test_insert_nat(self, tz, null):
+        # GH#16537, GH#18295 (test missing)
+        idx = pd.DatetimeIndex(['2017-01-01'], tz=tz)
+        expected = pd.DatetimeIndex(['NaT', '2017-01-01'], tz=tz)
+        res = idx.insert(0, null)
+        tm.assert_index_equal(res, expected)
+
     def test_insert(self):
         idx = DatetimeIndex(
             ['2000-01-04', '2000-01-01', '2000-01-02'], name='idx')
@@ -54,9 +310,9 @@ def test_insert(self):
         expected = Index([datetime(2000, 1, 4), 'inserted',
                           datetime(2000, 1, 1),
                           datetime(2000, 1, 2)], name='idx')
-        self.assertNotIsInstance(result, DatetimeIndex)
+        assert not isinstance(result, DatetimeIndex)
         tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+        assert result.name == expected.name
 
         idx = date_range('1/1/2000', periods=3, freq='M', name='idx')
 
@@ -85,33 +341,29 @@ def test_insert(self):
         for n, d, expected in cases:
             result = idx.insert(n, d)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
         # reset freq to None
         result = idx.insert(3, datetime(2000, 1, 2))
         expected = DatetimeIndex(['2000-01-31', '2000-02-29', '2000-03-31',
                                   '2000-01-02'], name='idx', freq=None)
         tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertTrue(result.freq is None)
-
-        # GH 7299
-        tm._skip_if_no_pytz()
-        import pytz
+        assert result.name == expected.name
+        assert result.freq is None
 
+        # see gh-7299
         idx = date_range('1/1/2000', periods=3, freq='D', tz='Asia/Tokyo',
                          name='idx')
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, pd.Timestamp('2000-01-04'))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, datetime(2000, 1, 4))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3, pd.Timestamp('2000-01-04', tz='US/Eastern'))
-        with tm.assertRaises(ValueError):
-            result = idx.insert(3,
-                                datetime(2000, 1, 4,
-                                         tzinfo=pytz.timezone('US/Eastern')))
+        with pytest.raises(ValueError):
+            idx.insert(3, pd.Timestamp('2000-01-04'))
+        with pytest.raises(ValueError):
+            idx.insert(3, datetime(2000, 1, 4))
+        with pytest.raises(ValueError):
+            idx.insert(3, pd.Timestamp('2000-01-04', tz='US/Eastern'))
+        with pytest.raises(ValueError):
+            idx.insert(3, datetime(2000, 1, 4,
+                                   tzinfo=pytz.timezone('US/Eastern')))
 
         for tz in ['US/Pacific', 'Asia/Singapore']:
             idx = date_range('1/1/2000 09:00', periods=6, freq='H', tz=tz,
@@ -124,9 +376,9 @@ def test_insert(self):
 
                 result = idx.insert(6, d)
                 tm.assert_index_equal(result, expected)
-                self.assertEqual(result.name, expected.name)
-                self.assertEqual(result.freq, expected.freq)
-                self.assertEqual(result.tz, expected.tz)
+                assert result.name == expected.name
+                assert result.freq == expected.freq
+                assert result.tz == expected.tz
 
             expected = DatetimeIndex(['2000-01-01 09:00', '2000-01-01 10:00',
                                       '2000-01-01 11:00',
@@ -139,9 +391,9 @@ def test_insert(self):
                       pytz.timezone(tz).localize(datetime(2000, 1, 1, 10))]:
                 result = idx.insert(6, d)
                 tm.assert_index_equal(result, expected)
-                self.assertEqual(result.name, expected.name)
-                self.assertTrue(result.freq is None)
-                self.assertEqual(result.tz, expected.tz)
+                assert result.name == expected.name
+                assert result.tz == expected.tz
+                assert result.freq is None
 
     def test_delete(self):
         idx = date_range(start='2000-01-01', periods=5, freq='M', name='idx')
@@ -164,12 +416,12 @@ def test_delete(self):
         for n, expected in compat.iteritems(cases):
             result = idx.delete(n)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = idx.delete(5)
+        with pytest.raises((IndexError, ValueError)):
+            # either depending on numpy version
+            idx.delete(5)
 
         for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
             idx = date_range(start='2000-01-01 09:00', periods=10, freq='H',
@@ -179,17 +431,17 @@ def test_delete(self):
                                   freq='H', name='idx', tz=tz)
             result = idx.delete(0)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freqstr, 'H')
-            self.assertEqual(result.tz, expected.tz)
+            assert result.name == expected.name
+            assert result.freqstr == 'H'
+            assert result.tz == expected.tz
 
             expected = date_range(start='2000-01-01 09:00', periods=9,
                                   freq='H', name='idx', tz=tz)
             result = idx.delete(-1)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freqstr, 'H')
-            self.assertEqual(result.tz, expected.tz)
+            assert result.name == expected.name
+            assert result.freqstr == 'H'
+            assert result.tz == expected.tz
 
     def test_delete_slice(self):
         idx = date_range(start='2000-01-01', periods=10, freq='D', name='idx')
@@ -211,13 +463,13 @@ def test_delete_slice(self):
         for n, expected in compat.iteritems(cases):
             result = idx.delete(n)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
             result = idx.delete(slice(n[0], n[-1] + 1))
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
         for tz in [None, 'Asia/Tokyo', 'US/Pacific']:
             ts = pd.Series(1, index=pd.date_range(
@@ -227,9 +479,9 @@ def test_delete_slice(self):
             expected = pd.date_range('2000-01-01 14:00', periods=5, freq='H',
                                      name='idx', tz=tz)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.tz, expected.tz)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
 
             # reset freq to None
             result = ts.drop(ts.index[[1, 3, 5, 7, 9]]).index
@@ -238,6 +490,123 @@ def test_delete_slice(self):
                                       '2000-01-01 15:00', '2000-01-01 17:00'],
                                      freq=None, name='idx', tz=tz)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.tz, expected.tz)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
+
+    def test_get_loc(self):
+        idx = pd.date_range('2000-01-01', periods=3)
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].to_pydatetime(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+            if method is not None:
+                assert idx.get_loc(idx[1], method,
+                                   tolerance=pd.Timedelta('0 days')) == 1
+
+        assert idx.get_loc('2000-01-01', method='nearest') == 0
+        assert idx.get_loc('2000-01-01T12', method='nearest') == 1
+
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance='1 day') == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=pd.Timedelta('1D')) == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=np.timedelta64(1, 'D')) == 1
+        assert idx.get_loc('2000-01-01T12', method='nearest',
+                           tolerance=timedelta(1)) == 1
+        with pytest.raises(ValueError, match='unit abbreviation w/o a number'):
+            idx.get_loc('2000-01-01T12', method='nearest', tolerance='foo')
+        with pytest.raises(KeyError):
+            idx.get_loc('2000-01-01T03', method='nearest', tolerance='2 hours')
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match target index size'):
+            idx.get_loc('2000-01-01', method='nearest',
+                        tolerance=[pd.Timedelta('1day').to_timedelta64(),
+                                   pd.Timedelta('1day').to_timedelta64()])
+
+        assert idx.get_loc('2000', method='nearest') == slice(0, 3)
+        assert idx.get_loc('2000-01', method='nearest') == slice(0, 3)
+
+        assert idx.get_loc('1999', method='nearest') == 0
+        assert idx.get_loc('2001', method='nearest') == 2
+
+        with pytest.raises(KeyError):
+            idx.get_loc('1999', method='pad')
+        with pytest.raises(KeyError):
+            idx.get_loc('2001', method='backfill')
+
+        with pytest.raises(KeyError):
+            idx.get_loc('foobar')
+        with pytest.raises(TypeError):
+            idx.get_loc(slice(2))
+
+        idx = pd.to_datetime(['2000-01-01', '2000-01-04'])
+        assert idx.get_loc('2000-01-02', method='nearest') == 0
+        assert idx.get_loc('2000-01-03', method='nearest') == 1
+        assert idx.get_loc('2000-01', method='nearest') == slice(0, 2)
+
+        # time indexing
+        idx = pd.date_range('2000-01-01', periods=24, freq='H')
+        tm.assert_numpy_array_equal(idx.get_loc(time(12)),
+                                    np.array([12]), check_dtype=False)
+        tm.assert_numpy_array_equal(idx.get_loc(time(12, 30)),
+                                    np.array([]), check_dtype=False)
+        with pytest.raises(NotImplementedError):
+            idx.get_loc(time(12, 30), method='pad')
+
+    def test_get_indexer(self):
+        idx = pd.date_range('2000-01-01', periods=3)
+        exp = np.array([0, 1, 2], dtype=np.intp)
+        tm.assert_numpy_array_equal(idx.get_indexer(idx), exp)
+
+        target = idx[0] + pd.to_timedelta(['-1 hour', '12 hours',
+                                           '1 day 1 hour'])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=pd.Timedelta('1 hour')),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_raw = [pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour').to_timedelta64(), ]
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=[np.timedelta64(x) for x in tol_raw]),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_bad = [pd.Timedelta('2 hour').to_timedelta64(),
+                   pd.Timedelta('1 hour').to_timedelta64(),
+                   'foo', ]
+        with pytest.raises(
+                ValueError, match='abbreviation w/o a number'):
+            idx.get_indexer(target, 'nearest', tolerance=tol_bad)
+        with pytest.raises(ValueError):
+            idx.get_indexer(idx[[0]], method='nearest', tolerance='foo')
+
+    def test_reasonable_key_error(self):
+        # GH#1062
+        index = DatetimeIndex(['1/3/2000'])
+        with pytest.raises(KeyError, match='2000'):
+            index.get_loc('1/1/2000')
+
+    @pytest.mark.parametrize('key', [pd.Timedelta(0),
+                                     pd.Timedelta(1),
+                                     timedelta(0)])
+    def test_timedelta_invalid_key(self, key):
+        # GH#20464
+        dti = pd.date_range('1970-01-01', periods=10)
+        with pytest.raises(TypeError):
+            dti.get_loc(key)
+
+    def test_get_loc_nat(self):
+        # GH#20464
+        index = DatetimeIndex(['1/3/2000', 'NaT'])
+        assert index.get_loc(pd.NaT) == 1
diff --git a/pandas/tests/indexes/datetimes/test_misc.py b/pandas/tests/indexes/datetimes/test_misc.py
index 76a26b09ed131..fc6080e68a803 100644
--- a/pandas/tests/indexes/datetimes/test_misc.py
+++ b/pandas/tests/indexes/datetimes/test_misc.py
@@ -1,58 +1,17 @@
+import calendar
+import locale
+import unicodedata
+
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import (
+    DatetimeIndex, Index, Timestamp, compat, date_range, datetime, offsets)
 import pandas.util.testing as tm
-from pandas import (Index, DatetimeIndex, datetime, offsets,
-                    Float64Index, date_range, Timestamp)
-
-
-class TestDateTimeIndexToJulianDate(tm.TestCase):
-
-    def test_1700(self):
-        r1 = Float64Index([2345897.5, 2345898.5, 2345899.5, 2345900.5,
-                           2345901.5])
-        r2 = date_range(start=Timestamp('1710-10-01'), periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_2000(self):
-        r1 = Float64Index([2451601.5, 2451602.5, 2451603.5, 2451604.5,
-                           2451605.5])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_hour(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.5416666666666666, 2451601.5833333333333333,
-             2451601.625, 2451601.6666666666666666])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='H').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_minute(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.5006944444444444, 2451601.5013888888888888,
-             2451601.5020833333333333, 2451601.5027777777777777])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='T').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_second(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.500011574074074, 2451601.5000231481481481,
-             2451601.5000347222222222, 2451601.5000462962962962])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='S').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-
-class TestTimeSeries(tm.TestCase):
+
+
+class TestTimeSeries(object):
 
     def test_pass_datetimeindex_to_index(self):
         # Bugs in #1396
@@ -61,11 +20,11 @@ def test_pass_datetimeindex_to_index(self):
 
         expected = Index(rng.to_pydatetime(), dtype=object)
 
-        self.assert_numpy_array_equal(idx.values, expected.values)
+        tm.assert_numpy_array_equal(idx.values, expected.values)
 
     def test_range_edges(self):
-        # GH 13672
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000001'),
+        # GH#13672
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:00.000000001'),
                             end=Timestamp('1970-01-01 00:00:00.000000004'),
                             freq='N')
         exp = DatetimeIndex(['1970-01-01 00:00:00.000000001',
@@ -74,19 +33,19 @@ def test_range_edges(self):
                              '1970-01-01 00:00:00.000000004'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000004'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:00.000000004'),
                             end=Timestamp('1970-01-01 00:00:00.000000001'),
                             freq='N')
         exp = DatetimeIndex([])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000000001'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:00.000000001'),
                             end=Timestamp('1970-01-01 00:00:00.000000001'),
                             freq='N')
         exp = DatetimeIndex(['1970-01-01 00:00:00.000000001'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.000001'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:00.000001'),
                             end=Timestamp('1970-01-01 00:00:00.000004'),
                             freq='U')
         exp = DatetimeIndex(['1970-01-01 00:00:00.000001',
@@ -95,7 +54,7 @@ def test_range_edges(self):
                              '1970-01-01 00:00:00.000004'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:00.001'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:00.001'),
                             end=Timestamp('1970-01-01 00:00:00.004'),
                             freq='L')
         exp = DatetimeIndex(['1970-01-01 00:00:00.001',
@@ -104,157 +63,98 @@ def test_range_edges(self):
                              '1970-01-01 00:00:00.004'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:00:01'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:00:01'),
                             end=Timestamp('1970-01-01 00:00:04'), freq='S')
         exp = DatetimeIndex(['1970-01-01 00:00:01', '1970-01-01 00:00:02',
                              '1970-01-01 00:00:03', '1970-01-01 00:00:04'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 00:01'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 00:01'),
                             end=Timestamp('1970-01-01 00:04'), freq='T')
         exp = DatetimeIndex(['1970-01-01 00:01', '1970-01-01 00:02',
                              '1970-01-01 00:03', '1970-01-01 00:04'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01 01:00'),
+        idx = pd.date_range(start=Timestamp('1970-01-01 01:00'),
                             end=Timestamp('1970-01-01 04:00'), freq='H')
         exp = DatetimeIndex(['1970-01-01 01:00', '1970-01-01 02:00',
                              '1970-01-01 03:00', '1970-01-01 04:00'])
         tm.assert_index_equal(idx, exp)
 
-        idx = DatetimeIndex(start=Timestamp('1970-01-01'),
+        idx = pd.date_range(start=Timestamp('1970-01-01'),
                             end=Timestamp('1970-01-04'), freq='D')
         exp = DatetimeIndex(['1970-01-01', '1970-01-02',
                              '1970-01-03', '1970-01-04'])
         tm.assert_index_equal(idx, exp)
 
-    def test_datetimeindex_integers_shift(self):
-        rng = date_range('1/1/2000', periods=20)
-
-        result = rng + 5
-        expected = rng.shift(5)
-        tm.assert_index_equal(result, expected)
-
-        result = rng - 5
-        expected = rng.shift(-5)
-        tm.assert_index_equal(result, expected)
-
-    def test_datetimeindex_repr_short(self):
-        dr = date_range(start='1/1/2012', periods=1)
-        repr(dr)
-
-        dr = date_range(start='1/1/2012', periods=2)
-        repr(dr)
-
-        dr = date_range(start='1/1/2012', periods=3)
-        repr(dr)
-
-    def test_normalize(self):
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D')
 
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D')
-        tm.assert_index_equal(result, expected)
-
-        rng_ns = pd.DatetimeIndex(np.array([1380585623454345752,
-                                            1380585612343234312]).astype(
-                                                "datetime64[ns]"))
-        rng_ns_normalized = rng_ns.normalize()
-        expected = pd.DatetimeIndex(np.array([1380585600000000000,
-                                              1380585600000000000]).astype(
-                                                  "datetime64[ns]"))
-        tm.assert_index_equal(rng_ns_normalized, expected)
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-
-class TestDatetime64(tm.TestCase):
+class TestDatetime64(object):
 
     def test_datetimeindex_accessors(self):
-
-        dti_naive = DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+        dti_naive = pd.date_range(freq='D', start=datetime(1998, 1, 1),
                                   periods=365)
-        # GH 13303
-        dti_tz = DatetimeIndex(freq='D', start=datetime(1998, 1, 1),
+        # GH#13303
+        dti_tz = pd.date_range(freq='D', start=datetime(1998, 1, 1),
                                periods=365, tz='US/Eastern')
         for dti in [dti_naive, dti_tz]:
 
-            self.assertEqual(dti.year[0], 1998)
-            self.assertEqual(dti.month[0], 1)
-            self.assertEqual(dti.day[0], 1)
-            self.assertEqual(dti.hour[0], 0)
-            self.assertEqual(dti.minute[0], 0)
-            self.assertEqual(dti.second[0], 0)
-            self.assertEqual(dti.microsecond[0], 0)
-            self.assertEqual(dti.dayofweek[0], 3)
-
-            self.assertEqual(dti.dayofyear[0], 1)
-            self.assertEqual(dti.dayofyear[120], 121)
-
-            self.assertEqual(dti.weekofyear[0], 1)
-            self.assertEqual(dti.weekofyear[120], 18)
-
-            self.assertEqual(dti.quarter[0], 1)
-            self.assertEqual(dti.quarter[120], 2)
-
-            self.assertEqual(dti.days_in_month[0], 31)
-            self.assertEqual(dti.days_in_month[90], 30)
-
-            self.assertEqual(dti.is_month_start[0], True)
-            self.assertEqual(dti.is_month_start[1], False)
-            self.assertEqual(dti.is_month_start[31], True)
-            self.assertEqual(dti.is_quarter_start[0], True)
-            self.assertEqual(dti.is_quarter_start[90], True)
-            self.assertEqual(dti.is_year_start[0], True)
-            self.assertEqual(dti.is_year_start[364], False)
-            self.assertEqual(dti.is_month_end[0], False)
-            self.assertEqual(dti.is_month_end[30], True)
-            self.assertEqual(dti.is_month_end[31], False)
-            self.assertEqual(dti.is_month_end[364], True)
-            self.assertEqual(dti.is_quarter_end[0], False)
-            self.assertEqual(dti.is_quarter_end[30], False)
-            self.assertEqual(dti.is_quarter_end[89], True)
-            self.assertEqual(dti.is_quarter_end[364], True)
-            self.assertEqual(dti.is_year_end[0], False)
-            self.assertEqual(dti.is_year_end[364], True)
-
-            # GH 11128
-            self.assertEqual(dti.weekday_name[4], u'Monday')
-            self.assertEqual(dti.weekday_name[5], u'Tuesday')
-            self.assertEqual(dti.weekday_name[6], u'Wednesday')
-            self.assertEqual(dti.weekday_name[7], u'Thursday')
-            self.assertEqual(dti.weekday_name[8], u'Friday')
-            self.assertEqual(dti.weekday_name[9], u'Saturday')
-            self.assertEqual(dti.weekday_name[10], u'Sunday')
-
-            self.assertEqual(Timestamp('2016-04-04').weekday_name, u'Monday')
-            self.assertEqual(Timestamp('2016-04-05').weekday_name, u'Tuesday')
-            self.assertEqual(Timestamp('2016-04-06').weekday_name,
-                             u'Wednesday')
-            self.assertEqual(Timestamp('2016-04-07').weekday_name, u'Thursday')
-            self.assertEqual(Timestamp('2016-04-08').weekday_name, u'Friday')
-            self.assertEqual(Timestamp('2016-04-09').weekday_name, u'Saturday')
-            self.assertEqual(Timestamp('2016-04-10').weekday_name, u'Sunday')
-
-            self.assertEqual(len(dti.year), 365)
-            self.assertEqual(len(dti.month), 365)
-            self.assertEqual(len(dti.day), 365)
-            self.assertEqual(len(dti.hour), 365)
-            self.assertEqual(len(dti.minute), 365)
-            self.assertEqual(len(dti.second), 365)
-            self.assertEqual(len(dti.microsecond), 365)
-            self.assertEqual(len(dti.dayofweek), 365)
-            self.assertEqual(len(dti.dayofyear), 365)
-            self.assertEqual(len(dti.weekofyear), 365)
-            self.assertEqual(len(dti.quarter), 365)
-            self.assertEqual(len(dti.is_month_start), 365)
-            self.assertEqual(len(dti.is_month_end), 365)
-            self.assertEqual(len(dti.is_quarter_start), 365)
-            self.assertEqual(len(dti.is_quarter_end), 365)
-            self.assertEqual(len(dti.is_year_start), 365)
-            self.assertEqual(len(dti.is_year_end), 365)
-            self.assertEqual(len(dti.weekday_name), 365)
+            assert dti.year[0] == 1998
+            assert dti.month[0] == 1
+            assert dti.day[0] == 1
+            assert dti.hour[0] == 0
+            assert dti.minute[0] == 0
+            assert dti.second[0] == 0
+            assert dti.microsecond[0] == 0
+            assert dti.dayofweek[0] == 3
+
+            assert dti.dayofyear[0] == 1
+            assert dti.dayofyear[120] == 121
+
+            assert dti.weekofyear[0] == 1
+            assert dti.weekofyear[120] == 18
+
+            assert dti.quarter[0] == 1
+            assert dti.quarter[120] == 2
+
+            assert dti.days_in_month[0] == 31
+            assert dti.days_in_month[90] == 30
+
+            assert dti.is_month_start[0]
+            assert not dti.is_month_start[1]
+            assert dti.is_month_start[31]
+            assert dti.is_quarter_start[0]
+            assert dti.is_quarter_start[90]
+            assert dti.is_year_start[0]
+            assert not dti.is_year_start[364]
+            assert not dti.is_month_end[0]
+            assert dti.is_month_end[30]
+            assert not dti.is_month_end[31]
+            assert dti.is_month_end[364]
+            assert not dti.is_quarter_end[0]
+            assert not dti.is_quarter_end[30]
+            assert dti.is_quarter_end[89]
+            assert dti.is_quarter_end[364]
+            assert not dti.is_year_end[0]
+            assert dti.is_year_end[364]
+
+            assert len(dti.year) == 365
+            assert len(dti.month) == 365
+            assert len(dti.day) == 365
+            assert len(dti.hour) == 365
+            assert len(dti.minute) == 365
+            assert len(dti.second) == 365
+            assert len(dti.microsecond) == 365
+            assert len(dti.dayofweek) == 365
+            assert len(dti.dayofyear) == 365
+            assert len(dti.weekofyear) == 365
+            assert len(dti.quarter) == 365
+            assert len(dti.is_month_start) == 365
+            assert len(dti.is_month_end) == 365
+            assert len(dti.is_quarter_start) == 365
+            assert len(dti.is_quarter_end) == 365
+            assert len(dti.is_year_start) == 365
+            assert len(dti.is_year_end) == 365
+            assert len(dti.weekday_name) == 365
 
             dti.name = 'name'
 
@@ -279,23 +179,24 @@ def test_datetimeindex_accessors(self):
             exp = DatetimeIndex([], freq='D', tz=dti.tz, name='name')
             tm.assert_index_equal(res, exp)
 
-        dti = DatetimeIndex(freq='BQ-FEB', start=datetime(1998, 1, 1),
+        dti = pd.date_range(freq='BQ-FEB', start=datetime(1998, 1, 1),
                             periods=4)
 
-        self.assertEqual(sum(dti.is_quarter_start), 0)
-        self.assertEqual(sum(dti.is_quarter_end), 4)
-        self.assertEqual(sum(dti.is_year_start), 0)
-        self.assertEqual(sum(dti.is_year_end), 1)
+        assert sum(dti.is_quarter_start) == 0
+        assert sum(dti.is_quarter_end) == 4
+        assert sum(dti.is_year_start) == 0
+        assert sum(dti.is_year_end) == 1
 
         # Ensure is_start/end accessors throw ValueError for CustomBusinessDay,
-        # CBD requires np >= 1.7
         bday_egypt = offsets.CustomBusinessDay(weekmask='Sun Mon Tue Wed Thu')
         dti = date_range(datetime(2013, 4, 30), periods=5, freq=bday_egypt)
-        self.assertRaises(ValueError, lambda: dti.is_month_start)
+        msg = "Custom business days is not supported by is_month_start"
+        with pytest.raises(ValueError, match=msg):
+            dti.is_month_start
 
         dti = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-03'])
 
-        self.assertEqual(dti.is_month_start[0], 1)
+        assert dti.is_month_start[0] == 1
 
         tests = [
             (Timestamp('2013-06-01', freq='M').is_month_start, 1),
@@ -332,10 +233,82 @@ def test_datetimeindex_accessors(self):
             (Timestamp('2013-02-01').days_in_month, 28)]
 
         for ts, value in tests:
-            self.assertEqual(ts, value)
+            assert ts == value
+
+        # GH 6538: Check that DatetimeIndex and its TimeStamp elements
+        # return the same weekofyear accessor close to new year w/ tz
+        dates = ["2013/12/29", "2013/12/30", "2013/12/31"]
+        dates = DatetimeIndex(dates, tz="Europe/Brussels")
+        expected = [52, 1, 1]
+        assert dates.weekofyear.tolist() == expected
+        assert [d.weekofyear for d in dates] == expected
+
+    # GH 12806
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_datetime_name_accessors(self, time_locale):
+        # Test Monday -> Sunday and January -> December, in that sequence
+        if time_locale is None:
+            # If the time_locale is None, day-name and month_name should
+            # return the english attributes
+            expected_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                             'Friday', 'Saturday', 'Sunday']
+            expected_months = ['January', 'February', 'March', 'April', 'May',
+                               'June', 'July', 'August', 'September',
+                               'October', 'November', 'December']
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_days = calendar.day_name[:]
+                expected_months = calendar.month_name[1:]
+
+        # GH#11128
+        dti = pd.date_range(freq='D', start=datetime(1998, 1, 1),
+                            periods=365)
+        english_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                        'Friday', 'Saturday', 'Sunday']
+        for day, name, eng_name in zip(range(4, 11),
+                                       expected_days,
+                                       english_days):
+            name = name.capitalize()
+            assert dti.weekday_name[day] == eng_name
+            assert dti.day_name(locale=time_locale)[day] == name
+            ts = Timestamp(datetime(2016, 4, day))
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                assert ts.weekday_name == eng_name
+            assert ts.day_name(locale=time_locale) == name
+        dti = dti.append(DatetimeIndex([pd.NaT]))
+        assert np.isnan(dti.day_name(locale=time_locale)[-1])
+        ts = Timestamp(pd.NaT)
+        assert np.isnan(ts.day_name(locale=time_locale))
+
+        # GH#12805
+        dti = pd.date_range(freq='M', start='2012', end='2013')
+        result = dti.month_name(locale=time_locale)
+        expected = Index([month.capitalize() for month in expected_months])
+
+        # work around different normalization schemes
+        # https://github.com/pandas-dev/pandas/issues/22342
+        if not compat.PY2:
+            result = result.str.normalize("NFD")
+            expected = expected.str.normalize("NFD")
+
+        tm.assert_index_equal(result, expected)
+
+        for date, expected in zip(dti, expected_months):
+            result = date.month_name(locale=time_locale)
+            expected = expected.capitalize()
+
+            if not compat.PY2:
+                result = unicodedata.normalize("NFD", result)
+                expected = unicodedata.normalize("NFD", result)
+
+            assert result == expected
+        dti = dti.append(DatetimeIndex([pd.NaT]))
+        assert np.isnan(dti.month_name(locale=time_locale)[-1])
 
     def test_nanosecond_field(self):
         dti = DatetimeIndex(np.arange(10))
 
-        self.assert_index_equal(dti.nanosecond,
-                                pd.Index(np.arange(10, dtype=np.int64)))
+        tm.assert_index_equal(dti.nanosecond,
+                              pd.Index(np.arange(10, dtype=np.int64)))
diff --git a/pandas/tests/indexes/datetimes/test_missing.py b/pandas/tests/indexes/datetimes/test_missing.py
index 8f3752227b6d0..c8d47caa7e947 100644
--- a/pandas/tests/indexes/datetimes/test_missing.py
+++ b/pandas/tests/indexes/datetimes/test_missing.py
@@ -1,50 +1,52 @@
+import pytest
+
 import pandas as pd
 import pandas.util.testing as tm
 
 
-class TestDatetimeIndex(tm.TestCase):
+class TestDatetimeIndex(object):
 
-    def test_fillna_datetime64(self):
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'Asia/Tokyo'])
+    def test_fillna_datetime64(self, tz):
         # GH 11343
-        for tz in ['US/Eastern', 'Asia/Tokyo']:
-            idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
-                                    '2011-01-01 11:00'])
-
-            exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
-                                    '2011-01-01 11:00'])
-            self.assert_index_equal(
-                idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
-
-            # tz mismatch
-            exp = pd.Index([pd.Timestamp('2011-01-01 09:00'),
-                            pd.Timestamp('2011-01-01 10:00', tz=tz),
-                            pd.Timestamp('2011-01-01 11:00')], dtype=object)
-            self.assert_index_equal(
-                idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
-
-            # object
-            exp = pd.Index([pd.Timestamp('2011-01-01 09:00'), 'x',
-                            pd.Timestamp('2011-01-01 11:00')], dtype=object)
-            self.assert_index_equal(idx.fillna('x'), exp)
-
-            idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
-                                    '2011-01-01 11:00'], tz=tz)
-
-            exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
-                                    '2011-01-01 11:00'], tz=tz)
-            self.assert_index_equal(
-                idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
-
-            exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
-                            pd.Timestamp('2011-01-01 10:00'),
-                            pd.Timestamp('2011-01-01 11:00', tz=tz)],
-                           dtype=object)
-            self.assert_index_equal(
-                idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
-
-            # object
-            exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
-                            'x',
-                            pd.Timestamp('2011-01-01 11:00', tz=tz)],
-                           dtype=object)
-            self.assert_index_equal(idx.fillna('x'), exp)
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
+                                '2011-01-01 11:00'])
+
+        exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                                '2011-01-01 11:00'])
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
+
+        # tz mismatch
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00'),
+                        pd.Timestamp('2011-01-01 10:00', tz=tz),
+                        pd.Timestamp('2011-01-01 11:00')], dtype=object)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
+
+        # object
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00'), 'x',
+                        pd.Timestamp('2011-01-01 11:00')], dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
+
+        idx = pd.DatetimeIndex(['2011-01-01 09:00', pd.NaT,
+                                '2011-01-01 11:00'], tz=tz)
+
+        exp = pd.DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
+                                '2011-01-01 11:00'], tz=tz)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00', tz=tz)), exp)
+
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
+                        pd.Timestamp('2011-01-01 10:00'),
+                        pd.Timestamp('2011-01-01 11:00', tz=tz)],
+                       dtype=object)
+        tm.assert_index_equal(
+            idx.fillna(pd.Timestamp('2011-01-01 10:00')), exp)
+
+        # object
+        exp = pd.Index([pd.Timestamp('2011-01-01 09:00', tz=tz),
+                        'x',
+                        pd.Timestamp('2011-01-01 11:00', tz=tz)],
+                       dtype=object)
+        tm.assert_index_equal(idx.fillna('x'), exp)
diff --git a/pandas/tests/indexes/datetimes/test_ops.py b/pandas/tests/indexes/datetimes/test_ops.py
index 4681879d708c4..84085141fcf92 100644
--- a/pandas/tests/indexes/datetimes/test_ops.py
+++ b/pandas/tests/indexes/datetimes/test_ops.py
@@ -1,30 +1,27 @@
-import pytest
+from datetime import datetime
 import warnings
+
 import numpy as np
-from datetime import timedelta
+import pytest
+
+from pandas.core.dtypes.generic import ABCDateOffset
 
-from itertools import product
 import pandas as pd
-import pandas._libs.tslib as tslib
-import pandas.util.testing as tm
-from pandas.core.common import PerformanceWarning
-from pandas.tseries.index import cdate_range
-from pandas import (DatetimeIndex, PeriodIndex, Series, Timestamp, Timedelta,
-                    date_range, TimedeltaIndex, _np_version_under1p10, Index,
-                    datetime, Float64Index, offsets, bdate_range)
-from pandas.tseries.offsets import BMonthEnd, CDay, BDay
+from pandas import (
+    DatetimeIndex, Index, PeriodIndex, Series, Timestamp, bdate_range,
+    date_range)
 from pandas.tests.test_base import Ops
+import pandas.util.testing as tm
 
+from pandas.tseries.offsets import BDay, BMonthEnd, CDay, Day, Hour
 
 START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
 
 
 class TestDatetimeIndexOps(Ops):
-    tz = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/Asia/Singapore',
-          'dateutil/US/Pacific']
 
-    def setUp(self):
-        super(TestDatetimeIndexOps, self).setUp()
+    def setup_method(self, method):
+        super(TestDatetimeIndexOps, self).setup_method(method)
         mask = lambda x: (isinstance(x, DatetimeIndex) or
                           isinstance(x, PeriodIndex))
         self.is_valid_objs = [o for o in self.objs if mask(o)]
@@ -39,729 +36,231 @@ def test_ops_properties(self):
     def test_ops_properties_basic(self):
 
         # sanity check that the behavior didn't change
-        # GH7206
+        # GH#7206
+        msg = "'Series' object has no attribute '{}'"
         for op in ['year', 'day', 'second', 'weekday']:
-            self.assertRaises(TypeError, lambda x: getattr(self.dt_series, op))
+            with pytest.raises(AttributeError, match=msg.format(op)):
+                getattr(self.dt_series, op)
 
         # attribute access should still work!
         s = Series(dict(year=2000, month=1, day=10))
-        self.assertEqual(s.year, 2000)
-        self.assertEqual(s.month, 1)
-        self.assertEqual(s.day, 10)
-        self.assertRaises(AttributeError, lambda: s.weekday)
-
-    def test_asobject_tolist(self):
-        idx = pd.date_range(start='2013-01-01', periods=4, freq='M',
-                            name='idx')
-        expected_list = [Timestamp('2013-01-31'),
-                         Timestamp('2013-02-28'),
-                         Timestamp('2013-03-31'),
-                         Timestamp('2013-04-30')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = pd.date_range(start='2013-01-01', periods=4, freq='M',
-                            name='idx', tz='Asia/Tokyo')
-        expected_list = [Timestamp('2013-01-31', tz='Asia/Tokyo'),
-                         Timestamp('2013-02-28', tz='Asia/Tokyo'),
-                         Timestamp('2013-03-31', tz='Asia/Tokyo'),
-                         Timestamp('2013-04-30', tz='Asia/Tokyo')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = DatetimeIndex([datetime(2013, 1, 1), datetime(2013, 1, 2),
-                             pd.NaT, datetime(2013, 1, 4)], name='idx')
-        expected_list = [Timestamp('2013-01-01'),
-                         Timestamp('2013-01-02'), pd.NaT,
-                         Timestamp('2013-01-04')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-    def test_minmax(self):
-        for tz in self.tz:
-            # monotonic
-            idx1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
-                                     '2011-01-03'], tz=tz)
-            self.assertTrue(idx1.is_monotonic)
-
-            # non-monotonic
-            idx2 = pd.DatetimeIndex(['2011-01-01', pd.NaT, '2011-01-03',
-                                     '2011-01-02', pd.NaT], tz=tz)
-            self.assertFalse(idx2.is_monotonic)
-
-            for idx in [idx1, idx2]:
-                self.assertEqual(idx.min(), Timestamp('2011-01-01', tz=tz))
-                self.assertEqual(idx.max(), Timestamp('2011-01-03', tz=tz))
-                self.assertEqual(idx.argmin(), 0)
-                self.assertEqual(idx.argmax(), 2)
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = DatetimeIndex([])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = DatetimeIndex([pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = DatetimeIndex([pd.NaT, pd.NaT, pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-    def test_numpy_minmax(self):
-        dr = pd.date_range(start='2016-01-15', end='2016-01-20')
-
-        self.assertEqual(np.min(dr),
-                         Timestamp('2016-01-15 00:00:00', freq='D'))
-        self.assertEqual(np.max(dr),
-                         Timestamp('2016-01-20 00:00:00', freq='D'))
-
-        errmsg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, errmsg, np.min, dr, out=0)
-        tm.assertRaisesRegexp(ValueError, errmsg, np.max, dr, out=0)
-
-        self.assertEqual(np.argmin(dr), 0)
-        self.assertEqual(np.argmax(dr), 5)
-
-        if not _np_version_under1p10:
-            errmsg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmin, dr, out=0)
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmax, dr, out=0)
-
-    def test_round(self):
-        for tz in self.tz:
-            rng = pd.date_range(start='2016-01-01', periods=5,
-                                freq='30Min', tz=tz)
-            elt = rng[1]
-
-            expected_rng = DatetimeIndex([
-                Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 01:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
-            ])
-            expected_elt = expected_rng[1]
-
-            tm.assert_index_equal(rng.round(freq='H'), expected_rng)
-            self.assertEqual(elt.round(freq='H'), expected_elt)
-
-            msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-            with tm.assertRaisesRegexp(ValueError, msg):
-                rng.round(freq='foo')
-            with tm.assertRaisesRegexp(ValueError, msg):
-                elt.round(freq='foo')
-
-            msg = "<MonthEnd> is a non-fixed frequency"
-            tm.assertRaisesRegexp(ValueError, msg, rng.round, freq='M')
-            tm.assertRaisesRegexp(ValueError, msg, elt.round, freq='M')
-
-            # GH 14440 & 15578
-            index = pd.DatetimeIndex(['2016-10-17 12:00:00.0015'], tz=tz)
-            result = index.round('ms')
-            expected = pd.DatetimeIndex(['2016-10-17 12:00:00.002000'], tz=tz)
-            tm.assert_index_equal(result, expected)
-
-            for freq in ['us', 'ns']:
-                tm.assert_index_equal(index, index.round(freq))
-
-            index = pd.DatetimeIndex(['2016-10-17 12:00:00.00149'], tz=tz)
-            result = index.round('ms')
-            expected = pd.DatetimeIndex(['2016-10-17 12:00:00.001000'], tz=tz)
-            tm.assert_index_equal(result, expected)
-
-            index = pd.DatetimeIndex(['2016-10-17 12:00:00.001501031'])
-            result = index.round('10ns')
-            expected = pd.DatetimeIndex(['2016-10-17 12:00:00.001501030'])
-            tm.assert_index_equal(result, expected)
-
-            with tm.assert_produces_warning():
-                ts = '2016-10-17 12:00:00.001501031'
-                pd.DatetimeIndex([ts]).round('1010ns')
-
-    def test_repeat_range(self):
+        assert s.year == 2000
+        assert s.month == 1
+        assert s.day == 10
+        msg = "'Series' object has no attribute 'weekday'"
+        with pytest.raises(AttributeError, match=msg):
+            s.weekday
+
+    def test_repeat_range(self, tz_naive_fixture):
+        tz = tz_naive_fixture
         rng = date_range('1/1/2000', '1/1/2001')
 
         result = rng.repeat(5)
-        self.assertIsNone(result.freq)
-        self.assertEqual(len(result), 5 * len(rng))
-
-        for tz in self.tz:
-            index = pd.date_range('2001-01-01', periods=2, freq='D', tz=tz)
-            exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
-                                    '2001-01-02', '2001-01-02'], tz=tz)
-            for res in [index.repeat(2), np.repeat(index, 2)]:
-                tm.assert_index_equal(res, exp)
-                self.assertIsNone(res.freq)
-
-            index = pd.date_range('2001-01-01', periods=2, freq='2D', tz=tz)
-            exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
-                                    '2001-01-03', '2001-01-03'], tz=tz)
-            for res in [index.repeat(2), np.repeat(index, 2)]:
-                tm.assert_index_equal(res, exp)
-                self.assertIsNone(res.freq)
-
-            index = pd.DatetimeIndex(['2001-01-01', 'NaT', '2003-01-01'],
-                                     tz=tz)
-            exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01', '2001-01-01',
-                                    'NaT', 'NaT', 'NaT',
-                                    '2003-01-01', '2003-01-01', '2003-01-01'],
-                                   tz=tz)
-            for res in [index.repeat(3), np.repeat(index, 3)]:
-                tm.assert_index_equal(res, exp)
-                self.assertIsNone(res.freq)
-
-    def test_repeat(self):
+        assert result.freq is None
+        assert len(result) == 5 * len(rng)
+
+        index = pd.date_range('2001-01-01', periods=2, freq='D', tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
+                                '2001-01-02', '2001-01-02'], tz=tz)
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+        index = pd.date_range('2001-01-01', periods=2, freq='2D', tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01',
+                                '2001-01-03', '2001-01-03'], tz=tz)
+        for res in [index.repeat(2), np.repeat(index, 2)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+        index = pd.DatetimeIndex(['2001-01-01', 'NaT', '2003-01-01'],
+                                 tz=tz)
+        exp = pd.DatetimeIndex(['2001-01-01', '2001-01-01', '2001-01-01',
+                                'NaT', 'NaT', 'NaT',
+                                '2003-01-01', '2003-01-01', '2003-01-01'],
+                               tz=tz)
+        for res in [index.repeat(3), np.repeat(index, 3)]:
+            tm.assert_index_equal(res, exp)
+            assert res.freq is None
+
+    def test_repeat(self, tz_naive_fixture):
+        tz = tz_naive_fixture
         reps = 2
         msg = "the 'axis' parameter is not supported"
 
-        for tz in self.tz:
-            rng = pd.date_range(start='2016-01-01', periods=2,
-                                freq='30Min', tz=tz)
-
-            expected_rng = DatetimeIndex([
-                Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
-                Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
-            ])
-
-            res = rng.repeat(reps)
-            tm.assert_index_equal(res, expected_rng)
-            self.assertIsNone(res.freq)
-
-            tm.assert_index_equal(np.repeat(rng, reps), expected_rng)
-            tm.assertRaisesRegexp(ValueError, msg, np.repeat,
-                                  rng, reps, axis=1)
-
-    def test_representation(self):
-
-        idx = []
-        idx.append(DatetimeIndex([], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01'], freq='D'))
-        idx.append(DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D'))
-        idx.append(DatetimeIndex(
-            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D'))
-        idx.append(DatetimeIndex(
-            ['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'
-             ], freq='H', tz='Asia/Tokyo'))
-        idx.append(DatetimeIndex(
-            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='US/Eastern'))
-        idx.append(DatetimeIndex(
-            ['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT], tz='UTC'))
-
-        exp = []
-        exp.append("""DatetimeIndex([], dtype='datetime64[ns]', freq='D')""")
-        exp.append("DatetimeIndex(['2011-01-01'], dtype='datetime64[ns]', "
-                   "freq='D')")
-        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02'], "
-                   "dtype='datetime64[ns]', freq='D')")
-        exp.append("DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
-                   "dtype='datetime64[ns]', freq='D')")
-        exp.append("DatetimeIndex(['2011-01-01 09:00:00+09:00', "
-                   "'2011-01-01 10:00:00+09:00', '2011-01-01 11:00:00+09:00']"
-                   ", dtype='datetime64[ns, Asia/Tokyo]', freq='H')")
-        exp.append("DatetimeIndex(['2011-01-01 09:00:00-05:00', "
-                   "'2011-01-01 10:00:00-05:00', 'NaT'], "
-                   "dtype='datetime64[ns, US/Eastern]', freq=None)")
-        exp.append("DatetimeIndex(['2011-01-01 09:00:00+00:00', "
-                   "'2011-01-01 10:00:00+00:00', 'NaT'], "
-                   "dtype='datetime64[ns, UTC]', freq=None)""")
-
-        with pd.option_context('display.width', 300):
-            for indx, expected in zip(idx, exp):
-                for func in ['__repr__', '__unicode__', '__str__']:
-                    result = getattr(indx, func)()
-                    self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        idx1 = DatetimeIndex([], freq='D')
-        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
-        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = DatetimeIndex(
-            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
-                              '2011-01-01 11:00'], freq='H', tz='Asia/Tokyo')
-        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                             tz='US/Eastern')
-        idx7 = DatetimeIndex(['2011-01-01 09:00', '2011-01-02 10:15'])
-
-        exp1 = """Series([], dtype: datetime64[ns])"""
-
-        exp2 = """0   2011-01-01
-dtype: datetime64[ns]"""
-
-        exp3 = """0   2011-01-01
-1   2011-01-02
-dtype: datetime64[ns]"""
-
-        exp4 = """0   2011-01-01
-1   2011-01-02
-2   2011-01-03
-dtype: datetime64[ns]"""
-
-        exp5 = """0   2011-01-01 09:00:00+09:00
-1   2011-01-01 10:00:00+09:00
-2   2011-01-01 11:00:00+09:00
-dtype: datetime64[ns, Asia/Tokyo]"""
-
-        exp6 = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2                         NaT
-dtype: datetime64[ns, US/Eastern]"""
-
-        exp7 = """0   2011-01-01 09:00:00
-1   2011-01-02 10:15:00
-dtype: datetime64[ns]"""
-
-        with pd.option_context('display.width', 300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4,
-                                      idx5, idx6, idx7],
-                                     [exp1, exp2, exp3, exp4,
-                                      exp5, exp6, exp7]):
-                result = repr(Series(idx))
-                self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = DatetimeIndex([], freq='D')
-        idx2 = DatetimeIndex(['2011-01-01'], freq='D')
-        idx3 = DatetimeIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = DatetimeIndex(
-            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
-                              '2011-01-01 11:00'],
-                             freq='H', tz='Asia/Tokyo')
-        idx6 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00', pd.NaT],
-                             tz='US/Eastern')
-
-        exp1 = """DatetimeIndex: 0 entries
-Freq: D"""
-
-        exp2 = """DatetimeIndex: 1 entries, 2011-01-01 to 2011-01-01
-Freq: D"""
-
-        exp3 = """DatetimeIndex: 2 entries, 2011-01-01 to 2011-01-02
-Freq: D"""
-
-        exp4 = """DatetimeIndex: 3 entries, 2011-01-01 to 2011-01-03
-Freq: D"""
-
-        exp5 = ("DatetimeIndex: 3 entries, 2011-01-01 09:00:00+09:00 "
-                "to 2011-01-01 11:00:00+09:00\n"
-                "Freq: H")
-
-        exp6 = """DatetimeIndex: 3 entries, 2011-01-01 09:00:00-05:00 to NaT"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5, idx6],
-                                 [exp1, exp2, exp3, exp4, exp5, exp6]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
-
-    def test_resolution(self):
+        rng = pd.date_range(start='2016-01-01', periods=2,
+                            freq='30Min', tz=tz)
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:30:00', tz=tz, freq='30T'),
+        ])
+
+        res = rng.repeat(reps)
+        tm.assert_index_equal(res, expected_rng)
+        assert res.freq is None
+
+        tm.assert_index_equal(np.repeat(rng, reps), expected_rng)
+        with pytest.raises(ValueError, match=msg):
+            np.repeat(rng, reps, axis=1)
+
+    def test_resolution(self, tz_naive_fixture):
+        tz = tz_naive_fixture
         for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T',
                                    'S', 'L', 'U'],
                                   ['day', 'day', 'day', 'day', 'hour',
                                    'minute', 'second', 'millisecond',
                                    'microsecond']):
-            for tz in self.tz:
-                idx = pd.date_range(start='2013-04-01', periods=30, freq=freq,
-                                    tz=tz)
-                self.assertEqual(idx.resolution, expected)
-
-    def test_union(self):
-        for tz in self.tz:
-            # union
-            rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
-            expected1 = pd.date_range('1/1/2000', freq='D', periods=10, tz=tz)
-
-            rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
-            expected2 = pd.date_range('1/1/2000', freq='D', periods=8, tz=tz)
-
-            rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other3 = pd.DatetimeIndex([], tz=tz)
-            expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            for rng, other, expected in [(rng1, other1, expected1),
-                                         (rng2, other2, expected2),
-                                         (rng3, other3, expected3)]:
-
-                result_union = rng.union(other)
-                tm.assert_index_equal(result_union, expected)
-
-    def test_add_iadd(self):
-        for tz in self.tz:
-
-            # offset
-            offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                       np.timedelta64(2, 'h'), Timedelta(hours=2)]
-
-            for delta in offsets:
-                rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
-                result = rng + delta
-                expected = pd.date_range('2000-01-01 02:00',
-                                         '2000-02-01 02:00', tz=tz)
-                tm.assert_index_equal(result, expected)
-                rng += delta
-                tm.assert_index_equal(rng, expected)
-
-            # int
-            rng = pd.date_range('2000-01-01 09:00', freq='H', periods=10,
-                                tz=tz)
-            result = rng + 1
-            expected = pd.date_range('2000-01-01 10:00', freq='H', periods=10,
-                                     tz=tz)
-            tm.assert_index_equal(result, expected)
-            rng += 1
-            tm.assert_index_equal(rng, expected)
-
-        idx = DatetimeIndex(['2011-01-01', '2011-01-02'])
-        msg = "cannot add a datelike to a DatetimeIndex"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            idx + Timestamp('2011-01-01')
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            Timestamp('2011-01-01') + idx
-
-    def test_add_dti_dti(self):
-        # previously performed setop (deprecated in 0.16.0), now raises
-        # TypeError (GH14164)
-
-        dti = date_range('20130101', periods=3)
-        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
-
-        with tm.assertRaises(TypeError):
-            dti + dti
-
-        with tm.assertRaises(TypeError):
-            dti_tz + dti_tz
-
-        with tm.assertRaises(TypeError):
-            dti_tz + dti
-
-        with tm.assertRaises(TypeError):
-            dti + dti_tz
-
-    def test_difference(self):
-        for tz in self.tz:
-            # diff
-            rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
-            expected1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
-            expected2 = pd.date_range('1/1/2000', freq='D', periods=3, tz=tz)
-
-            rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-            other3 = pd.DatetimeIndex([], tz=tz)
-            expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
-
-            for rng, other, expected in [(rng1, other1, expected1),
-                                         (rng2, other2, expected2),
-                                         (rng3, other3, expected3)]:
-                result_diff = rng.difference(other)
-                tm.assert_index_equal(result_diff, expected)
-
-    def test_sub_isub(self):
-        for tz in self.tz:
-
-            # offset
-            offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                       np.timedelta64(2, 'h'), Timedelta(hours=2)]
-
-            for delta in offsets:
-                rng = pd.date_range('2000-01-01', '2000-02-01', tz=tz)
-                expected = pd.date_range('1999-12-31 22:00',
-                                         '2000-01-31 22:00', tz=tz)
-
-                result = rng - delta
-                tm.assert_index_equal(result, expected)
-                rng -= delta
-                tm.assert_index_equal(rng, expected)
-
-            # int
-            rng = pd.date_range('2000-01-01 09:00', freq='H', periods=10,
+            idx = pd.date_range(start='2013-04-01', periods=30, freq=freq,
                                 tz=tz)
-            result = rng - 1
-            expected = pd.date_range('2000-01-01 08:00', freq='H', periods=10,
-                                     tz=tz)
-            tm.assert_index_equal(result, expected)
-            rng -= 1
-            tm.assert_index_equal(rng, expected)
-
-    def test_sub_dti_dti(self):
-        # previously performed setop (deprecated in 0.16.0), now changed to
-        # return subtraction -> TimeDeltaIndex (GH ...)
-
-        dti = date_range('20130101', periods=3)
-        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
-        dti_tz2 = date_range('20130101', periods=3).tz_localize('UTC')
-        expected = TimedeltaIndex([0, 0, 0])
-
-        result = dti - dti
-        tm.assert_index_equal(result, expected)
-
-        result = dti_tz - dti_tz
-        tm.assert_index_equal(result, expected)
-
-        with tm.assertRaises(TypeError):
-            dti_tz - dti
-
-        with tm.assertRaises(TypeError):
-            dti - dti_tz
-
-        with tm.assertRaises(TypeError):
-            dti_tz - dti_tz2
-
-        # isub
-        dti -= dti
-        tm.assert_index_equal(dti, expected)
-
-        # different length raises ValueError
-        dti1 = date_range('20130101', periods=3)
-        dti2 = date_range('20130101', periods=4)
-        with tm.assertRaises(ValueError):
-            dti1 - dti2
-
-        # NaN propagation
-        dti1 = DatetimeIndex(['2012-01-01', np.nan, '2012-01-03'])
-        dti2 = DatetimeIndex(['2012-01-02', '2012-01-03', np.nan])
-        expected = TimedeltaIndex(['1 days', np.nan, np.nan])
-        result = dti2 - dti1
-        tm.assert_index_equal(result, expected)
-
-    def test_sub_period(self):
-        # GH 13078
-        # not supported, check TypeError
-        p = pd.Period('2011-01-01', freq='D')
-
-        for freq in [None, 'D']:
-            idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], freq=freq)
-
-            with tm.assertRaises(TypeError):
-                idx - p
-
-            with tm.assertRaises(TypeError):
-                p - idx
-
-    def test_comp_nat(self):
-        left = pd.DatetimeIndex([pd.Timestamp('2011-01-01'), pd.NaT,
-                                 pd.Timestamp('2011-01-03')])
-        right = pd.DatetimeIndex([pd.NaT, pd.NaT, pd.Timestamp('2011-01-03')])
-
-        for l, r in [(left, right), (left.asobject, right.asobject)]:
-            result = l == r
-            expected = np.array([False, False, True])
-            tm.assert_numpy_array_equal(result, expected)
-
-            result = l != r
-            expected = np.array([True, True, False])
-            tm.assert_numpy_array_equal(result, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l == pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT == r, expected)
-
-            expected = np.array([True, True, True])
-            tm.assert_numpy_array_equal(l != pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT != l, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l < pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT > l, expected)
-
-    def test_value_counts_unique(self):
+            assert idx.resolution == expected
+
+    def test_value_counts_unique(self, tz_naive_fixture):
+        tz = tz_naive_fixture
         # GH 7735
-        for tz in self.tz:
-            idx = pd.date_range('2011-01-01 09:00', freq='H', periods=10)
-            # create repeated values, 'n'th element is repeated by n+1 times
-            idx = DatetimeIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
-                                tz=tz)
+        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=10)
+        # create repeated values, 'n'th element is repeated by n+1 times
+        idx = DatetimeIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
+                            tz=tz)
 
-            exp_idx = pd.date_range('2011-01-01 18:00', freq='-1H', periods=10,
-                                    tz=tz)
-            expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
+        exp_idx = pd.date_range('2011-01-01 18:00', freq='-1H', periods=10,
+                                tz=tz)
+        expected = Series(range(10, 0, -1), index=exp_idx, dtype='int64')
 
-            for obj in [idx, Series(idx)]:
-                tm.assert_series_equal(obj.value_counts(), expected)
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
 
-            expected = pd.date_range('2011-01-01 09:00', freq='H', periods=10,
-                                     tz=tz)
-            tm.assert_index_equal(idx.unique(), expected)
+        expected = pd.date_range('2011-01-01 09:00', freq='H', periods=10,
+                                 tz=tz)
+        tm.assert_index_equal(idx.unique(), expected)
 
-            idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 09:00',
-                                 '2013-01-01 09:00', '2013-01-01 08:00',
-                                 '2013-01-01 08:00', pd.NaT], tz=tz)
+        idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 09:00',
+                             '2013-01-01 09:00', '2013-01-01 08:00',
+                             '2013-01-01 08:00', pd.NaT], tz=tz)
 
-            exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00'],
-                                    tz=tz)
-            expected = Series([3, 2], index=exp_idx)
+        exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00'],
+                                tz=tz)
+        expected = Series([3, 2], index=exp_idx)
 
-            for obj in [idx, Series(idx)]:
-                tm.assert_series_equal(obj.value_counts(), expected)
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(), expected)
 
-            exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00',
-                                     pd.NaT], tz=tz)
-            expected = Series([3, 2, 1], index=exp_idx)
+        exp_idx = DatetimeIndex(['2013-01-01 09:00', '2013-01-01 08:00',
+                                 pd.NaT], tz=tz)
+        expected = Series([3, 2, 1], index=exp_idx)
 
-            for obj in [idx, Series(idx)]:
-                tm.assert_series_equal(obj.value_counts(dropna=False),
-                                       expected)
+        for obj in [idx, Series(idx)]:
+            tm.assert_series_equal(obj.value_counts(dropna=False),
+                                   expected)
 
-            tm.assert_index_equal(idx.unique(), exp_idx)
+        tm.assert_index_equal(idx.unique(), exp_idx)
 
     def test_nonunique_contains(self):
         # GH 9512
         for idx in map(DatetimeIndex,
                        ([0, 1, 0], [0, 0, -1], [0, -1, -1],
                         ['2015', '2015', '2016'], ['2015', '2015', '2014'])):
-            tm.assertIn(idx[0], idx)
-
-    def test_order(self):
-        # with freq
-        idx1 = DatetimeIndex(['2011-01-01', '2011-01-02',
-                              '2011-01-03'], freq='D', name='idx')
-        idx2 = DatetimeIndex(['2011-01-01 09:00', '2011-01-01 10:00',
-                              '2011-01-01 11:00'], freq='H',
-                             tz='Asia/Tokyo', name='tzidx')
-
-        for idx in [idx1, idx2]:
-            ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered = idx.sort_values(ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
-
-            ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([0, 1, 2]),
-                                          check_dtype=False)
-            self.assertEqual(ordered.freq, idx.freq)
-
-            ordered, indexer = idx.sort_values(return_indexer=True,
-                                               ascending=False)
-            expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([2, 1, 0]),
-                                          check_dtype=False)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
+            assert idx[0] in idx
+
+    @pytest.mark.parametrize('idx',
+                             [
+                                 DatetimeIndex(
+                                     ['2011-01-01',
+                                      '2011-01-02',
+                                      '2011-01-03'],
+                                     freq='D', name='idx'),
+                                 DatetimeIndex(
+                                     ['2011-01-01 09:00',
+                                      '2011-01-01 10:00',
+                                      '2011-01-01 11:00'],
+                                     freq='H', name='tzidx', tz='Asia/Tokyo')
+                             ])
+    def test_order_with_freq(self, idx):
+        ordered = idx.sort_values()
+        tm.assert_index_equal(ordered, idx)
+        assert ordered.freq == idx.freq
+
+        ordered = idx.sort_values(ascending=False)
+        expected = idx[::-1]
+        tm.assert_index_equal(ordered, expected)
+        assert ordered.freq == expected.freq
+        assert ordered.freq.n == -1
+
+        ordered, indexer = idx.sort_values(return_indexer=True)
+        tm.assert_index_equal(ordered, idx)
+        tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                    check_dtype=False)
+        assert ordered.freq == idx.freq
+
+        ordered, indexer = idx.sort_values(return_indexer=True,
+                                           ascending=False)
+        expected = idx[::-1]
+        tm.assert_index_equal(ordered, expected)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([2, 1, 0]),
+                                    check_dtype=False)
+        assert ordered.freq == expected.freq
+        assert ordered.freq.n == -1
+
+    @pytest.mark.parametrize('index_dates,expected_dates', [
+        (['2011-01-01', '2011-01-03', '2011-01-05',
+          '2011-01-02', '2011-01-01'],
+         ['2011-01-01', '2011-01-01', '2011-01-02',
+          '2011-01-03', '2011-01-05']),
+        (['2011-01-01', '2011-01-03', '2011-01-05',
+          '2011-01-02', '2011-01-01'],
+         ['2011-01-01', '2011-01-01', '2011-01-02',
+          '2011-01-03', '2011-01-05']),
+        ([pd.NaT, '2011-01-03', '2011-01-05',
+          '2011-01-02', pd.NaT],
+         [pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
+          '2011-01-05'])
+    ])
+    def test_order_without_freq(self, index_dates, expected_dates,
+                                tz_naive_fixture):
+        tz = tz_naive_fixture
 
         # without freq
-        for tz in self.tz:
-            idx1 = DatetimeIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                                  '2011-01-02', '2011-01-01'],
-                                 tz=tz, name='idx1')
-            exp1 = DatetimeIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                                  '2011-01-03', '2011-01-05'],
-                                 tz=tz, name='idx1')
-
-            idx2 = DatetimeIndex(['2011-01-01', '2011-01-03', '2011-01-05',
-                                  '2011-01-02', '2011-01-01'],
-                                 tz=tz, name='idx2')
-
-            exp2 = DatetimeIndex(['2011-01-01', '2011-01-01', '2011-01-02',
-                                  '2011-01-03', '2011-01-05'],
-                                 tz=tz, name='idx2')
-
-            idx3 = DatetimeIndex([pd.NaT, '2011-01-03', '2011-01-05',
-                                  '2011-01-02', pd.NaT], tz=tz, name='idx3')
-            exp3 = DatetimeIndex([pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
-                                  '2011-01-05'], tz=tz, name='idx3')
-
-            for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3)]:
-                ordered = idx.sort_values()
-                self.assert_index_equal(ordered, expected)
-                self.assertIsNone(ordered.freq)
-
-                ordered = idx.sort_values(ascending=False)
-                self.assert_index_equal(ordered, expected[::-1])
-                self.assertIsNone(ordered.freq)
-
-                ordered, indexer = idx.sort_values(return_indexer=True)
-                self.assert_index_equal(ordered, expected)
-
-                exp = np.array([0, 4, 3, 1, 2])
-                self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-                self.assertIsNone(ordered.freq)
-
-                ordered, indexer = idx.sort_values(return_indexer=True,
-                                                   ascending=False)
-                self.assert_index_equal(ordered, expected[::-1])
-
-                exp = np.array([2, 1, 3, 4, 0])
-                self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-                self.assertIsNone(ordered.freq)
-
-    def test_getitem(self):
-        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
-                             tz='Asia/Tokyo', name='idx')
-
-        for idx in [idx1, idx2]:
-            result = idx[0]
-            self.assertEqual(result, Timestamp('2011-01-01', tz=idx.tz))
-
-            result = idx[0:5]
-            expected = pd.date_range('2011-01-01', '2011-01-05', freq='D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[0:10:2]
-            expected = pd.date_range('2011-01-01', '2011-01-09', freq='2D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[-20:-5:3]
-            expected = pd.date_range('2011-01-12', '2011-01-24', freq='3D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[4::-1]
-            expected = DatetimeIndex(['2011-01-05', '2011-01-04', '2011-01-03',
-                                      '2011-01-02', '2011-01-01'],
-                                     freq='-1D', tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
+        index = DatetimeIndex(index_dates, tz=tz, name='idx')
+        expected = DatetimeIndex(expected_dates, tz=tz, name='idx')
+
+        ordered = index.sort_values()
+        tm.assert_index_equal(ordered, expected)
+        assert ordered.freq is None
+
+        ordered = index.sort_values(ascending=False)
+        tm.assert_index_equal(ordered, expected[::-1])
+        assert ordered.freq is None
+
+        ordered, indexer = index.sort_values(return_indexer=True)
+        tm.assert_index_equal(ordered, expected)
+
+        exp = np.array([0, 4, 3, 1, 2])
+        tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+        assert ordered.freq is None
+
+        ordered, indexer = index.sort_values(return_indexer=True,
+                                             ascending=False)
+        tm.assert_index_equal(ordered, expected[::-1])
+
+        exp = np.array([2, 1, 3, 4, 0])
+        tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+        assert ordered.freq is None
 
     def test_drop_duplicates_metadata(self):
         # GH 10115
         idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
         result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
 
         idx_dup = idx.append(idx)
-        self.assertIsNone(idx_dup.freq)  # freq is reset
+        assert idx_dup.freq is None  # freq is reset
         result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertIsNone(result.freq)
+        tm.assert_index_equal(idx, result)
+        assert result.freq is None
 
     def test_drop_duplicates(self):
         # to check Index/Series compat
@@ -784,510 +283,220 @@ def test_drop_duplicates(self):
         res = Series(idx).drop_duplicates(keep=False)
         tm.assert_series_equal(res, Series(base[5:], index=np.arange(5, 31)))
 
-    def test_take(self):
-        # GH 10295
-        idx1 = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        idx2 = pd.date_range('2011-01-01', '2011-01-31', freq='D',
-                             tz='Asia/Tokyo', name='idx')
-
-        for idx in [idx1, idx2]:
-            result = idx.take([0])
-            self.assertEqual(result, Timestamp('2011-01-01', tz=idx.tz))
-
-            result = idx.take([0, 1, 2])
-            expected = pd.date_range('2011-01-01', '2011-01-03', freq='D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([0, 2, 4])
-            expected = pd.date_range('2011-01-01', '2011-01-05', freq='2D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([7, 4, 1])
-            expected = pd.date_range('2011-01-08', '2011-01-02', freq='-3D',
-                                     tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([3, 2, 5])
-            expected = DatetimeIndex(['2011-01-04', '2011-01-03',
-                                      '2011-01-06'],
-                                     freq=None, tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-            result = idx.take([-3, 2, 5])
-            expected = DatetimeIndex(['2011-01-29', '2011-01-03',
-                                      '2011-01-06'],
-                                     freq=None, tz=idx.tz, name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-    def test_take_invalid_kwargs(self):
-        idx = pd.date_range('2011-01-01', '2011-01-31', freq='D', name='idx')
-        indices = [1, 6, 5, 9, 10, 13, 15, 3]
+    @pytest.mark.parametrize('freq', [
+        'A', '2A', '-2A', 'Q', '-1Q', 'M', '-1M', 'D', '3D',
+        '-3D', 'W', '-1W', 'H', '2H', '-2H', 'T', '2T', 'S',
+        '-3S'])
+    def test_infer_freq(self, freq):
+        # GH 11018
+        idx = pd.date_range('2011-01-01 09:00:00', freq=freq, periods=10)
+        result = pd.DatetimeIndex(idx.asi8, freq='infer')
+        tm.assert_index_equal(idx, result)
+        assert result.freq == freq
 
-        msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, idx.take,
-                              indices, foo=2)
+    def test_nat(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        assert pd.DatetimeIndex._na_value is pd.NaT
+        assert pd.DatetimeIndex([])._na_value is pd.NaT
 
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, out=indices)
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
+        assert idx._can_hold_na
 
-        msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, mode='clip')
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
+        assert idx.hasnans is False
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([], dtype=np.intp))
 
-    def test_infer_freq(self):
-        # GH 11018
-        for freq in ['A', '2A', '-2A', 'Q', '-1Q', 'M', '-1M', 'D', '3D',
-                     '-3D', 'W', '-1W', 'H', '2H', '-2H', 'T', '2T', 'S',
-                     '-3S']:
-            idx = pd.date_range('2011-01-01 09:00:00', freq=freq, periods=10)
-            result = pd.DatetimeIndex(idx.asi8, freq='infer')
-            tm.assert_index_equal(idx, result)
-            self.assertEqual(result.freq, freq)
-
-    def test_nat_new(self):
-        idx = pd.date_range('2011-01-01', freq='D', periods=5, name='x')
-        result = idx._nat_new()
-        exp = pd.DatetimeIndex([pd.NaT] * 5, name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx._nat_new(box=False)
-        exp = np.array([tslib.iNaT] * 5, dtype=np.int64)
-        tm.assert_numpy_array_equal(result, exp)
+        idx = pd.DatetimeIndex(['2011-01-01', 'NaT'], tz=tz)
+        assert idx._can_hold_na
 
-    def test_shift(self):
-        # GH 9903
-        for tz in self.tz:
-            idx = pd.DatetimeIndex([], name='xxx', tz=tz)
-            tm.assert_index_equal(idx.shift(0, freq='H'), idx)
-            tm.assert_index_equal(idx.shift(3, freq='H'), idx)
-
-            idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-01 11:00'
-                                    '2011-01-01 12:00'], name='xxx', tz=tz)
-            tm.assert_index_equal(idx.shift(0, freq='H'), idx)
-            exp = pd.DatetimeIndex(['2011-01-01 13:00', '2011-01-01 14:00'
-                                    '2011-01-01 15:00'], name='xxx', tz=tz)
-            tm.assert_index_equal(idx.shift(3, freq='H'), exp)
-            exp = pd.DatetimeIndex(['2011-01-01 07:00', '2011-01-01 08:00'
-                                    '2011-01-01 09:00'], name='xxx', tz=tz)
-            tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
-
-    def test_nat(self):
-        self.assertIs(pd.DatetimeIndex._na_value, pd.NaT)
-        self.assertIs(pd.DatetimeIndex([])._na_value, pd.NaT)
-
-        for tz in [None, 'US/Eastern', 'UTC']:
-            idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
-            self.assertTrue(idx._can_hold_na)
-
-            tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
-            self.assertFalse(idx.hasnans)
-            tm.assert_numpy_array_equal(idx._nan_idxs,
-                                        np.array([], dtype=np.intp))
-
-            idx = pd.DatetimeIndex(['2011-01-01', 'NaT'], tz=tz)
-            self.assertTrue(idx._can_hold_na)
-
-            tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
-            self.assertTrue(idx.hasnans)
-            tm.assert_numpy_array_equal(idx._nan_idxs,
-                                        np.array([1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
+        assert idx.hasnans is True
+        tm.assert_numpy_array_equal(idx._nan_idxs,
+                                    np.array([1], dtype=np.intp))
 
     def test_equals(self):
         # GH 13107
-        for tz in [None, 'UTC', 'US/Eastern', 'Asia/Tokyo']:
-            idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'])
-            self.assertTrue(idx.equals(idx))
-            self.assertTrue(idx.equals(idx.copy()))
-            self.assertTrue(idx.equals(idx.asobject))
-            self.assertTrue(idx.asobject.equals(idx))
-            self.assertTrue(idx.asobject.equals(idx.asobject))
-            self.assertFalse(idx.equals(list(idx)))
-            self.assertFalse(idx.equals(pd.Series(idx)))
-
-            idx2 = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'],
-                                    tz='US/Pacific')
-            self.assertFalse(idx.equals(idx2))
-            self.assertFalse(idx.equals(idx2.copy()))
-            self.assertFalse(idx.equals(idx2.asobject))
-            self.assertFalse(idx.asobject.equals(idx2))
-            self.assertFalse(idx.equals(list(idx2)))
-            self.assertFalse(idx.equals(pd.Series(idx2)))
-
-            # same internal, different tz
-            idx3 = pd.DatetimeIndex._simple_new(idx.asi8, tz='US/Pacific')
-            tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
-            self.assertFalse(idx.equals(idx3))
-            self.assertFalse(idx.equals(idx3.copy()))
-            self.assertFalse(idx.equals(idx3.asobject))
-            self.assertFalse(idx.asobject.equals(idx3))
-            self.assertFalse(idx.equals(list(idx3)))
-            self.assertFalse(idx.equals(pd.Series(idx3)))
-
-
-class TestDateTimeIndexToJulianDate(tm.TestCase):
-
-    def test_1700(self):
-        r1 = Float64Index([2345897.5, 2345898.5, 2345899.5, 2345900.5,
-                           2345901.5])
-        r2 = date_range(start=Timestamp('1710-10-01'), periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_2000(self):
-        r1 = Float64Index([2451601.5, 2451602.5, 2451603.5, 2451604.5,
-                           2451605.5])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='D').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_hour(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.5416666666666666, 2451601.5833333333333333,
-             2451601.625, 2451601.6666666666666666])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='H').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_minute(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.5006944444444444, 2451601.5013888888888888,
-             2451601.5020833333333333, 2451601.5027777777777777])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='T').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-    def test_second(self):
-        r1 = Float64Index(
-            [2451601.5, 2451601.500011574074074, 2451601.5000231481481481,
-             2451601.5000347222222222, 2451601.5000462962962962])
-        r2 = date_range(start=Timestamp('2000-02-27'), periods=5,
-                        freq='S').to_julian_date()
-        self.assertIsInstance(r2, Float64Index)
-        tm.assert_index_equal(r1, r2)
-
-
-# GH 10699
-@pytest.mark.parametrize('klass,assert_func', zip([Series, DatetimeIndex],
-                                                  [tm.assert_series_equal,
-                                                   tm.assert_index_equal]))
-def test_datetime64_with_DateOffset(klass, assert_func):
-    s = klass(date_range('2000-01-01', '2000-01-31'), name='a')
-    result = s + pd.DateOffset(years=1)
-    result2 = pd.DateOffset(years=1) + s
-    exp = klass(date_range('2001-01-01', '2001-01-31'), name='a')
-    assert_func(result, exp)
-    assert_func(result2, exp)
-
-    result = s - pd.DateOffset(years=1)
-    exp = klass(date_range('1999-01-01', '1999-01-31'), name='a')
-    assert_func(result, exp)
-
-    s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-               pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
-    result = s + pd.offsets.Day()
-    result2 = pd.offsets.Day() + s
-    exp = klass([Timestamp('2000-01-16 00:15:00', tz='US/Central'),
-                 Timestamp('2000-02-16', tz='US/Central')], name='a')
-    assert_func(result, exp)
-    assert_func(result2, exp)
-
-    s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-               pd.Timestamp('2000-02-15', tz='US/Central')], name='a')
-    result = s + pd.offsets.MonthEnd()
-    result2 = pd.offsets.MonthEnd() + s
-    exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
-                 Timestamp('2000-02-29', tz='US/Central')], name='a')
-    assert_func(result, exp)
-    assert_func(result2, exp)
-
-    # array of offsets - valid for Series only
-    if klass is Series:
-        with tm.assert_produces_warning(PerformanceWarning):
-            s = klass([Timestamp('2000-1-1'), Timestamp('2000-2-1')])
-            result = s + Series([pd.offsets.DateOffset(years=1),
-                                 pd.offsets.MonthEnd()])
-            exp = klass([Timestamp('2001-1-1'), Timestamp('2000-2-29')
-                         ])
-            assert_func(result, exp)
-
-            # same offset
-            result = s + Series([pd.offsets.DateOffset(years=1),
-                                 pd.offsets.DateOffset(years=1)])
-            exp = klass([Timestamp('2001-1-1'), Timestamp('2001-2-1')])
-            assert_func(result, exp)
-
-    s = klass([Timestamp('2000-01-05 00:15:00'),
-               Timestamp('2000-01-31 00:23:00'),
-               Timestamp('2000-01-01'),
-               Timestamp('2000-03-31'),
-               Timestamp('2000-02-29'),
-               Timestamp('2000-12-31'),
-               Timestamp('2000-05-15'),
-               Timestamp('2001-06-15')])
-
-    # DateOffset relativedelta fastpath
-    relative_kwargs = [('years', 2), ('months', 5), ('days', 3),
-                       ('hours', 5), ('minutes', 10), ('seconds', 2),
-                       ('microseconds', 5)]
-    for i, kwd in enumerate(relative_kwargs):
-        op = pd.DateOffset(**dict([kwd]))
-        assert_func(klass([x + op for x in s]), s + op)
-        assert_func(klass([x - op for x in s]), s - op)
-        op = pd.DateOffset(**dict(relative_kwargs[:i + 1]))
-        assert_func(klass([x + op for x in s]), s + op)
-        assert_func(klass([x - op for x in s]), s - op)
-
-    # assert these are equal on a piecewise basis
-    offsets = ['YearBegin', ('YearBegin', {'month': 5}),
-               'YearEnd', ('YearEnd', {'month': 5}),
-               'MonthBegin', 'MonthEnd',
-               'SemiMonthEnd', 'SemiMonthBegin',
-               'Week', ('Week', {'weekday': 3}),
-               'BusinessDay', 'BDay', 'QuarterEnd', 'QuarterBegin',
-               'CustomBusinessDay', 'CDay', 'CBMonthEnd',
-               'CBMonthBegin', 'BMonthBegin', 'BMonthEnd',
-               'BusinessHour', 'BYearBegin', 'BYearEnd',
-               'BQuarterBegin', ('LastWeekOfMonth', {'weekday': 2}),
-               ('FY5253Quarter', {'qtr_with_extra_week': 1,
-                                  'startingMonth': 1,
-                                  'weekday': 2,
-                                  'variation': 'nearest'}),
-               ('FY5253', {'weekday': 0,
-                           'startingMonth': 2,
-                           'variation':
-                           'nearest'}),
-               ('WeekOfMonth', {'weekday': 2,
-                                'week': 2}),
-               'Easter', ('DateOffset', {'day': 4}),
-               ('DateOffset', {'month': 5})]
-
-    with warnings.catch_warnings(record=True):
-        for normalize in (True, False):
-            for do in offsets:
-                if isinstance(do, tuple):
-                    do, kwargs = do
-                else:
-                    do = do
-                    kwargs = {}
-
-                    for n in [0, 5]:
-                        if (do in ['WeekOfMonth', 'LastWeekOfMonth',
-                                   'FY5253Quarter', 'FY5253'] and n == 0):
-                            continue
-                    op = getattr(pd.offsets, do)(n,
-                                                 normalize=normalize,
-                                                 **kwargs)
-                    assert_func(klass([x + op for x in s]), s + op)
-                    assert_func(klass([x - op for x in s]), s - op)
-                    assert_func(klass([op + x for x in s]), op + s)
-
-
-@pytest.mark.parametrize('years,months', product([-1, 0, 1], [-2, 0, 2]))
-def test_shift_months(years, months):
-    s = DatetimeIndex([Timestamp('2000-01-05 00:15:00'),
-                       Timestamp('2000-01-31 00:23:00'),
-                       Timestamp('2000-01-01'),
-                       Timestamp('2000-02-29'),
-                       Timestamp('2000-12-31')])
-    actual = DatetimeIndex(tslib.shift_months(s.asi8, years * 12 +
-                                              months))
-    expected = DatetimeIndex([x + offsets.DateOffset(
-        years=years, months=months) for x in s])
-    tm.assert_index_equal(actual, expected)
-
-
-class TestBusinessDatetimeIndex(tm.TestCase):
-
-    def setUp(self):
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'])
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
+
+        idx2 = pd.DatetimeIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                                tz='US/Pacific')
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+        # same internal, different tz
+        idx3 = pd.DatetimeIndex._simple_new(idx.asi8, tz='US/Pacific')
+        tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
+        assert not idx.equals(idx3)
+        assert not idx.equals(idx3.copy())
+        assert not idx.equals(idx3.astype(object))
+        assert not idx.astype(object).equals(idx3)
+        assert not idx.equals(list(idx3))
+        assert not idx.equals(pd.Series(idx3))
+
+    @pytest.mark.parametrize('values', [
+        ['20180101', '20180103', '20180105'], []])
+    @pytest.mark.parametrize('freq', [
+        '2D', Day(2), '2B', BDay(2), '48H', Hour(48)])
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    def test_freq_setter(self, values, freq, tz):
+        # GH 20678
+        idx = DatetimeIndex(values, tz=tz)
+
+        # can set to an offset, converting from string if necessary
+        idx.freq = freq
+        assert idx.freq == freq
+        assert isinstance(idx.freq, ABCDateOffset)
+
+        # can reset to None
+        idx.freq = None
+        assert idx.freq is None
+
+    def test_freq_setter_errors(self):
+        # GH 20678
+        idx = DatetimeIndex(['20180101', '20180103', '20180105'])
+
+        # setting with an incompatible freq
+        msg = ('Inferred frequency 2D from passed values does not conform to '
+               'passed frequency 5D')
+        with pytest.raises(ValueError, match=msg):
+            idx.freq = '5D'
+
+        # setting with non-freq string
+        with pytest.raises(ValueError, match='Invalid frequency'):
+            idx.freq = 'foo'
+
+    def test_offset_deprecated(self):
+        # GH 20716
+        idx = pd.DatetimeIndex(['20180101', '20180102'])
+
+        # getter deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            idx.offset
+
+        # setter deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            idx.offset = BDay()
+
+
+class TestBusinessDatetimeIndex(object):
+
+    def setup_method(self, method):
         self.rng = bdate_range(START, END)
 
     def test_comparison(self):
         d = self.rng[10]
 
         comp = self.rng > d
-        self.assertTrue(comp[11])
-        self.assertFalse(comp[9])
+        assert comp[11]
+        assert not comp[9]
 
     def test_pickle_unpickle(self):
-        unpickled = self.round_trip_pickle(self.rng)
-        self.assertIsNotNone(unpickled.offset)
+        unpickled = tm.round_trip_pickle(self.rng)
+        assert unpickled.freq is not None
 
     def test_copy(self):
         cp = self.rng.copy()
         repr(cp)
-        self.assert_index_equal(cp, self.rng)
-
-    def test_repr(self):
-        # only really care that it works
-        repr(self.rng)
-
-    def test_getitem(self):
-        smaller = self.rng[:5]
-        exp = DatetimeIndex(self.rng.view(np.ndarray)[:5])
-        self.assert_index_equal(smaller, exp)
-
-        self.assertEqual(smaller.offset, self.rng.offset)
-
-        sliced = self.rng[::5]
-        self.assertEqual(sliced.offset, BDay() * 5)
-
-        fancy_indexed = self.rng[[4, 3, 2, 1, 0]]
-        self.assertEqual(len(fancy_indexed), 5)
-        tm.assertIsInstance(fancy_indexed, DatetimeIndex)
-        self.assertIsNone(fancy_indexed.freq)
-
-        # 32-bit vs. 64-bit platforms
-        self.assertEqual(self.rng[4], self.rng[np.int_(4)])
-
-    def test_getitem_matplotlib_hackaround(self):
-        values = self.rng[:, None]
-        expected = self.rng.values[:, None]
-        self.assert_numpy_array_equal(values, expected)
+        tm.assert_index_equal(cp, self.rng)
 
     def test_shift(self):
         shifted = self.rng.shift(5)
-        self.assertEqual(shifted[0], self.rng[5])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[0] == self.rng[5]
+        assert shifted.freq == self.rng.freq
 
         shifted = self.rng.shift(-5)
-        self.assertEqual(shifted[5], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[5] == self.rng[0]
+        assert shifted.freq == self.rng.freq
 
         shifted = self.rng.shift(0)
-        self.assertEqual(shifted[0], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[0] == self.rng[0]
+        assert shifted.freq == self.rng.freq
 
         rng = date_range(START, END, freq=BMonthEnd())
         shifted = rng.shift(1, freq=BDay())
-        self.assertEqual(shifted[0], rng[0] + BDay())
-
-    def test_summary(self):
-        self.rng.summary()
-        self.rng[2:2].summary()
-
-    def test_summary_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc).summary()
-
-    def test_summary_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        bdate_range('1/1/2005', '1/1/2009', tz=dateutil.tz.tzutc()).summary()
+        assert shifted[0] == rng[0] + BDay()
 
     def test_equals(self):
-        self.assertFalse(self.rng.equals(list(self.rng)))
+        assert not self.rng.equals(list(self.rng))
 
     def test_identical(self):
         t1 = self.rng.copy()
         t2 = self.rng.copy()
-        self.assertTrue(t1.identical(t2))
+        assert t1.identical(t2)
 
         # name
         t1 = t1.rename('foo')
-        self.assertTrue(t1.equals(t2))
-        self.assertFalse(t1.identical(t2))
+        assert t1.equals(t2)
+        assert not t1.identical(t2)
         t2 = t2.rename('foo')
-        self.assertTrue(t1.identical(t2))
+        assert t1.identical(t2)
 
         # freq
         t2v = Index(t2.values)
-        self.assertTrue(t1.equals(t2v))
-        self.assertFalse(t1.identical(t2v))
+        assert t1.equals(t2v)
+        assert not t1.identical(t2v)
 
 
-class TestCustomDatetimeIndex(tm.TestCase):
-
-    def setUp(self):
-        self.rng = cdate_range(START, END)
+class TestCustomDatetimeIndex(object):
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END, freq='C')
 
     def test_comparison(self):
         d = self.rng[10]
 
         comp = self.rng > d
-        self.assertTrue(comp[11])
-        self.assertFalse(comp[9])
+        assert comp[11]
+        assert not comp[9]
 
     def test_copy(self):
         cp = self.rng.copy()
         repr(cp)
-        self.assert_index_equal(cp, self.rng)
-
-    def test_repr(self):
-        # only really care that it works
-        repr(self.rng)
-
-    def test_getitem(self):
-        smaller = self.rng[:5]
-        exp = DatetimeIndex(self.rng.view(np.ndarray)[:5])
-        self.assert_index_equal(smaller, exp)
-        self.assertEqual(smaller.offset, self.rng.offset)
-
-        sliced = self.rng[::5]
-        self.assertEqual(sliced.offset, CDay() * 5)
-
-        fancy_indexed = self.rng[[4, 3, 2, 1, 0]]
-        self.assertEqual(len(fancy_indexed), 5)
-        tm.assertIsInstance(fancy_indexed, DatetimeIndex)
-        self.assertIsNone(fancy_indexed.freq)
-
-        # 32-bit vs. 64-bit platforms
-        self.assertEqual(self.rng[4], self.rng[np.int_(4)])
-
-    def test_getitem_matplotlib_hackaround(self):
-        values = self.rng[:, None]
-        expected = self.rng.values[:, None]
-        self.assert_numpy_array_equal(values, expected)
+        tm.assert_index_equal(cp, self.rng)
 
     def test_shift(self):
 
         shifted = self.rng.shift(5)
-        self.assertEqual(shifted[0], self.rng[5])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[0] == self.rng[5]
+        assert shifted.freq == self.rng.freq
 
         shifted = self.rng.shift(-5)
-        self.assertEqual(shifted[5], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[5] == self.rng[0]
+        assert shifted.freq == self.rng.freq
 
         shifted = self.rng.shift(0)
-        self.assertEqual(shifted[0], self.rng[0])
-        self.assertEqual(shifted.offset, self.rng.offset)
+        assert shifted[0] == self.rng[0]
+        assert shifted.freq == self.rng.freq
 
-        # PerformanceWarning
         with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", pd.errors.PerformanceWarning)
             rng = date_range(START, END, freq=BMonthEnd())
             shifted = rng.shift(1, freq=CDay())
-            self.assertEqual(shifted[0], rng[0] + CDay())
-
-    def test_pickle_unpickle(self):
-        unpickled = self.round_trip_pickle(self.rng)
-        self.assertIsNotNone(unpickled.offset)
+            assert shifted[0] == rng[0] + CDay()
 
-    def test_summary(self):
-        self.rng.summary()
-        self.rng[2:2].summary()
+    def test_shift_periods(self):
+        # GH#22458 : argument 'n' was deprecated in favor of 'periods'
+        idx = pd.date_range(start=START, end=END, periods=3)
+        tm.assert_index_equal(idx.shift(periods=0), idx)
+        tm.assert_index_equal(idx.shift(0), idx)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=True):
+            tm.assert_index_equal(idx.shift(n=0), idx)
 
-    def test_summary_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        cdate_range('1/1/2005', '1/1/2009', tz=pytz.utc).summary()
-
-    def test_summary_dateutil(self):
-        tm._skip_if_no_dateutil()
-        import dateutil
-        cdate_range('1/1/2005', '1/1/2009', tz=dateutil.tz.tzutc()).summary()
+    def test_pickle_unpickle(self):
+        unpickled = tm.round_trip_pickle(self.rng)
+        assert unpickled.freq is not None
 
     def test_equals(self):
-        self.assertFalse(self.rng.equals(list(self.rng)))
+        assert not self.rng.equals(list(self.rng))
diff --git a/pandas/tests/indexes/datetimes/test_partial_slcing.py b/pandas/tests/indexes/datetimes/test_partial_slcing.py
deleted file mode 100644
index a960f5cf9235a..0000000000000
--- a/pandas/tests/indexes/datetimes/test_partial_slcing.py
+++ /dev/null
@@ -1,256 +0,0 @@
-""" test partial slicing on Series/Frame """
-from datetime import datetime
-import numpy as np
-import pandas as pd
-
-from pandas import (DatetimeIndex, Series, DataFrame,
-                    date_range, Index, Timedelta, Timestamp)
-from pandas.util import testing as tm
-
-
-class TestSlicing(tm.TestCase):
-
-    def test_slice_year(self):
-        dti = DatetimeIndex(freq='B', start=datetime(2005, 1, 1), periods=500)
-
-        s = Series(np.arange(len(dti)), index=dti)
-        result = s['2005']
-        expected = s[s.index.year == 2005]
-        tm.assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        result = df.loc['2005']
-        expected = df[df.index.year == 2005]
-        tm.assert_frame_equal(result, expected)
-
-        rng = date_range('1/1/2000', '1/1/2010')
-
-        result = rng.get_loc('2009')
-        expected = slice(3288, 3653)
-        self.assertEqual(result, expected)
-
-    def test_slice_quarter(self):
-        dti = DatetimeIndex(freq='D', start=datetime(2000, 6, 1), periods=500)
-
-        s = Series(np.arange(len(dti)), index=dti)
-        self.assertEqual(len(s['2001Q1']), 90)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        self.assertEqual(len(df.loc['1Q01']), 90)
-
-    def test_slice_month(self):
-        dti = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
-        s = Series(np.arange(len(dti)), index=dti)
-        self.assertEqual(len(s['2005-11']), 30)
-
-        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
-        self.assertEqual(len(df.loc['2005-11']), 30)
-
-        tm.assert_series_equal(s['2005-11'], s['11-2005'])
-
-    def test_partial_slice(self):
-        rng = DatetimeIndex(freq='D', start=datetime(2005, 1, 1), periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-05':'2006-02']
-        expected = s['20050501':'20060228']
-        tm.assert_series_equal(result, expected)
-
-        result = s['2005-05':]
-        expected = s['20050501':]
-        tm.assert_series_equal(result, expected)
-
-        result = s[:'2006-02']
-        expected = s[:'20060228']
-        tm.assert_series_equal(result, expected)
-
-        result = s['2005-1-1']
-        self.assertEqual(result, s.iloc[0])
-
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31')
-
-    def test_partial_slice_daily(self):
-        rng = DatetimeIndex(freq='H', start=datetime(2005, 1, 31), periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-31']
-        tm.assert_series_equal(result, s.iloc[:24])
-
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00')
-
-    def test_partial_slice_hourly(self):
-        rng = DatetimeIndex(freq='T', start=datetime(2005, 1, 1, 20, 0, 0),
-                            periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-1']
-        tm.assert_series_equal(result, s.iloc[:60 * 4])
-
-        result = s['2005-1-1 20']
-        tm.assert_series_equal(result, s.iloc[:60])
-
-        self.assertEqual(s['2005-1-1 20:00'], s.iloc[0])
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00:15')
-
-    def test_partial_slice_minutely(self):
-        rng = DatetimeIndex(freq='S', start=datetime(2005, 1, 1, 23, 59, 0),
-                            periods=500)
-        s = Series(np.arange(len(rng)), index=rng)
-
-        result = s['2005-1-1 23:59']
-        tm.assert_series_equal(result, s.iloc[:60])
-
-        result = s['2005-1-1']
-        tm.assert_series_equal(result, s.iloc[:60])
-
-        self.assertEqual(s[Timestamp('2005-1-1 23:59:00')], s.iloc[0])
-        self.assertRaises(Exception, s.__getitem__, '2004-12-31 00:00:00')
-
-    def test_partial_slice_second_precision(self):
-        rng = DatetimeIndex(start=datetime(2005, 1, 1, 0, 0, 59,
-                                           microsecond=999990),
-                            periods=20, freq='US')
-        s = Series(np.arange(20), rng)
-
-        tm.assert_series_equal(s['2005-1-1 00:00'], s.iloc[:10])
-        tm.assert_series_equal(s['2005-1-1 00:00:59'], s.iloc[:10])
-
-        tm.assert_series_equal(s['2005-1-1 00:01'], s.iloc[10:])
-        tm.assert_series_equal(s['2005-1-1 00:01:00'], s.iloc[10:])
-
-        self.assertEqual(s[Timestamp('2005-1-1 00:00:59.999990')], s.iloc[0])
-        self.assertRaisesRegexp(KeyError, '2005-1-1 00:00:00',
-                                lambda: s['2005-1-1 00:00:00'])
-
-    def test_partial_slicing_dataframe(self):
-        # GH14856
-        # Test various combinations of string slicing resolution vs.
-        # index resolution
-        # - If string resolution is less precise than index resolution,
-        # string is considered a slice
-        # - If string resolution is equal to or more precise than index
-        # resolution, string is considered an exact match
-        formats = ['%Y', '%Y-%m', '%Y-%m-%d', '%Y-%m-%d %H',
-                   '%Y-%m-%d %H:%M', '%Y-%m-%d %H:%M:%S']
-        resolutions = ['year', 'month', 'day', 'hour', 'minute', 'second']
-        for rnum, resolution in enumerate(resolutions[2:], 2):
-            # we check only 'day', 'hour', 'minute' and 'second'
-            unit = Timedelta("1 " + resolution)
-            middate = datetime(2012, 1, 1, 0, 0, 0)
-            index = DatetimeIndex([middate - unit,
-                                   middate, middate + unit])
-            values = [1, 2, 3]
-            df = DataFrame({'a': values}, index, dtype=np.int64)
-            self.assertEqual(df.index.resolution, resolution)
-
-            # Timestamp with the same resolution as index
-            # Should be exact match for Series (return scalar)
-            # and raise KeyError for Frame
-            for timestamp, expected in zip(index, values):
-                ts_string = timestamp.strftime(formats[rnum])
-                # make ts_string as precise as index
-                result = df['a'][ts_string]
-                self.assertIsInstance(result, np.int64)
-                self.assertEqual(result, expected)
-                self.assertRaises(KeyError, df.__getitem__, ts_string)
-
-            # Timestamp with resolution less precise than index
-            for fmt in formats[:rnum]:
-                for element, theslice in [[0, slice(None, 1)],
-                                          [1, slice(1, None)]]:
-                    ts_string = index[element].strftime(fmt)
-
-                    # Series should return slice
-                    result = df['a'][ts_string]
-                    expected = df['a'][theslice]
-                    tm.assert_series_equal(result, expected)
-
-                    # Frame should return slice as well
-                    result = df[ts_string]
-                    expected = df[theslice]
-                    tm.assert_frame_equal(result, expected)
-
-            # Timestamp with resolution more precise than index
-            # Compatible with existing key
-            # Should return scalar for Series
-            # and raise KeyError for Frame
-            for fmt in formats[rnum + 1:]:
-                ts_string = index[1].strftime(fmt)
-                result = df['a'][ts_string]
-                self.assertIsInstance(result, np.int64)
-                self.assertEqual(result, 2)
-                self.assertRaises(KeyError, df.__getitem__, ts_string)
-
-            # Not compatible with existing key
-            # Should raise KeyError
-            for fmt, res in list(zip(formats, resolutions))[rnum + 1:]:
-                ts = index[1] + Timedelta("1 " + res)
-                ts_string = ts.strftime(fmt)
-                self.assertRaises(KeyError, df['a'].__getitem__, ts_string)
-                self.assertRaises(KeyError, df.__getitem__, ts_string)
-
-    def test_partial_slicing_with_multiindex(self):
-
-        # GH 4758
-        # partial string indexing with a multi-index buggy
-        df = DataFrame({'ACCOUNT': ["ACCT1", "ACCT1", "ACCT1", "ACCT2"],
-                        'TICKER': ["ABC", "MNP", "XYZ", "XYZ"],
-                        'val': [1, 2, 3, 4]},
-                       index=date_range("2013-06-19 09:30:00",
-                                        periods=4, freq='5T'))
-        df_multi = df.set_index(['ACCOUNT', 'TICKER'], append=True)
-
-        expected = DataFrame([
-            [1]
-        ], index=Index(['ABC'], name='TICKER'), columns=['val'])
-        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1')]
-        tm.assert_frame_equal(result, expected)
-
-        expected = df_multi.loc[
-            (pd.Timestamp('2013-06-19 09:30:00', tz=None), 'ACCT1', 'ABC')]
-        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1', 'ABC')]
-        tm.assert_series_equal(result, expected)
-
-        # this is a KeyError as we don't do partial string selection on
-        # multi-levels
-        def f():
-            df_multi.loc[('2013-06-19', 'ACCT1', 'ABC')]
-
-        self.assertRaises(KeyError, f)
-
-        # GH 4294
-        # partial slice on a series mi
-        s = pd.DataFrame(np.random.rand(1000, 1000), index=pd.date_range(
-            '2000-1-1', periods=1000)).stack()
-
-        s2 = s[:-1].copy()
-        expected = s2['2000-1-4']
-        result = s2[pd.Timestamp('2000-1-4')]
-        tm.assert_series_equal(result, expected)
-
-        result = s[pd.Timestamp('2000-1-4')]
-        expected = s['2000-1-4']
-        tm.assert_series_equal(result, expected)
-
-        df2 = pd.DataFrame(s)
-        expected = df2.xs('2000-1-4')
-        result = df2.loc[pd.Timestamp('2000-1-4')]
-        tm.assert_frame_equal(result, expected)
-
-    def test_partial_slice_doesnt_require_monotonicity(self):
-        # For historical reasons.
-        s = pd.Series(np.arange(10), pd.date_range('2014-01-01', periods=10))
-
-        nonmonotonic = s[[3, 5, 4]]
-        expected = nonmonotonic.iloc[:0]
-        timestamp = pd.Timestamp('2014-01-10')
-
-        tm.assert_series_equal(nonmonotonic['2014-01-10':], expected)
-        self.assertRaisesRegexp(KeyError,
-                                r"Timestamp\('2014-01-10 00:00:00'\)",
-                                lambda: nonmonotonic[timestamp:])
-
-        tm.assert_series_equal(nonmonotonic.loc['2014-01-10':], expected)
-        self.assertRaisesRegexp(KeyError,
-                                r"Timestamp\('2014-01-10 00:00:00'\)",
-                                lambda: nonmonotonic.loc[timestamp:])
diff --git a/pandas/tests/indexes/datetimes/test_partial_slicing.py b/pandas/tests/indexes/datetimes/test_partial_slicing.py
new file mode 100644
index 0000000000000..64693324521b3
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_partial_slicing.py
@@ -0,0 +1,425 @@
+""" test partial slicing on Series/Frame """
+
+from datetime import datetime
+import operator as op
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, Series, Timedelta, Timestamp, date_range)
+from pandas.core.indexing import IndexingError
+from pandas.util import testing as tm
+
+
+class TestSlicing(object):
+    def test_dti_slicing(self):
+        dti = date_range(start='1/1/2005', end='12/1/2005', freq='M')
+        dti2 = dti[[1, 3, 5]]
+
+        v1 = dti2[0]
+        v2 = dti2[1]
+        v3 = dti2[2]
+
+        assert v1 == Timestamp('2/28/2005')
+        assert v2 == Timestamp('4/30/2005')
+        assert v3 == Timestamp('6/30/2005')
+
+        # don't carry freq through irregular slicing
+        assert dti2.freq is None
+
+    def test_slice_keeps_name(self):
+        # GH4226
+        st = pd.Timestamp('2013-07-01 00:00:00', tz='America/Los_Angeles')
+        et = pd.Timestamp('2013-07-02 00:00:00', tz='America/Los_Angeles')
+        dr = pd.date_range(st, et, freq='H', name='timebucket')
+        assert dr[1:].name == dr.name
+
+    def test_slice_with_negative_step(self):
+        ts = Series(np.arange(20),
+                    date_range('2014-01-01', periods=20, freq='MS'))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(ts[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+            tm.assert_series_equal(ts.loc[l_slc], ts.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[Timestamp('2014-10-01')::-1], SLC[9::-1])
+        assert_slices_equivalent(SLC['2014-10-01'::-1], SLC[9::-1])
+
+        assert_slices_equivalent(SLC[:Timestamp('2014-10-01'):-1], SLC[:8:-1])
+        assert_slices_equivalent(SLC[:'2014-10-01':-1], SLC[:8:-1])
+
+        assert_slices_equivalent(SLC['2015-02-01':'2014-10-01':-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):Timestamp(
+            '2014-10-01'):-1], SLC[13:8:-1])
+        assert_slices_equivalent(SLC['2015-02-01':Timestamp('2014-10-01'):-1],
+                                 SLC[13:8:-1])
+        assert_slices_equivalent(SLC[Timestamp('2015-02-01'):'2014-10-01':-1],
+                                 SLC[13:8:-1])
+
+        assert_slices_equivalent(SLC['2014-10-01':'2015-02-01':-1], SLC[:0])
+
+    def test_slice_with_zero_step_raises(self):
+        ts = Series(np.arange(20),
+                    date_range('2014-01-01', periods=20, freq='MS'))
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
+
+    def test_slice_bounds_empty(self):
+        # GH#14354
+        empty_idx = date_range(freq='1H', periods=0, end='2015')
+
+        right = empty_idx._maybe_cast_slice_bound('2015-01-02', 'right', 'loc')
+        exp = Timestamp('2015-01-02 23:59:59.999999999')
+        assert right == exp
+
+        left = empty_idx._maybe_cast_slice_bound('2015-01-02', 'left', 'loc')
+        exp = Timestamp('2015-01-02 00:00:00')
+        assert left == exp
+
+    def test_slice_duplicate_monotonic(self):
+        # https://github.com/pandas-dev/pandas/issues/16515
+        idx = pd.DatetimeIndex(['2017', '2017'])
+        result = idx._maybe_cast_slice_bound('2017-01-01', 'left', 'loc')
+        expected = Timestamp('2017-01-01')
+        assert result == expected
+
+    def test_monotone_DTI_indexing_bug(self):
+        # GH 19362
+        # Testing accessing the first element in a montononic descending
+        # partial string indexing.
+
+        df = pd.DataFrame(list(range(5)))
+        date_list = ['2018-01-02', '2017-02-10', '2016-03-10',
+                     '2015-03-15', '2014-03-16']
+        date_index = pd.to_datetime(date_list)
+        df['date'] = date_index
+        expected = pd.DataFrame({0: list(range(5)), 'date': date_index})
+        tm.assert_frame_equal(df, expected)
+
+        df = pd.DataFrame({'A': [1, 2, 3]},
+                          index=pd.date_range('20170101',
+                                              periods=3)[::-1])
+        expected = pd.DataFrame({'A': 1},
+                                index=pd.date_range('20170103',
+                                                    periods=1))
+        tm.assert_frame_equal(df.loc['2017-01-03'], expected)
+
+    def test_slice_year(self):
+        dti = date_range(freq='B', start=datetime(2005, 1, 1), periods=500)
+
+        s = Series(np.arange(len(dti)), index=dti)
+        result = s['2005']
+        expected = s[s.index.year == 2005]
+        tm.assert_series_equal(result, expected)
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        result = df.loc['2005']
+        expected = df[df.index.year == 2005]
+        tm.assert_frame_equal(result, expected)
+
+        rng = date_range('1/1/2000', '1/1/2010')
+
+        result = rng.get_loc('2009')
+        expected = slice(3288, 3653)
+        assert result == expected
+
+    def test_slice_quarter(self):
+        dti = date_range(freq='D', start=datetime(2000, 6, 1), periods=500)
+
+        s = Series(np.arange(len(dti)), index=dti)
+        assert len(s['2001Q1']) == 90
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        assert len(df.loc['1Q01']) == 90
+
+    def test_slice_month(self):
+        dti = date_range(freq='D', start=datetime(2005, 1, 1), periods=500)
+        s = Series(np.arange(len(dti)), index=dti)
+        assert len(s['2005-11']) == 30
+
+        df = DataFrame(np.random.rand(len(dti), 5), index=dti)
+        assert len(df.loc['2005-11']) == 30
+
+        tm.assert_series_equal(s['2005-11'], s['11-2005'])
+
+    def test_partial_slice(self):
+        rng = date_range(freq='D', start=datetime(2005, 1, 1), periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-05':'2006-02']
+        expected = s['20050501':'20060228']
+        tm.assert_series_equal(result, expected)
+
+        result = s['2005-05':]
+        expected = s['20050501':]
+        tm.assert_series_equal(result, expected)
+
+        result = s[:'2006-02']
+        expected = s[:'20060228']
+        tm.assert_series_equal(result, expected)
+
+        result = s['2005-1-1']
+        assert result == s.iloc[0]
+
+        with pytest.raises(KeyError, match=r"^'2004-12-31'$"):
+            s['2004-12-31']
+
+    def test_partial_slice_daily(self):
+        rng = date_range(freq='H', start=datetime(2005, 1, 31), periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-31']
+        tm.assert_series_equal(result, s.iloc[:24])
+
+        with pytest.raises(KeyError, match=r"^'2004-12-31 00'$"):
+            s['2004-12-31 00']
+
+    def test_partial_slice_hourly(self):
+        rng = date_range(freq='T', start=datetime(2005, 1, 1, 20, 0, 0),
+                         periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-1']
+        tm.assert_series_equal(result, s.iloc[:60 * 4])
+
+        result = s['2005-1-1 20']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        assert s['2005-1-1 20:00'] == s.iloc[0]
+        with pytest.raises(KeyError, match=r"^'2004-12-31 00:15'$"):
+            s['2004-12-31 00:15']
+
+    def test_partial_slice_minutely(self):
+        rng = date_range(freq='S', start=datetime(2005, 1, 1, 23, 59, 0),
+                         periods=500)
+        s = Series(np.arange(len(rng)), index=rng)
+
+        result = s['2005-1-1 23:59']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        result = s['2005-1-1']
+        tm.assert_series_equal(result, s.iloc[:60])
+
+        assert s[Timestamp('2005-1-1 23:59:00')] == s.iloc[0]
+        with pytest.raises(KeyError, match=r"^'2004-12-31 00:00:00'$"):
+            s['2004-12-31 00:00:00']
+
+    def test_partial_slice_second_precision(self):
+        rng = date_range(start=datetime(2005, 1, 1, 0, 0, 59,
+                                        microsecond=999990),
+                         periods=20, freq='US')
+        s = Series(np.arange(20), rng)
+
+        tm.assert_series_equal(s['2005-1-1 00:00'], s.iloc[:10])
+        tm.assert_series_equal(s['2005-1-1 00:00:59'], s.iloc[:10])
+
+        tm.assert_series_equal(s['2005-1-1 00:01'], s.iloc[10:])
+        tm.assert_series_equal(s['2005-1-1 00:01:00'], s.iloc[10:])
+
+        assert s[Timestamp('2005-1-1 00:00:59.999990')] == s.iloc[0]
+        with pytest.raises(KeyError, match='2005-1-1 00:00:00'):
+            s['2005-1-1 00:00:00']
+
+    def test_partial_slicing_dataframe(self):
+        # GH14856
+        # Test various combinations of string slicing resolution vs.
+        # index resolution
+        # - If string resolution is less precise than index resolution,
+        # string is considered a slice
+        # - If string resolution is equal to or more precise than index
+        # resolution, string is considered an exact match
+        formats = ['%Y', '%Y-%m', '%Y-%m-%d', '%Y-%m-%d %H',
+                   '%Y-%m-%d %H:%M', '%Y-%m-%d %H:%M:%S']
+        resolutions = ['year', 'month', 'day', 'hour', 'minute', 'second']
+        for rnum, resolution in enumerate(resolutions[2:], 2):
+            # we check only 'day', 'hour', 'minute' and 'second'
+            unit = Timedelta("1 " + resolution)
+            middate = datetime(2012, 1, 1, 0, 0, 0)
+            index = DatetimeIndex([middate - unit,
+                                   middate, middate + unit])
+            values = [1, 2, 3]
+            df = DataFrame({'a': values}, index, dtype=np.int64)
+            assert df.index.resolution == resolution
+
+            # Timestamp with the same resolution as index
+            # Should be exact match for Series (return scalar)
+            # and raise KeyError for Frame
+            for timestamp, expected in zip(index, values):
+                ts_string = timestamp.strftime(formats[rnum])
+                # make ts_string as precise as index
+                result = df['a'][ts_string]
+                assert isinstance(result, np.int64)
+                assert result == expected
+                msg = r"^'{}'$".format(ts_string)
+                with pytest.raises(KeyError, match=msg):
+                    df[ts_string]
+
+            # Timestamp with resolution less precise than index
+            for fmt in formats[:rnum]:
+                for element, theslice in [[0, slice(None, 1)],
+                                          [1, slice(1, None)]]:
+                    ts_string = index[element].strftime(fmt)
+
+                    # Series should return slice
+                    result = df['a'][ts_string]
+                    expected = df['a'][theslice]
+                    tm.assert_series_equal(result, expected)
+
+                    # Frame should return slice as well
+                    result = df[ts_string]
+                    expected = df[theslice]
+                    tm.assert_frame_equal(result, expected)
+
+            # Timestamp with resolution more precise than index
+            # Compatible with existing key
+            # Should return scalar for Series
+            # and raise KeyError for Frame
+            for fmt in formats[rnum + 1:]:
+                ts_string = index[1].strftime(fmt)
+                result = df['a'][ts_string]
+                assert isinstance(result, np.int64)
+                assert result == 2
+                msg = r"^'{}'$".format(ts_string)
+                with pytest.raises(KeyError, match=msg):
+                    df[ts_string]
+
+            # Not compatible with existing key
+            # Should raise KeyError
+            for fmt, res in list(zip(formats, resolutions))[rnum + 1:]:
+                ts = index[1] + Timedelta("1 " + res)
+                ts_string = ts.strftime(fmt)
+                msg = r"^'{}'$".format(ts_string)
+                with pytest.raises(KeyError, match=msg):
+                    df['a'][ts_string]
+                with pytest.raises(KeyError, match=msg):
+                    df[ts_string]
+
+    def test_partial_slicing_with_multiindex(self):
+
+        # GH 4758
+        # partial string indexing with a multi-index buggy
+        df = DataFrame({'ACCOUNT': ["ACCT1", "ACCT1", "ACCT1", "ACCT2"],
+                        'TICKER': ["ABC", "MNP", "XYZ", "XYZ"],
+                        'val': [1, 2, 3, 4]},
+                       index=date_range("2013-06-19 09:30:00",
+                                        periods=4, freq='5T'))
+        df_multi = df.set_index(['ACCOUNT', 'TICKER'], append=True)
+
+        expected = DataFrame([
+            [1]
+        ], index=Index(['ABC'], name='TICKER'), columns=['val'])
+        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1')]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df_multi.loc[
+            (pd.Timestamp('2013-06-19 09:30:00', tz=None), 'ACCT1', 'ABC')]
+        result = df_multi.loc[('2013-06-19 09:30:00', 'ACCT1', 'ABC')]
+        tm.assert_series_equal(result, expected)
+
+        # this is an IndexingError as we don't do partial string selection on
+        # multi-levels.
+        msg = "Too many indexers"
+        with pytest.raises(IndexingError, match=msg):
+            df_multi.loc[('2013-06-19', 'ACCT1', 'ABC')]
+
+        # GH 4294
+        # partial slice on a series mi
+        s = pd.DataFrame(np.random.rand(1000, 1000), index=pd.date_range(
+            '2000-1-1', periods=1000)).stack()
+
+        s2 = s[:-1].copy()
+        expected = s2['2000-1-4']
+        result = s2[pd.Timestamp('2000-1-4')]
+        tm.assert_series_equal(result, expected)
+
+        result = s[pd.Timestamp('2000-1-4')]
+        expected = s['2000-1-4']
+        tm.assert_series_equal(result, expected)
+
+        df2 = pd.DataFrame(s)
+        expected = df2.xs('2000-1-4')
+        result = df2.loc[pd.Timestamp('2000-1-4')]
+        tm.assert_frame_equal(result, expected)
+
+    def test_partial_slice_doesnt_require_monotonicity(self):
+        # For historical reasons.
+        s = pd.Series(np.arange(10), pd.date_range('2014-01-01', periods=10))
+
+        nonmonotonic = s[[3, 5, 4]]
+        expected = nonmonotonic.iloc[:0]
+        timestamp = pd.Timestamp('2014-01-10')
+
+        tm.assert_series_equal(nonmonotonic['2014-01-10':], expected)
+        with pytest.raises(KeyError,
+                           match=r"Timestamp\('2014-01-10 00:00:00'\)"):
+            nonmonotonic[timestamp:]
+
+        tm.assert_series_equal(nonmonotonic.loc['2014-01-10':], expected)
+        with pytest.raises(KeyError,
+                           match=r"Timestamp\('2014-01-10 00:00:00'\)"):
+            nonmonotonic.loc[timestamp:]
+
+    def test_loc_datetime_length_one(self):
+        # GH16071
+        df = pd.DataFrame(columns=['1'],
+                          index=pd.date_range('2016-10-01T00:00:00',
+                                              '2016-10-01T23:59:59'))
+        result = df.loc[datetime(2016, 10, 1):]
+        tm.assert_frame_equal(result, df)
+
+        result = df.loc['2016-10-01T00:00:00':]
+        tm.assert_frame_equal(result, df)
+
+    @pytest.mark.parametrize('datetimelike', [
+        Timestamp('20130101'), datetime(2013, 1, 1),
+        np.datetime64('2013-01-01T00:00', 'ns')])
+    @pytest.mark.parametrize('op,expected', [
+        (op.lt, [True, False, False, False]),
+        (op.le, [True, True, False, False]),
+        (op.eq, [False, True, False, False]),
+        (op.gt, [False, False, False, True])])
+    def test_selection_by_datetimelike(self, datetimelike, op, expected):
+        # GH issue #17965, test for ability to compare datetime64[ns] columns
+        # to datetimelike
+        df = DataFrame({'A': [pd.Timestamp('20120101'),
+                              pd.Timestamp('20130101'),
+                              np.nan, pd.Timestamp('20130103')]})
+        result = op(df.A, datetimelike)
+        expected = Series(expected, name='A')
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('start', [
+        '2018-12-02 21:50:00+00:00', pd.Timestamp('2018-12-02 21:50:00+00:00'),
+        pd.Timestamp('2018-12-02 21:50:00+00:00').to_pydatetime()
+    ])
+    @pytest.mark.parametrize('end', [
+        '2018-12-02 21:52:00+00:00', pd.Timestamp('2018-12-02 21:52:00+00:00'),
+        pd.Timestamp('2018-12-02 21:52:00+00:00').to_pydatetime()
+    ])
+    def test_getitem_with_datestring_with_UTC_offset(self, start, end):
+        # GH 24076
+        idx = pd.date_range(start='2018-12-02 14:50:00-07:00',
+                            end='2018-12-02 14:50:00-07:00', freq='1min')
+        df = pd.DataFrame(1, index=idx, columns=['A'])
+        result = df[start:end]
+        expected = df.iloc[0:3, :]
+        tm.assert_frame_equal(result, expected)
+
+        # GH 16785
+        start = str(start)
+        end = str(end)
+        with pytest.raises(ValueError, match="Both dates must"):
+            df[start:end[:-4] + '1:00']
+
+        with pytest.raises(ValueError, match="The index must be timezone"):
+            df = df.tz_localize(None)
+            df[start:end]
diff --git a/pandas/tests/indexes/datetimes/test_scalar_compat.py b/pandas/tests/indexes/datetimes/test_scalar_compat.py
new file mode 100644
index 0000000000000..42338a751e0fc
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_scalar_compat.py
@@ -0,0 +1,292 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DatetimeIndex methods behaving like their Timestamp counterparts
+"""
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs.np_datetime import OutOfBoundsDatetime
+
+import pandas as pd
+from pandas import DatetimeIndex, Timestamp, date_range
+import pandas.util.testing as tm
+
+from pandas.tseries.frequencies import to_offset
+
+
+class TestDatetimeIndexOps(object):
+    def test_dti_time(self):
+        rng = date_range('1/1/2000', freq='12min', periods=10)
+        result = pd.Index(rng).time
+        expected = [t.time() for t in rng]
+        assert (result == expected).all()
+
+    def test_dti_date(self):
+        rng = date_range('1/1/2000', freq='12H', periods=10)
+        result = pd.Index(rng).date
+        expected = [t.date() for t in rng]
+        assert (result == expected).all()
+
+    @pytest.mark.parametrize('data', [
+        ['1400-01-01'],
+        [datetime(1400, 1, 1)]])
+    def test_dti_date_out_of_range(self, data):
+        # GH#1475
+        msg = "Out of bounds nanosecond timestamp: 1400-01-01 00:00:00"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            DatetimeIndex(data)
+
+    @pytest.mark.parametrize('field', [
+        'dayofweek', 'dayofyear', 'week', 'weekofyear', 'quarter',
+        'days_in_month', 'is_month_start', 'is_month_end',
+        'is_quarter_start', 'is_quarter_end', 'is_year_start',
+        'is_year_end', 'weekday_name'])
+    def test_dti_timestamp_fields(self, field):
+        # extra fields from DatetimeIndex like quarter and week
+        idx = tm.makeDateIndex(100)
+        expected = getattr(idx, field)[-1]
+        if field == 'weekday_name':
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                result = getattr(Timestamp(idx[-1]), field)
+        else:
+            result = getattr(Timestamp(idx[-1]), field)
+        assert result == expected
+
+    def test_dti_timestamp_freq_fields(self):
+        # extra fields from DatetimeIndex like quarter and week
+        idx = tm.makeDateIndex(100)
+
+        assert idx.freq == Timestamp(idx[-1], idx.freq).freq
+        assert idx.freqstr == Timestamp(idx[-1], idx.freq).freqstr
+
+    # ----------------------------------------------------------------
+    # DatetimeIndex.round
+
+    def test_round_daily(self):
+        dti = date_range('20130101 09:10:11', periods=5)
+        result = dti.round('D')
+        expected = date_range('20130101', periods=5)
+        tm.assert_index_equal(result, expected)
+
+        dti = dti.tz_localize('UTC').tz_convert('US/Eastern')
+        result = dti.round('D')
+        expected = date_range('20130101',
+                              periods=5).tz_localize('US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        result = dti.round('s')
+        tm.assert_index_equal(result, dti)
+
+    @pytest.mark.parametrize('freq, error_msg', [
+        ('Y', '<YearEnd: month=12> is a non-fixed frequency'),
+        ('M', '<MonthEnd> is a non-fixed frequency'),
+        ('foobar', 'Invalid frequency: foobar')])
+    def test_round_invalid(self, freq, error_msg):
+        dti = date_range('20130101 09:10:11', periods=5)
+        dti = dti.tz_localize('UTC').tz_convert('US/Eastern')
+        with pytest.raises(ValueError, match=error_msg):
+            dti.round(freq)
+
+    def test_round(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        rng = date_range(start='2016-01-01', periods=5,
+                         freq='30Min', tz=tz)
+        elt = rng[1]
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 01:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
+            Timestamp('2016-01-01 02:00:00', tz=tz, freq='30T'),
+        ])
+        expected_elt = expected_rng[1]
+
+        tm.assert_index_equal(rng.round(freq='H'), expected_rng)
+        assert elt.round(freq='H') == expected_elt
+
+        msg = pd._libs.tslibs.frequencies.INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            rng.round(freq='foo')
+        with pytest.raises(ValueError, match=msg):
+            elt.round(freq='foo')
+
+        msg = "<MonthEnd> is a non-fixed frequency"
+        with pytest.raises(ValueError, match=msg):
+            rng.round(freq='M')
+        with pytest.raises(ValueError, match=msg):
+            elt.round(freq='M')
+
+        # GH#14440 & GH#15578
+        index = DatetimeIndex(['2016-10-17 12:00:00.0015'], tz=tz)
+        result = index.round('ms')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.002000'], tz=tz)
+        tm.assert_index_equal(result, expected)
+
+        for freq in ['us', 'ns']:
+            tm.assert_index_equal(index, index.round(freq))
+
+        index = DatetimeIndex(['2016-10-17 12:00:00.00149'], tz=tz)
+        result = index.round('ms')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.001000'], tz=tz)
+        tm.assert_index_equal(result, expected)
+
+        index = DatetimeIndex(['2016-10-17 12:00:00.001501031'])
+        result = index.round('10ns')
+        expected = DatetimeIndex(['2016-10-17 12:00:00.001501030'])
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(False):
+            ts = '2016-10-17 12:00:00.001501031'
+            DatetimeIndex([ts]).round('1010ns')
+
+    def test_no_rounding_occurs(self, tz_naive_fixture):
+        # GH 21262
+        tz = tz_naive_fixture
+        rng = date_range(start='2016-01-01', periods=5,
+                         freq='2Min', tz=tz)
+
+        expected_rng = DatetimeIndex([
+            Timestamp('2016-01-01 00:00:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:02:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:04:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:06:00', tz=tz, freq='2T'),
+            Timestamp('2016-01-01 00:08:00', tz=tz, freq='2T'),
+        ])
+
+        tm.assert_index_equal(rng.round(freq='2T'), expected_rng)
+
+    @pytest.mark.parametrize('test_input, rounder, freq, expected', [
+        (['2117-01-01 00:00:45'], 'floor', '15s', ['2117-01-01 00:00:45']),
+        (['2117-01-01 00:00:45'], 'ceil', '15s', ['2117-01-01 00:00:45']),
+        (['2117-01-01 00:00:45.000000012'], 'floor', '10ns',
+         ['2117-01-01 00:00:45.000000010']),
+        (['1823-01-01 00:00:01.000000012'], 'ceil', '10ns',
+         ['1823-01-01 00:00:01.000000020']),
+        (['1823-01-01 00:00:01'], 'floor', '1s', ['1823-01-01 00:00:01']),
+        (['1823-01-01 00:00:01'], 'ceil', '1s', ['1823-01-01 00:00:01']),
+        (['2018-01-01 00:15:00'], 'ceil', '15T', ['2018-01-01 00:15:00']),
+        (['2018-01-01 00:15:00'], 'floor', '15T', ['2018-01-01 00:15:00']),
+        (['1823-01-01 03:00:00'], 'ceil', '3H', ['1823-01-01 03:00:00']),
+        (['1823-01-01 03:00:00'], 'floor', '3H', ['1823-01-01 03:00:00']),
+        (('NaT', '1823-01-01 00:00:01'), 'floor', '1s',
+         ('NaT', '1823-01-01 00:00:01')),
+        (('NaT', '1823-01-01 00:00:01'), 'ceil', '1s',
+         ('NaT', '1823-01-01 00:00:01'))
+    ])
+    def test_ceil_floor_edge(self, test_input, rounder, freq, expected):
+        dt = DatetimeIndex(list(test_input))
+        func = getattr(dt, rounder)
+        result = func(freq)
+        expected = DatetimeIndex(list(expected))
+        assert expected.equals(result)
+
+    @pytest.mark.parametrize('start, index_freq, periods', [
+        ('2018-01-01', '12H', 25),
+        ('2018-01-01 0:0:0.124999', '1ns', 1000),
+    ])
+    @pytest.mark.parametrize('round_freq', [
+        '2ns', '3ns', '4ns', '5ns', '6ns', '7ns',
+        '250ns', '500ns', '750ns',
+        '1us', '19us', '250us', '500us', '750us',
+        '1s', '2s', '3s',
+        '12H', '1D',
+    ])
+    def test_round_int64(self, start, index_freq, periods, round_freq):
+        dt = date_range(start=start, freq=index_freq, periods=periods)
+        unit = to_offset(round_freq).nanos
+
+        # test floor
+        result = dt.floor(round_freq)
+        diff = dt.asi8 - result.asi8
+        mod = result.asi8 % unit
+        assert (mod == 0).all(), "floor not a {} multiple".format(round_freq)
+        assert (0 <= diff).all() and (diff < unit).all(), "floor error"
+
+        # test ceil
+        result = dt.ceil(round_freq)
+        diff = result.asi8 - dt.asi8
+        mod = result.asi8 % unit
+        assert (mod == 0).all(), "ceil not a {} multiple".format(round_freq)
+        assert (0 <= diff).all() and (diff < unit).all(), "ceil error"
+
+        # test round
+        result = dt.round(round_freq)
+        diff = abs(result.asi8 - dt.asi8)
+        mod = result.asi8 % unit
+        assert (mod == 0).all(), "round not a {} multiple".format(round_freq)
+        assert (diff <= unit // 2).all(), "round error"
+        if unit % 2 == 0:
+            assert (
+                result.asi8[diff == unit // 2] % 2 == 0
+            ).all(), "round half to even error"
+
+    # ----------------------------------------------------------------
+    # DatetimeIndex.normalize
+
+    def test_normalize(self):
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D')
+        tm.assert_index_equal(result, expected)
+
+        arr_ns = np.array([1380585623454345752,
+                           1380585612343234312]).astype("datetime64[ns]")
+        rng_ns = DatetimeIndex(arr_ns)
+        rng_ns_normalized = rng_ns.normalize()
+
+        arr_ns = np.array([1380585600000000000,
+                           1380585600000000000]).astype("datetime64[ns]")
+        expected = DatetimeIndex(arr_ns)
+        tm.assert_index_equal(rng_ns_normalized, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+    def test_normalize_nat(self):
+        dti = DatetimeIndex([pd.NaT, Timestamp('2018-01-01 01:00:00')])
+        result = dti.normalize()
+        expected = DatetimeIndex([pd.NaT, Timestamp('2018-01-01')])
+        tm.assert_index_equal(result, expected)
+
+
+class TestDateTimeIndexToJulianDate(object):
+
+    def test_1700(self):
+        dr = date_range(start=Timestamp('1710-10-01'), periods=5, freq='D')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_2000(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='D')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_hour(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='H')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_minute(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='T')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
+
+    def test_second(self):
+        dr = date_range(start=Timestamp('2000-02-27'), periods=5, freq='S')
+        r1 = pd.Index([x.to_julian_date() for x in dr])
+        r2 = dr.to_julian_date()
+        assert isinstance(r2, pd.Float64Index)
+        tm.assert_index_equal(r1, r2)
diff --git a/pandas/tests/indexes/datetimes/test_setops.py b/pandas/tests/indexes/datetimes/test_setops.py
index a1ad147f84aff..cf1f75234ec62 100644
--- a/pandas/tests/indexes/datetimes/test_setops.py
+++ b/pandas/tests/indexes/datetimes/test_setops.py
@@ -1,71 +1,129 @@
 from datetime import datetime
 
 import numpy as np
+import pytest
+
+import pandas.util._test_decorators as td
 
 import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, Int64Index, Series, bdate_range,
+    date_range, to_datetime)
 import pandas.util.testing as tm
-from pandas.tseries.index import cdate_range
-from pandas import (DatetimeIndex, date_range, Series, bdate_range, DataFrame,
-                    Int64Index, Index, to_datetime)
-from pandas.tseries.offsets import Minute, BMonthEnd, MonthEnd
 
-START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
+from pandas.tseries.offsets import BMonthEnd, Minute, MonthEnd
 
+START, END = datetime(2009, 1, 1), datetime(2010, 1, 1)
 
-class TestDatetimeIndex(tm.TestCase):
 
-    def test_union(self):
-        i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = Int64Index(np.arange(10, 30, 2))
-        result = i1.union(i2)
-        expected = Int64Index(np.arange(0, 30, 2))
-        tm.assert_index_equal(result, expected)
-
-    def test_union_coverage(self):
+class TestDatetimeIndexSetOps(object):
+    tz = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/Asia/Singapore',
+          'dateutil/US/Pacific']
+
+    # TODO: moved from test_datetimelike; dedup with version below
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union2(self, sort):
+        everything = tm.makeDateIndex(10)
+        first = everything[:5]
+        second = everything[5:]
+        union = first.union(second, sort=sort)
+        tm.assert_index_equal(union, everything)
+
+        # GH 10149
+        cases = [klass(second.values) for klass in [np.array, Series, list]]
+        for case in cases:
+            result = first.union(case, sort=sort)
+            tm.assert_index_equal(result, everything)
+
+    @pytest.mark.parametrize("tz", tz)
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, tz, sort):
+        rng1 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
+        expected1 = pd.date_range('1/1/2000', freq='D', periods=10, tz=tz)
+        expected1_notsorted = pd.DatetimeIndex(list(other1) + list(rng1))
+
+        rng2 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
+        expected2 = pd.date_range('1/1/2000', freq='D', periods=8, tz=tz)
+        expected2_notsorted = pd.DatetimeIndex(list(other2) + list(rng2[:3]))
+
+        rng3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        other3 = pd.DatetimeIndex([], tz=tz)
+        expected3 = pd.date_range('1/1/2000', freq='D', periods=5, tz=tz)
+        expected3_notsorted = rng3
+
+        for rng, other, exp, exp_notsorted in [(rng1, other1, expected1,
+                                                expected1_notsorted),
+                                               (rng2, other2, expected2,
+                                                expected2_notsorted),
+                                               (rng3, other3, expected3,
+                                                expected3_notsorted)]:
+
+            result_union = rng.union(other, sort=sort)
+            tm.assert_index_equal(result_union, exp)
+
+            result_union = other.union(rng, sort=sort)
+            if sort is None:
+                tm.assert_index_equal(result_union, exp)
+            else:
+                tm.assert_index_equal(result_union, exp_notsorted)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_coverage(self, sort):
         idx = DatetimeIndex(['2000-01-03', '2000-01-01', '2000-01-02'])
         ordered = DatetimeIndex(idx.sort_values(), freq='infer')
-        result = ordered.union(idx)
+        result = ordered.union(idx, sort=sort)
         tm.assert_index_equal(result, ordered)
 
-        result = ordered[:0].union(ordered)
+        result = ordered[:0].union(ordered, sort=sort)
         tm.assert_index_equal(result, ordered)
-        self.assertEqual(result.freq, ordered.freq)
+        assert result.freq == ordered.freq
 
-    def test_union_bug_1730(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_bug_1730(self, sort):
         rng_a = date_range('1/1/2012', periods=4, freq='3H')
         rng_b = date_range('1/1/2012', periods=4, freq='4H')
 
-        result = rng_a.union(rng_b)
+        result = rng_a.union(rng_b, sort=sort)
         exp = DatetimeIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
         tm.assert_index_equal(result, exp)
 
-    def test_union_bug_1745(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_bug_1745(self, sort):
         left = DatetimeIndex(['2012-05-11 15:19:49.695000'])
         right = DatetimeIndex(['2012-05-29 13:04:21.322000',
                                '2012-05-11 15:27:24.873000',
                                '2012-05-11 15:31:05.350000'])
 
-        result = left.union(right)
-        exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
+        result = left.union(right, sort=sort)
+        exp = DatetimeIndex(['2012-05-11 15:19:49.695000',
+                             '2012-05-29 13:04:21.322000',
+                             '2012-05-11 15:27:24.873000',
+                             '2012-05-11 15:31:05.350000'])
+        if sort is None:
+            exp = exp.sort_values()
         tm.assert_index_equal(result, exp)
 
-    def test_union_bug_4564(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_bug_4564(self, sort):
         from pandas import DateOffset
         left = date_range("2013-01-01", "2013-02-01")
         right = left + DateOffset(minutes=15)
 
-        result = left.union(right)
+        result = left.union(right, sort=sort)
         exp = DatetimeIndex(sorted(set(list(left)) | set(list(right))))
         tm.assert_index_equal(result, exp)
 
-    def test_union_freq_both_none(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_freq_both_none(self, sort):
         # GH11086
         expected = bdate_range('20150101', periods=10)
         expected.freq = None
 
-        result = expected.union(expected)
+        result = expected.union(expected, sort=sort)
         tm.assert_index_equal(result, expected)
-        self.assertIsNone(result.freq)
+        assert result.freq is None
 
     def test_union_dataframe_index(self):
         rng1 = date_range('1/1/1999', '1/1/2012', freq='MS')
@@ -78,75 +136,99 @@ def test_union_dataframe_index(self):
         exp = pd.date_range('1/1/1980', '1/1/2012', freq='MS')
         tm.assert_index_equal(df.index, exp)
 
-    def test_union_with_DatetimeIndex(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_with_DatetimeIndex(self, sort):
         i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = DatetimeIndex(start='2012-01-03 00:00:00', periods=10, freq='D')
-        i1.union(i2)  # Works
-        i2.union(i1)  # Fails with "AttributeError: can't set attribute"
+        i2 = date_range(start='2012-01-03 00:00:00', periods=10, freq='D')
+        # Works
+        i1.union(i2, sort=sort)
+        # Fails with "AttributeError: can't set attribute"
+        i2.union(i1, sort=sort)
+
+    # TODO: moved from test_datetimelike; de-duplicate with version below
+    def test_intersection2(self):
+        first = tm.makeDateIndex(10)
+        second = first[5:]
+        intersect = first.intersection(second)
+        assert tm.equalContents(intersect, second)
+
+        # GH 10149
+        cases = [klass(second.values) for klass in [np.array, Series, list]]
+        for case in cases:
+            result = first.intersection(case)
+            assert tm.equalContents(result, second)
+
+        third = Index(['a', 'b', 'c'])
+        result = first.intersection(third)
+        expected = pd.Index([], dtype=object)
+        tm.assert_index_equal(result, expected)
 
-    def test_intersection(self):
+    @pytest.mark.parametrize("tz", [None, 'Asia/Tokyo', 'US/Eastern',
+                                    'dateutil/US/Pacific'])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection(self, tz, sort):
         # GH 4690 (with tz)
-        for tz in [None, 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            base = date_range('6/1/2000', '6/30/2000', freq='D', name='idx')
-
-            # if target has the same name, it is preserved
-            rng2 = date_range('5/15/2000', '6/20/2000', freq='D', name='idx')
-            expected2 = date_range('6/1/2000', '6/20/2000', freq='D',
-                                   name='idx')
-
-            # if target name is different, it will be reset
-            rng3 = date_range('5/15/2000', '6/20/2000', freq='D', name='other')
-            expected3 = date_range('6/1/2000', '6/20/2000', freq='D',
-                                   name=None)
-
-            rng4 = date_range('7/1/2000', '7/31/2000', freq='D', name='idx')
-            expected4 = DatetimeIndex([], name='idx')
-
-            for (rng, expected) in [(rng2, expected2), (rng3, expected3),
-                                    (rng4, expected4)]:
-                result = base.intersection(rng)
-                tm.assert_index_equal(result, expected)
-                self.assertEqual(result.name, expected.name)
-                self.assertEqual(result.freq, expected.freq)
-                self.assertEqual(result.tz, expected.tz)
-
-            # non-monotonic
-            base = DatetimeIndex(['2011-01-05', '2011-01-04',
-                                  '2011-01-02', '2011-01-03'],
-                                 tz=tz, name='idx')
-
-            rng2 = DatetimeIndex(['2011-01-04', '2011-01-02',
-                                  '2011-02-02', '2011-02-03'],
-                                 tz=tz, name='idx')
-            expected2 = DatetimeIndex(
-                ['2011-01-04', '2011-01-02'], tz=tz, name='idx')
-
-            rng3 = DatetimeIndex(['2011-01-04', '2011-01-02',
-                                  '2011-02-02', '2011-02-03'],
-                                 tz=tz, name='other')
-            expected3 = DatetimeIndex(
-                ['2011-01-04', '2011-01-02'], tz=tz, name=None)
-
-            # GH 7880
-            rng4 = date_range('7/1/2000', '7/31/2000', freq='D', tz=tz,
-                              name='idx')
-            expected4 = DatetimeIndex([], tz=tz, name='idx')
-
-            for (rng, expected) in [(rng2, expected2), (rng3, expected3),
-                                    (rng4, expected4)]:
-                result = base.intersection(rng)
-                tm.assert_index_equal(result, expected)
-                self.assertEqual(result.name, expected.name)
-                self.assertIsNone(result.freq)
-                self.assertEqual(result.tz, expected.tz)
-
+        base = date_range('6/1/2000', '6/30/2000', freq='D', name='idx')
+
+        # if target has the same name, it is preserved
+        rng2 = date_range('5/15/2000', '6/20/2000', freq='D', name='idx')
+        expected2 = date_range('6/1/2000', '6/20/2000', freq='D', name='idx')
+
+        # if target name is different, it will be reset
+        rng3 = date_range('5/15/2000', '6/20/2000', freq='D', name='other')
+        expected3 = date_range('6/1/2000', '6/20/2000', freq='D', name=None)
+
+        rng4 = date_range('7/1/2000', '7/31/2000', freq='D', name='idx')
+        expected4 = DatetimeIndex([], name='idx')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+            assert result.tz == expected.tz
+
+        # non-monotonic
+        base = DatetimeIndex(['2011-01-05', '2011-01-04',
+                              '2011-01-02', '2011-01-03'],
+                             tz=tz, name='idx')
+
+        rng2 = DatetimeIndex(['2011-01-04', '2011-01-02',
+                              '2011-02-02', '2011-02-03'],
+                             tz=tz, name='idx')
+        expected2 = DatetimeIndex(['2011-01-04', '2011-01-02'],
+                                  tz=tz, name='idx')
+
+        rng3 = DatetimeIndex(['2011-01-04', '2011-01-02',
+                              '2011-02-02', '2011-02-03'],
+                             tz=tz, name='other')
+        expected3 = DatetimeIndex(['2011-01-04', '2011-01-02'],
+                                  tz=tz, name=None)
+
+        # GH 7880
+        rng4 = date_range('7/1/2000', '7/31/2000', freq='D', tz=tz,
+                          name='idx')
+        expected4 = DatetimeIndex([], tz=tz, name='idx')
+
+        for (rng, expected) in [(rng2, expected2), (rng3, expected3),
+                                (rng4, expected4)]:
+            result = base.intersection(rng, sort=sort)
+            if sort is None:
+                expected = expected.sort_values()
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq is None
+            assert result.tz == expected.tz
+
+    def test_intersection_empty(self):
         # empty same freq GH2129
         rng = date_range('6/1/2000', '6/15/2000', freq='T')
         result = rng[0:0].intersection(rng)
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
         result = rng.intersection(rng[0:0])
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
     def test_intersection_bug_1708(self):
         from pandas import DateOffset
@@ -154,41 +236,70 @@ def test_intersection_bug_1708(self):
         index_2 = index_1 + DateOffset(hours=1)
 
         result = index_1 & index_2
-        self.assertEqual(len(result), 0)
-
-    def test_difference_freq(self):
+        assert len(result) == 0
+
+    @pytest.mark.parametrize("tz", tz)
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference(self, tz, sort):
+        rng_dates = ['1/2/2000', '1/3/2000', '1/1/2000', '1/4/2000',
+                     '1/5/2000']
+
+        rng1 = pd.DatetimeIndex(rng_dates, tz=tz)
+        other1 = pd.date_range('1/6/2000', freq='D', periods=5, tz=tz)
+        expected1 = pd.DatetimeIndex(rng_dates, tz=tz)
+
+        rng2 = pd.DatetimeIndex(rng_dates, tz=tz)
+        other2 = pd.date_range('1/4/2000', freq='D', periods=5, tz=tz)
+        expected2 = pd.DatetimeIndex(rng_dates[:3], tz=tz)
+
+        rng3 = pd.DatetimeIndex(rng_dates, tz=tz)
+        other3 = pd.DatetimeIndex([], tz=tz)
+        expected3 = pd.DatetimeIndex(rng_dates, tz=tz)
+
+        for rng, other, expected in [(rng1, other1, expected1),
+                                     (rng2, other2, expected2),
+                                     (rng3, other3, expected3)]:
+            result_diff = rng.difference(other, sort)
+            if sort is None:
+                expected = expected.sort_values()
+            tm.assert_index_equal(result_diff, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_freq(self, sort):
         # GH14323: difference of DatetimeIndex should not preserve frequency
 
         index = date_range("20160920", "20160925", freq="D")
         other = date_range("20160921", "20160924", freq="D")
         expected = DatetimeIndex(["20160920", "20160925"], freq=None)
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
         other = date_range("20160922", "20160925", freq="D")
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         expected = DatetimeIndex(["20160920", "20160921"], freq=None)
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
-    def test_datetimeindex_diff(self):
-        dti1 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
-                             periods=100)
-        dti2 = DatetimeIndex(freq='Q-JAN', start=datetime(1997, 12, 31),
-                             periods=98)
-        self.assertEqual(len(dti1.difference(dti2)), 2)
-
-    def test_datetimeindex_union_join_empty(self):
-        dti = DatetimeIndex(start='1/1/2001', end='2/1/2001', freq='D')
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_datetimeindex_diff(self, sort):
+        dti1 = date_range(freq='Q-JAN', start=datetime(1997, 12, 31),
+                          periods=100)
+        dti2 = date_range(freq='Q-JAN', start=datetime(1997, 12, 31),
+                          periods=98)
+        assert len(dti1.difference(dti2, sort)) == 2
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_datetimeindex_union_join_empty(self, sort):
+        dti = date_range(start='1/1/2001', end='2/1/2001', freq='D')
         empty = Index([])
 
-        result = dti.union(empty)
-        tm.assertIsInstance(result, DatetimeIndex)
-        self.assertIs(result, result)
+        result = dti.union(empty, sort=sort)
+        assert isinstance(result, DatetimeIndex)
+        assert result is result
 
         result = dti.join(empty)
-        tm.assertIsInstance(result, DatetimeIndex)
+        assert isinstance(result, DatetimeIndex)
 
     def test_join_nonunique(self):
         idx1 = to_datetime(['2012-11-06 16:00:11.477563',
@@ -196,44 +307,49 @@ def test_join_nonunique(self):
         idx2 = to_datetime(['2012-11-06 15:11:09.006507',
                             '2012-11-06 15:11:09.006507'])
         rs = idx1.join(idx2, how='outer')
-        self.assertTrue(rs.is_monotonic)
+        assert rs.is_monotonic
 
 
-class TestBusinessDatetimeIndex(tm.TestCase):
+class TestBusinessDatetimeIndex(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.rng = bdate_range(START, END)
 
-    def test_union(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, sort):
         # overlapping
         left = self.rng[:10]
         right = self.rng[5:10]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = left.union(right, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
         # non-overlapping, gap in middle
         left = self.rng[:5]
         right = self.rng[10:]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, Index)
+        the_union = left.union(right, sort=sort)
+        assert isinstance(the_union, Index)
 
         # non-overlapping, no gap
         left = self.rng[:5]
         right = self.rng[5:10]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = left.union(right, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
         # order does not matter
-        tm.assert_index_equal(right.union(left), the_union)
+        if sort is None:
+            tm.assert_index_equal(right.union(left, sort=sort), the_union)
+        else:
+            expected = pd.DatetimeIndex(list(right) + list(left))
+            tm.assert_index_equal(right.union(left, sort=sort), expected)
 
         # overlapping, but different offset
         rng = date_range(START, END, freq=BMonthEnd())
 
-        the_union = self.rng.union(rng)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = self.rng.union(rng, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
     def test_outer_join(self):
         # should just behave as union
@@ -243,42 +359,47 @@ def test_outer_join(self):
         right = self.rng[5:10]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
+        assert isinstance(the_join, DatetimeIndex)
 
         # non-overlapping, gap in middle
         left = self.rng[:5]
         right = self.rng[10:]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
 
         # non-overlapping, no gap
         left = self.rng[:5]
         right = self.rng[5:10]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
+        assert isinstance(the_join, DatetimeIndex)
 
         # overlapping, but different offset
         rng = date_range(START, END, freq=BMonthEnd())
 
         the_join = self.rng.join(rng, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
 
-    def test_union_not_cacheable(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_not_cacheable(self, sort):
         rng = date_range('1/1/2000', periods=50, freq=Minute())
         rng1 = rng[10:]
         rng2 = rng[:25]
-        the_union = rng1.union(rng2)
-        self.assert_index_equal(the_union, rng)
+        the_union = rng1.union(rng2, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(the_union, rng)
+        else:
+            expected = pd.DatetimeIndex(list(rng[10:]) + list(rng[:10]))
+            tm.assert_index_equal(the_union, expected)
 
         rng1 = rng[10:]
         rng2 = rng[15:35]
-        the_union = rng1.union(rng2)
+        the_union = rng1.union(rng2, sort=sort)
         expected = rng[10:]
-        self.assert_index_equal(the_union, expected)
+        tm.assert_index_equal(the_union, expected)
 
     def test_intersection(self):
         rng = date_range('1/1/2000', periods=50, freq=Minute())
@@ -286,27 +407,27 @@ def test_intersection(self):
         rng2 = rng[:25]
         the_int = rng1.intersection(rng2)
         expected = rng[10:25]
-        self.assert_index_equal(the_int, expected)
-        tm.assertIsInstance(the_int, DatetimeIndex)
-        self.assertEqual(the_int.offset, rng.offset)
+        tm.assert_index_equal(the_int, expected)
+        assert isinstance(the_int, DatetimeIndex)
+        assert the_int.freq == rng.freq
 
         the_int = rng1.intersection(rng2.view(DatetimeIndex))
-        self.assert_index_equal(the_int, expected)
+        tm.assert_index_equal(the_int, expected)
 
         # non-overlapping
         the_int = rng[:10].intersection(rng[10:])
         expected = DatetimeIndex([])
-        self.assert_index_equal(the_int, expected)
+        tm.assert_index_equal(the_int, expected)
 
     def test_intersection_bug(self):
         # GH #771
         a = bdate_range('11/30/2011', '12/31/2011')
         b = bdate_range('12/10/2011', '12/20/2011')
         result = a.intersection(b)
-        self.assert_index_equal(result, b)
+        tm.assert_index_equal(result, b)
 
-    def test_month_range_union_tz_pytz(self):
-        tm._skip_if_no_pytz()
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_month_range_union_tz_pytz(self, sort):
         from pytz import timezone
         tz = timezone('US/Eastern')
 
@@ -321,13 +442,13 @@ def test_month_range_union_tz_pytz(self):
         late_dr = date_range(start=late_start, end=late_end, tz=tz,
                              freq=MonthEnd())
 
-        early_dr.union(late_dr)
+        early_dr.union(late_dr, sort=sort)
 
-    def test_month_range_union_tz_dateutil(self):
-        tm._skip_if_windows_python_3()
-        tm._skip_if_no_dateutil()
-        from pandas._libs.tslib import _dateutil_gettz as timezone
-        tz = timezone('US/Eastern')
+    @td.skip_if_windows_python_3
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_month_range_union_tz_dateutil(self, sort):
+        from pandas._libs.tslibs.timezones import dateutil_gettz
+        tz = dateutil_gettz('US/Eastern')
 
         early_start = datetime(2011, 1, 1)
         early_end = datetime(2011, 3, 1)
@@ -340,44 +461,46 @@ def test_month_range_union_tz_dateutil(self):
         late_dr = date_range(start=late_start, end=late_end, tz=tz,
                              freq=MonthEnd())
 
-        early_dr.union(late_dr)
+        early_dr.union(late_dr, sort=sort)
 
 
-class TestCustomDatetimeIndex(tm.TestCase):
+class TestCustomDatetimeIndex(object):
 
-    def setUp(self):
-        self.rng = cdate_range(START, END)
+    def setup_method(self, method):
+        self.rng = bdate_range(START, END, freq='C')
 
-    def test_union(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, sort):
         # overlapping
         left = self.rng[:10]
         right = self.rng[5:10]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = left.union(right, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
         # non-overlapping, gap in middle
         left = self.rng[:5]
         right = self.rng[10:]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, Index)
+        the_union = left.union(right, sort)
+        assert isinstance(the_union, Index)
 
         # non-overlapping, no gap
         left = self.rng[:5]
         right = self.rng[5:10]
 
-        the_union = left.union(right)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = left.union(right, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
         # order does not matter
-        self.assert_index_equal(right.union(left), the_union)
+        if sort is None:
+            tm.assert_index_equal(right.union(left, sort=sort), the_union)
 
         # overlapping, but different offset
         rng = date_range(START, END, freq=BMonthEnd())
 
-        the_union = self.rng.union(rng)
-        tm.assertIsInstance(the_union, DatetimeIndex)
+        the_union = self.rng.union(rng, sort=sort)
+        assert isinstance(the_union, DatetimeIndex)
 
     def test_outer_join(self):
         # should just behave as union
@@ -387,33 +510,33 @@ def test_outer_join(self):
         right = self.rng[5:10]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
+        assert isinstance(the_join, DatetimeIndex)
 
         # non-overlapping, gap in middle
         left = self.rng[:5]
         right = self.rng[10:]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
 
         # non-overlapping, no gap
         left = self.rng[:5]
         right = self.rng[5:10]
 
         the_join = left.join(right, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
+        assert isinstance(the_join, DatetimeIndex)
 
         # overlapping, but different offset
         rng = date_range(START, END, freq=BMonthEnd())
 
         the_join = self.rng.join(rng, how='outer')
-        tm.assertIsInstance(the_join, DatetimeIndex)
-        self.assertIsNone(the_join.freq)
+        assert isinstance(the_join, DatetimeIndex)
+        assert the_join.freq is None
 
     def test_intersection_bug(self):
         # GH #771
-        a = cdate_range('11/30/2011', '12/31/2011')
-        b = cdate_range('12/10/2011', '12/20/2011')
+        a = bdate_range('11/30/2011', '12/31/2011', freq='C')
+        b = bdate_range('12/10/2011', '12/20/2011', freq='C')
         result = a.intersection(b)
-        self.assert_index_equal(result, b)
+        tm.assert_index_equal(result, b)
diff --git a/pandas/tests/indexes/datetimes/test_timezones.py b/pandas/tests/indexes/datetimes/test_timezones.py
new file mode 100644
index 0000000000000..b25918417efcd
--- /dev/null
+++ b/pandas/tests/indexes/datetimes/test_timezones.py
@@ -0,0 +1,1163 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for DatetimeIndex timezone-related methods
+"""
+from datetime import date, datetime, time, timedelta, tzinfo
+from distutils.version import LooseVersion
+
+import dateutil
+from dateutil.tz import gettz, tzlocal
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslibs import conversion, timezones
+from pandas.compat import PY3, lrange, zip
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import (
+    DatetimeIndex, Index, Timestamp, bdate_range, date_range, isna,
+    to_datetime)
+import pandas.util.testing as tm
+
+
+class FixedOffset(tzinfo):
+    """Fixed offset in minutes east from UTC."""
+
+    def __init__(self, offset, name):
+        self.__offset = timedelta(minutes=offset)
+        self.__name = name
+
+    def utcoffset(self, dt):
+        return self.__offset
+
+    def tzname(self, dt):
+        return self.__name
+
+    def dst(self, dt):
+        return timedelta(0)
+
+
+fixed_off = FixedOffset(-420, '-07:00')
+fixed_off_no_name = FixedOffset(-330, None)
+
+
+class TestDatetimeIndexTimezones(object):
+    # -------------------------------------------------------------
+    # DatetimeIndex.tz_convert
+    def test_tz_convert_nat(self):
+        # GH#5546
+        dates = [pd.NaT]
+        idx = DatetimeIndex(dates)
+        idx = idx.tz_localize('US/Pacific')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Eastern'))
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='UTC'))
+
+        dates = ['2010-12-01 00:00', '2010-12-02 00:00', pd.NaT]
+        idx = DatetimeIndex(dates)
+        idx = idx.tz_localize('US/Pacific')
+        tm.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
+        idx = idx.tz_convert('US/Eastern')
+        expected = ['2010-12-01 03:00', '2010-12-02 03:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+
+        idx = idx + pd.offsets.Hour(5)
+        expected = ['2010-12-01 08:00', '2010-12-02 08:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+        idx = idx.tz_convert('US/Pacific')
+        expected = ['2010-12-01 05:00', '2010-12-02 05:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
+
+        idx = idx + np.timedelta64(3, 'h')
+        expected = ['2010-12-01 08:00', '2010-12-02 08:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
+
+        idx = idx.tz_convert('US/Eastern')
+        expected = ['2010-12-01 11:00', '2010-12-02 11:00', pd.NaT]
+        tm.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_tz_convert_compat_timestamp(self, prefix):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+        idx = DatetimeIndex(strdates, tz=prefix + 'US/Eastern')
+
+        conv = idx[0].tz_convert(prefix + 'US/Pacific')
+        expected = idx.tz_convert(prefix + 'US/Pacific')[0]
+
+        assert conv == expected
+
+    def test_dti_tz_convert_hour_overflow_dst(self):
+        # Regression test for:
+        # https://github.com/pandas-dev/pandas/issues/13306
+
+        # sorted case US/Eastern -> UTC
+        ts = ['2008-05-12 09:50:00',
+              '2008-12-12 09:50:35',
+              '2009-05-12 09:50:32']
+        tt = DatetimeIndex(ts).tz_localize('US/Eastern')
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # sorted case UTC -> US/Eastern
+        ts = ['2008-05-12 13:50:00',
+              '2008-12-12 14:50:35',
+              '2009-05-12 13:50:32']
+        tt = DatetimeIndex(ts).tz_localize('UTC')
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case US/Eastern -> UTC
+        ts = ['2008-05-12 09:50:00',
+              '2008-12-12 09:50:35',
+              '2008-05-12 09:50:32']
+        tt = DatetimeIndex(ts).tz_localize('US/Eastern')
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case UTC -> US/Eastern
+        ts = ['2008-05-12 13:50:00',
+              '2008-12-12 14:50:35',
+              '2008-05-12 13:50:32']
+        tt = DatetimeIndex(ts).tz_localize('UTC')
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_convert_hour_overflow_dst_timestamps(self, tz):
+        # Regression test for GH#13306
+
+        # sorted case US/Eastern -> UTC
+        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
+              Timestamp('2008-12-12 09:50:35', tz=tz),
+              Timestamp('2009-05-12 09:50:32', tz=tz)]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # sorted case UTC -> US/Eastern
+        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
+              Timestamp('2008-12-12 14:50:35', tz='UTC'),
+              Timestamp('2009-05-12 13:50:32', tz='UTC')]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case US/Eastern -> UTC
+        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
+              Timestamp('2008-12-12 09:50:35', tz=tz),
+              Timestamp('2008-05-12 09:50:32', tz=tz)]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('UTC')
+        expected = Index([13, 14, 13])
+        tm.assert_index_equal(ut.hour, expected)
+
+        # unsorted case UTC -> US/Eastern
+        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
+              Timestamp('2008-12-12 14:50:35', tz='UTC'),
+              Timestamp('2008-05-12 13:50:32', tz='UTC')]
+        tt = DatetimeIndex(ts)
+        ut = tt.tz_convert('US/Eastern')
+        expected = Index([9, 9, 9])
+        tm.assert_index_equal(ut.hour, expected)
+
+    @pytest.mark.parametrize('freq, n', [('H', 1), ('T', 60), ('S', 3600)])
+    def test_dti_tz_convert_trans_pos_plus_1__bug(self, freq, n):
+        # Regression test for tslib.tz_convert(vals, tz1, tz2).
+        # See https://github.com/pandas-dev/pandas/issues/4496 for details.
+        idx = date_range(datetime(2011, 3, 26, 23),
+                         datetime(2011, 3, 27, 1), freq=freq)
+        idx = idx.tz_localize('UTC')
+        idx = idx.tz_convert('Europe/Moscow')
+
+        expected = np.repeat(np.array([3, 4, 5]), np.array([n, n, 1]))
+        tm.assert_index_equal(idx.hour, Index(expected))
+
+    def test_dti_tz_convert_dst(self):
+        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
+            # Start DST
+            idx = date_range('2014-03-08 23:00', '2014-03-09 09:00', freq=freq,
+                             tz='UTC')
+            idx = idx.tz_convert('US/Eastern')
+            expected = np.repeat(np.array([18, 19, 20, 21, 22, 23,
+                                           0, 1, 3, 4, 5]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            idx = date_range('2014-03-08 18:00', '2014-03-09 05:00', freq=freq,
+                             tz='US/Eastern')
+            idx = idx.tz_convert('UTC')
+            expected = np.repeat(np.array([23, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            # End DST
+            idx = date_range('2014-11-01 23:00', '2014-11-02 09:00', freq=freq,
+                             tz='UTC')
+            idx = idx.tz_convert('US/Eastern')
+            expected = np.repeat(np.array([19, 20, 21, 22, 23,
+                                           0, 1, 1, 2, 3, 4]),
+                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+            idx = date_range('2014-11-01 18:00', '2014-11-02 05:00', freq=freq,
+                             tz='US/Eastern')
+            idx = idx.tz_convert('UTC')
+            expected = np.repeat(np.array([22, 23, 0, 1, 2, 3, 4, 5, 6,
+                                           7, 8, 9, 10]),
+                                 np.array([n, n, n, n, n, n, n, n, n,
+                                           n, n, n, 1]))
+            tm.assert_index_equal(idx.hour, Index(expected))
+
+        # daily
+        # Start DST
+        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
+                         tz='UTC')
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx.hour, Index([19, 19]))
+
+        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
+                         tz='US/Eastern')
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx.hour, Index([5, 5]))
+
+        # End DST
+        idx = date_range('2014-11-01 00:00', '2014-11-02 00:00', freq='D',
+                         tz='UTC')
+        idx = idx.tz_convert('US/Eastern')
+        tm.assert_index_equal(idx.hour, Index([20, 20]))
+
+        idx = date_range('2014-11-01 00:00', '2014-11-02 000:00', freq='D',
+                         tz='US/Eastern')
+        idx = idx.tz_convert('UTC')
+        tm.assert_index_equal(idx.hour, Index([4, 4]))
+
+    def test_tz_convert_roundtrip(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M',
+                          tz='UTC')
+        exp1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
+
+        idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D',
+                          tz='UTC')
+        exp2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
+
+        idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H',
+                          tz='UTC')
+        exp3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
+
+        idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T',
+                          tz='UTC')
+        exp4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
+
+        for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3),
+                              (idx4, exp4)]:
+            converted = idx.tz_convert(tz)
+            reset = converted.tz_convert(None)
+            tm.assert_index_equal(reset, expected)
+            assert reset.tzinfo is None
+            expected = converted.tz_convert('UTC').tz_localize(None)
+            tm.assert_index_equal(reset, expected)
+
+    def test_dti_tz_convert_tzlocal(self):
+        # GH#13583
+        # tz_convert doesn't affect to internal
+        dti = date_range(start='2001-01-01', end='2001-03-01', tz='UTC')
+        dti2 = dti.tz_convert(dateutil.tz.tzlocal())
+        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01',
+                         tz=dateutil.tz.tzlocal())
+        dti2 = dti.tz_convert(None)
+        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern',
+                                    pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_convert_utc_to_local_no_modify(self, tz):
+        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tz)
+
+        # Values are unmodified
+        tm.assert_numpy_array_equal(rng.asi8, rng_eastern.asi8)
+
+        assert timezones.tz_compare(rng_eastern.tz, timezones.maybe_get_tz(tz))
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_tz_convert_unsorted(self, tzstr):
+        dr = date_range('2012-03-09', freq='H', periods=100, tz='utc')
+        dr = dr.tz_convert(tzstr)
+
+        result = dr[::-1].hour
+        exp = dr.hour[::-1]
+        tm.assert_almost_equal(result, exp)
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.tz_localize
+
+    def test_dti_tz_localize_nonexistent_raise_coerce(self):
+        # GH#13057
+        times = ['2015-03-08 01:00', '2015-03-08 02:00', '2015-03-08 03:00']
+        index = DatetimeIndex(times)
+        tz = 'US/Eastern'
+        with pytest.raises(pytz.NonExistentTimeError):
+            index.tz_localize(tz=tz)
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            with tm.assert_produces_warning(FutureWarning):
+                index.tz_localize(tz=tz, errors='raise')
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        clear=FutureWarning,
+                                        check_stacklevel=False):
+            result = index.tz_localize(tz=tz, errors='coerce')
+        test_times = ['2015-03-08 01:00-05:00', 'NaT',
+                      '2015-03-08 03:00-04:00']
+        dti = to_datetime(test_times, utc=True)
+        expected = dti.tz_convert('US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_infer(self, tz):
+        # November 6, 2011, fall back, repeat 2 AM hour
+        # With no repeated hours, we cannot infer the transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dr.tz_localize(tz)
+
+        # With repeated hours, we can infer the transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour(), tz=tz)
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+        di = DatetimeIndex(times)
+        localized = di.tz_localize(tz, ambiguous='infer')
+        tm.assert_index_equal(dr, localized)
+        tm.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
+                                                ambiguous='infer'))
+
+        # When there is no dst transition, nothing special happens
+        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
+                        freq=pd.offsets.Hour())
+        localized = dr.tz_localize(tz)
+        localized_infer = dr.tz_localize(tz, ambiguous='infer')
+        tm.assert_index_equal(localized, localized_infer)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_times(self, tz):
+        # March 13, 2011, spring forward, skip from 2 AM to 3 AM
+        dr = date_range(datetime(2011, 3, 13, 1, 30), periods=3,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.NonExistentTimeError):
+            dr.tz_localize(tz)
+
+        # after dst transition, it works
+        dr = date_range(datetime(2011, 3, 13, 3, 30), periods=3,
+                        freq=pd.offsets.Hour(), tz=tz)
+
+        # November 6, 2011, fall back, repeat 2 AM hour
+        dr = date_range(datetime(2011, 11, 6, 1, 30), periods=3,
+                        freq=pd.offsets.Hour())
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dr.tz_localize(tz)
+
+        # UTC is OK
+        dr = date_range(datetime(2011, 3, 13), periods=48,
+                        freq=pd.offsets.Minute(30), tz=pytz.utc)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_localize_pass_dates_to_utc(self, tzstr):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+
+        idx = DatetimeIndex(strdates)
+        conv = idx.tz_localize(tzstr)
+
+        fromdates = DatetimeIndex(strdates, tz=tzstr)
+
+        assert conv.tz == fromdates.tz
+        tm.assert_numpy_array_equal(conv.values, fromdates.values)
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_tz_localize(self, prefix):
+        tzstr = prefix + 'US/Eastern'
+        dti = pd.date_range(start='1/1/2005', end='1/1/2005 0:00:30.256',
+                            freq='L')
+        dti2 = dti.tz_localize(tzstr)
+
+        dti_utc = pd.date_range(start='1/1/2005 05:00',
+                                end='1/1/2005 5:00:30.256', freq='L', tz='utc')
+
+        tm.assert_numpy_array_equal(dti2.values, dti_utc.values)
+
+        dti3 = dti2.tz_convert(prefix + 'US/Pacific')
+        tm.assert_numpy_array_equal(dti3.values, dti_utc.values)
+
+        dti = pd.date_range(start='11/6/2011 1:59', end='11/6/2011 2:00',
+                            freq='L')
+        with pytest.raises(pytz.AmbiguousTimeError):
+            dti.tz_localize(tzstr)
+
+        dti = pd.date_range(start='3/13/2011 1:59', end='3/13/2011 2:00',
+                            freq='L')
+        with pytest.raises(pytz.NonExistentTimeError):
+            dti.tz_localize(tzstr)
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern',
+                                    pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_utc_conversion(self, tz):
+        # Localizing to time zone should:
+        #  1) check for DST ambiguities
+        #  2) convert to UTC
+
+        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
+
+        converted = rng.tz_localize(tz)
+        expected_naive = rng + pd.offsets.Hour(5)
+        tm.assert_numpy_array_equal(converted.asi8, expected_naive.asi8)
+
+        # DST ambiguity, this should fail
+        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
+        # Is this really how it should fail??
+        with pytest.raises(pytz.NonExistentTimeError):
+            rng.tz_localize(tz)
+
+    def test_dti_tz_localize_roundtrip(self, tz_aware_fixture):
+        # note: this tz tests that a tz-naive index can be localized
+        # and de-localized successfully, when there are no DST transitions
+        # in the range.
+        idx = date_range(start='2014-06-01', end='2014-08-30', freq='15T')
+        tz = tz_aware_fixture
+        localized = idx.tz_localize(tz)
+        # cant localize a tz-aware object
+        with pytest.raises(TypeError):
+            localized.tz_localize(tz)
+        reset = localized.tz_localize(None)
+        assert reset.tzinfo is None
+        tm.assert_index_equal(reset, idx)
+
+    def test_dti_tz_localize_naive(self):
+        rng = date_range('1/1/2011', periods=100, freq='H')
+
+        conv = rng.tz_localize('US/Pacific')
+        exp = date_range('1/1/2011', periods=100, freq='H', tz='US/Pacific')
+
+        tm.assert_index_equal(conv, exp)
+
+    def test_dti_tz_localize_tzlocal(self):
+        # GH#13583
+        offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
+        offset = int(offset.total_seconds() * 1000000000)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01')
+        dti2 = dti.tz_localize(dateutil.tz.tzlocal())
+        tm.assert_numpy_array_equal(dti2.asi8 + offset, dti.asi8)
+
+        dti = date_range(start='2001-01-01', end='2001-03-01',
+                         tz=dateutil.tz.tzlocal())
+        dti2 = dti.tz_localize(None)
+        tm.assert_numpy_array_equal(dti2.asi8 - offset, dti.asi8)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_nat(self, tz):
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+        di = DatetimeIndex(times)
+        localized = di.tz_localize(tz, ambiguous='NaT')
+
+        times = ['11/06/2011 00:00', np.NaN, np.NaN, '11/06/2011 02:00',
+                 '11/06/2011 03:00']
+        di_test = DatetimeIndex(times, tz='US/Eastern')
+
+        # left dtype is datetime64[ns, US/Eastern]
+        # right is datetime64[ns, tzfile('/usr/share/zoneinfo/US/Eastern')]
+        tm.assert_numpy_array_equal(di_test.values, localized.values)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_tz_localize_ambiguous_flags(self, tz):
+        # November 6, 2011, fall back, repeat 2 AM hour
+
+        # Pass in flags to determine right dst transition
+        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
+                        freq=pd.offsets.Hour(), tz=tz)
+        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
+                 '11/06/2011 02:00', '11/06/2011 03:00']
+
+        # Test tz_localize
+        di = DatetimeIndex(times)
+        is_dst = [1, 1, 0, 0, 0]
+        localized = di.tz_localize(tz, ambiguous=is_dst)
+        tm.assert_index_equal(dr, localized)
+        tm.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
+                                                ambiguous=is_dst))
+
+        localized = di.tz_localize(tz, ambiguous=np.array(is_dst))
+        tm.assert_index_equal(dr, localized)
+
+        localized = di.tz_localize(tz,
+                                   ambiguous=np.array(is_dst).astype('bool'))
+        tm.assert_index_equal(dr, localized)
+
+        # Test constructor
+        localized = DatetimeIndex(times, tz=tz, ambiguous=is_dst)
+        tm.assert_index_equal(dr, localized)
+
+        # Test duplicate times where inferring the dst fails
+        times += times
+        di = DatetimeIndex(times)
+
+        # When the sizes are incompatible, make sure error is raised
+        with pytest.raises(Exception):
+            di.tz_localize(tz, ambiguous=is_dst)
+
+        # When sizes are compatible and there are repeats ('infer' won't work)
+        is_dst = np.hstack((is_dst, is_dst))
+        localized = di.tz_localize(tz, ambiguous=is_dst)
+        dr = dr.append(dr)
+        tm.assert_index_equal(dr, localized)
+
+        # When there is no dst transition, nothing special happens
+        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
+                        freq=pd.offsets.Hour())
+        is_dst = np.array([1] * 10)
+        localized = dr.tz_localize(tz)
+        localized_is_dst = dr.tz_localize(tz, ambiguous=is_dst)
+        tm.assert_index_equal(localized, localized_is_dst)
+
+    # TODO: belongs outside tz_localize tests?
+    @pytest.mark.parametrize('tz', ['Europe/London', 'dateutil/Europe/London'])
+    def test_dti_construction_ambiguous_endpoint(self, tz):
+        # construction with an ambiguous end-point
+        # GH#11626
+
+        # FIXME: This next block fails to raise; it was taken from an older
+        # version of this test that had an indention mistake that caused it
+        # to not get executed.
+        # with pytest.raises(pytz.AmbiguousTimeError):
+        #    date_range("2013-10-26 23:00", "2013-10-27 01:00",
+        #               tz="Europe/London", freq="H")
+
+        times = date_range("2013-10-26 23:00", "2013-10-27 01:00", freq="H",
+                           tz=tz, ambiguous='infer')
+        assert times[0] == Timestamp('2013-10-26 23:00', tz=tz, freq="H")
+
+        if str(tz).startswith('dateutil'):
+            if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+                # see GH#14621
+                assert times[-1] == Timestamp('2013-10-27 01:00:00+0000',
+                                              tz=tz, freq="H")
+            elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+                # fixed ambiguous behavior
+                assert times[-1] == Timestamp('2013-10-27 01:00:00+0100',
+                                              tz=tz, freq="H")
+        else:
+            assert times[-1] == Timestamp('2013-10-27 01:00:00+0000',
+                                          tz=tz, freq="H")
+
+    def test_dti_tz_localize_bdate_range(self):
+        dr = pd.bdate_range('1/1/2009', '1/1/2010')
+        dr_utc = pd.bdate_range('1/1/2009', '1/1/2010', tz=pytz.utc)
+        localized = dr.tz_localize(pytz.utc)
+        tm.assert_index_equal(dr_utc, localized)
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    @pytest.mark.parametrize('method, exp', [
+        ['NaT', pd.NaT],
+        ['raise', None],
+        ['foo', 'invalid']
+    ])
+    def test_dti_tz_localize_nonexistent(self, tz, method, exp):
+        # GH 8917
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        if method == 'raise':
+            with pytest.raises(pytz.NonExistentTimeError):
+                dti.tz_localize(tz, nonexistent=method)
+        elif exp == 'invalid':
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, nonexistent=method)
+        else:
+            result = dti.tz_localize(tz, nonexistent=method)
+            expected = DatetimeIndex([exp] * n, tz=tz)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start_ts, tz, end_ts, shift', [
+        ['2015-03-29 02:20:00', 'Europe/Warsaw', '2015-03-29 03:00:00',
+         'forward'],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 01:59:59.999999999', 'backward'],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 03:20:00', timedelta(hours=1)],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 01:20:00', timedelta(hours=-1)],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 03:00:00',
+         'forward'],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 01:59:59.999999999',
+         'backward'],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 03:33:00',
+         timedelta(hours=1)],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 01:33:00',
+         timedelta(hours=-1)]
+    ])
+    @pytest.mark.parametrize('tz_type', ['', 'dateutil/'])
+    def test_dti_tz_localize_nonexistent_shift(self, start_ts, tz,
+                                               end_ts, shift,
+                                               tz_type):
+        # GH 8917
+        tz = tz_type + tz
+        if isinstance(shift, str):
+            shift = 'shift_' + shift
+        dti = DatetimeIndex([Timestamp(start_ts)])
+        result = dti.tz_localize(tz, nonexistent=shift)
+        expected = DatetimeIndex([Timestamp(end_ts)]).tz_localize(tz)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('offset', [-1, 1])
+    @pytest.mark.parametrize('tz_type', ['', 'dateutil/'])
+    def test_dti_tz_localize_nonexistent_shift_invalid(self, offset, tz_type):
+        # GH 8917
+        tz = tz_type + 'Europe/Warsaw'
+        dti = DatetimeIndex([Timestamp('2015-03-29 02:20:00')])
+        msg = "The provided timedelta will relocalize on a nonexistent time"
+        with pytest.raises(ValueError, match=msg):
+            dti.tz_localize(tz, nonexistent=timedelta(seconds=offset))
+
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_dti_tz_localize_errors_deprecation(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, errors='foo')
+            # make sure errors='coerce' gets mapped correctly to nonexistent
+            result = dti.tz_localize(tz, errors='coerce')
+            expected = dti.tz_localize(tz, nonexistent='NaT')
+            tm.assert_index_equal(result, expected)
+
+    # -------------------------------------------------------------
+    # DatetimeIndex.normalize
+
+    def test_normalize_tz(self):
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
+                         tz='US/Eastern')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D',
+                              tz='US/Eastern')
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz='UTC')
+
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D', tz='UTC')
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz=tzlocal())
+        result = rng.normalize()
+        expected = date_range('1/1/2000', periods=10, freq='D', tz=tzlocal())
+        tm.assert_index_equal(result, expected)
+
+        assert result.is_normalized
+        assert not rng.is_normalized
+
+    @td.skip_if_windows
+    @pytest.mark.parametrize('timezone', ['US/Pacific', 'US/Eastern', 'UTC',
+                                          'Asia/Kolkata', 'Asia/Shanghai',
+                                          'Australia/Canberra'])
+    def test_normalize_tz_local(self, timezone):
+        # GH#13459
+        with tm.set_timezone(timezone):
+            rng = date_range('1/1/2000 9:30', periods=10, freq='D',
+                             tz=tzlocal())
+
+            result = rng.normalize()
+            expected = date_range('1/1/2000', periods=10, freq='D',
+                                  tz=tzlocal())
+            tm.assert_index_equal(result, expected)
+
+            assert result.is_normalized
+            assert not rng.is_normalized
+
+    # ------------------------------------------------------------
+    # DatetimeIndex.__new__
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_dti_constructor_static_tzinfo(self, prefix):
+        # it works!
+        index = DatetimeIndex([datetime(2012, 1, 1)], tz=prefix + 'EST')
+        index.hour
+        index[0]
+
+    def test_dti_constructor_with_fixed_tz(self):
+        off = FixedOffset(420, '+07:00')
+        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
+        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
+        rng = date_range(start=start, end=end)
+        assert off == rng.tz
+
+        rng2 = date_range(start, periods=len(rng), tz=off)
+        tm.assert_index_equal(rng, rng2)
+
+        rng3 = date_range('3/11/2012 05:00:00+07:00',
+                          '6/11/2012 05:00:00+07:00')
+        assert (rng.values == rng3.values).all()
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_convert_datetime_list(self, tzstr):
+        dr = date_range('2012-06-02', periods=10,
+                        tz=tzstr, name='foo')
+        dr2 = DatetimeIndex(list(dr), name='foo')
+        tm.assert_index_equal(dr, dr2)
+        assert dr.tz == dr2.tz
+        assert dr2.name == 'foo'
+
+    def test_dti_construction_univalent(self):
+        rng = date_range('03/12/2012 00:00', periods=10, freq='W-FRI',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(data=rng, tz='US/Eastern')
+        tm.assert_index_equal(rng, rng2)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_from_tzaware_datetime(self, tz):
+        d = [datetime(2012, 8, 19, tzinfo=tz)]
+
+        index = DatetimeIndex(d)
+        assert timezones.tz_compare(index.tz, tz)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_constructors(self, tzstr):
+        """ Test different DatetimeIndex constructions with timezone
+        Follow-up of GH#4229
+        """
+
+        arr = ['11/10/2005 08:00:00', '11/10/2005 09:00:00']
+
+        idx1 = to_datetime(arr).tz_localize(tzstr)
+        idx2 = pd.date_range(start="2005-11-10 08:00:00", freq='H', periods=2,
+                             tz=tzstr)
+        idx3 = DatetimeIndex(arr, tz=tzstr)
+        idx4 = DatetimeIndex(np.array(arr), tz=tzstr)
+
+        for other in [idx2, idx3, idx4]:
+            tm.assert_index_equal(idx1, other)
+
+    # -------------------------------------------------------------
+    # Unsorted
+
+    def test_join_utc_convert(self, join_type):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        left = rng.tz_convert('US/Eastern')
+        right = rng.tz_convert('Europe/Berlin')
+
+        result = left.join(left[:-5], how=join_type)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz == left.tz
+
+        result = left.join(right[:-5], how=join_type)
+        assert isinstance(result, DatetimeIndex)
+        assert result.tz.zone == 'UTC'
+
+    @pytest.mark.parametrize("dtype", [
+        None, 'datetime64[ns, CET]',
+        'datetime64[ns, EST]', 'datetime64[ns, UTC]'
+    ])
+    def test_date_accessor(self, dtype):
+        # Regression test for GH#21230
+        expected = np.array([date(2018, 6, 4), pd.NaT])
+
+        index = DatetimeIndex(['2018-06-04 10:00:00', pd.NaT], dtype=dtype)
+        result = index.date
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [
+        None, 'datetime64[ns, CET]',
+        'datetime64[ns, EST]', 'datetime64[ns, UTC]'
+    ])
+    def test_time_accessor(self, dtype):
+        # Regression test for GH#21267
+        expected = np.array([time(10, 20, 30), pd.NaT])
+
+        index = DatetimeIndex(['2018-06-04 10:20:30', pd.NaT], dtype=dtype)
+        result = index.time
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_timetz_accessor(self, tz_naive_fixture):
+        # GH21358
+        tz = timezones.maybe_get_tz(tz_naive_fixture)
+
+        expected = np.array([time(10, 20, 30, tzinfo=tz), pd.NaT])
+
+        index = DatetimeIndex(['2018-06-04 10:20:30', pd.NaT], tz=tz)
+        result = index.timetz
+
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_dti_drop_dont_lose_tz(self):
+        # GH#2621
+        ind = date_range("2012-12-01", periods=10, tz="utc")
+        ind = ind.drop(ind[-1])
+
+        assert ind.tz is not None
+
+    def test_dti_tz_conversion_freq(self, tz_naive_fixture):
+        # GH25241
+        t3 = DatetimeIndex(['2019-01-01 10:00'], freq='H')
+        assert t3.tz_localize(tz=tz_naive_fixture).freq == t3.freq
+        t4 = DatetimeIndex(['2019-01-02 12:00'], tz='UTC', freq='T')
+        assert t4.tz_convert(tz='UTC').freq == t4.freq
+
+    def test_drop_dst_boundary(self):
+        # see gh-18031
+        tz = "Europe/Brussels"
+        freq = "15min"
+
+        start = pd.Timestamp("201710290100", tz=tz)
+        end = pd.Timestamp("201710290300", tz=tz)
+        index = pd.date_range(start=start, end=end, freq=freq)
+
+        expected = DatetimeIndex(["201710290115", "201710290130",
+                                  "201710290145", "201710290200",
+                                  "201710290215", "201710290230",
+                                  "201710290245", "201710290200",
+                                  "201710290215", "201710290230",
+                                  "201710290245", "201710290300"],
+                                 tz=tz, freq=freq,
+                                 ambiguous=[True, True, True, True,
+                                            True, True, True, False,
+                                            False, False, False, False])
+        result = index.drop(index[0])
+        tm.assert_index_equal(result, expected)
+
+    def test_date_range_localize(self):
+        rng = date_range('3/11/2012 03:00', periods=15, freq='H',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(['3/11/2012 03:00', '3/11/2012 04:00'],
+                             tz='US/Eastern')
+        rng3 = date_range('3/11/2012 03:00', periods=15, freq='H')
+        rng3 = rng3.tz_localize('US/Eastern')
+
+        tm.assert_index_equal(rng, rng3)
+
+        # DST transition time
+        val = rng[0]
+        exp = Timestamp('3/11/2012 03:00', tz='US/Eastern')
+
+        assert val.hour == 3
+        assert exp.hour == 3
+        assert val == exp  # same UTC value
+        tm.assert_index_equal(rng[:2], rng2)
+
+        # Right before the DST transition
+        rng = date_range('3/11/2012 00:00', periods=2, freq='H',
+                         tz='US/Eastern')
+        rng2 = DatetimeIndex(['3/11/2012 00:00', '3/11/2012 01:00'],
+                             tz='US/Eastern')
+        tm.assert_index_equal(rng, rng2)
+        exp = Timestamp('3/11/2012 00:00', tz='US/Eastern')
+        assert exp.hour == 0
+        assert rng[0] == exp
+        exp = Timestamp('3/11/2012 01:00', tz='US/Eastern')
+        assert exp.hour == 1
+        assert rng[1] == exp
+
+        rng = date_range('3/11/2012 00:00', periods=10, freq='H',
+                         tz='US/Eastern')
+        assert rng[2].hour == 3
+
+    def test_timestamp_equality_different_timezones(self):
+        utc_range = date_range('1/1/2000', periods=20, tz='UTC')
+        eastern_range = utc_range.tz_convert('US/Eastern')
+        berlin_range = utc_range.tz_convert('Europe/Berlin')
+
+        for a, b, c in zip(utc_range, eastern_range, berlin_range):
+            assert a == b
+            assert b == c
+            assert a == c
+
+        assert (utc_range == eastern_range).all()
+        assert (utc_range == berlin_range).all()
+        assert (berlin_range == eastern_range).all()
+
+    def test_dti_intersection(self):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        left = rng[10:90][::-1]
+        right = rng[20:80][::-1]
+
+        assert left.tz == rng.tz
+        result = left.intersection(right)
+        assert result.tz == left.tz
+
+    def test_dti_equals_with_tz(self):
+        left = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+        right = date_range('1/1/2011', periods=100, freq='H', tz='US/Eastern')
+
+        assert not left.equals(right)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_tz_nat(self, tzstr):
+        idx = DatetimeIndex([Timestamp("2013-1-1", tz=tzstr), pd.NaT])
+
+        assert isna(idx[1])
+        assert idx[0].tzinfo is not None
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_astype_asobject_tzinfos(self, tzstr):
+        # GH#1345
+
+        # dates around a dst transition
+        rng = date_range('2/13/2010', '5/6/2010', tz=tzstr)
+
+        objs = rng.astype(object)
+        for i, x in enumerate(objs):
+            exval = rng[i]
+            assert x == exval
+            assert x.tzinfo == exval.tzinfo
+
+        objs = rng.astype(object)
+        for i, x in enumerate(objs):
+            exval = rng[i]
+            assert x == exval
+            assert x.tzinfo == exval.tzinfo
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_with_timezone_repr(self, tzstr):
+        rng = date_range('4/13/2010', '5/6/2010')
+
+        rng_eastern = rng.tz_localize(tzstr)
+
+        rng_repr = repr(rng_eastern)
+        assert '2010-04-13 00:00:00' in rng_repr
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_dti_take_dont_lose_meta(self, tzstr):
+        rng = date_range('1/1/2000', periods=20, tz=tzstr)
+
+        result = rng.take(lrange(5))
+        assert result.tz == rng.tz
+        assert result.freq == rng.freq
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_utc_box_timestamp_and_localize(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+
+        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tzstr)
+
+        expected = rng[-1].astimezone(tz)
+
+        stamp = rng_eastern[-1]
+        assert stamp == expected
+        assert stamp.tzinfo == expected.tzinfo
+
+        # right tzinfo
+        rng = date_range('3/13/2012', '3/14/2012', freq='H', tz='utc')
+        rng_eastern = rng.tz_convert(tzstr)
+        # test not valid for dateutil timezones.
+        # assert 'EDT' in repr(rng_eastern[0].tzinfo)
+        assert ('EDT' in repr(rng_eastern[0].tzinfo) or
+                'tzfile' in repr(rng_eastern[0].tzinfo))
+
+    def test_dti_to_pydatetime(self):
+        dt = dateutil.parser.parse('2012-06-13T01:39:00Z')
+        dt = dt.replace(tzinfo=tzlocal())
+
+        arr = np.array([dt], dtype=object)
+
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+        rng = date_range('2012-11-03 03:00', '2012-11-05 03:00', tz=tzlocal())
+        arr = rng.to_pydatetime()
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+    def test_dti_to_pydatetime_fizedtz(self):
+        dates = np.array([datetime(2000, 1, 1, tzinfo=fixed_off),
+                          datetime(2000, 1, 2, tzinfo=fixed_off),
+                          datetime(2000, 1, 3, tzinfo=fixed_off)])
+        dti = DatetimeIndex(dates)
+
+        result = dti.to_pydatetime()
+        tm.assert_numpy_array_equal(dates, result)
+
+        result = dti._mpl_repr()
+        tm.assert_numpy_array_equal(dates, result)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Central'),
+                                    gettz('US/Central')])
+    def test_with_tz(self, tz):
+        # just want it to work
+        start = datetime(2011, 3, 12, tzinfo=pytz.utc)
+        dr = bdate_range(start, periods=50, freq=pd.offsets.Hour())
+        assert dr.tz is pytz.utc
+
+        # DateRange with naive datetimes
+        dr = bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)
+        dr = bdate_range('1/1/2005', '1/1/2009', tz=tz)
+
+        # normalized
+        central = dr.tz_convert(tz)
+        assert central.tz is tz
+        naive = central[0].to_pydatetime().replace(tzinfo=None)
+        comp = conversion.localize_pydatetime(naive, tz).tzinfo
+        assert central[0].tz is comp
+
+        # compare vs a localized tz
+        naive = dr[0].to_pydatetime().replace(tzinfo=None)
+        comp = conversion.localize_pydatetime(naive, tz).tzinfo
+        assert central[0].tz is comp
+
+        # datetimes with tzinfo set
+        dr = bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc),
+                         datetime(2009, 1, 1, tzinfo=pytz.utc))
+        with pytest.raises(Exception):
+            bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc), '1/1/2009',
+                        tz=tz)
+
+    @pytest.mark.parametrize('prefix', ['', 'dateutil/'])
+    def test_field_access_localize(self, prefix):
+        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
+        rng = DatetimeIndex(strdates, tz=prefix + 'US/Eastern')
+        assert (rng.hour == 0).all()
+
+        # a more unusual time zone, #1946
+        dr = date_range('2011-10-02 00:00', freq='h', periods=10,
+                        tz=prefix + 'America/Atikokan')
+
+        expected = Index(np.arange(10, dtype=np.int64))
+        tm.assert_index_equal(dr.hour, expected)
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern')])
+    def test_dti_convert_tz_aware_datetime_datetime(self, tz):
+        # GH#1581
+        dates = [datetime(2000, 1, 1), datetime(2000, 1, 2),
+                 datetime(2000, 1, 3)]
+
+        dates_aware = [conversion.localize_pydatetime(x, tz) for x in dates]
+        result = DatetimeIndex(dates_aware)
+        assert timezones.tz_compare(result.tz, tz)
+
+        converted = to_datetime(dates_aware, utc=True)
+        ex_vals = np.array([Timestamp(x).value for x in dates_aware])
+        tm.assert_numpy_array_equal(converted.asi8, ex_vals)
+        assert converted.tz is pytz.utc
+
+    def test_dti_union_aware(self):
+        # non-overlapping
+        rng = date_range("2012-11-15 00:00:00", periods=6, freq="H",
+                         tz="US/Central")
+
+        rng2 = date_range("2012-11-15 12:00:00", periods=6, freq="H",
+                          tz="US/Eastern")
+
+        result = rng.union(rng2)
+        assert result.tz.zone == 'UTC'
+
+    @pytest.mark.parametrize('tz', [None, 'UTC', "US/Central",
+                                    dateutil.tz.tzoffset(None, -28800)])
+    @pytest.mark.usefixtures("datetime_tz_utc")
+    @pytest.mark.skipif(not PY3, reason="datetime.timezone not in PY2")
+    def test_iteration_preserves_nanoseconds(self, tz):
+        # GH 19603
+        index = DatetimeIndex(["2018-02-08 15:00:00.168456358",
+                               "2018-02-08 15:00:00.168456359"], tz=tz)
+        for i, ts in enumerate(index):
+            assert ts == index[i]
+
+
+class TestDateRange(object):
+    """Tests for date_range with timezones"""
+    def test_hongkong_tz_convert(self):
+        # GH#1673 smoke test
+        dr = date_range('2012-01-01', '2012-01-10', freq='D', tz='Hongkong')
+
+        # it works!
+        dr.hour
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_span_dst_transition(self, tzstr):
+        # GH#1778
+
+        # Standard -> Daylight Savings Time
+        dr = date_range('03/06/2012 00:00', periods=200, freq='W-FRI',
+                        tz='US/Eastern')
+
+        assert (dr.hour == 0).all()
+
+        dr = date_range('2012-11-02', periods=10, tz=tzstr)
+        result = dr.hour
+        expected = Index([0] * 10)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_timezone_str_argument(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+        result = date_range('1/1/2000', periods=10, tz=tzstr)
+        expected = date_range('1/1/2000', periods=10, tz=tz)
+
+        tm.assert_index_equal(result, expected)
+
+    def test_date_range_with_fixedoffset_noname(self):
+        off = fixed_off_no_name
+        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
+        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
+        rng = date_range(start=start, end=end)
+        assert off == rng.tz
+
+        idx = Index([start, end])
+        assert off == idx.tz
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_date_range_with_tz(self, tzstr):
+        stamp = Timestamp('3/11/2012 05:00', tz=tzstr)
+        assert stamp.hour == 5
+
+        rng = date_range('3/11/2012 04:00', periods=10, freq='H',
+                         tz=tzstr)
+
+        assert stamp == rng[1]
+
+
+class TestToDatetime(object):
+    """Tests for the to_datetime constructor with timezones"""
+    def test_to_datetime_utc(self):
+        arr = np.array([dateutil.parser.parse('2012-06-13T01:39:00Z')],
+                       dtype=object)
+
+        result = to_datetime(arr, utc=True)
+        assert result.tz is pytz.utc
+
+    def test_to_datetime_fixed_offset(self):
+        dates = [datetime(2000, 1, 1, tzinfo=fixed_off),
+                 datetime(2000, 1, 2, tzinfo=fixed_off),
+                 datetime(2000, 1, 3, tzinfo=fixed_off)]
+        result = to_datetime(dates)
+        assert result.tz == fixed_off
diff --git a/pandas/tests/indexes/datetimes/test_tools.py b/pandas/tests/indexes/datetimes/test_tools.py
index 512a3e1c38629..dd914d8a79837 100644
--- a/pandas/tests/indexes/datetimes/test_tools.py
+++ b/pandas/tests/indexes/datetimes/test_tools.py
@@ -1,30 +1,39 @@
 """ test to_datetime """
 
-import sys
-import pytest
-import locale
 import calendar
-import numpy as np
-from datetime import datetime, date, time
+from datetime import datetime, time
 from distutils.version import LooseVersion
+import locale
+
+import dateutil
+from dateutil.parser import parse
+from dateutil.tz.tz import tzoffset
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs import tslib
+from pandas._libs.tslibs import iNaT, parsing
+from pandas.compat import PY3, lmap
+from pandas.errors import OutOfBoundsDatetime
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.common import is_datetime64_ns_dtype
 
 import pandas as pd
-from pandas._libs import tslib, lib
-from pandas.tseries import tools
-from pandas.tseries.tools import normalize_date
-from pandas.compat import lmap
-from pandas.compat.numpy import np_array_datetime64_compat
-from pandas.types.common import is_datetime64_ns_dtype
+from pandas import (
+    DataFrame, DatetimeIndex, Index, NaT, Series, Timestamp, compat,
+    date_range, isna, to_datetime)
+from pandas.core.arrays import DatetimeArray
+from pandas.core.tools import datetimes as tools
 from pandas.util import testing as tm
-from pandas.util.testing import assert_series_equal, _skip_if_has_locale
-from pandas import (isnull, to_datetime, Timestamp, Series, DataFrame,
-                    Index, DatetimeIndex, NaT, date_range, bdate_range,
-                    compat)
+from pandas.util.testing import assert_series_equal
 
 
-class TimeConversionFormats(tm.TestCase):
+class TestTimeConversionFormats(object):
 
-    def test_to_datetime_format(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format(self, cache):
         values = ['1/1/2000', '1/2/2000', '1/3/2000']
 
         results1 = [Timestamp('20000101'), Timestamp('20000201'),
@@ -39,24 +48,25 @@ def test_to_datetime_format(self):
                                 (values[2], (results1[2], results2[2]))]:
 
             for i, fmt in enumerate(['%d/%m/%Y', '%m/%d/%Y']):
-                result = to_datetime(vals, format=fmt)
+                result = to_datetime(vals, format=fmt, cache=cache)
                 expected = expecteds[i]
 
                 if isinstance(expected, Series):
                     assert_series_equal(result, Series(expected))
                 elif isinstance(expected, Timestamp):
-                    self.assertEqual(result, expected)
+                    assert result == expected
                 else:
                     tm.assert_index_equal(result, expected)
 
-    def test_to_datetime_format_YYYYMMDD(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_YYYYMMDD(self, cache):
         s = Series([19801222, 19801222] + [19810105] * 5)
         expected = Series([Timestamp(x) for x in s.apply(str)])
 
-        result = to_datetime(s, format='%Y%m%d')
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
         assert_series_equal(result, expected)
 
-        result = to_datetime(s.apply(str), format='%Y%m%d')
+        result = to_datetime(s.apply(str), format='%Y%m%d', cache=cache)
         assert_series_equal(result, expected)
 
         # with NaT
@@ -65,44 +75,48 @@ def test_to_datetime_format_YYYYMMDD(self):
         expected[2] = np.nan
         s[2] = np.nan
 
-        result = to_datetime(s, format='%Y%m%d')
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
         assert_series_equal(result, expected)
 
         # string with NaT
         s = s.apply(str)
         s[2] = 'nat'
-        result = to_datetime(s, format='%Y%m%d')
+        result = to_datetime(s, format='%Y%m%d', cache=cache)
         assert_series_equal(result, expected)
 
         # coercion
         # GH 7930
         s = Series([20121231, 20141231, 99991231])
-        result = pd.to_datetime(s, format='%Y%m%d', errors='ignore')
+        result = pd.to_datetime(s, format='%Y%m%d', errors='ignore',
+                                cache=cache)
         expected = Series([datetime(2012, 12, 31),
                            datetime(2014, 12, 31), datetime(9999, 12, 31)],
                           dtype=object)
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
-        result = pd.to_datetime(s, format='%Y%m%d', errors='coerce')
+        result = pd.to_datetime(s, format='%Y%m%d', errors='coerce',
+                                cache=cache)
         expected = Series(['20121231', '20141231', 'NaT'], dtype='M8[ns]')
         assert_series_equal(result, expected)
 
-    # GH 10178
-    def test_to_datetime_format_integer(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_integer(self, cache):
+        # GH 10178
         s = Series([2000, 2001, 2002])
         expected = Series([Timestamp(x) for x in s.apply(str)])
 
-        result = to_datetime(s, format='%Y')
+        result = to_datetime(s, format='%Y', cache=cache)
         assert_series_equal(result, expected)
 
         s = Series([200001, 200105, 200206])
         expected = Series([Timestamp(x[:4] + '-' + x[4:]) for x in s.apply(str)
                            ])
 
-        result = to_datetime(s, format='%Y%m')
+        result = to_datetime(s, format='%Y%m', cache=cache)
         assert_series_equal(result, expected)
 
-    def test_to_datetime_format_microsecond(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_microsecond(self, cache):
 
         # these are locale dependent
         lang, _ = locale.getlocale()
@@ -110,11 +124,12 @@ def test_to_datetime_format_microsecond(self):
         val = '01-{}-2011 00:00:01.978'.format(month_abbr)
 
         format = '%d-%b-%Y %H:%M:%S.%f'
-        result = to_datetime(val, format=format)
+        result = to_datetime(val, format=format, cache=cache)
         exp = datetime.strptime(val, format)
-        self.assertEqual(result, exp)
+        assert result == exp
 
-    def test_to_datetime_format_time(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_time(self, cache):
         data = [
             ['01/10/2010 15:20', '%m/%d/%Y %H:%M',
              Timestamp('2010-01-10 15:20')],
@@ -130,25 +145,23 @@ def test_to_datetime_format_time(self):
             #  Timestamp('2010-01-10 09:12:56')]
         ]
         for s, format, dt in data:
-            self.assertEqual(to_datetime(s, format=format), dt)
+            assert to_datetime(s, format=format, cache=cache) == dt
 
-    def test_to_datetime_with_non_exact(self):
+    @td.skip_if_has_locale
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_non_exact(self, cache):
         # GH 10834
-        tm._skip_if_has_locale()
-
         # 8904
         # exact kw
-        if sys.version_info < (2, 7):
-            pytest.skip('on python version < 2.7')
-
         s = Series(['19MAY11', 'foobar19MAY11', '19MAY11:00:00:00',
                     '19MAY11 00:00:00Z'])
-        result = to_datetime(s, format='%d%b%y', exact=False)
+        result = to_datetime(s, format='%d%b%y', exact=False, cache=cache)
         expected = to_datetime(s.str.extract(r'(\d+\w+\d+)', expand=False),
-                               format='%d%b%y')
+                               format='%d%b%y', cache=cache)
         assert_series_equal(result, expected)
 
-    def test_parse_nanoseconds_with_formula(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parse_nanoseconds_with_formula(self, cache):
 
         # GH8989
         # trunctaing the nanoseconds when a format was provided
@@ -157,55 +170,214 @@ def test_parse_nanoseconds_with_formula(self):
                   "2012-01-01 09:00:00.001",
                   "2012-01-01 09:00:00.001000",
                   "2012-01-01 09:00:00.001000000", ]:
-            expected = pd.to_datetime(v)
-            result = pd.to_datetime(v, format="%Y-%m-%d %H:%M:%S.%f")
-            self.assertEqual(result, expected)
+            expected = pd.to_datetime(v, cache=cache)
+            result = pd.to_datetime(v, format="%Y-%m-%d %H:%M:%S.%f",
+                                    cache=cache)
+            assert result == expected
 
-    def test_to_datetime_format_weeks(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_format_weeks(self, cache):
         data = [
             ['2009324', '%Y%W%w', Timestamp('2009-08-13')],
             ['2013020', '%Y%U%w', Timestamp('2013-01-13')]
         ]
         for s, format, dt in data:
-            self.assertEqual(to_datetime(s, format=format), dt)
-
+            assert to_datetime(s, format=format, cache=cache) == dt
+
+    @pytest.mark.parametrize("box,const", [
+        [True, pd.Index],
+        [False, np.array]])
+    @pytest.mark.parametrize("fmt,dates,expected_dates", [
+        ['%Y-%m-%d %H:%M:%S %Z',
+         ['2010-01-01 12:00:00 UTC'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00', tz='UTC')] * 2],
+        ['%Y-%m-%d %H:%M:%S %Z',
+         ['2010-01-01 12:00:00 UTC',
+          '2010-01-01 12:00:00 GMT',
+          '2010-01-01 12:00:00 US/Pacific'],
+         [pd.Timestamp('2010-01-01 12:00:00', tz='UTC'),
+          pd.Timestamp('2010-01-01 12:00:00', tz='GMT'),
+          pd.Timestamp('2010-01-01 12:00:00', tz='US/Pacific')]],
+        ['%Y-%m-%d %H:%M:%S%z',
+         ['2010-01-01 12:00:00+0100'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60))] * 2],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 +0100'] * 2,
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60))] * 2],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 +0100', '2010-01-01 12:00:00 -0100'],
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(60)),
+          pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(-60))]],
+        ['%Y-%m-%d %H:%M:%S %z',
+         ['2010-01-01 12:00:00 Z', '2010-01-01 12:00:00 Z'],
+         [pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(0)),  # pytz coerces to UTC
+          pd.Timestamp('2010-01-01 12:00:00',
+                       tzinfo=pytz.FixedOffset(0))]]])
+    def test_to_datetime_parse_tzname_or_tzoffset(self, box, const,
+                                                  fmt, dates, expected_dates):
+        # GH 13486
+        result = pd.to_datetime(dates, format=fmt, box=box)
+        expected = const(expected_dates)
+        tm.assert_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(dates, format=fmt, box=box, utc=True)
+
+    @pytest.mark.parametrize('offset', [
+        '+0', '-1foo', 'UTCbar', ':10', '+01:000:01', ''])
+    def test_to_datetime_parse_timezone_malformed(self, offset):
+        fmt = '%Y-%m-%d %H:%M:%S %z'
+        date = '2010-01-01 12:00:00 ' + offset
+        with pytest.raises(ValueError):
+            pd.to_datetime([date], format=fmt)
+
+    def test_to_datetime_parse_timezone_keeps_name(self):
+        # GH 21697
+        fmt = '%Y-%m-%d %H:%M:%S %z'
+        arg = pd.Index(['2010-01-01 12:00:00 Z'], name='foo')
+        result = pd.to_datetime(arg, format=fmt)
+        expected = pd.DatetimeIndex(['2010-01-01 12:00:00'], tz='UTC',
+                                    name='foo')
+        tm.assert_index_equal(result, expected)
 
-class TestToDatetime(tm.TestCase):
 
-    def test_to_datetime_dt64s(self):
+class TestToDatetime(object):
+    @pytest.mark.parametrize('tz', [None, 'US/Central'])
+    def test_to_datetime_dtarr(self, tz):
+        # DatetimeArray
+        dti = date_range('1965-04-03', periods=19, freq='2W', tz=tz)
+        arr = DatetimeArray(dti)
+
+        result = to_datetime(arr)
+        assert result is arr
+
+        result = to_datetime(arr, box=True)
+        assert result is arr
+
+    def test_to_datetime_pydatetime(self):
+        actual = pd.to_datetime(datetime(2008, 1, 15))
+        assert actual == datetime(2008, 1, 15)
+
+    def test_to_datetime_YYYYMMDD(self):
+        actual = pd.to_datetime('20080115')
+        assert actual == datetime(2008, 1, 15)
+
+    def test_to_datetime_unparseable_ignore(self):
+        # unparseable
+        s = 'Month 1, 1999'
+        assert pd.to_datetime(s, errors='ignore') == s
+
+    @td.skip_if_windows  # `tm.set_timezone` does not work in windows
+    def test_to_datetime_now(self):
+        # See GH#18666
+        with tm.set_timezone('US/Eastern'):
+            npnow = np.datetime64('now').astype('datetime64[ns]')
+            pdnow = pd.to_datetime('now')
+            pdnow2 = pd.to_datetime(['now'])[0]
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdnow.value - npnow.astype(np.int64)) < 1e10
+            assert abs(pdnow2.value - npnow.astype(np.int64)) < 1e10
+
+            assert pdnow.tzinfo is None
+            assert pdnow2.tzinfo is None
+
+    @td.skip_if_windows  # `tm.set_timezone` does not work in windows
+    def test_to_datetime_today(self):
+        # See GH#18666
+        # Test with one timezone far ahead of UTC and another far behind, so
+        # one of these will _almost_ alawys be in a different day from UTC.
+        # Unfortunately this test between 12 and 1 AM Samoa time
+        # this both of these timezones _and_ UTC will all be in the same day,
+        # so this test will not detect the regression introduced in #18666.
+        with tm.set_timezone('Pacific/Auckland'):  # 12-13 hours ahead of UTC
+            nptoday = np.datetime64('today')\
+                .astype('datetime64[ns]').astype(np.int64)
+            pdtoday = pd.to_datetime('today')
+            pdtoday2 = pd.to_datetime(['today'])[0]
+
+            tstoday = pd.Timestamp('today')
+            tstoday2 = pd.Timestamp.today()
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdtoday.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday2.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday.value - tstoday.value) < 1e10
+            assert abs(pdtoday.value - tstoday2.value) < 1e10
+
+            assert pdtoday.tzinfo is None
+            assert pdtoday2.tzinfo is None
+
+        with tm.set_timezone('US/Samoa'):  # 11 hours behind UTC
+            nptoday = np.datetime64('today')\
+                .astype('datetime64[ns]').astype(np.int64)
+            pdtoday = pd.to_datetime('today')
+            pdtoday2 = pd.to_datetime(['today'])[0]
+
+            # These should all be equal with infinite perf; this gives
+            # a generous margin of 10 seconds
+            assert abs(pdtoday.normalize().value - nptoday) < 1e10
+            assert abs(pdtoday2.normalize().value - nptoday) < 1e10
+
+            assert pdtoday.tzinfo is None
+            assert pdtoday2.tzinfo is None
+
+    def test_to_datetime_today_now_unicode_bytes(self):
+        to_datetime([u'now'])
+        to_datetime([u'today'])
+        if not PY3:
+            to_datetime(['now'])
+            to_datetime(['today'])
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_dt64s(self, cache):
         in_bound_dts = [
             np.datetime64('2000-01-01'),
             np.datetime64('2000-01-02'),
         ]
 
         for dt in in_bound_dts:
-            self.assertEqual(pd.to_datetime(dt), Timestamp(dt))
-
-        oob_dts = [np.datetime64('1000-01-01'), np.datetime64('5000-01-02'), ]
-
-        for dt in oob_dts:
-            self.assertRaises(ValueError, pd.to_datetime, dt, errors='raise')
-            self.assertRaises(ValueError, Timestamp, dt)
-            self.assertIs(pd.to_datetime(dt, errors='coerce'), NaT)
-
-    def test_to_datetime_array_of_dt64s(self):
+            assert pd.to_datetime(dt, cache=cache) == Timestamp(dt)
+
+    @pytest.mark.parametrize('dt', [np.datetime64('1000-01-01'),
+                                    np.datetime64('5000-01-02')])
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_dt64s_out_of_bounds(self, cache, dt):
+        msg = "Out of bounds nanosecond timestamp: {}".format(dt)
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            pd.to_datetime(dt, errors='raise')
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            Timestamp(dt)
+        assert pd.to_datetime(dt, errors='coerce', cache=cache) is NaT
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_array_of_dt64s(self, cache):
         dts = [np.datetime64('2000-01-01'), np.datetime64('2000-01-02'), ]
 
         # Assuming all datetimes are in bounds, to_datetime() returns
         # an array that is equal to Timestamp() parsing
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts, box=False),
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts, box=False, cache=cache),
             np.array([Timestamp(x).asm8 for x in dts])
         )
 
         # A list of datetimes where the last one is out of bounds
         dts_with_oob = dts + [np.datetime64('9999-01-01')]
 
-        self.assertRaises(ValueError, pd.to_datetime, dts_with_oob,
-                          errors='raise')
+        msg = "Out of bounds nanosecond timestamp: 9999-01-01 00:00:00"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            pd.to_datetime(dts_with_oob, errors='raise')
 
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts_with_oob, box=False, errors='coerce'),
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts_with_oob, box=False, errors='coerce',
+                           cache=cache),
             np.array(
                 [
                     Timestamp(dts_with_oob[0]).asm8,
@@ -219,21 +391,23 @@ def test_to_datetime_array_of_dt64s(self):
         # With errors='ignore', out of bounds datetime64s
         # are converted to their .item(), which depending on the version of
         # numpy is either a python datetime.datetime or datetime.date
-        self.assert_numpy_array_equal(
-            pd.to_datetime(dts_with_oob, box=False, errors='ignore'),
+        tm.assert_numpy_array_equal(
+            pd.to_datetime(dts_with_oob, box=False, errors='ignore',
+                           cache=cache),
             np.array(
                 [dt.item() for dt in dts_with_oob],
                 dtype='O'
             )
         )
 
-    def test_to_datetime_tz(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz(self, cache):
 
         # xref 8260
         # uniform returns a DatetimeIndex
         arr = [pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
                pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')]
-        result = pd.to_datetime(arr)
+        result = pd.to_datetime(arr, cache=cache)
         expected = DatetimeIndex(
             ['2013-01-01 13:00:00', '2013-01-02 14:00:00'], tz='US/Pacific')
         tm.assert_index_equal(result, expected)
@@ -241,37 +415,85 @@ def test_to_datetime_tz(self):
         # mixed tzs will raise
         arr = [pd.Timestamp('2013-01-01 13:00:00', tz='US/Pacific'),
                pd.Timestamp('2013-01-02 14:00:00', tz='US/Eastern')]
-        self.assertRaises(ValueError, lambda: pd.to_datetime(arr))
-
-    def test_to_datetime_tz_pytz(self):
-
-        # xref 8260
-        tm._skip_if_no_pytz()
-        import pytz
-
+        msg = ("Tz-aware datetime.datetime cannot be converted to datetime64"
+               " unless utc=True")
+        with pytest.raises(ValueError, match=msg):
+            pd.to_datetime(arr, cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz_pytz(self, cache):
+        # see gh-8260
         us_eastern = pytz.timezone('US/Eastern')
         arr = np.array([us_eastern.localize(datetime(year=2000, month=1, day=1,
                                                      hour=3, minute=0)),
                         us_eastern.localize(datetime(year=2000, month=6, day=1,
                                                      hour=3, minute=0))],
                        dtype=object)
-        result = pd.to_datetime(arr, utc=True)
+        result = pd.to_datetime(arr, utc=True, cache=cache)
         expected = DatetimeIndex(['2000-01-01 08:00:00+00:00',
                                   '2000-06-01 07:00:00+00:00'],
                                  dtype='datetime64[ns, UTC]', freq=None)
         tm.assert_index_equal(result, expected)
 
-    def test_to_datetime_utc_is_true(self):
-        # See gh-11934
-        start = pd.Timestamp('2014-01-01', tz='utc')
-        end = pd.Timestamp('2014-01-03', tz='utc')
-        date_range = pd.bdate_range(start, end)
-
-        result = pd.to_datetime(date_range, utc=True)
-        expected = pd.DatetimeIndex(data=date_range)
-        tm.assert_index_equal(result, expected)
-
-    def test_to_datetime_tz_psycopg2(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize("init_constructor, end_constructor, test_method",
+                             [(Index, DatetimeIndex, tm.assert_index_equal),
+                              (list, DatetimeIndex, tm.assert_index_equal),
+                              (np.array, DatetimeIndex, tm.assert_index_equal),
+                              (Series, Series, tm.assert_series_equal)])
+    def test_to_datetime_utc_true(self,
+                                  cache,
+                                  init_constructor,
+                                  end_constructor,
+                                  test_method):
+        # See gh-11934 & gh-6415
+        data = ['20100102 121314', '20100102 121315']
+        expected_data = [pd.Timestamp('2010-01-02 12:13:14', tz='utc'),
+                         pd.Timestamp('2010-01-02 12:13:15', tz='utc')]
+
+        result = pd.to_datetime(init_constructor(data),
+                                format='%Y%m%d %H%M%S',
+                                utc=True,
+                                cache=cache)
+        expected = end_constructor(expected_data)
+        test_method(result, expected)
+
+        # Test scalar case as well
+        for scalar, expected in zip(data, expected_data):
+            result = pd.to_datetime(scalar, format='%Y%m%d %H%M%S', utc=True,
+                                    cache=cache)
+            assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_utc_true_with_series_single_value(self, cache):
+        # GH 15760 UTC=True with Series
+        ts = 1.5e18
+        result = pd.to_datetime(pd.Series([ts]), utc=True, cache=cache)
+        expected = pd.Series([pd.Timestamp(ts, tz='utc')])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_utc_true_with_series_tzaware_string(self, cache):
+        ts = '2013-01-01 00:00:00-01:00'
+        expected_ts = '2013-01-01 01:00:00'
+        data = pd.Series([ts] * 3)
+        result = pd.to_datetime(data, utc=True, cache=cache)
+        expected = pd.Series([pd.Timestamp(expected_ts, tz='utc')] * 3)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize('date, dtype',
+                             [('2013-01-01 01:00:00', 'datetime64[ns]'),
+                              ('2013-01-01 01:00:00', 'datetime64[ns, UTC]')])
+    def test_to_datetime_utc_true_with_series_datetime_ns(self, cache, date,
+                                                          dtype):
+        expected = pd.Series([pd.Timestamp('2013-01-01 01:00:00', tz='UTC')])
+        result = pd.to_datetime(pd.Series([date], dtype=dtype), utc=True,
+                                cache=cache)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_tz_psycopg2(self, cache):
 
         # xref 8260
         try:
@@ -286,7 +508,7 @@ def test_to_datetime_tz_psycopg2(self):
                         datetime(2000, 6, 1, 3, 0, tzinfo=tz2)],
                        dtype=object)
 
-        result = pd.to_datetime(arr, errors='coerce', utc=True)
+        result = pd.to_datetime(arr, errors='coerce', utc=True, cache=cache)
         expected = DatetimeIndex(['2000-01-01 08:00:00+00:00',
                                   '2000-06-01 07:00:00+00:00'],
                                  dtype='datetime64[ns, UTC]', freq=None)
@@ -294,114 +516,316 @@ def test_to_datetime_tz_psycopg2(self):
 
         # dtype coercion
         i = pd.DatetimeIndex([
-            '2000-01-01 08:00:00+00:00'
+            '2000-01-01 08:00:00'
         ], tz=psycopg2.tz.FixedOffsetTimezone(offset=-300, name=None))
-        self.assertTrue(is_datetime64_ns_dtype(i))
+        assert is_datetime64_ns_dtype(i)
 
         # tz coerceion
-        result = pd.to_datetime(i, errors='coerce')
+        result = pd.to_datetime(i, errors='coerce', cache=cache)
         tm.assert_index_equal(result, i)
 
-        result = pd.to_datetime(i, errors='coerce', utc=True)
+        result = pd.to_datetime(i, errors='coerce', utc=True, cache=cache)
         expected = pd.DatetimeIndex(['2000-01-01 13:00:00'],
                                     dtype='datetime64[ns, UTC]')
         tm.assert_index_equal(result, expected)
 
-    def test_datetime_bool(self):
+    @pytest.mark.parametrize(
+        'cache',
+        [pytest.param(True,
+                      marks=pytest.mark.skipif(True, reason="GH 18111")),
+         False])
+    def test_datetime_bool(self, cache):
         # GH13176
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             to_datetime(False)
-        self.assertTrue(to_datetime(False, errors="coerce") is NaT)
-        self.assertEqual(to_datetime(False, errors="ignore"), False)
-        with self.assertRaises(TypeError):
+        assert to_datetime(False, errors="coerce", cache=cache) is NaT
+        assert to_datetime(False, errors="ignore", cache=cache) is False
+        with pytest.raises(TypeError):
             to_datetime(True)
-        self.assertTrue(to_datetime(True, errors="coerce") is NaT)
-        self.assertEqual(to_datetime(True, errors="ignore"), True)
-        with self.assertRaises(TypeError):
-            to_datetime([False, datetime.today()])
-        with self.assertRaises(TypeError):
-            to_datetime(['20130101', True])
+        assert to_datetime(True, errors="coerce", cache=cache) is NaT
+        assert to_datetime(True, errors="ignore", cache=cache) is True
+        with pytest.raises(TypeError):
+            to_datetime([False, datetime.today()], cache=cache)
+        with pytest.raises(TypeError):
+            to_datetime(['20130101', True], cache=cache)
         tm.assert_index_equal(to_datetime([0, False, NaT, 0.0],
-                                          errors="coerce"),
-                              DatetimeIndex([to_datetime(0), NaT,
-                                             NaT, to_datetime(0)]))
+                                          errors="coerce", cache=cache),
+                              DatetimeIndex([to_datetime(0, cache=cache),
+                                             NaT,
+                                             NaT,
+                                             to_datetime(0, cache=cache)]))
 
     def test_datetime_invalid_datatype(self):
         # GH13176
 
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             pd.to_datetime(bool)
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             pd.to_datetime(pd.to_datetime)
 
+    @pytest.mark.parametrize('value', ["a", "00:01:99"])
+    @pytest.mark.parametrize('infer', [True, False])
+    @pytest.mark.parametrize('format', [None, 'H%:M%:S%'])
+    def test_datetime_invalid_scalar(self, value, format, infer):
+        # GH24763
+        res = pd.to_datetime(value, errors='ignore', format=format,
+                             infer_datetime_format=infer)
+        assert res == value
+
+        res = pd.to_datetime(value, errors='coerce', format=format,
+                             infer_datetime_format=infer)
+        assert res is pd.NaT
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(value, errors='raise', format=format,
+                           infer_datetime_format=infer)
+
+    @pytest.mark.parametrize('value', ["3000/12/11 00:00:00"])
+    @pytest.mark.parametrize('infer', [True, False])
+    @pytest.mark.parametrize('format', [None, 'H%:M%:S%'])
+    def test_datetime_outofbounds_scalar(self, value, format, infer):
+        # GH24763
+        res = pd.to_datetime(value, errors='ignore', format=format,
+                             infer_datetime_format=infer)
+        assert res == value
+
+        res = pd.to_datetime(value, errors='coerce', format=format,
+                             infer_datetime_format=infer)
+        assert res is pd.NaT
+
+        if format is not None:
+            with pytest.raises(ValueError):
+                pd.to_datetime(value, errors='raise', format=format,
+                               infer_datetime_format=infer)
+        else:
+            with pytest.raises(OutOfBoundsDatetime):
+                pd.to_datetime(value, errors='raise', format=format,
+                               infer_datetime_format=infer)
+
+    @pytest.mark.parametrize('values', [["a"], ["00:01:99"],
+                                        ["a", "b", "99:00:00"]])
+    @pytest.mark.parametrize('infer', [True, False])
+    @pytest.mark.parametrize('format', [None, 'H%:M%:S%'])
+    def test_datetime_invalid_index(self, values, format, infer):
+        # GH24763
+        res = pd.to_datetime(values, errors='ignore', format=format,
+                             infer_datetime_format=infer)
+        tm.assert_index_equal(res, pd.Index(values))
+
+        res = pd.to_datetime(values, errors='coerce', format=format,
+                             infer_datetime_format=infer)
+        tm.assert_index_equal(res, pd.DatetimeIndex([pd.NaT] * len(values)))
+
+        with pytest.raises(ValueError):
+            pd.to_datetime(values, errors='raise', format=format,
+                           infer_datetime_format=infer)
+
+    @pytest.mark.parametrize("utc", [True, None])
+    @pytest.mark.parametrize("format", ['%Y%m%d %H:%M:%S', None])
+    @pytest.mark.parametrize("box", [True, False])
+    @pytest.mark.parametrize("constructor", [list, tuple, np.array, pd.Index])
+    def test_to_datetime_cache(self, utc, format, box, constructor):
+        date = '20130101 00:00:00'
+        test_dates = [date] * 10**5
+        data = constructor(test_dates)
+        result = pd.to_datetime(data, utc=utc, format=format, box=box,
+                                cache=True)
+        expected = pd.to_datetime(data, utc=utc, format=format, box=box,
+                                  cache=False)
+        if box:
+            tm.assert_index_equal(result, expected)
+        else:
+            tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("utc", [True, None])
+    @pytest.mark.parametrize("format", ['%Y%m%d %H:%M:%S', None])
+    def test_to_datetime_cache_series(self, utc, format):
+        date = '20130101 00:00:00'
+        test_dates = [date] * 10**5
+        data = pd.Series(test_dates)
+        result = pd.to_datetime(data, utc=utc, format=format, cache=True)
+        expected = pd.to_datetime(data, utc=utc, format=format, cache=False)
+        tm.assert_series_equal(result, expected)
+
+    def test_to_datetime_cache_scalar(self):
+        date = '20130101 00:00:00'
+        result = pd.to_datetime(date, cache=True)
+        expected = pd.Timestamp('20130101 00:00:00')
+        assert result == expected
+
+    @pytest.mark.parametrize('date, format',
+                             [('2017-20', '%Y-%W'),
+                              ('20 Sunday', '%W %A'),
+                              ('20 Sun', '%W %a'),
+                              ('2017-21', '%Y-%U'),
+                              ('20 Sunday', '%U %A'),
+                              ('20 Sun', '%U %a')])
+    def test_week_without_day_and_calendar_year(self, date, format):
+        # GH16774
+
+        msg = "Cannot use '%W' or '%U' without day and year"
+        with pytest.raises(ValueError, match=msg):
+            pd.to_datetime(date, format=format)
+
+    def test_iso_8601_strings_with_same_offset(self):
+        # GH 17697, 11736
+        ts_str = "2015-11-18 15:30:00+05:30"
+        result = to_datetime(ts_str)
+        expected = Timestamp(ts_str)
+        assert result == expected
+
+        expected = DatetimeIndex([Timestamp(ts_str)] * 2)
+        result = to_datetime([ts_str] * 2)
+        tm.assert_index_equal(result, expected)
 
-class ToDatetimeUnit(tm.TestCase):
+        result = DatetimeIndex([ts_str] * 2)
+        tm.assert_index_equal(result, expected)
 
-    def test_unit(self):
+    def test_iso_8601_strings_same_offset_no_box(self):
+        # GH 22446
+        data = ['2018-01-04 09:01:00+09:00', '2018-01-04 09:02:00+09:00']
+        result = pd.to_datetime(data, box=False)
+        expected = np.array([
+            datetime(2018, 1, 4, 9, 1, tzinfo=pytz.FixedOffset(540)),
+            datetime(2018, 1, 4, 9, 2, tzinfo=pytz.FixedOffset(540))
+        ],
+            dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_iso_8601_strings_with_different_offsets(self):
+        # GH 17697, 11736
+        ts_strings = ["2015-11-18 15:30:00+05:30",
+                      "2015-11-18 16:30:00+06:30",
+                      NaT]
+        result = to_datetime(ts_strings)
+        expected = np.array([datetime(2015, 11, 18, 15, 30,
+                                      tzinfo=tzoffset(None, 19800)),
+                             datetime(2015, 11, 18, 16, 30,
+                                      tzinfo=tzoffset(None, 23400)),
+                             NaT],
+                            dtype=object)
+        # GH 21864
+        expected = Index(expected)
+        tm.assert_index_equal(result, expected)
+
+        result = to_datetime(ts_strings, utc=True)
+        expected = DatetimeIndex([Timestamp(2015, 11, 18, 10),
+                                  Timestamp(2015, 11, 18, 10),
+                                  NaT], tz='UTC')
+        tm.assert_index_equal(result, expected)
+
+    def test_iss8601_strings_mixed_offsets_with_naive(self):
+        # GH 24992
+        result = pd.to_datetime([
+            '2018-11-28T00:00:00',
+            '2018-11-28T00:00:00+12:00',
+            '2018-11-28T00:00:00',
+            '2018-11-28T00:00:00+06:00',
+            '2018-11-28T00:00:00'
+        ], utc=True)
+        expected = pd.to_datetime([
+            '2018-11-28T00:00:00',
+            '2018-11-27T12:00:00',
+            '2018-11-28T00:00:00',
+            '2018-11-27T18:00:00',
+            '2018-11-28T00:00:00'
+        ], utc=True)
+        tm.assert_index_equal(result, expected)
+
+        items = ['2018-11-28T00:00:00+12:00', '2018-11-28T00:00:00']
+        result = pd.to_datetime(items, utc=True)
+        expected = pd.to_datetime(list(reversed(items)), utc=True)[::-1]
+        tm.assert_index_equal(result, expected)
+
+    def test_non_iso_strings_with_tz_offset(self):
+        result = to_datetime(['March 1, 2018 12:00:00+0400'] * 2)
+        expected = DatetimeIndex([datetime(2018, 3, 1, 12,
+                                           tzinfo=pytz.FixedOffset(240))] * 2)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('ts, expected', [
+        (Timestamp('2018-01-01'),
+         Timestamp('2018-01-01', tz='UTC')),
+        (Timestamp('2018-01-01', tz='US/Pacific'),
+         Timestamp('2018-01-01 08:00', tz='UTC'))])
+    def test_timestamp_utc_true(self, ts, expected):
+        # GH 24415
+        result = to_datetime(ts, utc=True)
+        assert result == expected
+
+
+class TestToDatetimeUnit(object):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit(self, cache):
         # GH 11758
         # test proper behavior with erros
 
-        with self.assertRaises(ValueError):
-            to_datetime([1], unit='D', format='%Y%m%d')
+        with pytest.raises(ValueError):
+            to_datetime([1], unit='D', format='%Y%m%d', cache=cache)
 
-        values = [11111111, 1, 1.0, tslib.iNaT, NaT, np.nan,
+        values = [11111111, 1, 1.0, iNaT, NaT, np.nan,
                   'NaT', '']
-        result = to_datetime(values, unit='D', errors='ignore')
+        result = to_datetime(values, unit='D', errors='ignore', cache=cache)
         expected = Index([11111111, Timestamp('1970-01-02'),
                           Timestamp('1970-01-02'), NaT,
                           NaT, NaT, NaT, NaT],
                          dtype=object)
         tm.assert_index_equal(result, expected)
 
-        result = to_datetime(values, unit='D', errors='coerce')
+        result = to_datetime(values, unit='D', errors='coerce', cache=cache)
         expected = DatetimeIndex(['NaT', '1970-01-02', '1970-01-02',
                                   'NaT', 'NaT', 'NaT', 'NaT', 'NaT'])
         tm.assert_index_equal(result, expected)
 
-        with self.assertRaises(tslib.OutOfBoundsDatetime):
-            to_datetime(values, unit='D', errors='raise')
+        with pytest.raises(tslib.OutOfBoundsDatetime):
+            to_datetime(values, unit='D', errors='raise', cache=cache)
 
-        values = [1420043460000, tslib.iNaT, NaT, np.nan, 'NaT']
+        values = [1420043460000, iNaT, NaT, np.nan, 'NaT']
 
-        result = to_datetime(values, errors='ignore', unit='s')
+        result = to_datetime(values, errors='ignore', unit='s', cache=cache)
         expected = Index([1420043460000, NaT, NaT,
                           NaT, NaT], dtype=object)
         tm.assert_index_equal(result, expected)
 
-        result = to_datetime(values, errors='coerce', unit='s')
+        result = to_datetime(values, errors='coerce', unit='s', cache=cache)
         expected = DatetimeIndex(['NaT', 'NaT', 'NaT', 'NaT', 'NaT'])
         tm.assert_index_equal(result, expected)
 
-        with self.assertRaises(tslib.OutOfBoundsDatetime):
-            to_datetime(values, errors='raise', unit='s')
+        with pytest.raises(tslib.OutOfBoundsDatetime):
+            to_datetime(values, errors='raise', unit='s', cache=cache)
 
         # if we have a string, then we raise a ValueError
         # and NOT an OutOfBoundsDatetime
         for val in ['foo', Timestamp('20130101')]:
             try:
-                to_datetime(val, errors='raise', unit='s')
+                to_datetime(val, errors='raise', unit='s', cache=cache)
             except tslib.OutOfBoundsDatetime:
                 raise AssertionError("incorrect exception raised")
             except ValueError:
                 pass
 
-    def test_unit_consistency(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_consistency(self, cache):
 
         # consistency of conversions
         expected = Timestamp('1970-05-09 14:25:11')
-        result = pd.to_datetime(11111111, unit='s', errors='raise')
-        self.assertEqual(result, expected)
-        self.assertIsInstance(result, Timestamp)
+        result = pd.to_datetime(11111111, unit='s', errors='raise',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
 
-        result = pd.to_datetime(11111111, unit='s', errors='coerce')
-        self.assertEqual(result, expected)
-        self.assertIsInstance(result, Timestamp)
+        result = pd.to_datetime(11111111, unit='s', errors='coerce',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
 
-        result = pd.to_datetime(11111111, unit='s', errors='ignore')
-        self.assertEqual(result, expected)
-        self.assertIsInstance(result, Timestamp)
+        result = pd.to_datetime(11111111, unit='s', errors='ignore',
+                                cache=cache)
+        assert result == expected
+        assert isinstance(result, Timestamp)
 
-    def test_unit_with_numeric(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_with_numeric(self, cache):
 
         # GH 13180
         # coercions from floats/ints are ok
@@ -410,10 +834,10 @@ def test_unit_with_numeric(self):
         arr1 = [1.434692e+18, 1.432766e+18]
         arr2 = np.array(arr1).astype('int64')
         for errors in ['ignore', 'raise', 'coerce']:
-            result = pd.to_datetime(arr1, errors=errors)
+            result = pd.to_datetime(arr1, errors=errors, cache=cache)
             tm.assert_index_equal(result, expected)
 
-            result = pd.to_datetime(arr2, errors=errors)
+            result = pd.to_datetime(arr2, errors=errors, cache=cache)
             tm.assert_index_equal(result, expected)
 
         # but we want to make sure that we are coercing
@@ -422,7 +846,7 @@ def test_unit_with_numeric(self):
                                   '2015-06-19 05:33:20',
                                   '2015-05-27 22:33:20'])
         arr = ['foo', 1.434692e+18, 1.432766e+18]
-        result = pd.to_datetime(arr, errors='coerce')
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
         tm.assert_index_equal(result, expected)
 
         expected = DatetimeIndex(['2015-06-19 05:33:20',
@@ -430,31 +854,49 @@ def test_unit_with_numeric(self):
                                   'NaT',
                                   'NaT'])
         arr = [1.434692e+18, 1.432766e+18, 'foo', 'NaT']
-        result = pd.to_datetime(arr, errors='coerce')
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
         tm.assert_index_equal(result, expected)
 
-    def test_unit_mixed(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_mixed(self, cache):
 
         # mixed integers/datetimes
         expected = DatetimeIndex(['2013-01-01', 'NaT', 'NaT'])
         arr = [pd.Timestamp('20130101'), 1.434692e+18, 1.432766e+18]
-        result = pd.to_datetime(arr, errors='coerce')
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
         tm.assert_index_equal(result, expected)
 
-        with self.assertRaises(ValueError):
-            pd.to_datetime(arr, errors='raise')
+        with pytest.raises(ValueError):
+            pd.to_datetime(arr, errors='raise', cache=cache)
 
         expected = DatetimeIndex(['NaT',
                                   'NaT',
                                   '2013-01-01'])
         arr = [1.434692e+18, 1.432766e+18, pd.Timestamp('20130101')]
-        result = pd.to_datetime(arr, errors='coerce')
+        result = pd.to_datetime(arr, errors='coerce', cache=cache)
         tm.assert_index_equal(result, expected)
 
-        with self.assertRaises(ValueError):
-            pd.to_datetime(arr, errors='raise')
+        with pytest.raises(ValueError):
+            pd.to_datetime(arr, errors='raise', cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_rounding(self, cache):
+        # GH 14156: argument will incur floating point errors but no
+        # premature rounding
+        result = pd.to_datetime(1434743731.8770001, unit='s', cache=cache)
+        expected = pd.Timestamp('2015-06-19 19:55:31.877000093')
+        assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_unit_ignore_keeps_name(self, cache):
+        # GH 21697
+        expected = pd.Index([15e9] * 2, name='name')
+        result = pd.to_datetime(expected, errors='ignore', box=True, unit='s',
+                                cache=cache)
+        tm.assert_index_equal(result, expected)
 
-    def test_dataframe(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dataframe(self, cache):
 
         df = DataFrame({'year': [2015, 2016],
                         'month': [2, 3],
@@ -468,19 +910,20 @@ def test_dataframe(self):
 
         result = to_datetime({'year': df['year'],
                               'month': df['month'],
-                              'day': df['day']})
+                              'day': df['day']}, cache=cache)
         expected = Series([Timestamp('20150204 00:00:00'),
                            Timestamp('20160305 00:0:00')])
         assert_series_equal(result, expected)
 
         # dict-like
-        result = to_datetime(df[['year', 'month', 'day']].to_dict())
+        result = to_datetime(df[['year', 'month', 'day']].to_dict(),
+                             cache=cache)
         assert_series_equal(result, expected)
 
         # dict but with constructable
         df2 = df[['year', 'month', 'day']].to_dict()
         df2['month'] = 2
-        result = to_datetime(df2)
+        result = to_datetime(df2, cache=cache)
         expected2 = Series([Timestamp('20150204 00:00:00'),
                             Timestamp('20160205 00:0:00')])
         assert_series_equal(result, expected2)
@@ -501,7 +944,8 @@ def test_dataframe(self):
                  ]
 
         for d in units:
-            result = to_datetime(df[list(d.keys())].rename(columns=d))
+            result = to_datetime(df[list(d.keys())].rename(columns=d),
+                                 cache=cache)
             expected = Series([Timestamp('20150204 06:58:10'),
                                Timestamp('20160305 07:59:11')])
             assert_series_equal(result, expected)
@@ -516,65 +960,74 @@ def test_dataframe(self):
              'us': 'us',
              'ns': 'ns'}
 
-        result = to_datetime(df.rename(columns=d))
+        result = to_datetime(df.rename(columns=d), cache=cache)
         expected = Series([Timestamp('20150204 06:58:10.001002003'),
                            Timestamp('20160305 07:59:11.001002003')])
         assert_series_equal(result, expected)
 
         # coerce back to int
-        result = to_datetime(df.astype(str))
+        result = to_datetime(df.astype(str), cache=cache)
         assert_series_equal(result, expected)
 
         # passing coerce
         df2 = DataFrame({'year': [2015, 2016],
                          'month': [2, 20],
                          'day': [4, 5]})
-        with self.assertRaises(ValueError):
-            to_datetime(df2)
-        result = to_datetime(df2, errors='coerce')
+
+        msg = ("cannot assemble the datetimes: time data .+ does not "
+               r"match format '%Y%m%d' \(match\)")
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(df2, cache=cache)
+        result = to_datetime(df2, errors='coerce', cache=cache)
         expected = Series([Timestamp('20150204 00:00:00'),
                            NaT])
         assert_series_equal(result, expected)
 
         # extra columns
-        with self.assertRaises(ValueError):
+        msg = ("extra keys have been passed to the datetime assemblage: "
+               r"\[foo\]")
+        with pytest.raises(ValueError, match=msg):
             df2 = df.copy()
             df2['foo'] = 1
-            to_datetime(df2)
+            to_datetime(df2, cache=cache)
 
         # not enough
+        msg = (r'to assemble mappings requires at least that \[year, month, '
+               r'day\] be specified: \[.+\] is missing')
         for c in [['year'],
                   ['year', 'month'],
                   ['year', 'month', 'second'],
                   ['month', 'day'],
                   ['year', 'day', 'second']]:
-            with self.assertRaises(ValueError):
-                to_datetime(df[c])
+            with pytest.raises(ValueError, match=msg):
+                to_datetime(df[c], cache=cache)
 
         # duplicates
+        msg = 'cannot assemble with duplicate keys'
         df2 = DataFrame({'year': [2015, 2016],
                          'month': [2, 20],
                          'day': [4, 5]})
         df2.columns = ['year', 'year', 'day']
-        with self.assertRaises(ValueError):
-            to_datetime(df2)
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(df2, cache=cache)
 
         df2 = DataFrame({'year': [2015, 2016],
                          'month': [2, 20],
                          'day': [4, 5],
                          'hour': [4, 5]})
         df2.columns = ['year', 'month', 'day', 'day']
-        with self.assertRaises(ValueError):
-            to_datetime(df2)
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(df2, cache=cache)
 
-    def test_dataframe_dtypes(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dataframe_dtypes(self, cache):
         # #13451
         df = DataFrame({'year': [2015, 2016],
                         'month': [2, 3],
                         'day': [4, 5]})
 
         # int16
-        result = to_datetime(df.astype('int16'))
+        result = to_datetime(df.astype('int16'), cache=cache)
         expected = Series([Timestamp('20150204 00:00:00'),
                            Timestamp('20160305 00:00:00')])
         assert_series_equal(result, expected)
@@ -582,7 +1035,7 @@ def test_dataframe_dtypes(self):
         # mixed dtypes
         df['month'] = df['month'].astype('int8')
         df['day'] = df['day'].astype('int8')
-        result = to_datetime(df)
+        result = to_datetime(df, cache=cache)
         expected = Series([Timestamp('20150204 00:00:00'),
                            Timestamp('20160305 00:00:00')])
         assert_series_equal(result, expected)
@@ -591,129 +1044,163 @@ def test_dataframe_dtypes(self):
         df = DataFrame({'year': [2000, 2001],
                         'month': [1.5, 1],
                         'day': [1, 1]})
-        with self.assertRaises(ValueError):
-            to_datetime(df)
-
-
-class ToDatetimeMisc(tm.TestCase):
+        with pytest.raises(ValueError):
+            to_datetime(df, cache=cache)
+
+    def test_dataframe_box_false(self):
+        # GH 23760
+        df = pd.DataFrame({'year': [2015, 2016],
+                           'month': [2, 3],
+                           'day': [4, 5]})
+        result = pd.to_datetime(df, box=False)
+        expected = np.array(['2015-02-04', '2016-03-05'],
+                            dtype='datetime64[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_dataframe_utc_true(self):
+        # GH 23760
+        df = pd.DataFrame({'year': [2015, 2016],
+                           'month': [2, 3],
+                           'day': [4, 5]})
+        result = pd.to_datetime(df, utc=True)
+        expected = pd.Series(np.array(['2015-02-04', '2016-03-05'],
+                             dtype='datetime64[ns]')).dt.tz_localize('UTC')
+        tm.assert_series_equal(result, expected)
+
+    def test_to_datetime_errors_ignore_utc_true(self):
+        # GH 23758
+        result = pd.to_datetime([1], unit='s', box=True, utc=True,
+                                errors='ignore')
+        expected = DatetimeIndex(['1970-01-01 00:00:01'], tz='UTC')
+        tm.assert_index_equal(result, expected)
 
-    def test_index_to_datetime(self):
-        idx = Index(['1/1/2000', '1/2/2000', '1/3/2000'])
 
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = idx.to_datetime()
-            expected = DatetimeIndex(pd.to_datetime(idx.values))
-            tm.assert_index_equal(result, expected)
+class TestToDatetimeMisc(object):
+    def test_to_datetime_barely_out_of_bounds(self):
+        # GH#19529
+        # GH#19382 close enough to bounds that dropping nanos would result
+        # in an in-bounds datetime
+        arr = np.array(['2262-04-11 23:47:16.854775808'], dtype=object)
 
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            today = datetime.today()
-            idx = Index([today], dtype=object)
-            result = idx.to_datetime()
-            expected = DatetimeIndex([today])
-            tm.assert_index_equal(result, expected)
+        with pytest.raises(OutOfBoundsDatetime):
+            to_datetime(arr)
 
-    def test_to_datetime_iso8601(self):
-        result = to_datetime(["2012-01-01 00:00:00"])
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_iso8601(self, cache):
+        result = to_datetime(["2012-01-01 00:00:00"], cache=cache)
         exp = Timestamp("2012-01-01 00:00:00")
-        self.assertEqual(result[0], exp)
+        assert result[0] == exp
 
-        result = to_datetime(['20121001'])  # bad iso 8601
+        result = to_datetime(['20121001'], cache=cache)  # bad iso 8601
         exp = Timestamp('2012-10-01')
-        self.assertEqual(result[0], exp)
+        assert result[0] == exp
 
-    def test_to_datetime_default(self):
-        rs = to_datetime('2001')
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_default(self, cache):
+        rs = to_datetime('2001', cache=cache)
         xp = datetime(2001, 1, 1)
-        self.assertTrue(rs, xp)
+        assert rs == xp
 
         # dayfirst is essentially broken
 
         # to_datetime('01-13-2012', dayfirst=True)
-        # self.assertRaises(ValueError, to_datetime('01-13-2012',
+        # pytest.raises(ValueError, to_datetime('01-13-2012',
         #                   dayfirst=True))
 
-    def test_to_datetime_on_datetime64_series(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_on_datetime64_series(self, cache):
         # #2699
         s = Series(date_range('1/1/2000', periods=10))
 
-        result = to_datetime(s)
-        self.assertEqual(result[0], s[0])
+        result = to_datetime(s, cache=cache)
+        assert result[0] == s[0]
 
-    def test_to_datetime_with_space_in_series(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_space_in_series(self, cache):
         # GH 6428
         s = Series(['10/18/2006', '10/18/2008', ' '])
-        tm.assertRaises(ValueError, lambda: to_datetime(s, errors='raise'))
-        result_coerce = to_datetime(s, errors='coerce')
+        msg = r"(\(u?')?String does not contain a date(:', ' '\))?"
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(s, errors='raise', cache=cache)
+        result_coerce = to_datetime(s, errors='coerce', cache=cache)
         expected_coerce = Series([datetime(2006, 10, 18),
                                   datetime(2008, 10, 18),
                                   NaT])
         tm.assert_series_equal(result_coerce, expected_coerce)
-        result_ignore = to_datetime(s, errors='ignore')
+        result_ignore = to_datetime(s, errors='ignore', cache=cache)
         tm.assert_series_equal(result_ignore, s)
 
-    def test_to_datetime_with_apply(self):
+    @td.skip_if_has_locale
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_with_apply(self, cache):
         # this is only locale tested with US/None locales
-        tm._skip_if_has_locale()
-
         # GH 5195
         # with a format and coerce a single item to_datetime fails
         td = Series(['May 04', 'Jun 02', 'Dec 11'], index=[1, 2, 3])
-        expected = pd.to_datetime(td, format='%b %y')
-        result = td.apply(pd.to_datetime, format='%b %y')
+        expected = pd.to_datetime(td, format='%b %y', cache=cache)
+        result = td.apply(pd.to_datetime, format='%b %y', cache=cache)
         assert_series_equal(result, expected)
 
         td = pd.Series(['May 04', 'Jun 02', ''], index=[1, 2, 3])
-        self.assertRaises(ValueError,
-                          lambda: pd.to_datetime(td, format='%b %y',
-                                                 errors='raise'))
-        self.assertRaises(ValueError,
-                          lambda: td.apply(pd.to_datetime, format='%b %y',
-                                           errors='raise'))
-        expected = pd.to_datetime(td, format='%b %y', errors='coerce')
+        msg = r"time data '' does not match format '%b %y' \(match\)"
+        with pytest.raises(ValueError, match=msg):
+            pd.to_datetime(td, format='%b %y', errors='raise', cache=cache)
+        with pytest.raises(ValueError, match=msg):
+            td.apply(pd.to_datetime, format='%b %y',
+                     errors='raise', cache=cache)
+        expected = pd.to_datetime(td, format='%b %y', errors='coerce',
+                                  cache=cache)
 
         result = td.apply(
-            lambda x: pd.to_datetime(x, format='%b %y', errors='coerce'))
+            lambda x: pd.to_datetime(x, format='%b %y', errors='coerce',
+                                     cache=cache))
         assert_series_equal(result, expected)
 
-    def test_to_datetime_types(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_types(self, cache):
 
         # empty string
-        result = to_datetime('')
-        self.assertIs(result, NaT)
+        result = to_datetime('', cache=cache)
+        assert result is NaT
 
-        result = to_datetime(['', ''])
-        self.assertTrue(isnull(result).all())
+        result = to_datetime(['', ''], cache=cache)
+        assert isna(result).all()
 
         # ints
         result = Timestamp(0)
-        expected = to_datetime(0)
-        self.assertEqual(result, expected)
+        expected = to_datetime(0, cache=cache)
+        assert result == expected
 
         # GH 3888 (strings)
-        expected = to_datetime(['2012'])[0]
-        result = to_datetime('2012')
-        self.assertEqual(result, expected)
+        expected = to_datetime(['2012'], cache=cache)[0]
+        result = to_datetime('2012', cache=cache)
+        assert result == expected
 
         # array = ['2012','20120101','20120101 12:01:01']
         array = ['20120101', '20120101 12:01:01']
-        expected = list(to_datetime(array))
+        expected = list(to_datetime(array, cache=cache))
         result = lmap(Timestamp, array)
         tm.assert_almost_equal(result, expected)
 
         # currently fails ###
         # result = Timestamp('2012')
         # expected = to_datetime('2012')
-        # self.assertEqual(result, expected)
-
-    def test_to_datetime_unprocessable_input(self):
+        # assert result == expected
+
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize('box, klass', [
+        [True, Index],
+        [False, np.array]
+    ])
+    def test_to_datetime_unprocessable_input(self, cache, box, klass):
         # GH 4928
-        self.assert_numpy_array_equal(
-            to_datetime([1, '1'], errors='ignore'),
-            np.array([1, '1'], dtype='O')
-        )
-        self.assertRaises(TypeError, to_datetime, [1, '1'], errors='raise')
+        # GH 21864
+        result = to_datetime([1, '1'], errors='ignore', cache=cache, box=box)
+        expected = klass(np.array([1, '1'], dtype='O'))
+        tm.assert_equal(result, expected)
+        msg = "invalid string coercion to datetime"
+        with pytest.raises(TypeError, match=msg):
+            to_datetime([1, '1'], errors='raise', cache=cache, box=box)
 
     def test_to_datetime_other_datetime64_units(self):
         # 5/25/2012
@@ -721,10 +1208,10 @@ def test_to_datetime_other_datetime64_units(self):
         as_obj = scalar.astype('O')
 
         index = DatetimeIndex([scalar])
-        self.assertEqual(index[0], scalar.astype('O'))
+        assert index[0] == scalar.astype('O')
 
         value = Timestamp(scalar)
-        self.assertEqual(value, as_obj)
+        assert value == as_obj
 
     def test_to_datetime_list_of_integers(self):
         rng = date_range('1/1/2000', periods=20)
@@ -736,13 +1223,15 @@ def test_to_datetime_list_of_integers(self):
 
         tm.assert_index_equal(rng, result)
 
-    def test_to_datetime_freq(self):
-        xp = bdate_range('2000-1-1', periods=10, tz='UTC')
-        rs = xp.to_datetime()
-        self.assertEqual(xp.freq, rs.freq)
-        self.assertEqual(xp.tzinfo, rs.tzinfo)
+    def test_to_datetime_overflow(self):
+        # gh-17637
+        # we are overflowing Timedelta range here
+
+        with pytest.raises(OverflowError):
+            date_range(start='1/1/1700', freq='B', periods=100000)
 
-    def test_string_na_nat_conversion(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_string_na_nat_conversion(self, cache):
         # GH #999, #858
 
         from pandas.compat import parse_date
@@ -752,73 +1241,84 @@ def test_string_na_nat_conversion(self):
 
         expected = np.empty(4, dtype='M8[ns]')
         for i, val in enumerate(strings):
-            if isnull(val):
-                expected[i] = tslib.iNaT
+            if isna(val):
+                expected[i] = iNaT
             else:
                 expected[i] = parse_date(val)
 
-        result = tslib.array_to_datetime(strings)
+        result = tslib.array_to_datetime(strings)[0]
         tm.assert_almost_equal(result, expected)
 
-        result2 = to_datetime(strings)
-        tm.assertIsInstance(result2, DatetimeIndex)
+        result2 = to_datetime(strings, cache=cache)
+        assert isinstance(result2, DatetimeIndex)
         tm.assert_numpy_array_equal(result, result2.values)
 
         malformed = np.array(['1/100/2000', np.nan], dtype=object)
 
         # GH 10636, default is now 'raise'
-        self.assertRaises(ValueError,
-                          lambda: to_datetime(malformed, errors='raise'))
-
-        result = to_datetime(malformed, errors='ignore')
-        tm.assert_numpy_array_equal(result, malformed)
+        msg = (r"\(u?'Unknown string format:', '1/100/2000'\)|"
+               "day is out of range for month")
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(malformed, errors='raise', cache=cache)
+
+        result = to_datetime(malformed, errors='ignore', cache=cache)
+        # GH 21864
+        expected = Index(malformed)
+        tm.assert_index_equal(result, expected)
 
-        self.assertRaises(ValueError, to_datetime, malformed, errors='raise')
+        with pytest.raises(ValueError, match=msg):
+            to_datetime(malformed, errors='raise', cache=cache)
 
         idx = ['a', 'b', 'c', 'd', 'e']
         series = Series(['1/1/2000', np.nan, '1/3/2000', np.nan,
                          '1/5/2000'], index=idx, name='foo')
-        dseries = Series([to_datetime('1/1/2000'), np.nan,
-                          to_datetime('1/3/2000'), np.nan,
-                          to_datetime('1/5/2000')], index=idx, name='foo')
+        dseries = Series([to_datetime('1/1/2000', cache=cache), np.nan,
+                          to_datetime('1/3/2000', cache=cache), np.nan,
+                          to_datetime('1/5/2000', cache=cache)],
+                         index=idx, name='foo')
 
-        result = to_datetime(series)
-        dresult = to_datetime(dseries)
+        result = to_datetime(series, cache=cache)
+        dresult = to_datetime(dseries, cache=cache)
 
         expected = Series(np.empty(5, dtype='M8[ns]'), index=idx)
         for i in range(5):
             x = series[i]
-            if isnull(x):
-                expected[i] = tslib.iNaT
+            if isna(x):
+                expected[i] = iNaT
             else:
-                expected[i] = to_datetime(x)
+                expected[i] = to_datetime(x, cache=cache)
 
         assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'foo')
+        assert result.name == 'foo'
 
         assert_series_equal(dresult, expected, check_names=False)
-        self.assertEqual(dresult.name, 'foo')
-
-    def test_dti_constructor_numpy_timeunits(self):
+        assert dresult.name == 'foo'
+
+    @pytest.mark.parametrize('dtype', [
+        'datetime64[h]', 'datetime64[m]',
+        'datetime64[s]', 'datetime64[ms]',
+        'datetime64[us]', 'datetime64[ns]'])
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dti_constructor_numpy_timeunits(self, cache, dtype):
         # GH 9114
-        base = pd.to_datetime(['2000-01-01T00:00', '2000-01-02T00:00', 'NaT'])
+        base = pd.to_datetime(['2000-01-01T00:00', '2000-01-02T00:00', 'NaT'],
+                              cache=cache)
 
-        for dtype in ['datetime64[h]', 'datetime64[m]', 'datetime64[s]',
-                      'datetime64[ms]', 'datetime64[us]', 'datetime64[ns]']:
-            values = base.values.astype(dtype)
+        values = base.values.astype(dtype)
 
-            tm.assert_index_equal(DatetimeIndex(values), base)
-            tm.assert_index_equal(to_datetime(values), base)
+        tm.assert_index_equal(DatetimeIndex(values), base)
+        tm.assert_index_equal(to_datetime(values, cache=cache), base)
 
-    def test_dayfirst(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_dayfirst(self, cache):
         # GH 5917
         arr = ['10/02/2014', '11/02/2014', '12/02/2014']
         expected = DatetimeIndex([datetime(2014, 2, 10), datetime(2014, 2, 11),
                                   datetime(2014, 2, 12)])
         idx1 = DatetimeIndex(arr, dayfirst=True)
         idx2 = DatetimeIndex(np.array(arr), dayfirst=True)
-        idx3 = to_datetime(arr, dayfirst=True)
-        idx4 = to_datetime(np.array(arr), dayfirst=True)
+        idx3 = to_datetime(arr, dayfirst=True, cache=cache)
+        idx4 = to_datetime(np.array(arr), dayfirst=True, cache=cache)
         idx5 = DatetimeIndex(Index(arr), dayfirst=True)
         idx6 = DatetimeIndex(Series(arr), dayfirst=True)
         tm.assert_index_equal(expected, idx1)
@@ -829,85 +1329,10 @@ def test_dayfirst(self):
         tm.assert_index_equal(expected, idx6)
 
 
-class TestGuessDatetimeFormat(tm.TestCase):
-
-    def test_guess_datetime_format_with_parseable_formats(self):
-        tm._skip_if_not_us_locale()
-        dt_string_to_format = (('20111230', '%Y%m%d'),
-                               ('2011-12-30', '%Y-%m-%d'),
-                               ('30-12-2011', '%d-%m-%Y'),
-                               ('2011-12-30 00:00:00', '%Y-%m-%d %H:%M:%S'),
-                               ('2011-12-30T00:00:00', '%Y-%m-%dT%H:%M:%S'),
-                               ('2011-12-30 00:00:00.000000',
-                                '%Y-%m-%d %H:%M:%S.%f'), )
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
-
-    def test_guess_datetime_format_with_dayfirst(self):
-        ambiguous_string = '01/01/2011'
-        self.assertEqual(
-            tools._guess_datetime_format(ambiguous_string, dayfirst=True),
-            '%d/%m/%Y'
-        )
-        self.assertEqual(
-            tools._guess_datetime_format(ambiguous_string, dayfirst=False),
-            '%m/%d/%Y'
-        )
-
-    def test_guess_datetime_format_with_locale_specific_formats(self):
-        # The month names will vary depending on the locale, in which
-        # case these wont be parsed properly (dateutil can't parse them)
-        tm._skip_if_has_locale()
-
-        dt_string_to_format = (('30/Dec/2011', '%d/%b/%Y'),
-                               ('30/December/2011', '%d/%B/%Y'),
-                               ('30/Dec/2011 00:00:00', '%d/%b/%Y %H:%M:%S'), )
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
-
-    def test_guess_datetime_format_invalid_inputs(self):
-        # A datetime string must include a year, month and a day for it
-        # to be guessable, in addition to being a string that looks like
-        # a datetime
-        invalid_dts = [
-            '2013',
-            '01/2013',
-            '12:00:00',
-            '1/1/1/1',
-            'this_is_not_a_datetime',
-            '51a',
-            9,
-            datetime(2011, 1, 1),
-        ]
-
-        for invalid_dt in invalid_dts:
-            self.assertTrue(tools._guess_datetime_format(invalid_dt) is None)
-
-    def test_guess_datetime_format_nopadding(self):
-        # GH 11142
-        dt_string_to_format = (('2011-1-1', '%Y-%m-%d'),
-                               ('30-1-2011', '%d-%m-%Y'),
-                               ('1/1/2011', '%m/%d/%Y'),
-                               ('2011-1-1 00:00:00', '%Y-%m-%d %H:%M:%S'),
-                               ('2011-1-1 0:0:0', '%Y-%m-%d %H:%M:%S'),
-                               ('2011-1-3T00:00:0', '%Y-%m-%dT%H:%M:%S'))
-
-        for dt_string, dt_format in dt_string_to_format:
-            self.assertEqual(
-                tools._guess_datetime_format(dt_string),
-                dt_format
-            )
+class TestGuessDatetimeFormat(object):
 
+    @td.skip_if_not_us_locale
     def test_guess_datetime_format_for_array(self):
-        tm._skip_if_not_us_locale()
         expected_format = '%Y-%m-%d %H:%M:%S.%f'
         dt_string = datetime(2011, 12, 30, 0, 0, 0).strftime(expected_format)
 
@@ -918,20 +1343,19 @@ def test_guess_datetime_format_for_array(self):
         ]
 
         for test_array in test_arrays:
-            self.assertEqual(
-                tools._guess_datetime_format_for_array(test_array),
-                expected_format
-            )
+            assert tools._guess_datetime_format_for_array(
+                test_array) == expected_format
 
         format_for_string_of_nans = tools._guess_datetime_format_for_array(
             np.array(
                 [np.nan, np.nan, np.nan], dtype='O'))
-        self.assertTrue(format_for_string_of_nans is None)
+        assert format_for_string_of_nans is None
 
 
-class TestToDatetimeInferFormat(tm.TestCase):
+class TestToDatetimeInferFormat(object):
 
-    def test_to_datetime_infer_datetime_format_consistent_format(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_consistent_format(self, cache):
         s = pd.Series(pd.date_range('20000101', periods=50, freq='H'))
 
         test_formats = ['%m-%d-%Y', '%m/%d/%Y %H:%M:%S.%f',
@@ -940,210 +1364,216 @@ def test_to_datetime_infer_datetime_format_consistent_format(self):
         for test_format in test_formats:
             s_as_dt_strings = s.apply(lambda x: x.strftime(test_format))
 
-            with_format = pd.to_datetime(s_as_dt_strings, format=test_format)
+            with_format = pd.to_datetime(s_as_dt_strings, format=test_format,
+                                         cache=cache)
             no_infer = pd.to_datetime(s_as_dt_strings,
-                                      infer_datetime_format=False)
+                                      infer_datetime_format=False,
+                                      cache=cache)
             yes_infer = pd.to_datetime(s_as_dt_strings,
-                                       infer_datetime_format=True)
+                                       infer_datetime_format=True,
+                                       cache=cache)
 
             # Whether the format is explicitly passed, it is inferred, or
             # it is not inferred, the results should all be the same
-            self.assert_series_equal(with_format, no_infer)
-            self.assert_series_equal(no_infer, yes_infer)
+            tm.assert_series_equal(with_format, no_infer)
+            tm.assert_series_equal(no_infer, yes_infer)
 
-    def test_to_datetime_infer_datetime_format_inconsistent_format(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_inconsistent_format(self,
+                                                                   cache):
         s = pd.Series(np.array(['01/01/2011 00:00:00',
                                 '01-02-2011 00:00:00',
                                 '2011-01-03T00:00:00']))
 
         # When the format is inconsistent, infer_datetime_format should just
         # fallback to the default parsing
-        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False),
-                               pd.to_datetime(s, infer_datetime_format=True))
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
 
         s = pd.Series(np.array(['Jan/01/2011', 'Feb/01/2011', 'Mar/01/2011']))
 
-        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False),
-                               pd.to_datetime(s, infer_datetime_format=True))
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
 
-    def test_to_datetime_infer_datetime_format_series_with_nans(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_series_with_nans(self, cache):
         s = pd.Series(np.array(['01/01/2011 00:00:00', np.nan,
                                 '01/03/2011 00:00:00', np.nan]))
-        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False),
-                               pd.to_datetime(s, infer_datetime_format=True))
-
-    def test_to_datetime_infer_datetime_format_series_starting_with_nans(self):
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_infer_datetime_format_series_start_with_nans(self,
+                                                                      cache):
         s = pd.Series(np.array([np.nan, np.nan, '01/01/2011 00:00:00',
                                 '01/02/2011 00:00:00', '01/03/2011 00:00:00']))
 
-        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False),
-                               pd.to_datetime(s, infer_datetime_format=True))
+        tm.assert_series_equal(pd.to_datetime(s, infer_datetime_format=False,
+                                              cache=cache),
+                               pd.to_datetime(s, infer_datetime_format=True,
+                                              cache=cache))
 
-    def test_to_datetime_iso8601_noleading_0s(self):
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_to_datetime_iso8601_noleading_0s(self, cache):
         # GH 11871
         s = pd.Series(['2014-1-1', '2014-2-2', '2015-3-3'])
         expected = pd.Series([pd.Timestamp('2014-01-01'),
                               pd.Timestamp('2014-02-02'),
                               pd.Timestamp('2015-03-03')])
-        tm.assert_series_equal(pd.to_datetime(s), expected)
-        tm.assert_series_equal(pd.to_datetime(s, format='%Y-%m-%d'), expected)
+        tm.assert_series_equal(pd.to_datetime(s, cache=cache), expected)
+        tm.assert_series_equal(pd.to_datetime(s, format='%Y-%m-%d',
+                                              cache=cache), expected)
 
 
-class TestDaysInMonth(tm.TestCase):
+class TestDaysInMonth(object):
     # tests for issue #10154
 
-    def test_day_not_in_month_coerce(self):
-        self.assertTrue(isnull(to_datetime('2015-02-29', errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-02-29', format="%Y-%m-%d",
-                                           errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-02-32', format="%Y-%m-%d",
-                                           errors='coerce')))
-        self.assertTrue(isnull(to_datetime('2015-04-31', format="%Y-%m-%d",
-                                           errors='coerce')))
-
-    def test_day_not_in_month_raise(self):
-        self.assertRaises(ValueError, to_datetime, '2015-02-29',
-                          errors='raise')
-        self.assertRaises(ValueError, to_datetime, '2015-02-29',
-                          errors='raise', format="%Y-%m-%d")
-        self.assertRaises(ValueError, to_datetime, '2015-02-32',
-                          errors='raise', format="%Y-%m-%d")
-        self.assertRaises(ValueError, to_datetime, '2015-04-31',
-                          errors='raise', format="%Y-%m-%d")
-
-    def test_day_not_in_month_ignore(self):
-        self.assertEqual(to_datetime(
-            '2015-02-29', errors='ignore'), '2015-02-29')
-        self.assertEqual(to_datetime(
-            '2015-02-29', errors='ignore', format="%Y-%m-%d"), '2015-02-29')
-        self.assertEqual(to_datetime(
-            '2015-02-32', errors='ignore', format="%Y-%m-%d"), '2015-02-32')
-        self.assertEqual(to_datetime(
-            '2015-04-31', errors='ignore', format="%Y-%m-%d"), '2015-04-31')
-
-
-class TestDatetimeParsingWrappers(tm.TestCase):
-    def test_does_not_convert_mixed_integer(self):
-        bad_date_strings = ('-50000', '999', '123.1234', 'm', 'T')
-
-        for bad_date_string in bad_date_strings:
-            self.assertFalse(tslib._does_string_look_like_datetime(
-                bad_date_string))
-
-        good_date_strings = ('2012-01-01',
-                             '01/01/2012',
-                             'Mon Sep 16, 2013',
-                             '01012012',
-                             '0101',
-                             '1-1', )
-
-        for good_date_string in good_date_strings:
-            self.assertTrue(tslib._does_string_look_like_datetime(
-                good_date_string))
-
-    def test_parsers(self):
-
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_coerce(self, cache):
+        assert isna(to_datetime('2015-02-29', errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-02-29', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-02-32', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+        assert isna(to_datetime('2015-04-31', format="%Y-%m-%d",
+                                errors='coerce', cache=cache))
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_raise(self, cache):
+        msg = "day is out of range for month"
+        with pytest.raises(ValueError, match=msg):
+            to_datetime('2015-02-29', errors='raise', cache=cache)
+
+        msg = "time data 2015-02-29 doesn't match format specified"
+        with pytest.raises(ValueError, match=msg):
+            to_datetime('2015-02-29', errors='raise', format="%Y-%m-%d",
+                        cache=cache)
+
+        msg = "time data 2015-02-32 doesn't match format specified"
+        with pytest.raises(ValueError, match=msg):
+            to_datetime('2015-02-32', errors='raise', format="%Y-%m-%d",
+                        cache=cache)
+
+        msg = "time data 2015-04-31 doesn't match format specified"
+        with pytest.raises(ValueError, match=msg):
+            to_datetime('2015-04-31', errors='raise', format="%Y-%m-%d",
+                        cache=cache)
+
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_day_not_in_month_ignore(self, cache):
+        assert to_datetime('2015-02-29', errors='ignore',
+                           cache=cache) == '2015-02-29'
+        assert to_datetime('2015-02-29', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-02-29'
+        assert to_datetime('2015-02-32', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-02-32'
+        assert to_datetime('2015-04-31', errors='ignore',
+                           format="%Y-%m-%d", cache=cache) == '2015-04-31'
+
+
+class TestDatetimeParsingWrappers(object):
+
+    @pytest.mark.parametrize('date_str,expected', list({
+        '2011-01-01': datetime(2011, 1, 1),
+        '2Q2005': datetime(2005, 4, 1),
+        '2Q05': datetime(2005, 4, 1),
+        '2005Q1': datetime(2005, 1, 1),
+        '05Q1': datetime(2005, 1, 1),
+        '2011Q3': datetime(2011, 7, 1),
+        '11Q3': datetime(2011, 7, 1),
+        '3Q2011': datetime(2011, 7, 1),
+        '3Q11': datetime(2011, 7, 1),
+
+        # quarterly without space
+        '2000Q4': datetime(2000, 10, 1),
+        '00Q4': datetime(2000, 10, 1),
+        '4Q2000': datetime(2000, 10, 1),
+        '4Q00': datetime(2000, 10, 1),
+        '2000q4': datetime(2000, 10, 1),
+        '2000-Q4': datetime(2000, 10, 1),
+        '00-Q4': datetime(2000, 10, 1),
+        '4Q-2000': datetime(2000, 10, 1),
+        '4Q-00': datetime(2000, 10, 1),
+        '00q4': datetime(2000, 10, 1),
+        '2005': datetime(2005, 1, 1),
+        '2005-11': datetime(2005, 11, 1),
+        '2005 11': datetime(2005, 11, 1),
+        '11-2005': datetime(2005, 11, 1),
+        '11 2005': datetime(2005, 11, 1),
+        '200511': datetime(2020, 5, 11),
+        '20051109': datetime(2005, 11, 9),
+        '20051109 10:15': datetime(2005, 11, 9, 10, 15),
+        '20051109 08H': datetime(2005, 11, 9, 8, 0),
+        '2005-11-09 10:15': datetime(2005, 11, 9, 10, 15),
+        '2005-11-09 08H': datetime(2005, 11, 9, 8, 0),
+        '2005/11/09 10:15': datetime(2005, 11, 9, 10, 15),
+        '2005/11/09 08H': datetime(2005, 11, 9, 8, 0),
+        "Thu Sep 25 10:36:28 2003": datetime(2003, 9, 25, 10, 36, 28),
+        "Thu Sep 25 2003": datetime(2003, 9, 25),
+        "Sep 25 2003": datetime(2003, 9, 25),
+        "January 1 2014": datetime(2014, 1, 1),
+
+        # GHE10537
+        '2014-06': datetime(2014, 6, 1),
+        '06-2014': datetime(2014, 6, 1),
+        '2014-6': datetime(2014, 6, 1),
+        '6-2014': datetime(2014, 6, 1),
+
+        '20010101 12': datetime(2001, 1, 1, 12),
+        '20010101 1234': datetime(2001, 1, 1, 12, 34),
+        '20010101 123456': datetime(2001, 1, 1, 12, 34, 56)}.items()))
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers(self, date_str, expected, cache):
+
+        # dateutil >= 2.5.0 defaults to yearfirst=True
         # https://github.com/dateutil/dateutil/issues/217
-        import dateutil
-        yearfirst = dateutil.__version__ >= LooseVersion('2.5.0')
-
-        cases = {'2011-01-01': datetime(2011, 1, 1),
-                 '2Q2005': datetime(2005, 4, 1),
-                 '2Q05': datetime(2005, 4, 1),
-                 '2005Q1': datetime(2005, 1, 1),
-                 '05Q1': datetime(2005, 1, 1),
-                 '2011Q3': datetime(2011, 7, 1),
-                 '11Q3': datetime(2011, 7, 1),
-                 '3Q2011': datetime(2011, 7, 1),
-                 '3Q11': datetime(2011, 7, 1),
-
-                 # quarterly without space
-                 '2000Q4': datetime(2000, 10, 1),
-                 '00Q4': datetime(2000, 10, 1),
-                 '4Q2000': datetime(2000, 10, 1),
-                 '4Q00': datetime(2000, 10, 1),
-                 '2000q4': datetime(2000, 10, 1),
-                 '2000-Q4': datetime(2000, 10, 1),
-                 '00-Q4': datetime(2000, 10, 1),
-                 '4Q-2000': datetime(2000, 10, 1),
-                 '4Q-00': datetime(2000, 10, 1),
-                 '00q4': datetime(2000, 10, 1),
-                 '2005': datetime(2005, 1, 1),
-                 '2005-11': datetime(2005, 11, 1),
-                 '2005 11': datetime(2005, 11, 1),
-                 '11-2005': datetime(2005, 11, 1),
-                 '11 2005': datetime(2005, 11, 1),
-                 '200511': datetime(2020, 5, 11),
-                 '20051109': datetime(2005, 11, 9),
-                 '20051109 10:15': datetime(2005, 11, 9, 10, 15),
-                 '20051109 08H': datetime(2005, 11, 9, 8, 0),
-                 '2005-11-09 10:15': datetime(2005, 11, 9, 10, 15),
-                 '2005-11-09 08H': datetime(2005, 11, 9, 8, 0),
-                 '2005/11/09 10:15': datetime(2005, 11, 9, 10, 15),
-                 '2005/11/09 08H': datetime(2005, 11, 9, 8, 0),
-                 "Thu Sep 25 10:36:28 2003": datetime(2003, 9, 25, 10,
-                                                      36, 28),
-                 "Thu Sep 25 2003": datetime(2003, 9, 25),
-                 "Sep 25 2003": datetime(2003, 9, 25),
-                 "January 1 2014": datetime(2014, 1, 1),
-
-                 # GH 10537
-                 '2014-06': datetime(2014, 6, 1),
-                 '06-2014': datetime(2014, 6, 1),
-                 '2014-6': datetime(2014, 6, 1),
-                 '6-2014': datetime(2014, 6, 1),
-
-                 '20010101 12': datetime(2001, 1, 1, 12),
-                 '20010101 1234': datetime(2001, 1, 1, 12, 34),
-                 '20010101 123456': datetime(2001, 1, 1, 12, 34, 56),
-                 }
-
-        for date_str, expected in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str,
-                                                    yearfirst=yearfirst)
-            result2 = to_datetime(date_str, yearfirst=yearfirst)
-            result3 = to_datetime([date_str], yearfirst=yearfirst)
-            # result5 is used below
-            result4 = to_datetime(np.array([date_str], dtype=object),
-                                  yearfirst=yearfirst)
-            result6 = DatetimeIndex([date_str], yearfirst=yearfirst)
-            # result7 is used below
-            result8 = DatetimeIndex(Index([date_str]), yearfirst=yearfirst)
-            result9 = DatetimeIndex(Series([date_str]), yearfirst=yearfirst)
-
-            for res in [result1, result2]:
-                self.assertEqual(res, expected)
-            for res in [result3, result4, result6, result8, result9]:
-                exp = DatetimeIndex([pd.Timestamp(expected)])
-                tm.assert_index_equal(res, exp)
-
-            # these really need to have yearfist, but we don't support
-            if not yearfirst:
-                result5 = Timestamp(date_str)
-                self.assertEqual(result5, expected)
-                result7 = date_range(date_str, freq='S', periods=1,
-                                     yearfirst=yearfirst)
-                self.assertEqual(result7, expected)
-
-        # NaT
-        result1, _, _ = tools.parse_time_string('NaT')
+        yearfirst = True
+
+        result1, _, _ = parsing.parse_time_string(date_str,
+                                                  yearfirst=yearfirst)
+        result2 = to_datetime(date_str, yearfirst=yearfirst)
+        result3 = to_datetime([date_str], yearfirst=yearfirst)
+        # result5 is used below
+        result4 = to_datetime(np.array([date_str], dtype=object),
+                              yearfirst=yearfirst, cache=cache)
+        result6 = DatetimeIndex([date_str], yearfirst=yearfirst)
+        # result7 is used below
+        result8 = DatetimeIndex(Index([date_str]), yearfirst=yearfirst)
+        result9 = DatetimeIndex(Series([date_str]), yearfirst=yearfirst)
+
+        for res in [result1, result2]:
+            assert res == expected
+        for res in [result3, result4, result6, result8, result9]:
+            exp = DatetimeIndex([pd.Timestamp(expected)])
+            tm.assert_index_equal(res, exp)
+
+        # these really need to have yearfirst, but we don't support
+        if not yearfirst:
+            result5 = Timestamp(date_str)
+            assert result5 == expected
+            result7 = date_range(date_str, freq='S', periods=1,
+                                 yearfirst=yearfirst)
+            assert result7 == expected
+
+    def test_parsers_nat(self):
+        # Test that each of several string-accepting methods return pd.NaT
+        result1, _, _ = parsing.parse_time_string('NaT')
         result2 = to_datetime('NaT')
         result3 = Timestamp('NaT')
         result4 = DatetimeIndex(['NaT'])[0]
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-        self.assertTrue(result1 is tslib.NaT)
-
-    def test_parsers_quarter_invalid(self):
-
-        cases = ['2Q 2005', '2Q-200A', '2Q-200', '22Q2005', '6Q-20', '2Q200.']
-        for case in cases:
-            self.assertRaises(ValueError, tools.parse_time_string, case)
-
-    def test_parsers_dayfirst_yearfirst(self):
-        tm._skip_if_no_dateutil()
+        assert result1 is NaT
+        assert result2 is NaT
+        assert result3 is NaT
+        assert result4 is NaT
 
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers_dayfirst_yearfirst(self, cache):
         # OK
         # 2.5.1 10-11-12   [dayfirst=0, yearfirst=0] -> 2012-10-11 00:00:00
         # 2.5.2 10-11-12   [dayfirst=0, yearfirst=1] -> 2012-10-11 00:00:00
@@ -1184,8 +1614,7 @@ def test_parsers_dayfirst_yearfirst(self):
         # 2.5.2 20/12/21   [dayfirst=1, yearfirst=0] -> 2021-12-20 00:00:00
         # 2.5.3 20/12/21   [dayfirst=1, yearfirst=0] -> 2021-12-20 00:00:00
 
-        import dateutil
-        is_lt_253 = dateutil.__version__ < LooseVersion('2.5.3')
+        is_lt_253 = LooseVersion(dateutil.__version__) < LooseVersion('2.5.3')
 
         # str : dayfirst, yearfirst, expected
         cases = {'10-11-12': [(False, False,
@@ -1205,7 +1634,6 @@ def test_parsers_dayfirst_yearfirst(self):
                               (True, True,
                                datetime(2020, 12, 21))]}
 
-        from dateutil.parser import parse
         for date_str, values in compat.iteritems(cases):
             for dayfirst, yearfirst, expected in values:
 
@@ -1217,37 +1645,35 @@ def test_parsers_dayfirst_yearfirst(self):
                 # compare with dateutil result
                 dateutil_result = parse(date_str, dayfirst=dayfirst,
                                         yearfirst=yearfirst)
-                self.assertEqual(dateutil_result, expected)
+                assert dateutil_result == expected
 
-                result1, _, _ = tools.parse_time_string(date_str,
-                                                        dayfirst=dayfirst,
-                                                        yearfirst=yearfirst)
+                result1, _, _ = parsing.parse_time_string(date_str,
+                                                          dayfirst=dayfirst,
+                                                          yearfirst=yearfirst)
 
                 # we don't support dayfirst/yearfirst here:
                 if not dayfirst and not yearfirst:
                     result2 = Timestamp(date_str)
-                    self.assertEqual(result2, expected)
+                    assert result2 == expected
 
                 result3 = to_datetime(date_str, dayfirst=dayfirst,
-                                      yearfirst=yearfirst)
+                                      yearfirst=yearfirst, cache=cache)
 
                 result4 = DatetimeIndex([date_str], dayfirst=dayfirst,
                                         yearfirst=yearfirst)[0]
 
-                self.assertEqual(result1, expected)
-                self.assertEqual(result3, expected)
-                self.assertEqual(result4, expected)
-
-    def test_parsers_timestring(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.parser import parse
+                assert result1 == expected
+                assert result3 == expected
+                assert result4 == expected
 
+    @pytest.mark.parametrize('cache', [True, False])
+    def test_parsers_timestring(self, cache):
         # must be the same as dateutil result
         cases = {'10:15': (parse('10:15'), datetime(1, 1, 1, 10, 15)),
                  '9:05': (parse('9:05'), datetime(1, 1, 1, 9, 5))}
 
         for date_str, (exp_now, exp_def) in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str)
+            result1, _, _ = parsing.parse_time_string(date_str)
             result2 = to_datetime(date_str)
             result3 = to_datetime([date_str])
             result4 = Timestamp(date_str)
@@ -1255,263 +1681,214 @@ def test_parsers_timestring(self):
             # parse time string return time string based on default date
             # others are not, and can't be changed because it is used in
             # time series plot
-            self.assertEqual(result1, exp_def)
-            self.assertEqual(result2, exp_now)
-            self.assertEqual(result3, exp_now)
-            self.assertEqual(result4, exp_now)
-            self.assertEqual(result5, exp_now)
+            assert result1 == exp_def
+            assert result2 == exp_now
+            assert result3 == exp_now
+            assert result4 == exp_now
+            assert result5 == exp_now
 
+    @td.skip_if_has_locale
     def test_parsers_time(self):
         # GH11818
-        _skip_if_has_locale()
         strings = ["14:15", "1415", "2:15pm", "0215pm", "14:15:00", "141500",
                    "2:15:00pm", "021500pm", time(14, 15)]
         expected = time(14, 15)
 
         for time_string in strings:
-            self.assertEqual(tools.to_time(time_string), expected)
+            assert tools.to_time(time_string) == expected
 
         new_string = "14.15"
-        self.assertRaises(ValueError, tools.to_time, new_string)
-        self.assertEqual(tools.to_time(new_string, format="%H.%M"), expected)
+        msg = r"Cannot convert arg \['14\.15'\] to a time"
+        with pytest.raises(ValueError, match=msg):
+            tools.to_time(new_string)
+        assert tools.to_time(new_string, format="%H.%M") == expected
 
         arg = ["14:15", "20:20"]
         expected_arr = [time(14, 15), time(20, 20)]
-        self.assertEqual(tools.to_time(arg), expected_arr)
-        self.assertEqual(tools.to_time(arg, format="%H:%M"), expected_arr)
-        self.assertEqual(tools.to_time(arg, infer_time_format=True),
-                         expected_arr)
-        self.assertEqual(tools.to_time(arg, format="%I:%M%p", errors="coerce"),
-                         [None, None])
+        assert tools.to_time(arg) == expected_arr
+        assert tools.to_time(arg, format="%H:%M") == expected_arr
+        assert tools.to_time(arg, infer_time_format=True) == expected_arr
+        assert tools.to_time(arg, format="%I:%M%p",
+                             errors="coerce") == [None, None]
 
         res = tools.to_time(arg, format="%I:%M%p", errors="ignore")
-        self.assert_numpy_array_equal(res, np.array(arg, dtype=np.object_))
+        tm.assert_numpy_array_equal(res, np.array(arg, dtype=np.object_))
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             tools.to_time(arg, format="%I:%M%p", errors="raise")
 
-        self.assert_series_equal(tools.to_time(Series(arg, name="test")),
-                                 Series(expected_arr, name="test"))
+        tm.assert_series_equal(tools.to_time(Series(arg, name="test")),
+                               Series(expected_arr, name="test"))
 
         res = tools.to_time(np.array(arg))
-        self.assertIsInstance(res, list)
-        self.assert_equal(res, expected_arr)
-
-    def test_parsers_monthfreq(self):
-        cases = {'201101': datetime(2011, 1, 1, 0, 0),
-                 '200005': datetime(2000, 5, 1, 0, 0)}
-
-        for date_str, expected in compat.iteritems(cases):
-            result1, _, _ = tools.parse_time_string(date_str, freq='M')
-            self.assertEqual(result1, expected)
-
-    def test_parsers_quarterly_with_freq(self):
-        msg = ('Incorrect quarterly string is given, quarter '
-               'must be between 1 and 4: 2013Q5')
-        with tm.assertRaisesRegexp(tslib.DateParseError, msg):
-            tools.parse_time_string('2013Q5')
-
-        # GH 5418
-        msg = ('Unable to retrieve month information from given freq: '
-               'INVLD-L-DEC-SAT')
-        with tm.assertRaisesRegexp(tslib.DateParseError, msg):
-            tools.parse_time_string('2013Q1', freq='INVLD-L-DEC-SAT')
-
-        cases = {('2013Q2', None): datetime(2013, 4, 1),
-                 ('2013Q2', 'A-APR'): datetime(2012, 8, 1),
-                 ('2013-Q2', 'A-DEC'): datetime(2013, 4, 1)}
-
-        for (date_str, freq), exp in compat.iteritems(cases):
-            result, _, _ = tools.parse_time_string(date_str, freq=freq)
-            self.assertEqual(result, exp)
-
-    def test_parsers_timezone_minute_offsets_roundtrip(self):
+        assert isinstance(res, list)
+        assert res == expected_arr
+
+    @pytest.mark.parametrize('cache', [True, False])
+    @pytest.mark.parametrize('dt_string, tz, dt_string_repr', [
+        ('2013-01-01 05:45+0545', pytz.FixedOffset(345),
+         "Timestamp('2013-01-01 05:45:00+0545', tz='pytz.FixedOffset(345)')"),
+        ('2013-01-01 05:30+0530', pytz.FixedOffset(330),
+         "Timestamp('2013-01-01 05:30:00+0530', tz='pytz.FixedOffset(330)')")])
+    def test_parsers_timezone_minute_offsets_roundtrip(self, cache, dt_string,
+                                                       tz, dt_string_repr):
         # GH11708
-        base = to_datetime("2013-01-01 00:00:00")
-        dt_strings = [
-            ('2013-01-01 05:45+0545',
-             "Asia/Katmandu",
-             "Timestamp('2013-01-01 05:45:00+0545', tz='Asia/Katmandu')"),
-            ('2013-01-01 05:30+0530',
-             "Asia/Kolkata",
-             "Timestamp('2013-01-01 05:30:00+0530', tz='Asia/Kolkata')")
-        ]
+        base = to_datetime("2013-01-01 00:00:00", cache=cache)
+        base = base.tz_localize('UTC').tz_convert(tz)
+        dt_time = to_datetime(dt_string, cache=cache)
+        assert base == dt_time
+        assert dt_string_repr == repr(dt_time)
 
-        for dt_string, tz, dt_string_repr in dt_strings:
-            dt_time = to_datetime(dt_string)
-            self.assertEqual(base, dt_time)
-            converted_time = dt_time.tz_localize('UTC').tz_convert(tz)
-            self.assertEqual(dt_string_repr, repr(converted_time))
-
-    def test_parsers_iso8601(self):
-        # GH 12060
-        # test only the iso parser - flexibility to different
-        # separators and leadings 0s
-        # Timestamp construction falls back to dateutil
-        cases = {'2011-01-02': datetime(2011, 1, 2),
-                 '2011-1-2': datetime(2011, 1, 2),
-                 '2011-01': datetime(2011, 1, 1),
-                 '2011-1': datetime(2011, 1, 1),
-                 '2011 01 02': datetime(2011, 1, 2),
-                 '2011.01.02': datetime(2011, 1, 2),
-                 '2011/01/02': datetime(2011, 1, 2),
-                 '2011\\01\\02': datetime(2011, 1, 2),
-                 '2013-01-01 05:30:00': datetime(2013, 1, 1, 5, 30),
-                 '2013-1-1 5:30:00': datetime(2013, 1, 1, 5, 30)}
-        for date_str, exp in compat.iteritems(cases):
-            actual = tslib._test_parse_iso8601(date_str)
-            self.assertEqual(actual, exp)
-
-        # seperators must all match - YYYYMM not valid
-        invalid_cases = ['2011-01/02', '2011^11^11',
-                         '201401', '201111', '200101',
-                         # mixed separated and unseparated
-                         '2005-0101', '200501-01',
-                         '20010101 12:3456', '20010101 1234:56',
-                         # HHMMSS must have two digits in each component
-                         # if unseparated
-                         '20010101 1', '20010101 123', '20010101 12345',
-                         '20010101 12345Z',
-                         # wrong separator for HHMMSS
-                         '2001-01-01 12-34-56']
-        for date_str in invalid_cases:
-            with tm.assertRaises(ValueError):
-                tslib._test_parse_iso8601(date_str)
-                # If no ValueError raised, let me know which case failed.
-                raise Exception(date_str)
-
-
-class TestArrayToDatetime(tm.TestCase):
-
-    def test_try_parse_dates(self):
-        from dateutil.parser import parse
-        arr = np.array(['5/1/2000', '6/1/2000', '7/1/2000'], dtype=object)
-
-        result = lib.try_parse_dates(arr, dayfirst=True)
-        expected = [parse(d, dayfirst=True) for d in arr]
-        self.assertTrue(np.array_equal(result, expected))
-
-    def test_parsing_valid_dates(self):
-        arr = np.array(['01-01-2013', '01-02-2013'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr),
-            np_array_datetime64_compat(
-                [
-                    '2013-01-01T00:00:00.000000000-0000',
-                    '2013-01-02T00:00:00.000000000-0000'
-                ],
-                dtype='M8[ns]'
-            )
-        )
 
-        arr = np.array(['Mon Sep 16 2013', 'Tue Sep 17 2013'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr),
-            np_array_datetime64_compat(
-                [
-                    '2013-09-16T00:00:00.000000000-0000',
-                    '2013-09-17T00:00:00.000000000-0000'
-                ],
-                dtype='M8[ns]'
-            )
-        )
+@pytest.fixture(params=['D', 's', 'ms', 'us', 'ns'])
+def units(request):
+    """Day and some time units.
 
-    def test_parsing_timezone_offsets(self):
-        # All of these datetime strings with offsets are equivalent
-        # to the same datetime after the timezone offset is added
-        dt_strings = [
-            '01-01-2013 08:00:00+08:00',
-            '2013-01-01T08:00:00.000000000+0800',
-            '2012-12-31T16:00:00.000000000-0800',
-            '12-31-2012 23:00:00-01:00'
-        ]
+    * D
+    * s
+    * ms
+    * us
+    * ns
+    """
+    return request.param
 
-        expected_output = tslib.array_to_datetime(np.array(
-            ['01-01-2013 00:00:00'], dtype=object))
 
-        for dt_string in dt_strings:
-            self.assert_numpy_array_equal(
-                tslib.array_to_datetime(
-                    np.array([dt_string], dtype=object)
-                ),
-                expected_output
-            )
+@pytest.fixture
+def epoch_1960():
+    """Timestamp at 1960-01-01."""
+    return Timestamp('1960-01-01')
 
-    def test_number_looking_strings_not_into_datetime(self):
-        # #4601
-        # These strings don't look like datetimes so they shouldn't be
-        # attempted to be converted
-        arr = np.array(['-352.737091', '183.575577'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='ignore'), arr)
-
-        arr = np.array(['1', '2', '3', '4', '5'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='ignore'), arr)
-
-    def test_coercing_dates_outside_of_datetime64_ns_bounds(self):
-        invalid_dates = [
-            date(1000, 1, 1),
-            datetime(1000, 1, 1),
-            '1000-01-01',
-            'Jan 1, 1000',
-            np.datetime64('1000-01-01'),
-        ]
 
-        for invalid_date in invalid_dates:
-            self.assertRaises(ValueError,
-                              tslib.array_to_datetime,
-                              np.array(
-                                  [invalid_date], dtype='object'),
-                              errors='raise', )
-            self.assert_numpy_array_equal(
-                tslib.array_to_datetime(
-                    np.array([invalid_date], dtype='object'),
-                    errors='coerce'),
-                np.array([tslib.iNaT], dtype='M8[ns]')
-            )
+@pytest.fixture
+def units_from_epochs():
+    return list(range(5))
 
-        arr = np.array(['1/1/1000', '1/1/2000'], dtype=object)
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='coerce'),
-            np_array_datetime64_compat(
-                [
-                    tslib.iNaT,
-                    '2000-01-01T00:00:00.000000000-0000'
-                ],
-                dtype='M8[ns]'
-            )
-        )
 
-    def test_coerce_of_invalid_datetimes(self):
-        arr = np.array(['01-01-2013', 'not_a_date', '1'], dtype=object)
+@pytest.fixture(params=['timestamp', 'pydatetime', 'datetime64', 'str_1960'])
+def epochs(epoch_1960, request):
+    """Timestamp at 1960-01-01 in various forms.
 
-        # Without coercing, the presence of any invalid dates prevents
-        # any values from being converted
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='ignore'), arr)
+    * pd.Timestamp
+    * datetime.datetime
+    * numpy.datetime64
+    * str
+    """
+    assert request.param in {'timestamp', 'pydatetime', 'datetime64',
+                             "str_1960"}
+    if request.param == 'timestamp':
+        return epoch_1960
+    elif request.param == 'pydatetime':
+        return epoch_1960.to_pydatetime()
+    elif request.param == "datetime64":
+        return epoch_1960.to_datetime64()
+    else:
+        return str(epoch_1960)
 
-        # With coercing, the invalid dates becomes iNaT
-        self.assert_numpy_array_equal(
-            tslib.array_to_datetime(arr, errors='coerce'),
-            np_array_datetime64_compat(
-                [
-                    '2013-01-01T00:00:00.000000000-0000',
-                    tslib.iNaT,
-                    tslib.iNaT
-                ],
-                dtype='M8[ns]'
-            )
-        )
 
+@pytest.fixture
+def julian_dates():
+    return pd.date_range('2014-1-1', periods=10).to_julian_date().values
+
+
+class TestOrigin(object):
+
+    def test_to_basic(self, julian_dates):
+        # gh-11276, gh-11745
+        # for origin as julian
 
-def test_normalize_date():
-    value = date(2012, 9, 7)
+        result = Series(pd.to_datetime(
+            julian_dates, unit='D', origin='julian'))
+        expected = Series(pd.to_datetime(
+            julian_dates - pd.Timestamp(0).to_julian_date(), unit='D'))
+        assert_series_equal(result, expected)
+
+        result = Series(pd.to_datetime(
+            [0, 1, 2], unit='D', origin='unix'))
+        expected = Series([Timestamp('1970-01-01'),
+                           Timestamp('1970-01-02'),
+                           Timestamp('1970-01-03')])
+        assert_series_equal(result, expected)
+
+        # default
+        result = Series(pd.to_datetime(
+            [0, 1, 2], unit='D'))
+        expected = Series([Timestamp('1970-01-01'),
+                           Timestamp('1970-01-02'),
+                           Timestamp('1970-01-03')])
+        assert_series_equal(result, expected)
+
+    def test_julian_round_trip(self):
+        result = pd.to_datetime(2456658, origin='julian', unit='D')
+        assert result.to_julian_date() == 2456658
+
+        # out-of-bounds
+        with pytest.raises(ValueError):
+            pd.to_datetime(1, origin="julian", unit='D')
 
-    result = normalize_date(value)
-    assert (result == datetime(2012, 9, 7))
+    def test_invalid_unit(self, units, julian_dates):
 
-    value = datetime(2012, 9, 7, 12)
+        # checking for invalid combination of origin='julian' and unit != D
+        if units != 'D':
+            with pytest.raises(ValueError):
+                pd.to_datetime(julian_dates, unit=units, origin='julian')
+
+    def test_invalid_origin(self):
+
+        # need to have a numeric specified
+        with pytest.raises(ValueError):
+            pd.to_datetime("2005-01-01", origin="1960-01-01")
+
+        with pytest.raises(ValueError):
+            pd.to_datetime("2005-01-01", origin="1960-01-01", unit='D')
+
+    def test_epoch(self, units, epochs, epoch_1960, units_from_epochs):
+
+        expected = Series(
+            [pd.Timedelta(x, unit=units) +
+             epoch_1960 for x in units_from_epochs])
+
+        result = Series(pd.to_datetime(
+            units_from_epochs, unit=units, origin=epochs))
+        assert_series_equal(result, expected)
 
-    result = normalize_date(value)
-    assert (result == datetime(2012, 9, 7))
+    @pytest.mark.parametrize("origin, exc",
+                             [('random_string', ValueError),
+                              ('epoch', ValueError),
+                              ('13-24-1990', ValueError),
+                              (datetime(1, 1, 1), tslib.OutOfBoundsDatetime)])
+    def test_invalid_origins(self, origin, exc, units, units_from_epochs):
+
+        with pytest.raises(exc):
+            pd.to_datetime(units_from_epochs, unit=units,
+                           origin=origin)
+
+    def test_invalid_origins_tzinfo(self):
+        # GH16842
+        with pytest.raises(ValueError):
+            pd.to_datetime(1, unit='D',
+                           origin=datetime(2000, 1, 1, tzinfo=pytz.utc))
+
+    @pytest.mark.parametrize("format", [
+        None, "%Y-%m-%d %H:%M:%S"
+    ])
+    def test_to_datetime_out_of_bounds_with_format_arg(self, format):
+        # see gh-23830
+        msg = "Out of bounds nanosecond timestamp"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
+            to_datetime("2417-10-27 00:00:00", format=format)
+
+    def test_processing_order(self):
+        # make sure we handle out-of-bounds *before*
+        # constructing the dates
+
+        result = pd.to_datetime(200 * 365, unit='D')
+        expected = Timestamp('2169-11-13 00:00:00')
+        assert result == expected
+
+        result = pd.to_datetime(200 * 365, unit='D', origin='1870-01-01')
+        expected = Timestamp('2069-11-13 00:00:00')
+        assert result == expected
+
+        result = pd.to_datetime(300 * 365, unit='D', origin='1870-01-01')
+        expected = Timestamp('2169-10-20 00:00:00')
+        assert result == expected
diff --git a/pandas/tests/indexes/interval/__init__.py b/pandas/tests/indexes/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/interval/test_astype.py b/pandas/tests/indexes/interval/test_astype.py
new file mode 100644
index 0000000000000..2932a46f9bde2
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_astype.py
@@ -0,0 +1,206 @@
+from __future__ import division
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import CategoricalDtype, IntervalDtype
+
+from pandas import (
+    CategoricalIndex, Index, IntervalIndex, NaT, Timedelta, Timestamp,
+    interval_range)
+import pandas.util.testing as tm
+
+
+class Base(object):
+    """Tests common to IntervalIndex with any subtype"""
+
+    def test_astype_idempotent(self, index):
+        result = index.astype('interval')
+        tm.assert_index_equal(result, index)
+
+        result = index.astype(index.dtype)
+        tm.assert_index_equal(result, index)
+
+    def test_astype_object(self, index):
+        result = index.astype(object)
+        expected = Index(index.values, dtype='object')
+        tm.assert_index_equal(result, expected)
+        assert not result.equals(index)
+
+    def test_astype_category(self, index):
+        result = index.astype('category')
+        expected = CategoricalIndex(index.values)
+        tm.assert_index_equal(result, expected)
+
+        result = index.astype(CategoricalDtype())
+        tm.assert_index_equal(result, expected)
+
+        # non-default params
+        categories = index.dropna().unique().values[:-1]
+        dtype = CategoricalDtype(categories=categories, ordered=True)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(
+            index.values, categories=categories, ordered=True)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        'int64', 'uint64', 'float64', 'complex128', 'period[M]',
+        'timedelta64', 'timedelta64[ns]', 'datetime64', 'datetime64[ns]',
+        'datetime64[ns, US/Eastern]'])
+    def test_astype_cannot_cast(self, index, dtype):
+        msg = 'Cannot cast IntervalIndex to dtype'
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
+
+    def test_astype_invalid_dtype(self, index):
+        msg = "data type 'fake_dtype' not understood"
+        with pytest.raises(TypeError, match=msg):
+            index.astype('fake_dtype')
+
+
+class TestIntSubtype(Base):
+    """Tests specific to IntervalIndex with integer-like subtype"""
+
+    indexes = [
+        IntervalIndex.from_breaks(np.arange(-10, 11, dtype='int64')),
+        IntervalIndex.from_breaks(
+            np.arange(100, dtype='uint64'), closed='left'),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', [
+        'float64', 'datetime64[ns]', 'timedelta64[ns]'])
+    def test_subtype_conversion(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('subtype_start, subtype_end', [
+        ('int64', 'uint64'), ('uint64', 'int64')])
+    def test_subtype_integer(self, subtype_start, subtype_end):
+        index = IntervalIndex.from_breaks(np.arange(100, dtype=subtype_start))
+        dtype = IntervalDtype(subtype_end)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype_end),
+                                             index.right.astype(subtype_end),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.xfail(reason='GH#15832')
+    def test_subtype_integer_errors(self):
+        # int64 -> uint64 fails with negative values
+        index = interval_range(-10, 10)
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+
+class TestFloatSubtype(Base):
+    """Tests specific to IntervalIndex with float subtype"""
+
+    indexes = [
+        interval_range(-10.0, 10.0, closed='neither'),
+        IntervalIndex.from_arrays([-1.5, np.nan, 0., 0., 1.5],
+                                  [-0.5, np.nan, 1., 1., 3.],
+                                  closed='both'),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', ['int64', 'uint64'])
+    def test_subtype_integer(self, subtype):
+        index = interval_range(0.0, 10.0)
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+        # raises with NA
+        msg = 'Cannot convert NA to integer'
+        with pytest.raises(ValueError, match=msg):
+            index.insert(0, np.nan).astype(dtype)
+
+    @pytest.mark.xfail(reason='GH#15832')
+    def test_subtype_integer_errors(self):
+        # float64 -> uint64 fails with negative values
+        index = interval_range(-10.0, 10.0)
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+        # float64 -> integer-like fails with non-integer valued floats
+        index = interval_range(0.0, 10.0, freq=0.25)
+        dtype = IntervalDtype('int64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+        dtype = IntervalDtype('uint64')
+        with pytest.raises(ValueError):
+            index.astype(dtype)
+
+    @pytest.mark.parametrize('subtype', ['datetime64[ns]', 'timedelta64[ns]'])
+    def test_subtype_datetimelike(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
+
+
+class TestDatetimelikeSubtype(Base):
+    """Tests specific to IntervalIndex with datetime-like subtype"""
+
+    indexes = [
+        interval_range(Timestamp('2018-01-01'), periods=10, closed='neither'),
+        interval_range(Timestamp('2018-01-01'), periods=10).insert(2, NaT),
+        interval_range(Timestamp('2018-01-01', tz='US/Eastern'), periods=10),
+        interval_range(Timedelta('0 days'), periods=10, closed='both'),
+        interval_range(Timedelta('0 days'), periods=10).insert(2, NaT),
+    ]
+
+    @pytest.fixture(params=indexes)
+    def index(self, request):
+        return request.param
+
+    @pytest.mark.parametrize('subtype', ['int64', 'uint64'])
+    def test_subtype_integer(self, index, subtype):
+        dtype = IntervalDtype(subtype)
+        result = index.astype(dtype)
+        expected = IntervalIndex.from_arrays(index.left.astype(subtype),
+                                             index.right.astype(subtype),
+                                             closed=index.closed)
+        tm.assert_index_equal(result, expected)
+
+    def test_subtype_float(self, index):
+        dtype = IntervalDtype('float64')
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
+
+    def test_subtype_datetimelike(self):
+        # datetime -> timedelta raises
+        dtype = IntervalDtype('timedelta64[ns]')
+        msg = 'Cannot convert .* to .*; subtypes are incompatible'
+
+        index = interval_range(Timestamp('2018-01-01'), periods=10)
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
+
+        index = interval_range(Timestamp('2018-01-01', tz='CET'), periods=10)
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
+
+        # timedelta -> datetime raises
+        dtype = IntervalDtype('datetime64[ns]')
+        index = interval_range(Timedelta('0 days'), periods=10)
+        with pytest.raises(TypeError, match=msg):
+            index.astype(dtype)
diff --git a/pandas/tests/indexes/interval/test_construction.py b/pandas/tests/indexes/interval/test_construction.py
new file mode 100644
index 0000000000000..483978b40fee0
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_construction.py
@@ -0,0 +1,389 @@
+from __future__ import division
+
+from functools import partial
+
+import numpy as np
+import pytest
+
+from pandas.compat import lzip
+
+from pandas.core.dtypes.common import is_categorical_dtype
+from pandas.core.dtypes.dtypes import IntervalDtype
+
+from pandas import (
+    Categorical, CategoricalIndex, Float64Index, Index, Int64Index, Interval,
+    IntervalIndex, date_range, notna, period_range, timedelta_range)
+from pandas.core.arrays import IntervalArray
+import pandas.core.common as com
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class Base(object):
+    """
+    Common tests for all variations of IntervalIndex construction. Input data
+    to be supplied in breaks format, then converted by the subclass method
+    get_kwargs_from_breaks to the expected format.
+    """
+
+    @pytest.mark.parametrize('breaks', [
+        [3, 14, 15, 92, 653],
+        np.arange(10, dtype='int64'),
+        Int64Index(range(-10, 11)),
+        Float64Index(np.arange(20, 30, 0.5)),
+        date_range('20180101', periods=10),
+        date_range('20180101', periods=10, tz='US/Eastern'),
+        timedelta_range('1 day', periods=10)])
+    def test_constructor(self, constructor, breaks, closed, name):
+        result_kwargs = self.get_kwargs_from_breaks(breaks, closed)
+        result = constructor(closed=closed, name=name, **result_kwargs)
+
+        assert result.closed == closed
+        assert result.name == name
+        assert result.dtype.subtype == getattr(breaks, 'dtype', 'int64')
+        tm.assert_index_equal(result.left, Index(breaks[:-1]))
+        tm.assert_index_equal(result.right, Index(breaks[1:]))
+
+    @pytest.mark.parametrize('breaks, subtype', [
+        (Int64Index([0, 1, 2, 3, 4]), 'float64'),
+        (Int64Index([0, 1, 2, 3, 4]), 'datetime64[ns]'),
+        (Int64Index([0, 1, 2, 3, 4]), 'timedelta64[ns]'),
+        (Float64Index([0, 1, 2, 3, 4]), 'int64'),
+        (date_range('2017-01-01', periods=5), 'int64'),
+        (timedelta_range('1 day', periods=5), 'int64')])
+    def test_constructor_dtype(self, constructor, breaks, subtype):
+        # GH 19262: conversion via dtype parameter
+        expected_kwargs = self.get_kwargs_from_breaks(breaks.astype(subtype))
+        expected = constructor(**expected_kwargs)
+
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        iv_dtype = IntervalDtype(subtype)
+        for dtype in (iv_dtype, str(iv_dtype)):
+            result = constructor(dtype=dtype, **result_kwargs)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        [np.nan] * 2, [np.nan] * 4, [np.nan] * 50])
+    def test_constructor_nan(self, constructor, breaks, closed):
+        # GH 18421
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        result = constructor(closed=closed, **result_kwargs)
+
+        expected_subtype = np.float64
+        expected_values = np.array(breaks[:-1], dtype=object)
+
+        assert result.closed == closed
+        assert result.dtype.subtype == expected_subtype
+        tm.assert_numpy_array_equal(result._ndarray_values, expected_values)
+
+    @pytest.mark.parametrize('breaks', [
+        [],
+        np.array([], dtype='int64'),
+        np.array([], dtype='float64'),
+        np.array([], dtype='datetime64[ns]'),
+        np.array([], dtype='timedelta64[ns]')])
+    def test_constructor_empty(self, constructor, breaks, closed):
+        # GH 18421
+        result_kwargs = self.get_kwargs_from_breaks(breaks)
+        result = constructor(closed=closed, **result_kwargs)
+
+        expected_values = np.array([], dtype=object)
+        expected_subtype = getattr(breaks, 'dtype', np.int64)
+
+        assert result.empty
+        assert result.closed == closed
+        assert result.dtype.subtype == expected_subtype
+        tm.assert_numpy_array_equal(result._ndarray_values, expected_values)
+
+    @pytest.mark.parametrize('breaks', [
+        tuple('0123456789'),
+        list('abcdefghij'),
+        np.array(list('abcdefghij'), dtype=object),
+        np.array(list('abcdefghij'), dtype='<U1')])
+    def test_constructor_string(self, constructor, breaks):
+        # GH 19016
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with pytest.raises(TypeError, match=msg):
+            constructor(**self.get_kwargs_from_breaks(breaks))
+
+    @pytest.mark.parametrize('cat_constructor', [
+        Categorical, CategoricalIndex])
+    def test_constructor_categorical_valid(self, constructor, cat_constructor):
+        # GH 21243/21253
+        if isinstance(constructor, partial) and constructor.func is Index:
+            # Index is defined to create CategoricalIndex from categorical data
+            pytest.skip()
+
+        breaks = np.arange(10, dtype='int64')
+        expected = IntervalIndex.from_breaks(breaks)
+
+        cat_breaks = cat_constructor(breaks)
+        result_kwargs = self.get_kwargs_from_breaks(cat_breaks)
+        result = constructor(**result_kwargs)
+        tm.assert_index_equal(result, expected)
+
+    def test_generic_errors(self, constructor):
+        # filler input data to be used when supplying invalid kwargs
+        filler = self.get_kwargs_from_breaks(range(10))
+
+        # invalid closed
+        msg = "invalid option for 'closed': invalid"
+        with pytest.raises(ValueError, match=msg):
+            constructor(closed='invalid', **filler)
+
+        # unsupported dtype
+        msg = 'dtype must be an IntervalDtype, got int64'
+        with pytest.raises(TypeError, match=msg):
+            constructor(dtype='int64', **filler)
+
+        # invalid dtype
+        msg = "data type 'invalid' not understood"
+        with pytest.raises(TypeError, match=msg):
+            constructor(dtype='invalid', **filler)
+
+        # no point in nesting periods in an IntervalIndex
+        periods = period_range('2000-01-01', periods=10)
+        periods_kwargs = self.get_kwargs_from_breaks(periods)
+        msg = 'Period dtypes are not supported, use a PeriodIndex instead'
+        with pytest.raises(ValueError, match=msg):
+            constructor(**periods_kwargs)
+
+        # decreasing values
+        decreasing_kwargs = self.get_kwargs_from_breaks(range(10, -1, -1))
+        msg = 'left side of interval must be <= right side'
+        with pytest.raises(ValueError, match=msg):
+            constructor(**decreasing_kwargs)
+
+
+class TestFromArrays(Base):
+    """Tests specific to IntervalIndex.from_arrays"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_arrays
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_arrays
+        """
+        return {'left': breaks[:-1], 'right': breaks[1:]}
+
+    def test_constructor_errors(self):
+        # GH 19016: categorical data
+        data = Categorical(list('01234abcde'), ordered=True)
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with pytest.raises(TypeError, match=msg):
+            IntervalIndex.from_arrays(data[:-1], data[1:])
+
+        # unequal length
+        left = [0, 1, 2]
+        right = [2, 3]
+        msg = 'left and right must have the same length'
+        with pytest.raises(ValueError, match=msg):
+            IntervalIndex.from_arrays(left, right)
+
+    @pytest.mark.parametrize('left_subtype, right_subtype', [
+        (np.int64, np.float64), (np.float64, np.int64)])
+    def test_mixed_float_int(self, left_subtype, right_subtype):
+        """mixed int/float left/right results in float for both sides"""
+        left = np.arange(9, dtype=left_subtype)
+        right = np.arange(1, 10, dtype=right_subtype)
+        result = IntervalIndex.from_arrays(left, right)
+
+        expected_left = Float64Index(left)
+        expected_right = Float64Index(right)
+        expected_subtype = np.float64
+
+        tm.assert_index_equal(result.left, expected_left)
+        tm.assert_index_equal(result.right, expected_right)
+        assert result.dtype.subtype == expected_subtype
+
+
+class TestFromBreaks(Base):
+    """Tests specific to IntervalIndex.from_breaks"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_breaks
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_breaks
+        """
+        return {'breaks': breaks}
+
+    def test_constructor_errors(self):
+        # GH 19016: categorical data
+        data = Categorical(list('01234abcde'), ordered=True)
+        msg = ('category, object, and string subtypes are not supported '
+               'for IntervalIndex')
+        with pytest.raises(TypeError, match=msg):
+            IntervalIndex.from_breaks(data)
+
+    def test_length_one(self):
+        """breaks of length one produce an empty IntervalIndex"""
+        breaks = [0]
+        result = IntervalIndex.from_breaks(breaks)
+        expected = IntervalIndex.from_breaks([])
+        tm.assert_index_equal(result, expected)
+
+
+class TestFromTuples(Base):
+    """Tests specific to IntervalIndex.from_tuples"""
+
+    @pytest.fixture
+    def constructor(self):
+        return IntervalIndex.from_tuples
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by IntervalIndex.from_tuples
+        """
+        if len(breaks) == 0:
+            return {'data': breaks}
+
+        tuples = lzip(breaks[:-1], breaks[1:])
+        if isinstance(breaks, (list, tuple)):
+            return {'data': tuples}
+        elif is_categorical_dtype(breaks):
+            return {'data': breaks._constructor(tuples)}
+        return {'data': com.asarray_tuplesafe(tuples)}
+
+    def test_constructor_errors(self):
+        # non-tuple
+        tuples = [(0, 1), 2, (3, 4)]
+        msg = 'IntervalIndex.from_tuples received an invalid item, 2'
+        with pytest.raises(TypeError, match=msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+        # too few/many items
+        tuples = [(0, 1), (2,), (3, 4)]
+        msg = 'IntervalIndex.from_tuples requires tuples of length 2, got {t}'
+        with pytest.raises(ValueError, match=msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+        tuples = [(0, 1), (2, 3, 4), (5, 6)]
+        with pytest.raises(ValueError, match=msg.format(t=tuples)):
+            IntervalIndex.from_tuples(tuples)
+
+    def test_na_tuples(self):
+        # tuple (NA, NA) evaluates the same as NA as an elemenent
+        na_tuple = [(0, 1), (np.nan, np.nan), (2, 3)]
+        idx_na_tuple = IntervalIndex.from_tuples(na_tuple)
+        idx_na_element = IntervalIndex.from_tuples([(0, 1), np.nan, (2, 3)])
+        tm.assert_index_equal(idx_na_tuple, idx_na_element)
+
+
+class TestClassConstructors(Base):
+    """Tests specific to the IntervalIndex/Index constructors"""
+
+    @pytest.fixture(params=[IntervalIndex, partial(Index, dtype='interval')],
+                    ids=['IntervalIndex', 'Index'])
+    def constructor(self, request):
+        return request.param
+
+    def get_kwargs_from_breaks(self, breaks, closed='right'):
+        """
+        converts intervals in breaks format to a dictionary of kwargs to
+        specific to the format expected by the IntervalIndex/Index constructors
+        """
+        if len(breaks) == 0:
+            return {'data': breaks}
+
+        ivs = [Interval(l, r, closed) if notna(l) else l
+               for l, r in zip(breaks[:-1], breaks[1:])]
+
+        if isinstance(breaks, list):
+            return {'data': ivs}
+        elif is_categorical_dtype(breaks):
+            return {'data': breaks._constructor(ivs)}
+        return {'data': np.array(ivs, dtype=object)}
+
+    def test_generic_errors(self, constructor):
+        """
+        override the base class implementation since errors are handled
+        differently; checks unnecessary since caught at the Interval level
+        """
+        pass
+
+    def test_constructor_errors(self, constructor):
+        # mismatched closed within intervals with no constructor override
+        ivs = [Interval(0, 1, closed='right'), Interval(2, 3, closed='left')]
+        msg = 'intervals must all be closed on the same side'
+        with pytest.raises(ValueError, match=msg):
+            constructor(ivs)
+
+        # scalar
+        msg = (r'IntervalIndex\(...\) must be called with a collection of '
+               'some kind, 5 was passed')
+        with pytest.raises(TypeError, match=msg):
+            constructor(5)
+
+        # not an interval
+        msg = ("type <(class|type) 'numpy.int64'> with value 0 "
+               "is not an interval")
+        with pytest.raises(TypeError, match=msg):
+            constructor([0, 1])
+
+    @pytest.mark.parametrize('data, closed', [
+        ([], 'both'),
+        ([np.nan, np.nan], 'neither'),
+        ([Interval(0, 3, closed='neither'),
+          Interval(2, 5, closed='neither')], 'left'),
+        ([Interval(0, 3, closed='left'),
+          Interval(2, 5, closed='right')], 'neither'),
+        (IntervalIndex.from_breaks(range(5), closed='both'), 'right')])
+    def test_override_inferred_closed(self, constructor, data, closed):
+        # GH 19370
+        if isinstance(data, IntervalIndex):
+            tuples = data.to_tuples()
+        else:
+            tuples = [(iv.left, iv.right) if notna(iv) else iv for iv in data]
+        expected = IntervalIndex.from_tuples(tuples, closed=closed)
+        result = constructor(data, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('values_constructor', [
+        list, np.array, IntervalIndex, IntervalArray])
+    def test_index_object_dtype(self, values_constructor):
+        # Index(intervals, dtype=object) is an Index (not an IntervalIndex)
+        intervals = [Interval(0, 1), Interval(1, 2), Interval(2, 3)]
+        values = values_constructor(intervals)
+        result = Index(values, dtype=object)
+
+        assert type(result) is Index
+        tm.assert_numpy_array_equal(result.values, np.array(values))
+
+
+class TestFromIntervals(TestClassConstructors):
+    """
+    Tests for IntervalIndex.from_intervals, which is deprecated in favor of the
+    IntervalIndex constructor.  Same tests as the IntervalIndex constructor,
+    plus deprecation test.  Should only need to delete this class when removed.
+    """
+
+    @pytest.fixture
+    def constructor(self):
+        def from_intervals_ignore_warnings(*args, **kwargs):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                return IntervalIndex.from_intervals(*args, **kwargs)
+        return from_intervals_ignore_warnings
+
+    def test_deprecated(self):
+        ivs = [Interval(0, 1), Interval(1, 2)]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            IntervalIndex.from_intervals(ivs)
+
+    @pytest.mark.skip(reason='parent class test that is not applicable')
+    def test_index_object_dtype(self):
+        pass
diff --git a/pandas/tests/indexes/interval/test_interval.py b/pandas/tests/indexes/interval/test_interval.py
new file mode 100644
index 0000000000000..ba451da10573a
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval.py
@@ -0,0 +1,1260 @@
+from __future__ import division
+
+from itertools import permutations
+import re
+
+import numpy as np
+import pytest
+
+from pandas.compat import lzip
+
+import pandas as pd
+from pandas import (
+    Index, Interval, IntervalIndex, Timedelta, Timestamp, date_range,
+    interval_range, isna, notna, timedelta_range)
+import pandas.core.common as com
+from pandas.tests.indexes.common import Base
+import pandas.util.testing as tm
+
+
+@pytest.fixture(scope='class', params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class TestIntervalIndex(Base):
+    _holder = IntervalIndex
+
+    def setup_method(self, method):
+        self.index = IntervalIndex.from_arrays([0, 1], [1, 2])
+        self.index_with_nan = IntervalIndex.from_tuples(
+            [(0, 1), np.nan, (1, 2)])
+        self.indices = dict(intervalIndex=tm.makeIntervalIndex(10))
+
+    def create_index(self, closed='right'):
+        return IntervalIndex.from_breaks(range(11), closed=closed)
+
+    def create_index_with_nan(self, closed='right'):
+        mask = [True, False] + [True] * 8
+        return IntervalIndex.from_arrays(
+            np.where(mask, np.arange(10), np.nan),
+            np.where(mask, np.arange(1, 11), np.nan), closed=closed)
+
+    def test_properties(self, closed):
+        index = self.create_index(closed=closed)
+        assert len(index) == 10
+        assert index.size == 10
+        assert index.shape == (10, )
+
+        tm.assert_index_equal(index.left, Index(np.arange(10)))
+        tm.assert_index_equal(index.right, Index(np.arange(1, 11)))
+        tm.assert_index_equal(index.mid, Index(np.arange(0.5, 10.5)))
+
+        assert index.closed == closed
+
+        ivs = [Interval(l, r, closed) for l, r in zip(range(10), range(1, 11))]
+        expected = np.array(ivs, dtype=object)
+        tm.assert_numpy_array_equal(np.asarray(index), expected)
+
+        # with nans
+        index = self.create_index_with_nan(closed=closed)
+        assert len(index) == 10
+        assert index.size == 10
+        assert index.shape == (10, )
+
+        expected_left = Index([0, np.nan, 2, 3, 4, 5, 6, 7, 8, 9])
+        expected_right = expected_left + 1
+        expected_mid = expected_left + 0.5
+        tm.assert_index_equal(index.left, expected_left)
+        tm.assert_index_equal(index.right, expected_right)
+        tm.assert_index_equal(index.mid, expected_mid)
+
+        assert index.closed == closed
+
+        ivs = [Interval(l, r, closed) if notna(l) else np.nan
+               for l, r in zip(expected_left, expected_right)]
+        expected = np.array(ivs, dtype=object)
+        tm.assert_numpy_array_equal(np.asarray(index), expected)
+
+    @pytest.mark.parametrize('breaks', [
+        [1, 1, 2, 5, 15, 53, 217, 1014, 5335, 31240, 201608],
+        [-np.inf, -100, -10, 0.5, 1, 1.5, 3.8, 101, 202, np.inf],
+        pd.to_datetime(['20170101', '20170202', '20170303', '20170404']),
+        pd.to_timedelta(['1ns', '2ms', '3s', '4M', '5H', '6D'])])
+    def test_length(self, closed, breaks):
+        # GH 18789
+        index = IntervalIndex.from_breaks(breaks, closed=closed)
+        result = index.length
+        expected = Index(iv.length for iv in index)
+        tm.assert_index_equal(result, expected)
+
+        # with NA
+        index = index.insert(1, np.nan)
+        result = index.length
+        expected = Index(iv.length if notna(iv) else iv for iv in index)
+        tm.assert_index_equal(result, expected)
+
+    def test_with_nans(self, closed):
+        index = self.create_index(closed=closed)
+        assert index.hasnans is False
+
+        result = index.isna()
+        expected = np.repeat(False, len(index))
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.notna()
+        expected = np.repeat(True, len(index))
+        tm.assert_numpy_array_equal(result, expected)
+
+        index = self.create_index_with_nan(closed=closed)
+        assert index.hasnans is True
+
+        result = index.isna()
+        expected = np.array([False, True] + [False] * (len(index) - 2))
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.notna()
+        expected = np.array([True, False] + [True] * (len(index) - 2))
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_copy(self, closed):
+        expected = self.create_index(closed=closed)
+
+        result = expected.copy()
+        assert result.equals(expected)
+
+        result = expected.copy(deep=True)
+        assert result.equals(expected)
+        assert result.left is not expected.left
+
+    def test_ensure_copied_data(self, closed):
+        # exercise the copy flag in the constructor
+
+        # not copying
+        index = self.create_index(closed=closed)
+        result = IntervalIndex(index, copy=False)
+        tm.assert_numpy_array_equal(index.left.values, result.left.values,
+                                    check_same='same')
+        tm.assert_numpy_array_equal(index.right.values, result.right.values,
+                                    check_same='same')
+
+        # by-definition make a copy
+        result = IntervalIndex(index._ndarray_values, copy=False)
+        tm.assert_numpy_array_equal(index.left.values, result.left.values,
+                                    check_same='copy')
+        tm.assert_numpy_array_equal(index.right.values, result.right.values,
+                                    check_same='copy')
+
+    def test_equals(self, closed):
+        expected = IntervalIndex.from_breaks(np.arange(5), closed=closed)
+        assert expected.equals(expected)
+        assert expected.equals(expected.copy())
+
+        assert not expected.equals(expected.astype(object))
+        assert not expected.equals(np.array(expected))
+        assert not expected.equals(list(expected))
+
+        assert not expected.equals([1, 2])
+        assert not expected.equals(np.array([1, 2]))
+        assert not expected.equals(pd.date_range('20130101', periods=2))
+
+        expected_name1 = IntervalIndex.from_breaks(
+            np.arange(5), closed=closed, name='foo')
+        expected_name2 = IntervalIndex.from_breaks(
+            np.arange(5), closed=closed, name='bar')
+        assert expected.equals(expected_name1)
+        assert expected_name1.equals(expected_name2)
+
+        for other_closed in {'left', 'right', 'both', 'neither'} - {closed}:
+            expected_other_closed = IntervalIndex.from_breaks(
+                np.arange(5), closed=other_closed)
+            assert not expected.equals(expected_other_closed)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, pd.Series])
+    def test_where(self, closed, klass):
+        idx = self.create_index(closed=closed)
+        cond = [True] * len(idx)
+        expected = idx
+        result = expected.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+        cond = [False] + [True] * len(idx[1:])
+        expected = IntervalIndex([np.nan] + idx[1:].tolist())
+        result = idx.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_delete(self, closed):
+        expected = IntervalIndex.from_breaks(np.arange(1, 11), closed=closed)
+        result = self.create_index(closed=closed).delete(0)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('data', [
+        interval_range(0, periods=10, closed='neither'),
+        interval_range(1.7, periods=8, freq=2.5, closed='both'),
+        interval_range(Timestamp('20170101'), periods=12, closed='left'),
+        interval_range(Timedelta('1 day'), periods=6, closed='right')])
+    def test_insert(self, data):
+        item = data[0]
+        idx_item = IntervalIndex([item])
+
+        # start
+        expected = idx_item.append(data)
+        result = data.insert(0, item)
+        tm.assert_index_equal(result, expected)
+
+        # end
+        expected = data.append(idx_item)
+        result = data.insert(len(data), item)
+        tm.assert_index_equal(result, expected)
+
+        # mid
+        expected = data[:3].append(idx_item).append(data[3:])
+        result = data.insert(3, item)
+        tm.assert_index_equal(result, expected)
+
+        # invalid type
+        msg = 'can only insert Interval objects and NA into an IntervalIndex'
+        with pytest.raises(ValueError, match=msg):
+            data.insert(1, 'foo')
+
+        # invalid closed
+        msg = 'inserted item must be closed on the same side as the index'
+        for closed in {'left', 'right', 'both', 'neither'} - {item.closed}:
+            with pytest.raises(ValueError, match=msg):
+                bad_item = Interval(item.left, item.right, closed=closed)
+                data.insert(1, bad_item)
+
+        # GH 18295 (test missing)
+        na_idx = IntervalIndex([np.nan], closed=data.closed)
+        for na in (np.nan, pd.NaT, None):
+            expected = data[:1].append(na_idx).append(data[1:])
+            result = data.insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+    def test_take(self, closed):
+        index = self.create_index(closed=closed)
+
+        result = index.take(range(10))
+        tm.assert_index_equal(result, index)
+
+        result = index.take([0, 0, 1])
+        expected = IntervalIndex.from_arrays(
+            [0, 0, 1], [1, 1, 2], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    def test_is_unique_interval(self, closed):
+        """
+        Interval specific tests for is_unique in addition to base class tests
+        """
+        # unique overlapping - distinct endpoints
+        idx = IntervalIndex.from_tuples([(0, 1), (0.5, 1.5)], closed=closed)
+        assert idx.is_unique is True
+
+        # unique overlapping - shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(1, 2), (1, 3), (2, 3)], closed=closed)
+        assert idx.is_unique is True
+
+        # unique nested
+        idx = IntervalIndex.from_tuples([(-1, 1), (-2, 2)], closed=closed)
+        assert idx.is_unique is True
+
+    def test_monotonic(self, closed):
+        # increasing non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (2, 3), (4, 5)], closed=closed)
+        assert idx.is_monotonic is True
+        assert idx._is_strictly_monotonic_increasing is True
+        assert idx.is_monotonic_decreasing is False
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # decreasing non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(4, 5), (2, 3), (1, 2)], closed=closed)
+        assert idx.is_monotonic is False
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is True
+        assert idx._is_strictly_monotonic_decreasing is True
+
+        # unordered non-overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 1), (4, 5), (2, 3)], closed=closed)
+        assert idx.is_monotonic is False
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is False
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # increasing overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0, 2), (0.5, 2.5), (1, 3)], closed=closed)
+        assert idx.is_monotonic is True
+        assert idx._is_strictly_monotonic_increasing is True
+        assert idx.is_monotonic_decreasing is False
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # decreasing overlapping
+        idx = IntervalIndex.from_tuples(
+            [(1, 3), (0.5, 2.5), (0, 2)], closed=closed)
+        assert idx.is_monotonic is False
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is True
+        assert idx._is_strictly_monotonic_decreasing is True
+
+        # unordered overlapping
+        idx = IntervalIndex.from_tuples(
+            [(0.5, 2.5), (0, 2), (1, 3)], closed=closed)
+        assert idx.is_monotonic is False
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is False
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # increasing overlapping shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(1, 2), (1, 3), (2, 3)], closed=closed)
+        assert idx.is_monotonic is True
+        assert idx._is_strictly_monotonic_increasing is True
+        assert idx.is_monotonic_decreasing is False
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # decreasing overlapping shared endpoints
+        idx = pd.IntervalIndex.from_tuples(
+            [(2, 3), (1, 3), (1, 2)], closed=closed)
+        assert idx.is_monotonic is False
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is True
+        assert idx._is_strictly_monotonic_decreasing is True
+
+        # stationary
+        idx = IntervalIndex.from_tuples([(0, 1), (0, 1)], closed=closed)
+        assert idx.is_monotonic is True
+        assert idx._is_strictly_monotonic_increasing is False
+        assert idx.is_monotonic_decreasing is True
+        assert idx._is_strictly_monotonic_decreasing is False
+
+        # empty
+        idx = IntervalIndex([], closed=closed)
+        assert idx.is_monotonic is True
+        assert idx._is_strictly_monotonic_increasing is True
+        assert idx.is_monotonic_decreasing is True
+        assert idx._is_strictly_monotonic_decreasing is True
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr(self):
+        i = IntervalIndex.from_tuples([(0, 1), (1, 2)], closed='right')
+        expected = ("IntervalIndex(left=[0, 1],"
+                    "\n              right=[1, 2],"
+                    "\n              closed='right',"
+                    "\n              dtype='interval[int64]')")
+        assert repr(i) == expected
+
+        i = IntervalIndex.from_tuples((Timestamp('20130101'),
+                                       Timestamp('20130102')),
+                                      (Timestamp('20130102'),
+                                       Timestamp('20130103')),
+                                      closed='right')
+        expected = ("IntervalIndex(left=['2013-01-01', '2013-01-02'],"
+                    "\n              right=['2013-01-02', '2013-01-03'],"
+                    "\n              closed='right',"
+                    "\n              dtype='interval[datetime64[ns]]')")
+        assert repr(i) == expected
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr_max_seq_item_setting(self):
+        super(TestIntervalIndex, self).test_repr_max_seq_item_setting()
+
+    @pytest.mark.skip(reason='not a valid repr as we use interval notation')
+    def test_repr_roundtrip(self):
+        super(TestIntervalIndex, self).test_repr_roundtrip()
+
+    def test_frame_repr(self):
+        # https://github.com/pandas-dev/pandas/pull/24134/files
+        df = pd.DataFrame({'A': [1, 2, 3, 4]},
+                          index=pd.IntervalIndex.from_breaks([0, 1, 2, 3, 4]))
+        result = repr(df)
+        expected = (
+            '        A\n'
+            '(0, 1]  1\n'
+            '(1, 2]  2\n'
+            '(2, 3]  3\n'
+            '(3, 4]  4'
+        )
+        assert result == expected
+
+        # TODO: check this behavior is consistent with test_interval_new.py
+    def test_get_item(self, closed):
+        i = IntervalIndex.from_arrays((0, 1, np.nan), (1, 2, np.nan),
+                                      closed=closed)
+        assert i[0] == Interval(0.0, 1.0, closed=closed)
+        assert i[1] == Interval(1.0, 2.0, closed=closed)
+        assert isna(i[2])
+
+        result = i[0:1]
+        expected = IntervalIndex.from_arrays((0.,), (1.,), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = i[0:2]
+        expected = IntervalIndex.from_arrays((0., 1), (1., 2.), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = i[1:3]
+        expected = IntervalIndex.from_arrays((1., np.nan), (2., np.nan),
+                                             closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_loc_value(self):
+        with pytest.raises(KeyError, match="^0$"):
+            self.index.get_loc(0)
+        assert self.index.get_loc(0.5) == 0
+        assert self.index.get_loc(1) == 0
+        assert self.index.get_loc(1.5) == 1
+        assert self.index.get_loc(2) == 1
+        with pytest.raises(KeyError, match="^-1$"):
+            self.index.get_loc(-1)
+        with pytest.raises(KeyError, match="^3$"):
+            self.index.get_loc(3)
+
+        idx = IntervalIndex.from_tuples([(0, 2), (1, 3)])
+        assert idx.get_loc(0.5) == 0
+        assert idx.get_loc(1) == 0
+        tm.assert_numpy_array_equal(idx.get_loc(1.5),
+                                    np.array([0, 1], dtype='intp'))
+        tm.assert_numpy_array_equal(np.sort(idx.get_loc(2)),
+                                    np.array([0, 1], dtype='intp'))
+        assert idx.get_loc(3) == 1
+        with pytest.raises(KeyError, match=r"^3\.5$"):
+            idx.get_loc(3.5)
+
+        idx = IntervalIndex.from_arrays([0, 2], [1, 3])
+        with pytest.raises(KeyError, match=r"^1\.5$"):
+            idx.get_loc(1.5)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def slice_locs_cases(self, breaks):
+        # TODO: same tests for more index types
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='right')
+        assert index.slice_locs() == (0, 2)
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(1, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0.5, 1.5) == (0, 2)
+        assert index.slice_locs(0, 0.5) == (0, 1)
+        assert index.slice_locs(start=1) == (0, 2)
+        assert index.slice_locs(start=1.2) == (1, 2)
+        assert index.slice_locs(end=1) == (0, 1)
+        assert index.slice_locs(end=1.1) == (0, 2)
+        assert index.slice_locs(end=1.0) == (0, 1)
+        assert index.slice_locs(-1, -1) == (0, 0)
+
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='neither')
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0.5, 1.5) == (0, 2)
+        assert index.slice_locs(1, 1) == (1, 1)
+        assert index.slice_locs(1, 2) == (1, 2)
+
+        index = IntervalIndex.from_tuples([(0, 1), (2, 3), (4, 5)],
+                                          closed='both')
+        assert index.slice_locs(1, 1) == (0, 1)
+        assert index.slice_locs(1, 2) == (0, 2)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_int64(self):
+        self.slice_locs_cases([0, 1, 2])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_float64(self):
+        self.slice_locs_cases([0.0, 1.0, 2.0])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def slice_locs_decreasing_cases(self, tuples):
+        index = IntervalIndex.from_tuples(tuples)
+        assert index.slice_locs(1.5, 0.5) == (1, 3)
+        assert index.slice_locs(2, 0) == (1, 3)
+        assert index.slice_locs(2, 1) == (1, 3)
+        assert index.slice_locs(3, 1.1) == (0, 3)
+        assert index.slice_locs(3, 3) == (0, 2)
+        assert index.slice_locs(3.5, 3.3) == (0, 1)
+        assert index.slice_locs(1, -3) == (2, 3)
+
+        slice_locs = index.slice_locs(-1, -1)
+        assert slice_locs[0] == slice_locs[1]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_decreasing_int64(self):
+        self.slice_locs_cases([(2, 4), (1, 3), (0, 2)])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_decreasing_float64(self):
+        self.slice_locs_cases([(2., 4.), (1., 3.), (0., 2.)])
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_slice_locs_fails(self):
+        index = IntervalIndex.from_tuples([(1, 2), (0, 1), (2, 3)])
+        msg = ("'can only get slices from an IntervalIndex if bounds are"
+               " non-overlapping and all monotonic increasing or decreasing'")
+        with pytest.raises(KeyError, match=msg):
+            index.slice_locs(1, 2)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_loc_interval(self):
+        assert self.index.get_loc(Interval(0, 1)) == 0
+        assert self.index.get_loc(Interval(0, 0.5)) == 0
+        assert self.index.get_loc(Interval(0, 1, 'left')) == 0
+        msg = r"Interval\(2, 3, closed='right'\)"
+        with pytest.raises(KeyError, match=msg):
+            self.index.get_loc(Interval(2, 3))
+        msg = r"Interval\(-1, 0, closed='left'\)"
+        with pytest.raises(KeyError, match=msg):
+            self.index.get_loc(Interval(-1, 0, 'left'))
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('item', [3, Interval(1, 4)])
+    def test_get_loc_length_one(self, item, closed):
+        # GH 20921
+        index = IntervalIndex.from_tuples([(0, 5)], closed=closed)
+        result = index.get_loc(item)
+        assert result == 0
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('breaks', [
+        date_range('20180101', periods=4),
+        date_range('20180101', periods=4, tz='US/Eastern'),
+        timedelta_range('0 days', periods=4)], ids=lambda x: str(x.dtype))
+    def test_get_loc_datetimelike_nonoverlapping(self, breaks):
+        # GH 20636
+        # nonoverlapping = IntervalIndex method and no i8 conversion
+        index = IntervalIndex.from_breaks(breaks)
+
+        value = index[0].mid
+        result = index.get_loc(value)
+        expected = 0
+        assert result == expected
+
+        interval = Interval(index[0].left, index[1].right)
+        result = index.get_loc(interval)
+        expected = slice(0, 2)
+        assert result == expected
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('arrays', [
+        (date_range('20180101', periods=4), date_range('20180103', periods=4)),
+        (date_range('20180101', periods=4, tz='US/Eastern'),
+         date_range('20180103', periods=4, tz='US/Eastern')),
+        (timedelta_range('0 days', periods=4),
+         timedelta_range('2 days', periods=4))], ids=lambda x: str(x[0].dtype))
+    def test_get_loc_datetimelike_overlapping(self, arrays):
+        # GH 20636
+        # overlapping = IntervalTree method with i8 conversion
+        index = IntervalIndex.from_arrays(*arrays)
+
+        value = index[0].mid + Timedelta('12 hours')
+        result = np.sort(index.get_loc(value))
+        expected = np.array([0, 1], dtype='intp')
+        assert tm.assert_numpy_array_equal(result, expected)
+
+        interval = Interval(index[0].left, index[1].right)
+        result = np.sort(index.get_loc(interval))
+        expected = np.array([0, 1, 2], dtype='intp')
+        assert tm.assert_numpy_array_equal(result, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_indexer(self):
+        actual = self.index.get_indexer([-1, 0, 0.5, 1, 1.5, 2, 3])
+        expected = np.array([-1, -1, 0, 0, 1, 1, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(self.index)
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        index = IntervalIndex.from_breaks([0, 1, 2], closed='left')
+        actual = index.get_indexer([-1, 0, 0.5, 1, 1.5, 2, 3])
+        expected = np.array([-1, 0, 0, 1, 1, -1, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(index[:1])
+        expected = np.array([0], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(index)
+        expected = np.array([-1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_get_indexer_subintervals(self):
+
+        # TODO: is this right?
+        # return indexers for wholly contained subintervals
+        target = IntervalIndex.from_breaks(np.linspace(0, 2, 5))
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 1, 1], dtype='p')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        target = IntervalIndex.from_breaks([0, 0.67, 1.33, 2])
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index.get_indexer(target[[0, -1]])
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        target = IntervalIndex.from_breaks([0, 0.33, 0.67, 1], closed='left')
+        actual = self.index.get_indexer(target)
+        expected = np.array([0, 0, 0], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('item', [
+        [3], np.arange(1, 5), [Interval(1, 4)], interval_range(1, 4)])
+    def test_get_indexer_length_one(self, item, closed):
+        # GH 17284
+        index = IntervalIndex.from_tuples([(0, 5)], closed=closed)
+        result = index.get_indexer(item)
+        expected = np.array([0] * len(item), dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    # Make consistent with test_interval_new.py (see #16316, #16386)
+    @pytest.mark.parametrize('arrays', [
+        (date_range('20180101', periods=4), date_range('20180103', periods=4)),
+        (date_range('20180101', periods=4, tz='US/Eastern'),
+         date_range('20180103', periods=4, tz='US/Eastern')),
+        (timedelta_range('0 days', periods=4),
+         timedelta_range('2 days', periods=4))], ids=lambda x: str(x[0].dtype))
+    def test_get_reindexer_datetimelike(self, arrays):
+        # GH 20636
+        index = IntervalIndex.from_arrays(*arrays)
+        tuples = [(index[0].left, index[0].left + pd.Timedelta('12H')),
+                  (index[-1].right - pd.Timedelta('12H'), index[-1].right)]
+        target = IntervalIndex.from_tuples(tuples)
+
+        result = index._get_reindexer(target)
+        expected = np.array([0, 3], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        date_range('20180101', periods=4),
+        date_range('20180101', periods=4, tz='US/Eastern'),
+        timedelta_range('0 days', periods=4)], ids=lambda x: str(x.dtype))
+    def test_maybe_convert_i8(self, breaks):
+        # GH 20636
+        index = IntervalIndex.from_breaks(breaks)
+
+        # intervalindex
+        result = index._maybe_convert_i8(index)
+        expected = IntervalIndex.from_breaks(breaks.asi8)
+        tm.assert_index_equal(result, expected)
+
+        # interval
+        interval = Interval(breaks[0], breaks[1])
+        result = index._maybe_convert_i8(interval)
+        expected = Interval(breaks[0].value, breaks[1].value)
+        assert result == expected
+
+        # datetimelike index
+        result = index._maybe_convert_i8(breaks)
+        expected = Index(breaks.asi8)
+        tm.assert_index_equal(result, expected)
+
+        # datetimelike scalar
+        result = index._maybe_convert_i8(breaks[0])
+        expected = breaks[0].value
+        assert result == expected
+
+        # list-like of datetimelike scalars
+        result = index._maybe_convert_i8(list(breaks))
+        expected = Index(breaks.asi8)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        date_range('2018-01-01', periods=5),
+        timedelta_range('0 days', periods=5)])
+    def test_maybe_convert_i8_nat(self, breaks):
+        # GH 20636
+        index = IntervalIndex.from_breaks(breaks)
+
+        to_convert = breaks._constructor([pd.NaT] * 3)
+        expected = pd.Float64Index([np.nan] * 3)
+        result = index._maybe_convert_i8(to_convert)
+        tm.assert_index_equal(result, expected)
+
+        to_convert = to_convert.insert(0, breaks[0])
+        expected = expected.insert(0, float(breaks[0].value))
+        result = index._maybe_convert_i8(to_convert)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('breaks', [
+        np.arange(5, dtype='int64'),
+        np.arange(5, dtype='float64')], ids=lambda x: str(x.dtype))
+    @pytest.mark.parametrize('make_key', [
+        IntervalIndex.from_breaks,
+        lambda breaks: Interval(breaks[0], breaks[1]),
+        lambda breaks: breaks,
+        lambda breaks: breaks[0],
+        list], ids=['IntervalIndex', 'Interval', 'Index', 'scalar', 'list'])
+    def test_maybe_convert_i8_numeric(self, breaks, make_key):
+        # GH 20636
+        index = IntervalIndex.from_breaks(breaks)
+        key = make_key(breaks)
+
+        # no conversion occurs for numeric
+        result = index._maybe_convert_i8(key)
+        assert result is key
+
+    @pytest.mark.parametrize('breaks1, breaks2', permutations([
+        date_range('20180101', periods=4),
+        date_range('20180101', periods=4, tz='US/Eastern'),
+        timedelta_range('0 days', periods=4)], 2), ids=lambda x: str(x.dtype))
+    @pytest.mark.parametrize('make_key', [
+        IntervalIndex.from_breaks,
+        lambda breaks: Interval(breaks[0], breaks[1]),
+        lambda breaks: breaks,
+        lambda breaks: breaks[0],
+        list], ids=['IntervalIndex', 'Interval', 'Index', 'scalar', 'list'])
+    def test_maybe_convert_i8_errors(self, breaks1, breaks2, make_key):
+        # GH 20636
+        index = IntervalIndex.from_breaks(breaks1)
+        key = make_key(breaks2)
+
+        msg = ('Cannot index an IntervalIndex of subtype {dtype1} with '
+               'values of dtype {dtype2}')
+        msg = re.escape(msg.format(dtype1=breaks1.dtype, dtype2=breaks2.dtype))
+        with pytest.raises(ValueError, match=msg):
+            index._maybe_convert_i8(key)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_contains(self):
+        # Only endpoints are valid.
+        i = IntervalIndex.from_arrays([0, 1], [1, 2])
+
+        # Invalid
+        assert 0 not in i
+        assert 1 not in i
+        assert 2 not in i
+
+        # Valid
+        assert Interval(0, 1) in i
+        assert Interval(0, 2) in i
+        assert Interval(0, 0.5) in i
+        assert Interval(3, 5) not in i
+        assert Interval(-1, 0, closed='left') not in i
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def testcontains(self):
+        # can select values that are IN the range of a value
+        i = IntervalIndex.from_arrays([0, 1], [1, 2])
+
+        assert i.contains(0.1)
+        assert i.contains(0.5)
+        assert i.contains(1)
+        assert i.contains(Interval(0, 1))
+        assert i.contains(Interval(0, 2))
+
+        # these overlaps completely
+        assert i.contains(Interval(0, 3))
+        assert i.contains(Interval(1, 3))
+
+        assert not i.contains(20)
+        assert not i.contains(-20)
+
+    def test_dropna(self, closed):
+
+        expected = IntervalIndex.from_tuples(
+            [(0.0, 1.0), (1.0, 2.0)], closed=closed)
+
+        ii = IntervalIndex.from_tuples([(0, 1), (1, 2), np.nan], closed=closed)
+        result = ii.dropna()
+        tm.assert_index_equal(result, expected)
+
+        ii = IntervalIndex.from_arrays(
+            [0, 1, np.nan], [1, 2, np.nan], closed=closed)
+        result = ii.dropna()
+        tm.assert_index_equal(result, expected)
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_non_contiguous(self, closed):
+        index = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=closed)
+        target = [0.5, 1.5, 2.5]
+        actual = index.get_indexer(target)
+        expected = np.array([0, -1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        assert 1.5 not in index
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, closed, sort):
+        index = self.create_index(closed=closed)
+        other = IntervalIndex.from_breaks(range(5, 13), closed=closed)
+
+        expected = IntervalIndex.from_breaks(range(13), closed=closed)
+        result = index[::-1].union(other, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        result = other[::-1].union(index, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        tm.assert_index_equal(index.union(index, sort=sort), index)
+        tm.assert_index_equal(index.union(index[:1], sort=sort), index)
+
+        # GH 19101: empty result, same dtype
+        index = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        result = index.union(index, sort=sort)
+        tm.assert_index_equal(result, index)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex(np.array([], dtype='float64'), closed=closed)
+        result = index.union(other, sort=sort)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection(self, closed, sort):
+        index = self.create_index(closed=closed)
+        other = IntervalIndex.from_breaks(range(5, 13), closed=closed)
+
+        expected = IntervalIndex.from_breaks(range(5, 11), closed=closed)
+        result = index[::-1].intersection(other, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        result = other[::-1].intersection(index, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        tm.assert_index_equal(index.intersection(index, sort=sort), index)
+
+        # GH 19101: empty result, same dtype
+        other = IntervalIndex.from_breaks(range(300, 314), closed=closed)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        result = index.intersection(other, sort=sort)
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        breaks = np.arange(300, 314, dtype='float64')
+        other = IntervalIndex.from_breaks(breaks, closed=closed)
+        result = index.intersection(other, sort=sort)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference(self, closed, sort):
+        index = IntervalIndex.from_arrays([1, 0, 3, 2],
+                                          [1, 2, 3, 4],
+                                          closed=closed)
+        result = index.difference(index[:1], sort=sort)
+        expected = index[1:]
+        if sort is None:
+            expected = expected.sort_values()
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, same dtype
+        result = index.difference(index, sort=sort)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex.from_arrays(index.left.astype('float64'),
+                                          index.right, closed=closed)
+        result = index.difference(other, sort=sort)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_symmetric_difference(self, closed, sort):
+        index = self.create_index(closed=closed)
+        result = index[1:].symmetric_difference(index[:-1], sort=sort)
+        expected = IntervalIndex([index[0], index[-1]])
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        # GH 19101: empty result, same dtype
+        result = index.symmetric_difference(index, sort=sort)
+        expected = IntervalIndex(np.array([], dtype='int64'), closed=closed)
+        if sort is None:
+            tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
+
+        # GH 19101: empty result, different dtypes
+        other = IntervalIndex.from_arrays(index.left.astype('float64'),
+                                          index.right, closed=closed)
+        result = index.symmetric_difference(other, sort=sort)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('op_name', [
+        'union', 'intersection', 'difference', 'symmetric_difference'])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_set_operation_errors(self, closed, op_name, sort):
+        index = self.create_index(closed=closed)
+        set_op = getattr(index, op_name)
+
+        # non-IntervalIndex
+        msg = ('the other index needs to be an IntervalIndex too, but '
+               'was type Int64Index')
+        with pytest.raises(TypeError, match=msg):
+            set_op(Index([1, 2, 3]), sort=sort)
+
+        # mixed closed
+        msg = ('can only do set operations between two IntervalIndex objects '
+               'that are closed on the same side')
+        for other_closed in {'right', 'left', 'both', 'neither'} - {closed}:
+            other = self.create_index(closed=other_closed)
+            with pytest.raises(ValueError, match=msg):
+                set_op(other, sort=sort)
+
+        # GH 19016: incompatible dtypes
+        other = interval_range(Timestamp('20180101'), periods=9, closed=closed)
+        msg = ('can only do {op} between two IntervalIndex objects that have '
+               'compatible dtypes').format(op=op_name)
+        with pytest.raises(TypeError, match=msg):
+            set_op(other, sort=sort)
+
+    def test_isin(self, closed):
+        index = self.create_index(closed=closed)
+
+        expected = np.array([True] + [False] * (len(index) - 1))
+        result = index.isin(index[:1])
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.isin([index[0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        other = IntervalIndex.from_breaks(np.arange(-2, 10), closed=closed)
+        expected = np.array([True] * (len(index) - 1) + [False])
+        result = index.isin(other)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = index.isin(other.tolist())
+        tm.assert_numpy_array_equal(result, expected)
+
+        for other_closed in {'right', 'left', 'both', 'neither'}:
+            other = self.create_index(closed=other_closed)
+            expected = np.repeat(closed == other_closed, len(index))
+            result = index.isin(other)
+            tm.assert_numpy_array_equal(result, expected)
+
+            result = index.isin(other.tolist())
+            tm.assert_numpy_array_equal(result, expected)
+
+    def test_comparison(self):
+        actual = Interval(0, 1) < self.index
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = Interval(0.5, 1.5) < self.index
+        expected = np.array([False, True])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index > Interval(0.5, 1.5)
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == self.index
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index <= self.index
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index >= self.index
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index < self.index
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(actual, expected)
+        actual = self.index > self.index
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == IntervalIndex.from_breaks([0, 1, 2], 'left')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        actual = self.index == self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index.values == self.index
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index <= self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([True, True]))
+        actual = self.index != self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index > self.index.values
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index.values > self.index
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+
+        # invalid comparisons
+        actual = self.index == 0
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+        actual = self.index == self.index.left
+        tm.assert_numpy_array_equal(actual, np.array([False, False]))
+
+        with pytest.raises(TypeError, match='unorderable types'):
+            self.index > 0
+        with pytest.raises(TypeError, match='unorderable types'):
+            self.index <= 0
+        msg = r"unorderable types: Interval\(\) > int\(\)"
+        with pytest.raises(TypeError, match=msg):
+            self.index > np.arange(2)
+        msg = "Lengths must match to compare"
+        with pytest.raises(ValueError, match=msg):
+            self.index > np.arange(3)
+
+    def test_missing_values(self, closed):
+        idx = Index([np.nan, Interval(0, 1, closed=closed),
+                     Interval(1, 2, closed=closed)])
+        idx2 = IntervalIndex.from_arrays(
+            [np.nan, 0, 1], [np.nan, 1, 2], closed=closed)
+        assert idx.equals(idx2)
+
+        msg = ("missing values must be missing in the same location both left"
+               " and right sides")
+        with pytest.raises(ValueError, match=msg):
+            IntervalIndex.from_arrays(
+                [np.nan, 0, 1], np.array([0, 1, 2]), closed=closed)
+
+        tm.assert_numpy_array_equal(isna(idx),
+                                    np.array([True, False, False]))
+
+    def test_sort_values(self, closed):
+        index = self.create_index(closed=closed)
+
+        result = index.sort_values()
+        tm.assert_index_equal(result, index)
+
+        result = index.sort_values(ascending=False)
+        tm.assert_index_equal(result, index[::-1])
+
+        # with nan
+        index = IntervalIndex([Interval(1, 2), np.nan, Interval(0, 1)])
+
+        result = index.sort_values()
+        expected = IntervalIndex([Interval(0, 1), Interval(1, 2), np.nan])
+        tm.assert_index_equal(result, expected)
+
+        result = index.sort_values(ascending=False)
+        expected = IntervalIndex([np.nan, Interval(1, 2), Interval(0, 1)])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    def test_datetime(self, tz):
+        start = Timestamp('2000-01-01', tz=tz)
+        dates = date_range(start=start, periods=10)
+        index = IntervalIndex.from_breaks(dates)
+
+        # test mid
+        start = Timestamp('2000-01-01T12:00', tz=tz)
+        expected = date_range(start=start, periods=9)
+        tm.assert_index_equal(index.mid, expected)
+
+        # __contains__ doesn't check individual points
+        assert Timestamp('2000-01-01', tz=tz) not in index
+        assert Timestamp('2000-01-01T12', tz=tz) not in index
+        assert Timestamp('2000-01-02', tz=tz) not in index
+        iv_true = Interval(Timestamp('2000-01-01T08', tz=tz),
+                           Timestamp('2000-01-01T18', tz=tz))
+        iv_false = Interval(Timestamp('1999-12-31', tz=tz),
+                            Timestamp('2000-01-01', tz=tz))
+        assert iv_true in index
+        assert iv_false not in index
+
+        # .contains does check individual points
+        assert not index.contains(Timestamp('2000-01-01', tz=tz))
+        assert index.contains(Timestamp('2000-01-01T12', tz=tz))
+        assert index.contains(Timestamp('2000-01-02', tz=tz))
+        assert index.contains(iv_true)
+        assert not index.contains(iv_false)
+
+        # test get_indexer
+        start = Timestamp('1999-12-31T12:00', tz=tz)
+        target = date_range(start=start, periods=7, freq='12H')
+        actual = index.get_indexer(target)
+        expected = np.array([-1, -1, 0, 0, 1, 1, 2], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+        start = Timestamp('2000-01-08T18:00', tz=tz)
+        target = date_range(start=start, periods=7, freq='6H')
+        actual = index.get_indexer(target)
+        expected = np.array([7, 7, 8, 8, 8, 8, -1], dtype='intp')
+        tm.assert_numpy_array_equal(actual, expected)
+
+    def test_append(self, closed):
+
+        index1 = IntervalIndex.from_arrays([0, 1], [1, 2], closed=closed)
+        index2 = IntervalIndex.from_arrays([1, 2], [2, 3], closed=closed)
+
+        result = index1.append(index2)
+        expected = IntervalIndex.from_arrays(
+            [0, 1, 1, 2], [1, 2, 2, 3], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        result = index1.append([index1, index2])
+        expected = IntervalIndex.from_arrays(
+            [0, 1, 0, 1, 1, 2], [1, 2, 1, 2, 2, 3], closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        msg = ('can only append two IntervalIndex objects that are closed '
+               'on the same side')
+        for other_closed in {'left', 'right', 'both', 'neither'} - {closed}:
+            index_other_closed = IntervalIndex.from_arrays(
+                [0, 1], [1, 2], closed=other_closed)
+            with pytest.raises(ValueError, match=msg):
+                index1.append(index_other_closed)
+
+    def test_is_non_overlapping_monotonic(self, closed):
+        # Should be True in all cases
+        tpls = [(0, 1), (2, 3), (4, 5), (6, 7)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is True
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is True
+
+        # Should be False in all cases (overlapping)
+        tpls = [(0, 2), (1, 3), (4, 5), (6, 7)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        # Should be False in all cases (non-monotonic)
+        tpls = [(0, 1), (2, 3), (6, 7), (4, 5)]
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        idx = IntervalIndex.from_tuples(tpls[::-1], closed=closed)
+        assert idx.is_non_overlapping_monotonic is False
+
+        # Should be False for closed='both', otherwise True (GH16560)
+        if closed == 'both':
+            idx = IntervalIndex.from_breaks(range(4), closed=closed)
+            assert idx.is_non_overlapping_monotonic is False
+        else:
+            idx = IntervalIndex.from_breaks(range(4), closed=closed)
+            assert idx.is_non_overlapping_monotonic is True
+
+    @pytest.mark.parametrize('start, shift, na_value', [
+        (0, 1, np.nan),
+        (Timestamp('2018-01-01'), Timedelta('1 day'), pd.NaT),
+        (Timedelta('0 days'), Timedelta('1 day'), pd.NaT)])
+    def test_is_overlapping(self, start, shift, na_value, closed):
+        # GH 23309
+        # see test_interval_tree.py for extensive tests; interface tests here
+
+        # non-overlapping
+        tuples = [(start + n * shift, start + (n + 1) * shift)
+                  for n in (0, 2, 4)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        assert index.is_overlapping is False
+
+        # non-overlapping with NA
+        tuples = [(na_value, na_value)] + tuples + [(na_value, na_value)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        assert index.is_overlapping is False
+
+        # overlapping
+        tuples = [(start + n * shift, start + (n + 2) * shift)
+                  for n in range(3)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        assert index.is_overlapping is True
+
+        # overlapping with NA
+        tuples = [(na_value, na_value)] + tuples + [(na_value, na_value)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        assert index.is_overlapping is True
+
+        # common endpoints
+        tuples = [(start + n * shift, start + (n + 1) * shift)
+                  for n in range(3)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        result = index.is_overlapping
+        expected = closed == 'both'
+        assert result is expected
+
+        # common endpoints with NA
+        tuples = [(na_value, na_value)] + tuples + [(na_value, na_value)]
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+        result = index.is_overlapping
+        assert result is expected
+
+    @pytest.mark.parametrize('tuples', [
+        lzip(range(10), range(1, 11)),
+        lzip(date_range('20170101', periods=10),
+             date_range('20170101', periods=10)),
+        lzip(timedelta_range('0 days', periods=10),
+             timedelta_range('1 day', periods=10))])
+    def test_to_tuples(self, tuples):
+        # GH 18756
+        idx = IntervalIndex.from_tuples(tuples)
+        result = idx.to_tuples()
+        expected = Index(com.asarray_tuplesafe(tuples))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tuples', [
+        lzip(range(10), range(1, 11)) + [np.nan],
+        lzip(date_range('20170101', periods=10),
+             date_range('20170101', periods=10)) + [np.nan],
+        lzip(timedelta_range('0 days', periods=10),
+             timedelta_range('1 day', periods=10)) + [np.nan]])
+    @pytest.mark.parametrize('na_tuple', [True, False])
+    def test_to_tuples_na(self, tuples, na_tuple):
+        # GH 18756
+        idx = IntervalIndex.from_tuples(tuples)
+        result = idx.to_tuples(na_tuple=na_tuple)
+
+        # check the non-NA portion
+        expected_notna = Index(com.asarray_tuplesafe(tuples[:-1]))
+        result_notna = result[:-1]
+        tm.assert_index_equal(result_notna, expected_notna)
+
+        # check the NA portion
+        result_na = result[-1]
+        if na_tuple:
+            assert isinstance(result_na, tuple)
+            assert len(result_na) == 2
+            assert all(isna(x) for x in result_na)
+        else:
+            assert isna(result_na)
+
+    def test_nbytes(self):
+        # GH 19209
+        left = np.arange(0, 4, dtype='i8')
+        right = np.arange(1, 5, dtype='i8')
+
+        result = IntervalIndex.from_arrays(left, right).nbytes
+        expected = 64  # 4 * 8 * 2
+        assert result == expected
+
+    def test_itemsize(self):
+        # GH 19209
+        left = np.arange(0, 4, dtype='i8')
+        right = np.arange(1, 5, dtype='i8')
+        expected = 16  # 8 * 2
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = IntervalIndex.from_arrays(left, right).itemsize
+
+        assert result == expected
+
+    @pytest.mark.parametrize('new_closed', [
+        'left', 'right', 'both', 'neither'])
+    def test_set_closed(self, name, closed, new_closed):
+        # GH 21670
+        index = interval_range(0, 5, closed=closed, name=name)
+        result = index.set_closed(new_closed)
+        expected = interval_range(0, 5, closed=new_closed, name=name)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('bad_closed', ['foo', 10, 'LEFT', True, False])
+    def test_set_closed_errors(self, bad_closed):
+        # GH 21670
+        index = interval_range(0, 5)
+        msg = "invalid option for 'closed': {closed}".format(closed=bad_closed)
+        with pytest.raises(ValueError, match=msg):
+            index.set_closed(bad_closed)
+
+    def test_is_all_dates(self):
+        # GH 23576
+        year_2017 = pd.Interval(pd.Timestamp('2017-01-01 00:00:00'),
+                                pd.Timestamp('2018-01-01 00:00:00'))
+        year_2017_index = pd.IntervalIndex([year_2017])
+        assert not year_2017_index.is_all_dates
diff --git a/pandas/tests/indexes/interval/test_interval_new.py b/pandas/tests/indexes/interval/test_interval_new.py
new file mode 100644
index 0000000000000..fcffa29f7eadb
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_new.py
@@ -0,0 +1,271 @@
+from __future__ import division
+
+import numpy as np
+import pytest
+
+from pandas import Int64Index, Interval, IntervalIndex
+import pandas.util.testing as tm
+
+pytestmark = pytest.mark.skip(reason="new indexing tests for issue 16316")
+
+
+class TestIntervalIndex(object):
+
+    @pytest.mark.parametrize("side", ['right', 'left', 'both', 'neither'])
+    def test_get_loc_interval(self, closed, side):
+
+        idx = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=closed)
+
+        for bound in [[0, 1], [1, 2], [2, 3], [3, 4],
+                      [0, 2], [2.5, 3], [-1, 4]]:
+            # if get_loc is supplied an interval, it should only search
+            # for exact matches, not overlaps or covers, else KeyError.
+            if closed == side:
+                if bound == [0, 1]:
+                    assert idx.get_loc(Interval(0, 1, closed=side)) == 0
+                elif bound == [2, 3]:
+                    assert idx.get_loc(Interval(2, 3, closed=side)) == 1
+                else:
+                    with pytest.raises(KeyError):
+                        idx.get_loc(Interval(*bound, closed=side))
+            else:
+                with pytest.raises(KeyError):
+                    idx.get_loc(Interval(*bound, closed=side))
+
+    @pytest.mark.parametrize("scalar", [-0.5, 0, 0.5, 1, 1.5, 2, 2.5, 3, 3.5])
+    def test_get_loc_scalar(self, closed, scalar):
+
+        # correct = {side: {query: answer}}.
+        # If query is not in the dict, that query should raise a KeyError
+        correct = {'right': {0.5: 0, 1: 0, 2.5: 1, 3: 1},
+                   'left': {0: 0, 0.5: 0, 2: 1, 2.5: 1},
+                   'both': {0: 0, 0.5: 0, 1: 0, 2: 1, 2.5: 1, 3: 1},
+                   'neither': {0.5: 0, 2.5: 1}}
+
+        idx = IntervalIndex.from_tuples([(0, 1), (2, 3)], closed=closed)
+
+        # if get_loc is supplied a scalar, it should return the index of
+        # the interval which contains the scalar, or KeyError.
+        if scalar in correct[closed].keys():
+            assert idx.get_loc(scalar) == correct[closed][scalar]
+        else:
+            pytest.raises(KeyError, idx.get_loc, scalar)
+
+    def test_slice_locs_with_interval(self):
+
+        # increasing monotonically
+        index = IntervalIndex.from_tuples([(0, 2), (1, 3), (2, 4)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 1)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 1)
+
+        # decreasing monotonically
+        index = IntervalIndex.from_tuples([(2, 4), (1, 3), (0, 2)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (2, 1)
+        assert index.slice_locs(start=Interval(0, 2)) == (2, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 1)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (0, 3)
+
+        # sorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 3)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 2)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 2)
+
+        # unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (2, 4), (0, 2)])
+
+        pytest.raises(KeyError, index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)))
+        pytest.raises(KeyError, index.slice_locs(start=Interval(0, 2)))
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 2)
+        pytest.raises(KeyError, index.slice_locs(end=Interval(0, 2)))
+        pytest.raises(KeyError, index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)))
+
+        # another unsorted duplicates
+        index = IntervalIndex.from_tuples([(0, 2), (0, 2), (2, 4), (1, 3)])
+
+        assert index.slice_locs(
+            start=Interval(0, 2), end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(start=Interval(0, 2)) == (0, 4)
+        assert index.slice_locs(end=Interval(2, 4)) == (0, 3)
+        assert index.slice_locs(end=Interval(0, 2)) == (0, 2)
+        assert index.slice_locs(
+            start=Interval(2, 4), end=Interval(0, 2)) == (2, 2)
+
+    def test_slice_locs_with_ints_and_floats_succeeds(self):
+
+        # increasing non-overlapping
+        index = IntervalIndex.from_tuples([(0, 1), (1, 2), (3, 4)])
+
+        assert index.slice_locs(0, 1) == (0, 1)
+        assert index.slice_locs(0, 2) == (0, 2)
+        assert index.slice_locs(0, 3) == (0, 2)
+        assert index.slice_locs(3, 1) == (2, 1)
+        assert index.slice_locs(3, 4) == (2, 3)
+        assert index.slice_locs(0, 4) == (0, 3)
+
+        # decreasing non-overlapping
+        index = IntervalIndex.from_tuples([(3, 4), (1, 2), (0, 1)])
+        assert index.slice_locs(0, 1) == (3, 2)
+        assert index.slice_locs(0, 2) == (3, 1)
+        assert index.slice_locs(0, 3) == (3, 1)
+        assert index.slice_locs(3, 1) == (1, 2)
+        assert index.slice_locs(3, 4) == (1, 0)
+        assert index.slice_locs(0, 4) == (3, 0)
+
+    @pytest.mark.parametrize("query", [
+        [0, 1], [0, 2], [0, 3], [3, 1], [3, 4], [0, 4]])
+    @pytest.mark.parametrize("tuples", [
+        [(0, 2), (1, 3), (2, 4)], [(2, 4), (1, 3), (0, 2)],
+        [(0, 2), (0, 2), (2, 4)], [(0, 2), (2, 4), (0, 2)],
+        [(0, 2), (0, 2), (2, 4), (1, 3)]])
+    def test_slice_locs_with_ints_and_floats_errors(self, tuples, query):
+        index = IntervalIndex.from_tuples(tuples)
+        with pytest.raises(KeyError):
+            index.slice_locs(query)
+
+    @pytest.mark.parametrize('query, expected', [
+        ([Interval(1, 3, closed='right')], [1]),
+        ([Interval(1, 3, closed='left')], [-1]),
+        ([Interval(1, 3, closed='both')], [-1]),
+        ([Interval(1, 3, closed='neither')], [-1]),
+        ([Interval(1, 4, closed='right')], [-1]),
+        ([Interval(0, 4, closed='right')], [-1]),
+        ([Interval(1, 2, closed='right')], [-1]),
+        ([Interval(2, 4, closed='right'), Interval(1, 3, closed='right')],
+         [2, 1]),
+        ([Interval(1, 3, closed='right'), Interval(0, 2, closed='right')],
+         [1, -1]),
+        ([Interval(1, 3, closed='right'), Interval(1, 3, closed='left')],
+         [1, -1])])
+    def test_get_indexer_with_interval(self, query, expected):
+
+        tuples = [(0, 2.5), (1, 3), (2, 4)]
+        index = IntervalIndex.from_tuples(tuples, closed='right')
+
+        result = index.get_indexer(query)
+        expected = np.array(expected, dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('query, expected', [
+        ([-0.5], [-1]),
+        ([0], [-1]),
+        ([0.5], [0]),
+        ([1], [0]),
+        ([1.5], [1]),
+        ([2], [1]),
+        ([2.5], [-1]),
+        ([3], [-1]),
+        ([3.5], [2]),
+        ([4], [2]),
+        ([4.5], [-1]),
+        ([1, 2], [0, 1]),
+        ([1, 2, 3], [0, 1, -1]),
+        ([1, 2, 3, 4], [0, 1, -1, 2]),
+        ([1, 2, 3, 4, 2], [0, 1, -1, 2, 1])])
+    def test_get_indexer_with_int_and_float(self, query, expected):
+
+        tuples = [(0, 1), (1, 2), (3, 4)]
+        index = IntervalIndex.from_tuples(tuples, closed='right')
+
+        result = index.get_indexer(query)
+        expected = np.array(expected, dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('tuples, closed', [
+        ([(0, 2), (1, 3), (3, 4)], 'neither'),
+        ([(0, 5), (1, 4), (6, 7)], 'left'),
+        ([(0, 1), (0, 1), (1, 2)], 'right'),
+        ([(0, 1), (2, 3), (3, 4)], 'both')])
+    def test_get_indexer_errors(self, tuples, closed):
+        # IntervalIndex needs non-overlapping for uniqueness when querying
+        index = IntervalIndex.from_tuples(tuples, closed=closed)
+
+        msg = ('cannot handle overlapping indices; use '
+               'IntervalIndex.get_indexer_non_unique')
+        with pytest.raises(ValueError, match=msg):
+            index.get_indexer([0, 2])
+
+    @pytest.mark.parametrize('query, expected', [
+        ([-0.5], ([-1], [0])),
+        ([0], ([0], [])),
+        ([0.5], ([0], [])),
+        ([1], ([0, 1], [])),
+        ([1.5], ([0, 1], [])),
+        ([2], ([0, 1, 2], [])),
+        ([2.5], ([1, 2], [])),
+        ([3], ([2], [])),
+        ([3.5], ([2], [])),
+        ([4], ([-1], [0])),
+        ([4.5], ([-1], [0])),
+        ([1, 2], ([0, 1, 0, 1, 2], [])),
+        ([1, 2, 3], ([0, 1, 0, 1, 2, 2], [])),
+        ([1, 2, 3, 4], ([0, 1, 0, 1, 2, 2, -1], [3])),
+        ([1, 2, 3, 4, 2], ([0, 1, 0, 1, 2, 2, -1, 0, 1, 2], [3]))])
+    def test_get_indexer_non_unique_with_int_and_float(self, query, expected):
+
+        tuples = [(0, 2.5), (1, 3), (2, 4)]
+        index = IntervalIndex.from_tuples(tuples, closed='left')
+
+        result_indexer, result_missing = index.get_indexer_non_unique(query)
+        expected_indexer = Int64Index(expected[0])
+        expected_missing = np.array(expected[1], dtype='intp')
+
+        tm.assert_index_equal(result_indexer, expected_indexer)
+        tm.assert_numpy_array_equal(result_missing, expected_missing)
+
+        # TODO we may also want to test get_indexer for the case when
+        # the intervals are duplicated, decreasing, non-monotonic, etc..
+
+    def test_contains(self):
+
+        index = IntervalIndex.from_arrays([0, 1], [1, 2], closed='right')
+
+        # __contains__ requires perfect matches to intervals.
+        assert 0 not in index
+        assert 1 not in index
+        assert 2 not in index
+
+        assert Interval(0, 1, closed='right') in index
+        assert Interval(0, 2, closed='right') not in index
+        assert Interval(0, 0.5, closed='right') not in index
+        assert Interval(3, 5, closed='right') not in index
+        assert Interval(-1, 0, closed='left') not in index
+        assert Interval(0, 1, closed='left') not in index
+        assert Interval(0, 1, closed='both') not in index
+
+    def test_contains_method(self):
+
+        index = IntervalIndex.from_arrays([0, 1], [1, 2], closed='right')
+
+        assert not index.contains(0)
+        assert index.contains(0.1)
+        assert index.contains(0.5)
+        assert index.contains(1)
+
+        assert index.contains(Interval(0, 1, closed='right'))
+        assert not index.contains(Interval(0, 1, closed='left'))
+        assert not index.contains(Interval(0, 1, closed='both'))
+        assert not index.contains(Interval(0, 2, closed='right'))
+
+        assert not index.contains(Interval(0, 3, closed='right'))
+        assert not index.contains(Interval(1, 3, closed='right'))
+
+        assert not index.contains(20)
+        assert not index.contains(-20)
diff --git a/pandas/tests/indexes/interval/test_interval_range.py b/pandas/tests/indexes/interval/test_interval_range.py
new file mode 100644
index 0000000000000..13b7b643999da
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_range.py
@@ -0,0 +1,316 @@
+from __future__ import division
+
+from datetime import timedelta
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.common import is_integer
+
+from pandas import (
+    DateOffset, Interval, IntervalIndex, Timedelta, Timestamp, date_range,
+    interval_range, timedelta_range)
+import pandas.util.testing as tm
+
+from pandas.tseries.offsets import Day
+
+
+@pytest.fixture(scope='class', params=[None, 'foo'])
+def name(request):
+    return request.param
+
+
+class TestIntervalRange(object):
+
+    @pytest.mark.parametrize('freq, periods', [
+        (1, 100), (2.5, 40), (5, 20), (25, 4)])
+    def test_constructor_numeric(self, closed, name, freq, periods):
+        start, end = 0, 100
+        breaks = np.arange(101, step=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        result = interval_range(
+            start=start, end=end, periods=periods, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'US/Eastern'])
+    @pytest.mark.parametrize('freq, periods', [
+        ('D', 364), ('2D', 182), ('22D18H', 16), ('M', 11)])
+    def test_constructor_timestamp(self, closed, name, freq, periods, tz):
+        start, end = Timestamp('20180101', tz=tz), Timestamp('20181231', tz=tz)
+        breaks = date_range(start=start, end=end, freq=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        if not breaks.freq.isAnchored() and tz is None:
+            # matches expected only for non-anchored offsets and tz naive
+            # (anchored/DST transitions cause unequal spacing in expected)
+            result = interval_range(start=start, end=end, periods=periods,
+                                    name=name, closed=closed)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq, periods', [
+        ('D', 100), ('2D12H', 40), ('5D', 20), ('25D', 4)])
+    def test_constructor_timedelta(self, closed, name, freq, periods):
+        start, end = Timedelta('0 days'), Timedelta('100 days')
+        breaks = timedelta_range(start=start, end=end, freq=freq)
+        expected = IntervalIndex.from_breaks(breaks, name=name, closed=closed)
+
+        # defined from start/end/freq
+        result = interval_range(
+            start=start, end=end, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from start/periods/freq
+        result = interval_range(
+            start=start, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # defined from end/periods/freq
+        result = interval_range(
+            end=end, periods=periods, freq=freq, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        result = interval_range(
+            start=start, end=end, periods=periods, name=name, closed=closed)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start, end, freq, expected_endpoint', [
+        (0, 10, 3, 9),
+        (0, 10, 1.5, 9),
+        (0.5, 10, 3, 9.5),
+        (Timedelta('0D'), Timedelta('10D'), '2D4H', Timedelta('8D16H')),
+        (Timestamp('2018-01-01'),
+         Timestamp('2018-02-09'),
+         'MS',
+         Timestamp('2018-02-01')),
+        (Timestamp('2018-01-01', tz='US/Eastern'),
+         Timestamp('2018-01-20', tz='US/Eastern'),
+         '5D12H',
+         Timestamp('2018-01-17 12:00:00', tz='US/Eastern'))])
+    def test_early_truncation(self, start, end, freq, expected_endpoint):
+        # index truncates early if freq causes end to be skipped
+        result = interval_range(start=start, end=end, freq=freq)
+        result_endpoint = result.right[-1]
+        assert result_endpoint == expected_endpoint
+
+    @pytest.mark.parametrize('start, end, freq', [
+        (0.5, None, None),
+        (None, 4.5, None),
+        (0.5, None, 1.5),
+        (None, 6.5, 1.5)])
+    def test_no_invalid_float_truncation(self, start, end, freq):
+        # GH 21161
+        if freq is None:
+            breaks = [0.5, 1.5, 2.5, 3.5, 4.5]
+        else:
+            breaks = [0.5, 2.0, 3.5, 5.0, 6.5]
+        expected = IntervalIndex.from_breaks(breaks)
+
+        result = interval_range(start=start, end=end, periods=4, freq=freq)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('start, mid, end', [
+        (Timestamp('2018-03-10', tz='US/Eastern'),
+         Timestamp('2018-03-10 23:30:00', tz='US/Eastern'),
+         Timestamp('2018-03-12', tz='US/Eastern')),
+        (Timestamp('2018-11-03', tz='US/Eastern'),
+         Timestamp('2018-11-04 00:30:00', tz='US/Eastern'),
+         Timestamp('2018-11-05', tz='US/Eastern'))])
+    def test_linspace_dst_transition(self, start, mid, end):
+        # GH 20976: linspace behavior defined from start/end/periods
+        # accounts for the hour gained/lost during DST transition
+        result = interval_range(start=start, end=end, periods=2)
+        expected = IntervalIndex.from_breaks([start, mid, end])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', [2, 2.0])
+    @pytest.mark.parametrize('end', [10, 10.0])
+    @pytest.mark.parametrize('start', [0, 0.0])
+    def test_float_subtype(self, start, end, freq):
+        # Has float subtype if any of start/end/freq are float, even if all
+        # resulting endpoints can safely be upcast to integers
+
+        # defined from start/end/freq
+        index = interval_range(start=start, end=end, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + end + freq) else 'float64'
+        assert result == expected
+
+        # defined from start/periods/freq
+        index = interval_range(start=start, periods=5, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + freq) else 'float64'
+        assert result == expected
+
+        # defined from end/periods/freq
+        index = interval_range(end=end, periods=5, freq=freq)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(end + freq) else 'float64'
+        assert result == expected
+
+        # GH 20976: linspace behavior defined from start/end/periods
+        index = interval_range(start=start, end=end, periods=5)
+        result = index.dtype.subtype
+        expected = 'int64' if is_integer(start + end) else 'float64'
+        assert result == expected
+
+    def test_constructor_coverage(self):
+        # float value for periods
+        expected = interval_range(start=0, periods=10)
+        result = interval_range(start=0, periods=10.5)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent timestamp-like start/end
+        start, end = Timestamp('2017-01-01'), Timestamp('2017-01-15')
+        expected = interval_range(start=start, end=end)
+
+        result = interval_range(start=start.to_pydatetime(),
+                                end=end.to_pydatetime())
+        tm.assert_index_equal(result, expected)
+
+        result = interval_range(start=start.asm8, end=end.asm8)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent freq with timestamp
+        equiv_freq = ['D', Day(), Timedelta(days=1), timedelta(days=1),
+                      DateOffset(days=1)]
+        for freq in equiv_freq:
+            result = interval_range(start=start, end=end, freq=freq)
+            tm.assert_index_equal(result, expected)
+
+        # equivalent timedelta-like start/end
+        start, end = Timedelta(days=1), Timedelta(days=10)
+        expected = interval_range(start=start, end=end)
+
+        result = interval_range(start=start.to_pytimedelta(),
+                                end=end.to_pytimedelta())
+        tm.assert_index_equal(result, expected)
+
+        result = interval_range(start=start.asm8, end=end.asm8)
+        tm.assert_index_equal(result, expected)
+
+        # equivalent freq with timedelta
+        equiv_freq = ['D', Day(), Timedelta(days=1), timedelta(days=1)]
+        for freq in equiv_freq:
+            result = interval_range(start=start, end=end, freq=freq)
+            tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the four parameters: start, end, periods, and freq, '
+               'exactly three must be specified')
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range(start=0)
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range(end=5)
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range(periods=2)
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range()
+
+        # too many params
+        with pytest.raises(ValueError, match=msg):
+            interval_range(start=0, end=5, periods=6, freq=1.5)
+
+        # mixed units
+        msg = 'start, end, freq need to be type compatible'
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=0, end=Timestamp('20130101'), freq=2)
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=0, end=Timedelta('1 day'), freq=2)
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=0, end=10, freq='D')
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timestamp('20130101'), end=10, freq='D')
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timestamp('20130101'),
+                           end=Timedelta('1 day'), freq='D')
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timestamp('20130101'),
+                           end=Timestamp('20130110'), freq=2)
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timedelta('1 day'), end=10, freq='D')
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timedelta('1 day'),
+                           end=Timestamp('20130110'), freq='D')
+
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=Timedelta('1 day'),
+                           end=Timedelta('10 days'), freq=2)
+
+        # invalid periods
+        msg = 'periods must be a number, got foo'
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=0, periods='foo')
+
+        # invalid start
+        msg = 'start must be numeric or datetime-like, got foo'
+        with pytest.raises(ValueError, match=msg):
+            interval_range(start='foo', periods=10)
+
+        # invalid end
+        msg = r'end must be numeric or datetime-like, got \(0, 1\]'
+        with pytest.raises(ValueError, match=msg):
+            interval_range(end=Interval(0, 1), periods=10)
+
+        # invalid freq for datetime-like
+        msg = 'freq must be numeric or convertible to DateOffset, got foo'
+        with pytest.raises(ValueError, match=msg):
+            interval_range(start=0, end=10, freq='foo')
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range(start=Timestamp('20130101'), periods=10, freq='foo')
+
+        with pytest.raises(ValueError, match=msg):
+            interval_range(end=Timedelta('1 day'), periods=10, freq='foo')
+
+        # mixed tz
+        start = Timestamp('2017-01-01', tz='US/Eastern')
+        end = Timestamp('2017-01-07', tz='US/Pacific')
+        msg = 'Start and end cannot both be tz-aware with different timezones'
+        with pytest.raises(TypeError, match=msg):
+            interval_range(start=start, end=end)
diff --git a/pandas/tests/indexes/interval/test_interval_tree.py b/pandas/tests/indexes/interval/test_interval_tree.py
new file mode 100644
index 0000000000000..5d9ef2a9a6c32
--- /dev/null
+++ b/pandas/tests/indexes/interval/test_interval_tree.py
@@ -0,0 +1,184 @@
+from __future__ import division
+
+from itertools import permutations
+
+import numpy as np
+import pytest
+
+from pandas._libs.interval import IntervalTree
+
+from pandas import compat
+import pandas.util.testing as tm
+
+
+def skipif_32bit(param):
+    """
+    Skip parameters in a parametrize on 32bit systems. Specifically used
+    here to skip leaf_size parameters related to GH 23440.
+    """
+    marks = pytest.mark.skipif(compat.is_platform_32bit(),
+                               reason='GH 23440: int type mismatch on 32bit')
+    return pytest.param(param, marks=marks)
+
+
+@pytest.fixture(
+    scope='class', params=['int32', 'int64', 'float32', 'float64', 'uint64'])
+def dtype(request):
+    return request.param
+
+
+@pytest.fixture(params=[skipif_32bit(1), skipif_32bit(2), 10])
+def leaf_size(request):
+    """
+    Fixture to specify IntervalTree leaf_size parameter; to be used with the
+    tree fixture.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[
+    np.arange(5, dtype='int64'),
+    np.arange(5, dtype='int32'),
+    np.arange(5, dtype='uint64'),
+    np.arange(5, dtype='float64'),
+    np.arange(5, dtype='float32'),
+    np.array([0, 1, 2, 3, 4, np.nan], dtype='float64'),
+    np.array([0, 1, 2, 3, 4, np.nan], dtype='float32')])
+def tree(request, leaf_size):
+    left = request.param
+    return IntervalTree(left, left + 2, leaf_size=leaf_size)
+
+
+class TestIntervalTree(object):
+
+    def test_get_loc(self, tree):
+        result = tree.get_loc(1)
+        expected = np.array([0], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.sort(tree.get_loc(2))
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            tree.get_loc(-1)
+
+    def test_get_indexer(self, tree):
+        result = tree.get_indexer(np.array([1.0, 5.5, 6.5]))
+        expected = np.array([0, 4, -1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            tree.get_indexer(np.array([3.0]))
+
+    def test_get_indexer_non_unique(self, tree):
+        indexer, missing = tree.get_indexer_non_unique(
+            np.array([1.0, 2.0, 6.5]))
+
+        result = indexer[:1]
+        expected = np.array([0], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.sort(indexer[1:3])
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = np.sort(indexer[3:])
+        expected = np.array([-1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = missing
+        expected = np.array([2], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_duplicates(self, dtype):
+        left = np.array([0, 0, 0], dtype=dtype)
+        tree = IntervalTree(left, left + 1)
+
+        result = np.sort(tree.get_loc(0.5))
+        expected = np.array([0, 1, 2], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            tree.get_indexer(np.array([0.5]))
+
+        indexer, missing = tree.get_indexer_non_unique(np.array([0.5]))
+        result = np.sort(indexer)
+        expected = np.array([0, 1, 2], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = missing
+        expected = np.array([], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_loc_closed(self, closed):
+        tree = IntervalTree([0], [1], closed=closed)
+        for p, errors in [(0, tree.open_left),
+                          (1, tree.open_right)]:
+            if errors:
+                with pytest.raises(KeyError):
+                    tree.get_loc(p)
+            else:
+                result = tree.get_loc(p)
+                expected = np.array([0], dtype='intp')
+                tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('leaf_size', [
+        skipif_32bit(1), skipif_32bit(10), skipif_32bit(100), 10000])
+    def test_get_indexer_closed(self, closed, leaf_size):
+        x = np.arange(1000, dtype='float64')
+        found = x.astype('intp')
+        not_found = (-1 * np.ones(1000)).astype('intp')
+
+        tree = IntervalTree(x, x + 0.5, closed=closed, leaf_size=leaf_size)
+        tm.assert_numpy_array_equal(found, tree.get_indexer(x + 0.25))
+
+        expected = found if tree.closed_left else not_found
+        tm.assert_numpy_array_equal(expected, tree.get_indexer(x + 0.0))
+
+        expected = found if tree.closed_right else not_found
+        tm.assert_numpy_array_equal(expected, tree.get_indexer(x + 0.5))
+
+    @pytest.mark.parametrize('left, right, expected', [
+        (np.array([0, 1, 4]), np.array([2, 3, 5]), True),
+        (np.array([0, 1, 2]), np.array([5, 4, 3]), True),
+        (np.array([0, 1, np.nan]), np.array([5, 4, np.nan]), True),
+        (np.array([0, 2, 4]), np.array([1, 3, 5]), False),
+        (np.array([0, 2, np.nan]), np.array([1, 3, np.nan]), False)])
+    @pytest.mark.parametrize('order', map(list, permutations(range(3))))
+    def test_is_overlapping(self, closed, order, left, right, expected):
+        # GH 23309
+        tree = IntervalTree(left[order], right[order], closed=closed)
+        result = tree.is_overlapping
+        assert result is expected
+
+    @pytest.mark.parametrize('order', map(list, permutations(range(3))))
+    def test_is_overlapping_endpoints(self, closed, order):
+        """shared endpoints are marked as overlapping"""
+        # GH 23309
+        left, right = np.arange(3), np.arange(1, 4)
+        tree = IntervalTree(left[order], right[order], closed=closed)
+        result = tree.is_overlapping
+        expected = closed is 'both'
+        assert result is expected
+
+    @pytest.mark.parametrize('left, right', [
+        (np.array([], dtype='int64'), np.array([], dtype='int64')),
+        (np.array([0], dtype='int64'), np.array([1], dtype='int64')),
+        (np.array([np.nan]), np.array([np.nan])),
+        (np.array([np.nan] * 3), np.array([np.nan] * 3))])
+    def test_is_overlapping_trivial(self, closed, left, right):
+        # GH 23309
+        tree = IntervalTree(left, right, closed=closed)
+        assert tree.is_overlapping is False
+
+    @pytest.mark.skipif(compat.is_platform_32bit(), reason='GH 23440')
+    def test_construction_overflow(self):
+        # GH 25485
+        left, right = np.arange(101), [np.iinfo(np.int64).max] * 101
+        tree = IntervalTree(left, right)
+
+        # pivot should be average of left/right medians
+        result = tree.root.pivot
+        expected = (50 + np.iinfo(np.int64).max) / 2
+        assert result == expected
diff --git a/pandas/tests/indexes/multi/__init__.py b/pandas/tests/indexes/multi/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexes/multi/conftest.py b/pandas/tests/indexes/multi/conftest.py
new file mode 100644
index 0000000000000..7fb862c69f5b2
--- /dev/null
+++ b/pandas/tests/indexes/multi/conftest.py
@@ -0,0 +1,56 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import Index, MultiIndex
+
+
+@pytest.fixture
+def idx():
+    # a MultiIndex used to test the general functionality of the
+    # general functionality of this object
+    major_axis = Index(['foo', 'bar', 'baz', 'qux'])
+    minor_axis = Index(['one', 'two'])
+
+    major_codes = np.array([0, 0, 1, 2, 3, 3])
+    minor_codes = np.array([0, 1, 0, 1, 0, 1])
+    index_names = ['first', 'second']
+    mi = MultiIndex(levels=[major_axis, minor_axis],
+                    codes=[major_codes, minor_codes],
+                    names=index_names, verify_integrity=False)
+    return mi
+
+
+@pytest.fixture
+def idx_dup():
+    # compare tests/indexes/multi/conftest.py
+    major_axis = Index(['foo', 'bar', 'baz', 'qux'])
+    minor_axis = Index(['one', 'two'])
+
+    major_codes = np.array([0, 0, 1, 0, 1, 1])
+    minor_codes = np.array([0, 1, 0, 1, 0, 1])
+    index_names = ['first', 'second']
+    mi = MultiIndex(levels=[major_axis, minor_axis],
+                    codes=[major_codes, minor_codes],
+                    names=index_names, verify_integrity=False)
+    return mi
+
+
+@pytest.fixture
+def index_names():
+    # names that match those in the idx fixture for testing equality of
+    # names assigned to the idx
+    return ['first', 'second']
+
+
+@pytest.fixture
+def holder():
+    # the MultiIndex constructor used to base compatibility with pickle
+    return MultiIndex
+
+
+@pytest.fixture
+def compat_props():
+    # a MultiIndex must have these properties associated with it
+    return ['shape', 'ndim', 'size']
diff --git a/pandas/tests/indexes/multi/test_analytics.py b/pandas/tests/indexes/multi/test_analytics.py
new file mode 100644
index 0000000000000..d5a6e9acaa5f3
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_analytics.py
@@ -0,0 +1,309 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2, lrange
+from pandas.compat.numpy import _np_version_under1p17
+
+import pandas as pd
+from pandas import Index, MultiIndex, date_range, period_range
+import pandas.util.testing as tm
+
+
+def test_shift(idx):
+
+    # GH8083 test the base class for shift
+    msg = "Not supported for type MultiIndex"
+    with pytest.raises(NotImplementedError, match=msg):
+        idx.shift(1)
+    with pytest.raises(NotImplementedError, match=msg):
+        idx.shift(1, 2)
+
+
+def test_groupby(idx):
+    groups = idx.groupby(np.array([1, 1, 1, 2, 2, 2]))
+    labels = idx.get_values().tolist()
+    exp = {1: labels[:3], 2: labels[3:]}
+    tm.assert_dict_equal(groups, exp)
+
+    # GH5620
+    groups = idx.groupby(idx)
+    exp = {key: [key] for key in idx}
+    tm.assert_dict_equal(groups, exp)
+
+
+def test_truncate():
+    major_axis = Index(lrange(4))
+    minor_axis = Index(lrange(2))
+
+    major_codes = np.array([0, 0, 1, 2, 3, 3])
+    minor_codes = np.array([0, 1, 0, 1, 0, 1])
+
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+
+    result = index.truncate(before=1)
+    assert 'foo' not in result.levels[0]
+    assert 1 in result.levels[0]
+
+    result = index.truncate(after=1)
+    assert 2 not in result.levels[0]
+    assert 1 in result.levels[0]
+
+    result = index.truncate(before=1, after=2)
+    assert len(result.levels[0]) == 2
+
+    msg = "after < before"
+    with pytest.raises(ValueError, match=msg):
+        index.truncate(3, 1)
+
+
+def test_where():
+    i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+
+    msg = r"\.where is not supported for MultiIndex operations"
+    with pytest.raises(NotImplementedError, match=msg):
+        i.where(True)
+
+
+@pytest.mark.parametrize('klass', [list, tuple, np.array, pd.Series])
+def test_where_array_like(klass):
+    i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+    cond = [False, True]
+    msg = r"\.where is not supported for MultiIndex operations"
+    with pytest.raises(NotImplementedError, match=msg):
+        i.where(klass(cond))
+
+
+# TODO: reshape
+
+
+def test_reorder_levels(idx):
+    # this blows up
+    with pytest.raises(IndexError, match='^Too many levels'):
+        idx.reorder_levels([2, 1, 0])
+
+
+def test_numpy_repeat():
+    reps = 2
+    numbers = [1, 2, 3]
+    names = np.array(['foo', 'bar'])
+
+    m = MultiIndex.from_product([
+        numbers, names], names=names)
+    expected = MultiIndex.from_product([
+        numbers, names.repeat(reps)], names=names)
+    tm.assert_index_equal(np.repeat(m, reps), expected)
+
+    msg = "the 'axis' parameter is not supported"
+    with pytest.raises(ValueError, match=msg):
+        np.repeat(m, reps, axis=1)
+
+
+def test_append_mixed_dtypes():
+    # GH 13660
+    dti = date_range('2011-01-01', freq='M', periods=3, )
+    dti_tz = date_range('2011-01-01', freq='M', periods=3, tz='US/Eastern')
+    pi = period_range('2011-01', freq='M', periods=3)
+
+    mi = MultiIndex.from_arrays([[1, 2, 3],
+                                 [1.1, np.nan, 3.3],
+                                 ['a', 'b', 'c'],
+                                 dti, dti_tz, pi])
+    assert mi.nlevels == 6
+
+    res = mi.append(mi)
+    exp = MultiIndex.from_arrays([[1, 2, 3, 1, 2, 3],
+                                  [1.1, np.nan, 3.3, 1.1, np.nan, 3.3],
+                                  ['a', 'b', 'c', 'a', 'b', 'c'],
+                                  dti.append(dti),
+                                  dti_tz.append(dti_tz),
+                                  pi.append(pi)])
+    tm.assert_index_equal(res, exp)
+
+    other = MultiIndex.from_arrays([['x', 'y', 'z'], ['x', 'y', 'z'],
+                                    ['x', 'y', 'z'], ['x', 'y', 'z'],
+                                    ['x', 'y', 'z'], ['x', 'y', 'z']])
+
+    res = mi.append(other)
+    exp = MultiIndex.from_arrays([[1, 2, 3, 'x', 'y', 'z'],
+                                  [1.1, np.nan, 3.3, 'x', 'y', 'z'],
+                                  ['a', 'b', 'c', 'x', 'y', 'z'],
+                                  dti.append(pd.Index(['x', 'y', 'z'])),
+                                  dti_tz.append(pd.Index(['x', 'y', 'z'])),
+                                  pi.append(pd.Index(['x', 'y', 'z']))])
+    tm.assert_index_equal(res, exp)
+
+
+def test_take(idx):
+    indexer = [4, 3, 0, 2]
+    result = idx.take(indexer)
+    expected = idx[indexer]
+    assert result.equals(expected)
+
+    # TODO: Remove Commented Code
+    # if not isinstance(idx,
+    #                   (DatetimeIndex, PeriodIndex, TimedeltaIndex)):
+    # GH 10791
+    msg = "'MultiIndex' object has no attribute 'freq'"
+    with pytest.raises(AttributeError, match=msg):
+        idx.freq
+
+
+def test_take_invalid_kwargs(idx):
+    idx = idx
+    indices = [1, 2]
+
+    msg = r"take\(\) got an unexpected keyword argument 'foo'"
+    with pytest.raises(TypeError, match=msg):
+        idx.take(indices, foo=2)
+
+    msg = "the 'out' parameter is not supported"
+    with pytest.raises(ValueError, match=msg):
+        idx.take(indices, out=indices)
+
+    msg = "the 'mode' parameter is not supported"
+    with pytest.raises(ValueError, match=msg):
+        idx.take(indices, mode='clip')
+
+
+def test_take_fill_value():
+    # GH 12631
+    vals = [['A', 'B'],
+            [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
+    idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
+
+    result = idx.take(np.array([1, 0, -1]))
+    exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                ('A', pd.Timestamp('2011-01-01')),
+                ('B', pd.Timestamp('2011-01-02'))]
+    expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+    tm.assert_index_equal(result, expected)
+
+    # fill_value
+    result = idx.take(np.array([1, 0, -1]), fill_value=True)
+    exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                ('A', pd.Timestamp('2011-01-01')),
+                (np.nan, pd.NaT)]
+    expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+    tm.assert_index_equal(result, expected)
+
+    # allow_fill=False
+    result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                      fill_value=True)
+    exp_vals = [('A', pd.Timestamp('2011-01-02')),
+                ('A', pd.Timestamp('2011-01-01')),
+                ('B', pd.Timestamp('2011-01-02'))]
+    expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
+    tm.assert_index_equal(result, expected)
+
+    msg = ('When allow_fill=True and fill_value is not None, '
+           'all indices must be >= -1')
+    with pytest.raises(ValueError, match=msg):
+        idx.take(np.array([1, 0, -2]), fill_value=True)
+    with pytest.raises(ValueError, match=msg):
+        idx.take(np.array([1, 0, -5]), fill_value=True)
+
+    msg = "index -5 is out of bounds for size 4"
+    with pytest.raises(IndexError, match=msg):
+        idx.take(np.array([1, -5]))
+
+
+def test_iter(idx):
+    result = list(idx)
+    expected = [('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
+                ('baz', 'two'), ('qux', 'one'), ('qux', 'two')]
+    assert result == expected
+
+
+def test_sub(idx):
+
+    first = idx
+
+    # - now raises (previously was set op difference)
+    msg = "cannot perform __sub__ with this index type: MultiIndex"
+    with pytest.raises(TypeError, match=msg):
+        first - idx[-3:]
+    with pytest.raises(TypeError, match=msg):
+        idx[-3:] - first
+    with pytest.raises(TypeError, match=msg):
+        idx[-3:] - first.tolist()
+    msg = "cannot perform __rsub__ with this index type: MultiIndex"
+    with pytest.raises(TypeError, match=msg):
+        first.tolist() - idx[-3:]
+
+
+def test_map(idx):
+    # callable
+    index = idx
+
+    # we don't infer UInt64
+    if isinstance(index, pd.UInt64Index):
+        expected = index.astype('int64')
+    else:
+        expected = index
+
+    result = index.map(lambda x: x)
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    "mapper",
+    [
+        lambda values, idx: {i: e for e, i in zip(values, idx)},
+        lambda values, idx: pd.Series(values, idx)])
+def test_map_dictlike(idx, mapper):
+
+    if isinstance(idx, (pd.CategoricalIndex, pd.IntervalIndex)):
+        pytest.skip("skipping tests for {}".format(type(idx)))
+
+    identity = mapper(idx.values, idx)
+
+    # we don't infer to UInt64 for a dict
+    if isinstance(idx, pd.UInt64Index) and isinstance(identity, dict):
+        expected = idx.astype('int64')
+    else:
+        expected = idx
+
+    result = idx.map(identity)
+    tm.assert_index_equal(result, expected)
+
+    # empty mappable
+    expected = pd.Index([np.nan] * len(idx))
+    result = idx.map(mapper(expected, idx))
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+@pytest.mark.parametrize('func', [
+    np.exp, np.exp2, np.expm1, np.log, np.log2, np.log10,
+    np.log1p, np.sqrt, np.sin, np.cos, np.tan, np.arcsin,
+    np.arccos, np.arctan, np.sinh, np.cosh, np.tanh,
+    np.arcsinh, np.arccosh, np.arctanh, np.deg2rad,
+    np.rad2deg
+], ids=lambda func: func.__name__)
+def test_numpy_ufuncs(idx, func):
+    # test ufuncs of numpy. see:
+    # http://docs.scipy.org/doc/numpy/reference/ufuncs.html
+
+    if _np_version_under1p17:
+        expected_exception = AttributeError
+        msg = "'tuple' object has no attribute '{}'".format(func.__name__)
+    else:
+        expected_exception = TypeError
+        msg = ("loop of ufunc does not support argument 0 of type tuple which"
+               " has no callable {} method").format(func.__name__)
+    with pytest.raises(expected_exception, match=msg):
+        func(idx)
+
+
+@pytest.mark.parametrize('func', [
+    np.isfinite, np.isinf, np.isnan, np.signbit
+], ids=lambda func: func.__name__)
+def test_numpy_type_funcs(idx, func):
+    msg = ("ufunc '{}' not supported for the input types, and the inputs"
+           " could not be safely coerced to any supported types according to"
+           " the casting rule ''safe''").format(func.__name__)
+    with pytest.raises(TypeError, match=msg):
+        func(idx)
diff --git a/pandas/tests/indexes/multi/test_astype.py b/pandas/tests/indexes/multi/test_astype.py
new file mode 100644
index 0000000000000..c77b23c740094
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_astype.py
@@ -0,0 +1,32 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+from pandas.util.testing import assert_copy
+
+
+def test_astype(idx):
+    expected = idx.copy()
+    actual = idx.astype('O')
+    assert_copy(actual.levels, expected.levels)
+    assert_copy(actual.codes, expected.codes)
+    assert [level.name for level in actual.levels] == list(expected.names)
+
+    with pytest.raises(TypeError, match="^Setting.*dtype.*object"):
+        idx.astype(np.dtype(int))
+
+
+@pytest.mark.parametrize('ordered', [True, False])
+def test_astype_category(idx, ordered):
+    # GH 18630
+    msg = '> 1 ndim Categorical are not supported at this time'
+    with pytest.raises(NotImplementedError, match=msg):
+        idx.astype(CategoricalDtype(ordered=ordered))
+
+    if ordered is False:
+        # dtype='category' defaults to ordered=False, so only test once
+        with pytest.raises(NotImplementedError, match=msg):
+            idx.astype('category')
diff --git a/pandas/tests/indexes/multi/test_compat.py b/pandas/tests/indexes/multi/test_compat.py
new file mode 100644
index 0000000000000..89685b9feec27
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_compat.py
@@ -0,0 +1,129 @@
+# -*- coding: utf-8 -*-
+
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY3, long
+
+from pandas import MultiIndex
+import pandas.util.testing as tm
+
+
+def test_numeric_compat(idx):
+    with pytest.raises(TypeError, match="cannot perform __mul__"):
+        idx * 1
+
+    with pytest.raises(TypeError, match="cannot perform __rmul__"):
+        1 * idx
+
+    div_err = ("cannot perform __truediv__" if PY3
+               else "cannot perform __div__")
+    with pytest.raises(TypeError, match=div_err):
+        idx / 1
+
+    div_err = div_err.replace(" __", " __r")
+    with pytest.raises(TypeError, match=div_err):
+        1 / idx
+
+    with pytest.raises(TypeError, match="cannot perform __floordiv__"):
+        idx // 1
+
+    with pytest.raises(TypeError, match="cannot perform __rfloordiv__"):
+        1 // idx
+
+
+@pytest.mark.parametrize("method", ["all", "any"])
+def test_logical_compat(idx, method):
+    msg = "cannot perform {method}".format(method=method)
+
+    with pytest.raises(TypeError, match=msg):
+        getattr(idx, method)()
+
+
+def test_boolean_context_compat(idx):
+
+    with pytest.raises(ValueError):
+        bool(idx)
+
+
+def test_boolean_context_compat2():
+
+    # boolean context compat
+    # GH7897
+    i1 = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+    i2 = MultiIndex.from_tuples([('A', 1), ('A', 3)])
+    common = i1.intersection(i2)
+
+    with pytest.raises(ValueError):
+        bool(common)
+
+
+def test_inplace_mutation_resets_values():
+    levels = [['a', 'b', 'c'], [4]]
+    levels2 = [[1, 2, 3], ['a']]
+    codes = [[0, 1, 0, 2, 2, 0], [0, 0, 0, 0, 0, 0]]
+
+    mi1 = MultiIndex(levels=levels, codes=codes)
+    mi2 = MultiIndex(levels=levels2, codes=codes)
+    vals = mi1.values.copy()
+    vals2 = mi2.values.copy()
+
+    assert mi1._tuples is not None
+
+    # Make sure level setting works
+    new_vals = mi1.set_levels(levels2).values
+    tm.assert_almost_equal(vals2, new_vals)
+
+    # Non-inplace doesn't kill _tuples [implementation detail]
+    tm.assert_almost_equal(mi1._tuples, vals)
+
+    # ...and values is still same too
+    tm.assert_almost_equal(mi1.values, vals)
+
+    # Inplace should kill _tuples
+    mi1.set_levels(levels2, inplace=True)
+    tm.assert_almost_equal(mi1.values, vals2)
+
+    # Make sure label setting works too
+    codes2 = [[0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0]]
+    exp_values = np.empty((6,), dtype=object)
+    exp_values[:] = [(long(1), 'a')] * 6
+
+    # Must be 1d array of tuples
+    assert exp_values.shape == (6,)
+    new_values = mi2.set_codes(codes2).values
+
+    # Not inplace shouldn't change
+    tm.assert_almost_equal(mi2._tuples, vals2)
+
+    # Should have correct values
+    tm.assert_almost_equal(exp_values, new_values)
+
+    # ...and again setting inplace should kill _tuples, etc
+    mi2.set_codes(codes2, inplace=True)
+    tm.assert_almost_equal(mi2.values, new_values)
+
+
+def test_ndarray_compat_properties(idx, compat_props):
+    assert idx.T.equals(idx)
+    assert idx.transpose().equals(idx)
+
+    values = idx.values
+    for prop in compat_props:
+        assert getattr(idx, prop) == getattr(values, prop)
+
+    # test for validity
+    idx.nbytes
+    idx.values.nbytes
+
+
+def test_compat(indices):
+    assert indices.tolist() == list(indices)
+
+
+def test_pickle_compat_construction(holder):
+    # this is testing for pickle compat
+    # need an object to create with
+    with pytest.raises(TypeError, match="Must pass both levels and codes"):
+        holder()
diff --git a/pandas/tests/indexes/multi/test_constructor.py b/pandas/tests/indexes/multi/test_constructor.py
new file mode 100644
index 0000000000000..fe90e85cf93c8
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_constructor.py
@@ -0,0 +1,585 @@
+# -*- coding: utf-8 -*-
+
+from collections import OrderedDict
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslib import Timestamp
+from pandas.compat import lrange, range
+
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+
+import pandas as pd
+from pandas import Index, MultiIndex, date_range
+import pandas.util.testing as tm
+
+
+def test_constructor_single_level():
+    result = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
+                        codes=[[0, 1, 2, 3]], names=['first'])
+    assert isinstance(result, MultiIndex)
+    expected = Index(['foo', 'bar', 'baz', 'qux'], name='first')
+    tm.assert_index_equal(result.levels[0], expected)
+    assert result.names == ['first']
+
+
+def test_constructor_no_levels():
+    msg = "non-zero number of levels/codes"
+    with pytest.raises(ValueError, match=msg):
+        MultiIndex(levels=[], codes=[])
+
+    msg = "Must pass both levels and codes"
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex(levels=[])
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex(codes=[])
+
+
+def test_constructor_nonhashable_names():
+    # GH 20527
+    levels = [[1, 2], [u'one', u'two']]
+    codes = [[0, 0, 1, 1], [0, 1, 0, 1]]
+    names = (['foo'], ['bar'])
+    msg = r"MultiIndex\.name must be a hashable type"
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex(levels=levels, codes=codes, names=names)
+
+    # With .rename()
+    mi = MultiIndex(levels=[[1, 2], [u'one', u'two']],
+                    codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                    names=('foo', 'bar'))
+    renamed = [['foor'], ['barr']]
+    with pytest.raises(TypeError, match=msg):
+        mi.rename(names=renamed)
+
+    # With .set_names()
+    with pytest.raises(TypeError, match=msg):
+        mi.set_names(names=renamed)
+
+
+def test_constructor_mismatched_codes_levels(idx):
+    codes = [np.array([1]), np.array([2]), np.array([3])]
+    levels = ["a"]
+
+    msg = "Length of levels and codes must be the same"
+    with pytest.raises(ValueError, match=msg):
+        MultiIndex(levels=levels, codes=codes)
+
+    length_error = (r"On level 0, code max \(3\) >= length of level  \(1\)\."
+                    " NOTE: this index is in an inconsistent state")
+    label_error = r"Unequal code lengths: \[4, 2\]"
+
+    # important to check that it's looking at the right thing.
+    with pytest.raises(ValueError, match=length_error):
+        MultiIndex(levels=[['a'], ['b']],
+                   codes=[[0, 1, 2, 3], [0, 3, 4, 1]])
+
+    with pytest.raises(ValueError, match=label_error):
+        MultiIndex(levels=[['a'], ['b']], codes=[[0, 0, 0, 0], [0, 0]])
+
+    # external API
+    with pytest.raises(ValueError, match=length_error):
+        idx.copy().set_levels([['a'], ['b']])
+
+    with pytest.raises(ValueError, match=label_error):
+        idx.copy().set_codes([[0, 0, 0, 0], [0, 0]])
+
+
+def test_labels_deprecated(idx):
+    # GH23752
+    with tm.assert_produces_warning(FutureWarning):
+        MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
+                   labels=[[0, 1, 2, 3]], names=['first'])
+    with tm.assert_produces_warning(FutureWarning):
+        idx.labels
+
+
+def test_copy_in_constructor():
+    levels = np.array(["a", "b", "c"])
+    codes = np.array([1, 1, 2, 0, 0, 1, 1])
+    val = codes[0]
+    mi = MultiIndex(levels=[levels, levels], codes=[codes, codes],
+                    copy=True)
+    assert mi.codes[0][0] == val
+    codes[0] = 15
+    assert mi.codes[0][0] == val
+    val = levels[0]
+    levels[0] = "PANDA"
+    assert mi.levels[0][0] == val
+
+
+# ----------------------------------------------------------------------------
+# from_arrays
+# ----------------------------------------------------------------------------
+def test_from_arrays(idx):
+    arrays = [np.asarray(lev).take(level_codes)
+              for lev, level_codes in zip(idx.levels, idx.codes)]
+
+    # list of arrays as input
+    result = MultiIndex.from_arrays(arrays, names=idx.names)
+    tm.assert_index_equal(result, idx)
+
+    # infer correctly
+    result = MultiIndex.from_arrays([[pd.NaT, Timestamp('20130101')],
+                                     ['a', 'b']])
+    assert result.levels[0].equals(Index([Timestamp('20130101')]))
+    assert result.levels[1].equals(Index(['a', 'b']))
+
+
+def test_from_arrays_iterator(idx):
+    # GH 18434
+    arrays = [np.asarray(lev).take(level_codes)
+              for lev, level_codes in zip(idx.levels, idx.codes)]
+
+    # iterator as input
+    result = MultiIndex.from_arrays(iter(arrays), names=idx.names)
+    tm.assert_index_equal(result, idx)
+
+    # invalid iterator input
+    msg = "Input must be a list / sequence of array-likes."
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_arrays(0)
+
+
+def test_from_arrays_tuples(idx):
+    arrays = tuple(tuple(np.asarray(lev).take(level_codes))
+                   for lev, level_codes in zip(idx.levels, idx.codes))
+
+    # tuple of tuples as input
+    result = MultiIndex.from_arrays(arrays, names=idx.names)
+    tm.assert_index_equal(result, idx)
+
+
+def test_from_arrays_index_series_datetimetz():
+    idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                         tz='US/Eastern')
+    idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3,
+                         tz='Asia/Tokyo')
+    result = pd.MultiIndex.from_arrays([idx1, idx2])
+    tm.assert_index_equal(result.get_level_values(0), idx1)
+    tm.assert_index_equal(result.get_level_values(1), idx2)
+
+    result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+    tm.assert_index_equal(result2.get_level_values(0), idx1)
+    tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+    tm.assert_index_equal(result, result2)
+
+
+def test_from_arrays_index_series_timedelta():
+    idx1 = pd.timedelta_range('1 days', freq='D', periods=3)
+    idx2 = pd.timedelta_range('2 hours', freq='H', periods=3)
+    result = pd.MultiIndex.from_arrays([idx1, idx2])
+    tm.assert_index_equal(result.get_level_values(0), idx1)
+    tm.assert_index_equal(result.get_level_values(1), idx2)
+
+    result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+    tm.assert_index_equal(result2.get_level_values(0), idx1)
+    tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+    tm.assert_index_equal(result, result2)
+
+
+def test_from_arrays_index_series_period():
+    idx1 = pd.period_range('2011-01-01', freq='D', periods=3)
+    idx2 = pd.period_range('2015-01-01', freq='H', periods=3)
+    result = pd.MultiIndex.from_arrays([idx1, idx2])
+    tm.assert_index_equal(result.get_level_values(0), idx1)
+    tm.assert_index_equal(result.get_level_values(1), idx2)
+
+    result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+    tm.assert_index_equal(result2.get_level_values(0), idx1)
+    tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+    tm.assert_index_equal(result, result2)
+
+
+def test_from_arrays_index_datetimelike_mixed():
+    idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                         tz='US/Eastern')
+    idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3)
+    idx3 = pd.timedelta_range('1 days', freq='D', periods=3)
+    idx4 = pd.period_range('2011-01-01', freq='D', periods=3)
+
+    result = pd.MultiIndex.from_arrays([idx1, idx2, idx3, idx4])
+    tm.assert_index_equal(result.get_level_values(0), idx1)
+    tm.assert_index_equal(result.get_level_values(1), idx2)
+    tm.assert_index_equal(result.get_level_values(2), idx3)
+    tm.assert_index_equal(result.get_level_values(3), idx4)
+
+    result2 = pd.MultiIndex.from_arrays([pd.Series(idx1),
+                                         pd.Series(idx2),
+                                         pd.Series(idx3),
+                                         pd.Series(idx4)])
+    tm.assert_index_equal(result2.get_level_values(0), idx1)
+    tm.assert_index_equal(result2.get_level_values(1), idx2)
+    tm.assert_index_equal(result2.get_level_values(2), idx3)
+    tm.assert_index_equal(result2.get_level_values(3), idx4)
+
+    tm.assert_index_equal(result, result2)
+
+
+def test_from_arrays_index_series_categorical():
+    # GH13743
+    idx1 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                               ordered=False)
+    idx2 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                               ordered=True)
+
+    result = pd.MultiIndex.from_arrays([idx1, idx2])
+    tm.assert_index_equal(result.get_level_values(0), idx1)
+    tm.assert_index_equal(result.get_level_values(1), idx2)
+
+    result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
+    tm.assert_index_equal(result2.get_level_values(0), idx1)
+    tm.assert_index_equal(result2.get_level_values(1), idx2)
+
+    result3 = pd.MultiIndex.from_arrays([idx1.values, idx2.values])
+    tm.assert_index_equal(result3.get_level_values(0), idx1)
+    tm.assert_index_equal(result3.get_level_values(1), idx2)
+
+
+def test_from_arrays_empty():
+    # 0 levels
+    msg = "Must pass non-zero number of levels/codes"
+    with pytest.raises(ValueError, match=msg):
+        MultiIndex.from_arrays(arrays=[])
+
+    # 1 level
+    result = MultiIndex.from_arrays(arrays=[[]], names=['A'])
+    assert isinstance(result, MultiIndex)
+    expected = Index([], name='A')
+    tm.assert_index_equal(result.levels[0], expected)
+
+    # N levels
+    for N in [2, 3]:
+        arrays = [[]] * N
+        names = list('ABC')[:N]
+        result = MultiIndex.from_arrays(arrays=arrays, names=names)
+        expected = MultiIndex(levels=[[]] * N, codes=[[]] * N,
+                              names=names)
+        tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('invalid_sequence_of_arrays', [
+    1, [1], [1, 2], [[1], 2], [1, [2]], 'a', ['a'], ['a', 'b'], [['a'], 'b'],
+    (1,), (1, 2), ([1], 2), (1, [2]), 'a', ('a',), ('a', 'b'), (['a'], 'b'),
+    [(1,), 2], [1, (2,)], [('a',), 'b'],
+    ((1,), 2), (1, (2,)), (('a',), 'b')
+])
+def test_from_arrays_invalid_input(invalid_sequence_of_arrays):
+    msg = "Input must be a list / sequence of array-likes"
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_arrays(arrays=invalid_sequence_of_arrays)
+
+
+@pytest.mark.parametrize('idx1, idx2', [
+    ([1, 2, 3], ['a', 'b']),
+    ([], ['a', 'b']),
+    ([1, 2, 3], [])
+])
+def test_from_arrays_different_lengths(idx1, idx2):
+    # see gh-13599
+    msg = '^all arrays must be same length$'
+    with pytest.raises(ValueError, match=msg):
+        MultiIndex.from_arrays([idx1, idx2])
+
+
+# ----------------------------------------------------------------------------
+# from_tuples
+# ----------------------------------------------------------------------------
+def test_from_tuples():
+    msg = 'Cannot infer number of levels from empty list'
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_tuples([])
+
+    expected = MultiIndex(levels=[[1, 3], [2, 4]],
+                          codes=[[0, 1], [0, 1]],
+                          names=['a', 'b'])
+
+    # input tuples
+    result = MultiIndex.from_tuples(((1, 2), (3, 4)), names=['a', 'b'])
+    tm.assert_index_equal(result, expected)
+
+
+def test_from_tuples_iterator():
+    # GH 18434
+    # input iterator for tuples
+    expected = MultiIndex(levels=[[1, 3], [2, 4]],
+                          codes=[[0, 1], [0, 1]],
+                          names=['a', 'b'])
+
+    result = MultiIndex.from_tuples(zip([1, 3], [2, 4]), names=['a', 'b'])
+    tm.assert_index_equal(result, expected)
+
+    # input non-iterables
+    msg = 'Input must be a list / sequence of tuple-likes.'
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_tuples(0)
+
+
+def test_from_tuples_empty():
+    # GH 16777
+    result = MultiIndex.from_tuples([], names=['a', 'b'])
+    expected = MultiIndex.from_arrays(arrays=[[], []],
+                                      names=['a', 'b'])
+    tm.assert_index_equal(result, expected)
+
+
+def test_from_tuples_index_values(idx):
+    result = MultiIndex.from_tuples(idx)
+    assert (result.values == idx.values).all()
+
+
+def test_tuples_with_name_string():
+    # GH 15110 and GH 14848
+
+    li = [(0, 0, 1), (0, 1, 0), (1, 0, 0)]
+    msg = "Names should be list-like for a MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        pd.Index(li, name='abc')
+    with pytest.raises(ValueError, match=msg):
+        pd.Index(li, name='a')
+
+
+def test_from_tuples_with_tuple_label():
+    # GH 15457
+    expected = pd.DataFrame([[2, 1, 2], [4, (1, 2), 3]],
+                            columns=['a', 'b', 'c']).set_index(['a', 'b'])
+    idx = pd.MultiIndex.from_tuples([(2, 1), (4, (1, 2))], names=('a', 'b'))
+    result = pd.DataFrame([2, 3], columns=['c'], index=idx)
+    tm.assert_frame_equal(expected, result)
+
+
+# ----------------------------------------------------------------------------
+# from_product
+# ----------------------------------------------------------------------------
+def test_from_product_empty_zero_levels():
+    # 0 levels
+    msg = "Must pass non-zero number of levels/codes"
+    with pytest.raises(ValueError, match=msg):
+        MultiIndex.from_product([])
+
+
+def test_from_product_empty_one_level():
+    result = MultiIndex.from_product([[]], names=['A'])
+    expected = pd.Index([], name='A')
+    tm.assert_index_equal(result.levels[0], expected)
+
+
+@pytest.mark.parametrize('first, second', [
+    ([], []),
+    (['foo', 'bar', 'baz'], []),
+    ([], ['a', 'b', 'c']),
+])
+def test_from_product_empty_two_levels(first, second):
+    names = ['A', 'B']
+    result = MultiIndex.from_product([first, second], names=names)
+    expected = MultiIndex(levels=[first, second],
+                          codes=[[], []], names=names)
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('N', list(range(4)))
+def test_from_product_empty_three_levels(N):
+    # GH12258
+    names = ['A', 'B', 'C']
+    lvl2 = lrange(N)
+    result = MultiIndex.from_product([[], lvl2, []], names=names)
+    expected = MultiIndex(levels=[[], lvl2, []],
+                          codes=[[], [], []], names=names)
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('invalid_input', [
+    1,
+    [1],
+    [1, 2],
+    [[1], 2],
+    'a',
+    ['a'],
+    ['a', 'b'],
+    [['a'], 'b'],
+])
+def test_from_product_invalid_input(invalid_input):
+    msg = (r"Input must be a list / sequence of iterables|"
+           "Input must be list-like")
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_product(iterables=invalid_input)
+
+
+def test_from_product_datetimeindex():
+    dt_index = date_range('2000-01-01', periods=2)
+    mi = pd.MultiIndex.from_product([[1, 2], dt_index])
+    etalon = construct_1d_object_array_from_listlike([
+        (1, pd.Timestamp('2000-01-01')),
+        (1, pd.Timestamp('2000-01-02')),
+        (2, pd.Timestamp('2000-01-01')),
+        (2, pd.Timestamp('2000-01-02')),
+    ])
+    tm.assert_numpy_array_equal(mi.values, etalon)
+
+
+@pytest.mark.parametrize('ordered', [False, True])
+@pytest.mark.parametrize('f', [
+    lambda x: x,
+    lambda x: pd.Series(x),
+    lambda x: x.values
+])
+def test_from_product_index_series_categorical(ordered, f):
+    # GH13743
+    first = ['foo', 'bar']
+
+    idx = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
+                              ordered=ordered)
+    expected = pd.CategoricalIndex(list("abcaab") + list("abcaab"),
+                                   categories=list("bac"),
+                                   ordered=ordered)
+
+    result = pd.MultiIndex.from_product([first, f(idx)])
+    tm.assert_index_equal(result.get_level_values(1), expected)
+
+
+def test_from_product():
+
+    first = ['foo', 'bar', 'buz']
+    second = ['a', 'b', 'c']
+    names = ['first', 'second']
+    result = MultiIndex.from_product([first, second], names=names)
+
+    tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'), ('bar', 'a'),
+              ('bar', 'b'), ('bar', 'c'), ('buz', 'a'), ('buz', 'b'),
+              ('buz', 'c')]
+    expected = MultiIndex.from_tuples(tuples, names=names)
+
+    tm.assert_index_equal(result, expected)
+
+
+def test_from_product_iterator():
+    # GH 18434
+    first = ['foo', 'bar', 'buz']
+    second = ['a', 'b', 'c']
+    names = ['first', 'second']
+    tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'), ('bar', 'a'),
+              ('bar', 'b'), ('bar', 'c'), ('buz', 'a'), ('buz', 'b'),
+              ('buz', 'c')]
+    expected = MultiIndex.from_tuples(tuples, names=names)
+
+    # iterator as input
+    result = MultiIndex.from_product(iter([first, second]), names=names)
+    tm.assert_index_equal(result, expected)
+
+    # Invalid non-iterable input
+    msg = "Input must be a list / sequence of iterables."
+    with pytest.raises(TypeError, match=msg):
+        MultiIndex.from_product(0)
+
+
+def test_create_index_existing_name(idx):
+
+    # GH11193, when an existing index is passed, and a new name is not
+    # specified, the new index should inherit the previous object name
+    index = idx
+    index.names = ['foo', 'bar']
+    result = pd.Index(index)
+    expected = Index(
+        Index([
+            ('foo', 'one'), ('foo', 'two'),
+            ('bar', 'one'), ('baz', 'two'),
+            ('qux', 'one'), ('qux', 'two')],
+            dtype='object'
+        ),
+        names=['foo', 'bar']
+    )
+    tm.assert_index_equal(result, expected)
+
+    result = pd.Index(index, names=['A', 'B'])
+    expected = Index(
+        Index([
+            ('foo', 'one'), ('foo', 'two'),
+            ('bar', 'one'), ('baz', 'two'),
+            ('qux', 'one'), ('qux', 'two')],
+            dtype='object'
+        ),
+        names=['A', 'B']
+    )
+    tm.assert_index_equal(result, expected)
+
+
+# ----------------------------------------------------------------------------
+# from_frame
+# ----------------------------------------------------------------------------
+def test_from_frame():
+    # GH 22420
+    df = pd.DataFrame([['a', 'a'], ['a', 'b'], ['b', 'a'], ['b', 'b']],
+                      columns=['L1', 'L2'])
+    expected = pd.MultiIndex.from_tuples([('a', 'a'), ('a', 'b'),
+                                          ('b', 'a'), ('b', 'b')],
+                                         names=['L1', 'L2'])
+    result = pd.MultiIndex.from_frame(df)
+    tm.assert_index_equal(expected, result)
+
+
+@pytest.mark.parametrize('non_frame', [
+    pd.Series([1, 2, 3, 4]),
+    [1, 2, 3, 4],
+    [[1, 2], [3, 4], [5, 6]],
+    pd.Index([1, 2, 3, 4]),
+    np.array([[1, 2], [3, 4], [5, 6]]),
+    27
+])
+def test_from_frame_error(non_frame):
+    # GH 22420
+    with pytest.raises(TypeError, match='Input must be a DataFrame'):
+        pd.MultiIndex.from_frame(non_frame)
+
+
+def test_from_frame_dtype_fidelity():
+    # GH 22420
+    df = pd.DataFrame(OrderedDict([
+        ('dates', pd.date_range('19910905', periods=6, tz='US/Eastern')),
+        ('a', [1, 1, 1, 2, 2, 2]),
+        ('b', pd.Categorical(['a', 'a', 'b', 'b', 'c', 'c'], ordered=True)),
+        ('c', ['x', 'x', 'y', 'z', 'x', 'y'])
+    ]))
+    original_dtypes = df.dtypes.to_dict()
+
+    expected_mi = pd.MultiIndex.from_arrays([
+        pd.date_range('19910905', periods=6, tz='US/Eastern'),
+        [1, 1, 1, 2, 2, 2],
+        pd.Categorical(['a', 'a', 'b', 'b', 'c', 'c'], ordered=True),
+        ['x', 'x', 'y', 'z', 'x', 'y']
+    ], names=['dates', 'a', 'b', 'c'])
+    mi = pd.MultiIndex.from_frame(df)
+    mi_dtypes = {name: mi.levels[i].dtype for i, name in enumerate(mi.names)}
+
+    tm.assert_index_equal(expected_mi, mi)
+    assert original_dtypes == mi_dtypes
+
+
+@pytest.mark.parametrize('names_in,names_out', [
+    (None, [('L1', 'x'), ('L2', 'y')]),
+    (['x', 'y'], ['x', 'y']),
+])
+def test_from_frame_valid_names(names_in, names_out):
+    # GH 22420
+    df = pd.DataFrame([['a', 'a'], ['a', 'b'], ['b', 'a'], ['b', 'b']],
+                      columns=pd.MultiIndex.from_tuples([('L1', 'x'),
+                                                         ('L2', 'y')]))
+    mi = pd.MultiIndex.from_frame(df, names=names_in)
+    assert mi.names == names_out
+
+
+@pytest.mark.parametrize('names,expected_error_msg', [
+    ('bad_input', "Names should be list-like for a MultiIndex"),
+    (['a', 'b', 'c'],
+     "Length of names must match number of levels in MultiIndex")
+])
+def test_from_frame_invalid_names(names, expected_error_msg):
+    # GH 22420
+    df = pd.DataFrame([['a', 'a'], ['a', 'b'], ['b', 'a'], ['b', 'b']],
+                      columns=pd.MultiIndex.from_tuples([('L1', 'x'),
+                                                         ('L2', 'y')]))
+    with pytest.raises(ValueError, match=expected_error_msg):
+        pd.MultiIndex.from_frame(df, names=names)
diff --git a/pandas/tests/indexes/multi/test_contains.py b/pandas/tests/indexes/multi/test_contains.py
new file mode 100644
index 0000000000000..56836b94a6b03
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_contains.py
@@ -0,0 +1,106 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.compat import PYPY
+
+import pandas as pd
+from pandas import MultiIndex
+import pandas.util.testing as tm
+
+
+def test_contains_top_level():
+    midx = MultiIndex.from_product([['A', 'B'], [1, 2]])
+    assert 'A' in midx
+    assert 'A' not in midx._engine
+
+
+def test_contains_with_nat():
+    # MI with a NaT
+    mi = MultiIndex(levels=[['C'],
+                            pd.date_range('2012-01-01', periods=5)],
+                    codes=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
+                    names=[None, 'B'])
+    assert ('C', pd.Timestamp('2012-01-01')) in mi
+    for val in mi.values:
+        assert val in mi
+
+
+def test_contains(idx):
+    assert ('foo', 'two') in idx
+    assert ('bar', 'two') not in idx
+    assert None not in idx
+
+
+@pytest.mark.skipif(not PYPY, reason="tuples cmp recursively on PyPy")
+def test_isin_nan_pypy():
+    idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
+    tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
+                                np.array([False, True]))
+    tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
+                                np.array([False, True]))
+
+
+def test_isin():
+    values = [('foo', 2), ('bar', 3), ('quux', 4)]
+
+    idx = MultiIndex.from_arrays([
+        ['qux', 'baz', 'foo', 'bar'],
+        np.arange(4)
+    ])
+    result = idx.isin(values)
+    expected = np.array([False, False, True, True])
+    tm.assert_numpy_array_equal(result, expected)
+
+    # empty, return dtype bool
+    idx = MultiIndex.from_arrays([[], []])
+    result = idx.isin(values)
+    assert len(result) == 0
+    assert result.dtype == np.bool_
+
+
+@pytest.mark.skipif(PYPY, reason="tuples cmp recursively on PyPy")
+def test_isin_nan_not_pypy():
+    idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
+    tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
+                                np.array([False, False]))
+    tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
+                                np.array([False, False]))
+
+
+def test_isin_level_kwarg():
+    idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'], np.arange(
+        4)])
+
+    vals_0 = ['foo', 'bar', 'quux']
+    vals_1 = [2, 3, 10]
+
+    expected = np.array([False, False, True, True])
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=0))
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=-2))
+
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=1))
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=-1))
+
+    msg = "Too many levels: Index has only 2 levels, not 6"
+    with pytest.raises(IndexError, match=msg):
+        idx.isin(vals_0, level=5)
+    msg = ("Too many levels: Index has only 2 levels, -5 is not a valid level"
+           " number")
+    with pytest.raises(IndexError, match=msg):
+        idx.isin(vals_0, level=-5)
+
+    with pytest.raises(KeyError, match=r"'Level 1\.0 not found'"):
+        idx.isin(vals_0, level=1.0)
+    with pytest.raises(KeyError, match=r"'Level -1\.0 not found'"):
+        idx.isin(vals_1, level=-1.0)
+    with pytest.raises(KeyError, match="'Level A not found'"):
+        idx.isin(vals_1, level='A')
+
+    idx.names = ['A', 'B']
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level='A'))
+    tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level='B'))
+
+    with pytest.raises(KeyError, match="'Level C not found'"):
+        idx.isin(vals_1, level='C')
diff --git a/pandas/tests/indexes/multi/test_conversion.py b/pandas/tests/indexes/multi/test_conversion.py
new file mode 100644
index 0000000000000..00b935521bac4
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_conversion.py
@@ -0,0 +1,224 @@
+# -*- coding: utf-8 -*-
+
+from collections import OrderedDict
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, date_range
+import pandas.util.testing as tm
+
+
+def test_tolist(idx):
+    result = idx.tolist()
+    exp = list(idx.values)
+    assert result == exp
+
+
+def test_to_numpy(idx):
+    result = idx.to_numpy()
+    exp = idx.values
+    tm.assert_numpy_array_equal(result, exp)
+
+
+def test_to_frame():
+    tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
+
+    index = MultiIndex.from_tuples(tuples)
+    result = index.to_frame(index=False)
+    expected = DataFrame(tuples)
+    tm.assert_frame_equal(result, expected)
+
+    result = index.to_frame()
+    expected.index = index
+    tm.assert_frame_equal(result, expected)
+
+    tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
+    index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+    result = index.to_frame(index=False)
+    expected = DataFrame(tuples)
+    expected.columns = ['first', 'second']
+    tm.assert_frame_equal(result, expected)
+
+    result = index.to_frame()
+    expected.index = index
+    tm.assert_frame_equal(result, expected)
+
+    # See GH-22580
+    index = MultiIndex.from_tuples(tuples)
+    result = index.to_frame(index=False, name=['first', 'second'])
+    expected = DataFrame(tuples)
+    expected.columns = ['first', 'second']
+    tm.assert_frame_equal(result, expected)
+
+    result = index.to_frame(name=['first', 'second'])
+    expected.index = index
+    expected.columns = ['first', 'second']
+    tm.assert_frame_equal(result, expected)
+
+    msg = "'name' must be a list / sequence of column names."
+    with pytest.raises(TypeError, match=msg):
+        index.to_frame(name='first')
+
+    msg = "'name' should have same length as number of levels on index."
+    with pytest.raises(ValueError, match=msg):
+        index.to_frame(name=['first'])
+
+    # Tests for datetime index
+    index = MultiIndex.from_product([range(5),
+                                     pd.date_range('20130101', periods=3)])
+    result = index.to_frame(index=False)
+    expected = DataFrame(
+        {0: np.repeat(np.arange(5, dtype='int64'), 3),
+            1: np.tile(pd.date_range('20130101', periods=3), 5)})
+    tm.assert_frame_equal(result, expected)
+
+    result = index.to_frame()
+    expected.index = index
+    tm.assert_frame_equal(result, expected)
+
+    # See GH-22580
+    result = index.to_frame(index=False, name=['first', 'second'])
+    expected = DataFrame(
+        {'first': np.repeat(np.arange(5, dtype='int64'), 3),
+         'second': np.tile(pd.date_range('20130101', periods=3), 5)})
+    tm.assert_frame_equal(result, expected)
+
+    result = index.to_frame(name=['first', 'second'])
+    expected.index = index
+    tm.assert_frame_equal(result, expected)
+
+
+def test_to_frame_dtype_fidelity():
+    # GH 22420
+    mi = pd.MultiIndex.from_arrays([
+        pd.date_range('19910905', periods=6, tz='US/Eastern'),
+        [1, 1, 1, 2, 2, 2],
+        pd.Categorical(['a', 'a', 'b', 'b', 'c', 'c'], ordered=True),
+        ['x', 'x', 'y', 'z', 'x', 'y']
+    ], names=['dates', 'a', 'b', 'c'])
+    original_dtypes = {name: mi.levels[i].dtype
+                       for i, name in enumerate(mi.names)}
+
+    expected_df = pd.DataFrame(OrderedDict([
+        ('dates', pd.date_range('19910905', periods=6, tz='US/Eastern')),
+        ('a', [1, 1, 1, 2, 2, 2]),
+        ('b', pd.Categorical(['a', 'a', 'b', 'b', 'c', 'c'], ordered=True)),
+        ('c', ['x', 'x', 'y', 'z', 'x', 'y'])
+    ]))
+    df = mi.to_frame(index=False)
+    df_dtypes = df.dtypes.to_dict()
+
+    tm.assert_frame_equal(df, expected_df)
+    assert original_dtypes == df_dtypes
+
+
+def test_to_frame_resulting_column_order():
+    # GH 22420
+    expected = ['z', 0, 'a']
+    mi = pd.MultiIndex.from_arrays([['a', 'b', 'c'], ['x', 'y', 'z'],
+                                   ['q', 'w', 'e']], names=expected)
+    result = mi.to_frame().columns.tolist()
+    assert result == expected
+
+
+def test_to_hierarchical():
+    index = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
+        2, 'two')])
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = index.to_hierarchical(3)
+    expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
+                          codes=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
+                                 [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
+    tm.assert_index_equal(result, expected)
+    assert result.names == index.names
+
+    # K > 1
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = index.to_hierarchical(3, 2)
+    expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
+                          codes=[[0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1],
+                                 [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]])
+    tm.assert_index_equal(result, expected)
+    assert result.names == index.names
+
+    # non-sorted
+    index = MultiIndex.from_tuples([(2, 'c'), (1, 'b'),
+                                    (2, 'a'), (2, 'b')],
+                                   names=['N1', 'N2'])
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = index.to_hierarchical(2)
+    expected = MultiIndex.from_tuples([(2, 'c'), (2, 'c'), (1, 'b'),
+                                       (1, 'b'),
+                                       (2, 'a'), (2, 'a'),
+                                       (2, 'b'), (2, 'b')],
+                                      names=['N1', 'N2'])
+    tm.assert_index_equal(result, expected)
+    assert result.names == index.names
+
+
+def test_roundtrip_pickle_with_tz():
+    return
+
+    # GH 8367
+    # round-trip of timezone
+    index = MultiIndex.from_product(
+        [[1, 2], ['a', 'b'], date_range('20130101', periods=3,
+                                        tz='US/Eastern')
+         ], names=['one', 'two', 'three'])
+    unpickled = tm.round_trip_pickle(index)
+    assert index.equal_levels(unpickled)
+
+
+def test_pickle(indices):
+    return
+
+    unpickled = tm.round_trip_pickle(indices)
+    assert indices.equals(unpickled)
+    original_name, indices.name = indices.name, 'foo'
+    unpickled = tm.round_trip_pickle(indices)
+    assert indices.equals(unpickled)
+    indices.name = original_name
+
+
+def test_to_series(idx):
+    # assert that we are creating a copy of the index
+
+    s = idx.to_series()
+    assert s.values is not idx.values
+    assert s.index is not idx
+    assert s.name == idx.name
+
+
+def test_to_series_with_arguments(idx):
+    # GH18699
+
+    # index kwarg
+    s = idx.to_series(index=idx)
+
+    assert s.values is not idx.values
+    assert s.index is idx
+    assert s.name == idx.name
+
+    # name kwarg
+    idx = idx
+    s = idx.to_series(name='__test')
+
+    assert s.values is not idx.values
+    assert s.index is not idx
+    assert s.name != idx.name
+
+
+def test_to_flat_index(idx):
+    expected = pd.Index((('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
+                         ('baz', 'two'), ('qux', 'one'), ('qux', 'two')),
+                        tupleize_cols=False)
+    result = idx.to_flat_index()
+    tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/multi/test_copy.py b/pandas/tests/indexes/multi/test_copy.py
new file mode 100644
index 0000000000000..aaf2fe1cb635f
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_copy.py
@@ -0,0 +1,93 @@
+# -*- coding: utf-8 -*-
+
+from copy import copy, deepcopy
+
+import pytest
+
+from pandas import MultiIndex
+import pandas.util.testing as tm
+
+
+def assert_multiindex_copied(copy, original):
+    # Levels should be (at least, shallow copied)
+    tm.assert_copy(copy.levels, original.levels)
+    tm.assert_almost_equal(copy.codes, original.codes)
+
+    # Labels doesn't matter which way copied
+    tm.assert_almost_equal(copy.codes, original.codes)
+    assert copy.codes is not original.codes
+
+    # Names doesn't matter which way copied
+    assert copy.names == original.names
+    assert copy.names is not original.names
+
+    # Sort order should be copied
+    assert copy.sortorder == original.sortorder
+
+
+def test_copy(idx):
+    i_copy = idx.copy()
+
+    assert_multiindex_copied(i_copy, idx)
+
+
+def test_shallow_copy(idx):
+    i_copy = idx._shallow_copy()
+
+    assert_multiindex_copied(i_copy, idx)
+
+
+def test_labels_deprecated(idx):
+    # GH23752
+    with tm.assert_produces_warning(FutureWarning):
+        idx.copy(labels=idx.codes)
+
+
+def test_view(idx):
+    i_view = idx.view()
+    assert_multiindex_copied(i_view, idx)
+
+
+@pytest.mark.parametrize('func', [copy, deepcopy])
+def test_copy_and_deepcopy(func):
+
+    idx = MultiIndex(
+        levels=[['foo', 'bar'], ['fizz', 'buzz']],
+        codes=[[0, 0, 0, 1], [0, 0, 1, 1]],
+        names=['first', 'second']
+    )
+    idx_copy = func(idx)
+    assert idx_copy is not idx
+    assert idx_copy.equals(idx)
+
+
+@pytest.mark.parametrize('deep', [True, False])
+def test_copy_method(deep):
+    idx = MultiIndex(
+        levels=[['foo', 'bar'], ['fizz', 'buzz']],
+        codes=[[0, 0, 0, 1], [0, 0, 1, 1]],
+        names=['first', 'second']
+    )
+    idx_copy = idx.copy(deep=deep)
+    assert idx_copy.equals(idx)
+
+
+@pytest.mark.parametrize('deep', [True, False])
+@pytest.mark.parametrize('kwarg, value', [
+    ('names', ['thrid', 'fourth']),
+    ('levels', [['foo2', 'bar2'], ['fizz2', 'buzz2']]),
+    ('codes', [[1, 0, 0, 0], [1, 1, 0, 0]])
+])
+def test_copy_method_kwargs(deep, kwarg, value):
+    # gh-12309: Check that the "name" argument as well other kwargs are honored
+    idx = MultiIndex(
+        levels=[['foo', 'bar'], ['fizz', 'buzz']],
+        codes=[[0, 0, 0, 1], [0, 0, 1, 1]],
+        names=['first', 'second']
+    )
+    return
+    idx_copy = idx.copy(**{kwarg: value, 'deep': deep})
+    if kwarg == 'names':
+        assert getattr(idx_copy, kwarg) == value
+    else:
+        assert [list(i) for i in getattr(idx_copy, kwarg)] == value
diff --git a/pandas/tests/indexes/multi/test_drop.py b/pandas/tests/indexes/multi/test_drop.py
new file mode 100644
index 0000000000000..ac167c126fd13
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_drop.py
@@ -0,0 +1,136 @@
+# -*- coding: utf-8 -*-
+
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2, lrange
+from pandas.errors import PerformanceWarning
+
+import pandas as pd
+from pandas import Index, MultiIndex
+import pandas.util.testing as tm
+
+
+@pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+def test_drop(idx):
+    dropped = idx.drop([('foo', 'two'), ('qux', 'one')])
+
+    index = MultiIndex.from_tuples([('foo', 'two'), ('qux', 'one')])
+    dropped2 = idx.drop(index)
+
+    expected = idx[[0, 2, 3, 5]]
+    tm.assert_index_equal(dropped, expected)
+    tm.assert_index_equal(dropped2, expected)
+
+    dropped = idx.drop(['bar'])
+    expected = idx[[0, 1, 3, 4, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    dropped = idx.drop('foo')
+    expected = idx[[2, 3, 4, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    index = MultiIndex.from_tuples([('bar', 'two')])
+    with pytest.raises(KeyError, match=r"^10$"):
+        idx.drop([('bar', 'two')])
+    with pytest.raises(KeyError, match=r"^10$"):
+        idx.drop(index)
+    with pytest.raises(KeyError, match=r"^'two'$"):
+        idx.drop(['foo', 'two'])
+
+    # partially correct argument
+    mixed_index = MultiIndex.from_tuples([('qux', 'one'), ('bar', 'two')])
+    with pytest.raises(KeyError, match=r"^10$"):
+        idx.drop(mixed_index)
+
+    # error='ignore'
+    dropped = idx.drop(index, errors='ignore')
+    expected = idx[[0, 1, 2, 3, 4, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    dropped = idx.drop(mixed_index, errors='ignore')
+    expected = idx[[0, 1, 2, 3, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    dropped = idx.drop(['foo', 'two'], errors='ignore')
+    expected = idx[[2, 3, 4, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    # mixed partial / full drop
+    dropped = idx.drop(['foo', ('qux', 'one')])
+    expected = idx[[2, 3, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+    # mixed partial / full drop / error='ignore'
+    mixed_index = ['foo', ('qux', 'one'), 'two']
+    with pytest.raises(KeyError, match=r"^'two'$"):
+        idx.drop(mixed_index)
+    dropped = idx.drop(mixed_index, errors='ignore')
+    expected = idx[[2, 3, 5]]
+    tm.assert_index_equal(dropped, expected)
+
+
+def test_droplevel_with_names(idx):
+    index = idx[idx.get_loc('foo')]
+    dropped = index.droplevel(0)
+    assert dropped.name == 'second'
+
+    index = MultiIndex(
+        levels=[Index(lrange(4)), Index(lrange(4)), Index(lrange(4))],
+        codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
+        names=['one', 'two', 'three'])
+    dropped = index.droplevel(0)
+    assert dropped.names == ('two', 'three')
+
+    dropped = index.droplevel('two')
+    expected = index.droplevel(1)
+    assert dropped.equals(expected)
+
+
+def test_droplevel_list():
+    index = MultiIndex(
+        levels=[Index(lrange(4)), Index(lrange(4)), Index(lrange(4))],
+        codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
+        names=['one', 'two', 'three'])
+
+    dropped = index[:2].droplevel(['three', 'one'])
+    expected = index[:2].droplevel(2).droplevel(0)
+    assert dropped.equals(expected)
+
+    dropped = index[:2].droplevel([])
+    expected = index[:2]
+    assert dropped.equals(expected)
+
+    msg = ("Cannot remove 3 levels from an index with 3 levels: at least one"
+           " level must be left")
+    with pytest.raises(ValueError, match=msg):
+        index[:2].droplevel(['one', 'two', 'three'])
+
+    with pytest.raises(KeyError, match="'Level four not found'"):
+        index[:2].droplevel(['one', 'four'])
+
+
+def test_drop_not_lexsorted():
+    # GH 12078
+
+    # define the lexsorted version of the multi-index
+    tuples = [('a', ''), ('b1', 'c1'), ('b2', 'c2')]
+    lexsorted_mi = MultiIndex.from_tuples(tuples, names=['b', 'c'])
+    assert lexsorted_mi.is_lexsorted()
+
+    # and the not-lexsorted version
+    df = pd.DataFrame(columns=['a', 'b', 'c', 'd'],
+                      data=[[1, 'b1', 'c1', 3], [1, 'b2', 'c2', 4]])
+    df = df.pivot_table(index='a', columns=['b', 'c'], values='d')
+    df = df.reset_index()
+    not_lexsorted_mi = df.columns
+    assert not not_lexsorted_mi.is_lexsorted()
+
+    # compare the results
+    tm.assert_index_equal(lexsorted_mi, not_lexsorted_mi)
+    with tm.assert_produces_warning(PerformanceWarning):
+        tm.assert_index_equal(lexsorted_mi.drop('a'),
+                              not_lexsorted_mi.drop('a'))
diff --git a/pandas/tests/indexes/multi/test_duplicates.py b/pandas/tests/indexes/multi/test_duplicates.py
new file mode 100644
index 0000000000000..35034dc57b4b8
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_duplicates.py
@@ -0,0 +1,278 @@
+# -*- coding: utf-8 -*-
+
+from itertools import product
+
+import numpy as np
+import pytest
+
+from pandas._libs import hashtable
+from pandas.compat import range, u
+
+from pandas import DatetimeIndex, MultiIndex
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('names', [None, ['first', 'second']])
+def test_unique(names):
+    mi = MultiIndex.from_arrays([[1, 2, 1, 2], [1, 1, 1, 2]], names=names)
+
+    res = mi.unique()
+    exp = MultiIndex.from_arrays([[1, 2, 2], [1, 1, 2]], names=mi.names)
+    tm.assert_index_equal(res, exp)
+
+    mi = MultiIndex.from_arrays([list('aaaa'), list('abab')],
+                                names=names)
+    res = mi.unique()
+    exp = MultiIndex.from_arrays([list('aa'), list('ab')], names=mi.names)
+    tm.assert_index_equal(res, exp)
+
+    mi = MultiIndex.from_arrays([list('aaaa'), list('aaaa')], names=names)
+    res = mi.unique()
+    exp = MultiIndex.from_arrays([['a'], ['a']], names=mi.names)
+    tm.assert_index_equal(res, exp)
+
+    # GH #20568 - empty MI
+    mi = MultiIndex.from_arrays([[], []], names=names)
+    res = mi.unique()
+    tm.assert_index_equal(mi, res)
+
+
+def test_unique_datetimelike():
+    idx1 = DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-01',
+                          '2015-01-01', 'NaT', 'NaT'])
+    idx2 = DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-02',
+                          '2015-01-02', 'NaT', '2015-01-01'],
+                         tz='Asia/Tokyo')
+    result = MultiIndex.from_arrays([idx1, idx2]).unique()
+
+    eidx1 = DatetimeIndex(['2015-01-01', '2015-01-01', 'NaT', 'NaT'])
+    eidx2 = DatetimeIndex(['2015-01-01', '2015-01-02',
+                           'NaT', '2015-01-01'],
+                          tz='Asia/Tokyo')
+    exp = MultiIndex.from_arrays([eidx1, eidx2])
+    tm.assert_index_equal(result, exp)
+
+
+@pytest.mark.parametrize('level', [0, 'first', 1, 'second'])
+def test_unique_level(idx, level):
+    # GH #17896 - with level= argument
+    result = idx.unique(level=level)
+    expected = idx.get_level_values(level).unique()
+    tm.assert_index_equal(result, expected)
+
+    # With already unique level
+    mi = MultiIndex.from_arrays([[1, 3, 2, 4], [1, 3, 2, 5]],
+                                names=['first', 'second'])
+    result = mi.unique(level=level)
+    expected = mi.get_level_values(level)
+    tm.assert_index_equal(result, expected)
+
+    # With empty MI
+    mi = MultiIndex.from_arrays([[], []], names=['first', 'second'])
+    result = mi.unique(level=level)
+    expected = mi.get_level_values(level)
+
+
+@pytest.mark.parametrize('dropna', [True, False])
+def test_get_unique_index(idx, dropna):
+    mi = idx[[0, 1, 0, 1, 1, 0, 0]]
+    expected = mi._shallow_copy(mi[[0, 1]])
+
+    result = mi._get_unique_index(dropna=dropna)
+    assert result.unique
+    tm.assert_index_equal(result, expected)
+
+
+def test_duplicate_multiindex_codes():
+    # GH 17464
+    # Make sure that a MultiIndex with duplicate levels throws a ValueError
+    with pytest.raises(ValueError):
+        mi = MultiIndex([['A'] * 10, range(10)], [[0] * 10, range(10)])
+
+    # And that using set_levels with duplicate levels fails
+    mi = MultiIndex.from_arrays([['A', 'A', 'B', 'B', 'B'],
+                                 [1, 2, 1, 2, 3]])
+    with pytest.raises(ValueError):
+        mi.set_levels([['A', 'B', 'A', 'A', 'B'], [2, 1, 3, -2, 5]],
+                      inplace=True)
+
+
+@pytest.mark.parametrize('names', [['a', 'b', 'a'], [1, 1, 2],
+                                   [1, 'a', 1]])
+def test_duplicate_level_names(names):
+    # GH18872, GH19029
+    mi = MultiIndex.from_product([[0, 1]] * 3, names=names)
+    assert mi.names == names
+
+    # With .rename()
+    mi = MultiIndex.from_product([[0, 1]] * 3)
+    mi = mi.rename(names)
+    assert mi.names == names
+
+    # With .rename(., level=)
+    mi.rename(names[1], level=1, inplace=True)
+    mi = mi.rename([names[0], names[2]], level=[0, 2])
+    assert mi.names == names
+
+
+def test_duplicate_meta_data():
+    # GH 10115
+    mi = MultiIndex(
+        levels=[[0, 1], [0, 1, 2]],
+        codes=[[0, 0, 0, 0, 1, 1, 1],
+               [0, 1, 2, 0, 0, 1, 2]])
+
+    for idx in [mi,
+                mi.set_names([None, None]),
+                mi.set_names([None, 'Num']),
+                mi.set_names(['Upper', 'Num']), ]:
+        assert idx.has_duplicates
+        assert idx.drop_duplicates().names == idx.names
+
+
+def test_has_duplicates(idx, idx_dup):
+    # see fixtures
+    assert idx.is_unique is True
+    assert idx.has_duplicates is False
+    assert idx_dup.is_unique is False
+    assert idx_dup.has_duplicates is True
+
+    mi = MultiIndex(levels=[[0, 1], [0, 1, 2]],
+                    codes=[[0, 0, 0, 0, 1, 1, 1],
+                           [0, 1, 2, 0, 0, 1, 2]])
+    assert mi.is_unique is False
+    assert mi.has_duplicates is True
+
+    # single instance of NaN
+    mi_nan = MultiIndex(levels=[['a', 'b'], [0, 1]],
+                        codes=[[-1, 0, 0, 1, 1], [-1, 0, 1, 0, 1]])
+    assert mi_nan.is_unique is True
+    assert mi_nan.has_duplicates is False
+
+    # multiple instances of NaN
+    mi_nan_dup = MultiIndex(levels=[['a', 'b'], [0, 1]],
+                            codes=[[-1, -1, 0, 0, 1, 1], [-1, -1, 0, 1, 0, 1]])
+    assert mi_nan_dup.is_unique is False
+    assert mi_nan_dup.has_duplicates is True
+
+
+def test_has_duplicates_from_tuples():
+    # GH 9075
+    t = [(u('x'), u('out'), u('z'), 5, u('y'), u('in'), u('z'), 169),
+         (u('x'), u('out'), u('z'), 7, u('y'), u('in'), u('z'), 119),
+         (u('x'), u('out'), u('z'), 9, u('y'), u('in'), u('z'), 135),
+         (u('x'), u('out'), u('z'), 13, u('y'), u('in'), u('z'), 145),
+         (u('x'), u('out'), u('z'), 14, u('y'), u('in'), u('z'), 158),
+         (u('x'), u('out'), u('z'), 16, u('y'), u('in'), u('z'), 122),
+         (u('x'), u('out'), u('z'), 17, u('y'), u('in'), u('z'), 160),
+         (u('x'), u('out'), u('z'), 18, u('y'), u('in'), u('z'), 180),
+         (u('x'), u('out'), u('z'), 20, u('y'), u('in'), u('z'), 143),
+         (u('x'), u('out'), u('z'), 21, u('y'), u('in'), u('z'), 128),
+         (u('x'), u('out'), u('z'), 22, u('y'), u('in'), u('z'), 129),
+         (u('x'), u('out'), u('z'), 25, u('y'), u('in'), u('z'), 111),
+         (u('x'), u('out'), u('z'), 28, u('y'), u('in'), u('z'), 114),
+         (u('x'), u('out'), u('z'), 29, u('y'), u('in'), u('z'), 121),
+         (u('x'), u('out'), u('z'), 31, u('y'), u('in'), u('z'), 126),
+         (u('x'), u('out'), u('z'), 32, u('y'), u('in'), u('z'), 155),
+         (u('x'), u('out'), u('z'), 33, u('y'), u('in'), u('z'), 123),
+         (u('x'), u('out'), u('z'), 12, u('y'), u('in'), u('z'), 144)]
+
+    mi = MultiIndex.from_tuples(t)
+    assert not mi.has_duplicates
+
+
+def test_has_duplicates_overflow():
+    # handle int64 overflow if possible
+    def check(nlevels, with_nulls):
+        codes = np.tile(np.arange(500), 2)
+        level = np.arange(500)
+
+        if with_nulls:  # inject some null values
+            codes[500] = -1  # common nan value
+            codes = [codes.copy() for i in range(nlevels)]
+            for i in range(nlevels):
+                codes[i][500 + i - nlevels // 2] = -1
+
+            codes += [np.array([-1, 1]).repeat(500)]
+        else:
+            codes = [codes] * nlevels + [np.arange(2).repeat(500)]
+
+        levels = [level] * nlevels + [[0, 1]]
+
+        # no dups
+        mi = MultiIndex(levels=levels, codes=codes)
+        assert not mi.has_duplicates
+
+        # with a dup
+        if with_nulls:
+            def f(a):
+                return np.insert(a, 1000, a[0])
+            codes = list(map(f, codes))
+            mi = MultiIndex(levels=levels, codes=codes)
+        else:
+            values = mi.values.tolist()
+            mi = MultiIndex.from_tuples(values + [values[0]])
+
+        assert mi.has_duplicates
+
+    # no overflow
+    check(4, False)
+    check(4, True)
+
+    # overflow possible
+    check(8, False)
+    check(8, True)
+
+
+@pytest.mark.parametrize('keep, expected', [
+    ('first', np.array([False, False, False, True, True, False])),
+    ('last', np.array([False, True, True, False, False, False])),
+    (False, np.array([False, True, True, True, True, False]))
+])
+def test_duplicated(idx_dup, keep, expected):
+    result = idx_dup.duplicated(keep=keep)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize('keep', ['first', 'last', False])
+def test_duplicated_large(keep):
+    # GH 9125
+    n, k = 200, 5000
+    levels = [np.arange(n), tm.makeStringIndex(n), 1000 + np.arange(n)]
+    codes = [np.random.choice(n, k * n) for lev in levels]
+    mi = MultiIndex(levels=levels, codes=codes)
+
+    result = mi.duplicated(keep=keep)
+    expected = hashtable.duplicated_object(mi.values, keep=keep)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_get_duplicates():
+    # GH5873
+    for a in [101, 102]:
+        mi = MultiIndex.from_arrays([[101, a], [3.5, np.nan]])
+        assert not mi.has_duplicates
+
+        with tm.assert_produces_warning(FutureWarning):
+            # Deprecated - see GH20239
+            assert mi.get_duplicates().equals(MultiIndex.from_arrays([[], []]))
+
+        tm.assert_numpy_array_equal(mi.duplicated(),
+                                    np.zeros(2, dtype='bool'))
+
+    for n in range(1, 6):  # 1st level shape
+        for m in range(1, 5):  # 2nd level shape
+            # all possible unique combinations, including nan
+            codes = product(range(-1, n), range(-1, m))
+            mi = MultiIndex(levels=[list('abcde')[:n], list('WXYZ')[:m]],
+                            codes=np.random.permutation(list(codes)).T)
+            assert len(mi) == (n + 1) * (m + 1)
+            assert not mi.has_duplicates
+
+            with tm.assert_produces_warning(FutureWarning):
+                # Deprecated - see GH20239
+                assert mi.get_duplicates().equals(MultiIndex.from_arrays(
+                    [[], []]))
+
+            tm.assert_numpy_array_equal(mi.duplicated(),
+                                        np.zeros(len(mi), dtype='bool'))
diff --git a/pandas/tests/indexes/multi/test_equivalence.py b/pandas/tests/indexes/multi/test_equivalence.py
new file mode 100644
index 0000000000000..6a9eb662dd9d4
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_equivalence.py
@@ -0,0 +1,221 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, lzip, range
+
+import pandas as pd
+from pandas import Index, MultiIndex, Series
+import pandas.util.testing as tm
+
+
+def test_equals(idx):
+    assert idx.equals(idx)
+    assert idx.equals(idx.copy())
+    assert idx.equals(idx.astype(object))
+
+    assert not idx.equals(list(idx))
+    assert not idx.equals(np.array(idx))
+
+    same_values = Index(idx, dtype=object)
+    assert idx.equals(same_values)
+    assert same_values.equals(idx)
+
+    if idx.nlevels == 1:
+        # do not test MultiIndex
+        assert not idx.equals(pd.Series(idx))
+
+
+def test_equals_op(idx):
+    # GH9947, GH10637
+    index_a = idx
+
+    n = len(index_a)
+    index_b = index_a[0:-1]
+    index_c = index_a[0:-1].append(index_a[-2:-1])
+    index_d = index_a[0:1]
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == index_b
+    expected1 = np.array([True] * n)
+    expected2 = np.array([True] * (n - 1) + [False])
+    tm.assert_numpy_array_equal(index_a == index_a, expected1)
+    tm.assert_numpy_array_equal(index_a == index_c, expected2)
+
+    # test comparisons with numpy arrays
+    array_a = np.array(index_a)
+    array_b = np.array(index_a[0:-1])
+    array_c = np.array(index_a[0:-1].append(index_a[-2:-1]))
+    array_d = np.array(index_a[0:1])
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == array_b
+    tm.assert_numpy_array_equal(index_a == array_a, expected1)
+    tm.assert_numpy_array_equal(index_a == array_c, expected2)
+
+    # test comparisons with Series
+    series_a = Series(array_a)
+    series_b = Series(array_b)
+    series_c = Series(array_c)
+    series_d = Series(array_d)
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == series_b
+
+    tm.assert_numpy_array_equal(index_a == series_a, expected1)
+    tm.assert_numpy_array_equal(index_a == series_c, expected2)
+
+    # cases where length is 1 for one of them
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == index_d
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == series_d
+    with pytest.raises(ValueError, match="Lengths must match"):
+        index_a == array_d
+    msg = "Can only compare identically-labeled Series objects"
+    with pytest.raises(ValueError, match=msg):
+        series_a == series_d
+    with pytest.raises(ValueError, match="Lengths must match"):
+        series_a == array_d
+
+    # comparing with a scalar should broadcast; note that we are excluding
+    # MultiIndex because in this case each item in the index is a tuple of
+    # length 2, and therefore is considered an array of length 2 in the
+    # comparison instead of a scalar
+    if not isinstance(index_a, MultiIndex):
+        expected3 = np.array([False] * (len(index_a) - 2) + [True, False])
+        # assuming the 2nd to last item is unique in the data
+        item = index_a[-2]
+        tm.assert_numpy_array_equal(index_a == item, expected3)
+        tm.assert_series_equal(series_a == item, Series(expected3))
+
+
+def test_equals_multi(idx):
+    assert idx.equals(idx)
+    assert not idx.equals(idx.values)
+    assert idx.equals(Index(idx.values))
+
+    assert idx.equal_levels(idx)
+    assert not idx.equals(idx[:-1])
+    assert not idx.equals(idx[-1])
+
+    # different number of levels
+    index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+        lrange(4))], codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+    index2 = MultiIndex(levels=index.levels[:-1], codes=index.codes[:-1])
+    assert not index.equals(index2)
+    assert not index.equal_levels(index2)
+
+    # levels are different
+    major_axis = Index(lrange(4))
+    minor_axis = Index(lrange(2))
+
+    major_codes = np.array([0, 0, 1, 2, 2, 3])
+    minor_codes = np.array([0, 1, 0, 0, 1, 0])
+
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+    assert not idx.equals(index)
+    assert not idx.equal_levels(index)
+
+    # some of the labels are different
+    major_axis = Index(['foo', 'bar', 'baz', 'qux'])
+    minor_axis = Index(['one', 'two'])
+
+    major_codes = np.array([0, 0, 2, 2, 3, 3])
+    minor_codes = np.array([0, 1, 0, 1, 0, 1])
+
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+    assert not idx.equals(index)
+
+
+def test_identical(idx):
+    mi = idx.copy()
+    mi2 = idx.copy()
+    assert mi.identical(mi2)
+
+    mi = mi.set_names(['new1', 'new2'])
+    assert mi.equals(mi2)
+    assert not mi.identical(mi2)
+
+    mi2 = mi2.set_names(['new1', 'new2'])
+    assert mi.identical(mi2)
+
+    mi3 = Index(mi.tolist(), names=mi.names)
+    mi4 = Index(mi.tolist(), names=mi.names, tupleize_cols=False)
+    assert mi.identical(mi3)
+    assert not mi.identical(mi4)
+    assert mi.equals(mi4)
+
+
+def test_equals_operator(idx):
+    # GH9785
+    assert (idx == idx).all()
+
+
+def test_equals_missing_values():
+    # make sure take is not using -1
+    i = pd.MultiIndex.from_tuples([(0, pd.NaT),
+                                   (0, pd.Timestamp('20130101'))])
+    result = i[0:1].equals(i[0])
+    assert not result
+    result = i[1:2].equals(i[1])
+    assert not result
+
+
+def test_is_():
+    mi = MultiIndex.from_tuples(lzip(range(10), range(10)))
+    assert mi.is_(mi)
+    assert mi.is_(mi.view())
+    assert mi.is_(mi.view().view().view().view())
+    mi2 = mi.view()
+    # names are metadata, they don't change id
+    mi2.names = ["A", "B"]
+    assert mi2.is_(mi)
+    assert mi.is_(mi2)
+
+    assert mi.is_(mi.set_names(["C", "D"]))
+    mi2 = mi.view()
+    mi2.set_names(["E", "F"], inplace=True)
+    assert mi.is_(mi2)
+    # levels are inherent properties, they change identity
+    mi3 = mi2.set_levels([lrange(10), lrange(10)])
+    assert not mi3.is_(mi2)
+    # shouldn't change
+    assert mi2.is_(mi)
+    mi4 = mi3.view()
+
+    # GH 17464 - Remove duplicate MultiIndex levels
+    mi4.set_levels([lrange(10), lrange(10)], inplace=True)
+    assert not mi4.is_(mi3)
+    mi5 = mi.view()
+    mi5.set_levels(mi5.levels, inplace=True)
+    assert not mi5.is_(mi)
+
+
+def test_is_all_dates(idx):
+    assert not idx.is_all_dates
+
+
+def test_is_numeric(idx):
+    # MultiIndex is never numeric
+    assert not idx.is_numeric()
+
+
+def test_multiindex_compare():
+    # GH 21149
+    # Ensure comparison operations for MultiIndex with nlevels == 1
+    # behave consistently with those for MultiIndex with nlevels > 1
+
+    midx = pd.MultiIndex.from_product([[0, 1]])
+
+    # Equality self-test: MultiIndex object vs self
+    expected = pd.Series([True, True])
+    result = pd.Series(midx == midx)
+    tm.assert_series_equal(result, expected)
+
+    # Greater than comparison: MultiIndex object vs self
+    expected = pd.Series([False, False])
+    result = pd.Series(midx > midx)
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexes/multi/test_format.py b/pandas/tests/indexes/multi/test_format.py
new file mode 100644
index 0000000000000..a10b7220b8aa0
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_format.py
@@ -0,0 +1,132 @@
+# -*- coding: utf-8 -*-
+
+
+import warnings
+
+import pytest
+
+from pandas.compat import PY3, range, u
+
+import pandas as pd
+from pandas import MultiIndex, compat
+import pandas.util.testing as tm
+
+
+def test_dtype_str(indices):
+    dtype = indices.dtype_str
+    assert isinstance(dtype, compat.string_types)
+    assert dtype == str(indices.dtype)
+
+
+def test_format(idx):
+    idx.format()
+    idx[:0].format()
+
+
+def test_format_integer_names():
+    index = MultiIndex(levels=[[0, 1], [0, 1]],
+                       codes=[[0, 0, 1, 1], [0, 1, 0, 1]], names=[0, 1])
+    index.format(names=True)
+
+
+def test_format_sparse_config(idx):
+    warn_filters = warnings.filters
+    warnings.filterwarnings('ignore', category=FutureWarning,
+                            module=".*format")
+    # GH1538
+    pd.set_option('display.multi_sparse', False)
+
+    result = idx.format()
+    assert result[1] == 'foo  two'
+
+    tm.reset_display_options()
+
+    warnings.filters = warn_filters
+
+
+def test_format_sparse_display():
+    index = MultiIndex(levels=[[0, 1], [0, 1], [0, 1], [0]],
+                       codes=[[0, 0, 0, 1, 1, 1], [0, 0, 1, 0, 0, 1],
+                              [0, 1, 0, 0, 1, 0], [0, 0, 0, 0, 0, 0]])
+
+    result = index.format()
+    assert result[3] == '1  0  0  0'
+
+
+def test_repr_with_unicode_data():
+    with pd.core.config.option_context("display.encoding", 'UTF-8'):
+        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+        index = pd.DataFrame(d).set_index(["a", "b"]).index
+        assert "\\u" not in repr(index)  # we don't want unicode-escaped
+
+
+@pytest.mark.skip(reason="#22511 will remove this test")
+def test_repr_roundtrip():
+
+    mi = MultiIndex.from_product([list('ab'), range(3)],
+                                 names=['first', 'second'])
+    str(mi)
+
+    if PY3:
+        tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
+    else:
+        result = eval(repr(mi))
+        # string coerces to unicode
+        tm.assert_index_equal(result, mi, exact=False)
+        assert mi.get_level_values('first').inferred_type == 'string'
+        assert result.get_level_values('first').inferred_type == 'unicode'
+
+    mi_u = MultiIndex.from_product(
+        [list(u'ab'), range(3)], names=['first', 'second'])
+    result = eval(repr(mi_u))
+    tm.assert_index_equal(result, mi_u, exact=True)
+
+    # formatting
+    if PY3:
+        str(mi)
+    else:
+        compat.text_type(mi)
+
+    # long format
+    mi = MultiIndex.from_product([list('abcdefg'), range(10)],
+                                 names=['first', 'second'])
+
+    if PY3:
+        tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
+    else:
+        result = eval(repr(mi))
+        # string coerces to unicode
+        tm.assert_index_equal(result, mi, exact=False)
+        assert mi.get_level_values('first').inferred_type == 'string'
+        assert result.get_level_values('first').inferred_type == 'unicode'
+
+    result = eval(repr(mi_u))
+    tm.assert_index_equal(result, mi_u, exact=True)
+
+
+def test_unicode_string_with_unicode():
+    d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+    idx = pd.DataFrame(d).set_index(["a", "b"]).index
+
+    if PY3:
+        str(idx)
+    else:
+        compat.text_type(idx)
+
+
+def test_bytestring_with_unicode():
+    d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
+    idx = pd.DataFrame(d).set_index(["a", "b"]).index
+
+    if PY3:
+        bytes(idx)
+    else:
+        str(idx)
+
+
+def test_repr_max_seq_item_setting(idx):
+    # GH10182
+    idx = idx.repeat(50)
+    with pd.option_context("display.max_seq_items", None):
+        repr(idx)
+        assert '...' not in str(idx)
diff --git a/pandas/tests/indexes/multi/test_get_set.py b/pandas/tests/indexes/multi/test_get_set.py
new file mode 100644
index 0000000000000..62911c7032aca
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_get_set.py
@@ -0,0 +1,457 @@
+# -*- coding: utf-8 -*-
+
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas import CategoricalIndex, Index, MultiIndex
+import pandas.util.testing as tm
+
+
+def assert_matching(actual, expected, check_dtype=False):
+    # avoid specifying internal representation
+    # as much as possible
+    assert len(actual) == len(expected)
+    for act, exp in zip(actual, expected):
+        act = np.asarray(act)
+        exp = np.asarray(exp)
+        tm.assert_numpy_array_equal(act, exp, check_dtype=check_dtype)
+
+
+def test_get_level_number_integer(idx):
+    idx.names = [1, 0]
+    assert idx._get_level_number(1) == 0
+    assert idx._get_level_number(0) == 1
+    msg = "Too many levels: Index has only 2 levels, not 3"
+    with pytest.raises(IndexError, match=msg):
+        idx._get_level_number(2)
+    with pytest.raises(KeyError, match='Level fourth not found'):
+        idx._get_level_number('fourth')
+
+
+def test_get_level_values(idx):
+    result = idx.get_level_values(0)
+    expected = Index(['foo', 'foo', 'bar', 'baz', 'qux', 'qux'],
+                     name='first')
+    tm.assert_index_equal(result, expected)
+    assert result.name == 'first'
+
+    result = idx.get_level_values('first')
+    expected = idx.get_level_values(0)
+    tm.assert_index_equal(result, expected)
+
+    # GH 10460
+    index = MultiIndex(
+        levels=[CategoricalIndex(['A', 'B']),
+                CategoricalIndex([1, 2, 3])],
+        codes=[np.array([0, 0, 0, 1, 1, 1]),
+               np.array([0, 1, 2, 0, 1, 2])])
+
+    exp = CategoricalIndex(['A', 'A', 'A', 'B', 'B', 'B'])
+    tm.assert_index_equal(index.get_level_values(0), exp)
+    exp = CategoricalIndex([1, 2, 3, 1, 2, 3])
+    tm.assert_index_equal(index.get_level_values(1), exp)
+
+
+def test_get_value_duplicates():
+    index = MultiIndex(levels=[['D', 'B', 'C'],
+                               [0, 26, 27, 37, 57, 67, 75, 82]],
+                       codes=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
+                              [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
+                       names=['tag', 'day'])
+
+    assert index.get_loc('D') == slice(0, 3)
+    with pytest.raises(KeyError, match=r"^'D'$"):
+        index._engine.get_value(np.array([]), 'D')
+
+
+def test_get_level_values_all_na():
+    # GH 17924 when level entirely consists of nan
+    arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(0)
+    expected = pd.Index([np.nan, np.nan, np.nan], dtype=np.float64)
+    tm.assert_index_equal(result, expected)
+
+    result = index.get_level_values(1)
+    expected = pd.Index(['a', np.nan, 1], dtype=object)
+    tm.assert_index_equal(result, expected)
+
+
+def test_get_level_values_int_with_na():
+    # GH 17924
+    arrays = [['a', 'b', 'b'], [1, np.nan, 2]]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(1)
+    expected = Index([1, np.nan, 2])
+    tm.assert_index_equal(result, expected)
+
+    arrays = [['a', 'b', 'b'], [np.nan, np.nan, 2]]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(1)
+    expected = Index([np.nan, np.nan, 2])
+    tm.assert_index_equal(result, expected)
+
+
+def test_get_level_values_na():
+    arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(0)
+    expected = pd.Index([np.nan, np.nan, np.nan])
+    tm.assert_index_equal(result, expected)
+
+    result = index.get_level_values(1)
+    expected = pd.Index(['a', np.nan, 1])
+    tm.assert_index_equal(result, expected)
+
+    arrays = [['a', 'b', 'b'], pd.DatetimeIndex([0, 1, pd.NaT])]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(1)
+    expected = pd.DatetimeIndex([0, 1, pd.NaT])
+    tm.assert_index_equal(result, expected)
+
+    arrays = [[], []]
+    index = pd.MultiIndex.from_arrays(arrays)
+    result = index.get_level_values(0)
+    expected = pd.Index([], dtype=object)
+    tm.assert_index_equal(result, expected)
+
+
+def test_set_name_methods(idx, index_names):
+    # so long as these are synonyms, we don't need to test set_names
+    assert idx.rename == idx.set_names
+    new_names = [name + "SUFFIX" for name in index_names]
+    ind = idx.set_names(new_names)
+    assert idx.names == index_names
+    assert ind.names == new_names
+    msg = "Length of names must match number of levels in MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        ind.set_names(new_names + new_names)
+    new_names2 = [name + "SUFFIX2" for name in new_names]
+    res = ind.set_names(new_names2, inplace=True)
+    assert res is None
+    assert ind.names == new_names2
+
+    # set names for specific level (# GH7792)
+    ind = idx.set_names(new_names[0], level=0)
+    assert idx.names == index_names
+    assert ind.names == [new_names[0], index_names[1]]
+
+    res = ind.set_names(new_names2[0], level=0, inplace=True)
+    assert res is None
+    assert ind.names == [new_names2[0], index_names[1]]
+
+    # set names for multiple levels
+    ind = idx.set_names(new_names, level=[0, 1])
+    assert idx.names == index_names
+    assert ind.names == new_names
+
+    res = ind.set_names(new_names2, level=[0, 1], inplace=True)
+    assert res is None
+    assert ind.names == new_names2
+
+
+def test_set_levels_codes_directly(idx):
+    # setting levels/codes directly raises AttributeError
+
+    levels = idx.levels
+    new_levels = [[lev + 'a' for lev in level] for level in levels]
+
+    codes = idx.codes
+    major_codes, minor_codes = codes
+    major_codes = [(x + 1) % 3 for x in major_codes]
+    minor_codes = [(x + 1) % 1 for x in minor_codes]
+    new_codes = [major_codes, minor_codes]
+
+    msg = "can't set attribute"
+    with pytest.raises(AttributeError, match=msg):
+        idx.levels = new_levels
+    with pytest.raises(AttributeError, match=msg):
+        idx.codes = new_codes
+
+
+def test_set_levels(idx):
+    # side note - you probably wouldn't want to use levels and codes
+    # directly like this - but it is possible.
+    levels = idx.levels
+    new_levels = [[lev + 'a' for lev in level] for level in levels]
+
+    # level changing [w/o mutation]
+    ind2 = idx.set_levels(new_levels)
+    assert_matching(ind2.levels, new_levels)
+    assert_matching(idx.levels, levels)
+
+    # level changing [w/ mutation]
+    ind2 = idx.copy()
+    inplace_return = ind2.set_levels(new_levels, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.levels, new_levels)
+
+    # level changing specific level [w/o mutation]
+    ind2 = idx.set_levels(new_levels[0], level=0)
+    assert_matching(ind2.levels, [new_levels[0], levels[1]])
+    assert_matching(idx.levels, levels)
+
+    ind2 = idx.set_levels(new_levels[1], level=1)
+    assert_matching(ind2.levels, [levels[0], new_levels[1]])
+    assert_matching(idx.levels, levels)
+
+    # level changing multiple levels [w/o mutation]
+    ind2 = idx.set_levels(new_levels, level=[0, 1])
+    assert_matching(ind2.levels, new_levels)
+    assert_matching(idx.levels, levels)
+
+    # level changing specific level [w/ mutation]
+    ind2 = idx.copy()
+    inplace_return = ind2.set_levels(new_levels[0], level=0, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.levels, [new_levels[0], levels[1]])
+    assert_matching(idx.levels, levels)
+
+    ind2 = idx.copy()
+    inplace_return = ind2.set_levels(new_levels[1], level=1, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.levels, [levels[0], new_levels[1]])
+    assert_matching(idx.levels, levels)
+
+    # level changing multiple levels [w/ mutation]
+    ind2 = idx.copy()
+    inplace_return = ind2.set_levels(new_levels, level=[0, 1],
+                                     inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.levels, new_levels)
+    assert_matching(idx.levels, levels)
+
+    # illegal level changing should not change levels
+    # GH 13754
+    original_index = idx.copy()
+    for inplace in [True, False]:
+        with pytest.raises(ValueError, match="^On"):
+            idx.set_levels(['c'], level=0, inplace=inplace)
+        assert_matching(idx.levels, original_index.levels,
+                        check_dtype=True)
+
+        with pytest.raises(ValueError, match="^On"):
+            idx.set_codes([0, 1, 2, 3, 4, 5], level=0,
+                          inplace=inplace)
+        assert_matching(idx.codes, original_index.codes,
+                        check_dtype=True)
+
+        with pytest.raises(TypeError, match="^Levels"):
+            idx.set_levels('c', level=0, inplace=inplace)
+        assert_matching(idx.levels, original_index.levels,
+                        check_dtype=True)
+
+        with pytest.raises(TypeError, match="^Codes"):
+            idx.set_codes(1, level=0, inplace=inplace)
+        assert_matching(idx.codes, original_index.codes,
+                        check_dtype=True)
+
+
+def test_set_codes(idx):
+    # side note - you probably wouldn't want to use levels and codes
+    # directly like this - but it is possible.
+    codes = idx.codes
+    major_codes, minor_codes = codes
+    major_codes = [(x + 1) % 3 for x in major_codes]
+    minor_codes = [(x + 1) % 1 for x in minor_codes]
+    new_codes = [major_codes, minor_codes]
+
+    # changing codes w/o mutation
+    ind2 = idx.set_codes(new_codes)
+    assert_matching(ind2.codes, new_codes)
+    assert_matching(idx.codes, codes)
+
+    # changing label w/ mutation
+    ind2 = idx.copy()
+    inplace_return = ind2.set_codes(new_codes, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.codes, new_codes)
+
+    # codes changing specific level w/o mutation
+    ind2 = idx.set_codes(new_codes[0], level=0)
+    assert_matching(ind2.codes, [new_codes[0], codes[1]])
+    assert_matching(idx.codes, codes)
+
+    ind2 = idx.set_codes(new_codes[1], level=1)
+    assert_matching(ind2.codes, [codes[0], new_codes[1]])
+    assert_matching(idx.codes, codes)
+
+    # codes changing multiple levels w/o mutation
+    ind2 = idx.set_codes(new_codes, level=[0, 1])
+    assert_matching(ind2.codes, new_codes)
+    assert_matching(idx.codes, codes)
+
+    # label changing specific level w/ mutation
+    ind2 = idx.copy()
+    inplace_return = ind2.set_codes(new_codes[0], level=0, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.codes, [new_codes[0], codes[1]])
+    assert_matching(idx.codes, codes)
+
+    ind2 = idx.copy()
+    inplace_return = ind2.set_codes(new_codes[1], level=1, inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.codes, [codes[0], new_codes[1]])
+    assert_matching(idx.codes, codes)
+
+    # codes changing multiple levels [w/ mutation]
+    ind2 = idx.copy()
+    inplace_return = ind2.set_codes(new_codes, level=[0, 1],
+                                    inplace=True)
+    assert inplace_return is None
+    assert_matching(ind2.codes, new_codes)
+    assert_matching(idx.codes, codes)
+
+    # label changing for levels of different magnitude of categories
+    ind = pd.MultiIndex.from_tuples([(0, i) for i in range(130)])
+    new_codes = range(129, -1, -1)
+    expected = pd.MultiIndex.from_tuples(
+        [(0, i) for i in new_codes])
+
+    # [w/o mutation]
+    result = ind.set_codes(codes=new_codes, level=1)
+    assert result.equals(expected)
+
+    # [w/ mutation]
+    result = ind.copy()
+    result.set_codes(codes=new_codes, level=1, inplace=True)
+    assert result.equals(expected)
+
+    with tm.assert_produces_warning(FutureWarning):
+        ind.set_codes(labels=new_codes, level=1)
+
+
+def test_set_labels_deprecated():
+    # GH23752
+    ind = pd.MultiIndex.from_tuples([(0, i) for i in range(130)])
+    new_labels = range(129, -1, -1)
+    expected = pd.MultiIndex.from_tuples(
+        [(0, i) for i in new_labels])
+
+    # [w/o mutation]
+    with tm.assert_produces_warning(FutureWarning):
+        result = ind.set_labels(labels=new_labels, level=1)
+    assert result.equals(expected)
+
+    # [w/ mutation]
+    result = ind.copy()
+    with tm.assert_produces_warning(FutureWarning):
+        result.set_labels(labels=new_labels, level=1, inplace=True)
+    assert result.equals(expected)
+
+
+def test_set_levels_codes_names_bad_input(idx):
+    levels, codes = idx.levels, idx.codes
+    names = idx.names
+
+    with pytest.raises(ValueError, match='Length of levels'):
+        idx.set_levels([levels[0]])
+
+    with pytest.raises(ValueError, match='Length of codes'):
+        idx.set_codes([codes[0]])
+
+    with pytest.raises(ValueError, match='Length of names'):
+        idx.set_names([names[0]])
+
+    # shouldn't scalar data error, instead should demand list-like
+    with pytest.raises(TypeError, match='list of lists-like'):
+        idx.set_levels(levels[0])
+
+    # shouldn't scalar data error, instead should demand list-like
+    with pytest.raises(TypeError, match='list of lists-like'):
+        idx.set_codes(codes[0])
+
+    # shouldn't scalar data error, instead should demand list-like
+    with pytest.raises(TypeError, match='list-like'):
+        idx.set_names(names[0])
+
+    # should have equal lengths
+    with pytest.raises(TypeError, match='list of lists-like'):
+        idx.set_levels(levels[0], level=[0, 1])
+
+    with pytest.raises(TypeError, match='list-like'):
+        idx.set_levels(levels, level=0)
+
+    # should have equal lengths
+    with pytest.raises(TypeError, match='list of lists-like'):
+        idx.set_codes(codes[0], level=[0, 1])
+
+    with pytest.raises(TypeError, match='list-like'):
+        idx.set_codes(codes, level=0)
+
+    # should have equal lengths
+    with pytest.raises(ValueError, match='Length of names'):
+        idx.set_names(names[0], level=[0, 1])
+
+    with pytest.raises(TypeError, match='Names must be a'):
+        idx.set_names(names, level=0)
+
+
+@pytest.mark.parametrize('inplace', [True, False])
+def test_set_names_with_nlevel_1(inplace):
+    # GH 21149
+    # Ensure that .set_names for MultiIndex with
+    # nlevels == 1 does not raise any errors
+    expected = pd.MultiIndex(levels=[[0, 1]],
+                             codes=[[0, 1]],
+                             names=['first'])
+    m = pd.MultiIndex.from_product([[0, 1]])
+    result = m.set_names('first', level=0, inplace=inplace)
+
+    if inplace:
+        result = m
+
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('ordered', [True, False])
+def test_set_levels_categorical(ordered):
+    # GH13854
+    index = MultiIndex.from_arrays([list("xyzx"), [0, 1, 2, 3]])
+
+    cidx = CategoricalIndex(list("bac"), ordered=ordered)
+    result = index.set_levels(cidx, 0)
+    expected = MultiIndex(levels=[cidx, [0, 1, 2, 3]],
+                          codes=index.codes)
+    tm.assert_index_equal(result, expected)
+
+    result_lvl = result.get_level_values(0)
+    expected_lvl = CategoricalIndex(list("bacb"),
+                                    categories=cidx.categories,
+                                    ordered=cidx.ordered)
+    tm.assert_index_equal(result_lvl, expected_lvl)
+
+
+def test_set_value_keeps_names():
+    # motivating example from #3742
+    lev1 = ['hans', 'hans', 'hans', 'grethe', 'grethe', 'grethe']
+    lev2 = ['1', '2', '3'] * 2
+    idx = pd.MultiIndex.from_arrays([lev1, lev2], names=['Name', 'Number'])
+    df = pd.DataFrame(
+        np.random.randn(6, 4),
+        columns=['one', 'two', 'three', 'four'],
+        index=idx)
+    df = df.sort_index()
+    assert df._is_copy is None
+    assert df.index.names == ('Name', 'Number')
+    df.at[('grethe', '4'), 'one'] = 99.34
+    assert df._is_copy is None
+    assert df.index.names == ('Name', 'Number')
+
+
+def test_set_levels_with_iterable():
+    # GH23273
+    sizes = [1, 2, 3]
+    colors = ['black'] * 3
+    index = pd.MultiIndex.from_arrays([sizes, colors], names=['size', 'color'])
+
+    result = index.set_levels(map(int, ['3', '2', '1']), level='size')
+
+    expected_sizes = [3, 2, 1]
+    expected = pd.MultiIndex.from_arrays([expected_sizes, colors],
+                                         names=['size', 'color'])
+    tm.assert_index_equal(result, expected)
diff --git a/pandas/tests/indexes/multi/test_indexing.py b/pandas/tests/indexes/multi/test_indexing.py
new file mode 100644
index 0000000000000..c2af3b2050d8d
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_indexing.py
@@ -0,0 +1,393 @@
+# -*- coding: utf-8 -*-
+
+
+from datetime import timedelta
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2, lrange
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, Index, IntervalIndex, MultiIndex,
+    date_range)
+from pandas.core.indexes.base import InvalidIndexError
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal
+
+
+def test_slice_locs_partial(idx):
+    sorted_idx, _ = idx.sortlevel(0)
+
+    result = sorted_idx.slice_locs(('foo', 'two'), ('qux', 'one'))
+    assert result == (1, 5)
+
+    result = sorted_idx.slice_locs(None, ('qux', 'one'))
+    assert result == (0, 5)
+
+    result = sorted_idx.slice_locs(('foo', 'two'), None)
+    assert result == (1, len(sorted_idx))
+
+    result = sorted_idx.slice_locs('bar', 'baz')
+    assert result == (2, 4)
+
+
+def test_slice_locs():
+    df = tm.makeTimeDataFrame()
+    stacked = df.stack()
+    idx = stacked.index
+
+    slob = slice(*idx.slice_locs(df.index[5], df.index[15]))
+    sliced = stacked[slob]
+    expected = df[5:16].stack()
+    tm.assert_almost_equal(sliced.values, expected.values)
+
+    slob = slice(*idx.slice_locs(df.index[5] + timedelta(seconds=30),
+                                 df.index[15] - timedelta(seconds=30)))
+    sliced = stacked[slob]
+    expected = df[6:15].stack()
+    tm.assert_almost_equal(sliced.values, expected.values)
+
+
+def test_slice_locs_with_type_mismatch():
+    df = tm.makeTimeDataFrame()
+    stacked = df.stack()
+    idx = stacked.index
+    with pytest.raises(TypeError, match='^Level type mismatch'):
+        idx.slice_locs((1, 3))
+    with pytest.raises(TypeError, match='^Level type mismatch'):
+        idx.slice_locs(df.index[5] + timedelta(seconds=30), (5, 2))
+    df = tm.makeCustomDataframe(5, 5)
+    stacked = df.stack()
+    idx = stacked.index
+    with pytest.raises(TypeError, match='^Level type mismatch'):
+        idx.slice_locs(timedelta(seconds=30))
+    # TODO: Try creating a UnicodeDecodeError in exception message
+    with pytest.raises(TypeError, match='^Level type mismatch'):
+        idx.slice_locs(df.index[1], (16, "a"))
+
+
+def test_slice_locs_not_sorted():
+    index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+        lrange(4))], codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+    msg = "[Kk]ey length.*greater than MultiIndex lexsort depth"
+    with pytest.raises(KeyError, match=msg):
+        index.slice_locs((1, 0, 1), (2, 1, 0))
+
+    # works
+    sorted_index, _ = index.sortlevel(0)
+    # should there be a test case here???
+    sorted_index.slice_locs((1, 0, 1), (2, 1, 0))
+
+
+def test_slice_locs_not_contained():
+    # some searchsorted action
+
+    index = MultiIndex(levels=[[0, 2, 4, 6], [0, 2, 4]],
+                       codes=[[0, 0, 0, 1, 1, 2, 3, 3, 3],
+                              [0, 1, 2, 1, 2, 2, 0, 1, 2]], sortorder=0)
+
+    result = index.slice_locs((1, 0), (5, 2))
+    assert result == (3, 6)
+
+    result = index.slice_locs(1, 5)
+    assert result == (3, 6)
+
+    result = index.slice_locs((2, 2), (5, 2))
+    assert result == (3, 6)
+
+    result = index.slice_locs(2, 5)
+    assert result == (3, 6)
+
+    result = index.slice_locs((1, 0), (6, 3))
+    assert result == (3, 8)
+
+    result = index.slice_locs(-1, 10)
+    assert result == (0, len(index))
+
+
+def test_putmask_with_wrong_mask(idx):
+    # GH18368
+
+    msg = "putmask: mask and data must be the same size"
+    with pytest.raises(ValueError, match=msg):
+        idx.putmask(np.ones(len(idx) + 1, np.bool), 1)
+
+    with pytest.raises(ValueError, match=msg):
+        idx.putmask(np.ones(len(idx) - 1, np.bool), 1)
+
+    with pytest.raises(ValueError, match=msg):
+        idx.putmask('foo', 1)
+
+
+def test_get_indexer():
+    major_axis = Index(lrange(4))
+    minor_axis = Index(lrange(2))
+
+    major_codes = np.array([0, 0, 1, 2, 2, 3, 3], dtype=np.intp)
+    minor_codes = np.array([0, 1, 0, 0, 1, 0, 1], dtype=np.intp)
+
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+    idx1 = index[:5]
+    idx2 = index[[1, 3, 5]]
+
+    r1 = idx1.get_indexer(idx2)
+    assert_almost_equal(r1, np.array([1, 3, -1], dtype=np.intp))
+
+    r1 = idx2.get_indexer(idx1, method='pad')
+    e1 = np.array([-1, 0, 0, 1, 1], dtype=np.intp)
+    assert_almost_equal(r1, e1)
+
+    r2 = idx2.get_indexer(idx1[::-1], method='pad')
+    assert_almost_equal(r2, e1[::-1])
+
+    rffill1 = idx2.get_indexer(idx1, method='ffill')
+    assert_almost_equal(r1, rffill1)
+
+    r1 = idx2.get_indexer(idx1, method='backfill')
+    e1 = np.array([0, 0, 1, 1, 2], dtype=np.intp)
+    assert_almost_equal(r1, e1)
+
+    r2 = idx2.get_indexer(idx1[::-1], method='backfill')
+    assert_almost_equal(r2, e1[::-1])
+
+    rbfill1 = idx2.get_indexer(idx1, method='bfill')
+    assert_almost_equal(r1, rbfill1)
+
+    # pass non-MultiIndex
+    r1 = idx1.get_indexer(idx2.values)
+    rexp1 = idx1.get_indexer(idx2)
+    assert_almost_equal(r1, rexp1)
+
+    r1 = idx1.get_indexer([1, 2, 3])
+    assert (r1 == [-1, -1, -1]).all()
+
+    # create index with duplicates
+    idx1 = Index(lrange(10) + lrange(10))
+    idx2 = Index(lrange(20))
+
+    msg = "Reindexing only valid with uniquely valued Index objects"
+    with pytest.raises(InvalidIndexError, match=msg):
+        idx1.get_indexer(idx2)
+
+
+def test_get_indexer_nearest():
+    midx = MultiIndex.from_tuples([('a', 1), ('b', 2)])
+    msg = ("method='nearest' not implemented yet for MultiIndex; see GitHub"
+           " issue 9365")
+    with pytest.raises(NotImplementedError, match=msg):
+        midx.get_indexer(['a'], method='nearest')
+    msg = "tolerance not implemented yet for MultiIndex"
+    with pytest.raises(NotImplementedError, match=msg):
+        midx.get_indexer(['a'], method='pad', tolerance=2)
+
+
+def test_getitem(idx):
+    # scalar
+    assert idx[2] == ('bar', 'one')
+
+    # slice
+    result = idx[2:5]
+    expected = idx[[2, 3, 4]]
+    assert result.equals(expected)
+
+    # boolean
+    result = idx[[True, False, True, False, True, True]]
+    result2 = idx[np.array([True, False, True, False, True, True])]
+    expected = idx[[0, 2, 4, 5]]
+    assert result.equals(expected)
+    assert result2.equals(expected)
+
+
+def test_getitem_group_select(idx):
+    sorted_idx, _ = idx.sortlevel(0)
+    assert sorted_idx.get_loc('baz') == slice(3, 4)
+    assert sorted_idx.get_loc('foo') == slice(0, 2)
+
+
+def test_get_indexer_consistency(idx):
+    # See GH 16819
+    if isinstance(idx, IntervalIndex):
+        pass
+
+    if idx.is_unique or isinstance(idx, CategoricalIndex):
+        indexer = idx.get_indexer(idx[0:2])
+        assert isinstance(indexer, np.ndarray)
+        assert indexer.dtype == np.intp
+    else:
+        e = "Reindexing only valid with uniquely valued Index objects"
+        with pytest.raises(InvalidIndexError, match=e):
+            idx.get_indexer(idx[0:2])
+
+    indexer, _ = idx.get_indexer_non_unique(idx[0:2])
+    assert isinstance(indexer, np.ndarray)
+    assert indexer.dtype == np.intp
+
+
+@pytest.mark.parametrize('ind1', [[True] * 5, pd.Index([True] * 5)])
+@pytest.mark.parametrize('ind2', [[True, False, True, False, False],
+                                  pd.Index([True, False, True, False,
+                                            False])])
+def test_getitem_bool_index_all(ind1, ind2):
+    # GH#22533
+    idx = MultiIndex.from_tuples([(10, 1), (20, 2), (30, 3),
+                                  (40, 4), (50, 5)])
+    tm.assert_index_equal(idx[ind1], idx)
+
+    expected = MultiIndex.from_tuples([(10, 1), (30, 3)])
+    tm.assert_index_equal(idx[ind2], expected)
+
+
+@pytest.mark.parametrize('ind1', [[True], pd.Index([True])])
+@pytest.mark.parametrize('ind2', [[False], pd.Index([False])])
+def test_getitem_bool_index_single(ind1, ind2):
+    # GH#22533
+    idx = MultiIndex.from_tuples([(10, 1)])
+    tm.assert_index_equal(idx[ind1], idx)
+
+    expected = pd.MultiIndex(levels=[np.array([], dtype=np.int64),
+                                     np.array([], dtype=np.int64)],
+                             codes=[[], []])
+    tm.assert_index_equal(idx[ind2], expected)
+
+
+@pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+def test_get_loc(idx):
+    assert idx.get_loc(('foo', 'two')) == 1
+    assert idx.get_loc(('baz', 'two')) == 3
+    with pytest.raises(KeyError, match=r"^10$"):
+        idx.get_loc(('bar', 'two'))
+    with pytest.raises(KeyError, match=r"^'quux'$"):
+        idx.get_loc('quux')
+
+    msg = ("only the default get_loc method is currently supported for"
+           " MultiIndex")
+    with pytest.raises(NotImplementedError, match=msg):
+        idx.get_loc('foo', method='nearest')
+
+    # 3 levels
+    index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+        lrange(4))], codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+    with pytest.raises(KeyError, match=r"^\(1, 1\)$"):
+        index.get_loc((1, 1))
+    assert index.get_loc((2, 0)) == slice(3, 5)
+
+
+def test_get_loc_duplicates():
+    index = Index([2, 2, 2, 2])
+    result = index.get_loc(2)
+    expected = slice(0, 4)
+    assert result == expected
+    # pytest.raises(Exception, index.get_loc, 2)
+
+    index = Index(['c', 'a', 'a', 'b', 'b'])
+    rs = index.get_loc('c')
+    xp = 0
+    assert rs == xp
+
+
+def test_get_loc_level():
+    index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
+        lrange(4))], codes=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
+            [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
+
+    loc, new_index = index.get_loc_level((0, 1))
+    expected = slice(1, 2)
+    exp_index = index[expected].droplevel(0).droplevel(0)
+    assert loc == expected
+    assert new_index.equals(exp_index)
+
+    loc, new_index = index.get_loc_level((0, 1, 0))
+    expected = 1
+    assert loc == expected
+    assert new_index is None
+
+    with pytest.raises(KeyError, match=r"^\(2, 2\)$"):
+        index.get_loc_level((2, 2))
+    # GH 22221: unused label
+    with pytest.raises(KeyError, match=r"^2$"):
+        index.drop(2).get_loc_level(2)
+    # Unused label on unsorted level:
+    with pytest.raises(KeyError, match=r"^2$"):
+        index.drop(1, level=2).get_loc_level(2, level=2)
+
+    index = MultiIndex(levels=[[2000], lrange(4)], codes=[np.array(
+        [0, 0, 0, 0]), np.array([0, 1, 2, 3])])
+    result, new_index = index.get_loc_level((2000, slice(None, None)))
+    expected = slice(None, None)
+    assert result == expected
+    assert new_index.equals(index.droplevel(0))
+
+
+@pytest.mark.parametrize('dtype1', [int, float, bool, str])
+@pytest.mark.parametrize('dtype2', [int, float, bool, str])
+def test_get_loc_multiple_dtypes(dtype1, dtype2):
+    # GH 18520
+    levels = [np.array([0, 1]).astype(dtype1),
+              np.array([0, 1]).astype(dtype2)]
+    idx = pd.MultiIndex.from_product(levels)
+    assert idx.get_loc(idx[2]) == 2
+
+
+@pytest.mark.parametrize('level', [0, 1])
+@pytest.mark.parametrize('dtypes', [[int, float], [float, int]])
+def test_get_loc_implicit_cast(level, dtypes):
+    # GH 18818, GH 15994 : as flat index, cast int to float and vice-versa
+    levels = [['a', 'b'], ['c', 'd']]
+    key = ['b', 'd']
+    lev_dtype, key_dtype = dtypes
+    levels[level] = np.array([0, 1], dtype=lev_dtype)
+    key[level] = key_dtype(1)
+    idx = MultiIndex.from_product(levels)
+    assert idx.get_loc(tuple(key)) == 3
+
+
+def test_get_loc_cast_bool():
+    # GH 19086 : int is casted to bool, but not vice-versa
+    levels = [[False, True], np.arange(2, dtype='int64')]
+    idx = MultiIndex.from_product(levels)
+
+    assert idx.get_loc((0, 1)) == 1
+    assert idx.get_loc((1, 0)) == 2
+
+    with pytest.raises(KeyError, match=r"^\(False, True\)$"):
+        idx.get_loc((False, True))
+    with pytest.raises(KeyError, match=r"^\(True, False\)$"):
+        idx.get_loc((True, False))
+
+
+@pytest.mark.parametrize('level', [0, 1])
+def test_get_loc_nan(level, nulls_fixture):
+    # GH 18485 : NaN in MultiIndex
+    levels = [['a', 'b'], ['c', 'd']]
+    key = ['b', 'd']
+    levels[level] = np.array([0, nulls_fixture], dtype=type(nulls_fixture))
+    key[level] = nulls_fixture
+    idx = MultiIndex.from_product(levels)
+    assert idx.get_loc(tuple(key)) == 3
+
+
+def test_get_loc_missing_nan():
+    # GH 8569
+    idx = MultiIndex.from_arrays([[1.0, 2.0], [3.0, 4.0]])
+    assert isinstance(idx.get_loc(1), slice)
+    with pytest.raises(KeyError, match=r"^3\.0$"):
+        idx.get_loc(3)
+    with pytest.raises(KeyError, match=r"^nan$"):
+        idx.get_loc(np.nan)
+    with pytest.raises(KeyError, match=r"^\[nan\]$"):
+        idx.get_loc([np.nan])
+
+
+def test_get_indexer_categorical_time():
+    # https://github.com/pandas-dev/pandas/issues/21390
+    midx = MultiIndex.from_product(
+        [Categorical(['a', 'b', 'c']),
+         Categorical(date_range("2012-01-01", periods=3, freq='H'))])
+    result = midx.get_indexer(midx)
+    tm.assert_numpy_array_equal(result, np.arange(9, dtype=np.intp))
diff --git a/pandas/tests/indexes/multi/test_integrity.py b/pandas/tests/indexes/multi/test_integrity.py
new file mode 100644
index 0000000000000..a7dc093147725
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_integrity.py
@@ -0,0 +1,296 @@
+# -*- coding: utf-8 -*-
+
+import re
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, range
+
+from pandas.core.dtypes.cast import construct_1d_object_array_from_listlike
+
+import pandas as pd
+from pandas import IntervalIndex, MultiIndex, RangeIndex
+import pandas.util.testing as tm
+
+
+def test_labels_dtypes():
+
+    # GH 8456
+    i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
+    assert i.codes[0].dtype == 'int8'
+    assert i.codes[1].dtype == 'int8'
+
+    i = MultiIndex.from_product([['a'], range(40)])
+    assert i.codes[1].dtype == 'int8'
+    i = MultiIndex.from_product([['a'], range(400)])
+    assert i.codes[1].dtype == 'int16'
+    i = MultiIndex.from_product([['a'], range(40000)])
+    assert i.codes[1].dtype == 'int32'
+
+    i = pd.MultiIndex.from_product([['a'], range(1000)])
+    assert (i.codes[0] >= 0).all()
+    assert (i.codes[1] >= 0).all()
+
+
+def test_values_boxed():
+    tuples = [(1, pd.Timestamp('2000-01-01')), (2, pd.NaT),
+              (3, pd.Timestamp('2000-01-03')),
+              (1, pd.Timestamp('2000-01-04')),
+              (2, pd.Timestamp('2000-01-02')),
+              (3, pd.Timestamp('2000-01-03'))]
+    result = pd.MultiIndex.from_tuples(tuples)
+    expected = construct_1d_object_array_from_listlike(tuples)
+    tm.assert_numpy_array_equal(result.values, expected)
+    # Check that code branches for boxed values produce identical results
+    tm.assert_numpy_array_equal(result.values[:4], result[:4].values)
+
+
+def test_values_multiindex_datetimeindex():
+    # Test to ensure we hit the boxing / nobox part of MI.values
+    ints = np.arange(10 ** 18, 10 ** 18 + 5)
+    naive = pd.DatetimeIndex(ints)
+    # TODO(GH-24559): Remove the FutureWarning
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        aware = pd.DatetimeIndex(ints, tz='US/Central')
+
+    idx = pd.MultiIndex.from_arrays([naive, aware])
+    result = idx.values
+
+    outer = pd.DatetimeIndex([x[0] for x in result])
+    tm.assert_index_equal(outer, naive)
+
+    inner = pd.DatetimeIndex([x[1] for x in result])
+    tm.assert_index_equal(inner, aware)
+
+    # n_lev > n_lab
+    result = idx[:2].values
+
+    outer = pd.DatetimeIndex([x[0] for x in result])
+    tm.assert_index_equal(outer, naive[:2])
+
+    inner = pd.DatetimeIndex([x[1] for x in result])
+    tm.assert_index_equal(inner, aware[:2])
+
+
+def test_values_multiindex_periodindex():
+    # Test to ensure we hit the boxing / nobox part of MI.values
+    ints = np.arange(2007, 2012)
+    pidx = pd.PeriodIndex(ints, freq='D')
+
+    idx = pd.MultiIndex.from_arrays([ints, pidx])
+    result = idx.values
+
+    outer = pd.Int64Index([x[0] for x in result])
+    tm.assert_index_equal(outer, pd.Int64Index(ints))
+
+    inner = pd.PeriodIndex([x[1] for x in result])
+    tm.assert_index_equal(inner, pidx)
+
+    # n_lev > n_lab
+    result = idx[:2].values
+
+    outer = pd.Int64Index([x[0] for x in result])
+    tm.assert_index_equal(outer, pd.Int64Index(ints[:2]))
+
+    inner = pd.PeriodIndex([x[1] for x in result])
+    tm.assert_index_equal(inner, pidx[:2])
+
+
+def test_consistency():
+    # need to construct an overflow
+    major_axis = lrange(70000)
+    minor_axis = lrange(10)
+
+    major_codes = np.arange(70000)
+    minor_codes = np.repeat(lrange(10), 7000)
+
+    # the fact that is works means it's consistent
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+
+    # inconsistent
+    major_codes = np.array([0, 0, 1, 1, 1, 2, 2, 3, 3])
+    minor_codes = np.array([0, 1, 0, 1, 1, 0, 1, 0, 1])
+    index = MultiIndex(levels=[major_axis, minor_axis],
+                       codes=[major_codes, minor_codes])
+
+    assert index.is_unique is False
+
+
+def test_hash_collisions():
+    # non-smoke test that we don't get hash collisions
+
+    index = MultiIndex.from_product([np.arange(1000), np.arange(1000)],
+                                    names=['one', 'two'])
+    result = index.get_indexer(index.values)
+    tm.assert_numpy_array_equal(result, np.arange(
+        len(index), dtype='intp'))
+
+    for i in [0, 1, len(index) - 2, len(index) - 1]:
+        result = index.get_loc(index[i])
+        assert result == i
+
+
+def test_dims():
+    pass
+
+
+def take_invalid_kwargs():
+    vals = [['A', 'B'],
+            [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
+    idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
+    indices = [1, 2]
+
+    msg = r"take\(\) got an unexpected keyword argument 'foo'"
+    with pytest.raises(TypeError, match=msg):
+        idx.take(indices, foo=2)
+
+    msg = "the 'out' parameter is not supported"
+    with pytest.raises(ValueError, match=msg):
+        idx.take(indices, out=indices)
+
+    msg = "the 'mode' parameter is not supported"
+    with pytest.raises(ValueError, match=msg):
+        idx.take(indices, mode='clip')
+
+
+def test_isna_behavior(idx):
+    # should not segfault GH5123
+    # NOTE: if MI representation changes, may make sense to allow
+    # isna(MI)
+    msg = "isna is not defined for MultiIndex"
+    with pytest.raises(NotImplementedError, match=msg):
+        pd.isna(idx)
+
+
+def test_large_multiindex_error():
+    # GH12527
+    df_below_1000000 = pd.DataFrame(
+        1, index=pd.MultiIndex.from_product([[1, 2], range(499999)]),
+        columns=['dest'])
+    with pytest.raises(KeyError, match=r"^\(-1, 0\)$"):
+        df_below_1000000.loc[(-1, 0), 'dest']
+    with pytest.raises(KeyError, match=r"^\(3, 0\)$"):
+        df_below_1000000.loc[(3, 0), 'dest']
+    df_above_1000000 = pd.DataFrame(
+        1, index=pd.MultiIndex.from_product([[1, 2], range(500001)]),
+        columns=['dest'])
+    with pytest.raises(KeyError, match=r"^\(-1, 0\)$"):
+        df_above_1000000.loc[(-1, 0), 'dest']
+    with pytest.raises(KeyError, match=r"^\(3, 0\)$"):
+        df_above_1000000.loc[(3, 0), 'dest']
+
+
+def test_million_record_attribute_error():
+    # GH 18165
+    r = list(range(1000000))
+    df = pd.DataFrame({'a': r, 'b': r},
+                      index=pd.MultiIndex.from_tuples([(x, x) for x in r]))
+
+    msg = "'Series' object has no attribute 'foo'"
+    with pytest.raises(AttributeError, match=msg):
+        df['a'].foo()
+
+
+def test_can_hold_identifiers(idx):
+    key = idx[0]
+    assert idx._can_hold_identifiers_and_holds_name(key) is True
+
+
+def test_metadata_immutable(idx):
+    levels, codes = idx.levels, idx.codes
+    # shouldn't be able to set at either the top level or base level
+    mutable_regex = re.compile('does not support mutable operations')
+    with pytest.raises(TypeError, match=mutable_regex):
+        levels[0] = levels[0]
+    with pytest.raises(TypeError, match=mutable_regex):
+        levels[0][0] = levels[0][0]
+    # ditto for labels
+    with pytest.raises(TypeError, match=mutable_regex):
+        codes[0] = codes[0]
+    with pytest.raises(TypeError, match=mutable_regex):
+        codes[0][0] = codes[0][0]
+    # and for names
+    names = idx.names
+    with pytest.raises(TypeError, match=mutable_regex):
+        names[0] = names[0]
+
+
+def test_level_setting_resets_attributes():
+    ind = pd.MultiIndex.from_arrays([
+        ['A', 'A', 'B', 'B', 'B'], [1, 2, 1, 2, 3]
+    ])
+    assert ind.is_monotonic
+    ind.set_levels([['A', 'B'], [1, 3, 2]], inplace=True)
+    # if this fails, probably didn't reset the cache correctly.
+    assert not ind.is_monotonic
+
+
+def test_rangeindex_fallback_coercion_bug():
+    # GH 12893
+    foo = pd.DataFrame(np.arange(100).reshape((10, 10)))
+    bar = pd.DataFrame(np.arange(100).reshape((10, 10)))
+    df = pd.concat({'foo': foo.stack(), 'bar': bar.stack()}, axis=1)
+    df.index.names = ['fizz', 'buzz']
+
+    str(df)
+    expected = pd.DataFrame({'bar': np.arange(100),
+                             'foo': np.arange(100)},
+                            index=pd.MultiIndex.from_product(
+                                [range(10), range(10)],
+                                names=['fizz', 'buzz']))
+    tm.assert_frame_equal(df, expected, check_like=True)
+
+    result = df.index.get_level_values('fizz')
+    expected = pd.Int64Index(np.arange(10), name='fizz').repeat(10)
+    tm.assert_index_equal(result, expected)
+
+    result = df.index.get_level_values('buzz')
+    expected = pd.Int64Index(np.tile(np.arange(10), 10), name='buzz')
+    tm.assert_index_equal(result, expected)
+
+
+def test_hash_error(indices):
+    index = indices
+    with pytest.raises(TypeError, match=("unhashable type: %r" %
+                                         type(index).__name__)):
+        hash(indices)
+
+
+def test_mutability(indices):
+    if not len(indices):
+        return
+    msg = "Index does not support mutable operations"
+    with pytest.raises(TypeError, match=msg):
+        indices[0] = indices[0]
+
+
+def test_wrong_number_names(indices):
+    with pytest.raises(ValueError, match="^Length"):
+        indices.names = ["apple", "banana", "carrot"]
+
+
+def test_memory_usage(idx):
+    result = idx.memory_usage()
+    if len(idx):
+        idx.get_loc(idx[0])
+        result2 = idx.memory_usage()
+        result3 = idx.memory_usage(deep=True)
+
+        # RangeIndex, IntervalIndex
+        # don't have engines
+        if not isinstance(idx, (RangeIndex, IntervalIndex)):
+            assert result2 > result
+
+        if idx.inferred_type == 'object':
+            assert result3 > result2
+
+    else:
+
+        # we report 0 for no-length
+        assert result == 0
+
+
+def test_nlevels(idx):
+    assert idx.nlevels == 2
diff --git a/pandas/tests/indexes/multi/test_join.py b/pandas/tests/indexes/multi/test_join.py
new file mode 100644
index 0000000000000..9e6c947e6470c
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_join.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, MultiIndex
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize('other', [
+    Index(['three', 'one', 'two']),
+    Index(['one']),
+    Index(['one', 'three']),
+])
+def test_join_level(idx, other, join_type):
+    join_index, lidx, ridx = other.join(idx, how=join_type,
+                                        level='second',
+                                        return_indexers=True)
+
+    exp_level = other.join(idx.levels[1], how=join_type)
+    assert join_index.levels[0].equals(idx.levels[0])
+    assert join_index.levels[1].equals(exp_level)
+
+    # pare down levels
+    mask = np.array(
+        [x[1] in exp_level for x in idx], dtype=bool)
+    exp_values = idx.values[mask]
+    tm.assert_numpy_array_equal(join_index.values, exp_values)
+
+    if join_type in ('outer', 'inner'):
+        join_index2, ridx2, lidx2 = \
+            idx.join(other, how=join_type, level='second',
+                     return_indexers=True)
+
+        assert join_index.equals(join_index2)
+        tm.assert_numpy_array_equal(lidx, lidx2)
+        tm.assert_numpy_array_equal(ridx, ridx2)
+        tm.assert_numpy_array_equal(join_index2.values, exp_values)
+
+
+def test_join_level_corner_case(idx):
+    # some corner cases
+    index = Index(['three', 'one', 'two'])
+    result = index.join(idx, level='second')
+    assert isinstance(result, MultiIndex)
+
+    with pytest.raises(TypeError, match="Join.*MultiIndex.*ambiguous"):
+        idx.join(idx, level=1)
+
+
+def test_join_self(idx, join_type):
+    joined = idx.join(idx, how=join_type)
+    assert idx is joined
+
+
+def test_join_multi():
+    # GH 10665
+    midx = pd.MultiIndex.from_product(
+        [np.arange(4), np.arange(4)], names=['a', 'b'])
+    idx = pd.Index([1, 2, 5], name='b')
+
+    # inner
+    jidx, lidx, ridx = midx.join(idx, how='inner', return_indexers=True)
+    exp_idx = pd.MultiIndex.from_product(
+        [np.arange(4), [1, 2]], names=['a', 'b'])
+    exp_lidx = np.array([1, 2, 5, 6, 9, 10, 13, 14], dtype=np.intp)
+    exp_ridx = np.array([0, 1, 0, 1, 0, 1, 0, 1], dtype=np.intp)
+    tm.assert_index_equal(jidx, exp_idx)
+    tm.assert_numpy_array_equal(lidx, exp_lidx)
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
+    # flip
+    jidx, ridx, lidx = idx.join(midx, how='inner', return_indexers=True)
+    tm.assert_index_equal(jidx, exp_idx)
+    tm.assert_numpy_array_equal(lidx, exp_lidx)
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+    # keep MultiIndex
+    jidx, lidx, ridx = midx.join(idx, how='left', return_indexers=True)
+    exp_ridx = np.array([-1, 0, 1, -1, -1, 0, 1, -1, -1, 0, 1, -1, -1, 0,
+                         1, -1], dtype=np.intp)
+    tm.assert_index_equal(jidx, midx)
+    assert lidx is None
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
+    # flip
+    jidx, ridx, lidx = idx.join(midx, how='right', return_indexers=True)
+    tm.assert_index_equal(jidx, midx)
+    assert lidx is None
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
+
+
+def test_join_self_unique(idx, join_type):
+    if idx.is_unique:
+        joined = idx.join(idx, how=join_type)
+        assert (idx == joined).all()
diff --git a/pandas/tests/indexes/multi/test_missing.py b/pandas/tests/indexes/multi/test_missing.py
new file mode 100644
index 0000000000000..cd4adfa96ef54
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_missing.py
@@ -0,0 +1,129 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslib import iNaT
+
+import pandas as pd
+from pandas import Int64Index, MultiIndex, PeriodIndex, UInt64Index
+from pandas.core.indexes.datetimelike import DatetimeIndexOpsMixin
+import pandas.util.testing as tm
+
+
+def test_fillna(idx):
+    # GH 11343
+
+    # TODO: Remove or Refactor.  Not Implemented for MultiIndex
+    for name, index in [('idx', idx), ]:
+        if len(index) == 0:
+            pass
+        elif isinstance(index, MultiIndex):
+            idx = index.copy()
+            msg = "isna is not defined for MultiIndex"
+            with pytest.raises(NotImplementedError, match=msg):
+                idx.fillna(idx[0])
+        else:
+            idx = index.copy()
+            result = idx.fillna(idx[0])
+            tm.assert_index_equal(result, idx)
+            assert result is not idx
+
+            msg = "'value' must be a scalar, passed: "
+            with pytest.raises(TypeError, match=msg):
+                idx.fillna([idx[0]])
+
+            idx = index.copy()
+            values = idx.values
+
+            if isinstance(index, DatetimeIndexOpsMixin):
+                values[1] = iNaT
+            elif isinstance(index, (Int64Index, UInt64Index)):
+                continue
+            else:
+                values[1] = np.nan
+
+            if isinstance(index, PeriodIndex):
+                idx = index.__class__(values, freq=index.freq)
+            else:
+                idx = index.__class__(values)
+
+            expected = np.array([False] * len(idx), dtype=bool)
+            expected[1] = True
+            tm.assert_numpy_array_equal(idx._isnan, expected)
+            assert idx.hasnans is True
+
+
+def test_dropna():
+    # GH 6194
+    idx = pd.MultiIndex.from_arrays([[1, np.nan, 3, np.nan, 5],
+                                     [1, 2, np.nan, np.nan, 5],
+                                     ['a', 'b', 'c', np.nan, 'e']])
+
+    exp = pd.MultiIndex.from_arrays([[1, 5],
+                                     [1, 5],
+                                     ['a', 'e']])
+    tm.assert_index_equal(idx.dropna(), exp)
+    tm.assert_index_equal(idx.dropna(how='any'), exp)
+
+    exp = pd.MultiIndex.from_arrays([[1, np.nan, 3, 5],
+                                     [1, 2, np.nan, 5],
+                                     ['a', 'b', 'c', 'e']])
+    tm.assert_index_equal(idx.dropna(how='all'), exp)
+
+    msg = "invalid how option: xxx"
+    with pytest.raises(ValueError, match=msg):
+        idx.dropna(how='xxx')
+
+
+def test_nulls(idx):
+    # this is really a smoke test for the methods
+    # as these are adequately tested for function elsewhere
+
+    msg = "isna is not defined for MultiIndex"
+    with pytest.raises(NotImplementedError, match=msg):
+        idx.isna()
+
+
+@pytest.mark.xfail
+def test_hasnans_isnans(idx):
+    # GH 11343, added tests for hasnans / isnans
+    index = idx.copy()
+
+    # cases in indices doesn't include NaN
+    expected = np.array([False] * len(index), dtype=bool)
+    tm.assert_numpy_array_equal(index._isnan, expected)
+    assert index.hasnans is False
+
+    index = idx.copy()
+    values = index.values
+    values[1] = np.nan
+
+    index = idx.__class__(values)
+
+    expected = np.array([False] * len(index), dtype=bool)
+    expected[1] = True
+    tm.assert_numpy_array_equal(index._isnan, expected)
+    assert index.hasnans is True
+
+
+def test_nan_stays_float():
+
+    # GH 7031
+    idx0 = pd.MultiIndex(levels=[["A", "B"], []],
+                         codes=[[1, 0], [-1, -1]],
+                         names=[0, 1])
+    idx1 = pd.MultiIndex(levels=[["C"], ["D"]],
+                         codes=[[0], [0]],
+                         names=[0, 1])
+    idxm = idx0.join(idx1, how='outer')
+    assert pd.isna(idx0.get_level_values(1)).all()
+    # the following failed in 0.14.1
+    assert pd.isna(idxm.get_level_values(1)[:-1]).all()
+
+    df0 = pd.DataFrame([[1, 2]], index=idx0)
+    df1 = pd.DataFrame([[3, 4]], index=idx1)
+    dfm = df0 - df1
+    assert pd.isna(df0.index.get_level_values(1)).all()
+    # the following failed in 0.14.1
+    assert pd.isna(dfm.index.get_level_values(1)[:-1]).all()
diff --git a/pandas/tests/indexes/multi/test_monotonic.py b/pandas/tests/indexes/multi/test_monotonic.py
new file mode 100644
index 0000000000000..72e9bcc1e2eb1
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_monotonic.py
@@ -0,0 +1,213 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, IntervalIndex, MultiIndex
+from pandas.api.types import is_scalar
+
+
+def test_is_monotonic_increasing():
+    i = MultiIndex.from_product([np.arange(10),
+                                 np.arange(10)], names=['one', 'two'])
+    assert i.is_monotonic is True
+    assert i._is_strictly_monotonic_increasing is True
+    assert Index(i.values).is_monotonic is True
+    assert i._is_strictly_monotonic_increasing is True
+
+    i = MultiIndex.from_product([np.arange(10, 0, -1),
+                                 np.arange(10)], names=['one', 'two'])
+    assert i.is_monotonic is False
+    assert i._is_strictly_monotonic_increasing is False
+    assert Index(i.values).is_monotonic is False
+    assert Index(i.values)._is_strictly_monotonic_increasing is False
+
+    i = MultiIndex.from_product([np.arange(10),
+                                 np.arange(10, 0, -1)],
+                                names=['one', 'two'])
+    assert i.is_monotonic is False
+    assert i._is_strictly_monotonic_increasing is False
+    assert Index(i.values).is_monotonic is False
+    assert Index(i.values)._is_strictly_monotonic_increasing is False
+
+    i = MultiIndex.from_product([[1.0, np.nan, 2.0], ['a', 'b', 'c']])
+    assert i.is_monotonic is False
+    assert i._is_strictly_monotonic_increasing is False
+    assert Index(i.values).is_monotonic is False
+    assert Index(i.values)._is_strictly_monotonic_increasing is False
+
+    # string ordering
+    i = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                           ['one', 'two', 'three']],
+                   codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                          [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                   names=['first', 'second'])
+    assert i.is_monotonic is False
+    assert Index(i.values).is_monotonic is False
+    assert i._is_strictly_monotonic_increasing is False
+    assert Index(i.values)._is_strictly_monotonic_increasing is False
+
+    i = MultiIndex(levels=[['bar', 'baz', 'foo', 'qux'],
+                           ['mom', 'next', 'zenith']],
+                   codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                          [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                   names=['first', 'second'])
+    assert i.is_monotonic is True
+    assert Index(i.values).is_monotonic is True
+    assert i._is_strictly_monotonic_increasing is True
+    assert Index(i.values)._is_strictly_monotonic_increasing is True
+
+    # mixed levels, hits the TypeError
+    i = MultiIndex(
+        levels=[[1, 2, 3, 4], ['gb00b03mlx29', 'lu0197800237',
+                               'nl0000289783',
+                               'nl0000289965', 'nl0000301109']],
+        codes=[[0, 1, 1, 2, 2, 2, 3], [4, 2, 0, 0, 1, 3, -1]],
+        names=['household_id', 'asset_id'])
+
+    assert i.is_monotonic is False
+    assert i._is_strictly_monotonic_increasing is False
+
+    # empty
+    i = MultiIndex.from_arrays([[], []])
+    assert i.is_monotonic is True
+    assert Index(i.values).is_monotonic is True
+    assert i._is_strictly_monotonic_increasing is True
+    assert Index(i.values)._is_strictly_monotonic_increasing is True
+
+
+def test_is_monotonic_decreasing():
+    i = MultiIndex.from_product([np.arange(9, -1, -1),
+                                 np.arange(9, -1, -1)],
+                                names=['one', 'two'])
+    assert i.is_monotonic_decreasing is True
+    assert i._is_strictly_monotonic_decreasing is True
+    assert Index(i.values).is_monotonic_decreasing is True
+    assert i._is_strictly_monotonic_decreasing is True
+
+    i = MultiIndex.from_product([np.arange(10),
+                                 np.arange(10, 0, -1)],
+                                names=['one', 'two'])
+    assert i.is_monotonic_decreasing is False
+    assert i._is_strictly_monotonic_decreasing is False
+    assert Index(i.values).is_monotonic_decreasing is False
+    assert Index(i.values)._is_strictly_monotonic_decreasing is False
+
+    i = MultiIndex.from_product([np.arange(10, 0, -1),
+                                 np.arange(10)], names=['one', 'two'])
+    assert i.is_monotonic_decreasing is False
+    assert i._is_strictly_monotonic_decreasing is False
+    assert Index(i.values).is_monotonic_decreasing is False
+    assert Index(i.values)._is_strictly_monotonic_decreasing is False
+
+    i = MultiIndex.from_product([[2.0, np.nan, 1.0], ['c', 'b', 'a']])
+    assert i.is_monotonic_decreasing is False
+    assert i._is_strictly_monotonic_decreasing is False
+    assert Index(i.values).is_monotonic_decreasing is False
+    assert Index(i.values)._is_strictly_monotonic_decreasing is False
+
+    # string ordering
+    i = MultiIndex(levels=[['qux', 'foo', 'baz', 'bar'],
+                           ['three', 'two', 'one']],
+                   codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                          [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                   names=['first', 'second'])
+    assert i.is_monotonic_decreasing is False
+    assert Index(i.values).is_monotonic_decreasing is False
+    assert i._is_strictly_monotonic_decreasing is False
+    assert Index(i.values)._is_strictly_monotonic_decreasing is False
+
+    i = MultiIndex(levels=[['qux', 'foo', 'baz', 'bar'],
+                           ['zenith', 'next', 'mom']],
+                   codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                          [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                   names=['first', 'second'])
+    assert i.is_monotonic_decreasing is True
+    assert Index(i.values).is_monotonic_decreasing is True
+    assert i._is_strictly_monotonic_decreasing is True
+    assert Index(i.values)._is_strictly_monotonic_decreasing is True
+
+    # mixed levels, hits the TypeError
+    i = MultiIndex(
+        levels=[[4, 3, 2, 1], ['nl0000301109', 'nl0000289965',
+                               'nl0000289783', 'lu0197800237',
+                               'gb00b03mlx29']],
+        codes=[[0, 1, 1, 2, 2, 2, 3], [4, 2, 0, 0, 1, 3, -1]],
+        names=['household_id', 'asset_id'])
+
+    assert i.is_monotonic_decreasing is False
+    assert i._is_strictly_monotonic_decreasing is False
+
+    # empty
+    i = MultiIndex.from_arrays([[], []])
+    assert i.is_monotonic_decreasing is True
+    assert Index(i.values).is_monotonic_decreasing is True
+    assert i._is_strictly_monotonic_decreasing is True
+    assert Index(i.values)._is_strictly_monotonic_decreasing is True
+
+
+def test_is_strictly_monotonic_increasing():
+    idx = pd.MultiIndex(levels=[['bar', 'baz'], ['mom', 'next']],
+                        codes=[[0, 0, 1, 1], [0, 0, 0, 1]])
+    assert idx.is_monotonic_increasing is True
+    assert idx._is_strictly_monotonic_increasing is False
+
+
+def test_is_strictly_monotonic_decreasing():
+    idx = pd.MultiIndex(levels=[['baz', 'bar'], ['next', 'mom']],
+                        codes=[[0, 0, 1, 1], [0, 0, 0, 1]])
+    assert idx.is_monotonic_decreasing is True
+    assert idx._is_strictly_monotonic_decreasing is False
+
+
+def test_searchsorted_monotonic(indices):
+    # GH17271
+    # not implemented for tuple searches in MultiIndex
+    # or Intervals searches in IntervalIndex
+    if isinstance(indices, (MultiIndex, IntervalIndex)):
+        return
+
+    # nothing to test if the index is empty
+    if indices.empty:
+        return
+    value = indices[0]
+
+    # determine the expected results (handle dupes for 'right')
+    expected_left, expected_right = 0, (indices == value).argmin()
+    if expected_right == 0:
+        # all values are the same, expected_right should be length
+        expected_right = len(indices)
+
+    # test _searchsorted_monotonic in all cases
+    # test searchsorted only for increasing
+    if indices.is_monotonic_increasing:
+        ssm_left = indices._searchsorted_monotonic(value, side='left')
+        assert is_scalar(ssm_left)
+        assert expected_left == ssm_left
+
+        ssm_right = indices._searchsorted_monotonic(value, side='right')
+        assert is_scalar(ssm_right)
+        assert expected_right == ssm_right
+
+        ss_left = indices.searchsorted(value, side='left')
+        assert is_scalar(ss_left)
+        assert expected_left == ss_left
+
+        ss_right = indices.searchsorted(value, side='right')
+        assert is_scalar(ss_right)
+        assert expected_right == ss_right
+
+    elif indices.is_monotonic_decreasing:
+        ssm_left = indices._searchsorted_monotonic(value, side='left')
+        assert is_scalar(ssm_left)
+        assert expected_left == ssm_left
+
+        ssm_right = indices._searchsorted_monotonic(value, side='right')
+        assert is_scalar(ssm_right)
+        assert expected_right == ssm_right
+
+    else:
+        # non-monotonic should raise.
+        with pytest.raises(ValueError):
+            indices._searchsorted_monotonic(value, side='left')
diff --git a/pandas/tests/indexes/multi/test_names.py b/pandas/tests/indexes/multi/test_names.py
new file mode 100644
index 0000000000000..1f67b3bb5d9fb
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_names.py
@@ -0,0 +1,124 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+from pandas import MultiIndex
+import pandas.util.testing as tm
+
+
+def check_level_names(index, names):
+    assert [level.name for level in index.levels] == list(names)
+
+
+def test_slice_keep_name():
+    x = MultiIndex.from_tuples([('a', 'b'), (1, 2), ('c', 'd')],
+                               names=['x', 'y'])
+    assert x[1:].names == x.names
+
+
+def test_index_name_retained():
+    # GH9857
+    result = pd.DataFrame({'x': [1, 2, 6],
+                           'y': [2, 2, 8],
+                           'z': [-5, 0, 5]})
+    result = result.set_index('z')
+    result.loc[10] = [9, 10]
+    df_expected = pd.DataFrame({'x': [1, 2, 6, 9],
+                                'y': [2, 2, 8, 10],
+                                'z': [-5, 0, 5, 10]})
+    df_expected = df_expected.set_index('z')
+    tm.assert_frame_equal(result, df_expected)
+
+
+def test_changing_names(idx):
+
+    # names should be applied to levels
+    level_names = [level.name for level in idx.levels]
+    check_level_names(idx, idx.names)
+
+    view = idx.view()
+    copy = idx.copy()
+    shallow_copy = idx._shallow_copy()
+
+    # changing names should change level names on object
+    new_names = [name + "a" for name in idx.names]
+    idx.names = new_names
+    check_level_names(idx, new_names)
+
+    # but not on copies
+    check_level_names(view, level_names)
+    check_level_names(copy, level_names)
+    check_level_names(shallow_copy, level_names)
+
+    # and copies shouldn't change original
+    shallow_copy.names = [name + "c" for name in shallow_copy.names]
+    check_level_names(idx, new_names)
+
+
+def test_take_preserve_name(idx):
+    taken = idx.take([3, 0, 1])
+    assert taken.names == idx.names
+
+
+def test_copy_names():
+    # Check that adding a "names" parameter to the copy is honored
+    # GH14302
+    multi_idx = pd.Index([(1, 2), (3, 4)], names=['MyName1', 'MyName2'])
+    multi_idx1 = multi_idx.copy()
+
+    assert multi_idx.equals(multi_idx1)
+    assert multi_idx.names == ['MyName1', 'MyName2']
+    assert multi_idx1.names == ['MyName1', 'MyName2']
+
+    multi_idx2 = multi_idx.copy(names=['NewName1', 'NewName2'])
+
+    assert multi_idx.equals(multi_idx2)
+    assert multi_idx.names == ['MyName1', 'MyName2']
+    assert multi_idx2.names == ['NewName1', 'NewName2']
+
+    multi_idx3 = multi_idx.copy(name=['NewName1', 'NewName2'])
+
+    assert multi_idx.equals(multi_idx3)
+    assert multi_idx.names == ['MyName1', 'MyName2']
+    assert multi_idx3.names == ['NewName1', 'NewName2']
+
+
+def test_names(idx, index_names):
+
+    # names are assigned in setup
+    names = index_names
+    level_names = [level.name for level in idx.levels]
+    assert names == level_names
+
+    # setting bad names on existing
+    index = idx
+    with pytest.raises(ValueError, match="^Length of names"):
+        setattr(index, "names", list(index.names) + ["third"])
+    with pytest.raises(ValueError, match="^Length of names"):
+        setattr(index, "names", [])
+
+    # initializing with bad names (should always be equivalent)
+    major_axis, minor_axis = idx.levels
+    major_codes, minor_codes = idx.codes
+    with pytest.raises(ValueError, match="^Length of names"):
+        MultiIndex(levels=[major_axis, minor_axis],
+                   codes=[major_codes, minor_codes],
+                   names=['first'])
+    with pytest.raises(ValueError, match="^Length of names"):
+        MultiIndex(levels=[major_axis, minor_axis],
+                   codes=[major_codes, minor_codes],
+                   names=['first', 'second', 'third'])
+
+    # names are assigned
+    index.names = ["a", "b"]
+    ind_names = list(index.names)
+    level_names = [level.name for level in index.levels]
+    assert ind_names == level_names
+
+
+def test_duplicate_level_names_access_raises(idx):
+    # GH19029
+    idx.names = ['foo', 'foo']
+    with pytest.raises(ValueError, match='name foo occurs multiple times'):
+        idx._get_level_number('foo')
diff --git a/pandas/tests/indexes/multi/test_partial_indexing.py b/pandas/tests/indexes/multi/test_partial_indexing.py
new file mode 100644
index 0000000000000..b75396a313666
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_partial_indexing.py
@@ -0,0 +1,98 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, date_range
+import pandas.util.testing as tm
+
+
+def test_partial_string_timestamp_multiindex():
+    # GH10331
+    dr = pd.date_range('2016-01-01', '2016-01-03', freq='12H')
+    abc = ['a', 'b', 'c']
+    ix = pd.MultiIndex.from_product([dr, abc])
+    df = pd.DataFrame({'c1': range(0, 15)}, index=ix)
+    idx = pd.IndexSlice
+
+    #                        c1
+    # 2016-01-01 00:00:00 a   0
+    #                     b   1
+    #                     c   2
+    # 2016-01-01 12:00:00 a   3
+    #                     b   4
+    #                     c   5
+    # 2016-01-02 00:00:00 a   6
+    #                     b   7
+    #                     c   8
+    # 2016-01-02 12:00:00 a   9
+    #                     b  10
+    #                     c  11
+    # 2016-01-03 00:00:00 a  12
+    #                     b  13
+    #                     c  14
+
+    # partial string matching on a single index
+    for df_swap in (df.swaplevel(),
+                    df.swaplevel(0),
+                    df.swaplevel(0, 1)):
+        df_swap = df_swap.sort_index()
+        just_a = df_swap.loc['a']
+        result = just_a.loc['2016-01-01']
+        expected = df.loc[idx[:, 'a'], :].iloc[0:2]
+        expected.index = expected.index.droplevel(1)
+        tm.assert_frame_equal(result, expected)
+
+    # indexing with IndexSlice
+    result = df.loc[idx['2016-01-01':'2016-02-01', :], :]
+    expected = df
+    tm.assert_frame_equal(result, expected)
+
+    # match on secondary index
+    result = df_swap.loc[idx[:, '2016-01-01':'2016-01-01'], :]
+    expected = df_swap.iloc[[0, 1, 5, 6, 10, 11]]
+    tm.assert_frame_equal(result, expected)
+
+    # Even though this syntax works on a single index, this is somewhat
+    # ambiguous and we don't want to extend this behavior forward to work
+    # in multi-indexes. This would amount to selecting a scalar from a
+    # column.
+    with pytest.raises(KeyError):
+        df['2016-01-01']
+
+    # partial string match on year only
+    result = df.loc['2016']
+    expected = df
+    tm.assert_frame_equal(result, expected)
+
+    # partial string match on date
+    result = df.loc['2016-01-01']
+    expected = df.iloc[0:6]
+    tm.assert_frame_equal(result, expected)
+
+    # partial string match on date and hour, from middle
+    result = df.loc['2016-01-02 12']
+    expected = df.iloc[9:12]
+    tm.assert_frame_equal(result, expected)
+
+    # partial string match on secondary index
+    result = df_swap.loc[idx[:, '2016-01-02'], :]
+    expected = df_swap.iloc[[2, 3, 7, 8, 12, 13]]
+    tm.assert_frame_equal(result, expected)
+
+    # tuple selector with partial string match on date
+    result = df.loc[('2016-01-01', 'a'), :]
+    expected = df.iloc[[0, 3]]
+    tm.assert_frame_equal(result, expected)
+
+    # Slicing date on first level should break (of course)
+    with pytest.raises(KeyError):
+        df_swap.loc['2016-01-01']
+
+    # GH12685 (partial string with daily resolution or below)
+    dr = date_range('2013-01-01', periods=100, freq='D')
+    ix = MultiIndex.from_product([dr, ['a', 'b']])
+    df = DataFrame(np.random.randn(200, 1), columns=['A'], index=ix)
+
+    result = df.loc[idx['2013-03':'2013-03', :], :]
+    expected = df.iloc[118:180]
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexes/multi/test_reindex.py b/pandas/tests/indexes/multi/test_reindex.py
new file mode 100644
index 0000000000000..341ef82c538a8
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_reindex.py
@@ -0,0 +1,108 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, MultiIndex
+import pandas.util.testing as tm
+
+
+def check_level_names(index, names):
+    assert [level.name for level in index.levels] == list(names)
+
+
+def test_reindex(idx):
+    result, indexer = idx.reindex(list(idx[:4]))
+    assert isinstance(result, MultiIndex)
+    check_level_names(result, idx[:4].names)
+
+    result, indexer = idx.reindex(list(idx))
+    assert isinstance(result, MultiIndex)
+    assert indexer is None
+    check_level_names(result, idx.names)
+
+
+def test_reindex_level(idx):
+    index = Index(['one'])
+
+    target, indexer = idx.reindex(index, level='second')
+    target2, indexer2 = index.reindex(idx, level='second')
+
+    exp_index = idx.join(index, level='second', how='right')
+    exp_index2 = idx.join(index, level='second', how='left')
+
+    assert target.equals(exp_index)
+    exp_indexer = np.array([0, 2, 4])
+    tm.assert_numpy_array_equal(indexer, exp_indexer, check_dtype=False)
+
+    assert target2.equals(exp_index2)
+    exp_indexer2 = np.array([0, -1, 0, -1, 0, -1])
+    tm.assert_numpy_array_equal(indexer2, exp_indexer2, check_dtype=False)
+
+    with pytest.raises(TypeError, match="Fill method not supported"):
+        idx.reindex(idx, method='pad', level='second')
+
+    with pytest.raises(TypeError, match="Fill method not supported"):
+        index.reindex(index, method='bfill', level='first')
+
+
+def test_reindex_preserves_names_when_target_is_list_or_ndarray(idx):
+    # GH6552
+    idx = idx.copy()
+    target = idx.copy()
+    idx.names = target.names = [None, None]
+
+    other_dtype = pd.MultiIndex.from_product([[1, 2], [3, 4]])
+
+    # list & ndarray cases
+    assert idx.reindex([])[0].names == [None, None]
+    assert idx.reindex(np.array([]))[0].names == [None, None]
+    assert idx.reindex(target.tolist())[0].names == [None, None]
+    assert idx.reindex(target.values)[0].names == [None, None]
+    assert idx.reindex(other_dtype.tolist())[0].names == [None, None]
+    assert idx.reindex(other_dtype.values)[0].names == [None, None]
+
+    idx.names = ['foo', 'bar']
+    assert idx.reindex([])[0].names == ['foo', 'bar']
+    assert idx.reindex(np.array([]))[0].names == ['foo', 'bar']
+    assert idx.reindex(target.tolist())[0].names == ['foo', 'bar']
+    assert idx.reindex(target.values)[0].names == ['foo', 'bar']
+    assert idx.reindex(other_dtype.tolist())[0].names == ['foo', 'bar']
+    assert idx.reindex(other_dtype.values)[0].names == ['foo', 'bar']
+
+
+def test_reindex_lvl_preserves_names_when_target_is_list_or_array():
+    # GH7774
+    idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']],
+                                     names=['foo', 'bar'])
+    assert idx.reindex([], level=0)[0].names == ['foo', 'bar']
+    assert idx.reindex([], level=1)[0].names == ['foo', 'bar']
+
+
+def test_reindex_lvl_preserves_type_if_target_is_empty_list_or_array():
+    # GH7774
+    idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
+    assert idx.reindex([], level=0)[0].levels[0].dtype.type == np.int64
+    assert idx.reindex([], level=1)[0].levels[1].dtype.type == np.object_
+
+
+def test_reindex_base(idx):
+    idx = idx
+    expected = np.arange(idx.size, dtype=np.intp)
+
+    actual = idx.get_indexer(idx)
+    tm.assert_numpy_array_equal(expected, actual)
+
+    with pytest.raises(ValueError, match='Invalid fill method'):
+        idx.get_indexer(idx, method='invalid')
+
+
+def test_reindex_non_unique():
+    idx = pd.MultiIndex.from_tuples([(0, 0), (1, 1), (1, 1), (2, 2)])
+    a = pd.Series(np.arange(4), index=idx)
+    new_idx = pd.MultiIndex.from_tuples([(0, 0), (1, 1), (2, 2)])
+
+    msg = 'cannot handle a non-unique multi-index!'
+    with pytest.raises(ValueError, match=msg):
+        a.reindex(new_idx)
diff --git a/pandas/tests/indexes/multi/test_reshape.py b/pandas/tests/indexes/multi/test_reshape.py
new file mode 100644
index 0000000000000..92564a20c301b
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_reshape.py
@@ -0,0 +1,126 @@
+# -*- coding: utf-8 -*-
+
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, MultiIndex
+import pandas.util.testing as tm
+
+
+def test_insert(idx):
+    # key contained in all levels
+    new_index = idx.insert(0, ('bar', 'two'))
+    assert new_index.equal_levels(idx)
+    assert new_index[0] == ('bar', 'two')
+
+    # key not contained in all levels
+    new_index = idx.insert(0, ('abc', 'three'))
+
+    exp0 = Index(list(idx.levels[0]) + ['abc'], name='first')
+    tm.assert_index_equal(new_index.levels[0], exp0)
+
+    exp1 = Index(list(idx.levels[1]) + ['three'], name='second')
+    tm.assert_index_equal(new_index.levels[1], exp1)
+    assert new_index[0] == ('abc', 'three')
+
+    # key wrong length
+    msg = "Item must have length equal to number of levels"
+    with pytest.raises(ValueError, match=msg):
+        idx.insert(0, ('foo2',))
+
+    left = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1]],
+                        columns=['1st', '2nd', '3rd'])
+    left.set_index(['1st', '2nd'], inplace=True)
+    ts = left['3rd'].copy(deep=True)
+
+    left.loc[('b', 'x'), '3rd'] = 2
+    left.loc[('b', 'a'), '3rd'] = -1
+    left.loc[('b', 'b'), '3rd'] = 3
+    left.loc[('a', 'x'), '3rd'] = 4
+    left.loc[('a', 'w'), '3rd'] = 5
+    left.loc[('a', 'a'), '3rd'] = 6
+
+    ts.loc[('b', 'x')] = 2
+    ts.loc['b', 'a'] = -1
+    ts.loc[('b', 'b')] = 3
+    ts.loc['a', 'x'] = 4
+    ts.loc[('a', 'w')] = 5
+    ts.loc['a', 'a'] = 6
+
+    right = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1], ['b', 'x', 2],
+                          ['b', 'a', -1], ['b', 'b', 3], ['a', 'x', 4],
+                          ['a', 'w', 5], ['a', 'a', 6]],
+                         columns=['1st', '2nd', '3rd'])
+    right.set_index(['1st', '2nd'], inplace=True)
+    # FIXME data types changes to float because
+    # of intermediate nan insertion;
+    tm.assert_frame_equal(left, right, check_dtype=False)
+    tm.assert_series_equal(ts, right['3rd'])
+
+    # GH9250
+    idx = [('test1', i) for i in range(5)] + \
+        [('test2', i) for i in range(6)] + \
+        [('test', 17), ('test', 18)]
+
+    left = pd.Series(np.linspace(0, 10, 11),
+                     pd.MultiIndex.from_tuples(idx[:-2]))
+
+    left.loc[('test', 17)] = 11
+    left.loc[('test', 18)] = 12
+
+    right = pd.Series(np.linspace(0, 12, 13),
+                      pd.MultiIndex.from_tuples(idx))
+
+    tm.assert_series_equal(left, right)
+
+
+def test_append(idx):
+    result = idx[:3].append(idx[3:])
+    assert result.equals(idx)
+
+    foos = [idx[:1], idx[1:3], idx[3:]]
+    result = foos[0].append(foos[1:])
+    assert result.equals(idx)
+
+    # empty
+    result = idx.append([])
+    assert result.equals(idx)
+
+
+def test_repeat():
+    reps = 2
+    numbers = [1, 2, 3]
+    names = np.array(['foo', 'bar'])
+
+    m = MultiIndex.from_product([
+        numbers, names], names=names)
+    expected = MultiIndex.from_product([
+        numbers, names.repeat(reps)], names=names)
+    tm.assert_index_equal(m.repeat(reps), expected)
+
+
+def test_insert_base(idx):
+
+    result = idx[1:4]
+
+    # test 0th element
+    assert idx[0:4].equals(result.insert(0, idx[0]))
+
+
+def test_delete_base(idx):
+
+    expected = idx[1:]
+    result = idx.delete(0)
+    assert result.equals(expected)
+    assert result.name == expected.name
+
+    expected = idx[:-1]
+    result = idx.delete(-1)
+    assert result.equals(expected)
+    assert result.name == expected.name
+
+    with pytest.raises((IndexError, ValueError)):
+        # Exception raised depends on NumPy version.
+        idx.delete(len(idx))
diff --git a/pandas/tests/indexes/multi/test_set_ops.py b/pandas/tests/indexes/multi/test_set_ops.py
new file mode 100644
index 0000000000000..41a0e1e59e8a5
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_set_ops.py
@@ -0,0 +1,372 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import MultiIndex, Series
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("case", [0.5, "xxx"])
+@pytest.mark.parametrize("sort", [None, False])
+@pytest.mark.parametrize("method", ["intersection", "union",
+                                    "difference", "symmetric_difference"])
+def test_set_ops_error_cases(idx, case, sort, method):
+    # non-iterable input
+    msg = "Input must be Index or array-like"
+    with pytest.raises(TypeError, match=msg):
+        getattr(idx, method)(case, sort=sort)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_intersection_base(idx, sort):
+    first = idx[:5]
+    second = idx[:3]
+    intersect = first.intersection(second, sort=sort)
+
+    if sort is None:
+        tm.assert_index_equal(intersect, second.sort_values())
+    assert tm.equalContents(intersect, second)
+
+    # GH 10149
+    cases = [klass(second.values)
+             for klass in [np.array, Series, list]]
+    for case in cases:
+        result = first.intersection(case, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, second.sort_values())
+        assert tm.equalContents(result, second)
+
+    msg = "other must be a MultiIndex or a list of tuples"
+    with pytest.raises(TypeError, match=msg):
+        first.intersection([1, 2, 3], sort=sort)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_union_base(idx, sort):
+    first = idx[3:]
+    second = idx[:5]
+    everything = idx
+    union = first.union(second, sort=sort)
+    if sort is None:
+        tm.assert_index_equal(union, everything.sort_values())
+    assert tm.equalContents(union, everything)
+
+    # GH 10149
+    cases = [klass(second.values)
+             for klass in [np.array, Series, list]]
+    for case in cases:
+        result = first.union(case, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, everything.sort_values())
+        assert tm.equalContents(result, everything)
+
+    msg = "other must be a MultiIndex or a list of tuples"
+    with pytest.raises(TypeError, match=msg):
+        first.union([1, 2, 3], sort=sort)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_difference_base(idx, sort):
+    second = idx[4:]
+    answer = idx[:4]
+    result = idx.difference(second, sort=sort)
+
+    if sort is None:
+        answer = answer.sort_values()
+
+    assert result.equals(answer)
+    tm.assert_index_equal(result, answer)
+
+    # GH 10149
+    cases = [klass(second.values)
+             for klass in [np.array, Series, list]]
+    for case in cases:
+        result = idx.difference(case, sort=sort)
+        tm.assert_index_equal(result, answer)
+
+    msg = "other must be a MultiIndex or a list of tuples"
+    with pytest.raises(TypeError, match=msg):
+        idx.difference([1, 2, 3], sort=sort)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_symmetric_difference(idx, sort):
+    first = idx[1:]
+    second = idx[:-1]
+    answer = idx[[-1, 0]]
+    result = first.symmetric_difference(second, sort=sort)
+
+    if sort is None:
+        answer = answer.sort_values()
+
+    tm.assert_index_equal(result, answer)
+
+    # GH 10149
+    cases = [klass(second.values)
+             for klass in [np.array, Series, list]]
+    for case in cases:
+        result = first.symmetric_difference(case, sort=sort)
+        tm.assert_index_equal(result, answer)
+
+    msg = "other must be a MultiIndex or a list of tuples"
+    with pytest.raises(TypeError, match=msg):
+        first.symmetric_difference([1, 2, 3], sort=sort)
+
+
+def test_empty(idx):
+    # GH 15270
+    assert not idx.empty
+    assert idx[:0].empty
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_difference(idx, sort):
+
+    first = idx
+    result = first.difference(idx[-3:], sort=sort)
+    vals = idx[:-3].values
+
+    if sort is None:
+        vals = sorted(vals)
+
+    expected = MultiIndex.from_tuples(vals,
+                                      sortorder=0,
+                                      names=idx.names)
+
+    assert isinstance(result, MultiIndex)
+    assert result.equals(expected)
+    assert result.names == idx.names
+    tm.assert_index_equal(result, expected)
+
+    # empty difference: reflexive
+    result = idx.difference(idx, sort=sort)
+    expected = idx[:0]
+    assert result.equals(expected)
+    assert result.names == idx.names
+
+    # empty difference: superset
+    result = idx[-3:].difference(idx, sort=sort)
+    expected = idx[:0]
+    assert result.equals(expected)
+    assert result.names == idx.names
+
+    # empty difference: degenerate
+    result = idx[:0].difference(idx, sort=sort)
+    expected = idx[:0]
+    assert result.equals(expected)
+    assert result.names == idx.names
+
+    # names not the same
+    chunklet = idx[-3:]
+    chunklet.names = ['foo', 'baz']
+    result = first.difference(chunklet, sort=sort)
+    assert result.names == (None, None)
+
+    # empty, but non-equal
+    result = idx.difference(idx.sortlevel(1)[0], sort=sort)
+    assert len(result) == 0
+
+    # raise Exception called with non-MultiIndex
+    result = first.difference(first.values, sort=sort)
+    assert result.equals(first[:0])
+
+    # name from empty array
+    result = first.difference([], sort=sort)
+    assert first.equals(result)
+    assert first.names == result.names
+
+    # name from non-empty array
+    result = first.difference([('foo', 'one')], sort=sort)
+    expected = pd.MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'), (
+        'foo', 'two'), ('qux', 'one'), ('qux', 'two')])
+    expected.names = first.names
+    assert first.names == result.names
+
+    msg = "other must be a MultiIndex or a list of tuples"
+    with pytest.raises(TypeError, match=msg):
+        first.difference([1, 2, 3, 4, 5], sort=sort)
+
+
+def test_difference_sort_special():
+    # GH-24959
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+    # sort=None, the default
+    result = idx.difference([])
+    tm.assert_index_equal(result, idx)
+
+
+@pytest.mark.xfail(reason="Not implemented.")
+def test_difference_sort_special_true():
+    # TODO decide on True behaviour
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+    result = idx.difference([], sort=True)
+    expected = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
+    tm.assert_index_equal(result, expected)
+
+
+def test_difference_sort_incomparable():
+    # GH-24959
+    idx = pd.MultiIndex.from_product([[1, pd.Timestamp('2000'), 2],
+                                      ['a', 'b']])
+
+    other = pd.MultiIndex.from_product([[3, pd.Timestamp('2000'), 4],
+                                        ['c', 'd']])
+    # sort=None, the default
+    # MultiIndex.difference deviates here from other difference
+    # implementations in not catching the TypeError
+    with pytest.raises(TypeError):
+        result = idx.difference(other)
+
+    # sort=False
+    result = idx.difference(other, sort=False)
+    tm.assert_index_equal(result, idx)
+
+
+@pytest.mark.xfail(reason="Not implemented.")
+def test_difference_sort_incomparable_true():
+    # TODO decide on True behaviour
+    # # sort=True, raises
+    idx = pd.MultiIndex.from_product([[1, pd.Timestamp('2000'), 2],
+                                      ['a', 'b']])
+    other = pd.MultiIndex.from_product([[3, pd.Timestamp('2000'), 4],
+                                        ['c', 'd']])
+
+    with pytest.raises(TypeError):
+        idx.difference(other, sort=True)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_union(idx, sort):
+    piece1 = idx[:5][::-1]
+    piece2 = idx[3:]
+
+    the_union = piece1.union(piece2, sort=sort)
+
+    if sort is None:
+        tm.assert_index_equal(the_union, idx.sort_values())
+
+    assert tm.equalContents(the_union, idx)
+
+    # corner case, pass self or empty thing:
+    the_union = idx.union(idx, sort=sort)
+    assert the_union is idx
+
+    the_union = idx.union(idx[:0], sort=sort)
+    assert the_union is idx
+
+    # won't work in python 3
+    # tuples = _index.values
+    # result = _index[:4] | tuples[4:]
+    # assert result.equals(tuples)
+
+    # not valid for python 3
+    # def test_union_with_regular_index(self):
+    #     other = Index(['A', 'B', 'C'])
+
+    #     result = other.union(idx)
+    #     assert ('foo', 'one') in result
+    #     assert 'B' in result
+
+    #     result2 = _index.union(other)
+    #     assert result.equals(result2)
+
+
+@pytest.mark.parametrize("sort", [None, False])
+def test_intersection(idx, sort):
+    piece1 = idx[:5][::-1]
+    piece2 = idx[3:]
+
+    the_int = piece1.intersection(piece2, sort=sort)
+
+    if sort is None:
+        tm.assert_index_equal(the_int, idx[3:5])
+    assert tm.equalContents(the_int, idx[3:5])
+
+    # corner case, pass self
+    the_int = idx.intersection(idx, sort=sort)
+    assert the_int is idx
+
+    # empty intersection: disjoint
+    empty = idx[:2].intersection(idx[2:], sort=sort)
+    expected = idx[:0]
+    assert empty.equals(expected)
+
+    # can't do in python 3
+    # tuples = _index.values
+    # result = _index & tuples
+    # assert result.equals(tuples)
+
+
+def test_intersect_equal_sort():
+    # GH-24959
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+    tm.assert_index_equal(idx.intersection(idx, sort=False), idx)
+    tm.assert_index_equal(idx.intersection(idx, sort=None), idx)
+
+
+@pytest.mark.xfail(reason="Not implemented.")
+def test_intersect_equal_sort_true():
+    # TODO decide on True behaviour
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+    sorted_ = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
+    tm.assert_index_equal(idx.intersection(idx, sort=True), sorted_)
+
+
+@pytest.mark.parametrize('slice_', [slice(None), slice(0)])
+def test_union_sort_other_empty(slice_):
+    # https://github.com/pandas-dev/pandas/issues/24959
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+
+    # default, sort=None
+    other = idx[slice_]
+    tm.assert_index_equal(idx.union(other), idx)
+    # MultiIndex does not special case empty.union(idx)
+    # tm.assert_index_equal(other.union(idx), idx)
+
+    # sort=False
+    tm.assert_index_equal(idx.union(other, sort=False), idx)
+
+
+@pytest.mark.xfail(reason="Not implemented.")
+def test_union_sort_other_empty_sort(slice_):
+    # TODO decide on True behaviour
+    # # sort=True
+    idx = pd.MultiIndex.from_product([[1, 0], ['a', 'b']])
+    other = idx[:0]
+    result = idx.union(other, sort=True)
+    expected = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
+    tm.assert_index_equal(result, expected)
+
+
+def test_union_sort_other_incomparable():
+    # https://github.com/pandas-dev/pandas/issues/24959
+    idx = pd.MultiIndex.from_product([[1, pd.Timestamp('2000')], ['a', 'b']])
+
+    # default, sort=None
+    result = idx.union(idx[:1])
+    tm.assert_index_equal(result, idx)
+
+    # sort=False
+    result = idx.union(idx[:1], sort=False)
+    tm.assert_index_equal(result, idx)
+
+
+@pytest.mark.xfail(reason="Not implemented.")
+def test_union_sort_other_incomparable_sort():
+    # TODO decide on True behaviour
+    # # sort=True
+    idx = pd.MultiIndex.from_product([[1, pd.Timestamp('2000')], ['a', 'b']])
+    with pytest.raises(TypeError, match='Cannot compare'):
+        idx.union(idx[:1], sort=True)
+
+
+@pytest.mark.parametrize("method", ['union', 'intersection', 'difference',
+                                    'symmetric_difference'])
+def test_setops_disallow_true(method):
+    idx1 = pd.MultiIndex.from_product([['a', 'b'], [1, 2]])
+    idx2 = pd.MultiIndex.from_product([['b', 'c'], [1, 2]])
+
+    with pytest.raises(ValueError, match="The 'sort' keyword only takes"):
+        getattr(idx1, method)(idx2, sort=True)
diff --git a/pandas/tests/indexes/multi/test_sorting.py b/pandas/tests/indexes/multi/test_sorting.py
new file mode 100644
index 0000000000000..1a81318e06d8d
--- /dev/null
+++ b/pandas/tests/indexes/multi/test_sorting.py
@@ -0,0 +1,266 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+from pandas.compat import lrange
+from pandas.errors import PerformanceWarning, UnsortedIndexError
+
+import pandas as pd
+from pandas import CategoricalIndex, DataFrame, Index, MultiIndex, RangeIndex
+import pandas.util.testing as tm
+
+
+def test_sortlevel(idx):
+    import random
+
+    tuples = list(idx)
+    random.shuffle(tuples)
+
+    index = MultiIndex.from_tuples(tuples)
+
+    sorted_idx, _ = index.sortlevel(0)
+    expected = MultiIndex.from_tuples(sorted(tuples))
+    assert sorted_idx.equals(expected)
+
+    sorted_idx, _ = index.sortlevel(0, ascending=False)
+    assert sorted_idx.equals(expected[::-1])
+
+    sorted_idx, _ = index.sortlevel(1)
+    by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
+    expected = MultiIndex.from_tuples(by1)
+    assert sorted_idx.equals(expected)
+
+    sorted_idx, _ = index.sortlevel(1, ascending=False)
+    assert sorted_idx.equals(expected[::-1])
+
+
+def test_sortlevel_not_sort_remaining():
+    mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
+    sorted_idx, _ = mi.sortlevel('A', sort_remaining=False)
+    assert sorted_idx.equals(mi)
+
+
+def test_sortlevel_deterministic():
+    tuples = [('bar', 'one'), ('foo', 'two'), ('qux', 'two'),
+              ('foo', 'one'), ('baz', 'two'), ('qux', 'one')]
+
+    index = MultiIndex.from_tuples(tuples)
+
+    sorted_idx, _ = index.sortlevel(0)
+    expected = MultiIndex.from_tuples(sorted(tuples))
+    assert sorted_idx.equals(expected)
+
+    sorted_idx, _ = index.sortlevel(0, ascending=False)
+    assert sorted_idx.equals(expected[::-1])
+
+    sorted_idx, _ = index.sortlevel(1)
+    by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
+    expected = MultiIndex.from_tuples(by1)
+    assert sorted_idx.equals(expected)
+
+    sorted_idx, _ = index.sortlevel(1, ascending=False)
+    assert sorted_idx.equals(expected[::-1])
+
+
+def test_sort(indices):
+    with pytest.raises(TypeError):
+        indices.sort()
+
+
+def test_numpy_argsort(idx):
+    result = np.argsort(idx)
+    expected = idx.argsort()
+    tm.assert_numpy_array_equal(result, expected)
+
+    # these are the only two types that perform
+    # pandas compatibility input validation - the
+    # rest already perform separate (or no) such
+    # validation via their 'values' attribute as
+    # defined in pandas.core.indexes/base.py - they
+    # cannot be changed at the moment due to
+    # backwards compatibility concerns
+    if isinstance(type(idx), (CategoricalIndex, RangeIndex)):
+        msg = "the 'axis' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.argsort(idx, axis=1)
+
+        msg = "the 'kind' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.argsort(idx, kind='mergesort')
+
+        msg = "the 'order' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.argsort(idx, order=('a', 'b'))
+
+
+def test_unsortedindex():
+    # GH 11897
+    mi = pd.MultiIndex.from_tuples([('z', 'a'), ('x', 'a'), ('y', 'b'),
+                                    ('x', 'b'), ('y', 'a'), ('z', 'b')],
+                                   names=['one', 'two'])
+    df = pd.DataFrame([[i, 10 * i] for i in lrange(6)], index=mi,
+                      columns=['one', 'two'])
+
+    # GH 16734: not sorted, but no real slicing
+    result = df.loc(axis=0)['z', 'a']
+    expected = df.iloc[0]
+    tm.assert_series_equal(result, expected)
+
+    with pytest.raises(UnsortedIndexError):
+        df.loc(axis=0)['z', slice('a')]
+    df.sort_index(inplace=True)
+    assert len(df.loc(axis=0)['z', :]) == 2
+
+    with pytest.raises(KeyError):
+        df.loc(axis=0)['q', :]
+
+
+def test_unsortedindex_doc_examples():
+    # http://pandas.pydata.org/pandas-docs/stable/advanced.html#sorting-a-multiindex  # noqa
+    dfm = DataFrame({'jim': [0, 0, 1, 1],
+                     'joe': ['x', 'x', 'z', 'y'],
+                     'jolie': np.random.rand(4)})
+
+    dfm = dfm.set_index(['jim', 'joe'])
+    with tm.assert_produces_warning(PerformanceWarning):
+        dfm.loc[(1, 'z')]
+
+    with pytest.raises(UnsortedIndexError):
+        dfm.loc[(0, 'y'):(1, 'z')]
+
+    assert not dfm.index.is_lexsorted()
+    assert dfm.index.lexsort_depth == 1
+
+    # sort it
+    dfm = dfm.sort_index()
+    dfm.loc[(1, 'z')]
+    dfm.loc[(0, 'y'):(1, 'z')]
+
+    assert dfm.index.is_lexsorted()
+    assert dfm.index.lexsort_depth == 2
+
+
+def test_reconstruct_sort():
+
+    # starts off lexsorted & monotonic
+    mi = MultiIndex.from_arrays([
+        ['A', 'A', 'B', 'B', 'B'], [1, 2, 1, 2, 3]
+    ])
+    assert mi.is_lexsorted()
+    assert mi.is_monotonic
+
+    recons = mi._sort_levels_monotonic()
+    assert recons.is_lexsorted()
+    assert recons.is_monotonic
+    assert mi is recons
+
+    assert mi.equals(recons)
+    assert Index(mi.values).equals(Index(recons.values))
+
+    # cannot convert to lexsorted
+    mi = pd.MultiIndex.from_tuples([('z', 'a'), ('x', 'a'), ('y', 'b'),
+                                    ('x', 'b'), ('y', 'a'), ('z', 'b')],
+                                   names=['one', 'two'])
+    assert not mi.is_lexsorted()
+    assert not mi.is_monotonic
+
+    recons = mi._sort_levels_monotonic()
+    assert not recons.is_lexsorted()
+    assert not recons.is_monotonic
+
+    assert mi.equals(recons)
+    assert Index(mi.values).equals(Index(recons.values))
+
+    # cannot convert to lexsorted
+    mi = MultiIndex(levels=[['b', 'd', 'a'], [1, 2, 3]],
+                    codes=[[0, 1, 0, 2], [2, 0, 0, 1]],
+                    names=['col1', 'col2'])
+    assert not mi.is_lexsorted()
+    assert not mi.is_monotonic
+
+    recons = mi._sort_levels_monotonic()
+    assert not recons.is_lexsorted()
+    assert not recons.is_monotonic
+
+    assert mi.equals(recons)
+    assert Index(mi.values).equals(Index(recons.values))
+
+
+def test_reconstruct_remove_unused():
+    # xref to GH 2770
+    df = DataFrame([['deleteMe', 1, 9],
+                    ['keepMe', 2, 9],
+                    ['keepMeToo', 3, 9]],
+                   columns=['first', 'second', 'third'])
+    df2 = df.set_index(['first', 'second'], drop=False)
+    df2 = df2[df2['first'] != 'deleteMe']
+
+    # removed levels are there
+    expected = MultiIndex(levels=[['deleteMe', 'keepMe', 'keepMeToo'],
+                                  [1, 2, 3]],
+                          codes=[[1, 2], [1, 2]],
+                          names=['first', 'second'])
+    result = df2.index
+    tm.assert_index_equal(result, expected)
+
+    expected = MultiIndex(levels=[['keepMe', 'keepMeToo'],
+                                  [2, 3]],
+                          codes=[[0, 1], [0, 1]],
+                          names=['first', 'second'])
+    result = df2.index.remove_unused_levels()
+    tm.assert_index_equal(result, expected)
+
+    # idempotent
+    result2 = result.remove_unused_levels()
+    tm.assert_index_equal(result2, expected)
+    assert result2.is_(result)
+
+
+@pytest.mark.parametrize('first_type,second_type', [
+    ('int64', 'int64'),
+    ('datetime64[D]', 'str')
+])
+def test_remove_unused_levels_large(first_type, second_type):
+    # GH16556
+
+    # because tests should be deterministic (and this test in particular
+    # checks that levels are removed, which is not the case for every
+    # random input):
+    rng = np.random.RandomState(4)  # seed is arbitrary value that works
+
+    size = 1 << 16
+    df = DataFrame(dict(
+        first=rng.randint(0, 1 << 13, size).astype(first_type),
+        second=rng.randint(0, 1 << 10, size).astype(second_type),
+        third=rng.rand(size)))
+    df = df.groupby(['first', 'second']).sum()
+    df = df[df.third < 0.1]
+
+    result = df.index.remove_unused_levels()
+    assert len(result.levels[0]) < len(df.index.levels[0])
+    assert len(result.levels[1]) < len(df.index.levels[1])
+    assert result.equals(df.index)
+
+    expected = df.reset_index().set_index(['first', 'second']).index
+    tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('level0', [['a', 'd', 'b'],
+                                    ['a', 'd', 'b', 'unused']])
+@pytest.mark.parametrize('level1', [['w', 'x', 'y', 'z'],
+                                    ['w', 'x', 'y', 'z', 'unused']])
+def test_remove_unused_nan(level0, level1):
+    # GH 18417
+    mi = pd.MultiIndex(levels=[level0, level1],
+                       codes=[[0, 2, -1, 1, -1], [0, 1, 2, 3, 2]])
+
+    result = mi.remove_unused_levels()
+    tm.assert_index_equal(result, mi)
+    for level in 0, 1:
+        assert('unused' not in result.levels[level])
+
+
+def test_argsort(idx):
+    result = idx.argsort()
+    expected = idx.values.argsort()
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/period/test_arithmetic.py b/pandas/tests/indexes/period/test_arithmetic.py
new file mode 100644
index 0000000000000..67b642e013880
--- /dev/null
+++ b/pandas/tests/indexes/period/test_arithmetic.py
@@ -0,0 +1,108 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import PeriodIndex, period_range
+import pandas.util.testing as tm
+
+
+class TestPeriodIndexArithmetic(object):
+    # ---------------------------------------------------------------
+    # PeriodIndex.shift is used by __add__ and __sub__
+
+    def test_pi_shift_ndarray(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        result = idx.shift(np.array([1, 2, 3, 4]))
+        expected = PeriodIndex(['2011-02', '2011-04', 'NaT', '2011-08'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.shift(np.array([1, -2, 3, -4]))
+        expected = PeriodIndex(['2011-02', '2010-12', 'NaT', '2010-12'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+
+    def test_shift(self):
+        pi1 = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='A', start='1/1/2002', end='12/1/2010')
+
+        tm.assert_index_equal(pi1.shift(0), pi1)
+
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='A', start='1/1/2000', end='12/1/2008')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+        pi1 = period_range(freq='M', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='M', start='2/1/2001', end='1/1/2010')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = period_range(freq='M', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='M', start='12/1/2000', end='11/1/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+        pi1 = period_range(freq='D', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='D', start='1/2/2001', end='12/2/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(1), pi2)
+
+        pi1 = period_range(freq='D', start='1/1/2001', end='12/1/2009')
+        pi2 = period_range(freq='D', start='12/31/2000', end='11/30/2009')
+        assert len(pi1) == len(pi2)
+        tm.assert_index_equal(pi1.shift(-1), pi2)
+
+    def test_shift_corner_cases(self):
+        # GH#9903
+        idx = pd.PeriodIndex([], name='xxx', freq='H')
+
+        with pytest.raises(TypeError):
+            # period shift doesn't accept freq
+            idx.shift(1, freq='H')
+
+        tm.assert_index_equal(idx.shift(0), idx)
+        tm.assert_index_equal(idx.shift(3), idx)
+
+        idx = pd.PeriodIndex(['2011-01-01 10:00', '2011-01-01 11:00'
+                              '2011-01-01 12:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(0), idx)
+        exp = pd.PeriodIndex(['2011-01-01 13:00', '2011-01-01 14:00'
+                              '2011-01-01 15:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(3), exp)
+        exp = pd.PeriodIndex(['2011-01-01 07:00', '2011-01-01 08:00'
+                              '2011-01-01 09:00'], name='xxx', freq='H')
+        tm.assert_index_equal(idx.shift(-3), exp)
+
+    def test_shift_nat(self):
+        idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'],
+                          freq='M', name='idx')
+        result = idx.shift(1)
+        expected = PeriodIndex(['2011-02', '2011-03', 'NaT', '2011-05'],
+                               freq='M', name='idx')
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+
+    def test_shift_gh8083(self):
+        # test shift for PeriodIndex
+        # GH#8083
+        drange = pd.period_range('20130101', periods=5, freq='D')
+        result = drange.shift(1)
+        expected = PeriodIndex(['2013-01-02', '2013-01-03', '2013-01-04',
+                                '2013-01-05', '2013-01-06'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_shift_periods(self):
+        # GH #22458 : argument 'n' was deprecated in favor of 'periods'
+        idx = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        tm.assert_index_equal(idx.shift(periods=0), idx)
+        tm.assert_index_equal(idx.shift(0), idx)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=True):
+            tm.assert_index_equal(idx.shift(n=0), idx)
diff --git a/pandas/tests/indexes/period/test_asfreq.py b/pandas/tests/indexes/period/test_asfreq.py
index 96e3d0bbd8abc..30b416e3fe9dd 100644
--- a/pandas/tests/indexes/period/test_asfreq.py
+++ b/pandas/tests/indexes/period/test_asfreq.py
@@ -1,82 +1,82 @@
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import DataFrame, PeriodIndex, Series, period_range
 from pandas.util import testing as tm
-from pandas import PeriodIndex, Series, DataFrame
 
 
-class TestPeriodIndex(tm.TestCase):
-
-    def setUp(self):
-        pass
+class TestPeriodIndex(object):
 
     def test_asfreq(self):
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='1/1/2001')
-        pi2 = PeriodIndex(freq='Q', start='1/1/2001', end='1/1/2001')
-        pi3 = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2001')
-        pi4 = PeriodIndex(freq='D', start='1/1/2001', end='1/1/2001')
-        pi5 = PeriodIndex(freq='H', start='1/1/2001', end='1/1/2001 00:00')
-        pi6 = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 00:00')
-        pi7 = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 00:00:00')
-
-        self.assertEqual(pi1.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi1.asfreq('Q', 's'), pi2)
-        self.assertEqual(pi1.asfreq('M', 'start'), pi3)
-        self.assertEqual(pi1.asfreq('D', 'StarT'), pi4)
-        self.assertEqual(pi1.asfreq('H', 'beGIN'), pi5)
-        self.assertEqual(pi1.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi1.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi2.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi2.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi2.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi2.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi2.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi2.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi3.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi3.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi3.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi3.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi3.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi3.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi4.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi4.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi4.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi4.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi4.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi4.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi5.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi5.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi5.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi5.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi5.asfreq('Min', 'S'), pi6)
-        self.assertEqual(pi5.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi6.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi6.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi6.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi6.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi6.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi6.asfreq('S', 'S'), pi7)
-
-        self.assertEqual(pi7.asfreq('A', 'S'), pi1)
-        self.assertEqual(pi7.asfreq('Q', 'S'), pi2)
-        self.assertEqual(pi7.asfreq('M', 'S'), pi3)
-        self.assertEqual(pi7.asfreq('D', 'S'), pi4)
-        self.assertEqual(pi7.asfreq('H', 'S'), pi5)
-        self.assertEqual(pi7.asfreq('Min', 'S'), pi6)
-
-        self.assertRaises(ValueError, pi7.asfreq, 'T', 'foo')
+        pi1 = period_range(freq='A', start='1/1/2001', end='1/1/2001')
+        pi2 = period_range(freq='Q', start='1/1/2001', end='1/1/2001')
+        pi3 = period_range(freq='M', start='1/1/2001', end='1/1/2001')
+        pi4 = period_range(freq='D', start='1/1/2001', end='1/1/2001')
+        pi5 = period_range(freq='H', start='1/1/2001', end='1/1/2001 00:00')
+        pi6 = period_range(freq='Min', start='1/1/2001', end='1/1/2001 00:00')
+        pi7 = period_range(freq='S', start='1/1/2001', end='1/1/2001 00:00:00')
+
+        assert pi1.asfreq('Q', 'S') == pi2
+        assert pi1.asfreq('Q', 's') == pi2
+        assert pi1.asfreq('M', 'start') == pi3
+        assert pi1.asfreq('D', 'StarT') == pi4
+        assert pi1.asfreq('H', 'beGIN') == pi5
+        assert pi1.asfreq('Min', 'S') == pi6
+        assert pi1.asfreq('S', 'S') == pi7
+
+        assert pi2.asfreq('A', 'S') == pi1
+        assert pi2.asfreq('M', 'S') == pi3
+        assert pi2.asfreq('D', 'S') == pi4
+        assert pi2.asfreq('H', 'S') == pi5
+        assert pi2.asfreq('Min', 'S') == pi6
+        assert pi2.asfreq('S', 'S') == pi7
+
+        assert pi3.asfreq('A', 'S') == pi1
+        assert pi3.asfreq('Q', 'S') == pi2
+        assert pi3.asfreq('D', 'S') == pi4
+        assert pi3.asfreq('H', 'S') == pi5
+        assert pi3.asfreq('Min', 'S') == pi6
+        assert pi3.asfreq('S', 'S') == pi7
+
+        assert pi4.asfreq('A', 'S') == pi1
+        assert pi4.asfreq('Q', 'S') == pi2
+        assert pi4.asfreq('M', 'S') == pi3
+        assert pi4.asfreq('H', 'S') == pi5
+        assert pi4.asfreq('Min', 'S') == pi6
+        assert pi4.asfreq('S', 'S') == pi7
+
+        assert pi5.asfreq('A', 'S') == pi1
+        assert pi5.asfreq('Q', 'S') == pi2
+        assert pi5.asfreq('M', 'S') == pi3
+        assert pi5.asfreq('D', 'S') == pi4
+        assert pi5.asfreq('Min', 'S') == pi6
+        assert pi5.asfreq('S', 'S') == pi7
+
+        assert pi6.asfreq('A', 'S') == pi1
+        assert pi6.asfreq('Q', 'S') == pi2
+        assert pi6.asfreq('M', 'S') == pi3
+        assert pi6.asfreq('D', 'S') == pi4
+        assert pi6.asfreq('H', 'S') == pi5
+        assert pi6.asfreq('S', 'S') == pi7
+
+        assert pi7.asfreq('A', 'S') == pi1
+        assert pi7.asfreq('Q', 'S') == pi2
+        assert pi7.asfreq('M', 'S') == pi3
+        assert pi7.asfreq('D', 'S') == pi4
+        assert pi7.asfreq('H', 'S') == pi5
+        assert pi7.asfreq('Min', 'S') == pi6
+
+        msg = "How must be one of S or E"
+        with pytest.raises(ValueError, match=msg):
+            pi7.asfreq('T', 'foo')
         result1 = pi1.asfreq('3M')
         result2 = pi1.asfreq('M')
-        expected = PeriodIndex(freq='M', start='2001-12', end='2001-12')
-        self.assert_numpy_array_equal(result1.asi8, expected.asi8)
-        self.assertEqual(result1.freqstr, '3M')
-        self.assert_numpy_array_equal(result2.asi8, expected.asi8)
-        self.assertEqual(result2.freqstr, 'M')
+        expected = period_range(freq='M', start='2001-12', end='2001-12')
+        tm.assert_numpy_array_equal(result1.asi8, expected.asi8)
+        assert result1.freqstr == '3M'
+        tm.assert_numpy_array_equal(result2.asi8, expected.asi8)
+        assert result2.freqstr == 'M'
 
     def test_asfreq_nat(self):
         idx = PeriodIndex(['2011-01', '2011-02', 'NaT', '2011-04'], freq='M')
@@ -84,21 +84,21 @@ def test_asfreq_nat(self):
         expected = PeriodIndex(['2011Q1', '2011Q1', 'NaT', '2011Q2'], freq='Q')
         tm.assert_index_equal(result, expected)
 
-    def test_asfreq_mult_pi(self):
+    @pytest.mark.parametrize('freq', ['D', '3D'])
+    def test_asfreq_mult_pi(self, freq):
         pi = PeriodIndex(['2001-01', '2001-02', 'NaT', '2001-03'], freq='2M')
 
-        for freq in ['D', '3D']:
-            result = pi.asfreq(freq)
-            exp = PeriodIndex(['2001-02-28', '2001-03-31', 'NaT',
-                               '2001-04-30'], freq=freq)
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
+        result = pi.asfreq(freq)
+        exp = PeriodIndex(['2001-02-28', '2001-03-31', 'NaT',
+                           '2001-04-30'], freq=freq)
+        tm.assert_index_equal(result, exp)
+        assert result.freq == exp.freq
 
-            result = pi.asfreq(freq, how='S')
-            exp = PeriodIndex(['2001-01-01', '2001-02-01', 'NaT',
-                               '2001-03-01'], freq=freq)
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
+        result = pi.asfreq(freq, how='S')
+        exp = PeriodIndex(['2001-01-01', '2001-02-01', 'NaT',
+                           '2001-03-01'], freq=freq)
+        tm.assert_index_equal(result, exp)
+        assert result.freq == exp.freq
 
     def test_asfreq_combined_pi(self):
         pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00', 'NaT'],
@@ -107,8 +107,8 @@ def test_asfreq_combined_pi(self):
                           freq='25H')
         for freq, how in zip(['1D1H', '1H1D'], ['S', 'E']):
             result = pi.asfreq(freq, how=how)
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
 
         for freq in ['1D1H', '1H1D']:
             pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00',
@@ -116,31 +116,31 @@ def test_asfreq_combined_pi(self):
             result = pi.asfreq('H')
             exp = PeriodIndex(['2001-01-02 00:00', '2001-01-03 02:00', 'NaT'],
                               freq='H')
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
 
             pi = pd.PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00',
                                  'NaT'], freq=freq)
             result = pi.asfreq('H', how='S')
             exp = PeriodIndex(['2001-01-01 00:00', '2001-01-02 02:00', 'NaT'],
                               freq='H')
-            self.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, exp.freq)
+            tm.assert_index_equal(result, exp)
+            assert result.freq == exp.freq
 
     def test_asfreq_ts(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/31/2010')
+        index = period_range(freq='A', start='1/1/2001', end='12/31/2010')
         ts = Series(np.random.randn(len(index)), index=index)
         df = DataFrame(np.random.randn(len(index), 3), index=index)
 
         result = ts.asfreq('D', how='end')
         df_result = df.asfreq('D', how='end')
         exp_index = index.asfreq('D', how='end')
-        self.assertEqual(len(result), len(ts))
+        assert len(result) == len(ts)
         tm.assert_index_equal(result.index, exp_index)
         tm.assert_index_equal(df_result.index, exp_index)
 
         result = ts.asfreq('D', how='start')
-        self.assertEqual(len(result), len(ts))
+        assert len(result) == len(ts)
         tm.assert_index_equal(result.index, index.asfreq('D', how='start'))
 
     def test_astype_asfreq(self):
diff --git a/pandas/tests/indexes/period/test_astype.py b/pandas/tests/indexes/period/test_astype.py
new file mode 100644
index 0000000000000..6abdf5962d6cf
--- /dev/null
+++ b/pandas/tests/indexes/period/test_astype.py
@@ -0,0 +1,126 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, Int64Index, NaT, Period, PeriodIndex, period_range
+import pandas.util.testing as tm
+
+
+class TestPeriodIndexAsType(object):
+    @pytest.mark.parametrize('dtype', [
+        float, 'timedelta64', 'timedelta64[ns]'])
+    def test_astype_raises(self, dtype):
+        # GH#13149, GH#13209
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
+        msg = 'Cannot cast PeriodArray to dtype'
+        with pytest.raises(TypeError, match=msg):
+            idx.astype(dtype)
+
+    def test_astype_conversion(self):
+        # GH#13149, GH#13209
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
+
+        result = idx.astype(object)
+        expected = Index([Period('2016-05-16', freq='D')] +
+                         [Period(NaT, freq='D')] * 3, dtype='object')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(np.int64)
+        expected = Int64Index([16937] + [-9223372036854775808] * 3,
+                              dtype=np.int64)
+        tm.assert_index_equal(result, expected)
+
+        result = idx.astype(str)
+        expected = Index(str(x) for x in idx)
+        tm.assert_index_equal(result, expected)
+
+        idx = period_range('1990', '2009', freq='A')
+        result = idx.astype('i8')
+        tm.assert_index_equal(result, Index(idx.asi8))
+        tm.assert_numpy_array_equal(result.values, idx.asi8)
+
+    def test_astype_uint(self):
+        arr = period_range('2000', periods=2)
+        expected = pd.UInt64Index(np.array([10957, 10958], dtype='uint64'))
+        tm.assert_index_equal(arr.astype("uint64"), expected)
+        tm.assert_index_equal(arr.astype("uint32"), expected)
+
+    def test_astype_object(self):
+        idx = pd.PeriodIndex([], freq='M')
+
+        exp = np.array([], dtype=object)
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+        idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
+
+        exp = np.array([pd.Period('2011-01', freq='M'), pd.NaT], dtype=object)
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+        exp = np.array([pd.Period('2011-01-01', freq='D'), pd.NaT],
+                       dtype=object)
+        idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
+        tm.assert_numpy_array_equal(idx.astype(object).values, exp)
+        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
+
+    # TODO: de-duplicate this version (from test_ops) with the one above
+    # (from test_period)
+    def test_astype_object2(self):
+        idx = pd.period_range(start='2013-01-01', periods=4, freq='M',
+                              name='idx')
+        expected_list = [pd.Period('2013-01-31', freq='M'),
+                         pd.Period('2013-02-28', freq='M'),
+                         pd.Period('2013-03-31', freq='M'),
+                         pd.Period('2013-04-30', freq='M')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        assert isinstance(result, Index)
+        assert result.dtype == object
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
+        assert idx.tolist() == expected_list
+
+        idx = PeriodIndex(['2013-01-01', '2013-01-02', 'NaT',
+                           '2013-01-04'], freq='D', name='idx')
+        expected_list = [pd.Period('2013-01-01', freq='D'),
+                         pd.Period('2013-01-02', freq='D'),
+                         pd.Period('NaT', freq='D'),
+                         pd.Period('2013-01-04', freq='D')]
+        expected = pd.Index(expected_list, dtype=object, name='idx')
+        result = idx.astype(object)
+        assert isinstance(result, Index)
+        assert result.dtype == object
+        tm.assert_index_equal(result, expected)
+        for i in [0, 1, 3]:
+            assert result[i] == expected[i]
+        assert result[2] is pd.NaT
+        assert result.name == expected.name
+
+        result_list = idx.tolist()
+        for i in [0, 1, 3]:
+            assert result_list[i] == expected_list[i]
+        assert result_list[2] is pd.NaT
+
+    def test_astype_category(self):
+        obj = pd.period_range("2000", periods=2)
+        result = obj.astype('category')
+        expected = pd.CategoricalIndex([pd.Period('2000-01-01', freq="D"),
+                                        pd.Period('2000-01-02', freq="D")])
+        tm.assert_index_equal(result, expected)
+
+        result = obj._data.astype('category')
+        expected = expected.values
+        tm.assert_categorical_equal(result, expected)
+
+    def test_astype_array_fallback(self):
+        obj = pd.period_range("2000", periods=2)
+        result = obj.astype(bool)
+        expected = pd.Index(np.array([True, True]))
+        tm.assert_index_equal(result, expected)
+
+        result = obj._data.astype(bool)
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/period/test_construction.py b/pandas/tests/indexes/period/test_construction.py
index ab70ad59846e8..f1adeca7245f6 100644
--- a/pandas/tests/indexes/period/test_construction.py
+++ b/pandas/tests/indexes/period/test_construction.py
@@ -1,16 +1,21 @@
 import numpy as np
+import pytest
+
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas.compat import PY3, lmap, lrange, text_type
+
+from pandas.core.dtypes.dtypes import PeriodDtype
 
 import pandas as pd
+from pandas import (
+    Index, Period, PeriodIndex, Series, date_range, offsets, period_range)
+import pandas.core.indexes.period as period
 import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas.compat import lrange, PY3, text_type, lmap
-from pandas import (Period, PeriodIndex, period_range, offsets, date_range,
-                    Series, Index)
 
 
-class TestPeriodIndex(tm.TestCase):
+class TestPeriodIndex(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         pass
 
     def test_construction_base_constructor(self):
@@ -36,8 +41,12 @@ def test_construction_base_constructor(self):
     def test_constructor_use_start_freq(self):
         # GH #1118
         p = Period('4/2/2012', freq='B')
-        index = PeriodIndex(start=p, periods=10)
-        expected = PeriodIndex(start='4/2/2012', periods=10, freq='B')
+        with tm.assert_produces_warning(FutureWarning):
+            index = PeriodIndex(start=p, periods=10)
+        expected = period_range(start='4/2/2012', periods=10, freq='B')
+        tm.assert_index_equal(index, expected)
+
+        index = period_range(start=p, periods=10)
         tm.assert_index_equal(index, expected)
 
     def test_constructor_field_arrays(self):
@@ -58,12 +67,17 @@ def test_constructor_field_arrays(self):
 
         years = [2007, 2007, 2007]
         months = [1, 2]
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='M')
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='2M')
-        self.assertRaises(ValueError, PeriodIndex, year=years, month=months,
-                          freq='M', start=Period('2007-01', freq='M'))
+
+        msg = "Mismatched Period array lengths"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(year=years, month=months, freq='M')
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(year=years, month=months, freq='2M')
+
+        msg = "Can either instantiate from fields or endpoints, but not both"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(year=years, month=months, freq='M',
+                        start=Period('2007-01', freq='M'))
 
         years = [2007, 2007, 2007]
         months = [1, 2, 3]
@@ -73,8 +87,8 @@ def test_constructor_field_arrays(self):
 
     def test_constructor_U(self):
         # U was used as undefined period
-        self.assertRaises(ValueError, period_range, '2007-1-1', periods=500,
-                          freq='X')
+        with pytest.raises(ValueError, match="Invalid frequency: X"):
+            period_range('2007-1-1', periods=500, freq='X')
 
     def test_constructor_nano(self):
         idx = period_range(start=Period(ordinal=1, freq='N'),
@@ -91,21 +105,33 @@ def test_constructor_arrays_negative_year(self):
 
         pindex = PeriodIndex(year=years, quarter=quarters)
 
-        self.assert_index_equal(pindex.year, pd.Index(years))
-        self.assert_index_equal(pindex.quarter, pd.Index(quarters))
+        tm.assert_index_equal(pindex.year, pd.Index(years))
+        tm.assert_index_equal(pindex.quarter, pd.Index(quarters))
 
     def test_constructor_invalid_quarters(self):
-        self.assertRaises(ValueError, PeriodIndex, year=lrange(2000, 2004),
-                          quarter=lrange(4), freq='Q-DEC')
+        msg = "Quarter must be 1 <= q <= 4"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(year=lrange(2000, 2004), quarter=lrange(4),
+                        freq='Q-DEC')
 
     def test_constructor_corner(self):
-        self.assertRaises(ValueError, PeriodIndex, periods=10, freq='A')
+        msg = "Not enough parameters to construct Period range"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(periods=10, freq='A')
 
         start = Period('2007', freq='A-JUN')
         end = Period('2010', freq='A-DEC')
-        self.assertRaises(ValueError, PeriodIndex, start=start, end=end)
-        self.assertRaises(ValueError, PeriodIndex, start=start)
-        self.assertRaises(ValueError, PeriodIndex, end=end)
+
+        msg = "start and end must have same freq"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(start=start, end=end)
+
+        msg = ("Of the three parameters: start, end, and periods, exactly two"
+               " must be specified")
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(start=start)
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(end=end)
 
         result = period_range('2007-01', periods=10.5, freq='M')
         exp = period_range('2007-01', periods=10, freq='M')
@@ -118,10 +144,15 @@ def test_constructor_fromarraylike(self):
         tm.assert_index_equal(PeriodIndex(idx.values), idx)
         tm.assert_index_equal(PeriodIndex(list(idx.values)), idx)
 
-        self.assertRaises(ValueError, PeriodIndex, idx._values)
-        self.assertRaises(ValueError, PeriodIndex, list(idx._values))
-        self.assertRaises(TypeError, PeriodIndex,
-                          data=Period('2007', freq='A'))
+        msg = "freq not specified and cannot be inferred"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(idx._ndarray_values)
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(list(idx._ndarray_values))
+
+        msg = "'Period' object is not iterable"
+        with pytest.raises(TypeError, match=msg):
+            PeriodIndex(data=Period('2007', freq='A'))
 
         result = PeriodIndex(iter(idx))
         tm.assert_index_equal(result, idx)
@@ -134,15 +165,15 @@ def test_constructor_fromarraylike(self):
 
         result = PeriodIndex(idx, freq=offsets.MonthEnd())
         tm.assert_index_equal(result, idx)
-        self.assertTrue(result.freq, 'M')
+        assert result.freq == 'M'
 
         result = PeriodIndex(idx, freq='2M')
         tm.assert_index_equal(result, idx.asfreq('2M'))
-        self.assertTrue(result.freq, '2M')
+        assert result.freq == '2M'
 
         result = PeriodIndex(idx, freq=offsets.MonthEnd(2))
         tm.assert_index_equal(result, idx.asfreq('2M'))
-        self.assertTrue(result.freq, '2M')
+        assert result.freq == '2M'
 
         result = PeriodIndex(idx, freq='D')
         exp = idx.asfreq('D', 'e')
@@ -152,19 +183,36 @@ def test_constructor_datetime64arr(self):
         vals = np.arange(100000, 100000 + 10000, 100, dtype=np.int64)
         vals = vals.view(np.dtype('M8[us]'))
 
-        self.assertRaises(ValueError, PeriodIndex, vals, freq='D')
+        msg = r"Wrong dtype: datetime64\[us\]"
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(vals, freq='D')
+
+    @pytest.mark.parametrize('box', [None, 'series', 'index'])
+    def test_constructor_datetime64arr_ok(self, box):
+        # https://github.com/pandas-dev/pandas/issues/23438
+        data = pd.date_range('2017', periods=4, freq="M")
+        if box is None:
+            data = data._values
+        elif box == 'series':
+            data = pd.Series(data)
+
+        result = PeriodIndex(data, freq='D')
+        expected = PeriodIndex([
+            '2017-01-31', '2017-02-28', '2017-03-31', '2017-04-30'
+        ], freq="D")
+        tm.assert_index_equal(result, expected)
 
     def test_constructor_dtype(self):
         # passing a dtype with a tz should localize
         idx = PeriodIndex(['2013-01', '2013-03'], dtype='period[M]')
         exp = PeriodIndex(['2013-01', '2013-03'], freq='M')
         tm.assert_index_equal(idx, exp)
-        self.assertEqual(idx.dtype, 'period[M]')
+        assert idx.dtype == 'period[M]'
 
         idx = PeriodIndex(['2013-01-05', '2013-03-05'], dtype='period[3D]')
         exp = PeriodIndex(['2013-01-05', '2013-03-05'], freq='3D')
         tm.assert_index_equal(idx, exp)
-        self.assertEqual(idx.dtype, 'period[3D]')
+        assert idx.dtype == 'period[3D]'
 
         # if we already have a freq and its not the same, then asfreq
         # (not changed)
@@ -173,23 +221,23 @@ def test_constructor_dtype(self):
         res = PeriodIndex(idx, dtype='period[M]')
         exp = PeriodIndex(['2013-01', '2013-01'], freq='M')
         tm.assert_index_equal(res, exp)
-        self.assertEqual(res.dtype, 'period[M]')
+        assert res.dtype == 'period[M]'
 
         res = PeriodIndex(idx, freq='M')
         tm.assert_index_equal(res, exp)
-        self.assertEqual(res.dtype, 'period[M]')
+        assert res.dtype == 'period[M]'
 
         msg = 'specified freq and dtype are different'
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
             PeriodIndex(['2011-01'], freq='M', dtype='period[D]')
 
     def test_constructor_empty(self):
         idx = pd.PeriodIndex([], freq='M')
-        tm.assertIsInstance(idx, PeriodIndex)
-        self.assertEqual(len(idx), 0)
-        self.assertEqual(idx.freq, 'M')
+        assert isinstance(idx, PeriodIndex)
+        assert len(idx) == 0
+        assert idx.freq == 'M'
 
-        with tm.assertRaisesRegexp(ValueError, 'freq not specified'):
+        with pytest.raises(ValueError, match='freq not specified'):
             pd.PeriodIndex([])
 
     def test_constructor_pi_nat(self):
@@ -215,35 +263,35 @@ def test_constructor_pi_nat(self):
         idx = PeriodIndex([pd.NaT, pd.NaT, '2011-01', '2011-01'], freq='M')
         tm.assert_index_equal(idx, exp)
 
-        with tm.assertRaisesRegexp(ValueError, 'freq not specified'):
+        with pytest.raises(ValueError, match='freq not specified'):
             PeriodIndex([pd.NaT, pd.NaT])
 
-        with tm.assertRaisesRegexp(ValueError, 'freq not specified'):
+        with pytest.raises(ValueError, match='freq not specified'):
             PeriodIndex(np.array([pd.NaT, pd.NaT]))
 
-        with tm.assertRaisesRegexp(ValueError, 'freq not specified'):
+        with pytest.raises(ValueError, match='freq not specified'):
             PeriodIndex(['NaT', 'NaT'])
 
-        with tm.assertRaisesRegexp(ValueError, 'freq not specified'):
+        with pytest.raises(ValueError, match='freq not specified'):
             PeriodIndex(np.array(['NaT', 'NaT']))
 
     def test_constructor_incompat_freq(self):
         msg = "Input has different freq=D from PeriodIndex\\(freq=M\\)"
 
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
             PeriodIndex([Period('2011-01', freq='M'), pd.NaT,
                          Period('2011-01', freq='D')])
 
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
             PeriodIndex(np.array([Period('2011-01', freq='M'), pd.NaT,
                                   Period('2011-01', freq='D')]))
 
         # first element is pd.NaT
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
             PeriodIndex([pd.NaT, Period('2011-01', freq='M'),
                          Period('2011-01', freq='D')])
 
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
             PeriodIndex(np.array([pd.NaT, Period('2011-01', freq='M'),
                                   Period('2011-01', freq='D')]))
 
@@ -263,42 +311,34 @@ def test_constructor_mixed(self):
 
     def test_constructor_simple_new(self):
         idx = period_range('2007-01', name='p', periods=2, freq='M')
-        result = idx._simple_new(idx, 'p', freq=idx.freq)
+        result = idx._simple_new(idx, name='p', freq=idx.freq)
         tm.assert_index_equal(result, idx)
 
-        result = idx._simple_new(idx.astype('i8'), 'p', freq=idx.freq)
+        result = idx._simple_new(idx.astype('i8'), name='p', freq=idx.freq)
         tm.assert_index_equal(result, idx)
 
-        result = idx._simple_new([pd.Period('2007-01', freq='M'),
-                                  pd.Period('2007-02', freq='M')],
-                                 'p', freq=idx.freq)
-        self.assert_index_equal(result, idx)
-
-        result = idx._simple_new(np.array([pd.Period('2007-01', freq='M'),
-                                           pd.Period('2007-02', freq='M')]),
-                                 'p', freq=idx.freq)
-        self.assert_index_equal(result, idx)
-
     def test_constructor_simple_new_empty(self):
         # GH13079
         idx = PeriodIndex([], freq='M', name='p')
         result = idx._simple_new(idx, name='p', freq='M')
         tm.assert_index_equal(result, idx)
 
-    def test_constructor_floats(self):
-        # GH13079
-        for floats in [[1.1, 2.1], np.array([1.1, 2.1])]:
-            with self.assertRaises(TypeError):
-                pd.PeriodIndex._simple_new(floats, freq='M')
+    @pytest.mark.parametrize('floats', [[1.1, 2.1], np.array([1.1, 2.1])])
+    def test_constructor_floats(self, floats):
+        msg = r"PeriodIndex\._simple_new does not accept floats"
+        with pytest.raises(TypeError, match=msg):
+            pd.PeriodIndex._simple_new(floats, freq='M')
 
-            with self.assertRaises(TypeError):
-                pd.PeriodIndex(floats, freq='M')
+        msg = "PeriodIndex does not allow floating point in construction"
+        with pytest.raises(TypeError, match=msg):
+            pd.PeriodIndex(floats, freq='M')
 
     def test_constructor_nat(self):
-        self.assertRaises(ValueError, period_range, start='NaT',
-                          end='2011-01-01', freq='M')
-        self.assertRaises(ValueError, period_range, start='2011-01-01',
-                          end='NaT', freq='M')
+        msg = "start and end must not be NaT"
+        with pytest.raises(ValueError, match=msg):
+            period_range(start='NaT', end='2011-01-01', freq='M')
+        with pytest.raises(ValueError, match=msg):
+            period_range(start='2011-01-01', end='NaT', freq='M')
 
     def test_constructor_year_and_quarter(self):
         year = pd.Series([2001, 2002, 2003])
@@ -309,145 +349,166 @@ def test_constructor_year_and_quarter(self):
         p = PeriodIndex(lops)
         tm.assert_index_equal(p, idx)
 
-    def test_constructor_freq_mult(self):
+    @pytest.mark.parametrize('func, warning', [
+        (PeriodIndex, FutureWarning),
+        (period_range, None)
+    ])
+    def test_constructor_freq_mult(self, func, warning):
         # GH #7811
-        for func in [PeriodIndex, period_range]:
+        with tm.assert_produces_warning(warning):
             # must be the same, but for sure...
             pidx = func(start='2014-01', freq='2M', periods=4)
-            expected = PeriodIndex(['2014-01', '2014-03',
-                                    '2014-05', '2014-07'], freq='2M')
-            tm.assert_index_equal(pidx, expected)
+        expected = PeriodIndex(['2014-01', '2014-03',
+                                '2014-05', '2014-07'], freq='2M')
+        tm.assert_index_equal(pidx, expected)
 
+        with tm.assert_produces_warning(warning):
             pidx = func(start='2014-01-02', end='2014-01-15', freq='3D')
-            expected = PeriodIndex(['2014-01-02', '2014-01-05',
-                                    '2014-01-08', '2014-01-11',
-                                    '2014-01-14'], freq='3D')
-            tm.assert_index_equal(pidx, expected)
+        expected = PeriodIndex(['2014-01-02', '2014-01-05',
+                                '2014-01-08', '2014-01-11',
+                                '2014-01-14'], freq='3D')
+        tm.assert_index_equal(pidx, expected)
 
+        with tm.assert_produces_warning(warning):
             pidx = func(end='2014-01-01 17:00', freq='4H', periods=3)
-            expected = PeriodIndex(['2014-01-01 09:00', '2014-01-01 13:00',
-                                    '2014-01-01 17:00'], freq='4H')
-            tm.assert_index_equal(pidx, expected)
+        expected = PeriodIndex(['2014-01-01 09:00', '2014-01-01 13:00',
+                                '2014-01-01 17:00'], freq='4H')
+        tm.assert_index_equal(pidx, expected)
 
         msg = ('Frequency must be positive, because it'
                ' represents span: -1M')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             PeriodIndex(['2011-01'], freq='-1M')
 
         msg = ('Frequency must be positive, because it' ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             PeriodIndex(['2011-01'], freq='0M')
 
         msg = ('Frequency must be positive, because it' ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             period_range('2011-01', periods=3, freq='0M')
 
-    def test_constructor_freq_mult_dti_compat(self):
-        import itertools
-        mults = [1, 2, 3, 4, 5]
-        freqs = ['A', 'M', 'D', 'T', 'S']
-        for mult, freq in itertools.product(mults, freqs):
-            freqstr = str(mult) + freq
-            pidx = PeriodIndex(start='2014-04-01', freq=freqstr, periods=10)
-            expected = date_range(start='2014-04-01', freq=freqstr,
-                                  periods=10).to_period(freqstr)
-            tm.assert_index_equal(pidx, expected)
+    @pytest.mark.parametrize('freq', ['A', 'M', 'D', 'T', 'S'])
+    @pytest.mark.parametrize('mult', [1, 2, 3, 4, 5])
+    def test_constructor_freq_mult_dti_compat(self, mult, freq):
+        freqstr = str(mult) + freq
+        pidx = period_range(start='2014-04-01', freq=freqstr, periods=10)
+        expected = date_range(start='2014-04-01', freq=freqstr,
+                              periods=10).to_period(freqstr)
+        tm.assert_index_equal(pidx, expected)
 
     def test_constructor_freq_combined(self):
         for freq in ['1D1H', '1H1D']:
             pidx = PeriodIndex(['2016-01-01', '2016-01-02'], freq=freq)
             expected = PeriodIndex(['2016-01-01 00:00', '2016-01-02 00:00'],
                                    freq='25H')
-        for freq, func in zip(['1D1H', '1H1D'], [PeriodIndex, period_range]):
-            pidx = func(start='2016-01-01', periods=2, freq=freq)
+        for freq in ['1D1H', '1H1D']:
+            pidx = period_range(start='2016-01-01', periods=2, freq=freq)
             expected = PeriodIndex(['2016-01-01 00:00', '2016-01-02 01:00'],
                                    freq='25H')
             tm.assert_index_equal(pidx, expected)
 
+    def test_constructor_range_based_deprecated(self):
+        with tm.assert_produces_warning(FutureWarning):
+            pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 9
+
+    def test_constructor_range_based_deprecated_different_freq(self):
+        with tm.assert_produces_warning(FutureWarning) as m:
+            PeriodIndex(start='2000', periods=2)
+
+        warning, = m
+        assert 'freq="A-DEC"' in str(warning.message)
+
     def test_constructor(self):
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 9)
+        pi = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 9
 
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 4 * 9)
+        pi = period_range(freq='Q', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 4 * 9
 
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 12 * 9)
+        pi = period_range(freq='M', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 12 * 9
 
-        pi = PeriodIndex(freq='D', start='1/1/2001', end='12/31/2009')
-        self.assertEqual(len(pi), 365 * 9 + 2)
+        pi = period_range(freq='D', start='1/1/2001', end='12/31/2009')
+        assert len(pi) == 365 * 9 + 2
 
-        pi = PeriodIndex(freq='B', start='1/1/2001', end='12/31/2009')
-        self.assertEqual(len(pi), 261 * 9)
+        pi = period_range(freq='B', start='1/1/2001', end='12/31/2009')
+        assert len(pi) == 261 * 9
 
-        pi = PeriodIndex(freq='H', start='1/1/2001', end='12/31/2001 23:00')
-        self.assertEqual(len(pi), 365 * 24)
+        pi = period_range(freq='H', start='1/1/2001', end='12/31/2001 23:00')
+        assert len(pi) == 365 * 24
 
-        pi = PeriodIndex(freq='Min', start='1/1/2001', end='1/1/2001 23:59')
-        self.assertEqual(len(pi), 24 * 60)
+        pi = period_range(freq='Min', start='1/1/2001', end='1/1/2001 23:59')
+        assert len(pi) == 24 * 60
 
-        pi = PeriodIndex(freq='S', start='1/1/2001', end='1/1/2001 23:59:59')
-        self.assertEqual(len(pi), 24 * 60 * 60)
+        pi = period_range(freq='S', start='1/1/2001', end='1/1/2001 23:59:59')
+        assert len(pi) == 24 * 60 * 60
 
         start = Period('02-Apr-2005', 'B')
-        i1 = PeriodIndex(start=start, periods=20)
-        self.assertEqual(len(i1), 20)
-        self.assertEqual(i1.freq, start.freq)
-        self.assertEqual(i1[0], start)
+        i1 = period_range(start=start, periods=20)
+        assert len(i1) == 20
+        assert i1.freq == start.freq
+        assert i1[0] == start
 
         end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), 10)
-        self.assertEqual(i1.freq, end_intv.freq)
-        self.assertEqual(i1[-1], end_intv)
+        i1 = period_range(end=end_intv, periods=10)
+        assert len(i1) == 10
+        assert i1.freq == end_intv.freq
+        assert i1[-1] == end_intv
 
         end_intv = Period('2006-12-31', '1w')
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        self.assertEqual(i1.freq, i2.freq)
+        i2 = period_range(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
 
         end_intv = Period('2006-12-31', ('w', 1))
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        self.assertEqual(i1.freq, i2.freq)
+        i2 = period_range(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
 
         end_intv = Period('2005-05-01', 'B')
-        i1 = PeriodIndex(start=start, end=end_intv)
+        i1 = period_range(start=start, end=end_intv)
 
         # infer freq from first element
         i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
-        self.assertEqual(len(i2), 2)
-        self.assertEqual(i2[0], end_intv)
+        assert len(i2) == 2
+        assert i2[0] == end_intv
 
         i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
-        self.assertEqual(len(i2), 2)
-        self.assertEqual(i2[0], end_intv)
+        assert len(i2) == 2
+        assert i2[0] == end_intv
 
         # Mixed freq should fail
         vals = [end_intv, Period('2006-12-31', 'w')]
-        self.assertRaises(ValueError, PeriodIndex, vals)
+        msg = r"Input has different freq=W-SUN from PeriodIndex\(freq=B\)"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            PeriodIndex(vals)
         vals = np.array(vals)
-        self.assertRaises(ValueError, PeriodIndex, vals)
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            PeriodIndex(vals)
 
     def test_constructor_error(self):
         start = Period('02-Apr-2005', 'B')
         end_intv = Period('2006-12-31', ('w', 1))
 
-        msg = 'Start and end must have same freq'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = 'start and end must have same freq'
+        with pytest.raises(ValueError, match=msg):
             PeriodIndex(start=start, end=end_intv)
 
-        msg = 'Must specify 2 of start, end, periods'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        msg = ('Of the three parameters: start, end, and periods, '
+               'exactly two must be specified')
+        with pytest.raises(ValueError, match=msg):
             PeriodIndex(start=start)
 
-    def test_recreate_from_data(self):
-        for o in ['M', 'Q', 'A', 'D', 'B', 'T', 'S', 'L', 'U', 'N', 'H']:
-            org = PeriodIndex(start='2001/04/01', freq=o, periods=1)
-            idx = PeriodIndex(org.values, freq=o)
-            tm.assert_index_equal(idx, org)
+    @pytest.mark.parametrize('freq', ['M', 'Q', 'A', 'D', 'B',
+                                      'T', 'S', 'L', 'U', 'N', 'H'])
+    def test_recreate_from_data(self, freq):
+        org = period_range(start='2001/04/01', freq=freq, periods=1)
+        idx = PeriodIndex(org.values, freq=freq)
+        tm.assert_index_equal(idx, org)
 
     def test_map_with_string_constructor(self):
         raw = [2005, 2007, 2009]
@@ -463,26 +524,28 @@ def test_map_with_string_constructor(self):
             res = index.map(t)
 
             # should return an Index
-            tm.assertIsInstance(res, Index)
+            assert isinstance(res, Index)
 
             # preserve element types
-            self.assertTrue(all(isinstance(resi, t) for resi in res))
+            assert all(isinstance(resi, t) for resi in res)
 
             # lastly, values should compare equal
             tm.assert_index_equal(res, expected)
 
 
-class TestSeriesPeriod(tm.TestCase):
+class TestSeriesPeriod(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.series = Series(period_range('2000-01-01', periods=10, freq='D'))
 
     def test_constructor_cant_cast_period(self):
-        with tm.assertRaises(TypeError):
+        msg = "Cannot cast PeriodArray to dtype float64"
+        with pytest.raises(TypeError, match=msg):
             Series(period_range('2000-01-01', periods=10, freq='D'),
                    dtype=float)
 
     def test_constructor_cast_object(self):
-        s = Series(period_range('1/1/2000', periods=10), dtype=object)
+        s = Series(period_range('1/1/2000', periods=10),
+                   dtype=PeriodDtype("D"))
         exp = Series(period_range('1/1/2000', periods=10))
         tm.assert_series_equal(s, exp)
diff --git a/pandas/tests/indexes/period/test_formats.py b/pandas/tests/indexes/period/test_formats.py
new file mode 100644
index 0000000000000..5b2940372b9d7
--- /dev/null
+++ b/pandas/tests/indexes/period/test_formats.py
@@ -0,0 +1,220 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import PeriodIndex
+import pandas.util.testing as tm
+
+
+def test_to_native_types():
+    index = PeriodIndex(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], freq='D')
+
+    # First, with no arguments.
+    expected = np.array(['2017-01-01', '2017-01-02',
+                         '2017-01-03'], dtype='=U10')
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    # No NaN values, so na_rep has no effect
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure slicing works
+    expected = np.array(['2017-01-01', '2017-01-03'], dtype='=U10')
+
+    result = index.to_native_types([0, 2])
+    tm.assert_numpy_array_equal(result, expected)
+
+    # Make sure date formatting works
+    expected = np.array(['01-2017-01', '01-2017-02',
+                         '01-2017-03'], dtype='=U10')
+
+    result = index.to_native_types(date_format='%m-%Y-%d')
+    tm.assert_numpy_array_equal(result, expected)
+
+    # NULL object handling should work
+    index = PeriodIndex(['2017-01-01', pd.NaT, '2017-01-03'], freq='D')
+    expected = np.array(['2017-01-01', 'NaT', '2017-01-03'], dtype=object)
+
+    result = index.to_native_types()
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = np.array(['2017-01-01', 'pandas',
+                         '2017-01-03'], dtype=object)
+
+    result = index.to_native_types(na_rep='pandas')
+    tm.assert_numpy_array_equal(result, expected)
+
+
+class TestPeriodIndexRendering(object):
+
+    def test_frame_repr(self):
+        df = pd.DataFrame({"A": [1, 2, 3]},
+                          index=pd.date_range('2000', periods=3))
+        result = repr(df)
+        expected = (
+            '            A\n'
+            '2000-01-01  1\n'
+            '2000-01-02  2\n'
+            '2000-01-03  3')
+        assert result == expected
+
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_representation(self, method):
+        # GH#7601
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+        idx10 = PeriodIndex(['2011-01-01', '2011-02-01'], freq='3D')
+
+        exp1 = """PeriodIndex([], dtype='period[D]', freq='D')"""
+
+        exp2 = """PeriodIndex(['2011-01-01'], dtype='period[D]', freq='D')"""
+
+        exp3 = ("PeriodIndex(['2011-01-01', '2011-01-02'], dtype='period[D]', "
+                "freq='D')")
+
+        exp4 = ("PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
+                "dtype='period[D]', freq='D')")
+
+        exp5 = ("PeriodIndex(['2011', '2012', '2013'], dtype='period[A-DEC]', "
+                "freq='A-DEC')")
+
+        exp6 = ("PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], "
+                "dtype='period[H]', freq='H')")
+
+        exp7 = ("PeriodIndex(['2013Q1'], dtype='period[Q-DEC]', "
+                "freq='Q-DEC')")
+
+        exp8 = ("PeriodIndex(['2013Q1', '2013Q2'], dtype='period[Q-DEC]', "
+                "freq='Q-DEC')")
+
+        exp9 = ("PeriodIndex(['2013Q1', '2013Q2', '2013Q3'], "
+                "dtype='period[Q-DEC]', freq='Q-DEC')")
+
+        exp10 = ("PeriodIndex(['2011-01-01', '2011-02-01'], "
+                 "dtype='period[3D]', freq='3D')")
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9, idx10],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9, exp10]):
+            result = getattr(idx, method)()
+            assert result == expected
+
+    def test_representation_to_series(self):
+        # GH#10971
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+
+        exp1 = """Series([], dtype: period[D])"""
+
+        exp2 = """0    2011-01-01
+dtype: period[D]"""
+
+        exp3 = """0    2011-01-01
+1    2011-01-02
+dtype: period[D]"""
+
+        exp4 = """0    2011-01-01
+1    2011-01-02
+2    2011-01-03
+dtype: period[D]"""
+
+        exp5 = """0    2011
+1    2012
+2    2013
+dtype: period[A-DEC]"""
+
+        exp6 = """0    2011-01-01 09:00
+1    2012-02-01 10:00
+2                 NaT
+dtype: period[H]"""
+
+        exp7 = """0    2013Q1
+dtype: period[Q-DEC]"""
+
+        exp8 = """0    2013Q1
+1    2013Q2
+dtype: period[Q-DEC]"""
+
+        exp9 = """0    2013Q1
+1    2013Q2
+2    2013Q3
+dtype: period[Q-DEC]"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9]):
+            result = repr(pd.Series(idx))
+            assert result == expected
+
+    def test_summary(self):
+        # GH#9116
+        idx1 = PeriodIndex([], freq='D')
+        idx2 = PeriodIndex(['2011-01-01'], freq='D')
+        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
+        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                           freq='D')
+        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
+        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'],
+                           freq='H')
+
+        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
+        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
+        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
+
+        exp1 = """PeriodIndex: 0 entries
+Freq: D"""
+
+        exp2 = """PeriodIndex: 1 entries, 2011-01-01 to 2011-01-01
+Freq: D"""
+
+        exp3 = """PeriodIndex: 2 entries, 2011-01-01 to 2011-01-02
+Freq: D"""
+
+        exp4 = """PeriodIndex: 3 entries, 2011-01-01 to 2011-01-03
+Freq: D"""
+
+        exp5 = """PeriodIndex: 3 entries, 2011 to 2013
+Freq: A-DEC"""
+
+        exp6 = """PeriodIndex: 3 entries, 2011-01-01 09:00 to NaT
+Freq: H"""
+
+        exp7 = """PeriodIndex: 1 entries, 2013Q1 to 2013Q1
+Freq: Q-DEC"""
+
+        exp8 = """PeriodIndex: 2 entries, 2013Q1 to 2013Q2
+Freq: Q-DEC"""
+
+        exp9 = """PeriodIndex: 3 entries, 2013Q1 to 2013Q3
+Freq: Q-DEC"""
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
+                                  idx6, idx7, idx8, idx9],
+                                 [exp1, exp2, exp3, exp4, exp5,
+                                  exp6, exp7, exp8, exp9]):
+            result = idx._summary()
+            assert result == expected
diff --git a/pandas/tests/indexes/period/test_indexing.py b/pandas/tests/indexes/period/test_indexing.py
index ff83b50a2a7b2..fa8199b4e6163 100644
--- a/pandas/tests/indexes/period/test_indexing.py
+++ b/pandas/tests/indexes/period/test_indexing.py
@@ -1,18 +1,26 @@
-from datetime import datetime
+from datetime import datetime, timedelta
 
 import numpy as np
+import pytest
+
+from pandas._libs.tslibs import period as libperiod
+from pandas.compat import lrange
+
 import pandas as pd
+from pandas import (
+    DatetimeIndex, Period, PeriodIndex, Series, notna, period_range)
 from pandas.util import testing as tm
-from pandas.compat import lrange
-from pandas._libs import tslib
-from pandas import (PeriodIndex, Series, DatetimeIndex,
-                    period_range, Period, _np_version_under1p9)
 
 
-class TestGetItem(tm.TestCase):
+class TestGetItem(object):
+    def test_ellipsis(self):
+        # GH#21282
+        idx = period_range('2011-01-01', '2011-01-31', freq='D',
+                           name='idx')
 
-    def setUp(self):
-        pass
+        result = idx[...]
+        assert result.equals(idx)
+        assert result is not idx
 
     def test_getitem(self):
         idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D',
@@ -20,43 +28,43 @@ def test_getitem(self):
 
         for idx in [idx1]:
             result = idx[0]
-            self.assertEqual(result, pd.Period('2011-01-01', freq='D'))
+            assert result == pd.Period('2011-01-01', freq='D')
 
             result = idx[-1]
-            self.assertEqual(result, pd.Period('2011-01-31', freq='D'))
+            assert result == pd.Period('2011-01-31', freq='D')
 
             result = idx[0:5]
             expected = pd.period_range('2011-01-01', '2011-01-05', freq='D',
                                        name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx[0:10:2]
             expected = pd.PeriodIndex(['2011-01-01', '2011-01-03',
                                        '2011-01-05',
                                        '2011-01-07', '2011-01-09'],
                                       freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx[-20:-5:3]
             expected = pd.PeriodIndex(['2011-01-12', '2011-01-15',
                                        '2011-01-18',
                                        '2011-01-21', '2011-01-24'],
                                       freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx[4::-1]
             expected = PeriodIndex(['2011-01-05', '2011-01-04', '2011-01-03',
                                     '2011-01-02', '2011-01-01'],
                                    freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
     def test_getitem_index(self):
         idx = period_range('2007-01', periods=10, freq='M', name='x')
@@ -76,35 +84,35 @@ def test_getitem_partial(self):
         rng = period_range('2007-01', periods=50, freq='M')
         ts = Series(np.random.randn(len(rng)), rng)
 
-        self.assertRaises(KeyError, ts.__getitem__, '2006')
+        with pytest.raises(KeyError, match=r"^'2006'$"):
+            ts['2006']
 
         result = ts['2008']
-        self.assertTrue((result.index.year == 2008).all())
+        assert (result.index.year == 2008).all()
 
         result = ts['2008':'2009']
-        self.assertEqual(len(result), 24)
+        assert len(result) == 24
 
         result = ts['2008-1':'2009-12']
-        self.assertEqual(len(result), 24)
+        assert len(result) == 24
 
         result = ts['2008Q1':'2009Q4']
-        self.assertEqual(len(result), 24)
+        assert len(result) == 24
 
         result = ts[:'2009']
-        self.assertEqual(len(result), 36)
+        assert len(result) == 36
 
         result = ts['2009':]
-        self.assertEqual(len(result), 50 - 24)
+        assert len(result) == 50 - 24
 
         exp = result
         result = ts[24:]
         tm.assert_series_equal(exp, result)
 
         ts = ts[10:].append(ts[10:])
-        self.assertRaisesRegexp(KeyError,
-                                "left slice bound for non-unique "
-                                "label: '2008'",
-                                ts.__getitem__, slice('2008', '2009'))
+        msg = "left slice bound for non-unique label: '2008'"
+        with pytest.raises(KeyError, match=msg):
+            ts[slice('2008', '2009')]
 
     def test_getitem_datetime(self):
         rng = period_range(start='2012-01-01', periods=10, freq='W-MON')
@@ -118,16 +126,16 @@ def test_getitem_datetime(self):
 
     def test_getitem_nat(self):
         idx = pd.PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='M')
-        self.assertEqual(idx[0], pd.Period('2011-01', freq='M'))
-        self.assertIs(idx[1], tslib.NaT)
+        assert idx[0] == pd.Period('2011-01', freq='M')
+        assert idx[1] is pd.NaT
 
         s = pd.Series([0, 1, 2], index=idx)
-        self.assertEqual(s[pd.NaT], 1)
+        assert s[pd.NaT] == 1
 
         s = pd.Series(idx, index=idx)
-        self.assertEqual(s[pd.Period('2011-01', freq='M')],
-                         pd.Period('2011-01', freq='M'))
-        self.assertIs(s[pd.NaT], tslib.NaT)
+        assert (s[pd.Period('2011-01', freq='M')] ==
+                pd.Period('2011-01', freq='M'))
+        assert s[pd.NaT] is pd.NaT
 
     def test_getitem_list_periods(self):
         # GH 7710
@@ -137,26 +145,23 @@ def test_getitem_list_periods(self):
         tm.assert_series_equal(ts[[Period('2012-01-02', freq='D')]], exp)
 
     def test_getitem_seconds(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S',
+        # GH#6716
+        didx = pd.date_range(start='2013/01/01 09:00:00', freq='S',
                              periods=4000)
-        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
+        pidx = period_range(start='2013/01/01 09:00:00', freq='S',
+                            periods=4000)
 
         for idx in [didx, pidx]:
             # getitem against index should raise ValueError
             values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
                       '2013/02/01 09:00']
             for v in values:
-                if _np_version_under1p9:
-                    with tm.assertRaises(ValueError):
-                        idx[v]
-                else:
-                    # GH7116
-                    # these show deprecations as we are trying
-                    # to slice with non-integer indexers
-                    # with tm.assertRaises(IndexError):
-                    #    idx[v]
-                    continue
+                # GH7116
+                # these show deprecations as we are trying
+                # to slice with non-integer indexers
+                # with pytest.raises(IndexError):
+                #    idx[v]
+                continue
 
             s = Series(np.random.rand(len(idx)), index=idx)
             tm.assert_series_equal(s['2013/01/01 10:00'], s[3600:3660])
@@ -165,10 +170,10 @@ def test_getitem_seconds(self):
                 tm.assert_series_equal(s[d], s)
 
     def test_getitem_day(self):
-        # GH 6716
+        # GH#6716
         # Confirm DatetimeIndex and PeriodIndex works identically
-        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
-        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
+        didx = pd.date_range(start='2013/01/01', freq='D', periods=400)
+        pidx = period_range(start='2013/01/01', freq='D', periods=400)
 
         for idx in [didx, pidx]:
             # getitem against index should raise ValueError
@@ -176,16 +181,12 @@ def test_getitem_day(self):
                       '2013/02/01 09:00']
             for v in values:
 
-                if _np_version_under1p9:
-                    with tm.assertRaises(ValueError):
-                        idx[v]
-                else:
-                    # GH7116
-                    # these show deprecations as we are trying
-                    # to slice with non-integer indexers
-                    # with tm.assertRaises(IndexError):
-                    #    idx[v]
-                    continue
+                # GH7116
+                # these show deprecations as we are trying
+                # to slice with non-integer indexers
+                # with pytest.raises(IndexError):
+                #    idx[v]
+                continue
 
             s = Series(np.random.rand(len(idx)), index=idx)
             tm.assert_series_equal(s['2013/01'], s[0:31])
@@ -194,84 +195,96 @@ def test_getitem_day(self):
 
             invalid = ['2013/02/01 9H', '2013/02/01 09:00']
             for v in invalid:
-                with tm.assertRaises(KeyError):
+                with pytest.raises(KeyError):
                     s[v]
 
 
-class TestIndexing(tm.TestCase):
+class TestWhere(object):
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
+        i = period_range('20130101', periods=5, freq='D')
+        cond = [True] * len(i)
+        expected = i
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
 
-    def test_get_loc_msg(self):
-        idx = period_range('2000-1-1', freq='A', periods=10)
-        bad_period = Period('2012', 'A')
-        self.assertRaises(KeyError, idx.get_loc, bad_period)
+        cond = [False] + [True] * (len(i) - 1)
+        expected = PeriodIndex([pd.NaT] + i[1:].tolist(), freq='D')
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
 
-        try:
-            idx.get_loc(bad_period)
-        except KeyError as inst:
-            self.assertEqual(inst.args[0], bad_period)
+    def test_where_other(self):
+        i = period_range('20130101', periods=5, freq='D')
+        for arr in [np.nan, pd.NaT]:
+            result = i.where(notna(i), other=np.nan)
+            expected = i
+            tm.assert_index_equal(result, expected)
 
-    def test_get_loc_nat(self):
-        didx = DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03'])
-        pidx = PeriodIndex(['2011-01-01', 'NaT', '2011-01-03'], freq='M')
+        i2 = i.copy()
+        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
+                            freq='D')
+        result = i.where(notna(i2), i2)
+        tm.assert_index_equal(result, i2)
+
+        i2 = i.copy()
+        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
+                            freq='D')
+        result = i.where(notna(i2), i2.values)
+        tm.assert_index_equal(result, i2)
 
-        # check DatetimeIndex compat
-        for idx in [didx, pidx]:
-            self.assertEqual(idx.get_loc(pd.NaT), 1)
-            self.assertEqual(idx.get_loc(None), 1)
-            self.assertEqual(idx.get_loc(float('nan')), 1)
-            self.assertEqual(idx.get_loc(np.nan), 1)
 
+class TestTake(object):
     def test_take(self):
-        # GH 10295
+        # GH#10295
         idx1 = pd.period_range('2011-01-01', '2011-01-31', freq='D',
                                name='idx')
 
         for idx in [idx1]:
             result = idx.take([0])
-            self.assertEqual(result, pd.Period('2011-01-01', freq='D'))
+            assert result == pd.Period('2011-01-01', freq='D')
 
             result = idx.take([5])
-            self.assertEqual(result, pd.Period('2011-01-06', freq='D'))
+            assert result == pd.Period('2011-01-06', freq='D')
 
             result = idx.take([0, 1, 2])
             expected = pd.period_range('2011-01-01', '2011-01-03', freq='D',
                                        name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, 'D')
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_index_equal(result, expected)
+            assert result.freq == 'D'
+            assert result.freq == expected.freq
 
             result = idx.take([0, 2, 4])
             expected = pd.PeriodIndex(['2011-01-01', '2011-01-03',
                                        '2011-01-05'], freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx.take([7, 4, 1])
             expected = pd.PeriodIndex(['2011-01-08', '2011-01-05',
                                        '2011-01-02'],
                                       freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx.take([3, 2, 5])
             expected = PeriodIndex(['2011-01-04', '2011-01-03', '2011-01-06'],
                                    freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
             result = idx.take([-3, 2, 5])
             expected = PeriodIndex(['2011-01-29', '2011-01-03', '2011-01-06'],
                                    freq='D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-            self.assertEqual(result.freq, 'D')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+            assert result.freq == 'D'
 
     def test_take_misc(self):
-        index = PeriodIndex(start='1/1/10', end='12/31/12', freq='D',
-                            name='idx')
+        index = period_range(start='1/1/10', end='12/31/12', freq='D',
+                             name='idx')
         expected = PeriodIndex([datetime(2010, 1, 6), datetime(2010, 1, 7),
                                 datetime(2010, 1, 9), datetime(2010, 1, 13)],
                                freq='D', name='idx')
@@ -281,12 +294,12 @@ def test_take_misc(self):
 
         for taken in [taken1, taken2]:
             tm.assert_index_equal(taken, expected)
-            tm.assertIsInstance(taken, PeriodIndex)
-            self.assertEqual(taken.freq, index.freq)
-            self.assertEqual(taken.name, expected.name)
+            assert isinstance(taken, PeriodIndex)
+            assert taken.freq == index.freq
+            assert taken.name == expected.name
 
     def test_take_fill_value(self):
-        # GH 12631
+        # GH#12631
         idx = pd.PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
                              name='xxx', freq='D')
         result = idx.take(np.array([1, 0, -1]))
@@ -309,10 +322,329 @@ def test_take_fill_value(self):
 
         msg = ('When allow_fill=True and fill_value is not None, '
                'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        msg = "index -5 is out of bounds for size 3"
+        with pytest.raises(IndexError, match=msg):
             idx.take(np.array([1, -5]))
+
+
+class TestIndexing(object):
+
+    def test_get_loc_msg(self):
+        idx = period_range('2000-1-1', freq='A', periods=10)
+        bad_period = Period('2012', 'A')
+        with pytest.raises(KeyError, match=r"^Period\('2012', 'A-DEC'\)$"):
+            idx.get_loc(bad_period)
+
+        try:
+            idx.get_loc(bad_period)
+        except KeyError as inst:
+            assert inst.args[0] == bad_period
+
+    def test_get_loc_nat(self):
+        didx = DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03'])
+        pidx = PeriodIndex(['2011-01-01', 'NaT', '2011-01-03'], freq='M')
+
+        # check DatetimeIndex compat
+        for idx in [didx, pidx]:
+            assert idx.get_loc(pd.NaT) == 1
+            assert idx.get_loc(None) == 1
+            assert idx.get_loc(float('nan')) == 1
+            assert idx.get_loc(np.nan) == 1
+
+    def test_get_loc(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        # get the location of p1/p2 from
+        # monotonic increasing PeriodIndex with non-duplicate
+        idx0 = pd.PeriodIndex([p0, p1, p2])
+        expected_idx1_p1 = 1
+        expected_idx1_p2 = 2
+
+        assert idx0.get_loc(p1) == expected_idx1_p1
+        assert idx0.get_loc(str(p1)) == expected_idx1_p1
+        assert idx0.get_loc(p2) == expected_idx1_p2
+        assert idx0.get_loc(str(p2)) == expected_idx1_p2
+
+        msg = "Cannot interpret 'foo' as period"
+        with pytest.raises(KeyError, match=msg):
+            idx0.get_loc('foo')
+        with pytest.raises(KeyError, match=r"^1\.1$"):
+            idx0.get_loc(1.1)
+
+        msg = (r"'PeriodIndex\(\['2017-09-01', '2017-09-02', '2017-09-03'\],"
+               r" dtype='period\[D\]', freq='D'\)' is an invalid key")
+        with pytest.raises(TypeError, match=msg):
+            idx0.get_loc(idx0)
+
+        # get the location of p1/p2 from
+        # monotonic increasing PeriodIndex with duplicate
+        idx1 = pd.PeriodIndex([p1, p1, p2])
+        expected_idx1_p1 = slice(0, 2)
+        expected_idx1_p2 = 2
+
+        assert idx1.get_loc(p1) == expected_idx1_p1
+        assert idx1.get_loc(str(p1)) == expected_idx1_p1
+        assert idx1.get_loc(p2) == expected_idx1_p2
+        assert idx1.get_loc(str(p2)) == expected_idx1_p2
+
+        msg = "Cannot interpret 'foo' as period"
+        with pytest.raises(KeyError, match=msg):
+            idx1.get_loc('foo')
+
+        with pytest.raises(KeyError, match=r"^1\.1$"):
+            idx1.get_loc(1.1)
+
+        msg = (r"'PeriodIndex\(\['2017-09-02', '2017-09-02', '2017-09-03'\],"
+               r" dtype='period\[D\]', freq='D'\)' is an invalid key")
+        with pytest.raises(TypeError, match=msg):
+            idx1.get_loc(idx1)
+
+        # get the location of p1/p2 from
+        # non-monotonic increasing/decreasing PeriodIndex with duplicate
+        idx2 = pd.PeriodIndex([p2, p1, p2])
+        expected_idx2_p1 = 1
+        expected_idx2_p2 = np.array([True, False, True])
+
+        assert idx2.get_loc(p1) == expected_idx2_p1
+        assert idx2.get_loc(str(p1)) == expected_idx2_p1
+        tm.assert_numpy_array_equal(idx2.get_loc(p2), expected_idx2_p2)
+        tm.assert_numpy_array_equal(idx2.get_loc(str(p2)), expected_idx2_p2)
+
+    def test_is_monotonic_increasing(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx_inc0 = pd.PeriodIndex([p0, p1, p2])
+        idx_inc1 = pd.PeriodIndex([p0, p1, p1])
+        idx_dec0 = pd.PeriodIndex([p2, p1, p0])
+        idx_dec1 = pd.PeriodIndex([p2, p1, p1])
+        idx = pd.PeriodIndex([p1, p2, p0])
+
+        assert idx_inc0.is_monotonic_increasing is True
+        assert idx_inc1.is_monotonic_increasing is True
+        assert idx_dec0.is_monotonic_increasing is False
+        assert idx_dec1.is_monotonic_increasing is False
+        assert idx.is_monotonic_increasing is False
+
+    def test_is_monotonic_decreasing(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx_inc0 = pd.PeriodIndex([p0, p1, p2])
+        idx_inc1 = pd.PeriodIndex([p0, p1, p1])
+        idx_dec0 = pd.PeriodIndex([p2, p1, p0])
+        idx_dec1 = pd.PeriodIndex([p2, p1, p1])
+        idx = pd.PeriodIndex([p1, p2, p0])
+
+        assert idx_inc0.is_monotonic_decreasing is False
+        assert idx_inc1.is_monotonic_decreasing is False
+        assert idx_dec0.is_monotonic_decreasing is True
+        assert idx_dec1.is_monotonic_decreasing is True
+        assert idx.is_monotonic_decreasing is False
+
+    def test_contains(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+        p3 = pd.Period('2017-09-04')
+
+        ps0 = [p0, p1, p2]
+        idx0 = pd.PeriodIndex(ps0)
+
+        for p in ps0:
+            assert idx0.contains(p)
+            assert p in idx0
+
+            assert idx0.contains(str(p))
+            assert str(p) in idx0
+
+        assert idx0.contains('2017-09-01 00:00:01')
+        assert '2017-09-01 00:00:01' in idx0
+
+        assert idx0.contains('2017-09')
+        assert '2017-09' in idx0
+
+        assert not idx0.contains(p3)
+        assert p3 not in idx0
+
+    def test_get_value(self):
+        # GH 17717
+        p0 = pd.Period('2017-09-01')
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+
+        idx0 = pd.PeriodIndex([p0, p1, p2])
+        input0 = np.array([1, 2, 3])
+        expected0 = 2
+
+        result0 = idx0.get_value(input0, p1)
+        assert result0 == expected0
+
+        idx1 = pd.PeriodIndex([p1, p1, p2])
+        input1 = np.array([1, 2, 3])
+        expected1 = np.array([1, 2])
+
+        result1 = idx1.get_value(input1, p1)
+        tm.assert_numpy_array_equal(result1, expected1)
+
+        idx2 = pd.PeriodIndex([p1, p2, p1])
+        input2 = np.array([1, 2, 3])
+        expected2 = np.array([1, 3])
+
+        result2 = idx2.get_value(input2, p1)
+        tm.assert_numpy_array_equal(result2, expected2)
+
+    def test_get_indexer(self):
+        # GH 17717
+        p1 = pd.Period('2017-09-01')
+        p2 = pd.Period('2017-09-04')
+        p3 = pd.Period('2017-09-07')
+
+        tp0 = pd.Period('2017-08-31')
+        tp1 = pd.Period('2017-09-02')
+        tp2 = pd.Period('2017-09-05')
+        tp3 = pd.Period('2017-09-09')
+
+        idx = pd.PeriodIndex([p1, p2, p3])
+
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.PeriodIndex([tp0, tp1, tp2, tp3])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2, -1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 0, 1, 2], dtype=np.intp))
+
+        res = idx.get_indexer(target, 'nearest',
+                              tolerance=pd.Timedelta('1 day'))
+        tm.assert_numpy_array_equal(res,
+                                    np.array([0, 0, 1, -1], dtype=np.intp))
+
+    def test_get_indexer_non_unique(self):
+        # GH 17717
+        p1 = pd.Period('2017-09-02')
+        p2 = pd.Period('2017-09-03')
+        p3 = pd.Period('2017-09-04')
+        p4 = pd.Period('2017-09-05')
+
+        idx1 = pd.PeriodIndex([p1, p2, p1])
+        idx2 = pd.PeriodIndex([p2, p1, p3, p4])
+
+        result = idx1.get_indexer_non_unique(idx2)
+        expected_indexer = np.array([1, 0, 2, -1, -1], dtype=np.intp)
+        expected_missing = np.array([2, 3], dtype=np.int64)
+
+        tm.assert_numpy_array_equal(result[0], expected_indexer)
+        tm.assert_numpy_array_equal(result[1], expected_missing)
+
+    # TODO: This method came from test_period; de-dup with version above
+    def test_get_loc2(self):
+        idx = pd.period_range('2000-01-01', periods=3)
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].asfreq('H', how='start'), method) == 1
+            assert idx.get_loc(idx[1].to_timestamp(), method) == 1
+            assert idx.get_loc(idx[1].to_timestamp()
+                               .to_pydatetime(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+        idx = pd.period_range('2000-01-01', periods=5)[::2]
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance='1 day') == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=pd.Timedelta('1D')) == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=np.timedelta64(1, 'D')) == 1
+        assert idx.get_loc('2000-01-02T12', method='nearest',
+                           tolerance=timedelta(1)) == 1
+
+        msg = 'unit abbreviation w/o a number'
+        with pytest.raises(ValueError, match=msg):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='foo')
+
+        msg = 'Input has different freq=None from PeriodArray\\(freq=D\\)'
+        with pytest.raises(ValueError, match=msg):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='1 hour')
+        with pytest.raises(KeyError, match=r"^Period\('2000-01-10', 'D'\)$"):
+            idx.get_loc('2000-01-10', method='nearest', tolerance='1 day')
+        with pytest.raises(
+                ValueError,
+                match='list-like tolerance size must match target index size'):
+            idx.get_loc('2000-01-10', method='nearest',
+                        tolerance=[pd.Timedelta('1 day').to_timedelta64(),
+                                   pd.Timedelta('1 day').to_timedelta64()])
+
+    # TODO: This method came from test_period; de-dup with version above
+    def test_get_indexer2(self):
+        idx = pd.period_range('2000-01-01', periods=3).asfreq('H', how='start')
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.PeriodIndex(['1999-12-31T23', '2000-01-01T12',
+                                 '2000-01-02T01'], freq='H')
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
+                                                    tolerance='1 hour'),
+                                    np.array([0, -1, 1], dtype=np.intp))
+
+        msg = 'Input has different freq=None from PeriodArray\\(freq=H\\)'
+        with pytest.raises(ValueError, match=msg):
+            idx.get_indexer(target, 'nearest', tolerance='1 minute')
+
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
+                                                    tolerance='1 day'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+        tol_raw = [pd.Timedelta('1 hour'),
+                   pd.Timedelta('1 hour'),
+                   np.timedelta64(1, 'D'), ]
+        tm.assert_numpy_array_equal(
+            idx.get_indexer(target, 'nearest',
+                            tolerance=[np.timedelta64(x) for x in tol_raw]),
+            np.array([0, -1, 1], dtype=np.intp))
+        tol_bad = [pd.Timedelta('2 hour').to_timedelta64(),
+                   pd.Timedelta('1 hour').to_timedelta64(),
+                   np.timedelta64(1, 'M'), ]
+        with pytest.raises(
+                libperiod.IncompatibleFrequency,
+                match='Input has different freq=None from'):
+            idx.get_indexer(target, 'nearest', tolerance=tol_bad)
+
+    def test_indexing(self):
+        # GH 4390, iat incorrectly indexing
+        index = period_range('1/1/2001', periods=10)
+        s = Series(np.random.randn(10), index=index)
+        expected = s[index[0]]
+        result = s.iat[0]
+        assert expected == result
+
+    def test_period_index_indexer(self):
+        # GH4125
+        idx = pd.period_range('2002-01', '2003-12', freq='M')
+        df = pd.DataFrame(pd.np.random.randn(24, 10), index=idx)
+        tm.assert_frame_equal(df, df.loc[idx])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
+        tm.assert_frame_equal(df.iloc[0:5], df.loc[idx[0:5]])
+        tm.assert_frame_equal(df, df.loc[list(idx)])
diff --git a/pandas/tests/indexes/period/test_ops.py b/pandas/tests/indexes/period/test_ops.py
index 3b94992f2fe9f..8b022268897b6 100644
--- a/pandas/tests/indexes/period/test_ops.py
+++ b/pandas/tests/indexes/period/test_ops.py
@@ -1,20 +1,18 @@
+
 import numpy as np
-from datetime import timedelta
+import pytest
 
 import pandas as pd
-import pandas._libs.tslib as tslib
-import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas import (DatetimeIndex, PeriodIndex, period_range, Series, Period,
-                    _np_version_under1p10, Index, Timedelta, offsets)
-
+from pandas import DatetimeIndex, Index, NaT, PeriodIndex, Series
+from pandas.core.arrays import PeriodArray
 from pandas.tests.test_base import Ops
+import pandas.util.testing as tm
 
 
 class TestPeriodIndexOps(Ops):
 
-    def setUp(self):
-        super(TestPeriodIndexOps, self).setUp()
+    def setup_method(self, method):
+        super(TestPeriodIndexOps, self).setup_method(method)
         mask = lambda x: (isinstance(x, DatetimeIndex) or
                           isinstance(x, PeriodIndex))
         self.is_valid_objs = [o for o in self.objs if mask(o)]
@@ -22,255 +20,9 @@ def setUp(self):
 
     def test_ops_properties(self):
         f = lambda x: isinstance(x, PeriodIndex)
-        self.check_ops_properties(PeriodIndex._field_ops, f)
-        self.check_ops_properties(PeriodIndex._object_ops, f)
-        self.check_ops_properties(PeriodIndex._bool_ops, f)
-
-    def test_asobject_tolist(self):
-        idx = pd.period_range(start='2013-01-01', periods=4, freq='M',
-                              name='idx')
-        expected_list = [pd.Period('2013-01-31', freq='M'),
-                         pd.Period('2013-02-28', freq='M'),
-                         pd.Period('2013-03-31', freq='M'),
-                         pd.Period('2013-04-30', freq='M')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = PeriodIndex(['2013-01-01', '2013-01-02', 'NaT',
-                           '2013-01-04'], freq='D', name='idx')
-        expected_list = [pd.Period('2013-01-01', freq='D'),
-                         pd.Period('2013-01-02', freq='D'),
-                         pd.Period('NaT', freq='D'),
-                         pd.Period('2013-01-04', freq='D')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        tm.assert_index_equal(result, expected)
-        for i in [0, 1, 3]:
-            self.assertEqual(result[i], expected[i])
-        self.assertIs(result[2], pd.NaT)
-        self.assertEqual(result.name, expected.name)
-
-        result_list = idx.tolist()
-        for i in [0, 1, 3]:
-            self.assertEqual(result_list[i], expected_list[i])
-        self.assertIs(result_list[2], pd.NaT)
-
-    def test_minmax(self):
-
-        # monotonic
-        idx1 = pd.PeriodIndex([pd.NaT, '2011-01-01', '2011-01-02',
-                               '2011-01-03'], freq='D')
-        self.assertTrue(idx1.is_monotonic)
-
-        # non-monotonic
-        idx2 = pd.PeriodIndex(['2011-01-01', pd.NaT, '2011-01-03',
-                               '2011-01-02', pd.NaT], freq='D')
-        self.assertFalse(idx2.is_monotonic)
-
-        for idx in [idx1, idx2]:
-            self.assertEqual(idx.min(), pd.Period('2011-01-01', freq='D'))
-            self.assertEqual(idx.max(), pd.Period('2011-01-03', freq='D'))
-        self.assertEqual(idx1.argmin(), 1)
-        self.assertEqual(idx2.argmin(), 0)
-        self.assertEqual(idx1.argmax(), 3)
-        self.assertEqual(idx2.argmax(), 2)
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = PeriodIndex([], freq='M')
-            result = getattr(obj, op)()
-            self.assertIs(result, tslib.NaT)
-
-            obj = PeriodIndex([pd.NaT], freq='M')
-            result = getattr(obj, op)()
-            self.assertIs(result, tslib.NaT)
-
-            obj = PeriodIndex([pd.NaT, pd.NaT, pd.NaT], freq='M')
-            result = getattr(obj, op)()
-            self.assertIs(result, tslib.NaT)
-
-    def test_numpy_minmax(self):
-        pr = pd.period_range(start='2016-01-15', end='2016-01-20')
-
-        self.assertEqual(np.min(pr), Period('2016-01-15', freq='D'))
-        self.assertEqual(np.max(pr), Period('2016-01-20', freq='D'))
-
-        errmsg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, errmsg, np.min, pr, out=0)
-        tm.assertRaisesRegexp(ValueError, errmsg, np.max, pr, out=0)
-
-        self.assertEqual(np.argmin(pr), 0)
-        self.assertEqual(np.argmax(pr), 5)
-
-        if not _np_version_under1p10:
-            errmsg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmin, pr, out=0)
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmax, pr, out=0)
-
-    def test_representation(self):
-        # GH 7601
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
-                           freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00',
-                            'NaT'], freq='H')
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-        idx10 = PeriodIndex(['2011-01-01', '2011-02-01'], freq='3D')
-
-        exp1 = """PeriodIndex([], dtype='period[D]', freq='D')"""
-
-        exp2 = """PeriodIndex(['2011-01-01'], dtype='period[D]', freq='D')"""
-
-        exp3 = ("PeriodIndex(['2011-01-01', '2011-01-02'], dtype='period[D]', "
-                "freq='D')")
-
-        exp4 = ("PeriodIndex(['2011-01-01', '2011-01-02', '2011-01-03'], "
-                "dtype='period[D]', freq='D')")
-
-        exp5 = ("PeriodIndex(['2011', '2012', '2013'], dtype='period[A-DEC]', "
-                "freq='A-DEC')")
-
-        exp6 = ("PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], "
-                "dtype='period[H]', freq='H')")
-
-        exp7 = ("PeriodIndex(['2013Q1'], dtype='period[Q-DEC]', "
-                "freq='Q-DEC')")
-
-        exp8 = ("PeriodIndex(['2013Q1', '2013Q2'], dtype='period[Q-DEC]', "
-                "freq='Q-DEC')")
-
-        exp9 = ("PeriodIndex(['2013Q1', '2013Q2', '2013Q3'], "
-                "dtype='period[Q-DEC]', freq='Q-DEC')")
-
-        exp10 = ("PeriodIndex(['2011-01-01', '2011-02-01'], "
-                 "dtype='period[3D]', freq='3D')")
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
-                                  idx6, idx7, idx8, idx9, idx10],
-                                 [exp1, exp2, exp3, exp4, exp5,
-                                  exp6, exp7, exp8, exp9, exp10]):
-            for func in ['__repr__', '__unicode__', '__str__']:
-                result = getattr(idx, func)()
-                self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        # GH 10971
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(['2011-01-01', '2011-01-02',
-                            '2011-01-03'], freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(['2011-01-01 09:00', '2012-02-01 10:00',
-                            'NaT'], freq='H')
-
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-
-        exp1 = """Series([], dtype: object)"""
-
-        exp2 = """0   2011-01-01
-dtype: object"""
-
-        exp3 = """0   2011-01-01
-1   2011-01-02
-dtype: object"""
-
-        exp4 = """0   2011-01-01
-1   2011-01-02
-2   2011-01-03
-dtype: object"""
-
-        exp5 = """0   2011
-1   2012
-2   2013
-dtype: object"""
-
-        exp6 = """0   2011-01-01 09:00
-1   2012-02-01 10:00
-2                NaT
-dtype: object"""
-
-        exp7 = """0   2013Q1
-dtype: object"""
-
-        exp8 = """0   2013Q1
-1   2013Q2
-dtype: object"""
-
-        exp9 = """0   2013Q1
-1   2013Q2
-2   2013Q3
-dtype: object"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
-                                  idx6, idx7, idx8, idx9],
-                                 [exp1, exp2, exp3, exp4, exp5,
-                                  exp6, exp7, exp8, exp9]):
-            result = repr(pd.Series(idx))
-            self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = PeriodIndex([], freq='D')
-        idx2 = PeriodIndex(['2011-01-01'], freq='D')
-        idx3 = PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        idx4 = PeriodIndex(
-            ['2011-01-01', '2011-01-02', '2011-01-03'], freq='D')
-        idx5 = PeriodIndex(['2011', '2012', '2013'], freq='A')
-        idx6 = PeriodIndex(
-            ['2011-01-01 09:00', '2012-02-01 10:00', 'NaT'], freq='H')
-
-        idx7 = pd.period_range('2013Q1', periods=1, freq="Q")
-        idx8 = pd.period_range('2013Q1', periods=2, freq="Q")
-        idx9 = pd.period_range('2013Q1', periods=3, freq="Q")
-
-        exp1 = """PeriodIndex: 0 entries
-Freq: D"""
-
-        exp2 = """PeriodIndex: 1 entries, 2011-01-01 to 2011-01-01
-Freq: D"""
-
-        exp3 = """PeriodIndex: 2 entries, 2011-01-01 to 2011-01-02
-Freq: D"""
-
-        exp4 = """PeriodIndex: 3 entries, 2011-01-01 to 2011-01-03
-Freq: D"""
-
-        exp5 = """PeriodIndex: 3 entries, 2011 to 2013
-Freq: A-DEC"""
-
-        exp6 = """PeriodIndex: 3 entries, 2011-01-01 09:00 to NaT
-Freq: H"""
-
-        exp7 = """PeriodIndex: 1 entries, 2013Q1 to 2013Q1
-Freq: Q-DEC"""
-
-        exp8 = """PeriodIndex: 2 entries, 2013Q1 to 2013Q2
-Freq: Q-DEC"""
-
-        exp9 = """PeriodIndex: 3 entries, 2013Q1 to 2013Q3
-Freq: Q-DEC"""
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5,
-                                  idx6, idx7, idx8, idx9],
-                                 [exp1, exp2, exp3, exp4, exp5,
-                                  exp6, exp7, exp8, exp9]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
+        self.check_ops_properties(PeriodArray._field_ops, f)
+        self.check_ops_properties(PeriodArray._object_ops, f)
+        self.check_ops_properties(PeriodArray._bool_ops, f)
 
     def test_resolution(self):
         for freq, expected in zip(['A', 'Q', 'M', 'D', 'H',
@@ -280,239 +32,13 @@ def test_resolution(self):
                                    'millisecond', 'microsecond']):
 
             idx = pd.period_range(start='2013-04-01', periods=30, freq=freq)
-            self.assertEqual(idx.resolution, expected)
-
-    def test_add_iadd(self):
-        rng = pd.period_range('1/1/2000', freq='D', periods=5)
-        other = pd.period_range('1/6/2000', freq='D', periods=5)
-
-        # previously performed setop union, now raises TypeError (GH14164)
-        with tm.assertRaises(TypeError):
-            rng + other
-
-        with tm.assertRaises(TypeError):
-            rng += other
-
-        # offset
-        # DateOffset
-        rng = pd.period_range('2014', '2024', freq='A')
-        result = rng + pd.offsets.YearEnd(5)
-        expected = pd.period_range('2019', '2029', freq='A')
-        tm.assert_index_equal(result, expected)
-        rng += pd.offsets.YearEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(365, 'D'),
-                  timedelta(365), Timedelta(days=365)]:
-            msg = ('Input has different freq(=.+)? '
-                   'from PeriodIndex\\(freq=A-DEC\\)')
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng + o
-
-        rng = pd.period_range('2014-01', '2016-12', freq='M')
-        result = rng + pd.offsets.MonthEnd(5)
-        expected = pd.period_range('2014-06', '2017-05', freq='M')
-        tm.assert_index_equal(result, expected)
-        rng += pd.offsets.MonthEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(365, 'D'),
-                  timedelta(365), Timedelta(days=365)]:
-            rng = pd.period_range('2014-01', '2016-12', freq='M')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=M\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng + o
-
-        # Tick
-        offsets = [pd.offsets.Day(3), timedelta(days=3),
-                   np.timedelta64(3, 'D'), pd.offsets.Hour(72),
-                   timedelta(minutes=60 * 24 * 3), np.timedelta64(72, 'h'),
-                   Timedelta('72:00:00')]
-        for delta in offsets:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            result = rng + delta
-            expected = pd.period_range('2014-05-04', '2014-05-18', freq='D')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(4, 'h'),
-                  timedelta(hours=23), Timedelta('23:00:00')]:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=D\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng + o
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'), pd.offsets.Minute(120),
-                   timedelta(minutes=120), np.timedelta64(120, 'm'),
-                   Timedelta(minutes=120)]
-        for delta in offsets:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00',
-                                  freq='H')
-            result = rng + delta
-            expected = pd.period_range('2014-01-01 12:00', '2014-01-05 12:00',
-                                       freq='H')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        for delta in [pd.offsets.YearBegin(2), timedelta(minutes=30),
-                      np.timedelta64(30, 's'), Timedelta(seconds=30)]:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00',
-                                  freq='H')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=H\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                result = rng + delta
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng += delta
-
-        # int
-        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
-        result = rng + 1
-        expected = pd.period_range('2000-01-01 10:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng += 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_sub(self):
-        rng = period_range('2007-01', periods=50)
-
-        result = rng - 5
-        exp = rng + (-5)
-        tm.assert_index_equal(result, exp)
-
-    def test_sub_isub(self):
-
-        # previously performed setop, now raises TypeError (GH14164)
-        # TODO needs to wait on #13077 for decision on result type
-        rng = pd.period_range('1/1/2000', freq='D', periods=5)
-        other = pd.period_range('1/6/2000', freq='D', periods=5)
-
-        with tm.assertRaises(TypeError):
-            rng - other
-
-        with tm.assertRaises(TypeError):
-            rng -= other
-
-        # offset
-        # DateOffset
-        rng = pd.period_range('2014', '2024', freq='A')
-        result = rng - pd.offsets.YearEnd(5)
-        expected = pd.period_range('2009', '2019', freq='A')
-        tm.assert_index_equal(result, expected)
-        rng -= pd.offsets.YearEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(365, 'D'),
-                  timedelta(365)]:
-            rng = pd.period_range('2014', '2024', freq='A')
-            msg = ('Input has different freq(=.+)? '
-                   'from PeriodIndex\\(freq=A-DEC\\)')
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng - o
-
-        rng = pd.period_range('2014-01', '2016-12', freq='M')
-        result = rng - pd.offsets.MonthEnd(5)
-        expected = pd.period_range('2013-08', '2016-07', freq='M')
-        tm.assert_index_equal(result, expected)
-        rng -= pd.offsets.MonthEnd(5)
-        tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(365, 'D'),
-                  timedelta(365)]:
-            rng = pd.period_range('2014-01', '2016-12', freq='M')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=M\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng - o
-
-        # Tick
-        offsets = [pd.offsets.Day(3), timedelta(days=3),
-                   np.timedelta64(3, 'D'), pd.offsets.Hour(72),
-                   timedelta(minutes=60 * 24 * 3), np.timedelta64(72, 'h')]
-        for delta in offsets:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            result = rng - delta
-            expected = pd.period_range('2014-04-28', '2014-05-12', freq='D')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        for o in [pd.offsets.YearBegin(2), pd.offsets.MonthBegin(1),
-                  pd.offsets.Minute(), np.timedelta64(4, 'h'),
-                  timedelta(hours=23)]:
-            rng = pd.period_range('2014-05-01', '2014-05-15', freq='D')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=D\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng - o
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'), pd.offsets.Minute(120),
-                   timedelta(minutes=120), np.timedelta64(120, 'm')]
-        for delta in offsets:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00',
-                                  freq='H')
-            result = rng - delta
-            expected = pd.period_range('2014-01-01 08:00', '2014-01-05 08:00',
-                                       freq='H')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        for delta in [pd.offsets.YearBegin(2), timedelta(minutes=30),
-                      np.timedelta64(30, 's')]:
-            rng = pd.period_range('2014-01-01 10:00', '2014-01-05 10:00',
-                                  freq='H')
-            msg = 'Input has different freq(=.+)? from PeriodIndex\\(freq=H\\)'
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                result = rng + delta
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                rng += delta
-
-        # int
-        rng = pd.period_range('2000-01-01 09:00', freq='H', periods=10)
-        result = rng - 1
-        expected = pd.period_range('2000-01-01 08:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng -= 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_comp_nat(self):
-        left = pd.PeriodIndex([pd.Period('2011-01-01'), pd.NaT,
-                               pd.Period('2011-01-03')])
-        right = pd.PeriodIndex([pd.NaT, pd.NaT, pd.Period('2011-01-03')])
-
-        for l, r in [(left, right), (left.asobject, right.asobject)]:
-            result = l == r
-            expected = np.array([False, False, True])
-            tm.assert_numpy_array_equal(result, expected)
-
-            result = l != r
-            expected = np.array([True, True, False])
-            tm.assert_numpy_array_equal(result, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l == pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT == r, expected)
-
-            expected = np.array([True, True, True])
-            tm.assert_numpy_array_equal(l != pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT != l, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l < pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT > l, expected)
+            assert idx.resolution == expected
 
     def test_value_counts_unique(self):
         # GH 7735
         idx = pd.period_range('2011-01-01 09:00', freq='H', periods=10)
         # create repeated values, 'n'th element is repeated by n+1 times
-        idx = PeriodIndex(np.repeat(idx.values, range(1, len(idx) + 1)),
+        idx = PeriodIndex(np.repeat(idx._values, range(1, len(idx) + 1)),
                           freq='H')
 
         exp_idx = PeriodIndex(['2011-01-01 18:00', '2011-01-01 17:00',
@@ -532,7 +58,7 @@ def test_value_counts_unique(self):
 
         idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 09:00',
                            '2013-01-01 09:00', '2013-01-01 08:00',
-                           '2013-01-01 08:00', pd.NaT], freq='H')
+                           '2013-01-01 08:00', NaT], freq='H')
 
         exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00'],
                               freq='H')
@@ -542,7 +68,7 @@ def test_value_counts_unique(self):
             tm.assert_series_equal(obj.value_counts(), expected)
 
         exp_idx = PeriodIndex(['2013-01-01 09:00', '2013-01-01 08:00',
-                               pd.NaT], freq='H')
+                               NaT], freq='H')
         expected = Series([3, 2, 1], index=exp_idx)
 
         for obj in [idx, Series(idx)]:
@@ -554,13 +80,13 @@ def test_drop_duplicates_metadata(self):
         # GH 10115
         idx = pd.period_range('2011-01-01', '2011-01-31', freq='D', name='idx')
         result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
 
         idx_dup = idx.append(idx)  # freq will not be reset
         result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
 
     def test_drop_duplicates(self):
         # to check Index/Series compat
@@ -587,33 +113,31 @@ def test_drop_duplicates(self):
     def test_order_compat(self):
         def _check_freq(index, expected_index):
             if isinstance(index, PeriodIndex):
-                self.assertEqual(index.freq, expected_index.freq)
+                assert index.freq == expected_index.freq
 
         pidx = PeriodIndex(['2011', '2012', '2013'], name='pidx', freq='A')
         # for compatibility check
         iidx = Index([2011, 2012, 2013], name='idx')
         for idx in [pidx, iidx]:
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
+            tm.assert_index_equal(ordered, idx)
             _check_freq(ordered, idx)
 
             ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
+            tm.assert_index_equal(ordered, idx[::-1])
             _check_freq(ordered, idx[::-1])
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([0, 1, 2]),
-                                          check_dtype=False)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
             _check_freq(ordered, idx)
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([2, 1, 0]),
-                                          check_dtype=False)
+            tm.assert_index_equal(ordered, idx[::-1])
+            tm.assert_numpy_array_equal(indexer, np.array([2, 1, 0]),
+                                        check_dtype=False)
             _check_freq(ordered, idx[::-1])
 
         pidx = PeriodIndex(['2011', '2013', '2015', '2012',
@@ -625,27 +149,26 @@ def _check_freq(index, expected_index):
         iexpected = Index([2011, 2011, 2012, 2013, 2015], name='idx')
         for idx, expected in [(pidx, pexpected), (iidx, iexpected)]:
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
+            tm.assert_index_equal(ordered, expected)
             _check_freq(ordered, idx)
 
             ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
+            tm.assert_index_equal(ordered, expected[::-1])
             _check_freq(ordered, idx)
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
+            tm.assert_index_equal(ordered, expected)
 
             exp = np.array([0, 4, 3, 1, 2])
-            self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
             _check_freq(ordered, idx)
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
+            tm.assert_index_equal(ordered, expected[::-1])
 
             exp = np.array([2, 1, 3, 4, 0])
-            self.assert_numpy_array_equal(indexer, exp,
-                                          check_dtype=False)
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
             _check_freq(ordered, idx)
 
         pidx = PeriodIndex(['2011', '2013', 'NaT', '2011'], name='pidx',
@@ -654,14 +177,14 @@ def _check_freq(index, expected_index):
         result = pidx.sort_values()
         expected = PeriodIndex(['NaT', '2011', '2011', '2013'],
                                name='pidx', freq='D')
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.freq, 'D')
+        tm.assert_index_equal(result, expected)
+        assert result.freq == 'D'
 
         result = pidx.sort_values(ascending=False)
         expected = PeriodIndex(
             ['2013', '2011', '2011', 'NaT'], name='pidx', freq='D')
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.freq, 'D')
+        tm.assert_index_equal(result, expected)
+        assert result.freq == 'D'
 
     def test_order(self):
         for freq in ['D', '2D', '4D']:
@@ -669,32 +192,30 @@ def test_order(self):
                               freq=freq, name='idx')
 
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
+            tm.assert_index_equal(ordered, idx)
+            assert ordered.freq == idx.freq
 
             ordered = idx.sort_values(ascending=False)
             expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq, freq)
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == expected.freq
+            assert ordered.freq == freq
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([0, 1, 2]),
-                                          check_dtype=False)
-            self.assertEqual(ordered.freq, idx.freq)
-            self.assertEqual(ordered.freq, freq)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
+            assert ordered.freq == idx.freq
+            assert ordered.freq == freq
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
             expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([2, 1, 0]),
-                                          check_dtype=False)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq, freq)
+            tm.assert_index_equal(ordered, expected)
+            tm.assert_numpy_array_equal(indexer, np.array([2, 1, 0]),
+                                        check_dtype=False)
+            assert ordered.freq == expected.freq
+            assert ordered.freq == freq
 
         idx1 = PeriodIndex(['2011-01-01', '2011-01-03', '2011-01-05',
                             '2011-01-02', '2011-01-01'], freq='D', name='idx1')
@@ -708,620 +229,101 @@ def test_order(self):
                             '2011-01-03', '2011-01-05'],
                            freq='D', name='idx2')
 
-        idx3 = PeriodIndex([pd.NaT, '2011-01-03', '2011-01-05',
-                            '2011-01-02', pd.NaT], freq='D', name='idx3')
-        exp3 = PeriodIndex([pd.NaT, pd.NaT, '2011-01-02', '2011-01-03',
+        idx3 = PeriodIndex([NaT, '2011-01-03', '2011-01-05',
+                            '2011-01-02', NaT], freq='D', name='idx3')
+        exp3 = PeriodIndex([NaT, NaT, '2011-01-02', '2011-01-03',
                             '2011-01-05'], freq='D', name='idx3')
 
         for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3)]:
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, 'D')
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == 'D'
 
             ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assertEqual(ordered.freq, 'D')
+            tm.assert_index_equal(ordered, expected[::-1])
+            assert ordered.freq == 'D'
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
+            tm.assert_index_equal(ordered, expected)
 
             exp = np.array([0, 4, 3, 1, 2])
-            self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-            self.assertEqual(ordered.freq, 'D')
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq == 'D'
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
+            tm.assert_index_equal(ordered, expected[::-1])
 
             exp = np.array([2, 1, 3, 4, 0])
-            self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-            self.assertEqual(ordered.freq, 'D')
-
-    def test_nat_new(self):
-
-        idx = pd.period_range('2011-01', freq='M', periods=5, name='x')
-        result = idx._nat_new()
-        exp = pd.PeriodIndex([pd.NaT] * 5, freq='M', name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx._nat_new(box=False)
-        exp = np.array([tslib.iNaT] * 5, dtype=np.int64)
-        tm.assert_numpy_array_equal(result, exp)
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq == 'D'
 
     def test_shift(self):
-        # GH 9903
-        idx = pd.PeriodIndex([], name='xxx', freq='H')
-
-        with tm.assertRaises(TypeError):
-            # period shift doesn't accept freq
-            idx.shift(1, freq='H')
-
-        tm.assert_index_equal(idx.shift(0), idx)
-        tm.assert_index_equal(idx.shift(3), idx)
-
-        idx = pd.PeriodIndex(['2011-01-01 10:00', '2011-01-01 11:00'
-                              '2011-01-01 12:00'], name='xxx', freq='H')
-        tm.assert_index_equal(idx.shift(0), idx)
-        exp = pd.PeriodIndex(['2011-01-01 13:00', '2011-01-01 14:00'
-                              '2011-01-01 15:00'], name='xxx', freq='H')
-        tm.assert_index_equal(idx.shift(3), exp)
-        exp = pd.PeriodIndex(['2011-01-01 07:00', '2011-01-01 08:00'
-                              '2011-01-01 09:00'], name='xxx', freq='H')
-        tm.assert_index_equal(idx.shift(-3), exp)
-
-    def test_repeat(self):
-        index = pd.period_range('2001-01-01', periods=2, freq='D')
-        exp = pd.PeriodIndex(['2001-01-01', '2001-01-01',
-                              '2001-01-02', '2001-01-02'], freq='D')
-        for res in [index.repeat(2), np.repeat(index, 2)]:
-            tm.assert_index_equal(res, exp)
-
-        index = pd.period_range('2001-01-01', periods=2, freq='2D')
-        exp = pd.PeriodIndex(['2001-01-01', '2001-01-01',
-                              '2001-01-03', '2001-01-03'], freq='2D')
-        for res in [index.repeat(2), np.repeat(index, 2)]:
-            tm.assert_index_equal(res, exp)
-
-        index = pd.PeriodIndex(['2001-01', 'NaT', '2003-01'], freq='M')
-        exp = pd.PeriodIndex(['2001-01', '2001-01', '2001-01',
-                              'NaT', 'NaT', 'NaT',
-                              '2003-01', '2003-01', '2003-01'], freq='M')
-        for res in [index.repeat(3), np.repeat(index, 3)]:
-            tm.assert_index_equal(res, exp)
+        # This is tested in test_arithmetic
+        pass
 
     def test_nat(self):
-        self.assertIs(pd.PeriodIndex._na_value, pd.NaT)
-        self.assertIs(pd.PeriodIndex([], freq='M')._na_value, pd.NaT)
+        assert pd.PeriodIndex._na_value is NaT
+        assert pd.PeriodIndex([], freq='M')._na_value is NaT
 
         idx = pd.PeriodIndex(['2011-01-01', '2011-01-02'], freq='D')
-        self.assertTrue(idx._can_hold_na)
+        assert idx._can_hold_na
 
         tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
-        self.assertFalse(idx.hasnans)
+        assert idx.hasnans is False
         tm.assert_numpy_array_equal(idx._nan_idxs,
                                     np.array([], dtype=np.intp))
 
         idx = pd.PeriodIndex(['2011-01-01', 'NaT'], freq='D')
-        self.assertTrue(idx._can_hold_na)
+        assert idx._can_hold_na
 
         tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
-        self.assertTrue(idx.hasnans)
+        assert idx.hasnans is True
         tm.assert_numpy_array_equal(idx._nan_idxs,
                                     np.array([1], dtype=np.intp))
 
-    def test_equals(self):
-        # GH 13107
-        for freq in ['D', 'M']:
-            idx = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
-                                 freq=freq)
-            self.assertTrue(idx.equals(idx))
-            self.assertTrue(idx.equals(idx.copy()))
-            self.assertTrue(idx.equals(idx.asobject))
-            self.assertTrue(idx.asobject.equals(idx))
-            self.assertTrue(idx.asobject.equals(idx.asobject))
-            self.assertFalse(idx.equals(list(idx)))
-            self.assertFalse(idx.equals(pd.Series(idx)))
-
-            idx2 = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
-                                  freq='H')
-            self.assertFalse(idx.equals(idx2))
-            self.assertFalse(idx.equals(idx2.copy()))
-            self.assertFalse(idx.equals(idx2.asobject))
-            self.assertFalse(idx.asobject.equals(idx2))
-            self.assertFalse(idx.equals(list(idx2)))
-            self.assertFalse(idx.equals(pd.Series(idx2)))
-
-            # same internal, different tz
-            idx3 = pd.PeriodIndex._simple_new(idx.asi8, freq='H')
-            tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
-            self.assertFalse(idx.equals(idx3))
-            self.assertFalse(idx.equals(idx3.copy()))
-            self.assertFalse(idx.equals(idx3.asobject))
-            self.assertFalse(idx.asobject.equals(idx3))
-            self.assertFalse(idx.equals(list(idx3)))
-            self.assertFalse(idx.equals(pd.Series(idx3)))
-
-
-class TestPeriodIndexSeriesMethods(tm.TestCase):
-    """ Test PeriodIndex and Period Series Ops consistency """
-
-    def _check(self, values, func, expected):
-        idx = pd.PeriodIndex(values)
-        result = func(idx)
-        if isinstance(expected, pd.Index):
-            tm.assert_index_equal(result, expected)
-        else:
-            # comp op results in bool
-            tm.assert_numpy_array_equal(result, expected)
-
-        s = pd.Series(values)
-        result = func(s)
-
-        exp = pd.Series(expected, name=values.name)
-        tm.assert_series_equal(result, exp)
-
-    def test_pi_ops(self):
-        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-
-        expected = PeriodIndex(['2011-03', '2011-04',
-                                '2011-05', '2011-06'], freq='M', name='idx')
-        self._check(idx, lambda x: x + 2, expected)
-        self._check(idx, lambda x: 2 + x, expected)
-
-        self._check(idx + 2, lambda x: x - 2, idx)
-        result = idx - Period('2011-01', freq='M')
-        exp = pd.Index([0, 1, 2, 3], name='idx')
-        tm.assert_index_equal(result, exp)
-
-        result = Period('2011-01', freq='M') - idx
-        exp = pd.Index([0, -1, -2, -3], name='idx')
-        tm.assert_index_equal(result, exp)
-
-    def test_pi_ops_errors(self):
-        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-        s = pd.Series(idx)
-
-        msg = r"unsupported operand type\(s\)"
-
-        for obj in [idx, s]:
-            for ng in ["str", 1.5]:
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    obj + ng
-
-                with tm.assertRaises(TypeError):
-                    # error message differs between PY2 and 3
-                    ng + obj
-
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    obj - ng
-
-                with tm.assertRaises(TypeError):
-                    np.add(obj, ng)
-
-                if _np_version_under1p10:
-                    self.assertIs(np.add(ng, obj), NotImplemented)
-                else:
-                    with tm.assertRaises(TypeError):
-                        np.add(ng, obj)
-
-                with tm.assertRaises(TypeError):
-                    np.subtract(obj, ng)
-
-                if _np_version_under1p10:
-                    self.assertIs(np.subtract(ng, obj), NotImplemented)
-                else:
-                    with tm.assertRaises(TypeError):
-                        np.subtract(ng, obj)
-
-    def test_pi_ops_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        expected = PeriodIndex(['2011-03', '2011-04',
-                                'NaT', '2011-06'], freq='M', name='idx')
-        self._check(idx, lambda x: x + 2, expected)
-        self._check(idx, lambda x: 2 + x, expected)
-        self._check(idx, lambda x: np.add(x, 2), expected)
-
-        self._check(idx + 2, lambda x: x - 2, idx)
-        self._check(idx + 2, lambda x: np.subtract(x, 2), idx)
-
-        # freq with mult
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='2M', name='idx')
-        expected = PeriodIndex(['2011-07', '2011-08',
-                                'NaT', '2011-10'], freq='2M', name='idx')
-        self._check(idx, lambda x: x + 3, expected)
-        self._check(idx, lambda x: 3 + x, expected)
-        self._check(idx, lambda x: np.add(x, 3), expected)
-
-        self._check(idx + 3, lambda x: x - 3, idx)
-        self._check(idx + 3, lambda x: np.subtract(x, 3), idx)
-
-    def test_pi_ops_array_int(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        f = lambda x: x + np.array([1, 2, 3, 4])
-        exp = PeriodIndex(['2011-02', '2011-04', 'NaT',
-                           '2011-08'], freq='M', name='idx')
-        self._check(idx, f, exp)
-
-        f = lambda x: np.add(x, np.array([4, -1, 1, 2]))
-        exp = PeriodIndex(['2011-05', '2011-01', 'NaT',
-                           '2011-06'], freq='M', name='idx')
-        self._check(idx, f, exp)
-
-        f = lambda x: x - np.array([1, 2, 3, 4])
-        exp = PeriodIndex(['2010-12', '2010-12', 'NaT',
-                           '2010-12'], freq='M', name='idx')
-        self._check(idx, f, exp)
-
-        f = lambda x: np.subtract(x, np.array([3, 2, 3, -2]))
-        exp = PeriodIndex(['2010-10', '2010-12', 'NaT',
-                           '2011-06'], freq='M', name='idx')
-        self._check(idx, f, exp)
-
-    def test_pi_ops_offset(self):
-        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
-                           '2011-04-01'], freq='D', name='idx')
-        f = lambda x: x + offsets.Day()
-        exp = PeriodIndex(['2011-01-02', '2011-02-02', '2011-03-02',
-                           '2011-04-02'], freq='D', name='idx')
-        self._check(idx, f, exp)
-
-        f = lambda x: x + offsets.Day(2)
-        exp = PeriodIndex(['2011-01-03', '2011-02-03', '2011-03-03',
-                           '2011-04-03'], freq='D', name='idx')
-        self._check(idx, f, exp)
-
-        f = lambda x: x - offsets.Day(2)
-        exp = PeriodIndex(['2010-12-30', '2011-01-30', '2011-02-27',
-                           '2011-03-30'], freq='D', name='idx')
-        self._check(idx, f, exp)
-
-    def test_pi_offset_errors(self):
-        idx = PeriodIndex(['2011-01-01', '2011-02-01', '2011-03-01',
-                           '2011-04-01'], freq='D', name='idx')
-        s = pd.Series(idx)
-
-        # Series op is applied per Period instance, thus error is raised
-        # from Period
-        msg_idx = r"Input has different freq from PeriodIndex\(freq=D\)"
-        msg_s = r"Input cannot be converted to Period\(freq=D\)"
-        for obj, msg in [(idx, msg_idx), (s, msg_s)]:
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                obj + offsets.Hour(2)
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                offsets.Hour(2) + obj
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                obj - offsets.Hour(2)
-
-    def test_pi_sub_period(self):
-        # GH 13071
-        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-
-        result = idx - pd.Period('2012-01', freq='M')
-        exp = pd.Index([-12, -11, -10, -9], name='idx')
-        tm.assert_index_equal(result, exp)
-
-        result = np.subtract(idx, pd.Period('2012-01', freq='M'))
-        tm.assert_index_equal(result, exp)
-
-        result = pd.Period('2012-01', freq='M') - idx
-        exp = pd.Index([12, 11, 10, 9], name='idx')
-        tm.assert_index_equal(result, exp)
-
-        result = np.subtract(pd.Period('2012-01', freq='M'), idx)
-        if _np_version_under1p10:
-            self.assertIs(result, NotImplemented)
-        else:
-            tm.assert_index_equal(result, exp)
-
-        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
-        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
-        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
-
-    def test_pi_sub_pdnat(self):
-        # GH 13071
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        exp = pd.TimedeltaIndex([pd.NaT] * 4, name='idx')
-        tm.assert_index_equal(pd.NaT - idx, exp)
-        tm.assert_index_equal(idx - pd.NaT, exp)
-
-    def test_pi_sub_period_nat(self):
-        # GH 13071
-        idx = PeriodIndex(['2011-01', 'NaT', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-
-        result = idx - pd.Period('2012-01', freq='M')
-        exp = pd.Index([-12, np.nan, -10, -9], name='idx')
-        tm.assert_index_equal(result, exp)
-
-        result = pd.Period('2012-01', freq='M') - idx
-        exp = pd.Index([12, np.nan, 10, 9], name='idx')
-        tm.assert_index_equal(result, exp)
-
-        exp = pd.TimedeltaIndex([np.nan, np.nan, np.nan, np.nan], name='idx')
-        tm.assert_index_equal(idx - pd.Period('NaT', freq='M'), exp)
-        tm.assert_index_equal(pd.Period('NaT', freq='M') - idx, exp)
-
-    def test_pi_comp_period(self):
-        idx = PeriodIndex(['2011-01', '2011-02', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-
-        f = lambda x: x == pd.Period('2011-03', freq='M')
-        exp = np.array([False, False, True, False], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: pd.Period('2011-03', freq='M') == x
-        self._check(idx, f, exp)
-
-        f = lambda x: x != pd.Period('2011-03', freq='M')
-        exp = np.array([True, True, False, True], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: pd.Period('2011-03', freq='M') != x
-        self._check(idx, f, exp)
-
-        f = lambda x: pd.Period('2011-03', freq='M') >= x
-        exp = np.array([True, True, True, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-        f = lambda x: x > pd.Period('2011-03', freq='M')
-        exp = np.array([False, False, False, True], dtype=np.bool)
-        self._check(idx, f, exp)
-
-        f = lambda x: pd.Period('2011-03', freq='M') >= x
-        exp = np.array([True, True, True, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-    def test_pi_comp_period_nat(self):
-        idx = PeriodIndex(['2011-01', 'NaT', '2011-03',
-                           '2011-04'], freq='M', name='idx')
-
-        f = lambda x: x == pd.Period('2011-03', freq='M')
-        exp = np.array([False, False, True, False], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: pd.Period('2011-03', freq='M') == x
-        self._check(idx, f, exp)
-
-        f = lambda x: x == tslib.NaT
-        exp = np.array([False, False, False, False], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: tslib.NaT == x
-        self._check(idx, f, exp)
-
-        f = lambda x: x != pd.Period('2011-03', freq='M')
-        exp = np.array([True, True, False, True], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: pd.Period('2011-03', freq='M') != x
-        self._check(idx, f, exp)
-
-        f = lambda x: x != tslib.NaT
-        exp = np.array([True, True, True, True], dtype=np.bool)
-        self._check(idx, f, exp)
-        f = lambda x: tslib.NaT != x
-        self._check(idx, f, exp)
-
-        f = lambda x: pd.Period('2011-03', freq='M') >= x
-        exp = np.array([True, False, True, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-        f = lambda x: x < pd.Period('2011-03', freq='M')
-        exp = np.array([True, False, False, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-        f = lambda x: x > tslib.NaT
-        exp = np.array([False, False, False, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-        f = lambda x: tslib.NaT >= x
-        exp = np.array([False, False, False, False], dtype=np.bool)
-        self._check(idx, f, exp)
-
-
-class TestSeriesPeriod(tm.TestCase):
-
-    def setUp(self):
-        self.series = Series(period_range('2000-01-01', periods=10, freq='D'))
-
-    def test_ops_series_timedelta(self):
-        # GH 13043
-        s = pd.Series([pd.Period('2015-01-01', freq='D'),
-                       pd.Period('2015-01-02', freq='D')], name='xxx')
-        self.assertEqual(s.dtype, object)
-
-        exp = pd.Series([pd.Period('2015-01-02', freq='D'),
-                         pd.Period('2015-01-03', freq='D')], name='xxx')
-        tm.assert_series_equal(s + pd.Timedelta('1 days'), exp)
-        tm.assert_series_equal(pd.Timedelta('1 days') + s, exp)
-
-        tm.assert_series_equal(s + pd.tseries.offsets.Day(), exp)
-        tm.assert_series_equal(pd.tseries.offsets.Day() + s, exp)
-
-    def test_ops_series_period(self):
-        # GH 13043
-        s = pd.Series([pd.Period('2015-01-01', freq='D'),
-                       pd.Period('2015-01-02', freq='D')], name='xxx')
-        self.assertEqual(s.dtype, object)
-
-        p = pd.Period('2015-01-10', freq='D')
-        # dtype will be object because of original dtype
-        exp = pd.Series([9, 8], name='xxx', dtype=object)
-        tm.assert_series_equal(p - s, exp)
-        tm.assert_series_equal(s - p, -exp)
-
-        s2 = pd.Series([pd.Period('2015-01-05', freq='D'),
-                        pd.Period('2015-01-04', freq='D')], name='xxx')
-        self.assertEqual(s2.dtype, object)
-
-        exp = pd.Series([4, 2], name='xxx', dtype=object)
-        tm.assert_series_equal(s2 - s, exp)
-        tm.assert_series_equal(s - s2, -exp)
-
-
-class TestFramePeriod(tm.TestCase):
-
-    def test_ops_frame_period(self):
-        # GH 13043
-        df = pd.DataFrame({'A': [pd.Period('2015-01', freq='M'),
-                                 pd.Period('2015-02', freq='M')],
-                           'B': [pd.Period('2014-01', freq='M'),
-                                 pd.Period('2014-02', freq='M')]})
-        self.assertEqual(df['A'].dtype, object)
-        self.assertEqual(df['B'].dtype, object)
-
-        p = pd.Period('2015-03', freq='M')
-        # dtype will be object because of original dtype
-        exp = pd.DataFrame({'A': np.array([2, 1], dtype=object),
-                            'B': np.array([14, 13], dtype=object)})
-        tm.assert_frame_equal(p - df, exp)
-        tm.assert_frame_equal(df - p, -exp)
-
-        df2 = pd.DataFrame({'A': [pd.Period('2015-05', freq='M'),
-                                  pd.Period('2015-06', freq='M')],
-                            'B': [pd.Period('2015-05', freq='M'),
-                                  pd.Period('2015-06', freq='M')]})
-        self.assertEqual(df2['A'].dtype, object)
-        self.assertEqual(df2['B'].dtype, object)
-
-        exp = pd.DataFrame({'A': np.array([4, 4], dtype=object),
-                            'B': np.array([16, 16], dtype=object)})
-        tm.assert_frame_equal(df2 - df, exp)
-        tm.assert_frame_equal(df - df2, -exp)
-
-
-class TestPeriodIndexComparisons(tm.TestCase):
-
-    def test_pi_pi_comp(self):
-
-        for freq in ['M', '2M', '3M']:
-            base = PeriodIndex(['2011-01', '2011-02',
-                                '2011-03', '2011-04'], freq=freq)
-            p = Period('2011-02', freq=freq)
-
-            exp = np.array([False, True, False, False])
-            self.assert_numpy_array_equal(base == p, exp)
-            self.assert_numpy_array_equal(p == base, exp)
-
-            exp = np.array([True, False, True, True])
-            self.assert_numpy_array_equal(base != p, exp)
-            self.assert_numpy_array_equal(p != base, exp)
-
-            exp = np.array([False, False, True, True])
-            self.assert_numpy_array_equal(base > p, exp)
-            self.assert_numpy_array_equal(p < base, exp)
-
-            exp = np.array([True, False, False, False])
-            self.assert_numpy_array_equal(base < p, exp)
-            self.assert_numpy_array_equal(p > base, exp)
-
-            exp = np.array([False, True, True, True])
-            self.assert_numpy_array_equal(base >= p, exp)
-            self.assert_numpy_array_equal(p <= base, exp)
-
-            exp = np.array([True, True, False, False])
-            self.assert_numpy_array_equal(base <= p, exp)
-            self.assert_numpy_array_equal(p >= base, exp)
-
-            idx = PeriodIndex(['2011-02', '2011-01', '2011-03',
-                               '2011-05'], freq=freq)
-
-            exp = np.array([False, False, True, False])
-            self.assert_numpy_array_equal(base == idx, exp)
-
-            exp = np.array([True, True, False, True])
-            self.assert_numpy_array_equal(base != idx, exp)
-
-            exp = np.array([False, True, False, False])
-            self.assert_numpy_array_equal(base > idx, exp)
-
-            exp = np.array([True, False, False, True])
-            self.assert_numpy_array_equal(base < idx, exp)
-
-            exp = np.array([False, True, True, False])
-            self.assert_numpy_array_equal(base >= idx, exp)
-
-            exp = np.array([True, False, True, True])
-            self.assert_numpy_array_equal(base <= idx, exp)
-
-            # different base freq
-            msg = "Input has different freq=A-DEC from PeriodIndex"
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                base <= Period('2011', freq='A')
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                Period('2011', freq='A') >= base
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='A')
-                base <= idx
-
-            # different mult
-            msg = "Input has different freq=4M from PeriodIndex"
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                base <= Period('2011', freq='4M')
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                Period('2011', freq='4M') >= base
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                idx = PeriodIndex(['2011', '2012', '2013', '2014'], freq='4M')
-                base <= idx
-
-    def test_pi_nat_comp(self):
-        for freq in ['M', '2M', '3M']:
-            idx1 = PeriodIndex(
-                ['2011-01', '2011-02', 'NaT', '2011-05'], freq=freq)
-
-            result = idx1 > Period('2011-02', freq=freq)
-            exp = np.array([False, False, False, True])
-            self.assert_numpy_array_equal(result, exp)
-            result = Period('2011-02', freq=freq) < idx1
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == Period('NaT', freq=freq)
-            exp = np.array([False, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-            result = Period('NaT', freq=freq) == idx1
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != Period('NaT', freq=freq)
-            exp = np.array([True, True, True, True])
-            self.assert_numpy_array_equal(result, exp)
-            result = Period('NaT', freq=freq) != idx1
-            self.assert_numpy_array_equal(result, exp)
-
-            idx2 = PeriodIndex(['2011-02', '2011-01', '2011-04',
-                                'NaT'], freq=freq)
-            result = idx1 < idx2
-            exp = np.array([True, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == idx2
-            exp = np.array([False, False, False, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != idx2
-            exp = np.array([True, True, True, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 == idx1
-            exp = np.array([True, True, False, True])
-            self.assert_numpy_array_equal(result, exp)
-
-            result = idx1 != idx1
-            exp = np.array([False, False, True, False])
-            self.assert_numpy_array_equal(result, exp)
-
-            diff = PeriodIndex(['2011-02', '2011-01', '2011-04',
-                                'NaT'], freq='4M')
-            msg = "Input has different freq=4M from PeriodIndex"
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                idx1 > diff
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                idx1 == diff
+    @pytest.mark.parametrize('freq', ['D', 'M'])
+    def test_equals(self, freq):
+        # GH#13107
+        idx = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                             freq=freq)
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
+
+        idx2 = pd.PeriodIndex(['2011-01-01', '2011-01-02', 'NaT'],
+                              freq='H')
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+        # same internal, different tz
+        idx3 = pd.PeriodIndex._simple_new(
+            idx._values._simple_new(idx._values.asi8, freq="H")
+        )
+        tm.assert_numpy_array_equal(idx.asi8, idx3.asi8)
+        assert not idx.equals(idx3)
+        assert not idx.equals(idx3.copy())
+        assert not idx.equals(idx3.astype(object))
+        assert not idx.astype(object).equals(idx3)
+        assert not idx.equals(list(idx3))
+        assert not idx.equals(pd.Series(idx3))
+
+    def test_freq_setter_deprecated(self):
+        # GH 20678
+        idx = pd.period_range('2018Q1', periods=4, freq='Q')
+
+        # no warning for getter
+        with tm.assert_produces_warning(None):
+            idx.freq
+
+        # warning for setter
+        with tm.assert_produces_warning(FutureWarning):
+            idx.freq = pd.offsets.Day()
diff --git a/pandas/tests/indexes/period/test_partial_slicing.py b/pandas/tests/indexes/period/test_partial_slicing.py
index b051c4a0dcab1..0a1e7225463be 100644
--- a/pandas/tests/indexes/period/test_partial_slicing.py
+++ b/pandas/tests/indexes/period/test_partial_slicing.py
@@ -1,14 +1,14 @@
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import DataFrame, Period, Series, period_range
 from pandas.util import testing as tm
-from pandas import (Series, period_range, DatetimeIndex, PeriodIndex,
-                    DataFrame, _np_version_under1p12, Period)
 
 
-class TestPeriodIndex(tm.TestCase):
+class TestPeriodIndex(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         pass
 
     def test_slice_with_negative_step(self):
@@ -40,19 +40,19 @@ def assert_slices_equivalent(l_slc, i_slc):
     def test_slice_with_zero_step_raises(self):
         ts = Series(np.arange(20),
                     period_range('2014-01', periods=20, freq='M'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
 
     def test_slice_keep_name(self):
         idx = period_range('20010101', periods=10, freq='D', name='bob')
-        self.assertEqual(idx.name, idx[1:].name)
+        assert idx.name == idx[1:].name
 
     def test_pindex_slice_index(self):
-        pi = PeriodIndex(start='1/1/10', end='12/31/12', freq='M')
+        pi = period_range(start='1/1/10', end='12/31/12', freq='M')
         s = Series(np.random.rand(len(pi)), index=pi)
         res = s['2010']
         exp = s[0:12]
@@ -62,20 +62,16 @@ def test_pindex_slice_index(self):
         tm.assert_series_equal(res, exp)
 
     def test_range_slice_day(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01', freq='D', periods=400)
-        pidx = PeriodIndex(start='2013/01/01', freq='D', periods=400)
-
-        # changed to TypeError in 1.12
-        # https://github.com/numpy/numpy/pull/6271
-        exc = IndexError if _np_version_under1p12 else TypeError
+        # GH#6716
+        didx = pd.date_range(start='2013/01/01', freq='D', periods=400)
+        pidx = period_range(start='2013/01/01', freq='D', periods=400)
 
         for idx in [didx, pidx]:
             # slices against index should raise IndexError
             values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
                       '2013/02/01 09:00']
             for v in values:
-                with tm.assertRaises(exc):
+                with pytest.raises(TypeError):
                     idx[v:]
 
             s = Series(np.random.rand(len(idx)), index=idx)
@@ -87,25 +83,22 @@ def test_range_slice_day(self):
 
             invalid = ['2013/02/01 9H', '2013/02/01 09:00']
             for v in invalid:
-                with tm.assertRaises(exc):
+                with pytest.raises(TypeError):
                     idx[v:]
 
     def test_range_slice_seconds(self):
-        # GH 6716
-        didx = DatetimeIndex(start='2013/01/01 09:00:00', freq='S',
+        # GH#6716
+        didx = pd.date_range(start='2013/01/01 09:00:00', freq='S',
                              periods=4000)
-        pidx = PeriodIndex(start='2013/01/01 09:00:00', freq='S', periods=4000)
-
-        # changed to TypeError in 1.12
-        # https://github.com/numpy/numpy/pull/6271
-        exc = IndexError if _np_version_under1p12 else TypeError
+        pidx = period_range(start='2013/01/01 09:00:00', freq='S',
+                            periods=4000)
 
         for idx in [didx, pidx]:
             # slices against index should raise IndexError
             values = ['2014', '2013/02', '2013/01/02', '2013/02/01 9H',
                       '2013/02/01 09:00']
             for v in values:
-                with tm.assertRaises(exc):
+                with pytest.raises(TypeError):
                     idx[v:]
 
             s = Series(np.random.rand(len(idx)), index=idx)
@@ -120,9 +113,9 @@ def test_range_slice_seconds(self):
                 tm.assert_series_equal(s[d:], s)
 
     def test_range_slice_outofbounds(self):
-        # GH 5407
-        didx = DatetimeIndex(start='2013/10/01', freq='D', periods=10)
-        pidx = PeriodIndex(start='2013/10/01', freq='D', periods=10)
+        # GH#5407
+        didx = pd.date_range(start='2013/10/01', freq='D', periods=10)
+        pidx = period_range(start='2013/10/01', freq='D', periods=10)
 
         for idx in [didx, pidx]:
             df = DataFrame(dict(units=[100 + i for i in range(10)]), index=idx)
diff --git a/pandas/tests/indexes/period/test_period.py b/pandas/tests/indexes/period/test_period.py
index 6639fcd985ac4..89bcf56dbda71 100644
--- a/pandas/tests/indexes/period/test_period.py
+++ b/pandas/tests/indexes/period/test_period.py
@@ -1,180 +1,54 @@
+import numpy as np
 import pytest
 
-import numpy as np
-from numpy.random import randn
-from datetime import timedelta
+from pandas._libs.tslibs.period import IncompatibleFrequency
+import pandas.util._test_decorators as td
 
 import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, NaT, Period, PeriodIndex, Series,
+    date_range, offsets, period_range)
 from pandas.util import testing as tm
-from pandas import (PeriodIndex, period_range, notnull, DatetimeIndex, NaT,
-                    Index, Period, Int64Index, Series, DataFrame, date_range,
-                    offsets, compat)
 
 from ..datetimelike import DatetimeLike
 
 
-class TestPeriodIndex(DatetimeLike, tm.TestCase):
+class TestPeriodIndex(DatetimeLike):
     _holder = PeriodIndex
-    _multiprocess_can_split_ = True
 
-    def setUp(self):
-        self.indices = dict(index=tm.makePeriodIndex(10))
+    def setup_method(self, method):
+        self.indices = dict(index=tm.makePeriodIndex(10),
+                            index_dec=period_range('20130101', periods=10,
+                                                   freq='D')[::-1])
         self.setup_indices()
 
     def create_index(self):
         return period_range('20130101', periods=5, freq='D')
 
-    def test_astype(self):
-        # GH 13149, GH 13209
-        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
-
-        result = idx.astype(object)
-        expected = Index([Period('2016-05-16', freq='D')] +
-                         [Period(NaT, freq='D')] * 3, dtype='object')
-        tm.assert_index_equal(result, expected)
-
-        result = idx.astype(int)
-        expected = Int64Index([16937] + [-9223372036854775808] * 3,
-                              dtype=np.int64)
-        tm.assert_index_equal(result, expected)
-
-        idx = period_range('1990', '2009', freq='A')
-        result = idx.astype('i8')
-        self.assert_index_equal(result, Index(idx.asi8))
-        self.assert_numpy_array_equal(result.values, idx.asi8)
-
-    def test_astype_raises(self):
-        # GH 13149, GH 13209
-        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
-
-        self.assertRaises(ValueError, idx.astype, str)
-        self.assertRaises(ValueError, idx.astype, float)
-        self.assertRaises(ValueError, idx.astype, 'timedelta64')
-        self.assertRaises(ValueError, idx.astype, 'timedelta64[ns]')
-
     def test_pickle_compat_construction(self):
         pass
 
-    def test_pickle_round_trip(self):
-        for freq in ['D', 'M', 'Y']:
-            idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq='D')
-            result = self.round_trip_pickle(idx)
-            tm.assert_index_equal(result, idx)
-
-    def test_get_loc(self):
-        idx = pd.period_range('2000-01-01', periods=3)
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(
-                idx.get_loc(idx[1].asfreq('H', how='start'), method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_timestamp(), method), 1)
-            self.assertEqual(
-                idx.get_loc(idx[1].to_timestamp().to_pydatetime(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-
-        idx = pd.period_range('2000-01-01', periods=5)[::2]
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance='1 day'), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=pd.Timedelta('1D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=np.timedelta64(1, 'D')), 1)
-        self.assertEqual(idx.get_loc('2000-01-02T12', method='nearest',
-                                     tolerance=timedelta(1)), 1)
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='foo')
-
-        msg = 'Input has different freq from PeriodIndex\\(freq=D\\)'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='1 hour')
-        with tm.assertRaises(KeyError):
-            idx.get_loc('2000-01-10', method='nearest', tolerance='1 day')
+    @pytest.mark.parametrize('freq', ['D', 'M', 'A'])
+    def test_pickle_round_trip(self, freq):
+        idx = PeriodIndex(['2016-05-16', 'NaT', NaT, np.NaN], freq=freq)
+        result = tm.round_trip_pickle(idx)
+        tm.assert_index_equal(result, idx)
 
     def test_where(self):
-        i = self.create_index()
-        result = i.where(notnull(i))
-        expected = i
-        tm.assert_index_equal(result, expected)
-
-        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
-                            freq='D')
-        result = i.where(notnull(i2))
-        expected = i2
-        tm.assert_index_equal(result, expected)
-
-    def test_where_array_like(self):
-        i = self.create_index()
-        cond = [False] + [True] * (len(i) - 1)
-        klasses = [list, tuple, np.array, Series]
-        expected = pd.PeriodIndex([pd.NaT] + i[1:].tolist(), freq='D')
-
-        for klass in klasses:
-            result = i.where(klass(cond))
-            tm.assert_index_equal(result, expected)
-
-    def test_where_other(self):
-
-        i = self.create_index()
-        for arr in [np.nan, pd.NaT]:
-            result = i.where(notnull(i), other=np.nan)
-            expected = i
-            tm.assert_index_equal(result, expected)
+        # This is handled in test_indexing
+        pass
 
-        i2 = i.copy()
-        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
-                            freq='D')
-        result = i.where(notnull(i2), i2)
-        tm.assert_index_equal(result, i2)
-
-        i2 = i.copy()
-        i2 = pd.PeriodIndex([pd.NaT, pd.NaT] + i[2:].tolist(),
-                            freq='D')
-        result = i.where(notnull(i2), i2.values)
-        tm.assert_index_equal(result, i2)
-
-    def test_get_indexer(self):
-        idx = pd.period_range('2000-01-01', periods=3).asfreq('H', how='start')
-        tm.assert_numpy_array_equal(idx.get_indexer(idx),
-                                    np.array([0, 1, 2], dtype=np.intp))
-
-        target = pd.PeriodIndex(['1999-12-31T23', '2000-01-01T12',
-                                 '2000-01-02T01'], freq='H')
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
-                                    np.array([-1, 0, 1], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
-                                    np.array([0, 1, 2], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
-                                    np.array([0, 1, 1], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
-                                                    tolerance='1 hour'),
-                                    np.array([0, -1, 1], dtype=np.intp))
-
-        msg = 'Input has different freq from PeriodIndex\\(freq=H\\)'
-        with self.assertRaisesRegexp(ValueError, msg):
-            idx.get_indexer(target, 'nearest', tolerance='1 minute')
-
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest',
-                                                    tolerance='1 day'),
-                                    np.array([0, 1, 1], dtype=np.intp))
-
-    def test_repeat(self):
+    @pytest.mark.parametrize('use_numpy', [True, False])
+    @pytest.mark.parametrize('index', [
+        pd.period_range('2000-01-01', periods=3, freq='D'),
+        pd.period_range('2001-01-01', periods=3, freq='2D'),
+        pd.PeriodIndex(['2001-01', 'NaT', '2003-01'], freq='M')])
+    def test_repeat_freqstr(self, index, use_numpy):
         # GH10183
-        idx = pd.period_range('2000-01-01', periods=3, freq='D')
-        res = idx.repeat(3)
-        exp = PeriodIndex(idx.values.repeat(3), freq='D')
-        self.assert_index_equal(res, exp)
-        self.assertEqual(res.freqstr, 'D')
-
-    def test_period_index_indexer(self):
-        # GH4125
-        idx = pd.period_range('2002-01', '2003-12', freq='M')
-        df = pd.DataFrame(pd.np.random.randn(24, 10), index=idx)
-        self.assert_frame_equal(df, df.loc[idx])
-        self.assert_frame_equal(df, df.loc[list(idx)])
-        self.assert_frame_equal(df, df.loc[list(idx)])
-        self.assert_frame_equal(df.iloc[0:5], df.loc[idx[0:5]])
-        self.assert_frame_equal(df, df.loc[list(idx)])
+        expected = PeriodIndex([p for p in index for _ in range(3)])
+        result = np.repeat(index, 3) if use_numpy else index.repeat(3)
+        tm.assert_index_equal(result, expected)
+        assert result.freqstr == index.freqstr
 
     def test_fillna_period(self):
         # GH 11343
@@ -183,27 +57,30 @@ def test_fillna_period(self):
 
         exp = pd.PeriodIndex(['2011-01-01 09:00', '2011-01-01 10:00',
                               '2011-01-01 11:00'], freq='H')
-        self.assert_index_equal(
+        tm.assert_index_equal(
             idx.fillna(pd.Period('2011-01-01 10:00', freq='H')), exp)
 
         exp = pd.Index([pd.Period('2011-01-01 09:00', freq='H'), 'x',
                         pd.Period('2011-01-01 11:00', freq='H')], dtype=object)
-        self.assert_index_equal(idx.fillna('x'), exp)
+        tm.assert_index_equal(idx.fillna('x'), exp)
 
         exp = pd.Index([pd.Period('2011-01-01 09:00', freq='H'),
                         pd.Period('2011-01-01', freq='D'),
                         pd.Period('2011-01-01 11:00', freq='H')], dtype=object)
-        self.assert_index_equal(idx.fillna(pd.Period('2011-01-01', freq='D')),
-                                exp)
+        tm.assert_index_equal(idx.fillna(
+            pd.Period('2011-01-01', freq='D')), exp)
 
     def test_no_millisecond_field(self):
-        with self.assertRaises(AttributeError):
+        msg = "type object 'DatetimeIndex' has no attribute 'millisecond'"
+        with pytest.raises(AttributeError, match=msg):
             DatetimeIndex.millisecond
 
-        with self.assertRaises(AttributeError):
+        msg = "'DatetimeIndex' object has no attribute 'millisecond'"
+        with pytest.raises(AttributeError, match=msg):
             DatetimeIndex([]).millisecond
 
-    def test_difference_freq(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_freq(self, sort):
         # GH14323: difference of Period MUST preserve frequency
         # but the ability to union results must be preserved
 
@@ -211,26 +88,26 @@ def test_difference_freq(self):
 
         other = period_range("20160921", "20160924", freq="D")
         expected = PeriodIndex(["20160920", "20160925"], freq='D')
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
         other = period_range("20160922", "20160925", freq="D")
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         expected = PeriodIndex(["20160920", "20160921"], freq='D')
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
     def test_hash_error(self):
         index = period_range('20010101', periods=10)
-        with tm.assertRaisesRegexp(TypeError, "unhashable type: %r" %
-                                   type(index).__name__):
+        msg = "unhashable type: '{}'".format(type(index).__name__)
+        with pytest.raises(TypeError, match=msg):
             hash(index)
 
     def test_make_time_series(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        index = period_range(freq='A', start='1/1/2001', end='12/1/2009')
         series = Series(1, index=index)
-        tm.assertIsInstance(series, Series)
+        assert isinstance(series, Series)
 
     def test_shallow_copy_empty(self):
 
@@ -241,14 +118,26 @@ def test_shallow_copy_empty(self):
 
         tm.assert_index_equal(result, expected)
 
+    def test_shallow_copy_i8(self):
+        # GH-24391
+        pi = period_range("2018-01-01", periods=3, freq="2D")
+        result = pi._shallow_copy(pi.asi8, freq=pi.freq)
+        tm.assert_index_equal(result, pi)
+
+    def test_shallow_copy_changing_freq_raises(self):
+        pi = period_range("2018-01-01", periods=3, freq="2D")
+        msg = "specified freq and dtype are different"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            pi._shallow_copy(pi, freq="H")
+
     def test_dtype_str(self):
         pi = pd.PeriodIndex([], freq='M')
-        self.assertEqual(pi.dtype_str, 'period[M]')
-        self.assertEqual(pi.dtype_str, str(pi.dtype))
+        assert pi.dtype_str == 'period[M]'
+        assert pi.dtype_str == str(pi.dtype)
 
         pi = pd.PeriodIndex([], freq='3M')
-        self.assertEqual(pi.dtype_str, 'period[3M]')
-        self.assertEqual(pi.dtype_str, str(pi.dtype))
+        assert pi.dtype_str == 'period[3M]'
+        assert pi.dtype_str == str(pi.dtype)
 
     def test_view_asi8(self):
         idx = pd.PeriodIndex([], freq='M')
@@ -275,7 +164,7 @@ def test_values(self):
         tm.assert_numpy_array_equal(idx.values, exp)
         tm.assert_numpy_array_equal(idx.get_values(), exp)
         exp = np.array([], dtype=np.int64)
-        tm.assert_numpy_array_equal(idx._values, exp)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
 
         idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
 
@@ -283,7 +172,7 @@ def test_values(self):
         tm.assert_numpy_array_equal(idx.values, exp)
         tm.assert_numpy_array_equal(idx.get_values(), exp)
         exp = np.array([492, -9223372036854775808], dtype=np.int64)
-        tm.assert_numpy_array_equal(idx._values, exp)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
 
         idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
 
@@ -292,104 +181,103 @@ def test_values(self):
         tm.assert_numpy_array_equal(idx.values, exp)
         tm.assert_numpy_array_equal(idx.get_values(), exp)
         exp = np.array([14975, -9223372036854775808], dtype=np.int64)
-        tm.assert_numpy_array_equal(idx._values, exp)
+        tm.assert_numpy_array_equal(idx._ndarray_values, exp)
 
     def test_period_index_length(self):
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 9)
+        pi = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 9
 
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 4 * 9)
+        pi = period_range(freq='Q', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 4 * 9
 
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        self.assertEqual(len(pi), 12 * 9)
+        pi = period_range(freq='M', start='1/1/2001', end='12/1/2009')
+        assert len(pi) == 12 * 9
 
         start = Period('02-Apr-2005', 'B')
-        i1 = PeriodIndex(start=start, periods=20)
-        self.assertEqual(len(i1), 20)
-        self.assertEqual(i1.freq, start.freq)
-        self.assertEqual(i1[0], start)
+        i1 = period_range(start=start, periods=20)
+        assert len(i1) == 20
+        assert i1.freq == start.freq
+        assert i1[0] == start
 
         end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), 10)
-        self.assertEqual(i1.freq, end_intv.freq)
-        self.assertEqual(i1[-1], end_intv)
+        i1 = period_range(end=end_intv, periods=10)
+        assert len(i1) == 10
+        assert i1.freq == end_intv.freq
+        assert i1[-1] == end_intv
 
         end_intv = Period('2006-12-31', '1w')
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        self.assertEqual(i1.freq, i2.freq)
+        i2 = period_range(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
 
         end_intv = Period('2006-12-31', ('w', 1))
-        i2 = PeriodIndex(end=end_intv, periods=10)
-        self.assertEqual(len(i1), len(i2))
-        self.assertTrue((i1 == i2).all())
-        self.assertEqual(i1.freq, i2.freq)
+        i2 = period_range(end=end_intv, periods=10)
+        assert len(i1) == len(i2)
+        assert (i1 == i2).all()
+        assert i1.freq == i2.freq
 
-        try:
-            PeriodIndex(start=start, end=end_intv)
-            raise AssertionError('Cannot allow mixed freq for start and end')
-        except ValueError:
-            pass
+        msg = "start and end must have same freq"
+        with pytest.raises(ValueError, match=msg):
+            period_range(start=start, end=end_intv)
 
         end_intv = Period('2005-05-01', 'B')
-        i1 = PeriodIndex(start=start, end=end_intv)
+        i1 = period_range(start=start, end=end_intv)
 
-        try:
-            PeriodIndex(start=start)
-            raise AssertionError(
-                'Must specify periods if missing start or end')
-        except ValueError:
-            pass
+        msg = ("Of the three parameters: start, end, and periods, exactly two"
+               " must be specified")
+        with pytest.raises(ValueError, match=msg):
+            period_range(start=start)
 
         # infer freq from first element
         i2 = PeriodIndex([end_intv, Period('2005-05-05', 'B')])
-        self.assertEqual(len(i2), 2)
-        self.assertEqual(i2[0], end_intv)
+        assert len(i2) == 2
+        assert i2[0] == end_intv
 
         i2 = PeriodIndex(np.array([end_intv, Period('2005-05-05', 'B')]))
-        self.assertEqual(len(i2), 2)
-        self.assertEqual(i2[0], end_intv)
+        assert len(i2) == 2
+        assert i2[0] == end_intv
 
         # Mixed freq should fail
         vals = [end_intv, Period('2006-12-31', 'w')]
-        self.assertRaises(ValueError, PeriodIndex, vals)
+        msg = r"Input has different freq=W-SUN from PeriodIndex\(freq=B\)"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            PeriodIndex(vals)
         vals = np.array(vals)
-        self.assertRaises(ValueError, PeriodIndex, vals)
+        with pytest.raises(ValueError, match=msg):
+            PeriodIndex(vals)
 
     def test_fields(self):
         # year, month, day, hour, minute
         # second, weekofyear, week, dayofweek, weekday, dayofyear, quarter
         # qyear
-        pi = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2005')
+        pi = period_range(freq='A', start='1/1/2001', end='12/1/2005')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='Q', start='1/1/2001', end='12/1/2002')
+        pi = period_range(freq='Q', start='1/1/2001', end='12/1/2002')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='M', start='1/1/2001', end='1/1/2002')
+        pi = period_range(freq='M', start='1/1/2001', end='1/1/2002')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='D', start='12/1/2001', end='6/1/2001')
+        pi = period_range(freq='D', start='12/1/2001', end='6/1/2001')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='B', start='12/1/2001', end='6/1/2001')
+        pi = period_range(freq='B', start='12/1/2001', end='6/1/2001')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='H', start='12/31/2001', end='1/1/2002 23:00')
+        pi = period_range(freq='H', start='12/31/2001', end='1/1/2002 23:00')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='Min', start='12/31/2001', end='1/1/2002 00:20')
+        pi = period_range(freq='Min', start='12/31/2001', end='1/1/2002 00:20')
         self._check_all_fields(pi)
 
-        pi = PeriodIndex(freq='S', start='12/31/2001 00:00:00',
-                         end='12/31/2001 00:05:00')
+        pi = period_range(freq='S', start='12/31/2001 00:00:00',
+                          end='12/31/2001 00:05:00')
         self._check_all_fields(pi)
 
         end_intv = Period('2006-12-31', 'W')
-        i1 = PeriodIndex(end=end_intv, periods=10)
+        i1 = period_range(end=end_intv, periods=10)
         self._check_all_fields(i1)
 
     def _check_all_fields(self, periodindex):
@@ -402,26 +290,17 @@ def _check_all_fields(self, periodindex):
 
         for field in fields:
             field_idx = getattr(periodindex, field)
-            self.assertEqual(len(periodindex), len(field_idx))
+            assert len(periodindex) == len(field_idx)
             for x, val in zip(periods, field_idx):
-                self.assertEqual(getattr(x, field), val)
+                assert getattr(x, field) == val
 
             if len(s) == 0:
                 continue
 
             field_s = getattr(s.dt, field)
-            self.assertEqual(len(periodindex), len(field_s))
+            assert len(periodindex) == len(field_s)
             for x, val in zip(periods, field_s):
-                self.assertEqual(getattr(x, field), val)
-
-    def test_indexing(self):
-
-        # GH 4390, iat incorrectly indexing
-        index = period_range('1/1/2001', periods=10)
-        s = Series(randn(10), index=index)
-        expected = s[index[0]]
-        result = s.iat[0]
-        self.assertEqual(expected, result)
+                assert getattr(x, field) == val
 
     def test_period_set_index_reindex(self):
         # GH 6631
@@ -442,11 +321,11 @@ def test_factorize(self):
         exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
 
         arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         idx2 = pd.PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
@@ -454,93 +333,72 @@ def test_factorize(self):
 
         exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.intp)
         arr, idx = idx2.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
         exp_arr = np.array([0, 0, 1, 2, 0, 2], dtype=np.intp)
         exp_idx = PeriodIndex(['2014-03', '2014-02', '2014-01'], freq='M')
         arr, idx = idx2.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_numpy_array_equal(arr, exp_arr)
         tm.assert_index_equal(idx, exp_idx)
 
-    def test_asobject_like(self):
-        idx = pd.PeriodIndex([], freq='M')
-
-        exp = np.array([], dtype=object)
-        tm.assert_numpy_array_equal(idx.asobject.values, exp)
-        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
-
-        idx = pd.PeriodIndex(['2011-01', pd.NaT], freq='M')
-
-        exp = np.array([pd.Period('2011-01', freq='M'), pd.NaT], dtype=object)
-        tm.assert_numpy_array_equal(idx.asobject.values, exp)
-        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
-
-        exp = np.array([pd.Period('2011-01-01', freq='D'), pd.NaT],
-                       dtype=object)
-        idx = pd.PeriodIndex(['2011-01-01', pd.NaT], freq='D')
-        tm.assert_numpy_array_equal(idx.asobject.values, exp)
-        tm.assert_numpy_array_equal(idx._mpl_repr(), exp)
-
     def test_is_(self):
-        create_index = lambda: PeriodIndex(freq='A', start='1/1/2001',
-                                           end='12/1/2009')
+        create_index = lambda: period_range(freq='A', start='1/1/2001',
+                                            end='12/1/2009')
         index = create_index()
-        self.assertEqual(index.is_(index), True)
-        self.assertEqual(index.is_(create_index()), False)
-        self.assertEqual(index.is_(index.view()), True)
-        self.assertEqual(
-            index.is_(index.view().view().view().view().view()), True)
-        self.assertEqual(index.view().is_(index), True)
+        assert index.is_(index)
+        assert not index.is_(create_index())
+        assert index.is_(index.view())
+        assert index.is_(index.view().view().view().view().view())
+        assert index.view().is_(index)
         ind2 = index.view()
         index.name = "Apple"
-        self.assertEqual(ind2.is_(index), True)
-        self.assertEqual(index.is_(index[:]), False)
-        self.assertEqual(index.is_(index.asfreq('M')), False)
-        self.assertEqual(index.is_(index.asfreq('A')), False)
-        self.assertEqual(index.is_(index - 2), False)
-        self.assertEqual(index.is_(index - 0), False)
-
-    def test_comp_period(self):
-        idx = period_range('2007-01', periods=20, freq='M')
+        assert ind2.is_(index)
+        assert not index.is_(index[:])
+        assert not index.is_(index.asfreq('M'))
+        assert not index.is_(index.asfreq('A'))
 
-        result = idx < idx[10]
-        exp = idx.values < idx.values[10]
-        self.assert_numpy_array_equal(result, exp)
+        assert not index.is_(index - 2)
+        assert not index.is_(index - 0)
 
     def test_contains(self):
         rng = period_range('2007-01', freq='M', periods=10)
 
-        self.assertTrue(Period('2007-01', freq='M') in rng)
-        self.assertFalse(Period('2007-01', freq='D') in rng)
-        self.assertFalse(Period('2007-01', freq='2M') in rng)
+        assert Period('2007-01', freq='M') in rng
+        assert not Period('2007-01', freq='D') in rng
+        assert not Period('2007-01', freq='2M') in rng
 
     def test_contains_nat(self):
-        # GH13582
+        # see gh-13582
         idx = period_range('2007-01', freq='M', periods=10)
-        self.assertFalse(pd.NaT in idx)
-        self.assertFalse(None in idx)
-        self.assertFalse(float('nan') in idx)
-        self.assertFalse(np.nan in idx)
+        assert pd.NaT not in idx
+        assert None not in idx
+        assert float('nan') not in idx
+        assert np.nan not in idx
 
         idx = pd.PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='M')
-        self.assertTrue(pd.NaT in idx)
-        self.assertTrue(None in idx)
-        self.assertTrue(float('nan') in idx)
-        self.assertTrue(np.nan in idx)
+        assert pd.NaT in idx
+        assert None in idx
+        assert float('nan') in idx
+        assert np.nan in idx
 
     def test_periods_number_check(self):
-        with tm.assertRaises(ValueError):
+        msg = ("Of the three parameters: start, end, and periods, exactly two"
+               " must be specified")
+        with pytest.raises(ValueError, match=msg):
             period_range('2011-1-1', '2012-1-1', 'B')
 
     def test_start_time(self):
-        index = PeriodIndex(freq='M', start='2016-01-01', end='2016-05-31')
+        # GH 17157
+        index = period_range(freq='M', start='2016-01-01', end='2016-05-31')
         expected_index = date_range('2016-01-01', end='2016-05-31', freq='MS')
         tm.assert_index_equal(index.start_time, expected_index)
 
     def test_end_time(self):
-        index = PeriodIndex(freq='M', start='2016-01-01', end='2016-05-31')
+        # GH 17157
+        index = period_range(freq='M', start='2016-01-01', end='2016-05-31')
         expected_index = date_range('2016-01-01', end='2016-05-31', freq='M')
+        expected_index = expected_index.shift(1, freq='D').shift(-1, freq='ns')
         tm.assert_index_equal(index.end_time, expected_index)
 
     def test_index_duplicate_periods(self):
@@ -552,7 +410,7 @@ def test_index_duplicate_periods(self):
         expected = ts[1:3]
         tm.assert_series_equal(result, expected)
         result[:] = 1
-        self.assertTrue((ts[1:3] == 1).all())
+        assert (ts[1:3] == 1).all()
 
         # not monotonic
         idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN')
@@ -565,89 +423,24 @@ def test_index_duplicate_periods(self):
     def test_index_unique(self):
         idx = PeriodIndex([2000, 2007, 2007, 2009, 2009], freq='A-JUN')
         expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN')
-        self.assert_index_equal(idx.unique(), expected)
-        self.assertEqual(idx.nunique(), 3)
+        tm.assert_index_equal(idx.unique(), expected)
+        assert idx.nunique() == 3
 
         idx = PeriodIndex([2000, 2007, 2007, 2009, 2007], freq='A-JUN',
                           tz='US/Eastern')
         expected = PeriodIndex([2000, 2007, 2009], freq='A-JUN',
                                tz='US/Eastern')
-        self.assert_index_equal(idx.unique(), expected)
-        self.assertEqual(idx.nunique(), 3)
-
-    def test_shift_gh8083(self):
-
-        # test shift for PeriodIndex
-        # GH8083
-        drange = self.create_index()
-        result = drange.shift(1)
-        expected = PeriodIndex(['2013-01-02', '2013-01-03', '2013-01-04',
-                                '2013-01-05', '2013-01-06'], freq='D')
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(idx.unique(), expected)
+        assert idx.nunique() == 3
 
     def test_shift(self):
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='A', start='1/1/2002', end='12/1/2010')
-
-        tm.assert_index_equal(pi1.shift(0), pi1)
-
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(1), pi2)
-
-        pi1 = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='A', start='1/1/2000', end='12/1/2008')
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(-1), pi2)
-
-        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='M', start='2/1/2001', end='1/1/2010')
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(1), pi2)
-
-        pi1 = PeriodIndex(freq='M', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='M', start='12/1/2000', end='11/1/2009')
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(-1), pi2)
-
-        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='D', start='1/2/2001', end='12/2/2009')
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(1), pi2)
-
-        pi1 = PeriodIndex(freq='D', start='1/1/2001', end='12/1/2009')
-        pi2 = PeriodIndex(freq='D', start='12/31/2000', end='11/30/2009')
-        self.assertEqual(len(pi1), len(pi2))
-        self.assert_index_equal(pi1.shift(-1), pi2)
-
-    def test_shift_nat(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        result = idx.shift(1)
-        expected = PeriodIndex(['2011-02', '2011-03', 'NaT',
-                                '2011-05'], freq='M', name='idx')
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+        # This is tested in test_arithmetic
+        pass
 
+    @td.skip_if_32bit
     def test_ndarray_compat_properties(self):
-        if compat.is_platform_32bit():
-            pytest.skip("skipping on 32bit")
         super(TestPeriodIndex, self).test_ndarray_compat_properties()
 
-    def test_shift_ndarray(self):
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        result = idx.shift(np.array([1, 2, 3, 4]))
-        expected = PeriodIndex(['2011-02', '2011-04', 'NaT',
-                                '2011-08'], freq='M', name='idx')
-        tm.assert_index_equal(result, expected)
-
-        idx = PeriodIndex(['2011-01', '2011-02', 'NaT',
-                           '2011-04'], freq='M', name='idx')
-        result = idx.shift(np.array([1, -2, 3, -4]))
-        expected = PeriodIndex(['2011-02', '2010-12', 'NaT',
-                                '2010-12'], freq='M', name='idx')
-        tm.assert_index_equal(result, expected)
-
     def test_negative_ordinals(self):
         Period(ordinal=-1000, freq='A')
         Period(ordinal=0, freq='A')
@@ -661,68 +454,60 @@ def test_pindex_fieldaccessor_nat(self):
                            '2012-03', '2012-04'], freq='D', name='name')
 
         exp = Index([2011, 2011, -1, 2012, 2012], dtype=np.int64, name='name')
-        self.assert_index_equal(idx.year, exp)
+        tm.assert_index_equal(idx.year, exp)
         exp = Index([1, 2, -1, 3, 4], dtype=np.int64, name='name')
-        self.assert_index_equal(idx.month, exp)
+        tm.assert_index_equal(idx.month, exp)
 
     def test_pindex_qaccess(self):
         pi = PeriodIndex(['2Q05', '3Q05', '4Q05', '1Q06', '2Q06'], freq='Q')
         s = Series(np.random.rand(len(pi)), index=pi).cumsum()
         # Todo: fix these accessors!
-        self.assertEqual(s['05Q4'], s[2])
-
-    def test_numpy_repeat(self):
-        index = period_range('20010101', periods=2)
-        expected = PeriodIndex([Period('2001-01-01'), Period('2001-01-01'),
-                                Period('2001-01-02'), Period('2001-01-02')])
-
-        tm.assert_index_equal(np.repeat(index, 2), expected)
-
-        msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.repeat, index, 2, axis=1)
+        assert s['05Q4'] == s[2]
 
     def test_pindex_multiples(self):
-        pi = PeriodIndex(start='1/1/11', end='12/31/11', freq='2M')
+        with tm.assert_produces_warning(FutureWarning):
+            pi = PeriodIndex(start='1/1/11', end='12/31/11', freq='2M')
         expected = PeriodIndex(['2011-01', '2011-03', '2011-05', '2011-07',
                                 '2011-09', '2011-11'], freq='2M')
         tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
 
         pi = period_range(start='1/1/11', end='12/31/11', freq='2M')
         tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
 
         pi = period_range(start='1/1/11', periods=6, freq='2M')
         tm.assert_index_equal(pi, expected)
-        self.assertEqual(pi.freq, offsets.MonthEnd(2))
-        self.assertEqual(pi.freqstr, '2M')
+        assert pi.freq == offsets.MonthEnd(2)
+        assert pi.freqstr == '2M'
 
     def test_iteration(self):
-        index = PeriodIndex(start='1/1/10', periods=4, freq='B')
+        index = period_range(start='1/1/10', periods=4, freq='B')
 
         result = list(index)
-        tm.assertIsInstance(result[0], Period)
-        self.assertEqual(result[0].freq, index.freq)
+        assert isinstance(result[0], Period)
+        assert result[0].freq == index.freq
 
     def test_is_full(self):
         index = PeriodIndex([2005, 2007, 2009], freq='A')
-        self.assertFalse(index.is_full)
+        assert not index.is_full
 
         index = PeriodIndex([2005, 2006, 2007], freq='A')
-        self.assertTrue(index.is_full)
+        assert index.is_full
 
         index = PeriodIndex([2005, 2005, 2007], freq='A')
-        self.assertFalse(index.is_full)
+        assert not index.is_full
 
         index = PeriodIndex([2005, 2005, 2006], freq='A')
-        self.assertTrue(index.is_full)
+        assert index.is_full
 
         index = PeriodIndex([2006, 2005, 2005], freq='A')
-        self.assertRaises(ValueError, getattr, index, 'is_full')
+        with pytest.raises(ValueError, match="Index is not monotonic"):
+            index.is_full
 
-        self.assertTrue(index[:0].is_full)
+        assert index[:0].is_full
 
     def test_with_multi_index(self):
         # #1705
@@ -731,16 +516,16 @@ def test_with_multi_index(self):
 
         s = Series([0, 1, 2, 3], index_as_arrays)
 
-        tm.assertIsInstance(s.index.levels[0], PeriodIndex)
+        assert isinstance(s.index.levels[0], PeriodIndex)
 
-        tm.assertIsInstance(s.index.values[0][0], Period)
+        assert isinstance(s.index.values[0][0], Period)
 
     def test_convert_array_of_periods(self):
         rng = period_range('1/1/2000', periods=20, freq='D')
         periods = list(rng)
 
         result = pd.Index(periods)
-        tm.assertIsInstance(result, PeriodIndex)
+        assert isinstance(result, PeriodIndex)
 
     def test_append_concat(self):
         # #1815
@@ -755,22 +540,45 @@ def test_append_concat(self):
 
         # drops index
         result = pd.concat([s1, s2])
-        tm.assertIsInstance(result.index, PeriodIndex)
-        self.assertEqual(result.index[0], s1.index[0])
+        assert isinstance(result.index, PeriodIndex)
+        assert result.index[0] == s1.index[0]
 
     def test_pickle_freq(self):
         # GH2891
         prng = period_range('1/1/2011', '1/1/2012', freq='M')
-        new_prng = self.round_trip_pickle(prng)
-        self.assertEqual(new_prng.freq, offsets.MonthEnd())
-        self.assertEqual(new_prng.freqstr, 'M')
+        new_prng = tm.round_trip_pickle(prng)
+        assert new_prng.freq == offsets.MonthEnd()
+        assert new_prng.freqstr == 'M'
 
     def test_map(self):
-        index = PeriodIndex([2005, 2007, 2009], freq='A')
-        result = index.map(lambda x: x + 1)
-        expected = index + 1
-        tm.assert_index_equal(result, expected)
+        # test_map_dictlike generally tests
 
+        index = PeriodIndex([2005, 2007, 2009], freq='A')
         result = index.map(lambda x: x.ordinal)
         exp = Index([x.ordinal for x in index])
         tm.assert_index_equal(result, exp)
+
+    def test_join_self(self, join_type):
+        index = period_range('1/1/2000', periods=10)
+        joined = index.join(index, how=join_type)
+        assert index is joined
+
+    def test_insert(self):
+        # GH 18295 (test missing)
+        expected = PeriodIndex(
+            ['2017Q1', pd.NaT, '2017Q2', '2017Q3', '2017Q4'], freq='Q')
+        for na in (np.nan, pd.NaT, None):
+            result = period_range('2017Q1', periods=4, freq='Q').insert(1, na)
+            tm.assert_index_equal(result, expected)
+
+
+def test_maybe_convert_timedelta():
+    pi = PeriodIndex(['2000', '2001'], freq='D')
+    offset = offsets.Day(2)
+    assert pi._maybe_convert_timedelta(offset) == 2
+    assert pi._maybe_convert_timedelta(2) == 2
+
+    offset = offsets.BusinessDay()
+    msg = r"Input has different freq=B from PeriodIndex\(freq=D\)"
+    with pytest.raises(ValueError, match=msg):
+        pi._maybe_convert_timedelta(offset)
diff --git a/pandas/tests/indexes/period/test_period_range.py b/pandas/tests/indexes/period/test_period_range.py
new file mode 100644
index 0000000000000..aa300111ba67a
--- /dev/null
+++ b/pandas/tests/indexes/period/test_period_range.py
@@ -0,0 +1,95 @@
+import pytest
+
+from pandas import NaT, Period, PeriodIndex, date_range, period_range
+import pandas.util.testing as tm
+
+
+class TestPeriodRange(object):
+
+    @pytest.mark.parametrize('freq', ['D', 'W', 'M', 'Q', 'A'])
+    def test_construction_from_string(self, freq):
+        # non-empty
+        expected = date_range(start='2017-01-01', periods=5,
+                              freq=freq, name='foo').to_period()
+        start, end = str(expected[0]), str(expected[-1])
+
+        result = period_range(start=start, end=end, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=start, periods=5, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=5, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # empty
+        expected = PeriodIndex([], freq=freq, name='foo')
+
+        result = period_range(start=start, periods=0, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=0, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=end, end=start, freq=freq, name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_construction_from_period(self):
+        # upsampling
+        start, end = Period('2017Q1', freq='Q'), Period('2018Q1', freq='Q')
+        expected = date_range(start='2017-03-31', end='2018-03-31', freq='M',
+                              name='foo').to_period()
+        result = period_range(start=start, end=end, freq='M', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # downsampling
+        start, end = Period('2017-1', freq='M'), Period('2019-12', freq='M')
+        expected = date_range(start='2017-01-31', end='2019-12-31', freq='Q',
+                              name='foo').to_period()
+        result = period_range(start=start, end=end, freq='Q', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        # empty
+        expected = PeriodIndex([], freq='W', name='foo')
+
+        result = period_range(start=start, periods=0, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(end=end, periods=0, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+        result = period_range(start=end, end=start, freq='W', name='foo')
+        tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the three parameters: start, end, and periods, '
+               'exactly two must be specified')
+        with pytest.raises(ValueError, match=msg):
+            period_range(start='2017Q1')
+
+        with pytest.raises(ValueError, match=msg):
+            period_range(end='2017Q1')
+
+        with pytest.raises(ValueError, match=msg):
+            period_range(periods=5)
+
+        with pytest.raises(ValueError, match=msg):
+            period_range()
+
+        # too many params
+        with pytest.raises(ValueError, match=msg):
+            period_range(start='2017Q1', end='2018Q1', periods=8, freq='Q')
+
+        # start/end NaT
+        msg = 'start and end must not be NaT'
+        with pytest.raises(ValueError, match=msg):
+            period_range(start=NaT, end='2018Q1')
+
+        with pytest.raises(ValueError, match=msg):
+            period_range(start='2017Q1', end=NaT)
+
+        # invalid periods param
+        msg = 'periods must be a number, got foo'
+        with pytest.raises(TypeError, match=msg):
+            period_range(start='2017Q1', periods='foo')
diff --git a/pandas/tests/indexes/period/test_scalar_compat.py b/pandas/tests/indexes/period/test_scalar_compat.py
new file mode 100644
index 0000000000000..b140a1f3c5b8b
--- /dev/null
+++ b/pandas/tests/indexes/period/test_scalar_compat.py
@@ -0,0 +1,18 @@
+# -*- coding: utf-8 -*-
+"""Tests for PeriodIndex behaving like a vectorized Period scalar"""
+
+from pandas import Timedelta, date_range, period_range
+import pandas.util.testing as tm
+
+
+class TestPeriodIndexOps(object):
+    def test_start_time(self):
+        index = period_range(freq='M', start='2016-01-01', end='2016-05-31')
+        expected_index = date_range('2016-01-01', end='2016-05-31', freq='MS')
+        tm.assert_index_equal(index.start_time, expected_index)
+
+    def test_end_time(self):
+        index = period_range(freq='M', start='2016-01-01', end='2016-05-31')
+        expected_index = date_range('2016-01-01', end='2016-05-31', freq='M')
+        expected_index += Timedelta(1, 'D') - Timedelta(1, 'ns')
+        tm.assert_index_equal(index.end_time, expected_index)
diff --git a/pandas/tests/indexes/period/test_setops.py b/pandas/tests/indexes/period/test_setops.py
index d4f06bae8bc32..bf29edad4841e 100644
--- a/pandas/tests/indexes/period/test_setops.py
+++ b/pandas/tests/indexes/period/test_setops.py
@@ -1,35 +1,31 @@
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import Index, PeriodIndex, date_range, period_range
+import pandas.core.indexes.period as period
 import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas import period_range, PeriodIndex, Index, date_range
 
 
 def _permute(obj):
     return obj.take(np.random.permutation(len(obj)))
 
 
-class TestPeriodIndex(tm.TestCase):
+class TestPeriodIndex(object):
 
-    def setUp(self):
-        pass
-
-    def test_joins(self):
+    def test_joins(self, join_type):
         index = period_range('1/1/2000', '1/20/2000', freq='D')
 
-        for kind in ['inner', 'outer', 'left', 'right']:
-            joined = index.join(index[:-5], how=kind)
+        joined = index.join(index[:-5], how=join_type)
 
-            tm.assertIsInstance(joined, PeriodIndex)
-            self.assertEqual(joined.freq, index.freq)
+        assert isinstance(joined, PeriodIndex)
+        assert joined.freq == index.freq
 
-    def test_join_self(self):
+    def test_join_self(self, join_type):
         index = period_range('1/1/2000', '1/20/2000', freq='D')
 
-        for kind in ['inner', 'outer', 'left', 'right']:
-            res = index.join(index, how=kind)
-            self.assertIs(index, res)
+        res = index.join(index, how=join_type)
+        assert index is res
 
     def test_join_does_not_recur(self):
         df = tm.makeCustomDataframe(
@@ -42,10 +38,11 @@ def test_join_does_not_recur(self):
                           df.columns[0], df.columns[1]], object)
         tm.assert_index_equal(res, expected)
 
-    def test_union(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, sort):
         # union
-        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
-        other1 = pd.period_range('1/6/2000', freq='D', periods=5)
+        other1 = pd.period_range('1/1/2000', freq='D', periods=5)
+        rng1 = pd.period_range('1/6/2000', freq='D', periods=5)
         expected1 = pd.period_range('1/1/2000', freq='D', periods=10)
 
         rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
@@ -82,39 +79,53 @@ def test_union(self):
         other7 = pd.period_range('1998-01-01', freq='A', periods=8)
         expected7 = pd.period_range('1998-01-01', freq='A', periods=10)
 
+        rng8 = pd.PeriodIndex(['1/3/2000', '1/2/2000', '1/1/2000',
+                               '1/5/2000', '1/4/2000'], freq='D')
+        other8 = pd.period_range('1/6/2000', freq='D', periods=5)
+        expected8 = pd.PeriodIndex(['1/3/2000', '1/2/2000', '1/1/2000',
+                                    '1/5/2000', '1/4/2000', '1/6/2000',
+                                    '1/7/2000', '1/8/2000', '1/9/2000',
+                                    '1/10/2000'], freq='D')
+
         for rng, other, expected in [(rng1, other1, expected1),
                                      (rng2, other2, expected2),
-                                     (rng3, other3, expected3), (rng4, other4,
-                                                                 expected4),
-                                     (rng5, other5, expected5), (rng6, other6,
-                                                                 expected6),
-                                     (rng7, other7, expected7)]:
+                                     (rng3, other3, expected3),
+                                     (rng4, other4, expected4),
+                                     (rng5, other5, expected5),
+                                     (rng6, other6, expected6),
+                                     (rng7, other7, expected7),
+                                     (rng8, other8, expected8)]:
 
-            result_union = rng.union(other)
+            result_union = rng.union(other, sort=sort)
+            if sort is None:
+                expected = expected.sort_values()
             tm.assert_index_equal(result_union, expected)
 
-    def test_union_misc(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_misc(self, sort):
         index = period_range('1/1/2000', '1/20/2000', freq='D')
 
-        result = index[:-5].union(index[10:])
+        result = index[:-5].union(index[10:], sort=sort)
         tm.assert_index_equal(result, index)
 
         # not in order
-        result = _permute(index[:-5]).union(_permute(index[10:]))
-        tm.assert_index_equal(result, index)
+        result = _permute(index[:-5]).union(_permute(index[10:]), sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, index)
+        assert tm.equalContents(result, index)
 
         # raise if different frequencies
         index = period_range('1/1/2000', '1/20/2000', freq='D')
         index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
-        with tm.assertRaises(period.IncompatibleFrequency):
-            index.union(index2)
+        with pytest.raises(period.IncompatibleFrequency):
+            index.union(index2, sort=sort)
 
         msg = 'can only call with other PeriodIndex-ed objects'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             index.join(index.to_timestamp())
 
         index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
-        with tm.assertRaises(period.IncompatibleFrequency):
+        with pytest.raises(period.IncompatibleFrequency):
             index.join(index3)
 
     def test_union_dataframe_index(self):
@@ -126,31 +137,35 @@ def test_union_dataframe_index(self):
         df = pd.DataFrame({'s1': s1, 's2': s2})
 
         exp = pd.period_range('1/1/1980', '1/1/2012', freq='M')
-        self.assert_index_equal(df.index, exp)
+        tm.assert_index_equal(df.index, exp)
 
-    def test_intersection(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection(self, sort):
         index = period_range('1/1/2000', '1/20/2000', freq='D')
 
-        result = index[:-5].intersection(index[10:])
+        result = index[:-5].intersection(index[10:], sort=sort)
         tm.assert_index_equal(result, index[10:-5])
 
         # not in order
         left = _permute(index[:-5])
         right = _permute(index[10:])
-        result = left.intersection(right).sort_values()
-        tm.assert_index_equal(result, index[10:-5])
+        result = left.intersection(right, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, index[10:-5])
+        assert tm.equalContents(result, index[10:-5])
 
         # raise if different frequencies
         index = period_range('1/1/2000', '1/20/2000', freq='D')
         index2 = period_range('1/1/2000', '1/20/2000', freq='W-WED')
-        with tm.assertRaises(period.IncompatibleFrequency):
-            index.intersection(index2)
+        with pytest.raises(period.IncompatibleFrequency):
+            index.intersection(index2, sort=sort)
 
         index3 = period_range('1/1/2000', '1/20/2000', freq='2D')
-        with tm.assertRaises(period.IncompatibleFrequency):
-            index.intersection(index3)
+        with pytest.raises(period.IncompatibleFrequency):
+            index.intersection(index3, sort=sort)
 
-    def test_intersection_cases(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_cases(self, sort):
         base = period_range('6/1/2000', '6/30/2000', freq='D', name='idx')
 
         # if target has the same name, it is preserved
@@ -168,10 +183,10 @@ def test_intersection_cases(self):
 
         for (rng, expected) in [(rng2, expected2), (rng3, expected3),
                                 (rng4, expected4)]:
-            result = base.intersection(rng)
+            result = base.intersection(rng, sort=sort)
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
         # non-monotonic
         base = PeriodIndex(['2011-01-05', '2011-01-04', '2011-01-02',
@@ -194,50 +209,64 @@ def test_intersection_cases(self):
 
         for (rng, expected) in [(rng2, expected2), (rng3, expected3),
                                 (rng4, expected4)]:
-            result = base.intersection(rng)
+            result = base.intersection(rng, sort=sort)
+            if sort is None:
+                expected = expected.sort_values()
             tm.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, 'D')
+            assert result.name == expected.name
+            assert result.freq == 'D'
 
         # empty same freq
         rng = date_range('6/1/2000', '6/15/2000', freq='T')
         result = rng[0:0].intersection(rng)
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
         result = rng.intersection(rng[0:0])
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
-    def test_difference(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference(self, sort):
         # diff
-        rng1 = pd.period_range('1/1/2000', freq='D', periods=5)
+        period_rng = ['1/3/2000', '1/2/2000', '1/1/2000', '1/5/2000',
+                      '1/4/2000']
+        rng1 = pd.PeriodIndex(period_rng, freq='D')
         other1 = pd.period_range('1/6/2000', freq='D', periods=5)
-        expected1 = pd.period_range('1/1/2000', freq='D', periods=5)
+        expected1 = rng1
 
-        rng2 = pd.period_range('1/1/2000', freq='D', periods=5)
+        rng2 = pd.PeriodIndex(period_rng, freq='D')
         other2 = pd.period_range('1/4/2000', freq='D', periods=5)
-        expected2 = pd.period_range('1/1/2000', freq='D', periods=3)
+        expected2 = pd.PeriodIndex(['1/3/2000', '1/2/2000', '1/1/2000'],
+                                   freq='D')
 
-        rng3 = pd.period_range('1/1/2000', freq='D', periods=5)
+        rng3 = pd.PeriodIndex(period_rng, freq='D')
         other3 = pd.PeriodIndex([], freq='D')
-        expected3 = pd.period_range('1/1/2000', freq='D', periods=5)
+        expected3 = rng3
 
-        rng4 = pd.period_range('2000-01-01 09:00', freq='H', periods=5)
+        period_rng = ['2000-01-01 10:00', '2000-01-01 09:00',
+                      '2000-01-01 12:00', '2000-01-01 11:00',
+                      '2000-01-01 13:00']
+        rng4 = pd.PeriodIndex(period_rng, freq='H')
         other4 = pd.period_range('2000-01-02 09:00', freq='H', periods=5)
         expected4 = rng4
 
-        rng5 = pd.PeriodIndex(['2000-01-01 09:01', '2000-01-01 09:03',
+        rng5 = pd.PeriodIndex(['2000-01-01 09:03', '2000-01-01 09:01',
                                '2000-01-01 09:05'], freq='T')
         other5 = pd.PeriodIndex(
             ['2000-01-01 09:01', '2000-01-01 09:05'], freq='T')
         expected5 = pd.PeriodIndex(['2000-01-01 09:03'], freq='T')
 
-        rng6 = pd.period_range('2000-01-01', freq='M', periods=7)
+        period_rng = ['2000-02-01', '2000-01-01', '2000-06-01',
+                      '2000-07-01', '2000-05-01', '2000-03-01',
+                      '2000-04-01']
+        rng6 = pd.PeriodIndex(period_rng, freq='M')
         other6 = pd.period_range('2000-04-01', freq='M', periods=7)
-        expected6 = pd.period_range('2000-01-01', freq='M', periods=3)
+        expected6 = pd.PeriodIndex(['2000-02-01', '2000-01-01', '2000-03-01'],
+                                   freq='M')
 
-        rng7 = pd.period_range('2003-01-01', freq='A', periods=5)
+        period_rng = ['2003', '2007', '2006', '2005', '2004']
+        rng7 = pd.PeriodIndex(period_rng, freq='A')
         other7 = pd.period_range('1998-01-01', freq='A', periods=8)
-        expected7 = pd.period_range('2006-01-01', freq='A', periods=2)
+        expected7 = pd.PeriodIndex(['2007', '2006'], freq='A')
 
         for rng, other, expected in [(rng1, other1, expected1),
                                      (rng2, other2, expected2),
@@ -246,5 +275,7 @@ def test_difference(self):
                                      (rng5, other5, expected5),
                                      (rng6, other6, expected6),
                                      (rng7, other7, expected7), ]:
-            result_union = rng.difference(other)
-            tm.assert_index_equal(result_union, expected)
+            result_difference = rng.difference(other, sort=sort)
+            if sort is None:
+                expected = expected.sort_values()
+            tm.assert_index_equal(result_difference, expected)
diff --git a/pandas/tests/indexes/period/test_tools.py b/pandas/tests/indexes/period/test_tools.py
index f9a1df3d824f1..641400ebec925 100644
--- a/pandas/tests/indexes/period/test_tools.py
+++ b/pandas/tests/indexes/period/test_tools.py
@@ -1,26 +1,29 @@
-import numpy as np
 from datetime import datetime, timedelta
 
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs.ccalendar import MONTHS
+from pandas.compat import lrange
+
 import pandas as pd
+from pandas import (
+    DatetimeIndex, Period, PeriodIndex, Series, Timedelta, Timestamp,
+    date_range, period_range, to_datetime)
+import pandas.core.indexes.period as period
 import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas.compat import lrange
-from pandas.tseries.frequencies import get_freq, MONTHS
-from pandas._libs.period import period_ordinal, period_asfreq
-from pandas import (PeriodIndex, Period, DatetimeIndex, Timestamp, Series,
-                    date_range, to_datetime, period_range)
 
 
-class TestPeriodRepresentation(tm.TestCase):
+class TestPeriodRepresentation(object):
     """
     Wish to match NumPy units
     """
 
     def _check_freq(self, freq, base_date):
-        rng = PeriodIndex(start=base_date, periods=10, freq=freq)
+        rng = period_range(start=base_date, periods=10, freq=freq)
         exp = np.arange(10, dtype=np.int64)
-        self.assert_numpy_array_equal(rng._values, exp)
-        self.assert_numpy_array_equal(rng.asi8, exp)
+
+        tm.assert_numpy_array_equal(rng.asi8, exp)
 
     def test_annual(self):
         self._check_freq('A', 1970)
@@ -28,32 +31,10 @@ def test_annual(self):
     def test_monthly(self):
         self._check_freq('M', '1970-01')
 
-    def test_weekly(self):
-        self._check_freq('W-THU', '1970-01-01')
-
-    def test_daily(self):
-        self._check_freq('D', '1970-01-01')
-
-    def test_business_daily(self):
-        self._check_freq('B', '1970-01-01')
-
-    def test_hourly(self):
-        self._check_freq('H', '1970-01-01')
-
-    def test_minutely(self):
-        self._check_freq('T', '1970-01-01')
-
-    def test_secondly(self):
-        self._check_freq('S', '1970-01-01')
-
-    def test_millisecondly(self):
-        self._check_freq('L', '1970-01-01')
-
-    def test_microsecondly(self):
-        self._check_freq('U', '1970-01-01')
-
-    def test_nanosecondly(self):
-        self._check_freq('N', '1970-01-01')
+    @pytest.mark.parametrize('freq', ['W-THU', 'D', 'B', 'H', 'T',
+                                      'S', 'L', 'U', 'N'])
+    def test_freq(self, freq):
+        self._check_freq(freq, '1970-01-01')
 
     def test_negone_ordinals(self):
         freqs = ['A', 'M', 'Q', 'D', 'H', 'T', 'S']
@@ -65,7 +46,7 @@ def test_negone_ordinals(self):
         for freq in freqs:
             period = Period(ordinal=-1, freq=freq)
             repr(period)
-            self.assertEqual(period.year, 1969)
+            assert period.year == 1969
 
         period = Period(ordinal=-1, freq='B')
         repr(period)
@@ -73,122 +54,16 @@ def test_negone_ordinals(self):
         repr(period)
 
 
-class TestTslib(tm.TestCase):
-    def test_intraday_conversion_factors(self):
-        self.assertEqual(period_asfreq(
-            1, get_freq('D'), get_freq('H'), False), 24)
-        self.assertEqual(period_asfreq(
-            1, get_freq('D'), get_freq('T'), False), 1440)
-        self.assertEqual(period_asfreq(
-            1, get_freq('D'), get_freq('S'), False), 86400)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'D'), get_freq('L'), False), 86400000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'D'), get_freq('U'), False), 86400000000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'D'), get_freq('N'), False), 86400000000000)
-
-        self.assertEqual(period_asfreq(
-            1, get_freq('H'), get_freq('T'), False), 60)
-        self.assertEqual(period_asfreq(
-            1, get_freq('H'), get_freq('S'), False), 3600)
-        self.assertEqual(period_asfreq(1, get_freq('H'),
-                                       get_freq('L'), False), 3600000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'H'), get_freq('U'), False), 3600000000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'H'), get_freq('N'), False), 3600000000000)
-
-        self.assertEqual(period_asfreq(
-            1, get_freq('T'), get_freq('S'), False), 60)
-        self.assertEqual(period_asfreq(
-            1, get_freq('T'), get_freq('L'), False), 60000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'T'), get_freq('U'), False), 60000000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'T'), get_freq('N'), False), 60000000000)
-
-        self.assertEqual(period_asfreq(
-            1, get_freq('S'), get_freq('L'), False), 1000)
-        self.assertEqual(period_asfreq(1, get_freq('S'),
-                                       get_freq('U'), False), 1000000)
-        self.assertEqual(period_asfreq(1, get_freq(
-            'S'), get_freq('N'), False), 1000000000)
-
-        self.assertEqual(period_asfreq(
-            1, get_freq('L'), get_freq('U'), False), 1000)
-        self.assertEqual(period_asfreq(1, get_freq('L'),
-                                       get_freq('N'), False), 1000000)
-
-        self.assertEqual(period_asfreq(
-            1, get_freq('U'), get_freq('N'), False), 1000)
-
-    def test_period_ordinal_start_values(self):
-        # information for 1.1.1970
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0,
-                                           get_freq('A')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0,
-                                           get_freq('M')))
-        self.assertEqual(1, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0,
-                                           get_freq('W')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0,
-                                           get_freq('D')))
-        self.assertEqual(0, period_ordinal(1970, 1, 1, 0, 0, 0, 0, 0,
-                                           get_freq('B')))
-
-    def test_period_ordinal_week(self):
-        self.assertEqual(1, period_ordinal(1970, 1, 4, 0, 0, 0, 0, 0,
-                                           get_freq('W')))
-        self.assertEqual(2, period_ordinal(1970, 1, 5, 0, 0, 0, 0, 0,
-                                           get_freq('W')))
-
-        self.assertEqual(2284, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0,
-                                              get_freq('W')))
-        self.assertEqual(2285, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0,
-                                              get_freq('W')))
-
-    def test_period_ordinal_business_day(self):
-        # Thursday
-        self.assertEqual(11415, period_ordinal(2013, 10, 3, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-        # Friday
-        self.assertEqual(11416, period_ordinal(2013, 10, 4, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-        # Saturday
-        self.assertEqual(11417, period_ordinal(2013, 10, 5, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-        # Sunday
-        self.assertEqual(11417, period_ordinal(2013, 10, 6, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-        # Monday
-        self.assertEqual(11417, period_ordinal(2013, 10, 7, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-        # Tuesday
-        self.assertEqual(11418, period_ordinal(2013, 10, 8, 0, 0, 0, 0, 0,
-                                               get_freq('B')))
-
-
-class TestPeriodIndex(tm.TestCase):
-
-    def setUp(self):
-        pass
-
-    def test_tolist(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
-        rs = index.tolist()
-        [tm.assertIsInstance(x, Period) for x in rs]
-
-        recon = PeriodIndex(rs)
-        tm.assert_index_equal(index, recon)
-
+class TestPeriodIndex(object):
     def test_to_timestamp(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009')
+        index = period_range(freq='A', start='1/1/2001', end='12/1/2009')
         series = Series(1, index=index, name='foo')
 
         exp_index = date_range('1/1/2001', end='12/31/2009', freq='A-DEC')
         result = series.to_timestamp(how='end')
+        exp_index = exp_index + Timedelta(1, 'D') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
-        self.assertEqual(result.name, 'foo')
+        assert result.name == 'foo'
 
         exp_index = date_range('1/1/2001', end='1/1/2009', freq='AS-JAN')
         result = series.to_timestamp(how='start')
@@ -201,44 +76,36 @@ def _get_with_delta(delta, freq='A-DEC'):
         delta = timedelta(hours=23)
         result = series.to_timestamp('H', 'end')
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'h') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
         delta = timedelta(hours=23, minutes=59)
         result = series.to_timestamp('T', 'end')
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 'm') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
         result = series.to_timestamp('S', 'end')
         delta = timedelta(hours=23, minutes=59, seconds=59)
         exp_index = _get_with_delta(delta)
+        exp_index = exp_index + Timedelta(1, 's') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
 
-        index = PeriodIndex(freq='H', start='1/1/2001', end='1/2/2001')
+        index = period_range(freq='H', start='1/1/2001', end='1/2/2001')
         series = Series(1, index=index, name='foo')
 
         exp_index = date_range('1/1/2001 00:59:59', end='1/2/2001 00:59:59',
                                freq='H')
         result = series.to_timestamp(how='end')
+        exp_index = exp_index + Timedelta(1, 's') - Timedelta(1, 'ns')
         tm.assert_index_equal(result.index, exp_index)
-        self.assertEqual(result.name, 'foo')
-
-    def test_to_timestamp_quarterly_bug(self):
-        years = np.arange(1960, 2000).repeat(4)
-        quarters = np.tile(lrange(1, 5), 40)
-
-        pindex = PeriodIndex(year=years, quarter=quarters)
-
-        stamps = pindex.to_timestamp('D', 'end')
-        expected = DatetimeIndex([x.to_timestamp('D', 'end') for x in pindex])
-        tm.assert_index_equal(stamps, expected)
+        assert result.name == 'foo'
 
-    def test_to_timestamp_preserve_name(self):
-        index = PeriodIndex(freq='A', start='1/1/2001', end='12/1/2009',
-                            name='foo')
-        self.assertEqual(index.name, 'foo')
-
-        conv = index.to_timestamp('D')
-        self.assertEqual(conv.name, 'foo')
+    def test_to_timestamp_freq(self):
+        idx = pd.period_range('2017', periods=12, freq="A-DEC")
+        result = idx.to_timestamp()
+        expected = pd.date_range("2017", periods=12, freq="AS-JAN")
+        tm.assert_index_equal(result, expected)
 
     def test_to_timestamp_repr_is_code(self):
         zs = [Timestamp('99-04-17 00:00:00', tz='UTC'),
@@ -246,58 +113,7 @@ def test_to_timestamp_repr_is_code(self):
               Timestamp('2001-04-17 00:00:00', tz='America/Los_Angeles'),
               Timestamp('2001-04-17 00:00:00', tz=None)]
         for z in zs:
-            self.assertEqual(eval(repr(z)), z)
-
-    def test_to_timestamp_pi_nat(self):
-        # GH 7228
-        index = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='M',
-                            name='idx')
-
-        result = index.to_timestamp('D')
-        expected = DatetimeIndex([pd.NaT, datetime(2011, 1, 1),
-                                  datetime(2011, 2, 1)], name='idx')
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, 'idx')
-
-        result2 = result.to_period(freq='M')
-        tm.assert_index_equal(result2, index)
-        self.assertEqual(result2.name, 'idx')
-
-        result3 = result.to_period(freq='3M')
-        exp = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='3M', name='idx')
-        self.assert_index_equal(result3, exp)
-        self.assertEqual(result3.freqstr, '3M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -2A')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            result.to_period(freq='-2A')
-
-    def test_to_timestamp_pi_mult(self):
-        idx = PeriodIndex(['2011-01', 'NaT', '2011-02'], freq='2M', name='idx')
-        result = idx.to_timestamp()
-        expected = DatetimeIndex(
-            ['2011-01-01', 'NaT', '2011-02-01'], name='idx')
-        self.assert_index_equal(result, expected)
-        result = idx.to_timestamp(how='E')
-        expected = DatetimeIndex(
-            ['2011-02-28', 'NaT', '2011-03-31'], name='idx')
-        self.assert_index_equal(result, expected)
-
-    def test_to_timestamp_pi_combined(self):
-        idx = PeriodIndex(start='2011', periods=2, freq='1D1H', name='idx')
-        result = idx.to_timestamp()
-        expected = DatetimeIndex(
-            ['2011-01-01 00:00', '2011-01-02 01:00'], name='idx')
-        self.assert_index_equal(result, expected)
-        result = idx.to_timestamp(how='E')
-        expected = DatetimeIndex(
-            ['2011-01-02 00:59:59', '2011-01-03 01:59:59'], name='idx')
-        self.assert_index_equal(result, expected)
-        result = idx.to_timestamp(how='E', freq='H')
-        expected = DatetimeIndex(
-            ['2011-01-02 00:00', '2011-01-03 01:00'], name='idx')
-        self.assert_index_equal(result, expected)
+            assert eval(repr(z)) == z
 
     def test_to_timestamp_to_period_astype(self):
         idx = DatetimeIndex([pd.NaT, '2011-01-01', '2011-02-01'], name='idx')
@@ -308,21 +124,21 @@ def test_to_timestamp_to_period_astype(self):
 
         res = idx.astype('period[3M]')
         exp = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='3M', name='idx')
-        self.assert_index_equal(res, exp)
+        tm.assert_index_equal(res, exp)
 
     def test_dti_to_period(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
+        dti = pd.date_range(start='1/1/2005', end='12/1/2005', freq='M')
         pi1 = dti.to_period()
         pi2 = dti.to_period(freq='D')
         pi3 = dti.to_period(freq='3D')
 
-        self.assertEqual(pi1[0], Period('Jan 2005', freq='M'))
-        self.assertEqual(pi2[0], Period('1/31/2005', freq='D'))
-        self.assertEqual(pi3[0], Period('1/31/2005', freq='3D'))
+        assert pi1[0] == Period('Jan 2005', freq='M')
+        assert pi2[0] == Period('1/31/2005', freq='D')
+        assert pi3[0] == Period('1/31/2005', freq='3D')
 
-        self.assertEqual(pi1[-1], Period('Nov 2005', freq='M'))
-        self.assertEqual(pi2[-1], Period('11/30/2005', freq='D'))
-        self.assertEqual(pi3[-1], Period('11/30/2005', freq='3D'))
+        assert pi1[-1] == Period('Nov 2005', freq='M')
+        assert pi2[-1] == Period('11/30/2005', freq='D')
+        assert pi3[-1], Period('11/30/2005', freq='3D')
 
         tm.assert_index_equal(pi1, period_range('1/1/2005', '11/1/2005',
                                                 freq='M'))
@@ -331,61 +147,40 @@ def test_dti_to_period(self):
         tm.assert_index_equal(pi3, period_range('1/1/2005', '11/1/2005',
                                                 freq='M').asfreq('3D'))
 
-    def test_period_astype_to_timestamp(self):
-        pi = pd.PeriodIndex(['2011-01', '2011-02', '2011-03'], freq='M')
-
-        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'])
-        tm.assert_index_equal(pi.astype('datetime64[ns]'), exp)
-
-        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'])
-        tm.assert_index_equal(pi.astype('datetime64[ns]', how='end'), exp)
-
-        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
-                               tz='US/Eastern')
-        res = pi.astype('datetime64[ns, US/Eastern]')
-        tm.assert_index_equal(pi.astype('datetime64[ns, US/Eastern]'), exp)
-
-        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'],
-                               tz='US/Eastern')
-        res = pi.astype('datetime64[ns, US/Eastern]', how='end')
-        tm.assert_index_equal(res, exp)
-
-    def test_to_period_quarterly(self):
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_to_period_quarterly(self, month):
         # make sure we can make the round trip
-        for month in MONTHS:
-            freq = 'Q-%s' % month
-            rng = period_range('1989Q3', '1991Q3', freq=freq)
-            stamps = rng.to_timestamp()
-            result = stamps.to_period(freq)
-            tm.assert_index_equal(rng, result)
-
-    def test_to_period_quarterlyish(self):
-        offsets = ['BQ', 'QS', 'BQS']
-        for off in offsets:
-            rng = date_range('01-Jan-2012', periods=8, freq=off)
-            prng = rng.to_period()
-            self.assertEqual(prng.freq, 'Q-DEC')
+        freq = 'Q-%s' % month
+        rng = period_range('1989Q3', '1991Q3', freq=freq)
+        stamps = rng.to_timestamp()
+        result = stamps.to_period(freq)
+        tm.assert_index_equal(rng, result)
+
+    @pytest.mark.parametrize('off', ['BQ', 'QS', 'BQS'])
+    def test_to_period_quarterlyish(self, off):
+        rng = date_range('01-Jan-2012', periods=8, freq=off)
+        prng = rng.to_period()
+        assert prng.freq == 'Q-DEC'
 
-    def test_to_period_annualish(self):
-        offsets = ['BA', 'AS', 'BAS']
-        for off in offsets:
-            rng = date_range('01-Jan-2012', periods=8, freq=off)
-            prng = rng.to_period()
-            self.assertEqual(prng.freq, 'A-DEC')
+    @pytest.mark.parametrize('off', ['BA', 'AS', 'BAS'])
+    def test_to_period_annualish(self, off):
+        rng = date_range('01-Jan-2012', periods=8, freq=off)
+        prng = rng.to_period()
+        assert prng.freq == 'A-DEC'
 
     def test_to_period_monthish(self):
         offsets = ['MS', 'BM']
         for off in offsets:
             rng = date_range('01-Jan-2012', periods=8, freq=off)
             prng = rng.to_period()
-            self.assertEqual(prng.freq, 'M')
+            assert prng.freq == 'M'
 
         rng = date_range('01-Jan-2012', periods=8, freq='M')
         prng = rng.to_period()
-        self.assertEqual(prng.freq, 'M')
+        assert prng.freq == 'M'
 
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
+        msg = pd._libs.tslibs.frequencies.INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
             date_range('01-Jan-2012', periods=8, freq='EOM')
 
     def test_period_dt64_round_trip(self):
@@ -397,25 +192,11 @@ def test_period_dt64_round_trip(self):
         pi = dti.to_period(freq='H')
         tm.assert_index_equal(pi.to_timestamp(), dti)
 
-    def test_to_timestamp_1703(self):
-        index = period_range('1/1/2012', periods=4, freq='D')
-
-        result = index.to_timestamp()
-        self.assertEqual(result[0], Timestamp('1/1/2012'))
-
-    def test_to_datetime_depr(self):
-        index = period_range('1/1/2012', periods=4, freq='D')
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = index.to_datetime()
-            self.assertEqual(result[0], Timestamp('1/1/2012'))
-
     def test_combine_first(self):
-        # GH 3367
-        didx = pd.DatetimeIndex(start='1950-01-31', end='1950-07-31', freq='M')
-        pidx = pd.PeriodIndex(start=pd.Period('1950-1'),
-                              end=pd.Period('1950-7'), freq='M')
+        # GH#3367
+        didx = pd.date_range(start='1950-01-31', end='1950-07-31', freq='M')
+        pidx = pd.period_range(start=pd.Period('1950-1'),
+                               end=pd.Period('1950-7'), freq='M')
         # check to be consistent with DatetimeIndex
         for idx in [didx, pidx]:
             a = pd.Series([1, np.nan, np.nan, 4, 5, np.nan, 7], index=idx)
@@ -426,24 +207,139 @@ def test_combine_first(self):
                                  dtype=np.float64)
             tm.assert_series_equal(result, expected)
 
-    def test_searchsorted(self):
-        for freq in ['D', '2D']:
-            pidx = pd.PeriodIndex(['2014-01-01', '2014-01-02', '2014-01-03',
-                                   '2014-01-04', '2014-01-05'], freq=freq)
+    @pytest.mark.parametrize('freq', ['D', '2D'])
+    def test_searchsorted(self, freq):
+        pidx = pd.PeriodIndex(['2014-01-01', '2014-01-02', '2014-01-03',
+                               '2014-01-04', '2014-01-05'], freq=freq)
+
+        p1 = pd.Period('2014-01-01', freq=freq)
+        assert pidx.searchsorted(p1) == 0
+
+        p2 = pd.Period('2014-01-04', freq=freq)
+        assert pidx.searchsorted(p2) == 3
+
+        msg = "Input has different freq=H from PeriodIndex"
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
+            pidx.searchsorted(pd.Period('2014-01-01', freq='H'))
+
+        msg = "Input has different freq=5D from PeriodIndex"
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
+            pidx.searchsorted(pd.Period('2014-01-01', freq='5D'))
+
+
+class TestPeriodIndexConversion(object):
+    def test_tolist(self):
+        index = period_range(freq='A', start='1/1/2001', end='12/1/2009')
+        rs = index.tolist()
+        for x in rs:
+            assert isinstance(x, Period)
+
+        recon = PeriodIndex(rs)
+        tm.assert_index_equal(index, recon)
+
+    def test_to_timestamp_pi_nat(self):
+        # GH#7228
+        index = PeriodIndex(['NaT', '2011-01', '2011-02'], freq='M',
+                            name='idx')
+
+        result = index.to_timestamp('D')
+        expected = DatetimeIndex([pd.NaT, datetime(2011, 1, 1),
+                                  datetime(2011, 2, 1)], name='idx')
+        tm.assert_index_equal(result, expected)
+        assert result.name == 'idx'
 
-            p1 = pd.Period('2014-01-01', freq=freq)
-            self.assertEqual(pidx.searchsorted(p1), 0)
+        result2 = result.to_period(freq='M')
+        tm.assert_index_equal(result2, index)
+        assert result2.name == 'idx'
 
-            p2 = pd.Period('2014-01-04', freq=freq)
-            self.assertEqual(pidx.searchsorted(p2), 3)
+        result3 = result.to_period(freq='3M')
+        exp = PeriodIndex(['NaT', '2011-01', '2011-02'],
+                          freq='3M', name='idx')
+        tm.assert_index_equal(result3, exp)
+        assert result3.freqstr == '3M'
 
-            msg = "Input has different freq=H from PeriodIndex"
-            with self.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                pidx.searchsorted(pd.Period('2014-01-01', freq='H'))
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -2A')
+        with pytest.raises(ValueError, match=msg):
+            result.to_period(freq='-2A')
+
+    def test_to_timestamp_preserve_name(self):
+        index = period_range(freq='A', start='1/1/2001', end='12/1/2009',
+                             name='foo')
+        assert index.name == 'foo'
 
-            msg = "Input has different freq=5D from PeriodIndex"
-            with self.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                pidx.searchsorted(pd.Period('2014-01-01', freq='5D'))
+        conv = index.to_timestamp('D')
+        assert conv.name == 'foo'
 
-            with tm.assert_produces_warning(FutureWarning):
-                pidx.searchsorted(key=p2)
+    def test_to_timestamp_quarterly_bug(self):
+        years = np.arange(1960, 2000).repeat(4)
+        quarters = np.tile(lrange(1, 5), 40)
+
+        pindex = PeriodIndex(year=years, quarter=quarters)
+
+        stamps = pindex.to_timestamp('D', 'end')
+        expected = DatetimeIndex([x.to_timestamp('D', 'end') for x in pindex])
+        tm.assert_index_equal(stamps, expected)
+
+    def test_to_timestamp_pi_mult(self):
+        idx = PeriodIndex(['2011-01', 'NaT', '2011-02'],
+                          freq='2M', name='idx')
+
+        result = idx.to_timestamp()
+        expected = DatetimeIndex(['2011-01-01', 'NaT', '2011-02-01'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E')
+        expected = DatetimeIndex(['2011-02-28', 'NaT', '2011-03-31'],
+                                 name='idx')
+        expected = expected + Timedelta(1, 'D') - Timedelta(1, 'ns')
+        tm.assert_index_equal(result, expected)
+
+    def test_to_timestamp_pi_combined(self):
+        idx = period_range(start='2011', periods=2, freq='1D1H', name='idx')
+
+        result = idx.to_timestamp()
+        expected = DatetimeIndex(['2011-01-01 00:00', '2011-01-02 01:00'],
+                                 name='idx')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E')
+        expected = DatetimeIndex(['2011-01-02 00:59:59',
+                                  '2011-01-03 01:59:59'],
+                                 name='idx')
+        expected = expected + Timedelta(1, 's') - Timedelta(1, 'ns')
+        tm.assert_index_equal(result, expected)
+
+        result = idx.to_timestamp(how='E', freq='H')
+        expected = DatetimeIndex(['2011-01-02 00:00', '2011-01-03 01:00'],
+                                 name='idx')
+        expected = expected + Timedelta(1, 'h') - Timedelta(1, 'ns')
+        tm.assert_index_equal(result, expected)
+
+    def test_period_astype_to_timestamp(self):
+        pi = pd.PeriodIndex(['2011-01', '2011-02', '2011-03'], freq='M')
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'])
+        tm.assert_index_equal(pi.astype('datetime64[ns]'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'])
+        exp = exp + Timedelta(1, 'D') - Timedelta(1, 'ns')
+        tm.assert_index_equal(pi.astype('datetime64[ns]', how='end'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-03-01'],
+                               tz='US/Eastern')
+        res = pi.astype('datetime64[ns, US/Eastern]')
+        tm.assert_index_equal(pi.astype('datetime64[ns, US/Eastern]'), exp)
+
+        exp = pd.DatetimeIndex(['2011-01-31', '2011-02-28', '2011-03-31'],
+                               tz='US/Eastern')
+        exp = exp + Timedelta(1, 'D') - Timedelta(1, 'ns')
+        res = pi.astype('datetime64[ns, US/Eastern]', how='end')
+        tm.assert_index_equal(res, exp)
+
+    def test_to_timestamp_1703(self):
+        index = period_range('1/1/2012', periods=4, freq='D')
+
+        result = index.to_timestamp()
+        assert result[0] == Timestamp('1/1/2012')
diff --git a/pandas/tests/indexes/test_base.py b/pandas/tests/indexes/test_base.py
index a8197b070b032..26dcf7d6bc234 100644
--- a/pandas/tests/indexes/test_base.py
+++ b/pandas/tests/indexes/test_base.py
@@ -1,36 +1,41 @@
 # -*- coding: utf-8 -*-
 
+from collections import defaultdict
 from datetime import datetime, timedelta
-
-import pandas.util.testing as tm
-from pandas.indexes.api import Index, MultiIndex
-from pandas.tests.indexes.common import Base
-
-from pandas.compat import (range, lrange, lzip, u,
-                           text_type, zip, PY3, PY36)
+import math
 import operator
+import re
+import sys
+
 import numpy as np
+import pytest
 
-from pandas import (period_range, date_range, Series,
-                    DataFrame, Float64Index, Int64Index,
-                    CategoricalIndex, DatetimeIndex, TimedeltaIndex,
-                    PeriodIndex)
-from pandas.core.index import _get_combined_index
-from pandas.util.testing import assert_almost_equal
+from pandas._libs.tslib import Timestamp
+from pandas.compat import (
+    PY3, PY35, PY36, StringIO, lrange, lzip, range, text_type, u, zip)
 from pandas.compat.numpy import np_datetime64_compat
 
-import pandas.core.config as cf
-
-from pandas.tseries.index import _to_m8
+from pandas.core.dtypes.common import is_unsigned_integer_dtype
+from pandas.core.dtypes.generic import ABCIndex
 
 import pandas as pd
-from pandas._libs.lib import Timestamp
+from pandas import (
+    CategoricalIndex, DataFrame, DatetimeIndex, Float64Index, Int64Index,
+    PeriodIndex, RangeIndex, Series, TimedeltaIndex, UInt64Index, date_range,
+    isna, period_range)
+import pandas.core.config as cf
+from pandas.core.index import _get_combined_index, ensure_index_from_sequences
+from pandas.core.indexes.api import Index, MultiIndex
+from pandas.core.sorting import safe_sort
+from pandas.tests.indexes.common import Base
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal
 
 
-class TestIndex(Base, tm.TestCase):
+class TestIndex(Base):
     _holder = Index
 
-    def setUp(self):
+    def setup_method(self, method):
         self.indices = dict(unicodeIndex=tm.makeUnicodeIndex(100),
                             strIndex=tm.makeStringIndex(100),
                             dateIndex=tm.makeDateIndex(100),
@@ -38,362 +43,471 @@ def setUp(self):
                             tdIndex=tm.makeTimedeltaIndex(100),
                             intIndex=tm.makeIntIndex(100),
                             uintIndex=tm.makeUIntIndex(100),
-                            rangeIndex=tm.makeIntIndex(100),
+                            rangeIndex=tm.makeRangeIndex(100),
                             floatIndex=tm.makeFloatIndex(100),
                             boolIndex=Index([True, False]),
                             catIndex=tm.makeCategoricalIndex(100),
                             empty=Index([]),
                             tuples=MultiIndex.from_tuples(lzip(
-                                ['foo', 'bar', 'baz'], [1, 2, 3])))
+                                ['foo', 'bar', 'baz'], [1, 2, 3])),
+                            repeats=Index([0, 0, 1, 1, 2, 2]))
         self.setup_indices()
 
     def create_index(self):
         return Index(list('abcde'))
 
+    def generate_index_types(self, skip_index_keys=[]):
+        """
+        Return a generator of the various index types, leaving
+        out the ones with a key in skip_index_keys
+        """
+        for key, index in self.indices.items():
+            if key not in skip_index_keys:
+                yield key, index
+
+    def test_can_hold_identifiers(self):
+        index = self.create_index()
+        key = index[0]
+        assert index._can_hold_identifiers_and_holds_name(key) is True
+
     def test_new_axis(self):
         new_index = self.dateIndex[None, :]
-        self.assertEqual(new_index.ndim, 2)
-        tm.assertIsInstance(new_index, np.ndarray)
+        assert new_index.ndim == 2
+        assert isinstance(new_index, np.ndarray)
 
     def test_copy_and_deepcopy(self):
-        super(TestIndex, self).test_copy_and_deepcopy()
-
         new_copy2 = self.intIndex.copy(dtype=int)
-        self.assertEqual(new_copy2.dtype.kind, 'i')
+        assert new_copy2.dtype.kind == 'i'
 
-    def test_constructor(self):
+    @pytest.mark.parametrize("attr", ['strIndex', 'dateIndex'])
+    def test_constructor_regular(self, attr):
         # regular instance creation
-        tm.assert_contains_all(self.strIndex, self.strIndex)
-        tm.assert_contains_all(self.dateIndex, self.dateIndex)
+        index = getattr(self, attr)
+        tm.assert_contains_all(index, index)
 
+    def test_constructor_casting(self):
         # casting
         arr = np.array(self.strIndex)
         index = Index(arr)
         tm.assert_contains_all(arr, index)
         tm.assert_index_equal(self.strIndex, index)
 
+    def test_constructor_copy(self):
         # copy
         arr = np.array(self.strIndex)
         index = Index(arr, copy=True, name='name')
-        tm.assertIsInstance(index, Index)
-        self.assertEqual(index.name, 'name')
+        assert isinstance(index, Index)
+        assert index.name == 'name'
         tm.assert_numpy_array_equal(arr, index.values)
         arr[0] = "SOMEBIGLONGSTRING"
-        self.assertNotEqual(index[0], "SOMEBIGLONGSTRING")
+        assert index[0] != "SOMEBIGLONGSTRING"
 
         # what to do here?
         # arr = np.array(5.)
-        # self.assertRaises(Exception, arr.view, Index)
+        # pytest.raises(Exception, arr.view, Index)
 
     def test_constructor_corner(self):
         # corner case
-        self.assertRaises(TypeError, Index, 0)
-
-    def test_construction_list_mixed_tuples(self):
-        # 10697
-        # if we are constructing from a mixed list of tuples, make sure that we
-        # are independent of the sorting order
-        idx1 = Index([('A', 1), 'B'])
-        self.assertIsInstance(idx1, Index) and self.assertNotInstance(
-            idx1, MultiIndex)
-        idx2 = Index(['B', ('A', 1)])
-        self.assertIsInstance(idx2, Index) and self.assertNotInstance(
-            idx2, MultiIndex)
-
-    def test_constructor_from_index_datetimetz(self):
-        idx = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
-                            tz='US/Eastern')
-        result = pd.Index(idx)
-        tm.assert_index_equal(result, idx)
-        self.assertEqual(result.tz, idx.tz)
-
-        result = pd.Index(idx.asobject)
-        tm.assert_index_equal(result, idx)
-        self.assertEqual(result.tz, idx.tz)
-
-    def test_constructor_from_index_timedelta(self):
-        idx = pd.timedelta_range('1 days', freq='D', periods=3)
-        result = pd.Index(idx)
-        tm.assert_index_equal(result, idx)
-
-        result = pd.Index(idx.asobject)
-        tm.assert_index_equal(result, idx)
-
-    def test_constructor_from_index_period(self):
-        idx = pd.period_range('2015-01-01', freq='D', periods=3)
-        result = pd.Index(idx)
-        tm.assert_index_equal(result, idx)
-
-        result = pd.Index(idx.asobject)
-        tm.assert_index_equal(result, idx)
-
-    def test_constructor_from_series_datetimetz(self):
-        idx = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
-                            tz='US/Eastern')
-        result = pd.Index(pd.Series(idx))
-        tm.assert_index_equal(result, idx)
-        self.assertEqual(result.tz, idx.tz)
-
-    def test_constructor_from_series_timedelta(self):
-        idx = pd.timedelta_range('1 days', freq='D', periods=3)
-        result = pd.Index(pd.Series(idx))
-        tm.assert_index_equal(result, idx)
-
-    def test_constructor_from_series_period(self):
-        idx = pd.period_range('2015-01-01', freq='D', periods=3)
-        result = pd.Index(pd.Series(idx))
-        tm.assert_index_equal(result, idx)
-
-    def test_constructor_from_series(self):
+        msg = (r"Index\(\.\.\.\) must be called with a collection of some"
+               " kind, 0 was passed")
+        with pytest.raises(TypeError, match=msg):
+            Index(0)
+
+    @pytest.mark.parametrize("index_vals", [
+        [('A', 1), 'B'], ['B', ('A', 1)]])
+    def test_construction_list_mixed_tuples(self, index_vals):
+        # see gh-10697: if we are constructing from a mixed list of tuples,
+        # make sure that we are independent of the sorting order.
+        index = Index(index_vals)
+        assert isinstance(index, Index)
+        assert not isinstance(index, MultiIndex)
+
+    @pytest.mark.parametrize('na_value', [None, np.nan])
+    @pytest.mark.parametrize('vtype', [list, tuple, iter])
+    def test_construction_list_tuples_nan(self, na_value, vtype):
+        # GH 18505 : valid tuples containing NaN
+        values = [(1, 'two'), (3., na_value)]
+        result = Index(vtype(values))
+        expected = MultiIndex.from_tuples(values)
+        tm.assert_index_equal(result, expected)
 
+    @pytest.mark.parametrize("cast_as_obj", [True, False])
+    @pytest.mark.parametrize("index", [
+        pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                      tz='US/Eastern', name='Green Eggs & Ham'),  # DTI with tz
+        pd.date_range('2015-01-01 10:00', freq='D', periods=3),  # DTI no tz
+        pd.timedelta_range('1 days', freq='D', periods=3),  # td
+        pd.period_range('2015-01-01', freq='D', periods=3)  # period
+    ])
+    def test_constructor_from_index_dtlike(self, cast_as_obj, index):
+        if cast_as_obj:
+            result = pd.Index(index.astype(object))
+        else:
+            result = pd.Index(index)
+
+        tm.assert_index_equal(result, index)
+
+        if isinstance(index, pd.DatetimeIndex):
+            assert result.tz == index.tz
+            if cast_as_obj:
+                # GH#23524 check that Index(dti, dtype=object) does not
+                #  incorrectly raise ValueError, and that nanoseconds are not
+                #  dropped
+                index += pd.Timedelta(nanoseconds=50)
+                result = pd.Index(index, dtype=object)
+                assert result.dtype == np.object_
+                assert list(result) == list(index)
+
+    @pytest.mark.parametrize("index,has_tz", [
+        (pd.date_range('2015-01-01 10:00', freq='D', periods=3,
+                       tz='US/Eastern'), True),  # datetimetz
+        (pd.timedelta_range('1 days', freq='D', periods=3), False),  # td
+        (pd.period_range('2015-01-01', freq='D', periods=3), False)  # period
+    ])
+    def test_constructor_from_series_dtlike(self, index, has_tz):
+        result = pd.Index(pd.Series(index))
+        tm.assert_index_equal(result, index)
+
+        if has_tz:
+            assert result.tz == index.tz
+
+    @pytest.mark.parametrize("klass", [Index, DatetimeIndex])
+    def test_constructor_from_series(self, klass):
         expected = DatetimeIndex([Timestamp('20110101'), Timestamp('20120101'),
                                   Timestamp('20130101')])
         s = Series([Timestamp('20110101'), Timestamp('20120101'),
                     Timestamp('20130101')])
-        result = Index(s)
-        self.assert_index_equal(result, expected)
-        result = DatetimeIndex(s)
-        self.assert_index_equal(result, expected)
+        result = klass(s)
+        tm.assert_index_equal(result, expected)
 
+    def test_constructor_from_series_freq(self):
         # GH 6273
         # create from a series, passing a freq
-        s = Series(pd.to_datetime(['1-1-1990', '2-1-1990', '3-1-1990',
-                                   '4-1-1990', '5-1-1990']))
+        dts = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']
+        expected = DatetimeIndex(dts, freq='MS')
+
+        s = Series(pd.to_datetime(dts))
         result = DatetimeIndex(s, freq='MS')
-        expected = DatetimeIndex(['1-1-1990', '2-1-1990', '3-1-1990',
-                                  '4-1-1990', '5-1-1990'], freq='MS')
-        self.assert_index_equal(result, expected)
+
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_from_frame_series_freq(self):
+        # GH 6273
+        # create from a series, passing a freq
+        dts = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990', '5-1-1990']
+        expected = DatetimeIndex(dts, freq='MS')
 
         df = pd.DataFrame(np.random.rand(5, 3))
-        df['date'] = ['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990',
-                      '5-1-1990']
+        df['date'] = dts
         result = DatetimeIndex(df['date'], freq='MS')
+
+        assert df['date'].dtype == object
         expected.name = 'date'
-        self.assert_index_equal(result, expected)
-        self.assertEqual(df['date'].dtype, object)
+        tm.assert_index_equal(result, expected)
 
-        exp = pd.Series(['1-1-1990', '2-1-1990', '3-1-1990', '4-1-1990',
-                         '5-1-1990'], name='date')
-        self.assert_series_equal(df['date'], exp)
+        expected = pd.Series(dts, name='date')
+        tm.assert_series_equal(df['date'], expected)
 
         # GH 6274
         # infer freq of same
-        result = pd.infer_freq(df['date'])
-        self.assertEqual(result, 'MS')
-
-    def test_constructor_ndarray_like(self):
+        freq = pd.infer_freq(df['date'])
+        assert freq == 'MS'
+
+    @pytest.mark.parametrize("array", [
+        np.arange(5), np.array(['a', 'b', 'c']), date_range(
+            '2000-01-01', periods=3).values
+    ])
+    def test_constructor_ndarray_like(self, array):
         # GH 5460#issuecomment-44474502
         # it should be possible to convert any object that satisfies the numpy
         # ndarray interface directly into an Index
         class ArrayLike(object):
-
             def __init__(self, array):
                 self.array = array
 
             def __array__(self, dtype=None):
                 return self.array
 
-        for array in [np.arange(5), np.array(['a', 'b', 'c']),
-                      date_range('2000-01-01', periods=3).values]:
-            expected = pd.Index(array)
-            result = pd.Index(ArrayLike(array))
-            self.assert_index_equal(result, expected)
+        expected = pd.Index(array)
+        result = pd.Index(ArrayLike(array))
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [
+        int, 'int64', 'int32', 'int16', 'int8', 'uint64', 'uint32',
+        'uint16', 'uint8'])
+    def test_constructor_int_dtype_float(self, dtype):
+        # GH 18400
+        if is_unsigned_integer_dtype(dtype):
+            index_type = UInt64Index
+        else:
+            index_type = Int64Index
+
+        expected = index_type([0, 1, 2, 3])
+        result = Index([0., 1., 2., 3.], dtype=dtype)
+        tm.assert_index_equal(result, expected)
 
     def test_constructor_int_dtype_nan(self):
         # see gh-15187
         data = [np.nan]
-        msg = "cannot convert"
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Index(data, dtype='int64')
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Index(data, dtype='uint64')
-
-        # This, however, should not break
-        # because NaN is float.
         expected = Float64Index(data)
         result = Index(data, dtype='float')
         tm.assert_index_equal(result, expected)
 
-    def test_index_ctor_infer_nan_nat(self):
-        # GH 13467
-        exp = pd.Float64Index([np.nan, np.nan])
-        self.assertEqual(exp.dtype, np.float64)
-        tm.assert_index_equal(Index([np.nan, np.nan]), exp)
-        tm.assert_index_equal(Index(np.array([np.nan, np.nan])), exp)
+    @pytest.mark.parametrize("dtype", ['int64', 'uint64'])
+    def test_constructor_int_dtype_nan_raises(self, dtype):
+        # see gh-15187
+        data = [np.nan]
+        msg = "cannot convert"
+        with pytest.raises(ValueError, match=msg):
+            Index(data, dtype=dtype)
 
-        exp = pd.DatetimeIndex([pd.NaT, pd.NaT])
-        self.assertEqual(exp.dtype, 'datetime64[ns]')
-        tm.assert_index_equal(Index([pd.NaT, pd.NaT]), exp)
-        tm.assert_index_equal(Index(np.array([pd.NaT, pd.NaT])), exp)
+    def test_constructor_no_pandas_array(self):
+        ser = pd.Series([1, 2, 3])
+        result = pd.Index(ser.array)
+        expected = pd.Index([1, 2, 3])
+        tm.assert_index_equal(result, expected)
 
-        exp = pd.DatetimeIndex([pd.NaT, pd.NaT])
-        self.assertEqual(exp.dtype, 'datetime64[ns]')
+    @pytest.mark.parametrize("klass,dtype,na_val", [
+        (pd.Float64Index, np.float64, np.nan),
+        (pd.DatetimeIndex, 'datetime64[ns]', pd.NaT)
+    ])
+    def test_index_ctor_infer_nan_nat(self, klass, dtype, na_val):
+        # GH 13467
+        na_list = [na_val, na_val]
+        expected = klass(na_list)
+        assert expected.dtype == dtype
 
-        for data in [[pd.NaT, np.nan], [np.nan, pd.NaT],
-                     [np.nan, np.datetime64('nat')],
-                     [np.datetime64('nat'), np.nan]]:
-            tm.assert_index_equal(Index(data), exp)
-            tm.assert_index_equal(Index(np.array(data, dtype=object)), exp)
+        result = Index(na_list)
+        tm.assert_index_equal(result, expected)
 
-        exp = pd.TimedeltaIndex([pd.NaT, pd.NaT])
-        self.assertEqual(exp.dtype, 'timedelta64[ns]')
+        result = Index(np.array(na_list))
+        tm.assert_index_equal(result, expected)
 
-        for data in [[np.nan, np.timedelta64('nat')],
-                     [np.timedelta64('nat'), np.nan],
-                     [pd.NaT, np.timedelta64('nat')],
-                     [np.timedelta64('nat'), pd.NaT]]:
+    @pytest.mark.parametrize("pos", [0, 1])
+    @pytest.mark.parametrize("klass,dtype,ctor", [
+        (pd.DatetimeIndex, 'datetime64[ns]', np.datetime64('nat')),
+        (pd.TimedeltaIndex, 'timedelta64[ns]', np.timedelta64('nat'))
+    ])
+    def test_index_ctor_infer_nat_dt_like(self, pos, klass, dtype, ctor,
+                                          nulls_fixture):
+        expected = klass([pd.NaT, pd.NaT])
+        assert expected.dtype == dtype
+        data = [ctor]
+        data.insert(pos, nulls_fixture)
+
+        result = Index(data)
+        tm.assert_index_equal(result, expected)
 
-            tm.assert_index_equal(Index(data), exp)
-            tm.assert_index_equal(Index(np.array(data, dtype=object)), exp)
+        result = Index(np.array(data, dtype=object))
+        tm.assert_index_equal(result, expected)
 
+    @pytest.mark.parametrize("swap_objs", [True, False])
+    def test_index_ctor_nat_result(self, swap_objs):
         # mixed np.datetime64/timedelta64 nat results in object
         data = [np.datetime64('nat'), np.timedelta64('nat')]
-        exp = pd.Index(data, dtype=object)
-        tm.assert_index_equal(Index(data), exp)
-        tm.assert_index_equal(Index(np.array(data, dtype=object)), exp)
+        if swap_objs:
+            data = data[::-1]
 
-        data = [np.timedelta64('nat'), np.datetime64('nat')]
-        exp = pd.Index(data, dtype=object)
-        tm.assert_index_equal(Index(data), exp)
-        tm.assert_index_equal(Index(np.array(data, dtype=object)), exp)
+        expected = pd.Index(data, dtype=object)
+        tm.assert_index_equal(Index(data), expected)
+        tm.assert_index_equal(Index(np.array(data, dtype=object)), expected)
 
     def test_index_ctor_infer_periodindex(self):
         xp = period_range('2012-1-1', freq='M', periods=3)
         rs = Index(xp)
         tm.assert_index_equal(rs, xp)
-        tm.assertIsInstance(rs, PeriodIndex)
-
-    def test_constructor_simple_new(self):
-        idx = Index([1, 2, 3, 4, 5], name='int')
-        result = idx._simple_new(idx, 'int')
-        self.assert_index_equal(result, idx)
-
-        idx = Index([1.1, np.nan, 2.2, 3.0], name='float')
-        result = idx._simple_new(idx, 'float')
-        self.assert_index_equal(result, idx)
-
-        idx = Index(['A', 'B', 'C', np.nan], name='obj')
-        result = idx._simple_new(idx, 'obj')
-        self.assert_index_equal(result, idx)
-
-    def test_constructor_dtypes(self):
-
-        for idx in [Index(np.array([1, 2, 3], dtype=int)),
-                    Index(np.array([1, 2, 3], dtype=int), dtype=int),
-                    Index([1, 2, 3], dtype=int)]:
-            self.assertIsInstance(idx, Int64Index)
-
-        # these should coerce
-        for idx in [Index(np.array([1., 2., 3.], dtype=float), dtype=int),
-                    Index([1., 2., 3.], dtype=int)]:
-            self.assertIsInstance(idx, Int64Index)
-
-        for idx in [Index(np.array([1., 2., 3.], dtype=float)),
-                    Index(np.array([1, 2, 3], dtype=int), dtype=float),
-                    Index(np.array([1., 2., 3.], dtype=float), dtype=float),
-                    Index([1, 2, 3], dtype=float),
-                    Index([1., 2., 3.], dtype=float)]:
-            self.assertIsInstance(idx, Float64Index)
-
-        for idx in [Index(np.array([True, False, True], dtype=bool)),
-                    Index([True, False, True]),
-                    Index(np.array([True, False, True], dtype=bool),
-                          dtype=bool),
-                    Index([True, False, True], dtype=bool)]:
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-        for idx in [Index(np.array([1, 2, 3], dtype=int), dtype='category'),
-                    Index([1, 2, 3], dtype='category'),
-                    Index(np.array([np_datetime64_compat('2011-01-01'),
-                                    np_datetime64_compat('2011-01-02')]),
-                          dtype='category'),
-                    Index([datetime(2011, 1, 1), datetime(2011, 1, 2)],
-                          dtype='category')]:
-            self.assertIsInstance(idx, CategoricalIndex)
-
-        for idx in [Index(np.array([np_datetime64_compat('2011-01-01'),
-                                    np_datetime64_compat('2011-01-02')])),
-                    Index([datetime(2011, 1, 1), datetime(2011, 1, 2)])]:
-            self.assertIsInstance(idx, DatetimeIndex)
-
-        for idx in [Index(np.array([np_datetime64_compat('2011-01-01'),
-                                    np_datetime64_compat('2011-01-02')]),
-                          dtype=object),
-                    Index([datetime(2011, 1, 1),
-                           datetime(2011, 1, 2)], dtype=object)]:
-            self.assertNotIsInstance(idx, DatetimeIndex)
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-        for idx in [Index(np.array([np.timedelta64(1, 'D'), np.timedelta64(
-                1, 'D')])), Index([timedelta(1), timedelta(1)])]:
-            self.assertIsInstance(idx, TimedeltaIndex)
-
-        for idx in [Index(np.array([np.timedelta64(1, 'D'),
-                                    np.timedelta64(1, 'D')]), dtype=object),
-                    Index([timedelta(1), timedelta(1)], dtype=object)]:
-            self.assertNotIsInstance(idx, TimedeltaIndex)
-            self.assertIsInstance(idx, Index)
-            self.assertEqual(idx.dtype, object)
-
-    def test_constructor_dtypes_datetime(self):
-
-        for tz in [None, 'UTC', 'US/Eastern', 'Asia/Tokyo']:
-            idx = pd.date_range('2011-01-01', periods=5, tz=tz)
-            dtype = idx.dtype
-
-            # pass values without timezone, as DatetimeIndex localizes it
-            for values in [pd.date_range('2011-01-01', periods=5).values,
-                           pd.date_range('2011-01-01', periods=5).asi8]:
-
-                for res in [pd.Index(values, tz=tz),
-                            pd.Index(values, dtype=dtype),
-                            pd.Index(list(values), tz=tz),
-                            pd.Index(list(values), dtype=dtype)]:
-                    tm.assert_index_equal(res, idx)
-
-                # check compat with DatetimeIndex
-                for res in [pd.DatetimeIndex(values, tz=tz),
-                            pd.DatetimeIndex(values, dtype=dtype),
-                            pd.DatetimeIndex(list(values), tz=tz),
-                            pd.DatetimeIndex(list(values), dtype=dtype)]:
-                    tm.assert_index_equal(res, idx)
-
-    def test_constructor_dtypes_timedelta(self):
-
-        idx = pd.timedelta_range('1 days', periods=5)
-        dtype = idx.dtype
-
-        for values in [idx.values, idx.asi8]:
-
-            for res in [pd.Index(values, dtype=dtype),
-                        pd.Index(list(values), dtype=dtype)]:
-                tm.assert_index_equal(res, idx)
-
-            # check compat with TimedeltaIndex
-            for res in [pd.TimedeltaIndex(values, dtype=dtype),
-                        pd.TimedeltaIndex(list(values), dtype=dtype)]:
-                tm.assert_index_equal(res, idx)
+        assert isinstance(rs, PeriodIndex)
+
+    @pytest.mark.parametrize("vals,dtype", [
+        ([1, 2, 3, 4, 5], 'int'), ([1.1, np.nan, 2.2, 3.0], 'float'),
+        (['A', 'B', 'C', np.nan], 'obj')
+    ])
+    def test_constructor_simple_new(self, vals, dtype):
+        index = Index(vals, name=dtype)
+        result = index._simple_new(index.values, dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], np.array([1, 2, 3]), np.array([1, 2, 3], dtype=int),
+        # below should coerce
+        [1., 2., 3.], np.array([1., 2., 3.], dtype=float)
+    ])
+    def test_constructor_dtypes_to_int64(self, vals):
+        index = Index(vals, dtype=int)
+        assert isinstance(index, Int64Index)
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], [1., 2., 3.], np.array([1., 2., 3.]),
+        np.array([1, 2, 3], dtype=int), np.array([1., 2., 3.], dtype=float)
+    ])
+    def test_constructor_dtypes_to_float64(self, vals):
+        index = Index(vals, dtype=float)
+        assert isinstance(index, Float64Index)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        [True, False, True], np.array([True, False, True], dtype=bool)
+    ])
+    def test_constructor_dtypes_to_object(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=bool)
+        else:
+            index = Index(vals)
+
+        assert isinstance(index, Index)
+        assert index.dtype == object
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2, 3], np.array([1, 2, 3], dtype=int),
+        np.array([np_datetime64_compat('2011-01-01'),
+                  np_datetime64_compat('2011-01-02')]),
+        [datetime(2011, 1, 1), datetime(2011, 1, 2)]
+    ])
+    def test_constructor_dtypes_to_categorical(self, vals):
+        index = Index(vals, dtype='category')
+        assert isinstance(index, CategoricalIndex)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        Index(np.array([np_datetime64_compat('2011-01-01'),
+                        np_datetime64_compat('2011-01-02')])),
+        Index([datetime(2011, 1, 1), datetime(2011, 1, 2)])
+
+    ])
+    def test_constructor_dtypes_to_datetime(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=object)
+            assert isinstance(index, Index)
+            assert index.dtype == object
+        else:
+            index = Index(vals)
+            assert isinstance(index, DatetimeIndex)
+
+    @pytest.mark.parametrize("cast_index", [True, False])
+    @pytest.mark.parametrize("vals", [
+        np.array([np.timedelta64(1, 'D'), np.timedelta64(1, 'D')]),
+        [timedelta(1), timedelta(1)]
+    ])
+    def test_constructor_dtypes_to_timedelta(self, cast_index, vals):
+        if cast_index:
+            index = Index(vals, dtype=object)
+            assert isinstance(index, Index)
+            assert index.dtype == object
+        else:
+            index = Index(vals)
+            assert isinstance(index, TimedeltaIndex)
+
+    @pytest.mark.parametrize("attr, utc", [
+        ['values', False],
+        ['asi8', True]])
+    @pytest.mark.parametrize("klass", [pd.Index, pd.DatetimeIndex])
+    def test_constructor_dtypes_datetime(self, tz_naive_fixture, attr, utc,
+                                         klass):
+        # Test constructing with a datetimetz dtype
+        # .values produces numpy datetimes, so these are considered naive
+        # .asi8 produces integers, so these are considered epoch timestamps
+        # ^the above will be true in a later version. Right now we `.view`
+        # the i8 values as NS_DTYPE, effectively treating them as wall times.
+        index = pd.date_range('2011-01-01', periods=5)
+        arg = getattr(index, attr)
+        index = index.tz_localize(tz_naive_fixture)
+        dtype = index.dtype
+
+        # TODO(GH-24559): Remove the sys.modules and warnings
+        # not sure what this is from. It's Py2 only.
+        modules = [sys.modules['pandas.core.indexes.base']]
+
+        if (tz_naive_fixture and attr == "asi8" and
+                str(tz_naive_fixture) not in ('UTC', 'tzutc()')):
+            ex_warn = FutureWarning
+        else:
+            ex_warn = None
+
+        # stacklevel is checked elsewhere. We don't do it here since
+        # Index will have an frame, throwing off the expected.
+        with tm.assert_produces_warning(ex_warn, check_stacklevel=False,
+                                        clear=modules):
+            result = klass(arg, tz=tz_naive_fixture)
+        tm.assert_index_equal(result, index)
+
+        with tm.assert_produces_warning(ex_warn, check_stacklevel=False):
+            result = klass(arg, dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+        with tm.assert_produces_warning(ex_warn, check_stacklevel=False):
+            result = klass(list(arg), tz=tz_naive_fixture)
+        tm.assert_index_equal(result, index)
+
+        with tm.assert_produces_warning(ex_warn, check_stacklevel=False):
+            result = klass(list(arg), dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("attr", ['values', 'asi8'])
+    @pytest.mark.parametrize("klass", [pd.Index, pd.TimedeltaIndex])
+    def test_constructor_dtypes_timedelta(self, attr, klass):
+        index = pd.timedelta_range('1 days', periods=5)
+        dtype = index.dtype
+
+        values = getattr(index, attr)
+
+        result = klass(values, dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+        result = klass(list(values), dtype=dtype)
+        tm.assert_index_equal(result, index)
+
+    @pytest.mark.parametrize("value", [[], iter([]), (x for x in [])])
+    @pytest.mark.parametrize("klass",
+                             [Index, Float64Index, Int64Index, UInt64Index,
+                              CategoricalIndex, DatetimeIndex, TimedeltaIndex])
+    def test_constructor_empty(self, value, klass):
+        empty = klass(value)
+        assert isinstance(empty, klass)
+        assert not len(empty)
+
+    @pytest.mark.parametrize("empty,klass", [
+        (PeriodIndex([], freq='B'), PeriodIndex),
+        (PeriodIndex(iter([]), freq='B'), PeriodIndex),
+        (PeriodIndex((x for x in []), freq='B'), PeriodIndex),
+        (RangeIndex(step=1), pd.RangeIndex),
+        (MultiIndex(levels=[[1, 2], ['blue', 'red']],
+                    codes=[[], []]), MultiIndex)
+    ])
+    def test_constructor_empty_special(self, empty, klass):
+        assert isinstance(empty, klass)
+        assert not len(empty)
+
+    def test_constructor_overflow_int64(self):
+        # see gh-15832
+        msg = ("The elements provided in the data cannot "
+               "all be casted to the dtype int64")
+        with pytest.raises(OverflowError, match=msg):
+            Index([np.iinfo(np.uint64).max - 1], dtype="int64")
+
+    @pytest.mark.xfail(reason="see GH#21311: Index "
+                              "doesn't enforce dtype argument")
+    def test_constructor_cast(self):
+        msg = "could not convert string to float"
+        with pytest.raises(ValueError, match=msg):
+            Index(["a", "b", "c"], dtype=float)
 
     def test_view_with_args(self):
-
         restricted = ['unicodeIndex', 'strIndex', 'catIndex', 'boolIndex',
                       'empty']
-
-        for i in restricted:
-            ind = self.indices[i]
-
-            # with arguments
-            self.assertRaises(TypeError, lambda: ind.view('i8'))
-
-        # these are ok
         for i in list(set(self.indices.keys()) - set(restricted)):
             ind = self.indices[i]
+            ind.view('i8')
 
-            # with arguments
+    @pytest.mark.parametrize('index_type', [
+        'unicodeIndex',
+        'strIndex',
+        pytest.param('catIndex', marks=pytest.mark.xfail(reason="gh-25464")),
+        'boolIndex',
+        'empty'])
+    def test_view_with_args_object_array_raises(self, index_type):
+        ind = self.indices[index_type]
+        msg = "Cannot change data-type for object array"
+        with pytest.raises(TypeError, match=msg):
             ind.view('i8')
 
     def test_astype(self):
@@ -405,20 +519,16 @@ def test_astype(self):
         # pass on name
         self.intIndex.name = 'foobar'
         casted = self.intIndex.astype('i8')
-        self.assertEqual(casted.name, 'foobar')
+        assert casted.name == 'foobar'
 
     def test_equals_object(self):
         # same
-        self.assertTrue(Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'c'])))
-
-        # different length
-        self.assertFalse(Index(['a', 'b', 'c']).equals(Index(['a', 'b'])))
-
-        # same length, different values
-        self.assertFalse(Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'd'])))
+        assert Index(['a', 'b', 'c']).equals(Index(['a', 'b', 'c']))
 
-        # Must also be an Index
-        self.assertFalse(Index(['a', 'b', 'c']).equals(['a', 'b', 'c']))
+    @pytest.mark.parametrize("comp", [
+        Index(['a', 'b']), Index(['a', 'b', 'd']), ['a', 'b', 'c']])
+    def test_not_equals_object(self, comp):
+        assert not Index(['a', 'b', 'c']).equals(comp)
 
     def test_insert(self):
 
@@ -427,36 +537,42 @@ def test_insert(self):
         result = Index(['b', 'c', 'd'])
 
         # test 0th element
-        self.assert_index_equal(Index(['a', 'b', 'c', 'd']),
-                                result.insert(0, 'a'))
+        tm.assert_index_equal(Index(['a', 'b', 'c', 'd']),
+                              result.insert(0, 'a'))
 
         # test Nth element that follows Python list behavior
-        self.assert_index_equal(Index(['b', 'c', 'e', 'd']),
-                                result.insert(-1, 'e'))
+        tm.assert_index_equal(Index(['b', 'c', 'e', 'd']),
+                              result.insert(-1, 'e'))
 
         # test loc +/- neq (0, -1)
-        self.assert_index_equal(result.insert(1, 'z'), result.insert(-2, 'z'))
+        tm.assert_index_equal(result.insert(1, 'z'), result.insert(-2, 'z'))
 
         # test empty
         null_index = Index([])
-        self.assert_index_equal(Index(['a']), null_index.insert(0, 'a'))
+        tm.assert_index_equal(Index(['a']), null_index.insert(0, 'a'))
 
-    def test_delete(self):
-        idx = Index(['a', 'b', 'c', 'd'], name='idx')
-
-        expected = Index(['b', 'c', 'd'], name='idx')
-        result = idx.delete(0)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+    def test_insert_missing(self, nulls_fixture):
+        # GH 22295
+        # test there is no mangling of NA values
+        expected = Index(['a', nulls_fixture, 'b', 'c'])
+        result = Index(list('abc')).insert(1, nulls_fixture)
+        tm.assert_index_equal(result, expected)
 
-        expected = Index(['a', 'b', 'c'], name='idx')
-        result = idx.delete(-1)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+    @pytest.mark.parametrize("pos,expected", [
+        (0, Index(['b', 'c', 'd'], name='index')),
+        (-1, Index(['a', 'b', 'c'], name='index'))
+    ])
+    def test_delete(self, pos, expected):
+        index = Index(['a', 'b', 'c', 'd'], name='index')
+        result = index.delete(pos)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
 
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depending on numpy version
-            result = idx.delete(5)
+    def test_delete_raises(self):
+        index = Index(['a', 'b', 'c', 'd'], name='index')
+        msg = "index 5 is out of bounds for axis 0 with size 4"
+        with pytest.raises(IndexError, match=msg):
+            index.delete(5)
 
     def test_identical(self):
 
@@ -464,60 +580,59 @@ def test_identical(self):
         i1 = Index(['a', 'b', 'c'])
         i2 = Index(['a', 'b', 'c'])
 
-        self.assertTrue(i1.identical(i2))
+        assert i1.identical(i2)
 
         i1 = i1.rename('foo')
-        self.assertTrue(i1.equals(i2))
-        self.assertFalse(i1.identical(i2))
+        assert i1.equals(i2)
+        assert not i1.identical(i2)
 
         i2 = i2.rename('foo')
-        self.assertTrue(i1.identical(i2))
+        assert i1.identical(i2)
 
         i3 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')])
         i4 = Index([('a', 'a'), ('a', 'b'), ('b', 'a')], tupleize_cols=False)
-        self.assertFalse(i3.identical(i4))
+        assert not i3.identical(i4)
 
     def test_is_(self):
         ind = Index(range(10))
-        self.assertTrue(ind.is_(ind))
-        self.assertTrue(ind.is_(ind.view().view().view().view()))
-        self.assertFalse(ind.is_(Index(range(10))))
-        self.assertFalse(ind.is_(ind.copy()))
-        self.assertFalse(ind.is_(ind.copy(deep=False)))
-        self.assertFalse(ind.is_(ind[:]))
-        self.assertFalse(ind.is_(ind.view(np.ndarray).view(Index)))
-        self.assertFalse(ind.is_(np.array(range(10))))
+        assert ind.is_(ind)
+        assert ind.is_(ind.view().view().view().view())
+        assert not ind.is_(Index(range(10)))
+        assert not ind.is_(ind.copy())
+        assert not ind.is_(ind.copy(deep=False))
+        assert not ind.is_(ind[:])
+        assert not ind.is_(np.array(range(10)))
 
         # quasi-implementation dependent
-        self.assertTrue(ind.is_(ind.view()))
+        assert ind.is_(ind.view())
         ind2 = ind.view()
         ind2.name = 'bob'
-        self.assertTrue(ind.is_(ind2))
-        self.assertTrue(ind2.is_(ind))
+        assert ind.is_(ind2)
+        assert ind2.is_(ind)
         # doesn't matter if Indices are *actually* views of underlying data,
-        self.assertFalse(ind.is_(Index(ind.values)))
+        assert not ind.is_(Index(ind.values))
         arr = np.array(range(1, 11))
         ind1 = Index(arr, copy=False)
         ind2 = Index(arr, copy=False)
-        self.assertFalse(ind1.is_(ind2))
+        assert not ind1.is_(ind2)
 
     def test_asof(self):
         d = self.dateIndex[0]
-        self.assertEqual(self.dateIndex.asof(d), d)
-        self.assertTrue(np.isnan(self.dateIndex.asof(d - timedelta(1))))
+        assert self.dateIndex.asof(d) == d
+        assert isna(self.dateIndex.asof(d - timedelta(1)))
 
         d = self.dateIndex[-1]
-        self.assertEqual(self.dateIndex.asof(d + timedelta(1)), d)
+        assert self.dateIndex.asof(d + timedelta(1)) == d
 
         d = self.dateIndex[0].to_pydatetime()
-        tm.assertIsInstance(self.dateIndex.asof(d), Timestamp)
+        assert isinstance(self.dateIndex.asof(d), Timestamp)
 
     def test_asof_datetime_partial(self):
-        idx = pd.date_range('2010-01-01', periods=2, freq='m')
+        index = pd.date_range('2010-01-01', periods=2, freq='m')
         expected = Timestamp('2010-02-28')
-        result = idx.asof('2010-02')
-        self.assertEqual(result, expected)
-        self.assertFalse(isinstance(result, Index))
+        result = index.asof('2010-02')
+        assert result == expected
+        assert not isinstance(result, Index)
 
     def test_nanosecond_index_access(self):
         s = Series([Timestamp('20130101')]).values.view('i8')[0]
@@ -527,223 +642,290 @@ def test_nanosecond_index_access(self):
         first_value = x.asof(x.index[0])
 
         # this does not yet work, as parsing strings is done via dateutil
-        # self.assertEqual(first_value,
-        #                  x['2013-01-01 00:00:00.000000050+0000'])
-
-        exp_ts = np_datetime64_compat('2013-01-01 00:00:00.000000050+0000',
-                                      'ns')
-        self.assertEqual(first_value, x[Timestamp(exp_ts)])
-
-    def test_comparators(self):
-        index = self.dateIndex
-        element = index[len(index) // 2]
-        element = _to_m8(element)
-
-        arr = np.array(index)
+        # assert first_value == x['2013-01-01 00:00:00.000000050+0000']
 
-        def _check(op):
-            arr_result = op(arr, element)
-            index_result = op(index, element)
-
-            self.assertIsInstance(index_result, np.ndarray)
-            tm.assert_numpy_array_equal(arr_result, index_result)
-
-        _check(operator.eq)
-        _check(operator.ne)
-        _check(operator.gt)
-        _check(operator.lt)
-        _check(operator.ge)
-        _check(operator.le)
+        expected_ts = np_datetime64_compat('2013-01-01 00:00:00.000000050+'
+                                           '0000', 'ns')
+        assert first_value == x[Timestamp(expected_ts)]
 
     def test_booleanindex(self):
-        boolIdx = np.repeat(True, len(self.strIndex)).astype(bool)
-        boolIdx[5:30:2] = False
+        boolIndex = np.repeat(True, len(self.strIndex)).astype(bool)
+        boolIndex[5:30:2] = False
 
-        subIndex = self.strIndex[boolIdx]
+        subIndex = self.strIndex[boolIndex]
 
         for i, val in enumerate(subIndex):
-            self.assertEqual(subIndex.get_loc(val), i)
+            assert subIndex.get_loc(val) == i
 
-        subIndex = self.strIndex[list(boolIdx)]
+        subIndex = self.strIndex[list(boolIndex)]
         for i, val in enumerate(subIndex):
-            self.assertEqual(subIndex.get_loc(val), i)
+            assert subIndex.get_loc(val) == i
 
     def test_fancy(self):
         sl = self.strIndex[[1, 2, 3]]
         for i in sl:
-            self.assertEqual(i, sl[sl.get_loc(i)])
-
-    def test_empty_fancy(self):
-        empty_farr = np.array([], dtype=np.float_)
-        empty_iarr = np.array([], dtype=np.int_)
-        empty_barr = np.array([], dtype=np.bool_)
-
+            assert i == sl[sl.get_loc(i)]
+
+    @pytest.mark.parametrize("attr", [
+        'strIndex', 'intIndex', 'floatIndex'])
+    @pytest.mark.parametrize("dtype", [np.int_, np.bool_])
+    def test_empty_fancy(self, attr, dtype):
+        empty_arr = np.array([], dtype=dtype)
+        index = getattr(self, attr)
+        empty_index = index.__class__([])
+
+        assert index[[]].identical(empty_index)
+        assert index[empty_arr].identical(empty_index)
+
+    @pytest.mark.parametrize("attr", [
+        'strIndex', 'intIndex', 'floatIndex'])
+    def test_empty_fancy_raises(self, attr):
         # pd.DatetimeIndex is excluded, because it overrides getitem and should
         # be tested separately.
-        for idx in [self.strIndex, self.intIndex, self.floatIndex]:
-            empty_idx = idx.__class__([])
-
-            self.assertTrue(idx[[]].identical(empty_idx))
-            self.assertTrue(idx[empty_iarr].identical(empty_idx))
-            self.assertTrue(idx[empty_barr].identical(empty_idx))
-
-            # np.ndarray only accepts ndarray of int & bool dtypes, so should
-            # Index.
-            self.assertRaises(IndexError, idx.__getitem__, empty_farr)
-
-    def test_getitem(self):
-        arr = np.array(self.dateIndex)
-        exp = self.dateIndex[5]
-        exp = _to_m8(exp)
+        empty_farr = np.array([], dtype=np.float_)
+        index = getattr(self, attr)
+        empty_index = index.__class__([])
 
-        self.assertEqual(exp, arr[5])
+        assert index[[]].identical(empty_index)
+        # np.ndarray only accepts ndarray of int & bool dtypes, so should Index
+        msg = r"arrays used as indices must be of integer \(or boolean\) type"
+        with pytest.raises(IndexError, match=msg):
+            index[empty_farr]
 
-    def test_intersection(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection(self, sort):
         first = self.strIndex[:20]
         second = self.strIndex[:10]
-        intersect = first.intersection(second)
-        self.assertTrue(tm.equalContents(intersect, second))
+        intersect = first.intersection(second, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(intersect, second.sort_values())
+        assert tm.equalContents(intersect, second)
 
         # Corner cases
-        inter = first.intersection(first)
-        self.assertIs(inter, first)
-
-        idx1 = Index([1, 2, 3, 4, 5], name='idx')
-        # if target has the same name, it is preserved
-        idx2 = Index([3, 4, 5, 6, 7], name='idx')
-        expected2 = Index([3, 4, 5], name='idx')
-        result2 = idx1.intersection(idx2)
-        self.assert_index_equal(result2, expected2)
-        self.assertEqual(result2.name, expected2.name)
-
-        # if target name is different, it will be reset
-        idx3 = Index([3, 4, 5, 6, 7], name='other')
-        expected3 = Index([3, 4, 5], name=None)
-        result3 = idx1.intersection(idx3)
-        self.assert_index_equal(result3, expected3)
-        self.assertEqual(result3.name, expected3.name)
-
-        # non monotonic
-        idx1 = Index([5, 3, 2, 4, 1], name='idx')
-        idx2 = Index([4, 7, 6, 5, 3], name='idx')
-        expected = Index([5, 3, 4], name='idx')
-        result = idx1.intersection(idx2)
-        self.assert_index_equal(result, expected)
-
-        idx2 = Index([4, 7, 6, 5, 3], name='other')
-        expected = Index([5, 3, 4], name=None)
-        result = idx1.intersection(idx2)
-        self.assert_index_equal(result, expected)
+        inter = first.intersection(first, sort=sort)
+        assert inter is first
+
+    @pytest.mark.parametrize("index2,keeps_name", [
+        (Index([3, 4, 5, 6, 7], name="index"), True),  # preserve same name
+        (Index([3, 4, 5, 6, 7], name="other"), False),  # drop diff names
+        (Index([3, 4, 5, 6, 7]), False)])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_name_preservation(self, index2, keeps_name, sort):
+        index1 = Index([1, 2, 3, 4, 5], name='index')
+        expected = Index([3, 4, 5])
+        result = index1.intersection(index2, sort)
+
+        if keeps_name:
+            expected.name = 'index'
+
+        assert result.name == expected.name
+        tm.assert_index_equal(result, expected)
 
-        # non-monotonic non-unique
-        idx1 = Index(['A', 'B', 'A', 'C'])
-        idx2 = Index(['B', 'D'])
-        expected = Index(['B'], dtype='object')
-        result = idx1.intersection(idx2)
-        self.assert_index_equal(result, expected)
-
-        idx2 = Index(['B', 'D', 'A'])
-        expected = Index(['A', 'B', 'A'], dtype='object')
-        result = idx1.intersection(idx2)
-        self.assert_index_equal(result, expected)
-
-        # preserve names
+    @pytest.mark.parametrize("first_name,second_name,expected_name", [
+        ('A', 'A', 'A'), ('A', 'B', None), (None, 'B', None)])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_name_preservation2(self, first_name, second_name,
+                                             expected_name, sort):
         first = self.strIndex[5:20]
         second = self.strIndex[:10]
-        first.name = 'A'
-        second.name = 'A'
-        intersect = first.intersection(second)
-        self.assertEqual(intersect.name, 'A')
+        first.name = first_name
+        second.name = second_name
+        intersect = first.intersection(second, sort=sort)
+        assert intersect.name == expected_name
+
+    @pytest.mark.parametrize("index2,keeps_name", [
+        (Index([4, 7, 6, 5, 3], name='index'), True),
+        (Index([4, 7, 6, 5, 3], name='other'), False)])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_monotonic(self, index2, keeps_name, sort):
+        index1 = Index([5, 3, 2, 4, 1], name='index')
+        expected = Index([5, 3, 4])
+
+        if keeps_name:
+            expected.name = "index"
+
+        result = index1.intersection(index2, sort=sort)
+        if sort is None:
+            expected = expected.sort_values()
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("index2,expected_arr", [
+        (Index(['B', 'D']), ['B']),
+        (Index(['B', 'D', 'A']), ['A', 'B', 'A'])])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_non_monotonic_non_unique(self, index2, expected_arr,
+                                                   sort):
+        # non-monotonic non-unique
+        index1 = Index(['A', 'B', 'A', 'C'])
+        expected = Index(expected_arr, dtype='object')
+        result = index1.intersection(index2, sort=sort)
+        if sort is None:
+            expected = expected.sort_values()
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersect_str_dates(self, sort):
+        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
+
+        i1 = Index(dt_dates, dtype=object)
+        i2 = Index(['aa'], dtype=object)
+        result = i2.intersection(i1, sort=sort)
+
+        assert len(result) == 0
+
+    def test_intersect_nosort(self):
+        result = pd.Index(['c', 'b', 'a']).intersection(['b', 'a'])
+        expected = pd.Index(['b', 'a'])
+        tm.assert_index_equal(result, expected)
 
-        second.name = 'B'
-        intersect = first.intersection(second)
-        self.assertIsNone(intersect.name)
+    def test_intersection_equal_sort(self):
+        idx = pd.Index(['c', 'a', 'b'])
+        tm.assert_index_equal(idx.intersection(idx, sort=False), idx)
+        tm.assert_index_equal(idx.intersection(idx, sort=None), idx)
+
+    @pytest.mark.xfail(reason="Not implemented")
+    def test_intersection_equal_sort_true(self):
+        # TODO decide on True behaviour
+        idx = pd.Index(['c', 'a', 'b'])
+        sorted_ = pd.Index(['a', 'b', 'c'])
+        tm.assert_index_equal(idx.intersection(idx, sort=True), sorted_)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_chained_union(self, sort):
+        # Chained unions handles names correctly
+        i1 = Index([1, 2], name='i1')
+        i2 = Index([5, 6], name='i2')
+        i3 = Index([3, 4], name='i3')
+        union = i1.union(i2.union(i3, sort=sort), sort=sort)
+        expected = i1.union(i2, sort=sort).union(i3, sort=sort)
+        tm.assert_index_equal(union, expected)
 
-        first.name = None
-        second.name = 'B'
-        intersect = first.intersection(second)
-        self.assertIsNone(intersect.name)
+        j1 = Index([1, 2], name='j1')
+        j2 = Index([], name='j2')
+        j3 = Index([], name='j3')
+        union = j1.union(j2.union(j3, sort=sort), sort=sort)
+        expected = j1.union(j2, sort=sort).union(j3, sort=sort)
+        tm.assert_index_equal(union, expected)
 
-    def test_union(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union(self, sort):
+        # TODO: Replace with fixturesult
         first = self.strIndex[5:20]
         second = self.strIndex[:10]
         everything = self.strIndex[:20]
-        union = first.union(second)
-        self.assertTrue(tm.equalContents(union, everything))
 
-        # GH 10149
-        cases = [klass(second.values) for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.union(case)
-            self.assertTrue(tm.equalContents(result, everything))
+        union = first.union(second, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(union, everything.sort_values())
+        assert tm.equalContents(union, everything)
+
+    @pytest.mark.parametrize('slice_', [slice(None), slice(0)])
+    def test_union_sort_other_special(self, slice_):
+        # https://github.com/pandas-dev/pandas/issues/24959
+
+        idx = pd.Index([1, 0, 2])
+        # default, sort=None
+        other = idx[slice_]
+        tm.assert_index_equal(idx.union(other), idx)
+        tm.assert_index_equal(other.union(idx), idx)
+
+        # sort=False
+        tm.assert_index_equal(idx.union(other, sort=False), idx)
+
+    @pytest.mark.xfail(reason="Not implemented")
+    @pytest.mark.parametrize('slice_', [slice(None), slice(0)])
+    def test_union_sort_special_true(self, slice_):
+        # TODO decide on True behaviour
+        # sort=True
+        idx = pd.Index([1, 0, 2])
+        # default, sort=None
+        other = idx[slice_]
+
+        result = idx.union(other, sort=True)
+        expected = pd.Index([0, 1, 2])
+        tm.assert_index_equal(result, expected)
 
-        # Corner cases
-        union = first.union(first)
-        self.assertIs(union, first)
+    def test_union_sort_other_incomparable(self):
+        # https://github.com/pandas-dev/pandas/issues/24959
+        idx = pd.Index([1, pd.Timestamp('2000')])
+        # default (sort=None)
+        with tm.assert_produces_warning(RuntimeWarning):
+            result = idx.union(idx[:1])
 
-        union = first.union([])
-        self.assertIs(union, first)
+        tm.assert_index_equal(result, idx)
 
-        union = Index([]).union(first)
-        self.assertIs(union, first)
+        # sort=None
+        with tm.assert_produces_warning(RuntimeWarning):
+            result = idx.union(idx[:1], sort=None)
+        tm.assert_index_equal(result, idx)
 
-        # preserve names
-        first = Index(list('ab'), name='A')
-        second = Index(list('ab'), name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name=None)
-        tm.assert_index_equal(union, expected)
+        # sort=False
+        result = idx.union(idx[:1], sort=False)
+        tm.assert_index_equal(result, idx)
 
-        first = Index(list('ab'), name='A')
-        second = Index([], name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name=None)
-        tm.assert_index_equal(union, expected)
+    @pytest.mark.xfail(reason="Not implemented")
+    def test_union_sort_other_incomparable_true(self):
+        # TODO decide on True behaviour
+        # sort=True
+        idx = pd.Index([1, pd.Timestamp('2000')])
+        with pytest.raises(TypeError, match='.*'):
+            idx.union(idx[:1], sort=True)
+
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_from_iterables(self, klass, sort):
+        # GH 10149
+        # TODO: Replace with fixturesult
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        everything = self.strIndex[:20]
 
-        first = Index([], name='A')
-        second = Index(list('ab'), name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name=None)
-        tm.assert_index_equal(union, expected)
+        case = klass(second.values)
+        result = first.union(case, sort=sort)
+        if sort is None:
+            tm.assert_index_equal(result, everything.sort_values())
+        assert tm.equalContents(result, everything)
 
-        first = Index(list('ab'))
-        second = Index(list('ab'), name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name='B')
-        tm.assert_index_equal(union, expected)
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_identity(self, sort):
+        # TODO: replace with fixturesult
+        first = self.strIndex[5:20]
 
-        first = Index([])
-        second = Index(list('ab'), name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name='B')
-        tm.assert_index_equal(union, expected)
+        union = first.union(first, sort=sort)
+        # i.e. identity is not preserved when sort is True
+        assert (union is first) is (not sort)
 
-        first = Index(list('ab'))
-        second = Index([], name='B')
-        union = first.union(second)
-        expected = Index(list('ab'), name='B')
-        tm.assert_index_equal(union, expected)
+        union = first.union([], sort=sort)
+        assert (union is first) is (not sort)
 
-        first = Index(list('ab'), name='A')
-        second = Index(list('ab'))
-        union = first.union(second)
-        expected = Index(list('ab'), name='A')
-        tm.assert_index_equal(union, expected)
+        union = Index([]).union(first, sort=sort)
+        assert (union is first) is (not sort)
 
-        first = Index(list('ab'), name='A')
-        second = Index([])
-        union = first.union(second)
-        expected = Index(list('ab'), name='A')
-        tm.assert_index_equal(union, expected)
+    @pytest.mark.parametrize("first_list", [list('ba'), list()])
+    @pytest.mark.parametrize("second_list", [list('ab'), list()])
+    @pytest.mark.parametrize("first_name, second_name, expected_name", [
+        ('A', 'B', None), (None, 'B', None), ('A', None, None)])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_name_preservation(self, first_list, second_list, first_name,
+                                     second_name, expected_name, sort):
+        first = Index(first_list, name=first_name)
+        second = Index(second_list, name=second_name)
+        union = first.union(second, sort=sort)
 
-        first = Index([], name='A')
-        second = Index(list('ab'))
-        union = first.union(second)
-        expected = Index(list('ab'), name='A')
-        tm.assert_index_equal(union, expected)
+        vals = set(first_list).union(second_list)
 
-        with tm.assert_produces_warning(RuntimeWarning):
-            firstCat = self.strIndex.union(self.dateIndex)
+        if sort is None and len(first_list) > 0 and len(second_list) > 0:
+            expected = Index(sorted(vals), name=expected_name)
+            tm.assert_index_equal(union, expected)
+        else:
+            expected = Index(vals, name=expected_name)
+            assert tm.equalContents(union, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_union_dt_as_obj(self, sort):
+        # TODO: Replace with fixturesult
+        firstCat = self.strIndex.union(self.dateIndex)
         secondCat = self.strIndex.union(self.strIndex)
 
         if self.dateIndex.dtype == np.object_:
@@ -751,35 +933,24 @@ def test_union(self):
         else:
             appended = np.append(self.strIndex, self.dateIndex.astype('O'))
 
-        self.assertTrue(tm.equalContents(firstCat, appended))
-        self.assertTrue(tm.equalContents(secondCat, self.strIndex))
+        assert tm.equalContents(firstCat, appended)
+        assert tm.equalContents(secondCat, self.strIndex)
         tm.assert_contains_all(self.strIndex, firstCat)
         tm.assert_contains_all(self.strIndex, secondCat)
         tm.assert_contains_all(self.dateIndex, firstCat)
 
-    def test_add(self):
-        idx = self.strIndex
-        expected = Index(self.strIndex.values * 2)
-        self.assert_index_equal(idx + idx, expected)
-        self.assert_index_equal(idx + idx.tolist(), expected)
-        self.assert_index_equal(idx.tolist() + idx, expected)
-
-        # test add and radd
-        idx = Index(list('abc'))
-        expected = Index(['a1', 'b1', 'c1'])
-        self.assert_index_equal(idx + '1', expected)
-        expected = Index(['1a', '1b', '1c'])
-        self.assert_index_equal('1' + idx, expected)
-
-    def test_sub(self):
-        idx = self.strIndex
-        self.assertRaises(TypeError, lambda: idx - 'a')
-        self.assertRaises(TypeError, lambda: idx - idx)
-        self.assertRaises(TypeError, lambda: idx - idx.tolist())
-        self.assertRaises(TypeError, lambda: idx.tolist() - idx)
+    @pytest.mark.parametrize("method", ['union', 'intersection', 'difference',
+                                        'symmetric_difference'])
+    def test_setops_disallow_true(self, method):
+        idx1 = pd.Index(['a', 'b'])
+        idx2 = pd.Index(['b', 'c'])
+
+        with pytest.raises(ValueError, match="The 'sort' keyword only takes"):
+            getattr(idx1, method)(idx2, sort=True)
 
     def test_map_identity_mapping(self):
         # GH 12766
+        # TODO: replace with fixture
         for name, cur_index in self.indices.items():
             tm.assert_index_equal(cur_index, cur_index.map(lambda x: x))
 
@@ -788,16 +959,18 @@ def test_map_with_tuples(self):
 
         # Test that returning a single tuple from an Index
         #   returns an Index.
-        boolean_index = tm.makeIntIndex(3).map(lambda x: (x,))
-        expected = Index([(0,), (1,), (2,)])
-        tm.assert_index_equal(boolean_index, expected)
+        index = tm.makeIntIndex(3)
+        result = tm.makeIntIndex(3).map(lambda x: (x,))
+        expected = Index([(i,) for i in index])
+        tm.assert_index_equal(result, expected)
 
         # Test that returning a tuple from a map of a single index
         #   returns a MultiIndex object.
-        boolean_index = tm.makeIntIndex(3).map(lambda x: (x, x == 1))
-        expected = MultiIndex.from_tuples([(0, False), (1, True), (2, False)])
-        tm.assert_index_equal(boolean_index, expected)
+        result = index.map(lambda x: (x, x == 1))
+        expected = MultiIndex.from_tuples([(i, i == 1) for i in index])
+        tm.assert_index_equal(result, expected)
 
+    def test_map_with_tuples_mi(self):
         # Test that returning a single object from a MultiIndex
         #   returns an Index.
         first_level = ['foo', 'bar', 'baz']
@@ -805,164 +978,289 @@ def test_map_with_tuples(self):
         reduced_index = multi_index.map(lambda x: x[0])
         tm.assert_index_equal(reduced_index, Index(first_level))
 
-    def test_map_tseries_indices_return_index(self):
-        date_index = tm.makeDateIndex(10)
-        exp = Index([1] * 10)
-        tm.assert_index_equal(exp, date_index.map(lambda x: 1))
+    @pytest.mark.parametrize("attr", [
+        'makeDateIndex', 'makePeriodIndex', 'makeTimedeltaIndex'])
+    def test_map_tseries_indices_return_index(self, attr):
+        index = getattr(tm, attr)(10)
+        expected = Index([1] * 10)
+        result = index.map(lambda x: 1)
+        tm.assert_index_equal(expected, result)
 
-        period_index = tm.makePeriodIndex(10)
-        tm.assert_index_equal(exp, period_index.map(lambda x: 1))
+    def test_map_tseries_indices_accsr_return_index(self):
+        date_index = tm.makeDateIndex(24, freq='h', name='hourly')
+        expected = Index(range(24), name='hourly')
+        tm.assert_index_equal(expected, date_index.map(lambda x: x.hour))
+
+    @pytest.mark.parametrize(
+        "mapper",
+        [
+            lambda values, index: {i: e for e, i in zip(values, index)},
+            lambda values, index: pd.Series(values, index)])
+    def test_map_dictlike(self, mapper):
+        # GH 12756
+        expected = Index(['foo', 'bar', 'baz'])
+        index = tm.makeIntIndex(3)
+        result = index.map(mapper(expected.values, index))
+        tm.assert_index_equal(result, expected)
 
-        tdelta_index = tm.makeTimedeltaIndex(10)
-        tm.assert_index_equal(exp, tdelta_index.map(lambda x: 1))
+        # TODO: replace with fixture
+        for name in self.indices.keys():
+            if name == 'catIndex':
+                # Tested in test_categorical
+                continue
+            elif name == 'repeats':
+                # Cannot map duplicated index
+                continue
 
-        date_index = tm.makeDateIndex(24, freq='h', name='hourly')
-        exp = Index(range(24), name='hourly')
-        tm.assert_index_equal(exp, date_index.map(lambda x: x.hour))
+            index = self.indices[name]
+            expected = Index(np.arange(len(index), 0, -1))
+
+            # to match proper result coercion for uints
+            if name == 'empty':
+                expected = Index([])
+
+            result = index.map(mapper(expected, index))
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("mapper", [
+        Series(['foo', 2., 'baz'], index=[0, 2, -1]),
+        {0: 'foo', 2: 2.0, -1: 'baz'}])
+    def test_map_with_non_function_missing_values(self, mapper):
+        # GH 12756
+        expected = Index([2., np.nan, 'foo'])
+        result = Index([2, 1, 0]).map(mapper)
+
+        tm.assert_index_equal(expected, result)
+
+    def test_map_na_exclusion(self):
+        index = Index([1.5, np.nan, 3, np.nan, 5])
+
+        result = index.map(lambda x: x * 2, na_action='ignore')
+        expected = index * 2
+        tm.assert_index_equal(result, expected)
+
+    def test_map_defaultdict(self):
+        index = Index([1, 2, 3])
+        default_dict = defaultdict(lambda: 'blank')
+        default_dict[1] = 'stuff'
+        result = index.map(default_dict)
+        expected = Index(['stuff', 'blank', 'blank'])
+        tm.assert_index_equal(result, expected)
 
     def test_append_multiple(self):
         index = Index(['a', 'b', 'c', 'd', 'e', 'f'])
 
         foos = [index[:2], index[2:4], index[4:]]
         result = foos[0].append(foos[1:])
-        self.assert_index_equal(result, index)
+        tm.assert_index_equal(result, index)
 
         # empty
         result = index.append([])
-        self.assert_index_equal(result, index)
+        tm.assert_index_equal(result, index)
 
-    def test_append_empty_preserve_name(self):
+    @pytest.mark.parametrize("name,expected", [
+        ('foo', 'foo'), ('bar', None)])
+    def test_append_empty_preserve_name(self, name, expected):
         left = Index([], name='foo')
-        right = Index([1, 2, 3], name='foo')
+        right = Index([1, 2, 3], name=name)
 
         result = left.append(right)
-        self.assertEqual(result.name, 'foo')
+        assert result.name == expected
 
-        left = Index([], name='foo')
-        right = Index([1, 2, 3], name='bar')
+    @pytest.mark.parametrize("second_name,expected", [
+        (None, None), ('name', 'name')])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_name_preservation(self, second_name, expected, sort):
+        # TODO: replace with fixturesult
+        first = self.strIndex[5:20]
+        second = self.strIndex[:10]
+        answer = self.strIndex[10:20]
 
-        result = left.append(right)
-        self.assertIsNone(result.name)
+        first.name = 'name'
+        second.name = second_name
+        result = first.difference(second, sort=sort)
+
+        assert tm.equalContents(result, answer)
 
-    def test_add_string(self):
-        # from bug report
-        index = Index(['a', 'b', 'c'])
-        index2 = index + 'foo'
+        if expected is None:
+            assert result.name is None
+        else:
+            assert result.name == expected
 
-        self.assertNotIn('a', index2)
-        self.assertIn('afoo', index2)
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_empty_arg(self, sort):
+        first = self.strIndex[5:20]
+        first.name == 'name'
+        result = first.difference([], sort)
 
-    def test_iadd_string(self):
-        index = pd.Index(['a', 'b', 'c'])
-        # doesn't fail test unless there is a check before `+=`
-        self.assertIn('a', index)
+        assert tm.equalContents(result, first)
+        assert result.name == first.name
 
-        index += '_x'
-        self.assertIn('a_x', index)
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_identity(self, sort):
+        first = self.strIndex[5:20]
+        first.name == 'name'
+        result = first.difference(first, sort)
 
-    def test_difference(self):
+        assert len(result) == 0
+        assert result.name == first.name
 
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_sort(self, sort):
         first = self.strIndex[5:20]
         second = self.strIndex[:10]
-        answer = self.strIndex[10:20]
-        first.name = 'name'
-        # different names
-        result = first.difference(second)
-
-        self.assertTrue(tm.equalContents(result, answer))
-        self.assertEqual(result.name, None)
 
-        # same names
-        second.name = 'name'
-        result = first.difference(second)
-        self.assertEqual(result.name, 'name')
+        result = first.difference(second, sort)
+        expected = self.strIndex[10:20]
 
-        # with empty
-        result = first.difference([])
-        self.assertTrue(tm.equalContents(result, first))
-        self.assertEqual(result.name, first.name)
+        if sort is None:
+            expected = expected.sort_values()
 
-        # with everythin
-        result = first.difference(first)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.name, first.name)
+        tm.assert_index_equal(result, expected)
 
-    def test_symmetric_difference(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_symmetric_difference(self, sort):
         # smoke
-        idx1 = Index([1, 2, 3, 4], name='idx1')
-        idx2 = Index([2, 3, 4, 5])
-        result = idx1.symmetric_difference(idx2)
-        expected = Index([1, 5])
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertIsNone(result.name)
+        index1 = Index([5, 2, 3, 4], name='index1')
+        index2 = Index([2, 3, 4, 1])
+        result = index1.symmetric_difference(index2, sort=sort)
+        expected = Index([5, 1])
+        assert tm.equalContents(result, expected)
+        assert result.name is None
+        if sort is None:
+            expected = expected.sort_values()
+        tm.assert_index_equal(result, expected)
 
         # __xor__ syntax
-        expected = idx1 ^ idx2
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertIsNone(result.name)
-
-        # multiIndex
-        idx1 = MultiIndex.from_tuples(self.tuples)
-        idx2 = MultiIndex.from_tuples([('foo', 1), ('bar', 3)])
-        result = idx1.symmetric_difference(idx2)
+        expected = index1 ^ index2
+        assert tm.equalContents(result, expected)
+        assert result.name is None
+
+    @pytest.mark.parametrize('opname', ['difference', 'symmetric_difference'])
+    def test_difference_incomparable(self, opname):
+        a = pd.Index([3, pd.Timestamp('2000'), 1])
+        b = pd.Index([2, pd.Timestamp('1999'), 1])
+        op = operator.methodcaller(opname, b)
+
+        # sort=None, the default
+        result = op(a)
+        expected = pd.Index([3, pd.Timestamp('2000'), 2, pd.Timestamp('1999')])
+        if opname == 'difference':
+            expected = expected[:2]
+        tm.assert_index_equal(result, expected)
+
+        # sort=False
+        op = operator.methodcaller(opname, b, sort=False)
+        result = op(a)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.xfail(reason="Not implemented")
+    @pytest.mark.parametrize('opname', ['difference', 'symmetric_difference'])
+    def test_difference_incomparable_true(self, opname):
+        # TODO decide on True behaviour
+        # # sort=True, raises
+        a = pd.Index([3, pd.Timestamp('2000'), 1])
+        b = pd.Index([2, pd.Timestamp('1999'), 1])
+        op = operator.methodcaller(opname, b, sort=True)
+
+        with pytest.raises(TypeError, match='Cannot compare'):
+            op(a)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_symmetric_difference_mi(self, sort):
+        index1 = MultiIndex.from_tuples(self.tuples)
+        index2 = MultiIndex.from_tuples([('foo', 1), ('bar', 3)])
+        result = index1.symmetric_difference(index2, sort=sort)
         expected = MultiIndex.from_tuples([('bar', 2), ('baz', 3), ('bar', 3)])
-        self.assertTrue(tm.equalContents(result, expected))
+        if sort is None:
+            expected = expected.sort_values()
+        tm.assert_index_equal(result, expected)
+        assert tm.equalContents(result, expected)
 
-        # nans:
+    @pytest.mark.parametrize("index2,expected", [
+        (Index([0, 1, np.nan]), Index([2.0, 3.0, 0.0])),
+        (Index([0, 1]), Index([np.nan, 2.0, 3.0, 0.0]))])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_symmetric_difference_missing(self, index2, expected, sort):
         # GH 13514 change: {nan} - {nan} == {}
         # (GH 6444, sorting of nans, is no longer an issue)
-        idx1 = Index([1, np.nan, 2, 3])
-        idx2 = Index([0, 1, np.nan])
-        idx3 = Index([0, 1])
-
-        result = idx1.symmetric_difference(idx2)
-        expected = Index([0.0, 2.0, 3.0])
-        tm.assert_index_equal(result, expected)
+        index1 = Index([1, np.nan, 2, 3])
 
-        result = idx1.symmetric_difference(idx3)
-        expected = Index([0.0, 2.0, 3.0, np.nan])
+        result = index1.symmetric_difference(index2, sort=sort)
+        if sort is None:
+            expected = expected.sort_values()
         tm.assert_index_equal(result, expected)
 
-        # other not an Index:
-        idx1 = Index([1, 2, 3, 4], name='idx1')
-        idx2 = np.array([2, 3, 4, 5])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_symmetric_difference_non_index(self, sort):
+        index1 = Index([1, 2, 3, 4], name='index1')
+        index2 = np.array([2, 3, 4, 5])
         expected = Index([1, 5])
-        result = idx1.symmetric_difference(idx2)
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertEqual(result.name, 'idx1')
-
-        result = idx1.symmetric_difference(idx2, result_name='new_name')
-        self.assertTrue(tm.equalContents(result, expected))
-        self.assertEqual(result.name, 'new_name')
-
-    def test_is_numeric(self):
-        self.assertFalse(self.dateIndex.is_numeric())
-        self.assertFalse(self.strIndex.is_numeric())
-        self.assertTrue(self.intIndex.is_numeric())
-        self.assertTrue(self.floatIndex.is_numeric())
-        self.assertFalse(self.catIndex.is_numeric())
-
-    def test_is_object(self):
-        self.assertTrue(self.strIndex.is_object())
-        self.assertTrue(self.boolIndex.is_object())
-        self.assertFalse(self.catIndex.is_object())
-        self.assertFalse(self.intIndex.is_object())
-        self.assertFalse(self.dateIndex.is_object())
-        self.assertFalse(self.floatIndex.is_object())
-
-    def test_is_all_dates(self):
-        self.assertTrue(self.dateIndex.is_all_dates)
-        self.assertFalse(self.strIndex.is_all_dates)
-        self.assertFalse(self.intIndex.is_all_dates)
+        result = index1.symmetric_difference(index2, sort=sort)
+        assert tm.equalContents(result, expected)
+        assert result.name == 'index1'
+
+        result = index1.symmetric_difference(index2, result_name='new_name',
+                                             sort=sort)
+        assert tm.equalContents(result, expected)
+        assert result.name == 'new_name'
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_type(self, sort):
+        # GH 20040
+        # If taking difference of a set and itself, it
+        # needs to preserve the type of the index
+        skip_index_keys = ['repeats']
+        for key, index in self.generate_index_types(skip_index_keys):
+            result = index.difference(index, sort=sort)
+            expected = index.drop(index)
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_difference(self, sort):
+        # GH 20040
+        # Test that the intersection of an index with an
+        # empty index produces the same index as the difference
+        # of an index with itself.  Test for all types
+        skip_index_keys = ['repeats']
+        for key, index in self.generate_index_types(skip_index_keys):
+            inter = index.intersection(index.drop(index))
+            diff = index.difference(index, sort=sort)
+            tm.assert_index_equal(inter, diff)
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', False), ('boolIndex', False), ('catIndex', False),
+        ('intIndex', True), ('dateIndex', False), ('floatIndex', True)])
+    def test_is_numeric(self, attr, expected):
+        assert getattr(self, attr).is_numeric() == expected
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', True), ('boolIndex', True), ('catIndex', False),
+        ('intIndex', False), ('dateIndex', False), ('floatIndex', False)])
+    def test_is_object(self, attr, expected):
+        assert getattr(self, attr).is_object() == expected
+
+    @pytest.mark.parametrize("attr,expected", [
+        ('strIndex', False), ('boolIndex', False), ('catIndex', False),
+        ('intIndex', False), ('dateIndex', True), ('floatIndex', False)])
+    def test_is_all_dates(self, attr, expected):
+        assert getattr(self, attr).is_all_dates == expected
 
     def test_summary(self):
-        self._check_method_works(Index.summary)
+        self._check_method_works(Index._summary)
         # GH3869
         ind = Index(['{other}%s', "~:{range}:0"], name='A')
-        result = ind.summary()
+        result = ind._summary()
         # shouldn't be formatted accidentally.
-        self.assertIn('~:{range}:0', result)
-        self.assertIn('{other}%s', result)
+        assert '~:{range}:0' in result
+        assert '{other}%s' in result
+
+    # GH18217
+    def test_summary_deprecated(self):
+        ind = Index(['{other}%s', "~:{range}:0"], name='A')
+
+        with tm.assert_produces_warning(FutureWarning):
+            ind.summary()
 
     def test_format(self):
         self._check_method_works(Index.format)
@@ -970,27 +1268,29 @@ def test_format(self):
         # GH 14626
         # windows has different precision on datetime.datetime.now (it doesn't
         # include us since the default for Timestamp shows these but Index
-        # formating does not we are skipping)
+        # formatting does not we are skipping)
         now = datetime.now()
         if not str(now).endswith("000"):
             index = Index([now])
             formatted = index.format()
             expected = [str(index[0])]
-            self.assertEqual(formatted, expected)
+            assert formatted == expected
 
+        self.strIndex[:0].format()
+
+    @pytest.mark.parametrize("vals", [
+        [1, 2.0 + 3.0j, 4.], ['a', 'b', 'c']])
+    def test_format_missing(self, vals, nulls_fixture):
         # 2845
-        index = Index([1, 2.0 + 3.0j, np.nan])
-        formatted = index.format()
-        expected = [str(index[0]), str(index[1]), u('NaN')]
-        self.assertEqual(formatted, expected)
+        vals = list(vals)  # Copy for each iteration
+        vals.append(nulls_fixture)
+        index = Index(vals)
 
-        # is this really allowed?
-        index = Index([1, 2.0 + 3.0j, None])
         formatted = index.format()
-        expected = [str(index[0]), str(index[1]), u('NaN')]
-        self.assertEqual(formatted, expected)
+        expected = [str(index[0]), str(index[1]), str(index[2]), u('NaN')]
 
-        self.strIndex[:0].format()
+        assert formatted == expected
+        assert index[3] is nulls_fixture
 
     def test_format_with_name_time_info(self):
         # bug I fixed 12/20/2011
@@ -998,29 +1298,23 @@ def test_format_with_name_time_info(self):
         dates = Index([dt + inc for dt in self.dateIndex], name='something')
 
         formatted = dates.format(name=True)
-        self.assertEqual(formatted[0], 'something')
+        assert formatted[0] == 'something'
 
     def test_format_datetime_with_time(self):
         t = Index([datetime(2012, 2, 7), datetime(2012, 2, 7, 23)])
 
         result = t.format()
         expected = ['2012-02-07 00:00:00', '2012-02-07 23:00:00']
-        self.assertEqual(len(result), 2)
-        self.assertEqual(result, expected)
-
-    def test_format_none(self):
-        values = ['a', 'b', 'c', None]
+        assert len(result) == 2
+        assert result == expected
 
-        idx = Index(values)
-        idx.format()
-        self.assertIsNone(idx[3])
-
-    def test_logical_compat(self):
-        idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
+    @pytest.mark.parametrize("op", ['any', 'all'])
+    def test_logical_compat(self, op):
+        index = self.create_index()
+        assert getattr(index, op)() == getattr(index.values, op)()
 
     def _check_method_works(self, method):
+        # TODO: make this a dedicated test with parametrized methods
         method(self.empty)
         method(self.dateIndex)
         method(self.unicodeIndex)
@@ -1030,786 +1324,938 @@ def _check_method_works(self, method):
         method(self.catIndex)
 
     def test_get_indexer(self):
-        idx1 = Index([1, 2, 3, 4, 5])
-        idx2 = Index([2, 4, 6])
-
-        r1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, np.array([1, 3, -1], dtype=np.intp))
+        index1 = Index([1, 2, 3, 4, 5])
+        index2 = Index([2, 4, 6])
 
-        r1 = idx2.get_indexer(idx1, method='pad')
-        e1 = np.array([-1, 0, 0, 1, 1], dtype=np.intp)
+        r1 = index1.get_indexer(index2)
+        e1 = np.array([1, 3, -1], dtype=np.intp)
         assert_almost_equal(r1, e1)
 
-        r2 = idx2.get_indexer(idx1[::-1], method='pad')
-        assert_almost_equal(r2, e1[::-1])
+    @pytest.mark.parametrize("reverse", [True, False])
+    @pytest.mark.parametrize("expected,method", [
+        (np.array([-1, 0, 0, 1, 1], dtype=np.intp), 'pad'),
+        (np.array([-1, 0, 0, 1, 1], dtype=np.intp), 'ffill'),
+        (np.array([0, 0, 1, 1, 2], dtype=np.intp), 'backfill'),
+        (np.array([0, 0, 1, 1, 2], dtype=np.intp), 'bfill')])
+    def test_get_indexer_methods(self, reverse, expected, method):
+        index1 = Index([1, 2, 3, 4, 5])
+        index2 = Index([2, 4, 6])
 
-        rffill1 = idx2.get_indexer(idx1, method='ffill')
-        assert_almost_equal(r1, rffill1)
+        if reverse:
+            index1 = index1[::-1]
+            expected = expected[::-1]
 
-        r1 = idx2.get_indexer(idx1, method='backfill')
-        e1 = np.array([0, 0, 1, 1, 2], dtype=np.intp)
-        assert_almost_equal(r1, e1)
-
-        rbfill1 = idx2.get_indexer(idx1, method='bfill')
-        assert_almost_equal(r1, rbfill1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='backfill')
-        assert_almost_equal(r2, e1[::-1])
+        result = index2.get_indexer(index1, method=method)
+        assert_almost_equal(result, expected)
 
     def test_get_indexer_invalid(self):
         # GH10411
-        idx = Index(np.arange(10))
-
-        with tm.assertRaisesRegexp(ValueError, 'tolerance argument'):
-            idx.get_indexer([1, 0], tolerance=1)
-
-        with tm.assertRaisesRegexp(ValueError, 'limit argument'):
-            idx.get_indexer([1, 0], limit=1)
-
-    def test_get_indexer_nearest(self):
-        idx = Index(np.arange(10))
-
-        all_methods = ['pad', 'backfill', 'nearest']
-        for method in all_methods:
-            actual = idx.get_indexer([0, 5, 9], method=method)
-            tm.assert_numpy_array_equal(actual, np.array([0, 5, 9],
-                                                         dtype=np.intp))
-
-            actual = idx.get_indexer([0, 5, 9], method=method, tolerance=0)
-            tm.assert_numpy_array_equal(actual, np.array([0, 5, 9],
-                                                         dtype=np.intp))
-
-        for method, expected in zip(all_methods, [[0, 1, 8], [1, 2, 9],
-                                                  [0, 2, 9]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method)
-            tm.assert_numpy_array_equal(actual, np.array(expected,
-                                                         dtype=np.intp))
-
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method,
-                                     tolerance=1)
-            tm.assert_numpy_array_equal(actual, np.array(expected,
-                                                         dtype=np.intp))
-
-        for method, expected in zip(all_methods, [[0, -1, -1], [-1, 2, -1],
-                                                  [0, 2, -1]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method,
-                                     tolerance=0.2)
-            tm.assert_numpy_array_equal(actual, np.array(expected,
-                                                         dtype=np.intp))
-
-        with tm.assertRaisesRegexp(ValueError, 'limit argument'):
-            idx.get_indexer([1, 0], method='nearest', limit=1)
-
-    def test_get_indexer_nearest_decreasing(self):
-        idx = Index(np.arange(10))[::-1]
-
-        all_methods = ['pad', 'backfill', 'nearest']
-        for method in all_methods:
-            actual = idx.get_indexer([0, 5, 9], method=method)
-            tm.assert_numpy_array_equal(actual, np.array([9, 4, 0],
-                                                         dtype=np.intp))
-
-        for method, expected in zip(all_methods, [[8, 7, 0], [9, 8, 1],
-                                                  [9, 7, 0]]):
-            actual = idx.get_indexer([0.2, 1.8, 8.5], method=method)
-            tm.assert_numpy_array_equal(actual, np.array(expected,
-                                                         dtype=np.intp))
-
-    def test_get_indexer_strings(self):
-        idx = pd.Index(['b', 'c'])
-
-        actual = idx.get_indexer(['a', 'b', 'c', 'd'], method='pad')
-        expected = np.array([-1, 0, 1, 1], dtype=np.intp)
-        tm.assert_numpy_array_equal(actual, expected)
+        index = Index(np.arange(10))
+
+        with pytest.raises(ValueError, match='tolerance argument'):
+            index.get_indexer([1, 0], tolerance=1)
+
+        with pytest.raises(ValueError, match='limit argument'):
+            index.get_indexer([1, 0], limit=1)
+
+    @pytest.mark.parametrize(
+        'method, tolerance, indexer, expected',
+        [
+            ('pad', None, [0, 5, 9], [0, 5, 9]),
+            ('backfill', None, [0, 5, 9], [0, 5, 9]),
+            ('nearest', None, [0, 5, 9], [0, 5, 9]),
+            ('pad', 0, [0, 5, 9], [0, 5, 9]),
+            ('backfill', 0, [0, 5, 9], [0, 5, 9]),
+            ('nearest', 0, [0, 5, 9], [0, 5, 9]),
+
+            ('pad', None, [0.2, 1.8, 8.5], [0, 1, 8]),
+            ('backfill', None, [0.2, 1.8, 8.5], [1, 2, 9]),
+            ('nearest', None, [0.2, 1.8, 8.5], [0, 2, 9]),
+            ('pad', 1, [0.2, 1.8, 8.5], [0, 1, 8]),
+            ('backfill', 1, [0.2, 1.8, 8.5], [1, 2, 9]),
+            ('nearest', 1, [0.2, 1.8, 8.5], [0, 2, 9]),
+
+            ('pad', 0.2, [0.2, 1.8, 8.5], [0, -1, -1]),
+            ('backfill', 0.2, [0.2, 1.8, 8.5], [-1, 2, -1]),
+            ('nearest', 0.2, [0.2, 1.8, 8.5], [0, 2, -1])])
+    def test_get_indexer_nearest(self, method, tolerance, indexer, expected):
+        index = Index(np.arange(10))
+
+        actual = index.get_indexer(indexer, method=method, tolerance=tolerance)
+        tm.assert_numpy_array_equal(actual, np.array(expected,
+                                                     dtype=np.intp))
+
+    @pytest.mark.parametrize('listtype', [list, tuple, Series, np.array])
+    @pytest.mark.parametrize(
+        'tolerance, expected',
+        list(zip([[0.3, 0.3, 0.1], [0.2, 0.1, 0.1],
+                  [0.1, 0.5, 0.5]],
+                 [[0, 2, -1], [0, -1, -1],
+                  [-1, 2, 9]])))
+    def test_get_indexer_nearest_listlike_tolerance(self, tolerance,
+                                                    expected, listtype):
+        index = Index(np.arange(10))
+
+        actual = index.get_indexer([0.2, 1.8, 8.5], method='nearest',
+                                   tolerance=listtype(tolerance))
+        tm.assert_numpy_array_equal(actual, np.array(expected,
+                                                     dtype=np.intp))
+
+    def test_get_indexer_nearest_error(self):
+        index = Index(np.arange(10))
+        with pytest.raises(ValueError, match='limit argument'):
+            index.get_indexer([1, 0], method='nearest', limit=1)
+
+        with pytest.raises(ValueError, match='tolerance size must match'):
+            index.get_indexer([1, 0], method='nearest',
+                              tolerance=[1, 2, 3])
+
+    @pytest.mark.parametrize("method,expected", [
+        ('pad', [8, 7, 0]), ('backfill', [9, 8, 1]), ('nearest', [9, 7, 0])])
+    def test_get_indexer_nearest_decreasing(self, method, expected):
+        index = Index(np.arange(10))[::-1]
+
+        actual = index.get_indexer([0, 5, 9], method=method)
+        tm.assert_numpy_array_equal(actual, np.array([9, 4, 0], dtype=np.intp))
+
+        actual = index.get_indexer([0.2, 1.8, 8.5], method=method)
+        tm.assert_numpy_array_equal(actual, np.array(expected, dtype=np.intp))
+
+    @pytest.mark.parametrize("method,expected", [
+        ('pad', np.array([-1, 0, 1, 1], dtype=np.intp)),
+        ('backfill', np.array([0, 0, 1, -1], dtype=np.intp))])
+    def test_get_indexer_strings(self, method, expected):
+        index = pd.Index(['b', 'c'])
+        actual = index.get_indexer(['a', 'b', 'c', 'd'], method=method)
 
-        actual = idx.get_indexer(['a', 'b', 'c', 'd'], method='backfill')
-        expected = np.array([0, 0, 1, -1], dtype=np.intp)
         tm.assert_numpy_array_equal(actual, expected)
 
-        with tm.assertRaises(TypeError):
-            idx.get_indexer(['a', 'b', 'c', 'd'], method='nearest')
-
-        with tm.assertRaises(TypeError):
-            idx.get_indexer(['a', 'b', 'c', 'd'], method='pad', tolerance=2)
-
-    def test_get_loc(self):
-        idx = pd.Index([0, 1, 2])
-        all_methods = [None, 'pad', 'backfill', 'nearest']
-        for method in all_methods:
-            self.assertEqual(idx.get_loc(1, method=method), 1)
-            if method is not None:
-                self.assertEqual(idx.get_loc(1, method=method, tolerance=0), 1)
-            with tm.assertRaises(TypeError):
-                idx.get_loc([1, 2], method=method)
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method), loc)
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method, tolerance=1), loc)
-
-        for method in ['pad', 'backfill', 'nearest']:
-            with tm.assertRaises(KeyError):
-                idx.get_loc(1.1, method, tolerance=0.05)
-
-        with tm.assertRaisesRegexp(ValueError, 'must be numeric'):
-            idx.get_loc(1.1, 'nearest', tolerance='invalid')
-        with tm.assertRaisesRegexp(ValueError, 'tolerance .* valid if'):
-            idx.get_loc(1.1, tolerance=1)
-
-        idx = pd.Index(['a', 'c'])
-        with tm.assertRaises(TypeError):
-            idx.get_loc('a', method='nearest')
-        with tm.assertRaises(TypeError):
-            idx.get_loc('a', method='pad', tolerance='invalid')
-
-    def test_slice_locs(self):
-        for dtype in [int, float]:
-            idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=dtype))
-            n = len(idx)
-
-            self.assertEqual(idx.slice_locs(start=2), (2, n))
-            self.assertEqual(idx.slice_locs(start=3), (3, n))
-            self.assertEqual(idx.slice_locs(3, 8), (3, 6))
-            self.assertEqual(idx.slice_locs(5, 10), (3, n))
-            self.assertEqual(idx.slice_locs(end=8), (0, 6))
-            self.assertEqual(idx.slice_locs(end=9), (0, 7))
-
-            # reversed
-            idx2 = idx[::-1]
-            self.assertEqual(idx2.slice_locs(8, 2), (2, 6))
-            self.assertEqual(idx2.slice_locs(7, 3), (2, 5))
-
-        # float slicing
-        idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=float))
-        n = len(idx)
-        self.assertEqual(idx.slice_locs(5.0, 10.0), (3, n))
-        self.assertEqual(idx.slice_locs(4.5, 10.5), (3, 8))
-        idx2 = idx[::-1]
-        self.assertEqual(idx2.slice_locs(8.5, 1.5), (2, 6))
-        self.assertEqual(idx2.slice_locs(10.5, -1), (0, n))
-
-        # int slicing with floats
-        # GH 4892, these are all TypeErrors
-        idx = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=int))
-        self.assertRaises(TypeError,
-                          lambda: idx.slice_locs(5.0, 10.0), (3, n))
-        self.assertRaises(TypeError,
-                          lambda: idx.slice_locs(4.5, 10.5), (3, 8))
-        idx2 = idx[::-1]
-        self.assertRaises(TypeError,
-                          lambda: idx2.slice_locs(8.5, 1.5), (2, 6))
-        self.assertRaises(TypeError,
-                          lambda: idx2.slice_locs(10.5, -1), (0, n))
+    def test_get_indexer_strings_raises(self):
+        index = pd.Index(['b', 'c'])
+
+        msg = r"unsupported operand type\(s\) for -: 'str' and 'str'"
+        with pytest.raises(TypeError, match=msg):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='nearest')
+
+        with pytest.raises(TypeError, match=msg):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='pad', tolerance=2)
+
+        with pytest.raises(TypeError, match=msg):
+            index.get_indexer(['a', 'b', 'c', 'd'], method='pad',
+                              tolerance=[2, 2, 2, 2])
+
+    def test_get_indexer_numeric_index_boolean_target(self):
+        # GH 16877
+        numeric_index = pd.Index(range(4))
+        result = numeric_index.get_indexer([True, False, True])
+        expected = np.array([-1, -1, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_indexer_with_NA_values(self, unique_nulls_fixture,
+                                        unique_nulls_fixture2):
+        # GH 22332
+        # check pairwise, that no pair of na values
+        # is mangled
+        if unique_nulls_fixture is unique_nulls_fixture2:
+            return  # skip it, values are not unique
+        arr = np.array([unique_nulls_fixture,
+                        unique_nulls_fixture2], dtype=np.object)
+        index = pd.Index(arr, dtype=np.object)
+        result = index.get_indexer([unique_nulls_fixture,
+                                    unique_nulls_fixture2, 'Unknown'])
+        expected = np.array([0, 1, -1], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("method", [None, 'pad', 'backfill', 'nearest'])
+    def test_get_loc(self, method):
+        index = pd.Index([0, 1, 2])
+        assert index.get_loc(1, method=method) == 1
+
+        if method:
+            assert index.get_loc(1, method=method, tolerance=0) == 1
+
+    @pytest.mark.parametrize("method", [None, 'pad', 'backfill', 'nearest'])
+    def test_get_loc_raises_bad_label(self, method):
+        index = pd.Index([0, 1, 2])
+        if method:
+            # Messages vary across versions
+            if PY36:
+                msg = 'not supported between'
+            elif PY35:
+                msg = 'unorderable types'
+            else:
+                if method == 'nearest':
+                    msg = 'unsupported operand'
+                else:
+                    msg = 'requires scalar valued input'
+        else:
+            msg = 'invalid key'
+
+        with pytest.raises(TypeError, match=msg):
+            index.get_loc([1, 2], method=method)
+
+    @pytest.mark.parametrize("method,loc", [
+        ('pad', 1), ('backfill', 2), ('nearest', 1)])
+    def test_get_loc_tolerance(self, method, loc):
+        index = pd.Index([0, 1, 2])
+        assert index.get_loc(1.1, method) == loc
+        assert index.get_loc(1.1, method, tolerance=1) == loc
+
+    @pytest.mark.parametrize("method", ['pad', 'backfill', 'nearest'])
+    def test_get_loc_outside_tolerance_raises(self, method):
+        index = pd.Index([0, 1, 2])
+        with pytest.raises(KeyError, match='1.1'):
+            index.get_loc(1.1, method, tolerance=0.05)
+
+    def test_get_loc_bad_tolerance_raises(self):
+        index = pd.Index([0, 1, 2])
+        with pytest.raises(ValueError, match='must be numeric'):
+            index.get_loc(1.1, 'nearest', tolerance='invalid')
+
+    def test_get_loc_tolerance_no_method_raises(self):
+        index = pd.Index([0, 1, 2])
+        with pytest.raises(ValueError, match='tolerance .* valid if'):
+            index.get_loc(1.1, tolerance=1)
+
+    def test_get_loc_raises_missized_tolerance(self):
+        index = pd.Index([0, 1, 2])
+        with pytest.raises(ValueError, match='tolerance size must match'):
+            index.get_loc(1.1, 'nearest', tolerance=[1, 1])
+
+    def test_get_loc_raises_object_nearest(self):
+        index = pd.Index(['a', 'c'])
+        with pytest.raises(TypeError, match='unsupported operand type'):
+            index.get_loc('a', method='nearest')
+
+    def test_get_loc_raises_object_tolerance(self):
+        index = pd.Index(['a', 'c'])
+        with pytest.raises(TypeError, match='unsupported operand type'):
+            index.get_loc('a', method='pad', tolerance='invalid')
+
+    @pytest.mark.parametrize("dtype", [int, float])
+    def test_slice_locs(self, dtype):
+        index = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=dtype))
+        n = len(index)
+
+        assert index.slice_locs(start=2) == (2, n)
+        assert index.slice_locs(start=3) == (3, n)
+        assert index.slice_locs(3, 8) == (3, 6)
+        assert index.slice_locs(5, 10) == (3, n)
+        assert index.slice_locs(end=8) == (0, 6)
+        assert index.slice_locs(end=9) == (0, 7)
+
+        # reversed
+        index2 = index[::-1]
+        assert index2.slice_locs(8, 2) == (2, 6)
+        assert index2.slice_locs(7, 3) == (2, 5)
+
+    @pytest.mark.parametrize("dtype", [int, float])
+    def test_slice_float_locs(self, dtype):
+        index = Index(np.array([0, 1, 2, 5, 6, 7, 9, 10], dtype=dtype))
+        n = len(index)
+        assert index.slice_locs(5.0, 10.0) == (3, n)
+        assert index.slice_locs(4.5, 10.5) == (3, 8)
+
+        index2 = index[::-1]
+        assert index2.slice_locs(8.5, 1.5) == (2, 6)
+        assert index2.slice_locs(10.5, -1) == (0, n)
 
     def test_slice_locs_dup(self):
-        idx = Index(['a', 'a', 'b', 'c', 'd', 'd'])
-        self.assertEqual(idx.slice_locs('a', 'd'), (0, 6))
-        self.assertEqual(idx.slice_locs(end='d'), (0, 6))
-        self.assertEqual(idx.slice_locs('a', 'c'), (0, 4))
-        self.assertEqual(idx.slice_locs('b', 'd'), (2, 6))
-
-        idx2 = idx[::-1]
-        self.assertEqual(idx2.slice_locs('d', 'a'), (0, 6))
-        self.assertEqual(idx2.slice_locs(end='a'), (0, 6))
-        self.assertEqual(idx2.slice_locs('d', 'b'), (0, 4))
-        self.assertEqual(idx2.slice_locs('c', 'a'), (2, 6))
-
-        for dtype in [int, float]:
-            idx = Index(np.array([10, 12, 12, 14], dtype=dtype))
-            self.assertEqual(idx.slice_locs(12, 12), (1, 3))
-            self.assertEqual(idx.slice_locs(11, 13), (1, 3))
-
-            idx2 = idx[::-1]
-            self.assertEqual(idx2.slice_locs(12, 12), (1, 3))
-            self.assertEqual(idx2.slice_locs(13, 11), (1, 3))
+        index = Index(['a', 'a', 'b', 'c', 'd', 'd'])
+        assert index.slice_locs('a', 'd') == (0, 6)
+        assert index.slice_locs(end='d') == (0, 6)
+        assert index.slice_locs('a', 'c') == (0, 4)
+        assert index.slice_locs('b', 'd') == (2, 6)
+
+        index2 = index[::-1]
+        assert index2.slice_locs('d', 'a') == (0, 6)
+        assert index2.slice_locs(end='a') == (0, 6)
+        assert index2.slice_locs('d', 'b') == (0, 4)
+        assert index2.slice_locs('c', 'a') == (2, 6)
+
+    @pytest.mark.parametrize("dtype", [int, float])
+    def test_slice_locs_dup_numeric(self, dtype):
+        index = Index(np.array([10, 12, 12, 14], dtype=dtype))
+        assert index.slice_locs(12, 12) == (1, 3)
+        assert index.slice_locs(11, 13) == (1, 3)
+
+        index2 = index[::-1]
+        assert index2.slice_locs(12, 12) == (1, 3)
+        assert index2.slice_locs(13, 11) == (1, 3)
 
     def test_slice_locs_na(self):
-        idx = Index([np.nan, 1, 2])
-        self.assertRaises(KeyError, idx.slice_locs, start=1.5)
-        self.assertRaises(KeyError, idx.slice_locs, end=1.5)
-        self.assertEqual(idx.slice_locs(1), (1, 3))
-        self.assertEqual(idx.slice_locs(np.nan), (0, 3))
-
-        idx = Index([0, np.nan, np.nan, 1, 2])
-        self.assertEqual(idx.slice_locs(np.nan), (1, 5))
-
-    def test_slice_locs_negative_step(self):
-        idx = Index(list('bcdxy'))
-
-        SLC = pd.IndexSlice
-
-        def check_slice(in_slice, expected):
-            s_start, s_stop = idx.slice_locs(in_slice.start, in_slice.stop,
-                                             in_slice.step)
-            result = idx[s_start:s_stop:in_slice.step]
-            expected = pd.Index(list(expected))
-            self.assert_index_equal(result, expected)
-
-        for in_slice, expected in [
-            (SLC[::-1], 'yxdcb'), (SLC['b':'y':-1], ''),
-            (SLC['b'::-1], 'b'), (SLC[:'b':-1], 'yxdcb'),
-            (SLC[:'y':-1], 'y'), (SLC['y'::-1], 'yxdcb'),
-            (SLC['y'::-4], 'yb'),
-            # absent labels
-            (SLC[:'a':-1], 'yxdcb'), (SLC[:'a':-2], 'ydb'),
-            (SLC['z'::-1], 'yxdcb'), (SLC['z'::-3], 'yc'),
-            (SLC['m'::-1], 'dcb'), (SLC[:'m':-1], 'yx'),
-            (SLC['a':'a':-1], ''), (SLC['z':'z':-1], ''),
-            (SLC['m':'m':-1], '')
-        ]:
-            check_slice(in_slice, expected)
-
-    def test_drop(self):
-        n = len(self.strIndex)
+        index = Index([np.nan, 1, 2])
+        assert index.slice_locs(1) == (1, 3)
+        assert index.slice_locs(np.nan) == (0, 3)
+
+        index = Index([0, np.nan, np.nan, 1, 2])
+        assert index.slice_locs(np.nan) == (1, 5)
+
+    def test_slice_locs_na_raises(self):
+        index = Index([np.nan, 1, 2])
+        with pytest.raises(KeyError, match=''):
+            index.slice_locs(start=1.5)
+
+        with pytest.raises(KeyError, match=''):
+            index.slice_locs(end=1.5)
+
+    @pytest.mark.parametrize("in_slice,expected", [
+        (pd.IndexSlice[::-1], 'yxdcb'), (pd.IndexSlice['b':'y':-1], ''),
+        (pd.IndexSlice['b'::-1], 'b'), (pd.IndexSlice[:'b':-1], 'yxdcb'),
+        (pd.IndexSlice[:'y':-1], 'y'), (pd.IndexSlice['y'::-1], 'yxdcb'),
+        (pd.IndexSlice['y'::-4], 'yb'),
+        # absent labels
+        (pd.IndexSlice[:'a':-1], 'yxdcb'), (pd.IndexSlice[:'a':-2], 'ydb'),
+        (pd.IndexSlice['z'::-1], 'yxdcb'), (pd.IndexSlice['z'::-3], 'yc'),
+        (pd.IndexSlice['m'::-1], 'dcb'), (pd.IndexSlice[:'m':-1], 'yx'),
+        (pd.IndexSlice['a':'a':-1], ''), (pd.IndexSlice['z':'z':-1], ''),
+        (pd.IndexSlice['m':'m':-1], '')
+    ])
+    def test_slice_locs_negative_step(self, in_slice, expected):
+        index = Index(list('bcdxy'))
+
+        s_start, s_stop = index.slice_locs(in_slice.start, in_slice.stop,
+                                           in_slice.step)
+        result = index[s_start:s_stop:in_slice.step]
+        expected = pd.Index(list(expected))
+        tm.assert_index_equal(result, expected)
 
+    def test_drop_by_str_label(self):
+        # TODO: Parametrize these after replacing self.strIndex with fixture
+        n = len(self.strIndex)
         drop = self.strIndex[lrange(5, 10)]
         dropped = self.strIndex.drop(drop)
+
         expected = self.strIndex[lrange(5) + lrange(10, n)]
-        self.assert_index_equal(dropped, expected)
+        tm.assert_index_equal(dropped, expected)
 
-        self.assertRaises(ValueError, self.strIndex.drop, ['foo', 'bar'])
-        self.assertRaises(ValueError, self.strIndex.drop, ['1', 'bar'])
+        dropped = self.strIndex.drop(self.strIndex[0])
+        expected = self.strIndex[1:]
+        tm.assert_index_equal(dropped, expected)
+
+    @pytest.mark.parametrize("keys", [['foo', 'bar'], ['1', 'bar']])
+    def test_drop_by_str_label_raises_missing_keys(self, keys):
+        with pytest.raises(KeyError, match=''):
+            self.strIndex.drop(keys)
+
+    def test_drop_by_str_label_errors_ignore(self):
+        # TODO: Parametrize these after replacing self.strIndex with fixture
 
         # errors='ignore'
+        n = len(self.strIndex)
+        drop = self.strIndex[lrange(5, 10)]
         mixed = drop.tolist() + ['foo']
         dropped = self.strIndex.drop(mixed, errors='ignore')
+
         expected = self.strIndex[lrange(5) + lrange(10, n)]
-        self.assert_index_equal(dropped, expected)
+        tm.assert_index_equal(dropped, expected)
 
         dropped = self.strIndex.drop(['foo', 'bar'], errors='ignore')
         expected = self.strIndex[lrange(n)]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.strIndex.drop(self.strIndex[0])
-        expected = self.strIndex[1:]
-        self.assert_index_equal(dropped, expected)
+        tm.assert_index_equal(dropped, expected)
 
-        ser = Index([1, 2, 3])
-        dropped = ser.drop(1)
+    def test_drop_by_numeric_label_loc(self):
+        # TODO: Parametrize numeric and str tests after self.strIndex fixture
+        index = Index([1, 2, 3])
+        dropped = index.drop(1)
         expected = Index([2, 3])
-        self.assert_index_equal(dropped, expected)
 
-        # errors='ignore'
-        self.assertRaises(ValueError, ser.drop, [3, 4])
-
-        dropped = ser.drop(4, errors='ignore')
-        expected = Index([1, 2, 3])
-        self.assert_index_equal(dropped, expected)
-
-        dropped = ser.drop([3, 4, 5], errors='ignore')
-        expected = Index([1, 2])
-        self.assert_index_equal(dropped, expected)
-
-    def test_tuple_union_bug(self):
-        import pandas
-        import numpy as np
-
-        aidx1 = np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
-                         dtype=[('num', int), ('let', 'a1')])
-        aidx2 = np.array([(1, 'A'), (2, 'A'), (1, 'B'),
-                          (2, 'B'), (1, 'C'), (2, 'C')],
-                         dtype=[('num', int), ('let', 'a1')])
-
-        idx1 = pandas.Index(aidx1)
-        idx2 = pandas.Index(aidx2)
-
-        # intersection broken?
-        int_idx = idx1.intersection(idx2)
-        # needs to be 1d like idx1 and idx2
-        expected = idx1[:4]  # pandas.Index(sorted(set(idx1) & set(idx2)))
-        self.assertEqual(int_idx.ndim, 1)
-        self.assert_index_equal(int_idx, expected)
-
-        # union broken
-        union_idx = idx1.union(idx2)
-        expected = idx2
-        self.assertEqual(union_idx.ndim, 1)
-        self.assert_index_equal(union_idx, expected)
-
-    def test_is_monotonic_incomparable(self):
+        tm.assert_index_equal(dropped, expected)
+
+    def test_drop_by_numeric_label_raises_missing_keys(self):
+        index = Index([1, 2, 3])
+        with pytest.raises(KeyError, match=''):
+            index.drop([3, 4])
+
+    @pytest.mark.parametrize("key,expected", [
+        (4, Index([1, 2, 3])), ([3, 4, 5], Index([1, 2]))])
+    def test_drop_by_numeric_label_errors_ignore(self, key, expected):
+        index = Index([1, 2, 3])
+        dropped = index.drop(key, errors='ignore')
+
+        tm.assert_index_equal(dropped, expected)
+
+    @pytest.mark.parametrize("values", [['a', 'b', ('c', 'd')],
+                                        ['a', ('c', 'd'), 'b'],
+                                        [('c', 'd'), 'a', 'b']])
+    @pytest.mark.parametrize("to_drop", [[('c', 'd'), 'a'], ['a', ('c', 'd')]])
+    def test_drop_tuple(self, values, to_drop):
+        # GH 18304
+        index = pd.Index(values)
+        expected = pd.Index(['b'])
+
+        result = index.drop(to_drop)
+        tm.assert_index_equal(result, expected)
+
+        removed = index.drop(to_drop[0])
+        for drop_me in to_drop[1], [to_drop[1]]:
+            result = removed.drop(drop_me)
+            tm.assert_index_equal(result, expected)
+
+        removed = index.drop(to_drop[1])
+        msg = r"\"\[{}\] not found in axis\"".format(
+            re.escape(to_drop[1].__repr__()))
+        for drop_me in to_drop[1], [to_drop[1]]:
+            with pytest.raises(KeyError, match=msg):
+                removed.drop(drop_me)
+
+    @pytest.mark.parametrize("method,expected,sort", [
+        ('intersection', np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
+                                  dtype=[('num', int), ('let', 'a1')]),
+         False),
+
+        ('intersection', np.array([(1, 'A'), (1, 'B'), (2, 'A'), (2, 'B')],
+                                  dtype=[('num', int), ('let', 'a1')]),
+         None),
+
+        ('union', np.array([(1, 'A'), (1, 'B'), (1, 'C'), (2, 'A'), (2, 'B'),
+                            (2, 'C')], dtype=[('num', int), ('let', 'a1')]),
+         None)
+    ])
+    def test_tuple_union_bug(self, method, expected, sort):
+        index1 = Index(np.array([(1, 'A'), (2, 'A'), (1, 'B'), (2, 'B')],
+                                dtype=[('num', int), ('let', 'a1')]))
+        index2 = Index(np.array([(1, 'A'), (2, 'A'), (1, 'B'),
+                                 (2, 'B'), (1, 'C'), (2, 'C')],
+                                dtype=[('num', int), ('let', 'a1')]))
+
+        result = getattr(index1, method)(index2, sort=sort)
+        assert result.ndim == 1
+
+        expected = Index(expected)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("attr", [
+        'is_monotonic_increasing', 'is_monotonic_decreasing',
+        '_is_strictly_monotonic_increasing',
+        '_is_strictly_monotonic_decreasing'])
+    def test_is_monotonic_incomparable(self, attr):
         index = Index([5, datetime.now(), 7])
-        self.assertFalse(index.is_monotonic)
-        self.assertFalse(index.is_monotonic_decreasing)
+        assert not getattr(index, attr)
 
     def test_get_set_value(self):
+        # TODO: Remove function? GH 19728
         values = np.random.randn(100)
         date = self.dateIndex[67]
 
         assert_almost_equal(self.dateIndex.get_value(values, date), values[67])
 
         self.dateIndex.set_value(values, date, 10)
-        self.assertEqual(values[67], 10)
+        assert values[67] == 10
+
+    @pytest.mark.parametrize("values", [
+        ['foo', 'bar', 'quux'], {'foo', 'bar', 'quux'}])
+    @pytest.mark.parametrize("index,expected", [
+        (Index(['qux', 'baz', 'foo', 'bar']),
+         np.array([False, False, True, True])),
+        (Index([]), np.array([], dtype=bool))  # empty
+    ])
+    def test_isin(self, values, index, expected):
+        result = index.isin(values)
+        tm.assert_numpy_array_equal(result, expected)
 
-    def test_isin(self):
-        values = ['foo', 'bar', 'quux']
+    def test_isin_nan_common_object(self, nulls_fixture, nulls_fixture2):
+        # Test cartesian product of null fixtures and ensure that we don't
+        # mangle the various types (save a corner case with PyPy)
 
-        idx = Index(['qux', 'baz', 'foo', 'bar'])
-        result = idx.isin(values)
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(result, expected)
+        # all nans are the same
+        if (isinstance(nulls_fixture, float) and
+                isinstance(nulls_fixture2, float) and
+                math.isnan(nulls_fixture) and
+                math.isnan(nulls_fixture2)):
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [nulls_fixture2]), np.array([False, True]))
 
-        # set
-        result = idx.isin(set(values))
-        tm.assert_numpy_array_equal(result, expected)
+        elif nulls_fixture is nulls_fixture2:  # should preserve NA type
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [nulls_fixture2]), np.array([False, True]))
 
-        # empty, return dtype bool
-        idx = Index([])
-        result = idx.isin(values)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.dtype, np.bool_)
-
-    def test_isin_nan(self):
-        tm.assert_numpy_array_equal(Index(['a', np.nan]).isin([np.nan]),
-                                    np.array([False, True]))
-        tm.assert_numpy_array_equal(Index(['a', pd.NaT]).isin([pd.NaT]),
-                                    np.array([False, True]))
-        tm.assert_numpy_array_equal(Index(['a', np.nan]).isin([float('nan')]),
-                                    np.array([False, False]))
-        tm.assert_numpy_array_equal(Index(['a', np.nan]).isin([pd.NaT]),
-                                    np.array([False, False]))
+        else:
+            tm.assert_numpy_array_equal(Index(['a', nulls_fixture]).isin(
+                [nulls_fixture2]), np.array([False, False]))
+
+    def test_isin_nan_common_float64(self, nulls_fixture):
+        if nulls_fixture is pd.NaT:
+            pytest.skip("pd.NaT not compatible with Float64Index")
 
         # Float64Index overrides isin, so must be checked separately
-        tm.assert_numpy_array_equal(Float64Index([1.0, np.nan]).isin([np.nan]),
-                                    np.array([False, True]))
-        tm.assert_numpy_array_equal(
-            Float64Index([1.0, np.nan]).isin([float('nan')]),
-            np.array([False, True]))
+        tm.assert_numpy_array_equal(Float64Index([1.0, nulls_fixture]).isin(
+            [np.nan]), np.array([False, True]))
 
         # we cannot compare NaT with NaN
-        tm.assert_numpy_array_equal(Float64Index([1.0, np.nan]).isin([pd.NaT]),
-                                    np.array([False, False]))
+        tm.assert_numpy_array_equal(Float64Index([1.0, nulls_fixture]).isin(
+            [pd.NaT]), np.array([False, False]))
 
-    def test_isin_level_kwarg(self):
-        def check_idx(idx):
-            values = idx.tolist()[-2:] + ['nonexisting']
+    @pytest.mark.parametrize("level", [0, -1])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        # Float64Index overrides isin, so must be checked separately
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg(self, level, index):
+        values = index.tolist()[-2:] + ['nonexisting']
 
-            expected = np.array([False, False, True, True])
-            tm.assert_numpy_array_equal(expected, idx.isin(values, level=0))
-            tm.assert_numpy_array_equal(expected, idx.isin(values, level=-1))
+        expected = np.array([False, False, True, True])
+        tm.assert_numpy_array_equal(expected, index.isin(values, level=level))
 
-            self.assertRaises(IndexError, idx.isin, values, level=1)
-            self.assertRaises(IndexError, idx.isin, values, level=10)
-            self.assertRaises(IndexError, idx.isin, values, level=-2)
+        index.name = 'foobar'
+        tm.assert_numpy_array_equal(expected,
+                                    index.isin(values, level='foobar'))
 
-            self.assertRaises(KeyError, idx.isin, values, level=1.0)
-            self.assertRaises(KeyError, idx.isin, values, level='foobar')
+    @pytest.mark.parametrize("level", [1, 10, -2])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        # Float64Index overrides isin, so must be checked separately
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg_raises_bad_index(self, level, index):
+        with pytest.raises(IndexError, match='Too many levels'):
+            index.isin([], level=level)
+
+    @pytest.mark.parametrize("level", [1.0, 'foobar', 'xyzzy', np.nan])
+    @pytest.mark.parametrize("index", [
+        Index(['qux', 'baz', 'foo', 'bar']),
+        Float64Index([1.0, 2.0, 3.0, 4.0])])
+    def test_isin_level_kwarg_raises_key(self, level, index):
+        with pytest.raises(KeyError, match='must be same as name'):
+            index.isin([], level=level)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # see gh-16991
+        index = Index(["a", "b"])
+        expected = np.array([False, False])
+
+        result = index.isin(empty)
+        tm.assert_numpy_array_equal(expected, result)
+
+    @pytest.mark.parametrize("values", [
+        [1, 2, 3, 4],
+        [1., 2., 3., 4.],
+        [True, True, True, True],
+        ["foo", "bar", "baz", "qux"],
+        pd.date_range('2018-01-01', freq='D', periods=4)])
+    def test_boolean_cmp(self, values):
+        index = Index(values)
+        result = (index == values)
+        expected = np.array([True, True, True, True], dtype=bool)
 
-            idx.name = 'foobar'
-            tm.assert_numpy_array_equal(expected,
-                                        idx.isin(values, level='foobar'))
+        tm.assert_numpy_array_equal(result, expected)
 
-            self.assertRaises(KeyError, idx.isin, values, level='xyzzy')
-            self.assertRaises(KeyError, idx.isin, values, level=np.nan)
+    @pytest.mark.parametrize("name,level", [
+        (None, 0), ('a', 'a')])
+    def test_get_level_values(self, name, level):
+        expected = self.strIndex.copy()
+        if name:
+            expected.name = name
 
-        check_idx(Index(['qux', 'baz', 'foo', 'bar']))
-        # Float64Index overrides isin, so must be checked separately
-        check_idx(Float64Index([1.0, 2.0, 3.0, 4.0]))
+        result = expected.get_level_values(level)
+        tm.assert_index_equal(result, expected)
 
-    def test_boolean_cmp(self):
-        values = [1, 2, 3, 4]
+    def test_slice_keep_name(self):
+        index = Index(['a', 'b'], name='asdf')
+        assert index.name == index[1:].name
 
-        idx = Index(values)
-        res = (idx == values)
+    # instance attributes of the form self.<name>Index
+    @pytest.mark.parametrize('index_kind',
+                             ['unicode', 'str', 'date', 'int', 'float'])
+    def test_join_self(self, join_type, index_kind):
 
-        tm.assert_numpy_array_equal(res, np.array(
-            [True, True, True, True], dtype=bool))
+        res = getattr(self, '{0}Index'.format(index_kind))
 
-    def test_get_level_values(self):
-        result = self.strIndex.get_level_values(0)
-        self.assert_index_equal(result, self.strIndex)
+        joined = res.join(res, how=join_type)
+        assert res is joined
 
-    def test_slice_keep_name(self):
-        idx = Index(['a', 'b'], name='asdf')
-        self.assertEqual(idx.name, idx[1:].name)
+    @pytest.mark.parametrize("method", ['strip', 'rstrip', 'lstrip'])
+    def test_str_attribute(self, method):
+        # GH9068
+        index = Index([' jack', 'jill ', ' jesse ', 'frank'])
+        expected = Index([getattr(str, method)(x) for x in index.values])
 
-    def test_join_self(self):
-        # instance attributes of the form self.<name>Index
-        indices = 'unicode', 'str', 'date', 'int', 'float'
-        kinds = 'outer', 'inner', 'left', 'right'
-        for index_kind in indices:
-            res = getattr(self, '{0}Index'.format(index_kind))
+        result = getattr(index.str, method)()
+        tm.assert_index_equal(result, expected)
 
-            for kind in kinds:
-                joined = res.join(res, how=kind)
-                self.assertIs(res, joined)
+    @pytest.mark.parametrize("index", [
+        Index(range(5)), tm.makeDateIndex(10),
+        MultiIndex.from_tuples([('foo', '1'), ('bar', '3')]),
+        period_range(start='2000', end='2010', freq='A')])
+    def test_str_attribute_raises(self, index):
+        with pytest.raises(AttributeError, match='only use .str accessor'):
+            index.str.repeat(2)
+
+    @pytest.mark.parametrize("expand,expected", [
+        (None, Index([['a', 'b', 'c'], ['d', 'e'], ['f']])),
+        (False, Index([['a', 'b', 'c'], ['d', 'e'], ['f']])),
+        (True, MultiIndex.from_tuples([('a', 'b', 'c'), ('d', 'e', np.nan),
+                                       ('f', np.nan, np.nan)]))])
+    def test_str_split(self, expand, expected):
+        index = Index(['a b c', 'd e', 'f'])
+        if expand is not None:
+            result = index.str.split(expand=expand)
+        else:
+            result = index.str.split()
 
-    def test_str_attribute(self):
-        # GH9068
-        methods = ['strip', 'rstrip', 'lstrip']
-        idx = Index([' jack', 'jill ', ' jesse ', 'frank'])
-        for method in methods:
-            expected = Index([getattr(str, method)(x) for x in idx.values])
-            tm.assert_index_equal(
-                getattr(Index.str, method)(idx.str), expected)
-
-        # create a few instances that are not able to use .str accessor
-        indices = [Index(range(5)), tm.makeDateIndex(10),
-                   MultiIndex.from_tuples([('foo', '1'), ('bar', '3')]),
-                   PeriodIndex(start='2000', end='2010', freq='A')]
-        for idx in indices:
-            with self.assertRaisesRegexp(AttributeError,
-                                         'only use .str accessor'):
-                idx.str.repeat(2)
-
-        idx = Index(['a b c', 'd e', 'f'])
-        expected = Index([['a', 'b', 'c'], ['d', 'e'], ['f']])
-        tm.assert_index_equal(idx.str.split(), expected)
-        tm.assert_index_equal(idx.str.split(expand=False), expected)
-
-        expected = MultiIndex.from_tuples([('a', 'b', 'c'), ('d', 'e', np.nan),
-                                           ('f', np.nan, np.nan)])
-        tm.assert_index_equal(idx.str.split(expand=True), expected)
+        tm.assert_index_equal(result, expected)
 
+    def test_str_bool_return(self):
         # test boolean case, should return np.array instead of boolean Index
-        idx = Index(['a1', 'a2', 'b1', 'b2'])
+        index = Index(['a1', 'a2', 'b1', 'b2'])
+        result = index.str.startswith('a')
         expected = np.array([True, True, False, False])
-        tm.assert_numpy_array_equal(idx.str.startswith('a'), expected)
-        self.assertIsInstance(idx.str.startswith('a'), np.ndarray)
-        s = Series(range(4), index=idx)
+
+        tm.assert_numpy_array_equal(result, expected)
+        assert isinstance(result, np.ndarray)
+
+    def test_str_bool_series_indexing(self):
+        index = Index(['a1', 'a2', 'b1', 'b2'])
+        s = Series(range(4), index=index)
+
+        result = s[s.index.str.startswith('a')]
         expected = Series(range(2), index=['a1', 'a2'])
-        tm.assert_series_equal(s[s.index.str.startswith('a')], expected)
+        tm.assert_series_equal(result, expected)
 
-    def test_tab_completion(self):
+    @pytest.mark.parametrize("index,expected", [
+        (Index(list('abcd')), True), (Index(range(4)), False)])
+    def test_tab_completion(self, index, expected):
         # GH 9910
-        idx = Index(list('abcd'))
-        self.assertTrue('str' in dir(idx))
-
-        idx = Index(range(4))
-        self.assertTrue('str' not in dir(idx))
+        result = 'str' in dir(index)
+        assert result == expected
 
     def test_indexing_doesnt_change_class(self):
-        idx = Index([1, 2, 3, 'a', 'b', 'c'])
+        index = Index([1, 2, 3, 'a', 'b', 'c'])
 
-        self.assertTrue(idx[1:3].identical(pd.Index([2, 3], dtype=np.object_)))
-        self.assertTrue(idx[[0, 1]].identical(pd.Index(
-            [1, 2], dtype=np.object_)))
+        assert index[1:3].identical(pd.Index([2, 3], dtype=np.object_))
+        assert index[[0, 1]].identical(pd.Index([1, 2], dtype=np.object_))
 
     def test_outer_join_sort(self):
-        left_idx = Index(np.random.permutation(15))
-        right_idx = tm.makeDateIndex(10)
+        left_index = Index(np.random.permutation(15))
+        right_index = tm.makeDateIndex(10)
 
         with tm.assert_produces_warning(RuntimeWarning):
-            joined = left_idx.join(right_idx, how='outer')
+            result = left_index.join(right_index, how='outer')
 
-        # right_idx in this case because DatetimeIndex has join precedence over
-        # Int64Index
+        # right_index in this case because DatetimeIndex has join precedence
+        # over Int64Index
         with tm.assert_produces_warning(RuntimeWarning):
-            expected = right_idx.astype(object).union(left_idx.astype(object))
-        tm.assert_index_equal(joined, expected)
+            expected = right_index.astype(object).union(
+                left_index.astype(object))
+
+        tm.assert_index_equal(result, expected)
 
     def test_nan_first_take_datetime(self):
-        idx = Index([pd.NaT, Timestamp('20130101'), Timestamp('20130102')])
-        res = idx.take([-1, 0, 1])
-        exp = Index([idx[-1], idx[0], idx[1]])
-        tm.assert_index_equal(res, exp)
+        index = Index([pd.NaT, Timestamp('20130101'), Timestamp('20130102')])
+        result = index.take([-1, 0, 1])
+        expected = Index([index[-1], index[0], index[1]])
+        tm.assert_index_equal(result, expected)
 
     def test_take_fill_value(self):
         # GH 12631
-        idx = pd.Index(list('ABC'), name='xxx')
-        result = idx.take(np.array([1, 0, -1]))
+        index = pd.Index(list('ABC'), name='xxx')
+        result = index.take(np.array([1, 0, -1]))
         expected = pd.Index(list('BAC'), name='xxx')
         tm.assert_index_equal(result, expected)
 
         # fill_value
-        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        result = index.take(np.array([1, 0, -1]), fill_value=True)
         expected = pd.Index(['B', 'A', np.nan], name='xxx')
         tm.assert_index_equal(result, expected)
 
         # allow_fill=False
-        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
-                          fill_value=True)
+        result = index.take(np.array([1, 0, -1]), allow_fill=False,
+                            fill_value=True)
         expected = pd.Index(['B', 'A', 'C'], name='xxx')
         tm.assert_index_equal(result, expected)
 
+    def test_take_fill_value_none_raises(self):
+        index = pd.Index(list('ABC'), name='xxx')
         msg = ('When allow_fill=True and fill_value is not None, '
                'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            idx.take(np.array([1, -5]))
 
-    def test_reshape_raise(self):
-        msg = "reshaping is not supported"
-        idx = pd.Index([0, 1, 2])
-        tm.assertRaisesRegexp(NotImplementedError, msg,
-                              idx.reshape, idx.shape)
-
-    def test_reindex_preserves_name_if_target_is_list_or_ndarray(self):
+        with pytest.raises(ValueError, match=msg):
+            index.take(np.array([1, 0, -2]), fill_value=True)
+        with pytest.raises(ValueError, match=msg):
+            index.take(np.array([1, 0, -5]), fill_value=True)
+
+    def test_take_bad_bounds_raises(self):
+        index = pd.Index(list('ABC'), name='xxx')
+        with pytest.raises(IndexError, match='out of bounds'):
+            index.take(np.array([1, -5]))
+
+    @pytest.mark.parametrize("name", [None, 'foobar'])
+    @pytest.mark.parametrize("labels", [
+        [], np.array([]), ['A', 'B', 'C'], ['C', 'B', 'A'],
+        np.array(['A', 'B', 'C']), np.array(['C', 'B', 'A']),
+        # Must preserve name even if dtype changes
+        pd.date_range('20130101', periods=3).values,
+        pd.date_range('20130101', periods=3).tolist()])
+    def test_reindex_preserves_name_if_target_is_list_or_ndarray(self, name,
+                                                                 labels):
         # GH6552
-        idx = pd.Index([0, 1, 2])
-
-        dt_idx = pd.date_range('20130101', periods=3)
-
-        idx.name = None
-        self.assertEqual(idx.reindex([])[0].name, None)
-        self.assertEqual(idx.reindex(np.array([]))[0].name, None)
-        self.assertEqual(idx.reindex(idx.tolist())[0].name, None)
-        self.assertEqual(idx.reindex(idx.tolist()[:-1])[0].name, None)
-        self.assertEqual(idx.reindex(idx.values)[0].name, None)
-        self.assertEqual(idx.reindex(idx.values[:-1])[0].name, None)
-
-        # Must preserve name even if dtype changes.
-        self.assertEqual(idx.reindex(dt_idx.values)[0].name, None)
-        self.assertEqual(idx.reindex(dt_idx.tolist())[0].name, None)
-
-        idx.name = 'foobar'
-        self.assertEqual(idx.reindex([])[0].name, 'foobar')
-        self.assertEqual(idx.reindex(np.array([]))[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.tolist())[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.tolist()[:-1])[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.values)[0].name, 'foobar')
-        self.assertEqual(idx.reindex(idx.values[:-1])[0].name, 'foobar')
-
-        # Must preserve name even if dtype changes.
-        self.assertEqual(idx.reindex(dt_idx.values)[0].name, 'foobar')
-        self.assertEqual(idx.reindex(dt_idx.tolist())[0].name, 'foobar')
-
-    def test_reindex_preserves_type_if_target_is_empty_list_or_array(self):
+        index = pd.Index([0, 1, 2])
+        index.name = name
+        assert index.reindex(labels)[0].name == name
+
+    @pytest.mark.parametrize("labels", [
+        [], np.array([]), np.array([], dtype=np.int64)])
+    def test_reindex_preserves_type_if_target_is_empty_list_or_array(self,
+                                                                     labels):
         # GH7774
-        idx = pd.Index(list('abc'))
-
-        def get_reindex_type(target):
-            return idx.reindex(target)[0].dtype.type
-
-        self.assertEqual(get_reindex_type([]), np.object_)
-        self.assertEqual(get_reindex_type(np.array([])), np.object_)
-        self.assertEqual(get_reindex_type(np.array([], dtype=np.int64)),
-                         np.object_)
-
-    def test_reindex_doesnt_preserve_type_if_target_is_empty_index(self):
+        index = pd.Index(list('abc'))
+        assert index.reindex(labels)[0].dtype.type == np.object_
+
+    @pytest.mark.parametrize("labels,dtype", [
+        (pd.Int64Index([]), np.int64),
+        (pd.Float64Index([]), np.float64),
+        (pd.DatetimeIndex([]), np.datetime64)])
+    def test_reindex_doesnt_preserve_type_if_target_is_empty_index(self,
+                                                                   labels,
+                                                                   dtype):
         # GH7774
-        idx = pd.Index(list('abc'))
-
-        def get_reindex_type(target):
-            return idx.reindex(target)[0].dtype.type
-
-        self.assertEqual(get_reindex_type(pd.Int64Index([])), np.int64)
-        self.assertEqual(get_reindex_type(pd.Float64Index([])), np.float64)
-        self.assertEqual(get_reindex_type(pd.DatetimeIndex([])), np.datetime64)
+        index = pd.Index(list('abc'))
+        assert index.reindex(labels)[0].dtype.type == dtype
 
-        reindexed = idx.reindex(pd.MultiIndex(
+    def test_reindex_no_type_preserve_target_empty_mi(self):
+        index = pd.Index(list('abc'))
+        result = index.reindex(pd.MultiIndex(
             [pd.Int64Index([]), pd.Float64Index([])], [[], []]))[0]
-        self.assertEqual(reindexed.levels[0].dtype.type, np.int64)
-        self.assertEqual(reindexed.levels[1].dtype.type, np.float64)
+        assert result.levels[0].dtype.type == np.int64
+        assert result.levels[1].dtype.type == np.float64
 
     def test_groupby(self):
-        idx = Index(range(5))
-        groups = idx.groupby(np.array([1, 1, 2, 2, 2]))
-        exp = {1: pd.Index([0, 1]), 2: pd.Index([2, 3, 4])}
-        tm.assert_dict_equal(groups, exp)
+        index = Index(range(5))
+        result = index.groupby(np.array([1, 1, 2, 2, 2]))
+        expected = {1: pd.Index([0, 1]), 2: pd.Index([2, 3, 4])}
 
-    def test_equals_op_multiindex(self):
+        tm.assert_dict_equal(result, expected)
+
+    @pytest.mark.parametrize("mi,expected", [
+        (MultiIndex.from_tuples([(1, 2), (4, 5)]), np.array([True, True])),
+        (MultiIndex.from_tuples([(1, 2), (4, 6)]), np.array([True, False]))])
+    def test_equals_op_multiindex(self, mi, expected):
         # GH9785
         # test comparisons of multiindex
-        from pandas.compat import StringIO
         df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
-        tm.assert_numpy_array_equal(df.index == df.index,
-                                    np.array([True, True]))
-
-        mi1 = MultiIndex.from_tuples([(1, 2), (4, 5)])
-        tm.assert_numpy_array_equal(df.index == mi1, np.array([True, True]))
-        mi2 = MultiIndex.from_tuples([(1, 2), (4, 6)])
-        tm.assert_numpy_array_equal(df.index == mi2, np.array([True, False]))
-        mi3 = MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            df.index == mi3
-
-        index_a = Index(['foo', 'bar', 'baz'])
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
-            df.index == index_a
-        tm.assert_numpy_array_equal(index_a == mi3,
-                                    np.array([False, False, False]))
-
-    def test_conversion_preserves_name(self):
-        # GH 10875
-        i = pd.Index(['01:02:03', '01:02:04'], name='label')
-        self.assertEqual(i.name, pd.to_datetime(i).name)
-        self.assertEqual(i.name, pd.to_timedelta(i).name)
 
-    def test_string_index_repr(self):
-        # py3/py2 repr can differ because of "u" prefix
-        # which also affects to displayed element size
+        result = df.index == mi
+        tm.assert_numpy_array_equal(result, expected)
 
-        if PY3:
-            coerce = lambda x: x
-        else:
-            coerce = unicode  # noqa
+    def test_equals_op_multiindex_identify(self):
+        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
 
-        # short
-        idx = pd.Index(['a', 'bb', 'ccc'])
-        if PY3:
-            expected = u"""Index(['a', 'bb', 'ccc'], dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'a', u'bb', u'ccc'], dtype='object')"""
-            self.assertEqual(coerce(idx), expected)
+        result = df.index == df.index
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("index", [
+        MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)]),
+        Index(['foo', 'bar', 'baz'])])
+    def test_equals_op_mismatched_multiindex_raises(self, index):
+        df = pd.read_csv(StringIO('a,b,c\n1,2,3\n4,5,6'), index_col=[0, 1])
 
+        with pytest.raises(ValueError, match="Lengths must match"):
+            df.index == index
+
+    def test_equals_op_index_vs_mi_same_length(self):
+        mi = MultiIndex.from_tuples([(1, 2), (4, 5), (8, 9)])
+        index = Index(['foo', 'bar', 'baz'])
+
+        result = mi == index
+        expected = np.array([False, False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize("dt_conv", [
+        pd.to_datetime, pd.to_timedelta])
+    def test_dt_conversion_preserves_name(self, dt_conv):
+        # GH 10875
+        index = pd.Index(['01:02:03', '01:02:04'], name='label')
+        assert index.name == dt_conv(index).name
+
+    @pytest.mark.skipif(not PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # ASCII
+        # short
+        (pd.Index(['a', 'bb', 'ccc']),
+         u"""Index(['a', 'bb', 'ccc'], dtype='object')"""),
         # multiple lines
-        idx = pd.Index(['a', 'bb', 'ccc'] * 10)
-        if PY3:
-            expected = u"""\
+        (pd.Index(['a', 'bb', 'ccc'] * 10),
+         u"""\
 Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
        'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc',
        'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-      dtype='object')"""
-
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""\
-Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
-       u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
-       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-      dtype='object')"""
-
-            self.assertEqual(coerce(idx), expected)
-
+      dtype='object')"""),
         # truncated
-        idx = pd.Index(['a', 'bb', 'ccc'] * 100)
-        if PY3:
-            expected = u"""\
+        (pd.Index(['a', 'bb', 'ccc'] * 100),
+         u"""\
 Index(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
        ...
        'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-      dtype='object', length=300)"""
+      dtype='object', length=300)"""),
 
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""\
+        # Non-ASCII
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         u"""Index(['あ', 'いい', 'ううう'], dtype='object')"""),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう'],\n"
+          u"      dtype='object')")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
+          u"'あ', 'いい', 'ううう', 'あ',\n"
+          u"       ...\n"
+          u"       'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr(self, index, expected):
+        result = repr(index)
+        assert result == expected
+
+    @pytest.mark.skipif(PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # ASCII
+        # short
+        (pd.Index(['a', 'bb', 'ccc']),
+         u"""Index([u'a', u'bb', u'ccc'], dtype='object')"""),
+        # multiple lines
+        (pd.Index(['a', 'bb', 'ccc'] * 10),
+         u"""\
+Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
+       u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
+       u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
+      dtype='object')"""),
+        # truncated
+        (pd.Index(['a', 'bb', 'ccc'] * 100),
+         u"""\
 Index([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
        ...
        u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-      dtype='object', length=300)"""
-
-            self.assertEqual(coerce(idx), expected)
+      dtype='object', length=300)"""),
 
+        # Non-ASCII
         # short
-        idx = pd.Index([u'あ', u'いい', u'ううう'])
-        if PY3:
-            expected = u"""Index(['あ', 'いい', 'ううう'], dtype='object')"""
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = u"""Index([u'あ', u'いい', u'ううう'], dtype='object')"""
-            self.assertEqual(coerce(idx), expected)
-
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         u"""Index([u'あ', u'いい', u'ううう'], dtype='object')"""),
         # multiple lines
-        idx = pd.Index([u'あ', u'いい', u'ううう'] * 10)
-        if PY3:
-            expected = (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
-                        u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
-                        u"       'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
-                        u"'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',\n"
-                        u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
-                        u"'ううう'],\n"
-                        u"      dtype='object')")
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
-                        u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
-                        u"       u'いい', u'ううう', u'あ', u'いい', u'ううう', "
-                        u"u'あ', u'いい', u'ううう', u'あ', u'いい',\n"
-                        u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
-                        u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
-                        u"      dtype='object')")
-            self.assertEqual(coerce(idx), expected)
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
+          u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object')")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       ...\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
+          u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_compat(self, index, expected):
+        result = unicode(index)  # noqa
+        assert result == expected
+
+    @pytest.mark.skipif(not PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         (u"Index(['あ', 'いい', 'ううう'], "
+          u"dtype='object')")),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ', 'いい', 'ううう'],\n"
+          u"      dtype='object')""")),
+        # truncated
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
+          u"'ううう', 'あ', 'いい', 'ううう',\n"
+          u"       'あ',\n"
+          u"       ...\n"
+          u"       'ううう', 'あ', 'いい', 'ううう', 'あ', "
+          u"'いい', 'ううう', 'あ', 'いい',\n"
+          u"       'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_with_unicode_option(self, index, expected):
+        # Enable Unicode option -----------------------------------------
+        with cf.option_context('display.unicode.east_asian_width', True):
+            result = repr(index)
+            assert result == expected
 
+    @pytest.mark.skipif(PY3, reason="compat test")
+    @pytest.mark.parametrize("index,expected", [
+        # short
+        (pd.Index([u'あ', u'いい', u'ううう']),
+         (u"Index([u'あ', u'いい', u'ううう'], "
+          u"dtype='object')")),
+        # multiple lines
+        (pd.Index([u'あ', u'いい', u'ううう'] * 10),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう'],\n"
+          u"      dtype='object')")),
         # truncated
-        idx = pd.Index([u'あ', u'いい', u'ううう'] * 100)
-        if PY3:
-            expected = (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', "
-                        u"'あ', 'いい', 'ううう', 'あ',\n"
-                        u"       ...\n"
-                        u"       'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', "
-                        u"'ううう', 'あ', 'いい', 'ううう'],\n"
-                        u"      dtype='object', length=300)")
-            self.assertEqual(repr(idx), expected)
-        else:
-            expected = (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
-                        u"u'ううう', u'あ', u'いい', u'ううう', u'あ',\n"
-                        u"       ...\n"
-                        u"       u'ううう', u'あ', u'いい', u'ううう', u'あ', "
-                        u"u'いい', u'ううう', u'あ', u'いい', u'ううう'],\n"
-                        u"      dtype='object', length=300)")
+        (pd.Index([u'あ', u'いい', u'ううう'] * 100),
+         (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
+          u"u'ううう', u'あ', u'いい',\n"
+          u"       u'ううう', u'あ',\n"
+          u"       ...\n"
+          u"       u'ううう', u'あ', u'いい', u'ううう', "
+          u"u'あ', u'いい', u'ううう', u'あ',\n"
+          u"       u'いい', u'ううう'],\n"
+          u"      dtype='object', length=300)"))])
+    def test_string_index_repr_with_unicode_option_compat(self, index,
+                                                          expected):
+        # Enable Unicode option -----------------------------------------
+        with cf.option_context('display.unicode.east_asian_width', True):
+            result = unicode(index)  # noqa
+            assert result == expected
 
-            self.assertEqual(coerce(idx), expected)
+    def test_cached_properties_not_settable(self):
+        index = pd.Index([1, 2, 3])
+        with pytest.raises(AttributeError, match="Can't set attribute"):
+            index.is_unique = False
 
-        # Emable Unicode option -----------------------------------------
-        with cf.option_context('display.unicode.east_asian_width', True):
+    def test_get_duplicates_deprecated(self):
+        index = pd.Index([1, 2, 3])
+        with tm.assert_produces_warning(FutureWarning):
+            index.get_duplicates()
 
-            # short
-            idx = pd.Index([u'あ', u'いい', u'ううう'])
-            if PY3:
-                expected = (u"Index(['あ', 'いい', 'ううう'], "
-                            u"dtype='object')")
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = (u"Index([u'あ', u'いい', u'ううう'], "
-                            u"dtype='object')")
-                self.assertEqual(coerce(idx), expected)
-
-            # multiple lines
-            idx = pd.Index([u'あ', u'いい', u'ううう'] * 10)
-            if PY3:
-                expected = (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
-                            u"'ううう', 'あ', 'いい', 'ううう',\n"
-                            u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
-                            u"'ううう', 'あ', 'いい', 'ううう',\n"
-                            u"       'あ', 'いい', 'ううう', 'あ', 'いい', "
-                            u"'ううう', 'あ', 'いい', 'ううう',\n"
-                            u"       'あ', 'いい', 'ううう'],\n"
-                            u"      dtype='object')""")
-
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
-                            u"u'ううう', u'あ', u'いい',\n"
-                            u"       u'ううう', u'あ', u'いい', u'ううう', "
-                            u"u'あ', u'いい', u'ううう', u'あ',\n"
-                            u"       u'いい', u'ううう', u'あ', u'いい', "
-                            u"u'ううう', u'あ', u'いい',\n"
-                            u"       u'ううう', u'あ', u'いい', u'ううう', "
-                            u"u'あ', u'いい', u'ううう'],\n"
-                            u"      dtype='object')")
-
-                self.assertEqual(coerce(idx), expected)
-
-            # truncated
-            idx = pd.Index([u'あ', u'いい', u'ううう'] * 100)
-            if PY3:
-                expected = (u"Index(['あ', 'いい', 'ううう', 'あ', 'いい', "
-                            u"'ううう', 'あ', 'いい', 'ううう',\n"
-                            u"       'あ',\n"
-                            u"       ...\n"
-                            u"       'ううう', 'あ', 'いい', 'ううう', 'あ', "
-                            u"'いい', 'ううう', 'あ', 'いい',\n"
-                            u"       'ううう'],\n"
-                            u"      dtype='object', length=300)")
-
-                self.assertEqual(repr(idx), expected)
-            else:
-                expected = (u"Index([u'あ', u'いい', u'ううう', u'あ', u'いい', "
-                            u"u'ううう', u'あ', u'いい',\n"
-                            u"       u'ううう', u'あ',\n"
-                            u"       ...\n"
-                            u"       u'ううう', u'あ', u'いい', u'ううう', "
-                            u"u'あ', u'いい', u'ううう', u'あ',\n"
-                            u"       u'いい', u'ううう'],\n"
-                            u"      dtype='object', length=300)")
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
 
-                self.assertEqual(coerce(idx), expected)
+        code = "import pandas as pd; idx = pd.Index([1, 2])"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('idx.', 4))
 
 
-class TestMixedIntIndex(Base, tm.TestCase):
+class TestMixedIntIndex(Base):
     # Mostly the tests from common.py for which the results differ
     # in py2 and py3 because ints and strings are uncomparable in py3
     # (GH 13514)
 
     _holder = Index
 
-    def setUp(self):
+    def setup_method(self, method):
         self.indices = dict(mixedIndex=Index([0, 'a', 1, 'b', 2, 'c']))
         self.setup_indices()
 
@@ -1817,233 +2263,226 @@ def create_index(self):
         return self.mixedIndex
 
     def test_argsort(self):
-        idx = self.create_index()
+        index = self.create_index()
         if PY36:
-            with tm.assertRaisesRegexp(TypeError, "'>' not supported"):
-                result = idx.argsort()
+            with pytest.raises(TypeError, match="'>|<' not supported"):
+                result = index.argsort()
         elif PY3:
-            with tm.assertRaisesRegexp(TypeError, "unorderable types"):
-                result = idx.argsort()
+            with pytest.raises(TypeError, match="unorderable types"):
+                result = index.argsort()
         else:
-            result = idx.argsort()
-            expected = np.array(idx).argsort()
+            result = index.argsort()
+            expected = np.array(index).argsort()
             tm.assert_numpy_array_equal(result, expected, check_dtype=False)
 
     def test_numpy_argsort(self):
-        idx = self.create_index()
+        index = self.create_index()
         if PY36:
-            with tm.assertRaisesRegexp(TypeError, "'>' not supported"):
-                result = np.argsort(idx)
+            with pytest.raises(TypeError, match="'>|<' not supported"):
+                result = np.argsort(index)
         elif PY3:
-            with tm.assertRaisesRegexp(TypeError, "unorderable types"):
-                result = np.argsort(idx)
+            with pytest.raises(TypeError, match="unorderable types"):
+                result = np.argsort(index)
         else:
-            result = np.argsort(idx)
-            expected = idx.argsort()
+            result = np.argsort(index)
+            expected = index.argsort()
             tm.assert_numpy_array_equal(result, expected)
 
     def test_copy_name(self):
         # Check that "name" argument passed at initialization is honoured
         # GH12309
-        idx = self.create_index()
+        index = self.create_index()
 
-        first = idx.__class__(idx, copy=True, name='mario')
+        first = index.__class__(index, copy=True, name='mario')
         second = first.__class__(first, copy=False)
 
         # Even though "copy=False", we want a new object.
-        self.assertIsNot(first, second)
-        # Not using tm.assert_index_equal() since names differ:
-        self.assertTrue(idx.equals(first))
+        assert first is not second
+        tm.assert_index_equal(first, second)
 
-        self.assertEqual(first.name, 'mario')
-        self.assertEqual(second.name, 'mario')
+        assert first.name == 'mario'
+        assert second.name == 'mario'
 
         s1 = Series(2, index=first)
         s2 = Series(3, index=second[:-1])
-        if PY3:
-            with tm.assert_produces_warning(RuntimeWarning):
-                # unorderable types
-                s3 = s1 * s2
-        else:
-            s3 = s1 * s2
-        self.assertEqual(s3.index.name, 'mario')
+
+        s3 = s1 * s2
+
+        assert s3.index.name == 'mario'
 
     def test_copy_name2(self):
         # Check that adding a "name" parameter to the copy is honored
         # GH14302
-        idx = pd.Index([1, 2], name='MyName')
-        idx1 = idx.copy()
-
-        self.assertTrue(idx.equals(idx1))
-        self.assertEqual(idx.name, 'MyName')
-        self.assertEqual(idx1.name, 'MyName')
-
-        idx2 = idx.copy(name='NewName')
+        index = pd.Index([1, 2], name='MyName')
+        index1 = index.copy()
 
-        self.assertTrue(idx.equals(idx2))
-        self.assertEqual(idx.name, 'MyName')
-        self.assertEqual(idx2.name, 'NewName')
+        tm.assert_index_equal(index, index1)
 
-        idx3 = idx.copy(names=['NewName'])
+        index2 = index.copy(name='NewName')
+        tm.assert_index_equal(index, index2, check_names=False)
+        assert index.name == 'MyName'
+        assert index2.name == 'NewName'
 
-        self.assertTrue(idx.equals(idx3))
-        self.assertEqual(idx.name, 'MyName')
-        self.assertEqual(idx.names, ['MyName'])
-        self.assertEqual(idx3.name, 'NewName')
-        self.assertEqual(idx3.names, ['NewName'])
+        index3 = index.copy(names=['NewName'])
+        tm.assert_index_equal(index, index3, check_names=False)
+        assert index.name == 'MyName'
+        assert index.names == ['MyName']
+        assert index3.name == 'NewName'
+        assert index3.names == ['NewName']
 
     def test_union_base(self):
-        idx = self.create_index()
-        first = idx[3:]
-        second = idx[:5]
+        index = self.create_index()
+        first = index[3:]
+        second = index[:5]
 
-        if PY3:
-            with tm.assert_produces_warning(RuntimeWarning):
-                # unorderable types
-                result = first.union(second)
-                expected = Index(['b', 2, 'c', 0, 'a', 1])
-                self.assert_index_equal(result, expected)
-        else:
-            result = first.union(second)
-            expected = Index(['b', 2, 'c', 0, 'a', 1])
-            self.assert_index_equal(result, expected)
+        result = first.union(second)
 
+        expected = Index([0, 1, 2, 'a', 'b', 'c'])
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    def test_union_different_type_base(self, klass):
         # GH 10149
-        cases = [klass(second.values)
-                 for klass in [np.array, Series, list]]
-        for case in cases:
-            if PY3:
-                with tm.assert_produces_warning(RuntimeWarning):
-                    # unorderable types
-                    result = first.union(case)
-                    self.assertTrue(tm.equalContents(result, idx))
-            else:
-                result = first.union(case)
-                self.assertTrue(tm.equalContents(result, idx))
+        index = self.create_index()
+        first = index[3:]
+        second = index[:5]
+
+        result = first.union(klass(second.values))
+
+        assert tm.equalContents(result, index)
+
+    def test_unique_na(self):
+        idx = pd.Index([2, np.nan, 2, 1], name='my_index')
+        expected = pd.Index([2, np.nan, 1], name='my_index')
+        result = idx.unique()
+        tm.assert_index_equal(result, expected)
 
-    def test_intersection_base(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_base(self, sort):
         # (same results for py2 and py3 but sortedness not tested elsewhere)
-        idx = self.create_index()
-        first = idx[:5]
-        second = idx[:3]
-        result = first.intersection(second)
-        expected = Index([0, 'a', 1])
-        self.assert_index_equal(result, expected)
+        index = self.create_index()
+        first = index[:5]
+        second = index[:3]
+
+        expected = Index([0, 1, 'a']) if sort is None else Index([0, 'a', 1])
+        result = first.intersection(second, sort=sort)
+        tm.assert_index_equal(result, expected)
 
+    @pytest.mark.parametrize("klass", [
+        np.array, Series, list])
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection_different_type_base(self, klass, sort):
         # GH 10149
-        cases = [klass(second.values)
-                 for klass in [np.array, Series, list]]
-        for case in cases:
-            result = first.intersection(case)
-            self.assertTrue(tm.equalContents(result, second))
+        index = self.create_index()
+        first = index[:5]
+        second = index[:3]
+
+        result = first.intersection(klass(second.values), sort=sort)
+        assert tm.equalContents(result, second)
 
-    def test_difference_base(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_base(self, sort):
         # (same results for py2 and py3 but sortedness not tested elsewhere)
-        idx = self.create_index()
-        first = idx[:4]
-        second = idx[3:]
+        index = self.create_index()
+        first = index[:4]
+        second = index[3:]
 
-        result = first.difference(second)
-        expected = Index([0, 1, 'a'])
-        self.assert_index_equal(result, expected)
+        result = first.difference(second, sort)
+        expected = Index([0, 'a', 1])
+        if sort is None:
+            expected = Index(safe_sort(expected))
+        tm.assert_index_equal(result, expected)
 
     def test_symmetric_difference(self):
         # (same results for py2 and py3 but sortedness not tested elsewhere)
-        idx = self.create_index()
-        first = idx[:4]
-        second = idx[3:]
+        index = self.create_index()
+        first = index[:4]
+        second = index[3:]
 
         result = first.symmetric_difference(second)
         expected = Index([0, 1, 2, 'a', 'c'])
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
     def test_logical_compat(self):
-        idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
-
-    def test_dropna(self):
+        index = self.create_index()
+        assert index.all() == index.values.all()
+        assert index.any() == index.values.any()
+
+    @pytest.mark.parametrize("how", ['any', 'all'])
+    @pytest.mark.parametrize("dtype", [
+        None, object, 'category'])
+    @pytest.mark.parametrize("vals,expected", [
+        ([1, 2, 3], [1, 2, 3]), ([1., 2., 3.], [1., 2., 3.]),
+        ([1., 2., np.nan, 3.], [1., 2., 3.]),
+        (['A', 'B', 'C'], ['A', 'B', 'C']),
+        (['A', np.nan, 'B', 'C'], ['A', 'B', 'C'])])
+    def test_dropna(self, how, dtype, vals, expected):
         # GH 6194
-        for dtype in [None, object, 'category']:
-            idx = pd.Index([1, 2, 3], dtype=dtype)
-            tm.assert_index_equal(idx.dropna(), idx)
-
-            idx = pd.Index([1., 2., 3.], dtype=dtype)
-            tm.assert_index_equal(idx.dropna(), idx)
-            nanidx = pd.Index([1., 2., np.nan, 3.], dtype=dtype)
-            tm.assert_index_equal(nanidx.dropna(), idx)
-
-            idx = pd.Index(['A', 'B', 'C'], dtype=dtype)
-            tm.assert_index_equal(idx.dropna(), idx)
-            nanidx = pd.Index(['A', np.nan, 'B', 'C'], dtype=dtype)
-            tm.assert_index_equal(nanidx.dropna(), idx)
-
-            tm.assert_index_equal(nanidx.dropna(how='any'), idx)
-            tm.assert_index_equal(nanidx.dropna(how='all'), idx)
-
-        idx = pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'])
-        tm.assert_index_equal(idx.dropna(), idx)
-        nanidx = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
-                                   '2011-01-03', pd.NaT])
-        tm.assert_index_equal(nanidx.dropna(), idx)
-
-        idx = pd.TimedeltaIndex(['1 days', '2 days', '3 days'])
-        tm.assert_index_equal(idx.dropna(), idx)
-        nanidx = pd.TimedeltaIndex([pd.NaT, '1 days', '2 days',
-                                    '3 days', pd.NaT])
-        tm.assert_index_equal(nanidx.dropna(), idx)
-
-        idx = pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M')
-        tm.assert_index_equal(idx.dropna(), idx)
-        nanidx = pd.PeriodIndex(['2012-02', '2012-04', 'NaT', '2012-05'],
-                                freq='M')
-        tm.assert_index_equal(nanidx.dropna(), idx)
+        index = pd.Index(vals, dtype=dtype)
+        result = index.dropna(how=how)
+        expected = pd.Index(expected, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize("how", ['any', 'all'])
+    @pytest.mark.parametrize("index,expected", [
+        (pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03']),
+         pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'])),
+        (pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03', pd.NaT]),
+         pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'])),
+        (pd.TimedeltaIndex(['1 days', '2 days', '3 days']),
+         pd.TimedeltaIndex(['1 days', '2 days', '3 days'])),
+        (pd.TimedeltaIndex([pd.NaT, '1 days', '2 days', '3 days', pd.NaT]),
+         pd.TimedeltaIndex(['1 days', '2 days', '3 days'])),
+        (pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M'),
+         pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M')),
+        (pd.PeriodIndex(['2012-02', '2012-04', 'NaT', '2012-05'], freq='M'),
+         pd.PeriodIndex(['2012-02', '2012-04', '2012-05'], freq='M'))])
+    def test_dropna_dt_like(self, how, index, expected):
+        result = index.dropna(how=how)
+        tm.assert_index_equal(result, expected)
 
+    def test_dropna_invalid_how_raises(self):
         msg = "invalid how option: xxx"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             pd.Index([1, 2, 3]).dropna(how='xxx')
 
     def test_get_combined_index(self):
         result = _get_combined_index([])
-        tm.assert_index_equal(result, Index([]))
+        expected = Index([])
+        tm.assert_index_equal(result, expected)
 
     def test_repeat(self):
         repeats = 2
-        idx = pd.Index([1, 2, 3])
+        index = pd.Index([1, 2, 3])
         expected = pd.Index([1, 1, 2, 2, 3, 3])
 
-        result = idx.repeat(repeats)
+        result = index.repeat(repeats)
         tm.assert_index_equal(result, expected)
 
-        with tm.assert_produces_warning(FutureWarning):
-            result = idx.repeat(n=repeats)
-            tm.assert_index_equal(result, expected)
-
-    def test_is_monotonic_na(self):
-        examples = [pd.Index([np.nan]),
-                    pd.Index([np.nan, 1]),
-                    pd.Index([1, 2, np.nan]),
-                    pd.Index(['a', 'b', np.nan]),
-                    pd.to_datetime(['NaT']),
-                    pd.to_datetime(['NaT', '2000-01-01']),
-                    pd.to_datetime(['2000-01-01', 'NaT', '2000-01-02']),
-                    pd.to_timedelta(['1 day', 'NaT']), ]
-        for index in examples:
-            self.assertFalse(index.is_monotonic_increasing)
-            self.assertFalse(index.is_monotonic_decreasing)
+    @pytest.mark.parametrize("index", [
+        pd.Index([np.nan]), pd.Index([np.nan, 1]),
+        pd.Index([1, 2, np.nan]), pd.Index(['a', 'b', np.nan]),
+        pd.to_datetime(['NaT']), pd.to_datetime(['NaT', '2000-01-01']),
+        pd.to_datetime(['2000-01-01', 'NaT', '2000-01-02']),
+        pd.to_timedelta(['1 day', 'NaT'])])
+    def test_is_monotonic_na(self, index):
+        assert index.is_monotonic_increasing is False
+        assert index.is_monotonic_decreasing is False
+        assert index._is_strictly_monotonic_increasing is False
+        assert index._is_strictly_monotonic_decreasing is False
 
     def test_repr_summary(self):
         with cf.option_context('display.max_seq_items', 10):
-            r = repr(pd.Index(np.arange(1000)))
-            self.assertTrue(len(r) < 200)
-            self.assertTrue("..." in r)
+            result = repr(pd.Index(np.arange(1000)))
+            assert len(result) < 200
+            assert "..." in result
 
-    def test_int_name_format(self):
+    @pytest.mark.parametrize("klass", [Series, DataFrame])
+    def test_int_name_format(self, klass):
         index = Index(['a', 'b', 'c'], name=0)
-        s = Series(lrange(3), index)
-        df = DataFrame(lrange(3), index=index)
-        repr(s)
-        repr(df)
+        result = klass(lrange(3), index=index)
+        assert '0' in repr(result)
 
     def test_print_unicode_columns(self):
         df = pd.DataFrame({u("\u05d0"): [1, 2, 3],
@@ -2051,26 +2490,92 @@ def test_print_unicode_columns(self):
                            "c": [7, 8, 9]})
         repr(df.columns)  # should not raise UnicodeDecodeError
 
-    def test_unicode_string_with_unicode(self):
-        idx = Index(lrange(1000))
-
-        if PY3:
-            str(idx)
-        else:
-            text_type(idx)
+    @pytest.mark.parametrize("func,compat_func", [
+        (str, text_type),  # unicode string
+        (bytes, str)  # byte string
+    ])
+    def test_with_unicode(self, func, compat_func):
+        index = Index(lrange(1000))
 
-    def test_bytestring_with_unicode(self):
-        idx = Index(lrange(1000))
         if PY3:
-            bytes(idx)
+            func(index)
         else:
-            str(idx)
+            compat_func(index)
 
     def test_intersect_str_dates(self):
         dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
 
-        i1 = Index(dt_dates, dtype=object)
-        i2 = Index(['aa'], dtype=object)
-        res = i2.intersection(i1)
+        index1 = Index(dt_dates, dtype=object)
+        index2 = Index(['aa'], dtype=object)
+        result = index2.intersection(index1)
+
+        expected = Index([], dtype=object)
+        tm.assert_index_equal(result, expected)
+
+
+class TestIndexUtils(object):
+
+    @pytest.mark.parametrize('data, names, expected', [
+        ([[1, 2, 3]], None, Index([1, 2, 3])),
+        ([[1, 2, 3]], ['name'], Index([1, 2, 3], name='name')),
+        ([['a', 'a'], ['c', 'd']], None,
+         MultiIndex([['a'], ['c', 'd']], [[0, 0], [0, 1]])),
+        ([['a', 'a'], ['c', 'd']], ['L1', 'L2'],
+         MultiIndex([['a'], ['c', 'd']], [[0, 0], [0, 1]],
+                    names=['L1', 'L2'])),
+    ])
+    def test_ensure_index_from_sequences(self, data, names, expected):
+        result = ensure_index_from_sequences(data, names)
+        tm.assert_index_equal(result, expected)
+
+
+@pytest.mark.parametrize('opname', ['eq', 'ne', 'le', 'lt', 'ge', 'gt',
+                                    'add', 'radd', 'sub', 'rsub',
+                                    'mul', 'rmul', 'truediv', 'rtruediv',
+                                    'floordiv', 'rfloordiv',
+                                    'pow', 'rpow', 'mod', 'divmod'])
+def test_generated_op_names(opname, indices):
+    index = indices
+    if isinstance(index, ABCIndex) and opname == 'rsub':
+        # pd.Index.__rsub__ does not exist; though the method does exist
+        # for subclasses.  see GH#19723
+        return
+    opname = '__{name}__'.format(name=opname)
+    method = getattr(index, opname)
+    assert method.__name__ == opname
+
+
+@pytest.mark.parametrize('index_maker', tm.index_subclass_makers_generator())
+def test_index_subclass_constructor_wrong_kwargs(index_maker):
+    # GH #19348
+    with pytest.raises(TypeError, match='unexpected keyword argument'):
+        index_maker(foo='bar')
+
+
+def test_deprecated_fastpath():
+
+    with tm.assert_produces_warning(FutureWarning):
+        idx = pd.Index(
+            np.array(['a', 'b'], dtype=object), name='test', fastpath=True)
+
+    expected = pd.Index(['a', 'b'], name='test')
+    tm.assert_index_equal(idx, expected)
+
+    with tm.assert_produces_warning(FutureWarning):
+        idx = pd.Int64Index(
+            np.array([1, 2, 3], dtype='int64'), name='test', fastpath=True)
+
+    expected = pd.Index([1, 2, 3], name='test', dtype='int64')
+    tm.assert_index_equal(idx, expected)
+
+    with tm.assert_produces_warning(FutureWarning):
+        idx = pd.RangeIndex(0, 5, 2, name='test', fastpath=True)
+
+    expected = pd.RangeIndex(0, 5, 2, name='test')
+    tm.assert_index_equal(idx, expected)
+
+    with tm.assert_produces_warning(FutureWarning):
+        idx = pd.CategoricalIndex(['a', 'b', 'c'], name='test', fastpath=True)
 
-        self.assertEqual(len(res), 0)
+    expected = pd.CategoricalIndex(['a', 'b', 'c'], name='test')
+    tm.assert_index_equal(idx, expected)
diff --git a/pandas/tests/indexes/test_category.py b/pandas/tests/indexes/test_category.py
index ef1be7e60e0e8..95fac2f6ae05b 100644
--- a/pandas/tests/indexes/test_category.py
+++ b/pandas/tests/indexes/test_category.py
@@ -1,29 +1,30 @@
 # -*- coding: utf-8 -*-
 
-# TODO(wesm): fix long line flake8 issues
-# flake8: noqa
-
-import pandas.util.testing as tm
-from pandas.indexes.api import Index, CategoricalIndex
-from .common import Base
+import numpy as np
+import pytest
 
-from pandas.compat import range, PY3
+from pandas._libs import index as libindex
+from pandas.compat import PY3, range
 
-import numpy as np
+from pandas.core.dtypes.dtypes import CategoricalDtype
 
-from pandas import Categorical, compat, notnull
-from pandas.util.testing import assert_almost_equal
-import pandas.core.config as cf
 import pandas as pd
+from pandas import Categorical, IntervalIndex, compat
+import pandas.core.config as cf
+from pandas.core.indexes.api import CategoricalIndex, Index
+import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal
+
+from .common import Base
 
 if PY3:
     unicode = lambda x: x
 
 
-class TestCategoricalIndex(Base, tm.TestCase):
+class TestCategoricalIndex(Base):
     _holder = CategoricalIndex
 
-    def setUp(self):
+    def setup_method(self, method):
         self.indices = dict(catIndex=tm.makeCategoricalIndex(100))
         self.setup_indices()
 
@@ -33,6 +34,11 @@ def create_index(self, categories=None, ordered=False):
         return CategoricalIndex(
             list('aabbca'), categories=categories, ordered=ordered)
 
+    def test_can_hold_identifiers(self):
+        idx = self.create_index(categories=list('abcd'))
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is True
+
     def test_construction(self):
 
         ci = self.create_index(categories=list('abcd'))
@@ -40,62 +46,71 @@ def test_construction(self):
 
         result = Index(ci)
         tm.assert_index_equal(result, ci, exact=True)
-        self.assertFalse(result.ordered)
+        assert not result.ordered
 
         result = Index(ci.values)
         tm.assert_index_equal(result, ci, exact=True)
-        self.assertFalse(result.ordered)
+        assert not result.ordered
 
         # empty
         result = CategoricalIndex(categories=categories)
-        self.assert_index_equal(result.categories, Index(categories))
+        tm.assert_index_equal(result.categories, Index(categories))
         tm.assert_numpy_array_equal(result.codes, np.array([], dtype='int8'))
-        self.assertFalse(result.ordered)
+        assert not result.ordered
 
         # passing categories
         result = CategoricalIndex(list('aabbca'), categories=categories)
-        self.assert_index_equal(result.categories, Index(categories))
+        tm.assert_index_equal(result.categories, Index(categories))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, 2, 0], dtype='int8'))
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
 
         c = pd.Categorical(list('aabbca'))
         result = CategoricalIndex(c)
-        self.assert_index_equal(result.categories, Index(list('abc')))
+        tm.assert_index_equal(result.categories, Index(list('abc')))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, 2, 0], dtype='int8'))
-        self.assertFalse(result.ordered)
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
 
         result = CategoricalIndex(c, categories=categories)
-        self.assert_index_equal(result.categories, Index(categories))
+        tm.assert_index_equal(result.categories, Index(categories))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, 2, 0], dtype='int8'))
-        self.assertFalse(result.ordered)
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
 
         ci = CategoricalIndex(c, categories=list('abcd'))
         result = CategoricalIndex(ci)
-        self.assert_index_equal(result.categories, Index(categories))
+        tm.assert_index_equal(result.categories, Index(categories))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, 2, 0], dtype='int8'))
-        self.assertFalse(result.ordered)
+                                    np.array([0, 0, 1,
+                                              1, 2, 0], dtype='int8'))
+        assert not result.ordered
 
         result = CategoricalIndex(ci, categories=list('ab'))
-        self.assert_index_equal(result.categories, Index(list('ab')))
+        tm.assert_index_equal(result.categories, Index(list('ab')))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, -1, 0],
-                                             dtype='int8'))
-        self.assertFalse(result.ordered)
+                                    np.array([0, 0, 1,
+                                              1, -1, 0], dtype='int8'))
+        assert not result.ordered
 
         result = CategoricalIndex(ci, categories=list('ab'), ordered=True)
-        self.assert_index_equal(result.categories, Index(list('ab')))
+        tm.assert_index_equal(result.categories, Index(list('ab')))
         tm.assert_numpy_array_equal(result.codes,
-                                    np.array([0, 0, 1, 1, -1, 0],
-                                             dtype='int8'))
-        self.assertTrue(result.ordered)
+                                    np.array([0, 0, 1,
+                                              1, -1, 0], dtype='int8'))
+        assert result.ordered
+
+        result = pd.CategoricalIndex(ci, categories=list('ab'), ordered=True)
+        expected = pd.CategoricalIndex(ci, categories=list('ab'), ordered=True,
+                                       dtype='category')
+        tm.assert_index_equal(result, expected, exact=True)
 
         # turn me to an Index
         result = Index(np.array(ci))
-        self.assertIsInstance(result, Index)
-        self.assertNotIsInstance(result, CategoricalIndex)
+        assert isinstance(result, Index)
+        assert not isinstance(result, CategoricalIndex)
 
     def test_construction_with_dtype(self):
 
@@ -122,18 +137,65 @@ def test_construction_with_dtype(self):
         result = CategoricalIndex(idx, categories=idx, ordered=True)
         tm.assert_index_equal(result, expected, exact=True)
 
-    def test_disallow_set_ops(self):
+    def test_construction_empty_with_bool_categories(self):
+        # see gh-22702
+        cat = pd.CategoricalIndex([], categories=[True, False])
+        categories = sorted(cat.categories.tolist())
+        assert categories == [False, True]
+
+    def test_construction_with_categorical_dtype(self):
+        # construction with CategoricalDtype
+        # GH18109
+        data, cats, ordered = 'a a b b'.split(), 'c b a'.split(), True
+        dtype = CategoricalDtype(categories=cats, ordered=ordered)
+
+        result = CategoricalIndex(data, dtype=dtype)
+        expected = CategoricalIndex(data, categories=cats, ordered=ordered)
+        tm.assert_index_equal(result, expected, exact=True)
+
+        # GH 19032
+        result = Index(data, dtype=dtype)
+        tm.assert_index_equal(result, expected, exact=True)
 
+        # error when combining categories/ordered and dtype kwargs
+        msg = "Cannot specify `categories` or `ordered` together with `dtype`."
+        with pytest.raises(ValueError, match=msg):
+            CategoricalIndex(data, categories=cats, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Index(data, categories=cats, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            CategoricalIndex(data, ordered=ordered, dtype=dtype)
+
+        with pytest.raises(ValueError, match=msg):
+            Index(data, ordered=ordered, dtype=dtype)
+
+    def test_create_categorical(self):
+        # https://github.com/pandas-dev/pandas/pull/17513
+        # The public CI constructor doesn't hit this code path with
+        # instances of CategoricalIndex, but we still want to test the code
+        ci = CategoricalIndex(['a', 'b', 'c'])
+        # First ci is self, second ci is data.
+        result = CategoricalIndex._create_categorical(ci, ci)
+        expected = Categorical(['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize('func,op_name', [
+        (lambda idx: idx - idx, '__sub__'),
+        (lambda idx: idx + idx, '__add__'),
+        (lambda idx: idx - ['a', 'b'], '__sub__'),
+        (lambda idx: idx + ['a', 'b'], '__add__'),
+        (lambda idx: ['a', 'b'] - idx, '__rsub__'),
+        (lambda idx: ['a', 'b'] + idx, '__radd__'),
+    ])
+    def test_disallow_set_ops(self, func, op_name):
         # GH 10039
         # set ops (+/-) raise TypeError
         idx = pd.Index(pd.Categorical(['a', 'b']))
-
-        self.assertRaises(TypeError, lambda: idx - idx)
-        self.assertRaises(TypeError, lambda: idx + idx)
-        self.assertRaises(TypeError, lambda: idx - ['a', 'b'])
-        self.assertRaises(TypeError, lambda: idx + ['a', 'b'])
-        self.assertRaises(TypeError, lambda: ['a', 'b'] - idx)
-        self.assertRaises(TypeError, lambda: ['a', 'b'] + idx)
+        msg = "cannot perform {} with this index type: CategoricalIndex"
+        with pytest.raises(TypeError, match=msg.format(op_name)):
+            func(idx)
 
     def test_method_delegation(self):
 
@@ -147,6 +209,11 @@ def test_method_delegation(self):
         tm.assert_index_equal(result, CategoricalIndex(
             list('ffggef'), categories=list('efg')))
 
+        # GH18862 (let rename_categories take callables)
+        result = ci.rename_categories(lambda x: x.upper())
+        tm.assert_index_equal(result, CategoricalIndex(
+            list('AABBCA'), categories=list('CAB')))
+
         ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
         result = ci.add_categories(['d'])
         tm.assert_index_equal(result, CategoricalIndex(
@@ -167,36 +234,26 @@ def test_method_delegation(self):
             list('aabbca'), categories=list('cabdef'), ordered=True))
 
         # invalid
-        self.assertRaises(ValueError, lambda: ci.set_categories(
-            list('cab'), inplace=True))
+        msg = "cannot use inplace with CategoricalIndex"
+        with pytest.raises(ValueError, match=msg):
+            ci.set_categories(list('cab'), inplace=True)
 
     def test_contains(self):
 
         ci = self.create_index(categories=list('cabdef'))
 
-        self.assertTrue('a' in ci)
-        self.assertTrue('z' not in ci)
-        self.assertTrue('e' not in ci)
-        self.assertTrue(np.nan not in ci)
+        assert 'a' in ci
+        assert 'z' not in ci
+        assert 'e' not in ci
+        assert np.nan not in ci
 
         # assert codes NOT in index
-        self.assertFalse(0 in ci)
-        self.assertFalse(1 in ci)
+        assert 0 not in ci
+        assert 1 not in ci
 
         ci = CategoricalIndex(
             list('aabbca') + [np.nan], categories=list('cabdef'))
-        self.assertTrue(np.nan in ci)
-
-    def test_min_max(self):
-
-        ci = self.create_index(ordered=False)
-        self.assertRaises(TypeError, lambda: ci.min())
-        self.assertRaises(TypeError, lambda: ci.max())
-
-        ci = self.create_index(ordered=True)
-
-        self.assertEqual(ci.min(), 'c')
-        self.assertEqual(ci.max(), 'b')
+        assert np.nan in ci
 
     def test_map(self):
         ci = pd.CategoricalIndex(list('ABABC'), categories=list('CBA'),
@@ -215,7 +272,8 @@ def test_map(self):
 
         # GH 12766: Return an index not an array
         tm.assert_index_equal(ci.map(lambda x: 1),
-                              Index(np.array([1] * 5, dtype=np.int64), name='XXX'))
+                              Index(np.array([1] * 5, dtype=np.int64),
+                                    name='XXX'))
 
         # change categories dtype
         ci = pd.CategoricalIndex(list('ABABC'), categories=list('BAC'),
@@ -225,32 +283,65 @@ def f(x):
             return {'A': 10, 'B': 20, 'C': 30}.get(x)
 
         result = ci.map(f)
-        exp = pd.CategoricalIndex([10, 20, 10, 20, 30], categories=[20, 10, 30],
+        exp = pd.CategoricalIndex([10, 20, 10, 20, 30],
+                                  categories=[20, 10, 30],
                                   ordered=False)
         tm.assert_index_equal(result, exp)
 
-    def test_where(self):
+        result = ci.map(pd.Series([10, 20, 30], index=['A', 'B', 'C']))
+        tm.assert_index_equal(result, exp)
+
+        result = ci.map({'A': 10, 'B': 20, 'C': 30})
+        tm.assert_index_equal(result, exp)
+
+    def test_map_with_categorical_series(self):
+        # GH 12756
+        a = pd.Index([1, 2, 3, 4])
+        b = pd.Series(["even", "odd", "even", "odd"],
+                      dtype="category")
+        c = pd.Series(["even", "odd", "even", "odd"])
+
+        exp = CategoricalIndex(["odd", "even", "odd", np.nan])
+        tm.assert_index_equal(a.map(b), exp)
+        exp = pd.Index(["odd", "even", "odd", np.nan])
+        tm.assert_index_equal(a.map(c), exp)
+
+    @pytest.mark.parametrize(
+        (
+            'data',
+            'f'
+        ),
+        (
+            ([1, 1, np.nan], pd.isna),
+            ([1, 2, np.nan], pd.isna),
+            ([1, 1, np.nan], {1: False}),
+            ([1, 2, np.nan], {1: False, 2: False}),
+            ([1, 1, np.nan], pd.Series([False, False])),
+            ([1, 2, np.nan], pd.Series([False, False, False]))
+        ))
+    def test_map_with_nan(self, data, f):  # GH 24241
+        values = pd.Categorical(data)
+        result = values.map(f)
+        if data[1] == 1:
+            expected = pd.Categorical([False, False, np.nan])
+            tm.assert_categorical_equal(result, expected)
+        else:
+            expected = pd.Index([False, False, np.nan])
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, pd.Series])
+    def test_where(self, klass):
         i = self.create_index()
-        result = i.where(notnull(i))
+        cond = [True] * len(i)
         expected = i
+        result = i.where(klass(cond))
         tm.assert_index_equal(result, expected)
 
-        i2 = pd.CategoricalIndex([np.nan, np.nan] + i[2:].tolist(),
-                                 categories=i.categories)
-        result = i.where(notnull(i2))
-        expected = i2
-        tm.assert_index_equal(result, expected)
-
-    def test_where_array_like(self):
-        i = self.create_index()
         cond = [False] + [True] * (len(i) - 1)
-        klasses = [list, tuple, np.array, pd.Series]
-        expected = pd.CategoricalIndex([np.nan] + i[1:].tolist(),
-                                       categories=i.categories)
-
-        for klass in klasses:
-            result = i.where(klass(cond))
-            tm.assert_index_equal(result, expected)
+        expected = CategoricalIndex([np.nan] + i[1:].tolist(),
+                                    categories=i.categories)
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
 
     def test_append(self):
 
@@ -269,13 +360,12 @@ def test_append(self):
         result = ci.append([])
         tm.assert_index_equal(result, ci, exact=True)
 
-        # appending with different categories or reoreded is not ok
-        self.assertRaises(
-            TypeError,
-            lambda: ci.append(ci.values.set_categories(list('abcd'))))
-        self.assertRaises(
-            TypeError,
-            lambda: ci.append(ci.values.reorder_categories(list('abc'))))
+        # appending with different categories or reordered is not ok
+        msg = "all inputs must be Index"
+        with pytest.raises(TypeError, match=msg):
+            ci.append(ci.values.set_categories(list('abcd')))
+        with pytest.raises(TypeError, match=msg):
+            ci.append(ci.values.reorder_categories(list('abc')))
 
         # with objects
         result = ci.append(Index(['c', 'a']))
@@ -283,13 +373,23 @@ def test_append(self):
         tm.assert_index_equal(result, expected, exact=True)
 
         # invalid objects
-        self.assertRaises(TypeError, lambda: ci.append(Index(['a', 'd'])))
+        msg = "cannot append a non-category item to a CategoricalIndex"
+        with pytest.raises(TypeError, match=msg):
+            ci.append(Index(['a', 'd']))
 
         # GH14298 - if base object is not categorical -> coerce to object
         result = Index(['c', 'a']).append(ci)
         expected = Index(list('caaabbca'))
         tm.assert_index_equal(result, expected, exact=True)
 
+    def test_append_to_another(self):
+        # hits _concat_index_asobject
+        fst = Index(['a', 'b'])
+        snd = CategoricalIndex(['d', 'e'])
+        result = fst.append(snd)
+        expected = Index(['a', 'b', 'd', 'e'])
+        tm.assert_index_equal(result, expected)
+
     def test_insert(self):
 
         ci = self.create_index()
@@ -311,7 +411,16 @@ def test_insert(self):
         tm.assert_index_equal(result, expected, exact=True)
 
         # invalid
-        self.assertRaises(TypeError, lambda: ci.insert(0, 'd'))
+        msg = ("cannot insert an item into a CategoricalIndex that is not"
+               " already an existing category")
+        with pytest.raises(TypeError, match=msg):
+            ci.insert(0, 'd')
+
+        # GH 18295 (test missing)
+        expected = CategoricalIndex(['a', np.nan, 'a', 'b', 'c', 'b'])
+        for na in (np.nan, pd.NaT, None):
+            result = CategoricalIndex(list('aabcb')).insert(1, na)
+            tm.assert_index_equal(result, expected)
 
     def test_delete(self):
 
@@ -326,37 +435,79 @@ def test_delete(self):
         expected = CategoricalIndex(list('aabbc'), categories=categories)
         tm.assert_index_equal(result, expected, exact=True)
 
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = ci.delete(10)
+        with pytest.raises((IndexError, ValueError)):
+            # Either depending on NumPy version
+            ci.delete(10)
 
     def test_astype(self):
 
         ci = self.create_index()
-        result = ci.astype('category')
-        tm.assert_index_equal(result, ci, exact=True)
-
         result = ci.astype(object)
-        self.assert_index_equal(result, Index(np.array(ci)))
+        tm.assert_index_equal(result, Index(np.array(ci)))
 
         # this IS equal, but not the same class
-        self.assertTrue(result.equals(ci))
-        self.assertIsInstance(result, Index)
-        self.assertNotIsInstance(result, CategoricalIndex)
+        assert result.equals(ci)
+        assert isinstance(result, Index)
+        assert not isinstance(result, CategoricalIndex)
 
-    def test_reindex_base(self):
+        # interval
+        ii = IntervalIndex.from_arrays(left=[-0.001, 2.0],
+                                       right=[2, 4],
+                                       closed='right')
+
+        ci = CategoricalIndex(Categorical.from_codes(
+            [0, 1, -1], categories=ii, ordered=True))
 
-        # determined by cat ordering
-        idx = self.create_index()
-        expected = np.array([4, 0, 1, 5, 2, 3], dtype=np.intp)
+        result = ci.astype('interval')
+        expected = ii.take([0, 1, -1])
+        tm.assert_index_equal(result, expected)
+
+        result = IntervalIndex(result.values)
+        tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('index_ordered', [True, False])
+    def test_astype_category(self, name, dtype_ordered, index_ordered):
+        # GH 18630
+        index = self.create_index(ordered=index_ordered)
+        if name:
+            index = index.rename(name)
+
+        # standard categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(index.tolist(),
+                                    name=name,
+                                    categories=index.categories,
+                                    ordered=dtype_ordered)
+        tm.assert_index_equal(result, expected)
+
+        # non-standard categories
+        dtype = CategoricalDtype(index.unique().tolist()[:-1], dtype_ordered)
+        result = index.astype(dtype)
+        expected = CategoricalIndex(index.tolist(), name=name, dtype=dtype)
+        tm.assert_index_equal(result, expected)
+
+        if dtype_ordered is False:
+            # dtype='category' can't specify ordered, so only test once
+            result = index.astype('category')
+            expected = index
+            tm.assert_index_equal(result, expected)
+
+    def test_reindex_base(self):
+        # Determined by cat ordering.
+        idx = CategoricalIndex(list("cab"), categories=list("cab"))
+        expected = np.arange(len(idx), dtype=np.intp)
 
         actual = idx.get_indexer(idx)
         tm.assert_numpy_array_equal(expected, actual)
 
-        with tm.assertRaisesRegexp(ValueError, 'Invalid fill method'):
-            idx.get_indexer(idx, method='invalid')
+        with pytest.raises(ValueError, match="Invalid fill method"):
+            idx.get_indexer(idx, method="invalid")
 
     def test_reindexing(self):
+        np.random.seed(123456789)
 
         ci = self.create_index()
         oidx = Index(np.array(ci))
@@ -366,15 +517,26 @@ def test_reindexing(self):
             expected = oidx.get_indexer_non_unique(finder)[0]
 
             actual = ci.get_indexer(finder)
-            tm.assert_numpy_array_equal(
-                expected.values, actual, check_dtype=False)
+            tm.assert_numpy_array_equal(expected, actual)
+
+        # see gh-17323
+        #
+        # Even when indexer is equal to the
+        # members in the index, we should
+        # respect duplicates instead of taking
+        # the fast-track path.
+        for finder in [list("aabbca"), list("aababca")]:
+            expected = oidx.get_indexer_non_unique(finder)[0]
+
+            actual = ci.get_indexer(finder)
+            tm.assert_numpy_array_equal(expected, actual)
 
     def test_reindex_dtype(self):
         c = CategoricalIndex(['a', 'b', 'c', 'a'])
         res, indexer = c.reindex(['a', 'c'])
         tm.assert_index_equal(res, Index(['a', 'a', 'c']), exact=True)
         tm.assert_numpy_array_equal(indexer,
-                                    np.array([0, 3, 2], dtype=np.int64))
+                                    np.array([0, 3, 2], dtype=np.intp))
 
         c = CategoricalIndex(['a', 'b', 'c', 'a'])
         res, indexer = c.reindex(Categorical(['a', 'c']))
@@ -382,7 +544,7 @@ def test_reindex_dtype(self):
         exp = CategoricalIndex(['a', 'a', 'c'], categories=['a', 'c'])
         tm.assert_index_equal(res, exp, exact=True)
         tm.assert_numpy_array_equal(indexer,
-                                    np.array([0, 3, 2], dtype=np.int64))
+                                    np.array([0, 3, 2], dtype=np.intp))
 
         c = CategoricalIndex(['a', 'b', 'c', 'a'],
                              categories=['a', 'b', 'c', 'd'])
@@ -390,7 +552,7 @@ def test_reindex_dtype(self):
         exp = Index(['a', 'a', 'c'], dtype='object')
         tm.assert_index_equal(res, exp, exact=True)
         tm.assert_numpy_array_equal(indexer,
-                                    np.array([0, 3, 2], dtype=np.int64))
+                                    np.array([0, 3, 2], dtype=np.intp))
 
         c = CategoricalIndex(['a', 'b', 'c', 'a'],
                              categories=['a', 'b', 'c', 'd'])
@@ -398,17 +560,77 @@ def test_reindex_dtype(self):
         exp = CategoricalIndex(['a', 'a', 'c'], categories=['a', 'c'])
         tm.assert_index_equal(res, exp, exact=True)
         tm.assert_numpy_array_equal(indexer,
-                                    np.array([0, 3, 2], dtype=np.int64))
+                                    np.array([0, 3, 2], dtype=np.intp))
 
-    def test_duplicates(self):
+    def test_reindex_duplicate_target(self):
+        # See GH23963
+        c = CategoricalIndex(['a', 'b', 'c', 'a'],
+                             categories=['a', 'b', 'c', 'd'])
+        with pytest.raises(ValueError, match='non-unique indexer'):
+            c.reindex(['a', 'a', 'c'])
+
+        with pytest.raises(ValueError, match='non-unique indexer'):
+            c.reindex(CategoricalIndex(['a', 'a', 'c'],
+                                       categories=['a', 'b', 'c', 'd']))
+
+    def test_reindex_empty_index(self):
+        # See GH16770
+        c = CategoricalIndex([])
+        res, indexer = c.reindex(['a', 'b'])
+        tm.assert_index_equal(res, Index(['a', 'b']), exact=True)
+        tm.assert_numpy_array_equal(indexer,
+                                    np.array([-1, -1], dtype=np.intp))
+
+    @pytest.mark.parametrize('data, non_lexsorted_data', [
+        [[1, 2, 3], [9, 0, 1, 2, 3]],
+        [list('abc'), list('fabcd')],
+    ])
+    def test_is_monotonic(self, data, non_lexsorted_data):
+        c = CategoricalIndex(data)
+        assert c.is_monotonic_increasing is True
+        assert c.is_monotonic_decreasing is False
+
+        c = CategoricalIndex(data, ordered=True)
+        assert c.is_monotonic_increasing is True
+        assert c.is_monotonic_decreasing is False
+
+        c = CategoricalIndex(data, categories=reversed(data))
+        assert c.is_monotonic_increasing is False
+        assert c.is_monotonic_decreasing is True
+
+        c = CategoricalIndex(data, categories=reversed(data), ordered=True)
+        assert c.is_monotonic_increasing is False
+        assert c.is_monotonic_decreasing is True
+
+        # test when data is neither monotonic increasing nor decreasing
+        reordered_data = [data[0], data[2], data[1]]
+        c = CategoricalIndex(reordered_data, categories=reversed(data))
+        assert c.is_monotonic_increasing is False
+        assert c.is_monotonic_decreasing is False
+
+        # non lexsorted categories
+        categories = non_lexsorted_data
+
+        c = CategoricalIndex(categories[:2], categories=categories)
+        assert c.is_monotonic_increasing is True
+        assert c.is_monotonic_decreasing is False
+
+        c = CategoricalIndex(categories[1:3], categories=categories)
+        assert c.is_monotonic_increasing is True
+        assert c.is_monotonic_decreasing is False
+
+    def test_has_duplicates(self):
 
         idx = CategoricalIndex([0, 0, 0], name='foo')
-        self.assertFalse(idx.is_unique)
-        self.assertTrue(idx.has_duplicates)
+        assert idx.is_unique is False
+        assert idx.has_duplicates is True
+
+    def test_drop_duplicates(self):
 
+        idx = CategoricalIndex([0, 0, 0], name='foo')
         expected = CategoricalIndex([0], name='foo')
-        self.assert_index_equal(idx.drop_duplicates(), expected)
-        self.assert_index_equal(idx.unique(), expected)
+        tm.assert_index_equal(idx.drop_duplicates(), expected)
+        tm.assert_index_equal(idx.unique(), expected)
 
     def test_get_indexer(self):
 
@@ -419,22 +641,26 @@ def test_get_indexer(self):
             r1 = idx1.get_indexer(idx2)
             assert_almost_equal(r1, np.array([0, 1, 2, -1], dtype=np.intp))
 
-        self.assertRaises(NotImplementedError,
-                          lambda: idx2.get_indexer(idx1, method='pad'))
-        self.assertRaises(NotImplementedError,
-                          lambda: idx2.get_indexer(idx1, method='backfill'))
-        self.assertRaises(NotImplementedError,
-                          lambda: idx2.get_indexer(idx1, method='nearest'))
+        msg = ("method='pad' and method='backfill' not implemented yet for"
+               " CategoricalIndex")
+        with pytest.raises(NotImplementedError, match=msg):
+            idx2.get_indexer(idx1, method='pad')
+        with pytest.raises(NotImplementedError, match=msg):
+            idx2.get_indexer(idx1, method='backfill')
+
+        msg = "method='nearest' not implemented yet for CategoricalIndex"
+        with pytest.raises(NotImplementedError, match=msg):
+            idx2.get_indexer(idx1, method='nearest')
 
     def test_get_loc(self):
         # GH 12531
         cidx1 = CategoricalIndex(list('abcde'), categories=list('edabc'))
         idx1 = Index(list('abcde'))
-        self.assertEqual(cidx1.get_loc('a'), idx1.get_loc('a'))
-        self.assertEqual(cidx1.get_loc('e'), idx1.get_loc('e'))
+        assert cidx1.get_loc('a') == idx1.get_loc('a')
+        assert cidx1.get_loc('e') == idx1.get_loc('e')
 
         for i in [cidx1, idx1]:
-            with tm.assertRaises(KeyError):
+            with pytest.raises(KeyError):
                 i.get_loc('NOT-EXIST')
 
         # non-unique
@@ -443,16 +669,16 @@ def test_get_loc(self):
 
         # results in bool array
         res = cidx2.get_loc('d')
-        self.assert_numpy_array_equal(res, idx2.get_loc('d'))
-        self.assert_numpy_array_equal(res, np.array([False, False, False,
-                                                     True, False, True]))
+        tm.assert_numpy_array_equal(res, idx2.get_loc('d'))
+        tm.assert_numpy_array_equal(res, np.array([False, False, False,
+                                                   True, False, True]))
         # unique element results in scalar
         res = cidx2.get_loc('e')
-        self.assertEqual(res, idx2.get_loc('e'))
-        self.assertEqual(res, 4)
+        assert res == idx2.get_loc('e')
+        assert res == 4
 
         for i in [cidx2, idx2]:
-            with tm.assertRaises(KeyError):
+            with pytest.raises(KeyError):
                 i.get_loc('NOT-EXIST')
 
         # non-unique, slicable
@@ -461,15 +687,15 @@ def test_get_loc(self):
 
         # results in slice
         res = cidx3.get_loc('a')
-        self.assertEqual(res, idx3.get_loc('a'))
-        self.assertEqual(res, slice(0, 2, None))
+        assert res == idx3.get_loc('a')
+        assert res == slice(0, 2, None)
 
         res = cidx3.get_loc('b')
-        self.assertEqual(res, idx3.get_loc('b'))
-        self.assertEqual(res, slice(2, 5, None))
+        assert res == idx3.get_loc('b')
+        assert res == slice(2, 5, None)
 
         for i in [cidx3, idx3]:
-            with tm.assertRaises(KeyError):
+            with pytest.raises(KeyError):
                 i.get_loc('c')
 
     def test_repr_roundtrip(self):
@@ -505,95 +731,123 @@ def test_isin(self):
             ci.isin(['c', 'a', 'b', np.nan]), np.array([True] * 6))
 
         # mismatched categorical -> coerced to ndarray so doesn't matter
-        tm.assert_numpy_array_equal(
-            ci.isin(ci.set_categories(list('abcdefghi'))), np.array([True] *
-                                                                    6))
-        tm.assert_numpy_array_equal(
-            ci.isin(ci.set_categories(list('defghi'))),
-            np.array([False] * 5 + [True]))
+        result = ci.isin(ci.set_categories(list('abcdefghi')))
+        expected = np.array([True] * 6)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = ci.isin(ci.set_categories(list('defghi')))
+        expected = np.array([False] * 5 + [True])
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_identical(self):
 
         ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
         ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'],
                                ordered=True)
-        self.assertTrue(ci1.identical(ci1))
-        self.assertTrue(ci1.identical(ci1.copy()))
-        self.assertFalse(ci1.identical(ci2))
+        assert ci1.identical(ci1)
+        assert ci1.identical(ci1.copy())
+        assert not ci1.identical(ci2)
 
     def test_ensure_copied_data(self):
-        # Check the "copy" argument of each Index.__new__ is honoured
-        # GH12309
+        # gh-12309: Check the "copy" argument of each
+        # Index.__new__ is honored.
+        #
         # Must be tested separately from other indexes because
-        # self.value is not an ndarray
+        # self.value is not an ndarray.
         _base = lambda ar: ar if ar.base is None else ar.base
+
         for index in self.indices.values():
             result = CategoricalIndex(index.values, copy=True)
             tm.assert_index_equal(index, result)
-            self.assertIsNot(_base(index.values), _base(result.values))
+            assert _base(index.values) is not _base(result.values)
 
             result = CategoricalIndex(index.values, copy=False)
-            self.assertIs(_base(index.values), _base(result.values))
+            assert _base(index.values) is _base(result.values)
 
     def test_equals_categorical(self):
         ci1 = CategoricalIndex(['a', 'b'], categories=['a', 'b'], ordered=True)
         ci2 = CategoricalIndex(['a', 'b'], categories=['a', 'b', 'c'],
                                ordered=True)
 
-        self.assertTrue(ci1.equals(ci1))
-        self.assertFalse(ci1.equals(ci2))
-        self.assertTrue(ci1.equals(ci1.astype(object)))
-        self.assertTrue(ci1.astype(object).equals(ci1))
+        assert ci1.equals(ci1)
+        assert not ci1.equals(ci2)
+        assert ci1.equals(ci1.astype(object))
+        assert ci1.astype(object).equals(ci1)
 
-        self.assertTrue((ci1 == ci1).all())
-        self.assertFalse((ci1 != ci1).all())
-        self.assertFalse((ci1 > ci1).all())
-        self.assertFalse((ci1 < ci1).all())
-        self.assertTrue((ci1 <= ci1).all())
-        self.assertTrue((ci1 >= ci1).all())
+        assert (ci1 == ci1).all()
+        assert not (ci1 != ci1).all()
+        assert not (ci1 > ci1).all()
+        assert not (ci1 < ci1).all()
+        assert (ci1 <= ci1).all()
+        assert (ci1 >= ci1).all()
 
-        self.assertFalse((ci1 == 1).all())
-        self.assertTrue((ci1 == Index(['a', 'b'])).all())
-        self.assertTrue((ci1 == ci1.values).all())
+        assert not (ci1 == 1).all()
+        assert (ci1 == Index(['a', 'b'])).all()
+        assert (ci1 == ci1.values).all()
 
         # invalid comparisons
-        with tm.assertRaisesRegexp(ValueError, "Lengths must match"):
+        with pytest.raises(ValueError, match="Lengths must match"):
             ci1 == Index(['a', 'b', 'c'])
-        self.assertRaises(TypeError, lambda: ci1 == ci2)
-        self.assertRaises(
-            TypeError, lambda: ci1 == Categorical(ci1.values, ordered=False))
-        self.assertRaises(
-            TypeError,
-            lambda: ci1 == Categorical(ci1.values, categories=list('abc')))
+
+        msg = ("categorical index comparisons must have the same categories"
+               " and ordered attributes")
+        with pytest.raises(TypeError, match=msg):
+            ci1 == ci2
+        with pytest.raises(TypeError, match=msg):
+            ci1 == Categorical(ci1.values, ordered=False)
+        with pytest.raises(TypeError, match=msg):
+            ci1 == Categorical(ci1.values, categories=list('abc'))
 
         # tests
         # make sure that we are testing for category inclusion properly
         ci = CategoricalIndex(list('aabca'), categories=['c', 'a', 'b'])
-        self.assertFalse(ci.equals(list('aabca')))
-        self.assertFalse(ci.equals(CategoricalIndex(list('aabca'))))
-        self.assertTrue(ci.equals(ci.copy()))
+        assert not ci.equals(list('aabca'))
+        # Same categories, but different order
+        # Unordered
+        assert ci.equals(CategoricalIndex(list('aabca')))
+        # Ordered
+        assert not ci.equals(CategoricalIndex(list('aabca'), ordered=True))
+        assert ci.equals(ci.copy())
 
         ci = CategoricalIndex(list('aabca') + [np.nan],
                               categories=['c', 'a', 'b'])
-        self.assertFalse(ci.equals(list('aabca')))
-        self.assertFalse(ci.equals(CategoricalIndex(list('aabca'))))
-        self.assertTrue(ci.equals(ci.copy()))
+        assert not ci.equals(list('aabca'))
+        assert not ci.equals(CategoricalIndex(list('aabca')))
+        assert ci.equals(ci.copy())
 
         ci = CategoricalIndex(list('aabca') + [np.nan],
                               categories=['c', 'a', 'b'])
-        self.assertFalse(ci.equals(list('aabca') + [np.nan]))
-        self.assertFalse(ci.equals(CategoricalIndex(list('aabca') + [np.nan])))
-        self.assertTrue(ci.equals(ci.copy()))
+        assert not ci.equals(list('aabca') + [np.nan])
+        assert ci.equals(CategoricalIndex(list('aabca') + [np.nan]))
+        assert not ci.equals(CategoricalIndex(list('aabca') + [np.nan],
+                                              ordered=True))
+        assert ci.equals(ci.copy())
+
+    def test_equals_categoridcal_unordered(self):
+        # https://github.com/pandas-dev/pandas/issues/16603
+        a = pd.CategoricalIndex(['A'], categories=['A', 'B'])
+        b = pd.CategoricalIndex(['A'], categories=['B', 'A'])
+        c = pd.CategoricalIndex(['C'], categories=['B', 'A'])
+        assert a.equals(b)
+        assert not a.equals(c)
+        assert not b.equals(c)
+
+    def test_frame_repr(self):
+        df = pd.DataFrame({"A": [1, 2, 3]},
+                          index=pd.CategoricalIndex(['a', 'b', 'c']))
+        result = repr(df)
+        expected = '   A\na  1\nb  2\nc  3'
+        assert result == expected
 
     def test_string_categorical_index_repr(self):
         # short
         idx = pd.CategoricalIndex(['a', 'bb', 'ccc'])
         if PY3:
-            expected = u"""CategoricalIndex(['a', 'bb', 'ccc'], categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
+            expected = u"""CategoricalIndex(['a', 'bb', 'ccc'], categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""  # noqa
+            assert repr(idx) == expected
         else:
-            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc'], categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
+            expected = u"""CategoricalIndex([u'a', u'bb', u'ccc'], categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""  # noqa
+            assert unicode(idx) == expected
 
         # multiple lines
         idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 10)
@@ -601,17 +855,17 @@ def test_string_categorical_index_repr(self):
             expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
                   'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb',
                   'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""
+                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
                   u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
                   u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc',
                   u'a', u'bb', u'ccc', u'a', u'bb', u'ccc'],
-                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""
+                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # truncated
         idx = pd.CategoricalIndex(['a', 'bb', 'ccc'] * 100)
@@ -619,42 +873,42 @@ def test_string_categorical_index_repr(self):
             expected = u"""CategoricalIndex(['a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a',
                   ...
                   'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc', 'a', 'bb', 'ccc'],
-                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category', length=300)"""
+                 categories=['a', 'bb', 'ccc'], ordered=False, dtype='category', length=300)"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a', u'bb',
                   u'ccc', u'a',
                   ...
                   u'ccc', u'a', u'bb', u'ccc', u'a', u'bb', u'ccc', u'a',
                   u'bb', u'ccc'],
-                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category', length=300)"""
+                 categories=[u'a', u'bb', u'ccc'], ordered=False, dtype='category', length=300)"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # larger categories
         idx = pd.CategoricalIndex(list('abcdefghijklmmo'))
         if PY3:
             expected = u"""CategoricalIndex(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l',
                   'm', 'm', 'o'],
-                 categories=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', ...], ordered=False, dtype='category')"""
+                 categories=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', ...], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', u'i', u'j',
                   u'k', u'l', u'm', u'm', u'o'],
-                 categories=[u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', ...], ordered=False, dtype='category')"""
+                 categories=[u'a', u'b', u'c', u'd', u'e', u'f', u'g', u'h', ...], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # short
         idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
         if PY3:
-            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(repr(idx), expected)
+            expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+            assert repr(idx) == expected
         else:
-            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-            self.assertEqual(unicode(idx), expected)
+            expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+            assert unicode(idx) == expected
 
         # multiple lines
         idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
@@ -662,17 +916,17 @@ def test_string_categorical_index_repr(self):
             expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
                   'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
                   'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
                   u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう',
                   u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # truncated
         idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
@@ -680,33 +934,33 @@ def test_string_categorical_index_repr(self):
             expected = u"""CategoricalIndex(['あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ',
                   ...
                   'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
                   u'ううう', u'あ',
                   ...
                   u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # larger categories
         idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
         if PY3:
             expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ', 'さ', 'し',
                   'す', 'せ', 'そ'],
-                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""
+                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(repr(idx), expected)
+            assert repr(idx) == expected
         else:
             expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', u'け', u'こ',
                   u'さ', u'し', u'す', u'せ', u'そ'],
-                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""
+                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""  # noqa
 
-            self.assertEqual(unicode(idx), expected)
+            assert unicode(idx) == expected
 
         # Emable Unicode option -----------------------------------------
         with cf.option_context('display.unicode.east_asian_width', True):
@@ -714,11 +968,11 @@ def test_string_categorical_index_repr(self):
             # short
             idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'])
             if PY3:
-                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(repr(idx), expected)
+                expected = u"""CategoricalIndex(['あ', 'いい', 'ううう'], categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
+                assert repr(idx) == expected
             else:
-                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
-                self.assertEqual(unicode(idx), expected)
+                expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう'], categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
+                assert unicode(idx) == expected
 
             # multiple lines
             idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 10)
@@ -727,18 +981,18 @@ def test_string_categorical_index_repr(self):
                   'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
                   'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい',
                   'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category')"""  # noqa
 
-                self.assertEqual(repr(idx), expected)
+                assert repr(idx) == expected
             else:
                 expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category')"""  # noqa
 
-                self.assertEqual(unicode(idx), expected)
+                assert unicode(idx) == expected
 
             # truncated
             idx = pd.CategoricalIndex([u'あ', u'いい', u'ううう'] * 100)
@@ -748,44 +1002,44 @@ def test_string_categorical_index_repr(self):
                   ...
                   'ううう', 'あ', 'いい', 'ううう', 'あ', 'いい', 'ううう',
                   'あ', 'いい', 'ううう'],
-                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""
+                 categories=['あ', 'いい', 'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
 
-                self.assertEqual(repr(idx), expected)
+                assert repr(idx) == expected
             else:
                 expected = u"""CategoricalIndex([u'あ', u'いい', u'ううう', u'あ', u'いい', u'ううう', u'あ',
                   u'いい', u'ううう', u'あ',
                   ...
                   u'ううう', u'あ', u'いい', u'ううう', u'あ', u'いい',
                   u'ううう', u'あ', u'いい', u'ううう'],
-                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""
+                 categories=[u'あ', u'いい', u'ううう'], ordered=False, dtype='category', length=300)"""  # noqa
 
-                self.assertEqual(unicode(idx), expected)
+                assert unicode(idx) == expected
 
             # larger categories
             idx = pd.CategoricalIndex(list(u'あいうえおかきくけこさしすせそ'))
             if PY3:
                 expected = u"""CategoricalIndex(['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', 'け', 'こ',
                   'さ', 'し', 'す', 'せ', 'そ'],
-                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""
+                 categories=['あ', 'い', 'う', 'え', 'お', 'か', 'き', 'く', ...], ordered=False, dtype='category')"""  # noqa
 
-                self.assertEqual(repr(idx), expected)
+                assert repr(idx) == expected
             else:
                 expected = u"""CategoricalIndex([u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く',
                   u'け', u'こ', u'さ', u'し', u'す', u'せ', u'そ'],
-                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""
+                 categories=[u'あ', u'い', u'う', u'え', u'お', u'か', u'き', u'く', ...], ordered=False, dtype='category')"""  # noqa
 
-                self.assertEqual(unicode(idx), expected)
+                assert unicode(idx) == expected
 
     def test_fillna_categorical(self):
         # GH 11343
         idx = CategoricalIndex([1.0, np.nan, 3.0, 1.0], name='x')
         # fill by value in categories
         exp = CategoricalIndex([1.0, 1.0, 3.0, 1.0], name='x')
-        self.assert_index_equal(idx.fillna(1.0), exp)
+        tm.assert_index_equal(idx.fillna(1.0), exp)
 
         # fill by value not in categories raises ValueError
-        with tm.assertRaisesRegexp(ValueError,
-                                   'fill value must be in categories'):
+        msg = 'fill value must be in categories'
+        with pytest.raises(ValueError, match=msg):
             idx.fillna(2.0)
 
     def test_take_fill_value(self):
@@ -839,12 +1093,12 @@ def test_take_fill_value(self):
 
         msg = ('When allow_fill=True and fill_value is not None, '
                'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             idx.take(np.array([1, -5]))
 
     def test_take_fill_value_datetime(self):
@@ -877,12 +1131,12 @@ def test_take_fill_value_datetime(self):
 
         msg = ('When allow_fill=True and fill_value is not None, '
                'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             idx.take(np.array([1, -5]))
 
     def test_take_invalid_kwargs(self):
@@ -890,13 +1144,33 @@ def test_take_invalid_kwargs(self):
         indices = [1, 0, -1]
 
         msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, idx.take,
-                              indices, foo=2)
+        with pytest.raises(TypeError, match=msg):
+            idx.take(indices, foo=2)
 
         msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, out=indices)
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, out=indices)
 
         msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, mode='clip')
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, mode='clip')
+
+    @pytest.mark.parametrize('dtype, engine_type', [
+        (np.int8, libindex.Int8Engine),
+        (np.int16, libindex.Int16Engine),
+        (np.int32, libindex.Int32Engine),
+        (np.int64, libindex.Int64Engine),
+    ])
+    def test_engine_type(self, dtype, engine_type):
+        if dtype != np.int64:
+            # num. of uniques required to push CategoricalIndex.codes to a
+            # dtype (128 categories required for .codes dtype to be int16 etc.)
+            num_uniques = {np.int8: 1, np.int16: 128, np.int32: 32768}[dtype]
+            ci = pd.CategoricalIndex(range(num_uniques))
+        else:
+            # having 2**32 - 2**31 categories would be very memory-intensive,
+            # so we cheat a bit with the dtype
+            ci = pd.CategoricalIndex(range(32768))  # == 2**16 - 2**(16 - 1)
+            ci.values._codes = ci.values._codes.astype('int64')
+        assert np.issubdtype(ci.codes.dtype, dtype)
+        assert isinstance(ci._engine, engine_type)
diff --git a/pandas/tests/indexes/test_common.py b/pandas/tests/indexes/test_common.py
new file mode 100644
index 0000000000000..03448129a48fc
--- /dev/null
+++ b/pandas/tests/indexes/test_common.py
@@ -0,0 +1,355 @@
+"""
+Collection of tests asserting things that should be true for
+any index subclass. Makes use of the `indices` fixture defined
+in pandas/tests/indexes/conftest.py.
+"""
+import re
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import iNaT
+
+from pandas.core.dtypes.common import needs_i8_conversion
+
+import pandas as pd
+from pandas import CategoricalIndex, MultiIndex, RangeIndex, compat
+import pandas.util.testing as tm
+
+
+class TestCommon(object):
+
+    def test_droplevel(self, indices):
+        # GH 21115
+        if isinstance(indices, MultiIndex):
+            # Tested separately in test_multi.py
+            return
+
+        assert indices.droplevel([]).equals(indices)
+
+        for level in indices.name, [indices.name]:
+            if isinstance(indices.name, tuple) and level is indices.name:
+                # GH 21121 : droplevel with tuple name
+                continue
+            with pytest.raises(ValueError):
+                indices.droplevel(level)
+
+        for level in 'wrong', ['wrong']:
+            with pytest.raises(KeyError):
+                indices.droplevel(level)
+
+    def test_constructor_non_hashable_name(self, indices):
+        # GH 20527
+
+        if isinstance(indices, MultiIndex):
+            pytest.skip("multiindex handled in test_multi.py")
+
+        message = "Index.name must be a hashable type"
+        renamed = [['1']]
+
+        # With .rename()
+        with pytest.raises(TypeError, match=message):
+            indices.rename(name=renamed)
+
+        # With .set_names()
+        with pytest.raises(TypeError, match=message):
+            indices.set_names(names=renamed)
+
+    def test_constructor_unwraps_index(self, indices):
+        if isinstance(indices, pd.MultiIndex):
+            raise pytest.skip("MultiIndex has no ._data")
+        a = indices
+        b = type(a)(a)
+        tm.assert_equal(a._data, b._data)
+
+    @pytest.mark.parametrize("itm", [101, 'no_int'])
+    # FutureWarning from non-tuple sequence of nd indexing
+    @pytest.mark.filterwarnings("ignore::FutureWarning")
+    def test_getitem_error(self, indices, itm):
+        with pytest.raises(IndexError):
+            indices[itm]
+
+    @pytest.mark.parametrize(
+        'fname, sname, expected_name',
+        [
+            ('A', 'A', 'A'),
+            ('A', 'B', None),
+            ('A', None, None),
+            (None, 'B', None),
+            (None, None, None),
+        ])
+    def test_corner_union(self, indices, fname, sname, expected_name):
+        # GH 9943 9862
+        # Test unions with various name combinations
+        # Do not test MultiIndex or repeats
+
+        if isinstance(indices, MultiIndex) or not indices.is_unique:
+            pytest.skip("Not for MultiIndex or repeated indices")
+
+        # Test copy.union(copy)
+        first = indices.copy().set_names(fname)
+        second = indices.copy().set_names(sname)
+        union = first.union(second)
+        expected = indices.copy().set_names(expected_name)
+        tm.assert_index_equal(union, expected)
+
+        # Test copy.union(empty)
+        first = indices.copy().set_names(fname)
+        second = indices.drop(indices).set_names(sname)
+        union = first.union(second)
+        expected = indices.copy().set_names(expected_name)
+        tm.assert_index_equal(union, expected)
+
+        # Test empty.union(copy)
+        first = indices.drop(indices).set_names(fname)
+        second = indices.copy().set_names(sname)
+        union = first.union(second)
+        expected = indices.copy().set_names(expected_name)
+        tm.assert_index_equal(union, expected)
+
+        # Test empty.union(empty)
+        first = indices.drop(indices).set_names(fname)
+        second = indices.drop(indices).set_names(sname)
+        union = first.union(second)
+        expected = indices.drop(indices).set_names(expected_name)
+        tm.assert_index_equal(union, expected)
+
+    def test_to_flat_index(self, indices):
+        # 22866
+        if isinstance(indices, MultiIndex):
+            pytest.skip("Separate expectation for MultiIndex")
+
+        result = indices.to_flat_index()
+        tm.assert_index_equal(result, indices)
+
+    def test_wrong_number_names(self, indices):
+        with pytest.raises(ValueError, match="^Length"):
+            indices.names = ["apple", "banana", "carrot"]
+
+    def test_set_name_methods(self, indices):
+        new_name = "This is the new name for this index"
+
+        # don't tests a MultiIndex here (as its tested separated)
+        if isinstance(indices, MultiIndex):
+            pytest.skip('Skip check for MultiIndex')
+        original_name = indices.name
+        new_ind = indices.set_names([new_name])
+        assert new_ind.name == new_name
+        assert indices.name == original_name
+        res = indices.rename(new_name, inplace=True)
+
+        # should return None
+        assert res is None
+        assert indices.name == new_name
+        assert indices.names == [new_name]
+        # with pytest.raises(TypeError, match="list-like"):
+        #    # should still fail even if it would be the right length
+        #    ind.set_names("a")
+        with pytest.raises(ValueError, match="Level must be None"):
+            indices.set_names("a", level=0)
+
+        # rename in place just leaves tuples and other containers alone
+        name = ('A', 'B')
+        indices.rename(name, inplace=True)
+        assert indices.name == name
+        assert indices.names == [name]
+
+    def test_dtype_str(self, indices):
+        dtype = indices.dtype_str
+        assert isinstance(dtype, compat.string_types)
+        assert dtype == str(indices.dtype)
+
+    def test_hash_error(self, indices):
+        index = indices
+        with pytest.raises(TypeError, match=("unhashable type: %r" %
+                                             type(index).__name__)):
+            hash(indices)
+
+    def test_copy_and_deepcopy(self, indices):
+        from copy import copy, deepcopy
+
+        if isinstance(indices, MultiIndex):
+            pytest.skip('Skip check for MultiIndex')
+
+        for func in (copy, deepcopy):
+            idx_copy = func(indices)
+            assert idx_copy is not indices
+            assert idx_copy.equals(indices)
+
+        new_copy = indices.copy(deep=True, name="banana")
+        assert new_copy.name == "banana"
+
+    def test_unique(self, indices):
+        # don't test a MultiIndex here (as its tested separated)
+        # don't test a CategoricalIndex because categories change (GH 18291)
+        if isinstance(indices, (MultiIndex, CategoricalIndex)):
+            pytest.skip('Skip check for MultiIndex/CategoricalIndex')
+
+        # GH 17896
+        expected = indices.drop_duplicates()
+        for level in 0, indices.name, None:
+            result = indices.unique(level=level)
+            tm.assert_index_equal(result, expected)
+
+        msg = "Too many levels: Index has only 1 level, not 4"
+        with pytest.raises(IndexError, match=msg):
+            indices.unique(level=3)
+
+        msg = r"Level wrong must be same as name \({}\)".format(
+            re.escape(indices.name.__repr__()))
+        with pytest.raises(KeyError, match=msg):
+            indices.unique(level='wrong')
+
+    def test_get_unique_index(self, indices):
+        # MultiIndex tested separately
+        if not len(indices) or isinstance(indices, MultiIndex):
+            pytest.skip('Skip check for empty Index and MultiIndex')
+
+        idx = indices[[0] * 5]
+        idx_unique = indices[[0]]
+
+        # We test against `idx_unique`, so first we make sure it's unique
+        # and doesn't contain nans.
+        assert idx_unique.is_unique is True
+        try:
+            assert idx_unique.hasnans is False
+        except NotImplementedError:
+            pass
+
+        for dropna in [False, True]:
+            result = idx._get_unique_index(dropna=dropna)
+            tm.assert_index_equal(result, idx_unique)
+
+        # nans:
+        if not indices._can_hold_na:
+            pytest.skip('Skip na-check if index cannot hold na')
+
+        if needs_i8_conversion(indices):
+            vals = indices.asi8[[0] * 5]
+            vals[0] = iNaT
+        else:
+            vals = indices.values[[0] * 5]
+            vals[0] = np.nan
+
+        vals_unique = vals[:2]
+        idx_nan = indices._shallow_copy(vals)
+        idx_unique_nan = indices._shallow_copy(vals_unique)
+        assert idx_unique_nan.is_unique is True
+
+        assert idx_nan.dtype == indices.dtype
+        assert idx_unique_nan.dtype == indices.dtype
+
+        for dropna, expected in zip([False, True],
+                                    [idx_unique_nan,
+                                     idx_unique]):
+            for i in [idx_nan, idx_unique_nan]:
+                result = i._get_unique_index(dropna=dropna)
+                tm.assert_index_equal(result, expected)
+
+    def test_sort(self, indices):
+        msg = "cannot sort an Index object in-place, use sort_values instead"
+        with pytest.raises(TypeError, match=msg):
+            indices.sort()
+
+    def test_mutability(self, indices):
+        if not len(indices):
+            pytest.skip('Skip check for empty Index')
+        msg = "Index does not support mutable operations"
+        with pytest.raises(TypeError, match=msg):
+            indices[0] = indices[0]
+
+    def test_view(self, indices):
+        assert indices.view().name == indices.name
+
+    def test_compat(self, indices):
+        assert indices.tolist() == list(indices)
+
+    def test_searchsorted_monotonic(self, indices):
+        # GH17271
+        # not implemented for tuple searches in MultiIndex
+        # or Intervals searches in IntervalIndex
+        if isinstance(indices, (MultiIndex, pd.IntervalIndex)):
+            pytest.skip('Skip check for MultiIndex/IntervalIndex')
+
+        # nothing to test if the index is empty
+        if indices.empty:
+            pytest.skip('Skip check for empty Index')
+        value = indices[0]
+
+        # determine the expected results (handle dupes for 'right')
+        expected_left, expected_right = 0, (indices == value).argmin()
+        if expected_right == 0:
+            # all values are the same, expected_right should be length
+            expected_right = len(indices)
+
+        # test _searchsorted_monotonic in all cases
+        # test searchsorted only for increasing
+        if indices.is_monotonic_increasing:
+            ssm_left = indices._searchsorted_monotonic(value, side='left')
+            assert expected_left == ssm_left
+
+            ssm_right = indices._searchsorted_monotonic(value, side='right')
+            assert expected_right == ssm_right
+
+            ss_left = indices.searchsorted(value, side='left')
+            assert expected_left == ss_left
+
+            ss_right = indices.searchsorted(value, side='right')
+            assert expected_right == ss_right
+
+        elif indices.is_monotonic_decreasing:
+            ssm_left = indices._searchsorted_monotonic(value, side='left')
+            assert expected_left == ssm_left
+
+            ssm_right = indices._searchsorted_monotonic(value, side='right')
+            assert expected_right == ssm_right
+        else:
+            # non-monotonic should raise.
+            with pytest.raises(ValueError):
+                indices._searchsorted_monotonic(value, side='left')
+
+    def test_pickle(self, indices):
+        original_name, indices.name = indices.name, 'foo'
+        unpickled = tm.round_trip_pickle(indices)
+        assert indices.equals(unpickled)
+        indices.name = original_name
+
+    @pytest.mark.parametrize('keep', ['first', 'last', False])
+    def test_duplicated(self, indices, keep):
+        if not len(indices) or isinstance(indices, (MultiIndex, RangeIndex)):
+            # MultiIndex tested separately in:
+            # tests/indexes/multi/test_unique_and_duplicates
+            pytest.skip('Skip check for empty Index, MultiIndex, RangeIndex')
+
+        holder = type(indices)
+
+        idx = holder(indices)
+        if idx.has_duplicates:
+            # We are testing the duplicated-method here, so we need to know
+            # exactly which indices are duplicate and how (for the result).
+            # This is not possible if "idx" has duplicates already, which we
+            # therefore remove. This is seemingly circular, as drop_duplicates
+            # invokes duplicated, but in the end, it all works out because we
+            # cross-check with Series.duplicated, which is tested separately.
+            idx = idx.drop_duplicates()
+
+        n, k = len(idx), 10
+        duplicated_selection = np.random.choice(n, k * n)
+        expected = pd.Series(duplicated_selection).duplicated(keep=keep).values
+        idx = holder(idx.values[duplicated_selection])
+
+        result = idx.duplicated(keep=keep)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_has_duplicates(self, indices):
+        holder = type(indices)
+        if not len(indices) or isinstance(indices, (MultiIndex, RangeIndex)):
+            # MultiIndex tested separately in:
+            #   tests/indexes/multi/test_unique_and_duplicates.
+            # RangeIndex is unique by definition.
+            pytest.skip('Skip check for empty Index, MultiIndex, '
+                        'and RangeIndex')
+
+        idx = holder([indices[0]] * 5)
+        assert idx.is_unique is False
+        assert idx.has_duplicates is True
diff --git a/pandas/tests/indexes/test_frozen.py b/pandas/tests/indexes/test_frozen.py
index a82409fbf9513..c2931b10233e0 100644
--- a/pandas/tests/indexes/test_frozen.py
+++ b/pandas/tests/indexes/test_frozen.py
@@ -1,15 +1,19 @@
+import warnings
+
 import numpy as np
-from pandas.util import testing as tm
-from pandas.tests.test_base import CheckImmutable, CheckStringMixin
-from pandas.indexes.frozen import FrozenList, FrozenNDArray
+
 from pandas.compat import u
 
+from pandas.core.indexes.frozen import FrozenList, FrozenNDArray
+from pandas.tests.test_base import CheckImmutable, CheckStringMixin
+from pandas.util import testing as tm
+
 
-class TestFrozenList(CheckImmutable, CheckStringMixin, tm.TestCase):
+class TestFrozenList(CheckImmutable, CheckStringMixin):
     mutable_methods = ('extend', 'pop', 'remove', 'insert')
     unicode_container = FrozenList([u("\u05d0"), u("\u05d1"), "c"])
 
-    def setUp(self):
+    def setup_method(self, _):
         self.lst = [1, 2, 3, 4, 5]
         self.container = FrozenList(self.lst)
         self.klass = FrozenList
@@ -23,32 +27,59 @@ def test_add(self):
         expected = FrozenList([1, 2, 3] + self.lst)
         self.check_result(result, expected)
 
-    def test_inplace(self):
+    def test_iadd(self):
         q = r = self.container
+
         q += [5]
         self.check_result(q, self.lst + [5])
-        # other shouldn't be mutated
+
+        # Other shouldn't be mutated.
         self.check_result(r, self.lst)
 
+    def test_union(self):
+        result = self.container.union((1, 2, 3))
+        expected = FrozenList(self.lst + [1, 2, 3])
+        self.check_result(result, expected)
+
+    def test_difference(self):
+        result = self.container.difference([2])
+        expected = FrozenList([1, 3, 4, 5])
+        self.check_result(result, expected)
 
-class TestFrozenNDArray(CheckImmutable, CheckStringMixin, tm.TestCase):
+    def test_difference_dupe(self):
+        result = FrozenList([1, 2, 3, 2]).difference([2])
+        expected = FrozenList([1, 3])
+        self.check_result(result, expected)
+
+
+class TestFrozenNDArray(CheckImmutable, CheckStringMixin):
     mutable_methods = ('put', 'itemset', 'fill')
-    unicode_container = FrozenNDArray([u("\u05d0"), u("\u05d1"), "c"])
 
-    def setUp(self):
+    def setup_method(self, _):
         self.lst = [3, 5, 7, -2]
-        self.container = FrozenNDArray(self.lst)
         self.klass = FrozenNDArray
 
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", FutureWarning)
+
+            self.container = FrozenNDArray(self.lst)
+            self.unicode_container = FrozenNDArray(
+                [u("\u05d0"), u("\u05d1"), "c"])
+
+    def test_constructor_warns(self):
+        # see gh-9031
+        with tm.assert_produces_warning(FutureWarning):
+            FrozenNDArray([1, 2, 3])
+
     def test_shallow_copying(self):
         original = self.container.copy()
-        self.assertIsInstance(self.container.view(), FrozenNDArray)
-        self.assertFalse(isinstance(
-            self.container.view(np.ndarray), FrozenNDArray))
-        self.assertIsNot(self.container.view(), self.container)
-        self.assert_numpy_array_equal(self.container, original)
-        # shallow copy should be the same too
-        self.assertIsInstance(self.container._shallow_copy(), FrozenNDArray)
+        assert isinstance(self.container.view(), FrozenNDArray)
+        assert not isinstance(self.container.view(np.ndarray), FrozenNDArray)
+        assert self.container.view() is not self.container
+        tm.assert_numpy_array_equal(self.container, original)
+
+        # Shallow copy should be the same too
+        assert isinstance(self.container._shallow_copy(), FrozenNDArray)
 
         # setting should not be allowed
         def testit(container):
@@ -59,10 +90,20 @@ def testit(container):
     def test_values(self):
         original = self.container.view(np.ndarray).copy()
         n = original[0] + 15
+
         vals = self.container.values()
-        self.assert_numpy_array_equal(original, vals)
-        self.assertIsNot(original, vals)
+        tm.assert_numpy_array_equal(original, vals)
+
+        assert original is not vals
         vals[0] = n
-        self.assertIsInstance(self.container, FrozenNDArray)
-        self.assert_numpy_array_equal(self.container.values(), original)
-        self.assertEqual(vals[0], n)
+
+        assert isinstance(self.container, FrozenNDArray)
+        tm.assert_numpy_array_equal(self.container.values(), original)
+        assert vals[0] == n
+
+    def test_searchsorted(self):
+        expected = 2
+        assert self.container.searchsorted(7) == expected
+
+        with tm.assert_produces_warning(FutureWarning):
+            assert self.container.searchsorted(v=7) == expected
diff --git a/pandas/tests/indexes/test_multi.py b/pandas/tests/indexes/test_multi.py
deleted file mode 100644
index 0c274b2f6c4ff..0000000000000
--- a/pandas/tests/indexes/test_multi.py
+++ /dev/null
@@ -1,2709 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import re
-import warnings
-
-from datetime import timedelta
-from itertools import product
-
-import pytest
-
-import numpy as np
-
-import pandas as pd
-
-from pandas import (CategoricalIndex, DataFrame, Index, MultiIndex,
-                    compat, date_range, period_range)
-from pandas.compat import PY3, long, lrange, lzip, range, u
-from pandas.core.common import PerformanceWarning, UnsortedIndexError
-from pandas.indexes.base import InvalidIndexError
-from pandas._libs import lib
-from pandas._libs.lib import Timestamp
-
-import pandas.util.testing as tm
-
-from pandas.util.testing import (assertRaises, assertRaisesRegexp,
-                                 assert_almost_equal, assert_copy)
-
-
-from .common import Base
-
-
-class TestMultiIndex(Base, tm.TestCase):
-    _holder = MultiIndex
-    _compat_props = ['shape', 'ndim', 'size', 'itemsize']
-
-    def setUp(self):
-        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
-        minor_axis = Index(['one', 'two'])
-
-        major_labels = np.array([0, 0, 1, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-        self.index_names = ['first', 'second']
-        self.indices = dict(index=MultiIndex(levels=[major_axis, minor_axis],
-                                             labels=[major_labels, minor_labels
-                                                     ], names=self.index_names,
-                                             verify_integrity=False))
-        self.setup_indices()
-
-    def create_index(self):
-        return self.index
-
-    def test_boolean_context_compat2(self):
-
-        # boolean context compat
-        # GH7897
-        i1 = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        i2 = MultiIndex.from_tuples([('A', 1), ('A', 3)])
-        common = i1.intersection(i2)
-
-        def f():
-            if common:
-                pass
-
-        tm.assertRaisesRegexp(ValueError, 'The truth value of a', f)
-
-    def test_labels_dtypes(self):
-
-        # GH 8456
-        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        self.assertTrue(i.labels[0].dtype == 'int8')
-        self.assertTrue(i.labels[1].dtype == 'int8')
-
-        i = MultiIndex.from_product([['a'], range(40)])
-        self.assertTrue(i.labels[1].dtype == 'int8')
-        i = MultiIndex.from_product([['a'], range(400)])
-        self.assertTrue(i.labels[1].dtype == 'int16')
-        i = MultiIndex.from_product([['a'], range(40000)])
-        self.assertTrue(i.labels[1].dtype == 'int32')
-
-        i = pd.MultiIndex.from_product([['a'], range(1000)])
-        self.assertTrue((i.labels[0] >= 0).all())
-        self.assertTrue((i.labels[1] >= 0).all())
-
-    def test_where(self):
-        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-
-        def f():
-            i.where(True)
-
-        self.assertRaises(NotImplementedError, f)
-
-    def test_where_array_like(self):
-        i = MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        klasses = [list, tuple, np.array, pd.Series]
-        cond = [False, True]
-
-        for klass in klasses:
-            f = lambda: i.where(klass(cond))
-            self.assertRaises(NotImplementedError, f)
-
-    def test_repeat(self):
-        reps = 2
-        numbers = [1, 2, 3]
-        names = np.array(['foo', 'bar'])
-
-        m = MultiIndex.from_product([
-            numbers, names], names=names)
-        expected = MultiIndex.from_product([
-            numbers, names.repeat(reps)], names=names)
-        tm.assert_index_equal(m.repeat(reps), expected)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = m.repeat(n=reps)
-            tm.assert_index_equal(result, expected)
-
-    def test_numpy_repeat(self):
-        reps = 2
-        numbers = [1, 2, 3]
-        names = np.array(['foo', 'bar'])
-
-        m = MultiIndex.from_product([
-            numbers, names], names=names)
-        expected = MultiIndex.from_product([
-            numbers, names.repeat(reps)], names=names)
-        tm.assert_index_equal(np.repeat(m, reps), expected)
-
-        msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.repeat, m, reps, axis=1)
-
-    def test_set_name_methods(self):
-        # so long as these are synonyms, we don't need to test set_names
-        self.assertEqual(self.index.rename, self.index.set_names)
-        new_names = [name + "SUFFIX" for name in self.index_names]
-        ind = self.index.set_names(new_names)
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, new_names)
-        with assertRaisesRegexp(ValueError, "^Length"):
-            ind.set_names(new_names + new_names)
-        new_names2 = [name + "SUFFIX2" for name in new_names]
-        res = ind.set_names(new_names2, inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, new_names2)
-
-        # set names for specific level (# GH7792)
-        ind = self.index.set_names(new_names[0], level=0)
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, [new_names[0], self.index_names[1]])
-
-        res = ind.set_names(new_names2[0], level=0, inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, [new_names2[0], self.index_names[1]])
-
-        # set names for multiple levels
-        ind = self.index.set_names(new_names, level=[0, 1])
-        self.assertEqual(self.index.names, self.index_names)
-        self.assertEqual(ind.names, new_names)
-
-        res = ind.set_names(new_names2, level=[0, 1], inplace=True)
-        self.assertIsNone(res)
-        self.assertEqual(ind.names, new_names2)
-
-    def test_set_levels(self):
-        # side note - you probably wouldn't want to use levels and labels
-        # directly like this - but it is possible.
-        levels = self.index.levels
-        new_levels = [[lev + 'a' for lev in level] for level in levels]
-
-        def assert_matching(actual, expected, check_dtype=False):
-            # avoid specifying internal representation
-            # as much as possible
-            self.assertEqual(len(actual), len(expected))
-            for act, exp in zip(actual, expected):
-                act = np.asarray(act)
-                exp = np.asarray(exp)
-                tm.assert_numpy_array_equal(act, exp, check_dtype=check_dtype)
-
-        # level changing [w/o mutation]
-        ind2 = self.index.set_levels(new_levels)
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-        # level changing [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, new_levels)
-
-        # level changing specific level [w/o mutation]
-        ind2 = self.index.set_levels(new_levels[0], level=0)
-        assert_matching(ind2.levels, [new_levels[0], levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        ind2 = self.index.set_levels(new_levels[1], level=1)
-        assert_matching(ind2.levels, [levels[0], new_levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        # level changing multiple levels [w/o mutation]
-        ind2 = self.index.set_levels(new_levels, level=[0, 1])
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-        # level changing specific level [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels[0], level=0, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, [new_levels[0], levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels[1], level=1, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, [levels[0], new_levels[1]])
-        assert_matching(self.index.levels, levels)
-
-        # level changing multiple levels [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_levels(new_levels, level=[0, 1],
-                                         inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.levels, new_levels)
-        assert_matching(self.index.levels, levels)
-
-        # illegal level changing should not change levels
-        # GH 13754
-        original_index = self.index.copy()
-        for inplace in [True, False]:
-            with assertRaisesRegexp(ValueError, "^On"):
-                self.index.set_levels(['c'], level=0, inplace=inplace)
-            assert_matching(self.index.levels, original_index.levels,
-                            check_dtype=True)
-
-            with assertRaisesRegexp(ValueError, "^On"):
-                self.index.set_labels([0, 1, 2, 3, 4, 5], level=0,
-                                      inplace=inplace)
-            assert_matching(self.index.labels, original_index.labels,
-                            check_dtype=True)
-
-            with assertRaisesRegexp(TypeError, "^Levels"):
-                self.index.set_levels('c', level=0, inplace=inplace)
-            assert_matching(self.index.levels, original_index.levels,
-                            check_dtype=True)
-
-            with assertRaisesRegexp(TypeError, "^Labels"):
-                self.index.set_labels(1, level=0, inplace=inplace)
-            assert_matching(self.index.labels, original_index.labels,
-                            check_dtype=True)
-
-    def test_set_labels(self):
-        # side note - you probably wouldn't want to use levels and labels
-        # directly like this - but it is possible.
-        labels = self.index.labels
-        major_labels, minor_labels = labels
-        major_labels = [(x + 1) % 3 for x in major_labels]
-        minor_labels = [(x + 1) % 1 for x in minor_labels]
-        new_labels = [major_labels, minor_labels]
-
-        def assert_matching(actual, expected):
-            # avoid specifying internal representation
-            # as much as possible
-            self.assertEqual(len(actual), len(expected))
-            for act, exp in zip(actual, expected):
-                act = np.asarray(act)
-                exp = np.asarray(exp, dtype=np.int8)
-                tm.assert_numpy_array_equal(act, exp)
-
-        # label changing [w/o mutation]
-        ind2 = self.index.set_labels(new_labels)
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-        # label changing [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, new_labels)
-
-        # label changing specific level [w/o mutation]
-        ind2 = self.index.set_labels(new_labels[0], level=0)
-        assert_matching(ind2.labels, [new_labels[0], labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        ind2 = self.index.set_labels(new_labels[1], level=1)
-        assert_matching(ind2.labels, [labels[0], new_labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        # label changing multiple levels [w/o mutation]
-        ind2 = self.index.set_labels(new_labels, level=[0, 1])
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-        # label changing specific level [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels[0], level=0, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, [new_labels[0], labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels[1], level=1, inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, [labels[0], new_labels[1]])
-        assert_matching(self.index.labels, labels)
-
-        # label changing multiple levels [w/ mutation]
-        ind2 = self.index.copy()
-        inplace_return = ind2.set_labels(new_labels, level=[0, 1],
-                                         inplace=True)
-        self.assertIsNone(inplace_return)
-        assert_matching(ind2.labels, new_labels)
-        assert_matching(self.index.labels, labels)
-
-    def test_set_levels_labels_names_bad_input(self):
-        levels, labels = self.index.levels, self.index.labels
-        names = self.index.names
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of levels'):
-            self.index.set_levels([levels[0]])
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of labels'):
-            self.index.set_labels([labels[0]])
-
-        with tm.assertRaisesRegexp(ValueError, 'Length of names'):
-            self.index.set_names([names[0]])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_levels(levels[0])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_labels(labels[0])
-
-        # shouldn't scalar data error, instead should demand list-like
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_names(names[0])
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_levels(levels[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_levels(levels, level=0)
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(TypeError, 'list of lists-like'):
-            self.index.set_labels(labels[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'list-like'):
-            self.index.set_labels(labels, level=0)
-
-        # should have equal lengths
-        with tm.assertRaisesRegexp(ValueError, 'Length of names'):
-            self.index.set_names(names[0], level=[0, 1])
-
-        with tm.assertRaisesRegexp(TypeError, 'string'):
-            self.index.set_names(names, level=0)
-
-    def test_set_levels_categorical(self):
-        # GH13854
-        index = MultiIndex.from_arrays([list("xyzx"), [0, 1, 2, 3]])
-        for ordered in [False, True]:
-            cidx = CategoricalIndex(list("bac"), ordered=ordered)
-            result = index.set_levels(cidx, 0)
-            expected = MultiIndex(levels=[cidx, [0, 1, 2, 3]],
-                                  labels=index.labels)
-            tm.assert_index_equal(result, expected)
-
-            result_lvl = result.get_level_values(0)
-            expected_lvl = CategoricalIndex(list("bacb"),
-                                            categories=cidx.categories,
-                                            ordered=cidx.ordered)
-            tm.assert_index_equal(result_lvl, expected_lvl)
-
-    def test_metadata_immutable(self):
-        levels, labels = self.index.levels, self.index.labels
-        # shouldn't be able to set at either the top level or base level
-        mutable_regex = re.compile('does not support mutable operations')
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            levels[0] = levels[0]
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            levels[0][0] = levels[0][0]
-        # ditto for labels
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            labels[0] = labels[0]
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            labels[0][0] = labels[0][0]
-        # and for names
-        names = self.index.names
-        with assertRaisesRegexp(TypeError, mutable_regex):
-            names[0] = names[0]
-
-    def test_inplace_mutation_resets_values(self):
-        levels = [['a', 'b', 'c'], [4]]
-        levels2 = [[1, 2, 3], ['a']]
-        labels = [[0, 1, 0, 2, 2, 0], [0, 0, 0, 0, 0, 0]]
-        mi1 = MultiIndex(levels=levels, labels=labels)
-        mi2 = MultiIndex(levels=levels2, labels=labels)
-        vals = mi1.values.copy()
-        vals2 = mi2.values.copy()
-        self.assertIsNotNone(mi1._tuples)
-
-        # make sure level setting works
-        new_vals = mi1.set_levels(levels2).values
-        assert_almost_equal(vals2, new_vals)
-        # non-inplace doesn't kill _tuples [implementation detail]
-        assert_almost_equal(mi1._tuples, vals)
-        # and values is still same too
-        assert_almost_equal(mi1.values, vals)
-
-        # inplace should kill _tuples
-        mi1.set_levels(levels2, inplace=True)
-        assert_almost_equal(mi1.values, vals2)
-
-        # make sure label setting works too
-        labels2 = [[0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0]]
-        exp_values = np.empty((6, ), dtype=object)
-        exp_values[:] = [(long(1), 'a')] * 6
-        # must be 1d array of tuples
-        self.assertEqual(exp_values.shape, (6, ))
-        new_values = mi2.set_labels(labels2).values
-        # not inplace shouldn't change
-        assert_almost_equal(mi2._tuples, vals2)
-        # should have correct values
-        assert_almost_equal(exp_values, new_values)
-
-        # and again setting inplace should kill _tuples, etc
-        mi2.set_labels(labels2, inplace=True)
-        assert_almost_equal(mi2.values, new_values)
-
-    def test_copy_in_constructor(self):
-        levels = np.array(["a", "b", "c"])
-        labels = np.array([1, 1, 2, 0, 0, 1, 1])
-        val = labels[0]
-        mi = MultiIndex(levels=[levels, levels], labels=[labels, labels],
-                        copy=True)
-        self.assertEqual(mi.labels[0][0], val)
-        labels[0] = 15
-        self.assertEqual(mi.labels[0][0], val)
-        val = levels[0]
-        levels[0] = "PANDA"
-        self.assertEqual(mi.levels[0][0], val)
-
-    def test_set_value_keeps_names(self):
-        # motivating example from #3742
-        lev1 = ['hans', 'hans', 'hans', 'grethe', 'grethe', 'grethe']
-        lev2 = ['1', '2', '3'] * 2
-        idx = pd.MultiIndex.from_arrays([lev1, lev2], names=['Name', 'Number'])
-        df = pd.DataFrame(
-            np.random.randn(6, 4),
-            columns=['one', 'two', 'three', 'four'],
-            index=idx)
-        df = df.sort_index()
-        self.assertIsNone(df.is_copy)
-        self.assertEqual(df.index.names, ('Name', 'Number'))
-        df = df.set_value(('grethe', '4'), 'one', 99.34)
-        self.assertIsNone(df.is_copy)
-        self.assertEqual(df.index.names, ('Name', 'Number'))
-
-    def test_copy_names(self):
-        # Check that adding a "names" parameter to the copy is honored
-        # GH14302
-        multi_idx = pd.Index([(1, 2), (3, 4)], names=['MyName1', 'MyName2'])
-        multi_idx1 = multi_idx.copy()
-
-        self.assertTrue(multi_idx.equals(multi_idx1))
-        self.assertEqual(multi_idx.names, ['MyName1', 'MyName2'])
-        self.assertEqual(multi_idx1.names, ['MyName1', 'MyName2'])
-
-        multi_idx2 = multi_idx.copy(names=['NewName1', 'NewName2'])
-
-        self.assertTrue(multi_idx.equals(multi_idx2))
-        self.assertEqual(multi_idx.names, ['MyName1', 'MyName2'])
-        self.assertEqual(multi_idx2.names, ['NewName1', 'NewName2'])
-
-        multi_idx3 = multi_idx.copy(name=['NewName1', 'NewName2'])
-
-        self.assertTrue(multi_idx.equals(multi_idx3))
-        self.assertEqual(multi_idx.names, ['MyName1', 'MyName2'])
-        self.assertEqual(multi_idx3.names, ['NewName1', 'NewName2'])
-
-    def test_names(self):
-
-        # names are assigned in __init__
-        names = self.index_names
-        level_names = [level.name for level in self.index.levels]
-        self.assertEqual(names, level_names)
-
-        # setting bad names on existing
-        index = self.index
-        assertRaisesRegexp(ValueError, "^Length of names", setattr, index,
-                           "names", list(index.names) + ["third"])
-        assertRaisesRegexp(ValueError, "^Length of names", setattr, index,
-                           "names", [])
-
-        # initializing with bad names (should always be equivalent)
-        major_axis, minor_axis = self.index.levels
-        major_labels, minor_labels = self.index.labels
-        assertRaisesRegexp(ValueError, "^Length of names", MultiIndex,
-                           levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels],
-                           names=['first'])
-        assertRaisesRegexp(ValueError, "^Length of names", MultiIndex,
-                           levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels],
-                           names=['first', 'second', 'third'])
-
-        # names are assigned
-        index.names = ["a", "b"]
-        ind_names = list(index.names)
-        level_names = [level.name for level in index.levels]
-        self.assertEqual(ind_names, level_names)
-
-    def test_reference_duplicate_name(self):
-        idx = MultiIndex.from_tuples(
-            [('a', 'b'), ('c', 'd')], names=['x', 'x'])
-        self.assertTrue(idx._reference_duplicate_name('x'))
-
-        idx = MultiIndex.from_tuples(
-            [('a', 'b'), ('c', 'd')], names=['x', 'y'])
-        self.assertFalse(idx._reference_duplicate_name('x'))
-
-    def test_astype(self):
-        expected = self.index.copy()
-        actual = self.index.astype('O')
-        assert_copy(actual.levels, expected.levels)
-        assert_copy(actual.labels, expected.labels)
-        self.check_level_names(actual, expected.names)
-
-        with assertRaisesRegexp(TypeError, "^Setting.*dtype.*object"):
-            self.index.astype(np.dtype(int))
-
-    def test_constructor_single_level(self):
-        single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                  labels=[[0, 1, 2, 3]], names=['first'])
-        tm.assertIsInstance(single_level, Index)
-        self.assertNotIsInstance(single_level, MultiIndex)
-        self.assertEqual(single_level.name, 'first')
-
-        single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                  labels=[[0, 1, 2, 3]])
-        self.assertIsNone(single_level.name)
-
-    def test_constructor_no_levels(self):
-        assertRaisesRegexp(ValueError, "non-zero number of levels/labels",
-                           MultiIndex, levels=[], labels=[])
-        both_re = re.compile('Must pass both levels and labels')
-        with tm.assertRaisesRegexp(TypeError, both_re):
-            MultiIndex(levels=[])
-        with tm.assertRaisesRegexp(TypeError, both_re):
-            MultiIndex(labels=[])
-
-    def test_constructor_mismatched_label_levels(self):
-        labels = [np.array([1]), np.array([2]), np.array([3])]
-        levels = ["a"]
-        assertRaisesRegexp(ValueError, "Length of levels and labels must be"
-                           " the same", MultiIndex, levels=levels,
-                           labels=labels)
-        length_error = re.compile('>= length of level')
-        label_error = re.compile(r'Unequal label lengths: \[4, 2\]')
-
-        # important to check that it's looking at the right thing.
-        with tm.assertRaisesRegexp(ValueError, length_error):
-            MultiIndex(levels=[['a'], ['b']],
-                       labels=[[0, 1, 2, 3], [0, 3, 4, 1]])
-
-        with tm.assertRaisesRegexp(ValueError, label_error):
-            MultiIndex(levels=[['a'], ['b']], labels=[[0, 0, 0, 0], [0, 0]])
-
-        # external API
-        with tm.assertRaisesRegexp(ValueError, length_error):
-            self.index.copy().set_levels([['a'], ['b']])
-
-        with tm.assertRaisesRegexp(ValueError, label_error):
-            self.index.copy().set_labels([[0, 0, 0, 0], [0, 0]])
-
-        # deprecated properties
-        with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
-
-            with tm.assertRaisesRegexp(ValueError, length_error):
-                self.index.copy().levels = [['a'], ['b']]
-
-            with tm.assertRaisesRegexp(ValueError, label_error):
-                self.index.copy().labels = [[0, 0, 0, 0], [0, 0]]
-
-    def assert_multiindex_copied(self, copy, original):
-        # levels should be (at least, shallow copied)
-        assert_copy(copy.levels, original.levels)
-
-        assert_almost_equal(copy.labels, original.labels)
-
-        # labels doesn't matter which way copied
-        assert_almost_equal(copy.labels, original.labels)
-        self.assertIsNot(copy.labels, original.labels)
-
-        # names doesn't matter which way copied
-        self.assertEqual(copy.names, original.names)
-        self.assertIsNot(copy.names, original.names)
-
-        # sort order should be copied
-        self.assertEqual(copy.sortorder, original.sortorder)
-
-    def test_copy(self):
-        i_copy = self.index.copy()
-
-        self.assert_multiindex_copied(i_copy, self.index)
-
-    def test_shallow_copy(self):
-        i_copy = self.index._shallow_copy()
-
-        self.assert_multiindex_copied(i_copy, self.index)
-
-    def test_view(self):
-        i_view = self.index.view()
-
-        self.assert_multiindex_copied(i_view, self.index)
-
-    def check_level_names(self, index, names):
-        self.assertEqual([level.name for level in index.levels], list(names))
-
-    def test_changing_names(self):
-
-        # names should be applied to levels
-        level_names = [level.name for level in self.index.levels]
-        self.check_level_names(self.index, self.index.names)
-
-        view = self.index.view()
-        copy = self.index.copy()
-        shallow_copy = self.index._shallow_copy()
-
-        # changing names should change level names on object
-        new_names = [name + "a" for name in self.index.names]
-        self.index.names = new_names
-        self.check_level_names(self.index, new_names)
-
-        # but not on copies
-        self.check_level_names(view, level_names)
-        self.check_level_names(copy, level_names)
-        self.check_level_names(shallow_copy, level_names)
-
-        # and copies shouldn't change original
-        shallow_copy.names = [name + "c" for name in shallow_copy.names]
-        self.check_level_names(self.index, new_names)
-
-    def test_duplicate_names(self):
-        self.index.names = ['foo', 'foo']
-        assertRaisesRegexp(KeyError, 'Level foo not found',
-                           self.index._get_level_number, 'foo')
-
-    def test_get_level_number_integer(self):
-        self.index.names = [1, 0]
-        self.assertEqual(self.index._get_level_number(1), 0)
-        self.assertEqual(self.index._get_level_number(0), 1)
-        self.assertRaises(IndexError, self.index._get_level_number, 2)
-        assertRaisesRegexp(KeyError, 'Level fourth not found',
-                           self.index._get_level_number, 'fourth')
-
-    def test_from_arrays(self):
-        arrays = []
-        for lev, lab in zip(self.index.levels, self.index.labels):
-            arrays.append(np.asarray(lev).take(lab))
-
-        result = MultiIndex.from_arrays(arrays)
-        self.assertEqual(list(result), list(self.index))
-
-        # infer correctly
-        result = MultiIndex.from_arrays([[pd.NaT, Timestamp('20130101')],
-                                         ['a', 'b']])
-        self.assertTrue(result.levels[0].equals(Index([Timestamp('20130101')
-                                                       ])))
-        self.assertTrue(result.levels[1].equals(Index(['a', 'b'])))
-
-    def test_from_arrays_index_series_datetimetz(self):
-        idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
-                             tz='US/Eastern')
-        idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3,
-                             tz='Asia/Tokyo')
-        result = pd.MultiIndex.from_arrays([idx1, idx2])
-        tm.assert_index_equal(result.get_level_values(0), idx1)
-        tm.assert_index_equal(result.get_level_values(1), idx2)
-
-        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
-        tm.assert_index_equal(result2.get_level_values(0), idx1)
-        tm.assert_index_equal(result2.get_level_values(1), idx2)
-
-        tm.assert_index_equal(result, result2)
-
-    def test_from_arrays_index_series_timedelta(self):
-        idx1 = pd.timedelta_range('1 days', freq='D', periods=3)
-        idx2 = pd.timedelta_range('2 hours', freq='H', periods=3)
-        result = pd.MultiIndex.from_arrays([idx1, idx2])
-        tm.assert_index_equal(result.get_level_values(0), idx1)
-        tm.assert_index_equal(result.get_level_values(1), idx2)
-
-        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
-        tm.assert_index_equal(result2.get_level_values(0), idx1)
-        tm.assert_index_equal(result2.get_level_values(1), idx2)
-
-        tm.assert_index_equal(result, result2)
-
-    def test_from_arrays_index_series_period(self):
-        idx1 = pd.period_range('2011-01-01', freq='D', periods=3)
-        idx2 = pd.period_range('2015-01-01', freq='H', periods=3)
-        result = pd.MultiIndex.from_arrays([idx1, idx2])
-        tm.assert_index_equal(result.get_level_values(0), idx1)
-        tm.assert_index_equal(result.get_level_values(1), idx2)
-
-        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
-        tm.assert_index_equal(result2.get_level_values(0), idx1)
-        tm.assert_index_equal(result2.get_level_values(1), idx2)
-
-        tm.assert_index_equal(result, result2)
-
-    def test_from_arrays_index_datetimelike_mixed(self):
-        idx1 = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
-                             tz='US/Eastern')
-        idx2 = pd.date_range('2015-01-01 10:00', freq='H', periods=3)
-        idx3 = pd.timedelta_range('1 days', freq='D', periods=3)
-        idx4 = pd.period_range('2011-01-01', freq='D', periods=3)
-
-        result = pd.MultiIndex.from_arrays([idx1, idx2, idx3, idx4])
-        tm.assert_index_equal(result.get_level_values(0), idx1)
-        tm.assert_index_equal(result.get_level_values(1), idx2)
-        tm.assert_index_equal(result.get_level_values(2), idx3)
-        tm.assert_index_equal(result.get_level_values(3), idx4)
-
-        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1),
-                                             pd.Series(idx2),
-                                             pd.Series(idx3),
-                                             pd.Series(idx4)])
-        tm.assert_index_equal(result2.get_level_values(0), idx1)
-        tm.assert_index_equal(result2.get_level_values(1), idx2)
-        tm.assert_index_equal(result2.get_level_values(2), idx3)
-        tm.assert_index_equal(result2.get_level_values(3), idx4)
-
-        tm.assert_index_equal(result, result2)
-
-    def test_from_arrays_index_series_categorical(self):
-        # GH13743
-        idx1 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
-                                   ordered=False)
-        idx2 = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
-                                   ordered=True)
-
-        result = pd.MultiIndex.from_arrays([idx1, idx2])
-        tm.assert_index_equal(result.get_level_values(0), idx1)
-        tm.assert_index_equal(result.get_level_values(1), idx2)
-
-        result2 = pd.MultiIndex.from_arrays([pd.Series(idx1), pd.Series(idx2)])
-        tm.assert_index_equal(result2.get_level_values(0), idx1)
-        tm.assert_index_equal(result2.get_level_values(1), idx2)
-
-        result3 = pd.MultiIndex.from_arrays([idx1.values, idx2.values])
-        tm.assert_index_equal(result3.get_level_values(0), idx1)
-        tm.assert_index_equal(result3.get_level_values(1), idx2)
-
-    def test_from_arrays_empty(self):
-        # 0 levels
-        with tm.assertRaisesRegexp(
-                ValueError, "Must pass non-zero number of levels/labels"):
-            MultiIndex.from_arrays(arrays=[])
-
-        # 1 level
-        result = MultiIndex.from_arrays(arrays=[[]], names=['A'])
-        expected = Index([], name='A')
-        tm.assert_index_equal(result, expected)
-
-        # N levels
-        for N in [2, 3]:
-            arrays = [[]] * N
-            names = list('ABC')[:N]
-            result = MultiIndex.from_arrays(arrays=arrays, names=names)
-            expected = MultiIndex(levels=[np.array([])] * N, labels=[[]] * N,
-                                  names=names)
-            tm.assert_index_equal(result, expected)
-
-    def test_from_arrays_invalid_input(self):
-        invalid_inputs = [1, [1], [1, 2], [[1], 2],
-                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
-        for i in invalid_inputs:
-            tm.assertRaises(TypeError, MultiIndex.from_arrays, arrays=i)
-
-    def test_from_arrays_different_lengths(self):
-        # GH13599
-        idx1 = [1, 2, 3]
-        idx2 = ['a', 'b']
-        assertRaisesRegexp(ValueError, '^all arrays must be same length$',
-                           MultiIndex.from_arrays, [idx1, idx2])
-
-        idx1 = []
-        idx2 = ['a', 'b']
-        assertRaisesRegexp(ValueError, '^all arrays must be same length$',
-                           MultiIndex.from_arrays, [idx1, idx2])
-
-        idx1 = [1, 2, 3]
-        idx2 = []
-        assertRaisesRegexp(ValueError, '^all arrays must be same length$',
-                           MultiIndex.from_arrays, [idx1, idx2])
-
-    def test_from_product(self):
-
-        first = ['foo', 'bar', 'buz']
-        second = ['a', 'b', 'c']
-        names = ['first', 'second']
-        result = MultiIndex.from_product([first, second], names=names)
-
-        tuples = [('foo', 'a'), ('foo', 'b'), ('foo', 'c'), ('bar', 'a'),
-                  ('bar', 'b'), ('bar', 'c'), ('buz', 'a'), ('buz', 'b'),
-                  ('buz', 'c')]
-        expected = MultiIndex.from_tuples(tuples, names=names)
-
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, names)
-
-    def test_from_product_empty(self):
-        # 0 levels
-        with tm.assertRaisesRegexp(
-                ValueError, "Must pass non-zero number of levels/labels"):
-            MultiIndex.from_product([])
-
-        # 1 level
-        result = MultiIndex.from_product([[]], names=['A'])
-        expected = pd.Float64Index([], name='A')
-        tm.assert_index_equal(result, expected)
-
-        # 2 levels
-        l1 = [[], ['foo', 'bar', 'baz'], []]
-        l2 = [[], [], ['a', 'b', 'c']]
-        names = ['A', 'B']
-        for first, second in zip(l1, l2):
-            result = MultiIndex.from_product([first, second], names=names)
-            expected = MultiIndex(levels=[np.array(first), np.array(second)],
-                                  labels=[[], []], names=names)
-            tm.assert_index_equal(result, expected)
-
-        # GH12258
-        names = ['A', 'B', 'C']
-        for N in range(4):
-            lvl2 = lrange(N)
-            result = MultiIndex.from_product([[], lvl2, []], names=names)
-            expected = MultiIndex(levels=[np.array(A)
-                                          for A in [[], lvl2, []]],
-                                  labels=[[], [], []], names=names)
-            tm.assert_index_equal(result, expected)
-
-    def test_from_product_invalid_input(self):
-        invalid_inputs = [1, [1], [1, 2], [[1], 2],
-                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
-        for i in invalid_inputs:
-            tm.assertRaises(TypeError, MultiIndex.from_product, iterables=i)
-
-    def test_from_product_datetimeindex(self):
-        dt_index = date_range('2000-01-01', periods=2)
-        mi = pd.MultiIndex.from_product([[1, 2], dt_index])
-        etalon = lib.list_to_object_array([(1, pd.Timestamp(
-            '2000-01-01')), (1, pd.Timestamp('2000-01-02')), (2, pd.Timestamp(
-                '2000-01-01')), (2, pd.Timestamp('2000-01-02'))])
-        tm.assert_numpy_array_equal(mi.values, etalon)
-
-    def test_from_product_index_series_categorical(self):
-        # GH13743
-        first = ['foo', 'bar']
-        for ordered in [False, True]:
-            idx = pd.CategoricalIndex(list("abcaab"), categories=list("bac"),
-                                      ordered=ordered)
-            expected = pd.CategoricalIndex(list("abcaab") + list("abcaab"),
-                                           categories=list("bac"),
-                                           ordered=ordered)
-
-            for arr in [idx, pd.Series(idx), idx.values]:
-                result = pd.MultiIndex.from_product([first, arr])
-                tm.assert_index_equal(result.get_level_values(1), expected)
-
-    def test_values_boxed(self):
-        tuples = [(1, pd.Timestamp('2000-01-01')), (2, pd.NaT),
-                  (3, pd.Timestamp('2000-01-03')),
-                  (1, pd.Timestamp('2000-01-04')),
-                  (2, pd.Timestamp('2000-01-02')),
-                  (3, pd.Timestamp('2000-01-03'))]
-        mi = pd.MultiIndex.from_tuples(tuples)
-        tm.assert_numpy_array_equal(mi.values,
-                                    lib.list_to_object_array(tuples))
-        # Check that code branches for boxed values produce identical results
-        tm.assert_numpy_array_equal(mi.values[:4], mi[:4].values)
-
-    def test_append(self):
-        result = self.index[:3].append(self.index[3:])
-        self.assertTrue(result.equals(self.index))
-
-        foos = [self.index[:1], self.index[1:3], self.index[3:]]
-        result = foos[0].append(foos[1:])
-        self.assertTrue(result.equals(self.index))
-
-        # empty
-        result = self.index.append([])
-        self.assertTrue(result.equals(self.index))
-
-    def test_append_mixed_dtypes(self):
-        # GH 13660
-        dti = date_range('2011-01-01', freq='M', periods=3,)
-        dti_tz = date_range('2011-01-01', freq='M', periods=3, tz='US/Eastern')
-        pi = period_range('2011-01', freq='M', periods=3)
-
-        mi = MultiIndex.from_arrays([[1, 2, 3],
-                                     [1.1, np.nan, 3.3],
-                                     ['a', 'b', 'c'],
-                                     dti, dti_tz, pi])
-        self.assertEqual(mi.nlevels, 6)
-
-        res = mi.append(mi)
-        exp = MultiIndex.from_arrays([[1, 2, 3, 1, 2, 3],
-                                      [1.1, np.nan, 3.3, 1.1, np.nan, 3.3],
-                                      ['a', 'b', 'c', 'a', 'b', 'c'],
-                                      dti.append(dti),
-                                      dti_tz.append(dti_tz),
-                                      pi.append(pi)])
-        tm.assert_index_equal(res, exp)
-
-        other = MultiIndex.from_arrays([['x', 'y', 'z'], ['x', 'y', 'z'],
-                                        ['x', 'y', 'z'], ['x', 'y', 'z'],
-                                        ['x', 'y', 'z'], ['x', 'y', 'z']])
-
-        res = mi.append(other)
-        exp = MultiIndex.from_arrays([[1, 2, 3, 'x', 'y', 'z'],
-                                      [1.1, np.nan, 3.3, 'x', 'y', 'z'],
-                                      ['a', 'b', 'c', 'x', 'y', 'z'],
-                                      dti.append(pd.Index(['x', 'y', 'z'])),
-                                      dti_tz.append(pd.Index(['x', 'y', 'z'])),
-                                      pi.append(pd.Index(['x', 'y', 'z']))])
-        tm.assert_index_equal(res, exp)
-
-    def test_get_level_values(self):
-        result = self.index.get_level_values(0)
-        expected = Index(['foo', 'foo', 'bar', 'baz', 'qux', 'qux'],
-                         name='first')
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, 'first')
-
-        result = self.index.get_level_values('first')
-        expected = self.index.get_level_values(0)
-        tm.assert_index_equal(result, expected)
-
-        # GH 10460
-        index = MultiIndex(levels=[CategoricalIndex(
-            ['A', 'B']), CategoricalIndex([1, 2, 3])], labels=[np.array(
-                [0, 0, 0, 1, 1, 1]), np.array([0, 1, 2, 0, 1, 2])])
-        exp = CategoricalIndex(['A', 'A', 'A', 'B', 'B', 'B'])
-        self.assert_index_equal(index.get_level_values(0), exp)
-        exp = CategoricalIndex([1, 2, 3, 1, 2, 3])
-        self.assert_index_equal(index.get_level_values(1), exp)
-
-    def test_get_level_values_na(self):
-        arrays = [['a', 'b', 'b'], [1, np.nan, 2]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = np.array([1, np.nan, 2])
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-
-        arrays = [['a', 'b', 'b'], [np.nan, np.nan, 2]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = np.array([np.nan, np.nan, 2])
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-
-        arrays = [[np.nan, np.nan, np.nan], ['a', np.nan, 1]]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(0)
-        expected = np.array([np.nan, np.nan, np.nan])
-        tm.assert_numpy_array_equal(values.values.astype(float), expected)
-        values = index.get_level_values(1)
-        expected = np.array(['a', np.nan, 1], dtype=object)
-        tm.assert_numpy_array_equal(values.values, expected)
-
-        arrays = [['a', 'b', 'b'], pd.DatetimeIndex([0, 1, pd.NaT])]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(1)
-        expected = pd.DatetimeIndex([0, 1, pd.NaT])
-        tm.assert_numpy_array_equal(values.values, expected.values)
-
-        arrays = [[], []]
-        index = pd.MultiIndex.from_arrays(arrays)
-        values = index.get_level_values(0)
-        self.assertEqual(values.shape, (0, ))
-
-    def test_reorder_levels(self):
-        # this blows up
-        assertRaisesRegexp(IndexError, '^Too many levels',
-                           self.index.reorder_levels, [2, 1, 0])
-
-    def test_nlevels(self):
-        self.assertEqual(self.index.nlevels, 2)
-
-    def test_iter(self):
-        result = list(self.index)
-        expected = [('foo', 'one'), ('foo', 'two'), ('bar', 'one'),
-                    ('baz', 'two'), ('qux', 'one'), ('qux', 'two')]
-        self.assertEqual(result, expected)
-
-    def test_legacy_pickle(self):
-        if PY3:
-            pytest.skip("testing for legacy pickles not "
-                        "support on py3")
-
-        path = tm.get_data_path('multiindex_v1.pickle')
-        obj = pd.read_pickle(path)
-
-        obj2 = MultiIndex.from_tuples(obj.values)
-        self.assertTrue(obj.equals(obj2))
-
-        res = obj.get_indexer(obj)
-        exp = np.arange(len(obj), dtype=np.intp)
-        assert_almost_equal(res, exp)
-
-        res = obj.get_indexer(obj2[::-1])
-        exp = obj.get_indexer(obj[::-1])
-        exp2 = obj2.get_indexer(obj2[::-1])
-        assert_almost_equal(res, exp)
-        assert_almost_equal(exp, exp2)
-
-    def test_legacy_v2_unpickle(self):
-
-        # 0.7.3 -> 0.8.0 format manage
-        path = tm.get_data_path('mindex_073.pickle')
-        obj = pd.read_pickle(path)
-
-        obj2 = MultiIndex.from_tuples(obj.values)
-        self.assertTrue(obj.equals(obj2))
-
-        res = obj.get_indexer(obj)
-        exp = np.arange(len(obj), dtype=np.intp)
-        assert_almost_equal(res, exp)
-
-        res = obj.get_indexer(obj2[::-1])
-        exp = obj.get_indexer(obj[::-1])
-        exp2 = obj2.get_indexer(obj2[::-1])
-        assert_almost_equal(res, exp)
-        assert_almost_equal(exp, exp2)
-
-    def test_roundtrip_pickle_with_tz(self):
-
-        # GH 8367
-        # round-trip of timezone
-        index = MultiIndex.from_product(
-            [[1, 2], ['a', 'b'], date_range('20130101', periods=3,
-                                            tz='US/Eastern')
-             ], names=['one', 'two', 'three'])
-        unpickled = self.round_trip_pickle(index)
-        self.assertTrue(index.equal_levels(unpickled))
-
-    def test_from_tuples_index_values(self):
-        result = MultiIndex.from_tuples(self.index)
-        self.assertTrue((result.values == self.index.values).all())
-
-    def test_contains(self):
-        self.assertIn(('foo', 'two'), self.index)
-        self.assertNotIn(('bar', 'two'), self.index)
-        self.assertNotIn(None, self.index)
-
-    def test_contains_top_level(self):
-        midx = MultiIndex.from_product([['A', 'B'], [1, 2]])
-        assert 'A' in midx
-        assert 'A' not in midx._engine
-
-    def test_contains_with_nat(self):
-        # MI with a NaT
-        mi = MultiIndex(levels=[['C'],
-                                pd.date_range('2012-01-01', periods=5)],
-                        labels=[[0, 0, 0, 0, 0, 0], [-1, 0, 1, 2, 3, 4]],
-                        names=[None, 'B'])
-        self.assertTrue(('C', pd.Timestamp('2012-01-01')) in mi)
-        for val in mi.values:
-            self.assertTrue(val in mi)
-
-    def test_is_all_dates(self):
-        self.assertFalse(self.index.is_all_dates)
-
-    def test_is_numeric(self):
-        # MultiIndex is never numeric
-        self.assertFalse(self.index.is_numeric())
-
-    def test_getitem(self):
-        # scalar
-        self.assertEqual(self.index[2], ('bar', 'one'))
-
-        # slice
-        result = self.index[2:5]
-        expected = self.index[[2, 3, 4]]
-        self.assertTrue(result.equals(expected))
-
-        # boolean
-        result = self.index[[True, False, True, False, True, True]]
-        result2 = self.index[np.array([True, False, True, False, True, True])]
-        expected = self.index[[0, 2, 4, 5]]
-        self.assertTrue(result.equals(expected))
-        self.assertTrue(result2.equals(expected))
-
-    def test_getitem_group_select(self):
-        sorted_idx, _ = self.index.sortlevel(0)
-        self.assertEqual(sorted_idx.get_loc('baz'), slice(3, 4))
-        self.assertEqual(sorted_idx.get_loc('foo'), slice(0, 2))
-
-    def test_get_loc(self):
-        self.assertEqual(self.index.get_loc(('foo', 'two')), 1)
-        self.assertEqual(self.index.get_loc(('baz', 'two')), 3)
-        self.assertRaises(KeyError, self.index.get_loc, ('bar', 'two'))
-        self.assertRaises(KeyError, self.index.get_loc, 'quux')
-
-        self.assertRaises(NotImplementedError, self.index.get_loc, 'foo',
-                          method='nearest')
-
-        # 3 levels
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-        self.assertRaises(KeyError, index.get_loc, (1, 1))
-        self.assertEqual(index.get_loc((2, 0)), slice(3, 5))
-
-    def test_get_loc_duplicates(self):
-        index = Index([2, 2, 2, 2])
-        result = index.get_loc(2)
-        expected = slice(0, 4)
-        self.assertEqual(result, expected)
-        # self.assertRaises(Exception, index.get_loc, 2)
-
-        index = Index(['c', 'a', 'a', 'b', 'b'])
-        rs = index.get_loc('c')
-        xp = 0
-        assert (rs == xp)
-
-    def test_get_value_duplicates(self):
-        index = MultiIndex(levels=[['D', 'B', 'C'],
-                                   [0, 26, 27, 37, 57, 67, 75, 82]],
-                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
-                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
-                           names=['tag', 'day'])
-
-        assert index.get_loc('D') == slice(0, 3)
-        with pytest.raises(KeyError):
-            index._engine.get_value(np.array([]), 'D')
-
-    def test_get_loc_level(self):
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        loc, new_index = index.get_loc_level((0, 1))
-        expected = slice(1, 2)
-        exp_index = index[expected].droplevel(0).droplevel(0)
-        self.assertEqual(loc, expected)
-        self.assertTrue(new_index.equals(exp_index))
-
-        loc, new_index = index.get_loc_level((0, 1, 0))
-        expected = 1
-        self.assertEqual(loc, expected)
-        self.assertIsNone(new_index)
-
-        self.assertRaises(KeyError, index.get_loc_level, (2, 2))
-
-        index = MultiIndex(levels=[[2000], lrange(4)], labels=[np.array(
-            [0, 0, 0, 0]), np.array([0, 1, 2, 3])])
-        result, new_index = index.get_loc_level((2000, slice(None, None)))
-        expected = slice(None, None)
-        self.assertEqual(result, expected)
-        self.assertTrue(new_index.equals(index.droplevel(0)))
-
-    def test_slice_locs(self):
-        df = tm.makeTimeDataFrame()
-        stacked = df.stack()
-        idx = stacked.index
-
-        slob = slice(*idx.slice_locs(df.index[5], df.index[15]))
-        sliced = stacked[slob]
-        expected = df[5:16].stack()
-        tm.assert_almost_equal(sliced.values, expected.values)
-
-        slob = slice(*idx.slice_locs(df.index[5] + timedelta(seconds=30),
-                                     df.index[15] - timedelta(seconds=30)))
-        sliced = stacked[slob]
-        expected = df[6:15].stack()
-        tm.assert_almost_equal(sliced.values, expected.values)
-
-    def test_slice_locs_with_type_mismatch(self):
-        df = tm.makeTimeDataFrame()
-        stacked = df.stack()
-        idx = stacked.index
-        assertRaisesRegexp(TypeError, '^Level type mismatch', idx.slice_locs,
-                           (1, 3))
-        assertRaisesRegexp(TypeError, '^Level type mismatch', idx.slice_locs,
-                           df.index[5] + timedelta(seconds=30), (5, 2))
-        df = tm.makeCustomDataframe(5, 5)
-        stacked = df.stack()
-        idx = stacked.index
-        with assertRaisesRegexp(TypeError, '^Level type mismatch'):
-            idx.slice_locs(timedelta(seconds=30))
-        # TODO: Try creating a UnicodeDecodeError in exception message
-        with assertRaisesRegexp(TypeError, '^Level type mismatch'):
-            idx.slice_locs(df.index[1], (16, "a"))
-
-    def test_slice_locs_not_sorted(self):
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        assertRaisesRegexp(KeyError, "[Kk]ey length.*greater than MultiIndex"
-                           " lexsort depth", index.slice_locs, (1, 0, 1),
-                           (2, 1, 0))
-
-        # works
-        sorted_index, _ = index.sortlevel(0)
-        # should there be a test case here???
-        sorted_index.slice_locs((1, 0, 1), (2, 1, 0))
-
-    def test_slice_locs_partial(self):
-        sorted_idx, _ = self.index.sortlevel(0)
-
-        result = sorted_idx.slice_locs(('foo', 'two'), ('qux', 'one'))
-        self.assertEqual(result, (1, 5))
-
-        result = sorted_idx.slice_locs(None, ('qux', 'one'))
-        self.assertEqual(result, (0, 5))
-
-        result = sorted_idx.slice_locs(('foo', 'two'), None)
-        self.assertEqual(result, (1, len(sorted_idx)))
-
-        result = sorted_idx.slice_locs('bar', 'baz')
-        self.assertEqual(result, (2, 4))
-
-    def test_slice_locs_not_contained(self):
-        # some searchsorted action
-
-        index = MultiIndex(levels=[[0, 2, 4, 6], [0, 2, 4]],
-                           labels=[[0, 0, 0, 1, 1, 2, 3, 3, 3],
-                                   [0, 1, 2, 1, 2, 2, 0, 1, 2]], sortorder=0)
-
-        result = index.slice_locs((1, 0), (5, 2))
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs(1, 5)
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs((2, 2), (5, 2))
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs(2, 5)
-        self.assertEqual(result, (3, 6))
-
-        result = index.slice_locs((1, 0), (6, 3))
-        self.assertEqual(result, (3, 8))
-
-        result = index.slice_locs(-1, 10)
-        self.assertEqual(result, (0, len(index)))
-
-    def test_consistency(self):
-        # need to construct an overflow
-        major_axis = lrange(70000)
-        minor_axis = lrange(10)
-
-        major_labels = np.arange(70000)
-        minor_labels = np.repeat(lrange(10), 7000)
-
-        # the fact that is works means it's consistent
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        # inconsistent
-        major_labels = np.array([0, 0, 1, 1, 1, 2, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 1, 0, 1, 0, 1])
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        self.assertFalse(index.is_unique)
-
-    def test_truncate(self):
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-
-        result = index.truncate(before=1)
-        self.assertNotIn('foo', result.levels[0])
-        self.assertIn(1, result.levels[0])
-
-        result = index.truncate(after=1)
-        self.assertNotIn(2, result.levels[0])
-        self.assertIn(1, result.levels[0])
-
-        result = index.truncate(before=1, after=2)
-        self.assertEqual(len(result.levels[0]), 2)
-
-        # after < before
-        self.assertRaises(ValueError, index.truncate, 3, 1)
-
-    def test_get_indexer(self):
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 2, 3, 3], dtype=np.intp)
-        minor_labels = np.array([0, 1, 0, 0, 1, 0, 1], dtype=np.intp)
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        idx1 = index[:5]
-        idx2 = index[[1, 3, 5]]
-
-        r1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, np.array([1, 3, -1], dtype=np.intp))
-
-        r1 = idx2.get_indexer(idx1, method='pad')
-        e1 = np.array([-1, 0, 0, 1, 1], dtype=np.intp)
-        assert_almost_equal(r1, e1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='pad')
-        assert_almost_equal(r2, e1[::-1])
-
-        rffill1 = idx2.get_indexer(idx1, method='ffill')
-        assert_almost_equal(r1, rffill1)
-
-        r1 = idx2.get_indexer(idx1, method='backfill')
-        e1 = np.array([0, 0, 1, 1, 2], dtype=np.intp)
-        assert_almost_equal(r1, e1)
-
-        r2 = idx2.get_indexer(idx1[::-1], method='backfill')
-        assert_almost_equal(r2, e1[::-1])
-
-        rbfill1 = idx2.get_indexer(idx1, method='bfill')
-        assert_almost_equal(r1, rbfill1)
-
-        # pass non-MultiIndex
-        r1 = idx1.get_indexer(idx2.values)
-        rexp1 = idx1.get_indexer(idx2)
-        assert_almost_equal(r1, rexp1)
-
-        r1 = idx1.get_indexer([1, 2, 3])
-        self.assertTrue((r1 == [-1, -1, -1]).all())
-
-        # create index with duplicates
-        idx1 = Index(lrange(10) + lrange(10))
-        idx2 = Index(lrange(20))
-
-        msg = "Reindexing only valid with uniquely valued Index objects"
-        with assertRaisesRegexp(InvalidIndexError, msg):
-            idx1.get_indexer(idx2)
-
-    def test_get_indexer_nearest(self):
-        midx = MultiIndex.from_tuples([('a', 1), ('b', 2)])
-        with tm.assertRaises(NotImplementedError):
-            midx.get_indexer(['a'], method='nearest')
-        with tm.assertRaises(NotImplementedError):
-            midx.get_indexer(['a'], method='pad', tolerance=2)
-
-    def test_hash_collisions(self):
-        # non-smoke test that we don't get hash collisions
-
-        index = MultiIndex.from_product([np.arange(1000), np.arange(1000)],
-                                        names=['one', 'two'])
-        result = index.get_indexer(index.values)
-        self.assert_numpy_array_equal(result,
-                                      np.arange(len(index), dtype='intp'))
-
-        for i in [0, 1, len(index) - 2, len(index) - 1]:
-            result = index.get_loc(index[i])
-            self.assertEqual(result, i)
-
-    def test_format(self):
-        self.index.format()
-        self.index[:0].format()
-
-    def test_format_integer_names(self):
-        index = MultiIndex(levels=[[0, 1], [0, 1]],
-                           labels=[[0, 0, 1, 1], [0, 1, 0, 1]], names=[0, 1])
-        index.format(names=True)
-
-    def test_format_sparse_display(self):
-        index = MultiIndex(levels=[[0, 1], [0, 1], [0, 1], [0]],
-                           labels=[[0, 0, 0, 1, 1, 1], [0, 0, 1, 0, 0, 1],
-                                   [0, 1, 0, 0, 1, 0], [0, 0, 0, 0, 0, 0]])
-
-        result = index.format()
-        self.assertEqual(result[3], '1  0  0  0')
-
-    def test_format_sparse_config(self):
-        warn_filters = warnings.filters
-        warnings.filterwarnings('ignore', category=FutureWarning,
-                                module=".*format")
-        # GH1538
-        pd.set_option('display.multi_sparse', False)
-
-        result = self.index.format()
-        self.assertEqual(result[1], 'foo  two')
-
-        self.reset_display_options()
-
-        warnings.filters = warn_filters
-
-    def test_to_frame(self):
-        tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
-
-        index = MultiIndex.from_tuples(tuples)
-        result = index.to_frame(index=False)
-        expected = DataFrame(tuples)
-        tm.assert_frame_equal(result, expected)
-
-        result = index.to_frame()
-        expected.index = index
-        tm.assert_frame_equal(result, expected)
-
-        tuples = [(1, 'one'), (1, 'two'), (2, 'one'), (2, 'two')]
-        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
-        result = index.to_frame(index=False)
-        expected = DataFrame(tuples)
-        expected.columns = ['first', 'second']
-        tm.assert_frame_equal(result, expected)
-
-        result = index.to_frame()
-        expected.index = index
-        tm.assert_frame_equal(result, expected)
-
-        index = MultiIndex.from_product([range(5),
-                                         pd.date_range('20130101', periods=3)])
-        result = index.to_frame(index=False)
-        expected = DataFrame(
-            {0: np.repeat(np.arange(5, dtype='int64'), 3),
-             1: np.tile(pd.date_range('20130101', periods=3), 5)})
-        tm.assert_frame_equal(result, expected)
-
-        index = MultiIndex.from_product([range(5),
-                                         pd.date_range('20130101', periods=3)])
-        result = index.to_frame()
-        expected.index = index
-        tm.assert_frame_equal(result, expected)
-
-    def test_to_hierarchical(self):
-        index = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
-            2, 'two')])
-        result = index.to_hierarchical(3)
-        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
-                              labels=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1],
-                                      [0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1]])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-        # K > 1
-        result = index.to_hierarchical(3, 2)
-        expected = MultiIndex(levels=[[1, 2], ['one', 'two']],
-                              labels=[[0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1],
-                                      [0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-        # non-sorted
-        index = MultiIndex.from_tuples([(2, 'c'), (1, 'b'),
-                                        (2, 'a'), (2, 'b')],
-                                       names=['N1', 'N2'])
-
-        result = index.to_hierarchical(2)
-        expected = MultiIndex.from_tuples([(2, 'c'), (2, 'c'), (1, 'b'),
-                                           (1, 'b'),
-                                           (2, 'a'), (2, 'a'),
-                                           (2, 'b'), (2, 'b')],
-                                          names=['N1', 'N2'])
-        tm.assert_index_equal(result, expected)
-        self.assertEqual(result.names, index.names)
-
-    def test_bounds(self):
-        self.index._bounds
-
-    def test_equals_multi(self):
-        assert self.index.equals(self.index)
-        assert not self.index.equals(self.index.values)
-        assert self.index.equals(Index(self.index.values))
-
-        assert self.index.equal_levels(self.index)
-        assert not self.index.equals(self.index[:-1])
-        assert not self.index.equals(self.index[-1])
-
-        # different number of levels
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])])
-
-        index2 = MultiIndex(levels=index.levels[:-1], labels=index.labels[:-1])
-        assert not index.equals(index2)
-        assert not index.equal_levels(index2)
-
-        # levels are different
-        major_axis = Index(lrange(4))
-        minor_axis = Index(lrange(2))
-
-        major_labels = np.array([0, 0, 1, 2, 2, 3])
-        minor_labels = np.array([0, 1, 0, 0, 1, 0])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        assert not self.index.equals(index)
-        assert not self.index.equal_levels(index)
-
-        # some of the labels are different
-        major_axis = Index(['foo', 'bar', 'baz', 'qux'])
-        minor_axis = Index(['one', 'two'])
-
-        major_labels = np.array([0, 0, 2, 2, 3, 3])
-        minor_labels = np.array([0, 1, 0, 1, 0, 1])
-
-        index = MultiIndex(levels=[major_axis, minor_axis],
-                           labels=[major_labels, minor_labels])
-        assert not self.index.equals(index)
-
-    def test_equals_missing_values(self):
-        # make sure take is not using -1
-        i = pd.MultiIndex.from_tuples([(0, pd.NaT),
-                                       (0, pd.Timestamp('20130101'))])
-        result = i[0:1].equals(i[0])
-        self.assertFalse(result)
-        result = i[1:2].equals(i[1])
-        self.assertFalse(result)
-
-    def test_identical(self):
-        mi = self.index.copy()
-        mi2 = self.index.copy()
-        self.assertTrue(mi.identical(mi2))
-
-        mi = mi.set_names(['new1', 'new2'])
-        self.assertTrue(mi.equals(mi2))
-        self.assertFalse(mi.identical(mi2))
-
-        mi2 = mi2.set_names(['new1', 'new2'])
-        self.assertTrue(mi.identical(mi2))
-
-        mi3 = Index(mi.tolist(), names=mi.names)
-        mi4 = Index(mi.tolist(), names=mi.names, tupleize_cols=False)
-        self.assertTrue(mi.identical(mi3))
-        self.assertFalse(mi.identical(mi4))
-        self.assertTrue(mi.equals(mi4))
-
-    def test_is_(self):
-        mi = MultiIndex.from_tuples(lzip(range(10), range(10)))
-        self.assertTrue(mi.is_(mi))
-        self.assertTrue(mi.is_(mi.view()))
-        self.assertTrue(mi.is_(mi.view().view().view().view()))
-        mi2 = mi.view()
-        # names are metadata, they don't change id
-        mi2.names = ["A", "B"]
-        self.assertTrue(mi2.is_(mi))
-        self.assertTrue(mi.is_(mi2))
-
-        self.assertTrue(mi.is_(mi.set_names(["C", "D"])))
-        mi2 = mi.view()
-        mi2.set_names(["E", "F"], inplace=True)
-        self.assertTrue(mi.is_(mi2))
-        # levels are inherent properties, they change identity
-        mi3 = mi2.set_levels([lrange(10), lrange(10)])
-        self.assertFalse(mi3.is_(mi2))
-        # shouldn't change
-        self.assertTrue(mi2.is_(mi))
-        mi4 = mi3.view()
-        mi4.set_levels([[1 for _ in range(10)], lrange(10)], inplace=True)
-        self.assertFalse(mi4.is_(mi3))
-        mi5 = mi.view()
-        mi5.set_levels(mi5.levels, inplace=True)
-        self.assertFalse(mi5.is_(mi))
-
-    def test_union(self):
-        piece1 = self.index[:5][::-1]
-        piece2 = self.index[3:]
-
-        the_union = piece1 | piece2
-
-        tups = sorted(self.index.values)
-        expected = MultiIndex.from_tuples(tups)
-
-        self.assertTrue(the_union.equals(expected))
-
-        # corner case, pass self or empty thing:
-        the_union = self.index.union(self.index)
-        self.assertIs(the_union, self.index)
-
-        the_union = self.index.union(self.index[:0])
-        self.assertIs(the_union, self.index)
-
-        # won't work in python 3
-        # tuples = self.index.values
-        # result = self.index[:4] | tuples[4:]
-        # self.assertTrue(result.equals(tuples))
-
-        # not valid for python 3
-        # def test_union_with_regular_index(self):
-        #     other = Index(['A', 'B', 'C'])
-
-        #     result = other.union(self.index)
-        #     self.assertIn(('foo', 'one'), result)
-        #     self.assertIn('B', result)
-
-        #     result2 = self.index.union(other)
-        #     self.assertTrue(result.equals(result2))
-
-    def test_intersection(self):
-        piece1 = self.index[:5][::-1]
-        piece2 = self.index[3:]
-
-        the_int = piece1 & piece2
-        tups = sorted(self.index[3:5].values)
-        expected = MultiIndex.from_tuples(tups)
-        self.assertTrue(the_int.equals(expected))
-
-        # corner case, pass self
-        the_int = self.index.intersection(self.index)
-        self.assertIs(the_int, self.index)
-
-        # empty intersection: disjoint
-        empty = self.index[:2] & self.index[2:]
-        expected = self.index[:0]
-        self.assertTrue(empty.equals(expected))
-
-        # can't do in python 3
-        # tuples = self.index.values
-        # result = self.index & tuples
-        # self.assertTrue(result.equals(tuples))
-
-    def test_sub(self):
-
-        first = self.index
-
-        # - now raises (previously was set op difference)
-        with tm.assertRaises(TypeError):
-            first - self.index[-3:]
-        with tm.assertRaises(TypeError):
-            self.index[-3:] - first
-        with tm.assertRaises(TypeError):
-            self.index[-3:] - first.tolist()
-        with tm.assertRaises(TypeError):
-            first.tolist() - self.index[-3:]
-
-    def test_difference(self):
-
-        first = self.index
-        result = first.difference(self.index[-3:])
-        expected = MultiIndex.from_tuples(sorted(self.index[:-3].values),
-                                          sortorder=0,
-                                          names=self.index.names)
-
-        tm.assertIsInstance(result, MultiIndex)
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: reflexive
-        result = self.index.difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: superset
-        result = self.index[-3:].difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # empty difference: degenerate
-        result = self.index[:0].difference(self.index)
-        expected = self.index[:0]
-        self.assertTrue(result.equals(expected))
-        self.assertEqual(result.names, self.index.names)
-
-        # names not the same
-        chunklet = self.index[-3:]
-        chunklet.names = ['foo', 'baz']
-        result = first.difference(chunklet)
-        self.assertEqual(result.names, (None, None))
-
-        # empty, but non-equal
-        result = self.index.difference(self.index.sortlevel(1)[0])
-        self.assertEqual(len(result), 0)
-
-        # raise Exception called with non-MultiIndex
-        result = first.difference(first.values)
-        self.assertTrue(result.equals(first[:0]))
-
-        # name from empty array
-        result = first.difference([])
-        self.assertTrue(first.equals(result))
-        self.assertEqual(first.names, result.names)
-
-        # name from non-empty array
-        result = first.difference([('foo', 'one')])
-        expected = pd.MultiIndex.from_tuples([('bar', 'one'), ('baz', 'two'), (
-            'foo', 'two'), ('qux', 'one'), ('qux', 'two')])
-        expected.names = first.names
-        self.assertEqual(first.names, result.names)
-        assertRaisesRegexp(TypeError, "other must be a MultiIndex or a list"
-                           " of tuples", first.difference, [1, 2, 3, 4, 5])
-
-    def test_from_tuples(self):
-        assertRaisesRegexp(TypeError, 'Cannot infer number of levels from'
-                           ' empty list', MultiIndex.from_tuples, [])
-
-        idx = MultiIndex.from_tuples(((1, 2), (3, 4)), names=['a', 'b'])
-        self.assertEqual(len(idx), 2)
-
-    def test_argsort(self):
-        result = self.index.argsort()
-        expected = self.index.values.argsort()
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_sortlevel(self):
-        import random
-
-        tuples = list(self.index)
-        random.shuffle(tuples)
-
-        index = MultiIndex.from_tuples(tuples)
-
-        sorted_idx, _ = index.sortlevel(0)
-        expected = MultiIndex.from_tuples(sorted(tuples))
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(0, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-        sorted_idx, _ = index.sortlevel(1)
-        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
-        expected = MultiIndex.from_tuples(by1)
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(1, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-    def test_sortlevel_not_sort_remaining(self):
-        mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
-        sorted_idx, _ = mi.sortlevel('A', sort_remaining=False)
-        self.assertTrue(sorted_idx.equals(mi))
-
-    def test_sortlevel_deterministic(self):
-        tuples = [('bar', 'one'), ('foo', 'two'), ('qux', 'two'),
-                  ('foo', 'one'), ('baz', 'two'), ('qux', 'one')]
-
-        index = MultiIndex.from_tuples(tuples)
-
-        sorted_idx, _ = index.sortlevel(0)
-        expected = MultiIndex.from_tuples(sorted(tuples))
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(0, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-        sorted_idx, _ = index.sortlevel(1)
-        by1 = sorted(tuples, key=lambda x: (x[1], x[0]))
-        expected = MultiIndex.from_tuples(by1)
-        self.assertTrue(sorted_idx.equals(expected))
-
-        sorted_idx, _ = index.sortlevel(1, ascending=False)
-        self.assertTrue(sorted_idx.equals(expected[::-1]))
-
-    def test_dims(self):
-        pass
-
-    def test_drop(self):
-        dropped = self.index.drop([('foo', 'two'), ('qux', 'one')])
-
-        index = MultiIndex.from_tuples([('foo', 'two'), ('qux', 'one')])
-        dropped2 = self.index.drop(index)
-
-        expected = self.index[[0, 2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-        self.assert_index_equal(dropped2, expected)
-
-        dropped = self.index.drop(['bar'])
-        expected = self.index[[0, 1, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop('foo')
-        expected = self.index[[2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        index = MultiIndex.from_tuples([('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, [('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, index)
-        self.assertRaises(KeyError, self.index.drop, ['foo', 'two'])
-
-        # partially correct argument
-        mixed_index = MultiIndex.from_tuples([('qux', 'one'), ('bar', 'two')])
-        self.assertRaises(KeyError, self.index.drop, mixed_index)
-
-        # error='ignore'
-        dropped = self.index.drop(index, errors='ignore')
-        expected = self.index[[0, 1, 2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop(mixed_index, errors='ignore')
-        expected = self.index[[0, 1, 2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        dropped = self.index.drop(['foo', 'two'], errors='ignore')
-        expected = self.index[[2, 3, 4, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        # mixed partial / full drop
-        dropped = self.index.drop(['foo', ('qux', 'one')])
-        expected = self.index[[2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-        # mixed partial / full drop / error='ignore'
-        mixed_index = ['foo', ('qux', 'one'), 'two']
-        self.assertRaises(KeyError, self.index.drop, mixed_index)
-        dropped = self.index.drop(mixed_index, errors='ignore')
-        expected = self.index[[2, 3, 5]]
-        self.assert_index_equal(dropped, expected)
-
-    def test_droplevel_with_names(self):
-        index = self.index[self.index.get_loc('foo')]
-        dropped = index.droplevel(0)
-        self.assertEqual(dropped.name, 'second')
-
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
-            names=['one', 'two', 'three'])
-        dropped = index.droplevel(0)
-        self.assertEqual(dropped.names, ('two', 'three'))
-
-        dropped = index.droplevel('two')
-        expected = index.droplevel(1)
-        self.assertTrue(dropped.equals(expected))
-
-    def test_droplevel_multiple(self):
-        index = MultiIndex(levels=[Index(lrange(4)), Index(lrange(4)), Index(
-            lrange(4))], labels=[np.array([0, 0, 1, 2, 2, 2, 3, 3]), np.array(
-                [0, 1, 0, 0, 0, 1, 0, 1]), np.array([1, 0, 1, 1, 0, 0, 1, 0])],
-            names=['one', 'two', 'three'])
-
-        dropped = index[:2].droplevel(['three', 'one'])
-        expected = index[:2].droplevel(2).droplevel(0)
-        self.assertTrue(dropped.equals(expected))
-
-    def test_drop_not_lexsorted(self):
-        # GH 12078
-
-        # define the lexsorted version of the multi-index
-        tuples = [('a', ''), ('b1', 'c1'), ('b2', 'c2')]
-        lexsorted_mi = MultiIndex.from_tuples(tuples, names=['b', 'c'])
-        self.assertTrue(lexsorted_mi.is_lexsorted())
-
-        # and the not-lexsorted version
-        df = pd.DataFrame(columns=['a', 'b', 'c', 'd'],
-                          data=[[1, 'b1', 'c1', 3], [1, 'b2', 'c2', 4]])
-        df = df.pivot_table(index='a', columns=['b', 'c'], values='d')
-        df = df.reset_index()
-        not_lexsorted_mi = df.columns
-        self.assertFalse(not_lexsorted_mi.is_lexsorted())
-
-        # compare the results
-        self.assert_index_equal(lexsorted_mi, not_lexsorted_mi)
-        with self.assert_produces_warning(PerformanceWarning):
-            self.assert_index_equal(lexsorted_mi.drop('a'),
-                                    not_lexsorted_mi.drop('a'))
-
-    def test_insert(self):
-        # key contained in all levels
-        new_index = self.index.insert(0, ('bar', 'two'))
-        self.assertTrue(new_index.equal_levels(self.index))
-        self.assertEqual(new_index[0], ('bar', 'two'))
-
-        # key not contained in all levels
-        new_index = self.index.insert(0, ('abc', 'three'))
-
-        exp0 = Index(list(self.index.levels[0]) + ['abc'], name='first')
-        tm.assert_index_equal(new_index.levels[0], exp0)
-
-        exp1 = Index(list(self.index.levels[1]) + ['three'], name='second')
-        tm.assert_index_equal(new_index.levels[1], exp1)
-        self.assertEqual(new_index[0], ('abc', 'three'))
-
-        # key wrong length
-        msg = "Item must have length equal to number of levels"
-        with assertRaisesRegexp(ValueError, msg):
-            self.index.insert(0, ('foo2', ))
-
-        left = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1]],
-                            columns=['1st', '2nd', '3rd'])
-        left.set_index(['1st', '2nd'], inplace=True)
-        ts = left['3rd'].copy(deep=True)
-
-        left.loc[('b', 'x'), '3rd'] = 2
-        left.loc[('b', 'a'), '3rd'] = -1
-        left.loc[('b', 'b'), '3rd'] = 3
-        left.loc[('a', 'x'), '3rd'] = 4
-        left.loc[('a', 'w'), '3rd'] = 5
-        left.loc[('a', 'a'), '3rd'] = 6
-
-        ts.loc[('b', 'x')] = 2
-        ts.loc['b', 'a'] = -1
-        ts.loc[('b', 'b')] = 3
-        ts.loc['a', 'x'] = 4
-        ts.loc[('a', 'w')] = 5
-        ts.loc['a', 'a'] = 6
-
-        right = pd.DataFrame([['a', 'b', 0], ['b', 'd', 1], ['b', 'x', 2],
-                              ['b', 'a', -1], ['b', 'b', 3], ['a', 'x', 4],
-                              ['a', 'w', 5], ['a', 'a', 6]],
-                             columns=['1st', '2nd', '3rd'])
-        right.set_index(['1st', '2nd'], inplace=True)
-        # FIXME data types changes to float because
-        # of intermediate nan insertion;
-        tm.assert_frame_equal(left, right, check_dtype=False)
-        tm.assert_series_equal(ts, right['3rd'])
-
-        # GH9250
-        idx = [('test1', i) for i in range(5)] + \
-            [('test2', i) for i in range(6)] + \
-            [('test', 17), ('test', 18)]
-
-        left = pd.Series(np.linspace(0, 10, 11),
-                         pd.MultiIndex.from_tuples(idx[:-2]))
-
-        left.loc[('test', 17)] = 11
-        left.loc[('test', 18)] = 12
-
-        right = pd.Series(np.linspace(0, 12, 13),
-                          pd.MultiIndex.from_tuples(idx))
-
-        tm.assert_series_equal(left, right)
-
-    def test_take_preserve_name(self):
-        taken = self.index.take([3, 0, 1])
-        self.assertEqual(taken.names, self.index.names)
-
-    def test_take_fill_value(self):
-        # GH 12631
-        vals = [['A', 'B'],
-                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
-        idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
-
-        result = idx.take(np.array([1, 0, -1]))
-        exp_vals = [('A', pd.Timestamp('2011-01-02')),
-                    ('A', pd.Timestamp('2011-01-01')),
-                    ('B', pd.Timestamp('2011-01-02'))]
-        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
-        tm.assert_index_equal(result, expected)
-
-        # fill_value
-        result = idx.take(np.array([1, 0, -1]), fill_value=True)
-        exp_vals = [('A', pd.Timestamp('2011-01-02')),
-                    ('A', pd.Timestamp('2011-01-01')),
-                    (np.nan, pd.NaT)]
-        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
-        tm.assert_index_equal(result, expected)
-
-        # allow_fill=False
-        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
-                          fill_value=True)
-        exp_vals = [('A', pd.Timestamp('2011-01-02')),
-                    ('A', pd.Timestamp('2011-01-01')),
-                    ('B', pd.Timestamp('2011-01-02'))]
-        expected = pd.MultiIndex.from_tuples(exp_vals, names=['str', 'dt'])
-        tm.assert_index_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            idx.take(np.array([1, -5]))
-
-    def take_invalid_kwargs(self):
-        vals = [['A', 'B'],
-                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]]
-        idx = pd.MultiIndex.from_product(vals, names=['str', 'dt'])
-        indices = [1, 2]
-
-        msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, idx.take,
-                              indices, foo=2)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, out=indices)
-
-        msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, mode='clip')
-
-    def test_join_level(self):
-        def _check_how(other, how):
-            join_index, lidx, ridx = other.join(self.index, how=how,
-                                                level='second',
-                                                return_indexers=True)
-
-            exp_level = other.join(self.index.levels[1], how=how)
-            self.assertTrue(join_index.levels[0].equals(self.index.levels[0]))
-            self.assertTrue(join_index.levels[1].equals(exp_level))
-
-            # pare down levels
-            mask = np.array(
-                [x[1] in exp_level for x in self.index], dtype=bool)
-            exp_values = self.index.values[mask]
-            tm.assert_numpy_array_equal(join_index.values, exp_values)
-
-            if how in ('outer', 'inner'):
-                join_index2, ridx2, lidx2 = \
-                    self.index.join(other, how=how, level='second',
-                                    return_indexers=True)
-
-                self.assertTrue(join_index.equals(join_index2))
-                tm.assert_numpy_array_equal(lidx, lidx2)
-                tm.assert_numpy_array_equal(ridx, ridx2)
-                tm.assert_numpy_array_equal(join_index2.values, exp_values)
-
-        def _check_all(other):
-            _check_how(other, 'outer')
-            _check_how(other, 'inner')
-            _check_how(other, 'left')
-            _check_how(other, 'right')
-
-        _check_all(Index(['three', 'one', 'two']))
-        _check_all(Index(['one']))
-        _check_all(Index(['one', 'three']))
-
-        # some corner cases
-        idx = Index(['three', 'one', 'two'])
-        result = idx.join(self.index, level='second')
-        tm.assertIsInstance(result, MultiIndex)
-
-        assertRaisesRegexp(TypeError, "Join.*MultiIndex.*ambiguous",
-                           self.index.join, self.index, level=1)
-
-    def test_join_self(self):
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            res = self.index
-            joined = res.join(res, how=kind)
-            self.assertIs(res, joined)
-
-    def test_join_multi(self):
-        # GH 10665
-        midx = pd.MultiIndex.from_product(
-            [np.arange(4), np.arange(4)], names=['a', 'b'])
-        idx = pd.Index([1, 2, 5], name='b')
-
-        # inner
-        jidx, lidx, ridx = midx.join(idx, how='inner', return_indexers=True)
-        exp_idx = pd.MultiIndex.from_product(
-            [np.arange(4), [1, 2]], names=['a', 'b'])
-        exp_lidx = np.array([1, 2, 5, 6, 9, 10, 13, 14], dtype=np.intp)
-        exp_ridx = np.array([0, 1, 0, 1, 0, 1, 0, 1], dtype=np.intp)
-        self.assert_index_equal(jidx, exp_idx)
-        self.assert_numpy_array_equal(lidx, exp_lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-        # flip
-        jidx, ridx, lidx = idx.join(midx, how='inner', return_indexers=True)
-        self.assert_index_equal(jidx, exp_idx)
-        self.assert_numpy_array_equal(lidx, exp_lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-
-        # keep MultiIndex
-        jidx, lidx, ridx = midx.join(idx, how='left', return_indexers=True)
-        exp_ridx = np.array([-1, 0, 1, -1, -1, 0, 1, -1, -1, 0, 1, -1, -1, 0,
-                             1, -1], dtype=np.intp)
-        self.assert_index_equal(jidx, midx)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-        # flip
-        jidx, ridx, lidx = idx.join(midx, how='right', return_indexers=True)
-        self.assert_index_equal(jidx, midx)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, exp_ridx)
-
-    def test_reindex(self):
-        result, indexer = self.index.reindex(list(self.index[:4]))
-        tm.assertIsInstance(result, MultiIndex)
-        self.check_level_names(result, self.index[:4].names)
-
-        result, indexer = self.index.reindex(list(self.index))
-        tm.assertIsInstance(result, MultiIndex)
-        self.assertIsNone(indexer)
-        self.check_level_names(result, self.index.names)
-
-    def test_reindex_level(self):
-        idx = Index(['one'])
-
-        target, indexer = self.index.reindex(idx, level='second')
-        target2, indexer2 = idx.reindex(self.index, level='second')
-
-        exp_index = self.index.join(idx, level='second', how='right')
-        exp_index2 = self.index.join(idx, level='second', how='left')
-
-        self.assertTrue(target.equals(exp_index))
-        exp_indexer = np.array([0, 2, 4])
-        tm.assert_numpy_array_equal(indexer, exp_indexer, check_dtype=False)
-
-        self.assertTrue(target2.equals(exp_index2))
-        exp_indexer2 = np.array([0, -1, 0, -1, 0, -1])
-        tm.assert_numpy_array_equal(indexer2, exp_indexer2, check_dtype=False)
-
-        assertRaisesRegexp(TypeError, "Fill method not supported",
-                           self.index.reindex, self.index, method='pad',
-                           level='second')
-
-        assertRaisesRegexp(TypeError, "Fill method not supported", idx.reindex,
-                           idx, method='bfill', level='first')
-
-    def test_duplicates(self):
-        self.assertFalse(self.index.has_duplicates)
-        self.assertTrue(self.index.append(self.index).has_duplicates)
-
-        index = MultiIndex(levels=[[0, 1], [0, 1, 2]], labels=[
-                           [0, 0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 0, 1, 2]])
-        self.assertTrue(index.has_duplicates)
-
-        # GH 9075
-        t = [(u('x'), u('out'), u('z'), 5, u('y'), u('in'), u('z'), 169),
-             (u('x'), u('out'), u('z'), 7, u('y'), u('in'), u('z'), 119),
-             (u('x'), u('out'), u('z'), 9, u('y'), u('in'), u('z'), 135),
-             (u('x'), u('out'), u('z'), 13, u('y'), u('in'), u('z'), 145),
-             (u('x'), u('out'), u('z'), 14, u('y'), u('in'), u('z'), 158),
-             (u('x'), u('out'), u('z'), 16, u('y'), u('in'), u('z'), 122),
-             (u('x'), u('out'), u('z'), 17, u('y'), u('in'), u('z'), 160),
-             (u('x'), u('out'), u('z'), 18, u('y'), u('in'), u('z'), 180),
-             (u('x'), u('out'), u('z'), 20, u('y'), u('in'), u('z'), 143),
-             (u('x'), u('out'), u('z'), 21, u('y'), u('in'), u('z'), 128),
-             (u('x'), u('out'), u('z'), 22, u('y'), u('in'), u('z'), 129),
-             (u('x'), u('out'), u('z'), 25, u('y'), u('in'), u('z'), 111),
-             (u('x'), u('out'), u('z'), 28, u('y'), u('in'), u('z'), 114),
-             (u('x'), u('out'), u('z'), 29, u('y'), u('in'), u('z'), 121),
-             (u('x'), u('out'), u('z'), 31, u('y'), u('in'), u('z'), 126),
-             (u('x'), u('out'), u('z'), 32, u('y'), u('in'), u('z'), 155),
-             (u('x'), u('out'), u('z'), 33, u('y'), u('in'), u('z'), 123),
-             (u('x'), u('out'), u('z'), 12, u('y'), u('in'), u('z'), 144)]
-
-        index = pd.MultiIndex.from_tuples(t)
-        self.assertFalse(index.has_duplicates)
-
-        # handle int64 overflow if possible
-        def check(nlevels, with_nulls):
-            labels = np.tile(np.arange(500), 2)
-            level = np.arange(500)
-
-            if with_nulls:  # inject some null values
-                labels[500] = -1  # common nan value
-                labels = list(labels.copy() for i in range(nlevels))
-                for i in range(nlevels):
-                    labels[i][500 + i - nlevels // 2] = -1
-
-                labels += [np.array([-1, 1]).repeat(500)]
-            else:
-                labels = [labels] * nlevels + [np.arange(2).repeat(500)]
-
-            levels = [level] * nlevels + [[0, 1]]
-
-            # no dups
-            index = MultiIndex(levels=levels, labels=labels)
-            self.assertFalse(index.has_duplicates)
-
-            # with a dup
-            if with_nulls:
-                f = lambda a: np.insert(a, 1000, a[0])
-                labels = list(map(f, labels))
-                index = MultiIndex(levels=levels, labels=labels)
-            else:
-                values = index.values.tolist()
-                index = MultiIndex.from_tuples(values + [values[0]])
-
-            self.assertTrue(index.has_duplicates)
-
-        # no overflow
-        check(4, False)
-        check(4, True)
-
-        # overflow possible
-        check(8, False)
-        check(8, True)
-
-        # GH 9125
-        n, k = 200, 5000
-        levels = [np.arange(n), tm.makeStringIndex(n), 1000 + np.arange(n)]
-        labels = [np.random.choice(n, k * n) for lev in levels]
-        mi = MultiIndex(levels=levels, labels=labels)
-
-        for keep in ['first', 'last', False]:
-            left = mi.duplicated(keep=keep)
-            right = pd._libs.hashtable.duplicated_object(mi.values, keep=keep)
-            tm.assert_numpy_array_equal(left, right)
-
-        # GH5873
-        for a in [101, 102]:
-            mi = MultiIndex.from_arrays([[101, a], [3.5, np.nan]])
-            self.assertFalse(mi.has_duplicates)
-            self.assertEqual(mi.get_duplicates(), [])
-            tm.assert_numpy_array_equal(mi.duplicated(), np.zeros(
-                2, dtype='bool'))
-
-        for n in range(1, 6):  # 1st level shape
-            for m in range(1, 5):  # 2nd level shape
-                # all possible unique combinations, including nan
-                lab = product(range(-1, n), range(-1, m))
-                mi = MultiIndex(levels=[list('abcde')[:n], list('WXYZ')[:m]],
-                                labels=np.random.permutation(list(lab)).T)
-                self.assertEqual(len(mi), (n + 1) * (m + 1))
-                self.assertFalse(mi.has_duplicates)
-                self.assertEqual(mi.get_duplicates(), [])
-                tm.assert_numpy_array_equal(mi.duplicated(), np.zeros(
-                    len(mi), dtype='bool'))
-
-    def test_duplicate_meta_data(self):
-        # GH 10115
-        index = MultiIndex(levels=[[0, 1], [0, 1, 2]], labels=[
-                           [0, 0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 0, 1, 2]])
-        for idx in [index,
-                    index.set_names([None, None]),
-                    index.set_names([None, 'Num']),
-                    index.set_names(['Upper', 'Num']), ]:
-            self.assertTrue(idx.has_duplicates)
-            self.assertEqual(idx.drop_duplicates().names, idx.names)
-
-    def test_get_unique_index(self):
-        idx = self.index[[0, 1, 0, 1, 1, 0, 0]]
-        expected = self.index._shallow_copy(idx[[0, 1]])
-
-        for dropna in [False, True]:
-            result = idx._get_unique_index(dropna=dropna)
-            self.assertTrue(result.unique)
-            self.assert_index_equal(result, expected)
-
-    def test_unique(self):
-        mi = pd.MultiIndex.from_arrays([[1, 2, 1, 2], [1, 1, 1, 2]])
-
-        res = mi.unique()
-        exp = pd.MultiIndex.from_arrays([[1, 2, 2], [1, 1, 2]])
-        tm.assert_index_equal(res, exp)
-
-        mi = pd.MultiIndex.from_arrays([list('aaaa'), list('abab')])
-        res = mi.unique()
-        exp = pd.MultiIndex.from_arrays([list('aa'), list('ab')])
-        tm.assert_index_equal(res, exp)
-
-        mi = pd.MultiIndex.from_arrays([list('aaaa'), list('aaaa')])
-        res = mi.unique()
-        exp = pd.MultiIndex.from_arrays([['a'], ['a']])
-        tm.assert_index_equal(res, exp)
-
-    def test_unique_datetimelike(self):
-        idx1 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-01',
-                                 '2015-01-01', 'NaT', 'NaT'])
-        idx2 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', '2015-01-02',
-                                 '2015-01-02', 'NaT', '2015-01-01'],
-                                tz='Asia/Tokyo')
-        result = pd.MultiIndex.from_arrays([idx1, idx2]).unique()
-
-        eidx1 = pd.DatetimeIndex(['2015-01-01', '2015-01-01', 'NaT', 'NaT'])
-        eidx2 = pd.DatetimeIndex(['2015-01-01', '2015-01-02',
-                                  'NaT', '2015-01-01'],
-                                 tz='Asia/Tokyo')
-        exp = pd.MultiIndex.from_arrays([eidx1, eidx2])
-        tm.assert_index_equal(result, exp)
-
-    def test_tolist(self):
-        result = self.index.tolist()
-        exp = list(self.index.values)
-        self.assertEqual(result, exp)
-
-    def test_repr_with_unicode_data(self):
-        with pd.core.config.option_context("display.encoding", 'UTF-8'):
-            d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-            index = pd.DataFrame(d).set_index(["a", "b"]).index
-            self.assertFalse("\\u" in repr(index)
-                             )  # we don't want unicode-escaped
-
-    def test_repr_roundtrip(self):
-
-        mi = MultiIndex.from_product([list('ab'), range(3)],
-                                     names=['first', 'second'])
-        str(mi)
-
-        if PY3:
-            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
-        else:
-            result = eval(repr(mi))
-            # string coerces to unicode
-            tm.assert_index_equal(result, mi, exact=False)
-            self.assertEqual(
-                mi.get_level_values('first').inferred_type, 'string')
-            self.assertEqual(
-                result.get_level_values('first').inferred_type, 'unicode')
-
-        mi_u = MultiIndex.from_product(
-            [list(u'ab'), range(3)], names=['first', 'second'])
-        result = eval(repr(mi_u))
-        tm.assert_index_equal(result, mi_u, exact=True)
-
-        # formatting
-        if PY3:
-            str(mi)
-        else:
-            compat.text_type(mi)
-
-        # long format
-        mi = MultiIndex.from_product([list('abcdefg'), range(10)],
-                                     names=['first', 'second'])
-        result = str(mi)
-
-        if PY3:
-            tm.assert_index_equal(eval(repr(mi)), mi, exact=True)
-        else:
-            result = eval(repr(mi))
-            # string coerces to unicode
-            tm.assert_index_equal(result, mi, exact=False)
-            self.assertEqual(
-                mi.get_level_values('first').inferred_type, 'string')
-            self.assertEqual(
-                result.get_level_values('first').inferred_type, 'unicode')
-
-        mi = MultiIndex.from_product(
-            [list(u'abcdefg'), range(10)], names=['first', 'second'])
-        result = eval(repr(mi_u))
-        tm.assert_index_equal(result, mi_u, exact=True)
-
-    def test_str(self):
-        # tested elsewhere
-        pass
-
-    def test_unicode_string_with_unicode(self):
-        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-        idx = pd.DataFrame(d).set_index(["a", "b"]).index
-
-        if PY3:
-            str(idx)
-        else:
-            compat.text_type(idx)
-
-    def test_bytestring_with_unicode(self):
-        d = {"a": [u("\u05d0"), 2, 3], "b": [4, 5, 6], "c": [7, 8, 9]}
-        idx = pd.DataFrame(d).set_index(["a", "b"]).index
-
-        if PY3:
-            bytes(idx)
-        else:
-            str(idx)
-
-    def test_slice_keep_name(self):
-        x = MultiIndex.from_tuples([('a', 'b'), (1, 2), ('c', 'd')],
-                                   names=['x', 'y'])
-        self.assertEqual(x[1:].names, x.names)
-
-    def test_isnull_behavior(self):
-        # should not segfault GH5123
-        # NOTE: if MI representation changes, may make sense to allow
-        # isnull(MI)
-        with tm.assertRaises(NotImplementedError):
-            pd.isnull(self.index)
-
-    def test_level_setting_resets_attributes(self):
-        ind = MultiIndex.from_arrays([
-            ['A', 'A', 'B', 'B', 'B'], [1, 2, 1, 2, 3]
-        ])
-        self.assertTrue(ind.is_monotonic)
-        ind.set_levels([['A', 'B', 'A', 'A', 'B'], [2, 1, 3, -2, 5]],
-                       inplace=True)
-
-        # if this fails, probably didn't reset the cache correctly.
-        self.assertFalse(ind.is_monotonic)
-
-    def test_is_monotonic(self):
-        i = MultiIndex.from_product([np.arange(10),
-                                     np.arange(10)], names=['one', 'two'])
-        self.assertTrue(i.is_monotonic)
-        self.assertTrue(Index(i.values).is_monotonic)
-
-        i = MultiIndex.from_product([np.arange(10, 0, -1),
-                                     np.arange(10)], names=['one', 'two'])
-        self.assertFalse(i.is_monotonic)
-        self.assertFalse(Index(i.values).is_monotonic)
-
-        i = MultiIndex.from_product([np.arange(10),
-                                     np.arange(10, 0, -1)],
-                                    names=['one', 'two'])
-        self.assertFalse(i.is_monotonic)
-        self.assertFalse(Index(i.values).is_monotonic)
-
-        i = MultiIndex.from_product([[1.0, np.nan, 2.0], ['a', 'b', 'c']])
-        self.assertFalse(i.is_monotonic)
-        self.assertFalse(Index(i.values).is_monotonic)
-
-        # string ordering
-        i = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                               ['one', 'two', 'three']],
-                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                       names=['first', 'second'])
-        self.assertFalse(i.is_monotonic)
-        self.assertFalse(Index(i.values).is_monotonic)
-
-        i = MultiIndex(levels=[['bar', 'baz', 'foo', 'qux'],
-                               ['mom', 'next', 'zenith']],
-                       labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                               [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                       names=['first', 'second'])
-        self.assertTrue(i.is_monotonic)
-        self.assertTrue(Index(i.values).is_monotonic)
-
-        # mixed levels, hits the TypeError
-        i = MultiIndex(
-            levels=[[1, 2, 3, 4], ['gb00b03mlx29', 'lu0197800237',
-                                   'nl0000289783',
-                                   'nl0000289965', 'nl0000301109']],
-            labels=[[0, 1, 1, 2, 2, 2, 3], [4, 2, 0, 0, 1, 3, -1]],
-            names=['household_id', 'asset_id'])
-
-        self.assertFalse(i.is_monotonic)
-
-    def test_isin(self):
-        values = [('foo', 2), ('bar', 3), ('quux', 4)]
-
-        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'], np.arange(
-            4)])
-        result = idx.isin(values)
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(result, expected)
-
-        # empty, return dtype bool
-        idx = MultiIndex.from_arrays([[], []])
-        result = idx.isin(values)
-        self.assertEqual(len(result), 0)
-        self.assertEqual(result.dtype, np.bool_)
-
-    def test_isin_nan(self):
-        idx = MultiIndex.from_arrays([['foo', 'bar'], [1.0, np.nan]])
-        tm.assert_numpy_array_equal(idx.isin([('bar', np.nan)]),
-                                    np.array([False, False]))
-        tm.assert_numpy_array_equal(idx.isin([('bar', float('nan'))]),
-                                    np.array([False, False]))
-
-    def test_isin_level_kwarg(self):
-        idx = MultiIndex.from_arrays([['qux', 'baz', 'foo', 'bar'], np.arange(
-            4)])
-
-        vals_0 = ['foo', 'bar', 'quux']
-        vals_1 = [2, 3, 10]
-
-        expected = np.array([False, False, True, True])
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=0))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level=-2))
-
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=1))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level=-1))
-
-        self.assertRaises(IndexError, idx.isin, vals_0, level=5)
-        self.assertRaises(IndexError, idx.isin, vals_0, level=-5)
-
-        self.assertRaises(KeyError, idx.isin, vals_0, level=1.0)
-        self.assertRaises(KeyError, idx.isin, vals_1, level=-1.0)
-        self.assertRaises(KeyError, idx.isin, vals_1, level='A')
-
-        idx.names = ['A', 'B']
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_0, level='A'))
-        tm.assert_numpy_array_equal(expected, idx.isin(vals_1, level='B'))
-
-        self.assertRaises(KeyError, idx.isin, vals_1, level='C')
-
-    def test_reindex_preserves_names_when_target_is_list_or_ndarray(self):
-        # GH6552
-        idx = self.index.copy()
-        target = idx.copy()
-        idx.names = target.names = [None, None]
-
-        other_dtype = pd.MultiIndex.from_product([[1, 2], [3, 4]])
-
-        # list & ndarray cases
-        self.assertEqual(idx.reindex([])[0].names, [None, None])
-        self.assertEqual(idx.reindex(np.array([]))[0].names, [None, None])
-        self.assertEqual(idx.reindex(target.tolist())[0].names, [None, None])
-        self.assertEqual(idx.reindex(target.values)[0].names, [None, None])
-        self.assertEqual(
-            idx.reindex(other_dtype.tolist())[0].names, [None, None])
-        self.assertEqual(
-            idx.reindex(other_dtype.values)[0].names, [None, None])
-
-        idx.names = ['foo', 'bar']
-        self.assertEqual(idx.reindex([])[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(np.array([]))[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(target.tolist())[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex(target.values)[0].names, ['foo', 'bar'])
-        self.assertEqual(
-            idx.reindex(other_dtype.tolist())[0].names, ['foo', 'bar'])
-        self.assertEqual(
-            idx.reindex(other_dtype.values)[0].names, ['foo', 'bar'])
-
-    def test_reindex_lvl_preserves_names_when_target_is_list_or_array(self):
-        # GH7774
-        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']],
-                                         names=['foo', 'bar'])
-        self.assertEqual(idx.reindex([], level=0)[0].names, ['foo', 'bar'])
-        self.assertEqual(idx.reindex([], level=1)[0].names, ['foo', 'bar'])
-
-    def test_reindex_lvl_preserves_type_if_target_is_empty_list_or_array(self):
-        # GH7774
-        idx = pd.MultiIndex.from_product([[0, 1], ['a', 'b']])
-        self.assertEqual(idx.reindex([], level=0)[0].levels[0].dtype.type,
-                         np.int64)
-        self.assertEqual(idx.reindex([], level=1)[0].levels[1].dtype.type,
-                         np.object_)
-
-    def test_groupby(self):
-        groups = self.index.groupby(np.array([1, 1, 1, 2, 2, 2]))
-        labels = self.index.get_values().tolist()
-        exp = {1: labels[:3], 2: labels[3:]}
-        tm.assert_dict_equal(groups, exp)
-
-        # GH5620
-        groups = self.index.groupby(self.index)
-        exp = dict((key, [key]) for key in self.index)
-        tm.assert_dict_equal(groups, exp)
-
-    def test_index_name_retained(self):
-        # GH9857
-        result = pd.DataFrame({'x': [1, 2, 6],
-                               'y': [2, 2, 8],
-                               'z': [-5, 0, 5]})
-        result = result.set_index('z')
-        result.loc[10] = [9, 10]
-        df_expected = pd.DataFrame({'x': [1, 2, 6, 9],
-                                    'y': [2, 2, 8, 10],
-                                    'z': [-5, 0, 5, 10]})
-        df_expected = df_expected.set_index('z')
-        tm.assert_frame_equal(result, df_expected)
-
-    def test_equals_operator(self):
-        # GH9785
-        self.assertTrue((self.index == self.index).all())
-
-    def test_large_multiindex_error(self):
-        # GH12527
-        df_below_1000000 = pd.DataFrame(
-            1, index=pd.MultiIndex.from_product([[1, 2], range(499999)]),
-            columns=['dest'])
-        with assertRaises(KeyError):
-            df_below_1000000.loc[(-1, 0), 'dest']
-        with assertRaises(KeyError):
-            df_below_1000000.loc[(3, 0), 'dest']
-        df_above_1000000 = pd.DataFrame(
-            1, index=pd.MultiIndex.from_product([[1, 2], range(500001)]),
-            columns=['dest'])
-        with assertRaises(KeyError):
-            df_above_1000000.loc[(-1, 0), 'dest']
-        with assertRaises(KeyError):
-            df_above_1000000.loc[(3, 0), 'dest']
-
-    def test_partial_string_timestamp_multiindex(self):
-        # GH10331
-        dr = pd.date_range('2016-01-01', '2016-01-03', freq='12H')
-        abc = ['a', 'b', 'c']
-        ix = pd.MultiIndex.from_product([dr, abc])
-        df = pd.DataFrame({'c1': range(0, 15)}, index=ix)
-        idx = pd.IndexSlice
-
-        #                        c1
-        # 2016-01-01 00:00:00 a   0
-        #                     b   1
-        #                     c   2
-        # 2016-01-01 12:00:00 a   3
-        #                     b   4
-        #                     c   5
-        # 2016-01-02 00:00:00 a   6
-        #                     b   7
-        #                     c   8
-        # 2016-01-02 12:00:00 a   9
-        #                     b  10
-        #                     c  11
-        # 2016-01-03 00:00:00 a  12
-        #                     b  13
-        #                     c  14
-
-        # partial string matching on a single index
-        for df_swap in (df.swaplevel(),
-                        df.swaplevel(0),
-                        df.swaplevel(0, 1)):
-            df_swap = df_swap.sort_index()
-            just_a = df_swap.loc['a']
-            result = just_a.loc['2016-01-01']
-            expected = df.loc[idx[:, 'a'], :].iloc[0:2]
-            expected.index = expected.index.droplevel(1)
-            tm.assert_frame_equal(result, expected)
-
-        # indexing with IndexSlice
-        result = df.loc[idx['2016-01-01':'2016-02-01', :], :]
-        expected = df
-        tm.assert_frame_equal(result, expected)
-
-        # match on secondary index
-        result = df_swap.loc[idx[:, '2016-01-01':'2016-01-01'], :]
-        expected = df_swap.iloc[[0, 1, 5, 6, 10, 11]]
-        tm.assert_frame_equal(result, expected)
-
-        # Even though this syntax works on a single index, this is somewhat
-        # ambiguous and we don't want to extend this behavior forward to work
-        # in multi-indexes. This would amount to selecting a scalar from a
-        # column.
-        with assertRaises(KeyError):
-            df['2016-01-01']
-
-        # partial string match on year only
-        result = df.loc['2016']
-        expected = df
-        tm.assert_frame_equal(result, expected)
-
-        # partial string match on date
-        result = df.loc['2016-01-01']
-        expected = df.iloc[0:6]
-        tm.assert_frame_equal(result, expected)
-
-        # partial string match on date and hour, from middle
-        result = df.loc['2016-01-02 12']
-        expected = df.iloc[9:12]
-        tm.assert_frame_equal(result, expected)
-
-        # partial string match on secondary index
-        result = df_swap.loc[idx[:, '2016-01-02'], :]
-        expected = df_swap.iloc[[2, 3, 7, 8, 12, 13]]
-        tm.assert_frame_equal(result, expected)
-
-        # tuple selector with partial string match on date
-        result = df.loc[('2016-01-01', 'a'), :]
-        expected = df.iloc[[0, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        # Slicing date on first level should break (of course)
-        with assertRaises(KeyError):
-            df_swap.loc['2016-01-01']
-
-        # GH12685 (partial string with daily resolution or below)
-        dr = date_range('2013-01-01', periods=100, freq='D')
-        ix = MultiIndex.from_product([dr, ['a', 'b']])
-        df = DataFrame(np.random.randn(200, 1), columns=['A'], index=ix)
-
-        result = df.loc[idx['2013-03':'2013-03', :], :]
-        expected = df.iloc[118:180]
-        tm.assert_frame_equal(result, expected)
-
-    def test_rangeindex_fallback_coercion_bug(self):
-        # GH 12893
-        foo = pd.DataFrame(np.arange(100).reshape((10, 10)))
-        bar = pd.DataFrame(np.arange(100).reshape((10, 10)))
-        df = pd.concat({'foo': foo.stack(), 'bar': bar.stack()}, axis=1)
-        df.index.names = ['fizz', 'buzz']
-
-        str(df)
-        expected = pd.DataFrame({'bar': np.arange(100),
-                                 'foo': np.arange(100)},
-                                index=pd.MultiIndex.from_product(
-                                    [range(10), range(10)],
-                                    names=['fizz', 'buzz']))
-        tm.assert_frame_equal(df, expected, check_like=True)
-
-        result = df.index.get_level_values('fizz')
-        expected = pd.Int64Index(np.arange(10), name='fizz').repeat(10)
-        tm.assert_index_equal(result, expected)
-
-        result = df.index.get_level_values('buzz')
-        expected = pd.Int64Index(np.tile(np.arange(10), 10), name='buzz')
-        tm.assert_index_equal(result, expected)
-
-    def test_dropna(self):
-        # GH 6194
-        idx = pd.MultiIndex.from_arrays([[1, np.nan, 3, np.nan, 5],
-                                         [1, 2, np.nan, np.nan, 5],
-                                         ['a', 'b', 'c', np.nan, 'e']])
-
-        exp = pd.MultiIndex.from_arrays([[1, 5],
-                                         [1, 5],
-                                         ['a', 'e']])
-        tm.assert_index_equal(idx.dropna(), exp)
-        tm.assert_index_equal(idx.dropna(how='any'), exp)
-
-        exp = pd.MultiIndex.from_arrays([[1, np.nan, 3, 5],
-                                         [1, 2, np.nan, 5],
-                                         ['a', 'b', 'c', 'e']])
-        tm.assert_index_equal(idx.dropna(how='all'), exp)
-
-        msg = "invalid how option: xxx"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.dropna(how='xxx')
-
-    def test_unsortedindex(self):
-        # GH 11897
-        mi = pd.MultiIndex.from_tuples([('z', 'a'), ('x', 'a'), ('y', 'b'),
-                                        ('x', 'b'), ('y', 'a'), ('z', 'b')],
-                                       names=['one', 'two'])
-        df = pd.DataFrame([[i, 10 * i] for i in lrange(6)], index=mi,
-                          columns=['one', 'two'])
-
-        with assertRaises(UnsortedIndexError):
-            df.loc(axis=0)['z', :]
-        df.sort_index(inplace=True)
-        self.assertEqual(len(df.loc(axis=0)['z', :]), 2)
-
-        with assertRaises(KeyError):
-            df.loc(axis=0)['q', :]
-
-    def test_tuples_with_name_string(self):
-        # GH 15110 and GH 14848
-
-        li = [(0, 0, 1), (0, 1, 0), (1, 0, 0)]
-        with assertRaises(ValueError):
-            pd.Index(li, name='abc')
-        with assertRaises(ValueError):
-            pd.Index(li, name='a')
diff --git a/pandas/tests/indexes/test_numeric.py b/pandas/tests/indexes/test_numeric.py
index d0ce34169f79e..26413f4519eff 100644
--- a/pandas/tests/indexes/test_numeric.py
+++ b/pandas/tests/indexes/test_numeric.py
@@ -1,121 +1,35 @@
 # -*- coding: utf-8 -*-
 
 from datetime import datetime
-from pandas.compat import range, PY3
+import re
 
 import numpy as np
+import pytest
 
-from pandas import (date_range, notnull, Series, Index, Float64Index,
-                    Int64Index, UInt64Index, RangeIndex)
-
-import pandas.util.testing as tm
+from pandas._libs.tslibs import Timestamp
+from pandas.compat import PY2, range
 
 import pandas as pd
-from pandas._libs.lib import Timestamp
-
+from pandas import Float64Index, Index, Int64Index, Series, UInt64Index
+from pandas.api.types import pandas_dtype
 from pandas.tests.indexes.common import Base
-
-
-def full_like(array, value):
-    """Compatibility for numpy<1.8.0
-    """
-    ret = np.empty(array.shape, dtype=np.array(value).dtype)
-    ret.fill(value)
-    return ret
+import pandas.util.testing as tm
 
 
 class Numeric(Base):
 
-    def test_numeric_compat(self):
-
+    def test_can_hold_identifiers(self):
         idx = self.create_index()
-        didx = idx * idx
-
-        result = idx * 1
-        tm.assert_index_equal(result, idx)
-
-        result = 1 * idx
-        tm.assert_index_equal(result, idx)
-
-        # in general not true for RangeIndex
-        if not isinstance(idx, RangeIndex):
-            result = idx * idx
-            tm.assert_index_equal(result, idx ** 2)
-
-        # truediv under PY3
-        result = idx / 1
-        expected = idx
-        if PY3:
-            expected = expected.astype('float64')
-        tm.assert_index_equal(result, expected)
-
-        result = idx / 2
-        if PY3:
-            expected = expected.astype('float64')
-        expected = Index(idx.values / 2)
-        tm.assert_index_equal(result, expected)
-
-        result = idx // 1
-        tm.assert_index_equal(result, idx)
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
 
-        result = idx * np.array(5, dtype='int64')
-        tm.assert_index_equal(result, idx * 5)
-
-        arr_dtype = 'uint64' if isinstance(idx, UInt64Index) else 'int64'
-        result = idx * np.arange(5, dtype=arr_dtype)
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5, dtype=arr_dtype))
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5, dtype='float64') + 0.1)
-        expected = Float64Index(np.arange(5, dtype='float64') *
-                                (np.arange(5, dtype='float64') + 0.1))
-        tm.assert_index_equal(result, expected)
-
-        # invalid
-        self.assertRaises(TypeError,
-                          lambda: idx * date_range('20130101', periods=5))
-        self.assertRaises(ValueError, lambda: idx * idx[0:3])
-        self.assertRaises(ValueError, lambda: idx * np.array([1, 2]))
-
-        result = divmod(idx, 2)
-        with np.errstate(all='ignore'):
-            div, mod = divmod(idx.values, 2)
-            expected = Index(div), Index(mod)
-        for r, e in zip(result, expected):
-            tm.assert_index_equal(r, e)
-
-        result = divmod(idx, full_like(idx.values, 2))
-        with np.errstate(all='ignore'):
-            div, mod = divmod(idx.values, full_like(idx.values, 2))
-            expected = Index(div), Index(mod)
-        for r, e in zip(result, expected):
-            tm.assert_index_equal(r, e)
-
-        result = divmod(idx, Series(full_like(idx.values, 2)))
-        with np.errstate(all='ignore'):
-            div, mod = divmod(
-                idx.values,
-                full_like(idx.values, 2),
-            )
-            expected = Index(div), Index(mod)
-        for r, e in zip(result, expected):
-            tm.assert_index_equal(r, e)
-
-        # test power calculations both ways, GH 14973
-        expected = pd.Float64Index(2.0**idx.values)
-        result = 2.0**idx
-        tm.assert_index_equal(result, expected)
-
-        expected = pd.Float64Index(idx.values**2.0)
-        result = idx**2.0
-        tm.assert_index_equal(result, expected)
+    def test_numeric_compat(self):
+        pass  # override Base method
 
     def test_explicit_conversions(self):
 
         # GH 8608
-        # add/sub are overriden explicity for Float/Int Index
+        # add/sub are overridden explicitly for Float/Int Index
         idx = self._holder(np.arange(5, dtype='int64'))
 
         # float conversions
@@ -137,12 +51,6 @@ def test_explicit_conversions(self):
         result = a - fidx
         tm.assert_index_equal(result, expected)
 
-    def test_ufunc_compat(self):
-        idx = self._holder(np.arange(5, dtype='int64'))
-        result = np.sin(idx)
-        expected = Float64Index(np.sin(np.arange(5, dtype='int64')))
-        tm.assert_index_equal(result, expected)
-
     def test_index_groupby(self):
         int_idx = Index(range(6))
         float_idx = Index(np.arange(0, 0.6, 0.1))
@@ -167,19 +75,34 @@ def test_index_groupby(self):
                         ex_keys[1]: idx[[1, 4]]}
             tm.assert_dict_equal(idx.groupby(to_groupby), expected)
 
-    def test_modulo(self):
-        # GH 9244
-        index = self.create_index()
-        expected = Index(index.values % 2)
-        self.assert_index_equal(index % 2, expected)
+    @pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+    def test_where(self, klass):
+        i = self.create_index()
+        cond = [True] * len(i)
+        expected = i
+        result = i.where(klass(cond))
+
+        cond = [False] + [True] * (len(i) - 1)
+        expected = Float64Index([i._na_value] + i[1:].tolist())
+        result = i.where(klass(cond))
+        tm.assert_index_equal(result, expected)
+
+    def test_insert(self):
+        # GH 18295 (test missing)
+        expected = Float64Index([0, np.nan, 1, 2, 3, 4])
+        for na in (np.nan, pd.NaT, None):
+            result = self.create_index().insert(1, na)
+            tm.assert_index_equal(result, expected)
 
 
-class TestFloat64Index(Numeric, tm.TestCase):
+class TestFloat64Index(Numeric):
     _holder = Float64Index
 
-    def setUp(self):
+    def setup_method(self, method):
         self.indices = dict(mixed=Float64Index([1.5, 2, 3, 4, 5]),
-                            float=Float64Index(np.arange(5) * 2.5))
+                            float=Float64Index(np.arange(5) * 2.5),
+                            mixed_dec=Float64Index([5, 4, 3, 2, 1.5]),
+                            float_dec=Float64Index(np.arange(4, -1, -1) * 2.5))
         self.setup_indices()
 
     def create_index(self):
@@ -190,14 +113,14 @@ def test_repr_roundtrip(self):
             tm.assert_index_equal(eval(repr(ind)), ind)
 
     def check_is_index(self, i):
-        self.assertIsInstance(i, Index)
-        self.assertNotIsInstance(i, Float64Index)
+        assert isinstance(i, Index)
+        assert not isinstance(i, Float64Index)
 
     def check_coerce(self, a, b, is_float_index=True):
-        self.assertTrue(a.equals(b))
-        self.assert_index_equal(a, b, exact=False)
+        assert a.equals(b)
+        tm.assert_index_equal(a, b, exact=False)
         if is_float_index:
-            self.assertIsInstance(b, Float64Index)
+            assert isinstance(b, Float64Index)
         else:
             self.check_is_index(b)
 
@@ -205,39 +128,49 @@ def test_constructor(self):
 
         # explicit construction
         index = Float64Index([1, 2, 3, 4, 5])
-        self.assertIsInstance(index, Float64Index)
+        assert isinstance(index, Float64Index)
         expected = np.array([1, 2, 3, 4, 5], dtype='float64')
-        self.assert_numpy_array_equal(index.values, expected)
+        tm.assert_numpy_array_equal(index.values, expected)
         index = Float64Index(np.array([1, 2, 3, 4, 5]))
-        self.assertIsInstance(index, Float64Index)
+        assert isinstance(index, Float64Index)
         index = Float64Index([1., 2, 3, 4, 5])
-        self.assertIsInstance(index, Float64Index)
+        assert isinstance(index, Float64Index)
         index = Float64Index(np.array([1., 2, 3, 4, 5]))
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, float)
+        assert isinstance(index, Float64Index)
+        assert index.dtype == float
 
         index = Float64Index(np.array([1., 2, 3, 4, 5]), dtype=np.float32)
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, np.float64)
+        assert isinstance(index, Float64Index)
+        assert index.dtype == np.float64
 
         index = Float64Index(np.array([1, 2, 3, 4, 5]), dtype=np.float32)
-        self.assertIsInstance(index, Float64Index)
-        self.assertEqual(index.dtype, np.float64)
+        assert isinstance(index, Float64Index)
+        assert index.dtype == np.float64
 
         # nan handling
         result = Float64Index([np.nan, np.nan])
-        self.assertTrue(pd.isnull(result.values).all())
+        assert pd.isna(result.values).all()
         result = Float64Index(np.array([np.nan]))
-        self.assertTrue(pd.isnull(result.values).all())
+        assert pd.isna(result.values).all()
         result = Index(np.array([np.nan]))
-        self.assertTrue(pd.isnull(result.values).all())
+        assert pd.isna(result.values).all()
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_constructor_invalid(self):
 
         # invalid
-        self.assertRaises(TypeError, Float64Index, 0.)
-        self.assertRaises(TypeError, Float64Index, ['a', 'b', 0.])
-        self.assertRaises(TypeError, Float64Index, [Timestamp('20130101')])
+        msg = (r"Float64Index\(\.\.\.\) must be called with a collection of"
+               r" some kind, 0\.0 was passed")
+        with pytest.raises(TypeError, match=msg):
+            Float64Index(0.)
+        msg = ("String dtype not supported, you may need to explicitly cast to"
+               " a numeric type")
+        with pytest.raises(TypeError, match=msg):
+            Float64Index(['a', 'b', 0.])
+        msg = (r"float\(\) argument must be a string or a number, not"
+               " 'Timestamp'")
+        with pytest.raises(TypeError, match=msg):
+            Float64Index([Timestamp('20130101')])
 
     def test_constructor_coerce(self):
 
@@ -258,15 +191,15 @@ def test_constructor_explicit(self):
     def test_astype(self):
 
         result = self.float.astype(object)
-        self.assertTrue(result.equals(self.float))
-        self.assertTrue(self.float.equals(result))
+        assert result.equals(self.float)
+        assert self.float.equals(result)
         self.check_is_index(result)
 
         i = self.mixed.copy()
         i.name = 'foo'
         result = i.astype(object)
-        self.assertTrue(result.equals(i))
-        self.assertTrue(i.equals(result))
+        assert result.equals(i)
+        assert i.equals(result)
         self.check_is_index(result)
 
         # GH 12881
@@ -295,28 +228,45 @@ def test_astype(self):
 
         # invalid
         for dtype in ['M8[ns]', 'm8[ns]']:
-            self.assertRaises(TypeError, lambda: i.astype(dtype))
+            msg = ("Cannot convert Float64Index to dtype {}; integer values"
+                   " are required for conversion").format(pandas_dtype(dtype))
+            with pytest.raises(TypeError, match=re.escape(msg)):
+                i.astype(dtype)
 
         # GH 13149
         for dtype in ['int16', 'int32', 'int64']:
             i = Float64Index([0, 1.1, np.NAN])
-            self.assertRaises(ValueError, lambda: i.astype(dtype))
+            msg = "Cannot convert NA to integer"
+            with pytest.raises(ValueError, match=msg):
+                i.astype(dtype)
+
+    def test_type_coercion_fail(self, any_int_dtype):
+        # see gh-15832
+        msg = "Trying to coerce float values to integers"
+        with pytest.raises(ValueError, match=msg):
+            Index([1, 2, 3.5], dtype=any_int_dtype)
+
+    def test_type_coercion_valid(self, float_dtype):
+        # There is no Float32Index, so we always
+        # generate Float64Index.
+        i = Index([1, 2, 3.5], dtype=float_dtype)
+        tm.assert_index_equal(i, Index([1, 2, 3.5]))
 
     def test_equals_numeric(self):
 
         i = Float64Index([1.0, 2.0])
-        self.assertTrue(i.equals(i))
-        self.assertTrue(i.identical(i))
+        assert i.equals(i)
+        assert i.identical(i)
 
         i2 = Float64Index([1.0, 2.0])
-        self.assertTrue(i.equals(i2))
+        assert i.equals(i2)
 
         i = Float64Index([1.0, np.nan])
-        self.assertTrue(i.equals(i))
-        self.assertTrue(i.identical(i))
+        assert i.equals(i)
+        assert i.identical(i)
 
         i2 = Float64Index([1.0, np.nan])
-        self.assertTrue(i.equals(i2))
+        assert i.equals(i2)
 
     def test_get_indexer(self):
         idx = Float64Index([0.0, 1.0, 2.0])
@@ -334,54 +284,81 @@ def test_get_indexer(self):
     def test_get_loc(self):
         idx = Float64Index([0.0, 1.0, 2.0])
         for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(1, method), 1)
+            assert idx.get_loc(1, method) == 1
             if method is not None:
-                self.assertEqual(idx.get_loc(1, method, tolerance=0), 1)
+                assert idx.get_loc(1, method, tolerance=0) == 1
 
         for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc(1.1, method), loc)
-            self.assertEqual(idx.get_loc(1.1, method, tolerance=0.9), loc)
+            assert idx.get_loc(1.1, method) == loc
+            assert idx.get_loc(1.1, method, tolerance=0.9) == loc
+
+        with pytest.raises(KeyError, match="^'foo'$"):
+            idx.get_loc('foo')
+        with pytest.raises(KeyError, match=r"^1\.5$"):
+            idx.get_loc(1.5)
+        with pytest.raises(KeyError, match=r"^1\.5$"):
+            idx.get_loc(1.5, method='pad', tolerance=0.1)
+        with pytest.raises(KeyError, match="^True$"):
+            idx.get_loc(True)
+        with pytest.raises(KeyError, match="^False$"):
+            idx.get_loc(False)
+
+        with pytest.raises(ValueError, match='must be numeric'):
+            idx.get_loc(1.4, method='nearest', tolerance='foo')
 
-        self.assertRaises(KeyError, idx.get_loc, 'foo')
-        self.assertRaises(KeyError, idx.get_loc, 1.5)
-        self.assertRaises(KeyError, idx.get_loc, 1.5, method='pad',
-                          tolerance=0.1)
+        with pytest.raises(ValueError, match='must contain numeric elements'):
+            idx.get_loc(1.4, method='nearest', tolerance=np.array(['foo']))
 
-        with tm.assertRaisesRegexp(ValueError, 'must be numeric'):
-            idx.get_loc(1.4, method='nearest', tolerance='foo')
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match target index size'):
+            idx.get_loc(1.4, method='nearest', tolerance=np.array([1, 2]))
 
     def test_get_loc_na(self):
         idx = Float64Index([np.nan, 1, 2])
-        self.assertEqual(idx.get_loc(1), 1)
-        self.assertEqual(idx.get_loc(np.nan), 0)
+        assert idx.get_loc(1) == 1
+        assert idx.get_loc(np.nan) == 0
 
         idx = Float64Index([np.nan, 1, np.nan])
-        self.assertEqual(idx.get_loc(1), 1)
+        assert idx.get_loc(1) == 1
 
         # representable by slice [0:2:2]
-        # self.assertRaises(KeyError, idx.slice_locs, np.nan)
+        # pytest.raises(KeyError, idx.slice_locs, np.nan)
         sliced = idx.slice_locs(np.nan)
-        self.assertTrue(isinstance(sliced, tuple))
-        self.assertEqual(sliced, (0, 3))
+        assert isinstance(sliced, tuple)
+        assert sliced == (0, 3)
 
         # not representable by slice
         idx = Float64Index([np.nan, 1, np.nan, np.nan])
-        self.assertEqual(idx.get_loc(1), 1)
-        self.assertRaises(KeyError, idx.slice_locs, np.nan)
+        assert idx.get_loc(1) == 1
+        msg = "'Cannot get left slice bound for non-unique label: nan"
+        with pytest.raises(KeyError, match=msg):
+            idx.slice_locs(np.nan)
+
+    def test_get_loc_missing_nan(self):
+        # GH 8569
+        idx = Float64Index([1, 2])
+        assert idx.get_loc(1) == 0
+        with pytest.raises(KeyError, match=r"^3\.0$"):
+            idx.get_loc(3)
+        with pytest.raises(KeyError, match="^nan$"):
+            idx.get_loc(np.nan)
+        with pytest.raises(KeyError, match=r"^\[nan\]$"):
+            idx.get_loc([np.nan])
 
     def test_contains_nans(self):
         i = Float64Index([1.0, 2.0, np.nan])
-        self.assertTrue(np.nan in i)
+        assert np.nan in i
 
     def test_contains_not_nans(self):
         i = Float64Index([1.0, 2.0, np.nan])
-        self.assertTrue(1.0 in i)
+        assert 1.0 in i
 
     def test_doesnt_contain_all_the_things(self):
         i = Float64Index([np.nan])
-        self.assertFalse(i.isin([0]).item())
-        self.assertFalse(i.isin([1]).item())
-        self.assertTrue(i.isin([np.nan]).item())
+        assert not i.isin([0]).item()
+        assert not i.isin([1]).item()
+        assert i.isin([np.nan]).item()
 
     def test_nan_multiple_containment(self):
         i = Float64Index([1.0, np.nan])
@@ -398,7 +375,7 @@ def test_astype_from_object(self):
         index = Index([1.0, np.nan, 0.2], dtype='object')
         result = index.astype(float)
         expected = Float64Index([1.0, np.nan, 0.2])
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
         tm.assert_index_equal(result, expected)
 
     def test_fillna_float64(self):
@@ -406,15 +383,15 @@ def test_fillna_float64(self):
         idx = Index([1.0, np.nan, 3.0], dtype=float, name='x')
         # can't downcast
         exp = Index([1.0, 0.1, 3.0], name='x')
-        self.assert_index_equal(idx.fillna(0.1), exp)
+        tm.assert_index_equal(idx.fillna(0.1), exp)
 
         # downcast
         exp = Float64Index([1.0, 2.0, 3.0], name='x')
-        self.assert_index_equal(idx.fillna(2), exp)
+        tm.assert_index_equal(idx.fillna(2), exp)
 
         # object
         exp = Index([1.0, 'obj', 3.0], name='x')
-        self.assert_index_equal(idx.fillna('obj'), exp)
+        tm.assert_index_equal(idx.fillna('obj'), exp)
 
     def test_take_fill_value(self):
         # GH 12631
@@ -436,23 +413,21 @@ def test_take_fill_value(self):
 
         msg = ('When allow_fill=True and fill_value is not None, '
                'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             idx.take(np.array([1, -5]))
 
 
 class NumericInt(Numeric):
 
     def test_view(self):
-        super(NumericInt, self).test_view()
-
         i = self._holder([], name='Foo')
         i_view = i.view()
-        self.assertEqual(i_view.name, 'Foo')
+        assert i_view.name == 'Foo'
 
         i_view = i.view(self._dtype)
         tm.assert_index_equal(i, self._holder(i_view, name='Foo'))
@@ -461,42 +436,61 @@ def test_view(self):
         tm.assert_index_equal(i, self._holder(i_view, name='Foo'))
 
     def test_is_monotonic(self):
-        self.assertTrue(self.index.is_monotonic)
-        self.assertTrue(self.index.is_monotonic_increasing)
-        self.assertFalse(self.index.is_monotonic_decreasing)
+        assert self.index.is_monotonic is True
+        assert self.index.is_monotonic_increasing is True
+        assert self.index._is_strictly_monotonic_increasing is True
+        assert self.index.is_monotonic_decreasing is False
+        assert self.index._is_strictly_monotonic_decreasing is False
 
         index = self._holder([4, 3, 2, 1])
-        self.assertFalse(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is False
+        assert index._is_strictly_monotonic_increasing is False
+        assert index._is_strictly_monotonic_decreasing is True
 
         index = self._holder([1])
-        self.assertTrue(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_increasing)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is True
+        assert index.is_monotonic_increasing is True
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_increasing is True
+        assert index._is_strictly_monotonic_decreasing is True
+
+    def test_is_strictly_monotonic(self):
+        index = self._holder([1, 1, 2, 3])
+        assert index.is_monotonic_increasing is True
+        assert index._is_strictly_monotonic_increasing is False
+
+        index = self._holder([3, 2, 1, 1])
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_decreasing is False
+
+        index = self._holder([1, 1])
+        assert index.is_monotonic_increasing
+        assert index.is_monotonic_decreasing
+        assert not index._is_strictly_monotonic_increasing
+        assert not index._is_strictly_monotonic_decreasing
 
     def test_logical_compat(self):
         idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
+        assert idx.all() == idx.values.all()
+        assert idx.any() == idx.values.any()
 
     def test_identical(self):
         i = Index(self.index.copy())
-        self.assertTrue(i.identical(self.index))
+        assert i.identical(self.index)
 
         same_values_different_type = Index(i, dtype=object)
-        self.assertFalse(i.identical(same_values_different_type))
+        assert not i.identical(same_values_different_type)
 
         i = self.index.copy(dtype=object)
         i = i.rename('foo')
         same_values = Index(i, dtype=object)
-        self.assertTrue(same_values.identical(i))
+        assert same_values.identical(i)
 
-        self.assertFalse(i.identical(self.index))
-        self.assertTrue(Index(same_values, name='foo', dtype=object).identical(
-            i))
+        assert not i.identical(self.index)
+        assert Index(same_values, name='foo', dtype=object).identical(i)
 
-        self.assertFalse(self.index.copy(dtype=object)
-                         .identical(self.index.copy(dtype=self._dtype)))
+        assert not self.index.copy(dtype=object).identical(
+            self.index.copy(dtype=self._dtype))
 
     def test_join_non_unique(self):
         left = Index([4, 4, 3, 3])
@@ -504,7 +498,7 @@ def test_join_non_unique(self):
         joined, lidx, ridx = left.join(left, return_indexers=True)
 
         exp_joined = Index([3, 3, 3, 3, 4, 4, 4, 4])
-        self.assert_index_equal(joined, exp_joined)
+        tm.assert_index_equal(joined, exp_joined)
 
         exp_lidx = np.array([2, 2, 3, 3, 0, 0, 1, 1], dtype=np.intp)
         tm.assert_numpy_array_equal(lidx, exp_lidx)
@@ -512,11 +506,10 @@ def test_join_non_unique(self):
         exp_ridx = np.array([2, 3, 2, 3, 0, 1, 0, 1], dtype=np.intp)
         tm.assert_numpy_array_equal(ridx, exp_ridx)
 
-    def test_join_self(self):
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = self.index.join(self.index, how=kind)
-            self.assertIs(self.index, joined)
+    @pytest.mark.parametrize('kind', ['outer', 'inner', 'left', 'right'])
+    def test_join_self(self, kind):
+        joined = self.index.join(self.index, how=kind)
+        assert self.index is joined
 
     def test_union_noncomparable(self):
         from datetime import datetime, timedelta
@@ -532,25 +525,29 @@ def test_union_noncomparable(self):
         tm.assert_index_equal(result, expected)
 
     def test_cant_or_shouldnt_cast(self):
+        msg = ("String dtype not supported, you may need to explicitly cast to"
+               " a numeric type")
         # can't
         data = ['foo', 'bar', 'baz']
-        self.assertRaises(TypeError, self._holder, data)
+        with pytest.raises(TypeError, match=msg):
+            self._holder(data)
 
         # shouldn't
         data = ['0', '1', '2']
-        self.assertRaises(TypeError, self._holder, data)
+        with pytest.raises(TypeError, match=msg):
+            self._holder(data)
 
     def test_view_index(self):
         self.index.view(Index)
 
     def test_prevent_casting(self):
         result = self.index.astype('O')
-        self.assertEqual(result.dtype, np.object_)
+        assert result.dtype == np.object_
 
     def test_take_preserve_name(self):
         index = self._holder([1, 2, 3, 4], name='foo')
         taken = index.take([3, 0, 1])
-        self.assertEqual(index.name, taken.name)
+        assert index.name == taken.name
 
     def test_take_fill_value(self):
         # see gh-12631
@@ -564,7 +561,7 @@ def test_take_fill_value(self):
                "{name} cannot contain NA").format(name=name)
 
         # fill_value=True
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -1]), fill_value=True)
 
         # allow_fill=False
@@ -573,59 +570,26 @@ def test_take_fill_value(self):
         expected = self._holder([2, 1, 3], name='xxx')
         tm.assert_index_equal(result, expected)
 
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             idx.take(np.array([1, -5]))
 
     def test_slice_keep_name(self):
         idx = self._holder([1, 2], name='asdf')
-        self.assertEqual(idx.name, idx[1:].name)
-
-    def test_ufunc_coercions(self):
-        idx = self._holder([1, 2, 3, 4, 5], name='x')
+        assert idx.name == idx[1:].name
 
-        result = np.sqrt(idx)
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index(np.sqrt(np.array([1, 2, 3, 4, 5])), name='x')
-        tm.assert_index_equal(result, exp)
 
-        result = np.divide(idx, 2.)
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
-        tm.assert_index_equal(result, exp)
-
-        # _evaluate_numeric_binop
-        result = idx + 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index([3., 4., 5., 6., 7.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx - 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index([-1., 0., 1., 2., 3.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx * 1.
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index([1., 2., 3., 4., 5.], name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx / 2.
-        tm.assertIsInstance(result, Float64Index)
-        exp = Float64Index([0.5, 1., 1.5, 2., 2.5], name='x')
-        tm.assert_index_equal(result, exp)
-
-
-class TestInt64Index(NumericInt, tm.TestCase):
+class TestInt64Index(NumericInt):
     _dtype = 'int64'
     _holder = Int64Index
 
-    def setUp(self):
-        self.indices = dict(index=Int64Index(np.arange(0, 20, 2)))
+    def setup_method(self, method):
+        self.indices = dict(index=Int64Index(np.arange(0, 20, 2)),
+                            index_dec=Int64Index(np.arange(19, -1, -1)))
         self.setup_indices()
 
     def create_index(self):
@@ -642,7 +606,10 @@ def test_constructor(self):
         tm.assert_index_equal(index, expected)
 
         # scalar raise Exception
-        self.assertRaises(TypeError, Int64Index, 5)
+        msg = (r"Int64Index\(\.\.\.\) must be called with a collection of some"
+               " kind, 5 was passed")
+        with pytest.raises(TypeError, match=msg):
+            Int64Index(5)
 
         # copy
         arr = self.index.values
@@ -652,7 +619,7 @@ def test_constructor(self):
 
         # this should not change index
         arr[0] = val
-        self.assertNotEqual(new_index[0], val)
+        assert new_index[0] != val
 
         # interpret list-like
         expected = Int64Index([5, 0])
@@ -665,51 +632,40 @@ def test_constructor(self):
     def test_constructor_corner(self):
         arr = np.array([1, 2, 3, 4], dtype=object)
         index = Int64Index(arr)
-        self.assertEqual(index.values.dtype, np.int64)
-        self.assert_index_equal(index, Index(arr))
+        assert index.values.dtype == np.int64
+        tm.assert_index_equal(index, Index(arr))
 
         # preventing casting
         arr = np.array([1, '2', 3, '4'], dtype=object)
-        with tm.assertRaisesRegexp(TypeError, 'casting'):
+        with pytest.raises(TypeError, match='casting'):
             Int64Index(arr)
 
         arr_with_floats = [0, 2, 3, 4, 5, 1.25, 3, -1]
-        with tm.assertRaisesRegexp(TypeError, 'casting'):
+        with pytest.raises(TypeError, match='casting'):
             Int64Index(arr_with_floats)
 
+    def test_constructor_coercion_signed_to_unsigned(self, uint_dtype):
+
+        # see gh-15832
+        msg = "Trying to coerce negative values to unsigned integers"
+
+        with pytest.raises(OverflowError, match=msg):
+            Index([-1], dtype=uint_dtype)
+
+    def test_constructor_unwraps_index(self):
+        idx = pd.Index([1, 2])
+        result = pd.Int64Index(idx)
+        expected = np.array([1, 2], dtype='int64')
+        tm.assert_numpy_array_equal(result._data, expected)
+
     def test_coerce_list(self):
         # coerce things
         arr = Index([1, 2, 3, 4])
-        tm.assertIsInstance(arr, Int64Index)
+        assert isinstance(arr, Int64Index)
 
         # but not if explicit dtype passed
         arr = Index([1, 2, 3, 4], dtype=object)
-        tm.assertIsInstance(arr, Index)
-
-    def test_where(self):
-        i = self.create_index()
-        result = i.where(notnull(i))
-        expected = i
-        tm.assert_index_equal(result, expected)
-
-        _nan = i._na_value
-        cond = [False] + [True] * len(i[1:])
-        expected = pd.Index([_nan] + i[1:].tolist())
-
-        result = i.where(cond)
-        tm.assert_index_equal(result, expected)
-
-    def test_where_array_like(self):
-        i = self.create_index()
-
-        _nan = i._na_value
-        cond = [False] + [True] * (len(i) - 1)
-        klasses = [list, tuple, np.array, pd.Series]
-        expected = pd.Index([_nan] + i[1:].tolist())
-
-        for klass in klasses:
-            result = i.where(klass(cond))
-            tm.assert_index_equal(result, expected)
+        assert isinstance(arr, Index)
 
     def test_get_indexer(self):
         target = Int64Index(np.arange(10))
@@ -757,8 +713,8 @@ def test_join_inner(self):
         elidx = np.array([1, 6], dtype=np.intp)
         eridx = np.array([4, 1], dtype=np.intp)
 
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -767,12 +723,12 @@ def test_join_inner(self):
                                           return_indexers=True)
 
         res2 = self.index.intersection(other_mono)
-        self.assert_index_equal(res, res2)
+        tm.assert_index_equal(res, res2)
 
         elidx = np.array([1, 6], dtype=np.intp)
         eridx = np.array([1, 4], dtype=np.intp)
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -787,9 +743,9 @@ def test_join_left(self):
         eridx = np.array([-1, 4, -1, -1, -1, -1, 1, -1, -1, -1],
                          dtype=np.intp)
 
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
         tm.assert_numpy_array_equal(ridx, eridx)
 
         # monotonic
@@ -797,9 +753,9 @@ def test_join_left(self):
                                           return_indexers=True)
         eridx = np.array([-1, 1, -1, -1, -1, -1, 4, -1, -1, -1],
                          dtype=np.intp)
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
         tm.assert_numpy_array_equal(ridx, eridx)
 
         # non-unique
@@ -809,7 +765,7 @@ def test_join_left(self):
         eres = Index([1, 1, 2, 5, 7, 9])  # 1 is in idx2, so it should be x2
         eridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
         elidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
-        self.assert_index_equal(res, eres)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -823,20 +779,20 @@ def test_join_right(self):
         eres = other
         elidx = np.array([-1, 6, -1, -1, 1, -1], dtype=np.intp)
 
-        tm.assertIsInstance(other, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
+        assert ridx is None
 
         # monotonic
         res, lidx, ridx = self.index.join(other_mono, how='right',
                                           return_indexers=True)
         eres = other_mono
         elidx = np.array([-1, 1, -1, -1, 6, -1], dtype=np.intp)
-        tm.assertIsInstance(other, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
+        assert ridx is None
 
         # non-unique
         idx = Index([1, 1, 2, 5])
@@ -845,7 +801,7 @@ def test_join_right(self):
         eres = Index([1, 1, 2, 5, 7, 9])  # 1 is in idx2, so it should be x2
         elidx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
         eridx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
-        self.assert_index_equal(res, eres)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -855,26 +811,26 @@ def test_join_non_int_index(self):
         outer = self.index.join(other, how='outer')
         outer2 = other.join(self.index, how='outer')
         expected = Index([0, 2, 3, 4, 6, 7, 8, 10, 12, 14, 16, 18])
-        self.assert_index_equal(outer, outer2)
-        self.assert_index_equal(outer, expected)
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
 
         inner = self.index.join(other, how='inner')
         inner2 = other.join(self.index, how='inner')
         expected = Index([6, 8, 10])
-        self.assert_index_equal(inner, inner2)
-        self.assert_index_equal(inner, expected)
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
 
         left = self.index.join(other, how='left')
-        self.assert_index_equal(left, self.index.astype(object))
+        tm.assert_index_equal(left, self.index.astype(object))
 
         left2 = other.join(self.index, how='left')
-        self.assert_index_equal(left2, other)
+        tm.assert_index_equal(left2, other)
 
         right = self.index.join(other, how='right')
-        self.assert_index_equal(right, other)
+        tm.assert_index_equal(right, other)
 
         right2 = other.join(self.index, how='right')
-        self.assert_index_equal(right2, self.index.astype(object))
+        tm.assert_index_equal(right2, self.index.astype(object))
 
     def test_join_outer(self):
         other = Int64Index([7, 12, 25, 1, 2, 5])
@@ -885,7 +841,7 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
         eres = Int64Index([0, 1, 2, 4, 5, 6, 7, 8, 10, 12, 14, 16, 18, 25])
         elidx = np.array([0, -1, 1, 2, -1, 3, -1, 4, 5, 6, 7, 8, 9, -1],
@@ -893,8 +849,8 @@ def test_join_outer(self):
         eridx = np.array([-1, 3, 4, -1, 5, -1, 0, -1, -1, 1, -1, -1, -1, 2],
                          dtype=np.intp)
 
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -902,26 +858,27 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other_mono, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other_mono, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
         elidx = np.array([0, -1, 1, 2, -1, 3, -1, 4, 5, 6, 7, 8, 9, -1],
                          dtype=np.intp)
         eridx = np.array([-1, 0, 1, -1, 2, -1, 3, -1, -1, 4, -1, -1, -1, 5],
                          dtype=np.intp)
-        tm.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
 
-class TestUInt64Index(NumericInt, tm.TestCase):
+class TestUInt64Index(NumericInt):
 
     _dtype = 'uint64'
     _holder = UInt64Index
 
-    def setUp(self):
-        self.indices = dict(index=UInt64Index([2**63, 2**63 + 10, 2**63 + 15,
-                                               2**63 + 20, 2**63 + 25]))
+    def setup_method(self, method):
+        vals = [2**63, 2**63 + 10, 2**63 + 15, 2**63 + 20, 2**63 + 25]
+        self.indices = dict(index=UInt64Index(vals),
+                            index_dec=UInt64Index(reversed(vals)))
         self.setup_indices()
 
     def create_index(self):
@@ -995,8 +952,8 @@ def test_join_inner(self):
         elidx = np.array([1, 4], dtype=np.intp)
         eridx = np.array([5, 2], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -1005,13 +962,13 @@ def test_join_inner(self):
                                           return_indexers=True)
 
         res2 = self.index.intersection(other_mono)
-        self.assert_index_equal(res, res2)
+        tm.assert_index_equal(res, res2)
 
         elidx = np.array([1, 4], dtype=np.intp)
         eridx = np.array([3, 5], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -1027,9 +984,9 @@ def test_join_left(self):
         eres = self.index
         eridx = np.array([-1, 5, -1, -1, 2], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
         tm.assert_numpy_array_equal(ridx, eridx)
 
         # monotonic
@@ -1037,9 +994,9 @@ def test_join_left(self):
                                           return_indexers=True)
         eridx = np.array([-1, 3, -1, -1, 5], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
         tm.assert_numpy_array_equal(ridx, eridx)
 
         # non-unique
@@ -1053,7 +1010,7 @@ def test_join_left(self):
         eridx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
         elidx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
 
-        self.assert_index_equal(res, eres)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -1070,9 +1027,9 @@ def test_join_right(self):
         elidx = np.array([-1, -1, 4, -1, -1, 1], dtype=np.intp)
 
         tm.assert_numpy_array_equal(lidx, elidx)
-        tm.assertIsInstance(other, UInt64Index)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(ridx)
+        assert isinstance(other, UInt64Index)
+        tm.assert_index_equal(res, eres)
+        assert ridx is None
 
         # monotonic
         res, lidx, ridx = self.index.join(other_mono, how='right',
@@ -1080,10 +1037,10 @@ def test_join_right(self):
         eres = other_mono
         elidx = np.array([-1, -1, -1, 1, -1, 4], dtype=np.intp)
 
-        tm.assertIsInstance(other, UInt64Index)
+        assert isinstance(other, UInt64Index)
         tm.assert_numpy_array_equal(lidx, elidx)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(ridx)
+        tm.assert_index_equal(res, eres)
+        assert ridx is None
 
         # non-unique
         idx = UInt64Index(2**63 + np.array([1, 1, 2, 5], dtype='uint64'))
@@ -1096,7 +1053,7 @@ def test_join_right(self):
         elidx = np.array([0, 1, 2, 3, -1, -1], dtype=np.intp)
         eridx = np.array([0, 0, 1, 2, 3, 4], dtype=np.intp)
 
-        self.assert_index_equal(res, eres)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -1108,26 +1065,26 @@ def test_join_non_int_index(self):
         outer2 = other.join(self.index, how='outer')
         expected = Index(2**63 + np.array(
             [0, 1, 5, 7, 10, 15, 20, 25], dtype='uint64'))
-        self.assert_index_equal(outer, outer2)
-        self.assert_index_equal(outer, expected)
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
 
         inner = self.index.join(other, how='inner')
         inner2 = other.join(self.index, how='inner')
         expected = Index(2**63 + np.array([10, 20], dtype='uint64'))
-        self.assert_index_equal(inner, inner2)
-        self.assert_index_equal(inner, expected)
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
 
         left = self.index.join(other, how='left')
-        self.assert_index_equal(left, self.index.astype(object))
+        tm.assert_index_equal(left, self.index.astype(object))
 
         left2 = other.join(self.index, how='left')
-        self.assert_index_equal(left2, other)
+        tm.assert_index_equal(left2, other)
 
         right = self.index.join(other, how='right')
-        self.assert_index_equal(right, other)
+        tm.assert_index_equal(right, other)
 
         right2 = other.join(self.index, how='right')
-        self.assert_index_equal(right2, self.index.astype(object))
+        tm.assert_index_equal(right2, self.index.astype(object))
 
     def test_join_outer(self):
         other = UInt64Index(2**63 + np.array(
@@ -1140,15 +1097,15 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
         eres = UInt64Index(2**63 + np.array(
             [0, 1, 2, 7, 10, 12, 15, 20, 25], dtype='uint64'))
         elidx = np.array([0, -1, -1, -1, 1, -1, 2, 3, 4], dtype=np.intp)
         eridx = np.array([-1, 3, 4, 0, 5, 1, -1, -1, 2], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
 
@@ -1156,12 +1113,12 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other_mono, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other_mono, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
         elidx = np.array([0, -1, -1, -1, 1, -1, 2, 3, 4], dtype=np.intp)
         eridx = np.array([-1, 0, 1, 2, 3, 4, -1, -1, 5], dtype=np.intp)
 
-        tm.assertIsInstance(res, UInt64Index)
-        self.assert_index_equal(res, eres)
+        assert isinstance(res, UInt64Index)
+        tm.assert_index_equal(res, eres)
         tm.assert_numpy_array_equal(lidx, elidx)
         tm.assert_numpy_array_equal(ridx, eridx)
diff --git a/pandas/tests/indexes/test_range.py b/pandas/tests/indexes/test_range.py
index 53c88897d6764..96cf83d477376 100644
--- a/pandas/tests/indexes/test_range.py
+++ b/pandas/tests/indexes/test_range.py
@@ -1,167 +1,141 @@
 # -*- coding: utf-8 -*-
 
 from datetime import datetime
-from itertools import combinations
-import operator
-
-from pandas.compat import range, u, PY3
 
 import numpy as np
+import pytest
 
-from pandas import (notnull, Series, Index, Float64Index,
-                    Int64Index, RangeIndex)
-from pandas.util.testing import assertRaisesRegexp
-
-import pandas.util.testing as tm
+from pandas.compat import PY3, range, u
 
 import pandas as pd
+from pandas import Float64Index, Index, Int64Index, RangeIndex, Series
+import pandas.util.testing as tm
 
 from .test_numeric import Numeric
 
 
-class TestRangeIndex(Numeric, tm.TestCase):
+class TestRangeIndex(Numeric):
     _holder = RangeIndex
-    _compat_props = ['shape', 'ndim', 'size', 'itemsize']
+    _compat_props = ['shape', 'ndim', 'size']
 
-    def setUp(self):
-        self.indices = dict(index=RangeIndex(0, 20, 2, name='foo'))
+    def setup_method(self, method):
+        self.indices = dict(index=RangeIndex(0, 20, 2, name='foo'),
+                            index_dec=RangeIndex(18, -1, -2, name='bar'))
         self.setup_indices()
 
     def create_index(self):
         return RangeIndex(5)
 
-    def check_binop(self, ops, scalars, idxs):
-        for op in ops:
-            for a, b in combinations(idxs, 2):
-                result = op(a, b)
-                expected = op(Int64Index(a), Int64Index(b))
-                tm.assert_index_equal(result, expected)
-            for idx in idxs:
-                for scalar in scalars:
-                    result = op(idx, scalar)
-                    expected = op(Int64Index(idx), scalar)
-                    tm.assert_index_equal(result, expected)
-
-    def test_binops(self):
-        ops = [operator.add, operator.sub, operator.mul, operator.floordiv,
-               operator.truediv]
-        scalars = [-1, 1, 2]
-        idxs = [RangeIndex(0, 10, 1), RangeIndex(0, 20, 2),
-                RangeIndex(-10, 10, 2), RangeIndex(5, -5, -1)]
-        self.check_binop(ops, scalars, idxs)
-
-    def test_binops_pow(self):
-        # later versions of numpy don't allow powers of negative integers
-        # so test separately
-        # https://github.com/numpy/numpy/pull/8127
-        ops = [pow]
-        scalars = [1, 2]
-        idxs = [RangeIndex(0, 10, 1), RangeIndex(0, 20, 2)]
-        self.check_binop(ops, scalars, idxs)
+    def test_can_hold_identifiers(self):
+        idx = self.create_index()
+        key = idx[0]
+        assert idx._can_hold_identifiers_and_holds_name(key) is False
 
     def test_too_many_names(self):
-        def testit():
+        with pytest.raises(ValueError, match="^Length"):
             self.index.names = ["roger", "harold"]
 
-        assertRaisesRegexp(ValueError, "^Length", testit)
-
     def test_constructor(self):
         index = RangeIndex(5)
         expected = np.arange(5, dtype=np.int64)
-        self.assertIsInstance(index, RangeIndex)
-        self.assertEqual(index._start, 0)
-        self.assertEqual(index._stop, 5)
-        self.assertEqual(index._step, 1)
-        self.assertEqual(index.name, None)
+        assert isinstance(index, RangeIndex)
+        assert index._start == 0
+        assert index._stop == 5
+        assert index._step == 1
+        assert index.name is None
         tm.assert_index_equal(Index(expected), index)
 
         index = RangeIndex(1, 5)
         expected = np.arange(1, 5, dtype=np.int64)
-        self.assertIsInstance(index, RangeIndex)
-        self.assertEqual(index._start, 1)
+        assert isinstance(index, RangeIndex)
+        assert index._start == 1
         tm.assert_index_equal(Index(expected), index)
 
         index = RangeIndex(1, 5, 2)
         expected = np.arange(1, 5, 2, dtype=np.int64)
-        self.assertIsInstance(index, RangeIndex)
-        self.assertEqual(index._step, 2)
+        assert isinstance(index, RangeIndex)
+        assert index._step == 2
         tm.assert_index_equal(Index(expected), index)
 
-        msg = "RangeIndex\\(\\.\\.\\.\\) must be called with integers"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            RangeIndex()
-
         for index in [RangeIndex(0), RangeIndex(start=0), RangeIndex(stop=0),
                       RangeIndex(0, 0)]:
             expected = np.empty(0, dtype=np.int64)
-            self.assertIsInstance(index, RangeIndex)
-            self.assertEqual(index._start, 0)
-            self.assertEqual(index._stop, 0)
-            self.assertEqual(index._step, 1)
+            assert isinstance(index, RangeIndex)
+            assert index._start == 0
+            assert index._stop == 0
+            assert index._step == 1
             tm.assert_index_equal(Index(expected), index)
 
-        with tm.assertRaisesRegexp(TypeError, msg):
-            RangeIndex(name='Foo')
-
         for index in [RangeIndex(0, name='Foo'),
                       RangeIndex(start=0, name='Foo'),
                       RangeIndex(stop=0, name='Foo'),
                       RangeIndex(0, 0, name='Foo')]:
-            self.assertIsInstance(index, RangeIndex)
-            self.assertEqual(index.name, 'Foo')
+            assert isinstance(index, RangeIndex)
+            assert index.name == 'Foo'
 
         # we don't allow on a bare Index
-        self.assertRaises(TypeError, lambda: Index(0, 1000))
+        with pytest.raises(TypeError):
+            Index(0, 1000)
+
+    def test_constructor_invalid_args(self):
+        msg = "RangeIndex\\(\\.\\.\\.\\) must be called with integers"
+        with pytest.raises(TypeError, match=msg):
+            RangeIndex()
+
+        with pytest.raises(TypeError, match=msg):
+            RangeIndex(name='Foo')
 
         # invalid args
         for i in [Index(['a', 'b']), Series(['a', 'b']), np.array(['a', 'b']),
                   [], 'foo', datetime(2000, 1, 1, 0, 0), np.arange(0, 10),
                   np.array([1]), [1]]:
-            self.assertRaises(TypeError, lambda: RangeIndex(i))
+            with pytest.raises(TypeError):
+                RangeIndex(i)
 
     def test_constructor_same(self):
 
         # pass thru w and w/o copy
         index = RangeIndex(1, 5, 2)
         result = RangeIndex(index, copy=False)
-        self.assertTrue(result.identical(index))
+        assert result.identical(index)
 
         result = RangeIndex(index, copy=True)
-        self.assert_index_equal(result, index, exact=True)
+        tm.assert_index_equal(result, index, exact=True)
 
         result = RangeIndex(index)
-        self.assert_index_equal(result, index, exact=True)
+        tm.assert_index_equal(result, index, exact=True)
 
-        self.assertRaises(TypeError,
-                          lambda: RangeIndex(index, dtype='float64'))
+        with pytest.raises(TypeError):
+            RangeIndex(index, dtype='float64')
 
     def test_constructor_range(self):
 
-        self.assertRaises(TypeError, lambda: RangeIndex(range(1, 5, 2)))
+        with pytest.raises(TypeError):
+            RangeIndex(range(1, 5, 2))
 
         result = RangeIndex.from_range(range(1, 5, 2))
         expected = RangeIndex(1, 5, 2)
-        self.assert_index_equal(result, expected, exact=True)
+        tm.assert_index_equal(result, expected, exact=True)
 
         result = RangeIndex.from_range(range(5, 6))
         expected = RangeIndex(5, 6, 1)
-        self.assert_index_equal(result, expected, exact=True)
+        tm.assert_index_equal(result, expected, exact=True)
 
         # an invalid range
         result = RangeIndex.from_range(range(5, 1))
         expected = RangeIndex(0, 0, 1)
-        self.assert_index_equal(result, expected, exact=True)
+        tm.assert_index_equal(result, expected, exact=True)
 
         result = RangeIndex.from_range(range(5))
         expected = RangeIndex(0, 5, 1)
-        self.assert_index_equal(result, expected, exact=True)
+        tm.assert_index_equal(result, expected, exact=True)
 
         result = Index(range(1, 5, 2))
         expected = RangeIndex(1, 5, 2)
-        self.assert_index_equal(result, expected, exact=True)
+        tm.assert_index_equal(result, expected, exact=True)
 
-        self.assertRaises(TypeError,
-                          lambda: Index(range(1, 5, 2), dtype='float64'))
+        with pytest.raises(TypeError):
+            Index(range(1, 5, 2), dtype='float64')
 
     def test_constructor_name(self):
         # GH12288
@@ -171,99 +145,42 @@ def test_constructor_name(self):
         copy = RangeIndex(orig)
         copy.name = 'copy'
 
-        self.assertTrue(orig.name, 'original')
-        self.assertTrue(copy.name, 'copy')
+        assert orig.name == 'original'
+        assert copy.name == 'copy'
 
         new = Index(copy)
-        self.assertTrue(new.name, 'copy')
+        assert new.name == 'copy'
 
         new.name = 'new'
-        self.assertTrue(orig.name, 'original')
-        self.assertTrue(new.name, 'copy')
-        self.assertTrue(new.name, 'new')
-
-    def test_numeric_compat2(self):
-        # validate that we are handling the RangeIndex overrides to numeric ops
-        # and returning RangeIndex where possible
-
-        idx = RangeIndex(0, 10, 2)
-
-        result = idx * 2
-        expected = RangeIndex(0, 20, 4)
-        self.assert_index_equal(result, expected, exact=True)
-
-        result = idx + 2
-        expected = RangeIndex(2, 12, 2)
-        self.assert_index_equal(result, expected, exact=True)
-
-        result = idx - 2
-        expected = RangeIndex(-2, 8, 2)
-        self.assert_index_equal(result, expected, exact=True)
-
-        # truediv under PY3
-        result = idx / 2
-
-        if PY3:
-            expected = RangeIndex(0, 5, 1).astype('float64')
-        else:
-            expected = RangeIndex(0, 5, 1)
-        self.assert_index_equal(result, expected, exact=True)
-
-        result = idx / 4
-        expected = RangeIndex(0, 10, 2) / 4
-        self.assert_index_equal(result, expected, exact=True)
-
-        result = idx // 1
-        expected = idx
-        tm.assert_index_equal(result, expected, exact=True)
-
-        # __mul__
-        result = idx * idx
-        expected = Index(idx.values * idx.values)
-        tm.assert_index_equal(result, expected, exact=True)
-
-        # __pow__
-        idx = RangeIndex(0, 1000, 2)
-        result = idx ** 2
-        expected = idx._int64index ** 2
-        tm.assert_index_equal(Index(result.values), expected, exact=True)
-
-        # __floordiv__
-        cases_exact = [(RangeIndex(0, 1000, 2), 2, RangeIndex(0, 500, 1)),
-                       (RangeIndex(-99, -201, -3), -3, RangeIndex(33, 67, 1)),
-                       (RangeIndex(0, 1000, 1), 2,
-                        RangeIndex(0, 1000, 1)._int64index // 2),
-                       (RangeIndex(0, 100, 1), 2.0,
-                        RangeIndex(0, 100, 1)._int64index // 2.0),
-                       (RangeIndex(0), 50, RangeIndex(0)),
-                       (RangeIndex(2, 4, 2), 3, RangeIndex(0, 1, 1)),
-                       (RangeIndex(-5, -10, -6), 4, RangeIndex(-2, -1, 1)),
-                       (RangeIndex(-100, -200, 3), 2, RangeIndex(0))]
-        for idx, div, expected in cases_exact:
-            tm.assert_index_equal(idx // div, expected, exact=True)
+        assert orig.name == 'original'
+        assert copy.name == 'copy'
+        assert new.name == 'new'
 
     def test_constructor_corner(self):
         arr = np.array([1, 2, 3, 4], dtype=object)
         index = RangeIndex(1, 5)
-        self.assertEqual(index.values.dtype, np.int64)
-        self.assert_index_equal(index, Index(arr))
+        assert index.values.dtype == np.int64
+        tm.assert_index_equal(index, Index(arr))
 
         # non-int raise Exception
-        self.assertRaises(TypeError, RangeIndex, '1', '10', '1')
-        self.assertRaises(TypeError, RangeIndex, 1.1, 10.2, 1.3)
+        with pytest.raises(TypeError):
+            RangeIndex('1', '10', '1')
+        with pytest.raises(TypeError):
+            RangeIndex(1.1, 10.2, 1.3)
 
         # invalid passed type
-        self.assertRaises(TypeError, lambda: RangeIndex(1, 5, dtype='float64'))
+        with pytest.raises(TypeError):
+            RangeIndex(1, 5, dtype='float64')
 
     def test_copy(self):
         i = RangeIndex(5, name='Foo')
         i_copy = i.copy()
-        self.assertTrue(i_copy is not i)
-        self.assertTrue(i_copy.identical(i))
-        self.assertEqual(i_copy._start, 0)
-        self.assertEqual(i_copy._stop, 5)
-        self.assertEqual(i_copy._step, 1)
-        self.assertEqual(i_copy.name, 'Foo')
+        assert i_copy is not i
+        assert i_copy.identical(i)
+        assert i_copy._start == 0
+        assert i_copy._stop == 5
+        assert i_copy._step == 1
+        assert i_copy.name == 'Foo'
 
     def test_repr(self):
         i = RangeIndex(5, name='Foo')
@@ -272,18 +189,18 @@ def test_repr(self):
             expected = "RangeIndex(start=0, stop=5, step=1, name='Foo')"
         else:
             expected = "RangeIndex(start=0, stop=5, step=1, name=u'Foo')"
-        self.assertTrue(result, expected)
+        assert result == expected
 
         result = eval(result)
-        self.assert_index_equal(result, i, exact=True)
+        tm.assert_index_equal(result, i, exact=True)
 
         i = RangeIndex(5, 0, -1)
         result = repr(i)
         expected = "RangeIndex(start=5, stop=0, step=-1)"
-        self.assertEqual(result, expected)
+        assert result == expected
 
         result = eval(result)
-        self.assert_index_equal(result, i, exact=True)
+        tm.assert_index_equal(result, i, exact=True)
 
     def test_insert(self):
 
@@ -291,31 +208,35 @@ def test_insert(self):
         result = idx[1:4]
 
         # test 0th element
-        self.assert_index_equal(idx[0:4], result.insert(0, idx[0]))
+        tm.assert_index_equal(idx[0:4], result.insert(0, idx[0]))
+
+        # GH 18295 (test missing)
+        expected = Float64Index([0, np.nan, 1, 2, 3, 4])
+        for na in (np.nan, pd.NaT, None):
+            result = RangeIndex(5).insert(1, na)
+            tm.assert_index_equal(result, expected)
 
     def test_delete(self):
 
         idx = RangeIndex(5, name='Foo')
         expected = idx[1:].astype(int)
         result = idx.delete(0)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
 
         expected = idx[:-1].astype(int)
         result = idx.delete(-1)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+        tm.assert_index_equal(result, expected)
+        assert result.name == expected.name
 
-        with tm.assertRaises((IndexError, ValueError)):
+        with pytest.raises((IndexError, ValueError)):
             # either depending on numpy version
             result = idx.delete(len(idx))
 
     def test_view(self):
-        super(TestRangeIndex, self).test_view()
-
         i = RangeIndex(0, name='Foo')
         i_view = i.view()
-        self.assertEqual(i_view.name, 'Foo')
+        assert i_view.name == 'Foo'
 
         i_view = i.view('i8')
         tm.assert_numpy_array_equal(i.values, i_view)
@@ -324,31 +245,41 @@ def test_view(self):
         tm.assert_index_equal(i, i_view)
 
     def test_dtype(self):
-        self.assertEqual(self.index.dtype, np.int64)
+        assert self.index.dtype == np.int64
 
     def test_is_monotonic(self):
-        self.assertTrue(self.index.is_monotonic)
-        self.assertTrue(self.index.is_monotonic_increasing)
-        self.assertFalse(self.index.is_monotonic_decreasing)
+        assert self.index.is_monotonic is True
+        assert self.index.is_monotonic_increasing is True
+        assert self.index.is_monotonic_decreasing is False
+        assert self.index._is_strictly_monotonic_increasing is True
+        assert self.index._is_strictly_monotonic_decreasing is False
 
         index = RangeIndex(4, 0, -1)
-        self.assertFalse(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is False
+        assert index._is_strictly_monotonic_increasing is False
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_decreasing is True
 
         index = RangeIndex(1, 2)
-        self.assertTrue(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_increasing)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is True
+        assert index.is_monotonic_increasing is True
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_increasing is True
+        assert index._is_strictly_monotonic_decreasing is True
 
         index = RangeIndex(2, 1)
-        self.assertTrue(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_increasing)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is True
+        assert index.is_monotonic_increasing is True
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_increasing is True
+        assert index._is_strictly_monotonic_decreasing is True
 
         index = RangeIndex(1, 1)
-        self.assertTrue(index.is_monotonic)
-        self.assertTrue(index.is_monotonic_increasing)
-        self.assertTrue(index.is_monotonic_decreasing)
+        assert index.is_monotonic is True
+        assert index.is_monotonic_increasing is True
+        assert index.is_monotonic_decreasing is True
+        assert index._is_strictly_monotonic_increasing is True
+        assert index._is_strictly_monotonic_decreasing is True
 
     def test_equals_range(self):
         equiv_pairs = [(RangeIndex(0, 9, 2), RangeIndex(0, 10, 2)),
@@ -356,54 +287,53 @@ def test_equals_range(self):
                        (RangeIndex(1, 2, 3), RangeIndex(1, 3, 4)),
                        (RangeIndex(0, -9, -2), RangeIndex(0, -10, -2))]
         for left, right in equiv_pairs:
-            self.assertTrue(left.equals(right))
-            self.assertTrue(right.equals(left))
+            assert left.equals(right)
+            assert right.equals(left)
 
     def test_logical_compat(self):
         idx = self.create_index()
-        self.assertEqual(idx.all(), idx.values.all())
-        self.assertEqual(idx.any(), idx.values.any())
+        assert idx.all() == idx.values.all()
+        assert idx.any() == idx.values.any()
 
     def test_identical(self):
         i = Index(self.index.copy())
-        self.assertTrue(i.identical(self.index))
+        assert i.identical(self.index)
 
         # we don't allow object dtype for RangeIndex
         if isinstance(self.index, RangeIndex):
             return
 
         same_values_different_type = Index(i, dtype=object)
-        self.assertFalse(i.identical(same_values_different_type))
+        assert not i.identical(same_values_different_type)
 
         i = self.index.copy(dtype=object)
         i = i.rename('foo')
         same_values = Index(i, dtype=object)
-        self.assertTrue(same_values.identical(self.index.copy(dtype=object)))
+        assert same_values.identical(self.index.copy(dtype=object))
 
-        self.assertFalse(i.identical(self.index))
-        self.assertTrue(Index(same_values, name='foo', dtype=object).identical(
-            i))
+        assert not i.identical(self.index)
+        assert Index(same_values, name='foo', dtype=object).identical(i)
 
-        self.assertFalse(self.index.copy(dtype=object)
-                         .identical(self.index.copy(dtype='int64')))
+        assert not self.index.copy(dtype=object).identical(
+            self.index.copy(dtype='int64'))
 
     def test_get_indexer(self):
         target = RangeIndex(10)
         indexer = self.index.get_indexer(target)
         expected = np.array([0, -1, 1, -1, 2, -1, 3, -1, 4, -1], dtype=np.intp)
-        self.assert_numpy_array_equal(indexer, expected)
+        tm.assert_numpy_array_equal(indexer, expected)
 
     def test_get_indexer_pad(self):
         target = RangeIndex(10)
         indexer = self.index.get_indexer(target, method='pad')
         expected = np.array([0, 0, 1, 1, 2, 2, 3, 3, 4, 4], dtype=np.intp)
-        self.assert_numpy_array_equal(indexer, expected)
+        tm.assert_numpy_array_equal(indexer, expected)
 
     def test_get_indexer_backfill(self):
         target = RangeIndex(10)
         indexer = self.index.get_indexer(target, method='backfill')
         expected = np.array([0, 1, 1, 2, 2, 3, 3, 4, 4, 5], dtype=np.intp)
-        self.assert_numpy_array_equal(indexer, expected)
+        tm.assert_numpy_array_equal(indexer, expected)
 
     def test_join_outer(self):
         # join with Int64Index
@@ -412,7 +342,7 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
         eres = Int64Index([0, 2, 4, 6, 8, 10, 12, 14, 15, 16, 17, 18, 19, 20,
                            21, 22, 23, 24, 25])
@@ -421,11 +351,11 @@ def test_join_outer(self):
         eridx = np.array([-1, -1, -1, -1, -1, -1, -1, -1, 10, 9, 8, 7, 6,
                           5, 4, 3, 2, 1, 0], dtype=np.intp)
 
-        self.assertIsInstance(res, Int64Index)
-        self.assertFalse(isinstance(res, RangeIndex))
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, Int64Index)
+        assert not isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
 
         # join with RangeIndex
         other = RangeIndex(25, 14, -1)
@@ -433,13 +363,13 @@ def test_join_outer(self):
         res, lidx, ridx = self.index.join(other, how='outer',
                                           return_indexers=True)
         noidx_res = self.index.join(other, how='outer')
-        self.assert_index_equal(res, noidx_res)
+        tm.assert_index_equal(res, noidx_res)
 
-        self.assertIsInstance(res, Int64Index)
-        self.assertFalse(isinstance(res, RangeIndex))
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, Int64Index)
+        assert not isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
 
     def test_join_inner(self):
         # Join with non-RangeIndex
@@ -458,10 +388,10 @@ def test_join_inner(self):
         elidx = np.array([8, 9], dtype=np.intp)
         eridx = np.array([9, 7], dtype=np.intp)
 
-        self.assertIsInstance(res, Int64Index)
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
 
         # Join two RangeIndex
         other = RangeIndex(25, 14, -1)
@@ -469,10 +399,10 @@ def test_join_inner(self):
         res, lidx, ridx = self.index.join(other, how='inner',
                                           return_indexers=True)
 
-        self.assertIsInstance(res, RangeIndex)
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
 
     def test_join_left(self):
         # Join with Int64Index
@@ -483,10 +413,10 @@ def test_join_left(self):
         eres = self.index
         eridx = np.array([-1, -1, -1, -1, -1, -1, -1, -1, 9, 7], dtype=np.intp)
 
-        self.assertIsInstance(res, RangeIndex)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
 
         # Join withRangeIndex
         other = Int64Index(np.arange(25, 14, -1))
@@ -494,10 +424,10 @@ def test_join_left(self):
         res, lidx, ridx = self.index.join(other, how='left',
                                           return_indexers=True)
 
-        self.assertIsInstance(res, RangeIndex)
-        self.assert_index_equal(res, eres)
-        self.assertIsNone(lidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        assert isinstance(res, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        assert lidx is None
+        tm.assert_numpy_array_equal(ridx, eridx)
 
     def test_join_right(self):
         # Join with Int64Index
@@ -509,10 +439,10 @@ def test_join_right(self):
         elidx = np.array([-1, -1, -1, -1, -1, -1, -1, 9, -1, 8, -1],
                          dtype=np.intp)
 
-        self.assertIsInstance(other, Int64Index)
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
+        assert isinstance(other, Int64Index)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
 
         # Join withRangeIndex
         other = RangeIndex(25, 14, -1)
@@ -521,10 +451,10 @@ def test_join_right(self):
                                           return_indexers=True)
         eres = other
 
-        self.assertIsInstance(other, RangeIndex)
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assertIsNone(ridx)
+        assert isinstance(other, RangeIndex)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        assert ridx is None
 
     def test_join_non_int_index(self):
         other = Index([3, 6, 7, 8, 10], dtype=object)
@@ -532,26 +462,26 @@ def test_join_non_int_index(self):
         outer = self.index.join(other, how='outer')
         outer2 = other.join(self.index, how='outer')
         expected = Index([0, 2, 3, 4, 6, 7, 8, 10, 12, 14, 16, 18])
-        self.assert_index_equal(outer, outer2)
-        self.assert_index_equal(outer, expected)
+        tm.assert_index_equal(outer, outer2)
+        tm.assert_index_equal(outer, expected)
 
         inner = self.index.join(other, how='inner')
         inner2 = other.join(self.index, how='inner')
         expected = Index([6, 8, 10])
-        self.assert_index_equal(inner, inner2)
-        self.assert_index_equal(inner, expected)
+        tm.assert_index_equal(inner, inner2)
+        tm.assert_index_equal(inner, expected)
 
         left = self.index.join(other, how='left')
-        self.assert_index_equal(left, self.index.astype(object))
+        tm.assert_index_equal(left, self.index.astype(object))
 
         left2 = other.join(self.index, how='left')
-        self.assert_index_equal(left2, other)
+        tm.assert_index_equal(left2, other)
 
         right = self.index.join(other, how='right')
-        self.assert_index_equal(right, other)
+        tm.assert_index_equal(right, other)
 
         right2 = other.join(self.index, how='right')
-        self.assert_index_equal(right2, self.index.astype(object))
+        tm.assert_index_equal(right2, self.index.astype(object))
 
     def test_join_non_unique(self):
         other = Index([4, 4, 3, 3])
@@ -563,80 +493,87 @@ def test_join_non_unique(self):
         eridx = np.array([-1, -1, 0, 1, -1, -1, -1, -1, -1, -1, -1],
                          dtype=np.intp)
 
-        self.assert_index_equal(res, eres)
-        self.assert_numpy_array_equal(lidx, elidx)
-        self.assert_numpy_array_equal(ridx, eridx)
+        tm.assert_index_equal(res, eres)
+        tm.assert_numpy_array_equal(lidx, elidx)
+        tm.assert_numpy_array_equal(ridx, eridx)
 
     def test_join_self(self):
         kinds = 'outer', 'inner', 'left', 'right'
         for kind in kinds:
             joined = self.index.join(self.index, how=kind)
-            self.assertIs(self.index, joined)
+            assert self.index is joined
 
-    def test_intersection(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_intersection(self, sort):
         # intersect with Int64Index
         other = Index(np.arange(1, 6))
-        result = self.index.intersection(other)
+        result = self.index.intersection(other, sort=sort)
         expected = Index(np.sort(np.intersect1d(self.index.values,
                                                 other.values)))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
-        result = other.intersection(self.index)
+        result = other.intersection(self.index, sort=sort)
         expected = Index(np.sort(np.asarray(np.intersect1d(self.index.values,
                                                            other.values))))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         # intersect with increasing RangeIndex
         other = RangeIndex(1, 6)
-        result = self.index.intersection(other)
+        result = self.index.intersection(other, sort=sort)
         expected = Index(np.sort(np.intersect1d(self.index.values,
                                                 other.values)))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         # intersect with decreasing RangeIndex
         other = RangeIndex(5, 0, -1)
-        result = self.index.intersection(other)
+        result = self.index.intersection(other, sort=sort)
         expected = Index(np.sort(np.intersect1d(self.index.values,
                                                 other.values)))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
+
+        # reversed (GH 17296)
+        result = other.intersection(self.index, sort=sort)
+        tm.assert_index_equal(result, expected)
+
+        # GH 17296: intersect two decreasing RangeIndexes
+        first = RangeIndex(10, -2, -2)
+        other = RangeIndex(5, -4, -1)
+        expected = first.astype(int).intersection(other.astype(int), sort=sort)
+        result = first.intersection(other, sort=sort).astype(int)
+        tm.assert_index_equal(result, expected)
+
+        # reversed
+        result = other.intersection(first, sort=sort).astype(int)
+        tm.assert_index_equal(result, expected)
 
         index = RangeIndex(5)
 
         # intersect of non-overlapping indices
         other = RangeIndex(5, 10, 1)
-        result = index.intersection(other)
+        result = index.intersection(other, sort=sort)
         expected = RangeIndex(0, 0, 1)
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         other = RangeIndex(-1, -5, -1)
-        result = index.intersection(other)
+        result = index.intersection(other, sort=sort)
         expected = RangeIndex(0, 0, 1)
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         # intersection of empty indices
         other = RangeIndex(0, 0, 1)
-        result = index.intersection(other)
+        result = index.intersection(other, sort=sort)
         expected = RangeIndex(0, 0, 1)
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
-        result = other.intersection(index)
-        self.assert_index_equal(result, expected)
+        result = other.intersection(index, sort=sort)
+        tm.assert_index_equal(result, expected)
 
         # intersection of non-overlapping values based on start value and gcd
         index = RangeIndex(1, 10, 2)
         other = RangeIndex(0, 10, 4)
-        result = index.intersection(other)
+        result = index.intersection(other, sort=sort)
         expected = RangeIndex(0, 0, 1)
-        self.assert_index_equal(result, expected)
-
-    def test_intersect_str_dates(self):
-        dt_dates = [datetime(2012, 2, 9), datetime(2012, 2, 22)]
-
-        i1 = Index(dt_dates, dtype=object)
-        i2 = Index(['aa'], dtype=object)
-        res = i2.intersection(i1)
-
-        self.assertEqual(len(res), 0)
+        tm.assert_index_equal(result, expected)
 
     def test_union_noncomparable(self):
         from datetime import datetime, timedelta
@@ -645,11 +582,11 @@ def test_union_noncomparable(self):
         other = Index([now + timedelta(i) for i in range(4)], dtype=object)
         result = self.index.union(other)
         expected = Index(np.concatenate((self.index, other)))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         result = other.union(self.index)
         expected = Index(np.concatenate((other, self.index)))
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
     def test_union(self):
         RI = RangeIndex
@@ -688,30 +625,32 @@ def test_nbytes(self):
 
         # memory savings vs int index
         i = RangeIndex(0, 1000)
-        self.assertTrue(i.nbytes < i.astype(int).nbytes / 10)
+        assert i.nbytes < i._int64index.nbytes / 10
 
         # constant memory usage
         i2 = RangeIndex(0, 10)
-        self.assertEqual(i.nbytes, i2.nbytes)
+        assert i.nbytes == i2.nbytes
 
     def test_cant_or_shouldnt_cast(self):
         # can't
-        self.assertRaises(TypeError, RangeIndex, 'foo', 'bar', 'baz')
+        with pytest.raises(TypeError):
+            RangeIndex('foo', 'bar', 'baz')
 
         # shouldn't
-        self.assertRaises(TypeError, RangeIndex, '0', '1', '2')
+        with pytest.raises(TypeError):
+            RangeIndex('0', '1', '2')
 
     def test_view_Index(self):
         self.index.view(Index)
 
     def test_prevent_casting(self):
         result = self.index.astype('O')
-        self.assertEqual(result.dtype, np.object_)
+        assert result.dtype == np.object_
 
     def test_take_preserve_name(self):
         index = RangeIndex(1, 5, name='foo')
         taken = index.take([3, 0, 1])
-        self.assertEqual(index.name, taken.name)
+        assert index.name == taken.name
 
     def test_take_fill_value(self):
         # GH 12631
@@ -722,7 +661,7 @@ def test_take_fill_value(self):
 
         # fill_value
         msg = "Unable to fill values because RangeIndex cannot contain NA"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -1]), fill_value=True)
 
         # allow_fill=False
@@ -732,12 +671,12 @@ def test_take_fill_value(self):
         tm.assert_index_equal(result, expected)
 
         msg = "Unable to fill values because RangeIndex cannot contain NA"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             idx.take(np.array([1, 0, -5]), fill_value=True)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             idx.take(np.array([1, -5]))
 
     def test_print_unicode_columns(self):
@@ -751,12 +690,12 @@ def test_repr_roundtrip(self):
 
     def test_slice_keep_name(self):
         idx = RangeIndex(1, 2, name='asdf')
-        self.assertEqual(idx.name, idx[1:].name)
+        assert idx.name == idx[1:].name
 
     def test_explicit_conversions(self):
 
         # GH 8608
-        # add/sub are overriden explicity for Float/Int Index
+        # add/sub are overridden explicitly for Float/Int Index
         idx = RangeIndex(5)
 
         # float conversions
@@ -778,64 +717,58 @@ def test_explicit_conversions(self):
         result = a - fidx
         tm.assert_index_equal(result, expected)
 
-    def test_duplicates(self):
+    def test_has_duplicates(self):
         for ind in self.indices:
             if not len(ind):
                 continue
             idx = self.indices[ind]
-            self.assertTrue(idx.is_unique)
-            self.assertFalse(idx.has_duplicates)
-
-    def test_ufunc_compat(self):
-        idx = RangeIndex(5)
-        result = np.sin(idx)
-        expected = Float64Index(np.sin(np.arange(5, dtype='int64')))
-        tm.assert_index_equal(result, expected)
+            assert idx.is_unique
+            assert not idx.has_duplicates
 
     def test_extended_gcd(self):
         result = self.index._extended_gcd(6, 10)
-        self.assertEqual(result[0], result[1] * 6 + result[2] * 10)
-        self.assertEqual(2, result[0])
+        assert result[0] == result[1] * 6 + result[2] * 10
+        assert 2 == result[0]
 
         result = self.index._extended_gcd(10, 6)
-        self.assertEqual(2, result[1] * 10 + result[2] * 6)
-        self.assertEqual(2, result[0])
+        assert 2 == result[1] * 10 + result[2] * 6
+        assert 2 == result[0]
 
     def test_min_fitting_element(self):
         result = RangeIndex(0, 20, 2)._min_fitting_element(1)
-        self.assertEqual(2, result)
+        assert 2 == result
 
         result = RangeIndex(1, 6)._min_fitting_element(1)
-        self.assertEqual(1, result)
+        assert 1 == result
 
         result = RangeIndex(18, -2, -2)._min_fitting_element(1)
-        self.assertEqual(2, result)
+        assert 2 == result
 
         result = RangeIndex(5, 0, -1)._min_fitting_element(1)
-        self.assertEqual(1, result)
+        assert 1 == result
 
         big_num = 500000000000000000000000
 
         result = RangeIndex(5, big_num * 2, 1)._min_fitting_element(big_num)
-        self.assertEqual(big_num, result)
+        assert big_num == result
 
     def test_max_fitting_element(self):
         result = RangeIndex(0, 20, 2)._max_fitting_element(17)
-        self.assertEqual(16, result)
+        assert 16 == result
 
         result = RangeIndex(1, 6)._max_fitting_element(4)
-        self.assertEqual(4, result)
+        assert 4 == result
 
         result = RangeIndex(18, -2, -2)._max_fitting_element(17)
-        self.assertEqual(16, result)
+        assert 16 == result
 
         result = RangeIndex(5, 0, -1)._max_fitting_element(4)
-        self.assertEqual(4, result)
+        assert 4 == result
 
         big_num = 500000000000000000000000
 
         result = RangeIndex(5, big_num * 2, 1)._max_fitting_element(big_num)
-        self.assertEqual(big_num, result)
+        assert big_num == result
 
     def test_pickle_compat_construction(self):
         # RangeIndex() is a valid constructor
@@ -846,53 +779,53 @@ def test_slice_specialised(self):
         # scalar indexing
         res = self.index[1]
         expected = 2
-        self.assertEqual(res, expected)
+        assert res == expected
 
         res = self.index[-1]
         expected = 18
-        self.assertEqual(res, expected)
+        assert res == expected
 
         # slicing
         # slice value completion
         index = self.index[:]
         expected = self.index
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         # positive slice values
         index = self.index[7:10:2]
         expected = Index(np.array([14, 18]), name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         # negative slice values
         index = self.index[-1:-5:-2]
         expected = Index(np.array([18, 14]), name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         # stop overshoot
         index = self.index[2:100:4]
         expected = Index(np.array([4, 12]), name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         # reverse
         index = self.index[::-1]
         expected = Index(self.index.values[::-1], name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         index = self.index[-8::-1]
         expected = Index(np.array([4, 2, 0]), name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         index = self.index[-40::-1]
         expected = Index(np.array([], dtype=np.int64), name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         index = self.index[40::-1]
         expected = Index(self.index.values[40::-1], name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
         index = self.index[10::-1]
         expected = Index(self.index.values[::-1], name='foo')
-        self.assert_index_equal(index, expected)
+        tm.assert_index_equal(index, expected)
 
     def test_len_specialised(self):
 
@@ -903,41 +836,52 @@ def test_len_specialised(self):
 
             arr = np.arange(0, 5, step)
             i = RangeIndex(0, 5, step)
-            self.assertEqual(len(i), len(arr))
+            assert len(i) == len(arr)
 
             i = RangeIndex(5, 0, step)
-            self.assertEqual(len(i), 0)
+            assert len(i) == 0
 
         for step in np.arange(-6, -1, 1):
 
             arr = np.arange(5, 0, step)
             i = RangeIndex(5, 0, step)
-            self.assertEqual(len(i), len(arr))
+            assert len(i) == len(arr)
 
             i = RangeIndex(0, 5, step)
-            self.assertEqual(len(i), 0)
-
-    def test_where(self):
-        i = self.create_index()
-        result = i.where(notnull(i))
-        expected = i
-        tm.assert_index_equal(result, expected)
-
-        _nan = i._na_value
-        cond = [False] + [True] * len(i[1:])
-        expected = pd.Index([_nan] + i[1:].tolist())
-
-        result = i.where(cond)
-        tm.assert_index_equal(result, expected)
-
-    def test_where_array_like(self):
-        i = self.create_index()
+            assert len(i) == 0
 
-        _nan = i._na_value
-        cond = [False] + [True] * (len(i) - 1)
-        klasses = [list, tuple, np.array, pd.Series]
-        expected = pd.Index([_nan] + i[1:].tolist())
-
-        for klass in klasses:
-            result = i.where(klass(cond))
-            tm.assert_index_equal(result, expected)
+    def test_append(self):
+        # GH16212
+        RI = RangeIndex
+        I64 = Int64Index
+        F64 = Float64Index
+        OI = Index
+        cases = [([RI(1, 12, 5)], RI(1, 12, 5)),
+                 ([RI(0, 6, 4)], RI(0, 6, 4)),
+                 ([RI(1, 3), RI(3, 7)], RI(1, 7)),
+                 ([RI(1, 5, 2), RI(5, 6)], RI(1, 6, 2)),
+                 ([RI(1, 3, 2), RI(4, 7, 3)], RI(1, 7, 3)),
+                 ([RI(-4, 3, 2), RI(4, 7, 2)], RI(-4, 7, 2)),
+                 ([RI(-4, -8), RI(-8, -12)], RI(0, 0)),
+                 ([RI(-4, -8), RI(3, -4)], RI(0, 0)),
+                 ([RI(-4, -8), RI(3, 5)], RI(3, 5)),
+                 ([RI(-4, -2), RI(3, 5)], I64([-4, -3, 3, 4])),
+                 ([RI(-2,), RI(3, 5)], RI(3, 5)),
+                 ([RI(2,), RI(2)], I64([0, 1, 0, 1])),
+                 ([RI(2,), RI(2, 5), RI(5, 8, 4)], RI(0, 6)),
+                 ([RI(2,), RI(3, 5), RI(5, 8, 4)], I64([0, 1, 3, 4, 5])),
+                 ([RI(-2, 2), RI(2, 5), RI(5, 8, 4)], RI(-2, 6)),
+                 ([RI(3,), I64([-1, 3, 15])], I64([0, 1, 2, -1, 3, 15])),
+                 ([RI(3,), F64([-1, 3.1, 15.])], F64([0, 1, 2, -1, 3.1, 15.])),
+                 ([RI(3,), OI(['a', None, 14])], OI([0, 1, 2, 'a', None, 14])),
+                 ([RI(3, 1), OI(['a', None, 14])], OI(['a', None, 14]))
+                 ]
+
+        for indices, expected in cases:
+            result = indices[0].append(indices[1:])
+            tm.assert_index_equal(result, expected, exact=True)
+
+            if len(indices) == 2:
+                # Append single item rather than list
+                result2 = indices[0].append(indices[1])
+                tm.assert_index_equal(result2, expected, exact=True)
diff --git a/pandas/tests/indexes/timedeltas/test_arithmetic.py b/pandas/tests/indexes/timedeltas/test_arithmetic.py
new file mode 100644
index 0000000000000..3173252e174ab
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_arithmetic.py
@@ -0,0 +1,279 @@
+# -*- coding: utf-8 -*-
+
+from datetime import timedelta
+
+import numpy as np
+import pytest
+
+from pandas.errors import NullFrequencyError
+
+import pandas as pd
+from pandas import Timedelta, TimedeltaIndex, timedelta_range
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[pd.offsets.Hour(2), timedelta(hours=2),
+                        np.timedelta64(2, 'h'), Timedelta(hours=2)],
+                ids=str)
+def delta(request):
+    # Several ways of representing two hours
+    return request.param
+
+
+@pytest.fixture(params=['B', 'D'])
+def freq(request):
+    return request.param
+
+
+class TestTimedeltaIndexArithmetic(object):
+    # Addition and Subtraction Operations
+
+    # -------------------------------------------------------------
+    # TimedeltaIndex.shift is used by __add__/__sub__
+
+    def test_tdi_shift_empty(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex([], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        tm.assert_index_equal(idx.shift(3, freq='H'), idx)
+
+    def test_tdi_shift_hours(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex(['5 hours', '6 hours', '9 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
+        exp = pd.TimedeltaIndex(['8 hours', '9 hours', '12 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(3, freq='H'), exp)
+        exp = pd.TimedeltaIndex(['2 hours', '3 hours', '6 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
+
+    def test_tdi_shift_minutes(self):
+        # GH#9903
+        idx = pd.TimedeltaIndex(['5 hours', '6 hours', '9 hours'], name='xxx')
+        tm.assert_index_equal(idx.shift(0, freq='T'), idx)
+        exp = pd.TimedeltaIndex(['05:03:00', '06:03:00', '9:03:00'],
+                                name='xxx')
+        tm.assert_index_equal(idx.shift(3, freq='T'), exp)
+        exp = pd.TimedeltaIndex(['04:57:00', '05:57:00', '8:57:00'],
+                                name='xxx')
+        tm.assert_index_equal(idx.shift(-3, freq='T'), exp)
+
+    def test_tdi_shift_int(self):
+        # GH#8083
+        trange = pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        result = trange.shift(1)
+        expected = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00',
+                                   '3 days 01:00:00',
+                                   '4 days 01:00:00', '5 days 01:00:00'],
+                                  freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_shift_nonstandard_freq(self):
+        # GH#8083
+        trange = pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        result = trange.shift(3, freq='2D 1s')
+        expected = TimedeltaIndex(['6 days 01:00:03', '7 days 01:00:03',
+                                   '8 days 01:00:03', '9 days 01:00:03',
+                                   '10 days 01:00:03'], freq='D')
+        tm.assert_index_equal(result, expected)
+
+    def test_shift_no_freq(self):
+        # GH#19147
+        tdi = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00'], freq=None)
+        with pytest.raises(NullFrequencyError):
+            tdi.shift(2)
+
+    # -------------------------------------------------------------
+    # Binary operations TimedeltaIndex and integer
+
+    def test_tdi_add_int(self, one):
+        # Variants of `one` for #19012
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng + one
+        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_iadd_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            rng += one
+        tm.assert_index_equal(rng, expected)
+
+    def test_tdi_sub_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng - one
+        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
+        tm.assert_index_equal(result, expected)
+
+    def test_tdi_isub_int(self, one):
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
+        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            rng -= one
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+    # __add__/__sub__ with integer arrays
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_add_integer_array(self, box):
+        # GH#19959
+        rng = timedelta_range('1 days 09:00:00', freq='H', periods=3)
+        other = box([4, 3, 2])
+        expected = TimedeltaIndex(['1 day 13:00:00'] * 3)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng + other
+            tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = other + rng
+            tm.assert_index_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_sub_integer_array(self, box):
+        # GH#19959
+        rng = timedelta_range('9H', freq='H', periods=3)
+        other = box([4, 3, 2])
+        expected = TimedeltaIndex(['5H', '7H', '9H'])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = rng - other
+            tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # GH#22535
+            result = other - rng
+            tm.assert_index_equal(result, -expected)
+
+    @pytest.mark.parametrize('box', [np.array, pd.Index])
+    def test_tdi_addsub_integer_array_no_freq(self, box):
+        # GH#19959
+        tdi = TimedeltaIndex(['1 Day', 'NaT', '3 Hours'])
+        other = box([14, -1, 16])
+        with pytest.raises(NullFrequencyError):
+            tdi + other
+        with pytest.raises(NullFrequencyError):
+            other + tdi
+        with pytest.raises(NullFrequencyError):
+            tdi - other
+        with pytest.raises(NullFrequencyError):
+            other - tdi
+
+    # -------------------------------------------------------------
+    # Binary operations TimedeltaIndex and timedelta-like
+    # Note: add and sub are tested in tests.test_arithmetic, in-place
+    #  tests are kept here because their behavior is Index-specific
+
+    def test_tdi_iadd_timedeltalike(self, delta):
+        # only test adding/sub offsets as + is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('1 days 02:00:00', '10 days 02:00:00',
+                                   freq='D')
+        rng += delta
+        tm.assert_index_equal(rng, expected)
+
+    def test_tdi_isub_timedeltalike(self, delta):
+        # only test adding/sub offsets as - is now numeric
+        rng = timedelta_range('1 days', '10 days')
+        expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
+        rng -= delta
+        tm.assert_index_equal(rng, expected)
+
+    # -------------------------------------------------------------
+
+    # TODO: after #24365 this probably belongs in scalar tests
+    def test_ops_ndarray(self):
+        td = Timedelta('1 day')
+
+        # timedelta, timedelta
+        other = pd.to_timedelta(['1 day']).values
+        expected = pd.to_timedelta(['2 days']).values
+        tm.assert_numpy_array_equal(td + other, expected)
+        tm.assert_numpy_array_equal(other + td, expected)
+        msg = r"unsupported operand type\(s\) for \+: 'Timedelta' and 'int'"
+        with pytest.raises(TypeError, match=msg):
+            td + np.array([1])
+        msg = (r"unsupported operand type\(s\) for \+: 'numpy.ndarray' and"
+               " 'Timedelta'")
+        with pytest.raises(TypeError, match=msg):
+            np.array([1]) + td
+
+        expected = pd.to_timedelta(['0 days']).values
+        tm.assert_numpy_array_equal(td - other, expected)
+        tm.assert_numpy_array_equal(-other + td, expected)
+        msg = r"unsupported operand type\(s\) for -: 'Timedelta' and 'int'"
+        with pytest.raises(TypeError, match=msg):
+            td - np.array([1])
+        msg = (r"unsupported operand type\(s\) for -: 'numpy.ndarray' and"
+               " 'Timedelta'")
+        with pytest.raises(TypeError, match=msg):
+            np.array([1]) - td
+
+        expected = pd.to_timedelta(['2 days']).values
+        tm.assert_numpy_array_equal(td * np.array([2]), expected)
+        tm.assert_numpy_array_equal(np.array([2]) * td, expected)
+        msg = ("ufunc multiply cannot use operands with types"
+               r" dtype\('<m8\[ns\]'\) and dtype\('<m8\[ns\]'\)")
+        with pytest.raises(TypeError, match=msg):
+            td * other
+        with pytest.raises(TypeError, match=msg):
+            other * td
+
+        tm.assert_numpy_array_equal(td / other,
+                                    np.array([1], dtype=np.float64))
+        tm.assert_numpy_array_equal(other / td,
+                                    np.array([1], dtype=np.float64))
+
+        # timedelta, datetime
+        other = pd.to_datetime(['2000-01-01']).values
+        expected = pd.to_datetime(['2000-01-02']).values
+        tm.assert_numpy_array_equal(td + other, expected)
+        tm.assert_numpy_array_equal(other + td, expected)
+
+        expected = pd.to_datetime(['1999-12-31']).values
+        tm.assert_numpy_array_equal(-td + other, expected)
+        tm.assert_numpy_array_equal(other - td, expected)
+
+    def test_tdi_ops_attributes(self):
+        rng = timedelta_range('2 days', periods=5, freq='2D', name='x')
+
+        result = rng + 1 * rng.freq
+        exp = timedelta_range('4 days', periods=5, freq='2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '2D'
+
+        result = rng - 2 * rng.freq
+        exp = timedelta_range('-2 days', periods=5, freq='2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '2D'
+
+        result = rng * 2
+        exp = timedelta_range('4 days', periods=5, freq='4D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '4D'
+
+        result = rng / 2
+        exp = timedelta_range('1 days', periods=5, freq='D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == 'D'
+
+        result = -rng
+        exp = timedelta_range('-2 days', periods=5, freq='-2D', name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq == '-2D'
+
+        rng = pd.timedelta_range('-2 days', periods=5, freq='D', name='x')
+
+        result = abs(rng)
+        exp = TimedeltaIndex(['2 days', '1 days', '0 days', '1 days',
+                              '2 days'], name='x')
+        tm.assert_index_equal(result, exp)
+        assert result.freq is None
diff --git a/pandas/tests/indexes/timedeltas/test_astype.py b/pandas/tests/indexes/timedeltas/test_astype.py
index 88e7b1387feff..23e96dbc3d6ce 100644
--- a/pandas/tests/indexes/timedeltas/test_astype.py
+++ b/pandas/tests/indexes/timedeltas/test_astype.py
@@ -1,30 +1,41 @@
+from datetime import timedelta
+
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import (
+    Float64Index, Index, Int64Index, NaT, Timedelta, TimedeltaIndex,
+    timedelta_range)
 import pandas.util.testing as tm
-from pandas import (TimedeltaIndex, timedelta_range, Int64Index, Float64Index,
-                    Index, Timedelta, Series)
-
-from ..datetimelike import DatetimeLike
-
 
-class TestTimedeltaIndex(DatetimeLike, tm.TestCase):
-    _holder = TimedeltaIndex
-    _multiprocess_can_split_ = True
 
-    def setUp(self):
-        self.indices = dict(index=tm.makeTimedeltaIndex(10))
-        self.setup_indices()
+class TestTimedeltaIndex(object):
+    def test_astype_object(self):
+        idx = timedelta_range(start='1 days', periods=4, freq='D', name='idx')
+        expected_list = [Timedelta('1 days'), Timedelta('2 days'),
+                         Timedelta('3 days'), Timedelta('4 days')]
+        result = idx.astype(object)
+        expected = Index(expected_list, dtype=object, name='idx')
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
 
-    def create_index(self):
-        return pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+    def test_astype_object_with_nat(self):
+        idx = TimedeltaIndex([timedelta(days=1), timedelta(days=2), NaT,
+                              timedelta(days=4)], name='idx')
+        expected_list = [Timedelta('1 days'), Timedelta('2 days'), NaT,
+                         Timedelta('4 days')]
+        result = idx.astype(object)
+        expected = Index(expected_list, dtype=object, name='idx')
+        tm.assert_index_equal(result, expected)
+        assert idx.tolist() == expected_list
 
     def test_astype(self):
         # GH 13149, GH 13209
-        idx = TimedeltaIndex([1e14, 'NaT', pd.NaT, np.NaN])
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
 
         result = idx.astype(object)
-        expected = Index([Timedelta('1 days 03:46:40')] + [pd.NaT] * 3,
+        expected = Index([Timedelta('1 days 03:46:40')] + [NaT] * 3,
                          dtype=object)
         tm.assert_index_equal(result, expected)
 
@@ -33,15 +44,27 @@ def test_astype(self):
                               dtype=np.int64)
         tm.assert_index_equal(result, expected)
 
-        rng = timedelta_range('1 days', periods=10)
+        result = idx.astype(str)
+        expected = Index(str(x) for x in idx)
+        tm.assert_index_equal(result, expected)
 
+        rng = timedelta_range('1 days', periods=10)
         result = rng.astype('i8')
-        self.assert_index_equal(result, Index(rng.asi8))
-        self.assert_numpy_array_equal(rng.asi8, result.values)
+        tm.assert_index_equal(result, Index(rng.asi8))
+        tm.assert_numpy_array_equal(rng.asi8, result.values)
+
+    def test_astype_uint(self):
+        arr = timedelta_range('1H', periods=2)
+        expected = pd.UInt64Index(
+            np.array([3600000000000, 90000000000000], dtype="uint64")
+        )
+
+        tm.assert_index_equal(arr.astype("uint64"), expected)
+        tm.assert_index_equal(arr.astype("uint32"), expected)
 
     def test_astype_timedelta64(self):
         # GH 13149, GH 13209
-        idx = TimedeltaIndex([1e14, 'NaT', pd.NaT, np.NaN])
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
 
         result = idx.astype('timedelta64')
         expected = Float64Index([1e+14] + [np.NaN] * 3, dtype='float64')
@@ -49,73 +72,39 @@ def test_astype_timedelta64(self):
 
         result = idx.astype('timedelta64[ns]')
         tm.assert_index_equal(result, idx)
-        self.assertFalse(result is idx)
+        assert result is not idx
 
         result = idx.astype('timedelta64[ns]', copy=False)
         tm.assert_index_equal(result, idx)
-        self.assertTrue(result is idx)
+        assert result is idx
 
-    def test_astype_raises(self):
+    @pytest.mark.parametrize('dtype', [
+        float, 'datetime64', 'datetime64[ns]'])
+    def test_astype_raises(self, dtype):
         # GH 13149, GH 13209
-        idx = TimedeltaIndex([1e14, 'NaT', pd.NaT, np.NaN])
-
-        self.assertRaises(ValueError, idx.astype, float)
-        self.assertRaises(ValueError, idx.astype, str)
-        self.assertRaises(ValueError, idx.astype, 'datetime64')
-        self.assertRaises(ValueError, idx.astype, 'datetime64[ns]')
-
-    def test_pickle_compat_construction(self):
-        pass
-
-    def test_shift(self):
-        # test shift for TimedeltaIndex
-        # err8083
-
-        drange = self.create_index()
-        result = drange.shift(1)
-        expected = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00',
-                                   '3 days 01:00:00',
-                                   '4 days 01:00:00', '5 days 01:00:00'],
-                                  freq='D')
-        self.assert_index_equal(result, expected)
-
-        result = drange.shift(3, freq='2D 1s')
-        expected = TimedeltaIndex(['6 days 01:00:03', '7 days 01:00:03',
-                                   '8 days 01:00:03', '9 days 01:00:03',
-                                   '10 days 01:00:03'], freq='D')
-        self.assert_index_equal(result, expected)
-
-    def test_numeric_compat(self):
-
-        idx = self._holder(np.arange(5, dtype='int64'))
-        didx = self._holder(np.arange(5, dtype='int64') ** 2)
-        result = idx * 1
-        tm.assert_index_equal(result, idx)
-
-        result = 1 * idx
-        tm.assert_index_equal(result, idx)
-
-        result = idx / 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx // 1
-        tm.assert_index_equal(result, idx)
+        idx = TimedeltaIndex([1e14, 'NaT', NaT, np.NaN])
+        msg = 'Cannot cast TimedeltaArray to dtype'
+        with pytest.raises(TypeError, match=msg):
+            idx.astype(dtype)
 
-        result = idx * np.array(5, dtype='int64')
-        tm.assert_index_equal(result,
-                              self._holder(np.arange(5, dtype='int64') * 5))
+    def test_astype_category(self):
+        obj = pd.timedelta_range("1H", periods=2, freq='H')
 
-        result = idx * np.arange(5, dtype='int64')
-        tm.assert_index_equal(result, didx)
+        result = obj.astype('category')
+        expected = pd.CategoricalIndex([pd.Timedelta('1H'),
+                                        pd.Timedelta('2H')])
+        tm.assert_index_equal(result, expected)
 
-        result = idx * Series(np.arange(5, dtype='int64'))
-        tm.assert_index_equal(result, didx)
+        result = obj._data.astype('category')
+        expected = expected.values
+        tm.assert_categorical_equal(result, expected)
 
-        result = idx * Series(np.arange(5, dtype='float64') + 0.1)
-        tm.assert_index_equal(result, self._holder(np.arange(
-            5, dtype='float64') * (np.arange(5, dtype='float64') + 0.1)))
+    def test_astype_array_fallback(self):
+        obj = pd.timedelta_range("1H", periods=2)
+        result = obj.astype(bool)
+        expected = pd.Index(np.array([True, True]))
+        tm.assert_index_equal(result, expected)
 
-        # invalid
-        self.assertRaises(TypeError, lambda: idx * idx)
-        self.assertRaises(ValueError, lambda: idx * self._holder(np.arange(3)))
-        self.assertRaises(ValueError, lambda: idx * np.array([1, 2]))
+        result = obj._data.astype(bool)
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexes/timedeltas/test_construction.py b/pandas/tests/indexes/timedeltas/test_construction.py
index 9a3dd1c6bca71..0028f1e2edad5 100644
--- a/pandas/tests/indexes/timedeltas/test_construction.py
+++ b/pandas/tests/indexes/timedeltas/test_construction.py
@@ -1,13 +1,99 @@
-import numpy as np
 from datetime import timedelta
 
+import numpy as np
+import pytest
+
 import pandas as pd
+from pandas import Timedelta, TimedeltaIndex, timedelta_range, to_timedelta
+from pandas.core.arrays import TimedeltaArray
 import pandas.util.testing as tm
-from pandas import TimedeltaIndex, timedelta_range, to_timedelta
 
 
-class TestTimedeltaIndex(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestTimedeltaIndex(object):
+
+    def test_verify_integrity_deprecated(self):
+        # GH#23919
+        with tm.assert_produces_warning(FutureWarning):
+            TimedeltaIndex(['1 Day'], verify_integrity=False)
+
+    def test_range_kwargs_deprecated(self):
+        # GH#23919
+        with tm.assert_produces_warning(FutureWarning):
+            TimedeltaIndex(start='1 Day', end='3 Days', freq='D')
+
+    def test_int64_nocopy(self):
+        # GH#23539 check that a copy isn't made when we pass int64 data
+        #  and copy=False
+        arr = np.arange(10, dtype=np.int64)
+        tdi = TimedeltaIndex(arr, copy=False)
+        assert tdi._data._data.base is arr
+
+    def test_infer_from_tdi(self):
+        # GH#23539
+        # fast-path for inferring a frequency if the passed data already
+        #  has one
+        tdi = pd.timedelta_range('1 second', periods=10**7, freq='1s')
+
+        result = pd.TimedeltaIndex(tdi, freq='infer')
+        assert result.freq == tdi.freq
+
+        # check that inferred_freq was not called by checking that the
+        #  value has not been cached
+        assert "inferred_freq" not in getattr(result, "_cache", {})
+
+    def test_infer_from_tdi_mismatch(self):
+        # GH#23539
+        # fast-path for invalidating a frequency if the passed data already
+        #  has one and it does not match the `freq` input
+        tdi = pd.timedelta_range('1 second', periods=100, freq='1s')
+
+        msg = ("Inferred frequency .* from passed values does "
+               "not conform to passed frequency")
+        with pytest.raises(ValueError, match=msg):
+            TimedeltaIndex(tdi, freq='D')
+
+        with pytest.raises(ValueError, match=msg):
+            # GH#23789
+            TimedeltaArray(tdi, freq='D')
+
+    def test_dt64_data_invalid(self):
+        # GH#23539
+        # passing tz-aware DatetimeIndex raises, naive or ndarray[datetime64]
+        #  does not yet, but will in the future
+        dti = pd.date_range('2016-01-01', periods=3)
+
+        msg = "cannot be converted to timedelta64"
+        with pytest.raises(TypeError, match=msg):
+            TimedeltaIndex(dti.tz_localize('Europe/Brussels'))
+
+        with tm.assert_produces_warning(FutureWarning):
+            TimedeltaIndex(dti)
+
+        with tm.assert_produces_warning(FutureWarning):
+            TimedeltaIndex(np.asarray(dti))
+
+    def test_float64_ns_rounded(self):
+        # GH#23539 without specifying a unit, floats are regarded as nanos,
+        #  and fractional portions are truncated
+        tdi = TimedeltaIndex([2.3, 9.7])
+        expected = TimedeltaIndex([2, 9])
+        tm.assert_index_equal(tdi, expected)
+
+        # integral floats are non-lossy
+        tdi = TimedeltaIndex([2.0, 9.0])
+        expected = TimedeltaIndex([2, 9])
+        tm.assert_index_equal(tdi, expected)
+
+        # NaNs get converted to NaT
+        tdi = TimedeltaIndex([2.0, np.nan])
+        expected = TimedeltaIndex([pd.Timedelta(nanoseconds=2), pd.NaT])
+        tm.assert_index_equal(tdi, expected)
+
+    def test_float64_unit_conversion(self):
+        # GH#23539
+        tdi = TimedeltaIndex([1.5, 2.25], unit='D')
+        expected = TimedeltaIndex([Timedelta(days=1.5), Timedelta(days=2.25)])
+        tm.assert_index_equal(tdi, expected)
 
     def test_construction_base_constructor(self):
         arr = [pd.Timedelta('1 days'), pd.NaT, pd.Timedelta('3 days')]
@@ -43,44 +129,76 @@ def test_constructor(self):
         tm.assert_index_equal(TimedeltaIndex([400, 450, 1200], unit='ms'),
                               expected)
 
+    def test_constructor_iso(self):
+        # GH #21877
+        expected = timedelta_range('1s', periods=9, freq='s')
+        durations = ['P0DT0H0M{}S'.format(i) for i in range(1, 10)]
+        result = to_timedelta(durations)
+        tm.assert_index_equal(result, expected)
+
     def test_constructor_coverage(self):
         rng = timedelta_range('1 days', periods=10.5)
         exp = timedelta_range('1 days', periods=10)
-        self.assert_index_equal(rng, exp)
+        tm.assert_index_equal(rng, exp)
 
-        self.assertRaises(ValueError, TimedeltaIndex, start='1 days',
-                          periods='foo', freq='D')
+        msg = 'periods must be a number, got foo'
+        with pytest.raises(TypeError, match=msg):
+            timedelta_range(start='1 days', periods='foo', freq='D')
 
-        self.assertRaises(ValueError, TimedeltaIndex, start='1 days',
-                          end='10 days')
+        with pytest.raises(ValueError):
+            with tm.assert_produces_warning(FutureWarning):
+                TimedeltaIndex(start='1 days', end='10 days')
 
-        self.assertRaises(ValueError, TimedeltaIndex, '1 days')
+        with pytest.raises(TypeError):
+            TimedeltaIndex('1 days')
 
         # generator expression
         gen = (timedelta(i) for i in range(10))
         result = TimedeltaIndex(gen)
         expected = TimedeltaIndex([timedelta(i) for i in range(10)])
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         # NumPy string array
         strings = np.array(['1 days', '2 days', '3 days'])
         result = TimedeltaIndex(strings)
         expected = to_timedelta([1, 2, 3], unit='d')
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         from_ints = TimedeltaIndex(expected.asi8)
-        self.assert_index_equal(from_ints, expected)
+        tm.assert_index_equal(from_ints, expected)
 
         # non-conforming freq
-        self.assertRaises(ValueError, TimedeltaIndex,
-                          ['1 days', '2 days', '4 days'], freq='D')
+        msg = ("Inferred frequency None from passed values does not conform to"
+               " passed frequency D")
+        with pytest.raises(ValueError, match=msg):
+            TimedeltaIndex(['1 days', '2 days', '4 days'], freq='D')
 
-        self.assertRaises(ValueError, TimedeltaIndex, periods=10, freq='D')
+        msg = ("Of the four parameters: start, end, periods, and freq, exactly"
+               " three must be specified")
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range(periods=10, freq='D')
 
     def test_constructor_name(self):
-        idx = TimedeltaIndex(start='1 days', periods=1, freq='D', name='TEST')
-        self.assertEqual(idx.name, 'TEST')
+        idx = timedelta_range(start='1 days', periods=1, freq='D', name='TEST')
+        assert idx.name == 'TEST'
 
         # GH10025
         idx2 = TimedeltaIndex(idx, name='something else')
-        self.assertEqual(idx2.name, 'something else')
+        assert idx2.name == 'something else'
+
+    def test_constructor_no_precision_warns(self):
+        # GH-24753, GH-24739
+        expected = pd.TimedeltaIndex(['2000'], dtype='timedelta64[ns]')
+
+        # we set the stacklevel for DatetimeIndex
+        with tm.assert_produces_warning(FutureWarning):
+            result = pd.TimedeltaIndex(['2000'], dtype='timedelta64')
+        tm.assert_index_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = pd.Index(['2000'], dtype='timedelta64')
+        tm.assert_index_equal(result, expected)
+
+    def test_constructor_wrong_precision_raises(self):
+        with pytest.raises(ValueError):
+            pd.TimedeltaIndex(['2000'], dtype='timedelta64[us]')
diff --git a/pandas/tests/indexes/timedeltas/test_formats.py b/pandas/tests/indexes/timedeltas/test_formats.py
new file mode 100644
index 0000000000000..09921fac80d22
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_formats.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+import pandas as pd
+from pandas import TimedeltaIndex
+
+
+class TestTimedeltaIndexRendering(object):
+    @pytest.mark.parametrize('method', ['__repr__', '__unicode__', '__str__'])
+    def test_representation(self, method):
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = """TimedeltaIndex([], dtype='timedelta64[ns]', freq='D')"""
+
+        exp2 = ("TimedeltaIndex(['1 days'], dtype='timedelta64[ns]', "
+                "freq='D')")
+
+        exp3 = ("TimedeltaIndex(['1 days', '2 days'], "
+                "dtype='timedelta64[ns]', freq='D')")
+
+        exp4 = ("TimedeltaIndex(['1 days', '2 days', '3 days'], "
+                "dtype='timedelta64[ns]', freq='D')")
+
+        exp5 = ("TimedeltaIndex(['1 days 00:00:01', '2 days 00:00:00', "
+                "'3 days 00:00:00'], dtype='timedelta64[ns]', freq=None)")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                     [exp1, exp2, exp3, exp4, exp5]):
+                result = getattr(idx, method)()
+                assert result == expected
+
+    def test_representation_to_series(self):
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = """Series([], dtype: timedelta64[ns])"""
+
+        exp2 = ("0   1 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp3 = ("0   1 days\n"
+                "1   2 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp4 = ("0   1 days\n"
+                "1   2 days\n"
+                "2   3 days\n"
+                "dtype: timedelta64[ns]")
+
+        exp5 = ("0   1 days 00:00:01\n"
+                "1   2 days 00:00:00\n"
+                "2   3 days 00:00:00\n"
+                "dtype: timedelta64[ns]")
+
+        with pd.option_context('display.width', 300):
+            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                     [exp1, exp2, exp3, exp4, exp5]):
+                result = repr(pd.Series(idx))
+                assert result == expected
+
+    def test_summary(self):
+        # GH#9116
+        idx1 = TimedeltaIndex([], freq='D')
+        idx2 = TimedeltaIndex(['1 days'], freq='D')
+        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
+        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
+        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
+
+        exp1 = ("TimedeltaIndex: 0 entries\n"
+                "Freq: D")
+
+        exp2 = ("TimedeltaIndex: 1 entries, 1 days to 1 days\n"
+                "Freq: D")
+
+        exp3 = ("TimedeltaIndex: 2 entries, 1 days to 2 days\n"
+                "Freq: D")
+
+        exp4 = ("TimedeltaIndex: 3 entries, 1 days to 3 days\n"
+                "Freq: D")
+
+        exp5 = ("TimedeltaIndex: 3 entries, 1 days 00:00:01 to 3 days "
+                "00:00:00")
+
+        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
+                                 [exp1, exp2, exp3, exp4, exp5]):
+            result = idx._summary()
+            assert result == expected
diff --git a/pandas/tests/indexes/timedeltas/test_indexing.py b/pandas/tests/indexes/timedeltas/test_indexing.py
index b4a8bc79921bf..a6264e4dad4f0 100644
--- a/pandas/tests/indexes/timedeltas/test_indexing.py
+++ b/pandas/tests/indexes/timedeltas/test_indexing.py
@@ -1,11 +1,174 @@
-from datetime import timedelta
+from datetime import datetime, timedelta
 
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, Timedelta, TimedeltaIndex, compat, timedelta_range
 import pandas.util.testing as tm
-from pandas import TimedeltaIndex, timedelta_range, compat, Index, Timedelta
 
 
-class TestTimedeltaIndex(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestGetItem(object):
+    def test_ellipsis(self):
+        # GH#21282
+        idx = timedelta_range('1 day', '31 day', freq='D', name='idx')
+
+        result = idx[...]
+        assert result.equals(idx)
+        assert result is not idx
+
+    def test_getitem(self):
+        idx1 = timedelta_range('1 day', '31 day', freq='D', name='idx')
+
+        for idx in [idx1]:
+            result = idx[0]
+            assert result == Timedelta('1 day')
+
+            result = idx[0:5]
+            expected = timedelta_range('1 day', '5 day', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[0:10:2]
+            expected = timedelta_range('1 day', '9 day', freq='2D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[-20:-5:3]
+            expected = timedelta_range('12 day', '24 day', freq='3D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx[4::-1]
+            expected = TimedeltaIndex(['5 day', '4 day', '3 day',
+                                       '2 day', '1 day'],
+                                      freq='-1D', name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+    @pytest.mark.parametrize('key', [pd.Timestamp('1970-01-01'),
+                                     pd.Timestamp('1970-01-02'),
+                                     datetime(1970, 1, 1)])
+    def test_timestamp_invalid_key(self, key):
+        # GH#20464
+        tdi = pd.timedelta_range(0, periods=10)
+        with pytest.raises(TypeError):
+            tdi.get_loc(key)
+
+
+class TestWhere(object):
+    # placeholder for symmetry with DatetimeIndex and PeriodIndex tests
+    pass
+
+
+class TestTake(object):
+    def test_take(self):
+        # GH 10295
+        idx1 = timedelta_range('1 day', '31 day', freq='D', name='idx')
+
+        for idx in [idx1]:
+            result = idx.take([0])
+            assert result == Timedelta('1 day')
+
+            result = idx.take([-1])
+            assert result == Timedelta('31 day')
+
+            result = idx.take([0, 1, 2])
+            expected = timedelta_range('1 day', '3 day', freq='D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([0, 2, 4])
+            expected = timedelta_range('1 day', '5 day', freq='2D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([7, 4, 1])
+            expected = timedelta_range('8 day', '2 day', freq='-3D',
+                                       name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq == expected.freq
+
+            result = idx.take([3, 2, 5])
+            expected = TimedeltaIndex(['4 day', '3 day', '6 day'], name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+            result = idx.take([-3, 2, 5])
+            expected = TimedeltaIndex(['29 day', '3 day', '6 day'], name='idx')
+            tm.assert_index_equal(result, expected)
+            assert result.freq is None
+
+    def test_take_invalid_kwargs(self):
+        idx = timedelta_range('1 day', '31 day', freq='D', name='idx')
+        indices = [1, 6, 5, 9, 10, 13, 15, 3]
+
+        msg = r"take\(\) got an unexpected keyword argument 'foo'"
+        with pytest.raises(TypeError, match=msg):
+            idx.take(indices, foo=2)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, out=indices)
+
+        msg = "the 'mode' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            idx.take(indices, mode='clip')
+
+    # TODO: This method came from test_timedelta; de-dup with version above
+    def test_take2(self):
+        tds = ['1day 02:00:00', '1 day 04:00:00', '1 day 10:00:00']
+        idx = timedelta_range(start='1d', end='2d', freq='H', name='idx')
+        expected = TimedeltaIndex(tds, freq=None, name='idx')
+
+        taken1 = idx.take([2, 4, 10])
+        taken2 = idx[[2, 4, 10]]
+
+        for taken in [taken1, taken2]:
+            tm.assert_index_equal(taken, expected)
+            assert isinstance(taken, TimedeltaIndex)
+            assert taken.freq is None
+            assert taken.name == expected.name
+
+    def test_take_fill_value(self):
+        # GH 12631
+        idx = TimedeltaIndex(['1 days', '2 days', '3 days'],
+                             name='xxx')
+        result = idx.take(np.array([1, 0, -1]))
+        expected = TimedeltaIndex(['2 days', '1 days', '3 days'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # fill_value
+        result = idx.take(np.array([1, 0, -1]), fill_value=True)
+        expected = TimedeltaIndex(['2 days', '1 days', 'NaT'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        # allow_fill=False
+        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
+                          fill_value=True)
+        expected = TimedeltaIndex(['2 days', '1 days', '3 days'],
+                                  name='xxx')
+        tm.assert_index_equal(result, expected)
+
+        msg = ('When allow_fill=True and fill_value is not None, '
+               'all indices must be >= -1')
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -2]), fill_value=True)
+        with pytest.raises(ValueError, match=msg):
+            idx.take(np.array([1, 0, -5]), fill_value=True)
+
+        with pytest.raises(IndexError):
+            idx.take(np.array([1, -5]))
+
+
+class TestTimedeltaIndex(object):
 
     def test_insert(self):
 
@@ -13,15 +176,15 @@ def test_insert(self):
 
         result = idx.insert(2, timedelta(days=5))
         exp = TimedeltaIndex(['4day', '1day', '5day', '2day'], name='idx')
-        self.assert_index_equal(result, exp)
+        tm.assert_index_equal(result, exp)
 
         # insertion of non-datetime should coerce to object index
         result = idx.insert(1, 'inserted')
         expected = Index([Timedelta('4day'), 'inserted', Timedelta('1day'),
                           Timedelta('2day')], name='idx')
-        self.assertNotIsInstance(result, TimedeltaIndex)
+        assert not isinstance(result, TimedeltaIndex)
         tm.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
+        assert result.name == expected.name
 
         idx = timedelta_range('1day 00:00:01', periods=3, freq='s', name='idx')
 
@@ -49,9 +212,15 @@ def test_insert(self):
 
         for n, d, expected in cases:
             result = idx.insert(n, d)
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+        # GH 18295 (test missing)
+        expected = TimedeltaIndex(['1day', pd.NaT, '2day', '3day'])
+        for na in (np.nan, pd.NaT, None):
+            result = timedelta_range('1day', '3day').insert(1, na)
+            tm.assert_index_equal(result, expected)
 
     def test_delete(self):
         idx = timedelta_range(start='1 Days', periods=5, freq='D', name='idx')
@@ -73,13 +242,13 @@ def test_delete(self):
                  1: expected_1}
         for n, expected in compat.iteritems(cases):
             result = idx.delete(n)
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
-        with tm.assertRaises((IndexError, ValueError)):
-            # either depeidnig on numpy version
-            result = idx.delete(5)
+        with pytest.raises((IndexError, ValueError)):
+            # either depending on numpy version
+            idx.delete(5)
 
     def test_delete_slice(self):
         idx = timedelta_range(start='1 days', periods=10, freq='D', name='idx')
@@ -100,11 +269,70 @@ def test_delete_slice(self):
                  (3, 4, 5): expected_3_5}
         for n, expected in compat.iteritems(cases):
             result = idx.delete(n)
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
 
             result = idx.delete(slice(n[0], n[-1] + 1))
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.name, expected.name)
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_index_equal(result, expected)
+            assert result.name == expected.name
+            assert result.freq == expected.freq
+
+    def test_get_loc(self):
+        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
+
+        for method in [None, 'pad', 'backfill', 'nearest']:
+            assert idx.get_loc(idx[1], method) == 1
+            assert idx.get_loc(idx[1].to_pytimedelta(), method) == 1
+            assert idx.get_loc(str(idx[1]), method) == 1
+
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=Timedelta(0)) == 1
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=np.timedelta64(0, 's')) == 1
+        assert idx.get_loc(idx[1], 'pad',
+                           tolerance=timedelta(0)) == 1
+
+        with pytest.raises(ValueError, match='unit abbreviation w/o a number'):
+            idx.get_loc(idx[1], method='nearest', tolerance='foo')
+
+        with pytest.raises(
+                ValueError,
+                match='tolerance size must match'):
+            idx.get_loc(idx[1], method='nearest',
+                        tolerance=[Timedelta(0).to_timedelta64(),
+                                   Timedelta(0).to_timedelta64()])
+
+        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
+            assert idx.get_loc('1 day 1 hour', method) == loc
+
+        # GH 16909
+        assert idx.get_loc(idx[1].to_timedelta64()) == 1
+
+        # GH 16896
+        assert idx.get_loc('0 days') == 0
+
+    def test_get_loc_nat(self):
+        tidx = TimedeltaIndex(['1 days 01:00:00', 'NaT', '2 days 01:00:00'])
+
+        assert tidx.get_loc(pd.NaT) == 1
+        assert tidx.get_loc(None) == 1
+        assert tidx.get_loc(float('nan')) == 1
+        assert tidx.get_loc(np.nan) == 1
+
+    def test_get_indexer(self):
+        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
+        tm.assert_numpy_array_equal(idx.get_indexer(idx),
+                                    np.array([0, 1, 2], dtype=np.intp))
+
+        target = pd.to_timedelta(['-1 hour', '12 hours', '1 day 1 hour'])
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
+                                    np.array([-1, 0, 1], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
+                                    np.array([0, 1, 2], dtype=np.intp))
+        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
+                                    np.array([0, 1, 1], dtype=np.intp))
+
+        res = idx.get_indexer(target, 'nearest',
+                              tolerance=Timedelta('1 hour'))
+        tm.assert_numpy_array_equal(res, np.array([0, -1, 1], dtype=np.intp))
diff --git a/pandas/tests/indexes/timedeltas/test_ops.py b/pandas/tests/indexes/timedeltas/test_ops.py
index 2e9f11297dc83..63210f67c2dbd 100644
--- a/pandas/tests/indexes/timedeltas/test_ops.py
+++ b/pandas/tests/indexes/timedeltas/test_ops.py
@@ -1,21 +1,20 @@
+
 import numpy as np
-from datetime import timedelta
-from distutils.version import LooseVersion
+import pytest
+
+from pandas.core.dtypes.generic import ABCDateOffset
 
 import pandas as pd
-import pandas.util.testing as tm
-from pandas import to_timedelta
-from pandas.util.testing import assert_series_equal, assert_frame_equal
-from pandas import (Series, Timedelta, DataFrame, Timestamp, TimedeltaIndex,
-                    timedelta_range, date_range, DatetimeIndex, Int64Index,
-                    _np_version_under1p10, Float64Index, Index)
-from pandas._libs.tslib import iNaT
+from pandas import Series, TimedeltaIndex, timedelta_range
 from pandas.tests.test_base import Ops
+import pandas.util.testing as tm
+
+from pandas.tseries.offsets import Day, Hour
 
 
 class TestTimedeltaIndexOps(Ops):
-    def setUp(self):
-        super(TestTimedeltaIndexOps, self).setUp()
+    def setup_method(self, method):
+        super(TestTimedeltaIndexOps, self).setup_method(method)
         mask = lambda x: isinstance(x, TimedeltaIndex)
         self.is_valid_objs = [o for o in self.objs if mask(o)]
         self.not_valid_objs = []
@@ -25,494 +24,6 @@ def test_ops_properties(self):
         self.check_ops_properties(TimedeltaIndex._field_ops, f)
         self.check_ops_properties(TimedeltaIndex._object_ops, f)
 
-    def test_asobject_tolist(self):
-        idx = timedelta_range(start='1 days', periods=4, freq='D', name='idx')
-        expected_list = [Timedelta('1 days'), Timedelta('2 days'),
-                         Timedelta('3 days'), Timedelta('4 days')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-        idx = TimedeltaIndex([timedelta(days=1), timedelta(days=2), pd.NaT,
-                              timedelta(days=4)], name='idx')
-        expected_list = [Timedelta('1 days'), Timedelta('2 days'), pd.NaT,
-                         Timedelta('4 days')]
-        expected = pd.Index(expected_list, dtype=object, name='idx')
-        result = idx.asobject
-        self.assertTrue(isinstance(result, Index))
-        self.assertEqual(result.dtype, object)
-        self.assert_index_equal(result, expected)
-        self.assertEqual(result.name, expected.name)
-        self.assertEqual(idx.tolist(), expected_list)
-
-    def test_minmax(self):
-
-        # monotonic
-        idx1 = TimedeltaIndex(['1 days', '2 days', '3 days'])
-        self.assertTrue(idx1.is_monotonic)
-
-        # non-monotonic
-        idx2 = TimedeltaIndex(['1 days', np.nan, '3 days', 'NaT'])
-        self.assertFalse(idx2.is_monotonic)
-
-        for idx in [idx1, idx2]:
-            self.assertEqual(idx.min(), Timedelta('1 days')),
-            self.assertEqual(idx.max(), Timedelta('3 days')),
-            self.assertEqual(idx.argmin(), 0)
-            self.assertEqual(idx.argmax(), 2)
-
-        for op in ['min', 'max']:
-            # Return NaT
-            obj = TimedeltaIndex([])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = TimedeltaIndex([pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-            obj = TimedeltaIndex([pd.NaT, pd.NaT, pd.NaT])
-            self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-    def test_numpy_minmax(self):
-        dr = pd.date_range(start='2016-01-15', end='2016-01-20')
-        td = TimedeltaIndex(np.asarray(dr))
-
-        self.assertEqual(np.min(td), Timedelta('16815 days'))
-        self.assertEqual(np.max(td), Timedelta('16820 days'))
-
-        errmsg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, errmsg, np.min, td, out=0)
-        tm.assertRaisesRegexp(ValueError, errmsg, np.max, td, out=0)
-
-        self.assertEqual(np.argmin(td), 0)
-        self.assertEqual(np.argmax(td), 5)
-
-        if not _np_version_under1p10:
-            errmsg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmin, td, out=0)
-            tm.assertRaisesRegexp(ValueError, errmsg, np.argmax, td, out=0)
-
-    def test_round(self):
-        td = pd.timedelta_range(start='16801 days', periods=5, freq='30Min')
-        elt = td[1]
-
-        expected_rng = TimedeltaIndex([
-            Timedelta('16801 days 00:00:00'),
-            Timedelta('16801 days 00:00:00'),
-            Timedelta('16801 days 01:00:00'),
-            Timedelta('16801 days 02:00:00'),
-            Timedelta('16801 days 02:00:00'),
-        ])
-        expected_elt = expected_rng[1]
-
-        tm.assert_index_equal(td.round(freq='H'), expected_rng)
-        self.assertEqual(elt.round(freq='H'), expected_elt)
-
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            td.round(freq='foo')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            elt.round(freq='foo')
-
-        msg = "<MonthEnd> is a non-fixed frequency"
-        tm.assertRaisesRegexp(ValueError, msg, td.round, freq='M')
-        tm.assertRaisesRegexp(ValueError, msg, elt.round, freq='M')
-
-    def test_representation(self):
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """TimedeltaIndex([], dtype='timedelta64[ns]', freq='D')"""
-
-        exp2 = ("TimedeltaIndex(['1 days'], dtype='timedelta64[ns]', "
-                "freq='D')")
-
-        exp3 = ("TimedeltaIndex(['1 days', '2 days'], "
-                "dtype='timedelta64[ns]', freq='D')")
-
-        exp4 = ("TimedeltaIndex(['1 days', '2 days', '3 days'], "
-                "dtype='timedelta64[ns]', freq='D')")
-
-        exp5 = ("TimedeltaIndex(['1 days 00:00:01', '2 days 00:00:00', "
-                "'3 days 00:00:00'], dtype='timedelta64[ns]', freq=None)")
-
-        with pd.option_context('display.width', 300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                     [exp1, exp2, exp3, exp4, exp5]):
-                for func in ['__repr__', '__unicode__', '__str__']:
-                    result = getattr(idx, func)()
-                    self.assertEqual(result, expected)
-
-    def test_representation_to_series(self):
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """Series([], dtype: timedelta64[ns])"""
-
-        exp2 = """0   1 days
-dtype: timedelta64[ns]"""
-
-        exp3 = """0   1 days
-1   2 days
-dtype: timedelta64[ns]"""
-
-        exp4 = """0   1 days
-1   2 days
-2   3 days
-dtype: timedelta64[ns]"""
-
-        exp5 = """0   1 days 00:00:01
-1   2 days 00:00:00
-2   3 days 00:00:00
-dtype: timedelta64[ns]"""
-
-        with pd.option_context('display.width', 300):
-            for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                     [exp1, exp2, exp3, exp4, exp5]):
-                result = repr(pd.Series(idx))
-                self.assertEqual(result, expected)
-
-    def test_summary(self):
-        # GH9116
-        idx1 = TimedeltaIndex([], freq='D')
-        idx2 = TimedeltaIndex(['1 days'], freq='D')
-        idx3 = TimedeltaIndex(['1 days', '2 days'], freq='D')
-        idx4 = TimedeltaIndex(['1 days', '2 days', '3 days'], freq='D')
-        idx5 = TimedeltaIndex(['1 days 00:00:01', '2 days', '3 days'])
-
-        exp1 = """TimedeltaIndex: 0 entries
-Freq: D"""
-
-        exp2 = """TimedeltaIndex: 1 entries, 1 days to 1 days
-Freq: D"""
-
-        exp3 = """TimedeltaIndex: 2 entries, 1 days to 2 days
-Freq: D"""
-
-        exp4 = """TimedeltaIndex: 3 entries, 1 days to 3 days
-Freq: D"""
-
-        exp5 = ("TimedeltaIndex: 3 entries, 1 days 00:00:01 to 3 days "
-                "00:00:00")
-
-        for idx, expected in zip([idx1, idx2, idx3, idx4, idx5],
-                                 [exp1, exp2, exp3, exp4, exp5]):
-            result = idx.summary()
-            self.assertEqual(result, expected)
-
-    def test_add_iadd(self):
-
-        # only test adding/sub offsets as + is now numeric
-
-        # offset
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'), Timedelta(hours=2)]
-
-        for delta in offsets:
-            rng = timedelta_range('1 days', '10 days')
-            result = rng + delta
-            expected = timedelta_range('1 days 02:00:00', '10 days 02:00:00',
-                                       freq='D')
-            tm.assert_index_equal(result, expected)
-            rng += delta
-            tm.assert_index_equal(rng, expected)
-
-        # int
-        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        result = rng + 1
-        expected = timedelta_range('1 days 10:00:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng += 1
-        tm.assert_index_equal(rng, expected)
-
-    def test_sub_isub(self):
-        # only test adding/sub offsets as - is now numeric
-
-        # offset
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'), Timedelta(hours=2)]
-
-        for delta in offsets:
-            rng = timedelta_range('1 days', '10 days')
-            result = rng - delta
-            expected = timedelta_range('0 days 22:00:00', '9 days 22:00:00')
-            tm.assert_index_equal(result, expected)
-            rng -= delta
-            tm.assert_index_equal(rng, expected)
-
-        # int
-        rng = timedelta_range('1 days 09:00:00', freq='H', periods=10)
-        result = rng - 1
-        expected = timedelta_range('1 days 08:00:00', freq='H', periods=10)
-        tm.assert_index_equal(result, expected)
-        rng -= 1
-        tm.assert_index_equal(rng, expected)
-
-        idx = TimedeltaIndex(['1 day', '2 day'])
-        msg = "cannot subtract a datelike from a TimedeltaIndex"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            idx - Timestamp('2011-01-01')
-
-        result = Timestamp('2011-01-01') + idx
-        expected = DatetimeIndex(['2011-01-02', '2011-01-03'])
-        tm.assert_index_equal(result, expected)
-
-    def test_ops_compat(self):
-
-        offsets = [pd.offsets.Hour(2), timedelta(hours=2),
-                   np.timedelta64(2, 'h'), Timedelta(hours=2)]
-
-        rng = timedelta_range('1 days', '10 days', name='foo')
-
-        # multiply
-        for offset in offsets:
-            self.assertRaises(TypeError, lambda: rng * offset)
-
-        # divide
-        expected = Int64Index((np.arange(10) + 1) * 12, name='foo')
-        for offset in offsets:
-            result = rng / offset
-            tm.assert_index_equal(result, expected, exact=False)
-
-        # divide with nats
-        rng = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        expected = Float64Index([12, np.nan, 24], name='foo')
-        for offset in offsets:
-            result = rng / offset
-            tm.assert_index_equal(result, expected)
-
-        # don't allow division by NaT (make could in the future)
-        self.assertRaises(TypeError, lambda: rng / pd.NaT)
-
-    def test_subtraction_ops(self):
-
-        # with datetimes/timedelta and tdi/dti
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-        td = Timedelta('1 days')
-        dt = Timestamp('20130101')
-
-        self.assertRaises(TypeError, lambda: tdi - dt)
-        self.assertRaises(TypeError, lambda: tdi - dti)
-        self.assertRaises(TypeError, lambda: td - dt)
-        self.assertRaises(TypeError, lambda: td - dti)
-
-        result = dt - dti
-        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'], name='bar')
-        tm.assert_index_equal(result, expected)
-
-        result = dti - dt
-        expected = TimedeltaIndex(['0 days', '1 days', '2 days'], name='bar')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi - td
-        expected = TimedeltaIndex(['0 days', pd.NaT, '1 days'], name='foo')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = td - tdi
-        expected = TimedeltaIndex(['0 days', pd.NaT, '-1 days'], name='foo')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = dti - td
-        expected = DatetimeIndex(
-            ['20121231', '20130101', '20130102'], name='bar')
-        tm.assert_index_equal(result, expected, check_names=False)
-
-        result = dt - tdi
-        expected = DatetimeIndex(['20121231', pd.NaT, '20121230'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-    def test_subtraction_ops_with_tz(self):
-
-        # check that dt/dti subtraction ops with tz are validated
-        dti = date_range('20130101', periods=3)
-        ts = Timestamp('20130101')
-        dt = ts.to_pydatetime()
-        dti_tz = date_range('20130101', periods=3).tz_localize('US/Eastern')
-        ts_tz = Timestamp('20130101').tz_localize('US/Eastern')
-        ts_tz2 = Timestamp('20130101').tz_localize('CET')
-        dt_tz = ts_tz.to_pydatetime()
-        td = Timedelta('1 days')
-
-        def _check(result, expected):
-            self.assertEqual(result, expected)
-            self.assertIsInstance(result, Timedelta)
-
-        # scalars
-        result = ts - ts
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = dt_tz - ts_tz
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = ts_tz - dt_tz
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        # tz mismatches
-        self.assertRaises(TypeError, lambda: dt_tz - ts)
-        self.assertRaises(TypeError, lambda: dt_tz - dt)
-        self.assertRaises(TypeError, lambda: dt_tz - ts_tz2)
-        self.assertRaises(TypeError, lambda: dt - dt_tz)
-        self.assertRaises(TypeError, lambda: ts - dt_tz)
-        self.assertRaises(TypeError, lambda: ts_tz2 - ts)
-        self.assertRaises(TypeError, lambda: ts_tz2 - dt)
-        self.assertRaises(TypeError, lambda: ts_tz - ts_tz2)
-
-        # with dti
-        self.assertRaises(TypeError, lambda: dti - ts_tz)
-        self.assertRaises(TypeError, lambda: dti_tz - ts)
-        self.assertRaises(TypeError, lambda: dti_tz - ts_tz2)
-
-        result = dti_tz - dt_tz
-        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
-        tm.assert_index_equal(result, expected)
-
-        result = dt_tz - dti_tz
-        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
-        tm.assert_index_equal(result, expected)
-
-        result = dti_tz - ts_tz
-        expected = TimedeltaIndex(['0 days', '1 days', '2 days'])
-        tm.assert_index_equal(result, expected)
-
-        result = ts_tz - dti_tz
-        expected = TimedeltaIndex(['0 days', '-1 days', '-2 days'])
-        tm.assert_index_equal(result, expected)
-
-        result = td - td
-        expected = Timedelta('0 days')
-        _check(result, expected)
-
-        result = dti_tz - td
-        expected = DatetimeIndex(
-            ['20121231', '20130101', '20130102'], tz='US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-    def test_dti_tdi_numeric_ops(self):
-
-        # These are normally union/diff set-like ops
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-
-        # TODO(wesm): unused?
-        # td = Timedelta('1 days')
-        # dt = Timestamp('20130101')
-
-        result = tdi - tdi
-        expected = TimedeltaIndex(['0 days', pd.NaT, '0 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi + tdi
-        expected = TimedeltaIndex(['2 days', pd.NaT, '4 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = dti - tdi  # name will be reset
-        expected = DatetimeIndex(['20121231', pd.NaT, '20130101'])
-        tm.assert_index_equal(result, expected)
-
-    def test_sub_period(self):
-        # GH 13078
-        # not supported, check TypeError
-        p = pd.Period('2011-01-01', freq='D')
-
-        for freq in [None, 'H']:
-            idx = pd.TimedeltaIndex(['1 hours', '2 hours'], freq=freq)
-
-            with tm.assertRaises(TypeError):
-                idx - p
-
-            with tm.assertRaises(TypeError):
-                p - idx
-
-    def test_addition_ops(self):
-
-        # with datetimes/timedelta and tdi/dti
-        tdi = TimedeltaIndex(['1 days', pd.NaT, '2 days'], name='foo')
-        dti = date_range('20130101', periods=3, name='bar')
-        td = Timedelta('1 days')
-        dt = Timestamp('20130101')
-
-        result = tdi + dt
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = dt + tdi
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130103'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = td + tdi
-        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        result = tdi + td
-        expected = TimedeltaIndex(['2 days', pd.NaT, '3 days'], name='foo')
-        tm.assert_index_equal(result, expected)
-
-        # unequal length
-        self.assertRaises(ValueError, lambda: tdi + dti[0:1])
-        self.assertRaises(ValueError, lambda: tdi[0:1] + dti)
-
-        # random indexes
-        self.assertRaises(TypeError, lambda: tdi + Int64Index([1, 2, 3]))
-
-        # this is a union!
-        # self.assertRaises(TypeError, lambda : Int64Index([1,2,3]) + tdi)
-
-        result = tdi + dti  # name will be reset
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
-        tm.assert_index_equal(result, expected)
-
-        result = dti + tdi  # name will be reset
-        expected = DatetimeIndex(['20130102', pd.NaT, '20130105'])
-        tm.assert_index_equal(result, expected)
-
-        result = dt + td
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-        result = td + dt
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-    def test_comp_nat(self):
-        left = pd.TimedeltaIndex([pd.Timedelta('1 days'), pd.NaT,
-                                 pd.Timedelta('3 days')])
-        right = pd.TimedeltaIndex([pd.NaT, pd.NaT, pd.Timedelta('3 days')])
-
-        for l, r in [(left, right), (left.asobject, right.asobject)]:
-            result = l == r
-            expected = np.array([False, False, True])
-            tm.assert_numpy_array_equal(result, expected)
-
-            result = l != r
-            expected = np.array([True, True, False])
-            tm.assert_numpy_array_equal(result, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l == pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT == r, expected)
-
-            expected = np.array([True, True, True])
-            tm.assert_numpy_array_equal(l != pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT != l, expected)
-
-            expected = np.array([False, False, False])
-            tm.assert_numpy_array_equal(l < pd.NaT, expected)
-            tm.assert_numpy_array_equal(pd.NaT > l, expected)
-
     def test_value_counts_unique(self):
         # GH 7735
 
@@ -553,14 +64,16 @@ def test_nonunique_contains(self):
         for idx in map(TimedeltaIndex, ([0, 1, 0], [0, 0, -1], [0, -1, -1],
                                         ['00:01:00', '00:01:00', '00:02:00'],
                                         ['00:01:00', '00:01:00', '00:00:01'])):
-            tm.assertIn(idx[0], idx)
+            assert idx[0] in idx
 
     def test_unknown_attribute(self):
-        # GH 9680
+        # see gh-9680
         tdi = pd.timedelta_range(start=0, periods=10, freq='1s')
         ts = pd.Series(np.random.normal(size=10), index=tdi)
-        self.assertNotIn('foo', ts.__dict__.keys())
-        self.assertRaises(AttributeError, lambda: ts.foo)
+        assert 'foo' not in ts.__dict__.keys()
+        msg = "'Series' object has no attribute 'foo'"
+        with pytest.raises(AttributeError, match=msg):
+            ts.foo
 
     def test_order(self):
         # GH 10295
@@ -571,27 +84,26 @@ def test_order(self):
 
         for idx in [idx1, idx2]:
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, idx)
-            self.assertEqual(ordered.freq, idx.freq)
+            tm.assert_index_equal(ordered, idx)
+            assert ordered.freq == idx.freq
 
             ordered = idx.sort_values(ascending=False)
             expected = idx[::-1]
-            self.assert_index_equal(ordered, expected)
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq == expected.freq
+            assert ordered.freq.n == -1
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, idx)
-            self.assert_numpy_array_equal(indexer,
-                                          np.array([0, 1, 2]),
-                                          check_dtype=False)
-            self.assertEqual(ordered.freq, idx.freq)
+            tm.assert_index_equal(ordered, idx)
+            tm.assert_numpy_array_equal(indexer, np.array([0, 1, 2]),
+                                        check_dtype=False)
+            assert ordered.freq == idx.freq
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
-            self.assert_index_equal(ordered, idx[::-1])
-            self.assertEqual(ordered.freq, expected.freq)
-            self.assertEqual(ordered.freq.n, -1)
+            tm.assert_index_equal(ordered, idx[::-1])
+            assert ordered.freq == expected.freq
+            assert ordered.freq.n == -1
 
         idx1 = TimedeltaIndex(['1 hour', '3 hour', '5 hour',
                                '2 hour ', '1 hour'], name='idx1')
@@ -612,72 +124,40 @@ def test_order(self):
 
         for idx, expected in [(idx1, exp1), (idx1, exp1), (idx1, exp1)]:
             ordered = idx.sort_values()
-            self.assert_index_equal(ordered, expected)
-            self.assertIsNone(ordered.freq)
+            tm.assert_index_equal(ordered, expected)
+            assert ordered.freq is None
 
             ordered = idx.sort_values(ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
-            self.assertIsNone(ordered.freq)
+            tm.assert_index_equal(ordered, expected[::-1])
+            assert ordered.freq is None
 
             ordered, indexer = idx.sort_values(return_indexer=True)
-            self.assert_index_equal(ordered, expected)
+            tm.assert_index_equal(ordered, expected)
 
             exp = np.array([0, 4, 3, 1, 2])
-            self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-            self.assertIsNone(ordered.freq)
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq is None
 
             ordered, indexer = idx.sort_values(return_indexer=True,
                                                ascending=False)
-            self.assert_index_equal(ordered, expected[::-1])
+            tm.assert_index_equal(ordered, expected[::-1])
 
             exp = np.array([2, 1, 3, 4, 0])
-            self.assert_numpy_array_equal(indexer, exp, check_dtype=False)
-            self.assertIsNone(ordered.freq)
-
-    def test_getitem(self):
-        idx1 = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx[0]
-            self.assertEqual(result, pd.Timedelta('1 day'))
-
-            result = idx[0:5]
-            expected = pd.timedelta_range('1 day', '5 day', freq='D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[0:10:2]
-            expected = pd.timedelta_range('1 day', '9 day', freq='2D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[-20:-5:3]
-            expected = pd.timedelta_range('12 day', '24 day', freq='3D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx[4::-1]
-            expected = TimedeltaIndex(['5 day', '4 day', '3 day',
-                                       '2 day', '1 day'],
-                                      freq='-1D', name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
+            tm.assert_numpy_array_equal(indexer, exp, check_dtype=False)
+            assert ordered.freq is None
 
     def test_drop_duplicates_metadata(self):
         # GH 10115
         idx = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
         result = idx.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertEqual(idx.freq, result.freq)
+        tm.assert_index_equal(idx, result)
+        assert idx.freq == result.freq
 
         idx_dup = idx.append(idx)
-        self.assertIsNone(idx_dup.freq)  # freq is reset
+        assert idx_dup.freq is None  # freq is reset
         result = idx_dup.drop_duplicates()
-        self.assert_index_equal(idx, result)
-        self.assertIsNone(result.freq)
+        tm.assert_index_equal(idx, result)
+        assert result.freq is None
 
     def test_drop_duplicates(self):
         # to check Index/Series compat
@@ -700,108 +180,25 @@ def test_drop_duplicates(self):
         res = Series(idx).drop_duplicates(keep=False)
         tm.assert_series_equal(res, Series(base[5:], index=np.arange(5, 31)))
 
-    def test_take(self):
-        # GH 10295
-        idx1 = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-
-        for idx in [idx1]:
-            result = idx.take([0])
-            self.assertEqual(result, pd.Timedelta('1 day'))
-
-            result = idx.take([-1])
-            self.assertEqual(result, pd.Timedelta('31 day'))
-
-            result = idx.take([0, 1, 2])
-            expected = pd.timedelta_range('1 day', '3 day', freq='D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([0, 2, 4])
-            expected = pd.timedelta_range('1 day', '5 day', freq='2D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([7, 4, 1])
-            expected = pd.timedelta_range('8 day', '2 day', freq='-3D',
-                                          name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertEqual(result.freq, expected.freq)
-
-            result = idx.take([3, 2, 5])
-            expected = TimedeltaIndex(['4 day', '3 day', '6 day'], name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-            result = idx.take([-3, 2, 5])
-            expected = TimedeltaIndex(['29 day', '3 day', '6 day'], name='idx')
-            self.assert_index_equal(result, expected)
-            self.assertIsNone(result.freq)
-
-    def test_take_invalid_kwargs(self):
-        idx = pd.timedelta_range('1 day', '31 day', freq='D', name='idx')
-        indices = [1, 6, 5, 9, 10, 13, 15, 3]
-
-        msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, idx.take,
-                              indices, foo=2)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, out=indices)
-
-        msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, idx.take,
-                              indices, mode='clip')
-
-    def test_infer_freq(self):
-        # GH 11018
-        for freq in ['D', '3D', '-3D', 'H', '2H', '-2H', 'T', '2T', 'S', '-3S'
-                     ]:
-            idx = pd.timedelta_range('1', freq=freq, periods=10)
-            result = pd.TimedeltaIndex(idx.asi8, freq='infer')
-            tm.assert_index_equal(idx, result)
-            self.assertEqual(result.freq, freq)
-
-    def test_nat_new(self):
-
-        idx = pd.timedelta_range('1', freq='D', periods=5, name='x')
-        result = idx._nat_new()
-        exp = pd.TimedeltaIndex([pd.NaT] * 5, name='x')
-        tm.assert_index_equal(result, exp)
-
-        result = idx._nat_new(box=False)
-        exp = np.array([iNaT] * 5, dtype=np.int64)
-        tm.assert_numpy_array_equal(result, exp)
+    @pytest.mark.parametrize('freq', ['D', '3D', '-3D',
+                                      'H', '2H', '-2H',
+                                      'T', '2T', 'S', '-3S'])
+    def test_infer_freq(self, freq):
+        # GH#11018
+        idx = pd.timedelta_range('1', freq=freq, periods=10)
+        result = pd.TimedeltaIndex(idx.asi8, freq='infer')
+        tm.assert_index_equal(idx, result)
+        assert result.freq == freq
 
     def test_shift(self):
-        # GH 9903
-        idx = pd.TimedeltaIndex([], name='xxx')
-        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
-        tm.assert_index_equal(idx.shift(3, freq='H'), idx)
-
-        idx = pd.TimedeltaIndex(['5 hours', '6 hours', '9 hours'], name='xxx')
-        tm.assert_index_equal(idx.shift(0, freq='H'), idx)
-        exp = pd.TimedeltaIndex(['8 hours', '9 hours', '12 hours'], name='xxx')
-        tm.assert_index_equal(idx.shift(3, freq='H'), exp)
-        exp = pd.TimedeltaIndex(['2 hours', '3 hours', '6 hours'], name='xxx')
-        tm.assert_index_equal(idx.shift(-3, freq='H'), exp)
-
-        tm.assert_index_equal(idx.shift(0, freq='T'), idx)
-        exp = pd.TimedeltaIndex(['05:03:00', '06:03:00', '9:03:00'],
-                                name='xxx')
-        tm.assert_index_equal(idx.shift(3, freq='T'), exp)
-        exp = pd.TimedeltaIndex(['04:57:00', '05:57:00', '8:57:00'],
-                                name='xxx')
-        tm.assert_index_equal(idx.shift(-3, freq='T'), exp)
+        pass  # handled in test_arithmetic.py
 
     def test_repeat(self):
         index = pd.timedelta_range('1 days', periods=2, freq='D')
         exp = pd.TimedeltaIndex(['1 days', '1 days', '2 days', '2 days'])
         for res in [index.repeat(2), np.repeat(index, 2)]:
             tm.assert_index_equal(res, exp)
-            self.assertIsNone(res.freq)
+            assert res.freq is None
 
         index = TimedeltaIndex(['1 days', 'NaT', '3 days'])
         exp = TimedeltaIndex(['1 days', '1 days', '1 days',
@@ -809,468 +206,78 @@ def test_repeat(self):
                               '3 days', '3 days', '3 days'])
         for res in [index.repeat(3), np.repeat(index, 3)]:
             tm.assert_index_equal(res, exp)
-            self.assertIsNone(res.freq)
+            assert res.freq is None
 
     def test_nat(self):
-        self.assertIs(pd.TimedeltaIndex._na_value, pd.NaT)
-        self.assertIs(pd.TimedeltaIndex([])._na_value, pd.NaT)
+        assert pd.TimedeltaIndex._na_value is pd.NaT
+        assert pd.TimedeltaIndex([])._na_value is pd.NaT
 
         idx = pd.TimedeltaIndex(['1 days', '2 days'])
-        self.assertTrue(idx._can_hold_na)
+        assert idx._can_hold_na
 
         tm.assert_numpy_array_equal(idx._isnan, np.array([False, False]))
-        self.assertFalse(idx.hasnans)
+        assert idx.hasnans is False
         tm.assert_numpy_array_equal(idx._nan_idxs,
                                     np.array([], dtype=np.intp))
 
         idx = pd.TimedeltaIndex(['1 days', 'NaT'])
-        self.assertTrue(idx._can_hold_na)
+        assert idx._can_hold_na
 
         tm.assert_numpy_array_equal(idx._isnan, np.array([False, True]))
-        self.assertTrue(idx.hasnans)
+        assert idx.hasnans is True
         tm.assert_numpy_array_equal(idx._nan_idxs,
                                     np.array([1], dtype=np.intp))
 
     def test_equals(self):
         # GH 13107
         idx = pd.TimedeltaIndex(['1 days', '2 days', 'NaT'])
-        self.assertTrue(idx.equals(idx))
-        self.assertTrue(idx.equals(idx.copy()))
-        self.assertTrue(idx.equals(idx.asobject))
-        self.assertTrue(idx.asobject.equals(idx))
-        self.assertTrue(idx.asobject.equals(idx.asobject))
-        self.assertFalse(idx.equals(list(idx)))
-        self.assertFalse(idx.equals(pd.Series(idx)))
+        assert idx.equals(idx)
+        assert idx.equals(idx.copy())
+        assert idx.equals(idx.astype(object))
+        assert idx.astype(object).equals(idx)
+        assert idx.astype(object).equals(idx.astype(object))
+        assert not idx.equals(list(idx))
+        assert not idx.equals(pd.Series(idx))
 
         idx2 = pd.TimedeltaIndex(['2 days', '1 days', 'NaT'])
-        self.assertFalse(idx.equals(idx2))
-        self.assertFalse(idx.equals(idx2.copy()))
-        self.assertFalse(idx.equals(idx2.asobject))
-        self.assertFalse(idx.asobject.equals(idx2))
-        self.assertFalse(idx.asobject.equals(idx2.asobject))
-        self.assertFalse(idx.equals(list(idx2)))
-        self.assertFalse(idx.equals(pd.Series(idx2)))
-
-
-class TestTimedeltas(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def test_ops(self):
-
-        td = Timedelta(10, unit='d')
-        self.assertEqual(-td, Timedelta(-10, unit='d'))
-        self.assertEqual(+td, Timedelta(10, unit='d'))
-        self.assertEqual(td - td, Timedelta(0, unit='ns'))
-        self.assertTrue((td - pd.NaT) is pd.NaT)
-        self.assertEqual(td + td, Timedelta(20, unit='d'))
-        self.assertTrue((td + pd.NaT) is pd.NaT)
-        self.assertEqual(td * 2, Timedelta(20, unit='d'))
-        self.assertTrue((td * pd.NaT) is pd.NaT)
-        self.assertEqual(td / 2, Timedelta(5, unit='d'))
-        self.assertEqual(abs(td), td)
-        self.assertEqual(abs(-td), td)
-        self.assertEqual(td / td, 1)
-        self.assertTrue((td / pd.NaT) is np.nan)
-
-        # invert
-        self.assertEqual(-td, Timedelta('-10d'))
-        self.assertEqual(td * -1, Timedelta('-10d'))
-        self.assertEqual(-1 * td, Timedelta('-10d'))
-        self.assertEqual(abs(-td), Timedelta('10d'))
-
-        # invalid
-        self.assertRaises(TypeError, lambda: Timedelta(11, unit='d') // 2)
-
-        # invalid multiply with another timedelta
-        self.assertRaises(TypeError, lambda: td * td)
-
-        # can't operate with integers
-        self.assertRaises(TypeError, lambda: td + 2)
-        self.assertRaises(TypeError, lambda: td - 2)
-
-    def test_ops_offsets(self):
-        td = Timedelta(10, unit='d')
-        self.assertEqual(Timedelta(241, unit='h'), td + pd.offsets.Hour(1))
-        self.assertEqual(Timedelta(241, unit='h'), pd.offsets.Hour(1) + td)
-        self.assertEqual(240, td / pd.offsets.Hour(1))
-        self.assertEqual(1 / 240.0, pd.offsets.Hour(1) / td)
-        self.assertEqual(Timedelta(239, unit='h'), td - pd.offsets.Hour(1))
-        self.assertEqual(Timedelta(-239, unit='h'), pd.offsets.Hour(1) - td)
-
-    def test_ops_ndarray(self):
-        td = Timedelta('1 day')
-
-        # timedelta, timedelta
-        other = pd.to_timedelta(['1 day']).values
-        expected = pd.to_timedelta(['2 days']).values
-        self.assert_numpy_array_equal(td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other + td, expected)
-        self.assertRaises(TypeError, lambda: td + np.array([1]))
-        self.assertRaises(TypeError, lambda: np.array([1]) + td)
-
-        expected = pd.to_timedelta(['0 days']).values
-        self.assert_numpy_array_equal(td - other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(-other + td, expected)
-        self.assertRaises(TypeError, lambda: td - np.array([1]))
-        self.assertRaises(TypeError, lambda: np.array([1]) - td)
-
-        expected = pd.to_timedelta(['2 days']).values
-        self.assert_numpy_array_equal(td * np.array([2]), expected)
-        self.assert_numpy_array_equal(np.array([2]) * td, expected)
-        self.assertRaises(TypeError, lambda: td * other)
-        self.assertRaises(TypeError, lambda: other * td)
-
-        self.assert_numpy_array_equal(td / other,
-                                      np.array([1], dtype=np.float64))
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other / td,
-                                          np.array([1], dtype=np.float64))
-
-        # timedelta, datetime
-        other = pd.to_datetime(['2000-01-01']).values
-        expected = pd.to_datetime(['2000-01-02']).values
-        self.assert_numpy_array_equal(td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other + td, expected)
-
-        expected = pd.to_datetime(['1999-12-31']).values
-        self.assert_numpy_array_equal(-td + other, expected)
-        if LooseVersion(np.__version__) >= '1.8':
-            self.assert_numpy_array_equal(other - td, expected)
-
-    def test_ops_series(self):
-        # regression test for GH8813
-        td = Timedelta('1 day')
-        other = pd.Series([1, 2])
-        expected = pd.Series(pd.to_timedelta(['1 day', '2 days']))
-        tm.assert_series_equal(expected, td * other)
-        tm.assert_series_equal(expected, other * td)
-
-    def test_ops_series_object(self):
-        # GH 13043
-        s = pd.Series([pd.Timestamp('2015-01-01', tz='US/Eastern'),
-                       pd.Timestamp('2015-01-01', tz='Asia/Tokyo')],
-                      name='xxx')
-        self.assertEqual(s.dtype, object)
-
-        exp = pd.Series([pd.Timestamp('2015-01-02', tz='US/Eastern'),
-                         pd.Timestamp('2015-01-02', tz='Asia/Tokyo')],
-                        name='xxx')
-        tm.assert_series_equal(s + pd.Timedelta('1 days'), exp)
-        tm.assert_series_equal(pd.Timedelta('1 days') + s, exp)
-
-        # object series & object series
-        s2 = pd.Series([pd.Timestamp('2015-01-03', tz='US/Eastern'),
-                        pd.Timestamp('2015-01-05', tz='Asia/Tokyo')],
-                       name='xxx')
-        self.assertEqual(s2.dtype, object)
-        exp = pd.Series([pd.Timedelta('2 days'), pd.Timedelta('4 days')],
-                        name='xxx')
-        tm.assert_series_equal(s2 - s, exp)
-        tm.assert_series_equal(s - s2, -exp)
-
-        s = pd.Series([pd.Timedelta('01:00:00'), pd.Timedelta('02:00:00')],
-                      name='xxx', dtype=object)
-        self.assertEqual(s.dtype, object)
-
-        exp = pd.Series([pd.Timedelta('01:30:00'), pd.Timedelta('02:30:00')],
-                        name='xxx')
-        tm.assert_series_equal(s + pd.Timedelta('00:30:00'), exp)
-        tm.assert_series_equal(pd.Timedelta('00:30:00') + s, exp)
-
-    def test_ops_notimplemented(self):
-        class Other:
-            pass
-
-        other = Other()
-
-        td = Timedelta('1 day')
-        self.assertTrue(td.__add__(other) is NotImplemented)
-        self.assertTrue(td.__sub__(other) is NotImplemented)
-        self.assertTrue(td.__truediv__(other) is NotImplemented)
-        self.assertTrue(td.__mul__(other) is NotImplemented)
-        self.assertTrue(td.__floordiv__(td) is NotImplemented)
-
-    def test_ops_error_str(self):
-        # GH 13624
-        tdi = TimedeltaIndex(['1 day', '2 days'])
-
-        for l, r in [(tdi, 'a'), ('a', tdi)]:
-            with tm.assertRaises(TypeError):
-                l + r
-
-            with tm.assertRaises(TypeError):
-                l > r
-
-            with tm.assertRaises(TypeError):
-                l == r
-
-            with tm.assertRaises(TypeError):
-                l != r
-
-    def test_timedelta_ops(self):
-        # GH4984
-        # make sure ops return Timedelta
-        s = Series([Timestamp('20130101') + timedelta(seconds=i * i)
-                    for i in range(10)])
-        td = s.diff()
-
-        result = td.mean()
-        expected = to_timedelta(timedelta(seconds=9))
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().mean()
-        self.assertEqual(result[0], expected)
-
-        result = td.quantile(.1)
-        expected = Timedelta(np.timedelta64(2600, 'ms'))
-        self.assertEqual(result, expected)
-
-        result = td.median()
-        expected = to_timedelta('00:00:09')
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().median()
-        self.assertEqual(result[0], expected)
-
-        # GH 6462
-        # consistency in returned values for sum
-        result = td.sum()
-        expected = to_timedelta('00:01:21')
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().sum()
-        self.assertEqual(result[0], expected)
-
-        # std
-        result = td.std()
-        expected = to_timedelta(Series(td.dropna().values).std())
-        self.assertEqual(result, expected)
-
-        result = td.to_frame().std()
-        self.assertEqual(result[0], expected)
-
-        # invalid ops
-        for op in ['skew', 'kurt', 'sem', 'prod']:
-            self.assertRaises(TypeError, getattr(td, op))
-
-        # GH 10040
-        # make sure NaT is properly handled by median()
-        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07')])
-        self.assertEqual(s.diff().median(), timedelta(days=4))
-
-        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07'),
-                    Timestamp('2015-02-15')])
-        self.assertEqual(s.diff().median(), timedelta(days=6))
-
-    def test_timedelta_ops_scalar(self):
-        # GH 6808
-        base = pd.to_datetime('20130101 09:01:12.123456')
-        expected_add = pd.to_datetime('20130101 09:01:22.123456')
-        expected_sub = pd.to_datetime('20130101 09:01:02.123456')
-
-        for offset in [pd.to_timedelta(10, unit='s'), timedelta(seconds=10),
-                       np.timedelta64(10, 's'),
-                       np.timedelta64(10000000000, 'ns'),
-                       pd.offsets.Second(10)]:
-            result = base + offset
-            self.assertEqual(result, expected_add)
-
-            result = base - offset
-            self.assertEqual(result, expected_sub)
-
-        base = pd.to_datetime('20130102 09:01:12.123456')
-        expected_add = pd.to_datetime('20130103 09:01:22.123456')
-        expected_sub = pd.to_datetime('20130101 09:01:02.123456')
-
-        for offset in [pd.to_timedelta('1 day, 00:00:10'),
-                       pd.to_timedelta('1 days, 00:00:10'),
-                       timedelta(days=1, seconds=10),
-                       np.timedelta64(1, 'D') + np.timedelta64(10, 's'),
-                       pd.offsets.Day() + pd.offsets.Second(10)]:
-            result = base + offset
-            self.assertEqual(result, expected_add)
-
-            result = base - offset
-            self.assertEqual(result, expected_sub)
-
-    def test_timedelta_ops_with_missing_values(self):
-        # setup
-        s1 = pd.to_timedelta(Series(['00:00:01']))
-        s2 = pd.to_timedelta(Series(['00:00:02']))
-        sn = pd.to_timedelta(Series([pd.NaT]))
-        df1 = DataFrame(['00:00:01']).apply(pd.to_timedelta)
-        df2 = DataFrame(['00:00:02']).apply(pd.to_timedelta)
-        dfn = DataFrame([pd.NaT]).apply(pd.to_timedelta)
-        scalar1 = pd.to_timedelta('00:00:01')
-        scalar2 = pd.to_timedelta('00:00:02')
-        timedelta_NaT = pd.to_timedelta('NaT')
-        NA = np.nan
-
-        actual = scalar1 + scalar1
-        self.assertEqual(actual, scalar2)
-        actual = scalar2 - scalar1
-        self.assertEqual(actual, scalar1)
-
-        actual = s1 + s1
-        assert_series_equal(actual, s2)
-        actual = s2 - s1
-        assert_series_equal(actual, s1)
-
-        actual = s1 + scalar1
-        assert_series_equal(actual, s2)
-        actual = scalar1 + s1
-        assert_series_equal(actual, s2)
-        actual = s2 - scalar1
-        assert_series_equal(actual, s1)
-        actual = -scalar1 + s2
-        assert_series_equal(actual, s1)
-
-        actual = s1 + timedelta_NaT
-        assert_series_equal(actual, sn)
-        actual = timedelta_NaT + s1
-        assert_series_equal(actual, sn)
-        actual = s1 - timedelta_NaT
-        assert_series_equal(actual, sn)
-        actual = -timedelta_NaT + s1
-        assert_series_equal(actual, sn)
-
-        actual = s1 + NA
-        assert_series_equal(actual, sn)
-        actual = NA + s1
-        assert_series_equal(actual, sn)
-        actual = s1 - NA
-        assert_series_equal(actual, sn)
-        actual = -NA + s1
-        assert_series_equal(actual, sn)
-
-        actual = s1 + pd.NaT
-        assert_series_equal(actual, sn)
-        actual = s2 - pd.NaT
-        assert_series_equal(actual, sn)
-
-        actual = s1 + df1
-        assert_frame_equal(actual, df2)
-        actual = s2 - df1
-        assert_frame_equal(actual, df1)
-        actual = df1 + s1
-        assert_frame_equal(actual, df2)
-        actual = df2 - s1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + df1
-        assert_frame_equal(actual, df2)
-        actual = df2 - df1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + scalar1
-        assert_frame_equal(actual, df2)
-        actual = df2 - scalar1
-        assert_frame_equal(actual, df1)
-
-        actual = df1 + timedelta_NaT
-        assert_frame_equal(actual, dfn)
-        actual = df1 - timedelta_NaT
-        assert_frame_equal(actual, dfn)
-
-        actual = df1 + NA
-        assert_frame_equal(actual, dfn)
-        actual = df1 - NA
-        assert_frame_equal(actual, dfn)
-
-        actual = df1 + pd.NaT  # NaT is datetime, not timedelta
-        assert_frame_equal(actual, dfn)
-        actual = df1 - pd.NaT
-        assert_frame_equal(actual, dfn)
-
-    def test_compare_timedelta_series(self):
-        # regresssion test for GH5963
-        s = pd.Series([timedelta(days=1), timedelta(days=2)])
-        actual = s > timedelta(days=1)
-        expected = pd.Series([False, True])
-        tm.assert_series_equal(actual, expected)
-
-    def test_compare_timedelta_ndarray(self):
-        # GH11835
-        periods = [Timedelta('0 days 01:00:00'), Timedelta('0 days 01:00:00')]
-        arr = np.array(periods)
-        result = arr[0] > arr
-        expected = np.array([False, False])
-        self.assert_numpy_array_equal(result, expected)
-
-
-class TestSlicing(tm.TestCase):
-
-    def test_tdi_ops_attributes(self):
-        rng = timedelta_range('2 days', periods=5, freq='2D', name='x')
-
-        result = rng + 1
-        exp = timedelta_range('4 days', periods=5, freq='2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '2D')
-
-        result = rng - 2
-        exp = timedelta_range('-2 days', periods=5, freq='2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '2D')
-
-        result = rng * 2
-        exp = timedelta_range('4 days', periods=5, freq='4D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '4D')
-
-        result = rng / 2
-        exp = timedelta_range('1 days', periods=5, freq='D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, 'D')
-
-        result = -rng
-        exp = timedelta_range('-2 days', periods=5, freq='-2D', name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, '-2D')
-
-        rng = pd.timedelta_range('-2 days', periods=5, freq='D', name='x')
-
-        result = abs(rng)
-        exp = TimedeltaIndex(['2 days', '1 days', '0 days', '1 days',
-                              '2 days'], name='x')
-        tm.assert_index_equal(result, exp)
-        self.assertEqual(result.freq, None)
-
-    def test_add_overflow(self):
-        # see gh-14068
-        msg = "too (big|large) to convert"
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            to_timedelta(106580, 'D') + Timestamp('2000')
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            Timestamp('2000') + to_timedelta(106580, 'D')
-
-        _NaT = int(pd.NaT) + 1
-        msg = "Overflow in int64 addition"
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            to_timedelta([106580], 'D') + Timestamp('2000')
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            Timestamp('2000') + to_timedelta([106580], 'D')
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            to_timedelta([_NaT]) - Timedelta('1 days')
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            to_timedelta(['5 days', _NaT]) - Timedelta('1 days')
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            (to_timedelta([_NaT, '5 days', '1 hours']) -
-             to_timedelta(['7 seconds', _NaT, '4 hours']))
-
-        # These should not overflow!
-        exp = TimedeltaIndex([pd.NaT])
-        result = to_timedelta([pd.NaT]) - Timedelta('1 days')
-        tm.assert_index_equal(result, exp)
-
-        exp = TimedeltaIndex(['4 days', pd.NaT])
-        result = to_timedelta(['5 days', pd.NaT]) - Timedelta('1 days')
-        tm.assert_index_equal(result, exp)
-
-        exp = TimedeltaIndex([pd.NaT, pd.NaT, '5 hours'])
-        result = (to_timedelta([pd.NaT, '5 days', '1 hours']) +
-                  to_timedelta(['7 seconds', pd.NaT, '4 hours']))
-        tm.assert_index_equal(result, exp)
+        assert not idx.equals(idx2)
+        assert not idx.equals(idx2.copy())
+        assert not idx.equals(idx2.astype(object))
+        assert not idx.astype(object).equals(idx2)
+        assert not idx.astype(object).equals(idx2.astype(object))
+        assert not idx.equals(list(idx2))
+        assert not idx.equals(pd.Series(idx2))
+
+    @pytest.mark.parametrize('values', [['0 days', '2 days', '4 days'], []])
+    @pytest.mark.parametrize('freq', ['2D', Day(2), '48H', Hour(48)])
+    def test_freq_setter(self, values, freq):
+        # GH 20678
+        idx = TimedeltaIndex(values)
+
+        # can set to an offset, converting from string if necessary
+        idx.freq = freq
+        assert idx.freq == freq
+        assert isinstance(idx.freq, ABCDateOffset)
+
+        # can reset to None
+        idx.freq = None
+        assert idx.freq is None
+
+    def test_freq_setter_errors(self):
+        # GH 20678
+        idx = TimedeltaIndex(['0 days', '2 days', '4 days'])
+
+        # setting with an incompatible freq
+        msg = ('Inferred frequency 2D from passed values does not conform to '
+               'passed frequency 5D')
+        with pytest.raises(ValueError, match=msg):
+            idx.freq = '5D'
+
+        # setting with a non-fixed frequency
+        msg = r'<2 \* BusinessDays> is a non-fixed frequency'
+        with pytest.raises(ValueError, match=msg):
+            idx.freq = '2B'
+
+        # setting with non-freq string
+        with pytest.raises(ValueError, match='Invalid frequency'):
+            idx.freq = 'foo'
diff --git a/pandas/tests/indexes/timedeltas/test_partial_slicing.py b/pandas/tests/indexes/timedeltas/test_partial_slicing.py
index 0d46ee4172211..9fce1c9acd488 100644
--- a/pandas/tests/indexes/timedeltas/test_partial_slicing.py
+++ b/pandas/tests/indexes/timedeltas/test_partial_slicing.py
@@ -1,12 +1,16 @@
 import numpy as np
-import pandas.util.testing as tm
+import pytest
 
 import pandas as pd
-from pandas import Series, timedelta_range, Timedelta
+from pandas import Series, Timedelta, timedelta_range
 from pandas.util.testing import assert_series_equal
 
 
-class TestSlicing(tm.TestCase):
+class TestSlicing(object):
+    def test_slice_keeps_name(self):
+        # GH4226
+        dr = pd.timedelta_range('1d', '5d', freq='H', name='timebucket')
+        assert dr[1:].name == dr.name
 
     def test_partial_slice(self):
         rng = timedelta_range('1 day 10:11:12', freq='h', periods=500)
@@ -25,9 +29,11 @@ def test_partial_slice(self):
         assert_series_equal(result, expected)
 
         result = s['6 days, 23:11:12']
-        self.assertEqual(result, s.iloc[133])
+        assert result == s.iloc[133]
 
-        self.assertRaises(KeyError, s.__getitem__, '50 days')
+        msg = r"^Timedelta\('50 days 00:00:00'\)$"
+        with pytest.raises(KeyError, match=msg):
+            s['50 days']
 
     def test_partial_slice_high_reso(self):
 
@@ -44,7 +50,7 @@ def test_partial_slice_high_reso(self):
         assert_series_equal(result, expected)
 
         result = s['1 days, 10:11:12.001001']
-        self.assertEqual(result, s.iloc[1001])
+        assert result == s.iloc[1001]
 
     def test_slice_with_negative_step(self):
         ts = Series(np.arange(20), timedelta_range('0', periods=20, freq='H'))
@@ -73,9 +79,9 @@ def assert_slices_equivalent(l_slc, i_slc):
 
     def test_slice_with_zero_step_raises(self):
         ts = Series(np.arange(20), timedelta_range('0', periods=20, freq='H'))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: ts.loc[::0])
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            ts.loc[::0]
diff --git a/pandas/tests/indexes/timedeltas/test_scalar_compat.py b/pandas/tests/indexes/timedeltas/test_scalar_compat.py
new file mode 100644
index 0000000000000..788d27eb8ab76
--- /dev/null
+++ b/pandas/tests/indexes/timedeltas/test_scalar_compat.py
@@ -0,0 +1,64 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for TimedeltaIndex methods behaving like their Timedelta counterparts
+"""
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Index, Series, Timedelta, TimedeltaIndex, timedelta_range
+import pandas.util.testing as tm
+
+
+class TestVectorizedTimedelta(object):
+    def test_tdi_total_seconds(self):
+        # GH#10939
+        # test index
+        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
+                              freq='s')
+        expt = [1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9,
+                1 * 86400 + 10 * 3600 + 11 * 60 + 13 + 100123456. / 1e9]
+        tm.assert_almost_equal(rng.total_seconds(), Index(expt))
+
+        # test Series
+        ser = Series(rng)
+        s_expt = Series(expt, index=[0, 1])
+        tm.assert_series_equal(ser.dt.total_seconds(), s_expt)
+
+        # with nat
+        ser[1] = np.nan
+        s_expt = Series([1 * 86400 + 10 * 3600 + 11 * 60 +
+                         12 + 100123456. / 1e9, np.nan], index=[0, 1])
+        tm.assert_series_equal(ser.dt.total_seconds(), s_expt)
+
+        # with both nat
+        ser = Series([np.nan, np.nan], dtype='timedelta64[ns]')
+        tm.assert_series_equal(ser.dt.total_seconds(),
+                               Series([np.nan, np.nan], index=[0, 1]))
+
+    def test_tdi_round(self):
+        td = pd.timedelta_range(start='16801 days', periods=5, freq='30Min')
+        elt = td[1]
+
+        expected_rng = TimedeltaIndex([Timedelta('16801 days 00:00:00'),
+                                       Timedelta('16801 days 00:00:00'),
+                                       Timedelta('16801 days 01:00:00'),
+                                       Timedelta('16801 days 02:00:00'),
+                                       Timedelta('16801 days 02:00:00')])
+        expected_elt = expected_rng[1]
+
+        tm.assert_index_equal(td.round(freq='H'), expected_rng)
+        assert elt.round(freq='H') == expected_elt
+
+        msg = pd._libs.tslibs.frequencies.INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            td.round(freq='foo')
+        with pytest.raises(ValueError, match=msg):
+            elt.round(freq='foo')
+
+        msg = "<MonthEnd> is a non-fixed frequency"
+        with pytest.raises(ValueError, match=msg):
+            td.round(freq='M')
+        with pytest.raises(ValueError, match=msg):
+            elt.round(freq='M')
diff --git a/pandas/tests/indexes/timedeltas/test_setops.py b/pandas/tests/indexes/timedeltas/test_setops.py
index 9000fb3beb279..f7c3f764df0a0 100644
--- a/pandas/tests/indexes/timedeltas/test_setops.py
+++ b/pandas/tests/indexes/timedeltas/test_setops.py
@@ -1,12 +1,11 @@
 import numpy as np
 
 import pandas as pd
+from pandas import Int64Index, TimedeltaIndex, timedelta_range
 import pandas.util.testing as tm
-from pandas import TimedeltaIndex, timedelta_range, Int64Index
 
 
-class TestTimedeltaIndex(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestTimedeltaIndex(object):
 
     def test_union(self):
 
@@ -14,10 +13,10 @@ def test_union(self):
         i2 = timedelta_range('3day', periods=5)
         result = i1.union(i2)
         expected = timedelta_range('1day', periods=7)
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         i1 = Int64Index(np.arange(0, 20, 2))
-        i2 = TimedeltaIndex(start='1 day', periods=10, freq='D')
+        i2 = timedelta_range(start='1 day', periods=10, freq='D')
         i1.union(i2)  # Works
         i2.union(i1)  # Fails with "AttributeError: can't set attribute"
 
@@ -26,11 +25,11 @@ def test_union_coverage(self):
         idx = TimedeltaIndex(['3d', '1d', '2d'])
         ordered = TimedeltaIndex(idx.sort_values(), freq='infer')
         result = ordered.union(idx)
-        self.assert_index_equal(result, ordered)
+        tm.assert_index_equal(result, ordered)
 
         result = ordered[:0].union(ordered)
-        self.assert_index_equal(result, ordered)
-        self.assertEqual(result.freq, ordered.freq)
+        tm.assert_index_equal(result, ordered)
+        assert result.freq == ordered.freq
 
     def test_union_bug_1730(self):
 
@@ -39,7 +38,7 @@ def test_union_bug_1730(self):
 
         result = rng_a.union(rng_b)
         exp = TimedeltaIndex(sorted(set(list(rng_a)) | set(list(rng_b))))
-        self.assert_index_equal(result, exp)
+        tm.assert_index_equal(result, exp)
 
     def test_union_bug_1745(self):
 
@@ -50,7 +49,7 @@ def test_union_bug_1745(self):
 
         result = left.union(right)
         exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
-        self.assert_index_equal(result, exp)
+        tm.assert_index_equal(result, exp)
 
     def test_union_bug_4564(self):
 
@@ -59,14 +58,14 @@ def test_union_bug_4564(self):
 
         result = left.union(right)
         exp = TimedeltaIndex(sorted(set(list(left)) | set(list(right))))
-        self.assert_index_equal(result, exp)
+        tm.assert_index_equal(result, exp)
 
     def test_intersection_bug_1708(self):
         index_1 = timedelta_range('1 day', periods=4, freq='h')
         index_2 = index_1 + pd.offsets.Hour(5)
 
         result = index_1 & index_2
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
         index_1 = timedelta_range('1 day', periods=4, freq='h')
         index_2 = index_1 + pd.offsets.Hour(1)
diff --git a/pandas/tests/indexes/timedeltas/test_timedelta.py b/pandas/tests/indexes/timedeltas/test_timedelta.py
index 3abc2d8422fd3..062e1c1e9f46d 100644
--- a/pandas/tests/indexes/timedeltas/test_timedelta.py
+++ b/pandas/tests/indexes/timedeltas/test_timedelta.py
@@ -1,254 +1,110 @@
-import numpy as np
 from datetime import timedelta
+import re
+
+import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import (
+    DataFrame, Index, Int64Index, Series, Timedelta, TimedeltaIndex,
+    date_range, timedelta_range)
 import pandas.util.testing as tm
-from pandas import (timedelta_range, date_range, Series, Timedelta,
-                    DatetimeIndex, TimedeltaIndex, Index, DataFrame,
-                    Int64Index, _np_version_under1p8)
-from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_index_equal)
+from pandas.util.testing import (
+    assert_almost_equal, assert_index_equal, assert_series_equal)
 
 from ..datetimelike import DatetimeLike
 
 randn = np.random.randn
 
 
-class TestTimedeltaIndex(DatetimeLike, tm.TestCase):
+class TestTimedeltaIndex(DatetimeLike):
     _holder = TimedeltaIndex
-    _multiprocess_can_split_ = True
 
-    def setUp(self):
+    def setup_method(self, method):
         self.indices = dict(index=tm.makeTimedeltaIndex(10))
         self.setup_indices()
 
     def create_index(self):
         return pd.to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
 
-    def test_shift(self):
-        # test shift for TimedeltaIndex
-        # err8083
-
-        drange = self.create_index()
-        result = drange.shift(1)
-        expected = TimedeltaIndex(['1 days 01:00:00', '2 days 01:00:00',
-                                   '3 days 01:00:00',
-                                   '4 days 01:00:00', '5 days 01:00:00'],
-                                  freq='D')
-        self.assert_index_equal(result, expected)
-
-        result = drange.shift(3, freq='2D 1s')
-        expected = TimedeltaIndex(['6 days 01:00:03', '7 days 01:00:03',
-                                   '8 days 01:00:03', '9 days 01:00:03',
-                                   '10 days 01:00:03'], freq='D')
-        self.assert_index_equal(result, expected)
-
-    def test_get_loc(self):
-        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
-
-        for method in [None, 'pad', 'backfill', 'nearest']:
-            self.assertEqual(idx.get_loc(idx[1], method), 1)
-            self.assertEqual(idx.get_loc(idx[1].to_pytimedelta(), method), 1)
-            self.assertEqual(idx.get_loc(str(idx[1]), method), 1)
-
-        self.assertEqual(
-            idx.get_loc(idx[1], 'pad', tolerance=pd.Timedelta(0)), 1)
-        self.assertEqual(
-            idx.get_loc(idx[1], 'pad', tolerance=np.timedelta64(0, 's')), 1)
-        self.assertEqual(idx.get_loc(idx[1], 'pad', tolerance=timedelta(0)), 1)
-
-        with tm.assertRaisesRegexp(ValueError, 'must be convertible'):
-            idx.get_loc(idx[1], method='nearest', tolerance='foo')
-
-        for method, loc in [('pad', 1), ('backfill', 2), ('nearest', 1)]:
-            self.assertEqual(idx.get_loc('1 day 1 hour', method), loc)
-
-    def test_get_loc_nat(self):
-        tidx = TimedeltaIndex(['1 days 01:00:00', 'NaT', '2 days 01:00:00'])
-
-        self.assertEqual(tidx.get_loc(pd.NaT), 1)
-        self.assertEqual(tidx.get_loc(None), 1)
-        self.assertEqual(tidx.get_loc(float('nan')), 1)
-        self.assertEqual(tidx.get_loc(np.nan), 1)
-
-    def test_get_indexer(self):
-        idx = pd.to_timedelta(['0 days', '1 days', '2 days'])
-        tm.assert_numpy_array_equal(idx.get_indexer(idx),
-                                    np.array([0, 1, 2], dtype=np.intp))
-
-        target = pd.to_timedelta(['-1 hour', '12 hours', '1 day 1 hour'])
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'pad'),
-                                    np.array([-1, 0, 1], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'backfill'),
-                                    np.array([0, 1, 2], dtype=np.intp))
-        tm.assert_numpy_array_equal(idx.get_indexer(target, 'nearest'),
-                                    np.array([0, 1, 1], dtype=np.intp))
-
-        res = idx.get_indexer(target, 'nearest',
-                              tolerance=pd.Timedelta('1 hour'))
-        tm.assert_numpy_array_equal(res, np.array([0, -1, 1], dtype=np.intp))
-
     def test_numeric_compat(self):
+        # Dummy method to override super's version; this test is now done
+        # in test_arithmetic.py
+        pass
 
-        idx = self._holder(np.arange(5, dtype='int64'))
-        didx = self._holder(np.arange(5, dtype='int64') ** 2)
-        result = idx * 1
-        tm.assert_index_equal(result, idx)
-
-        result = 1 * idx
-        tm.assert_index_equal(result, idx)
-
-        result = idx / 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx // 1
-        tm.assert_index_equal(result, idx)
-
-        result = idx * np.array(5, dtype='int64')
-        tm.assert_index_equal(result,
-                              self._holder(np.arange(5, dtype='int64') * 5))
-
-        result = idx * np.arange(5, dtype='int64')
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5, dtype='int64'))
-        tm.assert_index_equal(result, didx)
-
-        result = idx * Series(np.arange(5, dtype='float64') + 0.1)
-        tm.assert_index_equal(result, self._holder(np.arange(
-            5, dtype='float64') * (np.arange(5, dtype='float64') + 0.1)))
-
-        # invalid
-        self.assertRaises(TypeError, lambda: idx * idx)
-        self.assertRaises(ValueError, lambda: idx * self._holder(np.arange(3)))
-        self.assertRaises(ValueError, lambda: idx * np.array([1, 2]))
+    def test_shift(self):
+        pass  # this is handled in test_arithmetic.py
 
     def test_pickle_compat_construction(self):
         pass
 
-    def test_ufunc_coercions(self):
-        # normal ops are also tested in tseries/test_timedeltas.py
-        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
-                             freq='2H', name='x')
-
-        for result in [idx * 2, np.multiply(idx, 2)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['4H', '8H', '12H', '16H', '20H'],
-                                 freq='4H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '4H')
-
-        for result in [idx / 2, np.divide(idx, 2)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['1H', '2H', '3H', '4H', '5H'],
-                                 freq='H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, 'H')
-
-        idx = TimedeltaIndex(['2H', '4H', '6H', '8H', '10H'],
-                             freq='2H', name='x')
-        for result in [-idx, np.negative(idx)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['-2H', '-4H', '-6H', '-8H', '-10H'],
-                                 freq='-2H', name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, '-2H')
-
-        idx = TimedeltaIndex(['-2H', '-1H', '0H', '1H', '2H'],
-                             freq='H', name='x')
-        for result in [abs(idx), np.absolute(idx)]:
-            tm.assertIsInstance(result, TimedeltaIndex)
-            exp = TimedeltaIndex(['2H', '1H', '0H', '1H', '2H'],
-                                 freq=None, name='x')
-            tm.assert_index_equal(result, exp)
-            self.assertEqual(result.freq, None)
-
     def test_fillna_timedelta(self):
         # GH 11343
         idx = pd.TimedeltaIndex(['1 day', pd.NaT, '3 day'])
 
         exp = pd.TimedeltaIndex(['1 day', '2 day', '3 day'])
-        self.assert_index_equal(idx.fillna(pd.Timedelta('2 day')), exp)
+        tm.assert_index_equal(idx.fillna(pd.Timedelta('2 day')), exp)
 
         exp = pd.TimedeltaIndex(['1 day', '3 hour', '3 day'])
         idx.fillna(pd.Timedelta('3 hour'))
 
         exp = pd.Index(
             [pd.Timedelta('1 day'), 'x', pd.Timedelta('3 day')], dtype=object)
-        self.assert_index_equal(idx.fillna('x'), exp)
+        tm.assert_index_equal(idx.fillna('x'), exp)
 
-    def test_difference_freq(self):
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_freq(self, sort):
         # GH14323: Difference of TimedeltaIndex should not preserve frequency
 
         index = timedelta_range("0 days", "5 days", freq="D")
 
         other = timedelta_range("1 days", "4 days", freq="D")
         expected = TimedeltaIndex(["0 days", "5 days"], freq=None)
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
         other = timedelta_range("2 days", "5 days", freq="D")
-        idx_diff = index.difference(other)
+        idx_diff = index.difference(other, sort)
         expected = TimedeltaIndex(["0 days", "1 days"], freq=None)
         tm.assert_index_equal(idx_diff, expected)
         tm.assert_attr_equal('freq', idx_diff, expected)
 
-    def test_take(self):
-
-        tds = ['1day 02:00:00', '1 day 04:00:00', '1 day 10:00:00']
-        idx = TimedeltaIndex(start='1d', end='2d', freq='H', name='idx')
-        expected = TimedeltaIndex(tds, freq=None, name='idx')
-
-        taken1 = idx.take([2, 4, 10])
-        taken2 = idx[[2, 4, 10]]
-
-        for taken in [taken1, taken2]:
-            self.assert_index_equal(taken, expected)
-            tm.assertIsInstance(taken, TimedeltaIndex)
-            self.assertIsNone(taken.freq)
-            self.assertEqual(taken.name, expected.name)
-
-    def test_take_fill_value(self):
-        # GH 12631
-        idx = pd.TimedeltaIndex(['1 days', '2 days', '3 days'],
-                                name='xxx')
-        result = idx.take(np.array([1, 0, -1]))
-        expected = pd.TimedeltaIndex(['2 days', '1 days', '3 days'],
-                                     name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        # fill_value
-        result = idx.take(np.array([1, 0, -1]), fill_value=True)
-        expected = pd.TimedeltaIndex(['2 days', '1 days', 'NaT'],
-                                     name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        # allow_fill=False
-        result = idx.take(np.array([1, 0, -1]), allow_fill=False,
-                          fill_value=True)
-        expected = pd.TimedeltaIndex(['2 days', '1 days', '3 days'],
-                                     name='xxx')
-        tm.assert_index_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            idx.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            idx.take(np.array([1, -5]))
+    @pytest.mark.parametrize("sort", [None, False])
+    def test_difference_sort(self, sort):
+
+        index = pd.TimedeltaIndex(["5 days", "3 days", "2 days", "4 days",
+                                   "1 days", "0 days"])
+
+        other = timedelta_range("1 days", "4 days", freq="D")
+        idx_diff = index.difference(other, sort)
+
+        expected = TimedeltaIndex(["5 days", "0 days"], freq=None)
+
+        if sort is None:
+            expected = expected.sort_values()
+
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
+
+        other = timedelta_range("2 days", "5 days", freq="D")
+        idx_diff = index.difference(other, sort)
+        expected = TimedeltaIndex(["1 days", "0 days"], freq=None)
+
+        if sort is None:
+            expected = expected.sort_values()
+
+        tm.assert_index_equal(idx_diff, expected)
+        tm.assert_attr_equal('freq', idx_diff, expected)
 
     def test_isin(self):
 
         index = tm.makeTimedeltaIndex(4)
         result = index.isin(index)
-        self.assertTrue(result.all())
+        assert result.all()
 
         result = index.isin(list(index))
-        self.assertTrue(result.all())
+        assert result.all()
 
         assert_almost_equal(index.isin([index[2], 5]),
                             np.array([False, False, True, False]))
@@ -261,33 +117,24 @@ def test_factorize(self):
         exp_idx = TimedeltaIndex(['1 day', '2 day', '3 day'])
 
         arr, idx = idx1.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assert_index_equal(idx, exp_idx)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
 
         arr, idx = idx1.factorize(sort=True)
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assert_index_equal(idx, exp_idx)
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, exp_idx)
 
         # freq must be preserved
         idx3 = timedelta_range('1 day', periods=4, freq='s')
         exp_arr = np.array([0, 1, 2, 3], dtype=np.intp)
         arr, idx = idx3.factorize()
-        self.assert_numpy_array_equal(arr, exp_arr)
-        self.assert_index_equal(idx, idx3)
-
-    def test_join_self(self):
+        tm.assert_numpy_array_equal(arr, exp_arr)
+        tm.assert_index_equal(idx, idx3)
 
+    def test_join_self(self, join_type):
         index = timedelta_range('1 day', periods=10)
-        kinds = 'outer', 'inner', 'left', 'right'
-        for kind in kinds:
-            joined = index.join(index, how=kind)
-            tm.assert_index_equal(index, joined)
-
-    def test_slice_keeps_name(self):
-
-        # GH4226
-        dr = pd.timedelta_range('1d', '5d', freq='H', name='timebucket')
-        self.assertEqual(dr[1:].name, dr.name)
+        joined = index.join(index, how=join_type)
+        tm.assert_index_equal(index, joined)
 
     def test_does_not_convert_mixed_integer(self):
         df = tm.makeCustomDataframe(10, 10,
@@ -297,8 +144,8 @@ def test_does_not_convert_mixed_integer(self):
 
         cols = df.columns.join(df.index, how='outer')
         joined = cols.join(df.columns)
-        self.assertEqual(cols.dtype, np.dtype('O'))
-        self.assertEqual(cols.dtype, joined.dtype)
+        assert cols.dtype == np.dtype('O')
+        assert cols.dtype == joined.dtype
         tm.assert_index_equal(cols, joined)
 
     def test_sort_values(self):
@@ -306,50 +153,54 @@ def test_sort_values(self):
         idx = TimedeltaIndex(['4d', '1d', '2d'])
 
         ordered = idx.sort_values()
-        self.assertTrue(ordered.is_monotonic)
+        assert ordered.is_monotonic
 
         ordered = idx.sort_values(ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
+        assert ordered[::-1].is_monotonic
 
         ordered, dexer = idx.sort_values(return_indexer=True)
-        self.assertTrue(ordered.is_monotonic)
-        self.assert_numpy_array_equal(dexer,
-                                      np.array([1, 2, 0]),
-                                      check_dtype=False)
+        assert ordered.is_monotonic
+
+        tm.assert_numpy_array_equal(dexer, np.array([1, 2, 0]),
+                                    check_dtype=False)
 
         ordered, dexer = idx.sort_values(return_indexer=True, ascending=False)
-        self.assertTrue(ordered[::-1].is_monotonic)
-        self.assert_numpy_array_equal(dexer,
-                                      np.array([0, 2, 1]),
-                                      check_dtype=False)
+        assert ordered[::-1].is_monotonic
+
+        tm.assert_numpy_array_equal(dexer, np.array([0, 2, 1]),
+                                    check_dtype=False)
 
     def test_get_duplicates(self):
         idx = TimedeltaIndex(['1 day', '2 day', '2 day', '3 day', '3day',
                               '4day'])
 
-        result = idx.get_duplicates()
+        with tm.assert_produces_warning(FutureWarning):
+            # Deprecated - see GH20239
+            result = idx.get_duplicates()
+
         ex = TimedeltaIndex(['2 day', '3day'])
-        self.assert_index_equal(result, ex)
+        tm.assert_index_equal(result, ex)
 
     def test_argmin_argmax(self):
         idx = TimedeltaIndex(['1 day 00:00:05', '1 day 00:00:01',
                               '1 day 00:00:02'])
-        self.assertEqual(idx.argmin(), 1)
-        self.assertEqual(idx.argmax(), 0)
+        assert idx.argmin() == 1
+        assert idx.argmax() == 0
 
     def test_misc_coverage(self):
 
         rng = timedelta_range('1 day', periods=5)
         result = rng.groupby(rng.days)
-        tm.assertIsInstance(list(result.values())[0][0], Timedelta)
+        assert isinstance(list(result.values())[0][0], Timedelta)
 
         idx = TimedeltaIndex(['3d', '1d', '2d'])
-        self.assertFalse(idx.equals(list(idx)))
+        assert not idx.equals(list(idx))
 
         non_td = Index(list('abc'))
-        self.assertFalse(idx.equals(list(non_td)))
+        assert not idx.equals(list(non_td))
 
     def test_map(self):
+        # test_map_dictlike generally tests
 
         rng = timedelta_range('1 day', periods=10)
 
@@ -358,90 +209,6 @@ def test_map(self):
         exp = Int64Index([f(x) for x in rng])
         tm.assert_index_equal(result, exp)
 
-    def test_comparisons_nat(self):
-
-        tdidx1 = pd.TimedeltaIndex(['1 day', pd.NaT, '1 day 00:00:01', pd.NaT,
-                                    '1 day 00:00:01', '5 day 00:00:03'])
-        tdidx2 = pd.TimedeltaIndex(['2 day', '2 day', pd.NaT, pd.NaT,
-                                    '1 day 00:00:02', '5 days 00:00:03'])
-        tdarr = np.array([np.timedelta64(2, 'D'),
-                          np.timedelta64(2, 'D'), np.timedelta64('nat'),
-                          np.timedelta64('nat'),
-                          np.timedelta64(1, 'D') + np.timedelta64(2, 's'),
-                          np.timedelta64(5, 'D') + np.timedelta64(3, 's')])
-
-        if _np_version_under1p8:
-            # cannot test array because np.datetime('nat') returns today's date
-            cases = [(tdidx1, tdidx2)]
-        else:
-            cases = [(tdidx1, tdidx2), (tdidx1, tdarr)]
-
-        # Check pd.NaT is handles as the same as np.nan
-        for idx1, idx2 in cases:
-
-            result = idx1 < idx2
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 > idx1
-            expected = np.array([True, False, False, False, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 <= idx2
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx2 >= idx1
-            expected = np.array([True, False, False, False, True, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 == idx2
-            expected = np.array([False, False, False, False, False, True])
-            self.assert_numpy_array_equal(result, expected)
-
-            result = idx1 != idx2
-            expected = np.array([True, True, True, True, True, False])
-            self.assert_numpy_array_equal(result, expected)
-
-    def test_comparisons_coverage(self):
-        rng = timedelta_range('1 days', periods=10)
-
-        result = rng < rng[3]
-        exp = np.array([True, True, True] + [False] * 7)
-        self.assert_numpy_array_equal(result, exp)
-
-        # raise TypeError for now
-        self.assertRaises(TypeError, rng.__lt__, rng[3].value)
-
-        result = rng == list(rng)
-        exp = rng == rng
-        self.assert_numpy_array_equal(result, exp)
-
-    def test_total_seconds(self):
-        # GH 10939
-        # test index
-        rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
-                              freq='s')
-        expt = [1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9,
-                1 * 86400 + 10 * 3600 + 11 * 60 + 13 + 100123456. / 1e9]
-        tm.assert_almost_equal(rng.total_seconds(), Index(expt))
-
-        # test Series
-        s = Series(rng)
-        s_expt = Series(expt, index=[0, 1])
-        tm.assert_series_equal(s.dt.total_seconds(), s_expt)
-
-        # with nat
-        s[1] = np.nan
-        s_expt = Series([1 * 86400 + 10 * 3600 + 11 * 60 +
-                         12 + 100123456. / 1e9, np.nan], index=[0, 1])
-        tm.assert_series_equal(s.dt.total_seconds(), s_expt)
-
-        # with both nat
-        s = Series([np.nan, np.nan], dtype='timedelta64[ns]')
-        tm.assert_series_equal(s.dt.total_seconds(),
-                               Series([np.nan, np.nan], index=[0, 1]))
-
     def test_pass_TimedeltaIndex_to_index(self):
 
         rng = timedelta_range('1 days', '10 days')
@@ -449,18 +216,18 @@ def test_pass_TimedeltaIndex_to_index(self):
 
         expected = Index(rng.to_pytimedelta(), dtype=object)
 
-        self.assert_numpy_array_equal(idx.values, expected.values)
+        tm.assert_numpy_array_equal(idx.values, expected.values)
 
     def test_pickle(self):
 
         rng = timedelta_range('1 days', periods=10)
-        rng_p = self.round_trip_pickle(rng)
+        rng_p = tm.round_trip_pickle(rng)
         tm.assert_index_equal(rng, rng_p)
 
     def test_hash_error(self):
         index = timedelta_range('1 days', periods=10)
-        with tm.assertRaisesRegexp(TypeError, "unhashable type: %r" %
-                                   type(index).__name__):
+        with pytest.raises(TypeError, match=("unhashable type: %r" %
+                                             type(index).__name__)):
             hash(index)
 
     def test_append_join_nondatetimeindex(self):
@@ -468,7 +235,7 @@ def test_append_join_nondatetimeindex(self):
         idx = Index(['a', 'b', 'c', 'd'])
 
         result = rng.append(idx)
-        tm.assertIsInstance(result[0], Timedelta)
+        assert isinstance(result[0], Timedelta)
 
         # it works
         rng.join(idx, how='outer')
@@ -481,25 +248,29 @@ def test_append_numpy_bug_1681(self):
         str(c)
 
         result = a.append(c)
-        self.assertTrue((result['B'] == td).all())
+        assert (result['B'] == td).all()
 
     def test_fields(self):
         rng = timedelta_range('1 days, 10:11:12.100123456', periods=2,
                               freq='s')
-        self.assert_index_equal(rng.days, Index([1, 1], dtype='int64'))
-        self.assert_index_equal(
+        tm.assert_index_equal(rng.days, Index([1, 1], dtype='int64'))
+        tm.assert_index_equal(
             rng.seconds,
             Index([10 * 3600 + 11 * 60 + 12, 10 * 3600 + 11 * 60 + 13],
                   dtype='int64'))
-        self.assert_index_equal(
+        tm.assert_index_equal(
             rng.microseconds,
             Index([100 * 1000 + 123, 100 * 1000 + 123], dtype='int64'))
-        self.assert_index_equal(rng.nanoseconds,
-                                Index([456, 456], dtype='int64'))
+        tm.assert_index_equal(rng.nanoseconds,
+                              Index([456, 456], dtype='int64'))
 
-        self.assertRaises(AttributeError, lambda: rng.hours)
-        self.assertRaises(AttributeError, lambda: rng.minutes)
-        self.assertRaises(AttributeError, lambda: rng.milliseconds)
+        msg = "'TimedeltaIndex' object has no attribute '{}'"
+        with pytest.raises(AttributeError, match=msg.format('hours')):
+            rng.hours
+        with pytest.raises(AttributeError, match=msg.format('minutes')):
+            rng.minutes
+        with pytest.raises(AttributeError, match=msg.format('milliseconds')):
+            rng.milliseconds
 
         # with nat
         s = Series(rng)
@@ -559,38 +330,18 @@ def test_freq_conversion(self):
         result = td.astype('timedelta64[s]')
         assert_index_equal(result, expected)
 
-
-class TestSlicing(tm.TestCase):
-
-    def test_timedelta(self):
-        # this is valid too
-        index = date_range('1/1/2000', periods=50, freq='B')
-        shifted = index + timedelta(1)
-        back = shifted + timedelta(-1)
-        self.assertTrue(tm.equalContents(index, back))
-        self.assertEqual(shifted.freq, index.freq)
-        self.assertEqual(shifted.freq, back.freq)
-
-        result = index - timedelta(1)
-        expected = index + timedelta(-1)
-        tm.assert_index_equal(result, expected)
-
-        # GH4134, buggy with timedeltas
-        rng = date_range('2013', '2014')
-        s = Series(rng)
-        result1 = rng - pd.offsets.Hour(1)
-        result2 = DatetimeIndex(s - np.timedelta64(100000000))
-        result3 = rng - np.timedelta64(100000000)
-        result4 = DatetimeIndex(s - pd.offsets.Hour(1))
-        tm.assert_index_equal(result1, result4)
-        tm.assert_index_equal(result2, result3)
+    @pytest.mark.parametrize('unit', ['Y', 'y', 'M'])
+    def test_unit_m_y_deprecated(self, unit):
+        with tm.assert_produces_warning(FutureWarning) as w:
+            TimedeltaIndex([1, 3, 7], unit)
+        msg = r'.* units are deprecated .*'
+        assert re.match(msg, str(w[0].message))
 
 
-class TestTimeSeries(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestTimeSeries(object):
 
     def test_series_box_timedelta(self):
         rng = timedelta_range('1 day 1 s', periods=5, freq='h')
         s = Series(rng)
-        tm.assertIsInstance(s[1], Timedelta)
-        tm.assertIsInstance(s.iat[2], Timedelta)
+        assert isinstance(s[1], Timedelta)
+        assert isinstance(s.iat[2], Timedelta)
diff --git a/pandas/tests/indexes/timedeltas/test_timedelta_range.py b/pandas/tests/indexes/timedeltas/test_timedelta_range.py
index 8bd56b5885bba..1c06abad1ab29 100644
--- a/pandas/tests/indexes/timedeltas/test_timedelta_range.py
+++ b/pandas/tests/indexes/timedeltas/test_timedelta_range.py
@@ -1,14 +1,14 @@
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import timedelta_range, to_timedelta
 import pandas.util.testing as tm
+
 from pandas.tseries.offsets import Day, Second
-from pandas import to_timedelta, timedelta_range
-from pandas.util.testing import assert_frame_equal
 
 
-class TestTimedeltas(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestTimedeltas(object):
 
     def test_timedelta_range(self):
 
@@ -37,10 +37,10 @@ def test_timedelta_range(self):
         arr = np.arange(10).reshape(2, 5)
         df = pd.DataFrame(np.arange(10).reshape(2, 5))
         for arg in (arr, df):
-            with tm.assertRaisesRegexp(TypeError, "1-d array"):
+            with pytest.raises(TypeError, match="1-d array"):
                 to_timedelta(arg)
             for errors in ['ignore', 'raise', 'coerce']:
-                with tm.assertRaisesRegexp(TypeError, "1-d array"):
+                with pytest.raises(TypeError, match="1-d array"):
                     to_timedelta(arg, errors=errors)
 
         # issue10583
@@ -48,4 +48,32 @@ def test_timedelta_range(self):
         df.index = pd.timedelta_range(start='0s', periods=10, freq='s')
         expected = df.loc[pd.Timedelta('0s'):, :]
         result = df.loc['0s':, :]
-        assert_frame_equal(expected, result)
+        tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.parametrize('periods, freq', [
+        (3, '2D'), (5, 'D'), (6, '19H12T'), (7, '16H'), (9, '12H')])
+    def test_linspace_behavior(self, periods, freq):
+        # GH 20976
+        result = timedelta_range(start='0 days', end='4 days', periods=periods)
+        expected = timedelta_range(start='0 days', end='4 days', freq=freq)
+        tm.assert_index_equal(result, expected)
+
+    def test_errors(self):
+        # not enough params
+        msg = ('Of the four parameters: start, end, periods, and freq, '
+               'exactly three must be specified')
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range(start='0 days')
+
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range(end='5 days')
+
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range(periods=2)
+
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range()
+
+        # too many params
+        with pytest.raises(ValueError, match=msg):
+            timedelta_range(start='0 days', end='5 days', periods=10, freq='H')
diff --git a/pandas/tests/indexes/timedeltas/test_tools.py b/pandas/tests/indexes/timedeltas/test_tools.py
index ade9366c7e994..58482a174dfd1 100644
--- a/pandas/tests/indexes/timedeltas/test_tools.py
+++ b/pandas/tests/indexes/timedeltas/test_tools.py
@@ -1,16 +1,17 @@
 from datetime import time, timedelta
+
 import numpy as np
+import pytest
+
+from pandas._libs.tslib import iNaT
 
 import pandas as pd
+from pandas import Series, TimedeltaIndex, isna, to_timedelta
 import pandas.util.testing as tm
 from pandas.util.testing import assert_series_equal
-from pandas import (Series, Timedelta, to_timedelta, isnull,
-                    TimedeltaIndex)
-from pandas._libs.tslib import iNaT
 
 
-class TestTimedeltas(tm.TestCase):
-    _multiprocess_can_split_ = True
+class TestTimedeltas(object):
 
     def test_to_timedelta(self):
         def conv(v):
@@ -18,19 +19,18 @@ def conv(v):
 
         d1 = np.timedelta64(1, 'D')
 
-        self.assertEqual(to_timedelta('1 days 06:05:01.00003', box=False),
-                         conv(d1 + np.timedelta64(6 * 3600 +
-                                                  5 * 60 + 1, 's') +
-                              np.timedelta64(30, 'us')))
-        self.assertEqual(to_timedelta('15.5us', box=False),
-                         conv(np.timedelta64(15500, 'ns')))
+        assert (to_timedelta('1 days 06:05:01.00003', box=False) ==
+                conv(d1 + np.timedelta64(6 * 3600 + 5 * 60 + 1, 's') +
+                     np.timedelta64(30, 'us')))
+        assert (to_timedelta('15.5us', box=False) ==
+                conv(np.timedelta64(15500, 'ns')))
 
         # empty string
         result = to_timedelta('', box=False)
-        self.assertEqual(result.astype('int64'), iNaT)
+        assert result.astype('int64') == iNaT
 
         result = to_timedelta(['', ''])
-        self.assertTrue(isnull(result).all())
+        assert isna(result).all()
 
         # pass thru
         result = to_timedelta(np.array([np.timedelta64(1, 's')]))
@@ -40,7 +40,7 @@ def conv(v):
         # ints
         result = np.timedelta64(0, 'ns')
         expected = to_timedelta(0, box=False)
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # Series
         expected = Series([timedelta(days=1), timedelta(days=1, seconds=1)])
@@ -57,12 +57,12 @@ def conv(v):
         v = timedelta(seconds=1)
         result = to_timedelta(v, box=False)
         expected = np.timedelta64(timedelta(seconds=1))
-        self.assertEqual(result, expected)
+        assert result == expected
 
         v = np.timedelta64(timedelta(seconds=1))
         result = to_timedelta(v, box=False)
         expected = np.timedelta64(timedelta(seconds=1))
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # arrays of various dtypes
         arr = np.array([1] * 5, dtype='int64')
@@ -111,19 +111,26 @@ def test_to_timedelta_invalid(self):
 
         # bad value for errors parameter
         msg = "errors must be one of"
-        tm.assertRaisesRegexp(ValueError, msg, to_timedelta,
-                              ['foo'], errors='never')
+        with pytest.raises(ValueError, match=msg):
+            to_timedelta(['foo'], errors='never')
 
         # these will error
-        self.assertRaises(ValueError, lambda: to_timedelta([1, 2], unit='foo'))
-        self.assertRaises(ValueError, lambda: to_timedelta(1, unit='foo'))
+        msg = "invalid unit abbreviation: foo"
+        with pytest.raises(ValueError, match=msg):
+            to_timedelta([1, 2], unit='foo')
+        with pytest.raises(ValueError, match=msg):
+            to_timedelta(1, unit='foo')
 
         # time not supported ATM
-        self.assertRaises(ValueError, lambda: to_timedelta(time(second=1)))
-        self.assertTrue(to_timedelta(
-            time(second=1), errors='coerce') is pd.NaT)
-
-        self.assertRaises(ValueError, lambda: to_timedelta(['foo', 'bar']))
+        msg = ("Value must be Timedelta, string, integer, float, timedelta or"
+               " convertible")
+        with pytest.raises(ValueError, match=msg):
+            to_timedelta(time(second=1))
+        assert to_timedelta(time(second=1), errors='coerce') is pd.NaT
+
+        msg = "unit abbreviation w/o a number"
+        with pytest.raises(ValueError, match=msg):
+            to_timedelta(['foo', 'bar'])
         tm.assert_index_equal(TimedeltaIndex([pd.NaT, pd.NaT]),
                               to_timedelta(['foo', 'bar'], errors='coerce'))
 
@@ -133,8 +140,7 @@ def test_to_timedelta_invalid(self):
 
         # gh-13613: these should not error because errors='ignore'
         invalid_data = 'apple'
-        self.assertEqual(invalid_data, to_timedelta(
-            invalid_data, errors='ignore'))
+        assert invalid_data == to_timedelta(invalid_data, errors='ignore')
 
         invalid_data = ['apple', '1 days']
         tm.assert_numpy_array_equal(
@@ -171,32 +177,7 @@ def test_to_timedelta_on_missing_values(self):
         assert_series_equal(actual, expected)
 
         actual = pd.to_timedelta(np.nan)
-        self.assertEqual(actual.value, timedelta_NaT.astype('int64'))
+        assert actual.value == timedelta_NaT.astype('int64')
 
         actual = pd.to_timedelta(pd.NaT)
-        self.assertEqual(actual.value, timedelta_NaT.astype('int64'))
-
-    def test_to_timedelta_on_nanoseconds(self):
-        # GH 9273
-        result = Timedelta(nanoseconds=100)
-        expected = Timedelta('100ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(days=1, hours=1, minutes=1, weeks=1, seconds=1,
-                           milliseconds=1, microseconds=1, nanoseconds=1)
-        expected = Timedelta(694861001001001)
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) + Timedelta(nanoseconds=1)
-        expected = Timedelta('1us1ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) - Timedelta(nanoseconds=1)
-        expected = Timedelta('999ns')
-        self.assertEqual(result, expected)
-
-        result = Timedelta(microseconds=1) + 5 * Timedelta(nanoseconds=-2)
-        expected = Timedelta('990ns')
-        self.assertEqual(result, expected)
-
-        self.assertRaises(TypeError, lambda: Timedelta(nanoseconds='abc'))
+        assert actual.value == timedelta_NaT.astype('int64')
diff --git a/pandas/tests/indexing/common.py b/pandas/tests/indexing/common.py
index c7637a00910c6..1b74eeea1a8c3 100644
--- a/pandas/tests/indexing/common.py
+++ b/pandas/tests/indexing/common.py
@@ -1,14 +1,19 @@
 """ common utilities """
 
 import itertools
-from warnings import catch_warnings
+from warnings import catch_warnings, filterwarnings
+
 import numpy as np
 
 from pandas.compat import lrange
-from pandas.types.common import is_scalar
-from pandas import Series, DataFrame, Panel, date_range, UInt64Index
+
+from pandas.core.dtypes.common import is_scalar
+
+from pandas import (
+    DataFrame, Float64Index, MultiIndex, Series, UInt64Index, date_range)
 from pandas.util import testing as tm
-from pandas.formats.printing import pprint_thing
+
+from pandas.io.formats.printing import pprint_thing
 
 _verbose = False
 
@@ -27,51 +32,51 @@ def _axify(obj, key, axis):
 class Base(object):
     """ indexing comprehensive base class """
 
-    _objs = set(['series', 'frame', 'panel'])
-    _typs = set(['ints', 'uints', 'labels', 'mixed',
-                 'ts', 'floats', 'empty', 'ts_rev'])
+    _objs = {'series', 'frame'}
+    _typs = {'ints', 'uints', 'labels', 'mixed', 'ts', 'floats', 'empty',
+             'ts_rev', 'multi'}
 
-    def setUp(self):
+    def setup_method(self, method):
 
         self.series_ints = Series(np.random.rand(4), index=lrange(0, 8, 2))
         self.frame_ints = DataFrame(np.random.randn(4, 4),
                                     index=lrange(0, 8, 2),
                                     columns=lrange(0, 12, 3))
-        self.panel_ints = Panel(np.random.rand(4, 4, 4),
-                                items=lrange(0, 8, 2),
-                                major_axis=lrange(0, 12, 3),
-                                minor_axis=lrange(0, 16, 4))
 
         self.series_uints = Series(np.random.rand(4),
                                    index=UInt64Index(lrange(0, 8, 2)))
         self.frame_uints = DataFrame(np.random.randn(4, 4),
                                      index=UInt64Index(lrange(0, 8, 2)),
                                      columns=UInt64Index(lrange(0, 12, 3)))
-        self.panel_uints = Panel(np.random.rand(4, 4, 4),
-                                 items=UInt64Index(lrange(0, 8, 2)),
-                                 major_axis=UInt64Index(lrange(0, 12, 3)),
-                                 minor_axis=UInt64Index(lrange(0, 16, 4)))
+
+        self.series_floats = Series(np.random.rand(4),
+                                    index=Float64Index(range(0, 8, 2)))
+        self.frame_floats = DataFrame(np.random.randn(4, 4),
+                                      index=Float64Index(range(0, 8, 2)),
+                                      columns=Float64Index(range(0, 12, 3)))
+
+        m_idces = [MultiIndex.from_product([[1, 2], [3, 4]]),
+                   MultiIndex.from_product([[5, 6], [7, 8]]),
+                   MultiIndex.from_product([[9, 10], [11, 12]])]
+
+        self.series_multi = Series(np.random.rand(4),
+                                   index=m_idces[0])
+        self.frame_multi = DataFrame(np.random.randn(4, 4),
+                                     index=m_idces[0],
+                                     columns=m_idces[1])
 
         self.series_labels = Series(np.random.randn(4), index=list('abcd'))
         self.frame_labels = DataFrame(np.random.randn(4, 4),
                                       index=list('abcd'), columns=list('ABCD'))
-        self.panel_labels = Panel(np.random.randn(4, 4, 4),
-                                  items=list('abcd'),
-                                  major_axis=list('ABCD'),
-                                  minor_axis=list('ZYXW'))
 
         self.series_mixed = Series(np.random.randn(4), index=[2, 4, 'null', 8])
         self.frame_mixed = DataFrame(np.random.randn(4, 4),
                                      index=[2, 4, 'null', 8])
-        self.panel_mixed = Panel(np.random.randn(4, 4, 4),
-                                 items=[2, 4, 'null', 8])
 
         self.series_ts = Series(np.random.randn(4),
                                 index=date_range('20130101', periods=4))
         self.frame_ts = DataFrame(np.random.randn(4, 4),
                                   index=date_range('20130101', periods=4))
-        self.panel_ts = Panel(np.random.randn(4, 4, 4),
-                              items=date_range('20130101', periods=4))
 
         dates_rev = (date_range('20130101', periods=4)
                      .sort_values(ascending=False))
@@ -79,12 +84,9 @@ def setUp(self):
                                     index=dates_rev)
         self.frame_ts_rev = DataFrame(np.random.randn(4, 4),
                                       index=dates_rev)
-        self.panel_ts_rev = Panel(np.random.randn(4, 4, 4),
-                                  items=dates_rev)
 
         self.frame_empty = DataFrame({})
         self.series_empty = Series({})
-        self.panel_empty = Panel({})
 
         # form agglomerates
         for o in self._objs:
@@ -96,7 +98,7 @@ def setUp(self):
             setattr(self, o, d)
 
     def generate_indices(self, f, values=False):
-        """ generate the indicies
+        """ generate the indices
         if values is True , use the axis values
         is False, use the range
         """
@@ -113,25 +115,25 @@ def get_result(self, obj, method, key, axis):
         if isinstance(key, dict):
             key = key[axis]
 
-        # use an artifical conversion to map the key as integers to the labels
-        # so ix can work for comparisions
+        # use an artificial conversion to map the key as integers to the labels
+        # so ix can work for comparisons
         if method == 'indexer':
             method = 'ix'
             key = obj._get_axis(axis)[key]
 
         # in case we actually want 0 index slicing
-        try:
-            with catch_warnings(record=True):
+        with catch_warnings(record=True):
+            try:
                 xp = getattr(obj, method).__getitem__(_axify(obj, key, axis))
-        except:
-            xp = getattr(obj, method).__getitem__(key)
+            except AttributeError:
+                xp = getattr(obj, method).__getitem__(key)
 
         return xp
 
     def get_value(self, f, i, values=False):
         """ return the value for the location i """
 
-        # check agains values
+        # check against values
         if values:
             return f.values[i]
 
@@ -141,6 +143,7 @@ def get_value(self, f, i, values=False):
         #    v = v.__getitem__(a)
         # return v
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             return f.ix[i]
 
     def check_values(self, f, func, values=False):
@@ -153,7 +156,7 @@ def check_values(self, f, func, values=False):
         for i in indicies:
             result = getattr(f, func)[i]
 
-            # check agains values
+            # check against values
             if values:
                 expected = f.values[i]
             else:
@@ -185,7 +188,7 @@ def _print(result, error=None):
 
                 try:
                     xp = self.get_result(obj, method2, k2, a)
-                except:
+                except Exception:
                     result = 'no comp'
                     _print(result)
                     return
@@ -194,13 +197,11 @@ def _print(result, error=None):
 
                 try:
                     if is_scalar(rs) and is_scalar(xp):
-                        self.assertEqual(rs, xp)
+                        assert rs == xp
                     elif xp.ndim == 1:
                         tm.assert_series_equal(rs, xp)
                     elif xp.ndim == 2:
                         tm.assert_frame_equal(rs, xp)
-                    elif xp.ndim == 3:
-                        tm.assert_panel_equal(rs, xp)
                     result = 'ok'
                 except AssertionError as e:
                     detail = str(e)
@@ -241,7 +242,7 @@ def _print(result, error=None):
             else:
                 axes = list(axes)
         else:
-            axes = [0, 1, 2]
+            axes = [0, 1]
 
         # check
         for o in objs:
@@ -255,8 +256,13 @@ def _print(result, error=None):
                         continue
 
                     obj = d[t]
-                    if obj is not None:
+                    if obj is None:
+                        continue
+
+                    def _call(obj=obj):
                         obj = obj.copy()
 
                         k2 = key2
                         _eq(t, o, a, obj, key1, k2)
+
+                    _call()
diff --git a/pandas/tests/indexing/conftest.py b/pandas/tests/indexing/conftest.py
new file mode 100644
index 0000000000000..be1cf4800a2ef
--- /dev/null
+++ b/pandas/tests/indexing/conftest.py
@@ -0,0 +1,20 @@
+import numpy as np
+import pytest
+
+from pandas._libs import index as libindex
+
+
+@pytest.fixture(params=[
+    (libindex.Int64Engine, np.int64),
+    (libindex.Int32Engine, np.int32),
+    (libindex.Int16Engine, np.int16),
+    (libindex.Int8Engine, np.int8),
+    (libindex.UInt64Engine, np.uint64),
+    (libindex.UInt32Engine, np.uint32),
+    (libindex.UInt16Engine, np.uint16),
+    (libindex.UInt8Engine, np.uint8),
+    (libindex.Float64Engine, np.float64),
+    (libindex.Float32Engine, np.float32),
+], ids=lambda x: x[0].__name__)
+def numeric_indexing_engine_type_and_dtype(request):
+    return request.param
diff --git a/pandas/tests/indexing/interval/__init__.py b/pandas/tests/indexing/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexing/interval/test_interval.py b/pandas/tests/indexing/interval/test_interval.py
new file mode 100644
index 0000000000000..938caec006f3a
--- /dev/null
+++ b/pandas/tests/indexing/interval/test_interval.py
@@ -0,0 +1,267 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Interval, IntervalIndex, Series
+import pandas.util.testing as tm
+
+
+class TestIntervalIndex(object):
+
+    def setup_method(self, method):
+        self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_loc_with_scalar(self):
+
+        s = self.s
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s.loc[:3])
+        tm.assert_series_equal(expected, s.loc[:2.5])
+        tm.assert_series_equal(expected, s.loc[0.1:2.5])
+        tm.assert_series_equal(expected, s.loc[-1:3])
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s.loc[[2, 3, 4]])
+        tm.assert_series_equal(expected, s.loc[[1.5, 3, 4]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s.loc[s >= 2])
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_getitem_with_scalar(self):
+
+        s = self.s
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s[:3])
+        tm.assert_series_equal(expected, s[:2.5])
+        tm.assert_series_equal(expected, s[0.1:2.5])
+        tm.assert_series_equal(expected, s[-1:3])
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s[[2, 3, 4]])
+        tm.assert_series_equal(expected, s[[1.5, 3, 4]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s[s >= 2])
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    @pytest.mark.parametrize('direction', ['increasing', 'decreasing'])
+    def test_nonoverlapping_monotonic(self, direction, closed):
+        tpls = [(0, 1), (2, 3), (4, 5)]
+        if direction == 'decreasing':
+            tpls = tpls[::-1]
+
+        idx = IntervalIndex.from_tuples(tpls, closed=closed)
+        s = Series(list('abc'), idx)
+
+        for key, expected in zip(idx.left, s):
+            if idx.closed_left:
+                assert s[key] == expected
+                assert s.loc[key] == expected
+            else:
+                with pytest.raises(KeyError):
+                    s[key]
+                with pytest.raises(KeyError):
+                    s.loc[key]
+
+        for key, expected in zip(idx.right, s):
+            if idx.closed_right:
+                assert s[key] == expected
+                assert s.loc[key] == expected
+            else:
+                with pytest.raises(KeyError):
+                    s[key]
+                with pytest.raises(KeyError):
+                    s.loc[key]
+
+        for key, expected in zip(idx.mid, s):
+            assert s[key] == expected
+            assert s.loc[key] == expected
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_interval(self):
+
+        s = self.s
+        expected = 0
+
+        result = s.loc[Interval(0, 1)]
+        assert result == expected
+
+        result = s[Interval(0, 1)]
+        assert result == expected
+
+        expected = s.iloc[3:5]
+        result = s.loc[Interval(3, 6)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 5)]]
+        tm.assert_series_equal(expected, result)
+
+        # missing
+        with pytest.raises(KeyError):
+            s.loc[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(5, 6)]
+
+        with pytest.raises(KeyError):
+            s[Interval(5, 6)]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_slices(self):
+
+        s = self.s
+
+        # slice of interval
+        with pytest.raises(NotImplementedError):
+            s.loc[Interval(3, 6):]
+
+        with pytest.raises(NotImplementedError):
+            s[Interval(3, 6):]
+
+        expected = s.iloc[3:5]
+        result = s[[Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        # slice of scalar with step != 1
+        with pytest.raises(ValueError):
+            s[0:4:2]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_with_overlaps(self):
+
+        s = self.s
+        expected = s.iloc[[3, 4, 3, 4]]
+        result = s.loc[[Interval(3, 6), Interval(3, 6)]]
+        tm.assert_series_equal(expected, result)
+
+        idx = IntervalIndex.from_tuples([(1, 5), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s[4]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s[[4]]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[[4]]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(3, 5)]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[Interval(3, 5)]
+        expected = s
+        tm.assert_series_equal(expected, result)
+
+        # doesn't intersect unique set of intervals
+        with pytest.raises(KeyError):
+            s[[Interval(3, 5)]]
+
+        with pytest.raises(KeyError):
+            s.loc[[Interval(3, 5)]]
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_non_unique(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (3, 7)])
+
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        assert result == 0
+
+        result = s.loc[[Interval(1, 3)]]
+        expected = s.iloc[0:1]
+        tm.assert_series_equal(expected, result)
+
+    # To be removed, replaced by test_interval_new.py (see #16316, #16386)
+    def test_non_unique_moar(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        expected = s.iloc[[0, 1]]
+        tm.assert_series_equal(expected, result)
+
+        # non-unique index and slices not allowed
+        with pytest.raises(ValueError):
+            s.loc[Interval(1, 3):]
+
+        with pytest.raises(ValueError):
+            s[Interval(1, 3):]
+
+        # non-unique
+        with pytest.raises(ValueError):
+            s[[Interval(1, 3)]]
+
+    # TODO: check this behavior is consistent with test_interval_new.py
+    def test_non_matching(self):
+        s = self.s
+
+        # this is a departure from our current
+        # indexin scheme, but simpler
+        with pytest.raises(KeyError):
+            s.loc[[-1, 3, 4, 5]]
+
+        with pytest.raises(KeyError):
+            s.loc[[-1, 3]]
+
+    def test_large_series(self):
+        s = Series(np.arange(1000000),
+                   index=IntervalIndex.from_breaks(np.arange(1000001)))
+
+        result1 = s.loc[:80000]
+        result2 = s.loc[0:80000]
+        result3 = s.loc[0:80000:1]
+        tm.assert_series_equal(result1, result2)
+        tm.assert_series_equal(result1, result3)
+
+    def test_loc_getitem_frame(self):
+
+        df = DataFrame({'A': range(10)})
+        s = pd.cut(df.A, 5)
+        df['B'] = s
+        df = df.set_index('B')
+
+        result = df.loc[4]
+        expected = df.iloc[4:6]
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            df.loc[10]
+
+        # single list-like
+        result = df.loc[[4]]
+        expected = df.iloc[4:6]
+        tm.assert_frame_equal(result, expected)
+
+        # non-unique
+        result = df.loc[[4, 5]]
+        expected = df.take([4, 5, 4, 5])
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(KeyError):
+            df.loc[[10]]
+
+        # partial missing
+        with pytest.raises(KeyError):
+            df.loc[[10, 4]]
diff --git a/pandas/tests/indexing/interval/test_interval_new.py b/pandas/tests/indexing/interval/test_interval_new.py
new file mode 100644
index 0000000000000..4b2ec0c4d17bf
--- /dev/null
+++ b/pandas/tests/indexing/interval/test_interval_new.py
@@ -0,0 +1,246 @@
+import numpy as np
+import pytest
+
+from pandas import Interval, IntervalIndex, Series
+import pandas.util.testing as tm
+
+pytestmark = pytest.mark.skip(reason="new indexing tests for issue 16316")
+
+
+class TestIntervalIndex(object):
+
+    def setup_method(self, method):
+        self.s = Series(np.arange(5), IntervalIndex.from_breaks(np.arange(6)))
+
+    def test_loc_with_interval(self):
+
+        # loc with single label / list of labels:
+        #   - Intervals: only exact matches
+        #   - scalars: those that contain it
+
+        s = self.s
+
+        expected = 0
+        result = s.loc[Interval(0, 1)]
+        assert result == expected
+        result = s[Interval(0, 1)]
+        assert result == expected
+
+        expected = s.iloc[3:5]
+        result = s.loc[[Interval(3, 4), Interval(4, 5)]]
+        tm.assert_series_equal(expected, result)
+        result = s[[Interval(3, 4), Interval(4, 5)]]
+        tm.assert_series_equal(expected, result)
+
+        # missing or not exact
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5, closed='left')]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5, closed='left')]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s[Interval(-2, 0)]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(5, 6)]
+
+        with pytest.raises(KeyError):
+            s[Interval(5, 6)]
+
+    def test_loc_with_scalar(self):
+
+        # loc with single label / list of labels:
+        #   - Intervals: only exact matches
+        #   - scalars: those that contain it
+
+        s = self.s
+
+        assert s.loc[1] == 0
+        assert s.loc[1.5] == 1
+        assert s.loc[2] == 1
+
+        # TODO with __getitem__ same rules as loc, or positional ?
+        # assert s[1] == 0
+        # assert s[1.5] == 1
+        # assert s[2] == 1
+
+        expected = s.iloc[1:4]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2.5, 3.5]])
+        tm.assert_series_equal(expected, s.loc[[2, 3, 4]])
+        tm.assert_series_equal(expected, s.loc[[1.5, 3, 4]])
+
+        expected = s.iloc[[1, 1, 2, 1]]
+        tm.assert_series_equal(expected, s.loc[[1.5, 2, 2.5, 1.5]])
+
+        expected = s.iloc[2:5]
+        tm.assert_series_equal(expected, s.loc[s >= 2])
+
+    def test_loc_with_slices(self):
+
+        # loc with slices:
+        #   - Interval objects: only works with exact matches
+        #   - scalars: only works for non-overlapping, monotonic intervals,
+        #     and start/stop select location based on the interval that
+        #     contains them:
+        #    (slice_loc(start, stop) == (idx.get_loc(start), idx.get_loc(stop))
+
+        s = self.s
+
+        # slice of interval
+
+        expected = s.iloc[:3]
+        result = s.loc[Interval(0, 1):Interval(2, 3)]
+        tm.assert_series_equal(expected, result)
+        result = s[Interval(0, 1):Interval(2, 3)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[4:]
+        result = s.loc[Interval(3, 4):]
+        tm.assert_series_equal(expected, result)
+        result = s[Interval(3, 4):]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 6):]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 6):]
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 4, closed='left'):]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 4, closed='left'):]
+
+        # TODO with non-existing intervals ?
+        # s.loc[Interval(-1, 0):Interval(2, 3)]
+
+        # slice of scalar
+
+        expected = s.iloc[:3]
+        tm.assert_series_equal(expected, s.loc[:3])
+        tm.assert_series_equal(expected, s.loc[:2.5])
+        tm.assert_series_equal(expected, s.loc[0.1:2.5])
+
+        # TODO should this work? (-1 is not contained in any of the Intervals)
+        # tm.assert_series_equal(expected, s.loc[-1:3])
+
+        # TODO with __getitem__ same rules as loc, or positional ?
+        # tm.assert_series_equal(expected, s[:3])
+        # tm.assert_series_equal(expected, s[:2.5])
+        # tm.assert_series_equal(expected, s[0.1:2.5])
+
+        # slice of scalar with step != 1
+        with pytest.raises(NotImplementedError):
+            s[0:4:2]
+
+    def test_loc_with_overlap(self):
+
+        idx = IntervalIndex.from_tuples([(1, 5), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        # scalar
+        expected = s
+        result = s.loc[4]
+        tm.assert_series_equal(expected, result)
+
+        result = s[4]
+        tm.assert_series_equal(expected, result)
+
+        result = s.loc[[4]]
+        tm.assert_series_equal(expected, result)
+
+        result = s[[4]]
+        tm.assert_series_equal(expected, result)
+
+        # interval
+        expected = 0
+        result = s.loc[Interval(1, 5)]
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(1, 5)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s.loc[[Interval(1, 5), Interval(3, 7)]]
+        tm.assert_series_equal(expected, result)
+
+        result = s[[Interval(1, 5), Interval(3, 7)]]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s.loc[[Interval(3, 5)]]
+
+        with pytest.raises(KeyError):
+            s[Interval(3, 5)]
+
+        with pytest.raises(KeyError):
+            s[[Interval(3, 5)]]
+
+        # slices with interval (only exact matches)
+        expected = s
+        result = s.loc[Interval(1, 5):Interval(3, 7)]
+        tm.assert_series_equal(expected, result)
+
+        result = s[Interval(1, 5):Interval(3, 7)]
+        tm.assert_series_equal(expected, result)
+
+        with pytest.raises(KeyError):
+            s.loc[Interval(1, 6):Interval(3, 8)]
+
+        with pytest.raises(KeyError):
+            s[Interval(1, 6):Interval(3, 8)]
+
+        # slices with scalar raise for overlapping intervals
+        # TODO KeyError is the appropriate error?
+        with pytest.raises(KeyError):
+            s.loc[1:4]
+
+    def test_non_unique(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        result = s.loc[Interval(1, 3)]
+        assert result == 0
+
+        result = s.loc[[Interval(1, 3)]]
+        expected = s.iloc[0:1]
+        tm.assert_series_equal(expected, result)
+
+    def test_non_unique_moar(self):
+
+        idx = IntervalIndex.from_tuples([(1, 3), (1, 3), (3, 7)])
+        s = Series(range(len(idx)), index=idx)
+
+        expected = s.iloc[[0, 1]]
+        result = s.loc[Interval(1, 3)]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s.loc[Interval(1, 3):]
+        tm.assert_series_equal(expected, result)
+
+        expected = s
+        result = s[Interval(1, 3):]
+        tm.assert_series_equal(expected, result)
+
+        expected = s.iloc[[0, 1]]
+        result = s[[Interval(1, 3)]]
+        tm.assert_series_equal(expected, result)
diff --git a/pandas/tests/indexing/multiindex/__init__.py b/pandas/tests/indexing/multiindex/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/indexing/multiindex/conftest.py b/pandas/tests/indexing/multiindex/conftest.py
new file mode 100644
index 0000000000000..545e092d9ce65
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/conftest.py
@@ -0,0 +1,31 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Index, MultiIndex
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def multiindex_dataframe_random_data():
+    """DataFrame with 2 level MultiIndex with random data"""
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    return DataFrame(np.random.randn(10, 3), index=index,
+                     columns=Index(['A', 'B', 'C'], name='exp'))
+
+
+@pytest.fixture
+def multiindex_year_month_day_dataframe_random_data():
+    """DataFrame with 3 level MultiIndex (year, month, day) covering
+    first 100 business days from 2000-01-01 with random data"""
+    tdf = tm.makeTimeDataFrame(100)
+    ymd = tdf.groupby([lambda x: x.year, lambda x: x.month,
+                       lambda x: x.day]).sum()
+    # use Int64Index, to make sure things work
+    ymd.index.set_levels([lev.astype('i8') for lev in ymd.index.levels],
+                         inplace=True)
+    ymd.index.set_names(['year', 'month', 'day'], inplace=True)
+    return ymd
diff --git a/pandas/tests/indexing/multiindex/test_chaining_and_caching.py b/pandas/tests/indexing/multiindex/test_chaining_and_caching.py
new file mode 100644
index 0000000000000..0ff499155f0c4
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_chaining_and_caching.py
@@ -0,0 +1,65 @@
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, lzip, range
+
+from pandas import DataFrame, MultiIndex, Series
+from pandas.core import common as com
+import pandas.util.testing as tm
+
+
+def test_detect_chained_assignment():
+    # Inplace ops, originally from:
+    # http://stackoverflow.com/questions/20508968/series-fillna-in-a-multiindex-dataframe-does-not-fill-is-this-a-bug
+    a = [12, 23]
+    b = [123, None]
+    c = [1234, 2345]
+    d = [12345, 23456]
+    tuples = [('eyes', 'left'), ('eyes', 'right'), ('ears', 'left'),
+              ('ears', 'right')]
+    events = {('eyes', 'left'): a,
+              ('eyes', 'right'): b,
+              ('ears', 'left'): c,
+              ('ears', 'right'): d}
+    multiind = MultiIndex.from_tuples(tuples, names=['part', 'side'])
+    zed = DataFrame(events, index=['a', 'b'], columns=multiind)
+
+    with pytest.raises(com.SettingWithCopyError):
+        zed['eyes']['right'].fillna(value=555, inplace=True)
+
+
+def test_cache_updating():
+    # 5216
+    # make sure that we don't try to set a dead cache
+    a = np.random.rand(10, 3)
+    df = DataFrame(a, columns=['x', 'y', 'z'])
+    tuples = [(i, j) for i in range(5) for j in range(2)]
+    index = MultiIndex.from_tuples(tuples)
+    df.index = index
+
+    # setting via chained assignment
+    # but actually works, since everything is a view
+    df.loc[0]['z'].iloc[0] = 1.
+    result = df.loc[(0, 0), 'z']
+    assert result == 1
+
+    # correct setting
+    df.loc[(0, 0), 'z'] = 2
+    result = df.loc[(0, 0), 'z']
+    assert result == 2
+
+
+def test_indexer_caching():
+    # GH5727
+    # make sure that indexers are in the _internal_names_set
+    n = 1000001
+    arrays = [lrange(n), lrange(n)]
+    index = MultiIndex.from_tuples(lzip(*arrays))
+    s = Series(np.zeros(n), index=index)
+    str(s)
+
+    # setitem
+    expected = Series(np.ones(n), index=index)
+    s = Series(np.zeros(n), index=index)
+    s[s == 0] = 1
+    tm.assert_series_equal(s, expected)
diff --git a/pandas/tests/indexing/multiindex/test_datetime.py b/pandas/tests/indexing/multiindex/test_datetime.py
new file mode 100644
index 0000000000000..a270ab32e9b04
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_datetime.py
@@ -0,0 +1,22 @@
+from datetime import datetime
+
+import numpy as np
+
+from pandas import Index, Period, Series, period_range
+
+
+def test_multiindex_period_datetime():
+    # GH4861, using datetime in period of multiindex raises exception
+
+    idx1 = Index(['a', 'a', 'a', 'b', 'b'])
+    idx2 = period_range('2012-01', periods=len(idx1), freq='M')
+    s = Series(np.random.randn(len(idx1)), [idx1, idx2])
+
+    # try Period as index
+    expected = s.iloc[0]
+    result = s.loc['a', Period('2012-01')]
+    assert result == expected
+
+    # try datetime as index
+    result = s.loc['a', datetime(2012, 1, 1)]
+    assert result == expected
diff --git a/pandas/tests/indexing/multiindex/test_getitem.py b/pandas/tests/indexing/multiindex/test_getitem.py
new file mode 100644
index 0000000000000..b7fdbee0b7185
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_getitem.py
@@ -0,0 +1,237 @@
+import numpy as np
+import pytest
+
+from pandas.compat import u, zip
+
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.core.indexing import IndexingError
+from pandas.util import testing as tm
+
+# ----------------------------------------------------------------------------
+# test indexing of Series with multi-level Index
+# ----------------------------------------------------------------------------
+
+
+@pytest.mark.parametrize('access_method', [lambda s, x: s[:, x],
+                                           lambda s, x: s.loc[:, x],
+                                           lambda s, x: s.xs(x, level=1)])
+@pytest.mark.parametrize('level1_value, expected', [
+    (0, Series([1], index=[0])),
+    (1, Series([2, 3], index=[1, 2]))
+])
+def test_series_getitem_multiindex(access_method, level1_value, expected):
+
+    # GH 6018
+    # series regression getitem with a multi-index
+
+    s = Series([1, 2, 3])
+    s.index = MultiIndex.from_tuples([(0, 0), (1, 1), (2, 1)])
+    result = access_method(s, level1_value)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('level0_value', ['D', 'A'])
+def test_series_getitem_duplicates_multiindex(level0_value):
+    # GH 5725 the 'A' happens to be a valid Timestamp so the doesn't raise
+    # the appropriate error, only in PY3 of course!
+
+    index = MultiIndex(levels=[[level0_value, 'B', 'C'],
+                               [0, 26, 27, 37, 57, 67, 75, 82]],
+                       codes=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
+                              [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
+                       names=['tag', 'day'])
+    arr = np.random.randn(len(index), 1)
+    df = DataFrame(arr, index=index, columns=['val'])
+
+    # confirm indexing on missing value raises KeyError
+    if level0_value != 'A':
+        with pytest.raises(KeyError, match=r"^'A'$"):
+            df.val['A']
+
+    with pytest.raises(KeyError, match=r"^'X'$"):
+        df.val['X']
+
+    result = df.val[level0_value]
+    expected = Series(arr.ravel()[0:3], name='val', index=Index(
+        [26, 37, 57], name='day'))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer', [
+    lambda s: s[2000, 3],
+    lambda s: s.loc[2000, 3]
+])
+def test_series_getitem(
+        multiindex_year_month_day_dataframe_random_data, indexer):
+    s = multiindex_year_month_day_dataframe_random_data['A']
+    expected = s.reindex(s.index[42:65])
+    expected.index = expected.index.droplevel(0).droplevel(0)
+
+    result = indexer(s)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer', [
+    lambda s: s[2000, 3, 10],
+    lambda s: s.loc[2000, 3, 10]
+])
+def test_series_getitem_returns_scalar(
+        multiindex_year_month_day_dataframe_random_data, indexer):
+    s = multiindex_year_month_day_dataframe_random_data['A']
+    expected = s.iloc[49]
+
+    result = indexer(s)
+    assert result == expected
+
+
+@pytest.mark.parametrize('indexer,expected_error,expected_error_msg', [
+    (lambda s: s.__getitem__((2000, 3, 4)), KeyError, r"^356L?$"),
+    (lambda s: s[(2000, 3, 4)], KeyError, r"^356L?$"),
+    (lambda s: s.loc[(2000, 3, 4)], IndexingError, 'Too many indexers'),
+    (lambda s: s.__getitem__(len(s)), IndexError, 'index out of bounds'),
+    (lambda s: s[len(s)], IndexError, 'index out of bounds'),
+    (lambda s: s.iloc[len(s)], IndexError,
+     'single positional indexer is out-of-bounds')
+])
+def test_series_getitem_indexing_errors(
+        multiindex_year_month_day_dataframe_random_data, indexer,
+        expected_error, expected_error_msg):
+    s = multiindex_year_month_day_dataframe_random_data['A']
+    with pytest.raises(expected_error, match=expected_error_msg):
+        indexer(s)
+
+
+def test_series_getitem_corner_generator(
+        multiindex_year_month_day_dataframe_random_data):
+    s = multiindex_year_month_day_dataframe_random_data['A']
+    result = s[(x > 0 for x in s)]
+    expected = s[s > 0]
+    tm.assert_series_equal(result, expected)
+
+
+# ----------------------------------------------------------------------------
+# test indexing of DataFrame with multi-level Index
+# ----------------------------------------------------------------------------
+
+def test_getitem_simple(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data.T
+    expected = df.values[:, 0]
+    result = df['foo', 'one'].values
+    tm.assert_almost_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer,expected_error_msg', [
+    (lambda df: df[('foo', 'four')], r"^\('foo', 'four'\)$"),
+    (lambda df: df['foobar'], r"^'foobar'$")
+])
+def test_frame_getitem_simple_key_error(
+        multiindex_dataframe_random_data, indexer, expected_error_msg):
+    df = multiindex_dataframe_random_data.T
+    with pytest.raises(KeyError, match=expected_error_msg):
+        indexer(df)
+
+
+def test_frame_getitem_multicolumn_empty_level():
+    df = DataFrame({'a': ['1', '2', '3'], 'b': ['2', '3', '4']})
+    df.columns = [['level1 item1', 'level1 item2'], ['', 'level2 item2'],
+                  ['level3 item1', 'level3 item2']]
+
+    result = df['level1 item1']
+    expected = DataFrame([['1'], ['2'], ['3']], index=df.index,
+                         columns=['level3 item1'])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer,expected_slice', [
+    (lambda df: df['foo'], slice(3)),
+    (lambda df: df['bar'], slice(3, 5)),
+    (lambda df: df.loc[:, 'bar'], slice(3, 5))
+])
+def test_frame_getitem_toplevel(
+        multiindex_dataframe_random_data, indexer, expected_slice):
+    df = multiindex_dataframe_random_data.T
+    expected = df.reindex(columns=df.columns[expected_slice])
+    expected.columns = expected.columns.droplevel(0)
+    result = indexer(df)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('unicode_strings', [True, False])
+def test_frame_mixed_depth_get(unicode_strings):
+    # If unicode_strings is True, the column labels in dataframe
+    # construction will use unicode strings in Python 2 (pull request
+    # #17099).
+
+    arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
+              ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
+              ['', 'wx', 'wy', '', '', '']]
+
+    if unicode_strings:
+        arrays = [[u(s) for s in arr] for arr in arrays]
+
+    tuples = sorted(zip(*arrays))
+    index = MultiIndex.from_tuples(tuples)
+    df = DataFrame(np.random.randn(4, 6), columns=index)
+
+    result = df['a']
+    expected = df['a', '', ''].rename('a')
+    tm.assert_series_equal(result, expected)
+
+    result = df['routine1', 'result1']
+    expected = df['routine1', 'result1', '']
+    expected = expected.rename(('routine1', 'result1'))
+    tm.assert_series_equal(result, expected)
+
+
+# ----------------------------------------------------------------------------
+# test indexing of DataFrame with multi-level Index with duplicates
+# ----------------------------------------------------------------------------
+
+@pytest.fixture
+def dataframe_with_duplicate_index():
+    """Fixture for DataFrame used in tests for gh-4145 and gh-4146"""
+    data = [['a', 'd', 'e', 'c', 'f', 'b'],
+            [1, 4, 5, 3, 6, 2],
+            [1, 4, 5, 3, 6, 2]]
+    index = ['h1', 'h3', 'h5']
+    columns = MultiIndex(
+        levels=[['A', 'B'], ['A1', 'A2', 'B1', 'B2']],
+        codes=[[0, 0, 0, 1, 1, 1], [0, 3, 3, 0, 1, 2]],
+        names=['main', 'sub'])
+    return DataFrame(data, index=index, columns=columns)
+
+
+@pytest.mark.parametrize('indexer', [
+    lambda df: df[('A', 'A1')],
+    lambda df: df.loc[:, ('A', 'A1')]
+])
+def test_frame_mi_access(dataframe_with_duplicate_index, indexer):
+    # GH 4145
+    df = dataframe_with_duplicate_index
+    index = Index(['h1', 'h3', 'h5'])
+    columns = MultiIndex.from_tuples([('A', 'A1')], names=['main', 'sub'])
+    expected = DataFrame([['a', 1, 1]], index=columns, columns=index).T
+
+    result = indexer(df)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_frame_mi_access_returns_series(dataframe_with_duplicate_index):
+    # GH 4146, not returning a block manager when selecting a unique index
+    # from a duplicate index
+    # as of 4879, this returns a Series (which is similar to what happens
+    # with a non-unique)
+    df = dataframe_with_duplicate_index
+    expected = Series(['a', 1, 1], index=['h1', 'h3', 'h5'], name='A1')
+    result = df['A']['A1']
+    tm.assert_series_equal(result, expected)
+
+
+def test_frame_mi_access_returns_frame(dataframe_with_duplicate_index):
+    # selecting a non_unique from the 2nd level
+    df = dataframe_with_duplicate_index
+    expected = DataFrame([['d', 4, 4], ['e', 5, 5]],
+                         index=Index(['B2', 'B2'], name='sub'),
+                         columns=['h1', 'h3', 'h5'], ).T
+    result = df['A']['B2']
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexing/multiindex/test_iloc.py b/pandas/tests/indexing/multiindex/test_iloc.py
new file mode 100644
index 0000000000000..bdd505804c82b
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_iloc.py
@@ -0,0 +1,151 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, MultiIndex, Series
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def simple_multiindex_dataframe():
+    """
+    Factory function to create simple 3 x 3 dataframe with
+    both columns and row MultiIndex using supplied data or
+    random data by default.
+    """
+    def _simple_multiindex_dataframe(data=None):
+        if data is None:
+            data = np.random.randn(3, 3)
+        return DataFrame(data, columns=[[2, 2, 4], [6, 8, 10]],
+                         index=[[4, 4, 8], [8, 10, 12]])
+    return _simple_multiindex_dataframe
+
+
+@pytest.mark.parametrize('indexer, expected', [
+    (lambda df: df.iloc[0],
+     lambda arr: Series(arr[0], index=[[2, 2, 4], [6, 8, 10]], name=(4, 8))),
+    (lambda df: df.iloc[2],
+     lambda arr: Series(arr[2], index=[[2, 2, 4], [6, 8, 10]], name=(8, 12))),
+    (lambda df: df.iloc[:, 2],
+     lambda arr: Series(
+         arr[:, 2], index=[[4, 4, 8], [8, 10, 12]], name=(4, 10)))
+])
+def test_iloc_returns_series(indexer, expected, simple_multiindex_dataframe):
+    arr = np.random.randn(3, 3)
+    df = simple_multiindex_dataframe(arr)
+    result = indexer(df)
+    expected = expected(arr)
+    tm.assert_series_equal(result, expected)
+
+
+def test_iloc_returns_dataframe(simple_multiindex_dataframe):
+    df = simple_multiindex_dataframe()
+    result = df.iloc[[0, 1]]
+    expected = df.xs(4, drop_level=False)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_iloc_returns_scalar(simple_multiindex_dataframe):
+    arr = np.random.randn(3, 3)
+    df = simple_multiindex_dataframe(arr)
+    result = df.iloc[2, 2]
+    expected = arr[2, 2]
+    assert result == expected
+
+
+def test_iloc_getitem_multiple_items():
+    # GH 5528
+    tup = zip(*[['a', 'a', 'b', 'b'], ['x', 'y', 'x', 'y']])
+    index = MultiIndex.from_tuples(tup)
+    df = DataFrame(np.random.randn(4, 4), index=index)
+    result = df.iloc[[2, 3]]
+    expected = df.xs('b', drop_level=False)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_iloc_getitem_labels():
+    # this is basically regular indexing
+    arr = np.random.randn(4, 3)
+    df = DataFrame(arr,
+                   columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
+                   index=[['i', 'i', 'j', 'k'], ['X', 'X', 'Y', 'Y']])
+    result = df.iloc[2, 2]
+    expected = arr[2, 2]
+    assert result == expected
+
+
+def test_frame_getitem_slice(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    result = df.iloc[:4]
+    expected = df[:4]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_frame_setitem_slice(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    df.iloc[:4] = 0
+
+    assert (df.values[:4] == 0).all()
+    assert (df.values[4:] != 0).all()
+
+
+def test_indexing_ambiguity_bug_1678():
+    # GH 1678
+    columns = MultiIndex.from_tuples(
+        [('Ohio', 'Green'), ('Ohio', 'Red'), ('Colorado', 'Green')])
+    index = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b', 2)])
+
+    df = DataFrame(np.arange(12).reshape((4, 3)), index=index, columns=columns)
+
+    result = df.iloc[:, 1]
+    expected = df.loc[:, ('Ohio', 'Red')]
+    tm.assert_series_equal(result, expected)
+
+
+def test_iloc_integer_locations():
+    # GH 13797
+    data = [['str00', 'str01'], ['str10', 'str11'], ['str20', 'srt21'],
+            ['str30', 'str31'], ['str40', 'str41']]
+
+    index = MultiIndex.from_tuples(
+        [('CC', 'A'), ('CC', 'B'), ('CC', 'B'), ('BB', 'a'), ('BB', 'b')])
+
+    expected = DataFrame(data)
+    df = DataFrame(data, index=index)
+
+    result = DataFrame([[df.iloc[r, c] for c in range(2)] for r in range(5)])
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'data, indexes, values, expected_k', [
+        # test without indexer value in first level of MultiIndex
+        ([[2, 22, 5], [2, 33, 6]], [0, -1, 1], [2, 3, 1], [7, 10]),
+        # test like code sample 1 in the issue
+        ([[1, 22, 555], [1, 33, 666]], [0, -1, 1], [200, 300, 100],
+            [755, 1066]),
+        # test like code sample 2 in the issue
+        ([[1, 3, 7], [2, 4, 8]], [0, -1, 1], [10, 10, 1000], [17, 1018]),
+        # test like code sample 3 in the issue
+        ([[1, 11, 4], [2, 22, 5], [3, 33, 6]], [0, -1, 1], [4, 7, 10],
+            [8, 15, 13])
+    ])
+def test_iloc_setitem_int_multiindex_series(data, indexes, values, expected_k):
+    # GH17148
+    df = DataFrame(data=data, columns=['i', 'j', 'k'])
+    df = df.set_index(['i', 'j'])
+
+    series = df.k.copy()
+    for i, v in zip(indexes, values):
+        series.iloc[i] += v
+
+    df['k'] = expected_k
+    expected = df.k
+    tm.assert_series_equal(series, expected)
+
+
+def test_getitem_iloc(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    result = df.iloc[2]
+    expected = df.xs(df.index[2])
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexing/multiindex/test_indexing_slow.py b/pandas/tests/indexing/multiindex/test_indexing_slow.py
new file mode 100644
index 0000000000000..1fdd42e307733
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_indexing_slow.py
@@ -0,0 +1,89 @@
+# -*- coding: utf-8 -*-
+
+import warnings
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, MultiIndex, Series
+import pandas.util.testing as tm
+
+
+@pytest.mark.slow
+@pytest.mark.filterwarnings("ignore::pandas.errors.PerformanceWarning")
+def test_multiindex_get_loc():  # GH7724, GH2646
+
+    with warnings.catch_warnings(record=True):
+
+        # test indexing into a multi-index before & past the lexsort depth
+        from numpy.random import randint, choice, randn
+        cols = ['jim', 'joe', 'jolie', 'joline', 'jolia']
+
+        def validate(mi, df, key):
+            mask = np.ones(len(df)).astype('bool')
+
+            # test for all partials of this key
+            for i, k in enumerate(key):
+                mask &= df.iloc[:, i] == k
+
+                if not mask.any():
+                    assert key[:i + 1] not in mi.index
+                    continue
+
+                assert key[:i + 1] in mi.index
+                right = df[mask].copy()
+
+                if i + 1 != len(key):  # partial key
+                    right.drop(cols[:i + 1], axis=1, inplace=True)
+                    right.set_index(cols[i + 1:-1], inplace=True)
+                    tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
+
+                else:  # full key
+                    right.set_index(cols[:-1], inplace=True)
+                    if len(right) == 1:  # single hit
+                        right = Series(right['jolia'].values,
+                                       name=right.index[0],
+                                       index=['jolia'])
+                        tm.assert_series_equal(mi.loc[key[:i + 1]], right)
+                    else:  # multi hit
+                        tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
+
+        def loop(mi, df, keys):
+            for key in keys:
+                validate(mi, df, key)
+
+        n, m = 1000, 50
+
+        vals = [randint(0, 10, n), choice(
+            list('abcdefghij'), n), choice(
+                pd.date_range('20141009', periods=10).tolist(), n), choice(
+                    list('ZYXWVUTSRQ'), n), randn(n)]
+        vals = list(map(tuple, zip(*vals)))
+
+        # bunch of keys for testing
+        keys = [randint(0, 11, m), choice(
+            list('abcdefghijk'), m), choice(
+                pd.date_range('20141009', periods=11).tolist(), m), choice(
+                    list('ZYXWVUTSRQP'), m)]
+        keys = list(map(tuple, zip(*keys)))
+        keys += list(map(lambda t: t[:-1], vals[::n // m]))
+
+        # covers both unique index and non-unique index
+        df = DataFrame(vals, columns=cols)
+        a, b = pd.concat([df, df]), df.drop_duplicates(subset=cols[:-1])
+
+        for frame in a, b:
+            for i in range(5):  # lexsort depth
+                df = frame.copy() if i == 0 else frame.sort_values(
+                    by=cols[:i])
+                mi = df.set_index(cols[:-1])
+                assert not mi.index.lexsort_depth < i
+                loop(mi, df, keys)
+
+
+@pytest.mark.slow
+def test_large_mi_dataframe_indexing():
+    # GH10645
+    result = MultiIndex.from_arrays([range(10 ** 6), range(10 ** 6)])
+    assert (not (10 ** 6, 0) in result)
diff --git a/pandas/tests/indexing/multiindex/test_ix.py b/pandas/tests/indexing/multiindex/test_ix.py
new file mode 100644
index 0000000000000..4970190252e30
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_ix.py
@@ -0,0 +1,56 @@
+from warnings import catch_warnings, simplefilter
+
+import pytest
+
+from pandas.compat import lrange
+from pandas.errors import PerformanceWarning
+
+from pandas import DataFrame, MultiIndex
+from pandas.util import testing as tm
+
+
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+class TestMultiIndexIx(object):
+
+    def test_frame_setitem_ix(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        frame.loc[('bar', 'two'), 'B'] = 5
+        assert frame.loc[('bar', 'two'), 'B'] == 5
+
+        # with integer labels
+        df = frame.copy()
+        df.columns = lrange(3)
+        df.loc[('bar', 'two'), 1] = 7
+        assert df.loc[('bar', 'two'), 1] == 7
+
+        with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
+            df = frame.copy()
+            df.columns = lrange(3)
+            df.ix[('bar', 'two'), 1] = 7
+        assert df.loc[('bar', 'two'), 1] == 7
+
+    def test_ix_general(self):
+
+        # ix general issues
+
+        # GH 2817
+        data = {'amount': {0: 700, 1: 600, 2: 222, 3: 333, 4: 444},
+                'col': {0: 3.5, 1: 3.5, 2: 4.0, 3: 4.0, 4: 4.0},
+                'year': {0: 2012, 1: 2011, 2: 2012, 3: 2012, 4: 2012}}
+        df = DataFrame(data).set_index(keys=['col', 'year'])
+        key = 4.0, 2012
+
+        # emits a PerformanceWarning, ok
+        with tm.assert_produces_warning(PerformanceWarning):
+            tm.assert_frame_equal(df.loc[key], df.iloc[2:])
+
+        # this is ok
+        df.sort_index(inplace=True)
+        res = df.loc[key]
+
+        # col has float dtype, result should be Float64Index
+        index = MultiIndex.from_arrays([[4.] * 3, [2012] * 3],
+                                       names=['col', 'year'])
+        expected = DataFrame({'amount': [222, 333, 444]}, index=index)
+        tm.assert_frame_equal(res, expected)
diff --git a/pandas/tests/indexing/multiindex/test_loc.py b/pandas/tests/indexing/multiindex/test_loc.py
new file mode 100644
index 0000000000000..073d40001a16b
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_loc.py
@@ -0,0 +1,380 @@
+import itertools
+from warnings import catch_warnings
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def single_level_multiindex():
+    """single level MultiIndex"""
+    return MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
+                      codes=[[0, 1, 2, 3]], names=['first'])
+
+
+@pytest.fixture
+def frame_random_data_integer_multi_index():
+    levels = [[0, 1], [0, 1, 2]]
+    codes = [[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]]
+    index = MultiIndex(levels=levels, codes=codes)
+    return DataFrame(np.random.randn(6, 2), index=index)
+
+
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+class TestMultiIndexLoc(object):
+
+    def test_loc_getitem_series(self):
+        # GH14730
+        # passing a series as a key with a MultiIndex
+        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
+        x = Series(index=index, data=range(9), dtype=np.float64)
+        y = Series([1, 3])
+        expected = Series(
+            data=[0, 1, 2, 6, 7, 8],
+            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
+            dtype=np.float64)
+        result = x.loc[y]
+        tm.assert_series_equal(result, expected)
+
+        result = x.loc[[1, 3]]
+        tm.assert_series_equal(result, expected)
+
+        # GH15424
+        y1 = Series([1, 3], index=[1, 2])
+        result = x.loc[y1]
+        tm.assert_series_equal(result, expected)
+
+        empty = Series(data=[], dtype=np.float64)
+        expected = Series([], index=MultiIndex(
+            levels=index.levels, codes=[[], []], dtype=np.float64))
+        result = x.loc[empty]
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_getitem_array(self):
+        # GH15434
+        # passing an array as a key with a MultiIndex
+        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
+        x = Series(index=index, data=range(9), dtype=np.float64)
+        y = np.array([1, 3])
+        expected = Series(
+            data=[0, 1, 2, 6, 7, 8],
+            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
+            dtype=np.float64)
+        result = x.loc[y]
+        tm.assert_series_equal(result, expected)
+
+        # empty array:
+        empty = np.array([])
+        expected = Series([], index=MultiIndex(
+            levels=index.levels, codes=[[], []], dtype=np.float64))
+        result = x.loc[empty]
+        tm.assert_series_equal(result, expected)
+
+        # 0-dim array (scalar):
+        scalar = np.int64(1)
+        expected = Series(
+            data=[0, 1, 2],
+            index=['A', 'B', 'C'],
+            dtype=np.float64)
+        result = x.loc[scalar]
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_multiindex(self):
+
+        mi_labels = DataFrame(np.random.randn(3, 3),
+                              columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
+                              index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
+
+        mi_int = DataFrame(np.random.randn(3, 3),
+                           columns=[[2, 2, 4], [6, 8, 10]],
+                           index=[[4, 4, 8], [8, 10, 12]])
+
+        # the first row
+        rs = mi_labels.loc['i']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix['i']
+        tm.assert_frame_equal(rs, xp)
+
+        # 2nd (last) columns
+        rs = mi_labels.loc[:, 'j']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix[:, 'j']
+        tm.assert_frame_equal(rs, xp)
+
+        # corner column
+        rs = mi_labels.loc['j'].loc[:, 'j']
+        with catch_warnings(record=True):
+            xp = mi_labels.ix['j'].ix[:, 'j']
+        tm.assert_frame_equal(rs, xp)
+
+        # with a tuple
+        rs = mi_labels.loc[('i', 'X')]
+        with catch_warnings(record=True):
+            xp = mi_labels.ix[('i', 'X')]
+        tm.assert_frame_equal(rs, xp)
+
+        rs = mi_int.loc[4]
+        with catch_warnings(record=True):
+            xp = mi_int.ix[4]
+        tm.assert_frame_equal(rs, xp)
+
+        # missing label
+        with pytest.raises(KeyError, match=r"^2L?$"):
+            mi_int.loc[2]
+        with catch_warnings(record=True):
+            # GH 21593
+            with pytest.raises(KeyError, match=r"^2L?$"):
+                mi_int.ix[2]
+
+    def test_loc_multiindex_indexer_none(self):
+
+        # GH6788
+        # multi-index indexer is None (meaning take all)
+        attributes = ['Attribute' + str(i) for i in range(1)]
+        attribute_values = ['Value' + str(i) for i in range(5)]
+
+        index = MultiIndex.from_product([attributes, attribute_values])
+        df = 0.1 * np.random.randn(10, 1 * 5) + 0.5
+        df = DataFrame(df, columns=index)
+        result = df[attributes]
+        tm.assert_frame_equal(result, df)
+
+        # GH 7349
+        # loc with a multi-index seems to be doing fallback
+        df = DataFrame(np.arange(12).reshape(-1, 1),
+                       index=MultiIndex.from_product([[1, 2, 3, 4],
+                                                      [1, 2, 3]]))
+
+        expected = df.loc[([1, 2], ), :]
+        result = df.loc[[1, 2]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_multiindex_incomplete(self):
+
+        # GH 7399
+        # incomplete indexers
+        s = Series(np.arange(15, dtype='int64'),
+                   MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
+        expected = s.loc[:, 'a':'c']
+
+        result = s.loc[0:4, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[:4, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[0:, 'a':'c']
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+        # GH 7400
+        # multiindexer gettitem with list of indexers skips wrong element
+        s = Series(np.arange(15, dtype='int64'),
+                   MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
+        expected = s.iloc[[6, 7, 8, 12, 13, 14]]
+        result = s.loc[2:4:2, 'a':'c']
+        tm.assert_series_equal(result, expected)
+
+    def test_get_loc_single_level(self, single_level_multiindex):
+        single_level = single_level_multiindex
+        s = Series(np.random.randn(len(single_level)),
+                   index=single_level)
+        for k in single_level.values:
+            s[k]
+
+    def test_loc_getitem_int_slice(self):
+        # GH 3053
+        # loc should treat integer slices like label slices
+
+        index = MultiIndex.from_tuples([t for t in itertools.product(
+            [6, 7, 8], ['a', 'b'])])
+        df = DataFrame(np.random.randn(6, 6), index, index)
+        result = df.loc[6:8, :]
+        expected = df
+        tm.assert_frame_equal(result, expected)
+
+        index = MultiIndex.from_tuples([t
+                                        for t in itertools.product(
+                                            [10, 20, 30], ['a', 'b'])])
+        df = DataFrame(np.random.randn(6, 6), index, index)
+        result = df.loc[20:30, :]
+        expected = df.iloc[2:]
+        tm.assert_frame_equal(result, expected)
+
+        # doc examples
+        result = df.loc[10, :]
+        expected = df.iloc[0:2]
+        expected.index = ['a', 'b']
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[:, 10]
+        # expected = df.ix[:,10] (this fails)
+        expected = df[10]
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        'indexer_type_1',
+        (list, tuple, set, slice, np.ndarray, Series, Index))
+    @pytest.mark.parametrize(
+        'indexer_type_2',
+        (list, tuple, set, slice, np.ndarray, Series, Index))
+    def test_loc_getitem_nested_indexer(self, indexer_type_1, indexer_type_2):
+        # GH #19686
+        # .loc should work with nested indexers which can be
+        # any list-like objects (see `pandas.api.types.is_list_like`) or slices
+
+        def convert_nested_indexer(indexer_type, keys):
+            if indexer_type == np.ndarray:
+                return np.array(keys)
+            if indexer_type == slice:
+                return slice(*keys)
+            return indexer_type(keys)
+
+        a = [10, 20, 30]
+        b = [1, 2, 3]
+        index = MultiIndex.from_product([a, b])
+        df = DataFrame(
+            np.arange(len(index), dtype='int64'),
+            index=index, columns=['Data'])
+
+        keys = ([10, 20], [2, 3])
+        types = (indexer_type_1, indexer_type_2)
+
+        # check indexers with all the combinations of nested objects
+        # of all the valid types
+        indexer = tuple(
+            convert_nested_indexer(indexer_type, k)
+            for indexer_type, k in zip(types, keys))
+
+        result = df.loc[indexer, 'Data']
+        expected = Series(
+            [1, 2, 4, 5], name='Data',
+            index=MultiIndex.from_product(keys))
+
+        tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer, is_level1, expected_error', [
+    ([], False, None),  # empty ok
+    (['A'], False, None),
+    (['A', 'D'], False, None),
+    (['D'], False, r"\['D'\] not in index"),  # not any values found
+    (pd.IndexSlice[:, ['foo']], True, None),
+    (pd.IndexSlice[:, ['foo', 'bah']], True, None)
+])
+def test_loc_getitem_duplicates_multiindex_missing_indexers(indexer, is_level1,
+                                                            expected_error):
+    # GH 7866
+    # multi-index slicing with missing indexers
+    idx = MultiIndex.from_product([['A', 'B', 'C'],
+                                   ['foo', 'bar', 'baz']],
+                                  names=['one', 'two'])
+    s = Series(np.arange(9, dtype='int64'), index=idx).sort_index()
+
+    if indexer == []:
+        expected = s.iloc[[]]
+    elif is_level1:
+        expected = Series([0, 3, 6], index=MultiIndex.from_product(
+            [['A', 'B', 'C'], ['foo']], names=['one', 'two'])).sort_index()
+    else:
+        exp_idx = MultiIndex.from_product([['A'], ['foo', 'bar', 'baz']],
+                                          names=['one', 'two'])
+        expected = Series(np.arange(3, dtype='int64'),
+                          index=exp_idx).sort_index()
+
+    if expected_error is not None:
+        with pytest.raises(KeyError, match=expected_error):
+            s.loc[indexer]
+    else:
+        result = s.loc[indexer]
+        tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+@pytest.mark.parametrize('indexer', [
+    lambda s: s.loc[[(2000, 3, 10), (2000, 3, 13)]],
+    lambda s: s.ix[[(2000, 3, 10), (2000, 3, 13)]]
+])
+def test_series_loc_getitem_fancy(
+        multiindex_year_month_day_dataframe_random_data, indexer):
+    s = multiindex_year_month_day_dataframe_random_data['A']
+    expected = s.reindex(s.index[49:51])
+
+    result = indexer(s)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('columns_indexer', [
+    ([], slice(None)),
+    (['foo'], [])
+])
+def test_loc_getitem_duplicates_multiindex_empty_indexer(columns_indexer):
+    # GH 8737
+    # empty indexer
+    multi_index = MultiIndex.from_product((['foo', 'bar', 'baz'],
+                                           ['alpha', 'beta']))
+    df = DataFrame(np.random.randn(5, 6), index=range(5), columns=multi_index)
+    df = df.sort_index(level=0, axis=1)
+
+    expected = DataFrame(index=range(5), columns=multi_index.reindex([])[0])
+    result = df.loc[:, columns_indexer]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_loc_getitem_duplicates_multiindex_non_scalar_type_object():
+    # regression from < 0.14.0
+    # GH 7914
+    df = DataFrame([[np.mean, np.median], ['mean', 'median']],
+                   columns=MultiIndex.from_tuples([('functs', 'mean'),
+                                                   ('functs', 'median')]),
+                   index=['function', 'name'])
+    result = df.loc['function', ('functs', 'mean')]
+    expected = np.mean
+    assert result == expected
+
+
+def test_loc_getitem_tuple_plus_slice():
+    # GH 671
+    df = DataFrame({'a': np.arange(10),
+                    'b': np.arange(10),
+                    'c': np.random.randn(10),
+                    'd': np.random.randn(10)}
+                   ).set_index(['a', 'b'])
+    expected = df.loc[0, 0]
+    result = df.loc[(0, 0), :]
+    tm.assert_series_equal(result, expected)
+
+
+def test_loc_getitem_int(frame_random_data_integer_multi_index):
+    df = frame_random_data_integer_multi_index
+    result = df.loc[1]
+    expected = df[-3:]
+    expected.index = expected.index.droplevel(0)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_loc_getitem_int_raises_exception(
+        frame_random_data_integer_multi_index):
+    df = frame_random_data_integer_multi_index
+    with pytest.raises(KeyError, match=r"^3L?$"):
+        df.loc[3]
+
+
+def test_loc_getitem_lowerdim_corner(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+
+    # test setup - check key not in dataframe
+    with pytest.raises(KeyError, match=r"^11L?$"):
+        df.loc[('bar', 'three'), 'B']
+
+    # in theory should be inserting in a sorted space????
+    df.loc[('bar', 'three'), 'B'] = 0
+    expected = 0
+    result = df.sort_index().loc[('bar', 'three'), 'B']
+    assert result == expected
diff --git a/pandas/tests/indexing/multiindex/test_multiindex.py b/pandas/tests/indexing/multiindex/test_multiindex.py
new file mode 100644
index 0000000000000..ccf017489e046
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_multiindex.py
@@ -0,0 +1,94 @@
+
+import numpy as np
+import pytest
+
+import pandas._libs.index as _index
+from pandas.errors import PerformanceWarning
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.util import testing as tm
+
+
+class TestMultiIndexBasic(object):
+
+    def test_multiindex_perf_warn(self):
+
+        df = DataFrame({'jim': [0, 0, 1, 1],
+                        'joe': ['x', 'x', 'z', 'y'],
+                        'jolie': np.random.rand(4)}).set_index(['jim', 'joe'])
+
+        with tm.assert_produces_warning(PerformanceWarning,
+                                        clear=[pd.core.index]):
+            df.loc[(1, 'z')]
+
+        df = df.iloc[[2, 1, 3, 0]]
+        with tm.assert_produces_warning(PerformanceWarning):
+            df.loc[(0, )]
+
+    def test_multiindex_contains_dropped(self):
+        # GH 19027
+        # test that dropped MultiIndex levels are not in the MultiIndex
+        # despite continuing to be in the MultiIndex's levels
+        idx = MultiIndex.from_product([[1, 2], [3, 4]])
+        assert 2 in idx
+        idx = idx.drop(2)
+
+        # drop implementation keeps 2 in the levels
+        assert 2 in idx.levels[0]
+        # but it should no longer be in the index itself
+        assert 2 not in idx
+
+        # also applies to strings
+        idx = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
+        assert 'a' in idx
+        idx = idx.drop('a')
+        assert 'a' in idx.levels[0]
+        assert 'a' not in idx
+
+    @pytest.mark.parametrize("data, expected", [
+        (MultiIndex.from_product([(), ()]), True),
+        (MultiIndex.from_product([(1, 2), (3, 4)]), True),
+        (MultiIndex.from_product([('a', 'b'), (1, 2)]), False),
+    ])
+    def test_multiindex_is_homogeneous_type(self, data, expected):
+        assert data._is_homogeneous_type is expected
+
+    def test_indexing_over_hashtable_size_cutoff(self):
+        n = 10000
+
+        old_cutoff = _index._SIZE_CUTOFF
+        _index._SIZE_CUTOFF = 20000
+
+        s = Series(np.arange(n),
+                   MultiIndex.from_arrays((["a"] * n, np.arange(n))))
+
+        # hai it works!
+        assert s[("a", 5)] == 5
+        assert s[("a", 6)] == 6
+        assert s[("a", 7)] == 7
+
+        _index._SIZE_CUTOFF = old_cutoff
+
+    def test_multi_nan_indexing(self):
+
+        # GH 3588
+        df = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
+                        'b': ["C1", "C2", "C3", "C4"],
+                        "c": [10, 15, np.nan, 20]})
+        result = df.set_index(['a', 'b'], drop=False)
+        expected = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
+                              'b': ["C1", "C2", "C3", "C4"],
+                              "c": [10, 15, np.nan, 20]},
+                             index=[Index(['R1', 'R2', np.nan, 'R4'],
+                                          name='a'),
+                                    Index(['C1', 'C2', 'C3', 'C4'], name='b')])
+        tm.assert_frame_equal(result, expected)
+
+    def test_contains(self):
+        # GH 24570
+        tx = pd.timedelta_range('09:30:00', '16:00:00', freq='30 min')
+        idx = MultiIndex.from_arrays([tx, np.arange(len(tx))])
+        assert tx[0] in idx
+        assert 'element_not_exit' not in idx
+        assert '0 day 09:30:00' in idx
diff --git a/pandas/tests/indexing/multiindex/test_partial.py b/pandas/tests/indexing/multiindex/test_partial.py
new file mode 100644
index 0000000000000..473463def2b87
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_partial.py
@@ -0,0 +1,183 @@
+from warnings import catch_warnings, simplefilter
+
+import numpy as np
+import pytest
+
+from pandas import DataFrame, MultiIndex
+from pandas.util import testing as tm
+
+
+class TestMultiIndexPartial(object):
+
+    def test_getitem_partial_int(self):
+        # GH 12416
+        # with single item
+        l1 = [10, 20]
+        l2 = ['a', 'b']
+        df = DataFrame(index=range(2),
+                       columns=MultiIndex.from_product([l1, l2]))
+        expected = DataFrame(index=range(2),
+                             columns=l2)
+        result = df[20]
+        tm.assert_frame_equal(result, expected)
+
+        # with list
+        expected = DataFrame(index=range(2),
+                             columns=MultiIndex.from_product([l1[1:], l2]))
+        result = df[[20]]
+        tm.assert_frame_equal(result, expected)
+
+        # missing item:
+        with pytest.raises(KeyError, match='1'):
+            df[1]
+        with pytest.raises(KeyError, match=r"'\[1\] not in index'"):
+            df[[1]]
+
+    def test_series_slice_partial(self):
+        pass
+
+    def test_xs_partial(self, multiindex_dataframe_random_data,
+                        multiindex_year_month_day_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        ymd = multiindex_year_month_day_dataframe_random_data
+        result = frame.xs('foo')
+        result2 = frame.loc['foo']
+        expected = frame.T['foo'].T
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result, result2)
+
+        result = ymd.xs((2000, 4))
+        expected = ymd.loc[2000, 4]
+        tm.assert_frame_equal(result, expected)
+
+        # ex from #1796
+        index = MultiIndex(levels=[['foo', 'bar'], ['one', 'two'], [-1, 1]],
+                           codes=[[0, 0, 0, 0, 1, 1, 1, 1],
+                                  [0, 0, 1, 1, 0, 0, 1, 1], [0, 1, 0, 1, 0, 1,
+                                                             0, 1]])
+        df = DataFrame(np.random.randn(8, 4), index=index,
+                       columns=list('abcd'))
+
+        result = df.xs(['foo', 'one'])
+        expected = df.loc['foo', 'one']
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem_partial(
+            self, multiindex_year_month_day_dataframe_random_data):
+        ymd = multiindex_year_month_day_dataframe_random_data
+        ymd = ymd.T
+        result = ymd[2000, 2]
+
+        expected = ymd.reindex(columns=ymd.columns[ymd.columns.codes[1] == 1])
+        expected.columns = expected.columns.droplevel(0).droplevel(0)
+        tm.assert_frame_equal(result, expected)
+
+    def test_fancy_slice_partial(
+            self, multiindex_dataframe_random_data,
+            multiindex_year_month_day_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        result = frame.loc['bar':'baz']
+        expected = frame[3:7]
+        tm.assert_frame_equal(result, expected)
+
+        ymd = multiindex_year_month_day_dataframe_random_data
+        result = ymd.loc[(2000, 2):(2000, 4)]
+        lev = ymd.index.codes[1]
+        expected = ymd[(lev >= 1) & (lev <= 3)]
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem_partial_column_select(self):
+        idx = MultiIndex(codes=[[0, 0, 0], [0, 1, 1], [1, 0, 1]],
+                         levels=[['a', 'b'], ['x', 'y'], ['p', 'q']])
+        df = DataFrame(np.random.rand(3, 2), index=idx)
+
+        result = df.loc[('a', 'y'), :]
+        expected = df.loc[('a', 'y')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[('a', 'y'), [1, 0]]
+        expected = df.loc[('a', 'y')][[1, 0]]
+        tm.assert_frame_equal(result, expected)
+
+        with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
+            result = df.ix[('a', 'y'), [1, 0]]
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(KeyError, match=r"\('a', 'foo'\)"):
+            df.loc[('a', 'foo'), :]
+
+    def test_partial_set(
+            self, multiindex_year_month_day_dataframe_random_data):
+        # GH #397
+        ymd = multiindex_year_month_day_dataframe_random_data
+        df = ymd.copy()
+        exp = ymd.copy()
+        df.loc[2000, 4] = 0
+        exp.loc[2000, 4].values[:] = 0
+        tm.assert_frame_equal(df, exp)
+
+        df['A'].loc[2000, 4] = 1
+        exp['A'].loc[2000, 4].values[:] = 1
+        tm.assert_frame_equal(df, exp)
+
+        df.loc[2000] = 5
+        exp.loc[2000].values[:] = 5
+        tm.assert_frame_equal(df, exp)
+
+        # this works...for now
+        df['A'].iloc[14] = 5
+        assert df['A'][14] == 5
+
+    # ---------------------------------------------------------------------
+    # AMBIGUOUS CASES!
+
+    def test_partial_ix_missing(
+            self, multiindex_year_month_day_dataframe_random_data):
+        pytest.skip("skipping for now")
+
+        ymd = multiindex_year_month_day_dataframe_random_data
+        result = ymd.loc[2000, 0]
+        expected = ymd.loc[2000]['A']
+        tm.assert_series_equal(result, expected)
+
+        # need to put in some work here
+
+        # self.ymd.loc[2000, 0] = 0
+        # assert (self.ymd.loc[2000]['A'] == 0).all()
+
+        # Pretty sure the second (and maybe even the first) is already wrong.
+        pytest.raises(Exception, ymd.loc.__getitem__, (2000, 6))
+        pytest.raises(Exception, ymd.loc.__getitem__, (2000, 6), 0)
+
+    # ---------------------------------------------------------------------
+
+    def test_setitem_multiple_partial(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        expected = frame.copy()
+        result = frame.copy()
+        result.loc[['foo', 'bar']] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_frame_equal(result, expected)
+
+        expected = frame.copy()
+        result = frame.copy()
+        result.loc['foo':'bar'] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_frame_equal(result, expected)
+
+        expected = frame['A'].copy()
+        result = frame['A'].copy()
+        result.loc[['foo', 'bar']] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_series_equal(result, expected)
+
+        expected = frame['A'].copy()
+        result = frame['A'].copy()
+        result.loc['foo':'bar'] = 0
+        expected.loc['foo'] = 0
+        expected.loc['bar'] = 0
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexing/multiindex/test_set_ops.py b/pandas/tests/indexing/multiindex/test_set_ops.py
new file mode 100644
index 0000000000000..1f864de2dacb1
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_set_ops.py
@@ -0,0 +1,42 @@
+from numpy.random import randn
+
+from pandas import DataFrame, MultiIndex, Series
+from pandas.util import testing as tm
+
+
+class TestMultiIndexSetOps(object):
+
+    def test_multiindex_symmetric_difference(self):
+        # GH 13490
+        idx = MultiIndex.from_product([['a', 'b'], ['A', 'B']],
+                                      names=['a', 'b'])
+        result = idx ^ idx
+        assert result.names == idx.names
+
+        idx2 = idx.copy().rename(['A', 'B'])
+        result = idx ^ idx2
+        assert result.names == [None, None]
+
+    def test_mixed_depth_insert(self):
+        arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
+                  ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
+                  ['', 'wx', 'wy', '', '', '']]
+
+        tuples = sorted(zip(*arrays))
+        index = MultiIndex.from_tuples(tuples)
+        df = DataFrame(randn(4, 6), columns=index)
+
+        result = df.copy()
+        expected = df.copy()
+        result['b'] = [1, 2, 3, 4]
+        expected['b', '', ''] = [1, 2, 3, 4]
+        tm.assert_frame_equal(result, expected)
+
+    def test_dataframe_insert_column_all_na(self):
+        # GH #1534
+        mix = MultiIndex.from_tuples([('1a', '2a'), ('1a', '2b'), ('1a', '2c')
+                                      ])
+        df = DataFrame([[1, 2], [3, 4], [5, 6]], index=mix)
+        s = Series({(1, 1): 1, (1, 2): 2})
+        df['new'] = s
+        assert df['new'].isna().all()
diff --git a/pandas/tests/indexing/multiindex/test_setitem.py b/pandas/tests/indexing/multiindex/test_setitem.py
new file mode 100644
index 0000000000000..f8f037dbda46b
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_setitem.py
@@ -0,0 +1,439 @@
+from warnings import catch_warnings, simplefilter
+
+import numpy as np
+from numpy.random import randn
+import pytest
+
+import pandas as pd
+from pandas import (
+    DataFrame, MultiIndex, Series, Timestamp, date_range, isna, notna)
+import pandas.core.common as com
+from pandas.util import testing as tm
+
+
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+class TestMultiIndexSetItem(object):
+
+    def test_setitem_multiindex(self):
+        with catch_warnings(record=True):
+
+            for index_fn in ('ix', 'loc'):
+
+                def assert_equal(a, b):
+                    assert a == b
+
+                def check(target, indexers, value, compare_fn, expected=None):
+                    fn = getattr(target, index_fn)
+                    fn.__setitem__(indexers, value)
+                    result = fn.__getitem__(indexers)
+                    if expected is None:
+                        expected = value
+                    compare_fn(result, expected)
+                # GH7190
+                index = MultiIndex.from_product([np.arange(0, 100),
+                                                 np.arange(0, 80)],
+                                                names=['time', 'firm'])
+                t, n = 0, 2
+                df = DataFrame(np.nan, columns=['A', 'w', 'l', 'a', 'x',
+                                                'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=0,
+                      compare_fn=assert_equal)
+
+                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
+                                              'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=1,
+                      compare_fn=assert_equal)
+
+                df = DataFrame(columns=['A', 'w', 'l', 'a', 'x',
+                                        'X', 'd', 'profit'],
+                               index=index)
+                check(target=df, indexers=((t, n), 'X'), value=2,
+                      compare_fn=assert_equal)
+
+                # gh-7218: assigning with 0-dim arrays
+                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
+                                              'X', 'd', 'profit'],
+                               index=index)
+                check(target=df,
+                      indexers=((t, n), 'X'),
+                      value=np.array(3),
+                      compare_fn=assert_equal,
+                      expected=3, )
+
+                # GH5206
+                df = DataFrame(np.arange(25).reshape(5, 5),
+                               columns='A,B,C,D,E'.split(','), dtype=float)
+                df['F'] = 99
+                row_selection = df['A'] % 2 == 0
+                col_selection = ['B', 'C']
+                with catch_warnings(record=True):
+                    df.ix[row_selection, col_selection] = df['F']
+                output = DataFrame(99., index=[0, 2, 4], columns=['B', 'C'])
+                with catch_warnings(record=True):
+                    tm.assert_frame_equal(df.ix[row_selection, col_selection],
+                                          output)
+                check(target=df,
+                      indexers=(row_selection, col_selection),
+                      value=df['F'],
+                      compare_fn=tm.assert_frame_equal,
+                      expected=output, )
+
+                # GH11372
+                idx = MultiIndex.from_product([
+                    ['A', 'B', 'C'],
+                    date_range('2015-01-01', '2015-04-01', freq='MS')])
+                cols = MultiIndex.from_product([
+                    ['foo', 'bar'],
+                    date_range('2016-01-01', '2016-02-01', freq='MS')])
+
+                df = DataFrame(np.random.random((12, 4)),
+                               index=idx, columns=cols)
+
+                subidx = MultiIndex.from_tuples(
+                    [('A', Timestamp('2015-01-01')),
+                     ('A', Timestamp('2015-02-01'))])
+                subcols = MultiIndex.from_tuples(
+                    [('foo', Timestamp('2016-01-01')),
+                     ('foo', Timestamp('2016-02-01'))])
+
+                vals = DataFrame(np.random.random((2, 2)),
+                                 index=subidx, columns=subcols)
+                check(target=df,
+                      indexers=(subidx, subcols),
+                      value=vals,
+                      compare_fn=tm.assert_frame_equal, )
+                # set all columns
+                vals = DataFrame(
+                    np.random.random((2, 4)), index=subidx, columns=cols)
+                check(target=df,
+                      indexers=(subidx, slice(None, None, None)),
+                      value=vals,
+                      compare_fn=tm.assert_frame_equal, )
+                # identity
+                copy = df.copy()
+                check(target=df, indexers=(df.index, df.columns), value=df,
+                      compare_fn=tm.assert_frame_equal, expected=copy)
+
+    def test_multiindex_setitem(self):
+
+        # GH 3738
+        # setting with a multi-index right hand side
+        arrays = [np.array(['bar', 'bar', 'baz', 'qux', 'qux', 'bar']),
+                  np.array(['one', 'two', 'one', 'one', 'two', 'one']),
+                  np.arange(0, 6, 1)]
+
+        df_orig = DataFrame(np.random.randn(6, 3), index=arrays,
+                            columns=['A', 'B', 'C']).sort_index()
+
+        expected = df_orig.loc[['bar']] * 2
+        df = df_orig.copy()
+        df.loc[['bar']] *= 2
+        tm.assert_frame_equal(df.loc[['bar']], expected)
+
+        # raise because these have differing levels
+        with pytest.raises(TypeError):
+            df.loc['bar'] *= 2
+
+        # from SO
+        # http://stackoverflow.com/questions/24572040/pandas-access-the-level-of-multiindex-for-inplace-operation
+        df_orig = DataFrame.from_dict({'price': {
+            ('DE', 'Coal', 'Stock'): 2,
+            ('DE', 'Gas', 'Stock'): 4,
+            ('DE', 'Elec', 'Demand'): 1,
+            ('FR', 'Gas', 'Stock'): 5,
+            ('FR', 'Solar', 'SupIm'): 0,
+            ('FR', 'Wind', 'SupIm'): 0
+        }})
+        df_orig.index = MultiIndex.from_tuples(df_orig.index,
+                                               names=['Sit', 'Com', 'Type'])
+
+        expected = df_orig.copy()
+        expected.iloc[[0, 2, 3]] *= 2
+
+        idx = pd.IndexSlice
+        df = df_orig.copy()
+        df.loc[idx[:, :, 'Stock'], :] *= 2
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[idx[:, :, 'Stock'], 'price'] *= 2
+        tm.assert_frame_equal(df, expected)
+
+    def test_multiindex_assignment(self):
+
+        # GH3777 part 2
+
+        # mixed dtype
+        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
+                       columns=list('abc'),
+                       index=[[4, 4, 8], [8, 10, 12]])
+        df['d'] = np.nan
+        arr = np.array([0., 1.])
+
+        with catch_warnings(record=True):
+            df.ix[4, 'd'] = arr
+            tm.assert_series_equal(df.ix[4, 'd'],
+                                   Series(arr, index=[8, 10], name='d'))
+
+        # single dtype
+        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
+                       columns=list('abc'),
+                       index=[[4, 4, 8], [8, 10, 12]])
+
+        with catch_warnings(record=True):
+            df.ix[4, 'c'] = arr
+            exp = Series(arr, index=[8, 10], name='c', dtype='float64')
+            tm.assert_series_equal(df.ix[4, 'c'], exp)
+
+        # scalar ok
+        with catch_warnings(record=True):
+            df.ix[4, 'c'] = 10
+            exp = Series(10, index=[8, 10], name='c', dtype='float64')
+            tm.assert_series_equal(df.ix[4, 'c'], exp)
+
+        # invalid assignments
+        with pytest.raises(ValueError):
+            with catch_warnings(record=True):
+                df.ix[4, 'c'] = [0, 1, 2, 3]
+
+        with pytest.raises(ValueError):
+            with catch_warnings(record=True):
+                df.ix[4, 'c'] = [0]
+
+        # groupby example
+        NUM_ROWS = 100
+        NUM_COLS = 10
+        col_names = ['A' + num for num in
+                     map(str, np.arange(NUM_COLS).tolist())]
+        index_cols = col_names[:5]
+
+        df = DataFrame(np.random.randint(5, size=(NUM_ROWS, NUM_COLS)),
+                       dtype=np.int64, columns=col_names)
+        df = df.set_index(index_cols).sort_index()
+        grp = df.groupby(level=index_cols[:4])
+        df['new_col'] = np.nan
+
+        f_index = np.arange(5)
+
+        def f(name, df2):
+            return Series(np.arange(df2.shape[0]),
+                          name=df2.index.values[0]).reindex(f_index)
+
+        # TODO(wesm): unused?
+        # new_df = pd.concat([f(name, df2) for name, df2 in grp], axis=1).T
+
+        # we are actually operating on a copy here
+        # but in this case, that's ok
+        for name, df2 in grp:
+            new_vals = np.arange(df2.shape[0])
+            with catch_warnings(record=True):
+                df.ix[name, 'new_col'] = new_vals
+
+    def test_series_setitem(
+            self, multiindex_year_month_day_dataframe_random_data):
+        ymd = multiindex_year_month_day_dataframe_random_data
+        s = ymd['A']
+
+        s[2000, 3] = np.nan
+        assert isna(s.values[42:65]).all()
+        assert notna(s.values[:42]).all()
+        assert notna(s.values[65:]).all()
+
+        s[2000, 3, 10] = np.nan
+        assert isna(s[49])
+
+    def test_frame_getitem_setitem_boolean(
+            self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        df = frame.T.copy()
+        values = df.values
+
+        result = df[df > 0]
+        expected = df.where(df > 0)
+        tm.assert_frame_equal(result, expected)
+
+        df[df > 0] = 5
+        values[values > 0] = 5
+        tm.assert_almost_equal(df.values, values)
+
+        df[df == 5] = 0
+        values[values == 5] = 0
+        tm.assert_almost_equal(df.values, values)
+
+        # a df that needs alignment first
+        df[df[:-1] < 0] = 2
+        np.putmask(values[:-1], values[:-1] < 0, 2)
+        tm.assert_almost_equal(df.values, values)
+
+        with pytest.raises(TypeError, match='boolean values only'):
+            df[df * 0] = 2
+
+    def test_frame_getitem_setitem_multislice(self):
+        levels = [['t1', 't2'], ['a', 'b', 'c']]
+        codes = [[0, 0, 0, 1, 1], [0, 1, 2, 0, 1]]
+        midx = MultiIndex(codes=codes, levels=levels, names=[None, 'id'])
+        df = DataFrame({'value': [1, 2, 3, 7, 8]}, index=midx)
+
+        result = df.loc[:, 'value']
+        tm.assert_series_equal(df['value'], result)
+
+        with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
+            result = df.ix[:, 'value']
+        tm.assert_series_equal(df['value'], result)
+
+        result = df.loc[df.index[1:3], 'value']
+        tm.assert_series_equal(df['value'][1:3], result)
+
+        result = df.loc[:, :]
+        tm.assert_frame_equal(df, result)
+
+        result = df
+        df.loc[:, 'value'] = 10
+        result['value'] = 10
+        tm.assert_frame_equal(df, result)
+
+        df.loc[:, :] = 10
+        tm.assert_frame_equal(df, result)
+
+    def test_frame_setitem_multi_column(self):
+        df = DataFrame(randn(10, 4), columns=[['a', 'a', 'b', 'b'],
+                                              [0, 1, 0, 1]])
+
+        cp = df.copy()
+        cp['a'] = cp['b']
+        tm.assert_frame_equal(cp['a'], cp['b'])
+
+        # set with ndarray
+        cp = df.copy()
+        cp['a'] = cp['b'].values
+        tm.assert_frame_equal(cp['a'], cp['b'])
+
+        # ---------------------------------------
+        # #1803
+        columns = MultiIndex.from_tuples([('A', '1'), ('A', '2'), ('B', '1')])
+        df = DataFrame(index=[1, 3, 5], columns=columns)
+
+        # Works, but adds a column instead of updating the two existing ones
+        df['A'] = 0.0  # Doesn't work
+        assert (df['A'].values == 0).all()
+
+        # it broadcasts
+        df['B', '1'] = [1, 2, 3]
+        df['A'] = df['B', '1']
+
+        sliced_a1 = df['A', '1']
+        sliced_a2 = df['A', '2']
+        sliced_b1 = df['B', '1']
+        tm.assert_series_equal(sliced_a1, sliced_b1, check_names=False)
+        tm.assert_series_equal(sliced_a2, sliced_b1, check_names=False)
+        assert sliced_a1.name == ('A', '1')
+        assert sliced_a2.name == ('A', '2')
+        assert sliced_b1.name == ('B', '1')
+
+    def test_getitem_setitem_tuple_plus_columns(
+            self, multiindex_year_month_day_dataframe_random_data):
+        # GH #1013
+        ymd = multiindex_year_month_day_dataframe_random_data
+        df = ymd[:5]
+
+        result = df.loc[(2000, 1, 6), ['A', 'B', 'C']]
+        expected = df.loc[2000, 1, 6][['A', 'B', 'C']]
+        tm.assert_series_equal(result, expected)
+
+    def test_getitem_setitem_slice_integers(self):
+        index = MultiIndex(levels=[[0, 1, 2], [0, 2]],
+                           codes=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
+
+        frame = DataFrame(np.random.randn(len(index), 4), index=index,
+                          columns=['a', 'b', 'c', 'd'])
+        res = frame.loc[1:2]
+        exp = frame.reindex(frame.index[2:])
+        tm.assert_frame_equal(res, exp)
+
+        frame.loc[1:2] = 7
+        assert (frame.loc[1:2] == 7).values.all()
+
+        series = Series(np.random.randn(len(index)), index=index)
+
+        res = series.loc[1:2]
+        exp = series.reindex(series.index[2:])
+        tm.assert_series_equal(res, exp)
+
+        series.loc[1:2] = 7
+        assert (series.loc[1:2] == 7).values.all()
+
+    def test_setitem_change_dtype(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        dft = frame.T
+        s = dft['foo', 'two']
+        dft['foo', 'two'] = s > s.median()
+        tm.assert_series_equal(dft['foo', 'two'], s > s.median())
+        # assert isinstance(dft._data.blocks[1].items, MultiIndex)
+
+        reindexed = dft.reindex(columns=[('foo', 'two')])
+        tm.assert_series_equal(reindexed['foo', 'two'], s > s.median())
+
+    def test_set_column_scalar_with_ix(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        subset = frame.index[[1, 4, 5]]
+
+        frame.loc[subset] = 99
+        assert (frame.loc[subset].values == 99).all()
+
+        col = frame['B']
+        col[subset] = 97
+        assert (frame.loc[subset, 'B'] == 97).all()
+
+    def test_nonunique_assignment_1750(self):
+        df = DataFrame([[1, 1, "x", "X"], [1, 1, "y", "Y"], [1, 2, "z", "Z"]],
+                       columns=list("ABCD"))
+
+        df = df.set_index(['A', 'B'])
+        ix = MultiIndex.from_tuples([(1, 1)])
+
+        df.loc[ix, "C"] = '_'
+
+        assert (df.xs((1, 1))['C'] == '_').all()
+
+    def test_astype_assignment_with_dups(self):
+
+        # GH 4686
+        # assignment with dups that has a dtype change
+        cols = MultiIndex.from_tuples([('A', '1'), ('B', '1'), ('A', '2')])
+        df = DataFrame(np.arange(3).reshape((1, 3)),
+                       columns=cols, dtype=object)
+        index = df.index.copy()
+
+        df['A'] = df['A'].astype(np.float64)
+        tm.assert_index_equal(df.index, index)
+
+
+def test_frame_setitem_view_direct(multiindex_dataframe_random_data):
+    # this works because we are modifying the underlying array
+    # really a no-no
+    df = multiindex_dataframe_random_data.T
+    df['foo'].values[:] = 0
+    assert (df['foo'].values == 0).all()
+
+
+def test_frame_setitem_copy_raises(multiindex_dataframe_random_data):
+    # will raise/warn as its chained assignment
+    df = multiindex_dataframe_random_data.T
+    msg = "A value is trying to be set on a copy of a slice from a DataFrame"
+    with pytest.raises(com.SettingWithCopyError, match=msg):
+        df['foo']['one'] = 2
+
+
+def test_frame_setitem_copy_no_write(multiindex_dataframe_random_data):
+    frame = multiindex_dataframe_random_data.T
+    expected = frame
+    df = frame.copy()
+    msg = "A value is trying to be set on a copy of a slice from a DataFrame"
+    with pytest.raises(com.SettingWithCopyError, match=msg):
+        df['foo']['one'] = 2
+
+    result = df
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexing/multiindex/test_slice.py b/pandas/tests/indexing/multiindex/test_slice.py
new file mode 100644
index 0000000000000..db7d079186708
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_slice.py
@@ -0,0 +1,577 @@
+from warnings import catch_warnings
+
+import numpy as np
+import pytest
+
+from pandas.errors import UnsortedIndexError
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, Timestamp
+from pandas.core.indexing import _non_reducing_slice
+from pandas.tests.indexing.common import _mklbl
+from pandas.util import testing as tm
+
+
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+class TestMultiIndexSlicers(object):
+
+    def test_per_axis_per_level_getitem(self):
+
+        # GH6134
+        # example test case
+        ix = MultiIndex.from_product([_mklbl('A', 5), _mklbl('B', 7), _mklbl(
+            'C', 4), _mklbl('D', 2)])
+        df = DataFrame(np.arange(len(ix.get_values())), index=ix)
+
+        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C2' or c == 'C3')]]
+        result = df.loc[(slice('A1', 'A3'), slice(None), slice('C1', 'C3')), :]
+        tm.assert_frame_equal(result, expected)
+
+        # test multi-index slicing with per axis and per index controls
+        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                        ('A', 3), ('B', 1)],
+                                       names=['one', 'two'])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+
+        df = DataFrame(
+            np.arange(16, dtype='int64').reshape(
+                4, 4), index=index, columns=columns)
+        df = df.sort_index(axis=0).sort_index(axis=1)
+
+        # identity
+        result = df.loc[(slice(None), slice(None)), :]
+        tm.assert_frame_equal(result, df)
+        result = df.loc[(slice(None), slice(None)), (slice(None), slice(None))]
+        tm.assert_frame_equal(result, df)
+        result = df.loc[:, (slice(None), slice(None))]
+        tm.assert_frame_equal(result, df)
+
+        # index
+        result = df.loc[(slice(None), [1]), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), 1), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # columns
+        result = df.loc[:, (slice(None), ['foo'])]
+        expected = df.iloc[:, [1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # both
+        result = df.loc[(slice(None), 1), (slice(None), ['foo'])]
+        expected = df.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc['A', 'a']
+        expected = DataFrame(dict(bar=[1, 5, 9], foo=[0, 4, 8]),
+                             index=Index([1, 2, 3], name='two'),
+                             columns=Index(['bar', 'foo'], name='lvl1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), [1, 2]), :]
+        expected = df.iloc[[0, 1, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # multi-level series
+        s = Series(np.arange(len(ix.get_values())), index=ix)
+        result = s.loc['A1':'A3', :, ['C1', 'C3']]
+        expected = s.loc[[tuple([a, b, c, d])
+                          for a, b, c, d in s.index.values
+                          if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                              c == 'C1' or c == 'C3')]]
+        tm.assert_series_equal(result, expected)
+
+        # boolean indexers
+        result = df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
+        expected = df.iloc[[2, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(ValueError):
+            df.loc[(slice(None), np.array([True, False])), :]
+
+        # ambiguous cases
+        # these can be multiply interpreted (e.g. in this case
+        # as df.loc[slice(None),[1]] as well
+        with pytest.raises(KeyError, match=r"'\[1\] not in index'"):
+            df.loc[slice(None), [1]]
+
+        result = df.loc[(slice(None), [1]), :]
+        expected = df.iloc[[0, 3]]
+        tm.assert_frame_equal(result, expected)
+
+        # not lexsorted
+        assert df.index.lexsort_depth == 2
+        df = df.sort_index(level=1, axis=0)
+        assert df.index.lexsort_depth == 0
+
+        msg = ('MultiIndex slicing requires the index to be '
+               r'lexsorted: slicing on levels \[1\], lexsort depth 0')
+        with pytest.raises(UnsortedIndexError, match=msg):
+            df.loc[(slice(None), slice('bar')), :]
+
+        # GH 16734: not sorted, but no real slicing
+        result = df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
+        tm.assert_frame_equal(result, df.iloc[[1, 3], :])
+
+    def test_multiindex_slicers_non_unique(self):
+
+        # GH 7106
+        # non-unique mi index support
+        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
+                             B=['a', 'a', 'a', 'a'],
+                             C=[1, 2, 1, 3],
+                             D=[1, 2, 3, 4]))
+              .set_index(['A', 'B', 'C']).sort_index())
+        assert not df.index.is_unique
+        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
+                                   C=[1, 1], D=[1, 3]))
+                    .set_index(['A', 'B', 'C']).sort_index())
+        result = df.loc[(slice(None), slice(None), 1), :]
+        tm.assert_frame_equal(result, expected)
+
+        # this is equivalent of an xs expression
+        result = df.xs(1, level=2, drop_level=False)
+        tm.assert_frame_equal(result, expected)
+
+        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
+                             B=['a', 'a', 'a', 'a'],
+                             C=[1, 2, 1, 2],
+                             D=[1, 2, 3, 4]))
+              .set_index(['A', 'B', 'C']).sort_index())
+        assert not df.index.is_unique
+        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
+                                   C=[1, 1], D=[1, 3]))
+                    .set_index(['A', 'B', 'C']).sort_index())
+        result = df.loc[(slice(None), slice(None), 1), :]
+        assert not result.index.is_unique
+        tm.assert_frame_equal(result, expected)
+
+        # GH12896
+        # numpy-implementation dependent bug
+        ints = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 12, 13, 14, 14, 16,
+                17, 18, 19, 200000, 200000]
+        n = len(ints)
+        idx = MultiIndex.from_arrays([['a'] * n, ints])
+        result = Series([1] * n, index=idx)
+        result = result.sort_index()
+        result = result.loc[(slice(None), slice(100000))]
+        expected = Series([1] * (n - 2), index=idx[:-2]).sort_index()
+        tm.assert_series_equal(result, expected)
+
+    def test_multiindex_slicers_datetimelike(self):
+
+        # GH 7429
+        # buggy/inconsistent behavior when slicing with datetime-like
+        import datetime
+        dates = [datetime.datetime(2012, 1, 1, 12, 12, 12) +
+                 datetime.timedelta(days=i) for i in range(6)]
+        freq = [1, 2]
+        index = MultiIndex.from_product(
+            [dates, freq], names=['date', 'frequency'])
+
+        df = DataFrame(
+            np.arange(6 * 2 * 4, dtype='int64').reshape(
+                -1, 4), index=index, columns=list('ABCD'))
+
+        # multi-axis slicing
+        idx = pd.IndexSlice
+        expected = df.iloc[[0, 2, 4], [0, 1]]
+        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
+                               Timestamp('2012-01-03 12:12:12')),
+                         slice(1, 1)), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(idx[Timestamp('2012-01-01 12:12:12'):Timestamp(
+            '2012-01-03 12:12:12')], idx[1:1]), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
+                               Timestamp('2012-01-03 12:12:12')), 1),
+                        slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        # with strings
+        result = df.loc[(slice('2012-01-01 12:12:12', '2012-01-03 12:12:12'),
+                         slice(1, 1)), slice('A', 'B')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(idx['2012-01-01 12:12:12':'2012-01-03 12:12:12'], 1),
+                        idx['A', 'B']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_multiindex_slicers_edges(self):
+        # GH 8132
+        # various edge cases
+        df = DataFrame(
+            {'A': ['A0'] * 5 + ['A1'] * 5 + ['A2'] * 5,
+             'B': ['B0', 'B0', 'B1', 'B1', 'B2'] * 3,
+             'DATE': ["2013-06-11", "2013-07-02", "2013-07-09", "2013-07-30",
+                      "2013-08-06", "2013-06-11", "2013-07-02", "2013-07-09",
+                      "2013-07-30", "2013-08-06", "2013-09-03", "2013-10-01",
+                      "2013-07-09", "2013-08-06", "2013-09-03"],
+             'VALUES': [22, 35, 14, 9, 4, 40, 18, 4, 2, 5, 1, 2, 3, 4, 2]})
+
+        df['DATE'] = pd.to_datetime(df['DATE'])
+        df1 = df.set_index(['A', 'B', 'DATE'])
+        df1 = df1.sort_index()
+
+        # A1 - Get all values under "A0" and "A1"
+        result = df1.loc[(slice('A1')), :]
+        expected = df1.iloc[0:10]
+        tm.assert_frame_equal(result, expected)
+
+        # A2 - Get all values from the start to "A2"
+        result = df1.loc[(slice('A2')), :]
+        expected = df1
+        tm.assert_frame_equal(result, expected)
+
+        # A3 - Get all values under "B1" or "B2"
+        result = df1.loc[(slice(None), slice('B1', 'B2')), :]
+        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13, 14]]
+        tm.assert_frame_equal(result, expected)
+
+        # A4 - Get all values between 2013-07-02 and 2013-07-09
+        result = df1.loc[(slice(None), slice(None),
+                          slice('20130702', '20130709')), :]
+        expected = df1.iloc[[1, 2, 6, 7, 12]]
+        tm.assert_frame_equal(result, expected)
+
+        # B1 - Get all values in B0 that are also under A0, A1 and A2
+        result = df1.loc[(slice('A2'), slice('B0')), :]
+        expected = df1.iloc[[0, 1, 5, 6, 10, 11]]
+        tm.assert_frame_equal(result, expected)
+
+        # B2 - Get all values in B0, B1 and B2 (similar to what #2 is doing for
+        # the As)
+        result = df1.loc[(slice(None), slice('B2')), :]
+        expected = df1
+        tm.assert_frame_equal(result, expected)
+
+        # B3 - Get all values from B1 to B2 and up to 2013-08-06
+        result = df1.loc[(slice(None), slice('B1', 'B2'),
+                          slice('2013-08-06')), :]
+        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13]]
+        tm.assert_frame_equal(result, expected)
+
+        # B4 - Same as A4 but the start of the date slice is not a key.
+        #      shows indexing on a partial selection slice
+        result = df1.loc[(slice(None), slice(None),
+                          slice('20130701', '20130709')), :]
+        expected = df1.iloc[[1, 2, 6, 7, 12]]
+        tm.assert_frame_equal(result, expected)
+
+    def test_per_axis_per_level_doc_examples(self):
+
+        # test index maker
+        idx = pd.IndexSlice
+
+        # from indexing.rst / advanced
+        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
+                                         _mklbl('C', 4), _mklbl('D', 2)])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
+                       .reshape((len(index), len(columns))),
+                       index=index, columns=columns)
+        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+        result = df.loc[idx['A1':'A3', :, ['C1', 'C3']], :]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[(slice(None), slice(None), ['C1', 'C3']), :]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+        result = df.loc[idx[:, :, ['C1', 'C3']], :]
+        tm.assert_frame_equal(result, expected)
+
+        # not sorted
+        with pytest.raises(UnsortedIndexError):
+            df.loc['A1', ('a', slice('foo'))]
+
+        # GH 16734: not sorted, but no real slicing
+        tm.assert_frame_equal(df.loc['A1', (slice(None), 'foo')],
+                              df.loc['A1'].iloc[:, [0, 2]])
+
+        df = df.sort_index(axis=1)
+
+        # slicing
+        df.loc['A1', (slice(None), 'foo')]
+        df.loc[(slice(None), slice(None), ['C1', 'C3']), (slice(None), 'foo')]
+
+        # setitem
+        df.loc(axis=0)[:, :, ['C1', 'C3']] = -10
+
+    def test_loc_axis_arguments(self):
+
+        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
+                                         _mklbl('C', 4), _mklbl('D', 2)])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
+                       .reshape((len(index), len(columns))),
+                       index=index,
+                       columns=columns).sort_index().sort_index(axis=1)
+
+        # axis 0
+        result = df.loc(axis=0)['A1':'A3', :, ['C1', 'C3']]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
+                               c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc(axis='index')[:, :, ['C1', 'C3']]
+        expected = df.loc[[tuple([a, b, c, d])
+                           for a, b, c, d in df.index.values
+                           if (c == 'C1' or c == 'C3')]]
+        tm.assert_frame_equal(result, expected)
+
+        # axis 1
+        result = df.loc(axis=1)[:, 'foo']
+        expected = df.loc[:, (slice(None), 'foo')]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc(axis='columns')[:, 'foo']
+        expected = df.loc[:, (slice(None), 'foo')]
+        tm.assert_frame_equal(result, expected)
+
+        # invalid axis
+        with pytest.raises(ValueError):
+            df.loc(axis=-1)[:, :, ['C1', 'C3']]
+
+        with pytest.raises(ValueError):
+            df.loc(axis=2)[:, :, ['C1', 'C3']]
+
+        with pytest.raises(ValueError):
+            df.loc(axis='foo')[:, :, ['C1', 'C3']]
+
+    def test_per_axis_per_level_setitem(self):
+
+        # test index maker
+        idx = pd.IndexSlice
+
+        # test multi-index slicing with per axis and per index controls
+        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
+                                        ('A', 3), ('B', 1)],
+                                       names=['one', 'two'])
+        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
+                                          ('b', 'foo'), ('b', 'bah')],
+                                         names=['lvl0', 'lvl1'])
+
+        df_orig = DataFrame(
+            np.arange(16, dtype='int64').reshape(
+                4, 4), index=index, columns=columns)
+        df_orig = df_orig.sort_index(axis=0).sort_index(axis=1)
+
+        # identity
+        df = df_orig.copy()
+        df.loc[(slice(None), slice(None)), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc(axis=0)[:, :] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), slice(None)), (slice(None), slice(None))] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[:, (slice(None), slice(None))] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, :] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # index
+        df = df_orig.copy()
+        df.loc[(slice(None), [1]), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), :] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc(axis=0)[:, 1] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # columns
+        df = df_orig.copy()
+        df.loc[:, (slice(None), ['foo'])] = 100
+        expected = df_orig.copy()
+        expected.iloc[:, [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # both
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[idx[:, 1], idx[:, ['foo']]] = 100
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc['A', 'a'] = 100
+        expected = df_orig.copy()
+        expected.iloc[0:3, 0:2] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # setting with a list-like
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+            [[100, 100], [100, 100]], dtype='int64')
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = 100
+        tm.assert_frame_equal(df, expected)
+
+        # not enough values
+        df = df_orig.copy()
+
+        with pytest.raises(ValueError):
+            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+                [[100], [100, 100]], dtype='int64')
+
+        with pytest.raises(ValueError):
+            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
+                [100, 100, 100, 100], dtype='int64')
+
+        # with an alignable rhs
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] = df.loc[(slice(
+            None), 1), (slice(None), ['foo'])] * 5
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] = expected.iloc[[0, 3], [1, 3]] * 5
+        tm.assert_frame_equal(df, expected)
+
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= df.loc[(slice(
+            None), 1), (slice(None), ['foo'])]
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(df, expected)
+
+        rhs = df_orig.loc[(slice(None), 1), (slice(None), ['foo'])].copy()
+        rhs.loc[:, ('c', 'bah')] = 10
+        df = df_orig.copy()
+        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= rhs
+        expected = df_orig.copy()
+        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
+        tm.assert_frame_equal(df, expected)
+
+    def test_multiindex_label_slicing_with_negative_step(self):
+        s = Series(np.arange(20),
+                   MultiIndex.from_product([list('abcde'), np.arange(4)]))
+        SLC = pd.IndexSlice
+
+        def assert_slices_equivalent(l_slc, i_slc):
+            tm.assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
+            tm.assert_series_equal(s[l_slc], s.iloc[i_slc])
+            with catch_warnings(record=True):
+                tm.assert_series_equal(s.ix[l_slc], s.iloc[i_slc])
+
+        assert_slices_equivalent(SLC[::-1], SLC[::-1])
+
+        assert_slices_equivalent(SLC['d'::-1], SLC[15::-1])
+        assert_slices_equivalent(SLC[('d', )::-1], SLC[15::-1])
+
+        assert_slices_equivalent(SLC[:'d':-1], SLC[:11:-1])
+        assert_slices_equivalent(SLC[:('d', ):-1], SLC[:11:-1])
+
+        assert_slices_equivalent(SLC['d':'b':-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC[('d', ):'b':-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC['d':('b', ):-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC[('d', ):('b', ):-1], SLC[15:3:-1])
+        assert_slices_equivalent(SLC['b':'d':-1], SLC[:0])
+
+        assert_slices_equivalent(SLC[('c', 2)::-1], SLC[10::-1])
+        assert_slices_equivalent(SLC[:('c', 2):-1], SLC[:9:-1])
+        assert_slices_equivalent(SLC[('e', 0):('c', 2):-1], SLC[16:9:-1])
+
+    def test_multiindex_slice_first_level(self):
+        # GH 12697
+        freq = ['a', 'b', 'c', 'd']
+        idx = MultiIndex.from_product([freq, np.arange(500)])
+        df = DataFrame(list(range(2000)), index=idx, columns=['Test'])
+        df_slice = df.loc[pd.IndexSlice[:, 30:70], :]
+        result = df_slice.loc['a']
+        expected = DataFrame(list(range(30, 71)),
+                             columns=['Test'], index=range(30, 71))
+        tm.assert_frame_equal(result, expected)
+        result = df_slice.loc['d']
+        expected = DataFrame(list(range(1530, 1571)),
+                             columns=['Test'], index=range(30, 71))
+        tm.assert_frame_equal(result, expected)
+
+    def test_int_series_slicing(
+            self, multiindex_year_month_day_dataframe_random_data):
+        ymd = multiindex_year_month_day_dataframe_random_data
+        s = ymd['A']
+        result = s[5:]
+        expected = s.reindex(s.index[5:])
+        tm.assert_series_equal(result, expected)
+
+        exp = ymd['A'].copy()
+        s[5:] = 0
+        exp.values[5:] = 0
+        tm.assert_numpy_array_equal(s.values, exp.values)
+
+        result = ymd[5:]
+        expected = ymd.reindex(s.index[5:])
+        tm.assert_frame_equal(result, expected)
+
+    def test_non_reducing_slice_on_multiindex(self):
+        # GH 19861
+        dic = {
+            ('a', 'd'): [1, 4],
+            ('a', 'c'): [2, 3],
+            ('b', 'c'): [3, 2],
+            ('b', 'd'): [4, 1]
+        }
+        df = pd.DataFrame(dic, index=[0, 1])
+        idx = pd.IndexSlice
+        slice_ = idx[:, idx['b', 'd']]
+        tslice_ = _non_reducing_slice(slice_)
+
+        result = df.loc[tslice_]
+        expected = pd.DataFrame({('b', 'd'): [4, 1]})
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexing/multiindex/test_sorted.py b/pandas/tests/indexing/multiindex/test_sorted.py
new file mode 100644
index 0000000000000..f565c30fc3e2c
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_sorted.py
@@ -0,0 +1,92 @@
+import numpy as np
+from numpy.random import randn
+
+from pandas.compat import lzip
+
+from pandas import DataFrame, MultiIndex, Series
+from pandas.util import testing as tm
+
+
+class TestMultiIndexSorted(object):
+    def test_getitem_multilevel_index_tuple_not_sorted(self):
+        index_columns = list("abc")
+        df = DataFrame([[0, 1, 0, "x"], [0, 0, 1, "y"]],
+                       columns=index_columns + ["data"])
+        df = df.set_index(index_columns)
+        query_index = df.index[:1]
+        rs = df.loc[query_index, "data"]
+
+        xp_idx = MultiIndex.from_tuples([(0, 1, 0)], names=['a', 'b', 'c'])
+        xp = Series(['x'], index=xp_idx, name='data')
+        tm.assert_series_equal(rs, xp)
+
+    def test_getitem_slice_not_sorted(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        df = frame.sort_index(level=1).T
+
+        # buglet with int typechecking
+        result = df.iloc[:, :np.int32(3)]
+        expected = df.reindex(columns=df.columns[:3])
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_getitem_not_sorted2(self):
+        # 13431
+        df = DataFrame({'col1': ['b', 'd', 'b', 'a'],
+                        'col2': [3, 1, 1, 2],
+                        'data': ['one', 'two', 'three', 'four']})
+
+        df2 = df.set_index(['col1', 'col2'])
+        df2_original = df2.copy()
+
+        df2.index.set_levels(['b', 'd', 'a'], level='col1', inplace=True)
+        df2.index.set_codes([0, 1, 0, 2], level='col1', inplace=True)
+        assert not df2.index.is_lexsorted()
+        assert not df2.index.is_monotonic
+
+        assert df2_original.index.equals(df2.index)
+        expected = df2.sort_index()
+        assert expected.index.is_lexsorted()
+        assert expected.index.is_monotonic
+
+        result = df2.sort_index(level=0)
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+        tm.assert_frame_equal(result, expected)
+
+    def test_frame_getitem_not_sorted(self, multiindex_dataframe_random_data):
+        frame = multiindex_dataframe_random_data
+        df = frame.T
+        df['foo', 'four'] = 'foo'
+
+        arrays = [np.array(x) for x in zip(*df.columns.values)]
+
+        result = df['foo']
+        result2 = df.loc[:, 'foo']
+        expected = df.reindex(columns=df.columns[arrays[0] == 'foo'])
+        expected.columns = expected.columns.droplevel(0)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+        df = df.T
+        result = df.xs('foo')
+        result2 = df.loc['foo']
+        expected = df.reindex(df.index[arrays[0] == 'foo'])
+        expected.index = expected.index.droplevel(0)
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(result2, expected)
+
+    def test_series_getitem_not_sorted(self):
+        arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        tuples = lzip(*arrays)
+        index = MultiIndex.from_tuples(tuples)
+        s = Series(randn(8), index=index)
+
+        arrays = [np.array(x) for x in zip(*index.values)]
+
+        result = s['qux']
+        result2 = s.loc['qux']
+        expected = s[arrays[0] == 'qux']
+        expected.index = expected.index.droplevel(0)
+        tm.assert_series_equal(result, expected)
+        tm.assert_series_equal(result2, expected)
diff --git a/pandas/tests/indexing/multiindex/test_xs.py b/pandas/tests/indexing/multiindex/test_xs.py
new file mode 100644
index 0000000000000..fb6d763cfcf58
--- /dev/null
+++ b/pandas/tests/indexing/multiindex/test_xs.py
@@ -0,0 +1,237 @@
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, product as cart_product
+
+from pandas import DataFrame, Index, MultiIndex, Series, concat, date_range
+import pandas.core.common as com
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def four_level_index_dataframe():
+    arr = np.array([[-0.5109, -2.3358, -0.4645, 0.05076, 0.364],
+                    [0.4473, 1.4152, 0.2834, 1.00661, 0.1744],
+                    [-0.6662, -0.5243, -0.358, 0.89145, 2.5838]])
+    index = MultiIndex(
+        levels=[['a', 'x'], ['b', 'q'], [10.0032, 20.0, 30.0], [3, 4, 5]],
+        codes=[[0, 0, 1], [0, 1, 1], [0, 1, 2], [2, 1, 0]],
+        names=['one', 'two', 'three', 'four'])
+    return DataFrame(arr, index=index, columns=list('ABCDE'))
+
+
+@pytest.mark.parametrize('key, level, exp_arr, exp_index', [
+    ('a', 'lvl0', lambda x: x[:, 0:2], Index(['bar', 'foo'], name='lvl1')),
+    ('foo', 'lvl1', lambda x: x[:, 1:2], Index(['a'], name='lvl0'))
+])
+def test_xs_named_levels_axis_eq_1(key, level, exp_arr, exp_index):
+    # see gh-2903
+    arr = np.random.randn(4, 4)
+    index = MultiIndex(levels=[['a', 'b'], ['bar', 'foo', 'hello', 'world']],
+                       codes=[[0, 0, 1, 1], [0, 1, 2, 3]],
+                       names=['lvl0', 'lvl1'])
+    df = DataFrame(arr, columns=index)
+    result = df.xs(key, level=level, axis=1)
+    expected = DataFrame(exp_arr(arr), columns=exp_index)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_xs_values(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    result = df.xs(('bar', 'two')).values
+    expected = df.values[4]
+    tm.assert_almost_equal(result, expected)
+
+
+def test_xs_loc_equality(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    result = df.xs(('bar', 'two'))
+    expected = df.loc[('bar', 'two')]
+    tm.assert_series_equal(result, expected)
+
+
+def test_xs_missing_values_in_index():
+    # see gh-6574
+    # missing values in returned index should be preserrved
+    acc = [
+        ('a', 'abcde', 1),
+        ('b', 'bbcde', 2),
+        ('y', 'yzcde', 25),
+        ('z', 'xbcde', 24),
+        ('z', None, 26),
+        ('z', 'zbcde', 25),
+        ('z', 'ybcde', 26),
+    ]
+    df = DataFrame(acc,
+                   columns=['a1', 'a2', 'cnt']).set_index(['a1', 'a2'])
+    expected = DataFrame({'cnt': [24, 26, 25, 26]}, index=Index(
+        ['xbcde', np.nan, 'zbcde', 'ybcde'], name='a2'))
+
+    result = df.xs('z', level='a1')
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('key, level', [
+    ('one', 'second'),
+    (['one'], ['second'])
+])
+def test_xs_with_duplicates(key, level, multiindex_dataframe_random_data):
+    # see gh-13719
+    frame = multiindex_dataframe_random_data
+    df = concat([frame] * 2)
+    assert df.index.is_unique is False
+    expected = concat([frame.xs('one', level='second')] * 2)
+
+    result = df.xs(key, level=level)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_xs_level(multiindex_dataframe_random_data):
+    df = multiindex_dataframe_random_data
+    result = df.xs('two', level='second')
+    expected = df[df.index.get_level_values(1) == 'two']
+    expected.index = Index(['foo', 'bar', 'baz', 'qux'], name='first')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_xs_level_eq_2():
+    arr = np.random.randn(3, 5)
+    index = MultiIndex(
+        levels=[['a', 'p', 'x'], ['b', 'q', 'y'], ['c', 'r', 'z']],
+        codes=[[2, 0, 1], [2, 0, 1], [2, 0, 1]])
+    df = DataFrame(arr, index=index)
+    expected = DataFrame(arr[1:2], index=[['a'], ['b']])
+    result = df.xs('c', level=2)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer', [
+    lambda df: df.xs(('a', 4), level=['one', 'four']),
+    lambda df: df.xs('a').xs(4, level='four')
+])
+def test_xs_level_multiple(indexer, four_level_index_dataframe):
+    df = four_level_index_dataframe
+    expected_values = [[0.4473, 1.4152, 0.2834, 1.00661, 0.1744]]
+    expected_index = MultiIndex(
+        levels=[['q'], [20.0]],
+        codes=[[0], [0]],
+        names=['two', 'three'])
+    expected = DataFrame(
+        expected_values, index=expected_index, columns=list('ABCDE'))
+    result = indexer(df)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_xs_setting_with_copy_error(multiindex_dataframe_random_data):
+    # this is a copy in 0.14
+    df = multiindex_dataframe_random_data
+    result = df.xs('two', level='second')
+
+    # setting this will give a SettingWithCopyError
+    # as we are trying to write a view
+    msg = 'A value is trying to be set on a copy of a slice from a DataFrame'
+    with pytest.raises(com.SettingWithCopyError, match=msg):
+        result[:] = 10
+
+
+def test_xs_setting_with_copy_error_multiple(four_level_index_dataframe):
+    # this is a copy in 0.14
+    df = four_level_index_dataframe
+    result = df.xs(('a', 4), level=['one', 'four'])
+
+    # setting this will give a SettingWithCopyError
+    # as we are trying to write a view
+    msg = 'A value is trying to be set on a copy of a slice from a DataFrame'
+    with pytest.raises(com.SettingWithCopyError, match=msg):
+        result[:] = 10
+
+
+def test_xs_integer_key():
+    # see gh-2107
+    dates = lrange(20111201, 20111205)
+    ids = 'abcde'
+    index = MultiIndex.from_tuples(
+        [x for x in cart_product(dates, ids)],
+        names=['date', 'secid'])
+    df = DataFrame(
+        np.random.randn(len(index), 3), index, ['X', 'Y', 'Z'])
+
+    result = df.xs(20111201, level='date')
+    expected = df.loc[20111201, :]
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('indexer', [
+    lambda df: df.xs('a', level=0),
+    lambda df: df.xs('a')
+])
+def test_xs_level0(indexer, four_level_index_dataframe):
+    df = four_level_index_dataframe
+    expected_values = [[-0.5109, -2.3358, -0.4645, 0.05076, 0.364],
+                       [0.4473, 1.4152, 0.2834, 1.00661, 0.1744]]
+    expected_index = MultiIndex(
+        levels=[['b', 'q'], [10.0032, 20.0], [4, 5]],
+        codes=[[0, 1], [0, 1], [1, 0]],
+        names=['two', 'three', 'four'])
+    expected = DataFrame(
+        expected_values, index=expected_index, columns=list('ABCDE'))
+
+    result = indexer(df)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_xs_level_series(multiindex_dataframe_random_data):
+    # this test is not explicitly testing .xs functionality
+    # TODO: move to another module or refactor
+    df = multiindex_dataframe_random_data
+    s = df['A']
+    result = s[:, 'two']
+    expected = df.xs('two', level=1)['A']
+    tm.assert_series_equal(result, expected)
+
+
+def test_xs_level_series_ymd(multiindex_year_month_day_dataframe_random_data):
+    # this test is not explicitly testing .xs functionality
+    # TODO: move to another module or refactor
+    df = multiindex_year_month_day_dataframe_random_data
+    s = df['A']
+    result = s[2000, 5]
+    expected = df.loc[2000, 5]['A']
+    tm.assert_series_equal(result, expected)
+
+
+def test_xs_level_series_slice_not_implemented(
+        multiindex_year_month_day_dataframe_random_data):
+    # this test is not explicitly testing .xs functionality
+    # TODO: move to another module or refactor
+    # not implementing this for now
+    df = multiindex_year_month_day_dataframe_random_data
+    s = df['A']
+
+    msg = r'\(2000, slice\(3, 4, None\)\)'
+    with pytest.raises(TypeError, match=msg):
+        s[2000, 3:4]
+
+
+def test_series_getitem_multiindex_xs():
+    # GH6258
+    dt = list(date_range('20130903', periods=3))
+    idx = MultiIndex.from_product([list('AB'), dt])
+    s = Series([1, 3, 4, 1, 3, 4], index=idx)
+    expected = Series([1, 1], index=list('AB'))
+
+    result = s.xs('20130903', level=1)
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_getitem_multiindex_xs_by_label():
+    # GH5684
+    idx = MultiIndex.from_tuples([('a', 'one'), ('a', 'two'), ('b', 'one'),
+                                  ('b', 'two')])
+    s = Series([1, 2, 3, 4], index=idx)
+    s.index.set_names(['L1', 'L2'], inplace=True)
+    expected = Series([1, 3], index=['a', 'b'])
+    expected.index.set_names(['L1'], inplace=True)
+
+    result = s.xs('one', level='L2')
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexing/test_callable.py b/pandas/tests/indexing/test_callable.py
index 1d70205076b86..d8f65c211a115 100644
--- a/pandas/tests/indexing/test_callable.py
+++ b/pandas/tests/indexing/test_callable.py
@@ -2,11 +2,12 @@
 # pylint: disable-msg=W0612,E1101
 
 import numpy as np
+
 import pandas as pd
 import pandas.util.testing as tm
 
 
-class TestIndexingCallable(tm.TestCase):
+class TestIndexingCallable(object):
 
     def test_frame_loc_ix_callable(self):
         # GH 11485
@@ -59,10 +60,10 @@ def test_frame_loc_ix_callable(self):
 
         # scalar
         res = df.loc[lambda x: 1, lambda x: 'A']
-        self.assertEqual(res, df.loc[1, 'A'])
+        assert res == df.loc[1, 'A']
 
         res = df.loc[lambda x: 1, lambda x: 'A']
-        self.assertEqual(res, df.loc[1, 'A'])
+        assert res == df.loc[1, 'A']
 
     def test_frame_loc_ix_callable_mixture(self):
         # GH 11485
diff --git a/pandas/tests/indexing/test_categorical.py b/pandas/tests/indexing/test_categorical.py
index b8a24cb2dcb03..317aac1766cf8 100644
--- a/pandas/tests/indexing/test_categorical.py
+++ b/pandas/tests/indexing/test_categorical.py
@@ -1,39 +1,46 @@
 # -*- coding: utf-8 -*-
 
-import pandas as pd
 import numpy as np
-from pandas import Series, DataFrame
-from pandas.util.testing import assert_series_equal, assert_frame_equal
+import pytest
+
+import pandas.compat as compat
+
+from pandas.core.dtypes.common import is_categorical_dtype
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DataFrame, Index, Interval, Series,
+    Timestamp)
+from pandas.api.types import CategoricalDtype as CDT
 from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestCategoricalIndex(tm.TestCase):
+class TestCategoricalIndex(object):
 
-    def setUp(self):
+    def setup_method(self, method):
 
         self.df = DataFrame({'A': np.arange(6, dtype='int64'),
                              'B': Series(list('aabbca')).astype(
-                                 'category', categories=list(
-                                     'cab'))}).set_index('B')
+                                 CDT(list('cab')))}).set_index('B')
         self.df2 = DataFrame({'A': np.arange(6, dtype='int64'),
                               'B': Series(list('aabbca')).astype(
-                                  'category', categories=list(
-                                      'cabe'))}).set_index('B')
+                                  CDT(list('cabe')))}).set_index('B')
         self.df3 = DataFrame({'A': np.arange(6, dtype='int64'),
                               'B': (Series([1, 1, 2, 1, 3, 2])
-                                    .astype('category', categories=[3, 2, 1],
-                                            ordered=True))}).set_index('B')
+                                    .astype(CDT([3, 2, 1], ordered=True)))
+                              }).set_index('B')
         self.df4 = DataFrame({'A': np.arange(6, dtype='int64'),
                               'B': (Series([1, 1, 2, 1, 3, 2])
-                                    .astype('category', categories=[3, 2, 1],
-                                            ordered=False))}).set_index('B')
+                                    .astype(CDT([3, 2, 1], ordered=False)))
+                              }).set_index('B')
 
     def test_loc_scalar(self):
         result = self.df.loc['a']
         expected = (DataFrame({'A': [0, 1, 5],
                                'B': (Series(list('aaa'))
-                                     .astype('category',
-                                             categories=list('cab')))})
+                                     .astype(CDT(list('cab'))))})
                     .set_index('B'))
         assert_frame_equal(result, expected)
 
@@ -41,28 +48,258 @@ def test_loc_scalar(self):
         df.loc['a'] = 20
         expected = (DataFrame({'A': [20, 20, 2, 3, 4, 20],
                                'B': (Series(list('aabbca'))
-                                     .astype('category',
-                                             categories=list('cab')))})
+                                     .astype(CDT(list('cab'))))})
                     .set_index('B'))
         assert_frame_equal(df, expected)
 
         # value not in the categories
-        self.assertRaises(KeyError, lambda: df.loc['d'])
+        with pytest.raises(KeyError, match=r"^'d'$"):
+            df.loc['d']
 
-        def f():
+        msg = "cannot append a non-category item to a CategoricalIndex"
+        with pytest.raises(TypeError, match=msg):
             df.loc['d'] = 10
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        msg = ("cannot insert an item into a CategoricalIndex that is not"
+               " already an existing category")
+        with pytest.raises(TypeError, match=msg):
             df.loc['d', 'A'] = 10
-
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(TypeError, match=msg):
             df.loc['d', 'C'] = 10
 
-        self.assertRaises(TypeError, f)
+    def test_getitem_scalar(self):
+
+        cats = Categorical([Timestamp('12-31-1999'),
+                            Timestamp('12-31-2000')])
+
+        s = Series([1, 2], index=cats)
+
+        expected = s.iloc[0]
+        result = s[cats[0]]
+        assert result == expected
+
+    def test_slicing_directly(self):
+        cat = Categorical(["a", "b", "c", "d", "a", "b", "c"])
+        sliced = cat[3]
+        assert sliced == "d"
+        sliced = cat[3:5]
+        expected = Categorical(["d", "a"], categories=['a', 'b', 'c', 'd'])
+        tm.assert_numpy_array_equal(sliced._codes, expected._codes)
+        tm.assert_index_equal(sliced.categories, expected.categories)
+
+    def test_slicing(self):
+        cat = Series(Categorical([1, 2, 3, 4]))
+        reversed = cat[::-1]
+        exp = np.array([4, 3, 2, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(reversed.__array__(), exp)
+
+        df = DataFrame({'value': (np.arange(100) + 1).astype('int64')})
+        df['D'] = pd.cut(df.value, bins=[0, 25, 50, 75, 100])
+
+        expected = Series([11, Interval(0, 25)], index=['value', 'D'], name=10)
+        result = df.iloc[10]
+        tm.assert_series_equal(result, expected)
+
+        expected = DataFrame({'value': np.arange(11, 21).astype('int64')},
+                             index=np.arange(10, 20).astype('int64'))
+        expected['D'] = pd.cut(expected.value, bins=[0, 25, 50, 75, 100])
+        result = df.iloc[10:20]
+        tm.assert_frame_equal(result, expected)
+
+        expected = Series([9, Interval(0, 25)], index=['value', 'D'], name=8)
+        result = df.loc[8]
+        tm.assert_series_equal(result, expected)
+
+    def test_slicing_and_getting_ops(self):
+
+        # systematically test the slicing operations:
+        #  for all slicing ops:
+        #   - returning a dataframe
+        #   - returning a column
+        #   - returning a row
+        #   - returning a single value
+
+        cats = Categorical(
+            ["a", "c", "b", "c", "c", "c", "c"], categories=["a", "b", "c"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n"])
+        values = [1, 2, 3, 4, 5, 6, 7]
+        df = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        # the expected values
+        cats2 = Categorical(["b", "c"], categories=["a", "b", "c"])
+        idx2 = Index(["j", "k"])
+        values2 = [3, 4]
+
+        # 2:4,: | "j":"k",:
+        exp_df = DataFrame({"cats": cats2, "values": values2}, index=idx2)
+
+        # :,"cats" | :,0
+        exp_col = Series(cats, index=idx, name='cats')
+
+        # "j",: | 2,:
+        exp_row = Series(["b", 3], index=["cats", "values"], dtype="object",
+                         name="j")
+
+        # "j","cats | 2,0
+        exp_val = "b"
+
+        # iloc
+        # frame
+        res_df = df.iloc[2:4, :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.iloc[2, :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.iloc[:, 0]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.iloc[2, 0]
+        assert res_val == exp_val
+
+        # loc
+        # frame
+        res_df = df.loc["j":"k", :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.loc["j", :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.loc[:, "cats"]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.loc["j", "cats"]
+        assert res_val == exp_val
+
+        # ix
+        # frame
+        # res_df = df.loc["j":"k",[0,1]] # doesn't work?
+        res_df = df.loc["j":"k", :]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        # row
+        res_row = df.loc["j", :]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        # col
+        res_col = df.loc[:, "cats"]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        # single value
+        res_val = df.loc["j", df.columns[0]]
+        assert res_val == exp_val
+
+        # iat
+        res_val = df.iat[2, 0]
+        assert res_val == exp_val
+
+        # at
+        res_val = df.at["j", "cats"]
+        assert res_val == exp_val
+
+        # fancy indexing
+        exp_fancy = df.iloc[[2]]
+
+        res_fancy = df[df["cats"] == "b"]
+        tm.assert_frame_equal(res_fancy, exp_fancy)
+        res_fancy = df[df["values"] == 3]
+        tm.assert_frame_equal(res_fancy, exp_fancy)
+
+        # get_value
+        res_val = df.at["j", "cats"]
+        assert res_val == exp_val
+
+        # i : int, slice, or sequence of integers
+        res_row = df.iloc[2]
+        tm.assert_series_equal(res_row, exp_row)
+        assert isinstance(res_row["cats"], compat.string_types)
+
+        res_df = df.iloc[slice(2, 4)]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_df = df.iloc[[2, 3]]
+        tm.assert_frame_equal(res_df, exp_df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_col = df.iloc[:, 0]
+        tm.assert_series_equal(res_col, exp_col)
+        assert is_categorical_dtype(res_col)
+
+        res_df = df.iloc[:, slice(0, 2)]
+        tm.assert_frame_equal(res_df, df)
+        assert is_categorical_dtype(res_df["cats"])
+
+        res_df = df.iloc[:, [0, 1]]
+        tm.assert_frame_equal(res_df, df)
+        assert is_categorical_dtype(res_df["cats"])
+
+    def test_slicing_doc_examples(self):
+
+        # GH 7918
+        cats = Categorical(["a", "b", "b", "b", "c", "c", "c"],
+                           categories=["a", "b", "c"])
+        idx = Index(["h", "i", "j", "k", "l", "m", "n", ])
+        values = [1, 2, 2, 2, 3, 4, 5]
+        df = DataFrame({"cats": cats, "values": values}, index=idx)
+
+        result = df.iloc[2:4, :]
+        expected = DataFrame(
+            {"cats": Categorical(['b', 'b'], categories=['a', 'b', 'c']),
+             "values": [2, 2]}, index=['j', 'k'])
+        tm.assert_frame_equal(result, expected)
+
+        result = df.iloc[2:4, :].dtypes
+        expected = Series(['category', 'int64'], ['cats', 'values'])
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc["h":"j", "cats"]
+        expected = Series(Categorical(['a', 'b', 'b'],
+                                      categories=['a', 'b', 'c']),
+                          index=['h', 'i', 'j'], name='cats')
+        tm.assert_series_equal(result, expected)
+
+        result = df.loc["h":"j", df.columns[0:1]]
+        expected = DataFrame({'cats': Categorical(['a', 'b', 'b'],
+                                                  categories=['a', 'b', 'c'])},
+                             index=['h', 'i', 'j'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem_category_type(self):
+        # GH 14580
+        # test iloc() on Series with Categorical data
+
+        s = Series([1, 2, 3]).astype('category')
+
+        # get slice
+        result = s.iloc[0:2]
+        expected = Series([1, 2]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
+
+        # get list of indexes
+        result = s.iloc[[0, 1]]
+        expected = Series([1, 2]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
+
+        # get boolean array
+        result = s.iloc[[True, False, False]]
+        expected = Series([1]).astype(CategoricalDtype([1, 2, 3]))
+        tm.assert_series_equal(result, expected)
 
     def test_loc_listlike(self):
 
@@ -72,70 +309,71 @@ def test_loc_listlike(self):
         assert_frame_equal(result, expected, check_index_type=True)
 
         result = self.df2.loc[['a', 'b', 'e']]
-        exp_index = pd.CategoricalIndex(
+        exp_index = CategoricalIndex(
             list('aaabbe'), categories=list('cabe'), name='B')
         expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan]}, index=exp_index)
         assert_frame_equal(result, expected, check_index_type=True)
 
         # element in the categories but not in the values
-        self.assertRaises(KeyError, lambda: self.df2.loc['e'])
+        with pytest.raises(KeyError, match=r"^'e'$"):
+            self.df2.loc['e']
 
         # assign is ok
         df = self.df2.copy()
         df.loc['e'] = 20
         result = df.loc[['a', 'b', 'e']]
-        exp_index = pd.CategoricalIndex(
+        exp_index = CategoricalIndex(
             list('aaabbe'), categories=list('cabe'), name='B')
         expected = DataFrame({'A': [0, 1, 5, 2, 3, 20]}, index=exp_index)
         assert_frame_equal(result, expected)
 
         df = self.df2.copy()
         result = df.loc[['a', 'b', 'e']]
-        exp_index = pd.CategoricalIndex(
+        exp_index = CategoricalIndex(
             list('aaabbe'), categories=list('cabe'), name='B')
         expected = DataFrame({'A': [0, 1, 5, 2, 3, np.nan]}, index=exp_index)
         assert_frame_equal(result, expected, check_index_type=True)
 
         # not all labels in the categories
-        self.assertRaises(KeyError, lambda: self.df2.loc[['a', 'd']])
+        with pytest.raises(KeyError):
+            self.df2.loc[['a', 'd']]
 
     def test_loc_listlike_dtypes(self):
         # GH 11586
 
         # unique categories and codes
-        index = pd.CategoricalIndex(['a', 'b', 'c'])
+        index = CategoricalIndex(['a', 'b', 'c'])
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}, index=index)
 
         # unique slice
         res = df.loc[['a', 'b']]
-        exp_index = pd.CategoricalIndex(['a', 'b'],
-                                        categories=index.categories)
+        exp_index = CategoricalIndex(['a', 'b'],
+                                     categories=index.categories)
         exp = DataFrame({'A': [1, 2], 'B': [4, 5]}, index=exp_index)
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
         # duplicated slice
         res = df.loc[['a', 'a', 'b']]
 
-        exp_index = pd.CategoricalIndex(['a', 'a', 'b'],
-                                        categories=index.categories)
+        exp_index = CategoricalIndex(['a', 'a', 'b'],
+                                     categories=index.categories)
         exp = DataFrame({'A': [1, 1, 2], 'B': [4, 4, 5]}, index=exp_index)
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
-        with tm.assertRaisesRegexp(
-                KeyError,
-                'a list-indexer must only include values that are '
-                'in the categories'):
+        msg = ('a list-indexer must only include '
+               'values that are in the categories')
+        with pytest.raises(KeyError, match=msg):
             df.loc[['a', 'x']]
 
         # duplicated categories and codes
-        index = pd.CategoricalIndex(['a', 'b', 'a'])
+        index = CategoricalIndex(['a', 'b', 'a'])
         df = DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}, index=index)
 
         # unique slice
         res = df.loc[['a', 'b']]
         exp = DataFrame({'A': [1, 3, 2],
                          'B': [4, 6, 5]},
-                        index=pd.CategoricalIndex(['a', 'a', 'b']))
+                        index=CategoricalIndex(['a', 'a', 'b']))
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
         # duplicated slice
@@ -143,93 +381,146 @@ def test_loc_listlike_dtypes(self):
         exp = DataFrame(
             {'A': [1, 3, 1, 3, 2],
              'B': [4, 6, 4, 6, 5
-                   ]}, index=pd.CategoricalIndex(['a', 'a', 'a', 'a', 'b']))
+                   ]}, index=CategoricalIndex(['a', 'a', 'a', 'a', 'b']))
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
-        with tm.assertRaisesRegexp(
-                KeyError,
-                'a list-indexer must only include values '
-                'that are in the categories'):
+        msg = ('a list-indexer must only include values '
+               'that are in the categories')
+        with pytest.raises(KeyError, match=msg):
             df.loc[['a', 'x']]
 
         # contains unused category
-        index = pd.CategoricalIndex(
+        index = CategoricalIndex(
             ['a', 'b', 'a', 'c'], categories=list('abcde'))
         df = DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]}, index=index)
 
         res = df.loc[['a', 'b']]
-        exp = DataFrame({'A': [1, 3, 2],
-                         'B': [5, 7, 6]}, index=pd.CategoricalIndex(
-                             ['a', 'a', 'b'], categories=list('abcde')))
+        exp = DataFrame({'A': [1, 3, 2], 'B': [5, 7, 6]},
+                        index=CategoricalIndex(['a', 'a', 'b'],
+                                               categories=list('abcde')))
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
         res = df.loc[['a', 'e']]
         exp = DataFrame({'A': [1, 3, np.nan], 'B': [5, 7, np.nan]},
-                        index=pd.CategoricalIndex(['a', 'a', 'e'],
-                                                  categories=list('abcde')))
+                        index=CategoricalIndex(['a', 'a', 'e'],
+                                               categories=list('abcde')))
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
         # duplicated slice
         res = df.loc[['a', 'a', 'b']]
         exp = DataFrame({'A': [1, 3, 1, 3, 2], 'B': [5, 7, 5, 7, 6]},
-                        index=pd.CategoricalIndex(['a', 'a', 'a', 'a', 'b'],
-                                                  categories=list('abcde')))
+                        index=CategoricalIndex(['a', 'a', 'a', 'a', 'b'],
+                                               categories=list('abcde')))
         tm.assert_frame_equal(res, exp, check_index_type=True)
 
-        with tm.assertRaisesRegexp(
-                KeyError,
-                'a list-indexer must only include values '
-                'that are in the categories'):
+        msg = ('a list-indexer must only include values '
+               'that are in the categories')
+        with pytest.raises(KeyError, match=msg):
             df.loc[['a', 'x']]
 
+    def test_get_indexer_array(self):
+        arr = np.array([Timestamp('1999-12-31 00:00:00'),
+                        Timestamp('2000-12-31 00:00:00')], dtype=object)
+        cats = [Timestamp('1999-12-31 00:00:00'),
+                Timestamp('2000-12-31 00:00:00')]
+        ci = CategoricalIndex(cats,
+                              categories=cats,
+                              ordered=False, dtype='category')
+        result = ci.get_indexer(arr)
+        expected = np.array([0, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_indexer_same_categories_same_order(self):
+        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'])
+
+        result = ci.get_indexer(CategoricalIndex(['b', 'b'],
+                                                 categories=['a', 'b']))
+        expected = np.array([1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_indexer_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19551
+        ci = CategoricalIndex(['a', 'b'], categories=['a', 'b'])
+
+        result = ci.get_indexer(CategoricalIndex(['b', 'b'],
+                                                 categories=['b', 'a']))
+        expected = np.array([1, 1], dtype='intp')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_getitem_with_listlike(self):
+        # GH 16115
+        cats = Categorical([Timestamp('12-31-1999'),
+                            Timestamp('12-31-2000')])
+
+        expected = DataFrame([[1, 0], [0, 1]], dtype='uint8',
+                             index=[0, 1], columns=cats)
+        dummies = pd.get_dummies(cats)
+        result = dummies[[c for c in dummies.columns]]
+        assert_frame_equal(result, expected)
+
+    def test_setitem_listlike(self):
+
+        # GH 9469
+        # properly coerce the input indexers
+        np.random.seed(1)
+        c = Categorical(np.random.randint(0, 5, size=150000).astype(
+            np.int8)).add_categories([-1000])
+        indexer = np.array([100000]).astype(np.int64)
+        c[indexer] = -1000
+
+        # we are asserting the code result here
+        # which maps to the -1000 category
+        result = c.codes[np.array([100000]).astype(np.int64)]
+        tm.assert_numpy_array_equal(result, np.array([5], dtype='int8'))
+
     def test_ix_categorical_index(self):
         # GH 12531
-        df = pd.DataFrame(np.random.randn(3, 3),
-                          index=list('ABC'), columns=list('XYZ'))
+        df = DataFrame(np.random.randn(3, 3),
+                       index=list('ABC'), columns=list('XYZ'))
         cdf = df.copy()
-        cdf.index = pd.CategoricalIndex(df.index)
-        cdf.columns = pd.CategoricalIndex(df.columns)
+        cdf.index = CategoricalIndex(df.index)
+        cdf.columns = CategoricalIndex(df.columns)
 
-        expect = pd.Series(df.loc['A', :], index=cdf.columns, name='A')
+        expect = Series(df.loc['A', :], index=cdf.columns, name='A')
         assert_series_equal(cdf.loc['A', :], expect)
 
-        expect = pd.Series(df.loc[:, 'X'], index=cdf.index, name='X')
+        expect = Series(df.loc[:, 'X'], index=cdf.index, name='X')
         assert_series_equal(cdf.loc[:, 'X'], expect)
 
-        exp_index = pd.CategoricalIndex(list('AB'), categories=['A', 'B', 'C'])
-        expect = pd.DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
-                              index=exp_index)
+        exp_index = CategoricalIndex(list('AB'), categories=['A', 'B', 'C'])
+        expect = DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
+                           index=exp_index)
         assert_frame_equal(cdf.loc[['A', 'B'], :], expect)
 
-        exp_columns = pd.CategoricalIndex(list('XY'),
-                                          categories=['X', 'Y', 'Z'])
-        expect = pd.DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
-                              columns=exp_columns)
+        exp_columns = CategoricalIndex(list('XY'),
+                                       categories=['X', 'Y', 'Z'])
+        expect = DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
+                           columns=exp_columns)
         assert_frame_equal(cdf.loc[:, ['X', 'Y']], expect)
 
         # non-unique
-        df = pd.DataFrame(np.random.randn(3, 3),
-                          index=list('ABA'), columns=list('XYX'))
+        df = DataFrame(np.random.randn(3, 3),
+                       index=list('ABA'), columns=list('XYX'))
         cdf = df.copy()
-        cdf.index = pd.CategoricalIndex(df.index)
-        cdf.columns = pd.CategoricalIndex(df.columns)
+        cdf.index = CategoricalIndex(df.index)
+        cdf.columns = CategoricalIndex(df.columns)
 
-        exp_index = pd.CategoricalIndex(list('AA'), categories=['A', 'B'])
-        expect = pd.DataFrame(df.loc['A', :], columns=cdf.columns,
-                              index=exp_index)
+        exp_index = CategoricalIndex(list('AA'), categories=['A', 'B'])
+        expect = DataFrame(df.loc['A', :], columns=cdf.columns,
+                           index=exp_index)
         assert_frame_equal(cdf.loc['A', :], expect)
 
-        exp_columns = pd.CategoricalIndex(list('XX'), categories=['X', 'Y'])
-        expect = pd.DataFrame(df.loc[:, 'X'], index=cdf.index,
-                              columns=exp_columns)
+        exp_columns = CategoricalIndex(list('XX'), categories=['X', 'Y'])
+        expect = DataFrame(df.loc[:, 'X'], index=cdf.index,
+                           columns=exp_columns)
         assert_frame_equal(cdf.loc[:, 'X'], expect)
 
-        expect = pd.DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
-                              index=pd.CategoricalIndex(list('AAB')))
+        expect = DataFrame(df.loc[['A', 'B'], :], columns=cdf.columns,
+                           index=CategoricalIndex(list('AAB')))
         assert_frame_equal(cdf.loc[['A', 'B'], :], expect)
 
-        expect = pd.DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
-                              columns=pd.CategoricalIndex(list('XXY')))
+        expect = DataFrame(df.loc[:, ['X', 'Y']], index=cdf.index,
+                           columns=CategoricalIndex(list('XXY')))
         assert_frame_equal(cdf.loc[:, ['X', 'Y']], expect)
 
     def test_read_only_source(self):
@@ -279,16 +570,16 @@ def test_reindexing(self):
         # then return a Categorical
         cats = list('cabe')
 
-        result = self.df2.reindex(pd.Categorical(['a', 'd'], categories=cats))
+        result = self.df2.reindex(Categorical(['a', 'd'], categories=cats))
         expected = DataFrame({'A': [0, 1, 5, np.nan],
                               'B': Series(list('aaad')).astype(
-                                  'category', categories=cats)}).set_index('B')
+                                  CDT(cats))}).set_index('B')
         assert_frame_equal(result, expected, check_index_type=True)
 
-        result = self.df2.reindex(pd.Categorical(['a'], categories=cats))
+        result = self.df2.reindex(Categorical(['a'], categories=cats))
         expected = DataFrame({'A': [0, 1, 5],
                               'B': Series(list('aaa')).astype(
-                                  'category', categories=cats)}).set_index('B')
+                                  CDT(cats))}).set_index('B')
         assert_frame_equal(result, expected, check_index_type=True)
 
         result = self.df2.reindex(['a', 'b', 'e'])
@@ -307,39 +598,45 @@ def test_reindexing(self):
         assert_frame_equal(result, expected, check_index_type=True)
 
         # give back the type of categorical that we received
-        result = self.df2.reindex(pd.Categorical(
+        result = self.df2.reindex(Categorical(
             ['a', 'd'], categories=cats, ordered=True))
         expected = DataFrame(
             {'A': [0, 1, 5, np.nan],
-             'B': Series(list('aaad')).astype('category', categories=cats,
-                                              ordered=True)}).set_index('B')
+             'B': Series(list('aaad')).astype(
+                 CDT(cats, ordered=True))}).set_index('B')
         assert_frame_equal(result, expected, check_index_type=True)
 
-        result = self.df2.reindex(pd.Categorical(
+        result = self.df2.reindex(Categorical(
             ['a', 'd'], categories=['a', 'd']))
         expected = DataFrame({'A': [0, 1, 5, np.nan],
                               'B': Series(list('aaad')).astype(
-                                  'category', categories=['a', 'd'
-                                                          ])}).set_index('B')
+                                  CDT(['a', 'd']))}).set_index('B')
         assert_frame_equal(result, expected, check_index_type=True)
 
         # passed duplicate indexers are not allowed
-        self.assertRaises(ValueError, lambda: self.df2.reindex(['a', 'a']))
+        msg = "cannot reindex with a non-unique indexer"
+        with pytest.raises(ValueError, match=msg):
+            self.df2.reindex(['a', 'a'])
 
         # args NotImplemented ATM
-        self.assertRaises(NotImplementedError,
-                          lambda: self.df2.reindex(['a'], method='ffill'))
-        self.assertRaises(NotImplementedError,
-                          lambda: self.df2.reindex(['a'], level=1))
-        self.assertRaises(NotImplementedError,
-                          lambda: self.df2.reindex(['a'], limit=2))
+        msg = r"argument {} is not implemented for CategoricalIndex\.reindex"
+        with pytest.raises(NotImplementedError, match=msg.format('method')):
+            self.df2.reindex(['a'], method='ffill')
+        with pytest.raises(NotImplementedError, match=msg.format('level')):
+            self.df2.reindex(['a'], level=1)
+        with pytest.raises(NotImplementedError, match=msg.format('limit')):
+            self.df2.reindex(['a'], limit=2)
 
     def test_loc_slice(self):
         # slicing
         # not implemented ATM
         # GH9748
 
-        self.assertRaises(TypeError, lambda: self.df.loc[1:5])
+        msg = ("cannot do slice indexing on {klass} with these "
+               r"indexers \[1\] of {kind}".format(
+                   klass=str(CategoricalIndex), kind=str(int)))
+        with pytest.raises(TypeError, match=msg):
+            self.df.loc[1:5]
 
         # result = df.loc[1:5]
         # expected = df.iloc[[1,2,3,4]]
@@ -387,8 +684,11 @@ def test_boolean_selection(self):
         #         categories=[3, 2, 1],
         #         ordered=False,
         #         name=u'B')
-        self.assertRaises(TypeError, lambda: df4[df4.index < 2])
-        self.assertRaises(TypeError, lambda: df4[df4.index > 1])
+        msg = "Unordered Categoricals can only compare equality or not"
+        with pytest.raises(TypeError, match=msg):
+            df4[df4.index < 2]
+        with pytest.raises(TypeError, match=msg):
+            df4[df4.index > 1]
 
     def test_indexing_with_category(self):
 
@@ -405,3 +705,21 @@ def test_indexing_with_category(self):
 
         res = (cat[['A']] == 'foo')
         tm.assert_frame_equal(res, exp)
+
+    def test_map_with_dict_or_series(self):
+        orig_values = ['a', 'B', 1, 'a']
+        new_values = ['one', 2, 3.0, 'one']
+        cur_index = pd.CategoricalIndex(orig_values, name='XXX')
+        expected = pd.CategoricalIndex(new_values,
+                                       name='XXX', categories=[3.0, 2, 'one'])
+
+        mapper = pd.Series(new_values[:-1], index=orig_values[:-1])
+        output = cur_index.map(mapper)
+        # Order of categories in output can be different
+        tm.assert_index_equal(expected, output)
+
+        mapper = {o: n for o, n in
+                  zip(orig_values[:-1], new_values[:-1])}
+        output = cur_index.map(mapper)
+        # Order of categories in output can be different
+        tm.assert_index_equal(expected, output)
diff --git a/pandas/tests/indexing/test_chaining_and_caching.py b/pandas/tests/indexing/test_chaining_and_caching.py
index 72e704537ba3f..6070edca075c2 100644
--- a/pandas/tests/indexing/test_chaining_and_caching.py
+++ b/pandas/tests/indexing/test_chaining_and_caching.py
@@ -1,14 +1,14 @@
-from warnings import catch_warnings
-
 import numpy as np
+import pytest
+
 import pandas as pd
+from pandas import (
+    DataFrame, Series, Timestamp, compat, date_range, option_context)
 from pandas.core import common as com
-from pandas import (compat, DataFrame, option_context,
-                    Series, MultiIndex, date_range, Timestamp)
 from pandas.util import testing as tm
 
 
-class TestCaching(tm.TestCase):
+class TestCaching(object):
 
     def test_slice_consolidate_invalidate_item_cache(self):
 
@@ -30,7 +30,7 @@ def test_slice_consolidate_invalidate_item_cache(self):
             # Assignment to wrong series
             df['bb'].iloc[0] = 0.17
             df._clear_item_cache()
-            self.assertAlmostEqual(df['bb'][0], 0.17)
+            tm.assert_almost_equal(df['bb'][0], 0.17)
 
     def test_setitem_cache_updating(self):
         # GH 5424
@@ -48,8 +48,8 @@ def test_setitem_cache_updating(self):
             # set it
             df.loc[7, 'c'] = 1
 
-            self.assertEqual(df.loc[0, 'c'], 0.0)
-            self.assertEqual(df.loc[7, 'c'], 1.0)
+            assert df.loc[0, 'c'] == 0.0
+            assert df.loc[7, 'c'] == 1.0
 
         # GH 7084
         # not updating cache on series setting with slices
@@ -88,12 +88,11 @@ def test_setitem_cache_updating(self):
         tm.assert_series_equal(out['A'], expected['A'])
 
 
-class TestChaining(tm.TestCase):
+class TestChaining(object):
 
     def test_setitem_chained_setfault(self):
 
         # GH6026
-        # setfaults under numpy 1.7.1 (ok on 1.8)
         data = ['right', 'left', 'left', 'left', 'right', 'left', 'timeout']
         mdata = ['right', 'left', 'left', 'left', 'right', 'left', 'none']
 
@@ -134,7 +133,8 @@ def test_detect_chained_assignment(self):
         expected = DataFrame([[-5, 1], [-6, 3]], columns=list('AB'))
         df = DataFrame(np.arange(4).reshape(2, 2),
                        columns=list('AB'), dtype='int64')
-        self.assertIsNone(df.is_copy)
+        assert df._is_copy is None
+
         df['A'][0] = -5
         df['A'][1] = -6
         tm.assert_frame_equal(df, expected)
@@ -142,71 +142,56 @@ def test_detect_chained_assignment(self):
         # test with the chaining
         df = DataFrame({'A': Series(range(2), dtype='int64'),
                         'B': np.array(np.arange(2, 4), dtype=np.float64)})
-        self.assertIsNone(df.is_copy)
+        assert df._is_copy is None
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df['A'][0] = -5
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df['A'][1] = np.nan
 
-        self.assertRaises(com.SettingWithCopyError, f)
-        self.assertIsNone(df['A'].is_copy)
+        assert df['A']._is_copy is None
 
-        # using a copy (the chain), fails
+        # Using a copy (the chain), fails
         df = DataFrame({'A': Series(range(2), dtype='int64'),
                         'B': np.array(np.arange(2, 4), dtype=np.float64)})
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df.loc[0]['A'] = -5
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        # doc example
+        # Doc example
         df = DataFrame({'a': ['one', 'one', 'two', 'three',
                               'two', 'one', 'six'],
                         'c': Series(range(7), dtype='int64')})
-        self.assertIsNone(df.is_copy)
-        expected = DataFrame({'a': ['one', 'one', 'two', 'three',
-                                    'two', 'one', 'six'],
-                              'c': [42, 42, 2, 3, 4, 42, 6]})
+        assert df._is_copy is None
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             indexer = df.a.str.startswith('o')
             df[indexer]['c'] = 42
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
         expected = DataFrame({'A': [111, 'bbb', 'ccc'], 'B': [1, 2, 3]})
         df = DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df['A'][0] = 111
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df.loc[0]['A'] = 111
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
         df.loc[0, 'A'] = 111
         tm.assert_frame_equal(df, expected)
 
-        # make sure that is_copy is picked up reconstruction
-        # GH5475
+        # gh-5475: Make sure that is_copy is picked up reconstruction
         df = DataFrame({"A": [1, 2]})
-        self.assertIsNone(df.is_copy)
+        assert df._is_copy is None
+
         with tm.ensure_clean('__tmp__pickle') as path:
             df.to_pickle(path)
             df2 = pd.read_pickle(path)
             df2["B"] = df2["A"]
             df2["B"] = df2["A"]
 
-        # a suprious raise as we are setting the entire column here
-        # GH5597
+        # gh-5597: a spurious raise as we are setting the entire column here
         from string import ascii_letters as letters
 
         def random_text(nobs=100):
@@ -214,42 +199,48 @@ def random_text(nobs=100):
             for i in range(nobs):
                 idx = np.random.randint(len(letters), size=2)
                 idx.sort()
+
                 df.append([letters[idx[0]:idx[1]]])
 
             return DataFrame(df, columns=['letters'])
 
         df = random_text(100000)
 
-        # always a copy
+        # Always a copy
         x = df.iloc[[0, 1, 2]]
-        self.assertIsNotNone(x.is_copy)
+        assert x._is_copy is not None
+
         x = df.iloc[[0, 1, 2, 4]]
-        self.assertIsNotNone(x.is_copy)
+        assert x._is_copy is not None
 
-        # explicity copy
+        # Explicitly copy
         indexer = df.letters.apply(lambda x: len(x) > 10)
         df = df.loc[indexer].copy()
-        self.assertIsNone(df.is_copy)
+
+        assert df._is_copy is None
         df['letters'] = df['letters'].apply(str.lower)
 
-        # implicity take
+        # Implicitly take
         df = random_text(100000)
         indexer = df.letters.apply(lambda x: len(x) > 10)
         df = df.loc[indexer]
-        self.assertIsNotNone(df.is_copy)
+
+        assert df._is_copy is not None
         df['letters'] = df['letters'].apply(str.lower)
 
-        # implicity take 2
+        # Implicitly take 2
         df = random_text(100000)
         indexer = df.letters.apply(lambda x: len(x) > 10)
+
         df = df.loc[indexer]
-        self.assertIsNotNone(df.is_copy)
+        assert df._is_copy is not None
         df.loc[:, 'letters'] = df['letters'].apply(str.lower)
 
-        # should be ok even though it's a copy!
-        self.assertIsNone(df.is_copy)
+        # Should be ok even though it's a copy!
+        assert df._is_copy is None
+
         df['letters'] = df['letters'].apply(str.lower)
-        self.assertIsNone(df.is_copy)
+        assert df._is_copy is None
 
         df = random_text(100000)
         indexer = df.letters.apply(lambda x: len(x) > 10)
@@ -258,42 +249,25 @@ def random_text(nobs=100):
 
         # an identical take, so no copy
         df = DataFrame({'a': [1]}).dropna()
-        self.assertIsNone(df.is_copy)
+        assert df._is_copy is None
         df['a'] += 1
 
-        # inplace ops
-        # original from:
-        # http://stackoverflow.com/questions/20508968/series-fillna-in-a-multiindex-dataframe-does-not-fill-is-this-a-bug
-        a = [12, 23]
-        b = [123, None]
-        c = [1234, 2345]
-        d = [12345, 23456]
-        tuples = [('eyes', 'left'), ('eyes', 'right'), ('ears', 'left'),
-                  ('ears', 'right')]
-        events = {('eyes', 'left'): a,
-                  ('eyes', 'right'): b,
-                  ('ears', 'left'): c,
-                  ('ears', 'right'): d}
-        multiind = MultiIndex.from_tuples(tuples, names=['part', 'side'])
-        zed = DataFrame(events, index=['a', 'b'], columns=multiind)
-
-        def f():
-            zed['eyes']['right'].fillna(value=555, inplace=True)
-
-        self.assertRaises(com.SettingWithCopyError, f)
-
         df = DataFrame(np.random.randn(10, 4))
         s = df.iloc[:, 0].sort_values()
+
         tm.assert_series_equal(s, df.iloc[:, 0].sort_values())
         tm.assert_series_equal(s, df[0].sort_values())
 
-        # false positives GH6025
+        # see gh-6025: false positives
         df = DataFrame({'column1': ['a', 'a', 'a'], 'column2': [4, 8, 9]})
         str(df)
+
         df['column1'] = df['column1'] + 'b'
         str(df)
+
         df = df[df['column2'] != 8]
         str(df)
+
         df['column1'] = df['column1'] + 'c'
         str(df)
 
@@ -302,46 +276,37 @@ def f():
         df = DataFrame(np.arange(0, 9), columns=['count'])
         df['group'] = 'b'
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df.iloc[0:5]['group'] = 'a'
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        # mixed type setting
-        # same dtype & changing dtype
+        # Mixed type setting but same dtype & changing dtype
         df = DataFrame(dict(A=date_range('20130101', periods=5),
                             B=np.random.randn(5),
                             C=np.arange(5, dtype='int64'),
                             D=list('abcde')))
 
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df.loc[2]['D'] = 'foo'
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df.loc[2]['C'] = 'foo'
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        def f():
+        with pytest.raises(com.SettingWithCopyError):
             df['C'][2] = 'foo'
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
     def test_setting_with_copy_bug(self):
 
         # operating on a copy
-        df = pd.DataFrame({'a': list(range(4)),
-                           'b': list('ab..'),
-                           'c': ['a', 'b', np.nan, 'd']})
-        mask = pd.isnull(df.c)
-
-        def f():
+        df = DataFrame({'a': list(range(4)),
+                        'b': list('ab..'),
+                        'c': ['a', 'b', np.nan, 'd']})
+        mask = pd.isna(df.c)
+
+        msg = ("A value is trying to be set on a copy of a slice from a"
+               " DataFrame")
+        with pytest.raises(com.SettingWithCopyError, match=msg):
             df[['c']][mask] = df[['b']][mask]
 
-        self.assertRaises(com.SettingWithCopyError, f)
-
         # invalid warning as we are returning a new object
         # GH 8730
         df1 = DataFrame({'x': Series(['a', 'b', 'c']),
@@ -352,13 +317,24 @@ def f():
         df2['y'] = ['g', 'h', 'i']
 
     def test_detect_chained_assignment_warnings(self):
+        with option_context("chained_assignment", "warn"):
+            df = DataFrame({"A": ["aaa", "bbb", "ccc"], "B": [1, 2, 3]})
+
+            with tm.assert_produces_warning(com.SettingWithCopyWarning):
+                df.loc[0]["A"] = 111
+
+    def test_detect_chained_assignment_warnings_filter_and_dupe_cols(self):
+        # xref gh-13017.
+        with option_context("chained_assignment", "warn"):
+            df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, -9]],
+                              columns=["a", "a", "c"])
 
-        # warnings
-        with option_context('chained_assignment', 'warn'):
-            df = DataFrame({'A': ['aaa', 'bbb', 'ccc'], 'B': [1, 2, 3]})
-            with tm.assert_produces_warning(
-                    expected_warning=com.SettingWithCopyWarning):
-                df.loc[0]['A'] = 111
+            with tm.assert_produces_warning(com.SettingWithCopyWarning):
+                df.c.loc[df.c > 0] = None
+
+            expected = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, -9]],
+                                    columns=["a", "a", "c"])
+            tm.assert_frame_equal(df, expected)
 
     def test_chained_getitem_with_lists(self):
 
@@ -367,7 +343,7 @@ def test_chained_getitem_with_lists(self):
         # 0.12
         def check(result, expected):
             tm.assert_numpy_array_equal(result, expected)
-            tm.assertIsInstance(result, np.ndarray)
+            assert isinstance(result, np.ndarray)
 
         df = DataFrame({'A': 5 * [np.zeros(3)], 'B': 5 * [np.ones(3)]})
         expected = df['A'].iloc[2]
@@ -380,41 +356,15 @@ def check(result, expected):
         result4 = df['A'].iloc[2]
         check(result4, expected)
 
+    @pytest.mark.filterwarnings("ignore::DeprecationWarning")
     def test_cache_updating(self):
         # GH 4939, make sure to update the cache on setitem
 
         df = tm.makeDataFrame()
         df['A']  # cache series
-        with catch_warnings(record=True):
-            df.ix["Hello Friend"] = df.ix[0]
-        self.assertIn("Hello Friend", df['A'].index)
-        self.assertIn("Hello Friend", df['B'].index)
-
-        with catch_warnings(record=True):
-            panel = tm.makePanel()
-            panel.ix[0]  # get first item into cache
-            panel.ix[:, :, 'A+1'] = panel.ix[:, :, 'A'] + 1
-            self.assertIn("A+1", panel.ix[0].columns)
-            self.assertIn("A+1", panel.ix[1].columns)
-
-        # 5216
-        # make sure that we don't try to set a dead cache
-        a = np.random.rand(10, 3)
-        df = DataFrame(a, columns=['x', 'y', 'z'])
-        tuples = [(i, j) for i in range(5) for j in range(2)]
-        index = MultiIndex.from_tuples(tuples)
-        df.index = index
-
-        # setting via chained assignment
-        # but actually works, since everything is a view
-        df.loc[0]['z'].iloc[0] = 1.
-        result = df.loc[(0, 0), 'z']
-        self.assertEqual(result, 1)
-
-        # correct setting
-        df.loc[(0, 0), 'z'] = 2
-        result = df.loc[(0, 0), 'z']
-        self.assertEqual(result, 2)
+        df.ix["Hello Friend"] = df.ix[0]
+        assert "Hello Friend" in df['A'].index
+        assert "Hello Friend" in df['B'].index
 
         # 10264
         df = DataFrame(np.zeros((5, 5), dtype='int64'), columns=[
@@ -432,3 +382,14 @@ def test_cache_updating(self):
         tm.assert_frame_equal(df, expected)
         expected = Series([0, 0, 0, 2, 0], name='f')
         tm.assert_series_equal(df.f, expected)
+
+    def test_deprecate_is_copy(self):
+        # GH18801
+        df = DataFrame({"A": [1, 2, 3]})
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # getter
+            df.is_copy
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # setter
+            df.is_copy = "test deprecated is_copy"
diff --git a/pandas/tests/indexing/test_coercion.py b/pandas/tests/indexing/test_coercion.py
index 7216c05657102..280db3b2b3004 100644
--- a/pandas/tests/indexing/test_coercion.py
+++ b/pandas/tests/indexing/test_coercion.py
@@ -1,18 +1,41 @@
 # -*- coding: utf-8 -*-
 
-import pytest
+import itertools
+
 import numpy as np
+import pytest
 
-import pandas as pd
-import pandas.util.testing as tm
 import pandas.compat as compat
 
+import pandas as pd
+import pandas.util.testing as tm
 
 ###############################################################
 # Index / Series common tests which may trigger dtype coercions
 ###############################################################
 
 
+@pytest.fixture(autouse=True, scope='class')
+def check_comprehensiveness(request):
+    # Iterate over combination of dtype, method and klass
+    # and ensure that each are contained within a collected test
+    cls = request.cls
+    combos = itertools.product(cls.klasses, cls.dtypes, [cls.method])
+
+    def has_test(combo):
+        klass, dtype, method = combo
+        cls_funcs = request.node.session.items
+        return any(klass in x.name and dtype in x.name and
+                   method in x.name for x in cls_funcs)
+
+    for combo in combos:
+        if not has_test(combo):
+            msg = 'test method is not defined: {0}, {1}'
+            raise AssertionError(msg.format(cls.__name__, combo))
+
+    yield
+
+
 class CoercionBase(object):
 
     klasses = ['index', 'series']
@@ -31,20 +54,11 @@ def _assert(self, left, right, dtype):
             tm.assert_index_equal(left, right)
         else:
             raise NotImplementedError
-        self.assertEqual(left.dtype, dtype)
-        self.assertEqual(right.dtype, dtype)
+        assert left.dtype == dtype
+        assert right.dtype == dtype
 
-    def test_has_comprehensive_tests(self):
-        for klass in self.klasses:
-            for dtype in self.dtypes:
-                method_name = 'test_{0}_{1}_{2}'.format(self.method,
-                                                        klass, dtype)
-                if not hasattr(self, method_name):
-                    msg = 'test method is not defined: {0}, {1}'
-                    raise AssertionError(msg.format(type(self), method_name))
 
-
-class TestSetitemCoercion(CoercionBase, tm.TestCase):
+class TestSetitemCoercion(CoercionBase):
 
     method = 'setitem'
 
@@ -55,191 +69,160 @@ def _assert_setitem_series_conversion(self, original_series, loc_value,
         temp[1] = loc_value
         tm.assert_series_equal(temp, expected_series)
         # check dtype explicitly for sure
-        self.assertEqual(temp.dtype, expected_dtype)
+        assert temp.dtype == expected_dtype
 
         # .loc works different rule, temporary disable
         # temp = original_series.copy()
         # temp.loc[1] = loc_value
         # tm.assert_series_equal(temp, expected_series)
 
-    def test_setitem_series_object(self):
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_setitem_series_object(self, val, exp_dtype):
         obj = pd.Series(list('abcd'))
-        self.assertEqual(obj.dtype, np.object)
-
-        # object + int -> object
-        exp = pd.Series(['a', 1, 'c', 'd'])
-        self._assert_setitem_series_conversion(obj, 1, exp, np.object)
+        assert obj.dtype == np.object
 
-        # object + float -> object
-        exp = pd.Series(['a', 1.1, 'c', 'd'])
-        self._assert_setitem_series_conversion(obj, 1.1, exp, np.object)
+        exp = pd.Series(['a', val, 'c', 'd'])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
 
-        # object + complex -> object
-        exp = pd.Series(['a', 1 + 1j, 'c', 'd'])
-        self._assert_setitem_series_conversion(obj, 1 + 1j, exp, np.object)
-
-        # object + bool -> object
-        exp = pd.Series(['a', True, 'c', 'd'])
-        self._assert_setitem_series_conversion(obj, True, exp, np.object)
-
-    def test_setitem_series_int64(self):
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_int64(self, val, exp_dtype):
         obj = pd.Series([1, 2, 3, 4])
-        self.assertEqual(obj.dtype, np.int64)
-
-        # int + int -> int
-        exp = pd.Series([1, 1, 3, 4])
-        self._assert_setitem_series_conversion(obj, 1, exp, np.int64)
-
-        # int + float -> float
-        # TODO_GH12747 The result must be float
-        # tm.assert_series_equal(temp, pd.Series([1, 1.1, 3, 4]))
-        # self.assertEqual(temp.dtype, np.float64)
-        exp = pd.Series([1, 1, 3, 4])
-        self._assert_setitem_series_conversion(obj, 1.1, exp, np.int64)
-
-        # int + complex -> complex
-        exp = pd.Series([1, 1 + 1j, 3, 4])
-        self._assert_setitem_series_conversion(obj, 1 + 1j, exp, np.complex128)
-
-        # int + bool -> int
-        exp = pd.Series([1, 1, 3, 4])
-        self._assert_setitem_series_conversion(obj, True, exp, np.int64)
-
-    def test_setitem_series_float64(self):
+        assert obj.dtype == np.int64
+
+        if exp_dtype is np.float64:
+            exp = pd.Series([1, 1, 3, 4])
+            self._assert_setitem_series_conversion(obj, 1.1, exp, np.int64)
+            pytest.xfail("GH12747 The result must be float")
+
+        exp = pd.Series([1, val, 3, 4])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (np.int32(1), np.int8),
+        (np.int16(2**9), np.int16)])
+    def test_setitem_series_int8(self, val, exp_dtype):
+        obj = pd.Series([1, 2, 3, 4], dtype=np.int8)
+        assert obj.dtype == np.int8
+
+        if exp_dtype is np.int16:
+            exp = pd.Series([1, 0, 3, 4], dtype=np.int8)
+            self._assert_setitem_series_conversion(obj, val, exp, np.int8)
+            pytest.xfail("BUG: it must be Series([1, 1, 3, 4], dtype=np.int16")
+
+        exp = pd.Series([1, val, 3, 4], dtype=np.int8)
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_float64(self, val, exp_dtype):
         obj = pd.Series([1.1, 2.2, 3.3, 4.4])
-        self.assertEqual(obj.dtype, np.float64)
-
-        # float + int -> float
-        exp = pd.Series([1.1, 1.0, 3.3, 4.4])
-        self._assert_setitem_series_conversion(obj, 1, exp, np.float64)
-
-        # float + float -> float
-        exp = pd.Series([1.1, 1.1, 3.3, 4.4])
-        self._assert_setitem_series_conversion(obj, 1.1, exp, np.float64)
+        assert obj.dtype == np.float64
 
-        # float + complex -> complex
-        exp = pd.Series([1.1, 1 + 1j, 3.3, 4.4])
-        self._assert_setitem_series_conversion(obj, 1 + 1j, exp,
-                                               np.complex128)
+        exp = pd.Series([1.1, val, 3.3, 4.4])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
 
-        # float + bool -> float
-        exp = pd.Series([1.1, 1.0, 3.3, 4.4])
-        self._assert_setitem_series_conversion(obj, True, exp, np.float64)
-
-    def test_setitem_series_complex128(self):
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_setitem_series_complex128(self, val, exp_dtype):
         obj = pd.Series([1 + 1j, 2 + 2j, 3 + 3j, 4 + 4j])
-        self.assertEqual(obj.dtype, np.complex128)
-
-        # complex + int -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 4 + 4j])
-        self._assert_setitem_series_conversion(obj, True, exp, np.complex128)
-
-        # complex + float -> complex
-        exp = pd.Series([1 + 1j, 1.1, 3 + 3j, 4 + 4j])
-        self._assert_setitem_series_conversion(obj, 1.1, exp, np.complex128)
-
-        # complex + complex -> complex
-        exp = pd.Series([1 + 1j, 1 + 1j, 3 + 3j, 4 + 4j])
-        self._assert_setitem_series_conversion(obj, 1 + 1j, exp, np.complex128)
-
-        # complex + bool -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 4 + 4j])
-        self._assert_setitem_series_conversion(obj, True, exp, np.complex128)
-
-    def test_setitem_series_bool(self):
+        assert obj.dtype == np.complex128
+
+        exp = pd.Series([1 + 1j, val, 3 + 3j, 4 + 4j])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (1, np.int64),
+        (3, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.bool)])
+    def test_setitem_series_bool(self, val, exp_dtype):
         obj = pd.Series([True, False, True, False])
-        self.assertEqual(obj.dtype, np.bool)
-
-        # bool + int -> int
-        # TODO_GH12747 The result must be int
-        # tm.assert_series_equal(temp, pd.Series([1, 1, 1, 0]))
-        # self.assertEqual(temp.dtype, np.int64)
-        exp = pd.Series([True, True, True, False])
-        self._assert_setitem_series_conversion(obj, 1, exp, np.bool)
-
-        # TODO_GH12747 The result must be int
-        # assigning int greater than bool
-        # tm.assert_series_equal(temp, pd.Series([1, 3, 1, 0]))
-        # self.assertEqual(temp.dtype, np.int64)
-        exp = pd.Series([True, True, True, False])
-        self._assert_setitem_series_conversion(obj, 3, exp, np.bool)
-
-        # bool + float -> float
-        # TODO_GH12747 The result must be float
-        # tm.assert_series_equal(temp, pd.Series([1., 1.1, 1., 0.]))
-        # self.assertEqual(temp.dtype, np.float64)
-        exp = pd.Series([True, True, True, False])
-        self._assert_setitem_series_conversion(obj, 1.1, exp, np.bool)
-
-        # bool + complex -> complex (buggy, results in bool)
-        # TODO_GH12747 The result must be complex
-        # tm.assert_series_equal(temp, pd.Series([1, 1 + 1j, 1, 0]))
-        # self.assertEqual(temp.dtype, np.complex128)
-        exp = pd.Series([True, True, True, False])
-        self._assert_setitem_series_conversion(obj, 1 + 1j, exp, np.bool)
-
-        # bool + bool -> bool
-        exp = pd.Series([True, True, True, False])
-        self._assert_setitem_series_conversion(obj, True, exp, np.bool)
-
-    def test_setitem_series_datetime64(self):
+        assert obj.dtype == np.bool
+
+        if exp_dtype is np.int64:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be int")
+        elif exp_dtype is np.float64:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be float")
+        elif exp_dtype is np.complex128:
+            exp = pd.Series([True, True, True, False])
+            self._assert_setitem_series_conversion(obj, val, exp, np.bool)
+            pytest.xfail("TODO_GH12747 The result must be complex")
+
+        exp = pd.Series([True, val, True, False])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (1, np.object),
+        ('x', np.object)])
+    def test_setitem_series_datetime64(self, val, exp_dtype):
         obj = pd.Series([pd.Timestamp('2011-01-01'),
                          pd.Timestamp('2011-01-02'),
                          pd.Timestamp('2011-01-03'),
                          pd.Timestamp('2011-01-04')])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
-
-        # datetime64 + datetime64 -> datetime64
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-01'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        self._assert_setitem_series_conversion(obj, pd.Timestamp('2012-01-01'),
-                                               exp, 'datetime64[ns]')
+        assert obj.dtype == 'datetime64[ns]'
 
-        # datetime64 + int -> object
-        # ToDo: The result must be object
         exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp(1),
+                         val,
                          pd.Timestamp('2011-01-03'),
                          pd.Timestamp('2011-01-04')])
-        self._assert_setitem_series_conversion(obj, 1, exp, 'datetime64[ns]')
-
-        # ToDo: add more tests once the above issue has been fixed
-
-    def test_setitem_series_datetime64tz(self):
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]'),
+        (pd.Timestamp('2012-01-01', tz='US/Pacific'), np.object),
+        (pd.Timestamp('2012-01-01'), np.object),
+        (1, np.object)])
+    def test_setitem_series_datetime64tz(self, val, exp_dtype):
         tz = 'US/Eastern'
         obj = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
                          pd.Timestamp('2011-01-02', tz=tz),
                          pd.Timestamp('2011-01-03', tz=tz),
                          pd.Timestamp('2011-01-04', tz=tz)])
-        self.assertEqual(obj.dtype, 'datetime64[ns, US/Eastern]')
+        assert obj.dtype == 'datetime64[ns, US/Eastern]'
 
-        # datetime64tz + datetime64tz -> datetime64tz
         exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp('2012-01-01', tz=tz),
+                         val,
                          pd.Timestamp('2011-01-03', tz=tz),
                          pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01', tz=tz)
-        self._assert_setitem_series_conversion(obj, value, exp,
-                                               'datetime64[ns, US/Eastern]')
-
-        # datetime64 + int -> object
-        # ToDo: The result must be object
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp(1, tz=tz),
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        self._assert_setitem_series_conversion(obj, 1, exp,
-                                               'datetime64[ns, US/Eastern]')
-
-        # ToDo: add more tests once the above issue has been fixed
-
-    def test_setitem_series_timedelta64(self):
-        pass
-
-    def test_setitem_series_period(self):
-        pass
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (pd.Timedelta('12 day'), 'timedelta64[ns]'),
+        (1, np.object),
+        ('x', np.object)])
+    def test_setitem_series_timedelta64(self, val, exp_dtype):
+        obj = pd.Series([pd.Timedelta('1 day'),
+                         pd.Timedelta('2 day'),
+                         pd.Timedelta('3 day'),
+                         pd.Timedelta('4 day')])
+        assert obj.dtype == 'timedelta64[ns]'
+
+        exp = pd.Series([pd.Timedelta('1 day'),
+                         val,
+                         pd.Timedelta('3 day'),
+                         pd.Timedelta('4 day')])
+        self._assert_setitem_series_conversion(obj, val, exp, exp_dtype)
 
     def _assert_setitem_index_conversion(self, original_series, loc_key,
                                          expected_index, expected_dtype):
@@ -249,67 +232,63 @@ def _assert_setitem_index_conversion(self, original_series, loc_key,
         exp = pd.Series([1, 2, 3, 4, 5], index=expected_index)
         tm.assert_series_equal(temp, exp)
         # check dtype explicitly for sure
-        self.assertEqual(temp.index.dtype, expected_dtype)
+        assert temp.index.dtype == expected_dtype
 
         temp = original_series.copy()
         temp.loc[loc_key] = 5
         exp = pd.Series([1, 2, 3, 4, 5], index=expected_index)
         tm.assert_series_equal(temp, exp)
         # check dtype explicitly for sure
-        self.assertEqual(temp.index.dtype, expected_dtype)
+        assert temp.index.dtype == expected_dtype
 
-    def test_setitem_index_object(self):
+    @pytest.mark.parametrize("val,exp_dtype", [
+        ('x', np.object),
+        (5, IndexError),
+        (1.1, np.object)])
+    def test_setitem_index_object(self, val, exp_dtype):
         obj = pd.Series([1, 2, 3, 4], index=list('abcd'))
-        self.assertEqual(obj.index.dtype, np.object)
-
-        # object + object -> object
-        exp_index = pd.Index(list('abcdx'))
-        self._assert_setitem_index_conversion(obj, 'x', exp_index, np.object)
-
-        # object + int -> IndexError, regarded as location
-        temp = obj.copy()
-        with tm.assertRaises(IndexError):
-            temp[5] = 5
+        assert obj.index.dtype == np.object
 
-        # object + float -> object
-        exp_index = pd.Index(['a', 'b', 'c', 'd', 1.1])
-        self._assert_setitem_index_conversion(obj, 1.1, exp_index, np.object)
-
-    def test_setitem_index_int64(self):
-        # tests setitem with non-existing numeric key
+        if exp_dtype is IndexError:
+            temp = obj.copy()
+            with pytest.raises(exp_dtype):
+                temp[5] = 5
+        else:
+            exp_index = pd.Index(list('abcd') + [val])
+            self._assert_setitem_index_conversion(obj, val, exp_index,
+                                                  exp_dtype)
+
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (5, np.int64),
+        (1.1, np.float64),
+        ('x', np.object)])
+    def test_setitem_index_int64(self, val, exp_dtype):
         obj = pd.Series([1, 2, 3, 4])
-        self.assertEqual(obj.index.dtype, np.int64)
-
-        # int + int -> int
-        exp_index = pd.Index([0, 1, 2, 3, 5])
-        self._assert_setitem_index_conversion(obj, 5, exp_index, np.int64)
+        assert obj.index.dtype == np.int64
 
-        # int + float -> float
-        exp_index = pd.Index([0, 1, 2, 3, 1.1])
-        self._assert_setitem_index_conversion(obj, 1.1, exp_index, np.float64)
+        exp_index = pd.Index([0, 1, 2, 3, val])
+        self._assert_setitem_index_conversion(obj, val, exp_index, exp_dtype)
 
-        # int + object -> object
-        exp_index = pd.Index([0, 1, 2, 3, 'x'])
-        self._assert_setitem_index_conversion(obj, 'x', exp_index, np.object)
-
-    def test_setitem_index_float64(self):
-        # tests setitem with non-existing numeric key
+    @pytest.mark.parametrize("val,exp_dtype", [
+        (5, IndexError),
+        (5.1, np.float64),
+        ('x', np.object)])
+    def test_setitem_index_float64(self, val, exp_dtype):
         obj = pd.Series([1, 2, 3, 4], index=[1.1, 2.1, 3.1, 4.1])
-        self.assertEqual(obj.index.dtype, np.float64)
+        assert obj.index.dtype == np.float64
 
-        # float + int -> int
-        temp = obj.copy()
-        # TODO_GH12747 The result must be float
-        with tm.assertRaises(IndexError):
-            temp[5] = 5
+        if exp_dtype is IndexError:
+            # float + int -> int
+            temp = obj.copy()
+            with pytest.raises(exp_dtype):
+                temp[5] = 5
+            pytest.xfail("TODO_GH12747 The result must be float")
 
-        # float + float -> float
-        exp_index = pd.Index([1.1, 2.1, 3.1, 4.1, 5.1])
-        self._assert_setitem_index_conversion(obj, 5.1, exp_index, np.float64)
+        exp_index = pd.Index([1.1, 2.1, 3.1, 4.1, val])
+        self._assert_setitem_index_conversion(obj, val, exp_index, exp_dtype)
 
-        # float + object -> object
-        exp_index = pd.Index([1.1, 2.1, 3.1, 4.1, 'x'])
-        self._assert_setitem_index_conversion(obj, 'x', exp_index, np.object)
+    def test_setitem_series_period(self):
+        pass
 
     def test_setitem_index_complex128(self):
         pass
@@ -330,7 +309,7 @@ def test_setitem_index_period(self):
         pass
 
 
-class TestInsertIndexCoercion(CoercionBase, tm.TestCase):
+class TestInsertIndexCoercion(CoercionBase):
 
     klasses = ['index']
     method = 'insert'
@@ -341,126 +320,75 @@ def _assert_insert_conversion(self, original, value,
         target = original.copy()
         res = target.insert(1, value)
         tm.assert_index_equal(res, expected)
-        self.assertEqual(res.dtype, expected_dtype)
-
-    def test_insert_index_object(self):
+        assert res.dtype == expected_dtype
+
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1, np.object),
+        (1.1, 1.1, np.object),
+        (False, False, np.object),
+        ('x', 'x', np.object)])
+    def test_insert_index_object(self, insert, coerced_val, coerced_dtype):
         obj = pd.Index(list('abcd'))
-        self.assertEqual(obj.dtype, np.object)
-
-        # object + int -> object
-        exp = pd.Index(['a', 1, 'b', 'c', 'd'])
-        self._assert_insert_conversion(obj, 1, exp, np.object)
-
-        # object + float -> object
-        exp = pd.Index(['a', 1.1, 'b', 'c', 'd'])
-        self._assert_insert_conversion(obj, 1.1, exp, np.object)
+        assert obj.dtype == np.object
 
-        # object + bool -> object
-        res = obj.insert(1, False)
-        tm.assert_index_equal(res, pd.Index(['a', False, 'b', 'c', 'd']))
-        self.assertEqual(res.dtype, np.object)
+        exp = pd.Index(['a', coerced_val, 'b', 'c', 'd'])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
 
-        # object + object -> object
-        exp = pd.Index(['a', 'x', 'b', 'c', 'd'])
-        self._assert_insert_conversion(obj, 'x', exp, np.object)
-
-    def test_insert_index_int64(self):
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1, np.int64),
+        (1.1, 1.1, np.float64),
+        (False, 0, np.int64),
+        ('x', 'x', np.object)])
+    def test_insert_index_int64(self, insert, coerced_val, coerced_dtype):
         obj = pd.Int64Index([1, 2, 3, 4])
-        self.assertEqual(obj.dtype, np.int64)
-
-        # int + int -> int
-        exp = pd.Index([1, 1, 2, 3, 4])
-        self._assert_insert_conversion(obj, 1, exp, np.int64)
-
-        # int + float -> float
-        exp = pd.Index([1, 1.1, 2, 3, 4])
-        self._assert_insert_conversion(obj, 1.1, exp, np.float64)
+        assert obj.dtype == np.int64
 
-        # int + bool -> int
-        exp = pd.Index([1, 0, 2, 3, 4])
-        self._assert_insert_conversion(obj, False, exp, np.int64)
+        exp = pd.Index([1, coerced_val, 2, 3, 4])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
 
-        # int + object -> object
-        exp = pd.Index([1, 'x', 2, 3, 4])
-        self._assert_insert_conversion(obj, 'x', exp, np.object)
-
-    def test_insert_index_float64(self):
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (1, 1., np.float64),
+        (1.1, 1.1, np.float64),
+        (False, 0., np.float64),
+        ('x', 'x', np.object)])
+    def test_insert_index_float64(self, insert, coerced_val, coerced_dtype):
         obj = pd.Float64Index([1., 2., 3., 4.])
-        self.assertEqual(obj.dtype, np.float64)
-
-        # float + int -> int
-        exp = pd.Index([1., 1., 2., 3., 4.])
-        self._assert_insert_conversion(obj, 1, exp, np.float64)
-
-        # float + float -> float
-        exp = pd.Index([1., 1.1, 2., 3., 4.])
-        self._assert_insert_conversion(obj, 1.1, exp, np.float64)
-
-        # float + bool -> float
-        exp = pd.Index([1., 0., 2., 3., 4.])
-        self._assert_insert_conversion(obj, False, exp, np.float64)
-
-        # float + object -> object
-        exp = pd.Index([1., 'x', 2., 3., 4.])
-        self._assert_insert_conversion(obj, 'x', exp, np.object)
-
-    def test_insert_index_complex128(self):
-        pass
+        assert obj.dtype == np.float64
 
-    def test_insert_index_bool(self):
-        pass
+        exp = pd.Index([1., coerced_val, 2., 3., 4.])
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
 
-    def test_insert_index_datetime64(self):
+    @pytest.mark.parametrize('fill_val,exp_dtype', [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]')],
+        ids=['datetime64', 'datetime64tz'])
+    def test_insert_index_datetimes(self, fill_val, exp_dtype):
         obj = pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03',
-                                '2011-01-04'])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
+                                '2011-01-04'], tz=fill_val.tz)
+        assert obj.dtype == exp_dtype
 
-        # datetime64 + datetime64 => datetime64
-        exp = pd.DatetimeIndex(['2011-01-01', '2012-01-01', '2011-01-02',
-                                '2011-01-03', '2011-01-04'])
-        self._assert_insert_conversion(obj, pd.Timestamp('2012-01-01'),
-                                       exp, 'datetime64[ns]')
+        exp = pd.DatetimeIndex(['2011-01-01', fill_val.date(), '2011-01-02',
+                                '2011-01-03', '2011-01-04'], tz=fill_val.tz)
+        self._assert_insert_conversion(obj, fill_val, exp, exp_dtype)
 
-        # ToDo: must coerce to object
         msg = "Passed item and index have different timezone"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            obj.insert(1, pd.Timestamp('2012-01-01', tz='US/Eastern'))
-
-        # ToDo: must coerce to object
-        msg = "cannot insert DatetimeIndex with incompatible label"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            obj.insert(1, 1)
+        if fill_val.tz:
+            with pytest.raises(ValueError, match=msg):
+                obj.insert(1, pd.Timestamp('2012-01-01'))
 
-    def test_insert_index_datetime64tz(self):
-        obj = pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03',
-                                '2011-01-04'], tz='US/Eastern')
-        self.assertEqual(obj.dtype, 'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + datetime64tz => datetime64
-        exp = pd.DatetimeIndex(['2011-01-01', '2012-01-01', '2011-01-02',
-                                '2011-01-03', '2011-01-04'], tz='US/Eastern')
-        val = pd.Timestamp('2012-01-01', tz='US/Eastern')
-        self._assert_insert_conversion(obj, val, exp,
-                                       'datetime64[ns, US/Eastern]')
-
-        # ToDo: must coerce to object
-        msg = "Passed item and index have different timezone"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            obj.insert(1, pd.Timestamp('2012-01-01'))
-
-        # ToDo: must coerce to object
-        msg = "Passed item and index have different timezone"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             obj.insert(1, pd.Timestamp('2012-01-01', tz='Asia/Tokyo'))
 
-        # ToDo: must coerce to object
         msg = "cannot insert DatetimeIndex with incompatible label"
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             obj.insert(1, 1)
 
+        pytest.xfail("ToDo: must coerce to object")
+
     def test_insert_index_timedelta64(self):
         obj = pd.TimedeltaIndex(['1 day', '2 day', '3 day', '4 day'])
-        self.assertEqual(obj.dtype, 'timedelta64[ns]')
+        assert obj.dtype == 'timedelta64[ns]'
 
         # timedelta64 + timedelta64 => timedelta64
         exp = pd.TimedeltaIndex(['1 day', '10 day', '2 day', '3 day', '4 day'])
@@ -469,52 +397,44 @@ def test_insert_index_timedelta64(self):
 
         # ToDo: must coerce to object
         msg = "cannot insert TimedeltaIndex with incompatible label"
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             obj.insert(1, pd.Timestamp('2012-01-01'))
 
         # ToDo: must coerce to object
         msg = "cannot insert TimedeltaIndex with incompatible label"
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             obj.insert(1, 1)
 
-    def test_insert_index_period(self):
+    @pytest.mark.parametrize("insert, coerced_val, coerced_dtype", [
+        (pd.Period('2012-01', freq='M'), '2012-01', 'period[M]'),
+        (pd.Timestamp('2012-01-01'), pd.Timestamp('2012-01-01'), np.object),
+        (1, 1, np.object),
+        ('x', 'x', np.object)])
+    def test_insert_index_period(self, insert, coerced_val, coerced_dtype):
         obj = pd.PeriodIndex(['2011-01', '2011-02', '2011-03', '2011-04'],
                              freq='M')
-        self.assertEqual(obj.dtype, 'period[M]')
-
-        # period + period => period
-        exp = pd.PeriodIndex(['2011-01', '2012-01', '2011-02',
-                              '2011-03', '2011-04'], freq='M')
-        self._assert_insert_conversion(obj, pd.Period('2012-01', freq='M'),
-                                       exp, 'period[M]')
-
-        # period + datetime64 => object
-        exp = pd.Index([pd.Period('2011-01', freq='M'),
-                        pd.Timestamp('2012-01-01'),
-                        pd.Period('2011-02', freq='M'),
-                        pd.Period('2011-03', freq='M'),
-                        pd.Period('2011-04', freq='M')], freq='M')
-        self._assert_insert_conversion(obj, pd.Timestamp('2012-01-01'),
-                                       exp, np.object)
-
-        # period + int => object
-        exp = pd.Index([pd.Period('2011-01', freq='M'),
-                        1,
-                        pd.Period('2011-02', freq='M'),
-                        pd.Period('2011-03', freq='M'),
-                        pd.Period('2011-04', freq='M')], freq='M')
-        self._assert_insert_conversion(obj, 1, exp, np.object)
-
-        # period + object => object
-        exp = pd.Index([pd.Period('2011-01', freq='M'),
-                        'x',
-                        pd.Period('2011-02', freq='M'),
-                        pd.Period('2011-03', freq='M'),
-                        pd.Period('2011-04', freq='M')], freq='M')
-        self._assert_insert_conversion(obj, 'x', exp, np.object)
-
-
-class TestWhereCoercion(CoercionBase, tm.TestCase):
+        assert obj.dtype == 'period[M]'
+
+        if isinstance(insert, pd.Period):
+            index_type = pd.PeriodIndex
+        else:
+            index_type = pd.Index
+
+        exp = index_type([pd.Period('2011-01', freq='M'),
+                          coerced_val,
+                          pd.Period('2011-02', freq='M'),
+                          pd.Period('2011-03', freq='M'),
+                          pd.Period('2011-04', freq='M')], freq='M')
+        self._assert_insert_conversion(obj, insert, exp, coerced_dtype)
+
+    def test_insert_index_complex128(self):
+        pass
+
+    def test_insert_index_bool(self):
+        pass
+
+
+class TestWhereCoercion(CoercionBase):
 
     method = 'where'
 
@@ -525,313 +445,206 @@ def _assert_where_conversion(self, original, cond, values,
         res = target.where(cond, values)
         self._assert(res, expected, expected_dtype)
 
-    def _where_object_common(self, klass):
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_where_object(self, klass, fill_val, exp_dtype):
         obj = klass(list('abcd'))
-        self.assertEqual(obj.dtype, np.object)
+        assert obj.dtype == np.object
         cond = klass([True, False, True, False])
 
-        # object + int -> object
-        exp = klass(['a', 1, 'c', 1])
-        self._assert_where_conversion(obj, cond, 1, exp, np.object)
-
-        values = klass([5, 6, 7, 8])
-        exp = klass(['a', 6, 'c', 8])
-        self._assert_where_conversion(obj, cond, values, exp, np.object)
-
-        # object + float -> object
-        exp = klass(['a', 1.1, 'c', 1.1])
-        self._assert_where_conversion(obj, cond, 1.1, exp, np.object)
-
-        values = klass([5.5, 6.6, 7.7, 8.8])
-        exp = klass(['a', 6.6, 'c', 8.8])
-        self._assert_where_conversion(obj, cond, values, exp, np.object)
-
-        # object + complex -> object
-        exp = klass(['a', 1 + 1j, 'c', 1 + 1j])
-        self._assert_where_conversion(obj, cond, 1 + 1j, exp, np.object)
-
-        values = klass([5 + 5j, 6 + 6j, 7 + 7j, 8 + 8j])
-        exp = klass(['a', 6 + 6j, 'c', 8 + 8j])
-        self._assert_where_conversion(obj, cond, values, exp, np.object)
-
-        if klass is pd.Series:
-            exp = klass(['a', 1, 'c', 1])
-            self._assert_where_conversion(obj, cond, True, exp, np.object)
+        if fill_val is True and klass is pd.Series:
+            ret_val = 1
+        else:
+            ret_val = fill_val
 
-            values = klass([True, False, True, True])
-            exp = klass(['a', 0, 'c', 1])
-            self._assert_where_conversion(obj, cond, values, exp, np.object)
-        elif klass is pd.Index:
-            # object + bool -> object
-            exp = klass(['a', True, 'c', True])
-            self._assert_where_conversion(obj, cond, True, exp, np.object)
+        exp = klass(['a', ret_val, 'c', ret_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
 
+        if fill_val is True:
             values = klass([True, False, True, True])
-            exp = klass(['a', False, 'c', True])
-            self._assert_where_conversion(obj, cond, values, exp, np.object)
         else:
-            NotImplementedError
-
-    def test_where_series_object(self):
-        self._where_object_common(pd.Series)
-
-    def test_where_index_object(self):
-        self._where_object_common(pd.Index)
-
-    def _where_int64_common(self, klass):
+            values = klass(fill_val * x for x in [5, 6, 7, 8])
+
+        exp = klass(['a', values[1], 'c', values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.int64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_int64(self, klass, fill_val, exp_dtype):
+        if klass is pd.Index and exp_dtype is np.complex128:
+            pytest.skip("Complex Index not supported")
         obj = klass([1, 2, 3, 4])
-        self.assertEqual(obj.dtype, np.int64)
+        assert obj.dtype == np.int64
         cond = klass([True, False, True, False])
 
-        # int + int -> int
-        exp = klass([1, 1, 3, 1])
-        self._assert_where_conversion(obj, cond, 1, exp, np.int64)
-
-        values = klass([5, 6, 7, 8])
-        exp = klass([1, 6, 3, 8])
-        self._assert_where_conversion(obj, cond, values, exp, np.int64)
-
-        # int + float -> float
-        exp = klass([1, 1.1, 3, 1.1])
-        self._assert_where_conversion(obj, cond, 1.1, exp, np.float64)
-
-        values = klass([5.5, 6.6, 7.7, 8.8])
-        exp = klass([1, 6.6, 3, 8.8])
-        self._assert_where_conversion(obj, cond, values, exp, np.float64)
-
-        # int + complex -> complex
-        if klass is pd.Series:
-            exp = klass([1, 1 + 1j, 3, 1 + 1j])
-            self._assert_where_conversion(obj, cond, 1 + 1j, exp,
-                                          np.complex128)
+        exp = klass([1, fill_val, 3, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
 
-            values = klass([5 + 5j, 6 + 6j, 7 + 7j, 8 + 8j])
-            exp = klass([1, 6 + 6j, 3, 8 + 8j])
-            self._assert_where_conversion(obj, cond, values, exp,
-                                          np.complex128)
-
-        # int + bool -> int
-        exp = klass([1, 1, 3, 1])
-        self._assert_where_conversion(obj, cond, True, exp, np.int64)
-
-        values = klass([True, False, True, True])
-        exp = klass([1, 0, 3, 1])
-        self._assert_where_conversion(obj, cond, values, exp, np.int64)
-
-    def test_where_series_int64(self):
-        self._where_int64_common(pd.Series)
-
-    def test_where_index_int64(self):
-        self._where_int64_common(pd.Index)
-
-    def _where_float64_common(self, klass):
+        if fill_val is True:
+            values = klass([True, False, True, True])
+        else:
+            values = klass(x * fill_val for x in [5, 6, 7, 8])
+        exp = klass([1, values[1], 3, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val, exp_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_float64(self, klass, fill_val, exp_dtype):
+        if klass is pd.Index and exp_dtype is np.complex128:
+            pytest.skip("Complex Index not supported")
         obj = klass([1.1, 2.2, 3.3, 4.4])
-        self.assertEqual(obj.dtype, np.float64)
+        assert obj.dtype == np.float64
         cond = klass([True, False, True, False])
 
-        # float + int -> float
-        exp = klass([1.1, 1.0, 3.3, 1.0])
-        self._assert_where_conversion(obj, cond, 1, exp, np.float64)
-
-        values = klass([5, 6, 7, 8])
-        exp = klass([1.1, 6.0, 3.3, 8.0])
-        self._assert_where_conversion(obj, cond, values, exp, np.float64)
-
-        # float + float -> float
-        exp = klass([1.1, 1.1, 3.3, 1.1])
-        self._assert_where_conversion(obj, cond, 1.1, exp, np.float64)
-
-        values = klass([5.5, 6.6, 7.7, 8.8])
-        exp = klass([1.1, 6.6, 3.3, 8.8])
-        self._assert_where_conversion(obj, cond, values, exp, np.float64)
+        exp = klass([1.1, fill_val, 3.3, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
 
-        # float + complex -> complex
-        if klass is pd.Series:
-            exp = klass([1.1, 1 + 1j, 3.3, 1 + 1j])
-            self._assert_where_conversion(obj, cond, 1 + 1j, exp,
-                                          np.complex128)
-
-            values = klass([5 + 5j, 6 + 6j, 7 + 7j, 8 + 8j])
-            exp = klass([1.1, 6 + 6j, 3.3, 8 + 8j])
-            self._assert_where_conversion(obj, cond, values, exp,
-                                          np.complex128)
-
-        # float + bool -> float
-        exp = klass([1.1, 1.0, 3.3, 1.0])
-        self._assert_where_conversion(obj, cond, True, exp, np.float64)
-
-        values = klass([True, False, True, True])
-        exp = klass([1.1, 0.0, 3.3, 1.0])
-        self._assert_where_conversion(obj, cond, values, exp, np.float64)
-
-    def test_where_series_float64(self):
-        self._where_float64_common(pd.Series)
-
-    def test_where_index_float64(self):
-        self._where_float64_common(pd.Index)
-
-    def test_where_series_complex128(self):
+        if fill_val is True:
+            values = klass([True, False, True, True])
+        else:
+            values = klass(x * fill_val for x in [5, 6, 7, 8])
+        exp = klass([1.1, values[1], 3.3, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_where_series_complex128(self, fill_val, exp_dtype):
         obj = pd.Series([1 + 1j, 2 + 2j, 3 + 3j, 4 + 4j])
-        self.assertEqual(obj.dtype, np.complex128)
+        assert obj.dtype == np.complex128
         cond = pd.Series([True, False, True, False])
 
-        # complex + int -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 1])
-        self._assert_where_conversion(obj, cond, 1, exp, np.complex128)
-
-        values = pd.Series([5, 6, 7, 8])
-        exp = pd.Series([1 + 1j, 6.0, 3 + 3j, 8.0])
-        self._assert_where_conversion(obj, cond, values, exp, np.complex128)
+        exp = pd.Series([1 + 1j, fill_val, 3 + 3j, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
 
-        # complex + float -> complex
-        exp = pd.Series([1 + 1j, 1.1, 3 + 3j, 1.1])
-        self._assert_where_conversion(obj, cond, 1.1, exp, np.complex128)
-
-        values = pd.Series([5.5, 6.6, 7.7, 8.8])
-        exp = pd.Series([1 + 1j, 6.6, 3 + 3j, 8.8])
-        self._assert_where_conversion(obj, cond, values, exp, np.complex128)
-
-        # complex + complex -> complex
-        exp = pd.Series([1 + 1j, 1 + 1j, 3 + 3j, 1 + 1j])
-        self._assert_where_conversion(obj, cond, 1 + 1j, exp, np.complex128)
-
-        values = pd.Series([5 + 5j, 6 + 6j, 7 + 7j, 8 + 8j])
-        exp = pd.Series([1 + 1j, 6 + 6j, 3 + 3j, 8 + 8j])
-        self._assert_where_conversion(obj, cond, values, exp, np.complex128)
-
-        # complex + bool -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 1])
-        self._assert_where_conversion(obj, cond, True, exp, np.complex128)
-
-        values = pd.Series([True, False, True, True])
-        exp = pd.Series([1 + 1j, 0, 3 + 3j, 1])
-        self._assert_where_conversion(obj, cond, values, exp, np.complex128)
+        if fill_val is True:
+            values = pd.Series([True, False, True, True])
+        else:
+            values = pd.Series(x * fill_val for x in [5, 6, 7, 8])
+        exp = pd.Series([1 + 1j, values[1], 3 + 3j, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
 
-    def test_where_index_complex128(self):
-        pass
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.bool)])
+    def test_where_series_bool(self, fill_val, exp_dtype):
 
-    def test_where_series_bool(self):
         obj = pd.Series([True, False, True, False])
-        self.assertEqual(obj.dtype, np.bool)
+        assert obj.dtype == np.bool
         cond = pd.Series([True, False, True, False])
 
-        # bool + int -> int
-        exp = pd.Series([1, 1, 1, 1])
-        self._assert_where_conversion(obj, cond, 1, exp, np.int64)
-
-        values = pd.Series([5, 6, 7, 8])
-        exp = pd.Series([1, 6, 1, 8])
-        self._assert_where_conversion(obj, cond, values, exp, np.int64)
-
-        # bool + float -> float
-        exp = pd.Series([1.0, 1.1, 1.0, 1.1])
-        self._assert_where_conversion(obj, cond, 1.1, exp, np.float64)
-
-        values = pd.Series([5.5, 6.6, 7.7, 8.8])
-        exp = pd.Series([1.0, 6.6, 1.0, 8.8])
-        self._assert_where_conversion(obj, cond, values, exp, np.float64)
-
-        # bool + complex -> complex
-        exp = pd.Series([1, 1 + 1j, 1, 1 + 1j])
-        self._assert_where_conversion(obj, cond, 1 + 1j, exp, np.complex128)
-
-        values = pd.Series([5 + 5j, 6 + 6j, 7 + 7j, 8 + 8j])
-        exp = pd.Series([1, 6 + 6j, 1, 8 + 8j])
-        self._assert_where_conversion(obj, cond, values, exp, np.complex128)
-
-        # bool + bool -> bool
-        exp = pd.Series([True, True, True, True])
-        self._assert_where_conversion(obj, cond, True, exp, np.bool)
-
-        values = pd.Series([True, False, True, True])
-        exp = pd.Series([True, False, True, True])
-        self._assert_where_conversion(obj, cond, values, exp, np.bool)
-
-    def test_where_index_bool(self):
-        pass
+        exp = pd.Series([True, fill_val, True, fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
 
-    def test_where_series_datetime64(self):
+        if fill_val is True:
+            values = pd.Series([True, False, True, True])
+        else:
+            values = pd.Series(x * fill_val for x in [5, 6, 7, 8])
+        exp = pd.Series([True, values[1], True, values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.parametrize("fill_val,exp_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'), np.object)],
+        ids=['datetime64', 'datetime64tz'])
+    def test_where_series_datetime64(self, fill_val, exp_dtype):
         obj = pd.Series([pd.Timestamp('2011-01-01'),
                          pd.Timestamp('2011-01-02'),
                          pd.Timestamp('2011-01-03'),
                          pd.Timestamp('2011-01-04')])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
+        assert obj.dtype == 'datetime64[ns]'
         cond = pd.Series([True, False, True, False])
 
-        # datetime64 + datetime64 -> datetime64
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-01'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2012-01-01')])
-        self._assert_where_conversion(obj, cond, pd.Timestamp('2012-01-01'),
-                                      exp, 'datetime64[ns]')
-
-        values = pd.Series([pd.Timestamp('2012-01-01'),
-                            pd.Timestamp('2012-01-02'),
-                            pd.Timestamp('2012-01-03'),
-                            pd.Timestamp('2012-01-04')])
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-02'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2012-01-04')])
-        self._assert_where_conversion(obj, cond, values, exp, 'datetime64[ns]')
-
-        # ToDo: coerce to object
-        msg = "cannot coerce a Timestamp with a tz on a naive Block"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            obj.where(cond, pd.Timestamp('2012-01-01', tz='US/Eastern'))
-
-        # ToDo: do not coerce to UTC, must be object
-        values = pd.Series([pd.Timestamp('2012-01-01', tz='US/Eastern'),
-                            pd.Timestamp('2012-01-02', tz='US/Eastern'),
-                            pd.Timestamp('2012-01-03', tz='US/Eastern'),
-                            pd.Timestamp('2012-01-04', tz='US/Eastern')])
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-02 05:00'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2012-01-04 05:00')])
-        self._assert_where_conversion(obj, cond, values, exp, 'datetime64[ns]')
-
-    def test_where_index_datetime64(self):
+        exp = pd.Series([pd.Timestamp('2011-01-01'), fill_val,
+                         pd.Timestamp('2011-01-03'), fill_val])
+        self._assert_where_conversion(obj, cond, fill_val, exp, exp_dtype)
+
+        values = pd.Series(pd.date_range(fill_val, periods=4))
+        if fill_val.tz:
+            exp = pd.Series([pd.Timestamp('2011-01-01'),
+                             pd.Timestamp('2012-01-02 00:00', tz='US/Eastern'),
+                             pd.Timestamp('2011-01-03'),
+                             pd.Timestamp('2012-01-04 00:00',
+                                          tz='US/Eastern')])
+            self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+        exp = pd.Series([pd.Timestamp('2011-01-01'), values[1],
+                         pd.Timestamp('2011-01-03'), values[3]])
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    def test_where_index_datetime(self):
+        fill_val = pd.Timestamp('2012-01-01')
+        exp_dtype = 'datetime64[ns]'
         obj = pd.Index([pd.Timestamp('2011-01-01'),
                         pd.Timestamp('2011-01-02'),
                         pd.Timestamp('2011-01-03'),
                         pd.Timestamp('2011-01-04')])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
+        assert obj.dtype == 'datetime64[ns]'
         cond = pd.Index([True, False, True, False])
 
-        # datetime64 + datetime64 -> datetime64
-        # must support scalar
-        msg = "cannot coerce a Timestamp with a tz on a naive Block"
-        with tm.assertRaises(TypeError):
-            obj.where(cond, pd.Timestamp('2012-01-01'))
+        msg = ("Index\\(\\.\\.\\.\\) must be called with a collection "
+               "of some kind")
+        with pytest.raises(TypeError, match=msg):
+            obj.where(cond, fill_val)
 
-        values = pd.Index([pd.Timestamp('2012-01-01'),
-                           pd.Timestamp('2012-01-02'),
-                           pd.Timestamp('2012-01-03'),
-                           pd.Timestamp('2012-01-04')])
+        values = pd.Index(pd.date_range(fill_val, periods=4))
         exp = pd.Index([pd.Timestamp('2011-01-01'),
                         pd.Timestamp('2012-01-02'),
                         pd.Timestamp('2011-01-03'),
                         pd.Timestamp('2012-01-04')])
-        self._assert_where_conversion(obj, cond, values, exp, 'datetime64[ns]')
 
-        # ToDo: coerce to object
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    @pytest.mark.xfail(
+        reason="GH 22839: do not ignore timezone, must be object")
+    def test_where_index_datetimetz(self):
+        fill_val = pd.Timestamp('2012-01-01', tz='US/Eastern')
+        exp_dtype = np.object
+        obj = pd.Index([pd.Timestamp('2011-01-01'),
+                        pd.Timestamp('2011-01-02'),
+                        pd.Timestamp('2011-01-03'),
+                        pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+        cond = pd.Index([True, False, True, False])
+
         msg = ("Index\\(\\.\\.\\.\\) must be called with a collection "
                "of some kind")
-        with tm.assertRaisesRegexp(TypeError, msg):
-            obj.where(cond, pd.Timestamp('2012-01-01', tz='US/Eastern'))
-
-        # ToDo: do not ignore timezone, must be object
-        values = pd.Index([pd.Timestamp('2012-01-01', tz='US/Eastern'),
-                           pd.Timestamp('2012-01-02', tz='US/Eastern'),
-                           pd.Timestamp('2012-01-03', tz='US/Eastern'),
-                           pd.Timestamp('2012-01-04', tz='US/Eastern')])
+        with pytest.raises(TypeError, match=msg):
+            obj.where(cond, fill_val)
+
+        values = pd.Index(pd.date_range(fill_val, periods=4))
         exp = pd.Index([pd.Timestamp('2011-01-01'),
-                        pd.Timestamp('2012-01-02'),
+                        pd.Timestamp('2012-01-02', tz='US/Eastern'),
                         pd.Timestamp('2011-01-03'),
-                        pd.Timestamp('2012-01-04')])
-        self._assert_where_conversion(obj, cond, values, exp, 'datetime64[ns]')
+                        pd.Timestamp('2012-01-04', tz='US/Eastern')],
+                       dtype=exp_dtype)
+
+        self._assert_where_conversion(obj, cond, values, exp, exp_dtype)
+
+    def test_where_index_complex128(self):
+        pass
+
+    def test_where_index_bool(self):
+        pass
 
     def test_where_series_datetime64tz(self):
         pass
@@ -852,12 +665,15 @@ def test_where_index_period(self):
         pass
 
 
-class TestFillnaSeriesCoercion(CoercionBase, tm.TestCase):
+class TestFillnaSeriesCoercion(CoercionBase):
 
     # not indexing, but place here for consisntency
 
     method = 'fillna'
 
+    def test_has_comprehensive_tests(self):
+        pass
+
     def _assert_fillna_conversion(self, original, value,
                                   expected, expected_dtype):
         """ test coercion triggered by fillna """
@@ -865,273 +681,112 @@ def _assert_fillna_conversion(self, original, value,
         res = target.fillna(value)
         self._assert(res, expected, expected_dtype)
 
-    def _fillna_object_common(self, klass):
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val, fill_dtype", [
+        (1, np.object),
+        (1.1, np.object),
+        (1 + 1j, np.object),
+        (True, np.object)])
+    def test_fillna_object(self, klass, fill_val, fill_dtype):
         obj = klass(['a', np.nan, 'c', 'd'])
-        self.assertEqual(obj.dtype, np.object)
-
-        # object + int -> object
-        exp = klass(['a', 1, 'c', 'd'])
-        self._assert_fillna_conversion(obj, 1, exp, np.object)
-
-        # object + float -> object
-        exp = klass(['a', 1.1, 'c', 'd'])
-        self._assert_fillna_conversion(obj, 1.1, exp, np.object)
-
-        # object + complex -> object
-        exp = klass(['a', 1 + 1j, 'c', 'd'])
-        self._assert_fillna_conversion(obj, 1 + 1j, exp, np.object)
-
-        # object + bool -> object
-        exp = klass(['a', True, 'c', 'd'])
-        self._assert_fillna_conversion(obj, True, exp, np.object)
+        assert obj.dtype == np.object
+
+        exp = klass(['a', fill_val, 'c', 'd'])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (1, np.float64),
+        (1.1, np.float64),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_fillna_float64(self, klass, fill_val, fill_dtype):
+        obj = klass([1.1, np.nan, 3.3, 4.4])
+        assert obj.dtype == np.float64
+
+        exp = klass([1.1, fill_val, 3.3, 4.4])
+        # float + complex -> we don't support a complex Index
+        # complex for Series,
+        # object for Index
+        if fill_dtype == np.complex128 and klass == pd.Index:
+            fill_dtype = np.object
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (1, np.complex128),
+        (1.1, np.complex128),
+        (1 + 1j, np.complex128),
+        (True, np.object)])
+    def test_fillna_series_complex128(self, fill_val, fill_dtype):
+        obj = pd.Series([1 + 1j, np.nan, 3 + 3j, 4 + 4j])
+        assert obj.dtype == np.complex128
+
+        exp = pd.Series([1 + 1j, fill_val, 3 + 3j, 4 + 4j])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index],
+                             ids=['series', 'index'])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (pd.Timestamp('2012-01-01'), 'datetime64[ns]'),
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'), np.object),
+        (1, np.object), ('x', np.object)],
+        ids=['datetime64', 'datetime64tz', 'object', 'object'])
+    def test_fillna_datetime(self, klass, fill_val, fill_dtype):
+        obj = klass([pd.Timestamp('2011-01-01'),
+                     pd.NaT,
+                     pd.Timestamp('2011-01-03'),
+                     pd.Timestamp('2011-01-04')])
+        assert obj.dtype == 'datetime64[ns]'
+
+        exp = klass([pd.Timestamp('2011-01-01'),
+                     fill_val,
+                     pd.Timestamp('2011-01-03'),
+                     pd.Timestamp('2011-01-04')])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
+
+    @pytest.mark.parametrize("klass", [pd.Series, pd.Index])
+    @pytest.mark.parametrize("fill_val,fill_dtype", [
+        (pd.Timestamp('2012-01-01', tz='US/Eastern'),
+         'datetime64[ns, US/Eastern]'),
+        (pd.Timestamp('2012-01-01'), np.object),
+        (pd.Timestamp('2012-01-01', tz='Asia/Tokyo'), np.object),
+        (1, np.object),
+        ('x', np.object)])
+    def test_fillna_datetime64tz(self, klass, fill_val, fill_dtype):
+        tz = 'US/Eastern'
 
-    def test_fillna_series_object(self):
-        self._fillna_object_common(pd.Series)
+        obj = klass([pd.Timestamp('2011-01-01', tz=tz),
+                     pd.NaT,
+                     pd.Timestamp('2011-01-03', tz=tz),
+                     pd.Timestamp('2011-01-04', tz=tz)])
+        assert obj.dtype == 'datetime64[ns, US/Eastern]'
 
-    def test_fillna_index_object(self):
-        self._fillna_object_common(pd.Index)
+        exp = klass([pd.Timestamp('2011-01-01', tz=tz),
+                     fill_val,
+                     pd.Timestamp('2011-01-03', tz=tz),
+                     pd.Timestamp('2011-01-04', tz=tz)])
+        self._assert_fillna_conversion(obj, fill_val, exp, fill_dtype)
 
     def test_fillna_series_int64(self):
-        # int can't hold NaN
         pass
 
     def test_fillna_index_int64(self):
         pass
 
-    def _fillna_float64_common(self, klass):
-        obj = klass([1.1, np.nan, 3.3, 4.4])
-        self.assertEqual(obj.dtype, np.float64)
-
-        # float + int -> float
-        exp = klass([1.1, 1.0, 3.3, 4.4])
-        self._assert_fillna_conversion(obj, 1, exp, np.float64)
-
-        # float + float -> float
-        exp = klass([1.1, 1.1, 3.3, 4.4])
-        self._assert_fillna_conversion(obj, 1.1, exp, np.float64)
-
-        if klass is pd.Series:
-            # float + complex -> complex
-            exp = klass([1.1, 1 + 1j, 3.3, 4.4])
-            self._assert_fillna_conversion(obj, 1 + 1j, exp, np.complex128)
-        elif klass is pd.Index:
-            # float + complex -> object
-            exp = klass([1.1, 1 + 1j, 3.3, 4.4])
-            self._assert_fillna_conversion(obj, 1 + 1j, exp, np.object)
-        else:
-            NotImplementedError
-
-        # float + bool -> float
-        exp = klass([1.1, 1.0, 3.3, 4.4])
-        self._assert_fillna_conversion(obj, True, exp, np.float64)
-
-    def test_fillna_series_float64(self):
-        self._fillna_float64_common(pd.Series)
-
-    def test_fillna_index_float64(self):
-        self._fillna_float64_common(pd.Index)
-
-    def test_fillna_series_complex128(self):
-        obj = pd.Series([1 + 1j, np.nan, 3 + 3j, 4 + 4j])
-        self.assertEqual(obj.dtype, np.complex128)
-
-        # complex + int -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 4 + 4j])
-        self._assert_fillna_conversion(obj, 1, exp, np.complex128)
-
-        # complex + float -> complex
-        exp = pd.Series([1 + 1j, 1.1, 3 + 3j, 4 + 4j])
-        self._assert_fillna_conversion(obj, 1.1, exp, np.complex128)
-
-        # complex + complex -> complex
-        exp = pd.Series([1 + 1j, 1 + 1j, 3 + 3j, 4 + 4j])
-        self._assert_fillna_conversion(obj, 1 + 1j, exp, np.complex128)
-
-        # complex + bool -> complex
-        exp = pd.Series([1 + 1j, 1, 3 + 3j, 4 + 4j])
-        self._assert_fillna_conversion(obj, True, exp, np.complex128)
-
-    def test_fillna_index_complex128(self):
-        self._fillna_float64_common(pd.Index)
-
     def test_fillna_series_bool(self):
-        # bool can't hold NaN
         pass
 
     def test_fillna_index_bool(self):
         pass
 
-    def test_fillna_series_datetime64(self):
-        obj = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.NaT,
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
-
-        # datetime64 + datetime64 => datetime64
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-01'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        self._assert_fillna_conversion(obj, pd.Timestamp('2012-01-01'),
-                                       exp, 'datetime64[ns]')
-
-        # datetime64 + datetime64tz => object
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp('2012-01-01', tz='US/Eastern'),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        value = pd.Timestamp('2012-01-01', tz='US/Eastern')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64 + int => object
-        # ToDo: must be coerced to object
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         pd.Timestamp(1),
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        self._assert_fillna_conversion(obj, 1, exp, 'datetime64[ns]')
-
-        # datetime64 + object => object
-        exp = pd.Series([pd.Timestamp('2011-01-01'),
-                         'x',
-                         pd.Timestamp('2011-01-03'),
-                         pd.Timestamp('2011-01-04')])
-        self._assert_fillna_conversion(obj, 'x', exp, np.object)
-
-    def test_fillna_series_datetime64tz(self):
-        tz = 'US/Eastern'
-
-        obj = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.NaT,
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        self.assertEqual(obj.dtype, 'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + datetime64tz => datetime64tz
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp('2012-01-01', tz=tz),
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01', tz=tz)
-        self._assert_fillna_conversion(obj, value, exp,
-                                       'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + datetime64 => object
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp('2012-01-01'),
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64tz + datetime64tz(different tz) => object
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp('2012-01-01', tz='Asia/Tokyo'),
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01', tz='Asia/Tokyo')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64tz + int => datetime64tz
-        # ToDo: must be object
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         pd.Timestamp(1, tz=tz),
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        self._assert_fillna_conversion(obj, 1, exp,
-                                       'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + object => object
-        exp = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                         'x',
-                         pd.Timestamp('2011-01-03', tz=tz),
-                         pd.Timestamp('2011-01-04', tz=tz)])
-        self._assert_fillna_conversion(obj, 'x', exp, np.object)
-
     def test_fillna_series_timedelta64(self):
         pass
 
     def test_fillna_series_period(self):
         pass
 
-    def test_fillna_index_datetime64(self):
-        obj = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03',
-                                '2011-01-04'])
-        self.assertEqual(obj.dtype, 'datetime64[ns]')
-
-        # datetime64 + datetime64 => datetime64
-        exp = pd.DatetimeIndex(['2011-01-01', '2012-01-01',
-                                '2011-01-03', '2011-01-04'])
-        self._assert_fillna_conversion(obj, pd.Timestamp('2012-01-01'),
-                                       exp, 'datetime64[ns]')
-
-        # datetime64 + datetime64tz => object
-        exp = pd.Index([pd.Timestamp('2011-01-01'),
-                        pd.Timestamp('2012-01-01', tz='US/Eastern'),
-                        pd.Timestamp('2011-01-03'),
-                        pd.Timestamp('2011-01-04')])
-        value = pd.Timestamp('2012-01-01', tz='US/Eastern')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64 + int => object
-        exp = pd.Index([pd.Timestamp('2011-01-01'),
-                        1,
-                        pd.Timestamp('2011-01-03'),
-                        pd.Timestamp('2011-01-04')])
-        self._assert_fillna_conversion(obj, 1, exp, np.object)
-
-        # datetime64 + object => object
-        exp = pd.Index([pd.Timestamp('2011-01-01'),
-                        'x',
-                        pd.Timestamp('2011-01-03'),
-                        pd.Timestamp('2011-01-04')])
-        self._assert_fillna_conversion(obj, 'x', exp, np.object)
-
-    def test_fillna_index_datetime64tz(self):
-        tz = 'US/Eastern'
-
-        obj = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-03',
-                                '2011-01-04'], tz=tz)
-        self.assertEqual(obj.dtype, 'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + datetime64tz => datetime64tz
-        exp = pd.DatetimeIndex(['2011-01-01', '2012-01-01',
-                                '2011-01-03', '2011-01-04'], tz=tz)
-        value = pd.Timestamp('2012-01-01', tz=tz)
-        self._assert_fillna_conversion(obj, value, exp,
-                                       'datetime64[ns, US/Eastern]')
-
-        # datetime64tz + datetime64 => object
-        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                        pd.Timestamp('2012-01-01'),
-                        pd.Timestamp('2011-01-03', tz=tz),
-                        pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64tz + datetime64tz(different tz) => object
-        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                        pd.Timestamp('2012-01-01', tz='Asia/Tokyo'),
-                        pd.Timestamp('2011-01-03', tz=tz),
-                        pd.Timestamp('2011-01-04', tz=tz)])
-        value = pd.Timestamp('2012-01-01', tz='Asia/Tokyo')
-        self._assert_fillna_conversion(obj, value, exp, np.object)
-
-        # datetime64tz + int => object
-        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                        1,
-                        pd.Timestamp('2011-01-03', tz=tz),
-                        pd.Timestamp('2011-01-04', tz=tz)])
-        self._assert_fillna_conversion(obj, 1, exp, np.object)
-
-        # datetime64tz + object => object
-        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                        'x',
-                        pd.Timestamp('2011-01-03', tz=tz),
-                        pd.Timestamp('2011-01-04', tz=tz)])
-        self._assert_fillna_conversion(obj, 'x', exp, np.object)
-
     def test_fillna_index_timedelta64(self):
         pass
 
@@ -1139,39 +794,53 @@ def test_fillna_index_period(self):
         pass
 
 
-class TestReplaceSeriesCoercion(CoercionBase, tm.TestCase):
-
-    # not indexing, but place here for consisntency
+class TestReplaceSeriesCoercion(CoercionBase):
 
     klasses = ['series']
     method = 'replace'
 
-    def setUp(self):
-        self.rep = {}
-        self.rep['object'] = ['a', 'b']
-        self.rep['int64'] = [4, 5]
-        self.rep['float64'] = [1.1, 2.2]
-        self.rep['complex128'] = [1 + 1j, 2 + 2j]
-        self.rep['bool'] = [True, False]
-        self.rep['datetime64[ns]'] = [pd.Timestamp('2011-01-01'),
-                                      pd.Timestamp('2011-01-03')]
-
-        for tz in ['UTC', 'US/Eastern']:
-            # to test tz => different tz replacement
-            key = 'datetime64[ns, {0}]'.format(tz)
-            self.rep[key] = [pd.Timestamp('2011-01-01', tz=tz),
-                             pd.Timestamp('2011-01-03', tz=tz)]
-
-        self.rep['timedelta64[ns]'] = [pd.Timedelta('1 day'),
-                                       pd.Timedelta('2 day')]
-
-    def _assert_replace_conversion(self, from_key, to_key, how):
+    rep = {}
+    rep['object'] = ['a', 'b']
+    rep['int64'] = [4, 5]
+    rep['float64'] = [1.1, 2.2]
+    rep['complex128'] = [1 + 1j, 2 + 2j]
+    rep['bool'] = [True, False]
+    rep['datetime64[ns]'] = [pd.Timestamp('2011-01-01'),
+                             pd.Timestamp('2011-01-03')]
+
+    for tz in ['UTC', 'US/Eastern']:
+        # to test tz => different tz replacement
+        key = 'datetime64[ns, {0}]'.format(tz)
+        rep[key] = [pd.Timestamp('2011-01-01', tz=tz),
+                    pd.Timestamp('2011-01-03', tz=tz)]
+
+    rep['timedelta64[ns]'] = [pd.Timedelta('1 day'),
+                              pd.Timedelta('2 day')]
+
+    @pytest.mark.parametrize('how', ['dict', 'series'])
+    @pytest.mark.parametrize('to_key', [
+        'object', 'int64', 'float64', 'complex128', 'bool', 'datetime64[ns]',
+        'datetime64[ns, UTC]', 'datetime64[ns, US/Eastern]', 'timedelta64[ns]'
+    ], ids=['object', 'int64', 'float64', 'complex128', 'bool',
+            'datetime64', 'datetime64tz', 'datetime64tz', 'timedelta64'])
+    @pytest.mark.parametrize('from_key', [
+        'object', 'int64', 'float64', 'complex128', 'bool', 'datetime64[ns]',
+        'datetime64[ns, UTC]', 'datetime64[ns, US/Eastern]', 'timedelta64[ns]']
+    )
+    def test_replace_series(self, how, to_key, from_key):
+        if from_key == 'bool' and how == 'series' and compat.PY3:
+            # doesn't work in PY3, though ...dict_from_bool works fine
+            pytest.skip("doesn't work as in PY3")
+
         index = pd.Index([3, 4], name='xxx')
         obj = pd.Series(self.rep[from_key], index=index, name='yyy')
-        self.assertEqual(obj.dtype, from_key)
+        assert obj.dtype == from_key
 
         if (from_key.startswith('datetime') and to_key.startswith('datetime')):
-            # different tz, currently mask_missing raises SystemError
+            # tested below
+            return
+        elif from_key in ['datetime64[ns, US/Eastern]', 'datetime64[ns, UTC]']:
+            # tested below
             return
 
         if how == 'dict':
@@ -1187,8 +856,7 @@ def _assert_replace_conversion(self, from_key, to_key, how):
             (from_key == 'complex128' and
              to_key in ('int64', 'float64'))):
 
-            # buggy on 32-bit
-            if tm.is_platform_32bit():
+            if compat.is_platform_32bit() or compat.is_platform_windows():
                 pytest.skip("32-bit platform buggy: {0} -> {1}".format
                             (from_key, to_key))
 
@@ -1198,81 +866,74 @@ def _assert_replace_conversion(self, from_key, to_key, how):
 
         else:
             exp = pd.Series(self.rep[to_key], index=index, name='yyy')
-            self.assertEqual(exp.dtype, to_key)
+            assert exp.dtype == to_key
 
         tm.assert_series_equal(result, exp)
 
-    def test_replace_series_object(self):
-        from_key = 'object'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
-
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
-
-    def test_replace_series_int64(self):
-        from_key = 'int64'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
-
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
-
-    def test_replace_series_float64(self):
-        from_key = 'float64'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
-
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
-
-    def test_replace_series_complex128(self):
-        from_key = 'complex128'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
-
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
-
-    def test_replace_series_bool(self):
-        from_key = 'bool'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
+    # TODO(jbrockmendel) commented out to only have a single xfail printed
+    @pytest.mark.xfail(reason='GH #18376, tzawareness-compat bug '
+                              'in BlockManager.replace_list')
+    # @pytest.mark.parametrize('how', ['dict', 'series'])
+    # @pytest.mark.parametrize('to_key', ['timedelta64[ns]', 'bool', 'object',
+    #                                     'complex128', 'float64', 'int64'])
+    # @pytest.mark.parametrize('from_key', ['datetime64[ns, UTC]',
+    #                                       'datetime64[ns, US/Eastern]'])
+    # def test_replace_series_datetime_tz(self, how, to_key, from_key):
+    def test_replace_series_datetime_tz(self):
+        how = 'series'
+        from_key = 'datetime64[ns, US/Eastern]'
+        to_key = 'timedelta64[ns]'
 
-        for to_key in self.rep:
+        index = pd.Index([3, 4], name='xxx')
+        obj = pd.Series(self.rep[from_key], index=index, name='yyy')
+        assert obj.dtype == from_key
 
-            if compat.PY3:
-                # doesn't work in PY3, though ...dict_from_bool works fine
-                pytest.skip("doesn't work as in PY3")
+        if how == 'dict':
+            replacer = dict(zip(self.rep[from_key], self.rep[to_key]))
+        elif how == 'series':
+            replacer = pd.Series(self.rep[to_key], index=self.rep[from_key])
+        else:
+            raise ValueError
 
-            self._assert_replace_conversion(from_key, to_key, how='series')
+        result = obj.replace(replacer)
+        exp = pd.Series(self.rep[to_key], index=index, name='yyy')
+        assert exp.dtype == to_key
 
-    def test_replace_series_datetime64(self):
-        from_key = 'datetime64[ns]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
+        tm.assert_series_equal(result, exp)
 
+    # TODO(jreback) commented out to only have a single xfail printed
+    @pytest.mark.xfail(reason="different tz, "
+                       "currently mask_missing raises SystemError",
+                       strict=False)
+    # @pytest.mark.parametrize('how', ['dict', 'series'])
+    # @pytest.mark.parametrize('to_key', [
+    #    'datetime64[ns]', 'datetime64[ns, UTC]',
+    #    'datetime64[ns, US/Eastern]'])
+    # @pytest.mark.parametrize('from_key', [
+    #    'datetime64[ns]', 'datetime64[ns, UTC]',
+    #    'datetime64[ns, US/Eastern]'])
+    # def test_replace_series_datetime_datetime(self, how, to_key, from_key):
+    def test_replace_series_datetime_datetime(self):
+        how = 'dict'
+        to_key = 'datetime64[ns]'
         from_key = 'datetime64[ns]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
 
-    def test_replace_series_datetime64tz(self):
-        from_key = 'datetime64[ns, US/Eastern]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
+        index = pd.Index([3, 4], name='xxx')
+        obj = pd.Series(self.rep[from_key], index=index, name='yyy')
+        assert obj.dtype == from_key
 
-        from_key = 'datetime64[ns, US/Eastern]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
+        if how == 'dict':
+            replacer = dict(zip(self.rep[from_key], self.rep[to_key]))
+        elif how == 'series':
+            replacer = pd.Series(self.rep[to_key], index=self.rep[from_key])
+        else:
+            raise ValueError
 
-    def test_replace_series_timedelta64(self):
-        from_key = 'timedelta64[ns]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='dict')
+        result = obj.replace(replacer)
+        exp = pd.Series(self.rep[to_key], index=index, name='yyy')
+        assert exp.dtype == to_key
 
-        from_key = 'timedelta64[ns]'
-        for to_key in self.rep:
-            self._assert_replace_conversion(from_key, to_key, how='series')
+        tm.assert_series_equal(result, exp)
 
     def test_replace_series_period(self):
         pass
diff --git a/pandas/tests/indexing/test_datetime.py b/pandas/tests/indexing/test_datetime.py
index eeef41ad6dbb2..11fb90ebd9bb9 100644
--- a/pandas/tests/indexing/test_datetime.py
+++ b/pandas/tests/indexing/test_datetime.py
@@ -1,10 +1,41 @@
+from datetime import datetime, timedelta
+
+from dateutil import tz
 import numpy as np
+
 import pandas as pd
-from pandas import date_range, Index, DataFrame, Series, Timestamp
+from pandas import DataFrame, Index, Series, Timestamp, date_range
 from pandas.util import testing as tm
 
 
-class TestDatetimeIndex(tm.TestCase):
+class TestDatetimeIndex(object):
+
+    def test_setitem_with_datetime_tz(self):
+        # 16889
+        # support .loc with alignment and tz-aware DatetimeIndex
+        mask = np.array([True, False, True, False])
+
+        idx = date_range('20010101', periods=4, tz='UTC')
+        df = DataFrame({'a': np.arange(4)}, index=idx).astype('float64')
+
+        result = df.copy()
+        result.loc[mask, :] = df.loc[mask, :]
+        tm.assert_frame_equal(result, df)
+
+        result = df.copy()
+        result.loc[mask] = df.loc[mask]
+        tm.assert_frame_equal(result, df)
+
+        idx = date_range('20010101', periods=4)
+        df = DataFrame({'a': np.arange(4)}, index=idx).astype('float64')
+
+        result = df.copy()
+        result.loc[mask, :] = df.loc[mask, :]
+        tm.assert_frame_equal(result, df)
+
+        result = df.copy()
+        result.loc[mask] = df.loc[mask]
+        tm.assert_frame_equal(result, df)
 
     def test_indexing_with_datetime_tz(self):
 
@@ -35,10 +66,10 @@ def test_indexing_with_datetime_tz(self):
         df = DataFrame({'a': date_range('2014-01-01', periods=10, tz='UTC')})
         result = df.iloc[5]
         expected = Timestamp('2014-01-06 00:00:00+0000', tz='UTC', freq='D')
-        self.assertEqual(result, expected)
+        assert result == expected
 
         result = df.loc[5]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # indexing - boolean
         result = df[df.a > df.a[3]]
@@ -54,10 +85,12 @@ def test_indexing_with_datetime_tz(self):
             'US/Pacific')
 
         # trying to set a single element on a part of a different timezone
-        def f():
-            df.loc[df.new_col == 'new', 'time'] = v
+        # this converts to object
+        df2 = df.copy()
+        df2.loc[df2.new_col == 'new', 'time'] = v
 
-        self.assertRaises(ValueError, f)
+        expected = Series([v[0], df.loc[1, 'time']], name='time')
+        tm.assert_series_equal(df2.time, expected)
 
         v = df.loc[df.new_col == 'new', 'time'] + pd.Timedelta('1s')
         df.loc[df.new_col == 'new', 'time'] = v
@@ -98,10 +131,9 @@ def test_indexing_with_datetimeindex_tz(self):
 
         # GH 12050
         # indexing on a series with a datetimeindex with tz
-        index = pd.date_range('2015-01-01', periods=2, tz='utc')
+        index = date_range('2015-01-01', periods=2, tz='utc')
 
-        ser = pd.Series(range(2), index=index,
-                        dtype='int64')
+        ser = Series(range(2), index=index, dtype='int64')
 
         # list-like indexing
 
@@ -112,7 +144,7 @@ def test_indexing_with_datetimeindex_tz(self):
             # setitem
             result = ser.copy()
             result[sel] = 1
-            expected = pd.Series(1, index=index)
+            expected = Series(1, index=index)
             tm.assert_series_equal(result, expected)
 
             # .loc getitem
@@ -121,36 +153,35 @@ def test_indexing_with_datetimeindex_tz(self):
             # .loc setitem
             result = ser.copy()
             result.loc[sel] = 1
-            expected = pd.Series(1, index=index)
+            expected = Series(1, index=index)
             tm.assert_series_equal(result, expected)
 
         # single element indexing
 
         # getitem
-        self.assertEqual(ser[index[1]], 1)
+        assert ser[index[1]] == 1
 
         # setitem
         result = ser.copy()
         result[index[1]] = 5
-        expected = pd.Series([0, 5], index=index)
+        expected = Series([0, 5], index=index)
         tm.assert_series_equal(result, expected)
 
         # .loc getitem
-        self.assertEqual(ser.loc[index[1]], 1)
+        assert ser.loc[index[1]] == 1
 
         # .loc setitem
         result = ser.copy()
         result.loc[index[1]] = 5
-        expected = pd.Series([0, 5], index=index)
+        expected = Series([0, 5], index=index)
         tm.assert_series_equal(result, expected)
 
     def test_partial_setting_with_datetimelike_dtype(self):
 
         # GH9478
         # a datetimeindex alignment issue with partial setting
-        df = pd.DataFrame(np.arange(6.).reshape(3, 2), columns=list('AB'),
-                          index=pd.date_range('1/1/2000', periods=3,
-                                              freq='1H'))
+        df = DataFrame(np.arange(6.).reshape(3, 2), columns=list('AB'),
+                       index=date_range('1/1/2000', periods=3, freq='1H'))
         expected = df.copy()
         expected['C'] = [expected.index[0]] + [pd.NaT, pd.NaT]
 
@@ -167,7 +198,7 @@ def test_loc_setitem_datetime(self):
         for conv in [lambda x: x, lambda x: x.to_datetime64(),
                      lambda x: x.to_pydatetime(), lambda x: np.datetime64(x)]:
 
-            df = pd.DataFrame()
+            df = DataFrame()
             df.loc[conv(dt1), 'one'] = 100
             df.loc[conv(dt2), 'one'] = 200
 
@@ -194,7 +225,9 @@ def test_series_partial_set_datetime(self):
                 Timestamp('2011-01-03')]
         exp = Series([np.nan, 0.2, np.nan],
                      index=pd.DatetimeIndex(keys, name='idx'), name='s')
-        tm.assert_series_equal(ser.loc[keys], exp, check_index_type=True)
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            tm.assert_series_equal(ser.loc[keys], exp, check_index_type=True)
 
     def test_series_partial_set_period(self):
         # GH 11497
@@ -219,5 +252,64 @@ def test_series_partial_set_period(self):
                 pd.Period('2011-01-03', freq='D')]
         exp = Series([np.nan, 0.2, np.nan],
                      index=pd.PeriodIndex(keys, name='idx'), name='s')
-        result = ser.loc[keys]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = ser.loc[keys]
         tm.assert_series_equal(result, exp)
+
+    def test_nanosecond_getitem_setitem_with_tz(self):
+        # GH 11679
+        data = ['2016-06-28 08:30:00.123456789']
+        index = pd.DatetimeIndex(data, dtype='datetime64[ns, America/Chicago]')
+        df = DataFrame({'a': [10]}, index=index)
+        result = df.loc[df.index[0]]
+        expected = Series(10, index=['a'], name=df.index[0])
+        tm.assert_series_equal(result, expected)
+
+        result = df.copy()
+        result.loc[df.index[0], 'a'] = -1
+        expected = DataFrame(-1, index=index, columns=['a'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_loc_getitem_across_dst(self):
+        # GH 21846
+        idx = pd.date_range('2017-10-29 01:30:00',
+                            tz='Europe/Berlin', periods=5, freq='30 min')
+        series2 = pd.Series([0, 1, 2, 3, 4],
+                            index=idx)
+
+        t_1 = pd.Timestamp('2017-10-29 02:30:00+02:00', tz='Europe/Berlin',
+                           freq='30min')
+        t_2 = pd.Timestamp('2017-10-29 02:00:00+01:00', tz='Europe/Berlin',
+                           freq='30min')
+        result = series2.loc[t_1:t_2]
+        expected = pd.Series([2, 3], index=idx[2:4])
+        tm.assert_series_equal(result, expected)
+
+        result = series2[t_1]
+        expected = 2
+        assert result == expected
+
+    def test_loc_incremental_setitem_with_dst(self):
+        # GH 20724
+        base = datetime(2015, 11, 1, tzinfo=tz.gettz("US/Pacific"))
+        idxs = [base + timedelta(seconds=i * 900) for i in range(16)]
+        result = pd.Series([0], index=[idxs[0]])
+        for ts in idxs:
+            result.loc[ts] = 1
+        expected = pd.Series(1, index=idxs)
+        tm.assert_series_equal(result, expected)
+
+    def test_loc_setitem_with_existing_dst(self):
+        # GH 18308
+        start = pd.Timestamp('2017-10-29 00:00:00+0200', tz='Europe/Madrid')
+        end = pd.Timestamp('2017-10-29 03:00:00+0100', tz='Europe/Madrid')
+        ts = pd.Timestamp('2016-10-10 03:00:00', tz='Europe/Madrid')
+        idx = pd.date_range(start, end, closed='left', freq="H")
+        result = pd.DataFrame(index=idx, columns=['value'])
+        result.loc[ts, 'value'] = 12
+        expected = pd.DataFrame([np.nan] * len(idx) + [12],
+                                index=idx.append(pd.DatetimeIndex([ts])),
+                                columns=['value'],
+                                dtype=object)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/indexing/test_floats.py b/pandas/tests/indexing/test_floats.py
index 99e7460b2a3de..b9b47338c9de2 100644
--- a/pandas/tests/indexing/test_floats.py
+++ b/pandas/tests/indexing/test_floats.py
@@ -1,13 +1,19 @@
 # -*- coding: utf-8 -*-
 
 from warnings import catch_warnings
+
 import numpy as np
-from pandas import Series, DataFrame, Index, Float64Index
-from pandas.util.testing import assert_series_equal, assert_almost_equal
+import pytest
+
+from pandas import (
+    DataFrame, Float64Index, Index, Int64Index, RangeIndex, Series, compat)
 import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal, assert_series_equal
 
+ignore_ix = pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
 
-class TestFloatIndexers(tm.TestCase):
+
+class TestFloatIndexers(object):
 
     def check(self, result, original, indexer, getitem):
         """
@@ -44,16 +50,17 @@ def test_scalar_error(self):
 
             s = Series(np.arange(len(i)), index=i)
 
-            def f():
+            msg = 'Cannot index by location index'
+            with pytest.raises(TypeError, match=msg):
                 s.iloc[3.0]
-            self.assertRaisesRegexp(TypeError,
-                                    'cannot do positional indexing',
-                                    f)
 
-            def f():
+            msg = ("cannot do positional indexing on {klass} with these "
+                   r"indexers \[3\.0\] of {kind}".format(
+                       klass=type(i), kind=str(float)))
+            with pytest.raises(TypeError, match=msg):
                 s.iloc[3.0] = 0
-            self.assertRaises(TypeError, f)
 
+    @ignore_ix
     def test_scalar_non_numeric(self):
 
         # GH 4892
@@ -77,35 +84,46 @@ def test_scalar_non_numeric(self):
                                       (lambda x: x.iloc, False),
                                       (lambda x: x, True)]:
 
-                    def f():
-                        with catch_warnings(record=True):
-                            idxr(s)[3.0]
-
                     # gettitem on a DataFrame is a KeyError as it is indexing
                     # via labels on the columns
                     if getitem and isinstance(s, DataFrame):
                         error = KeyError
+                        msg = r"^3(\.0)?$"
                     else:
                         error = TypeError
-                    self.assertRaises(error, f)
+                        msg = (r"cannot do (label|index|positional) indexing"
+                               r" on {klass} with these indexers \[3\.0\] of"
+                               r" {kind}|"
+                               "Cannot index by location index with a"
+                               " non-integer key"
+                               .format(klass=type(i), kind=str(float)))
+                    with catch_warnings(record=True):
+                        with pytest.raises(error, match=msg):
+                            idxr(s)[3.0]
 
                 # label based can be a TypeError or KeyError
-                def f():
-                    s.loc[3.0]
-
                 if s.index.inferred_type in ['string', 'unicode', 'mixed']:
                     error = KeyError
+                    msg = r"^3$"
                 else:
                     error = TypeError
-                self.assertRaises(error, f)
+                    msg = (r"cannot do (label|index) indexing"
+                           r" on {klass} with these indexers \[3\.0\] of"
+                           r" {kind}"
+                           .format(klass=type(i), kind=str(float)))
+                with pytest.raises(error, match=msg):
+                    s.loc[3.0]
 
                 # contains
-                self.assertFalse(3.0 in s)
+                assert 3.0 not in s
 
                 # setting with a float fails with iloc
-                def f():
+                msg = (r"cannot do (label|index|positional) indexing"
+                       r" on {klass} with these indexers \[3\.0\] of"
+                       r" {kind}"
+                       .format(klass=type(i), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     s.iloc[3.0] = 0
-                self.assertRaises(TypeError, f)
 
                 # setting with an indexer
                 if s.index.inferred_type in ['categorical']:
@@ -121,80 +139,109 @@ def f():
                     #    s2 = s.copy()
                     #    def f():
                     #        idxr(s2)[3.0] = 0
-                    #    self.assertRaises(TypeError, f)
+                    #    pytest.raises(TypeError, f)
                     pass
 
                 else:
 
                     s2 = s.copy()
                     s2.loc[3.0] = 10
-                    self.assertTrue(s2.index.is_object())
+                    assert s2.index.is_object()
 
                     for idxr in [lambda x: x.ix,
                                  lambda x: x]:
                         s2 = s.copy()
                         with catch_warnings(record=True):
                             idxr(s2)[3.0] = 0
-                        self.assertTrue(s2.index.is_object())
+                        assert s2.index.is_object()
 
             # fallsback to position selection, series only
             s = Series(np.arange(len(i)), index=i)
             s[3]
-            self.assertRaises(TypeError, lambda: s[3.0])
-
+            msg = (r"cannot do (label|index) indexing"
+                   r" on {klass} with these indexers \[3\.0\] of"
+                   r" {kind}"
+                   .format(klass=type(i), kind=str(float)))
+            with pytest.raises(TypeError, match=msg):
+                s[3.0]
+
+    @ignore_ix
     def test_scalar_with_mixed(self):
 
         s2 = Series([1, 2, 3], index=['a', 'b', 'c'])
         s3 = Series([1, 2, 3], index=['a', 'b', 1.5])
 
-        # lookup in a pure string index
+        # lookup in a pure stringstr
         # with an invalid indexer
         for idxr in [lambda x: x.ix,
                      lambda x: x,
                      lambda x: x.iloc]:
 
-            def f():
-                with catch_warnings(record=True):
+            msg = (r"cannot do label indexing"
+                   r" on {klass} with these indexers \[1\.0\] of"
+                   r" {kind}|"
+                   "Cannot index by location index with a non-integer key"
+                   .format(klass=str(Index), kind=str(float)))
+            with catch_warnings(record=True):
+                with pytest.raises(TypeError, match=msg):
                     idxr(s2)[1.0]
 
-            self.assertRaises(TypeError, f)
-
-        self.assertRaises(KeyError, lambda: s2.loc[1.0])
+        with pytest.raises(KeyError, match=r"^1$"):
+            s2.loc[1.0]
 
         result = s2.loc['b']
         expected = 2
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # mixed index so we have label
         # indexing
-        for idxr in [lambda x: x.ix,
-                     lambda x: x]:
-
-            def f():
-                with catch_warnings(record=True):
-                    idxr(s3)[1.0]
+        for idxr in [lambda x: x]:
 
-            self.assertRaises(TypeError, f)
+            msg = (r"cannot do label indexing"
+                   r" on {klass} with these indexers \[1\.0\] of"
+                   r" {kind}"
+                   .format(klass=str(Index), kind=str(float)))
+            with pytest.raises(TypeError, match=msg):
+                idxr(s3)[1.0]
 
             result = idxr(s3)[1]
             expected = 2
-            self.assertEqual(result, expected)
+            assert result == expected
 
-        self.assertRaises(TypeError, lambda: s3.iloc[1.0])
-        self.assertRaises(KeyError, lambda: s3.loc[1.0])
+        # mixed index so we have label
+        # indexing
+        for idxr in [lambda x: x.ix]:
+            with catch_warnings(record=True):
+
+                msg = (r"cannot do label indexing"
+                       r" on {klass} with these indexers \[1\.0\] of"
+                       r" {kind}"
+                       .format(klass=str(Index), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
+                    idxr(s3)[1.0]
+
+                result = idxr(s3)[1]
+                expected = 2
+                assert result == expected
+
+        msg = "Cannot index by location index with a non-integer key"
+        with pytest.raises(TypeError, match=msg):
+            s3.iloc[1.0]
+        with pytest.raises(KeyError, match=r"^1$"):
+            s3.loc[1.0]
 
         result = s3.loc[1.5]
         expected = 3
-        self.assertEqual(result, expected)
+        assert result == expected
 
+    @ignore_ix
     def test_scalar_integer(self):
 
         # test how scalar float indexers work on int indexes
 
         # integer index
-        for index in [tm.makeIntIndex, tm.makeRangeIndex]:
+        for i in [Int64Index(range(5)), RangeIndex(5)]:
 
-            i = index(5)
             for s in [Series(np.arange(len(i))),
                       DataFrame(np.random.randn(len(i), len(i)),
                                 index=i, columns=i)]:
@@ -214,7 +261,8 @@ def test_scalar_integer(self):
                                       (lambda x: x, True)]:
 
                     if isinstance(s, Series):
-                        compare = self.assertEqual
+                        def compare(x, y):
+                            assert x == y
                         expected = 100
                     else:
                         compare = tm.assert_series_equal
@@ -237,8 +285,9 @@ def test_scalar_integer(self):
 
                 # contains
                 # coerce to equal int
-                self.assertTrue(3.0 in s)
+                assert 3.0 in s
 
+    @ignore_ix
     def test_scalar_float(self):
 
         # scalar float indexers work on a float index
@@ -254,26 +303,23 @@ def test_scalar_float(self):
                                   (lambda x: x, True)]:
 
                 # getting
-                with catch_warnings(record=True):
-                    result = idxr(s)[indexer]
+                result = idxr(s)[indexer]
                 self.check(result, s, 3, getitem)
 
                 # setting
                 s2 = s.copy()
 
-                def f():
-                    with catch_warnings(record=True):
-                        idxr(s2)[indexer] = expected
                 with catch_warnings(record=True):
                     result = idxr(s2)[indexer]
                 self.check(result, s, 3, getitem)
 
                 # random integer is a KeyError
                 with catch_warnings(record=True):
-                    self.assertRaises(KeyError, lambda: idxr(s)[3.5])
+                    with pytest.raises(KeyError, match=r"^3\.5$"):
+                        idxr(s)[3.5]
 
             # contains
-            self.assertTrue(3.0 in s)
+            assert 3.0 in s
 
             # iloc succeeds with an integer
             expected = s.iloc[3]
@@ -284,12 +330,18 @@ def f():
             self.check(result, s, 3, False)
 
             # iloc raises with a float
-            self.assertRaises(TypeError, lambda: s.iloc[3.0])
+            msg = "Cannot index by location index with a non-integer key"
+            with pytest.raises(TypeError, match=msg):
+                s.iloc[3.0]
 
-            def g():
+            msg = (r"cannot do positional indexing"
+                   r" on {klass} with these indexers \[3\.0\] of"
+                   r" {kind}"
+                   .format(klass=str(Float64Index), kind=str(float)))
+            with pytest.raises(TypeError, match=msg):
                 s2.iloc[3.0] = 0
-            self.assertRaises(TypeError, g)
 
+    @ignore_ix
     def test_slice_non_numeric(self):
 
         # GH 4892
@@ -309,47 +361,66 @@ def test_slice_non_numeric(self):
                           slice(3, 4.0),
                           slice(3.0, 4.0)]:
 
-                    def f():
+                    msg = ("cannot do slice indexing"
+                           r" on {klass} with these indexers \[(3|4)\.0\] of"
+                           " {kind}"
+                           .format(klass=type(index), kind=str(float)))
+                    with pytest.raises(TypeError, match=msg):
                         s.iloc[l]
-                    self.assertRaises(TypeError, f)
 
                     for idxr in [lambda x: x.ix,
                                  lambda x: x.loc,
                                  lambda x: x.iloc,
                                  lambda x: x]:
 
-                        def f():
-                            with catch_warnings(record=True):
+                        msg = ("cannot do slice indexing"
+                               r" on {klass} with these indexers"
+                               r" \[(3|4)(\.0)?\]"
+                               r" of ({kind_float}|{kind_int})"
+                               .format(klass=type(index),
+                                       kind_float=str(float),
+                                       kind_int=str(int)))
+                        with catch_warnings(record=True):
+                            with pytest.raises(TypeError, match=msg):
                                 idxr(s)[l]
-                        self.assertRaises(TypeError, f)
 
                 # setitem
                 for l in [slice(3.0, 4),
                           slice(3, 4.0),
                           slice(3.0, 4.0)]:
 
-                    def f():
+                    msg = ("cannot do slice indexing"
+                           r" on {klass} with these indexers \[(3|4)\.0\] of"
+                           " {kind}"
+                           .format(klass=type(index), kind=str(float)))
+                    with pytest.raises(TypeError, match=msg):
                         s.iloc[l] = 0
-                    self.assertRaises(TypeError, f)
 
                     for idxr in [lambda x: x.ix,
                                  lambda x: x.loc,
                                  lambda x: x.iloc,
                                  lambda x: x]:
-                        def f():
-                            with catch_warnings(record=True):
+                        msg = ("cannot do slice indexing"
+                               r" on {klass} with these indexers"
+                               r" \[(3|4)(\.0)?\]"
+                               r" of ({kind_float}|{kind_int})"
+                               .format(klass=type(index),
+                                       kind_float=str(float),
+                                       kind_int=str(int)))
+                        with catch_warnings(record=True):
+                            with pytest.raises(TypeError, match=msg):
                                 idxr(s)[l] = 0
-                        self.assertRaises(TypeError, f)
 
+    @ignore_ix
     def test_slice_integer(self):
 
         # same as above, but for Integer based indexes
         # these coerce to a like integer
-        # oob indiciates if we are out of bounds
+        # oob indicates if we are out of bounds
         # of positional indexing
-        for index, oob in [(tm.makeIntIndex(5), False),
-                           (tm.makeRangeIndex(5), False),
-                           (tm.makeIntIndex(5) + 10, True)]:
+        for index, oob in [(Int64Index(range(5)), False),
+                           (RangeIndex(5), False),
+                           (Int64Index(range(5)) + 10, True)]:
 
             # s is an in-range index
             s = Series(range(5), index=index)
@@ -375,11 +446,13 @@ def test_slice_integer(self):
                     self.check(result, s, indexer, False)
 
                 # positional indexing
-                def f():
+                msg = ("cannot do slice indexing"
+                       r" on {klass} with these indexers \[(3|4)\.0\] of"
+                       " {kind}"
+                       .format(klass=type(index), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     s[l]
 
-                self.assertRaises(TypeError, f)
-
             # getitem out-of-bounds
             for l in [slice(-6, 6),
                       slice(-6.0, 6.0)]:
@@ -399,11 +472,13 @@ def f():
                     self.check(result, s, indexer, False)
 
             # positional indexing
-            def f():
+            msg = ("cannot do slice indexing"
+                   r" on {klass} with these indexers \[-6\.0\] of"
+                   " {kind}"
+                   .format(klass=type(index), kind=str(float)))
+            with pytest.raises(TypeError, match=msg):
                 s[slice(-6.0, 6.0)]
 
-            self.assertRaises(TypeError, f)
-
             # getitem odd floats
             for l, res1 in [(slice(2.5, 4), slice(3, 5)),
                             (slice(2, 3.5), slice(2, 4)),
@@ -422,11 +497,13 @@ def f():
                     self.check(result, s, res, False)
 
                 # positional indexing
-                def f():
+                msg = ("cannot do slice indexing"
+                       r" on {klass} with these indexers \[(2|3)\.5\] of"
+                       " {kind}"
+                       .format(klass=type(index), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     s[l]
 
-                self.assertRaises(TypeError, f)
-
             # setitem
             for l in [slice(3.0, 4),
                       slice(3, 4.0),
@@ -438,14 +515,16 @@ def f():
                     with catch_warnings(record=True):
                         idxr(sc)[l] = 0
                         result = idxr(sc)[l].values.ravel()
-                    self.assertTrue((result == 0).all())
+                    assert (result == 0).all()
 
                 # positional indexing
-                def f():
+                msg = ("cannot do slice indexing"
+                       r" on {klass} with these indexers \[(3|4)\.0\] of"
+                       " {kind}"
+                       .format(klass=type(index), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     s[l] = 0
 
-                self.assertRaises(TypeError, f)
-
     def test_integer_positional_indexing(self):
         """ make sure that we are raising on positional indexing
         w.r.t. an integer index """
@@ -463,38 +542,44 @@ def test_integer_positional_indexing(self):
                       slice(2.0, 4),
                       slice(2.0, 4.0)]:
 
-                def f():
+                if compat.PY2:
+                    klass = Int64Index
+                else:
+                    klass = RangeIndex
+                msg = ("cannot do slice indexing"
+                       r" on {klass} with these indexers \[(2|4)\.0\] of"
+                       " {kind}"
+                       .format(klass=str(klass), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     idxr(s)[l]
 
-                self.assertRaises(TypeError, f)
-
+    @ignore_ix
     def test_slice_integer_frame_getitem(self):
 
         # similar to above, but on the getitem dim (of a DataFrame)
-        for index in [tm.makeIntIndex, tm.makeRangeIndex]:
+        for index in [Int64Index(range(5)), RangeIndex(5)]:
 
-            index = index(5)
             s = DataFrame(np.random.randn(5, 2), index=index)
 
-            for idxr in [lambda x: x.loc,
-                         lambda x: x.ix]:
+            def f(idxr):
 
                 # getitem
                 for l in [slice(0.0, 1),
                           slice(0, 1.0),
                           slice(0.0, 1.0)]:
 
-                    with catch_warnings(record=True):
-                        result = idxr(s)[l]
+                    result = idxr(s)[l]
                     indexer = slice(0, 2)
                     self.check(result, s, indexer, False)
 
                     # positional indexing
-                    def f():
+                    msg = ("cannot do slice indexing"
+                           r" on {klass} with these indexers \[(0|1)\.0\] of"
+                           " {kind}"
+                           .format(klass=type(index), kind=str(float)))
+                    with pytest.raises(TypeError, match=msg):
                         s[l]
 
-                    self.assertRaises(TypeError, f)
-
                 # getitem out-of-bounds
                 for l in [slice(-10, 10),
                           slice(-10.0, 10.0)]:
@@ -503,43 +588,52 @@ def f():
                     self.check(result, s, slice(-10, 10), True)
 
                 # positional indexing
-                def f():
+                msg = ("cannot do slice indexing"
+                       r" on {klass} with these indexers \[-10\.0\] of"
+                       " {kind}"
+                       .format(klass=type(index), kind=str(float)))
+                with pytest.raises(TypeError, match=msg):
                     s[slice(-10.0, 10.0)]
 
-                self.assertRaises(TypeError, f)
-
                 # getitem odd floats
                 for l, res in [(slice(0.5, 1), slice(1, 2)),
                                (slice(0, 0.5), slice(0, 1)),
                                (slice(0.5, 1.5), slice(1, 2))]:
 
-                    with catch_warnings(record=True):
-                        result = idxr(s)[l]
+                    result = idxr(s)[l]
                     self.check(result, s, res, False)
 
                     # positional indexing
-                    def f():
+                    msg = ("cannot do slice indexing"
+                           r" on {klass} with these indexers \[0\.5\] of"
+                           " {kind}"
+                           .format(klass=type(index), kind=str(float)))
+                    with pytest.raises(TypeError, match=msg):
                         s[l]
 
-                    self.assertRaises(TypeError, f)
-
                 # setitem
                 for l in [slice(3.0, 4),
                           slice(3, 4.0),
                           slice(3.0, 4.0)]:
 
                     sc = s.copy()
-                    with catch_warnings(record=True):
-                        idxr(sc)[l] = 0
-                        result = idxr(sc)[l].values.ravel()
-                    self.assertTrue((result == 0).all())
+                    idxr(sc)[l] = 0
+                    result = idxr(sc)[l].values.ravel()
+                    assert (result == 0).all()
 
                     # positional indexing
-                    def f():
+                    msg = ("cannot do slice indexing"
+                           r" on {klass} with these indexers \[(3|4)\.0\] of"
+                           " {kind}"
+                           .format(klass=type(index), kind=str(float)))
+                    with pytest.raises(TypeError, match=msg):
                         s[l] = 0
 
-                    self.assertRaises(TypeError, f)
+            f(lambda x: x.loc)
+            with catch_warnings(record=True):
+                f(lambda x: x.ix)
 
+    @ignore_ix
     def test_slice_float(self):
 
         # same as above, but for floats
@@ -560,24 +654,24 @@ def test_slice_float(self):
                     with catch_warnings(record=True):
                         result = idxr(s)[l]
                     if isinstance(s, Series):
-                        self.assert_series_equal(result, expected)
+                        tm.assert_series_equal(result, expected)
                     else:
-                        self.assert_frame_equal(result, expected)
+                        tm.assert_frame_equal(result, expected)
                     # setitem
                     s2 = s.copy()
                     with catch_warnings(record=True):
                         idxr(s2)[l] = 0
                         result = idxr(s2)[l].values.ravel()
-                    self.assertTrue((result == 0).all())
+                    assert (result == 0).all()
 
     def test_floating_index_doc_example(self):
 
         index = Index([1.5, 2, 3, 4.5, 5])
         s = Series(range(5), index=index)
-        self.assertEqual(s[3], 2)
-        self.assertEqual(s.loc[3], 2)
-        self.assertEqual(s.loc[3], 2)
-        self.assertEqual(s.iloc[3], 3)
+        assert s[3] == 2
+        assert s.loc[3] == 2
+        assert s.loc[3] == 2
+        assert s.iloc[3] == 3
 
     def test_floating_misc(self):
 
@@ -596,23 +690,26 @@ def test_floating_misc(self):
         result1 = s[5.0]
         result2 = s.loc[5.0]
         result3 = s.loc[5.0]
-        self.assertEqual(result1, result2)
-        self.assertEqual(result1, result3)
+        assert result1 == result2
+        assert result1 == result3
 
         result1 = s[5]
         result2 = s.loc[5]
         result3 = s.loc[5]
-        self.assertEqual(result1, result2)
-        self.assertEqual(result1, result3)
+        assert result1 == result2
+        assert result1 == result3
 
-        self.assertEqual(s[5.0], s[5])
+        assert s[5.0] == s[5]
 
         # value not found (and no fallbacking at all)
 
         # scalar integers
-        self.assertRaises(KeyError, lambda: s.loc[4])
-        self.assertRaises(KeyError, lambda: s.loc[4])
-        self.assertRaises(KeyError, lambda: s[4])
+        with pytest.raises(KeyError, match=r"^4\.0$"):
+            s.loc[4]
+        with pytest.raises(KeyError, match=r"^4\.0$"):
+            s.loc[4]
+        with pytest.raises(KeyError, match=r"^4\.0$"):
+            s[4]
 
         # fancy floats/integers create the correct entry (as nan)
         # fancy tests
@@ -671,17 +768,23 @@ def test_floating_misc(self):
         assert_series_equal(result1, result3)
         assert_series_equal(result1, result4)
 
-        result1 = s[[1.6, 5, 10]]
-        result2 = s.loc[[1.6, 5, 10]]
-        result3 = s.loc[[1.6, 5, 10]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result1 = s[[1.6, 5, 10]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result2 = s.loc[[1.6, 5, 10]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result3 = s.loc[[1.6, 5, 10]]
         assert_series_equal(result1, result2)
         assert_series_equal(result1, result3)
         assert_series_equal(result1, Series(
             [np.nan, 2, 4], index=[1.6, 5, 10]))
 
-        result1 = s[[0, 1, 2]]
-        result2 = s.loc[[0, 1, 2]]
-        result3 = s.loc[[0, 1, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result1 = s[[0, 1, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result2 = s.loc[[0, 1, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result3 = s.loc[[0, 1, 2]]
         assert_series_equal(result1, result2)
         assert_series_equal(result1, result3)
         assert_series_equal(result1, Series(
@@ -700,15 +803,17 @@ def test_floating_misc(self):
         assert_series_equal(result1, Series([1], index=[2.5]))
 
     def test_floating_tuples(self):
-        # GH13509
+        # see gh-13509
         s = Series([(1, 1), (2, 2), (3, 3)], index=[0.0, 0.1, 0.2], name='foo')
+
         result = s[0.0]
-        self.assertEqual(result, (1, 1))
+        assert result == (1, 1)
 
+        expected = Series([(1, 1), (2, 2)], index=[0.0, 0.0], name='foo')
         s = Series([(1, 1), (2, 2), (3, 3)], index=[0.0, 0.0, 0.2], name='foo')
+
         result = s[0.0]
-        expected = Series([(1, 1), (2, 2)], index=[0.0, 0.0], name='foo')
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_float64index_slicing_bug(self):
         # GH 5557, related to slicing a float index
diff --git a/pandas/tests/indexing/test_iloc.py b/pandas/tests/indexing/test_iloc.py
index 517194835ca73..69ec6454e952a 100644
--- a/pandas/tests/indexing/test_iloc.py
+++ b/pandas/tests/indexing/test_iloc.py
@@ -1,48 +1,58 @@
 """ test positional based indexing with iloc """
 
-from warnings import catch_warnings
+from warnings import catch_warnings, filterwarnings, simplefilter
+
 import numpy as np
+import pytest
+
+from pandas.compat import lmap, lrange
 
 import pandas as pd
-from pandas.compat import lrange, lmap
-from pandas import Series, DataFrame, date_range, concat, isnull
-from pandas.util import testing as tm
+from pandas import DataFrame, Series, concat, date_range, isna
+from pandas.api.types import is_scalar
 from pandas.tests.indexing.common import Base
+from pandas.util import testing as tm
 
 
-class TestiLoc(Base, tm.TestCase):
+class TestiLoc(Base):
 
     def test_iloc_exceeds_bounds(self):
 
         # GH6296
         # iloc should allow indexers that exceed the bounds
         df = DataFrame(np.random.random_sample((20, 5)), columns=list('ABCDE'))
-        expected = df
 
         # lists of positions should raise IndexErrror!
-        with tm.assertRaisesRegexp(IndexError,
-                                   'positional indexers are out-of-bounds'):
+        msg = 'positional indexers are out-of-bounds'
+        with pytest.raises(IndexError, match=msg):
             df.iloc[:, [0, 1, 2, 3, 4, 5]]
-        self.assertRaises(IndexError, lambda: df.iloc[[1, 30]])
-        self.assertRaises(IndexError, lambda: df.iloc[[1, -30]])
-        self.assertRaises(IndexError, lambda: df.iloc[[100]])
+        with pytest.raises(IndexError, match=msg):
+            df.iloc[[1, 30]]
+        with pytest.raises(IndexError, match=msg):
+            df.iloc[[1, -30]]
+        with pytest.raises(IndexError, match=msg):
+            df.iloc[[100]]
 
         s = df['A']
-        self.assertRaises(IndexError, lambda: s.iloc[[100]])
-        self.assertRaises(IndexError, lambda: s.iloc[[-100]])
+        with pytest.raises(IndexError, match=msg):
+            s.iloc[[100]]
+        with pytest.raises(IndexError, match=msg):
+            s.iloc[[-100]]
 
         # still raise on a single indexer
         msg = 'single positional indexer is out-of-bounds'
-        with tm.assertRaisesRegexp(IndexError, msg):
+        with pytest.raises(IndexError, match=msg):
             df.iloc[30]
-        self.assertRaises(IndexError, lambda: df.iloc[-30])
+        with pytest.raises(IndexError, match=msg):
+            df.iloc[-30]
 
         # GH10779
         # single positive/negative indexer exceeding Series bounds should raise
         # an IndexError
-        with tm.assertRaisesRegexp(IndexError, msg):
+        with pytest.raises(IndexError, match=msg):
             s.iloc[30]
-        self.assertRaises(IndexError, lambda: s.iloc[-30])
+        with pytest.raises(IndexError, match=msg):
+            s.iloc[-30]
 
         # slices are ok
         result = df.iloc[:, 4:10]  # 0 < start < len < stop
@@ -101,8 +111,12 @@ def check(result, expected):
         check(dfl.iloc[:, 1:3], dfl.iloc[:, [1]])
         check(dfl.iloc[4:6], dfl.iloc[[4]])
 
-        self.assertRaises(IndexError, lambda: dfl.iloc[[4, 5, 6]])
-        self.assertRaises(IndexError, lambda: dfl.iloc[:, 4])
+        msg = "positional indexers are out-of-bounds"
+        with pytest.raises(IndexError, match=msg):
+            dfl.iloc[[4, 5, 6]]
+        msg = "single positional indexer is out-of-bounds"
+        with pytest.raises(IndexError, match=msg):
+            dfl.iloc[:, 4]
 
     def test_iloc_getitem_int(self):
 
@@ -122,6 +136,33 @@ def test_iloc_getitem_neg_int(self):
                           typs=['labels', 'mixed', 'ts', 'floats', 'empty'],
                           fails=IndexError)
 
+    @pytest.mark.parametrize('dims', [1, 2])
+    def test_iloc_getitem_invalid_scalar(self, dims):
+        # GH 21982
+
+        if dims == 1:
+            s = Series(np.arange(10))
+        else:
+            s = DataFrame(np.arange(100).reshape(10, 10))
+
+        with pytest.raises(TypeError, match='Cannot index by location index'):
+            s.iloc['a']
+
+    def test_iloc_array_not_mutating_negative_indices(self):
+
+        # GH 21867
+        array_with_neg_numbers = np.array([1, 2, -1])
+        array_copy = array_with_neg_numbers.copy()
+        df = pd.DataFrame({
+            'A': [100, 101, 102],
+            'B': [103, 104, 105],
+            'C': [106, 107, 108]},
+            index=[1, 2, 3])
+        df.iloc[array_with_neg_numbers]
+        tm.assert_numpy_array_equal(array_with_neg_numbers, array_copy)
+        df.iloc[:, array_with_neg_numbers]
+        tm.assert_numpy_array_equal(array_with_neg_numbers, array_copy)
+
     def test_iloc_getitem_list_int(self):
 
         # list of ints
@@ -163,14 +204,14 @@ def test_iloc_getitem_neg_int_can_reach_first_index(self):
 
         expected = s.iloc[0]
         result = s.iloc[-3]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         expected = s.iloc[[0]]
         result = s.iloc[[-3]]
         tm.assert_series_equal(result, expected)
 
         # check the length 1 Series case highlighted in GH10547
-        expected = pd.Series(['a'], index=['A'])
+        expected = Series(['a'], index=['A'])
         result = expected.iloc[[-1]]
         tm.assert_series_equal(result, expected)
 
@@ -188,7 +229,7 @@ def test_iloc_getitem_dups(self):
 
         # cross-sectional indexing
         result = df.iloc[0, 0]
-        self.assertTrue(isnull(result))
+        assert isna(result)
 
         result = df.iloc[0, :]
         expected = Series([np.nan, 1, 3, 3], index=['A', 'B', 'A', 'B'],
@@ -253,7 +294,7 @@ def test_iloc_setitem(self):
 
         df.iloc[1, 1] = 1
         result = df.iloc[1, 1]
-        self.assertEqual(result, 1)
+        assert result == 1
 
         df.iloc[:, 2:3] = 0
         expected = df.iloc[:, 2:3]
@@ -279,6 +320,19 @@ def test_iloc_setitem_list(self):
             index=["A", "B", "C"], columns=["A", "B", "C"])
         tm.assert_frame_equal(df, expected)
 
+    def test_iloc_setitem_pandas_object(self):
+        # GH 17193
+        s_orig = Series([0, 1, 2, 3])
+        expected = Series([0, -1, -2, 3])
+
+        s = s_orig.copy()
+        s.iloc[Series([1, 2])] = [-1, -2]
+        tm.assert_series_equal(s, expected)
+
+        s = s_orig.copy()
+        s.iloc[pd.Index([1, 2])] = [-1, -2]
+        tm.assert_series_equal(s, expected)
+
     def test_iloc_setitem_dups(self):
 
         # GH 6766
@@ -317,45 +371,53 @@ def test_iloc_getitem_frame(self):
 
         result = df.iloc[2]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             exp = df.ix[4]
         tm.assert_series_equal(result, exp)
 
         result = df.iloc[2, 2]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             exp = df.ix[4, 4]
-        self.assertEqual(result, exp)
+        assert result == exp
 
         # slice
         result = df.iloc[4:8]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[8:14]
         tm.assert_frame_equal(result, expected)
 
         result = df.iloc[:, 2:3]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[:, 4:5]
         tm.assert_frame_equal(result, expected)
 
         # list of integers
         result = df.iloc[[0, 1, 3]]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[[0, 2, 6]]
         tm.assert_frame_equal(result, expected)
 
         result = df.iloc[[0, 1, 3], [0, 1]]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[[0, 2, 6], [0, 2]]
         tm.assert_frame_equal(result, expected)
 
-        # neg indicies
+        # neg indices
         result = df.iloc[[-1, 1, 3], [-1, 1]]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[[18, 2, 6], [6, 2]]
         tm.assert_frame_equal(result, expected)
 
-        # dups indicies
+        # dups indices
         result = df.iloc[[-1, -1, 1, 3], [-1, 1]]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[[18, 18, 2, 6], [6, 2]]
         tm.assert_frame_equal(result, expected)
 
@@ -363,6 +425,7 @@ def test_iloc_getitem_frame(self):
         s = Series(index=lrange(1, 5))
         result = df.iloc[s.index]
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             expected = df.ix[[2, 4, 6, 8]]
         tm.assert_frame_equal(result, expected)
 
@@ -373,7 +436,7 @@ def test_iloc_getitem_labelled_frame(self):
 
         result = df.iloc[1, 1]
         exp = df.loc['b', 'B']
-        self.assertEqual(result, exp)
+        assert result == exp
 
         result = df.iloc[:, 2:3]
         expected = df.loc[:, ['C']]
@@ -382,13 +445,19 @@ def test_iloc_getitem_labelled_frame(self):
         # negative indexing
         result = df.iloc[-1, -1]
         exp = df.loc['j', 'D']
-        self.assertEqual(result, exp)
+        assert result == exp
 
         # out-of-bounds exception
-        self.assertRaises(IndexError, df.iloc.__getitem__, tuple([10, 5]))
+        msg = "single positional indexer is out-of-bounds"
+        with pytest.raises(IndexError, match=msg):
+            df.iloc[10, 5]
 
         # trying to use a label
-        self.assertRaises(ValueError, df.iloc.__getitem__, tuple(['j', 'D']))
+        msg = (r"Location based indexing can only have \[integer, integer"
+               r" slice \(START point is INCLUDED, END point is EXCLUDED\),"
+               r" listlike of integers, boolean array\] types")
+        with pytest.raises(ValueError, match=msg):
+            df.iloc['j', 'D']
 
     def test_iloc_getitem_doc_issue(self):
 
@@ -441,7 +510,7 @@ def test_iloc_setitem_series(self):
 
         df.iloc[1, 1] = 1
         result = df.iloc[1, 1]
-        self.assertEqual(result, 1)
+        assert result == 1
 
         df.iloc[:, 2:3] = 0
         expected = df.iloc[:, 2:3]
@@ -452,7 +521,7 @@ def test_iloc_setitem_series(self):
 
         s.iloc[1] = 1
         result = s.iloc[1]
-        self.assertEqual(result, 1)
+        assert result == 1
 
         s.iloc[:4] = 0
         expected = s.iloc[:4]
@@ -483,15 +552,35 @@ def test_iloc_setitem_list_of_lists(self):
                                   B=[5, 6, 11, 13, 9]))
         tm.assert_frame_equal(df, expected)
 
+    @pytest.mark.parametrize(
+        'indexer', [[0], slice(None, 1, None), np.array([0])])
+    @pytest.mark.parametrize(
+        'value', [['Z'], np.array(['Z'])])
+    def test_iloc_setitem_with_scalar_index(self, indexer, value):
+        # GH #19474
+        # assigning like "df.iloc[0, [0]] = ['Z']" should be evaluated
+        # elementwisely, not using "setter('A', ['Z'])".
+
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        df.iloc[0, indexer] = value
+        result = df.iloc[0, 0]
+
+        assert is_scalar(result) and result == 'Z'
+
     def test_iloc_mask(self):
 
         # GH 3631, iloc with a mask (of a series) should raise
         df = DataFrame(lrange(5), list('ABCDE'), columns=['a'])
         mask = (df.a % 2 == 0)
-        self.assertRaises(ValueError, df.iloc.__getitem__, tuple([mask]))
+        msg = ("iLocation based boolean indexing cannot use an indexable as"
+               " a mask")
+        with pytest.raises(ValueError, match=msg):
+            df.iloc[mask]
         mask.index = lrange(len(mask))
-        self.assertRaises(NotImplementedError, df.iloc.__getitem__,
-                          tuple([mask]))
+        msg = ("iLocation based boolean indexing on an integer type is not"
+               " available")
+        with pytest.raises(NotImplementedError, match=msg):
+            df.iloc[mask]
 
         # ndarray ok
         result = df.iloc[np.array([True] * len(mask), dtype=bool)]
@@ -523,6 +612,7 @@ def test_iloc_mask(self):
 
         # UserWarnings from reindex of a boolean mask
         with catch_warnings(record=True):
+            simplefilter("ignore", UserWarning)
             result = dict()
             for idx in [None, 'index', 'locs']:
                 mask = (df.nums > 2).values
@@ -552,13 +642,13 @@ def test_iloc_non_unique_indexing(self):
         idx = np.array(lrange(30)) * 99
         expected = df.iloc[idx]
 
-        df3 = pd.concat([df, 2 * df, 3 * df])
+        df3 = concat([df, 2 * df, 3 * df])
         result = df3.iloc[idx]
 
         tm.assert_frame_equal(result, expected)
 
         df2 = DataFrame({'A': [0.1] * 1000, 'B': [1] * 1000})
-        df2 = pd.concat([df2, 2 * df2, 3 * df2])
+        df2 = concat([df2, 2 * df2, 3 * df2])
 
         sidx = df2.index.to_series()
         expected = df2.iloc[idx[idx <= sidx.max()]]
@@ -570,9 +660,10 @@ def test_iloc_non_unique_indexing(self):
             new_list.append(s * 3)
 
         expected = DataFrame(new_list)
-        expected = pd.concat([expected, DataFrame(index=idx[idx > sidx.max()])
-                              ])
-        result = df2.loc[idx]
+        expected = concat([expected, DataFrame(index=idx[idx > sidx.max()])],
+                          sort=True)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df2.loc[idx]
         tm.assert_frame_equal(result, expected, check_index_type=False)
 
     def test_iloc_empty_list_indexer_is_ok(self):
@@ -588,3 +679,34 @@ def test_iloc_empty_list_indexer_is_ok(self):
         tm.assert_frame_equal(df.iloc[[]], df.iloc[:0, :],
                               check_index_type=True,
                               check_column_type=True)
+
+    def test_identity_slice_returns_new_object(self):
+        # GH13873
+        original_df = DataFrame({'a': [1, 2, 3]})
+        sliced_df = original_df.iloc[:]
+        assert sliced_df is not original_df
+
+        # should be a shallow copy
+        original_df['a'] = [4, 4, 4]
+        assert (sliced_df['a'] == 4).all()
+
+        original_series = Series([1, 2, 3, 4, 5, 6])
+        sliced_series = original_series.iloc[:]
+        assert sliced_series is not original_series
+
+        # should also be a shallow copy
+        original_series[:3] = [7, 8, 9]
+        assert all(sliced_series[:3] == [7, 8, 9])
+
+    def test_indexing_zerodim_np_array(self):
+        # GH24919
+        df = DataFrame([[1, 2], [3, 4]])
+        result = df.iloc[np.array(0)]
+        s = pd.Series([1, 2], name=0)
+        tm.assert_series_equal(result, s)
+
+    def test_series_indexing_zerodim_np_array(self):
+        # GH24919
+        s = Series([1, 2])
+        result = s.iloc[np.array(0)]
+        assert result == 1
diff --git a/pandas/tests/indexing/test_indexing.py b/pandas/tests/indexing/test_indexing.py
index 0d6ca383a1be1..03f1975c50d2a 100644
--- a/pandas/tests/indexing/test_indexing.py
+++ b/pandas/tests/indexing/test_indexing.py
@@ -3,27 +3,29 @@
 
 """ test fancy indexing & misc """
 
-from warnings import catch_warnings
 from datetime import datetime
+from warnings import catch_warnings, simplefilter
+import weakref
 
-from pandas.types.common import (is_integer_dtype,
-                                 is_float_dtype)
-from pandas.compat import range, lrange, lzip, StringIO
 import numpy as np
+import pytest
 
-import pandas as pd
-from pandas.core.indexing import _non_reducing_slice, _maybe_numeric_slice
-from pandas import NaT, DataFrame, Index, Series, MultiIndex
-import pandas.util.testing as tm
+from pandas.compat import PY2, lrange, range
 
-from pandas.tests.indexing.common import Base, _mklbl
+from pandas.core.dtypes.common import is_float_dtype, is_integer_dtype
 
+import pandas as pd
+from pandas import DataFrame, Index, NaT, Series
+from pandas.core.indexing import (
+    _maybe_numeric_slice, _non_reducing_slice, validate_indices)
+from pandas.tests.indexing.common import Base, _mklbl
+import pandas.util.testing as tm
 
 # ------------------------------------------------------------------------
 # Indexing test cases
 
 
-class TestFancy(Base, tm.TestCase):
+class TestFancy(Base):
     """ pure get/set item & fancy indexing """
 
     def test_setitem_ndarray_1d(self):
@@ -35,12 +37,10 @@ def test_setitem_ndarray_1d(self):
         df['bar'] = np.zeros(10, dtype=np.complex)
 
         # invalid
-        def f():
+        with pytest.raises(ValueError):
             df.loc[df.index[2:5], 'bar'] = np.array([2.33j, 1.23 + 0.1j,
                                                      2.2, 1.0])
 
-        self.assertRaises(ValueError, f)
-
         # valid
         df.loc[df.index[2:6], 'bar'] = np.array([2.33j, 1.23 + 0.1j,
                                                  2.2, 1.0])
@@ -55,17 +55,43 @@ def f():
         df['foo'] = np.zeros(10, dtype=np.float64)
         df['bar'] = np.zeros(10, dtype=np.complex)
 
-        def f():
+        with pytest.raises(ValueError):
             df[2:5] = np.arange(1, 4) * 1j
 
-        self.assertRaises(ValueError, f)
+    def test_inf_upcast(self):
+        # GH 16957
+        # We should be able to use np.inf as a key
+        # np.inf should cause an index to convert to float
+
+        # Test with np.inf in rows
+        df = DataFrame(columns=[0])
+        df.loc[1] = 1
+        df.loc[2] = 2
+        df.loc[np.inf] = 3
+
+        # make sure we can look up the value
+        assert df.loc[np.inf, 0] == 3
+
+        result = df.index
+        expected = pd.Float64Index([1, 2, np.inf])
+        tm.assert_index_equal(result, expected)
+
+        # Test with np.inf in columns
+        df = DataFrame()
+        df.loc[0, 0] = 1
+        df.loc[1, 1] = 2
+        df.loc[0, np.inf] = 3
+
+        result = df.columns
+        expected = pd.Float64Index([0, 1, np.inf])
+        tm.assert_index_equal(result, expected)
 
     def test_setitem_dtype_upcast(self):
 
         # GH3216
         df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
         df['c'] = np.nan
-        self.assertEqual(df['c'].dtype, np.float64)
+        assert df['c'].dtype == np.float64
 
         df.loc[0, 'c'] = 'foo'
         expected = DataFrame([{"a": 1, "c": 'foo'},
@@ -84,8 +110,8 @@ def test_setitem_dtype_upcast(self):
                               columns=['foo', 'bar', 'baz'])
 
             tm.assert_frame_equal(left, right)
-            self.assertTrue(is_integer_dtype(left['foo']))
-            self.assertTrue(is_integer_dtype(left['baz']))
+            assert is_integer_dtype(left['foo'])
+            assert is_integer_dtype(left['baz'])
 
         left = DataFrame(np.arange(6, dtype='int64').reshape(2, 3) / 10.0,
                          index=list('ab'),
@@ -96,8 +122,8 @@ def test_setitem_dtype_upcast(self):
                           columns=['foo', 'bar', 'baz'])
 
         tm.assert_frame_equal(left, right)
-        self.assertTrue(is_float_dtype(left['foo']))
-        self.assertTrue(is_float_dtype(left['baz']))
+        assert is_float_dtype(left['foo'])
+        assert is_float_dtype(left['baz'])
 
     def test_dups_fancy_indexing(self):
 
@@ -107,7 +133,7 @@ def test_dups_fancy_indexing(self):
         df.columns = ['a', 'a', 'b']
         result = df[['b', 'a']].columns
         expected = Index(['b', 'a', 'a'])
-        self.assert_index_equal(result, expected)
+        tm.assert_index_equal(result, expected)
 
         # across dtypes
         df = DataFrame([[1, 2, 1., 2., 3., 'foo', 'bar']],
@@ -145,7 +171,8 @@ def test_dups_fancy_indexing(self):
              'test1': [7., 6, np.nan],
              'other': ['d', 'c', np.nan]}, index=rows)
 
-        result = df.loc[rows]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[rows]
         tm.assert_frame_equal(result, expected)
 
         # see GH5553, make sure we use the right indexer
@@ -155,29 +182,27 @@ def test_dups_fancy_indexing(self):
                               'other': [np.nan, np.nan, np.nan,
                                         'd', 'c', np.nan]},
                              index=rows)
-        result = df.loc[rows]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[rows]
         tm.assert_frame_equal(result, expected)
 
-        # inconsistent returns for unique/duplicate indices when values are
-        # missing
-        df = DataFrame(np.random.randn(4, 3), index=list('ABCD'))
-        expected = df.reindex(['E'])
-
+        # List containing only missing label
         dfnu = DataFrame(np.random.randn(5, 3), index=list('AABCD'))
-        with catch_warnings(record=True):
-            result = dfnu.ix[['E']]
-        tm.assert_frame_equal(result, expected)
+        with pytest.raises(KeyError):
+            dfnu.loc[['E']]
 
         # ToDo: check_index_type can be True after GH 11497
 
         # GH 4619; duplicate indexer with missing label
         df = DataFrame({"A": [0, 1, 2]})
-        result = df.loc[[0, 8, 0]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[[0, 8, 0]]
         expected = DataFrame({"A": [0, np.nan, 0]}, index=[0, 8, 0])
         tm.assert_frame_equal(result, expected, check_index_type=False)
 
         df = DataFrame({"A": list('abc')})
-        result = df.loc[[0, 8, 0]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[[0, 8, 0]]
         expected = DataFrame({"A": ['a', np.nan, 'a']}, index=[0, 8, 0])
         tm.assert_frame_equal(result, expected, check_index_type=False)
 
@@ -185,9 +210,13 @@ def test_dups_fancy_indexing(self):
         df = DataFrame({'test': [5, 7, 9, 11]}, index=['A', 'A', 'B', 'C'])
         expected = DataFrame(
             {'test': [5, 7, 5, 7, np.nan]}, index=['A', 'A', 'A', 'A', 'E'])
-        result = df.loc[['A', 'A', 'E']]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[['A', 'A', 'E']]
         tm.assert_frame_equal(result, expected)
 
+    @pytest.mark.skipif(PY2,
+                        reason="GH-20770. Py2 unreliable warnings catching.")
+    def test_dups_fancy_indexing2(self):
         # GH 5835
         # dups on index and missing values
         df = DataFrame(
@@ -196,7 +225,8 @@ def test_dups_fancy_indexing(self):
         expected = pd.concat(
             [df.loc[:, ['A', 'B']], DataFrame(np.nan, columns=['C'],
                                               index=df.index)], axis=1)
-        result = df.loc[:, ['A', 'B', 'C']]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = df.loc[:, ['A', 'B', 'C']]
         tm.assert_frame_equal(result, expected)
 
         # GH 6504, multi-axis indexing
@@ -228,7 +258,7 @@ def test_indexing_mixed_frame_bug(self):
         idx = df['test'] == '_'
         temp = df.loc[idx, 'a'].apply(lambda x: '-----' if x == 'aaa' else x)
         df.loc[idx, 'test'] = temp
-        self.assertEqual(df.iloc[0, 2], '-----')
+        assert df.iloc[0, 2] == '-----'
 
         # if I look at df, then element [0,2] equals '_'. If instead I type
         # df.ix[idx,'test'], I get '-----', finally by typing df.iloc[0,2] I
@@ -236,12 +266,12 @@ def test_indexing_mixed_frame_bug(self):
 
     def test_multitype_list_index_access(self):
         # GH 10610
-        df = pd.DataFrame(np.random.random((10, 5)),
-                          columns=["a"] + [20, 21, 22, 23])
+        df = DataFrame(np.random.random((10, 5)),
+                       columns=["a"] + [20, 21, 22, 23])
 
-        with self.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             df[[22, 26, -8]]
-        self.assertEqual(df[21].shape[0], df.shape[0])
+        assert df[21].shape[0] == df.shape[0]
 
     def test_set_index_nan(self):
 
@@ -307,24 +337,9 @@ def test_set_index_nan(self):
             columns=df.columns)
         tm.assert_frame_equal(result, df)
 
-    def test_multi_nan_indexing(self):
-
-        # GH 3588
-        df = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
-                        'b': ["C1", "C2", "C3", "C4"],
-                        "c": [10, 15, np.nan, 20]})
-        result = df.set_index(['a', 'b'], drop=False)
-        expected = DataFrame({"a": ['R1', 'R2', np.nan, 'R4'],
-                              'b': ["C1", "C2", "C3", "C4"],
-                              "c": [10, 15, np.nan, 20]},
-                             index=[Index(['R1', 'R2', np.nan, 'R4'],
-                                          name='a'),
-                                    Index(['C1', 'C2', 'C3', 'C4'], name='b')])
-        tm.assert_frame_equal(result, expected)
-
     def test_multi_assign(self):
 
-        # GH 3626, an assignement of a sub-df to a df
+        # GH 3626, an assignment of a sub-df to a df
         df = DataFrame({'FC': ['a', 'b', 'a', 'b', 'a', 'b'],
                         'PF': [0, 0, 0, 0, 1, 1],
                         'col1': lrange(6),
@@ -332,7 +347,7 @@ def test_multi_assign(self):
         df.iloc[1, 0] = np.nan
         df2 = df.copy()
 
-        mask = ~df2.FC.isnull()
+        mask = ~df2.FC.isna()
         cols = ['col1', 'col2']
 
         dft = df2 * 2
@@ -351,6 +366,12 @@ def test_multi_assign(self):
         tm.assert_frame_equal(df2, expected)
 
         # with an ndarray on rhs
+        # coerces to float64 because values has float64 dtype
+        # GH 14001
+        expected = DataFrame({'FC': ['a', np.nan, 'a', 'b', 'a', 'b'],
+                              'PF': [0, 0, 0, 0, 1, 1],
+                              'col1': [0., 1., 4., 6., 8., 10.],
+                              'col2': [12, 7, 16, np.nan, 20, 22]})
         df2 = df.copy()
         df2.loc[mask, cols] = dft.loc[mask, cols].values
         tm.assert_frame_equal(df2, expected)
@@ -375,11 +396,13 @@ def test_setitem_list(self):
         # ix with a list
         df = DataFrame(index=[0, 1], columns=[0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             df.ix[1, 0] = [1, 2, 3]
             df.ix[1, 0] = [1, 2]
 
         result = DataFrame(index=[0, 1], columns=[0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             result.ix[1, 0] = [1, 2]
 
         tm.assert_frame_equal(result, df)
@@ -403,11 +426,13 @@ def view(self):
 
         df = DataFrame(index=[0, 1], columns=[0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             df.ix[1, 0] = TO(1)
             df.ix[1, 0] = TO(2)
 
         result = DataFrame(index=[0, 1], columns=[0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             result.ix[1, 0] = TO(2)
 
         tm.assert_frame_equal(result, df)
@@ -415,6 +440,7 @@ def view(self):
         # remains object dtype even after setting it back
         df = DataFrame(index=[0, 1], columns=[0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             df.ix[1, 0] = TO(1)
             df.ix[1, 0] = np.nan
         result = DataFrame(index=[0, 1], columns=[0])
@@ -425,62 +451,22 @@ def test_string_slice(self):
         # GH 14424
         # string indexing against datetimelike with object
         # dtype should properly raises KeyError
-        df = pd.DataFrame([1], pd.Index([pd.Timestamp('2011-01-01')],
-                                        dtype=object))
-        self.assertTrue(df.index.is_all_dates)
-        with tm.assertRaises(KeyError):
+        df = DataFrame([1], Index([pd.Timestamp('2011-01-01')], dtype=object))
+        assert df.index.is_all_dates
+        with pytest.raises(KeyError):
             df['2011']
 
-        with tm.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             df.loc['2011', 0]
 
-        df = pd.DataFrame()
-        self.assertFalse(df.index.is_all_dates)
-        with tm.assertRaises(KeyError):
+        df = DataFrame()
+        assert not df.index.is_all_dates
+        with pytest.raises(KeyError):
             df['2011']
 
-        with tm.assertRaises(KeyError):
+        with pytest.raises(KeyError):
             df.loc['2011', 0]
 
-    def test_mi_access(self):
-
-        # GH 4145
-        data = """h1 main  h3 sub  h5
-0  a    A   1  A1   1
-1  b    B   2  B1   2
-2  c    B   3  A1   3
-3  d    A   4  B2   4
-4  e    A   5  B2   5
-5  f    B   6  A2   6
-"""
-
-        df = pd.read_csv(StringIO(data), sep=r'\s+', index_col=0)
-        df2 = df.set_index(['main', 'sub']).T.sort_index(1)
-        index = Index(['h1', 'h3', 'h5'])
-        columns = MultiIndex.from_tuples([('A', 'A1')], names=['main', 'sub'])
-        expected = DataFrame([['a', 1, 1]], index=columns, columns=index).T
-
-        result = df2.loc[:, ('A', 'A1')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df2[('A', 'A1')]
-        tm.assert_frame_equal(result, expected)
-
-        # GH 4146, not returning a block manager when selecting a unique index
-        # from a duplicate index
-        # as of 4879, this returns a Series (which is similar to what happens
-        # with a non-unique)
-        expected = Series(['a', 1, 1], index=['h1', 'h3', 'h5'], name='A1')
-        result = df2['A']['A1']
-        tm.assert_series_equal(result, expected)
-
-        # selecting a non_unique from the 2nd level
-        expected = DataFrame([['d', 4, 4], ['e', 5, 5]],
-                             index=Index(['B2', 'B2'], name='sub'),
-                             columns=['h1', 'h3', 'h5'], ).T
-        result = df2['A']['B2']
-        tm.assert_frame_equal(result, expected)
-
     def test_astype_assignment(self):
 
         # GH4312 (iloc)
@@ -523,25 +509,69 @@ def test_astype_assignment(self):
         expected = DataFrame({'A': [1, 2, 3, 4]})
         tm.assert_frame_equal(df, expected)
 
-    def test_astype_assignment_with_dups(self):
-
-        # GH 4686
-        # assignment with dups that has a dtype change
-        cols = pd.MultiIndex.from_tuples([('A', '1'), ('B', '1'), ('A', '2')])
-        df = DataFrame(np.arange(3).reshape((1, 3)),
-                       columns=cols, dtype=object)
-        index = df.index.copy()
-
-        df['A'] = df['A'].astype(np.float64)
-        self.assert_index_equal(df.index, index)
-
-        # TODO(wesm): unused variables
-        # result = df.get_dtype_counts().sort_index()
-        # expected = Series({'float64': 2, 'object': 1}).sort_index()
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, 2]), 2),
+        (Index([0, 1, '2']), '2'),
+        (Index([0, 1, 2, np.inf, 4]), 4),
+        (Index([0, 1, 2, np.nan, 4]), 4),
+        (Index([0, 1, 2, np.inf]), np.inf),
+        (Index([0, 1, 2, np.nan]), np.nan),
+    ])
+    def test_index_contains(self, index, val):
+        assert val in index
+
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, 2]), '2'),
+        (Index([0, 1, '2']), 2),
+        (Index([0, 1, 2, np.inf]), 4),
+        (Index([0, 1, 2, np.nan]), 4),
+        (Index([0, 1, 2, np.inf]), np.nan),
+        (Index([0, 1, 2, np.nan]), np.inf),
+        # Checking if np.inf in Int64Index should not cause an OverflowError
+        # Related to GH 16957
+        (pd.Int64Index([0, 1, 2]), np.inf),
+        (pd.Int64Index([0, 1, 2]), np.nan),
+        (pd.UInt64Index([0, 1, 2]), np.inf),
+        (pd.UInt64Index([0, 1, 2]), np.nan),
+    ])
+    def test_index_not_contains(self, index, val):
+        assert val not in index
+
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, '2']), 0),
+        (Index([0, 1, '2']), '2'),
+    ])
+    def test_mixed_index_contains(self, index, val):
+        # GH 19860
+        assert val in index
+
+    @pytest.mark.parametrize("index,val", [
+        (Index([0, 1, '2']), '1'),
+        (Index([0, 1, '2']), 2),
+    ])
+    def test_mixed_index_not_contains(self, index, val):
+        # GH 19860
+        assert val not in index
+
+    def test_contains_with_float_index(self):
+        # GH#22085
+        integer_index = pd.Int64Index([0, 1, 2, 3])
+        uinteger_index = pd.UInt64Index([0, 1, 2, 3])
+        float_index = pd.Float64Index([0.1, 1.1, 2.2, 3.3])
+
+        for index in (integer_index, uinteger_index):
+            assert 1.1 not in index
+            assert 1.0 in index
+            assert 1 in index
+
+        assert 1.1 in float_index
+        assert 1.0 not in float_index
+        assert 1 not in float_index
 
     def test_index_type_coercion(self):
 
         with catch_warnings(record=True):
+            simplefilter("ignore")
 
             # GH 11836
             # if we have an index type and set it with something that looks
@@ -553,15 +583,15 @@ def test_index_type_coercion(self):
             for s in [Series(range(5)),
                       Series(range(5), index=range(1, 6))]:
 
-                self.assertTrue(s.index.is_integer())
+                assert s.index.is_integer()
 
                 for indexer in [lambda x: x.ix,
                                 lambda x: x.loc,
                                 lambda x: x]:
                     s2 = s.copy()
                     indexer(s2)[0.1] = 0
-                    self.assertTrue(s2.index.is_floating())
-                    self.assertTrue(indexer(s2)[0.1] == 0)
+                    assert s2.index.is_floating()
+                    assert indexer(s2)[0.1] == 0
 
                     s2 = s.copy()
                     indexer(s2)[0.0] = 0
@@ -572,11 +602,11 @@ def test_index_type_coercion(self):
 
                     s2 = s.copy()
                     indexer(s2)['0'] = 0
-                    self.assertTrue(s2.index.is_object())
+                    assert s2.index.is_object()
 
             for s in [Series(range(5), index=np.arange(5.))]:
 
-                self.assertTrue(s.index.is_floating())
+                assert s.index.is_floating()
 
                 for idxr in [lambda x: x.ix,
                              lambda x: x.loc,
@@ -584,8 +614,8 @@ def test_index_type_coercion(self):
 
                     s2 = s.copy()
                     idxr(s2)[0.1] = 0
-                    self.assertTrue(s2.index.is_floating())
-                    self.assertTrue(idxr(s2)[0.1] == 0)
+                    assert s2.index.is_floating()
+                    assert idxr(s2)[0.1] == 0
 
                     s2 = s.copy()
                     idxr(s2)[0.0] = 0
@@ -593,25 +623,10 @@ def test_index_type_coercion(self):
 
                     s2 = s.copy()
                     idxr(s2)['0'] = 0
-                    self.assertTrue(s2.index.is_object())
+                    assert s2.index.is_object()
 
 
-class TestMisc(Base, tm.TestCase):
-
-    def test_indexer_caching(self):
-        # GH5727
-        # make sure that indexers are in the _internal_names_set
-        n = 1000001
-        arrays = [lrange(n), lrange(n)]
-        index = MultiIndex.from_tuples(lzip(*arrays))
-        s = Series(np.zeros(n), index=index)
-        str(s)
-
-        # setitem
-        expected = Series(np.ones(n), index=index)
-        s = Series(np.zeros(n), index=index)
-        s[s == 0] = 1
-        tm.assert_series_equal(s, expected)
+class TestMisc(Base):
 
     def test_float_index_to_mixed(self):
         df = DataFrame({0.0: np.random.rand(10), 1.0: np.random.rand(10)})
@@ -633,46 +648,66 @@ def test_float_index_non_scalar_assignment(self):
         tm.assert_frame_equal(df, df2)
 
     def test_float_index_at_iat(self):
-        s = pd.Series([1, 2, 3], index=[0.1, 0.2, 0.3])
+        s = Series([1, 2, 3], index=[0.1, 0.2, 0.3])
         for el, item in s.iteritems():
-            self.assertEqual(s.at[el], item)
+            assert s.at[el] == item
         for i in range(len(s)):
-            self.assertEqual(s.iat[i], i + 1)
+            assert s.iat[i] == i + 1
+
+    def test_mixed_index_assignment(self):
+        # GH 19860
+        s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 1, 2])
+        s.at['a'] = 11
+        assert s.iat[0] == 11
+        s.at[1] = 22
+        assert s.iat[3] == 22
+
+    def test_mixed_index_no_fallback(self):
+        # GH 19860
+        s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 1, 2])
+        with pytest.raises(KeyError):
+            s.at[0]
+        with pytest.raises(KeyError):
+            s.at[4]
 
     def test_rhs_alignment(self):
         # GH8258, tests that both rows & columns are aligned to what is
         # assigned to. covers both uniform data-type & multi-type cases
         def run_tests(df, rhs, right):
             # label, index, slice
-            r, i, s = list('bcd'), [1, 2, 3], slice(1, 4)
-            c, j, l = ['joe', 'jolie'], [1, 2], slice(1, 3)
+            lbl_one, idx_one, slice_one = list('bcd'), [1, 2, 3], slice(1, 4)
+            lbl_two, idx_two, slice_two = ['joe', 'jolie'], [1, 2], slice(1, 3)
 
             left = df.copy()
-            left.loc[r, c] = rhs
+            left.loc[lbl_one, lbl_two] = rhs
             tm.assert_frame_equal(left, right)
 
             left = df.copy()
-            left.iloc[i, j] = rhs
+            left.iloc[idx_one, idx_two] = rhs
             tm.assert_frame_equal(left, right)
 
             left = df.copy()
             with catch_warnings(record=True):
-                left.ix[s, l] = rhs
+                # XXX: finer-filter here.
+                simplefilter("ignore")
+                left.ix[slice_one, slice_two] = rhs
             tm.assert_frame_equal(left, right)
 
             left = df.copy()
             with catch_warnings(record=True):
-                left.ix[i, j] = rhs
+                simplefilter("ignore")
+                left.ix[idx_one, idx_two] = rhs
             tm.assert_frame_equal(left, right)
 
             left = df.copy()
             with catch_warnings(record=True):
-                left.ix[r, c] = rhs
+                simplefilter("ignore")
+                left.ix[lbl_one, lbl_two] = rhs
             tm.assert_frame_equal(left, right)
 
         xs = np.arange(20).reshape(5, 4)
         cols = ['jim', 'joe', 'jolie', 'joline']
-        df = pd.DataFrame(xs, columns=cols, index=list('abcde'))
+        df = DataFrame(xs, columns=cols, index=list('abcde'))
 
         # right hand side; permute the indices and multiplpy by -2
         rhs = -2 * df.iloc[3:0:-1, 2:0:-1]
@@ -713,18 +748,19 @@ def assert_slices_equivalent(l_slc, i_slc):
 
     def test_slice_with_zero_step_raises(self):
         s = Series(np.arange(20), index=_mklbl('A', 20))
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: s[::0])
-        self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                lambda: s.loc[::0])
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            s[::0]
+        with pytest.raises(ValueError, match='slice step cannot be zero'):
+            s.loc[::0]
         with catch_warnings(record=True):
-            self.assertRaisesRegexp(ValueError, 'slice step cannot be zero',
-                                    lambda: s.ix[::0])
+            simplefilter("ignore")
+            with pytest.raises(ValueError, match='slice step cannot be zero'):
+                s.ix[::0]
 
     def test_indexing_assignment_dict_already_exists(self):
-        df = pd.DataFrame({'x': [1, 2, 6],
-                           'y': [2, 2, 8],
-                           'z': [-5, 0, 5]}).set_index('z')
+        df = DataFrame({'x': [1, 2, 6],
+                        'y': [2, 2, 8],
+                        'z': [-5, 0, 5]}).set_index('z')
         expected = df.copy()
         rhs = dict(x=9, y=99)
         df.loc[5] = rhs
@@ -735,18 +771,20 @@ def test_indexing_dtypes_on_empty(self):
         # Check that .iloc and .ix return correct dtypes GH9983
         df = DataFrame({'a': [1, 2, 3], 'b': ['b', 'b2', 'b3']})
         with catch_warnings(record=True):
+            simplefilter("ignore")
             df2 = df.ix[[], :]
 
-        self.assertEqual(df2.loc[:, 'a'].dtype, np.int64)
+        assert df2.loc[:, 'a'].dtype == np.int64
         tm.assert_series_equal(df2.loc[:, 'a'], df2.iloc[:, 0])
         with catch_warnings(record=True):
+            simplefilter("ignore")
             tm.assert_series_equal(df2.loc[:, 'a'], df2.ix[:, 0])
 
     def test_range_in_series_indexing(self):
         # range can cause an indexing error
         # GH 11652
         for x in [5, 999999, 1000000]:
-            s = pd.Series(index=range(x))
+            s = Series(index=range(x))
             s.loc[range(1)] = 42
             tm.assert_series_equal(s.loc[range(1)], Series(42.0, index=[0]))
 
@@ -754,7 +792,7 @@ def test_range_in_series_indexing(self):
             tm.assert_series_equal(s.loc[range(2)], Series(43.0, index=[0, 1]))
 
     def test_non_reducing_slice(self):
-        df = pd.DataFrame([[0, 1], [2, 3]])
+        df = DataFrame([[0, 1], [2, 3]])
 
         slices = [
             # pd.IndexSlice[:, :],
@@ -768,35 +806,59 @@ def test_non_reducing_slice(self):
             slice(None, None, None),
             [0, 1],
             np.array([0, 1]),
-            pd.Series([0, 1])
+            Series([0, 1])
         ]
         for slice_ in slices:
             tslice_ = _non_reducing_slice(slice_)
-            self.assertTrue(isinstance(df.loc[tslice_], DataFrame))
+            assert isinstance(df.loc[tslice_], DataFrame)
 
     def test_list_slice(self):
         # like dataframe getitem
-        slices = [['A'], pd.Series(['A']), np.array(['A'])]
-        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4]}, index=['A', 'B'])
+        slices = [['A'], Series(['A']), np.array(['A'])]
+        df = DataFrame({'A': [1, 2], 'B': [3, 4]}, index=['A', 'B'])
         expected = pd.IndexSlice[:, ['A']]
         for subset in slices:
             result = _non_reducing_slice(subset)
             tm.assert_frame_equal(df.loc[result], df.loc[expected])
 
     def test_maybe_numeric_slice(self):
-        df = pd.DataFrame({'A': [1, 2], 'B': ['c', 'd'], 'C': [True, False]})
+        df = DataFrame({'A': [1, 2], 'B': ['c', 'd'], 'C': [True, False]})
         result = _maybe_numeric_slice(df, slice_=None)
         expected = pd.IndexSlice[:, ['A']]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         result = _maybe_numeric_slice(df, None, include_bool=True)
         expected = pd.IndexSlice[:, ['A', 'C']]
         result = _maybe_numeric_slice(df, [1])
         expected = [1]
-        self.assertEqual(result, expected)
+        assert result == expected
+
+    def test_partial_boolean_frame_indexing(self):
+        # GH 17170
+        df = DataFrame(np.arange(9.).reshape(3, 3),
+                       index=list('abc'), columns=list('ABC'))
+        index_df = DataFrame(1, index=list('ab'), columns=list('AB'))
+        result = df[index_df.notnull()]
+        expected = DataFrame(np.array([[0., 1., np.nan],
+                                       [3., 4., np.nan],
+                                       [np.nan] * 3]),
+                             index=list('abc'),
+                             columns=list('ABC'))
+        tm.assert_frame_equal(result, expected)
+
+    def test_no_reference_cycle(self):
+        df = DataFrame({'a': [0, 1], 'b': [2, 3]})
+        for name in ('loc', 'iloc', 'at', 'iat'):
+            getattr(df, name)
+        with catch_warnings(record=True):
+            simplefilter("ignore")
+            getattr(df, 'ix')
+        wr = weakref.ref(df)
+        del df
+        assert wr() is None
 
 
-class TestSeriesNoneCoercion(tm.TestCase):
+class TestSeriesNoneCoercion(object):
     EXPECTED_RESULTS = [
         # For numeric series, we should coerce to NaN.
         ([1, 2, 3], [np.nan, 2, 3]),
@@ -843,7 +905,7 @@ def test_coercion_with_loc_and_series(self):
             tm.assert_series_equal(start_series, expected_series)
 
 
-class TestDataframeNoneCoercion(tm.TestCase):
+class TestDataframeNoneCoercion(object):
     EXPECTED_SINGLE_ROW_RESULTS = [
         # For numeric series, we should coerce to NaN.
         ([1, 2, 3], [np.nan, 2, 3]),
@@ -899,3 +961,55 @@ def test_none_coercion_mixed_dtypes(self):
                                datetime(2000, 1, 3)],
                          'd': [None, 'b', 'c']})
         tm.assert_frame_equal(start_dataframe, exp)
+
+
+def test_validate_indices_ok():
+    indices = np.asarray([0, 1])
+    validate_indices(indices, 2)
+    validate_indices(indices[:0], 0)
+    validate_indices(np.array([-1, -1]), 0)
+
+
+def test_validate_indices_low():
+    indices = np.asarray([0, -2])
+    with pytest.raises(ValueError, match="'indices' contains"):
+        validate_indices(indices, 2)
+
+
+def test_validate_indices_high():
+    indices = np.asarray([0, 1, 2])
+    with pytest.raises(IndexError, match="indices are out"):
+        validate_indices(indices, 2)
+
+
+def test_validate_indices_empty():
+    with pytest.raises(IndexError, match="indices are out"):
+        validate_indices(np.array([0, 1]), 0)
+
+
+def test_extension_array_cross_section():
+    # A cross-section of a homogeneous EA should be an EA
+    df = pd.DataFrame({
+        "A": pd.core.arrays.integer_array([1, 2]),
+        "B": pd.core.arrays.integer_array([3, 4])
+    }, index=['a', 'b'])
+    expected = pd.Series(pd.core.arrays.integer_array([1, 3]),
+                         index=['A', 'B'], name='a')
+    result = df.loc['a']
+    tm.assert_series_equal(result, expected)
+
+    result = df.iloc[0]
+    tm.assert_series_equal(result, expected)
+
+
+def test_extension_array_cross_section_converts():
+    df = pd.DataFrame({
+        "A": pd.core.arrays.integer_array([1, 2]),
+        "B": np.array([1, 2]),
+    }, index=['a', 'b'])
+    result = df.loc['a']
+    expected = pd.Series([1, 1], dtype=object, index=['A', 'B'], name='a')
+    tm.assert_series_equal(result, expected)
+
+    result = df.iloc[0]
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/indexing/test_indexing_engines.py b/pandas/tests/indexing/test_indexing_engines.py
new file mode 100644
index 0000000000000..57b85fd46a44e
--- /dev/null
+++ b/pandas/tests/indexing/test_indexing_engines.py
@@ -0,0 +1,169 @@
+import numpy as np
+
+from pandas._libs import algos as libalgos, index as libindex
+
+from pandas import compat
+import pandas.util.testing as tm
+
+
+class TestNumericEngine(object):
+    def test_is_monotonic(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+        num = 1000
+        arr = np.array([1] * num + [2] * num + [3] * num, dtype=dtype)
+
+        # monotonic increasing
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_monotonic_increasing is True
+        assert engine.is_monotonic_decreasing is False
+
+        # monotonic decreasing
+        engine = engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is True
+
+        # neither monotonic increasing or decreasing
+        arr = np.array([1] * num + [2] * num + [1] * num, dtype=dtype)
+        engine = engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is False
+
+    def test_is_unique(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        # unique
+        arr = np.array([1, 3, 2], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is True
+
+        # not unique
+        arr = np.array([1, 2, 1], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is False
+
+    def test_get_loc(self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        # unique
+        arr = np.array([1, 2, 3], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.get_loc(2) == 1
+
+        # monotonic
+        num = 1000
+        arr = np.array([1] * num + [2] * num + [3] * num, dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        assert engine.get_loc(2) == slice(1000, 2000)
+
+        # not monotonic
+        arr = np.array([1, 2, 3] * num, dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+        expected = np.array([False, True, False] * num, dtype=bool)
+        result = engine.get_loc(2)
+        assert (result == expected).all()
+
+    def test_get_backfill_indexer(
+            self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        arr = np.array([1, 5, 10], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+
+        new = np.array(compat.range(12), dtype=dtype)
+        result = engine.get_backfill_indexer(new)
+
+        expected = libalgos.backfill(arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_pad_indexer(
+            self, numeric_indexing_engine_type_and_dtype):
+        engine_type, dtype = numeric_indexing_engine_type_and_dtype
+
+        arr = np.array([1, 5, 10], dtype=dtype)
+        engine = engine_type(lambda: arr, len(arr))
+
+        new = np.array(compat.range(12), dtype=dtype)
+        result = engine.get_pad_indexer(new)
+
+        expected = libalgos.pad(arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestObjectEngine(object):
+    engine_type = libindex.ObjectEngine
+    dtype = np.object_
+    values = list('abc')
+
+    def test_is_monotonic(self):
+
+        num = 1000
+        arr = np.array(['a'] * num + ['a'] * num + ['c'] * num,
+                       dtype=self.dtype)
+
+        # monotonic increasing
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_monotonic_increasing is True
+        assert engine.is_monotonic_decreasing is False
+
+        # monotonic decreasing
+        engine = self.engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is True
+
+        # neither monotonic increasing or decreasing
+        arr = np.array(['a'] * num + ['b'] * num + ['a'] * num,
+                       dtype=self.dtype)
+        engine = self.engine_type(lambda: arr[::-1], len(arr))
+        assert engine.is_monotonic_increasing is False
+        assert engine.is_monotonic_decreasing is False
+
+    def test_is_unique(self):
+        # unique
+        arr = np.array(self.values, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is True
+
+        # not unique
+        arr = np.array(['a', 'b', 'a'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.is_unique is False
+
+    def test_get_loc(self):
+        # unique
+        arr = np.array(self.values, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.get_loc('b') == 1
+
+        # monotonic
+        num = 1000
+        arr = np.array(['a'] * num + ['b'] * num + ['c'] * num,
+                       dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        assert engine.get_loc('b') == slice(1000, 2000)
+
+        # not monotonic
+        arr = np.array(self.values * num, dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+        expected = np.array([False, True, False] * num, dtype=bool)
+        result = engine.get_loc('b')
+        assert (result == expected).all()
+
+    def test_get_backfill_indexer(self):
+        arr = np.array(['a', 'e', 'j'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+
+        new = np.array(list('abcdefghij'), dtype=self.dtype)
+        result = engine.get_backfill_indexer(new)
+
+        expected = libalgos.backfill["object"](arr, new)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_get_pad_indexer(self):
+        arr = np.array(['a', 'e', 'j'], dtype=self.dtype)
+        engine = self.engine_type(lambda: arr, len(arr))
+
+        new = np.array(list('abcdefghij'), dtype=self.dtype)
+        result = engine.get_pad_indexer(new)
+
+        expected = libalgos.pad["object"](arr, new)
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/indexing/test_indexing_slow.py b/pandas/tests/indexing/test_indexing_slow.py
index 42b50e37f0492..42263c813ddab 100644
--- a/pandas/tests/indexing/test_indexing_slow.py
+++ b/pandas/tests/indexing/test_indexing_slow.py
@@ -1,95 +1,17 @@
 # -*- coding: utf-8 -*-
 
-import warnings
+import pytest
 
-import numpy as np
-import pandas as pd
-from pandas.core.api import Series, DataFrame, MultiIndex
+from pandas import DataFrame
 import pandas.util.testing as tm
 
 
-class TestIndexingSlow(tm.TestCase):
+class TestIndexingSlow(object):
 
-    @tm.slow
-    def test_multiindex_get_loc(self):  # GH7724, GH2646
-
-        with warnings.catch_warnings(record=True):
-
-            # test indexing into a multi-index before & past the lexsort depth
-            from numpy.random import randint, choice, randn
-            cols = ['jim', 'joe', 'jolie', 'joline', 'jolia']
-
-            def validate(mi, df, key):
-                mask = np.ones(len(df)).astype('bool')
-
-                # test for all partials of this key
-                for i, k in enumerate(key):
-                    mask &= df.iloc[:, i] == k
-
-                    if not mask.any():
-                        self.assertNotIn(key[:i + 1], mi.index)
-                        continue
-
-                    self.assertIn(key[:i + 1], mi.index)
-                    right = df[mask].copy()
-
-                    if i + 1 != len(key):  # partial key
-                        right.drop(cols[:i + 1], axis=1, inplace=True)
-                        right.set_index(cols[i + 1:-1], inplace=True)
-                        tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
-
-                    else:  # full key
-                        right.set_index(cols[:-1], inplace=True)
-                        if len(right) == 1:  # single hit
-                            right = Series(right['jolia'].values,
-                                           name=right.index[0],
-                                           index=['jolia'])
-                            tm.assert_series_equal(mi.loc[key[:i + 1]], right)
-                        else:  # multi hit
-                            tm.assert_frame_equal(mi.loc[key[:i + 1]], right)
-
-            def loop(mi, df, keys):
-                for key in keys:
-                    validate(mi, df, key)
-
-            n, m = 1000, 50
-
-            vals = [randint(0, 10, n), choice(
-                list('abcdefghij'), n), choice(
-                    pd.date_range('20141009', periods=10).tolist(), n), choice(
-                        list('ZYXWVUTSRQ'), n), randn(n)]
-            vals = list(map(tuple, zip(*vals)))
-
-            # bunch of keys for testing
-            keys = [randint(0, 11, m), choice(
-                list('abcdefghijk'), m), choice(
-                    pd.date_range('20141009', periods=11).tolist(), m), choice(
-                        list('ZYXWVUTSRQP'), m)]
-            keys = list(map(tuple, zip(*keys)))
-            keys += list(map(lambda t: t[:-1], vals[::n // m]))
-
-            # covers both unique index and non-unique index
-            df = pd.DataFrame(vals, columns=cols)
-            a, b = pd.concat([df, df]), df.drop_duplicates(subset=cols[:-1])
-
-            for frame in a, b:
-                for i in range(5):  # lexsort depth
-                    df = frame.copy() if i == 0 else frame.sort_values(
-                        by=cols[:i])
-                    mi = df.set_index(cols[:-1])
-                    assert not mi.index.lexsort_depth < i
-                    loop(mi, df, keys)
-
-    @tm.slow
+    @pytest.mark.slow
     def test_large_dataframe_indexing(self):
         # GH10692
         result = DataFrame({'x': range(10 ** 6)}, dtype='int64')
         result.loc[len(result)] = len(result) + 1
         expected = DataFrame({'x': range(10 ** 6 + 1)}, dtype='int64')
         tm.assert_frame_equal(result, expected)
-
-    @tm.slow
-    def test_large_mi_dataframe_indexing(self):
-        # GH10645
-        result = MultiIndex.from_arrays([range(10 ** 6), range(10 ** 6)])
-        assert (not (10 ** 6, 0) in result)
diff --git a/pandas/tests/indexing/test_ix.py b/pandas/tests/indexing/test_ix.py
index e68e8015a2f39..fb4dfbb39ce94 100644
--- a/pandas/tests/indexing/test_ix.py
+++ b/pandas/tests/indexing/test_ix.py
@@ -3,24 +3,28 @@
 from warnings import catch_warnings
 
 import numpy as np
-import pandas as pd
+import pytest
 
-from pandas.types.common import is_scalar
 from pandas.compat import lrange
-from pandas import Series, DataFrame, option_context, MultiIndex
+
+from pandas.core.dtypes.common import is_scalar
+
+import pandas as pd
+from pandas import DataFrame, Series, option_context
 from pandas.util import testing as tm
-from pandas.core.common import PerformanceWarning
 
 
-class TestIX(tm.TestCase):
+def test_ix_deprecation():
+    # GH 15114
+
+    df = DataFrame({'A': [1, 2, 3]})
+    with tm.assert_produces_warning(DeprecationWarning,
+                                    check_stacklevel=False):
+        df.ix[1, 'A']
 
-    def test_ix_deprecation(self):
-        # GH 15114
 
-        df = DataFrame({'A': [1, 2, 3]})
-        with tm.assert_produces_warning(DeprecationWarning,
-                                        check_stacklevel=False):
-            df.ix[1, 'A']
+@pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
+class TestIX(object):
 
     def test_ix_loc_setitem_consistency(self):
 
@@ -51,13 +55,15 @@ def test_ix_loc_setitem_consistency(self):
 
         # GH 8607
         # ix setitem consistency
-        df = DataFrame({'timestamp': [1413840976, 1413842580, 1413760580],
-                        'delta': [1174, 904, 161],
-                        'elapsed': [7673, 9277, 1470]})
-        expected = DataFrame({'timestamp': pd.to_datetime(
-            [1413840976, 1413842580, 1413760580], unit='s'),
-            'delta': [1174, 904, 161],
-            'elapsed': [7673, 9277, 1470]})
+        df = DataFrame({'delta': [1174, 904, 161],
+                        'elapsed': [7673, 9277, 1470],
+                        'timestamp': [1413840976, 1413842580, 1413760580]})
+        expected = DataFrame({'delta': [1174, 904, 161],
+                              'elapsed': [7673, 9277, 1470],
+                              'timestamp': pd.to_datetime(
+                                  [1413840976, 1413842580, 1413760580],
+                                  unit='s')
+                              })
 
         df2 = df.copy()
         df2['timestamp'] = pd.to_datetime(df['timestamp'], unit='s')
@@ -80,12 +86,12 @@ def test_ix_loc_consistency(self):
 
         def compare(result, expected):
             if is_scalar(expected):
-                self.assertEqual(result, expected)
+                assert result == expected
             else:
-                self.assertTrue(expected.equals(result))
+                assert expected.equals(result)
 
         # failure cases for .loc, but these work for .ix
-        df = pd.DataFrame(np.random.randn(5, 4), columns=list('ABCD'))
+        df = DataFrame(np.random.randn(5, 4), columns=list('ABCD'))
         for key in [slice(1, 3), tuple([slice(0, 2), slice(0, 2)]),
                     tuple([slice(0, 2), df.columns[0:2]])]:
 
@@ -96,10 +102,15 @@ def compare(result, expected):
                 with catch_warnings(record=True):
                     df.ix[key]
 
-                self.assertRaises(TypeError, lambda: df.loc[key])
+                msg = (r"cannot do slice indexing"
+                       r" on {klass} with these indexers \[(0|1)\] of"
+                       r" {kind}"
+                       .format(klass=type(df.index), kind=str(int)))
+                with pytest.raises(TypeError, match=msg):
+                    df.loc[key]
 
-        df = pd.DataFrame(np.random.randn(5, 4), columns=list('ABCD'),
-                          index=pd.date_range('2012-01-01', periods=5))
+        df = DataFrame(np.random.randn(5, 4), columns=list('ABCD'),
+                       index=pd.date_range('2012-01-01', periods=5))
 
         for key in ['2012-01-03',
                     '2012-01-31',
@@ -116,7 +127,8 @@ def compare(result, expected):
                 with catch_warnings(record=True):
                     expected = df.ix[key]
             except KeyError:
-                self.assertRaises(KeyError, lambda: df.loc[key])
+                with pytest.raises(KeyError, match=r"^'2012-01-31'$"):
+                    df.loc[key]
                 continue
 
             result = df.loc[key]
@@ -172,31 +184,6 @@ def test_ix_weird_slicing(self):
                                       4: 5}})
         tm.assert_frame_equal(df, expected)
 
-    def test_ix_general(self):
-
-        # ix general issues
-
-        # GH 2817
-        data = {'amount': {0: 700, 1: 600, 2: 222, 3: 333, 4: 444},
-                'col': {0: 3.5, 1: 3.5, 2: 4.0, 3: 4.0, 4: 4.0},
-                'year': {0: 2012, 1: 2011, 2: 2012, 3: 2012, 4: 2012}}
-        df = DataFrame(data).set_index(keys=['col', 'year'])
-        key = 4.0, 2012
-
-        # emits a PerformanceWarning, ok
-        with self.assert_produces_warning(PerformanceWarning):
-            tm.assert_frame_equal(df.loc[key], df.iloc[2:])
-
-        # this is ok
-        df.sort_index(inplace=True)
-        res = df.loc[key]
-
-        # col has float dtype, result should be Float64Index
-        index = MultiIndex.from_arrays([[4.] * 3, [2012] * 3],
-                                       names=['col', 'year'])
-        expected = DataFrame({'amount': [222, 333, 444]}, index=index)
-        tm.assert_frame_equal(res, expected)
-
     def test_ix_assign_column_mixed(self):
         # GH #1142
         df = DataFrame(tm.getSeriesData())
@@ -214,7 +201,7 @@ def test_ix_assign_column_mixed(self):
             indexer = i * 2
             v = 1000 + i * 200
             expected.loc[indexer, 'y'] = v
-            self.assertEqual(expected.loc[indexer, 'y'], v)
+            assert expected.loc[indexer, 'y'] == v
 
         df.loc[df.x % 2 == 0, 'y'] = df.loc[df.x % 2 == 0, 'y'] * 100
         tm.assert_frame_equal(df, expected)
@@ -225,7 +212,7 @@ def test_ix_assign_column_mixed(self):
         expected = DataFrame({'a': [1, 2, 3], 'b': [100, 1, -100]})
         tm.assert_frame_equal(df, expected)
 
-        df = pd.DataFrame({'a': lrange(4)})
+        df = DataFrame({'a': lrange(4)})
         df['b'] = np.nan
         df.loc[[1, 3], 'b'] = [100, -100]
         expected = DataFrame({'a': [0, 1, 2, 3],
@@ -233,9 +220,9 @@ def test_ix_assign_column_mixed(self):
         tm.assert_frame_equal(df, expected)
 
         # ok, but chained assignments are dangerous
-        # if we turn off chained assignement it will work
+        # if we turn off chained assignment it will work
         with option_context('chained_assignment', None):
-            df = pd.DataFrame({'a': lrange(4)})
+            df = DataFrame({'a': lrange(4)})
             df['b'] = np.nan
             df['b'].loc[[1, 3]] = [100, -100]
             tm.assert_frame_equal(df, expected)
@@ -250,21 +237,21 @@ def test_ix_get_set_consistency(self):
                        index=['e', 7, 'f', 'g'])
 
         with catch_warnings(record=True):
-            self.assertEqual(df.ix['e', 8], 2)
-        self.assertEqual(df.loc['e', 8], 2)
+            assert df.ix['e', 8] == 2
+        assert df.loc['e', 8] == 2
 
         with catch_warnings(record=True):
             df.ix['e', 8] = 42
-            self.assertEqual(df.ix['e', 8], 42)
-        self.assertEqual(df.loc['e', 8], 42)
+            assert df.ix['e', 8] == 42
+        assert df.loc['e', 8] == 42
 
         df.loc['e', 8] = 45
         with catch_warnings(record=True):
-            self.assertEqual(df.ix['e', 8], 45)
-        self.assertEqual(df.loc['e', 8], 45)
+            assert df.ix['e', 8] == 45
+        assert df.loc['e', 8] == 45
 
     def test_ix_slicing_strings(self):
-        # GH3836
+        # see gh-3836
         data = {'Classification':
                 ['SA EQUITY CFD', 'bbb', 'SA EQUITY', 'SA SSF', 'aaa'],
                 'Random': [1, 2, 3, 4, 5],
@@ -294,18 +281,22 @@ def test_ix_slicing_strings(self):
         tm.assert_frame_equal(df, expected)
 
     def test_ix_setitem_out_of_bounds_axis_0(self):
-        df = pd.DataFrame(
+        df = DataFrame(
             np.random.randn(2, 5), index=["row%s" % i for i in range(2)],
             columns=["col%s" % i for i in range(5)])
         with catch_warnings(record=True):
-            self.assertRaises(ValueError, df.ix.__setitem__, (2, 0), 100)
+            msg = "cannot set by positional indexing with enlargement"
+            with pytest.raises(ValueError, match=msg):
+                df.ix[2, 0] = 100
 
     def test_ix_setitem_out_of_bounds_axis_1(self):
-        df = pd.DataFrame(
+        df = DataFrame(
             np.random.randn(5, 2), index=["row%s" % i for i in range(5)],
             columns=["col%s" % i for i in range(2)])
         with catch_warnings(record=True):
-            self.assertRaises(ValueError, df.ix.__setitem__, (0, 2), 100)
+            msg = "cannot set by positional indexing with enlargement"
+            with pytest.raises(ValueError, match=msg):
+                df.ix[0, 2] = 100
 
     def test_ix_empty_list_indexer_is_ok(self):
         with catch_warnings(record=True):
diff --git a/pandas/tests/indexing/test_loc.py b/pandas/tests/indexing/test_loc.py
index af9d3ffdf6671..c4f98b892feb7 100644
--- a/pandas/tests/indexing/test_loc.py
+++ b/pandas/tests/indexing/test_loc.py
@@ -1,22 +1,24 @@
 """ test label based indexing with loc """
 
-import itertools
-from warnings import catch_warnings
+from warnings import catch_warnings, filterwarnings
+
 import numpy as np
+import pytest
+
+from pandas.compat import PY2, StringIO, lrange
 
 import pandas as pd
-from pandas.compat import lrange, StringIO
-from pandas import (Series, DataFrame, Timestamp,
-                    date_range, MultiIndex)
-from pandas.util import testing as tm
+from pandas import DataFrame, Series, Timestamp, date_range
+from pandas.api.types import is_scalar
 from pandas.tests.indexing.common import Base
+from pandas.util import testing as tm
 
 
-class TestLoc(Base, tm.TestCase):
+class TestLoc(Base):
 
     def test_loc_getitem_dups(self):
         # GH 5678
-        # repeated gettitems on a dup index returing a ndarray
+        # repeated gettitems on a dup index returning a ndarray
         df = DataFrame(
             np.random.random_sample((20, 5)),
             index=['ABCDE' [x % 5] for x in range(20)])
@@ -56,7 +58,7 @@ def test_loc_setitem_dups(self):
         indexer = tuple(['r', 'bar'])
         df = df_orig.copy()
         df.loc[indexer] *= 2.0
-        self.assertEqual(df.loc[indexer], 2.0 * df_orig.loc[indexer])
+        assert df.loc[indexer] == 2.0 * df_orig.loc[indexer]
 
         indexer = tuple(['t', ['bar', 'bar2']])
         df = df_orig.copy()
@@ -93,8 +95,6 @@ def test_loc_getitem_int(self):
                           typs=['ints', 'uints'], axes=0)
         self.check_result('int label', 'loc', 3, 'ix', 3,
                           typs=['ints', 'uints'], axes=1)
-        self.check_result('int label', 'loc', 4, 'ix', 4,
-                          typs=['ints', 'uints'], axes=2)
         self.check_result('int label', 'loc', 2, 'ix', 2,
                           typs=['label'], fails=KeyError)
 
@@ -118,7 +118,7 @@ def test_loc_getitem_label_out_of_range(self):
                           typs=['ints', 'uints', 'labels', 'mixed', 'ts'],
                           fails=KeyError)
         self.check_result('label range', 'loc', 'f', 'ix', 'f',
-                          typs=['floats'], fails=TypeError)
+                          typs=['floats'], fails=KeyError)
         self.check_result('label range', 'loc', 20, 'ix', 20,
                           typs=['ints', 'uints', 'mixed'], fails=KeyError)
         self.check_result('label range', 'loc', 20, 'ix', 20,
@@ -126,7 +126,7 @@ def test_loc_getitem_label_out_of_range(self):
         self.check_result('label range', 'loc', 20, 'ix', 20, typs=['ts'],
                           axes=0, fails=TypeError)
         self.check_result('label range', 'loc', 20, 'ix', 20, typs=['floats'],
-                          axes=0, fails=TypeError)
+                          axes=0, fails=KeyError)
 
     def test_loc_getitem_label_list(self):
 
@@ -135,14 +135,10 @@ def test_loc_getitem_label_list(self):
                           typs=['ints', 'uints'], axes=0)
         self.check_result('list lbl', 'loc', [3, 6, 9], 'ix', [3, 6, 9],
                           typs=['ints', 'uints'], axes=1)
-        self.check_result('list lbl', 'loc', [4, 8, 12], 'ix', [4, 8, 12],
-                          typs=['ints', 'uints'], axes=2)
         self.check_result('list lbl', 'loc', ['a', 'b', 'd'], 'ix',
                           ['a', 'b', 'd'], typs=['labels'], axes=0)
         self.check_result('list lbl', 'loc', ['A', 'B', 'C'], 'ix',
                           ['A', 'B', 'C'], typs=['labels'], axes=1)
-        self.check_result('list lbl', 'loc', ['Z', 'Y', 'W'], 'ix',
-                          ['Z', 'Y', 'W'], typs=['labels'], axes=2)
         self.check_result('list lbl', 'loc', [2, 8, 'null'], 'ix',
                           [2, 8, 'null'], typs=['mixed'], axes=0)
         self.check_result('list lbl', 'loc',
@@ -150,21 +146,43 @@ def test_loc_getitem_label_list(self):
                           [Timestamp('20130102'), Timestamp('20130103')],
                           typs=['ts'], axes=0)
 
+    @pytest.mark.skipif(PY2, reason=("Catching warnings unreliable with "
+                                     "Python 2 (GH #20770)"))
+    def test_loc_getitem_label_list_with_missing(self):
         self.check_result('list lbl', 'loc', [0, 1, 2], 'indexer', [0, 1, 2],
                           typs=['empty'], fails=KeyError)
-        self.check_result('list lbl', 'loc', [0, 2, 3], 'ix', [0, 2, 3],
-                          typs=['ints', 'uints'], axes=0, fails=KeyError)
-        self.check_result('list lbl', 'loc', [3, 6, 7], 'ix', [3, 6, 7],
-                          typs=['ints', 'uints'], axes=1, fails=KeyError)
-        self.check_result('list lbl', 'loc', [4, 8, 10], 'ix', [4, 8, 10],
-                          typs=['ints', 'uints'], axes=2, fails=KeyError)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [0, 2, 10], 'ix', [0, 2, 10],
+                              typs=['ints', 'uints', 'floats'],
+                              axes=0, fails=KeyError)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [3, 6, 7], 'ix', [3, 6, 7],
+                              typs=['ints', 'uints', 'floats'],
+                              axes=1, fails=KeyError)
+
+        # GH 17758 - MultiIndex and missing keys
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            self.check_result('list lbl', 'loc', [(1, 3), (1, 4), (2, 5)],
+                              'ix', [(1, 3), (1, 4), (2, 5)],
+                              typs=['multi'],
+                              axes=0)
+
+    def test_getitem_label_list_with_missing(self):
+        s = Series(range(3), index=['a', 'b', 'c'])
+
+        # consistency
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s[['a', 'd']]
+
+        s = Series(range(3))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s[[0, 3]]
 
     def test_loc_getitem_label_list_fails(self):
         # fails
         self.check_result('list lbl', 'loc', [20, 30, 40], 'ix', [20, 30, 40],
                           typs=['ints', 'uints'], axes=1, fails=KeyError)
-        self.check_result('list lbl', 'loc', [20, 30, 40], 'ix', [20, 30, 40],
-                          typs=['ints', 'uints'], axes=2, fails=KeyError)
 
     def test_loc_getitem_label_array_like(self):
         # array like
@@ -172,8 +190,6 @@ def test_loc_getitem_label_array_like(self):
                           'ix', [0, 2, 4], typs=['ints', 'uints'], axes=0)
         self.check_result('array like', 'loc', Series(index=[3, 6, 9]).index,
                           'ix', [3, 6, 9], typs=['ints', 'uints'], axes=1)
-        self.check_result('array like', 'loc', Series(index=[4, 8, 12]).index,
-                          'ix', [4, 8, 12], typs=['ints', 'uints'], axes=2)
 
     def test_loc_getitem_bool(self):
         # boolean indexers
@@ -191,37 +207,6 @@ def test_loc_getitem_int_slice(self):
                           typs=['ints', 'uints'], axes=0)
         self.check_result('int slice2', 'loc', slice(3, 6), 'ix', [3, 6],
                           typs=['ints', 'uints'], axes=1)
-        self.check_result('int slice2', 'loc', slice(4, 8), 'ix', [4, 8],
-                          typs=['ints', 'uints'], axes=2)
-
-        # GH 3053
-        # loc should treat integer slices like label slices
-
-        index = MultiIndex.from_tuples([t for t in itertools.product(
-            [6, 7, 8], ['a', 'b'])])
-        df = DataFrame(np.random.randn(6, 6), index, index)
-        result = df.loc[6:8, :]
-        expected = df
-        tm.assert_frame_equal(result, expected)
-
-        index = MultiIndex.from_tuples([t
-                                        for t in itertools.product(
-                                            [10, 20, 30], ['a', 'b'])])
-        df = DataFrame(np.random.randn(6, 6), index, index)
-        result = df.loc[20:30, :]
-        expected = df.iloc[2:]
-        tm.assert_frame_equal(result, expected)
-
-        # doc examples
-        result = df.loc[10, :]
-        expected = df.iloc[0:2]
-        expected.index = ['a', 'b']
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[:, 10]
-        # expected = df.ix[:,10] (this fails)
-        expected = df[10]
-        tm.assert_frame_equal(result, expected)
 
     def test_loc_to_fail(self):
 
@@ -231,8 +216,10 @@ def test_loc_to_fail(self):
                        columns=['e', 'f', 'g'])
 
         # raise a KeyError?
-        self.assertRaises(KeyError, df.loc.__getitem__,
-                          tuple([[1, 2], [1, 2]]))
+        msg = (r"\"None of \[Int64Index\(\[1, 2\], dtype='int64'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            df.loc[[1, 2], [1, 2]]
 
         # GH  7496
         # loc should not fallback
@@ -241,39 +228,65 @@ def test_loc_to_fail(self):
         s.loc[1] = 1
         s.loc['a'] = 2
 
-        self.assertRaises(KeyError, lambda: s.loc[-1])
-        self.assertRaises(KeyError, lambda: s.loc[[-1, -2]])
+        with pytest.raises(KeyError, match=r"^-1$"):
+            s.loc[-1]
 
-        self.assertRaises(KeyError, lambda: s.loc[['4']])
+        msg = (r"\"None of \[Int64Index\(\[-1, -2\], dtype='int64'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            s.loc[[-1, -2]]
+
+        msg = (r"\"None of \[Index\(\[u?'4'\], dtype='object'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            s.loc[['4']]
 
         s.loc[-1] = 3
-        result = s.loc[[-1, -2]]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = s.loc[[-1, -2]]
         expected = Series([3, np.nan], index=[-1, -2])
         tm.assert_series_equal(result, expected)
 
         s['a'] = 2
-        self.assertRaises(KeyError, lambda: s.loc[[-2]])
+        msg = (r"\"None of \[Int64Index\(\[-2\], dtype='int64'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            s.loc[[-2]]
 
         del s['a']
 
-        def f():
+        with pytest.raises(KeyError, match=msg):
             s.loc[[-2]] = 0
 
-        self.assertRaises(KeyError, f)
-
         # inconsistency between .loc[values] and .loc[values,:]
         # GH 7999
         df = DataFrame([['a'], ['b']], index=[1, 2], columns=['value'])
 
-        def f():
+        msg = (r"\"None of \[Int64Index\(\[3\], dtype='int64'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
             df.loc[[3], :]
 
-        self.assertRaises(KeyError, f)
-
-        def f():
+        with pytest.raises(KeyError, match=msg):
             df.loc[[3]]
 
-        self.assertRaises(KeyError, f)
+    def test_loc_getitem_list_with_fail(self):
+        # 15747
+        # should KeyError if *any* missing labels
+
+        s = Series([1, 2, 3])
+
+        s.loc[[2]]
+
+        with pytest.raises(KeyError):
+            s.loc[[3]]
+
+        # a non-match and a match
+        with tm.assert_produces_warning(FutureWarning):
+            expected = s.loc[[2, 3]]
+        result = s.reindex([2, 3])
+        tm.assert_series_equal(result, expected)
 
     def test_loc_getitem_label_slice(self):
 
@@ -288,8 +301,6 @@ def test_loc_getitem_label_slice(self):
                           'ix', slice('a', 'c'), typs=['labels'], axes=0)
         self.check_result('lab slice', 'loc', slice('A', 'C'),
                           'ix', slice('A', 'C'), typs=['labels'], axes=1)
-        self.check_result('lab slice', 'loc', slice('W', 'Z'),
-                          'ix', slice('W', 'Z'), typs=['labels'], axes=2)
 
         self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
                           'ix', slice('20130102', '20130104'),
@@ -297,9 +308,6 @@ def test_loc_getitem_label_slice(self):
         self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
                           'ix', slice('20130102', '20130104'),
                           typs=['ts'], axes=1, fails=TypeError)
-        self.check_result('ts  slice', 'loc', slice('20130102', '20130104'),
-                          'ix', slice('20130102', '20130104'),
-                          typs=['ts'], axes=2, fails=TypeError)
 
         # GH 14316
         self.check_result('ts slice rev', 'loc', slice('20130104', '20130102'),
@@ -309,12 +317,27 @@ def test_loc_getitem_label_slice(self):
                           typs=['mixed'], axes=0, fails=TypeError)
         self.check_result('mixed slice', 'loc', slice(2, 8), 'ix', slice(2, 8),
                           typs=['mixed'], axes=1, fails=KeyError)
-        self.check_result('mixed slice', 'loc', slice(2, 8), 'ix', slice(2, 8),
-                          typs=['mixed'], axes=2, fails=KeyError)
 
         self.check_result('mixed slice', 'loc', slice(2, 4, 2), 'ix', slice(
             2, 4, 2), typs=['mixed'], axes=0, fails=TypeError)
 
+    def test_loc_index(self):
+        # gh-17131
+        # a boolean index should index like a boolean numpy array
+
+        df = DataFrame(
+            np.random.random(size=(5, 10)),
+            index=["alpha_0", "alpha_1", "alpha_2", "beta_0", "beta_1"])
+
+        mask = df.index.map(lambda x: "alpha" in x)
+        expected = df.loc[np.array(mask)]
+
+        result = df.loc[mask]
+        tm.assert_frame_equal(result, expected)
+
+        result = df.loc[mask.values]
+        tm.assert_frame_equal(result, expected)
+
     def test_loc_general(self):
 
         df = DataFrame(
@@ -323,18 +346,18 @@ def test_loc_general(self):
 
         # want this to work
         result = df.loc[:, "A":"B"].iloc[0:2, :]
-        self.assertTrue((result.columns == ['A', 'B']).all())
-        self.assertTrue((result.index == ['A', 'B']).all())
+        assert (result.columns == ['A', 'B']).all()
+        assert (result.index == ['A', 'B']).all()
 
         # mixed type
         result = DataFrame({'a': [Timestamp('20130101')], 'b': [1]}).iloc[0]
         expected = Series([Timestamp('20130101'), 1], index=['a', 'b'], name=0)
         tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, object)
+        assert result.dtype == object
 
     def test_loc_setitem_consistency(self):
         # GH 6149
-        # coerce similary for setitem and loc when rows have a null-slice
+        # coerce similarly for setitem and loc when rows have a null-slice
         expected = DataFrame({'date': Series(0, index=range(5),
                                              dtype=np.int64),
                               'val': Series(range(5), dtype=np.int64)})
@@ -369,6 +392,13 @@ def test_loc_setitem_consistency(self):
         df.loc[:, 'date'] = 1.0
         tm.assert_frame_equal(df, expected)
 
+        # GH 15494
+        # setting on frame with single row
+        df = DataFrame({'date': Series([Timestamp('20180101')])})
+        df.loc[:, 'date'] = 'string'
+        expected = DataFrame({'date': Series(['string'])})
+        tm.assert_frame_equal(df, expected)
+
     def test_loc_setitem_consistency_empty(self):
         # empty (essentially noops)
         expected = DataFrame(columns=['x', 'y'])
@@ -413,10 +443,10 @@ def test_loc_setitem_frame(self):
 
         df.loc['a', 'A'] = 1
         result = df.loc['a', 'A']
-        self.assertEqual(result, 1)
+        assert result == 1
 
         result = df.iloc[0, 0]
-        self.assertEqual(result, 1)
+        assert result == 1
 
         df.loc[:, 'B':'D'] = 0
         expected = df.loc[:, 'B':'D']
@@ -497,10 +527,25 @@ def test_loc_setitem_frame_multiples(self):
         df.loc[2:4] = rhs
         tm.assert_frame_equal(df, expected)
 
+    @pytest.mark.parametrize(
+        'indexer', [['A'], slice(None, 'A', None), np.array(['A'])])
+    @pytest.mark.parametrize(
+        'value', [['Z'], np.array(['Z'])])
+    def test_loc_setitem_with_scalar_index(self, indexer, value):
+        # GH #19474
+        # assigning like "df.loc[0, ['A']] = ['Z']" should be evaluated
+        # elementwisely, not using "setter('A', ['Z'])".
+
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        df.loc[0, indexer] = value
+        result = df.loc[0, 'A']
+
+        assert is_scalar(result) and result == 'Z'
+
     def test_loc_coerceion(self):
 
         # 12411
-        df = DataFrame({'date': [pd.Timestamp('20130101').tz_localize('UTC'),
+        df = DataFrame({'date': [Timestamp('20130101').tz_localize('UTC'),
                                  pd.NaT]})
         expected = df.dtypes
 
@@ -537,14 +582,18 @@ def test_loc_non_unique(self):
         # non-unique indexer with loc slice
         # https://groups.google.com/forum/?fromgroups#!topic/pydata/zTm2No0crYs
 
-        # these are going to raise becuase the we are non monotonic
+        # these are going to raise because the we are non monotonic
         df = DataFrame({'A': [1, 2, 3, 4, 5, 6],
                         'B': [3, 4, 5, 6, 7, 8]}, index=[0, 1, 0, 1, 2, 3])
-        self.assertRaises(KeyError, df.loc.__getitem__,
-                          tuple([slice(1, None)]))
-        self.assertRaises(KeyError, df.loc.__getitem__,
-                          tuple([slice(0, None)]))
-        self.assertRaises(KeyError, df.loc.__getitem__, tuple([slice(1, 2)]))
+        msg = "'Cannot get left slice bound for non-unique label: 1'"
+        with pytest.raises(KeyError, match=msg):
+            df.loc[1:]
+        msg = "'Cannot get left slice bound for non-unique label: 0'"
+        with pytest.raises(KeyError, match=msg):
+            df.loc[0:]
+        msg = "'Cannot get left slice bound for non-unique label: 1'"
+        with pytest.raises(KeyError, match=msg):
+            df.loc[1:2]
 
         # monotonic are ok
         df = DataFrame({'A': [1, 2, 3, 4, 5, 6],
@@ -578,15 +627,15 @@ def gen_test(l, l2):
                           index=[0] * l2, columns=columns)])
 
         def gen_expected(df, mask):
-            l = len(mask)
-            return pd.concat([df.take([0], convert=False),
-                              DataFrame(np.ones((l, len(columns))),
-                                        index=[0] * l,
+            len_mask = len(mask)
+            return pd.concat([df.take([0]),
+                              DataFrame(np.ones((len_mask, len(columns))),
+                                        index=[0] * len_mask,
                                         columns=columns),
-                              df.take(mask[1:], convert=False)])
+                              df.take(mask[1:])])
 
         df = gen_test(900, 100)
-        self.assertFalse(df.index.is_unique)
+        assert df.index.is_unique is False
 
         mask = np.arange(100)
         result = df.loc[mask]
@@ -594,7 +643,7 @@ def gen_expected(df, mask):
         tm.assert_frame_equal(result, expected)
 
         df = gen_test(900000, 100000)
-        self.assertFalse(df.index.is_unique)
+        assert df.index.is_unique is False
 
         mask = np.arange(100000)
         result = df.loc[mask]
@@ -606,14 +655,15 @@ def test_loc_name(self):
         df = DataFrame([[1, 1], [1, 1]])
         df.index.name = 'index_name'
         result = df.iloc[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
+        assert result == 'index_name'
 
         with catch_warnings(record=True):
+            filterwarnings("ignore", "\\n.ix", DeprecationWarning)
             result = df.ix[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
+        assert result == 'index_name'
 
         result = df.loc[[0, 1]].index.name
-        self.assertEqual(result, 'index_name')
+        assert result == 'index_name'
 
     def test_loc_empty_list_indexer_is_ok(self):
         from pandas.util.testing import makeCustomDataframe as mkdf
@@ -628,3 +678,92 @@ def test_loc_empty_list_indexer_is_ok(self):
         tm.assert_frame_equal(df.loc[[]], df.iloc[:0, :],
                               check_index_type=True,
                               check_column_type=True)
+
+    def test_identity_slice_returns_new_object(self):
+        # GH13873
+        original_df = DataFrame({'a': [1, 2, 3]})
+        sliced_df = original_df.loc[:]
+        assert sliced_df is not original_df
+        assert original_df[:] is not original_df
+
+        # should be a shallow copy
+        original_df['a'] = [4, 4, 4]
+        assert (sliced_df['a'] == 4).all()
+
+        # These should not return copies
+        assert original_df is original_df.loc[:, :]
+        df = DataFrame(np.random.randn(10, 4))
+        assert df[0] is df.loc[:, 0]
+
+        # Same tests for Series
+        original_series = Series([1, 2, 3, 4, 5, 6])
+        sliced_series = original_series.loc[:]
+        assert sliced_series is not original_series
+        assert original_series[:] is not original_series
+
+        original_series[:3] = [7, 8, 9]
+        assert all(sliced_series[:3] == [7, 8, 9])
+
+    def test_loc_uint64(self):
+        # GH20722
+        # Test whether loc accept uint64 max value as index.
+        s = pd.Series([1, 2],
+                      index=[np.iinfo('uint64').max - 1,
+                             np.iinfo('uint64').max])
+
+        result = s.loc[np.iinfo('uint64').max - 1]
+        expected = s.iloc[0]
+        assert result == expected
+
+        result = s.loc[[np.iinfo('uint64').max - 1]]
+        expected = s.iloc[[0]]
+        tm.assert_series_equal(result, expected)
+
+        result = s.loc[[np.iinfo('uint64').max - 1,
+                       np.iinfo('uint64').max]]
+        tm.assert_series_equal(result, s)
+
+    def test_loc_setitem_empty_append(self):
+        # GH6173, various appends to an empty dataframe
+
+        data = [1, 2, 3]
+        expected = DataFrame({'x': data, 'y': [None] * len(data)})
+
+        # appends to fit length of data
+        df = DataFrame(columns=['x', 'y'])
+        df.loc[:, 'x'] = data
+        tm.assert_frame_equal(df, expected)
+
+        # only appends one value
+        expected = DataFrame({'x': [1.0], 'y': [np.nan]})
+        df = DataFrame(columns=['x', 'y'],
+                       dtype=np.float)
+        df.loc[0, 'x'] = expected.loc[0, 'x']
+        tm.assert_frame_equal(df, expected)
+
+    def test_loc_setitem_empty_append_raises(self):
+        # GH6173, various appends to an empty dataframe
+
+        data = [1, 2]
+        df = DataFrame(columns=['x', 'y'])
+        msg = (r"None of \[Int64Index\(\[0, 1\], dtype='int64'\)\] "
+               r"are in the \[index\]")
+        with pytest.raises(KeyError, match=msg):
+            df.loc[[0, 1], 'x'] = data
+
+        msg = "cannot copy sequence with size 2 to array axis with dimension 0"
+        with pytest.raises(ValueError, match=msg):
+            df.loc[0:2, 'x'] = data
+
+    def test_indexing_zerodim_np_array(self):
+        # GH24924
+        df = DataFrame([[1, 2], [3, 4]])
+        result = df.loc[np.array(0)]
+        s = pd.Series([1, 2], name=0)
+        tm.assert_series_equal(result, s)
+
+    def test_series_indexing_zerodim_np_array(self):
+        # GH24924
+        s = Series([1, 2])
+        result = s.loc[np.array(0)]
+        assert result == 1
diff --git a/pandas/tests/indexing/test_multiindex.py b/pandas/tests/indexing/test_multiindex.py
deleted file mode 100644
index ed943202872a7..0000000000000
--- a/pandas/tests/indexing/test_multiindex.py
+++ /dev/null
@@ -1,1250 +0,0 @@
-from warnings import catch_warnings
-import pytest
-import numpy as np
-import pandas as pd
-from pandas import (Panel, Series, MultiIndex, DataFrame,
-                    Timestamp, Index, date_range)
-from pandas.util import testing as tm
-from pandas.core.common import PerformanceWarning, UnsortedIndexError
-from pandas.tests.indexing.common import _mklbl
-
-
-class TestMultiIndexBasic(tm.TestCase):
-
-    def test_iloc_getitem_multiindex2(self):
-        # TODO(wesm): fix this
-        pytest.skip('this test was being suppressed, '
-                    'needs to be fixed')
-
-        arr = np.random.randn(3, 3)
-        df = DataFrame(arr, columns=[[2, 2, 4], [6, 8, 10]],
-                       index=[[4, 4, 8], [8, 10, 12]])
-
-        rs = df.iloc[2]
-        xp = Series(arr[2], index=df.columns)
-        tm.assert_series_equal(rs, xp)
-
-        rs = df.iloc[:, 2]
-        xp = Series(arr[:, 2], index=df.index)
-        tm.assert_series_equal(rs, xp)
-
-        rs = df.iloc[2, 2]
-        xp = df.values[2, 2]
-        self.assertEqual(rs, xp)
-
-        # for multiple items
-        # GH 5528
-        rs = df.iloc[[0, 1]]
-        xp = df.xs(4, drop_level=False)
-        tm.assert_frame_equal(rs, xp)
-
-        tup = zip(*[['a', 'a', 'b', 'b'], ['x', 'y', 'x', 'y']])
-        index = MultiIndex.from_tuples(tup)
-        df = DataFrame(np.random.randn(4, 4), index=index)
-        rs = df.iloc[[2, 3]]
-        xp = df.xs('b', drop_level=False)
-        tm.assert_frame_equal(rs, xp)
-
-    def test_setitem_multiindex(self):
-        with catch_warnings(record=True):
-
-            for index_fn in ('ix', 'loc'):
-
-                def check(target, indexers, value, compare_fn, expected=None):
-                    fn = getattr(target, index_fn)
-                    fn.__setitem__(indexers, value)
-                    result = fn.__getitem__(indexers)
-                    if expected is None:
-                        expected = value
-                    compare_fn(result, expected)
-                # GH7190
-                index = pd.MultiIndex.from_product([np.arange(0, 100),
-                                                    np.arange(0, 80)],
-                                                   names=['time', 'firm'])
-                t, n = 0, 2
-                df = DataFrame(np.nan, columns=['A', 'w', 'l', 'a', 'x',
-                                                'X', 'd', 'profit'],
-                               index=index)
-                check(target=df, indexers=((t, n), 'X'), value=0,
-                      compare_fn=self.assertEqual)
-
-                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
-                                              'X', 'd', 'profit'],
-                               index=index)
-                check(target=df, indexers=((t, n), 'X'), value=1,
-                      compare_fn=self.assertEqual)
-
-                df = DataFrame(columns=['A', 'w', 'l', 'a', 'x',
-                                        'X', 'd', 'profit'],
-                               index=index)
-                check(target=df, indexers=((t, n), 'X'), value=2,
-                      compare_fn=self.assertEqual)
-
-                # GH 7218, assinging with 0-dim arrays
-                df = DataFrame(-999, columns=['A', 'w', 'l', 'a', 'x',
-                                              'X', 'd', 'profit'],
-                               index=index)
-                check(target=df,
-                      indexers=((t, n), 'X'),
-                      value=np.array(3),
-                      compare_fn=self.assertEqual,
-                      expected=3, )
-
-                # GH5206
-                df = pd.DataFrame(np.arange(25).reshape(5, 5),
-                                  columns='A,B,C,D,E'.split(','), dtype=float)
-                df['F'] = 99
-                row_selection = df['A'] % 2 == 0
-                col_selection = ['B', 'C']
-                with catch_warnings(record=True):
-                    df.ix[row_selection, col_selection] = df['F']
-                output = pd.DataFrame(99., index=[0, 2, 4], columns=['B', 'C'])
-                with catch_warnings(record=True):
-                    tm.assert_frame_equal(df.ix[row_selection, col_selection],
-                                          output)
-                check(target=df,
-                      indexers=(row_selection, col_selection),
-                      value=df['F'],
-                      compare_fn=tm.assert_frame_equal,
-                      expected=output, )
-
-                # GH11372
-                idx = pd.MultiIndex.from_product([
-                    ['A', 'B', 'C'],
-                    pd.date_range('2015-01-01', '2015-04-01', freq='MS')])
-                cols = pd.MultiIndex.from_product([
-                    ['foo', 'bar'],
-                    pd.date_range('2016-01-01', '2016-02-01', freq='MS')])
-
-                df = pd.DataFrame(np.random.random((12, 4)),
-                                  index=idx, columns=cols)
-
-                subidx = pd.MultiIndex.from_tuples(
-                    [('A', pd.Timestamp('2015-01-01')),
-                     ('A', pd.Timestamp('2015-02-01'))])
-                subcols = pd.MultiIndex.from_tuples(
-                    [('foo', pd.Timestamp('2016-01-01')),
-                     ('foo', pd.Timestamp('2016-02-01'))])
-
-                vals = pd.DataFrame(np.random.random((2, 2)),
-                                    index=subidx, columns=subcols)
-                check(target=df,
-                      indexers=(subidx, subcols),
-                      value=vals,
-                      compare_fn=tm.assert_frame_equal, )
-                # set all columns
-                vals = pd.DataFrame(
-                    np.random.random((2, 4)), index=subidx, columns=cols)
-                check(target=df,
-                      indexers=(subidx, slice(None, None, None)),
-                      value=vals,
-                      compare_fn=tm.assert_frame_equal, )
-                # identity
-                copy = df.copy()
-                check(target=df, indexers=(df.index, df.columns), value=df,
-                      compare_fn=tm.assert_frame_equal, expected=copy)
-
-    def test_loc_getitem_series(self):
-        # GH14730
-        # passing a series as a key with a MultiIndex
-        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
-        x = Series(index=index, data=range(9), dtype=np.float64)
-        y = Series([1, 3])
-        expected = Series(
-            data=[0, 1, 2, 6, 7, 8],
-            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
-            dtype=np.float64)
-        result = x.loc[y]
-        tm.assert_series_equal(result, expected)
-
-        result = x.loc[[1, 3]]
-        tm.assert_series_equal(result, expected)
-
-        # GH15424
-        y1 = Series([1, 3], index=[1, 2])
-        result = x.loc[y1]
-        tm.assert_series_equal(result, expected)
-
-        empty = Series(data=[], dtype=np.float64)
-        expected = Series([], index=MultiIndex(
-            levels=index.levels, labels=[[], []], dtype=np.float64))
-        result = x.loc[empty]
-        tm.assert_series_equal(result, expected)
-
-    def test_loc_getitem_array(self):
-        # GH15434
-        # passing an array as a key with a MultiIndex
-        index = MultiIndex.from_product([[1, 2, 3], ['A', 'B', 'C']])
-        x = Series(index=index, data=range(9), dtype=np.float64)
-        y = np.array([1, 3])
-        expected = Series(
-            data=[0, 1, 2, 6, 7, 8],
-            index=MultiIndex.from_product([[1, 3], ['A', 'B', 'C']]),
-            dtype=np.float64)
-        result = x.loc[y]
-        tm.assert_series_equal(result, expected)
-
-        # empty array:
-        empty = np.array([])
-        expected = Series([], index=MultiIndex(
-            levels=index.levels, labels=[[], []], dtype=np.float64))
-        result = x.loc[empty]
-        tm.assert_series_equal(result, expected)
-
-        # 0-dim array (scalar):
-        scalar = np.int64(1)
-        expected = Series(
-            data=[0, 1, 2],
-            index=['A', 'B', 'C'],
-            dtype=np.float64)
-        result = x.loc[scalar]
-        tm.assert_series_equal(result, expected)
-
-    def test_iloc_getitem_multiindex(self):
-        mi_labels = DataFrame(np.random.randn(4, 3),
-                              columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
-                              index=[['i', 'i', 'j', 'k'],
-                                     ['X', 'X', 'Y', 'Y']])
-
-        mi_int = DataFrame(np.random.randn(3, 3),
-                           columns=[[2, 2, 4], [6, 8, 10]],
-                           index=[[4, 4, 8], [8, 10, 12]])
-
-        # the first row
-        rs = mi_int.iloc[0]
-        with catch_warnings(record=True):
-            xp = mi_int.ix[4].ix[8]
-        tm.assert_series_equal(rs, xp, check_names=False)
-        self.assertEqual(rs.name, (4, 8))
-        self.assertEqual(xp.name, 8)
-
-        # 2nd (last) columns
-        rs = mi_int.iloc[:, 2]
-        with catch_warnings(record=True):
-            xp = mi_int.ix[:, 2]
-        tm.assert_series_equal(rs, xp)
-
-        # corner column
-        rs = mi_int.iloc[2, 2]
-        with catch_warnings(record=True):
-            xp = mi_int.ix[:, 2].ix[2]
-        self.assertEqual(rs, xp)
-
-        # this is basically regular indexing
-        rs = mi_labels.iloc[2, 2]
-        with catch_warnings(record=True):
-            xp = mi_labels.ix['j'].ix[:, 'j'].ix[0, 0]
-        self.assertEqual(rs, xp)
-
-    def test_loc_multiindex(self):
-
-        mi_labels = DataFrame(np.random.randn(3, 3),
-                              columns=[['i', 'i', 'j'], ['A', 'A', 'B']],
-                              index=[['i', 'i', 'j'], ['X', 'X', 'Y']])
-
-        mi_int = DataFrame(np.random.randn(3, 3),
-                           columns=[[2, 2, 4], [6, 8, 10]],
-                           index=[[4, 4, 8], [8, 10, 12]])
-
-        # the first row
-        rs = mi_labels.loc['i']
-        with catch_warnings(record=True):
-            xp = mi_labels.ix['i']
-        tm.assert_frame_equal(rs, xp)
-
-        # 2nd (last) columns
-        rs = mi_labels.loc[:, 'j']
-        with catch_warnings(record=True):
-            xp = mi_labels.ix[:, 'j']
-        tm.assert_frame_equal(rs, xp)
-
-        # corner column
-        rs = mi_labels.loc['j'].loc[:, 'j']
-        with catch_warnings(record=True):
-            xp = mi_labels.ix['j'].ix[:, 'j']
-        tm.assert_frame_equal(rs, xp)
-
-        # with a tuple
-        rs = mi_labels.loc[('i', 'X')]
-        with catch_warnings(record=True):
-            xp = mi_labels.ix[('i', 'X')]
-        tm.assert_frame_equal(rs, xp)
-
-        rs = mi_int.loc[4]
-        with catch_warnings(record=True):
-            xp = mi_int.ix[4]
-        tm.assert_frame_equal(rs, xp)
-
-    def test_loc_multiindex_indexer_none(self):
-
-        # GH6788
-        # multi-index indexer is None (meaning take all)
-        attributes = ['Attribute' + str(i) for i in range(1)]
-        attribute_values = ['Value' + str(i) for i in range(5)]
-
-        index = MultiIndex.from_product([attributes, attribute_values])
-        df = 0.1 * np.random.randn(10, 1 * 5) + 0.5
-        df = DataFrame(df, columns=index)
-        result = df[attributes]
-        tm.assert_frame_equal(result, df)
-
-        # GH 7349
-        # loc with a multi-index seems to be doing fallback
-        df = DataFrame(np.arange(12).reshape(-1, 1),
-                       index=pd.MultiIndex.from_product([[1, 2, 3, 4],
-                                                         [1, 2, 3]]))
-
-        expected = df.loc[([1, 2], ), :]
-        result = df.loc[[1, 2]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_loc_multiindex_incomplete(self):
-
-        # GH 7399
-        # incomplete indexers
-        s = pd.Series(np.arange(15, dtype='int64'),
-                      MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
-        expected = s.loc[:, 'a':'c']
-
-        result = s.loc[0:4, 'a':'c']
-        tm.assert_series_equal(result, expected)
-        tm.assert_series_equal(result, expected)
-
-        result = s.loc[:4, 'a':'c']
-        tm.assert_series_equal(result, expected)
-        tm.assert_series_equal(result, expected)
-
-        result = s.loc[0:, 'a':'c']
-        tm.assert_series_equal(result, expected)
-        tm.assert_series_equal(result, expected)
-
-        # GH 7400
-        # multiindexer gettitem with list of indexers skips wrong element
-        s = pd.Series(np.arange(15, dtype='int64'),
-                      MultiIndex.from_product([range(5), ['a', 'b', 'c']]))
-        expected = s.iloc[[6, 7, 8, 12, 13, 14]]
-        result = s.loc[2:4:2, 'a':'c']
-        tm.assert_series_equal(result, expected)
-
-    def test_multiindex_perf_warn(self):
-
-        df = DataFrame({'jim': [0, 0, 1, 1],
-                        'joe': ['x', 'x', 'z', 'y'],
-                        'jolie': np.random.rand(4)}).set_index(['jim', 'joe'])
-
-        with tm.assert_produces_warning(PerformanceWarning,
-                                        clear=[pd.core.index]):
-            df.loc[(1, 'z')]
-
-        df = df.iloc[[2, 1, 3, 0]]
-        with tm.assert_produces_warning(PerformanceWarning):
-            df.loc[(0, )]
-
-    def test_series_getitem_multiindex(self):
-
-        # GH 6018
-        # series regression getitem with a multi-index
-
-        s = Series([1, 2, 3])
-        s.index = MultiIndex.from_tuples([(0, 0), (1, 1), (2, 1)])
-
-        result = s[:, 0]
-        expected = Series([1], index=[0])
-        tm.assert_series_equal(result, expected)
-
-        result = s.loc[:, 1]
-        expected = Series([2, 3], index=[1, 2])
-        tm.assert_series_equal(result, expected)
-
-        # xs
-        result = s.xs(0, level=0)
-        expected = Series([1], index=[0])
-        tm.assert_series_equal(result, expected)
-
-        result = s.xs(1, level=1)
-        expected = Series([2, 3], index=[1, 2])
-        tm.assert_series_equal(result, expected)
-
-        # GH6258
-        dt = list(date_range('20130903', periods=3))
-        idx = MultiIndex.from_product([list('AB'), dt])
-        s = Series([1, 3, 4, 1, 3, 4], index=idx)
-
-        result = s.xs('20130903', level=1)
-        expected = Series([1, 1], index=list('AB'))
-        tm.assert_series_equal(result, expected)
-
-        # GH5684
-        idx = MultiIndex.from_tuples([('a', 'one'), ('a', 'two'), ('b', 'one'),
-                                      ('b', 'two')])
-        s = Series([1, 2, 3, 4], index=idx)
-        s.index.set_names(['L1', 'L2'], inplace=True)
-        result = s.xs('one', level='L2')
-        expected = Series([1, 3], index=['a', 'b'])
-        expected.index.set_names(['L1'], inplace=True)
-        tm.assert_series_equal(result, expected)
-
-    def test_xs_multiindex(self):
-
-        # GH2903
-        columns = MultiIndex.from_tuples(
-            [('a', 'foo'), ('a', 'bar'), ('b', 'hello'),
-             ('b', 'world')], names=['lvl0', 'lvl1'])
-        df = DataFrame(np.random.randn(4, 4), columns=columns)
-        df.sort_index(axis=1, inplace=True)
-        result = df.xs('a', level='lvl0', axis=1)
-        expected = df.iloc[:, 0:2].loc[:, 'a']
-        tm.assert_frame_equal(result, expected)
-
-        result = df.xs('foo', level='lvl1', axis=1)
-        expected = df.iloc[:, 1:2].copy()
-        expected.columns = expected.columns.droplevel('lvl1')
-        tm.assert_frame_equal(result, expected)
-
-    def test_multiindex_setitem(self):
-
-        # GH 3738
-        # setting with a multi-index right hand side
-        arrays = [np.array(['bar', 'bar', 'baz', 'qux', 'qux', 'bar']),
-                  np.array(['one', 'two', 'one', 'one', 'two', 'one']),
-                  np.arange(0, 6, 1)]
-
-        df_orig = pd.DataFrame(np.random.randn(6, 3),
-                               index=arrays,
-                               columns=['A', 'B', 'C']).sort_index()
-
-        expected = df_orig.loc[['bar']] * 2
-        df = df_orig.copy()
-        df.loc[['bar']] *= 2
-        tm.assert_frame_equal(df.loc[['bar']], expected)
-
-        # raise because these have differing levels
-        def f():
-            df.loc['bar'] *= 2
-
-        self.assertRaises(TypeError, f)
-
-        # from SO
-        # http://stackoverflow.com/questions/24572040/pandas-access-the-level-of-multiindex-for-inplace-operation
-        df_orig = DataFrame.from_dict({'price': {
-            ('DE', 'Coal', 'Stock'): 2,
-            ('DE', 'Gas', 'Stock'): 4,
-            ('DE', 'Elec', 'Demand'): 1,
-            ('FR', 'Gas', 'Stock'): 5,
-            ('FR', 'Solar', 'SupIm'): 0,
-            ('FR', 'Wind', 'SupIm'): 0
-        }})
-        df_orig.index = MultiIndex.from_tuples(df_orig.index,
-                                               names=['Sit', 'Com', 'Type'])
-
-        expected = df_orig.copy()
-        expected.iloc[[0, 2, 3]] *= 2
-
-        idx = pd.IndexSlice
-        df = df_orig.copy()
-        df.loc[idx[:, :, 'Stock'], :] *= 2
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[idx[:, :, 'Stock'], 'price'] *= 2
-        tm.assert_frame_equal(df, expected)
-
-    def test_getitem_duplicates_multiindex(self):
-        # GH 5725 the 'A' happens to be a valid Timestamp so the doesn't raise
-        # the appropriate error, only in PY3 of course!
-
-        index = MultiIndex(levels=[['D', 'B', 'C'],
-                                   [0, 26, 27, 37, 57, 67, 75, 82]],
-                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
-                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
-                           names=['tag', 'day'])
-        arr = np.random.randn(len(index), 1)
-        df = DataFrame(arr, index=index, columns=['val'])
-        result = df.val['D']
-        expected = Series(arr.ravel()[0:3], name='val', index=Index(
-            [26, 37, 57], name='day'))
-        tm.assert_series_equal(result, expected)
-
-        def f():
-            df.val['A']
-
-        self.assertRaises(KeyError, f)
-
-        def f():
-            df.val['X']
-
-        self.assertRaises(KeyError, f)
-
-        # A is treated as a special Timestamp
-        index = MultiIndex(levels=[['A', 'B', 'C'],
-                                   [0, 26, 27, 37, 57, 67, 75, 82]],
-                           labels=[[0, 0, 0, 1, 2, 2, 2, 2, 2, 2],
-                                   [1, 3, 4, 6, 0, 2, 2, 3, 5, 7]],
-                           names=['tag', 'day'])
-        df = DataFrame(arr, index=index, columns=['val'])
-        result = df.val['A']
-        expected = Series(arr.ravel()[0:3], name='val', index=Index(
-            [26, 37, 57], name='day'))
-        tm.assert_series_equal(result, expected)
-
-        def f():
-            df.val['X']
-
-        self.assertRaises(KeyError, f)
-
-        # GH 7866
-        # multi-index slicing with missing indexers
-        idx = pd.MultiIndex.from_product([['A', 'B', 'C'],
-                                          ['foo', 'bar', 'baz']],
-                                         names=['one', 'two'])
-        s = pd.Series(np.arange(9, dtype='int64'), index=idx).sort_index()
-
-        exp_idx = pd.MultiIndex.from_product([['A'], ['foo', 'bar', 'baz']],
-                                             names=['one', 'two'])
-        expected = pd.Series(np.arange(3, dtype='int64'),
-                             index=exp_idx).sort_index()
-
-        result = s.loc[['A']]
-        tm.assert_series_equal(result, expected)
-        result = s.loc[['A', 'D']]
-        tm.assert_series_equal(result, expected)
-
-        # not any values found
-        self.assertRaises(KeyError, lambda: s.loc[['D']])
-
-        # empty ok
-        result = s.loc[[]]
-        expected = s.iloc[[]]
-        tm.assert_series_equal(result, expected)
-
-        idx = pd.IndexSlice
-        expected = pd.Series([0, 3, 6], index=pd.MultiIndex.from_product(
-            [['A', 'B', 'C'], ['foo']], names=['one', 'two'])).sort_index()
-
-        result = s.loc[idx[:, ['foo']]]
-        tm.assert_series_equal(result, expected)
-        result = s.loc[idx[:, ['foo', 'bah']]]
-        tm.assert_series_equal(result, expected)
-
-        # GH 8737
-        # empty indexer
-        multi_index = pd.MultiIndex.from_product((['foo', 'bar', 'baz'],
-                                                  ['alpha', 'beta']))
-        df = DataFrame(
-            np.random.randn(5, 6), index=range(5), columns=multi_index)
-        df = df.sort_index(level=0, axis=1)
-
-        expected = DataFrame(index=range(5),
-                             columns=multi_index.reindex([])[0])
-        result1 = df.loc[:, ([], slice(None))]
-        result2 = df.loc[:, (['foo'], [])]
-        tm.assert_frame_equal(result1, expected)
-        tm.assert_frame_equal(result2, expected)
-
-        # regression from < 0.14.0
-        # GH 7914
-        df = DataFrame([[np.mean, np.median], ['mean', 'median']],
-                       columns=MultiIndex.from_tuples([('functs', 'mean'),
-                                                       ('functs', 'median')]),
-                       index=['function', 'name'])
-        result = df.loc['function', ('functs', 'mean')]
-        self.assertEqual(result, np.mean)
-
-    def test_multiindex_assignment(self):
-
-        # GH3777 part 2
-
-        # mixed dtype
-        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
-                       columns=list('abc'),
-                       index=[[4, 4, 8], [8, 10, 12]])
-        df['d'] = np.nan
-        arr = np.array([0., 1.])
-
-        with catch_warnings(record=True):
-            df.ix[4, 'd'] = arr
-            tm.assert_series_equal(df.ix[4, 'd'],
-                                   Series(arr, index=[8, 10], name='d'))
-
-        # single dtype
-        df = DataFrame(np.random.randint(5, 10, size=9).reshape(3, 3),
-                       columns=list('abc'),
-                       index=[[4, 4, 8], [8, 10, 12]])
-
-        with catch_warnings(record=True):
-            df.ix[4, 'c'] = arr
-            exp = Series(arr, index=[8, 10], name='c', dtype='float64')
-            tm.assert_series_equal(df.ix[4, 'c'], exp)
-
-        # scalar ok
-        with catch_warnings(record=True):
-            df.ix[4, 'c'] = 10
-            exp = Series(10, index=[8, 10], name='c', dtype='float64')
-            tm.assert_series_equal(df.ix[4, 'c'], exp)
-
-        # invalid assignments
-        def f():
-            with catch_warnings(record=True):
-                df.ix[4, 'c'] = [0, 1, 2, 3]
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            with catch_warnings(record=True):
-                df.ix[4, 'c'] = [0]
-
-        self.assertRaises(ValueError, f)
-
-        # groupby example
-        NUM_ROWS = 100
-        NUM_COLS = 10
-        col_names = ['A' + num for num in
-                     map(str, np.arange(NUM_COLS).tolist())]
-        index_cols = col_names[:5]
-
-        df = DataFrame(np.random.randint(5, size=(NUM_ROWS, NUM_COLS)),
-                       dtype=np.int64, columns=col_names)
-        df = df.set_index(index_cols).sort_index()
-        grp = df.groupby(level=index_cols[:4])
-        df['new_col'] = np.nan
-
-        f_index = np.arange(5)
-
-        def f(name, df2):
-            return Series(np.arange(df2.shape[0]),
-                          name=df2.index.values[0]).reindex(f_index)
-
-        # TODO(wesm): unused?
-        # new_df = pd.concat([f(name, df2) for name, df2 in grp], axis=1).T
-
-        # we are actually operating on a copy here
-        # but in this case, that's ok
-        for name, df2 in grp:
-            new_vals = np.arange(df2.shape[0])
-            with catch_warnings(record=True):
-                df.ix[name, 'new_col'] = new_vals
-
-    def test_multiindex_label_slicing_with_negative_step(self):
-        s = Series(np.arange(20),
-                   MultiIndex.from_product([list('abcde'), np.arange(4)]))
-        SLC = pd.IndexSlice
-
-        def assert_slices_equivalent(l_slc, i_slc):
-            tm.assert_series_equal(s.loc[l_slc], s.iloc[i_slc])
-            tm.assert_series_equal(s[l_slc], s.iloc[i_slc])
-            with catch_warnings(record=True):
-                tm.assert_series_equal(s.ix[l_slc], s.iloc[i_slc])
-
-        assert_slices_equivalent(SLC[::-1], SLC[::-1])
-
-        assert_slices_equivalent(SLC['d'::-1], SLC[15::-1])
-        assert_slices_equivalent(SLC[('d', )::-1], SLC[15::-1])
-
-        assert_slices_equivalent(SLC[:'d':-1], SLC[:11:-1])
-        assert_slices_equivalent(SLC[:('d', ):-1], SLC[:11:-1])
-
-        assert_slices_equivalent(SLC['d':'b':-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC[('d', ):'b':-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC['d':('b', ):-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC[('d', ):('b', ):-1], SLC[15:3:-1])
-        assert_slices_equivalent(SLC['b':'d':-1], SLC[:0])
-
-        assert_slices_equivalent(SLC[('c', 2)::-1], SLC[10::-1])
-        assert_slices_equivalent(SLC[:('c', 2):-1], SLC[:9:-1])
-        assert_slices_equivalent(SLC[('e', 0):('c', 2):-1], SLC[16:9:-1])
-
-    def test_multiindex_slice_first_level(self):
-        # GH 12697
-        freq = ['a', 'b', 'c', 'd']
-        idx = pd.MultiIndex.from_product([freq, np.arange(500)])
-        df = pd.DataFrame(list(range(2000)), index=idx, columns=['Test'])
-        df_slice = df.loc[pd.IndexSlice[:, 30:70], :]
-        result = df_slice.loc['a']
-        expected = pd.DataFrame(list(range(30, 71)),
-                                columns=['Test'],
-                                index=range(30, 71))
-        tm.assert_frame_equal(result, expected)
-        result = df_slice.loc['d']
-        expected = pd.DataFrame(list(range(1530, 1571)),
-                                columns=['Test'],
-                                index=range(30, 71))
-        tm.assert_frame_equal(result, expected)
-
-
-class TestMultiIndexSlicers(tm.TestCase):
-
-    def test_per_axis_per_level_getitem(self):
-
-        # GH6134
-        # example test case
-        ix = MultiIndex.from_product([_mklbl('A', 5), _mklbl('B', 7), _mklbl(
-            'C', 4), _mklbl('D', 2)])
-        df = DataFrame(np.arange(len(ix.get_values())), index=ix)
-
-        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
-                               c == 'C1' or c == 'C3')]]
-        tm.assert_frame_equal(result, expected)
-
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
-                               c == 'C1' or c == 'C2' or c == 'C3')]]
-        result = df.loc[(slice('A1', 'A3'), slice(None), slice('C1', 'C3')), :]
-        tm.assert_frame_equal(result, expected)
-
-        # test multi-index slicing with per axis and per index controls
-        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
-                                        ('A', 3), ('B', 1)],
-                                       names=['one', 'two'])
-        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
-                                          ('b', 'foo'), ('b', 'bah')],
-                                         names=['lvl0', 'lvl1'])
-
-        df = DataFrame(
-            np.arange(16, dtype='int64').reshape(
-                4, 4), index=index, columns=columns)
-        df = df.sort_index(axis=0).sort_index(axis=1)
-
-        # identity
-        result = df.loc[(slice(None), slice(None)), :]
-        tm.assert_frame_equal(result, df)
-        result = df.loc[(slice(None), slice(None)), (slice(None), slice(None))]
-        tm.assert_frame_equal(result, df)
-        result = df.loc[:, (slice(None), slice(None))]
-        tm.assert_frame_equal(result, df)
-
-        # index
-        result = df.loc[(slice(None), [1]), :]
-        expected = df.iloc[[0, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None), 1), :]
-        expected = df.iloc[[0, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        # columns
-        result = df.loc[:, (slice(None), ['foo'])]
-        expected = df.iloc[:, [1, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        # both
-        result = df.loc[(slice(None), 1), (slice(None), ['foo'])]
-        expected = df.iloc[[0, 3], [1, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc['A', 'a']
-        expected = DataFrame(dict(bar=[1, 5, 9], foo=[0, 4, 8]),
-                             index=Index([1, 2, 3], name='two'),
-                             columns=Index(['bar', 'foo'], name='lvl1'))
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None), [1, 2]), :]
-        expected = df.iloc[[0, 1, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        # multi-level series
-        s = Series(np.arange(len(ix.get_values())), index=ix)
-        result = s.loc['A1':'A3', :, ['C1', 'C3']]
-        expected = s.loc[[tuple([a, b, c, d])
-                          for a, b, c, d in s.index.values
-                          if (a == 'A1' or a == 'A2' or a == 'A3') and (
-                              c == 'C1' or c == 'C3')]]
-        tm.assert_series_equal(result, expected)
-
-        # boolean indexers
-        result = df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
-        expected = df.iloc[[2, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        def f():
-            df.loc[(slice(None), np.array([True, False])), :]
-
-        self.assertRaises(ValueError, f)
-
-        # ambiguous cases
-        # these can be multiply interpreted (e.g. in this case
-        # as df.loc[slice(None),[1]] as well
-        self.assertRaises(KeyError, lambda: df.loc[slice(None), [1]])
-
-        result = df.loc[(slice(None), [1]), :]
-        expected = df.iloc[[0, 3]]
-        tm.assert_frame_equal(result, expected)
-
-        # not lexsorted
-        self.assertEqual(df.index.lexsort_depth, 2)
-        df = df.sort_index(level=1, axis=0)
-        self.assertEqual(df.index.lexsort_depth, 0)
-        with tm.assertRaisesRegexp(
-                UnsortedIndexError,
-                'MultiIndex Slicing requires the index to be fully '
-                r'lexsorted tuple len \(2\), lexsort depth \(0\)'):
-            df.loc[(slice(None), df.loc[:, ('a', 'bar')] > 5), :]
-
-    def test_multiindex_slicers_non_unique(self):
-
-        # GH 7106
-        # non-unique mi index support
-        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
-                             B=['a', 'a', 'a', 'a'],
-                             C=[1, 2, 1, 3],
-                             D=[1, 2, 3, 4]))
-              .set_index(['A', 'B', 'C']).sort_index())
-        self.assertFalse(df.index.is_unique)
-        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
-                                   C=[1, 1], D=[1, 3]))
-                    .set_index(['A', 'B', 'C']).sort_index())
-        result = df.loc[(slice(None), slice(None), 1), :]
-        tm.assert_frame_equal(result, expected)
-
-        # this is equivalent of an xs expression
-        result = df.xs(1, level=2, drop_level=False)
-        tm.assert_frame_equal(result, expected)
-
-        df = (DataFrame(dict(A=['foo', 'foo', 'foo', 'foo'],
-                             B=['a', 'a', 'a', 'a'],
-                             C=[1, 2, 1, 2],
-                             D=[1, 2, 3, 4]))
-              .set_index(['A', 'B', 'C']).sort_index())
-        self.assertFalse(df.index.is_unique)
-        expected = (DataFrame(dict(A=['foo', 'foo'], B=['a', 'a'],
-                                   C=[1, 1], D=[1, 3]))
-                    .set_index(['A', 'B', 'C']).sort_index())
-        result = df.loc[(slice(None), slice(None), 1), :]
-        self.assertFalse(result.index.is_unique)
-        tm.assert_frame_equal(result, expected)
-
-        # GH12896
-        # numpy-implementation dependent bug
-        ints = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 12, 13, 14, 14, 16,
-                17, 18, 19, 200000, 200000]
-        n = len(ints)
-        idx = MultiIndex.from_arrays([['a'] * n, ints])
-        result = Series([1] * n, index=idx)
-        result = result.sort_index()
-        result = result.loc[(slice(None), slice(100000))]
-        expected = Series([1] * (n - 2), index=idx[:-2]).sort_index()
-        tm.assert_series_equal(result, expected)
-
-    def test_multiindex_slicers_datetimelike(self):
-
-        # GH 7429
-        # buggy/inconsistent behavior when slicing with datetime-like
-        import datetime
-        dates = [datetime.datetime(2012, 1, 1, 12, 12, 12) +
-                 datetime.timedelta(days=i) for i in range(6)]
-        freq = [1, 2]
-        index = MultiIndex.from_product(
-            [dates, freq], names=['date', 'frequency'])
-
-        df = DataFrame(
-            np.arange(6 * 2 * 4, dtype='int64').reshape(
-                -1, 4), index=index, columns=list('ABCD'))
-
-        # multi-axis slicing
-        idx = pd.IndexSlice
-        expected = df.iloc[[0, 2, 4], [0, 1]]
-        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
-                               Timestamp('2012-01-03 12:12:12')),
-                         slice(1, 1)), slice('A', 'B')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(idx[Timestamp('2012-01-01 12:12:12'):Timestamp(
-            '2012-01-03 12:12:12')], idx[1:1]), slice('A', 'B')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(Timestamp('2012-01-01 12:12:12'),
-                               Timestamp('2012-01-03 12:12:12')), 1),
-                        slice('A', 'B')]
-        tm.assert_frame_equal(result, expected)
-
-        # with strings
-        result = df.loc[(slice('2012-01-01 12:12:12', '2012-01-03 12:12:12'),
-                         slice(1, 1)), slice('A', 'B')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(idx['2012-01-01 12:12:12':'2012-01-03 12:12:12'], 1),
-                        idx['A', 'B']]
-        tm.assert_frame_equal(result, expected)
-
-    def test_multiindex_slicers_edges(self):
-        # GH 8132
-        # various edge cases
-        df = DataFrame(
-            {'A': ['A0'] * 5 + ['A1'] * 5 + ['A2'] * 5,
-             'B': ['B0', 'B0', 'B1', 'B1', 'B2'] * 3,
-             'DATE': ["2013-06-11", "2013-07-02", "2013-07-09", "2013-07-30",
-                      "2013-08-06", "2013-06-11", "2013-07-02", "2013-07-09",
-                      "2013-07-30", "2013-08-06", "2013-09-03", "2013-10-01",
-                      "2013-07-09", "2013-08-06", "2013-09-03"],
-             'VALUES': [22, 35, 14, 9, 4, 40, 18, 4, 2, 5, 1, 2, 3, 4, 2]})
-
-        df['DATE'] = pd.to_datetime(df['DATE'])
-        df1 = df.set_index(['A', 'B', 'DATE'])
-        df1 = df1.sort_index()
-
-        # A1 - Get all values under "A0" and "A1"
-        result = df1.loc[(slice('A1')), :]
-        expected = df1.iloc[0:10]
-        tm.assert_frame_equal(result, expected)
-
-        # A2 - Get all values from the start to "A2"
-        result = df1.loc[(slice('A2')), :]
-        expected = df1
-        tm.assert_frame_equal(result, expected)
-
-        # A3 - Get all values under "B1" or "B2"
-        result = df1.loc[(slice(None), slice('B1', 'B2')), :]
-        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13, 14]]
-        tm.assert_frame_equal(result, expected)
-
-        # A4 - Get all values between 2013-07-02 and 2013-07-09
-        result = df1.loc[(slice(None), slice(None),
-                          slice('20130702', '20130709')), :]
-        expected = df1.iloc[[1, 2, 6, 7, 12]]
-        tm.assert_frame_equal(result, expected)
-
-        # B1 - Get all values in B0 that are also under A0, A1 and A2
-        result = df1.loc[(slice('A2'), slice('B0')), :]
-        expected = df1.iloc[[0, 1, 5, 6, 10, 11]]
-        tm.assert_frame_equal(result, expected)
-
-        # B2 - Get all values in B0, B1 and B2 (similar to what #2 is doing for
-        # the As)
-        result = df1.loc[(slice(None), slice('B2')), :]
-        expected = df1
-        tm.assert_frame_equal(result, expected)
-
-        # B3 - Get all values from B1 to B2 and up to 2013-08-06
-        result = df1.loc[(slice(None), slice('B1', 'B2'),
-                          slice('2013-08-06')), :]
-        expected = df1.iloc[[2, 3, 4, 7, 8, 9, 12, 13]]
-        tm.assert_frame_equal(result, expected)
-
-        # B4 - Same as A4 but the start of the date slice is not a key.
-        #      shows indexing on a partial selection slice
-        result = df1.loc[(slice(None), slice(None),
-                          slice('20130701', '20130709')), :]
-        expected = df1.iloc[[1, 2, 6, 7, 12]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_per_axis_per_level_doc_examples(self):
-
-        # test index maker
-        idx = pd.IndexSlice
-
-        # from indexing.rst / advanced
-        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
-                                         _mklbl('C', 4), _mklbl('D', 2)])
-        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
-                                          ('b', 'foo'), ('b', 'bah')],
-                                         names=['lvl0', 'lvl1'])
-        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
-                       .reshape((len(index), len(columns))),
-                       index=index, columns=columns)
-        result = df.loc[(slice('A1', 'A3'), slice(None), ['C1', 'C3']), :]
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
-                               c == 'C1' or c == 'C3')]]
-        tm.assert_frame_equal(result, expected)
-        result = df.loc[idx['A1':'A3', :, ['C1', 'C3']], :]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[(slice(None), slice(None), ['C1', 'C3']), :]
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (c == 'C1' or c == 'C3')]]
-        tm.assert_frame_equal(result, expected)
-        result = df.loc[idx[:, :, ['C1', 'C3']], :]
-        tm.assert_frame_equal(result, expected)
-
-        # not sorted
-        def f():
-            df.loc['A1', (slice(None), 'foo')]
-
-        self.assertRaises(UnsortedIndexError, f)
-        df = df.sort_index(axis=1)
-
-        # slicing
-        df.loc['A1', (slice(None), 'foo')]
-        df.loc[(slice(None), slice(None), ['C1', 'C3']), (slice(None), 'foo')]
-
-        # setitem
-        df.loc(axis=0)[:, :, ['C1', 'C3']] = -10
-
-    def test_loc_axis_arguments(self):
-
-        index = MultiIndex.from_product([_mklbl('A', 4), _mklbl('B', 2),
-                                         _mklbl('C', 4), _mklbl('D', 2)])
-        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
-                                          ('b', 'foo'), ('b', 'bah')],
-                                         names=['lvl0', 'lvl1'])
-        df = DataFrame(np.arange(len(index) * len(columns), dtype='int64')
-                       .reshape((len(index), len(columns))),
-                       index=index,
-                       columns=columns).sort_index().sort_index(axis=1)
-
-        # axis 0
-        result = df.loc(axis=0)['A1':'A3', :, ['C1', 'C3']]
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (a == 'A1' or a == 'A2' or a == 'A3') and (
-                               c == 'C1' or c == 'C3')]]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc(axis='index')[:, :, ['C1', 'C3']]
-        expected = df.loc[[tuple([a, b, c, d])
-                           for a, b, c, d in df.index.values
-                           if (c == 'C1' or c == 'C3')]]
-        tm.assert_frame_equal(result, expected)
-
-        # axis 1
-        result = df.loc(axis=1)[:, 'foo']
-        expected = df.loc[:, (slice(None), 'foo')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc(axis='columns')[:, 'foo']
-        expected = df.loc[:, (slice(None), 'foo')]
-        tm.assert_frame_equal(result, expected)
-
-        # invalid axis
-        def f():
-            df.loc(axis=-1)[:, :, ['C1', 'C3']]
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.loc(axis=2)[:, :, ['C1', 'C3']]
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.loc(axis='foo')[:, :, ['C1', 'C3']]
-
-        self.assertRaises(ValueError, f)
-
-    def test_per_axis_per_level_setitem(self):
-
-        # test index maker
-        idx = pd.IndexSlice
-
-        # test multi-index slicing with per axis and per index controls
-        index = MultiIndex.from_tuples([('A', 1), ('A', 2),
-                                        ('A', 3), ('B', 1)],
-                                       names=['one', 'two'])
-        columns = MultiIndex.from_tuples([('a', 'foo'), ('a', 'bar'),
-                                          ('b', 'foo'), ('b', 'bah')],
-                                         names=['lvl0', 'lvl1'])
-
-        df_orig = DataFrame(
-            np.arange(16, dtype='int64').reshape(
-                4, 4), index=index, columns=columns)
-        df_orig = df_orig.sort_index(axis=0).sort_index(axis=1)
-
-        # identity
-        df = df_orig.copy()
-        df.loc[(slice(None), slice(None)), :] = 100
-        expected = df_orig.copy()
-        expected.iloc[:, :] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc(axis=0)[:, :] = 100
-        expected = df_orig.copy()
-        expected.iloc[:, :] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None), slice(None)), (slice(None), slice(None))] = 100
-        expected = df_orig.copy()
-        expected.iloc[:, :] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[:, (slice(None), slice(None))] = 100
-        expected = df_orig.copy()
-        expected.iloc[:, :] = 100
-        tm.assert_frame_equal(df, expected)
-
-        # index
-        df = df_orig.copy()
-        df.loc[(slice(None), [1]), :] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), :] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc(axis=0)[:, 1] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        # columns
-        df = df_orig.copy()
-        df.loc[:, (slice(None), ['foo'])] = 100
-        expected = df_orig.copy()
-        expected.iloc[:, [1, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        # both
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), (slice(None), ['foo'])] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[idx[:, 1], idx[:, ['foo']]] = 100
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc['A', 'a'] = 100
-        expected = df_orig.copy()
-        expected.iloc[0:3, 0:2] = 100
-        tm.assert_frame_equal(df, expected)
-
-        # setting with a list-like
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
-            [[100, 100], [100, 100]], dtype='int64')
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] = 100
-        tm.assert_frame_equal(df, expected)
-
-        # not enough values
-        df = df_orig.copy()
-
-        def f():
-            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
-                [[100], [100, 100]], dtype='int64')
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            df.loc[(slice(None), 1), (slice(None), ['foo'])] = np.array(
-                [100, 100, 100, 100], dtype='int64')
-
-        self.assertRaises(ValueError, f)
-
-        # with an alignable rhs
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), (slice(None), ['foo'])] = df.loc[(slice(
-            None), 1), (slice(None), ['foo'])] * 5
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] = expected.iloc[[0, 3], [1, 3]] * 5
-        tm.assert_frame_equal(df, expected)
-
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= df.loc[(slice(
-            None), 1), (slice(None), ['foo'])]
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
-        tm.assert_frame_equal(df, expected)
-
-        rhs = df_orig.loc[(slice(None), 1), (slice(None), ['foo'])].copy()
-        rhs.loc[:, ('c', 'bah')] = 10
-        df = df_orig.copy()
-        df.loc[(slice(None), 1), (slice(None), ['foo'])] *= rhs
-        expected = df_orig.copy()
-        expected.iloc[[0, 3], [1, 3]] *= expected.iloc[[0, 3], [1, 3]]
-        tm.assert_frame_equal(df, expected)
-
-
-class TestMultiIndexPanel(tm.TestCase):
-
-    def test_iloc_getitem_panel_multiindex(self):
-        # GH 7199
-        # Panel with multi-index
-        multi_index = pd.MultiIndex.from_tuples([('ONE', 'one'),
-                                                 ('TWO', 'two'),
-                                                 ('THREE', 'three')],
-                                                names=['UPPER', 'lower'])
-
-        simple_index = [x[0] for x in multi_index]
-        wd1 = Panel(items=['First', 'Second'], major_axis=['a', 'b', 'c', 'd'],
-                    minor_axis=multi_index)
-
-        wd2 = Panel(items=['First', 'Second'], major_axis=['a', 'b', 'c', 'd'],
-                    minor_axis=simple_index)
-
-        expected1 = wd1['First'].iloc[[True, True, True, False], [0, 2]]
-        result1 = wd1.iloc[0, [True, True, True, False], [0, 2]]  # WRONG
-        tm.assert_frame_equal(result1, expected1)
-
-        expected2 = wd2['First'].iloc[[True, True, True, False], [0, 2]]
-        result2 = wd2.iloc[0, [True, True, True, False], [0, 2]]
-        tm.assert_frame_equal(result2, expected2)
-
-        expected1 = DataFrame(index=['a'], columns=multi_index,
-                              dtype='float64')
-        result1 = wd1.iloc[0, [0], [0, 1, 2]]
-        tm.assert_frame_equal(result1, expected1)
-
-        expected2 = DataFrame(index=['a'], columns=simple_index,
-                              dtype='float64')
-        result2 = wd2.iloc[0, [0], [0, 1, 2]]
-        tm.assert_frame_equal(result2, expected2)
-
-        # GH 7516
-        mi = MultiIndex.from_tuples([(0, 'x'), (1, 'y'), (2, 'z')])
-        p = Panel(np.arange(3 * 3 * 3, dtype='int64').reshape(3, 3, 3),
-                  items=['a', 'b', 'c'], major_axis=mi,
-                  minor_axis=['u', 'v', 'w'])
-        result = p.iloc[:, 1, 0]
-        expected = Series([3, 12, 21], index=['a', 'b', 'c'], name='u')
-        tm.assert_series_equal(result, expected)
-
-        result = p.loc[:, (1, 'y'), 'u']
-        tm.assert_series_equal(result, expected)
-
-    def test_panel_setitem_with_multiindex(self):
-
-        # 10360
-        # failing with a multi-index
-        arr = np.array([[[1, 2, 3], [0, 0, 0]], [[0, 0, 0], [0, 0, 0]]],
-                       dtype=np.float64)
-
-        # reg index
-        axes = dict(items=['A', 'B'], major_axis=[0, 1],
-                    minor_axis=['X', 'Y', 'Z'])
-        p1 = Panel(0., **axes)
-        p1.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p1, expected)
-
-        # multi-indexes
-        axes['items'] = pd.MultiIndex.from_tuples([('A', 'a'), ('B', 'b')])
-        p2 = Panel(0., **axes)
-        p2.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p2, expected)
-
-        axes['major_axis'] = pd.MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        p3 = Panel(0., **axes)
-        p3.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p3, expected)
-
-        axes['minor_axis'] = pd.MultiIndex.from_product([['X'], range(3)])
-        p4 = Panel(0., **axes)
-        p4.iloc[0, 0, :] = [1, 2, 3]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p4, expected)
-
-        arr = np.array(
-            [[[1, 0, 0], [2, 0, 0]], [[0, 0, 0], [0, 0, 0]]], dtype=np.float64)
-        p5 = Panel(0., **axes)
-        p5.iloc[0, :, 0] = [1, 2]
-        expected = Panel(arr, **axes)
-        tm.assert_panel_equal(p5, expected)
diff --git a/pandas/tests/indexing/test_panel.py b/pandas/tests/indexing/test_panel.py
deleted file mode 100644
index 0677ea498c282..0000000000000
--- a/pandas/tests/indexing/test_panel.py
+++ /dev/null
@@ -1,209 +0,0 @@
-from warnings import catch_warnings
-
-import numpy as np
-from pandas.util import testing as tm
-from pandas import Panel, date_range, DataFrame
-
-
-class TestPanel(tm.TestCase):
-
-    def test_iloc_getitem_panel(self):
-
-        # GH 7189
-        p = Panel(np.arange(4 * 3 * 2).reshape(4, 3, 2),
-                  items=['A', 'B', 'C', 'D'],
-                  major_axis=['a', 'b', 'c'],
-                  minor_axis=['one', 'two'])
-
-        result = p.iloc[1]
-        expected = p.loc['B']
-        tm.assert_frame_equal(result, expected)
-
-        result = p.iloc[1, 1]
-        expected = p.loc['B', 'b']
-        tm.assert_series_equal(result, expected)
-
-        result = p.iloc[1, 1, 1]
-        expected = p.loc['B', 'b', 'two']
-        self.assertEqual(result, expected)
-
-        # slice
-        result = p.iloc[1:3]
-        expected = p.loc[['B', 'C']]
-        tm.assert_panel_equal(result, expected)
-
-        result = p.iloc[:, 0:2]
-        expected = p.loc[:, ['a', 'b']]
-        tm.assert_panel_equal(result, expected)
-
-        # list of integers
-        result = p.iloc[[0, 2]]
-        expected = p.loc[['A', 'C']]
-        tm.assert_panel_equal(result, expected)
-
-        # neg indicies
-        result = p.iloc[[-1, 1], [-1, 1]]
-        expected = p.loc[['D', 'B'], ['c', 'b']]
-        tm.assert_panel_equal(result, expected)
-
-        # dups indicies
-        result = p.iloc[[-1, -1, 1], [-1, 1]]
-        expected = p.loc[['D', 'D', 'B'], ['c', 'b']]
-        tm.assert_panel_equal(result, expected)
-
-        # combined
-        result = p.iloc[0, [True, True], [0, 1]]
-        expected = p.loc['A', ['a', 'b'], ['one', 'two']]
-        tm.assert_frame_equal(result, expected)
-
-        # out-of-bounds exception
-        self.assertRaises(IndexError, p.iloc.__getitem__, tuple([10, 5]))
-
-        def f():
-            p.iloc[0, [True, True], [0, 1, 2]]
-
-        self.assertRaises(IndexError, f)
-
-        # trying to use a label
-        self.assertRaises(ValueError, p.iloc.__getitem__, tuple(['j', 'D']))
-
-        # GH
-        p = Panel(
-            np.random.rand(4, 3, 2), items=['A', 'B', 'C', 'D'],
-            major_axis=['U', 'V', 'W'], minor_axis=['X', 'Y'])
-        expected = p['A']
-
-        result = p.iloc[0, :, :]
-        tm.assert_frame_equal(result, expected)
-
-        result = p.iloc[0, [True, True, True], :]
-        tm.assert_frame_equal(result, expected)
-
-        result = p.iloc[0, [True, True, True], [0, 1]]
-        tm.assert_frame_equal(result, expected)
-
-        def f():
-            p.iloc[0, [True, True, True], [0, 1, 2]]
-
-        self.assertRaises(IndexError, f)
-
-        def f():
-            p.iloc[0, [True, True, True], [2]]
-
-        self.assertRaises(IndexError, f)
-
-    def test_iloc_panel_issue(self):
-
-        # GH 3617
-        p = Panel(np.random.randn(4, 4, 4))
-
-        self.assertEqual(p.iloc[:3, :3, :3].shape, (3, 3, 3))
-        self.assertEqual(p.iloc[1, :3, :3].shape, (3, 3))
-        self.assertEqual(p.iloc[:3, 1, :3].shape, (3, 3))
-        self.assertEqual(p.iloc[:3, :3, 1].shape, (3, 3))
-        self.assertEqual(p.iloc[1, 1, :3].shape, (3, ))
-        self.assertEqual(p.iloc[1, :3, 1].shape, (3, ))
-        self.assertEqual(p.iloc[:3, 1, 1].shape, (3, ))
-
-    def test_panel_getitem(self):
-        # GH4016, date selection returns a frame when a partial string
-        # selection
-        ind = date_range(start="2000", freq="D", periods=1000)
-        df = DataFrame(
-            np.random.randn(
-                len(ind), 5), index=ind, columns=list('ABCDE'))
-        panel = Panel(dict([('frame_' + c, df) for c in list('ABC')]))
-
-        test2 = panel.loc[:, "2002":"2002-12-31"]
-        test1 = panel.loc[:, "2002"]
-        tm.assert_panel_equal(test1, test2)
-
-        # GH8710
-        # multi-element getting with a list
-        panel = tm.makePanel()
-
-        expected = panel.iloc[[0, 1]]
-
-        result = panel.loc[['ItemA', 'ItemB']]
-        tm.assert_panel_equal(result, expected)
-
-        result = panel.loc[['ItemA', 'ItemB'], :, :]
-        tm.assert_panel_equal(result, expected)
-
-        result = panel[['ItemA', 'ItemB']]
-        tm.assert_panel_equal(result, expected)
-
-        result = panel.loc['ItemA':'ItemB']
-        tm.assert_panel_equal(result, expected)
-
-        with catch_warnings(record=True):
-            result = panel.ix[['ItemA', 'ItemB']]
-        tm.assert_panel_equal(result, expected)
-
-        # with an object-like
-        # GH 9140
-        class TestObject:
-
-            def __str__(self):
-                return "TestObject"
-
-        obj = TestObject()
-
-        p = Panel(np.random.randn(1, 5, 4), items=[obj],
-                  major_axis=date_range('1/1/2000', periods=5),
-                  minor_axis=['A', 'B', 'C', 'D'])
-
-        expected = p.iloc[0]
-        result = p[obj]
-        tm.assert_frame_equal(result, expected)
-
-    def test_panel_setitem(self):
-
-        # GH 7763
-        # loc and setitem have setting differences
-        np.random.seed(0)
-        index = range(3)
-        columns = list('abc')
-
-        panel = Panel({'A': DataFrame(np.random.randn(3, 3),
-                                      index=index, columns=columns),
-                       'B': DataFrame(np.random.randn(3, 3),
-                                      index=index, columns=columns),
-                       'C': DataFrame(np.random.randn(3, 3),
-                                      index=index, columns=columns)})
-
-        replace = DataFrame(np.eye(3, 3), index=range(3), columns=columns)
-        expected = Panel({'A': replace, 'B': replace, 'C': replace})
-
-        p = panel.copy()
-        for idx in list('ABC'):
-            p[idx] = replace
-        tm.assert_panel_equal(p, expected)
-
-        p = panel.copy()
-        for idx in list('ABC'):
-            p.loc[idx, :, :] = replace
-        tm.assert_panel_equal(p, expected)
-
-    def test_panel_assignment(self):
-        # GH3777
-        wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                   major_axis=date_range('1/1/2000', periods=5),
-                   minor_axis=['A', 'B', 'C', 'D'])
-        wp2 = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                    major_axis=date_range('1/1/2000', periods=5),
-                    minor_axis=['A', 'B', 'C', 'D'])
-
-        # TODO: unused?
-        # expected = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
-
-        def f():
-            wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = wp2.loc[
-                ['Item1', 'Item2'], :, ['A', 'B']]
-
-        self.assertRaises(NotImplementedError, f)
-
-        # to_assign = wp2.loc[['Item1', 'Item2'], :, ['A', 'B']]
-        # wp.loc[['Item1', 'Item2'], :, ['A', 'B']] = to_assign
-        # result = wp.loc[['Item1', 'Item2'], :, ['A', 'B']]
-        # tm.assert_panel_equal(result,expected)
diff --git a/pandas/tests/indexing/test_partial.py b/pandas/tests/indexing/test_partial.py
index 31fadcc88583c..e8ce5bc4c36ef 100644
--- a/pandas/tests/indexing/test_partial.py
+++ b/pandas/tests/indexing/test_partial.py
@@ -3,16 +3,20 @@
 
 TOD: these should be split among the indexer tests
 """
+
 from warnings import catch_warnings
+
 import numpy as np
+import pytest
 
 import pandas as pd
-from pandas import Series, DataFrame, Panel, Index, date_range
+from pandas import DataFrame, Index, Series, date_range
 from pandas.util import testing as tm
 
 
-class TestPartialSetting(tm.TestCase):
+class TestPartialSetting(object):
 
+    @pytest.mark.filterwarnings("ignore:\\n.ix:DeprecationWarning")
     def test_partial_setting(self):
 
         # GH2578, allow ix and friends to partially set
@@ -43,16 +47,12 @@ def test_partial_setting(self):
         # iloc/iat raise
         s = s_orig.copy()
 
-        def f():
+        with pytest.raises(IndexError):
             s.iloc[3] = 5.
 
-        self.assertRaises(IndexError, f)
-
-        def f():
+        with pytest.raises(IndexError):
             s.iat[3] = 5.
 
-        self.assertRaises(IndexError, f)
-
         # ## frame ##
 
         df_orig = DataFrame(
@@ -61,16 +61,12 @@ def f():
         # iloc/iat raise
         df = df_orig.copy()
 
-        def f():
+        with pytest.raises(IndexError):
             df.iloc[4, 2] = 5.
 
-        self.assertRaises(IndexError, f)
-
-        def f():
+        with pytest.raises(IndexError):
             df.iat[4, 2] = 5.
 
-        self.assertRaises(IndexError, f)
-
         # row setting where it exists
         expected = DataFrame(dict({'A': [0, 4, 4], 'B': [1, 5, 5]}))
         df = df_orig.copy()
@@ -119,56 +115,30 @@ def f():
             df.ix[:, 'C'] = df.ix[:, 'A']
         tm.assert_frame_equal(df, expected)
 
-        # ## panel ##
-        p_orig = Panel(np.arange(16).reshape(2, 4, 2),
-                       items=['Item1', 'Item2'],
-                       major_axis=pd.date_range('2001/1/12', periods=4),
-                       minor_axis=['A', 'B'], dtype='float64')
-
-        # panel setting via item
-        p_orig = Panel(np.arange(16).reshape(2, 4, 2),
-                       items=['Item1', 'Item2'],
-                       major_axis=pd.date_range('2001/1/12', periods=4),
-                       minor_axis=['A', 'B'], dtype='float64')
-        expected = p_orig.copy()
-        expected['Item3'] = expected['Item1']
-        p = p_orig.copy()
-        p.loc['Item3'] = p['Item1']
-        tm.assert_panel_equal(p, expected)
-
-        # panel with aligned series
-        expected = p_orig.copy()
-        expected = expected.transpose(2, 1, 0)
-        expected['C'] = DataFrame({'Item1': [30, 30, 30, 30],
-                                   'Item2': [32, 32, 32, 32]},
-                                  index=p_orig.major_axis)
-        expected = expected.transpose(2, 1, 0)
-        p = p_orig.copy()
-        p.loc[:, :, 'C'] = Series([30, 32], index=p_orig.items)
-        tm.assert_panel_equal(p, expected)
-
         # GH 8473
         dates = date_range('1/1/2000', periods=8)
         df_orig = DataFrame(np.random.randn(8, 4), index=dates,
                             columns=['A', 'B', 'C', 'D'])
 
-        expected = pd.concat([df_orig, DataFrame(
-            {'A': 7}, index=[dates[-1] + 1])])
+        expected = pd.concat([df_orig,
+                              DataFrame({'A': 7},
+                                        index=[dates[-1] + dates.freq])],
+                             sort=True)
         df = df_orig.copy()
-        df.loc[dates[-1] + 1, 'A'] = 7
+        df.loc[dates[-1] + dates.freq, 'A'] = 7
         tm.assert_frame_equal(df, expected)
         df = df_orig.copy()
-        df.at[dates[-1] + 1, 'A'] = 7
+        df.at[dates[-1] + dates.freq, 'A'] = 7
         tm.assert_frame_equal(df, expected)
 
-        exp_other = DataFrame({0: 7}, index=[dates[-1] + 1])
+        exp_other = DataFrame({0: 7}, index=[dates[-1] + dates.freq])
         expected = pd.concat([df_orig, exp_other], axis=1)
 
         df = df_orig.copy()
-        df.loc[dates[-1] + 1, 0] = 7
+        df.loc[dates[-1] + dates.freq, 0] = 7
         tm.assert_frame_equal(df, expected)
         df = df_orig.copy()
-        df.at[dates[-1] + 1, 0] = 7
+        df.at[dates[-1] + dates.freq, 0] = 7
         tm.assert_frame_equal(df, expected)
 
     def test_partial_setting_mixed_dtype(self):
@@ -200,11 +170,9 @@ def test_partial_setting_mixed_dtype(self):
         # list-like must conform
         df = DataFrame(columns=['A', 'B'])
 
-        def f():
+        with pytest.raises(ValueError):
             df.loc[0] = [1, 2, 3]
 
-        self.assertRaises(ValueError, f)
-
         # TODO: #15657, these are left as object and not coerced
         df = DataFrame(columns=['A', 'B'])
         df.loc[3] = [6, 7]
@@ -218,13 +186,21 @@ def test_series_partial_set(self):
         # Regression from GH4825
         ser = Series([0.1, 0.2], index=[1, 2])
 
-        # loc
+        # loc equiv to .reindex
         expected = Series([np.nan, 0.2, np.nan], index=[3, 2, 3])
-        result = ser.loc[[3, 2, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([3, 2, 3])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         expected = Series([np.nan, 0.2, np.nan, np.nan], index=[3, 2, 3, 'x'])
-        result = ser.loc[[3, 2, 3, 'x']]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3, 'x']]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([3, 2, 3, 'x'])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         expected = Series([0.2, 0.2, 0.1], index=[2, 2, 1])
@@ -232,38 +208,74 @@ def test_series_partial_set(self):
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         expected = Series([0.2, 0.2, np.nan, 0.1], index=[2, 2, 'x', 1])
-        result = ser.loc[[2, 2, 'x', 1]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 'x', 1]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = ser.reindex([2, 2, 'x', 1])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # raises as nothing in in the index
-        self.assertRaises(KeyError, lambda: ser.loc[[3, 3, 3]])
+        msg = (r"\"None of \[Int64Index\(\[3, 3, 3\], dtype='int64'\)\] are"
+               r" in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            ser.loc[[3, 3, 3]]
 
         expected = Series([0.2, 0.2, np.nan], index=[2, 2, 3])
-        result = ser.loc[[2, 2, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 3]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+        result = ser.reindex([2, 2, 3])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3], index=[1, 2, 3])
         expected = Series([0.3, np.nan, np.nan], index=[3, 4, 4])
-        result = Series([0.1, 0.2, 0.3], index=[1, 2, 3]).loc[[3, 4, 4]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[3, 4, 4]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([3, 4, 4])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
         expected = Series([np.nan, 0.3, 0.3], index=[5, 3, 3])
-        result = Series([0.1, 0.2, 0.3, 0.4],
-                        index=[1, 2, 3, 4]).loc[[5, 3, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[5, 3, 3]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([5, 3, 3])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
         expected = Series([np.nan, 0.4, 0.4], index=[5, 4, 4])
-        result = Series([0.1, 0.2, 0.3, 0.4],
-                        index=[1, 2, 3, 4]).loc[[5, 4, 4]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[5, 4, 4]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+        result = s.reindex([5, 4, 4])
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[4, 5, 6, 7])
         expected = Series([0.4, np.nan, np.nan], index=[7, 2, 2])
-        result = Series([0.1, 0.2, 0.3, 0.4],
-                        index=[4, 5, 6, 7]).loc[[7, 2, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[7, 2, 2]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([7, 2, 2])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+        s = Series([0.1, 0.2, 0.3, 0.4],
+                   index=[1, 2, 3, 4])
         expected = Series([0.4, np.nan, np.nan], index=[4, 5, 5])
-        result = Series([0.1, 0.2, 0.3, 0.4],
-                        index=[1, 2, 3, 4]).loc[[4, 5, 5]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.loc[[4, 5, 5]]
+        tm.assert_series_equal(result, expected, check_index_type=True)
+
+        result = s.reindex([4, 5, 5])
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # iloc
@@ -280,13 +292,15 @@ def test_series_partial_set_with_name(self):
         # loc
         exp_idx = Index([3, 2, 3], dtype='int64', name='idx')
         expected = Series([np.nan, 0.2, np.nan], index=exp_idx, name='s')
-        result = ser.loc[[3, 2, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([3, 2, 3, 'x'], dtype='object', name='idx')
         expected = Series([np.nan, 0.2, np.nan, np.nan], index=exp_idx,
                           name='s')
-        result = ser.loc[[3, 2, 3, 'x']]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[3, 2, 3, 'x']]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([2, 2, 1], dtype='int64', name='idx')
@@ -296,49 +310,61 @@ def test_series_partial_set_with_name(self):
 
         exp_idx = Index([2, 2, 'x', 1], dtype='object', name='idx')
         expected = Series([0.2, 0.2, np.nan, 0.1], index=exp_idx, name='s')
-        result = ser.loc[[2, 2, 'x', 1]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 'x', 1]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # raises as nothing in in the index
-        self.assertRaises(KeyError, lambda: ser.loc[[3, 3, 3]])
+        msg = (r"\"None of \[Int64Index\(\[3, 3, 3\], dtype='int64',"
+               r" name=u?'idx'\)\] are in the \[index\]\"")
+        with pytest.raises(KeyError, match=msg):
+            ser.loc[[3, 3, 3]]
 
         exp_idx = Index([2, 2, 3], dtype='int64', name='idx')
         expected = Series([0.2, 0.2, np.nan], index=exp_idx, name='s')
-        result = ser.loc[[2, 2, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = ser.loc[[2, 2, 3]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([3, 4, 4], dtype='int64', name='idx')
         expected = Series([0.3, np.nan, np.nan], index=exp_idx, name='s')
         idx = Index([1, 2, 3], dtype='int64', name='idx')
-        result = Series([0.1, 0.2, 0.3], index=idx, name='s').loc[[3, 4, 4]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3],
+                            index=idx,
+                            name='s').loc[[3, 4, 4]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([5, 3, 3], dtype='int64', name='idx')
         expected = Series([np.nan, 0.3, 0.3], index=exp_idx, name='s')
         idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
-        result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
-                        name='s').loc[[5, 3, 3]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[5, 3, 3]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([5, 4, 4], dtype='int64', name='idx')
         expected = Series([np.nan, 0.4, 0.4], index=exp_idx, name='s')
         idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
-        result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
-                        name='s').loc[[5, 4, 4]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[5, 4, 4]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([7, 2, 2], dtype='int64', name='idx')
         expected = Series([0.4, np.nan, np.nan], index=exp_idx, name='s')
         idx = Index([4, 5, 6, 7], dtype='int64', name='idx')
-        result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
-                        name='s').loc[[7, 2, 2]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[7, 2, 2]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         exp_idx = Index([4, 5, 5], dtype='int64', name='idx')
         expected = Series([0.4, np.nan, np.nan], index=exp_idx, name='s')
         idx = Index([1, 2, 3, 4], dtype='int64', name='idx')
-        result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
-                        name='s').loc[[4, 5, 5]]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = Series([0.1, 0.2, 0.3, 0.4], index=idx,
+                            name='s').loc[[4, 5, 5]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # iloc
@@ -347,6 +373,7 @@ def test_series_partial_set_with_name(self):
         result = ser.iloc[[1, 1, 0, 0]]
         tm.assert_series_equal(result, expected, check_index_type=True)
 
+    @pytest.mark.filterwarnings("ignore:\\n.ix")
     def test_partial_set_invalid(self):
 
         # GH 4940
@@ -356,39 +383,30 @@ def test_partial_set_invalid(self):
         df = orig.copy()
 
         # don't allow not string inserts
-        def f():
+        with pytest.raises(TypeError):
             with catch_warnings(record=True):
                 df.loc[100.0, :] = df.ix[0]
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(TypeError):
             with catch_warnings(record=True):
                 df.loc[100, :] = df.ix[0]
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(TypeError):
             with catch_warnings(record=True):
                 df.ix[100.0, :] = df.ix[0]
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(ValueError):
             with catch_warnings(record=True):
                 df.ix[100, :] = df.ix[0]
 
-        self.assertRaises(ValueError, f)
-
         # allow object conversion here
         df = orig.copy()
         with catch_warnings(record=True):
             df.loc['a', :] = df.ix[0]
-            exp = orig.append(pd.Series(df.ix[0], name='a'))
+            exp = orig.append(Series(df.ix[0], name='a'))
         tm.assert_frame_equal(df, exp)
-        tm.assert_index_equal(df.index,
-                              pd.Index(orig.index.tolist() + ['a']))
-        self.assertEqual(df.index.dtype, 'object')
+        tm.assert_index_equal(df.index, Index(orig.index.tolist() + ['a']))
+        assert df.index.dtype == 'object'
 
     def test_partial_set_empty_series(self):
 
@@ -421,26 +439,19 @@ def test_partial_set_empty_frame(self):
         # frame
         df = DataFrame()
 
-        def f():
+        with pytest.raises(ValueError):
             df.loc[1] = 1
 
-        self.assertRaises(ValueError, f)
-
-        def f():
+        with pytest.raises(ValueError):
             df.loc[1] = Series([1], index=['foo'])
 
-        self.assertRaises(ValueError, f)
-
-        def f():
+        with pytest.raises(ValueError):
             df.loc[:, 1] = 1
 
-        self.assertRaises(ValueError, f)
-
         # these work as they don't really change
         # anything but the index
         # GH5632
-        expected = DataFrame(columns=['foo'], index=pd.Index(
-            [], dtype='int64'))
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
 
         def f():
             df = DataFrame()
@@ -463,8 +474,7 @@ def f():
 
         tm.assert_frame_equal(f(), expected)
 
-        expected = DataFrame(columns=['foo'],
-                             index=pd.Index([], dtype='int64'))
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
         expected['foo'] = expected['foo'].astype('float64')
 
         def f():
@@ -476,24 +486,23 @@ def f():
 
         def f():
             df = DataFrame()
-            df['foo'] = Series(range(len(df)))
+            df['foo'] = Series(np.arange(len(df)), dtype='float64')
             return df
 
         tm.assert_frame_equal(f(), expected)
 
         def f():
             df = DataFrame()
-            tm.assert_index_equal(df.index, pd.Index([], dtype='object'))
+            tm.assert_index_equal(df.index, Index([], dtype='object'))
             df['foo'] = range(len(df))
             return df
 
-        expected = DataFrame(columns=['foo'],
-                             index=pd.Index([], dtype='int64'))
+        expected = DataFrame(columns=['foo'], index=Index([], dtype='int64'))
         expected['foo'] = expected['foo'].astype('float64')
         tm.assert_frame_equal(f(), expected)
 
         df = DataFrame()
-        tm.assert_index_equal(df.columns, pd.Index([], dtype=object))
+        tm.assert_index_equal(df.columns, Index([], dtype=object))
         df2 = DataFrame()
         df2[1] = Series([1], index=['foo'])
         df.loc[:, 1] = Series([1], index=['foo'])
@@ -520,7 +529,7 @@ def test_partial_set_empty_frame_row(self):
         # GH5720, GH5744
         # don't create rows when empty
         expected = DataFrame(columns=['A', 'B', 'New'],
-                             index=pd.Index([], dtype='int64'))
+                             index=Index([], dtype='int64'))
         expected['A'] = expected['A'].astype('int64')
         expected['B'] = expected['B'].astype('float64')
         expected['New'] = expected['New'].astype('float64')
@@ -543,7 +552,7 @@ def test_partial_set_empty_frame_row(self):
         y = df[df.A > 5]
         result = y.reindex(columns=['A', 'B', 'C'])
         expected = DataFrame(columns=['A', 'B', 'C'],
-                             index=pd.Index([], dtype='int64'))
+                             index=Index([], dtype='int64'))
         expected['A'] = expected['A'].astype('int64')
         expected['B'] = expected['B'].astype('float64')
         expected['C'] = expected['C'].astype('float64')
diff --git a/pandas/tests/indexing/test_scalar.py b/pandas/tests/indexing/test_scalar.py
index 0eeaec3e00fa6..20053264ac4f1 100644
--- a/pandas/tests/indexing/test_scalar.py
+++ b/pandas/tests/indexing/test_scalar.py
@@ -1,14 +1,14 @@
 """ test scalar indexing, including at and iat """
 
 import numpy as np
+import pytest
 
-from pandas import (Series, DataFrame, Timestamp,
-                    Timedelta, date_range)
-from pandas.util import testing as tm
+from pandas import DataFrame, Series, Timedelta, Timestamp, date_range
 from pandas.tests.indexing.common import Base
+from pandas.util import testing as tm
 
 
-class TestScalar(Base, tm.TestCase):
+class TestScalar(Base):
 
     def test_at_and_iat_get(self):
         def _check(f, func, values=False):
@@ -30,7 +30,9 @@ def _check(f, func, values=False):
 
             for f in [d['labels'], d['ts'], d['floats']]:
                 if f is not None:
-                    self.assertRaises(ValueError, self.check_values, f, 'iat')
+                    msg = "iAt based indexing can only have integer indexers"
+                    with pytest.raises(ValueError, match=msg):
+                        self.check_values(f, 'iat')
 
             # at
             for f in [d['ints'], d['uints'], d['labels'],
@@ -57,7 +59,9 @@ def _check(f, func, values=False):
 
             for f in [d['labels'], d['ts'], d['floats']]:
                 if f is not None:
-                    self.assertRaises(ValueError, _check, f, 'iat')
+                    msg = "iAt based indexing can only have integer indexers"
+                    with pytest.raises(ValueError, match=msg):
+                        _check(f, 'iat')
 
             # at
             for f in [d['ints'], d['uints'], d['labels'],
@@ -75,7 +79,7 @@ def test_at_iat_coercion(self):
 
         result = s.at[dates[5]]
         xp = s.values[5]
-        self.assertEqual(result, xp)
+        assert result == xp
 
         # GH 7729
         # make sure we are boxing the returns
@@ -84,14 +88,14 @@ def test_at_iat_coercion(self):
 
         for r in [lambda: s.iat[1], lambda: s.iloc[1]]:
             result = r()
-            self.assertEqual(result, expected)
+            assert result == expected
 
         s = Series(['1 days', '2 days'], dtype='timedelta64[ns]')
         expected = Timedelta('2 days')
 
         for r in [lambda: s.iat[1], lambda: s.iloc[1]]:
             result = r()
-            self.assertEqual(result, expected)
+            assert result == expected
 
     def test_iat_invalid_args(self):
         pass
@@ -103,12 +107,16 @@ def test_imethods_with_dups(self):
 
         s = Series(range(5), index=[1, 1, 2, 2, 3], dtype='int64')
         result = s.iloc[2]
-        self.assertEqual(result, 2)
+        assert result == 2
         result = s.iat[2]
-        self.assertEqual(result, 2)
+        assert result == 2
 
-        self.assertRaises(IndexError, lambda: s.iat[10])
-        self.assertRaises(IndexError, lambda: s.iat[-10])
+        msg = "index 10 is out of bounds for axis 0 with size 5"
+        with pytest.raises(IndexError, match=msg):
+            s.iat[10]
+        msg = "index -10 is out of bounds for axis 0 with size 5"
+        with pytest.raises(IndexError, match=msg):
+            s.iat[-10]
 
         result = s.iloc[[2, 3]]
         expected = Series([2, 3], [2, 2], dtype='int64')
@@ -120,31 +128,38 @@ def test_imethods_with_dups(self):
         tm.assert_series_equal(result, expected)
 
         result = df.iat[2, 0]
-        expected = 2
-        self.assertEqual(result, 2)
+        assert result == 2
 
     def test_at_to_fail(self):
         # at should not fallback
         # GH 7814
         s = Series([1, 2, 3], index=list('abc'))
         result = s.at['a']
-        self.assertEqual(result, 1)
-        self.assertRaises(ValueError, lambda: s.at[0])
+        assert result == 1
+        msg = ("At based indexing on an non-integer index can only have"
+               " non-integer indexers")
+        with pytest.raises(ValueError, match=msg):
+            s.at[0]
 
         df = DataFrame({'A': [1, 2, 3]}, index=list('abc'))
         result = df.at['a', 'A']
-        self.assertEqual(result, 1)
-        self.assertRaises(ValueError, lambda: df.at['a', 0])
+        assert result == 1
+        with pytest.raises(ValueError, match=msg):
+            df.at['a', 0]
 
         s = Series([1, 2, 3], index=[3, 2, 1])
         result = s.at[1]
-        self.assertEqual(result, 3)
-        self.assertRaises(ValueError, lambda: s.at['a'])
+        assert result == 3
+        msg = ("At based indexing on an integer index can only have integer"
+               " indexers")
+        with pytest.raises(ValueError, match=msg):
+            s.at['a']
 
         df = DataFrame({0: [1, 2, 3]}, index=[3, 2, 1])
         result = df.at[1, 0]
-        self.assertEqual(result, 3)
-        self.assertRaises(ValueError, lambda: df.at['a', 0])
+        assert result == 3
+        with pytest.raises(ValueError, match=msg):
+            df.at['a', 0]
 
         # GH 13822, incorrect error string with non-unique columns when missing
         # column is accessed
@@ -152,8 +167,8 @@ def test_at_to_fail(self):
         df.columns = ['x', 'x', 'z']
 
         # Check that we get the correct value in the KeyError
-        self.assertRaisesRegexp(KeyError, r"\['y'\] not in index",
-                                lambda: df[['x', 'y', 'z']])
+        with pytest.raises(KeyError, match=r"\['y'\] not in index"):
+            df[['x', 'y', 'z']]
 
     def test_at_with_tz(self):
         # gh-15822
@@ -169,3 +184,61 @@ def test_at_with_tz(self):
 
         result = df.at[0, 'date']
         assert result == expected
+
+    def test_series_set_tz_timestamp(self, tz_naive_fixture):
+        # GH 25506
+        ts = Timestamp('2017-08-05 00:00:00+0100', tz=tz_naive_fixture)
+        result = Series(ts)
+        result.at[1] = ts
+        expected = Series([ts, ts])
+        tm.assert_series_equal(result, expected)
+
+    def test_mixed_index_at_iat_loc_iloc_series(self):
+        # GH 19860
+        s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 1, 2])
+        for el, item in s.iteritems():
+            assert s.at[el] == s.loc[el] == item
+        for i in range(len(s)):
+            assert s.iat[i] == s.iloc[i] == i + 1
+
+        with pytest.raises(KeyError):
+            s.at[4]
+        with pytest.raises(KeyError):
+            s.loc[4]
+
+    def test_mixed_index_at_iat_loc_iloc_dataframe(self):
+        # GH 19860
+        df = DataFrame([[0, 1, 2, 3, 4], [5, 6, 7, 8, 9]],
+                       columns=['a', 'b', 'c', 1, 2])
+        for rowIdx, row in df.iterrows():
+            for el, item in row.iteritems():
+                assert df.at[rowIdx, el] == df.loc[rowIdx, el] == item
+
+        for row in range(2):
+            for i in range(5):
+                assert df.iat[row, i] == df.iloc[row, i] == row * 5 + i
+
+        with pytest.raises(KeyError):
+            df.at[0, 3]
+        with pytest.raises(KeyError):
+            df.loc[0, 3]
+
+    def test_iat_setter_incompatible_assignment(self):
+        # GH 23236
+        result = DataFrame({'a': [0, 1], 'b': [4, 5]})
+        result.iat[0, 0] = None
+        expected = DataFrame({"a": [None, 1], "b": [4, 5]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_getitem_zerodim_np_array(self):
+        # GH24924
+        # dataframe __getitem__
+        df = DataFrame([[1, 2], [3, 4]])
+        result = df[np.array(0)]
+        expected = Series([1, 3], name=0)
+        tm.assert_series_equal(result, expected)
+
+        # series __getitem__
+        s = Series([1, 2])
+        result = s[np.array(0)]
+        assert result == 1
diff --git a/pandas/tests/indexing/test_timedelta.py b/pandas/tests/indexing/test_timedelta.py
index 5f0088382ce57..acd8bee3e5663 100644
--- a/pandas/tests/indexing/test_timedelta.py
+++ b/pandas/tests/indexing/test_timedelta.py
@@ -1,9 +1,11 @@
+import numpy as np
+import pytest
+
 import pandas as pd
 from pandas.util import testing as tm
 
 
-class TestTimedeltaIndexing(tm.TestCase):
-
+class TestTimedeltaIndexing(object):
     def test_boolean_indexing(self):
         # GH 14946
         df = pd.DataFrame({'x': range(10)})
@@ -16,5 +18,80 @@ def test_boolean_indexing(self):
             result = df.assign(x=df.mask(cond, 10).astype('int64'))
             expected = pd.DataFrame(data,
                                     index=pd.to_timedelta(range(10), unit='s'),
-                                    columns=['x'])
+                                    columns=['x'],
+                                    dtype='int64')
             tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.parametrize(
+        "indexer, expected",
+        [(0, [20, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+         (slice(4, 8), [0, 1, 2, 3, 20, 20, 20, 20, 8, 9]),
+         ([3, 5], [0, 1, 2, 20, 4, 20, 6, 7, 8, 9])])
+    def test_list_like_indexing(self, indexer, expected):
+        # GH 16637
+        df = pd.DataFrame({'x': range(10)}, dtype="int64")
+        df.index = pd.to_timedelta(range(10), unit='s')
+
+        df.loc[df.index[indexer], 'x'] = 20
+
+        expected = pd.DataFrame(expected,
+                                index=pd.to_timedelta(range(10), unit='s'),
+                                columns=['x'],
+                                dtype="int64")
+
+        tm.assert_frame_equal(expected, df)
+
+    def test_string_indexing(self):
+        # GH 16896
+        df = pd.DataFrame({'x': range(3)},
+                          index=pd.to_timedelta(range(3), unit='days'))
+        expected = df.iloc[0]
+        sliced = df.loc['0 days']
+        tm.assert_series_equal(sliced, expected)
+
+    @pytest.mark.parametrize(
+        "value",
+        [None, pd.NaT, np.nan])
+    def test_masked_setitem(self, value):
+        # issue (#18586)
+        series = pd.Series([0, 1, 2], dtype='timedelta64[ns]')
+        series[series == series[0]] = value
+        expected = pd.Series([pd.NaT, 1, 2], dtype='timedelta64[ns]')
+        tm.assert_series_equal(series, expected)
+
+    @pytest.mark.parametrize(
+        "value",
+        [None, pd.NaT, np.nan])
+    def test_listlike_setitem(self, value):
+        # issue (#18586)
+        series = pd.Series([0, 1, 2], dtype='timedelta64[ns]')
+        series.iloc[0] = value
+        expected = pd.Series([pd.NaT, 1, 2], dtype='timedelta64[ns]')
+        tm.assert_series_equal(series, expected)
+
+    @pytest.mark.parametrize('start,stop, expected_slice', [
+        [np.timedelta64(0, 'ns'), None, slice(0, 11)],
+        [np.timedelta64(1, 'D'), np.timedelta64(6, 'D'), slice(1, 7)],
+        [None, np.timedelta64(4, 'D'), slice(0, 5)]])
+    def test_numpy_timedelta_scalar_indexing(self, start, stop,
+                                             expected_slice):
+        # GH 20393
+        s = pd.Series(range(11), pd.timedelta_range('0 days', '10 days'))
+        result = s.loc[slice(start, stop)]
+        expected = s.iloc[expected_slice]
+        tm.assert_series_equal(result, expected)
+
+    def test_roundtrip_thru_setitem(self):
+        # PR 23462
+        dt1 = pd.Timedelta(0)
+        dt2 = pd.Timedelta(28767471428571405)
+        df = pd.DataFrame({'dt': pd.Series([dt1, dt2])})
+        df_copy = df.copy()
+        s = pd.Series([dt1])
+
+        expected = df['dt'].iloc[1].value
+        df.loc[[True, False]] = s
+        result = df['dt'].iloc[1].value
+
+        assert expected == result
+        tm.assert_frame_equal(df, df_copy)
diff --git a/pandas/tests/internals/__init__.py b/pandas/tests/internals/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/test_internals.py b/pandas/tests/internals/test_internals.py
similarity index 84%
rename from pandas/tests/test_internals.py
rename to pandas/tests/internals/test_internals.py
index af7c584249416..bda486411e01e 100644
--- a/pandas/tests/test_internals.py
+++ b/pandas/tests/internals/test_internals.py
@@ -1,30 +1,32 @@
 # -*- coding: utf-8 -*-
 # pylint: disable=W0102
-
-from datetime import datetime, date
+from collections import OrderedDict
+from datetime import date, datetime
+from distutils.version import LooseVersion
+import itertools
+import operator
+import re
 import sys
-import pytest
+
 import numpy as np
+import pytest
 
-import re
-from distutils.version import LooseVersion
-import itertools
-from pandas import (Index, MultiIndex, DataFrame, DatetimeIndex,
-                    Series, Categorical)
-from pandas.compat import OrderedDict, lrange
-from pandas.sparse.array import SparseArray
-from pandas.core.internals import (BlockPlacement, SingleBlockManager,
-                                   make_block, BlockManager)
+from pandas._libs.internals import BlockPlacement
+from pandas.compat import lrange, u, zip
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, MultiIndex, Series,
+    SparseArray)
 import pandas.core.algorithms as algos
+from pandas.core.arrays import DatetimeArray, TimedeltaArray
+from pandas.core.internals import BlockManager, SingleBlockManager, make_block
 import pandas.util.testing as tm
-import pandas as pd
-from pandas._libs import lib
-from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
-                                 randn, assert_series_equal)
-from pandas.compat import zip, u
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal, randn)
 
 # in 3.6.1 a c-api slicing function changed, see src/compat_helper.h
-PY361 = sys.version >= LooseVersion('3.6.1')
+PY361 = LooseVersion(sys.version) >= LooseVersion('3.6.1')
 
 
 @pytest.fixture
@@ -38,8 +40,8 @@ def mgr():
 def assert_block_equal(left, right):
     tm.assert_numpy_array_equal(left.values, right.values)
     assert left.dtype == right.dtype
-    assert isinstance(left.mgr_locs, lib.BlockPlacement)
-    assert isinstance(right.mgr_locs, lib.BlockPlacement)
+    assert isinstance(left.mgr_locs, BlockPlacement)
+    assert isinstance(right.mgr_locs, BlockPlacement)
     tm.assert_numpy_array_equal(left.mgr_locs.as_array,
                                 right.mgr_locs.as_array)
 
@@ -192,9 +194,9 @@ def create_mgr(descr, item_shape=None):
                         [mgr_items] + [np.arange(n) for n in item_shape])
 
 
-class TestBlock(tm.TestCase):
+class TestBlock(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         # self.fblock = get_float_ex()  # a,c,e
         # self.cblock = get_complex_ex() #
         # self.oblock = get_obj_ex()
@@ -221,7 +223,7 @@ def _check(blk):
         _check(self.bool_block)
 
     def test_mgr_locs(self):
-        assert isinstance(self.fblock.mgr_locs, lib.BlockPlacement)
+        assert isinstance(self.fblock.mgr_locs, BlockPlacement)
         tm.assert_numpy_array_equal(self.fblock.mgr_locs.as_array,
                                     np.array([0, 2, 4], dtype=np.int64))
 
@@ -248,7 +250,7 @@ def test_merge(self):
 
     def test_copy(self):
         cop = self.fblock.copy()
-        self.assertIsNot(cop, self.fblock)
+        assert cop is not self.fblock
         assert_block_equal(self.fblock, cop)
 
     def test_reindex_index(self):
@@ -263,14 +265,14 @@ def test_insert(self):
     def test_delete(self):
         newb = self.fblock.copy()
         newb.delete(0)
-        assert isinstance(newb.mgr_locs, lib.BlockPlacement)
+        assert isinstance(newb.mgr_locs, BlockPlacement)
         tm.assert_numpy_array_equal(newb.mgr_locs.as_array,
                                     np.array([2, 4], dtype=np.int64))
         assert (newb.values[0] == 1).all()
 
         newb = self.fblock.copy()
         newb.delete(1)
-        assert isinstance(newb.mgr_locs, lib.BlockPlacement)
+        assert isinstance(newb.mgr_locs, BlockPlacement)
         tm.assert_numpy_array_equal(newb.mgr_locs.as_array,
                                     np.array([0, 4], dtype=np.int64))
         assert (newb.values[1] == 2).all()
@@ -285,44 +287,29 @@ def test_delete(self):
         with pytest.raises(Exception):
             newb.delete(3)
 
-    def test_split_block_at(self):
-
-        # with dup column support this method was taken out
-        # GH3679
-        pytest.skip("skipping for now")
-
-        bs = list(self.fblock.split_block_at('a'))
-        assert len(bs) == 1
-        assert np.array_equal(bs[0].items, ['c', 'e'])
-
-        bs = list(self.fblock.split_block_at('c'))
-        assert len(bs) == 2
-        assert np.array_equal(bs[0].items, ['a'])
-        assert np.array_equal(bs[1].items, ['e'])
-
-        bs = list(self.fblock.split_block_at('e'))
-        assert len(bs) == 1
-        assert np.array_equal(bs[0].items, ['a', 'c'])
-
-        # bblock = get_bool_ex(['f'])
-        # bs = list(bblock.split_block_at('f'))
-        # assert len(bs), 0)
+    def test_make_block_same_class(self):
+        # issue 19431
+        block = create_block('M8[ns, US/Eastern]', [3])
+        with tm.assert_produces_warning(DeprecationWarning,
+                                        check_stacklevel=False):
+            block.make_block_same_class(block.values,
+                                        dtype=block.values.dtype)
 
 
-class TestDatetimeBlock(tm.TestCase):
+class TestDatetimeBlock(object):
 
     def test_try_coerce_arg(self):
         block = create_block('datetime', [0])
 
         # coerce None
-        none_coerced = block._try_coerce_args(block.values, None)[2]
+        none_coerced = block._try_coerce_args(block.values, None)[1]
         assert pd.Timestamp(none_coerced) is pd.NaT
 
         # coerce different types of date bojects
         vals = (np.datetime64('2010-10-10'), datetime(2010, 10, 10),
                 date(2010, 10, 10))
         for val in vals:
-            coerced = block._try_coerce_args(block.values, val)[2]
+            coerced = block._try_coerce_args(block.values, val)[1]
             assert np.int64 == type(coerced)
             assert pd.Timestamp('2010-10-10') == pd.Timestamp(coerced)
 
@@ -344,17 +331,6 @@ def test_is_mixed_dtype(self):
         assert create_mgr('a,b:f8; c,d: f4').is_mixed_type
         assert create_mgr('a,b:f8; c,d: object').is_mixed_type
 
-    def test_is_indexed_like(self):
-        mgr1 = create_mgr('a,b: f8')
-        mgr2 = create_mgr('a:i8; b:bool')
-        mgr3 = create_mgr('a,b,c: f8')
-        assert mgr1._is_indexed_like(mgr1)
-        assert mgr1._is_indexed_like(mgr2)
-        assert mgr1._is_indexed_like(mgr3)
-
-        assert not mgr1._is_indexed_like(mgr1.get_slice(
-            slice(-1), axis=1))
-
     def test_duplicate_ref_loc_failure(self):
         tmp_mgr = create_mgr('a:bool; a: f8')
 
@@ -382,7 +358,7 @@ def test_pickle(self, mgr):
         assert_frame_equal(DataFrame(mgr), DataFrame(mgr2))
 
         # share ref_items
-        # self.assertIs(mgr2.blocks[0].ref_items, mgr2.blocks[1].ref_items)
+        # assert mgr2.blocks[0].ref_items is mgr2.blocks[1].ref_items
 
         # GH2431
         assert hasattr(mgr2, "_is_consolidated")
@@ -411,15 +387,6 @@ def test_categorical_block_pickle(self):
         smgr2 = tm.round_trip_pickle(smgr)
         assert_series_equal(Series(smgr), Series(smgr2))
 
-    def test_get_scalar(self, mgr):
-        for item in mgr.items:
-            for i, index in enumerate(mgr.axes[1]):
-                res = mgr.get_scalar((item, index))
-                exp = mgr.get(item, fastpath=False)[i]
-                assert res == exp
-                exp = mgr.get(item).internal_values()[i]
-                assert res == exp
-
     def test_get(self):
         cols = Index(list('abc'))
         values = np.random.rand(3, 3)
@@ -469,10 +436,11 @@ def test_set_change_dtype_slice(self):  # GH8850
         df = DataFrame([[1.0, 2, 3], [4.0, 5, 6]], columns=cols)
         df['2nd'] = df['2nd'] * 2.0
 
-        assert sorted(df.blocks.keys()) == ['float64', 'int64']
-        assert_frame_equal(df.blocks['float64'], DataFrame(
+        blocks = df._to_dict_of_blocks()
+        assert sorted(blocks.keys()) == ['float64', 'int64']
+        assert_frame_equal(blocks['float64'], DataFrame(
             [[1.0, 4.0], [4.0, 10.0]], columns=cols[:2]))
-        assert_frame_equal(df.blocks['int64'], DataFrame(
+        assert_frame_equal(blocks['int64'], DataFrame(
             [[3], [6]], columns=cols[2:]))
 
     def test_copy(self, mgr):
@@ -481,7 +449,11 @@ def test_copy(self, mgr):
 
             # view assertion
             assert cp_blk.equals(blk)
-            assert cp_blk.values.base is blk.values.base
+            if isinstance(blk.values, np.ndarray):
+                assert cp_blk.values.base is blk.values.base
+            else:
+                # DatetimeTZBlock has DatetimeIndex values
+                assert cp_blk.values._data.base is blk.values._data.base
 
         cp = mgr.copy(deep=True)
         for blk, cp_blk in zip(mgr.blocks, cp.blocks):
@@ -489,15 +461,15 @@ def test_copy(self, mgr):
             # copy assertion we either have a None for a base or in case of
             # some blocks it is an array (e.g. datetimetz), but was copied
             assert cp_blk.equals(blk)
-            if cp_blk.values.base is not None and blk.values.base is not None:
-                assert cp_blk.values.base is not blk.values.base
+            if not isinstance(cp_blk.values, np.ndarray):
+                assert cp_blk.values._data.base is not blk.values._data.base
             else:
                 assert cp_blk.values.base is None and blk.values.base is None
 
     def test_sparse(self):
         mgr = create_mgr('a: sparse-1; b: sparse-2')
         # what to test here?
-        assert mgr.as_matrix().dtype == np.float64
+        assert mgr.as_array().dtype == np.float64
 
     def test_sparse_mixed(self):
         mgr = create_mgr('a: sparse-1; b: sparse-2; c: f8')
@@ -506,32 +478,32 @@ def test_sparse_mixed(self):
 
         # what to test here?
 
-    def test_as_matrix_float(self):
+    def test_as_array_float(self):
         mgr = create_mgr('c: f4; d: f2; e: f8')
-        assert mgr.as_matrix().dtype == np.float64
+        assert mgr.as_array().dtype == np.float64
 
         mgr = create_mgr('c: f4; d: f2')
-        assert mgr.as_matrix().dtype == np.float32
+        assert mgr.as_array().dtype == np.float32
 
-    def test_as_matrix_int_bool(self):
+    def test_as_array_int_bool(self):
         mgr = create_mgr('a: bool-1; b: bool-2')
-        assert mgr.as_matrix().dtype == np.bool_
+        assert mgr.as_array().dtype == np.bool_
 
         mgr = create_mgr('a: i8-1; b: i8-2; c: i4; d: i2; e: u1')
-        assert mgr.as_matrix().dtype == np.int64
+        assert mgr.as_array().dtype == np.int64
 
         mgr = create_mgr('c: i4; d: i2; e: u1')
-        assert mgr.as_matrix().dtype == np.int32
+        assert mgr.as_array().dtype == np.int32
 
-    def test_as_matrix_datetime(self):
+    def test_as_array_datetime(self):
         mgr = create_mgr('h: datetime-1; g: datetime-2')
-        assert mgr.as_matrix().dtype == 'M8[ns]'
+        assert mgr.as_array().dtype == 'M8[ns]'
 
-    def test_as_matrix_datetime_tz(self):
+    def test_as_array_datetime_tz(self):
         mgr = create_mgr('h: M8[ns, US/Eastern]; g: M8[ns, CET]')
         assert mgr.get('h').dtype == 'datetime64[ns, US/Eastern]'
         assert mgr.get('g').dtype == 'datetime64[ns, CET]'
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
 
     def test_astype(self):
         # coerce all
@@ -628,49 +600,49 @@ def test_interleave(self):
         for dtype in ['f8', 'i8', 'object', 'bool', 'complex', 'M8[ns]',
                       'm8[ns]']:
             mgr = create_mgr('a: {0}'.format(dtype))
-            assert mgr.as_matrix().dtype == dtype
+            assert mgr.as_array().dtype == dtype
             mgr = create_mgr('a: {0}; b: {0}'.format(dtype))
-            assert mgr.as_matrix().dtype == dtype
+            assert mgr.as_array().dtype == dtype
 
         # will be converted according the actual dtype of the underlying
         mgr = create_mgr('a: category')
-        assert mgr.as_matrix().dtype == 'i8'
+        assert mgr.as_array().dtype == 'i8'
         mgr = create_mgr('a: category; b: category')
-        assert mgr.as_matrix().dtype == 'i8'
+        assert mgr.as_array().dtype == 'i8'
         mgr = create_mgr('a: category; b: category2')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: category2')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: category2; b: category2')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
 
         # combinations
         mgr = create_mgr('a: f8')
-        assert mgr.as_matrix().dtype == 'f8'
+        assert mgr.as_array().dtype == 'f8'
         mgr = create_mgr('a: f8; b: i8')
-        assert mgr.as_matrix().dtype == 'f8'
+        assert mgr.as_array().dtype == 'f8'
         mgr = create_mgr('a: f4; b: i8')
-        assert mgr.as_matrix().dtype == 'f8'
+        assert mgr.as_array().dtype == 'f8'
         mgr = create_mgr('a: f4; b: i8; d: object')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: bool; b: i8')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: complex')
-        assert mgr.as_matrix().dtype == 'complex'
+        assert mgr.as_array().dtype == 'complex'
         mgr = create_mgr('a: f8; b: category')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: M8[ns]; b: category')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: M8[ns]; b: bool')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: M8[ns]; b: i8')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: m8[ns]; b: bool')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: m8[ns]; b: i8')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
         mgr = create_mgr('a: M8[ns]; b: m8[ns]')
-        assert mgr.as_matrix().dtype == 'object'
+        assert mgr.as_array().dtype == 'object'
 
     def test_interleave_non_unique_cols(self):
         df = DataFrame([
@@ -700,7 +672,7 @@ def test_consolidate_ordering_issues(self, mgr):
         assert cons.nblocks == 4
         cons = mgr.consolidate().get_numeric_data()
         assert cons.nblocks == 1
-        assert isinstance(cons.blocks[0].mgr_locs, lib.BlockPlacement)
+        assert isinstance(cons.blocks[0].mgr_locs, BlockPlacement)
         tm.assert_numpy_array_equal(cons.blocks[0].mgr_locs.as_array,
                                     np.arange(len(cons.items), dtype=np.int64))
 
@@ -741,8 +713,8 @@ def test_multiindex_xs(self):
 
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
                                                                   'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['first', 'second'])
 
         mgr.set_axis(1, index)
@@ -852,7 +824,7 @@ def test_equals_block_order_different_dtypes(self):
 
     def test_single_mgr_ctor(self):
         mgr = create_single_mgr('f8', num_rows=5)
-        assert mgr.as_matrix().tolist() == [0., 1., 2., 3., 4.]
+        assert mgr.as_array().tolist() == [0., 1., 2., 3., 4.]
 
     def test_validate_bool_args(self):
         invalid_values = [1, "True", [1, 2, 3], 5.0]
@@ -875,23 +847,18 @@ class TestIndexing(object):
     MANAGERS = [
         create_single_mgr('f8', N),
         create_single_mgr('i8', N),
-        # create_single_mgr('sparse', N),
-        create_single_mgr('sparse_na', N),
 
         # 2-dim
         create_mgr('a,b,c,d,e,f: f8', item_shape=(N,)),
         create_mgr('a,b,c,d,e,f: i8', item_shape=(N,)),
         create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N,)),
         create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N,)),
-        # create_mgr('a: sparse', item_shape=(N,)),
-        create_mgr('a: sparse_na', item_shape=(N,)),
 
         # 3-dim
         create_mgr('a,b,c,d,e,f: f8', item_shape=(N, N)),
         create_mgr('a,b,c,d,e,f: i8', item_shape=(N, N)),
         create_mgr('a,b: f8; c,d: i8; e,f: string', item_shape=(N, N)),
         create_mgr('a,b: f8; c,d: i8; e,f: f8', item_shape=(N, N)),
-        # create_mgr('a: sparse', item_shape=(1, N)),
     ]
 
     # MANAGERS = [MANAGERS[6]]
@@ -899,7 +866,7 @@ class TestIndexing(object):
     def test_get_slice(self):
         def assert_slice_ok(mgr, axis, slobj):
             # import pudb; pudb.set_trace()
-            mat = mgr.as_matrix()
+            mat = mgr.as_array()
 
             # we maybe using an ndarray to test slicing and
             # might not be the full length of the axis
@@ -910,7 +877,7 @@ def assert_slice_ok(mgr, axis, slobj):
                         len(ax) - len(slobj), dtype=bool)])
             sliced = mgr.get_slice(slobj, axis=axis)
             mat_slobj = (slice(None), ) * axis + (slobj, )
-            tm.assert_numpy_array_equal(mat[mat_slobj], sliced.as_matrix(),
+            tm.assert_numpy_array_equal(mat[mat_slobj], sliced.as_array(),
                                         check_dtype=False)
             tm.assert_index_equal(mgr.axes[axis][slobj], sliced.axes[axis])
 
@@ -951,10 +918,10 @@ def assert_slice_ok(mgr, axis, slobj):
 
     def test_take(self):
         def assert_take_ok(mgr, axis, indexer):
-            mat = mgr.as_matrix()
+            mat = mgr.as_array()
             taken = mgr.take(indexer, axis)
             tm.assert_numpy_array_equal(np.take(mat, indexer, axis),
-                                        taken.as_matrix(), check_dtype=False)
+                                        taken.as_array(), check_dtype=False)
             tm.assert_index_equal(mgr.axes[axis].take(indexer),
                                   taken.axes[axis])
 
@@ -971,14 +938,14 @@ def assert_take_ok(mgr, axis, indexer):
 
     def test_reindex_axis(self):
         def assert_reindex_axis_is_ok(mgr, axis, new_labels, fill_value):
-            mat = mgr.as_matrix()
+            mat = mgr.as_array()
             indexer = mgr.axes[axis].get_indexer_for(new_labels)
 
             reindexed = mgr.reindex_axis(new_labels, axis,
                                          fill_value=fill_value)
             tm.assert_numpy_array_equal(algos.take_nd(mat, indexer, axis,
                                                       fill_value=fill_value),
-                                        reindexed.as_matrix(),
+                                        reindexed.as_array(),
                                         check_dtype=False)
             tm.assert_index_equal(reindexed.axes[axis], new_labels)
 
@@ -1017,13 +984,13 @@ def test_reindex_indexer(self):
 
         def assert_reindex_indexer_is_ok(mgr, axis, new_labels, indexer,
                                          fill_value):
-            mat = mgr.as_matrix()
+            mat = mgr.as_array()
             reindexed_mat = algos.take_nd(mat, indexer, axis,
                                           fill_value=fill_value)
             reindexed = mgr.reindex_indexer(new_labels, indexer, axis,
                                             fill_value=fill_value)
             tm.assert_numpy_array_equal(reindexed_mat,
-                                        reindexed.as_matrix(),
+                                        reindexed.as_array(),
                                         check_dtype=False)
             tm.assert_index_equal(reindexed.axes[axis], new_labels)
 
@@ -1072,7 +1039,7 @@ def assert_reindex_indexer_is_ok(mgr, axis, new_labels, indexer,
     # reindex_indexer(new_labels, indexer, axis)
 
 
-class TestBlockPlacement(tm.TestCase):
+class TestBlockPlacement(object):
 
     def test_slice_len(self):
         assert len(BlockPlacement(slice(0, 4))) == 4
@@ -1090,8 +1057,8 @@ def test_zero_step_raises(self):
 
     def test_unbounded_slice_raises(self):
         def assert_unbounded_slice_error(slc):
-            tm.assertRaisesRegexp(ValueError, "unbounded slice",
-                                  lambda: BlockPlacement(slc))
+            with pytest.raises(ValueError, match="unbounded slice"):
+                BlockPlacement(slc)
 
         assert_unbounded_slice_error(slice(None, None))
         assert_unbounded_slice_error(slice(10, None))
@@ -1212,3 +1179,118 @@ def assert_add_equals(val, inc, result):
 
             with pytest.raises(ValueError):
                 BlockPlacement(slice(2, None, -1)).add(-1)
+
+
+class DummyElement(object):
+    def __init__(self, value, dtype):
+        self.value = value
+        self.dtype = np.dtype(dtype)
+
+    def __array__(self):
+        return np.array(self.value, dtype=self.dtype)
+
+    def __str__(self):
+        return "DummyElement({}, {})".format(self.value, self.dtype)
+
+    def __repr__(self):
+        return str(self)
+
+    def astype(self, dtype, copy=False):
+        self.dtype = dtype
+        return self
+
+    def view(self, dtype):
+        return type(self)(self.value.view(dtype), dtype)
+
+    def any(self, axis=None):
+        return bool(self.value)
+
+
+class TestCanHoldElement(object):
+    @pytest.mark.parametrize('value, dtype', [
+        (1, 'i8'),
+        (1.0, 'f8'),
+        (2**63, 'f8'),
+        (1j, 'complex128'),
+        (2**63, 'complex128'),
+        (True, 'bool'),
+        (np.timedelta64(20, 'ns'), '<m8[ns]'),
+        (np.datetime64(20, 'ns'), '<M8[ns]'),
+    ])
+    @pytest.mark.parametrize('op', [
+        operator.add,
+        operator.sub,
+        operator.mul,
+        operator.truediv,
+        operator.mod,
+        operator.pow,
+    ], ids=lambda x: x.__name__)
+    def test_binop_other(self, op, value, dtype):
+        skip = {(operator.add, 'bool'),
+                (operator.sub, 'bool'),
+                (operator.mul, 'bool'),
+                (operator.truediv, 'bool'),
+                (operator.mod, 'i8'),
+                (operator.mod, 'complex128'),
+                (operator.pow, 'bool')}
+        if (op, dtype) in skip:
+            pytest.skip("Invalid combination {},{}".format(op, dtype))
+
+        e = DummyElement(value, dtype)
+        s = pd.DataFrame({"A": [e.value, e.value]}, dtype=e.dtype)
+
+        invalid = {(operator.pow, '<M8[ns]'),
+                   (operator.mod, '<M8[ns]'),
+                   (operator.truediv, '<M8[ns]'),
+                   (operator.mul, '<M8[ns]'),
+                   (operator.add, '<M8[ns]'),
+                   (operator.pow, '<m8[ns]'),
+                   (operator.mul, '<m8[ns]')}
+
+        if (op, dtype) in invalid:
+            with pytest.raises(TypeError):
+                op(s, e.value)
+        else:
+            # FIXME: Since dispatching to Series, this test no longer
+            # asserts anything meaningful
+            result = op(s, e.value).dtypes
+            expected = op(s, value).dtypes
+            assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('typestr, holder', [
+    ('category', Categorical),
+    ('M8[ns]', DatetimeArray),
+    ('M8[ns, US/Central]', DatetimeArray),
+    ('m8[ns]', TimedeltaArray),
+    ('sparse', SparseArray),
+])
+def test_holder(typestr, holder):
+    blk = create_block(typestr, [1])
+    assert blk._holder is holder
+
+
+def test_deprecated_fastpath():
+    # GH#19265
+    values = np.random.rand(3, 3)
+    with tm.assert_produces_warning(DeprecationWarning,
+                                    check_stacklevel=False):
+        make_block(values, placement=np.arange(3), fastpath=True)
+
+
+def test_validate_ndim():
+    values = np.array([1.0, 2.0])
+    placement = slice(2)
+    msg = r"Wrong number of dimensions. values.ndim != ndim \[1 != 2\]"
+
+    with pytest.raises(ValueError, match=msg):
+        make_block(values, placement, ndim=2)
+
+
+def test_block_shape():
+    idx = pd.Index([0, 1, 2, 3, 4])
+    a = pd.Series([1, 2, 3]).reindex(idx)
+    b = pd.Series(pd.Categorical([1, 2, 3])).reindex(idx)
+
+    assert (a._data.blocks[0].mgr_locs.indexer ==
+            b._data.blocks[0].mgr_locs.indexer)
diff --git a/pandas/tests/io/conftest.py b/pandas/tests/io/conftest.py
new file mode 100644
index 0000000000000..af6f7ac4ef528
--- /dev/null
+++ b/pandas/tests/io/conftest.py
@@ -0,0 +1,90 @@
+from distutils.version import LooseVersion
+import os
+
+import pytest
+
+import pandas.util.testing as tm
+
+from pandas.io.parsers import read_csv
+
+
+@pytest.fixture
+def tips_file(datapath):
+    """Path to the tips dataset"""
+    return datapath('io', 'parser', 'data', 'tips.csv')
+
+
+@pytest.fixture
+def jsonl_file(datapath):
+    """Path a JSONL dataset"""
+    return datapath('io', 'parser', 'data', 'items.jsonl')
+
+
+@pytest.fixture
+def salaries_table(datapath):
+    """DataFrame with the salaries dataset"""
+    return read_csv(datapath('io', 'parser', 'data', 'salaries.csv'), sep='\t')
+
+
+@pytest.fixture
+def s3_resource(tips_file, jsonl_file):
+    """Fixture for mocking S3 interaction.
+
+    The primary bucket name is "pandas-test". The following datasets
+    are loaded.
+
+    - tips.csv
+    - tips.csv.gz
+    - tips.csv.bz2
+    - items.jsonl
+
+    A private bucket "cant_get_it" is also created. The boto3 s3 resource
+    is yielded by the fixture.
+    """
+    pytest.importorskip('s3fs')
+    boto3 = pytest.importorskip('boto3')
+    botocore = pytest.importorskip('botocore')
+
+    if LooseVersion(botocore.__version__) < LooseVersion("1.11.0"):
+        # botocore leaks an uncatchable ResourceWarning before 1.11.0;
+        # see GH 23731 and https://github.com/boto/botocore/issues/1464
+        pytest.skip("botocore is leaking resources before 1.11.0")
+
+    with tm.ensure_safe_environment_variables():
+        # temporary workaround as moto fails for botocore >= 1.11 otherwise,
+        # see https://github.com/spulec/moto/issues/1924 & 1952
+        os.environ.setdefault("AWS_ACCESS_KEY_ID", "foobar_key")
+        os.environ.setdefault("AWS_SECRET_ACCESS_KEY", "foobar_secret")
+
+        moto = pytest.importorskip('moto')
+
+        test_s3_files = [
+            ('tips.csv', tips_file),
+            ('tips.csv.gz', tips_file + '.gz'),
+            ('tips.csv.bz2', tips_file + '.bz2'),
+            ('items.jsonl', jsonl_file),
+        ]
+
+        def add_tips_files(bucket_name):
+            for s3_key, file_name in test_s3_files:
+                with open(file_name, 'rb') as f:
+                    conn.Bucket(bucket_name).put_object(
+                        Key=s3_key,
+                        Body=f)
+
+        try:
+            s3 = moto.mock_s3()
+            s3.start()
+
+            # see gh-16135
+            bucket = 'pandas-test'
+            conn = boto3.resource("s3", region_name="us-east-1")
+
+            conn.create_bucket(Bucket=bucket)
+            add_tips_files(bucket)
+
+            conn.create_bucket(Bucket='cant_get_it', ACL='private')
+            add_tips_files('cant_get_it')
+            yield conn
+        finally:
+            s3.stop()
diff --git a/pandas/tests/io/data/banklist.html b/pandas/tests/io/data/banklist.html
index 8ec1561f8c394..a0562989ad3a4 100644
--- a/pandas/tests/io/data/banklist.html
+++ b/pandas/tests/io/data/banklist.html
@@ -7,7 +7,7 @@
 <meta charset="UTF-8">
 <!-- Unicode character encoding -->
 <meta http-equiv="X-UA-Compatible" content="IE=edge">
-<!-- Turns off IE Compatiblity Mode -->
+<!-- Turns off IE Compatibility Mode -->
 <meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1">
 <!-- Makes it so phones don't auto zoom out. -->
 <meta name="author" content="DRR">
@@ -37,7 +37,7 @@
 	else var sValue = li.selectValue;
 
 	$('#googlesearch').submit();
-	
+
 }
 function findValue2(li) {
 	if( li == null ) return alert("No match!");
@@ -47,7 +47,7 @@
 
 	// otherwise, let's just display the value in the text box
 	else var sValue = li.selectValue;
-	
+
 	$('#googlesearch2').submit();
 }
 function selectItem(li) {
@@ -62,7 +62,7 @@
 	function log(event, data, formatted) {
 		$("<li>").html( !data ? "No match!" : "Selected: " + formatted).appendTo("#result");
 	}
-	
+
 	function formatItem(row) {
 		return row[0] + " (<strong>id: " + row[1] + "</strong>)";
 	}
@@ -81,7 +81,7 @@
 		selectFirst: false
 
 	});
-	
+
 	$("#search2").autocomplete("/searchjs.asp", {
 		width: 160,
 		autoFill: false,
@@ -93,7 +93,7 @@
 		selectFirst: false
 
 	});
-	
+
 });
 
 </script>
@@ -232,16 +232,16 @@ <h2>Each depositor insured to at least $250,000 per insured bank</h2>
 	<h1 class="page_title">Failed Bank List</h1>
 
 	<p>The FDIC is often appointed as receiver for failed banks. This page contains useful information for the customers and vendors of these banks. This includes information on the acquiring bank (if applicable), how your accounts and loans are affected, and how vendors can file claims against the receivership. <a href="http://www2.fdic.gov/drrip/cs/index.asp">Failed Financial Institution Contact Search</a> displays point of contact information related to failed banks.</p>
-	
+
 	<p>This list includes banks which have failed since October 1, 2000. To search for banks that failed prior to those on this page, visit this link: <a href="http://www2.fdic.gov/hsob/SelectRpt.asp?EntryTyp=30">Failures and Assistance Transactions</a></p>
-	
+
 	<p><a href="banklist.csv">Failed Bank List</a> - CSV file (Updated on Mondays. Also opens in Excel - <a href="/excel.html">Excel Help</a>)</p>
-	
+
 	<p class="small_screen_warning">Due to the small screen size some information is no longer visible.<br>Full information available when viewed on a larger screen.</p>
 
 	<script type="text/javascript">
 	<!--
-	document.writeln("<p><em>Click arrows next to headers to sort in Ascending or Descending order.</em></p>"); 
+	document.writeln("<p><em>Click arrows next to headers to sort in Ascending or Descending order.</em></p>");
 	//-->
 	</script>
 
@@ -253,7 +253,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<th id="city" class="nosort" scope="col">City</th>
 				<th id="state" scope="col">ST</th>
 				<th id="cert" class="nosort" scope="col">CERT</th>
-				<th id="ai" scope="col">Acquiring Institution</th>    
+				<th id="ai" scope="col">Acquiring Institution</th>
 				<th id="closing" scope="col">Closing Date</th>
 				<th id="updated" scope="col">Updated Date</th>
 			</tr>
@@ -294,7 +294,7 @@ <h1 class="page_title">Failed Bank List</h1>
 			  <td class="ai">Capital Bank, N.A.</td>
 			  <td class="closing">May 10, 2013</td>
 			  <td class="updated">May 14, 2013</td>
-			</tr>			
+			</tr>
 			<tr>
 				<td class="institution"><a href="douglascb.html">Douglas County Bank</a></td>
 				<td class="city">Douglasville</td>
@@ -340,6 +340,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="closing">April 19, 2013</td>
 				<td class="updated">April 23, 2013</td>
 			</tr>
+			<tr>
 				<td class="institution"><a href="goldcanyon.html">Gold Canyon Bank</a></td>
 				<td class="city">Gold Canyon</td>
 				<td class="state">AZ</td>
@@ -383,7 +384,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Sunwest Bank</td>
 				<td class="closing">January 11, 2013</td>
 				<td class="updated">January 24, 2013</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="cmbkozarks.html">Community Bank of the Ozarks</a></td>
 				<td class="city">Sunrise Beach</td>
@@ -392,7 +393,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Bank of Sullivan</td>
 				<td class="closing">December 14, 2012</td>
 				<td class="updated">January 24, 2013</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="hometown.html">Hometown Community Bank</a></td>
 				<td class="city">Braselton</td>
@@ -401,7 +402,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CertusBank, National Association</td>
 				<td class="closing">November 16, 2012</td>
 				<td class="updated">January 24, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="cfnb.html">Citizens First National Bank</a></td>
 				<td class="city">Princeton</td>
@@ -518,7 +519,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Metcalf Bank</td>
 				<td class="closing">July 20, 2012</td>
 				<td class="updated">December 17, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="cherokee.html">First Cherokee State Bank</a></td>
 				<td class="city">Woodstock</td>
@@ -635,7 +636,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Southern States Bank</td>
 				<td class="closing">May 18, 2012</td>
 				<td class="updated">May 20, 2013</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="securitybank.html">Security Bank, National Association</a></td>
 				<td class="city">North Lauderdale</td>
@@ -644,7 +645,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Banesco USA</td>
 				<td class="closing">May 4, 2012</td>
 				<td class="updated">October 31, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="palmdesert.html">Palm Desert National Bank</a></td>
 				<td class="city">Palm Desert</td>
@@ -734,7 +735,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">No Acquirer</td>
 				<td class="closing">March 9, 2012</td>
 				<td class="updated">October 29, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="global.html">Global Commerce Bank</a></td>
 				<td class="city">Doraville</td>
@@ -752,7 +753,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">No Acquirer</td>
 				<td class="closing">February 24, 2012</td>
 				<td class="updated">December 17, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="cbg.html">Central Bank of Georgia</a></td>
 				<td class="city">Ellaville</td>
@@ -761,7 +762,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Ameris Bank</td>
 				<td class="closing">February 24, 2012</td>
 				<td class="updated">August 9, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="scbbank.html">SCB Bank</a></td>
 				<td class="city">Shelbyville</td>
@@ -770,7 +771,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Merchants Bank, National Association</td>
 				<td class="closing">February 10, 2012</td>
 				<td class="updated">March 25, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="cnbt.html">Charter National Bank and Trust</a></td>
 				<td class="city">Hoffman Estates</td>
@@ -779,7 +780,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Barrington Bank &amp; Trust Company, National Association</td>
 				<td class="closing">February 10, 2012</td>
 				<td class="updated">March 25, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankeast.html">BankEast</a></td>
 				<td class="city">Knoxville</td>
@@ -788,7 +789,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">U.S.Bank National Association</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">March 8, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="patriot-mn.html">Patriot Bank Minnesota</a></td>
 				<td class="city">Forest Lake</td>
@@ -797,7 +798,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Resource Bank</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="tcb.html">Tennessee Commerce Bank</a></td>
 				<td class="city">Franklin</td>
@@ -806,7 +807,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Republic Bank &amp; Trust Company</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">November 20, 2012</td>
-			</tr>     
+			</tr>
 			<tr>
 				<td class="institution"><a href="fgbtcj.html">First Guaranty Bank and Trust Company of Jacksonville</a></td>
 				<td class="city">Jacksonville</td>
@@ -815,7 +816,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CenterState Bank of Florida, N.A.</td>
 				<td class="closing">January 27, 2012</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="americaneagle.html">American Eagle Savings Bank</a></td>
 				<td class="city">Boothwyn</td>
@@ -824,7 +825,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Capital Bank, N.A.</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>      
+			</tr>
 			<tr>
 				<td class="institution"><a href="firststatebank-ga.html">The First State Bank</a></td>
 				<td class="city">Stockbridge</td>
@@ -833,7 +834,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Hamilton State Bank</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>      
+			</tr>
 			<tr>
 				<td class="institution"><a href="cfsb.html">Central Florida State Bank</a></td>
 				<td class="city">Belleview</td>
@@ -842,7 +843,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">CenterState Bank of Florida, N.A.</td>
 				<td class="closing">January 20, 2012</td>
 				<td class="updated">January 25, 2013</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="westernnatl.html">Western National Bank</a></td>
 				<td class="city">Phoenix</td>
@@ -869,7 +870,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First NBC Bank</td>
 				<td class="closing">November 18, 2011</td>
 				<td class="updated">August 13, 2012</td>
-			</tr>     
+			</tr>
 			<tr>
 				<td class="institution"><a href="polkcounty.html">Polk County Bank</a></td>
 				<td class="city">Johnston</td>
@@ -887,7 +888,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Century Bank of Georgia</td>
 				<td class="closing">November 10, 2011</td>
 				<td class="updated">August 13, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="sunfirst.html">SunFirst Bank</a></td>
 				<td class="city">Saint George</td>
@@ -896,7 +897,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Cache Valley Bank</td>
 				<td class="closing">November 4, 2011</td>
 				<td class="updated">November 16, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="midcity.html">Mid City Bank, Inc.</a></td>
 				<td class="city">Omaha</td>
@@ -905,7 +906,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Premier Bank</td>
 				<td class="closing">November 4, 2011</td>
 				<td class="updated">August 15, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="allamerican.html ">All American Bank</a></td>
 				<td class="city">Des Plaines</td>
@@ -914,7 +915,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">International Bank of Chicago</td>
 				<td class="closing">October 28, 2011</td>
 				<td class="updated">August 15, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="commbanksco.html">Community Banks of Colorado</a></td>
 				<td class="city">Greenwood Village</td>
@@ -959,7 +960,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Blackhawk Bank &amp; Trust</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">August 15, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="firststatebank-nj.html">First State Bank</a></td>
  				<td class="city">Cranford</td>
@@ -968,7 +969,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Northfield Bank</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">November 8, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="blueridge.html">Blue Ridge Savings Bank, Inc.</a></td>
  				<td class="city">Asheville</td>
@@ -977,7 +978,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">Bank of North Carolina</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">November 8, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="piedmont-ga.html">Piedmont Community Bank</a></td>
  				<td class="city">Gray</td>
@@ -986,7 +987,7 @@ <h1 class="page_title">Failed Bank List</h1>
  				<td class="ai">State Bank and Trust Company</td>
  				<td class="closing">October 14, 2011</td>
  				<td class="updated">January 22, 2013</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="sunsecurity.html">Sun Security Bank</a></td>
  				<td class="city">Ellington</td>
@@ -1202,7 +1203,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Ameris Bank</td>
 				<td class="closing">July 15, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="onegeorgia.html">One Georgia Bank</a></td>
 				<td class="city">Atlanta</td>
@@ -1247,7 +1248,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First American Bank and Trust Company</td>
 				<td class="closing">June 24, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="fcbtb.html">First Commercial Bank of Tampa Bay</a></td>
 				<td class="city">Tampa</td>
@@ -1256,7 +1257,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Stonegate Bank</td>
 				<td class="closing">June 17, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>    
+			</tr>
 			<tr>
 				<td class="institution"><a href="mcintoshstate.html">McIntosh State Bank</a></td>
 				<td class="city">Jackson</td>
@@ -1265,7 +1266,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Hamilton State Bank</td>
 				<td class="closing">June 17, 2011</td>
 				<td class="updated">November 2, 2012</td>
-			</tr>   
+			</tr>
 			<tr>
 				<td class="institution"><a href="atlanticbanktrust.html">Atlantic Bank and Trust</a></td>
 				<td class="city">Charleston</td>
@@ -1274,7 +1275,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Citizens Bank and Trust Company, Inc.</td>
 				<td class="closing">June 3, 2011</td>
 				<td class="updated">October 31, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="firstheritage.html">First Heritage Bank</a></td>
 				<td class="city">Snohomish</td>
@@ -1283,7 +1284,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Columbia State Bank</td>
 				<td class="closing">May 27, 2011</td>
 				<td class="updated">January 28, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="summit.html">Summit Bank</a></td>
 				<td class="city">Burlington</td>
@@ -1292,7 +1293,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Columbia State Bank</td>
 				<td class="closing">May 20, 2011</td>
 				<td class="updated">January 22, 2013</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="fgbc.html">First Georgia Banking Company</a></td>
 				<td class="city">Franklin</td>
@@ -2030,7 +2031,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Westamerica Bank</td>
 				<td class="closing">August 20, 2010</td>
 				<td class="updated">September 12, 2012</td>
-			</tr>	 
+			</tr>
 			<tr>
 				<td class="institution"><a href="lospadres.html">Los Padres Bank</a></td>
 				<td class="city">Solvang</td>
@@ -2624,7 +2625,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">MB Financial Bank, N.A.</td>
 				<td class="closing">April 23, 2010</td>
 				<td class="updated">August 23, 2012</td>
-			</tr> 	 	 	 
+			</tr>
 			<tr>
 				<td class="institution"><a href="amcore.html">Amcore Bank, National Association</a></td>
 				<td class="city">Rockford</td>
@@ -2768,7 +2769,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">First Citizens Bank</td>
 				<td class="closing">March 19, 2010</td>
 				<td class="updated">August 23, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankofhiawassee.html">Bank of Hiawassee</a></td>
 				<td class="city">Hiawassee</td>
@@ -3480,7 +3481,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="closing">October 2, 2009</td>
 				<td class="updated">August 21, 2012</td>
 			</tr>
-			<tr> 
+			<tr>
 				<td class="institution"><a href="warren-mi.html">Warren Bank</a></td>
 				<td class="city">Warren</td>
 				<td class="state">MI</td>
@@ -3767,7 +3768,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Herring Bank</td>
 				<td class="closing">July 31, 2009</td>
 				<td class="updated">August 20, 2012</td>
-			</tr> 
+			</tr>
 			<tr>
 				<td class="institution"><a href="sb-jones.html">Security Bank of Jones County</a></td>
 				<td class="city">Gray</td>
@@ -3848,7 +3849,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">California Bank &amp; Trust</td>
 				<td class="closing">July 17, 2009</td>
 				<td class="updated">August 20, 2012</td>
-			</tr>  
+			</tr>
 			<tr>
 				<td class="institution"><a href="bankfirst.html">BankFirst</a></td>
 				<td class="city">Sioux Falls</td>
@@ -4811,7 +4812,7 @@ <h1 class="page_title">Failed Bank List</h1>
 				<td class="ai">Bank of the Orient</td>
 				<td class="closing">October 13, 2000</td>
 				<td class="updated">March 17, 2005</td>
-			</tr> 	 
+			</tr>
 		</tbody>
 	</table>
 	</div>
@@ -4849,12 +4850,12 @@ <h1 class="page_title">Failed Bank List</h1>
 		<ul>
 			<li><a href="/about/freedom/" title="Freedom of Information Act (FOIA) Service Center">Freedom of Information Act (FOIA) Service Center</a></li>
 			<li><a href="/open/" title="FDIC Open Government Webpage">FDIC Open Government Webpage</a></li>
-			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No  FEAR Act Data</a></li>
+			<li><a href="/about/diversity/nofear/" title="No FEAR Act Data">No FEAR Act Data</a></li>
 		</ul>
 	</div>
 	<div id="responsive_footer-small">
 		<ul>
-			<li><a href="/" title="Home">Home</a></li> 
+			<li><a href="/" title="Home">Home</a></li>
 			<li><a href="/about/contact/ask/" title="Contact Us">Contact Us</a></li>
 			<li><a href="/about/policies/" title="Website Policies">Website Policies</a></li>
 			<li><a href="/search/" title="Search">Search</a></li>
diff --git a/pandas/tests/io/data/feather-0_3_1.feather b/pandas/tests/io/data/feather-0_3_1.feather
new file mode 100644
index 0000000000000..5a2c7b3dcc684
Binary files /dev/null and b/pandas/tests/io/data/feather-0_3_1.feather differ
diff --git a/pandas/tests/io/data/fixed_width_format.txt b/pandas/tests/io/data/fixed_width_format.txt
new file mode 100644
index 0000000000000..bb487d8de7ef9
--- /dev/null
+++ b/pandas/tests/io/data/fixed_width_format.txt
@@ -0,0 +1,3 @@
+A   B   C
+1   2   3
+4   5   6
diff --git a/pandas/tests/io/data/legacy_hdf/legacy_0.10.h5 b/pandas/tests/io/data/legacy_hdf/legacy_0.10.h5
deleted file mode 100644
index b1439ef16361a..0000000000000
Binary files a/pandas/tests/io/data/legacy_hdf/legacy_0.10.h5 and /dev/null differ
diff --git a/pandas/tests/io/data/legacy_hdf/legacy_table.h5 b/pandas/tests/io/data/legacy_hdf/legacy_table.h5
deleted file mode 100644
index 1c90382d9125c..0000000000000
Binary files a/pandas/tests/io/data/legacy_hdf/legacy_table.h5 and /dev/null differ
diff --git a/pandas/tests/io/data/legacy_hdf/legacy_table_0.11.h5 b/pandas/tests/io/data/legacy_hdf/legacy_table_0.11.h5
deleted file mode 100644
index 958effc2ce6f8..0000000000000
Binary files a/pandas/tests/io/data/legacy_hdf/legacy_table_0.11.h5 and /dev/null differ
diff --git a/pandas/tests/io/data/legacy_hdf/legacy_table_fixed_py2.h5 b/pandas/tests/io/data/legacy_hdf/legacy_table_fixed_py2.h5
new file mode 100644
index 0000000000000..540251d9fae86
Binary files /dev/null and b/pandas/tests/io/data/legacy_hdf/legacy_table_fixed_py2.h5 differ
diff --git a/pandas/tests/io/data/legacy_hdf/legacy_table_py2.h5 b/pandas/tests/io/data/legacy_hdf/legacy_table_py2.h5
new file mode 100644
index 0000000000000..3863d714a315b
Binary files /dev/null and b/pandas/tests/io/data/legacy_hdf/legacy_table_py2.h5 differ
diff --git a/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5 b/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5
new file mode 100644
index 0000000000000..6fb92d3c564bd
Binary files /dev/null and b/pandas/tests/io/data/legacy_hdf/periodindex_0.20.1_x86_64_darwin_2.7.13.h5 differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle
new file mode 100644
index 0000000000000..6341fa26d1f25
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.16.2/0.16.2_AMD64_windows_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle
new file mode 100644
index 0000000000000..537864af7028b
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.17.0/0.17.0_x86_64_darwin_3.5.3.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle
index db1d17a8b67c3..20af597c57a1b 100644
Binary files a/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle and b/pandas/tests/io/data/legacy_pickle/0.18.1/0.18.1_x86_64_darwin_3.5.2.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle
new file mode 100644
index 0000000000000..ddd88f77aa2a4
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_AMD64_windows_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle
new file mode 100644
index 0000000000000..555be58cc33ac
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle
index 6bb02672a4151..75ea95ff402c4 100644
Binary files a/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle and b/pandas/tests/io/data/legacy_pickle/0.19.2/0.19.2_x86_64_darwin_3.6.1.pickle differ
diff --git a/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle b/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle
new file mode 100644
index 0000000000000..963e533c4d2b4
Binary files /dev/null and b/pandas/tests/io/data/legacy_pickle/0.20.3/0.20.3_x86_64_darwin_2.7.14.pickle differ
diff --git a/pandas/tests/io/data/macau.html b/pandas/tests/io/data/macau.html
index be62b3221518d..edc4ea96f0f20 100644
--- a/pandas/tests/io/data/macau.html
+++ b/pandas/tests/io/data/macau.html
@@ -13,22 +13,22 @@
 <script type="text/javascript">
 
 function slideSwitch() {
-    
+
     var $active = $('#banner1 a.active');
-    
+
     var totalTmp=document.getElementById("bannerTotal").innerHTML;
-    
+
     var randomTmp=Math.floor(Math.random()*totalTmp+1);
 
     var $next = $('#image'+randomTmp).length?$('#image'+randomTmp):$('#banner1 a:first');
-    
+
     if($next.attr("id")==$active.attr("id")){
 
       $next =  $active.next().length ? $active.next():$('#banner1 a:first');
     }
-    
+
     $active.removeClass("active");
-	
+
 	$next.addClass("active").show();
 
     $active.hide();
@@ -36,12 +36,12 @@
 }
 
 jQuery(function() {
-    
+
     var totalTmp=document.getElementById("bannerTotal").innerHTML;
     if(totalTmp>1){
        setInterval( "slideSwitch()", 5000 );
     }
-    
+
 });
 
 </script>
@@ -77,9 +77,9 @@
 
 <div id="top">
 		<div id="lang">
-		  
-		  <a href="http://www.camacau.com/changeLang?lang=zh_TW&url=/statistic_list">繁體中文</a> | 
-		  <a href="http://www.camacau.com/changeLang?lang=zh_CN&url=/statistic_list">簡體中文</a> 
+
+		  <a href="http://www.camacau.com/changeLang?lang=zh_TW&url=/statistic_list">繁體中文</a> |
+		  <a href="http://www.camacau.com/changeLang?lang=zh_CN&url=/statistic_list">簡體中文</a>
 		  <!--<a href="changeLang?lang=pt_PT&url=/statistic_list" >Portuguese</a>
 		  -->
 		  </div>
@@ -92,10 +92,10 @@
 		  <div id="search">
 		  <form id="searchForm" name="searchForm" action="http://www.camacau.com/search" method="POST">
 			<input id="keyword" name="keyword" type="text">
-			<a href="javascript:document.searchForm.submit();">Search</a> | 
-			<a href="mailto:mkd@macau-airport.com">Contact Us</a>  | 
+			<a href="javascript:document.searchForm.submit();">Search</a> |
+			<a href="mailto:mkd@macau-airport.com">Contact Us</a>  |
 			<a href="http://www.camacau.com/sitemap">SiteMap</a> |
-			
+
 		  	<a href="http://www.camacau.com/rssBuilder.action"><img src="./macau_files/rssIcon.png" alt="RSS">RSS</a>
 			</form></div>
 		</div>
@@ -103,8 +103,8 @@
 </div>
 <div id="menu2">
 			<div>
-			
-		          	 
+
+
 		    <object classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" id="FlashID4" title="Main Page">
 				<param name="movie" value="flash/button_index_EN.swf">
 				<param name="quality" value="high">
@@ -130,8 +130,8 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				  <!--[if !IE]>-->
 				</object>
 				<!--<![endif]-->
-			  </object>		  
-		          	 
+			  </object>
+
 			<object classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" id="FlashID4" title="Our Business">
 				<param name="movie" value="flash/button_our business_EN.swf">
 				<param name="quality" value="high">
@@ -158,7 +158,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				<!--<![endif]-->
 			  </object>
-			  
+
 			  <object id="FlashID" classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" title="About Us">
 				<param name="movie" value="flash/button_about us_EN.swf">
 				<param name="quality" value="high">
@@ -185,7 +185,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				  <!--<![endif]-->
 			  </object>
-			  
+
 			  <object id="FlashID3" classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" title="Media Centre">
 				<param name="movie" value="flash/button_media centre_EN.swf">
 				<param name="quality" value="high">
@@ -212,7 +212,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				<!--<![endif]-->
 			  </object>
-			  
+
 			  <object classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" id="FlashID5" title="Related Links">
 				<param name="movie" value="flash/button_related links_EN.swf">
 				<param name="quality" value="high">
@@ -239,7 +239,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				<!--<![endif]-->
 			  </object>
-			  
+
 			  <object id="FlashID2" classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" title="Interactive">
 				<param name="movie" value="flash/button_interactive_EN.swf">
 				<param name="quality" value="high">
@@ -266,16 +266,16 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				<!--<![endif]-->
 			  </object>
-			  
+
 			  <!--<object classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" width="95" height="20" id="FlashID4" title="Group of Public">
 				<param name="movie" value="flash/button_pressRelease_EN.swf" />
 				<param name="quality" value="high" />
 				<param name="scale" value="exactfit">
 				<param name="wmode" value="opaque" />
 				<param name="swfversion" value="6.0.65.0" />
-				 此 param 標籤會提示使用 Flash Player 6.0 r65 和更新版本的使用者下載最新版本的 Flash Player。如果您不想讓使用者看到這項提示，請將其刪除。 
+				 此 param 標籤會提示使用 Flash Player 6.0 r65 和更新版本的使用者下載最新版本的 Flash Player。如果您不想讓使用者看到這項提示，請將其刪除。
 				<param name="expressinstall" value="flash/expressInstall.swf" />
-				 下一個物件標籤僅供非 IE 瀏覽器使用。因此，請使用 IECC 將其自 IE 隱藏。 
+				 下一個物件標籤僅供非 IE 瀏覽器使用。因此，請使用 IECC 將其自 IE 隱藏。
 				[if !IE]>
 				<object type="application/x-shockwave-flash" data="flash/button_pressRelease_EN.swf" width="92" height="20">
 				  <![endif]
@@ -284,7 +284,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				  <param name="wmode" value="opaque" />
 				  <param name="swfversion" value="6.0.65.0" />
 				  <param name="expressinstall" value="flash/expressInstall.swf" />
-				   瀏覽器會為使用 Flash Player 6.0 和更早版本的使用者顯示下列替代內容。 
+				   瀏覽器會為使用 Flash Player 6.0 和更早版本的使用者顯示下列替代內容。
 				  <div>
 					<h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 					<p><a href="http://www.adobe.com/go/getflashplayer"><img src="http://www.adobe.com/images/shared/download_buttons/get_flash_player.gif" alt="取得 Adobe Flash Player" width="112" height="33" /></a></p>
@@ -293,7 +293,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</object>
 				<![endif]
 			  </object>
-			  
+
 			  --></div>
 		  </div>
 
@@ -304,8 +304,8 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 
 
 <style>
-#slider ul li 
-{ 
+#slider ul li
+{
 height: 90px;
 list-style:none;
 width:95%;
@@ -353,107 +353,107 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 
 <div id="banner">
 	<!--<div id="leftGradient"></div>-->
-	
+
 			<table id="tbNotice" style="display:none;width:800px;z-index:999;position:absolute;left:20%;" align="center">
-				<tbody><tr height="40px"><td></td></tr> 
+				<tbody><tr height="40px"><td></td></tr>
 				<tr><td>
-					
+
 					<div id="slider">
 				<div id="close_tbNotice"><img src="./macau_files/delete.png" onclick="close_notice()"></div>
 				<ul>
 					<li>
-						
-		                
-		                
-						
+
+
+
+
 					</li>
 				</ul>
-				
+
 			</div>
 			<div id="show_notice" style="display:none;">
-			
+
 			</div>
-			
+
 				</td>
-	
+
 				</tr>
 				<tr><td align="right"></td></tr>
 			</tbody></table>
-			 
-		
+
+
 	<div class="gradient">
-		
+
 	</div>
 	<div class="banner1" id="banner1">
-	
-	
-			
-			
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: none;" id="image1" class="">
 		     <img src="./macau_files/41.jpeg" alt="Slideshow Image 1">
 	         </a>
-		    
-            
-	
-			
-            
+
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: none;" id="image2" class="">
 		     <img src="./macau_files/45.jpeg" alt="Slideshow Image 2">
 	         </a>
-		    
-		
-	
-			
-            
+
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: none;" id="image3" class="">
 		     <img src="./macau_files/46.jpeg" alt="Slideshow Image 3">
 	         </a>
-		    
-		
-	
-			
-            
+
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: inline;" id="image4" class="active">
 		     <img src="./macau_files/47.jpeg" alt="Slideshow Image 4">
 	         </a>
-		    
-		
-	
-			
-            
+
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: none;" id="image5" class="">
 		     <img src="./macau_files/48.jpeg" alt="Slideshow Image 5">
 	         </a>
-		    
-		
-	
-			
-            
+
+
+
+
+
              <a href="http://www.macau-airport.com/" target="_blank" style="display: none;" id="image6" class="">
 		     <img src="./macau_files/49.jpeg" alt="Slideshow Image 6">
 	         </a>
-		    
-		
-	
-			
-            
+
+
+
+
+
              <a href="http://www.4cpscac.com/" target="_blank" style="display: none;" id="image7" class="">
 		     <img src="./macau_files/50.jpg" alt="Slideshow Image 7">
 	         </a>
-		    
-		
-	
-	
+
+
+
+
 	</div>
 	<div id="bannerTotal" style="display:none;">7</div>
 </div>
 
 <div id="content">
         <div id="leftnav">
-        
+
                 <div id="navmenu">
-				
-        		
+
+
 
 
 
@@ -476,12 +476,12 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 	toggleclass: ["", "selected"], //Two CSS classes to be applied to the header when it's collapsed and expanded, respectively ["class1", "class2"]
 	togglehtml: ["", "", ""], //Additional HTML added to the header when it's collapsed and expanded, respectively  ["position", "html1", "html2"] (see docs)
 	animatespeed: "normal", //speed of animation: integer in milliseconds (ie: 200), or keywords "fast", "normal", or "slow"
-	oninit:function(headers, expandedindices){ //custom code to run when headers have initalized
+	oninit:function(headers, expandedindices){ //custom code to run when headers have initialized
 		//do nothing
 	},
 	onopenclose:function(header, index, state, isuseractivated){ //custom code to run whenever a header is opened or closed
 		//do nothing
-	
+
 	}
 });
 </script><style type="text/css">
@@ -489,7 +489,7 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 a.hiddenajaxlink{display: none}
 </style>
 
-	
+
 				<table>
 				<tbody><tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/geographic_information">MIA Geographical Information</a></td></tr>
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/airport_services">Scope of Service</a></td></tr>
@@ -518,14 +518,14 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				</tbody></table>
 				</td>
 				</tr>
-				
+
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/slot_application">Slot Application</a></td></tr>
-				
+
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/freighter_forwards">Macau Freight Forwarders</a></td></tr>
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/ctplatform">Cargo Tracking Platform</a></td></tr>
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/for_rent">For Rent</a></td></tr>
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/capacity">Airport Capacity</a></td></tr>
-				
+
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td style="color: #606060;text-decoration: none;"><a href="javascript:void(0)" class="leftmenu_silverheader " headerindex="2h">Airport Characteristics &amp; Traffic Statistics</a></td></tr>
 				<tr><td colspan="2" style="padding-top:0px;padding-bottom:0px;padding-right:0px;">
 				<table class="leftmenu_submenu" contentindex="2c" style="display: none;">
@@ -539,11 +539,11 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 				<tr><td><img width="20" height="15" src="./macau_files/double.gif"></td><td><a href="http://www.camacau.com/operational_routes">Operational Routes</a></td></tr>
 
 				<!--<tr><td><img width="20" height="15" src="images/double.gif"/></td><td><a href="route_development">Member Registration</a></td></tr>
-				
+
 				--><!--<tr><td><img width="20" height="15" src="images/double.gif"/></td><td><a href="cargo_arrival">Cargo Flight Information</a></td></tr>-->
-				
+
 				<!--<tr><td><img width="20" height="15" src="images/double.gif"/></td><td><a href="/mvnforum/mvnforum/index">Forum</a></td></tr>-->
-				
+
 				</tbody></table>
 
 
@@ -553,3116 +553,3116 @@ <h4>這個頁面上的內容需要較新版本的 Adobe Flash Player。</h4>
 <div id="under">
 			<div id="contextTitle">
           			<h2 class="con">Traffic Statistics - Passengers</h2>
-          
+
           </div>
 			<div class="contextTitleAfter"></div>
 	<div>
-    	  
-          
+
+
     	  <div id="context">
           <!--/*begin context*/-->
           <div class="Container">
                      <div id="Scroller-1">
                            <div class="Scroller-Container">
           		<div id="statisticspassengers" style="width:550px;">
-          		
+
 
    <span id="title">Traffic Statistics</span>
 
-  
-   
-   
-   
+
+
+
+
    <br><br><br>
    <span id="title">Passengers Figure(2008-2013) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2013</th>
-   
+
    <th align="center">2012</th>
-   
+
    <th align="center">2011</th>
-   
+
    <th align="center">2010</th>
-   
+
    <th align="center">2009</th>
-   
+
    <th align="center">2008</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-    
+
     374,917
    </td>
-   
+
    <td align="center">
-    
+
     362,379
    </td>
-   
+
    <td align="center">
-    
+
     301,503
    </td>
-   
+
    <td align="center">
-    
+
     358,902
    </td>
-   
+
    <td align="center">
-    
+
     342,323
    </td>
-   
+
    <td align="center">
-    
+
     420,574
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     393,152
    </td>
-   
+
    <td align="center">
-   
+
     312,405
    </td>
-   
+
    <td align="center">
-   
+
     301,259
    </td>
-   
+
    <td align="center">
-   
+
     351,654
    </td>
-   
+
    <td align="center">
-   
+
     297,755
    </td>
-   
+
    <td align="center">
-   
+
     442,809
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     408,755
    </td>
-   
+
    <td align="center">
-   
+
     334,000
    </td>
-   
+
    <td align="center">
-   
+
     318,908
    </td>
-   
+
    <td align="center">
-   
+
     360,365
    </td>
-   
+
    <td align="center">
-   
+
     387,879
    </td>
-   
+
    <td align="center">
-   
+
     468,540
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     408,860
    </td>
-   
+
    <td align="center">
-   
+
     358,198
    </td>
-   
+
    <td align="center">
-   
+
     339,060
    </td>
-   
+
    <td align="center">
-   
+
     352,976
    </td>
-   
+
    <td align="center">
-   
+
     400,553
    </td>
-   
+
    <td align="center">
-   
+
     492,930
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     374,397
    </td>
-   
+
    <td align="center">
-   
+
     329,218
    </td>
-   
+
    <td align="center">
-   
+
     321,060
    </td>
-   
+
    <td align="center">
-   
+
     330,407
    </td>
-   
+
    <td align="center">
-   
+
     335,967
    </td>
-   
+
    <td align="center">
-   
+
     465,045
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     401,995
    </td>
-   
+
    <td align="center">
-   
+
     356,679
    </td>
-   
+
    <td align="center">
-   
+
     343,006
    </td>
-   
+
    <td align="center">
-   
+
     326,724
    </td>
-   
+
    <td align="center">
-   
+
     296,748
    </td>
-   
+
    <td align="center">
-   
+
     426,764
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     423,081
    </td>
-   
+
    <td align="center">
-   
+
     378,993
    </td>
-   
+
    <td align="center">
-   
+
     356,580
    </td>
-   
+
    <td align="center">
-   
+
     351,110
    </td>
-   
+
    <td align="center">
-   
+
     439,425
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     453,391
    </td>
-   
+
    <td align="center">
-   
+
     395,883
    </td>
-   
+
    <td align="center">
-   
+
     364,011
    </td>
-   
+
    <td align="center">
-   
+
     404,076
    </td>
-   
+
    <td align="center">
-   
+
     425,814
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     384,887
    </td>
-   
+
    <td align="center">
-   
+
     325,124
    </td>
-   
+
    <td align="center">
-   
+
     308,940
    </td>
-   
+
    <td align="center">
-   
+
     317,226
    </td>
-   
+
    <td align="center">
-   
+
     379,898
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     383,889
    </td>
-   
+
    <td align="center">
-   
+
     333,102
    </td>
-   
+
    <td align="center">
-   
+
     317,040
    </td>
-   
+
    <td align="center">
-   
+
     355,935
    </td>
-   
+
    <td align="center">
-   
+
     415,339
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     379,065
    </td>
-   
+
    <td align="center">
-   
+
     327,803
    </td>
-   
+
    <td align="center">
-   
+
     303,186
    </td>
-   
+
    <td align="center">
-   
+
     372,104
    </td>
-   
+
    <td align="center">
-   
+
     366,411
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     413,873
    </td>
-   
+
    <td align="center">
-   
+
     359,313
    </td>
-   
+
    <td align="center">
-   
+
     348,051
    </td>
-   
+
    <td align="center">
-   
+
     388,573
    </td>
-   
+
    <td align="center">
-   
+
     354,253
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     2,362,076
    </td>
-   
+
    <td align="center">
-   
+
     4,491,065
    </td>
-   
+
    <td align="center">
-   
+
     4,045,014
    </td>
-   
+
    <td align="center">
-   
+
     4,078,836
    </td>
-   
+
    <td align="center">
-   
+
     4,250,249
    </td>
-   
+
    <td align="center">
-   
+
     5,097,802
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Passengers Figure(2002-2007) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2007</th>
-   
+
    <th align="center">2006</th>
-   
+
    <th align="center">2005</th>
-   
+
    <th align="center">2004</th>
-   
+
    <th align="center">2003</th>
-   
+
    <th align="center">2002</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-    
+
     381,887
    </td>
-   
+
    <td align="center">
-    
+
     323,282
    </td>
-   
+
    <td align="center">
-    
+
     289,701
    </td>
-   
+
    <td align="center">
-    
+
     288,507
    </td>
-   
+
    <td align="center">
-    
+
     290,140
    </td>
-   
+
    <td align="center">
-    
+
     268,783
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     426,014
    </td>
-   
+
    <td align="center">
-   
+
     360,820
    </td>
-   
+
    <td align="center">
-   
+
     348,723
    </td>
-   
+
    <td align="center">
-   
+
     207,710
    </td>
-   
+
    <td align="center">
-   
+
     323,264
    </td>
-   
+
    <td align="center">
-   
+
     323,654
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     443,805
    </td>
-   
+
    <td align="center">
-   
+
     389,125
    </td>
-   
+
    <td align="center">
-   
+
     321,953
    </td>
-   
+
    <td align="center">
-   
+
     273,910
    </td>
-   
+
    <td align="center">
-   
+
     295,052
    </td>
-   
+
    <td align="center">
-   
+
     360,668
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     500,917
    </td>
-   
+
    <td align="center">
-   
+
     431,550
    </td>
-   
+
    <td align="center">
-   
+
     367,976
    </td>
-   
+
    <td align="center">
-   
+
     324,931
    </td>
-   
+
    <td align="center">
-   
+
     144,082
    </td>
-   
+
    <td align="center">
-   
+
     380,648
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     468,637
    </td>
-   
+
    <td align="center">
-   
+
     399,743
    </td>
-   
+
    <td align="center">
-   
+
     359,298
    </td>
-   
+
    <td align="center">
-   
+
     250,601
    </td>
-   
+
    <td align="center">
-   
+
     47,333
    </td>
-   
+
    <td align="center">
-   
+
     359,547
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     463,676
    </td>
-   
+
    <td align="center">
-   
+
     393,713
    </td>
-   
+
    <td align="center">
-   
+
     360,147
    </td>
-   
+
    <td align="center">
-   
+
     296,000
    </td>
-   
+
    <td align="center">
-   
+
     94,294
    </td>
-   
+
    <td align="center">
-   
+
     326,508
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
+
     490,404
    </td>
-   
+
    <td align="center">
-   
+
     465,497
    </td>
-   
+
    <td align="center">
-   
+
     413,131
    </td>
-   
+
    <td align="center">
-   
+
     365,454
    </td>
-   
+
    <td align="center">
-   
+
     272,784
    </td>
-   
+
    <td align="center">
-   
+
     388,061
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
+
     490,830
    </td>
-   
+
    <td align="center">
-   
+
     478,474
    </td>
-   
+
    <td align="center">
-   
+
     409,281
    </td>
-   
+
    <td align="center">
-   
+
     372,802
    </td>
-   
+
    <td align="center">
-   
+
     333,840
    </td>
-   
+
    <td align="center">
-   
+
     384,719
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
+
     446,594
    </td>
-   
+
    <td align="center">
-   
+
     412,444
    </td>
-   
+
    <td align="center">
-   
+
     354,751
    </td>
-   
+
    <td align="center">
-   
+
     321,456
    </td>
-   
+
    <td align="center">
-   
+
     295,447
    </td>
-   
+
    <td align="center">
-   
+
     334,029
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
+
     465,757
    </td>
-   
+
    <td align="center">
-   
+
     461,215
    </td>
-   
+
    <td align="center">
-   
+
     390,435
    </td>
-   
+
    <td align="center">
-   
+
     358,362
    </td>
-   
+
    <td align="center">
-   
+
     291,193
    </td>
-   
+
    <td align="center">
-   
+
     372,706
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     455,132
    </td>
-   
+
    <td align="center">
-   
+
     425,116
    </td>
-   
+
    <td align="center">
-   
+
     323,347
    </td>
-   
+
    <td align="center">
-   
+
     327,593
    </td>
-   
+
    <td align="center">
-   
+
     268,282
    </td>
-   
+
    <td align="center">
-   
+
     350,324
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     465,225
    </td>
-   
+
    <td align="center">
-   
+
     435,114
    </td>
-   
+
    <td align="center">
-   
+
     308,999
    </td>
-   
+
    <td align="center">
-   
+
     326,933
    </td>
-   
+
    <td align="center">
-   
+
     249,855
    </td>
-   
+
    <td align="center">
-   
+
     322,056
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     5,498,878
    </td>
-   
+
    <td align="center">
-   
+
     4,976,093
    </td>
-   
+
    <td align="center">
-   
+
     4,247,742
    </td>
-   
+
    <td align="center">
-   
+
     3,714,259
    </td>
-   
+
    <td align="center">
-   
+
     2,905,566
    </td>
-   
+
    <td align="center">
-   
+
     4,171,703
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Passengers Figure(1996-2001) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2001</th>
-   
+
    <th align="center">2000</th>
-   
+
    <th align="center">1999</th>
-   
+
    <th align="center">1998</th>
-   
+
    <th align="center">1997</th>
-   
+
    <th align="center">1996</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-    
+
     265,603
    </td>
-   
+
    <td align="center">
-    
+
     184,381
    </td>
-   
+
    <td align="center">
-    
+
     161,264
    </td>
-   
+
    <td align="center">
-    
+
     161,432
    </td>
-   
+
    <td align="center">
-    
+
     117,984
    </td>
-   
+
    <td align="center">
-    
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     249,259
    </td>
-   
+
    <td align="center">
-   
+
     264,066
    </td>
-   
+
    <td align="center">
-   
+
     209,569
    </td>
-   
+
    <td align="center">
-   
+
     168,777
    </td>
-   
+
    <td align="center">
-   
+
     150,772
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     312,319
    </td>
-   
+
    <td align="center">
-   
+
     226,483
    </td>
-   
+
    <td align="center">
-   
+
     186,965
    </td>
-   
+
    <td align="center">
-   
+
     172,060
    </td>
-   
+
    <td align="center">
-   
+
     149,795
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     351,793
    </td>
-   
+
    <td align="center">
-   
+
     296,541
    </td>
-   
+
    <td align="center">
-   
+
     237,449
    </td>
-   
+
    <td align="center">
-   
+
     180,241
    </td>
-   
+
    <td align="center">
-   
+
     179,049
    </td>
-   
+
    <td align="center">
-   
-    
-   </td>
-   
+
+
+   </td>
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     338,692
    </td>
-   
+
    <td align="center">
-   
+
     288,949
    </td>
-   
+
    <td align="center">
-   
+
     230,691
    </td>
-   
+
    <td align="center">
-   
+
     172,391
    </td>
-   
+
    <td align="center">
-   
+
     189,925
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     332,630
    </td>
-   
+
    <td align="center">
-   
+
     271,181
    </td>
-   
+
    <td align="center">
-   
+
     231,328
    </td>
-   
+
    <td align="center">
-   
+
     157,519
    </td>
-   
+
    <td align="center">
-   
+
     175,402
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
+
     344,658
    </td>
-   
+
    <td align="center">
-   
+
     304,276
    </td>
-   
+
    <td align="center">
-   
+
     243,534
    </td>
-   
+
    <td align="center">
-   
+
     205,595
    </td>
-   
+
    <td align="center">
-   
+
     173,103
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
+
     360,899
    </td>
-   
+
    <td align="center">
-   
+
     300,418
    </td>
-   
+
    <td align="center">
-   
+
     257,616
    </td>
-   
+
    <td align="center">
-   
+
     241,140
    </td>
-   
+
    <td align="center">
-   
+
     178,118
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
+
     291,817
    </td>
-   
+
    <td align="center">
-   
+
     280,803
    </td>
-   
+
    <td align="center">
-   
+
     210,885
    </td>
-   
+
    <td align="center">
-   
+
     183,954
    </td>
-   
+
    <td align="center">
-   
+
     163,385
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
+
     327,232
    </td>
-   
+
    <td align="center">
-   
+
     298,873
    </td>
-   
+
    <td align="center">
-   
+
     231,251
    </td>
-   
+
    <td align="center">
-   
+
     205,726
    </td>
-   
+
    <td align="center">
-   
+
     176,879
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     315,538
    </td>
-   
+
    <td align="center">
-   
+
     265,528
    </td>
-   
+
    <td align="center">
-   
+
     228,637
    </td>
-   
+
    <td align="center">
-   
+
     181,677
    </td>
-   
+
    <td align="center">
-   
+
     146,804
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     314,866
    </td>
-   
+
    <td align="center">
-   
+
     257,929
    </td>
-   
+
    <td align="center">
-   
+
     210,922
    </td>
-   
+
    <td align="center">
-   
+
     183,975
    </td>
-   
+
    <td align="center">
-   
+
     151,362
    </td>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     3,805,306
    </td>
-   
+
    <td align="center">
-   
+
     3,239,428
    </td>
-   
+
    <td align="center">
-   
+
     2,640,111
    </td>
-   
+
    <td align="center">
-   
+
     2,214,487
    </td>
-   
+
    <td align="center">
-   
+
     1,952,578
    </td>
-   
+
    <td align="center">
-   
+
     0
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Passengers Figure(1995-1995) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">1995</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-    
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     6,601
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     37,041
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     43,642
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
 
    <br><br><br>
    <div align="right"><img src="./macau_files/pass_stat.jpg" alt="passenger statistic picture" width="565" height="318"></div>
    <br><br><br>
-   
-   
-   <!--statistics-movement  --> 
-   
+
+
+   <!--statistics-movement  -->
+
    <br><br><br>
    <span id="title">Movement Statistics(2008-2013) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2013</th>
-   
+
    <th align="center">2012</th>
-   
+
    <th align="center">2011</th>
-   
+
    <th align="center">2010</th>
-   
+
    <th align="center">2009</th>
-   
+
    <th align="center">2008</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-   
+
     3,925
    </td>
-   
+
    <td align="center">
-   
+
     3,463
    </td>
-   
+
    <td align="center">
-   
+
     3,289
    </td>
-   
+
    <td align="center">
-   
+
     3,184
    </td>
-   
+
    <td align="center">
-   
+
     3,488
    </td>
-   
+
    <td align="center">
-   
+
     4,568
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     3,632
    </td>
-   
+
    <td align="center">
-   
+
     2,983
    </td>
-   
+
    <td align="center">
-   
+
     2,902
    </td>
-   
+
    <td align="center">
-   
+
     3,053
    </td>
-   
+
    <td align="center">
-   
+
     3,347
    </td>
-   
+
    <td align="center">
-   
+
     4,527
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     3,909
    </td>
-   
+
    <td align="center">
-   
+
     3,166
    </td>
-   
+
    <td align="center">
-   
+
     3,217
    </td>
-   
+
    <td align="center">
-   
+
     3,175
    </td>
-   
+
    <td align="center">
-   
+
     3,636
    </td>
-   
+
    <td align="center">
-   
+
     4,594
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     3,903
    </td>
-   
+
    <td align="center">
-   
+
     3,258
    </td>
-   
+
    <td align="center">
-   
+
     3,146
    </td>
-   
+
    <td align="center">
-   
+
     3,023
    </td>
-   
+
    <td align="center">
-   
+
     3,709
    </td>
-   
+
    <td align="center">
-   
+
     4,574
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     4,075
    </td>
-   
+
    <td align="center">
-   
+
     3,234
    </td>
-   
+
    <td align="center">
-   
+
     3,266
    </td>
-   
+
    <td align="center">
-   
+
     3,033
    </td>
-   
+
    <td align="center">
-   
+
     3,603
    </td>
-   
+
    <td align="center">
-   
+
     4,511
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     4,038
    </td>
-   
+
    <td align="center">
-   
+
     3,272
    </td>
-   
+
    <td align="center">
-   
+
     3,316
    </td>
-   
+
    <td align="center">
-   
+
     2,909
    </td>
-   
+
    <td align="center">
-   
+
     3,057
    </td>
-   
+
    <td align="center">
-   
+
     4,081
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,661
    </td>
-   
+
    <td align="center">
-   
+
     3,359
    </td>
-   
+
    <td align="center">
-   
+
     3,062
    </td>
-   
+
    <td align="center">
-   
+
     3,354
    </td>
-   
+
    <td align="center">
-   
+
     4,215
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,942
    </td>
-   
+
    <td align="center">
-   
+
     3,417
    </td>
-   
+
    <td align="center">
-   
+
     3,077
    </td>
-   
+
    <td align="center">
-   
+
     3,395
    </td>
-   
+
    <td align="center">
-   
+
     4,139
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,703
    </td>
-   
+
    <td align="center">
-   
+
     3,169
    </td>
-   
+
    <td align="center">
-   
+
     3,095
    </td>
-   
+
    <td align="center">
-   
+
     3,100
    </td>
-   
+
    <td align="center">
-   
+
     3,752
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,727
    </td>
-   
+
    <td align="center">
-   
+
     3,469
    </td>
-   
+
    <td align="center">
-   
+
     3,179
    </td>
-   
+
    <td align="center">
-   
+
     3,375
    </td>
-   
+
    <td align="center">
-   
+
     3,874
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,722
    </td>
-   
+
    <td align="center">
-   
+
     3,145
    </td>
-   
+
    <td align="center">
-   
+
     3,159
    </td>
-   
+
    <td align="center">
-   
+
     3,213
    </td>
-   
+
    <td align="center">
-   
+
     3,567
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    <td align="center">
-   
+
     3,866
    </td>
-   
+
    <td align="center">
-   
+
     3,251
    </td>
-   
+
    <td align="center">
-   
+
     3,199
    </td>
-   
+
    <td align="center">
-   
+
     3,324
    </td>
-   
+
    <td align="center">
-   
+
     3,362
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     23,482
    </td>
-   
+
    <td align="center">
-   
+
     41,997
    </td>
-   
+
    <td align="center">
-   
+
     38,946
    </td>
-   
+
    <td align="center">
-   
+
     37,148
    </td>
-   
+
    <td align="center">
-   
+
     40,601
    </td>
-   
+
    <td align="center">
-   
+
     49,764
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Movement Statistics(2002-2007) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2007</th>
-   
+
    <th align="center">2006</th>
-   
+
    <th align="center">2005</th>
-   
+
    <th align="center">2004</th>
-   
+
    <th align="center">2003</th>
-   
+
    <th align="center">2002</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-   
+
     4,384
    </td>
-   
+
    <td align="center">
-   
+
     3,933
    </td>
-   
+
    <td align="center">
-   
+
     3,528
    </td>
-   
+
    <td align="center">
-   
+
     3,051
    </td>
-   
+
    <td align="center">
-   
+
     3,257
    </td>
-   
+
    <td align="center">
-   
+
     2,711
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     4,131
    </td>
-   
+
    <td align="center">
-   
+
     3,667
    </td>
-   
+
    <td align="center">
-   
+
     3,331
    </td>
-   
+
    <td align="center">
-   
+
     2,372
    </td>
-   
+
    <td align="center">
-   
+
     3,003
    </td>
-   
+
    <td align="center">
-   
+
     2,747
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     4,349
    </td>
-   
+
    <td align="center">
-   
+
     4,345
    </td>
-   
+
    <td align="center">
-   
+
     3,549
    </td>
-   
+
    <td align="center">
-   
+
     3,049
    </td>
-   
+
    <td align="center">
-   
+
     3,109
    </td>
-   
+
    <td align="center">
-   
+
     2,985
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     4,460
    </td>
-   
+
    <td align="center">
-   
+
     4,490
    </td>
-   
+
    <td align="center">
-   
+
     3,832
    </td>
-   
+
    <td align="center">
-   
+
     3,359
    </td>
-   
+
    <td align="center">
-   
+
     2,033
    </td>
-   
+
    <td align="center">
-   
+
     2,928
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     4,629
    </td>
-   
+
    <td align="center">
-   
+
     4,245
    </td>
-   
+
    <td align="center">
-   
+
     3,663
    </td>
-   
+
    <td align="center">
-   
+
     3,251
    </td>
-   
+
    <td align="center">
-   
+
     1,229
    </td>
-   
+
    <td align="center">
-   
+
     3,109
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     4,365
    </td>
-   
+
    <td align="center">
-   
+
     4,124
    </td>
-   
+
    <td align="center">
-   
+
     3,752
    </td>
-   
+
    <td align="center">
-   
+
     3,414
    </td>
-   
+
    <td align="center">
-   
+
     1,217
    </td>
-   
+
    <td align="center">
-   
+
     3,049
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
+
     4,612
    </td>
-   
+
    <td align="center">
-   
+
     4,386
    </td>
-   
+
    <td align="center">
-   
+
     3,876
    </td>
-   
+
    <td align="center">
-   
+
     3,664
    </td>
-   
+
    <td align="center">
-   
+
     2,423
    </td>
-   
+
    <td align="center">
-   
+
     3,078
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
+
     4,446
    </td>
-   
+
    <td align="center">
-   
+
     4,373
    </td>
-   
+
    <td align="center">
-   
+
     3,987
    </td>
-   
+
    <td align="center">
-   
+
     3,631
    </td>
-   
+
    <td align="center">
-   
+
     3,040
    </td>
-   
+
    <td align="center">
-   
+
     3,166
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
+
     4,414
    </td>
-   
+
    <td align="center">
-   
+
     4,311
    </td>
-   
+
    <td align="center">
-   
+
     3,782
    </td>
-   
+
    <td align="center">
-   
+
     3,514
    </td>
-   
+
    <td align="center">
-   
+
     2,809
    </td>
-   
+
    <td align="center">
-   
+
     3,239
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
+
     4,445
    </td>
-   
+
    <td align="center">
-   
+
     4,455
    </td>
-   
+
    <td align="center">
-   
+
     3,898
    </td>
-   
+
    <td align="center">
-   
+
     3,744
    </td>
-   
+
    <td align="center">
-   
+
     3,052
    </td>
-   
+
    <td align="center">
-   
+
     3,562
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     4,563
    </td>
-   
+
    <td align="center">
-   
+
     4,285
    </td>
-   
+
    <td align="center">
-   
+
     3,951
    </td>
-   
+
    <td align="center">
-   
+
     3,694
    </td>
-   
+
    <td align="center">
-   
+
     3,125
    </td>
-   
+
    <td align="center">
-   
+
     3,546
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     4,588
    </td>
-   
+
    <td align="center">
-   
+
     4,435
    </td>
-   
+
    <td align="center">
-   
+
     3,855
    </td>
-   
+
    <td align="center">
-   
+
     3,763
    </td>
-   
+
    <td align="center">
-   
+
     2,996
    </td>
-   
+
    <td align="center">
-   
+
     3,444
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     53,386
    </td>
-   
+
    <td align="center">
-   
+
     51,049
    </td>
-   
+
    <td align="center">
-   
+
     45,004
    </td>
-   
+
    <td align="center">
-   
+
     40,506
    </td>
-   
+
    <td align="center">
-   
+
     31,293
    </td>
-   
+
    <td align="center">
-   
+
     37,564
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Movement Statistics(1996-2001) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">2001</th>
-   
+
    <th align="center">2000</th>
-   
+
    <th align="center">1999</th>
-   
+
    <th align="center">1998</th>
-   
+
    <th align="center">1997</th>
-   
+
    <th align="center">1996</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-   
+
     2,694
    </td>
-   
+
    <td align="center">
-   
+
     2,201
    </td>
-   
+
    <td align="center">
-   
+
     1,835
    </td>
-   
+
    <td align="center">
-   
+
     2,177
    </td>
-   
+
    <td align="center">
-   
+
     1,353
    </td>
-   
+
    <td align="center">
-   
+
     744
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
+
     2,364
    </td>
-   
+
    <td align="center">
-   
+
     2,357
    </td>
-   
+
    <td align="center">
-   
+
     1,826
    </td>
-   
+
    <td align="center">
-   
+
     1,740
    </td>
-   
+
    <td align="center">
-   
+
     1,339
    </td>
-   
+
    <td align="center">
-   
+
     692
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
+
     2,543
    </td>
-   
+
    <td align="center">
-   
+
     2,206
    </td>
-   
+
    <td align="center">
-   
+
     1,895
    </td>
-   
+
    <td align="center">
-   
+
     1,911
    </td>
-   
+
    <td align="center">
-   
+
     1,533
    </td>
-   
+
    <td align="center">
-   
+
     872
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
+
     2,531
    </td>
-   
+
    <td align="center">
-   
+
     2,311
    </td>
-   
+
    <td align="center">
-   
+
     2,076
    </td>
-   
+
    <td align="center">
-   
+
     1,886
    </td>
-   
+
    <td align="center">
-   
+
     1,587
    </td>
-   
+
    <td align="center">
-   
+
     1,026
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
+
     2,579
    </td>
-   
+
    <td align="center">
-   
+
     2,383
    </td>
-   
+
    <td align="center">
-   
+
     1,914
    </td>
-   
+
    <td align="center">
-   
+
     2,102
    </td>
-   
+
    <td align="center">
-   
+
     1,720
    </td>
-   
+
    <td align="center">
-   
+
     1,115
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
+
     2,681
    </td>
-   
+
    <td align="center">
-   
+
     2,370
    </td>
-   
+
    <td align="center">
-   
+
     1,890
    </td>
-   
+
    <td align="center">
-   
+
     2,038
    </td>
-   
+
    <td align="center">
-   
+
     1,716
    </td>
-   
+
    <td align="center">
-   
+
     1,037
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
+
     2,903
    </td>
-   
+
    <td align="center">
-   
+
     2,609
    </td>
-   
+
    <td align="center">
-   
+
     1,916
    </td>
-   
+
    <td align="center">
-   
+
     2,078
    </td>
-   
+
    <td align="center">
-   
+
     1,693
    </td>
-   
+
    <td align="center">
-   
+
     1,209
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
+
     3,037
    </td>
-   
+
    <td align="center">
-   
+
     2,487
    </td>
-   
+
    <td align="center">
-   
+
     1,968
    </td>
-   
+
    <td align="center">
-   
+
     2,061
    </td>
-   
+
    <td align="center">
-   
+
     1,676
    </td>
-   
+
    <td align="center">
-   
+
     1,241
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
+
     2,767
    </td>
-   
+
    <td align="center">
-   
+
     2,329
    </td>
-   
+
    <td align="center">
-   
+
     1,955
    </td>
-   
+
    <td align="center">
-   
+
     1,970
    </td>
-   
+
    <td align="center">
-   
+
     1,681
    </td>
-   
+
    <td align="center">
-   
+
     1,263
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
+
     2,922
    </td>
-   
+
    <td align="center">
-   
+
     2,417
    </td>
-   
+
    <td align="center">
-   
+
     2,267
    </td>
-   
+
    <td align="center">
-   
+
     1,969
    </td>
-   
+
    <td align="center">
-   
+
     1,809
    </td>
-   
+
    <td align="center">
-   
+
     1,368
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     2,670
    </td>
-   
+
    <td align="center">
-   
+
     2,273
    </td>
-   
+
    <td align="center">
-   
+
     2,132
    </td>
-   
+
    <td align="center">
-   
+
     2,102
    </td>
-   
+
    <td align="center">
-   
+
     1,786
    </td>
-   
+
    <td align="center">
-   
+
     1,433
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     2,815
    </td>
-   
+
    <td align="center">
-   
+
     2,749
    </td>
-   
+
    <td align="center">
-   
+
     2,187
    </td>
-   
+
    <td align="center">
-   
+
     1,981
    </td>
-   
+
    <td align="center">
-   
+
     1,944
    </td>
-   
+
    <td align="center">
-   
+
     1,386
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     32,506
    </td>
-   
+
    <td align="center">
-   
+
     28,692
    </td>
-   
+
    <td align="center">
-   
+
     23,861
    </td>
-   
+
    <td align="center">
-   
+
     24,015
    </td>
-   
+
    <td align="center">
-   
+
     19,837
    </td>
-   
+
    <td align="center">
-   
+
     13,386
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
    <br><br><br>
    <span id="title">Movement Statistics(1995-1995) </span><br><br>
    <table class="style1">
    <tbody>
    <tr height="17">
    <th align="right">&nbsp; </th>
-   
+
    <th align="center">1995</th>
-   
+
    </tr>
    <tr height="17">
    <th align="right">January</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">February</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">March</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">April</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">May</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">June</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">July</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">August</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">September</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">October</th>
-   
+
    <td align="center">
-   
-    
+
+
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">November</th>
-   
+
    <td align="center">
-   
+
     126
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">December</th>
-   
+
    <td align="center">
-   
+
     536
    </td>
-   
+
    </tr>
    <tr height="17">
    <th align="right">Total</th>
-   
+
    <td align="center">
-   
+
     662
    </td>
-   
+
    </tr>
    </tbody>
    </table>
-   
+
 
    <br><br><br>
    <div align="right"><img src="./macau_files/mov_stat.jpg" alt="passenger statistic picture" width="565" height="318"></div>
 
-          		
+
   </div>
-            
+
           </div>
                      </div>
             </div>
-         
-          
+
+
           <!--/*end context*/-->
           </div>
     </div>
-  
+
 	<div id="buttombar"><img height="100" src="./macau_files/buttombar.gif"></div>
 	<div id="logo">
 
 
-		
+
 		<div>
-		
+
           <a href="http://www.macau-airport.com/envirop/zh/default.php" style="display: inline;"><img height="80" src="./macau_files/38.jpg"></a>
-		
+
 		</div>
 
-		
+
 		<div>
-		
+
           <a href="http://www.macau-airport.com/envirop/en/default.php" style="display: inline;"><img height="80" src="./macau_files/36.jpg"></a>
-		
+
 		</div>
 
 </div>
@@ -3676,11 +3676,11 @@ <h2 class="con">Traffic Statistics - Passengers</h2>
 <div id="footer">
 <hr>
   <div id="footer-left">
-  <a href="http://www.camacau.com/index">Main Page</a> | 
-  <a href="http://www.camacau.com/geographic_information">Our Business</a> | 
-  <a href="http://www.camacau.com/about_us">About Us</a> | 
-  <a href="http://www.camacau.com/pressReleases_list">Media Centre</a> | 
-  <a href="http://www.camacau.com/rlinks2">Related Links</a> | 
+  <a href="http://www.camacau.com/index">Main Page</a> |
+  <a href="http://www.camacau.com/geographic_information">Our Business</a> |
+  <a href="http://www.camacau.com/about_us">About Us</a> |
+  <a href="http://www.camacau.com/pressReleases_list">Media Centre</a> |
+  <a href="http://www.camacau.com/rlinks2">Related Links</a> |
   <a href="http://www.camacau.com/download_list">Interactive</a>
   </div>
   <div id="footer-right">Macau International Airport Co. Ltd. | Copyright 2013 | All rights reserved</div>
diff --git a/pandas/tests/io/data/nyse_wsj.html b/pandas/tests/io/data/nyse_wsj.html
index aa3d470a5fbc6..2360bd49e9950 100644
--- a/pandas/tests/io/data/nyse_wsj.html
+++ b/pandas/tests/io/data/nyse_wsj.html
@@ -7,7 +7,7 @@
             </div>
             <div class="hat_button">
                 <span class="hat_button_text">SEARCH</span>
-            </div> 
+            </div>
             <div style="clear: both;"><div class="subSymbolCompleteResults"></div></div>
         </td>
     </tr>
diff --git a/pandas/tests/io/data/spam.html b/pandas/tests/io/data/spam.html
index 935b39f6d6011..a8e445ff1e176 100644
--- a/pandas/tests/io/data/spam.html
+++ b/pandas/tests/io/data/spam.html
@@ -5,31 +5,31 @@
 <!--[if IE 8 ]>    <html lang="en" class="no-js ie8"> <![endif]-->
 <!--[if IE 9 ]>    <html lang="en" class="no-js ie9"> <![endif]-->
 <!--[if (gt IE 9)|!(IE)]><!--> <html lang="en" class="no-js"><!--<![endif]-->
- 
-    
+
+
 <html>
     <head>
-     
+
         <title>Show Foods</title>
         <link rel="shortcut icon" href="/ndb/static/images/favicon.ico" type="image/x-icon" />
-    
-     
 
-         
-         
-         
+
+
+
+
+
          <link rel='stylesheet' type='text/css' href='/ndb/plugins/richui-0.8/css/autocomplete.css' />
 <script type='text/javascript' src='/ndb/plugins/richui-0.8/js/yui/yahoo-dom-event/yahoo-dom-event.js'></script>
 <script type='text/javascript' src='/ndb/plugins/richui-0.8/js/yui/connection/connection-min.js'></script>
 <script type='text/javascript' src='/ndb/plugins/richui-0.8/js/yui/datasource/datasource-min.js'></script>
 <script type='text/javascript' src='/ndb/plugins/richui-0.8/js/yui/animation/animation-min.js'></script>
 <script type='text/javascript' src='/ndb/plugins/richui-0.8/js/yui/autocomplete/autocomplete-min.js'></script>
-                   
+
 <link rel="stylesheet" href="/ndb/static/css/main.css" />
-           
-      	<script type="text/JavaScript"> 
+
+      	<script type="text/JavaScript">
 		 var _gaq = _gaq || [];
-		 // NAL 
+		 // NAL
 		  _gaq.push(['_setAccount', 'UA-28627214-1']);
 		  _gaq.push(['_setDomainName', 'nal.usda.gov']);
 		  _gaq.push(['_setAllowLinker', true]);
@@ -55,28 +55,28 @@
 		  _gaq.push(['b._setDomainName', 'usda.gov']);
 		  _gaq.push(['b._setAllowLinker', true]);
 		  _gaq.push(['b._trackPageview']);
-		 
+
 		  (function() {
-		    var ga = document.createElement('script'); ga.type = 
+		    var ga = document.createElement('script'); ga.type =
 		'text/javascript'; ga.async = true;
-		    ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 
+		    ga.src = ('https:' == document.location.protocol ? 'https://ssl' :
 		'http://www') + '.google-analytics.com/ga.js';
-		    var s = document.getElementsByTagName('script')[0]; 
+		    var s = document.getElementsByTagName('script')[0];
 		s.parentNode.insertBefore(ga, s);
 		  })();
-	</script> 
-      
-     
-          
+	</script>
+
+
+
         <meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
         <meta name="layout" content="main"/>
-        
-        
-       
-		
 
-      
-    
+
+
+
+
+
+
           <script src="/ndb/static/plugins/yui-2.8.2.1/js/yui/yahoo-dom-event/yahoo-dom-event.js" type="text/javascript" ></script>
 <script src="/ndb/static/plugins/yui-2.8.2.1/js/yui/element/element-min.js" type="text/javascript" ></script>
 <script src="/ndb/static/plugins/yui-2.8.2.1/js/yui/animation/animation-min.js" type="text/javascript" ></script>
@@ -95,8 +95,8 @@
 <link href="/ndb/static/bundle-bundle_yui-button_head.css" type="text/css" rel="stylesheet" media="screen, projection" />
 
     </head>
-   <body class="yui-skin-sam">  
-   <div class="section clearfix" >   
+   <body class="yui-skin-sam">
+   <div class="section clearfix" >
     	<div id="name-and-slogan" style="padding-left:15px;" >
          <a href="http://www.ars.usda.gov"><img id="masthead-map" usemap="#masthead-map" src="/ndb/static/images/masthead.jpg" alt="National Nutrient Database" border="0" /></a>
          <map id="masthead-map" name="masthead-map">
@@ -106,18 +106,18 @@
 <area shape="rect" coords="470,2,679,52" href="http://www.ars.usda.gov/main/site_main.htm?modecode=12-35-45-00" alt="" title="Nutrient Data Laboratory Website"    />
 <area shape="rect" coords="702,6,742,47" href="http://fnic.nal.usda.gov" alt="" title="Food and Nutrition Information Center Website"    />
 </map>
-         
-         
+
+
     </div>
-       
 
-			
+
+
         </div>
         	<div id='site-slogan'  align='left'>
 				National Nutrient Database for Standard Reference<br>Release 25
 			</div>
 			<div class="bodywrapper">
-        
+
 		 <div class="nav">
           <span class="menuButton"> <a href="http://www.ars.usda.gov/main/site_main.htm?modecode=12-35-45-00" class="home" title="Go the NDL home page">NDL Home</a></span>
         <span class="menuButton"><a href="/ndb/search/list" class="list" name="menu-advanced" title="Browse the foods list">Foods List</a></span>
@@ -125,41 +125,41 @@
         <span class="menuButton"><a href="http://www.ars.usda.gov/SP2UserFiles/Place/12354500/Data/SR25/sr25_doc.pdf" class="docs" title="View and download release documentation" target="_help">SR25 Documentation</a></span>
         <span class="menuButton"><a href="/ndb/help/index" class="help" target="_help" title="Read help on how to use the website">Help</a></span>
        </div>
-      
-       
-       
-        
-    
+
+
+
+
+
      <div id="view-name">Basic Report</div>
-        
+
         <div class="body">
             <h1>Nutrient data for 07908, Luncheon meat, pork with ham, minced, canned, includes SPAM (Hormel)
-            
-         	
+
+
               </h1>
              <div class="menuButton" >
             <a href="/ndb/search/list?fg=&amp;man=&amp;lfacet=&amp;count=&amp;max=25&amp;sort=&amp;qlookup=spam&amp;offset=&amp;format=Abridged&amp;new=" name="search" class="previous" title="Return to results list">Return to Search Results</a><script type='text/javascript'> var myTooltip = new YAHOO.widget.Tooltip("myTooltip", { context:"null" } );</script>
-           
-            
-           
+
+
+
             	<a href="/ndb/foods/show/1732?fg=&amp;man=&amp;lfacet=&amp;count=&amp;max=25&amp;sort=&amp;qlookup=spam&amp;offset=&amp;format=Full&amp;new=" name="full" title="View Full Report">Full Report (All Nutrients)</a><script type='text/javascript'> var myTooltip = new YAHOO.widget.Tooltip("myTooltip", { context:"null" } );</script>
-          	
-          	 
+
+
             	 <a href="/ndb/foods/show/1732?fg=&amp;man=&amp;lfacet=&amp;count=&amp;max=25&amp;sort=&amp;qlookup=spam&amp;offset=&amp;format=Stats&amp;new=" name="stats" title="View Statistics Report">Statistics Report</a><script type='text/javascript'> var myTooltip = new YAHOO.widget.Tooltip("myTooltip", { context:"null" } );</script>
-            
+
             </div>
-            
-            
+
+
             <div class="dialog">
-            
-                
+
+
         <div class="null">
             <div id="measuresHelpDialog">
                 <div class="hd">Modifying household measures</div>
                 <div class="bd">
-                       
-                	<div id="helpDiv"></div>   
-         		
+
+                	<div id="helpDiv"></div>
+
                 </div>
             </div>
         </div>
@@ -179,13 +179,13 @@ <h1>Nutrient data for 07908, Luncheon meat, pork with ham, minced, canned, inclu
 handler: function() {this.cancel();},
 'isDefault': true}] });
                 GRAILSUI.measuresHelpDialog.render(document.body);
-                
-        
+
+
             }
             YAHOO.util.Event.onDOMReady(init_dlg_measuresHelpDialog);
         </script>
-                
-                  
+
+
                <!--  NUTRIENT DATA TABLE -->
                <form action="/ndb/foods/show/1732" method="get" >
                <input type="hidden" name="fg" value="" id="fg" />
@@ -197,29 +197,29 @@ <h1>Nutrient data for 07908, Luncheon meat, pork with ham, minced, canned, inclu
                <input type="hidden" name="offset" value="" id="offset" />
                <input type="hidden" name="sort" value="" id="sort" />
                <input type="hidden" name="format" value="Abridged" id="format" />
-               
-               
+
+
               		<div class="nutlist">
-              		
-              	
+
+
               	<p style="font-style:italic;font-size:.8em">Nutrient values and weights are for edible portion</p>
-              	
-						
+
+
 	<table>
                 <thead>
-                
-                <tr><td colspan="6" style="vertical-align:middle;text-align:center;height:2em;" class="buttons"><input type="submit" name="_action_show" value="Apply Changes" class="calc" title="Click to recalculate measures" id="1732" /><a href="/ndb/help/contextHelp/measures" onclick="jQuery.ajax({type:'POST', url:'/ndb/help/contextHelp/measures',success:function(data,textStatus){jQuery('#helpDiv').html(data);},error:function(XMLHttpRequest,textStatus,errorThrown){},complete:function(XMLHttpRequest,textStatus){GRAILSUI.measuresHelpDialog.show();}});return false;" controller="help" action="contextHelp" id="measures"><img  title="Click for more information on calculating household measures" src="/ndb/static/images/skin/help.png" alt="Help" border="0" style="vertical-align:middle"/></a></span></td></tr>
+
+                <tr><td colspan="6" style="vertical-align:middle;text-align:center;height:2em;" class="buttons"><input type="submit" name="_action_show" value="Apply Changes" class="calc" title="Click to recalculate measures" id="1732" /><a href="/ndb/help/contextHelp/measures" onclick="jQuery.ajax({type:'POST', url:'/ndb/help/contextHelp/measures',success:function(data,textStatus){jQuery('#helpDiv').html(data);},error:function(XMLHttpRequest,textStatus,errorThrown){},complete:function(XMLHttpRequest,textStatus){GRAILSUI.measuresHelpDialog.show();}});return false;" controller="help" action="contextHelp" id="measures"><img title="Click for more information on calculating household measures" src="/ndb/static/images/skin/help.png" alt="Help" border="0" style="vertical-align:middle"/></a></span></td></tr>
                 <th style="vertical-align:middle">Nutrient</th>
 				<th style="vertical-align:middle" >Unit</th>
                 <th style="vertical-align:middle"><input type="text" name="Qv" style="width:30px;text-align:right;border-style:inset;height:15px" maxlength="5" value="1" id="Qv" /><br/>Value per 100.0g</th>
-                
-                
+
+
 
 
   <th style="width:130px;line-height:1.2em;text-align:center">
   	<input type="text" name="Q3483" style="width:30px;text-align:right;border-style:inset;height:15px" maxlength="5" value="2.0" id="Q3483" />
   	<br>
-  	
+
   	oz 1 NLEA serving
   	<br>56g
   	<!--
@@ -228,563 +228,563 @@ <h1>Nutrient data for 07908, Luncheon meat, pork with ham, minced, canned, inclu
 
                 </thead>
                 <tbody>
-               
+
                 <tr class="even" >
                 <td style="font-weight:bold" colspan="6" bgcolor="#dddddd" >Proximates</td>
                 </tr>
-                	
-                	
+
+
 	                	<tr class="odd">
 	                	<td >Water
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">51.70</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">28.95</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Energy
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">kcal</td>
 	                	<td style="text-align:right;">315</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">176</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Protein
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">13.40</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">7.50</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Total lipid (fat)
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">26.60</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">14.90</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Carbohydrate, by difference
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">4.60</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">2.58</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Fiber, total dietary
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">0.0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Sugars, total
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">0.00</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.00</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
-               	
+
+
+
                 <tr class="even" >
                 <td style="font-weight:bold" colspan="6" bgcolor="#dddddd" >Minerals</td>
                 </tr>
-                	
-                	
+
+
 	                	<tr class="odd">
 	                	<td >Calcium, Ca
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Iron, Fe
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.64</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.36</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Magnesium, Mg
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">14</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">8</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Phosphorus, P
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">151</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">85</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Potassium, K
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">409</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">229</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Sodium, Na
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">1411</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">790</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Zinc, Zn
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">1.59</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.89</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
-               	
+
+
+
                 <tr class="even" >
                 <td style="font-weight:bold" colspan="6" bgcolor="#dddddd" >Vitamins</td>
                 </tr>
-                	
-                	
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin C, total ascorbic acid
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Thiamin
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.317</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.178</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Riboflavin
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.176</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.099</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Niacin
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">3.530</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">1.977</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin B-6
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.218</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.122</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Folate, DFE
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">µg</td>
 	                	<td style="text-align:right;">3</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">2</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin B-12
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">µg</td>
 	                	<td style="text-align:right;">0.45</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.25</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Vitamin A, RAE
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">µg</td>
 	                	<td style="text-align:right;">0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin A, IU
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">IU</td>
 	                	<td style="text-align:right;">0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Vitamin E (alpha-tocopherol)
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0.42</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.24</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin D (D2 + D3)
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">µg</td>
 	                	<td style="text-align:right;">0.6</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.3</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Vitamin D
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">IU</td>
 	                	<td style="text-align:right;">26</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">15</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Vitamin K (phylloquinone)
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">µg</td>
 	                	<td style="text-align:right;">0.0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0.0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
-               	
+
+
+
                 <tr class="even" >
                 <td style="font-weight:bold" colspan="6" bgcolor="#dddddd" >Lipids</td>
                 </tr>
-                	
-                	
+
+
 	                	<tr class="odd">
 	                	<td >Fatty acids, total saturated
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">9.987</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">5.593</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Fatty acids, total monounsaturated
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">13.505</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">7.563</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="odd">
 	                	<td >Fatty acids, total polyunsaturated
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">g</td>
 	                	<td style="text-align:right;">2.019</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">1.131</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
+
+
 	                	<tr class="even">
 	                	<td >Cholesterol
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">71</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">40</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
-               	
+
+
+
                 <tr class="even" >
                 <td style="font-weight:bold" colspan="6" bgcolor="#dddddd" >Other</td>
                 </tr>
-                	
-                	
+
+
 	                	<tr class="odd">
 	                	<td >Caffeine
-	                	
-	                	
+
+
 	                	</td>
-	                	
+
 	                	<td style="text-align:center;">mg</td>
 	                	<td style="text-align:right;">0</td>
-		               
-	                	
+
+
 	                		<td style="text-align:right;">0</td>
-	                	
-	                	
+
+
 	                	</tr>
-                	
-               		 
-               	
+
+
+
                 </tbody>
                 </table>
-				
+
                 </div>
                </form>
-               
-                
-                 
-                    	
-               
+
+
+
+
+
             </div>
-           
+
         </div>
-    
+
         <script src="/ndb/static/js/application.js" type="text/javascript" ></script>
 
 
diff --git a/pandas/tests/io/data/stata13_dates.dta b/pandas/tests/io/data/stata13_dates.dta
new file mode 100644
index 0000000000000..87b857559e501
Binary files /dev/null and b/pandas/tests/io/data/stata13_dates.dta differ
diff --git a/pandas/tests/io/data/stata16_118.dta b/pandas/tests/io/data/stata16_118.dta
new file mode 100644
index 0000000000000..49cfa49d1b302
Binary files /dev/null and b/pandas/tests/io/data/stata16_118.dta differ
diff --git a/pandas/tests/io/data/test1.xls b/pandas/tests/io/data/test1.xls
index db0f9dec7d5e4..faf5dc84700c9 100644
Binary files a/pandas/tests/io/data/test1.xls and b/pandas/tests/io/data/test1.xls differ
diff --git a/pandas/tests/io/data/test1.xlsm b/pandas/tests/io/data/test1.xlsm
index 4c873e55a5300..f93c57ab7f857 100644
Binary files a/pandas/tests/io/data/test1.xlsm and b/pandas/tests/io/data/test1.xlsm differ
diff --git a/pandas/tests/io/data/test1.xlsx b/pandas/tests/io/data/test1.xlsx
index e6d3a0d503cf2..a437d838fe130 100644
Binary files a/pandas/tests/io/data/test1.xlsx and b/pandas/tests/io/data/test1.xlsx differ
diff --git a/pandas/tests/io/data/testmultiindex.xls b/pandas/tests/io/data/testmultiindex.xls
index 51ef0f6c04cba..4329992642c8c 100644
Binary files a/pandas/tests/io/data/testmultiindex.xls and b/pandas/tests/io/data/testmultiindex.xls differ
diff --git a/pandas/tests/io/data/testmultiindex.xlsm b/pandas/tests/io/data/testmultiindex.xlsm
index 28c92a5f0be38..ebbca4856562f 100644
Binary files a/pandas/tests/io/data/testmultiindex.xlsm and b/pandas/tests/io/data/testmultiindex.xlsm differ
diff --git a/pandas/tests/io/data/testmultiindex.xlsx b/pandas/tests/io/data/testmultiindex.xlsx
index 815f3b07342ca..afe1758a7a132 100644
Binary files a/pandas/tests/io/data/testmultiindex.xlsx and b/pandas/tests/io/data/testmultiindex.xlsx differ
diff --git a/pandas/tests/io/data/wikipedia_states.html b/pandas/tests/io/data/wikipedia_states.html
index 6765954dd13d1..f1a4c4d29c72e 100644
--- a/pandas/tests/io/data/wikipedia_states.html
+++ b/pandas/tests/io/data/wikipedia_states.html
@@ -1539,7 +1539,7 @@ <h2><span class="mw-headline" id="External_links">External links</span><span cla
 </table>
 
 
-<!-- 
+<!--
 NewPP limit report
 Parsed by terbium
 CPU time usage: 6.220 seconds
@@ -1754,4 +1754,3 @@ <h3 id='p-lang-label'>Languages</h3>
 }</script>
 	</body>
 </html>
-	
\ No newline at end of file
diff --git a/pandas/tests/io/formats/__init__.py b/pandas/tests/io/formats/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/io/formats/data/html/datetime64_hourformatter.html b/pandas/tests/io/formats/data/html/datetime64_hourformatter.html
new file mode 100644
index 0000000000000..c92b7218eba76
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/datetime64_hourformatter.html
@@ -0,0 +1,18 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>hod</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>10:10</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>12:12</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/datetime64_monthformatter.html b/pandas/tests/io/formats/data/html/datetime64_monthformatter.html
new file mode 100644
index 0000000000000..589c8fba858a5
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/datetime64_monthformatter.html
@@ -0,0 +1,18 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>months</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>2016-01</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2016-02</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/escape_disabled.html b/pandas/tests/io/formats/data/html/escape_disabled.html
new file mode 100644
index 0000000000000..260a04d26108b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/escape_disabled.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>co<l1</th>
+      <th>co>l2</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>str<ing1 &amp;</th>
+      <td><b>bold</b></td>
+      <td><b>bold</b></td>
+    </tr>
+    <tr>
+      <th>stri>ng2 &amp;</th>
+      <td><b>bold</b></td>
+      <td><b>bold</b></td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/escaped.html b/pandas/tests/io/formats/data/html/escaped.html
new file mode 100644
index 0000000000000..d68bdd3df79c4
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/escaped.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>co&lt;l1</th>
+      <th>co&gt;l2</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>str&lt;ing1 &amp;amp;</th>
+      <td>&lt;type 'str'&gt;</td>
+      <td>&lt;type 'str'&gt;</td>
+    </tr>
+    <tr>
+      <th>stri&gt;ng2 &amp;amp;</th>
+      <td>&lt;type 'str'&gt;</td>
+      <td>&lt;type 'str'&gt;</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh12031_expected_output.html b/pandas/tests/io/formats/data/html/gh12031_expected_output.html
new file mode 100644
index 0000000000000..896e154a2b324
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh12031_expected_output.html
@@ -0,0 +1,22 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>A</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>6,0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>3,1</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>2,2</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh14882_expected_output_1.html b/pandas/tests/io/formats/data/html/gh14882_expected_output_1.html
new file mode 100644
index 0000000000000..4cfd8785de825
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh14882_expected_output_1.html
@@ -0,0 +1,274 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>n</th>
+    </tr>
+    <tr>
+      <th>a</th>
+      <th>b</th>
+      <th>c</th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="21" valign="top">100</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>2</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>4</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>6</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>8</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>9</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>10</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>11</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>12</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>13</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>14</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>16</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>17</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>18</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>19</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>20</td>
+    </tr>
+    <tr>
+      <th rowspan="19" valign="top">200</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>21</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>22</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>23</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>24</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>25</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>26</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>27</td>
+    </tr>
+    <tr>
+      <th rowspan="5" valign="top">20</th>
+      <th>1</th>
+      <td>28</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>29</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>33</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>34</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>35</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>36</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>37</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>38</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>39</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>40</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>41</td>
+    </tr>
+    <tr>
+      <th rowspan="21" valign="top">300</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>42</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>43</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>44</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>45</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>46</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>47</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>48</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>49</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>50</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>51</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>52</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>53</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>54</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>56</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>57</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>58</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>59</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>60</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>61</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>62</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh14882_expected_output_2.html b/pandas/tests/io/formats/data/html/gh14882_expected_output_2.html
new file mode 100644
index 0000000000000..d4e7fd9bd8135
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh14882_expected_output_2.html
@@ -0,0 +1,258 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>n</th>
+    </tr>
+    <tr>
+      <th>a</th>
+      <th>b</th>
+      <th>c</th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="21" valign="top">100</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>2</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>4</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>6</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>8</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>9</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>10</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>11</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>12</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>13</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>14</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>16</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>17</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>18</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>19</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>20</td>
+    </tr>
+    <tr>
+      <th rowspan="15" valign="top">200</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>21</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>22</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>23</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>24</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>25</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>26</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>27</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>35</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>36</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>37</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>38</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>39</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>40</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>41</td>
+    </tr>
+    <tr>
+      <th rowspan="21" valign="top">300</th>
+      <th rowspan="7" valign="top">10</th>
+      <th>1</th>
+      <td>42</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>43</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>44</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>45</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>46</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>47</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>48</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">20</th>
+      <th>1</th>
+      <td>49</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>50</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>51</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>52</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>53</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>54</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th rowspan="7" valign="top">30</th>
+      <th>1</th>
+      <td>56</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>57</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>58</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>59</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>60</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>61</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>62</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh14998_expected_output.html b/pandas/tests/io/formats/data/html/gh14998_expected_output.html
new file mode 100644
index 0000000000000..62b96493a8ecd
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh14998_expected_output.html
@@ -0,0 +1,12 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>A</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>1</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh15019_expected_output.html b/pandas/tests/io/formats/data/html/gh15019_expected_output.html
new file mode 100644
index 0000000000000..5fb9d960f4465
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh15019_expected_output.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>1.764052</td>
+      <td>0.400157</td>
+    </tr>
+    <tr>
+      <td>0.978738</td>
+      <td>2.240893</td>
+    </tr>
+    <tr>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <td>0.950088</td>
+      <td>-0.151357</td>
+    </tr>
+    <tr>
+      <td>-0.103219</td>
+      <td>0.410599</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh21625_expected_output.html b/pandas/tests/io/formats/data/html/gh21625_expected_output.html
new file mode 100644
index 0000000000000..a87e4ca301d9d
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh21625_expected_output.html
@@ -0,0 +1,14 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>x</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0.200</td>
+    </tr>
+  </tbody>
+</table>
\ No newline at end of file
diff --git a/pandas/tests/io/formats/data/html/gh22270_expected_output.html b/pandas/tests/io/formats/data/html/gh22270_expected_output.html
new file mode 100644
index 0000000000000..6694c43dc9e68
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh22270_expected_output.html
@@ -0,0 +1,14 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>x</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>100</td>
+    </tr>
+  </tbody>
+</table>
\ No newline at end of file
diff --git a/pandas/tests/io/formats/data/html/gh22579_expected_output.html b/pandas/tests/io/formats/data/html/gh22579_expected_output.html
new file mode 100644
index 0000000000000..425b0f915ed16
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh22579_expected_output.html
@@ -0,0 +1,76 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th colspan="2" halign="left">a</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th>c</th>
+      <th>d</th>
+      <th>c</th>
+      <th>d</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>10</td>
+      <td>10</td>
+      <td>10</td>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>11</td>
+      <td>11</td>
+      <td>11</td>
+    </tr>
+    <tr>
+      <td>2</td>
+      <td>12</td>
+      <td>12</td>
+      <td>12</td>
+    </tr>
+    <tr>
+      <td>3</td>
+      <td>13</td>
+      <td>13</td>
+      <td>13</td>
+    </tr>
+    <tr>
+      <td>4</td>
+      <td>14</td>
+      <td>14</td>
+      <td>14</td>
+    </tr>
+    <tr>
+      <td>5</td>
+      <td>15</td>
+      <td>15</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <td>6</td>
+      <td>16</td>
+      <td>16</td>
+      <td>16</td>
+    </tr>
+    <tr>
+      <td>7</td>
+      <td>17</td>
+      <td>17</td>
+      <td>17</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>18</td>
+      <td>18</td>
+      <td>18</td>
+    </tr>
+    <tr>
+      <td>9</td>
+      <td>19</td>
+      <td>19</td>
+      <td>19</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh22783_expected_output.html b/pandas/tests/io/formats/data/html/gh22783_expected_output.html
new file mode 100644
index 0000000000000..107db43c48639
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh22783_expected_output.html
@@ -0,0 +1,27 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>3</th>
+      <th>4</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>1.764052</td>
+      <td>0.400157</td>
+      <td>...</td>
+      <td>2.240893</td>
+      <td>1.867558</td>
+    </tr>
+    <tr>
+      <td>-0.977278</td>
+      <td>0.950088</td>
+      <td>...</td>
+      <td>-0.103219</td>
+      <td>0.410599</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh22783_named_columns_index.html b/pandas/tests/io/formats/data/html/gh22783_named_columns_index.html
new file mode 100644
index 0000000000000..55ab290920cc5
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh22783_named_columns_index.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>3</th>
+      <th>4</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th></th>
+      <td>1.764052</td>
+      <td>0.400157</td>
+      <td>...</td>
+      <td>2.240893</td>
+      <td>1.867558</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>-0.977278</td>
+      <td>0.950088</td>
+      <td>...</td>
+      <td>-0.103219</td>
+      <td>0.410599</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh6131_expected_output.html b/pandas/tests/io/formats/data/html/gh6131_expected_output.html
new file mode 100644
index 0000000000000..cb3a3363ff016
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh6131_expected_output.html
@@ -0,0 +1,46 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th colspan="3" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>a</th>
+      <th>aa</th>
+      <th>...</th>
+      <th>ac</th>
+    </tr>
+    <tr>
+      <th>b</th>
+      <th>c</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>ba</th>
+      <th>ca</th>
+      <td>1.0</td>
+      <td>...</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>bb</th>
+      <th>cb</th>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>bc</th>
+      <th>cc</th>
+      <td>NaN</td>
+      <td>...</td>
+      <td>3.0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/gh8452_expected_output.html b/pandas/tests/io/formats/data/html/gh8452_expected_output.html
new file mode 100644
index 0000000000000..81ce397a201e0
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/gh8452_expected_output.html
@@ -0,0 +1,28 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th colspan="2" halign="left">a</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th>c</th>
+      <th>d</th>
+      <th>c</th>
+      <th>d</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>3</td>
+      <td>5</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>4</td>
+      <td>6</td>
+      <td>4</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_1.html b/pandas/tests/io/formats/data/html/index_1.html
new file mode 100644
index 0000000000000..41221865a7cb7
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_1.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>foo</th>
+      <td>1</td>
+      <td>1.2</td>
+      <td>one</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <td>2</td>
+      <td>3.4</td>
+      <td>two</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <td>3</td>
+      <td>5.6</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_2.html b/pandas/tests/io/formats/data/html/index_2.html
new file mode 100644
index 0000000000000..a86ba80a69bb1
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_2.html
@@ -0,0 +1,26 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>1</td>
+      <td>1.2</td>
+      <td>one</td>
+    </tr>
+    <tr>
+      <td>2</td>
+      <td>3.4</td>
+      <td>two</td>
+    </tr>
+    <tr>
+      <td>3</td>
+      <td>5.6</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_3.html b/pandas/tests/io/formats/data/html/index_3.html
new file mode 100644
index 0000000000000..02edba4961bc7
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_3.html
@@ -0,0 +1,36 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+    <tr>
+      <th>idx</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>foo</th>
+      <td>1</td>
+      <td>1.2</td>
+      <td>one</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <td>2</td>
+      <td>3.4</td>
+      <td>two</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <td>3</td>
+      <td>5.6</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_4.html b/pandas/tests/io/formats/data/html/index_4.html
new file mode 100644
index 0000000000000..0d1bf9ffcd717
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_4.html
@@ -0,0 +1,33 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">foo</th>
+      <th>car</th>
+      <td>1</td>
+      <td>1.2</td>
+      <td>one</td>
+    </tr>
+    <tr>
+      <th>bike</th>
+      <td>2</td>
+      <td>3.4</td>
+      <td>two</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <th>car</th>
+      <td>3</td>
+      <td>5.6</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_5.html b/pandas/tests/io/formats/data/html/index_5.html
new file mode 100644
index 0000000000000..c5ac12ecd630e
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_5.html
@@ -0,0 +1,40 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+    <tr>
+      <th>idx1</th>
+      <th>idx2</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">foo</th>
+      <th>car</th>
+      <td>1</td>
+      <td>1.2</td>
+      <td>one</td>
+    </tr>
+    <tr>
+      <th>bike</th>
+      <td>2</td>
+      <td>3.4</td>
+      <td>two</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <th>car</th>
+      <td>3</td>
+      <td>5.6</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_formatter.html b/pandas/tests/io/formats/data/html/index_formatter.html
new file mode 100644
index 0000000000000..7a2f8a9f52a04
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_formatter.html
@@ -0,0 +1,31 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>foo</th>
+      <th>None</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>a</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>b</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>d</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_multi_columns_named_multi.html b/pandas/tests/io/formats/data/html/index_named_multi_columns_named_multi.html
new file mode 100644
index 0000000000000..817b54d77f8b1
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_multi_columns_named_multi.html
@@ -0,0 +1,34 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>columns.name.0</th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>columns.name.1</th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+    <tr>
+      <th>index.name.0</th>
+      <th>index.name.1</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_multi_columns_named_standard.html b/pandas/tests/io/formats/data/html/index_named_multi_columns_named_standard.html
new file mode 100644
index 0000000000000..e85965f14075d
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_multi_columns_named_standard.html
@@ -0,0 +1,29 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>index.name.0</th>
+      <th>index.name.1</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_multi_columns_none.html b/pandas/tests/io/formats/data/html/index_named_multi_columns_none.html
new file mode 100644
index 0000000000000..8c41d2e29f2c0
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_multi_columns_none.html
@@ -0,0 +1,23 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>index.name.0</th>
+      <th>index.name.1</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..7af63e893b12e
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_multi.html
@@ -0,0 +1,34 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+    <tr>
+      <th>index.name.0</th>
+      <th>index.name.1</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..2f7837864bf88
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_multi_columns_unnamed_standard.html
@@ -0,0 +1,29 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>index.name.0</th>
+      <th>index.name.1</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_standard_columns_named_multi.html b/pandas/tests/io/formats/data/html/index_named_standard_columns_named_multi.html
new file mode 100644
index 0000000000000..ca9b8bd834a9c
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_standard_columns_named_multi.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>columns.name.0</th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th>columns.name.1</th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_standard_columns_named_standard.html b/pandas/tests/io/formats/data/html/index_named_standard_columns_named_standard.html
new file mode 100644
index 0000000000000..6478c99ad85e9
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_standard_columns_named_standard.html
@@ -0,0 +1,26 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_standard_columns_none.html b/pandas/tests/io/formats/data/html/index_named_standard_columns_none.html
new file mode 100644
index 0000000000000..432d8e06d5784
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_standard_columns_none.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..d7660872177dc
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_multi.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..4810f66018d3b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_named_standard_columns_unnamed_standard.html
@@ -0,0 +1,26 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_none_columns_named_multi.html b/pandas/tests/io/formats/data/html/index_none_columns_named_multi.html
new file mode 100644
index 0000000000000..e111f55be7d25
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_none_columns_named_multi.html
@@ -0,0 +1,25 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>columns.name.0</th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th>columns.name.1</th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_none_columns_named_standard.html b/pandas/tests/io/formats/data/html/index_none_columns_named_standard.html
new file mode 100644
index 0000000000000..d3a9ba017b43e
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_none_columns_named_standard.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_none_columns_none.html b/pandas/tests/io/formats/data/html/index_none_columns_none.html
new file mode 100644
index 0000000000000..44899858d9519
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_none_columns_none.html
@@ -0,0 +1,12 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_none_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/index_none_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..b21a618328b1b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_none_columns_unnamed_multi.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_none_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/index_none_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..1249fa5605099
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_none_columns_unnamed_standard.html
@@ -0,0 +1,18 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_multi.html b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_multi.html
new file mode 100644
index 0000000000000..95c38c9c8fd28
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_multi.html
@@ -0,0 +1,28 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>columns.name.0</th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>columns.name.1</th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_standard.html b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_standard.html
new file mode 100644
index 0000000000000..9583a21f55f01
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_named_standard.html
@@ -0,0 +1,23 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_none.html b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_none.html
new file mode 100644
index 0000000000000..81da7c3619abc
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_none.html
@@ -0,0 +1,15 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..f620259037b60
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_multi.html
@@ -0,0 +1,28 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..2ca18c288437b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_multi_columns_unnamed_standard.html
@@ -0,0 +1,23 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th>b</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>c</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_multi.html b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_multi.html
new file mode 100644
index 0000000000000..ed3360f898afd
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_multi.html
@@ -0,0 +1,25 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>columns.name.0</th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th>columns.name.1</th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_standard.html b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_standard.html
new file mode 100644
index 0000000000000..54da03858a9a4
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_named_standard.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_none.html b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_none.html
new file mode 100644
index 0000000000000..3d958afe4a4ac
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_none.html
@@ -0,0 +1,14 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..b57fafbe0ca40
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_multi.html
@@ -0,0 +1,25 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>b</th>
+      <th>c</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..235ca61a9e63d
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/index_unnamed_standard_columns_unnamed_standard.html
@@ -0,0 +1,21 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/justify.html b/pandas/tests/io/formats/data/html/justify.html
new file mode 100644
index 0000000000000..33e4b5715260e
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/justify.html
@@ -0,0 +1,30 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: {justify};">
+      <th></th>
+      <th>A</th>
+      <th>B</th>
+      <th>C</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>6</td>
+      <td>1</td>
+      <td>223442</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>30000</td>
+      <td>2</td>
+      <td>0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>2</td>
+      <td>70000</td>
+      <td>1</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_1.html b/pandas/tests/io/formats/data/html/multiindex_1.html
new file mode 100644
index 0000000000000..88db177545972
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_1.html
@@ -0,0 +1,32 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>CL0</th>
+      <th colspan="2" halign="left">0</th>
+      <th colspan="2" halign="left">1</th>
+    </tr>
+    <tr>
+      <th>CL1</th>
+      <th>0</th>
+      <th>1</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>a</td>
+      <td>b</td>
+      <td>c</td>
+      <td>d</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>e</td>
+      <td>f</td>
+      <td>g</td>
+      <td>h</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_2.html b/pandas/tests/io/formats/data/html/multiindex_2.html
new file mode 100644
index 0000000000000..289ea2202d6b9
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_2.html
@@ -0,0 +1,34 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>2</th>
+      <th>3</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>a</td>
+      <td>b</td>
+      <td>c</td>
+      <td>d</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>e</td>
+      <td>f</td>
+      <td>g</td>
+      <td>h</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_sparsify_1.html b/pandas/tests/io/formats/data/html/multiindex_sparsify_1.html
new file mode 100644
index 0000000000000..5b5bcf9ce0a96
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_sparsify_1.html
@@ -0,0 +1,40 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_sparsify_2.html b/pandas/tests/io/formats/data/html/multiindex_sparsify_2.html
new file mode 100644
index 0000000000000..fd4c6bd23dae2
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_sparsify_2.html
@@ -0,0 +1,46 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>foo</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>0</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_1.html b/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_1.html
new file mode 100644
index 0000000000000..42a5ea5eb5899
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_1.html
@@ -0,0 +1,42 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>0</th>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_2.html b/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_2.html
new file mode 100644
index 0000000000000..2be61392e8573
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/multiindex_sparsify_false_multi_sparse_2.html
@@ -0,0 +1,48 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th>foo</th>
+      <th>0</th>
+      <th>1</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>0</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+    </tr>
+    <tr>
+      <th>0</th>
+      <th>1</th>
+      <td>2</td>
+      <td>3</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>0</th>
+      <td>4</td>
+      <td>5</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <th>1</th>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/render_links_false.html b/pandas/tests/io/formats/data/html/render_links_false.html
new file mode 100644
index 0000000000000..6509a0e985597
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/render_links_false.html
@@ -0,0 +1,24 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>foo</th>
+      <th>bar</th>
+      <th>None</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>http://pandas.pydata.org/?q1=a&amp;q2=b</td>
+      <td>pydata.org</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>www.pydata.org</td>
+      <td>pydata.org</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/render_links_true.html b/pandas/tests/io/formats/data/html/render_links_true.html
new file mode 100644
index 0000000000000..e9cb5632aad1d
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/render_links_true.html
@@ -0,0 +1,24 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>foo</th>
+      <th>bar</th>
+      <th>None</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td><a href="http://pandas.pydata.org/?q1=a&q2=b" target="_blank">http://pandas.pydata.org/?q1=a&amp;q2=b</a></td>
+      <td>pydata.org</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>0</td>
+      <td>www.pydata.org</td>
+      <td>pydata.org</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_multi.html
new file mode 100644
index 0000000000000..e66d3c816e67d
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_multi.html
@@ -0,0 +1,88 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>foo</th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>baz</th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th>baz</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_standard.html
new file mode 100644
index 0000000000000..536b371145081
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_named_standard.html
@@ -0,0 +1,72 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th>baz</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_none.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_none.html
new file mode 100644
index 0000000000000..0f262495b6c6b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_none.html
@@ -0,0 +1,62 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th>baz</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..d472cdecb12c9
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_multi.html
@@ -0,0 +1,88 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th>baz</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..31c71ca3e59f6
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_multi_columns_unnamed_standard.html
@@ -0,0 +1,72 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th></th>
+      <th>baz</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_multi.html
new file mode 100644
index 0000000000000..779e84f6ee6d1
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_multi.html
@@ -0,0 +1,74 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>foo</th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_standard.html
new file mode 100644
index 0000000000000..b86454f5fb11f
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_named_standard.html
@@ -0,0 +1,62 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_none.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_none.html
new file mode 100644
index 0000000000000..d294a507dbce4
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_none.html
@@ -0,0 +1,54 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..24b776e18bef9
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_multi.html
@@ -0,0 +1,74 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..a0ca960207ac0
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_named_standard_columns_unnamed_standard.html
@@ -0,0 +1,62 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+    <tr>
+      <th>index.name</th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_multi.html
new file mode 100644
index 0000000000000..6640db4cf8704
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_multi.html
@@ -0,0 +1,66 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>foo</th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_standard.html
new file mode 100644
index 0000000000000..364a0b98d6548
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_named_standard.html
@@ -0,0 +1,54 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th></th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th></th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_none.html b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_none.html
new file mode 100644
index 0000000000000..e2af1ba42e940
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_none.html
@@ -0,0 +1,39 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..8c9a9e244277b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_multi.html
@@ -0,0 +1,58 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..b9dcf52619490
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_none_columns_unnamed_standard.html
@@ -0,0 +1,48 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_multi.html
new file mode 100644
index 0000000000000..0590d0dea6669
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_multi.html
@@ -0,0 +1,78 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>foo</th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>baz</th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_standard.html
new file mode 100644
index 0000000000000..28a2d964675a3
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_named_standard.html
@@ -0,0 +1,62 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_none.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_none.html
new file mode 100644
index 0000000000000..387ac51b17634
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_none.html
@@ -0,0 +1,50 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..30cd85904be4e
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_multi.html
@@ -0,0 +1,78 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..81edece220408
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_multi_columns_unnamed_standard.html
@@ -0,0 +1,62 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th></th>
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">a</th>
+      <th rowspan="2" valign="top">c</th>
+      <th>e</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">b</th>
+      <th rowspan="2" valign="top">d</th>
+      <th>e</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>f</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_multi.html
new file mode 100644
index 0000000000000..2acacfed3a6d0
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_multi.html
@@ -0,0 +1,66 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th>foo</th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_standard.html
new file mode 100644
index 0000000000000..c9bacdbd241a6
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_named_standard.html
@@ -0,0 +1,54 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th>columns.name</th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_none.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_none.html
new file mode 100644
index 0000000000000..f2696f7d6b46a
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_none.html
@@ -0,0 +1,44 @@
+<table border="1" class="dataframe">
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_multi.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_multi.html
new file mode 100644
index 0000000000000..37e731520c7d9
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_multi.html
@@ -0,0 +1,66 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">a</th>
+      <th>...</th>
+      <th colspan="2" halign="left">b</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th colspan="2" halign="left">c</th>
+      <th>...</th>
+      <th colspan="2" halign="left">d</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th>e</th>
+      <th>f</th>
+      <th>...</th>
+      <th>e</th>
+      <th>f</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_standard.html b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_standard.html
new file mode 100644
index 0000000000000..3241ff41c5c58
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/trunc_df_index_unnamed_standard_columns_unnamed_standard.html
@@ -0,0 +1,54 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>6</th>
+      <th>7</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0</td>
+      <td>1</td>
+      <td>...</td>
+      <td>6</td>
+      <td>7</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>8</td>
+      <td>9</td>
+      <td>...</td>
+      <td>14</td>
+      <td>15</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>48</td>
+      <td>49</td>
+      <td>...</td>
+      <td>54</td>
+      <td>55</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>56</td>
+      <td>57</td>
+      <td>...</td>
+      <td>62</td>
+      <td>63</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/truncate.html b/pandas/tests/io/formats/data/html/truncate.html
new file mode 100644
index 0000000000000..a5eb8c5cdbb9b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/truncate.html
@@ -0,0 +1,86 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>0</th>
+      <th>1</th>
+      <th>...</th>
+      <th>18</th>
+      <th>19</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>2001-01-01</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-02</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-03</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-04</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>2001-01-17</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-18</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-19</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>2001-01-20</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/truncate_multi_index.html b/pandas/tests/io/formats/data/html/truncate_multi_index.html
new file mode 100644
index 0000000000000..8a295d66db130
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/truncate_multi_index.html
@@ -0,0 +1,101 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th colspan="2" halign="left">bar</th>
+      <th>baz</th>
+      <th>...</th>
+      <th>foo</th>
+      <th colspan="2" halign="left">qux</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>one</th>
+      <th>two</th>
+      <th>one</th>
+      <th>...</th>
+      <th>two</th>
+      <th>one</th>
+      <th>two</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th rowspan="2" valign="top">bar</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th rowspan="2" valign="top">qux</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/truncate_multi_index_sparse_off.html b/pandas/tests/io/formats/data/html/truncate_multi_index_sparse_off.html
new file mode 100644
index 0000000000000..6a7e1b5a59e3b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/truncate_multi_index_sparse_off.html
@@ -0,0 +1,105 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>bar</th>
+      <th>bar</th>
+      <th>baz</th>
+      <th>...</th>
+      <th>foo</th>
+      <th>qux</th>
+      <th>qux</th>
+    </tr>
+    <tr>
+      <th></th>
+      <th></th>
+      <th>one</th>
+      <th>two</th>
+      <th>one</th>
+      <th>...</th>
+      <th>two</th>
+      <th>one</th>
+      <th>two</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>bar</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>bar</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>baz</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>...</th>
+      <th>...</th>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+      <td>...</td>
+    </tr>
+    <tr>
+      <th>foo</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>qux</th>
+      <th>one</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+    <tr>
+      <th>qux</th>
+      <th>two</th>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>...</td>
+      <td>NaN</td>
+      <td>NaN</td>
+      <td>NaN</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/unicode_1.html b/pandas/tests/io/formats/data/html/unicode_1.html
new file mode 100644
index 0000000000000..72b810181bade
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/unicode_1.html
@@ -0,0 +1,50 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>σ</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>0.0</td>
+    </tr>
+    <tr>
+      <th>1</th>
+      <td>1.0</td>
+    </tr>
+    <tr>
+      <th>2</th>
+      <td>2.0</td>
+    </tr>
+    <tr>
+      <th>3</th>
+      <td>3.0</td>
+    </tr>
+    <tr>
+      <th>4</th>
+      <td>4.0</td>
+    </tr>
+    <tr>
+      <th>5</th>
+      <td>5.0</td>
+    </tr>
+    <tr>
+      <th>6</th>
+      <td>6.0</td>
+    </tr>
+    <tr>
+      <th>7</th>
+      <td>7.0</td>
+    </tr>
+    <tr>
+      <th>8</th>
+      <td>8.0</td>
+    </tr>
+    <tr>
+      <th>9</th>
+      <td>9.0</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/unicode_2.html b/pandas/tests/io/formats/data/html/unicode_2.html
new file mode 100644
index 0000000000000..79c088093e539
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/unicode_2.html
@@ -0,0 +1,14 @@
+<table border="1" class="dataframe">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+      <th>A</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th>0</th>
+      <td>σ</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/data/html/with_classes.html b/pandas/tests/io/formats/data/html/with_classes.html
new file mode 100644
index 0000000000000..8cee3f0c7052b
--- /dev/null
+++ b/pandas/tests/io/formats/data/html/with_classes.html
@@ -0,0 +1,9 @@
+<table border="1" class="dataframe sortable draggable">
+  <thead>
+    <tr style="text-align: right;">
+      <th></th>
+    </tr>
+  </thead>
+  <tbody>
+  </tbody>
+</table>
diff --git a/pandas/tests/io/formats/test_console.py b/pandas/tests/io/formats/test_console.py
new file mode 100644
index 0000000000000..a3e0e195f4864
--- /dev/null
+++ b/pandas/tests/io/formats/test_console.py
@@ -0,0 +1,92 @@
+import subprocess  # noqa: F401
+
+import pytest
+
+from pandas.io.formats.console import detect_console_encoding
+from pandas.io.formats.terminal import _get_terminal_size_tput
+
+
+class MockEncoding(object):  # TODO(py27): replace with mock
+    """
+    Used to add a side effect when accessing the 'encoding' property. If the
+    side effect is a str in nature, the value will be returned. Otherwise, the
+    side effect should be an exception that will be raised.
+    """
+    def __init__(self, encoding):
+        super(MockEncoding, self).__init__()
+        self.val = encoding
+
+    @property
+    def encoding(self):
+        return self.raise_or_return(self.val)
+
+    @staticmethod
+    def raise_or_return(val):
+        if isinstance(val, str):
+            return val
+        else:
+            raise val
+
+
+@pytest.mark.parametrize('empty,filled', [
+    ['stdin', 'stdout'],
+    ['stdout', 'stdin']
+])
+def test_detect_console_encoding_from_stdout_stdin(monkeypatch, empty, filled):
+    # Ensures that when sys.stdout.encoding or sys.stdin.encoding is used when
+    # they have values filled.
+    # GH 21552
+    with monkeypatch.context() as context:
+        context.setattr('sys.{}'.format(empty), MockEncoding(''))
+        context.setattr('sys.{}'.format(filled), MockEncoding(filled))
+        assert detect_console_encoding() == filled
+
+
+@pytest.mark.parametrize('encoding', [
+    AttributeError,
+    IOError,
+    'ascii'
+])
+def test_detect_console_encoding_fallback_to_locale(monkeypatch, encoding):
+    # GH 21552
+    with monkeypatch.context() as context:
+        context.setattr('locale.getpreferredencoding', lambda: 'foo')
+        context.setattr('sys.stdout', MockEncoding(encoding))
+        assert detect_console_encoding() == 'foo'
+
+
+@pytest.mark.parametrize('std,locale', [
+    ['ascii', 'ascii'],
+    ['ascii', Exception],
+    [AttributeError, 'ascii'],
+    [AttributeError, Exception],
+    [IOError, 'ascii'],
+    [IOError, Exception]
+])
+def test_detect_console_encoding_fallback_to_default(monkeypatch, std, locale):
+    # When both the stdout/stdin encoding and locale preferred encoding checks
+    # fail (or return 'ascii', we should default to the sys default encoding.
+    # GH 21552
+    with monkeypatch.context() as context:
+        context.setattr(
+            'locale.getpreferredencoding',
+            lambda: MockEncoding.raise_or_return(locale)
+        )
+        context.setattr('sys.stdout', MockEncoding(std))
+        context.setattr('sys.getdefaultencoding', lambda: 'sysDefaultEncoding')
+        assert detect_console_encoding() == 'sysDefaultEncoding'
+
+
+@pytest.mark.parametrize("size", ['', ['']])
+def test_terminal_unknown_dimensions(monkeypatch, size, mocker):
+
+    def communicate(*args, **kwargs):
+        return size
+
+    monkeypatch.setattr('subprocess.Popen', mocker.Mock())
+    monkeypatch.setattr('subprocess.Popen.return_value.returncode', None)
+    monkeypatch.setattr(
+        'subprocess.Popen.return_value.communicate', communicate)
+    result = _get_terminal_size_tput()
+
+    assert result is None
diff --git a/pandas/tests/io/formats/test_css.py b/pandas/tests/io/formats/test_css.py
new file mode 100644
index 0000000000000..f251bd983509e
--- /dev/null
+++ b/pandas/tests/io/formats/test_css.py
@@ -0,0 +1,187 @@
+import pytest
+
+from pandas.util import testing as tm
+
+from pandas.io.formats.css import CSSResolver, CSSWarning
+
+
+def assert_resolves(css, props, inherited=None):
+    resolve = CSSResolver()
+    actual = resolve(css, inherited=inherited)
+    assert props == actual
+
+
+def assert_same_resolution(css1, css2, inherited=None):
+    resolve = CSSResolver()
+    resolved1 = resolve(css1, inherited=inherited)
+    resolved2 = resolve(css2, inherited=inherited)
+    assert resolved1 == resolved2
+
+
+@pytest.mark.parametrize('name,norm,abnorm', [
+    ('whitespace', 'hello: world; foo: bar',
+     ' \t hello \t :\n  world \n  ;  \n foo: \tbar\n\n'),
+    ('case', 'hello: world; foo: bar', 'Hello: WORLD; foO: bar'),
+    ('empty-decl', 'hello: world; foo: bar',
+     '; hello: world;; foo: bar;\n; ;'),
+    ('empty-list', '', ';'),
+])
+def test_css_parse_normalisation(name, norm, abnorm):
+    assert_same_resolution(norm, abnorm)
+
+
+@pytest.mark.parametrize(
+    'invalid_css,remainder', [
+        # No colon
+        ('hello-world', ''),
+        ('border-style: solid; hello-world', 'border-style: solid'),
+        ('border-style: solid; hello-world; font-weight: bold',
+         'border-style: solid; font-weight: bold'),
+        # Unclosed string fail
+        # Invalid size
+        ('font-size: blah', 'font-size: 1em'),
+        ('font-size: 1a2b', 'font-size: 1em'),
+        ('font-size: 1e5pt', 'font-size: 1em'),
+        ('font-size: 1+6pt', 'font-size: 1em'),
+        ('font-size: 1unknownunit', 'font-size: 1em'),
+        ('font-size: 10', 'font-size: 1em'),
+        ('font-size: 10 pt', 'font-size: 1em'),
+    ])
+def test_css_parse_invalid(invalid_css, remainder):
+    with tm.assert_produces_warning(CSSWarning):
+        assert_same_resolution(invalid_css, remainder)
+
+    # TODO: we should be checking that in other cases no warnings are raised
+
+
+@pytest.mark.parametrize(
+    'shorthand,expansions',
+    [('margin', ['margin-top', 'margin-right',
+                 'margin-bottom', 'margin-left']),
+     ('padding', ['padding-top', 'padding-right',
+                  'padding-bottom', 'padding-left']),
+     ('border-width', ['border-top-width', 'border-right-width',
+                       'border-bottom-width', 'border-left-width']),
+     ('border-color', ['border-top-color', 'border-right-color',
+                       'border-bottom-color', 'border-left-color']),
+     ('border-style', ['border-top-style', 'border-right-style',
+                       'border-bottom-style', 'border-left-style']),
+     ])
+def test_css_side_shorthands(shorthand, expansions):
+    top, right, bottom, left = expansions
+
+    assert_resolves('{shorthand}: 1pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '1pt',
+                     bottom: '1pt', left: '1pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '1pt', left: '4pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt 2pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '2pt', left: '4pt'})
+
+    assert_resolves('{shorthand}: 1pt 4pt 2pt 0pt'.format(shorthand=shorthand),
+                    {top: '1pt', right: '4pt',
+                     bottom: '2pt', left: '0pt'})
+
+    with tm.assert_produces_warning(CSSWarning):
+        assert_resolves(
+            '{shorthand}: 1pt 1pt 1pt 1pt 1pt'.format(shorthand=shorthand), {})
+
+
+@pytest.mark.parametrize('style,inherited,equiv', [
+    ('margin: 1px; margin: 2px', '',
+     'margin: 2px'),
+    ('margin: 1px', 'margin: 2px',
+     'margin: 1px'),
+    ('margin: 1px; margin: inherit', 'margin: 2px',
+     'margin: 2px'),
+    ('margin: 1px; margin-top: 2px', '',
+     'margin-left: 1px; margin-right: 1px; ' +
+     'margin-bottom: 1px; margin-top: 2px'),
+    ('margin-top: 2px', 'margin: 1px',
+     'margin: 1px; margin-top: 2px'),
+    ('margin: 1px', 'margin-top: 2px',
+     'margin: 1px'),
+    ('margin: 1px; margin-top: inherit', 'margin: 2px',
+     'margin: 1px; margin-top: 2px'),
+])
+def test_css_precedence(style, inherited, equiv):
+    resolve = CSSResolver()
+    inherited_props = resolve(inherited)
+    style_props = resolve(style, inherited=inherited_props)
+    equiv_props = resolve(equiv)
+    assert style_props == equiv_props
+
+
+@pytest.mark.parametrize('style,equiv', [
+    ('margin: 1px; margin-top: inherit',
+     'margin-bottom: 1px; margin-right: 1px; margin-left: 1px'),
+    ('margin-top: inherit', ''),
+    ('margin-top: initial', ''),
+])
+def test_css_none_absent(style, equiv):
+    assert_same_resolution(style, equiv)
+
+
+@pytest.mark.parametrize('size,resolved', [
+    ('xx-small', '6pt'),
+    ('x-small', '{pt:f}pt'.format(pt=7.5)),
+    ('small', '{pt:f}pt'.format(pt=9.6)),
+    ('medium', '12pt'),
+    ('large', '{pt:f}pt'.format(pt=13.5)),
+    ('x-large', '18pt'),
+    ('xx-large', '24pt'),
+
+    ('8px', '6pt'),
+    ('1.25pc', '15pt'),
+    ('.25in', '18pt'),
+    ('02.54cm', '72pt'),
+    ('25.4mm', '72pt'),
+    ('101.6q', '72pt'),
+    ('101.6q', '72pt'),
+])
+@pytest.mark.parametrize('relative_to',  # invariant to inherited size
+                         [None, '16pt'])
+def test_css_absolute_font_size(size, relative_to, resolved):
+    if relative_to is None:
+        inherited = None
+    else:
+        inherited = {'font-size': relative_to}
+    assert_resolves('font-size: {size}'.format(size=size),
+                    {'font-size': resolved}, inherited=inherited)
+
+
+@pytest.mark.parametrize('size,relative_to,resolved', [
+    ('1em', None, '12pt'),
+    ('1.0em', None, '12pt'),
+    ('1.25em', None, '15pt'),
+    ('1em', '16pt', '16pt'),
+    ('1.0em', '16pt', '16pt'),
+    ('1.25em', '16pt', '20pt'),
+    ('1rem', '16pt', '12pt'),
+    ('1.0rem', '16pt', '12pt'),
+    ('1.25rem', '16pt', '15pt'),
+    ('100%', None, '12pt'),
+    ('125%', None, '15pt'),
+    ('100%', '16pt', '16pt'),
+    ('125%', '16pt', '20pt'),
+    ('2ex', None, '12pt'),
+    ('2.0ex', None, '12pt'),
+    ('2.50ex', None, '15pt'),
+    ('inherit', '16pt', '16pt'),
+
+    ('smaller', None, '10pt'),
+    ('smaller', '18pt', '15pt'),
+    ('larger', None, '{pt:f}pt'.format(pt=14.4)),
+    ('larger', '15pt', '18pt'),
+])
+def test_css_relative_font_size(size, relative_to, resolved):
+    if relative_to is None:
+        inherited = None
+    else:
+        inherited = {'font-size': relative_to}
+    assert_resolves('font-size: {size}'.format(size=size),
+                    {'font-size': resolved}, inherited=inherited)
diff --git a/pandas/tests/formats/test_eng_formatting.py b/pandas/tests/io/formats/test_eng_formatting.py
similarity index 92%
rename from pandas/tests/formats/test_eng_formatting.py
rename to pandas/tests/io/formats/test_eng_formatting.py
index d2badd4fc160a..455b6454d73ff 100644
--- a/pandas/tests/formats/test_eng_formatting.py
+++ b/pandas/tests/io/formats/test_eng_formatting.py
@@ -1,12 +1,15 @@
 import numpy as np
+
+from pandas.compat import u
+
 import pandas as pd
 from pandas import DataFrame
-from pandas.compat import u
-import pandas.formats.format as fmt
 from pandas.util import testing as tm
 
+import pandas.io.formats.format as fmt
+
 
-class TestEngFormatter(tm.TestCase):
+class TestEngFormatter(object):
 
     def test_eng_float_formatter(self):
         df = DataFrame({'A': [1.41, 141., 14100, 1410000.]})
@@ -18,7 +21,7 @@ def test_eng_float_formatter(self):
                     '1  141.000E+00\n'
                     '2   14.100E+03\n'
                     '3    1.410E+06')
-        self.assertEqual(result, expected)
+        assert result == expected
 
         fmt.set_eng_float_format(use_eng_prefix=True)
         result = df.to_string()
@@ -27,7 +30,7 @@ def test_eng_float_formatter(self):
                     '1  141.000\n'
                     '2  14.100k\n'
                     '3   1.410M')
-        self.assertEqual(result, expected)
+        assert result == expected
 
         fmt.set_eng_float_format(accuracy=0)
         result = df.to_string()
@@ -36,15 +39,13 @@ def test_eng_float_formatter(self):
                     '1  141E+00\n'
                     '2   14E+03\n'
                     '3    1E+06')
-        self.assertEqual(result, expected)
+        assert result == expected
 
-        self.reset_display_options()
+        tm.reset_display_options()
 
     def compare(self, formatter, input, output):
         formatted_input = formatter(input)
-        msg = ("formatting of %s results in '%s', expected '%s'" %
-               (str(input), formatted_input, output))
-        self.assertEqual(formatted_input, output, msg)
+        assert formatted_input == output
 
     def compare_all(self, formatter, in_out):
         """
@@ -169,14 +170,14 @@ def test_rounding(self):
 
         formatter = fmt.EngFormatter(accuracy=3, use_eng_prefix=True)
         result = formatter(0)
-        self.assertEqual(result, u(' 0.000'))
+        assert result == u(' 0.000')
 
     def test_nan(self):
         # Issue #11981
 
         formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
         result = formatter(np.nan)
-        self.assertEqual(result, u('NaN'))
+        assert result == u('NaN')
 
         df = pd.DataFrame({'a': [1.5, 10.3, 20.5],
                            'b': [50.3, 60.67, 70.12],
@@ -184,12 +185,12 @@ def test_nan(self):
         pt = df.pivot_table(values='a', index='b', columns='c')
         fmt.set_eng_float_format(accuracy=1)
         result = pt.to_string()
-        self.assertTrue('NaN' in result)
-        self.reset_display_options()
+        assert 'NaN' in result
+        tm.reset_display_options()
 
     def test_inf(self):
         # Issue #11981
 
         formatter = fmt.EngFormatter(accuracy=1, use_eng_prefix=True)
         result = formatter(np.inf)
-        self.assertEqual(result, u('inf'))
+        assert result == u('inf')
diff --git a/pandas/tests/io/formats/test_format.py b/pandas/tests/io/formats/test_format.py
new file mode 100644
index 0000000000000..b0cf5a2f17609
--- /dev/null
+++ b/pandas/tests/io/formats/test_format.py
@@ -0,0 +1,2794 @@
+# -*- coding: utf-8 -*-
+
+"""
+Test output formatting for Series/DataFrame, including to_string & reprs
+"""
+
+from __future__ import print_function
+
+from datetime import datetime
+import itertools
+from operator import methodcaller
+import os
+import re
+import sys
+import textwrap
+import warnings
+
+import dateutil
+import numpy as np
+import pytest
+import pytz
+
+import pandas.compat as compat
+from pandas.compat import (
+    PY3, StringIO, is_platform_32bit, is_platform_windows, lrange, lzip, range,
+    u, zip)
+
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, NaT, Series, Timestamp, date_range, read_csv)
+from pandas.core.config import (
+    get_option, option_context, reset_option, set_option)
+import pandas.util.testing as tm
+
+import pandas.io.formats.format as fmt
+import pandas.io.formats.printing as printing
+from pandas.io.formats.terminal import get_terminal_size
+
+use_32bit_repr = is_platform_windows() or is_platform_32bit()
+
+_frame = DataFrame(tm.getSeriesData())
+
+
+def curpath():
+    pth, _ = os.path.split(os.path.abspath(__file__))
+    return pth
+
+
+def has_info_repr(df):
+    r = repr(df)
+    c1 = r.split('\n')[0].startswith("<class")
+    c2 = r.split('\n')[0].startswith(r"&lt;class")  # _repr_html_
+    return c1 or c2
+
+
+def has_non_verbose_info_repr(df):
+    has_info = has_info_repr(df)
+    r = repr(df)
+
+    # 1. <class>
+    # 2. Index
+    # 3. Columns
+    # 4. dtype
+    # 5. memory usage
+    # 6. trailing newline
+    nv = len(r.split('\n')) == 6
+    return has_info and nv
+
+
+def has_horizontally_truncated_repr(df):
+    try:  # Check header row
+        fst_line = np.array(repr(df).splitlines()[0].split())
+        cand_col = np.where(fst_line == '...')[0][0]
+    except IndexError:
+        return False
+    # Make sure each row has this ... in the same place
+    r = repr(df)
+    for ix, l in enumerate(r.splitlines()):
+        if not r.split()[cand_col] == '...':
+            return False
+    return True
+
+
+def has_vertically_truncated_repr(df):
+    r = repr(df)
+    only_dot_row = False
+    for row in r.splitlines():
+        if re.match(r'^[\.\ ]+$', row):
+            only_dot_row = True
+    return only_dot_row
+
+
+def has_truncated_repr(df):
+    return has_horizontally_truncated_repr(
+        df) or has_vertically_truncated_repr(df)
+
+
+def has_doubly_truncated_repr(df):
+    return has_horizontally_truncated_repr(
+        df) and has_vertically_truncated_repr(df)
+
+
+def has_expanded_repr(df):
+    r = repr(df)
+    for line in r.split('\n'):
+        if line.endswith('\\'):
+            return True
+    return False
+
+
+class TestDataFrameFormatting(object):
+
+    def setup_method(self, method):
+        self.warn_filters = warnings.filters
+        warnings.filterwarnings('ignore', category=FutureWarning,
+                                module=".*format")
+
+        self.frame = _frame.copy()
+
+    def teardown_method(self, method):
+        warnings.filters = self.warn_filters
+
+    def test_repr_embedded_ndarray(self):
+        arr = np.empty(10, dtype=[('err', object)])
+        for i in range(len(arr)):
+            arr['err'][i] = np.random.randn(i)
+
+        df = DataFrame(arr)
+        repr(df['err'])
+        repr(df)
+        df.to_string()
+
+    def test_eng_float_formatter(self):
+        self.frame.loc[5] = 0
+
+        fmt.set_eng_float_format()
+        repr(self.frame)
+
+        fmt.set_eng_float_format(use_eng_prefix=True)
+        repr(self.frame)
+
+        fmt.set_eng_float_format(accuracy=0)
+        repr(self.frame)
+        tm.reset_display_options()
+
+    def test_show_null_counts(self):
+
+        df = DataFrame(1, columns=range(10), index=range(10))
+        df.iloc[1, 1] = np.nan
+
+        def check(null_counts, result):
+            buf = StringIO()
+            df.info(buf=buf, null_counts=null_counts)
+            assert ('non-null' in buf.getvalue()) is result
+
+        with option_context('display.max_info_rows', 20,
+                            'display.max_info_columns', 20):
+            check(None, True)
+            check(True, True)
+            check(False, False)
+
+        with option_context('display.max_info_rows', 5,
+                            'display.max_info_columns', 5):
+            check(None, False)
+            check(True, False)
+            check(False, False)
+
+    def test_repr_tuples(self):
+        buf = StringIO()
+
+        df = DataFrame({'tups': lzip(range(10), range(10))})
+        repr(df)
+        df.to_string(col_space=10, buf=buf)
+
+    def test_repr_truncation(self):
+        max_len = 20
+        with option_context("display.max_colwidth", max_len):
+            df = DataFrame({'A': np.random.randn(10),
+                            'B': [tm.rands(np.random.randint(
+                                max_len - 1, max_len + 1)) for i in range(10)
+            ]})
+            r = repr(df)
+            r = r[r.find('\n') + 1:]
+
+            adj = fmt._get_adjustment()
+
+            for line, value in lzip(r.split('\n'), df['B']):
+                if adj.len(value) + 1 > max_len:
+                    assert '...' in line
+                else:
+                    assert '...' not in line
+
+        with option_context("display.max_colwidth", 999999):
+            assert '...' not in repr(df)
+
+        with option_context("display.max_colwidth", max_len + 2):
+            assert '...' not in repr(df)
+
+    def test_repr_chop_threshold(self):
+        df = DataFrame([[0.1, 0.5], [0.5, -0.1]])
+        pd.reset_option("display.chop_threshold")  # default None
+        assert repr(df) == '     0    1\n0  0.1  0.5\n1  0.5 -0.1'
+
+        with option_context("display.chop_threshold", 0.2):
+            assert repr(df) == '     0    1\n0  0.0  0.5\n1  0.5  0.0'
+
+        with option_context("display.chop_threshold", 0.6):
+            assert repr(df) == '     0    1\n0  0.0  0.0\n1  0.0  0.0'
+
+        with option_context("display.chop_threshold", None):
+            assert repr(df) == '     0    1\n0  0.1  0.5\n1  0.5 -0.1'
+
+    def test_repr_chop_threshold_column_below(self):
+        # GH 6839: validation case
+
+        df = pd.DataFrame([[10, 20, 30, 40],
+                           [8e-10, -1e-11, 2e-9, -2e-11]]).T
+
+        with option_context("display.chop_threshold", 0):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  8.000000e-10\n'
+                                '1  20.0 -1.000000e-11\n'
+                                '2  30.0  2.000000e-09\n'
+                                '3  40.0 -2.000000e-11')
+
+        with option_context("display.chop_threshold", 1e-8):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  0.000000e+00\n'
+                                '1  20.0  0.000000e+00\n'
+                                '2  30.0  0.000000e+00\n'
+                                '3  40.0  0.000000e+00')
+
+        with option_context("display.chop_threshold", 5e-11):
+            assert repr(df) == ('      0             1\n'
+                                '0  10.0  8.000000e-10\n'
+                                '1  20.0  0.000000e+00\n'
+                                '2  30.0  2.000000e-09\n'
+                                '3  40.0  0.000000e+00')
+
+    def test_repr_obeys_max_seq_limit(self):
+        with option_context("display.max_seq_items", 2000):
+            assert len(printing.pprint_thing(lrange(1000))) > 1000
+
+        with option_context("display.max_seq_items", 5):
+            assert len(printing.pprint_thing(lrange(1000))) < 100
+
+    def test_repr_set(self):
+        assert printing.pprint_thing({1}) == '{1}'
+
+    def test_repr_is_valid_construction_code(self):
+        # for the case of Index, where the repr is traditional rather then
+        # stylized
+        idx = Index(['a', 'b'])
+        res = eval("pd." + repr(idx))
+        tm.assert_series_equal(Series(res), Series(idx))
+
+    def test_repr_should_return_str(self):
+        # https://docs.python.org/3/reference/datamodel.html#object.__repr__
+        # "...The return value must be a string object."
+
+        # (str on py2.x, str (unicode) on py3)
+
+        data = [8, 5, 3, 5]
+        index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
+        cols = [u("\u03c8")]
+        df = DataFrame(data, columns=cols, index=index1)
+        assert type(df.__repr__()) == str  # both py2 / 3
+
+    def test_repr_no_backslash(self):
+        with option_context('mode.sim_interactive', True):
+            df = DataFrame(np.random.randn(10, 4))
+            assert '\\' not in repr(df)
+
+    def test_expand_frame_repr(self):
+        df_small = DataFrame('hello', [0], [0])
+        df_wide = DataFrame('hello', [0], lrange(10))
+        df_tall = DataFrame('hello', lrange(30), lrange(5))
+
+        with option_context('mode.sim_interactive', True):
+            with option_context('display.max_columns', 10, 'display.width', 20,
+                                'display.max_rows', 20,
+                                'display.show_dimensions', True):
+                with option_context('display.expand_frame_repr', True):
+                    assert not has_truncated_repr(df_small)
+                    assert not has_expanded_repr(df_small)
+                    assert not has_truncated_repr(df_wide)
+                    assert has_expanded_repr(df_wide)
+                    assert has_vertically_truncated_repr(df_tall)
+                    assert has_expanded_repr(df_tall)
+
+                with option_context('display.expand_frame_repr', False):
+                    assert not has_truncated_repr(df_small)
+                    assert not has_expanded_repr(df_small)
+                    assert not has_horizontally_truncated_repr(df_wide)
+                    assert not has_expanded_repr(df_wide)
+                    assert has_vertically_truncated_repr(df_tall)
+                    assert not has_expanded_repr(df_tall)
+
+    def test_repr_non_interactive(self):
+        # in non interactive mode, there can be no dependency on the
+        # result of terminal auto size detection
+        df = DataFrame('hello', lrange(1000), lrange(5))
+
+        with option_context('mode.sim_interactive', False, 'display.width', 0,
+                            'display.max_rows', 5000):
+            assert not has_truncated_repr(df)
+            assert not has_expanded_repr(df)
+
+    def test_repr_truncates_terminal_size(self, monkeypatch):
+        # see gh-21180
+
+        terminal_size = (118, 96)
+        monkeypatch.setattr('pandas.io.formats.console.get_terminal_size',
+                            lambda: terminal_size)
+        monkeypatch.setattr('pandas.io.formats.format.get_terminal_size',
+                            lambda: terminal_size)
+
+        index = range(5)
+        columns = pd.MultiIndex.from_tuples([
+            ('This is a long title with > 37 chars.', 'cat'),
+            ('This is a loooooonger title with > 43 chars.', 'dog'),
+        ])
+        df = pd.DataFrame(1, index=index, columns=columns)
+
+        result = repr(df)
+
+        h1, h2 = result.split('\n')[:2]
+        assert 'long' in h1
+        assert 'loooooonger' in h1
+        assert 'cat' in h2
+        assert 'dog' in h2
+
+        # regular columns
+        df2 = pd.DataFrame({"A" * 41: [1, 2], 'B' * 41: [1, 2]})
+        result = repr(df2)
+
+        assert df2.columns[0] in result.split('\n')[0]
+
+    def test_repr_truncates_terminal_size_full(self, monkeypatch):
+        # GH 22984 ensure entire window is filled
+        terminal_size = (80, 24)
+        df = pd.DataFrame(np.random.rand(1, 7))
+        monkeypatch.setattr('pandas.io.formats.console.get_terminal_size',
+                            lambda: terminal_size)
+        monkeypatch.setattr('pandas.io.formats.format.get_terminal_size',
+                            lambda: terminal_size)
+        assert "..." not in str(df)
+
+    def test_repr_truncation_column_size(self):
+        # dataframe with last column very wide -> check it is not used to
+        # determine size of truncation (...) column
+        df = pd.DataFrame({'a': [108480, 30830], 'b': [12345, 12345],
+                           'c': [12345, 12345], 'd': [12345, 12345],
+                           'e': ['a' * 50] * 2})
+        assert "..." in str(df)
+        assert "    ...    " not in str(df)
+
+    def test_repr_max_columns_max_rows(self):
+        term_width, term_height = get_terminal_size()
+        if term_width < 10 or term_height < 10:
+            pytest.skip("terminal size too small, "
+                        "{0} x {1}".format(term_width, term_height))
+
+        def mkframe(n):
+            index = ['{i:05d}'.format(i=i) for i in range(n)]
+            return DataFrame(0, index, index)
+
+        df6 = mkframe(6)
+        df10 = mkframe(10)
+        with option_context('mode.sim_interactive', True):
+            with option_context('display.width', term_width * 2):
+                with option_context('display.max_rows', 5,
+                                    'display.max_columns', 5):
+                    assert not has_expanded_repr(mkframe(4))
+                    assert not has_expanded_repr(mkframe(5))
+                    assert not has_expanded_repr(df6)
+                    assert has_doubly_truncated_repr(df6)
+
+                with option_context('display.max_rows', 20,
+                                    'display.max_columns', 10):
+                    # Out off max_columns boundary, but no extending
+                    # since not exceeding width
+                    assert not has_expanded_repr(df6)
+                    assert not has_truncated_repr(df6)
+
+                with option_context('display.max_rows', 9,
+                                    'display.max_columns', 10):
+                    # out vertical bounds can not result in exanded repr
+                    assert not has_expanded_repr(df10)
+                    assert has_vertically_truncated_repr(df10)
+
+            # width=None in terminal, auto detection
+            with option_context('display.max_columns', 100, 'display.max_rows',
+                                term_width * 20, 'display.width', None):
+                df = mkframe((term_width // 7) - 2)
+                assert not has_expanded_repr(df)
+                df = mkframe((term_width // 7) + 2)
+                printing.pprint_thing(df._repr_fits_horizontal_())
+                assert has_expanded_repr(df)
+
+    def test_str_max_colwidth(self):
+        # GH 7856
+        df = pd.DataFrame([{'a': 'foo',
+                            'b': 'bar',
+                            'c': 'uncomfortably long line with lots of stuff',
+                            'd': 1}, {'a': 'foo',
+                                      'b': 'bar',
+                                      'c': 'stuff',
+                                      'd': 1}])
+        df.set_index(['a', 'b', 'c'])
+        assert str(df) == (
+            '     a    b                                           c  d\n'
+            '0  foo  bar  uncomfortably long line with lots of stuff  1\n'
+            '1  foo  bar                                       stuff  1')
+        with option_context('max_colwidth', 20):
+            assert str(df) == ('     a    b                    c  d\n'
+                               '0  foo  bar  uncomfortably lo...  1\n'
+                               '1  foo  bar                stuff  1')
+
+    def test_auto_detect(self):
+        term_width, term_height = get_terminal_size()
+        fac = 1.05  # Arbitrary large factor to exceed term width
+        cols = range(int(term_width * fac))
+        index = range(10)
+        df = DataFrame(index=index, columns=cols)
+        with option_context('mode.sim_interactive', True):
+            with option_context('max_rows', None):
+                with option_context('max_columns', None):
+                    # Wrap around with None
+                    assert has_expanded_repr(df)
+            with option_context('max_rows', 0):
+                with option_context('max_columns', 0):
+                    # Truncate with auto detection.
+                    assert has_horizontally_truncated_repr(df)
+
+            index = range(int(term_height * fac))
+            df = DataFrame(index=index, columns=cols)
+            with option_context('max_rows', 0):
+                with option_context('max_columns', None):
+                    # Wrap around with None
+                    assert has_expanded_repr(df)
+                    # Truncate vertically
+                    assert has_vertically_truncated_repr(df)
+
+            with option_context('max_rows', None):
+                with option_context('max_columns', 0):
+                    assert has_horizontally_truncated_repr(df)
+
+    def test_to_string_repr_unicode(self):
+        buf = StringIO()
+
+        unicode_values = [u('\u03c3')] * 10
+        unicode_values = np.array(unicode_values, dtype=object)
+        df = DataFrame({'unicode': unicode_values})
+        df.to_string(col_space=10, buf=buf)
+
+        # it works!
+        repr(df)
+
+        idx = Index(['abc', u('\u03c3a'), 'aegdvg'])
+        ser = Series(np.random.randn(len(idx)), idx)
+        rs = repr(ser).split('\n')
+        line_len = len(rs[0])
+        for line in rs[1:]:
+            try:
+                line = line.decode(get_option("display.encoding"))
+            except AttributeError:
+                pass
+            if not line.startswith('dtype:'):
+                assert len(line) == line_len
+
+        # it works even if sys.stdin in None
+        _stdin = sys.stdin
+        try:
+            sys.stdin = None
+            repr(df)
+        finally:
+            sys.stdin = _stdin
+
+    def test_to_string_unicode_columns(self):
+        df = DataFrame({u('\u03c3'): np.arange(10.)})
+
+        buf = StringIO()
+        df.to_string(buf=buf)
+        buf.getvalue()
+
+        buf = StringIO()
+        df.info(buf=buf)
+        buf.getvalue()
+
+        result = self.frame.to_string()
+        assert isinstance(result, compat.text_type)
+
+    def test_to_string_utf8_columns(self):
+        n = u("\u05d0").encode('utf-8')
+
+        with option_context('display.max_rows', 1):
+            df = DataFrame([1, 2], columns=[n])
+            repr(df)
+
+    def test_to_string_unicode_two(self):
+        dm = DataFrame({u('c/\u03c3'): []})
+        buf = StringIO()
+        dm.to_string(buf)
+
+    def test_to_string_unicode_three(self):
+        dm = DataFrame(['\xc2'])
+        buf = StringIO()
+        dm.to_string(buf)
+
+    def test_to_string_with_formatters(self):
+        df = DataFrame({'int': [1, 2, 3],
+                        'float': [1.0, 2.0, 3.0],
+                        'object': [(1, 2), True, False]},
+                       columns=['int', 'float', 'object'])
+
+        formatters = [('int', lambda x: '0x{x:x}'.format(x=x)),
+                      ('float', lambda x: '[{x: 4.1f}]'.format(x=x)),
+                      ('object', lambda x: '-{x!s}-'.format(x=x))]
+        result = df.to_string(formatters=dict(formatters))
+        result2 = df.to_string(formatters=lzip(*formatters)[1])
+        assert result == ('  int  float    object\n'
+                          '0 0x1 [ 1.0]  -(1, 2)-\n'
+                          '1 0x2 [ 2.0]    -True-\n'
+                          '2 0x3 [ 3.0]   -False-')
+        assert result == result2
+
+    def test_to_string_with_datetime64_monthformatter(self):
+        months = [datetime(2016, 1, 1), datetime(2016, 2, 2)]
+        x = DataFrame({'months': months})
+
+        def format_func(x):
+            return x.strftime('%Y-%m')
+        result = x.to_string(formatters={'months': format_func})
+        expected = 'months\n0 2016-01\n1 2016-02'
+        assert result.strip() == expected
+
+    def test_to_string_with_datetime64_hourformatter(self):
+
+        x = DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                             format='%H:%M:%S.%f')})
+
+        def format_func(x):
+            return x.strftime('%H:%M')
+
+        result = x.to_string(formatters={'hod': format_func})
+        expected = 'hod\n0 10:10\n1 12:12'
+        assert result.strip() == expected
+
+    def test_to_string_with_formatters_unicode(self):
+        df = DataFrame({u('c/\u03c3'): [1, 2, 3]})
+        result = df.to_string(
+            formatters={u('c/\u03c3'): lambda x: '{x}'.format(x=x)})
+        assert result == u('  c/\u03c3\n') + '0   1\n1   2\n2   3'
+
+    def test_east_asian_unicode_false(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+
+        # not alighned properly because of east asian width
+
+        # mid col
+        df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
+                        'b': [1, 222, 33333, 4]},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"          a      b\na         あ      1\n"
+                    u"bb      いいい    222\nc         う  33333\n"
+                    u"ddd  ええええええ      4")
+        assert _rep(df) == expected
+
+        # last col
+        df = DataFrame({'a': [1, 222, 33333, 4],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"         a       b\na        1       あ\n"
+                    u"bb     222     いいい\nc    33333       う\n"
+                    u"ddd      4  ええええええ")
+        assert _rep(df) == expected
+
+        # all col
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"         a       b\na    あああああ       あ\n"
+                    u"bb       い     いいい\nc        う       う\n"
+                    u"ddd    えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # column name
+        df = DataFrame({'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                        u'あああああ': [1, 222, 33333, 4]},
+                       index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"          b  あああああ\na         あ      1\n"
+                    u"bb      いいい    222\nc         う  33333\n"
+                    u"ddd  ええええええ      4")
+        assert _rep(df) == expected
+
+        # index
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=[u'あああ', u'いいいいいい', u'うう', u'え'])
+        expected = (u"            a       b\nあああ     あああああ       あ\n"
+                    u"いいいいいい      い     いいい\nうう          う       う\n"
+                    u"え         えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # index name
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=pd.Index([u'あ', u'い', u'うう', u'え'],
+                                      name=u'おおおお'))
+        expected = (u"          a       b\n"
+                    u"おおおお               \n"
+                    u"あ     あああああ       あ\n"
+                    u"い         い     いいい\n"
+                    u"うう        う       う\n"
+                    u"え       えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # all
+        df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
+                        u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
+                       index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
+                                      name=u'お'))
+        expected = (u"       あああ いいいいい\n"
+                    u"お               \n"
+                    u"あ      あああ     あ\n"
+                    u"いいい      い   いいい\n"
+                    u"うう       う     う\n"
+                    u"え    えええええ    ええ")
+        assert _rep(df) == expected
+
+        # MultiIndex
+        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+            u'おおお', u'かかかか'), (u'き', u'くく')])
+        df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                        'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                       index=idx)
+        expected = (u"              a       b\n"
+                    u"あ   いい    あああああ       あ\n"
+                    u"う   え         い     いいい\n"
+                    u"おおお かかかか      う       う\n"
+                    u"き   くく      えええ  ええええええ")
+        assert _rep(df) == expected
+
+        # truncate
+        with option_context('display.max_rows', 3, 'display.max_columns', 3):
+            df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                               'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                               'c': [u'お', u'か', u'ききき', u'くくくくくく'],
+                               u'ああああ': [u'さ', u'し', u'す', u'せ']},
+                              columns=['a', 'b', 'c', u'ああああ'])
+
+            expected = (u"        a  ... ああああ\n0   あああああ  ...    さ\n"
+                        u"..    ...  ...  ...\n3     えええ  ...    せ\n"
+                        u"\n[4 rows x 4 columns]")
+            assert _rep(df) == expected
+
+            df.index = [u'あああ', u'いいいい', u'う', 'aaa']
+            expected = (u"         a  ... ああああ\nあああ  あああああ  ...    さ\n"
+                        u"..     ...  ...  ...\naaa    えええ  ...    せ\n"
+                        u"\n[4 rows x 4 columns]")
+            assert _rep(df) == expected
+
+    def test_east_asian_unicode_true(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+
+        # Emable Unicode option -----------------------------------------
+        with option_context('display.unicode.east_asian_width', True):
+
+            # mid col
+            df = DataFrame({'a': [u'あ', u'いいい', u'う', u'ええええええ'],
+                            'b': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"                a      b\na              あ      1\n"
+                        u"bb         いいい    222\nc              う  33333\n"
+                        u"ddd  ええええええ      4")
+            assert _rep(df) == expected
+
+            # last col
+            df = DataFrame({'a': [1, 222, 33333, 4],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"         a             b\na        1            あ\n"
+                        u"bb     222        いいい\nc    33333            う\n"
+                        u"ddd      4  ええええええ")
+            assert _rep(df) == expected
+
+            # all col
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"              a             b\n"
+                        u"a    あああああ            あ\n"
+                        u"bb           い        いいい\n"
+                        u"c            う            う\n"
+                        u"ddd      えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # column name
+            df = DataFrame({'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                            u'あああああ': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"                b  あああああ\n"
+                        u"a              あ           1\n"
+                        u"bb         いいい         222\n"
+                        u"c              う       33333\n"
+                        u"ddd  ええええええ           4")
+            assert _rep(df) == expected
+
+            # index
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=[u'あああ', u'いいいいいい', u'うう', u'え'])
+            expected = (u"                       a             b\n"
+                        u"あああ        あああああ            あ\n"
+                        u"いいいいいい          い        いいい\n"
+                        u"うう                  う            う\n"
+                        u"え                えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # index name
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=pd.Index([u'あ', u'い', u'うう', u'え'],
+                                          name=u'おおおお'))
+            expected = (u"                   a             b\n"
+                        u"おおおお                          \n"
+                        u"あ        あああああ            あ\n"
+                        u"い                い        いいい\n"
+                        u"うう              う            う\n"
+                        u"え            えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # all
+            df = DataFrame({u'あああ': [u'あああ', u'い', u'う', u'えええええ'],
+                            u'いいいいい': [u'あ', u'いいい', u'う', u'ええ']},
+                           index=pd.Index([u'あ', u'いいい', u'うう', u'え'],
+                                          name=u'お'))
+            expected = (u"            あああ いいいいい\n"
+                        u"お                           \n"
+                        u"あ          あああ         あ\n"
+                        u"いいい          い     いいい\n"
+                        u"うう            う         う\n"
+                        u"え      えええええ       ええ")
+            assert _rep(df) == expected
+
+            # MultiIndex
+            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+                u'おおお', u'かかかか'), (u'き', u'くく')])
+            df = DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                            'b': [u'あ', u'いいい', u'う', u'ええええええ']},
+                           index=idx)
+            expected = (u"                          a             b\n"
+                        u"あ     いい      あああああ            あ\n"
+                        u"う     え                い        いいい\n"
+                        u"おおお かかかか          う            う\n"
+                        u"き     くく          えええ  ええええええ")
+            assert _rep(df) == expected
+
+            # truncate
+            with option_context('display.max_rows', 3, 'display.max_columns',
+                                3):
+
+                df = pd.DataFrame({'a': [u'あああああ', u'い', u'う', u'えええ'],
+                                   'b': [u'あ', u'いいい', u'う', u'ええええええ'],
+                                   'c': [u'お', u'か', u'ききき', u'くくくくくく'],
+                                   u'ああああ': [u'さ', u'し', u'す', u'せ']},
+                                  columns=['a', 'b', 'c', u'ああああ'])
+
+                expected = (u"             a  ... ああああ\n"
+                            u"0   あああああ  ...       さ\n"
+                            u"..         ...  ...      ...\n"
+                            u"3       えええ  ...       せ\n"
+                            u"\n[4 rows x 4 columns]")
+                assert _rep(df) == expected
+
+                df.index = [u'あああ', u'いいいい', u'う', 'aaa']
+                expected = (u"                 a  ... ああああ\n"
+                            u"あああ  あああああ  ...       さ\n"
+                            u"...            ...  ...      ...\n"
+                            u"aaa         えええ  ...       せ\n"
+                            u"\n[4 rows x 4 columns]")
+                assert _rep(df) == expected
+
+            # ambiguous unicode
+            df = DataFrame({'b': [u'あ', u'いいい', u'¡¡', u'ええええええ'],
+                            u'あああああ': [1, 222, 33333, 4]},
+                           index=['a', 'bb', 'c', '¡¡¡'])
+            expected = (u"                b  あああああ\n"
+                        u"a              あ           1\n"
+                        u"bb         いいい         222\n"
+                        u"c              ¡¡       33333\n"
+                        u"¡¡¡  ええええええ           4")
+            assert _rep(df) == expected
+
+    def test_to_string_buffer_all_unicode(self):
+        buf = StringIO()
+
+        empty = DataFrame({u('c/\u03c3'): Series()})
+        nonempty = DataFrame({u('c/\u03c3'): Series([1, 2, 3])})
+
+        print(empty, file=buf)
+        print(nonempty, file=buf)
+
+        # this should work
+        buf.getvalue()
+
+    def test_to_string_with_col_space(self):
+        df = DataFrame(np.random.random(size=(1, 3)))
+        c10 = len(df.to_string(col_space=10).split("\n")[1])
+        c20 = len(df.to_string(col_space=20).split("\n")[1])
+        c30 = len(df.to_string(col_space=30).split("\n")[1])
+        assert c10 < c20 < c30
+
+        # GH 8230
+        # col_space wasn't being applied with header=False
+        with_header = df.to_string(col_space=20)
+        with_header_row1 = with_header.splitlines()[1]
+        no_header = df.to_string(col_space=20, header=False)
+        assert len(with_header_row1) == len(no_header)
+
+    def test_to_string_truncate_indices(self):
+        for index in [tm.makeStringIndex, tm.makeUnicodeIndex, tm.makeIntIndex,
+                      tm.makeDateIndex, tm.makePeriodIndex]:
+            for column in [tm.makeStringIndex]:
+                for h in [10, 20]:
+                    for w in [10, 20]:
+                        with option_context("display.expand_frame_repr",
+                                            False):
+                            df = DataFrame(index=index(h), columns=column(w))
+                            with option_context("display.max_rows", 15):
+                                if h == 20:
+                                    assert has_vertically_truncated_repr(df)
+                                else:
+                                    assert not has_vertically_truncated_repr(
+                                        df)
+                            with option_context("display.max_columns", 15):
+                                if w == 20:
+                                    assert has_horizontally_truncated_repr(df)
+                                else:
+                                    assert not (
+                                        has_horizontally_truncated_repr(df))
+                            with option_context("display.max_rows", 15,
+                                                "display.max_columns", 15):
+                                if h == 20 and w == 20:
+                                    assert has_doubly_truncated_repr(df)
+                                else:
+                                    assert not has_doubly_truncated_repr(
+                                        df)
+
+    def test_to_string_truncate_multilevel(self):
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        df = DataFrame(index=arrays, columns=arrays)
+        with option_context("display.max_rows", 7, "display.max_columns", 7):
+            assert has_doubly_truncated_repr(df)
+
+    def test_truncate_with_different_dtypes(self):
+
+        # 11594, 12045
+        # when truncated the dtypes of the splits can differ
+
+        # 11594
+        import datetime
+        s = Series([datetime.datetime(2012, 1, 1)] * 10 +
+                   [datetime.datetime(1012, 1, 2)] + [
+            datetime.datetime(2012, 1, 3)] * 10)
+
+        with pd.option_context('display.max_rows', 8):
+            result = str(s)
+            assert 'object' in result
+
+        # 12045
+        df = DataFrame({'text': ['some words'] + [None] * 9})
+
+        with pd.option_context('display.max_rows', 8,
+                               'display.max_columns', 3):
+            result = str(df)
+            assert 'None' in result
+            assert 'NaN' not in result
+
+    def test_datetimelike_frame(self):
+
+        # GH 12211
+        df = DataFrame(
+            {'date': [pd.Timestamp('20130101').tz_localize('UTC')] +
+                     [pd.NaT] * 5})
+
+        with option_context("display.max_rows", 5):
+            result = str(df)
+            assert '2013-01-01 00:00:00+00:00' in result
+            assert 'NaT' in result
+            assert '...' in result
+            assert '[6 rows x 1 columns]' in result
+
+        dts = [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5 + [pd.NaT] * 5
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                          dt   x\n'
+                        '0  2011-01-01 00:00:00-05:00   1\n'
+                        '1  2011-01-01 00:00:00-05:00   2\n'
+                        '..                       ...  ..\n'
+                        '8                        NaT   9\n'
+                        '9                        NaT  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+        dts = [pd.NaT] * 5 + [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                          dt   x\n'
+                        '0                        NaT   1\n'
+                        '1                        NaT   2\n'
+                        '..                       ...  ..\n'
+                        '8  2011-01-01 00:00:00-05:00   9\n'
+                        '9  2011-01-01 00:00:00-05:00  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+        dts = ([pd.Timestamp('2011-01-01', tz='Asia/Tokyo')] * 5 +
+               [pd.Timestamp('2011-01-01', tz='US/Eastern')] * 5)
+        df = pd.DataFrame({"dt": dts,
+                           "x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]})
+        with option_context('display.max_rows', 5):
+            expected = ('                           dt   x\n'
+                        '0   2011-01-01 00:00:00+09:00   1\n'
+                        '1   2011-01-01 00:00:00+09:00   2\n'
+                        '..                        ...  ..\n'
+                        '8   2011-01-01 00:00:00-05:00   9\n'
+                        '9   2011-01-01 00:00:00-05:00  10\n\n'
+                        '[10 rows x 2 columns]')
+            assert repr(df) == expected
+
+    @pytest.mark.parametrize('start_date', [
+        '2017-01-01 23:59:59.999999999',
+        '2017-01-01 23:59:59.99999999',
+        '2017-01-01 23:59:59.9999999',
+        '2017-01-01 23:59:59.999999',
+        '2017-01-01 23:59:59.99999',
+        '2017-01-01 23:59:59.9999',
+    ])
+    def test_datetimeindex_highprecision(self, start_date):
+        # GH19030
+        # Check that high-precision time values for the end of day are
+        # included in repr for DatetimeIndex
+        df = DataFrame({'A': date_range(start=start_date,
+                                        freq='D', periods=5)})
+        result = str(df)
+        assert start_date in result
+
+        dti = date_range(start=start_date,
+                         freq='D', periods=5)
+        df = DataFrame({'A': range(5)}, index=dti)
+        result = str(df.index)
+        assert start_date in result
+
+    def test_nonunicode_nonascii_alignment(self):
+        df = DataFrame([["aa\xc3\xa4\xc3\xa4", 1], ["bbbb", 2]])
+        rep_str = df.to_string()
+        lines = rep_str.split('\n')
+        assert len(lines[1]) == len(lines[2])
+
+    def test_unicode_problem_decoding_as_ascii(self):
+        dm = DataFrame({u('c/\u03c3'): Series({'test': np.nan})})
+        compat.text_type(dm.to_string())
+
+    def test_string_repr_encoding(self, datapath):
+        filepath = datapath('io', 'parser', 'data', 'unicode_series.csv')
+        df = pd.read_csv(filepath, header=None, encoding='latin1')
+        repr(df)
+        repr(df[1])
+
+    def test_repr_corner(self):
+        # representing infs poses no problems
+        df = DataFrame({'foo': [-np.inf, np.inf]})
+        repr(df)
+
+    def test_frame_info_encoding(self):
+        index = ['\'Til There Was You (1997)',
+                 'ldum klaka (Cold Fever) (1994)']
+        fmt.set_option('display.max_rows', 1)
+        df = DataFrame(columns=['a', 'b', 'c'], index=index)
+        repr(df)
+        repr(df.T)
+        fmt.set_option('display.max_rows', 200)
+
+    def test_pprint_thing(self):
+        from pandas.io.formats.printing import pprint_thing as pp_t
+
+        if PY3:
+            pytest.skip("doesn't work on Python 3")
+
+        assert pp_t('a') == u('a')
+        assert pp_t(u('a')) == u('a')
+        assert pp_t(None) == 'None'
+        assert pp_t(u('\u05d0'), quote_strings=True) == u("u'\u05d0'")
+        assert pp_t(u('\u05d0'), quote_strings=False) == u('\u05d0')
+        assert (pp_t((u('\u05d0'), u('\u05d1')), quote_strings=True) ==
+                u("(u'\u05d0', u'\u05d1')"))
+        assert (pp_t((u('\u05d0'), (u('\u05d1'), u('\u05d2'))),
+                     quote_strings=True) == u("(u'\u05d0', "
+                                              "(u'\u05d1', u'\u05d2'))"))
+        assert (pp_t(('foo', u('\u05d0'), (u('\u05d0'), u('\u05d0'))),
+                     quote_strings=True) == u("(u'foo', u'\u05d0', "
+                                              "(u'\u05d0', u'\u05d0'))"))
+
+        # gh-2038: escape embedded tabs in string
+        assert "\t" not in pp_t("a\tb", escape_chars=("\t", ))
+
+    def test_wide_repr(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.show_dimensions', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+
+            assert "10 rows x {c} columns".format(c=max_cols - 1) in rep_str
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 120):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_wide_columns(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            df = DataFrame(np.random.randn(5, 3),
+                           columns=['a' * 90, 'b' * 90, 'c' * 90])
+            rep_str = repr(df)
+
+            assert len(rep_str.splitlines()) == 20
+
+    def test_wide_repr_named(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            df.index.name = 'DataFrame Index'
+            set_option('display.expand_frame_repr', False)
+
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+            for line in wide_repr.splitlines()[1::13]:
+                assert 'DataFrame Index' in line
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_multiindex(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
+            max_cols = get_option('display.max_columns')
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)),
+                           index=midx)
+            df.index.names = ['Level 0', 'Level 1']
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+            for line in wide_repr.splitlines()[1::13]:
+                assert 'Level 0 Level 1' in line
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_multiindex_cols(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = get_option('display.max_columns')
+            midx = MultiIndex.from_arrays(tm.rands_array(5, size=(2, 10)))
+            mcols = MultiIndex.from_arrays(
+                tm.rands_array(3, size=(2, max_cols - 1)))
+            df = DataFrame(tm.rands_array(25, (10, max_cols - 1)),
+                           index=midx, columns=mcols)
+            df.index.names = ['Level 0', 'Level 1']
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+        with option_context('display.width', 150, 'display.max_columns', 20):
+            wider_repr = repr(df)
+            assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_unicode(self):
+        with option_context('mode.sim_interactive', True,
+                            'display.max_columns', 20):
+            max_cols = 20
+            df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+            set_option('display.expand_frame_repr', False)
+            rep_str = repr(df)
+            set_option('display.expand_frame_repr', True)
+            wide_repr = repr(df)
+            assert rep_str != wide_repr
+
+            with option_context('display.width', 150):
+                wider_repr = repr(df)
+                assert len(wider_repr) < len(wide_repr)
+
+        reset_option('display.expand_frame_repr')
+
+    def test_wide_repr_wide_long_columns(self):
+        with option_context('mode.sim_interactive', True):
+            df = DataFrame({'a': ['a' * 30, 'b' * 30],
+                            'b': ['c' * 70, 'd' * 80]})
+
+            result = repr(df)
+            assert 'ccccc' in result
+            assert 'ddddd' in result
+
+    def test_long_series(self):
+        n = 1000
+        s = Series(
+            np.random.randint(-50, 50, n),
+            index=['s{x:04d}'.format(x=x) for x in range(n)], dtype='int64')
+
+        import re
+        str_rep = str(s)
+        nmatches = len(re.findall('dtype', str_rep))
+        assert nmatches == 1
+
+    def test_index_with_nan(self):
+        #  GH 2850
+        df = DataFrame({'id1': {0: '1a3',
+                                1: '9h4'},
+                        'id2': {0: np.nan,
+                                1: 'd67'},
+                        'id3': {0: '78d',
+                                1: '79d'},
+                        'value': {0: 123,
+                                  1: 64}})
+
+        # multi-index
+        y = df.set_index(['id1', 'id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            '1a3 NaN 78d    123\n9h4 d67 79d     64')
+        assert result == expected
+
+        # index
+        y = df.set_index('id2')
+        result = y.to_string()
+        expected = u(
+            '     id1  id3  value\nid2                 \n'
+            'NaN  1a3  78d    123\nd67  9h4  79d     64')
+        assert result == expected
+
+        # with append (this failed in 0.12)
+        y = df.set_index(['id1', 'id2']).set_index('id3', append=True)
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            '1a3 NaN 78d    123\n9h4 d67 79d     64')
+        assert result == expected
+
+        # all-nan in mi
+        df2 = df.copy()
+        df2.loc[:, 'id2'] = np.nan
+        y = df2.set_index('id2')
+        result = y.to_string()
+        expected = u(
+            '     id1  id3  value\nid2                 \n'
+            'NaN  1a3  78d    123\nNaN  9h4  79d     64')
+        assert result == expected
+
+        # partial nan in mi
+        df2 = df.copy()
+        df2.loc[:, 'id2'] = np.nan
+        y = df2.set_index(['id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '         id1  value\nid2 id3            \n'
+            'NaN 78d  1a3    123\n    79d  9h4     64')
+        assert result == expected
+
+        df = DataFrame({'id1': {0: np.nan,
+                                1: '9h4'},
+                        'id2': {0: np.nan,
+                                1: 'd67'},
+                        'id3': {0: np.nan,
+                                1: '79d'},
+                        'value': {0: 123,
+                                  1: 64}})
+
+        y = df.set_index(['id1', 'id2', 'id3'])
+        result = y.to_string()
+        expected = u(
+            '             value\nid1 id2 id3       \n'
+            'NaN NaN NaN    123\n9h4 d67 79d     64')
+        assert result == expected
+
+    def test_to_string(self):
+
+        # big mixed
+        biggie = DataFrame({'A': np.random.randn(200),
+                            'B': tm.makeStringIndex(200)},
+                           index=lrange(200))
+
+        biggie.loc[:20, 'A'] = np.nan
+        biggie.loc[:20, 'B'] = np.nan
+        s = biggie.to_string()
+
+        buf = StringIO()
+        retval = biggie.to_string(buf=buf)
+        assert retval is None
+        assert buf.getvalue() == s
+
+        assert isinstance(s, compat.string_types)
+
+        # print in right order
+        result = biggie.to_string(columns=['B', 'A'], col_space=17,
+                                  float_format='%.5f'.__mod__)
+        lines = result.split('\n')
+        header = lines[0].strip().split()
+        joined = '\n'.join(re.sub(r'\s+', ' ', x).strip() for x in lines[1:])
+        recons = read_csv(StringIO(joined), names=header,
+                          header=None, sep=' ')
+        tm.assert_series_equal(recons['B'], biggie['B'])
+        assert recons['A'].count() == biggie['A'].count()
+        assert (np.abs(recons['A'].dropna() -
+                       biggie['A'].dropna()) < 0.1).all()
+
+        # expected = ['B', 'A']
+        # assert header == expected
+
+        result = biggie.to_string(columns=['A'], col_space=17)
+        header = result.split('\n')[0].strip().split()
+        expected = ['A']
+        assert header == expected
+
+        biggie.to_string(columns=['B', 'A'],
+                         formatters={'A': lambda x: '{x:.1f}'.format(x=x)})
+
+        biggie.to_string(columns=['B', 'A'], float_format=str)
+        biggie.to_string(columns=['B', 'A'], col_space=12, float_format=str)
+
+        frame = DataFrame(index=np.arange(200))
+        frame.to_string()
+
+    def test_to_string_no_header(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(header=False)
+        expected = "0  1  4\n1  2  5\n2  3  6"
+
+        assert df_s == expected
+
+    def test_to_string_specified_header(self):
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(header=['X', 'Y'])
+        expected = '   X  Y\n0  1  4\n1  2  5\n2  3  6'
+
+        assert df_s == expected
+
+        with pytest.raises(ValueError):
+            df.to_string(header=['X'])
+
+    def test_to_string_no_index(self):
+        # GH 16839, GH 13032
+        df = DataFrame({'x': [11, 22], 'y': [33, -44], 'z': ['AAA', '   ']})
+
+        df_s = df.to_string(index=False)
+        # Leading space is expected for positive numbers.
+        expected = ("  x   y    z\n"
+                    " 11  33  AAA\n"
+                    " 22 -44     ")
+        assert df_s == expected
+
+        df_s = df[['y', 'x', 'z']].to_string(index=False)
+        expected = ("  y   x    z\n"
+                    " 33  11  AAA\n"
+                    "-44  22     ")
+        assert df_s == expected
+
+    def test_to_string_line_width_no_index(self):
+        # GH 13998, GH 22505
+        df = DataFrame({'x': [1, 2, 3], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(line_width=1, index=False)
+        expected = " x  \\\n 1   \n 2   \n 3   \n\n y  \n 4  \n 5  \n 6  "
+
+        assert df_s == expected
+
+        df = DataFrame({'x': [11, 22, 33], 'y': [4, 5, 6]})
+
+        df_s = df.to_string(line_width=1, index=False)
+        expected = "  x  \\\n 11   \n 22   \n 33   \n\n y  \n 4  \n 5  \n 6  "
+
+        assert df_s == expected
+
+        df = DataFrame({'x': [11, 22, -33], 'y': [4, 5, -6]})
+
+        df_s = df.to_string(line_width=1, index=False)
+        expected = "  x  \\\n 11   \n 22   \n-33   \n\n y  \n 4  \n 5  \n-6  "
+
+        assert df_s == expected
+
+    def test_to_string_float_formatting(self):
+        tm.reset_display_options()
+        fmt.set_option('display.precision', 5, 'display.column_space', 12,
+                       'display.notebook_repr_html', False)
+
+        df = DataFrame({'x': [0, 0.25, 3456.000, 12e+45, 1.64e+6, 1.7e+8,
+                              1.253456, np.pi, -1e6]})
+
+        df_s = df.to_string()
+
+        if _three_digit_exp():
+            expected = ('              x\n0  0.00000e+000\n1  2.50000e-001\n'
+                        '2  3.45600e+003\n3  1.20000e+046\n4  1.64000e+006\n'
+                        '5  1.70000e+008\n6  1.25346e+000\n7  3.14159e+000\n'
+                        '8 -1.00000e+006')
+        else:
+            expected = ('             x\n0  0.00000e+00\n1  2.50000e-01\n'
+                        '2  3.45600e+03\n3  1.20000e+46\n4  1.64000e+06\n'
+                        '5  1.70000e+08\n6  1.25346e+00\n7  3.14159e+00\n'
+                        '8 -1.00000e+06')
+        assert df_s == expected
+
+        df = DataFrame({'x': [3234, 0.253]})
+        df_s = df.to_string()
+
+        expected = ('          x\n' '0  3234.000\n' '1     0.253')
+        assert df_s == expected
+
+        tm.reset_display_options()
+        assert get_option("display.precision") == 6
+
+        df = DataFrame({'x': [1e9, 0.2512]})
+        df_s = df.to_string()
+
+        if _three_digit_exp():
+            expected = ('               x\n'
+                        '0  1.000000e+009\n'
+                        '1  2.512000e-001')
+        else:
+            expected = ('              x\n'
+                        '0  1.000000e+09\n'
+                        '1  2.512000e-01')
+        assert df_s == expected
+
+    def test_to_string_float_format_no_fixed_width(self):
+
+        # GH 21625
+        df = DataFrame({'x': [0.19999]})
+        expected = '      x\n0 0.200'
+        assert df.to_string(float_format='%.3f') == expected
+
+        # GH 22270
+        df = DataFrame({'x': [100.0]})
+        expected = '    x\n0 100'
+        assert df.to_string(float_format='%.0f') == expected
+
+    def test_to_string_small_float_values(self):
+        df = DataFrame({'a': [1.5, 1e-17, -5.5e-7]})
+
+        result = df.to_string()
+        # sadness per above
+        if '{x:.4g}'.format(x=1.7e8) == '1.7e+008':
+            expected = ('               a\n'
+                        '0  1.500000e+000\n'
+                        '1  1.000000e-017\n'
+                        '2 -5.500000e-007')
+        else:
+            expected = ('              a\n'
+                        '0  1.500000e+00\n'
+                        '1  1.000000e-17\n'
+                        '2 -5.500000e-07')
+        assert result == expected
+
+        # but not all exactly zero
+        df = df * 0
+        result = df.to_string()
+        expected = ('   0\n' '0  0\n' '1  0\n' '2 -0')
+
+    def test_to_string_float_index(self):
+        index = Index([1.5, 2, 3, 4, 5])
+        df = DataFrame(lrange(5), index=index)
+
+        result = df.to_string()
+        expected = ('     0\n'
+                    '1.5  0\n'
+                    '2.0  1\n'
+                    '3.0  2\n'
+                    '4.0  3\n'
+                    '5.0  4')
+        assert result == expected
+
+    def test_to_string_ascii_error(self):
+        data = [('0  ', u('                        .gitignore '), u('     5 '),
+                 ' \xe2\x80\xa2\xe2\x80\xa2\xe2\x80'
+                 '\xa2\xe2\x80\xa2\xe2\x80\xa2')]
+        df = DataFrame(data)
+
+        # it works!
+        repr(df)
+
+    def test_to_string_int_formatting(self):
+        df = DataFrame({'x': [-15, 20, 25, -35]})
+        assert issubclass(df['x'].dtype.type, np.integer)
+
+        output = df.to_string()
+        expected = ('    x\n' '0 -15\n' '1  20\n' '2  25\n' '3 -35')
+        assert output == expected
+
+    def test_to_string_index_formatter(self):
+        df = DataFrame([lrange(5), lrange(5, 10), lrange(10, 15)])
+
+        rs = df.to_string(formatters={'__index__': lambda x: 'abc' [x]})
+
+        xp = """\
+    0   1   2   3   4
+a   0   1   2   3   4
+b   5   6   7   8   9
+c  10  11  12  13  14\
+"""
+
+        assert rs == xp
+
+    def test_to_string_left_justify_cols(self):
+        tm.reset_display_options()
+        df = DataFrame({'x': [3234, 0.253]})
+        df_s = df.to_string(justify='left')
+        expected = ('   x       \n' '0  3234.000\n' '1     0.253')
+        assert df_s == expected
+
+    def test_to_string_format_na(self):
+        tm.reset_display_options()
+        df = DataFrame({'A': [np.nan, -1, -2.1234, 3, 4],
+                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
+        result = df.to_string()
+
+        expected = ('        A       B\n'
+                    '0     NaN     NaN\n'
+                    '1 -1.0000     foo\n'
+                    '2 -2.1234   foooo\n'
+                    '3  3.0000  fooooo\n'
+                    '4  4.0000     bar')
+        assert result == expected
+
+        df = DataFrame({'A': [np.nan, -1., -2., 3., 4.],
+                        'B': [np.nan, 'foo', 'foooo', 'fooooo', 'bar']})
+        result = df.to_string()
+
+        expected = ('     A       B\n'
+                    '0  NaN     NaN\n'
+                    '1 -1.0     foo\n'
+                    '2 -2.0   foooo\n'
+                    '3  3.0  fooooo\n'
+                    '4  4.0     bar')
+        assert result == expected
+
+    def test_to_string_format_inf(self):
+        # Issue #24861
+        tm.reset_display_options()
+        df = DataFrame({
+            'A': [-np.inf, np.inf, -1, -2.1234, 3, 4],
+            'B': [-np.inf, np.inf, 'foo', 'foooo', 'fooooo', 'bar']
+        })
+        result = df.to_string()
+
+        expected = ('        A       B\n'
+                    '0    -inf    -inf\n'
+                    '1     inf     inf\n'
+                    '2 -1.0000     foo\n'
+                    '3 -2.1234   foooo\n'
+                    '4  3.0000  fooooo\n'
+                    '5  4.0000     bar')
+        assert result == expected
+
+        df = DataFrame({
+            'A': [-np.inf, np.inf, -1., -2., 3., 4.],
+            'B': [-np.inf, np.inf, 'foo', 'foooo', 'fooooo', 'bar']
+        })
+        result = df.to_string()
+
+        expected = ('     A       B\n'
+                    '0 -inf    -inf\n'
+                    '1  inf     inf\n'
+                    '2 -1.0     foo\n'
+                    '3 -2.0   foooo\n'
+                    '4  3.0  fooooo\n'
+                    '5  4.0     bar')
+        assert result == expected
+
+    def test_to_string_decimal(self):
+        # Issue #23614
+        df = DataFrame({'A': [6.0, 3.1, 2.2]})
+        expected = '     A\n0  6,0\n1  3,1\n2  2,2'
+        assert df.to_string(decimal=',') == expected
+
+    def test_to_string_line_width(self):
+        df = DataFrame(123, lrange(10, 15), lrange(30))
+        s = df.to_string(line_width=80)
+        assert max(len(l) for l in s.split('\n')) == 80
+
+    def test_show_dimensions(self):
+        df = DataFrame(123, lrange(10, 15), lrange(30))
+
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', True):
+            assert '5 rows' in str(df)
+            assert '5 rows' in df._repr_html_()
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', False):
+            assert '5 rows' not in str(df)
+            assert '5 rows' not in df._repr_html_()
+        with option_context('display.max_rows', 2, 'display.max_columns', 2,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', 'truncate'):
+            assert '5 rows' in str(df)
+            assert '5 rows' in df._repr_html_()
+        with option_context('display.max_rows', 10, 'display.max_columns', 40,
+                            'display.width', 500, 'display.expand_frame_repr',
+                            'info', 'display.show_dimensions', 'truncate'):
+            assert '5 rows' not in str(df)
+            assert '5 rows' not in df._repr_html_()
+
+    def test_repr_html(self):
+        self.frame._repr_html_()
+
+        fmt.set_option('display.max_rows', 1, 'display.max_columns', 1)
+        self.frame._repr_html_()
+
+        fmt.set_option('display.notebook_repr_html', False)
+        self.frame._repr_html_()
+
+        tm.reset_display_options()
+
+        df = DataFrame([[1, 2], [3, 4]])
+        fmt.set_option('display.show_dimensions', True)
+        assert '2 rows' in df._repr_html_()
+        fmt.set_option('display.show_dimensions', False)
+        assert '2 rows' not in df._repr_html_()
+
+        tm.reset_display_options()
+
+    def test_repr_html_mathjax(self):
+        df = DataFrame([[1, 2], [3, 4]])
+        assert 'tex2jax_ignore' not in df._repr_html_()
+
+        with pd.option_context('display.html.use_mathjax', False):
+            assert 'tex2jax_ignore' in df._repr_html_()
+
+    def test_repr_html_wide(self):
+        max_cols = 20
+        df = DataFrame(tm.rands_array(25, size=(10, max_cols - 1)))
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert "..." not in df._repr_html_()
+
+        wide_df = DataFrame(tm.rands_array(25, size=(10, max_cols + 1)))
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert "..." in wide_df._repr_html_()
+
+    def test_repr_html_wide_multiindex_cols(self):
+        max_cols = 20
+
+        mcols = MultiIndex.from_product([np.arange(max_cols // 2),
+                                         ['foo', 'bar']],
+                                        names=['first', 'second'])
+        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
+                       columns=mcols)
+        reg_repr = df._repr_html_()
+        assert '...' not in reg_repr
+
+        mcols = MultiIndex.from_product((np.arange(1 + (max_cols // 2)),
+                                         ['foo', 'bar']),
+                                        names=['first', 'second'])
+        df = DataFrame(tm.rands_array(25, size=(10, len(mcols))),
+                       columns=mcols)
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' in df._repr_html_()
+
+    def test_repr_html_long(self):
+        with option_context('display.max_rows', 60):
+            max_rows = get_option('display.max_rows')
+            h = max_rows - 1
+            df = DataFrame({'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)})
+            reg_repr = df._repr_html_()
+            assert '..' not in reg_repr
+            assert str(41 + max_rows // 2) in reg_repr
+
+            h = max_rows + 1
+            df = DataFrame({'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)})
+            long_repr = df._repr_html_()
+            assert '..' in long_repr
+            assert str(41 + max_rows // 2) not in long_repr
+            assert u('{h} rows ').format(h=h) in long_repr
+            assert u('2 columns') in long_repr
+
+    def test_repr_html_float(self):
+        with option_context('display.max_rows', 60):
+
+            max_rows = get_option('display.max_rows')
+            h = max_rows - 1
+            df = DataFrame({'idx': np.linspace(-10, 10, h),
+                            'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)}).set_index('idx')
+            reg_repr = df._repr_html_()
+            assert '..' not in reg_repr
+            assert '<td>{val}</td>'.format(val=str(40 + h)) in reg_repr
+
+            h = max_rows + 1
+            df = DataFrame({'idx': np.linspace(-10, 10, h),
+                            'A': np.arange(1, 1 + h),
+                            'B': np.arange(41, 41 + h)}).set_index('idx')
+            long_repr = df._repr_html_()
+            assert '..' in long_repr
+            assert '<td>{val}</td>'.format(val='31') not in long_repr
+            assert u('{h} rows ').format(h=h) in long_repr
+            assert u('2 columns') in long_repr
+
+    def test_repr_html_long_multiindex(self):
+        max_rows = 60
+        max_L1 = max_rows // 2
+
+        tuples = list(itertools.product(np.arange(max_L1), ['foo', 'bar']))
+        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        df = DataFrame(np.random.randn(max_L1 * 2, 2), index=idx,
+                       columns=['A', 'B'])
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            reg_repr = df._repr_html_()
+        assert '...' not in reg_repr
+
+        tuples = list(itertools.product(np.arange(max_L1 + 1), ['foo', 'bar']))
+        idx = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        df = DataFrame(np.random.randn((max_L1 + 1) * 2, 2), index=idx,
+                       columns=['A', 'B'])
+        long_repr = df._repr_html_()
+        assert '...' in long_repr
+
+    def test_repr_html_long_and_wide(self):
+        max_cols = 20
+        max_rows = 60
+
+        h, w = max_rows - 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' not in df._repr_html_()
+
+        h, w = max_rows + 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        with option_context('display.max_rows', 60, 'display.max_columns', 20):
+            assert '...' in df._repr_html_()
+
+    def test_info_repr(self):
+        # GH#21746 For tests inside a terminal (i.e. not CI) we need to detect
+        # the terminal size to ensure that we try to print something "too big"
+        term_width, term_height = get_terminal_size()
+
+        max_rows = 60
+        max_cols = 20 + (max(term_width, 80) - 80) // 4
+        # Long
+        h, w = max_rows + 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert has_vertically_truncated_repr(df)
+        with option_context('display.large_repr', 'info'):
+            assert has_info_repr(df)
+
+        # Wide
+        h, w = max_rows - 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert has_horizontally_truncated_repr(df)
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', max_cols):
+            assert has_info_repr(df)
+
+    def test_info_repr_max_cols(self):
+        # GH #6939
+        df = DataFrame(np.random.randn(10, 5))
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', 1,
+                            'display.max_info_columns', 4):
+            assert has_non_verbose_info_repr(df)
+
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', 1,
+                            'display.max_info_columns', 5):
+            assert not has_non_verbose_info_repr(df)
+
+        # test verbose overrides
+        # fmt.set_option('display.max_info_columns', 4)  # exceeded
+
+    def test_info_repr_html(self):
+        max_rows = 60
+        max_cols = 20
+        # Long
+        h, w = max_rows + 1, max_cols - 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert r'&lt;class' not in df._repr_html_()
+        with option_context('display.large_repr', 'info'):
+            assert r'&lt;class' in df._repr_html_()
+
+        # Wide
+        h, w = max_rows - 1, max_cols + 1
+        df = DataFrame({k: np.arange(1, 1 + h) for k in np.arange(w)})
+        assert '<class' not in df._repr_html_()
+        with option_context('display.large_repr', 'info',
+                            'display.max_columns', max_cols):
+            assert '&lt;class' in df._repr_html_()
+
+    def test_fake_qtconsole_repr_html(self):
+        def get_ipython():
+            return {'config': {'KernelApp':
+                               {'parent_appname': 'ipython-qtconsole'}}}
+
+        repstr = self.frame._repr_html_()
+        assert repstr is not None
+
+        fmt.set_option('display.max_rows', 5, 'display.max_columns', 2)
+        repstr = self.frame._repr_html_()
+
+        assert 'class' in repstr  # info fallback
+        tm.reset_display_options()
+
+    def test_pprint_pathological_object(self):
+        """
+        If the test fails, it at least won't hang.
+        """
+
+        class A(object):
+            def __getitem__(self, key):
+                return 3  # obviously simplified
+
+        df = DataFrame([A()])
+        repr(df)  # just don't die
+
+    def test_float_trim_zeros(self):
+        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
+                2.03954217305e+10, 5.59897817305e+10]
+        skip = True
+        for line in repr(DataFrame({'A': vals})).split('\n')[:-2]:
+            if line.startswith('dtype:'):
+                continue
+            if _three_digit_exp():
+                assert ('+010' in line) or skip
+            else:
+                assert ('+10' in line) or skip
+            skip = False
+
+    def test_dict_entries(self):
+        df = DataFrame({'A': [{'a': 1, 'b': 2}]})
+
+        val = df.to_string()
+        assert "'a': 1" in val
+        assert "'b': 2" in val
+
+    def test_period(self):
+        # GH 12615
+        df = pd.DataFrame({'A': pd.period_range('2013-01',
+                                                periods=4, freq='M'),
+                           'B': [pd.Period('2011-01', freq='M'),
+                                 pd.Period('2011-02-01', freq='D'),
+                                 pd.Period('2011-03-01 09:00', freq='H'),
+                                 pd.Period('2011-04', freq='M')],
+                           'C': list('abcd')})
+        exp = ("         A                 B  C\n"
+               "0  2013-01           2011-01  a\n"
+               "1  2013-02        2011-02-01  b\n"
+               "2  2013-03  2011-03-01 09:00  c\n"
+               "3  2013-04           2011-04  d")
+        assert str(df) == exp
+
+
+def gen_series_formatting():
+    s1 = pd.Series(['a'] * 100)
+    s2 = pd.Series(['ab'] * 100)
+    s3 = pd.Series(['a', 'ab', 'abc', 'abcd', 'abcde', 'abcdef'])
+    s4 = s3[::-1]
+    test_sers = {'onel': s1, 'twol': s2, 'asc': s3, 'desc': s4}
+    return test_sers
+
+
+class TestSeriesFormatting(object):
+
+    def setup_method(self, method):
+        self.ts = tm.makeTimeSeries()
+
+    def test_repr_unicode(self):
+        s = Series([u('\u03c3')] * 10)
+        repr(s)
+
+        a = Series([u("\u05d0")] * 1000)
+        a.name = 'title1'
+        repr(a)
+
+    def test_to_string(self):
+        buf = StringIO()
+
+        s = self.ts.to_string()
+
+        retval = self.ts.to_string(buf=buf)
+        assert retval is None
+        assert buf.getvalue().strip() == s
+
+        # pass float_format
+        format = '%.4f'.__mod__
+        result = self.ts.to_string(float_format=format)
+        result = [x.split()[1] for x in result.split('\n')[:-1]]
+        expected = [format(x) for x in self.ts]
+        assert result == expected
+
+        # empty string
+        result = self.ts[:0].to_string()
+        assert result == 'Series([], Freq: B)'
+
+        result = self.ts[:0].to_string(length=0)
+        assert result == 'Series([], Freq: B)'
+
+        # name and length
+        cp = self.ts.copy()
+        cp.name = 'foo'
+        result = cp.to_string(length=True, name=True, dtype=True)
+        last_line = result.split('\n')[-1].strip()
+        assert last_line == ("Freq: B, Name: foo, "
+                             "Length: {cp}, dtype: float64".format(cp=len(cp)))
+
+    def test_freq_name_separation(self):
+        s = Series(np.random.randn(10),
+                   index=date_range('1/1/2000', periods=10), name=0)
+
+        result = repr(s)
+        assert 'Freq: D, Name: 0' in result
+
+    def test_to_string_mixed(self):
+        s = Series(['foo', np.nan, -1.23, 4.56])
+        result = s.to_string()
+        expected = (u('0     foo\n') + u('1     NaN\n') + u('2   -1.23\n') +
+                    u('3    4.56'))
+        assert result == expected
+
+        # but don't count NAs as floats
+        s = Series(['foo', np.nan, 'bar', 'baz'])
+        result = s.to_string()
+        expected = (u('0    foo\n') + '1    NaN\n' + '2    bar\n' + '3    baz')
+        assert result == expected
+
+        s = Series(['foo', 5, 'bar', 'baz'])
+        result = s.to_string()
+        expected = (u('0    foo\n') + '1      5\n' + '2    bar\n' + '3    baz')
+        assert result == expected
+
+    def test_to_string_float_na_spacing(self):
+        s = Series([0., 1.5678, 2., -3., 4.])
+        s[::2] = np.nan
+
+        result = s.to_string()
+        expected = (u('0       NaN\n') + '1    1.5678\n' + '2       NaN\n' +
+                    '3   -3.0000\n' + '4       NaN')
+        assert result == expected
+
+    def test_to_string_without_index(self):
+        # GH 11729 Test index=False option
+        s = Series([1, 2, 3, 4])
+        result = s.to_string(index=False)
+        expected = (u(' 1\n') + ' 2\n' + ' 3\n' + ' 4')
+        assert result == expected
+
+    def test_unicode_name_in_footer(self):
+        s = Series([1, 2], name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
+        sf = fmt.SeriesFormatter(s, name=u('\u05e2\u05d1\u05e8\u05d9\u05ea'))
+        sf._get_footer()  # should not raise exception
+
+    def test_east_asian_unicode_series(self):
+        if PY3:
+            _rep = repr
+        else:
+            _rep = unicode  # noqa
+        # not aligned properly because of east asian width
+
+        # unicode index
+        s = Series(['a', 'bb', 'CCC', 'D'],
+                   index=[u'あ', u'いい', u'ううう', u'ええええ'])
+        expected = (u"あ         a\nいい       bb\nううう     CCC\n"
+                    u"ええええ      D\ndtype: object")
+        assert _rep(s) == expected
+
+        # unicode values
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=['a', 'bb', 'c', 'ddd'])
+        expected = (u"a         あ\nbb       いい\nc       ううう\n"
+                    u"ddd    ええええ\ndtype: object")
+        assert _rep(s) == expected
+
+        # both
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=[u'ああ', u'いいいい', u'う', u'えええ'])
+        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
+                    u"えええ     ええええ\ndtype: object")
+        assert _rep(s) == expected
+
+        # unicode footer
+        s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                   index=[u'ああ', u'いいいい', u'う', u'えええ'],
+                   name=u'おおおおおおお')
+        expected = (u"ああ         あ\nいいいい      いい\nう        ううう\n"
+                    u"えええ     ええええ\nName: おおおおおおお, dtype: object")
+        assert _rep(s) == expected
+
+        # MultiIndex
+        idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+            u'おおお', u'かかかか'), (u'き', u'くく')])
+        s = Series([1, 22, 3333, 44444], index=idx)
+        expected = (u"あ    いい          1\n"
+                    u"う    え          22\n"
+                    u"おおお  かかかか     3333\n"
+                    u"き    くく      44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # object dtype, shorter than unicode repr
+        s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
+        expected = (u"1          1\nAB        22\nNaN     3333\n"
+                    u"あああ    44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # object dtype, longer than unicode repr
+        s = Series([1, 22, 3333, 44444],
+                   index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
+        expected = (u"1                          1\n"
+                    u"AB                        22\n"
+                    u"2011-01-01 00:00:00     3333\n"
+                    u"あああ                    44444\ndtype: int64")
+        assert _rep(s) == expected
+
+        # truncate
+        with option_context('display.max_rows', 3):
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       name=u'おおおおおおお')
+
+            expected = (u"0       あ\n     ... \n"
+                        u"3    ええええ\n"
+                        u"Name: おおおおおおお, Length: 4, dtype: object")
+            assert _rep(s) == expected
+
+            s.index = [u'ああ', u'いいいい', u'う', u'えええ']
+            expected = (u"ああ        あ\n       ... \n"
+                        u"えええ    ええええ\n"
+                        u"Name: おおおおおおお, Length: 4, dtype: object")
+            assert _rep(s) == expected
+
+        # Emable Unicode option -----------------------------------------
+        with option_context('display.unicode.east_asian_width', True):
+
+            # unicode index
+            s = Series(['a', 'bb', 'CCC', 'D'],
+                       index=[u'あ', u'いい', u'ううう', u'ええええ'])
+            expected = (u"あ            a\nいい         bb\nううう      CCC\n"
+                        u"ええええ      D\ndtype: object")
+            assert _rep(s) == expected
+
+            # unicode values
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=['a', 'bb', 'c', 'ddd'])
+            expected = (u"a            あ\nbb         いい\nc        ううう\n"
+                        u"ddd    ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+            # both
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'いいいい', u'う', u'えええ'])
+            expected = (u"ああ              あ\n"
+                        u"いいいい        いい\n"
+                        u"う            ううう\n"
+                        u"えええ      ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+            # unicode footer
+            s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'いいいい', u'う', u'えええ'],
+                       name=u'おおおおおおお')
+            expected = (u"ああ              あ\n"
+                        u"いいいい        いい\n"
+                        u"う            ううう\n"
+                        u"えええ      ええええ\n"
+                        u"Name: おおおおおおお, dtype: object")
+            assert _rep(s) == expected
+
+            # MultiIndex
+            idx = pd.MultiIndex.from_tuples([(u'あ', u'いい'), (u'う', u'え'), (
+                u'おおお', u'かかかか'), (u'き', u'くく')])
+            s = Series([1, 22, 3333, 44444], index=idx)
+            expected = (u"あ      いい            1\n"
+                        u"う      え             22\n"
+                        u"おおお  かかかか     3333\n"
+                        u"き      くく        44444\n"
+                        u"dtype: int64")
+            assert _rep(s) == expected
+
+            # object dtype, shorter than unicode repr
+            s = Series([1, 22, 3333, 44444], index=[1, 'AB', np.nan, u'あああ'])
+            expected = (u"1             1\nAB           22\nNaN        3333\n"
+                        u"あああ    44444\ndtype: int64")
+            assert _rep(s) == expected
+
+            # object dtype, longer than unicode repr
+            s = Series([1, 22, 3333, 44444],
+                       index=[1, 'AB', pd.Timestamp('2011-01-01'), u'あああ'])
+            expected = (u"1                          1\n"
+                        u"AB                        22\n"
+                        u"2011-01-01 00:00:00     3333\n"
+                        u"あああ                 44444\ndtype: int64")
+            assert _rep(s) == expected
+
+            # truncate
+            with option_context('display.max_rows', 3):
+                s = Series([u'あ', u'いい', u'ううう', u'ええええ'],
+                           name=u'おおおおおおお')
+                expected = (u"0          あ\n       ...   \n"
+                            u"3    ええええ\n"
+                            u"Name: おおおおおおお, Length: 4, dtype: object")
+                assert _rep(s) == expected
+
+                s.index = [u'ああ', u'いいいい', u'う', u'えええ']
+                expected = (u"ああ            あ\n"
+                            u"            ...   \n"
+                            u"えええ    ええええ\n"
+                            u"Name: おおおおおおお, Length: 4, dtype: object")
+                assert _rep(s) == expected
+
+            # ambiguous unicode
+            s = Series([u'¡¡', u'い¡¡', u'ううう', u'ええええ'],
+                       index=[u'ああ', u'¡¡¡¡いい', u'¡¡', u'えええ'])
+            expected = (u"ああ              ¡¡\n"
+                        u"¡¡¡¡いい        い¡¡\n"
+                        u"¡¡            ううう\n"
+                        u"えええ      ええええ\ndtype: object")
+            assert _rep(s) == expected
+
+    def test_float_trim_zeros(self):
+        vals = [2.08430917305e+10, 3.52205017305e+10, 2.30674817305e+10,
+                2.03954217305e+10, 5.59897817305e+10]
+        for line in repr(Series(vals)).split('\n'):
+            if line.startswith('dtype:'):
+                continue
+            if _three_digit_exp():
+                assert '+010' in line
+            else:
+                assert '+10' in line
+
+    def test_datetimeindex(self):
+
+        index = date_range('20130102', periods=6)
+        s = Series(1, index=index)
+        result = s.to_string()
+        assert '2013-01-02' in result
+
+        # nat in index
+        s2 = Series(2, index=[Timestamp('20130111'), NaT])
+        s = s2.append(s)
+        result = s.to_string()
+        assert 'NaT' in result
+
+        # nat in summary
+        result = str(s2.index)
+        assert 'NaT' in result
+
+    @pytest.mark.parametrize('start_date', [
+        '2017-01-01 23:59:59.999999999',
+        '2017-01-01 23:59:59.99999999',
+        '2017-01-01 23:59:59.9999999',
+        '2017-01-01 23:59:59.999999',
+        '2017-01-01 23:59:59.99999',
+        '2017-01-01 23:59:59.9999'
+    ])
+    def test_datetimeindex_highprecision(self, start_date):
+        # GH19030
+        # Check that high-precision time values for the end of day are
+        # included in repr for DatetimeIndex
+        s1 = Series(date_range(start=start_date, freq='D', periods=5))
+        result = str(s1)
+        assert start_date in result
+
+        dti = date_range(start=start_date, freq='D', periods=5)
+        s2 = Series(3, index=dti)
+        result = str(s2.index)
+        assert start_date in result
+
+    def test_timedelta64(self):
+
+        from datetime import datetime, timedelta
+
+        Series(np.array([1100, 20], dtype='timedelta64[ns]')).to_string()
+
+        s = Series(date_range('2012-1-1', periods=3, freq='D'))
+
+        # GH2146
+
+        # adding NaTs
+        y = s - s.shift(1)
+        result = y.to_string()
+        assert '1 days' in result
+        assert '00:00:00' not in result
+        assert 'NaT' in result
+
+        # with frac seconds
+        o = Series([datetime(2012, 1, 1, microsecond=150)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +23:59:59.999850' in result
+
+        # rounding?
+        o = Series([datetime(2012, 1, 1, 1)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +23:00:00' in result
+        assert '1 days 23:00:00' in result
+
+        o = Series([datetime(2012, 1, 1, 1, 1)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +22:59:00' in result
+        assert '1 days 22:59:00' in result
+
+        o = Series([datetime(2012, 1, 1, 1, 1, microsecond=150)] * 3)
+        y = s - o
+        result = y.to_string()
+        assert '-1 days +22:58:59.999850' in result
+        assert '0 days 22:58:59.999850' in result
+
+        # neg time
+        td = timedelta(minutes=5, seconds=3)
+        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
+        y = s - s2
+        result = y.to_string()
+        assert '-1 days +23:54:57' in result
+
+        td = timedelta(microseconds=550)
+        s2 = Series(date_range('2012-1-1', periods=3, freq='D')) + td
+        y = s - td
+        result = y.to_string()
+        assert '2012-01-01 23:59:59.999450' in result
+
+        # no boxing of the actual elements
+        td = Series(pd.timedelta_range('1 days', periods=3))
+        result = td.to_string()
+        assert result == u("0   1 days\n1   2 days\n2   3 days")
+
+    def test_mixed_datetime64(self):
+        df = DataFrame({'A': [1, 2], 'B': ['2012-01-01', '2012-01-02']})
+        df['B'] = pd.to_datetime(df.B)
+
+        result = repr(df.loc[0])
+        assert '2012-01-01' in result
+
+    def test_period(self):
+        # GH 12615
+        index = pd.period_range('2013-01', periods=6, freq='M')
+        s = Series(np.arange(6, dtype='int64'), index=index)
+        exp = ("2013-01    0\n"
+               "2013-02    1\n"
+               "2013-03    2\n"
+               "2013-04    3\n"
+               "2013-05    4\n"
+               "2013-06    5\n"
+               "Freq: M, dtype: int64")
+        assert str(s) == exp
+
+        s = Series(index)
+        exp = ("0    2013-01\n"
+               "1    2013-02\n"
+               "2    2013-03\n"
+               "3    2013-04\n"
+               "4    2013-05\n"
+               "5    2013-06\n"
+               "dtype: period[M]")
+        assert str(s) == exp
+
+        # periods with mixed freq
+        s = Series([pd.Period('2011-01', freq='M'),
+                    pd.Period('2011-02-01', freq='D'),
+                    pd.Period('2011-03-01 09:00', freq='H')])
+        exp = ("0             2011-01\n1          2011-02-01\n"
+               "2    2011-03-01 09:00\ndtype: object")
+        assert str(s) == exp
+
+    def test_max_multi_index_display(self):
+        # GH 7101
+
+        # doc example (indexing.rst)
+
+        # multi-index
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        tuples = list(zip(*arrays))
+        index = MultiIndex.from_tuples(tuples, names=['first', 'second'])
+        s = Series(np.random.randn(8), index=index)
+
+        with option_context("display.max_rows", 10):
+            assert len(str(s).split('\n')) == 10
+        with option_context("display.max_rows", 3):
+            assert len(str(s).split('\n')) == 5
+        with option_context("display.max_rows", 2):
+            assert len(str(s).split('\n')) == 5
+        with option_context("display.max_rows", 1):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 0):
+            assert len(str(s).split('\n')) == 10
+
+        # index
+        s = Series(np.random.randn(8), None)
+
+        with option_context("display.max_rows", 10):
+            assert len(str(s).split('\n')) == 9
+        with option_context("display.max_rows", 3):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 2):
+            assert len(str(s).split('\n')) == 4
+        with option_context("display.max_rows", 1):
+            assert len(str(s).split('\n')) == 3
+        with option_context("display.max_rows", 0):
+            assert len(str(s).split('\n')) == 9
+
+    # Make sure #8532 is fixed
+    def test_consistent_format(self):
+        s = pd.Series([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0.9999, 1, 1] * 10)
+        with option_context("display.max_rows", 10,
+                            "display.show_dimensions", False):
+            res = repr(s)
+        exp = ('0      1.0000\n1      1.0000\n2      1.0000\n3      '
+               '1.0000\n4      1.0000\n        ...  \n125    '
+               '1.0000\n126    1.0000\n127    0.9999\n128    '
+               '1.0000\n129    1.0000\ndtype: float64')
+        assert res == exp
+
+    def chck_ncols(self, s):
+        with option_context("display.max_rows", 10):
+            res = repr(s)
+        lines = res.split('\n')
+        lines = [line for line in repr(s).split('\n')
+                 if not re.match(r'[^\.]*\.+', line)][:-1]
+        ncolsizes = len({len(line.strip()) for line in lines})
+        assert ncolsizes == 1
+
+    def test_format_explicit(self):
+        test_sers = gen_series_formatting()
+        with option_context("display.max_rows", 4,
+                            "display.show_dimensions", False):
+            res = repr(test_sers['onel'])
+            exp = '0     a\n1     a\n     ..\n98    a\n99    a\ndtype: object'
+            assert exp == res
+            res = repr(test_sers['twol'])
+            exp = ('0     ab\n1     ab\n      ..\n98    ab\n99    ab\ndtype:'
+                   ' object')
+            assert exp == res
+            res = repr(test_sers['asc'])
+            exp = ('0         a\n1        ab\n      ...  \n4     abcde\n5'
+                   '    abcdef\ndtype: object')
+            assert exp == res
+            res = repr(test_sers['desc'])
+            exp = ('5    abcdef\n4     abcde\n      ...  \n1        ab\n0'
+                   '         a\ndtype: object')
+            assert exp == res
+
+    def test_ncols(self):
+        test_sers = gen_series_formatting()
+        for s in test_sers.values():
+            self.chck_ncols(s)
+
+    def test_max_rows_eq_one(self):
+        s = Series(range(10), dtype='int64')
+        with option_context("display.max_rows", 1):
+            strrepr = repr(s).split('\n')
+        exp1 = ['0', '0']
+        res1 = strrepr[0].split()
+        assert exp1 == res1
+        exp2 = ['..']
+        res2 = strrepr[1].split()
+        assert exp2 == res2
+
+    def test_truncate_ndots(self):
+        def getndots(s):
+            return len(re.match(r'[^\.]*(\.*)', s).groups()[0])
+
+        s = Series([0, 2, 3, 6])
+        with option_context("display.max_rows", 2):
+            strrepr = repr(s).replace('\n', '')
+        assert getndots(strrepr) == 2
+
+        s = Series([0, 100, 200, 400])
+        with option_context("display.max_rows", 2):
+            strrepr = repr(s).replace('\n', '')
+        assert getndots(strrepr) == 3
+
+    def test_show_dimensions(self):
+        # gh-7117
+        s = Series(range(5))
+
+        assert 'Length' not in repr(s)
+
+        with option_context("display.max_rows", 4):
+            assert 'Length' in repr(s)
+
+        with option_context("display.show_dimensions", True):
+            assert 'Length' in repr(s)
+
+        with option_context("display.max_rows", 4,
+                            "display.show_dimensions", False):
+            assert 'Length' not in repr(s)
+
+    def test_to_string_name(self):
+        s = Series(range(100), dtype='int64')
+        s.name = 'myser'
+        res = s.to_string(max_rows=2, name=True)
+        exp = '0      0\n      ..\n99    99\nName: myser'
+        assert res == exp
+        res = s.to_string(max_rows=2, name=False)
+        exp = '0      0\n      ..\n99    99'
+        assert res == exp
+
+    def test_to_string_dtype(self):
+        s = Series(range(100), dtype='int64')
+        res = s.to_string(max_rows=2, dtype=True)
+        exp = '0      0\n      ..\n99    99\ndtype: int64'
+        assert res == exp
+        res = s.to_string(max_rows=2, dtype=False)
+        exp = '0      0\n      ..\n99    99'
+        assert res == exp
+
+    def test_to_string_length(self):
+        s = Series(range(100), dtype='int64')
+        res = s.to_string(max_rows=2, length=True)
+        exp = '0      0\n      ..\n99    99\nLength: 100'
+        assert res == exp
+
+    def test_to_string_na_rep(self):
+        s = pd.Series(index=range(100))
+        res = s.to_string(na_rep='foo', max_rows=2)
+        exp = '0    foo\n      ..\n99   foo'
+        assert res == exp
+
+    def test_to_string_float_format(self):
+        s = pd.Series(range(10), dtype='float64')
+        res = s.to_string(float_format=lambda x: '{0:2.1f}'.format(x),
+                          max_rows=2)
+        exp = '0   0.0\n     ..\n9   9.0'
+        assert res == exp
+
+    def test_to_string_header(self):
+        s = pd.Series(range(10), dtype='int64')
+        s.index.name = 'foo'
+        res = s.to_string(header=True, max_rows=2)
+        exp = 'foo\n0    0\n    ..\n9    9'
+        assert res == exp
+        res = s.to_string(header=False, max_rows=2)
+        exp = '0    0\n    ..\n9    9'
+        assert res == exp
+
+
+def _three_digit_exp():
+    return '{x:.4g}'.format(x=1.7e8) == '1.7e+008'
+
+
+class TestFloatArrayFormatter(object):
+
+    def test_misc(self):
+        obj = fmt.FloatArrayFormatter(np.array([], dtype=np.float64))
+        result = obj.get_result()
+        assert len(result) == 0
+
+    def test_format(self):
+        obj = fmt.FloatArrayFormatter(np.array([12, 0], dtype=np.float64))
+        result = obj.get_result()
+        assert result[0] == " 12.0"
+        assert result[1] == "  0.0"
+
+    def test_output_significant_digits(self):
+        # Issue #9764
+
+        # In case default display precision changes:
+        with pd.option_context('display.precision', 6):
+            # DataFrame example from issue #9764
+            d = pd.DataFrame(
+                {'col1': [9.999e-8, 1e-7, 1.0001e-7, 2e-7, 4.999e-7, 5e-7,
+                          5.0001e-7, 6e-7, 9.999e-7, 1e-6, 1.0001e-6, 2e-6,
+                          4.999e-6, 5e-6, 5.0001e-6, 6e-6]})
+
+            expected_output = {
+                (0, 6):
+                '           col1\n'
+                '0  9.999000e-08\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07',
+                (1, 6):
+                '           col1\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07',
+                (1, 8):
+                '           col1\n'
+                '1  1.000000e-07\n'
+                '2  1.000100e-07\n'
+                '3  2.000000e-07\n'
+                '4  4.999000e-07\n'
+                '5  5.000000e-07\n'
+                '6  5.000100e-07\n'
+                '7  6.000000e-07',
+                (8, 16):
+                '            col1\n'
+                '8   9.999000e-07\n'
+                '9   1.000000e-06\n'
+                '10  1.000100e-06\n'
+                '11  2.000000e-06\n'
+                '12  4.999000e-06\n'
+                '13  5.000000e-06\n'
+                '14  5.000100e-06\n'
+                '15  6.000000e-06',
+                (9, 16):
+                '        col1\n'
+                '9   0.000001\n'
+                '10  0.000001\n'
+                '11  0.000002\n'
+                '12  0.000005\n'
+                '13  0.000005\n'
+                '14  0.000005\n'
+                '15  0.000006'
+            }
+
+            for (start, stop), v in expected_output.items():
+                assert str(d[start:stop]) == v
+
+    def test_too_long(self):
+        # GH 10451
+        with pd.option_context('display.precision', 4):
+            # need both a number > 1e6 and something that normally formats to
+            # having length > display.precision + 6
+            df = pd.DataFrame(dict(x=[12345.6789]))
+            assert str(df) == '            x\n0  12345.6789'
+            df = pd.DataFrame(dict(x=[2e6]))
+            assert str(df) == '           x\n0  2000000.0'
+            df = pd.DataFrame(dict(x=[12345.6789, 2e6]))
+            assert str(df) == '            x\n0  1.2346e+04\n1  2.0000e+06'
+
+
+class TestRepr_timedelta64(object):
+
+    def test_none(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base()
+        assert drepr(delta_1d) == "1 days"
+        assert drepr(-delta_1d) == "-1 days"
+        assert drepr(delta_0d) == "0 days"
+        assert drepr(delta_1s) == "0 days 00:00:01"
+        assert drepr(delta_500ms) == "0 days 00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_sub_day(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base(format='sub_day')
+        assert drepr(delta_1d) == "1 days"
+        assert drepr(-delta_1d) == "-1 days"
+        assert drepr(delta_0d) == "00:00:00"
+        assert drepr(delta_1s) == "00:00:01"
+        assert drepr(delta_500ms) == "00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_long(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1s = pd.to_timedelta(1, unit='s')
+        delta_500ms = pd.to_timedelta(500, unit='ms')
+
+        drepr = lambda x: x._repr_base(format='long')
+        assert drepr(delta_1d) == "1 days 00:00:00"
+        assert drepr(-delta_1d) == "-1 days +00:00:00"
+        assert drepr(delta_0d) == "0 days 00:00:00"
+        assert drepr(delta_1s) == "0 days 00:00:01"
+        assert drepr(delta_500ms) == "0 days 00:00:00.500000"
+        assert drepr(delta_1d + delta_1s) == "1 days 00:00:01"
+        assert drepr(-delta_1d + delta_1s) == "-1 days +00:00:01"
+        assert drepr(delta_1d + delta_500ms) == "1 days 00:00:00.500000"
+        assert drepr(-delta_1d + delta_500ms) == "-1 days +00:00:00.500000"
+
+    def test_all(self):
+        delta_1d = pd.to_timedelta(1, unit='D')
+        delta_0d = pd.to_timedelta(0, unit='D')
+        delta_1ns = pd.to_timedelta(1, unit='ns')
+
+        drepr = lambda x: x._repr_base(format='all')
+        assert drepr(delta_1d) == "1 days 00:00:00.000000000"
+        assert drepr(-delta_1d) == "-1 days +00:00:00.000000000"
+        assert drepr(delta_0d) == "0 days 00:00:00.000000000"
+        assert drepr(delta_1ns) == "0 days 00:00:00.000000001"
+        assert drepr(-delta_1d + delta_1ns) == "-1 days +00:00:00.000000001"
+
+
+class TestTimedelta64Formatter(object):
+
+    def test_days(self):
+        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+        assert result[1].strip() == "'1 days'"
+
+        result = fmt.Timedelta64Formatter(x[1:2], box=True).get_result()
+        assert result[0].strip() == "'1 days'"
+
+        result = fmt.Timedelta64Formatter(x, box=False).get_result()
+        assert result[0].strip() == "0 days"
+        assert result[1].strip() == "1 days"
+
+        result = fmt.Timedelta64Formatter(x[1:2], box=False).get_result()
+        assert result[0].strip() == "1 days"
+
+    def test_days_neg(self):
+        x = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(-x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+        assert result[1].strip() == "'-1 days'"
+
+    def test_subdays(self):
+        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
+        result = fmt.Timedelta64Formatter(y, box=True).get_result()
+        assert result[0].strip() == "'00:00:00'"
+        assert result[1].strip() == "'00:00:01'"
+
+    def test_subdays_neg(self):
+        y = pd.to_timedelta(list(range(5)) + [pd.NaT], unit='s')
+        result = fmt.Timedelta64Formatter(-y, box=True).get_result()
+        assert result[0].strip() == "'00:00:00'"
+        assert result[1].strip() == "'-1 days +23:59:59'"
+
+    def test_zero(self):
+        x = pd.to_timedelta(list(range(1)) + [pd.NaT], unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+
+        x = pd.to_timedelta(list(range(1)), unit='D')
+        result = fmt.Timedelta64Formatter(x, box=True).get_result()
+        assert result[0].strip() == "'0 days'"
+
+
+class TestDatetime64Formatter(object):
+
+    def test_mixed(self):
+        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 1, 12), pd.NaT])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 00:00:00"
+        assert result[1].strip() == "2013-01-01 12:00:00"
+
+    def test_dates(self):
+        x = Series([datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01"
+        assert result[1].strip() == "2013-01-02"
+
+    def test_date_nanos(self):
+        x = Series([Timestamp(200)])
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "1970-01-01 00:00:00.000000200"
+
+    def test_dates_display(self):
+
+        # 10170
+        # make sure that we are consistently display date formatting
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='D'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-05 09:00:00"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='s'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:04"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='ms'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.004"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='us'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.000004"
+
+        x = Series(date_range('20130101 09:00:00', periods=5, freq='N'))
+        x.iloc[1] = np.nan
+        result = fmt.Datetime64Formatter(x).get_result()
+        assert result[0].strip() == "2013-01-01 09:00:00.000000000"
+        assert result[1].strip() == "NaT"
+        assert result[4].strip() == "2013-01-01 09:00:00.000000004"
+
+    def test_datetime64formatter_yearmonth(self):
+        x = Series([datetime(2016, 1, 1), datetime(2016, 2, 2)])
+
+        def format_func(x):
+            return x.strftime('%Y-%m')
+
+        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
+        result = formatter.get_result()
+        assert result == ['2016-01', '2016-02']
+
+    def test_datetime64formatter_hoursecond(self):
+
+        x = Series(pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                  format='%H:%M:%S.%f'))
+
+        def format_func(x):
+            return x.strftime('%H:%M')
+
+        formatter = fmt.Datetime64Formatter(x, formatter=format_func)
+        result = formatter.get_result()
+        assert result == ['10:10', '12:12']
+
+
+class TestNaTFormatting(object):
+
+    def test_repr(self):
+        assert repr(pd.NaT) == "NaT"
+
+    def test_str(self):
+        assert str(pd.NaT) == "NaT"
+
+
+class TestDatetimeIndexFormat(object):
+
+    def test_datetime(self):
+        formatted = pd.to_datetime([datetime(2003, 1, 1, 12), pd.NaT]).format()
+        assert formatted[0] == "2003-01-01 12:00:00"
+        assert formatted[1] == "NaT"
+
+    def test_date(self):
+        formatted = pd.to_datetime([datetime(2003, 1, 1), pd.NaT]).format()
+        assert formatted[0] == "2003-01-01"
+        assert formatted[1] == "NaT"
+
+    def test_date_tz(self):
+        formatted = pd.to_datetime([datetime(2013, 1, 1)], utc=True).format()
+        assert formatted[0] == "2013-01-01 00:00:00+00:00"
+
+        formatted = pd.to_datetime(
+            [datetime(2013, 1, 1), pd.NaT], utc=True).format()
+        assert formatted[0] == "2013-01-01 00:00:00+00:00"
+
+    def test_date_explicit_date_format(self):
+        formatted = pd.to_datetime([datetime(2003, 2, 1), pd.NaT]).format(
+            date_format="%m-%d-%Y", na_rep="UT")
+        assert formatted[0] == "02-01-2003"
+        assert formatted[1] == "UT"
+
+
+class TestDatetimeIndexUnicode(object):
+
+    def test_dates(self):
+        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(2014, 1, 1)
+                                   ]))
+        assert "['2013-01-01'," in text
+        assert ", '2014-01-01']" in text
+
+    def test_mixed(self):
+        text = str(pd.to_datetime([datetime(2013, 1, 1), datetime(
+            2014, 1, 1, 12), datetime(2014, 1, 1)]))
+        assert "'2013-01-01 00:00:00'," in text
+        assert "'2014-01-01 00:00:00']" in text
+
+
+class TestStringRepTimestamp(object):
+
+    def test_no_tz(self):
+        dt_date = datetime(2013, 1, 2)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+        ts_nanos_only = Timestamp(200)
+        assert str(ts_nanos_only) == "1970-01-01 00:00:00.000000200"
+
+        ts_nanos_micros = Timestamp(1200)
+        assert str(ts_nanos_micros) == "1970-01-01 00:00:00.000001200"
+
+    def test_tz_pytz(self):
+        dt_date = datetime(2013, 1, 2, tzinfo=pytz.utc)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=pytz.utc)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=pytz.utc)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+    def test_tz_dateutil(self):
+        utc = dateutil.tz.tzutc()
+
+        dt_date = datetime(2013, 1, 2, tzinfo=utc)
+        assert str(dt_date) == str(Timestamp(dt_date))
+
+        dt_datetime = datetime(2013, 1, 2, 12, 1, 3, tzinfo=utc)
+        assert str(dt_datetime) == str(Timestamp(dt_datetime))
+
+        dt_datetime_us = datetime(2013, 1, 2, 12, 1, 3, 45, tzinfo=utc)
+        assert str(dt_datetime_us) == str(Timestamp(dt_datetime_us))
+
+    def test_nat_representations(self):
+        for f in (str, repr, methodcaller('isoformat')):
+            assert f(pd.NaT) == 'NaT'
+
+
+def test_format_percentiles():
+    result = fmt.format_percentiles([0.01999, 0.02001, 0.5, 0.666666, 0.9999])
+    expected = ['1.999%', '2.001%', '50%', '66.667%', '99.99%']
+    assert result == expected
+
+    result = fmt.format_percentiles([0, 0.5, 0.02001, 0.5, 0.666666, 0.9999])
+    expected = ['0%', '50%', '2.0%', '50%', '66.67%', '99.99%']
+    assert result == expected
+
+    msg = r"percentiles should all be in the interval \[0,1\]"
+    with pytest.raises(ValueError, match=msg):
+        fmt.format_percentiles([0.1, np.nan, 0.5])
+    with pytest.raises(ValueError, match=msg):
+        fmt.format_percentiles([-0.001, 0.1, 0.5])
+    with pytest.raises(ValueError, match=msg):
+        fmt.format_percentiles([2, 0.1, 0.5])
+    with pytest.raises(ValueError, match=msg):
+        fmt.format_percentiles([0.1, 0.5, 'a'])
+
+
+def test_repr_html_ipython_config(ip):
+    code = textwrap.dedent("""\
+    import pandas as pd
+    df = pd.DataFrame({"A": [1, 2]})
+    df._repr_html_()
+
+    cfg = get_ipython().config
+    cfg['IPKernelApp']['parent_appname']
+    df._repr_html_()
+    """)
+    result = ip.run_cell(code)
+    assert not result.error_in_exec
diff --git a/pandas/tests/io/formats/test_printing.py b/pandas/tests/io/formats/test_printing.py
new file mode 100644
index 0000000000000..67ff68ac4db8c
--- /dev/null
+++ b/pandas/tests/io/formats/test_printing.py
@@ -0,0 +1,204 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import compat
+import pandas.core.config as cf
+
+import pandas.io.formats.format as fmt
+import pandas.io.formats.printing as printing
+
+
+def test_adjoin():
+    data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
+    expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
+
+    adjoined = printing.adjoin(2, *data)
+
+    assert (adjoined == expected)
+
+
+def test_repr_binary_type():
+    import string
+    letters = string.ascii_letters
+    btype = compat.binary_type
+    try:
+        raw = btype(letters, encoding=cf.get_option('display.encoding'))
+    except TypeError:
+        raw = btype(letters)
+    b = compat.text_type(compat.bytes_to_str(raw))
+    res = printing.pprint_thing(b, quote_strings=True)
+    assert res == repr(b)
+    res = printing.pprint_thing(b, quote_strings=False)
+    assert res == b
+
+
+class TestFormattBase(object):
+
+    def test_adjoin(self):
+        data = [['a', 'b', 'c'], ['dd', 'ee', 'ff'], ['ggg', 'hhh', 'iii']]
+        expected = 'a  dd  ggg\nb  ee  hhh\nc  ff  iii'
+
+        adjoined = printing.adjoin(2, *data)
+
+        assert adjoined == expected
+
+    def test_adjoin_unicode(self):
+        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'], ['ggg', 'hhh', u'いいい']]
+        expected = u'あ  dd  ggg\nb  ええ  hhh\nc  ff  いいい'
+        adjoined = printing.adjoin(2, *data)
+        assert adjoined == expected
+
+        adj = fmt.EastAsianTextAdjustment()
+
+        expected = u"""あ  dd    ggg
+b   ええ  hhh
+c   ff    いいい"""
+
+        adjoined = adj.adjoin(2, *data)
+        assert adjoined == expected
+        cols = adjoined.split('\n')
+        assert adj.len(cols[0]) == 13
+        assert adj.len(cols[1]) == 13
+        assert adj.len(cols[2]) == 16
+
+        expected = u"""あ       dd         ggg
+b        ええ       hhh
+c        ff         いいい"""
+
+        adjoined = adj.adjoin(7, *data)
+        assert adjoined == expected
+        cols = adjoined.split('\n')
+        assert adj.len(cols[0]) == 23
+        assert adj.len(cols[1]) == 23
+        assert adj.len(cols[2]) == 26
+
+    def test_justify(self):
+        adj = fmt.EastAsianTextAdjustment()
+
+        def just(x, *args, **kwargs):
+            # wrapper to test single str
+            return adj.justify([x], *args, **kwargs)[0]
+
+        assert just('abc', 5, mode='left') == 'abc  '
+        assert just('abc', 5, mode='center') == ' abc '
+        assert just('abc', 5, mode='right') == '  abc'
+        assert just(u'abc', 5, mode='left') == 'abc  '
+        assert just(u'abc', 5, mode='center') == ' abc '
+        assert just(u'abc', 5, mode='right') == '  abc'
+
+        assert just(u'パンダ', 5, mode='left') == u'パンダ'
+        assert just(u'パンダ', 5, mode='center') == u'パンダ'
+        assert just(u'パンダ', 5, mode='right') == u'パンダ'
+
+        assert just(u'パンダ', 10, mode='left') == u'パンダ    '
+        assert just(u'パンダ', 10, mode='center') == u'  パンダ  '
+        assert just(u'パンダ', 10, mode='right') == u'    パンダ'
+
+    def test_east_asian_len(self):
+        adj = fmt.EastAsianTextAdjustment()
+
+        assert adj.len('abc') == 3
+        assert adj.len(u'abc') == 3
+
+        assert adj.len(u'パンダ') == 6
+        assert adj.len(u'ﾊﾟﾝﾀﾞ') == 5
+        assert adj.len(u'パンダpanda') == 11
+        assert adj.len(u'ﾊﾟﾝﾀﾞpanda') == 10
+
+    def test_ambiguous_width(self):
+        adj = fmt.EastAsianTextAdjustment()
+        assert adj.len(u'¡¡ab') == 4
+
+        with cf.option_context('display.unicode.ambiguous_as_wide', True):
+            adj = fmt.EastAsianTextAdjustment()
+            assert adj.len(u'¡¡ab') == 6
+
+        data = [[u'あ', 'b', 'c'], ['dd', u'ええ', 'ff'],
+                ['ggg', u'¡¡ab', u'いいい']]
+        expected = u'あ  dd    ggg \nb   ええ  ¡¡ab\nc   ff    いいい'
+        adjoined = adj.adjoin(2, *data)
+        assert adjoined == expected
+
+
+class TestTableSchemaRepr(object):
+
+    @classmethod
+    def setup_class(cls):
+        pytest.importorskip('IPython')
+
+        from IPython.core.interactiveshell import InteractiveShell
+        cls.display_formatter = InteractiveShell.instance().display_formatter
+
+    def test_publishes(self):
+
+        df = pd.DataFrame({"A": [1, 2]})
+        objects = [df['A'], df, df]  # dataframe / series
+        expected_keys = [
+            {'text/plain', 'application/vnd.dataresource+json'},
+            {'text/plain', 'text/html', 'application/vnd.dataresource+json'},
+        ]
+
+        opt = pd.option_context('display.html.table_schema', True)
+        for obj, expected in zip(objects, expected_keys):
+            with opt:
+                formatted = self.display_formatter.format(obj)
+            assert set(formatted[0].keys()) == expected
+
+        with_latex = pd.option_context('display.latex.repr', True)
+
+        with opt, with_latex:
+            formatted = self.display_formatter.format(obj)
+
+        expected = {'text/plain', 'text/html', 'text/latex',
+                    'application/vnd.dataresource+json'}
+        assert set(formatted[0].keys()) == expected
+
+    def test_publishes_not_implemented(self):
+        # column MultiIndex
+        # GH 15996
+        midx = pd.MultiIndex.from_product([['A', 'B'], ['a', 'b', 'c']])
+        df = pd.DataFrame(np.random.randn(5, len(midx)), columns=midx)
+
+        opt = pd.option_context('display.html.table_schema', True)
+
+        with opt:
+            formatted = self.display_formatter.format(df)
+
+        expected = {'text/plain', 'text/html'}
+        assert set(formatted[0].keys()) == expected
+
+    def test_config_on(self):
+        df = pd.DataFrame({"A": [1, 2]})
+        with pd.option_context("display.html.table_schema", True):
+            result = df._repr_data_resource_()
+
+        assert result is not None
+
+    def test_config_default_off(self):
+        df = pd.DataFrame({"A": [1, 2]})
+        with pd.option_context("display.html.table_schema", False):
+            result = df._repr_data_resource_()
+
+        assert result is None
+
+    def test_enable_data_resource_formatter(self):
+        # GH 10491
+        formatters = self.display_formatter.formatters
+        mimetype = 'application/vnd.dataresource+json'
+
+        with pd.option_context('display.html.table_schema', True):
+            assert 'application/vnd.dataresource+json' in formatters
+            assert formatters[mimetype].enabled
+
+        # still there, just disabled
+        assert 'application/vnd.dataresource+json' in formatters
+        assert not formatters[mimetype].enabled
+
+        # able to re-set
+        with pd.option_context('display.html.table_schema', True):
+            assert 'application/vnd.dataresource+json' in formatters
+            assert formatters[mimetype].enabled
+            # smoke test that it works
+            self.display_formatter.format(cf)
diff --git a/pandas/tests/io/formats/test_style.py b/pandas/tests/io/formats/test_style.py
new file mode 100644
index 0000000000000..407c786725f13
--- /dev/null
+++ b/pandas/tests/io/formats/test_style.py
@@ -0,0 +1,1315 @@
+import copy
+import re
+import textwrap
+
+import numpy as np
+import pytest
+
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+jinja2 = pytest.importorskip('jinja2')
+from pandas.io.formats.style import Styler, _get_level_lengths  # noqa  # isort:skip
+
+
+class TestStyler(object):
+
+    def setup_method(self, method):
+        np.random.seed(24)
+        self.s = DataFrame({'A': np.random.permutation(range(6))})
+        self.df = DataFrame({'A': [0, 1], 'B': np.random.randn(2)})
+        self.f = lambda x: x
+        self.g = lambda x: x
+
+        def h(x, foo='bar'):
+            return pd.Series(
+                'color: {foo}'.format(foo=foo), index=x.index, name=x.name)
+
+        self.h = h
+        self.styler = Styler(self.df)
+        self.attrs = pd.DataFrame({'A': ['color: red', 'color: blue']})
+        self.dataframes = [
+            self.df,
+            pd.DataFrame({'f': [1., 2.], 'o': ['a', 'b'],
+                          'c': pd.Categorical(['a', 'b'])})
+        ]
+
+    def test_init_non_pandas(self):
+        with pytest.raises(TypeError):
+            Styler([1, 2, 3])
+
+    def test_init_series(self):
+        result = Styler(pd.Series([1, 2]))
+        assert result.data.ndim == 2
+
+    def test_repr_html_ok(self):
+        self.styler._repr_html_()
+
+    def test_repr_html_mathjax(self):
+        # gh-19824
+        assert 'tex2jax_ignore' not in self.styler._repr_html_()
+
+        with pd.option_context('display.html.use_mathjax', False):
+            assert 'tex2jax_ignore' in self.styler._repr_html_()
+
+    def test_update_ctx(self):
+        self.styler._update_ctx(self.attrs)
+        expected = {(0, 0): ['color: red'],
+                    (1, 0): ['color: blue']}
+        assert self.styler.ctx == expected
+
+    def test_update_ctx_flatten_multi(self):
+        attrs = DataFrame({"A": ['color: red; foo: bar',
+                                 'color: blue; foo: baz']})
+        self.styler._update_ctx(attrs)
+        expected = {(0, 0): ['color: red', ' foo: bar'],
+                    (1, 0): ['color: blue', ' foo: baz']}
+        assert self.styler.ctx == expected
+
+    def test_update_ctx_flatten_multi_traliing_semi(self):
+        attrs = DataFrame({"A": ['color: red; foo: bar;',
+                                 'color: blue; foo: baz;']})
+        self.styler._update_ctx(attrs)
+        expected = {(0, 0): ['color: red', ' foo: bar'],
+                    (1, 0): ['color: blue', ' foo: baz']}
+        assert self.styler.ctx == expected
+
+    def test_copy(self):
+        s2 = copy.copy(self.styler)
+        assert self.styler is not s2
+        assert self.styler.ctx is s2.ctx  # shallow
+        assert self.styler._todo is s2._todo
+
+        self.styler._update_ctx(self.attrs)
+        self.styler.highlight_max()
+        assert self.styler.ctx == s2.ctx
+        assert self.styler._todo == s2._todo
+
+    def test_deepcopy(self):
+        s2 = copy.deepcopy(self.styler)
+        assert self.styler is not s2
+        assert self.styler.ctx is not s2.ctx
+        assert self.styler._todo is not s2._todo
+
+        self.styler._update_ctx(self.attrs)
+        self.styler.highlight_max()
+        assert self.styler.ctx != s2.ctx
+        assert s2._todo == []
+        assert self.styler._todo != s2._todo
+
+    def test_clear(self):
+        s = self.df.style.highlight_max()._compute()
+        assert len(s.ctx) > 0
+        assert len(s._todo) > 0
+        s.clear()
+        assert len(s.ctx) == 0
+        assert len(s._todo) == 0
+
+    def test_render(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        style = lambda x: pd.Series(["color: red", "color: blue"], name=x.name)
+        s = Styler(df, uuid='AB').apply(style)
+        s.render()
+        # it worked?
+
+    def test_render_empty_dfs(self):
+        empty_df = DataFrame()
+        es = Styler(empty_df)
+        es.render()
+        # An index but no columns
+        DataFrame(columns=['a']).style.render()
+        # A column but no index
+        DataFrame(index=['a']).style.render()
+        # No IndexError raised?
+
+    def test_render_double(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        style = lambda x: pd.Series(["color: red; border: 1px",
+                                     "color: blue; border: 2px"], name=x.name)
+        s = Styler(df, uuid='AB').apply(style)
+        s.render()
+        # it worked?
+
+    def test_set_properties(self):
+        df = pd.DataFrame({"A": [0, 1]})
+        result = df.style.set_properties(color='white',
+                                         size='10px')._compute().ctx
+        # order is deterministic
+        v = ["color: white", "size: 10px"]
+        expected = {(0, 0): v, (1, 0): v}
+        assert result.keys() == expected.keys()
+        for v1, v2 in zip(result.values(), expected.values()):
+            assert sorted(v1) == sorted(v2)
+
+    def test_set_properties_subset(self):
+        df = pd.DataFrame({'A': [0, 1]})
+        result = df.style.set_properties(subset=pd.IndexSlice[0, 'A'],
+                                         color='white')._compute().ctx
+        expected = {(0, 0): ['color: white']}
+        assert result == expected
+
+    def test_empty_index_name_doesnt_display(self):
+        # https://github.com/pandas-dev/pandas/pull/12090#issuecomment-180695902
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.style._translate()
+
+        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
+                      'is_visible': True, 'display_value': ''},
+                     {'class': 'col_heading level0 col0',
+                      'display_value': 'A',
+                      'type': 'th',
+                      'value': 'A',
+                      'is_visible': True,
+                      },
+                     {'class': 'col_heading level0 col1',
+                      'display_value': 'B',
+                      'type': 'th',
+                      'value': 'B',
+                      'is_visible': True,
+                      },
+                     {'class': 'col_heading level0 col2',
+                      'display_value': 'C',
+                      'type': 'th',
+                      'value': 'C',
+                      'is_visible': True,
+                      }]]
+
+        assert result['head'] == expected
+
+    def test_index_name(self):
+        # https://github.com/pandas-dev/pandas/issues/11655
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.set_index('A').style._translate()
+
+        expected = [[{'class': 'blank level0', 'type': 'th', 'value': '',
+                      'display_value': '', 'is_visible': True},
+                     {'class': 'col_heading level0 col0', 'type': 'th',
+                      'value': 'B', 'display_value': 'B', 'is_visible': True},
+                     {'class': 'col_heading level0 col1', 'type': 'th',
+                      'value': 'C', 'display_value': 'C', 'is_visible': True}],
+                    [{'class': 'index_name level0', 'type': 'th',
+                      'value': 'A'},
+                     {'class': 'blank', 'type': 'th', 'value': ''},
+                     {'class': 'blank', 'type': 'th', 'value': ''}]]
+
+        assert result['head'] == expected
+
+    def test_multiindex_name(self):
+        # https://github.com/pandas-dev/pandas/issues/11655
+        df = pd.DataFrame({'A': [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        result = df.set_index(['A', 'B']).style._translate()
+
+        expected = [[
+            {'class': 'blank', 'type': 'th', 'value': '',
+             'display_value': '', 'is_visible': True},
+            {'class': 'blank level0', 'type': 'th', 'value': '',
+             'display_value': '', 'is_visible': True},
+            {'class': 'col_heading level0 col0', 'type': 'th',
+             'value': 'C', 'display_value': 'C', 'is_visible': True}],
+            [{'class': 'index_name level0', 'type': 'th',
+              'value': 'A'},
+             {'class': 'index_name level1', 'type': 'th',
+              'value': 'B'},
+             {'class': 'blank', 'type': 'th', 'value': ''}]]
+
+        assert result['head'] == expected
+
+    def test_numeric_columns(self):
+        # https://github.com/pandas-dev/pandas/issues/12125
+        # smoke test for _translate
+        df = pd.DataFrame({0: [1, 2, 3]})
+        df.style._translate()
+
+    def test_apply_axis(self):
+        df = pd.DataFrame({'A': [0, 0], 'B': [1, 1]})
+        f = lambda x: ['val: {max}'.format(max=x.max()) for v in x]
+        result = df.style.apply(f, axis=1)
+        assert len(result._todo) == 1
+        assert len(result.ctx) == 0
+        result._compute()
+        expected = {(0, 0): ['val: 1'], (0, 1): ['val: 1'],
+                    (1, 0): ['val: 1'], (1, 1): ['val: 1']}
+        assert result.ctx == expected
+
+        result = df.style.apply(f, axis=0)
+        expected = {(0, 0): ['val: 0'], (0, 1): ['val: 1'],
+                    (1, 0): ['val: 0'], (1, 1): ['val: 1']}
+        result._compute()
+        assert result.ctx == expected
+        result = df.style.apply(f)  # default
+        result._compute()
+        assert result.ctx == expected
+
+    def test_apply_subset(self):
+        axes = [0, 1]
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+        for ax in axes:
+            for slice_ in slices:
+                result = self.df.style.apply(self.h, axis=ax, subset=slice_,
+                                             foo='baz')._compute().ctx
+                expected = {(r, c): ['color: baz']
+                            for r, row in enumerate(self.df.index)
+                            for c, col in enumerate(self.df.columns)
+                            if row in self.df.loc[slice_].index and
+                            col in self.df.loc[slice_].columns}
+                assert result == expected
+
+    def test_applymap_subset(self):
+        def f(x):
+            return 'foo: bar'
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.applymap(f, subset=slice_)._compute().ctx
+            expected = {(r, c): ['foo: bar']
+                        for r, row in enumerate(self.df.index)
+                        for c, col in enumerate(self.df.columns)
+                        if row in self.df.loc[slice_].index and
+                        col in self.df.loc[slice_].columns}
+            assert result == expected
+
+    def test_applymap_subset_multiindex(self):
+        # GH 19861
+        # Smoke test for applymap
+        def color_negative_red(val):
+            """
+            Takes a scalar and returns a string with
+            the css property `'color: red'` for negative
+            strings, black otherwise.
+            """
+            color = 'red' if val < 0 else 'black'
+            return 'color: %s' % color
+
+        dic = {
+            ('a', 'd'): [-1.12, 2.11],
+            ('a', 'c'): [2.78, -2.88],
+            ('b', 'c'): [-3.99, 3.77],
+            ('b', 'd'): [4.21, -1.22],
+        }
+
+        idx = pd.IndexSlice
+        df = pd.DataFrame(dic, index=[0, 1])
+
+        (df.style
+         .applymap(color_negative_red, subset=idx[:, idx['b', 'd']])
+         .render())
+
+    def test_where_with_one_style(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+
+        result = self.df.style.where(f, style1)._compute().ctx
+        expected = {(r, c): [style1 if f(self.df.loc[row, col]) else '']
+                    for r, row in enumerate(self.df.index)
+                    for c, col in enumerate(self.df.columns)}
+        assert result == expected
+
+    def test_where_subset(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+        style2 = 'baz: foo'
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.where(f, style1, style2,
+                                         subset=slice_)._compute().ctx
+            expected = {(r, c):
+                        [style1 if f(self.df.loc[row, col]) else style2]
+                        for r, row in enumerate(self.df.index)
+                        for c, col in enumerate(self.df.columns)
+                        if row in self.df.loc[slice_].index and
+                        col in self.df.loc[slice_].columns}
+            assert result == expected
+
+    def test_where_subset_compare_with_applymap(self):
+        # GH 17474
+        def f(x):
+            return x > 0.5
+
+        style1 = 'foo: bar'
+        style2 = 'baz: foo'
+
+        def g(x):
+            return style1 if f(x) else style2
+
+        slices = [pd.IndexSlice[:], pd.IndexSlice[:, ['A']],
+                  pd.IndexSlice[[1], :], pd.IndexSlice[[1], ['A']],
+                  pd.IndexSlice[:2, ['A', 'B']]]
+
+        for slice_ in slices:
+            result = self.df.style.where(f, style1, style2,
+                                         subset=slice_)._compute().ctx
+            expected = self.df.style.applymap(g, subset=slice_)._compute().ctx
+            assert result == expected
+
+    def test_empty(self):
+        df = pd.DataFrame({'A': [1, 0]})
+        s = df.style
+        s.ctx = {(0, 0): ['color: red'],
+                 (1, 0): ['']}
+
+        result = s._translate()['cellstyle']
+        expected = [{'props': [['color', ' red']], 'selector': 'row0_col0'},
+                    {'props': [['', '']], 'selector': 'row1_col0'}]
+        assert result == expected
+
+    def test_bar_align_left(self):
+        df = pd.DataFrame({'A': [0, 1, 2]})
+        result = df.style.bar()._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,#d65f5f 50.0%, transparent 50.0%)'],
+            (2, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,red 25.0%, transparent 25.0%)'],
+            (2, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient('
+                     '90deg,red 50.0%, transparent 50.0%)']
+        }
+        assert result == expected
+
+        df['C'] = ['a'] * len(df)
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        assert result == expected
+        df['C'] = df['C'].astype('category')
+        result = df.style.bar(color='red', width=50)._compute().ctx
+        assert result == expected
+
+    def test_bar_align_left_0points(self):
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
+        result = df.style.bar()._compute().ctx
+        expected = {(0, 0): ['width: 10em', ' height: 80%'],
+                    (0, 1): ['width: 10em', ' height: 80%'],
+                    (0, 2): ['width: 10em', ' height: 80%'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 50.0%)'],
+                    (1, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 50.0%)'],
+                    (1, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 50.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)'],
+                    (2, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)'],
+                    (2, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)']}
+        assert result == expected
+
+        result = df.style.bar(axis=1)._compute().ctx
+        expected = {(0, 0): ['width: 10em', ' height: 80%'],
+                    (0, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%,'
+                             ' transparent 50.0%)'],
+                    (0, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%'],
+                    (1, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%'
+                             ', transparent 50.0%)'],
+                    (1, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%'],
+                    (2, 1): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 50.0%'
+                             ', transparent 50.0%)'],
+                    (2, 2): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,#d65f5f 100.0%'
+                             ', transparent 100.0%)']}
+        assert result == expected
+
+    def test_bar_align_mid_pos_and_neg(self):
+        df = pd.DataFrame({'A': [-10, 0, 20, 90]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#d65f5f 10.0%, transparent 10.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%', ],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 10.0%, #5fba7d 10.0%'
+                             ', #5fba7d 30.0%, transparent 30.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 10.0%, '
+                             '#5fba7d 10.0%, #5fba7d 100.0%, '
+                             'transparent 100.0%)']}
+
+        assert result == expected
+
+    def test_bar_align_mid_all_pos(self):
+        df = pd.DataFrame({'A': [10, 20, 50, 100]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#5fba7d 10.0%, transparent 10.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#5fba7d 20.0%, transparent 20.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#5fba7d 50.0%, transparent 50.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#5fba7d 100.0%, transparent 100.0%)']}
+
+        assert result == expected
+
+    def test_bar_align_mid_all_neg(self):
+        df = pd.DataFrame({'A': [-100, -60, -30, -20]})
+
+        result = df.style.bar(align='mid', color=[
+                              '#d65f5f', '#5fba7d'])._compute().ctx
+
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg,'
+                             '#d65f5f 100.0%, transparent 100.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 40.0%, '
+                             '#d65f5f 40.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 70.0%, '
+                             '#d65f5f 70.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 80.0%, '
+                             '#d65f5f 80.0%, #d65f5f 100.0%, '
+                             'transparent 100.0%)']}
+        assert result == expected
+
+    def test_bar_align_zero_pos_and_neg(self):
+        # See https://github.com/pandas-dev/pandas/pull/14757
+        df = pd.DataFrame({'A': [-10, 0, 20, 90]})
+
+        result = df.style.bar(align='zero', color=[
+                              '#d65f5f', '#5fba7d'], width=90)._compute().ctx
+        expected = {(0, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 40.0%, #d65f5f 40.0%, '
+                             '#d65f5f 45.0%, transparent 45.0%)'],
+                    (1, 0): ['width: 10em', ' height: 80%'],
+                    (2, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 45.0%, #5fba7d 45.0%, '
+                             '#5fba7d 55.0%, transparent 55.0%)'],
+                    (3, 0): ['width: 10em', ' height: 80%',
+                             'background: linear-gradient(90deg, '
+                             'transparent 45.0%, #5fba7d 45.0%, '
+                             '#5fba7d 90.0%, transparent 90.0%)']}
+        assert result == expected
+
+    def test_bar_align_left_axis_none(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [2, 4]})
+        result = df.style.bar(axis=None)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 25.0%, transparent 25.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_zero_axis_none(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='zero', axis=None)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 50.0%, #d65f5f 50.0%, '
+                     '#d65f5f 62.5%, transparent 62.5%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 50.0%, #d65f5f 50.0%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_axis_none(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='mid', axis=None)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 33.3%, #d65f5f 33.3%, '
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 33.3%, transparent 33.3%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 33.3%, #d65f5f 33.3%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_vmin(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='mid', axis=None, vmin=-6)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 60.0%, #d65f5f 60.0%, '
+                     '#d65f5f 70.0%, transparent 70.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 40.0%, #d65f5f 40.0%, '
+                     '#d65f5f 60.0%, transparent 60.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 60.0%, #d65f5f 60.0%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_vmax(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='mid', axis=None, vmax=8)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 20.0%, #d65f5f 20.0%, '
+                     '#d65f5f 30.0%, transparent 30.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 20.0%, transparent 20.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 20.0%, #d65f5f 20.0%, '
+                     '#d65f5f 60.0%, transparent 60.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_vmin_vmax_wide(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='mid', axis=None,
+                              vmin=-3, vmax=7)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 30.0%, #d65f5f 30.0%, '
+                     '#d65f5f 40.0%, transparent 40.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 10.0%, #d65f5f 10.0%, '
+                     '#d65f5f 30.0%, transparent 30.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 30.0%, #d65f5f 30.0%, '
+                     '#d65f5f 70.0%, transparent 70.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_vmin_vmax_clipping(self):
+        df = pd.DataFrame({'A': [0, 1], 'B': [-2, 4]})
+        result = df.style.bar(align='mid', axis=None,
+                              vmin=-1, vmax=3)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%'],
+            (1, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 25.0%, transparent 25.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_mid_nans(self):
+        df = pd.DataFrame({'A': [1, None], 'B': [-1, 3]})
+        result = df.style.bar(align='mid', axis=None)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (1, 0): [''],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg,'
+                     '#d65f5f 25.0%, transparent 25.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_align_zero_nans(self):
+        df = pd.DataFrame({'A': [1, None], 'B': [-1, 2]})
+        result = df.style.bar(align='zero', axis=None)._compute().ctx
+        expected = {
+            (0, 0): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 50.0%, #d65f5f 50.0%, '
+                     '#d65f5f 75.0%, transparent 75.0%)'],
+            (1, 0): [''],
+            (0, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 25.0%, #d65f5f 25.0%, '
+                     '#d65f5f 50.0%, transparent 50.0%)'],
+            (1, 1): ['width: 10em', ' height: 80%',
+                     'background: linear-gradient(90deg, '
+                     'transparent 50.0%, #d65f5f 50.0%, '
+                     '#d65f5f 100.0%, transparent 100.0%)']
+        }
+        assert result == expected
+
+    def test_bar_bad_align_raises(self):
+        df = pd.DataFrame({'A': [-100, -60, -30, -20]})
+        with pytest.raises(ValueError):
+            df.style.bar(align='poorly', color=['#d65f5f', '#5fba7d'])
+
+    def test_highlight_null(self, null_color='red'):
+        df = pd.DataFrame({'A': [0, np.nan]})
+        result = df.style.highlight_null()._compute().ctx
+        expected = {(0, 0): [''],
+                    (1, 0): ['background-color: red']}
+        assert result == expected
+
+    def test_nonunique_raises(self):
+        df = pd.DataFrame([[1, 2]], columns=['A', 'A'])
+        with pytest.raises(ValueError):
+            df.style
+
+        with pytest.raises(ValueError):
+            Styler(df)
+
+    def test_caption(self):
+        styler = Styler(self.df, caption='foo')
+        result = styler.render()
+        assert all(['caption' in result, 'foo' in result])
+
+        styler = self.df.style
+        result = styler.set_caption('baz')
+        assert styler is result
+        assert styler.caption == 'baz'
+
+    def test_uuid(self):
+        styler = Styler(self.df, uuid='abc123')
+        result = styler.render()
+        assert 'abc123' in result
+
+        styler = self.df.style
+        result = styler.set_uuid('aaa')
+        assert result is styler
+        assert result.uuid == 'aaa'
+
+    def test_unique_id(self):
+        # See https://github.com/pandas-dev/pandas/issues/16780
+        df = pd.DataFrame({'a': [1, 3, 5, 6], 'b': [2, 4, 12, 21]})
+        result = df.style.render(uuid='test')
+        assert 'test' in result
+        ids = re.findall('id="(.*?)"', result)
+        assert np.unique(ids).size == len(ids)
+
+    def test_table_styles(self):
+        style = [{'selector': 'th', 'props': [('foo', 'bar')]}]
+        styler = Styler(self.df, table_styles=style)
+        result = ' '.join(styler.render().split())
+        assert 'th { foo: bar; }' in result
+
+        styler = self.df.style
+        result = styler.set_table_styles(style)
+        assert styler is result
+        assert styler.table_styles == style
+
+    def test_table_attributes(self):
+        attributes = 'class="foo" data-bar'
+        styler = Styler(self.df, table_attributes=attributes)
+        result = styler.render()
+        assert 'class="foo" data-bar' in result
+
+        result = self.df.style.set_table_attributes(attributes).render()
+        assert 'class="foo" data-bar' in result
+
+    def test_precision(self):
+        with pd.option_context('display.precision', 10):
+            s = Styler(self.df)
+        assert s.precision == 10
+        s = Styler(self.df, precision=2)
+        assert s.precision == 2
+
+        s2 = s.set_precision(4)
+        assert s is s2
+        assert s.precision == 4
+
+    def test_apply_none(self):
+        def f(x):
+            return pd.DataFrame(np.where(x == x.max(), 'color: red', ''),
+                                index=x.index, columns=x.columns)
+        result = (pd.DataFrame([[1, 2], [3, 4]])
+                  .style.apply(f, axis=None)._compute().ctx)
+        assert result[(1, 1)] == ['color: red']
+
+    def test_trim(self):
+        result = self.df.style.render()  # trim=True
+        assert result.count('#') == 0
+
+        result = self.df.style.highlight_max().render()
+        assert result.count('#') == len(self.df.columns)
+
+    def test_highlight_max(self):
+        df = pd.DataFrame([[1, 2], [3, 4]], columns=['A', 'B'])
+        # max(df) = min(-df)
+        for max_ in [True, False]:
+            if max_:
+                attr = 'highlight_max'
+            else:
+                df = -df
+                attr = 'highlight_min'
+            result = getattr(df.style, attr)()._compute().ctx
+            assert result[(1, 1)] == ['background-color: yellow']
+
+            result = getattr(df.style, attr)(color='green')._compute().ctx
+            assert result[(1, 1)] == ['background-color: green']
+
+            result = getattr(df.style, attr)(subset='A')._compute().ctx
+            assert result[(1, 0)] == ['background-color: yellow']
+
+            result = getattr(df.style, attr)(axis=0)._compute().ctx
+            expected = {(1, 0): ['background-color: yellow'],
+                        (1, 1): ['background-color: yellow'],
+                        (0, 1): [''], (0, 0): ['']}
+            assert result == expected
+
+            result = getattr(df.style, attr)(axis=1)._compute().ctx
+            expected = {(0, 1): ['background-color: yellow'],
+                        (1, 1): ['background-color: yellow'],
+                        (0, 0): [''], (1, 0): ['']}
+            assert result == expected
+
+        # separate since we can't negate the strs
+        df['C'] = ['a', 'b']
+        result = df.style.highlight_max()._compute().ctx
+        expected = {(1, 1): ['background-color: yellow']}
+
+        result = df.style.highlight_min()._compute().ctx
+        expected = {(0, 0): ['background-color: yellow']}
+
+    def test_export(self):
+        f = lambda x: 'color: red' if x > 0 else 'color: blue'
+        g = lambda x, y, z: 'color: {z}'.format(z=z) \
+            if x > 0 else 'color: {z}'.format(z=z)
+        style1 = self.styler
+        style1.applymap(f)\
+            .applymap(g, y='a', z='b')\
+            .highlight_max()
+        result = style1.export()
+        style2 = self.df.style
+        style2.use(result)
+        assert style1._todo == style2._todo
+        style2.render()
+
+    def test_display_format(self):
+        df = pd.DataFrame(np.random.random(size=(2, 2)))
+        ctx = df.style.format("{:0.1f}")._translate()
+
+        assert all(['display_value' in c for c in row]
+                   for row in ctx['body'])
+        assert all([len(c['display_value']) <= 3 for c in row[1:]]
+                   for row in ctx['body'])
+        assert len(ctx['body'][0][1]['display_value'].lstrip('-')) <= 3
+
+    def test_display_format_raises(self):
+        df = pd.DataFrame(np.random.randn(2, 2))
+        with pytest.raises(TypeError):
+            df.style.format(5)
+        with pytest.raises(TypeError):
+            df.style.format(True)
+
+    def test_display_subset(self):
+        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
+                          columns=['a', 'b'])
+        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"},
+                              subset=pd.IndexSlice[0, :])._translate()
+        expected = '0.1'
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == '1.1234'
+        assert ctx['body'][0][2]['display_value'] == '12.34%'
+
+        raw_11 = '1.1234'
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, :])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, :])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice['a'])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][0][2]['display_value'] == '0.1234'
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[0, 'a'])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == raw_11
+
+        ctx = df.style.format("{:0.1f}",
+                              subset=pd.IndexSlice[[0, 1], ['a']])._translate()
+        assert ctx['body'][0][1]['display_value'] == expected
+        assert ctx['body'][1][1]['display_value'] == '1.1'
+        assert ctx['body'][0][2]['display_value'] == '0.1234'
+        assert ctx['body'][1][2]['display_value'] == '1.1234'
+
+    def test_display_dict(self):
+        df = pd.DataFrame([[.1234, .1234], [1.1234, 1.1234]],
+                          columns=['a', 'b'])
+        ctx = df.style.format({"a": "{:0.1f}", "b": "{0:.2%}"})._translate()
+        assert ctx['body'][0][1]['display_value'] == '0.1'
+        assert ctx['body'][0][2]['display_value'] == '12.34%'
+        df['c'] = ['aaa', 'bbb']
+        ctx = df.style.format({"a": "{:0.1f}", "c": str.upper})._translate()
+        assert ctx['body'][0][1]['display_value'] == '0.1'
+        assert ctx['body'][0][3]['display_value'] == 'AAA'
+
+    def test_bad_apply_shape(self):
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: 'x', subset=pd.IndexSlice[[0, 1], :])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: [''], subset=pd.IndexSlice[[0, 1], :])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', '', ''])
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', ''], subset=1)
+
+        with pytest.raises(ValueError):
+            df.style._apply(lambda x: ['', '', ''], axis=1)
+
+    def test_apply_bad_return(self):
+        def f(x):
+            return ''
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(TypeError):
+            df.style._apply(f, axis=None)
+
+    def test_apply_bad_labels(self):
+        def f(x):
+            return pd.DataFrame(index=[1, 2], columns=['a', 'b'])
+        df = pd.DataFrame([[1, 2], [3, 4]])
+        with pytest.raises(ValueError):
+            df.style._apply(f, axis=None)
+
+    def test_get_level_lengths(self):
+        index = pd.MultiIndex.from_product([['a', 'b'], [0, 1, 2]])
+        expected = {(0, 0): 3, (0, 3): 3, (1, 0): 1, (1, 1): 1, (1, 2): 1,
+                    (1, 3): 1, (1, 4): 1, (1, 5): 1}
+        result = _get_level_lengths(index)
+        tm.assert_dict_equal(result, expected)
+
+    def test_get_level_lengths_un_sorted(self):
+        index = pd.MultiIndex.from_arrays([
+            [1, 1, 2, 1],
+            ['a', 'b', 'b', 'd']
+        ])
+        expected = {(0, 0): 2, (0, 2): 1, (0, 3): 1,
+                    (1, 0): 1, (1, 1): 1, (1, 2): 1, (1, 3): 1}
+        result = _get_level_lengths(index)
+        tm.assert_dict_equal(result, expected)
+
+    def test_mi_sparse(self):
+        df = pd.DataFrame({'A': [1, 2]},
+                          index=pd.MultiIndex.from_arrays([['a', 'a'],
+                                                           [0, 1]]))
+
+        result = df.style._translate()
+        body_0 = result['body'][0][0]
+        expected_0 = {
+            "value": "a", "display_value": "a", "is_visible": True,
+            "type": "th", "attributes": ["rowspan=2"],
+            "class": "row_heading level0 row0", "id": "level0_row0"
+        }
+        tm.assert_dict_equal(body_0, expected_0)
+
+        body_1 = result['body'][0][1]
+        expected_1 = {
+            "value": 0, "display_value": 0, "is_visible": True,
+            "type": "th", "class": "row_heading level1 row0",
+            "id": "level1_row0"
+        }
+        tm.assert_dict_equal(body_1, expected_1)
+
+        body_10 = result['body'][1][0]
+        expected_10 = {
+            "value": 'a', "display_value": 'a', "is_visible": False,
+            "type": "th", "class": "row_heading level0 row1",
+            "id": "level0_row1"
+        }
+        tm.assert_dict_equal(body_10, expected_10)
+
+        head = result['head'][0]
+        expected = [
+            {'type': 'th', 'class': 'blank', 'value': '',
+             'is_visible': True, "display_value": ''},
+            {'type': 'th', 'class': 'blank level0', 'value': '',
+             'is_visible': True, 'display_value': ''},
+            {'type': 'th', 'class': 'col_heading level0 col0', 'value': 'A',
+             'is_visible': True, 'display_value': 'A'}]
+        assert head == expected
+
+    def test_mi_sparse_disabled(self):
+        with pd.option_context('display.multi_sparse', False):
+            df = pd.DataFrame({'A': [1, 2]},
+                              index=pd.MultiIndex.from_arrays([['a', 'a'],
+                                                               [0, 1]]))
+            result = df.style._translate()
+        body = result['body']
+        for row in body:
+            assert 'attributes' not in row[0]
+
+    def test_mi_sparse_index_names(self):
+        df = pd.DataFrame({'A': [1, 2]}, index=pd.MultiIndex.from_arrays(
+            [['a', 'a'], [0, 1]],
+            names=['idx_level_0', 'idx_level_1'])
+        )
+        result = df.style._translate()
+        head = result['head'][1]
+        expected = [{
+            'class': 'index_name level0', 'value': 'idx_level_0',
+            'type': 'th'},
+            {'class': 'index_name level1', 'value': 'idx_level_1',
+             'type': 'th'},
+            {'class': 'blank', 'value': '', 'type': 'th'}]
+
+        assert head == expected
+
+    def test_mi_sparse_column_names(self):
+        df = pd.DataFrame(
+            np.arange(16).reshape(4, 4),
+            index=pd.MultiIndex.from_arrays(
+                [['a', 'a', 'b', 'a'], [0, 1, 1, 2]],
+                names=['idx_level_0', 'idx_level_1']),
+            columns=pd.MultiIndex.from_arrays(
+                [['C1', 'C1', 'C2', 'C2'], [1, 0, 1, 0]],
+                names=['col_0', 'col_1']
+            )
+        )
+        result = df.style._translate()
+        head = result['head'][1]
+        expected = [
+            {'class': 'blank', 'value': '', 'display_value': '',
+             'type': 'th', 'is_visible': True},
+            {'class': 'index_name level1', 'value': 'col_1',
+             'display_value': 'col_1', 'is_visible': True, 'type': 'th'},
+            {'class': 'col_heading level1 col0',
+             'display_value': 1,
+             'is_visible': True,
+             'type': 'th',
+             'value': 1},
+            {'class': 'col_heading level1 col1',
+             'display_value': 0,
+             'is_visible': True,
+             'type': 'th',
+             'value': 0},
+
+            {'class': 'col_heading level1 col2',
+             'display_value': 1,
+             'is_visible': True,
+             'type': 'th',
+             'value': 1},
+
+            {'class': 'col_heading level1 col3',
+             'display_value': 0,
+             'is_visible': True,
+             'type': 'th',
+             'value': 0},
+        ]
+        assert head == expected
+
+    def test_hide_single_index(self):
+        # GH 14194
+        # single unnamed index
+        ctx = self.df.style._translate()
+        assert ctx['body'][0][0]['is_visible']
+        assert ctx['head'][0][0]['is_visible']
+        ctx2 = self.df.style.hide_index()._translate()
+        assert not ctx2['body'][0][0]['is_visible']
+        assert not ctx2['head'][0][0]['is_visible']
+
+        # single named index
+        ctx3 = self.df.set_index('A').style._translate()
+        assert ctx3['body'][0][0]['is_visible']
+        assert len(ctx3['head']) == 2  # 2 header levels
+        assert ctx3['head'][0][0]['is_visible']
+
+        ctx4 = self.df.set_index('A').style.hide_index()._translate()
+        assert not ctx4['body'][0][0]['is_visible']
+        assert len(ctx4['head']) == 1  # only 1 header levels
+        assert not ctx4['head'][0][0]['is_visible']
+
+    def test_hide_multiindex(self):
+        # GH 14194
+        df = pd.DataFrame({'A': [1, 2]}, index=pd.MultiIndex.from_arrays(
+            [['a', 'a'], [0, 1]],
+            names=['idx_level_0', 'idx_level_1'])
+        )
+        ctx1 = df.style._translate()
+        # tests for 'a' and '0'
+        assert ctx1['body'][0][0]['is_visible']
+        assert ctx1['body'][0][1]['is_visible']
+        # check for blank header rows
+        assert ctx1['head'][0][0]['is_visible']
+        assert ctx1['head'][0][1]['is_visible']
+
+        ctx2 = df.style.hide_index()._translate()
+        # tests for 'a' and '0'
+        assert not ctx2['body'][0][0]['is_visible']
+        assert not ctx2['body'][0][1]['is_visible']
+        # check for blank header rows
+        assert not ctx2['head'][0][0]['is_visible']
+        assert not ctx2['head'][0][1]['is_visible']
+
+    def test_hide_columns_single_level(self):
+        # GH 14194
+        # test hiding single column
+        ctx = self.df.style._translate()
+        assert ctx['head'][0][1]['is_visible']
+        assert ctx['head'][0][1]['display_value'] == 'A'
+        assert ctx['head'][0][2]['is_visible']
+        assert ctx['head'][0][2]['display_value'] == 'B'
+        assert ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert ctx['body'][1][2]['is_visible']  # col B, row 1
+
+        ctx = self.df.style.hide_columns('A')._translate()
+        assert not ctx['head'][0][1]['is_visible']
+        assert not ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert ctx['body'][1][2]['is_visible']  # col B, row 1
+
+        # test hiding mulitiple columns
+        ctx = self.df.style.hide_columns(['A', 'B'])._translate()
+        assert not ctx['head'][0][1]['is_visible']
+        assert not ctx['head'][0][2]['is_visible']
+        assert not ctx['body'][0][1]['is_visible']  # col A, row 1
+        assert not ctx['body'][1][2]['is_visible']  # col B, row 1
+
+    def test_hide_columns_mult_levels(self):
+        # GH 14194
+        # setup dataframe with multiple column levels and indices
+        i1 = pd.MultiIndex.from_arrays([['a', 'a'], [0, 1]],
+                                       names=['idx_level_0',
+                                              'idx_level_1'])
+        i2 = pd.MultiIndex.from_arrays([['b', 'b'], [0, 1]],
+                                       names=['col_level_0',
+                                              'col_level_1'])
+        df = pd.DataFrame([[1, 2], [3, 4]], index=i1, columns=i2)
+        ctx = df.style._translate()
+        # column headers
+        assert ctx['head'][0][2]['is_visible']
+        assert ctx['head'][1][2]['is_visible']
+        assert ctx['head'][1][3]['display_value'] == 1
+        # indices
+        assert ctx['body'][0][0]['is_visible']
+        # data
+        assert ctx['body'][1][2]['is_visible']
+        assert ctx['body'][1][2]['display_value'] == 3
+        assert ctx['body'][1][3]['is_visible']
+        assert ctx['body'][1][3]['display_value'] == 4
+
+        # hide top column level, which hides both columns
+        ctx = df.style.hide_columns('b')._translate()
+        assert not ctx['head'][0][2]['is_visible']  # b
+        assert not ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['body'][1][2]['is_visible']  # 3
+        assert ctx['body'][0][0]['is_visible']  # index
+
+        # hide first column only
+        ctx = df.style.hide_columns([('b', 0)])._translate()
+        assert ctx['head'][0][2]['is_visible']  # b
+        assert not ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['body'][1][2]['is_visible']  # 3
+        assert ctx['body'][1][3]['is_visible']
+        assert ctx['body'][1][3]['display_value'] == 4
+
+        # hide second column and index
+        ctx = df.style.hide_columns([('b', 1)]).hide_index()._translate()
+        assert not ctx['body'][0][0]['is_visible']  # index
+        assert ctx['head'][0][2]['is_visible']  # b
+        assert ctx['head'][1][2]['is_visible']  # 0
+        assert not ctx['head'][1][3]['is_visible']  # 1
+        assert not ctx['body'][1][3]['is_visible']  # 4
+        assert ctx['body'][1][2]['is_visible']
+        assert ctx['body'][1][2]['display_value'] == 3
+
+    def test_pipe(self):
+        def set_caption_from_template(styler, a, b):
+            return styler.set_caption(
+                'Dataframe with a = {a} and b = {b}'.format(a=a, b=b))
+
+        styler = self.df.style.pipe(set_caption_from_template, 'A', b='B')
+        assert 'Dataframe with a = A and b = B' in styler.render()
+
+        # Test with an argument that is a (callable, keyword_name) pair.
+        def f(a, b, styler):
+            return (a, b, styler)
+
+        styler = self.df.style
+        result = styler.pipe((f, 'styler'), a=1, b=2)
+        assert result == (1, 2, styler)
+
+
+@td.skip_if_no_mpl
+class TestStylerMatplotlibDep(object):
+
+    def test_background_gradient(self):
+        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
+
+        for c_map in [None, 'YlOrRd']:
+            result = df.style.background_gradient(cmap=c_map)._compute().ctx
+            assert all("#" in x[0] for x in result.values())
+            assert result[(0, 0)] == result[(0, 1)]
+            assert result[(1, 0)] == result[(1, 1)]
+
+        result = df.style.background_gradient(
+            subset=pd.IndexSlice[1, 'A'])._compute().ctx
+
+        assert result[(1, 0)] == ['background-color: #fff7fb',
+                                  'color: #000000']
+
+    @pytest.mark.parametrize(
+        'c_map,expected', [
+            (None, {
+                (0, 0): ['background-color: #440154', 'color: #f1f1f1'],
+                (1, 0): ['background-color: #fde725', 'color: #000000']}),
+            ('YlOrRd', {
+                (0, 0): ['background-color: #ffffcc', 'color: #000000'],
+                (1, 0): ['background-color: #800026', 'color: #f1f1f1']})])
+    def test_text_color_threshold(self, c_map, expected):
+        df = pd.DataFrame([1, 2], columns=['A'])
+        result = df.style.background_gradient(cmap=c_map)._compute().ctx
+        assert result == expected
+
+    @pytest.mark.parametrize("text_color_threshold", [1.1, '1', -1, [2, 2]])
+    def test_text_color_threshold_raises(self, text_color_threshold):
+        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
+        msg = "`text_color_threshold` must be a value from 0 to 1."
+        with pytest.raises(ValueError, match=msg):
+            df.style.background_gradient(
+                text_color_threshold=text_color_threshold)._compute()
+
+    @td.skip_if_no_mpl
+    def test_background_gradient_axis(self):
+        df = pd.DataFrame([[1, 2], [2, 4]], columns=['A', 'B'])
+
+        low = ['background-color: #f7fbff', 'color: #000000']
+        high = ['background-color: #08306b', 'color: #f1f1f1']
+        mid = ['background-color: #abd0e6', 'color: #000000']
+        result = df.style.background_gradient(cmap='Blues',
+                                              axis=0)._compute().ctx
+        assert result[(0, 0)] == low
+        assert result[(0, 1)] == low
+        assert result[(1, 0)] == high
+        assert result[(1, 1)] == high
+
+        result = df.style.background_gradient(cmap='Blues',
+                                              axis=1)._compute().ctx
+        assert result[(0, 0)] == low
+        assert result[(0, 1)] == high
+        assert result[(1, 0)] == low
+        assert result[(1, 1)] == high
+
+        result = df.style.background_gradient(cmap='Blues',
+                                              axis=None)._compute().ctx
+        assert result[(0, 0)] == low
+        assert result[(0, 1)] == mid
+        assert result[(1, 0)] == mid
+        assert result[(1, 1)] == high
+
+
+def test_block_names():
+    # catch accidental removal of a block
+    expected = {
+        'before_style', 'style', 'table_styles', 'before_cellstyle',
+        'cellstyle', 'before_table', 'table', 'caption', 'thead', 'tbody',
+        'after_table', 'before_head_rows', 'head_tr', 'after_head_rows',
+        'before_rows', 'tr', 'after_rows',
+    }
+    result = set(Styler.template.blocks)
+    assert result == expected
+
+
+def test_from_custom_template(tmpdir):
+    p = tmpdir.mkdir("templates").join("myhtml.tpl")
+    p.write(textwrap.dedent("""\
+        {% extends "html.tpl" %}
+        {% block table %}
+        <h1>{{ table_title|default("My Table") }}</h1>
+        {{ super() }}
+        {% endblock table %}"""))
+    result = Styler.from_custom_template(str(tmpdir.join('templates')),
+                                         'myhtml.tpl')
+    assert issubclass(result, Styler)
+    assert result.env is not Styler.env
+    assert result.template is not Styler.template
+    styler = result(pd.DataFrame({"A": [1, 2]}))
+    assert styler.render()
diff --git a/pandas/tests/io/formats/test_to_csv.py b/pandas/tests/io/formats/test_to_csv.py
new file mode 100644
index 0000000000000..1929817a49b3c
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_csv.py
@@ -0,0 +1,563 @@
+# -*- coding: utf-8 -*-
+
+import os
+import sys
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, compat
+from pandas.util import testing as tm
+
+
+class TestToCSV(object):
+
+    @pytest.mark.xfail((3, 6, 5) > sys.version_info >= (3, 5),
+                       reason=("Python csv library bug "
+                               "(see https://bugs.python.org/issue32255)"))
+    def test_to_csv_with_single_column(self):
+        # see gh-18676, https://bugs.python.org/issue32255
+        #
+        # Python's CSV library adds an extraneous '""'
+        # before the newline when the NaN-value is in
+        # the first row. Otherwise, only the newline
+        # character is added. This behavior is inconsistent
+        # and was patched in https://bugs.python.org/pull_request4672.
+        df1 = DataFrame([None, 1])
+        expected1 = """\
+""
+1.0
+"""
+        with tm.ensure_clean('test.csv') as path:
+            df1.to_csv(path, header=None, index=None)
+            with open(path, 'r') as f:
+                assert f.read() == expected1
+
+        df2 = DataFrame([1, None])
+        expected2 = """\
+1.0
+""
+"""
+        with tm.ensure_clean('test.csv') as path:
+            df2.to_csv(path, header=None, index=None)
+            with open(path, 'r') as f:
+                assert f.read() == expected2
+
+    def test_to_csv_defualt_encoding(self):
+        # GH17097
+        df = DataFrame({'col': [u"AAAAA", u"ÄÄÄÄÄ", u"ßßßßß", u"聞聞聞聞聞"]})
+
+        with tm.ensure_clean('test.csv') as path:
+            # the default to_csv encoding in Python 2 is ascii, and that in
+            # Python 3 is uft-8.
+            if pd.compat.PY2:
+                # the encoding argument parameter should be utf-8
+                with pytest.raises(UnicodeEncodeError, match='ascii'):
+                    df.to_csv(path)
+            else:
+                df.to_csv(path)
+                tm.assert_frame_equal(pd.read_csv(path, index_col=0), df)
+
+    def test_to_csv_quotechar(self):
+        df = DataFrame({'col': [1, 2]})
+        expected = """\
+"","col"
+"0","1"
+"1","2"
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1)  # 1=QUOTE_ALL
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        expected = """\
+$$,$col$
+$0$,$1$
+$1$,$2$
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1, quotechar="$")
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        with tm.ensure_clean('test.csv') as path:
+            with pytest.raises(TypeError, match='quotechar'):
+                df.to_csv(path, quoting=1, quotechar=None)
+
+    def test_to_csv_doublequote(self):
+        df = DataFrame({'col': ['a"a', '"bb"']})
+        expected = '''\
+"","col"
+"0","a""a"
+"1","""bb"""
+'''
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=1, doublequote=True)  # QUOTE_ALL
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        from _csv import Error
+        with tm.ensure_clean('test.csv') as path:
+            with pytest.raises(Error, match='escapechar'):
+                df.to_csv(path, doublequote=False)  # no escapechar set
+
+    def test_to_csv_escapechar(self):
+        df = DataFrame({'col': ['a"a', '"bb"']})
+        expected = '''\
+"","col"
+"0","a\\"a"
+"1","\\"bb\\""
+'''
+
+        with tm.ensure_clean('test.csv') as path:  # QUOTE_ALL
+            df.to_csv(path, quoting=1, doublequote=False, escapechar='\\')
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+        df = DataFrame({'col': ['a,a', ',bb,']})
+        expected = """\
+,col
+0,a\\,a
+1,\\,bb\\,
+"""
+
+        with tm.ensure_clean('test.csv') as path:
+            df.to_csv(path, quoting=3, escapechar='\\')  # QUOTE_NONE
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+    def test_csv_to_string(self):
+        df = DataFrame({'col': [1, 2]})
+        expected_rows = [',col',
+                         '0,1',
+                         '1,2']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.to_csv() == expected
+
+    def test_to_csv_decimal(self):
+        # see gh-781
+        df = DataFrame({'col1': [1], 'col2': ['a'], 'col3': [10.1]})
+
+        expected_rows = [',col1,col2,col3',
+                         '0,1,a,10.1']
+        expected_default = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.to_csv() == expected_default
+
+        expected_rows = [';col1;col2;col3',
+                         '0;1;a;10,1']
+        expected_european_excel = tm.convert_rows_list_to_csv_str(
+            expected_rows)
+        assert df.to_csv(decimal=',', sep=';') == expected_european_excel
+
+        expected_rows = [',col1,col2,col3',
+                         '0,1,a,10.10']
+        expected_float_format_default = tm.convert_rows_list_to_csv_str(
+            expected_rows)
+        assert df.to_csv(float_format='%.2f') == expected_float_format_default
+
+        expected_rows = [';col1;col2;col3',
+                         '0;1;a;10,10']
+        expected_float_format = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.to_csv(decimal=',', sep=';',
+                         float_format='%.2f') == expected_float_format
+
+        # see gh-11553: testing if decimal is taken into account for '0.0'
+        df = pd.DataFrame({'a': [0, 1.1], 'b': [2.2, 3.3], 'c': 1})
+
+        expected_rows = ['a,b,c',
+                         '0^0,2^2,1',
+                         '1^1,3^3,1']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.to_csv(index=False, decimal='^') == expected
+
+        # same but for an index
+        assert df.set_index('a').to_csv(decimal='^') == expected
+
+        # same for a multi-index
+        assert df.set_index(['a', 'b']).to_csv(decimal="^") == expected
+
+    def test_to_csv_float_format(self):
+        # testing if float_format is taken into account for the index
+        # GH 11553
+        df = pd.DataFrame({'a': [0, 1], 'b': [2.2, 3.3], 'c': 1})
+
+        expected_rows = ['a,b,c',
+                         '0,2.20,1',
+                         '1,3.30,1']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df.set_index('a').to_csv(float_format='%.2f') == expected
+
+        # same for a multi-index
+        assert df.set_index(['a', 'b']).to_csv(
+            float_format='%.2f') == expected
+
+    def test_to_csv_na_rep(self):
+        # see gh-11553
+        #
+        # Testing if NaN values are correctly represented in the index.
+        df = DataFrame({'a': [0, np.NaN], 'b': [0, 1], 'c': [2, 3]})
+        expected_rows = ['a,b,c',
+                         '0.0,0,2',
+                         '_,1,3']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+        # now with an index containing only NaNs
+        df = DataFrame({'a': np.NaN, 'b': [0, 1], 'c': [2, 3]})
+        expected_rows = ['a,b,c',
+                         '_,0,2',
+                         '_,1,3']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+        # check if na_rep parameter does not break anything when no NaN
+        df = DataFrame({'a': 0, 'b': [0, 1], 'c': [2, 3]})
+        expected_rows = ['a,b,c',
+                         '0,0,2',
+                         '0,1,3']
+        expected = tm.convert_rows_list_to_csv_str(expected_rows)
+
+        assert df.set_index('a').to_csv(na_rep='_') == expected
+        assert df.set_index(['a', 'b']).to_csv(na_rep='_') == expected
+
+    def test_to_csv_date_format(self):
+        # GH 10209
+        df_sec = DataFrame({'A': pd.date_range('20130101', periods=5, freq='s')
+                            })
+        df_day = DataFrame({'A': pd.date_range('20130101', periods=5, freq='d')
+                            })
+
+        expected_rows = [',A',
+                         '0,2013-01-01 00:00:00',
+                         '1,2013-01-01 00:00:01',
+                         '2,2013-01-01 00:00:02',
+                         '3,2013-01-01 00:00:03',
+                         '4,2013-01-01 00:00:04']
+        expected_default_sec = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df_sec.to_csv() == expected_default_sec
+
+        expected_rows = [',A',
+                         '0,2013-01-01 00:00:00',
+                         '1,2013-01-02 00:00:00',
+                         '2,2013-01-03 00:00:00',
+                         '3,2013-01-04 00:00:00',
+                         '4,2013-01-05 00:00:00']
+        expected_ymdhms_day = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert (df_day.to_csv(date_format='%Y-%m-%d %H:%M:%S') ==
+                expected_ymdhms_day)
+
+        expected_rows = [',A',
+                         '0,2013-01-01',
+                         '1,2013-01-01',
+                         '2,2013-01-01',
+                         '3,2013-01-01',
+                         '4,2013-01-01']
+        expected_ymd_sec = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df_sec.to_csv(date_format='%Y-%m-%d') == expected_ymd_sec
+
+        expected_rows = [',A',
+                         '0,2013-01-01',
+                         '1,2013-01-02',
+                         '2,2013-01-03',
+                         '3,2013-01-04',
+                         '4,2013-01-05']
+        expected_default_day = tm.convert_rows_list_to_csv_str(expected_rows)
+        assert df_day.to_csv() == expected_default_day
+        assert df_day.to_csv(date_format='%Y-%m-%d') == expected_default_day
+
+        # see gh-7791
+        #
+        # Testing if date_format parameter is taken into account
+        # for multi-indexed DataFrames.
+        df_sec['B'] = 0
+        df_sec['C'] = 1
+
+        expected_rows = ['A,B,C',
+                         '2013-01-01,0,1']
+        expected_ymd_sec = tm.convert_rows_list_to_csv_str(expected_rows)
+
+        df_sec_grouped = df_sec.groupby([pd.Grouper(key='A', freq='1h'), 'B'])
+        assert (df_sec_grouped.mean().to_csv(date_format='%Y-%m-%d') ==
+                expected_ymd_sec)
+
+    def test_to_csv_multi_index(self):
+        # see gh-6618
+        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]))
+
+        exp_rows = [',1',
+                    ',2',
+                    '0,1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv() == exp
+
+        exp_rows = ['1', '2', '1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv(index=False) == exp
+
+        df = DataFrame([1], columns=pd.MultiIndex.from_arrays([[1], [2]]),
+                       index=pd.MultiIndex.from_arrays([[1], [2]]))
+
+        exp_rows = [',,1', ',,2', '1,2,1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv() == exp
+
+        exp_rows = ['1', '2', '1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv(index=False) == exp
+
+        df = DataFrame(
+            [1], columns=pd.MultiIndex.from_arrays([['foo'], ['bar']]))
+
+        exp_rows = [',foo', ',bar', '0,1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv() == exp
+
+        exp_rows = ['foo', 'bar', '1']
+        exp = tm.convert_rows_list_to_csv_str(exp_rows)
+        assert df.to_csv(index=False) == exp
+
+    @pytest.mark.parametrize("ind,expected", [
+        (pd.MultiIndex(levels=[[1.0]],
+                       codes=[[0]],
+                       names=["x"]),
+         "x,data\n1.0,1\n"),
+        (pd.MultiIndex(levels=[[1.], [2.]],
+                       codes=[[0], [0]],
+                       names=["x", "y"]),
+         "x,y,data\n1.0,2.0,1\n")
+    ])
+    @pytest.mark.parametrize("klass", [
+        pd.DataFrame, pd.Series
+    ])
+    def test_to_csv_single_level_multi_index(self, ind, expected, klass):
+        # see gh-19589
+        result = klass(pd.Series([1], ind, name="data")).to_csv(
+            line_terminator="\n", header=True)
+        assert result == expected
+
+    def test_to_csv_string_array_ascii(self):
+        # GH 10813
+        str_array = [{'names': ['foo', 'bar']}, {'names': ['baz', 'qux']}]
+        df = pd.DataFrame(str_array)
+        expected_ascii = '''\
+,names
+0,"['foo', 'bar']"
+1,"['baz', 'qux']"
+'''
+        with tm.ensure_clean('str_test.csv') as path:
+            df.to_csv(path, encoding='ascii')
+            with open(path, 'r') as f:
+                assert f.read() == expected_ascii
+
+    @pytest.mark.xfail
+    def test_to_csv_string_array_utf8(self):
+        # GH 10813
+        str_array = [{'names': ['foo', 'bar']}, {'names': ['baz', 'qux']}]
+        df = pd.DataFrame(str_array)
+        expected_utf8 = '''\
+,names
+0,"[u'foo', u'bar']"
+1,"[u'baz', u'qux']"
+'''
+        with tm.ensure_clean('unicode_test.csv') as path:
+            df.to_csv(path, encoding='utf-8')
+            with open(path, 'r') as f:
+                assert f.read() == expected_utf8
+
+    def test_to_csv_string_with_lf(self):
+        # GH 20353
+        data = {
+            'int': [1, 2, 3],
+            'str_lf': ['abc', 'd\nef', 'g\nh\n\ni']
+        }
+        df = pd.DataFrame(data)
+        with tm.ensure_clean('lf_test.csv') as path:
+            # case 1: The default line terminator(=os.linesep)(PR 21406)
+            os_linesep = os.linesep.encode('utf-8')
+            expected_noarg = (
+                b'int,str_lf' + os_linesep +
+                b'1,abc' + os_linesep +
+                b'2,"d\nef"' + os_linesep +
+                b'3,"g\nh\n\ni"' + os_linesep
+            )
+            df.to_csv(path, index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_noarg
+        with tm.ensure_clean('lf_test.csv') as path:
+            # case 2: LF as line terminator
+            expected_lf = (
+                b'int,str_lf\n'
+                b'1,abc\n'
+                b'2,"d\nef"\n'
+                b'3,"g\nh\n\ni"\n'
+            )
+            df.to_csv(path, line_terminator='\n', index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_lf
+        with tm.ensure_clean('lf_test.csv') as path:
+            # case 3: CRLF as line terminator
+            # 'line_terminator' should not change inner element
+            expected_crlf = (
+                b'int,str_lf\r\n'
+                b'1,abc\r\n'
+                b'2,"d\nef"\r\n'
+                b'3,"g\nh\n\ni"\r\n'
+            )
+            df.to_csv(path, line_terminator='\r\n', index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_crlf
+
+    def test_to_csv_string_with_crlf(self):
+        # GH 20353
+        data = {
+            'int': [1, 2, 3],
+            'str_crlf': ['abc', 'd\r\nef', 'g\r\nh\r\n\r\ni']
+        }
+        df = pd.DataFrame(data)
+        with tm.ensure_clean('crlf_test.csv') as path:
+            # case 1: The default line terminator(=os.linesep)(PR 21406)
+            os_linesep = os.linesep.encode('utf-8')
+            expected_noarg = (
+                b'int,str_crlf' + os_linesep +
+                b'1,abc' + os_linesep +
+                b'2,"d\r\nef"' + os_linesep +
+                b'3,"g\r\nh\r\n\r\ni"' + os_linesep
+            )
+            df.to_csv(path, index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_noarg
+        with tm.ensure_clean('crlf_test.csv') as path:
+            # case 2: LF as line terminator
+            expected_lf = (
+                b'int,str_crlf\n'
+                b'1,abc\n'
+                b'2,"d\r\nef"\n'
+                b'3,"g\r\nh\r\n\r\ni"\n'
+            )
+            df.to_csv(path, line_terminator='\n', index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_lf
+        with tm.ensure_clean('crlf_test.csv') as path:
+            # case 3: CRLF as line terminator
+            # 'line_terminator' should not change inner element
+            expected_crlf = (
+                b'int,str_crlf\r\n'
+                b'1,abc\r\n'
+                b'2,"d\r\nef"\r\n'
+                b'3,"g\r\nh\r\n\r\ni"\r\n'
+            )
+            df.to_csv(path, line_terminator='\r\n', index=False)
+            with open(path, 'rb') as f:
+                assert f.read() == expected_crlf
+
+    def test_to_csv_stdout_file(self, capsys):
+        # GH 21561
+        df = pd.DataFrame([['foo', 'bar'], ['baz', 'qux']],
+                          columns=['name_1', 'name_2'])
+        expected_rows = [',name_1,name_2',
+                         '0,foo,bar',
+                         '1,baz,qux']
+        expected_ascii = tm.convert_rows_list_to_csv_str(expected_rows)
+
+        df.to_csv(sys.stdout, encoding='ascii')
+        captured = capsys.readouterr()
+
+        assert captured.out == expected_ascii
+        assert not sys.stdout.closed
+
+    @pytest.mark.xfail(
+        compat.is_platform_windows(),
+        reason=("Especially in Windows, file stream should not be passed"
+                "to csv writer without newline='' option."
+                "(https://docs.python.org/3.6/library/csv.html#csv.writer)"))
+    def test_to_csv_write_to_open_file(self):
+        # GH 21696
+        df = pd.DataFrame({'a': ['x', 'y', 'z']})
+        expected = '''\
+manual header
+x
+y
+z
+'''
+        with tm.ensure_clean('test.txt') as path:
+            with open(path, 'w') as f:
+                f.write('manual header\n')
+                df.to_csv(f, header=None, index=None)
+            with open(path, 'r') as f:
+                assert f.read() == expected
+
+    @pytest.mark.skipif(compat.PY2, reason="Test case for python3")
+    def test_to_csv_write_to_open_file_with_newline_py3(self):
+        # see gh-21696
+        # see gh-20353
+        df = pd.DataFrame({'a': ['x', 'y', 'z']})
+        expected_rows = ["x",
+                         "y",
+                         "z"]
+        expected = ("manual header\n" +
+                    tm.convert_rows_list_to_csv_str(expected_rows))
+        with tm.ensure_clean('test.txt') as path:
+            with open(path, 'w', newline='') as f:
+                f.write('manual header\n')
+                df.to_csv(f, header=None, index=None)
+
+            with open(path, 'rb') as f:
+                assert f.read() == bytes(expected, 'utf-8')
+
+    @pytest.mark.skipif(compat.PY3, reason="Test case for python2")
+    def test_to_csv_write_to_open_file_with_newline_py2(self):
+        # see gh-21696
+        # see gh-20353
+        df = pd.DataFrame({'a': ['x', 'y', 'z']})
+        expected_rows = ["x",
+                         "y",
+                         "z"]
+        expected = ("manual header\n" +
+                    tm.convert_rows_list_to_csv_str(expected_rows))
+        with tm.ensure_clean('test.txt') as path:
+            with open(path, 'wb') as f:
+                f.write('manual header\n')
+                df.to_csv(f, header=None, index=None)
+
+            with open(path, 'rb') as f:
+                assert f.read() == expected
+
+    @pytest.mark.parametrize("to_infer", [True, False])
+    @pytest.mark.parametrize("read_infer", [True, False])
+    def test_to_csv_compression(self, compression_only,
+                                read_infer, to_infer):
+        # see gh-15008
+        compression = compression_only
+
+        if compression == "zip":
+            pytest.skip("{compression} is not supported "
+                        "for to_csv".format(compression=compression))
+
+        # We'll complete file extension subsequently.
+        filename = "test."
+
+        if compression == "gzip":
+            filename += "gz"
+        else:
+            # xz --> .xz
+            # bz2 --> .bz2
+            filename += compression
+
+        df = DataFrame({"A": [1]})
+
+        to_compression = "infer" if to_infer else compression
+        read_compression = "infer" if read_infer else compression
+
+        with tm.ensure_clean(filename) as path:
+            df.to_csv(path, compression=to_compression)
+            result = pd.read_csv(path, index_col=0,
+                                 compression=read_compression)
+            tm.assert_frame_equal(result, df)
diff --git a/pandas/tests/io/formats/test_to_excel.py b/pandas/tests/io/formats/test_to_excel.py
new file mode 100644
index 0000000000000..13eb517fcab6a
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_excel.py
@@ -0,0 +1,278 @@
+"""Tests formatting as writer-agnostic ExcelCells
+
+ExcelFormatter is tested implicitly in pandas/tests/io/test_excel.py
+"""
+
+import pytest
+
+import pandas.util.testing as tm
+
+from pandas.io.formats.css import CSSWarning
+from pandas.io.formats.excel import CSSToExcelConverter
+
+
+@pytest.mark.parametrize('css,expected', [
+    # FONT
+    # - name
+    ('font-family: foo,bar', {'font': {'name': 'foo'}}),
+    ('font-family: "foo bar",baz', {'font': {'name': 'foo bar'}}),
+    ('font-family: foo,\nbar', {'font': {'name': 'foo'}}),
+    ('font-family: foo, bar,    baz', {'font': {'name': 'foo'}}),
+    ('font-family: bar, foo', {'font': {'name': 'bar'}}),
+    ('font-family: \'foo bar\', baz', {'font': {'name': 'foo bar'}}),
+    ('font-family: \'foo \\\'bar\', baz', {'font': {'name': 'foo \'bar'}}),
+    ('font-family: "foo \\"bar", baz', {'font': {'name': 'foo "bar'}}),
+    ('font-family: "foo ,bar", baz', {'font': {'name': 'foo ,bar'}}),
+    # - family
+    ('font-family: serif', {'font': {'name': 'serif', 'family': 1}}),
+    ('font-family: Serif', {'font': {'name': 'serif', 'family': 1}}),
+    ('font-family: roman, serif', {'font': {'name': 'roman', 'family': 1}}),
+    ('font-family: roman, sans-serif', {'font': {'name': 'roman',
+                                                 'family': 2}}),
+    ('font-family: roman, sans serif', {'font': {'name': 'roman'}}),
+    ('font-family: roman, sansserif', {'font': {'name': 'roman'}}),
+    ('font-family: roman, cursive', {'font': {'name': 'roman', 'family': 4}}),
+    ('font-family: roman, fantasy', {'font': {'name': 'roman', 'family': 5}}),
+    # - size
+    ('font-size: 1em', {'font': {'size': 12}}),
+    ('font-size: xx-small', {'font': {'size': 6}}),
+    ('font-size: x-small', {'font': {'size': 7.5}}),
+    ('font-size: small', {'font': {'size': 9.6}}),
+    ('font-size: medium', {'font': {'size': 12}}),
+    ('font-size: large', {'font': {'size': 13.5}}),
+    ('font-size: x-large', {'font': {'size': 18}}),
+    ('font-size: xx-large', {'font': {'size': 24}}),
+    ('font-size: 50%', {'font': {'size': 6}}),
+    # - bold
+    ('font-weight: 100', {'font': {'bold': False}}),
+    ('font-weight: 200', {'font': {'bold': False}}),
+    ('font-weight: 300', {'font': {'bold': False}}),
+    ('font-weight: 400', {'font': {'bold': False}}),
+    ('font-weight: normal', {'font': {'bold': False}}),
+    ('font-weight: lighter', {'font': {'bold': False}}),
+    ('font-weight: bold', {'font': {'bold': True}}),
+    ('font-weight: bolder', {'font': {'bold': True}}),
+    ('font-weight: 700', {'font': {'bold': True}}),
+    ('font-weight: 800', {'font': {'bold': True}}),
+    ('font-weight: 900', {'font': {'bold': True}}),
+    # - italic
+    ('font-style: italic', {'font': {'italic': True}}),
+    ('font-style: oblique', {'font': {'italic': True}}),
+    # - underline
+    ('text-decoration: underline',
+     {'font': {'underline': 'single'}}),
+    ('text-decoration: overline',
+     {}),
+    ('text-decoration: none',
+     {}),
+    # - strike
+    ('text-decoration: line-through',
+     {'font': {'strike': True}}),
+    ('text-decoration: underline line-through',
+     {'font': {'strike': True, 'underline': 'single'}}),
+    ('text-decoration: underline; text-decoration: line-through',
+     {'font': {'strike': True}}),
+    # - color
+    ('color: red', {'font': {'color': 'FF0000'}}),
+    ('color: #ff0000', {'font': {'color': 'FF0000'}}),
+    ('color: #f0a', {'font': {'color': 'FF00AA'}}),
+    # - shadow
+    ('text-shadow: none', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px #CCC', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px #999', {'font': {'shadow': False}}),
+    ('text-shadow: 0px -0em 0px', {'font': {'shadow': False}}),
+    ('text-shadow: 2px -0em 0px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -2em 0px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -0em 2px #CCC', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -0em 2px', {'font': {'shadow': True}}),
+    ('text-shadow: 0px -2em', {'font': {'shadow': True}}),
+
+    # FILL
+    # - color, fillType
+    ('background-color: red', {'fill': {'fgColor': 'FF0000',
+                                        'patternType': 'solid'}}),
+    ('background-color: #ff0000', {'fill': {'fgColor': 'FF0000',
+                                            'patternType': 'solid'}}),
+    ('background-color: #f0a', {'fill': {'fgColor': 'FF00AA',
+                                         'patternType': 'solid'}}),
+    # BORDER
+    # - style
+    ('border-style: solid',
+     {'border': {'top': {'style': 'medium'},
+                 'bottom': {'style': 'medium'},
+                 'left': {'style': 'medium'},
+                 'right': {'style': 'medium'}}}),
+    ('border-style: solid; border-width: thin',
+     {'border': {'top': {'style': 'thin'},
+                 'bottom': {'style': 'thin'},
+                 'left': {'style': 'thin'},
+                 'right': {'style': 'thin'}}}),
+
+    ('border-top-style: solid; border-top-width: thin',
+     {'border': {'top': {'style': 'thin'}}}),
+    ('border-top-style: solid; border-top-width: 1pt',
+     {'border': {'top': {'style': 'thin'}}}),
+    ('border-top-style: solid',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: medium',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: 2pt',
+     {'border': {'top': {'style': 'medium'}}}),
+    ('border-top-style: solid; border-top-width: thick',
+     {'border': {'top': {'style': 'thick'}}}),
+    ('border-top-style: solid; border-top-width: 4pt',
+     {'border': {'top': {'style': 'thick'}}}),
+
+    ('border-top-style: dotted',
+     {'border': {'top': {'style': 'mediumDashDotDot'}}}),
+    ('border-top-style: dotted; border-top-width: thin',
+     {'border': {'top': {'style': 'dotted'}}}),
+    ('border-top-style: dashed',
+     {'border': {'top': {'style': 'mediumDashed'}}}),
+    ('border-top-style: dashed; border-top-width: thin',
+     {'border': {'top': {'style': 'dashed'}}}),
+    ('border-top-style: double',
+     {'border': {'top': {'style': 'double'}}}),
+    # - color
+    ('border-style: solid; border-color: #0000ff',
+     {'border': {'top': {'style': 'medium', 'color': '0000FF'},
+                 'right': {'style': 'medium', 'color': '0000FF'},
+                 'bottom': {'style': 'medium', 'color': '0000FF'},
+                 'left': {'style': 'medium', 'color': '0000FF'}}}),
+    ('border-top-style: double; border-top-color: blue',
+     {'border': {'top': {'style': 'double', 'color': '0000FF'}}}),
+    ('border-top-style: solid; border-top-color: #06c',
+     {'border': {'top': {'style': 'medium', 'color': '0066CC'}}}),
+    # ALIGNMENT
+    # - horizontal
+    ('text-align: center',
+     {'alignment': {'horizontal': 'center'}}),
+    ('text-align: left',
+     {'alignment': {'horizontal': 'left'}}),
+    ('text-align: right',
+     {'alignment': {'horizontal': 'right'}}),
+    ('text-align: justify',
+     {'alignment': {'horizontal': 'justify'}}),
+    # - vertical
+    ('vertical-align: top',
+     {'alignment': {'vertical': 'top'}}),
+    ('vertical-align: text-top',
+     {'alignment': {'vertical': 'top'}}),
+    ('vertical-align: middle',
+     {'alignment': {'vertical': 'center'}}),
+    ('vertical-align: bottom',
+     {'alignment': {'vertical': 'bottom'}}),
+    ('vertical-align: text-bottom',
+     {'alignment': {'vertical': 'bottom'}}),
+    # - wrap_text
+    ('white-space: nowrap',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: pre',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: pre-line',
+     {'alignment': {'wrap_text': False}}),
+    ('white-space: normal',
+     {'alignment': {'wrap_text': True}}),
+    # NUMBER FORMAT
+    ('number-format: 0%',
+     {'number_format': {'format_code': '0%'}}),
+])
+def test_css_to_excel(css, expected):
+    convert = CSSToExcelConverter()
+    assert expected == convert(css)
+
+
+def test_css_to_excel_multiple():
+    convert = CSSToExcelConverter()
+    actual = convert('''
+        font-weight: bold;
+        text-decoration: underline;
+        color: red;
+        border-width: thin;
+        text-align: center;
+        vertical-align: top;
+        unused: something;
+    ''')
+    assert {"font": {"bold": True, "underline": "single", "color": "FF0000"},
+            "border": {"top": {"style": "thin"},
+                       "right": {"style": "thin"},
+                       "bottom": {"style": "thin"},
+                       "left": {"style": "thin"}},
+            "alignment": {"horizontal": "center",
+                          "vertical": "top"}} == actual
+
+
+@pytest.mark.parametrize('css,inherited,expected', [
+    ('font-weight: bold', '',
+     {'font': {'bold': True}}),
+    ('', 'font-weight: bold',
+     {'font': {'bold': True}}),
+    ('font-weight: bold', 'font-style: italic',
+     {'font': {'bold': True, 'italic': True}}),
+    ('font-style: normal', 'font-style: italic',
+     {'font': {'italic': False}}),
+    ('font-style: inherit', '', {}),
+    ('font-style: normal; font-style: inherit', 'font-style: italic',
+     {'font': {'italic': True}}),
+])
+def test_css_to_excel_inherited(css, inherited, expected):
+    convert = CSSToExcelConverter(inherited)
+    assert expected == convert(css)
+
+
+@pytest.mark.parametrize("input_color,output_color", (
+    [(name, rgb) for name, rgb in CSSToExcelConverter.NAMED_COLORS.items()] +
+    [("#" + rgb, rgb) for rgb in CSSToExcelConverter.NAMED_COLORS.values()] +
+    [("#F0F", "FF00FF"), ("#ABC", "AABBCC")])
+)
+def test_css_to_excel_good_colors(input_color, output_color):
+    # see gh-18392
+    css = ("border-top-color: {color}; "
+           "border-right-color: {color}; "
+           "border-bottom-color: {color}; "
+           "border-left-color: {color}; "
+           "background-color: {color}; "
+           "color: {color}").format(color=input_color)
+
+    expected = dict()
+
+    expected["fill"] = {
+        "patternType": "solid",
+        "fgColor": output_color
+    }
+
+    expected["font"] = {
+        "color": output_color
+    }
+
+    expected["border"] = {
+        k: {
+            "color": output_color,
+        } for k in ("top", "right", "bottom", "left")
+    }
+
+    with tm.assert_produces_warning(None):
+        convert = CSSToExcelConverter()
+        assert expected == convert(css)
+
+
+@pytest.mark.parametrize("input_color", [None, "not-a-color"])
+def test_css_to_excel_bad_colors(input_color):
+    # see gh-18392
+    css = ("border-top-color: {color}; "
+           "border-right-color: {color}; "
+           "border-bottom-color: {color}; "
+           "border-left-color: {color}; "
+           "background-color: {color}; "
+           "color: {color}").format(color=input_color)
+
+    expected = dict()
+
+    if input_color is not None:
+        expected["fill"] = {
+            "patternType": "solid"
+        }
+
+    with tm.assert_produces_warning(CSSWarning):
+        convert = CSSToExcelConverter()
+        assert expected == convert(css)
diff --git a/pandas/tests/io/formats/test_to_html.py b/pandas/tests/io/formats/test_to_html.py
new file mode 100644
index 0000000000000..428f1411a10a6
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_html.py
@@ -0,0 +1,625 @@
+# -*- coding: utf-8 -*-
+
+from datetime import datetime
+from io import open
+import re
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO, lrange, u
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, compat, option_context
+from pandas.util import testing as tm
+
+import pandas.io.formats.format as fmt
+
+lorem_ipsum = (
+    "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod"
+    " tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim"
+    " veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip ex"
+    " ea commodo consequat. Duis aute irure dolor in reprehenderit in"
+    " voluptate velit esse cillum dolore eu fugiat nulla pariatur. Excepteur"
+    " sint occaecat cupidatat non proident, sunt in culpa qui officia"
+    " deserunt mollit anim id est laborum.")
+
+
+def expected_html(datapath, name):
+    """
+    Read HTML file from formats data directory.
+
+    Parameters
+    ----------
+    datapath : pytest fixture
+        The datapath fixture injected into a test by pytest.
+    name : str
+        The name of the HTML file without the suffix.
+
+    Returns
+    -------
+    str : contents of HTML file.
+    """
+    filename = '.'.join([name, 'html'])
+    filepath = datapath('io', 'formats', 'data', 'html', filename)
+    with open(filepath, encoding='utf-8') as f:
+        html = f.read()
+    return html.rstrip()
+
+
+@pytest.fixture(params=['mixed', 'empty'])
+def biggie_df_fixture(request):
+    """Fixture for a big mixed Dataframe and an empty Dataframe"""
+    if request.param == 'mixed':
+        df = DataFrame({'A': np.random.randn(200),
+                        'B': tm.makeStringIndex(200)},
+                       index=lrange(200))
+        df.loc[:20, 'A'] = np.nan
+        df.loc[:20, 'B'] = np.nan
+        return df
+    elif request.param == 'empty':
+        df = DataFrame(index=np.arange(200))
+        return df
+
+
+@pytest.fixture(params=fmt._VALID_JUSTIFY_PARAMETERS)
+def justify(request):
+    return request.param
+
+
+@pytest.mark.parametrize('col_space', [30, 50])
+def test_to_html_with_col_space(col_space):
+    df = DataFrame(np.random.random(size=(1, 3)))
+    # check that col_space affects HTML generation
+    # and be very brittle about it.
+    result = df.to_html(col_space=col_space)
+    hdrs = [x for x in result.split(r"\n") if re.search(r"<th[>\s]", x)]
+    assert len(hdrs) > 0
+    for h in hdrs:
+        assert "min-width" in h
+        assert str(col_space) in h
+
+
+def test_to_html_with_empty_string_label():
+    # GH 3547, to_html regards empty string labels as repeated labels
+    data = {'c1': ['a', 'b'], 'c2': ['a', ''], 'data': [1, 2]}
+    df = DataFrame(data).set_index(['c1', 'c2'])
+    result = df.to_html()
+    assert "rowspan" not in result
+
+
+@pytest.mark.parametrize('df,expected', [
+    (DataFrame({u('\u03c3'): np.arange(10.)}), 'unicode_1'),
+    (DataFrame({'A': [u('\u03c3')]}), 'unicode_2')
+])
+def test_to_html_unicode(df, expected, datapath):
+    expected = expected_html(datapath, expected)
+    result = df.to_html()
+    assert result == expected
+
+
+def test_to_html_decimal(datapath):
+    # GH 12031
+    df = DataFrame({'A': [6.0, 3.1, 2.2]})
+    result = df.to_html(decimal=',')
+    expected = expected_html(datapath, 'gh12031_expected_output')
+    assert result == expected
+
+
+@pytest.mark.parametrize('kwargs,string,expected', [
+    (dict(), "<type 'str'>", 'escaped'),
+    (dict(escape=False), "<b>bold</b>", 'escape_disabled')
+])
+def test_to_html_escaped(kwargs, string, expected, datapath):
+    a = 'str<ing1 &amp;'
+    b = 'stri>ng2 &amp;'
+
+    test_dict = {'co<l1': {a: string,
+                           b: string},
+                 'co>l2': {a: string,
+                           b: string}}
+    result = DataFrame(test_dict).to_html(**kwargs)
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+@pytest.mark.parametrize('index_is_named', [True, False])
+def test_to_html_multiindex_index_false(index_is_named, datapath):
+    # GH 8452
+    df = DataFrame({
+        'a': range(2),
+        'b': range(3, 5),
+        'c': range(5, 7),
+        'd': range(3, 5)
+    })
+    df.columns = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
+    if index_is_named:
+        df.index = Index(df.index.values, name='idx')
+    result = df.to_html(index=False)
+    expected = expected_html(datapath, 'gh8452_expected_output')
+    assert result == expected
+
+
+@pytest.mark.parametrize('multi_sparse,expected', [
+    (False, 'multiindex_sparsify_false_multi_sparse_1'),
+    (False, 'multiindex_sparsify_false_multi_sparse_2'),
+    (True, 'multiindex_sparsify_1'),
+    (True, 'multiindex_sparsify_2')
+])
+def test_to_html_multiindex_sparsify(multi_sparse, expected, datapath):
+    index = MultiIndex.from_arrays([[0, 0, 1, 1], [0, 1, 0, 1]],
+                                   names=['foo', None])
+    df = DataFrame([[0, 1], [2, 3], [4, 5], [6, 7]], index=index)
+    if expected.endswith('2'):
+        df.columns = index[::2]
+    with option_context('display.multi_sparse', multi_sparse):
+        result = df.to_html()
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+@pytest.mark.parametrize('max_rows,expected', [
+    (60, 'gh14882_expected_output_1'),
+
+    # Test that ... appears in a middle level
+    (56, 'gh14882_expected_output_2')
+])
+def test_to_html_multiindex_odd_even_truncate(max_rows, expected, datapath):
+    # GH 14882 - Issue on truncation with odd length DataFrame
+    index = MultiIndex.from_product([[100, 200, 300],
+                                     [10, 20, 30],
+                                     [1, 2, 3, 4, 5, 6, 7]],
+                                    names=['a', 'b', 'c'])
+    df = DataFrame({'n': range(len(index))}, index=index)
+    result = df.to_html(max_rows=max_rows)
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+@pytest.mark.parametrize('df,formatters,expected', [
+    (DataFrame(
+        [[0, 1], [2, 3], [4, 5], [6, 7]],
+        columns=['foo', None], index=lrange(4)),
+     {'__index__': lambda x: 'abcd' [x]},
+     'index_formatter'),
+
+    (DataFrame(
+        {'months': [datetime(2016, 1, 1), datetime(2016, 2, 2)]}),
+     {'months': lambda x: x.strftime('%Y-%m')},
+     'datetime64_monthformatter'),
+
+    (DataFrame({'hod': pd.to_datetime(['10:10:10.100', '12:12:12.120'],
+                                      format='%H:%M:%S.%f')}),
+     {'hod': lambda x: x.strftime('%H:%M')},
+     'datetime64_hourformatter')
+])
+def test_to_html_formatters(df, formatters, expected, datapath):
+    expected = expected_html(datapath, expected)
+    result = df.to_html(formatters=formatters)
+    assert result == expected
+
+
+def test_to_html_regression_GH6098():
+    df = DataFrame({
+        u('clé1'): [u('a'), u('a'), u('b'), u('b'), u('a')],
+        u('clé2'): [u('1er'), u('2ème'), u('1er'), u('2ème'), u('1er')],
+        'données1': np.random.randn(5),
+        'données2': np.random.randn(5)})
+
+    # it works
+    df.pivot_table(index=[u('clé1')], columns=[u('clé2')])._repr_html_()
+
+
+def test_to_html_truncate(datapath):
+    index = pd.date_range(start='20010101', freq='D', periods=20)
+    df = DataFrame(index=index, columns=range(20))
+    result = df.to_html(max_rows=8, max_cols=4)
+    expected = expected_html(datapath, 'truncate')
+    assert result == expected
+
+
+@pytest.mark.parametrize('sparsify,expected', [
+    (True, 'truncate_multi_index'),
+    (False, 'truncate_multi_index_sparse_off')
+])
+def test_to_html_truncate_multi_index(sparsify, expected, datapath):
+    arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+              ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+    df = DataFrame(index=arrays, columns=arrays)
+    result = df.to_html(max_rows=7, max_cols=7, sparsify=sparsify)
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+@pytest.mark.parametrize('option,result,expected', [
+    (None, lambda df: df.to_html(), '1'),
+    (None, lambda df: df.to_html(border=0), '0'),
+    (0, lambda df: df.to_html(), '0'),
+    (0, lambda df: df._repr_html_(), '0'),
+])
+def test_to_html_border(option, result, expected):
+    df = DataFrame({'A': [1, 2]})
+    if option is None:
+        result = result(df)
+    else:
+        with option_context('display.html.border', option):
+            result = result(df)
+    expected = 'border="{}"'.format(expected)
+    assert expected in result
+
+
+def test_display_option_warning():
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        pd.options.html.border
+
+
+@pytest.mark.parametrize('biggie_df_fixture', ['mixed'], indirect=True)
+def test_to_html(biggie_df_fixture):
+    # TODO: split this test
+    df = biggie_df_fixture
+    s = df.to_html()
+
+    buf = StringIO()
+    retval = df.to_html(buf=buf)
+    assert retval is None
+    assert buf.getvalue() == s
+
+    assert isinstance(s, compat.string_types)
+
+    df.to_html(columns=['B', 'A'], col_space=17)
+    df.to_html(columns=['B', 'A'],
+               formatters={'A': lambda x: '{x:.1f}'.format(x=x)})
+
+    df.to_html(columns=['B', 'A'], float_format=str)
+    df.to_html(columns=['B', 'A'], col_space=12, float_format=str)
+
+
+@pytest.mark.parametrize('biggie_df_fixture', ['empty'], indirect=True)
+def test_to_html_empty_dataframe(biggie_df_fixture):
+    df = biggie_df_fixture
+    df.to_html()
+
+
+def test_to_html_filename(biggie_df_fixture, tmpdir):
+    df = biggie_df_fixture
+    expected = df.to_html()
+    path = tmpdir.join('test.html')
+    df.to_html(path)
+    result = path.read()
+    assert result == expected
+
+
+def test_to_html_with_no_bold():
+    df = DataFrame({'x': np.random.randn(5)})
+    html = df.to_html(bold_rows=False)
+    result = html[html.find("</thead>")]
+    assert '<strong' not in result
+
+
+def test_to_html_columns_arg():
+    df = DataFrame(tm.getSeriesData())
+    result = df.to_html(columns=['A'])
+    assert '<th>B</th>' not in result
+
+
+@pytest.mark.parametrize('columns,justify,expected', [
+    (MultiIndex.from_tuples(
+        list(zip(np.arange(2).repeat(2), np.mod(lrange(4), 2))),
+        names=['CL0', 'CL1']),
+     'left',
+     'multiindex_1'),
+
+    (MultiIndex.from_tuples(
+        list(zip(range(4), np.mod(lrange(4), 2)))),
+     'right',
+     'multiindex_2')
+])
+def test_to_html_multiindex(columns, justify, expected, datapath):
+    df = DataFrame([list('abcd'), list('efgh')], columns=columns)
+    result = df.to_html(justify=justify)
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+def test_to_html_justify(justify, datapath):
+    df = DataFrame({'A': [6, 30000, 2],
+                    'B': [1, 2, 70000],
+                    'C': [223442, 0, 1]},
+                   columns=['A', 'B', 'C'])
+    result = df.to_html(justify=justify)
+    expected = expected_html(datapath, 'justify').format(justify=justify)
+    assert result == expected
+
+
+@pytest.mark.parametrize("justify", ["super-right", "small-left",
+                                     "noinherit", "tiny", "pandas"])
+def test_to_html_invalid_justify(justify):
+    # GH 17527
+    df = DataFrame()
+    msg = "Invalid value for justify parameter"
+
+    with pytest.raises(ValueError, match=msg):
+        df.to_html(justify=justify)
+
+
+def test_to_html_index(datapath):
+    # TODO: split this test
+    index = ['foo', 'bar', 'baz']
+    df = DataFrame({'A': [1, 2, 3],
+                    'B': [1.2, 3.4, 5.6],
+                    'C': ['one', 'two', np.nan]},
+                   columns=['A', 'B', 'C'],
+                   index=index)
+    expected_with_index = expected_html(datapath, 'index_1')
+    assert df.to_html() == expected_with_index
+
+    expected_without_index = expected_html(datapath, 'index_2')
+    result = df.to_html(index=False)
+    for i in index:
+        assert i not in result
+    assert result == expected_without_index
+    df.index = Index(['foo', 'bar', 'baz'], name='idx')
+    expected_with_index = expected_html(datapath, 'index_3')
+    assert df.to_html() == expected_with_index
+    assert df.to_html(index=False) == expected_without_index
+
+    tuples = [('foo', 'car'), ('foo', 'bike'), ('bar', 'car')]
+    df.index = MultiIndex.from_tuples(tuples)
+
+    expected_with_index = expected_html(datapath, 'index_4')
+    assert df.to_html() == expected_with_index
+
+    result = df.to_html(index=False)
+    for i in ['foo', 'bar', 'car', 'bike']:
+        assert i not in result
+    # must be the same result as normal index
+    assert result == expected_without_index
+
+    df.index = MultiIndex.from_tuples(tuples, names=['idx1', 'idx2'])
+    expected_with_index = expected_html(datapath, 'index_5')
+    assert df.to_html() == expected_with_index
+    assert df.to_html(index=False) == expected_without_index
+
+
+@pytest.mark.parametrize('classes', [
+    "sortable draggable",
+    ["sortable", "draggable"]
+])
+def test_to_html_with_classes(classes, datapath):
+    df = DataFrame()
+    expected = expected_html(datapath, 'with_classes')
+    result = df.to_html(classes=classes)
+    assert result == expected
+
+
+def test_to_html_no_index_max_rows(datapath):
+    # GH 14998
+    df = DataFrame({"A": [1, 2, 3, 4]})
+    result = df.to_html(index=False, max_rows=1)
+    expected = expected_html(datapath, 'gh14998_expected_output')
+    assert result == expected
+
+
+def test_to_html_multiindex_max_cols(datapath):
+    # GH 6131
+    index = MultiIndex(levels=[['ba', 'bb', 'bc'], ['ca', 'cb', 'cc']],
+                       codes=[[0, 1, 2], [0, 1, 2]],
+                       names=['b', 'c'])
+    columns = MultiIndex(levels=[['d'], ['aa', 'ab', 'ac']],
+                         codes=[[0, 0, 0], [0, 1, 2]],
+                         names=[None, 'a'])
+    data = np.array(
+        [[1., np.nan, np.nan], [np.nan, 2., np.nan], [np.nan, np.nan, 3.]])
+    df = DataFrame(data, index, columns)
+    result = df.to_html(max_cols=2)
+    expected = expected_html(datapath, 'gh6131_expected_output')
+    assert result == expected
+
+
+def test_to_html_multi_indexes_index_false(datapath):
+    # GH 22579
+    df = DataFrame({'a': range(10), 'b': range(10, 20), 'c': range(10, 20),
+                    'd': range(10, 20)})
+    df.columns = MultiIndex.from_product([['a', 'b'], ['c', 'd']])
+    df.index = MultiIndex.from_product([['a', 'b'],
+                                        ['c', 'd', 'e', 'f', 'g']])
+    result = df.to_html(index=False)
+    expected = expected_html(datapath, 'gh22579_expected_output')
+    assert result == expected
+
+
+@pytest.mark.parametrize('index_names', [True, False])
+@pytest.mark.parametrize('header', [True, False])
+@pytest.mark.parametrize('index', [True, False])
+@pytest.mark.parametrize('column_index, column_type', [
+    (Index([0, 1]), 'unnamed_standard'),
+    (Index([0, 1], name='columns.name'), 'named_standard'),
+    (MultiIndex.from_product([['a'], ['b', 'c']]), 'unnamed_multi'),
+    (MultiIndex.from_product(
+        [['a'], ['b', 'c']], names=['columns.name.0',
+                                    'columns.name.1']), 'named_multi')
+])
+@pytest.mark.parametrize('row_index, row_type', [
+    (Index([0, 1]), 'unnamed_standard'),
+    (Index([0, 1], name='index.name'), 'named_standard'),
+    (MultiIndex.from_product([['a'], ['b', 'c']]), 'unnamed_multi'),
+    (MultiIndex.from_product(
+        [['a'], ['b', 'c']], names=['index.name.0',
+                                    'index.name.1']), 'named_multi')
+])
+def test_to_html_basic_alignment(
+        datapath, row_index, row_type, column_index, column_type,
+        index, header, index_names):
+    # GH 22747, GH 22579
+    df = DataFrame(np.zeros((2, 2), dtype=int),
+                   index=row_index, columns=column_index)
+    result = df.to_html(
+        index=index, header=header, index_names=index_names)
+
+    if not index:
+        row_type = 'none'
+    elif not index_names and row_type.startswith('named'):
+        row_type = 'un' + row_type
+
+    if not header:
+        column_type = 'none'
+    elif not index_names and column_type.startswith('named'):
+        column_type = 'un' + column_type
+
+    filename = 'index_' + row_type + '_columns_' + column_type
+    expected = expected_html(datapath, filename)
+    assert result == expected
+
+
+@pytest.mark.parametrize('index_names', [True, False])
+@pytest.mark.parametrize('header', [True, False])
+@pytest.mark.parametrize('index', [True, False])
+@pytest.mark.parametrize('column_index, column_type', [
+    (Index(np.arange(8)), 'unnamed_standard'),
+    (Index(np.arange(8), name='columns.name'), 'named_standard'),
+    (MultiIndex.from_product(
+        [['a', 'b'], ['c', 'd'], ['e', 'f']]), 'unnamed_multi'),
+    (MultiIndex.from_product(
+        [['a', 'b'], ['c', 'd'], ['e', 'f']], names=['foo', None, 'baz']),
+        'named_multi')
+])
+@pytest.mark.parametrize('row_index, row_type', [
+    (Index(np.arange(8)), 'unnamed_standard'),
+    (Index(np.arange(8), name='index.name'), 'named_standard'),
+    (MultiIndex.from_product(
+        [['a', 'b'], ['c', 'd'], ['e', 'f']]), 'unnamed_multi'),
+    (MultiIndex.from_product(
+        [['a', 'b'], ['c', 'd'], ['e', 'f']], names=['foo', None, 'baz']),
+        'named_multi')
+])
+def test_to_html_alignment_with_truncation(
+        datapath, row_index, row_type, column_index, column_type,
+        index, header, index_names):
+    # GH 22747, GH 22579
+    df = DataFrame(np.arange(64).reshape(8, 8),
+                   index=row_index, columns=column_index)
+    result = df.to_html(
+        max_rows=4, max_cols=4,
+        index=index, header=header, index_names=index_names)
+
+    if not index:
+        row_type = 'none'
+    elif not index_names and row_type.startswith('named'):
+        row_type = 'un' + row_type
+
+    if not header:
+        column_type = 'none'
+    elif not index_names and column_type.startswith('named'):
+        column_type = 'un' + column_type
+
+    filename = 'trunc_df_index_' + row_type + '_columns_' + column_type
+    expected = expected_html(datapath, filename)
+    assert result == expected
+
+
+@pytest.mark.parametrize('index', [False, 0])
+def test_to_html_truncation_index_false_max_rows(datapath, index):
+    # GH 15019
+    data = [[1.764052, 0.400157],
+            [0.978738, 2.240893],
+            [1.867558, -0.977278],
+            [0.950088, -0.151357],
+            [-0.103219, 0.410599]]
+    df = DataFrame(data)
+    result = df.to_html(max_rows=4, index=index)
+    expected = expected_html(datapath, 'gh15019_expected_output')
+    assert result == expected
+
+
+@pytest.mark.parametrize('index', [False, 0])
+@pytest.mark.parametrize('col_index_named, expected_output', [
+    (False, 'gh22783_expected_output'),
+    (True, 'gh22783_named_columns_index')
+])
+def test_to_html_truncation_index_false_max_cols(
+        datapath, index, col_index_named, expected_output):
+    # GH 22783
+    data = [[1.764052, 0.400157, 0.978738, 2.240893, 1.867558],
+            [-0.977278, 0.950088, -0.151357, -0.103219, 0.410599]]
+    df = DataFrame(data)
+    if col_index_named:
+        df.columns.rename('columns.name', inplace=True)
+    result = df.to_html(max_cols=4, index=index)
+    expected = expected_html(datapath, expected_output)
+    assert result == expected
+
+
+@pytest.mark.parametrize('notebook', [True, False])
+def test_to_html_notebook_has_style(notebook):
+    df = DataFrame({"A": [1, 2, 3]})
+    result = df.to_html(notebook=notebook)
+
+    if notebook:
+        assert "tbody tr th:only-of-type" in result
+        assert "vertical-align: middle;" in result
+        assert "thead th" in result
+    else:
+        assert "tbody tr th:only-of-type" not in result
+        assert "vertical-align: middle;" not in result
+        assert "thead th" not in result
+
+
+def test_to_html_with_index_names_false():
+    # GH 16493
+    df = DataFrame({"A": [1, 2]}, index=Index(['a', 'b'],
+                                              name='myindexname'))
+    result = df.to_html(index_names=False)
+    assert 'myindexname' not in result
+
+
+def test_to_html_with_id():
+    # GH 8496
+    df = DataFrame({"A": [1, 2]}, index=Index(['a', 'b'],
+                                              name='myindexname'))
+    result = df.to_html(index_names=False, table_id="TEST_ID")
+    assert ' id="TEST_ID"' in result
+
+
+@pytest.mark.parametrize('value,float_format,expected', [
+    (0.19999, '%.3f', 'gh21625_expected_output'),
+    (100.0, '%.0f', 'gh22270_expected_output'),
+])
+def test_to_html_float_format_no_fixed_width(
+        value, float_format, expected, datapath):
+    # GH 21625, GH 22270
+    df = DataFrame({'x': [value]})
+    expected = expected_html(datapath, expected)
+    result = df.to_html(float_format=float_format)
+    assert result == expected
+
+
+@pytest.mark.parametrize("render_links,expected", [
+    (True, 'render_links_true'),
+    (False, 'render_links_false'),
+])
+def test_to_html_render_links(render_links, expected, datapath):
+    # GH 2679
+    data = [
+        [0, 'http://pandas.pydata.org/?q1=a&q2=b', 'pydata.org'],
+        [0, 'www.pydata.org', 'pydata.org']
+    ]
+    df = DataFrame(data, columns=['foo', 'bar', None])
+
+    result = df.to_html(render_links=render_links)
+    expected = expected_html(datapath, expected)
+    assert result == expected
+
+
+@pytest.mark.parametrize('method,expected', [
+    ('to_html', lambda x:lorem_ipsum),
+    ('_repr_html_', lambda x:lorem_ipsum[:x - 4] + '...')  # regression case
+])
+@pytest.mark.parametrize('max_colwidth', [10, 20, 50, 100])
+def test_ignore_display_max_colwidth(method, expected, max_colwidth):
+    # see gh-17004
+    df = DataFrame([lorem_ipsum])
+    with pd.option_context('display.max_colwidth', max_colwidth):
+        result = getattr(df, method)()
+    expected = expected(max_colwidth)
+    assert expected in result
diff --git a/pandas/tests/io/formats/test_to_latex.py b/pandas/tests/io/formats/test_to_latex.py
new file mode 100644
index 0000000000000..1653e474aa7b0
--- /dev/null
+++ b/pandas/tests/io/formats/test_to_latex.py
@@ -0,0 +1,737 @@
+import codecs
+from datetime import datetime
+
+import pytest
+
+from pandas.compat import u
+
+import pandas as pd
+from pandas import DataFrame, Series, compat
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def frame():
+    return DataFrame(tm.getSeriesData())
+
+
+class TestToLatex(object):
+
+    def test_to_latex_filename(self, frame):
+        with tm.ensure_clean('test.tex') as path:
+            frame.to_latex(path)
+
+            with open(path, 'r') as f:
+                assert frame.to_latex() == f.read()
+
+        # test with utf-8 and encoding option (GH 7061)
+        df = DataFrame([[u'au\xdfgangen']])
+        with tm.ensure_clean('test.tex') as path:
+            df.to_latex(path, encoding='utf-8')
+            with codecs.open(path, 'r', encoding='utf-8') as f:
+                assert df.to_latex() == f.read()
+
+        # test with utf-8 without encoding option
+        if compat.PY3:  # python3: pandas default encoding is utf-8
+            with tm.ensure_clean('test.tex') as path:
+                df.to_latex(path)
+                with codecs.open(path, 'r', encoding='utf-8') as f:
+                    assert df.to_latex() == f.read()
+        else:
+            # python2 default encoding is ascii, so an error should be raised
+            with tm.ensure_clean('test.tex') as path:
+                with pytest.raises(UnicodeEncodeError):
+                    df.to_latex(path)
+
+    def test_to_latex(self, frame):
+        # it works!
+        frame.to_latex()
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex()
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+ a &   b \\
+\midrule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+    def test_to_latex_format(self, frame):
+        # GH Bug #9402
+        frame.to_latex(column_format='ccc')
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(column_format='ccc')
+        withindex_expected = r"""\begin{tabular}{ccc}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_empty(self):
+        df = DataFrame()
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{l}
+\toprule
+Empty DataFrame
+Columns: Index([], dtype='object')
+Index: Index([], dtype='object') \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.to_latex(longtable=True)
+        expected = r"""\begin{longtable}{l}
+\toprule
+Empty DataFrame
+Columns: Index([], dtype='object')
+Index: Index([], dtype='object') \\
+\end{longtable}
+"""
+        assert result == expected
+
+    def test_to_latex_with_formatters(self):
+        df = DataFrame({'datetime64': [datetime(2016, 1, 1),
+                                       datetime(2016, 2, 5),
+                                       datetime(2016, 3, 3)],
+                        'float': [1.0, 2.0, 3.0],
+                        'int': [1, 2, 3],
+                        'object': [(1, 2), True, False],
+                        })
+
+        formatters = {'datetime64': lambda x: x.strftime('%Y-%m'),
+                      'float': lambda x: '[{x: 4.1f}]'.format(x=x),
+                      'int': lambda x: '0x{x:x}'.format(x=x),
+                      'object': lambda x: '-{x!s}-'.format(x=x),
+                      '__index__': lambda x: 'index: {x}'.format(x=x)}
+        result = df.to_latex(formatters=dict(formatters))
+
+        expected = r"""\begin{tabular}{llrrl}
+\toprule
+{} & datetime64 &  float & int &    object \\
+\midrule
+index: 0 &    2016-01 & [ 1.0] & 0x1 &  -(1, 2)- \\
+index: 1 &    2016-02 & [ 2.0] & 0x2 &    -True- \\
+index: 2 &    2016-03 & [ 3.0] & 0x3 &   -False- \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_multiindex(self):
+        df = DataFrame({('x', 'y'): ['a']})
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  x \\
+{} &  y \\
+\midrule
+0 &  a \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        result = df.T.to_latex()
+        expected = r"""\begin{tabular}{lll}
+\toprule
+  &   &  0 \\
+\midrule
+x & y &  a \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        df = DataFrame.from_dict({
+            ('c1', 0): pd.Series({x: x for x in range(4)}),
+            ('c1', 1): pd.Series({x: x + 4 for x in range(4)}),
+            ('c2', 0): pd.Series({x: x for x in range(4)}),
+            ('c2', 1): pd.Series({x: x + 4 for x in range(4)}),
+            ('c3', 0): pd.Series({x: x for x in range(4)}),
+        }).T
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{llrrrr}
+\toprule
+   &   &  0 &  1 &  2 &  3 \\
+\midrule
+c1 & 0 &  0 &  1 &  2 &  3 \\
+   & 1 &  4 &  5 &  6 &  7 \\
+c2 & 0 &  0 &  1 &  2 &  3 \\
+   & 1 &  4 &  5 &  6 &  7 \\
+c3 & 0 &  0 &  1 &  2 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        # GH 14184
+        df = df.T
+        df.columns.names = ['a', 'b']
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+a & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
+b &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  4 &  0 &  4 &  0 \\
+1 &  1 &  5 &  1 &  5 &  1 \\
+2 &  2 &  6 &  2 &  6 &  2 \\
+3 &  3 &  7 &  3 &  7 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        # GH 10660
+        df = pd.DataFrame({'a': [0, 0, 1, 1],
+                           'b': list('abab'),
+                           'c': [1, 2, 3, 4]})
+        result = df.set_index(['a', 'b']).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+  &   &  c \\
+a & b &    \\
+\midrule
+0 & a &  1 \\
+  & b &  2 \\
+1 & a &  3 \\
+  & b &  4 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+        result = df.groupby('a').describe().to_latex()
+        expected = r"""\begin{tabular}{lrrrrrrrr}
+\toprule
+{} & \multicolumn{8}{l}{c} \\
+{} & count & mean &       std &  min &   25\% &  50\% &   75\% &  max \\
+a &       &      &           &      &       &      &       &      \\
+\midrule
+0 &   2.0 &  1.5 &  0.707107 &  1.0 &  1.25 &  1.5 &  1.75 &  2.0 \\
+1 &   2.0 &  3.5 &  0.707107 &  3.0 &  3.25 &  3.5 &  3.75 &  4.0 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert result == expected
+
+    def test_to_latex_multiindex_dupe_level(self):
+        # see gh-14484
+        #
+        # If an index is repeated in subsequent rows, it should be
+        # replaced with a blank in the created table. This should
+        # ONLY happen if all higher order indices (to the left) are
+        # equal too. In this test, 'c' has to be printed both times
+        # because the higher order index 'A' != 'B'.
+        df = pd.DataFrame(index=pd.MultiIndex.from_tuples(
+            [('A', 'c'), ('B', 'c')]), columns=['col'])
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lll}
+\toprule
+  &   &  col \\
+\midrule
+A & c &  NaN \\
+B & c &  NaN \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_multicolumnrow(self):
+        df = pd.DataFrame({
+            ('c1', 0): {x: x for x in range(5)},
+            ('c1', 1): {x: x + 5 for x in range(5)},
+            ('c2', 0): {x: x for x in range(5)},
+            ('c2', 1): {x: x + 5 for x in range(5)},
+            ('c3', 0): {x: x for x in range(5)}
+        })
+        result = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+{} & \multicolumn{2}{l}{c1} & \multicolumn{2}{l}{c2} & c3 \\
+{} &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  5 &  0 &  5 &  0 \\
+1 &  1 &  6 &  1 &  6 &  1 \\
+2 &  2 &  7 &  2 &  7 &  2 \\
+3 &  3 &  8 &  3 &  8 &  3 \\
+4 &  4 &  9 &  4 &  9 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.to_latex(multicolumn=False)
+        expected = r"""\begin{tabular}{lrrrrr}
+\toprule
+{} & c1 &    & c2 &    & c3 \\
+{} &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+0 &  0 &  5 &  0 &  5 &  0 \\
+1 &  1 &  6 &  1 &  6 &  1 \\
+2 &  2 &  7 &  2 &  7 &  2 \\
+3 &  3 &  8 &  3 &  8 &  3 \\
+4 &  4 &  9 &  4 &  9 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        result = df.T.to_latex(multirow=True)
+        expected = r"""\begin{tabular}{llrrrrr}
+\toprule
+   &   &  0 &  1 &  2 &  3 &  4 \\
+\midrule
+\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+        df.index = df.T.index
+        result = df.T.to_latex(multirow=True, multicolumn=True,
+                               multicolumn_format='c')
+        expected = r"""\begin{tabular}{llrrrrr}
+\toprule
+   &   & \multicolumn{2}{c}{c1} & \multicolumn{2}{c}{c2} & c3 \\
+   &   &  0 &  1 &  0 &  1 &  0 \\
+\midrule
+\multirow{2}{*}{c1} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+\multirow{2}{*}{c2} & 0 &  0 &  1 &  2 &  3 &  4 \\
+   & 1 &  5 &  6 &  7 &  8 &  9 \\
+\cline{1-7}
+c3 & 0 &  0 &  1 &  2 &  3 &  4 \\
+\bottomrule
+\end{tabular}
+"""
+        assert result == expected
+
+    def test_to_latex_escape(self):
+        a = 'a'
+        b = 'b'
+
+        test_dict = {u('co$e^x$'): {a: "a",
+                                    b: "b"},
+                     u('co^l1'): {a: "a",
+                                  b: "b"}}
+
+        unescaped_result = DataFrame(test_dict).to_latex(escape=False)
+        escaped_result = DataFrame(test_dict).to_latex(
+        )  # default: escape=True
+
+        unescaped_expected = r'''\begin{tabular}{lll}
+\toprule
+{} & co$e^x$ & co^l1 \\
+\midrule
+a &       a &     a \\
+b &       b &     b \\
+\bottomrule
+\end{tabular}
+'''
+
+        escaped_expected = r'''\begin{tabular}{lll}
+\toprule
+{} & co\$e\textasciicircum x\$ & co\textasciicircum l1 \\
+\midrule
+a &       a &     a \\
+b &       b &     b \\
+\bottomrule
+\end{tabular}
+'''
+
+        assert unescaped_result == unescaped_expected
+        assert escaped_result == escaped_expected
+
+    def test_to_latex_special_escape(self):
+        df = DataFrame([r"a\b\c", r"^a^b^c", r"~a~b~c"])
+
+        escaped_result = df.to_latex()
+        escaped_expected = r"""\begin{tabular}{ll}
+\toprule
+{} &       0 \\
+\midrule
+0 &   a\textbackslash b\textbackslash c \\
+1 &  \textasciicircum a\textasciicircum b\textasciicircum c \\
+2 &  \textasciitilde a\textasciitilde b\textasciitilde c \\
+\bottomrule
+\end{tabular}
+"""
+        assert escaped_result == escaped_expected
+
+    def test_to_latex_longtable(self, frame):
+        frame.to_latex(longtable=True)
+
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(longtable=True)
+        withindex_expected = r"""\begin{longtable}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+\endhead
+\midrule
+\multicolumn{3}{r}{{Continued on next page}} \\
+\midrule
+\endfoot
+
+\bottomrule
+\endlastfoot
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\end{longtable}
+"""
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False, longtable=True)
+        withoutindex_expected = r"""\begin{longtable}{rl}
+\toprule
+ a &   b \\
+\midrule
+\endhead
+\midrule
+\multicolumn{2}{r}{{Continued on next page}} \\
+\midrule
+\endfoot
+
+\bottomrule
+\endlastfoot
+ 1 &  b1 \\
+ 2 &  b2 \\
+\end{longtable}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+        df = DataFrame({'a': [1, 2]})
+        with1column_result = df.to_latex(index=False, longtable=True)
+        assert r"\multicolumn{1}" in with1column_result
+
+        df = DataFrame({'a': [1, 2], 'b': [3, 4], 'c': [5, 6]})
+        with3columns_result = df.to_latex(index=False, longtable=True)
+        assert r"\multicolumn{3}" in with3columns_result
+
+    def test_to_latex_escape_special_chars(self):
+        special_characters = ['&', '%', '$', '#', '_', '{', '}', '~', '^',
+                              '\\']
+        df = DataFrame(data=special_characters)
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  0 \\
+\midrule
+0 &  \& \\
+1 &  \% \\
+2 &  \$ \\
+3 &  \# \\
+4 &  \_ \\
+5 &  \{ \\
+6 &  \} \\
+7 &  \textasciitilde  \\
+8 &  \textasciicircum  \\
+9 &  \textbackslash  \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert observed == expected
+
+    def test_to_latex_no_header(self):
+        # GH 7124
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(header=False)
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(index=False, header=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+    def test_to_latex_specified_header(self):
+        # GH 7124
+        df = DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(header=['AA', 'BB'])
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} & AA &  BB \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+        withoutindex_result = df.to_latex(header=['AA', 'BB'], index=False)
+        withoutindex_expected = r"""\begin{tabular}{rl}
+\toprule
+AA &  BB \\
+\midrule
+ 1 &  b1 \\
+ 2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutindex_result == withoutindex_expected
+
+        withoutescape_result = df.to_latex(header=['$A$', '$B$'], escape=False)
+        withoutescape_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} & $A$ & $B$ \\
+\midrule
+0 &   1 &  b1 \\
+1 &   2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withoutescape_result == withoutescape_expected
+
+        with pytest.raises(ValueError):
+            df.to_latex(header=['A'])
+
+    def test_to_latex_decimal(self, frame):
+        # GH 12031
+        frame.to_latex()
+
+        df = DataFrame({'a': [1.0, 2.1], 'b': ['b1', 'b2']})
+        withindex_result = df.to_latex(decimal=',')
+
+        withindex_expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &    a &   b \\
+\midrule
+0 &  1,0 &  b1 \\
+1 &  2,1 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_series(self):
+        s = Series(['a', 'b', 'c'])
+        withindex_result = s.to_latex()
+        withindex_expected = r"""\begin{tabular}{ll}
+\toprule
+{} &  0 \\
+\midrule
+0 &  a \\
+1 &  b \\
+2 &  c \\
+\bottomrule
+\end{tabular}
+"""
+        assert withindex_result == withindex_expected
+
+    def test_to_latex_bold_rows(self):
+        # GH 16707
+        df = pd.DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        observed = df.to_latex(bold_rows=True)
+        expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+\textbf{0} &  1 &  b1 \\
+\textbf{1} &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_no_bold_rows(self):
+        # GH 16707
+        df = pd.DataFrame({'a': [1, 2], 'b': ['b1', 'b2']})
+        observed = df.to_latex(bold_rows=False)
+        expected = r"""\begin{tabular}{lrl}
+\toprule
+{} &  a &   b \\
+\midrule
+0 &  1 &  b1 \\
+1 &  2 &  b2 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    @pytest.mark.parametrize('name0', [None, 'named0'])
+    @pytest.mark.parametrize('name1', [None, 'named1'])
+    @pytest.mark.parametrize('axes', [[0], [1], [0, 1]])
+    def test_to_latex_multiindex_names(self, name0, name1, axes):
+        # GH 18667
+        names = [name0, name1]
+        mi = pd.MultiIndex.from_product([[1, 2], [3, 4]])
+        df = pd.DataFrame(-1, index=mi.copy(), columns=mi.copy())
+        for idx in axes:
+            df.axes[idx].names = names
+
+        idx_names = tuple(n or '{}' for n in names)
+        idx_names_row = ('%s & %s &    &    &    &    \\\\\n' % idx_names
+                         if (0 in axes and any(names)) else '')
+        placeholder = '{}' if any(names) and 1 in axes else ' '
+        col_names = [n if (bool(n) and 1 in axes) else placeholder
+                     for n in names]
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{llrrrr}
+\toprule
+  & %s & \multicolumn{2}{l}{1} & \multicolumn{2}{l}{2} \\
+  & %s &  3 &  4 &  3 &  4 \\
+%s\midrule
+1 & 3 & -1 & -1 & -1 & -1 \\
+  & 4 & -1 & -1 & -1 & -1 \\
+2 & 3 & -1 & -1 & -1 & -1 \\
+  & 4 & -1 & -1 & -1 & -1 \\
+\bottomrule
+\end{tabular}
+""" % tuple(list(col_names) + [idx_names_row])
+        assert observed == expected
+
+    @pytest.mark.parametrize('one_row', [True, False])
+    def test_to_latex_multiindex_nans(self, one_row):
+        # GH 14249
+        df = pd.DataFrame({'a': [None, 1], 'b': [2, 3], 'c': [4, 5]})
+        if one_row:
+            df = df.iloc[[0]]
+        observed = df.set_index(['a', 'b']).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+    &   &  c \\
+a & b &    \\
+\midrule
+NaN & 2 &  4 \\
+"""
+        if not one_row:
+            expected += r"""1.0 & 3 &  5 \\
+"""
+        expected += r"""\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_non_string_index(self):
+        # GH 19981
+        observed = pd.DataFrame([[1, 2, 3]] * 2).set_index([0, 1]).to_latex()
+        expected = r"""\begin{tabular}{llr}
+\toprule
+  &   &  2 \\
+0 & 1 &    \\
+\midrule
+1 & 2 &  3 \\
+  & 2 &  3 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_midrule_location(self):
+        # GH 18326
+        df = pd.DataFrame({'a': [1, 2]})
+        df.index.name = 'foo'
+        observed = df.to_latex(index_names=False)
+        expected = r"""\begin{tabular}{lr}
+\toprule
+{} &  a \\
+\midrule
+0 &  1 \\
+1 &  2 \\
+\bottomrule
+\end{tabular}
+"""
+
+        assert observed == expected
+
+    def test_to_latex_multiindex_empty_name(self):
+        # GH 18669
+        mi = pd.MultiIndex.from_product([[1, 2]], names=[''])
+        df = pd.DataFrame(-1, index=mi, columns=range(4))
+        observed = df.to_latex()
+        expected = r"""\begin{tabular}{lrrrr}
+\toprule
+  &  0 &  1 &  2 &  3 \\
+{} &    &    &    &    \\
+\midrule
+1 & -1 & -1 & -1 & -1 \\
+2 & -1 & -1 & -1 & -1 \\
+\bottomrule
+\end{tabular}
+"""
+        assert observed == expected
+
+    def test_to_latex_float_format_no_fixed_width(self):
+
+        # GH 21625
+        df = DataFrame({'x': [0.19999]})
+        expected = r"""\begin{tabular}{lr}
+\toprule
+{} &     x \\
+\midrule
+0 & 0.200 \\
+\bottomrule
+\end{tabular}
+"""
+        assert df.to_latex(float_format='%.3f') == expected
+
+        # GH 22270
+        df = DataFrame({'x': [100.0]})
+        expected = r"""\begin{tabular}{lr}
+\toprule
+{} &   x \\
+\midrule
+0 & 100 \\
+\bottomrule
+\end{tabular}
+"""
+        assert df.to_latex(float_format='%.0f') == expected
diff --git a/pandas/tests/io/generate_legacy_storage_files.py b/pandas/tests/io/generate_legacy_storage_files.py
old mode 100644
new mode 100755
index d0365cb2c30b3..6c6e28cb1c090
--- a/pandas/tests/io/generate_legacy_storage_files.py
+++ b/pandas/tests/io/generate_legacy_storage_files.py
@@ -1,18 +1,62 @@
-""" self-contained to write legacy storage (pickle/msgpack) files """
+#!/usr/bin/env python
+
+"""
+self-contained to write legacy storage (pickle/msgpack) files
+
+To use this script. Create an environment where you want
+generate pickles, say its for 0.18.1, with your pandas clone
+in ~/pandas
+
+. activate pandas_0.18.1
+cd ~/
+
+$ python pandas/pandas/tests/io/generate_legacy_storage_files.py \
+    pandas/pandas/tests/io/data/legacy_pickle/0.18.1/ pickle
+
+This script generates a storage file for the current arch, system,
+and python version
+  pandas version: 0.18.1
+  output dir    : pandas/pandas/tests/io/data/legacy_pickle/0.18.1/
+  storage format: pickle
+created pickle file: 0.18.1_x86_64_darwin_3.5.2.pickle
+
+The idea here is you are using the *current* version of the
+generate_legacy_storage_files with an *older* version of pandas to
+generate a pickle file. We will then check this file into a current
+branch, and test using test_pickle.py. This will load the *older*
+pickles and test versus the current data that is generated
+(with master). These are then compared.
+
+If we have cases where we changed the signature (e.g. we renamed
+offset -> freq in Timestamp). Then we have to conditionally execute
+in the generate_legacy_storage_files.py to make it
+run under the older AND the newer version.
+
+"""
+
 from __future__ import print_function
+
+from datetime import timedelta
 from distutils.version import LooseVersion
-from pandas import (Series, DataFrame, Panel,
-                    SparseSeries, SparseDataFrame,
-                    Index, MultiIndex, bdate_range, to_msgpack,
-                    date_range, period_range,
-                    Timestamp, NaT, Categorical, Period)
-from pandas.compat import u
 import os
+import platform as pl
 import sys
+
 import numpy as np
+
+from pandas.compat import u
+
 import pandas
-import platform as pl
+from pandas import (
+    Categorical, DataFrame, Index, MultiIndex, NaT, Period, Series,
+    SparseDataFrame, SparseSeries, Timestamp, bdate_range, date_range,
+    period_range, timedelta_range, to_msgpack)
 
+from pandas.tseries.offsets import (
+    FY5253, BusinessDay, BusinessHour, CustomBusinessDay, DateOffset, Day,
+    Easter, Hour, LastWeekOfMonth, Minute, MonthBegin, MonthEnd, QuarterBegin,
+    QuarterEnd, SemiMonthBegin, SemiMonthEnd, Week, WeekOfMonth, YearBegin,
+    YearEnd)
 
 _loose_version = LooseVersion(pandas.__version__)
 
@@ -72,7 +116,18 @@ def create_data():
 
     index = dict(int=Index(np.arange(10)),
                  date=date_range('20130101', periods=10),
-                 period=period_range('2013-01-01', freq='M', periods=10))
+                 period=period_range('2013-01-01', freq='M', periods=10),
+                 float=Index(np.arange(10, dtype=np.float64)),
+                 uint=Index(np.arange(10, dtype=np.uint64)),
+                 timedelta=timedelta_range('00:00:00', freq='30T', periods=10))
+
+    if _loose_version >= LooseVersion('0.18'):
+        from pandas import RangeIndex
+        index['range'] = RangeIndex(10)
+
+    if _loose_version >= LooseVersion('0.21'):
+        from pandas import interval_range
+        index['interval'] = interval_range(0, periods=10)
 
     mi = dict(reg2=MultiIndex.from_tuples(
         tuple(zip(*[[u'bar', u'bar', u'baz', u'baz', u'foo',
@@ -124,32 +179,55 @@ def create_data():
                  mixed_dup=mixed_dup_df,
                  dt_mixed_tzs=DataFrame({
                      u'A': Timestamp('20130102', tz='US/Eastern'),
-                     u'B': Timestamp('20130603', tz='CET')}, index=range(5))
+                     u'B': Timestamp('20130603', tz='CET')}, index=range(5)),
+                 dt_mixed2_tzs=DataFrame({
+                     u'A': Timestamp('20130102', tz='US/Eastern'),
+                     u'B': Timestamp('20130603', tz='CET'),
+                     u'C': Timestamp('20130603', tz='UTC')}, index=range(5))
                  )
 
-    mixed_dup_panel = Panel({u'ItemA': frame[u'float'],
-                             u'ItemB': frame[u'int']})
-    mixed_dup_panel.items = [u'ItemA', u'ItemA']
-    panel = dict(float=Panel({u'ItemA': frame[u'float'],
-                              u'ItemB': frame[u'float'] + 1}),
-                 dup=Panel(np.arange(30).reshape(3, 5, 2).astype(np.float64),
-                           items=[u'A', u'B', u'A']),
-                 mixed_dup=mixed_dup_panel)
-
     cat = dict(int8=Categorical(list('abcdefg')),
                int16=Categorical(np.arange(1000)),
                int32=Categorical(np.arange(10000)))
 
     timestamp = dict(normal=Timestamp('2011-01-01'),
                      nat=NaT,
-                     tz=Timestamp('2011-01-01', tz='US/Eastern'),
-                     freq=Timestamp('2011-01-01', freq='D'),
-                     both=Timestamp('2011-01-01', tz='Asia/Tokyo',
-                                    freq='M'))
+                     tz=Timestamp('2011-01-01', tz='US/Eastern'))
+
+    if _loose_version < LooseVersion('0.19.2'):
+        timestamp['freq'] = Timestamp('2011-01-01', offset='D')
+        timestamp['both'] = Timestamp('2011-01-01', tz='Asia/Tokyo',
+                                      offset='M')
+    else:
+        timestamp['freq'] = Timestamp('2011-01-01', freq='D')
+        timestamp['both'] = Timestamp('2011-01-01', tz='Asia/Tokyo',
+                                      freq='M')
+
+    off = {'DateOffset': DateOffset(years=1),
+           'DateOffset_h_ns': DateOffset(hour=6, nanoseconds=5824),
+           'BusinessDay': BusinessDay(offset=timedelta(seconds=9)),
+           'BusinessHour': BusinessHour(normalize=True, n=6, end='15:14'),
+           'CustomBusinessDay': CustomBusinessDay(weekmask='Mon Fri'),
+           'SemiMonthBegin': SemiMonthBegin(day_of_month=9),
+           'SemiMonthEnd': SemiMonthEnd(day_of_month=24),
+           'MonthBegin': MonthBegin(1),
+           'MonthEnd': MonthEnd(1),
+           'QuarterBegin': QuarterBegin(1),
+           'QuarterEnd': QuarterEnd(1),
+           'Day': Day(1),
+           'YearBegin': YearBegin(1),
+           'YearEnd': YearEnd(1),
+           'Week': Week(1),
+           'Week_Tues': Week(2, normalize=False, weekday=1),
+           'WeekOfMonth': WeekOfMonth(week=3, weekday=4),
+           'LastWeekOfMonth': LastWeekOfMonth(n=1, weekday=3),
+           'FY5253': FY5253(n=2, weekday=6, startingMonth=7, variation="last"),
+           'Easter': Easter(),
+           'Hour': Hour(1),
+           'Minute': Minute(1)}
 
     return dict(series=series,
                 frame=frame,
-                panel=panel,
                 index=index,
                 scalars=scalars,
                 mi=mi,
@@ -157,7 +235,8 @@ def create_data():
                                ts=_create_sp_tsseries()),
                 sp_frame=dict(float=_create_sp_frame()),
                 cat=cat,
-                timestamp=timestamp)
+                timestamp=timestamp,
+                offsets=off)
 
 
 def create_pickle_data():
@@ -165,10 +244,10 @@ def create_pickle_data():
 
     # Pre-0.14.1 versions generated non-unpicklable mixed-type frames and
     # panels if their columns/items were non-unique.
-    if _loose_version < '0.14.1':
+    if _loose_version < LooseVersion('0.14.1'):
         del data['frame']['mixed_dup']
         del data['panel']['mixed_dup']
-    if _loose_version < '0.17.0':
+    if _loose_version < LooseVersion('0.17.0'):
         del data['series']['period']
         del data['scalars']['period']
     return data
@@ -180,12 +259,12 @@ def _u(x):
 
 def create_msgpack_data():
     data = create_data()
-    if _loose_version < '0.17.0':
+    if _loose_version < LooseVersion('0.17.0'):
         del data['frame']['mixed_dup']
         del data['panel']['mixed_dup']
         del data['frame']['dup']
         del data['panel']['dup']
-    if _loose_version < '0.18.0':
+    if _loose_version < LooseVersion('0.18.0'):
         del data['series']['dt_tz']
         del data['frame']['dt_mixed_tzs']
     # Not supported
@@ -196,6 +275,9 @@ def create_msgpack_data():
     del data['frame']['cat_onecol']
     del data['frame']['cat_and_float']
     del data['scalars']['period']
+    if _loose_version < LooseVersion('0.23.0'):
+        del data['index']['interval']
+    del data['offsets']
     return _u(data)
 
 
@@ -209,7 +291,7 @@ def write_legacy_pickles(output_dir):
     # make sure we are < 0.13 compat (in py3)
     try:
         from pandas.compat import zip, cPickle as pickle  # noqa
-    except:
+    except ImportError:
         import pickle
 
     version = pandas.__version__
diff --git a/pandas/tests/io/json/data/tsframe_v012.json.zip b/pandas/tests/io/json/data/tsframe_v012.json.zip
new file mode 100644
index 0000000000000..100ba0c87b2ba
Binary files /dev/null and b/pandas/tests/io/json/data/tsframe_v012.json.zip differ
diff --git a/pandas/tests/io/json/test_compression.py b/pandas/tests/io/json/test_compression.py
new file mode 100644
index 0000000000000..430acbdac804a
--- /dev/null
+++ b/pandas/tests/io/json/test_compression.py
@@ -0,0 +1,120 @@
+import pytest
+
+import pandas.util._test_decorators as td
+
+import pandas as pd
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+def test_compression_roundtrip(compression):
+    df = pd.DataFrame([[0.123456, 0.234567, 0.567567],
+                       [12.32112, 123123.2, 321321.2]],
+                      index=['A', 'B'], columns=['X', 'Y', 'Z'])
+
+    with tm.ensure_clean() as path:
+        df.to_json(path, compression=compression)
+        assert_frame_equal(df, pd.read_json(path,
+                                            compression=compression))
+
+        # explicitly ensure file was compressed.
+        with tm.decompress_file(path, compression) as fh:
+            result = fh.read().decode('utf8')
+        assert_frame_equal(df, pd.read_json(result))
+
+
+def test_read_zipped_json(datapath):
+    uncompressed_path = datapath("io", "json", "data", "tsframe_v012.json")
+    uncompressed_df = pd.read_json(uncompressed_path)
+
+    compressed_path = datapath("io", "json", "data", "tsframe_v012.json.zip")
+    compressed_df = pd.read_json(compressed_path, compression='zip')
+
+    assert_frame_equal(uncompressed_df, compressed_df)
+
+
+@td.skip_if_not_us_locale
+def test_with_s3_url(compression, s3_resource):
+    # Bucket "pandas-test" created in tests/io/conftest.py
+
+    df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+
+    with tm.ensure_clean() as path:
+        df.to_json(path, compression=compression)
+        with open(path, 'rb') as f:
+            s3_resource.Bucket("pandas-test").put_object(Key='test-1', Body=f)
+
+    roundtripped_df = pd.read_json('s3://pandas-test/test-1',
+                                   compression=compression)
+    assert_frame_equal(df, roundtripped_df)
+
+
+def test_lines_with_compression(compression):
+
+    with tm.ensure_clean() as path:
+        df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+        df.to_json(path, orient='records', lines=True,
+                   compression=compression)
+        roundtripped_df = pd.read_json(path, lines=True,
+                                       compression=compression)
+        assert_frame_equal(df, roundtripped_df)
+
+
+def test_chunksize_with_compression(compression):
+
+    with tm.ensure_clean() as path:
+        df = pd.read_json('{"a": ["foo", "bar", "baz"], "b": [4, 5, 6]}')
+        df.to_json(path, orient='records', lines=True,
+                   compression=compression)
+
+        res = pd.read_json(path, lines=True, chunksize=1,
+                           compression=compression)
+        roundtripped_df = pd.concat(res)
+        assert_frame_equal(df, roundtripped_df)
+
+
+def test_write_unsupported_compression_type():
+    df = pd.read_json('{"a": [1, 2, 3], "b": [4, 5, 6]}')
+    with tm.ensure_clean() as path:
+        msg = "Unrecognized compression type: unsupported"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(path, compression="unsupported")
+
+
+def test_read_unsupported_compression_type():
+    with tm.ensure_clean() as path:
+        msg = "Unrecognized compression type: unsupported"
+        with pytest.raises(ValueError, match=msg):
+            pd.read_json(path, compression="unsupported")
+
+
+@pytest.mark.parametrize("to_infer", [True, False])
+@pytest.mark.parametrize("read_infer", [True, False])
+def test_to_json_compression(compression_only,
+                             read_infer, to_infer):
+    # see gh-15008
+    compression = compression_only
+
+    if compression == "zip":
+        pytest.skip("{compression} is not supported "
+                    "for to_csv".format(compression=compression))
+
+    # We'll complete file extension subsequently.
+    filename = "test."
+
+    if compression == "gzip":
+        filename += "gz"
+    else:
+        # xz --> .xz
+        # bz2 --> .bz2
+        filename += compression
+
+    df = pd.DataFrame({"A": [1]})
+
+    to_compression = "infer" if to_infer else compression
+    read_compression = "infer" if read_infer else compression
+
+    with tm.ensure_clean(filename) as path:
+        df.to_json(path, compression=to_compression)
+        result = pd.read_json(path, compression=read_compression)
+        tm.assert_frame_equal(result, df)
diff --git a/pandas/tests/io/json/test_json_table_schema.py b/pandas/tests/io/json/test_json_table_schema.py
index d1795f2816817..351b495e5d8fc 100644
--- a/pandas/tests/io/json/test_json_table_schema.py
+++ b/pandas/tests/io/json/test_json_table_schema.py
@@ -1,22 +1,25 @@
 """Tests for Table Schema integration."""
-import json
 from collections import OrderedDict
+import json
 
 import numpy as np
-import pandas as pd
 import pytest
 
+from pandas.core.dtypes.dtypes import (
+    CategoricalDtype, DatetimeTZDtype, PeriodDtype)
+
+import pandas as pd
 from pandas import DataFrame
-from pandas.types.dtypes import PeriodDtype, CategoricalDtype, DatetimeTZDtype
 import pandas.util.testing as tm
+
 from pandas.io.json.table_schema import (
-    as_json_table_type, build_table_schema, make_field, set_default_names
-)
+    as_json_table_type, build_table_schema, convert_json_field_to_pandas_type,
+    convert_pandas_type_to_json_field, set_default_names)
 
 
-class TestBuildSchema(tm.TestCase):
+class TestBuildSchema(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.df = DataFrame(
             {'A': [1, 2, 3, 4],
              'B': ['a', 'b', 'c', 'c'],
@@ -36,9 +39,9 @@ def test_build_table_schema(self):
                        ],
             'primaryKey': ['idx']
         }
-        self.assertEqual(result, expected)
+        assert result == expected
         result = build_table_schema(self.df)
-        self.assertTrue("pandas_version" in result)
+        assert "pandas_version" in result
 
     def test_series(self):
         s = pd.Series([1, 2, 3], name='foo')
@@ -46,16 +49,16 @@ def test_series(self):
         expected = {'fields': [{'name': 'index', 'type': 'integer'},
                                {'name': 'foo', 'type': 'integer'}],
                     'primaryKey': ['index']}
-        self.assertEqual(result, expected)
+        assert result == expected
         result = build_table_schema(s)
-        self.assertTrue('pandas_version' in result)
+        assert 'pandas_version' in result
 
-    def tets_series_unnamed(self):
+    def test_series_unnamed(self):
         result = build_table_schema(pd.Series([1, 2, 3]), version=False)
         expected = {'fields': [{'name': 'index', 'type': 'integer'},
                                {'name': 'values', 'type': 'integer'}],
                     'primaryKey': ['index']}
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_multiindex(self):
         df = self.df.copy()
@@ -73,104 +76,105 @@ def test_multiindex(self):
                        ],
             'primaryKey': ['level_0', 'level_1']
         }
-        self.assertEqual(result, expected)
+        assert result == expected
 
         df.index.names = ['idx0', None]
         expected['fields'][0]['name'] = 'idx0'
         expected['primaryKey'] = ['idx0', 'level_1']
         result = build_table_schema(df, version=False)
-        self.assertEqual(result, expected)
+        assert result == expected
 
 
-class TestTableSchemaType(tm.TestCase):
+class TestTableSchemaType(object):
 
-    def test_as_json_table_type_int_data(self):
+    @pytest.mark.parametrize('int_type', [
+        np.int, np.int16, np.int32, np.int64])
+    def test_as_json_table_type_int_data(self, int_type):
         int_data = [1, 2, 3]
-        int_types = [np.int, np.int16, np.int32, np.int64]
-        for t in int_types:
-            self.assertEqual(as_json_table_type(np.array(int_data, dtype=t)),
-                             'integer')
+        assert as_json_table_type(np.array(
+            int_data, dtype=int_type)) == 'integer'
 
-    def test_as_json_table_type_float_data(self):
+    @pytest.mark.parametrize('float_type', [
+        np.float, np.float16, np.float32, np.float64])
+    def test_as_json_table_type_float_data(self, float_type):
         float_data = [1., 2., 3.]
-        float_types = [np.float, np.float16, np.float32, np.float64]
-        for t in float_types:
-            self.assertEqual(as_json_table_type(np.array(float_data,
-                                                         dtype=t)),
-                             'number')
+        assert as_json_table_type(np.array(
+            float_data, dtype=float_type)) == 'number'
 
-    def test_as_json_table_type_bool_data(self):
+    @pytest.mark.parametrize('bool_type', [bool, np.bool])
+    def test_as_json_table_type_bool_data(self, bool_type):
         bool_data = [True, False]
-        bool_types = [bool, np.bool]
-        for t in bool_types:
-            self.assertEqual(as_json_table_type(np.array(bool_data, dtype=t)),
-                             'boolean')
-
-    def test_as_json_table_type_date_data(self):
-        date_data = [pd.to_datetime(['2016']),
-                     pd.to_datetime(['2016'], utc=True),
-                     pd.Series(pd.to_datetime(['2016'])),
-                     pd.Series(pd.to_datetime(['2016'], utc=True)),
-                     pd.period_range('2016', freq='A', periods=3)]
-        for arr in date_data:
-            self.assertEqual(as_json_table_type(arr), 'datetime')
-
-    def test_as_json_table_type_string_data(self):
-        strings = [pd.Series(['a', 'b']), pd.Index(['a', 'b'])]
-        for t in strings:
-            self.assertEqual(as_json_table_type(t), 'string')
-
-    def test_as_json_table_type_categorical_data(self):
-        self.assertEqual(as_json_table_type(pd.Categorical(['a'])), 'any')
-        self.assertEqual(as_json_table_type(pd.Categorical([1])), 'any')
-        self.assertEqual(as_json_table_type(
-            pd.Series(pd.Categorical([1]))), 'any')
-        self.assertEqual(as_json_table_type(pd.CategoricalIndex([1])), 'any')
-        self.assertEqual(as_json_table_type(pd.Categorical([1])), 'any')
+        assert as_json_table_type(np.array(
+            bool_data, dtype=bool_type)) == 'boolean'
+
+    @pytest.mark.parametrize('date_data', [
+        pd.to_datetime(['2016']),
+        pd.to_datetime(['2016'], utc=True),
+        pd.Series(pd.to_datetime(['2016'])),
+        pd.Series(pd.to_datetime(['2016'], utc=True)),
+        pd.period_range('2016', freq='A', periods=3)
+    ])
+    def test_as_json_table_type_date_data(self, date_data):
+        assert as_json_table_type(date_data) == 'datetime'
+
+    @pytest.mark.parametrize('str_data', [
+        pd.Series(['a', 'b']), pd.Index(['a', 'b'])])
+    def test_as_json_table_type_string_data(self, str_data):
+        assert as_json_table_type(str_data) == 'string'
+
+    @pytest.mark.parametrize('cat_data', [
+        pd.Categorical(['a']),
+        pd.Categorical([1]),
+        pd.Series(pd.Categorical([1])),
+        pd.CategoricalIndex([1]),
+        pd.Categorical([1])])
+    def test_as_json_table_type_categorical_data(self, cat_data):
+        assert as_json_table_type(cat_data) == 'any'
 
     # ------
     # dtypes
     # ------
-    def test_as_json_table_type_int_dtypes(self):
-        integers = [np.int, np.int16, np.int32, np.int64]
-        for t in integers:
-            self.assertEqual(as_json_table_type(t), 'integer')
-
-    def test_as_json_table_type_float_dtypes(self):
-        floats = [np.float, np.float16, np.float32, np.float64]
-        for t in floats:
-            self.assertEqual(as_json_table_type(t), 'number')
-
-    def test_as_json_table_type_bool_dtypes(self):
-        bools = [bool, np.bool]
-        for t in bools:
-            self.assertEqual(as_json_table_type(t), 'boolean')
-
-    def test_as_json_table_type_date_dtypes(self):
+    @pytest.mark.parametrize('int_dtype', [
+        np.int, np.int16, np.int32, np.int64])
+    def test_as_json_table_type_int_dtypes(self, int_dtype):
+        assert as_json_table_type(int_dtype) == 'integer'
+
+    @pytest.mark.parametrize('float_dtype', [
+        np.float, np.float16, np.float32, np.float64])
+    def test_as_json_table_type_float_dtypes(self, float_dtype):
+        assert as_json_table_type(float_dtype) == 'number'
+
+    @pytest.mark.parametrize('bool_dtype', [bool, np.bool])
+    def test_as_json_table_type_bool_dtypes(self, bool_dtype):
+        assert as_json_table_type(bool_dtype) == 'boolean'
+
+    @pytest.mark.parametrize('date_dtype', [
+        np.datetime64, np.dtype("<M8[ns]"), PeriodDtype('D'),
+        DatetimeTZDtype('ns', 'US/Central')])
+    def test_as_json_table_type_date_dtypes(self, date_dtype):
         # TODO: datedate.date? datetime.time?
-        dates = [np.datetime64, np.dtype("<M8[ns]"), PeriodDtype(),
-                 DatetimeTZDtype('ns', 'US/Central')]
-        for t in dates:
-            self.assertEqual(as_json_table_type(t), 'datetime')
+        assert as_json_table_type(date_dtype) == 'datetime'
 
-    def test_as_json_table_type_timedelta_dtypes(self):
-        durations = [np.timedelta64, np.dtype("<m8[ns]")]
-        for t in durations:
-            self.assertEqual(as_json_table_type(t), 'duration')
+    @pytest.mark.parametrize('td_dtype', [
+        np.timedelta64, np.dtype("<m8[ns]")])
+    def test_as_json_table_type_timedelta_dtypes(self, td_dtype):
+        assert as_json_table_type(td_dtype) == 'duration'
 
-    def test_as_json_table_type_string_dtypes(self):
-        strings = [object]  # TODO
-        for t in strings:
-            self.assertEqual(as_json_table_type(t), 'string')
+    @pytest.mark.parametrize('str_dtype', [object])  # TODO
+    def test_as_json_table_type_string_dtypes(self, str_dtype):
+        assert as_json_table_type(str_dtype) == 'string'
 
     def test_as_json_table_type_categorical_dtypes(self):
-        self.assertEqual(as_json_table_type(pd.Categorical), 'any')
-        self.assertEqual(as_json_table_type(CategoricalDtype()), 'any')
+        # TODO: I think before is_categorical_dtype(Categorical)
+        # returned True, but now it's False. Figure out why or
+        # if it matters
+        assert as_json_table_type(pd.Categorical(['a'])) == 'any'
+        assert as_json_table_type(CategoricalDtype()) == 'any'
 
 
-class TestTableOrient(tm.TestCase):
+class TestTableOrient(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.df = DataFrame(
             {'A': [1, 2, 3, 4],
              'B': ['a', 'b', 'c', 'c'],
@@ -191,7 +195,7 @@ def test_build_series(self):
         result = s.to_json(orient='table', date_format='iso')
         result = json.loads(result, object_pairs_hook=OrderedDict)
 
-        self.assertTrue("pandas_version" in result['schema'])
+        assert "pandas_version" in result['schema']
         result['schema'].pop('pandas_version')
 
         fields = [{'name': 'id', 'type': 'integer'},
@@ -214,7 +218,7 @@ def test_to_json(self):
         result = df.to_json(orient='table', date_format='iso')
         result = json.loads(result, object_pairs_hook=OrderedDict)
 
-        self.assertTrue("pandas_version" in result['schema'])
+        assert "pandas_version" in result['schema']
         result['schema'].pop('pandas_version')
 
         fields = [
@@ -266,7 +270,7 @@ def test_to_json(self):
                          ]),
         ]
         expected = OrderedDict([('schema', schema), ('data', data)])
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_to_json_float_index(self):
         data = pd.Series(1, index=[1., 2.])
@@ -283,7 +287,7 @@ def test_to_json_float_index(self):
                 ('data', [OrderedDict([('index', 1.0), ('values', 1)]),
                           OrderedDict([('index', 2.0), ('values', 1)])])])
         )
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_to_json_period_index(self):
         idx = pd.period_range('2016', freq='Q-JAN', periods=2)
@@ -301,7 +305,7 @@ def test_to_json_period_index(self):
                 OrderedDict([('index', '2016-02-01T00:00:00.000Z'),
                              ('values', 1)])]
         expected = OrderedDict([('schema', schema), ('data', data)])
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_to_json_categorical_index(self):
         data = pd.Series(1, pd.CategoricalIndex(['a', 'b']))
@@ -321,71 +325,92 @@ def test_to_json_categorical_index(self):
                                           ('values', 1)]),
                              OrderedDict([('index', 'b'), ('values', 1)])])])
         )
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_date_format_raises(self):
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             self.df.to_json(orient='table', date_format='epoch')
 
         # others work
         self.df.to_json(orient='table', date_format='iso')
         self.df.to_json(orient='table')
 
-    def test_make_field_int(self):
+    @pytest.mark.parametrize('kind', [pd.Series, pd.Index])
+    def test_convert_pandas_type_to_json_field_int(self, kind):
         data = [1, 2, 3]
-        kinds = [pd.Series(data, name='name'), pd.Index(data, name='name')]
-        for kind in kinds:
-            result = make_field(kind)
-            expected = {"name": "name", "type": 'integer'}
-            self.assertEqual(result, expected)
+        result = convert_pandas_type_to_json_field(kind(data, name='name'))
+        expected = {"name": "name", "type": "integer"}
+        assert result == expected
 
-    def test_make_field_float(self):
+    @pytest.mark.parametrize('kind', [pd.Series, pd.Index])
+    def test_convert_pandas_type_to_json_field_float(self, kind):
         data = [1., 2., 3.]
-        kinds = [pd.Series(data, name='name'), pd.Index(data, name='name')]
-        for kind in kinds:
-            result = make_field(kind)
-            expected = {"name": "name", "type": 'number'}
-            self.assertEqual(result, expected)
+        result = convert_pandas_type_to_json_field(kind(data, name='name'))
+        expected = {"name": "name", "type": "number"}
+        assert result == expected
 
-    def test_make_field_datetime(self):
+    @pytest.mark.parametrize('dt_args,extra_exp', [
+        ({}, {}), ({'utc': True}, {'tz': 'UTC'})])
+    @pytest.mark.parametrize('wrapper', [None, pd.Series])
+    def test_convert_pandas_type_to_json_field_datetime(self, dt_args,
+                                                        extra_exp, wrapper):
         data = [1., 2., 3.]
-        kinds = [pd.Series(pd.to_datetime(data), name='values'),
-                 pd.to_datetime(data)]
-        for kind in kinds:
-            result = make_field(kind)
-            expected = {"name": "values", "type": 'datetime'}
-            self.assertEqual(result, expected)
-
-        kinds = [pd.Series(pd.to_datetime(data, utc=True), name='values'),
-                 pd.to_datetime(data, utc=True)]
-        for kind in kinds:
-            result = make_field(kind)
-            expected = {"name": "values", "type": 'datetime', "tz": "UTC"}
-            self.assertEqual(result, expected)
+        data = pd.to_datetime(data, **dt_args)
+        if wrapper is pd.Series:
+            data = pd.Series(data, name='values')
+        result = convert_pandas_type_to_json_field(data)
+        expected = {"name": "values", "type": 'datetime'}
+        expected.update(extra_exp)
+        assert result == expected
 
+    def test_convert_pandas_type_to_json_period_range(self):
         arr = pd.period_range('2016', freq='A-DEC', periods=4)
-        result = make_field(arr)
+        result = convert_pandas_type_to_json_field(arr)
         expected = {"name": "values", "type": 'datetime', "freq": "A-DEC"}
-        self.assertEqual(result, expected)
+        assert result == expected
 
-    def test_make_field_categorical(self):
+    @pytest.mark.parametrize('kind', [pd.Categorical, pd.CategoricalIndex])
+    @pytest.mark.parametrize('ordered', [True, False])
+    def test_convert_pandas_type_to_json_field_categorical(self, kind,
+                                                           ordered):
         data = ['a', 'b', 'c']
-        ordereds = [True, False]
-
-        for ordered in ordereds:
-            arr = pd.Series(pd.Categorical(data, ordered=ordered), name='cats')
-            result = make_field(arr)
-            expected = {"name": "cats", "type": "any",
-                        "constraints": {"enum": data},
-                        "ordered": ordered}
-            self.assertEqual(result, expected)
-
-            arr = pd.CategoricalIndex(data, ordered=ordered, name='cats')
-            result = make_field(arr)
-            expected = {"name": "cats", "type": "any",
-                        "constraints": {"enum": data},
-                        "ordered": ordered}
-            self.assertEqual(result, expected)
+        if kind is pd.Categorical:
+            arr = pd.Series(kind(data, ordered=ordered), name='cats')
+        elif kind is pd.CategoricalIndex:
+            arr = kind(data, ordered=ordered, name='cats')
+
+        result = convert_pandas_type_to_json_field(arr)
+        expected = {"name": "cats", "type": "any",
+                    "constraints": {"enum": data},
+                    "ordered": ordered}
+        assert result == expected
+
+    @pytest.mark.parametrize("inp,exp", [
+        ({'type': 'integer'}, 'int64'),
+        ({'type': 'number'}, 'float64'),
+        ({'type': 'boolean'}, 'bool'),
+        ({'type': 'duration'}, 'timedelta64'),
+        ({'type': 'datetime'}, 'datetime64[ns]'),
+        ({'type': 'datetime', 'tz': 'US/Hawaii'}, 'datetime64[ns, US/Hawaii]'),
+        ({'type': 'any'}, 'object'),
+        ({'type': 'any', 'constraints': {'enum': ['a', 'b', 'c']},
+          'ordered': False}, CategoricalDtype(categories=['a', 'b', 'c'],
+                                              ordered=False)),
+        ({'type': 'any', 'constraints': {'enum': ['a', 'b', 'c']},
+          'ordered': True}, CategoricalDtype(categories=['a', 'b', 'c'],
+                                             ordered=True)),
+        ({'type': 'string'}, 'object')])
+    def test_convert_json_field_to_pandas_type(self, inp, exp):
+        field = {'name': 'foo'}
+        field.update(inp)
+        assert convert_json_field_to_pandas_type(field) == exp
+
+    @pytest.mark.parametrize("inp", ["geopoint", "geojson", "fake_type"])
+    def test_convert_json_field_to_pandas_type_raises(self, inp):
+        field = {'type': inp}
+        with pytest.raises(ValueError, match=("Unsupported or invalid field "
+                                              "type: {}".format(inp))):
+            convert_json_field_to_pandas_type(field)
 
     def test_categorical(self):
         s = pd.Series(pd.Categorical(['a', 'b', 'a']))
@@ -406,37 +431,38 @@ def test_categorical(self):
             ('data', [OrderedDict([('idx', 0), ('values', 'a')]),
                       OrderedDict([('idx', 1), ('values', 'b')]),
                       OrderedDict([('idx', 2), ('values', 'a')])])])
-        self.assertEqual(result, expected)
-
-    def test_set_default_names_unset(self):
-        data = pd.Series(1, pd.Index([1]))
-        result = set_default_names(data)
-        self.assertEqual(result.index.name, 'index')
-
-    def test_set_default_names_set(self):
-        data = pd.Series(1, pd.Index([1], name='myname'))
-        result = set_default_names(data)
-        self.assertEqual(result.index.name, 'myname')
-
-    def test_set_default_names_mi_unset(self):
-        data = pd.Series(
-            1, pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')]))
-        result = set_default_names(data)
-        self.assertEqual(result.index.names, ['level_0', 'level_1'])
-
-    def test_set_default_names_mi_set(self):
-        data = pd.Series(
-            1, pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
-                                          names=['n1', 'n2']))
-        result = set_default_names(data)
-        self.assertEqual(result.index.names, ['n1', 'n2'])
+        assert result == expected
 
-    def test_set_default_names_mi_partion(self):
-        data = pd.Series(
-            1, pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
-                                          names=['n1', None]))
+    @pytest.mark.parametrize('idx,nm,prop', [
+        (pd.Index([1]), 'index', 'name'),
+        (pd.Index([1], name='myname'), 'myname', 'name'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')]),
+         ['level_0', 'level_1'], 'names'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
+                                    names=['n1', 'n2']),
+         ['n1', 'n2'], 'names'),
+        (pd.MultiIndex.from_product([('a', 'b'), ('c', 'd')],
+                                    names=['n1', None]),
+         ['n1', 'level_1'], 'names')
+    ])
+    def test_set_names_unset(self, idx, nm, prop):
+        data = pd.Series(1, idx)
         result = set_default_names(data)
-        self.assertEqual(result.index.names, ['n1', 'level_1'])
+        assert getattr(result.index, prop) == nm
+
+    @pytest.mark.parametrize("idx", [
+        pd.Index([], name='index'),
+        pd.MultiIndex.from_arrays([['foo'], ['bar']],
+                                  names=('level_0', 'level_1')),
+        pd.MultiIndex.from_arrays([['foo'], ['bar']],
+                                  names=('foo', 'level_1'))
+    ])
+    def test_warns_non_roundtrippable_names(self, idx):
+        # GH 19130
+        df = pd.DataFrame([[]], index=idx)
+        df.index.name = 'index'
+        with tm.assert_produces_warning():
+            set_default_names(df)
 
     def test_timestamp_in_columns(self):
         df = pd.DataFrame([[1, 2]], columns=[pd.Timestamp('2016'),
@@ -446,17 +472,102 @@ def test_timestamp_in_columns(self):
         assert js['schema']['fields'][1]['name'] == 1451606400000
         assert js['schema']['fields'][2]['name'] == 10000
 
-    def test_overlapping_names(self):
-        cases = [
-            pd.Series([1], index=pd.Index([1], name='a'), name='a'),
-            pd.DataFrame({"A": [1]}, index=pd.Index([1], name="A")),
-            pd.DataFrame({"A": [1]}, index=pd.MultiIndex.from_arrays([
-                ['a'], [1]
-            ], names=["A", "a"])),
-        ]
-
-        for data in cases:
-            with pytest.raises(ValueError) as excinfo:
-                data.to_json(orient='table')
+    @pytest.mark.parametrize('case', [
+        pd.Series([1], index=pd.Index([1], name='a'), name='a'),
+        pd.DataFrame({"A": [1]}, index=pd.Index([1], name="A")),
+        pd.DataFrame({"A": [1]}, index=pd.MultiIndex.from_arrays([
+            ['a'], [1]], names=["A", "a"]))
+    ])
+    def test_overlapping_names(self, case):
+        with pytest.raises(ValueError, match='Overlapping'):
+            case.to_json(orient='table')
+
+    def test_mi_falsey_name(self):
+        # GH 16203
+        df = pd.DataFrame(np.random.randn(4, 4),
+                          index=pd.MultiIndex.from_product([('A', 'B'),
+                                                            ('a', 'b')]))
+        result = [x['name'] for x in build_table_schema(df)['fields']]
+        assert result == ['level_0', 'level_1', 0, 1, 2, 3]
+
+
+class TestTableOrientReader(object):
+
+    @pytest.mark.parametrize("index_nm", [
+        None,
+        "idx",
+        pytest.param("index",
+                     marks=pytest.mark.xfail),
+        'level_0'])
+    @pytest.mark.parametrize("vals", [
+        {'ints': [1, 2, 3, 4]},
+        {'objects': ['a', 'b', 'c', 'd']},
+        {'objects': ['1', '2', '3', '4']},
+        {'date_ranges': pd.date_range('2016-01-01', freq='d', periods=4)},
+        {'categoricals': pd.Series(pd.Categorical(['a', 'b', 'c', 'c']))},
+        {'ordered_cats': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'],
+                                                  ordered=True))},
+        {'floats': [1., 2., 3., 4.]},
+        {'floats': [1.1, 2.2, 3.3, 4.4]},
+        {'bools': [True, False, False, True]}])
+    def test_read_json_table_orient(self, index_nm, vals, recwarn):
+        df = DataFrame(vals, index=pd.Index(range(4), name=index_nm))
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize("index_nm", [
+        None, "idx", "index"])
+    @pytest.mark.parametrize("vals", [
+        {'timedeltas': pd.timedelta_range('1H', periods=4, freq='T')},
+        {'timezones': pd.date_range('2016-01-01', freq='d', periods=4,
+                                    tz='US/Central')}])
+    def test_read_json_table_orient_raises(self, index_nm, vals, recwarn):
+        df = DataFrame(vals, index=pd.Index(range(4), name=index_nm))
+        out = df.to_json(orient="table")
+        with pytest.raises(NotImplementedError, match='can not yet read '):
+            pd.read_json(out, orient="table")
+
+    def test_comprehensive(self):
+        df = DataFrame(
+            {'A': [1, 2, 3, 4],
+             'B': ['a', 'b', 'c', 'c'],
+             'C': pd.date_range('2016-01-01', freq='d', periods=4),
+             # 'D': pd.timedelta_range('1H', periods=4, freq='T'),
+             'E': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'])),
+             'F': pd.Series(pd.Categorical(['a', 'b', 'c', 'c'],
+                                           ordered=True)),
+             'G': [1.1, 2.2, 3.3, 4.4],
+             # 'H': pd.date_range('2016-01-01', freq='d', periods=4,
+             #                   tz='US/Central'),
+             'I': [True, False, False, True],
+             },
+            index=pd.Index(range(4), name='idx'))
 
-            assert 'Overlapping' in str(excinfo.value)
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize("index_names", [
+        [None, None], ['foo', 'bar'], ['foo', None], [None, 'foo'],
+        ['index', 'foo']])
+    def test_multiindex(self, index_names):
+        # GH 18912
+        df = pd.DataFrame(
+            [["Arr", "alpha", [1, 2, 3, 4]],
+             ["Bee", "Beta", [10, 20, 30, 40]]],
+            index=[["A", "B"], ["Null", "Eins"]],
+            columns=["Aussprache", "Griechisch", "Args"]
+        )
+        df.index.names = index_names
+        out = df.to_json(orient="table")
+        result = pd.read_json(out, orient="table")
+        tm.assert_frame_equal(df, result)
+
+    def test_empty_frame_roundtrip(self):
+        # GH 21287
+        df = pd.DataFrame([], columns=['a', 'b', 'c'])
+        expected = df.copy()
+        out = df.to_json(orient='table')
+        result = pd.read_json(out, orient='table')
+        tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/io/json/test_normalize.py b/pandas/tests/io/json/test_normalize.py
index ee79859e9b71a..3bf699cc8a1f0 100644
--- a/pandas/tests/io/json/test_normalize.py
+++ b/pandas/tests/io/json/test_normalize.py
@@ -1,9 +1,10 @@
-import pytest
-import numpy as np
 import json
 
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Index, compat
 import pandas.util.testing as tm
-from pandas import compat, Index, DataFrame
 
 from pandas.io.json import json_normalize
 from pandas.io.json.normalize import nested_to_record
@@ -54,6 +55,17 @@ def state_data():
          'state': 'Ohio'}]
 
 
+@pytest.fixture
+def author_missing_data():
+    return [
+        {'info': None},
+        {'info':
+            {'created_at': '11/08/1993', 'last_updated': '26/05/2012'},
+            'author_name':
+         {'first': 'Jane', 'last_name': 'Doe'}
+         }]
+
+
 class TestJSONNormalize(object):
 
     def test_simple_records(self):
@@ -112,6 +124,27 @@ def test_simple_normalize_with_separator(self, deep_nested):
                           'country', 'states_name']).sort_values()
         assert result.columns.sort_values().equals(expected)
 
+    def test_value_array_record_prefix(self):
+        # GH 21536
+        result = json_normalize({'A': [1, 2]}, 'A', record_prefix='Prefix.')
+        expected = DataFrame([[1], [2]], columns=['Prefix.0'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_nested_object_record_path(self):
+        # GH 22706
+        data = {'state': 'Florida',
+                'info': {
+                    'governor': 'Rick Scott',
+                    'counties': [{'name': 'Dade', 'population': 12345},
+                                 {'name': 'Broward', 'population': 40000},
+                                 {'name': 'Palm Beach', 'population': 60000}]}}
+        result = json_normalize(data, record_path=["info", "counties"])
+        expected = DataFrame([['Dade', 12345],
+                              ['Broward', 40000],
+                              ['Palm Beach', 60000]],
+                             columns=['name', 'population'])
+        tm.assert_frame_equal(result, expected)
+
     def test_more_deeply_nested(self, deep_nested):
 
         result = json_normalize(deep_nested, ['states', 'cities'],
@@ -164,7 +197,9 @@ def test_meta_name_conflict(self):
                  'data': [{'foo': 'something', 'bar': 'else'},
                           {'foo': 'something2', 'bar': 'else2'}]}]
 
-        with pytest.raises(ValueError):
+        msg = (r"Conflicting metadata name (foo|bar),"
+               " need distinguishing prefix")
+        with pytest.raises(ValueError, match=msg):
             json_normalize(data, 'data', meta=['foo', 'bar'])
 
         result = json_normalize(data, 'data', meta=['foo', 'bar'],
@@ -173,6 +208,21 @@ def test_meta_name_conflict(self):
         for val in ['metafoo', 'metabar', 'foo', 'bar']:
             assert val in result
 
+    def test_meta_parameter_not_modified(self):
+        # GH 18610
+        data = [{'foo': 'hello',
+                 'bar': 'there',
+                 'data': [{'foo': 'something', 'bar': 'else'},
+                          {'foo': 'something2', 'bar': 'else2'}]}]
+
+        COLUMNS = ['foo', 'bar']
+        result = json_normalize(data, 'data', meta=COLUMNS,
+                                meta_prefix='meta')
+
+        assert COLUMNS == ['foo', 'bar']
+        for val in ['metafoo', 'metabar', 'foo', 'bar']:
+            assert val in result
+
     def test_record_prefix(self, state_data):
         result = json_normalize(state_data[0], 'counties')
         expected = DataFrame(state_data[0]['counties'])
@@ -211,8 +261,26 @@ def test_non_ascii_key(self):
         result = json_normalize(json.loads(testjson))
         tm.assert_frame_equal(result, expected)
 
+    def test_missing_field(self, author_missing_data):
+        # GH20030:
+        result = json_normalize(author_missing_data)
+        ex_data = [
+            {'info': np.nan,
+             'author_name.first': np.nan,
+             'author_name.last_name': np.nan,
+             'info.created_at': np.nan,
+             'info.last_updated': np.nan},
+            {'info': None,
+             'author_name.first': 'Jane',
+             'author_name.last_name': 'Doe',
+             'info.created_at': '11/08/1993',
+             'info.last_updated': '26/05/2012'}
+        ]
+        expected = DataFrame(ex_data)
+        tm.assert_frame_equal(result, expected)
+
 
-class TestNestedToRecord(tm.TestCase):
+class TestNestedToRecord(object):
 
     def test_flat_stays_flat(self):
         recs = [dict(flat1=1, flat2=2),
@@ -221,7 +289,7 @@ def test_flat_stays_flat(self):
 
         result = nested_to_record(recs)
         expected = recs
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_one_level_deep_flattens(self):
         data = dict(flat1=1,
@@ -232,7 +300,7 @@ def test_one_level_deep_flattens(self):
                     'dict1.d': 2,
                     'flat1': 1}
 
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_nested_flattens(self):
         data = dict(flat1=1,
@@ -248,7 +316,7 @@ def test_nested_flattens(self):
                     'nested.e.c': 1,
                     'nested.e.d': 2}
 
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_json_normalize_errors(self):
         # GH14583: If meta keys are not always present
@@ -298,12 +366,97 @@ def test_json_normalize_errors(self):
                     'price': {0: '0', 1: '0', 2: '0', 3: '0'},
                     'symbol': {0: 'AAPL', 1: 'GOOG', 2: 'AAPL', 3: 'GOOG'}}
 
-        self.assertEqual(j.fillna('').to_dict(), expected)
-
-        self.assertRaises(KeyError,
-                          json_normalize, data=i['Trades'],
-                          record_path=[['general', 'stocks']],
-                          meta=[['general', 'tradeid'],
-                                ['general', 'trade_version']],
-                          errors='raise'
-                          )
+        assert j.fillna('').to_dict() == expected
+
+        msg = ("Try running with errors='ignore' as key 'trade_version'"
+               " is not always present")
+        with pytest.raises(KeyError, match=msg):
+            json_normalize(
+                data=i['Trades'],
+                record_path=[['general', 'stocks']],
+                meta=[['general', 'tradeid'],
+                      ['general', 'trade_version']],
+                errors='raise')
+
+    def test_donot_drop_nonevalues(self):
+        # GH21356
+        data = [
+            {'info': None,
+             'author_name':
+             {'first': 'Smith', 'last_name': 'Appleseed'}
+             },
+            {'info':
+                {'created_at': '11/08/1993', 'last_updated': '26/05/2012'},
+             'author_name':
+                {'first': 'Jane', 'last_name': 'Doe'}
+             }
+        ]
+        result = nested_to_record(data)
+        expected = [
+            {'info': None,
+             'author_name.first': 'Smith',
+             'author_name.last_name': 'Appleseed'},
+            {'author_name.first': 'Jane',
+             'author_name.last_name': 'Doe',
+             'info.created_at': '11/08/1993',
+             'info.last_updated': '26/05/2012'}]
+
+        assert result == expected
+
+    def test_nonetype_top_level_bottom_level(self):
+        # GH21158: If inner level json has a key with a null value
+        # make sure it doesnt do a new_d.pop twice and except
+        data = {
+            "id": None,
+            "location": {
+                "country": {
+                    "state": {
+                        "id": None,
+                        "town.info": {
+                            "id": None,
+                            "region": None,
+                            "x": 49.151580810546875,
+                            "y": -33.148521423339844,
+                            "z": 27.572303771972656}}}
+            }
+        }
+        result = nested_to_record(data)
+        expected = {
+            'id': None,
+            'location.country.state.id': None,
+            'location.country.state.town.info.id': None,
+            'location.country.state.town.info.region': None,
+            'location.country.state.town.info.x': 49.151580810546875,
+            'location.country.state.town.info.y': -33.148521423339844,
+            'location.country.state.town.info.z': 27.572303771972656}
+        assert result == expected
+
+    def test_nonetype_multiple_levels(self):
+        # GH21158: If inner level json has a key with a null value
+        # make sure it doesnt do a new_d.pop twice and except
+        data = {
+            "id": None,
+            "location": {
+                "id": None,
+                "country": {
+                    "id": None,
+                    "state": {
+                        "id": None,
+                        "town.info": {
+                            "region": None,
+                            "x": 49.151580810546875,
+                            "y": -33.148521423339844,
+                            "z": 27.572303771972656}}}
+            }
+        }
+        result = nested_to_record(data)
+        expected = {
+            'id': None,
+            'location.id': None,
+            'location.country.id': None,
+            'location.country.state.id': None,
+            'location.country.state.town.info.region': None,
+            'location.country.state.town.info.x': 49.151580810546875,
+            'location.country.state.town.info.y': -33.148521423339844,
+            'location.country.state.town.info.z': 27.572303771972656}
+        assert result == expected
diff --git a/pandas/tests/io/json/test_pandas.py b/pandas/tests/io/json/test_pandas.py
index 7dbcf25c60b45..ed598b730d960 100644
--- a/pandas/tests/io/json/test_pandas.py
+++ b/pandas/tests/io/json/test_pandas.py
@@ -1,27 +1,31 @@
 # -*- coding: utf-8 -*-
 # pylint: disable-msg=W0612,E1101
-import pytest
-from pandas.compat import range, lrange, StringIO, OrderedDict
+from collections import OrderedDict
+from datetime import timedelta
+import json
 import os
 
 import numpy as np
-from pandas import (Series, DataFrame, DatetimeIndex, Timestamp,
-                    read_json, compat)
-from datetime import timedelta
-import pandas as pd
+import pytest
+
+from pandas.compat import StringIO, is_platform_32bit, lrange, range
+import pandas.util._test_decorators as td
 
-from pandas.util.testing import (assert_almost_equal, assert_frame_equal,
-                                 assert_series_equal, network,
-                                 ensure_clean, assert_index_equal)
+import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Series, Timestamp, compat, read_json)
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_index_equal,
+    assert_series_equal, ensure_clean, network)
 
 _seriesd = tm.getSeriesData()
 _tsd = tm.getTimeSeriesData()
 
 _frame = DataFrame(_seriesd)
 _frame2 = DataFrame(_seriesd, columns=['D', 'C', 'B', 'A'])
-_intframe = DataFrame(dict((k, v.astype(np.int64))
-                           for k, v in compat.iteritems(_seriesd)))
+_intframe = DataFrame({k: v.astype(np.int64)
+                       for k, v in compat.iteritems(_seriesd)})
 
 _tsframe = DataFrame(_tsd)
 _cat_frame = _frame.copy()
@@ -34,10 +38,11 @@
 _mixed_frame = _frame.copy()
 
 
-class TestPandasContainer(tm.TestCase):
+class TestPandasContainer(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(scope="function", autouse=True)
+    def setup(self, datapath):
+        self.dirpath = datapath("io", "json", "data")
 
         self.ts = tm.makeTimeSeries()
         self.ts.name = 'ts'
@@ -58,7 +63,8 @@ def setUp(self):
         self.mixed_frame = _mixed_frame.copy()
         self.categorical = _cat_frame.copy()
 
-    def tearDown(self):
+        yield
+
         del self.dirpath
 
         del self.ts
@@ -95,13 +101,17 @@ def test_frame_non_unique_index(self):
         df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 1],
                        columns=['x', 'y'])
 
-        self.assertRaises(ValueError, df.to_json, orient='index')
-        self.assertRaises(ValueError, df.to_json, orient='columns')
+        msg = "DataFrame index must be unique for orient='index'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient='index')
+        msg = "DataFrame index must be unique for orient='columns'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient='columns')
 
         assert_frame_equal(df, read_json(df.to_json(orient='split'),
                                          orient='split'))
         unser = read_json(df.to_json(orient='records'), orient='records')
-        self.assert_index_equal(df.columns, unser.columns)
+        tm.assert_index_equal(df.columns, unser.columns)
         tm.assert_almost_equal(df.values, unser.values)
         unser = read_json(df.to_json(orient='values'), orient='values')
         tm.assert_numpy_array_equal(df.values, unser.values)
@@ -110,9 +120,15 @@ def test_frame_non_unique_columns(self):
         df = DataFrame([['a', 'b'], ['c', 'd']], index=[1, 2],
                        columns=['x', 'x'])
 
-        self.assertRaises(ValueError, df.to_json, orient='index')
-        self.assertRaises(ValueError, df.to_json, orient='columns')
-        self.assertRaises(ValueError, df.to_json, orient='records')
+        msg = "DataFrame columns must be unique for orient='index'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient='index')
+        msg = "DataFrame columns must be unique for orient='columns'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient='columns')
+        msg = "DataFrame columns must be unique for orient='records'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient='records')
 
         assert_frame_equal(df, read_json(df.to_json(orient='split'),
                                          orient='split', dtype=False))
@@ -150,13 +166,16 @@ def _check_orient(df, orient, dtype=None, numpy=False,
             # if we are not unique, then check that we are raising ValueError
             # for the appropriate orients
             if not df.index.is_unique and orient in ['index', 'columns']:
-                self.assertRaises(
-                    ValueError, lambda: df.to_json(orient=orient))
+                msg = ("DataFrame index must be unique for orient='{}'"
+                       .format(orient))
+                with pytest.raises(ValueError, match=msg):
+                    df.to_json(orient=orient)
                 return
             if (not df.columns.is_unique and
                     orient in ['index', 'columns', 'records']):
-                self.assertRaises(
-                    ValueError, lambda: df.to_json(orient=orient))
+                # TODO: not executed. fix this.
+                with pytest.raises(ValueError, match='ksjkajksfjksjfkjs'):
+                    df.to_json(orient=orient)
                 return
 
             dfjson = df.to_json(orient=orient)
@@ -175,7 +194,7 @@ def _check_orient(df, orient, dtype=None, numpy=False,
             else:
                 unser = unser.sort_index()
 
-            if dtype is False:
+            if not dtype:
                 check_dtype = False
 
             if not convert_axes and df.index.dtype.type == np.datetime64:
@@ -183,17 +202,17 @@ def _check_orient(df, orient, dtype=None, numpy=False,
                     unser.index.values.astype('i8') * 1e6)
             if orient == "records":
                 # index is not captured in this orientation
-                assert_almost_equal(df.values, unser.values,
-                                    check_dtype=check_numpy_dtype)
-                self.assert_index_equal(df.columns, unser.columns,
-                                        exact=check_column_type)
+                tm.assert_almost_equal(df.values, unser.values,
+                                       check_dtype=check_numpy_dtype)
+                tm.assert_index_equal(df.columns, unser.columns,
+                                      exact=check_column_type)
             elif orient == "values":
                 # index and cols are not captured in this orientation
                 if numpy is True and df.shape == (0, 0):
                     assert unser.shape[0] == 0
                 else:
-                    assert_almost_equal(df.values, unser.values,
-                                        check_dtype=check_numpy_dtype)
+                    tm.assert_almost_equal(df.values, unser.values,
+                                           check_dtype=check_numpy_dtype)
             elif orient == "split":
                 # index and col labels might not be strings
                 unser.index = [str(i) for i in unser.index]
@@ -201,16 +220,16 @@ def _check_orient(df, orient, dtype=None, numpy=False,
 
                 if sort is None:
                     unser = unser.sort_index()
-                assert_almost_equal(df.values, unser.values,
-                                    check_dtype=check_numpy_dtype)
+                tm.assert_almost_equal(df.values, unser.values,
+                                       check_dtype=check_numpy_dtype)
             else:
                 if convert_axes:
-                    assert_frame_equal(df, unser, check_dtype=check_dtype,
-                                       check_index_type=check_index_type,
-                                       check_column_type=check_column_type)
+                    tm.assert_frame_equal(df, unser, check_dtype=check_dtype,
+                                          check_index_type=check_index_type,
+                                          check_column_type=check_column_type)
                 else:
-                    assert_frame_equal(df, unser, check_less_precise=False,
-                                       check_dtype=check_dtype)
+                    tm.assert_frame_equal(df, unser, check_less_precise=False,
+                                          check_dtype=check_dtype)
 
         def _check_all_orients(df, dtype=None, convert_axes=True,
                                raise_ok=None, sort=None, check_index_type=True,
@@ -271,8 +290,7 @@ def _check_all_orients(df, dtype=None, convert_axes=True,
 
         # basic
         _check_all_orients(self.frame)
-        self.assertEqual(self.frame.to_json(),
-                         self.frame.to_json(orient="columns"))
+        assert self.frame.to_json() == self.frame.to_json(orient="columns")
 
         _check_all_orients(self.intframe, dtype=self.intframe.values.dtype)
         _check_all_orients(self.intframe, dtype=False)
@@ -321,84 +339,116 @@ def _check_all_orients(df, dtype=None, convert_axes=True,
         _check_orient(df.transpose().transpose(), "index", dtype=False)
 
     def test_frame_from_json_bad_data(self):
-        self.assertRaises(ValueError, read_json, StringIO('{"key":b:a:d}'))
+        with pytest.raises(ValueError, match='Expected object or value'):
+            read_json(StringIO('{"key":b:a:d}'))
 
         # too few indices
         json = StringIO('{"columns":["A","B"],'
                         '"index":["2","3"],'
                         '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        self.assertRaises(ValueError, read_json, json,
-                          orient="split")
+        msg = r"Shape of passed values is \(3, 2\), indices imply \(2, 2\)"
+        with pytest.raises(ValueError, match=msg):
+            read_json(json, orient="split")
 
         # too many columns
         json = StringIO('{"columns":["A","B","C"],'
                         '"index":["1","2","3"],'
                         '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        self.assertRaises(AssertionError, read_json, json,
-                          orient="split")
+        msg = "3 columns passed, passed data had 2 columns"
+        with pytest.raises(AssertionError, match=msg):
+            read_json(json, orient="split")
 
         # bad key
         json = StringIO('{"badkey":["A","B"],'
                         '"index":["2","3"],'
                         '"data":[[1.0,"1"],[2.0,"2"],[null,"3"]]}')
-        with tm.assertRaisesRegexp(ValueError, r"unexpected key\(s\): badkey"):
+        with pytest.raises(ValueError, match=r"unexpected key\(s\): badkey"):
             read_json(json, orient="split")
 
     def test_frame_from_json_nones(self):
         df = DataFrame([[1, 2], [4, 5, 6]])
         unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
 
         df = DataFrame([['1', '2'], ['4', '5', '6']])
         unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
         unser = read_json(df.to_json(), dtype=False)
-        self.assertTrue(unser[2][0] is None)
+        assert unser[2][0] is None
         unser = read_json(df.to_json(), convert_axes=False, dtype=False)
-        self.assertTrue(unser['2']['0'] is None)
+        assert unser['2']['0'] is None
 
         unser = read_json(df.to_json(), numpy=False)
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
         unser = read_json(df.to_json(), numpy=False, dtype=False)
-        self.assertTrue(unser[2][0] is None)
+        assert unser[2][0] is None
         unser = read_json(df.to_json(), numpy=False,
                           convert_axes=False, dtype=False)
-        self.assertTrue(unser['2']['0'] is None)
+        assert unser['2']['0'] is None
 
         # infinities get mapped to nulls which get mapped to NaNs during
         # deserialisation
         df = DataFrame([[1, 2], [4, 5, 6]])
         df.loc[0, 2] = np.inf
         unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
         unser = read_json(df.to_json(), dtype=False)
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
 
         df.loc[0, 2] = np.NINF
         unser = read_json(df.to_json())
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
         unser = read_json(df.to_json(), dtype=False)
-        self.assertTrue(np.isnan(unser[2][0]))
+        assert np.isnan(unser[2][0])
+
+    @pytest.mark.skipif(is_platform_32bit(),
+                        reason="not compliant on 32-bit, xref #15865")
+    def test_frame_to_json_float_precision(self):
+        df = pd.DataFrame([dict(a_float=0.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=1.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":2.0}}'
+
+        df = pd.DataFrame([dict(a_float=-1.95)])
+        encoded = df.to_json(double_precision=1)
+        assert encoded == '{"a_float":{"0":-2.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.995)])
+        encoded = df.to_json(double_precision=2)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.9995)])
+        encoded = df.to_json(double_precision=3)
+        assert encoded == '{"a_float":{"0":1.0}}'
+
+        df = pd.DataFrame([dict(a_float=0.99999999999999944)])
+        encoded = df.to_json(double_precision=15)
+        assert encoded == '{"a_float":{"0":1.0}}'
 
     def test_frame_to_json_except(self):
         df = DataFrame([1, 2, 3])
-        self.assertRaises(ValueError, df.to_json, orient="garbage")
+        msg = "Invalid value 'garbage' for option 'orient'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient="garbage")
 
     def test_frame_empty(self):
         df = DataFrame(columns=['jim', 'joe'])
-        self.assertFalse(df._is_mixed_type)
+        assert not df._is_mixed_type
         assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df,
                            check_index_type=False)
         # GH 7445
         result = pd.DataFrame({'test': []}, index=[]).to_json(orient='columns')
         expected = '{"test":{}}'
-        tm.assert_equal(result, expected)
+        assert result == expected
 
     def test_frame_empty_mixedtype(self):
         # mixed type
         df = DataFrame(columns=['jim', 'joe'])
         df['joe'] = df['joe'].astype('i8')
-        self.assertTrue(df._is_mixed_type)
+        assert df._is_mixed_type
         assert_frame_equal(read_json(df.to_json(), dtype=dict(df.dtypes)), df,
                            check_index_type=False)
 
@@ -411,7 +461,7 @@ def test_frame_mixedtype_orient(self):  # GH10289
         df = DataFrame(vals, index=list('abcd'),
                        columns=['1st', '2nd', '3rd', '4th', '5th'])
 
-        self.assertTrue(df._is_mixed_type)
+        assert df._is_mixed_type
         right = df.copy()
 
         for orient in ['split', 'index', 'columns']:
@@ -483,10 +533,60 @@ def test_blocks_compat_GH9037(self):
                            by_blocks=True,
                            check_exact=True)
 
+    def test_frame_nonprintable_bytes(self):
+        # GH14256: failing column caused segfaults, if it is not the last one
+
+        class BinaryThing(object):
+
+            def __init__(self, hexed):
+                self.hexed = hexed
+                if compat.PY2:
+                    self.binary = hexed.decode('hex')
+                else:
+                    self.binary = bytes.fromhex(hexed)
+
+            def __str__(self):
+                return self.hexed
+
+        hexed = '574b4454ba8c5eb4f98a8f45'
+        binthing = BinaryThing(hexed)
+
+        # verify the proper conversion of printable content
+        df_printable = DataFrame({'A': [binthing.hexed]})
+        assert df_printable.to_json() == \
+            '{{"A":{{"0":"{hex}"}}}}'.format(hex=hexed)
+
+        # check if non-printable content throws appropriate Exception
+        df_nonprintable = DataFrame({'A': [binthing]})
+        msg = "Unsupported UTF-8 sequence length when encoding string"
+        with pytest.raises(OverflowError, match=msg):
+            df_nonprintable.to_json()
+
+        # the same with multiple columns threw segfaults
+        df_mixed = DataFrame({'A': [binthing], 'B': [1]},
+                             columns=['A', 'B'])
+        with pytest.raises(OverflowError):
+            df_mixed.to_json()
+
+        # default_handler should resolve exceptions for non-string types
+        assert df_nonprintable.to_json(default_handler=str) == \
+            '{{"A":{{"0":"{hex}"}}}}'.format(hex=hexed)
+        assert df_mixed.to_json(default_handler=str) == \
+            '{{"A":{{"0":"{hex}"}},"B":{{"0":1}}}}'.format(hex=hexed)
+
+    def test_label_overflow(self):
+        # GH14256: buffer length not checked when writing label
+        df = pd.DataFrame({'bar' * 100000: [1], 'foo': [1337]})
+        assert df.to_json() == \
+            '{{"{bar}":{{"0":1}},"foo":{{"0":1337}}}}'.format(
+                bar=('bar' * 100000))
+
     def test_series_non_unique_index(self):
         s = Series(['a', 'b'], index=[1, 1])
 
-        self.assertRaises(ValueError, s.to_json, orient='index')
+        msg = "Series index must be unique for orient='index'"
+        with pytest.raises(ValueError, match=msg):
+            s.to_json(orient='index')
 
         assert_series_equal(s, read_json(s.to_json(orient='split'),
                                          orient='split', typ='series'))
@@ -537,8 +637,7 @@ def _check_all_orients(series, dtype=None, check_index_type=True):
 
         # basic
         _check_all_orients(self.series)
-        self.assertEqual(self.series.to_json(),
-                         self.series.to_json(orient="index"))
+        assert self.series.to_json() == self.series.to_json(orient="index")
 
         objSeries = Series([str(d) for d in self.objSeries],
                            index=self.objSeries.index,
@@ -547,7 +646,7 @@ def _check_all_orients(series, dtype=None, check_index_type=True):
 
         # empty_series has empty index with object dtype
         # which cannot be revert
-        self.assertEqual(self.empty_series.index.dtype, np.object_)
+        assert self.empty_series.index.dtype == np.object_
         _check_all_orients(self.empty_series, check_index_type=False)
 
         _check_all_orients(self.ts)
@@ -559,13 +658,22 @@ def _check_all_orients(series, dtype=None, check_index_type=True):
 
     def test_series_to_json_except(self):
         s = Series([1, 2, 3])
-        self.assertRaises(ValueError, s.to_json, orient="garbage")
+        msg = "Invalid value 'garbage' for option 'orient'"
+        with pytest.raises(ValueError, match=msg):
+            s.to_json(orient="garbage")
 
     def test_series_from_json_precise_float(self):
         s = Series([4.56, 4.56, 4.56])
         result = read_json(s.to_json(), typ='series', precise_float=True)
         assert_series_equal(result, s, check_index_type=False)
 
+    def test_series_with_dtype(self):
+        # GH 21986
+        s = Series([4.56, 4.56, 4.56])
+        result = read_json(s.to_json(), typ='series', dtype=np.int64)
+        expected = Series([4] * 3)
+        assert_series_equal(result, expected)
+
     def test_frame_from_json_precise_float(self):
         df = DataFrame([[4.56, 4.56, 4.56], [4.56, 4.56, 4.56]])
         result = read_json(df.to_json(), precise_float=True)
@@ -608,7 +716,7 @@ def test_axis_dates(self):
         json = self.ts.to_json()
         result = read_json(json, typ='series')
         assert_series_equal(result, self.ts, check_names=False)
-        self.assertTrue(result.name is None)
+        assert result.name is None
 
     def test_convert_dates(self):
 
@@ -667,8 +775,9 @@ def test_w_date(date, date_unit=None):
         test_w_date('20130101 20:43:42.123456', date_unit='us')
         test_w_date('20130101 20:43:42.123456789', date_unit='ns')
 
-        self.assertRaises(ValueError, df.to_json, date_format='iso',
-                          date_unit='foo')
+        msg = "Invalid value 'foo' for option 'date_unit'"
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(date_format='iso', date_unit='foo')
 
     def test_date_format_series(self):
         def test_w_date(date, date_unit=None):
@@ -689,8 +798,9 @@ def test_w_date(date, date_unit=None):
         test_w_date('20130101 20:43:42.123456789', date_unit='ns')
 
         ts = Series(Timestamp('20130101 20:43:42.123'), index=self.ts.index)
-        self.assertRaises(ValueError, ts.to_json, date_format='iso',
-                          date_unit='foo')
+        msg = "Invalid value 'foo' for option 'date_unit'"
+        with pytest.raises(ValueError, match=msg):
+            ts.to_json(date_format='iso', date_unit='foo')
 
     def test_date_unit(self):
         df = self.tsframe.copy()
@@ -755,7 +865,7 @@ def test_misc_example(self):
 DataFrame\\.index values are different \\(100\\.0 %\\)
 \\[left\\]:  Index\\(\\[u?'a', u?'b'\\], dtype='object'\\)
 \\[right\\]: RangeIndex\\(start=0, stop=2, step=1\\)"""
-        with tm.assertRaisesRegexp(AssertionError, error_msg):
+        with pytest.raises(AssertionError, match=error_msg):
             assert_frame_equal(result, expected, check_index_type=False)
 
         result = read_json('[{"a": 1, "b": 2}, {"b":2, "a" :1}]')
@@ -763,6 +873,7 @@ def test_misc_example(self):
         assert_frame_equal(result, expected)
 
     @network
+    @pytest.mark.single
     def test_round_trip_exception_(self):
         # GH 3867
         csv = 'https://raw.github.com/hayd/lahman2012/master/csvs/Teams.csv'
@@ -773,29 +884,30 @@ def test_round_trip_exception_(self):
             index=df.index, columns=df.columns), df)
 
     @network
+    @pytest.mark.single
     def test_url(self):
         url = 'https://api.github.com/repos/pandas-dev/pandas/issues?per_page=5'  # noqa
         result = read_json(url, convert_dates=True)
         for c in ['created_at', 'closed_at', 'updated_at']:
-            self.assertEqual(result[c].dtype, 'datetime64[ns]')
+            assert result[c].dtype == 'datetime64[ns]'
 
     def test_timedelta(self):
         converter = lambda x: pd.to_timedelta(x, unit='ms')
 
         s = Series([timedelta(23), timedelta(seconds=5)])
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
 
         result = pd.read_json(s.to_json(), typ='series').apply(converter)
         assert_series_equal(result, s)
 
         s = Series([timedelta(23), timedelta(seconds=5)],
                    index=pd.Index([0, 1]))
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         result = pd.read_json(s.to_json(), typ='series').apply(converter)
         assert_series_equal(result, s)
 
         frame = DataFrame([timedelta(23), timedelta(seconds=5)])
-        self.assertEqual(frame[0].dtype, 'timedelta64[ns]')
+        assert frame[0].dtype == 'timedelta64[ns]'
         assert_frame_equal(frame, pd.read_json(frame.to_json())
                            .apply(converter))
 
@@ -839,8 +951,8 @@ def default(obj):
                                 columns=['a', 'b'])]
         expected = ('[9,[[1,null],["STR",null],[[["mathjs","Complex"],'
                     '["re",4.0],["im",-5.0]],"N\\/A"]]]')
-        self.assertEqual(expected, dumps(df_list, default_handler=default,
-                                         orient="values"))
+        assert dumps(df_list, default_handler=default,
+                     orient="values") == expected
 
     def test_default_handler_numpy_unsupported_dtype(self):
         # GH12554 to_json raises 'Unhandled numpy dtype 15'
@@ -850,18 +962,19 @@ def test_default_handler_numpy_unsupported_dtype(self):
         expected = ('[["(1+0j)","(nan+0j)"],'
                     '["(2.3+0j)","(nan+0j)"],'
                     '["(4-5j)","(1.2+0j)"]]')
-        self.assertEqual(expected, df.to_json(default_handler=str,
-                                              orient="values"))
+        assert df.to_json(default_handler=str, orient="values") == expected
 
     def test_default_handler_raises(self):
+        msg = "raisin"
+
         def my_handler_raises(obj):
-            raise TypeError("raisin")
-        self.assertRaises(TypeError,
-                          DataFrame({'a': [1, 2, object()]}).to_json,
-                          default_handler=my_handler_raises)
-        self.assertRaises(TypeError,
-                          DataFrame({'a': [1, 2, complex(4, -5)]}).to_json,
-                          default_handler=my_handler_raises)
+            raise TypeError(msg)
+        with pytest.raises(TypeError, match=msg):
+            DataFrame({'a': [1, 2, object()]}).to_json(
+                default_handler=my_handler_raises)
+        with pytest.raises(TypeError, match=msg):
+            DataFrame({'a': [1, 2, complex(4, -5)]}).to_json(
+                default_handler=my_handler_raises)
 
     def test_categorical(self):
         # GH4377 df.to_json segfaults with non-ndarray blocks
@@ -870,11 +983,11 @@ def test_categorical(self):
         expected = df.to_json()
 
         df["B"] = df["A"].astype('category')
-        self.assertEqual(expected, df.to_json())
+        assert expected == df.to_json()
 
         s = df["A"]
         sc = df["B"]
-        self.assertEqual(s.to_json(), sc.to_json())
+        assert s.to_json() == sc.to_json()
 
     def test_datetime_tz(self):
         # GH4377 df.to_json segfaults with non-ndarray blocks
@@ -888,11 +1001,11 @@ def test_datetime_tz(self):
         df_naive = df.copy()
         df_naive['A'] = tz_naive
         expected = df_naive.to_json()
-        self.assertEqual(expected, df.to_json())
+        assert expected == df.to_json()
 
         stz = Series(tz_range)
         s_naive = Series(tz_naive)
-        self.assertEqual(stz.to_json(), s_naive.to_json())
+        assert stz.to_json() == s_naive.to_json()
 
     def test_sparse(self):
         # GH4377 df.to_json segfaults with non-ndarray blocks
@@ -901,33 +1014,33 @@ def test_sparse(self):
 
         sdf = df.to_sparse()
         expected = df.to_json()
-        self.assertEqual(expected, sdf.to_json())
+        assert expected == sdf.to_json()
 
         s = pd.Series(np.random.randn(10))
         s.loc[:8] = np.nan
         ss = s.to_sparse()
 
         expected = s.to_json()
-        self.assertEqual(expected, ss.to_json())
+        assert expected == ss.to_json()
 
     def test_tz_is_utc(self):
         from pandas.io.json import dumps
         exp = '"2013-01-10T05:00:00.000Z"'
 
         ts = Timestamp('2013-01-10 05:00:00Z')
-        self.assertEqual(exp, dumps(ts, iso_dates=True))
+        assert dumps(ts, iso_dates=True) == exp
         dt = ts.to_pydatetime()
-        self.assertEqual(exp, dumps(dt, iso_dates=True))
+        assert dumps(dt, iso_dates=True) == exp
 
         ts = Timestamp('2013-01-10 00:00:00', tz='US/Eastern')
-        self.assertEqual(exp, dumps(ts, iso_dates=True))
+        assert dumps(ts, iso_dates=True) == exp
         dt = ts.to_pydatetime()
-        self.assertEqual(exp, dumps(dt, iso_dates=True))
+        assert dumps(dt, iso_dates=True) == exp
 
         ts = Timestamp('2013-01-10 00:00:00-0500')
-        self.assertEqual(exp, dumps(ts, iso_dates=True))
+        assert dumps(ts, iso_dates=True) == exp
         dt = ts.to_pydatetime()
-        self.assertEqual(exp, dumps(dt, iso_dates=True))
+        assert dumps(dt, iso_dates=True) == exp
 
     def test_tz_range_is_utc(self):
         from pandas.io.json import dumps
@@ -938,33 +1051,51 @@ def test_tz_range_is_utc(self):
                  '"1":"2013-01-02T05:00:00.000Z"}}')
 
         tz_range = pd.date_range('2013-01-01 05:00:00Z', periods=2)
-        self.assertEqual(exp, dumps(tz_range, iso_dates=True))
+        assert dumps(tz_range, iso_dates=True) == exp
         dti = pd.DatetimeIndex(tz_range)
-        self.assertEqual(exp, dumps(dti, iso_dates=True))
+        assert dumps(dti, iso_dates=True) == exp
         df = DataFrame({'DT': dti})
-        self.assertEqual(dfexp, dumps(df, iso_dates=True))
+        result = dumps(df, iso_dates=True)
+        assert result == dfexp
 
         tz_range = pd.date_range('2013-01-01 00:00:00', periods=2,
                                  tz='US/Eastern')
-        self.assertEqual(exp, dumps(tz_range, iso_dates=True))
+        assert dumps(tz_range, iso_dates=True) == exp
         dti = pd.DatetimeIndex(tz_range)
-        self.assertEqual(exp, dumps(dti, iso_dates=True))
+        assert dumps(dti, iso_dates=True) == exp
         df = DataFrame({'DT': dti})
-        self.assertEqual(dfexp, dumps(df, iso_dates=True))
+        assert dumps(df, iso_dates=True) == dfexp
 
         tz_range = pd.date_range('2013-01-01 00:00:00-0500', periods=2)
-        self.assertEqual(exp, dumps(tz_range, iso_dates=True))
+        assert dumps(tz_range, iso_dates=True) == exp
         dti = pd.DatetimeIndex(tz_range)
-        self.assertEqual(exp, dumps(dti, iso_dates=True))
+        assert dumps(dti, iso_dates=True) == exp
         df = DataFrame({'DT': dti})
-        self.assertEqual(dfexp, dumps(df, iso_dates=True))
+        assert dumps(df, iso_dates=True) == dfexp
 
-    def test_read_jsonl(self):
+    def test_read_inline_jsonl(self):
         # GH9180
         result = read_json('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n', lines=True)
         expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
         assert_frame_equal(result, expected)
 
+    @td.skip_if_not_us_locale
+    def test_read_s3_jsonl(self, s3_resource):
+        # GH17200
+
+        result = read_json('s3n://pandas-test/items.jsonl', lines=True)
+        expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+        assert_frame_equal(result, expected)
+
+    def test_read_local_jsonl(self):
+        # GH17200
+        with ensure_clean('tmp_items.json') as path:
+            with open(path, 'w') as infile:
+                infile.write('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n')
+            result = read_json(path, lines=True)
+            expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+            assert_frame_equal(result, expected)
+
     def test_read_jsonl_unicode_chars(self):
         # GH15132: non-ascii unicode characters
         # \u201d == RIGHT DOUBLE QUOTATION MARK
@@ -984,17 +1115,31 @@ def test_read_jsonl_unicode_chars(self):
                              columns=['a', 'b'])
         assert_frame_equal(result, expected)
 
+    def test_read_json_large_numbers(self):
+        # GH18842
+        json = '{"articleId": "1404366058080022500245"}'
+        json = StringIO(json)
+        result = read_json(json, typ="series")
+        expected = Series(1.404366e+21, index=['articleId'])
+        assert_series_equal(result, expected)
+
+        json = '{"0": {"articleId": "1404366058080022500245"}}'
+        json = StringIO(json)
+        result = read_json(json)
+        expected = DataFrame(1.404366e+21, index=['articleId'], columns=[0])
+        assert_frame_equal(result, expected)
+
     def test_to_jsonl(self):
         # GH9180
         df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
         result = df.to_json(orient="records", lines=True)
         expected = '{"a":1,"b":2}\n{"a":1,"b":2}'
-        self.assertEqual(result, expected)
+        assert result == expected
 
         df = DataFrame([["foo}", "bar"], ['foo"', "bar"]], columns=['a', 'b'])
         result = df.to_json(orient="records", lines=True)
         expected = '{"a":"foo}","b":"bar"}\n{"a":"foo\\"","b":"bar"}'
-        self.assertEqual(result, expected)
+        assert result == expected
         assert_frame_equal(pd.read_json(result, lines=True), df)
 
         # GH15096: escaped characters in columns and data
@@ -1003,14 +1148,12 @@ def test_to_jsonl(self):
         result = df.to_json(orient="records", lines=True)
         expected = ('{"a\\\\":"foo\\\\","b":"bar"}\n'
                     '{"a\\\\":"foo\\"","b":"bar"}')
-        self.assertEqual(result, expected)
+        assert result == expected
         assert_frame_equal(pd.read_json(result, lines=True), df)
 
     def test_latin_encoding(self):
         if compat.PY2:
-            self.assertRaisesRegexp(
-                TypeError, r'\[unicode\] is not implemented as a table column')
-            return
+            pytest.skip("[unicode] is not implemented as a table column")
 
         # GH 13774
         pytest.skip("encoding not implemented in .to_json(), "
@@ -1057,4 +1200,109 @@ def test_data_frame_size_after_to_json(self):
         df.to_json()
         size_after = df.memory_usage(index=True, deep=True).sum()
 
-        self.assertEqual(size_before, size_after)
+        assert size_before == size_after
+
+    @pytest.mark.parametrize('index', [None, [1, 2], [1., 2.], ['a', 'b'],
+                                       ['1', '2'], ['1.', '2.']])
+    @pytest.mark.parametrize('columns', [['a', 'b'], ['1', '2'], ['1.', '2.']])
+    def test_from_json_to_json_table_index_and_columns(self, index, columns):
+        # GH25433 GH25435
+        expected = DataFrame([[1, 2], [3, 4]], index=index, columns=columns)
+        dfjson = expected.to_json(orient='table')
+        result = pd.read_json(dfjson, orient='table')
+        assert_frame_equal(result, expected)
+
+    def test_from_json_to_json_table_dtypes(self):
+        # GH21345
+        expected = pd.DataFrame({'a': [1, 2], 'b': [3., 4.], 'c': ['5', '6']})
+        dfjson = expected.to_json(orient='table')
+        result = pd.read_json(dfjson, orient='table')
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('dtype', [True, {'b': int, 'c': int}])
+    def test_read_json_table_dtype_raises(self, dtype):
+        # GH21345
+        df = pd.DataFrame({'a': [1, 2], 'b': [3., 4.], 'c': ['5', '6']})
+        dfjson = df.to_json(orient='table')
+        msg = "cannot pass both dtype and orient='table'"
+        with pytest.raises(ValueError, match=msg):
+            pd.read_json(dfjson, orient='table', dtype=dtype)
+
+    def test_read_json_table_convert_axes_raises(self):
+        # GH25433 GH25435
+        df = DataFrame([[1, 2], [3, 4]], index=[1., 2.], columns=['1.', '2.'])
+        dfjson = df.to_json(orient='table')
+        msg = "cannot pass both convert_axes and orient='table'"
+        with pytest.raises(ValueError, match=msg):
+            pd.read_json(dfjson, orient='table', convert_axes=True)
+
+    @pytest.mark.parametrize('data, expected', [
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']).rename_axis('foo'),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'],
+                   index=[['a', 'b'], ['c', 'd']]),
+            {'columns': ['a', 'b'], 'data': [[1, 2], [4, 5]]}),
+        (Series([1, 2, 3], name='A'),
+            {'name': 'A', 'data': [1, 2, 3]}),
+        (Series([1, 2, 3], name='A').rename_axis('foo'),
+            {'name': 'A', 'data': [1, 2, 3]}),
+        (Series([1, 2], name='A', index=[['a', 'b'], ['c', 'd']]),
+            {'name': 'A', 'data': [1, 2]}),
+    ])
+    def test_index_false_to_json_split(self, data, expected):
+        # GH 17394
+        # Testing index=False in to_json with orient='split'
+
+        result = data.to_json(orient='split', index=False)
+        result = json.loads(result)
+
+        assert result == expected
+
+    @pytest.mark.parametrize('data', [
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'])),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b']).rename_axis('foo')),
+        (DataFrame([[1, 2], [4, 5]], columns=['a', 'b'],
+                   index=[['a', 'b'], ['c', 'd']])),
+        (Series([1, 2, 3], name='A')),
+        (Series([1, 2, 3], name='A').rename_axis('foo')),
+        (Series([1, 2], name='A', index=[['a', 'b'], ['c', 'd']])),
+    ])
+    def test_index_false_to_json_table(self, data):
+        # GH 17394
+        # Testing index=False in to_json with orient='table'
+
+        result = data.to_json(orient='table', index=False)
+        result = json.loads(result)
+
+        expected = {
+            'schema': pd.io.json.build_table_schema(data, index=False),
+            'data': DataFrame(data).to_dict(orient='records')
+        }
+
+        assert result == expected
+
+    @pytest.mark.parametrize('orient', [
+        'records', 'index', 'columns', 'values'
+    ])
+    def test_index_false_error_to_json(self, orient):
+        # GH 17394
+        # Testing error message from to_json with index=False
+
+        df = pd.DataFrame([[1, 2], [4, 5]], columns=['a', 'b'])
+
+        msg = ("'index=False' is only valid when "
+               "'orient' is 'split' or 'table'")
+        with pytest.raises(ValueError, match=msg):
+            df.to_json(orient=orient, index=False)
+
+    @pytest.mark.parametrize('orient', ['split', 'table'])
+    @pytest.mark.parametrize('index', [True, False])
+    def test_index_false_from_json_to_json(self, orient, index):
+        # GH25170
+        # Test index=False in from_json to_json
+        expected = DataFrame({'a': [1, 2], 'b': [3, 4]})
+        dfjson = expected.to_json(orient=orient, index=index)
+        result = read_json(dfjson, orient=orient)
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/json/test_readlines.py b/pandas/tests/io/json/test_readlines.py
new file mode 100644
index 0000000000000..25e78526b2e5a
--- /dev/null
+++ b/pandas/tests/io/json/test_readlines.py
@@ -0,0 +1,172 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+from pandas.compat import StringIO
+
+import pandas as pd
+from pandas import DataFrame, read_json
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_frame_equal, assert_series_equal, ensure_clean)
+
+from pandas.io.json.json import JsonReader
+
+
+@pytest.fixture
+def lines_json_df():
+    df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+    return df.to_json(lines=True, orient="records")
+
+
+def test_read_jsonl():
+    # GH9180
+    result = read_json('{"a": 1, "b": 2}\n{"b":2, "a" :1}\n', lines=True)
+    expected = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+
+def test_read_jsonl_unicode_chars():
+    # GH15132: non-ascii unicode characters
+    # \u201d == RIGHT DOUBLE QUOTATION MARK
+
+    # simulate file handle
+    json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+    json = StringIO(json)
+    result = read_json(json, lines=True)
+    expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                         columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+    # simulate string
+    json = '{"a": "foo”", "b": "bar"}\n{"a": "foo", "b": "bar"}\n'
+    result = read_json(json, lines=True)
+    expected = DataFrame([[u"foo\u201d", "bar"], ["foo", "bar"]],
+                         columns=['a', 'b'])
+    assert_frame_equal(result, expected)
+
+
+def test_to_jsonl():
+    # GH9180
+    df = DataFrame([[1, 2], [1, 2]], columns=['a', 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = '{"a":1,"b":2}\n{"a":1,"b":2}'
+    assert result == expected
+
+    df = DataFrame([["foo}", "bar"], ['foo"', "bar"]], columns=['a', 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = '{"a":"foo}","b":"bar"}\n{"a":"foo\\"","b":"bar"}'
+    assert result == expected
+    assert_frame_equal(read_json(result, lines=True), df)
+
+    # GH15096: escaped characters in columns and data
+    df = DataFrame([["foo\\", "bar"], ['foo"', "bar"]],
+                   columns=["a\\", 'b'])
+    result = df.to_json(orient="records", lines=True)
+    expected = ('{"a\\\\":"foo\\\\","b":"bar"}\n'
+                '{"a\\\\":"foo\\"","b":"bar"}')
+    assert result == expected
+    assert_frame_equal(read_json(result, lines=True), df)
+
+
+@pytest.mark.parametrize("chunksize", [1, 1.0])
+def test_readjson_chunks(lines_json_df, chunksize):
+    # Basic test that read_json(chunks=True) gives the same result as
+    # read_json(chunks=False)
+    # GH17048: memory usage when lines=True
+
+    unchunked = read_json(StringIO(lines_json_df), lines=True)
+    reader = read_json(StringIO(lines_json_df), lines=True,
+                       chunksize=chunksize)
+    chunked = pd.concat(reader)
+
+    assert_frame_equal(chunked, unchunked)
+
+
+def test_readjson_chunksize_requires_lines(lines_json_df):
+    msg = "chunksize can only be passed if lines=True"
+    with pytest.raises(ValueError, match=msg):
+        pd.read_json(StringIO(lines_json_df), lines=False, chunksize=2)
+
+
+def test_readjson_chunks_series():
+    # Test reading line-format JSON to Series with chunksize param
+    s = pd.Series({'A': 1, 'B': 2})
+
+    strio = StringIO(s.to_json(lines=True, orient="records"))
+    unchunked = pd.read_json(strio, lines=True, typ='Series')
+
+    strio = StringIO(s.to_json(lines=True, orient="records"))
+    chunked = pd.concat(pd.read_json(
+        strio, lines=True, typ='Series', chunksize=1
+    ))
+
+    assert_series_equal(chunked, unchunked)
+
+
+def test_readjson_each_chunk(lines_json_df):
+    # Other tests check that the final result of read_json(chunksize=True)
+    # is correct. This checks the intermediate chunks.
+    chunks = list(
+        pd.read_json(StringIO(lines_json_df), lines=True, chunksize=2)
+    )
+    assert chunks[0].shape == (2, 2)
+    assert chunks[1].shape == (1, 2)
+
+
+def test_readjson_chunks_from_file():
+    with ensure_clean('test.json') as path:
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+        df.to_json(path, lines=True, orient="records")
+        chunked = pd.concat(pd.read_json(path, lines=True, chunksize=1))
+        unchunked = pd.read_json(path, lines=True)
+        assert_frame_equal(unchunked, chunked)
+
+
+@pytest.mark.parametrize("chunksize", [None, 1])
+def test_readjson_chunks_closes(chunksize):
+    with ensure_clean('test.json') as path:
+        df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+        df.to_json(path, lines=True, orient="records")
+        reader = JsonReader(
+            path, orient=None, typ="frame", dtype=True, convert_axes=True,
+            convert_dates=True, keep_default_dates=True, numpy=False,
+            precise_float=False, date_unit=None, encoding=None,
+            lines=True, chunksize=chunksize, compression=None)
+        reader.read()
+        assert reader.open_stream.closed, "didn't close stream with \
+            chunksize = {chunksize}".format(chunksize=chunksize)
+
+
+@pytest.mark.parametrize("chunksize", [0, -1, 2.2, "foo"])
+def test_readjson_invalid_chunksize(lines_json_df, chunksize):
+    msg = r"'chunksize' must be an integer >=1"
+
+    with pytest.raises(ValueError, match=msg):
+        pd.read_json(StringIO(lines_json_df), lines=True,
+                     chunksize=chunksize)
+
+
+@pytest.mark.parametrize("chunksize", [None, 1, 2])
+def test_readjson_chunks_multiple_empty_lines(chunksize):
+    j = """
+
+    {"A":1,"B":4}
+
+
+
+    {"A":2,"B":5}
+
+
+
+
+
+
+
+    {"A":3,"B":6}
+    """
+    orig = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]})
+    test = pd.read_json(j, lines=True, chunksize=chunksize)
+    if chunksize is not None:
+        test = pd.concat(test)
+    tm.assert_frame_equal(
+        orig, test, obj="chunksize: {chunksize}".format(chunksize=chunksize))
diff --git a/pandas/tests/io/json/test_ujson.py b/pandas/tests/io/json/test_ujson.py
index e66721beed288..63ba9bc0f0488 100644
--- a/pandas/tests/io/json/test_ujson.py
+++ b/pandas/tests/io/json/test_ujson.py
@@ -1,781 +1,613 @@
 # -*- coding: utf-8 -*-
 
-from unittest import TestCase
-
 try:
     import json
 except ImportError:
     import simplejson as json
-import math
-import pytest
-import platform
-import sys
-import time
-import datetime
 import calendar
-import re
+import datetime
 import decimal
 from functools import partial
-from pandas.compat import range, zip, StringIO, u
-import pandas.io.json.libjson as ujson
-import pandas.compat as compat
+import locale
+import math
+import re
+import time
 
+import dateutil
 import numpy as np
-from pandas import DataFrame, Series, Index, NaT, DatetimeIndex
-import pandas.util.testing as tm
-
+import pytest
+import pytz
 
-def _skip_if_python_ver(skip_major, skip_minor=None):
-    major, minor = sys.version_info[:2]
-    if major == skip_major and (skip_minor is None or minor == skip_minor):
-        pytest.skip("skipping Python version %d.%d" % (major, minor))
+import pandas._libs.json as ujson
+from pandas._libs.tslib import Timestamp
+import pandas.compat as compat
+from pandas.compat import StringIO, range, u
 
+from pandas import DataFrame, DatetimeIndex, Index, NaT, Series, date_range
+import pandas.util.testing as tm
 
 json_unicode = (json.dumps if compat.PY3
                 else partial(json.dumps, encoding="utf-8"))
 
 
-class UltraJSONTests(TestCase):
+def _clean_dict(d):
+    """
+    Sanitize dictionary for JSON by converting all keys to strings.
+
+    Parameters
+    ----------
+    d : dict
+        The dictionary to convert.
+
+    Returns
+    -------
+    cleaned_dict : dict
+    """
+
+    return {str(k): v for k, v in compat.iteritems(d)}
+
 
-    def test_encodeDecimal(self):
+@pytest.fixture(params=[
+    None,  # Column indexed by default.
+    "split",
+    "records",
+    "values",
+    "index"])
+def orient(request):
+    return request.param
+
+
+@pytest.fixture(params=[None, True])
+def numpy(request):
+    return request.param
+
+
+class TestUltraJSONTests(object):
+
+    @pytest.mark.skipif(compat.is_platform_32bit(),
+                        reason="not compliant on 32-bit, xref #15865")
+    def test_encode_decimal(self):
         sut = decimal.Decimal("1337.1337")
         encoded = ujson.encode(sut, double_precision=15)
         decoded = ujson.decode(encoded)
-        self.assertEqual(decoded, 1337.1337)
+        assert decoded == 1337.1337
+
+        sut = decimal.Decimal("0.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "1.0"
 
-    def test_encodeStringConversion(self):
-        input = "A string \\ / \b \f \n \r \t </script> &"
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.94")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "0.9"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == 0.9
+
+        sut = decimal.Decimal("1.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "2.0"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == 2.0
+
+        sut = decimal.Decimal("-1.95")
+        encoded = ujson.encode(sut, double_precision=1)
+        assert encoded == "-2.0"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == -2.0
+
+        sut = decimal.Decimal("0.995")
+        encoded = ujson.encode(sut, double_precision=2)
+        assert encoded == "1.0"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.9995")
+        encoded = ujson.encode(sut, double_precision=3)
+        assert encoded == "1.0"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+        sut = decimal.Decimal("0.99999999999999944")
+        encoded = ujson.encode(sut, double_precision=15)
+        assert encoded == "1.0"
+
+        decoded = ujson.decode(encoded)
+        assert decoded == 1.0
+
+    @pytest.mark.parametrize("ensure_ascii", [True, False])
+    def test_encode_string_conversion(self, ensure_ascii):
+        string_input = "A string \\ / \b \f \n \r \t </script> &"
         not_html_encoded = ('"A string \\\\ \\/ \\b \\f \\n '
                             '\\r \\t <\\/script> &"')
         html_encoded = ('"A string \\\\ \\/ \\b \\f \\n \\r \\t '
                         '\\u003c\\/script\\u003e \\u0026"')
 
         def helper(expected_output, **encode_kwargs):
-            output = ujson.encode(input, **encode_kwargs)
-            self.assertEqual(input, json.loads(output))
-            self.assertEqual(output, expected_output)
-            self.assertEqual(input, ujson.decode(output))
+            output = ujson.encode(string_input,
+                                  ensure_ascii=ensure_ascii,
+                                  **encode_kwargs)
+
+            assert output == expected_output
+            assert string_input == json.loads(output)
+            assert string_input == ujson.decode(output)
 
         # Default behavior assumes encode_html_chars=False.
-        helper(not_html_encoded, ensure_ascii=True)
-        helper(not_html_encoded, ensure_ascii=False)
+        helper(not_html_encoded)
 
         # Make sure explicit encode_html_chars=False works.
-        helper(not_html_encoded, ensure_ascii=True, encode_html_chars=False)
-        helper(not_html_encoded, ensure_ascii=False, encode_html_chars=False)
+        helper(not_html_encoded, encode_html_chars=False)
 
         # Make sure explicit encode_html_chars=True does the encoding.
-        helper(html_encoded, ensure_ascii=True, encode_html_chars=True)
-        helper(html_encoded, ensure_ascii=False, encode_html_chars=True)
-
-    def test_doubleLongIssue(self):
-        sut = {u('a'): -4342969734183514}
-        encoded = json.dumps(sut)
-        decoded = json.loads(encoded)
-        self.assertEqual(sut, decoded)
-        encoded = ujson.encode(sut, double_precision=15)
-        decoded = ujson.decode(encoded)
-        self.assertEqual(sut, decoded)
+        helper(html_encoded, encode_html_chars=True)
 
-    def test_doubleLongDecimalIssue(self):
-        sut = {u('a'): -12345678901234.56789012}
-        encoded = json.dumps(sut)
-        decoded = json.loads(encoded)
-        self.assertEqual(sut, decoded)
+    @pytest.mark.parametrize("long_number", [
+        -4342969734183514, -12345678901234.56789012, -528656961.4399388
+    ])
+    def test_double_long_numbers(self, long_number):
+        sut = {u("a"): long_number}
         encoded = ujson.encode(sut, double_precision=15)
+
         decoded = ujson.decode(encoded)
-        self.assertEqual(sut, decoded)
-
-    def test_encodeNonCLocale(self):
-        import locale
-        savedlocale = locale.getlocale(locale.LC_NUMERIC)
-        try:
-            locale.setlocale(locale.LC_NUMERIC, 'it_IT.UTF-8')
-        except:
-            try:
-                locale.setlocale(locale.LC_NUMERIC, 'Italian_Italy')
-            except:
-                pytest.skip('Could not set locale for testing')
-        self.assertEqual(ujson.loads(ujson.dumps(4.78e60)), 4.78e60)
-        self.assertEqual(ujson.loads('4.78', precise_float=True), 4.78)
-        locale.setlocale(locale.LC_NUMERIC, savedlocale)
-
-    def test_encodeDecodeLongDecimal(self):
-        sut = {u('a'): -528656961.4399388}
-        encoded = ujson.dumps(sut, double_precision=15)
-        ujson.decode(encoded)
-
-    def test_decimalDecodeTestPrecise(self):
-        sut = {u('a'): 4.56}
+        assert sut == decoded
+
+    def test_encode_non_c_locale(self):
+        lc_category = locale.LC_NUMERIC
+
+        # We just need one of these locales to work.
+        for new_locale in ("it_IT.UTF-8", "Italian_Italy"):
+            if tm.can_set_locale(new_locale, lc_category):
+                with tm.set_locale(new_locale, lc_category):
+                    assert ujson.loads(ujson.dumps(4.78e60)) == 4.78e60
+                    assert ujson.loads("4.78", precise_float=True) == 4.78
+                break
+
+    def test_decimal_decode_test_precise(self):
+        sut = {u("a"): 4.56}
         encoded = ujson.encode(sut)
         decoded = ujson.decode(encoded, precise_float=True)
-        self.assertEqual(sut, decoded)
-
-    def test_encodeDoubleTinyExponential(self):
-        if compat.is_platform_windows() and not compat.PY3:
-            pytest.skip("buggy on win-64 for py2")
+        assert sut == decoded
 
+    @pytest.mark.skipif(compat.is_platform_windows() and not compat.PY3,
+                        reason="buggy on win-64 for py2")
+    def test_encode_double_tiny_exponential(self):
         num = 1e-40
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
+        assert num == ujson.decode(ujson.encode(num))
         num = 1e-100
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
+        assert num == ujson.decode(ujson.encode(num))
         num = -1e-45
-        self.assertEqual(num, ujson.decode(ujson.encode(num)))
+        assert num == ujson.decode(ujson.encode(num))
         num = -1e-145
-        self.assertTrue(np.allclose(num, ujson.decode(ujson.encode(num))))
-
-    def test_encodeDictWithUnicodeKeys(self):
-        input = {u("key1"): u("value1"), u("key1"):
-                 u("value1"), u("key1"): u("value1"),
-                 u("key1"): u("value1"), u("key1"):
-                 u("value1"), u("key1"): u("value1")}
-        output = ujson.encode(input)
-
-        input = {u("بن"): u("value1"), u("بن"): u("value1"),
-                 u("بن"): u("value1"), u("بن"): u("value1"),
-                 u("بن"): u("value1"), u("بن"): u("value1"),
-                 u("بن"): u("value1")}
-        output = ujson.encode(input)  # noqa
-
-    def test_encodeDoubleConversion(self):
-        input = math.pi
-        output = ujson.encode(input)
-        self.assertEqual(round(input, 5), round(json.loads(output), 5))
-        self.assertEqual(round(input, 5), round(ujson.decode(output), 5))
-
-    def test_encodeWithDecimal(self):
-        input = 1.0
-        output = ujson.encode(input)
-        self.assertEqual(output, "1.0")
-
-    def test_encodeDoubleNegConversion(self):
-        input = -math.pi
-        output = ujson.encode(input)
-
-        self.assertEqual(round(input, 5), round(json.loads(output), 5))
-        self.assertEqual(round(input, 5), round(ujson.decode(output), 5))
-
-    def test_encodeArrayOfNestedArrays(self):
-        input = [[[[]]]] * 20
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        # self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        input = np.array(input)
-        tm.assert_numpy_array_equal(input, ujson.decode(
-            output, numpy=True, dtype=input.dtype))
-
-    def test_encodeArrayOfDoubles(self):
-        input = [31337.31337, 31337.31337, 31337.31337, 31337.31337] * 10
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        # self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(
-            np.array(input), ujson.decode(output, numpy=True))
-
-    def test_doublePrecisionTest(self):
-        input = 30.012345678901234
-        output = ujson.encode(input, double_precision=15)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-
-        output = ujson.encode(input, double_precision=9)
-        self.assertEqual(round(input, 9), json.loads(output))
-        self.assertEqual(round(input, 9), ujson.decode(output))
-
-        output = ujson.encode(input, double_precision=3)
-        self.assertEqual(round(input, 3), json.loads(output))
-        self.assertEqual(round(input, 3), ujson.decode(output))
-
-    def test_invalidDoublePrecision(self):
-        input = 30.12345678901234567890
-
-        self.assertRaises(ValueError, ujson.encode, input, double_precision=20)
-        self.assertRaises(ValueError, ujson.encode, input, double_precision=-1)
-
-        # will throw typeError
-        self.assertRaises(TypeError, ujson.encode, input, double_precision='9')
-        # will throw typeError
-        self.assertRaises(TypeError, ujson.encode,
-                          input, double_precision=None)
-
-    def test_encodeStringConversion2(self):
-        input = "A string \\ / \b \f \n \r \t"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, '"A string \\\\ \\/ \\b \\f \\n \\r \\t"')
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_decodeUnicodeConversion(self):
-        pass
-
-    def test_encodeUnicodeConversion1(self):
-        input = "Räksmörgås اسامة بن محمد بن عوض بن لادن"
-        enc = ujson.encode(input)
+        assert np.allclose(num, ujson.decode(ujson.encode(num)))
+
+    @pytest.mark.parametrize("unicode_key", [
+        u("key1"), u("بن")
+    ])
+    def test_encode_dict_with_unicode_keys(self, unicode_key):
+        unicode_dict = {unicode_key: u("value1")}
+        assert unicode_dict == ujson.decode(ujson.encode(unicode_dict))
+
+    @pytest.mark.parametrize("double_input", [
+        math.pi,
+        -math.pi  # Should work with negatives too.
+    ])
+    def test_encode_double_conversion(self, double_input):
+        output = ujson.encode(double_input)
+        assert round(double_input, 5) == round(json.loads(output), 5)
+        assert round(double_input, 5) == round(ujson.decode(output), 5)
+
+    def test_encode_with_decimal(self):
+        decimal_input = 1.0
+        output = ujson.encode(decimal_input)
+
+        assert output == "1.0"
+
+    def test_encode_array_of_nested_arrays(self):
+        nested_input = [[[[]]]] * 20
+        output = ujson.encode(nested_input)
+
+        assert nested_input == json.loads(output)
+        assert nested_input == ujson.decode(output)
+
+        nested_input = np.array(nested_input)
+        tm.assert_numpy_array_equal(nested_input, ujson.decode(
+            output, numpy=True, dtype=nested_input.dtype))
+
+    def test_encode_array_of_doubles(self):
+        doubles_input = [31337.31337, 31337.31337,
+                         31337.31337, 31337.31337] * 10
+        output = ujson.encode(doubles_input)
+
+        assert doubles_input == json.loads(output)
+        assert doubles_input == ujson.decode(output)
+
+        tm.assert_numpy_array_equal(np.array(doubles_input),
+                                    ujson.decode(output, numpy=True))
+
+    def test_double_precision(self):
+        double_input = 30.012345678901234
+        output = ujson.encode(double_input, double_precision=15)
+
+        assert double_input == json.loads(output)
+        assert double_input == ujson.decode(output)
+
+        for double_precision in (3, 9):
+            output = ujson.encode(double_input,
+                                  double_precision=double_precision)
+            rounded_input = round(double_input, double_precision)
+
+            assert rounded_input == json.loads(output)
+            assert rounded_input == ujson.decode(output)
+
+    @pytest.mark.parametrize("invalid_val", [
+        20, -1, "9", None
+    ])
+    def test_invalid_double_precision(self, invalid_val):
+        double_input = 30.12345678901234567890
+        expected_exception = (ValueError if isinstance(invalid_val, int)
+                              else TypeError)
+
+        with pytest.raises(expected_exception):
+            ujson.encode(double_input, double_precision=invalid_val)
+
+    def test_encode_string_conversion2(self):
+        string_input = "A string \\ / \b \f \n \r \t"
+        output = ujson.encode(string_input)
+
+        assert string_input == json.loads(output)
+        assert string_input == ujson.decode(output)
+        assert output == '"A string \\\\ \\/ \\b \\f \\n \\r \\t"'
+
+    @pytest.mark.parametrize("unicode_input", [
+        "Räksmörgås اسامة بن محمد بن عوض بن لادن",
+        "\xe6\x97\xa5\xd1\x88"
+    ])
+    def test_encode_unicode_conversion(self, unicode_input):
+        enc = ujson.encode(unicode_input)
         dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
 
-    def test_encodeControlEscaping(self):
-        input = "\x19"
-        enc = ujson.encode(input)
-        dec = ujson.decode(enc)
-        self.assertEqual(input, dec)
-        self.assertEqual(enc, json_unicode(input))
+        assert enc == json_unicode(unicode_input)
+        assert dec == json.loads(enc)
 
-    def test_encodeUnicodeConversion2(self):
-        input = "\xe6\x97\xa5\xd1\x88"
-        enc = ujson.encode(input)
+    def test_encode_control_escaping(self):
+        escaped_input = "\x19"
+        enc = ujson.encode(escaped_input)
         dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
-
-    def test_encodeUnicodeSurrogatePair(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf0\x90\x8d\x86"
-        enc = ujson.encode(input)
+
+        assert escaped_input == dec
+        assert enc == json_unicode(escaped_input)
+
+    def test_encode_unicode_surrogate_pair(self):
+        surrogate_input = "\xf0\x90\x8d\x86"
+        enc = ujson.encode(surrogate_input)
         dec = ujson.decode(enc)
 
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
+        assert enc == json_unicode(surrogate_input)
+        assert dec == json.loads(enc)
 
-    def test_encodeUnicode4BytesUTF8(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf0\x91\x80\xb0TRAILINGNORMAL"
-        enc = ujson.encode(input)
+    def test_encode_unicode_4bytes_utf8(self):
+        four_bytes_input = "\xf0\x91\x80\xb0TRAILINGNORMAL"
+        enc = ujson.encode(four_bytes_input)
         dec = ujson.decode(enc)
 
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
+        assert enc == json_unicode(four_bytes_input)
+        assert dec == json.loads(enc)
 
-    def test_encodeUnicode4BytesUTF8Highest(self):
-        _skip_if_python_ver(2, 5)
-        _skip_if_python_ver(2, 6)
-        input = "\xf3\xbf\xbf\xbfTRAILINGNORMAL"
-        enc = ujson.encode(input)
+    def test_encode_unicode_4bytes_utf8highest(self):
+        four_bytes_input = "\xf3\xbf\xbf\xbfTRAILINGNORMAL"
+        enc = ujson.encode(four_bytes_input)
 
         dec = ujson.decode(enc)
 
-        self.assertEqual(enc, json_unicode(input))
-        self.assertEqual(dec, json.loads(enc))
+        assert enc == json_unicode(four_bytes_input)
+        assert dec == json.loads(enc)
 
-    def test_encodeArrayInArray(self):
-        input = [[[[]]]]
-        output = ujson.encode(input)
+    def test_encode_array_in_array(self):
+        arr_in_arr_input = [[[[]]]]
+        output = ujson.encode(arr_in_arr_input)
 
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(
-            np.array(input), ujson.decode(output, numpy=True))
-        pass
-
-    def test_encodeIntConversion(self):
-        input = 31337
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeIntNegConversion(self):
-        input = -31337
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeLongNegConversion(self):
-        input = -9223372036854775808
-        output = ujson.encode(input)
-
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-    def test_encodeListConversion(self):
-        input = [1, 2, 3, 4]
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(
-            np.array(input), ujson.decode(output, numpy=True))
-        pass
-
-    def test_encodeDictConversion(self):
-        input = {"k1": 1, "k2": 2, "k3": 3, "k4": 4}
-        output = ujson.encode(input)  # noqa
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeNoneConversion(self):
-        input = None
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeTrueConversion(self):
-        input = True
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_encodeFalseConversion(self):
-        input = False
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-    def test_encodeDatetimeConversion(self):
-        ts = time.time()
-        input = datetime.datetime.fromtimestamp(ts)
-        output = ujson.encode(input, date_unit='s')
-        expected = calendar.timegm(input.utctimetuple())
-        self.assertEqual(int(expected), json.loads(output))
-        self.assertEqual(int(expected), ujson.decode(output))
-
-    def test_encodeDateConversion(self):
-        ts = time.time()
-        input = datetime.date.fromtimestamp(ts)
-
-        output = ujson.encode(input, date_unit='s')
-        tup = (input.year, input.month, input.day, 0, 0, 0)
+        assert arr_in_arr_input == json.loads(output)
+        assert output == json.dumps(arr_in_arr_input)
+        assert arr_in_arr_input == ujson.decode(output)
+
+        tm.assert_numpy_array_equal(np.array(arr_in_arr_input),
+                                    ujson.decode(output, numpy=True))
+
+    @pytest.mark.parametrize("num_input", [
+        31337,
+        -31337,  # Negative number.
+        -9223372036854775808  # Large negative number.
+    ])
+    def test_encode_num_conversion(self, num_input):
+        output = ujson.encode(num_input)
+        assert num_input == json.loads(output)
+        assert output == json.dumps(num_input)
+        assert num_input == ujson.decode(output)
+
+    def test_encode_list_conversion(self):
+        list_input = [1, 2, 3, 4]
+        output = ujson.encode(list_input)
+
+        assert list_input == json.loads(output)
+        assert list_input == ujson.decode(output)
+
+        tm.assert_numpy_array_equal(np.array(list_input),
+                                    ujson.decode(output, numpy=True))
+
+    def test_encode_dict_conversion(self):
+        dict_input = {"k1": 1, "k2": 2, "k3": 3, "k4": 4}
+        output = ujson.encode(dict_input)
+
+        assert dict_input == json.loads(output)
+        assert dict_input == ujson.decode(output)
 
+    @pytest.mark.parametrize("builtin_value", [None, True, False])
+    def test_encode_builtin_values_conversion(self, builtin_value):
+        output = ujson.encode(builtin_value)
+        assert builtin_value == json.loads(output)
+        assert output == json.dumps(builtin_value)
+        assert builtin_value == ujson.decode(output)
+
+    def test_encode_datetime_conversion(self):
+        datetime_input = datetime.datetime.fromtimestamp(time.time())
+        output = ujson.encode(datetime_input, date_unit="s")
+        expected = calendar.timegm(datetime_input.utctimetuple())
+
+        assert int(expected) == json.loads(output)
+        assert int(expected) == ujson.decode(output)
+
+    def test_encode_date_conversion(self):
+        date_input = datetime.date.fromtimestamp(time.time())
+        output = ujson.encode(date_input, date_unit="s")
+
+        tup = (date_input.year, date_input.month, date_input.day, 0, 0, 0)
         expected = calendar.timegm(tup)
-        self.assertEqual(int(expected), json.loads(output))
-        self.assertEqual(int(expected), ujson.decode(output))
-
-    def test_encodeTimeConversion(self):
-        tests = [
-            datetime.time(),
-            datetime.time(1, 2, 3),
-            datetime.time(10, 12, 15, 343243),
-        ]
-        for test in tests:
-            output = ujson.encode(test)
-            expected = '"%s"' % test.isoformat()
-            self.assertEqual(expected, output)
-
-    def test_encodeTimeConversion_pytz(self):
-        # GH11473 to_json segfaults with timezone-aware datetimes
-        tm._skip_if_no_pytz()
-        import pytz
+
+        assert int(expected) == json.loads(output)
+        assert int(expected) == ujson.decode(output)
+
+    @pytest.mark.parametrize("test", [
+        datetime.time(),
+        datetime.time(1, 2, 3),
+        datetime.time(10, 12, 15, 343243),
+    ])
+    def test_encode_time_conversion_basic(self, test):
+        output = ujson.encode(test)
+        expected = '"{iso}"'.format(iso=test.isoformat())
+        assert expected == output
+
+    def test_encode_time_conversion_pytz(self):
+        # see gh-11473: to_json segfaults with timezone-aware datetimes
         test = datetime.time(10, 12, 15, 343243, pytz.utc)
         output = ujson.encode(test)
-        expected = '"%s"' % test.isoformat()
-        self.assertEqual(expected, output)
+        expected = '"{iso}"'.format(iso=test.isoformat())
+        assert expected == output
 
-    def test_encodeTimeConversion_dateutil(self):
-        # GH11473 to_json segfaults with timezone-aware datetimes
-        tm._skip_if_no_dateutil()
-        import dateutil
+    def test_encode_time_conversion_dateutil(self):
+        # see gh-11473: to_json segfaults with timezone-aware datetimes
         test = datetime.time(10, 12, 15, 343243, dateutil.tz.tzutc())
         output = ujson.encode(test)
-        expected = '"%s"' % test.isoformat()
-        self.assertEqual(expected, output)
-
-    def test_nat(self):
-        input = NaT
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_npy_nat(self):
-        from distutils.version import LooseVersion
-        if LooseVersion(np.__version__) < '1.7.0':
-            pytest.skip("numpy version < 1.7.0, is "
-                        "{0}".format(np.__version__))
-
-        input = np.datetime64('NaT')
-        assert ujson.encode(input) == 'null', "Expected null"
+        expected = '"{iso}"'.format(iso=test.isoformat())
+        assert expected == output
+
+    @pytest.mark.parametrize("decoded_input", [
+        NaT,
+        np.datetime64("NaT"),
+        np.nan,
+        np.inf,
+        -np.inf
+    ])
+    def test_encode_as_null(self, decoded_input):
+        assert ujson.encode(decoded_input) == "null", "Expected null"
 
     def test_datetime_units(self):
-        from pandas._libs.lib import Timestamp
-
         val = datetime.datetime(2013, 8, 17, 21, 17, 12, 215504)
         stamp = Timestamp(val)
 
         roundtrip = ujson.decode(ujson.encode(val, date_unit='s'))
-        self.assertEqual(roundtrip, stamp.value // 10**9)
+        assert roundtrip == stamp.value // 10**9
 
         roundtrip = ujson.decode(ujson.encode(val, date_unit='ms'))
-        self.assertEqual(roundtrip, stamp.value // 10**6)
+        assert roundtrip == stamp.value // 10**6
 
         roundtrip = ujson.decode(ujson.encode(val, date_unit='us'))
-        self.assertEqual(roundtrip, stamp.value // 10**3)
+        assert roundtrip == stamp.value // 10**3
 
         roundtrip = ujson.decode(ujson.encode(val, date_unit='ns'))
-        self.assertEqual(roundtrip, stamp.value)
+        assert roundtrip == stamp.value
+
+        msg = "Invalid value 'foo' for option 'date_unit'"
+        with pytest.raises(ValueError, match=msg):
+            ujson.encode(val, date_unit='foo')
 
-        self.assertRaises(ValueError, ujson.encode, val, date_unit='foo')
+    def test_encode_to_utf8(self):
+        unencoded = "\xe6\x97\xa5\xd1\x88"
 
-    def test_encodeToUTF8(self):
-        _skip_if_python_ver(2, 5)
-        input = "\xe6\x97\xa5\xd1\x88"
-        enc = ujson.encode(input, ensure_ascii=False)
+        enc = ujson.encode(unencoded, ensure_ascii=False)
         dec = ujson.decode(enc)
-        self.assertEqual(enc, json_unicode(input, ensure_ascii=False))
-        self.assertEqual(dec, json.loads(enc))
 
-    def test_decodeFromUnicode(self):
-        input = u("{\"obj\": 31337}")
-        dec1 = ujson.decode(input)
-        dec2 = ujson.decode(str(input))
-        self.assertEqual(dec1, dec2)
+        assert enc == json_unicode(unencoded, ensure_ascii=False)
+        assert dec == json.loads(enc)
 
-    def test_encodeRecursionMax(self):
+    def test_decode_from_unicode(self):
+        unicode_input = u("{\"obj\": 31337}")
+
+        dec1 = ujson.decode(unicode_input)
+        dec2 = ujson.decode(str(unicode_input))
+
+        assert dec1 == dec2
+
+    def test_encode_recursion_max(self):
         # 8 is the max recursion depth
 
-        class O2:
+        class O2(object):
             member = 0
             pass
 
-        class O1:
+        class O1(object):
             member = 0
             pass
 
-        input = O1()
-        input.member = O2()
-        input.member.member = input
+        decoded_input = O1()
+        decoded_input.member = O2()
+        decoded_input.member.member = decoded_input
+
+        with pytest.raises(OverflowError):
+            ujson.encode(decoded_input)
+
+    def test_decode_jibberish(self):
+        jibberish = "fdsa sda v9sa fdsa"
+
+        with pytest.raises(ValueError):
+            ujson.decode(jibberish)
+
+    @pytest.mark.parametrize("broken_json", [
+        "[",  # Broken array start.
+        "{",  # Broken object start.
+        "]",  # Broken array end.
+        "}",  # Broken object end.
+    ])
+    def test_decode_broken_json(self, broken_json):
+        with pytest.raises(ValueError):
+            ujson.decode(broken_json)
+
+    @pytest.mark.parametrize("too_big_char", [
+        "[",
+        "{",
+    ])
+    def test_decode_depth_too_big(self, too_big_char):
+        with pytest.raises(ValueError):
+            ujson.decode(too_big_char * (1024 * 1024))
+
+    @pytest.mark.parametrize("bad_string", [
+        "\"TESTING",  # Unterminated.
+        "\"TESTING\\\"",  # Unterminated escape.
+        "tru",  # Broken True.
+        "fa",  # Broken False.
+        "n",  # Broken None.
+    ])
+    def test_decode_bad_string(self, bad_string):
+        with pytest.raises(ValueError):
+            ujson.decode(bad_string)
+
+    @pytest.mark.parametrize("broken_json", [
+        '{{1337:""}}',
+        '{{"key":"}',
+        '[[[true',
+    ])
+    def test_decode_broken_json_leak(self, broken_json):
+        for _ in range(1000):
+            with pytest.raises(ValueError):
+                ujson.decode(broken_json)
+
+    @pytest.mark.parametrize("invalid_dict", [
+        "{{{{31337}}}}",  # No key.
+        "{{{{\"key\":}}}}",  # No value.
+        "{{{{\"key\"}}}}",  # No colon or value.
+    ])
+    def test_decode_invalid_dict(self, invalid_dict):
+        with pytest.raises(ValueError):
+            ujson.decode(invalid_dict)
+
+    @pytest.mark.parametrize("numeric_int_as_str", [
+        "31337", "-31337"  # Should work with negatives.
+    ])
+    def test_decode_numeric_int(self, numeric_int_as_str):
+        assert int(numeric_int_as_str) == ujson.decode(numeric_int_as_str)
+
+    @pytest.mark.skipif(compat.PY3, reason="only PY2")
+    def test_encode_unicode_4bytes_utf8_fail(self):
+        with pytest.raises(OverflowError):
+            ujson.encode("\xfd\xbf\xbf\xbf\xbf\xbf")
+
+    def test_encode_null_character(self):
+        wrapped_input = "31337 \x00 1337"
+        output = ujson.encode(wrapped_input)
+
+        assert wrapped_input == json.loads(output)
+        assert output == json.dumps(wrapped_input)
+        assert wrapped_input == ujson.decode(output)
+
+        alone_input = "\x00"
+        output = ujson.encode(alone_input)
+
+        assert alone_input == json.loads(output)
+        assert output == json.dumps(alone_input)
+        assert alone_input == ujson.decode(output)
+        assert '"  \\u0000\\r\\n "' == ujson.dumps(u("  \u0000\r\n "))
+
+    def test_decode_null_character(self):
+        wrapped_input = "\"31337 \\u0000 31337\""
+        assert ujson.decode(wrapped_input) == json.loads(wrapped_input)
+
+    def test_encode_list_long_conversion(self):
+        long_input = [9223372036854775807, 9223372036854775807,
+                      9223372036854775807, 9223372036854775807,
+                      9223372036854775807, 9223372036854775807]
+        output = ujson.encode(long_input)
+
+        assert long_input == json.loads(output)
+        assert long_input == ujson.decode(output)
+
+        tm.assert_numpy_array_equal(np.array(long_input),
+                                    ujson.decode(output, numpy=True,
+                                                 dtype=np.int64))
 
-        try:
-            output = ujson.encode(input)  # noqa
-            assert False, "Expected overflow exception"
-        except(OverflowError):
-            pass
+    def test_encode_long_conversion(self):
+        long_input = 9223372036854775807
+        output = ujson.encode(long_input)
 
-    def test_encodeDoubleNan(self):
-        input = np.nan
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_encodeDoubleInf(self):
-        input = np.inf
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_encodeDoubleNegInf(self):
-        input = -np.inf
-        assert ujson.encode(input) == 'null', "Expected null"
-
-    def test_decodeJibberish(self):
-        input = "fdsa sda v9sa fdsa"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenArrayStart(self):
-        input = "["
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenObjectStart(self):
-        input = "{"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenArrayEnd(self):
-        input = "]"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeArrayDepthTooBig(self):
-        input = '[' * (1024 * 1024)
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenObjectEnd(self):
-        input = "}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeObjectDepthTooBig(self):
-        input = '{' * (1024 * 1024)
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringUnterminated(self):
-        input = "\"TESTING"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringUntermEscapeSequence(self):
-        input = "\"TESTING\\\""
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeStringBadEscape(self):
-        input = "\"TESTING\\\""
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeTrueBroken(self):
-        input = "tru"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeFalseBroken(self):
-        input = "fa"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeNullBroken(self):
-        input = "n"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-        assert False, "Wrong exception"
-
-    def test_decodeBrokenDictKeyTypeLeakTest(self):
-        input = '{{1337:""}}'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except ValueError:
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeBrokenDictLeakTest(self):
-        input = '{{"key":"}'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except(ValueError):
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeBrokenListLeakTest(self):
-        input = '[[[true'
-        for x in range(1000):
-            try:
-                ujson.decode(input)
-                assert False, "Expected exception!"
-            except(ValueError):
-                continue
-
-            assert False, "Wrong exception"
-
-    def test_decodeDictWithNoKey(self):
-        input = "{{{{31337}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeDictWithNoColonOrValue(self):
-        input = "{{{{\"key\"}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeDictWithNoValue(self):
-        input = "{{{{\"key\":}}}}"
-        try:
-            ujson.decode(input)
-            assert False, "Expected exception!"
-        except(ValueError):
-            return
-
-        assert False, "Wrong exception"
-
-    def test_decodeNumericIntPos(self):
-        input = "31337"
-        self.assertEqual(31337, ujson.decode(input))
-
-    def test_decodeNumericIntNeg(self):
-        input = "-31337"
-        self.assertEqual(-31337, ujson.decode(input))
-
-    def test_encodeUnicode4BytesUTF8Fail(self):
-        _skip_if_python_ver(3)
-        input = "\xfd\xbf\xbf\xbf\xbf\xbf"
-        try:
-            enc = ujson.encode(input)  # noqa
-            assert False, "Expected exception"
-        except OverflowError:
-            pass
+        assert long_input == json.loads(output)
+        assert output == json.dumps(long_input)
+        assert long_input == ujson.decode(output)
 
-    def test_encodeNullCharacter(self):
-        input = "31337 \x00 1337"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-        input = "\x00"
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-
-        self.assertEqual('"  \\u0000\\r\\n "', ujson.dumps(u("  \u0000\r\n ")))
-        pass
-
-    def test_decodeNullCharacter(self):
-        input = "\"31337 \\u0000 31337\""
-        self.assertEqual(ujson.decode(input), json.loads(input))
-
-    def test_encodeListLongConversion(self):
-        input = [9223372036854775807, 9223372036854775807, 9223372036854775807,
-                 9223372036854775807, 9223372036854775807, 9223372036854775807]
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(input, ujson.decode(output))
-        tm.assert_numpy_array_equal(np.array(input),
-                                    ujson.decode(output, numpy=True,
-                                                 dtype=np.int64))
-        pass
-
-    def test_encodeLongConversion(self):
-        input = 9223372036854775807
-        output = ujson.encode(input)
-        self.assertEqual(input, json.loads(output))
-        self.assertEqual(output, json.dumps(input))
-        self.assertEqual(input, ujson.decode(output))
-        pass
-
-    def test_numericIntExp(self):
-        input = "1337E40"
-        output = ujson.decode(input)
-        self.assertEqual(output, json.loads(input))
-
-    def test_numericIntFrcExp(self):
-        input = "1.337E40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpEPLUS(self):
-        input = "1337E+9"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpePLUS(self):
-        input = "1.337e+40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpE(self):
-        input = "1337E40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpe(self):
-        input = "1337e40"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpEMinus(self):
-        input = "1.337E-4"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_decodeNumericIntExpeMinus(self):
-        input = "1.337e-4"
-        output = ujson.decode(input)
-        self.assertAlmostEqual(output, json.loads(input))
-
-    def test_dumpToFile(self):
+    @pytest.mark.parametrize("int_exp", [
+        "1337E40", "1.337E40", "1337E+9", "1.337e+40", "1.337E-4"
+    ])
+    def test_decode_numeric_int_exp(self, int_exp):
+        assert ujson.decode(int_exp) == json.loads(int_exp)
+
+    def test_dump_to_file(self):
         f = StringIO()
         ujson.dump([1, 2, 3], f)
-        self.assertEqual("[1,2,3]", f.getvalue())
+        assert "[1,2,3]" == f.getvalue()
 
-    def test_dumpToFileLikeObject(self):
-        class filelike:
+    def test_dump_to_file_like(self):
+        class FileLike(object):
 
             def __init__(self):
                 self.bytes = ''
 
-            def write(self, bytes):
-                self.bytes += bytes
-        f = filelike()
+            def write(self, data_bytes):
+                self.bytes += data_bytes
+
+        f = FileLike()
         ujson.dump([1, 2, 3], f)
-        self.assertEqual("[1,2,3]", f.bytes)
+        assert "[1,2,3]" == f.bytes
 
-    def test_dumpFileArgsError(self):
-        try:
-            ujson.dump([], '')
-        except TypeError:
-            pass
-        else:
-            assert False, 'expected TypeError'
+    def test_dump_file_args_error(self):
+        with pytest.raises(TypeError):
+            ujson.dump([], "")
 
-    def test_loadFile(self):
-        f = StringIO("[1,2,3,4]")
-        self.assertEqual([1, 2, 3, 4], ujson.load(f))
-        f = StringIO("[1,2,3,4]")
-        tm.assert_numpy_array_equal(
-            np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
+    def test_load_file(self):
+        data = "[1,2,3,4]"
+        exp_data = [1, 2, 3, 4]
 
-    def test_loadFileLikeObject(self):
-        class filelike:
+        f = StringIO(data)
+        assert exp_data == ujson.load(f)
+
+        f = StringIO(data)
+        tm.assert_numpy_array_equal(np.array(exp_data),
+                                    ujson.load(f, numpy=True))
+
+    def test_load_file_like(self):
+        class FileLike(object):
 
             def read(self):
                 try:
@@ -783,94 +615,75 @@ def read(self):
                 except AttributeError:
                     self.end = True
                     return "[1,2,3,4]"
-        f = filelike()
-        self.assertEqual([1, 2, 3, 4], ujson.load(f))
-        f = filelike()
-        tm.assert_numpy_array_equal(
-            np.array([1, 2, 3, 4]), ujson.load(f, numpy=True))
 
-    def test_loadFileArgsError(self):
-        try:
+        exp_data = [1, 2, 3, 4]
+
+        f = FileLike()
+        assert exp_data == ujson.load(f)
+
+        f = FileLike()
+        tm.assert_numpy_array_equal(np.array(exp_data),
+                                    ujson.load(f, numpy=True))
+
+    def test_load_file_args_error(self):
+        with pytest.raises(TypeError):
             ujson.load("[]")
-        except TypeError:
-            pass
-        else:
-            assert False, "expected TypeError"
 
     def test_version(self):
         assert re.match(r'^\d+\.\d+(\.\d+)?$', ujson.__version__), \
             "ujson.__version__ must be a string like '1.4.0'"
 
-    def test_encodeNumericOverflow(self):
-        try:
+    def test_encode_numeric_overflow(self):
+        with pytest.raises(OverflowError):
             ujson.encode(12839128391289382193812939)
-        except OverflowError:
-            pass
-        else:
-            assert False, "expected OverflowError"
 
-    def test_encodeNumericOverflowNested(self):
-        for n in range(0, 100):
-            class Nested:
-                x = 12839128391289382193812939
+    def test_encode_numeric_overflow_nested(self):
+        class Nested(object):
+            x = 12839128391289382193812939
 
-            nested = Nested()
+        for _ in range(0, 100):
+            with pytest.raises(OverflowError):
+                ujson.encode(Nested())
 
-            try:
-                ujson.encode(nested)
-            except OverflowError:
-                pass
-            else:
-                assert False, "expected OverflowError"
-
-    def test_decodeNumberWith32bitSignBit(self):
+    @pytest.mark.parametrize("val", [
+        3590016419, 2**31, 2**32, (2**32) - 1
+    ])
+    def test_decode_number_with_32bit_sign_bit(self, val):
         # Test that numbers that fit within 32 bits but would have the
         # sign bit set (2**31 <= x < 2**32) are decoded properly.
-        boundary1 = 2**31  # noqa
-        boundary2 = 2**32  # noqa
-        docs = (
-            '{"id": 3590016419}',
-            '{"id": %s}' % 2**31,
-            '{"id": %s}' % 2**32,
-            '{"id": %s}' % ((2**32) - 1),
-        )
-        results = (3590016419, 2**31, 2**32, 2**32 - 1)
-        for doc, result in zip(docs, results):
-            self.assertEqual(ujson.decode(doc)['id'], result)
-
-    def test_encodeBigEscape(self):
-        for x in range(10):
-            if compat.PY3:
-                base = '\u00e5'.encode('utf-8')
-            else:
-                base = "\xc3\xa5"
-            input = base * 1024 * 1024 * 2
-            output = ujson.encode(input)  # noqa
-
-    def test_decodeBigEscape(self):
-        for x in range(10):
-            if compat.PY3:
-                base = '\u00e5'.encode('utf-8')
-            else:
-                base = "\xc3\xa5"
+        doc = '{{"id": {val}}}'.format(val=val)
+        assert ujson.decode(doc)["id"] == val
+
+    def test_encode_big_escape(self):
+        # Make sure no Exception is raised.
+        for _ in range(10):
+            base = '\u00e5'.encode("utf-8") if compat.PY3 else "\xc3\xa5"
+            escape_input = base * 1024 * 1024 * 2
+            ujson.encode(escape_input)
+
+    def test_decode_big_escape(self):
+        # Make sure no Exception is raised.
+        for _ in range(10):
+            base = '\u00e5'.encode("utf-8") if compat.PY3 else "\xc3\xa5"
             quote = compat.str_to_bytes("\"")
-            input = quote + (base * 1024 * 1024 * 2) + quote
-            output = ujson.decode(input)  # noqa
 
-    def test_toDict(self):
-        d = {u("key"): 31337}
+            escape_input = quote + (base * 1024 * 1024 * 2) + quote
+            ujson.decode(escape_input)
 
-        class DictTest:
+    def test_to_dict(self):
+        d = {u("key"): 31337}
 
+        class DictTest(object):
             def toDict(self):
                 return d
 
         o = DictTest()
         output = ujson.encode(o)
+
         dec = ujson.decode(output)
-        self.assertEqual(dec, d)
+        assert dec == d
 
-    def test_defaultHandler(self):
+    def test_default_handler(self):
 
         class _TestObject(object):
 
@@ -884,730 +697,433 @@ def recursive_attr(self):
             def __str__(self):
                 return str(self.val)
 
-        self.assertRaises(OverflowError, ujson.encode, _TestObject("foo"))
-        self.assertEqual('"foo"', ujson.encode(_TestObject("foo"),
-                                               default_handler=str))
+        msg = "Maximum recursion level reached"
+        with pytest.raises(OverflowError, match=msg):
+            ujson.encode(_TestObject("foo"))
+        assert '"foo"' == ujson.encode(_TestObject("foo"),
+                                       default_handler=str)
 
-        def my_handler(obj):
+        def my_handler(_):
             return "foobar"
-        self.assertEqual('"foobar"', ujson.encode(_TestObject("foo"),
-                                                  default_handler=my_handler))
 
-        def my_handler_raises(obj):
+        assert '"foobar"' == ujson.encode(_TestObject("foo"),
+                                          default_handler=my_handler)
+
+        def my_handler_raises(_):
             raise TypeError("I raise for anything")
-        with tm.assertRaisesRegexp(TypeError, "I raise for anything"):
+
+        with pytest.raises(TypeError, match="I raise for anything"):
             ujson.encode(_TestObject("foo"), default_handler=my_handler_raises)
 
-        def my_int_handler(obj):
+        def my_int_handler(_):
             return 42
-        self.assertEqual(
-            42, ujson.decode(ujson.encode(_TestObject("foo"),
-                                          default_handler=my_int_handler)))
-
-        def my_obj_handler(obj):
-            return datetime.datetime(2013, 2, 3)
-        self.assertEqual(
-            ujson.decode(ujson.encode(datetime.datetime(2013, 2, 3))),
-            ujson.decode(ujson.encode(_TestObject("foo"),
-                                      default_handler=my_obj_handler)))
-
-        l = [_TestObject("foo"), _TestObject("bar")]
-        self.assertEqual(json.loads(json.dumps(l, default=str)),
-                         ujson.decode(ujson.encode(l, default_handler=str)))
-
 
-class NumpyJSONTests(TestCase):
+        assert ujson.decode(ujson.encode(_TestObject("foo"),
+                                         default_handler=my_int_handler)) == 42
 
-    def testBool(self):
-        b = np.bool(True)
-        self.assertEqual(ujson.decode(ujson.encode(b)), b)
-
-    def testBoolArray(self):
-        inpt = np.array([True, False, True, True, False, True, False, False],
-                        dtype=np.bool)
-        outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=np.bool)
-        tm.assert_numpy_array_equal(inpt, outp)
-
-    def testInt(self):
-        num = np.int(2562010)
-        self.assertEqual(np.int(ujson.decode(ujson.encode(num))), num)
+        def my_obj_handler(_):
+            return datetime.datetime(2013, 2, 3)
 
-        num = np.int8(127)
-        self.assertEqual(np.int8(ujson.decode(ujson.encode(num))), num)
+        assert (ujson.decode(ujson.encode(datetime.datetime(2013, 2, 3))) ==
+                ujson.decode(ujson.encode(_TestObject("foo"),
+                                          default_handler=my_obj_handler)))
 
-        num = np.int16(2562010)
-        self.assertEqual(np.int16(ujson.decode(ujson.encode(num))), num)
+        obj_list = [_TestObject("foo"), _TestObject("bar")]
+        assert (json.loads(json.dumps(obj_list, default=str)) ==
+                ujson.decode(ujson.encode(obj_list, default_handler=str)))
 
-        num = np.int32(2562010)
-        self.assertEqual(np.int32(ujson.decode(ujson.encode(num))), num)
 
-        num = np.int64(2562010)
-        self.assertEqual(np.int64(ujson.decode(ujson.encode(num))), num)
+class TestNumpyJSONTests(object):
 
-        num = np.uint8(255)
-        self.assertEqual(np.uint8(ujson.decode(ujson.encode(num))), num)
+    @pytest.mark.parametrize("bool_input", [True, False])
+    def test_bool(self, bool_input):
+        b = np.bool(bool_input)
+        assert ujson.decode(ujson.encode(b)) == b
 
-        num = np.uint16(2562010)
-        self.assertEqual(np.uint16(ujson.decode(ujson.encode(num))), num)
+    def test_bool_array(self):
+        bool_array = np.array([
+            True, False, True, True,
+            False, True, False, False], dtype=np.bool)
+        output = np.array(ujson.decode(
+            ujson.encode(bool_array)), dtype=np.bool)
+        tm.assert_numpy_array_equal(bool_array, output)
 
-        num = np.uint32(2562010)
-        self.assertEqual(np.uint32(ujson.decode(ujson.encode(num))), num)
+    def test_int(self, any_int_dtype):
+        klass = np.dtype(any_int_dtype).type
+        num = klass(1)
 
-        num = np.uint64(2562010)
-        self.assertEqual(np.uint64(ujson.decode(ujson.encode(num))), num)
+        assert klass(ujson.decode(ujson.encode(num))) == num
 
-    def testIntArray(self):
+    def test_int_array(self, any_int_dtype):
         arr = np.arange(100, dtype=np.int)
-        dtypes = (np.int, np.int8, np.int16, np.int32, np.int64,
-                  np.uint, np.uint8, np.uint16, np.uint32, np.uint64)
-        for dtype in dtypes:
-            inpt = arr.astype(dtype)
-            outp = np.array(ujson.decode(ujson.encode(inpt)), dtype=dtype)
-            tm.assert_numpy_array_equal(inpt, outp)
-
-    def testIntMax(self):
-        num = np.int(np.iinfo(np.int).max)
-        self.assertEqual(np.int(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int8(np.iinfo(np.int8).max)
-        self.assertEqual(np.int8(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int16(np.iinfo(np.int16).max)
-        self.assertEqual(np.int16(ujson.decode(ujson.encode(num))), num)
-
-        num = np.int32(np.iinfo(np.int32).max)
-        self.assertEqual(np.int32(ujson.decode(ujson.encode(num))), num)
+        arr_input = arr.astype(any_int_dtype)
 
-        num = np.uint8(np.iinfo(np.uint8).max)
-        self.assertEqual(np.uint8(ujson.decode(ujson.encode(num))), num)
+        arr_output = np.array(ujson.decode(ujson.encode(arr_input)),
+                              dtype=any_int_dtype)
+        tm.assert_numpy_array_equal(arr_input, arr_output)
 
-        num = np.uint16(np.iinfo(np.uint16).max)
-        self.assertEqual(np.uint16(ujson.decode(ujson.encode(num))), num)
+    def test_int_max(self, any_int_dtype):
+        if any_int_dtype in ("int64", "uint64") and compat.is_platform_32bit():
+            pytest.skip("Cannot test 64-bit integer on 32-bit platform")
 
-        num = np.uint32(np.iinfo(np.uint32).max)
-        self.assertEqual(np.uint32(ujson.decode(ujson.encode(num))), num)
+        klass = np.dtype(any_int_dtype).type
 
-        if platform.architecture()[0] != '32bit':
-            num = np.int64(np.iinfo(np.int64).max)
-            self.assertEqual(np.int64(ujson.decode(ujson.encode(num))), num)
-
-            # uint64 max will always overflow as it's encoded to signed
-            num = np.uint64(np.iinfo(np.int64).max)
-            self.assertEqual(np.uint64(ujson.decode(ujson.encode(num))), num)
+        # uint64 max will always overflow,
+        # as it's encoded to signed.
+        if any_int_dtype == "uint64":
+            num = np.iinfo("int64").max
+        else:
+            num = np.iinfo(any_int_dtype).max
 
-    def testFloat(self):
-        num = np.float(256.2013)
-        self.assertEqual(np.float(ujson.decode(ujson.encode(num))), num)
+        assert klass(ujson.decode(ujson.encode(num))) == num
 
-        num = np.float32(256.2013)
-        self.assertEqual(np.float32(ujson.decode(ujson.encode(num))), num)
+    def test_float(self, float_dtype):
+        klass = np.dtype(float_dtype).type
+        num = klass(256.2013)
 
-        num = np.float64(256.2013)
-        self.assertEqual(np.float64(ujson.decode(ujson.encode(num))), num)
+        assert klass(ujson.decode(ujson.encode(num))) == num
 
-    def testFloatArray(self):
+    def test_float_array(self, float_dtype):
         arr = np.arange(12.5, 185.72, 1.7322, dtype=np.float)
-        dtypes = (np.float, np.float32, np.float64)
+        float_input = arr.astype(float_dtype)
 
-        for dtype in dtypes:
-            inpt = arr.astype(dtype)
-            outp = np.array(ujson.decode(ujson.encode(
-                inpt, double_precision=15)), dtype=dtype)
-            tm.assert_almost_equal(inpt, outp)
+        float_output = np.array(ujson.decode(
+            ujson.encode(float_input, double_precision=15)),
+            dtype=float_dtype)
+        tm.assert_almost_equal(float_input, float_output)
 
-    def testFloatMax(self):
-        num = np.float(np.finfo(np.float).max / 10)
-        tm.assert_almost_equal(np.float(ujson.decode(
-            ujson.encode(num, double_precision=15))), num, 15)
+    def test_float_max(self, float_dtype):
+        klass = np.dtype(float_dtype).type
+        num = klass(np.finfo(float_dtype).max / 10)
 
-        num = np.float32(np.finfo(np.float32).max / 10)
-        tm.assert_almost_equal(np.float32(ujson.decode(
-            ujson.encode(num, double_precision=15))), num, 15)
+        tm.assert_almost_equal(klass(ujson.decode(
+            ujson.encode(num, double_precision=15))), num)
 
-        num = np.float64(np.finfo(np.float64).max / 10)
-        tm.assert_almost_equal(np.float64(ujson.decode(
-            ujson.encode(num, double_precision=15))), num, 15)
-
-    def testArrays(self):
-        arr = np.arange(100)
+    def test_array_basic(self):
+        arr = np.arange(96)
+        arr = arr.reshape((2, 2, 2, 2, 3, 2))
 
-        arr = arr.reshape((10, 10))
         tm.assert_numpy_array_equal(
             np.array(ujson.decode(ujson.encode(arr))), arr)
         tm.assert_numpy_array_equal(ujson.decode(
             ujson.encode(arr), numpy=True), arr)
 
-        arr = arr.reshape((5, 5, 4))
-        tm.assert_numpy_array_equal(
-            np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(
-            ujson.encode(arr), numpy=True), arr)
+    @pytest.mark.parametrize("shape", [
+        (10, 10),
+        (5, 5, 4),
+        (100, 1),
+    ])
+    def test_array_reshaped(self, shape):
+        arr = np.arange(100)
+        arr = arr.reshape(shape)
 
-        arr = arr.reshape((100, 1))
         tm.assert_numpy_array_equal(
             np.array(ujson.decode(ujson.encode(arr))), arr)
         tm.assert_numpy_array_equal(ujson.decode(
             ujson.encode(arr), numpy=True), arr)
 
-        arr = np.arange(96)
-        arr = arr.reshape((2, 2, 2, 2, 3, 2))
+    def test_array_list(self):
+        arr_list = ["a", list(), dict(), dict(), list(),
+                    42, 97.8, ["a", "b"], {"key": "val"}]
+        arr = np.array(arr_list)
         tm.assert_numpy_array_equal(
             np.array(ujson.decode(ujson.encode(arr))), arr)
-        tm.assert_numpy_array_equal(ujson.decode(
-            ujson.encode(arr), numpy=True), arr)
 
-        l = ['a', list(), dict(), dict(), list(),
-             42, 97.8, ['a', 'b'], {'key': 'val'}]
-        arr = np.array(l)
-        tm.assert_numpy_array_equal(
-            np.array(ujson.decode(ujson.encode(arr))), arr)
+    def test_array_float(self):
+        dtype = np.float32
 
-        arr = np.arange(100.202, 200.202, 1, dtype=np.float32)
+        arr = np.arange(100.202, 200.202, 1, dtype=dtype)
         arr = arr.reshape((5, 5, 4))
-        outp = np.array(ujson.decode(ujson.encode(arr)), dtype=np.float32)
-        tm.assert_almost_equal(arr, outp)
-        outp = ujson.decode(ujson.encode(arr), numpy=True, dtype=np.float32)
-        tm.assert_almost_equal(arr, outp)
 
-    def testOdArray(self):
-        def will_raise():
-            ujson.encode(np.array(1))
+        arr_out = np.array(ujson.decode(ujson.encode(arr)), dtype=dtype)
+        tm.assert_almost_equal(arr, arr_out)
 
-        self.assertRaises(TypeError, will_raise)
+        arr_out = ujson.decode(ujson.encode(arr), numpy=True, dtype=dtype)
+        tm.assert_almost_equal(arr, arr_out)
 
-    def testArrayNumpyExcept(self):
+    def test_0d_array(self):
+        with pytest.raises(TypeError):
+            ujson.encode(np.array(1))
 
-        input = ujson.dumps([42, {}, 'a'])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(TypeError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps(['a', 'b', [], 'c'])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([['a'], 42])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([42, ['a'], 42])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{}, []])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([42, None])
-        try:
-            ujson.decode(input, numpy=True)
-            assert False, "Expected exception!"
-        except(TypeError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{'a': 'b'}])
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps({'a': {'b': {'c': 42}}})
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-        input = ujson.dumps([{'a': 42, 'b': 23}, {'c': 17}])
-        try:
-            ujson.decode(input, numpy=True, labelled=True)
-            assert False, "Expected exception!"
-        except(ValueError):
-            pass
-        except:
-            assert False, "Wrong exception"
-
-    def testArrayNumpyLabelled(self):
-        input = {'a': []}
-        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
-        self.assertTrue((np.empty((1, 0)) == output[0]).all())
-        self.assertTrue((np.array(['a']) == output[1]).all())
-        self.assertTrue(output[2] is None)
-
-        input = [{'a': 42}]
-        output = ujson.loads(ujson.dumps(input), numpy=True, labelled=True)
-        self.assertTrue((np.array([42]) == output[0]).all())
-        self.assertTrue(output[1] is None)
-        self.assertTrue((np.array([u('a')]) == output[2]).all())
-
-        # Write out the dump explicitly so there is no dependency on iteration
-        # order GH10837
+    @pytest.mark.parametrize("bad_input,exc_type,kwargs", [
+        ([{}, []], ValueError, {}),
+        ([42, None], TypeError, {}),
+        ([["a"], 42], ValueError, {}),
+        ([42, {}, "a"], TypeError, {}),
+        ([42, ["a"], 42], ValueError, {}),
+        (["a", "b", [], "c"], ValueError, {}),
+        ([{"a": "b"}], ValueError, dict(labelled=True)),
+        ({"a": {"b": {"c": 42}}}, ValueError, dict(labelled=True)),
+        ([{"a": 42, "b": 23}, {"c": 17}], ValueError, dict(labelled=True))
+    ])
+    def test_array_numpy_except(self, bad_input, exc_type, kwargs):
+        with pytest.raises(exc_type):
+            ujson.decode(ujson.dumps(bad_input), numpy=True, **kwargs)
+
+    def test_array_numpy_labelled(self):
+        labelled_input = {"a": []}
+        output = ujson.loads(ujson.dumps(labelled_input),
+                             numpy=True, labelled=True)
+        assert (np.empty((1, 0)) == output[0]).all()
+        assert (np.array(["a"]) == output[1]).all()
+        assert output[2] is None
+
+        labelled_input = [{"a": 42}]
+        output = ujson.loads(ujson.dumps(labelled_input),
+                             numpy=True, labelled=True)
+        assert (np.array([u("a")]) == output[2]).all()
+        assert (np.array([42]) == output[0]).all()
+        assert output[1] is None
+
+        # see gh-10837: write out the dump explicitly
+        # so there is no dependency on iteration order
         input_dumps = ('[{"a": 42, "b":31}, {"a": 24, "c": 99}, '
                        '{"a": 2.4, "b": 78}]')
         output = ujson.loads(input_dumps, numpy=True, labelled=True)
-        expectedvals = np.array(
+        expected_vals = np.array(
             [42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
-        self.assertTrue((expectedvals == output[0]).all())
-        self.assertTrue(output[1] is None)
-        self.assertTrue((np.array([u('a'), 'b']) == output[2]).all())
+        assert (expected_vals == output[0]).all()
+        assert output[1] is None
+        assert (np.array([u("a"), "b"]) == output[2]).all()
 
         input_dumps = ('{"1": {"a": 42, "b":31}, "2": {"a": 24, "c": 99}, '
                        '"3": {"a": 2.4, "b": 78}}')
         output = ujson.loads(input_dumps, numpy=True, labelled=True)
-        expectedvals = np.array(
+        expected_vals = np.array(
             [42, 31, 24, 99, 2.4, 78], dtype=int).reshape((3, 2))
-        self.assertTrue((expectedvals == output[0]).all())
-        self.assertTrue((np.array(['1', '2', '3']) == output[1]).all())
-        self.assertTrue((np.array(['a', 'b']) == output[2]).all())
+        assert (expected_vals == output[0]).all()
+        assert (np.array(["1", "2", "3"]) == output[1]).all()
+        assert (np.array(["a", "b"]) == output[2]).all()
 
 
-class PandasJSONTests(TestCase):
+class TestPandasJSONTests(object):
 
-    def testDataFrame(self):
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
-                       'a', 'b'], columns=['x', 'y', 'z'])
-
-        # column indexed
-        outp = DataFrame(ujson.decode(ujson.encode(df)))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-        tm.assert_index_equal(df.index, outp.index)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split")))
-        outp = DataFrame(**dec)
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-        tm.assert_index_equal(df.index, outp.index)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="records")))
-        outp.index = df.index
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="values")))
-        outp.index = df.index
-        self.assertTrue((df.values == outp.values).all())
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index")))
-        self.assertTrue((df.transpose() == outp).values.all())
-        tm.assert_index_equal(df.transpose().columns, outp.columns)
-        tm.assert_index_equal(df.transpose().index, outp.index)
-
-    def testDataFrameNumpy(self):
-        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
-                       'a', 'b'], columns=['x', 'y', 'z'])
+    def test_dataframe(self, orient, numpy):
+        if orient == "records" and numpy:
+            pytest.skip("Not idiomatic pandas")
 
-        # column indexed
-        outp = DataFrame(ujson.decode(ujson.encode(df), numpy=True))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-        tm.assert_index_equal(df.index, outp.index)
-
-        dec = _clean_dict(ujson.decode(ujson.encode(df, orient="split"),
-                                       numpy=True))
-        outp = DataFrame(**dec)
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-        tm.assert_index_equal(df.index, outp.index)
-
-        outp = DataFrame(ujson.decode(ujson.encode(df, orient="index"),
-                                      numpy=True))
-        self.assertTrue((df.transpose() == outp).values.all())
-        tm.assert_index_equal(df.transpose().columns, outp.columns)
-        tm.assert_index_equal(df.transpose().index, outp.index)
-
-    def testDataFrameNested(self):
         df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
-                       'a', 'b'], columns=['x', 'y', 'z'])
-
-        nested = {'df1': df, 'df2': df.copy()}
+            "a", "b"], columns=["x", "y", "z"])
+        encode_kwargs = {} if orient is None else dict(orient=orient)
+        decode_kwargs = {} if numpy is None else dict(numpy=numpy)
 
-        exp = {'df1': ujson.decode(ujson.encode(df)),
-               'df2': ujson.decode(ujson.encode(df))}
-        self.assertTrue(ujson.decode(ujson.encode(nested)) == exp)
+        output = ujson.decode(ujson.encode(df, **encode_kwargs),
+                              **decode_kwargs)
 
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="index")),
-               'df2': ujson.decode(ujson.encode(df, orient="index"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="index")) == exp)
-
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="records")),
-               'df2': ujson.decode(ujson.encode(df, orient="records"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="records")) == exp)
+        # Ensure proper DataFrame initialization.
+        if orient == "split":
+            dec = _clean_dict(output)
+            output = DataFrame(**dec)
+        else:
+            output = DataFrame(output)
 
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="values")),
-               'df2': ujson.decode(ujson.encode(df, orient="values"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="values")) == exp)
+        # Corrections to enable DataFrame comparison.
+        if orient == "values":
+            df.columns = [0, 1, 2]
+            df.index = [0, 1]
+        elif orient == "records":
+            df.index = [0, 1]
+        elif orient == "index":
+            df = df.transpose()
 
-        exp = {'df1': ujson.decode(ujson.encode(df, orient="split")),
-               'df2': ujson.decode(ujson.encode(df, orient="split"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="split")) == exp)
+        tm.assert_frame_equal(output, df, check_dtype=False)
 
-    def testDataFrameNumpyLabelled(self):
+    def test_dataframe_nested(self, orient):
         df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
-                       'a', 'b'], columns=['x', 'y', 'z'])
-
-        # column indexed
-        outp = DataFrame(*ujson.decode(ujson.encode(df),
-                                       numpy=True, labelled=True))
-        self.assertTrue((df.T == outp).values.all())
-        tm.assert_index_equal(df.T.columns, outp.columns)
-        tm.assert_index_equal(df.T.index, outp.index)
-
-        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="records"),
-                                       numpy=True, labelled=True))
-        outp.index = df.index
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-
-        outp = DataFrame(*ujson.decode(ujson.encode(df, orient="index"),
-                                       numpy=True, labelled=True))
-        self.assertTrue((df == outp).values.all())
-        tm.assert_index_equal(df.columns, outp.columns)
-        tm.assert_index_equal(df.index, outp.index)
-
-    def testSeries(self):
-        s = Series([10, 20, 30, 40, 50, 60], name="series",
-                   index=[6, 7, 8, 9, 10, 15]).sort_values()
-
-        # column indexed
-        outp = Series(ujson.decode(ujson.encode(s))).sort_values()
-        exp = Series([10, 20, 30, 40, 50, 60],
-                     index=['6', '7', '8', '9', '10', '15'])
-        tm.assert_series_equal(outp, exp)
-
-        outp = Series(ujson.decode(ujson.encode(s), numpy=True)).sort_values()
-        tm.assert_series_equal(outp, exp)
+            "a", "b"], columns=["x", "y", "z"])
 
-        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split")))
-        outp = Series(**dec)
-        tm.assert_series_equal(outp, s)
+        nested = {"df1": df, "df2": df.copy()}
+        kwargs = {} if orient is None else dict(orient=orient)
 
-        dec = _clean_dict(ujson.decode(ujson.encode(s, orient="split"),
-                                       numpy=True))
-        outp = Series(**dec)
-
-        exp_np = Series(np.array([10, 20, 30, 40, 50, 60]))
-        exp_pd = Series([10, 20, 30, 40, 50, 60])
-        outp = Series(ujson.decode(ujson.encode(s, orient="records"),
-                                   numpy=True))
-        tm.assert_series_equal(outp, exp_np)
+        exp = {"df1": ujson.decode(ujson.encode(df, **kwargs)),
+               "df2": ujson.decode(ujson.encode(df, **kwargs))}
+        assert ujson.decode(ujson.encode(nested, **kwargs)) == exp
 
-        outp = Series(ujson.decode(ujson.encode(s, orient="records")))
-        exp = Series([10, 20, 30, 40, 50, 60])
-        tm.assert_series_equal(outp, exp_pd)
+    def test_dataframe_numpy_labelled(self, orient):
+        if orient in ("split", "values"):
+            pytest.skip("Incompatible with labelled=True")
 
-        outp = Series(ujson.decode(ujson.encode(s, orient="values"),
-                                   numpy=True))
-        tm.assert_series_equal(outp, exp_np)
+        df = DataFrame([[1, 2, 3], [4, 5, 6]], index=[
+            "a", "b"], columns=["x", "y", "z"], dtype=np.int)
+        kwargs = {} if orient is None else dict(orient=orient)
 
-        outp = Series(ujson.decode(ujson.encode(s, orient="values")))
-        tm.assert_series_equal(outp, exp_pd)
+        output = DataFrame(*ujson.decode(ujson.encode(df, **kwargs),
+                                         numpy=True, labelled=True))
 
-        outp = Series(ujson.decode(ujson.encode(
-            s, orient="index"))).sort_values()
-        exp = Series([10, 20, 30, 40, 50, 60],
-                     index=['6', '7', '8', '9', '10', '15'])
-        tm.assert_series_equal(outp, exp)
+        if orient is None:
+            df = df.T
+        elif orient == "records":
+            df.index = [0, 1]
 
-        outp = Series(ujson.decode(ujson.encode(
-            s, orient="index"), numpy=True)).sort_values()
-        tm.assert_series_equal(outp, exp)
+        tm.assert_frame_equal(output, df)
 
-    def testSeriesNested(self):
+    def test_series(self, orient, numpy):
         s = Series([10, 20, 30, 40, 50, 60], name="series",
                    index=[6, 7, 8, 9, 10, 15]).sort_values()
 
-        nested = {'s1': s, 's2': s.copy()}
+        encode_kwargs = {} if orient is None else dict(orient=orient)
+        decode_kwargs = {} if numpy is None else dict(numpy=numpy)
 
-        exp = {'s1': ujson.decode(ujson.encode(s)),
-               's2': ujson.decode(ujson.encode(s))}
-        self.assertTrue(ujson.decode(ujson.encode(nested)) == exp)
+        output = ujson.decode(ujson.encode(s, **encode_kwargs),
+                              **decode_kwargs)
 
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="split")),
-               's2': ujson.decode(ujson.encode(s, orient="split"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="split")) == exp)
+        if orient == "split":
+            dec = _clean_dict(output)
+            output = Series(**dec)
+        else:
+            output = Series(output)
 
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="records")),
-               's2': ujson.decode(ujson.encode(s, orient="records"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="records")) == exp)
+        if orient in (None, "index"):
+            s.name = None
+            output = output.sort_values()
+            s.index = ["6", "7", "8", "9", "10", "15"]
+        elif orient in ("records", "values"):
+            s.name = None
+            s.index = [0, 1, 2, 3, 4, 5]
 
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="values")),
-               's2': ujson.decode(ujson.encode(s, orient="values"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="values")) == exp)
+        tm.assert_series_equal(output, s, check_dtype=False)
+
+    def test_series_nested(self, orient):
+        s = Series([10, 20, 30, 40, 50, 60], name="series",
+                   index=[6, 7, 8, 9, 10, 15]).sort_values()
+        nested = {"s1": s, "s2": s.copy()}
+        kwargs = {} if orient is None else dict(orient=orient)
 
-        exp = {'s1': ujson.decode(ujson.encode(s, orient="index")),
-               's2': ujson.decode(ujson.encode(s, orient="index"))}
-        self.assertTrue(ujson.decode(
-            ujson.encode(nested, orient="index")) == exp)
+        exp = {"s1": ujson.decode(ujson.encode(s, **kwargs)),
+               "s2": ujson.decode(ujson.encode(s, **kwargs))}
+        assert ujson.decode(ujson.encode(nested, **kwargs)) == exp
 
-    def testIndex(self):
+    def test_index(self):
         i = Index([23, 45, 18, 98, 43, 11], name="index")
 
-        # column indexed
-        outp = Index(ujson.decode(ujson.encode(i)), name='index')
-        tm.assert_index_equal(i, outp)
+        # Column indexed.
+        output = Index(ujson.decode(ujson.encode(i)), name="index")
+        tm.assert_index_equal(i, output)
 
-        outp = Index(ujson.decode(ujson.encode(i), numpy=True), name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i), numpy=True), name="index")
+        tm.assert_index_equal(i, output)
 
         dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split")))
-        outp = Index(**dec)
-        tm.assert_index_equal(i, outp)
-        self.assertTrue(i.name == outp.name)
+        output = Index(**dec)
+
+        tm.assert_index_equal(i, output)
+        assert i.name == output.name
 
         dec = _clean_dict(ujson.decode(ujson.encode(i, orient="split"),
                                        numpy=True))
-        outp = Index(**dec)
-        tm.assert_index_equal(i, outp)
-        self.assertTrue(i.name == outp.name)
+        output = Index(**dec)
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="values")),
-                     name='index')
-        tm.assert_index_equal(i, outp)
+        tm.assert_index_equal(i, output)
+        assert i.name == output.name
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="values"),
-                                  numpy=True), name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i, orient="values")),
+                       name="index")
+        tm.assert_index_equal(i, output)
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="records")),
-                     name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i, orient="values"),
+                                    numpy=True), name="index")
+        tm.assert_index_equal(i, output)
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="records"),
-                                  numpy=True), name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i, orient="records")),
+                       name="index")
+        tm.assert_index_equal(i, output)
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="index")),
-                     name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i, orient="records"),
+                                    numpy=True), name="index")
+        tm.assert_index_equal(i, output)
 
-        outp = Index(ujson.decode(ujson.encode(i, orient="index"),
-                                  numpy=True), name='index')
-        tm.assert_index_equal(i, outp)
+        output = Index(ujson.decode(ujson.encode(i, orient="index")),
+                       name="index")
+        tm.assert_index_equal(i, output)
 
-    def test_datetimeindex(self):
-        from pandas.tseries.index import date_range
+        output = Index(ujson.decode(ujson.encode(i, orient="index"),
+                                    numpy=True), name="index")
+        tm.assert_index_equal(i, output)
 
-        rng = date_range('1/1/2000', periods=20)
+    def test_datetime_index(self):
+        date_unit = "ns"
 
-        encoded = ujson.encode(rng, date_unit='ns')
-        decoded = DatetimeIndex(np.array(ujson.decode(encoded)))
+        rng = date_range("1/1/2000", periods=20)
+        encoded = ujson.encode(rng, date_unit=date_unit)
 
+        decoded = DatetimeIndex(np.array(ujson.decode(encoded)))
         tm.assert_index_equal(rng, decoded)
 
         ts = Series(np.random.randn(len(rng)), index=rng)
-        decoded = Series(ujson.decode(ujson.encode(ts, date_unit='ns')))
+        decoded = Series(ujson.decode(ujson.encode(ts, date_unit=date_unit)))
+
         idx_values = decoded.index.values.astype(np.int64)
         decoded.index = DatetimeIndex(idx_values)
         tm.assert_series_equal(ts, decoded)
 
-    def test_decodeArrayTrailingCommaFail(self):
-        input = "[31337,]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayLeadingCommaFail(self):
-        input = "[,31337]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayOnlyCommaFail(self):
-        input = "[,]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayUnmatchedBracketFail(self):
-        input = "[]]"
-        try:
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayEmpty(self):
-        input = "[]"
-        ujson.decode(input)
-
-    def test_decodeArrayOneItem(self):
-        input = "[31337]"
-        ujson.decode(input)
-
-    def test_decodeBigValue(self):
-        input = "9223372036854775807"
-        ujson.decode(input)
-
-    def test_decodeSmallValue(self):
-        input = "-9223372036854775808"
-        ujson.decode(input)
-
-    def test_decodeTooBigValue(self):
-        try:
-            input = "9223372036854775808"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeTooSmallValue(self):
-        try:
-            input = "-90223372036854775809"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeVeryTooBigValue(self):
-        try:
-            input = "9223372036854775808"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeVeryTooSmallValue(self):
-        try:
-            input = "-90223372036854775809"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeWithTrailingWhitespaces(self):
-        input = "{}\n\t "
-        ujson.decode(input)
-
-    def test_decodeWithTrailingNonWhitespaces(self):
-        try:
-            input = "{}\n\t a"
-            ujson.decode(input)
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayWithBigInt(self):
-        try:
-            ujson.loads('[18446098363113800555]')
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeArrayFaultyUnicode(self):
-        try:
-            ujson.loads('[18446098363113800555]')
-        except ValueError:
-            pass
-        else:
-            assert False, "expected ValueError"
-
-    def test_decodeFloatingPointAdditionalTests(self):
-        places = 15
-
-        self.assertAlmostEqual(-1.1234567893,
-                               ujson.loads("-1.1234567893"), places=places)
-        self.assertAlmostEqual(-1.234567893,
-                               ujson.loads("-1.234567893"), places=places)
-        self.assertAlmostEqual(-1.34567893,
-                               ujson.loads("-1.34567893"), places=places)
-        self.assertAlmostEqual(-1.4567893,
-                               ujson.loads("-1.4567893"), places=places)
-        self.assertAlmostEqual(-1.567893,
-                               ujson.loads("-1.567893"), places=places)
-        self.assertAlmostEqual(-1.67893,
-                               ujson.loads("-1.67893"), places=places)
-        self.assertAlmostEqual(-1.7893, ujson.loads("-1.7893"), places=places)
-        self.assertAlmostEqual(-1.893, ujson.loads("-1.893"), places=places)
-        self.assertAlmostEqual(-1.3, ujson.loads("-1.3"), places=places)
-
-        self.assertAlmostEqual(1.1234567893, ujson.loads(
-            "1.1234567893"), places=places)
-        self.assertAlmostEqual(1.234567893, ujson.loads(
-            "1.234567893"), places=places)
-        self.assertAlmostEqual(
-            1.34567893, ujson.loads("1.34567893"), places=places)
-        self.assertAlmostEqual(
-            1.4567893, ujson.loads("1.4567893"), places=places)
-        self.assertAlmostEqual(
-            1.567893, ujson.loads("1.567893"), places=places)
-        self.assertAlmostEqual(1.67893, ujson.loads("1.67893"), places=places)
-        self.assertAlmostEqual(1.7893, ujson.loads("1.7893"), places=places)
-        self.assertAlmostEqual(1.893, ujson.loads("1.893"), places=places)
-        self.assertAlmostEqual(1.3, ujson.loads("1.3"), places=places)
-
-    def test_encodeBigSet(self):
+    @pytest.mark.parametrize("invalid_arr", [
+        "[31337,]",  # Trailing comma.
+        "[,31337]",  # Leading comma.
+        "[]]",  # Unmatched bracket.
+        "[,]",  # Only comma.
+    ])
+    def test_decode_invalid_array(self, invalid_arr):
+        with pytest.raises(ValueError):
+            ujson.decode(invalid_arr)
+
+    @pytest.mark.parametrize("arr", [
+        [], [31337]
+    ])
+    def test_decode_array(self, arr):
+        assert arr == ujson.decode(str(arr))
+
+    @pytest.mark.parametrize("extreme_num", [
+        9223372036854775807, -9223372036854775808
+    ])
+    def test_decode_extreme_numbers(self, extreme_num):
+        assert extreme_num == ujson.decode(str(extreme_num))
+
+    @pytest.mark.parametrize("too_extreme_num", [
+        "9223372036854775808", "-90223372036854775809"
+    ])
+    def test_decode_too_extreme_numbers(self, too_extreme_num):
+        with pytest.raises(ValueError):
+            ujson.decode(too_extreme_num)
+
+    def test_decode_with_trailing_whitespaces(self):
+        assert {} == ujson.decode("{}\n\t ")
+
+    def test_decode_with_trailing_non_whitespaces(self):
+        with pytest.raises(ValueError):
+            ujson.decode("{}\n\t a")
+
+    def test_decode_array_with_big_int(self):
+        with pytest.raises(ValueError):
+            ujson.loads("[18446098363113800555]")
+
+    @pytest.mark.parametrize("float_number", [
+        1.1234567893, 1.234567893, 1.34567893,
+        1.4567893, 1.567893, 1.67893,
+        1.7893, 1.893, 1.3,
+    ])
+    @pytest.mark.parametrize("sign", [-1, 1])
+    def test_decode_floating_point(self, sign, float_number):
+        float_number *= sign
+        tm.assert_almost_equal(float_number,
+                               ujson.loads(str(float_number)),
+                               check_less_precise=15)
+
+    def test_encode_big_set(self):
         s = set()
+
         for x in range(0, 100000):
             s.add(x)
+
+        # Make sure no Exception is raised.
         ujson.encode(s)
 
-    def test_encodeEmptySet(self):
-        s = set()
-        self.assertEqual("[]", ujson.encode(s))
+    def test_encode_empty_set(self):
+        assert "[]" == ujson.encode(set())
 
-    def test_encodeSet(self):
-        s = set([1, 2, 3, 4, 5, 6, 7, 8, 9])
+    def test_encode_set(self):
+        s = {1, 2, 3, 4, 5, 6, 7, 8, 9}
         enc = ujson.encode(s)
         dec = ujson.decode(enc)
 
         for v in dec:
-            self.assertTrue(v in s)
-
-
-def _clean_dict(d):
-    return dict((str(k), v) for k, v in compat.iteritems(d))
+            assert v in s
diff --git a/pandas/tests/io/msgpack/common.py b/pandas/tests/io/msgpack/common.py
new file mode 100644
index 0000000000000..434d347c5742a
--- /dev/null
+++ b/pandas/tests/io/msgpack/common.py
@@ -0,0 +1,9 @@
+from pandas.compat import PY3
+
+# array compat
+if PY3:
+    frombytes = lambda obj, data: obj.frombytes(data)
+    tobytes = lambda obj: obj.tobytes()
+else:
+    frombytes = lambda obj, data: obj.fromstring(data)
+    tobytes = lambda obj: obj.tostring()
diff --git a/pandas/tests/io/msgpack/data/frame.mp b/pandas/tests/io/msgpack/data/frame.mp
new file mode 100644
index 0000000000000..21e20d262b26c
Binary files /dev/null and b/pandas/tests/io/msgpack/data/frame.mp differ
diff --git a/pandas/tests/io/msgpack/test_buffer.py b/pandas/tests/io/msgpack/test_buffer.py
index 5a2dc3dba5dfa..e36dc5bbdb4ba 100644
--- a/pandas/tests/io/msgpack/test_buffer.py
+++ b/pandas/tests/io/msgpack/test_buffer.py
@@ -2,11 +2,13 @@
 
 from pandas.io.msgpack import packb, unpackb
 
+from .common import frombytes
+
 
 def test_unpack_buffer():
     from array import array
     buf = array('b')
-    buf.fromstring(packb((b'foo', b'bar')))
+    frombytes(buf, packb((b'foo', b'bar')))
     obj = unpackb(buf, use_list=1)
     assert [b'foo', b'bar'] == obj
 
diff --git a/pandas/tests/io/msgpack/test_case.py b/pandas/tests/io/msgpack/test_case.py
index 3927693a94dd8..c0e76b37ee46d 100644
--- a/pandas/tests/io/msgpack/test_case.py
+++ b/pandas/tests/io/msgpack/test_case.py
@@ -98,10 +98,10 @@ def test_match():
         (tuple(range(16)), (b"\xdc\x00\x10\x00\x01\x02\x03\x04\x05\x06\x07"
                             b"\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f")),
         ({}, b'\x80'),
-        (dict([(x, x) for x in range(15)]),
+        ({x: x for x in range(15)},
          (b'\x8f\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06\x06\x07'
           b'\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e')),
-        (dict([(x, x) for x in range(16)]),
+        ({x: x for x in range(16)},
          (b'\xde\x00\x10\x00\x00\x01\x01\x02\x02\x03\x03\x04\x04\x05\x05\x06'
           b'\x06\x07\x07\x08\x08\t\t\n\n\x0b\x0b\x0c\x0c\r\r\x0e\x0e'
           b'\x0f\x0f')),
diff --git a/pandas/tests/io/msgpack/test_except.py b/pandas/tests/io/msgpack/test_except.py
index 4bcef3607bfa4..cd894109e989f 100644
--- a/pandas/tests/io/msgpack/test_except.py
+++ b/pandas/tests/io/msgpack/test_except.py
@@ -1,6 +1,9 @@
 # coding: utf-8
 
-import unittest
+from datetime import datetime
+
+import pytest
+
 from pandas.io.msgpack import packb, unpackb
 
 
@@ -8,26 +11,29 @@ class DummyException(Exception):
     pass
 
 
-class TestExceptions(unittest.TestCase):
+class TestExceptions(object):
 
     def test_raise_on_find_unsupported_value(self):
-        import datetime
-        self.assertRaises(TypeError, packb, datetime.datetime.now())
+        msg = "can\'t serialize datetime"
+        with pytest.raises(TypeError, match=msg):
+            packb(datetime.now())
 
     def test_raise_from_object_hook(self):
-        def hook(obj):
-            raise DummyException
-
-        self.assertRaises(DummyException, unpackb, packb({}), object_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': 'buzz'}),
-                          object_hook=hook)
-        self.assertRaises(DummyException, unpackb, packb({'fizz': 'buzz'}),
-                          object_pairs_hook=hook)
-        self.assertRaises(DummyException, unpackb,
-                          packb({'fizz': {'buzz': 'spam'}}), object_hook=hook)
-        self.assertRaises(DummyException, unpackb,
-                          packb({'fizz': {'buzz': 'spam'}}),
-                          object_pairs_hook=hook)
-
-    def test_invalidvalue(self):
-        self.assertRaises(ValueError, unpackb, b'\xd9\x97#DL_')
+        def hook(_):
+            raise DummyException()
+
+        with pytest.raises(DummyException):
+            unpackb(packb({}), object_hook=hook)
+        with pytest.raises(DummyException):
+            unpackb(packb({'fizz': 'buzz'}), object_hook=hook)
+        with pytest.raises(DummyException):
+            unpackb(packb({'fizz': 'buzz'}), object_pairs_hook=hook)
+        with pytest.raises(DummyException):
+            unpackb(packb({'fizz': {'buzz': 'spam'}}), object_hook=hook)
+        with pytest.raises(DummyException):
+            unpackb(packb({'fizz': {'buzz': 'spam'}}), object_pairs_hook=hook)
+
+    def test_invalid_value(self):
+        msg = "Unpack failed: error"
+        with pytest.raises(ValueError, match=msg):
+            unpackb(b"\xd9\x97#DL_")
diff --git a/pandas/tests/io/msgpack/test_extension.py b/pandas/tests/io/msgpack/test_extension.py
index a5a111efbb835..06a0691bf4f7e 100644
--- a/pandas/tests/io/msgpack/test_extension.py
+++ b/pandas/tests/io/msgpack/test_extension.py
@@ -1,8 +1,12 @@
 from __future__ import print_function
+
 import array
+
 import pandas.io.msgpack as msgpack
 from pandas.io.msgpack import ExtType
 
+from .common import frombytes, tobytes
+
 
 def test_pack_ext_type():
     def p(s):
@@ -42,15 +46,15 @@ def default(obj):
         print('default called', obj)
         if isinstance(obj, array.array):
             typecode = 123  # application specific typecode
-            data = obj.tostring()
+            data = tobytes(obj)
             return ExtType(typecode, data)
-        raise TypeError("Unknwon type object %r" % (obj, ))
+        raise TypeError("Unknown type object %r" % (obj, ))
 
     def ext_hook(code, data):
         print('ext_hook called', code, data)
         assert code == 123
         obj = array.array('d')
-        obj.fromstring(data)
+        frombytes(obj, data)
         return obj
 
     obj = [42, b'hello', array.array('d', [1.1, 2.2, 3.3])]
diff --git a/pandas/tests/io/msgpack/test_limits.py b/pandas/tests/io/msgpack/test_limits.py
index a908ee3547634..dd8dc8da607a4 100644
--- a/pandas/tests/io/msgpack/test_limits.py
+++ b/pandas/tests/io/msgpack/test_limits.py
@@ -1,32 +1,37 @@
 # coding: utf-8
-from __future__ import (absolute_import, division, print_function,
-                        unicode_literals)
-import pandas.util.testing as tm
+from __future__ import (
+    absolute_import, division, print_function, unicode_literals)
 
-from pandas.io.msgpack import packb, unpackb, Packer, Unpacker, ExtType
+import pytest
 
+from pandas.io.msgpack import ExtType, Packer, Unpacker, packb, unpackb
 
-class TestLimits(tm.TestCase):
+
+class TestLimits(object):
 
     def test_integer(self):
         x = -(2 ** 63)
         assert unpackb(packb(x)) == x
-        self.assertRaises((OverflowError, ValueError), packb, x - 1)
+        msg = (r"((long |Python )?(int )?too (big|large) to convert"
+               r"( to C (unsigned )?long))?")
+        with pytest.raises((OverflowError, ValueError), match=msg):
+            packb(x - 1)
         x = 2 ** 64 - 1
         assert unpackb(packb(x)) == x
-        self.assertRaises((OverflowError, ValueError), packb, x + 1)
+        with pytest.raises((OverflowError, ValueError), match=msg):
+            packb(x + 1)
 
     def test_array_header(self):
         packer = Packer()
         packer.pack_array_header(2 ** 32 - 1)
-        self.assertRaises((OverflowError, ValueError),
-                          packer.pack_array_header, 2 ** 32)
+        with pytest.raises((OverflowError, ValueError)):
+            packer.pack_array_header(2 ** 32)
 
     def test_map_header(self):
         packer = Packer()
         packer.pack_map_header(2 ** 32 - 1)
-        self.assertRaises((OverflowError, ValueError),
-                          packer.pack_array_header, 2 ** 32)
+        with pytest.raises((OverflowError, ValueError)):
+            packer.pack_array_header(2 ** 32)
 
     def test_max_str_len(self):
         d = 'x' * 3
@@ -38,7 +43,10 @@ def test_max_str_len(self):
 
         unpacker = Unpacker(max_str_len=2, encoding='utf-8')
         unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
+
+        msg = "3 exceeds max_str_len"
+        with pytest.raises(ValueError, match=msg):
+            unpacker.unpack()
 
     def test_max_bin_len(self):
         d = b'x' * 3
@@ -50,7 +58,10 @@ def test_max_bin_len(self):
 
         unpacker = Unpacker(max_bin_len=2)
         unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
+
+        msg = "3 exceeds max_bin_len"
+        with pytest.raises(ValueError, match=msg):
+            unpacker.unpack()
 
     def test_max_array_len(self):
         d = [1, 2, 3]
@@ -62,7 +73,10 @@ def test_max_array_len(self):
 
         unpacker = Unpacker(max_array_len=2)
         unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
+
+        msg = "3 exceeds max_array_len"
+        with pytest.raises(ValueError, match=msg):
+            unpacker.unpack()
 
     def test_max_map_len(self):
         d = {1: 2, 3: 4, 5: 6}
@@ -74,7 +88,10 @@ def test_max_map_len(self):
 
         unpacker = Unpacker(max_map_len=2)
         unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
+
+        msg = "3 exceeds max_map_len"
+        with pytest.raises(ValueError, match=msg):
+            unpacker.unpack()
 
     def test_max_ext_len(self):
         d = ExtType(42, b"abc")
@@ -86,4 +103,7 @@ def test_max_ext_len(self):
 
         unpacker = Unpacker(max_ext_len=2)
         unpacker.feed(packed)
-        self.assertRaises(ValueError, unpacker.unpack)
+
+        msg = "4 exceeds max_ext_len"
+        with pytest.raises(ValueError, match=msg):
+            unpacker.unpack()
diff --git a/pandas/tests/io/msgpack/test_newspec.py b/pandas/tests/io/msgpack/test_newspec.py
index 783bfc1b364f8..d92c649c5e1ca 100644
--- a/pandas/tests/io/msgpack/test_newspec.py
+++ b/pandas/tests/io/msgpack/test_newspec.py
@@ -1,6 +1,6 @@
 # coding: utf-8
 
-from pandas.io.msgpack import packb, unpackb, ExtType
+from pandas.io.msgpack import ExtType, packb, unpackb
 
 
 def test_str8():
diff --git a/pandas/tests/io/msgpack/test_obj.py b/pandas/tests/io/msgpack/test_obj.py
index b067dacb84494..471212f1bfe32 100644
--- a/pandas/tests/io/msgpack/test_obj.py
+++ b/pandas/tests/io/msgpack/test_obj.py
@@ -1,6 +1,7 @@
 # coding: utf-8
 
-import unittest
+import pytest
+
 from pandas.io.msgpack import packb, unpackb
 
 
@@ -8,7 +9,7 @@ class DecodeError(Exception):
     pass
 
 
-class TestObj(unittest.TestCase):
+class TestObj(object):
 
     def _arr_to_str(self, arr):
         return ''.join(str(c) for c in arr)
@@ -46,31 +47,28 @@ def test_decode_pairs_hook(self):
         assert unpacked[1] == prod_sum
 
     def test_only_one_obj_hook(self):
-        self.assertRaises(TypeError, unpackb, b'', object_hook=lambda x: x,
-                          object_pairs_hook=lambda x: x)
+        msg = "object_pairs_hook and object_hook are mutually exclusive"
+        with pytest.raises(TypeError, match=msg):
+            unpackb(b'', object_hook=lambda x: x,
+                    object_pairs_hook=lambda x: x)
 
     def test_bad_hook(self):
-        def f():
+        msg = r"can't serialize \(1\+2j\)"
+        with pytest.raises(TypeError, match=msg):
             packed = packb([3, 1 + 2j], default=lambda o: o)
             unpacked = unpackb(packed, use_list=1)  # noqa
 
-        self.assertRaises(TypeError, f)
-
     def test_array_hook(self):
         packed = packb([1, 2, 3])
         unpacked = unpackb(packed, list_hook=self._arr_to_str, use_list=1)
         assert unpacked == '123'
 
     def test_an_exception_in_objecthook1(self):
-        def f():
+        with pytest.raises(DecodeError, match='Ooops!'):
             packed = packb({1: {'__complex__': True, 'real': 1, 'imag': 2}})
             unpackb(packed, object_hook=self.bad_complex_decoder)
 
-        self.assertRaises(DecodeError, f)
-
     def test_an_exception_in_objecthook2(self):
-        def f():
+        with pytest.raises(DecodeError, match='Ooops!'):
             packed = packb({1: [{'__complex__': True, 'real': 1, 'imag': 2}]})
             unpackb(packed, list_hook=self.bad_complex_decoder, use_list=1)
-
-        self.assertRaises(DecodeError, f)
diff --git a/pandas/tests/io/msgpack/test_pack.py b/pandas/tests/io/msgpack/test_pack.py
index 6f9a271cbd326..078d9f4ceb649 100644
--- a/pandas/tests/io/msgpack/test_pack.py
+++ b/pandas/tests/io/msgpack/test_pack.py
@@ -1,14 +1,17 @@
 # coding: utf-8
+from collections import OrderedDict
+import struct
 
-import unittest
+import pytest
+
+from pandas.compat import u
 
-import struct
 from pandas import compat
-from pandas.compat import u, OrderedDict
-from pandas.io.msgpack import packb, unpackb, Unpacker, Packer
+
+from pandas.io.msgpack import Packer, Unpacker, packb, unpackb
 
 
-class TestPack(unittest.TestCase):
+class TestPack(object):
 
     def check(self, data, use_list=False):
         re = unpackb(packb(data), use_list=use_list)
@@ -64,12 +67,17 @@ def testIgnoreUnicodeErrors(self):
         assert re == "abcdef"
 
     def testStrictUnicodeUnpack(self):
-        self.assertRaises(UnicodeDecodeError, unpackb, packb(b'abc\xeddef'),
-                          encoding='utf-8', use_list=1)
+        msg = (r"'utf-*8' codec can't decode byte 0xed in position 3:"
+               " invalid continuation byte")
+        with pytest.raises(UnicodeDecodeError, match=msg):
+            unpackb(packb(b'abc\xeddef'), encoding='utf-8', use_list=1)
 
     def testStrictUnicodePack(self):
-        self.assertRaises(UnicodeEncodeError, packb, compat.u("abc\xeddef"),
-                          encoding='ascii', unicode_errors='strict')
+        msg = (r"'ascii' codec can't encode character u*'\\xed' in position 3:"
+               r" ordinal not in range\(128\)")
+        with pytest.raises(UnicodeEncodeError, match=msg):
+            packb(compat.u("abc\xeddef"), encoding='ascii',
+                  unicode_errors='strict')
 
     def testIgnoreErrorsPack(self):
         re = unpackb(
@@ -79,7 +87,9 @@ def testIgnoreErrorsPack(self):
         assert re == compat.u("abcdef")
 
     def testNoEncoding(self):
-        self.assertRaises(TypeError, packb, compat.u("abc"), encoding=None)
+        msg = "Can't encode unicode string: no encoding is specified"
+        with pytest.raises(TypeError, match=msg):
+            packb(compat.u("abc"), encoding=None)
 
     def testDecodeBinary(self):
         re = unpackb(packb("abc"), encoding=None, use_list=1)
@@ -131,7 +141,7 @@ def testMapSize(self, sizes=[0, 5, 50, 1000]):
         bio.seek(0)
         unpacker = Unpacker(bio)
         for size in sizes:
-            assert unpacker.unpack() == dict((i, i * 2) for i in range(size))
+            assert unpacker.unpack() == {i: i * 2 for i in range(size)}
 
     def test_odict(self):
         seq = [(b'one', 1), (b'two', 2), (b'three', 3), (b'four', 4)]
diff --git a/pandas/tests/io/msgpack/test_read_size.py b/pandas/tests/io/msgpack/test_read_size.py
index ef521fa345637..42791b571e8e7 100644
--- a/pandas/tests/io/msgpack/test_read_size.py
+++ b/pandas/tests/io/msgpack/test_read_size.py
@@ -1,5 +1,6 @@
 """Test Unpacker's read_array_header and read_map_header methods"""
-from pandas.io.msgpack import packb, Unpacker, OutOfData
+from pandas.io.msgpack import OutOfData, Unpacker, packb
+
 UnexpectedTypeException = ValueError
 
 
diff --git a/pandas/tests/io/msgpack/test_seq.py b/pandas/tests/io/msgpack/test_seq.py
index 5f203e8997ccb..68be8c2d975aa 100644
--- a/pandas/tests/io/msgpack/test_seq.py
+++ b/pandas/tests/io/msgpack/test_seq.py
@@ -1,6 +1,7 @@
 # coding: utf-8
 
 import io
+
 import pandas.io.msgpack as msgpack
 
 binarydata = bytes(bytearray(range(256)))
@@ -25,7 +26,7 @@ def test_exceeding_unpacker_read_size():
     # double free or corruption (!prev)
 
     # 40 ok for read_size=1024, while 50 introduces errors
-    # 7000 ok for read_size=1024*1024, while 8000 leads to  glibc detected ***
+    # 7000 ok for read_size=1024*1024, while 8000 leads to glibc detected ***
     # python: double free or corruption (!prev):
 
     for idx in range(NUMBER_OF_STRINGS):
diff --git a/pandas/tests/io/msgpack/test_sequnpack.py b/pandas/tests/io/msgpack/test_sequnpack.py
index c9c979c4e0e44..91f5778a7ce6c 100644
--- a/pandas/tests/io/msgpack/test_sequnpack.py
+++ b/pandas/tests/io/msgpack/test_sequnpack.py
@@ -1,28 +1,25 @@
 # coding: utf-8
 
-import unittest
+import pytest
 
 from pandas import compat
-from pandas.io.msgpack import Unpacker, BufferFull
-from pandas.io.msgpack import OutOfData
 
+from pandas.io.msgpack import BufferFull, OutOfData, Unpacker
 
-class TestPack(unittest.TestCase):
 
-    def test_partialdata(self):
+class TestPack(object):
+
+    def test_partial_data(self):
         unpacker = Unpacker()
-        unpacker.feed(b'\xa5')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'h')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'a')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'l')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'l')
-        self.assertRaises(StopIteration, next, iter(unpacker))
-        unpacker.feed(b'o')
-        assert next(iter(unpacker)) == b'hallo'
+        msg = "No more data to unpack"
+
+        for data in [b"\xa5", b"h", b"a", b"l", b"l"]:
+            unpacker.feed(data)
+            with pytest.raises(StopIteration, match=msg):
+                next(iter(unpacker))
+
+        unpacker.feed(b"o")
+        assert next(iter(unpacker)) == b"hallo"
 
     def test_foobar(self):
         unpacker = Unpacker(read_size=3, use_list=1)
@@ -33,7 +30,9 @@ def test_foobar(self):
         assert unpacker.unpack() == ord(b'b')
         assert unpacker.unpack() == ord(b'a')
         assert unpacker.unpack() == ord(b'r')
-        self.assertRaises(OutOfData, unpacker.unpack)
+        msg = "No more data to unpack"
+        with pytest.raises(OutOfData, match=msg):
+            unpacker.unpack()
 
         unpacker.feed(b'foo')
         unpacker.feed(b'bar')
@@ -53,14 +52,24 @@ def test_foobar_skip(self):
         unpacker.skip()
         assert unpacker.unpack() == ord(b'a')
         unpacker.skip()
-        self.assertRaises(OutOfData, unpacker.unpack)
+        msg = "No more data to unpack"
+        with pytest.raises(OutOfData, match=msg):
+            unpacker.unpack()
+
+    def test_maxbuffersize_read_size_exceeds_max_buffer_size(self):
+        msg = "read_size should be less or equal to max_buffer_size"
+        with pytest.raises(ValueError, match=msg):
+            Unpacker(read_size=5, max_buffer_size=3)
+
+    def test_maxbuffersize_bufferfull(self):
+        unpacker = Unpacker(read_size=3, max_buffer_size=3, use_list=1)
+        unpacker.feed(b'foo')
+        with pytest.raises(BufferFull, match=r'^$'):
+            unpacker.feed(b'b')
 
     def test_maxbuffersize(self):
-        self.assertRaises(ValueError, Unpacker, read_size=5, max_buffer_size=3)
         unpacker = Unpacker(read_size=3, max_buffer_size=3, use_list=1)
-        unpacker.feed(b'fo')
-        self.assertRaises(BufferFull, unpacker.feed, b'ob')
-        unpacker.feed(b'o')
+        unpacker.feed(b'foo')
         assert ord('f') == next(unpacker)
         unpacker.feed(b'b')
         assert ord('o') == next(unpacker)
diff --git a/pandas/tests/io/msgpack/test_subtype.py b/pandas/tests/io/msgpack/test_subtype.py
index e27ec66c63e1f..8af7e0b91d9b7 100644
--- a/pandas/tests/io/msgpack/test_subtype.py
+++ b/pandas/tests/io/msgpack/test_subtype.py
@@ -1,8 +1,9 @@
 # coding: utf-8
 
-from pandas.io.msgpack import packb
 from collections import namedtuple
 
+from pandas.io.msgpack import packb
+
 
 class MyList(list):
     pass
diff --git a/pandas/tests/io/msgpack/test_unpack.py b/pandas/tests/io/msgpack/test_unpack.py
index 24a8e885d19d6..356156296c067 100644
--- a/pandas/tests/io/msgpack/test_unpack.py
+++ b/pandas/tests/io/msgpack/test_unpack.py
@@ -1,11 +1,12 @@
 from io import BytesIO
 import sys
-from pandas.io.msgpack import Unpacker, packb, OutOfData, ExtType
-import pandas.util.testing as tm
+
 import pytest
 
+from pandas.io.msgpack import ExtType, OutOfData, Unpacker, packb
+
 
-class TestUnpack(tm.TestCase):
+class TestUnpack(object):
 
     def test_unpack_array_header_from_file(self):
         f = BytesIO(packb([1, 2, 3, 4]))
@@ -15,7 +16,9 @@ def test_unpack_array_header_from_file(self):
         assert unpacker.unpack() == 2
         assert unpacker.unpack() == 3
         assert unpacker.unpack() == 4
-        self.assertRaises(OutOfData, unpacker.unpack)
+        msg = "No more data to unpack"
+        with pytest.raises(OutOfData, match=msg):
+            unpacker.unpack()
 
     def test_unpacker_hook_refcnt(self):
         if not hasattr(sys, 'getrefcount'):
diff --git a/pandas/tests/io/msgpack/test_unpack_raw.py b/pandas/tests/io/msgpack/test_unpack_raw.py
index a261bf4cbbcd7..09ebb681d8709 100644
--- a/pandas/tests/io/msgpack/test_unpack_raw.py
+++ b/pandas/tests/io/msgpack/test_unpack_raw.py
@@ -1,6 +1,7 @@
 """Tests for cases where the user seeks to obtain packed msgpack objects"""
 
 import io
+
 from pandas.io.msgpack import Unpacker, packb
 
 
diff --git a/pandas/tests/io/parser/c_parser_only.py b/pandas/tests/io/parser/c_parser_only.py
deleted file mode 100644
index ffbd904843bfc..0000000000000
--- a/pandas/tests/io/parser/c_parser_only.py
+++ /dev/null
@@ -1,410 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that apply specifically to the CParser. Unless specifically stated
-as a CParser-specific issue, the goal is to eventually move as many of
-these tests out of this module as soon as the Python parser can accept
-further arguments when parsing.
-"""
-
-import pytest
-import numpy as np
-
-import pandas as pd
-import pandas.util.testing as tm
-from pandas import DataFrame
-from pandas import compat
-from pandas.compat import StringIO, range, lrange
-
-
-class CParserTests(object):
-
-    def test_buffer_overflow(self):
-        # see gh-9205: test certain malformed input files that cause
-        # buffer overflows in tokenizer.c
-
-        malfw = "1\r1\r1\r 1\r 1\r"         # buffer overflow in words pointer
-        malfs = "1\r1\r1\r 1\r 1\r11\r"     # buffer overflow in stream pointer
-        malfl = "1\r1\r1\r 1\r 1\r11\r1\r"  # buffer overflow in lines pointer
-
-        cperr = 'Buffer overflow caught - possible malformed input file.'
-
-        for malf in (malfw, malfs, malfl):
-            try:
-                self.read_table(StringIO(malf))
-            except Exception as err:
-                self.assertIn(cperr, str(err))
-
-    def test_buffer_rd_bytes(self):
-        # see gh-12098: src->buffer in the C parser can be freed twice leading
-        # to a segfault if a corrupt gzip file is read with 'read_csv' and the
-        # buffer is filled more than once before gzip throws an exception
-
-        data = '\x1F\x8B\x08\x00\x00\x00\x00\x00\x00\x03\xED\xC3\x41\x09' \
-               '\x00\x00\x08\x00\xB1\xB7\xB6\xBA\xFE\xA5\xCC\x21\x6C\xB0' \
-               '\xA6\x4D' + '\x55' * 267 + \
-               '\x7D\xF7\x00\x91\xE0\x47\x97\x14\x38\x04\x00' \
-               '\x1f\x8b\x08\x00VT\x97V\x00\x03\xed]\xefO'
-        for i in range(100):
-            try:
-                self.read_csv(StringIO(data),
-                              compression='gzip',
-                              delim_whitespace=True)
-            except Exception:
-                pass
-
-    def test_delim_whitespace_custom_terminator(self):
-        # See gh-12912
-        data = """a b c~1 2 3~4 5 6~7 8 9"""
-        df = self.read_csv(StringIO(data), lineterminator='~',
-                           delim_whitespace=True)
-        expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                             columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_dtype_and_names_error(self):
-        # see gh-8833: passing both dtype and names
-        # resulting in an error reporting issue
-        data = """
-1.0 1
-2.0 2
-3.0 3
-"""
-        # base cases
-        result = self.read_csv(StringIO(data), sep=r'\s+', header=None)
-        expected = DataFrame([[1.0, 1], [2.0, 2], [3.0, 3]])
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), sep=r'\s+',
-                               header=None, names=['a', 'b'])
-        expected = DataFrame(
-            [[1.0, 1], [2.0, 2], [3.0, 3]], columns=['a', 'b'])
-        tm.assert_frame_equal(result, expected)
-
-        # fallback casting
-        result = self.read_csv(StringIO(
-            data), sep=r'\s+', header=None,
-            names=['a', 'b'], dtype={'a': np.int32})
-        expected = DataFrame([[1, 1], [2, 2], [3, 3]],
-                             columns=['a', 'b'])
-        expected['a'] = expected['a'].astype(np.int32)
-        tm.assert_frame_equal(result, expected)
-
-        data = """
-1.0 1
-nan 2
-3.0 3
-"""
-        # fallback casting, but not castable
-        with tm.assertRaisesRegexp(ValueError, 'cannot safely convert'):
-            self.read_csv(StringIO(data), sep=r'\s+', header=None,
-                          names=['a', 'b'], dtype={'a': np.int32})
-
-    def test_unsupported_dtype(self):
-        df = DataFrame(np.random.rand(5, 2), columns=list(
-            'AB'), index=['1A', '1B', '1C', '1D', '1E'])
-
-        with tm.ensure_clean('__unsupported_dtype__.csv') as path:
-            df.to_csv(path)
-
-            # valid but we don't support it (date)
-            self.assertRaises(TypeError, self.read_csv, path,
-                              dtype={'A': 'datetime64', 'B': 'float64'},
-                              index_col=0)
-            self.assertRaises(TypeError, self.read_csv, path,
-                              dtype={'A': 'datetime64', 'B': 'float64'},
-                              index_col=0, parse_dates=['B'])
-
-            # valid but we don't support it
-            self.assertRaises(TypeError, self.read_csv, path,
-                              dtype={'A': 'timedelta64', 'B': 'float64'},
-                              index_col=0)
-
-            # valid but unsupported - fixed width unicode string
-            self.assertRaises(TypeError, self.read_csv, path,
-                              dtype={'A': 'U8'},
-                              index_col=0)
-
-    def test_precise_conversion(self):
-        # see gh-8002
-        tm._skip_if_32bit()
-        from decimal import Decimal
-
-        normal_errors = []
-        precise_errors = []
-
-        # test numbers between 1 and 2
-        for num in np.linspace(1., 2., num=500):
-            # 25 decimal digits of precision
-            text = 'a\n{0:.25}'.format(num)
-
-            normal_val = float(self.read_csv(StringIO(text))['a'][0])
-            precise_val = float(self.read_csv(
-                StringIO(text), float_precision='high')['a'][0])
-            roundtrip_val = float(self.read_csv(
-                StringIO(text), float_precision='round_trip')['a'][0])
-            actual_val = Decimal(text[2:])
-
-            def error(val):
-                return abs(Decimal('{0:.100}'.format(val)) - actual_val)
-
-            normal_errors.append(error(normal_val))
-            precise_errors.append(error(precise_val))
-
-            # round-trip should match float()
-            self.assertEqual(roundtrip_val, float(text[2:]))
-
-        self.assertTrue(sum(precise_errors) <= sum(normal_errors))
-        self.assertTrue(max(precise_errors) <= max(normal_errors))
-
-    def test_pass_dtype_as_recarray(self):
-        if compat.is_platform_windows() and self.low_memory:
-            pytest.skip(
-                "segfaults on win-64, only when all tests are run")
-
-        data = """\
-one,two
-1,2.5
-2,3.5
-3,4.5
-4,5.5"""
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            result = self.read_csv(StringIO(data), dtype={
-                'one': 'u1', 1: 'S1'}, as_recarray=True)
-            self.assertEqual(result['one'].dtype, 'u1')
-            self.assertEqual(result['two'].dtype, 'S1')
-
-    def test_usecols_dtypes(self):
-        data = """\
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-
-        result = self.read_csv(StringIO(data), usecols=(0, 1, 2),
-                               names=('a', 'b', 'c'),
-                               header=None,
-                               converters={'a': str},
-                               dtype={'b': int, 'c': float},
-                               )
-        result2 = self.read_csv(StringIO(data), usecols=(0, 2),
-                                names=('a', 'b', 'c'),
-                                header=None,
-                                converters={'a': str},
-                                dtype={'b': int, 'c': float},
-                                )
-        self.assertTrue((result.dtypes == [object, np.int, np.float]).all())
-        self.assertTrue((result2.dtypes == [object, np.float]).all())
-
-    def test_disable_bool_parsing(self):
-        # #2090
-
-        data = """A,B,C
-Yes,No,Yes
-No,Yes,Yes
-Yes,,Yes
-No,No,No"""
-
-        result = self.read_csv(StringIO(data), dtype=object)
-        self.assertTrue((result.dtypes == object).all())
-
-        result = self.read_csv(StringIO(data), dtype=object, na_filter=False)
-        self.assertEqual(result['B'][2], '')
-
-    def test_custom_lineterminator(self):
-        data = 'a,b,c~1,2,3~4,5,6'
-
-        result = self.read_csv(StringIO(data), lineterminator='~')
-        expected = self.read_csv(StringIO(data.replace('~', '\n')))
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_parse_ragged_csv(self):
-        data = """1,2,3
-1,2,3,4
-1,2,3,4,5
-1,2
-1,2,3,4"""
-
-        nice_data = """1,2,3,,
-1,2,3,4,
-1,2,3,4,5
-1,2,,,
-1,2,3,4,"""
-        result = self.read_csv(StringIO(data), header=None,
-                               names=['a', 'b', 'c', 'd', 'e'])
-
-        expected = self.read_csv(StringIO(nice_data), header=None,
-                                 names=['a', 'b', 'c', 'd', 'e'])
-
-        tm.assert_frame_equal(result, expected)
-
-        # too many columns, cause segfault if not careful
-        data = "1,2\n3,4,5"
-
-        result = self.read_csv(StringIO(data), header=None,
-                               names=lrange(50))
-        expected = self.read_csv(StringIO(data), header=None,
-                                 names=lrange(3)).reindex(columns=lrange(50))
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_tokenize_CR_with_quoting(self):
-        # see gh-3453
-
-        data = ' a,b,c\r"a,b","e,d","f,f"'
-
-        result = self.read_csv(StringIO(data), header=None)
-        expected = self.read_csv(StringIO(data.replace('\r', '\n')),
-                                 header=None)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data))
-        expected = self.read_csv(StringIO(data.replace('\r', '\n')))
-        tm.assert_frame_equal(result, expected)
-
-    def test_grow_boundary_at_cap(self):
-        # See gh-12494
-        #
-        # Cause of error was that the C parser
-        # was not increasing the buffer size when
-        # the desired space would fill the buffer
-        # to capacity, which would later cause a
-        # buffer overflow error when checking the
-        # EOF terminator of the CSV stream
-        def test_empty_header_read(count):
-            s = StringIO(',' * count)
-            expected = DataFrame(columns=[
-                'Unnamed: {i}'.format(i=i)
-                for i in range(count + 1)])
-            df = self.read_csv(s)
-            tm.assert_frame_equal(df, expected)
-
-        for count in range(1, 101):
-            test_empty_header_read(count)
-
-    def test_parse_trim_buffers(self):
-        # This test is part of a bugfix for issue #13703. It attmepts to
-        # to stress the system memory allocator, to cause it to move the
-        # stream buffer and either let the OS reclaim the region, or let
-        # other memory requests of parser otherwise modify the contents
-        # of memory space, where it was formely located.
-        # This test is designed to cause a `segfault` with unpatched
-        # `tokenizer.c`. Sometimes the test fails on `segfault`, other
-        # times it fails due to memory corruption, which causes the
-        # loaded DataFrame to differ from the expected one.
-
-        # Generate a large mixed-type CSV file on-the-fly (one record is
-        # approx 1.5KiB).
-        record_ = \
-            """9999-9,99:99,,,,ZZ,ZZ,,,ZZZ-ZZZZ,.Z-ZZZZ,-9.99,,,9.99,Z""" \
-            """ZZZZ,,-99,9,ZZZ-ZZZZ,ZZ-ZZZZ,,9.99,ZZZ-ZZZZZ,ZZZ-ZZZZZ,""" \
-            """ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,9""" \
-            """99,ZZZ-ZZZZ,,ZZ-ZZZZ,,,,,ZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,,,9,9,""" \
-            """9,9,99,99,999,999,ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,9,ZZ-ZZZZ,9.""" \
-            """99,ZZ-ZZZZ,ZZ-ZZZZ,,,,ZZZZ,,,ZZ,ZZ,,,,,,,,,,,,,9,,,999.""" \
-            """99,999.99,,,ZZZZZ,,,Z9,,,,,,,ZZZ,ZZZ,,,,,,,,,,,ZZZZZ,ZZ""" \
-            """ZZZ,ZZZ-ZZZZZZ,ZZZ-ZZZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZ""" \
-            """ZZ,,,999999,999999,ZZZ,ZZZ,,,ZZZ,ZZZ,999.99,999.99,,,,Z""" \
-            """ZZ-ZZZ,ZZZ-ZZZ,-9.99,-9.99,9,9,,99,,9.99,9.99,9,9,9.99,""" \
-            """9.99,,,,9.99,9.99,,99,,99,9.99,9.99,,,ZZZ,ZZZ,,999.99,,""" \
-            """999.99,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,ZZZZZ,ZZZZZ,ZZZ,ZZZ,9,9,""" \
-            """,,,,,ZZZ-ZZZZ,ZZZ999Z,,,999.99,,999.99,ZZZ-ZZZZ,,,9.999""" \
-            """,9.999,9.999,9.999,-9.999,-9.999,-9.999,-9.999,9.999,9.""" \
-            """999,9.999,9.999,9.999,9.999,9.999,9.999,99999,ZZZ-ZZZZ,""" \
-            """,9.99,ZZZ,,,,,,,,ZZZ,,,,,9,,,,9,,,,,,,,,,ZZZ-ZZZZ,ZZZ-Z""" \
-            """ZZZ,,ZZZZZ,ZZZZZ,ZZZZZ,ZZZZZ,,,9.99,,ZZ-ZZZZ,ZZ-ZZZZ,ZZ""" \
-            """,999,,,,ZZ-ZZZZ,ZZZ,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,99.99,99.99""" \
-            """,,,9.99,9.99,9.99,9.99,ZZZ-ZZZZ,,,ZZZ-ZZZZZ,,,,,-9.99,-""" \
-            """9.99,-9.99,-9.99,,,,,,,,,ZZZ-ZZZZ,,9,9.99,9.99,99ZZ,,-9""" \
-            """.99,-9.99,ZZZ-ZZZZ,,,,,,,ZZZ-ZZZZ,9.99,9.99,9999,,,,,,,""" \
-            """,,,-9.9,Z/Z-ZZZZ,999.99,9.99,,999.99,ZZ-ZZZZ,ZZ-ZZZZ,9.""" \
-            """99,9.99,9.99,9.99,9.99,9.99,,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZ""" \
-            """ZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ,ZZZ,ZZZ,ZZZ,9.99,,,-9.99,ZZ""" \
-            """-ZZZZ,-999.99,,-9999,,999.99,,,,999.99,99.99,,,ZZ-ZZZZZ""" \
-            """ZZZ,ZZ-ZZZZ-ZZZZZZZ,,,,ZZ-ZZ-ZZZZZZZZ,ZZZZZZZZ,ZZZ-ZZZZ""" \
-            """,9999,999.99,ZZZ-ZZZZ,-9.99,-9.99,ZZZ-ZZZZ,99:99:99,,99""" \
-            """,99,,9.99,,-99.99,,,,,,9.99,ZZZ-ZZZZ,-9.99,-9.99,9.99,9""" \
-            """.99,,ZZZ,,,,,,,ZZZ,ZZZ,,,,,"""
-
-        # Set the number of lines so that a call to `parser_trim_buffers`
-        # is triggered: after a couple of full chunks are consumed a
-        # relatively small 'residual' chunk would cause reallocation
-        # within the parser.
-        chunksize, n_lines = 128, 2 * 128 + 15
-        csv_data = "\n".join([record_] * n_lines) + "\n"
-
-        # We will use StringIO to load the CSV from this text buffer.
-        # pd.read_csv() will iterate over the file in chunks and will
-        # finally read a residual chunk of really small size.
-
-        # Generate the expected output: manually create the dataframe
-        # by splitting by comma and repeating the `n_lines` times.
-        row = tuple(val_ if val_ else float("nan")
-                    for val_ in record_.split(","))
-        expected = pd.DataFrame([row for _ in range(n_lines)],
-                                dtype=object, columns=None, index=None)
-
-        # Iterate over the CSV file in chunks of `chunksize` lines
-        chunks_ = self.read_csv(StringIO(csv_data), header=None,
-                                dtype=object, chunksize=chunksize)
-        result = pd.concat(chunks_, axis=0, ignore_index=True)
-
-        # Check for data corruption if there was no segfault
-        tm.assert_frame_equal(result, expected)
-
-    def test_internal_null_byte(self):
-        # see gh-14012
-        #
-        # The null byte ('\x00') should not be used as a
-        # true line terminator, escape character, or comment
-        # character, only as a placeholder to indicate that
-        # none was specified.
-        #
-        # This test should be moved to common.py ONLY when
-        # Python's csv class supports parsing '\x00'.
-        names = ['a', 'b', 'c']
-        data = "1,2,3\n4,\x00,6\n7,8,9"
-        expected = pd.DataFrame([[1, 2.0, 3], [4, np.nan, 6],
-                                 [7, 8, 9]], columns=names)
-
-        result = self.read_csv(StringIO(data), names=names)
-        tm.assert_frame_equal(result, expected)
-
-    def test_read_nrows_large(self):
-        # gh-7626 - Read only nrows of data in for large inputs (>262144b)
-        header_narrow = '\t'.join(['COL_HEADER_' + str(i)
-                                   for i in range(10)]) + '\n'
-        data_narrow = '\t'.join(['somedatasomedatasomedata1'
-                                 for i in range(10)]) + '\n'
-        header_wide = '\t'.join(['COL_HEADER_' + str(i)
-                                 for i in range(15)]) + '\n'
-        data_wide = '\t'.join(['somedatasomedatasomedata2'
-                               for i in range(15)]) + '\n'
-        test_input = (header_narrow + data_narrow * 1050 +
-                      header_wide + data_wide * 2)
-
-        df = self.read_csv(StringIO(test_input), sep='\t', nrows=1010)
-
-        self.assertTrue(df.size == 1010 * 10)
-
-    def test_float_precision_round_trip_with_text(self):
-        # gh-15140 - This should not segfault on Python 2.7+
-        df = self.read_csv(StringIO('a'),
-                           float_precision='round_trip',
-                           header=None)
-        tm.assert_frame_equal(df, DataFrame({0: ['a']}))
-
-    def test_large_difference_in_columns(self):
-        # gh-14125
-        count = 10000
-        large_row = ('X,' * count)[:-1] + '\n'
-        normal_row = 'XXXXXX XXXXXX,111111111111111\n'
-        test_input = (large_row + normal_row * 6)[:-1]
-        result = self.read_csv(StringIO(test_input), header=None, usecols=[0])
-        rows = test_input.split('\n')
-        expected = DataFrame([row.split(',')[0] for row in rows])
-
-        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/comment.py b/pandas/tests/io/parser/comment.py
deleted file mode 100644
index 9987a017cf985..0000000000000
--- a/pandas/tests/io/parser/comment.py
+++ /dev/null
@@ -1,118 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that comments are properly handled during parsing
-for all of the parsers defined in parsers.py
-"""
-
-import numpy as np
-import pandas.util.testing as tm
-
-from pandas import DataFrame
-from pandas.compat import StringIO
-
-
-class CommentTests(object):
-
-    def test_comment(self):
-        data = """A,B,C
-1,2.,4.#hello world
-5.,NaN,10.0
-"""
-        expected = np.array([[1., 2., 4.],
-                             [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_numpy_array_equal(df.values, expected)
-
-        df = self.read_table(StringIO(data), sep=',', comment='#',
-                             na_values=['NaN'])
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_line_comment(self):
-        data = """# empty
-A,B,C
-1,2.,4.#hello world
-#ignore this line
-5.,NaN,10.0
-"""
-        expected = np.array([[1., 2., 4.],
-                             [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data), comment='#')
-        tm.assert_numpy_array_equal(df.values, expected)
-
-        # check with delim_whitespace=True
-        df = self.read_csv(StringIO(data.replace(',', ' ')), comment='#',
-                           delim_whitespace=True)
-        tm.assert_almost_equal(df.values, expected)
-
-        # custom line terminator is not supported
-        # with the Python parser yet
-        if self.engine == 'c':
-            expected = np.array([[1., 2., 4.],
-                                 [5., np.nan, 10.]])
-            df = self.read_csv(StringIO(data.replace('\n', '*')),
-                               comment='#', lineterminator='*')
-            tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_comment_skiprows(self):
-        data = """# empty
-random line
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        # this should ignore the first four lines (including comments)
-        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4)
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_comment_header(self):
-        data = """# empty
-# second empty line
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        # header should begin at the second non-comment line
-        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data), comment='#', header=1)
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_comment_skiprows_header(self):
-        data = """# empty
-# second empty line
-# third empty line
-X,Y,Z
-1,2,3
-A,B,C
-1,2.,4.
-5.,NaN,10.0
-"""
-        # skiprows should skip the first 4 lines (including comments), while
-        # header should start from the second non-commented line starting
-        # with line 5
-        expected = np.array([[1., 2., 4.], [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data), comment='#', skiprows=4, header=1)
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_custom_comment_char(self):
-        data = "a,b,c\n1,2,3#ignore this!\n4,5,6#ignorethistoo"
-
-        result = self.read_csv(StringIO(data), comment='#')
-        expected = DataFrame({'a': [1, 4], 'b': [2, 5], 'c': [3, 6]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_commment_first_line(self):
-        # see gh-4623
-        data = '# notes\na,b,c\n# more notes\n1,2,3'
-
-        expected = DataFrame([[1, 2, 3]], columns=['a', 'b', 'c'])
-        result = self.read_csv(StringIO(data), comment='#')
-        tm.assert_frame_equal(result, expected)
-
-        expected = DataFrame({0: ['a', '1'], 1: ['b', '2'], 2: ['c', '3']})
-        result = self.read_csv(StringIO(data), comment='#', header=None)
-        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/common.py b/pandas/tests/io/parser/common.py
deleted file mode 100644
index 2c8bca490f274..0000000000000
--- a/pandas/tests/io/parser/common.py
+++ /dev/null
@@ -1,1679 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import csv
-import os
-import platform
-import codecs
-
-import re
-import sys
-from datetime import datetime
-
-import pytest
-import numpy as np
-from pandas._libs.lib import Timestamp
-
-import pandas as pd
-import pandas.util.testing as tm
-from pandas import DataFrame, Series, Index, MultiIndex
-from pandas import compat
-from pandas.compat import (StringIO, BytesIO, PY3,
-                           range, lrange, u)
-from pandas.io.common import DtypeWarning, EmptyDataError, URLError
-from pandas.io.parsers import TextFileReader, TextParser
-
-
-class ParserTests(object):
-    """
-    Want to be able to test either C+Cython or Python+Cython parsers
-    """
-    data1 = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo2,12,13,14,15
-bar2,12,13,14,15
-"""
-
-    def test_empty_decimal_marker(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        # Parsers support only length-1 decimals
-        msg = 'Only length-1 decimal markers supported'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(data), decimal='')
-
-    def test_bad_stream_exception(self):
-        # Issue 13652:
-        # This test validates that both python engine
-        # and C engine will raise UnicodeDecodeError instead of
-        # c engine raising ParserError and swallowing exception
-        # that caused read to fail.
-        handle = open(self.csv_shiftjs, "rb")
-        codec = codecs.lookup("utf-8")
-        utf8 = codecs.lookup('utf-8')
-        # stream must be binary UTF8
-        stream = codecs.StreamRecoder(
-            handle, utf8.encode, utf8.decode, codec.streamreader,
-            codec.streamwriter)
-        if compat.PY3:
-            msg = "'utf-8' codec can't decode byte"
-        else:
-            msg = "'utf8' codec can't decode byte"
-        with tm.assertRaisesRegexp(UnicodeDecodeError, msg):
-            self.read_csv(stream)
-        stream.close()
-
-    def test_read_csv(self):
-        if not compat.PY3:
-            if compat.is_platform_windows():
-                prefix = u("file:///")
-            else:
-                prefix = u("file://")
-
-            fname = prefix + compat.text_type(self.csv1)
-            self.read_csv(fname, index_col=0, parse_dates=True)
-
-    def test_1000_sep(self):
-        data = """A|B|C
-1|2,334|5
-10|13|10.
-"""
-        expected = DataFrame({
-            'A': [1, 10],
-            'B': [2334, 13],
-            'C': [5, 10.]
-        })
-
-        df = self.read_csv(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data), sep='|', thousands=',')
-        tm.assert_frame_equal(df, expected)
-
-    def test_squeeze(self):
-        data = """\
-a,1
-b,2
-c,3
-"""
-        idx = Index(['a', 'b', 'c'], name=0)
-        expected = Series([1, 2, 3], name=1, index=idx)
-        result = self.read_table(StringIO(data), sep=',', index_col=0,
-                                 header=None, squeeze=True)
-        tm.assertIsInstance(result, Series)
-        tm.assert_series_equal(result, expected)
-
-    def test_squeeze_no_view(self):
-        # see gh-8217
-        # Series should not be a view
-        data = """time,data\n0,10\n1,11\n2,12\n4,14\n5,15\n3,13"""
-        result = self.read_csv(StringIO(data), index_col='time', squeeze=True)
-        self.assertFalse(result._is_view)
-
-    def test_malformed(self):
-        # see gh-6607
-
-        # all
-        data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-"""
-        msg = 'Expected 3 fields in line 4, saw 5'
-        with tm.assertRaisesRegexp(Exception, msg):
-            self.read_table(StringIO(data), sep=',',
-                            header=1, comment='#')
-
-        # first chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        msg = 'Expected 3 fields in line 6, saw 5'
-        with tm.assertRaisesRegexp(Exception, msg):
-            it = self.read_table(StringIO(data), sep=',',
-                                 header=1, comment='#',
-                                 iterator=True, chunksize=1,
-                                 skiprows=[2])
-            it.read(5)
-
-        # middle chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        msg = 'Expected 3 fields in line 6, saw 5'
-        with tm.assertRaisesRegexp(Exception, msg):
-            it = self.read_table(StringIO(data), sep=',', header=1,
-                                 comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            it.read(3)
-
-        # last chunk
-        data = """ignore
-A,B,C
-skip
-1,2,3
-3,5,10 # comment
-1,2,3,4,5
-2,3,4
-"""
-        msg = 'Expected 3 fields in line 6, saw 5'
-        with tm.assertRaisesRegexp(Exception, msg):
-            it = self.read_table(StringIO(data), sep=',', header=1,
-                                 comment='#', iterator=True, chunksize=1,
-                                 skiprows=[2])
-            it.read()
-
-        # skipfooter is not supported with the C parser yet
-        if self.engine == 'python':
-            # skipfooter
-            data = """ignore
-A,B,C
-1,2,3 # comment
-1,2,3,4,5
-2,3,4
-footer
-"""
-            msg = 'Expected 3 fields in line 4, saw 5'
-            with tm.assertRaisesRegexp(Exception, msg):
-                self.read_table(StringIO(data), sep=',',
-                                header=1, comment='#',
-                                skipfooter=1)
-
-    def test_quoting(self):
-        bad_line_small = """printer\tresult\tvariant_name
-Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jacob
-Klosterdruckerei\tKlosterdruckerei <Salem> (1611-1804)\tMuller, Jakob
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\t"Furststiftische Hofdruckerei,  <Kempten""
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tGaller, Alois
-Klosterdruckerei\tKlosterdruckerei <Kempten> (1609-1805)\tHochfurstliche Buchhandlung <Kempten>"""  # noqa
-        self.assertRaises(Exception, self.read_table, StringIO(bad_line_small),
-                          sep='\t')
-
-        good_line_small = bad_line_small + '"'
-        df = self.read_table(StringIO(good_line_small), sep='\t')
-        self.assertEqual(len(df), 3)
-
-    def test_unnamed_columns(self):
-        data = """A,B,C,,
-1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        expected = np.array([[1, 2, 3, 4, 5],
-                             [6, 7, 8, 9, 10],
-                             [11, 12, 13, 14, 15]], dtype=np.int64)
-        df = self.read_table(StringIO(data), sep=',')
-        tm.assert_almost_equal(df.values, expected)
-        self.assert_index_equal(df.columns,
-                                Index(['A', 'B', 'C', 'Unnamed: 3',
-                                       'Unnamed: 4']))
-
-    def test_duplicate_columns(self):
-        # TODO: add test for condition 'mangle_dupe_cols=False'
-        # once it is actually supported (gh-12935)
-        data = """A,A,B,B,B
-1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-
-        for method in ('read_csv', 'read_table'):
-
-            # check default behavior
-            df = getattr(self, method)(StringIO(data), sep=',')
-            self.assertEqual(list(df.columns),
-                             ['A', 'A.1', 'B', 'B.1', 'B.2'])
-
-            df = getattr(self, method)(StringIO(data), sep=',',
-                                       mangle_dupe_cols=True)
-            self.assertEqual(list(df.columns),
-                             ['A', 'A.1', 'B', 'B.1', 'B.2'])
-
-    def test_csv_mixed_type(self):
-        data = """A,B,C
-a,1,2
-b,3,4
-c,4,5
-"""
-        expected = DataFrame({'A': ['a', 'b', 'c'],
-                              'B': [1, 3, 4],
-                              'C': [2, 4, 5]})
-        out = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(out, expected)
-
-    def test_read_csv_dataframe(self):
-        df = self.read_csv(self.csv1, index_col=0, parse_dates=True)
-        df2 = self.read_table(self.csv1, sep=',', index_col=0,
-                              parse_dates=True)
-        self.assert_index_equal(df.columns, pd.Index(['A', 'B', 'C', 'D']))
-        self.assertEqual(df.index.name, 'index')
-        self.assertIsInstance(
-            df.index[0], (datetime, np.datetime64, Timestamp))
-        self.assertEqual(df.values.dtype, np.float64)
-        tm.assert_frame_equal(df, df2)
-
-    def test_read_csv_no_index_name(self):
-        df = self.read_csv(self.csv2, index_col=0, parse_dates=True)
-        df2 = self.read_table(self.csv2, sep=',', index_col=0,
-                              parse_dates=True)
-        self.assert_index_equal(df.columns,
-                                pd.Index(['A', 'B', 'C', 'D', 'E']))
-        self.assertIsInstance(df.index[0],
-                              (datetime, np.datetime64, Timestamp))
-        self.assertEqual(df.loc[:, ['A', 'B', 'C', 'D']].values.dtype,
-                         np.float64)
-        tm.assert_frame_equal(df, df2)
-
-    def test_read_table_unicode(self):
-        fin = BytesIO(u('\u0141aski, Jan;1').encode('utf-8'))
-        df1 = self.read_table(fin, sep=";", encoding="utf-8", header=None)
-        tm.assertIsInstance(df1[0].values[0], compat.text_type)
-
-    def test_read_table_wrong_num_columns(self):
-        # too few!
-        data = """A,B,C,D,E,F
-1,2,3,4,5,6
-6,7,8,9,10,11,12
-11,12,13,14,15,16
-"""
-        self.assertRaises(ValueError, self.read_csv, StringIO(data))
-
-    def test_read_duplicate_index_explicit(self):
-        data = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo,12,13,14,15
-bar,12,13,14,15
-"""
-
-        result = self.read_csv(StringIO(data), index_col=0)
-        expected = self.read_csv(StringIO(data)).set_index(
-            'index', verify_integrity=False)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_table(StringIO(data), sep=',', index_col=0)
-        expected = self.read_table(StringIO(data), sep=',', ).set_index(
-            'index', verify_integrity=False)
-        tm.assert_frame_equal(result, expected)
-
-    def test_read_duplicate_index_implicit(self):
-        data = """A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo,12,13,14,15
-bar,12,13,14,15
-"""
-
-        # make sure an error isn't thrown
-        self.read_csv(StringIO(data))
-        self.read_table(StringIO(data), sep=',')
-
-    def test_parse_bools(self):
-        data = """A,B
-True,1
-False,2
-True,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-YES,1
-no,2
-yes,3
-No,3
-Yes,3
-"""
-        data = self.read_csv(StringIO(data),
-                             true_values=['yes', 'Yes', 'YES'],
-                             false_values=['no', 'NO', 'No'])
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-TRUE,1
-FALSE,2
-TRUE,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.bool_)
-
-        data = """A,B
-foo,bar
-bar,foo"""
-        result = self.read_csv(StringIO(data), true_values=['foo'],
-                               false_values=['bar'])
-        expected = DataFrame({'A': [True, False], 'B': [False, True]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_int_conversion(self):
-        data = """A,B
-1.0,1
-2.0,2
-3.0,3
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertEqual(data['A'].dtype, np.float64)
-        self.assertEqual(data['B'].dtype, np.int64)
-
-    def test_read_nrows(self):
-        expected = self.read_csv(StringIO(self.data1))[:3]
-
-        df = self.read_csv(StringIO(self.data1), nrows=3)
-        tm.assert_frame_equal(df, expected)
-
-        # see gh-10476
-        df = self.read_csv(StringIO(self.data1), nrows=3.0)
-        tm.assert_frame_equal(df, expected)
-
-        msg = r"'nrows' must be an integer >=0"
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), nrows=1.2)
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), nrows='foo')
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), nrows=-1)
-
-    def test_read_chunksize(self):
-        reader = self.read_csv(StringIO(self.data1), index_col=0, chunksize=2)
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunks = list(reader)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-        # with invalid chunksize value:
-        msg = r"'chunksize' must be an integer >=1"
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), chunksize=1.3)
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), chunksize='foo')
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(self.data1), chunksize=0)
-
-    def test_read_chunksize_and_nrows(self):
-
-        # gh-15755
-        # With nrows
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               chunksize=2, nrows=5)
-        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
-
-        tm.assert_frame_equal(pd.concat(reader), df)
-
-        # chunksize > nrows
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               chunksize=8, nrows=5)
-        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
-
-        tm.assert_frame_equal(pd.concat(reader), df)
-
-        # with changing "size":
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               chunksize=8, nrows=5)
-        df = self.read_csv(StringIO(self.data1), index_col=0, nrows=5)
-
-        tm.assert_frame_equal(reader.get_chunk(size=2), df.iloc[:2])
-        tm.assert_frame_equal(reader.get_chunk(size=4), df.iloc[2:5])
-        with tm.assertRaises(StopIteration):
-            reader.get_chunk(size=3)
-
-    def test_read_chunksize_named(self):
-        reader = self.read_csv(
-            StringIO(self.data1), index_col='index', chunksize=2)
-        df = self.read_csv(StringIO(self.data1), index_col='index')
-
-        chunks = list(reader)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-    def test_get_chunk_passed_chunksize(self):
-        data = """A,B,C
-1,2,3
-4,5,6
-7,8,9
-1,2,3"""
-        result = self.read_csv(StringIO(data), chunksize=2)
-
-        piece = result.get_chunk()
-        self.assertEqual(len(piece), 2)
-
-    def test_read_chunksize_generated_index(self):
-        # GH 12185
-        reader = self.read_csv(StringIO(self.data1), chunksize=2)
-        df = self.read_csv(StringIO(self.data1))
-
-        tm.assert_frame_equal(pd.concat(reader), df)
-
-        reader = self.read_csv(StringIO(self.data1), chunksize=2, index_col=0)
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        tm.assert_frame_equal(pd.concat(reader), df)
-
-    def test_read_text_list(self):
-        data = """A,B,C\nfoo,1,2,3\nbar,4,5,6"""
-        as_list = [['A', 'B', 'C'], ['foo', '1', '2', '3'], ['bar',
-                                                             '4', '5', '6']]
-        df = self.read_csv(StringIO(data), index_col=0)
-
-        parser = TextParser(as_list, index_col=0, chunksize=2)
-        chunk = parser.read(None)
-
-        tm.assert_frame_equal(chunk, df)
-
-    def test_iterator(self):
-        # See gh-6607
-        reader = self.read_csv(StringIO(self.data1), index_col=0,
-                               iterator=True)
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunk = reader.read(3)
-        tm.assert_frame_equal(chunk, df[:3])
-
-        last_chunk = reader.read(5)
-        tm.assert_frame_equal(last_chunk, df[3:])
-
-        # pass list
-        lines = list(csv.reader(StringIO(self.data1)))
-        parser = TextParser(lines, index_col=0, chunksize=2)
-
-        df = self.read_csv(StringIO(self.data1), index_col=0)
-
-        chunks = list(parser)
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-        # pass skiprows
-        parser = TextParser(lines, index_col=0, chunksize=2, skiprows=[1])
-        chunks = list(parser)
-        tm.assert_frame_equal(chunks[0], df[1:3])
-
-        treader = self.read_table(StringIO(self.data1), sep=',', index_col=0,
-                                  iterator=True)
-        tm.assertIsInstance(treader, TextFileReader)
-
-        # gh-3967: stopping iteration when chunksize is specified
-        data = """A,B,C
-foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        reader = self.read_csv(StringIO(data), iterator=True)
-        result = list(reader)
-        expected = DataFrame(dict(A=[1, 4, 7], B=[2, 5, 8], C=[
-            3, 6, 9]), index=['foo', 'bar', 'baz'])
-        tm.assert_frame_equal(result[0], expected)
-
-        # chunksize = 1
-        reader = self.read_csv(StringIO(data), chunksize=1)
-        result = list(reader)
-        expected = DataFrame(dict(A=[1, 4, 7], B=[2, 5, 8], C=[
-            3, 6, 9]), index=['foo', 'bar', 'baz'])
-        self.assertEqual(len(result), 3)
-        tm.assert_frame_equal(pd.concat(result), expected)
-
-        # skipfooter is not supported with the C parser yet
-        if self.engine == 'python':
-            # test bad parameter (skipfooter)
-            reader = self.read_csv(StringIO(self.data1), index_col=0,
-                                   iterator=True, skipfooter=True)
-            self.assertRaises(ValueError, reader.read, 3)
-
-    def test_pass_names_with_index(self):
-        lines = self.data1.split('\n')
-        no_header = '\n'.join(lines[1:])
-
-        # regular index
-        names = ['index', 'A', 'B', 'C', 'D']
-        df = self.read_csv(StringIO(no_header), index_col=0, names=names)
-        expected = self.read_csv(StringIO(self.data1), index_col=0)
-        tm.assert_frame_equal(df, expected)
-
-        # multi index
-        data = """index1,index2,A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-        lines = data.split('\n')
-        no_header = '\n'.join(lines[1:])
-        names = ['index1', 'index2', 'A', 'B', 'C', 'D']
-        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
-                           names=names)
-        expected = self.read_csv(StringIO(data), index_col=[0, 1])
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(data), index_col=['index1', 'index2'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_multi_index_no_level_names(self):
-        data = """index1,index2,A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-
-        data2 = """A,B,C,D
-foo,one,2,3,4,5
-foo,two,7,8,9,10
-foo,three,12,13,14,15
-bar,one,12,13,14,15
-bar,two,12,13,14,15
-"""
-
-        lines = data.split('\n')
-        no_header = '\n'.join(lines[1:])
-        names = ['A', 'B', 'C', 'D']
-
-        df = self.read_csv(StringIO(no_header), index_col=[0, 1],
-                           header=None, names=names)
-        expected = self.read_csv(StringIO(data), index_col=[0, 1])
-        tm.assert_frame_equal(df, expected, check_names=False)
-
-        # 2 implicit first cols
-        df2 = self.read_csv(StringIO(data2))
-        tm.assert_frame_equal(df2, df)
-
-        # reverse order of index
-        df = self.read_csv(StringIO(no_header), index_col=[1, 0], names=names,
-                           header=None)
-        expected = self.read_csv(StringIO(data), index_col=[1, 0])
-        tm.assert_frame_equal(df, expected, check_names=False)
-
-    def test_multi_index_blank_df(self):
-        # GH 14545
-        data = """a,b
-"""
-        df = self.read_csv(StringIO(data), header=[0])
-        expected = DataFrame(columns=['a', 'b'])
-        tm.assert_frame_equal(df, expected)
-        round_trip = self.read_csv(StringIO(
-            expected.to_csv(index=False)), header=[0])
-        tm.assert_frame_equal(round_trip, expected)
-
-        data_multiline = """a,b
-c,d
-"""
-        df2 = self.read_csv(StringIO(data_multiline), header=[0, 1])
-        cols = MultiIndex.from_tuples([('a', 'c'), ('b', 'd')])
-        expected2 = DataFrame(columns=cols)
-        tm.assert_frame_equal(df2, expected2)
-        round_trip = self.read_csv(StringIO(
-            expected2.to_csv(index=False)), header=[0, 1])
-        tm.assert_frame_equal(round_trip, expected2)
-
-    def test_no_unnamed_index(self):
-        data = """ id c0 c1 c2
-0 1 0 a b
-1 2 0 c d
-2 2 2 e f
-"""
-        df = self.read_table(StringIO(data), sep=' ')
-        self.assertIsNone(df.index.name)
-
-    def test_read_csv_parse_simple_list(self):
-        text = """foo
-bar baz
-qux foo
-foo
-bar"""
-        df = self.read_csv(StringIO(text), header=None)
-        expected = DataFrame({0: ['foo', 'bar baz', 'qux foo',
-                                  'foo', 'bar']})
-        tm.assert_frame_equal(df, expected)
-
-    @tm.network
-    def test_url(self):
-        # HTTP(S)
-        url = ('https://raw.github.com/pandas-dev/pandas/master/'
-               'pandas/tests/io/parser/data/salaries.csv')
-        url_table = self.read_table(url)
-        dirpath = tm.get_data_path()
-        localtable = os.path.join(dirpath, 'salaries.csv')
-        local_table = self.read_table(localtable)
-        tm.assert_frame_equal(url_table, local_table)
-        # TODO: ftp testing
-
-    @tm.slow
-    def test_file(self):
-        dirpath = tm.get_data_path()
-        localtable = os.path.join(dirpath, 'salaries.csv')
-        local_table = self.read_table(localtable)
-
-        try:
-            url_table = self.read_table('file://localhost/' + localtable)
-        except URLError:
-            # fails on some systems
-            pytest.skip("failing on %s" %
-                        ' '.join(platform.uname()).strip())
-
-        tm.assert_frame_equal(url_table, local_table)
-
-    def test_nonexistent_path(self):
-        # gh-2428: pls no segfault
-        # gh-14086: raise more helpful FileNotFoundError
-        path = '%s.csv' % tm.rands(10)
-        self.assertRaises(compat.FileNotFoundError, self.read_csv, path)
-
-    def test_missing_trailing_delimiters(self):
-        data = """A,B,C,D
-1,2,3,4
-1,3,3,
-1,4,5"""
-        result = self.read_csv(StringIO(data))
-        self.assertTrue(result['D'].isnull()[1:].all())
-
-    def test_skipinitialspace(self):
-        s = ('"09-Apr-2012", "01:10:18.300", 2456026.548822908, 12849, '
-             '1.00361,  1.12551, 330.65659, 0355626618.16711,  73.48821, '
-             '314.11625,  1917.09447,   179.71425,  80.000, 240.000, -350,  '
-             '70.06056, 344.98370, 1,   1, -0.689265, -0.692787,  '
-             '0.212036,    14.7674,   41.605,   -9999.0,   -9999.0,   '
-             '-9999.0,   -9999.0,   -9999.0,  -9999.0, 000, 012, 128')
-
-        sfile = StringIO(s)
-        # it's 33 columns
-        result = self.read_csv(sfile, names=lrange(33), na_values=['-9999.0'],
-                               header=None, skipinitialspace=True)
-        self.assertTrue(pd.isnull(result.iloc[0, 29]))
-
-    def test_utf16_bom_skiprows(self):
-        # #2298
-        data = u("""skip this
-skip this too
-A\tB\tC
-1\t2\t3
-4\t5\t6""")
-
-        data2 = u("""skip this
-skip this too
-A,B,C
-1,2,3
-4,5,6""")
-
-        path = '__%s__.csv' % tm.rands(10)
-
-        with tm.ensure_clean(path) as path:
-            for sep, dat in [('\t', data), (',', data2)]:
-                for enc in ['utf-16', 'utf-16le', 'utf-16be']:
-                    bytes = dat.encode(enc)
-                    with open(path, 'wb') as f:
-                        f.write(bytes)
-
-                    s = BytesIO(dat.encode('utf-8'))
-                    if compat.PY3:
-                        # somewhat False since the code never sees bytes
-                        from io import TextIOWrapper
-                        s = TextIOWrapper(s, encoding='utf-8')
-
-                    result = self.read_csv(path, encoding=enc, skiprows=2,
-                                           sep=sep)
-                    expected = self.read_csv(s, encoding='utf-8', skiprows=2,
-                                             sep=sep)
-                    s.close()
-
-                    tm.assert_frame_equal(result, expected)
-
-    def test_utf16_example(self):
-        path = tm.get_data_path('utf16_ex.txt')
-
-        # it works! and is the right length
-        result = self.read_table(path, encoding='utf-16')
-        self.assertEqual(len(result), 50)
-
-        if not compat.PY3:
-            buf = BytesIO(open(path, 'rb').read())
-            result = self.read_table(buf, encoding='utf-16')
-            self.assertEqual(len(result), 50)
-
-    def test_unicode_encoding(self):
-        pth = tm.get_data_path('unicode_series.csv')
-
-        result = self.read_csv(pth, header=None, encoding='latin-1')
-        result = result.set_index(0)
-
-        got = result[1][1632]
-        expected = u('\xc1 k\xf6ldum klaka (Cold Fever) (1994)')
-
-        self.assertEqual(got, expected)
-
-    def test_trailing_delimiters(self):
-        # #2442. grumble grumble
-        data = """A,B,C
-1,2,3,
-4,5,6,
-7,8,9,"""
-        result = self.read_csv(StringIO(data), index_col=False)
-
-        expected = DataFrame({'A': [1, 4, 7], 'B': [2, 5, 8],
-                              'C': [3, 6, 9]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_escapechar(self):
-        # http://stackoverflow.com/questions/13824840/feature-request-for-
-        # pandas-read-csv
-        data = '''SEARCH_TERM,ACTUAL_URL
-"bra tv bord","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
-"tv p\xc3\xa5 hjul","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
-"SLAGBORD, \\"Bergslagen\\", IKEA:s 1700-tals serie","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"'''  # noqa
-
-        result = self.read_csv(StringIO(data), escapechar='\\',
-                               quotechar='"', encoding='utf-8')
-        self.assertEqual(result['SEARCH_TERM'][2],
-                         'SLAGBORD, "Bergslagen", IKEA:s 1700-tals serie')
-        self.assertTrue(np.array_equal(result.columns,
-                                       ['SEARCH_TERM', 'ACTUAL_URL']))
-
-    def test_int64_min_issues(self):
-        # #2599
-        data = 'A,B\n0,0\n0,'
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'A': [0, 0], 'B': [0, np.nan]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_parse_integers_above_fp_precision(self):
-        data = """Numbers
-17007000002000191
-17007000002000191
-17007000002000191
-17007000002000191
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000192
-17007000002000194"""
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'Numbers': [17007000002000191,
-                                          17007000002000191,
-                                          17007000002000191,
-                                          17007000002000191,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000192,
-                                          17007000002000194]})
-
-        self.assertTrue(np.array_equal(result['Numbers'], expected['Numbers']))
-
-    def test_chunks_have_consistent_numerical_type(self):
-        integers = [str(i) for i in range(499999)]
-        data = "a\n" + "\n".join(integers + ["1.0", "2.0"] + integers)
-
-        with tm.assert_produces_warning(False):
-            df = self.read_csv(StringIO(data))
-        # Assert that types were coerced.
-        self.assertTrue(type(df.a[0]) is np.float64)
-        self.assertEqual(df.a.dtype, np.float)
-
-    def test_warn_if_chunks_have_mismatched_type(self):
-        warning_type = False
-        integers = [str(i) for i in range(499999)]
-        data = "a\n" + "\n".join(integers + ['a', 'b'] + integers)
-
-        # see gh-3866: if chunks are different types and can't
-        # be coerced using numerical types, then issue warning.
-        if self.engine == 'c' and self.low_memory:
-            warning_type = DtypeWarning
-
-        with tm.assert_produces_warning(warning_type):
-            df = self.read_csv(StringIO(data))
-        self.assertEqual(df.a.dtype, np.object)
-
-    def test_integer_overflow_bug(self):
-        # see gh-2601
-        data = "65248E10 11\n55555E55 22\n"
-
-        result = self.read_csv(StringIO(data), header=None, sep=' ')
-        self.assertTrue(result[0].dtype == np.float64)
-
-        result = self.read_csv(StringIO(data), header=None, sep=r'\s+')
-        self.assertTrue(result[0].dtype == np.float64)
-
-    def test_catch_too_many_names(self):
-        # see gh-5156
-        data = """\
-1,2,3
-4,,6
-7,8,9
-10,11,12\n"""
-        tm.assertRaises(ValueError, self.read_csv, StringIO(data),
-                        header=0, names=['a', 'b', 'c', 'd'])
-
-    def test_ignore_leading_whitespace(self):
-        # see gh-3374, gh-6607
-        data = ' a b c\n 1 2 3\n 4 5 6\n 7 8 9'
-        result = self.read_table(StringIO(data), sep=r'\s+')
-        expected = DataFrame({'a': [1, 4, 7], 'b': [2, 5, 8], 'c': [3, 6, 9]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_chunk_begins_with_newline_whitespace(self):
-        # see gh-10022
-        data = '\n hello\nworld\n'
-        result = self.read_csv(StringIO(data), header=None)
-        self.assertEqual(len(result), 2)
-
-        # see gh-9735: this issue is C parser-specific (bug when
-        # parsing whitespace and characters at chunk boundary)
-        if self.engine == 'c':
-            chunk1 = 'a' * (1024 * 256 - 2) + '\na'
-            chunk2 = '\n a'
-            result = self.read_csv(StringIO(chunk1 + chunk2), header=None)
-            expected = DataFrame(['a' * (1024 * 256 - 2), 'a', ' a'])
-            tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_index(self):
-        # see gh-10184
-        data = 'x,y'
-        result = self.read_csv(StringIO(data), index_col=0)
-        expected = DataFrame([], columns=['y'], index=Index([], name='x'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_multiindex(self):
-        # see gh-10467
-        data = 'x,y,z'
-        result = self.read_csv(StringIO(data), index_col=['x', 'y'])
-        expected = DataFrame([], columns=['z'],
-                             index=MultiIndex.from_arrays(
-                                 [[]] * 2, names=['x', 'y']))
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_reversed_multiindex(self):
-        data = 'x,y,z'
-        result = self.read_csv(StringIO(data), index_col=[1, 0])
-        expected = DataFrame([], columns=['z'],
-                             index=MultiIndex.from_arrays(
-                                 [[]] * 2, names=['y', 'x']))
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_float_parser(self):
-        # see gh-9565
-        data = '45e-1,4.5,45.,inf,-inf'
-        result = self.read_csv(StringIO(data), header=None)
-        expected = DataFrame([[float(s) for s in data.split(',')]])
-        tm.assert_frame_equal(result, expected)
-
-    def test_scientific_no_exponent(self):
-        # see gh-12215
-        df = DataFrame.from_items([('w', ['2e']), ('x', ['3E']),
-                                   ('y', ['42e']), ('z', ['632E'])])
-        data = df.to_csv(index=False)
-        for prec in self.float_precision_choices:
-            df_roundtrip = self.read_csv(
-                StringIO(data), float_precision=prec)
-            tm.assert_frame_equal(df_roundtrip, df)
-
-    def test_int64_overflow(self):
-        data = """ID
-00013007854817840016671868
-00013007854817840016749251
-00013007854817840016754630
-00013007854817840016781876
-00013007854817840017028824
-00013007854817840017963235
-00013007854817840018860166"""
-
-        # 13007854817840016671868 > UINT64_MAX, so this
-        # will overflow and return object as the dtype.
-        result = self.read_csv(StringIO(data))
-        self.assertTrue(result['ID'].dtype == object)
-
-        # 13007854817840016671868 > UINT64_MAX, so attempts
-        # to cast to either int64 or uint64 will result in
-        # an OverflowError being raised.
-        for conv in (np.int64, np.uint64):
-            self.assertRaises(OverflowError, self.read_csv,
-                              StringIO(data), converters={'ID': conv})
-
-        # These numbers fall right inside the int64-uint64 range,
-        # so they should be parsed as string.
-        ui_max = np.iinfo(np.uint64).max
-        i_max = np.iinfo(np.int64).max
-        i_min = np.iinfo(np.int64).min
-
-        for x in [i_max, i_min, ui_max]:
-            result = self.read_csv(StringIO(str(x)), header=None)
-            expected = DataFrame([x])
-            tm.assert_frame_equal(result, expected)
-
-        # These numbers fall just outside the int64-uint64 range,
-        # so they should be parsed as string.
-        too_big = ui_max + 1
-        too_small = i_min - 1
-
-        for x in [too_big, too_small]:
-            result = self.read_csv(StringIO(str(x)), header=None)
-            expected = DataFrame([str(x)])
-            tm.assert_frame_equal(result, expected)
-
-        # No numerical dtype can hold both negative and uint64 values,
-        # so they should be cast as string.
-        data = '-1\n' + str(2**63)
-        expected = DataFrame([str(-1), str(2**63)])
-        result = self.read_csv(StringIO(data), header=None)
-        tm.assert_frame_equal(result, expected)
-
-        data = str(2**63) + '\n-1'
-        expected = DataFrame([str(2**63), str(-1)])
-        result = self.read_csv(StringIO(data), header=None)
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_with_nrows_chunksize(self):
-        # see gh-9535
-        expected = DataFrame([], columns=['foo', 'bar'])
-        result = self.read_csv(StringIO('foo,bar\n'), nrows=10)
-        tm.assert_frame_equal(result, expected)
-
-        result = next(iter(self.read_csv(
-            StringIO('foo,bar\n'), chunksize=10)))
-        tm.assert_frame_equal(result, expected)
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            result = self.read_csv(StringIO('foo,bar\n'),
-                                   nrows=10, as_recarray=True)
-            result = DataFrame(result[2], columns=result[1],
-                               index=result[0])
-            tm.assert_frame_equal(DataFrame.from_records(
-                result), expected, check_index_type=False)
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            result = next(iter(self.read_csv(StringIO('foo,bar\n'),
-                                             chunksize=10, as_recarray=True)))
-            result = DataFrame(result[2], columns=result[1], index=result[0])
-            tm.assert_frame_equal(DataFrame.from_records(result), expected,
-                                  check_index_type=False)
-
-    def test_eof_states(self):
-        # see gh-10728, gh-10548
-
-        # With skip_blank_lines = True
-        expected = DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
-
-        # gh-10728: WHITESPACE_LINE
-        data = 'a,b,c\n4,5,6\n '
-        result = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(result, expected)
-
-        # gh-10548: EAT_LINE_COMMENT
-        data = 'a,b,c\n4,5,6\n#comment'
-        result = self.read_csv(StringIO(data), comment='#')
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_CRNL_NOP
-        data = 'a,b,c\n4,5,6\n\r'
-        result = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_COMMENT
-        data = 'a,b,c\n4,5,6#comment'
-        result = self.read_csv(StringIO(data), comment='#')
-        tm.assert_frame_equal(result, expected)
-
-        # SKIP_LINE
-        data = 'a,b,c\n4,5,6\nskipme'
-        result = self.read_csv(StringIO(data), skiprows=[2])
-        tm.assert_frame_equal(result, expected)
-
-        # With skip_blank_lines = False
-
-        # EAT_LINE_COMMENT
-        data = 'a,b,c\n4,5,6\n#comment'
-        result = self.read_csv(
-            StringIO(data), comment='#', skip_blank_lines=False)
-        expected = DataFrame([[4, 5, 6]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        # IN_FIELD
-        data = 'a,b,c\n4,5,6\n '
-        result = self.read_csv(StringIO(data), skip_blank_lines=False)
-        expected = DataFrame(
-            [['4', 5, 6], [' ', None, None]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        # EAT_CRNL
-        data = 'a,b,c\n4,5,6\n\r'
-        result = self.read_csv(StringIO(data), skip_blank_lines=False)
-        expected = DataFrame(
-            [[4, 5, 6], [None, None, None]], columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-        # Should produce exceptions
-
-        # ESCAPED_CHAR
-        data = "a,b,c\n4,5,6\n\\"
-        self.assertRaises(Exception, self.read_csv,
-                          StringIO(data), escapechar='\\')
-
-        # ESCAPE_IN_QUOTED_FIELD
-        data = 'a,b,c\n4,5,6\n"\\'
-        self.assertRaises(Exception, self.read_csv,
-                          StringIO(data), escapechar='\\')
-
-        # IN_QUOTED_FIELD
-        data = 'a,b,c\n4,5,6\n"'
-        self.assertRaises(Exception, self.read_csv,
-                          StringIO(data), escapechar='\\')
-
-    def test_uneven_lines_with_usecols(self):
-        # See gh-12203
-        csv = r"""a,b,c
-        0,1,2
-        3,4,5,6,7
-        8,9,10
-        """
-
-        # make sure that an error is still thrown
-        # when the 'usecols' parameter is not provided
-        msg = r"Expected \d+ fields in line \d+, saw \d+"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df = self.read_csv(StringIO(csv))
-
-        expected = DataFrame({
-            'a': [0, 3, 8],
-            'b': [1, 4, 9]
-        })
-
-        usecols = [0, 1]
-        df = self.read_csv(StringIO(csv), usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-        usecols = ['a', 'b']
-        df = self.read_csv(StringIO(csv), usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-    def test_read_empty_with_usecols(self):
-        # See gh-12493
-        names = ['Dummy', 'X', 'Dummy_2']
-        usecols = names[1:2]  # ['X']
-
-        # first, check to see that the response of
-        # parser when faced with no provided columns
-        # throws the correct error, with or without usecols
-        errmsg = "No columns to parse from file"
-
-        with tm.assertRaisesRegexp(EmptyDataError, errmsg):
-            self.read_csv(StringIO(''))
-
-        with tm.assertRaisesRegexp(EmptyDataError, errmsg):
-            self.read_csv(StringIO(''), usecols=usecols)
-
-        expected = DataFrame(columns=usecols, index=[0], dtype=np.float64)
-        df = self.read_csv(StringIO(',,'), names=names, usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-        expected = DataFrame(columns=usecols)
-        df = self.read_csv(StringIO(''), names=names, usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-    def test_trailing_spaces(self):
-        data = "A B C  \nrandom line with trailing spaces    \nskip\n1,2,3\n1,2.,4.\nrandom line with trailing tabs\t\t\t\n   \n5.1,NaN,10.0\n"  # noqa
-        expected = DataFrame([[1., 2., 4.],
-                              [5.1, np.nan, 10.]])
-
-        # gh-8661, gh-8679: this should ignore six lines including
-        # lines with trailing whitespace and blank lines
-        df = self.read_csv(StringIO(data.replace(',', '  ')),
-                           header=None, delim_whitespace=True,
-                           skiprows=[0, 1, 2, 3, 5, 6], skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-        df = self.read_table(StringIO(data.replace(',', '  ')),
-                             header=None, delim_whitespace=True,
-                             skiprows=[0, 1, 2, 3, 5, 6],
-                             skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-
-        # gh-8983: test skipping set of rows after a row with trailing spaces
-        expected = DataFrame({"A": [1., 5.1], "B": [2., np.nan],
-                              "C": [4., 10]})
-        df = self.read_table(StringIO(data.replace(',', '  ')),
-                             delim_whitespace=True,
-                             skiprows=[1, 2, 3, 5, 6], skip_blank_lines=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_raise_on_sep_with_delim_whitespace(self):
-        # see gh-6607
-        data = 'a b c\n1 2 3'
-        with tm.assertRaisesRegexp(ValueError, 'you can only specify one'):
-            self.read_table(StringIO(data), sep=r'\s', delim_whitespace=True)
-
-    def test_single_char_leading_whitespace(self):
-        # see gh-9710
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b\n"""
-
-        expected = DataFrame({'MyColumn': list('abab')})
-
-        result = self.read_csv(StringIO(data), delim_whitespace=True,
-                               skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), skipinitialspace=True)
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_lines(self):
-        data = """\
-A,B,C
-1,2.,4.
-
-
-5.,NaN,10.0
-
--70,.4,1
-"""
-        expected = np.array([[1., 2., 4.],
-                             [5., np.nan, 10.],
-                             [-70., .4, 1.]])
-        df = self.read_csv(StringIO(data))
-        tm.assert_numpy_array_equal(df.values, expected)
-        df = self.read_csv(StringIO(data.replace(',', '  ')), sep=r'\s+')
-        tm.assert_numpy_array_equal(df.values, expected)
-        expected = np.array([[1., 2., 4.],
-                             [np.nan, np.nan, np.nan],
-                             [np.nan, np.nan, np.nan],
-                             [5., np.nan, 10.],
-                             [np.nan, np.nan, np.nan],
-                             [-70., .4, 1.]])
-        df = self.read_csv(StringIO(data), skip_blank_lines=False)
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_whitespace_lines(self):
-        data = """
-
-\t  \t\t
-  \t
-A,B,C
-  \t    1,2.,4.
-5.,NaN,10.0
-"""
-        expected = np.array([[1, 2., 4.],
-                             [5., np.nan, 10.]])
-        df = self.read_csv(StringIO(data))
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_regex_separator(self):
-        # see gh-6607
-        data = """   A   B   C   D
-a   1   2   3   4
-b   1   2   3   4
-c   1   2   3   4
-"""
-        df = self.read_table(StringIO(data), sep=r'\s+')
-        expected = self.read_csv(StringIO(re.sub('[ ]+', ',', data)),
-                                 index_col=0)
-        self.assertIsNone(expected.index.name)
-        tm.assert_frame_equal(df, expected)
-
-        data = '    a b c\n1 2 3 \n4 5  6\n 7 8 9'
-        result = self.read_table(StringIO(data), sep=r'\s+')
-        expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                             columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_verbose_import(self):
-        text = """a,b,c,d
-one,1,2,3
-one,1,2,3
-,1,2,3
-one,1,2,3
-,1,2,3
-,1,2,3
-one,1,2,3
-two,1,2,3"""
-
-        buf = StringIO()
-        sys.stdout = buf
-
-        try:  # engines are verbose in different ways
-            self.read_csv(StringIO(text), verbose=True)
-            if self.engine == 'c':
-                self.assertIn('Tokenization took:', buf.getvalue())
-                self.assertIn('Parser memory cleanup took:', buf.getvalue())
-            else:  # Python engine
-                self.assertEqual(buf.getvalue(),
-                                 'Filled 3 NA values in column a\n')
-        finally:
-            sys.stdout = sys.__stdout__
-
-        buf = StringIO()
-        sys.stdout = buf
-
-        text = """a,b,c,d
-one,1,2,3
-two,1,2,3
-three,1,2,3
-four,1,2,3
-five,1,2,3
-,1,2,3
-seven,1,2,3
-eight,1,2,3"""
-
-        try:  # engines are verbose in different ways
-            self.read_csv(StringIO(text), verbose=True, index_col=0)
-            if self.engine == 'c':
-                self.assertIn('Tokenization took:', buf.getvalue())
-                self.assertIn('Parser memory cleanup took:', buf.getvalue())
-            else:  # Python engine
-                self.assertEqual(buf.getvalue(),
-                                 'Filled 1 NA values in column a\n')
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_iteration_open_handle(self):
-        if PY3:
-            pytest.skip(
-                "won't work in Python 3 {0}".format(sys.version_info))
-
-        with tm.ensure_clean() as path:
-            with open(path, 'wb') as f:
-                f.write('AAA\nBBB\nCCC\nDDD\nEEE\nFFF\nGGG')
-
-            with open(path, 'rb') as f:
-                for line in f:
-                    if 'CCC' in line:
-                        break
-
-                if self.engine == 'c':
-                    tm.assertRaises(Exception, self.read_table,
-                                    f, squeeze=True, header=None)
-                else:
-                    result = self.read_table(f, squeeze=True, header=None)
-                    expected = Series(['DDD', 'EEE', 'FFF', 'GGG'], name=0)
-                    tm.assert_series_equal(result, expected)
-
-    def test_1000_sep_with_decimal(self):
-        data = """A|B|C
-1|2,334.01|5
-10|13|10.
-"""
-        expected = DataFrame({
-            'A': [1, 10],
-            'B': [2334.01, 13],
-            'C': [5, 10.]
-        })
-
-        tm.assert_equal(expected.A.dtype, 'int64')
-        tm.assert_equal(expected.B.dtype, 'float')
-        tm.assert_equal(expected.C.dtype, 'float')
-
-        df = self.read_csv(StringIO(data), sep='|', thousands=',', decimal='.')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data), sep='|',
-                             thousands=',', decimal='.')
-        tm.assert_frame_equal(df, expected)
-
-        data_with_odd_sep = """A|B|C
-1|2.334,01|5
-10|13|10,
-"""
-        df = self.read_csv(StringIO(data_with_odd_sep),
-                           sep='|', thousands='.', decimal=',')
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_table(StringIO(data_with_odd_sep),
-                             sep='|', thousands='.', decimal=',')
-        tm.assert_frame_equal(df, expected)
-
-    def test_euro_decimal_format(self):
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-
-        df2 = self.read_csv(StringIO(data), sep=';', decimal=',')
-        self.assertEqual(df2['Number1'].dtype, float)
-        self.assertEqual(df2['Number2'].dtype, float)
-        self.assertEqual(df2['Number3'].dtype, float)
-
-    def test_read_duplicate_names(self):
-        # See gh-7160
-        data = "a,b,a\n0,1,2\n3,4,5"
-        df = self.read_csv(StringIO(data))
-        expected = DataFrame([[0, 1, 2], [3, 4, 5]],
-                             columns=['a', 'b', 'a.1'])
-        tm.assert_frame_equal(df, expected)
-
-        data = "0,1,2\n3,4,5"
-        df = self.read_csv(StringIO(data), names=["a", "b", "a"])
-        expected = DataFrame([[0, 1, 2], [3, 4, 5]],
-                             columns=['a', 'b', 'a.1'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_inf_parsing(self):
-        data = """\
-,A
-a,inf
-b,-inf
-c,+Inf
-d,-Inf
-e,INF
-f,-INF
-g,+INf
-h,-INf
-i,inF
-j,-inF"""
-        inf = float('inf')
-        expected = Series([inf, -inf] * 5)
-
-        df = self.read_csv(StringIO(data), index_col=0)
-        tm.assert_almost_equal(df['A'].values, expected.values)
-
-        df = self.read_csv(StringIO(data), index_col=0, na_filter=False)
-        tm.assert_almost_equal(df['A'].values, expected.values)
-
-    def test_raise_on_no_columns(self):
-        # single newline
-        data = "\n"
-        self.assertRaises(EmptyDataError, self.read_csv, StringIO(data))
-
-        # test with more than a single newline
-        data = "\n\n\n"
-        self.assertRaises(EmptyDataError, self.read_csv, StringIO(data))
-
-    def test_compact_ints_use_unsigned(self):
-        # see gh-13323
-        data = 'a,b,c\n1,9,258'
-
-        # sanity check
-        expected = DataFrame({
-            'a': np.array([1], dtype=np.int64),
-            'b': np.array([9], dtype=np.int64),
-            'c': np.array([258], dtype=np.int64),
-        })
-        out = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(out, expected)
-
-        expected = DataFrame({
-            'a': np.array([1], dtype=np.int8),
-            'b': np.array([9], dtype=np.int8),
-            'c': np.array([258], dtype=np.int16),
-        })
-
-        # default behaviour for 'use_unsigned'
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            out = self.read_csv(StringIO(data), compact_ints=True)
-            tm.assert_frame_equal(out, expected)
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            out = self.read_csv(StringIO(data), compact_ints=True,
-                                use_unsigned=False)
-            tm.assert_frame_equal(out, expected)
-
-        expected = DataFrame({
-            'a': np.array([1], dtype=np.uint8),
-            'b': np.array([9], dtype=np.uint8),
-            'c': np.array([258], dtype=np.uint16),
-        })
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            out = self.read_csv(StringIO(data), compact_ints=True,
-                                use_unsigned=True)
-            tm.assert_frame_equal(out, expected)
-
-    def test_compact_ints_as_recarray(self):
-        data = ('0,1,0,0\n'
-                '1,1,0,0\n'
-                '0,1,0,1')
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            result = self.read_csv(StringIO(data), delimiter=',', header=None,
-                                   compact_ints=True, as_recarray=True)
-            ex_dtype = np.dtype([(str(i), 'i1') for i in range(4)])
-            self.assertEqual(result.dtype, ex_dtype)
-
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            result = self.read_csv(StringIO(data), delimiter=',', header=None,
-                                   as_recarray=True, compact_ints=True,
-                                   use_unsigned=True)
-            ex_dtype = np.dtype([(str(i), 'u1') for i in range(4)])
-            self.assertEqual(result.dtype, ex_dtype)
-
-    def test_as_recarray(self):
-        # basic test
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'a,b\n1,a\n2,b'
-            expected = np.array([(1, 'a'), (2, 'b')],
-                                dtype=[('a', '=i8'), ('b', 'O')])
-            out = self.read_csv(StringIO(data), as_recarray=True)
-            tm.assert_numpy_array_equal(out, expected)
-
-        # index_col ignored
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'a,b\n1,a\n2,b'
-            expected = np.array([(1, 'a'), (2, 'b')],
-                                dtype=[('a', '=i8'), ('b', 'O')])
-            out = self.read_csv(StringIO(data), as_recarray=True, index_col=0)
-            tm.assert_numpy_array_equal(out, expected)
-
-        # respects names
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = '1,a\n2,b'
-            expected = np.array([(1, 'a'), (2, 'b')],
-                                dtype=[('a', '=i8'), ('b', 'O')])
-            out = self.read_csv(StringIO(data), names=['a', 'b'],
-                                header=None, as_recarray=True)
-            tm.assert_numpy_array_equal(out, expected)
-
-        # header order is respected even though it conflicts
-        # with the natural ordering of the column names
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'b,a\n1,a\n2,b'
-            expected = np.array([(1, 'a'), (2, 'b')],
-                                dtype=[('b', '=i8'), ('a', 'O')])
-            out = self.read_csv(StringIO(data), as_recarray=True)
-            tm.assert_numpy_array_equal(out, expected)
-
-        # overrides the squeeze parameter
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'a\n1'
-            expected = np.array([(1,)], dtype=[('a', '=i8')])
-            out = self.read_csv(StringIO(data), as_recarray=True, squeeze=True)
-            tm.assert_numpy_array_equal(out, expected)
-
-        # does data conversions before doing recarray conversion
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'a,b\n1,a\n2,b'
-            conv = lambda x: int(x) + 1
-            expected = np.array([(2, 'a'), (3, 'b')],
-                                dtype=[('a', '=i8'), ('b', 'O')])
-            out = self.read_csv(StringIO(data), as_recarray=True,
-                                converters={'a': conv})
-            tm.assert_numpy_array_equal(out, expected)
-
-        # filters by usecols before doing recarray conversion
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            data = 'a,b\n1,a\n2,b'
-            expected = np.array([(1,), (2,)], dtype=[('a', '=i8')])
-            out = self.read_csv(StringIO(data), as_recarray=True,
-                                usecols=['a'])
-            tm.assert_numpy_array_equal(out, expected)
-
-    def test_memory_map(self):
-        mmap_file = os.path.join(self.dirpath, 'test_mmap.csv')
-        expected = DataFrame({
-            'a': [1, 2, 3],
-            'b': ['one', 'two', 'three'],
-            'c': ['I', 'II', 'III']
-        })
-
-        out = self.read_csv(mmap_file, memory_map=True)
-        tm.assert_frame_equal(out, expected)
-
-    def test_null_byte_char(self):
-        # see gh-2741
-        data = '\x00,foo'
-        cols = ['a', 'b']
-
-        expected = DataFrame([[np.nan, 'foo']],
-                             columns=cols)
-
-        if self.engine == 'c':
-            out = self.read_csv(StringIO(data), names=cols)
-            tm.assert_frame_equal(out, expected)
-        else:
-            msg = "NULL byte detected"
-            with tm.assertRaisesRegexp(csv.Error, msg):
-                self.read_csv(StringIO(data), names=cols)
-
-    def test_utf8_bom(self):
-        # see gh-4793
-        bom = u('\ufeff')
-        utf8 = 'utf-8'
-
-        def _encode_data_with_bom(_data):
-            bom_data = (bom + _data).encode(utf8)
-            return BytesIO(bom_data)
-
-        # basic test
-        data = 'a\n1'
-        expected = DataFrame({'a': [1]})
-
-        out = self.read_csv(_encode_data_with_bom(data),
-                            encoding=utf8)
-        tm.assert_frame_equal(out, expected)
-
-        # test with "regular" quoting
-        data = '"a"\n1'
-        expected = DataFrame({'a': [1]})
-
-        out = self.read_csv(_encode_data_with_bom(data),
-                            encoding=utf8, quotechar='"')
-        tm.assert_frame_equal(out, expected)
-
-        # test in a data row instead of header
-        data = 'b\n1'
-        expected = DataFrame({'a': ['b', '1']})
-
-        out = self.read_csv(_encode_data_with_bom(data),
-                            encoding=utf8, names=['a'])
-        tm.assert_frame_equal(out, expected)
-
-        # test in empty data row with skipping
-        data = '\n1'
-        expected = DataFrame({'a': [1]})
-
-        out = self.read_csv(_encode_data_with_bom(data),
-                            encoding=utf8, names=['a'],
-                            skip_blank_lines=True)
-        tm.assert_frame_equal(out, expected)
-
-        # test in empty data row without skipping
-        data = '\n1'
-        expected = DataFrame({'a': [np.nan, 1.0]})
-
-        out = self.read_csv(_encode_data_with_bom(data),
-                            encoding=utf8, names=['a'],
-                            skip_blank_lines=False)
-        tm.assert_frame_equal(out, expected)
-
-    def test_temporary_file(self):
-        # see gh-13398
-        data1 = "0 0"
-
-        from tempfile import TemporaryFile
-        new_file = TemporaryFile("w+")
-        new_file.write(data1)
-        new_file.flush()
-        new_file.seek(0)
-
-        result = self.read_csv(new_file, sep=r'\s+', header=None)
-        new_file.close()
-        expected = DataFrame([[0, 0]])
-        tm.assert_frame_equal(result, expected)
-
-    def test_read_csv_utf_aliases(self):
-        # see gh issue 13549
-        expected = pd.DataFrame({'mb_num': [4.8], 'multibyte': ['test']})
-        for byte in [8, 16]:
-            for fmt in ['utf-{0}', 'utf_{0}', 'UTF-{0}', 'UTF_{0}']:
-                encoding = fmt.format(byte)
-                data = 'mb_num,multibyte\n4.8,test'.encode(encoding)
-                result = self.read_csv(BytesIO(data), encoding=encoding)
-                tm.assert_frame_equal(result, expected)
-
-    def test_internal_eof_byte(self):
-        # see gh-5500
-        data = "a,b\n1\x1a,2"
-
-        expected = pd.DataFrame([["1\x1a", 2]], columns=['a', 'b'])
-        result = self.read_csv(StringIO(data))
-        tm.assert_frame_equal(result, expected)
-
-    def test_file_handles(self):
-        # GH 14418 - don't close user provided file handles
-
-        fh = StringIO('a,b\n1,2')
-        self.read_csv(fh)
-        self.assertFalse(fh.closed)
-
-        with open(self.csv1, 'r') as f:
-            self.read_csv(f)
-            self.assertFalse(f.closed)
-
-        # mmap not working with python engine
-        if self.engine != 'python':
-
-            import mmap
-            with open(self.csv1, 'r') as f:
-                m = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
-                self.read_csv(m)
-                # closed attribute new in python 3.2
-                if PY3:
-                    self.assertFalse(m.closed)
-                m.close()
diff --git a/pandas/tests/io/parser/compression.py b/pandas/tests/io/parser/compression.py
deleted file mode 100644
index bdcd10fc64aa5..0000000000000
--- a/pandas/tests/io/parser/compression.py
+++ /dev/null
@@ -1,171 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests compressed data parsing functionality for all
-of the parsers defined in parsers.py
-"""
-
-import pytest
-
-import pandas.util.testing as tm
-
-
-class CompressionTests(object):
-
-    def test_zip(self):
-        try:
-            import zipfile
-        except ImportError:
-            pytest.skip('need zipfile to run')
-
-        with open(self.csv1, 'rb') as data_file:
-            data = data_file.read()
-            expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean('test_file.zip') as path:
-            tmp = zipfile.ZipFile(path, mode='w')
-            tmp.writestr('test_file', data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='zip')
-            tm.assert_frame_equal(result, expected)
-
-            result = self.read_csv(path, compression='infer')
-            tm.assert_frame_equal(result, expected)
-
-            if self.engine is not 'python':
-                with open(path, 'rb') as f:
-                    result = self.read_csv(f, compression='zip')
-                    tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean('combined_zip.zip') as path:
-            inner_file_names = ['test_file', 'second_file']
-            tmp = zipfile.ZipFile(path, mode='w')
-            for file_name in inner_file_names:
-                tmp.writestr(file_name, data)
-            tmp.close()
-
-            self.assertRaisesRegexp(ValueError, 'Multiple files',
-                                    self.read_csv, path, compression='zip')
-
-            self.assertRaisesRegexp(ValueError, 'Multiple files',
-                                    self.read_csv, path, compression='infer')
-
-        with tm.ensure_clean() as path:
-            tmp = zipfile.ZipFile(path, mode='w')
-            tmp.close()
-
-            self.assertRaisesRegexp(ValueError, 'Zero files',
-                                    self.read_csv, path, compression='zip')
-
-        with tm.ensure_clean() as path:
-            with open(path, 'wb') as f:
-                self.assertRaises(zipfile.BadZipfile, self.read_csv,
-                                  f, compression='zip')
-
-    def test_gzip(self):
-        try:
-            import gzip
-        except ImportError:
-            pytest.skip('need gzip to run')
-
-        with open(self.csv1, 'rb') as data_file:
-            data = data_file.read()
-            expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='gzip')
-            tm.assert_frame_equal(result, expected)
-
-            with open(path, 'rb') as f:
-                result = self.read_csv(f, compression='gzip')
-                tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean('test.gz') as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-            result = self.read_csv(path, compression='infer')
-            tm.assert_frame_equal(result, expected)
-
-    def test_bz2(self):
-        try:
-            import bz2
-        except ImportError:
-            pytest.skip('need bz2 to run')
-
-        with open(self.csv1, 'rb') as data_file:
-            data = data_file.read()
-            expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='bz2')
-            tm.assert_frame_equal(result, expected)
-
-            self.assertRaises(ValueError, self.read_csv,
-                              path, compression='bz3')
-
-            with open(path, 'rb') as fin:
-                result = self.read_csv(fin, compression='bz2')
-                tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean('test.bz2') as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-            result = self.read_csv(path, compression='infer')
-            tm.assert_frame_equal(result, expected)
-
-    def test_xz(self):
-        lzma = tm._skip_if_no_lzma()
-
-        with open(self.csv1, 'rb') as data_file:
-            data = data_file.read()
-            expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = lzma.LZMAFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, compression='xz')
-            tm.assert_frame_equal(result, expected)
-
-            with open(path, 'rb') as f:
-                result = self.read_csv(f, compression='xz')
-                tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean('test.xz') as path:
-            tmp = lzma.LZMAFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-            result = self.read_csv(path, compression='infer')
-            tm.assert_frame_equal(result, expected)
-
-    def test_read_csv_infer_compression(self):
-        # see gh-9770
-        expected = self.read_csv(self.csv1, index_col=0, parse_dates=True)
-
-        inputs = [self.csv1, self.csv1 + '.gz',
-                  self.csv1 + '.bz2', open(self.csv1)]
-
-        for f in inputs:
-            df = self.read_csv(f, index_col=0, parse_dates=True,
-                               compression='infer')
-
-            tm.assert_frame_equal(expected, df)
-
-        inputs[3].close()
-
-    def test_invalid_compression(self):
-        msg = 'Unrecognized compression type: sfark'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv('test_file.zip', compression='sfark')
diff --git a/pandas/tests/io/parser/conftest.py b/pandas/tests/io/parser/conftest.py
new file mode 100644
index 0000000000000..feb6c36b5178f
--- /dev/null
+++ b/pandas/tests/io/parser/conftest.py
@@ -0,0 +1,85 @@
+import os
+
+import pytest
+
+from pandas import read_csv, read_table
+
+
+class BaseParser(object):
+    engine = None
+    low_memory = True
+    float_precision_choices = []
+
+    def update_kwargs(self, kwargs):
+        kwargs = kwargs.copy()
+        kwargs.update(dict(engine=self.engine,
+                           low_memory=self.low_memory))
+
+        return kwargs
+
+    def read_csv(self, *args, **kwargs):
+        kwargs = self.update_kwargs(kwargs)
+        return read_csv(*args, **kwargs)
+
+    def read_table(self, *args, **kwargs):
+        kwargs = self.update_kwargs(kwargs)
+        return read_table(*args, **kwargs)
+
+
+class CParser(BaseParser):
+    engine = "c"
+    float_precision_choices = [None, "high", "round_trip"]
+
+
+class CParserHighMemory(CParser):
+    low_memory = False
+
+
+class CParserLowMemory(CParser):
+    low_memory = True
+
+
+class PythonParser(BaseParser):
+    engine = "python"
+    float_precision_choices = [None]
+
+
+@pytest.fixture
+def csv_dir_path(datapath):
+    return datapath("io", "parser", "data")
+
+
+@pytest.fixture
+def csv1(csv_dir_path):
+    return os.path.join(csv_dir_path, "test1.csv")
+
+
+_cParserHighMemory = CParserHighMemory()
+_cParserLowMemory = CParserLowMemory()
+_pythonParser = PythonParser()
+
+_py_parsers_only = [_pythonParser]
+_c_parsers_only = [_cParserHighMemory, _cParserLowMemory]
+_all_parsers = _c_parsers_only + _py_parsers_only
+
+_py_parser_ids = ["python"]
+_c_parser_ids = ["c_high", "c_low"]
+_all_parser_ids = _c_parser_ids + _py_parser_ids
+
+
+@pytest.fixture(params=_all_parsers,
+                ids=_all_parser_ids)
+def all_parsers(request):
+    return request.param
+
+
+@pytest.fixture(params=_c_parsers_only,
+                ids=_c_parser_ids)
+def c_parser_only(request):
+    return request.param
+
+
+@pytest.fixture(params=_py_parsers_only,
+                ids=_py_parser_ids)
+def python_parser_only(request):
+    return request.param
diff --git a/pandas/tests/io/parser/converters.py b/pandas/tests/io/parser/converters.py
deleted file mode 100644
index 2659d977ea747..0000000000000
--- a/pandas/tests/io/parser/converters.py
+++ /dev/null
@@ -1,153 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests column conversion functionality during parsing
-for all of the parsers defined in parsers.py
-"""
-
-from datetime import datetime
-
-import pytest
-
-import numpy as np
-import pandas as pd
-import pandas.util.testing as tm
-
-from pandas._libs.lib import Timestamp
-from pandas import DataFrame, Index
-from pandas.compat import parse_date, StringIO, lmap
-
-
-class ConverterTests(object):
-
-    def test_converters_type_must_be_dict(self):
-        data = """index,A,B,C,D
-foo,2,3,4,5
-"""
-        with tm.assertRaisesRegexp(TypeError, 'Type converters.+'):
-            self.read_csv(StringIO(data), converters=0)
-
-    def test_converters(self):
-        data = """A,B,C,D
-a,1,2,01/01/2009
-b,3,4,01/02/2009
-c,4,5,01/03/2009
-"""
-        result = self.read_csv(StringIO(data), converters={'D': parse_date})
-        result2 = self.read_csv(StringIO(data), converters={3: parse_date})
-
-        expected = self.read_csv(StringIO(data))
-        expected['D'] = expected['D'].map(parse_date)
-
-        tm.assertIsInstance(result['D'][0], (datetime, Timestamp))
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result2, expected)
-
-        # produce integer
-        converter = lambda x: int(x.split('/')[2])
-        result = self.read_csv(StringIO(data), converters={'D': converter})
-        expected = self.read_csv(StringIO(data))
-        expected['D'] = expected['D'].map(converter)
-        tm.assert_frame_equal(result, expected)
-
-    def test_converters_no_implicit_conv(self):
-        # see gh-2184
-        data = """000102,1.2,A\n001245,2,B"""
-        f = lambda x: x.strip()
-        converter = {0: f}
-        df = self.read_csv(StringIO(data), header=None, converters=converter)
-        self.assertEqual(df[0].dtype, object)
-
-    def test_converters_euro_decimal_format(self):
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-        f = lambda x: float(x.replace(",", "."))
-        converter = {'Number1': f, 'Number2': f, 'Number3': f}
-        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
-        self.assertEqual(df2['Number1'].dtype, float)
-        self.assertEqual(df2['Number2'].dtype, float)
-        self.assertEqual(df2['Number3'].dtype, float)
-
-    def test_converter_return_string_bug(self):
-        # see gh-583
-        data = """Id;Number1;Number2;Text1;Text2;Number3
-1;1521,1541;187101,9543;ABC;poi;4,738797819
-2;121,12;14897,76;DEF;uyt;0,377320872
-3;878,158;108013,434;GHI;rez;2,735694704"""
-        f = lambda x: float(x.replace(",", "."))
-        converter = {'Number1': f, 'Number2': f, 'Number3': f}
-        df2 = self.read_csv(StringIO(data), sep=';', converters=converter)
-        self.assertEqual(df2['Number1'].dtype, float)
-
-    def test_converters_corner_with_nas(self):
-        # skip aberration observed on Win64 Python 3.2.2
-        if hash(np.int64(-1)) != -2:
-            pytest.skip("skipping because of windows hash on Python"
-                        " 3.2.2")
-
-        data = """id,score,days
-1,2,12
-2,2-5,
-3,,14+
-4,6-12,2"""
-
-        def convert_days(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-
-            is_plus = x.endswith('+')
-            if is_plus:
-                x = int(x[:-1]) + 1
-            else:
-                x = int(x)
-            return x
-
-        def convert_days_sentinel(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-
-            is_plus = x.endswith('+')
-            if is_plus:
-                x = int(x[:-1]) + 1
-            else:
-                x = int(x)
-            return x
-
-        def convert_score(x):
-            x = x.strip()
-            if not x:
-                return np.nan
-            if x.find('-') > 0:
-                valmin, valmax = lmap(int, x.split('-'))
-                val = 0.5 * (valmin + valmax)
-            else:
-                val = float(x)
-
-            return val
-
-        fh = StringIO(data)
-        result = self.read_csv(fh, converters={'score': convert_score,
-                                               'days': convert_days},
-                               na_values=['', None])
-        self.assertTrue(pd.isnull(result['days'][1]))
-
-        fh = StringIO(data)
-        result2 = self.read_csv(fh, converters={'score': convert_score,
-                                                'days': convert_days_sentinel},
-                                na_values=['', None])
-        tm.assert_frame_equal(result, result2)
-
-    def test_converter_index_col_bug(self):
-        # see gh-1835
-        data = "A;B\n1;2\n3;4"
-
-        rs = self.read_csv(StringIO(data), sep=';', index_col='A',
-                           converters={'A': lambda x: x})
-
-        xp = DataFrame({'B': [2, 4]}, index=Index([1, 3], name='A'))
-        tm.assert_frame_equal(rs, xp)
-        self.assertEqual(rs.index.name, xp.index.name)
diff --git a/pandas/tests/io/parser/data/items.jsonl b/pandas/tests/io/parser/data/items.jsonl
new file mode 100644
index 0000000000000..f784d37befa82
--- /dev/null
+++ b/pandas/tests/io/parser/data/items.jsonl
@@ -0,0 +1,2 @@
+{"a": 1, "b": 2}
+{"b":2, "a" :1}
diff --git a/pandas/tests/io/parser/data/salaries.csv b/pandas/tests/io/parser/data/salaries.csv
index ea7803339e98d..85631704ff6e0 100644
--- a/pandas/tests/io/parser/data/salaries.csv
+++ b/pandas/tests/io/parser/data/salaries.csv
@@ -1,47 +1,47 @@
 S	X	E	M
-13876 	1 	1 	1 
-11608 	1 	3 	0 
-18701 	1 	3 	1 
-11283 	1 	2 	0 
-11767 	1 	3 	0 
-20872 	2 	2 	1 
-11772 	2 	2 	0 
-10535 	2 	1 	0 
-12195 	2 	3 	0 
-12313 	3 	2 	0 
-14975 	3 	1 	1 
-21371 	3 	2 	1 
-19800 	3 	3 	1 
-11417 	4 	1 	0 
-20263 	4 	3 	1 
-13231 	4 	3 	0 
-12884 	4 	2 	0 
-13245 	5 	2 	0 
-13677 	5 	3 	0 
-15965 	5 	1 	1 
-12336 	6 	1 	0 
-21352 	6 	3 	1 
-13839 	6 	2 	0 
-22884 	6 	2 	1 
-16978 	7 	1 	1 
-14803 	8 	2 	0 
-17404 	8 	1 	1 
-22184 	8 	3 	1 
-13548 	8 	1 	0 
-14467 	10 	1 	0 
-15942 	10 	2 	0 
-23174 	10 	3 	1 
-23780 	10 	2 	1 
-25410 	11 	2 	1 
-14861 	11 	1 	0 
-16882 	12 	2 	0 
-24170 	12 	3 	1 
-15990 	13 	1 	0 
-26330 	13 	2 	1 
-17949 	14 	2 	0 
-25685 	15 	3 	1 
-27837 	16 	2 	1 
-18838 	16 	2 	0 
-17483 	16 	1 	0 
-19207 	17 	2 	0 
-19346 	20 	1 	0 
+13876 	1 	1 	1
+11608 	1 	3 	0
+18701 	1 	3 	1
+11283 	1 	2 	0
+11767 	1 	3 	0
+20872 	2 	2 	1
+11772 	2 	2 	0
+10535 	2 	1 	0
+12195 	2 	3 	0
+12313 	3 	2 	0
+14975 	3 	1 	1
+21371 	3 	2 	1
+19800 	3 	3 	1
+11417 	4 	1 	0
+20263 	4 	3 	1
+13231 	4 	3 	0
+12884 	4 	2 	0
+13245 	5 	2 	0
+13677 	5 	3 	0
+15965 	5 	1 	1
+12336 	6 	1 	0
+21352 	6 	3 	1
+13839 	6 	2 	0
+22884 	6 	2 	1
+16978 	7 	1 	1
+14803 	8 	2 	0
+17404 	8 	1 	1
+22184 	8 	3 	1
+13548 	8 	1 	0
+14467 	10 	1 	0
+15942 	10 	2 	0
+23174 	10 	3 	1
+23780 	10 	2 	1
+25410 	11 	2 	1
+14861 	11 	1 	0
+16882 	12 	2 	0
+24170 	12 	3 	1
+15990 	13 	1 	0
+26330 	13 	2 	1
+17949 	14 	2 	0
+25685 	15 	3 	1
+27837 	16 	2 	1
+18838 	16 	2 	0
+17483 	16 	1 	0
+19207 	17 	2 	0
+19346 	20 	1 	0
diff --git a/pandas/tests/io/parser/data/sub_char.csv b/pandas/tests/io/parser/data/sub_char.csv
new file mode 100644
index 0000000000000..ff1fa777832c7
--- /dev/null
+++ b/pandas/tests/io/parser/data/sub_char.csv
@@ -0,0 +1,2 @@
+a,"b",c
+1,2,3
\ No newline at end of file
diff --git a/pandas/tests/io/parser/data/tar_csv.tar b/pandas/tests/io/parser/data/tar_csv.tar
new file mode 100644
index 0000000000000..d1819550e0a00
Binary files /dev/null and b/pandas/tests/io/parser/data/tar_csv.tar differ
diff --git a/pandas/tests/io/parser/data/tar_csv.tar.gz b/pandas/tests/io/parser/data/tar_csv.tar.gz
new file mode 100644
index 0000000000000..80505d345f1e2
Binary files /dev/null and b/pandas/tests/io/parser/data/tar_csv.tar.gz differ
diff --git a/pandas/tests/io/parser/data/tips.csv.bz2 b/pandas/tests/io/parser/data/tips.csv.bz2
new file mode 100644
index 0000000000000..1452896b05e9d
Binary files /dev/null and b/pandas/tests/io/parser/data/tips.csv.bz2 differ
diff --git a/pandas/tests/io/parser/data/tips.csv.gz b/pandas/tests/io/parser/data/tips.csv.gz
new file mode 100644
index 0000000000000..3a131068b2a38
Binary files /dev/null and b/pandas/tests/io/parser/data/tips.csv.gz differ
diff --git a/pandas/tests/io/parser/data/utf16_ex_small.zip b/pandas/tests/io/parser/data/utf16_ex_small.zip
new file mode 100644
index 0000000000000..b0560c1b1f6c4
Binary files /dev/null and b/pandas/tests/io/parser/data/utf16_ex_small.zip differ
diff --git a/pandas/tests/io/parser/dialect.py b/pandas/tests/io/parser/dialect.py
deleted file mode 100644
index ee50cf812f72e..0000000000000
--- a/pandas/tests/io/parser/dialect.py
+++ /dev/null
@@ -1,78 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that dialects are properly handled during parsing
-for all of the parsers defined in parsers.py
-"""
-
-import csv
-
-from pandas import DataFrame
-from pandas.compat import StringIO
-from pandas.io.common import ParserWarning
-
-import pandas.util.testing as tm
-
-
-class DialectTests(object):
-
-    def test_dialect(self):
-        data = """\
-label1,label2,label3
-index1,"a,c,e
-index2,b,d,f
-"""
-
-        dia = csv.excel()
-        dia.quoting = csv.QUOTE_NONE
-        with tm.assert_produces_warning(ParserWarning):
-            df = self.read_csv(StringIO(data), dialect=dia)
-
-        data = '''\
-label1,label2,label3
-index1,a,c,e
-index2,b,d,f
-'''
-        exp = self.read_csv(StringIO(data))
-        exp.replace('a', '"a', inplace=True)
-        tm.assert_frame_equal(df, exp)
-
-    def test_dialect_str(self):
-        data = """\
-fruit:vegetable
-apple:brocolli
-pear:tomato
-"""
-        exp = DataFrame({
-            'fruit': ['apple', 'pear'],
-            'vegetable': ['brocolli', 'tomato']
-        })
-        csv.register_dialect('mydialect', delimiter=':')
-        with tm.assert_produces_warning(ParserWarning):
-            df = self.read_csv(StringIO(data), dialect='mydialect')
-
-        tm.assert_frame_equal(df, exp)
-        csv.unregister_dialect('mydialect')
-
-    def test_invalid_dialect(self):
-        class InvalidDialect(object):
-            pass
-
-        data = 'a\n1'
-        msg = 'Invalid dialect'
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(data), dialect=InvalidDialect)
-
-    def test_dialect_conflict(self):
-        data = 'a,b\n1,2'
-        dialect = 'excel'
-        exp = DataFrame({'a': [1], 'b': [2]})
-
-        with tm.assert_produces_warning(None):
-            df = self.read_csv(StringIO(data), delimiter=',', dialect=dialect)
-            tm.assert_frame_equal(df, exp)
-
-        with tm.assert_produces_warning(ParserWarning):
-            df = self.read_csv(StringIO(data), delimiter='.', dialect=dialect)
-            tm.assert_frame_equal(df, exp)
diff --git a/pandas/tests/io/parser/dtypes.py b/pandas/tests/io/parser/dtypes.py
deleted file mode 100644
index fa95c18c4d7a9..0000000000000
--- a/pandas/tests/io/parser/dtypes.py
+++ /dev/null
@@ -1,286 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests dtype specification during parsing
-for all of the parsers defined in parsers.py
-"""
-
-import numpy as np
-import pandas as pd
-import pandas.util.testing as tm
-
-from pandas import DataFrame, Series, Index, MultiIndex, Categorical
-from pandas.compat import StringIO
-from pandas.types.dtypes import CategoricalDtype
-from pandas.io.common import ParserWarning
-
-
-class DtypeTests(object):
-
-    def test_passing_dtype(self):
-        # see gh-6607
-        df = DataFrame(np.random.rand(5, 2).round(4), columns=list(
-            'AB'), index=['1A', '1B', '1C', '1D', '1E'])
-
-        with tm.ensure_clean('__passing_str_as_dtype__.csv') as path:
-            df.to_csv(path)
-
-            # see gh-3795: passing 'str' as the dtype
-            result = self.read_csv(path, dtype=str, index_col=0)
-            expected = df.astype(str)
-            tm.assert_frame_equal(result, expected)
-
-            # for parsing, interpret object as str
-            result = self.read_csv(path, dtype=object, index_col=0)
-            tm.assert_frame_equal(result, expected)
-
-            # we expect all object columns, so need to
-            # convert to test for equivalence
-            result = result.astype(float)
-            tm.assert_frame_equal(result, df)
-
-            # invalid dtype
-            self.assertRaises(TypeError, self.read_csv, path,
-                              dtype={'A': 'foo', 'B': 'float64'},
-                              index_col=0)
-
-        # see gh-12048: empty frame
-        actual = self.read_csv(StringIO('A,B'), dtype=str)
-        expected = DataFrame({'A': [], 'B': []}, index=[], dtype=str)
-        tm.assert_frame_equal(actual, expected)
-
-    def test_pass_dtype(self):
-        data = """\
-one,two
-1,2.5
-2,3.5
-3,4.5
-4,5.5"""
-
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1', 1: 'S1'})
-        self.assertEqual(result['one'].dtype, 'u1')
-        self.assertEqual(result['two'].dtype, 'object')
-
-    def test_categorical_dtype(self):
-        # GH 10153
-        data = """a,b,c
-1,a,3.4
-1,a,3.4
-2,b,4.5"""
-        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
-                                 'b': Categorical(['a', 'a', 'b']),
-                                 'c': Categorical(['3.4', '3.4', '4.5'])})
-        actual = self.read_csv(StringIO(data), dtype='category')
-        tm.assert_frame_equal(actual, expected)
-
-        actual = self.read_csv(StringIO(data), dtype=CategoricalDtype())
-        tm.assert_frame_equal(actual, expected)
-
-        actual = self.read_csv(StringIO(data), dtype={'a': 'category',
-                                                      'b': 'category',
-                                                      'c': CategoricalDtype()})
-        tm.assert_frame_equal(actual, expected)
-
-        actual = self.read_csv(StringIO(data), dtype={'b': 'category'})
-        expected = pd.DataFrame({'a': [1, 1, 2],
-                                 'b': Categorical(['a', 'a', 'b']),
-                                 'c': [3.4, 3.4, 4.5]})
-        tm.assert_frame_equal(actual, expected)
-
-        actual = self.read_csv(StringIO(data), dtype={1: 'category'})
-        tm.assert_frame_equal(actual, expected)
-
-        # unsorted
-        data = """a,b,c
-1,b,3.4
-1,b,3.4
-2,a,4.5"""
-        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
-                                 'b': Categorical(['b', 'b', 'a']),
-                                 'c': Categorical(['3.4', '3.4', '4.5'])})
-        actual = self.read_csv(StringIO(data), dtype='category')
-        tm.assert_frame_equal(actual, expected)
-
-        # missing
-        data = """a,b,c
-1,b,3.4
-1,nan,3.4
-2,a,4.5"""
-        expected = pd.DataFrame({'a': Categorical(['1', '1', '2']),
-                                 'b': Categorical(['b', np.nan, 'a']),
-                                 'c': Categorical(['3.4', '3.4', '4.5'])})
-        actual = self.read_csv(StringIO(data), dtype='category')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_categorical_dtype_encoding(self):
-        # GH 10153
-        pth = tm.get_data_path('unicode_series.csv')
-        encoding = 'latin-1'
-        expected = self.read_csv(pth, header=None, encoding=encoding)
-        expected[1] = Categorical(expected[1])
-        actual = self.read_csv(pth, header=None, encoding=encoding,
-                               dtype={1: 'category'})
-        tm.assert_frame_equal(actual, expected)
-
-        pth = tm.get_data_path('utf16_ex.txt')
-        encoding = 'utf-16'
-        expected = self.read_table(pth, encoding=encoding)
-        expected = expected.apply(Categorical)
-        actual = self.read_table(pth, encoding=encoding, dtype='category')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_categorical_dtype_chunksize(self):
-        # GH 10153
-        data = """a,b
-1,a
-1,b
-1,b
-2,c"""
-        expecteds = [pd.DataFrame({'a': [1, 1],
-                                   'b': Categorical(['a', 'b'])}),
-                     pd.DataFrame({'a': [1, 2],
-                                   'b': Categorical(['b', 'c'])},
-                                  index=[2, 3])]
-        actuals = self.read_csv(StringIO(data), dtype={'b': 'category'},
-                                chunksize=2)
-
-        for actual, expected in zip(actuals, expecteds):
-            tm.assert_frame_equal(actual, expected)
-
-    def test_empty_pass_dtype(self):
-        data = 'one,two'
-        result = self.read_csv(StringIO(data), dtype={'one': 'u1'})
-
-        expected = DataFrame({'one': np.empty(0, dtype='u1'),
-                              'two': np.empty(0, dtype=np.object)})
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_index_pass_dtype(self):
-        data = 'one,two'
-        result = self.read_csv(StringIO(data), index_col=['one'],
-                               dtype={'one': 'u1', 1: 'f'})
-
-        expected = DataFrame({'two': np.empty(0, dtype='f')},
-                             index=Index([], dtype='u1', name='one'))
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_multiindex_pass_dtype(self):
-        data = 'one,two,three'
-        result = self.read_csv(StringIO(data), index_col=['one', 'two'],
-                               dtype={'one': 'u1', 1: 'f8'})
-
-        exp_idx = MultiIndex.from_arrays([np.empty(0, dtype='u1'),
-                                          np.empty(0, dtype='O')],
-                                         names=['one', 'two'])
-        expected = DataFrame(
-            {'three': np.empty(0, dtype=np.object)}, index=exp_idx)
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_mangled_column_pass_dtype_by_names(self):
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), dtype={
-            'one': 'u1', 'one.1': 'f'})
-
-        expected = DataFrame(
-            {'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_mangled_column_pass_dtype_by_indexes(self):
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), dtype={0: 'u1', 1: 'f'})
-
-        expected = DataFrame(
-            {'one': np.empty(0, dtype='u1'), 'one.1': np.empty(0, dtype='f')})
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_empty_with_dup_column_pass_dtype_by_indexes(self):
-        # see gh-9424
-        expected = pd.concat([Series([], name='one', dtype='u1'),
-                              Series([], name='one.1', dtype='f')], axis=1)
-
-        data = 'one,one'
-        result = self.read_csv(StringIO(data), dtype={0: 'u1', 1: 'f'})
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-        data = ''
-        result = self.read_csv(StringIO(data), names=['one', 'one'],
-                               dtype={0: 'u1', 1: 'f'})
-        tm.assert_frame_equal(result, expected, check_index_type=False)
-
-    def test_raise_on_passed_int_dtype_with_nas(self):
-        # see gh-2631
-        data = """YEAR, DOY, a
-2001,106380451,10
-2001,,11
-2001,106380451,67"""
-        self.assertRaises(ValueError, self.read_csv, StringIO(data),
-                          sep=",", skipinitialspace=True,
-                          dtype={'DOY': np.int64})
-
-    def test_dtype_with_converter(self):
-        data = """a,b
-1.1,2.2
-1.2,2.3"""
-        # dtype spec ignored if converted specified
-        with tm.assert_produces_warning(ParserWarning):
-            result = self.read_csv(StringIO(data), dtype={'a': 'i8'},
-                                   converters={'a': lambda x: str(x)})
-        expected = DataFrame({'a': ['1.1', '1.2'], 'b': [2.2, 2.3]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_empty_dtype(self):
-        # see gh-14712
-        data = 'a,b'
-
-        expected = pd.DataFrame(columns=['a', 'b'], dtype=np.float64)
-        result = self.read_csv(StringIO(data), header=0, dtype=np.float64)
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame({'a': pd.Categorical([]),
-                                 'b': pd.Categorical([])},
-                                index=[])
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype='category')
-        tm.assert_frame_equal(result, expected)
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype={'a': 'category', 'b': 'category'})
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame(columns=['a', 'b'], dtype='datetime64[ns]')
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype='datetime64[ns]')
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame({'a': pd.Series([], dtype='timedelta64[ns]'),
-                                 'b': pd.Series([], dtype='timedelta64[ns]')},
-                                index=[])
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype='timedelta64[ns]')
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame(columns=['a', 'b'])
-        expected['a'] = expected['a'].astype(np.float64)
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype={'a': np.float64})
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame(columns=['a', 'b'])
-        expected['a'] = expected['a'].astype(np.float64)
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype={0: np.float64})
-        tm.assert_frame_equal(result, expected)
-
-        expected = pd.DataFrame(columns=['a', 'b'])
-        expected['a'] = expected['a'].astype(np.int32)
-        expected['b'] = expected['b'].astype(np.float64)
-        result = self.read_csv(StringIO(data), header=0,
-                               dtype={'a': np.int32, 1: np.float64})
-        tm.assert_frame_equal(result, expected)
-
-    def test_numeric_dtype(self):
-        data = '0\n1'
-
-        for dt in np.typecodes['AllInteger'] + np.typecodes['Float']:
-            expected = pd.DataFrame([0, 1], dtype=dt)
-            result = self.read_csv(StringIO(data), header=None, dtype=dt)
-            tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/io/parser/header.py b/pandas/tests/io/parser/header.py
deleted file mode 100644
index dc6d2ad1daa47..0000000000000
--- a/pandas/tests/io/parser/header.py
+++ /dev/null
@@ -1,277 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that the file header is properly handled or inferred
-during parsing for all of the parsers defined in parsers.py
-"""
-
-import numpy as np
-import pandas.util.testing as tm
-
-from pandas import DataFrame, Index, MultiIndex
-from pandas.compat import StringIO, lrange, u
-
-
-class HeaderTests(object):
-
-    def test_read_with_bad_header(self):
-        errmsg = r"but only \d+ lines in file"
-
-        with tm.assertRaisesRegexp(ValueError, errmsg):
-            s = StringIO(',,')
-            self.read_csv(s, header=[10])
-
-    def test_bool_header_arg(self):
-        # see gh-6114
-        data = """\
-MyColumn
-   a
-   b
-   a
-   b"""
-        for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                self.read_csv(StringIO(data), header=arg)
-            with tm.assertRaises(TypeError):
-                self.read_table(StringIO(data), header=arg)
-
-    def test_no_header_prefix(self):
-        data = """1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        df_pref = self.read_table(StringIO(data), sep=',', prefix='Field',
-                                  header=None)
-
-        expected = np.array([[1, 2, 3, 4, 5],
-                             [6, 7, 8, 9, 10],
-                             [11, 12, 13, 14, 15]], dtype=np.int64)
-        tm.assert_almost_equal(df_pref.values, expected)
-
-        self.assert_index_equal(df_pref.columns,
-                                Index(['Field0', 'Field1', 'Field2',
-                                       'Field3', 'Field4']))
-
-    def test_header_with_index_col(self):
-        data = """foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        names = ['A', 'B', 'C']
-        df = self.read_csv(StringIO(data), names=names)
-
-        self.assertEqual(names, ['A', 'B', 'C'])
-
-        values = [[1, 2, 3], [4, 5, 6], [7, 8, 9]]
-        expected = DataFrame(values, index=['foo', 'bar', 'baz'],
-                             columns=['A', 'B', 'C'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_header_not_first_line(self):
-        data = """got,to,ignore,this,line
-got,to,ignore,this,line
-index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-"""
-        data2 = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-"""
-
-        df = self.read_csv(StringIO(data), header=2, index_col=0)
-        expected = self.read_csv(StringIO(data2), header=0, index_col=0)
-        tm.assert_frame_equal(df, expected)
-
-    def test_header_multi_index(self):
-        expected = tm.makeCustomDataframe(
-            5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
-
-        data = """\
-C0,,C_l0_g0,C_l0_g1,C_l0_g2
-
-C1,,C_l1_g0,C_l1_g1,C_l1_g2
-C2,,C_l2_g0,C_l2_g1,C_l2_g2
-C3,,C_l3_g0,C_l3_g1,C_l3_g2
-R0,R1,,,
-R_l0_g0,R_l1_g0,R0C0,R0C1,R0C2
-R_l0_g1,R_l1_g1,R1C0,R1C1,R1C2
-R_l0_g2,R_l1_g2,R2C0,R2C1,R2C2
-R_l0_g3,R_l1_g3,R3C0,R3C1,R3C2
-R_l0_g4,R_l1_g4,R4C0,R4C1,R4C2
-"""
-
-        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3], index_col=[
-            0, 1], tupleize_cols=False)
-        tm.assert_frame_equal(df, expected)
-
-        # skipping lines in the header
-        df = self.read_csv(StringIO(data), header=[0, 1, 2, 3], index_col=[
-            0, 1], tupleize_cols=False)
-        tm.assert_frame_equal(df, expected)
-
-        # INVALID OPTIONS
-
-        # no as_recarray
-        with tm.assert_produces_warning(
-                FutureWarning, check_stacklevel=False):
-            self.assertRaises(ValueError, self.read_csv,
-                              StringIO(data), header=[0, 1, 2, 3],
-                              index_col=[0, 1], as_recarray=True,
-                              tupleize_cols=False)
-
-        # names
-        self.assertRaises(ValueError, self.read_csv,
-                          StringIO(data), header=[0, 1, 2, 3],
-                          index_col=[0, 1], names=['foo', 'bar'],
-                          tupleize_cols=False)
-
-        # usecols
-        self.assertRaises(ValueError, self.read_csv,
-                          StringIO(data), header=[0, 1, 2, 3],
-                          index_col=[0, 1], usecols=['foo', 'bar'],
-                          tupleize_cols=False)
-
-        # non-numeric index_col
-        self.assertRaises(ValueError, self.read_csv,
-                          StringIO(data), header=[0, 1, 2, 3],
-                          index_col=['foo', 'bar'], tupleize_cols=False)
-
-    def test_header_multiindex_common_format(self):
-
-        df = DataFrame([[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]],
-                       index=['one', 'two'],
-                       columns=MultiIndex.from_tuples(
-                           [('a', 'q'), ('a', 'r'), ('a', 's'),
-                            ('b', 't'), ('c', 'u'), ('c', 'v')]))
-
-        # to_csv
-        data = """,a,a,a,b,c,c
-,q,r,s,t,u,v
-,,,,,,
-one,1,2,3,4,5,6
-two,7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
-        tm.assert_frame_equal(df, result)
-
-        # common
-        data = """,a,a,a,b,c,c
-,q,r,s,t,u,v
-one,1,2,3,4,5,6
-two,7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
-        tm.assert_frame_equal(df, result)
-
-        # common, no index_col
-        data = """a,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=None)
-        tm.assert_frame_equal(df.reset_index(drop=True), result)
-
-        # malformed case 1
-        expected = DataFrame(np.array(
-            [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype='int64'),
-            index=Index([1, 7]),
-            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
-                                       [u('r'), u('s'), u('t'),
-                                        u('u'), u('v')]],
-                               labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
-                               names=[u('a'), u('q')]))
-
-        data = """a,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
-        tm.assert_frame_equal(expected, result)
-
-        # malformed case 2
-        expected = DataFrame(np.array(
-            [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype='int64'),
-            index=Index([1, 7]),
-            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
-                                       [u('r'), u('s'), u('t'),
-                                        u('u'), u('v')]],
-                               labels=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
-                               names=[None, u('q')]))
-
-        data = """,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=0)
-        tm.assert_frame_equal(expected, result)
-
-        # mi on columns and index (malformed)
-        expected = DataFrame(np.array(
-            [[3, 4, 5, 6], [9, 10, 11, 12]], dtype='int64'),
-            index=MultiIndex(levels=[[1, 7], [2, 8]],
-                             labels=[[0, 1], [0, 1]]),
-            columns=MultiIndex(levels=[[u('a'), u('b'), u('c')],
-                                       [u('s'), u('t'), u('u'), u('v')]],
-                               labels=[[0, 1, 2, 2], [0, 1, 2, 3]],
-                               names=[None, u('q')]))
-
-        data = """,a,a,b,c,c
-q,r,s,t,u,v
-1,2,3,4,5,6
-7,8,9,10,11,12"""
-
-        result = self.read_csv(StringIO(data), header=[0, 1], index_col=[0, 1])
-        tm.assert_frame_equal(expected, result)
-
-    def test_header_names_backward_compat(self):
-        # #2539
-        data = '1,2,3\n4,5,6'
-
-        result = self.read_csv(StringIO(data), names=['a', 'b', 'c'])
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        tm.assert_frame_equal(result, expected)
-
-        data2 = 'foo,bar,baz\n' + data
-        result = self.read_csv(StringIO(data2), names=['a', 'b', 'c'],
-                               header=0)
-        tm.assert_frame_equal(result, expected)
-
-    def test_read_only_header_no_rows(self):
-        # See gh-7773
-        expected = DataFrame(columns=['a', 'b', 'c'])
-
-        df = self.read_csv(StringIO('a,b,c'))
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO('a,b,c'), index_col=False)
-        tm.assert_frame_equal(df, expected)
-
-    def test_no_header(self):
-        data = """1,2,3,4,5
-6,7,8,9,10
-11,12,13,14,15
-"""
-        df = self.read_table(StringIO(data), sep=',', header=None)
-        df_pref = self.read_table(StringIO(data), sep=',', prefix='X',
-                                  header=None)
-
-        names = ['foo', 'bar', 'baz', 'quux', 'panda']
-        df2 = self.read_table(StringIO(data), sep=',', names=names)
-        expected = np.array([[1, 2, 3, 4, 5],
-                             [6, 7, 8, 9, 10],
-                             [11, 12, 13, 14, 15]], dtype=np.int64)
-        tm.assert_almost_equal(df.values, expected)
-        tm.assert_almost_equal(df.values, df2.values)
-
-        self.assert_index_equal(df_pref.columns,
-                                Index(['X0', 'X1', 'X2', 'X3', 'X4']))
-        self.assert_index_equal(df.columns, Index(lrange(5)))
-
-        self.assert_index_equal(df2.columns, Index(names))
diff --git a/pandas/tests/io/parser/index_col.py b/pandas/tests/io/parser/index_col.py
deleted file mode 100644
index 6eb15eb3e043c..0000000000000
--- a/pandas/tests/io/parser/index_col.py
+++ /dev/null
@@ -1,141 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that the specified index column (a.k.a 'index_col')
-is properly handled or inferred during parsing for all of
-the parsers defined in parsers.py
-"""
-
-import pandas.util.testing as tm
-
-from pandas import DataFrame, Index, MultiIndex
-from pandas.compat import StringIO
-
-
-class IndexColTests(object):
-
-    def test_index_col_named(self):
-        no_header = """\
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""  # noqa
-
-        h = "ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir\n"  # noqa
-        data = h + no_header
-        rs = self.read_csv(StringIO(data), index_col='ID')
-        xp = self.read_csv(StringIO(data), header=0).set_index('ID')
-        tm.assert_frame_equal(rs, xp)
-
-        self.assertRaises(ValueError, self.read_csv, StringIO(no_header),
-                          index_col='ID')
-
-        data = """\
-1,2,3,4,hello
-5,6,7,8,world
-9,10,11,12,foo
-"""
-        names = ['a', 'b', 'c', 'd', 'message']
-        xp = DataFrame({'a': [1, 5, 9], 'b': [2, 6, 10], 'c': [3, 7, 11],
-                        'd': [4, 8, 12]},
-                       index=Index(['hello', 'world', 'foo'], name='message'))
-        rs = self.read_csv(StringIO(data), names=names, index_col=['message'])
-        tm.assert_frame_equal(xp, rs)
-        self.assertEqual(xp.index.name, rs.index.name)
-
-        rs = self.read_csv(StringIO(data), names=names, index_col='message')
-        tm.assert_frame_equal(xp, rs)
-        self.assertEqual(xp.index.name, rs.index.name)
-
-    def test_index_col_is_true(self):
-        # see gh-9798
-        self.assertRaises(ValueError, self.read_csv,
-                          StringIO(self.ts_data), index_col=True)
-
-    def test_infer_index_col(self):
-        data = """A,B,C
-foo,1,2,3
-bar,4,5,6
-baz,7,8,9
-"""
-        data = self.read_csv(StringIO(data))
-        self.assertTrue(data.index.equals(Index(['foo', 'bar', 'baz'])))
-
-    def test_empty_index_col_scenarios(self):
-        data = 'x,y,z'
-
-        # None, no index
-        index_col, expected = None, DataFrame([], columns=list('xyz')),
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # False, no index
-        index_col, expected = False, DataFrame([], columns=list('xyz')),
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # int, first column
-        index_col, expected = 0, DataFrame(
-            [], columns=['y', 'z'], index=Index([], name='x'))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # int, not first column
-        index_col, expected = 1, DataFrame(
-            [], columns=['x', 'z'], index=Index([], name='y'))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # str, first column
-        index_col, expected = 'x', DataFrame(
-            [], columns=['y', 'z'], index=Index([], name='x'))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # str, not the first column
-        index_col, expected = 'y', DataFrame(
-            [], columns=['x', 'z'], index=Index([], name='y'))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col), expected)
-
-        # list of int
-        index_col, expected = [0, 1], DataFrame(
-            [], columns=['z'], index=MultiIndex.from_arrays(
-                [[]] * 2, names=['x', 'y']))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col),
-            expected, check_index_type=False)
-
-        # list of str
-        index_col = ['x', 'y']
-        expected = DataFrame([], columns=['z'],
-                             index=MultiIndex.from_arrays(
-                                 [[]] * 2, names=['x', 'y']))
-        tm.assert_frame_equal(self.read_csv(StringIO(
-            data), index_col=index_col),
-            expected, check_index_type=False)
-
-        # list of int, reversed sequence
-        index_col = [1, 0]
-        expected = DataFrame([], columns=['z'], index=MultiIndex.from_arrays(
-            [[]] * 2, names=['y', 'x']))
-        tm.assert_frame_equal(self.read_csv(
-            StringIO(data), index_col=index_col),
-            expected, check_index_type=False)
-
-        # list of str, reversed sequence
-        index_col = ['y', 'x']
-        expected = DataFrame([], columns=['z'], index=MultiIndex.from_arrays(
-            [[]] * 2, names=['y', 'x']))
-        tm.assert_frame_equal(self.read_csv(StringIO(
-            data), index_col=index_col),
-            expected, check_index_type=False)
-
-    def test_empty_with_index_col_false(self):
-        # see gh-10413
-        data = 'x,y'
-        result = self.read_csv(StringIO(data), index_col=False)
-        expected = DataFrame([], columns=['x', 'y'])
-        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/multithread.py b/pandas/tests/io/parser/multithread.py
deleted file mode 100644
index 2aaef889db6de..0000000000000
--- a/pandas/tests/io/parser/multithread.py
+++ /dev/null
@@ -1,99 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests multithreading behaviour for reading and
-parsing files for each parser defined in parsers.py
-"""
-
-from __future__ import division
-from multiprocessing.pool import ThreadPool
-
-import numpy as np
-import pandas as pd
-import pandas.util.testing as tm
-
-from pandas import DataFrame
-from pandas.compat import BytesIO, range
-
-
-def _construct_dataframe(num_rows):
-
-    df = DataFrame(np.random.rand(num_rows, 5), columns=list('abcde'))
-    df['foo'] = 'foo'
-    df['bar'] = 'bar'
-    df['baz'] = 'baz'
-    df['date'] = pd.date_range('20000101 09:00:00',
-                               periods=num_rows,
-                               freq='s')
-    df['int'] = np.arange(num_rows, dtype='int64')
-    return df
-
-
-class MultithreadTests(object):
-
-    def _generate_multithread_dataframe(self, path, num_rows, num_tasks):
-
-        def reader(arg):
-            start, nrows = arg
-
-            if not start:
-                return self.read_csv(path, index_col=0, header=0,
-                                     nrows=nrows, parse_dates=['date'])
-
-            return self.read_csv(path,
-                                 index_col=0,
-                                 header=None,
-                                 skiprows=int(start) + 1,
-                                 nrows=nrows,
-                                 parse_dates=[9])
-
-        tasks = [
-            (num_rows * i // num_tasks,
-             num_rows // num_tasks) for i in range(num_tasks)
-        ]
-
-        pool = ThreadPool(processes=num_tasks)
-
-        results = pool.map(reader, tasks)
-
-        header = results[0].columns
-        for r in results[1:]:
-            r.columns = header
-
-        final_dataframe = pd.concat(results)
-
-        return final_dataframe
-
-    def test_multithread_stringio_read_csv(self):
-        # see gh-11786
-        max_row_range = 10000
-        num_files = 100
-
-        bytes_to_df = [
-            '\n'.join(
-                ['%d,%d,%d' % (i, i, i) for i in range(max_row_range)]
-            ).encode() for j in range(num_files)]
-        files = [BytesIO(b) for b in bytes_to_df]
-
-        # read all files in many threads
-        pool = ThreadPool(8)
-        results = pool.map(self.read_csv, files)
-        first_result = results[0]
-
-        for result in results:
-            tm.assert_frame_equal(first_result, result)
-
-    def test_multithread_path_multipart_read_csv(self):
-        # see gh-11786
-        num_tasks = 4
-        file_name = '__threadpool_reader__.csv'
-        num_rows = 100000
-
-        df = _construct_dataframe(num_rows)
-
-        with tm.ensure_clean(file_name) as path:
-            df.to_csv(path)
-
-            final_dataframe = self._generate_multithread_dataframe(
-                path, num_rows, num_tasks)
-            tm.assert_frame_equal(df, final_dataframe)
diff --git a/pandas/tests/io/parser/na_values.py b/pandas/tests/io/parser/na_values.py
deleted file mode 100644
index 2cbd7cdedf2ab..0000000000000
--- a/pandas/tests/io/parser/na_values.py
+++ /dev/null
@@ -1,305 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that NA values are properly handled during
-parsing for all of the parsers defined in parsers.py
-"""
-
-import numpy as np
-from numpy import nan
-
-import pandas.io.parsers as parsers
-import pandas.util.testing as tm
-
-from pandas import DataFrame, MultiIndex
-from pandas.compat import StringIO, range
-
-
-class NAvaluesTests(object):
-
-    def test_string_nas(self):
-        data = """A,B,C
-a,b,c
-d,,f
-,g,h
-"""
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame([['a', 'b', 'c'],
-                              ['d', np.nan, 'f'],
-                              [np.nan, 'g', 'h']],
-                             columns=['A', 'B', 'C'])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_detect_string_na(self):
-        data = """A,B
-foo,bar
-NA,baz
-NaN,nan
-"""
-        expected = np.array([['foo', 'bar'], [nan, 'baz'], [nan, nan]],
-                            dtype=np.object_)
-        df = self.read_csv(StringIO(data))
-        tm.assert_numpy_array_equal(df.values, expected)
-
-    def test_non_string_na_values(self):
-        # see gh-3611: with an odd float format, we can't match
-        # the string '999.0' exactly but still need float matching
-        nice = """A,B
--999,1.2
-2,-999
-3,4.5
-"""
-        ugly = """A,B
--999,1.200
-2,-999.000
-3,4.500
-"""
-        na_values_param = [['-999.0', '-999'],
-                           [-999, -999.0],
-                           [-999.0, -999],
-                           ['-999.0'], ['-999'],
-                           [-999.0], [-999]]
-        expected = DataFrame([[np.nan, 1.2], [2.0, np.nan],
-                              [3.0, 4.5]], columns=['A', 'B'])
-
-        for data in (nice, ugly):
-            for na_values in na_values_param:
-                out = self.read_csv(StringIO(data), na_values=na_values)
-                tm.assert_frame_equal(out, expected)
-
-    def test_default_na_values(self):
-        _NA_VALUES = set(['-1.#IND', '1.#QNAN', '1.#IND', '-1.#QNAN',
-                          '#N/A', 'N/A', 'NA', '#NA', 'NULL', 'NaN',
-                          'nan', '-NaN', '-nan', '#N/A N/A', ''])
-        self.assertEqual(_NA_VALUES, parsers._NA_VALUES)
-        nv = len(_NA_VALUES)
-
-        def f(i, v):
-            if i == 0:
-                buf = ''
-            elif i > 0:
-                buf = ''.join([','] * i)
-
-            buf = "{0}{1}".format(buf, v)
-
-            if i < nv - 1:
-                buf = "{0}{1}".format(buf, ''.join([','] * (nv - i - 1)))
-
-            return buf
-
-        data = StringIO('\n'.join([f(i, v) for i, v in enumerate(_NA_VALUES)]))
-        expected = DataFrame(np.nan, columns=range(nv), index=range(nv))
-        df = self.read_csv(data, header=None)
-        tm.assert_frame_equal(df, expected)
-
-    def test_custom_na_values(self):
-        data = """A,B,C
-ignore,this,row
-1,NA,3
--1.#IND,5,baz
-7,8,NaN
-"""
-        expected = np.array([[1., nan, 3],
-                             [nan, 5, nan],
-                             [7, 8, nan]])
-
-        df = self.read_csv(StringIO(data), na_values=['baz'], skiprows=[1])
-        tm.assert_numpy_array_equal(df.values, expected)
-
-        df2 = self.read_table(StringIO(data), sep=',', na_values=['baz'],
-                              skiprows=[1])
-        tm.assert_numpy_array_equal(df2.values, expected)
-
-        df3 = self.read_table(StringIO(data), sep=',', na_values='baz',
-                              skiprows=[1])
-        tm.assert_numpy_array_equal(df3.values, expected)
-
-    def test_bool_na_values(self):
-        data = """A,B,C
-True,False,True
-NA,True,False
-False,NA,True"""
-
-        result = self.read_csv(StringIO(data))
-        expected = DataFrame({'A': np.array([True, nan, False], dtype=object),
-                              'B': np.array([False, True, nan], dtype=object),
-                              'C': [True, False, True]})
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_na_value_dict(self):
-        data = """A,B,C
-foo,bar,NA
-bar,foo,foo
-foo,bar,NA
-bar,foo,foo"""
-
-        df = self.read_csv(StringIO(data),
-                           na_values={'A': ['foo'], 'B': ['bar']})
-        expected = DataFrame({'A': [np.nan, 'bar', np.nan, 'bar'],
-                              'B': [np.nan, 'foo', np.nan, 'foo'],
-                              'C': [np.nan, 'foo', np.nan, 'foo']})
-        tm.assert_frame_equal(df, expected)
-
-        data = """\
-a,b,c,d
-0,NA,1,5
-"""
-        xp = DataFrame({'b': [np.nan], 'c': [1], 'd': [5]}, index=[0])
-        xp.index.name = 'a'
-        df = self.read_csv(StringIO(data), na_values={}, index_col=0)
-        tm.assert_frame_equal(df, xp)
-
-        xp = DataFrame({'b': [np.nan], 'd': [5]},
-                       MultiIndex.from_tuples([(0, 1)]))
-        xp.index.names = ['a', 'c']
-        df = self.read_csv(StringIO(data), na_values={}, index_col=[0, 2])
-        tm.assert_frame_equal(df, xp)
-
-        xp = DataFrame({'b': [np.nan], 'd': [5]},
-                       MultiIndex.from_tuples([(0, 1)]))
-        xp.index.names = ['a', 'c']
-        df = self.read_csv(StringIO(data), na_values={}, index_col=['a', 'c'])
-        tm.assert_frame_equal(df, xp)
-
-    def test_na_values_keep_default(self):
-        data = """\
-One,Two,Three
-a,1,one
-b,2,two
-,3,three
-d,4,nan
-e,5,five
-nan,6,
-g,7,seven
-"""
-        df = self.read_csv(StringIO(data))
-        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', np.nan, 'five',
-                                  np.nan, 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []},
-                           keep_default_na=False)
-        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', 'nan', 'five',
-                                  '', 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(
-            StringIO(data), na_values=['a'], keep_default_na=False)
-        xp = DataFrame({'One': [np.nan, 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', 'nan', 'five', '',
-                                  'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        df = self.read_csv(StringIO(data), na_values={'One': [], 'Three': []})
-        xp = DataFrame({'One': ['a', 'b', np.nan, 'd', 'e', np.nan, 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['one', 'two', 'three', np.nan, 'five',
-                                  np.nan, 'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-        # see gh-4318: passing na_values=None and
-        # keep_default_na=False yields 'None' as a na_value
-        data = """\
-One,Two,Three
-a,1,None
-b,2,two
-,3,None
-d,4,nan
-e,5,five
-nan,6,
-g,7,seven
-"""
-        df = self.read_csv(
-            StringIO(data), keep_default_na=False)
-        xp = DataFrame({'One': ['a', 'b', '', 'd', 'e', 'nan', 'g'],
-                        'Two': [1, 2, 3, 4, 5, 6, 7],
-                        'Three': ['None', 'two', 'None', 'nan', 'five', '',
-                                  'seven']})
-        tm.assert_frame_equal(xp.reindex(columns=df.columns), df)
-
-    def test_na_values_na_filter_override(self):
-        data = """\
-A,B
-1,A
-nan,B
-3,C
-"""
-
-        expected = DataFrame([[1, 'A'], [np.nan, np.nan], [3, 'C']],
-                             columns=['A', 'B'])
-        out = self.read_csv(StringIO(data), na_values=['B'], na_filter=True)
-        tm.assert_frame_equal(out, expected)
-
-        expected = DataFrame([['1', 'A'], ['nan', 'B'], ['3', 'C']],
-                             columns=['A', 'B'])
-        out = self.read_csv(StringIO(data), na_values=['B'], na_filter=False)
-        tm.assert_frame_equal(out, expected)
-
-    def test_na_trailing_columns(self):
-        data = """Date,Currenncy,Symbol,Type,Units,UnitPrice,Cost,Tax
-2012-03-14,USD,AAPL,BUY,1000
-2012-05-12,USD,SBUX,SELL,500"""
-
-        result = self.read_csv(StringIO(data))
-        self.assertEqual(result['Date'][1], '2012-05-12')
-        self.assertTrue(result['UnitPrice'].isnull().all())
-
-    def test_na_values_scalar(self):
-        # see gh-12224
-        names = ['a', 'b']
-        data = '1,2\n2,1'
-
-        expected = DataFrame([[np.nan, 2.0], [2.0, np.nan]],
-                             columns=names)
-        out = self.read_csv(StringIO(data), names=names, na_values=1)
-        tm.assert_frame_equal(out, expected)
-
-        expected = DataFrame([[1.0, 2.0], [np.nan, np.nan]],
-                             columns=names)
-        out = self.read_csv(StringIO(data), names=names,
-                            na_values={'a': 2, 'b': 1})
-        tm.assert_frame_equal(out, expected)
-
-    def test_na_values_dict_aliasing(self):
-        na_values = {'a': 2, 'b': 1}
-        na_values_copy = na_values.copy()
-
-        names = ['a', 'b']
-        data = '1,2\n2,1'
-
-        expected = DataFrame([[1.0, 2.0], [np.nan, np.nan]], columns=names)
-        out = self.read_csv(StringIO(data), names=names, na_values=na_values)
-
-        tm.assert_frame_equal(out, expected)
-        tm.assert_dict_equal(na_values, na_values_copy)
-
-    def test_na_values_dict_col_index(self):
-        # see gh-14203
-
-        data = 'a\nfoo\n1'
-        na_values = {0: 'foo'}
-
-        out = self.read_csv(StringIO(data), na_values=na_values)
-        expected = DataFrame({'a': [np.nan, 1]})
-        tm.assert_frame_equal(out, expected)
-
-    def test_na_values_uint64(self):
-        # see gh-14983
-
-        na_values = [2**63]
-        data = str(2**63) + '\n' + str(2**63 + 1)
-        expected = DataFrame([str(2**63), str(2**63 + 1)])
-        out = self.read_csv(StringIO(data), header=None, na_values=na_values)
-        tm.assert_frame_equal(out, expected)
-
-        data = str(2**63) + ',1' + '\n,2'
-        expected = DataFrame([[str(2**63), 1], ['', 2]])
-        out = self.read_csv(StringIO(data), header=None)
-        tm.assert_frame_equal(out, expected)
diff --git a/pandas/tests/io/parser/parse_dates.py b/pandas/tests/io/parser/parse_dates.py
deleted file mode 100644
index de4e3fbc0d943..0000000000000
--- a/pandas/tests/io/parser/parse_dates.py
+++ /dev/null
@@ -1,656 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests date parsing functionality for all of the
-parsers defined in parsers.py
-"""
-
-from distutils.version import LooseVersion
-from datetime import datetime, date
-
-import pytest
-import numpy as np
-import pandas._libs.lib as lib
-from pandas._libs.lib import Timestamp
-
-import pandas as pd
-import pandas.io.parsers as parsers
-import pandas.tseries.tools as tools
-import pandas.util.testing as tm
-
-import pandas.io.date_converters as conv
-from pandas import DataFrame, Series, Index, DatetimeIndex, MultiIndex
-from pandas import compat
-from pandas.compat import parse_date, StringIO, lrange
-from pandas.compat.numpy import np_array_datetime64_compat
-from pandas.tseries.index import date_range
-
-
-class ParseDatesTests(object):
-
-    def test_separator_date_conflict(self):
-        # Regression test for gh-4678: make sure thousands separator and
-        # date parsing do not conflict.
-        data = '06-02-2013;13:00;1-000.215'
-        expected = DataFrame(
-            [[datetime(2013, 6, 2, 13, 0, 0), 1000.215]],
-            columns=['Date', 2]
-        )
-
-        df = self.read_csv(StringIO(data), sep=';', thousands='-',
-                           parse_dates={'Date': [0, 1]}, header=None)
-        tm.assert_frame_equal(df, expected)
-
-    def test_multiple_date_col(self):
-        # Can use multiple date parsers
-        data = """\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-
-        def func(*date_cols):
-            return lib.try_parse_dates(parsers._concat_date_cols(date_cols))
-
-        df = self.read_csv(StringIO(data), header=None,
-                           date_parser=func,
-                           prefix='X',
-                           parse_dates={'nominal': [1, 2],
-                                        'actual': [1, 3]})
-        self.assertIn('nominal', df)
-        self.assertIn('actual', df)
-        self.assertNotIn('X1', df)
-        self.assertNotIn('X2', df)
-        self.assertNotIn('X3', df)
-
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.loc[0, 'nominal'], d)
-
-        df = self.read_csv(StringIO(data), header=None,
-                           date_parser=func,
-                           parse_dates={'nominal': [1, 2],
-                                        'actual': [1, 3]},
-                           keep_date_col=True)
-        self.assertIn('nominal', df)
-        self.assertIn('actual', df)
-
-        self.assertIn(1, df)
-        self.assertIn(2, df)
-        self.assertIn(3, df)
-
-        data = """\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-        df = self.read_csv(StringIO(data), header=None,
-                           prefix='X', parse_dates=[[1, 2], [1, 3]])
-
-        self.assertIn('X1_X2', df)
-        self.assertIn('X1_X3', df)
-        self.assertNotIn('X1', df)
-        self.assertNotIn('X2', df)
-        self.assertNotIn('X3', df)
-
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.loc[0, 'X1_X2'], d)
-
-        df = self.read_csv(StringIO(data), header=None,
-                           parse_dates=[[1, 2], [1, 3]], keep_date_col=True)
-
-        self.assertIn('1_2', df)
-        self.assertIn('1_3', df)
-        self.assertIn(1, df)
-        self.assertIn(2, df)
-        self.assertIn(3, df)
-
-        data = '''\
-KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-        df = self.read_csv(StringIO(data), sep=',', header=None,
-                           parse_dates=[1], index_col=1)
-        d = datetime(1999, 1, 27, 19, 0)
-        self.assertEqual(df.index[0], d)
-
-    def test_multiple_date_cols_int_cast(self):
-        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-        import pandas.io.date_converters as conv
-
-        # it works!
-        df = self.read_csv(StringIO(data), header=None, parse_dates=date_spec,
-                           date_parser=conv.parse_date_time)
-        self.assertIn('nominal', df)
-
-    def test_multiple_date_col_timestamp_parse(self):
-        data = """05/31/2012,15:30:00.029,1306.25,1,E,0,,1306.25
-05/31/2012,15:30:00.029,1306.25,8,E,0,,1306.25"""
-        result = self.read_csv(StringIO(data), sep=',', header=None,
-                               parse_dates=[[0, 1]], date_parser=Timestamp)
-
-        ex_val = Timestamp('05/31/2012 15:30:00.029')
-        self.assertEqual(result['0_1'][0], ex_val)
-
-    def test_multiple_date_cols_with_header(self):
-        data = """\
-ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
-
-        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
-        self.assertNotIsInstance(df.nominal[0], compat.string_types)
-
-    ts_data = """\
-ID,date,nominalTime,actualTime,A,B,C,D,E
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-
-    def test_multiple_date_col_name_collision(self):
-        self.assertRaises(ValueError, self.read_csv, StringIO(self.ts_data),
-                          parse_dates={'ID': [1, 2]})
-
-        data = """\
-date_NominalTime,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""  # noqa
-
-        self.assertRaises(ValueError, self.read_csv, StringIO(data),
-                          parse_dates=[[1, 2]])
-
-    def test_date_parser_int_bug(self):
-        # See gh-3071
-        log_file = StringIO(
-            'posix_timestamp,elapsed,sys,user,queries,query_time,rows,'
-            'accountid,userid,contactid,level,silo,method\n'
-            '1343103150,0.062353,0,4,6,0.01690,3,'
-            '12345,1,-1,3,invoice_InvoiceResource,search\n'
-        )
-
-        def f(posix_string):
-            return datetime.utcfromtimestamp(int(posix_string))
-
-        # it works!
-        self.read_csv(log_file, index_col=0, parse_dates=[0], date_parser=f)
-
-    def test_nat_parse(self):
-        # See gh-3062
-        df = DataFrame(dict({
-            'A': np.asarray(lrange(10), dtype='float64'),
-            'B': pd.Timestamp('20010101')}))
-        df.iloc[3:6, :] = np.nan
-
-        with tm.ensure_clean('__nat_parse_.csv') as path:
-            df.to_csv(path)
-            result = self.read_csv(path, index_col=0, parse_dates=['B'])
-            tm.assert_frame_equal(result, df)
-
-            expected = Series(dict(A='float64', B='datetime64[ns]'))
-            tm.assert_series_equal(expected, result.dtypes)
-
-            # test with NaT for the nan_rep
-            # we don't have a method to specif the Datetime na_rep (it defaults
-            # to '')
-            df.to_csv(path)
-            result = self.read_csv(path, index_col=0, parse_dates=['B'])
-            tm.assert_frame_equal(result, df)
-
-    def test_csv_custom_parser(self):
-        data = """A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        f = lambda x: datetime.strptime(x, '%Y%m%d')
-        df = self.read_csv(StringIO(data), date_parser=f)
-        expected = self.read_csv(StringIO(data), parse_dates=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_parse_dates_implicit_first_col(self):
-        data = """A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        df = self.read_csv(StringIO(data), parse_dates=True)
-        expected = self.read_csv(StringIO(data), index_col=0, parse_dates=True)
-        self.assertIsInstance(
-            df.index[0], (datetime, np.datetime64, Timestamp))
-        tm.assert_frame_equal(df, expected)
-
-    def test_parse_dates_string(self):
-        data = """date,A,B,C
-20090101,a,1,2
-20090102,b,3,4
-20090103,c,4,5
-"""
-        rs = self.read_csv(
-            StringIO(data), index_col='date', parse_dates=['date'])
-        idx = date_range('1/1/2009', periods=3)
-        idx.name = 'date'
-        xp = DataFrame({'A': ['a', 'b', 'c'],
-                        'B': [1, 3, 4],
-                        'C': [2, 4, 5]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-    def test_yy_format_with_yearfirst(self):
-        data = """date,time,B,C
-090131,0010,1,2
-090228,1020,3,4
-090331,0830,5,6
-"""
-
-        # See gh-217
-        import dateutil
-        if dateutil.__version__ >= LooseVersion('2.5.0'):
-            pytest.skip("testing yearfirst=True not-support"
-                        "on datetutil < 2.5.0 this works but"
-                        "is wrong")
-
-        rs = self.read_csv(StringIO(data), index_col=0,
-                           parse_dates=[['date', 'time']])
-        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
-                             datetime(2009, 2, 28, 10, 20, 0),
-                             datetime(2009, 3, 31, 8, 30, 0)],
-                            dtype=object, name='date_time')
-        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-        rs = self.read_csv(StringIO(data), index_col=0,
-                           parse_dates=[[0, 1]])
-        idx = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
-                             datetime(2009, 2, 28, 10, 20, 0),
-                             datetime(2009, 3, 31, 8, 30, 0)],
-                            dtype=object, name='date_time')
-        xp = DataFrame({'B': [1, 3, 5], 'C': [2, 4, 6]}, idx)
-        tm.assert_frame_equal(rs, xp)
-
-    def test_parse_dates_column_list(self):
-        data = 'a,b,c\n01/01/2010,1,15/02/2010'
-
-        expected = DataFrame({'a': [datetime(2010, 1, 1)], 'b': [1],
-                              'c': [datetime(2010, 2, 15)]})
-        expected = expected.set_index(['a', 'b'])
-
-        df = self.read_csv(StringIO(data), index_col=[0, 1],
-                           parse_dates=[0, 2], dayfirst=True)
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(data), index_col=[0, 1],
-                           parse_dates=['a', 'c'], dayfirst=True)
-        tm.assert_frame_equal(df, expected)
-
-    def test_multi_index_parse_dates(self):
-        data = """index1,index2,A,B,C
-20090101,one,a,1,2
-20090101,two,b,3,4
-20090101,three,c,4,5
-20090102,one,a,1,2
-20090102,two,b,3,4
-20090102,three,c,4,5
-20090103,one,a,1,2
-20090103,two,b,3,4
-20090103,three,c,4,5
-"""
-        df = self.read_csv(StringIO(data), index_col=[0, 1], parse_dates=True)
-        self.assertIsInstance(df.index.levels[0][0],
-                              (datetime, np.datetime64, Timestamp))
-
-        # specify columns out of order!
-        df2 = self.read_csv(StringIO(data), index_col=[1, 0], parse_dates=True)
-        self.assertIsInstance(df2.index.levels[1][0],
-                              (datetime, np.datetime64, Timestamp))
-
-    def test_parse_dates_custom_euroformat(self):
-        text = """foo,bar,baz
-31/01/2010,1,2
-01/02/2010,1,NA
-02/02/2010,1,2
-"""
-        parser = lambda d: parse_date(d, dayfirst=True)
-        df = self.read_csv(StringIO(text),
-                           names=['time', 'Q', 'NTU'], header=0,
-                           index_col=0, parse_dates=True,
-                           date_parser=parser, na_values=['NA'])
-
-        exp_index = Index([datetime(2010, 1, 31), datetime(2010, 2, 1),
-                           datetime(2010, 2, 2)], name='time')
-        expected = DataFrame({'Q': [1, 1, 1], 'NTU': [2, np.nan, 2]},
-                             index=exp_index, columns=['Q', 'NTU'])
-        tm.assert_frame_equal(df, expected)
-
-        parser = lambda d: parse_date(d, day_first=True)
-        self.assertRaises(TypeError, self.read_csv,
-                          StringIO(text), skiprows=[0],
-                          names=['time', 'Q', 'NTU'], index_col=0,
-                          parse_dates=True, date_parser=parser,
-                          na_values=['NA'])
-
-    def test_parse_tz_aware(self):
-        # See gh-1693
-        import pytz
-        data = StringIO("Date,x\n2012-06-13T01:39:00Z,0.5")
-
-        # it works
-        result = self.read_csv(data, index_col=0, parse_dates=True)
-        stamp = result.index[0]
-        self.assertEqual(stamp.minute, 39)
-        try:
-            self.assertIs(result.index.tz, pytz.utc)
-        except AssertionError:  # hello Yaroslav
-            arr = result.index.to_pydatetime()
-            result = tools.to_datetime(arr, utc=True)[0]
-            self.assertEqual(stamp.minute, result.minute)
-            self.assertEqual(stamp.hour, result.hour)
-            self.assertEqual(stamp.day, result.day)
-
-    def test_multiple_date_cols_index(self):
-        data = """
-ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
-KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
-"""
-
-        xp = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]})
-        df = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
-                           index_col='nominal')
-        tm.assert_frame_equal(xp.set_index('nominal'), df)
-        df2 = self.read_csv(StringIO(data), parse_dates={'nominal': [1, 2]},
-                            index_col=0)
-        tm.assert_frame_equal(df2, df)
-
-        df3 = self.read_csv(StringIO(data), parse_dates=[[1, 2]], index_col=0)
-        tm.assert_frame_equal(df3, df, check_names=False)
-
-    def test_multiple_date_cols_chunked(self):
-        df = self.read_csv(StringIO(self.ts_data), parse_dates={
-            'nominal': [1, 2]}, index_col='nominal')
-        reader = self.read_csv(StringIO(self.ts_data),
-                               parse_dates={'nominal': [1, 2]},
-                               index_col='nominal', chunksize=2)
-
-        chunks = list(reader)
-
-        self.assertNotIn('nominalTime', df)
-
-        tm.assert_frame_equal(chunks[0], df[:2])
-        tm.assert_frame_equal(chunks[1], df[2:4])
-        tm.assert_frame_equal(chunks[2], df[4:])
-
-    def test_multiple_date_col_named_components(self):
-        xp = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]},
-                           index_col='nominal')
-        colspec = {'nominal': ['date', 'nominalTime']}
-        df = self.read_csv(StringIO(self.ts_data), parse_dates=colspec,
-                           index_col='nominal')
-        tm.assert_frame_equal(df, xp)
-
-    def test_multiple_date_col_multiple_index(self):
-        df = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]},
-                           index_col=['nominal', 'ID'])
-
-        xp = self.read_csv(StringIO(self.ts_data),
-                           parse_dates={'nominal': [1, 2]})
-
-        tm.assert_frame_equal(xp.set_index(['nominal', 'ID']), df)
-
-    def test_read_with_parse_dates_scalar_non_bool(self):
-        # See gh-5636
-        errmsg = ("Only booleans, lists, and "
-                  "dictionaries are accepted "
-                  "for the 'parse_dates' parameter")
-        data = """A,B,C
-        1,2,2003-11-1"""
-
-        tm.assertRaisesRegexp(TypeError, errmsg, self.read_csv,
-                              StringIO(data), parse_dates="C")
-        tm.assertRaisesRegexp(TypeError, errmsg, self.read_csv,
-                              StringIO(data), parse_dates="C",
-                              index_col="C")
-
-    def test_read_with_parse_dates_invalid_type(self):
-        errmsg = ("Only booleans, lists, and "
-                  "dictionaries are accepted "
-                  "for the 'parse_dates' parameter")
-        data = """A,B,C
-        1,2,2003-11-1"""
-
-        tm.assertRaisesRegexp(TypeError, errmsg, self.read_csv,
-                              StringIO(data), parse_dates=(1,))
-        tm.assertRaisesRegexp(TypeError, errmsg, self.read_csv,
-                              StringIO(data), parse_dates=np.array([4, 5]))
-        tm.assertRaisesRegexp(TypeError, errmsg, self.read_csv,
-                              StringIO(data), parse_dates=set([1, 3, 3]))
-
-    def test_parse_dates_empty_string(self):
-        # see gh-2263
-        data = "Date, test\n2012-01-01, 1\n,2"
-        result = self.read_csv(StringIO(data), parse_dates=["Date"],
-                               na_filter=False)
-        self.assertTrue(result['Date'].isnull()[1])
-
-    def test_parse_dates_noconvert_thousands(self):
-        # see gh-14066
-        data = 'a\n04.15.2016'
-
-        expected = DataFrame([datetime(2016, 4, 15)], columns=['a'])
-        result = self.read_csv(StringIO(data), parse_dates=['a'],
-                               thousands='.')
-        tm.assert_frame_equal(result, expected)
-
-        exp_index = DatetimeIndex(['2016-04-15'], name='a')
-        expected = DataFrame(index=exp_index)
-        result = self.read_csv(StringIO(data), index_col=0,
-                               parse_dates=True, thousands='.')
-        tm.assert_frame_equal(result, expected)
-
-        data = 'a,b\n04.15.2016,09.16.2013'
-
-        expected = DataFrame([[datetime(2016, 4, 15),
-                               datetime(2013, 9, 16)]],
-                             columns=['a', 'b'])
-        result = self.read_csv(StringIO(data), parse_dates=['a', 'b'],
-                               thousands='.')
-        tm.assert_frame_equal(result, expected)
-
-        expected = DataFrame([[datetime(2016, 4, 15),
-                               datetime(2013, 9, 16)]],
-                             columns=['a', 'b'])
-        expected = expected.set_index(['a', 'b'])
-        result = self.read_csv(StringIO(data), index_col=[0, 1],
-                               parse_dates=True, thousands='.')
-        tm.assert_frame_equal(result, expected)
-
-    def test_parse_date_time_multi_level_column_name(self):
-        data = """\
-D,T,A,B
-date, time,a,b
-2001-01-05, 09:00:00, 0.0, 10.
-2001-01-06, 00:00:00, 1.0, 11.
-"""
-        datecols = {'date_time': [0, 1]}
-        result = self.read_csv(StringIO(data), sep=',', header=[0, 1],
-                               parse_dates=datecols,
-                               date_parser=conv.parse_date_time)
-
-        expected_data = [[datetime(2001, 1, 5, 9, 0, 0), 0., 10.],
-                         [datetime(2001, 1, 6, 0, 0, 0), 1., 11.]]
-        expected = DataFrame(expected_data,
-                             columns=['date_time', ('A', 'a'), ('B', 'b')])
-        tm.assert_frame_equal(result, expected)
-
-    def test_parse_date_time(self):
-        dates = np.array(['2007/1/3', '2008/2/4'], dtype=object)
-        times = np.array(['05:07:09', '06:08:00'], dtype=object)
-        expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
-                             datetime(2008, 2, 4, 6, 8, 0)])
-
-        result = conv.parse_date_time(dates, times)
-        self.assertTrue((result == expected).all())
-
-        data = """\
-date, time, a, b
-2001-01-05, 10:00:00, 0.0, 10.
-2001-01-05, 00:00:00, 1., 11.
-"""
-        datecols = {'date_time': [0, 1]}
-        df = self.read_csv(StringIO(data), sep=',', header=0,
-                           parse_dates=datecols,
-                           date_parser=conv.parse_date_time)
-        self.assertIn('date_time', df)
-        self.assertEqual(df.date_time.loc[0], datetime(2001, 1, 5, 10, 0, 0))
-
-        data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
-                "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
-                "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
-                "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
-                "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
-                "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
-
-        date_spec = {'nominal': [1, 2], 'actual': [1, 3]}
-        df = self.read_csv(StringIO(data), header=None, parse_dates=date_spec,
-                           date_parser=conv.parse_date_time)
-
-    def test_parse_date_fields(self):
-        years = np.array([2007, 2008])
-        months = np.array([1, 2])
-        days = np.array([3, 4])
-        result = conv.parse_date_fields(years, months, days)
-        expected = np.array([datetime(2007, 1, 3), datetime(2008, 2, 4)])
-        self.assertTrue((result == expected).all())
-
-        data = ("year, month, day, a\n 2001 , 01 , 10 , 10.\n"
-                "2001 , 02 , 1 , 11.")
-        datecols = {'ymd': [0, 1, 2]}
-        df = self.read_csv(StringIO(data), sep=',', header=0,
-                           parse_dates=datecols,
-                           date_parser=conv.parse_date_fields)
-        self.assertIn('ymd', df)
-        self.assertEqual(df.ymd.loc[0], datetime(2001, 1, 10))
-
-    def test_datetime_six_col(self):
-        years = np.array([2007, 2008])
-        months = np.array([1, 2])
-        days = np.array([3, 4])
-        hours = np.array([5, 6])
-        minutes = np.array([7, 8])
-        seconds = np.array([9, 0])
-        expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
-                             datetime(2008, 2, 4, 6, 8, 0)])
-
-        result = conv.parse_all_fields(years, months, days,
-                                       hours, minutes, seconds)
-
-        self.assertTrue((result == expected).all())
-
-        data = """\
-year, month, day, hour, minute, second, a, b
-2001, 01, 05, 10, 00, 0, 0.0, 10.
-2001, 01, 5, 10, 0, 00, 1., 11.
-"""
-        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
-        df = self.read_csv(StringIO(data), sep=',', header=0,
-                           parse_dates=datecols,
-                           date_parser=conv.parse_all_fields)
-        self.assertIn('ymdHMS', df)
-        self.assertEqual(df.ymdHMS.loc[0], datetime(2001, 1, 5, 10, 0, 0))
-
-    def test_datetime_fractional_seconds(self):
-        data = """\
-year, month, day, hour, minute, second, a, b
-2001, 01, 05, 10, 00, 0.123456, 0.0, 10.
-2001, 01, 5, 10, 0, 0.500000, 1., 11.
-"""
-        datecols = {'ymdHMS': [0, 1, 2, 3, 4, 5]}
-        df = self.read_csv(StringIO(data), sep=',', header=0,
-                           parse_dates=datecols,
-                           date_parser=conv.parse_all_fields)
-        self.assertIn('ymdHMS', df)
-        self.assertEqual(df.ymdHMS.loc[0], datetime(2001, 1, 5, 10, 0, 0,
-                                                    microsecond=123456))
-        self.assertEqual(df.ymdHMS.loc[1], datetime(2001, 1, 5, 10, 0, 0,
-                                                    microsecond=500000))
-
-    def test_generic(self):
-        data = "year, month, day, a\n 2001, 01, 10, 10.\n 2001, 02, 1, 11."
-        datecols = {'ym': [0, 1]}
-        dateconverter = lambda y, m: date(year=int(y), month=int(m), day=1)
-        df = self.read_csv(StringIO(data), sep=',', header=0,
-                           parse_dates=datecols,
-                           date_parser=dateconverter)
-        self.assertIn('ym', df)
-        self.assertEqual(df.ym.loc[0], date(2001, 1, 1))
-
-    def test_dateparser_resolution_if_not_ns(self):
-        # GH 10245
-        data = """\
-date,time,prn,rxstatus
-2013-11-03,19:00:00,126,00E80000
-2013-11-03,19:00:00,23,00E80000
-2013-11-03,19:00:00,13,00E80000
-"""
-
-        def date_parser(date, time):
-            datetime = np_array_datetime64_compat(
-                date + 'T' + time + 'Z', dtype='datetime64[s]')
-            return datetime
-
-        df = self.read_csv(StringIO(data), date_parser=date_parser,
-                           parse_dates={'datetime': ['date', 'time']},
-                           index_col=['datetime', 'prn'])
-
-        datetimes = np_array_datetime64_compat(['2013-11-03T19:00:00Z'] * 3,
-                                               dtype='datetime64[s]')
-        df_correct = DataFrame(data={'rxstatus': ['00E80000'] * 3},
-                               index=MultiIndex.from_tuples(
-                                   [(datetimes[0], 126),
-                                    (datetimes[1], 23),
-                                    (datetimes[2], 13)],
-                               names=['datetime', 'prn']))
-        tm.assert_frame_equal(df, df_correct)
-
-    def test_parse_date_column_with_empty_string(self):
-        # GH 6428
-        data = """case,opdate
-                  7,10/18/2006
-                  7,10/18/2008
-                  621, """
-        result = self.read_csv(StringIO(data), parse_dates=['opdate'])
-        expected_data = [[7, '10/18/2006'],
-                         [7, '10/18/2008'],
-                         [621, ' ']]
-        expected = DataFrame(expected_data, columns=['case', 'opdate'])
-        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/python_parser_only.py b/pandas/tests/io/parser/python_parser_only.py
deleted file mode 100644
index bd76070933c47..0000000000000
--- a/pandas/tests/io/parser/python_parser_only.py
+++ /dev/null
@@ -1,239 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that apply specifically to the Python parser. Unless specifically
-stated as a Python-specific issue, the goal is to eventually move as many of
-these tests out of this module as soon as the C parser can accept further
-arguments when parsing.
-"""
-
-import csv
-import sys
-import pytest
-
-import pandas.util.testing as tm
-from pandas import DataFrame, Index
-from pandas import compat
-from pandas.compat import StringIO, BytesIO, u
-
-
-class PythonParserTests(object):
-
-    def test_negative_skipfooter_raises(self):
-        text = """#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-
-        with tm.assertRaisesRegexp(
-                ValueError, 'skip footer cannot be negative'):
-            self.read_csv(StringIO(text), skipfooter=-1)
-
-    def test_sniff_delimiter(self):
-        text = """index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-"""
-        data = self.read_csv(StringIO(text), index_col=0, sep=None)
-        self.assert_index_equal(data.index,
-                                Index(['foo', 'bar', 'baz'], name='index'))
-
-        data2 = self.read_csv(StringIO(text), index_col=0, delimiter='|')
-        tm.assert_frame_equal(data, data2)
-
-        text = """ignore this
-ignore this too
-index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-"""
-        data3 = self.read_csv(StringIO(text), index_col=0,
-                              sep=None, skiprows=2)
-        tm.assert_frame_equal(data, data3)
-
-        text = u("""ignore this
-ignore this too
-index|A|B|C
-foo|1|2|3
-bar|4|5|6
-baz|7|8|9
-""").encode('utf-8')
-
-        s = BytesIO(text)
-        if compat.PY3:
-            # somewhat False since the code never sees bytes
-            from io import TextIOWrapper
-            s = TextIOWrapper(s, encoding='utf-8')
-
-        data4 = self.read_csv(s, index_col=0, sep=None, skiprows=2,
-                              encoding='utf-8')
-        tm.assert_frame_equal(data, data4)
-
-    def test_BytesIO_input(self):
-        if not compat.PY3:
-            pytest.skip(
-                "Bytes-related test - only needs to work on Python 3")
-
-        data = BytesIO("שלום::1234\n562::123".encode('cp1255'))
-        result = self.read_table(data, sep="::", encoding='cp1255')
-        expected = DataFrame([[562, 123]], columns=["שלום", "1234"])
-        tm.assert_frame_equal(result, expected)
-
-    def test_single_line(self):
-        # see gh-6607: sniff separator
-
-        buf = StringIO()
-        sys.stdout = buf
-
-        try:
-            df = self.read_csv(StringIO('1,2'), names=['a', 'b'],
-                               header=None, sep=None)
-            tm.assert_frame_equal(DataFrame({'a': [1], 'b': [2]}), df)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    def test_skipfooter(self):
-        # see gh-6607
-        data = """A,B,C
-1,2,3
-4,5,6
-7,8,9
-want to skip this
-also also skip this
-"""
-        result = self.read_csv(StringIO(data), skipfooter=2)
-        no_footer = '\n'.join(data.split('\n')[:-3])
-        expected = self.read_csv(StringIO(no_footer))
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), nrows=3)
-        tm.assert_frame_equal(result, expected)
-
-        # skipfooter alias
-        result = self.read_csv(StringIO(data), skipfooter=2)
-        no_footer = '\n'.join(data.split('\n')[:-3])
-        expected = self.read_csv(StringIO(no_footer))
-        tm.assert_frame_equal(result, expected)
-
-    def test_decompression_regex_sep(self):
-        # see gh-6607
-
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            pytest.skip('need gzip and bz2 to run')
-
-        with open(self.csv1, 'rb') as f:
-            data = f.read()
-        data = data.replace(b',', b'::')
-        expected = self.read_csv(self.csv1)
-
-        with tm.ensure_clean() as path:
-            tmp = gzip.GzipFile(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, sep='::', compression='gzip')
-            tm.assert_frame_equal(result, expected)
-
-        with tm.ensure_clean() as path:
-            tmp = bz2.BZ2File(path, mode='wb')
-            tmp.write(data)
-            tmp.close()
-
-            result = self.read_csv(path, sep='::', compression='bz2')
-            tm.assert_frame_equal(result, expected)
-
-            self.assertRaises(ValueError, self.read_csv,
-                              path, compression='bz3')
-
-    def test_read_table_buglet_4x_multiindex(self):
-        # see gh-6607
-        text = """                      A       B       C       D        E
-one two three   four
-a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
-a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
-x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
-
-        df = self.read_table(StringIO(text), sep=r'\s+')
-        self.assertEqual(df.index.names, ('one', 'two', 'three', 'four'))
-
-        # see gh-6893
-        data = '      A B C\na b c\n1 3 7 0 3 6\n3 1 4 1 5 9'
-        expected = DataFrame.from_records(
-            [(1, 3, 7, 0, 3, 6), (3, 1, 4, 1, 5, 9)],
-            columns=list('abcABC'), index=list('abc'))
-        actual = self.read_table(StringIO(data), sep=r'\s+')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_skipfooter_with_decimal(self):
-        # see gh-6971
-        data = '1#2\n3#4'
-        expected = DataFrame({'a': [1.2, 3.4]})
-
-        result = self.read_csv(StringIO(data), names=['a'],
-                               decimal='#')
-        tm.assert_frame_equal(result, expected)
-
-        # the stray footer line should not mess with the
-        # casting of the first t    wo lines if we skip it
-        data = data + '\nFooter'
-        result = self.read_csv(StringIO(data), names=['a'],
-                               decimal='#', skipfooter=1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_encoding_non_utf8_multichar_sep(self):
-        # see gh-3404
-        expected = DataFrame({'a': [1], 'b': [2]})
-
-        for sep in ['::', '#####', '!!!', '123', '#1!c5',
-                    '%!c!d', '@@#4:2', '_!pd#_']:
-            data = '1' + sep + '2'
-
-            for encoding in ['utf-16', 'utf-16-be', 'utf-16-le',
-                             'utf-32', 'cp037']:
-                encoded_data = data.encode(encoding)
-                result = self.read_csv(BytesIO(encoded_data),
-                                       sep=sep, names=['a', 'b'],
-                                       encoding=encoding)
-                tm.assert_frame_equal(result, expected)
-
-    def test_multi_char_sep_quotes(self):
-        # see gh-13374
-
-        data = 'a,,b\n1,,a\n2,,"2,,b"'
-        msg = 'ignored when a multi-char delimiter is used'
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(data), sep=',,')
-
-        # We expect no match, so there should be an assertion
-        # error out of the inner context manager.
-        with tm.assertRaises(AssertionError):
-            with tm.assertRaisesRegexp(ValueError, msg):
-                self.read_csv(StringIO(data), sep=',,',
-                              quoting=csv.QUOTE_NONE)
-
-    def test_skipfooter_bad_row(self):
-        # see gh-13879
-
-        data = 'a,b,c\ncat,foo,bar\ndog,foo,"baz'
-        msg = 'parsing errors in the skipped footer rows'
-
-        with tm.assertRaisesRegexp(csv.Error, msg):
-            self.read_csv(StringIO(data), skipfooter=1)
-
-        # We expect no match, so there should be an assertion
-        # error out of the inner context manager.
-        with tm.assertRaises(AssertionError):
-            with tm.assertRaisesRegexp(csv.Error, msg):
-                self.read_csv(StringIO(data))
diff --git a/pandas/tests/io/parser/quoting.py b/pandas/tests/io/parser/quoting.py
deleted file mode 100644
index a692e03e868c7..0000000000000
--- a/pandas/tests/io/parser/quoting.py
+++ /dev/null
@@ -1,153 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that quoting specifications are properly handled
-during parsing for all of the parsers defined in parsers.py
-"""
-
-import csv
-import pandas.util.testing as tm
-
-from pandas import DataFrame
-from pandas.compat import PY3, StringIO, u
-
-
-class QuotingTests(object):
-
-    def test_bad_quote_char(self):
-        data = '1,2,3'
-
-        # Python 2.x: "...must be an 1-character..."
-        # Python 3.x: "...must be a 1-character..."
-        msg = '"quotechar" must be a(n)? 1-character string'
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quotechar='foo')
-
-        msg = 'quotechar must be set if quoting enabled'
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quotechar=None,
-                              quoting=csv.QUOTE_MINIMAL)
-
-        msg = '"quotechar" must be string, not int'
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quotechar=2)
-
-    def test_bad_quoting(self):
-        data = '1,2,3'
-
-        msg = '"quoting" must be an integer'
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quoting='foo')
-
-        # quoting must in the range [0, 3]
-        msg = 'bad "quoting" value'
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quoting=5)
-
-    def test_quote_char_basic(self):
-        data = 'a,b,c\n1,2,"cat"'
-        expected = DataFrame([[1, 2, 'cat']],
-                             columns=['a', 'b', 'c'])
-        result = self.read_csv(StringIO(data), quotechar='"')
-        tm.assert_frame_equal(result, expected)
-
-    def test_quote_char_various(self):
-        data = 'a,b,c\n1,2,"cat"'
-        expected = DataFrame([[1, 2, 'cat']],
-                             columns=['a', 'b', 'c'])
-        quote_chars = ['~', '*', '%', '$', '@', 'P']
-
-        for quote_char in quote_chars:
-            new_data = data.replace('"', quote_char)
-            result = self.read_csv(StringIO(new_data), quotechar=quote_char)
-            tm.assert_frame_equal(result, expected)
-
-    def test_null_quote_char(self):
-        data = 'a,b,c\n1,2,3'
-
-        # sanity checks
-        msg = 'quotechar must be set if quoting enabled'
-
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quotechar=None,
-                              quoting=csv.QUOTE_MINIMAL)
-
-        tm.assertRaisesRegexp(TypeError, msg, self.read_csv,
-                              StringIO(data), quotechar='',
-                              quoting=csv.QUOTE_MINIMAL)
-
-        # no errors should be raised if quoting is None
-        expected = DataFrame([[1, 2, 3]],
-                             columns=['a', 'b', 'c'])
-
-        result = self.read_csv(StringIO(data), quotechar=None,
-                               quoting=csv.QUOTE_NONE)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), quotechar='',
-                               quoting=csv.QUOTE_NONE)
-        tm.assert_frame_equal(result, expected)
-
-    def test_quoting_various(self):
-        data = '1,2,"foo"'
-        cols = ['a', 'b', 'c']
-
-        # QUOTE_MINIMAL and QUOTE_ALL apply only to
-        # the CSV writer, so they should have no
-        # special effect for the CSV reader
-        expected = DataFrame([[1, 2, 'foo']], columns=cols)
-
-        # test default (afterwards, arguments are all explicit)
-        result = self.read_csv(StringIO(data), names=cols)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               quoting=csv.QUOTE_MINIMAL, names=cols)
-        tm.assert_frame_equal(result, expected)
-
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               quoting=csv.QUOTE_ALL, names=cols)
-        tm.assert_frame_equal(result, expected)
-
-        # QUOTE_NONE tells the reader to do no special handling
-        # of quote characters and leave them alone
-        expected = DataFrame([[1, 2, '"foo"']], columns=cols)
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               quoting=csv.QUOTE_NONE, names=cols)
-        tm.assert_frame_equal(result, expected)
-
-        # QUOTE_NONNUMERIC tells the reader to cast
-        # all non-quoted fields to float
-        expected = DataFrame([[1.0, 2.0, 'foo']], columns=cols)
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               quoting=csv.QUOTE_NONNUMERIC,
-                               names=cols)
-        tm.assert_frame_equal(result, expected)
-
-    def test_double_quote(self):
-        data = 'a,b\n3,"4 "" 5"'
-
-        expected = DataFrame([[3, '4 " 5']],
-                             columns=['a', 'b'])
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               doublequote=True)
-        tm.assert_frame_equal(result, expected)
-
-        expected = DataFrame([[3, '4 " 5"']],
-                             columns=['a', 'b'])
-        result = self.read_csv(StringIO(data), quotechar='"',
-                               doublequote=False)
-        tm.assert_frame_equal(result, expected)
-
-    def test_quotechar_unicode(self):
-        # See gh-14477
-        data = 'a\n1'
-        expected = DataFrame({'a': [1]})
-
-        result = self.read_csv(StringIO(data), quotechar=u('"'))
-        tm.assert_frame_equal(result, expected)
-
-        # Compared to Python 3.x, Python 2.x does not handle unicode well.
-        if PY3:
-            result = self.read_csv(StringIO(data), quotechar=u('\u0001'))
-            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/skiprows.py b/pandas/tests/io/parser/skiprows.py
deleted file mode 100644
index c53e6a1579267..0000000000000
--- a/pandas/tests/io/parser/skiprows.py
+++ /dev/null
@@ -1,225 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests that skipped rows are properly handled during
-parsing for all of the parsers defined in parsers.py
-"""
-
-from datetime import datetime
-
-import numpy as np
-
-import pandas.util.testing as tm
-
-from pandas import DataFrame
-from pandas.io.common import EmptyDataError
-from pandas.compat import StringIO, range, lrange
-
-
-class SkipRowsTests(object):
-
-    def test_skiprows_bug(self):
-        # see gh-505
-        text = """#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-#foo,a,b,c
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-        data = self.read_csv(StringIO(text), skiprows=lrange(6), header=None,
-                             index_col=0, parse_dates=True)
-
-        data2 = self.read_csv(StringIO(text), skiprows=6, header=None,
-                              index_col=0, parse_dates=True)
-
-        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
-                             columns=[1, 2, 3],
-                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
-                                    datetime(2000, 1, 3)])
-        expected.index.name = 0
-        tm.assert_frame_equal(data, expected)
-        tm.assert_frame_equal(data, data2)
-
-    def test_deep_skiprows(self):
-        # see gh-4382
-        text = "a,b,c\n" + \
-               "\n".join([",".join([str(i), str(i + 1), str(i + 2)])
-                          for i in range(10)])
-        condensed_text = "a,b,c\n" + \
-                         "\n".join([",".join([str(i), str(i + 1), str(i + 2)])
-                                    for i in [0, 1, 2, 3, 4, 6, 8, 9]])
-        data = self.read_csv(StringIO(text), skiprows=[6, 8])
-        condensed_data = self.read_csv(StringIO(condensed_text))
-        tm.assert_frame_equal(data, condensed_data)
-
-    def test_skiprows_blank(self):
-        # see gh-9832
-        text = """#foo,a,b,c
-#foo,a,b,c
-
-#foo,a,b,c
-#foo,a,b,c
-
-1/1/2000,1.,2.,3.
-1/2/2000,4,5,6
-1/3/2000,7,8,9
-"""
-        data = self.read_csv(StringIO(text), skiprows=6, header=None,
-                             index_col=0, parse_dates=True)
-
-        expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
-                             columns=[1, 2, 3],
-                             index=[datetime(2000, 1, 1), datetime(2000, 1, 2),
-                                    datetime(2000, 1, 3)])
-        expected.index.name = 0
-        tm.assert_frame_equal(data, expected)
-
-    def test_skiprow_with_newline(self):
-        # see gh-12775 and gh-10911
-        data = """id,text,num_lines
-1,"line 11
-line 12",2
-2,"line 21
-line 22",2
-3,"line 31",1"""
-        expected = [[2, 'line 21\nline 22', 2],
-                    [3, 'line 31', 1]]
-        expected = DataFrame(expected, columns=[
-            'id', 'text', 'num_lines'])
-        df = self.read_csv(StringIO(data), skiprows=[1])
-        tm.assert_frame_equal(df, expected)
-
-        data = ('a,b,c\n~a\n b~,~e\n d~,'
-                '~f\n f~\n1,2,~12\n 13\n 14~')
-        expected = [['a\n b', 'e\n d', 'f\n f']]
-        expected = DataFrame(expected, columns=[
-            'a', 'b', 'c'])
-        df = self.read_csv(StringIO(data),
-                           quotechar="~",
-                           skiprows=[2])
-        tm.assert_frame_equal(df, expected)
-
-        data = ('Text,url\n~example\n '
-                'sentence\n one~,url1\n~'
-                'example\n sentence\n two~,url2\n~'
-                'example\n sentence\n three~,url3')
-        expected = [['example\n sentence\n two', 'url2']]
-        expected = DataFrame(expected, columns=[
-            'Text', 'url'])
-        df = self.read_csv(StringIO(data),
-                           quotechar="~",
-                           skiprows=[1, 3])
-        tm.assert_frame_equal(df, expected)
-
-    def test_skiprow_with_quote(self):
-        # see gh-12775 and gh-10911
-        data = """id,text,num_lines
-1,"line '11' line 12",2
-2,"line '21' line 22",2
-3,"line '31' line 32",1"""
-        expected = [[2, "line '21' line 22", 2],
-                    [3, "line '31' line 32", 1]]
-        expected = DataFrame(expected, columns=[
-            'id', 'text', 'num_lines'])
-        df = self.read_csv(StringIO(data), skiprows=[1])
-        tm.assert_frame_equal(df, expected)
-
-    def test_skiprow_with_newline_and_quote(self):
-        # see gh-12775 and gh-10911
-        data = """id,text,num_lines
-1,"line \n'11' line 12",2
-2,"line \n'21' line 22",2
-3,"line \n'31' line 32",1"""
-        expected = [[2, "line \n'21' line 22", 2],
-                    [3, "line \n'31' line 32", 1]]
-        expected = DataFrame(expected, columns=[
-            'id', 'text', 'num_lines'])
-        df = self.read_csv(StringIO(data), skiprows=[1])
-        tm.assert_frame_equal(df, expected)
-
-        data = """id,text,num_lines
-1,"line '11\n' line 12",2
-2,"line '21\n' line 22",2
-3,"line '31\n' line 32",1"""
-        expected = [[2, "line '21\n' line 22", 2],
-                    [3, "line '31\n' line 32", 1]]
-        expected = DataFrame(expected, columns=[
-            'id', 'text', 'num_lines'])
-        df = self.read_csv(StringIO(data), skiprows=[1])
-        tm.assert_frame_equal(df, expected)
-
-        data = """id,text,num_lines
-1,"line '11\n' \r\tline 12",2
-2,"line '21\n' \r\tline 22",2
-3,"line '31\n' \r\tline 32",1"""
-        expected = [[2, "line '21\n' \r\tline 22", 2],
-                    [3, "line '31\n' \r\tline 32", 1]]
-        expected = DataFrame(expected, columns=[
-            'id', 'text', 'num_lines'])
-        df = self.read_csv(StringIO(data), skiprows=[1])
-        tm.assert_frame_equal(df, expected)
-
-    def test_skiprows_lineterminator(self):
-        # see gh-9079
-        data = '\n'.join(['SMOSMANIA ThetaProbe-ML2X ',
-                          '2007/01/01 01:00   0.2140 U M ',
-                          '2007/01/01 02:00   0.2141 M O ',
-                          '2007/01/01 04:00   0.2142 D M '])
-        expected = DataFrame([['2007/01/01', '01:00', 0.2140, 'U', 'M'],
-                              ['2007/01/01', '02:00', 0.2141, 'M', 'O'],
-                              ['2007/01/01', '04:00', 0.2142, 'D', 'M']],
-                             columns=['date', 'time', 'var', 'flag',
-                                      'oflag'])
-
-        # test with default line terminators "LF" and "CRLF"
-        df = self.read_csv(StringIO(data), skiprows=1, delim_whitespace=True,
-                           names=['date', 'time', 'var', 'flag', 'oflag'])
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(data.replace('\n', '\r\n')),
-                           skiprows=1, delim_whitespace=True,
-                           names=['date', 'time', 'var', 'flag', 'oflag'])
-        tm.assert_frame_equal(df, expected)
-
-        # "CR" is not respected with the Python parser yet
-        if self.engine == 'c':
-            df = self.read_csv(StringIO(data.replace('\n', '\r')),
-                               skiprows=1, delim_whitespace=True,
-                               names=['date', 'time', 'var', 'flag', 'oflag'])
-            tm.assert_frame_equal(df, expected)
-
-    def test_skiprows_infield_quote(self):
-        # see gh-14459
-        data = 'a"\nb"\na\n1'
-        expected = DataFrame({'a': [1]})
-
-        df = self.read_csv(StringIO(data), skiprows=2)
-        tm.assert_frame_equal(df, expected)
-
-    def test_skiprows_callable(self):
-        data = 'a\n1\n2\n3\n4\n5'
-
-        skiprows = lambda x: x % 2 == 0
-        expected = DataFrame({'1': [3, 5]})
-        df = self.read_csv(StringIO(data), skiprows=skiprows)
-        tm.assert_frame_equal(df, expected)
-
-        expected = DataFrame({'foo': [3, 5]})
-        df = self.read_csv(StringIO(data), skiprows=skiprows,
-                           header=0, names=['foo'])
-        tm.assert_frame_equal(df, expected)
-
-        skiprows = lambda x: True
-        msg = "No columns to parse from file"
-        with tm.assertRaisesRegexp(EmptyDataError, msg):
-            self.read_csv(StringIO(data), skiprows=skiprows)
-
-        # This is a bad callable and should raise.
-        msg = "by zero"
-        skiprows = lambda x: 1 / 0
-        with tm.assertRaisesRegexp(ZeroDivisionError, msg):
-            self.read_csv(StringIO(data), skiprows=skiprows)
diff --git a/pandas/tests/io/parser/test_c_parser_only.py b/pandas/tests/io/parser/test_c_parser_only.py
new file mode 100644
index 0000000000000..c089a189ae551
--- /dev/null
+++ b/pandas/tests/io/parser/test_c_parser_only.py
@@ -0,0 +1,591 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that apply specifically to the CParser. Unless specifically stated
+as a CParser-specific issue, the goal is to eventually move as many of
+these tests out of this module as soon as the Python parser can accept
+further arguments when parsing.
+"""
+
+from io import TextIOWrapper
+import mmap
+import os
+import tarfile
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY3, BytesIO, StringIO, lrange, range
+from pandas.errors import ParserError
+import pandas.util._test_decorators as td
+
+from pandas import DataFrame, concat
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize(
+    "malformed",
+    ["1\r1\r1\r 1\r 1\r",
+     "1\r1\r1\r 1\r 1\r11\r",
+     "1\r1\r1\r 1\r 1\r11\r1\r"],
+    ids=["words pointer", "stream pointer", "lines pointer"])
+def test_buffer_overflow(c_parser_only, malformed):
+    # see gh-9205: test certain malformed input files that cause
+    # buffer overflows in tokenizer.c
+    msg = "Buffer overflow caught - possible malformed input file."
+    parser = c_parser_only
+
+    with pytest.raises(ParserError, match=msg):
+        parser.read_csv(StringIO(malformed))
+
+
+def test_buffer_rd_bytes(c_parser_only):
+    # see gh-12098: src->buffer in the C parser can be freed twice leading
+    # to a segfault if a corrupt gzip file is read with 'read_csv', and the
+    # buffer is filled more than once before gzip raises an Exception.
+
+    data = "\x1F\x8B\x08\x00\x00\x00\x00\x00\x00\x03\xED\xC3\x41\x09" \
+           "\x00\x00\x08\x00\xB1\xB7\xB6\xBA\xFE\xA5\xCC\x21\x6C\xB0" \
+           "\xA6\x4D" + "\x55" * 267 + \
+           "\x7D\xF7\x00\x91\xE0\x47\x97\x14\x38\x04\x00" \
+           "\x1f\x8b\x08\x00VT\x97V\x00\x03\xed]\xefO"
+    parser = c_parser_only
+
+    for _ in range(100):
+        try:
+            parser.read_csv(StringIO(data), compression="gzip",
+                            delim_whitespace=True)
+        except Exception:
+            pass
+
+
+def test_delim_whitespace_custom_terminator(c_parser_only):
+    # See gh-12912
+    data = "a b c~1 2 3~4 5 6~7 8 9"
+    parser = c_parser_only
+
+    df = parser.read_csv(StringIO(data), lineterminator="~",
+                         delim_whitespace=True)
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         columns=["a", "b", "c"])
+    tm.assert_frame_equal(df, expected)
+
+
+def test_dtype_and_names_error(c_parser_only):
+    # see gh-8833: passing both dtype and names
+    # resulting in an error reporting issue
+    parser = c_parser_only
+    data = """
+1.0 1
+2.0 2
+3.0 3
+"""
+    # base cases
+    result = parser.read_csv(StringIO(data), sep=r"\s+", header=None)
+    expected = DataFrame([[1.0, 1], [2.0, 2], [3.0, 3]])
+    tm.assert_frame_equal(result, expected)
+
+    result = parser.read_csv(StringIO(data), sep=r"\s+",
+                             header=None, names=["a", "b"])
+    expected = DataFrame(
+        [[1.0, 1], [2.0, 2], [3.0, 3]], columns=["a", "b"])
+    tm.assert_frame_equal(result, expected)
+
+    # fallback casting
+    result = parser.read_csv(StringIO(
+        data), sep=r"\s+", header=None,
+        names=["a", "b"], dtype={"a": np.int32})
+    expected = DataFrame([[1, 1], [2, 2], [3, 3]],
+                         columns=["a", "b"])
+    expected["a"] = expected["a"].astype(np.int32)
+    tm.assert_frame_equal(result, expected)
+
+    data = """
+1.0 1
+nan 2
+3.0 3
+"""
+    # fallback casting, but not castable
+    with pytest.raises(ValueError, match="cannot safely convert"):
+        parser.read_csv(StringIO(data), sep=r"\s+", header=None,
+                        names=["a", "b"], dtype={"a": np.int32})
+
+
+@pytest.mark.parametrize("match,kwargs", [
+    # For each of these cases, all of the dtypes are valid, just unsupported.
+    (("the dtype datetime64 is not supported for parsing, "
+      "pass this column using parse_dates instead"),
+     dict(dtype={"A": "datetime64", "B": "float64"})),
+
+    (("the dtype datetime64 is not supported for parsing, "
+      "pass this column using parse_dates instead"),
+     dict(dtype={"A": "datetime64", "B": "float64"},
+          parse_dates=["B"])),
+
+    ("the dtype timedelta64 is not supported for parsing",
+     dict(dtype={"A": "timedelta64", "B": "float64"})),
+
+    ("the dtype <U8 is not supported for parsing",
+     dict(dtype={"A": "U8"}))
+], ids=["dt64-0", "dt64-1", "td64", "<U8"])
+def test_unsupported_dtype(c_parser_only, match, kwargs):
+    parser = c_parser_only
+    df = DataFrame(np.random.rand(5, 2), columns=list(
+        "AB"), index=["1A", "1B", "1C", "1D", "1E"])
+
+    with tm.ensure_clean("__unsupported_dtype__.csv") as path:
+        df.to_csv(path)
+
+        with pytest.raises(TypeError, match=match):
+            parser.read_csv(path, index_col=0, **kwargs)
+
+
+@td.skip_if_32bit
+def test_precise_conversion(c_parser_only):
+    from decimal import Decimal
+    parser = c_parser_only
+
+    normal_errors = []
+    precise_errors = []
+
+    # test numbers between 1 and 2
+    for num in np.linspace(1., 2., num=500):
+        # 25 decimal digits of precision
+        text = "a\n{0:.25}".format(num)
+
+        normal_val = float(parser.read_csv(StringIO(text))["a"][0])
+        precise_val = float(parser.read_csv(
+            StringIO(text), float_precision="high")["a"][0])
+        roundtrip_val = float(parser.read_csv(
+            StringIO(text), float_precision="round_trip")["a"][0])
+        actual_val = Decimal(text[2:])
+
+        def error(val):
+            return abs(Decimal("{0:.100}".format(val)) - actual_val)
+
+        normal_errors.append(error(normal_val))
+        precise_errors.append(error(precise_val))
+
+        # round-trip should match float()
+        assert roundtrip_val == float(text[2:])
+
+    assert sum(precise_errors) <= sum(normal_errors)
+    assert max(precise_errors) <= max(normal_errors)
+
+
+def test_usecols_dtypes(c_parser_only):
+    parser = c_parser_only
+    data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+
+    result = parser.read_csv(StringIO(data), usecols=(0, 1, 2),
+                             names=("a", "b", "c"),
+                             header=None,
+                             converters={"a": str},
+                             dtype={"b": int, "c": float})
+    result2 = parser.read_csv(StringIO(data), usecols=(0, 2),
+                              names=("a", "b", "c"),
+                              header=None,
+                              converters={"a": str},
+                              dtype={"b": int, "c": float})
+
+    assert (result.dtypes == [object, np.int, np.float]).all()
+    assert (result2.dtypes == [object, np.float]).all()
+
+
+def test_disable_bool_parsing(c_parser_only):
+    # see gh-2090
+
+    parser = c_parser_only
+    data = """A,B,C
+Yes,No,Yes
+No,Yes,Yes
+Yes,,Yes
+No,No,No"""
+
+    result = parser.read_csv(StringIO(data), dtype=object)
+    assert (result.dtypes == object).all()
+
+    result = parser.read_csv(StringIO(data), dtype=object, na_filter=False)
+    assert result["B"][2] == ""
+
+
+def test_custom_lineterminator(c_parser_only):
+    parser = c_parser_only
+    data = "a,b,c~1,2,3~4,5,6"
+
+    result = parser.read_csv(StringIO(data), lineterminator="~")
+    expected = parser.read_csv(StringIO(data.replace("~", "\n")))
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_ragged_csv(c_parser_only):
+    parser = c_parser_only
+    data = """1,2,3
+1,2,3,4
+1,2,3,4,5
+1,2
+1,2,3,4"""
+
+    nice_data = """1,2,3,,
+1,2,3,4,
+1,2,3,4,5
+1,2,,,
+1,2,3,4,"""
+    result = parser.read_csv(StringIO(data), header=None,
+                             names=["a", "b", "c", "d", "e"])
+
+    expected = parser.read_csv(StringIO(nice_data), header=None,
+                               names=["a", "b", "c", "d", "e"])
+
+    tm.assert_frame_equal(result, expected)
+
+    # too many columns, cause segfault if not careful
+    data = "1,2\n3,4,5"
+
+    result = parser.read_csv(StringIO(data), header=None,
+                             names=lrange(50))
+    expected = parser.read_csv(StringIO(data), header=None,
+                               names=lrange(3)).reindex(columns=lrange(50))
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_tokenize_CR_with_quoting(c_parser_only):
+    # see gh-3453
+    parser = c_parser_only
+    data = " a,b,c\r\"a,b\",\"e,d\",\"f,f\""
+
+    result = parser.read_csv(StringIO(data), header=None)
+    expected = parser.read_csv(StringIO(data.replace("\r", "\n")),
+                               header=None)
+    tm.assert_frame_equal(result, expected)
+
+    result = parser.read_csv(StringIO(data))
+    expected = parser.read_csv(StringIO(data.replace("\r", "\n")))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_grow_boundary_at_cap(c_parser_only):
+    # See gh-12494
+    #
+    # Cause of error was that the C parser
+    # was not increasing the buffer size when
+    # the desired space would fill the buffer
+    # to capacity, which would later cause a
+    # buffer overflow error when checking the
+    # EOF terminator of the CSV stream.
+    parser = c_parser_only
+
+    def test_empty_header_read(count):
+        s = StringIO("," * count)
+        expected = DataFrame(columns=[
+            "Unnamed: {i}".format(i=i)
+            for i in range(count + 1)])
+        df = parser.read_csv(s)
+        tm.assert_frame_equal(df, expected)
+
+    for cnt in range(1, 101):
+        test_empty_header_read(cnt)
+
+
+def test_parse_trim_buffers(c_parser_only):
+    # This test is part of a bugfix for gh-13703. It attempts to
+    # to stress the system memory allocator, to cause it to move the
+    # stream buffer and either let the OS reclaim the region, or let
+    # other memory requests of parser otherwise modify the contents
+    # of memory space, where it was formally located.
+    # This test is designed to cause a `segfault` with unpatched
+    # `tokenizer.c`. Sometimes the test fails on `segfault`, other
+    # times it fails due to memory corruption, which causes the
+    # loaded DataFrame to differ from the expected one.
+
+    parser = c_parser_only
+
+    # Generate a large mixed-type CSV file on-the-fly (one record is
+    # approx 1.5KiB).
+    record_ = \
+        """9999-9,99:99,,,,ZZ,ZZ,,,ZZZ-ZZZZ,.Z-ZZZZ,-9.99,,,9.99,Z""" \
+        """ZZZZ,,-99,9,ZZZ-ZZZZ,ZZ-ZZZZ,,9.99,ZZZ-ZZZZZ,ZZZ-ZZZZZ,""" \
+        """ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,9""" \
+        """99,ZZZ-ZZZZ,,ZZ-ZZZZ,,,,,ZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,,,9,9,""" \
+        """9,9,99,99,999,999,ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZ,9,ZZ-ZZZZ,9.""" \
+        """99,ZZ-ZZZZ,ZZ-ZZZZ,,,,ZZZZ,,,ZZ,ZZ,,,,,,,,,,,,,9,,,999.""" \
+        """99,999.99,,,ZZZZZ,,,Z9,,,,,,,ZZZ,ZZZ,,,,,,,,,,,ZZZZZ,ZZ""" \
+        """ZZZ,ZZZ-ZZZZZZ,ZZZ-ZZZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZZZ,ZZ-ZZ""" \
+        """ZZ,,,999999,999999,ZZZ,ZZZ,,,ZZZ,ZZZ,999.99,999.99,,,,Z""" \
+        """ZZ-ZZZ,ZZZ-ZZZ,-9.99,-9.99,9,9,,99,,9.99,9.99,9,9,9.99,""" \
+        """9.99,,,,9.99,9.99,,99,,99,9.99,9.99,,,ZZZ,ZZZ,,999.99,,""" \
+        """999.99,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,ZZZZZ,ZZZZZ,ZZZ,ZZZ,9,9,""" \
+        """,,,,,ZZZ-ZZZZ,ZZZ999Z,,,999.99,,999.99,ZZZ-ZZZZ,,,9.999""" \
+        """,9.999,9.999,9.999,-9.999,-9.999,-9.999,-9.999,9.999,9.""" \
+        """999,9.999,9.999,9.999,9.999,9.999,9.999,99999,ZZZ-ZZZZ,""" \
+        """,9.99,ZZZ,,,,,,,,ZZZ,,,,,9,,,,9,,,,,,,,,,ZZZ-ZZZZ,ZZZ-Z""" \
+        """ZZZ,,ZZZZZ,ZZZZZ,ZZZZZ,ZZZZZ,,,9.99,,ZZ-ZZZZ,ZZ-ZZZZ,ZZ""" \
+        """,999,,,,ZZ-ZZZZ,ZZZ,ZZZ,ZZZ-ZZZZ,ZZZ-ZZZZ,,,99.99,99.99""" \
+        """,,,9.99,9.99,9.99,9.99,ZZZ-ZZZZ,,,ZZZ-ZZZZZ,,,,,-9.99,-""" \
+        """9.99,-9.99,-9.99,,,,,,,,,ZZZ-ZZZZ,,9,9.99,9.99,99ZZ,,-9""" \
+        """.99,-9.99,ZZZ-ZZZZ,,,,,,,ZZZ-ZZZZ,9.99,9.99,9999,,,,,,,""" \
+        """,,,-9.9,Z/Z-ZZZZ,999.99,9.99,,999.99,ZZ-ZZZZ,ZZ-ZZZZ,9.""" \
+        """99,9.99,9.99,9.99,9.99,9.99,,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ-ZZ""" \
+        """ZZZ,ZZZ-ZZZZZ,ZZZ-ZZZZZ,ZZZ,ZZZ,ZZZ,ZZZ,9.99,,,-9.99,ZZ""" \
+        """-ZZZZ,-999.99,,-9999,,999.99,,,,999.99,99.99,,,ZZ-ZZZZZ""" \
+        """ZZZ,ZZ-ZZZZ-ZZZZZZZ,,,,ZZ-ZZ-ZZZZZZZZ,ZZZZZZZZ,ZZZ-ZZZZ""" \
+        """,9999,999.99,ZZZ-ZZZZ,-9.99,-9.99,ZZZ-ZZZZ,99:99:99,,99""" \
+        """,99,,9.99,,-99.99,,,,,,9.99,ZZZ-ZZZZ,-9.99,-9.99,9.99,9""" \
+        """.99,,ZZZ,,,,,,,ZZZ,ZZZ,,,,,"""
+
+    # Set the number of lines so that a call to `parser_trim_buffers`
+    # is triggered: after a couple of full chunks are consumed a
+    # relatively small 'residual' chunk would cause reallocation
+    # within the parser.
+    chunksize, n_lines = 128, 2 * 128 + 15
+    csv_data = "\n".join([record_] * n_lines) + "\n"
+
+    # We will use StringIO to load the CSV from this text buffer.
+    # pd.read_csv() will iterate over the file in chunks and will
+    # finally read a residual chunk of really small size.
+
+    # Generate the expected output: manually create the dataframe
+    # by splitting by comma and repeating the `n_lines` times.
+    row = tuple(val_ if val_ else np.nan
+                for val_ in record_.split(","))
+    expected = DataFrame([row for _ in range(n_lines)],
+                         dtype=object, columns=None, index=None)
+
+    # Iterate over the CSV file in chunks of `chunksize` lines
+    chunks_ = parser.read_csv(StringIO(csv_data), header=None,
+                              dtype=object, chunksize=chunksize)
+    result = concat(chunks_, axis=0, ignore_index=True)
+
+    # Check for data corruption if there was no segfault
+    tm.assert_frame_equal(result, expected)
+
+    # This extra test was added to replicate the fault in gh-5291.
+    # Force 'utf-8' encoding, so that `_string_convert` would take
+    # a different execution branch.
+    chunks_ = parser.read_csv(StringIO(csv_data), header=None,
+                              dtype=object, chunksize=chunksize,
+                              encoding="utf_8")
+    result = concat(chunks_, axis=0, ignore_index=True)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_internal_null_byte(c_parser_only):
+    # see gh-14012
+    #
+    # The null byte ('\x00') should not be used as a
+    # true line terminator, escape character, or comment
+    # character, only as a placeholder to indicate that
+    # none was specified.
+    #
+    # This test should be moved to test_common.py ONLY when
+    # Python's csv class supports parsing '\x00'.
+    parser = c_parser_only
+
+    names = ["a", "b", "c"]
+    data = "1,2,3\n4,\x00,6\n7,8,9"
+    expected = DataFrame([[1, 2.0, 3], [4, np.nan, 6],
+                          [7, 8, 9]], columns=names)
+
+    result = parser.read_csv(StringIO(data), names=names)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_nrows_large(c_parser_only):
+    # gh-7626 - Read only nrows of data in for large inputs (>262144b)
+    parser = c_parser_only
+    header_narrow = "\t".join(["COL_HEADER_" + str(i)
+                               for i in range(10)]) + "\n"
+    data_narrow = "\t".join(["somedatasomedatasomedata1"
+                             for _ in range(10)]) + "\n"
+    header_wide = "\t".join(["COL_HEADER_" + str(i)
+                             for i in range(15)]) + "\n"
+    data_wide = "\t".join(["somedatasomedatasomedata2"
+                           for _ in range(15)]) + "\n"
+    test_input = (header_narrow + data_narrow * 1050 +
+                  header_wide + data_wide * 2)
+
+    df = parser.read_csv(StringIO(test_input), sep="\t", nrows=1010)
+
+    assert df.size == 1010 * 10
+
+
+def test_float_precision_round_trip_with_text(c_parser_only):
+    # see gh-15140 - This should not segfault on Python 2.7+
+    parser = c_parser_only
+    df = parser.read_csv(StringIO("a"), header=None,
+                         float_precision="round_trip")
+    tm.assert_frame_equal(df, DataFrame({0: ["a"]}))
+
+
+def test_large_difference_in_columns(c_parser_only):
+    # see gh-14125
+    parser = c_parser_only
+
+    count = 10000
+    large_row = ("X," * count)[:-1] + "\n"
+    normal_row = "XXXXXX XXXXXX,111111111111111\n"
+    test_input = (large_row + normal_row * 6)[:-1]
+
+    result = parser.read_csv(StringIO(test_input), header=None, usecols=[0])
+    rows = test_input.split("\n")
+
+    expected = DataFrame([row.split(",")[0] for row in rows])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_data_after_quote(c_parser_only):
+    # see gh-15910
+    parser = c_parser_only
+
+    data = "a\n1\n\"b\"a"
+    result = parser.read_csv(StringIO(data))
+
+    expected = DataFrame({"a": ["1", "ba"]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_comment_whitespace_delimited(c_parser_only, capsys):
+    parser = c_parser_only
+    test_input = """\
+1 2
+2 2 3
+3 2 3 # 3 fields
+4 2 3# 3 fields
+5 2 # 2 fields
+6 2# 2 fields
+7 # 1 field, NaN
+8# 1 field, NaN
+9 2 3 # skipped line
+# comment"""
+    df = parser.read_csv(StringIO(test_input), comment="#", header=None,
+                         delimiter="\\s+", skiprows=0,
+                         error_bad_lines=False)
+    captured = capsys.readouterr()
+    # skipped lines 2, 3, 4, 9
+    for line_num in (2, 3, 4, 9):
+        assert "Skipping line {}".format(line_num) in captured.err
+    expected = DataFrame([[1, 2],
+                          [5, 2],
+                          [6, 2],
+                          [7, np.nan],
+                          [8, np.nan]])
+    tm.assert_frame_equal(df, expected)
+
+
+def test_file_like_no_next(c_parser_only):
+    # gh-16530: the file-like need not have a "next" or "__next__"
+    # attribute despite having an "__iter__" attribute.
+    #
+    # NOTE: This is only true for the C engine, not Python engine.
+    class NoNextBuffer(StringIO):
+        def __next__(self):
+            raise AttributeError("No next method")
+
+        next = __next__
+
+    parser = c_parser_only
+    data = "a\n1"
+
+    expected = DataFrame({"a": [1]})
+    result = parser.read_csv(NoNextBuffer(data))
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_buffer_rd_bytes_bad_unicode(c_parser_only):
+    # see gh-22748
+    parser = c_parser_only
+    t = BytesIO(b"\xB0")
+
+    if PY3:
+        msg = "'utf-8' codec can't encode character"
+        t = TextIOWrapper(t, encoding="ascii", errors="surrogateescape")
+    else:
+        msg = "'utf8' codec can't decode byte"
+
+    with pytest.raises(UnicodeError, match=msg):
+        parser.read_csv(t, encoding="UTF-8")
+
+
+@pytest.mark.parametrize("tar_suffix", [".tar", ".tar.gz"])
+def test_read_tarfile(c_parser_only, csv_dir_path, tar_suffix):
+    # see gh-16530
+    #
+    # Unfortunately, Python's CSV library can't handle
+    # tarfile objects (expects string, not bytes when
+    # iterating through a file-like).
+    parser = c_parser_only
+    tar_path = os.path.join(csv_dir_path, "tar_csv" + tar_suffix)
+
+    with tarfile.open(tar_path, "r") as tar:
+        data_file = tar.extractfile("tar_data.csv")
+
+        out = parser.read_csv(data_file)
+        expected = DataFrame({"a": [1]})
+        tm.assert_frame_equal(out, expected)
+
+
+@pytest.mark.high_memory
+def test_bytes_exceed_2gb(c_parser_only):
+    # see gh-16798
+    #
+    # Read from a "CSV" that has a column larger than 2GB.
+    parser = c_parser_only
+
+    if parser.low_memory:
+        pytest.skip("not a high_memory test")
+
+    csv = StringIO("strings\n" + "\n".join(
+        ["x" * (1 << 20) for _ in range(2100)]))
+    df = parser.read_csv(csv)
+    assert not df.empty
+
+
+def test_chunk_whitespace_on_boundary(c_parser_only):
+    # see gh-9735: this issue is C parser-specific (bug when
+    # parsing whitespace and characters at chunk boundary)
+    #
+    # This test case has a field too large for the Python parser / CSV library.
+    parser = c_parser_only
+
+    chunk1 = "a" * (1024 * 256 - 2) + "\na"
+    chunk2 = "\n a"
+    result = parser.read_csv(StringIO(chunk1 + chunk2), header=None)
+
+    expected = DataFrame(["a" * (1024 * 256 - 2), "a", " a"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_file_handles_mmap(c_parser_only, csv1):
+    # gh-14418
+    #
+    # Don't close user provided file handles.
+    parser = c_parser_only
+
+    with open(csv1, "r") as f:
+        m = mmap.mmap(f.fileno(), 0, access=mmap.ACCESS_READ)
+        parser.read_csv(m)
+
+        if PY3:
+            assert not m.closed
+        m.close()
+
+
+def test_file_binary_mode(c_parser_only):
+    # see gh-23779
+    parser = c_parser_only
+    expected = DataFrame([[1, 2, 3], [4, 5, 6]])
+
+    with tm.ensure_clean() as path:
+        with open(path, "w") as f:
+            f.write("1,2,3\n4,5,6")
+
+        with open(path, "rb") as f:
+            result = parser.read_csv(f, header=None)
+            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_comment.py b/pandas/tests/io/parser/test_comment.py
new file mode 100644
index 0000000000000..299a04f876bd1
--- /dev/null
+++ b/pandas/tests/io/parser/test_comment.py
@@ -0,0 +1,136 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that comments are properly handled during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO
+
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("na_values", [None, ["NaN"]])
+def test_comment(all_parsers, na_values):
+    parser = all_parsers
+    data = """A,B,C
+1,2.,4.#hello world
+5.,NaN,10.0
+"""
+    expected = DataFrame([[1., 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data), comment="#",
+                             na_values=na_values)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("read_kwargs", [
+    dict(),
+    dict(lineterminator="*"),
+    dict(delim_whitespace=True),
+])
+def test_line_comment(all_parsers, read_kwargs):
+    parser = all_parsers
+    data = """# empty
+A,B,C
+1,2.,4.#hello world
+#ignore this line
+5.,NaN,10.0
+"""
+    if read_kwargs.get("delim_whitespace"):
+        data = data.replace(",", " ")
+    elif read_kwargs.get("lineterminator"):
+        if parser.engine != "c":
+            pytest.skip("Custom terminator not supported with Python engine")
+
+        data = data.replace("\n", read_kwargs.get("lineterminator"))
+
+    read_kwargs["comment"] = "#"
+    result = parser.read_csv(StringIO(data), **read_kwargs)
+
+    expected = DataFrame([[1., 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_comment_skiprows(all_parsers):
+    parser = all_parsers
+    data = """# empty
+random line
+# second empty line
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+    # This should ignore the first four lines (including comments).
+    expected = DataFrame([[1., 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data), comment="#", skiprows=4)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_comment_header(all_parsers):
+    parser = all_parsers
+    data = """# empty
+# second empty line
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+    # Header should begin at the second non-comment line.
+    expected = DataFrame([[1., 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data), comment="#", header=1)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_comment_skiprows_header(all_parsers):
+    parser = all_parsers
+    data = """# empty
+# second empty line
+# third empty line
+X,Y,Z
+1,2,3
+A,B,C
+1,2.,4.
+5.,NaN,10.0
+"""
+    # Skiprows should skip the first 4 lines (including comments),
+    # while header should start from the second non-commented line,
+    # starting with line 5.
+    expected = DataFrame([[1., 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data), comment="#", skiprows=4, header=1)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("comment_char", ["#", "~", "&", "^", "*", "@"])
+def test_custom_comment_char(all_parsers, comment_char):
+    parser = all_parsers
+    data = "a,b,c\n1,2,3#ignore this!\n4,5,6#ignorethistoo"
+    result = parser.read_csv(StringIO(data.replace("#", comment_char)),
+                             comment=comment_char)
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6]], columns=["a", "b", "c"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("header", ["infer", None])
+def test_comment_first_line(all_parsers, header):
+    # see gh-4623
+    parser = all_parsers
+    data = "# notes\na,b,c\n# more notes\n1,2,3"
+
+    if header is None:
+        expected = DataFrame({0: ["a", "1"], 1: ["b", "2"], 2: ["c", "3"]})
+    else:
+        expected = DataFrame([[1, 2, 3]], columns=["a", "b", "c"])
+
+    result = parser.read_csv(StringIO(data), comment="#", header=header)
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_common.py b/pandas/tests/io/parser/test_common.py
new file mode 100644
index 0000000000000..05da171d7dc31
--- /dev/null
+++ b/pandas/tests/io/parser/test_common.py
@@ -0,0 +1,1946 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that work on both the Python and C engines but do not have a
+specific classification into the other test modules.
+"""
+
+import codecs
+from collections import OrderedDict
+import csv
+from datetime import datetime
+import os
+import platform
+from tempfile import TemporaryFile
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslib import Timestamp
+from pandas.compat import BytesIO, StringIO, lrange, range, u
+from pandas.errors import DtypeWarning, EmptyDataError, ParserError
+
+from pandas import DataFrame, Index, MultiIndex, Series, compat, concat
+import pandas.util.testing as tm
+
+from pandas.io.common import URLError
+from pandas.io.parsers import CParserWrapper, TextFileReader, TextParser
+
+
+def test_override_set_noconvert_columns():
+    # see gh-17351
+    #
+    # Usecols needs to be sorted in _set_noconvert_columns based
+    # on the test_usecols_with_parse_dates test from test_usecols.py
+    class MyTextFileReader(TextFileReader):
+        def __init__(self):
+            self._currow = 0
+            self.squeeze = False
+
+    class MyCParserWrapper(CParserWrapper):
+        def _set_noconvert_columns(self):
+            if self.usecols_dtype == "integer":
+                # self.usecols is a set, which is documented as unordered
+                # but in practice, a CPython set of integers is sorted.
+                # In other implementations this assumption does not hold.
+                # The following code simulates a different order, which
+                # before GH 17351 would cause the wrong columns to be
+                # converted via the parse_dates parameter
+                self.usecols = list(self.usecols)
+                self.usecols.reverse()
+            return CParserWrapper._set_noconvert_columns(self)
+
+    data = """a,b,c,d,e
+0,1,20140101,0900,4
+0,1,20140102,1000,4"""
+
+    parse_dates = [[1, 2]]
+    cols = {
+        "a": [0, 0],
+        "c_d": [
+            Timestamp("2014-01-01 09:00:00"),
+            Timestamp("2014-01-02 10:00:00")
+        ]
+    }
+    expected = DataFrame(cols, columns=["c_d", "a"])
+
+    parser = MyTextFileReader()
+    parser.options = {"usecols": [0, 2, 3],
+                      "parse_dates": parse_dates,
+                      "delimiter": ","}
+    parser._engine = MyCParserWrapper(StringIO(data), **parser.options)
+
+    result = parser.read()
+    tm.assert_frame_equal(result, expected)
+
+
+def test_bytes_io_input(all_parsers):
+    if compat.PY2:
+        pytest.skip("Bytes-related test does not need to work on Python 2.x")
+
+    encoding = "cp1255"
+    parser = all_parsers
+
+    data = BytesIO("שלום:1234\n562:123".encode(encoding))
+    result = parser.read_csv(data, sep=":", encoding=encoding)
+
+    expected = DataFrame([[562, 123]], columns=["שלום", "1234"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_decimal_marker(all_parsers):
+    data = """A|B|C
+1|2,334|5
+10|13|10.
+"""
+    # Parsers support only length-1 decimals
+    msg = "Only length-1 decimal markers supported"
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), decimal="")
+
+
+def test_bad_stream_exception(all_parsers, csv_dir_path):
+    # see gh-13652
+    #
+    # This test validates that both the Python engine and C engine will
+    # raise UnicodeDecodeError instead of C engine raising ParserError
+    # and swallowing the exception that caused read to fail.
+    path = os.path.join(csv_dir_path, "sauron.SHIFT_JIS.csv")
+    codec = codecs.lookup("utf-8")
+    utf8 = codecs.lookup('utf-8')
+    parser = all_parsers
+
+    msg = ("'utf-8' codec can't decode byte" if compat.PY3
+           else "'utf8' codec can't decode byte")
+
+    # Stream must be binary UTF8.
+    with open(path, "rb") as handle, codecs.StreamRecoder(
+            handle, utf8.encode, utf8.decode, codec.streamreader,
+            codec.streamwriter) as stream:
+
+        with pytest.raises(UnicodeDecodeError, match=msg):
+            parser.read_csv(stream)
+
+
+@pytest.mark.skipif(compat.PY2, reason="PY3-only test")
+def test_read_csv_local(all_parsers, csv1):
+    prefix = u("file:///") if compat.is_platform_windows() else u("file://")
+    parser = all_parsers
+
+    fname = prefix + compat.text_type(os.path.abspath(csv1))
+    result = parser.read_csv(fname, index_col=0, parse_dates=True)
+
+    expected = DataFrame([[0.980269, 3.685731, -0.364216805298, -1.159738],
+                          [1.047916, -0.041232, -0.16181208307, 0.212549],
+                          [0.498581, 0.731168, -0.537677223318, 1.346270],
+                          [1.120202, 1.567621, 0.00364077397681, 0.675253],
+                          [-0.487094, 0.571455, -1.6116394093, 0.103469],
+                          [0.836649, 0.246462, 0.588542635376, 1.062782],
+                          [-0.157161, 1.340307, 1.1957779562, -1.097007]],
+                         columns=["A", "B", "C", "D"],
+                         index=Index([datetime(2000, 1, 3),
+                                      datetime(2000, 1, 4),
+                                      datetime(2000, 1, 5),
+                                      datetime(2000, 1, 6),
+                                      datetime(2000, 1, 7),
+                                      datetime(2000, 1, 10),
+                                      datetime(2000, 1, 11)], name="index"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_1000_sep(all_parsers):
+    parser = all_parsers
+    data = """A|B|C
+1|2,334|5
+10|13|10.
+"""
+    expected = DataFrame({
+        "A": [1, 10],
+        "B": [2334, 13],
+        "C": [5, 10.]
+    })
+
+    result = parser.read_csv(StringIO(data), sep="|", thousands=",")
+    tm.assert_frame_equal(result, expected)
+
+
+def test_squeeze(all_parsers):
+    data = """\
+a,1
+b,2
+c,3
+"""
+    parser = all_parsers
+    index = Index(["a", "b", "c"], name=0)
+    expected = Series([1, 2, 3], name=1, index=index)
+
+    result = parser.read_csv(StringIO(data), index_col=0,
+                             header=None, squeeze=True)
+    tm.assert_series_equal(result, expected)
+
+    # see gh-8217
+    #
+    # Series should not be a view.
+    assert not result._is_view
+
+
+def test_malformed(all_parsers):
+    # see gh-6607
+    parser = all_parsers
+    data = """ignore
+A,B,C
+1,2,3 # comment
+1,2,3,4,5
+2,3,4
+"""
+    msg = "Expected 3 fields in line 4, saw 5"
+    with pytest.raises(ParserError, match=msg):
+        parser.read_csv(StringIO(data), header=1, comment="#")
+
+
+@pytest.mark.parametrize("nrows", [5, 3, None])
+def test_malformed_chunks(all_parsers, nrows):
+    data = """ignore
+A,B,C
+skip
+1,2,3
+3,5,10 # comment
+1,2,3,4,5
+2,3,4
+"""
+    parser = all_parsers
+    msg = 'Expected 3 fields in line 6, saw 5'
+    reader = parser.read_csv(StringIO(data), header=1, comment="#",
+                             iterator=True, chunksize=1, skiprows=[2])
+
+    with pytest.raises(ParserError, match=msg):
+        reader.read(nrows)
+
+
+def test_unnamed_columns(all_parsers):
+    data = """A,B,C,,
+1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+    parser = all_parsers
+    expected = DataFrame([[1, 2, 3, 4, 5],
+                          [6, 7, 8, 9, 10],
+                          [11, 12, 13, 14, 15]],
+                         dtype=np.int64, columns=["A", "B", "C",
+                                                  "Unnamed: 3",
+                                                  "Unnamed: 4"])
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_csv_mixed_type(all_parsers):
+    data = """A,B,C
+a,1,2
+b,3,4
+c,4,5
+"""
+    parser = all_parsers
+    expected = DataFrame({"A": ["a", "b", "c"],
+                          "B": [1, 3, 4],
+                          "C": [2, 4, 5]})
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_low_memory_no_rows_with_index(all_parsers):
+    # see gh-21141
+    parser = all_parsers
+
+    if not parser.low_memory:
+        pytest.skip("This is a low-memory specific test")
+
+    data = """A,B,C
+1,1,1,2
+2,2,3,4
+3,3,4,5
+"""
+    result = parser.read_csv(StringIO(data), low_memory=True,
+                             index_col=0, nrows=0)
+    expected = DataFrame(columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_dataframe(all_parsers, csv1):
+    parser = all_parsers
+    result = parser.read_csv(csv1, index_col=0, parse_dates=True)
+
+    expected = DataFrame([[0.980269, 3.685731, -0.364216805298, -1.159738],
+                          [1.047916, -0.041232, -0.16181208307, 0.212549],
+                          [0.498581, 0.731168, -0.537677223318, 1.346270],
+                          [1.120202, 1.567621, 0.00364077397681, 0.675253],
+                          [-0.487094, 0.571455, -1.6116394093, 0.103469],
+                          [0.836649, 0.246462, 0.588542635376, 1.062782],
+                          [-0.157161, 1.340307, 1.1957779562, -1.097007]],
+                         columns=["A", "B", "C", "D"],
+                         index=Index([datetime(2000, 1, 3),
+                                      datetime(2000, 1, 4),
+                                      datetime(2000, 1, 5),
+                                      datetime(2000, 1, 6),
+                                      datetime(2000, 1, 7),
+                                      datetime(2000, 1, 10),
+                                      datetime(2000, 1, 11)], name="index"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_no_index_name(all_parsers, csv_dir_path):
+    parser = all_parsers
+    csv2 = os.path.join(csv_dir_path, "test2.csv")
+    result = parser.read_csv(csv2, index_col=0, parse_dates=True)
+
+    expected = DataFrame([[0.980269, 3.685731, -0.364216805298,
+                           -1.159738, "foo"],
+                          [1.047916, -0.041232, -0.16181208307,
+                           0.212549, "bar"],
+                          [0.498581, 0.731168, -0.537677223318,
+                           1.346270, "baz"],
+                          [1.120202, 1.567621, 0.00364077397681,
+                           0.675253, "qux"],
+                          [-0.487094, 0.571455, -1.6116394093,
+                           0.103469, "foo2"]],
+                         columns=["A", "B", "C", "D", "E"],
+                         index=Index([datetime(2000, 1, 3),
+                                      datetime(2000, 1, 4),
+                                      datetime(2000, 1, 5),
+                                      datetime(2000, 1, 6),
+                                      datetime(2000, 1, 7)]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_unicode(all_parsers):
+    parser = all_parsers
+    data = BytesIO(u("\u0141aski, Jan;1").encode("utf-8"))
+
+    result = parser.read_csv(data, sep=";", encoding="utf-8", header=None)
+    expected = DataFrame([[u("\u0141aski, Jan"), 1]])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_wrong_num_columns(all_parsers):
+    # Too few columns.
+    data = """A,B,C,D,E,F
+1,2,3,4,5,6
+6,7,8,9,10,11,12
+11,12,13,14,15,16
+"""
+    parser = all_parsers
+    msg = "Expected 6 fields in line 3, saw 7"
+
+    with pytest.raises(ParserError, match=msg):
+        parser.read_csv(StringIO(data))
+
+
+def test_read_duplicate_index_explicit(all_parsers):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo,12,13,14,15
+bar,12,13,14,15
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=0)
+
+    expected = DataFrame([[2, 3, 4, 5], [7, 8, 9, 10],
+                          [12, 13, 14, 15], [12, 13, 14, 15],
+                          [12, 13, 14, 15], [12, 13, 14, 15]],
+                         columns=["A", "B", "C", "D"],
+                         index=Index(["foo", "bar", "baz",
+                                      "qux", "foo", "bar"], name="index"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_duplicate_index_implicit(all_parsers):
+    data = """A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo,12,13,14,15
+bar,12,13,14,15
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data))
+
+    expected = DataFrame([[2, 3, 4, 5], [7, 8, 9, 10],
+                          [12, 13, 14, 15], [12, 13, 14, 15],
+                          [12, 13, 14, 15], [12, 13, 14, 15]],
+                         columns=["A", "B", "C", "D"],
+                         index=Index(["foo", "bar", "baz",
+                                      "qux", "foo", "bar"]))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    ("A,B\nTrue,1\nFalse,2\nTrue,3", dict(),
+     DataFrame([[True, 1], [False, 2], [True, 3]], columns=["A", "B"])),
+    ("A,B\nYES,1\nno,2\nyes,3\nNo,3\nYes,3",
+     dict(true_values=["yes", "Yes", "YES"],
+          false_values=["no", "NO", "No"]),
+     DataFrame([[True, 1], [False, 2], [True, 3],
+                [False, 3], [True, 3]], columns=["A", "B"])),
+    ("A,B\nTRUE,1\nFALSE,2\nTRUE,3", dict(),
+     DataFrame([[True, 1], [False, 2], [True, 3]], columns=["A", "B"])),
+    ("A,B\nfoo,bar\nbar,foo", dict(true_values=["foo"],
+                                   false_values=["bar"]),
+     DataFrame([[True, False], [False, True]], columns=["A", "B"]))
+])
+def test_parse_bool(all_parsers, data, kwargs, expected):
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_int_conversion(all_parsers):
+    data = """A,B
+1.0,1
+2.0,2
+3.0,3
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data))
+
+    expected = DataFrame([[1.0, 1], [2.0, 2], [3.0, 3]], columns=["A", "B"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("nrows", [3, 3.0])
+def test_read_nrows(all_parsers, nrows):
+    # see gh-10476
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    expected = DataFrame([["foo", 2, 3, 4, 5],
+                          ["bar", 7, 8, 9, 10],
+                          ["baz", 12, 13, 14, 15]],
+                         columns=["index", "A", "B", "C", "D"])
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), nrows=nrows)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("nrows", [1.2, "foo", -1])
+def test_read_nrows_bad(all_parsers, nrows):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    msg = r"'nrows' must be an integer >=0"
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), nrows=nrows)
+
+
+@pytest.mark.parametrize("index_col", [0, "index"])
+def test_read_chunksize_with_index(all_parsers, index_col):
+    parser = all_parsers
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+    reader = parser.read_csv(StringIO(data), index_col=0, chunksize=2)
+    expected = DataFrame([["foo", 2, 3, 4, 5],
+                          ["bar", 7, 8, 9, 10],
+                          ["baz", 12, 13, 14, 15],
+                          ["qux", 12, 13, 14, 15],
+                          ["foo2", 12, 13, 14, 15],
+                          ["bar2", 12, 13, 14, 15]],
+                         columns=["index", "A", "B", "C", "D"])
+    expected = expected.set_index("index")
+
+    chunks = list(reader)
+    tm.assert_frame_equal(chunks[0], expected[:2])
+    tm.assert_frame_equal(chunks[1], expected[2:4])
+    tm.assert_frame_equal(chunks[2], expected[4:])
+
+
+@pytest.mark.parametrize("chunksize", [1.3, "foo", 0])
+def test_read_chunksize_bad(all_parsers, chunksize):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    msg = r"'chunksize' must be an integer >=1"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), chunksize=chunksize)
+
+
+@pytest.mark.parametrize("chunksize", [2, 8])
+def test_read_chunksize_and_nrows(all_parsers, chunksize):
+    # see gh-15755
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    kwargs = dict(index_col=0, nrows=5)
+
+    reader = parser.read_csv(StringIO(data), chunksize=chunksize, **kwargs)
+    expected = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(concat(reader), expected)
+
+
+def test_read_chunksize_and_nrows_changing_size(all_parsers):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    kwargs = dict(index_col=0, nrows=5)
+
+    reader = parser.read_csv(StringIO(data), chunksize=8, **kwargs)
+    expected = parser.read_csv(StringIO(data), **kwargs)
+
+    tm.assert_frame_equal(reader.get_chunk(size=2), expected.iloc[:2])
+    tm.assert_frame_equal(reader.get_chunk(size=4), expected.iloc[2:5])
+
+    with pytest.raises(StopIteration, match=""):
+        reader.get_chunk(size=3)
+
+
+def test_get_chunk_passed_chunksize(all_parsers):
+    parser = all_parsers
+    data = """A,B,C
+1,2,3
+4,5,6
+7,8,9
+1,2,3"""
+
+    reader = parser.read_csv(StringIO(data), chunksize=2)
+    result = reader.get_chunk()
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6]], columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [dict(), dict(index_col=0)])
+def test_read_chunksize_compat(all_parsers, kwargs):
+    # see gh-12185
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    reader = parser.read_csv(StringIO(data), chunksize=2, **kwargs)
+
+    result = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(concat(reader), result)
+
+
+def test_read_chunksize_jagged_names(all_parsers):
+    # see gh-23509
+    parser = all_parsers
+    data = "\n".join(["0"] * 7 + [",".join(["0"] * 10)])
+
+    expected = DataFrame([[0] + [np.nan] * 9] * 7 + [[0] * 10])
+    reader = parser.read_csv(StringIO(data), names=range(10), chunksize=4)
+
+    result = concat(reader)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_data_list(all_parsers):
+    parser = all_parsers
+    kwargs = dict(index_col=0)
+    data = "A,B,C\nfoo,1,2,3\nbar,4,5,6"
+
+    data_list = [["A", "B", "C"], ["foo", "1", "2", "3"],
+                 ["bar", "4", "5", "6"]]
+    expected = parser.read_csv(StringIO(data), **kwargs)
+
+    parser = TextParser(data_list, chunksize=2, **kwargs)
+    result = parser.read()
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_iterator(all_parsers):
+    # see gh-6607
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    kwargs = dict(index_col=0)
+
+    expected = parser.read_csv(StringIO(data), **kwargs)
+    reader = parser.read_csv(StringIO(data), iterator=True, **kwargs)
+
+    first_chunk = reader.read(3)
+    tm.assert_frame_equal(first_chunk, expected[:3])
+
+    last_chunk = reader.read(5)
+    tm.assert_frame_equal(last_chunk, expected[3:])
+
+
+def test_iterator2(all_parsers):
+    parser = all_parsers
+    data = """A,B,C
+foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+
+    reader = parser.read_csv(StringIO(data), iterator=True)
+    result = list(reader)
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         index=["foo", "bar", "baz"],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result[0], expected)
+
+
+def test_reader_list(all_parsers):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    kwargs = dict(index_col=0)
+
+    lines = list(csv.reader(StringIO(data)))
+    reader = TextParser(lines, chunksize=2, **kwargs)
+
+    expected = parser.read_csv(StringIO(data), **kwargs)
+    chunks = list(reader)
+
+    tm.assert_frame_equal(chunks[0], expected[:2])
+    tm.assert_frame_equal(chunks[1], expected[2:4])
+    tm.assert_frame_equal(chunks[2], expected[4:])
+
+
+def test_reader_list_skiprows(all_parsers):
+    data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+    parser = all_parsers
+    kwargs = dict(index_col=0)
+
+    lines = list(csv.reader(StringIO(data)))
+    reader = TextParser(lines, chunksize=2, skiprows=[1], **kwargs)
+
+    expected = parser.read_csv(StringIO(data), **kwargs)
+    chunks = list(reader)
+
+    tm.assert_frame_equal(chunks[0], expected[1:3])
+
+
+def test_iterator_stop_on_chunksize(all_parsers):
+    # gh-3967: stopping iteration when chunksize is specified
+    parser = all_parsers
+    data = """A,B,C
+foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+
+    reader = parser.read_csv(StringIO(data), chunksize=1)
+    result = list(reader)
+
+    assert len(result) == 3
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         index=["foo", "bar", "baz"],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(concat(result), expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(iterator=True,
+         chunksize=1),
+    dict(iterator=True),
+    dict(chunksize=1)
+])
+def test_iterator_skipfooter_errors(all_parsers, kwargs):
+    msg = "'skipfooter' not supported for 'iteration'"
+    parser = all_parsers
+    data = "a\n1\n2"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), skipfooter=1, **kwargs)
+
+
+def test_nrows_skipfooter_errors(all_parsers):
+    msg = "'skipfooter' not supported with 'nrows'"
+    data = "a\n1\n2\n3\n4\n5\n6"
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), skipfooter=1, nrows=5)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    ("""foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+""", dict(index_col=0, names=["index", "A", "B", "C", "D"]),
+     DataFrame([[2, 3, 4, 5], [7, 8, 9, 10], [12, 13, 14, 15],
+                [12, 13, 14, 15], [12, 13, 14, 15], [12, 13, 14, 15]],
+               index=Index(["foo", "bar", "baz", "qux",
+                            "foo2", "bar2"], name="index"),
+               columns=["A", "B", "C", "D"])),
+    ("""foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+""", dict(index_col=[0, 1], names=["index1", "index2", "A", "B", "C", "D"]),
+     DataFrame([[2, 3, 4, 5], [7, 8, 9, 10], [12, 13, 14, 15],
+                [12, 13, 14, 15], [12, 13, 14, 15]],
+               index=MultiIndex.from_tuples([
+                   ("foo", "one"), ("foo", "two"), ("foo", "three"),
+                   ("bar", "one"), ("bar", "two")],
+                   names=["index1", "index2"]),
+               columns=["A", "B", "C", "D"])),
+])
+def test_pass_names_with_index(all_parsers, data, kwargs, expected):
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_col", [[0, 1], [1, 0]])
+def test_multi_index_no_level_names(all_parsers, index_col):
+    data = """index1,index2,A,B,C,D
+foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+"""
+    headless_data = '\n'.join(data.split("\n")[1:])
+
+    names = ["A", "B", "C", "D"]
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(headless_data),
+                             index_col=index_col,
+                             header=None, names=names)
+    expected = parser.read_csv(StringIO(data), index_col=index_col)
+
+    # No index names in headless data.
+    expected.index.names = [None] * 2
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multi_index_no_level_names_implicit(all_parsers):
+    parser = all_parsers
+    data = """A,B,C,D
+foo,one,2,3,4,5
+foo,two,7,8,9,10
+foo,three,12,13,14,15
+bar,one,12,13,14,15
+bar,two,12,13,14,15
+"""
+
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame([[2, 3, 4, 5], [7, 8, 9, 10], [12, 13, 14, 15],
+                          [12, 13, 14, 15], [12, 13, 14, 15]],
+                         columns=["A", "B", "C", "D"],
+                         index=MultiIndex.from_tuples([
+                             ("foo", "one"), ("foo", "two"), ("foo", "three"),
+                             ("bar", "one"), ("bar", "two")]))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,expected,header", [
+    ("a,b", DataFrame(columns=["a", "b"]), [0]),
+    ("a,b\nc,d", DataFrame(columns=MultiIndex.from_tuples(
+        [("a", "c"), ("b", "d")])), [0, 1]),
+])
+@pytest.mark.parametrize("round_trip", [True, False])
+def test_multi_index_blank_df(all_parsers, data, expected, header, round_trip):
+    # see gh-14545
+    parser = all_parsers
+    data = expected.to_csv(index=False) if round_trip else data
+
+    result = parser.read_csv(StringIO(data), header=header)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_no_unnamed_index(all_parsers):
+    parser = all_parsers
+    data = """ id c0 c1 c2
+0 1 0 a b
+1 2 0 c d
+2 2 2 e f
+"""
+    result = parser.read_csv(StringIO(data), sep=" ")
+    expected = DataFrame([[0, 1, 0, "a", "b"], [1, 2, 0, "c", "d"],
+                          [2, 2, 2, "e", "f"]], columns=["Unnamed: 0", "id",
+                                                         "c0", "c1", "c2"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_parse_simple_list(all_parsers):
+    parser = all_parsers
+    data = """foo
+bar baz
+qux foo
+foo
+bar"""
+
+    result = parser.read_csv(StringIO(data), header=None)
+    expected = DataFrame(["foo", "bar baz", "qux foo", "foo", "bar"])
+    tm.assert_frame_equal(result, expected)
+
+
+@tm.network
+def test_url(all_parsers, csv_dir_path):
+    # TODO: FTP testing
+    parser = all_parsers
+    kwargs = dict(sep="\t")
+
+    url = ("https://raw.github.com/pandas-dev/pandas/master/"
+           "pandas/tests/io/parser/data/salaries.csv")
+    url_result = parser.read_csv(url, **kwargs)
+
+    local_path = os.path.join(csv_dir_path, "salaries.csv")
+    local_result = parser.read_csv(local_path, **kwargs)
+    tm.assert_frame_equal(url_result, local_result)
+
+
+@pytest.mark.slow
+def test_local_file(all_parsers, csv_dir_path):
+    parser = all_parsers
+    kwargs = dict(sep="\t")
+
+    local_path = os.path.join(csv_dir_path, "salaries.csv")
+    local_result = parser.read_csv(local_path, **kwargs)
+    url = "file://localhost/" + local_path
+
+    try:
+        url_result = parser.read_csv(url, **kwargs)
+        tm.assert_frame_equal(url_result, local_result)
+    except URLError:
+        # Fails on some systems.
+        pytest.skip("Failing on: " + " ".join(platform.uname()))
+
+
+def test_path_path_lib(all_parsers):
+    parser = all_parsers
+    df = tm.makeDataFrame()
+    result = tm.round_trip_pathlib(
+        df.to_csv, lambda p: parser.read_csv(p, index_col=0))
+    tm.assert_frame_equal(df, result)
+
+
+def test_path_local_path(all_parsers):
+    parser = all_parsers
+    df = tm.makeDataFrame()
+    result = tm.round_trip_localpath(
+        df.to_csv, lambda p: parser.read_csv(p, index_col=0))
+    tm.assert_frame_equal(df, result)
+
+
+def test_nonexistent_path(all_parsers):
+    # gh-2428: pls no segfault
+    # gh-14086: raise more helpful FileNotFoundError
+    parser = all_parsers
+    path = "%s.csv" % tm.rands(10)
+
+    msg = ("does not exist" if parser.engine == "c"
+           else r"\[Errno 2\]")
+    with pytest.raises(compat.FileNotFoundError, match=msg) as e:
+        parser.read_csv(path)
+
+        filename = e.value.filename
+        filename = filename.decode() if isinstance(
+            filename, bytes) else filename
+
+        assert path == filename
+
+
+def test_missing_trailing_delimiters(all_parsers):
+    parser = all_parsers
+    data = """A,B,C,D
+1,2,3,4
+1,3,3,
+1,4,5"""
+
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame([[1, 2, 3, 4], [1, 3, 3, np.nan],
+                          [1, 4, 5, np.nan]], columns=["A", "B", "C", "D"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_skip_initial_space(all_parsers):
+    data = ('"09-Apr-2012", "01:10:18.300", 2456026.548822908, 12849, '
+            '1.00361,  1.12551, 330.65659, 0355626618.16711,  73.48821, '
+            '314.11625,  1917.09447,   179.71425,  80.000, 240.000, -350,  '
+            '70.06056, 344.98370, 1,   1, -0.689265, -0.692787,  '
+            '0.212036,    14.7674,   41.605,   -9999.0,   -9999.0,   '
+            '-9999.0,   -9999.0,   -9999.0,  -9999.0, 000, 012, 128')
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), names=lrange(33), header=None,
+                             na_values=["-9999.0"], skipinitialspace=True)
+    expected = DataFrame([["09-Apr-2012", "01:10:18.300", 2456026.548822908,
+                           12849, 1.00361, 1.12551, 330.65659,
+                           355626618.16711, 73.48821, 314.11625, 1917.09447,
+                           179.71425, 80.0, 240.0, -350, 70.06056, 344.9837,
+                           1, 1, -0.689265, -0.692787, 0.212036, 14.7674,
+                           41.605, np.nan, np.nan, np.nan, np.nan, np.nan,
+                           np.nan, 0, 12, 128]])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("sep", [",", "\t"])
+@pytest.mark.parametrize("encoding", ["utf-16", "utf-16le", "utf-16be"])
+def test_utf16_bom_skiprows(all_parsers, sep, encoding):
+    # see gh-2298
+    parser = all_parsers
+    data = u("""skip this
+skip this too
+A,B,C
+1,2,3
+4,5,6""").replace(",", sep)
+    path = "__%s__.csv" % tm.rands(10)
+    kwargs = dict(sep=sep, skiprows=2)
+    utf8 = "utf-8"
+
+    with tm.ensure_clean(path) as path:
+        bytes_data = data.encode(encoding)
+
+        with open(path, "wb") as f:
+            f.write(bytes_data)
+
+        bytes_buffer = BytesIO(data.encode(utf8))
+
+        if compat.PY3:
+            from io import TextIOWrapper
+            bytes_buffer = TextIOWrapper(bytes_buffer, encoding=utf8)
+
+        result = parser.read_csv(path, encoding=encoding, **kwargs)
+        expected = parser.read_csv(bytes_buffer, encoding=utf8, **kwargs)
+
+        bytes_buffer.close()
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("buffer", [
+    False,
+    pytest.param(True, marks=pytest.mark.skipif(
+        compat.PY3, reason="Not supported on PY3"))])
+def test_utf16_example(all_parsers, csv_dir_path, buffer):
+    path = os.path.join(csv_dir_path, "utf16_ex.txt")
+    parser = all_parsers
+
+    src = BytesIO(open(path, "rb").read()) if buffer else path
+    result = parser.read_csv(src, encoding="utf-16", sep="\t")
+    assert len(result) == 50
+
+
+def test_unicode_encoding(all_parsers, csv_dir_path):
+    path = os.path.join(csv_dir_path, "unicode_series.csv")
+    parser = all_parsers
+
+    result = parser.read_csv(path, header=None, encoding="latin-1")
+    result = result.set_index(0)
+    got = result[1][1632]
+
+    expected = u('\xc1 k\xf6ldum klaka (Cold Fever) (1994)')
+    assert got == expected
+
+
+def test_trailing_delimiters(all_parsers):
+    # see gh-2442
+    data = """A,B,C
+1,2,3,
+4,5,6,
+7,8,9,"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=False)
+
+    expected = DataFrame({"A": [1, 4, 7], "B": [2, 5, 8], "C": [3, 6, 9]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_escapechar(all_parsers):
+    # http://stackoverflow.com/questions/13824840/feature-request-for-
+    # pandas-read-csv
+    data = '''SEARCH_TERM,ACTUAL_URL
+"bra tv bord","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
+"tv p\xc3\xa5 hjul","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"
+"SLAGBORD, \\"Bergslagen\\", IKEA:s 1700-tals serie","http://www.ikea.com/se/sv/catalog/categories/departments/living_room/10475/?se%7cps%7cnonbranded%7cvardagsrum%7cgoogle%7ctv_bord"'''  # noqa
+
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), escapechar='\\',
+                             quotechar='"', encoding='utf-8')
+
+    assert result['SEARCH_TERM'][2] == ('SLAGBORD, "Bergslagen", '
+                                        'IKEA:s 1700-tals serie')
+    tm.assert_index_equal(result.columns,
+                          Index(['SEARCH_TERM', 'ACTUAL_URL']))
+
+
+def test_int64_min_issues(all_parsers):
+    # see gh-2599
+    parser = all_parsers
+    data = "A,B\n0,0\n0,"
+    result = parser.read_csv(StringIO(data))
+
+    expected = DataFrame({"A": [0, 0], "B": [0, np.nan]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_integers_above_fp_precision(all_parsers):
+    data = """Numbers
+17007000002000191
+17007000002000191
+17007000002000191
+17007000002000191
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000192
+17007000002000194"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame({"Numbers": [17007000002000191,
+                                      17007000002000191,
+                                      17007000002000191,
+                                      17007000002000191,
+                                      17007000002000192,
+                                      17007000002000192,
+                                      17007000002000192,
+                                      17007000002000192,
+                                      17007000002000192,
+                                      17007000002000194]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_chunks_have_consistent_numerical_type(all_parsers):
+    parser = all_parsers
+    integers = [str(i) for i in range(499999)]
+    data = "a\n" + "\n".join(integers + ["1.0", "2.0"] + integers)
+
+    # Coercions should work without warnings.
+    with tm.assert_produces_warning(None):
+        result = parser.read_csv(StringIO(data))
+
+    assert type(result.a[0]) is np.float64
+    assert result.a.dtype == np.float
+
+
+def test_warn_if_chunks_have_mismatched_type(all_parsers):
+    warning_type = None
+    parser = all_parsers
+    integers = [str(i) for i in range(499999)]
+    data = "a\n" + "\n".join(integers + ["a", "b"] + integers)
+
+    # see gh-3866: if chunks are different types and can't
+    # be coerced using numerical types, then issue warning.
+    if parser.engine == "c" and parser.low_memory:
+        warning_type = DtypeWarning
+
+    with tm.assert_produces_warning(warning_type):
+        df = parser.read_csv(StringIO(data))
+    assert df.a.dtype == np.object
+
+
+@pytest.mark.parametrize("sep", [" ", r"\s+"])
+def test_integer_overflow_bug(all_parsers, sep):
+    # see gh-2601
+    data = "65248E10 11\n55555E55 22\n"
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), header=None, sep=sep)
+    expected = DataFrame([[6.5248e14, 11], [5.5555e59, 22]])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_catch_too_many_names(all_parsers):
+    # see gh-5156
+    data = """\
+1,2,3
+4,,6
+7,8,9
+10,11,12\n"""
+    parser = all_parsers
+    msg = ("Too many columns specified: "
+           "expected 4 and found 3" if parser.engine == "c"
+           else "Number of passed names did not match "
+                "number of header fields in the file")
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), header=0, names=["a", "b", "c", "d"])
+
+
+def test_ignore_leading_whitespace(all_parsers):
+    # see gh-3374, gh-6607
+    parser = all_parsers
+    data = " a b c\n 1 2 3\n 4 5 6\n 7 8 9"
+    result = parser.read_csv(StringIO(data), sep=r"\s+")
+
+    expected = DataFrame({"a": [1, 4, 7], "b": [2, 5, 8], "c": [3, 6, 9]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_chunk_begins_with_newline_whitespace(all_parsers):
+    # see gh-10022
+    parser = all_parsers
+    data = "\n hello\nworld\n"
+
+    result = parser.read_csv(StringIO(data), header=None)
+    expected = DataFrame([" hello", "world"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_index(all_parsers):
+    # see gh-10184
+    data = "x,y"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=0)
+
+    expected = DataFrame([], columns=["y"], index=Index([], name="x"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_multi_index(all_parsers):
+    # see gh-10467
+    data = "x,y,z"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=["x", "y"])
+
+    expected = DataFrame([], columns=["z"],
+                         index=MultiIndex.from_arrays(
+                             [[]] * 2, names=["x", "y"]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_reversed_multi_index(all_parsers):
+    data = "x,y,z"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=[1, 0])
+
+    expected = DataFrame([], columns=["z"],
+                         index=MultiIndex.from_arrays(
+                             [[]] * 2, names=["y", "x"]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_float_parser(all_parsers):
+    # see gh-9565
+    parser = all_parsers
+    data = "45e-1,4.5,45.,inf,-inf"
+    result = parser.read_csv(StringIO(data), header=None)
+
+    expected = DataFrame([[float(s) for s in data.split(",")]])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_scientific_no_exponent(all_parsers):
+    # see gh-12215
+    df = DataFrame.from_dict(OrderedDict([("w", ["2e"]), ("x", ["3E"]),
+                                          ("y", ["42e"]),
+                                          ("z", ["632E"])]))
+    data = df.to_csv(index=False)
+    parser = all_parsers
+
+    for precision in parser.float_precision_choices:
+        df_roundtrip = parser.read_csv(StringIO(data),
+                                       float_precision=precision)
+        tm.assert_frame_equal(df_roundtrip, df)
+
+
+@pytest.mark.parametrize("conv", [None, np.int64, np.uint64])
+def test_int64_overflow(all_parsers, conv):
+    data = """ID
+00013007854817840016671868
+00013007854817840016749251
+00013007854817840016754630
+00013007854817840016781876
+00013007854817840017028824
+00013007854817840017963235
+00013007854817840018860166"""
+    parser = all_parsers
+
+    if conv is None:
+        # 13007854817840016671868 > UINT64_MAX, so this
+        # will overflow and return object as the dtype.
+        result = parser.read_csv(StringIO(data))
+        expected = DataFrame(["00013007854817840016671868",
+                              "00013007854817840016749251",
+                              "00013007854817840016754630",
+                              "00013007854817840016781876",
+                              "00013007854817840017028824",
+                              "00013007854817840017963235",
+                              "00013007854817840018860166"], columns=["ID"])
+        tm.assert_frame_equal(result, expected)
+    else:
+        # 13007854817840016671868 > UINT64_MAX, so attempts
+        # to cast to either int64 or uint64 will result in
+        # an OverflowError being raised.
+        msg = ("(Python int too large to convert to C long)|"
+               "(long too big to convert)|"
+               "(int too big to convert)")
+
+        with pytest.raises(OverflowError, match=msg):
+            parser.read_csv(StringIO(data), converters={"ID": conv})
+
+
+@pytest.mark.parametrize("val", [
+    np.iinfo(np.uint64).max,
+    np.iinfo(np.int64).max,
+    np.iinfo(np.int64).min
+])
+def test_int64_uint64_range(all_parsers, val):
+    # These numbers fall right inside the int64-uint64
+    # range, so they should be parsed as string.
+    parser = all_parsers
+    result = parser.read_csv(StringIO(str(val)), header=None)
+
+    expected = DataFrame([val])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("val", [
+    np.iinfo(np.uint64).max + 1,
+    np.iinfo(np.int64).min - 1
+])
+def test_outside_int64_uint64_range(all_parsers, val):
+    # These numbers fall just outside the int64-uint64
+    # range, so they should be parsed as string.
+    parser = all_parsers
+    result = parser.read_csv(StringIO(str(val)), header=None)
+
+    expected = DataFrame([str(val)])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("exp_data", [[str(-1), str(2**63)],
+                                      [str(2**63), str(-1)]])
+def test_numeric_range_too_wide(all_parsers, exp_data):
+    # No numerical dtype can hold both negative and uint64
+    # values, so they should be cast as string.
+    parser = all_parsers
+    data = "\n".join(exp_data)
+    expected = DataFrame(exp_data)
+
+    result = parser.read_csv(StringIO(data), header=None)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("iterator", [True, False])
+def test_empty_with_nrows_chunksize(all_parsers, iterator):
+    # see gh-9535
+    parser = all_parsers
+    expected = DataFrame([], columns=["foo", "bar"])
+
+    nrows = 10
+    data = StringIO("foo,bar\n")
+
+    if iterator:
+        result = next(iter(parser.read_csv(data, chunksize=nrows)))
+    else:
+        result = parser.read_csv(data, nrows=nrows)
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected,msg", [
+    # gh-10728: WHITESPACE_LINE
+    ("a,b,c\n4,5,6\n ", dict(),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # gh-10548: EAT_LINE_COMMENT
+    ("a,b,c\n4,5,6\n#comment", dict(comment="#"),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # EAT_CRNL_NOP
+    ("a,b,c\n4,5,6\n\r", dict(),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # EAT_COMMENT
+    ("a,b,c\n4,5,6#comment", dict(comment="#"),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # SKIP_LINE
+    ("a,b,c\n4,5,6\nskipme", dict(skiprows=[2]),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # EAT_LINE_COMMENT
+    ("a,b,c\n4,5,6\n#comment", dict(comment="#", skip_blank_lines=False),
+     DataFrame([[4, 5, 6]], columns=["a", "b", "c"]), None),
+
+    # IN_FIELD
+    ("a,b,c\n4,5,6\n ", dict(skip_blank_lines=False),
+     DataFrame([["4", 5, 6], [" ", None, None]],
+               columns=["a", "b", "c"]), None),
+
+    # EAT_CRNL
+    ("a,b,c\n4,5,6\n\r", dict(skip_blank_lines=False),
+     DataFrame([[4, 5, 6], [None, None, None]],
+               columns=["a", "b", "c"]), None),
+
+    # ESCAPED_CHAR
+    ("a,b,c\n4,5,6\n\\", dict(escapechar="\\"),
+     None, "(EOF following escape character)|(unexpected end of data)"),
+
+    # ESCAPE_IN_QUOTED_FIELD
+    ('a,b,c\n4,5,6\n"\\', dict(escapechar="\\"),
+     None, "(EOF inside string starting at row 2)|(unexpected end of data)"),
+
+    # IN_QUOTED_FIELD
+    ('a,b,c\n4,5,6\n"', dict(escapechar="\\"),
+     None, "(EOF inside string starting at row 2)|(unexpected end of data)"),
+], ids=["whitespace-line", "eat-line-comment", "eat-crnl-nop", "eat-comment",
+        "skip-line", "eat-line-comment", "in-field", "eat-crnl",
+        "escaped-char", "escape-in-quoted-field", "in-quoted-field"])
+def test_eof_states(all_parsers, data, kwargs, expected, msg):
+    # see gh-10728, gh-10548
+    parser = all_parsers
+
+    if expected is None:
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data), **kwargs)
+    else:
+        result = parser.read_csv(StringIO(data), **kwargs)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols", [None, [0, 1], ["a", "b"]])
+def test_uneven_lines_with_usecols(all_parsers, usecols):
+    # see gh-12203
+    parser = all_parsers
+    data = r"""a,b,c
+0,1,2
+3,4,5,6,7
+8,9,10"""
+
+    if usecols is None:
+        # Make sure that an error is still raised
+        # when the "usecols" parameter is not provided.
+        msg = r"Expected \d+ fields in line \d+, saw \d+"
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data))
+    else:
+        expected = DataFrame({
+            "a": [0, 3, 8],
+            "b": [1, 4, 9]
+        })
+
+        result = parser.read_csv(StringIO(data), usecols=usecols)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    # First, check to see that the response of parser when faced with no
+    # provided columns raises the correct error, with or without usecols.
+    ("", dict(), None),
+    ("", dict(usecols=["X"]), None),
+    (",,", dict(names=["Dummy", "X", "Dummy_2"], usecols=["X"]),
+     DataFrame(columns=["X"], index=[0], dtype=np.float64)),
+    ("", dict(names=["Dummy", "X", "Dummy_2"], usecols=["X"]),
+     DataFrame(columns=["X"])),
+])
+def test_read_empty_with_usecols(all_parsers, data, kwargs, expected):
+    # see gh-12493
+    parser = all_parsers
+
+    if expected is None:
+        msg = "No columns to parse from file"
+        with pytest.raises(EmptyDataError, match=msg):
+            parser.read_csv(StringIO(data), **kwargs)
+    else:
+        result = parser.read_csv(StringIO(data), **kwargs)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,expected", [
+    # gh-8661, gh-8679: this should ignore six lines, including
+    # lines with trailing whitespace and blank lines.
+    (dict(header=None, delim_whitespace=True, skiprows=[0, 1, 2, 3, 5, 6],
+          skip_blank_lines=True), DataFrame([[1., 2., 4.],
+                                             [5.1, np.nan, 10.]])),
+
+    # gh-8983: test skipping set of rows after a row with trailing spaces.
+    (dict(delim_whitespace=True, skiprows=[1, 2, 3, 5, 6],
+          skip_blank_lines=True), DataFrame({"A": [1., 5.1],
+                                             "B": [2., np.nan],
+                                             "C": [4., 10]})),
+])
+def test_trailing_spaces(all_parsers, kwargs, expected):
+    data = "A B C  \nrandom line with trailing spaces    \nskip\n1,2,3\n1,2.,4.\nrandom line with trailing tabs\t\t\t\n   \n5.1,NaN,10.0\n"  # noqa
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data.replace(",", "  ")), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_raise_on_sep_with_delim_whitespace(all_parsers):
+    # see gh-6607
+    data = "a b c\n1 2 3"
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match="you can only specify one"):
+        parser.read_csv(StringIO(data), sep=r"\s", delim_whitespace=True)
+
+
+@pytest.mark.parametrize("delim_whitespace", [True, False])
+def test_single_char_leading_whitespace(all_parsers, delim_whitespace):
+    # see gh-9710
+    parser = all_parsers
+    data = """\
+MyColumn
+a
+b
+a
+b\n"""
+
+    expected = DataFrame({"MyColumn": list("abab")})
+    result = parser.read_csv(StringIO(data), skipinitialspace=True,
+                             delim_whitespace=delim_whitespace)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("sep,skip_blank_lines,exp_data", [
+    (",", True, [[1., 2., 4.], [5., np.nan, 10.], [-70., .4, 1.]]),
+    (r"\s+", True, [[1., 2., 4.], [5., np.nan, 10.], [-70., .4, 1.]]),
+    (",", False, [[1., 2., 4.], [np.nan, np.nan, np.nan],
+                  [np.nan, np.nan, np.nan], [5., np.nan, 10.],
+                  [np.nan, np.nan, np.nan], [-70., .4, 1.]]),
+])
+def test_empty_lines(all_parsers, sep, skip_blank_lines, exp_data):
+    parser = all_parsers
+    data = """\
+A,B,C
+1,2.,4.
+
+
+5.,NaN,10.0
+
+-70,.4,1
+"""
+
+    if sep == r"\s+":
+        data = data.replace(",", "  ")
+
+    result = parser.read_csv(StringIO(data), sep=sep,
+                             skip_blank_lines=skip_blank_lines)
+    expected = DataFrame(exp_data, columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_whitespace_lines(all_parsers):
+    parser = all_parsers
+    data = """
+
+\t  \t\t
+\t
+A,B,C
+\t    1,2.,4.
+5.,NaN,10.0
+"""
+    expected = DataFrame([[1, 2., 4.], [5., np.nan, 10.]],
+                         columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,expected", [
+    ("""   A   B   C   D
+a   1   2   3   4
+b   1   2   3   4
+c   1   2   3   4
+""", DataFrame([[1, 2, 3, 4], [1, 2, 3, 4], [1, 2, 3, 4]],
+               columns=["A", "B", "C", "D"], index=["a", "b", "c"])),
+    ("    a b c\n1 2 3 \n4 5  6\n 7 8 9",
+     DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]], columns=["a", "b", "c"])),
+])
+def test_whitespace_regex_separator(all_parsers, data, expected):
+    # see gh-6607
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), sep=r"\s+")
+    tm.assert_frame_equal(result, expected)
+
+
+def test_verbose_read(all_parsers, capsys):
+    parser = all_parsers
+    data = """a,b,c,d
+one,1,2,3
+one,1,2,3
+,1,2,3
+one,1,2,3
+,1,2,3
+,1,2,3
+one,1,2,3
+two,1,2,3"""
+
+    # Engines are verbose in different ways.
+    parser.read_csv(StringIO(data), verbose=True)
+    captured = capsys.readouterr()
+
+    if parser.engine == "c":
+        assert "Tokenization took:" in captured.out
+        assert "Parser memory cleanup took:" in captured.out
+    else:  # Python engine
+        assert captured.out == "Filled 3 NA values in column a\n"
+
+
+def test_verbose_read2(all_parsers, capsys):
+    parser = all_parsers
+    data = """a,b,c,d
+one,1,2,3
+two,1,2,3
+three,1,2,3
+four,1,2,3
+five,1,2,3
+,1,2,3
+seven,1,2,3
+eight,1,2,3"""
+
+    parser.read_csv(StringIO(data), verbose=True, index_col=0)
+    captured = capsys.readouterr()
+
+    # Engines are verbose in different ways.
+    if parser.engine == "c":
+        assert "Tokenization took:" in captured.out
+        assert "Parser memory cleanup took:" in captured.out
+    else:  # Python engine
+        assert captured.out == "Filled 1 NA values in column a\n"
+
+
+def test_iteration_open_handle(all_parsers):
+    parser = all_parsers
+    kwargs = dict(squeeze=True, header=None)
+
+    with tm.ensure_clean() as path:
+        with open(path, "wb" if compat.PY2 else "w") as f:
+            f.write("AAA\nBBB\nCCC\nDDD\nEEE\nFFF\nGGG")
+
+        with open(path, "rb" if compat.PY2 else "r") as f:
+            for line in f:
+                if "CCC" in line:
+                    break
+
+            if parser.engine == "c" and compat.PY2:
+                msg = "Mixing iteration and read methods would lose data"
+                with pytest.raises(ValueError, match=msg):
+                    parser.read_csv(f, **kwargs)
+            else:
+                result = parser.read_csv(f, **kwargs)
+                expected = Series(["DDD", "EEE", "FFF", "GGG"], name=0)
+                tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,thousands,decimal", [
+    ("""A|B|C
+1|2,334.01|5
+10|13|10.
+""", ",", "."),
+    ("""A|B|C
+1|2.334,01|5
+10|13|10,
+""", ".", ","),
+])
+def test_1000_sep_with_decimal(all_parsers, data, thousands, decimal):
+    parser = all_parsers
+    expected = DataFrame({
+        "A": [1, 10],
+        "B": [2334.01, 13],
+        "C": [5, 10.]
+    })
+
+    result = parser.read_csv(StringIO(data), sep="|",
+                             thousands=thousands,
+                             decimal=decimal)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_euro_decimal_format(all_parsers):
+    parser = all_parsers
+    data = """Id;Number1;Number2;Text1;Text2;Number3
+1;1521,1541;187101,9543;ABC;poi;4,738797819
+2;121,12;14897,76;DEF;uyt;0,377320872
+3;878,158;108013,434;GHI;rez;2,735694704"""
+
+    result = parser.read_csv(StringIO(data), sep=";", decimal=",")
+    expected = DataFrame([
+        [1, 1521.1541, 187101.9543, "ABC", "poi", 4.738797819],
+        [2, 121.12, 14897.76, "DEF", "uyt", 0.377320872],
+        [3, 878.158, 108013.434, "GHI", "rez", 2.735694704]
+    ], columns=["Id", "Number1", "Number2", "Text1", "Text2", "Number3"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_filter", [True, False])
+def test_inf_parsing(all_parsers, na_filter):
+    parser = all_parsers
+    data = """\
+,A
+a,inf
+b,-inf
+c,+Inf
+d,-Inf
+e,INF
+f,-INF
+g,+INf
+h,-INf
+i,inF
+j,-inF"""
+    expected = DataFrame({"A": [float("inf"), float("-inf")] * 5},
+                         index=["a", "b", "c", "d", "e",
+                                "f", "g", "h", "i", "j"])
+    result = parser.read_csv(StringIO(data), index_col=0, na_filter=na_filter)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("nrows", [0, 1, 2, 3, 4, 5])
+def test_raise_on_no_columns(all_parsers, nrows):
+    parser = all_parsers
+    data = "\n" * nrows
+
+    msg = "No columns to parse from file"
+    with pytest.raises(EmptyDataError, match=msg):
+        parser.read_csv(StringIO(data))
+
+
+def test_memory_map(all_parsers, csv_dir_path):
+    mmap_file = os.path.join(csv_dir_path, "test_mmap.csv")
+    parser = all_parsers
+
+    expected = DataFrame({
+        "a": [1, 2, 3],
+        "b": ["one", "two", "three"],
+        "c": ["I", "II", "III"]
+    })
+
+    result = parser.read_csv(mmap_file, memory_map=True)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_null_byte_char(all_parsers):
+    # see gh-2741
+    data = "\x00,foo"
+    names = ["a", "b"]
+    parser = all_parsers
+
+    if parser.engine == "c":
+        expected = DataFrame([[np.nan, "foo"]], columns=names)
+        out = parser.read_csv(StringIO(data), names=names)
+        tm.assert_frame_equal(out, expected)
+    else:
+        msg = "NULL byte detected"
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data), names=names)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    # Basic test
+    ("a\n1", dict(), DataFrame({"a": [1]})),
+
+    # "Regular" quoting
+    ('"a"\n1', dict(quotechar='"'), DataFrame({"a": [1]})),
+
+    # Test in a data row instead of header
+    ("b\n1", dict(names=["a"]), DataFrame({"a": ["b", "1"]})),
+
+    # Test in empty data row with skipping
+    ("\n1", dict(names=["a"], skip_blank_lines=True), DataFrame({"a": [1]})),
+
+    # Test in empty data row without skipping
+    ("\n1", dict(names=["a"], skip_blank_lines=False),
+     DataFrame({"a": [np.nan, 1]})),
+])
+def test_utf8_bom(all_parsers, data, kwargs, expected):
+    # see gh-4793
+    parser = all_parsers
+    bom = u("\ufeff")
+    utf8 = "utf-8"
+
+    def _encode_data_with_bom(_data):
+        bom_data = (bom + _data).encode(utf8)
+        return BytesIO(bom_data)
+
+    result = parser.read_csv(_encode_data_with_bom(data),
+                             encoding=utf8, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_temporary_file(all_parsers):
+    # see gh-13398
+    parser = all_parsers
+    data = "0 0"
+
+    new_file = TemporaryFile("w+")
+    new_file.write(data)
+    new_file.flush()
+    new_file.seek(0)
+
+    result = parser.read_csv(new_file, sep=r"\s+", header=None)
+    new_file.close()
+
+    expected = DataFrame([[0, 0]])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("byte", [8, 16])
+@pytest.mark.parametrize("fmt", ["utf-{0}", "utf_{0}",
+                                 "UTF-{0}", "UTF_{0}"])
+def test_read_csv_utf_aliases(all_parsers, byte, fmt):
+    # see gh-13549
+    expected = DataFrame({"mb_num": [4.8], "multibyte": ["test"]})
+    parser = all_parsers
+
+    encoding = fmt.format(byte)
+    data = "mb_num,multibyte\n4.8,test".encode(encoding)
+
+    result = parser.read_csv(BytesIO(data), encoding=encoding)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_internal_eof_byte(all_parsers):
+    # see gh-5500
+    parser = all_parsers
+    data = "a,b\n1\x1a,2"
+
+    expected = DataFrame([["1\x1a", 2]], columns=["a", "b"])
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_internal_eof_byte_to_file(all_parsers):
+    # see gh-16559
+    parser = all_parsers
+    data = b'c1,c2\r\n"test \x1a    test", test\r\n'
+    expected = DataFrame([["test \x1a    test", " test"]],
+                         columns=["c1", "c2"])
+    path = "__%s__.csv" % tm.rands(10)
+
+    with tm.ensure_clean(path) as path:
+        with open(path, "wb") as f:
+            f.write(data)
+
+        result = parser.read_csv(path)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_sub_character(all_parsers, csv_dir_path):
+    # see gh-16893
+    filename = os.path.join(csv_dir_path, "sub_char.csv")
+    expected = DataFrame([[1, 2, 3]], columns=["a", "\x1ab", "c"])
+
+    parser = all_parsers
+    result = parser.read_csv(filename)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_file_handle_string_io(all_parsers):
+    # gh-14418
+    #
+    # Don't close user provided file handles.
+    parser = all_parsers
+    data = "a,b\n1,2"
+
+    fh = StringIO(data)
+    parser.read_csv(fh)
+    assert not fh.closed
+
+
+def test_file_handles_with_open(all_parsers, csv1):
+    # gh-14418
+    #
+    # Don't close user provided file handles.
+    parser = all_parsers
+
+    with open(csv1, "r") as f:
+        parser.read_csv(f)
+        assert not f.closed
+
+
+def test_invalid_file_buffer_class(all_parsers):
+    # see gh-15337
+    class InvalidBuffer(object):
+        pass
+
+    parser = all_parsers
+    msg = "Invalid file path or buffer object type"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(InvalidBuffer())
+
+
+def test_invalid_file_buffer_mock(all_parsers):
+    # see gh-15337
+    parser = all_parsers
+    msg = "Invalid file path or buffer object type"
+
+    class Foo():
+        pass
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(Foo())
+
+
+def test_valid_file_buffer_seems_invalid(all_parsers):
+    # gh-16135: we want to ensure that "tell" and "seek"
+    # aren't actually being used when we call `read_csv`
+    #
+    # Thus, while the object may look "invalid" (these
+    # methods are attributes of the `StringIO` class),
+    # it is still a valid file-object for our purposes.
+    class NoSeekTellBuffer(StringIO):
+        def tell(self):
+            raise AttributeError("No tell method")
+
+        def seek(self, pos, whence=0):
+            raise AttributeError("No seek method")
+
+    data = "a\n1"
+    parser = all_parsers
+    expected = DataFrame({"a": [1]})
+
+    result = parser.read_csv(NoSeekTellBuffer(data))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(),                      # Default is True.
+    dict(error_bad_lines=True),  # Explicitly pass in.
+])
+@pytest.mark.parametrize("warn_kwargs", [
+    dict(), dict(warn_bad_lines=True),
+    dict(warn_bad_lines=False)
+])
+def test_error_bad_lines(all_parsers, kwargs, warn_kwargs):
+    # see gh-15925
+    parser = all_parsers
+    kwargs.update(**warn_kwargs)
+    data = "a\n1\n1,2,3\n4\n5,6,7"
+
+    msg = "Expected 1 fields in line 3, saw 3"
+    with pytest.raises(ParserError, match=msg):
+        parser.read_csv(StringIO(data), **kwargs)
+
+
+def test_warn_bad_lines(all_parsers, capsys):
+    # see gh-15925
+    parser = all_parsers
+    data = "a\n1\n1,2,3\n4\n5,6,7"
+    expected = DataFrame({"a": [1, 4]})
+
+    result = parser.read_csv(StringIO(data),
+                             error_bad_lines=False,
+                             warn_bad_lines=True)
+    tm.assert_frame_equal(result, expected)
+
+    captured = capsys.readouterr()
+    assert "Skipping line 3" in captured.err
+    assert "Skipping line 5" in captured.err
+
+
+def test_suppress_error_output(all_parsers, capsys):
+    # see gh-15925
+    parser = all_parsers
+    data = "a\n1\n1,2,3\n4\n5,6,7"
+    expected = DataFrame({"a": [1, 4]})
+
+    result = parser.read_csv(StringIO(data),
+                             error_bad_lines=False,
+                             warn_bad_lines=False)
+    tm.assert_frame_equal(result, expected)
+
+    captured = capsys.readouterr()
+    assert captured.err == ""
+
+
+def test_filename_with_special_chars(all_parsers):
+    # see gh-15086.
+    parser = all_parsers
+    df = DataFrame({"a": [1, 2, 3]})
+
+    with tm.ensure_clean("sé-es-vé.csv") as path:
+        df.to_csv(path, index=False)
+
+        result = parser.read_csv(path)
+        tm.assert_frame_equal(result, df)
+
+
+def test_read_csv_memory_growth_chunksize(all_parsers):
+    # see gh-24805
+    #
+    # Let's just make sure that we don't crash
+    # as we iteratively process all chunks.
+    parser = all_parsers
+
+    with tm.ensure_clean() as path:
+        with open(path, "w") as f:
+            for i in range(1000):
+                f.write(str(i) + "\n")
+
+        result = parser.read_csv(path, chunksize=20)
+
+        for _ in result:
+            pass
+
+
+def test_read_table_deprecated(all_parsers):
+    # see gh-21948
+    parser = all_parsers
+    data = "a\tb\n1\t2\n3\t4"
+    expected = parser.read_csv(StringIO(data), sep="\t")
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = parser.read_table(StringIO(data))
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_compression.py b/pandas/tests/io/parser/test_compression.py
new file mode 100644
index 0000000000000..6e615e795e53c
--- /dev/null
+++ b/pandas/tests/io/parser/test_compression.py
@@ -0,0 +1,154 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests compressed data parsing functionality for all
+of the parsers defined in parsers.py
+"""
+
+import os
+import zipfile
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[True, False])
+def buffer(request):
+    return request.param
+
+
+@pytest.fixture
+def parser_and_data(all_parsers, csv1):
+    parser = all_parsers
+
+    with open(csv1, "rb") as f:
+        data = f.read()
+        expected = parser.read_csv(csv1)
+
+    return parser, data, expected
+
+
+@pytest.mark.parametrize("compression", ["zip", "infer", "zip2"])
+def test_zip(parser_and_data, compression):
+    parser, data, expected = parser_and_data
+
+    with tm.ensure_clean("test_file.zip") as path:
+        with zipfile.ZipFile(path, mode="w") as tmp:
+            tmp.writestr("test_file", data)
+
+        if compression == "zip2":
+            with open(path, "rb") as f:
+                result = parser.read_csv(f, compression="zip")
+        else:
+            result = parser.read_csv(path, compression=compression)
+
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("compression", ["zip", "infer"])
+def test_zip_error_multiple_files(parser_and_data, compression):
+    parser, data, expected = parser_and_data
+
+    with tm.ensure_clean("combined_zip.zip") as path:
+        inner_file_names = ["test_file", "second_file"]
+
+        with zipfile.ZipFile(path, mode="w") as tmp:
+            for file_name in inner_file_names:
+                tmp.writestr(file_name, data)
+
+        with pytest.raises(ValueError, match="Multiple files"):
+            parser.read_csv(path, compression=compression)
+
+
+def test_zip_error_no_files(parser_and_data):
+    parser, _, _ = parser_and_data
+
+    with tm.ensure_clean() as path:
+        with zipfile.ZipFile(path, mode="w"):
+            pass
+
+        with pytest.raises(ValueError, match="Zero files"):
+            parser.read_csv(path, compression="zip")
+
+
+def test_zip_error_invalid_zip(parser_and_data):
+    parser, _, _ = parser_and_data
+
+    with tm.ensure_clean() as path:
+        with open(path, "wb") as f:
+            with pytest.raises(zipfile.BadZipfile,
+                               match="File is not a zip file"):
+                parser.read_csv(f, compression="zip")
+
+
+@pytest.mark.parametrize("filename", [None, "test.{ext}"])
+def test_compression(parser_and_data, compression_only, buffer, filename):
+    parser, data, expected = parser_and_data
+    compress_type = compression_only
+
+    ext = "gz" if compress_type == "gzip" else compress_type
+    filename = filename if filename is None else filename.format(ext=ext)
+
+    if filename and buffer:
+        pytest.skip("Cannot deduce compression from "
+                    "buffer of compressed data.")
+
+    with tm.ensure_clean(filename=filename) as path:
+        tm.write_to_compressed(compress_type, path, data)
+        compression = "infer" if filename else compress_type
+
+        if buffer:
+            with open(path, "rb") as f:
+                result = parser.read_csv(f, compression=compression)
+        else:
+            result = parser.read_csv(path, compression=compression)
+
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("ext", [None, "gz", "bz2"])
+def test_infer_compression(all_parsers, csv1, buffer, ext):
+    # see gh-9770
+    parser = all_parsers
+    kwargs = dict(index_col=0, parse_dates=True)
+
+    expected = parser.read_csv(csv1, **kwargs)
+    kwargs["compression"] = "infer"
+
+    if buffer:
+        with open(csv1) as f:
+            result = parser.read_csv(f, **kwargs)
+    else:
+        ext = "." + ext if ext else ""
+        result = parser.read_csv(csv1 + ext, **kwargs)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_compression_utf16_encoding(all_parsers, csv_dir_path):
+    # see gh-18071
+    parser = all_parsers
+    path = os.path.join(csv_dir_path, "utf16_ex_small.zip")
+
+    result = parser.read_csv(path, encoding="utf-16",
+                             compression="zip", sep="\t")
+    expected = pd.DataFrame({
+        u"Country": [u"Venezuela", u"Venezuela"],
+        u"Twitter": [u"Hugo Chávez Frías", u"Henrique Capriles R."]
+    })
+
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("invalid_compression", ["sfark", "bz3", "zipper"])
+def test_invalid_compression(all_parsers, invalid_compression):
+    parser = all_parsers
+    compress_kwargs = dict(compression=invalid_compression)
+
+    msg = ("Unrecognized compression "
+           "type: {compression}".format(**compress_kwargs))
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv("test_file.zip", **compress_kwargs)
diff --git a/pandas/tests/io/parser/test_converters.py b/pandas/tests/io/parser/test_converters.py
new file mode 100644
index 0000000000000..47bbae0274fd3
--- /dev/null
+++ b/pandas/tests/io/parser/test_converters.py
@@ -0,0 +1,158 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests column conversion functionality during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO, lmap, parse_date
+
+import pandas as pd
+from pandas import DataFrame, Index
+import pandas.util.testing as tm
+
+
+def test_converters_type_must_be_dict(all_parsers):
+    parser = all_parsers
+    data = """index,A,B,C,D
+foo,2,3,4,5
+"""
+
+    with pytest.raises(TypeError, match="Type converters.+"):
+        parser.read_csv(StringIO(data), converters=0)
+
+
+@pytest.mark.parametrize("column", [3, "D"])
+@pytest.mark.parametrize("converter", [
+    parse_date,
+    lambda x: int(x.split("/")[2])  # Produce integer.
+])
+def test_converters(all_parsers, column, converter):
+    parser = all_parsers
+    data = """A,B,C,D
+a,1,2,01/01/2009
+b,3,4,01/02/2009
+c,4,5,01/03/2009
+"""
+    result = parser.read_csv(StringIO(data), converters={column: converter})
+
+    expected = parser.read_csv(StringIO(data))
+    expected["D"] = expected["D"].map(converter)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_converters_no_implicit_conv(all_parsers):
+    # see gh-2184
+    parser = all_parsers
+    data = """000102,1.2,A\n001245,2,B"""
+
+    converters = {0: lambda x: x.strip()}
+    result = parser.read_csv(StringIO(data), header=None,
+                             converters=converters)
+
+    # Column 0 should not be casted to numeric and should remain as object.
+    expected = DataFrame([["000102", 1.2, "A"], ["001245", 2, "B"]])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_converters_euro_decimal_format(all_parsers):
+    # see gh-583
+    converters = dict()
+    parser = all_parsers
+
+    data = """Id;Number1;Number2;Text1;Text2;Number3
+1;1521,1541;187101,9543;ABC;poi;4,7387
+2;121,12;14897,76;DEF;uyt;0,3773
+3;878,158;108013,434;GHI;rez;2,7356"""
+    converters["Number1"] = converters["Number2"] =\
+        converters["Number3"] = lambda x: float(x.replace(",", "."))
+
+    result = parser.read_csv(StringIO(data), sep=";", converters=converters)
+    expected = DataFrame([[1, 1521.1541, 187101.9543, "ABC", "poi", 4.7387],
+                          [2, 121.12, 14897.76, "DEF", "uyt", 0.3773],
+                          [3, 878.158, 108013.434, "GHI", "rez", 2.7356]],
+                         columns=["Id", "Number1", "Number2",
+                                  "Text1", "Text2", "Number3"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_converters_corner_with_nans(all_parsers):
+    parser = all_parsers
+    data = """id,score,days
+1,2,12
+2,2-5,
+3,,14+
+4,6-12,2"""
+
+    # Example converters.
+    def convert_days(x):
+        x = x.strip()
+
+        if not x:
+            return np.nan
+
+        is_plus = x.endswith("+")
+
+        if is_plus:
+            x = int(x[:-1]) + 1
+        else:
+            x = int(x)
+
+        return x
+
+    def convert_days_sentinel(x):
+        x = x.strip()
+
+        if not x:
+            return np.nan
+
+        is_plus = x.endswith("+")
+
+        if is_plus:
+            x = int(x[:-1]) + 1
+        else:
+            x = int(x)
+
+        return x
+
+    def convert_score(x):
+        x = x.strip()
+
+        if not x:
+            return np.nan
+
+        if x.find("-") > 0:
+            val_min, val_max = lmap(int, x.split("-"))
+            val = 0.5 * (val_min + val_max)
+        else:
+            val = float(x)
+
+        return val
+
+    results = []
+
+    for day_converter in [convert_days, convert_days_sentinel]:
+        result = parser.read_csv(StringIO(data),
+                                 converters={"score": convert_score,
+                                             "days": day_converter},
+                                 na_values=["", None])
+        assert pd.isna(result["days"][1])
+        results.append(result)
+
+    tm.assert_frame_equal(results[0], results[1])
+
+
+def test_converter_index_col_bug(all_parsers):
+    # see gh-1835
+    parser = all_parsers
+    data = "A;B\n1;2\n3;4"
+
+    rs = parser.read_csv(StringIO(data), sep=";", index_col="A",
+                         converters={"A": lambda x: x})
+
+    xp = DataFrame({"B": [2, 4]}, index=Index([1, 3], name="A"))
+    tm.assert_frame_equal(rs, xp)
diff --git a/pandas/tests/io/parser/test_dialect.py b/pandas/tests/io/parser/test_dialect.py
new file mode 100644
index 0000000000000..5392f793b361c
--- /dev/null
+++ b/pandas/tests/io/parser/test_dialect.py
@@ -0,0 +1,135 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that dialects are properly handled during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import csv
+
+import pytest
+
+from pandas.compat import StringIO
+from pandas.errors import ParserWarning
+
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def custom_dialect():
+    dialect_name = "weird"
+    dialect_kwargs = dict(doublequote=False, escapechar="~", delimiter=":",
+                          skipinitialspace=False, quotechar="~", quoting=3)
+    return dialect_name, dialect_kwargs
+
+
+def test_dialect(all_parsers):
+    parser = all_parsers
+    data = """\
+label1,label2,label3
+index1,"a,c,e
+index2,b,d,f
+"""
+
+    dia = csv.excel()
+    dia.quoting = csv.QUOTE_NONE
+    df = parser.read_csv(StringIO(data), dialect=dia)
+
+    data = """\
+label1,label2,label3
+index1,a,c,e
+index2,b,d,f
+"""
+    exp = parser.read_csv(StringIO(data))
+    exp.replace("a", "\"a", inplace=True)
+    tm.assert_frame_equal(df, exp)
+
+
+def test_dialect_str(all_parsers):
+    dialect_name = "mydialect"
+    parser = all_parsers
+    data = """\
+fruit:vegetable
+apple:broccoli
+pear:tomato
+"""
+    exp = DataFrame({
+        "fruit": ["apple", "pear"],
+        "vegetable": ["broccoli", "tomato"]
+    })
+
+    with tm.with_csv_dialect(dialect_name, delimiter=":"):
+        df = parser.read_csv(StringIO(data), dialect=dialect_name)
+        tm.assert_frame_equal(df, exp)
+
+
+def test_invalid_dialect(all_parsers):
+    class InvalidDialect(object):
+        pass
+
+    data = "a\n1"
+    parser = all_parsers
+    msg = "Invalid dialect"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), dialect=InvalidDialect)
+
+
+@pytest.mark.parametrize("arg", [None, "doublequote", "escapechar",
+                                 "skipinitialspace", "quotechar", "quoting"])
+@pytest.mark.parametrize("value", ["dialect", "default", "other"])
+def test_dialect_conflict_except_delimiter(all_parsers, custom_dialect,
+                                           arg, value):
+    # see gh-23761.
+    dialect_name, dialect_kwargs = custom_dialect
+    parser = all_parsers
+
+    expected = DataFrame({"a": [1], "b": [2]})
+    data = "a:b\n1:2"
+
+    warning_klass = None
+    kwds = dict()
+
+    # arg=None tests when we pass in the dialect without any other arguments.
+    if arg is not None:
+        if "value" == "dialect":  # No conflict --> no warning.
+            kwds[arg] = dialect_kwargs[arg]
+        elif "value" == "default":  # Default --> no warning.
+            from pandas.io.parsers import _parser_defaults
+            kwds[arg] = _parser_defaults[arg]
+        else:  # Non-default + conflict with dialect --> warning.
+            warning_klass = ParserWarning
+            kwds[arg] = "blah"
+
+    with tm.with_csv_dialect(dialect_name, **dialect_kwargs):
+        with tm.assert_produces_warning(warning_klass):
+            result = parser.read_csv(StringIO(data),
+                                     dialect=dialect_name, **kwds)
+            tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,warning_klass", [
+    (dict(sep=","), None),           # sep is default --> sep_override=True
+    (dict(sep="."), ParserWarning),  # sep isn't default --> sep_override=False
+    (dict(delimiter=":"), None),     # No conflict
+    (dict(delimiter=None), None),    # Default arguments --> sep_override=True
+    (dict(delimiter=","), ParserWarning),  # Conflict
+    (dict(delimiter="."), ParserWarning),  # Conflict
+], ids=["sep-override-true", "sep-override-false",
+        "delimiter-no-conflict", "delimiter-default-arg",
+        "delimiter-conflict", "delimiter-conflict2"])
+def test_dialect_conflict_delimiter(all_parsers, custom_dialect,
+                                    kwargs, warning_klass):
+    # see gh-23761.
+    dialect_name, dialect_kwargs = custom_dialect
+    parser = all_parsers
+
+    expected = DataFrame({"a": [1], "b": [2]})
+    data = "a:b\n1:2"
+
+    with tm.with_csv_dialect(dialect_name, **dialect_kwargs):
+        with tm.assert_produces_warning(warning_klass):
+            result = parser.read_csv(StringIO(data),
+                                     dialect=dialect_name, **kwargs)
+            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_dtypes.py b/pandas/tests/io/parser/test_dtypes.py
new file mode 100644
index 0000000000000..caa03fc3685f6
--- /dev/null
+++ b/pandas/tests/io/parser/test_dtypes.py
@@ -0,0 +1,514 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests dtype specification during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import os
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO
+from pandas.errors import ParserWarning
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, MultiIndex, Series, Timestamp, concat)
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("dtype", [str, object])
+@pytest.mark.parametrize("check_orig", [True, False])
+def test_dtype_all_columns(all_parsers, dtype, check_orig):
+    # see gh-3795, gh-6607
+    parser = all_parsers
+
+    df = DataFrame(np.random.rand(5, 2).round(4), columns=list("AB"),
+                   index=["1A", "1B", "1C", "1D", "1E"])
+
+    with tm.ensure_clean("__passing_str_as_dtype__.csv") as path:
+        df.to_csv(path)
+
+        result = parser.read_csv(path, dtype=dtype, index_col=0)
+
+        if check_orig:
+            expected = df.copy()
+            result = result.astype(float)
+        else:
+            expected = df.astype(str)
+
+        tm.assert_frame_equal(result, expected)
+
+
+def test_dtype_all_columns_empty(all_parsers):
+    # see gh-12048
+    parser = all_parsers
+    result = parser.read_csv(StringIO("A,B"), dtype=str)
+
+    expected = DataFrame({"A": [], "B": []}, index=[], dtype=str)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_dtype_per_column(all_parsers):
+    parser = all_parsers
+    data = """\
+one,two
+1,2.5
+2,3.5
+3,4.5
+4,5.5"""
+    expected = DataFrame([[1, "2.5"], [2, "3.5"], [3, "4.5"], [4, "5.5"]],
+                         columns=["one", "two"])
+    expected["one"] = expected["one"].astype(np.float64)
+    expected["two"] = expected["two"].astype(object)
+
+    result = parser.read_csv(StringIO(data), dtype={"one": np.float64,
+                                                    1: str})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_invalid_dtype_per_column(all_parsers):
+    parser = all_parsers
+    data = """\
+one,two
+1,2.5
+2,3.5
+3,4.5
+4,5.5"""
+
+    with pytest.raises(TypeError, match="data type 'foo' not understood"):
+        parser.read_csv(StringIO(data), dtype={"one": "foo", 1: "int"})
+
+
+@pytest.mark.parametrize("dtype", [
+    "category",
+    CategoricalDtype(),
+    {"a": "category",
+     "b": "category",
+     "c": CategoricalDtype()}
+])
+def test_categorical_dtype(all_parsers, dtype):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b,c
+1,a,3.4
+1,a,3.4
+2,b,4.5"""
+    expected = DataFrame({"a": Categorical(["1", "1", "2"]),
+                          "b": Categorical(["a", "a", "b"]),
+                          "c": Categorical(["3.4", "3.4", "4.5"])})
+    actual = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(actual, expected)
+
+
+@pytest.mark.parametrize("dtype", [
+    {"b": "category"},
+    {1: "category"}
+])
+def test_categorical_dtype_single(all_parsers, dtype):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b,c
+1,a,3.4
+1,a,3.4
+2,b,4.5"""
+    expected = DataFrame({"a": [1, 1, 2],
+                          "b": Categorical(["a", "a", "b"]),
+                          "c": [3.4, 3.4, 4.5]})
+    actual = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_unsorted(all_parsers):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b,c
+1,b,3.4
+1,b,3.4
+2,a,4.5"""
+    expected = DataFrame({"a": Categorical(["1", "1", "2"]),
+                          "b": Categorical(["b", "b", "a"]),
+                          "c": Categorical(["3.4", "3.4", "4.5"])})
+    actual = parser.read_csv(StringIO(data), dtype="category")
+    tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_missing(all_parsers):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b,c
+1,b,3.4
+1,nan,3.4
+2,a,4.5"""
+    expected = DataFrame({"a": Categorical(["1", "1", "2"]),
+                          "b": Categorical(["b", np.nan, "a"]),
+                          "c": Categorical(["3.4", "3.4", "4.5"])})
+    actual = parser.read_csv(StringIO(data), dtype="category")
+    tm.assert_frame_equal(actual, expected)
+
+
+@pytest.mark.slow
+def test_categorical_dtype_high_cardinality_numeric(all_parsers):
+    # see gh-18186
+    parser = all_parsers
+    data = np.sort([str(i) for i in range(524289)])
+    expected = DataFrame({"a": Categorical(data, ordered=True)})
+
+    actual = parser.read_csv(StringIO("a\n" + "\n".join(data)),
+                             dtype="category")
+    actual["a"] = actual["a"].cat.reorder_categories(
+        np.sort(actual.a.cat.categories), ordered=True)
+    tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_latin1(all_parsers, csv_dir_path):
+    # see gh-10153
+    pth = os.path.join(csv_dir_path, "unicode_series.csv")
+    parser = all_parsers
+    encoding = "latin-1"
+
+    expected = parser.read_csv(pth, header=None, encoding=encoding)
+    expected[1] = Categorical(expected[1])
+
+    actual = parser.read_csv(pth, header=None, encoding=encoding,
+                             dtype={1: "category"})
+    tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_utf16(all_parsers, csv_dir_path):
+    # see gh-10153
+    pth = os.path.join(csv_dir_path, "utf16_ex.txt")
+    parser = all_parsers
+    encoding = "utf-16"
+    sep = ","
+
+    expected = parser.read_csv(pth, sep=sep, encoding=encoding)
+    expected = expected.apply(Categorical)
+
+    actual = parser.read_csv(pth, sep=sep, encoding=encoding, dtype="category")
+    tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_chunksize_infer_categories(all_parsers):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+    expecteds = [DataFrame({"a": [1, 1],
+                            "b": Categorical(["a", "b"])}),
+                 DataFrame({"a": [1, 2],
+                            "b": Categorical(["b", "c"])},
+                           index=[2, 3])]
+    actuals = parser.read_csv(StringIO(data), dtype={"b": "category"},
+                              chunksize=2)
+
+    for actual, expected in zip(actuals, expecteds):
+        tm.assert_frame_equal(actual, expected)
+
+
+def test_categorical_dtype_chunksize_explicit_categories(all_parsers):
+    # see gh-10153
+    parser = all_parsers
+    data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+    cats = ["a", "b", "c"]
+    expecteds = [DataFrame({"a": [1, 1],
+                            "b": Categorical(["a", "b"],
+                                             categories=cats)}),
+                 DataFrame({"a": [1, 2],
+                            "b": Categorical(["b", "c"],
+                                             categories=cats)},
+                           index=[2, 3])]
+    dtype = CategoricalDtype(cats)
+    actuals = parser.read_csv(StringIO(data), dtype={"b": dtype}, chunksize=2)
+
+    for actual, expected in zip(actuals, expecteds):
+        tm.assert_frame_equal(actual, expected)
+
+
+@pytest.mark.parametrize("ordered", [False, True])
+@pytest.mark.parametrize("categories", [
+    ["a", "b", "c"],
+    ["a", "c", "b"],
+    ["a", "b", "c", "d"],
+    ["c", "b", "a"],
+])
+def test_categorical_category_dtype(all_parsers, categories, ordered):
+    parser = all_parsers
+    data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+    expected = DataFrame({
+        "a": [1, 1, 1, 2],
+        "b": Categorical(["a", "b", "b", "c"],
+                         categories=categories,
+                         ordered=ordered)
+    })
+
+    dtype = {"b": CategoricalDtype(categories=categories,
+                                   ordered=ordered)}
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_category_dtype_unsorted(all_parsers):
+    parser = all_parsers
+    data = """a,b
+1,a
+1,b
+1,b
+2,c"""
+    dtype = CategoricalDtype(["c", "b", "a"])
+    expected = DataFrame({
+        "a": [1, 1, 1, 2],
+        "b": Categorical(["a", "b", "b", "c"], categories=["c", "b", "a"])
+    })
+
+    result = parser.read_csv(StringIO(data), dtype={"b": dtype})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_coerces_numeric(all_parsers):
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype([1, 2, 3])}
+
+    data = "b\n1\n1\n2\n3"
+    expected = DataFrame({"b": Categorical([1, 1, 2, 3])})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_coerces_datetime(all_parsers):
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype(pd.date_range("2017", "2019", freq="AS"))}
+
+    data = "b\n2017-01-01\n2018-01-01\n2019-01-01"
+    expected = DataFrame({"b": Categorical(dtype["b"].categories)})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_coerces_timestamp(all_parsers):
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype([Timestamp("2014")])}
+
+    data = "b\n2014-01-01\n2014-01-01T00:00:00"
+    expected = DataFrame({"b": Categorical([Timestamp("2014")] * 2)})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_coerces_timedelta(all_parsers):
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype(pd.to_timedelta(["1H", "2H", "3H"]))}
+
+    data = "b\n1H\n2H\n3H"
+    expected = DataFrame({"b": Categorical(dtype["b"].categories)})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data", [
+    "b\nTrue\nFalse\nNA\nFalse",
+    "b\ntrue\nfalse\nNA\nfalse",
+    "b\nTRUE\nFALSE\nNA\nFALSE",
+    "b\nTrue\nFalse\nNA\nFALSE",
+])
+def test_categorical_dtype_coerces_boolean(all_parsers, data):
+    # see gh-20498
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype([False, True])}
+    expected = DataFrame({"b": Categorical([True, False, None, False])})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_categorical_unexpected_categories(all_parsers):
+    parser = all_parsers
+    dtype = {"b": CategoricalDtype(["a", "b", "d", "e"])}
+
+    data = "b\nd\na\nc\nd"  # Unexpected c
+    expected = DataFrame({"b": Categorical(list("dacd"),
+                                           dtype=dtype["b"])})
+
+    result = parser.read_csv(StringIO(data), dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_pass_dtype(all_parsers):
+    parser = all_parsers
+
+    data = "one,two"
+    result = parser.read_csv(StringIO(data), dtype={"one": "u1"})
+
+    expected = DataFrame({"one": np.empty(0, dtype="u1"),
+                          "two": np.empty(0, dtype=np.object)},
+                         index=Index([], dtype=object))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_index_pass_dtype(all_parsers):
+    parser = all_parsers
+
+    data = "one,two"
+    result = parser.read_csv(StringIO(data), index_col=["one"],
+                             dtype={"one": "u1", 1: "f"})
+
+    expected = DataFrame({"two": np.empty(0, dtype="f")},
+                         index=Index([], dtype="u1", name="one"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_multi_index_pass_dtype(all_parsers):
+    parser = all_parsers
+
+    data = "one,two,three"
+    result = parser.read_csv(StringIO(data), index_col=["one", "two"],
+                             dtype={"one": "u1", 1: "f8"})
+
+    exp_idx = MultiIndex.from_arrays([np.empty(0, dtype="u1"),
+                                      np.empty(0, dtype=np.float64)],
+                                     names=["one", "two"])
+    expected = DataFrame({"three": np.empty(0, dtype=np.object)},
+                         index=exp_idx)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_mangled_column_pass_dtype_by_names(all_parsers):
+    parser = all_parsers
+
+    data = "one,one"
+    result = parser.read_csv(StringIO(data), dtype={"one": "u1", "one.1": "f"})
+
+    expected = DataFrame({"one": np.empty(0, dtype="u1"),
+                          "one.1": np.empty(0, dtype="f")},
+                         index=Index([], dtype=object))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_mangled_column_pass_dtype_by_indexes(all_parsers):
+    parser = all_parsers
+
+    data = "one,one"
+    result = parser.read_csv(StringIO(data), dtype={0: "u1", 1: "f"})
+
+    expected = DataFrame({"one": np.empty(0, dtype="u1"),
+                          "one.1": np.empty(0, dtype="f")},
+                         index=Index([], dtype=object))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_dup_column_pass_dtype_by_indexes(all_parsers):
+    # see gh-9424
+    parser = all_parsers
+    expected = concat([Series([], name="one", dtype="u1"),
+                       Series([], name="one.1", dtype="f")], axis=1)
+    expected.index = expected.index.astype(object)
+
+    data = "one,one"
+    result = parser.read_csv(StringIO(data), dtype={0: "u1", 1: "f"})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_dup_column_pass_dtype_by_indexes_warn(all_parsers):
+    # see gh-9424
+    parser = all_parsers
+    expected = concat([Series([], name="one", dtype="u1"),
+                       Series([], name="one.1", dtype="f")], axis=1)
+    expected.index = expected.index.astype(object)
+
+    with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+        data = ""
+        result = parser.read_csv(StringIO(data), names=["one", "one"],
+                                 dtype={0: "u1", 1: "f"})
+        tm.assert_frame_equal(result, expected)
+
+
+def test_raise_on_passed_int_dtype_with_nas(all_parsers):
+    # see gh-2631
+    parser = all_parsers
+    data = """YEAR, DOY, a
+2001,106380451,10
+2001,,11
+2001,106380451,67"""
+
+    msg = ("Integer column has NA values" if parser.engine == "c" else
+           "Unable to convert column DOY")
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), dtype={"DOY": np.int64},
+                        skipinitialspace=True)
+
+
+def test_dtype_with_converters(all_parsers):
+    parser = all_parsers
+    data = """a,b
+1.1,2.2
+1.2,2.3"""
+
+    # Dtype spec ignored if converted specified.
+    with tm.assert_produces_warning(ParserWarning):
+        result = parser.read_csv(StringIO(data), dtype={"a": "i8"},
+                                 converters={"a": lambda x: str(x)})
+    expected = DataFrame({"a": ["1.1", "1.2"], "b": [2.2, 2.3]})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("dtype,expected", [
+    (np.float64, DataFrame(columns=["a", "b"], dtype=np.float64)),
+    ("category", DataFrame({"a": Categorical([]),
+                            "b": Categorical([])},
+                           index=[])),
+    (dict(a="category", b="category"),
+     DataFrame({"a": Categorical([]),
+                "b": Categorical([])},
+               index=[])),
+    ("datetime64[ns]", DataFrame(columns=["a", "b"], dtype="datetime64[ns]")),
+    ("timedelta64[ns]", DataFrame({"a": Series([], dtype="timedelta64[ns]"),
+                                   "b": Series([], dtype="timedelta64[ns]")},
+                                  index=[])),
+    (dict(a=np.int64,
+          b=np.int32), DataFrame({"a": Series([], dtype=np.int64),
+                                  "b": Series([], dtype=np.int32)},
+                                 index=[])),
+    ({0: np.int64, 1: np.int32}, DataFrame({"a": Series([], dtype=np.int64),
+                                            "b": Series([], dtype=np.int32)},
+                                           index=[])),
+    ({"a": np.int64, 1: np.int32}, DataFrame({"a": Series([], dtype=np.int64),
+                                              "b": Series([], dtype=np.int32)},
+                                             index=[])),
+])
+def test_empty_dtype(all_parsers, dtype, expected):
+    # see gh-14712
+    parser = all_parsers
+    data = "a,b"
+
+    result = parser.read_csv(StringIO(data), header=0, dtype=dtype)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("dtype", list(np.typecodes["AllInteger"] +
+                                       np.typecodes["Float"]))
+def test_numeric_dtype(all_parsers, dtype):
+    data = "0\n1"
+    parser = all_parsers
+    expected = DataFrame([0, 1], dtype=dtype)
+
+    result = parser.read_csv(StringIO(data), header=None, dtype=dtype)
+    tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/io/parser/test_header.py b/pandas/tests/io/parser/test_header.py
new file mode 100644
index 0000000000000..38f4cc42357fa
--- /dev/null
+++ b/pandas/tests/io/parser/test_header.py
@@ -0,0 +1,428 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that the file header is properly handled or inferred
+during parsing for all of the parsers defined in parsers.py
+"""
+
+from collections import namedtuple
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO, u
+from pandas.errors import ParserError
+
+from pandas import DataFrame, Index, MultiIndex
+import pandas.util.testing as tm
+
+
+def test_read_with_bad_header(all_parsers):
+    parser = all_parsers
+    msg = r"but only \d+ lines in file"
+
+    with pytest.raises(ValueError, match=msg):
+        s = StringIO(",,")
+        parser.read_csv(s, header=[10])
+
+
+@pytest.mark.parametrize("header", [True, False])
+def test_bool_header_arg(all_parsers, header):
+    # see gh-6114
+    parser = all_parsers
+    data = """\
+MyColumn
+a
+b
+a
+b"""
+    msg = "Passing a bool to header is invalid"
+    with pytest.raises(TypeError, match=msg):
+        parser.read_csv(StringIO(data), header=header)
+
+
+def test_no_header_prefix(all_parsers):
+    parser = all_parsers
+    data = """1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+    result = parser.read_csv(StringIO(data), prefix="Field", header=None)
+    expected = DataFrame([[1, 2, 3, 4, 5], [6, 7, 8, 9, 10],
+                          [11, 12, 13, 14, 15]],
+                         columns=["Field0", "Field1", "Field2",
+                                  "Field3", "Field4"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_header_with_index_col(all_parsers):
+    parser = all_parsers
+    data = """foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+    names = ["A", "B", "C"]
+    result = parser.read_csv(StringIO(data), names=names)
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         index=["foo", "bar", "baz"],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_header_not_first_line(all_parsers):
+    parser = all_parsers
+    data = """got,to,ignore,this,line
+got,to,ignore,this,line
+index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+"""
+    data2 = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+"""
+
+    result = parser.read_csv(StringIO(data), header=2, index_col=0)
+    expected = parser.read_csv(StringIO(data2), header=0, index_col=0)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_header_multi_index(all_parsers):
+    parser = all_parsers
+    expected = tm.makeCustomDataframe(
+        5, 3, r_idx_nlevels=2, c_idx_nlevels=4)
+
+    data = """\
+C0,,C_l0_g0,C_l0_g1,C_l0_g2
+
+C1,,C_l1_g0,C_l1_g1,C_l1_g2
+C2,,C_l2_g0,C_l2_g1,C_l2_g2
+C3,,C_l3_g0,C_l3_g1,C_l3_g2
+R0,R1,,,
+R_l0_g0,R_l1_g0,R0C0,R0C1,R0C2
+R_l0_g1,R_l1_g1,R1C0,R1C1,R1C2
+R_l0_g2,R_l1_g2,R2C0,R2C1,R2C2
+R_l0_g3,R_l1_g3,R3C0,R3C1,R3C2
+R_l0_g4,R_l1_g4,R4C0,R4C1,R4C2
+"""
+    result = parser.read_csv(StringIO(data), header=[0, 1, 2, 3],
+                             index_col=[0, 1])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,msg", [
+    (dict(index_col=["foo", "bar"]), ("index_col must only contain "
+                                      "row numbers when specifying "
+                                      "a multi-index header")),
+    (dict(index_col=[0, 1], names=["foo", "bar"]), ("cannot specify names "
+                                                    "when specifying a "
+                                                    "multi-index header")),
+    (dict(index_col=[0, 1], usecols=["foo", "bar"]), ("cannot specify "
+                                                      "usecols when "
+                                                      "specifying a "
+                                                      "multi-index header")),
+])
+def test_header_multi_index_invalid(all_parsers, kwargs, msg):
+    data = """\
+C0,,C_l0_g0,C_l0_g1,C_l0_g2
+
+C1,,C_l1_g0,C_l1_g1,C_l1_g2
+C2,,C_l2_g0,C_l2_g1,C_l2_g2
+C3,,C_l3_g0,C_l3_g1,C_l3_g2
+R0,R1,,,
+R_l0_g0,R_l1_g0,R0C0,R0C1,R0C2
+R_l0_g1,R_l1_g1,R1C0,R1C1,R1C2
+R_l0_g2,R_l1_g2,R2C0,R2C1,R2C2
+R_l0_g3,R_l1_g3,R3C0,R3C1,R3C2
+R_l0_g4,R_l1_g4,R4C0,R4C1,R4C2
+"""
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), header=[0, 1, 2, 3], **kwargs)
+
+
+_TestTuple = namedtuple("names", ["first", "second"])
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(header=[0, 1]),
+    dict(skiprows=3,
+         names=[("a", "q"), ("a", "r"), ("a", "s"),
+                ("b", "t"), ("c", "u"), ("c", "v")]),
+    dict(skiprows=3,
+         names=[_TestTuple("a", "q"), _TestTuple("a", "r"),
+                _TestTuple("a", "s"), _TestTuple("b", "t"),
+                _TestTuple("c", "u"), _TestTuple("c", "v")])
+])
+def test_header_multi_index_common_format1(all_parsers, kwargs):
+    parser = all_parsers
+    expected = DataFrame([[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]],
+                         index=["one", "two"],
+                         columns=MultiIndex.from_tuples(
+                             [("a", "q"), ("a", "r"), ("a", "s"),
+                              ("b", "t"), ("c", "u"), ("c", "v")]))
+    data = """,a,a,a,b,c,c
+,q,r,s,t,u,v
+,,,,,,
+one,1,2,3,4,5,6
+two,7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), index_col=0, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(header=[0, 1]),
+    dict(skiprows=2,
+         names=[("a", "q"), ("a", "r"), ("a", "s"),
+                ("b", "t"), ("c", "u"), ("c", "v")]),
+    dict(skiprows=2,
+         names=[_TestTuple("a", "q"), _TestTuple("a", "r"),
+                _TestTuple("a", "s"), _TestTuple("b", "t"),
+                _TestTuple("c", "u"), _TestTuple("c", "v")])
+])
+def test_header_multi_index_common_format2(all_parsers, kwargs):
+    parser = all_parsers
+    expected = DataFrame([[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]],
+                         index=["one", "two"],
+                         columns=MultiIndex.from_tuples(
+                             [("a", "q"), ("a", "r"), ("a", "s"),
+                              ("b", "t"), ("c", "u"), ("c", "v")]))
+    data = """,a,a,a,b,c,c
+,q,r,s,t,u,v
+one,1,2,3,4,5,6
+two,7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), index_col=0, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(header=[0, 1]),
+    dict(skiprows=2,
+         names=[("a", "q"), ("a", "r"), ("a", "s"),
+                ("b", "t"), ("c", "u"), ("c", "v")]),
+    dict(skiprows=2,
+         names=[_TestTuple("a", "q"), _TestTuple("a", "r"),
+                _TestTuple("a", "s"), _TestTuple("b", "t"),
+                _TestTuple("c", "u"), _TestTuple("c", "v")])
+])
+def test_header_multi_index_common_format3(all_parsers, kwargs):
+    parser = all_parsers
+    expected = DataFrame([[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]],
+                         index=["one", "two"],
+                         columns=MultiIndex.from_tuples(
+                             [("a", "q"), ("a", "r"), ("a", "s"),
+                              ("b", "t"), ("c", "u"), ("c", "v")]))
+    expected = expected.reset_index(drop=True)
+    data = """a,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), index_col=None, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_header_multi_index_common_format_malformed1(all_parsers):
+    parser = all_parsers
+    expected = DataFrame(np.array(
+        [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype="int64"),
+        index=Index([1, 7]),
+        columns=MultiIndex(levels=[[u("a"), u("b"), u("c")],
+                                   [u("r"), u("s"), u("t"),
+                                    u("u"), u("v")]],
+                           codes=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
+                           names=[u("a"), u("q")]))
+    data = """a,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), header=[0, 1], index_col=0)
+    tm.assert_frame_equal(expected, result)
+
+
+def test_header_multi_index_common_format_malformed2(all_parsers):
+    parser = all_parsers
+    expected = DataFrame(np.array(
+        [[2, 3, 4, 5, 6], [8, 9, 10, 11, 12]], dtype="int64"),
+        index=Index([1, 7]),
+        columns=MultiIndex(levels=[[u("a"), u("b"), u("c")],
+                                   [u("r"), u("s"), u("t"),
+                                    u("u"), u("v")]],
+                           codes=[[0, 0, 1, 2, 2], [0, 1, 2, 3, 4]],
+                           names=[None, u("q")]))
+
+    data = """,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), header=[0, 1], index_col=0)
+    tm.assert_frame_equal(expected, result)
+
+
+def test_header_multi_index_common_format_malformed3(all_parsers):
+    parser = all_parsers
+    expected = DataFrame(np.array(
+        [[3, 4, 5, 6], [9, 10, 11, 12]], dtype="int64"),
+        index=MultiIndex(levels=[[1, 7], [2, 8]],
+                         codes=[[0, 1], [0, 1]]),
+        columns=MultiIndex(levels=[[u("a"), u("b"), u("c")],
+                                   [u("s"), u("t"), u("u"), u("v")]],
+                           codes=[[0, 1, 2, 2], [0, 1, 2, 3]],
+                           names=[None, u("q")]))
+    data = """,a,a,b,c,c
+q,r,s,t,u,v
+1,2,3,4,5,6
+7,8,9,10,11,12"""
+
+    result = parser.read_csv(StringIO(data), header=[0, 1], index_col=[0, 1])
+    tm.assert_frame_equal(expected, result)
+
+
+@pytest.mark.parametrize("data,header", [
+    ("1,2,3\n4,5,6", None),
+    ("foo,bar,baz\n1,2,3\n4,5,6", 0),
+])
+def test_header_names_backward_compat(all_parsers, data, header):
+    # see gh-2539
+    parser = all_parsers
+    expected = parser.read_csv(StringIO("1,2,3\n4,5,6"),
+                               names=["a", "b", "c"])
+
+    result = parser.read_csv(StringIO(data), names=["a", "b", "c"],
+                             header=header)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(), dict(index_col=False)
+])
+def test_read_only_header_no_rows(all_parsers, kwargs):
+    # See gh-7773
+    parser = all_parsers
+    expected = DataFrame(columns=["a", "b", "c"])
+
+    result = parser.read_csv(StringIO("a,b,c"), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,names", [
+    (dict(), [0, 1, 2, 3, 4]),
+    (dict(prefix="X"), ["X0", "X1", "X2", "X3", "X4"]),
+    (dict(names=["foo", "bar", "baz", "quux", "panda"]),
+     ["foo", "bar", "baz", "quux", "panda"])
+])
+def test_no_header(all_parsers, kwargs, names):
+    parser = all_parsers
+    data = """1,2,3,4,5
+6,7,8,9,10
+11,12,13,14,15
+"""
+    expected = DataFrame([[1, 2, 3, 4, 5],
+                          [6, 7, 8, 9, 10],
+                          [11, 12, 13, 14, 15]], columns=names)
+    result = parser.read_csv(StringIO(data), header=None, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("header", [
+    ["a", "b"],
+    "string_header"
+])
+def test_non_int_header(all_parsers, header):
+    # see gh-16338
+    msg = "header must be integer or list of integers"
+    data = """1,2\n3,4"""
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), header=header)
+
+
+def test_singleton_header(all_parsers):
+    # see gh-7757
+    data = """a,b,c\n0,1,2\n1,2,3"""
+    parser = all_parsers
+
+    expected = DataFrame({"a": [0, 1], "b": [1, 2], "c": [2, 3]})
+    result = parser.read_csv(StringIO(data), header=[0])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,expected", [
+    ("A,A,A,B\none,one,one,two\n0,40,34,0.1",
+     DataFrame([[0, 40, 34, 0.1]],
+               columns=MultiIndex.from_tuples(
+                   [("A", "one"), ("A", "one.1"),
+                    ("A", "one.2"), ("B", "two")]))),
+    ("A,A,A,B\none,one,one.1,two\n0,40,34,0.1",
+     DataFrame([[0, 40, 34, 0.1]],
+               columns=MultiIndex.from_tuples(
+                   [("A", "one"), ("A", "one.1"),
+                    ("A", "one.1.1"), ("B", "two")]))),
+    ("A,A,A,B,B\none,one,one.1,two,two\n0,40,34,0.1,0.1",
+     DataFrame([[0, 40, 34, 0.1, 0.1]],
+               columns=MultiIndex.from_tuples(
+                   [("A", "one"), ("A", "one.1"),
+                    ("A", "one.1.1"), ("B", "two"),
+                    ("B", "two.1")])))
+])
+def test_mangles_multi_index(all_parsers, data, expected):
+    # see gh-18062
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), header=[0, 1])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_col", [None, [0]])
+@pytest.mark.parametrize("columns", [None,
+                                     (["", "Unnamed"]),
+                                     (["Unnamed", ""]),
+                                     (["Unnamed", "NotUnnamed"])])
+def test_multi_index_unnamed(all_parsers, index_col, columns):
+    # see gh-23687
+    #
+    # When specifying a multi-index header, make sure that
+    # we don't error just because one of the rows in our header
+    # has ALL column names containing the string "Unnamed". The
+    # correct condition to check is whether the row contains
+    # ALL columns that did not have names (and instead were given
+    # placeholder ones).
+    parser = all_parsers
+    header = [0, 1]
+
+    if index_col is None:
+        data = ",".join(columns or ["", ""]) + "\n0,1\n2,3\n4,5\n"
+    else:
+        data = (",".join([""] + (columns or ["", ""])) +
+                "\n,0,1\n0,2,3\n1,4,5\n")
+
+    if columns is None:
+        msg = (r"Passed header=\[0,1\] are too "
+               r"many rows for this multi_index of columns")
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data), header=header,
+                            index_col=index_col)
+    else:
+        result = parser.read_csv(StringIO(data), header=header,
+                                 index_col=index_col)
+        template = "Unnamed: {i}_level_0"
+        exp_columns = []
+
+        for i, col in enumerate(columns):
+            if not col:  # Unnamed.
+                col = template.format(i=i if index_col is None else i + 1)
+
+            exp_columns.append(col)
+
+        columns = MultiIndex.from_tuples(zip(exp_columns, ["0", "1"]))
+        expected = DataFrame([[2, 3], [4, 5]], columns=columns)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_index_col.py b/pandas/tests/io/parser/test_index_col.py
new file mode 100644
index 0000000000000..6421afba18f94
--- /dev/null
+++ b/pandas/tests/io/parser/test_index_col.py
@@ -0,0 +1,152 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that the specified index column (a.k.a "index_col")
+is properly handled or inferred during parsing for all of
+the parsers defined in parsers.py
+"""
+
+import pytest
+
+from pandas.compat import StringIO
+
+from pandas import DataFrame, Index, MultiIndex
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("with_header", [True, False])
+def test_index_col_named(all_parsers, with_header):
+    parser = all_parsers
+    no_header = """\
+KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""  # noqa
+    header = "ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir\n"  # noqa
+
+    if with_header:
+        data = header + no_header
+
+        result = parser.read_csv(StringIO(data), index_col="ID")
+        expected = parser.read_csv(StringIO(data), header=0).set_index("ID")
+        tm.assert_frame_equal(result, expected)
+    else:
+        data = no_header
+        msg = "Index ID invalid"
+
+        with pytest.raises(ValueError, match=msg):
+            parser.read_csv(StringIO(data), index_col="ID")
+
+
+def test_index_col_named2(all_parsers):
+    parser = all_parsers
+    data = """\
+1,2,3,4,hello
+5,6,7,8,world
+9,10,11,12,foo
+"""
+
+    expected = DataFrame({"a": [1, 5, 9], "b": [2, 6, 10],
+                          "c": [3, 7, 11], "d": [4, 8, 12]},
+                         index=Index(["hello", "world", "foo"],
+                                     name="message"))
+    names = ["a", "b", "c", "d", "message"]
+
+    result = parser.read_csv(StringIO(data), names=names,
+                             index_col=["message"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_index_col_is_true(all_parsers):
+    # see gh-9798
+    data = "a,b\n1,2"
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match="The value of index_col "
+                                         "couldn't be 'True'"):
+        parser.read_csv(StringIO(data), index_col=True)
+
+
+def test_infer_index_col(all_parsers):
+    data = """A,B,C
+foo,1,2,3
+bar,4,5,6
+baz,7,8,9
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data))
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         index=["foo", "bar", "baz"],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_col,kwargs", [
+    (None, dict(columns=["x", "y", "z"])),
+    (False, dict(columns=["x", "y", "z"])),
+    (0, dict(columns=["y", "z"], index=Index([], name="x"))),
+    (1, dict(columns=["x", "z"], index=Index([], name="y"))),
+    ("x", dict(columns=["y", "z"], index=Index([], name="x"))),
+    ("y", dict(columns=["x", "z"], index=Index([], name="y"))),
+    ([0, 1], dict(columns=["z"], index=MultiIndex.from_arrays(
+        [[]] * 2, names=["x", "y"]))),
+    (["x", "y"], dict(columns=["z"], index=MultiIndex.from_arrays(
+        [[]] * 2, names=["x", "y"]))),
+    ([1, 0], dict(columns=["z"], index=MultiIndex.from_arrays(
+        [[]] * 2, names=["y", "x"]))),
+    (["y", "x"], dict(columns=["z"], index=MultiIndex.from_arrays(
+        [[]] * 2, names=["y", "x"]))),
+])
+def test_index_col_empty_data(all_parsers, index_col, kwargs):
+    data = "x,y,z"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=index_col)
+
+    expected = DataFrame([], **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_with_index_col_false(all_parsers):
+    # see gh-10413
+    data = "x,y"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=False)
+
+    expected = DataFrame([], columns=["x", "y"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_names", [
+    ["", ""],
+    ["foo", ""],
+    ["", "bar"],
+    ["foo", "bar"],
+    ["NotReallyUnnamed", "Unnamed: 0"],
+])
+def test_multi_index_naming(all_parsers, index_names):
+    parser = all_parsers
+
+    # We don't want empty index names being replaced with "Unnamed: 0"
+    data = ",".join(index_names + ["col\na,c,1\na,d,2\nb,c,3\nb,d,4"])
+    result = parser.read_csv(StringIO(data), index_col=[0, 1])
+
+    expected = DataFrame({"col": [1, 2, 3, 4]},
+                         index=MultiIndex.from_product([["a", "b"],
+                                                        ["c", "d"]]))
+    expected.index.names = [name if name else None for name in index_names]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multi_index_naming_not_all_at_beginning(all_parsers):
+    parser = all_parsers
+    data = ",Unnamed: 2,\na,c,1\na,d,2\nb,c,3\nb,d,4"
+    result = parser.read_csv(StringIO(data), index_col=[0, 2])
+
+    expected = DataFrame({"Unnamed: 2": ["c", "d", "c", "d"]},
+                         index=MultiIndex(
+                             levels=[['a', 'b'], [1, 2, 3, 4]],
+                             codes=[[0, 0, 1, 1], [0, 1, 2, 3]]))
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_mangle_dupes.py b/pandas/tests/io/parser/test_mangle_dupes.py
new file mode 100644
index 0000000000000..0efc0c2c13557
--- /dev/null
+++ b/pandas/tests/io/parser/test_mangle_dupes.py
@@ -0,0 +1,119 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that duplicate columns are handled appropriately when parsed by the
+CSV engine. In general, the expected result is that they are either thoroughly
+de-duplicated (if mangling requested) or ignored otherwise.
+"""
+
+import pytest
+
+from pandas.compat import StringIO
+
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("kwargs", [dict(), dict(mangle_dupe_cols=True)])
+def test_basic(all_parsers, kwargs):
+    # TODO: add test for condition "mangle_dupe_cols=False"
+    # once it is actually supported (gh-12935)
+    parser = all_parsers
+
+    data = "a,a,b,b,b\n1,2,3,4,5"
+    result = parser.read_csv(StringIO(data), sep=",", **kwargs)
+
+    expected = DataFrame([[1, 2, 3, 4, 5]],
+                         columns=["a", "a.1", "b", "b.1", "b.2"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_basic_names(all_parsers):
+    # See gh-7160
+    parser = all_parsers
+
+    data = "a,b,a\n0,1,2\n3,4,5"
+    expected = DataFrame([[0, 1, 2], [3, 4, 5]],
+                         columns=["a", "b", "a.1"])
+
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_basic_names_warn(all_parsers):
+    # See gh-7160
+    parser = all_parsers
+
+    data = "0,1,2\n3,4,5"
+    expected = DataFrame([[0, 1, 2], [3, 4, 5]],
+                         columns=["a", "b", "a.1"])
+
+    with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+        result = parser.read_csv(StringIO(data), names=["a", "b", "a"])
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,expected", [
+    ("a,a,a.1\n1,2,3",
+     DataFrame([[1, 2, 3]], columns=["a", "a.1", "a.1.1"])),
+    ("a,a,a.1,a.1.1,a.1.1.1,a.1.1.1.1\n1,2,3,4,5,6",
+     DataFrame([[1, 2, 3, 4, 5, 6]], columns=["a", "a.1", "a.1.1", "a.1.1.1",
+                                              "a.1.1.1.1", "a.1.1.1.1.1"])),
+    ("a,a,a.3,a.1,a.2,a,a\n1,2,3,4,5,6,7",
+     DataFrame([[1, 2, 3, 4, 5, 6, 7]], columns=["a", "a.1", "a.3", "a.1.1",
+                                                 "a.2", "a.2.1", "a.3.1"]))
+])
+def test_thorough_mangle_columns(all_parsers, data, expected):
+    # see gh-17060
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,names,expected", [
+    ("a,b,b\n1,2,3",
+     ["a.1", "a.1", "a.1.1"],
+     DataFrame([["a", "b", "b"], ["1", "2", "3"]],
+               columns=["a.1", "a.1.1", "a.1.1.1"])),
+    ("a,b,c,d,e,f\n1,2,3,4,5,6",
+     ["a", "a", "a.1", "a.1.1", "a.1.1.1", "a.1.1.1.1"],
+     DataFrame([["a", "b", "c", "d", "e", "f"],
+                ["1", "2", "3", "4", "5", "6"]],
+               columns=["a", "a.1", "a.1.1", "a.1.1.1",
+                        "a.1.1.1.1", "a.1.1.1.1.1"])),
+    ("a,b,c,d,e,f,g\n1,2,3,4,5,6,7",
+     ["a", "a", "a.3", "a.1", "a.2", "a", "a"],
+     DataFrame([["a", "b", "c", "d", "e", "f", "g"],
+                ["1", "2", "3", "4", "5", "6", "7"]],
+               columns=["a", "a.1", "a.3", "a.1.1",
+                        "a.2", "a.2.1", "a.3.1"])),
+])
+def test_thorough_mangle_names(all_parsers, data, names, expected):
+    # see gh-17095
+    parser = all_parsers
+
+    with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+        result = parser.read_csv(StringIO(data), names=names)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_mangled_unnamed_placeholders(all_parsers):
+    # xref gh-13017
+    orig_key = "0"
+    parser = all_parsers
+
+    orig_value = [1, 2, 3]
+    df = DataFrame({orig_key: orig_value})
+
+    # This test recursively updates `df`.
+    for i in range(3):
+        expected = DataFrame()
+
+        for j in range(i + 1):
+            expected["Unnamed: 0" + ".1" * j] = [0, 1, 2]
+
+        expected[orig_key] = orig_value
+        df = parser.read_csv(StringIO(df.to_csv()))
+
+        tm.assert_frame_equal(df, expected)
diff --git a/pandas/tests/io/parser/test_multi_thread.py b/pandas/tests/io/parser/test_multi_thread.py
new file mode 100644
index 0000000000000..fbf23f769e202
--- /dev/null
+++ b/pandas/tests/io/parser/test_multi_thread.py
@@ -0,0 +1,145 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests multithreading behaviour for reading and
+parsing files for each parser defined in parsers.py
+"""
+
+from __future__ import division
+
+from multiprocessing.pool import ThreadPool
+
+import numpy as np
+
+from pandas.compat import BytesIO, range
+
+import pandas as pd
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+
+def _construct_dataframe(num_rows):
+    """
+    Construct a DataFrame for testing.
+
+    Parameters
+    ----------
+    num_rows : int
+        The number of rows for our DataFrame.
+
+    Returns
+    -------
+    df : DataFrame
+    """
+    df = DataFrame(np.random.rand(num_rows, 5), columns=list("abcde"))
+    df["foo"] = "foo"
+    df["bar"] = "bar"
+    df["baz"] = "baz"
+    df["date"] = pd.date_range("20000101 09:00:00",
+                               periods=num_rows,
+                               freq="s")
+    df["int"] = np.arange(num_rows, dtype="int64")
+    return df
+
+
+def test_multi_thread_string_io_read_csv(all_parsers):
+    # see gh-11786
+    parser = all_parsers
+    max_row_range = 10000
+    num_files = 100
+
+    bytes_to_df = [
+        "\n".join(
+            ["%d,%d,%d" % (i, i, i) for i in range(max_row_range)]
+        ).encode() for _ in range(num_files)]
+    files = [BytesIO(b) for b in bytes_to_df]
+
+    # Read all files in many threads.
+    pool = ThreadPool(8)
+
+    results = pool.map(parser.read_csv, files)
+    first_result = results[0]
+
+    for result in results:
+        tm.assert_frame_equal(first_result, result)
+
+
+def _generate_multi_thread_dataframe(parser, path, num_rows, num_tasks):
+    """
+    Generate a DataFrame via multi-thread.
+
+    Parameters
+    ----------
+    parser : BaseParser
+        The parser object to use for reading the data.
+    path : str
+        The location of the CSV file to read.
+    num_rows : int
+        The number of rows to read per task.
+    num_tasks : int
+        The number of tasks to use for reading this DataFrame.
+
+    Returns
+    -------
+    df : DataFrame
+    """
+    def reader(arg):
+        """
+        Create a reader for part of the CSV.
+
+        Parameters
+        ----------
+        arg : tuple
+            A tuple of the following:
+
+            * start : int
+                The starting row to start for parsing CSV
+            * nrows : int
+                The number of rows to read.
+
+        Returns
+        -------
+        df : DataFrame
+        """
+        start, nrows = arg
+
+        if not start:
+            return parser.read_csv(path, index_col=0, header=0,
+                                   nrows=nrows, parse_dates=["date"])
+
+        return parser.read_csv(path, index_col=0, header=None,
+                               skiprows=int(start) + 1,
+                               nrows=nrows, parse_dates=[9])
+
+    tasks = [
+        (num_rows * i // num_tasks,
+         num_rows // num_tasks) for i in range(num_tasks)
+    ]
+
+    pool = ThreadPool(processes=num_tasks)
+    results = pool.map(reader, tasks)
+
+    header = results[0].columns
+
+    for r in results[1:]:
+        r.columns = header
+
+    final_dataframe = pd.concat(results)
+    return final_dataframe
+
+
+def test_multi_thread_path_multipart_read_csv(all_parsers):
+    # see gh-11786
+    num_tasks = 4
+    num_rows = 100000
+
+    parser = all_parsers
+    file_name = "__thread_pool_reader__.csv"
+    df = _construct_dataframe(num_rows)
+
+    with tm.ensure_clean(file_name) as path:
+        df.to_csv(path)
+
+        final_dataframe = _generate_multi_thread_dataframe(parser, path,
+                                                           num_rows, num_tasks)
+        tm.assert_frame_equal(df, final_dataframe)
diff --git a/pandas/tests/io/parser/test_na_values.py b/pandas/tests/io/parser/test_na_values.py
new file mode 100644
index 0000000000000..1b6d2ee8a062e
--- /dev/null
+++ b/pandas/tests/io/parser/test_na_values.py
@@ -0,0 +1,441 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that NA values are properly handled during
+parsing for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO, range
+
+from pandas import DataFrame, Index, MultiIndex
+import pandas.util.testing as tm
+
+import pandas.io.common as com
+
+
+def test_string_nas(all_parsers):
+    parser = all_parsers
+    data = """A,B,C
+a,b,c
+d,,f
+,g,h
+"""
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame([["a", "b", "c"],
+                          ["d", np.nan, "f"],
+                          [np.nan, "g", "h"]],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_detect_string_na(all_parsers):
+    parser = all_parsers
+    data = """A,B
+foo,bar
+NA,baz
+NaN,nan
+"""
+    expected = DataFrame([["foo", "bar"], [np.nan, "baz"],
+                          [np.nan, np.nan]], columns=["A", "B"])
+    result = parser.read_csv(StringIO(data))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_values", [
+    ["-999.0", "-999"],
+    [-999, -999.0],
+    [-999.0, -999],
+    ["-999.0"], ["-999"],
+    [-999.0], [-999]
+])
+@pytest.mark.parametrize("data", [
+    """A,B
+-999,1.2
+2,-999
+3,4.5
+""",
+    """A,B
+-999,1.200
+2,-999.000
+3,4.500
+"""
+])
+def test_non_string_na_values(all_parsers, data, na_values):
+    # see gh-3611: with an odd float format, we can't match
+    # the string "999.0" exactly but still need float matching
+    parser = all_parsers
+    expected = DataFrame([[np.nan, 1.2], [2.0, np.nan],
+                          [3.0, 4.5]], columns=["A", "B"])
+
+    result = parser.read_csv(StringIO(data), na_values=na_values)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_default_na_values(all_parsers):
+    _NA_VALUES = {"-1.#IND", "1.#QNAN", "1.#IND", "-1.#QNAN", "#N/A",
+                  "N/A", "n/a", "NA", "#NA", "NULL", "null", "NaN", "nan",
+                  "-NaN", "-nan", "#N/A N/A", ""}
+    assert _NA_VALUES == com._NA_VALUES
+
+    parser = all_parsers
+    nv = len(_NA_VALUES)
+
+    def f(i, v):
+        if i == 0:
+            buf = ""
+        elif i > 0:
+            buf = "".join([","] * i)
+
+        buf = "{0}{1}".format(buf, v)
+
+        if i < nv - 1:
+            buf = "{0}{1}".format(buf, "".join([","] * (nv - i - 1)))
+
+        return buf
+
+    data = StringIO("\n".join(f(i, v) for i, v in enumerate(_NA_VALUES)))
+    expected = DataFrame(np.nan, columns=range(nv), index=range(nv))
+
+    result = parser.read_csv(data, header=None)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_values", ["baz", ["baz"]])
+def test_custom_na_values(all_parsers, na_values):
+    parser = all_parsers
+    data = """A,B,C
+ignore,this,row
+1,NA,3
+-1.#IND,5,baz
+7,8,NaN
+"""
+    expected = DataFrame([[1., np.nan, 3], [np.nan, 5, np.nan],
+                          [7, 8, np.nan]], columns=["A", "B", "C"])
+    result = parser.read_csv(StringIO(data), na_values=na_values, skiprows=[1])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_bool_na_values(all_parsers):
+    data = """A,B,C
+True,False,True
+NA,True,False
+False,NA,True"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame({"A": np.array([True, np.nan, False], dtype=object),
+                          "B": np.array([False, True, np.nan], dtype=object),
+                          "C": [True, False, True]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_na_value_dict(all_parsers):
+    data = """A,B,C
+foo,bar,NA
+bar,foo,foo
+foo,bar,NA
+bar,foo,foo"""
+    parser = all_parsers
+    df = parser.read_csv(StringIO(data),
+                         na_values={"A": ["foo"], "B": ["bar"]})
+    expected = DataFrame({"A": [np.nan, "bar", np.nan, "bar"],
+                          "B": [np.nan, "foo", np.nan, "foo"],
+                          "C": [np.nan, "foo", np.nan, "foo"]})
+    tm.assert_frame_equal(df, expected)
+
+
+@pytest.mark.parametrize("index_col,expected", [
+    ([0], DataFrame({"b": [np.nan], "c": [1], "d": [5]},
+                    index=Index([0], name="a"))),
+    ([0, 2], DataFrame({"b": [np.nan], "d": [5]},
+                       index=MultiIndex.from_tuples(
+                           [(0, 1)], names=["a", "c"]))),
+    (["a", "c"], DataFrame({"b": [np.nan], "d": [5]},
+                           index=MultiIndex.from_tuples(
+                               [(0, 1)], names=["a", "c"]))),
+])
+def test_na_value_dict_multi_index(all_parsers, index_col, expected):
+    data = """\
+a,b,c,d
+0,NA,1,5
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), na_values=set(),
+                             index_col=index_col)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,expected", [
+    (dict(), DataFrame({"A": ["a", "b", np.nan, "d", "e", np.nan, "g"],
+                        "B": [1, 2, 3, 4, 5, 6, 7],
+                        "C": ["one", "two", "three", np.nan, "five",
+                              np.nan, "seven"]})),
+    (dict(na_values={"A": [], "C": []}, keep_default_na=False),
+     DataFrame({"A": ["a", "b", "", "d", "e", "nan", "g"],
+                "B": [1, 2, 3, 4, 5, 6, 7],
+                "C": ["one", "two", "three", "nan", "five", "", "seven"]})),
+    (dict(na_values=["a"], keep_default_na=False),
+     DataFrame({"A": [np.nan, "b", "", "d", "e", "nan", "g"],
+                "B": [1, 2, 3, 4, 5, 6, 7],
+                "C": ["one", "two", "three", "nan", "five", "", "seven"]})),
+    (dict(na_values={"A": [], "C": []}),
+     DataFrame({"A": ["a", "b", np.nan, "d", "e", np.nan, "g"],
+                "B": [1, 2, 3, 4, 5, 6, 7],
+                "C": ["one", "two", "three", np.nan,
+                      "five", np.nan, "seven"]})),
+])
+def test_na_values_keep_default(all_parsers, kwargs, expected):
+    data = """\
+A,B,C
+a,1,one
+b,2,two
+,3,three
+d,4,nan
+e,5,five
+nan,6,
+g,7,seven
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_no_na_values_no_keep_default(all_parsers):
+    # see gh-4318: passing na_values=None and
+    # keep_default_na=False yields 'None" as a na_value
+    data = """\
+A,B,C
+a,1,None
+b,2,two
+,3,None
+d,4,nan
+e,5,five
+nan,6,
+g,7,seven
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), keep_default_na=False)
+
+    expected = DataFrame({"A": ["a", "b", "", "d", "e", "nan", "g"],
+                          "B": [1, 2, 3, 4, 5, 6, 7],
+                          "C": ["None", "two", "None", "nan",
+                                "five", "", "seven"]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_no_keep_default_na_dict_na_values(all_parsers):
+    # see gh-19227
+    data = "a,b\n,2"
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), na_values={"b": ["2"]},
+                             keep_default_na=False)
+    expected = DataFrame({"a": [""], "b": [np.nan]})
+    tm.assert_frame_equal(result, expected)
+
+
+def test_no_keep_default_na_dict_na_scalar_values(all_parsers):
+    # see gh-19227
+    #
+    # Scalar values shouldn't cause the parsing to crash or fail.
+    data = "a,b\n1,2"
+    parser = all_parsers
+    df = parser.read_csv(StringIO(data), na_values={"b": 2},
+                         keep_default_na=False)
+    expected = DataFrame({"a": [1], "b": [np.nan]})
+    tm.assert_frame_equal(df, expected)
+
+
+@pytest.mark.parametrize("col_zero_na_values", [
+    113125, "113125"
+])
+def test_no_keep_default_na_dict_na_values_diff_reprs(all_parsers,
+                                                      col_zero_na_values):
+    # see gh-19227
+    data = """\
+113125,"blah","/blaha",kjsdkj,412.166,225.874,214.008
+729639,"qwer","",asdfkj,466.681,,252.373
+"""
+    parser = all_parsers
+    expected = DataFrame({0: [np.nan, 729639.0],
+                          1: [np.nan, "qwer"],
+                          2: ["/blaha", np.nan],
+                          3: ["kjsdkj", "asdfkj"],
+                          4: [412.166, 466.681],
+                          5: ["225.874", ""],
+                          6: [np.nan, 252.373]})
+
+    result = parser.read_csv(StringIO(data), header=None,
+                             keep_default_na=False,
+                             na_values={2: "", 6: "214.008",
+                                        1: "blah", 0: col_zero_na_values})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_filter,row_data", [
+    (True, [[1, "A"], [np.nan, np.nan], [3, "C"]]),
+    (False, [["1", "A"], ["nan", "B"], ["3", "C"]]),
+])
+def test_na_values_na_filter_override(all_parsers, na_filter, row_data):
+    data = """\
+A,B
+1,A
+nan,B
+3,C
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), na_values=["B"],
+                             na_filter=na_filter)
+
+    expected = DataFrame(row_data, columns=["A", "B"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_na_trailing_columns(all_parsers):
+    parser = all_parsers
+    data = """Date,Currency,Symbol,Type,Units,UnitPrice,Cost,Tax
+2012-03-14,USD,AAPL,BUY,1000
+2012-05-12,USD,SBUX,SELL,500"""
+
+    # Trailing columns should be all NaN.
+    result = parser.read_csv(StringIO(data))
+    expected = DataFrame([
+        ["2012-03-14", "USD", "AAPL", "BUY", 1000, np.nan, np.nan, np.nan],
+        ["2012-05-12", "USD", "SBUX", "SELL", 500, np.nan, np.nan, np.nan],
+    ], columns=["Date", "Currency", "Symbol", "Type",
+                "Units", "UnitPrice", "Cost", "Tax"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_values,row_data", [
+    (1, [[np.nan, 2.0], [2.0, np.nan]]),
+    ({"a": 2, "b": 1}, [[1.0, 2.0], [np.nan, np.nan]]),
+])
+def test_na_values_scalar(all_parsers, na_values, row_data):
+    # see gh-12224
+    parser = all_parsers
+    names = ["a", "b"]
+    data = "1,2\n2,1"
+
+    result = parser.read_csv(StringIO(data), names=names, na_values=na_values)
+    expected = DataFrame(row_data, columns=names)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_na_values_dict_aliasing(all_parsers):
+    parser = all_parsers
+    na_values = {"a": 2, "b": 1}
+    na_values_copy = na_values.copy()
+
+    names = ["a", "b"]
+    data = "1,2\n2,1"
+
+    expected = DataFrame([[1.0, 2.0], [np.nan, np.nan]], columns=names)
+    result = parser.read_csv(StringIO(data), names=names, na_values=na_values)
+
+    tm.assert_frame_equal(result, expected)
+    tm.assert_dict_equal(na_values, na_values_copy)
+
+
+def test_na_values_dict_col_index(all_parsers):
+    # see gh-14203
+    data = "a\nfoo\n1"
+    parser = all_parsers
+    na_values = {0: "foo"}
+
+    result = parser.read_csv(StringIO(data), na_values=na_values)
+    expected = DataFrame({"a": [np.nan, 1]})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    (str(2**63) + "\n" + str(2**63 + 1),
+     dict(na_values=[2**63]), DataFrame([str(2**63), str(2**63 + 1)])),
+    (str(2**63) + ",1" + "\n,2",
+     dict(), DataFrame([[str(2**63), 1], ['', 2]])),
+    (str(2**63) + "\n1",
+     dict(na_values=[2**63]), DataFrame([np.nan, 1])),
+])
+def test_na_values_uint64(all_parsers, data, kwargs, expected):
+    # see gh-14983
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), header=None, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_na_values_no_default_with_index(all_parsers):
+    # see gh-15835
+    data = "a,1\nb,2"
+    parser = all_parsers
+    expected = DataFrame({"1": [2]}, index=Index(["b"], name="a"))
+
+    result = parser.read_csv(StringIO(data), index_col=0,
+                             keep_default_na=False)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("na_filter,index_data", [
+    (False, ["", "5"]),
+    (True, [np.nan, 5.0]),
+])
+def test_no_na_filter_on_index(all_parsers, na_filter, index_data):
+    # see gh-5239
+    #
+    # Don't parse NA-values in index unless na_filter=True
+    parser = all_parsers
+    data = "a,b,c\n1,,3\n4,5,6"
+
+    expected = DataFrame({"a": [1, 4], "c": [3, 6]},
+                         index=Index(index_data, name="b"))
+    result = parser.read_csv(StringIO(data), index_col=[1],
+                             na_filter=na_filter)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_inf_na_values_with_int_index(all_parsers):
+    # see gh-17128
+    parser = all_parsers
+    data = "idx,col1,col2\n1,3,4\n2,inf,-inf"
+
+    # Don't fail with OverflowError with inf's and integer index column.
+    out = parser.read_csv(StringIO(data), index_col=[0],
+                          na_values=["inf", "-inf"])
+    expected = DataFrame({"col1": [3, np.nan], "col2": [4, np.nan]},
+                         index=Index([1, 2], name="idx"))
+    tm.assert_frame_equal(out, expected)
+
+
+@pytest.mark.parametrize("na_filter", [True, False])
+def test_na_values_with_dtype_str_and_na_filter(all_parsers, na_filter):
+    # see gh-20377
+    parser = all_parsers
+    data = "a,b,c\n1,,3\n4,5,6"
+
+    # na_filter=True --> missing value becomes NaN.
+    # na_filter=False --> missing value remains empty string.
+    empty = np.nan if na_filter else ""
+    expected = DataFrame({"a": ["1", "4"],
+                          "b": [empty, "5"],
+                          "c": ["3", "6"]})
+
+    result = parser.read_csv(StringIO(data), na_filter=na_filter, dtype=str)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data, na_values", [
+    ("false,1\n,1\ntrue", None),
+    ("false,1\nnull,1\ntrue", None),
+    ("false,1\nnan,1\ntrue", None),
+    ("false,1\nfoo,1\ntrue", 'foo'),
+    ("false,1\nfoo,1\ntrue", ['foo']),
+    ("false,1\nfoo,1\ntrue", {'a': 'foo'}),
+])
+def test_cast_NA_to_bool_raises_error(all_parsers, data, na_values):
+    parser = all_parsers
+    msg = ("(Bool column has NA values in column [0a])|"
+           "(cannot safely convert passed user dtype of "
+           "bool for object dtyped data in column 0)")
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), header=None, names=['a', 'b'],
+                        dtype={'a': 'bool'}, na_values=na_values)
diff --git a/pandas/tests/io/parser/test_network.py b/pandas/tests/io/parser/test_network.py
index 4d6b6c7daa3c6..e54da94089cfd 100644
--- a/pandas/tests/io/parser/test_network.py
+++ b/pandas/tests/io/parser/test_network.py
@@ -4,29 +4,33 @@
 Tests parsers ability to read and parse non-local files
 and hence require a network connection to be read.
 """
+import logging
 
-import os
+import numpy as np
 import pytest
 
-import pandas.util.testing as tm
-from pandas import DataFrame
-from pandas.io.parsers import read_csv, read_table
+from pandas.compat import BytesIO, StringIO
+import pandas.util._test_decorators as td
 
+from pandas import DataFrame
+import pandas.util.testing as tm
 
-@pytest.fixture(scope='module')
-def salaries_table():
-    path = os.path.join(tm.get_data_path(), 'salaries.csv')
-    return read_table(path)
+from pandas.io.parsers import read_csv
 
 
+@pytest.mark.network
 @pytest.mark.parametrize(
-    "compression,extension",
-    [('gzip', '.gz'), ('bz2', '.bz2'), ('zip', '.zip'),
-     tm._mark_skipif_no_lzma(('xz', '.xz'))])
+    "compress_type, extension", [
+        ('gzip', '.gz'), ('bz2', '.bz2'), ('zip', '.zip'),
+        pytest.param('xz', '.xz', marks=td.skip_if_no_lzma)
+    ]
+)
 @pytest.mark.parametrize('mode', ['explicit', 'infer'])
 @pytest.mark.parametrize('engine', ['python', 'c'])
-def test_compressed_urls(salaries_table, compression, extension, mode, engine):
-    check_compressed_urls(salaries_table, compression, extension, mode, engine)
+def test_compressed_urls(salaries_table, compress_type, extension, mode,
+                         engine):
+    check_compressed_urls(salaries_table, compress_type, extension, mode,
+                          engine)
 
 
 @tm.network
@@ -42,136 +46,159 @@ def check_compressed_urls(salaries_table, compression, extension, mode,
     if mode != 'explicit':
         compression = mode
 
-    url_table = read_table(url, compression=compression, engine=engine)
+    url_table = read_csv(url, sep='\t', compression=compression, engine=engine)
     tm.assert_frame_equal(url_table, salaries_table)
 
 
-class TestS3(tm.TestCase):
+@pytest.fixture
+def tips_df(datapath):
+    """DataFrame with the tips dataset."""
+    return read_csv(datapath('io', 'parser', 'data', 'tips.csv'))
 
-    def setUp(self):
-        try:
-            import s3fs  # noqa
-        except ImportError:
-            pytest.skip("s3fs not installed")
 
-    @tm.network
-    def test_parse_public_s3_bucket(self):
+@pytest.mark.usefixtures("s3_resource")
+@td.skip_if_not_us_locale()
+class TestS3(object):
+
+    def test_parse_public_s3_bucket(self, tips_df):
+        pytest.importorskip('s3fs')
+
+        # more of an integration test due to the not-public contents portion
+        # can probably mock this though.
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df = read_csv('s3://pandas-test/tips.csv' +
                           ext, compression=comp)
-            self.assertTrue(isinstance(df, DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(read_csv(
-                tm.get_data_path('tips.csv')), df)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
 
         # Read public file from bucket with not-public contents
         df = read_csv('s3://cant_get_it/tips.csv')
-        self.assertTrue(isinstance(df, DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(read_csv(tm.get_data_path('tips.csv')), df)
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(df, tips_df)
+
+    def test_parse_public_s3n_bucket(self, tips_df):
 
-    @tm.network
-    def test_parse_public_s3n_bucket(self):
         # Read from AWS s3 as "s3n" URL
         df = read_csv('s3n://pandas-test/tips.csv', nrows=10)
-        self.assertTrue(isinstance(df, DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(read_csv(
-            tm.get_data_path('tips.csv')).iloc[:10], df)
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(tips_df.iloc[:10], df)
 
-    @tm.network
-    def test_parse_public_s3a_bucket(self):
+    def test_parse_public_s3a_bucket(self, tips_df):
         # Read from AWS s3 as "s3a" URL
         df = read_csv('s3a://pandas-test/tips.csv', nrows=10)
-        self.assertTrue(isinstance(df, DataFrame))
-        self.assertFalse(df.empty)
-        tm.assert_frame_equal(read_csv(
-            tm.get_data_path('tips.csv')).iloc[:10], df)
+        assert isinstance(df, DataFrame)
+        assert not df.empty
+        tm.assert_frame_equal(tips_df.iloc[:10], df)
 
-    @tm.network
-    def test_parse_public_s3_bucket_nrows(self):
+    def test_parse_public_s3_bucket_nrows(self, tips_df):
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df = read_csv('s3://pandas-test/tips.csv' +
                           ext, nrows=10, compression=comp)
-            self.assertTrue(isinstance(df, DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(read_csv(
-                tm.get_data_path('tips.csv')).iloc[:10], df)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(tips_df.iloc[:10], df)
 
-    @tm.network
-    def test_parse_public_s3_bucket_chunked(self):
+    def test_parse_public_s3_bucket_chunked(self, tips_df):
         # Read with a chunksize
         chunksize = 5
-        local_tips = read_csv(tm.get_data_path('tips.csv'))
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df_reader = read_csv('s3://pandas-test/tips.csv' + ext,
                                  chunksize=chunksize, compression=comp)
-            self.assertEqual(df_reader.chunksize, chunksize)
+            assert df_reader.chunksize == chunksize
             for i_chunk in [0, 1, 2]:
                 # Read a couple of chunks and make sure we see them
                 # properly.
                 df = df_reader.get_chunk()
-                self.assertTrue(isinstance(df, DataFrame))
-                self.assertFalse(df.empty)
-                true_df = local_tips.iloc[
+                assert isinstance(df, DataFrame)
+                assert not df.empty
+                true_df = tips_df.iloc[
                     chunksize * i_chunk: chunksize * (i_chunk + 1)]
                 tm.assert_frame_equal(true_df, df)
 
-    @tm.network
-    def test_parse_public_s3_bucket_chunked_python(self):
+    def test_parse_public_s3_bucket_chunked_python(self, tips_df):
         # Read with a chunksize using the Python parser
         chunksize = 5
-        local_tips = read_csv(tm.get_data_path('tips.csv'))
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df_reader = read_csv('s3://pandas-test/tips.csv' + ext,
                                  chunksize=chunksize, compression=comp,
                                  engine='python')
-            self.assertEqual(df_reader.chunksize, chunksize)
+            assert df_reader.chunksize == chunksize
             for i_chunk in [0, 1, 2]:
                 # Read a couple of chunks and make sure we see them properly.
                 df = df_reader.get_chunk()
-                self.assertTrue(isinstance(df, DataFrame))
-                self.assertFalse(df.empty)
-                true_df = local_tips.iloc[
+                assert isinstance(df, DataFrame)
+                assert not df.empty
+                true_df = tips_df.iloc[
                     chunksize * i_chunk: chunksize * (i_chunk + 1)]
                 tm.assert_frame_equal(true_df, df)
 
-    @tm.network
-    def test_parse_public_s3_bucket_python(self):
+    def test_parse_public_s3_bucket_python(self, tips_df):
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df = read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
                           compression=comp)
-            self.assertTrue(isinstance(df, DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(read_csv(
-                tm.get_data_path('tips.csv')), df)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
 
-    @tm.network
-    def test_infer_s3_compression(self):
+    def test_infer_s3_compression(self, tips_df):
         for ext in ['', '.gz', '.bz2']:
             df = read_csv('s3://pandas-test/tips.csv' + ext,
                           engine='python', compression='infer')
-            self.assertTrue(isinstance(df, DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(read_csv(
-                tm.get_data_path('tips.csv')), df)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(df, tips_df)
 
-    @tm.network
-    def test_parse_public_s3_bucket_nrows_python(self):
+    def test_parse_public_s3_bucket_nrows_python(self, tips_df):
         for ext, comp in [('', None), ('.gz', 'gzip'), ('.bz2', 'bz2')]:
             df = read_csv('s3://pandas-test/tips.csv' + ext, engine='python',
                           nrows=10, compression=comp)
-            self.assertTrue(isinstance(df, DataFrame))
-            self.assertFalse(df.empty)
-            tm.assert_frame_equal(read_csv(
-                tm.get_data_path('tips.csv')).iloc[:10], df)
+            assert isinstance(df, DataFrame)
+            assert not df.empty
+            tm.assert_frame_equal(tips_df.iloc[:10], df)
 
-    @tm.network
     def test_s3_fails(self):
-        with tm.assertRaises(IOError):
+        with pytest.raises(IOError):
             read_csv('s3://nyqpug/asdf.csv')
 
         # Receive a permission error when trying to read a private bucket.
         # It's irrelevant here that this isn't actually a table.
-        with tm.assertRaises(IOError):
+        with pytest.raises(IOError):
             read_csv('s3://cant_get_it/')
+
+    def test_read_csv_handles_boto_s3_object(self,
+                                             s3_resource,
+                                             tips_file):
+        # see gh-16135
+
+        s3_object = s3_resource.meta.client.get_object(
+            Bucket='pandas-test',
+            Key='tips.csv')
+
+        result = read_csv(BytesIO(s3_object["Body"].read()), encoding='utf8')
+        assert isinstance(result, DataFrame)
+        assert not result.empty
+
+        expected = read_csv(tips_file)
+        tm.assert_frame_equal(result, expected)
+
+    def test_read_csv_chunked_download(self, s3_resource, caplog):
+        # 8 MB, S3FS usees 5MB chunks
+        df = DataFrame(np.random.randn(100000, 4), columns=list('abcd'))
+        buf = BytesIO()
+        str_buf = StringIO()
+
+        df.to_csv(str_buf)
+
+        buf = BytesIO(str_buf.getvalue().encode('utf-8'))
+
+        s3_resource.Bucket("pandas-test").put_object(
+            Key="large-file.csv",
+            Body=buf)
+
+        with caplog.at_level(logging.DEBUG, logger='s3fs.core'):
+            read_csv("s3://pandas-test/large-file.csv", nrows=5)
+            # log of fetch_range (start, stop)
+            assert ((0, 5505024) in {x.args[-2:] for x in caplog.records})
diff --git a/pandas/tests/io/parser/test_parse_dates.py b/pandas/tests/io/parser/test_parse_dates.py
new file mode 100644
index 0000000000000..ffc8af09bf239
--- /dev/null
+++ b/pandas/tests/io/parser/test_parse_dates.py
@@ -0,0 +1,849 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests date parsing functionality for all of the
+parsers defined in parsers.py
+"""
+
+from datetime import date, datetime
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslib import Timestamp
+from pandas._libs.tslibs import parsing
+from pandas.compat import StringIO, lrange, parse_date
+from pandas.compat.numpy import np_array_datetime64_compat
+
+import pandas as pd
+from pandas import DataFrame, DatetimeIndex, Index, MultiIndex
+from pandas.core.indexes.datetimes import date_range
+import pandas.util.testing as tm
+
+import pandas.io.date_converters as conv
+import pandas.io.parsers as parsers
+
+
+def test_separator_date_conflict(all_parsers):
+    # Regression test for gh-4678
+    #
+    # Make sure thousands separator and
+    # date parsing do not conflict.
+    parser = all_parsers
+    data = "06-02-2013;13:00;1-000.215"
+    expected = DataFrame([[datetime(2013, 6, 2, 13, 0, 0), 1000.215]],
+                         columns=["Date", 2])
+
+    df = parser.read_csv(StringIO(data), sep=";", thousands="-",
+                         parse_dates={"Date": [0, 1]}, header=None)
+    tm.assert_frame_equal(df, expected)
+
+
+@pytest.mark.parametrize("keep_date_col", [True, False])
+def test_multiple_date_col_custom(all_parsers, keep_date_col):
+    data = """\
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+    parser = all_parsers
+
+    def date_parser(*date_cols):
+        """
+        Test date parser.
+
+        Parameters
+        ----------
+        date_cols : args
+            The list of data columns to parse.
+
+        Returns
+        -------
+        parsed : Series
+        """
+        return parsing.try_parse_dates(parsers._concat_date_cols(date_cols))
+
+    result = parser.read_csv(StringIO(data), header=None,
+                             date_parser=date_parser, prefix="X",
+                             parse_dates={"actual": [1, 2],
+                                          "nominal": [1, 3]},
+                             keep_date_col=keep_date_col)
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), datetime(1999, 1, 27, 18, 56),
+         "KORD", "19990127", " 19:00:00", " 18:56:00",
+         0.81, 2.81, 7.2, 0.0, 280.0],
+        [datetime(1999, 1, 27, 20, 0), datetime(1999, 1, 27, 19, 56),
+         "KORD", "19990127", " 20:00:00", " 19:56:00",
+         0.01, 2.21, 7.2, 0.0, 260.0],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 20, 56),
+         "KORD", "19990127", " 21:00:00", " 20:56:00",
+         -0.59, 2.21, 5.7, 0.0, 280.0],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 21, 18),
+         "KORD", "19990127", " 21:00:00", " 21:18:00",
+         -0.99, 2.01, 3.6, 0.0, 270.0],
+        [datetime(1999, 1, 27, 22, 0), datetime(1999, 1, 27, 21, 56),
+         "KORD", "19990127", " 22:00:00", " 21:56:00",
+         -0.59, 1.71, 5.1, 0.0, 290.0],
+        [datetime(1999, 1, 27, 23, 0), datetime(1999, 1, 27, 22, 56),
+         "KORD", "19990127", " 23:00:00", " 22:56:00",
+         -0.59, 1.71, 4.6, 0.0, 280.0],
+    ], columns=["actual", "nominal", "X0", "X1", "X2",
+                "X3", "X4", "X5", "X6", "X7", "X8"])
+
+    if not keep_date_col:
+        expected = expected.drop(["X1", "X2", "X3"], axis=1)
+    elif parser.engine == "python":
+        expected["X1"] = expected["X1"].astype(np.int64)
+
+    # Python can sometimes be flaky about how
+    # the aggregated columns are entered, so
+    # this standardizes the order.
+    result = result[expected.columns]
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("keep_date_col", [True, False])
+def test_multiple_date_col(all_parsers, keep_date_col):
+    data = """\
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), header=None,
+                             prefix="X", parse_dates=[[1, 2], [1, 3]],
+                             keep_date_col=keep_date_col)
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), datetime(1999, 1, 27, 18, 56),
+         "KORD", "19990127", " 19:00:00", " 18:56:00",
+         0.81, 2.81, 7.2, 0.0, 280.0],
+        [datetime(1999, 1, 27, 20, 0), datetime(1999, 1, 27, 19, 56),
+         "KORD", "19990127", " 20:00:00", " 19:56:00",
+         0.01, 2.21, 7.2, 0.0, 260.0],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 20, 56),
+         "KORD", "19990127", " 21:00:00", " 20:56:00",
+         -0.59, 2.21, 5.7, 0.0, 280.0],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 21, 18),
+         "KORD", "19990127", " 21:00:00", " 21:18:00",
+         -0.99, 2.01, 3.6, 0.0, 270.0],
+        [datetime(1999, 1, 27, 22, 0), datetime(1999, 1, 27, 21, 56),
+         "KORD", "19990127", " 22:00:00", " 21:56:00",
+         -0.59, 1.71, 5.1, 0.0, 290.0],
+        [datetime(1999, 1, 27, 23, 0), datetime(1999, 1, 27, 22, 56),
+         "KORD", "19990127", " 23:00:00", " 22:56:00",
+         -0.59, 1.71, 4.6, 0.0, 280.0],
+    ], columns=["X1_X2", "X1_X3", "X0", "X1", "X2",
+                "X3", "X4", "X5", "X6", "X7", "X8"])
+
+    if not keep_date_col:
+        expected = expected.drop(["X1", "X2", "X3"], axis=1)
+    elif parser.engine == "python":
+        expected["X1"] = expected["X1"].astype(np.int64)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_date_col_as_index_col(all_parsers):
+    data = """\
+KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), header=None, prefix="X",
+                             parse_dates=[1], index_col=1)
+
+    index = Index([datetime(1999, 1, 27, 19, 0), datetime(1999, 1, 27, 20, 0),
+                   datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 21, 0),
+                   datetime(1999, 1, 27, 22, 0)], name="X1")
+    expected = DataFrame([
+        ["KORD", " 18:56:00", 0.81, 2.81, 7.2, 0.0, 280.0],
+        ["KORD", " 19:56:00", 0.01, 2.21, 7.2, 0.0, 260.0],
+        ["KORD", " 20:56:00", -0.59, 2.21, 5.7, 0.0, 280.0],
+        ["KORD", " 21:18:00", -0.99, 2.01, 3.6, 0.0, 270.0],
+        ["KORD", " 21:56:00", -0.59, 1.71, 5.1, 0.0, 290.0],
+    ], columns=["X0", "X2", "X3", "X4", "X5", "X6", "X7"], index=index)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multiple_date_cols_int_cast(all_parsers):
+    data = ("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
+            "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
+            "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
+            "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
+            "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
+            "KORD,19990127, 23:00:00, 22:56:00, -0.5900")
+    parse_dates = {"actual": [1, 2], "nominal": [1, 3]}
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), header=None,
+                             date_parser=conv.parse_date_time,
+                             parse_dates=parse_dates, prefix="X")
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), datetime(1999, 1, 27, 18, 56),
+         "KORD", 0.81],
+        [datetime(1999, 1, 27, 20, 0), datetime(1999, 1, 27, 19, 56),
+         "KORD", 0.01],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 20, 56),
+         "KORD", -0.59],
+        [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 21, 18),
+         "KORD", -0.99],
+        [datetime(1999, 1, 27, 22, 0), datetime(1999, 1, 27, 21, 56),
+         "KORD", -0.59],
+        [datetime(1999, 1, 27, 23, 0), datetime(1999, 1, 27, 22, 56),
+         "KORD", -0.59],
+    ], columns=["actual", "nominal", "X0", "X4"])
+
+    # Python can sometimes be flaky about how
+    # the aggregated columns are entered, so
+    # this standardizes the order.
+    result = result[expected.columns]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multiple_date_col_timestamp_parse(all_parsers):
+    parser = all_parsers
+    data = """05/31/2012,15:30:00.029,1306.25,1,E,0,,1306.25
+05/31/2012,15:30:00.029,1306.25,8,E,0,,1306.25"""
+
+    result = parser.read_csv(StringIO(data), parse_dates=[[0, 1]],
+                             header=None, date_parser=Timestamp)
+    expected = DataFrame([
+        [Timestamp("05/31/2012, 15:30:00.029"),
+         1306.25, 1, "E", 0, np.nan, 1306.25],
+        [Timestamp("05/31/2012, 15:30:00.029"),
+         1306.25, 8, "E", 0, np.nan, 1306.25]
+    ], columns=["0_1", 2, 3, 4, 5, 6, 7])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multiple_date_cols_with_header(all_parsers):
+    parser = all_parsers
+    data = """\
+ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000"""
+
+    result = parser.read_csv(StringIO(data), parse_dates={"nominal": [1, 2]})
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), "KORD", " 18:56:00",
+         0.81, 2.81, 7.2, 0.0, 280.0],
+        [datetime(1999, 1, 27, 20, 0), "KORD", " 19:56:00",
+         0.01, 2.21, 7.2, 0.0, 260.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD", " 20:56:00",
+         -0.59, 2.21, 5.7, 0.0, 280.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD", " 21:18:00",
+         -0.99, 2.01, 3.6, 0.0, 270.0],
+        [datetime(1999, 1, 27, 22, 0), "KORD", " 21:56:00",
+         -0.59, 1.71, 5.1, 0.0, 290.0],
+        [datetime(1999, 1, 27, 23, 0), "KORD", " 22:56:00",
+         -0.59, 1.71, 4.6, 0.0, 280.0],
+    ], columns=["nominal", "ID", "ActualTime", "TDew",
+                "TAir", "Windspeed", "Precip", "WindDir"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,parse_dates,msg", [
+    ("""\
+date_NominalTime,date,NominalTime
+KORD1,19990127, 19:00:00
+KORD2,19990127, 20:00:00""", [[1, 2]], ("New date column already "
+                                        "in dict date_NominalTime")),
+    ("""\
+ID,date,nominalTime
+KORD,19990127, 19:00:00
+KORD,19990127, 20:00:00""", dict(ID=[1, 2]), "Date column ID already in dict")
+])
+def test_multiple_date_col_name_collision(all_parsers, data, parse_dates, msg):
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), parse_dates=parse_dates)
+
+
+def test_date_parser_int_bug(all_parsers):
+    # see gh-3071
+    parser = all_parsers
+    data = ("posix_timestamp,elapsed,sys,user,queries,query_time,rows,"
+            "accountid,userid,contactid,level,silo,method\n"
+            "1343103150,0.062353,0,4,6,0.01690,3,"
+            "12345,1,-1,3,invoice_InvoiceResource,search\n")
+
+    result = parser.read_csv(
+        StringIO(data), index_col=0, parse_dates=[0],
+        date_parser=lambda x: datetime.utcfromtimestamp(int(x)))
+    expected = DataFrame([[0.062353, 0, 4, 6, 0.01690, 3, 12345, 1, -1,
+                           3, "invoice_InvoiceResource", "search"]],
+                         columns=["elapsed", "sys", "user", "queries",
+                                  "query_time", "rows", "accountid",
+                                  "userid", "contactid", "level",
+                                  "silo", "method"],
+                         index=Index([Timestamp("2012-07-24 04:12:30")],
+                                     name="posix_timestamp"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_nat_parse(all_parsers):
+    # see gh-3062
+    parser = all_parsers
+    df = DataFrame(dict({"A": np.asarray(lrange(10), dtype="float64"),
+                         "B": pd.Timestamp("20010101")}))
+    df.iloc[3:6, :] = np.nan
+
+    with tm.ensure_clean("__nat_parse_.csv") as path:
+        df.to_csv(path)
+
+        result = parser.read_csv(path, index_col=0, parse_dates=["B"])
+        tm.assert_frame_equal(result, df)
+
+
+def test_csv_custom_parser(all_parsers):
+    data = """A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+    parser = all_parsers
+    result = parser.read_csv(
+        StringIO(data),
+        date_parser=lambda x: datetime.strptime(x, "%Y%m%d"))
+    expected = parser.read_csv(StringIO(data), parse_dates=True)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_dates_implicit_first_col(all_parsers):
+    data = """A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), parse_dates=True)
+
+    expected = parser.read_csv(StringIO(data), index_col=0,
+                               parse_dates=True)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_dates_string(all_parsers):
+    data = """date,A,B,C
+20090101,a,1,2
+20090102,b,3,4
+20090103,c,4,5
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col="date",
+                             parse_dates=["date"])
+    index = date_range("1/1/2009", periods=3)
+    index.name = "date"
+
+    expected = DataFrame({"A": ["a", "b", "c"], "B": [1, 3, 4],
+                          "C": [2, 4, 5]}, index=index)
+    tm.assert_frame_equal(result, expected)
+
+
+# Bug in https://github.com/dateutil/dateutil/issues/217
+# has been addressed, but we just don't pass in the `yearfirst`
+@pytest.mark.xfail(reason="yearfirst is not surfaced in read_*")
+@pytest.mark.parametrize("parse_dates", [
+    [["date", "time"]],
+    [[0, 1]]
+])
+def test_yy_format_with_year_first(all_parsers, parse_dates):
+    data = """date,time,B,C
+090131,0010,1,2
+090228,1020,3,4
+090331,0830,5,6
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), index_col=0,
+                             parse_dates=parse_dates)
+    index = DatetimeIndex([datetime(2009, 1, 31, 0, 10, 0),
+                           datetime(2009, 2, 28, 10, 20, 0),
+                           datetime(2009, 3, 31, 8, 30, 0)],
+                          dtype=object, name="date_time")
+    expected = DataFrame({"B": [1, 3, 5], "C": [2, 4, 6]}, index=index)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("parse_dates", [[0, 2], ["a", "c"]])
+def test_parse_dates_column_list(all_parsers, parse_dates):
+    data = "a,b,c\n01/01/2010,1,15/02/2010"
+    parser = all_parsers
+
+    expected = DataFrame({"a": [datetime(2010, 1, 1)], "b": [1],
+                          "c": [datetime(2010, 2, 15)]})
+    expected = expected.set_index(["a", "b"])
+
+    result = parser.read_csv(StringIO(data), index_col=[0, 1],
+                             parse_dates=parse_dates, dayfirst=True)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_col", [[0, 1], [1, 0]])
+def test_multi_index_parse_dates(all_parsers, index_col):
+    data = """index1,index2,A,B,C
+20090101,one,a,1,2
+20090101,two,b,3,4
+20090101,three,c,4,5
+20090102,one,a,1,2
+20090102,two,b,3,4
+20090102,three,c,4,5
+20090103,one,a,1,2
+20090103,two,b,3,4
+20090103,three,c,4,5
+"""
+    parser = all_parsers
+    index = MultiIndex.from_product([
+        (datetime(2009, 1, 1), datetime(2009, 1, 2),
+         datetime(2009, 1, 3)), ("one", "two", "three")],
+        names=["index1", "index2"])
+
+    # Out of order.
+    if index_col == [1, 0]:
+        index = index.swaplevel(0, 1)
+
+    expected = DataFrame([["a", 1, 2], ["b", 3, 4], ["c", 4, 5],
+                          ["a", 1, 2], ["b", 3, 4], ["c", 4, 5],
+                          ["a", 1, 2], ["b", 3, 4], ["c", 4, 5]],
+                         columns=["A", "B", "C"], index=index)
+    result = parser.read_csv(StringIO(data), index_col=index_col,
+                             parse_dates=True)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(dayfirst=True), dict(day_first=True)
+])
+def test_parse_dates_custom_euro_format(all_parsers, kwargs):
+    parser = all_parsers
+    data = """foo,bar,baz
+31/01/2010,1,2
+01/02/2010,1,NA
+02/02/2010,1,2
+"""
+    if "dayfirst" in kwargs:
+        df = parser.read_csv(StringIO(data), names=["time", "Q", "NTU"],
+                             date_parser=lambda d: parse_date(d, **kwargs),
+                             header=0, index_col=0, parse_dates=True,
+                             na_values=["NA"])
+        exp_index = Index([datetime(2010, 1, 31), datetime(2010, 2, 1),
+                           datetime(2010, 2, 2)], name="time")
+        expected = DataFrame({"Q": [1, 1, 1], "NTU": [2, np.nan, 2]},
+                             index=exp_index, columns=["Q", "NTU"])
+        tm.assert_frame_equal(df, expected)
+    else:
+        msg = "got an unexpected keyword argument 'day_first'"
+        with pytest.raises(TypeError, match=msg):
+            parser.read_csv(StringIO(data), names=["time", "Q", "NTU"],
+                            date_parser=lambda d: parse_date(d, **kwargs),
+                            skiprows=[0], index_col=0, parse_dates=True,
+                            na_values=["NA"])
+
+
+def test_parse_tz_aware(all_parsers):
+    # See gh-1693
+    parser = all_parsers
+    data = "Date,x\n2012-06-13T01:39:00Z,0.5"
+
+    result = parser.read_csv(StringIO(data), index_col=0,
+                             parse_dates=True)
+    expected = DataFrame({"x": [0.5]}, index=Index([Timestamp(
+        "2012-06-13 01:39:00+00:00")], name="Date"))
+    tm.assert_frame_equal(result, expected)
+    assert result.index.tz is pytz.utc
+
+
+@pytest.mark.parametrize("parse_dates,index_col", [
+    ({"nominal": [1, 2]}, "nominal"),
+    ({"nominal": [1, 2]}, 0),
+    ([[1, 2]], 0),
+])
+def test_multiple_date_cols_index(all_parsers, parse_dates, index_col):
+    parser = all_parsers
+    data = """
+ID,date,NominalTime,ActualTime,TDew,TAir,Windspeed,Precip,WindDir
+KORD1,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD2,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD3,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD4,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD5,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD6,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), "KORD1", " 18:56:00",
+         0.81, 2.81, 7.2, 0.0, 280.0],
+        [datetime(1999, 1, 27, 20, 0), "KORD2", " 19:56:00",
+         0.01, 2.21, 7.2, 0.0, 260.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD3", " 20:56:00",
+         -0.59, 2.21, 5.7, 0.0, 280.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD4", " 21:18:00",
+         -0.99, 2.01, 3.6, 0.0, 270.0],
+        [datetime(1999, 1, 27, 22, 0), "KORD5", " 21:56:00",
+         -0.59, 1.71, 5.1, 0.0, 290.0],
+        [datetime(1999, 1, 27, 23, 0), "KORD6", " 22:56:00",
+         -0.59, 1.71, 4.6, 0.0, 280.0],
+    ], columns=["nominal", "ID", "ActualTime", "TDew",
+                "TAir", "Windspeed", "Precip", "WindDir"])
+    expected = expected.set_index("nominal")
+
+    if not isinstance(parse_dates, dict):
+        expected.index.name = "date_NominalTime"
+
+    result = parser.read_csv(StringIO(data), parse_dates=parse_dates,
+                             index_col=index_col)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multiple_date_cols_chunked(all_parsers):
+    parser = all_parsers
+    data = """\
+ID,date,nominalTime,actualTime,A,B,C,D,E
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+
+    expected = DataFrame([
+        [datetime(1999, 1, 27, 19, 0), "KORD", " 18:56:00",
+         0.81, 2.81, 7.2, 0.0, 280.0],
+        [datetime(1999, 1, 27, 20, 0), "KORD", " 19:56:00",
+         0.01, 2.21, 7.2, 0.0, 260.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD", " 20:56:00",
+         -0.59, 2.21, 5.7, 0.0, 280.0],
+        [datetime(1999, 1, 27, 21, 0), "KORD", " 21:18:00",
+         -0.99, 2.01, 3.6, 0.0, 270.0],
+        [datetime(1999, 1, 27, 22, 0), "KORD", " 21:56:00",
+         -0.59, 1.71, 5.1, 0.0, 290.0],
+        [datetime(1999, 1, 27, 23, 0), "KORD", " 22:56:00",
+         -0.59, 1.71, 4.6, 0.0, 280.0],
+    ], columns=["nominal", "ID", "actualTime", "A", "B", "C", "D", "E"])
+    expected = expected.set_index("nominal")
+
+    reader = parser.read_csv(StringIO(data), parse_dates={"nominal": [1, 2]},
+                             index_col="nominal", chunksize=2)
+    chunks = list(reader)
+
+    tm.assert_frame_equal(chunks[0], expected[:2])
+    tm.assert_frame_equal(chunks[1], expected[2:4])
+    tm.assert_frame_equal(chunks[2], expected[4:])
+
+
+def test_multiple_date_col_named_index_compat(all_parsers):
+    parser = all_parsers
+    data = """\
+ID,date,nominalTime,actualTime,A,B,C,D,E
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+
+    with_indices = parser.read_csv(StringIO(data),
+                                   parse_dates={"nominal": [1, 2]},
+                                   index_col="nominal")
+    with_names = parser.read_csv(StringIO(data), index_col="nominal",
+                                 parse_dates={"nominal": [
+                                     "date", "nominalTime"]})
+    tm.assert_frame_equal(with_indices, with_names)
+
+
+def test_multiple_date_col_multiple_index_compat(all_parsers):
+    parser = all_parsers
+    data = """\
+ID,date,nominalTime,actualTime,A,B,C,D,E
+KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
+KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
+KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
+KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
+KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
+KORD,19990127, 23:00:00, 22:56:00, -0.5900, 1.7100, 4.6000, 0.0000, 280.0000
+"""
+    result = parser.read_csv(StringIO(data), index_col=["nominal", "ID"],
+                             parse_dates={"nominal": [1, 2]})
+    expected = parser.read_csv(StringIO(data),
+                               parse_dates={"nominal": [1, 2]})
+
+    expected = expected.set_index(["nominal", "ID"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [dict(), dict(index_col="C")])
+def test_read_with_parse_dates_scalar_non_bool(all_parsers, kwargs):
+    # see gh-5636
+    parser = all_parsers
+    msg = ("Only booleans, lists, and dictionaries "
+           "are accepted for the 'parse_dates' parameter")
+    data = """A,B,C
+    1,2,2003-11-1"""
+
+    with pytest.raises(TypeError, match=msg):
+        parser.read_csv(StringIO(data), parse_dates="C", **kwargs)
+
+
+@pytest.mark.parametrize("parse_dates", [
+    (1,), np.array([4, 5]), {1, 3, 3}
+])
+def test_read_with_parse_dates_invalid_type(all_parsers, parse_dates):
+    parser = all_parsers
+    msg = ("Only booleans, lists, and dictionaries "
+           "are accepted for the 'parse_dates' parameter")
+    data = """A,B,C
+    1,2,2003-11-1"""
+
+    with pytest.raises(TypeError, match=msg):
+        parser.read_csv(StringIO(data), parse_dates=(1,))
+
+
+def test_parse_dates_empty_string(all_parsers):
+    # see gh-2263
+    parser = all_parsers
+    data = "Date,test\n2012-01-01,1\n,2"
+    result = parser.read_csv(StringIO(data), parse_dates=["Date"],
+                             na_filter=False)
+
+    expected = DataFrame([[datetime(2012, 1, 1), 1], [pd.NaT, 2]],
+                         columns=["Date", "test"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    ("a\n04.15.2016", dict(parse_dates=["a"]),
+     DataFrame([datetime(2016, 4, 15)], columns=["a"])),
+    ("a\n04.15.2016", dict(parse_dates=True, index_col=0),
+     DataFrame(index=DatetimeIndex(["2016-04-15"], name="a"))),
+    ("a,b\n04.15.2016,09.16.2013", dict(parse_dates=["a", "b"]),
+     DataFrame([[datetime(2016, 4, 15), datetime(2013, 9, 16)]],
+               columns=["a", "b"])),
+    ("a,b\n04.15.2016,09.16.2013", dict(parse_dates=True, index_col=[0, 1]),
+     DataFrame(index=MultiIndex.from_tuples(
+         [(datetime(2016, 4, 15), datetime(2013, 9, 16))], names=["a", "b"]))),
+])
+def test_parse_dates_no_convert_thousands(all_parsers, data, kwargs, expected):
+    # see gh-14066
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), thousands=".", **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_date_time_multi_level_column_name(all_parsers):
+    data = """\
+D,T,A,B
+date, time,a,b
+2001-01-05, 09:00:00, 0.0, 10.
+2001-01-06, 00:00:00, 1.0, 11.
+"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), header=[0, 1],
+                             parse_dates={"date_time": [0, 1]},
+                             date_parser=conv.parse_date_time)
+
+    expected_data = [[datetime(2001, 1, 5, 9, 0, 0), 0., 10.],
+                     [datetime(2001, 1, 6, 0, 0, 0), 1., 11.]]
+    expected = DataFrame(expected_data,
+                         columns=["date_time", ("A", "a"), ("B", "b")])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    ("""\
+date,time,a,b
+2001-01-05, 10:00:00, 0.0, 10.
+2001-01-05, 00:00:00, 1., 11.
+""", dict(header=0, parse_dates={"date_time": [0, 1]}),
+     DataFrame([[datetime(2001, 1, 5, 10, 0, 0), 0.0, 10],
+                [datetime(2001, 1, 5, 0, 0, 0), 1.0, 11.0]],
+               columns=["date_time", "a", "b"])),
+    (("KORD,19990127, 19:00:00, 18:56:00, 0.8100\n"
+      "KORD,19990127, 20:00:00, 19:56:00, 0.0100\n"
+      "KORD,19990127, 21:00:00, 20:56:00, -0.5900\n"
+      "KORD,19990127, 21:00:00, 21:18:00, -0.9900\n"
+      "KORD,19990127, 22:00:00, 21:56:00, -0.5900\n"
+      "KORD,19990127, 23:00:00, 22:56:00, -0.5900"),
+     dict(header=None, parse_dates={"actual": [1, 2], "nominal": [1, 3]}),
+     DataFrame([
+         [datetime(1999, 1, 27, 19, 0), datetime(1999, 1, 27, 18, 56),
+          "KORD", 0.81],
+         [datetime(1999, 1, 27, 20, 0), datetime(1999, 1, 27, 19, 56),
+          "KORD", 0.01],
+         [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 20, 56),
+          "KORD", -0.59],
+         [datetime(1999, 1, 27, 21, 0), datetime(1999, 1, 27, 21, 18),
+          "KORD", -0.99],
+         [datetime(1999, 1, 27, 22, 0), datetime(1999, 1, 27, 21, 56),
+          "KORD", -0.59],
+         [datetime(1999, 1, 27, 23, 0), datetime(1999, 1, 27, 22, 56),
+          "KORD", -0.59]], columns=["actual", "nominal", 0, 4])),
+])
+def test_parse_date_time(all_parsers, data, kwargs, expected):
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), date_parser=conv.parse_date_time,
+                             **kwargs)
+
+    # Python can sometimes be flaky about how
+    # the aggregated columns are entered, so
+    # this standardizes the order.
+    result = result[expected.columns]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_date_fields(all_parsers):
+    parser = all_parsers
+    data = ("year,month,day,a\n2001,01,10,10.\n"
+            "2001,02,1,11.")
+    result = parser.read_csv(StringIO(data), header=0,
+                             parse_dates={"ymd": [0, 1, 2]},
+                             date_parser=conv.parse_date_fields)
+
+    expected = DataFrame([[datetime(2001, 1, 10), 10.],
+                          [datetime(2001, 2, 1), 11.]], columns=["ymd", "a"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_date_all_fields(all_parsers):
+    parser = all_parsers
+    data = """\
+year,month,day,hour,minute,second,a,b
+2001,01,05,10,00,0,0.0,10.
+2001,01,5,10,0,00,1.,11.
+"""
+    result = parser.read_csv(StringIO(data), header=0,
+                             date_parser=conv.parse_all_fields,
+                             parse_dates={"ymdHMS": [0, 1, 2, 3, 4, 5]})
+    expected = DataFrame([[datetime(2001, 1, 5, 10, 0, 0), 0.0, 10.0],
+                          [datetime(2001, 1, 5, 10, 0, 0), 1.0, 11.0]],
+                         columns=["ymdHMS", "a", "b"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_datetime_fractional_seconds(all_parsers):
+    parser = all_parsers
+    data = """\
+year,month,day,hour,minute,second,a,b
+2001,01,05,10,00,0.123456,0.0,10.
+2001,01,5,10,0,0.500000,1.,11.
+"""
+    result = parser.read_csv(StringIO(data), header=0,
+                             date_parser=conv.parse_all_fields,
+                             parse_dates={"ymdHMS": [0, 1, 2, 3, 4, 5]})
+    expected = DataFrame([[datetime(2001, 1, 5, 10, 0, 0,
+                                    microsecond=123456), 0.0, 10.0],
+                          [datetime(2001, 1, 5, 10, 0, 0,
+                                    microsecond=500000), 1.0, 11.0]],
+                         columns=["ymdHMS", "a", "b"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_generic(all_parsers):
+    parser = all_parsers
+    data = "year,month,day,a\n2001,01,10,10.\n2001,02,1,11."
+
+    result = parser.read_csv(StringIO(data), header=0,
+                             parse_dates={"ym": [0, 1]},
+                             date_parser=lambda y, m: date(year=int(y),
+                                                           month=int(m),
+                                                           day=1))
+    expected = DataFrame([[date(2001, 1, 1), 10, 10.],
+                          [date(2001, 2, 1), 1, 11.]],
+                         columns=["ym", "day", "a"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_date_parser_resolution_if_not_ns(all_parsers):
+    # see gh-10245
+    parser = all_parsers
+    data = """\
+date,time,prn,rxstatus
+2013-11-03,19:00:00,126,00E80000
+2013-11-03,19:00:00,23,00E80000
+2013-11-03,19:00:00,13,00E80000
+"""
+
+    def date_parser(dt, time):
+        return np_array_datetime64_compat(dt + "T" + time + "Z",
+                                          dtype="datetime64[s]")
+
+    result = parser.read_csv(StringIO(data), date_parser=date_parser,
+                             parse_dates={"datetime": ["date", "time"]},
+                             index_col=["datetime", "prn"])
+
+    datetimes = np_array_datetime64_compat(["2013-11-03T19:00:00Z"] * 3,
+                                           dtype="datetime64[s]")
+    expected = DataFrame(data={"rxstatus": ["00E80000"] * 3},
+                         index=MultiIndex.from_tuples(
+                             [(datetimes[0], 126), (datetimes[1], 23),
+                              (datetimes[2], 13)], names=["datetime", "prn"]))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_date_column_with_empty_string(all_parsers):
+    # see gh-6428
+    parser = all_parsers
+    data = "case,opdate\n7,10/18/2006\n7,10/18/2008\n621, "
+    result = parser.read_csv(StringIO(data), parse_dates=["opdate"])
+
+    expected_data = [[7, "10/18/2006"],
+                     [7, "10/18/2008"],
+                     [621, " "]]
+    expected = DataFrame(expected_data, columns=["case", "opdate"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,expected", [
+    ("a\n135217135789158401\n1352171357E+5",
+     DataFrame({"a": [135217135789158401,
+                      135217135700000]}, dtype="float64")),
+    ("a\n99999999999\n123456789012345\n1234E+0",
+     DataFrame({"a": [99999999999,
+                      123456789012345,
+                      1234]}, dtype="float64"))
+])
+@pytest.mark.parametrize("parse_dates", [True, False])
+def test_parse_date_float(all_parsers, data, expected, parse_dates):
+    # see gh-2697
+    #
+    # Date parsing should fail, so we leave the data untouched
+    # (i.e. float precision should remain unchanged).
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), parse_dates=parse_dates)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_parse_timezone(all_parsers):
+    # see gh-22256
+    parser = all_parsers
+    data = """dt,val
+              2018-01-04 09:01:00+09:00,23350
+              2018-01-04 09:02:00+09:00,23400
+              2018-01-04 09:03:00+09:00,23400
+              2018-01-04 09:04:00+09:00,23400
+              2018-01-04 09:05:00+09:00,23400"""
+    result = parser.read_csv(StringIO(data), parse_dates=["dt"])
+
+    dti = pd.date_range(start="2018-01-04 09:01:00",
+                        end="2018-01-04 09:05:00", freq="1min",
+                        tz=pytz.FixedOffset(540))
+    expected_data = {"dt": dti, "val": [23350, 23400, 23400, 23400, 23400]}
+
+    expected = DataFrame(expected_data)
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_parsers.py b/pandas/tests/io/parser/test_parsers.py
deleted file mode 100644
index 2ae557a7d57db..0000000000000
--- a/pandas/tests/io/parser/test_parsers.py
+++ /dev/null
@@ -1,101 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import os
-
-import pandas.util.testing as tm
-
-from pandas import read_csv, read_table
-from pandas.core.common import AbstractMethodError
-
-from .common import ParserTests
-from .header import HeaderTests
-from .comment import CommentTests
-from .dialect import DialectTests
-from .quoting import QuotingTests
-from .usecols import UsecolsTests
-from .skiprows import SkipRowsTests
-from .index_col import IndexColTests
-from .na_values import NAvaluesTests
-from .converters import ConverterTests
-from .c_parser_only import CParserTests
-from .parse_dates import ParseDatesTests
-from .compression import CompressionTests
-from .multithread import MultithreadTests
-from .python_parser_only import PythonParserTests
-from .dtypes import DtypeTests
-
-
-class BaseParser(CommentTests, CompressionTests,
-                 ConverterTests, DialectTests,
-                 HeaderTests, IndexColTests,
-                 MultithreadTests, NAvaluesTests,
-                 ParseDatesTests, ParserTests,
-                 SkipRowsTests, UsecolsTests,
-                 QuotingTests, DtypeTests):
-
-    def read_csv(self, *args, **kwargs):
-        raise NotImplementedError
-
-    def read_table(self, *args, **kwargs):
-        raise NotImplementedError
-
-    def float_precision_choices(self):
-        raise AbstractMethodError(self)
-
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
-        self.csv1 = os.path.join(self.dirpath, 'test1.csv')
-        self.csv2 = os.path.join(self.dirpath, 'test2.csv')
-        self.xls1 = os.path.join(self.dirpath, 'test.xls')
-        self.csv_shiftjs = os.path.join(self.dirpath, 'sauron.SHIFT_JIS.csv')
-
-
-class TestCParserHighMemory(BaseParser, CParserTests, tm.TestCase):
-    engine = 'c'
-    low_memory = False
-    float_precision_choices = [None, 'high', 'round_trip']
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        kwds['low_memory'] = self.low_memory
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        kwds['low_memory'] = self.low_memory
-        return read_table(*args, **kwds)
-
-
-class TestCParserLowMemory(BaseParser, CParserTests, tm.TestCase):
-    engine = 'c'
-    low_memory = True
-    float_precision_choices = [None, 'high', 'round_trip']
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        kwds['low_memory'] = self.low_memory
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        kwds['low_memory'] = True
-        return read_table(*args, **kwds)
-
-
-class TestPythonParser(BaseParser, PythonParserTests, tm.TestCase):
-    engine = 'python'
-    float_precision_choices = [None]
-
-    def read_csv(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        return read_csv(*args, **kwds)
-
-    def read_table(self, *args, **kwds):
-        kwds = kwds.copy()
-        kwds['engine'] = self.engine
-        return read_table(*args, **kwds)
diff --git a/pandas/tests/io/parser/test_python_parser_only.py b/pandas/tests/io/parser/test_python_parser_only.py
new file mode 100644
index 0000000000000..c2edff258f1b5
--- /dev/null
+++ b/pandas/tests/io/parser/test_python_parser_only.py
@@ -0,0 +1,301 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that apply specifically to the Python parser. Unless specifically
+stated as a Python-specific issue, the goal is to eventually move as many of
+these tests out of this module as soon as the C parser can accept further
+arguments when parsing.
+"""
+
+import csv
+
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import BytesIO, StringIO, u
+from pandas.errors import ParserError
+
+from pandas import DataFrame, Index, MultiIndex
+import pandas.util.testing as tm
+
+
+def test_default_separator(python_parser_only):
+    # see gh-17333
+    #
+    # csv.Sniffer in Python treats "o" as separator.
+    data = "aob\n1o2\n3o4"
+    parser = python_parser_only
+    expected = DataFrame({"a": [1, 3], "b": [2, 4]})
+
+    result = parser.read_csv(StringIO(data), sep=None)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("skipfooter", ["foo", 1.5, True])
+def test_invalid_skipfooter_non_int(python_parser_only, skipfooter):
+    # see gh-15925 (comment)
+    data = "a\n1\n2"
+    parser = python_parser_only
+    msg = "skipfooter must be an integer"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), skipfooter=skipfooter)
+
+
+def test_invalid_skipfooter_negative(python_parser_only):
+    # see gh-15925 (comment)
+    data = "a\n1\n2"
+    parser = python_parser_only
+    msg = "skipfooter cannot be negative"
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), skipfooter=-1)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(sep=None),
+    dict(delimiter="|")
+])
+def test_sniff_delimiter(python_parser_only, kwargs):
+    data = """index|A|B|C
+foo|1|2|3
+bar|4|5|6
+baz|7|8|9
+"""
+    parser = python_parser_only
+    result = parser.read_csv(StringIO(data), index_col=0, **kwargs)
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         columns=["A", "B", "C"],
+                         index=Index(["foo", "bar", "baz"], name="index"))
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("encoding", [None, "utf-8"])
+def test_sniff_delimiter_encoding(python_parser_only, encoding):
+    parser = python_parser_only
+    data = """ignore this
+ignore this too
+index|A|B|C
+foo|1|2|3
+bar|4|5|6
+baz|7|8|9
+"""
+
+    if encoding is not None:
+        data = u(data).encode(encoding)
+        data = BytesIO(data)
+
+        if compat.PY3:
+            from io import TextIOWrapper
+            data = TextIOWrapper(data, encoding=encoding)
+    else:
+        data = StringIO(data)
+
+    result = parser.read_csv(data, index_col=0, sep=None,
+                             skiprows=2, encoding=encoding)
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         columns=["A", "B", "C"],
+                         index=Index(["foo", "bar", "baz"], name="index"))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_single_line(python_parser_only):
+    # see gh-6607: sniff separator
+    parser = python_parser_only
+    result = parser.read_csv(StringIO("1,2"), names=["a", "b"],
+                             header=None, sep=None)
+
+    expected = DataFrame({"a": [1], "b": [2]})
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [dict(skipfooter=2), dict(nrows=3)])
+def test_skipfooter(python_parser_only, kwargs):
+    # see gh-6607
+    data = """A,B,C
+1,2,3
+4,5,6
+7,8,9
+want to skip this
+also also skip this
+"""
+    parser = python_parser_only
+    result = parser.read_csv(StringIO(data), **kwargs)
+
+    expected = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                         columns=["A", "B", "C"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("compression,klass", [
+    ("gzip", "GzipFile"),
+    ("bz2", "BZ2File"),
+])
+def test_decompression_regex_sep(python_parser_only, csv1, compression, klass):
+    # see gh-6607
+    parser = python_parser_only
+
+    with open(csv1, "rb") as f:
+        data = f.read()
+
+    data = data.replace(b",", b"::")
+    expected = parser.read_csv(csv1)
+
+    module = pytest.importorskip(compression)
+    klass = getattr(module, klass)
+
+    with tm.ensure_clean() as path:
+        tmp = klass(path, mode="wb")
+        tmp.write(data)
+        tmp.close()
+
+        result = parser.read_csv(path, sep="::",
+                                 compression=compression)
+        tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_buglet_4x_multi_index(python_parser_only):
+    # see gh-6607
+    data = """                      A       B       C       D        E
+one two three   four
+a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
+a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
+x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
+    parser = python_parser_only
+
+    expected = DataFrame([[-0.5109, -2.3358, -0.4645, 0.05076, 0.3640],
+                          [0.4473, 1.4152, 0.2834, 1.00661, 0.1744],
+                          [-0.6662, -0.5243, -0.3580, 0.89145, 2.5838]],
+                         columns=["A", "B", "C", "D", "E"],
+                         index=MultiIndex.from_tuples([
+                             ("a", "b", 10.0032, 5),
+                             ("a", "q", 20, 4),
+                             ("x", "q", 30, 3),
+                         ], names=["one", "two", "three", "four"]))
+    result = parser.read_csv(StringIO(data), sep=r"\s+")
+    tm.assert_frame_equal(result, expected)
+
+
+def test_read_csv_buglet_4x_multi_index2(python_parser_only):
+    # see gh-6893
+    data = "      A B C\na b c\n1 3 7 0 3 6\n3 1 4 1 5 9"
+    parser = python_parser_only
+
+    expected = DataFrame.from_records(
+        [(1, 3, 7, 0, 3, 6), (3, 1, 4, 1, 5, 9)],
+        columns=list("abcABC"), index=list("abc"))
+    result = parser.read_csv(StringIO(data), sep=r"\s+")
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("add_footer", [True, False])
+def test_skipfooter_with_decimal(python_parser_only, add_footer):
+    # see gh-6971
+    data = "1#2\n3#4"
+    parser = python_parser_only
+    expected = DataFrame({"a": [1.2, 3.4]})
+
+    if add_footer:
+        # The stray footer line should not mess with the
+        # casting of the first two lines if we skip it.
+        kwargs = dict(skipfooter=1)
+        data += "\nFooter"
+    else:
+        kwargs = dict()
+
+    result = parser.read_csv(StringIO(data), names=["a"],
+                             decimal="#", **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("sep", ["::", "#####", "!!!", "123", "#1!c5",
+                                 "%!c!d", "@@#4:2", "_!pd#_"])
+@pytest.mark.parametrize("encoding", ["utf-16", "utf-16-be", "utf-16-le",
+                                      "utf-32", "cp037"])
+def test_encoding_non_utf8_multichar_sep(python_parser_only, sep, encoding):
+    # see gh-3404
+    expected = DataFrame({"a": [1], "b": [2]})
+    parser = python_parser_only
+
+    data = "1" + sep + "2"
+    encoded_data = data.encode(encoding)
+
+    result = parser.read_csv(BytesIO(encoded_data), sep=sep,
+                             names=["a", "b"], encoding=encoding)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("quoting", [csv.QUOTE_MINIMAL, csv.QUOTE_NONE])
+def test_multi_char_sep_quotes(python_parser_only, quoting):
+    # see gh-13374
+    kwargs = dict(sep=",,")
+    parser = python_parser_only
+
+    data = 'a,,b\n1,,a\n2,,"2,,b"'
+    msg = "ignored when a multi-char delimiter is used"
+
+    def fail_read():
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data), quoting=quoting, **kwargs)
+
+    if quoting == csv.QUOTE_NONE:
+        # We expect no match, so there should be an assertion
+        # error out of the inner context manager.
+        with pytest.raises(AssertionError):
+            fail_read()
+    else:
+        fail_read()
+
+
+def test_none_delimiter(python_parser_only, capsys):
+    # see gh-13374 and gh-17465
+    parser = python_parser_only
+    data = "a,b,c\n0,1,2\n3,4,5,6\n7,8,9"
+    expected = DataFrame({"a": [0, 7], "b": [1, 8], "c": [2, 9]})
+
+    # We expect the third line in the data to be
+    # skipped because it is malformed, but we do
+    # not expect any errors to occur.
+    result = parser.read_csv(StringIO(data), header=0,
+                             sep=None, warn_bad_lines=True,
+                             error_bad_lines=False)
+    tm.assert_frame_equal(result, expected)
+
+    captured = capsys.readouterr()
+    assert "Skipping line 3" in captured.err
+
+
+@pytest.mark.parametrize("data", [
+    'a\n1\n"b"a', 'a,b,c\ncat,foo,bar\ndog,foo,"baz'])
+@pytest.mark.parametrize("skipfooter", [0, 1])
+def test_skipfooter_bad_row(python_parser_only, data, skipfooter):
+    # see gh-13879 and gh-15910
+    msg = "parsing errors in the skipped footer rows"
+    parser = python_parser_only
+
+    def fail_read():
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data), skipfooter=skipfooter)
+
+    if skipfooter:
+        fail_read()
+    else:
+        # We expect no match, so there should be an assertion
+        # error out of the inner context manager.
+        with pytest.raises(AssertionError):
+            fail_read()
+
+
+def test_malformed_skipfooter(python_parser_only):
+    parser = python_parser_only
+    data = """ignore
+A,B,C
+1,2,3 # comment
+1,2,3,4,5
+2,3,4
+footer
+"""
+    msg = "Expected 3 fields in line 4, saw 5"
+    with pytest.raises(ParserError, match=msg):
+        parser.read_csv(StringIO(data), header=1,
+                        comment="#", skipfooter=1)
diff --git a/pandas/tests/io/parser/test_quoting.py b/pandas/tests/io/parser/test_quoting.py
new file mode 100644
index 0000000000000..b33a1b8448bea
--- /dev/null
+++ b/pandas/tests/io/parser/test_quoting.py
@@ -0,0 +1,158 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that quoting specifications are properly handled
+during parsing for all of the parsers defined in parsers.py
+"""
+
+import csv
+
+import pytest
+
+from pandas.compat import PY2, StringIO, u
+from pandas.errors import ParserError
+
+from pandas import DataFrame
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("kwargs,msg", [
+    (dict(quotechar="foo"), '"quotechar" must be a(n)? 1-character string'),
+    (dict(quotechar=None, quoting=csv.QUOTE_MINIMAL),
+     "quotechar must be set if quoting enabled"),
+    (dict(quotechar=2), '"quotechar" must be string, not int')
+])
+def test_bad_quote_char(all_parsers, kwargs, msg):
+    data = "1,2,3"
+    parser = all_parsers
+
+    with pytest.raises(TypeError, match=msg):
+        parser.read_csv(StringIO(data), **kwargs)
+
+
+@pytest.mark.parametrize("quoting,msg", [
+    ("foo", '"quoting" must be an integer'),
+    (5, 'bad "quoting" value'),  # quoting must be in the range [0, 3]
+])
+def test_bad_quoting(all_parsers, quoting, msg):
+    data = "1,2,3"
+    parser = all_parsers
+
+    with pytest.raises(TypeError, match=msg):
+        parser.read_csv(StringIO(data), quoting=quoting)
+
+
+def test_quote_char_basic(all_parsers):
+    parser = all_parsers
+    data = 'a,b,c\n1,2,"cat"'
+    expected = DataFrame([[1, 2, "cat"]],
+                         columns=["a", "b", "c"])
+
+    result = parser.read_csv(StringIO(data), quotechar='"')
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("quote_char", ["~", "*", "%", "$", "@", "P"])
+def test_quote_char_various(all_parsers, quote_char):
+    parser = all_parsers
+    expected = DataFrame([[1, 2, "cat"]],
+                         columns=["a", "b", "c"])
+
+    data = 'a,b,c\n1,2,"cat"'
+    new_data = data.replace('"', quote_char)
+
+    result = parser.read_csv(StringIO(new_data), quotechar=quote_char)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("quoting", [csv.QUOTE_MINIMAL, csv.QUOTE_NONE])
+@pytest.mark.parametrize("quote_char", ["", None])
+def test_null_quote_char(all_parsers, quoting, quote_char):
+    kwargs = dict(quotechar=quote_char, quoting=quoting)
+    data = "a,b,c\n1,2,3"
+    parser = all_parsers
+
+    if quoting != csv.QUOTE_NONE:
+        # Sanity checking.
+        msg = "quotechar must be set if quoting enabled"
+
+        with pytest.raises(TypeError, match=msg):
+            parser.read_csv(StringIO(data), **kwargs)
+    else:
+        expected = DataFrame([[1, 2, 3]], columns=["a", "b", "c"])
+        result = parser.read_csv(StringIO(data), **kwargs)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,exp_data", [
+    (dict(), [[1, 2, "foo"]]),  # Test default.
+
+    # QUOTE_MINIMAL only applies to CSV writing, so no effect on reading.
+    (dict(quotechar='"', quoting=csv.QUOTE_MINIMAL), [[1, 2, "foo"]]),
+
+    # QUOTE_MINIMAL only applies to CSV writing, so no effect on reading.
+    (dict(quotechar='"', quoting=csv.QUOTE_ALL), [[1, 2, "foo"]]),
+
+    # QUOTE_NONE tells the reader to do no special handling
+    # of quote characters and leave them alone.
+    (dict(quotechar='"', quoting=csv.QUOTE_NONE), [[1, 2, '"foo"']]),
+
+    # QUOTE_NONNUMERIC tells the reader to cast
+    # all non-quoted fields to float
+    (dict(quotechar='"', quoting=csv.QUOTE_NONNUMERIC), [[1.0, 2.0, "foo"]])
+])
+def test_quoting_various(all_parsers, kwargs, exp_data):
+    data = '1,2,"foo"'
+    parser = all_parsers
+    columns = ["a", "b", "c"]
+
+    result = parser.read_csv(StringIO(data), names=columns, **kwargs)
+    expected = DataFrame(exp_data, columns=columns)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("doublequote,exp_data", [
+    (True, [[3, '4 " 5']]),
+    (False, [[3, '4 " 5"']]),
+])
+def test_double_quote(all_parsers, doublequote, exp_data):
+    parser = all_parsers
+    data = 'a,b\n3,"4 "" 5"'
+
+    result = parser.read_csv(StringIO(data), quotechar='"',
+                             doublequote=doublequote)
+    expected = DataFrame(exp_data, columns=["a", "b"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("quotechar", [
+    u('"'),
+    pytest.param(u('\u0001'), marks=pytest.mark.skipif(
+        PY2, reason="Python 2.x does not handle unicode well."))])
+def test_quotechar_unicode(all_parsers, quotechar):
+    # see gh-14477
+    data = "a\n1"
+    parser = all_parsers
+    expected = DataFrame({"a": [1]})
+
+    result = parser.read_csv(StringIO(data), quotechar=quotechar)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("balanced", [True, False])
+def test_unbalanced_quoting(all_parsers, balanced):
+    # see gh-22789.
+    parser = all_parsers
+    data = "a,b,c\n1,2,\"3"
+
+    if balanced:
+        # Re-balance the quoting and read in without errors.
+        expected = DataFrame([[1, 2, 3]], columns=["a", "b", "c"])
+        result = parser.read_csv(StringIO(data + '"'))
+        tm.assert_frame_equal(result, expected)
+    else:
+        msg = ("EOF inside string starting at row 1" if parser.engine == "c"
+               else "unexpected end of data")
+
+        with pytest.raises(ParserError, match=msg):
+            parser.read_csv(StringIO(data))
diff --git a/pandas/tests/io/parser/test_read_fwf.py b/pandas/tests/io/parser/test_read_fwf.py
index dccae06afe4d1..172bbe0bad4c7 100644
--- a/pandas/tests/io/parser/test_read_fwf.py
+++ b/pandas/tests/io/parser/test_read_fwf.py
@@ -8,83 +8,170 @@
 
 from datetime import datetime
 
-import pytest
 import numpy as np
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import BytesIO, StringIO
+
 import pandas as pd
+from pandas import DataFrame, DatetimeIndex
 import pandas.util.testing as tm
 
-from pandas import DataFrame
-from pandas import compat
-from pandas.compat import StringIO, BytesIO
-from pandas.io.parsers import read_csv, read_fwf, EmptyDataError
+from pandas.io.parsers import EmptyDataError, read_csv, read_fwf
 
 
-class TestFwfParsing(tm.TestCase):
-
-    def test_fwf(self):
-        data_expected = """\
-2011,58,360.242940,149.910199,11950.7
-2011,59,444.953632,166.985655,11788.4
-2011,60,364.136849,183.628767,11806.2
-2011,61,413.836124,184.375703,11916.8
-2011,62,502.953953,173.237159,12468.3
+def test_basic():
+    data = """\
+A         B            C            D
+201158    360.242940   149.910199   11950.7
+201159    444.953632   166.985655   11788.4
+201160    364.136849   183.628767   11806.2
+201161    413.836124   184.375703   11916.8
+201162    502.953953   173.237159   12468.3
 """
-        expected = read_csv(StringIO(data_expected),
-                            engine='python', header=None)
-
-        data1 = """\
+    result = read_fwf(StringIO(data))
+    expected = DataFrame([[201158, 360.242940, 149.910199, 11950.7],
+                          [201159, 444.953632, 166.985655, 11788.4],
+                          [201160, 364.136849, 183.628767, 11806.2],
+                          [201161, 413.836124, 184.375703, 11916.8],
+                          [201162, 502.953953, 173.237159, 12468.3]],
+                         columns=["A", "B", "C", "D"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_colspecs():
+    data = """\
+A   B     C            D            E
 201158    360.242940   149.910199   11950.7
 201159    444.953632   166.985655   11788.4
 201160    364.136849   183.628767   11806.2
 201161    413.836124   184.375703   11916.8
 201162    502.953953   173.237159   12468.3
 """
-        colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
-        df = read_fwf(StringIO(data1), colspecs=colspecs, header=None)
-        tm.assert_frame_equal(df, expected)
+    colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
+    result = read_fwf(StringIO(data), colspecs=colspecs)
+
+    expected = DataFrame([[2011, 58, 360.242940, 149.910199, 11950.7],
+                          [2011, 59, 444.953632, 166.985655, 11788.4],
+                          [2011, 60, 364.136849, 183.628767, 11806.2],
+                          [2011, 61, 413.836124, 184.375703, 11916.8],
+                          [2011, 62, 502.953953, 173.237159, 12468.3]],
+                         columns=["A", "B", "C", "D", "E"])
+    tm.assert_frame_equal(result, expected)
 
-        data2 = """\
+
+def test_widths():
+    data = """\
+A    B    C            D            E
 2011 58   360.242940   149.910199   11950.7
 2011 59   444.953632   166.985655   11788.4
 2011 60   364.136849   183.628767   11806.2
 2011 61   413.836124   184.375703   11916.8
 2011 62   502.953953   173.237159   12468.3
 """
-        df = read_fwf(StringIO(data2), widths=[5, 5, 13, 13, 7], header=None)
-        tm.assert_frame_equal(df, expected)
-
-        # From Thomas Kluyver: apparently some non-space filler characters can
-        # be seen, this is supported by specifying the 'delimiter' character:
-        # http://publib.boulder.ibm.com/infocenter/dmndhelp/v6r1mx/index.jsp?topic=/com.ibm.wbit.612.help.config.doc/topics/rfixwidth.html
-        data3 = """\
+    result = read_fwf(StringIO(data), widths=[5, 5, 13, 13, 7])
+
+    expected = DataFrame([[2011, 58, 360.242940, 149.910199, 11950.7],
+                          [2011, 59, 444.953632, 166.985655, 11788.4],
+                          [2011, 60, 364.136849, 183.628767, 11806.2],
+                          [2011, 61, 413.836124, 184.375703, 11916.8],
+                          [2011, 62, 502.953953, 173.237159, 12468.3]],
+                         columns=["A", "B", "C", "D", "E"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_non_space_filler():
+    # From Thomas Kluyver:
+    #
+    # Apparently, some non-space filler characters can be seen, this is
+    # supported by specifying the 'delimiter' character:
+    #
+    # http://publib.boulder.ibm.com/infocenter/dmndhelp/v6r1mx/index.jsp?topic=/com.ibm.wbit.612.help.config.doc/topics/rfixwidth.html
+    data = """\
+A~~~~B~~~~C~~~~~~~~~~~~D~~~~~~~~~~~~E
 201158~~~~360.242940~~~149.910199~~~11950.7
 201159~~~~444.953632~~~166.985655~~~11788.4
 201160~~~~364.136849~~~183.628767~~~11806.2
 201161~~~~413.836124~~~184.375703~~~11916.8
 201162~~~~502.953953~~~173.237159~~~12468.3
 """
-        df = read_fwf(
-            StringIO(data3), colspecs=colspecs, delimiter='~', header=None)
-        tm.assert_frame_equal(df, expected)
+    colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
+    result = read_fwf(StringIO(data), colspecs=colspecs, delimiter="~")
 
-        with tm.assertRaisesRegexp(ValueError, "must specify only one of"):
-            read_fwf(StringIO(data3), colspecs=colspecs, widths=[6, 10, 10, 7])
+    expected = DataFrame([[2011, 58, 360.242940, 149.910199, 11950.7],
+                          [2011, 59, 444.953632, 166.985655, 11788.4],
+                          [2011, 60, 364.136849, 183.628767, 11806.2],
+                          [2011, 61, 413.836124, 184.375703, 11916.8],
+                          [2011, 62, 502.953953, 173.237159, 12468.3]],
+                         columns=["A", "B", "C", "D", "E"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_over_specified():
+    data = """\
+A   B     C            D            E
+201158    360.242940   149.910199   11950.7
+201159    444.953632   166.985655   11788.4
+201160    364.136849   183.628767   11806.2
+201161    413.836124   184.375703   11916.8
+201162    502.953953   173.237159   12468.3
+"""
+    colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
 
-        with tm.assertRaisesRegexp(ValueError, "Must specify either"):
-            read_fwf(StringIO(data3), colspecs=None, widths=None)
+    with pytest.raises(ValueError, match="must specify only one of"):
+        read_fwf(StringIO(data), colspecs=colspecs, widths=[6, 10, 10, 7])
 
-    def test_BytesIO_input(self):
-        if not compat.PY3:
-            pytest.skip(
-                "Bytes-related test - only needs to work on Python 3")
 
-        result = read_fwf(BytesIO("שלום\nשלום".encode('utf8')), widths=[
-            2, 2], encoding='utf8')
-        expected = DataFrame([["של", "ום"]], columns=["של", "ום"])
-        tm.assert_frame_equal(result, expected)
+def test_under_specified():
+    data = """\
+A   B     C            D            E
+201158    360.242940   149.910199   11950.7
+201159    444.953632   166.985655   11788.4
+201160    364.136849   183.628767   11806.2
+201161    413.836124   184.375703   11916.8
+201162    502.953953   173.237159   12468.3
+"""
+    with pytest.raises(ValueError, match="Must specify either"):
+        read_fwf(StringIO(data), colspecs=None, widths=None)
+
 
-    def test_fwf_colspecs_is_list_or_tuple(self):
-        data = """index,A,B,C,D
+def test_read_csv_compat():
+    csv_data = """\
+A,B,C,D,E
+2011,58,360.242940,149.910199,11950.7
+2011,59,444.953632,166.985655,11788.4
+2011,60,364.136849,183.628767,11806.2
+2011,61,413.836124,184.375703,11916.8
+2011,62,502.953953,173.237159,12468.3
+"""
+    expected = read_csv(StringIO(csv_data), engine="python")
+
+    fwf_data = """\
+A   B     C            D            E
+201158    360.242940   149.910199   11950.7
+201159    444.953632   166.985655   11788.4
+201160    364.136849   183.628767   11806.2
+201161    413.836124   184.375703   11916.8
+201162    502.953953   173.237159   12468.3
+"""
+    colspecs = [(0, 4), (4, 8), (8, 20), (21, 33), (34, 43)]
+    result = read_fwf(StringIO(fwf_data), colspecs=colspecs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_bytes_io_input():
+    if not compat.PY3:
+        pytest.skip("Bytes-related test - only needs to work on Python 3")
+
+    result = read_fwf(BytesIO("שלום\nשלום".encode('utf8')),
+                      widths=[2, 2], encoding="utf8")
+    expected = DataFrame([["של", "ום"]], columns=["של", "ום"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_fwf_colspecs_is_list_or_tuple():
+    data = """index,A,B,C,D
 foo,2,3,4,5
 bar,7,8,9,10
 baz,12,13,14,15
@@ -93,14 +180,14 @@ def test_fwf_colspecs_is_list_or_tuple(self):
 bar2,12,13,14,15
 """
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   'column specifications must be a list or '
-                                   'tuple.+'):
-            pd.io.parsers.FixedWidthReader(StringIO(data),
-                                           {'a': 1}, ',', '#')
+    msg = "column specifications must be a list or tuple.+"
+
+    with pytest.raises(TypeError, match=msg):
+        read_fwf(StringIO(data), colspecs={"a": 1}, delimiter=",")
+
 
-    def test_fwf_colspecs_is_list_or_tuple_of_two_element_tuples(self):
-        data = """index,A,B,C,D
+def test_fwf_colspecs_is_list_or_tuple_of_two_element_tuples():
+    data = """index,A,B,C,D
 foo,2,3,4,5
 bar,7,8,9,10
 baz,12,13,14,15
@@ -109,146 +196,151 @@ def test_fwf_colspecs_is_list_or_tuple_of_two_element_tuples(self):
 bar2,12,13,14,15
 """
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   'Each column specification must be.+'):
-            read_fwf(StringIO(data), [('a', 1)])
+    msg = "Each column specification must be.+"
 
-    def test_fwf_colspecs_None(self):
-        # GH 7079
-        data = """\
+    with pytest.raises(TypeError, match=msg):
+        read_fwf(StringIO(data), [("a", 1)])
+
+
+@pytest.mark.parametrize("colspecs,exp_data", [
+    ([(0, 3), (3, None)], [[123, 456], [456, 789]]),
+    ([(None, 3), (3, 6)], [[123, 456], [456, 789]]),
+    ([(0, None), (3, None)], [[123456, 456], [456789, 789]]),
+    ([(None, None), (3, 6)], [[123456, 456], [456789, 789]]),
+])
+def test_fwf_colspecs_none(colspecs, exp_data):
+    # see gh-7079
+    data = """\
 123456
 456789
 """
-        colspecs = [(0, 3), (3, None)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123, 456], [456, 789]])
-        tm.assert_frame_equal(result, expected)
+    expected = DataFrame(exp_data)
 
-        colspecs = [(None, 3), (3, 6)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123, 456], [456, 789]])
-        tm.assert_frame_equal(result, expected)
+    result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
+    tm.assert_frame_equal(result, expected)
 
-        colspecs = [(0, None), (3, None)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123456, 456], [456789, 789]])
-        tm.assert_frame_equal(result, expected)
 
-        colspecs = [(None, None), (3, 6)]
-        result = read_fwf(StringIO(data), colspecs=colspecs, header=None)
-        expected = DataFrame([[123456, 456], [456789, 789]])
-        tm.assert_frame_equal(result, expected)
+@pytest.mark.parametrize("infer_nrows,exp_data", [
+    # infer_nrows --> colspec == [(2, 3), (5, 6)]
+    (1, [[1, 2], [3, 8]]),
 
-    def test_fwf_regression(self):
-        # GH 3594
-        # turns out 'T060' is parsable as a datetime slice!
-
-        tzlist = [1, 10, 20, 30, 60, 80, 100]
-        ntz = len(tzlist)
-        tcolspecs = [16] + [8] * ntz
-        tcolnames = ['SST'] + ["T%03d" % z for z in tzlist[1:]]
-        data = """  2009164202000   9.5403  9.4105  8.6571  7.8372  6.0612  5.8843  5.5192
-  2009164203000   9.5435  9.2010  8.6167  7.8176  6.0804  5.8728  5.4869
-  2009164204000   9.5873  9.1326  8.4694  7.5889  6.0422  5.8526  5.4657
-  2009164205000   9.5810  9.0896  8.4009  7.4652  6.0322  5.8189  5.4379
-  2009164210000   9.6034  9.0897  8.3822  7.4905  6.0908  5.7904  5.4039
+    # infer_nrows > number of rows
+    (10, [[1, 2], [123, 98]]),
+])
+def test_fwf_colspecs_infer_nrows(infer_nrows, exp_data):
+    # see gh-15138
+    data = """\
+  1  2
+123 98
 """
+    expected = DataFrame(exp_data)
+
+    result = read_fwf(StringIO(data), infer_nrows=infer_nrows, header=None)
+    tm.assert_frame_equal(result, expected)
 
-        df = read_fwf(StringIO(data),
-                      index_col=0,
-                      header=None,
-                      names=tcolnames,
-                      widths=tcolspecs,
-                      parse_dates=True,
-                      date_parser=lambda s: datetime.strptime(s, '%Y%j%H%M%S'))
 
-        for c in df.columns:
-            res = df.loc[:, c]
-            self.assertTrue(len(res))
+def test_fwf_regression():
+    # see gh-3594
+    #
+    # Turns out "T060" is parsable as a datetime slice!
+    tz_list = [1, 10, 20, 30, 60, 80, 100]
+    widths = [16] + [8] * len(tz_list)
+    names = ["SST"] + ["T%03d" % z for z in tz_list[1:]]
 
-    def test_fwf_for_uint8(self):
-        data = """1421302965.213420    PRI=3 PGN=0xef00      DST=0x17 SRC=0x28    04 154 00 00 00 00 00 127
+    data = """  2009164202000   9.5403  9.4105  8.6571  7.8372  6.0612  5.8843  5.5192
+2009164203000   9.5435  9.2010  8.6167  7.8176  6.0804  5.8728  5.4869
+2009164204000   9.5873  9.1326  8.4694  7.5889  6.0422  5.8526  5.4657
+2009164205000   9.5810  9.0896  8.4009  7.4652  6.0322  5.8189  5.4379
+2009164210000   9.6034  9.0897  8.3822  7.4905  6.0908  5.7904  5.4039
+"""
+
+    result = read_fwf(StringIO(data), index_col=0, header=None, names=names,
+                      widths=widths, parse_dates=True,
+                      date_parser=lambda s: datetime.strptime(s, "%Y%j%H%M%S"))
+    expected = DataFrame([
+        [9.5403, 9.4105, 8.6571, 7.8372, 6.0612, 5.8843, 5.5192],
+        [9.5435, 9.2010, 8.6167, 7.8176, 6.0804, 5.8728, 5.4869],
+        [9.5873, 9.1326, 8.4694, 7.5889, 6.0422, 5.8526, 5.4657],
+        [9.5810, 9.0896, 8.4009, 7.4652, 6.0322, 5.8189, 5.4379],
+        [9.6034, 9.0897, 8.3822, 7.4905, 6.0908, 5.7904, 5.4039],
+    ], index=DatetimeIndex(["2009-06-13 20:20:00", "2009-06-13 20:30:00",
+                            "2009-06-13 20:40:00", "2009-06-13 20:50:00",
+                            "2009-06-13 21:00:00"]),
+        columns=["SST", "T010", "T020", "T030", "T060", "T080", "T100"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_fwf_for_uint8():
+    data = """1421302965.213420    PRI=3 PGN=0xef00      DST=0x17 SRC=0x28    04 154 00 00 00 00 00 127
 1421302964.226776    PRI=6 PGN=0xf002               SRC=0x47    243 00 00 255 247 00 00 71"""  # noqa
-        df = read_fwf(StringIO(data),
-                      colspecs=[(0, 17), (25, 26), (33, 37),
-                                (49, 51), (58, 62), (63, 1000)],
-                      names=['time', 'pri', 'pgn', 'dst', 'src', 'data'],
-                      converters={
-                          'pgn': lambda x: int(x, 16),
-                          'src': lambda x: int(x, 16),
-                          'dst': lambda x: int(x, 16),
-                          'data': lambda x: len(x.split(' '))})
-
-        expected = DataFrame([[1421302965.213420, 3, 61184, 23, 40, 8],
-                              [1421302964.226776, 6, 61442, None, 71, 8]],
-                             columns=["time", "pri", "pgn",
-                                      "dst", "src", "data"])
-        expected["dst"] = expected["dst"].astype(object)
-
-        tm.assert_frame_equal(df, expected)
-
-    def test_fwf_compression(self):
-        try:
-            import gzip
-            import bz2
-        except ImportError:
-            pytest.skip("Need gzip and bz2 to run this test")
-
-        data = """1111111111
-        2222222222
-        3333333333""".strip()
-        widths = [5, 5]
-        names = ['one', 'two']
-        expected = read_fwf(StringIO(data), widths=widths, names=names)
-        if compat.PY3:
-            data = bytes(data, encoding='utf-8')
-        comps = [('gzip', gzip.GzipFile), ('bz2', bz2.BZ2File)]
-        for comp_name, compresser in comps:
-            with tm.ensure_clean() as path:
-                tmp = compresser(path, mode='wb')
-                tmp.write(data)
-                tmp.close()
-                result = read_fwf(path, widths=widths, names=names,
-                                  compression=comp_name)
-                tm.assert_frame_equal(result, expected)
-
-    def test_comment_fwf(self):
-        data = """
+    df = read_fwf(StringIO(data),
+                  colspecs=[(0, 17), (25, 26), (33, 37),
+                            (49, 51), (58, 62), (63, 1000)],
+                  names=["time", "pri", "pgn", "dst", "src", "data"],
+                  converters={
+                      "pgn": lambda x: int(x, 16),
+                      "src": lambda x: int(x, 16),
+                      "dst": lambda x: int(x, 16),
+                      "data": lambda x: len(x.split(" "))})
+
+    expected = DataFrame([[1421302965.213420, 3, 61184, 23, 40, 8],
+                          [1421302964.226776, 6, 61442, None, 71, 8]],
+                         columns=["time", "pri", "pgn",
+                                  "dst", "src", "data"])
+    expected["dst"] = expected["dst"].astype(object)
+    tm.assert_frame_equal(df, expected)
+
+
+@pytest.mark.parametrize("comment", ["#", "~", "!"])
+def test_fwf_comment(comment):
+    data = """\
   1   2.   4  #hello world
   5  NaN  10.0
 """
-        expected = np.array([[1, 2., 4],
-                             [5, np.nan, 10.]])
-        df = read_fwf(StringIO(data), colspecs=[(0, 3), (4, 9), (9, 25)],
-                      comment='#')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_1000_fwf(self):
-        data = """
+    data = data.replace("#", comment)
+
+    colspecs = [(0, 3), (4, 9), (9, 25)]
+    expected = DataFrame([[1, 2., 4], [5, np.nan, 10.]])
+
+    result = read_fwf(StringIO(data), colspecs=colspecs,
+                      header=None, comment=comment)
+    tm.assert_almost_equal(result, expected)
+
+
+@pytest.mark.parametrize("thousands", [",", "#", "~"])
+def test_fwf_thousands(thousands):
+    data = """\
  1 2,334.0    5
 10   13     10.
 """
-        expected = np.array([[1, 2334., 5],
-                             [10, 13, 10]])
-        df = read_fwf(StringIO(data), colspecs=[(0, 3), (3, 11), (12, 16)],
-                      thousands=',')
-        tm.assert_almost_equal(df.values, expected)
-
-    def test_bool_header_arg(self):
-        # see gh-6114
-        data = """\
+    data = data.replace(",", thousands)
+
+    colspecs = [(0, 3), (3, 11), (12, 16)]
+    expected = DataFrame([[1, 2334., 5], [10, 13, 10.]])
+
+    result = read_fwf(StringIO(data), header=None,
+                      colspecs=colspecs, thousands=thousands)
+    tm.assert_almost_equal(result, expected)
+
+
+@pytest.mark.parametrize("header", [True, False])
+def test_bool_header_arg(header):
+    # see gh-6114
+    data = """\
 MyColumn
    a
    b
    a
    b"""
-        for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                read_fwf(StringIO(data), header=arg)
 
-    def test_full_file(self):
-        # File with all values
-        test = """index                             A    B    C
+    msg = "Passing a bool to header is invalid"
+    with pytest.raises(TypeError, match=msg):
+        read_fwf(StringIO(data), header=header)
+
+
+def test_full_file():
+    # File with all values.
+    test = """index                             A    B    C
 2000-01-03T00:00:00  0.980268513777    3  foo
 2000-01-04T00:00:00  1.04791624281    -4  bar
 2000-01-05T00:00:00  0.498580885705   73  baz
@@ -256,13 +348,16 @@ def test_full_file(self):
 2000-01-07T00:00:00  0.487094399463    0  bar
 2000-01-10T00:00:00  0.836648671666    2  baz
 2000-01-11T00:00:00  0.157160753327   34  foo"""
-        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+    colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
+    expected = read_fwf(StringIO(test), colspecs=colspecs)
+
+    result = read_fwf(StringIO(test))
+    tm.assert_frame_equal(result, expected)
 
-    def test_full_file_with_missing(self):
-        # File with missing values
-        test = """index                             A    B    C
+
+def test_full_file_with_missing():
+    # File with missing values.
+    test = """index                             A    B    C
 2000-01-03T00:00:00  0.980268513777    3  foo
 2000-01-04T00:00:00  1.04791624281    -4  bar
                      0.498580885705   73  baz
@@ -270,136 +365,216 @@ def test_full_file_with_missing(self):
 2000-01-07T00:00:00                    0  bar
 2000-01-10T00:00:00  0.836648671666    2  baz
                                       34"""
-        colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+    colspecs = ((0, 19), (21, 35), (38, 40), (42, 45))
+    expected = read_fwf(StringIO(test), colspecs=colspecs)
+
+    result = read_fwf(StringIO(test))
+    tm.assert_frame_equal(result, expected)
 
-    def test_full_file_with_spaces(self):
-        # File with spaces in columns
-        test = """
+
+def test_full_file_with_spaces():
+    # File with spaces in columns.
+    test = """
 Account                 Name  Balance     CreditLimit   AccountCreated
 101     Keanu Reeves          9315.45     10000.00           1/17/1998
 312     Gerard Butler         90.00       1000.00             8/6/2003
 868     Jennifer Love Hewitt  0           17000.00           5/25/1985
 761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
 317     Bill Murray           789.65      5000.00             2/5/2007
-""".strip('\r\n')
-        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_full_file_with_spaces_and_missing(self):
-        # File with spaces and missing values in columsn
-        test = """
+""".strip("\r\n")
+    colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
+    expected = read_fwf(StringIO(test), colspecs=colspecs)
+
+    result = read_fwf(StringIO(test))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_full_file_with_spaces_and_missing():
+    # File with spaces and missing values in columns.
+    test = """
 Account               Name    Balance     CreditLimit   AccountCreated
 101                           10000.00                       1/17/1998
 312     Gerard Butler         90.00       1000.00             8/6/2003
 868                                                          5/25/1985
 761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
 317     Bill Murray           789.65
-""".strip('\r\n')
-        colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
-
-    def test_messed_up_data(self):
-        # Completely messed up file
-        test = """
+""".strip("\r\n")
+    colspecs = ((0, 7), (8, 28), (30, 38), (42, 53), (56, 70))
+    expected = read_fwf(StringIO(test), colspecs=colspecs)
+
+    result = read_fwf(StringIO(test))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_messed_up_data():
+    # Completely messed up file.
+    test = """
    Account          Name             Balance     Credit Limit   Account Created
        101                           10000.00                       1/17/1998
        312     Gerard Butler         90.00       1000.00
 
        761     Jada Pinkett-Smith    49654.87    100000.00          12/5/2006
   317          Bill Murray           789.65
-""".strip('\r\n')
-        colspecs = ((2, 10), (15, 33), (37, 45), (49, 61), (64, 79))
-        expected = read_fwf(StringIO(test), colspecs=colspecs)
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test)))
+""".strip("\r\n")
+    colspecs = ((2, 10), (15, 33), (37, 45), (49, 61), (64, 79))
+    expected = read_fwf(StringIO(test), colspecs=colspecs)
 
-    def test_multiple_delimiters(self):
-        test = r"""
+    result = read_fwf(StringIO(test))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_multiple_delimiters():
+    test = r"""
 col1~~~~~col2  col3++++++++++++++++++col4
 ~~22.....11.0+++foo~~~~~~~~~~Keanu Reeves
   33+++122.33\\\bar.........Gerard Butler
 ++44~~~~12.01   baz~~Jennifer Love Hewitt
 ~~55       11+++foo++++Jada Pinkett-Smith
 ..66++++++.03~~~bar           Bill Murray
-""".strip('\r\n')
-        colspecs = ((0, 4), (7, 13), (15, 19), (21, 41))
-        expected = read_fwf(StringIO(test), colspecs=colspecs,
-                            delimiter=' +~.\\')
-        tm.assert_frame_equal(expected, read_fwf(StringIO(test),
-                                                 delimiter=' +~.\\'))
-
-    def test_variable_width_unicode(self):
-        if not compat.PY3:
-            pytest.skip(
-                'Bytes-related test - only needs to work on Python 3')
-        test = """
+""".strip("\r\n")
+    delimiter = " +~.\\"
+    colspecs = ((0, 4), (7, 13), (15, 19), (21, 41))
+    expected = read_fwf(StringIO(test), colspecs=colspecs, delimiter=delimiter)
+
+    result = read_fwf(StringIO(test), delimiter=delimiter)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_variable_width_unicode():
+    if not compat.PY3:
+        pytest.skip("Bytes-related test - only needs to work on Python 3")
+
+    data = """
 שלום שלום
 ום   שלל
 של   ום
-""".strip('\r\n')
-        expected = read_fwf(BytesIO(test.encode('utf8')),
-                            colspecs=[(0, 4), (5, 9)],
-                            header=None, encoding='utf8')
-        tm.assert_frame_equal(expected, read_fwf(
-            BytesIO(test.encode('utf8')), header=None, encoding='utf8'))
-
-    def test_dtype(self):
-        data = """ a    b    c
+""".strip("\r\n")
+    encoding = "utf8"
+    kwargs = dict(header=None, encoding=encoding)
+
+    expected = read_fwf(BytesIO(data.encode(encoding)),
+                        colspecs=[(0, 4), (5, 9)], **kwargs)
+    result = read_fwf(BytesIO(data.encode(encoding)), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("dtype", [
+    dict(), {"a": "float64", "b": str, "c": "int32"}
+])
+def test_dtype(dtype):
+    data = """ a    b    c
 1    2    3.2
 3    4    5.2
 """
-        colspecs = [(0, 5), (5, 10), (10, None)]
-        result = pd.read_fwf(StringIO(data), colspecs=colspecs)
-        expected = pd.DataFrame({
-            'a': [1, 3],
-            'b': [2, 4],
-            'c': [3.2, 5.2]}, columns=['a', 'b', 'c'])
-        tm.assert_frame_equal(result, expected)
+    colspecs = [(0, 5), (5, 10), (10, None)]
+    result = read_fwf(StringIO(data), colspecs=colspecs, dtype=dtype)
 
-        expected['a'] = expected['a'].astype('float64')
-        expected['b'] = expected['b'].astype(str)
-        expected['c'] = expected['c'].astype('int32')
-        result = pd.read_fwf(StringIO(data), colspecs=colspecs,
-                             dtype={'a': 'float64', 'b': str, 'c': 'int32'})
-        tm.assert_frame_equal(result, expected)
+    expected = pd.DataFrame({
+        "a": [1, 3], "b": [2, 4],
+        "c": [3.2, 5.2]}, columns=["a", "b", "c"])
 
-    def test_skiprows_inference(self):
-        # GH11256
-        test = """
+    for col, dt in dtype.items():
+        expected[col] = expected[col].astype(dt)
+
+    tm.assert_frame_equal(result, expected)
+
+
+def test_skiprows_inference():
+    # see gh-11256
+    data = """
 Text contained in the file header
 
 DataCol1   DataCol2
      0.0        1.0
    101.6      956.1
 """.strip()
-        expected = read_csv(StringIO(test), skiprows=2,
-                            delim_whitespace=True)
-        tm.assert_frame_equal(expected, read_fwf(
-            StringIO(test), skiprows=2))
+    skiprows = 2
+    expected = read_csv(StringIO(data), skiprows=skiprows,
+                        delim_whitespace=True)
+
+    result = read_fwf(StringIO(data), skiprows=skiprows)
+    tm.assert_frame_equal(result, expected)
 
-    def test_skiprows_by_index_inference(self):
-        test = """
+
+def test_skiprows_by_index_inference():
+    data = """
 To be skipped
 Not  To  Be  Skipped
 Once more to be skipped
 123  34   8      123
 456  78   9      456
 """.strip()
+    skiprows = [0, 2]
+    expected = read_csv(StringIO(data), skiprows=skiprows,
+                        delim_whitespace=True)
+
+    result = read_fwf(StringIO(data), skiprows=skiprows)
+    tm.assert_frame_equal(result, expected)
 
-        expected = read_csv(StringIO(test), skiprows=[0, 2],
-                            delim_whitespace=True)
-        tm.assert_frame_equal(expected, read_fwf(
-            StringIO(test), skiprows=[0, 2]))
 
-    def test_skiprows_inference_empty(self):
-        test = """
+def test_skiprows_inference_empty():
+    data = """
 AA   BBB  C
 12   345  6
 78   901  2
 """.strip()
 
-        with tm.assertRaises(EmptyDataError):
-            read_fwf(StringIO(test), skiprows=3)
+    msg = "No rows from which to infer column width"
+    with pytest.raises(EmptyDataError, match=msg):
+        read_fwf(StringIO(data), skiprows=3)
+
+
+def test_whitespace_preservation():
+    # see gh-16772
+    header = None
+    csv_data = """
+ a ,bbb
+ cc,dd """
+
+    fwf_data = """
+ a bbb
+ ccdd """
+    result = read_fwf(StringIO(fwf_data), widths=[3, 3],
+                      header=header, skiprows=[0], delimiter="\n\t")
+    expected = read_csv(StringIO(csv_data), header=header)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_default_delimiter():
+    header = None
+    csv_data = """
+a,bbb
+cc,dd"""
+
+    fwf_data = """
+a \tbbb
+cc\tdd """
+    result = read_fwf(StringIO(fwf_data), widths=[3, 3],
+                      header=header, skiprows=[0])
+    expected = read_csv(StringIO(csv_data), header=header)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("infer", [True, False, None])
+def test_fwf_compression(compression_only, infer):
+    data = """1111111111
+    2222222222
+    3333333333""".strip()
+
+    compression = compression_only
+    extension = "gz" if compression == "gzip" else compression
+
+    kwargs = dict(widths=[5, 5], names=["one", "two"])
+    expected = read_fwf(StringIO(data), **kwargs)
+
+    if compat.PY3:
+        data = bytes(data, encoding="utf-8")
+
+    with tm.ensure_clean(filename="tmp." + extension) as path:
+        tm.write_to_compressed(compression, path, data)
+
+        if infer is not None:
+            kwargs["compression"] = "infer" if infer else compression
+
+        result = read_fwf(path, **kwargs)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/test_skiprows.py b/pandas/tests/io/parser/test_skiprows.py
new file mode 100644
index 0000000000000..1df2ca4fad4d8
--- /dev/null
+++ b/pandas/tests/io/parser/test_skiprows.py
@@ -0,0 +1,222 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests that skipped rows are properly handled during
+parsing for all of the parsers defined in parsers.py
+"""
+
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO, lrange, range
+from pandas.errors import EmptyDataError
+
+from pandas import DataFrame, Index
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("skiprows", [lrange(6), 6])
+def test_skip_rows_bug(all_parsers, skiprows):
+    # see gh-505
+    parser = all_parsers
+    text = """#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+#foo,a,b,c
+1/1/2000,1.,2.,3.
+1/2/2000,4,5,6
+1/3/2000,7,8,9
+"""
+    result = parser.read_csv(StringIO(text), skiprows=skiprows, header=None,
+                             index_col=0, parse_dates=True)
+    index = Index([datetime(2000, 1, 1), datetime(2000, 1, 2),
+                   datetime(2000, 1, 3)], name=0)
+
+    expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
+                         columns=[1, 2, 3], index=index)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_deep_skip_rows(all_parsers):
+    # see gh-4382
+    parser = all_parsers
+    data = "a,b,c\n" + "\n".join([",".join([str(i), str(i + 1), str(i + 2)])
+                                  for i in range(10)])
+    condensed_data = "a,b,c\n" + "\n".join([
+        ",".join([str(i), str(i + 1), str(i + 2)])
+        for i in [0, 1, 2, 3, 4, 6, 8, 9]])
+
+    result = parser.read_csv(StringIO(data), skiprows=[6, 8])
+    condensed_result = parser.read_csv(StringIO(condensed_data))
+    tm.assert_frame_equal(result, condensed_result)
+
+
+def test_skip_rows_blank(all_parsers):
+    # see gh-9832
+    parser = all_parsers
+    text = """#foo,a,b,c
+#foo,a,b,c
+
+#foo,a,b,c
+#foo,a,b,c
+
+1/1/2000,1.,2.,3.
+1/2/2000,4,5,6
+1/3/2000,7,8,9
+"""
+    data = parser.read_csv(StringIO(text), skiprows=6, header=None,
+                           index_col=0, parse_dates=True)
+    index = Index([datetime(2000, 1, 1), datetime(2000, 1, 2),
+                   datetime(2000, 1, 3)], name=0)
+
+    expected = DataFrame(np.arange(1., 10.).reshape((3, 3)),
+                         columns=[1, 2, 3],
+                         index=index)
+    tm.assert_frame_equal(data, expected)
+
+
+@pytest.mark.parametrize("data,kwargs,expected", [
+    ("""id,text,num_lines
+1,"line 11
+line 12",2
+2,"line 21
+line 22",2
+3,"line 31",1""",
+     dict(skiprows=[1]),
+     DataFrame([[2, "line 21\nline 22", 2],
+                [3, "line 31", 1]], columns=["id", "text", "num_lines"])),
+    ("a,b,c\n~a\n b~,~e\n d~,~f\n f~\n1,2,~12\n 13\n 14~",
+     dict(quotechar="~", skiprows=[2]),
+     DataFrame([["a\n b", "e\n d", "f\n f"]], columns=["a", "b", "c"])),
+    (("Text,url\n~example\n "
+      "sentence\n one~,url1\n~"
+      "example\n sentence\n two~,url2\n~"
+      "example\n sentence\n three~,url3"),
+     dict(quotechar="~", skiprows=[1, 3]),
+     DataFrame([['example\n sentence\n two', 'url2']],
+               columns=["Text", "url"]))
+])
+def test_skip_row_with_newline(all_parsers, data, kwargs, expected):
+    # see gh-12775 and gh-10911
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_skip_row_with_quote(all_parsers):
+    # see gh-12775 and gh-10911
+    parser = all_parsers
+    data = """id,text,num_lines
+1,"line '11' line 12",2
+2,"line '21' line 22",2
+3,"line '31' line 32",1"""
+
+    exp_data = [[2, "line '21' line 22", 2],
+                [3, "line '31' line 32", 1]]
+    expected = DataFrame(exp_data, columns=[
+        "id", "text", "num_lines"])
+
+    result = parser.read_csv(StringIO(data), skiprows=[1])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,exp_data", [
+    ("""id,text,num_lines
+1,"line \n'11' line 12",2
+2,"line \n'21' line 22",2
+3,"line \n'31' line 32",1""",
+     [[2, "line \n'21' line 22", 2],
+      [3, "line \n'31' line 32", 1]]),
+    ("""id,text,num_lines
+1,"line '11\n' line 12",2
+2,"line '21\n' line 22",2
+3,"line '31\n' line 32",1""",
+     [[2, "line '21\n' line 22", 2],
+      [3, "line '31\n' line 32", 1]]),
+    ("""id,text,num_lines
+1,"line '11\n' \r\tline 12",2
+2,"line '21\n' \r\tline 22",2
+3,"line '31\n' \r\tline 32",1""",
+     [[2, "line '21\n' \r\tline 22", 2],
+      [3, "line '31\n' \r\tline 32", 1]]),
+])
+def test_skip_row_with_newline_and_quote(all_parsers, data, exp_data):
+    # see gh-12775 and gh-10911
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), skiprows=[1])
+
+    expected = DataFrame(exp_data, columns=["id", "text", "num_lines"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("line_terminator", [
+    "\n",    # "LF"
+    "\r\n",  # "CRLF"
+    "\r"     # "CR"
+])
+def test_skiprows_lineterminator(all_parsers, line_terminator):
+    # see gh-9079
+    parser = all_parsers
+    data = "\n".join(["SMOSMANIA ThetaProbe-ML2X ",
+                      "2007/01/01 01:00   0.2140 U M ",
+                      "2007/01/01 02:00   0.2141 M O ",
+                      "2007/01/01 04:00   0.2142 D M "])
+    expected = DataFrame([["2007/01/01", "01:00", 0.2140, "U", "M"],
+                          ["2007/01/01", "02:00", 0.2141, "M", "O"],
+                          ["2007/01/01", "04:00", 0.2142, "D", "M"]],
+                         columns=["date", "time", "var", "flag",
+                                  "oflag"])
+
+    if parser.engine == "python" and line_terminator == "\r":
+        pytest.skip("'CR' not respect with the Python parser yet")
+
+    data = data.replace("\n", line_terminator)
+    result = parser.read_csv(StringIO(data), skiprows=1, delim_whitespace=True,
+                             names=["date", "time", "var", "flag", "oflag"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_skiprows_infield_quote(all_parsers):
+    # see gh-14459
+    parser = all_parsers
+    data = "a\"\nb\"\na\n1"
+    expected = DataFrame({"a": [1]})
+
+    result = parser.read_csv(StringIO(data), skiprows=2)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,expected", [
+    (dict(), DataFrame({"1": [3, 5]})),
+    (dict(header=0, names=["foo"]), DataFrame({"foo": [3, 5]}))
+])
+def test_skip_rows_callable(all_parsers, kwargs, expected):
+    parser = all_parsers
+    data = "a\n1\n2\n3\n4\n5"
+
+    result = parser.read_csv(StringIO(data),
+                             skiprows=lambda x: x % 2 == 0,
+                             **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_skip_rows_skip_all(all_parsers):
+    parser = all_parsers
+    data = "a\n1\n2\n3\n4\n5"
+    msg = "No columns to parse from file"
+
+    with pytest.raises(EmptyDataError, match=msg):
+        parser.read_csv(StringIO(data), skiprows=lambda x: True)
+
+
+def test_skip_rows_bad_callable(all_parsers):
+    msg = "by zero"
+    parser = all_parsers
+    data = "a\n1\n2\n3\n4\n5"
+
+    with pytest.raises(ZeroDivisionError, match=msg):
+        parser.read_csv(StringIO(data), skiprows=lambda x: 1 / 0)
diff --git a/pandas/tests/io/parser/test_textreader.py b/pandas/tests/io/parser/test_textreader.py
index b6a9900b0b087..8119de67890a5 100644
--- a/pandas/tests/io/parser/test_textreader.py
+++ b/pandas/tests/io/parser/test_textreader.py
@@ -5,52 +5,46 @@
 is integral to the C engine in parsers.py
 """
 
-from pandas.compat import StringIO, BytesIO, map
-from pandas import compat
-
 import os
-import sys
 
-from numpy import nan
 import numpy as np
+from numpy import nan
+import pytest
 
-from pandas import DataFrame
-from pandas.io.parsers import (read_csv, TextFileReader)
-from pandas.util.testing import assert_frame_equal
+import pandas._libs.parsers as parser
+from pandas._libs.parsers import TextReader
+import pandas.compat as compat
+from pandas.compat import BytesIO, StringIO, map
 
+from pandas import DataFrame
 import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
 
-from pandas.io.libparsers import TextReader
-import pandas.io.libparsers as parser
+from pandas.io.parsers import TextFileReader, read_csv
 
 
-class TestTextReader(tm.TestCase):
+class TestTextReader(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath('io', 'parser', 'data')
         self.csv1 = os.path.join(self.dirpath, 'test1.csv')
         self.csv2 = os.path.join(self.dirpath, 'test2.csv')
         self.xls1 = os.path.join(self.dirpath, 'test.xls')
 
     def test_file_handle(self):
-        try:
-            f = open(self.csv1, 'rb')
+        with open(self.csv1, 'rb') as f:
             reader = TextReader(f)
-            result = reader.read()  # noqa
-        finally:
-            f.close()
+            reader.read()
 
     def test_string_filename(self):
         reader = TextReader(self.csv1, header=None)
         reader.read()
 
     def test_file_handle_mmap(self):
-        try:
-            f = open(self.csv1, 'rb')
+        with open(self.csv1, 'rb') as f:
             reader = TextReader(f, memory_map=True, header=None)
             reader.read()
-        finally:
-            f.close()
 
     def test_StringIO(self):
         with open(self.csv1, 'rb') as f:
@@ -64,7 +58,7 @@ def test_string_factorize(self):
         data = 'a\nb\na\nb\na'
         reader = TextReader(StringIO(data), header=None)
         result = reader.read()
-        self.assertEqual(len(set(map(id, result[0]))), 2)
+        assert len(set(map(id, result[0]))) == 2
 
     def test_skipinitialspace(self):
         data = ('a,   b\n'
@@ -76,12 +70,10 @@ def test_skipinitialspace(self):
                             header=None)
         result = reader.read()
 
-        self.assert_numpy_array_equal(result[0],
-                                      np.array(['a', 'a', 'a', 'a'],
-                                               dtype=np.object_))
-        self.assert_numpy_array_equal(result[1],
-                                      np.array(['b', 'b', 'b', 'b'],
-                                               dtype=np.object_))
+        tm.assert_numpy_array_equal(result[0], np.array(['a', 'a', 'a', 'a'],
+                                                        dtype=np.object_))
+        tm.assert_numpy_array_equal(result[1], np.array(['b', 'b', 'b', 'b'],
+                                                        dtype=np.object_))
 
     def test_parse_booleans(self):
         data = 'True\nFalse\nTrue\nTrue'
@@ -89,7 +81,7 @@ def test_parse_booleans(self):
         reader = TextReader(StringIO(data), header=None)
         result = reader.read()
 
-        self.assertEqual(result[0].dtype, np.bool_)
+        assert result[0].dtype == np.bool_
 
     def test_delimit_whitespace(self):
         data = 'a  b\na\t\t "b"\n"a"\t \t b'
@@ -98,10 +90,10 @@ def test_delimit_whitespace(self):
                             header=None)
         result = reader.read()
 
-        self.assert_numpy_array_equal(result[0], np.array(['a', 'a', 'a'],
-                                                          dtype=np.object_))
-        self.assert_numpy_array_equal(result[1], np.array(['b', 'b', 'b'],
-                                                          dtype=np.object_))
+        tm.assert_numpy_array_equal(result[0], np.array(['a', 'a', 'a'],
+                                                        dtype=np.object_))
+        tm.assert_numpy_array_equal(result[1], np.array(['b', 'b', 'b'],
+                                                        dtype=np.object_))
 
     def test_embedded_newline(self):
         data = 'a\n"hello\nthere"\nthis'
@@ -110,7 +102,7 @@ def test_embedded_newline(self):
         result = reader.read()
 
         expected = np.array(['a', 'hello\nthere', 'this'], dtype=np.object_)
-        self.assert_numpy_array_equal(result[0], expected)
+        tm.assert_numpy_array_equal(result[0], expected)
 
     def test_euro_decimal(self):
         data = '12345,67\n345,678'
@@ -142,7 +134,7 @@ def test_integer_thousands_alt(self):
         expected = DataFrame([123456, 12500])
         tm.assert_frame_equal(result, expected)
 
-    def test_skip_bad_lines(self):
+    def test_skip_bad_lines(self, capsys):
         # too many lines, see #2430 for why
         data = ('a:b:c\n'
                 'd:e:f\n'
@@ -153,31 +145,30 @@ def test_skip_bad_lines(self):
 
         reader = TextReader(StringIO(data), delimiter=':',
                             header=None)
-        self.assertRaises(parser.ParserError, reader.read)
+        msg = (r"Error tokenizing data\. C error: Expected 3 fields in"
+               " line 4, saw 4")
+        with pytest.raises(parser.ParserError, match=msg):
+            reader.read()
 
         reader = TextReader(StringIO(data), delimiter=':',
                             header=None,
                             error_bad_lines=False,
                             warn_bad_lines=False)
         result = reader.read()
-        expected = {0: ['a', 'd', 'g', 'l'],
-                    1: ['b', 'e', 'h', 'm'],
-                    2: ['c', 'f', 'i', 'n']}
+        expected = {0: np.array(['a', 'd', 'g', 'l'], dtype=object),
+                    1: np.array(['b', 'e', 'h', 'm'], dtype=object),
+                    2: np.array(['c', 'f', 'i', 'n'], dtype=object)}
         assert_array_dicts_equal(result, expected)
 
-        stderr = sys.stderr
-        sys.stderr = StringIO()
-        try:
-            reader = TextReader(StringIO(data), delimiter=':',
-                                header=None,
-                                error_bad_lines=False,
-                                warn_bad_lines=True)
-            reader.read()
-            val = sys.stderr.getvalue()
-            self.assertTrue('Skipping line 4' in val)
-            self.assertTrue('Skipping line 6' in val)
-        finally:
-            sys.stderr = stderr
+        reader = TextReader(StringIO(data), delimiter=':',
+                            header=None,
+                            error_bad_lines=False,
+                            warn_bad_lines=True)
+        reader.read()
+        captured = capsys.readouterr()
+
+        assert 'Skipping line 4' in captured.err
+        assert 'Skipping line 6' in captured.err
 
     def test_header_not_enough_lines(self):
         data = ('skip this\n'
@@ -189,36 +180,13 @@ def test_header_not_enough_lines(self):
         reader = TextReader(StringIO(data), delimiter=',', header=2)
         header = reader.header
         expected = [['a', 'b', 'c']]
-        self.assertEqual(header, expected)
-
-        recs = reader.read()
-        expected = {0: [1, 4], 1: [2, 5], 2: [3, 6]}
-        assert_array_dicts_equal(expected, recs)
-
-        # not enough rows
-        self.assertRaises(parser.ParserError, TextReader, StringIO(data),
-                          delimiter=',', header=5, as_recarray=True)
-
-    def test_header_not_enough_lines_as_recarray(self):
-        data = ('skip this\n'
-                'skip this\n'
-                'a,b,c\n'
-                '1,2,3\n'
-                '4,5,6')
-
-        reader = TextReader(StringIO(data), delimiter=',', header=2,
-                            as_recarray=True)
-        header = reader.header
-        expected = [['a', 'b', 'c']]
-        self.assertEqual(header, expected)
+        assert header == expected
 
         recs = reader.read()
-        expected = {'a': [1, 4], 'b': [2, 5], 'c': [3, 6]}
-        assert_array_dicts_equal(expected, recs)
-
-        # not enough rows
-        self.assertRaises(parser.ParserError, TextReader, StringIO(data),
-                          delimiter=',', header=5, as_recarray=True)
+        expected = {0: np.array([1, 4], dtype=np.int64),
+                    1: np.array([2, 5], dtype=np.int64),
+                    2: np.array([3, 6], dtype=np.int64)}
+        assert_array_dicts_equal(recs, expected)
 
     def test_escapechar(self):
         data = ('\\"hello world\"\n'
@@ -228,7 +196,7 @@ def test_escapechar(self):
         reader = TextReader(StringIO(data), delimiter=',', header=None,
                             escapechar='\\')
         result = reader.read()
-        expected = {0: ['"hello world"'] * 3}
+        expected = {0: np.array(['"hello world"'] * 3, dtype=object)}
         assert_array_dicts_equal(result, expected)
 
     def test_eof_has_eol(self):
@@ -253,37 +221,18 @@ def _make_reader(**kwds):
         reader = _make_reader(dtype='S5,i4')
         result = reader.read()
 
-        self.assertEqual(result[0].dtype, 'S5')
+        assert result[0].dtype == 'S5'
 
         ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaaa'], dtype='S5')
-        self.assertTrue((result[0] == ex_values).all())
-        self.assertEqual(result[1].dtype, 'i4')
+        assert (result[0] == ex_values).all()
+        assert result[1].dtype == 'i4'
 
         reader = _make_reader(dtype='S4')
         result = reader.read()
-        self.assertEqual(result[0].dtype, 'S4')
-        ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaa'], dtype='S4')
-        self.assertTrue((result[0] == ex_values).all())
-        self.assertEqual(result[1].dtype, 'S4')
-
-    def test_numpy_string_dtype_as_recarray(self):
-        data = """\
-a,1
-aa,2
-aaa,3
-aaaa,4
-aaaaa,5"""
-
-        def _make_reader(**kwds):
-            return TextReader(StringIO(data), delimiter=',', header=None,
-                              **kwds)
-
-        reader = _make_reader(dtype='S4', as_recarray=True)
-        result = reader.read()
-        self.assertEqual(result['0'].dtype, 'S4')
+        assert result[0].dtype == 'S4'
         ex_values = np.array(['a', 'aa', 'aaa', 'aaaa', 'aaaa'], dtype='S4')
-        self.assertTrue((result['0'] == ex_values).all())
-        self.assertEqual(result['1'].dtype, 'S4')
+        assert (result[0] == ex_values).all()
+        assert result[1].dtype == 'S4'
 
     def test_pass_dtype(self):
         data = """\
@@ -298,19 +247,19 @@ def _make_reader(**kwds):
 
         reader = _make_reader(dtype={'one': 'u1', 1: 'S1'})
         result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'S1')
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'S1'
 
         reader = _make_reader(dtype={'one': np.uint8, 1: object})
         result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'O')
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'O'
 
         reader = _make_reader(dtype={'one': np.dtype('u1'),
                                      1: np.dtype('O')})
         result = reader.read()
-        self.assertEqual(result[0].dtype, 'u1')
-        self.assertEqual(result[1].dtype, 'O')
+        assert result[0].dtype == 'u1'
+        assert result[1].dtype == 'O'
 
     def test_usecols(self):
         data = """\
@@ -327,9 +276,9 @@ def _make_reader(**kwds):
         result = reader.read()
 
         exp = _make_reader().read()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result[1] == exp[1]).all())
-        self.assertTrue((result[2] == exp[2]).all())
+        assert len(result) == 2
+        assert (result[1] == exp[1]).all()
+        assert (result[2] == exp[2]).all()
 
     def test_cr_delimited(self):
         def _test(text, **kwargs):
@@ -363,7 +312,7 @@ def test_empty_field_eof(self):
 
         result = TextReader(StringIO(data), delimiter=',').read()
 
-        expected = {0: np.array([1, 4]),
+        expected = {0: np.array([1, 4], dtype=np.int64),
                     1: np.array(['2', ''], dtype=object),
                     2: np.array(['3', ''], dtype=object)}
         assert_array_dicts_equal(result, expected)
@@ -395,9 +344,10 @@ def test_empty_csv_input(self):
         # GH14867
         df = read_csv(StringIO(), chunksize=20, header=None,
                       names=['a', 'b', 'c'])
-        self.assertTrue(isinstance(df, TextFileReader))
+        assert isinstance(df, TextFileReader)
 
 
 def assert_array_dicts_equal(left, right):
     for k, v in compat.iteritems(left):
-        assert(np.array_equal(v, right[k]))
+        assert tm.assert_numpy_array_equal(np.asarray(v),
+                                           np.asarray(right[k]))
diff --git a/pandas/tests/io/parser/test_unsupported.py b/pandas/tests/io/parser/test_unsupported.py
index 48dd5d4ba506b..8c6dbd64c785d 100644
--- a/pandas/tests/io/parser/test_unsupported.py
+++ b/pandas/tests/io/parser/test_unsupported.py
@@ -9,15 +9,23 @@
 test suite as new feature support is added to the parsers.
 """
 
-import pandas.io.parsers as parsers
-import pandas.util.testing as tm
+import pytest
 
 from pandas.compat import StringIO
-from pandas.io.common import ParserError
-from pandas.io.parsers import read_csv, read_table
+from pandas.errors import ParserError
 
+import pandas.util.testing as tm
+
+import pandas.io.parsers as parsers
+from pandas.io.parsers import read_csv
 
-class TestUnsupportedFeatures(tm.TestCase):
+
+@pytest.fixture(params=["python", "python-fwf"], ids=lambda val: val)
+def python_engine(request):
+    return request.param
+
+
+class TestUnsupportedFeatures(object):
 
     def test_mangle_dupe_cols_false(self):
         # see gh-12935
@@ -25,7 +33,7 @@ def test_mangle_dupe_cols_false(self):
         msg = 'is not supported'
 
         for engine in ('c', 'python'):
-            with tm.assertRaisesRegexp(ValueError, msg):
+            with pytest.raises(ValueError, match=msg):
                 read_csv(StringIO(data), engine=engine,
                          mangle_dupe_cols=False)
 
@@ -35,25 +43,25 @@ def test_c_engine(self):
         msg = 'does not support'
 
         # specify C engine with unsupported options (raise)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            read_table(StringIO(data), engine='c',
-                       sep=None, delim_whitespace=False)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            read_table(StringIO(data), engine='c', sep=r'\s')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            read_table(StringIO(data), engine='c', quotechar=chr(128))
-        with tm.assertRaisesRegexp(ValueError, msg):
-            read_table(StringIO(data), engine='c', skipfooter=1)
+        with pytest.raises(ValueError, match=msg):
+            read_csv(StringIO(data), engine='c',
+                     sep=None, delim_whitespace=False)
+        with pytest.raises(ValueError, match=msg):
+            read_csv(StringIO(data), engine='c', sep=r'\s')
+        with pytest.raises(ValueError, match=msg):
+            read_csv(StringIO(data), engine='c', sep='\t', quotechar=chr(128))
+        with pytest.raises(ValueError, match=msg):
+            read_csv(StringIO(data), engine='c', skipfooter=1)
 
         # specify C-unsupported options without python-unsupported options
         with tm.assert_produces_warning(parsers.ParserWarning):
-            read_table(StringIO(data), sep=None, delim_whitespace=False)
+            read_csv(StringIO(data), sep=None, delim_whitespace=False)
         with tm.assert_produces_warning(parsers.ParserWarning):
-            read_table(StringIO(data), quotechar=chr(128))
+            read_csv(StringIO(data), sep=r'\s')
         with tm.assert_produces_warning(parsers.ParserWarning):
-            read_table(StringIO(data), sep=r'\s')
+            read_csv(StringIO(data), sep='\t', quotechar=chr(128))
         with tm.assert_produces_warning(parsers.ParserWarning):
-            read_table(StringIO(data), skipfooter=1)
+            read_csv(StringIO(data), skipfooter=1)
 
         text = """                      A       B       C       D        E
 one two three   four
@@ -62,27 +70,27 @@ def test_c_engine(self):
 x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
         msg = 'Error tokenizing data'
 
-        with tm.assertRaisesRegexp(ParserError, msg):
-            read_table(StringIO(text), sep='\\s+')
-        with tm.assertRaisesRegexp(ParserError, msg):
-            read_table(StringIO(text), engine='c', sep='\\s+')
+        with pytest.raises(ParserError, match=msg):
+            read_csv(StringIO(text), sep='\\s+')
+        with pytest.raises(ParserError, match=msg):
+            read_csv(StringIO(text), engine='c', sep='\\s+')
 
         msg = "Only length-1 thousands markers supported"
         data = """A|B|C
 1|2,334|5
 10|13|10.
 """
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             read_csv(StringIO(data), thousands=',,')
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             read_csv(StringIO(data), thousands='')
 
         msg = "Only length-1 line terminators supported"
         data = 'a,b,c~~1,2,3~~4,5,6'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             read_csv(StringIO(data), lineterminator='~~')
 
-    def test_python_engine(self):
+    def test_python_engine(self, python_engine):
         from pandas.io.parsers import _python_unsupported as py_unsupported
 
         data = """1,2,3,,
@@ -90,46 +98,43 @@ def test_python_engine(self):
 1,2,3,4,5
 1,2,,,
 1,2,3,4,"""
-        engines = 'python', 'python-fwf'
 
-        for engine in engines:
-            for default in py_unsupported:
-                msg = ('The %r option is not supported '
-                       'with the %r engine' % (default, engine))
+        for default in py_unsupported:
+            msg = ('The %r option is not supported '
+                   'with the %r engine' % (default, python_engine))
+
+            kwargs = {default: object()}
+            with pytest.raises(ValueError, match=msg):
+                read_csv(StringIO(data), engine=python_engine, **kwargs)
 
-                kwargs = {default: object()}
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    read_csv(StringIO(data), engine=engine, **kwargs)
+    def test_python_engine_file_no_next(self, python_engine):
+        # see gh-16530
+        class NoNextBuffer(object):
+            def __init__(self, csv_data):
+                self.data = csv_data
 
+            def __iter__(self):
+                return self
 
-class TestDeprecatedFeatures(tm.TestCase):
+            def read(self):
+                return self.data
 
-    def test_deprecated_args(self):
-        data = '1,2,3'
+        data = "a\n1"
+        msg = "The 'python' engine cannot iterate"
 
-        # deprecated arguments with non-default values
-        deprecated = {
-            'as_recarray': True,
-            'buffer_lines': True,
-            'compact_ints': True,
-            'skip_footer': True,
-            'use_unsigned': True,
-        }
+        with pytest.raises(ValueError, match=msg):
+            read_csv(NoNextBuffer(data), engine=python_engine)
 
-        engines = 'c', 'python'
 
-        for engine in engines:
-            for arg, non_default_val in deprecated.items():
-                if engine == 'c' and arg == 'skip_footer':
-                    # unsupported --> exception is raised
-                    continue
+class TestDeprecatedFeatures(object):
 
-                if engine == 'python' and arg == 'buffer_lines':
-                    # unsupported --> exception is raised
-                    continue
+    @pytest.mark.parametrize("engine", ["c", "python"])
+    @pytest.mark.parametrize("kwargs", [{"tupleize_cols": True},
+                                        {"tupleize_cols": False}])
+    def test_deprecated_args(self, engine, kwargs):
+        data = "1,2,3"
+        arg, _ = list(kwargs.items())[0]
 
-                with tm.assert_produces_warning(
-                        FutureWarning, check_stacklevel=False):
-                    kwargs = {arg: non_default_val}
-                    read_csv(StringIO(data), engine=engine,
-                             **kwargs)
+        with tm.assert_produces_warning(
+                FutureWarning, check_stacklevel=False):
+            read_csv(StringIO(data), engine=engine, **kwargs)
diff --git a/pandas/tests/io/parser/test_usecols.py b/pandas/tests/io/parser/test_usecols.py
new file mode 100644
index 0000000000000..652f78d198ee8
--- /dev/null
+++ b/pandas/tests/io/parser/test_usecols.py
@@ -0,0 +1,534 @@
+# -*- coding: utf-8 -*-
+
+"""
+Tests the usecols functionality during parsing
+for all of the parsers defined in parsers.py
+"""
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslib import Timestamp
+from pandas.compat import StringIO
+
+from pandas import DataFrame, Index
+import pandas.util.testing as tm
+
+_msg_validate_usecols_arg = ("'usecols' must either be list-like "
+                             "of all strings, all unicode, all "
+                             "integers or a callable.")
+_msg_validate_usecols_names = ("Usecols do not match columns, columns "
+                               "expected but not found: {0}")
+
+
+def test_raise_on_mixed_dtype_usecols(all_parsers):
+    # See gh-12678
+    data = """a,b,c
+        1000,2000,3000
+        4000,5000,6000
+        """
+    usecols = [0, "b", 2]
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=_msg_validate_usecols_arg):
+        parser.read_csv(StringIO(data), usecols=usecols)
+
+
+@pytest.mark.parametrize("usecols", [(1, 2), ("b", "c")])
+def test_usecols(all_parsers, usecols):
+    data = """\
+a,b,c
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), usecols=usecols)
+
+    expected = DataFrame([[2, 3], [5, 6], [8, 9],
+                          [11, 12]], columns=["b", "c"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_names(all_parsers):
+    data = """\
+a,b,c
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+    parser = all_parsers
+    names = ["foo", "bar"]
+    result = parser.read_csv(StringIO(data), names=names,
+                             usecols=[1, 2], header=0)
+
+    expected = DataFrame([[2, 3], [5, 6], [8, 9],
+                          [11, 12]], columns=names)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("names,usecols", [
+    (["b", "c"], [1, 2]),
+    (["a", "b", "c"], ["b", "c"])
+])
+def test_usecols_relative_to_names(all_parsers, names, usecols):
+    data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), names=names,
+                             header=None, usecols=usecols)
+
+    expected = DataFrame([[2, 3], [5, 6], [8, 9],
+                          [11, 12]], columns=["b", "c"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_relative_to_names2(all_parsers):
+    # see gh-5766
+    data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), names=["a", "b"],
+                             header=None, usecols=[0, 1])
+
+    expected = DataFrame([[1, 2], [4, 5], [7, 8],
+                          [10, 11]], columns=["a", "b"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_name_length_conflict(all_parsers):
+    data = """\
+1,2,3
+4,5,6
+7,8,9
+10,11,12"""
+    parser = all_parsers
+    msg = ("Number of passed names did not "
+           "match number of header fields in the file"
+           if parser.engine == "python" else
+           "Passed header names mismatches usecols")
+
+    with pytest.raises(ValueError, match=msg):
+        parser.read_csv(StringIO(data), names=["a", "b"],
+                        header=None, usecols=[1])
+
+
+def test_usecols_single_string(all_parsers):
+    # see gh-20558
+    parser = all_parsers
+    data = """foo, bar, baz
+1000, 2000, 3000
+4000, 5000, 6000"""
+
+    with pytest.raises(ValueError, match=_msg_validate_usecols_arg):
+        parser.read_csv(StringIO(data), usecols="foo")
+
+
+@pytest.mark.parametrize("data", ["a,b,c,d\n1,2,3,4\n5,6,7,8",
+                                  "a,b,c,d\n1,2,3,4,\n5,6,7,8,"])
+def test_usecols_index_col_false(all_parsers, data):
+    # see gh-9082
+    parser = all_parsers
+    usecols = ["a", "c", "d"]
+    expected = DataFrame({"a": [1, 5], "c": [3, 7], "d": [4, 8]})
+
+    result = parser.read_csv(StringIO(data), usecols=usecols, index_col=False)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("index_col", ["b", 0])
+@pytest.mark.parametrize("usecols", [["b", "c"], [1, 2]])
+def test_usecols_index_col_conflict(all_parsers, usecols, index_col):
+    # see gh-4201: test that index_col as integer reflects usecols
+    parser = all_parsers
+    data = "a,b,c,d\nA,a,1,one\nB,b,2,two"
+    expected = DataFrame({"c": [1, 2]}, index=Index(["a", "b"], name="b"))
+
+    result = parser.read_csv(StringIO(data), usecols=usecols,
+                             index_col=index_col)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_index_col_conflict2(all_parsers):
+    # see gh-4201: test that index_col as integer reflects usecols
+    parser = all_parsers
+    data = "a,b,c,d\nA,a,1,one\nB,b,2,two"
+
+    expected = DataFrame({"b": ["a", "b"], "c": [1, 2], "d": ("one", "two")})
+    expected = expected.set_index(["b", "c"])
+
+    result = parser.read_csv(StringIO(data), usecols=["b", "c", "d"],
+                             index_col=["b", "c"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_implicit_index_col(all_parsers):
+    # see gh-2654
+    parser = all_parsers
+    data = "a,b,c\n4,apple,bat,5.7\n8,orange,cow,10"
+
+    result = parser.read_csv(StringIO(data), usecols=["a", "b"])
+    expected = DataFrame({"a": ["apple", "orange"],
+                          "b": ["bat", "cow"]}, index=[4, 8])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_regex_sep(all_parsers):
+    # see gh-2733
+    parser = all_parsers
+    data = "a  b  c\n4  apple  bat  5.7\n8  orange  cow  10"
+    result = parser.read_csv(StringIO(data), sep=r"\s+", usecols=("a", "b"))
+
+    expected = DataFrame({"a": ["apple", "orange"],
+                          "b": ["bat", "cow"]}, index=[4, 8])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_whitespace(all_parsers):
+    parser = all_parsers
+    data = "a  b  c\n4  apple  bat  5.7\n8  orange  cow  10"
+
+    result = parser.read_csv(StringIO(data), delim_whitespace=True,
+                             usecols=("a", "b"))
+    expected = DataFrame({"a": ["apple", "orange"],
+                          "b": ["bat", "cow"]}, index=[4, 8])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols,expected", [
+    # Column selection by index.
+    ([0, 1], DataFrame(data=[[1000, 2000], [4000, 5000]],
+                       columns=["2", "0"])),
+
+    # Column selection by name.
+    (["0", "1"], DataFrame(data=[[2000, 3000], [5000, 6000]],
+                           columns=["0", "1"])),
+])
+def test_usecols_with_integer_like_header(all_parsers, usecols, expected):
+    parser = all_parsers
+    data = """2,0,1
+1000,2000,3000
+4000,5000,6000"""
+
+    result = parser.read_csv(StringIO(data), usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols", [[0, 2, 3], [3, 0, 2]])
+def test_usecols_with_parse_dates(all_parsers, usecols):
+    # see gh-9755
+    data = """a,b,c,d,e
+0,1,20140101,0900,4
+0,1,20140102,1000,4"""
+    parser = all_parsers
+    parse_dates = [[1, 2]]
+
+    cols = {
+        "a": [0, 0],
+        "c_d": [
+            Timestamp("2014-01-01 09:00:00"),
+            Timestamp("2014-01-02 10:00:00")
+        ]
+    }
+    expected = DataFrame(cols, columns=["c_d", "a"])
+    result = parser.read_csv(StringIO(data), usecols=usecols,
+                             parse_dates=parse_dates)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_parse_dates2(all_parsers):
+    # see gh-13604
+    parser = all_parsers
+    data = """2008-02-07 09:40,1032.43
+2008-02-07 09:50,1042.54
+2008-02-07 10:00,1051.65"""
+
+    names = ["date", "values"]
+    usecols = names[:]
+    parse_dates = [0]
+
+    index = Index([Timestamp("2008-02-07 09:40"),
+                   Timestamp("2008-02-07 09:50"),
+                   Timestamp("2008-02-07 10:00")],
+                  name="date")
+    cols = {"values": [1032.43, 1042.54, 1051.65]}
+    expected = DataFrame(cols, index=index)
+
+    result = parser.read_csv(StringIO(data), parse_dates=parse_dates,
+                             index_col=0, usecols=usecols,
+                             header=None, names=names)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_parse_dates3(all_parsers):
+    # see gh-14792
+    parser = all_parsers
+    data = """a,b,c,d,e,f,g,h,i,j
+2016/09/21,1,1,2,3,4,5,6,7,8"""
+
+    usecols = list("abcdefghij")
+    parse_dates = [0]
+
+    cols = {"a": Timestamp("2016-09-21"),
+            "b": [1], "c": [1], "d": [2],
+            "e": [3], "f": [4], "g": [5],
+            "h": [6], "i": [7], "j": [8]}
+    expected = DataFrame(cols, columns=usecols)
+
+    result = parser.read_csv(StringIO(data), usecols=usecols,
+                             parse_dates=parse_dates)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_parse_dates4(all_parsers):
+    data = "a,b,c,d,e,f,g,h,i,j\n2016/09/21,1,1,2,3,4,5,6,7,8"
+    usecols = list("abcdefghij")
+    parse_dates = [[0, 1]]
+    parser = all_parsers
+
+    cols = {"a_b": "2016/09/21 1",
+            "c": [1], "d": [2], "e": [3], "f": [4],
+            "g": [5], "h": [6], "i": [7], "j": [8]}
+    expected = DataFrame(cols, columns=["a_b"] + list("cdefghij"))
+
+    result = parser.read_csv(StringIO(data), usecols=usecols,
+                             parse_dates=parse_dates)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols", [[0, 2, 3], [3, 0, 2]])
+@pytest.mark.parametrize("names", [
+    list("abcde"),  # Names span all columns in original data.
+    list("acd"),    # Names span only the selected columns.
+])
+def test_usecols_with_parse_dates_and_names(all_parsers, usecols, names):
+    # see gh-9755
+    s = """0,1,20140101,0900,4
+0,1,20140102,1000,4"""
+    parse_dates = [[1, 2]]
+    parser = all_parsers
+
+    cols = {
+        "a": [0, 0],
+        "c_d": [
+            Timestamp("2014-01-01 09:00:00"),
+            Timestamp("2014-01-02 10:00:00")
+        ]
+    }
+    expected = DataFrame(cols, columns=["c_d", "a"])
+
+    result = parser.read_csv(StringIO(s), names=names,
+                             parse_dates=parse_dates,
+                             usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_unicode_strings(all_parsers):
+    # see gh-13219
+    data = """AAA,BBB,CCC,DDD
+0.056674973,8,True,a
+2.613230982,2,False,b
+3.568935038,7,False,a"""
+    parser = all_parsers
+
+    exp_data = {
+        "AAA": {
+            0: 0.056674972999999997,
+            1: 2.6132309819999997,
+            2: 3.5689350380000002
+        },
+        "BBB": {0: 8, 1: 2, 2: 7}
+    }
+    expected = DataFrame(exp_data)
+
+    result = parser.read_csv(StringIO(data), usecols=[u"AAA", u"BBB"])
+    tm.assert_frame_equal(result, expected)
+
+
+def test_usecols_with_single_byte_unicode_strings(all_parsers):
+    # see gh-13219
+    data = """A,B,C,D
+0.056674973,8,True,a
+2.613230982,2,False,b
+3.568935038,7,False,a"""
+    parser = all_parsers
+
+    exp_data = {
+        "A": {
+            0: 0.056674972999999997,
+            1: 2.6132309819999997,
+            2: 3.5689350380000002
+        },
+        "B": {0: 8, 1: 2, 2: 7}
+    }
+    expected = DataFrame(exp_data)
+
+    result = parser.read_csv(StringIO(data), usecols=[u"A", u"B"])
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols", [[u"AAA", b"BBB"], [b"AAA", u"BBB"]])
+def test_usecols_with_mixed_encoding_strings(all_parsers, usecols):
+    data = """AAA,BBB,CCC,DDD
+0.056674973,8,True,a
+2.613230982,2,False,b
+3.568935038,7,False,a"""
+    parser = all_parsers
+
+    with pytest.raises(ValueError, match=_msg_validate_usecols_arg):
+        parser.read_csv(StringIO(data), usecols=usecols)
+
+
+@pytest.mark.parametrize("usecols", [
+    ["あああ", "いい"],
+    [u"あああ", u"いい"]
+])
+def test_usecols_with_multi_byte_characters(all_parsers, usecols):
+    data = """あああ,いい,ううう,ええええ
+0.056674973,8,True,a
+2.613230982,2,False,b
+3.568935038,7,False,a"""
+    parser = all_parsers
+
+    exp_data = {
+        "あああ": {
+            0: 0.056674972999999997,
+            1: 2.6132309819999997,
+            2: 3.5689350380000002
+        },
+        "いい": {0: 8, 1: 2, 2: 7}
+    }
+    expected = DataFrame(exp_data)
+
+    result = parser.read_csv(StringIO(data), usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_empty_usecols(all_parsers):
+    data = "a,b,c\n1,2,3\n4,5,6"
+    expected = DataFrame()
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), usecols=set())
+    tm.assert_frame_equal(result, expected)
+
+
+def test_np_array_usecols(all_parsers):
+    # see gh-12546
+    parser = all_parsers
+    data = "a,b,c\n1,2,3"
+    usecols = np.array(["a", "b"])
+
+    expected = DataFrame([[1, 2]], columns=usecols)
+    result = parser.read_csv(StringIO(data), usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols,expected", [
+    (lambda x: x.upper() in ["AAA", "BBB", "DDD"],
+     DataFrame({
+         "AaA": {
+             0: 0.056674972999999997,
+             1: 2.6132309819999997,
+             2: 3.5689350380000002
+         },
+         "bBb": {0: 8, 1: 2, 2: 7},
+         "ddd": {0: "a", 1: "b", 2: "a"}
+     })),
+    (lambda x: False, DataFrame()),
+])
+def test_callable_usecols(all_parsers, usecols, expected):
+    # see gh-14154
+    data = """AaA,bBb,CCC,ddd
+0.056674973,8,True,a
+2.613230982,2,False,b
+3.568935038,7,False,a"""
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols", [["a", "c"], lambda x: x in ["a", "c"]])
+def test_incomplete_first_row(all_parsers, usecols):
+    # see gh-6710
+    data = "1,2\n1,2,3"
+    parser = all_parsers
+    names = ["a", "b", "c"]
+    expected = DataFrame({"a": [1, 1], "c": [np.nan, 3]})
+
+    result = parser.read_csv(StringIO(data), names=names, usecols=usecols)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("data,usecols,kwargs,expected", [
+    # see gh-8985
+    ("19,29,39\n" * 2 + "10,20,30,40", [0, 1, 2],
+     dict(header=None), DataFrame([[19, 29, 39], [19, 29, 39], [10, 20, 30]])),
+
+    # see gh-9549
+    (("A,B,C\n1,2,3\n3,4,5\n1,2,4,5,1,6\n"
+      "1,2,3,,,1,\n1,2,3\n5,6,7"), ["A", "B", "C"],
+     dict(), DataFrame({"A": [1, 3, 1, 1, 1, 5],
+                        "B": [2, 4, 2, 2, 2, 6],
+                        "C": [3, 5, 4, 3, 3, 7]})),
+])
+def test_uneven_length_cols(all_parsers, data, usecols, kwargs, expected):
+    # see gh-8985
+    parser = all_parsers
+    result = parser.read_csv(StringIO(data), usecols=usecols, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("usecols,kwargs,expected,msg", [
+    (["a", "b", "c", "d"], dict(),
+     DataFrame({"a": [1, 5], "b": [2, 6], "c": [3, 7], "d": [4, 8]}), None),
+    (["a", "b", "c", "f"], dict(), None,
+     _msg_validate_usecols_names.format(r"\['f'\]")),
+    (["a", "b", "f"], dict(), None,
+     _msg_validate_usecols_names.format(r"\['f'\]")),
+    (["a", "b", "f", "g"], dict(), None,
+     _msg_validate_usecols_names.format(r"\[('f', 'g'|'g', 'f')\]")),
+
+    # see gh-14671
+    (None, dict(header=0, names=["A", "B", "C", "D"]),
+     DataFrame({"A": [1, 5], "B": [2, 6], "C": [3, 7],
+                "D": [4, 8]}), None),
+    (["A", "B", "C", "f"], dict(header=0, names=["A", "B", "C", "D"]),
+     None, _msg_validate_usecols_names.format(r"\['f'\]")),
+    (["A", "B", "f"], dict(names=["A", "B", "C", "D"]),
+     None, _msg_validate_usecols_names.format(r"\['f'\]")),
+])
+def test_raises_on_usecols_names_mismatch(all_parsers, usecols,
+                                          kwargs, expected, msg):
+    data = "a,b,c,d\n1,2,3,4\n5,6,7,8"
+    kwargs.update(usecols=usecols)
+    parser = all_parsers
+
+    if expected is None:
+        with pytest.raises(ValueError, match=msg):
+            parser.read_csv(StringIO(data), **kwargs)
+    else:
+        result = parser.read_csv(StringIO(data), **kwargs)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.xfail(
+    reason="see gh-16469: works on the C engine but not the Python engine",
+    strict=False)
+@pytest.mark.parametrize("usecols", [["A", "C"], [0, 2]])
+def test_usecols_subset_names_mismatch_orig_columns(all_parsers, usecols):
+    data = "a,b,c,d\n1,2,3,4\n5,6,7,8"
+    names = ["A", "B", "C", "D"]
+    parser = all_parsers
+
+    result = parser.read_csv(StringIO(data), header=0,
+                             names=names, usecols=usecols)
+    expected = DataFrame({"A": [1, 5], "C": [3, 7]})
+    tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/io/parser/usecols.py b/pandas/tests/io/parser/usecols.py
deleted file mode 100644
index 0cf642983e8d3..0000000000000
--- a/pandas/tests/io/parser/usecols.py
+++ /dev/null
@@ -1,477 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-Tests the usecols functionality during parsing
-for all of the parsers defined in parsers.py
-"""
-
-import pytest
-
-import numpy as np
-import pandas.util.testing as tm
-
-from pandas import DataFrame, Index
-from pandas._libs.lib import Timestamp
-from pandas.compat import StringIO
-
-
-class UsecolsTests(object):
-
-    def test_raise_on_mixed_dtype_usecols(self):
-        # See gh-12678
-        data = """a,b,c
-        1000,2000,3000
-        4000,5000,6000
-        """
-
-        msg = ("'usecols' must either be all strings, all unicode, "
-               "all integers or a callable")
-        usecols = [0, 'b', 2]
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(data), usecols=usecols)
-
-    def test_usecols(self):
-        data = """\
-a,b,c
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-
-        result = self.read_csv(StringIO(data), usecols=(1, 2))
-        result2 = self.read_csv(StringIO(data), usecols=('b', 'c'))
-        exp = self.read_csv(StringIO(data))
-
-        self.assertEqual(len(result.columns), 2)
-        self.assertTrue((result['b'] == exp['b']).all())
-        self.assertTrue((result['c'] == exp['c']).all())
-
-        tm.assert_frame_equal(result, result2)
-
-        result = self.read_csv(StringIO(data), usecols=[1, 2], header=0,
-                               names=['foo', 'bar'])
-        expected = self.read_csv(StringIO(data), usecols=[1, 2])
-        expected.columns = ['foo', 'bar']
-        tm.assert_frame_equal(result, expected)
-
-        data = """\
-1,2,3
-4,5,6
-7,8,9
-10,11,12"""
-        result = self.read_csv(StringIO(data), names=['b', 'c'],
-                               header=None, usecols=[1, 2])
-
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        expected = expected[['b', 'c']]
-        tm.assert_frame_equal(result, expected)
-
-        result2 = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                header=None, usecols=['b', 'c'])
-        tm.assert_frame_equal(result2, result)
-
-        # see gh-5766
-        result = self.read_csv(StringIO(data), names=['a', 'b'],
-                               header=None, usecols=[0, 1])
-
-        expected = self.read_csv(StringIO(data), names=['a', 'b', 'c'],
-                                 header=None)
-        expected = expected[['a', 'b']]
-        tm.assert_frame_equal(result, expected)
-
-        # length conflict, passed names and usecols disagree
-        self.assertRaises(ValueError, self.read_csv, StringIO(data),
-                          names=['a', 'b'], usecols=[1], header=None)
-
-    def test_usecols_index_col_False(self):
-        # see gh-9082
-        s = "a,b,c,d\n1,2,3,4\n5,6,7,8"
-        s_malformed = "a,b,c,d\n1,2,3,4,\n5,6,7,8,"
-        cols = ['a', 'c', 'd']
-        expected = DataFrame({'a': [1, 5], 'c': [3, 7], 'd': [4, 8]})
-        df = self.read_csv(StringIO(s), usecols=cols, index_col=False)
-        tm.assert_frame_equal(expected, df)
-        df = self.read_csv(StringIO(s_malformed),
-                           usecols=cols, index_col=False)
-        tm.assert_frame_equal(expected, df)
-
-    def test_usecols_index_col_conflict(self):
-        # see gh-4201: test that index_col as integer reflects usecols
-        data = 'a,b,c,d\nA,a,1,one\nB,b,2,two'
-        expected = DataFrame({'c': [1, 2]}, index=Index(
-            ['a', 'b'], name='b'))
-
-        df = self.read_csv(StringIO(data), usecols=['b', 'c'],
-                           index_col=0)
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=['b', 'c'],
-                           index_col='b')
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=[1, 2],
-                           index_col='b')
-        tm.assert_frame_equal(expected, df)
-
-        df = self.read_csv(StringIO(data), usecols=[1, 2],
-                           index_col=0)
-        tm.assert_frame_equal(expected, df)
-
-        expected = DataFrame(
-            {'b': ['a', 'b'], 'c': [1, 2], 'd': ('one', 'two')})
-        expected = expected.set_index(['b', 'c'])
-        df = self.read_csv(StringIO(data), usecols=['b', 'c', 'd'],
-                           index_col=['b', 'c'])
-        tm.assert_frame_equal(expected, df)
-
-    def test_usecols_implicit_index_col(self):
-        # see gh-2654
-        data = 'a,b,c\n4,apple,bat,5.7\n8,orange,cow,10'
-
-        result = self.read_csv(StringIO(data), usecols=['a', 'b'])
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_usecols_regex_sep(self):
-        # see gh-2733
-        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
-
-        df = self.read_csv(StringIO(data), sep=r'\s+', usecols=('a', 'b'))
-
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_whitespace(self):
-        data = 'a  b  c\n4  apple  bat  5.7\n8  orange  cow  10'
-
-        result = self.read_csv(StringIO(data), delim_whitespace=True,
-                               usecols=('a', 'b'))
-        expected = DataFrame({'a': ['apple', 'orange'],
-                              'b': ['bat', 'cow']}, index=[4, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_usecols_with_integer_like_header(self):
-        data = """2,0,1
-        1000,2000,3000
-        4000,5000,6000
-        """
-
-        usecols = [0, 1]  # column selection by index
-        expected = DataFrame(data=[[1000, 2000],
-                                   [4000, 5000]],
-                             columns=['2', '0'])
-        df = self.read_csv(StringIO(data), usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-        usecols = ['0', '1']  # column selection by name
-        expected = DataFrame(data=[[2000, 3000],
-                                   [5000, 6000]],
-                             columns=['0', '1'])
-        df = self.read_csv(StringIO(data), usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_parse_dates(self):
-        # See gh-9755
-        s = """a,b,c,d,e
-        0,1,20140101,0900,4
-        0,1,20140102,1000,4"""
-        parse_dates = [[1, 2]]
-
-        cols = {
-            'a': [0, 0],
-            'c_d': [
-                Timestamp('2014-01-01 09:00:00'),
-                Timestamp('2014-01-02 10:00:00')
-            ]
-        }
-        expected = DataFrame(cols, columns=['c_d', 'a'])
-
-        df = self.read_csv(StringIO(s), usecols=[0, 2, 3],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(s), usecols=[3, 0, 2],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-        # See gh-13604
-        s = """2008-02-07 09:40,1032.43
-        2008-02-07 09:50,1042.54
-        2008-02-07 10:00,1051.65
-        """
-        parse_dates = [0]
-        names = ['date', 'values']
-        usecols = names[:]
-
-        index = Index([Timestamp('2008-02-07 09:40'),
-                       Timestamp('2008-02-07 09:50'),
-                       Timestamp('2008-02-07 10:00')],
-                      name='date')
-        cols = {'values': [1032.43, 1042.54, 1051.65]}
-        expected = DataFrame(cols, index=index)
-
-        df = self.read_csv(StringIO(s), parse_dates=parse_dates, index_col=0,
-                           usecols=usecols, header=None, names=names)
-        tm.assert_frame_equal(df, expected)
-
-        # See gh-14792
-        s = """a,b,c,d,e,f,g,h,i,j
-        2016/09/21,1,1,2,3,4,5,6,7,8"""
-        parse_dates = [0]
-        usecols = list('abcdefghij')
-        cols = {'a': Timestamp('2016-09-21'),
-                'b': [1], 'c': [1], 'd': [2],
-                'e': [3], 'f': [4], 'g': [5],
-                'h': [6], 'i': [7], 'j': [8]}
-        expected = DataFrame(cols, columns=usecols)
-        df = self.read_csv(StringIO(s), usecols=usecols,
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-        s = """a,b,c,d,e,f,g,h,i,j\n2016/09/21,1,1,2,3,4,5,6,7,8"""
-        parse_dates = [[0, 1]]
-        usecols = list('abcdefghij')
-        cols = {'a_b': '2016/09/21 1',
-                'c': [1], 'd': [2], 'e': [3], 'f': [4],
-                'g': [5], 'h': [6], 'i': [7], 'j': [8]}
-        expected = DataFrame(cols, columns=['a_b'] + list('cdefghij'))
-        df = self.read_csv(StringIO(s), usecols=usecols,
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_parse_dates_and_full_names(self):
-        # See gh-9755
-        s = """0,1,20140101,0900,4
-        0,1,20140102,1000,4"""
-        parse_dates = [[1, 2]]
-        names = list('abcde')
-
-        cols = {
-            'a': [0, 0],
-            'c_d': [
-                Timestamp('2014-01-01 09:00:00'),
-                Timestamp('2014-01-02 10:00:00')
-            ]
-        }
-        expected = DataFrame(cols, columns=['c_d', 'a'])
-
-        df = self.read_csv(StringIO(s), names=names,
-                           usecols=[0, 2, 3],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(s), names=names,
-                           usecols=[3, 0, 2],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_parse_dates_and_usecol_names(self):
-        # See gh-9755
-        s = """0,1,20140101,0900,4
-        0,1,20140102,1000,4"""
-        parse_dates = [[1, 2]]
-        names = list('acd')
-
-        cols = {
-            'a': [0, 0],
-            'c_d': [
-                Timestamp('2014-01-01 09:00:00'),
-                Timestamp('2014-01-02 10:00:00')
-            ]
-        }
-        expected = DataFrame(cols, columns=['c_d', 'a'])
-
-        df = self.read_csv(StringIO(s), names=names,
-                           usecols=[0, 2, 3],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-        df = self.read_csv(StringIO(s), names=names,
-                           usecols=[3, 0, 2],
-                           parse_dates=parse_dates)
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_unicode_strings(self):
-        # see gh-13219
-
-        s = '''AAA,BBB,CCC,DDD
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-
-        data = {
-            'AAA': {
-                0: 0.056674972999999997,
-                1: 2.6132309819999997,
-                2: 3.5689350380000002
-            },
-            'BBB': {0: 8, 1: 2, 2: 7}
-        }
-        expected = DataFrame(data)
-
-        df = self.read_csv(StringIO(s), usecols=[u'AAA', u'BBB'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_single_byte_unicode_strings(self):
-        # see gh-13219
-
-        s = '''A,B,C,D
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-
-        data = {
-            'A': {
-                0: 0.056674972999999997,
-                1: 2.6132309819999997,
-                2: 3.5689350380000002
-            },
-            'B': {0: 8, 1: 2, 2: 7}
-        }
-        expected = DataFrame(data)
-
-        df = self.read_csv(StringIO(s), usecols=[u'A', u'B'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_mixed_encoding_strings(self):
-        s = '''AAA,BBB,CCC,DDD
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-
-        msg = ("'usecols' must either be all strings, all unicode, "
-               "all integers or a callable")
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(s), usecols=[u'AAA', b'BBB'])
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.read_csv(StringIO(s), usecols=[b'AAA', u'BBB'])
-
-    def test_usecols_with_multibyte_characters(self):
-        s = '''あああ,いい,ううう,ええええ
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-        data = {
-            'あああ': {
-                0: 0.056674972999999997,
-                1: 2.6132309819999997,
-                2: 3.5689350380000002
-            },
-            'いい': {0: 8, 1: 2, 2: 7}
-        }
-        expected = DataFrame(data)
-
-        df = self.read_csv(StringIO(s), usecols=['あああ', 'いい'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_usecols_with_multibyte_unicode_characters(self):
-        pytest.skip('TODO: see gh-13253')
-
-        s = '''あああ,いい,ううう,ええええ
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-        data = {
-            'あああ': {
-                0: 0.056674972999999997,
-                1: 2.6132309819999997,
-                2: 3.5689350380000002
-            },
-            'いい': {0: 8, 1: 2, 2: 7}
-        }
-        expected = DataFrame(data)
-
-        df = self.read_csv(StringIO(s), usecols=[u'あああ', u'いい'])
-        tm.assert_frame_equal(df, expected)
-
-    def test_empty_usecols(self):
-        # should not raise
-        data = 'a,b,c\n1,2,3\n4,5,6'
-        expected = DataFrame()
-        result = self.read_csv(StringIO(data), usecols=set([]))
-        tm.assert_frame_equal(result, expected)
-
-    def test_np_array_usecols(self):
-        # See gh-12546
-        data = 'a,b,c\n1,2,3'
-        usecols = np.array(['a', 'b'])
-
-        expected = DataFrame([[1, 2]], columns=usecols)
-        result = self.read_csv(StringIO(data), usecols=usecols)
-        tm.assert_frame_equal(result, expected)
-
-    def test_callable_usecols(self):
-        # See gh-14154
-        s = '''AaA,bBb,CCC,ddd
-        0.056674973,8,True,a
-        2.613230982,2,False,b
-        3.568935038,7,False,a
-        '''
-
-        data = {
-            'AaA': {
-                0: 0.056674972999999997,
-                1: 2.6132309819999997,
-                2: 3.5689350380000002
-            },
-            'bBb': {0: 8, 1: 2, 2: 7},
-            'ddd': {0: 'a', 1: 'b', 2: 'a'}
-        }
-        expected = DataFrame(data)
-        df = self.read_csv(StringIO(s), usecols=lambda x:
-                           x.upper() in ['AAA', 'BBB', 'DDD'])
-        tm.assert_frame_equal(df, expected)
-
-        # Check that a callable returning only False returns
-        # an empty DataFrame
-        expected = DataFrame()
-        df = self.read_csv(StringIO(s), usecols=lambda x: False)
-        tm.assert_frame_equal(df, expected)
-
-    def test_incomplete_first_row(self):
-        # see gh-6710
-        data = '1,2\n1,2,3'
-        names = ['a', 'b', 'c']
-        expected = DataFrame({'a': [1, 1],
-                              'c': [np.nan, 3]})
-
-        usecols = ['a', 'c']
-        df = self.read_csv(StringIO(data), names=names, usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-        usecols = lambda x: x in ['a', 'c']
-        df = self.read_csv(StringIO(data), names=names, usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-    def test_uneven_length_cols(self):
-        # see gh-8985
-        usecols = [0, 1, 2]
-        data = '19,29,39\n' * 2 + '10,20,30,40'
-        expected = DataFrame([[19, 29, 39],
-                              [19, 29, 39],
-                              [10, 20, 30]])
-        df = self.read_csv(StringIO(data), header=None, usecols=usecols)
-        tm.assert_frame_equal(df, expected)
-
-        # see gh-9549
-        usecols = ['A', 'B', 'C']
-        data = ('A,B,C\n1,2,3\n3,4,5\n1,2,4,5,1,6\n'
-                '1,2,3,,,1,\n1,2,3\n5,6,7')
-        expected = DataFrame({'A': [1, 3, 1, 1, 1, 5],
-                              'B': [2, 4, 2, 2, 2, 6],
-                              'C': [3, 5, 4, 3, 3, 7]})
-        df = self.read_csv(StringIO(data), usecols=usecols)
-        tm.assert_frame_equal(df, expected)
diff --git a/pandas/tests/io/sas/data/cars.sas7bdat b/pandas/tests/io/sas/data/cars.sas7bdat
new file mode 100644
index 0000000000000..ca5d3474c36ad
Binary files /dev/null and b/pandas/tests/io/sas/data/cars.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/datetime.csv b/pandas/tests/io/sas/data/datetime.csv
new file mode 100644
index 0000000000000..6126f6d04eaf0
--- /dev/null
+++ b/pandas/tests/io/sas/data/datetime.csv
@@ -0,0 +1,5 @@
+Date1,Date2,DateTime,DateTimeHi,Taiw
+1677-09-22,1677-09-22,1677-09-21 00:12:44,1677-09-21 00:12:43.145226,1912-01-01
+1960-01-01,1960-01-01,1960-01-01 00:00:00,1960-01-01 00:00:00.000000,1960-01-01
+2016-02-29,2016-02-29,2016-02-29 23:59:59,2016-02-29 23:59:59.123456,2016-02-29
+2262-04-11,2262-04-11,2262-04-11 23:47:16,2262-04-11 23:47:16.854774,2262-04-11
diff --git a/pandas/tests/io/sas/data/datetime.sas7bdat b/pandas/tests/io/sas/data/datetime.sas7bdat
new file mode 100644
index 0000000000000..6469dbf29f8ee
Binary files /dev/null and b/pandas/tests/io/sas/data/datetime.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/load_log.sas7bdat b/pandas/tests/io/sas/data/load_log.sas7bdat
new file mode 100644
index 0000000000000..dc78925471baf
Binary files /dev/null and b/pandas/tests/io/sas/data/load_log.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/many_columns.csv b/pandas/tests/io/sas/data/many_columns.csv
new file mode 100644
index 0000000000000..307fc30f33b9f
--- /dev/null
+++ b/pandas/tests/io/sas/data/many_columns.csv
@@ -0,0 +1,4 @@
+DATASRC,PDDOCID,age,agegt89,ASSESSA,ASSESS1,ASSESS3,ASSESS4,ASSESS5,ASSESS6,ASSESS7,week,BECK,conf1,conf2,conf3,demo3,demo4,demo5,demo6,demo7,demo11a,demo11b,demo11c,demo11d,derm1b,derm2,derm3,derm4,derm5a,derm5b,derm7,derm7a,derm7b,derm8,derm9,ECG3,ecgrtxt,ecgrhr,ecgrpr,ecgrqrs,ecgrqrsaxis,ecgrqt,ecgrqtc,ecgrrep,ecgrtime,mmse1,mmse2,mmse3,mmse4,mmse5,mmse6,mmse7,mmse8,mmse9,mmse10,mmse11,mmse12,mmse13,mmse14,mmse15,mmse16,mmse17,mmse18,mmse19,mmse20,mmse,mmsescor,mrf1,mrf2,mrf3,mrf4,mrf5,mrf6,mrf7,mrf8,mrf9,mrf10,mrf11,mrf12,mrf13,nvitl1s,nvitl1d,nvitl1r,nvitl2s,nvitl2d,nvitl2r,nvitl3s,nvitl3d,nvitl3r,nvitl4s,nvitl4d,nvitl4r,nvitl5,nvitl1,nvitl2,nvitl3,nvitl4,phys1,phys1a,phys14,phys15a,phys15b,phys15c,phys15d,phys16a,phys16b,phys16c,phys16d,phys17a,phys17b,phys17c,phys17d,phys18a,phys18b,phys18c,phys18d,phys19a,phys19b,phys20,phys22,phys24,phys26,phys28,PREG1,PREG2,updrsa,updrs1,updrs2,updrs3,updrs4,updrs5a,updrs6a,updrs7a,updrs8a,updrs9a,updrs10a,updrs11a,updrs12a,updrs13a,updrs14a,updrs15a,updrs16a,updrs17a,updrs18a,updrs19a,updrs20a1,updrs20b1,updrs20c1,updrs20d1,updrs20e1,updrs21a1,updrs21b1,updrs22a1,updrs22b1,updrs22c1,updrs22d1,updrs22e1,updrs23a1,updrs23b1,updrs24a1,updrs24b1,updrs25a1,updrs25b1,updrs26a1,updrs26b1,updrs26c1,updrs26d1,updrs27a,updrs28a,updrs29a,updrs30a,updrs31a,updrs32a,updrs33a,updrs34a,updrs35,updrs36,updrs37,updrs38,updrs39,updrs5b,updrs6b,updrs7b,updrs8b,updrs9b,updrs10b,updrs11b,updrs12b,updrs13b,updrs14b,updrs15b,updrs16b,updrs17b,updrs18b,updrs19b,updrs20a2,updrs20b2,updrs20c2,updrs20d2,updrs20e2,updrs21a2,updrs21b2,updrs22a2,updrs22b2,updrs22c2,updrs22d2,updrs22e2,updrs23a2,updrs23b2,updrs24a2,updrs24b2,updrs25a2,updrs25b2,updrs26a2,updrs26b2,updrs26c2,updrs26d2,updrs27b,updrs28b,updrs29b,updrs30b,updrs31b,updrs32b,updrs33b,updrs34b,updrs5c,updrs6c,updrs7c,updrs8c,updrs9c,updrs10c,updrs11c,updrs12c,updrs13c,updrs14c,updrs15c,updrs16c,updrs17c,updrs32c,updrs33c,updrs34c,updrsmental,updrsadl,updrsadlon,updrsadloff,updrsadlmin,updrstremor,updrstremortreat,updrstremormin,updrsrigid,updrsrigidtreat,updrsrigidmin,updrsmotor,updrsmotortreat,updrsmotormin,updrs,updrstrt,updrsmin,updrs4a,updrs41,updrs42,updrs43,updrs44,updrs45,updrs46,updrs47,updrs48,updrs49,updrs410,updrs411,vitl1s,vitl1d,vitl2,vitl3s,vitl3d,vitl4,vitl5,vitl6,assess,fbeck,conf,demo1,derm,ecg,ecgr,mrf,nvitl,fphys1,fpreg,fupdrs,fupdrs4,vitl,site,race,rImaged,rPD,rPDlt5,rAgeGt30,rHY,rMed,rMelanoma,rPreclude,rNeed,rEligible,gender,incsae,incsusp,incterm,increlated,inctermat,increason,incafter24,incendp,incres,disp2,disp3,disp4,disp6,inex1,inex2,inex3,inex4,inex5,inex6,inex7,inex8,inex9,inex10,inex11,inex12,inex13,inex14,inex15,inex16,inex17,inex18,inex19,inex20,inex21,inex22,inex23,inex24,inex25,inex26,inex27,inex28,treatment,treat,disp,inex,classify,enrollyr,demoyear,dob_yr,inexdays,demodays,onsetdays,diagdays,medstartdays,physdays,phys21dys,phys23dys,phys25dys,phys27dys,phys29dys,confdays,pregdays,nvitldays,nvitlscandays,vitldays,labdays,ecgdays,ecgtestdays,mrfdays,dermdays,dermexamdays,dermbiopdays,mmsedays,beckdays,updrdays,updr4days,assessdays,daystotherapy,dispdays,endpdys,termdys,SAEdys,resdys,lmeddys,wddays,VISIT_NO
+a030,ab304,43.0,0.0,0.0,0.0,,,,,,-2.0,0.0,1.0,1.0,,2.0,1.0,19.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,,,,,,,0.0,2.0,ABNORMAL,75.0,150.0,100.0,-3.0,410.0,460.0,2.0,1000.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,0.0,1.0,3.0,5.0,2.0,1.0,1.0,1.0,0.0,3.0,1.0,1.0,1.0,26.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,150.0,94.0,73.0,155.0,96.0,71.0,148.0,91.0,69.0,146.0,67.0,72.0,1.0,42840.0,46080.0,46980.0,30600.0,100.0,175.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,4.0,4.0,4.0,4.0,2.0,1.0,,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.5,0.0,0.0,0.0,1.0,1.0,2.0,2.0,1.0,1.5,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,1.0,2.5,95.0,95.0,7.0,,2.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,5.0,,,5.0,1.5,,1.5,7.5,,7.5,20.0,,20.0,25.0,,25.0,,,,,,,,,,,,,138.0,86.0,72.0,130.0,80.0,80.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,abc,1.0,1.0,1.0,0.0,1.0,34.0,5.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,,0.0,3.0,0.0,1.0,0.0,4.0,3.0,,1.0,1.0,1.0,1.0,1.0,1.0,,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,Placebo,1.0,1.0,1.0,1.0,2002.0,2002.0,1914.0,-28.0,-28.0,-404.0,-28.0,0.0,-28.0,,,,,-6.0,-28.0,-13.0,-13.0,-12.0,-28.0,-28.0,-28.0,-28.0,-28.0,-14.0,-14.0,,-28.0,-28.0,-28.0,,-28.0,,659.0,426.0,659.0,,,658.0,100.0,ab
+a030,ab304,43.0,0.0,0.0,0.0,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1000.0,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,2.0,0.0,0.0,1.0,0.0,1.0,2.0,95.0,95.0,7.0,,2.0,1.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,3.0,,,3.0,0.0,,0.0,3.0,,3.0,13.0,,13.0,16.0,,16.0,,,,,,,,,,,,,140.0,86.0,76.0,132.0,80.0,84.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,abc,0.0,0.0,1.0,0.0,1.0,34.0,5.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,,0.0,3.0,0.0,1.0,0.0,4.0,3.0,,1.0,1.0,1.0,1.0,1.0,1.0,,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,Placebo,1.0,1.0,1.0,1.0,2002.0,,1914.0,-28.0,,,,0.0,,,,,,,,,,,0.0,0.0,,,,,,,,,0.0,,0.0,,659.0,426.0,659.0,,,658.0,100.0,ab
+a030,ab304,43.0,0.0,0.0,0.0,,,,,,4.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1000.0,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,1.0,2.0,0.0,1.0,1.0,0.5,1.0,2.0,90.0,95.0,7.0,,2.0,2.0,2.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,5.0,,,5.0,0.5,,0.5,2.0,,2.0,16.0,,16.0,21.0,,21.0,0.0,,,,,,,,,,,,149.0,88.0,80.0,136.0,90.0,82.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,abc,0.0,0.0,1.0,1.0,1.0,34.0,5.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,,0.0,3.0,0.0,1.0,0.0,4.0,3.0,,1.0,1.0,1.0,1.0,1.0,1.0,,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,Placebo,1.0,1.0,1.0,1.0,2002.0,,1914.0,-28.0,,,,0.0,,,,,,,,,,,29.0,29.0,,,,,,,,,29.0,29.0,29.0,,659.0,426.0,659.0,,,658.0,100.0,ab
diff --git a/pandas/tests/io/sas/data/many_columns.sas7bdat b/pandas/tests/io/sas/data/many_columns.sas7bdat
new file mode 100644
index 0000000000000..582316fc59e18
Binary files /dev/null and b/pandas/tests/io/sas/data/many_columns.sas7bdat differ
diff --git a/pandas/tests/io/sas/data/productsales.csv b/pandas/tests/io/sas/data/productsales.csv
index fea9b68912297..1f6a4424e1a97 100644
--- a/pandas/tests/io/sas/data/productsales.csv
+++ b/pandas/tests/io/sas/data/productsales.csv
@@ -1,1441 +1,1441 @@
 ACTUAL,PREDICT,COUNTRY,REGION,DIVISION,PRODTYPE,PRODUCT,QUARTER,YEAR,MONTH
-925,850,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-999,297,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-608,846,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-642,533,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-656,646,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-948,486,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-612,717,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-114,564,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-685,230,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-657,494,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-608,903,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-353,266,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-107,190,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-354,139,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-101,217,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-553,560,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-877,148,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-431,762,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-511,457,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-157,532,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-520,629,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-114,491,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-277,0,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-561,979,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-220,585,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,12054
-444,267,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,12085
-178,487,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,12113
-756,764,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,12144
-329,312,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,12174
-910,531,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,12205
-530,536,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,12235
-101,773,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,12266
-515,143,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,12297
-730,126,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,12327
-993,862,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,12358
-954,754,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,12388
-267,410,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,12419
-347,701,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,12450
-991,204,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,12478
-923,509,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,12509
-437,378,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,12539
-737,507,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,12570
-104,49,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,12600
-840,876,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,12631
-704,66,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,12662
-889,819,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,12692
-107,351,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,12723
-571,201,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,12753
-688,209,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,12054
-544,51,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,12085
-954,135,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,12113
-445,47,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,12144
-829,379,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,12174
-464,758,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,12205
-968,475,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,12235
-842,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,12266
-721,507,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,12297
-966,269,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,12327
-332,699,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,12358
-328,824,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,12388
-355,497,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,12419
-506,44,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,12450
-585,522,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,12478
-634,378,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,12509
-662,689,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,12539
-783,90,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,12570
-786,720,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,12600
-710,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,12631
-950,457,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,12662
-274,947,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,12692
-406,834,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,12723
-515,71,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,12753
-35,282,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-995,538,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-670,679,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-406,601,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-825,577,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-467,908,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-709,819,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-522,687,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-688,157,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-956,111,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-129,31,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-687,790,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-877,795,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-845,379,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-425,114,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-899,475,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-987,747,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-641,372,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-448,415,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-341,955,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-137,356,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-235,316,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-482,351,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-678,164,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-240,386,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,12054
-605,113,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,12085
-274,68,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,12113
-422,885,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,12144
-763,575,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,12174
-561,743,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,12205
-339,816,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,12235
-877,203,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,12266
-192,581,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,12297
-604,815,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,12327
-55,333,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,12358
-87,40,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,12388
-942,672,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,12419
-912,23,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,12450
-768,948,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,12478
-951,291,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,12509
-768,839,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,12539
-978,864,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,12570
-20,337,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,12600
-298,95,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,12631
-193,535,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,12662
-336,191,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,12692
-617,412,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,12723
-709,711,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,12753
-5,425,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-164,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-422,948,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-424,544,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-854,764,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-168,446,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-8,957,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-748,967,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-682,11,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-300,110,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-672,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-894,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-944,965,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-403,423,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-596,753,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-481,770,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-503,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-126,79,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-721,441,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-271,858,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-721,667,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-157,193,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-991,394,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-499,680,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-284,414,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,12054
-705,770,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,12085
-737,679,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,12113
-745,7,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,12144
-633,713,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,12174
-983,851,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,12205
-591,944,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,12235
-42,130,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,12266
-771,485,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,12297
-465,23,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,12327
-296,193,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,12358
-890,7,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,12388
-312,919,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,12419
-777,768,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,12450
-364,854,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,12478
-601,411,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,12509
-823,736,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,12539
-847,10,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,12570
-490,311,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,12600
-387,348,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,12631
-688,458,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,12662
-650,195,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,12692
-447,658,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,12723
-91,704,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,12753
-197,807,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,12054
-51,861,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,12085
-570,873,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,12113
-423,933,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,12144
-524,355,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,12174
-416,794,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,12205
-789,645,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,12235
-551,700,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,12266
-400,831,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,12297
-361,800,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,12327
-189,830,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,12358
-554,828,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,12388
-585,12,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,12419
-281,501,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,12450
-629,914,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,12478
-43,685,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,12509
-533,755,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,12539
-882,708,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,12570
-790,595,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,12600
-600,32,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,12631
-148,49,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,12662
-237,727,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,12692
-488,239,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,12723
-457,273,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,12753
-401,986,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-181,544,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-995,182,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-120,197,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-119,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-319,974,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-333,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-923,688,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-634,750,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-493,155,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-461,860,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-304,102,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-641,425,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-992,224,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-202,408,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-770,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-202,816,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-14,515,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-134,793,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-977,460,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-174,732,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-429,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-514,38,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-784,616,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-973,225,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,12054
-511,402,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,12085
-30,697,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,12113
-895,567,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,12144
-557,231,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,12174
-282,372,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,12205
-909,15,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,12235
-276,866,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,12266
-234,452,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,12297
-479,663,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,12327
-782,982,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,12358
-755,813,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,12388
-689,523,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,12419
-496,871,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,12450
-24,511,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,12478
-379,819,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,12509
-441,525,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,12539
-49,13,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,12570
-243,694,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,12600
-295,782,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,12631
-395,839,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,12662
-929,461,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,12692
-997,303,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,12723
-889,421,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,12753
-72,421,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-926,433,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-850,394,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-826,338,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-651,764,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-854,216,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-899,96,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-309,550,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-943,636,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-138,427,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-99,652,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-270,478,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-862,18,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-574,40,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-359,453,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-958,987,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-791,26,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-284,101,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-190,969,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-527,492,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-112,263,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-271,593,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-643,923,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-554,146,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-211,305,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,12054
-368,318,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,12085
-778,417,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,12113
-808,623,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,12144
-46,761,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,12174
-466,272,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,12205
-18,988,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,12235
-87,821,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,12266
-765,962,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,12297
-62,615,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,12327
-13,523,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,12358
-775,806,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,12388
-636,586,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,12419
-458,520,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,12450
-206,908,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,12478
-310,30,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,12509
-813,247,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,12539
-22,647,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,12570
-742,55,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,12600
-394,154,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,12631
-957,344,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,12662
-205,95,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,12692
-198,665,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,12723
-638,145,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,12753
-155,925,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,12054
-688,395,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,12085
-730,749,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,12113
-208,279,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,12144
-525,288,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,12174
-483,509,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,12205
-748,255,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,12235
-6,214,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,12266
-168,473,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,12297
-301,702,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,12327
-9,814,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,12358
-778,231,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,12388
-799,422,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,12419
-309,572,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,12450
-433,363,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,12478
-969,919,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,12509
-181,355,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,12539
-787,992,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,12570
-971,147,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,12600
-440,183,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,12631
-209,375,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,12662
-537,77,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,12692
-364,308,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,12723
-377,660,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,12753
-251,555,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-607,455,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-127,888,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-513,652,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-146,799,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-917,249,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-776,539,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-330,198,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-981,340,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-862,152,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-612,347,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-607,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-786,855,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-160,87,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-199,69,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-972,807,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-870,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-494,798,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-975,714,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-760,17,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-180,797,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-256,422,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-422,621,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-859,661,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-586,363,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,12054
-441,910,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,12085
-597,998,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,12113
-717,95,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,12144
-713,731,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,12174
-591,718,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,12205
-492,467,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,12235
-170,126,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,12266
-684,127,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,12297
-981,746,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,12327
-966,878,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,12358
-439,27,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,12388
-151,569,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,12419
-602,812,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,12450
-187,603,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,12478
-415,506,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,12509
-61,185,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,12539
-839,692,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,12570
-596,565,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,12600
-751,512,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,12631
-460,86,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,12662
-922,399,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,12692
-153,672,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,12723
-928,801,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,12753
-951,730,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-394,408,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-615,982,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-653,499,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-180,307,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-649,741,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-921,640,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-11,300,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-696,929,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-795,309,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-550,340,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-320,228,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-845,1000,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-245,21,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-142,583,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-717,506,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-3,405,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-790,556,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-646,72,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-230,103,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-938,262,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-629,102,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-317,841,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-812,159,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-141,570,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,12054
-64,375,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,12085
-207,298,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,12113
-435,32,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,12144
-96,760,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,12174
-252,338,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,12205
-956,149,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,12235
-633,343,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,12266
-190,151,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,12297
-227,44,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,12327
-24,583,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,12358
-420,230,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,12388
-910,907,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,12419
-709,783,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,12450
-810,117,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,12478
-723,416,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,12509
-911,318,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,12539
-230,888,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,12570
-448,60,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,12600
-945,596,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,12631
-508,576,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,12662
-262,576,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,12692
-441,280,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,12723
-15,219,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,12753
-795,133,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,12054
-301,273,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,12085
-304,86,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,12113
-49,400,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,12144
-576,364,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,12174
-669,63,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,12205
-325,929,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,12235
-272,344,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,12266
-80,768,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,12297
-46,668,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,12327
-223,407,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,12358
-774,536,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,12388
-784,657,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,12419
-92,215,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,12450
-67,966,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,12478
-747,674,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,12509
-686,574,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,12539
-93,266,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,12570
-192,680,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,12600
-51,362,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,12631
-498,412,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,12662
-546,431,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,12692
-485,94,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,12723
-925,345,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,12753
-292,445,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-540,632,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-21,855,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-100,36,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-49,250,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-353,427,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-911,367,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-823,245,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-278,893,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-576,490,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-655,88,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-763,964,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-88,62,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-746,506,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-927,680,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-297,153,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-291,403,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-838,98,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-112,376,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-509,477,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-472,50,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-495,592,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-1000,813,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-241,740,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-693,873,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,12054
-903,459,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,12085
-791,224,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,12113
-108,562,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,12144
-845,199,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,12174
-452,275,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,12205
-479,355,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,12235
-410,947,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,12266
-379,454,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,12297
-740,450,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,12327
-471,575,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,12358
-325,6,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,12388
-455,847,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,12419
-563,338,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,12450
-879,517,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,12478
-312,630,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,12509
-587,381,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,12539
-628,864,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,12570
-486,416,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,12600
-811,852,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,12631
-990,815,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,12662
-35,23,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,12692
-764,527,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,12723
-619,693,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,12753
-996,977,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-554,549,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-540,951,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-140,390,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-554,204,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-724,78,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-693,613,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-866,745,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-833,56,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-164,887,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-753,651,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-60,691,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-688,767,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-883,709,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-109,417,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-950,326,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-438,599,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-286,818,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-342,13,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-383,185,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-80,140,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-322,717,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-749,852,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-606,125,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-641,325,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,12054
-494,648,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,12085
-428,365,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,12113
-936,120,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,12144
-597,347,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,12174
-728,638,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,12205
-933,732,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,12235
-663,465,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,12266
-394,262,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,12297
-334,947,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,12327
-114,694,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,12358
-89,482,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,12388
-874,600,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,12419
-674,94,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,12450
-347,323,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,12478
-105,49,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,12509
-286,70,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,12539
-669,844,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,12570
-786,773,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,12600
-104,68,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,12631
-770,110,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,12662
-263,42,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,12692
-900,171,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,12723
-630,644,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,12753
-597,408,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,12054
-185,45,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,12085
-175,522,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,12113
-576,166,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,12144
-957,885,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,12174
-993,713,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,12205
-500,838,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,12235
-410,267,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,12266
-592,967,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,12297
-64,529,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,12327
-208,656,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,12358
-273,665,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,12388
-906,419,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,12419
-429,776,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,12450
-961,971,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,12478
-338,248,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,12509
-472,486,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,12539
-903,674,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,12570
-299,603,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,12600
-948,492,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,12631
-931,512,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,12662
-570,391,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,12692
-97,313,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,12723
-674,758,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,12753
-468,304,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-430,846,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-893,912,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-519,810,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-267,122,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-908,102,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-176,161,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-673,450,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-798,215,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-291,765,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-583,557,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-442,739,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-951,811,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-430,780,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-559,645,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-726,365,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-944,597,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-497,126,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-388,655,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-81,604,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-111,280,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-288,115,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-845,205,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-745,672,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-352,339,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,12054
-234,70,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,12085
-167,528,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,12113
-606,220,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,12144
-670,691,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,12174
-764,197,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,12205
-659,239,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,12235
-996,50,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,12266
-424,135,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,12297
-899,972,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,12327
-392,475,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,12358
-555,868,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,12388
-860,451,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,12419
-114,565,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,12450
-943,116,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,12478
-365,385,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,12509
-249,375,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,12539
-192,357,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,12570
-328,230,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,12600
-311,829,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,12631
-576,971,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,12662
-915,280,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,12692
-522,853,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,12723
-625,953,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,12753
-873,874,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-498,578,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-808,768,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-742,178,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-744,916,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-30,917,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-747,633,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-672,107,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-564,523,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-785,924,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-825,481,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-243,240,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-959,819,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-123,602,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-714,538,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-252,632,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-715,952,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-670,480,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-81,700,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-653,726,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-795,526,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-182,410,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-725,307,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-101,73,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-143,232,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,12054
-15,993,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,12085
-742,652,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,12113
-339,761,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,12144
-39,428,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,12174
-465,4,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,12205
-889,101,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,12235
-856,869,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,12266
-358,271,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,12297
-452,633,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,12327
-387,481,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,12358
-824,302,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,12388
-185,245,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,12419
-151,941,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,12450
-419,721,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,12478
-643,893,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,12509
-63,898,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,12539
-202,94,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,12570
-332,962,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,12600
-723,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,12631
-148,108,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,12662
-840,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,12692
-601,767,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,12723
-962,323,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,12753
-166,982,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,12054
-531,614,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,12085
-963,839,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,12113
-994,388,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,12144
-978,296,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,12174
-72,429,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,12205
-33,901,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,12235
-428,350,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,12266
-413,581,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,12297
-737,583,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,12327
-85,92,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,12358
-916,647,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,12388
-785,771,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,12419
-302,26,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,12450
-1000,598,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,12478
-458,715,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,12509
-896,74,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,12539
-615,580,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,12570
-174,848,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,12600
-651,118,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,12631
-784,54,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,12662
-121,929,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,12692
-341,393,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,12723
-615,820,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,12753
-697,336,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-215,299,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-197,747,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-205,154,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-256,486,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-377,251,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-577,225,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-686,77,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-332,74,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-534,596,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-485,493,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-594,782,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-413,487,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-13,127,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-483,538,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-820,94,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-745,252,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-79,722,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-36,536,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-950,958,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-74,466,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-458,309,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-609,680,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-429,539,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-956,511,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,12054
-205,505,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,12085
-629,720,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,12113
-277,823,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,12144
-266,21,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,12174
-872,142,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,12205
-435,95,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,12235
-988,398,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,12266
-953,328,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,12297
-556,151,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,12327
-211,978,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,12358
-389,918,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,12388
-351,542,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,12419
-14,96,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,12450
-181,496,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,12478
-452,77,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,12509
-511,236,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,12539
-193,913,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,12570
-797,49,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,12600
-988,967,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,12631
-487,502,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,12662
-941,790,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,12692
-577,121,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,12723
-456,55,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,12753
-982,739,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-593,683,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-702,610,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-528,248,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-873,530,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-301,889,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-769,245,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-724,473,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-466,938,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-774,150,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-111,772,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-954,201,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-780,945,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-210,177,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-93,378,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-332,83,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-186,803,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-782,398,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-41,215,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-222,194,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-992,287,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-477,410,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-948,50,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-817,204,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-597,239,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,12054
-649,637,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,12085
-3,938,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,12113
-731,788,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,12144
-181,399,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,12174
-468,576,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,12205
-891,187,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,12235
-226,703,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,12266
-28,455,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,12297
-609,244,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,12327
-224,868,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,12358
-230,353,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,12388
-216,101,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,12419
-282,924,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,12450
-501,144,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,12478
-320,0,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,12509
-720,910,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,12539
-464,259,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,12570
-363,107,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,12600
-49,63,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,12631
-223,270,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,12662
-452,554,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,12692
-210,154,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,12723
-444,205,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,12753
-222,441,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,12054
-678,183,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,12085
-25,459,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,12113
-57,810,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,12144
-981,268,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,12174
-740,916,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,12205
-408,742,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,12235
-966,522,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,12266
-107,299,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,12297
-488,677,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,12327
-759,709,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,12358
-504,310,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,12388
-99,160,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,12419
-503,698,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,12450
-724,540,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,12478
-309,901,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,12509
-625,34,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,12539
-294,536,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,12570
-890,780,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,12600
-501,716,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,12631
-34,532,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,12662
-203,871,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,12692
-140,199,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,12723
-845,845,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,12753
-774,591,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-645,378,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-986,942,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-296,686,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-936,720,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-341,546,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-32,845,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-277,667,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-548,627,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-727,142,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-812,655,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-168,556,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-150,459,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-136,89,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-695,726,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-363,38,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-853,60,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-621,369,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-764,381,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-669,465,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-772,981,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-228,758,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-261,31,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-821,237,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-100,285,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,12054
-465,94,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,12085
-350,561,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,12113
-991,143,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,12144
-910,95,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,12174
-206,341,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,12205
-263,388,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,12235
-374,272,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,12266
-875,890,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,12297
-810,734,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,12327
-398,364,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,12358
-565,619,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,12388
-417,517,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,12419
-291,781,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,12450
-251,327,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,12478
-449,48,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,12509
-774,809,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,12539
-386,73,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,12570
-22,936,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,12600
-940,400,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,12631
-132,736,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,12662
-103,211,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,12692
-152,271,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,12723
-952,855,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,12753
-872,923,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-748,854,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-749,769,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-876,271,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-860,383,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-900,29,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-705,185,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-913,351,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-315,560,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-466,840,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-233,517,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-906,949,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-148,633,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-661,636,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-847,138,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-768,481,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-866,408,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-475,130,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-112,813,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-136,661,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-763,311,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-388,872,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-996,643,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-486,174,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-494,528,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,12054
-771,124,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,12085
-49,126,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,12113
-322,440,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,12144
-878,881,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,12174
-827,292,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,12205
-852,873,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,12235
-716,357,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,12266
-81,247,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,12297
-916,18,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,12327
-673,395,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,12358
-242,620,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,12388
-914,946,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,12419
-902,72,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,12450
-707,691,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,12478
-223,95,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,12509
-619,878,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,12539
-254,757,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,12570
-688,898,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,12600
-477,172,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,12631
-280,419,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,12662
-546,849,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,12692
-630,807,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,12723
-455,599,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,12753
-505,59,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,12054
-823,790,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,12085
-891,574,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,12113
-840,96,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,12144
-436,376,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,12174
-168,352,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,12205
-177,741,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,12235
-727,12,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,12266
-278,157,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,12297
-443,10,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,12327
-905,544,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,12358
-881,817,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,12388
-507,754,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,12419
-363,425,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,12450
-603,492,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,12478
-473,485,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,12509
-128,369,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,12539
-105,560,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,12570
-325,651,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,12600
-711,326,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,12631
-983,180,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,12662
-241,935,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,12692
-71,403,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,12723
-395,345,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,12753
-168,278,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-512,376,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-291,104,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-776,543,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-271,798,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-946,333,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-195,833,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-165,132,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-238,629,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-409,337,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-720,300,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-309,470,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-812,875,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-441,237,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-500,272,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-517,860,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-924,415,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-572,140,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-768,367,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-692,195,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-28,245,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-202,285,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-76,98,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-421,932,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-636,898,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,12054
-52,330,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,12085
-184,603,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,12113
-739,280,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,12144
-841,507,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,12174
-65,202,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,12205
-623,513,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,12235
-517,132,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,12266
-636,21,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,12297
-845,657,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,12327
-232,195,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,12358
-26,323,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,12388
-680,299,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,12419
-364,811,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,12450
-572,739,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,12478
-145,889,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,12509
-644,189,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,12539
-87,698,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,12570
-620,646,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,12600
-535,562,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,12631
-661,753,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,12662
-884,425,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,12692
-689,693,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,12723
-646,941,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,12753
-4,975,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-813,455,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-773,260,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-205,69,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-657,147,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-154,533,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-747,881,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-787,457,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-867,441,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-307,859,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-571,177,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-92,633,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-269,382,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-764,707,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-662,566,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-818,349,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-617,128,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-649,231,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-895,258,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-750,812,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-738,362,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-107,133,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-278,60,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-32,88,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-129,378,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,12054
-187,569,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,12085
-670,186,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,12113
-678,875,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,12144
-423,636,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,12174
-389,360,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,12205
-257,677,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,12235
-780,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,12266
-159,158,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,12297
-97,384,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,12327
-479,927,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,12358
-9,134,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,12388
-614,273,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,12419
-261,27,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,12450
-115,209,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,12478
-358,470,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,12509
-133,219,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,12539
-891,907,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,12570
-702,778,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,12600
-58,998,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,12631
-606,194,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,12662
-668,933,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,12692
-813,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,12723
-450,949,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,12753
-956,579,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,12054
-276,131,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,12085
-889,689,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,12113
-708,908,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,12144
-14,524,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,12174
-904,336,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,12205
-272,916,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,12235
-257,236,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,12266
-343,965,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,12297
-80,350,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,12327
-530,599,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,12358
-340,901,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,12388
-595,935,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,12419
-47,667,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,12450
-279,104,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,12478
-293,803,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,12509
-162,64,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,12539
-935,825,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,12570
-689,839,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,12600
-484,184,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,12631
-230,348,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,12662
-164,904,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,12692
-401,219,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,12723
-607,381,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,12753
-229,524,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-786,902,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-92,212,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-455,762,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-409,182,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-166,442,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-277,919,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-92,67,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-631,741,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-390,617,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-403,214,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-964,202,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-223,788,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-684,639,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-645,336,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-470,937,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-424,399,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-862,21,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-736,125,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-554,635,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-790,229,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-115,770,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-853,622,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-643,109,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-794,975,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,12054
-892,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,12085
-728,123,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,12113
-744,135,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,12144
-678,535,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,12174
-768,971,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,12205
-234,166,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,12235
-333,814,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,12266
-968,557,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,12297
-119,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,12327
-469,486,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,12358
-261,429,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,12388
-984,65,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,12419
-845,977,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,12450
-374,410,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,12478
-687,150,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,12509
-157,630,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,12539
-49,488,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,12570
-817,112,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,12600
-223,598,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,12631
-433,705,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,12662
-41,226,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,12692
-396,979,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,12723
-131,19,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,12753
-521,204,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-751,805,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-45,549,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-144,912,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-119,427,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-728,1,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-120,540,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-657,940,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-409,644,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-881,821,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-113,560,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-831,309,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-129,1000,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-76,945,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-260,931,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-882,504,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-157,950,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-443,278,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-111,225,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-497,6,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-321,124,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-194,206,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-684,320,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-634,270,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-622,278,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,12054
-689,447,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,12085
-120,170,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,12113
-374,87,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,12144
-926,384,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,12174
-687,574,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,12205
-600,585,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,12235
-779,947,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,12266
-223,984,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,12297
-628,189,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,12327
-326,364,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,12358
-836,49,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,12388
-361,851,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,12419
-444,643,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,12450
-501,143,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,12478
-743,763,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,12509
-861,987,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,12539
-203,264,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,12570
-762,439,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,12600
-705,750,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,12631
-153,37,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,12662
-436,95,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,12692
-428,79,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,12723
-804,832,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,12753
-805,649,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,12054
-860,838,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,12085
-104,439,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,12113
-434,207,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,12144
-912,804,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,12174
-571,875,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,12205
-267,473,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,12235
-415,845,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,12266
-261,91,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,12297
-746,630,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,12327
-30,185,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,12358
-662,317,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,12388
-916,88,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,12419
-415,607,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,12450
-514,35,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,12478
-756,680,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,12509
-461,78,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,12539
-460,117,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,12570
-305,440,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,12600
-198,652,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,12631
-234,249,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,12662
-638,658,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,12692
-88,563,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,12723
-751,737,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,12753
-816,789,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-437,988,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-715,220,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-780,946,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-245,986,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-201,129,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-815,433,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-865,492,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-634,306,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-901,154,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-789,206,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-882,81,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-953,882,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-862,848,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-628,664,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-765,389,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-741,182,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-61,505,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-470,861,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-869,263,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-650,400,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-750,556,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-602,497,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-54,181,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-384,619,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,12054
-161,332,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,12085
-977,669,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,12113
-615,487,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,12144
-783,994,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,12174
-977,331,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,12205
-375,739,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,12235
-298,665,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,12266
-104,921,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,12297
-713,862,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,12327
-556,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,12358
-323,517,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,12388
-391,352,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,12419
-593,166,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,12450
-906,859,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,12478
-130,571,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,12509
-613,976,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,12539
-58,466,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,12570
-314,79,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,12600
-67,864,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,12631
-654,623,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,12662
-312,170,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,12692
-349,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,12723
-415,763,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,12753
-404,896,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12054
-22,973,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12085
-744,161,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,12113
-804,934,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12144
-101,697,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12174
-293,116,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,12205
-266,84,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12235
-372,604,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12266
-38,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,12297
-385,783,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12327
-262,335,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12358
-961,321,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,12388
-831,177,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12419
-579,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12450
-301,583,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,12478
-693,364,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12509
-895,343,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12539
-320,854,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,12570
-284,691,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12600
-362,387,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12631
-132,298,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,12662
-42,635,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12692
-118,81,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12723
-42,375,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,12753
-18,846,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,12054
-512,933,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,12085
-337,237,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,12113
-167,964,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,12144
-749,382,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,12174
-890,610,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,12205
-910,148,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,12235
-403,837,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,12266
-403,85,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,12297
-661,425,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,12327
-485,633,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,12358
-789,515,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,12388
-415,512,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,12419
-418,156,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,12450
-163,464,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,12478
-298,813,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,12509
-584,455,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,12539
-797,366,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,12570
-767,734,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,12600
-984,451,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,12631
-388,134,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,12662
-924,547,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,12692
-566,802,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,12723
-390,61,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,12753
-608,556,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,12054
-840,202,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,12085
-112,964,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,12113
-288,112,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,12144
-408,445,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,12174
-876,884,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,12205
-224,348,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,12235
-133,564,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,12266
-662,568,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,12297
-68,882,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,12327
-626,542,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,12358
-678,119,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,12388
-361,248,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,12419
-464,868,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,12450
-681,841,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,12478
-377,484,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,12509
-222,986,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,12539
-972,39,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,12570
-56,930,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,12600
-695,252,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,12631
-908,794,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,12662
-328,658,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,12692
-891,139,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,12723
-265,331,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,12753
-251,261,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12054
-783,122,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12085
-425,296,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,12113
-859,391,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12144
-314,75,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12174
-153,731,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,12205
-955,883,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12235
-654,707,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12266
-693,97,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,12297
-757,390,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12327
-221,237,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12358
-942,496,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,12388
-31,814,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12419
-540,765,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12450
-352,308,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,12478
-904,327,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12509
-436,266,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12539
-281,699,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,12570
-801,599,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12600
-273,950,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12631
-716,117,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,12662
-902,632,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12692
-341,35,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12723
-155,562,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,12753
-796,144,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,12054
-257,142,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,12085
-611,273,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,12113
-6,915,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,12144
-125,920,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,12174
-745,294,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,12205
-437,681,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,12235
-906,86,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,12266
-844,764,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,12297
-413,269,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,12327
-869,138,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,12358
-403,834,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,12388
-137,112,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,12419
-922,921,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,12450
-202,859,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,12478
-955,442,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,12509
-781,593,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,12539
-12,346,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,12570
-931,312,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,12600
-95,690,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,12631
-795,344,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,12662
-542,784,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,12692
-935,639,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,12723
-269,726,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,12753
-197,596,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12054
-828,263,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12085
-461,194,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,12113
-35,895,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12144
-88,502,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12174
-832,342,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,12205
-900,421,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12235
-368,901,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12266
-201,474,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,12297
-758,571,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12327
-504,511,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12358
-864,379,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,12388
-574,68,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12419
-61,210,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12450
-565,478,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,12478
-475,296,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12509
-44,664,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12539
-145,880,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,12570
-813,607,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12600
-703,97,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12631
-757,908,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,12662
-96,152,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12692
-860,622,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12723
-750,309,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,12753
-585,912,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,12054
-127,429,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,12085
-669,580,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,12113
-708,179,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,12144
-830,119,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,12174
-550,369,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,12205
-762,882,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,12235
-468,727,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,12266
-151,823,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,12297
-103,783,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,12327
-876,884,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,12358
-881,891,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,12388
-116,909,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,12419
-677,765,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,12450
-477,180,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,12478
-154,712,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,12509
-331,175,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,12539
-784,869,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,12570
-563,820,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,12600
-229,554,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,12631
-451,126,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,12662
-974,760,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,12692
-484,446,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,12723
-69,254,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,12753
-755,516,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,12054
-331,779,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,12085
-482,987,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,12113
-632,318,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,12144
-750,427,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,12174
-618,86,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,12205
-935,553,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,12235
-716,315,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,12266
-205,328,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,12297
-215,521,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,12327
-871,156,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,12358
-552,841,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,12388
-619,623,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,12419
-701,849,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,12450
-104,438,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,12478
-114,719,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,12509
-854,906,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,12539
-563,267,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,12570
-73,542,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,12600
-427,552,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,12631
-348,428,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,12662
-148,158,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,12692
-895,379,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,12723
-394,142,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,12753
-792,588,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12054
-175,506,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12085
-208,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,12113
-354,132,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12144
-163,652,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12174
-336,723,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,12205
-804,682,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12235
-863,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12266
-326,125,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,12297
-568,321,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12327
-691,922,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12358
-152,884,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,12388
-565,38,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12419
-38,194,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12450
-185,996,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,12478
-318,532,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12509
-960,391,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12539
-122,104,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,12570
-400,22,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12600
-301,650,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12631
-909,143,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,12662
-433,999,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12692
-508,415,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12723
-648,350,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,12753
-793,342,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,12054
-129,215,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,12085
-481,52,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,12113
-406,292,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,12144
-512,862,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,12174
-668,309,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,12205
-551,886,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,12235
-124,172,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,12266
-655,912,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,12297
-523,666,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,12327
-739,656,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,12358
-87,145,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,12388
-890,664,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,12419
-665,639,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,12450
-329,707,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,12478
-417,891,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,12509
-828,466,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,12539
-298,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,12570
-356,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,12600
-909,874,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,12631
-251,805,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,12662
-526,426,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,12692
-652,932,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,12723
-573,581,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,12753
+925,850,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+999,297,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+608,846,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+642,533,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+656,646,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+948,486,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+612,717,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+114,564,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+685,230,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+657,494,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+608,903,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+353,266,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+107,190,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+354,139,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+101,217,CANADA,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+553,560,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+877,148,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+431,762,CANADA,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+511,457,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+157,532,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+520,629,CANADA,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+114,491,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+277,0,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+561,979,CANADA,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+220,585,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+444,267,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+178,487,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+756,764,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+329,312,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+910,531,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+530,536,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+101,773,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+515,143,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+730,126,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+993,862,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+954,754,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+267,410,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+347,701,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+991,204,CANADA,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+923,509,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+437,378,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+737,507,CANADA,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+104,49,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+840,876,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+704,66,CANADA,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+889,819,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+107,351,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+571,201,CANADA,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+688,209,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+544,51,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+954,135,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+445,47,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+829,379,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+464,758,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+968,475,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+842,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+721,507,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+966,269,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+332,699,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+328,824,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+355,497,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+506,44,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+585,522,CANADA,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+634,378,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+662,689,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+783,90,CANADA,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+786,720,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+710,343,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+950,457,CANADA,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+274,947,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+406,834,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+515,71,CANADA,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+35,282,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+995,538,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+670,679,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+406,601,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+825,577,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+467,908,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+709,819,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+522,687,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+688,157,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+956,111,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+129,31,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+687,790,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+877,795,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+845,379,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+425,114,CANADA,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+899,475,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+987,747,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+641,372,CANADA,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+448,415,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+341,955,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+137,356,CANADA,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+235,316,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+482,351,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+678,164,CANADA,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+240,386,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+605,113,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+274,68,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+422,885,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+763,575,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+561,743,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+339,816,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+877,203,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+192,581,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+604,815,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+55,333,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+87,40,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+942,672,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+912,23,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+768,948,CANADA,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+951,291,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+768,839,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+978,864,CANADA,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+20,337,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+298,95,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+193,535,CANADA,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+336,191,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+617,412,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+709,711,CANADA,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+5,425,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+164,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+422,948,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+424,544,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+854,764,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+168,446,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+8,957,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+748,967,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+682,11,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+300,110,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+672,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+894,215,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+944,965,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+403,423,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+596,753,CANADA,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+481,770,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+503,263,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+126,79,CANADA,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+721,441,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+271,858,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+721,667,CANADA,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+157,193,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+991,394,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+499,680,CANADA,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+284,414,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+705,770,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+737,679,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+745,7,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+633,713,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+983,851,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+591,944,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+42,130,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+771,485,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+465,23,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+296,193,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+890,7,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+312,919,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+777,768,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+364,854,CANADA,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+601,411,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+823,736,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+847,10,CANADA,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+490,311,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+387,348,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+688,458,CANADA,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+650,195,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+447,658,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+91,704,CANADA,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+197,807,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+51,861,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+570,873,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+423,933,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+524,355,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+416,794,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+789,645,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+551,700,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+400,831,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+361,800,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+189,830,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+554,828,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+585,12,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+281,501,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+629,914,CANADA,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+43,685,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+533,755,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+882,708,CANADA,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+790,595,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+600,32,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+148,49,CANADA,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+237,727,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+488,239,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+457,273,CANADA,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+401,986,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+181,544,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+995,182,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+120,197,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+119,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+319,974,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+333,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+923,688,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+634,750,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+493,155,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+461,860,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+304,102,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+641,425,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+992,224,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+202,408,CANADA,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+770,524,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+202,816,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+14,515,CANADA,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+134,793,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+977,460,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+174,732,CANADA,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+429,435,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+514,38,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+784,616,CANADA,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+973,225,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+511,402,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+30,697,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+895,567,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+557,231,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+282,372,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+909,15,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+276,866,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+234,452,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+479,663,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+782,982,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+755,813,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+689,523,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+496,871,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+24,511,CANADA,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+379,819,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+441,525,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+49,13,CANADA,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+243,694,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+295,782,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+395,839,CANADA,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+929,461,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+997,303,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+889,421,CANADA,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+72,421,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+926,433,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+850,394,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+826,338,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+651,764,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+854,216,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+899,96,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+309,550,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+943,636,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+138,427,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+99,652,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+270,478,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+862,18,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+574,40,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+359,453,CANADA,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+958,987,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+791,26,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+284,101,CANADA,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+190,969,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+527,492,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+112,263,CANADA,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+271,593,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+643,923,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+554,146,CANADA,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+211,305,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+368,318,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+778,417,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+808,623,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+46,761,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+466,272,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+18,988,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+87,821,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+765,962,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+62,615,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+13,523,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+775,806,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+636,586,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+458,520,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+206,908,CANADA,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+310,30,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+813,247,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+22,647,CANADA,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+742,55,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+394,154,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+957,344,CANADA,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+205,95,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+198,665,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+638,145,CANADA,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+155,925,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+688,395,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+730,749,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+208,279,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+525,288,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+483,509,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+748,255,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+6,214,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+168,473,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+301,702,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+9,814,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+778,231,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+799,422,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+309,572,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+433,363,CANADA,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+969,919,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+181,355,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+787,992,CANADA,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+971,147,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+440,183,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+209,375,CANADA,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+537,77,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+364,308,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+377,660,CANADA,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+251,555,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+607,455,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+127,888,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+513,652,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+146,799,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+917,249,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+776,539,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+330,198,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+981,340,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+862,152,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+612,347,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+607,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+786,855,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+160,87,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+199,69,CANADA,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+972,807,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+870,565,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+494,798,CANADA,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+975,714,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+760,17,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+180,797,CANADA,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+256,422,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+422,621,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+859,661,CANADA,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+586,363,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+441,910,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+597,998,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+717,95,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+713,731,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+591,718,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+492,467,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+170,126,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+684,127,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+981,746,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+966,878,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+439,27,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+151,569,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+602,812,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+187,603,CANADA,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+415,506,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+61,185,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+839,692,CANADA,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+596,565,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+751,512,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+460,86,CANADA,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+922,399,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+153,672,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+928,801,CANADA,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+951,730,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+394,408,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+615,982,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+653,499,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+180,307,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+649,741,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+921,640,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+11,300,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+696,929,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+795,309,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+550,340,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+320,228,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+845,1000,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+245,21,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+142,583,CANADA,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+717,506,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+3,405,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+790,556,CANADA,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+646,72,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+230,103,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+938,262,CANADA,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+629,102,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+317,841,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+812,159,CANADA,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+141,570,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+64,375,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+207,298,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+435,32,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+96,760,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+252,338,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+956,149,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+633,343,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+190,151,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+227,44,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+24,583,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+420,230,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+910,907,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+709,783,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+810,117,CANADA,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+723,416,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+911,318,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+230,888,CANADA,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+448,60,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+945,596,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+508,576,CANADA,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+262,576,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+441,280,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+15,219,CANADA,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+795,133,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+301,273,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+304,86,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+49,400,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+576,364,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+669,63,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+325,929,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+272,344,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+80,768,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+46,668,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+223,407,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+774,536,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+784,657,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+92,215,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+67,966,CANADA,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+747,674,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+686,574,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+93,266,CANADA,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+192,680,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+51,362,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+498,412,CANADA,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+546,431,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+485,94,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+925,345,CANADA,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+292,445,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+540,632,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+21,855,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+100,36,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+49,250,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+353,427,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+911,367,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+823,245,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+278,893,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+576,490,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+655,88,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+763,964,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+88,62,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+746,506,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+927,680,CANADA,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+297,153,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+291,403,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+838,98,CANADA,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+112,376,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+509,477,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+472,50,CANADA,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+495,592,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+1000,813,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+241,740,CANADA,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+693,873,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+903,459,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+791,224,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+108,562,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+845,199,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+452,275,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+479,355,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+410,947,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+379,454,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+740,450,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+471,575,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+325,6,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+455,847,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+563,338,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+879,517,CANADA,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+312,630,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+587,381,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+628,864,CANADA,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+486,416,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+811,852,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+990,815,CANADA,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+35,23,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+764,527,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+619,693,CANADA,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+996,977,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+554,549,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+540,951,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+140,390,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+554,204,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+724,78,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+693,613,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+866,745,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+833,56,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+164,887,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+753,651,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+60,691,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+688,767,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+883,709,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+109,417,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+950,326,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+438,599,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+286,818,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+342,13,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+383,185,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+80,140,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+322,717,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+749,852,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+606,125,GERMANY,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+641,325,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+494,648,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+428,365,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+936,120,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+597,347,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+728,638,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+933,732,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+663,465,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+394,262,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+334,947,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+114,694,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+89,482,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+874,600,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+674,94,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+347,323,GERMANY,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+105,49,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+286,70,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+669,844,GERMANY,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+786,773,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+104,68,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+770,110,GERMANY,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+263,42,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+900,171,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+630,644,GERMANY,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+597,408,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+185,45,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+175,522,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+576,166,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+957,885,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+993,713,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+500,838,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+410,267,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+592,967,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+64,529,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+208,656,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+273,665,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+906,419,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+429,776,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+961,971,GERMANY,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+338,248,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+472,486,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+903,674,GERMANY,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+299,603,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+948,492,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+931,512,GERMANY,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+570,391,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+97,313,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+674,758,GERMANY,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+468,304,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+430,846,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+893,912,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+519,810,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+267,122,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+908,102,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+176,161,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+673,450,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+798,215,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+291,765,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+583,557,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+442,739,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+951,811,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+430,780,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+559,645,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+726,365,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+944,597,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+497,126,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+388,655,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+81,604,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+111,280,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+288,115,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+845,205,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+745,672,GERMANY,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+352,339,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+234,70,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+167,528,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+606,220,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+670,691,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+764,197,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+659,239,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+996,50,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+424,135,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+899,972,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+392,475,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+555,868,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+860,451,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+114,565,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+943,116,GERMANY,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+365,385,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+249,375,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+192,357,GERMANY,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+328,230,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+311,829,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+576,971,GERMANY,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+915,280,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+522,853,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+625,953,GERMANY,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+873,874,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+498,578,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+808,768,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+742,178,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+744,916,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+30,917,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+747,633,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+672,107,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+564,523,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+785,924,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+825,481,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+243,240,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+959,819,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+123,602,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+714,538,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+252,632,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+715,952,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+670,480,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+81,700,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+653,726,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+795,526,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+182,410,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+725,307,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+101,73,GERMANY,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+143,232,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+15,993,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+742,652,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+339,761,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+39,428,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+465,4,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+889,101,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+856,869,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+358,271,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+452,633,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+387,481,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+824,302,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+185,245,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+151,941,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+419,721,GERMANY,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+643,893,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+63,898,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+202,94,GERMANY,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+332,962,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+723,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+148,108,GERMANY,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+840,71,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+601,767,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+962,323,GERMANY,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+166,982,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+531,614,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+963,839,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+994,388,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+978,296,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+72,429,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+33,901,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+428,350,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+413,581,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+737,583,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+85,92,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+916,647,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+785,771,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+302,26,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+1000,598,GERMANY,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+458,715,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+896,74,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+615,580,GERMANY,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+174,848,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+651,118,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+784,54,GERMANY,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+121,929,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+341,393,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+615,820,GERMANY,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+697,336,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+215,299,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+197,747,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+205,154,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+256,486,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+377,251,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+577,225,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+686,77,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+332,74,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+534,596,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+485,493,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+594,782,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+413,487,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+13,127,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+483,538,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+820,94,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+745,252,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+79,722,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+36,536,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+950,958,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+74,466,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+458,309,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+609,680,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+429,539,GERMANY,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+956,511,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+205,505,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+629,720,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+277,823,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+266,21,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+872,142,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+435,95,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+988,398,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+953,328,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+556,151,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+211,978,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+389,918,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+351,542,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+14,96,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+181,496,GERMANY,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+452,77,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+511,236,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+193,913,GERMANY,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+797,49,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+988,967,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+487,502,GERMANY,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+941,790,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+577,121,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+456,55,GERMANY,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+982,739,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+593,683,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+702,610,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+528,248,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+873,530,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+301,889,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+769,245,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+724,473,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+466,938,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+774,150,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+111,772,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+954,201,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+780,945,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+210,177,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+93,378,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+332,83,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+186,803,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+782,398,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+41,215,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+222,194,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+992,287,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+477,410,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+948,50,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+817,204,GERMANY,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+597,239,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+649,637,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+3,938,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+731,788,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+181,399,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+468,576,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+891,187,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+226,703,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+28,455,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+609,244,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+224,868,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+230,353,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+216,101,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+282,924,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+501,144,GERMANY,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+320,0,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+720,910,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+464,259,GERMANY,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+363,107,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+49,63,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+223,270,GERMANY,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+452,554,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+210,154,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+444,205,GERMANY,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+222,441,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+678,183,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+25,459,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+57,810,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+981,268,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+740,916,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+408,742,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+966,522,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+107,299,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+488,677,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+759,709,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+504,310,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+99,160,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+503,698,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+724,540,GERMANY,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+309,901,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+625,34,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+294,536,GERMANY,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+890,780,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+501,716,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+34,532,GERMANY,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+203,871,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+140,199,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+845,845,GERMANY,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+774,591,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+645,378,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+986,942,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+296,686,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+936,720,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+341,546,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+32,845,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+277,667,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+548,627,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+727,142,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+812,655,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+168,556,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+150,459,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+136,89,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+695,726,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+363,38,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+853,60,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+621,369,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+764,381,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+669,465,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+772,981,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+228,758,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+261,31,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+821,237,GERMANY,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+100,285,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+465,94,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+350,561,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+991,143,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+910,95,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+206,341,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+263,388,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+374,272,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+875,890,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+810,734,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+398,364,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+565,619,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+417,517,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+291,781,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+251,327,GERMANY,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+449,48,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+774,809,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+386,73,GERMANY,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+22,936,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+940,400,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+132,736,GERMANY,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+103,211,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+152,271,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+952,855,GERMANY,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+872,923,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+748,854,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+749,769,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+876,271,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+860,383,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+900,29,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+705,185,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+913,351,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+315,560,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+466,840,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+233,517,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+906,949,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+148,633,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+661,636,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+847,138,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+768,481,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+866,408,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+475,130,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+112,813,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+136,661,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+763,311,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+388,872,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+996,643,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+486,174,GERMANY,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+494,528,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+771,124,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+49,126,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+322,440,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+878,881,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+827,292,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+852,873,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+716,357,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+81,247,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+916,18,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+673,395,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+242,620,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+914,946,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+902,72,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+707,691,GERMANY,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+223,95,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+619,878,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+254,757,GERMANY,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+688,898,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+477,172,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+280,419,GERMANY,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+546,849,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+630,807,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+455,599,GERMANY,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+505,59,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+823,790,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+891,574,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+840,96,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+436,376,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+168,352,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+177,741,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+727,12,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+278,157,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+443,10,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+905,544,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+881,817,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+507,754,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+363,425,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+603,492,GERMANY,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+473,485,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+128,369,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+105,560,GERMANY,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+325,651,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+711,326,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+983,180,GERMANY,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+241,935,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+71,403,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+395,345,GERMANY,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+168,278,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+512,376,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+291,104,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+776,543,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+271,798,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+946,333,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+195,833,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+165,132,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+238,629,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+409,337,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+720,300,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+309,470,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+812,875,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+441,237,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+500,272,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+517,860,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+924,415,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+572,140,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+768,367,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+692,195,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+28,245,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+202,285,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+76,98,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+421,932,GERMANY,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+636,898,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+52,330,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+184,603,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+739,280,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+841,507,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+65,202,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+623,513,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+517,132,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+636,21,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+845,657,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+232,195,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+26,323,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+680,299,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+364,811,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+572,739,GERMANY,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+145,889,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+644,189,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+87,698,GERMANY,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+620,646,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+535,562,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+661,753,GERMANY,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+884,425,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+689,693,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+646,941,GERMANY,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+4,975,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+813,455,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+773,260,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+205,69,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+657,147,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+154,533,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+747,881,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+787,457,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+867,441,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+307,859,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+571,177,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+92,633,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+269,382,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+764,707,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+662,566,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+818,349,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+617,128,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+649,231,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+895,258,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+750,812,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+738,362,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+107,133,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+278,60,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+32,88,U.S.A.,EAST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+129,378,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+187,569,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+670,186,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+678,875,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+423,636,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+389,360,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+257,677,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+780,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+159,158,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+97,384,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+479,927,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+9,134,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+614,273,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+261,27,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+115,209,U.S.A.,EAST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+358,470,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+133,219,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+891,907,U.S.A.,EAST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+702,778,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+58,998,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+606,194,U.S.A.,EAST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+668,933,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+813,708,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+450,949,U.S.A.,EAST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+956,579,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+276,131,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+889,689,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+708,908,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+14,524,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+904,336,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+272,916,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+257,236,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+343,965,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+80,350,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+530,599,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+340,901,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+595,935,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+47,667,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+279,104,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+293,803,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+162,64,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+935,825,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+689,839,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+484,184,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+230,348,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+164,904,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+401,219,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+607,381,U.S.A.,EAST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+229,524,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+786,902,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+92,212,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+455,762,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+409,182,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+166,442,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+277,919,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+92,67,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+631,741,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+390,617,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+403,214,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+964,202,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+223,788,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+684,639,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+645,336,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+470,937,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+424,399,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+862,21,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+736,125,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+554,635,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+790,229,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+115,770,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+853,622,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+643,109,U.S.A.,EAST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+794,975,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+892,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+728,123,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+744,135,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+678,535,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+768,971,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+234,166,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+333,814,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+968,557,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+119,820,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+469,486,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+261,429,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+984,65,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+845,977,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+374,410,U.S.A.,EAST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+687,150,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+157,630,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+49,488,U.S.A.,EAST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+817,112,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+223,598,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+433,705,U.S.A.,EAST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+41,226,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+396,979,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+131,19,U.S.A.,EAST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+521,204,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+751,805,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+45,549,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+144,912,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+119,427,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+728,1,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+120,540,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+657,940,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+409,644,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+881,821,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+113,560,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+831,309,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+129,1000,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+76,945,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+260,931,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+882,504,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+157,950,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+443,278,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+111,225,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+497,6,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+321,124,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+194,206,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+684,320,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+634,270,U.S.A.,EAST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+622,278,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+689,447,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+120,170,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+374,87,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+926,384,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+687,574,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+600,585,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+779,947,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+223,984,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+628,189,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+326,364,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+836,49,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+361,851,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+444,643,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+501,143,U.S.A.,EAST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+743,763,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+861,987,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+203,264,U.S.A.,EAST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+762,439,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+705,750,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+153,37,U.S.A.,EAST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+436,95,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+428,79,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+804,832,U.S.A.,EAST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+805,649,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+860,838,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+104,439,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+434,207,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+912,804,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+571,875,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+267,473,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+415,845,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+261,91,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+746,630,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+30,185,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+662,317,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+916,88,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+415,607,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+514,35,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+756,680,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+461,78,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+460,117,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+305,440,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+198,652,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+234,249,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+638,658,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+88,563,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+751,737,U.S.A.,EAST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+816,789,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+437,988,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+715,220,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+780,946,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+245,986,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+201,129,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+815,433,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+865,492,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+634,306,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+901,154,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+789,206,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+882,81,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+953,882,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+862,848,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+628,664,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+765,389,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+741,182,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+61,505,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+470,861,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+869,263,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+650,400,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+750,556,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+602,497,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+54,181,U.S.A.,EAST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+384,619,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+161,332,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+977,669,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+615,487,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+783,994,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+977,331,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+375,739,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+298,665,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+104,921,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+713,862,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+556,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+323,517,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+391,352,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+593,166,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+906,859,U.S.A.,EAST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+130,571,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+613,976,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+58,466,U.S.A.,EAST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+314,79,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+67,864,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+654,623,U.S.A.,EAST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+312,170,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+349,662,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+415,763,U.S.A.,EAST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
+404,896,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-01-01
+22,973,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-02-01
+744,161,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1993,1993-03-01
+804,934,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-04-01
+101,697,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-05-01
+293,116,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1993,1993-06-01
+266,84,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-07-01
+372,604,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-08-01
+38,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1993,1993-09-01
+385,783,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-10-01
+262,335,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-11-01
+961,321,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1993,1993-12-01
+831,177,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-01-01
+579,371,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-02-01
+301,583,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,1,1994,1994-03-01
+693,364,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-04-01
+895,343,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-05-01
+320,854,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,2,1994,1994-06-01
+284,691,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-07-01
+362,387,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-08-01
+132,298,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,3,1994,1994-09-01
+42,635,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-10-01
+118,81,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-11-01
+42,375,U.S.A.,WEST,EDUCATION,FURNITURE,SOFA,4,1994,1994-12-01
+18,846,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-01-01
+512,933,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-02-01
+337,237,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1993,1993-03-01
+167,964,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-04-01
+749,382,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-05-01
+890,610,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1993,1993-06-01
+910,148,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-07-01
+403,837,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-08-01
+403,85,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1993,1993-09-01
+661,425,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-10-01
+485,633,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-11-01
+789,515,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1993,1993-12-01
+415,512,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-01-01
+418,156,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-02-01
+163,464,U.S.A.,WEST,EDUCATION,FURNITURE,BED,1,1994,1994-03-01
+298,813,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-04-01
+584,455,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-05-01
+797,366,U.S.A.,WEST,EDUCATION,FURNITURE,BED,2,1994,1994-06-01
+767,734,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-07-01
+984,451,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-08-01
+388,134,U.S.A.,WEST,EDUCATION,FURNITURE,BED,3,1994,1994-09-01
+924,547,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-10-01
+566,802,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-11-01
+390,61,U.S.A.,WEST,EDUCATION,FURNITURE,BED,4,1994,1994-12-01
+608,556,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-01-01
+840,202,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-02-01
+112,964,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1993,1993-03-01
+288,112,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-04-01
+408,445,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-05-01
+876,884,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1993,1993-06-01
+224,348,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-07-01
+133,564,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-08-01
+662,568,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1993,1993-09-01
+68,882,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-10-01
+626,542,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-11-01
+678,119,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1993,1993-12-01
+361,248,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-01-01
+464,868,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-02-01
+681,841,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,1,1994,1994-03-01
+377,484,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-04-01
+222,986,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-05-01
+972,39,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,2,1994,1994-06-01
+56,930,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-07-01
+695,252,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-08-01
+908,794,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,3,1994,1994-09-01
+328,658,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-10-01
+891,139,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-11-01
+265,331,U.S.A.,WEST,EDUCATION,OFFICE,TABLE,4,1994,1994-12-01
+251,261,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-01-01
+783,122,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-02-01
+425,296,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1993,1993-03-01
+859,391,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-04-01
+314,75,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-05-01
+153,731,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1993,1993-06-01
+955,883,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-07-01
+654,707,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-08-01
+693,97,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1993,1993-09-01
+757,390,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-10-01
+221,237,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-11-01
+942,496,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1993,1993-12-01
+31,814,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-01-01
+540,765,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-02-01
+352,308,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,1,1994,1994-03-01
+904,327,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-04-01
+436,266,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-05-01
+281,699,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,2,1994,1994-06-01
+801,599,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-07-01
+273,950,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-08-01
+716,117,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,3,1994,1994-09-01
+902,632,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-10-01
+341,35,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-11-01
+155,562,U.S.A.,WEST,EDUCATION,OFFICE,CHAIR,4,1994,1994-12-01
+796,144,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-01-01
+257,142,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-02-01
+611,273,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1993,1993-03-01
+6,915,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-04-01
+125,920,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-05-01
+745,294,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1993,1993-06-01
+437,681,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-07-01
+906,86,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-08-01
+844,764,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1993,1993-09-01
+413,269,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-10-01
+869,138,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-11-01
+403,834,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1993,1993-12-01
+137,112,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-01-01
+922,921,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-02-01
+202,859,U.S.A.,WEST,EDUCATION,OFFICE,DESK,1,1994,1994-03-01
+955,442,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-04-01
+781,593,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-05-01
+12,346,U.S.A.,WEST,EDUCATION,OFFICE,DESK,2,1994,1994-06-01
+931,312,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-07-01
+95,690,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-08-01
+795,344,U.S.A.,WEST,EDUCATION,OFFICE,DESK,3,1994,1994-09-01
+542,784,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-10-01
+935,639,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-11-01
+269,726,U.S.A.,WEST,EDUCATION,OFFICE,DESK,4,1994,1994-12-01
+197,596,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-01-01
+828,263,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-02-01
+461,194,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1993,1993-03-01
+35,895,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-04-01
+88,502,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-05-01
+832,342,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1993,1993-06-01
+900,421,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-07-01
+368,901,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-08-01
+201,474,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1993,1993-09-01
+758,571,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-10-01
+504,511,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-11-01
+864,379,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1993,1993-12-01
+574,68,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-01-01
+61,210,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-02-01
+565,478,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,1,1994,1994-03-01
+475,296,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-04-01
+44,664,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-05-01
+145,880,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,2,1994,1994-06-01
+813,607,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-07-01
+703,97,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-08-01
+757,908,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,3,1994,1994-09-01
+96,152,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-10-01
+860,622,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-11-01
+750,309,U.S.A.,WEST,CONSUMER,FURNITURE,SOFA,4,1994,1994-12-01
+585,912,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-01-01
+127,429,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-02-01
+669,580,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1993,1993-03-01
+708,179,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-04-01
+830,119,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-05-01
+550,369,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1993,1993-06-01
+762,882,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-07-01
+468,727,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-08-01
+151,823,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1993,1993-09-01
+103,783,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-10-01
+876,884,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-11-01
+881,891,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1993,1993-12-01
+116,909,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-01-01
+677,765,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-02-01
+477,180,U.S.A.,WEST,CONSUMER,FURNITURE,BED,1,1994,1994-03-01
+154,712,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-04-01
+331,175,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-05-01
+784,869,U.S.A.,WEST,CONSUMER,FURNITURE,BED,2,1994,1994-06-01
+563,820,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-07-01
+229,554,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-08-01
+451,126,U.S.A.,WEST,CONSUMER,FURNITURE,BED,3,1994,1994-09-01
+974,760,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-10-01
+484,446,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-11-01
+69,254,U.S.A.,WEST,CONSUMER,FURNITURE,BED,4,1994,1994-12-01
+755,516,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-01-01
+331,779,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-02-01
+482,987,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1993,1993-03-01
+632,318,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-04-01
+750,427,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-05-01
+618,86,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1993,1993-06-01
+935,553,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-07-01
+716,315,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-08-01
+205,328,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1993,1993-09-01
+215,521,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-10-01
+871,156,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-11-01
+552,841,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1993,1993-12-01
+619,623,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-01-01
+701,849,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-02-01
+104,438,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,1,1994,1994-03-01
+114,719,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-04-01
+854,906,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-05-01
+563,267,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,2,1994,1994-06-01
+73,542,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-07-01
+427,552,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-08-01
+348,428,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,3,1994,1994-09-01
+148,158,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-10-01
+895,379,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-11-01
+394,142,U.S.A.,WEST,CONSUMER,OFFICE,TABLE,4,1994,1994-12-01
+792,588,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-01-01
+175,506,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-02-01
+208,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1993,1993-03-01
+354,132,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-04-01
+163,652,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-05-01
+336,723,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1993,1993-06-01
+804,682,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-07-01
+863,382,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-08-01
+326,125,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1993,1993-09-01
+568,321,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-10-01
+691,922,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-11-01
+152,884,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1993,1993-12-01
+565,38,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-01-01
+38,194,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-02-01
+185,996,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,1,1994,1994-03-01
+318,532,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-04-01
+960,391,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-05-01
+122,104,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,2,1994,1994-06-01
+400,22,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-07-01
+301,650,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-08-01
+909,143,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,3,1994,1994-09-01
+433,999,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-10-01
+508,415,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-11-01
+648,350,U.S.A.,WEST,CONSUMER,OFFICE,CHAIR,4,1994,1994-12-01
+793,342,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-01-01
+129,215,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-02-01
+481,52,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1993,1993-03-01
+406,292,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-04-01
+512,862,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-05-01
+668,309,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1993,1993-06-01
+551,886,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-07-01
+124,172,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-08-01
+655,912,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1993,1993-09-01
+523,666,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-10-01
+739,656,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-11-01
+87,145,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1993,1993-12-01
+890,664,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-01-01
+665,639,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-02-01
+329,707,U.S.A.,WEST,CONSUMER,OFFICE,DESK,1,1994,1994-03-01
+417,891,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-04-01
+828,466,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-05-01
+298,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,2,1994,1994-06-01
+356,451,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-07-01
+909,874,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-08-01
+251,805,U.S.A.,WEST,CONSUMER,OFFICE,DESK,3,1994,1994-09-01
+526,426,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-10-01
+652,932,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-11-01
+573,581,U.S.A.,WEST,CONSUMER,OFFICE,DESK,4,1994,1994-12-01
diff --git a/pandas/tests/io/sas/data/zero_variables.sas7bdat b/pandas/tests/io/sas/data/zero_variables.sas7bdat
new file mode 100644
index 0000000000000..85fec09447ec5
Binary files /dev/null and b/pandas/tests/io/sas/data/zero_variables.sas7bdat differ
diff --git a/pandas/tests/io/sas/test_sas.py b/pandas/tests/io/sas/test_sas.py
index 237e3676c3b3d..34bca1e5b74a1 100644
--- a/pandas/tests/io/sas/test_sas.py
+++ b/pandas/tests/io/sas/test_sas.py
@@ -1,13 +1,25 @@
-import pandas.util.testing as tm
+import pytest
+
 from pandas.compat import StringIO
+
 from pandas import read_sas
+import pandas.util.testing as tm
 
 
-class TestSas(tm.TestCase):
+class TestSas(object):
 
     def test_sas_buffer_format(self):
-
-        # GH14947
+        # see gh-14947
         b = StringIO("")
-        with self.assertRaises(ValueError):
+
+        msg = ("If this is a buffer object rather than a string "
+               "name, you must specify a format string")
+        with pytest.raises(ValueError, match=msg):
             read_sas(b)
+
+    def test_sas_read_no_format_or_extension(self):
+        # see gh-24548
+        msg = ("unable to infer format of SAS file")
+        with tm.ensure_clean('test_file_no_extension') as path:
+            with pytest.raises(ValueError, match=msg):
+                read_sas(path)
diff --git a/pandas/tests/io/sas/test_sas7bdat.py b/pandas/tests/io/sas/test_sas7bdat.py
index 69073a90e9669..3dd8d0449ef5f 100644
--- a/pandas/tests/io/sas/test_sas7bdat.py
+++ b/pandas/tests/io/sas/test_sas7bdat.py
@@ -1,19 +1,29 @@
-import pandas as pd
-from pandas.compat import PY2
-import pandas.util.testing as tm
-import os
 import io
+import os
+
 import numpy as np
+import pytest
+
+from pandas.compat import PY2
+from pandas.errors import EmptyDataError
+import pandas.util._test_decorators as td
+
+import pandas as pd
+import pandas.util.testing as tm
 
 
-class TestSAS7BDAT(tm.TestCase):
+# https://github.com/cython/cython/issues/1720
+@pytest.mark.filterwarnings("ignore:can't resolve package:ImportWarning")
+class TestSAS7BDAT(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "sas", "data")
         self.data = []
         self.test_ix = [list(range(1, 16)), [16]]
         for j in 1, 2:
-            fname = os.path.join(self.dirpath, "test_sas7bdat_%d.csv" % j)
+            fname = os.path.join(
+                self.dirpath, "test_sas7bdat_{j}.csv".format(j=j))
             df = pd.read_csv(fname)
             epoch = pd.datetime(1960, 1, 1)
             t1 = pd.to_timedelta(df["Column4"], unit='d')
@@ -35,7 +45,8 @@ def test_from_file(self):
         for j in 0, 1:
             df0 = self.data[j]
             for k in self.test_ix[j]:
-                fname = os.path.join(self.dirpath, "test%d.sas7bdat" % k)
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
                 df = pd.read_sas(fname, encoding='utf-8')
                 tm.assert_frame_equal(df, df0)
 
@@ -43,7 +54,8 @@ def test_from_buffer(self):
         for j in 0, 1:
             df0 = self.data[j]
             for k in self.test_ix[j]:
-                fname = os.path.join(self.dirpath, "test%d.sas7bdat" % k)
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
                 with open(fname, 'rb') as f:
                     byts = f.read()
                 buf = io.BytesIO(byts)
@@ -57,7 +69,8 @@ def test_from_iterator(self):
         for j in 0, 1:
             df0 = self.data[j]
             for k in self.test_ix[j]:
-                fname = os.path.join(self.dirpath, "test%d.sas7bdat" % k)
+                fname = os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k))
                 rdr = pd.read_sas(fname, iterator=True, encoding='utf-8')
                 df = rdr.read(2)
                 tm.assert_frame_equal(df, df0.iloc[0:2, :])
@@ -65,23 +78,46 @@ def test_from_iterator(self):
                 tm.assert_frame_equal(df, df0.iloc[2:5, :])
                 rdr.close()
 
+    @td.skip_if_no('pathlib')
+    def test_path_pathlib(self):
+        from pathlib import Path
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = Path(os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k)))
+                df = pd.read_sas(fname, encoding='utf-8')
+                tm.assert_frame_equal(df, df0)
+
+    @td.skip_if_no('py.path')
+    def test_path_localpath(self):
+        from py.path import local as LocalPath
+        for j in 0, 1:
+            df0 = self.data[j]
+            for k in self.test_ix[j]:
+                fname = LocalPath(os.path.join(
+                    self.dirpath, "test{k}.sas7bdat".format(k=k)))
+                df = pd.read_sas(fname, encoding='utf-8')
+                tm.assert_frame_equal(df, df0)
+
     def test_iterator_loop(self):
         # github #13654
         for j in 0, 1:
             for k in self.test_ix[j]:
                 for chunksize in 3, 5, 10, 11:
-                    fname = os.path.join(self.dirpath, "test%d.sas7bdat" % k)
+                    fname = os.path.join(
+                        self.dirpath, "test{k}.sas7bdat".format(k=k))
                     rdr = pd.read_sas(fname, chunksize=10, encoding='utf-8')
                     y = 0
                     for x in rdr:
                         y += x.shape[0]
-                    self.assertTrue(y == rdr.row_count)
+                    assert y == rdr.row_count
                     rdr.close()
 
     def test_iterator_read_too_much(self):
         # github #14734
         k = self.test_ix[0][0]
-        fname = os.path.join(self.dirpath, "test%d.sas7bdat" % k)
+        fname = os.path.join(self.dirpath, "test{k}.sas7bdat".format(k=k))
         rdr = pd.read_sas(fname, format="sas7bdat",
                           iterator=True, encoding='utf-8')
         d1 = rdr.read(rdr.row_count + 20)
@@ -93,9 +129,8 @@ def test_iterator_read_too_much(self):
         rdr.close()
 
 
-def test_encoding_options():
-    dirpath = tm.get_data_path()
-    fname = os.path.join(dirpath, "test1.sas7bdat")
+def test_encoding_options(datapath):
+    fname = datapath("io", "sas", "data", "test1.sas7bdat")
     df1 = pd.read_sas(fname)
     df2 = pd.read_sas(fname, encoding='utf-8')
     for col in df1.columns:
@@ -113,32 +148,80 @@ def test_encoding_options():
         assert(x == y.decode())
 
 
-def test_productsales():
-    dirpath = tm.get_data_path()
-    fname = os.path.join(dirpath, "productsales.sas7bdat")
+def test_productsales(datapath):
+    fname = datapath("io", "sas", "data", "productsales.sas7bdat")
     df = pd.read_sas(fname, encoding='utf-8')
-    fname = os.path.join(dirpath, "productsales.csv")
-    df0 = pd.read_csv(fname)
-    vn = ["ACTUAL", "PREDICT", "QUARTER", "YEAR", "MONTH"]
+    fname = datapath("io", "sas", "data", "productsales.csv")
+    df0 = pd.read_csv(fname, parse_dates=['MONTH'])
+    vn = ["ACTUAL", "PREDICT", "QUARTER", "YEAR"]
     df0[vn] = df0[vn].astype(np.float64)
     tm.assert_frame_equal(df, df0)
 
 
-def test_12659():
-    dirpath = tm.get_data_path()
-    fname = os.path.join(dirpath, "test_12659.sas7bdat")
+def test_12659(datapath):
+    fname = datapath("io", "sas", "data", "test_12659.sas7bdat")
     df = pd.read_sas(fname)
-    fname = os.path.join(dirpath, "test_12659.csv")
+    fname = datapath("io", "sas", "data", "test_12659.csv")
     df0 = pd.read_csv(fname)
     df0 = df0.astype(np.float64)
     tm.assert_frame_equal(df, df0)
 
 
-def test_airline():
-    dirpath = tm.get_data_path()
-    fname = os.path.join(dirpath, "airline.sas7bdat")
+def test_airline(datapath):
+    fname = datapath("io", "sas", "data", "airline.sas7bdat")
     df = pd.read_sas(fname)
-    fname = os.path.join(dirpath, "airline.csv")
+    fname = datapath("io", "sas", "data", "airline.csv")
     df0 = pd.read_csv(fname)
     df0 = df0.astype(np.float64)
     tm.assert_frame_equal(df, df0, check_exact=False)
+
+
+def test_date_time(datapath):
+    # Support of different SAS date/datetime formats (PR #15871)
+    fname = datapath("io", "sas", "data", "datetime.sas7bdat")
+    df = pd.read_sas(fname)
+    fname = datapath("io", "sas", "data", "datetime.csv")
+    df0 = pd.read_csv(fname, parse_dates=['Date1', 'Date2', 'DateTime',
+                                          'DateTimeHi', 'Taiw'])
+    # GH 19732: Timestamps imported from sas will incur floating point errors
+    df.iloc[:, 3] = df.iloc[:, 3].dt.round('us')
+    tm.assert_frame_equal(df, df0)
+
+
+def test_compact_numerical_values(datapath):
+    # Regression test for #21616
+    fname = datapath("io", "sas", "data", "cars.sas7bdat")
+    df = pd.read_sas(fname, encoding='latin-1')
+    # The two columns CYL and WGT in cars.sas7bdat have column
+    # width < 8 and only contain integral values.
+    # Test that pandas doesn't corrupt the numbers by adding
+    # decimals.
+    result = df['WGT']
+    expected = df['WGT'].round()
+    tm.assert_series_equal(result, expected, check_exact=True)
+    result = df['CYL']
+    expected = df['CYL'].round()
+    tm.assert_series_equal(result, expected, check_exact=True)
+
+
+def test_many_columns(datapath):
+    # Test for looking for column information in more places (PR #22628)
+    fname = datapath("io", "sas", "data", "many_columns.sas7bdat")
+    df = pd.read_sas(fname, encoding='latin-1')
+    fname = datapath("io", "sas", "data", "many_columns.csv")
+    df0 = pd.read_csv(fname, encoding='latin-1')
+    tm.assert_frame_equal(df, df0)
+
+
+def test_inconsistent_number_of_rows(datapath):
+    # Regression test for issue #16615. (PR #22628)
+    fname = datapath("io", "sas", "data", "load_log.sas7bdat")
+    df = pd.read_sas(fname, encoding='latin-1')
+    assert len(df) == 2097
+
+
+def test_zero_variables(datapath):
+    # Check if the SAS file has zero variables (PR #18184)
+    fname = datapath("io", "sas", "data", "zero_variables.sas7bdat")
+    with pytest.raises(EmptyDataError):
+        pd.read_sas(fname)
diff --git a/pandas/tests/io/sas/test_xport.py b/pandas/tests/io/sas/test_xport.py
index fe2f7cb4bf4be..1b086daf51c41 100644
--- a/pandas/tests/io/sas/test_xport.py
+++ b/pandas/tests/io/sas/test_xport.py
@@ -1,8 +1,12 @@
+import os
+
+import numpy as np
+import pytest
+
 import pandas as pd
 import pandas.util.testing as tm
+
 from pandas.io.sas.sasreader import read_sas
-import numpy as np
-import os
 
 # CSV versions of test xpt files were obtained using the R foreign library
 
@@ -16,10 +20,11 @@ def numeric_as_float(data):
             data[v] = data[v].astype(np.float64)
 
 
-class TestXport(tm.TestCase):
+class TestXport(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "sas", "data")
         self.file01 = os.path.join(self.dirpath, "DEMO_G.xpt")
         self.file02 = os.path.join(self.dirpath, "SSHSV1_A.xpt")
         self.file03 = os.path.join(self.dirpath, "DRXFCD_G.xpt")
@@ -40,7 +45,7 @@ def test1_basic(self):
         # Test reading beyond end of file
         reader = read_sas(self.file01, format="xport", iterator=True)
         data = reader.read(num_rows + 100)
-        self.assertTrue(data.shape[0] == num_rows)
+        assert data.shape[0] == num_rows
         reader.close()
 
         # Test incremental read with `read` method.
@@ -61,7 +66,7 @@ def test1_basic(self):
         for x in reader:
             m += x.shape[0]
         reader.close()
-        self.assertTrue(m == num_rows)
+        assert m == num_rows
 
         # Read full file with `read_sas` method
         data = read_sas(self.file01)
diff --git a/pandas/tests/io/test_clipboard.py b/pandas/tests/io/test_clipboard.py
index 2e701143357e3..565db92210b0a 100644
--- a/pandas/tests/io/test_clipboard.py
+++ b/pandas/tests/io/test_clipboard.py
@@ -1,109 +1,205 @@
 # -*- coding: utf-8 -*-
+from textwrap import dedent
+
 import numpy as np
 from numpy.random import randint
-
 import pytest
-import pandas as pd
 
-from pandas import DataFrame
-from pandas import read_clipboard
-from pandas import get_option
+from pandas.compat import PY2
+
+import pandas as pd
+from pandas import DataFrame, get_option, read_clipboard
 from pandas.util import testing as tm
 from pandas.util.testing import makeCustomDataframe as mkdf
-from pandas.util.clipboard.exceptions import PyperclipException
 
+from pandas.io.clipboard import clipboard_get, clipboard_set
+from pandas.io.clipboard.exceptions import PyperclipException
 
 try:
     DataFrame({'A': [1, 2]}).to_clipboard()
     _DEPS_INSTALLED = 1
-except PyperclipException:
+except (PyperclipException, RuntimeError):
     _DEPS_INSTALLED = 0
 
 
+def build_kwargs(sep, excel):
+    kwargs = {}
+    if excel != 'default':
+        kwargs['excel'] = excel
+    if sep != 'default':
+        kwargs['sep'] = sep
+    return kwargs
+
+
+@pytest.fixture(params=['delims', 'utf8', 'utf16', 'string', 'long',
+                        'nonascii', 'colwidth', 'mixed', 'float', 'int'])
+def df(request):
+    data_type = request.param
+
+    if data_type == 'delims':
+        return pd.DataFrame({'a': ['"a,\t"b|c', 'd\tef´'],
+                             'b': ['hi\'j', 'k\'\'lm']})
+    elif data_type == 'utf8':
+        return pd.DataFrame({'a': ['µasd', 'Ωœ∑´'],
+                             'b': ['øπ∆˚¬', 'œ∑´®']})
+    elif data_type == 'utf16':
+        return pd.DataFrame({'a': ['\U0001f44d\U0001f44d',
+                                   '\U0001f44d\U0001f44d'],
+                             'b': ['abc', 'def']})
+    elif data_type == 'string':
+        return mkdf(5, 3, c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'long':
+        max_rows = get_option('display.max_rows')
+        return mkdf(max_rows + 1, 3,
+                    data_gen_f=lambda *args: randint(2),
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'nonascii':
+        return pd.DataFrame({'en': 'in English'.split(),
+                             'es': 'en español'.split()})
+    elif data_type == 'colwidth':
+        _cw = get_option('display.max_colwidth') + 1
+        return mkdf(5, 3, data_gen_f=lambda *args: 'x' * _cw,
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'mixed':
+        return DataFrame({'a': np.arange(1.0, 6.0) + 0.01,
+                          'b': np.arange(1, 6),
+                          'c': list('abcde')})
+    elif data_type == 'float':
+        return mkdf(5, 3, data_gen_f=lambda r, c: float(r) + 0.01,
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    elif data_type == 'int':
+        return mkdf(5, 3, data_gen_f=lambda *args: randint(2),
+                    c_idx_type='s', r_idx_type='i',
+                    c_idx_names=[None], r_idx_names=[None])
+    else:
+        raise ValueError
+
+
+@pytest.fixture
+def mock_clipboard(monkeypatch, request):
+    """Fixture mocking clipboard IO.
+
+    This mocks pandas.io.clipboard.clipboard_get and
+    pandas.io.clipboard.clipboard_set.
+
+    This uses a local dict for storing data. The dictionary
+    key used is the test ID, available with ``request.node.name``.
+
+    This returns the local dictionary, for direct manipulation by
+    tests.
+    """
+
+    # our local clipboard for tests
+    _mock_data = {}
+
+    def _mock_set(data):
+        _mock_data[request.node.name] = data
+
+    def _mock_get():
+        return _mock_data[request.node.name]
+
+    monkeypatch.setattr("pandas.io.clipboard.clipboard_set", _mock_set)
+    monkeypatch.setattr("pandas.io.clipboard.clipboard_get", _mock_get)
+
+    yield _mock_data
+
+
+@pytest.mark.clipboard
+def test_mock_clipboard(mock_clipboard):
+    import pandas.io.clipboard
+    pandas.io.clipboard.clipboard_set("abc")
+    assert "abc" in set(mock_clipboard.values())
+    result = pandas.io.clipboard.clipboard_get()
+    assert result == "abc"
+
+
 @pytest.mark.single
+@pytest.mark.clipboard
 @pytest.mark.skipif(not _DEPS_INSTALLED,
                     reason="clipboard primitives not installed")
-class TestClipboard(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestClipboard, cls).setUpClass()
-        cls.data = {}
-        cls.data['string'] = mkdf(5, 3, c_idx_type='s', r_idx_type='i',
-                                  c_idx_names=[None], r_idx_names=[None])
-        cls.data['int'] = mkdf(5, 3, data_gen_f=lambda *args: randint(2),
-                               c_idx_type='s', r_idx_type='i',
-                               c_idx_names=[None], r_idx_names=[None])
-        cls.data['float'] = mkdf(5, 3,
-                                 data_gen_f=lambda r, c: float(r) + 0.01,
-                                 c_idx_type='s', r_idx_type='i',
-                                 c_idx_names=[None], r_idx_names=[None])
-        cls.data['mixed'] = DataFrame({'a': np.arange(1.0, 6.0) + 0.01,
-                                       'b': np.arange(1, 6),
-                                       'c': list('abcde')})
-
-        # Test columns exceeding "max_colwidth" (GH8305)
-        _cw = get_option('display.max_colwidth') + 1
-        cls.data['colwidth'] = mkdf(5, 3, data_gen_f=lambda *args: 'x' * _cw,
-                                    c_idx_type='s', r_idx_type='i',
-                                    c_idx_names=[None], r_idx_names=[None])
-        # Test GH-5346
-        max_rows = get_option('display.max_rows')
-        cls.data['longdf'] = mkdf(max_rows + 1, 3,
-                                  data_gen_f=lambda *args: randint(2),
-                                  c_idx_type='s', r_idx_type='i',
-                                  c_idx_names=[None], r_idx_names=[None])
-        # Test for non-ascii text: GH9263
-        cls.data['nonascii'] = pd.DataFrame({'en': 'in English'.split(),
-                                             'es': 'en español'.split()})
-        # unicode round trip test for GH 13747, GH 12529
-        cls.data['utf8'] = pd.DataFrame({'a': ['µasd', 'Ωœ∑´'],
-                                         'b': ['øπ∆˚¬', 'œ∑´®']})
-        cls.data_types = list(cls.data.keys())
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestClipboard, cls).tearDownClass()
-        del cls.data_types, cls.data
-
-    def check_round_trip_frame(self, data_type, excel=None, sep=None,
+@pytest.mark.usefixtures("mock_clipboard")
+class TestClipboard(object):
+
+    def check_round_trip_frame(self, data, excel=None, sep=None,
                                encoding=None):
-        data = self.data[data_type]
         data.to_clipboard(excel=excel, sep=sep, encoding=encoding)
-        if sep is not None:
-            result = read_clipboard(sep=sep, index_col=0, encoding=encoding)
-        else:
-            result = read_clipboard(encoding=encoding)
+        result = read_clipboard(sep=sep or '\t', index_col=0,
+                                encoding=encoding)
         tm.assert_frame_equal(data, result, check_dtype=False)
 
-    def test_round_trip_frame_sep(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt, sep=',')
-            self.check_round_trip_frame(dt, sep=r'\s+')
-            self.check_round_trip_frame(dt, sep='|')
-
-    def test_round_trip_frame_string(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt, excel=False)
-
-    def test_round_trip_frame(self):
-        for dt in self.data_types:
-            self.check_round_trip_frame(dt)
-
-    def test_read_clipboard_infer_excel(self):
-        from textwrap import dedent
-        from pandas.util.clipboard import clipboard_set
+    # Test that default arguments copy as tab delimited
+    def test_round_trip_frame(self, df):
+        self.check_round_trip_frame(df)
+
+    # Test that explicit delimiters are respected
+    @pytest.mark.parametrize('sep', ['\t', ',', '|'])
+    def test_round_trip_frame_sep(self, df, sep):
+        self.check_round_trip_frame(df, sep=sep)
+
+    # Test white space separator
+    def test_round_trip_frame_string(self, df):
+        df.to_clipboard(excel=False, sep=None)
+        result = read_clipboard()
+        assert df.to_string() == result.to_string()
+        assert df.shape == result.shape
+
+    # Two character separator is not supported in to_clipboard
+    # Test that multi-character separators are not silently passed
+    def test_excel_sep_warning(self, df):
+        with tm.assert_produces_warning():
+            df.to_clipboard(excel=True, sep=r'\t')
+
+    # Separator is ignored when excel=False and should produce a warning
+    def test_copy_delim_warning(self, df):
+        with tm.assert_produces_warning():
+            df.to_clipboard(excel=False, sep='\t')
+
+    # Tests that the default behavior of to_clipboard is tab
+    # delimited and excel="True"
+    @pytest.mark.parametrize('sep', ['\t', None, 'default'])
+    @pytest.mark.parametrize('excel', [True, None, 'default'])
+    def test_clipboard_copy_tabs_default(self, sep, excel, df, request,
+                                         mock_clipboard):
+        kwargs = build_kwargs(sep, excel)
+        df.to_clipboard(**kwargs)
+        if PY2:
+            # to_clipboard copies unicode, to_csv produces bytes. This is
+            # expected behavior
+            result = mock_clipboard[request.node.name].encode('utf-8')
+            expected = df.to_csv(sep='\t')
+            assert result == expected
+        else:
+            assert mock_clipboard[request.node.name] == df.to_csv(sep='\t')
+
+    # Tests reading of white space separated tables
+    @pytest.mark.parametrize('sep', [None, 'default'])
+    @pytest.mark.parametrize('excel', [False])
+    def test_clipboard_copy_strings(self, sep, excel, df):
+        kwargs = build_kwargs(sep, excel)
+        df.to_clipboard(**kwargs)
+        result = read_clipboard(sep=r'\s+')
+        assert result.to_string() == df.to_string()
+        assert df.shape == result.shape
+
+    def test_read_clipboard_infer_excel(self, request,
+                                        mock_clipboard):
+        # gh-19010: avoid warnings
+        clip_kwargs = dict(engine="python")
 
         text = dedent("""
             John James	Charlie Mingus
             1	2
             4	Harry Carney
             """.strip())
-        clipboard_set(text)
-        df = pd.read_clipboard()
+        mock_clipboard[request.node.name] = text
+        df = pd.read_clipboard(**clip_kwargs)
 
         # excel data is parsed correctly
-        self.assertEqual(df.iloc[1][1], 'Harry Carney')
+        assert df.iloc[1][1] == 'Harry Carney'
 
         # having diff tab counts doesn't trigger it
         text = dedent("""
@@ -111,28 +207,37 @@ def test_read_clipboard_infer_excel(self):
             1  2
             3  4
             """.strip())
-        clipboard_set(text)
-        res = pd.read_clipboard()
+        mock_clipboard[request.node.name] = text
+        res = pd.read_clipboard(**clip_kwargs)
 
         text = dedent("""
             a  b
             1  2
             3  4
             """.strip())
-        clipboard_set(text)
-        exp = pd.read_clipboard()
+        mock_clipboard[request.node.name] = text
+        exp = pd.read_clipboard(**clip_kwargs)
 
         tm.assert_frame_equal(res, exp)
 
-    def test_invalid_encoding(self):
+    def test_invalid_encoding(self, df):
         # test case for testing invalid encoding
-        data = self.data['string']
-        with tm.assertRaises(ValueError):
-            data.to_clipboard(encoding='ascii')
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(ValueError):
+            df.to_clipboard(encoding='ascii')
+        with pytest.raises(NotImplementedError):
             pd.read_clipboard(encoding='ascii')
 
-    def test_round_trip_valid_encodings(self):
-        for enc in ['UTF-8', 'utf-8', 'utf8']:
-            for dt in self.data_types:
-                self.check_round_trip_frame(dt, encoding=enc)
+    @pytest.mark.parametrize('enc', ['UTF-8', 'utf-8', 'utf8'])
+    def test_round_trip_valid_encodings(self, enc, df):
+        self.check_round_trip_frame(df, encoding=enc)
+
+
+@pytest.mark.single
+@pytest.mark.clipboard
+@pytest.mark.skipif(not _DEPS_INSTALLED,
+                    reason="clipboard primitives not installed")
+@pytest.mark.parametrize('data', [u'\U0001f44d...', u'Ωœ∑´...', 'abcd...'])
+def test_raw_roundtrip(data):
+    # PR #25040 wide unicode wasn't copied correctly on PY3 on windows
+    clipboard_set(data)
+    assert data == clipboard_get()
diff --git a/pandas/tests/io/test_common.py b/pandas/tests/io/test_common.py
index 3c980cae3351a..3354bca63be92 100644
--- a/pandas/tests/io/test_common.py
+++ b/pandas/tests/io/test_common.py
@@ -1,30 +1,50 @@
 """
-    Tests for the pandas.io.common functionalities
+Tests for the pandas.io.common functionalities
 """
 import mmap
 import os
-from os.path import isabs
 
-import pandas.util.testing as tm
+import pytest
 
-from pandas.io import common
-from pandas.compat import is_platform_windows, StringIO
+from pandas.compat import FileNotFoundError, StringIO, is_platform_windows
+import pandas.util._test_decorators as td
 
-from pandas import read_csv, concat
 import pandas as pd
+import pandas.util.testing as tm
+
+import pandas.io.common as icom
+
+
+class CustomFSPath(object):
+    """For testing fspath on unknown objects"""
+    def __init__(self, path):
+        self.path = path
+
+    def __fspath__(self):
+        return self.path
+
+
+# Functions that consume a string path and return a string or path-like object
+path_types = [str, CustomFSPath]
 
 try:
     from pathlib import Path
+    path_types.append(Path)
 except ImportError:
     pass
 
 try:
     from py.path import local as LocalPath
+    path_types.append(LocalPath)
 except ImportError:
     pass
 
+HERE = os.path.abspath(os.path.dirname(__file__))
+
 
-class TestCommonIOCapabilities(tm.TestCase):
+# https://github.com/cython/cython/issues/1720
+@pytest.mark.filterwarnings("ignore:can't resolve package:ImportWarning")
+class TestCommonIOCapabilities(object):
     data1 = """index,A,B,C,D
 foo,2,3,4,5
 bar,7,8,9,10
@@ -36,84 +56,252 @@ class TestCommonIOCapabilities(tm.TestCase):
 
     def test_expand_user(self):
         filename = '~/sometest'
-        expanded_name = common._expand_user(filename)
+        expanded_name = icom._expand_user(filename)
 
-        self.assertNotEqual(expanded_name, filename)
-        self.assertTrue(isabs(expanded_name))
-        self.assertEqual(os.path.expanduser(filename), expanded_name)
+        assert expanded_name != filename
+        assert os.path.isabs(expanded_name)
+        assert os.path.expanduser(filename) == expanded_name
 
     def test_expand_user_normal_path(self):
         filename = '/somefolder/sometest'
-        expanded_name = common._expand_user(filename)
+        expanded_name = icom._expand_user(filename)
 
-        self.assertEqual(expanded_name, filename)
-        self.assertEqual(os.path.expanduser(filename), expanded_name)
+        assert expanded_name == filename
+        assert os.path.expanduser(filename) == expanded_name
 
+    @td.skip_if_no('pathlib')
     def test_stringify_path_pathlib(self):
-        tm._skip_if_no_pathlib()
-
-        rel_path = common._stringify_path(Path('.'))
-        self.assertEqual(rel_path, '.')
-        redundant_path = common._stringify_path(Path('foo//bar'))
-        self.assertEqual(redundant_path, os.path.join('foo', 'bar'))
+        rel_path = icom._stringify_path(Path('.'))
+        assert rel_path == '.'
+        redundant_path = icom._stringify_path(Path('foo//bar'))
+        assert redundant_path == os.path.join('foo', 'bar')
 
+    @td.skip_if_no('py.path')
     def test_stringify_path_localpath(self):
-        tm._skip_if_no_localpath()
-
         path = os.path.join('foo', 'bar')
         abs_path = os.path.abspath(path)
         lpath = LocalPath(path)
-        self.assertEqual(common._stringify_path(lpath), abs_path)
+        assert icom._stringify_path(lpath) == abs_path
+
+    def test_stringify_path_fspath(self):
+        p = CustomFSPath('foo/bar.csv')
+        result = icom._stringify_path(p)
+        assert result == 'foo/bar.csv'
+
+    @pytest.mark.parametrize('extension,expected', [
+        ('', None),
+        ('.gz', 'gzip'),
+        ('.bz2', 'bz2'),
+        ('.zip', 'zip'),
+        ('.xz', 'xz'),
+    ])
+    @pytest.mark.parametrize('path_type', path_types)
+    def test_infer_compression_from_path(self, extension, expected, path_type):
+        path = path_type('foo/bar.csv' + extension)
+        compression = icom._infer_compression(path, compression='infer')
+        assert compression == expected
 
     def test_get_filepath_or_buffer_with_path(self):
         filename = '~/sometest'
-        filepath_or_buffer, _, _ = common.get_filepath_or_buffer(filename)
-        self.assertNotEqual(filepath_or_buffer, filename)
-        self.assertTrue(isabs(filepath_or_buffer))
-        self.assertEqual(os.path.expanduser(filename), filepath_or_buffer)
+        filepath_or_buffer, _, _, should_close = icom.get_filepath_or_buffer(
+            filename)
+        assert filepath_or_buffer != filename
+        assert os.path.isabs(filepath_or_buffer)
+        assert os.path.expanduser(filename) == filepath_or_buffer
+        assert not should_close
 
     def test_get_filepath_or_buffer_with_buffer(self):
         input_buffer = StringIO()
-        filepath_or_buffer, _, _ = common.get_filepath_or_buffer(input_buffer)
-        self.assertEqual(filepath_or_buffer, input_buffer)
+        filepath_or_buffer, _, _, should_close = icom.get_filepath_or_buffer(
+            input_buffer)
+        assert filepath_or_buffer == input_buffer
+        assert not should_close
 
     def test_iterator(self):
-        reader = read_csv(StringIO(self.data1), chunksize=1)
-        result = concat(reader, ignore_index=True)
-        expected = read_csv(StringIO(self.data1))
+        reader = pd.read_csv(StringIO(self.data1), chunksize=1)
+        result = pd.concat(reader, ignore_index=True)
+        expected = pd.read_csv(StringIO(self.data1))
         tm.assert_frame_equal(result, expected)
 
         # GH12153
-        it = read_csv(StringIO(self.data1), chunksize=1)
+        it = pd.read_csv(StringIO(self.data1), chunksize=1)
         first = next(it)
         tm.assert_frame_equal(first, expected.iloc[[0]])
-        tm.assert_frame_equal(concat(it), expected.iloc[1:])
+        tm.assert_frame_equal(pd.concat(it), expected.iloc[1:])
+
+    @pytest.mark.parametrize('reader, module, error_class, fn_ext', [
+        (pd.read_csv, 'os', FileNotFoundError, 'csv'),
+        (pd.read_fwf, 'os', FileNotFoundError, 'txt'),
+        (pd.read_excel, 'xlrd', FileNotFoundError, 'xlsx'),
+        (pd.read_feather, 'feather', Exception, 'feather'),
+        (pd.read_hdf, 'tables', FileNotFoundError, 'h5'),
+        (pd.read_stata, 'os', FileNotFoundError, 'dta'),
+        (pd.read_sas, 'os', FileNotFoundError, 'sas7bdat'),
+        (pd.read_json, 'os', ValueError, 'json'),
+        (pd.read_msgpack, 'os', ValueError, 'mp'),
+        (pd.read_pickle, 'os', FileNotFoundError, 'pickle'),
+    ])
+    def test_read_non_existant(self, reader, module, error_class, fn_ext):
+        pytest.importorskip(module)
+
+        path = os.path.join(HERE, 'data', 'does_not_exist.' + fn_ext)
+        msg1 = (r"File (b')?.+does_not_exist\.{}'? does not exist"
+                .format(fn_ext))
+        msg2 = (r"\[Errno 2\] No such file or directory: '.+does_not_exist"
+                r"\.{}'").format(fn_ext)
+        msg3 = "Expected object or value"
+        msg4 = "path_or_buf needs to be a string file path or file-like"
+        msg5 = (r"\[Errno 2\] File .+does_not_exist\.{} does not exist:"
+                r" '.+does_not_exist\.{}'").format(fn_ext, fn_ext)
+        with pytest.raises(error_class, match=r"({}|{}|{}|{}|{})".format(
+                msg1, msg2, msg3, msg4, msg5)):
+            reader(path)
+
+    @pytest.mark.parametrize('reader, module, error_class, fn_ext', [
+        (pd.read_csv, 'os', FileNotFoundError, 'csv'),
+        (pd.read_fwf, 'os', FileNotFoundError, 'txt'),
+        (pd.read_excel, 'xlrd', FileNotFoundError, 'xlsx'),
+        (pd.read_feather, 'feather', Exception, 'feather'),
+        (pd.read_hdf, 'tables', FileNotFoundError, 'h5'),
+        (pd.read_stata, 'os', FileNotFoundError, 'dta'),
+        (pd.read_sas, 'os', FileNotFoundError, 'sas7bdat'),
+        (pd.read_json, 'os', ValueError, 'json'),
+        (pd.read_msgpack, 'os', ValueError, 'mp'),
+        (pd.read_pickle, 'os', FileNotFoundError, 'pickle'),
+    ])
+    def test_read_expands_user_home_dir(self, reader, module,
+                                        error_class, fn_ext, monkeypatch):
+        pytest.importorskip(module)
+
+        path = os.path.join('~', 'does_not_exist.' + fn_ext)
+        monkeypatch.setattr(icom, '_expand_user',
+                            lambda x: os.path.join('foo', x))
+
+        msg1 = (r"File (b')?.+does_not_exist\.{}'? does not exist"
+                .format(fn_ext))
+        msg2 = (r"\[Errno 2\] No such file or directory:"
+                r" '.+does_not_exist\.{}'").format(fn_ext)
+        msg3 = "Unexpected character found when decoding 'false'"
+        msg4 = "path_or_buf needs to be a string file path or file-like"
+        msg5 = (r"\[Errno 2\] File .+does_not_exist\.{} does not exist:"
+                r" '.+does_not_exist\.{}'").format(fn_ext, fn_ext)
+
+        with pytest.raises(error_class, match=r"({}|{}|{}|{}|{})".format(
+                msg1, msg2, msg3, msg4, msg5)):
+            reader(path)
+
+    def test_read_non_existant_read_table(self):
+        path = os.path.join(HERE, 'data', 'does_not_exist.' + 'csv')
+        msg1 = r"File b'.+does_not_exist\.csv' does not exist"
+        msg2 = (r"\[Errno 2\] File .+does_not_exist\.csv does not exist:"
+                r" '.+does_not_exist\.csv'")
+        with pytest.raises(FileNotFoundError, match=r"({}|{})".format(
+                msg1, msg2)):
+            with tm.assert_produces_warning(FutureWarning):
+                pd.read_table(path)
+
+    @pytest.mark.parametrize('reader, module, path', [
+        (pd.read_csv, 'os', ('io', 'data', 'iris.csv')),
+        (pd.read_fwf, 'os', ('io', 'data', 'fixed_width_format.txt')),
+        (pd.read_excel, 'xlrd', ('io', 'data', 'test1.xlsx')),
+        (pd.read_feather, 'feather', ('io', 'data', 'feather-0_3_1.feather')),
+        (pd.read_hdf, 'tables', ('io', 'data', 'legacy_hdf',
+                                 'datetimetz_object.h5')),
+        (pd.read_stata, 'os', ('io', 'data', 'stata10_115.dta')),
+        (pd.read_sas, 'os', ('io', 'sas', 'data', 'test1.sas7bdat')),
+        (pd.read_json, 'os', ('io', 'json', 'data', 'tsframe_v012.json')),
+        (pd.read_msgpack, 'os', ('io', 'msgpack', 'data', 'frame.mp')),
+        (pd.read_pickle, 'os', ('io', 'data', 'categorical_0_14_1.pickle')),
+    ])
+    def test_read_fspath_all(self, reader, module, path, datapath):
+        pytest.importorskip(module)
+        path = datapath(*path)
+
+        mypath = CustomFSPath(path)
+        result = reader(mypath)
+        expected = reader(path)
+
+        if path.endswith('.pickle'):
+            # categorical
+            tm.assert_categorical_equal(result, expected)
+        else:
+            tm.assert_frame_equal(result, expected)
+
+    def test_read_fspath_all_read_table(self, datapath):
+        path = datapath('io', 'data', 'iris.csv')
 
-    def test_error_rename(self):
-        # see gh-12665
-        try:
-            raise common.CParserError()
-        except common.ParserError:
-            pass
+        mypath = CustomFSPath(path)
+        with tm.assert_produces_warning(FutureWarning):
+            result = pd.read_table(mypath)
+        with tm.assert_produces_warning(FutureWarning):
+            expected = pd.read_table(path)
 
-        try:
-            raise common.ParserError()
-        except common.CParserError:
-            pass
+        if path.endswith('.pickle'):
+            # categorical
+            tm.assert_categorical_equal(result, expected)
+        else:
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('writer_name, writer_kwargs, module', [
+        ('to_csv', {}, 'os'),
+        ('to_excel', {'engine': 'xlwt'}, 'xlwt'),
+        ('to_feather', {}, 'feather'),
+        ('to_html', {}, 'os'),
+        ('to_json', {}, 'os'),
+        ('to_latex', {}, 'os'),
+        ('to_msgpack', {}, 'os'),
+        ('to_pickle', {}, 'os'),
+        ('to_stata', {}, 'os'),
+    ])
+    def test_write_fspath_all(self, writer_name, writer_kwargs, module):
+        p1 = tm.ensure_clean('string')
+        p2 = tm.ensure_clean('fspath')
+        df = pd.DataFrame({"A": [1, 2]})
+
+        with p1 as string, p2 as fspath:
+            pytest.importorskip(module)
+            mypath = CustomFSPath(fspath)
+            writer = getattr(df, writer_name)
+
+            writer(string, **writer_kwargs)
+            with open(string, 'rb') as f:
+                expected = f.read()
+
+            writer(mypath, **writer_kwargs)
+            with open(fspath, 'rb') as f:
+                result = f.read()
+
+            assert result == expected
+
+    def test_write_fspath_hdf5(self):
+        # Same test as write_fspath_all, except HDF5 files aren't
+        # necessarily byte-for-byte identical for a given dataframe, so we'll
+        # have to read and compare equality
+        pytest.importorskip('tables')
+
+        df = pd.DataFrame({"A": [1, 2]})
+        p1 = tm.ensure_clean('string')
+        p2 = tm.ensure_clean('fspath')
+
+        with p1 as string, p2 as fspath:
+            mypath = CustomFSPath(fspath)
+            df.to_hdf(mypath, key='bar')
+            df.to_hdf(string, key='bar')
+
+            result = pd.read_hdf(fspath, key='bar')
+            expected = pd.read_hdf(string, key='bar')
+
+        tm.assert_frame_equal(result, expected)
 
-        try:
-            raise common.ParserError()
-        except pd.parser.CParserError:
-            pass
 
+@pytest.fixture
+def mmap_file(datapath):
+    return datapath('io', 'data', 'test_mmap.csv')
 
-class TestMMapWrapper(tm.TestCase):
 
-    def setUp(self):
-        self.mmap_file = os.path.join(tm.get_data_path(),
-                                      'test_mmap.csv')
+class TestMMapWrapper(object):
 
-    def test_constructor_bad_file(self):
+    def test_constructor_bad_file(self, mmap_file):
         non_file = StringIO('I am not a file')
         non_file.fileno = lambda: -1
 
@@ -125,17 +313,19 @@ def test_constructor_bad_file(self):
             msg = "[Errno 22]"
             err = mmap.error
 
-        tm.assertRaisesRegexp(err, msg, common.MMapWrapper, non_file)
+        with pytest.raises(err, match=msg):
+            icom.MMapWrapper(non_file)
 
-        target = open(self.mmap_file, 'r')
+        target = open(mmap_file, 'r')
         target.close()
 
         msg = "I/O operation on closed file"
-        tm.assertRaisesRegexp(ValueError, msg, common.MMapWrapper, target)
+        with pytest.raises(ValueError, match=msg):
+            icom.MMapWrapper(target)
 
-    def test_get_attr(self):
-        with open(self.mmap_file, 'r') as target:
-            wrapper = common.MMapWrapper(target)
+    def test_get_attr(self, mmap_file):
+        with open(mmap_file, 'r') as target:
+            wrapper = icom.MMapWrapper(target)
 
         attrs = dir(wrapper.mmap)
         attrs = [attr for attr in attrs
@@ -143,17 +333,25 @@ def test_get_attr(self):
         attrs.append('__next__')
 
         for attr in attrs:
-            self.assertTrue(hasattr(wrapper, attr))
+            assert hasattr(wrapper, attr)
 
-        self.assertFalse(hasattr(wrapper, 'foo'))
+        assert not hasattr(wrapper, 'foo')
 
-    def test_next(self):
-        with open(self.mmap_file, 'r') as target:
-            wrapper = common.MMapWrapper(target)
+    def test_next(self, mmap_file):
+        with open(mmap_file, 'r') as target:
+            wrapper = icom.MMapWrapper(target)
             lines = target.readlines()
 
         for line in lines:
             next_line = next(wrapper)
-            self.assertEqual(next_line.strip(), line.strip())
+            assert next_line.strip() == line.strip()
+
+        with pytest.raises(StopIteration, match=r'^$'):
+            next(wrapper)
 
-        self.assertRaises(StopIteration, next, wrapper)
+    def test_unknown_engine(self):
+        with tm.ensure_clean() as path:
+            df = tm.makeDataFrame()
+            df.to_csv(path)
+            with pytest.raises(ValueError, match='Unknown engine'):
+                pd.read_csv(path, engine='pyt')
diff --git a/pandas/tests/io/test_compression.py b/pandas/tests/io/test_compression.py
new file mode 100644
index 0000000000000..a3fb35f9f01f2
--- /dev/null
+++ b/pandas/tests/io/test_compression.py
@@ -0,0 +1,116 @@
+import contextlib
+import os
+import warnings
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+import pandas.io.common as icom
+
+
+@contextlib.contextmanager
+def catch_to_csv_depr():
+    # Catching warnings because Series.to_csv has
+    # been deprecated. Remove this context when
+    # Series.to_csv has been aligned.
+
+    with warnings.catch_warnings(record=True):
+        warnings.simplefilter("ignore", FutureWarning)
+        yield
+
+
+@pytest.mark.parametrize('obj', [
+    pd.DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                        [12.32112, 123123.2, 321321.2]],
+                 columns=['X', 'Y', 'Z']),
+    pd.Series(100 * [0.123456, 0.234567, 0.567567], name='X')])
+@pytest.mark.parametrize('method', ['to_pickle', 'to_json', 'to_csv'])
+def test_compression_size(obj, method, compression_only):
+    with tm.ensure_clean() as path:
+        with catch_to_csv_depr():
+            getattr(obj, method)(path, compression=compression_only)
+            compressed_size = os.path.getsize(path)
+            getattr(obj, method)(path, compression=None)
+            uncompressed_size = os.path.getsize(path)
+            assert uncompressed_size > compressed_size
+
+
+@pytest.mark.parametrize('obj', [
+    pd.DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                        [12.32112, 123123.2, 321321.2]],
+                 columns=['X', 'Y', 'Z']),
+    pd.Series(100 * [0.123456, 0.234567, 0.567567], name='X')])
+@pytest.mark.parametrize('method', ['to_csv', 'to_json'])
+def test_compression_size_fh(obj, method, compression_only):
+    with tm.ensure_clean() as path:
+        f, handles = icom._get_handle(path, 'w', compression=compression_only)
+        with catch_to_csv_depr():
+            with f:
+                getattr(obj, method)(f)
+                assert not f.closed
+            assert f.closed
+            compressed_size = os.path.getsize(path)
+    with tm.ensure_clean() as path:
+        f, handles = icom._get_handle(path, 'w', compression=None)
+        with catch_to_csv_depr():
+            with f:
+                getattr(obj, method)(f)
+                assert not f.closed
+        assert f.closed
+        uncompressed_size = os.path.getsize(path)
+        assert uncompressed_size > compressed_size
+
+
+@pytest.mark.parametrize('write_method, write_kwargs, read_method', [
+    ('to_csv', {'index': False}, pd.read_csv),
+    ('to_json', {}, pd.read_json),
+    ('to_pickle', {}, pd.read_pickle),
+])
+def test_dataframe_compression_defaults_to_infer(
+        write_method, write_kwargs, read_method, compression_only):
+    # GH22004
+    input = pd.DataFrame([[1.0, 0, -4], [3.4, 5, 2]], columns=['X', 'Y', 'Z'])
+    extension = icom._compression_to_extension[compression_only]
+    with tm.ensure_clean('compressed' + extension) as path:
+        getattr(input, write_method)(path, **write_kwargs)
+        output = read_method(path, compression=compression_only)
+    tm.assert_frame_equal(output, input)
+
+
+@pytest.mark.parametrize('write_method,write_kwargs,read_method,read_kwargs', [
+    ('to_csv', {'index': False, 'header': True},
+     pd.read_csv, {'squeeze': True}),
+    ('to_json', {}, pd.read_json, {'typ': 'series'}),
+    ('to_pickle', {}, pd.read_pickle, {}),
+])
+def test_series_compression_defaults_to_infer(
+        write_method, write_kwargs, read_method, read_kwargs,
+        compression_only):
+    # GH22004
+    input = pd.Series([0, 5, -2, 10], name='X')
+    extension = icom._compression_to_extension[compression_only]
+    with tm.ensure_clean('compressed' + extension) as path:
+        getattr(input, write_method)(path, **write_kwargs)
+        output = read_method(path, compression=compression_only, **read_kwargs)
+    tm.assert_series_equal(output, input, check_names=False)
+
+
+def test_compression_warning(compression_only):
+    # Assert that passing a file object to to_csv while explicitly specifying a
+    # compression protocol triggers a RuntimeWarning, as per GH21227.
+    # Note that pytest has an issue that causes assert_produces_warning to fail
+    # in Python 2 if the warning has occurred in previous tests
+    # (see https://git.io/fNEBm & https://git.io/fNEBC). Hence, should this
+    # test fail in just Python 2 builds, it likely indicates that other tests
+    # are producing RuntimeWarnings, thereby triggering the pytest bug.
+    df = pd.DataFrame(100 * [[0.123456, 0.234567, 0.567567],
+                             [12.32112, 123123.2, 321321.2]],
+                      columns=['X', 'Y', 'Z'])
+    with tm.ensure_clean() as path:
+        f, handles = icom._get_handle(path, 'w', compression=compression_only)
+        with tm.assert_produces_warning(RuntimeWarning,
+                                        check_stacklevel=False):
+            with f:
+                df.to_csv(f, compression=compression_only)
diff --git a/pandas/tests/io/test_date_converters.py b/pandas/tests/io/test_date_converters.py
new file mode 100644
index 0000000000000..c5a94883aa609
--- /dev/null
+++ b/pandas/tests/io/test_date_converters.py
@@ -0,0 +1,43 @@
+from datetime import datetime
+
+import numpy as np
+
+import pandas.util.testing as tm
+
+import pandas.io.date_converters as conv
+
+
+def test_parse_date_time():
+    dates = np.array(['2007/1/3', '2008/2/4'], dtype=object)
+    times = np.array(['05:07:09', '06:08:00'], dtype=object)
+    expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
+                         datetime(2008, 2, 4, 6, 8, 0)])
+
+    result = conv.parse_date_time(dates, times)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_parse_date_fields():
+    days = np.array([3, 4])
+    months = np.array([1, 2])
+    years = np.array([2007, 2008])
+    result = conv.parse_date_fields(years, months, days)
+
+    expected = np.array([datetime(2007, 1, 3), datetime(2008, 2, 4)])
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_parse_all_fields():
+    hours = np.array([5, 6])
+    minutes = np.array([7, 8])
+    seconds = np.array([9, 0])
+
+    days = np.array([3, 4])
+    years = np.array([2007, 2008])
+    months = np.array([1, 2])
+
+    result = conv.parse_all_fields(years, months, days,
+                                   hours, minutes, seconds)
+    expected = np.array([datetime(2007, 1, 3, 5, 7, 9),
+                         datetime(2008, 2, 4, 6, 8, 0)])
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/io/test_excel.py b/pandas/tests/io/test_excel.py
index 256a37e922177..04c9c58a326a4 100644
--- a/pandas/tests/io/test_excel.py
+++ b/pandas/tests/io/test_excel.py
@@ -1,75 +1,30 @@
-# pylint: disable=E1101
-
-from pandas.compat import u, range, map, openpyxl_compat, BytesIO, iteritems
-from datetime import datetime, date, time
-import sys
-import os
+from collections import OrderedDict
+import contextlib
+from datetime import date, datetime, time, timedelta
 from distutils.version import LooseVersion
-
+from functools import partial
+import os
 import warnings
-import operator
-import functools
-import pytest
 
-from numpy import nan
 import numpy as np
+from numpy import nan
+import pytest
+
+from pandas.compat import PY36, BytesIO, iteritems, map, range, u
+import pandas.util._test_decorators as td
 
 import pandas as pd
-from pandas import DataFrame, Index, MultiIndex
-from pandas.io.parsers import read_csv
-from pandas.io.excel import (
-    ExcelFile, ExcelWriter, read_excel, _XlwtWriter, _Openpyxl1Writer,
-    _Openpyxl20Writer, _Openpyxl22Writer, register_writer, _XlsxWriter
-)
-from pandas.io.common import URLError
-from pandas.util.testing import ensure_clean, makeCustomDataframe as mkdf
-from pandas.core.config import set_option, get_option
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.core.config import get_option, set_option
 import pandas.util.testing as tm
+from pandas.util.testing import ensure_clean, makeCustomDataframe as mkdf
 
-
-def _skip_if_no_xlrd():
-    try:
-        import xlrd
-        ver = tuple(map(int, xlrd.__VERSION__.split(".")[:2]))
-        if ver < (0, 9):
-            pytest.skip('xlrd < 0.9, skipping')
-    except ImportError:
-        pytest.skip('xlrd not installed, skipping')
-
-
-def _skip_if_no_xlwt():
-    try:
-        import xlwt  # NOQA
-    except ImportError:
-        pytest.skip('xlwt not installed, skipping')
-
-
-def _skip_if_no_openpyxl():
-    try:
-        import openpyxl  # NOQA
-    except ImportError:
-        pytest.skip('openpyxl not installed, skipping')
-
-
-def _skip_if_no_xlsxwriter():
-    try:
-        import xlsxwriter  # NOQA
-    except ImportError:
-        pytest.skip('xlsxwriter not installed, skipping')
-
-
-def _skip_if_no_excelsuite():
-    _skip_if_no_xlrd()
-    _skip_if_no_xlwt()
-    _skip_if_no_openpyxl()
-
-
-def _skip_if_no_s3fs():
-    try:
-        import s3fs  # noqa
-    except ImportError:
-        pytest.skip('s3fs not installed, skipping')
-
+from pandas.io.common import URLError
+from pandas.io.excel import (
+    ExcelFile, ExcelWriter, _OpenpyxlWriter, _XlsxWriter, _XlwtWriter,
+    read_excel, register_writer)
+from pandas.io.formats.excel import ExcelFormatter
+from pandas.io.parsers import read_csv
 
 _seriesd = tm.getSeriesData()
 _tsd = tm.getTimeSeriesData()
@@ -80,10 +35,26 @@ def _skip_if_no_s3fs():
 _mixed_frame['foo'] = 'bar'
 
 
+@contextlib.contextmanager
+def ignore_xlrd_time_clock_warning():
+    """
+    Context manager to ignore warnings raised by the xlrd library,
+    regarding the deprecation of `time.clock` in Python 3.7.
+    """
+    with warnings.catch_warnings():
+        warnings.filterwarnings(
+            action='ignore',
+            message='time.clock has been deprecated',
+            category=DeprecationWarning)
+        yield
+
+
+@td.skip_if_no('xlrd', '1.0.0')
 class SharedItems(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "data")
         self.frame = _frame.copy()
         self.frame2 = _frame2.copy()
         self.tsframe = _tsframe.copy()
@@ -92,7 +63,6 @@ def setUp(self):
     def get_csv_refdf(self, basename):
         """
         Obtain the reference data from read_csv with the Python engine.
-        Test data path is defined by pandas.util.testing.get_data_path()
 
         Parameters
         ----------
@@ -109,10 +79,9 @@ def get_csv_refdf(self, basename):
         dfref = read_csv(pref, index_col=0, parse_dates=True, engine='python')
         return dfref
 
-    def get_excelfile(self, basename):
+    def get_excelfile(self, basename, ext):
         """
-        Return test data ExcelFile instance. Test data path is defined by
-        pandas.util.testing.get_data_path()
+        Return test data ExcelFile instance.
 
         Parameters
         ----------
@@ -125,12 +94,11 @@ def get_excelfile(self, basename):
 
         excel : io.excel.ExcelFile
         """
-        return ExcelFile(os.path.join(self.dirpath, basename + self.ext))
+        return ExcelFile(os.path.join(self.dirpath, basename + ext))
 
-    def get_exceldf(self, basename, *args, **kwds):
+    def get_exceldf(self, basename, ext, *args, **kwds):
         """
-        Return test data DataFrame. Test data path is defined by
-        pandas.util.testing.get_data_path()
+        Return test data DataFrame.
 
         Parameters
         ----------
@@ -143,94 +111,208 @@ def get_exceldf(self, basename, *args, **kwds):
 
         df : DataFrame
         """
-        pth = os.path.join(self.dirpath, basename + self.ext)
+        pth = os.path.join(self.dirpath, basename + ext)
         return read_excel(pth, *args, **kwds)
 
 
 class ReadingTestsBase(SharedItems):
     # This is based on ExcelWriterBase
-    #
-    # Base class for test cases to run with different Excel readers.
-    # To add a reader test, define the following:
-    # 1. A check_skip function that skips your tests if your reader isn't
-    #    installed.
-    # 2. Add a property ext, which is the file extension that your reader
-    #    reades from. (needs to start with '.' so it's a valid path)
-    # 3. Add a property engine_name, which is the name of the reader class.
-    #    For the reader this is not used for anything at the moment.
-
-    def setUp(self):
-        self.check_skip()
-        super(ReadingTestsBase, self).setUp()
-
-    def test_parse_cols_int(self):
 
-        dfref = self.get_csv_refdf('test1')
-        dfref = dfref.reindex(columns=['A', 'B', 'C'])
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0, parse_cols=3)
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_cols=3)
+    @pytest.fixture(autouse=True, params=['xlrd', None])
+    def set_engine(self, request):
+        func_name = "get_exceldf"
+        old_func = getattr(self, func_name)
+        new_func = partial(old_func, engine=request.param)
+        setattr(self, func_name, new_func)
+        yield
+        setattr(self, func_name, old_func)
+
+    @td.skip_if_no("xlrd", "1.0.1")  # see gh-22682
+    def test_usecols_int(self, ext):
+
+        df_ref = self.get_csv_refdf("test1")
+        df_ref = df_ref.reindex(columns=["A", "B", "C"])
+
+        # usecols as int
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            with ignore_xlrd_time_clock_warning():
+                df1 = self.get_exceldf("test1", ext, "Sheet1",
+                                       index_col=0, usecols=3)
+
+        # usecols as int
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            with ignore_xlrd_time_clock_warning():
+                df2 = self.get_exceldf("test1", ext, "Sheet2", skiprows=[1],
+                                       index_col=0, usecols=3)
+
+        # parse_cols instead of usecols, usecols as int
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            with ignore_xlrd_time_clock_warning():
+                df3 = self.get_exceldf("test1", ext, "Sheet2", skiprows=[1],
+                                       index_col=0, parse_cols=3)
+
         # TODO add index to xls file)
-        tm.assert_frame_equal(df1, dfref, check_names=False)
-        tm.assert_frame_equal(df2, dfref, check_names=False)
+        tm.assert_frame_equal(df1, df_ref, check_names=False)
+        tm.assert_frame_equal(df2, df_ref, check_names=False)
+        tm.assert_frame_equal(df3, df_ref, check_names=False)
 
-    def test_parse_cols_list(self):
+    @td.skip_if_no('xlrd', '1.0.1')  # GH-22682
+    def test_usecols_list(self, ext):
 
         dfref = self.get_csv_refdf('test1')
         dfref = dfref.reindex(columns=['B', 'C'])
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0,
-                               parse_cols=[0, 2, 3])
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_cols=[0, 2, 3])
+        df1 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols=[0, 2, 3])
+        df2 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols=[0, 2, 3])
+
+        with tm.assert_produces_warning(FutureWarning):
+            with ignore_xlrd_time_clock_warning():
+                df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                                       index_col=0, parse_cols=[0, 2, 3])
+
         # TODO add index to xls file)
         tm.assert_frame_equal(df1, dfref, check_names=False)
         tm.assert_frame_equal(df2, dfref, check_names=False)
+        tm.assert_frame_equal(df3, dfref, check_names=False)
 
-    def test_parse_cols_str(self):
+    @td.skip_if_no('xlrd', '1.0.1')  # GH-22682
+    def test_usecols_str(self, ext):
 
         dfref = self.get_csv_refdf('test1')
 
         df1 = dfref.reindex(columns=['A', 'B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0,
-                               parse_cols='A:D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_cols='A:D')
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A:D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A:D')
+
+        with tm.assert_produces_warning(FutureWarning):
+            with ignore_xlrd_time_clock_warning():
+                df4 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                                       index_col=0, parse_cols='A:D')
+
         # TODO add index to xls, read xls ignores index name ?
         tm.assert_frame_equal(df2, df1, check_names=False)
         tm.assert_frame_equal(df3, df1, check_names=False)
+        tm.assert_frame_equal(df4, df1, check_names=False)
 
         df1 = dfref.reindex(columns=['B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0,
-                               parse_cols='A,C,D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_cols='A,C,D')
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A,C,D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A,C,D')
         # TODO add index to xls file
         tm.assert_frame_equal(df2, df1, check_names=False)
         tm.assert_frame_equal(df3, df1, check_names=False)
 
         df1 = dfref.reindex(columns=['B', 'C'])
-        df2 = self.get_exceldf('test1', 'Sheet1', index_col=0,
-                               parse_cols='A,C:D')
-        df3 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0,
-                               parse_cols='A,C:D')
+        df2 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
+                               usecols='A,C:D')
+        df3 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0, usecols='A,C:D')
         tm.assert_frame_equal(df2, df1, check_names=False)
         tm.assert_frame_equal(df3, df1, check_names=False)
 
-    def test_excel_stop_iterator(self):
+    @pytest.mark.parametrize("usecols", [
+        [0, 1, 3], [0, 3, 1],
+        [1, 0, 3], [1, 3, 0],
+        [3, 0, 1], [3, 1, 0],
+    ])
+    def test_usecols_diff_positional_int_columns_order(self, ext, usecols):
+        expected = self.get_csv_refdf("test1")[["A", "C"]]
+        result = self.get_exceldf("test1", ext, "Sheet1",
+                                  index_col=0, usecols=usecols)
+        tm.assert_frame_equal(result, expected, check_names=False)
+
+    @pytest.mark.parametrize("usecols", [
+        ["B", "D"], ["D", "B"]
+    ])
+    def test_usecols_diff_positional_str_columns_order(self, ext, usecols):
+        expected = self.get_csv_refdf("test1")[["B", "D"]]
+        expected.index = range(len(expected))
+
+        result = self.get_exceldf("test1", ext, "Sheet1", usecols=usecols)
+        tm.assert_frame_equal(result, expected, check_names=False)
+
+    def test_read_excel_without_slicing(self, ext):
+        expected = self.get_csv_refdf("test1")
+        result = self.get_exceldf("test1", ext, "Sheet1", index_col=0)
+        tm.assert_frame_equal(result, expected, check_names=False)
+
+    def test_usecols_excel_range_str(self, ext):
+        expected = self.get_csv_refdf("test1")[["C", "D"]]
+        result = self.get_exceldf("test1", ext, "Sheet1",
+                                  index_col=0, usecols="A,D:E")
+        tm.assert_frame_equal(result, expected, check_names=False)
+
+    def test_usecols_excel_range_str_invalid(self, ext):
+        msg = "Invalid column name: E1"
+
+        with pytest.raises(ValueError, match=msg):
+            self.get_exceldf("test1", ext, "Sheet1", usecols="D:E1")
+
+    def test_index_col_label_error(self, ext):
+        msg = "list indices must be integers.*, not str"
+
+        with pytest.raises(TypeError, match=msg):
+            self.get_exceldf("test1", ext, "Sheet1", index_col=["A"],
+                             usecols=["A", "C"])
+
+    def test_index_col_empty(self, ext):
+        # see gh-9208
+        result = self.get_exceldf("test1", ext, "Sheet3",
+                                  index_col=["A", "B", "C"])
+        expected = DataFrame(columns=["D", "E", "F"],
+                             index=MultiIndex(levels=[[]] * 3,
+                                              codes=[[]] * 3,
+                                              names=["A", "B", "C"]))
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("index_col", [None, 2])
+    def test_index_col_with_unnamed(self, ext, index_col):
+        # see gh-18792
+        result = self.get_exceldf("test1", ext, "Sheet4",
+                                  index_col=index_col)
+        expected = DataFrame([["i1", "a", "x"], ["i2", "b", "y"]],
+                             columns=["Unnamed: 0", "col1", "col2"])
+        if index_col:
+            expected = expected.set_index(expected.columns[index_col])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_usecols_pass_non_existent_column(self, ext):
+        msg = ("Usecols do not match columns, "
+               "columns expected but not found: " + r"\['E'\]")
+
+        with pytest.raises(ValueError, match=msg):
+            self.get_exceldf("test1", ext, usecols=["E"])
+
+    def test_usecols_wrong_type(self, ext):
+        msg = ("'usecols' must either be list-like of "
+               "all strings, all unicode, all integers or a callable.")
+
+        with pytest.raises(ValueError, match=msg):
+            self.get_exceldf("test1", ext, usecols=["E1", 0])
+
+    def test_excel_stop_iterator(self, ext):
 
-        parsed = self.get_exceldf('test2', 'Sheet1')
+        parsed = self.get_exceldf('test2', ext, 'Sheet1')
         expected = DataFrame([['aaaa', 'bbbbb']], columns=['Test', 'Test1'])
         tm.assert_frame_equal(parsed, expected)
 
-    def test_excel_cell_error_na(self):
+    def test_excel_cell_error_na(self, ext):
 
-        parsed = self.get_exceldf('test3', 'Sheet1')
+        parsed = self.get_exceldf('test3', ext, 'Sheet1')
         expected = DataFrame([[np.nan]], columns=['Test'])
         tm.assert_frame_equal(parsed, expected)
 
-    def test_excel_passes_na(self):
+    def test_excel_passes_na(self, ext):
 
-        excel = self.get_excelfile('test4')
+        excel = self.get_excelfile('test4', ext)
 
         parsed = read_excel(excel, 'Sheet1', keep_default_na=False,
                             na_values=['apple'])
@@ -245,7 +327,7 @@ def test_excel_passes_na(self):
         tm.assert_frame_equal(parsed, expected)
 
         # 13967
-        excel = self.get_excelfile('test5')
+        excel = self.get_excelfile('test5', ext)
 
         parsed = read_excel(excel, 'Sheet1', keep_default_na=False,
                             na_values=['apple'])
@@ -259,9 +341,21 @@ def test_excel_passes_na(self):
                              columns=['Test'])
         tm.assert_frame_equal(parsed, expected)
 
-    def test_excel_table_sheet_by_index(self):
+    @td.skip_if_no('xlrd', '1.0.1')  # GH-22682
+    def test_deprecated_sheetname(self, ext):
+        # gh-17964
+        excel = self.get_excelfile('test1', ext)
 
-        excel = self.get_excelfile('test1')
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            read_excel(excel, sheetname='Sheet1')
+
+        with pytest.raises(TypeError):
+            read_excel(excel, sheet='Sheet1')
+
+    @td.skip_if_no('xlrd', '1.0.1')  # GH-22682
+    def test_excel_table_sheet_by_index(self, ext):
+
+        excel = self.get_excelfile('test1', ext)
         dfref = self.get_csv_refdf('test1')
 
         df1 = read_excel(excel, 0, index_col=0)
@@ -275,39 +369,37 @@ def test_excel_table_sheet_by_index(self):
         tm.assert_frame_equal(df2, dfref, check_names=False)
 
         df3 = read_excel(excel, 0, index_col=0, skipfooter=1)
-        df4 = read_excel(excel, 0, index_col=0, skip_footer=1)
         tm.assert_frame_equal(df3, df1.iloc[:-1])
-        tm.assert_frame_equal(df3, df4)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df4 = read_excel(excel, 0, index_col=0, skip_footer=1)
+            tm.assert_frame_equal(df3, df4)
 
         df3 = excel.parse(0, index_col=0, skipfooter=1)
-        df4 = excel.parse(0, index_col=0, skip_footer=1)
         tm.assert_frame_equal(df3, df1.iloc[:-1])
-        tm.assert_frame_equal(df3, df4)
 
         import xlrd
-        with tm.assertRaises(xlrd.XLRDError):
+        with pytest.raises(xlrd.XLRDError):
             read_excel(excel, 'asdf')
 
-    def test_excel_table(self):
+    def test_excel_table(self, ext):
 
         dfref = self.get_csv_refdf('test1')
 
-        df1 = self.get_exceldf('test1', 'Sheet1', index_col=0)
-        df2 = self.get_exceldf('test1', 'Sheet2', skiprows=[1], index_col=0)
+        df1 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0)
+        df2 = self.get_exceldf('test1', ext, 'Sheet2', skiprows=[1],
+                               index_col=0)
         # TODO add index to file
         tm.assert_frame_equal(df1, dfref, check_names=False)
         tm.assert_frame_equal(df2, dfref, check_names=False)
 
-        df3 = self.get_exceldf('test1', 'Sheet1', index_col=0,
+        df3 = self.get_exceldf('test1', ext, 'Sheet1', index_col=0,
                                skipfooter=1)
-        df4 = self.get_exceldf('test1', 'Sheet1', index_col=0,
-                               skip_footer=1)
         tm.assert_frame_equal(df3, df1.iloc[:-1])
-        tm.assert_frame_equal(df3, df4)
 
-    def test_reader_special_dtypes(self):
+    def test_reader_special_dtypes(self, ext):
 
-        expected = DataFrame.from_items([
+        expected = DataFrame.from_dict(OrderedDict([
             ("IntCol", [1, 2, -3, 4, 0]),
             ("FloatCol", [1.25, 2.25, 1.83, 1.92, 0.0000000005]),
             ("BoolCol", [True, False, True, True, False]),
@@ -317,50 +409,49 @@ def test_reader_special_dtypes(self):
             ("DateCol", [datetime(2013, 10, 30), datetime(2013, 10, 31),
                          datetime(1905, 1, 1), datetime(2013, 12, 14),
                          datetime(2015, 3, 14)])
-        ])
-
+        ]))
         basename = 'test_types'
 
         # should read in correctly and infer types
-        actual = self.get_exceldf(basename, 'Sheet1')
+        actual = self.get_exceldf(basename, ext, 'Sheet1')
         tm.assert_frame_equal(actual, expected)
 
         # if not coercing number, then int comes in as float
         float_expected = expected.copy()
         float_expected["IntCol"] = float_expected["IntCol"].astype(float)
         float_expected.loc[float_expected.index[1], "Str2Col"] = 3.0
-        actual = self.get_exceldf(basename, 'Sheet1', convert_float=False)
+        actual = self.get_exceldf(basename, ext, 'Sheet1', convert_float=False)
         tm.assert_frame_equal(actual, float_expected)
 
         # check setting Index (assuming xls and xlsx are the same here)
         for icol, name in enumerate(expected.columns):
-            actual = self.get_exceldf(basename, 'Sheet1', index_col=icol)
+            actual = self.get_exceldf(basename, ext, 'Sheet1', index_col=icol)
             exp = expected.set_index(name)
             tm.assert_frame_equal(actual, exp)
 
         # convert_float and converters should be different but both accepted
         expected["StrCol"] = expected["StrCol"].apply(str)
         actual = self.get_exceldf(
-            basename, 'Sheet1', converters={"StrCol": str})
+            basename, ext, 'Sheet1', converters={"StrCol": str})
         tm.assert_frame_equal(actual, expected)
 
         no_convert_float = float_expected.copy()
         no_convert_float["StrCol"] = no_convert_float["StrCol"].apply(str)
-        actual = self.get_exceldf(basename, 'Sheet1', convert_float=False,
+        actual = self.get_exceldf(basename, ext, 'Sheet1', convert_float=False,
                                   converters={"StrCol": str})
         tm.assert_frame_equal(actual, no_convert_float)
 
     # GH8212 - support for converters and missing values
-    def test_reader_converters(self):
+    def test_reader_converters(self, ext):
 
         basename = 'test_converters'
 
-        expected = DataFrame.from_items([
+        expected = DataFrame.from_dict(OrderedDict([
             ("IntCol", [1, 2, -3, -1000, 0]),
             ("FloatCol", [12.5, np.nan, 18.3, 19.2, 0.000000005]),
             ("BoolCol", ['Found', 'Found', 'Found', 'Not found', 'Found']),
             ("StrCol", ['1', np.nan, '3', '4', '5']),
-        ])
+        ]))
 
         converters = {'IntCol': lambda x: int(x) if x != '' else -1000,
                       'FloatCol': lambda x: 10 * x if x else np.nan,
@@ -370,13 +461,14 @@ def test_reader_converters(self):
 
         # should read in correctly and set types of single cells (not array
         # dtypes)
-        actual = self.get_exceldf(basename, 'Sheet1', converters=converters)
+        actual = self.get_exceldf(basename, ext, 'Sheet1',
+                                  converters=converters)
         tm.assert_frame_equal(actual, expected)
 
-    def test_reader_dtype(self):
+    def test_reader_dtype(self, ext):
         # GH 8212
         basename = 'testdtype'
-        actual = self.get_exceldf(basename)
+        actual = self.get_exceldf(basename, ext)
 
         expected = DataFrame({
             'a': [1, 2, 3, 4],
@@ -387,7 +479,7 @@ def test_reader_dtype(self):
 
         tm.assert_frame_equal(actual, expected)
 
-        actual = self.get_exceldf(basename,
+        actual = self.get_exceldf(basename, ext,
                                   dtype={'a': 'float64',
                                          'b': 'float32',
                                          'c': str})
@@ -397,23 +489,50 @@ def test_reader_dtype(self):
         expected['c'] = ['001', '002', '003', '004']
         tm.assert_frame_equal(actual, expected)
 
-        with tm.assertRaises(ValueError):
-            actual = self.get_exceldf(basename, dtype={'d': 'int64'})
+        with pytest.raises(ValueError):
+            self.get_exceldf(basename, ext, dtype={'d': 'int64'})
+
+    @pytest.mark.parametrize("dtype,expected", [
+        (None,
+         DataFrame({
+             "a": [1, 2, 3, 4],
+             "b": [2.5, 3.5, 4.5, 5.5],
+             "c": [1, 2, 3, 4],
+             "d": [1.0, 2.0, np.nan, 4.0]
+         })),
+        ({"a": "float64",
+          "b": "float32",
+          "c": str,
+          "d": str
+          },
+         DataFrame({
+             "a": Series([1, 2, 3, 4], dtype="float64"),
+             "b": Series([2.5, 3.5, 4.5, 5.5], dtype="float32"),
+             "c": ["001", "002", "003", "004"],
+             "d": ["1", "2", np.nan, "4"]
+         })),
+    ])
+    def test_reader_dtype_str(self, ext, dtype, expected):
+        # see gh-20377
+        basename = "testdtype"
+
+        actual = self.get_exceldf(basename, ext, dtype=dtype)
+        tm.assert_frame_equal(actual, expected)
 
-    def test_reading_all_sheets(self):
+    def test_reading_all_sheets(self, ext):
         # Test reading all sheetnames by setting sheetname to None,
         # Ensure a dict is returned.
         # See PR #9450
         basename = 'test_multisheet'
-        dfs = self.get_exceldf(basename, sheetname=None)
+        dfs = self.get_exceldf(basename, ext, sheet_name=None)
         # ensure this is not alphabetical to test order preservation
         expected_keys = ['Charlie', 'Alpha', 'Beta']
         tm.assert_contains_all(expected_keys, dfs.keys())
         # Issue 9930
         # Ensure sheet order is preserved
-        tm.assert_equal(expected_keys, list(dfs.keys()))
+        assert expected_keys == list(dfs.keys())
 
-    def test_reading_multiple_specific_sheets(self):
+    def test_reading_multiple_specific_sheets(self, ext):
         # Test reading specific sheetnames by specifying a mixed list
         # of integers and strings, and confirm that duplicated sheet
         # references (positions/names) are removed properly.
@@ -422,100 +541,82 @@ def test_reading_multiple_specific_sheets(self):
         basename = 'test_multisheet'
         # Explicitly request duplicates. Only the set should be returned.
         expected_keys = [2, 'Charlie', 'Charlie']
-        dfs = self.get_exceldf(basename, sheetname=expected_keys)
+        dfs = self.get_exceldf(basename, ext, sheet_name=expected_keys)
         expected_keys = list(set(expected_keys))
         tm.assert_contains_all(expected_keys, dfs.keys())
         assert len(expected_keys) == len(dfs.keys())
 
-    def test_reading_all_sheets_with_blank(self):
+    def test_reading_all_sheets_with_blank(self, ext):
         # Test reading all sheetnames by setting sheetname to None,
         # In the case where some sheets are blank.
         # Issue #11711
         basename = 'blank_with_header'
-        dfs = self.get_exceldf(basename, sheetname=None)
+        dfs = self.get_exceldf(basename, ext, sheet_name=None)
         expected_keys = ['Sheet1', 'Sheet2', 'Sheet3']
         tm.assert_contains_all(expected_keys, dfs.keys())
 
     # GH6403
-    def test_read_excel_blank(self):
-        actual = self.get_exceldf('blank', 'Sheet1')
+    def test_read_excel_blank(self, ext):
+        actual = self.get_exceldf('blank', ext, 'Sheet1')
         tm.assert_frame_equal(actual, DataFrame())
 
-    def test_read_excel_blank_with_header(self):
+    def test_read_excel_blank_with_header(self, ext):
         expected = DataFrame(columns=['col_1', 'col_2'])
-        actual = self.get_exceldf('blank_with_header', 'Sheet1')
+        actual = self.get_exceldf('blank_with_header', ext, 'Sheet1')
         tm.assert_frame_equal(actual, expected)
 
-    # GH 12292 : error when read one empty column from excel file
-    def test_read_one_empty_col_no_header(self):
-        _skip_if_no_xlwt()
-        _skip_if_no_openpyxl()
-
+    @td.skip_if_no("xlwt")
+    @td.skip_if_no("openpyxl")
+    @pytest.mark.parametrize("header,expected", [
+        (None, DataFrame([np.nan] * 4)),
+        (0, DataFrame({"Unnamed: 0": [np.nan] * 3}))
+    ])
+    def test_read_one_empty_col_no_header(self, ext, header, expected):
+        # xref gh-12292
+        filename = "no_header"
         df = pd.DataFrame(
             [["", 1, 100],
              ["", 2, 200],
              ["", 3, 300],
              ["", 4, 400]]
         )
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, 'no_header', index=False, header=False)
-            actual_header_none = read_excel(
-                path,
-                'no_header',
-                parse_cols=[0],
-                header=None
-            )
-
-            actual_header_zero = read_excel(
-                path,
-                'no_header',
-                parse_cols=[0],
-                header=0
-            )
-        expected = DataFrame()
-        tm.assert_frame_equal(actual_header_none, expected)
-        tm.assert_frame_equal(actual_header_zero, expected)
-
-    def test_read_one_empty_col_with_header(self):
-        _skip_if_no_xlwt()
-        _skip_if_no_openpyxl()
 
+        with ensure_clean(ext) as path:
+            df.to_excel(path, filename, index=False, header=False)
+            result = read_excel(path, filename, usecols=[0], header=header)
+
+        tm.assert_frame_equal(result, expected)
+
+    @td.skip_if_no("xlwt")
+    @td.skip_if_no("openpyxl")
+    @pytest.mark.parametrize("header,expected", [
+        (None, DataFrame([0] + [np.nan] * 4)),
+        (0, DataFrame([np.nan] * 4))
+    ])
+    def test_read_one_empty_col_with_header(self, ext, header, expected):
+        filename = "with_header"
         df = pd.DataFrame(
             [["", 1, 100],
              ["", 2, 200],
              ["", 3, 300],
              ["", 4, 400]]
         )
-        with ensure_clean(self.ext) as path:
+
+        with ensure_clean(ext) as path:
             df.to_excel(path, 'with_header', index=False, header=True)
-            actual_header_none = read_excel(
-                path,
-                'with_header',
-                parse_cols=[0],
-                header=None
-            )
-
-            actual_header_zero = read_excel(
-                path,
-                'with_header',
-                parse_cols=[0],
-                header=0
-            )
-        expected_header_none = DataFrame(pd.Series([0], dtype='int64'))
-        tm.assert_frame_equal(actual_header_none, expected_header_none)
-        expected_header_zero = DataFrame(columns=[0], dtype='int64')
-        tm.assert_frame_equal(actual_header_zero, expected_header_zero)
-
-    def test_set_column_names_in_parameter(self):
-        _skip_if_no_xlwt()
-        _skip_if_no_openpyxl()
+            result = read_excel(path, filename, usecols=[0], header=header)
+
+        tm.assert_frame_equal(result, expected)
 
+    @td.skip_if_no('openpyxl')
+    @td.skip_if_no('xlwt')
+    def test_set_column_names_in_parameter(self, ext):
         # GH 12870 : pass down column names associated with
         # keyword argument names
         refdf = pd.DataFrame([[1, 'foo'], [2, 'bar'],
                               [3, 'baz']], columns=['a', 'b'])
 
-        with ensure_clean(self.ext) as pth:
+        with ensure_clean(ext) as pth:
             with ExcelWriter(pth) as writer:
                 refdf.to_excel(writer, 'Data_no_head',
                                header=False, index=False)
@@ -532,26 +633,58 @@ def test_set_column_names_in_parameter(self):
             tm.assert_frame_equal(xlsdf_no_head, refdf)
             tm.assert_frame_equal(xlsdf_with_head, refdf)
 
-    def test_date_conversion_overflow(self):
+    def test_date_conversion_overflow(self, ext):
         # GH 10001 : pandas.ExcelFile ignore parse_dates=False
         expected = pd.DataFrame([[pd.Timestamp('2016-03-12'), 'Marc Johnson'],
                                  [pd.Timestamp('2016-03-16'), 'Jack Black'],
                                  [1e+20, 'Timothy Brown']],
                                 columns=['DateColWithBigInt', 'StringCol'])
 
-        result = self.get_exceldf('testdateoverflow')
+        result = self.get_exceldf('testdateoverflow', ext)
         tm.assert_frame_equal(result, expected)
 
-
-class XlrdTests(ReadingTestsBase):
-    """
-    This is the base class for the xlrd tests, and 3 different file formats
-    are supported: xls, xlsx, xlsm
-    """
-
-    def test_excel_read_buffer(self):
-
-        pth = os.path.join(self.dirpath, 'test1' + self.ext)
+    @td.skip_if_no("xlrd", "1.0.1")  # see gh-22682
+    def test_sheet_name_and_sheetname(self, ext):
+        # gh-10559: Minor improvement: Change "sheet_name" to "sheetname"
+        # gh-10969: DOC: Consistent var names (sheetname vs sheet_name)
+        # gh-12604: CLN GH10559 Rename sheetname variable to sheet_name
+        # gh-20920: ExcelFile.parse() and pd.read_xlsx() have different
+        #           behavior for "sheetname" argument
+        filename = "test1"
+        sheet_name = "Sheet1"
+
+        df_ref = self.get_csv_refdf(filename)
+        df1 = self.get_exceldf(filename, ext,
+                               sheet_name=sheet_name, index_col=0)  # doc
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            with ignore_xlrd_time_clock_warning():
+                df2 = self.get_exceldf(filename, ext, index_col=0,
+                                       sheetname=sheet_name)  # backward compat
+
+        excel = self.get_excelfile(filename, ext)
+        df1_parse = excel.parse(sheet_name=sheet_name, index_col=0)  # doc
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df2_parse = excel.parse(index_col=0,
+                                    sheetname=sheet_name)  # backward compat
+
+        tm.assert_frame_equal(df1, df_ref, check_names=False)
+        tm.assert_frame_equal(df2, df_ref, check_names=False)
+        tm.assert_frame_equal(df1_parse, df_ref, check_names=False)
+        tm.assert_frame_equal(df2_parse, df_ref, check_names=False)
+
+    def test_sheet_name_both_raises(self, ext):
+        with pytest.raises(TypeError, match="Cannot specify both"):
+            self.get_exceldf('test1', ext, sheetname='Sheet1',
+                             sheet_name='Sheet1')
+
+        excel = self.get_excelfile('test1', ext)
+        with pytest.raises(TypeError, match="Cannot specify both"):
+            excel.parse(sheetname='Sheet1',
+                        sheet_name='Sheet1')
+
+    def test_excel_read_buffer(self, ext):
+
+        pth = os.path.join(self.dirpath, 'test1' + ext)
         expected = read_excel(pth, 'Sheet1', index_col=0)
         with open(pth, 'rb') as f:
             actual = read_excel(f, 'Sheet1', index_col=0)
@@ -562,47 +695,40 @@ def test_excel_read_buffer(self):
             actual = read_excel(xls, 'Sheet1', index_col=0)
             tm.assert_frame_equal(expected, actual)
 
-    def test_read_xlrd_Book(self):
-        _skip_if_no_xlwt()
-
-        import xlrd
-        df = self.frame
-        with ensure_clean('.xls') as pth:
-            df.to_excel(pth, "SheetA")
-            book = xlrd.open_workbook(pth)
-
-            with ExcelFile(book, engine="xlrd") as xl:
-                result = read_excel(xl, "SheetA")
-                tm.assert_frame_equal(df, result)
-
-            result = read_excel(book, sheetname="SheetA", engine="xlrd")
-            tm.assert_frame_equal(df, result)
+    def test_bad_engine_raises(self, ext):
+        bad_engine = 'foo'
+        with pytest.raises(ValueError, match="Unknown engine: foo"):
+            read_excel('', engine=bad_engine)
 
     @tm.network
-    def test_read_from_http_url(self):
+    def test_read_from_http_url(self, ext):
         url = ('https://raw.github.com/pandas-dev/pandas/master/'
-               'pandas/tests/io/data/test1' + self.ext)
+               'pandas/tests/io/data/test1' + ext)
         url_table = read_excel(url)
-        local_table = self.get_exceldf('test1')
+        local_table = self.get_exceldf('test1', ext)
         tm.assert_frame_equal(url_table, local_table)
 
-    @tm.network(check_before_test=True)
-    def test_read_from_s3_url(self):
-        _skip_if_no_s3fs()
+    @td.skip_if_not_us_locale
+    def test_read_from_s3_url(self, ext, s3_resource):
+        # Bucket "pandas-test" created in tests/io/conftest.py
+        file_name = os.path.join(self.dirpath, 'test1' + ext)
+
+        with open(file_name, "rb") as f:
+            s3_resource.Bucket("pandas-test").put_object(Key="test1" + ext,
+                                                         Body=f)
 
-        url = ('s3://pandas-test/test1' + self.ext)
+        url = ('s3://pandas-test/test1' + ext)
         url_table = read_excel(url)
-        local_table = self.get_exceldf('test1')
+        local_table = self.get_exceldf('test1', ext)
         tm.assert_frame_equal(url_table, local_table)
 
-    @tm.slow
-    def test_read_from_file_url(self):
+    @pytest.mark.slow
+    # ignore warning from old xlrd
+    @pytest.mark.filterwarnings("ignore:This metho:PendingDeprecationWarning")
+    def test_read_from_file_url(self, ext):
 
         # FILE
-        if sys.version_info[:2] < (2, 6):
-            pytest.skip("file:// not supported with Python < 2.6")
-
-        localtable = os.path.join(self.dirpath, 'test1' + self.ext)
+        localtable = os.path.join(self.dirpath, 'test1' + ext)
         local_table = read_excel(localtable)
 
         try:
@@ -615,346 +741,347 @@ def test_read_from_file_url(self):
 
         tm.assert_frame_equal(url_table, local_table)
 
-    def test_read_from_pathlib_path(self):
+    @td.skip_if_no('pathlib')
+    def test_read_from_pathlib_path(self, ext):
 
         # GH12655
-        tm._skip_if_no_pathlib()
-
         from pathlib import Path
 
-        str_path = os.path.join(self.dirpath, 'test1' + self.ext)
+        str_path = os.path.join(self.dirpath, 'test1' + ext)
         expected = read_excel(str_path, 'Sheet1', index_col=0)
 
-        path_obj = Path(self.dirpath, 'test1' + self.ext)
+        path_obj = Path(self.dirpath, 'test1' + ext)
         actual = read_excel(path_obj, 'Sheet1', index_col=0)
 
         tm.assert_frame_equal(expected, actual)
 
-    def test_read_from_py_localpath(self):
+    @td.skip_if_no('py.path')
+    def test_read_from_py_localpath(self, ext):
 
         # GH12655
-        tm._skip_if_no_localpath()
-
         from py.path import local as LocalPath
 
-        str_path = os.path.join(self.dirpath, 'test1' + self.ext)
+        str_path = os.path.join(self.dirpath, 'test1' + ext)
         expected = read_excel(str_path, 'Sheet1', index_col=0)
 
         abs_dir = os.path.abspath(self.dirpath)
-        path_obj = LocalPath(abs_dir).join('test1' + self.ext)
+        path_obj = LocalPath(abs_dir).join('test1' + ext)
         actual = read_excel(path_obj, 'Sheet1', index_col=0)
 
         tm.assert_frame_equal(expected, actual)
 
-    def test_reader_closes_file(self):
+    def test_reader_closes_file(self, ext):
 
-        pth = os.path.join(self.dirpath, 'test1' + self.ext)
+        pth = os.path.join(self.dirpath, 'test1' + ext)
         f = open(pth, 'rb')
         with ExcelFile(f) as xlsx:
             # parses okay
             read_excel(xlsx, 'Sheet1', index_col=0)
 
-        self.assertTrue(f.closed)
-
-    def test_creating_and_reading_multiple_sheets(self):
-        # Test reading multiple sheets, from a runtime created excel file
-        # with multiple sheets.
-        # See PR #9450
-
-        _skip_if_no_xlwt()
-        _skip_if_no_openpyxl()
+        assert f.closed
 
-        def tdf(sheetname):
+    @td.skip_if_no("xlwt")
+    @td.skip_if_no("openpyxl")
+    def test_creating_and_reading_multiple_sheets(self, ext):
+        # see gh-9450
+        #
+        # Test reading multiple sheets, from a runtime
+        # created Excel file with multiple sheets.
+        def tdf(col_sheet_name):
             d, i = [11, 22, 33], [1, 2, 3]
-            return DataFrame(d, i, columns=[sheetname])
+            return DataFrame(d, i, columns=[col_sheet_name])
 
-        sheets = ['AAA', 'BBB', 'CCC']
+        sheets = ["AAA", "BBB", "CCC"]
 
         dfs = [tdf(s) for s in sheets]
         dfs = dict(zip(sheets, dfs))
 
-        with ensure_clean(self.ext) as pth:
+        with ensure_clean(ext) as pth:
             with ExcelWriter(pth) as ew:
                 for sheetname, df in iteritems(dfs):
                     df.to_excel(ew, sheetname)
-            dfs_returned = read_excel(pth, sheetname=sheets)
+
+            dfs_returned = read_excel(pth, sheet_name=sheets, index_col=0)
+
             for s in sheets:
                 tm.assert_frame_equal(dfs[s], dfs_returned[s])
 
-    def test_reader_seconds(self):
-        # Test reading times with and without milliseconds. GH5945.
-        import xlrd
+    def test_reader_seconds(self, ext):
 
-        if LooseVersion(xlrd.__VERSION__) >= LooseVersion("0.9.3"):
-            # Xlrd >= 0.9.3 can handle Excel milliseconds.
-            expected = DataFrame.from_items([("Time",
-                                              [time(1, 2, 3),
-                                               time(2, 45, 56, 100000),
-                                               time(4, 29, 49, 200000),
-                                               time(6, 13, 42, 300000),
-                                               time(7, 57, 35, 400000),
-                                               time(9, 41, 28, 500000),
-                                               time(11, 25, 21, 600000),
-                                               time(13, 9, 14, 700000),
-                                               time(14, 53, 7, 800000),
-                                               time(16, 37, 0, 900000),
-                                               time(18, 20, 54)])])
-        else:
-            # Xlrd < 0.9.3 rounds Excel milliseconds.
-            expected = DataFrame.from_items([("Time",
-                                              [time(1, 2, 3),
-                                               time(2, 45, 56),
-                                               time(4, 29, 49),
-                                               time(6, 13, 42),
-                                               time(7, 57, 35),
-                                               time(9, 41, 29),
-                                               time(11, 25, 22),
-                                               time(13, 9, 15),
-                                               time(14, 53, 8),
-                                               time(16, 37, 1),
-                                               time(18, 20, 54)])])
-
-        actual = self.get_exceldf('times_1900', 'Sheet1')
+        # Test reading times with and without milliseconds. GH5945.
+        expected = DataFrame.from_dict({"Time": [time(1, 2, 3),
+                                                 time(2, 45, 56, 100000),
+                                                 time(4, 29, 49, 200000),
+                                                 time(6, 13, 42, 300000),
+                                                 time(7, 57, 35, 400000),
+                                                 time(9, 41, 28, 500000),
+                                                 time(11, 25, 21, 600000),
+                                                 time(13, 9, 14, 700000),
+                                                 time(14, 53, 7, 800000),
+                                                 time(16, 37, 0, 900000),
+                                                 time(18, 20, 54)]})
+
+        actual = self.get_exceldf('times_1900', ext, 'Sheet1')
         tm.assert_frame_equal(actual, expected)
 
-        actual = self.get_exceldf('times_1904', 'Sheet1')
+        actual = self.get_exceldf('times_1904', ext, 'Sheet1')
         tm.assert_frame_equal(actual, expected)
 
-    def test_read_excel_multiindex(self):
-        # GH 4679
-        mi = MultiIndex.from_product([['foo', 'bar'], ['a', 'b']])
-        mi_file = os.path.join(self.dirpath, 'testmultiindex' + self.ext)
+    def test_read_excel_multiindex(self, ext):
+        # see gh-4679
+        mi = MultiIndex.from_product([["foo", "bar"], ["a", "b"]])
+        mi_file = os.path.join(self.dirpath, "testmultiindex" + ext)
 
-        expected = DataFrame([[1, 2.5, pd.Timestamp('2015-01-01'), True],
-                              [2, 3.5, pd.Timestamp('2015-01-02'), False],
-                              [3, 4.5, pd.Timestamp('2015-01-03'), False],
-                              [4, 5.5, pd.Timestamp('2015-01-04'), True]],
+        # "mi_column" sheet
+        expected = DataFrame([[1, 2.5, pd.Timestamp("2015-01-01"), True],
+                              [2, 3.5, pd.Timestamp("2015-01-02"), False],
+                              [3, 4.5, pd.Timestamp("2015-01-03"), False],
+                              [4, 5.5, pd.Timestamp("2015-01-04"), True]],
                              columns=mi)
 
-        actual = read_excel(mi_file, 'mi_column', header=[0, 1])
-        tm.assert_frame_equal(actual, expected)
-        actual = read_excel(mi_file, 'mi_column', header=[0, 1], index_col=0)
+        actual = read_excel(mi_file, "mi_column", header=[0, 1], index_col=0)
         tm.assert_frame_equal(actual, expected)
 
-        expected.columns = ['a', 'b', 'c', 'd']
+        # "mi_index" sheet
         expected.index = mi
-        actual = read_excel(mi_file, 'mi_index', index_col=[0, 1])
+        expected.columns = ["a", "b", "c", "d"]
+
+        actual = read_excel(mi_file, "mi_index", index_col=[0, 1])
         tm.assert_frame_equal(actual, expected, check_names=False)
 
+        # "both" sheet
         expected.columns = mi
-        actual = read_excel(mi_file, 'both', index_col=[0, 1], header=[0, 1])
+
+        actual = read_excel(mi_file, "both", index_col=[0, 1], header=[0, 1])
         tm.assert_frame_equal(actual, expected, check_names=False)
 
-        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
-        expected.columns = ['a', 'b', 'c', 'd']
-        actual = read_excel(mi_file, 'mi_index_name', index_col=[0, 1])
+        # "mi_index_name" sheet
+        expected.columns = ["a", "b", "c", "d"]
+        expected.index = mi.set_names(["ilvl1", "ilvl2"])
+
+        actual = read_excel(mi_file, "mi_index_name", index_col=[0, 1])
         tm.assert_frame_equal(actual, expected)
 
+        # "mi_column_name" sheet
         expected.index = list(range(4))
-        expected.columns = mi.set_names(['c1', 'c2'])
-        actual = read_excel(mi_file, 'mi_column_name',
+        expected.columns = mi.set_names(["c1", "c2"])
+        actual = read_excel(mi_file, "mi_column_name",
                             header=[0, 1], index_col=0)
         tm.assert_frame_equal(actual, expected)
 
-        # Issue #11317
+        # see gh-11317
+        # "name_with_int" sheet
         expected.columns = mi.set_levels(
-            [1, 2], level=1).set_names(['c1', 'c2'])
-        actual = read_excel(mi_file, 'name_with_int',
+            [1, 2], level=1).set_names(["c1", "c2"])
+
+        actual = read_excel(mi_file, "name_with_int",
                             index_col=0, header=[0, 1])
         tm.assert_frame_equal(actual, expected)
 
-        expected.columns = mi.set_names(['c1', 'c2'])
-        expected.index = mi.set_names(['ilvl1', 'ilvl2'])
-        actual = read_excel(mi_file, 'both_name',
-                            index_col=[0, 1], header=[0, 1])
-        tm.assert_frame_equal(actual, expected)
+        # "both_name" sheet
+        expected.columns = mi.set_names(["c1", "c2"])
+        expected.index = mi.set_names(["ilvl1", "ilvl2"])
 
-        actual = read_excel(mi_file, 'both_name',
+        actual = read_excel(mi_file, "both_name",
                             index_col=[0, 1], header=[0, 1])
         tm.assert_frame_equal(actual, expected)
 
-        actual = read_excel(mi_file, 'both_name_skiprows', index_col=[0, 1],
+        # "both_skiprows" sheet
+        actual = read_excel(mi_file, "both_name_skiprows", index_col=[0, 1],
                             header=[0, 1], skiprows=2)
         tm.assert_frame_equal(actual, expected)
 
-    def test_read_excel_multiindex_empty_level(self):
-        # GH 12453
-        _skip_if_no_xlsxwriter()
-        with ensure_clean('.xlsx') as path:
+    def test_read_excel_multiindex_header_only(self, ext):
+        # see gh-11733.
+        #
+        # Don't try to parse a header name if there isn't one.
+        mi_file = os.path.join(self.dirpath, "testmultiindex" + ext)
+        result = read_excel(mi_file, "index_col_none", header=[0, 1])
+
+        exp_columns = MultiIndex.from_product([("A", "B"), ("key", "val")])
+        expected = DataFrame([[1, 2, 3, 4]] * 2, columns=exp_columns)
+        tm.assert_frame_equal(result, expected)
+
+    @td.skip_if_no("xlsxwriter")
+    def test_read_excel_multiindex_empty_level(self, ext):
+        # see gh-12453
+        with ensure_clean(ext) as path:
             df = DataFrame({
-                ('Zero', ''): {0: 0},
-                ('One', 'x'): {0: 1},
-                ('Two', 'X'): {0: 3},
-                ('Two', 'Y'): {0: 7}
+                ("One", "x"): {0: 1},
+                ("Two", "X"): {0: 3},
+                ("Two", "Y"): {0: 7},
+                ("Zero", ""): {0: 0}
             })
 
             expected = DataFrame({
-                ('Zero', 'Unnamed: 3_level_1'): {0: 0},
-                ('One', u'x'): {0: 1},
-                ('Two', u'X'): {0: 3},
-                ('Two', u'Y'): {0: 7}
+                ("One", "x"): {0: 1},
+                ("Two", "X"): {0: 3},
+                ("Two", "Y"): {0: 7},
+                ("Zero", "Unnamed: 4_level_1"): {0: 0}
             })
 
             df.to_excel(path)
-            actual = pd.read_excel(path, header=[0, 1])
+            actual = pd.read_excel(path, header=[0, 1], index_col=0)
             tm.assert_frame_equal(actual, expected)
 
             df = pd.DataFrame({
-                ('Beg', ''): {0: 0},
-                ('Middle', 'x'): {0: 1},
-                ('Tail', 'X'): {0: 3},
-                ('Tail', 'Y'): {0: 7}
+                ("Beg", ""): {0: 0},
+                ("Middle", "x"): {0: 1},
+                ("Tail", "X"): {0: 3},
+                ("Tail", "Y"): {0: 7}
             })
 
             expected = pd.DataFrame({
-                ('Beg', 'Unnamed: 0_level_1'): {0: 0},
-                ('Middle', u'x'): {0: 1},
-                ('Tail', u'X'): {0: 3},
-                ('Tail', u'Y'): {0: 7}
+                ("Beg", "Unnamed: 1_level_1"): {0: 0},
+                ("Middle", "x"): {0: 1},
+                ("Tail", "X"): {0: 3},
+                ("Tail", "Y"): {0: 7}
             })
 
             df.to_excel(path)
-            actual = pd.read_excel(path, header=[0, 1])
+            actual = pd.read_excel(path, header=[0, 1], index_col=0)
             tm.assert_frame_equal(actual, expected)
 
-    def test_excel_multindex_roundtrip(self):
-        # GH 4679
-        _skip_if_no_xlsxwriter()
-        with ensure_clean('.xlsx') as pth:
-            for c_idx_names in [True, False]:
-                for r_idx_names in [True, False]:
-                    for c_idx_levels in [1, 3]:
-                        for r_idx_levels in [1, 3]:
-                            # column index name can't be serialized unless
-                            # MultiIndex
-                            if (c_idx_levels == 1 and c_idx_names):
-                                continue
-
-                            # empty name case current read in as unamed levels,
-                            # not Nones
-                            check_names = True
-                            if not r_idx_names and r_idx_levels > 1:
-                                check_names = False
-
-                            df = mkdf(5, 5, c_idx_names,
-                                      r_idx_names, c_idx_levels,
-                                      r_idx_levels)
-                            df.to_excel(pth)
-                            act = pd.read_excel(
-                                pth, index_col=list(range(r_idx_levels)),
+    @td.skip_if_no("xlsxwriter")
+    @pytest.mark.parametrize("c_idx_names", [True, False])
+    @pytest.mark.parametrize("r_idx_names", [True, False])
+    @pytest.mark.parametrize("c_idx_levels", [1, 3])
+    @pytest.mark.parametrize("r_idx_levels", [1, 3])
+    def test_excel_multindex_roundtrip(self, ext, c_idx_names, r_idx_names,
+                                       c_idx_levels, r_idx_levels):
+        # see gh-4679
+        with ensure_clean(ext) as pth:
+            if c_idx_levels == 1 and c_idx_names:
+                pytest.skip("Column index name cannot be "
+                            "serialized unless it's a MultiIndex")
+
+            # Empty name case current read in as
+            # unnamed levels, not Nones.
+            check_names = r_idx_names or r_idx_levels <= 1
+
+            df = mkdf(5, 5, c_idx_names, r_idx_names,
+                      c_idx_levels, r_idx_levels)
+            df.to_excel(pth)
+
+            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
                                 header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(
-                                df, act, check_names=check_names)
+            tm.assert_frame_equal(df, act, check_names=check_names)
 
-                            df.iloc[0, :] = np.nan
-                            df.to_excel(pth)
-                            act = pd.read_excel(
-                                pth, index_col=list(range(r_idx_levels)),
+            df.iloc[0, :] = np.nan
+            df.to_excel(pth)
+
+            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
                                 header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(
-                                df, act, check_names=check_names)
+            tm.assert_frame_equal(df, act, check_names=check_names)
 
-                            df.iloc[-1, :] = np.nan
-                            df.to_excel(pth)
-                            act = pd.read_excel(
-                                pth, index_col=list(range(r_idx_levels)),
+            df.iloc[-1, :] = np.nan
+            df.to_excel(pth)
+            act = pd.read_excel(pth, index_col=list(range(r_idx_levels)),
                                 header=list(range(c_idx_levels)))
-                            tm.assert_frame_equal(
-                                df, act, check_names=check_names)
-
-    def test_excel_oldindex_format(self):
-        # GH 4679
-        data = np.array([['R0C0', 'R0C1', 'R0C2', 'R0C3', 'R0C4'],
-                         ['R1C0', 'R1C1', 'R1C2', 'R1C3', 'R1C4'],
-                         ['R2C0', 'R2C1', 'R2C2', 'R2C3', 'R2C4'],
-                         ['R3C0', 'R3C1', 'R3C2', 'R3C3', 'R3C4'],
-                         ['R4C0', 'R4C1', 'R4C2', 'R4C3', 'R4C4']])
-        columns = ['C_l0_g0', 'C_l0_g1', 'C_l0_g2', 'C_l0_g3', 'C_l0_g4']
-        mi = MultiIndex(levels=[['R_l0_g0', 'R_l0_g1', 'R_l0_g2',
-                                 'R_l0_g3', 'R_l0_g4'],
-                                ['R_l1_g0', 'R_l1_g1', 'R_l1_g2',
-                                 'R_l1_g3', 'R_l1_g4']],
-                        labels=[[0, 1, 2, 3, 4], [0, 1, 2, 3, 4]],
-                        names=['R0', 'R1'])
-        si = Index(['R_l0_g0', 'R_l0_g1', 'R_l0_g2',
-                    'R_l0_g3', 'R_l0_g4'], name='R0')
-
-        in_file = os.path.join(
-            self.dirpath, 'test_index_name_pre17' + self.ext)
+            tm.assert_frame_equal(df, act, check_names=check_names)
+
+    def test_excel_old_index_format(self, ext):
+        # see gh-4679
+        filename = "test_index_name_pre17" + ext
+        in_file = os.path.join(self.dirpath, filename)
+
+        # We detect headers to determine if index names exist, so
+        # that "index" name in the "names" version of the data will
+        # now be interpreted as rows that include null data.
+        data = np.array([[None, None, None, None, None],
+                         ["R0C0", "R0C1", "R0C2", "R0C3", "R0C4"],
+                         ["R1C0", "R1C1", "R1C2", "R1C3", "R1C4"],
+                         ["R2C0", "R2C1", "R2C2", "R2C3", "R2C4"],
+                         ["R3C0", "R3C1", "R3C2", "R3C3", "R3C4"],
+                         ["R4C0", "R4C1", "R4C2", "R4C3", "R4C4"]])
+        columns = ["C_l0_g0", "C_l0_g1", "C_l0_g2", "C_l0_g3", "C_l0_g4"]
+        mi = MultiIndex(levels=[["R0", "R_l0_g0", "R_l0_g1",
+                                 "R_l0_g2", "R_l0_g3", "R_l0_g4"],
+                                ["R1", "R_l1_g0", "R_l1_g1",
+                                 "R_l1_g2", "R_l1_g3", "R_l1_g4"]],
+                        codes=[[0, 1, 2, 3, 4, 5], [0, 1, 2, 3, 4, 5]],
+                        names=[None, None])
+        si = Index(["R0", "R_l0_g0", "R_l0_g1", "R_l0_g2",
+                    "R_l0_g3", "R_l0_g4"], name=None)
 
         expected = pd.DataFrame(data, index=si, columns=columns)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(
-                in_file, 'single_names', has_index_names=True)
+
+        actual = pd.read_excel(in_file, "single_names", index_col=0)
         tm.assert_frame_equal(actual, expected)
 
-        expected.index.name = None
-        actual = pd.read_excel(in_file, 'single_no_names')
+        expected.index = mi
+
+        actual = pd.read_excel(in_file, "multi_names", index_col=[0, 1])
         tm.assert_frame_equal(actual, expected)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(
-                in_file, 'single_no_names', has_index_names=False)
+
+        # The analogous versions of the "names" version data
+        # where there are explicitly no names for the indices.
+        data = np.array([["R0C0", "R0C1", "R0C2", "R0C3", "R0C4"],
+                         ["R1C0", "R1C1", "R1C2", "R1C3", "R1C4"],
+                         ["R2C0", "R2C1", "R2C2", "R2C3", "R2C4"],
+                         ["R3C0", "R3C1", "R3C2", "R3C3", "R3C4"],
+                         ["R4C0", "R4C1", "R4C2", "R4C3", "R4C4"]])
+        columns = ["C_l0_g0", "C_l0_g1", "C_l0_g2", "C_l0_g3", "C_l0_g4"]
+        mi = MultiIndex(levels=[["R_l0_g0", "R_l0_g1", "R_l0_g2",
+                                 "R_l0_g3", "R_l0_g4"],
+                                ["R_l1_g0", "R_l1_g1", "R_l1_g2",
+                                 "R_l1_g3", "R_l1_g4"]],
+                        codes=[[0, 1, 2, 3, 4], [0, 1, 2, 3, 4]],
+                        names=[None, None])
+        si = Index(["R_l0_g0", "R_l0_g1", "R_l0_g2",
+                    "R_l0_g3", "R_l0_g4"], name=None)
+
+        expected = pd.DataFrame(data, index=si, columns=columns)
+
+        actual = pd.read_excel(in_file, "single_no_names", index_col=0)
         tm.assert_frame_equal(actual, expected)
 
         expected.index = mi
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(
-                in_file, 'multi_names', has_index_names=True)
-        tm.assert_frame_equal(actual, expected)
 
-        expected.index.names = [None, None]
-        actual = pd.read_excel(in_file, 'multi_no_names', index_col=[0, 1])
-        tm.assert_frame_equal(actual, expected, check_names=False)
-        with tm.assert_produces_warning(FutureWarning):
-            actual = pd.read_excel(in_file, 'multi_no_names', index_col=[0, 1],
-                                   has_index_names=False)
+        actual = pd.read_excel(in_file, "multi_no_names", index_col=[0, 1])
         tm.assert_frame_equal(actual, expected, check_names=False)
 
-    def test_read_excel_bool_header_arg(self):
+    def test_read_excel_bool_header_arg(self, ext):
         # GH 6114
         for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                pd.read_excel(os.path.join(self.dirpath, 'test1' + self.ext),
+            with pytest.raises(TypeError):
+                pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
                               header=arg)
 
-    def test_read_excel_chunksize(self):
+    def test_read_excel_chunksize(self, ext):
         # GH 8011
-        with tm.assertRaises(NotImplementedError):
-            pd.read_excel(os.path.join(self.dirpath, 'test1' + self.ext),
+        with pytest.raises(NotImplementedError):
+            pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
                           chunksize=100)
 
-    def test_read_excel_parse_dates(self):
-        # GH 11544, 12051
-
+    @td.skip_if_no("xlwt")
+    @td.skip_if_no("openpyxl")
+    def test_read_excel_parse_dates(self, ext):
+        # see gh-11544, gh-12051
         df = DataFrame(
-            {'col': [1, 2, 3],
-             'date_strings': pd.date_range('2012-01-01', periods=3)})
+            {"col": [1, 2, 3],
+             "date_strings": pd.date_range("2012-01-01", periods=3)})
         df2 = df.copy()
-        df2['date_strings'] = df2['date_strings'].dt.strftime('%m/%d/%Y')
+        df2["date_strings"] = df2["date_strings"].dt.strftime("%m/%d/%Y")
 
-        with ensure_clean(self.ext) as pth:
+        with ensure_clean(ext) as pth:
             df2.to_excel(pth)
 
-            res = read_excel(pth)
+            res = read_excel(pth, index_col=0)
             tm.assert_frame_equal(df2, res)
 
-            # no index_col specified when parse_dates is True
-            with tm.assert_produces_warning():
-                res = read_excel(pth, parse_dates=True)
-                tm.assert_frame_equal(df2, res)
-
-            res = read_excel(pth, parse_dates=['date_strings'], index_col=0)
+            res = read_excel(pth, parse_dates=["date_strings"], index_col=0)
             tm.assert_frame_equal(df, res)
 
-            dateparser = lambda x: pd.datetime.strptime(x, '%m/%d/%Y')
-            res = read_excel(pth, parse_dates=['date_strings'],
-                             date_parser=dateparser, index_col=0)
+            date_parser = lambda x: pd.datetime.strptime(x, "%m/%d/%Y")
+            res = read_excel(pth, parse_dates=["date_strings"],
+                             date_parser=date_parser, index_col=0)
             tm.assert_frame_equal(df, res)
 
-    def test_read_excel_skiprows_list(self):
+    def test_read_excel_skiprows_list(self, ext):
         # GH 4903
         actual = pd.read_excel(os.path.join(self.dirpath,
-                                            'testskiprows' + self.ext),
+                                            'testskiprows' + ext),
                                'skiprows_list', skiprows=[0, 2])
         expected = DataFrame([[1, 2.5, pd.Timestamp('2015-01-01'), True],
                               [2, 3.5, pd.Timestamp('2015-01-02'), False],
@@ -964,13 +1091,40 @@ def test_read_excel_skiprows_list(self):
         tm.assert_frame_equal(actual, expected)
 
         actual = pd.read_excel(os.path.join(self.dirpath,
-                                            'testskiprows' + self.ext),
+                                            'testskiprows' + ext),
                                'skiprows_list', skiprows=np.array([0, 2]))
         tm.assert_frame_equal(actual, expected)
 
-    def test_read_excel_squeeze(self):
+    def test_read_excel_nrows(self, ext):
+        # GH 16645
+        num_rows_to_pull = 5
+        actual = pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                               nrows=num_rows_to_pull)
+        expected = pd.read_excel(os.path.join(self.dirpath,
+                                              'test1' + ext))
+        expected = expected[:num_rows_to_pull]
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_nrows_greater_than_nrows_in_file(self, ext):
+        # GH 16645
+        expected = pd.read_excel(os.path.join(self.dirpath,
+                                              'test1' + ext))
+        num_records_in_file = len(expected)
+        num_rows_to_pull = num_records_in_file + 10
+        actual = pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                               nrows=num_rows_to_pull)
+        tm.assert_frame_equal(actual, expected)
+
+    def test_read_excel_nrows_non_integer_parameter(self, ext):
+        # GH 16645
+        msg = "'nrows' must be an integer >=0"
+        with pytest.raises(ValueError, match=msg):
+            pd.read_excel(os.path.join(self.dirpath, 'test1' + ext),
+                          nrows='5')
+
+    def test_read_excel_squeeze(self, ext):
         # GH 12157
-        f = os.path.join(self.dirpath, 'test_squeeze' + self.ext)
+        f = os.path.join(self.dirpath, 'test_squeeze' + ext)
 
         actual = pd.read_excel(f, 'two_columns', index_col=0, squeeze=True)
         expected = pd.Series([2, 3, 4], [4, 5, 6], name='b')
@@ -987,439 +1141,483 @@ def test_read_excel_squeeze(self):
         tm.assert_series_equal(actual, expected)
 
 
-class XlsReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
+@pytest.mark.parametrize("ext", ['.xls', '.xlsx', '.xlsm'])
+class TestXlrdReader(ReadingTestsBase):
+    """
+    This is the base class for the xlrd tests, and 3 different file formats
+    are supported: xls, xlsx, xlsm
+    """
 
+    @td.skip_if_no("xlwt")
+    def test_read_xlrd_book(self, ext):
+        import xlrd
+        df = self.frame
 
-class XlsxReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
+        engine = "xlrd"
+        sheet_name = "SheetA"
 
+        with ensure_clean(ext) as pth:
+            df.to_excel(pth, sheet_name)
+            book = xlrd.open_workbook(pth)
 
-class XlsmReaderTests(XlrdTests, tm.TestCase):
-    ext = '.xlsm'
-    engine_name = 'xlrd'
-    check_skip = staticmethod(_skip_if_no_xlrd)
+            with ExcelFile(book, engine=engine) as xl:
+                result = read_excel(xl, sheet_name, index_col=0)
+                tm.assert_frame_equal(df, result)
 
+            result = read_excel(book, sheet_name=sheet_name,
+                                engine=engine, index_col=0)
+            tm.assert_frame_equal(df, result)
+
+
+class _WriterBase(SharedItems):
+
+    @pytest.fixture(autouse=True)
+    def set_engine_and_path(self, request, merge_cells, engine, ext):
+        """Fixture to set engine and open file for use in each test case
+
+        Rather than requiring `engine=...` to be provided explicitly as an
+        argument in each test, this fixture sets a global option to dictate
+        which engine should be used to write Excel files. After executing
+        the test it rolls back said change to the global option.
 
-class ExcelWriterBase(SharedItems):
+        It also uses a context manager to open a temporary excel file for
+        the function to write to, accessible via `self.path`
+
+        Notes
+        -----
+        This fixture will run as part of each test method defined in the
+        class and any subclasses, on account of the `autouse=True`
+        argument
+        """
+        option_name = 'io.excel.{ext}.writer'.format(ext=ext.strip('.'))
+        prev_engine = get_option(option_name)
+        set_option(option_name, engine)
+        with ensure_clean(ext) as path:
+            self.path = path
+            yield
+        set_option(option_name, prev_engine)  # Roll back option change
+
+
+@pytest.mark.parametrize("merge_cells", [True, False])
+@pytest.mark.parametrize("engine,ext", [
+    pytest.param('openpyxl', '.xlsx', marks=pytest.mark.skipif(
+        not td.safe_import('openpyxl'), reason='No openpyxl')),
+    pytest.param('openpyxl', '.xlsm', marks=pytest.mark.skipif(
+        not td.safe_import('openpyxl'), reason='No openpyxl')),
+    pytest.param('xlwt', '.xls', marks=pytest.mark.skipif(
+        not td.safe_import('xlwt'), reason='No xlwt')),
+    pytest.param('xlsxwriter', '.xlsx', marks=pytest.mark.skipif(
+        not td.safe_import('xlsxwriter'), reason='No xlsxwriter'))
+])
+class TestExcelWriter(_WriterBase):
     # Base class for test cases to run with different Excel writers.
-    # To add a writer test, define the following:
-    # 1. A check_skip function that skips your tests if your writer isn't
-    #    installed.
-    # 2. Add a property ext, which is the file extension that your writer
-    #    writes to. (needs to start with '.' so it's a valid path)
-    # 3. Add a property engine_name, which is the name of the writer class.
-
-    # Test with MultiIndex and Hierarchical Rows as merged cells.
-    merge_cells = True
-
-    def setUp(self):
-        self.check_skip()
-        super(ExcelWriterBase, self).setUp()
-        self.option_name = 'io.excel.%s.writer' % self.ext.strip('.')
-        self.prev_engine = get_option(self.option_name)
-        set_option(self.option_name, self.engine_name)
-
-    def tearDown(self):
-        set_option(self.option_name, self.prev_engine)
-
-    def test_excel_sheet_by_name_raise(self):
-        _skip_if_no_xlrd()
+
+    def test_excel_sheet_by_name_raise(self, *_):
         import xlrd
 
-        with ensure_clean(self.ext) as pth:
-            gt = DataFrame(np.random.randn(10, 2))
-            gt.to_excel(pth)
-            xl = ExcelFile(pth)
-            df = read_excel(xl, 0)
-            tm.assert_frame_equal(gt, df)
+        gt = DataFrame(np.random.randn(10, 2))
+        gt.to_excel(self.path)
 
-            with tm.assertRaises(xlrd.XLRDError):
-                read_excel(xl, '0')
+        xl = ExcelFile(self.path)
+        df = read_excel(xl, 0, index_col=0)
 
-    def test_excelwriter_contextmanager(self):
-        _skip_if_no_xlrd()
+        tm.assert_frame_equal(gt, df)
 
-        with ensure_clean(self.ext) as pth:
-            with ExcelWriter(pth) as writer:
-                self.frame.to_excel(writer, 'Data1')
-                self.frame2.to_excel(writer, 'Data2')
+        with pytest.raises(xlrd.XLRDError):
+            read_excel(xl, "0")
 
-            with ExcelFile(pth) as reader:
-                found_df = read_excel(reader, 'Data1')
-                found_df2 = read_excel(reader, 'Data2')
-                tm.assert_frame_equal(found_df, self.frame)
-                tm.assert_frame_equal(found_df2, self.frame2)
-
-    def test_roundtrip(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # test roundtrip
-            self.frame.to_excel(path, 'test1')
-            recons = read_excel(path, 'test1', index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', index=False)
-            recons = read_excel(path, 'test1', index_col=None)
-            recons.index = self.frame.index
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', na_rep='NA')
-            recons = read_excel(path, 'test1', index_col=0, na_values=['NA'])
-            tm.assert_frame_equal(self.frame, recons)
-
-            # GH 3611
-            self.frame.to_excel(path, 'test1', na_rep='88')
-            recons = read_excel(path, 'test1', index_col=0, na_values=['88'])
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, 'test1', na_rep='88')
-            recons = read_excel(path, 'test1', index_col=0,
-                                na_values=[88, 88.0])
-            tm.assert_frame_equal(self.frame, recons)
-
-            # GH 6573
-            self.frame.to_excel(path, 'Sheet1')
-            recons = read_excel(path, index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-            self.frame.to_excel(path, '0')
-            recons = read_excel(path, index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-
-            # GH 8825 Pandas Series should provide to_excel method
-            s = self.frame["A"]
-            s.to_excel(path)
-            recons = read_excel(path, index_col=0)
-            tm.assert_frame_equal(s.to_frame(), recons)
-
-    def test_mixed(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.mixed_frame.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=0)
-            tm.assert_frame_equal(self.mixed_frame, recons)
-
-    def test_tsframe(self):
-        _skip_if_no_xlrd()
+    def test_excel_writer_context_manager(self, *_):
+        with ExcelWriter(self.path) as writer:
+            self.frame.to_excel(writer, "Data1")
+            self.frame2.to_excel(writer, "Data2")
 
-        df = tm.makeTimeDataFrame()[:5]
+        with ExcelFile(self.path) as reader:
+            found_df = read_excel(reader, "Data1", index_col=0)
+            found_df2 = read_excel(reader, "Data2", index_col=0)
+
+            tm.assert_frame_equal(found_df, self.frame)
+            tm.assert_frame_equal(found_df2, self.frame2)
+
+    def test_roundtrip(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # test roundtrip
+        self.frame.to_excel(self.path, 'test1')
+        recons = read_excel(self.path, 'test1', index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', index=False)
+        recons = read_excel(self.path, 'test1', index_col=None)
+        recons.index = self.frame.index
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', na_rep='NA')
+        recons = read_excel(self.path, 'test1', index_col=0, na_values=['NA'])
+        tm.assert_frame_equal(self.frame, recons)
+
+        # GH 3611
+        self.frame.to_excel(self.path, 'test1', na_rep='88')
+        recons = read_excel(self.path, 'test1', index_col=0, na_values=['88'])
+        tm.assert_frame_equal(self.frame, recons)
+
+        self.frame.to_excel(self.path, 'test1', na_rep='88')
+        recons = read_excel(self.path, 'test1', index_col=0,
+                            na_values=[88, 88.0])
+        tm.assert_frame_equal(self.frame, recons)
+
+        # GH 6573
+        self.frame.to_excel(self.path, 'Sheet1')
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
 
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(df, recons)
-
-    def test_basics_with_nan(self):
-        _skip_if_no_xlrd()
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-    def test_int_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.int8, np.int16, np.int32, np.int64):
-
-            with ensure_clean(self.ext) as path:
-                # Test np.int values read come back as int (rather than float
-                # which is Excel's format).
-                frame = DataFrame(np.random.randint(-10, 10, size=(10, 2)),
-                                  dtype=np_type)
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1')
-                int_frame = frame.astype(np.int64)
-                tm.assert_frame_equal(int_frame, recons)
-                recons2 = read_excel(path, 'test1')
-                tm.assert_frame_equal(int_frame, recons2)
-
-                # test with convert_float=False comes back as float
-                float_frame = frame.astype(float)
-                recons = read_excel(path, 'test1', convert_float=False)
-                tm.assert_frame_equal(recons, float_frame,
-                                      check_index_type=False,
-                                      check_column_type=False)
-
-    def test_float_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.float16, np.float32, np.float64):
-            with ensure_clean(self.ext) as path:
-                # Test np.float values read come back as float.
-                frame = DataFrame(np.random.random_sample(10), dtype=np_type)
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1').astype(np_type)
-                tm.assert_frame_equal(frame, recons, check_dtype=False)
-
-    def test_bool_types(self):
-        _skip_if_no_xlrd()
-
-        for np_type in (np.bool8, np.bool_):
-            with ensure_clean(self.ext) as path:
-                # Test np.bool values read come back as float.
-                frame = (DataFrame([1, 0, True, False], dtype=np_type))
-                frame.to_excel(path, 'test1')
-                reader = ExcelFile(path)
-                recons = read_excel(reader, 'test1').astype(np_type)
-                tm.assert_frame_equal(frame, recons)
-
-    def test_inf_roundtrip(self):
-        _skip_if_no_xlrd()
+        self.frame.to_excel(self.path, '0')
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
 
+        # GH 8825 Pandas Series should provide to_excel method
+        s = self.frame["A"]
+        s.to_excel(self.path)
+        recons = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(s.to_frame(), recons)
+
+    def test_mixed(self, merge_cells, engine, ext):
+        self.mixed_frame.to_excel(self.path, 'test1')
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=0)
+        tm.assert_frame_equal(self.mixed_frame, recons)
+
+    def test_ts_frame(self, *_):
+        df = tm.makeTimeDataFrame()[:5]
+
+        df.to_excel(self.path, "test1")
+        reader = ExcelFile(self.path)
+
+        recons = read_excel(reader, "test1", index_col=0)
+        tm.assert_frame_equal(df, recons)
+
+    def test_basics_with_nan(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+    @pytest.mark.parametrize("np_type", [
+        np.int8, np.int16, np.int32, np.int64])
+    def test_int_types(self, merge_cells, engine, ext, np_type):
+        # Test np.int values read come back as int
+        # (rather than float which is Excel's format).
+        frame = DataFrame(np.random.randint(-10, 10, size=(10, 2)),
+                          dtype=np_type)
+        frame.to_excel(self.path, "test1")
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, "test1", index_col=0)
+
+        int_frame = frame.astype(np.int64)
+        tm.assert_frame_equal(int_frame, recons)
+
+        recons2 = read_excel(self.path, "test1", index_col=0)
+        tm.assert_frame_equal(int_frame, recons2)
+
+        # Test with convert_float=False comes back as float.
+        float_frame = frame.astype(float)
+        recons = read_excel(self.path, "test1",
+                            convert_float=False, index_col=0)
+        tm.assert_frame_equal(recons, float_frame,
+                              check_index_type=False,
+                              check_column_type=False)
+
+    @pytest.mark.parametrize("np_type", [
+        np.float16, np.float32, np.float64])
+    def test_float_types(self, merge_cells, engine, ext, np_type):
+        # Test np.float values read come back as float.
+        frame = DataFrame(np.random.random_sample(10), dtype=np_type)
+        frame.to_excel(self.path, "test1")
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, "test1", index_col=0).astype(np_type)
+
+        tm.assert_frame_equal(frame, recons, check_dtype=False)
+
+    @pytest.mark.parametrize("np_type", [np.bool8, np.bool_])
+    def test_bool_types(self, merge_cells, engine, ext, np_type):
+        # Test np.bool values read come back as float.
+        frame = (DataFrame([1, 0, True, False], dtype=np_type))
+        frame.to_excel(self.path, "test1")
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, "test1", index_col=0).astype(np_type)
+
+        tm.assert_frame_equal(frame, recons)
+
+    def test_inf_roundtrip(self, *_):
         frame = DataFrame([(1, np.inf), (2, 3), (5, -np.inf)])
-        with ensure_clean(self.ext) as path:
-            frame.to_excel(path, 'test1')
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(frame, recons)
+        frame.to_excel(self.path, "test1")
 
-    def test_sheets(self):
-        _skip_if_no_xlrd()
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, "test1", index_col=0)
 
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
+        tm.assert_frame_equal(frame, recons)
 
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
+    def test_sheets(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
 
-            # Test writing to separate sheets
-            writer = ExcelWriter(path)
-            self.frame.to_excel(writer, 'test1')
-            self.tsframe.to_excel(writer, 'test2')
-            writer.save()
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=0)
-            tm.assert_frame_equal(self.frame, recons)
-            recons = read_excel(reader, 'test2', index_col=0)
-            tm.assert_frame_equal(self.tsframe, recons)
-            self.assertEqual(2, len(reader.sheet_names))
-            self.assertEqual('test1', reader.sheet_names[0])
-            self.assertEqual('test2', reader.sheet_names[1])
-
-    def test_colaliases(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # column aliases
-            col_aliases = Index(['AA', 'X', 'Y', 'Z'])
-            self.frame2.to_excel(path, 'test1', header=col_aliases)
-            reader = ExcelFile(path)
-            rs = read_excel(reader, 'test1', index_col=0)
-            xp = self.frame2.copy()
-            xp.columns = col_aliases
-            tm.assert_frame_equal(xp, rs)
-
-    def test_roundtrip_indexlabels(self):
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-
-            self.frame['A'][:5] = nan
-
-            self.frame.to_excel(path, 'test1')
-            self.frame.to_excel(path, 'test1', columns=['A', 'B'])
-            self.frame.to_excel(path, 'test1', header=False)
-            self.frame.to_excel(path, 'test1', index=False)
-
-            # test index_label
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path, 'test1',
-                           index_label=['test'],
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                index_col=0,
-                                ).astype(np.int64)
-            frame.index.names = ['test']
-            self.assertEqual(frame.index.names, recons.index.names)
-
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path,
-                           'test1',
-                           index_label=['test', 'dummy', 'dummy2'],
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                index_col=0,
-                                ).astype(np.int64)
-            frame.index.names = ['test']
-            self.assertEqual(frame.index.names, recons.index.names)
-
-            frame = (DataFrame(np.random.randn(10, 2)) >= 0)
-            frame.to_excel(path,
-                           'test1',
-                           index_label='test',
-                           merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                index_col=0,
-                                ).astype(np.int64)
-            frame.index.names = ['test']
-            tm.assert_frame_equal(frame, recons.astype(bool))
-
-        with ensure_clean(self.ext) as path:
-
-            self.frame.to_excel(path,
-                                'test1',
-                                columns=['A', 'B', 'C', 'D'],
-                                index=False, merge_cells=self.merge_cells)
-            # take 'A' and 'B' as indexes (same row as cols 'C', 'D')
-            df = self.frame.copy()
-            df = df.set_index(['A', 'B'])
-
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1', index_col=[0, 1])
-            tm.assert_frame_equal(df, recons, check_less_precise=True)
-
-    def test_excel_roundtrip_indexname(self):
-        _skip_if_no_xlrd()
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
 
+        # Test writing to separate sheets
+        writer = ExcelWriter(self.path)
+        self.frame.to_excel(writer, 'test1')
+        self.tsframe.to_excel(writer, 'test2')
+        writer.save()
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=0)
+        tm.assert_frame_equal(self.frame, recons)
+        recons = read_excel(reader, 'test2', index_col=0)
+        tm.assert_frame_equal(self.tsframe, recons)
+        assert 2 == len(reader.sheet_names)
+        assert 'test1' == reader.sheet_names[0]
+        assert 'test2' == reader.sheet_names[1]
+
+    def test_colaliases(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # column aliases
+        col_aliases = Index(['AA', 'X', 'Y', 'Z'])
+        self.frame2.to_excel(self.path, 'test1', header=col_aliases)
+        reader = ExcelFile(self.path)
+        rs = read_excel(reader, 'test1', index_col=0)
+        xp = self.frame2.copy()
+        xp.columns = col_aliases
+        tm.assert_frame_equal(xp, rs)
+
+    def test_roundtrip_indexlabels(self, merge_cells, engine, ext):
+        self.frame['A'][:5] = nan
+
+        self.frame.to_excel(self.path, 'test1')
+        self.frame.to_excel(self.path, 'test1', columns=['A', 'B'])
+        self.frame.to_excel(self.path, 'test1', header=False)
+        self.frame.to_excel(self.path, 'test1', index=False)
+
+        # test index_label
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path, 'test1',
+                       index_label=['test'],
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        assert frame.index.names == recons.index.names
+
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path,
+                       'test1',
+                       index_label=['test', 'dummy', 'dummy2'],
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        assert frame.index.names == recons.index.names
+
+        frame = (DataFrame(np.random.randn(10, 2)) >= 0)
+        frame.to_excel(self.path,
+                       'test1',
+                       index_label='test',
+                       merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=0,
+                            ).astype(np.int64)
+        frame.index.names = ['test']
+        tm.assert_frame_equal(frame, recons.astype(bool))
+
+        self.frame.to_excel(self.path,
+                            'test1',
+                            columns=['A', 'B', 'C', 'D'],
+                            index=False, merge_cells=merge_cells)
+        # take 'A' and 'B' as indexes (same row as cols 'C', 'D')
+        df = self.frame.copy()
+        df = df.set_index(['A', 'B'])
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1', index_col=[0, 1])
+        tm.assert_frame_equal(df, recons, check_less_precise=True)
+
+    def test_excel_roundtrip_indexname(self, merge_cells, engine, ext):
         df = DataFrame(np.random.randn(10, 4))
         df.index.name = 'foo'
 
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, merge_cells=self.merge_cells)
+        df.to_excel(self.path, merge_cells=merge_cells)
 
-            xf = ExcelFile(path)
-            result = read_excel(xf, xf.sheet_names[0],
-                                index_col=0)
+        xf = ExcelFile(self.path)
+        result = read_excel(xf, xf.sheet_names[0],
+                            index_col=0)
 
-            tm.assert_frame_equal(result, df)
-            self.assertEqual(result.index.name, 'foo')
-
-    def test_excel_roundtrip_datetime(self):
-        _skip_if_no_xlrd()
+        tm.assert_frame_equal(result, df)
+        assert result.index.name == 'foo'
 
+    def test_excel_roundtrip_datetime(self, merge_cells, *_):
         # datetime.date, not sure what to test here exactly
         tsf = self.tsframe.copy()
-        with ensure_clean(self.ext) as path:
 
-            tsf.index = [x.date() for x in self.tsframe.index]
-            tsf.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1')
-            tm.assert_frame_equal(self.tsframe, recons)
+        tsf.index = [x.date() for x in self.tsframe.index]
+        tsf.to_excel(self.path, "test1", merge_cells=merge_cells)
+
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, "test1", index_col=0)
 
-    # GH4133 - excel output format strings
-    def test_excel_date_datetime_format(self):
-        _skip_if_no_xlrd()
+        tm.assert_frame_equal(self.tsframe, recons)
+
+    def test_excel_date_datetime_format(self, merge_cells, engine, ext):
+        # see gh-4133
+        #
+        # Excel output format strings
         df = DataFrame([[date(2014, 1, 31),
                          date(1999, 9, 24)],
                         [datetime(1998, 5, 26, 23, 33, 4),
                          datetime(2014, 2, 28, 13, 5, 13)]],
-                       index=['DATE', 'DATETIME'], columns=['X', 'Y'])
+                       index=["DATE", "DATETIME"], columns=["X", "Y"])
         df_expected = DataFrame([[datetime(2014, 1, 31),
                                   datetime(1999, 9, 24)],
                                  [datetime(1998, 5, 26, 23, 33, 4),
                                   datetime(2014, 2, 28, 13, 5, 13)]],
-                                index=['DATE', 'DATETIME'], columns=['X', 'Y'])
-
-        with ensure_clean(self.ext) as filename1:
-            with ensure_clean(self.ext) as filename2:
-                writer1 = ExcelWriter(filename1)
-                writer2 = ExcelWriter(filename2,
-                                      date_format='DD.MM.YYYY',
-                                      datetime_format='DD.MM.YYYY HH-MM-SS')
-
-                df.to_excel(writer1, 'test1')
-                df.to_excel(writer2, 'test1')
-
-                writer1.close()
-                writer2.close()
-
-                reader1 = ExcelFile(filename1)
-                reader2 = ExcelFile(filename2)
-
-                rs1 = read_excel(reader1, 'test1', index_col=None)
-                rs2 = read_excel(reader2, 'test1', index_col=None)
-
-                tm.assert_frame_equal(rs1, rs2)
-
-                # since the reader returns a datetime object for dates, we need
-                # to use df_expected to check the result
-                tm.assert_frame_equal(rs2, df_expected)
-
-    def test_to_excel_periodindex(self):
-        _skip_if_no_xlrd()
-
+                                index=["DATE", "DATETIME"], columns=["X", "Y"])
+
+        with ensure_clean(ext) as filename2:
+            writer1 = ExcelWriter(self.path)
+            writer2 = ExcelWriter(filename2,
+                                  date_format="DD.MM.YYYY",
+                                  datetime_format="DD.MM.YYYY HH-MM-SS")
+
+            df.to_excel(writer1, "test1")
+            df.to_excel(writer2, "test1")
+
+            writer1.close()
+            writer2.close()
+
+            reader1 = ExcelFile(self.path)
+            reader2 = ExcelFile(filename2)
+
+            rs1 = read_excel(reader1, "test1", index_col=0)
+            rs2 = read_excel(reader2, "test1", index_col=0)
+
+            tm.assert_frame_equal(rs1, rs2)
+
+            # Since the reader returns a datetime object for dates,
+            # we need to use df_expected to check the result.
+            tm.assert_frame_equal(rs2, df_expected)
+
+    def test_to_excel_interval_no_labels(self, *_):
+        # see gh-19242
+        #
+        # Test writing Interval without labels.
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          dtype=np.int64)
+        expected = frame.copy()
+
+        frame["new"] = pd.cut(frame[0], 10)
+        expected["new"] = pd.cut(expected[0], 10).astype(str)
+
+        frame.to_excel(self.path, "test1")
+        reader = ExcelFile(self.path)
+
+        recons = read_excel(reader, "test1", index_col=0)
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_interval_labels(self, *_):
+        # see gh-19242
+        #
+        # Test writing Interval with labels.
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          dtype=np.int64)
+        expected = frame.copy()
+        intervals = pd.cut(frame[0], 10, labels=["A", "B", "C", "D", "E",
+                                                 "F", "G", "H", "I", "J"])
+        frame["new"] = intervals
+        expected["new"] = pd.Series(list(intervals))
+
+        frame.to_excel(self.path, "test1")
+        reader = ExcelFile(self.path)
+
+        recons = read_excel(reader, "test1", index_col=0)
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_timedelta(self, *_):
+        # see gh-19242, gh-9155
+        #
+        # Test writing timedelta to xls.
+        frame = DataFrame(np.random.randint(-10, 10, size=(20, 1)),
+                          columns=["A"], dtype=np.int64)
+        expected = frame.copy()
+
+        frame["new"] = frame["A"].apply(lambda x: timedelta(seconds=x))
+        expected["new"] = expected["A"].apply(
+            lambda x: timedelta(seconds=x).total_seconds() / float(86400))
+
+        frame.to_excel(self.path, "test1")
+        reader = ExcelFile(self.path)
+
+        recons = read_excel(reader, "test1", index_col=0)
+        tm.assert_frame_equal(expected, recons)
+
+    def test_to_excel_periodindex(self, merge_cells, engine, ext):
         frame = self.tsframe
         xp = frame.resample('M', kind='period').mean()
 
-        with ensure_clean(self.ext) as path:
-            xp.to_excel(path, 'sht1')
-
-            reader = ExcelFile(path)
-            rs = read_excel(reader, 'sht1', index_col=0)
-            tm.assert_frame_equal(xp, rs.to_period('M'))
+        xp.to_excel(self.path, 'sht1')
 
-    def test_to_excel_multiindex(self):
-        _skip_if_no_xlrd()
+        reader = ExcelFile(self.path)
+        rs = read_excel(reader, 'sht1', index_col=0)
+        tm.assert_frame_equal(xp, rs.to_period('M'))
 
+    def test_to_excel_multiindex(self, merge_cells, engine, ext):
         frame = self.frame
         arrays = np.arange(len(frame.index) * 2).reshape(2, -1)
         new_index = MultiIndex.from_arrays(arrays,
                                            names=['first', 'second'])
         frame.index = new_index
 
-        with ensure_clean(self.ext) as path:
-            frame.to_excel(path, 'test1', header=False)
-            frame.to_excel(path, 'test1', columns=['A', 'B'])
+        frame.to_excel(self.path, 'test1', header=False)
+        frame.to_excel(self.path, 'test1', columns=['A', 'B'])
 
-            # round trip
-            frame.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            df = read_excel(reader, 'test1', index_col=[0, 1])
-            tm.assert_frame_equal(frame, df)
+        # round trip
+        frame.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        df = read_excel(reader, 'test1', index_col=[0, 1])
+        tm.assert_frame_equal(frame, df)
 
     # GH13511
-    def test_to_excel_multiindex_nan_label(self):
-        _skip_if_no_xlrd()
-
+    def test_to_excel_multiindex_nan_label(self, merge_cells, engine, ext):
         frame = pd.DataFrame({'A': [None, 2, 3],
                               'B': [10, 20, 30],
                               'C': np.random.sample(3)})
         frame = frame.set_index(['A', 'B'])
 
-        with ensure_clean(self.ext) as path:
-            frame.to_excel(path, merge_cells=self.merge_cells)
-            df = read_excel(path, index_col=[0, 1])
-            tm.assert_frame_equal(frame, df)
+        frame.to_excel(self.path, merge_cells=merge_cells)
+        df = read_excel(self.path, index_col=[0, 1])
+        tm.assert_frame_equal(frame, df)
 
     # Test for Issue 11328. If column indices are integers, make
     # sure they are handled correctly for either setting of
     # merge_cells
-    def test_to_excel_multiindex_cols(self):
-        _skip_if_no_xlrd()
-
+    def test_to_excel_multiindex_cols(self, merge_cells, engine, ext):
         frame = self.frame
         arrays = np.arange(len(frame.index) * 2).reshape(2, -1)
         new_index = MultiIndex.from_arrays(arrays,
@@ -1430,42 +1628,37 @@ def test_to_excel_multiindex_cols(self):
                                                  (50, 1), (50, 2)])
         frame.columns = new_cols_index
         header = [0, 1]
-        if not self.merge_cells:
+        if not merge_cells:
             header = 0
 
-        with ensure_clean(self.ext) as path:
-            # round trip
-            frame.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            df = read_excel(reader, 'test1', header=header,
-                            index_col=[0, 1])
-            if not self.merge_cells:
-                fm = frame.columns.format(sparsify=False,
-                                          adjoin=False, names=False)
-                frame.columns = [".".join(map(str, q)) for q in zip(*fm)]
-            tm.assert_frame_equal(frame, df)
-
-    def test_to_excel_multiindex_dates(self):
-        _skip_if_no_xlrd()
-
+        # round trip
+        frame.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        df = read_excel(reader, 'test1', header=header,
+                        index_col=[0, 1])
+        if not merge_cells:
+            fm = frame.columns.format(sparsify=False,
+                                      adjoin=False, names=False)
+            frame.columns = [".".join(map(str, q)) for q in zip(*fm)]
+        tm.assert_frame_equal(frame, df)
+
+    def test_to_excel_multiindex_dates(self, merge_cells, engine, ext):
         # try multiindex with dates
         tsframe = self.tsframe.copy()
         new_index = [tsframe.index, np.arange(len(tsframe.index))]
         tsframe.index = MultiIndex.from_arrays(new_index)
 
-        with ensure_clean(self.ext) as path:
-            tsframe.index.names = ['time', 'foo']
-            tsframe.to_excel(path, 'test1', merge_cells=self.merge_cells)
-            reader = ExcelFile(path)
-            recons = read_excel(reader, 'test1',
-                                index_col=[0, 1])
-
-            tm.assert_frame_equal(tsframe, recons)
-            self.assertEqual(recons.index.names, ('time', 'foo'))
+        tsframe.index.names = ['time', 'foo']
+        tsframe.to_excel(self.path, 'test1', merge_cells=merge_cells)
+        reader = ExcelFile(self.path)
+        recons = read_excel(reader, 'test1',
+                            index_col=[0, 1])
 
-    def test_to_excel_multiindex_no_write_index(self):
-        _skip_if_no_xlrd()
+        tm.assert_frame_equal(tsframe, recons)
+        assert recons.index.names == ('time', 'foo')
 
+    def test_to_excel_multiindex_no_write_index(self, merge_cells, engine,
+                                                ext):
         # Test writing and re-reading a MI witout the index. GH 5616.
 
         # Initial non-MI frame.
@@ -1476,74 +1669,66 @@ def test_to_excel_multiindex_no_write_index(self):
         multi_index = MultiIndex.from_tuples([(70, 80), (90, 100)])
         frame2.index = multi_index
 
-        with ensure_clean(self.ext) as path:
-
-            # Write out to Excel without the index.
-            frame2.to_excel(path, 'test1', index=False)
+        # Write out to Excel without the index.
+        frame2.to_excel(self.path, 'test1', index=False)
 
-            # Read it back in.
-            reader = ExcelFile(path)
-            frame3 = read_excel(reader, 'test1')
+        # Read it back in.
+        reader = ExcelFile(self.path)
+        frame3 = read_excel(reader, 'test1')
 
-            # Test that it is the same as the initial frame.
-            tm.assert_frame_equal(frame1, frame3)
-
-    def test_to_excel_float_format(self):
-        _skip_if_no_xlrd()
+        # Test that it is the same as the initial frame.
+        tm.assert_frame_equal(frame1, frame3)
 
+    def test_to_excel_float_format(self, *_):
         df = DataFrame([[0.123456, 0.234567, 0.567567],
                         [12.32112, 123123.2, 321321.2]],
-                       index=['A', 'B'], columns=['X', 'Y', 'Z'])
+                       index=["A", "B"], columns=["X", "Y", "Z"])
+        df.to_excel(self.path, "test1", float_format="%.2f")
 
-        with ensure_clean(self.ext) as filename:
-            df.to_excel(filename, 'test1', float_format='%.2f')
+        reader = ExcelFile(self.path)
+        result = read_excel(reader, "test1", index_col=0)
 
-            reader = ExcelFile(filename)
-            rs = read_excel(reader, 'test1', index_col=None)
-            xp = DataFrame([[0.12, 0.23, 0.57],
-                            [12.32, 123123.20, 321321.20]],
-                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
-            tm.assert_frame_equal(rs, xp)
-
-    def test_to_excel_output_encoding(self):
-        _skip_if_no_xlrd()
-
-        # avoid mixed inferred_type
-        df = DataFrame([[u'\u0192', u'\u0193', u'\u0194'],
-                        [u'\u0195', u'\u0196', u'\u0197']],
-                       index=[u'A\u0192', u'B'],
-                       columns=[u'X\u0193', u'Y', u'Z'])
-
-        with ensure_clean('__tmp_to_excel_float_format__.' + self.ext)\
-                as filename:
-            df.to_excel(filename, sheet_name='TestSheet', encoding='utf8')
-            result = read_excel(filename, 'TestSheet', encoding='utf8')
+        expected = DataFrame([[0.12, 0.23, 0.57],
+                              [12.32, 123123.20, 321321.20]],
+                             index=["A", "B"], columns=["X", "Y", "Z"])
+        tm.assert_frame_equal(result, expected)
+
+    def test_to_excel_output_encoding(self, merge_cells, engine, ext):
+        # Avoid mixed inferred_type.
+        df = DataFrame([[u"\u0192", u"\u0193", u"\u0194"],
+                        [u"\u0195", u"\u0196", u"\u0197"]],
+                       index=[u"A\u0192", u"B"],
+                       columns=[u"X\u0193", u"Y", u"Z"])
+
+        with ensure_clean("__tmp_to_excel_float_format__." + ext) as filename:
+            df.to_excel(filename, sheet_name="TestSheet", encoding="utf8")
+            result = read_excel(filename, "TestSheet",
+                                encoding="utf8", index_col=0)
             tm.assert_frame_equal(result, df)
 
-    def test_to_excel_unicode_filename(self):
-        _skip_if_no_xlrd()
-        with ensure_clean(u('\u0192u.') + self.ext) as filename:
+    def test_to_excel_unicode_filename(self, merge_cells, engine, ext):
+        with ensure_clean(u("\u0192u.") + ext) as filename:
             try:
-                f = open(filename, 'wb')
+                f = open(filename, "wb")
             except UnicodeEncodeError:
-                pytest.skip('no unicode file names on this system')
+                pytest.skip("No unicode file names on this system")
             else:
                 f.close()
 
             df = DataFrame([[0.123456, 0.234567, 0.567567],
                             [12.32112, 123123.2, 321321.2]],
-                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
-
-            df.to_excel(filename, 'test1', float_format='%.2f')
+                           index=["A", "B"], columns=["X", "Y", "Z"])
+            df.to_excel(filename, "test1", float_format="%.2f")
 
             reader = ExcelFile(filename)
-            rs = read_excel(reader, 'test1', index_col=None)
-            xp = DataFrame([[0.12, 0.23, 0.57],
-                            [12.32, 123123.20, 321321.20]],
-                           index=['A', 'B'], columns=['X', 'Y', 'Z'])
-            tm.assert_frame_equal(rs, xp)
+            result = read_excel(reader, "test1", index_col=0)
 
-    # def test_to_excel_header_styling_xls(self):
+            expected = DataFrame([[0.12, 0.23, 0.57],
+                                  [12.32, 123123.20, 321321.20]],
+                                 index=["A", "B"], columns=["X", "Y", "Z"])
+            tm.assert_frame_equal(result, expected)
+
+    # def test_to_excel_header_styling_xls(self, merge_cells, engine, ext):
 
     #     import StringIO
     #     s = StringIO(
@@ -1575,23 +1760,22 @@ def test_to_excel_unicode_filename(self):
 
     #     wbk = xlrd.open_workbook(filename,
     #                              formatting_info=True)
-    #     self.assertEqual(["test1"], wbk.sheet_names())
+    #     assert ["test1"] == wbk.sheet_names()
     #     ws = wbk.sheet_by_name('test1')
-    #     self.assertEqual([(0, 1, 5, 7), (0, 1, 3, 5), (0, 1, 1, 3)],
-    #                       ws.merged_cells)
+    #     assert [(0, 1, 5, 7), (0, 1, 3, 5), (0, 1, 1, 3)] == ws.merged_cells
     #     for i in range(0, 2):
     #         for j in range(0, 7):
     #             xfx = ws.cell_xf_index(0, 0)
     #             cell_xf = wbk.xf_list[xfx]
     #             font = wbk.font_list
-    #             self.assertEqual(1, font[cell_xf.font_index].bold)
-    #             self.assertEqual(1, cell_xf.border.top_line_style)
-    #             self.assertEqual(1, cell_xf.border.right_line_style)
-    #             self.assertEqual(1, cell_xf.border.bottom_line_style)
-    #             self.assertEqual(1, cell_xf.border.left_line_style)
-    #             self.assertEqual(2, cell_xf.alignment.hor_align)
+    #             assert 1 == font[cell_xf.font_index].bold
+    #             assert 1 == cell_xf.border.top_line_style
+    #             assert 1 == cell_xf.border.right_line_style
+    #             assert 1 == cell_xf.border.bottom_line_style
+    #             assert 1 == cell_xf.border.left_line_style
+    #             assert 2 == cell_xf.alignment.hor_align
     #     os.remove(filename)
-    # def test_to_excel_header_styling_xlsx(self):
+    # def test_to_excel_header_styling_xlsx(self, merge_cells, engine, ext):
     #     import StringIO
     #     s = StringIO(
     #     """Date,ticker,type,value
@@ -1621,175 +1805,209 @@ def test_to_excel_unicode_filename(self):
     #     filename = '__tmp_to_excel_header_styling_xlsx__.xlsx'
     #     pdf.to_excel(filename, 'test1')
     #     wbk = openpyxl.load_workbook(filename)
-    #     self.assertEqual(["test1"], wbk.get_sheet_names())
+    #     assert ["test1"] == wbk.get_sheet_names()
     #     ws = wbk.get_sheet_by_name('test1')
     #     xlsaddrs = ["%s2" % chr(i) for i in range(ord('A'), ord('H'))]
     #     xlsaddrs += ["A%s" % i for i in range(1, 6)]
     #     xlsaddrs += ["B1", "D1", "F1"]
     #     for xlsaddr in xlsaddrs:
     #         cell = ws.cell(xlsaddr)
-    #         self.assertTrue(cell.style.font.bold)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.top.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.right.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.bottom.border_style)
-    #         self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-    #                           cell.style.borders.left.border_style)
-    #         self.assertEqual(openpyxl.style.Alignment.HORIZONTAL_CENTER,
-    #                           cell.style.alignment.horizontal)
+    #         assert cell.style.font.bold
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.top.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.right.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.bottom.border_style)
+    #         assert (openpyxl.style.Border.BORDER_THIN ==
+    #                 cell.style.borders.left.border_style)
+    #         assert (openpyxl.style.Alignment.HORIZONTAL_CENTER ==
+    #                 cell.style.alignment.horizontal)
     #     mergedcells_addrs = ["C1", "E1", "G1"]
     #     for maddr in mergedcells_addrs:
-    #         self.assertTrue(ws.cell(maddr).merged)
+    #         assert ws.cell(maddr).merged
     #     os.remove(filename)
 
-    def test_excel_010_hemstring(self):
-        _skip_if_no_xlrd()
+    @pytest.mark.parametrize("use_headers", [True, False])
+    @pytest.mark.parametrize("r_idx_nlevels", [1, 2, 3])
+    @pytest.mark.parametrize("c_idx_nlevels", [1, 2, 3])
+    def test_excel_010_hemstring(self, merge_cells, engine, ext,
+                                 c_idx_nlevels, r_idx_nlevels, use_headers):
 
-        if self.merge_cells:
-            pytest.skip('Skip tests for merged MI format.')
+        def roundtrip(data, header=True, parser_hdr=0, index=True):
+            data.to_excel(self.path, header=header,
+                          merge_cells=merge_cells, index=index)
 
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        # ensure limited functionality in 0.10
-        # override of #2370 until sorted out in 0.11
+            xf = ExcelFile(self.path)
+            return read_excel(xf, xf.sheet_names[0], header=parser_hdr)
 
-        def roundtrip(df, header=True, parser_hdr=0, index=True):
+        # Basic test.
+        parser_header = 0 if use_headers else None
+        res = roundtrip(DataFrame([0]), use_headers, parser_header)
 
-            with ensure_clean(self.ext) as path:
-                df.to_excel(path, header=header,
-                            merge_cells=self.merge_cells, index=index)
-                xf = ExcelFile(path)
-                res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
-                return res
+        assert res.shape == (1, 2)
+        assert res.iloc[0, 0] is not np.nan
 
+        # More complex tests with multi-index.
         nrows = 5
         ncols = 3
-        for use_headers in (True, False):
-            for i in range(1, 4):  # row multindex upto nlevel=3
-                for j in range(1, 4):  # col ""
-                    df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
-
-                    # this if will be removed once multi column excel writing
-                    # is implemented for now fixing #9794
-                    if j > 1:
-                        with tm.assertRaises(NotImplementedError):
-                            res = roundtrip(df, use_headers, index=False)
-                    else:
-                        res = roundtrip(df, use_headers)
-
-                    if use_headers:
-                        self.assertEqual(res.shape, (nrows, ncols + i))
-                    else:
-                        # first row taken as columns
-                        self.assertEqual(res.shape, (nrows - 1, ncols + i))
-
-                    # no nans
-                    for r in range(len(res.index)):
-                        for c in range(len(res.columns)):
-                            self.assertTrue(res.iloc[r, c] is not np.nan)
-
-        res = roundtrip(DataFrame([0]))
-        self.assertEqual(res.shape, (1, 1))
-        self.assertTrue(res.iloc[0, 0] is not np.nan)
 
-        res = roundtrip(DataFrame([0]), False, None)
-        self.assertEqual(res.shape, (1, 2))
-        self.assertTrue(res.iloc[0, 0] is not np.nan)
+        from pandas.util.testing import makeCustomDataframe as mkdf
+        # ensure limited functionality in 0.10
+        # override of gh-2370 until sorted out in 0.11
 
-    def test_excel_010_hemstring_raises_NotImplementedError(self):
-        # This test was failing only for j>1 and header=False,
-        # So I reproduced a simple test.
-        _skip_if_no_xlrd()
+        df = mkdf(nrows, ncols, r_idx_nlevels=r_idx_nlevels,
+                  c_idx_nlevels=c_idx_nlevels)
 
-        if self.merge_cells:
-            pytest.skip('Skip tests for merged MI format.')
+        # This if will be removed once multi-column Excel writing
+        # is implemented. For now fixing gh-9794.
+        if c_idx_nlevels > 1:
+            with pytest.raises(NotImplementedError):
+                roundtrip(df, use_headers, index=False)
+        else:
+            res = roundtrip(df, use_headers)
 
-        from pandas.util.testing import makeCustomDataframe as mkdf
-        # ensure limited functionality in 0.10
-        # override of #2370 until sorted out in 0.11
+            if use_headers:
+                assert res.shape == (nrows, ncols + r_idx_nlevels)
+            else:
+                # First row taken as columns.
+                assert res.shape == (nrows - 1, ncols + r_idx_nlevels)
+
+            # No NaNs.
+            for r in range(len(res.index)):
+                for c in range(len(res.columns)):
+                    assert res.iloc[r, c] is not np.nan
+
+    def test_duplicated_columns(self, *_):
+        # see gh-5235
+        df = DataFrame([[1, 2, 3], [1, 2, 3], [1, 2, 3]],
+                       columns=["A", "B", "B"])
+        df.to_excel(self.path, "test1")
+        expected = DataFrame([[1, 2, 3], [1, 2, 3], [1, 2, 3]],
+                             columns=["A", "B", "B.1"])
+
+        # By default, we mangle.
+        result = read_excel(self.path, "test1", index_col=0)
+        tm.assert_frame_equal(result, expected)
 
-        def roundtrip2(df, header=True, parser_hdr=0, index=True):
+        # Explicitly, we pass in the parameter.
+        result = read_excel(self.path, "test1", index_col=0,
+                            mangle_dupe_cols=True)
+        tm.assert_frame_equal(result, expected)
 
-            with ensure_clean(self.ext) as path:
-                df.to_excel(path, header=header,
-                            merge_cells=self.merge_cells, index=index)
-                xf = ExcelFile(path)
-                res = read_excel(xf, xf.sheet_names[0], header=parser_hdr)
-                return res
+        # see gh-11007, gh-10970
+        df = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                       columns=["A", "B", "A", "B"])
+        df.to_excel(self.path, "test1")
 
-        nrows = 5
-        ncols = 3
-        j = 2
-        i = 1
-        df = mkdf(nrows, ncols, r_idx_nlevels=i, c_idx_nlevels=j)
-        with tm.assertRaises(NotImplementedError):
-            roundtrip2(df, header=False, index=False)
-
-    def test_duplicated_columns(self):
-        # Test for issue #5235
-        _skip_if_no_xlrd()
-
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame([[1, 2, 3], [1, 2, 3], [1, 2, 3]])
-            colnames = ['A', 'B', 'B']
-
-            write_frame.columns = colnames
-            write_frame.to_excel(path, 'test1')
-
-            read_frame = read_excel(path, 'test1')
-            read_frame.columns = colnames
-            tm.assert_frame_equal(write_frame, read_frame)
-
-            # 11007 / #10970
-            write_frame = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
-                                    columns=['A', 'B', 'A', 'B'])
-            write_frame.to_excel(path, 'test1')
-            read_frame = read_excel(path, 'test1')
-            read_frame.columns = ['A', 'B', 'A', 'B']
-            tm.assert_frame_equal(write_frame, read_frame)
-
-            # 10982
-            write_frame.to_excel(path, 'test1', index=False, header=False)
-            read_frame = read_excel(path, 'test1', header=None)
-            write_frame.columns = [0, 1, 2, 3]
-            tm.assert_frame_equal(write_frame, read_frame)
-
-    def test_swapped_columns(self):
-        # Test for issue #5427.
-        _skip_if_no_xlrd()
+        result = read_excel(self.path, "test1", index_col=0)
+        expected = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]],
+                             columns=["A", "B", "A.1", "B.1"])
+        tm.assert_frame_equal(result, expected)
 
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame({'A': [1, 1, 1],
-                                     'B': [2, 2, 2]})
-            write_frame.to_excel(path, 'test1', columns=['B', 'A'])
+        # see gh-10982
+        df.to_excel(self.path, "test1", index=False, header=False)
+        result = read_excel(self.path, "test1", header=None)
 
-            read_frame = read_excel(path, 'test1', header=0)
+        expected = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]])
+        tm.assert_frame_equal(result, expected)
 
-            tm.assert_series_equal(write_frame['A'], read_frame['A'])
-            tm.assert_series_equal(write_frame['B'], read_frame['B'])
+        msg = "Setting mangle_dupe_cols=False is not supported yet"
+        with pytest.raises(ValueError, match=msg):
+            read_excel(self.path, "test1", header=None, mangle_dupe_cols=False)
 
-    def test_invalid_columns(self):
-        # 10982
-        _skip_if_no_xlrd()
+    def test_swapped_columns(self, merge_cells, engine, ext):
+        # Test for issue #5427.
+        write_frame = DataFrame({'A': [1, 1, 1],
+                                 'B': [2, 2, 2]})
+        write_frame.to_excel(self.path, 'test1', columns=['B', 'A'])
+
+        read_frame = read_excel(self.path, 'test1', header=0)
+
+        tm.assert_series_equal(write_frame['A'], read_frame['A'])
+        tm.assert_series_equal(write_frame['B'], read_frame['B'])
+
+    def test_invalid_columns(self, *_):
+        # see gh-10982
+        write_frame = DataFrame({"A": [1, 1, 1],
+                                 "B": [2, 2, 2]})
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            write_frame.to_excel(self.path, "test1", columns=["B", "C"])
+
+        expected = write_frame.reindex(columns=["B", "C"])
+        read_frame = read_excel(self.path, "test1", index_col=0)
+        tm.assert_frame_equal(expected, read_frame)
+
+        with pytest.raises(KeyError):
+            write_frame.to_excel(self.path, "test1", columns=["C", "D"])
+
+    def test_comment_arg(self, *_):
+        # see gh-18735
+        #
+        # Test the comment argument functionality to read_excel.
+
+        # Create file to read in.
+        df = DataFrame({"A": ["one", "#one", "one"],
+                        "B": ["two", "two", "#two"]})
+        df.to_excel(self.path, "test_c")
+
+        # Read file without comment arg.
+        result1 = read_excel(self.path, "test_c", index_col=0)
+
+        result1.iloc[1, 0] = None
+        result1.iloc[1, 1] = None
+        result1.iloc[2, 1] = None
+
+        result2 = read_excel(self.path, "test_c", comment="#", index_col=0)
+        tm.assert_frame_equal(result1, result2)
+
+    def test_comment_default(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test the comment argument default to read_excel
+
+        # Create file to read in
+        df = DataFrame({'A': ['one', '#one', 'one'],
+                        'B': ['two', 'two', '#two']})
+        df.to_excel(self.path, 'test_c')
+
+        # Read file with default and explicit comment=None
+        result1 = read_excel(self.path, 'test_c')
+        result2 = read_excel(self.path, 'test_c', comment=None)
+        tm.assert_frame_equal(result1, result2)
+
+    def test_comment_used(self, *_):
+        # see gh-18735
+        #
+        # Test the comment argument is working as expected when used.
+
+        # Create file to read in.
+        df = DataFrame({"A": ["one", "#one", "one"],
+                        "B": ["two", "two", "#two"]})
+        df.to_excel(self.path, "test_c")
+
+        # Test read_frame_comment against manually produced expected output.
+        expected = DataFrame({"A": ["one", None, "one"],
+                              "B": ["two", None, None]})
+        result = read_excel(self.path, "test_c", comment="#", index_col=0)
+        tm.assert_frame_equal(result, expected)
 
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame({'A': [1, 1, 1],
-                                     'B': [2, 2, 2]})
+    def test_comment_empty_line(self, merge_cells, engine, ext):
+        # Re issue #18735
+        # Test that read_excel ignores commented lines at the end of file
 
-            write_frame.to_excel(path, 'test1', columns=['B', 'C'])
-            expected = write_frame.loc[:, ['B', 'C']]
-            read_frame = read_excel(path, 'test1')
-            tm.assert_frame_equal(expected, read_frame)
+        df = DataFrame({'a': ['1', '#2'], 'b': ['2', '3']})
+        df.to_excel(self.path, index=False)
 
-            with tm.assertRaises(KeyError):
-                write_frame.to_excel(path, 'test1', columns=['C', 'D'])
+        # Test that all-comment lines at EoF are ignored
+        expected = DataFrame({'a': [1], 'b': [2]})
+        result = read_excel(self.path, comment='#')
+        tm.assert_frame_equal(result, expected)
 
-    def test_datetimes(self):
+    def test_datetimes(self, merge_cells, engine, ext):
 
         # Test writing and reading datetimes. For issue #9139. (xref #9185)
-        _skip_if_no_xlrd()
-
         datetimes = [datetime(2013, 1, 13, 1, 2, 3),
                      datetime(2013, 1, 13, 2, 45, 56),
                      datetime(2013, 1, 13, 4, 29, 49),
@@ -1802,265 +2020,83 @@ def test_datetimes(self):
                      datetime(2013, 1, 13, 16, 37, 0),
                      datetime(2013, 1, 13, 18, 20, 52)]
 
-        with ensure_clean(self.ext) as path:
-            write_frame = DataFrame.from_items([('A', datetimes)])
-            write_frame.to_excel(path, 'Sheet1')
-            read_frame = read_excel(path, 'Sheet1', header=0)
-
-            tm.assert_series_equal(write_frame['A'], read_frame['A'])
+        write_frame = DataFrame({'A': datetimes})
+        write_frame.to_excel(self.path, 'Sheet1')
+        read_frame = read_excel(self.path, 'Sheet1', header=0)
 
-    # GH7074
-    def test_bytes_io(self):
-        _skip_if_no_xlrd()
+        tm.assert_series_equal(write_frame['A'], read_frame['A'])
 
+    def test_bytes_io(self, merge_cells, engine, ext):
+        # see gh-7074
         bio = BytesIO()
         df = DataFrame(np.random.randn(10, 2))
-        # pass engine explicitly as there is no file path to infer from
-        writer = ExcelWriter(bio, engine=self.engine_name)
+
+        # Pass engine explicitly, as there is no file path to infer from.
+        writer = ExcelWriter(bio, engine=engine)
         df.to_excel(writer)
         writer.save()
+
         bio.seek(0)
-        reread_df = read_excel(bio)
+        reread_df = read_excel(bio, index_col=0)
         tm.assert_frame_equal(df, reread_df)
 
-    # GH8188
-    def test_write_lists_dict(self):
-        _skip_if_no_xlrd()
+    def test_write_lists_dict(self, *_):
+        # see gh-8188.
+        df = DataFrame({"mixed": ["a", ["b", "c"], {"d": "e", "f": 2}],
+                        "numeric": [1, 2, 3.0],
+                        "str": ["apple", "banana", "cherry"]})
+        df.to_excel(self.path, "Sheet1")
+        read = read_excel(self.path, "Sheet1", header=0, index_col=0)
 
-        df = DataFrame({'mixed': ['a', ['b', 'c'], {'d': 'e', 'f': 2}],
-                        'numeric': [1, 2, 3.0],
-                        'str': ['apple', 'banana', 'cherry']})
         expected = df.copy()
         expected.mixed = expected.mixed.apply(str)
-        expected.numeric = expected.numeric.astype('int64')
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path, 'Sheet1')
-            read = read_excel(path, 'Sheet1', header=0)
-            tm.assert_frame_equal(read, expected)
-
-    # GH13347
-    def test_true_and_false_value_options(self):
-        df = pd.DataFrame([['foo', 'bar']], columns=['col1', 'col2'])
-        expected = df.replace({'foo': True,
-                               'bar': False})
-        with ensure_clean(self.ext) as path:
-            df.to_excel(path)
-            read_frame = read_excel(path, true_values=['foo'],
-                                    false_values=['bar'])
-            tm.assert_frame_equal(read_frame, expected)
-
-    def test_freeze_panes(self):
-        # GH15160
-        expected = DataFrame([[1, 2], [3, 4]], columns=['col1', 'col2'])
-        with ensure_clean(self.ext) as path:
-            expected.to_excel(path, "Sheet1", freeze_panes=(1, 1))
-            result = read_excel(path)
-            tm.assert_frame_equal(expected, result)
-
-
-def raise_wrapper(major_ver):
-    def versioned_raise_wrapper(orig_method):
-        @functools.wraps(orig_method)
-        def wrapped(self, *args, **kwargs):
-            _skip_if_no_openpyxl()
-            if openpyxl_compat.is_compat(major_ver=major_ver):
-                orig_method(self, *args, **kwargs)
-            else:
-                msg = (r'Installed openpyxl is not supported at this '
-                       r'time\. Use.+')
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    orig_method(self, *args, **kwargs)
-        return wrapped
-    return versioned_raise_wrapper
-
-
-def raise_on_incompat_version(major_ver):
-    def versioned_raise_on_incompat_version(cls):
-        methods = filter(operator.methodcaller(
-            'startswith', 'test_'), dir(cls))
-        for method in methods:
-            setattr(cls, method, raise_wrapper(
-                major_ver)(getattr(cls, method)))
-        return cls
-    return versioned_raise_on_incompat_version
-
-
-@raise_on_incompat_version(1)
-class OpenpyxlTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl1'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
-        _skip_if_no_openpyxl()
-        if not openpyxl_compat.is_compat(major_ver=1):
-            pytest.skip('incompatible openpyxl version')
-
-        import openpyxl
-
-        hstyle = {"font": {"bold": True},
-                  "borders": {"top": "thin",
-                              "right": "thin",
-                              "bottom": "thin",
-                              "left": "thin"},
-                  "alignment": {"horizontal": "center", "vertical": "top"}}
-
-        xlsx_style = _Openpyxl1Writer._convert_to_style(hstyle)
-        self.assertTrue(xlsx_style.font.bold)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.top.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.right.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.bottom.border_style)
-        self.assertEqual(openpyxl.style.Border.BORDER_THIN,
-                         xlsx_style.borders.left.border_style)
-        self.assertEqual(openpyxl.style.Alignment.HORIZONTAL_CENTER,
-                         xlsx_style.alignment.horizontal)
-        self.assertEqual(openpyxl.style.Alignment.VERTICAL_TOP,
-                         xlsx_style.alignment.vertical)
-
-
-def skip_openpyxl_gt21(cls):
-    """Skip a TestCase instance if openpyxl >= 2.2"""
-
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_openpyxl()
-        import openpyxl
-        ver = openpyxl.__version__
-        if (not (LooseVersion(ver) >= LooseVersion('2.0.0') and
-                 LooseVersion(ver) < LooseVersion('2.2.0'))):
-            pytest.skip("openpyxl %s >= 2.2" % str(ver))
-
-    cls.setUpClass = setUpClass
-    return cls
-
-
-@raise_on_incompat_version(2)
-@skip_openpyxl_gt21
-class Openpyxl20Tests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl20'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
-        import openpyxl
-        from openpyxl import styles
-
-        hstyle = {
-            "font": {
-                "color": '00FF0000',
-                "bold": True,
-            },
-            "borders": {
-                "top": "thin",
-                "right": "thin",
-                "bottom": "thin",
-                "left": "thin",
-            },
-            "alignment": {
-                "horizontal": "center",
-                "vertical": "top",
-            },
-            "fill": {
-                "patternType": 'solid',
-                'fgColor': {
-                    'rgb': '006666FF',
-                    'tint': 0.3,
-                },
-            },
-            "number_format": {
-                "format_code": "0.00"
-            },
-            "protection": {
-                "locked": True,
-                "hidden": False,
-            },
-        }
-
-        font_color = styles.Color('00FF0000')
-        font = styles.Font(bold=True, color=font_color)
-        side = styles.Side(style=styles.borders.BORDER_THIN)
-        border = styles.Border(top=side, right=side, bottom=side, left=side)
-        alignment = styles.Alignment(horizontal='center', vertical='top')
-        fill_color = styles.Color(rgb='006666FF', tint=0.3)
-        fill = styles.PatternFill(patternType='solid', fgColor=fill_color)
+        expected.numeric = expected.numeric.astype("int64")
 
-        # ahh openpyxl API changes
-        ver = openpyxl.__version__
-        if ver >= LooseVersion('2.0.0') and ver < LooseVersion('2.1.0'):
-            number_format = styles.NumberFormat(format_code='0.00')
-        else:
-            number_format = '0.00'  # XXX: Only works with openpyxl-2.1.0
+        tm.assert_frame_equal(read, expected)
 
-        protection = styles.Protection(locked=True, hidden=False)
+    def test_true_and_false_value_options(self, *_):
+        # see gh-13347
+        df = pd.DataFrame([["foo", "bar"]], columns=["col1", "col2"])
+        expected = df.replace({"foo": True, "bar": False})
 
-        kw = _Openpyxl20Writer._convert_to_style_kwargs(hstyle)
-        self.assertEqual(kw['font'], font)
-        self.assertEqual(kw['border'], border)
-        self.assertEqual(kw['alignment'], alignment)
-        self.assertEqual(kw['fill'], fill)
-        self.assertEqual(kw['number_format'], number_format)
-        self.assertEqual(kw['protection'], protection)
+        df.to_excel(self.path)
+        read_frame = read_excel(self.path, true_values=["foo"],
+                                false_values=["bar"], index_col=0)
+        tm.assert_frame_equal(read_frame, expected)
 
-    def test_write_cells_merge_styled(self):
-        from pandas.formats.format import ExcelCell
-        from openpyxl import styles
-
-        sheet_name = 'merge_styled'
+    def test_freeze_panes(self, *_):
+        # see gh-15160
+        expected = DataFrame([[1, 2], [3, 4]], columns=["col1", "col2"])
+        expected.to_excel(self.path, "Sheet1", freeze_panes=(1, 1))
 
-        sty_b1 = {'font': {'color': '00FF0000'}}
-        sty_a2 = {'font': {'color': '0000FF00'}}
-
-        initial_cells = [
-            ExcelCell(col=1, row=0, val=42, style=sty_b1),
-            ExcelCell(col=0, row=1, val=99, style=sty_a2),
-        ]
-
-        sty_merged = {'font': {'color': '000000FF', 'bold': True}}
-        sty_kwargs = _Openpyxl20Writer._convert_to_style_kwargs(sty_merged)
-        openpyxl_sty_merged = styles.Style(**sty_kwargs)
-        merge_cells = [
-            ExcelCell(col=0, row=0, val='pandas',
-                      mergestart=1, mergeend=1, style=sty_merged),
-        ]
-
-        with ensure_clean('.xlsx') as path:
-            writer = _Openpyxl20Writer(path)
-            writer.write_cells(initial_cells, sheet_name=sheet_name)
-            writer.write_cells(merge_cells, sheet_name=sheet_name)
+        result = read_excel(self.path, index_col=0)
+        tm.assert_frame_equal(result, expected)
 
-            wks = writer.sheets[sheet_name]
-            xcell_b1 = wks['B1']
-            xcell_a2 = wks['A2']
-            self.assertEqual(xcell_b1.style, openpyxl_sty_merged)
-            self.assertEqual(xcell_a2.style, openpyxl_sty_merged)
+    def test_path_path_lib(self, merge_cells, engine, ext):
+        df = tm.makeDataFrame()
+        writer = partial(df.to_excel, engine=engine)
 
+        reader = partial(pd.read_excel, index_col=0)
+        result = tm.round_trip_pathlib(writer, reader,
+                                       path="foo.{ext}".format(ext=ext))
+        tm.assert_frame_equal(result, df)
 
-def skip_openpyxl_lt22(cls):
-    """Skip a TestCase instance if openpyxl < 2.2"""
+    def test_path_local_path(self, merge_cells, engine, ext):
+        df = tm.makeDataFrame()
+        writer = partial(df.to_excel, engine=engine)
 
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_openpyxl()
-        import openpyxl
-        ver = openpyxl.__version__
-        if LooseVersion(ver) < LooseVersion('2.2.0'):
-            pytest.skip("openpyxl %s < 2.2" % str(ver))
+        reader = partial(pd.read_excel, index_col=0)
+        result = tm.round_trip_pathlib(writer, reader,
+                                       path="foo.{ext}".format(ext=ext))
+        tm.assert_frame_equal(result, df)
 
-    cls.setUpClass = setUpClass
-    return cls
 
+@td.skip_if_no('openpyxl')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xlsx', 'openpyxl')])
+class TestOpenpyxlTests(_WriterBase):
 
-@raise_on_incompat_version(2)
-@skip_openpyxl_lt22
-class Openpyxl22Tests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl22'
-    check_skip = staticmethod(lambda *args, **kwargs: None)
-
-    def test_to_excel_styleconverter(self):
+    def test_to_excel_styleconverter(self, merge_cells, ext, engine):
         from openpyxl import styles
 
         hstyle = {
@@ -2106,19 +2142,16 @@ def test_to_excel_styleconverter(self):
 
         protection = styles.Protection(locked=True, hidden=False)
 
-        kw = _Openpyxl22Writer._convert_to_style_kwargs(hstyle)
-        self.assertEqual(kw['font'], font)
-        self.assertEqual(kw['border'], border)
-        self.assertEqual(kw['alignment'], alignment)
-        self.assertEqual(kw['fill'], fill)
-        self.assertEqual(kw['number_format'], number_format)
-        self.assertEqual(kw['protection'], protection)
-
-    def test_write_cells_merge_styled(self):
-        if not openpyxl_compat.is_compat(major_ver=2):
-            pytest.skip('incompatible openpyxl version')
+        kw = _OpenpyxlWriter._convert_to_style_kwargs(hstyle)
+        assert kw['font'] == font
+        assert kw['border'] == border
+        assert kw['alignment'] == alignment
+        assert kw['fill'] == fill
+        assert kw['number_format'] == number_format
+        assert kw['protection'] == protection
 
-        from pandas.formats.format import ExcelCell
+    def test_write_cells_merge_styled(self, merge_cells, ext, engine):
+        from pandas.io.formats.excel import ExcelCell
 
         sheet_name = 'merge_styled'
 
@@ -2131,63 +2164,85 @@ def test_write_cells_merge_styled(self):
         ]
 
         sty_merged = {'font': {'color': '000000FF', 'bold': True}}
-        sty_kwargs = _Openpyxl22Writer._convert_to_style_kwargs(sty_merged)
+        sty_kwargs = _OpenpyxlWriter._convert_to_style_kwargs(sty_merged)
         openpyxl_sty_merged = sty_kwargs['font']
         merge_cells = [
             ExcelCell(col=0, row=0, val='pandas',
                       mergestart=1, mergeend=1, style=sty_merged),
         ]
 
-        with ensure_clean('.xlsx') as path:
-            writer = _Openpyxl22Writer(path)
+        with ensure_clean(ext) as path:
+            writer = _OpenpyxlWriter(path)
             writer.write_cells(initial_cells, sheet_name=sheet_name)
             writer.write_cells(merge_cells, sheet_name=sheet_name)
 
             wks = writer.sheets[sheet_name]
             xcell_b1 = wks['B1']
             xcell_a2 = wks['A2']
-            self.assertEqual(xcell_b1.font, openpyxl_sty_merged)
-            self.assertEqual(xcell_a2.font, openpyxl_sty_merged)
+            assert xcell_b1.font == openpyxl_sty_merged
+            assert xcell_a2.font == openpyxl_sty_merged
+
+    @pytest.mark.parametrize("mode,expected", [
+        ('w', ['baz']), ('a', ['foo', 'bar', 'baz'])])
+    def test_write_append_mode(self, merge_cells, ext, engine, mode, expected):
+        import openpyxl
+        df = DataFrame([1], columns=['baz'])
+
+        with ensure_clean(ext) as f:
+            wb = openpyxl.Workbook()
+            wb.worksheets[0].title = 'foo'
+            wb.worksheets[0]['A1'].value = 'foo'
+            wb.create_sheet('bar')
+            wb.worksheets[1]['A1'].value = 'bar'
+            wb.save(f)
+
+            writer = ExcelWriter(f, engine=engine, mode=mode)
+            df.to_excel(writer, sheet_name='baz', index=False)
+            writer.save()
 
+            wb2 = openpyxl.load_workbook(f)
+            result = [sheet.title for sheet in wb2.worksheets]
+            assert result == expected
 
-class XlwtTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlwt'
-    check_skip = staticmethod(_skip_if_no_xlwt)
+            for index, cell_value in enumerate(expected):
+                assert wb2.worksheets[index]['A1'].value == cell_value
 
-    def test_excel_raise_error_on_multiindex_columns_and_no_index(self):
-        _skip_if_no_xlwt()
+
+@td.skip_if_no('xlwt')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xls', 'xlwt')])
+class TestXlwtTests(_WriterBase):
+
+    def test_excel_raise_error_on_multiindex_columns_and_no_index(
+            self, merge_cells, ext, engine):
         # MultiIndex as columns is not yet implemented 9794
         cols = MultiIndex.from_tuples([('site', ''),
                                        ('2014', 'height'),
                                        ('2014', 'weight')])
         df = DataFrame(np.random.randn(10, 3), columns=cols)
-        with tm.assertRaises(NotImplementedError):
-            with ensure_clean(self.ext) as path:
+        with pytest.raises(NotImplementedError):
+            with ensure_clean(ext) as path:
                 df.to_excel(path, index=False)
 
-    def test_excel_multiindex_columns_and_index_true(self):
-        _skip_if_no_xlwt()
+    def test_excel_multiindex_columns_and_index_true(self, merge_cells, ext,
+                                                     engine):
         cols = MultiIndex.from_tuples([('site', ''),
                                        ('2014', 'height'),
                                        ('2014', 'weight')])
         df = pd.DataFrame(np.random.randn(10, 3), columns=cols)
-        with ensure_clean(self.ext) as path:
+        with ensure_clean(ext) as path:
             df.to_excel(path, index=True)
 
-    def test_excel_multiindex_index(self):
-        _skip_if_no_xlwt()
+    def test_excel_multiindex_index(self, merge_cells, ext, engine):
         # MultiIndex as index works so assert no error #9794
         cols = MultiIndex.from_tuples([('site', ''),
                                        ('2014', 'height'),
                                        ('2014', 'weight')])
         df = DataFrame(np.random.randn(3, 10), index=cols)
-        with ensure_clean(self.ext) as path:
+        with ensure_clean(ext) as path:
             df.to_excel(path, index=False)
 
-    def test_to_excel_styleconverter(self):
-        _skip_if_no_xlwt()
-
+    def test_to_excel_styleconverter(self, merge_cells, ext, engine):
         import xlwt
 
         hstyle = {"font": {"bold": True},
@@ -2198,32 +2253,37 @@ def test_to_excel_styleconverter(self):
                   "alignment": {"horizontal": "center", "vertical": "top"}}
 
         xls_style = _XlwtWriter._convert_to_style(hstyle)
-        self.assertTrue(xls_style.font.bold)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.top)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.right)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.bottom)
-        self.assertEqual(xlwt.Borders.THIN, xls_style.borders.left)
-        self.assertEqual(xlwt.Alignment.HORZ_CENTER, xls_style.alignment.horz)
-        self.assertEqual(xlwt.Alignment.VERT_TOP, xls_style.alignment.vert)
+        assert xls_style.font.bold
+        assert xlwt.Borders.THIN == xls_style.borders.top
+        assert xlwt.Borders.THIN == xls_style.borders.right
+        assert xlwt.Borders.THIN == xls_style.borders.bottom
+        assert xlwt.Borders.THIN == xls_style.borders.left
+        assert xlwt.Alignment.HORZ_CENTER == xls_style.alignment.horz
+        assert xlwt.Alignment.VERT_TOP == xls_style.alignment.vert
+
+    def test_write_append_mode_raises(self, merge_cells, ext, engine):
+        msg = "Append mode is not supported with xlwt!"
+
+        with ensure_clean(ext) as f:
+            with pytest.raises(ValueError, match=msg):
+                ExcelWriter(f, engine=engine, mode='a')
 
 
-class XlsxWriterTests(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlsxwriter'
-    check_skip = staticmethod(_skip_if_no_xlsxwriter)
+@td.skip_if_no('xlsxwriter')
+@pytest.mark.parametrize("merge_cells,ext,engine", [
+    (None, '.xlsx', 'xlsxwriter')])
+class TestXlsxWriterTests(_WriterBase):
 
-    def test_column_format(self):
+    @td.skip_if_no('openpyxl')
+    def test_column_format(self, merge_cells, ext, engine):
         # Test that column formats are applied to cells. Test for issue #9167.
         # Applicable to xlsxwriter only.
-        _skip_if_no_xlsxwriter()
-
         with warnings.catch_warnings():
             # Ignore the openpyxl lxml warning.
             warnings.simplefilter("ignore")
-            _skip_if_no_openpyxl()
             import openpyxl
 
-        with ensure_clean(self.ext) as path:
+        with ensure_clean(ext) as path:
             frame = DataFrame({'A': [123456, 123456],
                                'B': [123456, 123456]})
 
@@ -2254,63 +2314,43 @@ def test_column_format(self):
 
             try:
                 read_num_format = cell.number_format
-            except:
+            except Exception:
                 read_num_format = cell.style.number_format._format_code
 
-            self.assertEqual(read_num_format, num_format)
-
-
-class OpenpyxlTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'openpyxl'
-    check_skip = staticmethod(_skip_if_no_openpyxl)
-
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
-
+            assert read_num_format == num_format
 
-class XlwtTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xls'
-    engine_name = 'xlwt'
-    check_skip = staticmethod(_skip_if_no_xlwt)
+    def test_write_append_mode_raises(self, merge_cells, ext, engine):
+        msg = "Append mode is not supported with xlsxwriter!"
 
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
+        with ensure_clean(ext) as f:
+            with pytest.raises(ValueError, match=msg):
+                ExcelWriter(f, engine=engine, mode='a')
 
 
-class XlsxWriterTests_NoMerge(ExcelWriterBase, tm.TestCase):
-    ext = '.xlsx'
-    engine_name = 'xlsxwriter'
-    check_skip = staticmethod(_skip_if_no_xlsxwriter)
-
-    # Test < 0.13 non-merge behaviour for MultiIndex and Hierarchical Rows.
-    merge_cells = False
-
-
-class ExcelWriterEngineTests(tm.TestCase):
-
-    def test_ExcelWriter_dispatch(self):
-        with tm.assertRaisesRegexp(ValueError, 'No engine'):
-            ExcelWriter('nothing')
+class TestExcelWriterEngineTests(object):
 
-        try:
-            import xlsxwriter  # noqa
-            writer_klass = _XlsxWriter
-        except ImportError:
-            _skip_if_no_openpyxl()
-            if not openpyxl_compat.is_compat(major_ver=1):
-                pytest.skip('incompatible openpyxl version')
-            writer_klass = _Openpyxl1Writer
-
-        with ensure_clean('.xlsx') as path:
+    @pytest.mark.parametrize('klass,ext', [
+        pytest.param(_XlsxWriter, '.xlsx', marks=pytest.mark.skipif(
+            not td.safe_import('xlsxwriter'), reason='No xlsxwriter')),
+        pytest.param(_OpenpyxlWriter, '.xlsx', marks=pytest.mark.skipif(
+            not td.safe_import('openpyxl'), reason='No openpyxl')),
+        pytest.param(_XlwtWriter, '.xls', marks=pytest.mark.skipif(
+            not td.safe_import('xlwt'), reason='No xlwt'))
+    ])
+    def test_ExcelWriter_dispatch(self, klass, ext):
+        with ensure_clean(ext) as path:
             writer = ExcelWriter(path)
-            tm.assertIsInstance(writer, writer_klass)
+            if ext == '.xlsx' and td.safe_import('xlsxwriter'):
+                # xlsxwriter has preference over openpyxl if both installed
+                assert isinstance(writer, _XlsxWriter)
+            else:
+                assert isinstance(writer, klass)
 
-        _skip_if_no_xlwt()
-        with ensure_clean('.xls') as path:
-            writer = ExcelWriter(path)
-            tm.assertIsInstance(writer, _XlwtWriter)
+    def test_ExcelWriter_dispatch_raises(self):
+        with pytest.raises(ValueError, match='No engine'):
+            ExcelWriter('nothing')
 
+    @pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
     def test_register_writer(self):
         # some awkward mocking to test out dispatch and such actually works
         called_save = []
@@ -2319,7 +2359,7 @@ def test_register_writer(self):
         class DummyClass(ExcelWriter):
             called_save = False
             called_write_cells = False
-            supported_extensions = ['test', 'xlsx', 'xls']
+            supported_extensions = ['xlsx', 'xls']
             engine = 'dummy'
 
             def save(self):
@@ -2330,19 +2370,190 @@ def write_cells(self, *args, **kwargs):
 
         def check_called(func):
             func()
-            self.assertTrue(len(called_save) >= 1)
-            self.assertTrue(len(called_write_cells) >= 1)
+            assert len(called_save) >= 1
+            assert len(called_write_cells) >= 1
             del called_save[:]
             del called_write_cells[:]
 
         with pd.option_context('io.excel.xlsx.writer', 'dummy'):
             register_writer(DummyClass)
-            writer = ExcelWriter('something.test')
-            tm.assertIsInstance(writer, DummyClass)
+            writer = ExcelWriter('something.xlsx')
+            assert isinstance(writer, DummyClass)
             df = tm.makeCustomDataframe(1, 1)
-            panel = tm.makePanel()
-            func = lambda: df.to_excel('something.test')
-            check_called(func)
-            check_called(lambda: panel.to_excel('something.test'))
             check_called(lambda: df.to_excel('something.xlsx'))
-            check_called(lambda: df.to_excel('something.xls', engine='dummy'))
+            check_called(
+                lambda: df.to_excel(
+                    'something.xls', engine='dummy'))
+
+
+@pytest.mark.parametrize('engine', [
+    pytest.param('xlwt',
+                 marks=pytest.mark.xfail(reason='xlwt does not support '
+                                                'openpyxl-compatible '
+                                                'style dicts')),
+    'xlsxwriter',
+    'openpyxl',
+])
+def test_styler_to_excel(engine):
+    def style(df):
+        # XXX: RGB colors not supported in xlwt
+        return DataFrame([['font-weight: bold', '', ''],
+                          ['', 'color: blue', ''],
+                          ['', '', 'text-decoration: underline'],
+                          ['border-style: solid', '', ''],
+                          ['', 'font-style: italic', ''],
+                          ['', '', 'text-align: right'],
+                          ['background-color: red', '', ''],
+                          ['number-format: 0%', '', ''],
+                          ['', '', ''],
+                          ['', '', ''],
+                          ['', '', '']],
+                         index=df.index, columns=df.columns)
+
+    def assert_equal_style(cell1, cell2, engine):
+        if engine in ['xlsxwriter', 'openpyxl']:
+            pytest.xfail(reason=("GH25351: failing on some attribute "
+                                 "comparisons in {}".format(engine)))
+        # XXX: should find a better way to check equality
+        assert cell1.alignment.__dict__ == cell2.alignment.__dict__
+        assert cell1.border.__dict__ == cell2.border.__dict__
+        assert cell1.fill.__dict__ == cell2.fill.__dict__
+        assert cell1.font.__dict__ == cell2.font.__dict__
+        assert cell1.number_format == cell2.number_format
+        assert cell1.protection.__dict__ == cell2.protection.__dict__
+
+    def custom_converter(css):
+        # use bold iff there is custom style attached to the cell
+        if css.strip(' \n;'):
+            return {'font': {'bold': True}}
+        return {}
+
+    pytest.importorskip('jinja2')
+    pytest.importorskip(engine)
+
+    # Prepare spreadsheets
+
+    df = DataFrame(np.random.randn(11, 3))
+    with ensure_clean('.xlsx' if engine != 'xlwt' else '.xls') as path:
+        writer = ExcelWriter(path, engine=engine)
+        df.to_excel(writer, sheet_name='frame')
+        df.style.to_excel(writer, sheet_name='unstyled')
+        styled = df.style.apply(style, axis=None)
+        styled.to_excel(writer, sheet_name='styled')
+        ExcelFormatter(styled, style_converter=custom_converter).write(
+            writer, sheet_name='custom')
+        writer.save()
+
+        if engine not in ('openpyxl', 'xlsxwriter'):
+            # For other engines, we only smoke test
+            return
+        openpyxl = pytest.importorskip('openpyxl')
+        wb = openpyxl.load_workbook(path)
+
+        # (1) compare DataFrame.to_excel and Styler.to_excel when unstyled
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['unstyled'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                assert cell1.value == cell2.value
+                assert_equal_style(cell1, cell2, engine)
+                n_cells += 1
+
+        # ensure iteration actually happened:
+        assert n_cells == (11 + 1) * (3 + 1)
+
+        # (2) check styling with default converter
+
+        # XXX: openpyxl (as at 2.4) prefixes colors with 00, xlsxwriter with FF
+        alpha = '00' if engine == 'openpyxl' else 'FF'
+
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['styled'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                ref = '%s%d' % (cell2.column, cell2.row)
+                # XXX: this isn't as strong a test as ideal; we should
+                #      confirm that differences are exclusive
+                if ref == 'B2':
+                    assert not cell1.font.bold
+                    assert cell2.font.bold
+                elif ref == 'C3':
+                    assert cell1.font.color.rgb != cell2.font.color.rgb
+                    assert cell2.font.color.rgb == alpha + '0000FF'
+                elif ref == 'D4':
+                    # This fails with engine=xlsxwriter due to
+                    # https://bitbucket.org/openpyxl/openpyxl/issues/800
+                    if engine == 'xlsxwriter' \
+                       and (LooseVersion(openpyxl.__version__) <
+                            LooseVersion('2.4.6')):
+                        pass
+                    else:
+                        assert cell1.font.underline != cell2.font.underline
+                        assert cell2.font.underline == 'single'
+                elif ref == 'B5':
+                    assert not cell1.border.left.style
+                    assert (cell2.border.top.style ==
+                            cell2.border.right.style ==
+                            cell2.border.bottom.style ==
+                            cell2.border.left.style ==
+                            'medium')
+                elif ref == 'C6':
+                    assert not cell1.font.italic
+                    assert cell2.font.italic
+                elif ref == 'D7':
+                    assert (cell1.alignment.horizontal !=
+                            cell2.alignment.horizontal)
+                    assert cell2.alignment.horizontal == 'right'
+                elif ref == 'B8':
+                    assert cell1.fill.fgColor.rgb != cell2.fill.fgColor.rgb
+                    assert cell1.fill.patternType != cell2.fill.patternType
+                    assert cell2.fill.fgColor.rgb == alpha + 'FF0000'
+                    assert cell2.fill.patternType == 'solid'
+                elif ref == 'B9':
+                    assert cell1.number_format == 'General'
+                    assert cell2.number_format == '0%'
+                else:
+                    assert_equal_style(cell1, cell2, engine)
+
+                assert cell1.value == cell2.value
+                n_cells += 1
+
+        assert n_cells == (11 + 1) * (3 + 1)
+
+        # (3) check styling with custom converter
+        n_cells = 0
+        for col1, col2 in zip(wb['frame'].columns,
+                              wb['custom'].columns):
+            assert len(col1) == len(col2)
+            for cell1, cell2 in zip(col1, col2):
+                ref = '%s%d' % (cell2.column, cell2.row)
+                if ref in ('B2', 'C3', 'D4', 'B5', 'C6', 'D7', 'B8', 'B9'):
+                    assert not cell1.font.bold
+                    assert cell2.font.bold
+                else:
+                    assert_equal_style(cell1, cell2, engine)
+
+                assert cell1.value == cell2.value
+                n_cells += 1
+
+        assert n_cells == (11 + 1) * (3 + 1)
+
+
+@td.skip_if_no('openpyxl')
+@pytest.mark.skipif(not PY36, reason='requires fspath')
+class TestFSPath(object):
+
+    def test_excelfile_fspath(self):
+        with tm.ensure_clean('foo.xlsx') as path:
+            df = DataFrame({"A": [1, 2]})
+            df.to_excel(path)
+            xl = ExcelFile(path)
+            result = os.fspath(xl)
+            assert result == path
+
+    def test_excelwriter_fspath(self):
+        with tm.ensure_clean('foo.xlsx') as path:
+            writer = ExcelWriter(path)
+            assert os.fspath(writer) == str(path)
diff --git a/pandas/tests/io/test_feather.py b/pandas/tests/io/test_feather.py
index 6e2c28a0f68de..d170e4c43feb3 100644
--- a/pandas/tests/io/test_feather.py
+++ b/pandas/tests/io/test_feather.py
@@ -1,37 +1,42 @@
 """ test feather-format compat """
+from distutils.version import LooseVersion
 
+import numpy as np
 import pytest
-feather = pytest.importorskip('feather')
 
-import numpy as np
 import pandas as pd
-from pandas.io.feather_format import to_feather, read_feather
-
-from feather import FeatherError
 import pandas.util.testing as tm
 from pandas.util.testing import assert_frame_equal, ensure_clean
 
+from pandas.io.feather_format import read_feather, to_feather  # noqa:E402
+
+pyarrow = pytest.importorskip('pyarrow')
+
 
-class TestFeather(tm.TestCase):
+pyarrow_version = LooseVersion(pyarrow.__version__)
 
-    def setUp(self):
-        pass
+
+@pytest.mark.single
+class TestFeather(object):
 
     def check_error_on_write(self, df, exc):
         # check that we are raising the exception
         # on writing
 
-        def f():
+        with pytest.raises(exc):
             with ensure_clean() as path:
                 to_feather(df, path)
-        self.assertRaises(exc, f)
 
-    def check_round_trip(self, df):
+    def check_round_trip(self, df, expected=None, **kwargs):
+
+        if expected is None:
+            expected = df
 
         with ensure_clean() as path:
             to_feather(df, path)
-            result = read_feather(path)
-            assert_frame_equal(result, df)
+
+            result = read_feather(path, **kwargs)
+            assert_frame_equal(result, expected)
 
     def test_error(self):
 
@@ -41,26 +46,25 @@ def test_error(self):
 
     def test_basic(self):
 
-        df = pd.DataFrame({'a': list('abc'),
-                           'b': list(range(1, 4)),
-                           'c': np.arange(3, 6).astype('u1'),
-                           'd': np.arange(4.0, 7.0, dtype='float64'),
-                           'e': [True, False, True],
-                           'f': pd.Categorical(list('abc')),
-                           'g': pd.date_range('20130101', periods=3),
-                           'h': pd.date_range('20130101', periods=3,
-                                              tz='US/Eastern'),
-                           'i': pd.date_range('20130101', periods=3,
-                                              freq='ns')})
-
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4)),
+                           'uint': np.arange(3, 6).astype('u1'),
+                           'float': np.arange(4.0, 7.0, dtype='float64'),
+                           'float_with_null': [1., np.nan, 3],
+                           'bool': [True, False, True],
+                           'bool_with_null': [True, np.nan, False],
+                           'cat': pd.Categorical(list('abc')),
+                           'dt': pd.date_range('20130101', periods=3),
+                           'dttz': pd.date_range('20130101', periods=3,
+                                                 tz='US/Eastern'),
+                           'dt_with_null': [pd.Timestamp('20130101'), pd.NaT,
+                                            pd.Timestamp('20130103')],
+                           'dtns': pd.date_range('20130101', periods=3,
+                                                 freq='ns')})
+
+        assert df.dttz.dtype.tz.zone == 'US/Eastern'
         self.check_round_trip(df)
 
-    def test_strided_data_issues(self):
-
-        # strided data issuehttps://github.com/wesm/feather/issues/97
-        df = pd.DataFrame(np.arange(12).reshape(4, 3), columns=list('abc'))
-        self.check_error_on_write(df, FeatherError)
-
     def test_duplicate_columns(self):
 
         # https://github.com/wesm/feather/issues/53
@@ -74,15 +78,47 @@ def test_stringify_columns(self):
         df = pd.DataFrame(np.arange(12).reshape(4, 3)).copy()
         self.check_error_on_write(df, ValueError)
 
-    def test_unsupported(self):
+    def test_read_columns(self):
+        # GH 24025
+        df = pd.DataFrame({'col1': list('abc'),
+                           'col2': list(range(1, 4)),
+                           'col3': list('xyz'),
+                           'col4': list(range(4, 7))})
+        columns = ['col1', 'col3']
+        self.check_round_trip(df, expected=df[columns],
+                              columns=columns)
+
+    def test_unsupported_other(self):
 
         # period
         df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
-        self.check_error_on_write(df, ValueError)
-
-        # non-strings
-        df = pd.DataFrame({'a': ['a', 1, 2.0]})
-        self.check_error_on_write(df, ValueError)
+        # Some versions raise ValueError, others raise ArrowInvalid.
+        self.check_error_on_write(df, Exception)
+
+    def test_rw_nthreads(self):
+        df = pd.DataFrame({'A': np.arange(100000)})
+        expected_warning = (
+            "the 'nthreads' keyword is deprecated, "
+            "use 'use_threads' instead"
+        )
+        # TODO: make the warning work with check_stacklevel=True
+        with tm.assert_produces_warning(
+                FutureWarning, check_stacklevel=False) as w:
+            self.check_round_trip(df, nthreads=2)
+        # we have an extra FutureWarning because of #GH23752
+        assert any(expected_warning in str(x) for x in w)
+
+        # TODO: make the warning work with check_stacklevel=True
+        with tm.assert_produces_warning(
+                FutureWarning, check_stacklevel=False) as w:
+            self.check_round_trip(df, nthreads=1)
+        # we have an extra FutureWarnings because of #GH23752
+        assert any(expected_warning in str(x) for x in w)
+
+    def test_rw_use_threads(self):
+        df = pd.DataFrame({'A': np.arange(100000)})
+        self.check_round_trip(df, use_threads=True)
+        self.check_round_trip(df, use_threads=False)
 
     def test_write_with_index(self):
 
@@ -110,3 +146,13 @@ def test_write_with_index(self):
         df.index = [0, 1, 2]
         df.columns = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)]),
         self.check_error_on_write(df, ValueError)
+
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame().reset_index()
+        result = tm.round_trip_pathlib(df.to_feather, pd.read_feather)
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self):
+        df = tm.makeDataFrame().reset_index()
+        result = tm.round_trip_localpath(df.to_feather, pd.read_feather)
+        tm.assert_frame_equal(df, result)
diff --git a/pandas/tests/io/test_gbq.py b/pandas/tests/io/test_gbq.py
index 13529e7b54714..d3569af8d7786 100644
--- a/pandas/tests/io/test_gbq.py
+++ b/pandas/tests/io/test_gbq.py
@@ -1,18 +1,21 @@
-import pytest
 from datetime import datetime
-import pytz
-import platform
-from time import sleep
 import os
+import platform
 
 import numpy as np
-import pandas as pd
-from pandas import compat, DataFrame
+import pytest
+import pytz
 
 from pandas.compat import range
+
+import pandas as pd
+from pandas import DataFrame, compat
 import pandas.util.testing as tm
 
-pandas_gbq = pytest.importorskip('pandas_gbq')
+api_exceptions = pytest.importorskip("google.api_core.exceptions")
+bigquery = pytest.importorskip("google.cloud.bigquery")
+service_account = pytest.importorskip("google.oauth2.service_account")
+pandas_gbq = pytest.importorskip("pandas_gbq")
 
 PROJECT_ID = None
 PRIVATE_KEY_JSON_PATH = None
@@ -49,32 +52,31 @@ def _in_travis_environment():
 def _get_project_id():
     if _in_travis_environment():
         return os.environ.get('GBQ_PROJECT_ID')
-    else:
-        return PROJECT_ID
+    return PROJECT_ID or os.environ.get('GBQ_PROJECT_ID')
 
 
 def _get_private_key_path():
     if _in_travis_environment():
         return os.path.join(*[os.environ.get('TRAVIS_BUILD_DIR'), 'ci',
                               'travis_gbq.json'])
-    else:
-        return PRIVATE_KEY_JSON_PATH
 
+    private_key_path = PRIVATE_KEY_JSON_PATH
+    if not private_key_path:
+        private_key_path = os.environ.get('GBQ_GOOGLE_APPLICATION_CREDENTIALS')
+    return private_key_path
 
-def clean_gbq_environment(private_key=None):
-    dataset = pandas_gbq.gbq._Dataset(_get_project_id(),
-                                      private_key=private_key)
 
-    for i in range(1, 10):
-        if DATASET_ID + str(i) in dataset.datasets():
-            dataset_id = DATASET_ID + str(i)
-            table = pandas_gbq.gbq._Table(_get_project_id(), dataset_id,
-                                          private_key=private_key)
-            for j in range(1, 20):
-                if TABLE_ID + str(j) in dataset.tables(dataset_id):
-                    table.delete(TABLE_ID + str(j))
+def _get_credentials():
+    private_key_path = _get_private_key_path()
+    if private_key_path:
+        return service_account.Credentials.from_service_account_file(
+            private_key_path)
 
-            dataset.delete(dataset_id)
+
+def _get_client():
+    project_id = _get_project_id()
+    credentials = _get_credentials()
+    return bigquery.Client(project=project_id, credentials=credentials)
 
 
 def make_mixed_dataframe_v2(test_size):
@@ -93,11 +95,23 @@ def make_mixed_dataframe_v2(test_size):
                      index=range(test_size))
 
 
+def test_read_gbq_without_dialect_warns_future_change(monkeypatch):
+    # Default dialect is changing to standard SQL. See:
+    # https://github.com/pydata/pandas-gbq/issues/195
+
+    def mock_read_gbq(*args, **kwargs):
+        return DataFrame([[1.0]])
+
+    monkeypatch.setattr(pandas_gbq, 'read_gbq', mock_read_gbq)
+    with tm.assert_produces_warning(FutureWarning):
+        pd.read_gbq("SELECT 1")
+
+
 @pytest.mark.single
-class TestToGBQIntegrationWithServiceAccountKeyPath(tm.TestCase):
+class TestToGBQIntegrationWithServiceAccountKeyPath(object):
 
     @classmethod
-    def setUpClass(cls):
+    def setup_class(cls):
         # - GLOBAL CLASS FIXTURES -
         # put here any instruction you want to execute only *ONCE* *BEFORE*
         # executing *ALL* tests described below.
@@ -105,18 +119,22 @@ def setUpClass(cls):
         _skip_if_no_project_id()
         _skip_if_no_private_key_path()
 
-        clean_gbq_environment(_get_private_key_path())
-        pandas_gbq.gbq._Dataset(_get_project_id(),
-                                private_key=_get_private_key_path()
-                                ).create(DATASET_ID + "1")
+        cls.client = _get_client()
+        cls.dataset = cls.client.dataset(DATASET_ID + "1")
+        try:
+            # Clean-up previous test runs.
+            cls.client.delete_dataset(cls.dataset, delete_contents=True)
+        except api_exceptions.NotFound:
+            pass  # It's OK if the dataset doesn't already exist.
+
+        cls.client.create_dataset(bigquery.Dataset(cls.dataset))
 
     @classmethod
-    def tearDownClass(cls):
+    def teardown_class(cls):
         # - GLOBAL CLASS FIXTURES -
         # put here any instruction you want to execute only *ONCE* *AFTER*
         # executing all tests.
-
-        clean_gbq_environment(_get_private_key_path())
+        cls.client.delete_dataset(cls.dataset, delete_contents=True)
 
     def test_roundtrip(self):
         destination_table = DESTINATION_TABLE + "1"
@@ -124,13 +142,12 @@ def test_roundtrip(self):
         test_size = 20001
         df = make_mixed_dataframe_v2(test_size)
 
-        df.to_gbq(destination_table, _get_project_id(), chunksize=10000,
-                  private_key=_get_private_key_path())
-
-        sleep(30)  # <- Curses Google!!!
+        df.to_gbq(destination_table, _get_project_id(), chunksize=None,
+                  credentials=_get_credentials())
 
         result = pd.read_gbq("SELECT COUNT(*) AS num_rows FROM {0}"
                              .format(destination_table),
                              project_id=_get_project_id(),
-                             private_key=_get_private_key_path())
-        self.assertEqual(result['num_rows'][0], test_size)
+                             credentials=_get_credentials(),
+                             dialect="standard")
+        assert result['num_rows'][0] == test_size
diff --git a/pandas/tests/io/test_gcs.py b/pandas/tests/io/test_gcs.py
new file mode 100644
index 0000000000000..ec0631e748dfc
--- /dev/null
+++ b/pandas/tests/io/test_gcs.py
@@ -0,0 +1,72 @@
+import numpy as np
+import pytest
+
+from pandas.compat import StringIO
+
+from pandas import DataFrame, date_range, read_csv
+from pandas.util import _test_decorators as td
+from pandas.util.testing import assert_frame_equal
+
+from pandas.io.common import is_gcs_url
+
+
+def test_is_gcs_url():
+    assert is_gcs_url("gcs://pandas/somethingelse.com")
+    assert is_gcs_url("gs://pandas/somethingelse.com")
+    assert not is_gcs_url("s3://pandas/somethingelse.com")
+
+
+@td.skip_if_no('gcsfs')
+def test_read_csv_gcs(monkeypatch):
+    df1 = DataFrame({'int': [1, 3], 'float': [2.0, np.nan], 'str': ['t', 's'],
+                     'dt': date_range('2018-06-18', periods=2)})
+
+    class MockGCSFileSystem():
+        def open(*args):
+            return StringIO(df1.to_csv(index=False))
+
+    monkeypatch.setattr('gcsfs.GCSFileSystem', MockGCSFileSystem)
+    df2 = read_csv('gs://test/test.csv', parse_dates=['dt'])
+
+    assert_frame_equal(df1, df2)
+
+
+@td.skip_if_no('gcsfs')
+def test_to_csv_gcs(monkeypatch):
+    df1 = DataFrame({'int': [1, 3], 'float': [2.0, np.nan], 'str': ['t', 's'],
+                     'dt': date_range('2018-06-18', periods=2)})
+    s = StringIO()
+
+    class MockGCSFileSystem():
+        def open(*args):
+            return s
+
+    monkeypatch.setattr('gcsfs.GCSFileSystem', MockGCSFileSystem)
+    df1.to_csv('gs://test/test.csv', index=True)
+    df2 = read_csv(StringIO(s.getvalue()), parse_dates=['dt'], index_col=0)
+
+    assert_frame_equal(df1, df2)
+
+
+@td.skip_if_no('gcsfs')
+def test_gcs_get_filepath_or_buffer(monkeypatch):
+    df1 = DataFrame({'int': [1, 3], 'float': [2.0, np.nan], 'str': ['t', 's'],
+                     'dt': date_range('2018-06-18', periods=2)})
+
+    def mock_get_filepath_or_buffer(*args, **kwargs):
+        return (StringIO(df1.to_csv(index=False)),
+                None, None, False)
+
+    monkeypatch.setattr('pandas.io.gcs.get_filepath_or_buffer',
+                        mock_get_filepath_or_buffer)
+    df2 = read_csv('gs://test/test.csv', parse_dates=['dt'])
+
+    assert_frame_equal(df1, df2)
+
+
+@pytest.mark.skipif(td.safe_import('gcsfs'),
+                    reason='Only check when gcsfs not installed')
+def test_gcs_not_present_exception():
+    with pytest.raises(ImportError) as e:
+        read_csv('gs://test/test.csv')
+        assert 'gcsfs library is required' in str(e.value)
diff --git a/pandas/tests/io/test_html.py b/pandas/tests/io/test_html.py
index 4aa85c0f63a68..b2b0c21c81263 100644
--- a/pandas/tests/io/test_html.py
+++ b/pandas/tests/io/test_html.py
@@ -1,66 +1,40 @@
 from __future__ import print_function
 
-import glob
+from functools import partial
 import os
 import re
-import warnings
-
-try:
-    from importlib import import_module
-except ImportError:
-    import_module = __import__
-
-from distutils.version import LooseVersion
-
-import pytest
+import threading
 
 import numpy as np
 from numpy.random import rand
+import pytest
 
-from pandas import (DataFrame, MultiIndex, read_csv, Timestamp, Index,
-                    date_range, Series)
-from pandas.compat import (map, zip, StringIO, string_types, BytesIO,
-                           is_platform_windows)
-from pandas.io.common import URLError, urlopen, file_path_to_url
-from pandas.io.html import read_html
-from pandas.io.libparsers import ParserError
+from pandas.compat import (
+    PY3, BytesIO, StringIO, is_platform_windows, map, reload, zip)
+from pandas.errors import ParserError
+import pandas.util._test_decorators as td
 
+from pandas import (
+    DataFrame, Index, MultiIndex, Series, Timestamp, date_range, read_csv)
 import pandas.util.testing as tm
 from pandas.util.testing import makeCustomDataframe as mkdf, network
 
+from pandas.io.common import URLError, file_path_to_url
+import pandas.io.html
+from pandas.io.html import read_html
 
-def _have_module(module_name):
-    try:
-        import_module(module_name)
-        return True
-    except ImportError:
-        return False
-
-
-def _skip_if_no(module_name):
-    if not _have_module(module_name):
-        pytest.skip("{0!r} not found".format(module_name))
-
-
-def _skip_if_none_of(module_names):
-    if isinstance(module_names, string_types):
-        _skip_if_no(module_names)
-        if module_names == 'bs4':
-            import bs4
-            if bs4.__version__ == LooseVersion('4.2.0'):
-                pytest.skip("Bad version of bs4: 4.2.0")
-    else:
-        not_found = [module_name for module_name in module_names if not
-                     _have_module(module_name)]
-        if set(not_found) & set(module_names):
-            pytest.skip("{0!r} not found".format(not_found))
-        if 'bs4' in module_names:
-            import bs4
-            if bs4.__version__ == LooseVersion('4.2.0'):
-                pytest.skip("Bad version of bs4: 4.2.0")
+HERE = os.path.dirname(__file__)
 
 
-DATA_PATH = tm.get_data_path()
+@pytest.fixture(params=[
+    'chinese_utf-16.html',
+    'chinese_utf-32.html',
+    'chinese_utf-8.html',
+    'letz_latin1.html',
+])
+def html_encoding_file(request, datapath):
+    """Parametrized fixture for HTML encoding test filenames."""
+    return datapath('io', 'data', 'html_encoding', request.param)
 
 
 def assert_framelist_equal(list1, list2, *args, **kwargs):
@@ -77,31 +51,51 @@ def assert_framelist_equal(list1, list2, *args, **kwargs):
         assert not frame_i.empty, 'frames are both empty'
 
 
-def test_bs4_version_fails():
-    _skip_if_none_of(('bs4', 'html5lib'))
+@td.skip_if_no('bs4')
+def test_bs4_version_fails(monkeypatch, datapath):
     import bs4
-    if bs4.__version__ == LooseVersion('4.2.0'):
-        tm.assert_raises(AssertionError, read_html, os.path.join(DATA_PATH,
-                                                                 "spam.html"),
-                         flavor='bs4')
+    monkeypatch.setattr(bs4, '__version__', '4.2')
+    with pytest.raises(ValueError, match="minimum version"):
+        read_html(datapath("io", "data", "spam.html"), flavor='bs4')
+
+
+def test_invalid_flavor():
+    url = "google.com"
+    flavor = "invalid flavor"
+    msg = r"\{" + flavor + r"\} is not a valid set of flavors"
 
+    with pytest.raises(ValueError, match=msg):
+        read_html(url, "google", flavor=flavor)
 
-class ReadHtmlMixin(object):
 
-    def read_html(self, *args, **kwargs):
-        kwargs.setdefault('flavor', self.flavor)
-        return read_html(*args, **kwargs)
+@td.skip_if_no('bs4')
+@td.skip_if_no('lxml')
+def test_same_ordering(datapath):
+    filename = datapath('io', 'data', 'valid_markup.html')
+    dfs_lxml = read_html(filename, index_col=0, flavor=['lxml'])
+    dfs_bs4 = read_html(filename, index_col=0, flavor=['bs4'])
+    assert_framelist_equal(dfs_lxml, dfs_bs4)
+
 
+@pytest.mark.parametrize("flavor", [
+    pytest.param('bs4', marks=pytest.mark.skipif(
+        not td.safe_import('lxml'), reason='No bs4')),
+    pytest.param('lxml', marks=pytest.mark.skipif(
+        not td.safe_import('lxml'), reason='No lxml'))], scope="class")
+class TestReadHtml(object):
 
-class TestReadHtml(tm.TestCase, ReadHtmlMixin):
-    flavor = 'bs4'
-    spam_data = os.path.join(DATA_PATH, 'spam.html')
-    banklist_data = os.path.join(DATA_PATH, 'banklist.html')
+    @pytest.fixture(autouse=True)
+    def set_files(self, datapath):
+        self.spam_data = datapath('io', 'data', 'spam.html')
+        self.spam_data_kwargs = {}
+        if PY3:
+            self.spam_data_kwargs['encoding'] = 'UTF-8'
+        self.banklist_data = datapath("io", "data", "banklist.html")
 
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtml, cls).setUpClass()
-        _skip_if_none_of(('bs4', 'html5lib'))
+    @pytest.fixture(autouse=True, scope="function")
+    def set_defaults(self, flavor, request):
+        self.read_html = partial(read_html, flavor=flavor)
+        yield
 
     def test_to_html_compat(self):
         df = mkdf(4, 3, data_gen_f=lambda *args: rand(), c_idx_names=False,
@@ -121,14 +115,14 @@ def test_banklist_url(self):
 
     @network
     def test_spam_url(self):
-        url = ('http://ndb.nal.usda.gov/ndb/foods/show/1732?fg=&man=&'
+        url = ('http://ndb.nal.usda.gov/ndb/foods/show/300772?fg=&man=&'
                'lfacet=&format=&count=&max=25&offset=&sort=&qlookup=spam')
         df1 = self.read_html(url, '.*Water.*')
         df2 = self.read_html(url, 'Unit')
 
         assert_framelist_equal(df1, df2)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_banklist(self):
         df1 = self.read_html(self.banklist_data, '.*Florida.*',
                              attrs={'id': 'table'})
@@ -137,38 +131,28 @@ def test_banklist(self):
 
         assert_framelist_equal(df1, df2)
 
-    def test_spam_no_types(self):
-
-        # infer_types removed in #10892
+    def test_spam(self):
         df1 = self.read_html(self.spam_data, '.*Water.*')
         df2 = self.read_html(self.spam_data, 'Unit')
         assert_framelist_equal(df1, df2)
 
-        self.assertEqual(df1[0].iloc[0, 0], 'Proximates')
-        self.assertEqual(df1[0].columns[0], 'Nutrient')
-
-    def test_spam_with_types(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*')
-        df2 = self.read_html(self.spam_data, 'Unit')
-        assert_framelist_equal(df1, df2)
-
-        self.assertEqual(df1[0].iloc[0, 0], 'Proximates')
-        self.assertEqual(df1[0].columns[0], 'Nutrient')
+        assert df1[0].iloc[0, 0] == 'Proximates'
+        assert df1[0].columns[0] == 'Nutrient'
 
     def test_spam_no_match(self):
         dfs = self.read_html(self.spam_data)
         for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
+            assert isinstance(df, DataFrame)
 
     def test_banklist_no_match(self):
         dfs = self.read_html(self.banklist_data, attrs={'id': 'table'})
         for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
+            assert isinstance(df, DataFrame)
 
     def test_spam_header(self):
-        df = self.read_html(self.spam_data, '.*Water.*', header=1)[0]
-        self.assertEqual(df.columns[0], 'Proximates')
-        self.assertFalse(df.empty)
+        df = self.read_html(self.spam_data, '.*Water.*', header=2)[0]
+        assert df.columns[0] == 'Proximates'
+        assert not df.empty
 
     def test_skiprows_int(self):
         df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=1)
@@ -188,8 +172,8 @@ def test_skiprows_list(self):
         assert_framelist_equal(df1, df2)
 
     def test_skiprows_set(self):
-        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows=set([1, 2]))
-        df2 = self.read_html(self.spam_data, 'Unit', skiprows=set([2, 1]))
+        df1 = self.read_html(self.spam_data, '.*Water.*', skiprows={1, 2})
+        df2 = self.read_html(self.spam_data, 'Unit', skiprows={2, 1})
 
         assert_framelist_equal(df1, df2)
 
@@ -219,8 +203,8 @@ def test_skiprows_ndarray(self):
         assert_framelist_equal(df1, df2)
 
     def test_skiprows_invalid(self):
-        with tm.assertRaisesRegexp(TypeError,
-                                   'is not a valid type for skipping rows'):
+        with pytest.raises(TypeError, match=('is not a valid type '
+                                             'for skipping rows')):
             self.read_html(self.spam_data, '.*Water.*', skiprows='asdf')
 
     def test_index(self):
@@ -248,10 +232,10 @@ def test_infer_types(self):
         assert_framelist_equal(df1, df2)
 
     def test_string_io(self):
-        with open(self.spam_data) as f:
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
             data1 = StringIO(f.read())
 
-        with open(self.spam_data) as f:
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
             data2 = StringIO(f.read())
 
         df1 = self.read_html(data1, '.*Water.*')
@@ -259,7 +243,7 @@ def test_string_io(self):
         assert_framelist_equal(df1, df2)
 
     def test_string(self):
-        with open(self.spam_data) as f:
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
             data = f.read()
 
         df1 = self.read_html(data, '.*Water.*')
@@ -268,41 +252,42 @@ def test_string(self):
         assert_framelist_equal(df1, df2)
 
     def test_file_like(self):
-        with open(self.spam_data) as f:
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
             df1 = self.read_html(f, '.*Water.*')
 
-        with open(self.spam_data) as f:
+        with open(self.spam_data, **self.spam_data_kwargs) as f:
             df2 = self.read_html(f, 'Unit')
 
         assert_framelist_equal(df1, df2)
 
     @network
     def test_bad_url_protocol(self):
-        with tm.assertRaises(URLError):
+        with pytest.raises(URLError):
             self.read_html('git://github.com', match='.*Water.*')
 
     @network
     def test_invalid_url(self):
         try:
-            with tm.assertRaises(URLError):
+            with pytest.raises(URLError):
                 self.read_html('http://www.a23950sdfa908sd.com',
                                match='.*Water.*')
         except ValueError as e:
-            self.assertEqual(str(e), 'No tables found')
+            assert 'No tables found' in str(e)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_file_url(self):
         url = self.banklist_data
-        dfs = self.read_html(file_path_to_url(url), 'First',
+        dfs = self.read_html(file_path_to_url(os.path.abspath(url)),
+                             'First',
                              attrs={'id': 'table'})
-        tm.assertIsInstance(dfs, list)
+        assert isinstance(dfs, list)
         for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
+            assert isinstance(df, DataFrame)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_invalid_table_attrs(self):
         url = self.banklist_data
-        with tm.assertRaisesRegexp(ValueError, 'No tables found'):
+        with pytest.raises(ValueError, match='No tables found'):
             self.read_html(url, 'First Federal Bank of Florida',
                            attrs={'id': 'tasdfable'})
 
@@ -310,90 +295,118 @@ def _bank_data(self, *args, **kwargs):
         return self.read_html(self.banklist_data, 'Metcalf',
                               attrs={'id': 'table'}, *args, **kwargs)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_header(self):
         df = self._bank_data(header=[0, 1])[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
+        assert isinstance(df.columns, MultiIndex)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_index(self):
         df = self._bank_data(index_col=[0, 1])[0]
-        tm.assertIsInstance(df.index, MultiIndex)
+        assert isinstance(df.index, MultiIndex)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_header_index(self):
         df = self._bank_data(header=[0, 1], index_col=[0, 1])[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
-        tm.assertIsInstance(df.index, MultiIndex)
+        assert isinstance(df.columns, MultiIndex)
+        assert isinstance(df.index, MultiIndex)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_header_skiprows_tuples(self):
-        df = self._bank_data(header=[0, 1], skiprows=1, tupleize_cols=True)[0]
-        tm.assertIsInstance(df.columns, Index)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            df = self._bank_data(header=[0, 1], skiprows=1,
+                                 tupleize_cols=True)[0]
+            assert isinstance(df.columns, Index)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_header_skiprows(self):
         df = self._bank_data(header=[0, 1], skiprows=1)[0]
-        tm.assertIsInstance(df.columns, MultiIndex)
+        assert isinstance(df.columns, MultiIndex)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_multiindex_header_index_skiprows(self):
         df = self._bank_data(header=[0, 1], index_col=[0, 1], skiprows=1)[0]
-        tm.assertIsInstance(df.index, MultiIndex)
-        tm.assertIsInstance(df.columns, MultiIndex)
+        assert isinstance(df.index, MultiIndex)
+        assert isinstance(df.columns, MultiIndex)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_regex_idempotency(self):
         url = self.banklist_data
-        dfs = self.read_html(file_path_to_url(url),
+        dfs = self.read_html(file_path_to_url(os.path.abspath(url)),
                              match=re.compile(re.compile('Florida')),
                              attrs={'id': 'table'})
-        tm.assertIsInstance(dfs, list)
+        assert isinstance(dfs, list)
         for df in dfs:
-            tm.assertIsInstance(df, DataFrame)
+            assert isinstance(df, DataFrame)
 
     def test_negative_skiprows(self):
-        with tm.assertRaisesRegexp(ValueError,
-                                   r'\(you passed a negative value\)'):
+        msg = r'\(you passed a negative value\)'
+        with pytest.raises(ValueError, match=msg):
             self.read_html(self.spam_data, 'Water', skiprows=-1)
 
     @network
     def test_multiple_matches(self):
         url = 'https://docs.python.org/2/'
         dfs = self.read_html(url, match='Python')
-        self.assertTrue(len(dfs) > 1)
+        assert len(dfs) > 1
 
     @network
     def test_python_docs_table(self):
         url = 'https://docs.python.org/2/'
         dfs = self.read_html(url, match='Python')
         zz = [df.iloc[0, 0][0:4] for df in dfs]
-        self.assertEqual(sorted(zz), sorted(['Repo', 'What']))
+        assert sorted(zz) == sorted(['Repo', 'What'])
 
-    @tm.slow
-    def test_thousands_macau_stats(self):
+    @pytest.mark.slow
+    def test_thousands_macau_stats(self, datapath):
         all_non_nan_table_index = -2
-        macau_data = os.path.join(DATA_PATH, 'macau.html')
+        macau_data = datapath("io", "data", "macau.html")
         dfs = self.read_html(macau_data, index_col=0,
                              attrs={'class': 'style1'})
         df = dfs[all_non_nan_table_index]
 
-        self.assertFalse(any(s.isnull().any() for _, s in df.iteritems()))
+        assert not any(s.isna().any() for _, s in df.iteritems())
 
-    @tm.slow
-    def test_thousands_macau_index_col(self):
+    @pytest.mark.slow
+    def test_thousands_macau_index_col(self, datapath):
         all_non_nan_table_index = -2
-        macau_data = os.path.join(DATA_PATH, 'macau.html')
+        macau_data = datapath('io', 'data', 'macau.html')
         dfs = self.read_html(macau_data, index_col=0, header=0)
         df = dfs[all_non_nan_table_index]
 
-        self.assertFalse(any(s.isnull().any() for _, s in df.iteritems()))
+        assert not any(s.isna().any() for _, s in df.iteritems())
 
     def test_empty_tables(self):
         """
         Make sure that read_html ignores empty tables.
         """
-        data1 = '''<table>
+        result = self.read_html('''
+            <table>
+                <thead>
+                    <tr>
+                        <th>A</th>
+                        <th>B</th>
+                    </tr>
+                </thead>
+                <tbody>
+                    <tr>
+                        <td>1</td>
+                        <td>2</td>
+                    </tr>
+                </tbody>
+            </table>
+            <table>
+                <tbody>
+                </tbody>
+            </table>
+        ''')
+
+        assert len(result) == 1
+
+    def test_multiple_tbody(self):
+        # GH-20690
+        # Read all tbody tags within a single table.
+        result = self.read_html('''<table>
             <thead>
                 <tr>
                     <th>A</th>
@@ -406,23 +419,24 @@ def test_empty_tables(self):
                     <td>2</td>
                 </tr>
             </tbody>
-        </table>'''
-        data2 = data1 + '''<table>
             <tbody>
+                <tr>
+                    <td>3</td>
+                    <td>4</td>
+                </tr>
             </tbody>
-        </table>'''
-        res1 = self.read_html(StringIO(data1))
-        res2 = self.read_html(StringIO(data2))
-        assert_framelist_equal(res1, res2)
+        </table>''')[0]
+
+        expected = DataFrame(data=[[1, 2], [3, 4]], columns=['A', 'B'])
+
+        tm.assert_frame_equal(result, expected)
 
     def test_header_and_one_column(self):
         """
         Don't fail with bs4 when there is a header and only one column
         as described in issue #9178
         """
-        data = StringIO('''<html>
-            <body>
-             <table>
+        result = self.read_html('''<table>
                 <thead>
                     <tr>
                         <th>Header</th>
@@ -433,11 +447,36 @@ def test_header_and_one_column(self):
                         <td>first</td>
                     </tr>
                 </tbody>
-            </table>
-            </body>
-        </html>''')
+            </table>''')[0]
+
         expected = DataFrame(data={'Header': 'first'}, index=[0])
-        result = self.read_html(data)[0]
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_thead_without_tr(self):
+        """
+        Ensure parser adds <tr> within <thead> on malformed HTML.
+        """
+        result = self.read_html('''<table>
+            <thead>
+                <tr>
+                    <th>Country</th>
+                    <th>Municipality</th>
+                    <th>Year</th>
+                </tr>
+            </thead>
+            <tbody>
+                <tr>
+                    <td>Ukraine</td>
+                    <th>Odessa</th>
+                    <td>1944</td>
+                </tr>
+            </tbody>
+        </table>''')[0]
+
+        expected = DataFrame(data=[['Ukraine', 'Odessa', 1944]],
+                             columns=['Country', 'Municipality', 'Year'])
+
         tm.assert_frame_equal(result, expected)
 
     def test_tfoot_read(self):
@@ -463,66 +502,54 @@ def test_tfoot_read(self):
             </tfoot>
         </table>'''
 
+        expected1 = DataFrame(data=[['bodyA', 'bodyB']], columns=['A', 'B'])
+
+        expected2 = DataFrame(data=[['bodyA', 'bodyB'], ['footA', 'footB']],
+                              columns=['A', 'B'])
+
         data1 = data_template.format(footer="")
         data2 = data_template.format(
             footer="<tr><td>footA</td><th>footB</th></tr>")
 
-        d1 = {'A': ['bodyA'], 'B': ['bodyB']}
-        d2 = {'A': ['bodyA', 'footA'], 'B': ['bodyB', 'footB']}
+        result1 = self.read_html(data1)[0]
+        result2 = self.read_html(data2)[0]
 
-        tm.assert_frame_equal(self.read_html(data1)[0], DataFrame(d1))
-        tm.assert_frame_equal(self.read_html(data2)[0], DataFrame(d2))
+        tm.assert_frame_equal(result1, expected1)
+        tm.assert_frame_equal(result2, expected2)
 
-    def test_countries_municipalities(self):
-        # GH5048
-        data1 = StringIO('''<table>
-            <thead>
-                <tr>
-                    <th>Country</th>
-                    <th>Municipality</th>
-                    <th>Year</th>
-                </tr>
-            </thead>
-            <tbody>
+    def test_parse_header_of_non_string_column(self):
+        # GH5048: if header is specified explicitly, an int column should be
+        # parsed as int while its header is parsed as str
+        result = self.read_html('''
+            <table>
                 <tr>
-                    <td>Ukraine</td>
-                    <th>Odessa</th>
-                    <td>1944</td>
-                </tr>
-            </tbody>
-        </table>''')
-        data2 = StringIO('''
-        <table>
-            <tbody>
-                <tr>
-                    <th>Country</th>
-                    <th>Municipality</th>
-                    <th>Year</th>
+                    <td>S</td>
+                    <td>I</td>
                 </tr>
                 <tr>
-                    <td>Ukraine</td>
-                    <th>Odessa</th>
+                    <td>text</td>
                     <td>1944</td>
                 </tr>
-            </tbody>
-        </table>''')
-        res1 = self.read_html(data1)
-        res2 = self.read_html(data2, header=0)
-        assert_framelist_equal(res1, res2)
+            </table>
+        ''', header=0)[0]
 
-    def test_nyse_wsj_commas_table(self):
-        data = os.path.join(DATA_PATH, 'nyse_wsj.html')
+        expected = DataFrame([['text', 1944]], columns=('S', 'I'))
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_nyse_wsj_commas_table(self, datapath):
+        data = datapath('io', 'data', 'nyse_wsj.html')
         df = self.read_html(data, index_col=0, header=0,
                             attrs={'class': 'mdcTable'})[0]
 
-        columns = Index(['Issue(Roll over for charts and headlines)',
-                         'Volume', 'Price', 'Chg', '% Chg'])
+        expected = Index(['Issue(Roll over for charts and headlines)',
+                          'Volume', 'Price', 'Chg', '% Chg'])
         nrows = 100
-        self.assertEqual(df.shape[0], nrows)
-        self.assert_index_equal(df.columns, columns)
+        assert df.shape[0] == nrows
+        tm.assert_index_equal(df.columns, expected)
 
-    @tm.slow
-    def test_banklist_header(self):
+    @pytest.mark.slow
+    def test_banklist_header(self, datapath):
         from pandas.io.html import _remove_whitespace
 
         def try_remove_ws(x):
@@ -533,10 +560,10 @@ def try_remove_ws(x):
 
         df = self.read_html(self.banklist_data, 'Metcalf',
                             attrs={'id': 'table'})[0]
-        ground_truth = read_csv(os.path.join(DATA_PATH, 'banklist.csv'),
+        ground_truth = read_csv(datapath('io', 'data', 'banklist.csv'),
                                 converters={'Updated Date': Timestamp,
                                             'Closing Date': Timestamp})
-        self.assertEqual(df.shape, ground_truth.shape)
+        assert df.shape == ground_truth.shape
         old = ['First Vietnamese American BankIn Vietnamese',
                'Westernbank Puerto RicoEn Espanol',
                'R-G Premier Bank of Puerto RicoEn Espanol',
@@ -560,19 +587,19 @@ def try_remove_ws(x):
                                                              coerce=True)
         tm.assert_frame_equal(converted, gtnew)
 
-    @tm.slow
+    @pytest.mark.slow
     def test_gold_canyon(self):
         gc = 'Gold Canyon'
         with open(self.banklist_data, 'r') as f:
             raw_text = f.read()
 
-        self.assertIn(gc, raw_text)
+        assert gc in raw_text
         df = self.read_html(self.banklist_data, 'Gold Canyon',
                             attrs={'id': 'table'})[0]
-        self.assertIn(gc, df.to_string())
+        assert gc in df.to_string()
 
-    def test_different_number_of_rows(self):
-        expected = """<table border="1" class="dataframe">
+    def test_different_number_of_cols(self):
+        expected = self.read_html("""<table>
                         <thead>
                             <tr style="text-align: right;">
                             <th></th>
@@ -601,8 +628,9 @@ def test_different_number_of_rows(self):
                             <td> 0.222</td>
                             </tr>
                         </tbody>
-                    </table>"""
-        out = """<table border="1" class="dataframe">
+                    </table>""", index_col=0)[0]
+
+        result = self.read_html("""<table>
                     <thead>
                         <tr style="text-align: right;">
                         <th></th>
@@ -628,10 +656,151 @@ def test_different_number_of_rows(self):
                         <td> 0.222</td>
                         </tr>
                     </tbody>
-                 </table>"""
-        expected = self.read_html(expected, index_col=0)[0]
-        res = self.read_html(out, index_col=0)[0]
-        tm.assert_frame_equal(expected, res)
+                 </table>""", index_col=0)[0]
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_colspan_rowspan_1(self):
+        # GH17054
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <th>A</th>
+                    <th colspan="1">B</th>
+                    <th rowspan="1">C</th>
+                </tr>
+                <tr>
+                    <td>a</td>
+                    <td>b</td>
+                    <td>c</td>
+                </tr>
+            </table>
+        """)[0]
+
+        expected = DataFrame([['a', 'b', 'c']], columns=['A', 'B', 'C'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_colspan_rowspan_copy_values(self):
+        # GH17054
+
+        # In ASCII, with lowercase letters being copies:
+        #
+        # X x Y Z W
+        # A B b z C
+
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <td colspan="2">X</td>
+                    <td>Y</td>
+                    <td rowspan="2">Z</td>
+                    <td>W</td>
+                </tr>
+                <tr>
+                    <td>A</td>
+                    <td colspan="2">B</td>
+                    <td>C</td>
+                </tr>
+            </table>
+        """, header=0)[0]
+
+        expected = DataFrame(data=[['A', 'B', 'B', 'Z', 'C']],
+                             columns=['X', 'X.1', 'Y', 'Z', 'W'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_colspan_rowspan_both_not_1(self):
+        # GH17054
+
+        # In ASCII, with lowercase letters being copies:
+        #
+        # A B b b C
+        # a b b b D
+
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <td rowspan="2">A</td>
+                    <td rowspan="2" colspan="3">B</td>
+                    <td>C</td>
+                </tr>
+                <tr>
+                    <td>D</td>
+                </tr>
+            </table>
+        """, header=0)[0]
+
+        expected = DataFrame(data=[['A', 'B', 'B', 'B', 'D']],
+                             columns=['A', 'B', 'B.1', 'B.2', 'C'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_rowspan_at_end_of_row(self):
+        # GH17054
+
+        # In ASCII, with lowercase letters being copies:
+        #
+        # A B
+        # C b
+
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <td>A</td>
+                    <td rowspan="2">B</td>
+                </tr>
+                <tr>
+                    <td>C</td>
+                </tr>
+            </table>
+        """, header=0)[0]
+
+        expected = DataFrame(data=[['C', 'B']], columns=['A', 'B'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_rowspan_only_rows(self):
+        # GH17054
+
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <td rowspan="3">A</td>
+                    <td rowspan="3">B</td>
+                </tr>
+            </table>
+        """, header=0)[0]
+
+        expected = DataFrame(data=[['A', 'B'], ['A', 'B']],
+                             columns=['A', 'B'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_header_inferred_from_rows_with_only_th(self):
+        # GH17054
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <th>A</th>
+                    <th>B</th>
+                </tr>
+                <tr>
+                    <th>a</th>
+                    <th>b</th>
+                </tr>
+                <tr>
+                    <td>1</td>
+                    <td>2</td>
+                </tr>
+            </table>
+        """)[0]
+
+        columns = MultiIndex(levels=[['A', 'B'], ['a', 'b']],
+                             codes=[[0, 1], [0, 1]])
+        expected = DataFrame(data=[[1, 2]], columns=columns)
+
+        tm.assert_frame_equal(result, expected)
 
     def test_parse_dates_list(self):
         df = DataFrame({'date': date_range('1/1/2001', periods=10)})
@@ -650,24 +819,42 @@ def test_parse_dates_combine(self):
         newdf = DataFrame({'datetime': raw_dates})
         tm.assert_frame_equal(newdf, res[0])
 
-    def test_computer_sales_page(self):
-        data = os.path.join(DATA_PATH, 'computer_sales_page.html')
-        with tm.assertRaisesRegexp(ParserError, r"Passed header=\[0,1\] are "
-                                   "too many rows for this multi_index "
-                                   "of columns"):
+    def test_computer_sales_page(self, datapath):
+        data = datapath('io', 'data', 'computer_sales_page.html')
+        msg = (r"Passed header=\[0,1\] are too many "
+               r"rows for this multi_index of columns")
+        with pytest.raises(ParserError, match=msg):
             self.read_html(data, header=[0, 1])
 
-    def test_wikipedia_states_table(self):
-        data = os.path.join(DATA_PATH, 'wikipedia_states.html')
+        data = datapath('io', 'data', 'computer_sales_page.html')
+        assert self.read_html(data, header=[1, 2])
+
+    def test_wikipedia_states_table(self, datapath):
+        data = datapath('io', 'data', 'wikipedia_states.html')
         assert os.path.isfile(data), '%r is not a file' % data
         assert os.path.getsize(data), '%r is an empty file' % data
         result = self.read_html(data, 'Arizona', header=1)[0]
-        self.assertEqual(result['sq mi'].dtype, np.dtype('float64'))
+        assert result['sq mi'].dtype == np.dtype('float64')
+
+    def test_parser_error_on_empty_header_row(self):
+        msg = (r"Passed header=\[0,1\] are too many "
+               r"rows for this multi_index of columns")
+        with pytest.raises(ParserError, match=msg):
+            self.read_html("""
+                <table>
+                    <thead>
+                        <tr><th></th><th></tr>
+                        <tr><th>A</th><th>B</th></tr>
+                    </thead>
+                    <tbody>
+                        <tr><td>a</td><td>b</td></tr>
+                    </tbody>
+                </table>
+            """, header=[0, 1])
 
     def test_decimal_rows(self):
-
         # GH 12907
-        data = StringIO('''<html>
+        result = self.read_html('''<html>
             <body>
              <table>
                 <thead>
@@ -682,63 +869,72 @@ def test_decimal_rows(self):
                 </tbody>
             </table>
             </body>
-        </html>''')
+        </html>''', decimal='#')[0]
+
         expected = DataFrame(data={'Header': 1100.101}, index=[0])
-        result = self.read_html(data, decimal='#')[0]
+
         assert result['Header'].dtype == np.dtype('float64')
         tm.assert_frame_equal(result, expected)
 
     def test_bool_header_arg(self):
         # GH 6114
         for arg in [True, False]:
-            with tm.assertRaises(TypeError):
-                read_html(self.spam_data, header=arg)
+            with pytest.raises(TypeError):
+                self.read_html(self.spam_data, header=arg)
 
     def test_converters(self):
         # GH 13461
-        html_data = """<table>
-                        <thead>
-                            <th>a</th>
-                            </tr>
-                        </thead>
-                        <tbody>
-                            <tr>
-                            <td> 0.763</td>
-                            </tr>
-                            <tr>
-                            <td> 0.244</td>
-                            </tr>
-                        </tbody>
-                    </table>"""
+        result = self.read_html(
+            """<table>
+                 <thead>
+                   <tr>
+                     <th>a</th>
+                    </tr>
+                 </thead>
+                 <tbody>
+                   <tr>
+                     <td> 0.763</td>
+                   </tr>
+                   <tr>
+                     <td> 0.244</td>
+                   </tr>
+                 </tbody>
+               </table>""",
+            converters={'a': str}
+        )[0]
+
+        expected = DataFrame({'a': ['0.763', '0.244']})
 
-        expected_df = DataFrame({'a': ['0.763', '0.244']})
-        html_df = read_html(html_data, converters={'a': str})[0]
-        tm.assert_frame_equal(expected_df, html_df)
+        tm.assert_frame_equal(result, expected)
 
     def test_na_values(self):
         # GH 13461
-        html_data = """<table>
-                        <thead>
-                            <th>a</th>
-                            </tr>
-                        </thead>
-                        <tbody>
-                            <tr>
-                            <td> 0.763</td>
-                            </tr>
-                            <tr>
-                            <td> 0.244</td>
-                            </tr>
-                        </tbody>
-                    </table>"""
+        result = self.read_html(
+            """<table>
+                 <thead>
+                   <tr>
+                     <th>a</th>
+                   </tr>
+                 </thead>
+                 <tbody>
+                   <tr>
+                     <td> 0.763</td>
+                   </tr>
+                   <tr>
+                     <td> 0.244</td>
+                   </tr>
+                 </tbody>
+               </table>""",
+            na_values=[0.244])[0]
+
+        expected = DataFrame({'a': [0.763, np.nan]})
 
-        expected_df = DataFrame({'a': [0.763, np.nan]})
-        html_df = read_html(html_data, na_values=[0.244])[0]
-        tm.assert_frame_equal(expected_df, html_df)
+        tm.assert_frame_equal(result, expected)
 
     def test_keep_default_na(self):
         html_data = """<table>
                         <thead>
+                            <tr>
                             <th>a</th>
                             </tr>
                         </thead>
@@ -753,13 +949,56 @@ def test_keep_default_na(self):
                     </table>"""
 
         expected_df = DataFrame({'a': ['N/A', 'NA']})
-        html_df = read_html(html_data, keep_default_na=False)[0]
+        html_df = self.read_html(html_data, keep_default_na=False)[0]
         tm.assert_frame_equal(expected_df, html_df)
 
         expected_df = DataFrame({'a': [np.nan, np.nan]})
-        html_df = read_html(html_data, keep_default_na=True)[0]
+        html_df = self.read_html(html_data, keep_default_na=True)[0]
         tm.assert_frame_equal(expected_df, html_df)
 
+    def test_preserve_empty_rows(self):
+        result = self.read_html("""
+            <table>
+                <tr>
+                    <th>A</th>
+                    <th>B</th>
+                </tr>
+                <tr>
+                    <td>a</td>
+                    <td>b</td>
+                </tr>
+                <tr>
+                    <td></td>
+                    <td></td>
+                </tr>
+            </table>
+        """)[0]
+
+        expected = DataFrame(data=[['a', 'b'], [np.nan, np.nan]],
+                             columns=['A', 'B'])
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_ignore_empty_rows_when_inferring_header(self):
+        result = self.read_html("""
+            <table>
+                <thead>
+                    <tr><th></th><th></tr>
+                    <tr><th>A</th><th>B</th></tr>
+                    <tr><th>a</th><th>b</th></tr>
+                </thead>
+                <tbody>
+                    <tr><td>1</td><td>2</td></tr>
+                </tbody>
+            </table>
+        """)[0]
+
+        columns = MultiIndex(levels=[['A', 'B'], ['a', 'b']],
+                             codes=[[0, 1], [0, 1]])
+        expected = DataFrame(data=[[1, 2]], columns=columns)
+
+        tm.assert_frame_equal(result, expected)
+
     def test_multiple_header_rows(self):
         # Issue #13434
         expected_df = DataFrame(data=[("Hillary", 68, "D"),
@@ -769,164 +1008,154 @@ def test_multiple_header_rows(self):
                                ["Name", "Unnamed: 1_level_1",
                                 "Unnamed: 2_level_1"]]
         html = expected_df.to_html(index=False)
-        html_df = read_html(html, )[0]
+        html_df = self.read_html(html, )[0]
         tm.assert_frame_equal(expected_df, html_df)
 
-
-def _lang_enc(filename):
-    return os.path.splitext(os.path.basename(filename))[0].split('_')
-
-
-class TestReadHtmlEncoding(tm.TestCase):
-    files = glob.glob(os.path.join(DATA_PATH, 'html_encoding', '*.html'))
-    flavor = 'bs4'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlEncoding, cls).setUpClass()
-        _skip_if_none_of((cls.flavor, 'html5lib'))
-
-    def read_html(self, *args, **kwargs):
-        kwargs['flavor'] = self.flavor
-        return read_html(*args, **kwargs)
-
-    def read_filename(self, f, encoding):
-        return self.read_html(f, encoding=encoding, index_col=0)
-
-    def read_file_like(self, f, encoding):
-        with open(f, 'rb') as fobj:
-            return self.read_html(BytesIO(fobj.read()), encoding=encoding,
-                                  index_col=0)
-
-    def read_string(self, f, encoding):
-        with open(f, 'rb') as fobj:
-            return self.read_html(fobj.read(), encoding=encoding, index_col=0)
-
-    def test_encode(self):
-        assert self.files, 'no files read from the data folder'
-        for f in self.files:
-            _, encoding = _lang_enc(f)
-            try:
-                from_string = self.read_string(f, encoding).pop()
-                from_file_like = self.read_file_like(f, encoding).pop()
-                from_filename = self.read_filename(f, encoding).pop()
-                tm.assert_frame_equal(from_string, from_file_like)
-                tm.assert_frame_equal(from_string, from_filename)
-            except Exception:
-                # seems utf-16/32 fail on windows
-                if is_platform_windows():
-                    if '16' in encoding or '32' in encoding:
-                        continue
-                    raise
-
-
-class TestReadHtmlEncodingLxml(TestReadHtmlEncoding):
-    flavor = 'lxml'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlEncodingLxml, cls).setUpClass()
-        _skip_if_no(cls.flavor)
-
-
-class TestReadHtmlLxml(tm.TestCase, ReadHtmlMixin):
-    flavor = 'lxml'
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestReadHtmlLxml, cls).setUpClass()
-        _skip_if_no('lxml')
-
-    def test_data_fail(self):
-        from lxml.etree import XMLSyntaxError
-        spam_data = os.path.join(DATA_PATH, 'spam.html')
-        banklist_data = os.path.join(DATA_PATH, 'banklist.html')
-
-        with tm.assertRaises(XMLSyntaxError):
-            self.read_html(spam_data)
-
-        with tm.assertRaises(XMLSyntaxError):
-            self.read_html(banklist_data)
-
-    def test_works_on_valid_markup(self):
-        filename = os.path.join(DATA_PATH, 'valid_markup.html')
+    def test_works_on_valid_markup(self, datapath):
+        filename = datapath('io', 'data', 'valid_markup.html')
         dfs = self.read_html(filename, index_col=0)
-        tm.assertIsInstance(dfs, list)
-        tm.assertIsInstance(dfs[0], DataFrame)
+        assert isinstance(dfs, list)
+        assert isinstance(dfs[0], DataFrame)
 
-    @tm.slow
-    def test_fallback_success(self):
-        _skip_if_none_of(('bs4', 'html5lib'))
-        banklist_data = os.path.join(DATA_PATH, 'banklist.html')
+    @pytest.mark.slow
+    def test_fallback_success(self, datapath):
+        banklist_data = datapath('io', 'data', 'banklist.html')
         self.read_html(banklist_data, '.*Water.*', flavor=['lxml', 'html5lib'])
 
-    def test_parse_dates_list(self):
-        df = DataFrame({'date': date_range('1/1/2001', periods=10)})
-        expected = df.to_html()
-        res = self.read_html(expected, parse_dates=[1], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-        res = self.read_html(expected, parse_dates=['date'], index_col=0)
-        tm.assert_frame_equal(df, res[0])
-
-    def test_parse_dates_combine(self):
-        raw_dates = Series(date_range('1/1/2001', periods=10))
-        df = DataFrame({'date': raw_dates.map(lambda x: str(x.date())),
-                        'time': raw_dates.map(lambda x: str(x.time()))})
-        res = self.read_html(df.to_html(), parse_dates={'datetime': [1, 2]},
-                             index_col=1)
-        newdf = DataFrame({'datetime': raw_dates})
-        tm.assert_frame_equal(newdf, res[0])
-
-    def test_computer_sales_page(self):
-        data = os.path.join(DATA_PATH, 'computer_sales_page.html')
-        self.read_html(data, header=[0, 1])
-
-
-def test_invalid_flavor():
-    url = 'google.com'
-    with tm.assertRaises(ValueError):
-        read_html(url, 'google', flavor='not a* valid**++ flaver')
-
-
-def get_elements_from_file(url, element='table'):
-    _skip_if_none_of(('bs4', 'html5lib'))
-    url = file_path_to_url(url)
-    from bs4 import BeautifulSoup
-    with urlopen(url) as f:
-        soup = BeautifulSoup(f, features='html5lib')
-    return soup.find_all(element)
-
-
-@tm.slow
-def test_bs4_finds_tables():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    with warnings.catch_warnings():
-        warnings.filterwarnings('ignore')
-        assert get_elements_from_file(filepath, 'table')
-
-
-def get_lxml_elements(url, element):
-    _skip_if_no('lxml')
-    from lxml.html import parse
-    doc = parse(url)
-    return doc.xpath('.//{0}'.format(element))
-
-
-@tm.slow
-def test_lxml_finds_tables():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    assert get_lxml_elements(filepath, 'table')
+    def test_to_html_timestamp(self):
+        rng = date_range('2000-01-01', periods=10)
+        df = DataFrame(np.random.randn(10, 4), index=rng)
+
+        result = df.to_html()
+        assert '2000-01-01' in result
+
+    @pytest.mark.parametrize("displayed_only,exp0,exp1", [
+        (True, DataFrame(["foo"]), None),
+        (False, DataFrame(["foo  bar  baz  qux"]), DataFrame(["foo"]))])
+    def test_displayed_only(self, displayed_only, exp0, exp1):
+        # GH 20027
+        data = StringIO("""<html>
+          <body>
+            <table>
+              <tr>
+                <td>
+                  foo
+                  <span style="display:none;text-align:center">bar</span>
+                  <span style="display:none">baz</span>
+                  <span style="display: none">qux</span>
+                </td>
+              </tr>
+            </table>
+            <table style="display: none">
+              <tr>
+                <td>foo</td>
+              </tr>
+            </table>
+          </body>
+        </html>""")
 
+        dfs = self.read_html(data, displayed_only=displayed_only)
+        tm.assert_frame_equal(dfs[0], exp0)
 
-@tm.slow
-def test_lxml_finds_tbody():
-    filepath = os.path.join(DATA_PATH, "spam.html")
-    assert get_lxml_elements(filepath, 'tbody')
+        if exp1 is not None:
+            tm.assert_frame_equal(dfs[1], exp1)
+        else:
+            assert len(dfs) == 1  # Should not parse hidden table
 
+    def test_encode(self, html_encoding_file):
+        _, encoding = os.path.splitext(
+            os.path.basename(html_encoding_file)
+        )[0].split('_')
 
-def test_same_ordering():
-    _skip_if_none_of(['bs4', 'lxml', 'html5lib'])
-    filename = os.path.join(DATA_PATH, 'valid_markup.html')
-    dfs_lxml = read_html(filename, index_col=0, flavor=['lxml'])
-    dfs_bs4 = read_html(filename, index_col=0, flavor=['bs4'])
-    assert_framelist_equal(dfs_lxml, dfs_bs4)
+        try:
+            with open(html_encoding_file, 'rb') as fobj:
+                from_string = self.read_html(fobj.read(), encoding=encoding,
+                                             index_col=0).pop()
+
+            with open(html_encoding_file, 'rb') as fobj:
+                from_file_like = self.read_html(BytesIO(fobj.read()),
+                                                encoding=encoding,
+                                                index_col=0).pop()
+
+            from_filename = self.read_html(html_encoding_file,
+                                           encoding=encoding,
+                                           index_col=0).pop()
+            tm.assert_frame_equal(from_string, from_file_like)
+            tm.assert_frame_equal(from_string, from_filename)
+        except Exception:
+            # seems utf-16/32 fail on windows
+            if is_platform_windows():
+                if '16' in encoding or '32' in encoding:
+                    pytest.skip()
+                raise
+
+    def test_parse_failure_unseekable(self):
+        # Issue #17975
+
+        if self.read_html.keywords.get('flavor') == 'lxml':
+            pytest.skip("Not applicable for lxml")
+
+        class UnseekableStringIO(StringIO):
+            def seekable(self):
+                return False
+
+        bad = UnseekableStringIO('''
+            <table><tr><td>spam<foobr />eggs</td></tr></table>''')
+
+        assert self.read_html(bad)
+
+        with pytest.raises(ValueError,
+                           match='passed a non-rewindable file object'):
+            self.read_html(bad)
+
+    def test_parse_failure_rewinds(self):
+        # Issue #17975
+
+        class MockFile(object):
+            def __init__(self, data):
+                self.data = data
+                self.at_end = False
+
+            def read(self, size=None):
+                data = '' if self.at_end else self.data
+                self.at_end = True
+                return data
+
+            def seek(self, offset):
+                self.at_end = False
+
+            def seekable(self):
+                return True
+
+        good = MockFile('<table><tr><td>spam<br />eggs</td></tr></table>')
+        bad = MockFile('<table><tr><td>spam<foobr />eggs</td></tr></table>')
+
+        assert self.read_html(good)
+        assert self.read_html(bad)
+
+    @pytest.mark.slow
+    def test_importcheck_thread_safety(self, datapath):
+        # see gh-16928
+
+        class ErrorThread(threading.Thread):
+            def run(self):
+                try:
+                    super(ErrorThread, self).run()
+                except Exception as e:
+                    self.err = e
+                else:
+                    self.err = None
+
+        # force import check by reinitalising global vars in html.py
+        reload(pandas.io.html)
+
+        filename = datapath('io', 'data', 'valid_markup.html')
+        helper_thread1 = ErrorThread(target=self.read_html, args=(filename,))
+        helper_thread2 = ErrorThread(target=self.read_html, args=(filename,))
+
+        helper_thread1.start()
+        helper_thread2.start()
+
+        while helper_thread1.is_alive() or helper_thread2.is_alive():
+            pass
+        assert None is helper_thread1.err is helper_thread2.err
diff --git a/pandas/tests/io/test_packers.py b/pandas/tests/io/test_packers.py
index efa8587d64657..375557c43a3ae 100644
--- a/pandas/tests/io/test_packers.py
+++ b/pandas/tests/io/test_packers.py
@@ -1,29 +1,26 @@
-import pytest
-
-import os
 import datetime
-import numpy as np
-import sys
 from distutils.version import LooseVersion
+import glob
+import os
+from warnings import catch_warnings
 
-from pandas import compat
-from pandas.compat import u, PY3
-from pandas import (Series, DataFrame, Panel, MultiIndex, bdate_range,
-                    date_range, period_range, Index, Categorical)
-from pandas.core.common import PerformanceWarning
-from pandas.io.packers import to_msgpack, read_msgpack
-import pandas.util.testing as tm
-from pandas.util.testing import (ensure_clean,
-                                 assert_categorical_equal,
-                                 assert_frame_equal,
-                                 assert_index_equal,
-                                 assert_series_equal,
-                                 patch)
-from pandas.tests.test_panel import assert_panel_equal
+import numpy as np
+import pytest
 
-import pandas
-from pandas import Timestamp, NaT
 from pandas._libs.tslib import iNaT
+from pandas.compat import PY3, u
+from pandas.errors import PerformanceWarning
+
+import pandas
+from pandas import (
+    Categorical, DataFrame, Index, Interval, MultiIndex, NaT, Period, Series,
+    Timestamp, bdate_range, compat, date_range, period_range)
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_categorical_equal, assert_frame_equal, assert_index_equal,
+    assert_series_equal, ensure_clean)
+
+from pandas.io.packers import read_msgpack, to_msgpack
 
 nan = np.nan
 
@@ -64,8 +61,6 @@ def check_arbitrary(a, b):
         assert(len(a) == len(b))
         for a_, b_ in zip(a, b):
             check_arbitrary(a_, b_)
-    elif isinstance(a, Panel):
-        assert_panel_equal(a, b)
     elif isinstance(a, DataFrame):
         assert_frame_equal(a, b)
     elif isinstance(a, Series):
@@ -89,12 +84,13 @@ def check_arbitrary(a, b):
         assert(a == b)
 
 
-class TestPackers(tm.TestCase):
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+class TestPackers(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.path = '__%s__.msg' % tm.rands(10)
 
-    def tearDown(self):
+    def teardown_method(self, method):
         pass
 
     def encode_decode(self, x, compress=None, **kwargs):
@@ -103,6 +99,7 @@ def encode_decode(self, x, compress=None, **kwargs):
             return read_msgpack(p, **kwargs)
 
 
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
 class TestAPI(TestPackers):
 
     def test_string_io(self):
@@ -127,12 +124,21 @@ def test_string_io(self):
         with ensure_clean(self.path) as p:
 
             s = df.to_msgpack()
-            fh = open(p, 'wb')
-            fh.write(s)
-            fh.close()
+            with open(p, 'wb') as fh:
+                fh.write(s)
             result = read_msgpack(p)
             tm.assert_frame_equal(result, df)
 
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_pathlib(df.to_msgpack, read_msgpack)
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_localpath(df.to_msgpack, read_msgpack)
+        tm.assert_frame_equal(df, result)
+
     def test_iterator_with_string_io(self):
 
         dfs = [DataFrame(np.random.randn(10, 2)) for i in range(5)]
@@ -147,9 +153,14 @@ class A(object):
             def __init__(self):
                 self.read = 0
 
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf=None)
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf={})
-        tm.assertRaises(ValueError, read_msgpack, path_or_buf=A())
+        msg = (r"Invalid file path or buffer object type: <(class|type)"
+               r" '{}'>")
+        with pytest.raises(ValueError, match=msg.format('NoneType')):
+            read_msgpack(path_or_buf=None)
+        with pytest.raises(ValueError, match=msg.format('dict')):
+            read_msgpack(path_or_buf={})
+        with pytest.raises(ValueError, match=msg.format(r'.*\.A')):
+            read_msgpack(path_or_buf=A())
 
 
 class TestNumpy(TestPackers):
@@ -162,17 +173,26 @@ def test_numpy_scalar_float(self):
     def test_numpy_scalar_complex(self):
         x = np.complex64(np.random.rand() + 1j * np.random.rand())
         x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
+        assert np.allclose(x, x_rec)
 
     def test_scalar_float(self):
         x = np.random.rand()
         x_rec = self.encode_decode(x)
         tm.assert_almost_equal(x, x_rec)
 
+    def test_scalar_bool(self):
+        x = np.bool_(1)
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
+        x = np.bool_(0)
+        x_rec = self.encode_decode(x)
+        tm.assert_almost_equal(x, x_rec)
+
     def test_scalar_complex(self):
         x = np.random.rand() + 1j * np.random.rand()
         x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
+        assert np.allclose(x, x_rec)
 
     def test_list_numpy_float(self):
         x = [np.float32(np.random.rand()) for i in range(5)]
@@ -185,13 +205,13 @@ def test_list_numpy_float(self):
 
     def test_list_numpy_float_complex(self):
         if not hasattr(np, 'complex128'):
-            pytest.skip('numpy cant handle complex128')
+            pytest.skip('numpy can not handle complex128')
 
         x = [np.float32(np.random.rand()) for i in range(5)] + \
             [np.complex128(np.random.rand() + 1j * np.random.rand())
              for i in range(5)]
         x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
+        assert np.allclose(x, x_rec)
 
     def test_list_float(self):
         x = [np.random.rand() for i in range(5)]
@@ -206,7 +226,7 @@ def test_list_float_complex(self):
         x = [np.random.rand() for i in range(5)] + \
             [(np.random.rand() + 1j * np.random.rand()) for i in range(5)]
         x_rec = self.encode_decode(x)
-        self.assertTrue(np.allclose(x, x_rec))
+        assert np.allclose(x, x_rec)
 
     def test_dict_float(self):
         x = {'foo': 1.0, 'bar': 2.0}
@@ -216,9 +236,10 @@ def test_dict_float(self):
     def test_dict_complex(self):
         x = {'foo': 1.0 + 1.0j, 'bar': 2.0 + 2.0j}
         x_rec = self.encode_decode(x)
-        self.assertEqual(x, x_rec)
+        tm.assert_dict_equal(x, x_rec)
+
         for key in x:
-            self.assertEqual(type(x[key]), type(x_rec[key]))
+            tm.assert_class_equal(x[key], x_rec[key], obj="complex value")
 
     def test_dict_numpy_float(self):
         x = {'foo': np.float32(1.0), 'bar': np.float32(2.0)}
@@ -229,9 +250,10 @@ def test_dict_numpy_complex(self):
         x = {'foo': np.complex128(1.0 + 1.0j),
              'bar': np.complex128(2.0 + 2.0j)}
         x_rec = self.encode_decode(x)
-        self.assertEqual(x, x_rec)
+        tm.assert_dict_equal(x, x_rec)
+
         for key in x:
-            self.assertEqual(type(x[key]), type(x_rec[key]))
+            tm.assert_class_equal(x[key], x_rec[key], obj="numpy complex128")
 
     def test_numpy_array_float(self):
 
@@ -246,11 +268,11 @@ def test_numpy_array_float(self):
     def test_numpy_array_complex(self):
         x = (np.random.rand(5) + 1j * np.random.rand(5)).astype(np.complex128)
         x_rec = self.encode_decode(x)
-        self.assertTrue(all(map(lambda x, y: x == y, x, x_rec)) and
-                        x.dtype == x_rec.dtype)
+        assert (all(map(lambda x, y: x == y, x, x_rec)) and
+                x.dtype == x_rec.dtype)
 
     def test_list_mixed(self):
-        x = [1.0, np.float32(3.5), np.complex128(4.25), u('foo')]
+        x = [1.0, np.float32(3.5), np.complex128(4.25), u('foo'), np.bool_(1)]
         x_rec = self.encode_decode(x)
         # current msgpack cannot distinguish list/tuple
         tm.assert_almost_equal(tuple(x), x_rec)
@@ -267,25 +289,20 @@ def test_timestamp(self):
             '20130101'), Timestamp('20130101', tz='US/Eastern'),
                 Timestamp('201301010501')]:
             i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
+            assert i == i_rec
 
     def test_nat(self):
         nat_rec = self.encode_decode(NaT)
-        self.assertIs(NaT, nat_rec)
+        assert NaT is nat_rec
 
     def test_datetimes(self):
 
-        # fails under 2.6/win32 (np.datetime64 seems broken)
-
-        if LooseVersion(sys.version) < '2.7':
-            pytest.skip('2.6 with np.datetime64 is broken')
-
         for i in [datetime.datetime(2013, 1, 1),
                   datetime.datetime(2013, 1, 1, 5, 1),
                   datetime.date(2013, 1, 1),
                   np.datetime64(datetime.datetime(2013, 1, 5, 2, 15))]:
             i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
+            assert i == i_rec
 
     def test_timedeltas(self):
 
@@ -293,13 +310,26 @@ def test_timedeltas(self):
                   datetime.timedelta(days=1, seconds=10),
                   np.timedelta64(1000000)]:
             i_rec = self.encode_decode(i)
-            self.assertEqual(i, i_rec)
+            assert i == i_rec
+
+    def test_periods(self):
+        # 13463
+        for i in [Period('2010-09', 'M'), Period('2014-Q1', 'Q')]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
+
+    def test_intervals(self):
+        # 19967
+        for i in [Interval(0, 1), Interval(0, 1, 'left'),
+                  Interval(10, 25., 'right')]:
+            i_rec = self.encode_decode(i)
+            assert i == i_rec
 
 
 class TestIndex(TestPackers):
 
-    def setUp(self):
-        super(TestIndex, self).setUp()
+    def setup_method(self, method):
+        super(TestIndex, self).setup_method(method)
 
         self.d = {
             'string': tm.makeStringIndex(100),
@@ -312,7 +342,9 @@ def setUp(self):
             'period': Index(period_range('2012-1-1', freq='M', periods=3)),
             'date2': Index(date_range('2013-01-1', periods=10)),
             'bdate': Index(bdate_range('2013-01-02', periods=10)),
-            'cat': tm.makeCategoricalIndex(100)
+            'cat': tm.makeCategoricalIndex(100),
+            'interval': tm.makeIntervalIndex(100),
+            'timedelta': tm.makeTimedeltaIndex(100, 'H')
         }
 
         self.mi = {
@@ -326,30 +358,30 @@ def test_basic_index(self):
 
         for s, i in self.d.items():
             i_rec = self.encode_decode(i)
-            self.assert_index_equal(i, i_rec)
+            tm.assert_index_equal(i, i_rec)
 
         # datetime with no freq (GH5506)
         i = Index([Timestamp('20130101'), Timestamp('20130103')])
         i_rec = self.encode_decode(i)
-        self.assert_index_equal(i, i_rec)
+        tm.assert_index_equal(i, i_rec)
 
         # datetime with timezone
         i = Index([Timestamp('20130101 9:00:00'), Timestamp(
             '20130103 11:00:00')]).tz_localize('US/Eastern')
         i_rec = self.encode_decode(i)
-        self.assert_index_equal(i, i_rec)
+        tm.assert_index_equal(i, i_rec)
 
     def test_multi_index(self):
 
         for s, i in self.mi.items():
             i_rec = self.encode_decode(i)
-            self.assert_index_equal(i, i_rec)
+            tm.assert_index_equal(i, i_rec)
 
     def test_unicode(self):
         i = tm.makeUnicodeIndex(100)
 
         i_rec = self.encode_decode(i)
-        self.assert_index_equal(i, i_rec)
+        tm.assert_index_equal(i, i_rec)
 
     def categorical_index(self):
         # GH15487
@@ -361,8 +393,8 @@ def categorical_index(self):
 
 class TestSeries(TestPackers):
 
-    def setUp(self):
-        super(TestSeries, self).setUp()
+    def setup_method(self, method):
+        super(TestSeries, self).setup_method(method)
 
         self.d = {}
 
@@ -388,6 +420,7 @@ def setUp(self):
             'G': [Timestamp('20130102', tz='US/Eastern')] * 5,
             'H': Categorical([1, 2, 3, 4, 5]),
             'I': Categorical([1, 2, 3, 4, 5], ordered=True),
+            'J': (np.bool_(1), 2, 3, 4, 5),
         }
 
         self.d['float'] = Series(data['A'])
@@ -397,6 +430,7 @@ def setUp(self):
         self.d['dt_tz'] = Series(data['G'])
         self.d['cat_ordered'] = Series(data['H'])
         self.d['cat_unordered'] = Series(data['I'])
+        self.d['numpy_bool_mixed'] = Series(data['J'])
 
     def test_basic(self):
 
@@ -409,8 +443,8 @@ def test_basic(self):
 
 class TestCategorical(TestPackers):
 
-    def setUp(self):
-        super(TestCategorical, self).setUp()
+    def setup_method(self, method):
+        super(TestCategorical, self).setup_method(method)
 
         self.d = {}
 
@@ -430,10 +464,11 @@ def test_basic(self):
                 assert_categorical_equal(i, i_rec)
 
 
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
 class TestNDFrame(TestPackers):
 
-    def setUp(self):
-        super(TestNDFrame, self).setUp()
+    def setup_method(self, method):
+        super(TestNDFrame, self).setup_method(method)
 
         data = {
             'A': [0., 1., 2., 3., np.nan],
@@ -452,49 +487,39 @@ def setUp(self):
             'int': DataFrame(dict(A=data['B'], B=Series(data['B']) + 1)),
             'mixed': DataFrame(data)}
 
-        self.panel = {
-            'float': Panel(dict(ItemA=self.frame['float'],
-                                ItemB=self.frame['float'] + 1))}
-
     def test_basic_frame(self):
 
         for s, i in self.frame.items():
             i_rec = self.encode_decode(i)
             assert_frame_equal(i, i_rec)
 
-    def test_basic_panel(self):
-
-        for s, i in self.panel.items():
-            i_rec = self.encode_decode(i)
-            assert_panel_equal(i, i_rec)
-
     def test_multi(self):
 
         i_rec = self.encode_decode(self.frame)
         for k in self.frame.keys():
             assert_frame_equal(self.frame[k], i_rec[k])
 
-        l = tuple([self.frame['float'], self.frame['float'].A,
-                   self.frame['float'].B, None])
-        l_rec = self.encode_decode(l)
-        check_arbitrary(l, l_rec)
+        packed_items = tuple([self.frame['float'], self.frame['float'].A,
+                              self.frame['float'].B, None])
+        l_rec = self.encode_decode(packed_items)
+        check_arbitrary(packed_items, l_rec)
 
         # this is an oddity in that packed lists will be returned as tuples
-        l = [self.frame['float'], self.frame['float']
-             .A, self.frame['float'].B, None]
-        l_rec = self.encode_decode(l)
-        self.assertIsInstance(l_rec, tuple)
-        check_arbitrary(l, l_rec)
+        packed_items = [self.frame['float'], self.frame['float'].A,
+                        self.frame['float'].B, None]
+        l_rec = self.encode_decode(packed_items)
+        assert isinstance(l_rec, tuple)
+        check_arbitrary(packed_items, l_rec)
 
     def test_iterator(self):
 
-        l = [self.frame['float'], self.frame['float']
-             .A, self.frame['float'].B, None]
+        packed_items = [self.frame['float'], self.frame['float'].A,
+                        self.frame['float'].B, None]
 
         with ensure_clean(self.path) as path:
-            to_msgpack(path, *l)
+            to_msgpack(path, *packed_items)
             for i, packed in enumerate(read_msgpack(path, iterator=True)):
-                check_arbitrary(packed, l[i])
+                check_arbitrary(packed, packed_items[i])
 
     def tests_datetimeindex_freq_issue(self):
 
@@ -533,7 +558,9 @@ def _check_roundtrip(self, obj, comparator, **kwargs):
         # currently these are not implemetned
         # i_rec = self.encode_decode(obj)
         # comparator(obj, i_rec, **kwargs)
-        self.assertRaises(NotImplementedError, self.encode_decode, obj)
+        msg = r"msgpack sparse (series|frame) is not implemented"
+        with pytest.raises(NotImplementedError, match=msg):
+            self.encode_decode(obj)
 
     def test_sparse_series(self):
 
@@ -574,7 +601,7 @@ class TestCompression(TestPackers):
     """See https://github.com/pandas-dev/pandas/pull/9783
     """
 
-    def setUp(self):
+    def setup_method(self, method):
         try:
             from sqlalchemy import create_engine
             self._create_sql_engine = create_engine
@@ -583,7 +610,7 @@ def setUp(self):
         else:
             self._SQLALCHEMY_INSTALLED = True
 
-        super(TestCompression, self).setUp()
+        super(TestCompression, self).setup_method(method)
         data = {
             'A': np.arange(1000, dtype=np.float64),
             'B': np.arange(1000, dtype=np.int32),
@@ -592,8 +619,8 @@ def setUp(self):
             'E': [datetime.timedelta(days=x) for x in range(1000)],
         }
         self.frame = {
-            'float': DataFrame(dict((k, data[k]) for k in ['A', 'A'])),
-            'int': DataFrame(dict((k, data[k]) for k in ['B', 'B'])),
+            'float': DataFrame({k: data[k] for k in ['A', 'A']}),
+            'int': DataFrame({k: data[k] for k in ['B', 'B']}),
             'mixed': DataFrame(data),
         }
 
@@ -610,7 +637,7 @@ def _test_compression(self, compress):
             assert_frame_equal(value, expected)
             # make sure that we can write to the new frames
             for block in value._data.blocks:
-                self.assertTrue(block.values.flags.writeable)
+                assert block.values.flags.writeable
 
     def test_compression_zlib(self):
         if not _ZLIB_INSTALLED:
@@ -622,7 +649,8 @@ def test_compression_blosc(self):
             pytest.skip('no blosc')
         self._test_compression('blosc')
 
-    def _test_compression_warns_when_decompress_caches(self, compress):
+    def _test_compression_warns_when_decompress_caches(
+            self, monkeypatch, compress):
         not_garbage = []
         control = []  # copied data
 
@@ -647,9 +675,9 @@ def decompress(ob):
             np.dtype('timedelta64[ns]'): np.timedelta64(1, 'ns'),
         }
 
-        with patch(compress_module, 'decompress', decompress), \
+        with monkeypatch.context() as m, \
                 tm.assert_produces_warning(PerformanceWarning) as ws:
-
+            m.setattr(compress_module, 'decompress', decompress)
             i_rec = self.encode_decode(self.frame, compress=compress)
             for k in self.frame.keys():
 
@@ -659,32 +687,32 @@ def decompress(ob):
                 # make sure that we can write to the new frames even though
                 # we needed to copy the data
                 for block in value._data.blocks:
-                    self.assertTrue(block.values.flags.writeable)
+                    assert block.values.flags.writeable
                     # mutate the data in some way
                     block.values[0] += rhs[block.dtype]
 
         for w in ws:
             # check the messages from our warnings
-            self.assertEqual(
-                str(w.message),
-                'copying data after decompressing; this may mean that'
-                ' decompress is caching its result',
-            )
+            assert str(w.message) == ('copying data after decompressing; '
+                                      'this may mean that decompress is '
+                                      'caching its result')
 
         for buf, control_buf in zip(not_garbage, control):
             # make sure none of our mutations above affected the
             # original buffers
-            self.assertEqual(buf, control_buf)
+            assert buf == control_buf
 
-    def test_compression_warns_when_decompress_caches_zlib(self):
+    def test_compression_warns_when_decompress_caches_zlib(self, monkeypatch):
         if not _ZLIB_INSTALLED:
             pytest.skip('no zlib')
-        self._test_compression_warns_when_decompress_caches('zlib')
+        self._test_compression_warns_when_decompress_caches(
+            monkeypatch, 'zlib')
 
-    def test_compression_warns_when_decompress_caches_blosc(self):
+    def test_compression_warns_when_decompress_caches_blosc(self, monkeypatch):
         if not _BLOSC_INSTALLED:
             pytest.skip('no blosc')
-        self._test_compression_warns_when_decompress_caches('blosc')
+        self._test_compression_warns_when_decompress_caches(
+            monkeypatch, 'blosc')
 
     def _test_small_strings_no_warn(self, compress):
         empty = np.array([], dtype='uint8')
@@ -692,14 +720,14 @@ def _test_small_strings_no_warn(self, compress):
             empty_unpacked = self.encode_decode(empty, compress=compress)
 
         tm.assert_numpy_array_equal(empty_unpacked, empty)
-        self.assertTrue(empty_unpacked.flags.writeable)
+        assert empty_unpacked.flags.writeable
 
         char = np.array([ord(b'a')], dtype='uint8')
         with tm.assert_produces_warning(None):
             char_unpacked = self.encode_decode(char, compress=compress)
 
         tm.assert_numpy_array_equal(char_unpacked, char)
-        self.assertTrue(char_unpacked.flags.writeable)
+        assert char_unpacked.flags.writeable
         # if this test fails I am sorry because the interpreter is now in a
         # bad state where b'a' points to 98 == ord(b'b').
         char_unpacked[0] = ord(b'b')
@@ -707,7 +735,7 @@ def _test_small_strings_no_warn(self, compress):
         # we compare the ord of bytes b'a' with unicode u'a' because the should
         # always be the same (unless we were able to mutate the shared
         # character singleton in which case ord(b'a') == ord(b'b').
-        self.assertEqual(ord(b'a'), ord(u'a'))
+        assert ord(b'a') == ord(u'a')
         tm.assert_numpy_array_equal(
             char_unpacked,
             np.array([ord(b'b')], dtype='uint8'),
@@ -729,15 +757,15 @@ def test_readonly_axis_blosc(self):
             pytest.skip('no blosc')
         df1 = DataFrame({'A': list('abcd')})
         df2 = DataFrame(df1, index=[1., 2., 3., 4.])
-        self.assertTrue(1 in self.encode_decode(df1['A'], compress='blosc'))
-        self.assertTrue(1. in self.encode_decode(df2['A'], compress='blosc'))
+        assert 1 in self.encode_decode(df1['A'], compress='blosc')
+        assert 1. in self.encode_decode(df2['A'], compress='blosc')
 
     def test_readonly_axis_zlib(self):
         # GH11880
         df1 = DataFrame({'A': list('abcd')})
         df2 = DataFrame(df1, index=[1., 2., 3., 4.])
-        self.assertTrue(1 in self.encode_decode(df1['A'], compress='zlib'))
-        self.assertTrue(1. in self.encode_decode(df2['A'], compress='zlib'))
+        assert 1 in self.encode_decode(df1['A'], compress='zlib')
+        assert 1. in self.encode_decode(df2['A'], compress='zlib')
 
     def test_readonly_axis_blosc_to_sql(self):
         # GH11880
@@ -770,8 +798,8 @@ def test_readonly_axis_zlib_to_sql(self):
 
 class TestEncoding(TestPackers):
 
-    def setUp(self):
-        super(TestEncoding, self).setUp()
+    def setup_method(self, method):
+        super(TestEncoding, self).setup_method(method)
         data = {
             'A': [compat.u('\u2019')] * 1000,
             'B': np.arange(1000, dtype=np.int32),
@@ -781,8 +809,8 @@ def setUp(self):
             'G': [400] * 1000
         }
         self.frame = {
-            'float': DataFrame(dict((k, data[k]) for k in ['A', 'A'])),
-            'int': DataFrame(dict((k, data[k]) for k in ['B', 'B'])),
+            'float': DataFrame({k: data[k] for k in ['A', 'A']}),
+            'int': DataFrame({k: data[k] for k in ['B', 'B']}),
             'mixed': DataFrame(data),
         }
         self.utf_encodings = ['utf8', 'utf16', 'utf32']
@@ -798,20 +826,21 @@ def test_default_encoding(self):
         for frame in compat.itervalues(self.frame):
             result = frame.to_msgpack()
             expected = frame.to_msgpack(encoding='utf8')
-            self.assertEqual(result, expected)
+            assert result == expected
             result = self.encode_decode(frame)
             assert_frame_equal(result, frame)
 
 
-def legacy_packers_versions():
-    # yield the packers versions
-    path = tm.get_data_path('legacy_msgpack')
-    for v in os.listdir(path):
-        p = os.path.join(path, v)
-        if os.path.isdir(p):
-            yield v
+files = glob.glob(os.path.join(os.path.dirname(__file__), "data",
+                               "legacy_msgpack", "*", "*.msgpack"))
+
+
+@pytest.fixture(params=files)
+def legacy_packer(request, datapath):
+    return datapath(request.param)
 
 
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
 class TestMsgpack(object):
     """
     How to add msgpack tests:
@@ -833,6 +862,10 @@ class TestMsgpack(object):
 
     def check_min_structure(self, data, version):
         for typ, v in self.minimum_structure.items():
+            if typ == "panel":
+                # FIXME: kludge; get this key out of the legacy file
+                continue
+
             assert typ in data, '"{0}" not found in unpacked data'.format(typ)
             for kind in v:
                 msg = '"{0}" not found in data["{1}"]'.format(kind, typ)
@@ -840,10 +873,15 @@ def check_min_structure(self, data, version):
 
     def compare(self, current_data, all_data, vf, version):
         # GH12277 encoding default used to be latin-1, now utf-8
-        if LooseVersion(version) < '0.18.0':
+        if LooseVersion(version) < LooseVersion('0.18.0'):
             data = read_msgpack(vf, encoding='latin-1')
         else:
             data = read_msgpack(vf)
+
+        if "panel" in data:
+            # FIXME: kludge; get the key out of the stored file
+            del data["panel"]
+
         self.check_min_structure(data, version)
         for typ, dv in data.items():
             assert typ in all_data, ('unpacked data contains '
@@ -871,7 +909,7 @@ def compare(self, current_data, all_data, vf, version):
     def compare_series_dt_tz(self, result, expected, typ, version):
         # 8260
         # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
+        if LooseVersion(version) < LooseVersion('0.17.0'):
             expected = expected.astype(object)
             tm.assert_series_equal(result, expected)
         else:
@@ -880,29 +918,32 @@ def compare_series_dt_tz(self, result, expected, typ, version):
     def compare_frame_dt_mixed_tzs(self, result, expected, typ, version):
         # 8260
         # dtype is object < 0.17.0
-        if LooseVersion(version) < '0.17.0':
+        if LooseVersion(version) < LooseVersion('0.17.0'):
             expected = expected.astype(object)
             tm.assert_frame_equal(result, expected)
         else:
             tm.assert_frame_equal(result, expected)
 
-    @pytest.mark.parametrize('version', legacy_packers_versions())
     def test_msgpacks_legacy(self, current_packers_data, all_packers_data,
-                             version):
-
-        pth = tm.get_data_path('legacy_msgpack/{0}'.format(version))
-        n = 0
-        for f in os.listdir(pth):
-            # GH12142 0.17 files packed in P2 can't be read in P3
-            if (compat.PY3 and version.startswith('0.17.') and
-                    f.split('.')[-4][-1] == '2'):
-                continue
-            vf = os.path.join(pth, f)
-            try:
+                             legacy_packer, datapath):
+
+        version = os.path.basename(os.path.dirname(legacy_packer))
+
+        # GH12142 0.17 files packed in P2 can't be read in P3
+        if (compat.PY3 and version.startswith('0.17.') and
+                legacy_packer.split('.')[-4][-1] == '2'):
+            msg = "Files packed in Py2 can't be read in Py3 ({})"
+            pytest.skip(msg.format(version))
+        try:
+            with catch_warnings(record=True):
                 self.compare(current_packers_data, all_packers_data,
-                             vf, version)
-            except ImportError:
-                # blosc not installed
-                continue
-            n += 1
-        assert n > 0, 'Msgpack files are not tested'
+                             legacy_packer, version)
+        except ImportError:
+            # blosc not installed
+            pass
+
+    def test_msgpack_period_freq(self):
+        # https://github.com/pandas-dev/pandas/issues/24135
+        s = Series(np.random.rand(5), index=date_range('20130101', periods=5))
+        r = read_msgpack(s.to_msgpack())
+        repr(r)
diff --git a/pandas/tests/io/test_parquet.py b/pandas/tests/io/test_parquet.py
new file mode 100644
index 0000000000000..01a47a67ad1b6
--- /dev/null
+++ b/pandas/tests/io/test_parquet.py
@@ -0,0 +1,541 @@
+""" test parquet compat """
+import datetime
+from distutils.version import LooseVersion
+import os
+from warnings import catch_warnings
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY3
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas.util import testing as tm
+
+from pandas.io.parquet import (
+    FastParquetImpl, PyArrowImpl, get_engine, read_parquet, to_parquet)
+
+try:
+    import pyarrow  # noqa
+    _HAVE_PYARROW = True
+except ImportError:
+    _HAVE_PYARROW = False
+
+try:
+    import fastparquet  # noqa
+    _HAVE_FASTPARQUET = True
+except ImportError:
+    _HAVE_FASTPARQUET = False
+
+
+# setup engines & skips
+@pytest.fixture(params=[
+    pytest.param('fastparquet',
+                 marks=pytest.mark.skipif(not _HAVE_FASTPARQUET,
+                                          reason='fastparquet is '
+                                                 'not installed')),
+    pytest.param('pyarrow',
+                 marks=pytest.mark.skipif(not _HAVE_PYARROW,
+                                          reason='pyarrow is '
+                                                 'not installed'))])
+def engine(request):
+    return request.param
+
+
+@pytest.fixture
+def pa():
+    if not _HAVE_PYARROW:
+        pytest.skip("pyarrow is not installed")
+    return 'pyarrow'
+
+
+@pytest.fixture
+def fp():
+    if not _HAVE_FASTPARQUET:
+        pytest.skip("fastparquet is not installed")
+    return 'fastparquet'
+
+
+@pytest.fixture
+def df_compat():
+    return pd.DataFrame({'A': [1, 2, 3], 'B': 'foo'})
+
+
+@pytest.fixture
+def df_cross_compat():
+    df = pd.DataFrame({'a': list('abc'),
+                       'b': list(range(1, 4)),
+                       # 'c': np.arange(3, 6).astype('u1'),
+                       'd': np.arange(4.0, 7.0, dtype='float64'),
+                       'e': [True, False, True],
+                       'f': pd.date_range('20130101', periods=3),
+                       # 'g': pd.date_range('20130101', periods=3,
+                       #                    tz='US/Eastern'),
+                       # 'h': pd.date_range('20130101', periods=3, freq='ns')
+                       })
+    return df
+
+
+@pytest.fixture
+def df_full():
+    return pd.DataFrame(
+        {'string': list('abc'),
+         'string_with_nan': ['a', np.nan, 'c'],
+         'string_with_none': ['a', None, 'c'],
+         'bytes': [b'foo', b'bar', b'baz'],
+         'unicode': [u'foo', u'bar', u'baz'],
+         'int': list(range(1, 4)),
+         'uint': np.arange(3, 6).astype('u1'),
+         'float': np.arange(4.0, 7.0, dtype='float64'),
+         'float_with_nan': [2., np.nan, 3.],
+         'bool': [True, False, True],
+         'datetime': pd.date_range('20130101', periods=3),
+         'datetime_with_nat': [pd.Timestamp('20130101'),
+                               pd.NaT,
+                               pd.Timestamp('20130103')]})
+
+
+def check_round_trip(df, engine=None, path=None,
+                     write_kwargs=None, read_kwargs=None,
+                     expected=None, check_names=True,
+                     repeat=2):
+    """Verify parquet serializer and deserializer produce the same results.
+
+    Performs a pandas to disk and disk to pandas round trip,
+    then compares the 2 resulting DataFrames to verify equality.
+
+    Parameters
+    ----------
+    df: Dataframe
+    engine: str, optional
+        'pyarrow' or 'fastparquet'
+    path: str, optional
+    write_kwargs: dict of str:str, optional
+    read_kwargs: dict of str:str, optional
+    expected: DataFrame, optional
+        Expected deserialization result, otherwise will be equal to `df`
+    check_names: list of str, optional
+        Closed set of column names to be compared
+    repeat: int, optional
+        How many times to repeat the test
+    """
+
+    write_kwargs = write_kwargs or {'compression': None}
+    read_kwargs = read_kwargs or {}
+
+    if expected is None:
+        expected = df
+
+    if engine:
+        write_kwargs['engine'] = engine
+        read_kwargs['engine'] = engine
+
+    def compare(repeat):
+        for _ in range(repeat):
+            df.to_parquet(path, **write_kwargs)
+            with catch_warnings(record=True):
+                actual = read_parquet(path, **read_kwargs)
+            tm.assert_frame_equal(expected, actual,
+                                  check_names=check_names)
+
+    if path is None:
+        with tm.ensure_clean() as path:
+            compare(repeat)
+    else:
+        compare(repeat)
+
+
+def test_invalid_engine(df_compat):
+    with pytest.raises(ValueError):
+        check_round_trip(df_compat, 'foo', 'bar')
+
+
+def test_options_py(df_compat, pa):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'pyarrow'):
+        check_round_trip(df_compat)
+
+
+def test_options_fp(df_compat, fp):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'fastparquet'):
+        check_round_trip(df_compat)
+
+
+def test_options_auto(df_compat, fp, pa):
+    # use the set option
+
+    with pd.option_context('io.parquet.engine', 'auto'):
+        check_round_trip(df_compat)
+
+
+def test_options_get_engine(fp, pa):
+    assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+    assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'pyarrow'):
+        assert isinstance(get_engine('auto'), PyArrowImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'fastparquet'):
+        assert isinstance(get_engine('auto'), FastParquetImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+    with pd.option_context('io.parquet.engine', 'auto'):
+        assert isinstance(get_engine('auto'), PyArrowImpl)
+        assert isinstance(get_engine('pyarrow'), PyArrowImpl)
+        assert isinstance(get_engine('fastparquet'), FastParquetImpl)
+
+
+def test_cross_engine_pa_fp(df_cross_compat, pa, fp):
+    # cross-compat with differing reading/writing engines
+
+    df = df_cross_compat
+    with tm.ensure_clean() as path:
+        df.to_parquet(path, engine=pa, compression=None)
+
+        result = read_parquet(path, engine=fp)
+        tm.assert_frame_equal(result, df)
+
+        result = read_parquet(path, engine=fp, columns=['a', 'd'])
+        tm.assert_frame_equal(result, df[['a', 'd']])
+
+
+def test_cross_engine_fp_pa(df_cross_compat, pa, fp):
+    # cross-compat with differing reading/writing engines
+
+    df = df_cross_compat
+    with tm.ensure_clean() as path:
+        df.to_parquet(path, engine=fp, compression=None)
+
+        with catch_warnings(record=True):
+            result = read_parquet(path, engine=pa)
+            tm.assert_frame_equal(result, df)
+
+            result = read_parquet(path, engine=pa, columns=['a', 'd'])
+            tm.assert_frame_equal(result, df[['a', 'd']])
+
+
+class Base(object):
+
+    def check_error_on_write(self, df, engine, exc):
+        # check that we are raising the exception on writing
+        with tm.ensure_clean() as path:
+            with pytest.raises(exc):
+                to_parquet(df, path, engine, compression=None)
+
+
+class TestBasic(Base):
+
+    def test_error(self, engine):
+        for obj in [pd.Series([1, 2, 3]), 1, 'foo', pd.Timestamp('20130101'),
+                    np.array([1, 2, 3])]:
+            self.check_error_on_write(obj, engine, ValueError)
+
+    def test_columns_dtypes(self, engine):
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        # unicode
+        df.columns = [u'foo', u'bar']
+        check_round_trip(df, engine)
+
+    def test_columns_dtypes_invalid(self, engine):
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        # numeric
+        df.columns = [0, 1]
+        self.check_error_on_write(df, engine, ValueError)
+
+        if PY3:
+            # bytes on PY3, on PY2 these are str
+            df.columns = [b'foo', b'bar']
+            self.check_error_on_write(df, engine, ValueError)
+
+        # python object
+        df.columns = [datetime.datetime(2011, 1, 1, 0, 0),
+                      datetime.datetime(2011, 1, 1, 1, 1)]
+        self.check_error_on_write(df, engine, ValueError)
+
+    @pytest.mark.parametrize('compression', [None, 'gzip', 'snappy', 'brotli'])
+    def test_compression(self, engine, compression):
+
+        if compression == 'snappy':
+            pytest.importorskip('snappy')
+
+        elif compression == 'brotli':
+            pytest.importorskip('brotli')
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        check_round_trip(df, engine, write_kwargs={'compression': compression})
+
+    def test_read_columns(self, engine):
+        # GH18154
+        df = pd.DataFrame({'string': list('abc'),
+                           'int': list(range(1, 4))})
+
+        expected = pd.DataFrame({'string': list('abc')})
+        check_round_trip(df, engine, expected=expected,
+                         read_kwargs={'columns': ['string']})
+
+    def test_write_index(self, engine):
+        check_names = engine != 'fastparquet'
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        check_round_trip(df, engine)
+
+        indexes = [
+            [2, 3, 4],
+            pd.date_range('20130101', periods=3),
+            list('abc'),
+            [1, 3, 4],
+        ]
+        # non-default index
+        for index in indexes:
+            df.index = index
+            check_round_trip(df, engine, check_names=check_names)
+
+        # index with meta-data
+        df.index = [0, 1, 2]
+        df.index.name = 'foo'
+        check_round_trip(df, engine)
+
+    def test_write_multiindex(self, pa):
+        # Not suppoprted in fastparquet as of 0.1.3 or older pyarrow version
+        engine = pa
+
+        df = pd.DataFrame({'A': [1, 2, 3]})
+        index = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)])
+        df.index = index
+        check_round_trip(df, engine)
+
+    def test_write_column_multiindex(self, engine):
+        # column multi-index
+        mi_columns = pd.MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)])
+        df = pd.DataFrame(np.random.randn(4, 3), columns=mi_columns)
+        self.check_error_on_write(df, engine, ValueError)
+
+    def test_multiindex_with_columns(self, pa):
+        engine = pa
+        dates = pd.date_range('01-Jan-2018', '01-Dec-2018', freq='MS')
+        df = pd.DataFrame(np.random.randn(2 * len(dates), 3),
+                          columns=list('ABC'))
+        index1 = pd.MultiIndex.from_product(
+            [['Level1', 'Level2'], dates],
+            names=['level', 'date'])
+        index2 = index1.copy(names=None)
+        for index in [index1, index2]:
+            df.index = index
+
+            check_round_trip(df, engine)
+            check_round_trip(df, engine, read_kwargs={'columns': ['A', 'B']},
+                             expected=df[['A', 'B']])
+
+    def test_write_ignoring_index(self, engine):
+        # ENH 20768
+        # Ensure index=False omits the index from the written Parquet file.
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': ['q', 'r', 's']})
+
+        write_kwargs = {
+            'compression': None,
+            'index': False,
+        }
+
+        # Because we're dropping the index, we expect the loaded dataframe to
+        # have the default integer index.
+        expected = df.reset_index(drop=True)
+
+        check_round_trip(df, engine, write_kwargs=write_kwargs,
+                         expected=expected)
+
+        # Ignore custom index
+        df = pd.DataFrame({'a': [1, 2, 3], 'b': ['q', 'r', 's']},
+                          index=['zyx', 'wvu', 'tsr'])
+
+        check_round_trip(df, engine, write_kwargs=write_kwargs,
+                         expected=expected)
+
+        # Ignore multi-indexes as well.
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        df = pd.DataFrame({'one': [i for i in range(8)],
+                           'two': [-i for i in range(8)]}, index=arrays)
+
+        expected = df.reset_index(drop=True)
+        check_round_trip(df, engine, write_kwargs=write_kwargs,
+                         expected=expected)
+
+
+class TestParquetPyArrow(Base):
+
+    def test_basic(self, pa, df_full):
+
+        df = df_full
+
+        # additional supported types for pyarrow
+        df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                          tz='Europe/Brussels')
+        df['bool_with_none'] = [True, None, True]
+
+        check_round_trip(df, pa)
+
+    # TODO: This doesn't fail on all systems; track down which
+    @pytest.mark.xfail(reason="pyarrow fails on this (ARROW-1883)",
+                       strict=False)
+    def test_basic_subset_columns(self, pa, df_full):
+        # GH18628
+
+        df = df_full
+        # additional supported types for pyarrow
+        df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                          tz='Europe/Brussels')
+
+        check_round_trip(df, pa, expected=df[['string', 'int']],
+                         read_kwargs={'columns': ['string', 'int']})
+
+    def test_duplicate_columns(self, pa):
+        # not currently able to handle duplicate columns
+        df = pd.DataFrame(np.arange(12).reshape(4, 3),
+                          columns=list('aaa')).copy()
+        self.check_error_on_write(df, pa, ValueError)
+
+    def test_unsupported(self, pa):
+        # period
+        df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
+        # pyarrow 0.11 raises ArrowTypeError
+        # older pyarrows raise ArrowInvalid
+        self.check_error_on_write(df, pa, Exception)
+
+        # timedelta
+        df = pd.DataFrame({'a': pd.timedelta_range('1 day',
+                                                   periods=3)})
+        self.check_error_on_write(df, pa, NotImplementedError)
+
+        # mixed python objects
+        df = pd.DataFrame({'a': ['a', 1, 2.0]})
+        # pyarrow 0.11 raises ArrowTypeError
+        # older pyarrows raise ArrowInvalid
+        self.check_error_on_write(df, pa, Exception)
+
+    def test_categorical(self, pa):
+
+        # supported in >= 0.7.0
+        df = pd.DataFrame({'a': pd.Categorical(list('abc'))})
+
+        # de-serialized as object
+        expected = df.assign(a=df.a.astype(object))
+        check_round_trip(df, pa, expected=expected)
+
+    def test_s3_roundtrip(self, df_compat, s3_resource, pa):
+        # GH #19134
+        check_round_trip(df_compat, pa,
+                         path='s3://pandas-test/pyarrow.parquet')
+
+    def test_partition_cols_supported(self, pa, df_full):
+        # GH #23283
+        partition_cols = ['bool', 'int']
+        df = df_full
+        with tm.ensure_clean_dir() as path:
+            df.to_parquet(path, partition_cols=partition_cols,
+                          compression=None)
+            import pyarrow.parquet as pq
+            dataset = pq.ParquetDataset(path, validate_schema=False)
+            assert len(dataset.partitions.partition_names) == 2
+            assert dataset.partitions.partition_names == set(partition_cols)
+
+
+class TestParquetFastParquet(Base):
+
+    @td.skip_if_no('fastparquet', min_version="0.2.1")
+    def test_basic(self, fp, df_full):
+        df = df_full
+
+        # additional supported types for fastparquet
+        if LooseVersion(fastparquet.__version__) >= LooseVersion('0.1.4'):
+            df['datetime_tz'] = pd.date_range('20130101', periods=3,
+                                              tz='US/Eastern')
+        df['timedelta'] = pd.timedelta_range('1 day', periods=3)
+        check_round_trip(df, fp)
+
+    @pytest.mark.skip(reason="not supported")
+    def test_duplicate_columns(self, fp):
+
+        # not currently able to handle duplicate columns
+        df = pd.DataFrame(np.arange(12).reshape(4, 3),
+                          columns=list('aaa')).copy()
+        self.check_error_on_write(df, fp, ValueError)
+
+    def test_bool_with_none(self, fp):
+        df = pd.DataFrame({'a': [True, None, False]})
+        expected = pd.DataFrame({'a': [1.0, np.nan, 0.0]}, dtype='float16')
+        check_round_trip(df, fp, expected=expected)
+
+    def test_unsupported(self, fp):
+
+        # period
+        df = pd.DataFrame({'a': pd.period_range('2013', freq='M', periods=3)})
+        self.check_error_on_write(df, fp, ValueError)
+
+        # mixed
+        df = pd.DataFrame({'a': ['a', 1, 2.0]})
+        self.check_error_on_write(df, fp, ValueError)
+
+    def test_categorical(self, fp):
+        if LooseVersion(fastparquet.__version__) < LooseVersion("0.1.3"):
+            pytest.skip("CategoricalDtype not supported for older fp")
+        df = pd.DataFrame({'a': pd.Categorical(list('abc'))})
+        check_round_trip(df, fp)
+
+    def test_filter_row_groups(self, fp):
+        d = {'a': list(range(0, 3))}
+        df = pd.DataFrame(d)
+        with tm.ensure_clean() as path:
+            df.to_parquet(path, fp, compression=None,
+                          row_group_offsets=1)
+            result = read_parquet(path, fp, filters=[('a', '==', 0)])
+        assert len(result) == 1
+
+    def test_s3_roundtrip(self, df_compat, s3_resource, fp):
+        # GH #19134
+        check_round_trip(df_compat, fp,
+                         path='s3://pandas-test/fastparquet.parquet')
+
+    def test_partition_cols_supported(self, fp, df_full):
+        # GH #23283
+        partition_cols = ['bool', 'int']
+        df = df_full
+        with tm.ensure_clean_dir() as path:
+            df.to_parquet(path, engine="fastparquet",
+                          partition_cols=partition_cols, compression=None)
+            assert os.path.exists(path)
+            import fastparquet
+            actual_partition_cols = fastparquet.ParquetFile(path, False).cats
+            assert len(actual_partition_cols) == 2
+
+    def test_partition_on_supported(self, fp, df_full):
+        # GH #23283
+        partition_cols = ['bool', 'int']
+        df = df_full
+        with tm.ensure_clean_dir() as path:
+            df.to_parquet(path, engine="fastparquet", compression=None,
+                          partition_on=partition_cols)
+            assert os.path.exists(path)
+            import fastparquet
+            actual_partition_cols = fastparquet.ParquetFile(path, False).cats
+            assert len(actual_partition_cols) == 2
+
+    def test_error_on_using_partition_cols_and_partition_on(self, fp, df_full):
+        # GH #23283
+        partition_cols = ['bool', 'int']
+        df = df_full
+        with pytest.raises(ValueError):
+            with tm.ensure_clean_dir() as path:
+                df.to_parquet(path, engine="fastparquet", compression=None,
+                              partition_on=partition_cols,
+                              partition_cols=partition_cols)
diff --git a/pandas/tests/io/test_pickle.py b/pandas/tests/io/test_pickle.py
index f46f62e781006..b4befadaddc42 100644
--- a/pandas/tests/io/test_pickle.py
+++ b/pandas/tests/io/test_pickle.py
@@ -12,17 +12,22 @@
 
 3. Move the created pickle to "data/legacy_pickle/<version>" directory.
 """
+from distutils.version import LooseVersion
+import glob
+import os
+import shutil
+from warnings import catch_warnings, simplefilter
 
 import pytest
-import os
-from distutils.version import LooseVersion
+
+from pandas.compat import PY3, is_platform_little_endian
+import pandas.util._test_decorators as td
+
 import pandas as pd
 from pandas import Index
-from pandas.compat import is_platform_little_endian
-import pandas
 import pandas.util.testing as tm
+
 from pandas.tseries.offsets import Day, MonthEnd
-import shutil
 
 
 @pytest.fixture(scope='module')
@@ -34,7 +39,7 @@ def current_pickle_data():
 
 
 # ---------------------
-# comparision functions
+# comparison functions
 # ---------------------
 def compare_element(result, expected, typ, version=None):
     if isinstance(expected, Index):
@@ -48,8 +53,8 @@ def compare_element(result, expected, typ, version=None):
         if expected is pd.NaT:
             assert result is pd.NaT
         else:
-            tm.assert_equal(result, expected)
-            tm.assert_equal(result.freq, expected.freq)
+            assert result == expected
+            assert result.freq == expected.freq
     else:
         comparator = getattr(tm, "assert_%s_equal" %
                              typ, tm.assert_almost_equal)
@@ -60,7 +65,7 @@ def compare(data, vf, version):
 
     # py3 compat when reading py2 pickle
     try:
-        data = pandas.read_pickle(vf)
+        data = pd.read_pickle(vf)
     except (ValueError) as e:
         if 'unsupported pickle protocol:' in str(e):
             # trying to read a py3 pickle in py2
@@ -70,6 +75,10 @@ def compare(data, vf, version):
 
     m = globals()
     for typ, dv in data.items():
+        if typ == "panel":
+            # FIXME: kludge; get this key out of the legacy file
+            continue
+
         for dt, result in dv.items():
             try:
                 expected = data[typ][dt]
@@ -91,7 +100,7 @@ def compare(data, vf, version):
 def compare_sp_series_ts(res, exp, typ, version):
     # SparseTimeSeries integrated into SparseSeries in 0.12.0
     # and deprecated in 0.17.0
-    if version and LooseVersion(version) <= "0.12.0":
+    if version and LooseVersion(version) <= LooseVersion("0.12.0"):
         tm.assert_sp_series_equal(res, exp, check_series_type=False)
     else:
         tm.assert_sp_series_equal(res, exp)
@@ -100,27 +109,27 @@ def compare_sp_series_ts(res, exp, typ, version):
 def compare_series_ts(result, expected, typ, version):
     # GH 7748
     tm.assert_series_equal(result, expected)
-    tm.assert_equal(result.index.freq, expected.index.freq)
-    tm.assert_equal(result.index.freq.normalize, False)
+    assert result.index.freq == expected.index.freq
+    assert not result.index.freq.normalize
     tm.assert_series_equal(result > 0, expected > 0)
 
     # GH 9291
     freq = result.index.freq
-    tm.assert_equal(freq + Day(1), Day(2))
+    assert freq + Day(1) == Day(2)
 
-    res = freq + pandas.Timedelta(hours=1)
-    tm.assert_equal(isinstance(res, pandas.Timedelta), True)
-    tm.assert_equal(res, pandas.Timedelta(days=1, hours=1))
+    res = freq + pd.Timedelta(hours=1)
+    assert isinstance(res, pd.Timedelta)
+    assert res == pd.Timedelta(days=1, hours=1)
 
-    res = freq + pandas.Timedelta(nanoseconds=1)
-    tm.assert_equal(isinstance(res, pandas.Timedelta), True)
-    tm.assert_equal(res, pandas.Timedelta(days=1, nanoseconds=1))
+    res = freq + pd.Timedelta(nanoseconds=1)
+    assert isinstance(res, pd.Timedelta)
+    assert res == pd.Timedelta(days=1, nanoseconds=1)
 
 
 def compare_series_dt_tz(result, expected, typ, version):
     # 8260
     # dtype is object < 0.17.0
-    if LooseVersion(version) < '0.17.0':
+    if LooseVersion(version) < LooseVersion('0.17.0'):
         expected = expected.astype(object)
         tm.assert_series_equal(result, expected)
     else:
@@ -130,10 +139,10 @@ def compare_series_dt_tz(result, expected, typ, version):
 def compare_series_cat(result, expected, typ, version):
     # Categorical dtype is added in 0.15.0
     # ordered is changed in 0.16.0
-    if LooseVersion(version) < '0.15.0':
+    if LooseVersion(version) < LooseVersion('0.15.0'):
         tm.assert_series_equal(result, expected, check_dtype=False,
                                check_categorical=False)
-    elif LooseVersion(version) < '0.16.0':
+    elif LooseVersion(version) < LooseVersion('0.16.0'):
         tm.assert_series_equal(result, expected, check_categorical=False)
     else:
         tm.assert_series_equal(result, expected)
@@ -142,7 +151,7 @@ def compare_series_cat(result, expected, typ, version):
 def compare_frame_dt_mixed_tzs(result, expected, typ, version):
     # 8260
     # dtype is object < 0.17.0
-    if LooseVersion(version) < '0.17.0':
+    if LooseVersion(version) < LooseVersion('0.17.0'):
         expected = expected.astype(object)
         tm.assert_frame_equal(result, expected)
     else:
@@ -152,10 +161,10 @@ def compare_frame_dt_mixed_tzs(result, expected, typ, version):
 def compare_frame_cat_onecol(result, expected, typ, version):
     # Categorical dtype is added in 0.15.0
     # ordered is changed in 0.16.0
-    if LooseVersion(version) < '0.15.0':
+    if LooseVersion(version) < LooseVersion('0.15.0'):
         tm.assert_frame_equal(result, expected, check_dtype=False,
                               check_categorical=False)
-    elif LooseVersion(version) < '0.16.0':
+    elif LooseVersion(version) < LooseVersion('0.16.0'):
         tm.assert_frame_equal(result, expected, check_categorical=False)
     else:
         tm.assert_frame_equal(result, expected)
@@ -167,48 +176,40 @@ def compare_frame_cat_and_float(result, expected, typ, version):
 
 def compare_index_period(result, expected, typ, version):
     tm.assert_index_equal(result, expected)
-    tm.assertIsInstance(result.freq, MonthEnd)
-    tm.assert_equal(result.freq, MonthEnd())
-    tm.assert_equal(result.freqstr, 'M')
+    assert isinstance(result.freq, MonthEnd)
+    assert result.freq == MonthEnd()
+    assert result.freqstr == 'M'
     tm.assert_index_equal(result.shift(2), expected.shift(2))
 
 
 def compare_sp_frame_float(result, expected, typ, version):
-    if LooseVersion(version) <= '0.18.1':
+    if LooseVersion(version) <= LooseVersion('0.18.1'):
         tm.assert_sp_frame_equal(result, expected, exact_indices=False,
                                  check_dtype=False)
     else:
         tm.assert_sp_frame_equal(result, expected)
 
 
+files = glob.glob(os.path.join(os.path.dirname(__file__), "data",
+                  "legacy_pickle", "*", "*.pickle"))
+
+
+@pytest.fixture(params=files)
+def legacy_pickle(request, datapath):
+    return datapath(request.param)
+
+
 # ---------------------
 # tests
 # ---------------------
-def legacy_pickle_versions():
-    # yield the pickle versions
-    path = tm.get_data_path('legacy_pickle')
-    for v in os.listdir(path):
-        p = os.path.join(path, v)
-        if os.path.isdir(p):
-            yield v
-
-
-@pytest.mark.parametrize('version', legacy_pickle_versions())
-def test_pickles(current_pickle_data, version):
+def test_pickles(current_pickle_data, legacy_pickle):
     if not is_platform_little_endian():
         pytest.skip("known failure on non-little endian")
 
-    pth = tm.get_data_path('legacy_pickle/{0}'.format(version))
-    n = 0
-    for f in os.listdir(pth):
-        vf = os.path.join(pth, f)
-        data = compare(current_pickle_data, vf, version)
-
-        if data is None:
-            continue
-        n += 1
-    assert n > 0, ('Pickle files are not '
-                   'tested: {version}'.format(version=version))
+    version = os.path.basename(os.path.dirname(legacy_pickle))
+    with catch_warnings(record=True):
+        simplefilter("ignore")
+        compare(current_pickle_data, legacy_pickle, version)
 
 
 def test_round_trip_current(current_pickle_data):
@@ -224,7 +225,7 @@ def c_unpickler(path):
             with open(path, 'rb') as fh:
                 fh.seek(0)
                 return c_pickle.load(fh)
-    except:
+    except ImportError:
         c_pickler = None
         c_unpickler = None
 
@@ -264,12 +265,11 @@ def python_unpickler(path):
                     compare_element(result, expected, typ)
 
 
-def test_pickle_v0_14_1():
+def test_pickle_v0_14_1(datapath):
 
     cat = pd.Categorical(values=['a', 'b', 'c'], ordered=False,
                          categories=['a', 'b', 'c', 'd'])
-    pickle_path = os.path.join(tm.get_data_path(),
-                               'categorical_0_14_1.pickle')
+    pickle_path = datapath('io', 'data', 'categorical_0_14_1.pickle')
     # This code was executed once on v0.14.1 to generate the pickle:
     #
     # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
@@ -279,14 +279,13 @@ def test_pickle_v0_14_1():
     tm.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
 
 
-def test_pickle_v0_15_2():
+def test_pickle_v0_15_2(datapath):
     # ordered -> _ordered
     # GH 9347
 
     cat = pd.Categorical(values=['a', 'b', 'c'], ordered=False,
                          categories=['a', 'b', 'c', 'd'])
-    pickle_path = os.path.join(tm.get_data_path(),
-                               'categorical_0_15_2.pickle')
+    pickle_path = datapath('io', 'data', 'categorical_0_15_2.pickle')
     # This code was executed once on v0.15.2 to generate the pickle:
     #
     # cat = Categorical(labels=np.arange(3), levels=['a', 'b', 'c', 'd'],
@@ -296,6 +295,18 @@ def test_pickle_v0_15_2():
     tm.assert_categorical_equal(cat, pd.read_pickle(pickle_path))
 
 
+def test_pickle_path_pathlib():
+    df = tm.makeDataFrame()
+    result = tm.round_trip_pathlib(df.to_pickle, pd.read_pickle)
+    tm.assert_frame_equal(df, result)
+
+
+def test_pickle_path_localpath():
+    df = tm.makeDataFrame()
+    result = tm.round_trip_localpath(df.to_pickle, pd.read_pickle)
+    tm.assert_frame_equal(df, result)
+
+
 # ---------------------
 # test pickle compression
 # ---------------------
@@ -328,56 +339,21 @@ def compress_file(self, src_path, dest_path, compression):
             f = bz2.BZ2File(dest_path, "w")
         elif compression == 'zip':
             import zipfile
-            zip_file = zipfile.ZipFile(dest_path, "w",
-                                       compression=zipfile.ZIP_DEFLATED)
-            zip_file.write(src_path, os.path.basename(src_path))
+            with zipfile.ZipFile(dest_path, "w",
+                                 compression=zipfile.ZIP_DEFLATED) as f:
+                f.write(src_path, os.path.basename(src_path))
         elif compression == 'xz':
-            lzma = pandas.compat.import_lzma()
+            lzma = pd.compat.import_lzma()
             f = lzma.LZMAFile(dest_path, "w")
         else:
             msg = 'Unrecognized compression type: {}'.format(compression)
             raise ValueError(msg)
 
         if compression != "zip":
-            f.write(open(src_path, "rb").read())
-            f.close()
+            with open(src_path, "rb") as fh, f:
+                f.write(fh.read())
 
-    def decompress_file(self, src_path, dest_path, compression):
-        if compression is None:
-            shutil.copyfile(src_path, dest_path)
-            return
-
-        if compression == 'gzip':
-            import gzip
-            f = gzip.open(src_path, "r")
-        elif compression == 'bz2':
-            import bz2
-            f = bz2.BZ2File(src_path, "r")
-        elif compression == 'zip':
-            import zipfile
-            zip_file = zipfile.ZipFile(src_path)
-            zip_names = zip_file.namelist()
-            if len(zip_names) == 1:
-                f = zip_file.open(zip_names.pop())
-            else:
-                raise ValueError('ZIP file {} error. Only one file per ZIP.'
-                                 .format(src_path))
-        elif compression == 'xz':
-            lzma = pandas.compat.import_lzma()
-            f = lzma.LZMAFile(src_path, "r")
-        else:
-            msg = 'Unrecognized compression type: {}'.format(compression)
-            raise ValueError(msg)
-
-        open(dest_path, "wb").write(f.read())
-        f.close()
-
-    @pytest.mark.parametrize('compression', [None, 'gzip', 'bz2', 'xz'])
     def test_write_explicit(self, compression, get_random_path):
-        # issue 11666
-        if compression == 'xz':
-            tm._skip_if_no_lzma()
-
         base = get_random_path
         path1 = base + ".compressed"
         path2 = base + ".raw"
@@ -389,7 +365,9 @@ def test_write_explicit(self, compression, get_random_path):
             df.to_pickle(p1, compression=compression)
 
             # decompress
-            self.decompress_file(p1, p2, compression=compression)
+            with tm.decompress_file(p1, compression=compression) as f:
+                with open(p2, "wb") as fh:
+                    fh.write(f.read())
 
             # read decompressed file
             df2 = pd.read_pickle(p2, compression=None)
@@ -398,17 +376,16 @@ def test_write_explicit(self, compression, get_random_path):
 
     @pytest.mark.parametrize('compression', ['', 'None', 'bad', '7z'])
     def test_write_explicit_bad(self, compression, get_random_path):
-        with tm.assertRaisesRegexp(ValueError,
-                                   "Unrecognized compression type"):
+        with pytest.raises(ValueError, match="Unrecognized compression type"):
             with tm.ensure_clean(get_random_path) as path:
                 df = tm.makeDataFrame()
                 df.to_pickle(path, compression=compression)
 
-    @pytest.mark.parametrize('ext', ['', '.gz', '.bz2', '.xz', '.no_compress'])
+    @pytest.mark.parametrize('ext', [
+        '', '.gz', '.bz2', '.no_compress',
+        pytest.param('.xz', marks=td.skip_if_no_lzma)
+    ])
     def test_write_infer(self, ext, get_random_path):
-        if ext == '.xz':
-            tm._skip_if_no_lzma()
-
         base = get_random_path
         path1 = base + ext
         path2 = base + ".raw"
@@ -425,19 +402,16 @@ def test_write_infer(self, ext, get_random_path):
             df.to_pickle(p1)
 
             # decompress
-            self.decompress_file(p1, p2, compression=compression)
+            with tm.decompress_file(p1, compression=compression) as f:
+                with open(p2, "wb") as fh:
+                    fh.write(f.read())
 
             # read decompressed file
             df2 = pd.read_pickle(p2, compression=None)
 
             tm.assert_frame_equal(df, df2)
 
-    @pytest.mark.parametrize('compression', [None, 'gzip', 'bz2', 'xz', "zip"])
     def test_read_explicit(self, compression, get_random_path):
-        # issue 11666
-        if compression == 'xz':
-            tm._skip_if_no_lzma()
-
         base = get_random_path
         path1 = base + ".raw"
         path2 = base + ".compressed"
@@ -456,12 +430,11 @@ def test_read_explicit(self, compression, get_random_path):
 
             tm.assert_frame_equal(df, df2)
 
-    @pytest.mark.parametrize('ext', ['', '.gz', '.bz2', '.xz', '.zip',
-                                     '.no_compress'])
+    @pytest.mark.parametrize('ext', [
+        '', '.gz', '.bz2', '.zip', '.no_compress',
+        pytest.param('.xz', marks=td.skip_if_no_lzma)
+    ])
     def test_read_infer(self, ext, get_random_path):
-        if ext == '.xz':
-            tm._skip_if_no_lzma()
-
         base = get_random_path
         path1 = base + ".raw"
         path2 = base + ext
@@ -484,3 +457,29 @@ def test_read_infer(self, ext, get_random_path):
             df2 = pd.read_pickle(p2)
 
             tm.assert_frame_equal(df, df2)
+
+
+# ---------------------
+# test pickle compression
+# ---------------------
+
+class TestProtocol(object):
+
+    @pytest.mark.parametrize('protocol', [-1, 0, 1, 2])
+    def test_read(self, protocol, get_random_path):
+        with tm.ensure_clean(get_random_path) as path:
+            df = tm.makeDataFrame()
+            df.to_pickle(path, protocol=protocol)
+            df2 = pd.read_pickle(path)
+            tm.assert_frame_equal(df, df2)
+
+    @pytest.mark.parametrize('protocol', [3, 4])
+    @pytest.mark.skipif(PY3, reason="Testing invalid parameters for Python 2")
+    def test_read_bad_versions(self, protocol, get_random_path):
+        # For Python 2, HIGHEST_PROTOCOL should be 2.
+        msg = ("pickle protocol {protocol} asked for; the highest available "
+               "protocol is 2").format(protocol=protocol)
+        with pytest.raises(ValueError, match=msg):
+            with tm.ensure_clean(get_random_path) as path:
+                df = tm.makeDataFrame()
+                df.to_pickle(path, protocol=protocol)
diff --git a/pandas/tests/io/test_pytables.py b/pandas/tests/io/test_pytables.py
index 82a98f5d08488..69ff32d1b728b 100644
--- a/pandas/tests/io/test_pytables.py
+++ b/pandas/tests/io/test_pytables.py
@@ -1,50 +1,55 @@
-import pytest
-import sys
-import os
-from warnings import catch_warnings
-import tempfile
 from contextlib import contextmanager
-
 import datetime
 from datetime import timedelta
+from distutils.version import LooseVersion
+import os
+import tempfile
+from warnings import catch_warnings, simplefilter
+
 import numpy as np
+import pytest
+
+from pandas.compat import (
+    PY35, PY36, BytesIO, is_platform_little_endian, is_platform_windows,
+    lrange, range, text_type, u)
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.common import is_categorical_dtype
 
-import pandas
 import pandas as pd
-from pandas import (Series, DataFrame, Panel, MultiIndex, Int64Index,
-                    RangeIndex, Categorical, bdate_range,
-                    date_range, timedelta_range, Index, DatetimeIndex,
-                    isnull)
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, Int64Index, MultiIndex,
+    RangeIndex, Series, Timestamp, bdate_range, compat, concat, date_range,
+    isna, timedelta_range)
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_frame_equal, assert_series_equal, set_timezone)
 
-from pandas.compat import is_platform_windows, PY3, PY35
-from pandas.formats.printing import pprint_thing
+from pandas.io import pytables as pytables  # noqa:E402
+from pandas.io.formats.printing import pprint_thing
+from pandas.io.pytables import (
+    ClosedFileError, HDFStore, PossibleDataLossError, Term, read_hdf)
+from pandas.io.pytables import TableIterator  # noqa:E402
 
 tables = pytest.importorskip('tables')
-from pandas.io.pytables import TableIterator
-from pandas.io.pytables import (HDFStore, get_store, Term, read_hdf,
-                                IncompatibilityWarning, PerformanceWarning,
-                                AttributeConflictWarning,
-                                PossibleDataLossError, ClosedFileError)
 
-from pandas.io import pytables as pytables
-import pandas.util.testing as tm
-from pandas.util.testing import (assert_panel4d_equal,
-                                 assert_panel_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal,
-                                 set_timezone)
-from pandas import concat, Timestamp
-from pandas import compat
-from pandas.compat import range, lrange, u
-from distutils.version import LooseVersion
 
-_default_compressor = ('blosc' if LooseVersion(tables.__version__) >= '2.2'
-                       else 'zlib')
+# TODO:
+# remove when gh-24839 is fixed; this affects numpy 1.16
+# and pytables 3.4.4
+xfail_non_writeable = pytest.mark.xfail(
+    LooseVersion(np.__version__) >= LooseVersion('1.16'),
+    reason=('gh-25511, gh-24839. pytables needs a '
+            'release beyong 3.4.4 to support numpy 1.16x'))
+
 
+_default_compressor = ('blosc' if LooseVersion(tables.__version__) >=
+                       LooseVersion('2.2') else 'zlib')
 
-# testing on windows/py3 seems to fault
-# for using compression
-skip_compression = PY3 and is_platform_windows()
+
+ignore_natural_naming_warning = pytest.mark.filterwarnings(
+    "ignore:object name:tables.exceptions.NaturalNameWarning"
+)
 
 # contextmanager to ensure the file cleanup
 
@@ -53,7 +58,7 @@ def safe_remove(path):
     if path is not None:
         try:
             os.remove(path)
-        except:
+        except OSError:
             pass
 
 
@@ -61,7 +66,7 @@ def safe_close(store):
     try:
         if store is not None:
             store.close()
-    except:
+    except IOError:
         pass
 
 
@@ -119,55 +124,38 @@ def _maybe_remove(store, key):
     no content from previous tests using the same table name."""
     try:
         store.remove(key)
-    except:
+    except (ValueError, KeyError):
         pass
 
 
-class Base(tm.TestCase):
+class Base(object):
 
     @classmethod
-    def setUpClass(cls):
-        super(Base, cls).setUpClass()
+    def setup_class(cls):
 
         # Pytables 3.0.0 deprecates lots of things
         tm.reset_testing_mode()
 
     @classmethod
-    def tearDownClass(cls):
-        super(Base, cls).tearDownClass()
+    def teardown_class(cls):
 
         # Pytables 3.0.0 deprecates lots of things
         tm.set_testing_mode()
 
-    def setUp(self):
+    def setup_method(self, method):
         self.path = 'tmp.__%s__.h5' % tm.rands(10)
 
-    def tearDown(self):
+    def teardown_method(self, method):
         pass
 
 
 @pytest.mark.single
-class TestHDFStore(Base, tm.TestCase):
-
-    def test_factory_fun(self):
-        path = create_tempfile(self.path)
-        try:
-            with get_store(path) as tbl:
-                raise ValueError('blah')
-        except ValueError:
-            pass
-        finally:
-            safe_remove(path)
-
-        try:
-            with get_store(path) as tbl:
-                tbl['a'] = tm.makeDataFrame()
+class TestHDFStore(Base):
 
-            with get_store(path) as tbl:
-                self.assertEqual(len(tbl), 1)
-                self.assertEqual(type(tbl['a']), DataFrame)
-        finally:
-            safe_remove(self.path)
+    def test_format_kwarg_in_constructor(self):
+        # GH 13291
+        with ensure_clean_path(self.path) as path:
+            pytest.raises(ValueError, HDFStore, path, format='table')
 
     def test_context(self):
         path = create_tempfile(self.path)
@@ -184,8 +172,8 @@ def test_context(self):
                 tbl['a'] = tm.makeDataFrame()
 
             with HDFStore(path) as tbl:
-                self.assertEqual(len(tbl), 1)
-                self.assertEqual(type(tbl['a']), DataFrame)
+                assert len(tbl) == 1
+                assert type(tbl['a']) == DataFrame
         finally:
             safe_remove(path)
 
@@ -205,9 +193,6 @@ def roundtrip(key, obj, **kwargs):
             o = tm.makeDataFrame()
             assert_frame_equal(o, roundtrip('frame', o))
 
-            o = tm.makePanel()
-            assert_panel_equal(o, roundtrip('panel', o))
-
             # table
             df = DataFrame(dict(A=lrange(5), B=lrange(5)))
             df.to_hdf(path, 'table', append=True)
@@ -220,8 +205,6 @@ def roundtrip(key, obj, **kwargs):
     def test_long_strings(self):
 
         # GH6166
-        # unconversion of long strings was being chopped in earlier
-        # versions of numpy < 1.7.2
         df = DataFrame({'a': tm.rands_array(100, size=10)},
                        index=tm.rands_array(100, size=10))
 
@@ -305,20 +288,20 @@ def test_api(self):
 
             # invalid
             df = tm.makeDataFrame()
-            self.assertRaises(ValueError, df.to_hdf, path,
-                              'df', append=True, format='f')
-            self.assertRaises(ValueError, df.to_hdf, path,
-                              'df', append=True, format='fixed')
+            pytest.raises(ValueError, df.to_hdf, path,
+                          'df', append=True, format='f')
+            pytest.raises(ValueError, df.to_hdf, path,
+                          'df', append=True, format='fixed')
 
-            self.assertRaises(TypeError, df.to_hdf, path,
-                              'df', append=True, format='foo')
-            self.assertRaises(TypeError, df.to_hdf, path,
-                              'df', append=False, format='bar')
+            pytest.raises(TypeError, df.to_hdf, path,
+                          'df', append=True, format='foo')
+            pytest.raises(TypeError, df.to_hdf, path,
+                          'df', append=False, format='bar')
 
         # File path doesn't exist
         path = ""
-        self.assertRaises(compat.FileNotFoundError,
-                          read_hdf, path, 'df')
+        pytest.raises(compat.FileNotFoundError,
+                      read_hdf, path, 'df')
 
     def test_api_default_format(self):
 
@@ -326,41 +309,41 @@ def test_api_default_format(self):
         with ensure_clean_store(self.path) as store:
             df = tm.makeDataFrame()
 
-            pandas.set_option('io.hdf.default_format', 'fixed')
+            pd.set_option('io.hdf.default_format', 'fixed')
             _maybe_remove(store, 'df')
             store.put('df', df)
-            self.assertFalse(store.get_storer('df').is_table)
-            self.assertRaises(ValueError, store.append, 'df2', df)
+            assert not store.get_storer('df').is_table
+            pytest.raises(ValueError, store.append, 'df2', df)
 
-            pandas.set_option('io.hdf.default_format', 'table')
+            pd.set_option('io.hdf.default_format', 'table')
             _maybe_remove(store, 'df')
             store.put('df', df)
-            self.assertTrue(store.get_storer('df').is_table)
+            assert store.get_storer('df').is_table
             _maybe_remove(store, 'df2')
             store.append('df2', df)
-            self.assertTrue(store.get_storer('df').is_table)
+            assert store.get_storer('df').is_table
 
-            pandas.set_option('io.hdf.default_format', None)
+            pd.set_option('io.hdf.default_format', None)
 
         with ensure_clean_path(self.path) as path:
 
             df = tm.makeDataFrame()
 
-            pandas.set_option('io.hdf.default_format', 'fixed')
+            pd.set_option('io.hdf.default_format', 'fixed')
             df.to_hdf(path, 'df')
-            with get_store(path) as store:
-                self.assertFalse(store.get_storer('df').is_table)
-            self.assertRaises(ValueError, df.to_hdf, path, 'df2', append=True)
+            with HDFStore(path) as store:
+                assert not store.get_storer('df').is_table
+            pytest.raises(ValueError, df.to_hdf, path, 'df2', append=True)
 
-            pandas.set_option('io.hdf.default_format', 'table')
+            pd.set_option('io.hdf.default_format', 'table')
             df.to_hdf(path, 'df3')
             with HDFStore(path) as store:
-                self.assertTrue(store.get_storer('df3').is_table)
+                assert store.get_storer('df3').is_table
             df.to_hdf(path, 'df4', append=True)
             with HDFStore(path) as store:
-                self.assertTrue(store.get_storer('df4').is_table)
+                assert store.get_storer('df4').is_table
 
-            pandas.set_option('io.hdf.default_format', None)
+            pd.set_option('io.hdf.default_format', None)
 
     def test_keys(self):
 
@@ -368,29 +351,43 @@ def test_keys(self):
             store['a'] = tm.makeTimeSeries()
             store['b'] = tm.makeStringSeries()
             store['c'] = tm.makeDataFrame()
-            store['d'] = tm.makePanel()
-            store['foo/bar'] = tm.makePanel()
-            self.assertEqual(len(store), 5)
-            expected = set(['/a', '/b', '/c', '/d', '/foo/bar'])
-            self.assertTrue(set(store.keys()) == expected)
-            self.assertTrue(set(store) == expected)
+
+            assert len(store) == 3
+            expected = {'/a', '/b', '/c'}
+            assert set(store.keys()) == expected
+            assert set(store) == expected
+
+    def test_keys_ignore_hdf_softlink(self):
+
+        # GH 20523
+        # Puts a softlink into HDF file and rereads
+
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame(dict(A=lrange(5), B=lrange(5)))
+            store.put("df", df)
+
+            assert store.keys() == ["/df"]
+
+            store._handle.create_soft_link(store._handle.root, "symlink", "df")
+
+            # Should ignore the softlink
+            assert store.keys() == ["/df"]
 
     def test_iter_empty(self):
 
         with ensure_clean_store(self.path) as store:
             # GH 12221
-            self.assertTrue(list(store) == [])
+            assert list(store) == []
 
     def test_repr(self):
 
         with ensure_clean_store(self.path) as store:
             repr(store)
+            store.info()
             store['a'] = tm.makeTimeSeries()
             store['b'] = tm.makeStringSeries()
             store['c'] = tm.makeDataFrame()
-            store['d'] = tm.makePanel()
-            store['foo/bar'] = tm.makePanel()
-            store.append('e', tm.makePanel())
 
             df = tm.makeDataFrame()
             df['obj1'] = 'foo'
@@ -407,15 +404,16 @@ def test_repr(self):
             df.loc[3:6, ['obj1']] = np.nan
             df = df._consolidate()._convert(datetime=True)
 
-            # PerformanceWarning
             with catch_warnings(record=True):
+                simplefilter("ignore", pd.errors.PerformanceWarning)
                 store['df'] = df
 
             # make a random group in hdf space
             store._handle.create_group(store._handle.root, 'bah')
 
-            repr(store)
-            str(store)
+            assert store.filename in repr(store)
+            assert store.filename in str(store)
+            store.info()
 
         # storers
         with ensure_clean_store(self.path) as store:
@@ -427,25 +425,25 @@ def test_repr(self):
             repr(s)
             str(s)
 
+    @ignore_natural_naming_warning
     def test_contains(self):
 
         with ensure_clean_store(self.path) as store:
             store['a'] = tm.makeTimeSeries()
             store['b'] = tm.makeDataFrame()
             store['foo/bar'] = tm.makeDataFrame()
-            self.assertIn('a', store)
-            self.assertIn('b', store)
-            self.assertNotIn('c', store)
-            self.assertIn('foo/bar', store)
-            self.assertIn('/foo/bar', store)
-            self.assertNotIn('/foo/b', store)
-            self.assertNotIn('bar', store)
-
-            # GH 2694
-            # tables.NaturalNameWarning
+            assert 'a' in store
+            assert 'b' in store
+            assert 'c' not in store
+            assert 'foo/bar' in store
+            assert '/foo/bar' in store
+            assert '/foo/b' not in store
+            assert 'bar' not in store
+
+            # gh-2694: tables.NaturalNameWarning
             with catch_warnings(record=True):
                 store['node())'] = tm.makeDataFrame()
-            self.assertIn('node())', store)
+            assert 'node())' in store
 
     def test_versioning(self):
 
@@ -456,9 +454,9 @@ def test_versioning(self):
             _maybe_remove(store, 'df1')
             store.append('df1', df[:10])
             store.append('df1', df[10:])
-            self.assertEqual(store.root.a._v_attrs.pandas_version, '0.15.2')
-            self.assertEqual(store.root.b._v_attrs.pandas_version, '0.15.2')
-            self.assertEqual(store.root.df1._v_attrs.pandas_version, '0.15.2')
+            assert store.root.a._v_attrs.pandas_version == '0.15.2'
+            assert store.root.b._v_attrs.pandas_version == '0.15.2'
+            assert store.root.df1._v_attrs.pandas_version == '0.15.2'
 
             # write a file and wipe its versioning
             _maybe_remove(store, 'df2')
@@ -467,7 +465,7 @@ def test_versioning(self):
             # this is an error because its table_type is appendable, but no
             # version info
             store.get_node('df2')._v_attrs.pandas_version = None
-            self.assertRaises(Exception, store.select, 'df2')
+            pytest.raises(Exception, store.select, 'df2')
 
     def test_mode(self):
 
@@ -479,11 +477,11 @@ def check(mode):
 
                 # constructor
                 if mode in ['r', 'r+']:
-                    self.assertRaises(IOError, HDFStore, path, mode=mode)
+                    pytest.raises(IOError, HDFStore, path, mode=mode)
 
                 else:
                     store = HDFStore(path, mode=mode)
-                    self.assertEqual(store._handle.mode, mode)
+                    assert store._handle.mode == mode
                     store.close()
 
             with ensure_clean_path(self.path) as path:
@@ -493,25 +491,25 @@ def check(mode):
                     def f():
                         with HDFStore(path, mode=mode) as store:  # noqa
                             pass
-                    self.assertRaises(IOError, f)
+                    pytest.raises(IOError, f)
                 else:
                     with HDFStore(path, mode=mode) as store:
-                        self.assertEqual(store._handle.mode, mode)
+                        assert store._handle.mode == mode
 
             with ensure_clean_path(self.path) as path:
 
                 # conv write
                 if mode in ['r', 'r+']:
-                    self.assertRaises(IOError, df.to_hdf,
-                                      path, 'df', mode=mode)
+                    pytest.raises(IOError, df.to_hdf,
+                                  path, 'df', mode=mode)
                     df.to_hdf(path, 'df', mode='w')
                 else:
                     df.to_hdf(path, 'df', mode=mode)
 
                 # conv read
                 if mode in ['w']:
-                    self.assertRaises(ValueError, read_hdf,
-                                      path, 'df', mode=mode)
+                    pytest.raises(ValueError, read_hdf,
+                                  path, 'df', mode=mode)
                 else:
                     result = read_hdf(path, 'df', mode=mode)
                     assert_frame_equal(result, df)
@@ -538,43 +536,43 @@ def test_reopen_handle(self):
             store['a'] = tm.makeTimeSeries()
 
             # invalid mode change
-            self.assertRaises(PossibleDataLossError, store.open, 'w')
+            pytest.raises(PossibleDataLossError, store.open, 'w')
             store.close()
-            self.assertFalse(store.is_open)
+            assert not store.is_open
 
             # truncation ok here
             store.open('w')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 0)
+            assert store.is_open
+            assert len(store) == 0
             store.close()
-            self.assertFalse(store.is_open)
+            assert not store.is_open
 
             store = HDFStore(path, mode='a')
             store['a'] = tm.makeTimeSeries()
 
             # reopen as read
             store.open('r')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'r')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'r'
             store.close()
-            self.assertFalse(store.is_open)
+            assert not store.is_open
 
             # reopen as append
             store.open('a')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'a')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'a'
             store.close()
-            self.assertFalse(store.is_open)
+            assert not store.is_open
 
             # reopen as append (again)
             store.open('a')
-            self.assertTrue(store.is_open)
-            self.assertEqual(len(store), 1)
-            self.assertEqual(store._mode, 'a')
+            assert store.is_open
+            assert len(store) == 1
+            assert store._mode == 'a'
             store.close()
-            self.assertFalse(store.is_open)
+            assert not store.is_open
 
     def test_open_args(self):
 
@@ -594,7 +592,7 @@ def test_open_args(self):
             store.close()
 
             # the file should not have actually been written
-            self.assertFalse(os.path.exists(path))
+            assert not os.path.exists(path)
 
     def test_flush(self):
 
@@ -615,7 +613,58 @@ def test_get(self):
             right = store['/a']
             tm.assert_series_equal(left, right)
 
-            self.assertRaises(KeyError, store.get, 'b')
+            pytest.raises(KeyError, store.get, 'b')
+
+    @pytest.mark.parametrize('where, expected', [
+        ('/', {
+            '': ({'first_group', 'second_group'}, set()),
+            '/first_group': (set(), {'df1', 'df2'}),
+            '/second_group': ({'third_group'}, {'df3', 's1'}),
+            '/second_group/third_group': (set(), {'df4'}),
+        }),
+        ('/second_group', {
+            '/second_group': ({'third_group'}, {'df3', 's1'}),
+            '/second_group/third_group': (set(), {'df4'}),
+        })
+    ])
+    def test_walk(self, where, expected):
+        # GH10143
+        objs = {
+            'df1': pd.DataFrame([1, 2, 3]),
+            'df2': pd.DataFrame([4, 5, 6]),
+            'df3': pd.DataFrame([6, 7, 8]),
+            'df4': pd.DataFrame([9, 10, 11]),
+            's1': pd.Series([10, 9, 8]),
+            # Next 3 items aren't pandas objects and should be ignored
+            'a1': np.array([[1, 2, 3], [4, 5, 6]]),
+            'tb1': np.array([(1, 2, 3), (4, 5, 6)], dtype='i,i,i'),
+            'tb2': np.array([(7, 8, 9), (10, 11, 12)], dtype='i,i,i')
+        }
+
+        with ensure_clean_store('walk_groups.hdf', mode='w') as store:
+            store.put('/first_group/df1', objs['df1'])
+            store.put('/first_group/df2', objs['df2'])
+            store.put('/second_group/df3', objs['df3'])
+            store.put('/second_group/s1', objs['s1'])
+            store.put('/second_group/third_group/df4', objs['df4'])
+            # Create non-pandas objects
+            store._handle.create_array('/first_group', 'a1', objs['a1'])
+            store._handle.create_table('/first_group', 'tb1', obj=objs['tb1'])
+            store._handle.create_table('/second_group', 'tb2', obj=objs['tb2'])
+
+            assert len(list(store.walk(where=where))) == len(expected)
+            for path, groups, leaves in store.walk(where=where):
+                assert path in expected
+                expected_groups, expected_frames = expected[path]
+                assert expected_groups == set(groups)
+                assert expected_frames == set(leaves)
+                for leaf in leaves:
+                    frame_path = '/'.join([path, leaf])
+                    obj = store.get(frame_path)
+                    if 'df' in leaf:
+                        tm.assert_frame_equal(obj, objs[leaf])
+                    else:
+                        tm.assert_series_equal(obj, objs[leaf])
 
     def test_getattr(self):
 
@@ -636,10 +685,10 @@ def test_getattr(self):
             tm.assert_frame_equal(result, df)
 
             # errors
-            self.assertRaises(AttributeError, getattr, store, 'd')
+            pytest.raises(AttributeError, getattr, store, 'd')
 
             for x in ['mode', 'path', 'handle', 'complib']:
-                self.assertRaises(AttributeError, getattr, store, x)
+                pytest.raises(AttributeError, getattr, store, x)
 
             # not stores
             for x in ['mode', 'path', 'handle', 'complib']:
@@ -659,17 +708,17 @@ def test_put(self):
             store.put('c', df[:10], format='table')
 
             # not OK, not a table
-            self.assertRaises(
+            pytest.raises(
                 ValueError, store.put, 'b', df[10:], append=True)
 
             # node does not currently exist, test _is_table_type returns False
             # in this case
             # _maybe_remove(store, 'f')
-            # self.assertRaises(ValueError, store.put, 'f', df[10:],
+            # pytest.raises(ValueError, store.put, 'f', df[10:],
             #                   append=True)
 
             # can't put to a table (use append instead)
-            self.assertRaises(ValueError, store.put, 'c', df[10:], append=True)
+            pytest.raises(ValueError, store.put, 'c', df[10:], append=True)
 
             # overwrite table
             store.put('c', df[:10], format='table', append=False)
@@ -711,31 +760,118 @@ def test_put_compression(self):
             tm.assert_frame_equal(store['c'], df)
 
             # can't compress if format='fixed'
-            self.assertRaises(ValueError, store.put, 'b', df,
-                              format='fixed', complib='zlib')
+            pytest.raises(ValueError, store.put, 'b', df,
+                          format='fixed', complib='zlib')
 
+    @td.skip_if_windows_python_3
     def test_put_compression_blosc(self):
-        tm.skip_if_no_package('tables', min_version='2.2',
-                              app='blosc support')
-        if skip_compression:
-            pytest.skip("skipping on windows/PY3")
-
         df = tm.makeTimeDataFrame()
 
         with ensure_clean_store(self.path) as store:
 
             # can't compress if format='fixed'
-            self.assertRaises(ValueError, store.put, 'b', df,
-                              format='fixed', complib='blosc')
+            pytest.raises(ValueError, store.put, 'b', df,
+                          format='fixed', complib='blosc')
 
             store.put('c', df, format='table', complib='blosc')
             tm.assert_frame_equal(store['c'], df)
 
+    def test_complibs_default_settings(self):
+        # GH15943
+        df = tm.makeDataFrame()
+
+        # Set complevel and check if complib is automatically set to
+        # default value
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df', complevel=9)
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 9
+                    assert node.filters.complib == 'zlib'
+
+        # Set complib and check to see if compression is disabled
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df', complib='zlib')
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+
+        # Check if not setting complib or complevel results in no compression
+        with ensure_clean_path(self.path) as tmpfile:
+            df.to_hdf(tmpfile, 'df')
+            result = pd.read_hdf(tmpfile, 'df')
+            tm.assert_frame_equal(result, df)
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+
+        # Check if file-defaults can be overridden on a per table basis
+        with ensure_clean_path(self.path) as tmpfile:
+            store = pd.HDFStore(tmpfile)
+            store.append('dfc', df, complevel=9, complib='blosc')
+            store.append('df', df)
+            store.close()
+
+            with tables.open_file(tmpfile, mode='r') as h5file:
+                for node in h5file.walk_nodes(where='/df', classname='Leaf'):
+                    assert node.filters.complevel == 0
+                    assert node.filters.complib is None
+                for node in h5file.walk_nodes(where='/dfc', classname='Leaf'):
+                    assert node.filters.complevel == 9
+                    assert node.filters.complib == 'blosc'
+
+    def test_complibs(self):
+        # GH14478
+        df = tm.makeDataFrame()
+
+        # Building list of all complibs and complevels tuples
+        all_complibs = tables.filters.all_complibs
+        # Remove lzo if its not available on this platform
+        if not tables.which_lib_version('lzo'):
+            all_complibs.remove('lzo')
+        # Remove bzip2 if its not available on this platform
+        if not tables.which_lib_version("bzip2"):
+            all_complibs.remove("bzip2")
+
+        all_levels = range(0, 10)
+        all_tests = [(lib, lvl) for lib in all_complibs for lvl in all_levels]
+
+        for (lib, lvl) in all_tests:
+            with ensure_clean_path(self.path) as tmpfile:
+                gname = 'foo'
+
+                # Write and read file to see if data is consistent
+                df.to_hdf(tmpfile, gname, complib=lib, complevel=lvl)
+                result = pd.read_hdf(tmpfile, gname)
+                tm.assert_frame_equal(result, df)
+
+                # Open file and check metadata
+                # for correct amount of compression
+                h5table = tables.open_file(tmpfile, mode='r')
+                for node in h5table.walk_nodes(where='/' + gname,
+                                               classname='Leaf'):
+                    assert node.filters.complevel == lvl
+                    if lvl == 0:
+                        assert node.filters.complib is None
+                    else:
+                        assert node.filters.complib == lib
+                h5table.close()
+
     def test_put_integer(self):
         # non-date, non-string index
         df = DataFrame(np.random.randn(50, 100))
         self._check_roundtrip(df, tm.assert_frame_equal)
 
+    @xfail_non_writeable
     def test_put_mixed_type(self):
         df = tm.makeTimeDataFrame()
         df['obj1'] = 'foo'
@@ -755,107 +891,76 @@ def test_put_mixed_type(self):
         with ensure_clean_store(self.path) as store:
             _maybe_remove(store, 'df')
 
+            # PerformanceWarning
             with catch_warnings(record=True):
+                simplefilter("ignore", pd.errors.PerformanceWarning)
                 store.put('df', df)
 
             expected = store.get('df')
             tm.assert_frame_equal(expected, df)
 
+    @pytest.mark.filterwarnings(
+        "ignore:object name:tables.exceptions.NaturalNameWarning"
+    )
     def test_append(self):
 
         with ensure_clean_store(self.path) as store:
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df1')
-            store.append('df1', df[:10])
-            store.append('df1', df[10:])
-            tm.assert_frame_equal(store['df1'], df)
-
-            _maybe_remove(store, 'df2')
-            store.put('df2', df[:10], format='table')
-            store.append('df2', df[10:])
-            tm.assert_frame_equal(store['df2'], df)
-
-            _maybe_remove(store, 'df3')
-            store.append('/df3', df[:10])
-            store.append('/df3', df[10:])
-            tm.assert_frame_equal(store['df3'], df)
 
             # this is allowed by almost always don't want to do it
             # tables.NaturalNameWarning):
             with catch_warnings(record=True):
+
+                df = tm.makeTimeDataFrame()
+                _maybe_remove(store, 'df1')
+                store.append('df1', df[:10])
+                store.append('df1', df[10:])
+                tm.assert_frame_equal(store['df1'], df)
+
+                _maybe_remove(store, 'df2')
+                store.put('df2', df[:10], format='table')
+                store.append('df2', df[10:])
+                tm.assert_frame_equal(store['df2'], df)
+
+                _maybe_remove(store, 'df3')
+                store.append('/df3', df[:10])
+                store.append('/df3', df[10:])
+                tm.assert_frame_equal(store['df3'], df)
+
+                # this is allowed by almost always don't want to do it
+                # tables.NaturalNameWarning
                 _maybe_remove(store, '/df3 foo')
                 store.append('/df3 foo', df[:10])
                 store.append('/df3 foo', df[10:])
                 tm.assert_frame_equal(store['df3 foo'], df)
 
-            # panel
-            wp = tm.makePanel()
-            _maybe_remove(store, 'wp1')
-            store.append('wp1', wp.iloc[:, :10, :])
-            store.append('wp1', wp.iloc[:, 10:, :])
-            assert_panel_equal(store['wp1'], wp)
-
-            # ndim
-            with catch_warnings(record=True):
-                p4d = tm.makePanel4D()
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :])
-                store.append('p4d', p4d.iloc[:, :, 10:, :])
-                assert_panel4d_equal(store['p4d'], p4d)
-
-                # test using axis labels
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :], axes=[
-                    'items', 'major_axis', 'minor_axis'])
-                store.append('p4d', p4d.iloc[:, :, 10:, :], axes=[
-                    'items', 'major_axis', 'minor_axis'])
-                assert_panel4d_equal(store['p4d'], p4d)
-
-                # test using differnt number of items on each axis
-                p4d2 = p4d.copy()
-                p4d2['l4'] = p4d['l1']
-                p4d2['l5'] = p4d['l1']
-                _maybe_remove(store, 'p4d2')
-                store.append(
-                    'p4d2', p4d2, axes=['items', 'major_axis', 'minor_axis'])
-                assert_panel4d_equal(store['p4d2'], p4d2)
-
-            # test using differt order of items on the non-index axes
-            _maybe_remove(store, 'wp1')
-            wp_append1 = wp.iloc[:, :10, :]
-            store.append('wp1', wp_append1)
-            wp_append2 = wp.iloc[:, 10:, :].reindex(items=wp.items[::-1])
-            store.append('wp1', wp_append2)
-            assert_panel_equal(store['wp1'], wp)
-
-            # dtype issues - mizxed type in a single object column
-            df = DataFrame(data=[[1, 2], [0, 1], [1, 2], [0, 0]])
-            df['mixed_column'] = 'testing'
-            df.loc[2, 'mixed_column'] = np.nan
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-            tm.assert_frame_equal(store['df'], df)
-
-            # uints - test storage of uints
-            uint_data = DataFrame({
-                'u08': Series(np.random.randint(0, high=255, size=5),
-                              dtype=np.uint8),
-                'u16': Series(np.random.randint(0, high=65535, size=5),
-                              dtype=np.uint16),
-                'u32': Series(np.random.randint(0, high=2**30, size=5),
-                              dtype=np.uint32),
-                'u64': Series([2**58, 2**59, 2**60, 2**61, 2**62],
-                              dtype=np.uint64)}, index=np.arange(5))
-            _maybe_remove(store, 'uints')
-            store.append('uints', uint_data)
-            tm.assert_frame_equal(store['uints'], uint_data)
-
-            # uints - test storage of uints in indexable columns
-            _maybe_remove(store, 'uints')
-            # 64-bit indices not yet supported
-            store.append('uints', uint_data, data_columns=[
-                         'u08', 'u16', 'u32'])
-            tm.assert_frame_equal(store['uints'], uint_data)
+                # dtype issues - mizxed type in a single object column
+                df = DataFrame(data=[[1, 2], [0, 1], [1, 2], [0, 0]])
+                df['mixed_column'] = 'testing'
+                df.loc[2, 'mixed_column'] = np.nan
+                _maybe_remove(store, 'df')
+                store.append('df', df)
+                tm.assert_frame_equal(store['df'], df)
+
+                # uints - test storage of uints
+                uint_data = DataFrame({
+                    'u08': Series(np.random.randint(0, high=255, size=5),
+                                  dtype=np.uint8),
+                    'u16': Series(np.random.randint(0, high=65535, size=5),
+                                  dtype=np.uint16),
+                    'u32': Series(np.random.randint(0, high=2**30, size=5),
+                                  dtype=np.uint32),
+                    'u64': Series([2**58, 2**59, 2**60, 2**61, 2**62],
+                                  dtype=np.uint64)}, index=np.arange(5))
+                _maybe_remove(store, 'uints')
+                store.append('uints', uint_data)
+                tm.assert_frame_equal(store['uints'], uint_data)
+
+                # uints - test storage of uints in indexable columns
+                _maybe_remove(store, 'uints')
+                # 64-bit indices not yet supported
+                store.append('uints', uint_data, data_columns=[
+                             'u08', 'u16', 'u32'])
+                tm.assert_frame_equal(store['uints'], uint_data)
 
     def test_append_series(self):
 
@@ -869,18 +974,18 @@ def test_append_series(self):
             store.append('ss', ss)
             result = store['ss']
             tm.assert_series_equal(result, ss)
-            self.assertIsNone(result.name)
+            assert result.name is None
 
             store.append('ts', ts)
             result = store['ts']
             tm.assert_series_equal(result, ts)
-            self.assertIsNone(result.name)
+            assert result.name is None
 
             ns.name = 'foo'
             store.append('ns', ns)
             result = store['ns']
             tm.assert_series_equal(result, ns)
-            self.assertEqual(result.name, ns.name)
+            assert result.name == ns.name
 
             # select on the values
             expected = ns[ns > 60]
@@ -936,16 +1041,17 @@ def check(format, index):
             else:
 
                 # only support for fixed types (and they have a perf warning)
-                self.assertRaises(TypeError, check, 'table', index)
-                with tm.assert_produces_warning(
-                        expected_warning=PerformanceWarning):
+                pytest.raises(TypeError, check, 'table', index)
+
+                # PerformanceWarning
+                with catch_warnings(record=True):
+                    simplefilter("ignore", pd.errors.PerformanceWarning)
                     check('fixed', index)
 
+    @pytest.mark.skipif(not is_platform_little_endian(),
+                        reason="reason platform is not little endian")
     def test_encoding(self):
 
-        if sys.byteorder != 'little':
-            pytest.skip('system byteorder is not little')
-
         with ensure_clean_store(self.path) as store:
             df = DataFrame(dict(A='foo', B='bar'), index=range(5))
             df.loc[2, 'A'] = np.nan
@@ -961,9 +1067,7 @@ def test_encoding(self):
     def test_latin_encoding(self):
 
         if compat.PY2:
-            self.assertRaisesRegexp(
-                TypeError, r'\[unicode\] is not implemented as a table column')
-            return
+            pytest.skip("[unicode] is not implemented as a table column")
 
         values = [[b'E\xc9, 17', b'', b'a', b'b', b'c'],
                   [b'E\xc9, 17', b'a', b'b', b'c'],
@@ -986,7 +1090,7 @@ def _try_decode(x, encoding='latin-1'):
         examples = []
         for dtype in ['category', object]:
             for val in values:
-                examples.append(pandas.Series(val, dtype=dtype))
+                examples.append(pd.Series(val, dtype=dtype))
 
         def roundtrip(s, key='data', encoding='latin-1', nan_rep=''):
             with ensure_clean_path(self.path) as store:
@@ -994,7 +1098,12 @@ def roundtrip(s, key='data', encoding='latin-1', nan_rep=''):
                          nan_rep=nan_rep)
                 retr = read_hdf(store, key)
                 s_nan = s.replace(nan_rep, np.nan)
-                assert_series_equal(s_nan, retr, check_categorical=False)
+                if is_categorical_dtype(s_nan):
+                    assert is_categorical_dtype(retr)
+                    assert_series_equal(s_nan, retr, check_dtype=False,
+                                        check_categorical=False)
+                else:
+                    assert_series_equal(s_nan, retr)
 
         for s in examples:
             roundtrip(s)
@@ -1066,13 +1175,13 @@ def test_append_all_nans(self):
             tm.assert_frame_equal(store['df2'], df)
 
             # tests the option io.hdf.dropna_table
-            pandas.set_option('io.hdf.dropna_table', False)
+            pd.set_option('io.hdf.dropna_table', False)
             _maybe_remove(store, 'df3')
             store.append('df3', df[:10])
             store.append('df3', df[10:])
             tm.assert_frame_equal(store['df3'], df)
 
-            pandas.set_option('io.hdf.dropna_table', True)
+            pd.set_option('io.hdf.dropna_table', True)
             _maybe_remove(store, 'df4')
             store.append('df4', df[:10])
             store.append('df4', df[10:])
@@ -1127,20 +1236,6 @@ def test_append_all_nans(self):
             reloaded = read_hdf(path, 'df_with_missing')
             tm.assert_frame_equal(df_with_missing, reloaded)
 
-        matrix = [[[np.nan, np.nan, np.nan], [1, np.nan, np.nan]],
-                  [[np.nan, np.nan, np.nan], [np.nan, 5, 6]],
-                  [[np.nan, np.nan, np.nan], [np.nan, 3, np.nan]]]
-
-        panel_with_missing = Panel(matrix, items=['Item1', 'Item2', 'Item3'],
-                                   major_axis=[1, 2],
-                                   minor_axis=['A', 'B', 'C'])
-
-        with ensure_clean_path(self.path) as path:
-            panel_with_missing.to_hdf(
-                path, 'panel_with_missing', format='table')
-            reloaded_panel = read_hdf(path, 'panel_with_missing')
-            tm.assert_panel_equal(panel_with_missing, reloaded_panel)
-
     def test_append_frame_column_oriented(self):
 
         with ensure_clean_store(self.path) as store:
@@ -1158,13 +1253,14 @@ def test_append_frame_column_oriented(self):
 
             # selection on the non-indexable
             result = store.select(
-                'df1', ('columns=A', Term('index=df.index[0:4]')))
+                'df1', ('columns=A', 'index=df.index[0:4]'))
             expected = df.reindex(columns=['A'], index=df.index[0:4])
             tm.assert_frame_equal(expected, result)
 
             # this isn't supported
-            self.assertRaises(TypeError, store.select, 'df1', (
-                'columns=A', Term('index>df.index[4]')))
+            with pytest.raises(TypeError):
+                store.select('df1',
+                             'columns=A and index>df.index[4]')
 
     def test_append_with_different_block_ordering(self):
 
@@ -1200,187 +1296,92 @@ def test_append_with_different_block_ordering(self):
             df['int16'] = Series([1] * len(df), dtype='int16')
             store.append('df', df)
 
-            # store additonal fields in different blocks
+            # store additional fields in different blocks
             df['int16_2'] = Series([1] * len(df), dtype='int16')
-            self.assertRaises(ValueError, store.append, 'df', df)
+            pytest.raises(ValueError, store.append, 'df', df)
 
-            # store multile additonal fields in different blocks
+            # store multile additional fields in different blocks
             df['float_3'] = Series([1.] * len(df), dtype='float64')
-            self.assertRaises(ValueError, store.append, 'df', df)
-
-    def test_ndim_indexables(self):
-        # test using ndim tables in new ways
-
-        with catch_warnings(record=True):
-            with ensure_clean_store(self.path) as store:
-
-                p4d = tm.makePanel4D()
-
-                def check_indexers(key, indexers):
-                    for i, idx in enumerate(indexers):
-                        descr = getattr(store.root, key).table.description
-                        self.assertTrue(getattr(descr, idx)._v_pos == i)
-
-                # append then change (will take existing schema)
-                indexers = ['items', 'major_axis', 'minor_axis']
-
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :], axes=indexers)
-                store.append('p4d', p4d.iloc[:, :, 10:, :])
-                assert_panel4d_equal(store.select('p4d'), p4d)
-                check_indexers('p4d', indexers)
-
-                # same as above, but try to append with differnt axes
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :], axes=indexers)
-                store.append('p4d', p4d.iloc[:, :, 10:, :], axes=[
-                    'labels', 'items', 'major_axis'])
-                assert_panel4d_equal(store.select('p4d'), p4d)
-                check_indexers('p4d', indexers)
-
-                # pass incorrect number of axes
-                _maybe_remove(store, 'p4d')
-                self.assertRaises(ValueError, store.append, 'p4d', p4d.iloc[
-                    :, :, :10, :], axes=['major_axis', 'minor_axis'])
-
-                # different than default indexables #1
-                indexers = ['labels', 'major_axis', 'minor_axis']
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :], axes=indexers)
-                store.append('p4d', p4d.iloc[:, :, 10:, :])
-                assert_panel4d_equal(store['p4d'], p4d)
-                check_indexers('p4d', indexers)
-
-                # different than default indexables #2
-                indexers = ['major_axis', 'labels', 'minor_axis']
-                _maybe_remove(store, 'p4d')
-                store.append('p4d', p4d.iloc[:, :, :10, :], axes=indexers)
-                store.append('p4d', p4d.iloc[:, :, 10:, :])
-                assert_panel4d_equal(store['p4d'], p4d)
-                check_indexers('p4d', indexers)
-
-                # partial selection
-                result = store.select('p4d', ['labels=l1'])
-                expected = p4d.reindex(labels=['l1'])
-                assert_panel4d_equal(result, expected)
-
-                # partial selection2
-                result = store.select('p4d', [Term(
-                    'labels=l1'), Term('items=ItemA'), Term('minor_axis=B')])
-                expected = p4d.reindex(
-                    labels=['l1'], items=['ItemA'], minor_axis=['B'])
-                assert_panel4d_equal(result, expected)
-
-                # non-existant partial selection
-                result = store.select('p4d', [Term(
-                    'labels=l1'), Term('items=Item1'), Term('minor_axis=B')])
-                expected = p4d.reindex(labels=['l1'], items=[],
-                                       minor_axis=['B'])
-                assert_panel4d_equal(result, expected)
+            pytest.raises(ValueError, store.append, 'df', df)
 
     def test_append_with_strings(self):
 
         with ensure_clean_store(self.path) as store:
-            wp = tm.makePanel()
-            wp2 = wp.rename_axis(
-                dict([(x, "%s_extra" % x) for x in wp.minor_axis]), axis=2)
-
-            def check_col(key, name, size):
-                self.assertEqual(getattr(store.get_storer(
-                    key).table.description, name).itemsize, size)
-
-            store.append('s1', wp, min_itemsize=20)
-            store.append('s1', wp2)
-            expected = concat([wp, wp2], axis=2)
-            expected = expected.reindex(minor_axis=sorted(expected.minor_axis))
-            assert_panel_equal(store['s1'], expected)
-            check_col('s1', 'minor_axis', 20)
-
-            # test dict format
-            store.append('s2', wp, min_itemsize={'minor_axis': 20})
-            store.append('s2', wp2)
-            expected = concat([wp, wp2], axis=2)
-            expected = expected.reindex(minor_axis=sorted(expected.minor_axis))
-            assert_panel_equal(store['s2'], expected)
-            check_col('s2', 'minor_axis', 20)
-
-            # apply the wrong field (similar to #1)
-            store.append('s3', wp, min_itemsize={'major_axis': 20})
-            self.assertRaises(ValueError, store.append, 's3', wp2)
-
-            # test truncation of bigger strings
-            store.append('s4', wp)
-            self.assertRaises(ValueError, store.append, 's4', wp2)
-
-            # avoid truncation on elements
-            df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
-            store.append('df_big', df)
-            tm.assert_frame_equal(store.select('df_big'), df)
-            check_col('df_big', 'values_block_1', 15)
-
-            # appending smaller string ok
-            df2 = DataFrame([[124, 'asdqy'], [346, 'dggnhefbdfb']])
-            store.append('df_big', df2)
-            expected = concat([df, df2])
-            tm.assert_frame_equal(store.select('df_big'), expected)
-            check_col('df_big', 'values_block_1', 15)
-
-            # avoid truncation on elements
-            df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
-            store.append('df_big2', df, min_itemsize={'values': 50})
-            tm.assert_frame_equal(store.select('df_big2'), df)
-            check_col('df_big2', 'values_block_1', 50)
-
-            # bigger string on next append
-            store.append('df_new', df)
-            df_new = DataFrame(
-                [[124, 'abcdefqhij'], [346, 'abcdefghijklmnopqrtsuvwxyz']])
-            self.assertRaises(ValueError, store.append, 'df_new', df_new)
-
-            # min_itemsize on Series index (GH 11412)
-            df = tm.makeMixedDataFrame().set_index('C')
-            store.append('ss', df['B'], min_itemsize={'index': 4})
-            tm.assert_series_equal(store.select('ss'), df['B'])
-
-            # same as above, with data_columns=True
-            store.append('ss2', df['B'], data_columns=True,
-                         min_itemsize={'index': 4})
-            tm.assert_series_equal(store.select('ss2'), df['B'])
-
-            # min_itemsize in index without appending (GH 10381)
-            store.put('ss3', df, format='table',
-                      min_itemsize={'index': 6})
-            # just make sure there is a longer string:
-            df2 = df.copy().reset_index().assign(C='longer').set_index('C')
-            store.append('ss3', df2)
-            tm.assert_frame_equal(store.select('ss3'),
-                                  pd.concat([df, df2]))
-
-            # same as above, with a Series
-            store.put('ss4', df['B'], format='table',
-                      min_itemsize={'index': 6})
-            store.append('ss4', df2['B'])
-            tm.assert_series_equal(store.select('ss4'),
-                                   pd.concat([df['B'], df2['B']]))
+            with catch_warnings(record=True):
 
-            # with nans
-            _maybe_remove(store, 'df')
-            df = tm.makeTimeDataFrame()
-            df['string'] = 'foo'
-            df.loc[1:4, 'string'] = np.nan
-            df['string2'] = 'bar'
-            df.loc[4:8, 'string2'] = np.nan
-            df['string3'] = 'bah'
-            df.loc[1:, 'string3'] = np.nan
-            store.append('df', df)
-            result = store.select('df')
-            tm.assert_frame_equal(result, df)
+                def check_col(key, name, size):
+                    assert getattr(store.get_storer(key)
+                                   .table.description, name).itemsize == size
+
+                # avoid truncation on elements
+                df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
+                store.append('df_big', df)
+                tm.assert_frame_equal(store.select('df_big'), df)
+                check_col('df_big', 'values_block_1', 15)
+
+                # appending smaller string ok
+                df2 = DataFrame([[124, 'asdqy'], [346, 'dggnhefbdfb']])
+                store.append('df_big', df2)
+                expected = concat([df, df2])
+                tm.assert_frame_equal(store.select('df_big'), expected)
+                check_col('df_big', 'values_block_1', 15)
+
+                # avoid truncation on elements
+                df = DataFrame([[123, 'asdqwerty'], [345, 'dggnhebbsdfbdfb']])
+                store.append('df_big2', df, min_itemsize={'values': 50})
+                tm.assert_frame_equal(store.select('df_big2'), df)
+                check_col('df_big2', 'values_block_1', 50)
+
+                # bigger string on next append
+                store.append('df_new', df)
+                df_new = DataFrame(
+                    [[124, 'abcdefqhij'], [346, 'abcdefghijklmnopqrtsuvwxyz']])
+                pytest.raises(ValueError, store.append, 'df_new', df_new)
+
+                # min_itemsize on Series index (GH 11412)
+                df = tm.makeMixedDataFrame().set_index('C')
+                store.append('ss', df['B'], min_itemsize={'index': 4})
+                tm.assert_series_equal(store.select('ss'), df['B'])
+
+                # same as above, with data_columns=True
+                store.append('ss2', df['B'], data_columns=True,
+                             min_itemsize={'index': 4})
+                tm.assert_series_equal(store.select('ss2'), df['B'])
+
+                # min_itemsize in index without appending (GH 10381)
+                store.put('ss3', df, format='table',
+                          min_itemsize={'index': 6})
+                # just make sure there is a longer string:
+                df2 = df.copy().reset_index().assign(C='longer').set_index('C')
+                store.append('ss3', df2)
+                tm.assert_frame_equal(store.select('ss3'),
+                                      pd.concat([df, df2]))
+
+                # same as above, with a Series
+                store.put('ss4', df['B'], format='table',
+                          min_itemsize={'index': 6})
+                store.append('ss4', df2['B'])
+                tm.assert_series_equal(store.select('ss4'),
+                                       pd.concat([df['B'], df2['B']]))
+
+                # with nans
+                _maybe_remove(store, 'df')
+                df = tm.makeTimeDataFrame()
+                df['string'] = 'foo'
+                df.loc[1:4, 'string'] = np.nan
+                df['string2'] = 'bar'
+                df.loc[4:8, 'string2'] = np.nan
+                df['string3'] = 'bah'
+                df.loc[1:, 'string3'] = np.nan
+                store.append('df', df)
+                result = store.select('df')
+                tm.assert_frame_equal(result, df)
 
         with ensure_clean_store(self.path) as store:
 
             def check_col(key, name, size):
-                self.assertEqual(getattr(store.get_storer(
-                    key).table.description, name).itemsize, size)
+                assert getattr(store.get_storer(key)
+                               .table.description, name).itemsize, size
 
             df = DataFrame(dict(A='foo', B='bar'), index=range(10))
 
@@ -1388,13 +1389,13 @@ def check_col(key, name, size):
             _maybe_remove(store, 'df')
             store.append('df', df, min_itemsize={'A': 200})
             check_col('df', 'A', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['A'])
+            assert store.get_storer('df').data_columns == ['A']
 
             # a min_itemsize that creates a data_column2
             _maybe_remove(store, 'df')
             store.append('df', df, data_columns=['B'], min_itemsize={'A': 200})
             check_col('df', 'A', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['B', 'A'])
+            assert store.get_storer('df').data_columns == ['B', 'A']
 
             # a min_itemsize that creates a data_column2
             _maybe_remove(store, 'df')
@@ -1402,7 +1403,7 @@ def check_col(key, name, size):
                          'B'], min_itemsize={'values': 200})
             check_col('df', 'B', 200)
             check_col('df', 'values_block_0', 200)
-            self.assertEqual(store.get_storer('df').data_columns, ['B'])
+            assert store.get_storer('df').data_columns == ['B']
 
             # infer the .typ on subsequent appends
             _maybe_remove(store, 'df')
@@ -1414,8 +1415,18 @@ def check_col(key, name, size):
             df = DataFrame(['foo', 'foo', 'foo', 'barh',
                             'barh', 'barh'], columns=['A'])
             _maybe_remove(store, 'df')
-            self.assertRaises(ValueError, store.append, 'df',
-                              df, min_itemsize={'foo': 20, 'foobar': 20})
+            pytest.raises(ValueError, store.append, 'df',
+                          df, min_itemsize={'foo': 20, 'foobar': 20})
+
+    def test_append_with_empty_string(self):
+
+        with ensure_clean_store(self.path) as store:
+
+            # with all empty strings (GH 12242)
+            df = DataFrame({'x': ['a', 'b', 'c', 'd', 'e', 'f', '']})
+            store.append('df', df[:-1], min_itemsize={'x': 1})
+            store.append('df', df[-1:], min_itemsize={'x': 1})
+            tm.assert_frame_equal(store.select('df'), df)
 
     def test_to_hdf_with_min_itemsize(self):
 
@@ -1437,6 +1448,21 @@ def test_to_hdf_with_min_itemsize(self):
             tm.assert_series_equal(pd.read_hdf(path, 'ss4'),
                                    pd.concat([df['B'], df2['B']]))
 
+    @pytest.mark.parametrize(
+        "format",
+        [pytest.param('fixed', marks=xfail_non_writeable),
+         'table'])
+    def test_to_hdf_errors(self, format):
+
+        data = ['\ud800foo']
+        ser = pd.Series(data, index=pd.Index(data))
+        with ensure_clean_path(self.path) as path:
+            # GH 20835
+            ser.to_hdf(path, 'table', format=format, errors='surrogatepass')
+
+            result = pd.read_hdf(path, 'table', errors='surrogatepass')
+            tm.assert_series_equal(result, ser)
+
     def test_append_with_data_columns(self):
 
         with ensure_clean_store(self.path) as store:
@@ -1447,18 +1473,18 @@ def test_append_with_data_columns(self):
             store.append('df', df[2:])
             tm.assert_frame_equal(store['df'], df)
 
-            # check that we have indicies created
+            # check that we have indices created
             assert(store._handle.root.df.table.cols.index.is_indexed is True)
             assert(store._handle.root.df.table.cols.B.is_indexed is True)
 
             # data column searching
-            result = store.select('df', [Term('B>0')])
+            result = store.select('df', 'B>0')
             expected = df[df.B > 0]
             tm.assert_frame_equal(result, expected)
 
             # data column searching (with an indexable and a data_columns)
             result = store.select(
-                'df', [Term('B>0'), Term('index>df.index[3]')])
+                'df', 'B>0 and index>df.index[3]')
             df_new = df.reindex(index=df.index[4:])
             expected = df_new[df_new.B > 0]
             tm.assert_frame_equal(result, expected)
@@ -1470,14 +1496,14 @@ def test_append_with_data_columns(self):
             df_new.loc[5:6, 'string'] = 'bar'
             _maybe_remove(store, 'df')
             store.append('df', df_new, data_columns=['string'])
-            result = store.select('df', [Term('string=foo')])
+            result = store.select('df', "string='foo'")
             expected = df_new[df_new.string == 'foo']
             tm.assert_frame_equal(result, expected)
 
             # using min_itemsize and a data column
             def check_col(key, name, size):
-                self.assertEqual(getattr(store.get_storer(
-                    key).table.description, name).itemsize, size)
+                assert getattr(store.get_storer(key)
+                               .table.description, name).itemsize == size
 
         with ensure_clean_store(self.path) as store:
             _maybe_remove(store, 'df')
@@ -1523,15 +1549,15 @@ def check_col(key, name, size):
             _maybe_remove(store, 'df')
             store.append(
                 'df', df_new, data_columns=['A', 'B', 'string', 'string2'])
-            result = store.select('df', [Term('string=foo'), Term(
-                'string2=foo'), Term('A>0'), Term('B<0')])
+            result = store.select('df',
+                                  "string='foo' and string2='foo'"
+                                  " and A>0 and B<0")
             expected = df_new[(df_new.string == 'foo') & (
                 df_new.string2 == 'foo') & (df_new.A > 0) & (df_new.B < 0)]
             tm.assert_frame_equal(result, expected, check_index_type=False)
 
             # yield an empty frame
-            result = store.select('df', [Term('string=foo'), Term(
-                'string2=cool')])
+            result = store.select('df', "string='foo' and string2='cool'")
             expected = df_new[(df_new.string == 'foo') & (
                 df_new.string2 == 'cool')]
             tm.assert_frame_equal(result, expected, check_index_type=False)
@@ -1551,7 +1577,7 @@ def check_col(key, name, size):
             store.append('df_dc', df_dc,
                          data_columns=['B', 'C', 'string',
                                        'string2', 'datetime'])
-            result = store.select('df_dc', [Term('B>0')])
+            result = store.select('df_dc', 'B>0')
 
             expected = df_dc[df_dc.B > 0]
             tm.assert_frame_equal(result, expected, check_index_type=False)
@@ -1578,7 +1604,7 @@ def check_col(key, name, size):
             store.append('df_dc', df_dc, data_columns=[
                          'B', 'C', 'string', 'string2'])
 
-            result = store.select('df_dc', [Term('B>0')])
+            result = store.select('df_dc', 'B>0')
             expected = df_dc[df_dc.B > 0]
             tm.assert_frame_equal(result, expected)
 
@@ -1588,106 +1614,41 @@ def check_col(key, name, size):
                              (df_dc.string == 'foo')]
             tm.assert_frame_equal(result, expected)
 
-        with ensure_clean_store(self.path) as store:
-            # panel
-            # GH5717 not handling data_columns
-            np.random.seed(1234)
-            p = tm.makePanel()
-
-            store.append('p1', p)
-            tm.assert_panel_equal(store.select('p1'), p)
-
-            store.append('p2', p, data_columns=True)
-            tm.assert_panel_equal(store.select('p2'), p)
-
-            result = store.select('p2', where='ItemA>0')
-            expected = p.to_frame()
-            expected = expected[expected['ItemA'] > 0]
-            tm.assert_frame_equal(result.to_frame(), expected)
-
-            result = store.select('p2', where='ItemA>0 & minor_axis=["A","B"]')
-            expected = p.to_frame()
-            expected = expected[expected['ItemA'] > 0]
-            expected = expected[expected.reset_index(
-                level=['major']).index.isin(['A', 'B'])]
-            tm.assert_frame_equal(result.to_frame(), expected)
-
     def test_create_table_index(self):
 
         with ensure_clean_store(self.path) as store:
 
-            def col(t, column):
-                return getattr(store.get_storer(t).table.cols, column)
-
-            # index=False
-            wp = tm.makePanel()
-            store.append('p5', wp, index=False)
-            store.create_table_index('p5', columns=['major_axis'])
-            assert(col('p5', 'major_axis').is_indexed is True)
-            assert(col('p5', 'minor_axis').is_indexed is False)
-
-            # index=True
-            store.append('p5i', wp, index=True)
-            assert(col('p5i', 'major_axis').is_indexed is True)
-            assert(col('p5i', 'minor_axis').is_indexed is True)
-
-            # default optlevels
-            store.get_storer('p5').create_index()
-            assert(col('p5', 'major_axis').index.optlevel == 6)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-
-            # let's change the indexing scheme
-            store.create_table_index('p5')
-            assert(col('p5', 'major_axis').index.optlevel == 6)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-            store.create_table_index('p5', optlevel=9)
-            assert(col('p5', 'major_axis').index.optlevel == 9)
-            assert(col('p5', 'minor_axis').index.kind == 'medium')
-            store.create_table_index('p5', kind='full')
-            assert(col('p5', 'major_axis').index.optlevel == 9)
-            assert(col('p5', 'minor_axis').index.kind == 'full')
-            store.create_table_index('p5', optlevel=1, kind='light')
-            assert(col('p5', 'major_axis').index.optlevel == 1)
-            assert(col('p5', 'minor_axis').index.kind == 'light')
-
-            # data columns
-            df = tm.makeTimeDataFrame()
-            df['string'] = 'foo'
-            df['string2'] = 'bar'
-            store.append('f', df, data_columns=['string', 'string2'])
-            assert(col('f', 'index').is_indexed is True)
-            assert(col('f', 'string').is_indexed is True)
-            assert(col('f', 'string2').is_indexed is True)
-
-            # specify index=columns
-            store.append(
-                'f2', df, index=['string'], data_columns=['string', 'string2'])
-            assert(col('f2', 'index').is_indexed is False)
-            assert(col('f2', 'string').is_indexed is True)
-            assert(col('f2', 'string2').is_indexed is False)
-
-            # try to index a non-table
-            _maybe_remove(store, 'f2')
-            store.put('f2', df)
-            self.assertRaises(TypeError, store.create_table_index, 'f2')
+            with catch_warnings(record=True):
+                def col(t, column):
+                    return getattr(store.get_storer(t).table.cols, column)
 
-    def test_append_diff_item_order(self):
+                # data columns
+                df = tm.makeTimeDataFrame()
+                df['string'] = 'foo'
+                df['string2'] = 'bar'
+                store.append('f', df, data_columns=['string', 'string2'])
+                assert(col('f', 'index').is_indexed is True)
+                assert(col('f', 'string').is_indexed is True)
+                assert(col('f', 'string2').is_indexed is True)
 
-        wp = tm.makePanel()
-        wp1 = wp.iloc[:, :10, :]
-        wp2 = wp.iloc[wp.items.get_indexer(['ItemC', 'ItemB', 'ItemA']),
-                      10:, :]
+                # specify index=columns
+                store.append(
+                    'f2', df, index=['string'],
+                    data_columns=['string', 'string2'])
+                assert(col('f2', 'index').is_indexed is False)
+                assert(col('f2', 'string').is_indexed is True)
+                assert(col('f2', 'string2').is_indexed is False)
 
-        with ensure_clean_store(self.path) as store:
-            store.put('panel', wp1, format='table')
-            self.assertRaises(ValueError, store.put, 'panel', wp2,
-                              append=True)
+                # try to index a non-table
+                _maybe_remove(store, 'f2')
+                store.put('f2', df)
+                pytest.raises(TypeError, store.create_table_index, 'f2')
 
     def test_append_hierarchical(self):
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
                                    ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['foo', 'bar'])
         df = DataFrame(np.random.randn(10, 3), index=index,
                        columns=['A', 'B', 'C'])
@@ -1732,10 +1693,10 @@ def test_column_multiindex(self):
                                   check_index_type=True,
                                   check_column_type=True)
 
-            self.assertRaises(ValueError, store.put, 'df2', df,
-                              format='table', data_columns=['A'])
-            self.assertRaises(ValueError, store.put, 'df3', df,
-                              format='table', data_columns=True)
+            pytest.raises(ValueError, store.put, 'df2', df,
+                          format='table', data_columns=['A'])
+            pytest.raises(ValueError, store.put, 'df3', df,
+                          format='table', data_columns=True)
 
         # appending multi-column on existing table (see GH 6167)
         with ensure_clean_store(self.path) as store:
@@ -1798,13 +1759,13 @@ def make_index(names=None):
             _maybe_remove(store, 'df')
             df = DataFrame(np.zeros((12, 2)), columns=[
                            'a', 'b'], index=make_index(['date', 'a', 't']))
-            self.assertRaises(ValueError, store.append, 'df', df)
+            pytest.raises(ValueError, store.append, 'df', df)
 
             # dup within level
             _maybe_remove(store, 'df')
             df = DataFrame(np.zeros((12, 2)), columns=['a', 'b'],
                            index=make_index(['date', 'date', 'date']))
-            self.assertRaises(ValueError, store.append, 'df', df)
+            pytest.raises(ValueError, store.append, 'df', df)
 
             # fully names
             _maybe_remove(store, 'df')
@@ -1820,8 +1781,8 @@ def test_select_columns_in_where(self):
         # in the `where` argument
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
                                    ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['foo_name', 'bar_name'])
 
         # With a DataFrame
@@ -1863,34 +1824,22 @@ def test_pass_spec_to_storer(self):
 
         with ensure_clean_store(self.path) as store:
             store.put('df', df)
-            self.assertRaises(TypeError, store.select, 'df', columns=['A'])
-            self.assertRaises(TypeError, store.select,
-                              'df', where=[('columns=A')])
+            pytest.raises(TypeError, store.select, 'df', columns=['A'])
+            pytest.raises(TypeError, store.select,
+                          'df', where=[('columns=A')])
 
+    @xfail_non_writeable
     def test_append_misc(self):
 
         with ensure_clean_store(self.path) as store:
+            df = tm.makeDataFrame()
+            store.append('df', df, chunksize=1)
+            result = store.select('df')
+            tm.assert_frame_equal(result, df)
 
-            with catch_warnings(record=True):
-
-                # unsuported data types for non-tables
-                p4d = tm.makePanel4D()
-                self.assertRaises(TypeError, store.put, 'p4d', p4d)
-
-                # unsuported data types
-                self.assertRaises(TypeError, store.put, 'abc', None)
-                self.assertRaises(TypeError, store.put, 'abc', '123')
-                self.assertRaises(TypeError, store.put, 'abc', 123)
-                self.assertRaises(TypeError, store.put, 'abc', np.arange(5))
-
-                df = tm.makeDataFrame()
-                store.append('df', df, chunksize=1)
-                result = store.select('df')
-                tm.assert_frame_equal(result, df)
-
-                store.append('df1', df, expectedrows=10)
-                result = store.select('df1')
-                tm.assert_frame_equal(result, df)
+            store.append('df1', df, expectedrows=10)
+            result = store.select('df1')
+            tm.assert_frame_equal(result, df)
 
         # more chunksize in append tests
         def check(obj, comparator):
@@ -1909,20 +1858,13 @@ def check(obj, comparator):
         df['time2'] = Timestamp('20130102')
         check(df, tm.assert_frame_equal)
 
-        p = tm.makePanel()
-        check(p, assert_panel_equal)
-
-        with catch_warnings(record=True):
-            p4d = tm.makePanel4D()
-            check(p4d, assert_panel4d_equal)
-
         # empty frame, GH4273
         with ensure_clean_store(self.path) as store:
 
             # 0 len
             df_empty = DataFrame(columns=list('ABC'))
             store.append('df', df_empty)
-            self.assertRaises(KeyError, store.select, 'df')
+            pytest.raises(KeyError, store.select, 'df')
 
             # repeated append of 0/non-zero frames
             df = DataFrame(np.random.rand(10, 3), columns=list('ABC'))
@@ -1936,22 +1878,6 @@ def check(obj, comparator):
             store.put('df2', df)
             assert_frame_equal(store.select('df2'), df)
 
-            # 0 len
-            p_empty = Panel(items=list('ABC'))
-            store.append('p', p_empty)
-            self.assertRaises(KeyError, store.select, 'p')
-
-            # repeated append of 0/non-zero frames
-            p = Panel(np.random.randn(3, 4, 5), items=list('ABC'))
-            store.append('p', p)
-            assert_panel_equal(store.select('p'), p)
-            store.append('p', p_empty)
-            assert_panel_equal(store.select('p'), p)
-
-            # store
-            store.put('p2', p_empty)
-            assert_panel_equal(store.select('p2'), p_empty)
-
     def test_append_raise(self):
 
         with ensure_clean_store(self.path) as store:
@@ -1961,13 +1887,13 @@ def test_append_raise(self):
             # list in column
             df = tm.makeDataFrame()
             df['invalid'] = [['a']] * len(df)
-            self.assertEqual(df.dtypes['invalid'], np.object_)
-            self.assertRaises(TypeError, store.append, 'df', df)
+            assert df.dtypes['invalid'] == np.object_
+            pytest.raises(TypeError, store.append, 'df', df)
 
             # multiple invalid columns
             df['invalid2'] = [['a']] * len(df)
             df['invalid3'] = [['a']] * len(df)
-            self.assertRaises(TypeError, store.append, 'df', df)
+            pytest.raises(TypeError, store.append, 'df', df)
 
             # datetime with embedded nans as object
             df = tm.makeDataFrame()
@@ -1975,22 +1901,22 @@ def test_append_raise(self):
             s = s.astype(object)
             s[0:5] = np.nan
             df['invalid'] = s
-            self.assertEqual(df.dtypes['invalid'], np.object_)
-            self.assertRaises(TypeError, store.append, 'df', df)
+            assert df.dtypes['invalid'] == np.object_
+            pytest.raises(TypeError, store.append, 'df', df)
 
-            # directy ndarray
-            self.assertRaises(TypeError, store.append, 'df', np.arange(10))
+            # directly ndarray
+            pytest.raises(TypeError, store.append, 'df', np.arange(10))
 
             # series directly
-            self.assertRaises(TypeError, store.append,
-                              'df', Series(np.arange(10)))
+            pytest.raises(TypeError, store.append,
+                          'df', Series(np.arange(10)))
 
             # appending an incompatible table
             df = tm.makeDataFrame()
             store.append('df', df)
 
             df['foo'] = 'foo'
-            self.assertRaises(ValueError, store.append, 'df', df)
+            pytest.raises(ValueError, store.append, 'df', df)
 
     def test_table_index_incompatible_dtypes(self):
         df1 = DataFrame({'a': [1, 2, 3]})
@@ -1999,8 +1925,8 @@ def test_table_index_incompatible_dtypes(self):
 
         with ensure_clean_store(self.path) as store:
             store.put('frame', df1, format='table')
-            self.assertRaises(TypeError, store.put, 'frame', df2,
-                              format='table', append=True)
+            pytest.raises(TypeError, store.put, 'frame', df2,
+                          format='table', append=True)
 
     def test_table_values_dtypes_roundtrip(self):
 
@@ -2014,7 +1940,7 @@ def test_table_values_dtypes_roundtrip(self):
             assert_series_equal(df2.dtypes, store['df_i8'].dtypes)
 
             # incompatible dtype
-            self.assertRaises(ValueError, store.append, 'df_i8', df1)
+            pytest.raises(ValueError, store.append, 'df_i8', df1)
 
             # check creation/storage/retrieval of float32 (a bit hacky to
             # actually create them thought)
@@ -2025,9 +1951,9 @@ def test_table_values_dtypes_roundtrip(self):
             assert df1.dtypes[0] == 'float32'
 
             # check with mixed dtypes
-            df1 = DataFrame(dict([(c, Series(np.random.randn(5), dtype=c))
-                                  for c in ['float32', 'float64', 'int32',
-                                            'int64', 'int16', 'int8']]))
+            df1 = DataFrame({c: Series(np.random.randint(5), dtype=c)
+                             for c in ['float32', 'float64', 'int32',
+                                       'int64', 'int16', 'int8']})
             df1['string'] = 'foo'
             df1['float322'] = 1.
             df1['float322'] = df1['float322'].astype('float32')
@@ -2041,7 +1967,7 @@ def test_table_values_dtypes_roundtrip(self):
                                'bool': 1, 'int16': 1, 'int8': 1,
                                'int64': 1, 'object': 1, 'datetime64[ns]': 2})
             result = result.sort_index()
-            result = expected.sort_index()
+            expected = expected.sort_index()
             tm.assert_series_equal(result, expected)
 
     def test_table_mixed_dtypes(self):
@@ -2066,51 +1992,21 @@ def test_table_mixed_dtypes(self):
             store.append('df1_mixed', df)
             tm.assert_frame_equal(store.select('df1_mixed'), df)
 
-        # panel
-        wp = tm.makePanel()
-        wp['obj1'] = 'foo'
-        wp['obj2'] = 'bar'
-        wp['bool1'] = wp['ItemA'] > 0
-        wp['bool2'] = wp['ItemB'] > 0
-        wp['int1'] = 1
-        wp['int2'] = 2
-        wp = wp._consolidate()
-
-        with ensure_clean_store(self.path) as store:
-            store.append('p1_mixed', wp)
-            assert_panel_equal(store.select('p1_mixed'), wp)
-
-        with catch_warnings(record=True):
-
-            # ndim
-            wp = tm.makePanel4D()
-            wp['obj1'] = 'foo'
-            wp['obj2'] = 'bar'
-            wp['bool1'] = wp['l1'] > 0
-            wp['bool2'] = wp['l2'] > 0
-            wp['int1'] = 1
-            wp['int2'] = 2
-            wp = wp._consolidate()
-
-            with ensure_clean_store(self.path) as store:
-                store.append('p4d_mixed', wp)
-                assert_panel4d_equal(store.select('p4d_mixed'), wp)
-
     def test_unimplemented_dtypes_table_columns(self):
 
         with ensure_clean_store(self.path) as store:
 
-            l = [('date', datetime.date(2001, 1, 2))]
+            dtypes = [('date', datetime.date(2001, 1, 2))]
 
             # py3 ok for unicode
             if not compat.PY3:
-                l.append(('unicode', u('\\u03c3')))
+                dtypes.append(('unicode', u('\\u03c3')))
 
             # currently not supported dtypes ####
-            for n, f in l:
+            for n, f in dtypes:
                 df = tm.makeDataFrame()
                 df[n] = f
-                self.assertRaises(
+                pytest.raises(
                     TypeError, store.append, 'df1_%s' % n, df)
 
         # frame
@@ -2122,8 +2018,13 @@ def test_unimplemented_dtypes_table_columns(self):
 
         with ensure_clean_store(self.path) as store:
             # this fails because we have a date in the object block......
-            self.assertRaises(TypeError, store.append, 'df_unimplemented', df)
+            pytest.raises(TypeError, store.append, 'df_unimplemented', df)
 
+    @xfail_non_writeable
+    @pytest.mark.skipif(
+        LooseVersion(np.__version__) == LooseVersion('1.15.0'),
+        reason=("Skipping  pytables test when numpy version is "
+                "exactly equal to 1.15.0: gh-22098"))
     def test_calendar_roundtrip_issue(self):
 
         # 8591
@@ -2131,7 +2032,7 @@ def test_calendar_roundtrip_issue(self):
         weekmask_egypt = 'Sun Mon Tue Wed Thu'
         holidays = ['2012-05-01',
                     datetime.datetime(2013, 5, 1), np.datetime64('2014-05-01')]
-        bday_egypt = pandas.offsets.CustomBusinessDay(
+        bday_egypt = pd.offsets.CustomBusinessDay(
             holidays=holidays, weekmask=weekmask_egypt)
         dt = datetime.datetime(2013, 4, 30)
         dts = date_range(dt, periods=5, freq=bday_egypt)
@@ -2149,6 +2050,17 @@ def test_calendar_roundtrip_issue(self):
             result = store.select('table')
             assert_series_equal(result, s)
 
+    def test_roundtrip_tz_aware_index(self):
+        # GH 17618
+        time = pd.Timestamp('2000-01-01 01:00:00', tz='US/Eastern')
+        df = pd.DataFrame(data=[0], index=[time])
+
+        with ensure_clean_store(self.path) as store:
+            store.put('frame', df, format='fixed')
+            recons = store['frame']
+            tm.assert_frame_equal(recons, df)
+            assert recons.index[0].value == 946706400000000000
+
     def test_append_with_timedelta(self):
         # GH 3577
         # append timedelta
@@ -2166,9 +2078,12 @@ def test_append_with_timedelta(self):
             result = store.select('df')
             assert_frame_equal(result, df)
 
-            result = store.select('df', "C<100000")
+            result = store.select('df', where="C<100000")
             assert_frame_equal(result, df)
 
+            result = store.select('df', where="C<pd.Timedelta('-3D')")
+            assert_frame_equal(result, df.iloc[3:])
+
             result = store.select('df', "C<'-3D'")
             assert_frame_equal(result, df.iloc[3:])
 
@@ -2197,215 +2112,33 @@ def test_remove(self):
             store['a'] = ts
             store['b'] = df
             _maybe_remove(store, 'a')
-            self.assertEqual(len(store), 1)
+            assert len(store) == 1
             tm.assert_frame_equal(df, store['b'])
 
             _maybe_remove(store, 'b')
-            self.assertEqual(len(store), 0)
+            assert len(store) == 0
 
             # nonexistence
-            self.assertRaises(KeyError, store.remove, 'a_nonexistent_store')
+            pytest.raises(KeyError, store.remove, 'a_nonexistent_store')
 
             # pathing
             store['a'] = ts
             store['b/foo'] = df
             _maybe_remove(store, 'foo')
             _maybe_remove(store, 'b/foo')
-            self.assertEqual(len(store), 1)
+            assert len(store) == 1
 
             store['a'] = ts
             store['b/foo'] = df
             _maybe_remove(store, 'b')
-            self.assertEqual(len(store), 1)
+            assert len(store) == 1
 
             # __delitem__
             store['a'] = ts
             store['b'] = df
             del store['a']
             del store['b']
-            self.assertEqual(len(store), 0)
-
-    def test_remove_where(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            # non-existance
-            crit1 = Term('index>foo')
-            self.assertRaises(KeyError, store.remove, 'a', [crit1])
-
-            # try to remove non-table (with crit)
-            # non-table ok (where = None)
-            wp = tm.makePanel(30)
-            store.put('wp', wp, format='table')
-            store.remove('wp', ["minor_axis=['A', 'D']"])
-            rs = store.select('wp')
-            expected = wp.reindex(minor_axis=['B', 'C'])
-            assert_panel_equal(rs, expected)
-
-            # empty where
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-
-            # deleted number (entire table)
-            n = store.remove('wp', [])
-            self.assertTrue(n == 120)
-
-            # non - empty where
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            self.assertRaises(ValueError, store.remove,
-                              'wp', ['foo'])
-
-            # selectin non-table with a where
-            # store.put('wp2', wp, format='f')
-            # self.assertRaises(ValueError, store.remove,
-            #                  'wp2', [('column', ['A', 'D'])])
-
-    def test_remove_startstop(self):
-        # GH #4835 and #6177
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel(30)
-
-            # start
-            _maybe_remove(store, 'wp1')
-            store.put('wp1', wp, format='t')
-            n = store.remove('wp1', start=32)
-            self.assertTrue(n == 120 - 32)
-            result = store.select('wp1')
-            expected = wp.reindex(major_axis=wp.major_axis[:32 // 4])
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp2')
-            store.put('wp2', wp, format='t')
-            n = store.remove('wp2', start=-32)
-            self.assertTrue(n == 32)
-            result = store.select('wp2')
-            expected = wp.reindex(major_axis=wp.major_axis[:-32 // 4])
-            assert_panel_equal(result, expected)
-
-            # stop
-            _maybe_remove(store, 'wp3')
-            store.put('wp3', wp, format='t')
-            n = store.remove('wp3', stop=32)
-            self.assertTrue(n == 32)
-            result = store.select('wp3')
-            expected = wp.reindex(major_axis=wp.major_axis[32 // 4:])
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp4')
-            store.put('wp4', wp, format='t')
-            n = store.remove('wp4', stop=-32)
-            self.assertTrue(n == 120 - 32)
-            result = store.select('wp4')
-            expected = wp.reindex(major_axis=wp.major_axis[-32 // 4:])
-            assert_panel_equal(result, expected)
-
-            # start n stop
-            _maybe_remove(store, 'wp5')
-            store.put('wp5', wp, format='t')
-            n = store.remove('wp5', start=16, stop=-16)
-            self.assertTrue(n == 120 - 32)
-            result = store.select('wp5')
-            expected = wp.reindex(major_axis=wp.major_axis[
-                                  :16 // 4].union(wp.major_axis[-16 // 4:]))
-            assert_panel_equal(result, expected)
-
-            _maybe_remove(store, 'wp6')
-            store.put('wp6', wp, format='t')
-            n = store.remove('wp6', start=16, stop=16)
-            self.assertTrue(n == 0)
-            result = store.select('wp6')
-            expected = wp.reindex(major_axis=wp.major_axis)
-            assert_panel_equal(result, expected)
-
-            # with where
-            _maybe_remove(store, 'wp7')
-
-            # TODO: unused?
-            date = wp.major_axis.take(np.arange(0, 30, 3))  # noqa
-
-            crit = Term('major_axis=date')
-            store.put('wp7', wp, format='t')
-            n = store.remove('wp7', where=[crit], stop=80)
-            self.assertTrue(n == 28)
-            result = store.select('wp7')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(
-                wp.major_axis[np.arange(0, 20, 3)]))
-            assert_panel_equal(result, expected)
-
-    def test_remove_crit(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel(30)
-
-            # group row removal
-            _maybe_remove(store, 'wp3')
-            date4 = wp.major_axis.take([0, 1, 2, 4, 5, 6, 8, 9, 10])
-            crit4 = Term('major_axis=date4')
-            store.put('wp3', wp, format='t')
-            n = store.remove('wp3', where=[crit4])
-            self.assertTrue(n == 36)
-
-            result = store.select('wp3')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(date4))
-            assert_panel_equal(result, expected)
-
-            # upper half
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            date = wp.major_axis[len(wp.major_axis) // 2]
-
-            crit1 = Term('major_axis>date')
-            crit2 = Term("minor_axis=['A', 'D']")
-            n = store.remove('wp', where=[crit1])
-            self.assertTrue(n == 56)
-
-            n = store.remove('wp', where=[crit2])
-            self.assertTrue(n == 32)
-
-            result = store['wp']
-            expected = wp.truncate(after=date).reindex(minor=['B', 'C'])
-            assert_panel_equal(result, expected)
-
-            # individual row elements
-            _maybe_remove(store, 'wp2')
-            store.put('wp2', wp, format='table')
-
-            date1 = wp.major_axis[1:3]
-            crit1 = Term('major_axis=date1')
-            store.remove('wp2', where=[crit1])
-            result = store.select('wp2')
-            expected = wp.reindex(major_axis=wp.major_axis.difference(date1))
-            assert_panel_equal(result, expected)
-
-            date2 = wp.major_axis[5]
-            crit2 = Term('major_axis=date2')
-            store.remove('wp2', where=[crit2])
-            result = store['wp2']
-            expected = wp.reindex(major_axis=wp.major_axis.difference(date1)
-                                  .difference(Index([date2])))
-            assert_panel_equal(result, expected)
-
-            date3 = [wp.major_axis[7], wp.major_axis[9]]
-            crit3 = Term('major_axis=date3')
-            store.remove('wp2', where=[crit3])
-            result = store['wp2']
-            expected = wp.reindex(major_axis=wp.major_axis
-                                  .difference(date1)
-                                  .difference(Index([date2]))
-                                  .difference(Index(date3)))
-            assert_panel_equal(result, expected)
-
-            # corners
-            _maybe_remove(store, 'wp4')
-            store.put('wp4', wp, format='table')
-            n = store.remove(
-                'wp4', where=[Term('major_axis>wp.major_axis[-1]')])
-            result = store.select('wp4')
-            assert_panel_equal(result, wp)
+            assert len(store) == 0
 
     def test_invalid_terms(self):
 
@@ -2416,29 +2149,16 @@ def test_invalid_terms(self):
                 df = tm.makeTimeDataFrame()
                 df['string'] = 'foo'
                 df.loc[0:4, 'string'] = 'bar'
-                wp = tm.makePanel()
 
-                p4d = tm.makePanel4D()
                 store.put('df', df, format='table')
-                store.put('wp', wp, format='table')
-                store.put('p4d', p4d, format='table')
 
                 # some invalid terms
-                self.assertRaises(ValueError, store.select,
-                                  'wp', "minor=['A', 'B']")
-                self.assertRaises(ValueError, store.select,
-                                  'wp', ["index=['20121114']"])
-                self.assertRaises(ValueError, store.select, 'wp', [
-                    "index=['20121114', '20121114']"])
-                self.assertRaises(TypeError, Term)
+                pytest.raises(TypeError, Term)
 
                 # more invalid
-                self.assertRaises(
+                pytest.raises(
                     ValueError, store.select, 'df', 'df.index[3]')
-                self.assertRaises(SyntaxError, store.select, 'df', 'index>')
-                self.assertRaises(
-                    ValueError, store.select, 'wp',
-                    "major_axis<'20000108' & minor_axis['A', 'B']")
+                pytest.raises(SyntaxError, store.select, 'df', 'index>')
 
         # from the docs
         with ensure_clean_path(self.path) as path:
@@ -2457,133 +2177,8 @@ def test_invalid_terms(self):
                 'ABCD'), index=date_range('20130101', periods=10))
             dfq.to_hdf(path, 'dfq', format='table')
 
-            self.assertRaises(ValueError, read_hdf, path,
-                              'dfq', where="A>0 or C>0")
-
-    def test_terms(self):
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = tm.makePanel()
-            wpneg = Panel.fromDict({-1: tm.makeDataFrame(),
-                                    0: tm.makeDataFrame(),
-                                    1: tm.makeDataFrame()})
-
-            with catch_warnings(record=True):
-
-                p4d = tm.makePanel4D()
-                store.put('p4d', p4d, format='table')
-
-            store.put('wp', wp, format='table')
-            store.put('wpneg', wpneg, format='table')
-
-            # panel
-            result = store.select(
-                'wp', "major_axis<'20000108' and minor_axis=['A', 'B']")
-            expected = wp.truncate(after='20000108').reindex(minor=['A', 'B'])
-            assert_panel_equal(result, expected)
-
-            # p4d
-            with catch_warnings(record=True):
-
-                result = store.select('p4d',
-                                      ("major_axis<'20000108' and "
-                                       "minor_axis=['A', 'B'] and "
-                                       "items=['ItemA', 'ItemB']"))
-                expected = p4d.truncate(after='20000108').reindex(
-                    minor=['A', 'B'], items=['ItemA', 'ItemB'])
-                assert_panel4d_equal(result, expected)
-
-            with catch_warnings(record=True):
-
-                # valid terms
-                terms = [('major_axis=20121114'),
-                         ('major_axis>20121114'),
-                         (("major_axis=['20121114', '20121114']"),),
-                         ('major_axis=datetime.datetime(2012, 11, 14)'),
-                         'major_axis> 20121114',
-                         'major_axis >20121114',
-                         'major_axis > 20121114',
-                         (("minor_axis=['A', 'B']"),),
-                         (("minor_axis=['A', 'B']"),),
-                         ((("minor_axis==['A', 'B']"),),),
-                         (("items=['ItemA', 'ItemB']"),),
-                         ('items=ItemA'),
-                         ]
-
-                for t in terms:
-                    store.select('wp', t)
-                    store.select('p4d', t)
-
-                # valid for p4d only
-                terms = [(("labels=['l1', 'l2']"),),
-                         Term("labels=['l1', 'l2']"),
-                         ]
-
-                for t in terms:
-                    store.select('p4d', t)
-
-            with tm.assertRaisesRegexp(TypeError,
-                                       'Only named functions are supported'):
-                store.select('wp', Term(
-                    'major_axis == (lambda x: x)("20130101")'))
-
-            # check USub node parsing
-            res = store.select('wpneg', Term('items == -1'))
-            expected = Panel({-1: wpneg[-1]})
-            tm.assert_panel_equal(res, expected)
-
-            with tm.assertRaisesRegexp(NotImplementedError,
-                                       'Unary addition not supported'):
-                store.select('wpneg', Term('items == +1'))
-
-    def test_term_compat(self):
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp', wp)
-
-            result = store.select(
-                'wp', "major_axis>20000102 and minor_axis=['A', 'B']")
-            expected = wp.loc[:, wp.major_axis >
-                              Timestamp('20000102'), ['A', 'B']]
-            assert_panel_equal(result, expected)
-
-            store.remove('wp', 'major_axis>20000103')
-            result = store.select('wp')
-            expected = wp.loc[:, wp.major_axis <= Timestamp('20000103'), :]
-            assert_panel_equal(result, expected)
-
-        with ensure_clean_store(self.path) as store:
-
-            wp = Panel(np.random.randn(2, 5, 4), items=['Item1', 'Item2'],
-                       major_axis=date_range('1/1/2000', periods=5),
-                       minor_axis=['A', 'B', 'C', 'D'])
-            store.append('wp', wp)
-
-            # stringified datetimes
-            result = store.select(
-                'wp', "major_axis>datetime.datetime(2000, 1, 2)")
-            expected = wp.loc[:, wp.major_axis > Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-
-            result = store.select(
-                'wp', "major_axis>datetime.datetime(2000, 1, 2, 0, 0)")
-            expected = wp.loc[:, wp.major_axis > Timestamp('20000102')]
-            assert_panel_equal(result, expected)
-
-            result = store.select(
-                'wp', ("major_axis=[datetime.datetime(2000, 1, 2, 0, 0), "
-                       "datetime.datetime(2000, 1, 3, 0, 0)]"))
-            expected = wp.loc[:, [Timestamp('20000102'),
-                                  Timestamp('20000103')]]
-            assert_panel_equal(result, expected)
-
-            result = store.select('wp', "minor_axis=['A', 'B']")
-            expected = wp.loc[:, :, ['A', 'B']]
-            assert_panel_equal(result, expected)
+            pytest.raises(ValueError, read_hdf, path,
+                          'dfq', where="A>0 or C>0")
 
     def test_same_name_scoping(self):
 
@@ -2665,6 +2260,7 @@ def test_float_index(self):
         s = Series(np.random.randn(10), index=index)
         self._check_roundtrip(s, tm.assert_series_equal)
 
+    @xfail_non_writeable
     def test_tuple_index(self):
 
         # GH #492
@@ -2674,16 +2270,20 @@ def test_tuple_index(self):
         DF = DataFrame(data, index=idx, columns=col)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", pd.errors.PerformanceWarning)
             self._check_roundtrip(DF, tm.assert_frame_equal)
 
+    @xfail_non_writeable
+    @pytest.mark.filterwarnings("ignore::pandas.errors.PerformanceWarning")
     def test_index_types(self):
 
-        values = np.random.randn(2)
+        with catch_warnings(record=True):
+            values = np.random.randn(2)
 
-        func = lambda l, r: tm.assert_series_equal(l, r,
-                                                   check_dtype=True,
-                                                   check_index_type=True,
-                                                   check_series_type=True)
+            func = lambda l, r: tm.assert_series_equal(l, r,
+                                                       check_dtype=True,
+                                                       check_index_type=True,
+                                                       check_series_type=True)
 
         with catch_warnings(record=True):
             ser = Series(values, [0, 'y'])
@@ -2702,24 +2302,34 @@ def test_index_types(self):
             self._check_roundtrip(ser, func)
 
         with catch_warnings(record=True):
+
+            ser = Series(values, [0, 'y'])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [datetime.datetime.today(), 0])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, ['y', 0])
+            self._check_roundtrip(ser, func)
+
+            ser = Series(values, [datetime.date.today(), 'a'])
+            self._check_roundtrip(ser, func)
+
             ser = Series(values, [1.23, 'b'])
             self._check_roundtrip(ser, func)
 
-        ser = Series(values, [1, 1.53])
-        self._check_roundtrip(ser, func)
+            ser = Series(values, [1, 1.53])
+            self._check_roundtrip(ser, func)
 
-        ser = Series(values, [1, 5])
-        self._check_roundtrip(ser, func)
+            ser = Series(values, [1, 5])
+            self._check_roundtrip(ser, func)
 
-        ser = Series(values, [datetime.datetime(
-            2012, 1, 1), datetime.datetime(2012, 1, 2)])
-        self._check_roundtrip(ser, func)
+            ser = Series(values, [datetime.datetime(
+                2012, 1, 1), datetime.datetime(2012, 1, 2)])
+            self._check_roundtrip(ser, func)
 
     def test_timeseries_preepoch(self):
 
-        if sys.version_info[0] == 2 and sys.version_info[1] < 7:
-            pytest.skip("won't work on Python < 2.7")
-
         dr = bdate_range('1/1/1940', '1/1/1960')
         ts = Series(np.random.randn(len(dr)), index=dr)
         try:
@@ -2727,7 +2337,11 @@ def test_timeseries_preepoch(self):
         except OverflowError:
             pytest.skip('known failer on some windows platforms')
 
-    def test_frame(self):
+    @xfail_non_writeable
+    @pytest.mark.parametrize("compression", [
+        False, pytest.param(True, marks=td.skip_if_windows_python_3)
+    ])
+    def test_frame(self, compression):
 
         df = tm.makeDataFrame()
 
@@ -2735,32 +2349,26 @@ def test_frame(self):
         df.values[0, 0] = np.nan
         df.values[5, 3] = np.nan
 
-        self._check_roundtrip_table(df, tm.assert_frame_equal)
-        self._check_roundtrip(df, tm.assert_frame_equal)
-
-        if not skip_compression:
-            self._check_roundtrip_table(df, tm.assert_frame_equal,
-                                        compression=True)
-            self._check_roundtrip(df, tm.assert_frame_equal,
-                                  compression=True)
+        self._check_roundtrip_table(df, tm.assert_frame_equal,
+                                    compression=compression)
+        self._check_roundtrip(df, tm.assert_frame_equal,
+                              compression=compression)
 
         tdf = tm.makeTimeDataFrame()
-        self._check_roundtrip(tdf, tm.assert_frame_equal)
-
-        if not skip_compression:
-            self._check_roundtrip(tdf, tm.assert_frame_equal,
-                                  compression=True)
+        self._check_roundtrip(tdf, tm.assert_frame_equal,
+                              compression=compression)
 
         with ensure_clean_store(self.path) as store:
             # not consolidated
             df['foo'] = np.random.randn(len(df))
             store['df'] = df
             recons = store['df']
-            self.assertTrue(recons._data.is_consolidated())
+            assert recons._data.is_consolidated()
 
         # empty
         self._check_roundtrip(df[:0], tm.assert_frame_equal)
 
+    @xfail_non_writeable
     def test_empty_series_frame(self):
         s0 = Series()
         s1 = Series(name='myseries')
@@ -2774,8 +2382,10 @@ def test_empty_series_frame(self):
         self._check_roundtrip(df1, tm.assert_frame_equal)
         self._check_roundtrip(df2, tm.assert_frame_equal)
 
-    def test_empty_series(self):
-        for dtype in [np.int64, np.float64, np.object, 'm8[ns]', 'M8[ns]']:
+    @xfail_non_writeable
+    @pytest.mark.parametrize(
+        'dtype', [np.int64, np.float64, np.object, 'm8[ns]', 'M8[ns]'])
+    def test_empty_series(self, dtype):
             s = Series(dtype=dtype)
             self._check_roundtrip(s, tm.assert_series_equal)
 
@@ -2789,8 +2399,8 @@ def test_can_serialize_dates(self):
     def test_store_hierarchical(self):
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
                                    ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['foo', 'bar'])
         frame = DataFrame(np.random.randn(10, 3), index=index,
                           columns=['A', 'B', 'C'])
@@ -2826,6 +2436,27 @@ def test_store_index_name_with_tz(self):
             recons = store['frame']
             tm.assert_frame_equal(recons, df)
 
+    @pytest.mark.parametrize('table_format', ['table', 'fixed'])
+    def test_store_index_name_numpy_str(self, table_format):
+        # GH #13492
+        idx = pd.Index(pd.to_datetime([datetime.date(2000, 1, 1),
+                                       datetime.date(2000, 1, 2)]),
+                       name=u('cols\u05d2'))
+        idx1 = pd.Index(pd.to_datetime([datetime.date(2010, 1, 1),
+                                        datetime.date(2010, 1, 2)]),
+                        name=u('rows\u05d0'))
+        df = pd.DataFrame(np.arange(4).reshape(2, 2), columns=idx, index=idx1)
+
+        # This used to fail, returning numpy strings instead of python strings.
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format=table_format)
+            df2 = read_hdf(path, 'df')
+
+            assert_frame_equal(df, df2, check_names=True)
+
+            assert type(df2.index.name) == text_type
+            assert type(df2.columns.name) == text_type
+
     def test_store_series_name(self):
         df = tm.makeDataFrame()
         series = df['A']
@@ -2835,7 +2466,11 @@ def test_store_series_name(self):
             recons = store['series']
             tm.assert_series_equal(recons, series)
 
-    def test_store_mixed(self):
+    @xfail_non_writeable
+    @pytest.mark.parametrize("compression", [
+        False, pytest.param(True, marks=td.skip_if_windows_python_3)
+    ])
+    def test_store_mixed(self, compression):
 
         def _make_one():
             df = tm.makeDataFrame()
@@ -2860,30 +2495,16 @@ def _make_one():
             tm.assert_frame_equal(store['obj'], df2)
 
         # check that can store Series of all of these types
-        self._check_roundtrip(df1['obj1'], tm.assert_series_equal)
-        self._check_roundtrip(df1['bool1'], tm.assert_series_equal)
-        self._check_roundtrip(df1['int1'], tm.assert_series_equal)
-
-        if not skip_compression:
-            self._check_roundtrip(df1['obj1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1['bool1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1['int1'], tm.assert_series_equal,
-                                  compression=True)
-            self._check_roundtrip(df1, tm.assert_frame_equal,
-                                  compression=True)
-
-    def test_wide(self):
-
-        wp = tm.makePanel()
-        self._check_roundtrip(wp, assert_panel_equal)
-
-    def test_wide_table(self):
-
-        wp = tm.makePanel()
-        self._check_roundtrip_table(wp, assert_panel_equal)
-
+        self._check_roundtrip(df1['obj1'], tm.assert_series_equal,
+                              compression=compression)
+        self._check_roundtrip(df1['bool1'], tm.assert_series_equal,
+                              compression=compression)
+        self._check_roundtrip(df1['int1'], tm.assert_series_equal,
+                              compression=compression)
+
+    @pytest.mark.filterwarnings(
+        "ignore:\\nduplicate:pandas.io.pytables.DuplicateWarning"
+    )
     def test_select_with_dups(self):
 
         # single dtypes
@@ -2905,7 +2526,7 @@ def test_select_with_dups(self):
             expected = df.loc[:, ['A']]
             assert_frame_equal(result, expected)
 
-        # dups accross dtypes
+        # dups across dtypes
         df = concat([DataFrame(np.random.randn(10, 4),
                                columns=['A', 'A', 'B', 'B']),
                      DataFrame(np.random.randint(0, 10, size=20)
@@ -2943,30 +2564,6 @@ def test_select_with_dups(self):
             result = store.select('df', columns=['B', 'A'])
             assert_frame_equal(result, expected, by_blocks=True)
 
-    def test_wide_table_dups(self):
-        wp = tm.makePanel()
-        with ensure_clean_store(self.path) as store:
-            store.put('panel', wp, format='table')
-            store.put('panel', wp, format='table', append=True)
-
-            with catch_warnings(record=True):
-                recons = store['panel']
-
-            assert_panel_equal(recons, wp)
-
-    def test_long(self):
-        def _check(left, right):
-            assert_panel_equal(left.to_panel(), right.to_panel())
-
-        wp = tm.makePanel()
-        self._check_roundtrip(wp.to_frame(), _check)
-
-        # empty
-        # self._check_roundtrip(wp.to_frame()[:0], _check)
-
-    def test_longpanel(self):
-        pass
-
     def test_overwrite_node(self):
 
         with ensure_clean_store(self.path) as store:
@@ -3009,70 +2606,44 @@ def test_sparse_with_compression(self):
                                      check_frame_type=True)
 
     def test_select(self):
-        wp = tm.makePanel()
 
         with ensure_clean_store(self.path) as store:
 
-            # put/select ok
-            _maybe_remove(store, 'wp')
-            store.put('wp', wp, format='table')
-            store.select('wp')
-
-            # non-table ok (where = None)
-            _maybe_remove(store, 'wp')
-            store.put('wp2', wp)
-            store.select('wp2')
-
-            # selection on the non-indexable with a large number of columns
-            wp = Panel(np.random.randn(100, 100, 100),
-                       items=['Item%03d' % i for i in range(100)],
-                       major_axis=date_range('1/1/2000', periods=100),
-                       minor_axis=['E%03d' % i for i in range(100)])
-
-            _maybe_remove(store, 'wp')
-            store.append('wp', wp)
-            items = ['Item%03d' % i for i in range(80)]
-            result = store.select('wp', Term('items=items'))
-            expected = wp.reindex(items=items)
-            assert_panel_equal(expected, result)
-
-            # selectin non-table with a where
-            # self.assertRaises(ValueError, store.select,
-            #                  'wp2', ('column', ['A', 'D']))
-
-            # select with columns=
-            df = tm.makeTimeDataFrame()
-            _maybe_remove(store, 'df')
-            store.append('df', df)
-            result = store.select('df', columns=['A', 'B'])
-            expected = df.reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
+            with catch_warnings(record=True):
 
-            # equivalentsly
-            result = store.select('df', [("columns=['A', 'B']")])
-            expected = df.reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
+                # select with columns=
+                df = tm.makeTimeDataFrame()
+                _maybe_remove(store, 'df')
+                store.append('df', df)
+                result = store.select('df', columns=['A', 'B'])
+                expected = df.reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
 
-            # with a data column
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['A'])
-            result = store.select('df', ['A > 0'], columns=['A', 'B'])
-            expected = df[df.A > 0].reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
+                # equivalentsly
+                result = store.select('df', [("columns=['A', 'B']")])
+                expected = df.reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
 
-            # all a data columns
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=True)
-            result = store.select('df', ['A > 0'], columns=['A', 'B'])
-            expected = df[df.A > 0].reindex(columns=['A', 'B'])
-            tm.assert_frame_equal(expected, result)
+                # with a data column
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=['A'])
+                result = store.select('df', ['A > 0'], columns=['A', 'B'])
+                expected = df[df.A > 0].reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
 
-            # with a data column, but different columns
-            _maybe_remove(store, 'df')
-            store.append('df', df, data_columns=['A'])
-            result = store.select('df', ['A > 0'], columns=['C', 'D'])
-            expected = df[df.A > 0].reindex(columns=['C', 'D'])
-            tm.assert_frame_equal(expected, result)
+                # all a data columns
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=True)
+                result = store.select('df', ['A > 0'], columns=['A', 'B'])
+                expected = df[df.A > 0].reindex(columns=['A', 'B'])
+                tm.assert_frame_equal(expected, result)
+
+                # with a data column, but different columns
+                _maybe_remove(store, 'df')
+                store.append('df', df, data_columns=['A'])
+                result = store.select('df', ['A > 0'], columns=['C', 'D'])
+                expected = df[df.A > 0].reindex(columns=['C', 'D'])
+                tm.assert_frame_equal(expected, result)
 
     def test_select_dtypes(self):
 
@@ -3084,7 +2655,7 @@ def test_select_dtypes(self):
             _maybe_remove(store, 'df')
             store.append('df', df, data_columns=['ts', 'A'])
 
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01')")])
+            result = store.select('df', "ts>=Timestamp('2012-02-01')")
             expected = df[df.ts >= Timestamp('2012-02-01')]
             tm.assert_frame_equal(expected, result)
 
@@ -3099,15 +2670,15 @@ def test_select_dtypes(self):
             expected = (df[df.boolv == True]  # noqa
                         .reindex(columns=['A', 'boolv']))
             for v in [True, 'true', 1]:
-                result = store.select('df', Term(
-                    'boolv == %s' % str(v)), columns=['A', 'boolv'])
+                result = store.select('df', 'boolv == %s' % str(v),
+                                      columns=['A', 'boolv'])
                 tm.assert_frame_equal(expected, result)
 
             expected = (df[df.boolv == False]  # noqa
                         .reindex(columns=['A', 'boolv']))
             for v in [False, 'false', 0]:
-                result = store.select('df', Term(
-                    'boolv == %s' % str(v)), columns=['A', 'boolv'])
+                result = store.select(
+                    'df', 'boolv == %s' % str(v), columns=['A', 'boolv'])
                 tm.assert_frame_equal(expected, result)
 
             # integer index
@@ -3115,7 +2686,7 @@ def test_select_dtypes(self):
             _maybe_remove(store, 'df_int')
             store.append('df_int', df)
             result = store.select(
-                'df_int', [Term("index<10"), Term("columns=['A']")])
+                'df_int', "index<10 and columns=['A']")
             expected = df.reindex(index=list(df.index)[0:10], columns=['A'])
             tm.assert_frame_equal(expected, result)
 
@@ -3125,7 +2696,7 @@ def test_select_dtypes(self):
             _maybe_remove(store, 'df_float')
             store.append('df_float', df)
             result = store.select(
-                'df_float', [Term("index<10.0"), Term("columns=['A']")])
+                'df_float', "index<10.0 and columns=['A']")
             expected = df.reindex(index=list(df.index)[0:10], columns=['A'])
             tm.assert_frame_equal(expected, result)
 
@@ -3196,14 +2767,14 @@ def test_select_with_many_inputs(self):
             store.append('df', df, data_columns=['ts', 'A', 'B', 'users'])
 
             # regular select
-            result = store.select('df', [Term("ts>=Timestamp('2012-02-01')")])
+            result = store.select('df', "ts>=Timestamp('2012-02-01')")
             expected = df[df.ts >= Timestamp('2012-02-01')]
             tm.assert_frame_equal(expected, result)
 
             # small selector
             result = store.select(
-                'df', [Term("ts>=Timestamp('2012-02-01') & "
-                            "users=['a','b','c']")])
+                'df',
+                "ts>=Timestamp('2012-02-01') & users=['a','b','c']")
             expected = df[(df.ts >= Timestamp('2012-02-01')) &
                           df.users.isin(['a', 'b', 'c'])]
             tm.assert_frame_equal(expected, result)
@@ -3211,24 +2782,24 @@ def test_select_with_many_inputs(self):
             # big selector along the columns
             selector = ['a', 'b', 'c'] + ['a%03d' % i for i in range(60)]
             result = store.select(
-                'df', [Term("ts>=Timestamp('2012-02-01')"),
-                       Term('users=selector')])
+                'df',
+                "ts>=Timestamp('2012-02-01') and users=selector")
             expected = df[(df.ts >= Timestamp('2012-02-01')) &
                           df.users.isin(selector)]
             tm.assert_frame_equal(expected, result)
 
             selector = range(100, 200)
-            result = store.select('df', [Term('B=selector')])
+            result = store.select('df', 'B=selector')
             expected = df[df.B.isin(selector)]
             tm.assert_frame_equal(expected, result)
-            self.assertEqual(len(result), 100)
+            assert len(result) == 100
 
             # big selector along the index
             selector = Index(df.ts[0:100].values)
-            result = store.select('df', [Term('ts=selector')])
+            result = store.select('df', 'ts=selector')
             expected = df[df.ts.isin(selector.values)]
             tm.assert_frame_equal(expected, result)
-            self.assertEqual(len(result), 100)
+            assert len(result) == 100
 
     def test_select_iterator(self):
 
@@ -3246,7 +2817,7 @@ def test_select_iterator(self):
             tm.assert_frame_equal(expected, result)
 
             results = [s for s in store.select('df', chunksize=100)]
-            self.assertEqual(len(results), 5)
+            assert len(results) == 5
             result = concat(results)
             tm.assert_frame_equal(expected, result)
 
@@ -3258,10 +2829,10 @@ def test_select_iterator(self):
 
             df = tm.makeTimeDataFrame(500)
             df.to_hdf(path, 'df_non_table')
-            self.assertRaises(TypeError, read_hdf, path,
-                              'df_non_table', chunksize=100)
-            self.assertRaises(TypeError, read_hdf, path,
-                              'df_non_table', iterator=True)
+            pytest.raises(TypeError, read_hdf, path,
+                          'df_non_table', chunksize=100)
+            pytest.raises(TypeError, read_hdf, path,
+                          'df_non_table', iterator=True)
 
         with ensure_clean_path(self.path) as path:
 
@@ -3271,7 +2842,7 @@ def test_select_iterator(self):
             results = [s for s in read_hdf(path, 'df', chunksize=100)]
             result = concat(results)
 
-            self.assertEqual(len(results), 5)
+            assert len(results) == 5
             tm.assert_frame_equal(result, df)
             tm.assert_frame_equal(result, read_hdf(path, 'df'))
 
@@ -3296,17 +2867,6 @@ def test_select_iterator(self):
             result = concat(results)
             tm.assert_frame_equal(expected, result)
 
-            # where selection
-            # expected = store.select_as_multiple(
-            #    ['df1', 'df2'], where= Term('A>0'), selector='df1')
-            # results = []
-            # for s in store.select_as_multiple(
-            #    ['df1', 'df2'], where= Term('A>0'), selector='df1',
-            #        chunksize=25):
-            #    results.append(s)
-            # result = concat(results)
-            # tm.assert_frame_equal(expected, result)
-
     def test_select_iterator_complete_8014(self):
 
         # GH 8014
@@ -3435,7 +2995,7 @@ def test_select_iterator_non_complete_8014(self):
             where = "index > '%s'" % end_dt
             results = [s for s in store.select(
                 'df', where=where, chunksize=chunksize)]
-            self.assertEqual(0, len(results))
+            assert 0 == len(results)
 
     def test_select_iterator_many_empty_frames(self):
 
@@ -3467,7 +3027,7 @@ def test_select_iterator_many_empty_frames(self):
             results = [s for s in store.select(
                 'df', where=where, chunksize=chunksize)]
 
-            tm.assert_equal(1, len(results))
+            assert len(results) == 1
             result = concat(results)
             rexpected = expected[expected.index <= end_dt]
             tm.assert_frame_equal(rexpected, result)
@@ -3478,7 +3038,7 @@ def test_select_iterator_many_empty_frames(self):
                 'df', where=where, chunksize=chunksize)]
 
             # should be 1, is 10
-            tm.assert_equal(1, len(results))
+            assert len(results) == 1
             result = concat(results)
             rexpected = expected[(expected.index >= beg_dt) &
                                  (expected.index <= end_dt)]
@@ -3496,8 +3056,11 @@ def test_select_iterator_many_empty_frames(self):
                 'df', where=where, chunksize=chunksize)]
 
             # should be []
-            tm.assert_equal(0, len(results))
+            assert len(results) == 0
 
+    @pytest.mark.filterwarnings(
+        "ignore:\\nthe :pandas.io.pytables.AttributeConflictWarning"
+    )
     def test_retain_index_attributes(self):
 
         # GH 3499, losing frequency info on index recreation
@@ -3514,19 +3077,18 @@ def test_retain_index_attributes(self):
 
             for attr in ['freq', 'tz', 'name']:
                 for idx in ['index', 'columns']:
-                    self.assertEqual(getattr(getattr(df, idx), attr, None),
-                                     getattr(getattr(result, idx), attr, None))
+                    assert (getattr(getattr(df, idx), attr, None) ==
+                            getattr(getattr(result, idx), attr, None))
 
             # try to append a table with a different frequency
-            with tm.assert_produces_warning(
-                    expected_warning=AttributeConflictWarning):
+            with catch_warnings(record=True):
                 df2 = DataFrame(dict(
                     A=Series(lrange(3),
                              index=date_range('2002-1-1',
                                               periods=3, freq='D'))))
                 store.append('data', df2)
 
-            self.assertIsNone(store.get_storer('data').info['index']['freq'])
+            assert store.get_storer('data').info['index']['freq'] is None
 
             # this is ok
             _maybe_remove(store, 'df2')
@@ -3541,12 +3103,13 @@ def test_retain_index_attributes(self):
                                           freq='D'))))
             store.append('df2', df3)
 
+    @pytest.mark.filterwarnings(
+        "ignore:\\nthe :pandas.io.pytables.AttributeConflictWarning"
+    )
     def test_retain_index_attributes2(self):
         with ensure_clean_path(self.path) as path:
 
-            expected_warning = Warning if PY35 else AttributeConflictWarning
-            with tm.assert_produces_warning(expected_warning=expected_warning,
-                                            check_stacklevel=False):
+            with catch_warnings(record=True):
 
                 df = DataFrame(dict(
                     A=Series(lrange(3),
@@ -3564,37 +3127,16 @@ def test_retain_index_attributes2(self):
                 df = DataFrame(dict(A=Series(lrange(3), index=idx)))
                 df.to_hdf(path, 'data', mode='w', append=True)
 
-            self.assertEqual(read_hdf(path, 'data').index.name, 'foo')
+            assert read_hdf(path, 'data').index.name == 'foo'
 
-            with tm.assert_produces_warning(expected_warning=expected_warning,
-                                            check_stacklevel=False):
+            with catch_warnings(record=True):
 
                 idx2 = date_range('2001-1-1', periods=3, freq='H')
                 idx2.name = 'bar'
                 df2 = DataFrame(dict(A=Series(lrange(3), index=idx2)))
                 df2.to_hdf(path, 'data', append=True)
 
-            self.assertIsNone(read_hdf(path, 'data').index.name)
-
-    def test_panel_select(self):
-
-        wp = tm.makePanel()
-
-        with ensure_clean_store(self.path) as store:
-            store.put('wp', wp, format='table')
-            date = wp.major_axis[len(wp.major_axis) // 2]
-
-            crit1 = ('major_axis>=date')
-            crit2 = ("minor_axis=['A', 'D']")
-
-            result = store.select('wp', [crit1, crit2])
-            expected = wp.truncate(before=date).reindex(minor=['A', 'D'])
-            assert_panel_equal(result, expected)
-
-            result = store.select(
-                'wp', ['major_axis>="20000124"', ("minor_axis=['A', 'B']")])
-            expected = wp.truncate(before='20000124').reindex(minor=['A', 'B'])
-            assert_panel_equal(result, expected)
+            assert read_hdf(path, 'data').index.name is None
 
     def test_frame_select(self):
 
@@ -3605,7 +3147,7 @@ def test_frame_select(self):
             date = df.index[len(df) // 2]
 
             crit1 = Term('index>=date')
-            self.assertEqual(crit1.env.scope['date'], date)
+            assert crit1.env.scope['date'] == date
 
             crit2 = ("columns=['A', 'D']")
             crit3 = ('columns=A')
@@ -3621,12 +3163,12 @@ def test_frame_select(self):
             # invalid terms
             df = tm.makeTimeDataFrame()
             store.append('df_time', df)
-            self.assertRaises(
-                ValueError, store.select, 'df_time', [Term("index>0")])
+            pytest.raises(
+                ValueError, store.select, 'df_time', "index>0")
 
             # can't select if not written as table
             # store['frame'] = df
-            # self.assertRaises(ValueError, store.select,
+            # pytest.raises(ValueError, store.select,
             #                  'frame', [crit1, crit2])
 
     def test_frame_select_complex(self):
@@ -3665,8 +3207,8 @@ def test_frame_select_complex(self):
             tm.assert_frame_equal(result, expected)
 
             # invert not implemented in numexpr :(
-            self.assertRaises(NotImplementedError,
-                              store.select, 'df', '~(string="bar")')
+            pytest.raises(NotImplementedError,
+                          store.select, 'df', '~(string="bar")')
 
             # invert ok for filters
             result = store.select('df', "~(columns=['A','B'])")
@@ -3701,7 +3243,7 @@ def test_frame_select_complex2(self):
 
             hist.to_hdf(hh, 'df', mode='w', format='table')
 
-            expected = read_hdf(hh, 'df', where="l1=[2, 3, 4]")
+            expected = read_hdf(hh, 'df', where='l1=[2, 3, 4]')
 
             # sccope with list like
             l = selection.index.tolist()  # noqa
@@ -3754,12 +3296,12 @@ def test_invalid_filtering(self):
             store.put('df', df, format='table')
 
             # not implemented
-            self.assertRaises(NotImplementedError, store.select,
-                              'df', "columns=['A'] | columns=['B']")
+            pytest.raises(NotImplementedError, store.select,
+                          'df', "columns=['A'] | columns=['B']")
 
             # in theory we could deal with this
-            self.assertRaises(NotImplementedError, store.select,
-                              'df', "columns=['A','B'] & columns=['C']")
+            pytest.raises(NotImplementedError, store.select,
+                          'df', "columns=['A','B'] & columns=['C']")
 
     def test_string_select(self):
         # GH 2973
@@ -3791,7 +3333,7 @@ def test_string_select(self):
 
             store.append('df2', df2, data_columns=['x'])
             result = store.select('df2', 'x!=none')
-            expected = df2[isnull(df2.x)]
+            expected = df2[isna(df2.x)]
             assert_frame_equal(result, expected)
 
             # int ==/!=
@@ -3814,22 +3356,29 @@ def test_read_column(self):
 
         with ensure_clean_store(self.path) as store:
             _maybe_remove(store, 'df')
-            store.append('df', df)
 
+            # GH 17912
+            # HDFStore.select_column should raise a KeyError
+            # exception if the key is not a valid store
+            with pytest.raises(KeyError,
+                               match='No object named df in the file'):
+                store.select_column('df', 'index')
+
+            store.append('df', df)
             # error
-            self.assertRaises(KeyError, store.select_column, 'df', 'foo')
+            pytest.raises(KeyError, store.select_column, 'df', 'foo')
 
             def f():
                 store.select_column('df', 'index', where=['index>5'])
-            self.assertRaises(Exception, f)
+            pytest.raises(Exception, f)
 
             # valid
             result = store.select_column('df', 'index')
             tm.assert_almost_equal(result.values, Series(df.index).values)
-            self.assertIsInstance(result, Series)
+            assert isinstance(result, Series)
 
             # not a data indexable column
-            self.assertRaises(
+            pytest.raises(
                 ValueError, store.select_column, 'df', 'values_block_0')
 
             # a data column
@@ -3901,7 +3450,7 @@ def test_coordinates(self):
             result = store.select('df', where=c)
             expected = df.loc[3:4, :]
             tm.assert_frame_equal(result, expected)
-            self.assertIsInstance(c, Index)
+            assert isinstance(c, Index)
 
             # multiple tables
             _maybe_remove(store, 'df1')
@@ -3939,14 +3488,14 @@ def test_coordinates(self):
             tm.assert_frame_equal(result, expected)
 
             # invalid
-            self.assertRaises(ValueError, store.select, 'df',
-                              where=np.arange(len(df), dtype='float64'))
-            self.assertRaises(ValueError, store.select, 'df',
-                              where=np.arange(len(df) + 1))
-            self.assertRaises(ValueError, store.select, 'df',
-                              where=np.arange(len(df)), start=5)
-            self.assertRaises(ValueError, store.select, 'df',
-                              where=np.arange(len(df)), start=5, stop=10)
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df), dtype='float64'))
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df) + 1))
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df)), start=5)
+            pytest.raises(ValueError, store.select, 'df',
+                          where=np.arange(len(df)), start=5, stop=10)
 
             # selection with filter
             selection = date_range('20000101', periods=500)
@@ -3982,12 +3531,12 @@ def test_append_to_multiple(self):
         with ensure_clean_store(self.path) as store:
 
             # exceptions
-            self.assertRaises(ValueError, store.append_to_multiple,
-                              {'df1': ['A', 'B'], 'df2': None}, df,
-                              selector='df3')
-            self.assertRaises(ValueError, store.append_to_multiple,
-                              {'df1': None, 'df2': None}, df, selector='df3')
-            self.assertRaises(
+            pytest.raises(ValueError, store.append_to_multiple,
+                          {'df1': ['A', 'B'], 'df2': None}, df,
+                          selector='df3')
+            pytest.raises(ValueError, store.append_to_multiple,
+                          {'df1': None, 'df2': None}, df, selector='df3')
+            pytest.raises(
                 ValueError, store.append_to_multiple, 'df1', df, 'df1')
 
             # regular operation
@@ -4005,6 +3554,7 @@ def test_append_to_multiple_dropna(self):
         df = concat([df1, df2], axis=1)
 
         with ensure_clean_store(self.path) as store:
+
             # dropna=True should guarantee rows are synchronized
             store.append_to_multiple(
                 {'df1': ['A', 'B'], 'df2': None}, df, selector='df1',
@@ -4015,14 +3565,27 @@ def test_append_to_multiple_dropna(self):
             tm.assert_index_equal(store.select('df1').index,
                                   store.select('df2').index)
 
+    @pytest.mark.xfail(run=False,
+                       reason="append_to_multiple_dropna_false "
+                       "is not raising as failed")
+    def test_append_to_multiple_dropna_false(self):
+        df1 = tm.makeTimeDataFrame()
+        df2 = tm.makeTimeDataFrame().rename(columns=lambda x: "%s_2" % x)
+        df1.iloc[1, df1.columns.get_indexer(['A', 'B'])] = np.nan
+        df = concat([df1, df2], axis=1)
+
+        with ensure_clean_store(self.path) as store:
+
             # dropna=False shouldn't synchronize row indexes
             store.append_to_multiple(
-                {'df1': ['A', 'B'], 'df2': None}, df, selector='df1',
+                {'df1a': ['A', 'B'], 'df2a': None}, df, selector='df1a',
                 dropna=False)
-            self.assertRaises(
-                ValueError, store.select_as_multiple, ['df1', 'df2'])
-            assert not store.select('df1').index.equals(
-                store.select('df2').index)
+
+            with pytest.raises(ValueError):
+                store.select_as_multiple(['df1a', 'df2a'])
+
+            assert not store.select('df1a').index.equals(
+                store.select('df2a').index)
 
     def test_select_as_multiple(self):
 
@@ -4033,25 +3596,25 @@ def test_select_as_multiple(self):
         with ensure_clean_store(self.path) as store:
 
             # no tables stored
-            self.assertRaises(Exception, store.select_as_multiple,
-                              None, where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(Exception, store.select_as_multiple,
+                          None, where=['A>0', 'B>0'], selector='df1')
 
             store.append('df1', df1, data_columns=['A', 'B'])
             store.append('df2', df2)
 
             # exceptions
-            self.assertRaises(Exception, store.select_as_multiple,
-                              None, where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(Exception, store.select_as_multiple,
-                              [None], where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df1', 'df3'], where=['A>0', 'B>0'],
-                              selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df3'], where=['A>0', 'B>0'], selector='df1')
-            self.assertRaises(KeyError, store.select_as_multiple,
-                              ['df1', 'df2'], where=['A>0', 'B>0'],
-                              selector='df4')
+            pytest.raises(Exception, store.select_as_multiple,
+                          None, where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(Exception, store.select_as_multiple,
+                          [None], where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df1', 'df3'], where=['A>0', 'B>0'],
+                          selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df3'], where=['A>0', 'B>0'], selector='df1')
+            pytest.raises(KeyError, store.select_as_multiple,
+                          ['df1', 'df2'], where=['A>0', 'B>0'],
+                          selector='df4')
 
             # default select
             result = store.select('df1', ['A>0', 'B>0'])
@@ -4078,17 +3641,16 @@ def test_select_as_multiple(self):
 
             # test excpection for diff rows
             store.append('df3', tm.makeTimeDataFrame(nper=50))
-            self.assertRaises(ValueError, store.select_as_multiple,
-                              ['df1', 'df3'], where=['A>0', 'B>0'],
-                              selector='df1')
-
+            pytest.raises(ValueError, store.select_as_multiple,
+                          ['df1', 'df3'], where=['A>0', 'B>0'],
+                          selector='df1')
+
+    @pytest.mark.skipif(
+        LooseVersion(tables.__version__) < LooseVersion('3.1.0'),
+        reason=("tables version does not support fix for nan selection "
+                "bug: GH 4858"))
     def test_nan_selection_bug_4858(self):
 
-        # GH 4858; nan selection bug, only works for pytables >= 3.1
-        if LooseVersion(tables.__version__) < '3.1.0':
-            pytest.skip('tables version does not support fix for nan '
-                        'selection bug: GH 4858')
-
         with ensure_clean_store(self.path) as store:
 
             df = DataFrame(dict(cols=range(6), values=range(6)),
@@ -4120,10 +3682,25 @@ def test_start_stop_table(self):
             # out of range
             result = store.select(
                 'df', "columns=['A']", start=30, stop=40)
-            self.assertTrue(len(result) == 0)
+            assert len(result) == 0
             expected = df.loc[30:40, ['A']]
             tm.assert_frame_equal(result, expected)
 
+    def test_start_stop_multiple(self):
+
+        # GH 16209
+        with ensure_clean_store(self.path) as store:
+
+            df = DataFrame({"foo": [1, 2], "bar": [1, 2]})
+
+            store.append_to_multiple({'selector': ['foo'], 'data': None}, df,
+                                     selector='selector')
+            result = store.select_as_multiple(['selector', 'data'],
+                                              selector='selector', start=0,
+                                              stop=1)
+            expected = df.loc[[0], ['foo', 'bar']]
+            tm.assert_frame_equal(result, expected)
+
     def test_start_stop_fixed(self):
 
         with ensure_clean_store(self.path) as store:
@@ -4167,7 +3744,7 @@ def test_start_stop_fixed(self):
             df.iloc[8:10, -2] = np.nan
             dfs = df.to_sparse()
             store.put('dfs', dfs)
-            with self.assertRaises(NotImplementedError):
+            with pytest.raises(NotImplementedError):
                 store.select('dfs', start=0, stop=5)
 
     def test_select_filter_corner(self):
@@ -4187,6 +3764,62 @@ def test_select_filter_corner(self):
             result = store.select('frame', [crit])
             tm.assert_frame_equal(result, df.loc[:, df.columns[:75:2]])
 
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+
+        result = tm.round_trip_pathlib(
+            lambda p: df.to_hdf(p, 'df'),
+            lambda p: pd.read_hdf(p, 'df'))
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize('start, stop', [(0, 2), (1, 2), (None, None)])
+    def test_contiguous_mixed_data_table(self, start, stop):
+        # GH 17021
+        # ValueError when reading a contiguous mixed-data table ft. VLArray
+        df = DataFrame({'a': Series([20111010, 20111011, 20111012]),
+                        'b': Series(['ab', 'cd', 'ab'])})
+
+        with ensure_clean_store(self.path) as store:
+            store.append('test_dataset', df)
+
+            result = store.select('test_dataset', start=start, stop=stop)
+            assert_frame_equal(df[start:stop], result)
+
+    def test_path_pathlib_hdfstore(self):
+        df = tm.makeDataFrame()
+
+        def writer(path):
+            with pd.HDFStore(path) as store:
+                df.to_hdf(store, 'df')
+
+        def reader(path):
+            with pd.HDFStore(path) as store:
+                return pd.read_hdf(store, 'df')
+
+        result = tm.round_trip_pathlib(writer, reader)
+        tm.assert_frame_equal(df, result)
+
+    def test_pickle_path_localpath(self):
+        df = tm.makeDataFrame()
+        result = tm.round_trip_pathlib(
+            lambda p: df.to_hdf(p, 'df'),
+            lambda p: pd.read_hdf(p, 'df'))
+        tm.assert_frame_equal(df, result)
+
+    def test_path_localpath_hdfstore(self):
+        df = tm.makeDataFrame()
+
+        def writer(path):
+            with pd.HDFStore(path) as store:
+                df.to_hdf(store, 'df')
+
+        def reader(path):
+            with pd.HDFStore(path) as store:
+                return pd.read_hdf(store, 'df')
+
+        result = tm.round_trip_localpath(writer, reader)
+        tm.assert_frame_equal(df, result)
+
     def _check_roundtrip(self, obj, comparator, compression=False, **kwargs):
 
         options = {}
@@ -4220,11 +3853,11 @@ def _check_roundtrip_table(self, obj, comparator, compression=False):
         with ensure_clean_store(self.path, 'w', **options) as store:
             store.put('obj', obj, format='table')
             retrieved = store['obj']
-            # sorted_obj = _test_sort(obj)
+
             comparator(retrieved, obj)
 
     def test_multiple_open_close(self):
-        # GH 4409, open & close multiple times
+        # gh-4409: open & close multiple times
 
         with ensure_clean_path(self.path) as path:
 
@@ -4233,11 +3866,12 @@ def test_multiple_open_close(self):
 
             # single
             store = HDFStore(path)
-            self.assertNotIn('CLOSED', str(store))
-            self.assertTrue(store.is_open)
+            assert 'CLOSED' not in store.info()
+            assert store.is_open
+
             store.close()
-            self.assertIn('CLOSED', str(store))
-            self.assertFalse(store.is_open)
+            assert 'CLOSED' in store.info()
+            assert not store.is_open
 
         with ensure_clean_path(self.path) as path:
 
@@ -4248,7 +3882,7 @@ def test_multiple_open_close(self):
 
                 def f():
                     HDFStore(path)
-                self.assertRaises(ValueError, f)
+                pytest.raises(ValueError, f)
                 store1.close()
 
             else:
@@ -4257,22 +3891,22 @@ def f():
                 store1 = HDFStore(path)
                 store2 = HDFStore(path)
 
-                self.assertNotIn('CLOSED', str(store1))
-                self.assertNotIn('CLOSED', str(store2))
-                self.assertTrue(store1.is_open)
-                self.assertTrue(store2.is_open)
+                assert 'CLOSED' not in store1.info()
+                assert 'CLOSED' not in store2.info()
+                assert store1.is_open
+                assert store2.is_open
 
                 store1.close()
-                self.assertIn('CLOSED', str(store1))
-                self.assertFalse(store1.is_open)
-                self.assertNotIn('CLOSED', str(store2))
-                self.assertTrue(store2.is_open)
+                assert 'CLOSED' in store1.info()
+                assert not store1.is_open
+                assert 'CLOSED' not in store2.info()
+                assert store2.is_open
 
                 store2.close()
-                self.assertIn('CLOSED', str(store1))
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store1.is_open)
-                self.assertFalse(store2.is_open)
+                assert 'CLOSED' in store1.info()
+                assert 'CLOSED' in store2.info()
+                assert not store1.is_open
+                assert not store2.is_open
 
                 # nested close
                 store = HDFStore(path, mode='w')
@@ -4281,12 +3915,12 @@ def f():
                 store2 = HDFStore(path)
                 store2.append('df2', df)
                 store2.close()
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store2.is_open)
+                assert 'CLOSED' in store2.info()
+                assert not store2.is_open
 
                 store.close()
-                self.assertIn('CLOSED', str(store))
-                self.assertFalse(store.is_open)
+                assert 'CLOSED' in store.info()
+                assert not store.is_open
 
                 # double closing
                 store = HDFStore(path, mode='w')
@@ -4294,12 +3928,12 @@ def f():
 
                 store2 = HDFStore(path)
                 store.close()
-                self.assertIn('CLOSED', str(store))
-                self.assertFalse(store.is_open)
+                assert 'CLOSED' in store.info()
+                assert not store.is_open
 
                 store2.close()
-                self.assertIn('CLOSED', str(store2))
-                self.assertFalse(store2.is_open)
+                assert 'CLOSED' in store2.info()
+                assert not store2.is_open
 
         # ops on a closed store
         with ensure_clean_path(self.path) as path:
@@ -4310,100 +3944,75 @@ def f():
             store = HDFStore(path)
             store.close()
 
-            self.assertRaises(ClosedFileError, store.keys)
-            self.assertRaises(ClosedFileError, lambda: 'df' in store)
-            self.assertRaises(ClosedFileError, lambda: len(store))
-            self.assertRaises(ClosedFileError, lambda: store['df'])
-            self.assertRaises(ClosedFileError, lambda: store.df)
-            self.assertRaises(ClosedFileError, store.select, 'df')
-            self.assertRaises(ClosedFileError, store.get, 'df')
-            self.assertRaises(ClosedFileError, store.append, 'df2', df)
-            self.assertRaises(ClosedFileError, store.put, 'df3', df)
-            self.assertRaises(ClosedFileError, store.get_storer, 'df2')
-            self.assertRaises(ClosedFileError, store.remove, 'df2')
-
-            def f():
+            pytest.raises(ClosedFileError, store.keys)
+            pytest.raises(ClosedFileError, lambda: 'df' in store)
+            pytest.raises(ClosedFileError, lambda: len(store))
+            pytest.raises(ClosedFileError, lambda: store['df'])
+            pytest.raises(AttributeError, lambda: store.df)
+            pytest.raises(ClosedFileError, store.select, 'df')
+            pytest.raises(ClosedFileError, store.get, 'df')
+            pytest.raises(ClosedFileError, store.append, 'df2', df)
+            pytest.raises(ClosedFileError, store.put, 'df3', df)
+            pytest.raises(ClosedFileError, store.get_storer, 'df2')
+            pytest.raises(ClosedFileError, store.remove, 'df2')
+
+            with pytest.raises(ClosedFileError, match='file is not open'):
                 store.select('df')
-            tm.assertRaisesRegexp(ClosedFileError, 'file is not open', f)
-
-    def test_pytables_native_read(self):
 
+    def test_pytables_native_read(self, datapath):
         with ensure_clean_store(
-                tm.get_data_path('legacy_hdf/pytables_native.h5'),
+                datapath('io', 'data', 'legacy_hdf/pytables_native.h5'),
                 mode='r') as store:
             d2 = store['detector/readout']
-            self.assertIsInstance(d2, DataFrame)
-
-    def test_pytables_native2_read(self):
-        # fails on win/3.5 oddly
-        if PY35 and is_platform_windows():
-            pytest.skip("native2 read fails oddly on windows / 3.5")
+            assert isinstance(d2, DataFrame)
 
+    @pytest.mark.skipif(PY35 and is_platform_windows(),
+                        reason="native2 read fails oddly on windows / 3.5")
+    def test_pytables_native2_read(self, datapath):
         with ensure_clean_store(
-                tm.get_data_path('legacy_hdf/pytables_native2.h5'),
+                datapath('io', 'data', 'legacy_hdf', 'pytables_native2.h5'),
                 mode='r') as store:
             str(store)
             d1 = store['detector']
-            self.assertIsInstance(d1, DataFrame)
+            assert isinstance(d1, DataFrame)
 
-    def test_legacy_table_read(self):
-        # legacy table types
+    @xfail_non_writeable
+    def test_legacy_table_fixed_format_read_py2(self, datapath):
+        # GH 24510
+        # legacy table with fixed format written in Python 2
         with ensure_clean_store(
-                tm.get_data_path('legacy_hdf/legacy_table.h5'),
+                datapath('io', 'data', 'legacy_hdf',
+                         'legacy_table_fixed_py2.h5'),
                 mode='r') as store:
-            store.select('df1')
-            store.select('df2')
-            store.select('wp1')
-
-            # force the frame
-            store.select('df2', typ='legacy_frame')
-
-            # old version warning
-            with tm.assert_produces_warning(
-                    expected_warning=IncompatibilityWarning):
-                self.assertRaises(
-                    Exception, store.select, 'wp1', 'minor_axis=B')
-
-                df2 = store.select('df2')
-                result = store.select('df2', 'index>df2.index[2]')
-                expected = df2[df2.index > df2.index[2]]
-                assert_frame_equal(expected, result)
-
-    def test_legacy_0_10_read(self):
-        # legacy from 0.10
-        with catch_warnings(record=True):
-            path = tm.get_data_path('legacy_hdf/legacy_0.10.h5')
-            with ensure_clean_store(path, mode='r') as store:
-                str(store)
-                for k in store.keys():
-                    store.select(k)
-
-    def test_legacy_0_11_read(self):
-        # legacy from 0.11
-        path = os.path.join('legacy_hdf', 'legacy_table_0.11.h5')
-        with ensure_clean_store(tm.get_data_path(path), mode='r') as store:
-            str(store)
-            assert 'df' in store
-            assert 'df1' in store
-            assert 'mi' in store
-            df = store.select('df')
-            df1 = store.select('df1')
-            mi = store.select('mi')
-            assert isinstance(df, DataFrame)
-            assert isinstance(df1, DataFrame)
-            assert isinstance(mi, DataFrame)
+            result = store.select('df')
+            expected = pd.DataFrame([[1, 2, 3, 'D']],
+                                    columns=['A', 'B', 'C', 'D'],
+                                    index=pd.Index(['ABC'],
+                                                   name='INDEX_NAME'))
+            assert_frame_equal(expected, result)
+
+    def test_legacy_table_read_py2(self, datapath):
+        # issue: 24925
+        # legacy table written in Python 2
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf',
+                         'legacy_table_py2.h5'),
+                mode='r') as store:
+            result = store.select('table')
+
+        expected = pd.DataFrame({
+            "a": ["a", "b"],
+            "b": [2, 3]
+        })
+        assert_frame_equal(expected, result)
 
     def test_copy(self):
 
         with catch_warnings(record=True):
 
-            def do_copy(f=None, new_f=None, keys=None,
+            def do_copy(f, new_f=None, keys=None,
                         propindexes=True, **kwargs):
                 try:
-                    if f is None:
-                        f = tm.get_data_path(os.path.join('legacy_hdf',
-                                                          'legacy_0.10.h5'))
-
                     store = HDFStore(f, 'r')
 
                     if new_f is None:
@@ -4416,36 +4025,31 @@ def do_copy(f=None, new_f=None, keys=None,
                     # check keys
                     if keys is None:
                         keys = store.keys()
-                    self.assertEqual(set(keys), set(tstore.keys()))
+                    assert set(keys) == set(tstore.keys())
 
-                    # check indicies & nrows
+                    # check indices & nrows
                     for k in tstore.keys():
                         if tstore.get_storer(k).is_table:
                             new_t = tstore.get_storer(k)
                             orig_t = store.get_storer(k)
 
-                            self.assertEqual(orig_t.nrows, new_t.nrows)
+                            assert orig_t.nrows == new_t.nrows
 
                             # check propindixes
                             if propindexes:
                                 for a in orig_t.axes:
                                     if a.is_indexed:
-                                        self.assertTrue(
-                                            new_t[a.name].is_indexed)
+                                        assert new_t[a.name].is_indexed
 
                 finally:
                     safe_close(store)
                     safe_close(tstore)
                     try:
                         os.close(fd)
-                    except:
+                    except (OSError, ValueError):
                         pass
                     safe_remove(new_f)
 
-            do_copy()
-            do_copy(keys=['/a', '/b', '/df1_mixed'])
-            do_copy(propindexes=False)
-
             # new table
             df = tm.makeDataFrame()
 
@@ -4459,37 +4063,13 @@ def do_copy(f=None, new_f=None, keys=None,
             finally:
                 safe_remove(path)
 
-    def test_legacy_table_write(self):
-        pytest.skip("cannot write legacy tables")
-
-        store = HDFStore(tm.get_data_path(
-            'legacy_hdf/legacy_table_%s.h5' % pandas.__version__), 'a')
-
-        df = tm.makeDataFrame()
-        wp = tm.makePanel()
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['foo', 'bar'])
-        df = DataFrame(np.random.randn(10, 3), index=index,
-                       columns=['A', 'B', 'C'])
-        store.append('mi', df)
-
-        df = DataFrame(dict(A='foo', B='bar'), index=lrange(10))
-        store.append('df', df, data_columns=['B'], min_itemsize={'A': 200})
-        store.append('wp', wp)
-
-        store.close()
-
     def test_store_datetime_fractional_secs(self):
 
         with ensure_clean_store(self.path) as store:
             dt = datetime.datetime(2012, 1, 2, 3, 4, 5, 123456)
             series = Series([0], [dt])
             store['a'] = series
-            self.assertEqual(store['a'].index[0], dt)
+            assert store['a'].index[0] == dt
 
     def test_tseries_indices_series(self):
 
@@ -4499,18 +4079,18 @@ def test_tseries_indices_series(self):
             store['a'] = ser
             result = store['a']
 
-            assert_series_equal(result, ser)
-            self.assertEqual(type(result.index), type(ser.index))
-            self.assertEqual(result.index.freq, ser.index.freq)
+            tm.assert_series_equal(result, ser)
+            assert result.index.freq == ser.index.freq
+            tm.assert_class_equal(result.index, ser.index, obj="series index")
 
             idx = tm.makePeriodIndex(10)
             ser = Series(np.random.randn(len(idx)), idx)
             store['a'] = ser
             result = store['a']
 
-            assert_series_equal(result, ser)
-            self.assertEqual(type(result.index), type(ser.index))
-            self.assertEqual(result.index.freq, ser.index.freq)
+            tm.assert_series_equal(result, ser)
+            assert result.index.freq == ser.index.freq
+            tm.assert_class_equal(result.index, ser.index, obj="series index")
 
     def test_tseries_indices_frame(self):
 
@@ -4521,8 +4101,9 @@ def test_tseries_indices_frame(self):
             result = store['a']
 
             assert_frame_equal(result, df)
-            self.assertEqual(type(result.index), type(df.index))
-            self.assertEqual(result.index.freq, df.index.freq)
+            assert result.index.freq == df.index.freq
+            tm.assert_class_equal(result.index, df.index,
+                                  obj="dataframe index")
 
             idx = tm.makePeriodIndex(10)
             df = DataFrame(np.random.randn(len(idx), 3), idx)
@@ -4530,8 +4111,9 @@ def test_tseries_indices_frame(self):
             result = store['a']
 
             assert_frame_equal(result, df)
-            self.assertEqual(type(result.index), type(df.index))
-            self.assertEqual(result.index.freq, df.index.freq)
+            assert result.index.freq == df.index.freq
+            tm.assert_class_equal(result.index, df.index,
+                                  obj="dataframe index")
 
     def test_unicode_index(self):
 
@@ -4539,6 +4121,7 @@ def test_unicode_index(self):
 
         # PerformanceWarning
         with catch_warnings(record=True):
+            simplefilter("ignore", pd.errors.PerformanceWarning)
             s = Series(np.random.randn(len(unicode_values)), unicode_values)
             self._check_roundtrip(s, tm.assert_series_equal)
 
@@ -4557,6 +4140,7 @@ def test_unicode_longer_encoded(self):
             result = store.get('df')
             tm.assert_frame_equal(result, df)
 
+    @xfail_non_writeable
     def test_store_datetime_mixed(self):
 
         df = DataFrame(
@@ -4571,7 +4155,7 @@ def test_store_datetime_mixed(self):
     #                   index=[np.arange(5).repeat(2),
     #                          np.tile(np.arange(2), 5)])
 
-    #    self.assertRaises(Exception, store.put, 'foo', df, format='table')
+    #    pytest.raises(Exception, store.put, 'foo', df, format='table')
 
     def test_append_with_diff_col_name_types_raises_value_error(self):
         df = DataFrame(np.random.randn(10, 1))
@@ -4585,7 +4169,7 @@ def test_append_with_diff_col_name_types_raises_value_error(self):
             store.append(name, df)
 
             for d in (df2, df3, df4, df5):
-                with tm.assertRaises(ValueError):
+                with pytest.raises(ValueError):
                     store.append(name, d)
 
     def test_query_with_nested_special_character(self):
@@ -4602,7 +4186,7 @@ def test_categorical(self):
 
         with ensure_clean_store(self.path) as store:
 
-            # basic
+            # Basic
             _maybe_remove(store, 's')
             s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=[
                        'a', 'b', 'c', 'd'], ordered=False))
@@ -4623,37 +4207,43 @@ def test_categorical(self):
             result = store.select('df')
             tm.assert_frame_equal(result, df)
 
-            # dtypes
+            # Dtypes
+            _maybe_remove(store, 'si')
             s = Series([1, 1, 2, 2, 3, 4, 5]).astype('category')
             store.append('si', s)
             result = store.select('si')
             tm.assert_series_equal(result, s)
 
+            _maybe_remove(store, 'si2')
             s = Series([1, 1, np.nan, 2, 3, 4, 5]).astype('category')
             store.append('si2', s)
             result = store.select('si2')
             tm.assert_series_equal(result, s)
 
-            # multiple
+            # Multiple
+            _maybe_remove(store, 'df2')
             df2 = df.copy()
             df2['s2'] = Series(list('abcdefg')).astype('category')
             store.append('df2', df2)
             result = store.select('df2')
             tm.assert_frame_equal(result, df2)
 
-            # make sure the metadata is ok
-            self.assertTrue('/df2   ' in str(store))
-            self.assertTrue('/df2/meta/values_block_0/meta' in str(store))
-            self.assertTrue('/df2/meta/values_block_1/meta' in str(store))
+            # Make sure the metadata is OK
+            info = store.info()
+            assert '/df2   ' in info
+            # assert '/df2/meta/values_block_0/meta' in info
+            assert '/df2/meta/values_block_1/meta' in info
 
             # unordered
+            _maybe_remove(store, 's2')
             s = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c'], categories=[
                        'a', 'b', 'c', 'd'], ordered=False))
             store.append('s2', s, format='table')
             result = store.select('s2')
             tm.assert_series_equal(result, s)
 
-            # query
+            # Query
+            _maybe_remove(store, 'df3')
             store.append('df3', df, data_columns=['s'])
             expected = df[df.s.isin(['b', 'c'])]
             result = store.select('df3', where=['s in ["b","c"]'])
@@ -4671,7 +4261,7 @@ def test_categorical(self):
             result = store.select('df3', where=['s in ["f"]'])
             tm.assert_frame_equal(result, expected)
 
-            # appending with same categories is ok
+            # Appending with same categories is ok
             store.append('df3', df)
 
             df = concat([df, df])
@@ -4679,20 +4269,21 @@ def test_categorical(self):
             result = store.select('df3', where=['s in ["b","c"]'])
             tm.assert_frame_equal(result, expected)
 
-            # appending must have the same categories
+            # Appending must have the same categories
             df3 = df.copy()
             df3['s'].cat.remove_unused_categories(inplace=True)
 
-            self.assertRaises(ValueError, lambda: store.append('df3', df3))
+            with pytest.raises(ValueError):
+                store.append('df3', df3)
 
-            # remove
-            # make sure meta data is removed (its a recursive removal so should
-            # be)
+            # Remove, and make sure meta data is removed (its a recursive
+            # removal so should be).
             result = store.select('df3/meta/s/meta')
-            self.assertIsNotNone(result)
+            assert result is not None
             store.remove('df3')
-            self.assertRaises(
-                KeyError, lambda: store.select('df3/meta/s/meta'))
+
+            with pytest.raises(KeyError):
+                store.select('df3/meta/s/meta')
 
     def test_categorical_conversion(self):
 
@@ -4724,19 +4315,38 @@ def test_categorical_conversion(self):
             result = read_hdf(path, 'df', where='obsids=B')
             tm.assert_frame_equal(result, expected)
 
+    def test_categorical_nan_only_columns(self):
+        # GH18413
+        # Check that read_hdf with categorical columns with NaN-only values can
+        # be read back.
+        df = pd.DataFrame({
+            'a': ['a', 'b', 'c', np.nan],
+            'b': [np.nan, np.nan, np.nan, np.nan],
+            'c': [1, 2, 3, 4],
+            'd': pd.Series([None] * 4, dtype=object)
+        })
+        df['a'] = df.a.astype('category')
+        df['b'] = df.b.astype('category')
+        df['d'] = df.b.astype('category')
+        expected = df
+        with ensure_clean_path(self.path) as path:
+            df.to_hdf(path, 'df', format='table', data_columns=True)
+            result = read_hdf(path, 'df')
+            tm.assert_frame_equal(result, expected)
+
     def test_duplicate_column_name(self):
         df = DataFrame(columns=["a", "a"], data=[[0, 0]])
 
         with ensure_clean_path(self.path) as path:
-            self.assertRaises(ValueError, df.to_hdf,
-                              path, 'df', format='fixed')
+            pytest.raises(ValueError, df.to_hdf,
+                          path, 'df', format='fixed')
 
             df.to_hdf(path, 'df', format='table')
             other = read_hdf(path, 'df')
 
             tm.assert_frame_equal(df, other)
-            self.assertTrue(df.equals(other))
-            self.assertTrue(other.equals(df))
+            assert df.equals(other)
+            assert other.equals(df)
 
     def test_round_trip_equals(self):
         # GH 9330
@@ -4746,8 +4356,8 @@ def test_round_trip_equals(self):
             df.to_hdf(path, 'df', format='table')
             other = read_hdf(path, 'df')
             tm.assert_frame_equal(df, other)
-            self.assertTrue(df.equals(other))
-            self.assertTrue(other.equals(df))
+            assert df.equals(other)
+            assert other.equals(df)
 
     def test_preserve_timedeltaindex_type(self):
         # GH9635
@@ -4762,7 +4372,7 @@ def test_preserve_timedeltaindex_type(self):
             store['df'] = df
             assert_frame_equal(store['df'], df)
 
-    def test_colums_multiindex_modified(self):
+    def test_columns_multiindex_modified(self):
         # BUG: 7212
         # read_hdf store.select modified the passed columns parameters
         # when multi-indexed.
@@ -4783,8 +4393,9 @@ def test_colums_multiindex_modified(self):
             cols2load = list('BCD')
             cols2load_original = list(cols2load)
             df_loaded = read_hdf(path, 'df', columns=cols2load)  # noqa
-            self.assertTrue(cols2load_original == cols2load)
+            assert cols2load_original == cols2load
 
+    @ignore_natural_naming_warning
     def test_to_hdf_with_object_column_names(self):
         # GH9057
         # Writing HDF5 table format should only work for string-like
@@ -4798,17 +4409,17 @@ def test_to_hdf_with_object_column_names(self):
         if compat.PY3:
             types_should_run.append(tm.makeUnicodeIndex)
         else:
-            types_should_fail.append(tm.makeUnicodeIndex)
+            # TODO: Add back to types_should_fail
+            # https://github.com/pandas-dev/pandas/issues/20907
+            pass
 
         for index in types_should_fail:
             df = DataFrame(np.random.randn(10, 2), columns=index(2))
             with ensure_clean_path(self.path) as path:
-                with self.assertRaises(
-                        ValueError, msg=("cannot have non-object label "
-                                         "DataIndexableCol")):
-                    with catch_warnings(record=True):
-                        df.to_hdf(path, 'df',
-                                  format='table',
+                with catch_warnings(record=True):
+                    msg = "cannot have non-object label DataIndexableCol"
+                    with pytest.raises(ValueError, match=msg):
+                        df.to_hdf(path, 'df', format='table',
                                   data_columns=True)
 
         for index in types_should_run:
@@ -4835,7 +4446,7 @@ def test_read_hdf_open_store(self):
             store = HDFStore(path, mode='r')
             indirect = read_hdf(store, 'df')
             tm.assert_frame_equal(direct, indirect)
-            self.assertTrue(store.is_open)
+            assert store.is_open
             store.close()
 
     def test_read_hdf_iterator(self):
@@ -4849,7 +4460,7 @@ def test_read_hdf_iterator(self):
             df.to_hdf(path, 'df', mode='w', format='t')
             direct = read_hdf(path, 'df')
             iterator = read_hdf(path, 'df', iterator=True)
-            self.assertTrue(isinstance(iterator, TableIterator))
+            assert isinstance(iterator, TableIterator)
             indirect = next(iterator.__iter__())
             tm.assert_frame_equal(direct, indirect)
             iterator.store.close()
@@ -4860,21 +4471,22 @@ def test_read_hdf_errors(self):
                        columns=list('ABCDE'))
 
         with ensure_clean_path(self.path) as path:
-            self.assertRaises(IOError, read_hdf, path, 'key')
+            pytest.raises(IOError, read_hdf, path, 'key')
             df.to_hdf(path, 'df')
             store = HDFStore(path, mode='r')
             store.close()
-            self.assertRaises(IOError, read_hdf, store, 'df')
-            with open(path, mode='r') as store:
-                self.assertRaises(NotImplementedError, read_hdf, store, 'df')
+            pytest.raises(IOError, read_hdf, store, 'df')
+
+    def test_read_hdf_generic_buffer_errors(self):
+        pytest.raises(NotImplementedError, read_hdf, BytesIO(b''), 'df')
 
     def test_invalid_complib(self):
         df = DataFrame(np.random.rand(4, 5),
                        index=list('abcd'),
                        columns=list('ABCDE'))
         with ensure_clean_path(self.path) as path:
-            self.assertRaises(ValueError, df.to_hdf, path,
-                              'df', complib='blosc:zlib')
+            with pytest.raises(ValueError):
+                df.to_hdf(path, 'df', complib='foolib')
     # GH10443
 
     def test_read_nokey(self):
@@ -4889,7 +4501,7 @@ def test_read_nokey(self):
             reread = read_hdf(path)
             assert_frame_equal(df, reread)
             df.to_hdf(path, 'df2', mode='a')
-            self.assertRaises(ValueError, read_hdf, path)
+            pytest.raises(ValueError, read_hdf, path)
 
     def test_read_nokey_table(self):
         # GH13231
@@ -4901,19 +4513,18 @@ def test_read_nokey_table(self):
             reread = read_hdf(path)
             assert_frame_equal(df, reread)
             df.to_hdf(path, 'df2', mode='a', format='table')
-            self.assertRaises(ValueError, read_hdf, path)
+            pytest.raises(ValueError, read_hdf, path)
 
     def test_read_nokey_empty(self):
         with ensure_clean_path(self.path) as path:
             store = HDFStore(path)
             store.close()
-            self.assertRaises(ValueError, read_hdf, path)
+            pytest.raises(ValueError, read_hdf, path)
 
+    @td.skip_if_no('pathlib')
     def test_read_from_pathlib_path(self):
 
         # GH11773
-        tm._skip_if_no_pathlib()
-
         from pathlib import Path
 
         expected = DataFrame(np.random.rand(4, 5),
@@ -4927,11 +4538,10 @@ def test_read_from_pathlib_path(self):
 
         tm.assert_frame_equal(expected, actual)
 
+    @td.skip_if_no('py.path')
     def test_read_from_py_localpath(self):
 
         # GH11773
-        tm._skip_if_no_localpath()
-
         from py.path import local as LocalPath
 
         expected = DataFrame(np.random.rand(4, 5),
@@ -4956,7 +4566,7 @@ def test_query_long_float_literal(self):
 
             cutoff = 1000000000.0006
             result = store.select('test', "A < %.4f" % cutoff)
-            self.assertTrue(result.empty)
+            assert result.empty
 
             cutoff = 1000000000.0010
             result = store.select('test', "A > %.4f" % cutoff)
@@ -4979,7 +4589,7 @@ def test_query_compare_column_type(self):
         with ensure_clean_store(self.path) as store:
             store.append('test', df, format='table', data_columns=True)
 
-            ts = pd.Timestamp('2014-01-01') # noqa
+            ts = pd.Timestamp('2014-01-01')  # noqa
             result = store.select('test', where='real_date > ts')
             expected = df.loc[[1], :]
             tm.assert_frame_equal(expected, result)
@@ -4989,15 +4599,15 @@ def test_query_compare_column_type(self):
                 for v in [2.1, True, pd.Timestamp('2014-01-01'),
                           pd.Timedelta(1, 's')]:
                     query = 'date {op} v'.format(op=op)
-                    with tm.assertRaises(TypeError):
-                        result = store.select('test', where=query)
+                    with pytest.raises(TypeError):
+                        store.select('test', where=query)
 
                 # strings to other columns must be convertible to type
                 v = 'a'
                 for col in ['int', 'float', 'real_date']:
                     query = '{col} {op} v'.format(op=op, col=col)
-                    with tm.assertRaises(ValueError):
-                        result = store.select('test', where=query)
+                    with pytest.raises(ValueError):
+                        store.select('test', where=query)
 
                 for v, col in zip(['1', '1.1', '2014-01-01'],
                                   ['int', 'float', 'real_date']):
@@ -5012,6 +4622,44 @@ def test_query_compare_column_type(self):
                         expected = df.loc[[], :]
                     tm.assert_frame_equal(expected, result)
 
+    @pytest.mark.parametrize('format', ['fixed', 'table'])
+    def test_read_hdf_series_mode_r(self, format):
+        # GH 16583
+        # Tests that reading a Series saved to an HDF file
+        # still works if a mode='r' argument is supplied
+        series = tm.makeFloatSeries()
+        with ensure_clean_path(self.path) as path:
+            series.to_hdf(path, key='data', format=format)
+            result = pd.read_hdf(path, key='data', mode='r')
+        tm.assert_series_equal(result, series)
+
+    @pytest.mark.skipif(not PY36, reason="Need python 3.6")
+    def test_fspath(self):
+        with tm.ensure_clean('foo.h5') as path:
+            with pd.HDFStore(path) as store:
+                assert os.fspath(store) == str(path)
+
+    def test_read_py2_hdf_file_in_py3(self, datapath):
+        # GH 16781
+
+        # tests reading a PeriodIndex DataFrame written in Python2 in Python3
+
+        # the file was generated in Python 2.7 like so:
+        #
+        # df = pd.DataFrame([1.,2,3], index=pd.PeriodIndex(
+        #              ['2015-01-01', '2015-01-02', '2015-01-05'], freq='B'))
+        # df.to_hdf('periodindex_0.20.1_x86_64_darwin_2.7.13.h5', 'p')
+
+        expected = pd.DataFrame([1., 2, 3], index=pd.PeriodIndex(
+            ['2015-01-01', '2015-01-02', '2015-01-05'], freq='B'))
+
+        with ensure_clean_store(
+                datapath('io', 'data', 'legacy_hdf',
+                         'periodindex_0.20.1_x86_64_darwin_2.7.13.h5'),
+                mode='r') as store:
+            result = store['p']
+            assert_frame_equal(result, expected)
+
 
 class TestHDFComplexValues(Base):
     # GH10447
@@ -5053,6 +4701,7 @@ def test_complex_table(self):
             reread = read_hdf(path, 'df')
             assert_frame_equal(df, reread)
 
+    @xfail_non_writeable
     def test_complex_mixed_fixed(self):
         complex64 = np.array([1.0 + 1.0j, 1.0 + 1.0j,
                               1.0 + 1.0j, 1.0 + 1.0j], dtype=np.complex64)
@@ -5092,32 +4741,29 @@ def test_complex_mixed_table(self):
             assert_frame_equal(df, reread)
 
     def test_complex_across_dimensions_fixed(self):
-        complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
-        s = Series(complex128, index=list('abcd'))
-        df = DataFrame({'A': s, 'B': s})
-        p = Panel({'One': df, 'Two': df})
+        with catch_warnings(record=True):
+            complex128 = np.array(
+                [1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
+            s = Series(complex128, index=list('abcd'))
+            df = DataFrame({'A': s, 'B': s})
 
-        objs = [s, df, p]
-        comps = [tm.assert_series_equal, tm.assert_frame_equal,
-                 tm.assert_panel_equal]
-        for obj, comp in zip(objs, comps):
-            with ensure_clean_path(self.path) as path:
-                obj.to_hdf(path, 'obj', format='fixed')
-                reread = read_hdf(path, 'obj')
-                comp(obj, reread)
+            objs = [s, df]
+            comps = [tm.assert_series_equal, tm.assert_frame_equal]
+            for obj, comp in zip(objs, comps):
+                with ensure_clean_path(self.path) as path:
+                    obj.to_hdf(path, 'obj', format='fixed')
+                    reread = read_hdf(path, 'obj')
+                    comp(obj, reread)
 
     def test_complex_across_dimensions(self):
         complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
         s = Series(complex128, index=list('abcd'))
         df = DataFrame({'A': s, 'B': s})
-        p = Panel({'One': df, 'Two': df})
 
         with catch_warnings(record=True):
-            p4d = pd.Panel4D({'i': p, 'ii': p})
 
-            objs = [df, p, p4d]
-            comps = [tm.assert_frame_equal, tm.assert_panel_equal,
-                     tm.assert_panel4d_equal]
+            objs = [df]
+            comps = [tm.assert_frame_equal]
             for obj, comp in zip(objs, comps):
                 with ensure_clean_path(self.path) as path:
                     obj.to_hdf(path, 'obj', format='table')
@@ -5132,15 +4778,15 @@ def test_complex_indexing_error(self):
                         'C': complex128},
                        index=list('abcd'))
         with ensure_clean_store(self.path) as store:
-            self.assertRaises(TypeError, store.append,
-                              'df', df, data_columns=['C'])
+            pytest.raises(TypeError, store.append,
+                          'df', df, data_columns=['C'])
 
     def test_complex_series_error(self):
         complex128 = np.array([1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j, 1.0 + 1.0j])
         s = Series(complex128, index=list('abcd'))
 
         with ensure_clean_path(self.path) as path:
-            self.assertRaises(TypeError, s.to_hdf, path, 'obj', format='t')
+            pytest.raises(TypeError, s.to_hdf, path, 'obj', format='t')
 
         with ensure_clean_path(self.path) as path:
             s.to_hdf(path, 'obj', format='t', index=False)
@@ -5158,7 +4804,7 @@ def test_complex_append(self):
             assert_frame_equal(pd.concat([df, df], 0), result)
 
 
-class TestTimezones(Base, tm.TestCase):
+class TestTimezones(Base):
 
     def _compare_with_tz(self, a, b):
         tm.assert_frame_equal(a, b)
@@ -5170,16 +4816,15 @@ def _compare_with_tz(self, a, b):
                 b_e = b.loc[i, c]
                 if not (a_e == b_e and a_e.tz == b_e.tz):
                     raise AssertionError(
-                        "invalid tz comparsion [%s] [%s]" % (a_e, b_e))
+                        "invalid tz comparison [%s] [%s]" % (a_e, b_e))
 
     def test_append_with_timezones_dateutil(self):
 
         from datetime import timedelta
-        tm._skip_if_no_dateutil()
 
         # use maybe_get_tz instead of dateutil.tz.gettz to handle the windows
         # filename issues.
-        from pandas._libs.tslib import maybe_get_tz
+        from pandas._libs.tslibs.timezones import maybe_get_tz
         gettz = lambda x: maybe_get_tz('dateutil/' + x)
 
         # as columns
@@ -5215,7 +4860,7 @@ def test_append_with_timezones_dateutil(self):
                                             tz=gettz('US/Eastern')),
                                 B=Timestamp('20130102', tz=gettz('EET'))),
                            index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
+            pytest.raises(ValueError, store.append, 'df_tz', df)
 
             # this is ok
             _maybe_remove(store, 'df_tz')
@@ -5229,7 +4874,7 @@ def test_append_with_timezones_dateutil(self):
                                             tz=gettz('US/Eastern')),
                                 B=Timestamp('20130102', tz=gettz('CET'))),
                            index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
+            pytest.raises(ValueError, store.append, 'df_tz', df)
 
         # as index
         with ensure_clean_store(self.path) as store:
@@ -5282,7 +4927,7 @@ def test_append_with_timezones_pytz(self):
             df = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
                                 B=Timestamp('20130102', tz='EET')),
                            index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
+            pytest.raises(ValueError, store.append, 'df_tz', df)
 
             # this is ok
             _maybe_remove(store, 'df_tz')
@@ -5295,7 +4940,7 @@ def test_append_with_timezones_pytz(self):
             df = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
                                 B=Timestamp('20130102', tz='CET')),
                            index=range(5))
-            self.assertRaises(ValueError, store.append, 'df_tz', df)
+            pytest.raises(ValueError, store.append, 'df_tz', df)
 
         # as index
         with ensure_clean_store(self.path) as store:
@@ -5326,7 +4971,7 @@ def test_tseries_select_index_column(self):
         with ensure_clean_store(self.path) as store:
             store.append('frame', frame)
             result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, DatetimeIndex(result.values).tz)
+            assert rng.tz == DatetimeIndex(result.values).tz
 
         # check utc
         rng = date_range('1/1/2000', '1/30/2000', tz='UTC')
@@ -5335,7 +4980,7 @@ def test_tseries_select_index_column(self):
         with ensure_clean_store(self.path) as store:
             store.append('frame', frame)
             result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, result.dt.tz)
+            assert rng.tz == result.dt.tz
 
         # double check non-utc
         rng = date_range('1/1/2000', '1/30/2000', tz='US/Eastern')
@@ -5344,7 +4989,7 @@ def test_tseries_select_index_column(self):
         with ensure_clean_store(self.path) as store:
             store.append('frame', frame)
             result = store.select_column('frame', 'index')
-            self.assertEqual(rng.tz, result.dt.tz)
+            assert rng.tz == result.dt.tz
 
     def test_timezones_fixed(self):
         with ensure_clean_store(self.path) as store:
@@ -5374,9 +5019,10 @@ def test_fixed_offset_tz(self):
         with ensure_clean_store(self.path) as store:
             store['frame'] = frame
             recons = store['frame']
-            self.assert_index_equal(recons.index, rng)
-            self.assertEqual(rng.tz, recons.index.tz)
+            tm.assert_index_equal(recons.index, rng)
+            assert rng.tz == recons.index.tz
 
+    @td.skip_if_windows
     def test_store_timezone(self):
         # GH2852
         # issue storing datetime.date with a timezone as it resets when read
@@ -5404,14 +5050,14 @@ def test_store_timezone(self):
 
             assert_frame_equal(result, df)
 
-    def test_legacy_datetimetz_object(self):
+    def test_legacy_datetimetz_object(self, datapath):
         # legacy from < 0.17.0
         # 8260
         expected = DataFrame(dict(A=Timestamp('20130102', tz='US/Eastern'),
                                   B=Timestamp('20130603', tz='CET')),
                              index=range(5))
         with ensure_clean_store(
-                tm.get_data_path('legacy_hdf/datetimetz_object.h5'),
+                datapath('io', 'data', 'legacy_hdf', 'datetimetz_object.h5'),
                 mode='r') as store:
             result = store['df']
             assert_frame_equal(result, expected)
@@ -5430,12 +5076,3 @@ def test_dst_transitions(self):
                 store.append('df', df)
                 result = store.select('df')
                 assert_frame_equal(result, df)
-
-
-def _test_sort(obj):
-    if isinstance(obj, DataFrame):
-        return obj.reindex(sorted(obj.index))
-    elif isinstance(obj, Panel):
-        return obj.reindex(major=sorted(obj.major_axis))
-    else:
-        raise ValueError('type not supported here')
diff --git a/pandas/tests/io/test_s3.py b/pandas/tests/io/test_s3.py
index 2983fa647445c..32eae8ed328f4 100644
--- a/pandas/tests/io/test_s3.py
+++ b/pandas/tests/io/test_s3.py
@@ -1,10 +1,29 @@
-from pandas.util import testing as tm
+import pytest
 
-from pandas.io.common import _is_s3_url
+from pandas.compat import BytesIO
 
+from pandas import read_csv
 
-class TestS3URL(tm.TestCase):
+from pandas.io.common import is_s3_url
+
+
+class TestS3URL(object):
 
     def test_is_s3_url(self):
-        self.assertTrue(_is_s3_url("s3://pandas/somethingelse.com"))
-        self.assertFalse(_is_s3_url("s4://pandas/somethingelse.com"))
+        assert is_s3_url("s3://pandas/somethingelse.com")
+        assert not is_s3_url("s4://pandas/somethingelse.com")
+
+
+def test_streaming_s3_objects():
+    # GH17135
+    # botocore gained iteration support in 1.10.47, can now be used in read_*
+    pytest.importorskip('botocore', minversion='1.10.47')
+    from botocore.response import StreamingBody
+
+    data = [
+        b'foo,bar,baz\n1,2,3\n4,5,6\n',
+        b'just,the,header\n',
+    ]
+    for el in data:
+        body = StreamingBody(BytesIO(el), content_length=len(el))
+        read_csv(body)
diff --git a/pandas/tests/io/test_sql.py b/pandas/tests/io/test_sql.py
index 890f52e8c65e9..806bd7f2b7c93 100644
--- a/pandas/tests/io/test_sql.py
+++ b/pandas/tests/io/test_sql.py
@@ -18,31 +18,29 @@
 """
 
 from __future__ import print_function
-import pytest
-import unittest
-import sqlite3
-import csv
-import os
-import sys
 
+import csv
+from datetime import date, datetime, time
+import sqlite3
 import warnings
-import numpy as np
-import pandas as pd
 
-from datetime import datetime, date, time
+import numpy as np
+import pytest
 
-from pandas.types.common import (is_object_dtype, is_datetime64_dtype,
-                                 is_datetime64tz_dtype)
-from pandas import DataFrame, Series, Index, MultiIndex, isnull, concat
-from pandas import date_range, to_datetime, to_timedelta, Timestamp
 import pandas.compat as compat
-from pandas.compat import StringIO, range, lrange, string_types, PY36
-from pandas.tseries.tools import format as date_format
+from pandas.compat import PY36, lrange, range, string_types
 
-import pandas.io.sql as sql
-from pandas.io.sql import read_sql_table, read_sql_query
+from pandas.core.dtypes.common import (
+    is_datetime64_dtype, is_datetime64tz_dtype)
+
+import pandas as pd
+from pandas import (
+    DataFrame, Index, MultiIndex, Series, Timestamp, concat, date_range, isna,
+    to_datetime, to_timedelta)
 import pandas.util.testing as tm
 
+import pandas.io.sql as sql
+from pandas.io.sql import read_sql_query, read_sql_table
 
 try:
     import sqlalchemy
@@ -88,6 +86,7 @@
                     "TextCol" TEXT,
                     "DateCol" TEXT,
                     "IntDateCol" INTEGER,
+                    "IntDateOnlyCol" INTEGER,
                     "FloatCol" REAL,
                     "IntCol" INTEGER,
                     "BoolCol" INTEGER,
@@ -98,6 +97,7 @@
                     `TextCol` TEXT,
                     `DateCol` DATETIME,
                     `IntDateCol` INTEGER,
+                    `IntDateOnlyCol` INTEGER,
                     `FloatCol` DOUBLE,
                     `IntCol` INTEGER,
                     `BoolCol` BOOLEAN,
@@ -109,6 +109,7 @@
                     "DateCol" TIMESTAMP,
                     "DateColWithTz" TIMESTAMP WITH TIME ZONE,
                     "IntDateCol" INTEGER,
+                    "IntDateOnlyCol" INTEGER,
                     "FloatCol" DOUBLE PRECISION,
                     "IntCol" INTEGER,
                     "BoolCol" BOOLEAN,
@@ -120,31 +121,33 @@
         'sqlite': {
             'query': """
                 INSERT INTO types_test_data
-                VALUES(?, ?, ?, ?, ?, ?, ?, ?)
+                VALUES(?, ?, ?, ?, ?, ?, ?, ?, ?)
                 """,
             'fields': (
-                'TextCol', 'DateCol', 'IntDateCol', 'FloatCol',
-                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
+                'TextCol', 'DateCol', 'IntDateCol', 'IntDateOnlyCol',
+                'FloatCol', 'IntCol', 'BoolCol', 'IntColWithNull',
+                'BoolColWithNull'
             )
         },
         'mysql': {
             'query': """
                 INSERT INTO types_test_data
-                VALUES("%s", %s, %s, %s, %s, %s, %s, %s)
+                VALUES("%s", %s, %s, %s, %s, %s, %s, %s, %s)
                 """,
             'fields': (
-                'TextCol', 'DateCol', 'IntDateCol', 'FloatCol',
-                'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
+                'TextCol', 'DateCol', 'IntDateCol', 'IntDateOnlyCol',
+                'FloatCol', 'IntCol', 'BoolCol', 'IntColWithNull',
+                'BoolColWithNull'
             )
         },
         'postgresql': {
             'query': """
                 INSERT INTO types_test_data
-                VALUES(%s, %s, %s, %s, %s, %s, %s, %s, %s)
+                VALUES(%s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
                 """,
             'fields': (
                 'TextCol', 'DateCol', 'DateColWithTz',
-                'IntDateCol', 'FloatCol',
+                'IntDateCol', 'IntDateOnlyCol', 'FloatCol',
                 'IntCol', 'BoolCol', 'IntColWithNull', 'BoolColWithNull'
             )
         },
@@ -178,10 +181,12 @@
 
 class MixInBase(object):
 
-    def tearDown(self):
-        for tbl in self._get_all_tables():
-            self.drop_table(tbl)
-        self._close_conn()
+    def teardown_method(self, method):
+        # if setup fails, there may not be a connection to close.
+        if hasattr(self, 'conn'):
+            for tbl in self._get_all_tables():
+                self.drop_table(tbl)
+            self._close_conn()
 
 
 class MySQLMixIn(MixInBase):
@@ -248,9 +253,13 @@ def _get_exec(self):
         else:
             return self.conn.cursor()
 
-    def _load_iris_data(self):
+    @pytest.fixture(params=[('io', 'data', 'iris.csv')])
+    def load_iris_data(self, datapath, request):
         import io
-        iris_csv_file = os.path.join(tm.get_data_path(), 'iris.csv')
+        iris_csv_file = datapath(*request.param)
+
+        if not hasattr(self, 'conn'):
+            self.setup_connect()
 
         self.drop_table('iris')
         self._get_exec().execute(SQL_STRINGS['create_iris'][self.flavor])
@@ -271,8 +280,7 @@ def _check_iris_loaded_frame(self, iris_frame):
         pytype = iris_frame.dtypes[0].type
         row = iris_frame.iloc[0]
 
-        self.assertTrue(
-            issubclass(pytype, np.floating), 'Loaded frame has incorrect type')
+        assert issubclass(pytype, np.floating)
         tm.equalContents(row.values, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
 
     def _load_test1_data(self):
@@ -314,13 +322,13 @@ def _load_raw_sql(self):
         self.drop_table('types_test_data')
         self._get_exec().execute(SQL_STRINGS['create_test_types'][self.flavor])
         ins = SQL_STRINGS['insert_test_types'][self.flavor]
-
         data = [
             {
                 'TextCol': 'first',
                 'DateCol': '2000-01-03 00:00:00',
                 'DateColWithTz': '2000-01-01 00:00:00-08:00',
                 'IntDateCol': 535852800,
+                'IntDateOnlyCol': 20101010,
                 'FloatCol': 10.10,
                 'IntCol': 1,
                 'BoolCol': False,
@@ -332,6 +340,7 @@ def _load_raw_sql(self):
                 'DateCol': '2000-01-04 00:00:00',
                 'DateColWithTz': '2000-06-01 00:00:00-07:00',
                 'IntDateCol': 1356998400,
+                'IntDateOnlyCol': 20101212,
                 'FloatCol': 10.10,
                 'IntCol': 1,
                 'BoolCol': False,
@@ -367,12 +376,15 @@ def _read_sql_iris_named_parameter(self):
         iris_frame = self.pandasSQL.read_query(query, params=params)
         self._check_iris_loaded_frame(iris_frame)
 
-    def _to_sql(self):
+    def _to_sql(self, method=None):
         self.drop_table('test_frame1')
 
-        self.pandasSQL.to_sql(self.test_frame1, 'test_frame1')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
+        self.pandasSQL.to_sql(self.test_frame1, 'test_frame1', method=method)
+        assert self.pandasSQL.has_table('test_frame1')
+
+        num_entries = len(self.test_frame1)
+        num_rows = self._count_rows('test_frame1')
+        assert num_rows == num_entries
 
         # Nuke table
         self.drop_table('test_frame1')
@@ -386,11 +398,10 @@ def _to_sql_fail(self):
 
         self.pandasSQL.to_sql(
             self.test_frame1, 'test_frame1', if_exists='fail')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
+        assert self.pandasSQL.has_table('test_frame1')
 
-        self.assertRaises(ValueError, self.pandasSQL.to_sql,
-                          self.test_frame1, 'test_frame1', if_exists='fail')
+        pytest.raises(ValueError, self.pandasSQL.to_sql,
+                      self.test_frame1, 'test_frame1', if_exists='fail')
 
         self.drop_table('test_frame1')
 
@@ -402,15 +413,12 @@ def _to_sql_replace(self):
         # Add to table again
         self.pandasSQL.to_sql(
             self.test_frame1, 'test_frame1', if_exists='replace')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
+        assert self.pandasSQL.has_table('test_frame1')
 
         num_entries = len(self.test_frame1)
         num_rows = self._count_rows('test_frame1')
 
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
-
+        assert num_rows == num_entries
         self.drop_table('test_frame1')
 
     def _to_sql_append(self):
@@ -423,15 +431,31 @@ def _to_sql_append(self):
         # Add to table again
         self.pandasSQL.to_sql(
             self.test_frame1, 'test_frame1', if_exists='append')
-        self.assertTrue(self.pandasSQL.has_table(
-            'test_frame1'), 'Table not written to DB')
+        assert self.pandasSQL.has_table('test_frame1')
 
         num_entries = 2 * len(self.test_frame1)
         num_rows = self._count_rows('test_frame1')
 
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
+        assert num_rows == num_entries
+        self.drop_table('test_frame1')
+
+    def _to_sql_method_callable(self):
+        check = []  # used to double check function below is really being used
+
+        def sample(pd_table, conn, keys, data_iter):
+            check.append(1)
+            data = [dict(zip(keys, row)) for row in data_iter]
+            conn.execute(pd_table.table.insert(), data)
+        self.drop_table('test_frame1')
+
+        self.pandasSQL.to_sql(self.test_frame1, 'test_frame1', method=sample)
+        assert self.pandasSQL.has_table('test_frame1')
 
+        assert check == [1]
+        num_entries = len(self.test_frame1)
+        num_rows = self._count_rows('test_frame1')
+        assert num_rows == num_entries
+        # Nuke table
         self.drop_table('test_frame1')
 
     def _roundtrip(self):
@@ -458,7 +482,7 @@ def _to_sql_save_index(self):
                                     columns=['A', 'B', 'C'], index=['A'])
         self.pandasSQL.to_sql(df, 'test_to_sql_saves_index')
         ix_cols = self._get_index_columns('test_to_sql_saves_index')
-        self.assertEqual(ix_cols, [['A', ], ])
+        assert ix_cols == [['A', ], ]
 
     def _transaction_test(self):
         self.pandasSQL.execute("CREATE TABLE test_trans (A INT, B TEXT)")
@@ -470,17 +494,17 @@ def _transaction_test(self):
             with self.pandasSQL.run_transaction() as trans:
                 trans.execute(ins_sql)
                 raise Exception('error')
-        except:
+        except Exception:
             # ignore raised exception
             pass
         res = self.pandasSQL.read_query('SELECT * FROM test_trans')
-        self.assertEqual(len(res), 0)
+        assert len(res) == 0
 
         # Make sure when transaction is committed, rows do get inserted
         with self.pandasSQL.run_transaction() as trans:
             trans.execute(ins_sql)
         res2 = self.pandasSQL.read_query('SELECT * FROM test_trans')
-        self.assertEqual(len(res2), 1)
+        assert len(res2) == 1
 
 
 # -----------------------------------------------------------------------------
@@ -506,9 +530,14 @@ class _TestSQLApi(PandasSQLTest):
     flavor = 'sqlite'
     mode = None
 
-    def setUp(self):
+    def setup_connect(self):
         self.conn = self.connect()
-        self._load_iris_data()
+
+    @pytest.fixture(autouse=True)
+    def setup_method(self, load_iris_data):
+        self.load_test_data_and_sql()
+
+    def load_test_data_and_sql(self):
         self._load_iris_view()
         self._load_test1_data()
         self._load_test2_data()
@@ -527,19 +556,15 @@ def test_read_sql_view(self):
 
     def test_to_sql(self):
         sql.to_sql(self.test_frame1, 'test_frame1', self.conn)
-        self.assertTrue(
-            sql.has_table('test_frame1', self.conn),
-            'Table not written to DB')
+        assert sql.has_table('test_frame1', self.conn)
 
     def test_to_sql_fail(self):
         sql.to_sql(self.test_frame1, 'test_frame2',
                    self.conn, if_exists='fail')
-        self.assertTrue(
-            sql.has_table('test_frame2', self.conn),
-            'Table not written to DB')
+        assert sql.has_table('test_frame2', self.conn)
 
-        self.assertRaises(ValueError, sql.to_sql, self.test_frame1,
-                          'test_frame2', self.conn, if_exists='fail')
+        pytest.raises(ValueError, sql.to_sql, self.test_frame1,
+                      'test_frame2', self.conn, if_exists='fail')
 
     def test_to_sql_replace(self):
         sql.to_sql(self.test_frame1, 'test_frame3',
@@ -547,15 +572,12 @@ def test_to_sql_replace(self):
         # Add to table again
         sql.to_sql(self.test_frame1, 'test_frame3',
                    self.conn, if_exists='replace')
-        self.assertTrue(
-            sql.has_table('test_frame3', self.conn),
-            'Table not written to DB')
+        assert sql.has_table('test_frame3', self.conn)
 
         num_entries = len(self.test_frame1)
         num_rows = self._count_rows('test_frame3')
 
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
+        assert num_rows == num_entries
 
     def test_to_sql_append(self):
         sql.to_sql(self.test_frame1, 'test_frame4',
@@ -564,15 +586,12 @@ def test_to_sql_append(self):
         # Add to table again
         sql.to_sql(self.test_frame1, 'test_frame4',
                    self.conn, if_exists='append')
-        self.assertTrue(
-            sql.has_table('test_frame4', self.conn),
-            'Table not written to DB')
+        assert sql.has_table('test_frame4', self.conn)
 
         num_entries = 2 * len(self.test_frame1)
         num_rows = self._count_rows('test_frame4')
 
-        self.assertEqual(
-            num_rows, num_entries, "not the same number of rows as entries")
+        assert num_rows == num_entries
 
     def test_to_sql_type_mapping(self):
         sql.to_sql(self.test_frame3, 'test_frame5', self.conn, index=False)
@@ -586,11 +605,6 @@ def test_to_sql_series(self):
         s2 = sql.read_sql_query("SELECT * FROM test_series", self.conn)
         tm.assert_frame_equal(s.to_frame(), s2)
 
-    def test_to_sql_panel(self):
-        panel = tm.makePanel()
-        self.assertRaises(NotImplementedError, sql.to_sql, panel,
-                          'test_panel', self.conn)
-
     def test_roundtrip(self):
         sql.to_sql(self.test_frame1, 'test_frame_roundtrip',
                    con=self.conn)
@@ -620,36 +634,50 @@ def test_execute_sql(self):
         tm.equalContents(row, [5.1, 3.5, 1.4, 0.2, 'Iris-setosa'])
 
     def test_date_parsing(self):
-        # Test date parsing in read_sq
+        # Test date parsing in read_sql
         # No Parsing
         df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn)
-        self.assertFalse(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
+        assert not issubclass(df.DateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
                                 parse_dates=['DateCol'])
-        self.assertTrue(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+        assert df.DateCol.tolist() == [
+            pd.Timestamp(2000, 1, 3, 0, 0, 0),
+            pd.Timestamp(2000, 1, 4, 0, 0, 0)
+        ]
 
         df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
                                 parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
-        self.assertTrue(
-            issubclass(df.DateCol.dtype.type, np.datetime64),
-            "DateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
+        assert df.DateCol.tolist() == [
+            pd.Timestamp(2000, 1, 3, 0, 0, 0),
+            pd.Timestamp(2000, 1, 4, 0, 0, 0)
+        ]
 
         df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
                                 parse_dates=['IntDateCol'])
-
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+        assert df.IntDateCol.tolist() == [
+            pd.Timestamp(1986, 12, 25, 0, 0, 0),
+            pd.Timestamp(2013, 1, 1, 0, 0, 0)
+        ]
 
         df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
                                 parse_dates={'IntDateCol': 's'})
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
+        assert df.IntDateCol.tolist() == [
+            pd.Timestamp(1986, 12, 25, 0, 0, 0),
+            pd.Timestamp(2013, 1, 1, 0, 0, 0)
+        ]
 
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        df = sql.read_sql_query("SELECT * FROM types_test_data", self.conn,
+                                parse_dates={'IntDateOnlyCol': '%Y%m%d'})
+        assert issubclass(df.IntDateOnlyCol.dtype.type, np.datetime64)
+        assert df.IntDateOnlyCol.tolist() == [
+            pd.Timestamp('2010-10-10'),
+            pd.Timestamp('2010-12-12')
+        ]
 
     def test_date_and_index(self):
         # Test case where same column appears in parse_date and index_col
@@ -658,11 +686,8 @@ def test_date_and_index(self):
                                 index_col='DateCol',
                                 parse_dates=['DateCol', 'IntDateCol'])
 
-        self.assertTrue(issubclass(df.index.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
-
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.index.dtype.type, np.datetime64)
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
 
     def test_timedelta(self):
 
@@ -677,52 +702,31 @@ def test_timedelta(self):
     def test_complex(self):
         df = DataFrame({'a': [1 + 1j, 2j]})
         # Complex data type should raise error
-        self.assertRaises(ValueError, df.to_sql, 'test_complex', self.conn)
-
-    def test_to_sql_index_label(self):
-        temp_frame = DataFrame({'col1': range(4)})
+        pytest.raises(ValueError, df.to_sql, 'test_complex', self.conn)
 
+    @pytest.mark.parametrize("index_name,index_label,expected", [
         # no index name, defaults to 'index'
-        sql.to_sql(temp_frame, 'test_index_label', self.conn)
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'index')
-
+        (None, None, "index"),
         # specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label='other_label')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'other_label',
-                         "Specified index_label not written to database")
-
+        (None, "other_label", "other_label"),
         # using the index name
-        temp_frame.index.name = 'index_name'
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'index_name',
-                         "Index name not written to database")
-
+        ("index_name", None, "index_name"),
         # has index name, but specifying index_label
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label='other_label')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'other_label',
-                         "Specified index_label not written to database")
-
+        ("index_name", "other_label", "other_label"),
         # index name is integer
-        temp_frame.index.name = 0
-        sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace')
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], '0',
-                         "Integer index label not written to database")
-
-        temp_frame.index.name = None
+        (0, None, "0"),
+        # index name is None but index label is integer
+        (None, 0, "0"),
+    ])
+    def test_to_sql_index_label(self, index_name,
+                                index_label, expected):
+        temp_frame = DataFrame({'col1': range(4)})
+        temp_frame.index.name = index_name
+        query = 'SELECT * FROM test_index_label'
         sql.to_sql(temp_frame, 'test_index_label', self.conn,
-                   if_exists='replace', index_label=0)
-        frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], '0',
-                         "Integer index label not written to database")
+                   index_label=index_label)
+        frame = sql.read_sql_query(query, self.conn)
+        assert frame.columns[0] == expected
 
     def test_to_sql_index_label_multiindex(self):
         temp_frame = DataFrame({'col1': range(4)},
@@ -732,35 +736,32 @@ def test_to_sql_index_label_multiindex(self):
         # no index name, defaults to 'level_0' and 'level_1'
         sql.to_sql(temp_frame, 'test_index_label', self.conn)
         frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[0], 'level_0')
-        self.assertEqual(frame.columns[1], 'level_1')
+        assert frame.columns[0] == 'level_0'
+        assert frame.columns[1] == 'level_1'
 
         # specifying index_label
         sql.to_sql(temp_frame, 'test_index_label', self.conn,
                    if_exists='replace', index_label=['A', 'B'])
         frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['A', 'B'],
-                         "Specified index_labels not written to database")
+        assert frame.columns[:2].tolist() == ['A', 'B']
 
         # using the index name
         temp_frame.index.names = ['A', 'B']
         sql.to_sql(temp_frame, 'test_index_label', self.conn,
                    if_exists='replace')
         frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['A', 'B'],
-                         "Index names not written to database")
+        assert frame.columns[:2].tolist() == ['A', 'B']
 
         # has index name, but specifying index_label
         sql.to_sql(temp_frame, 'test_index_label', self.conn,
                    if_exists='replace', index_label=['C', 'D'])
         frame = sql.read_sql_query('SELECT * FROM test_index_label', self.conn)
-        self.assertEqual(frame.columns[:2].tolist(), ['C', 'D'],
-                         "Specified index_labels not written to database")
+        assert frame.columns[:2].tolist() == ['C', 'D']
 
         # wrong length of index_label
-        self.assertRaises(ValueError, sql.to_sql, temp_frame,
-                          'test_index_label', self.conn, if_exists='replace',
-                          index_label='C')
+        pytest.raises(ValueError, sql.to_sql, temp_frame,
+                      'test_index_label', self.conn, if_exists='replace',
+                      index_label='C')
 
     def test_multiindex_roundtrip(self):
         df = DataFrame.from_records([(1, 2.1, 'line1'), (2, 1.5, 'line2')],
@@ -778,27 +779,27 @@ def test_integer_col_names(self):
 
     def test_get_schema(self):
         create_sql = sql.get_schema(self.test_frame1, 'test', con=self.conn)
-        self.assertTrue('CREATE' in create_sql)
+        assert 'CREATE' in create_sql
 
     def test_get_schema_dtypes(self):
         float_frame = DataFrame({'a': [1.1, 1.2], 'b': [2.1, 2.2]})
         dtype = sqlalchemy.Integer if self.mode == 'sqlalchemy' else 'INTEGER'
         create_sql = sql.get_schema(float_frame, 'test',
                                     con=self.conn, dtype={'b': dtype})
-        self.assertTrue('CREATE' in create_sql)
-        self.assertTrue('INTEGER' in create_sql)
+        assert 'CREATE' in create_sql
+        assert 'INTEGER' in create_sql
 
     def test_get_schema_keys(self):
         frame = DataFrame({'Col1': [1.1, 1.2], 'Col2': [2.1, 2.2]})
         create_sql = sql.get_schema(frame, 'test', con=self.conn, keys='Col1')
         constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("Col1")'
-        self.assertTrue(constraint_sentence in create_sql)
+        assert constraint_sentence in create_sql
 
         # multiple columns as key (GH10385)
         create_sql = sql.get_schema(self.test_frame1, 'test',
                                     con=self.conn, keys=['A', 'B'])
         constraint_sentence = 'CONSTRAINT test_pk PRIMARY KEY ("A", "B")'
-        self.assertTrue(constraint_sentence in create_sql)
+        assert constraint_sentence in create_sql
 
     def test_chunksize_read(self):
         df = DataFrame(np.random.randn(22, 5), columns=list('abcde'))
@@ -815,7 +816,7 @@ def test_chunksize_read(self):
         for chunk in sql.read_sql_query("select * from test_chunksize",
                                         self.conn, chunksize=5):
             res2 = concat([res2, chunk], ignore_index=True)
-            self.assertEqual(len(chunk), sizes[i])
+            assert len(chunk) == sizes[i]
             i += 1
 
         tm.assert_frame_equal(res1, res2)
@@ -829,7 +830,7 @@ def test_chunksize_read(self):
             for chunk in sql.read_sql_table("test_chunksize", self.conn,
                                             chunksize=5):
                 res3 = concat([res3, chunk], ignore_index=True)
-                self.assertEqual(len(chunk), sizes[i])
+                assert len(chunk) == sizes[i]
                 i += 1
 
             tm.assert_frame_equal(res1, res3)
@@ -853,9 +854,19 @@ def test_unicode_column_name(self):
         df = DataFrame([[1, 2], [3, 4]], columns=[u'\xe9', u'b'])
         df.to_sql('test_unicode', self.conn, index=False)
 
+    def test_escaped_table_name(self):
+        # GH 13206
+        df = DataFrame({'A': [0, 1, 2], 'B': [0.2, np.nan, 5.6]})
+        df.to_sql('d1187b08-4943-4c8d-a7f6', self.conn, index=False)
+
+        res = sql.read_sql_query('SELECT * FROM `d1187b08-4943-4c8d-a7f6`',
+                                 self.conn)
+
+        tm.assert_frame_equal(res, df)
+
 
 @pytest.mark.single
-class TestSQLApi(SQLAlchemyMixIn, _TestSQLApi, unittest.TestCase):
+class TestSQLApi(SQLAlchemyMixIn, _TestSQLApi):
     """
     Test the public API as it would be used directly
 
@@ -878,29 +889,24 @@ def test_read_table_columns(self):
 
         cols = ['A', 'B']
         result = sql.read_sql_table('test_frame', self.conn, columns=cols)
-        self.assertEqual(result.columns.tolist(), cols,
-                         "Columns not correctly selected")
+        assert result.columns.tolist() == cols
 
     def test_read_table_index_col(self):
         # test columns argument in read_table
         sql.to_sql(self.test_frame1, 'test_frame', self.conn)
 
         result = sql.read_sql_table('test_frame', self.conn, index_col="index")
-        self.assertEqual(result.index.names, ["index"],
-                         "index_col not correctly set")
+        assert result.index.names == ["index"]
 
         result = sql.read_sql_table(
             'test_frame', self.conn, index_col=["A", "B"])
-        self.assertEqual(result.index.names, ["A", "B"],
-                         "index_col not correctly set")
+        assert result.index.names == ["A", "B"]
 
         result = sql.read_sql_table('test_frame', self.conn,
                                     index_col=["A", "B"],
                                     columns=["C", "D"])
-        self.assertEqual(result.index.names, ["A", "B"],
-                         "index_col not correctly set")
-        self.assertEqual(result.columns.tolist(), ["C", "D"],
-                         "columns not set correctly whith index_col")
+        assert result.index.names == ["A", "B"]
+        assert result.columns.tolist() == ["C", "D"]
 
     def test_read_sql_delegate(self):
         iris_frame1 = sql.read_sql_query(
@@ -927,10 +933,11 @@ def test_not_reflect_all_tables(self):
             sql.read_sql_table('other_table', self.conn)
             sql.read_sql_query('SELECT * FROM other_table', self.conn)
             # Verify some things
-            self.assertEqual(len(w), 0, "Warning triggered for other table")
+            assert len(w) == 0
 
     def test_warning_case_insensitive_table_name(self):
-        # see GH7815.
+        # see gh-7815
+        #
         # We can't test that this warning is triggered, a the database
         # configuration would have to be altered. But here we test that
         # the warning is certainly NOT triggered in a normal case.
@@ -940,8 +947,7 @@ def test_warning_case_insensitive_table_name(self):
             # This should not trigger a Warning
             self.test_frame1.to_sql('CaseSensitive', self.conn)
             # Verify some things
-            self.assertEqual(
-                len(w), 0, "Warning triggered for writing a table")
+            assert len(w) == 0
 
     def _get_index_columns(self, tbl_name):
         from sqlalchemy.engine import reflection
@@ -957,8 +963,8 @@ def test_sqlalchemy_type_mapping(self):
                                             utc=True)})
         db = sql.SQLDatabase(self.conn)
         table = sql.SQLTable("test_type", db, frame=df)
-        self.assertTrue(isinstance(
-            table.table.c['time'].type, sqltypes.DateTime))
+        # GH 9086: TIMESTAMP is the suggested type for datetimes with timezones
+        assert isinstance(table.table.c['time'].type, sqltypes.TIMESTAMP)
 
     def test_database_uri_string(self):
 
@@ -981,8 +987,15 @@ def test_database_uri_string(self):
 
         # using driver that will not be installed on Travis to trigger error
         # in sqlalchemy.create_engine -> test passing of this error to user
+        try:
+            # the rest of this test depends on pg8000's being absent
+            import pg8000  # noqa
+            pytest.skip("pg8000 is installed")
+        except ImportError:
+            pass
+
         db_uri = "postgresql+pg8000://user:pass@host/dbname"
-        with tm.assertRaisesRegexp(ImportError, "pg8000"):
+        with pytest.raises(ImportError, match="pg8000"):
             sql.read_sql("select * from table", db_uri)
 
     def _make_iris_table_metadata(self):
@@ -1004,7 +1017,7 @@ def test_query_by_text_obj(self):
         iris_df = sql.read_sql(name_text, self.conn, params={
                                'name': 'Iris-versicolor'})
         all_names = set(iris_df['Name'])
-        self.assertEqual(all_names, set(['Iris-versicolor']))
+        assert all_names == {'Iris-versicolor'}
 
     def test_query_by_select_obj(self):
         # WIP : GH10846
@@ -1015,7 +1028,7 @@ def test_query_by_select_obj(self):
         iris_df = sql.read_sql(name_select, self.conn,
                                params={'name': 'Iris-setosa'})
         all_names = set(iris_df['Name'])
-        self.assertEqual(all_names, set(['Iris-setosa']))
+        assert all_names == {'Iris-setosa'}
 
 
 class _EngineToConnMixin(object):
@@ -1023,8 +1036,9 @@ class _EngineToConnMixin(object):
     A mixin that causes setup_connect to create a conn rather than an engine.
     """
 
-    def setUp(self):
-        super(_EngineToConnMixin, self).setUp()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, load_iris_data):
+        super(_EngineToConnMixin, self).load_test_data_and_sql()
         engine = self.conn
         conn = engine.connect()
         self.__tx = conn.begin()
@@ -1032,21 +1046,23 @@ def setUp(self):
         self.__engine = engine
         self.conn = conn
 
-    def tearDown(self):
+        yield
+
         self.__tx.rollback()
         self.conn.close()
         self.conn = self.__engine
         self.pandasSQL = sql.SQLDatabase(self.__engine)
-        super(_EngineToConnMixin, self).tearDown()
+        # XXX:
+        # super(_EngineToConnMixin, self).teardown_method(method)
 
 
 @pytest.mark.single
-class TestSQLApiConn(_EngineToConnMixin, TestSQLApi, unittest.TestCase):
+class TestSQLApiConn(_EngineToConnMixin, TestSQLApi):
     pass
 
 
 @pytest.mark.single
-class TestSQLiteFallbackApi(SQLiteMixIn, _TestSQLApi, unittest.TestCase):
+class TestSQLiteFallbackApi(SQLiteMixIn, _TestSQLApi):
     """
     Test the public sqlite connection fallback API
 
@@ -1078,8 +1094,8 @@ def test_sql_open_close(self):
     def test_con_string_import_error(self):
         if not SQLALCHEMY_INSTALLED:
             conn = 'mysql://root@localhost/pandas_nosetest'
-            self.assertRaises(ImportError, sql.read_sql, "SELECT * FROM iris",
-                              conn)
+            pytest.raises(ImportError, sql.read_sql, "SELECT * FROM iris",
+                          conn)
         else:
             pytest.skip('SQLAlchemy is installed')
 
@@ -1088,7 +1104,7 @@ def test_read_sql_delegate(self):
         iris_frame2 = sql.read_sql("SELECT * FROM iris", self.conn)
         tm.assert_frame_equal(iris_frame1, iris_frame2)
 
-        self.assertRaises(sql.DatabaseError, sql.read_sql, 'iris', self.conn)
+        pytest.raises(sql.DatabaseError, sql.read_sql, 'iris', self.conn)
 
     def test_safe_names_warning(self):
         # GH 6798
@@ -1100,7 +1116,7 @@ def test_safe_names_warning(self):
     def test_get_schema2(self):
         # without providing a connection object (available for backwards comp)
         create_sql = sql.get_schema(self.test_frame1, 'test')
-        self.assertTrue('CREATE' in create_sql)
+        assert 'CREATE' in create_sql
 
     def _get_sqlite_column_type(self, schema, column):
 
@@ -1117,8 +1133,7 @@ def test_sqlite_type_mapping(self):
         db = sql.SQLiteDatabase(self.conn)
         table = sql.SQLiteTable("test_type", db, frame=df)
         schema = table.sql_schema()
-        self.assertEqual(self._get_sqlite_column_type(schema, 'time'),
-                         "TIMESTAMP")
+        assert self._get_sqlite_column_type(schema, 'time') == "TIMESTAMP"
 
 
 # -----------------------------------------------------------------------------
@@ -1135,26 +1150,21 @@ class _TestSQLAlchemy(SQLAlchemyMixIn, PandasSQLTest):
     """
     flavor = None
 
-    @classmethod
-    def setUpClass(cls):
+    @pytest.fixture(autouse=True, scope='class')
+    def setup_class(cls):
         cls.setup_import()
         cls.setup_driver()
+        conn = cls.connect()
+        conn.connect()
 
-        # test connection
-        try:
-            conn = cls.connect()
-            conn.connect()
-        except sqlalchemy.exc.OperationalError:
-            msg = "{0} - can't connect to {1} server".format(cls, cls.flavor)
-            pytest.skip(msg)
-
-    def setUp(self):
-        self.setup_connect()
-
-        self._load_iris_data()
+    def load_test_data_and_sql(self):
         self._load_raw_sql()
         self._load_test1_data()
 
+    @pytest.fixture(autouse=True)
+    def setup_method(self, load_iris_data):
+        self.load_test_data_and_sql()
+
     @classmethod
     def setup_import(cls):
         # Skip this test if SQLAlchemy not available
@@ -1179,7 +1189,7 @@ def setup_connect(self):
             pytest.skip(
                 "Can't connect to {0} server".format(self.flavor))
 
-    def test_aread_sql(self):
+    def test_read_sql(self):
         self._read_sql_iris()
 
     def test_read_sql_parameter(self):
@@ -1203,6 +1213,12 @@ def test_to_sql_replace(self):
     def test_to_sql_append(self):
         self._to_sql_append()
 
+    def test_to_sql_method_multi(self):
+        self._to_sql(method='multi')
+
+    def test_to_sql_method_callable(self):
+        self._to_sql_method_callable()
+
     def test_create_table(self):
         temp_conn = self.connect()
         temp_frame = DataFrame(
@@ -1211,8 +1227,7 @@ def test_create_table(self):
         pandasSQL = sql.SQLDatabase(temp_conn)
         pandasSQL.to_sql(temp_frame, 'temp_frame')
 
-        self.assertTrue(
-            temp_conn.has_table('temp_frame'), 'Table not written to DB')
+        assert temp_conn.has_table('temp_frame')
 
     def test_drop_table(self):
         temp_conn = self.connect()
@@ -1223,13 +1238,11 @@ def test_drop_table(self):
         pandasSQL = sql.SQLDatabase(temp_conn)
         pandasSQL.to_sql(temp_frame, 'temp_frame')
 
-        self.assertTrue(
-            temp_conn.has_table('temp_frame'), 'Table not written to DB')
+        assert temp_conn.has_table('temp_frame')
 
         pandasSQL.drop_table('temp_frame')
 
-        self.assertFalse(
-            temp_conn.has_table('temp_frame'), 'Table not deleted from DB')
+        assert not temp_conn.has_table('temp_frame')
 
     def test_roundtrip(self):
         self._roundtrip()
@@ -1248,25 +1261,20 @@ def test_read_table_columns(self):
             iris_frame.columns.values, ['SepalLength', 'SepalLength'])
 
     def test_read_table_absent(self):
-        self.assertRaises(
+        pytest.raises(
             ValueError, sql.read_sql_table, "this_doesnt_exist", con=self.conn)
 
     def test_default_type_conversion(self):
         df = sql.read_sql_table("types_test_data", self.conn)
 
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.bool_),
-                        "BoolCol loaded with incorrect type")
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+        assert issubclass(df.BoolCol.dtype.type, np.bool_)
 
         # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
         # Bool column with NA values becomes object
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.object),
-                        "BoolColWithNull loaded with incorrect type")
+        assert issubclass(df.BoolColWithNull.dtype.type, np.object)
 
     def test_bigint(self):
         # int64 should be converted to BigInteger, GH7433
@@ -1281,8 +1289,7 @@ def test_default_date_load(self):
 
         # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
         # MySQL SHOULD be converted.
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
 
     def test_datetime_with_timezone(self):
         # edge case that converts postgresql datetime with time zone types
@@ -1296,24 +1303,24 @@ def check(col):
 
                 # "2000-01-01 00:00:00-08:00" should convert to
                 # "2000-01-01 08:00:00"
-                self.assertEqual(col[0], Timestamp('2000-01-01 08:00:00'))
+                assert col[0] == Timestamp('2000-01-01 08:00:00')
 
                 # "2000-06-01 00:00:00-07:00" should convert to
                 # "2000-06-01 07:00:00"
-                self.assertEqual(col[1], Timestamp('2000-06-01 07:00:00'))
+                assert col[1] == Timestamp('2000-06-01 07:00:00')
 
             elif is_datetime64tz_dtype(col.dtype):
-                self.assertTrue(str(col.dt.tz) == 'UTC')
+                assert str(col.dt.tz) == 'UTC'
 
                 # "2000-01-01 00:00:00-08:00" should convert to
                 # "2000-01-01 08:00:00"
-                self.assertEqual(col[0], Timestamp(
-                    '2000-01-01 08:00:00', tz='UTC'))
-
                 # "2000-06-01 00:00:00-07:00" should convert to
                 # "2000-06-01 07:00:00"
-                self.assertEqual(col[1], Timestamp(
-                    '2000-06-01 07:00:00', tz='UTC'))
+                # GH 6415
+                expected_data = [Timestamp('2000-01-01 08:00:00', tz='UTC'),
+                                 Timestamp('2000-06-01 07:00:00', tz='UTC')]
+                expected = Series(expected_data, name=col.name)
+                tm.assert_series_equal(col, expected)
 
             else:
                 raise AssertionError("DateCol loaded with incorrect type "
@@ -1328,69 +1335,102 @@ def check(col):
         # even with the same versions of psycopg2 & sqlalchemy, possibly a
         # Postgrsql server version difference
         col = df.DateColWithTz
-        self.assertTrue(is_object_dtype(col.dtype) or
-                        is_datetime64_dtype(col.dtype) or
-                        is_datetime64tz_dtype(col.dtype),
-                        "DateCol loaded with incorrect type -> {0}"
-                        .format(col.dtype))
+        assert is_datetime64tz_dtype(col.dtype)
 
         df = pd.read_sql_query("select * from types_test_data",
                                self.conn, parse_dates=['DateColWithTz'])
         if not hasattr(df, 'DateColWithTz'):
             pytest.skip("no column with datetime with time zone")
+        col = df.DateColWithTz
+        assert is_datetime64tz_dtype(col.dtype)
+        assert str(col.dt.tz) == 'UTC'
         check(df.DateColWithTz)
 
         df = pd.concat(list(pd.read_sql_query("select * from types_test_data",
                                               self.conn, chunksize=1)),
                        ignore_index=True)
         col = df.DateColWithTz
-        self.assertTrue(is_datetime64tz_dtype(col.dtype),
-                        "DateCol loaded with incorrect type -> {0}"
-                        .format(col.dtype))
-        self.assertTrue(str(col.dt.tz) == 'UTC')
+        assert is_datetime64tz_dtype(col.dtype)
+        assert str(col.dt.tz) == 'UTC'
         expected = sql.read_sql_table("types_test_data", self.conn)
-        tm.assert_series_equal(df.DateColWithTz,
-                               expected.DateColWithTz
-                               .astype('datetime64[ns, UTC]'))
+        col = expected.DateColWithTz
+        assert is_datetime64tz_dtype(col.dtype)
+        tm.assert_series_equal(df.DateColWithTz, expected.DateColWithTz)
 
         # xref #7139
         # this might or might not be converted depending on the postgres driver
         df = sql.read_sql_table("types_test_data", self.conn)
         check(df.DateColWithTz)
 
+    def test_datetime_with_timezone_roundtrip(self):
+        # GH 9086
+        # Write datetimetz data to a db and read it back
+        # For dbs that support timestamps with timezones, should get back UTC
+        # otherwise naive data should be returned
+        expected = DataFrame({'A': date_range(
+            '2013-01-01 09:00:00', periods=3, tz='US/Pacific'
+        )})
+        expected.to_sql('test_datetime_tz', self.conn, index=False)
+
+        if self.flavor == 'postgresql':
+            # SQLAlchemy "timezones" (i.e. offsets) are coerced to UTC
+            expected['A'] = expected['A'].dt.tz_convert('UTC')
+        else:
+            # Otherwise, timestamps are returned as local, naive
+            expected['A'] = expected['A'].dt.tz_localize(None)
+
+        result = sql.read_sql_table('test_datetime_tz', self.conn)
+        tm.assert_frame_equal(result, expected)
+
+        result = sql.read_sql_query(
+            'SELECT * FROM test_datetime_tz', self.conn
+        )
+        if self.flavor == 'sqlite':
+            # read_sql_query does not return datetime type like read_sql_table
+            assert isinstance(result.loc[0, 'A'], string_types)
+            result['A'] = to_datetime(result['A'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_naive_datetimeindex_roundtrip(self):
+        # GH 23510
+        # Ensure that a naive DatetimeIndex isn't converted to UTC
+        dates = date_range('2018-01-01', periods=5, freq='6H')
+        expected = DataFrame({'nums': range(5)}, index=dates)
+        expected.to_sql('foo_table', self.conn, index_label='info_date')
+        result = sql.read_sql_table('foo_table', self.conn,
+                                    index_col='info_date')
+        # result index with gain a name from a set_index operation; expected
+        tm.assert_frame_equal(result, expected, check_names=False)
+
     def test_date_parsing(self):
         # No Parsing
         df = sql.read_sql_table("types_test_data", self.conn)
+        expected_type = object if self.flavor == 'sqlite' else np.datetime64
+        assert issubclass(df.DateCol.dtype.type, expected_type)
 
         df = sql.read_sql_table("types_test_data", self.conn,
                                 parse_dates=['DateCol'])
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_table("types_test_data", self.conn,
                                 parse_dates={'DateCol': '%Y-%m-%d %H:%M:%S'})
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "DateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_table("types_test_data", self.conn, parse_dates={
             'DateCol': {'format': '%Y-%m-%d %H:%M:%S'}})
-        self.assertTrue(issubclass(df.DateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.DateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_table(
             "types_test_data", self.conn, parse_dates=['IntDateCol'])
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_table(
             "types_test_data", self.conn, parse_dates={'IntDateCol': 's'})
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
 
         df = sql.read_sql_table("types_test_data", self.conn,
                                 parse_dates={'IntDateCol': {'unit': 's'}})
-        self.assertTrue(issubclass(df.IntDateCol.dtype.type, np.datetime64),
-                        "IntDateCol loaded with incorrect type")
+        assert issubclass(df.IntDateCol.dtype.type, np.datetime64)
 
     def test_datetime(self):
         df = DataFrame({'A': date_range('2013-01-01 09:00:00', periods=3),
@@ -1406,7 +1446,7 @@ def test_datetime(self):
         result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
         result = result.drop('index', axis=1)
         if self.flavor == 'sqlite':
-            self.assertTrue(isinstance(result.loc[0, 'A'], string_types))
+            assert isinstance(result.loc[0, 'A'], string_types)
             result['A'] = to_datetime(result['A'])
             tm.assert_frame_equal(result, df)
         else:
@@ -1425,7 +1465,7 @@ def test_datetime_NaT(self):
         # with read_sql -> no type information -> sqlite has no native
         result = sql.read_sql_query('SELECT * FROM test_datetime', self.conn)
         if self.flavor == 'sqlite':
-            self.assertTrue(isinstance(result.loc[0, 'A'], string_types))
+            assert isinstance(result.loc[0, 'A'], string_types)
             result['A'] = to_datetime(result['A'], errors='coerce')
             tm.assert_frame_equal(result, df)
         else:
@@ -1436,8 +1476,10 @@ def test_datetime_date(self):
         df = DataFrame([date(2014, 1, 1), date(2014, 1, 2)], columns=["a"])
         df.to_sql('test_date', self.conn, index=False)
         res = read_sql_table('test_date', self.conn)
+        result = res['a']
+        expected = to_datetime(df['a'])
         # comes back as datetime64
-        tm.assert_series_equal(res['a'], to_datetime(df['a']))
+        tm.assert_series_equal(result, expected)
 
     def test_datetime_time(self):
         # test support for datetime.time
@@ -1558,16 +1600,16 @@ def test_dtype(self):
         meta = sqlalchemy.schema.MetaData(bind=self.conn)
         meta.reflect()
         sqltype = meta.tables['dtype_test2'].columns['B'].type
-        self.assertTrue(isinstance(sqltype, sqlalchemy.TEXT))
-        self.assertRaises(ValueError, df.to_sql,
-                          'error', self.conn, dtype={'B': str})
+        assert isinstance(sqltype, sqlalchemy.TEXT)
+        pytest.raises(ValueError, df.to_sql,
+                      'error', self.conn, dtype={'B': str})
 
         # GH9083
         df.to_sql('dtype_test3', self.conn, dtype={'B': sqlalchemy.String(10)})
         meta.reflect()
         sqltype = meta.tables['dtype_test3'].columns['B'].type
-        self.assertTrue(isinstance(sqltype, sqlalchemy.String))
-        self.assertEqual(sqltype.length, 10)
+        assert isinstance(sqltype, sqlalchemy.String)
+        assert sqltype.length == 10
 
         # single dtype
         df.to_sql('single_dtype_test', self.conn, dtype=sqlalchemy.TEXT)
@@ -1575,10 +1617,10 @@ def test_dtype(self):
         meta.reflect()
         sqltypea = meta.tables['single_dtype_test'].columns['A'].type
         sqltypeb = meta.tables['single_dtype_test'].columns['B'].type
-        self.assertTrue(isinstance(sqltypea, sqlalchemy.TEXT))
-        self.assertTrue(isinstance(sqltypeb, sqlalchemy.TEXT))
+        assert isinstance(sqltypea, sqlalchemy.TEXT)
+        assert isinstance(sqltypeb, sqlalchemy.TEXT)
 
-    def test_notnull_dtype(self):
+    def test_notna_dtype(self):
         cols = {'Bool': Series([True, None]),
                 'Date': Series([datetime(2012, 5, 1), None]),
                 'Int': Series([1, None], dtype='object'),
@@ -1586,7 +1628,7 @@ def test_notnull_dtype(self):
                 }
         df = DataFrame(cols)
 
-        tbl = 'notnull_dtype_test'
+        tbl = 'notna_dtype_test'
         df.to_sql(tbl, self.conn)
         returned_df = sql.read_sql_table(tbl, self.conn)  # noqa
         meta = sqlalchemy.schema.MetaData(bind=self.conn)
@@ -1598,10 +1640,10 @@ def test_notnull_dtype(self):
 
         col_dict = meta.tables[tbl].columns
 
-        self.assertTrue(isinstance(col_dict['Bool'].type, my_type))
-        self.assertTrue(isinstance(col_dict['Date'].type, sqltypes.DateTime))
-        self.assertTrue(isinstance(col_dict['Int'].type, sqltypes.Integer))
-        self.assertTrue(isinstance(col_dict['Float'].type, sqltypes.Float))
+        assert isinstance(col_dict['Bool'].type, my_type)
+        assert isinstance(col_dict['Date'].type, sqltypes.DateTime)
+        assert isinstance(col_dict['Int'].type, sqltypes.Integer)
+        assert isinstance(col_dict['Float'].type, sqltypes.Float)
 
     def test_double_precision(self):
         V = 1.23456789101112131415
@@ -1618,19 +1660,18 @@ def test_double_precision(self):
         res = sql.read_sql_table('test_dtypes', self.conn)
 
         # check precision of float64
-        self.assertEqual(np.round(df['f64'].iloc[0], 14),
-                         np.round(res['f64'].iloc[0], 14))
+        assert (np.round(df['f64'].iloc[0], 14) ==
+                np.round(res['f64'].iloc[0], 14))
 
         # check sql types
         meta = sqlalchemy.schema.MetaData(bind=self.conn)
         meta.reflect()
         col_dict = meta.tables['test_dtypes'].columns
-        self.assertEqual(str(col_dict['f32'].type),
-                         str(col_dict['f64_as_f32'].type))
-        self.assertTrue(isinstance(col_dict['f32'].type, sqltypes.Float))
-        self.assertTrue(isinstance(col_dict['f64'].type, sqltypes.Float))
-        self.assertTrue(isinstance(col_dict['i32'].type, sqltypes.Integer))
-        self.assertTrue(isinstance(col_dict['i64'].type, sqltypes.BigInteger))
+        assert str(col_dict['f32'].type) == str(col_dict['f64_as_f32'].type)
+        assert isinstance(col_dict['f32'].type, sqltypes.Float)
+        assert isinstance(col_dict['f64'].type, sqltypes.Float)
+        assert isinstance(col_dict['i32'].type, sqltypes.Integer)
+        assert isinstance(col_dict['i64'].type, sqltypes.BigInteger)
 
     def test_connectable_issue_example(self):
         # This tests the example raised in issue
@@ -1706,27 +1747,23 @@ def setup_driver(cls):
     def test_default_type_conversion(self):
         df = sql.read_sql_table("types_test_data", self.conn)
 
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+
         # sqlite has no boolean type, so integer type is returned
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.integer),
-                        "BoolCol loaded with incorrect type")
+        assert issubclass(df.BoolCol.dtype.type, np.integer)
 
         # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
+
         # Non-native Bool column with NA values stays as float
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.floating),
-                        "BoolColWithNull loaded with incorrect type")
+        assert issubclass(df.BoolColWithNull.dtype.type, np.floating)
 
     def test_default_date_load(self):
         df = sql.read_sql_table("types_test_data", self.conn)
 
         # IMPORTANT - sqlite has no native date type, so shouldn't parse, but
-        self.assertFalse(issubclass(df.DateCol.dtype.type, np.datetime64),
-                         "DateCol loaded with incorrect type")
+        assert not issubclass(df.DateCol.dtype.type, np.datetime64)
 
     def test_bigint_warning(self):
         # test no warning for BIGINT (to support int64) is raised (GH7433)
@@ -1736,7 +1773,7 @@ def test_bigint_warning(self):
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter("always")
             sql.read_sql_table('test_bigintwarning', self.conn)
-            self.assertEqual(len(w), 0, "Warning triggered for other table")
+            assert len(w) == 0
 
 
 class _TestMySQLAlchemy(object):
@@ -1749,35 +1786,33 @@ class _TestMySQLAlchemy(object):
     @classmethod
     def connect(cls):
         url = 'mysql+{driver}://root@localhost/pandas_nosetest'
-        return sqlalchemy.create_engine(url.format(driver=cls.driver))
+        return sqlalchemy.create_engine(url.format(driver=cls.driver),
+                                        connect_args=cls.connect_args)
 
     @classmethod
     def setup_driver(cls):
-        try:
-            import pymysql  # noqa
-            cls.driver = 'pymysql'
-        except ImportError:
-            pytest.skip('pymysql not installed')
+        pymysql = pytest.importorskip('pymysql')
+        cls.driver = 'pymysql'
+        cls.connect_args = {
+            'client_flag': pymysql.constants.CLIENT.MULTI_STATEMENTS}
 
     def test_default_type_conversion(self):
         df = sql.read_sql_table("types_test_data", self.conn)
 
-        self.assertTrue(issubclass(df.FloatCol.dtype.type, np.floating),
-                        "FloatCol loaded with incorrect type")
-        self.assertTrue(issubclass(df.IntCol.dtype.type, np.integer),
-                        "IntCol loaded with incorrect type")
+        assert issubclass(df.FloatCol.dtype.type, np.floating)
+        assert issubclass(df.IntCol.dtype.type, np.integer)
+
         # MySQL has no real BOOL type (it's an alias for TINYINT)
-        self.assertTrue(issubclass(df.BoolCol.dtype.type, np.integer),
-                        "BoolCol loaded with incorrect type")
+        assert issubclass(df.BoolCol.dtype.type, np.integer)
 
         # Int column with NA values stays as float
-        self.assertTrue(issubclass(df.IntColWithNull.dtype.type, np.floating),
-                        "IntColWithNull loaded with incorrect type")
+        assert issubclass(df.IntColWithNull.dtype.type, np.floating)
+
         # Bool column with NA = int column with NA values => becomes float
-        self.assertTrue(issubclass(df.BoolColWithNull.dtype.type, np.floating),
-                        "BoolColWithNull loaded with incorrect type")
+        assert issubclass(df.BoolColWithNull.dtype.type, np.floating)
 
     def test_read_procedure(self):
+        import pymysql
         # see GH7324. Although it is more an api test, it is added to the
         # mysql tests as sqlite does not have stored procedures
         df = DataFrame({'a': [1, 2, 3], 'b': [0.1, 0.2, 0.3]})
@@ -1796,7 +1831,7 @@ def test_read_procedure(self):
         try:
             r1 = connection.execute(proc)  # noqa
             trans.commit()
-        except:
+        except pymysql.Error:
             trans.rollback()
             raise
 
@@ -1822,11 +1857,8 @@ def connect(cls):
 
     @classmethod
     def setup_driver(cls):
-        try:
-            import psycopg2  # noqa
-            cls.driver = 'psycopg2'
-        except ImportError:
-            pytest.skip('psycopg2 not installed')
+        pytest.importorskip('psycopg2')
+        cls.driver = 'psycopg2'
 
     def test_schema_support(self):
         # only test this for postgresql (schema's not supported in
@@ -1855,8 +1887,8 @@ def test_schema_support(self):
         res4 = sql.read_sql_table('test_schema_other', self.conn,
                                   schema='other')
         tm.assert_frame_equal(df, res4)
-        self.assertRaises(ValueError, sql.read_sql_table, 'test_schema_other',
-                          self.conn, schema='public')
+        pytest.raises(ValueError, sql.read_sql_table, 'test_schema_other',
+                      self.conn, schema='public')
 
         # different if_exists options
 
@@ -1892,39 +1924,68 @@ def test_schema_support(self):
             res2 = pdsql.read_table('test_schema_other2')
             tm.assert_frame_equal(res1, res2)
 
+    def test_copy_from_callable_insertion_method(self):
+        # GH 8953
+        # Example in io.rst found under _io.sql.method
+        # not available in sqlite, mysql
+        def psql_insert_copy(table, conn, keys, data_iter):
+            # gets a DBAPI connection that can provide a cursor
+            dbapi_conn = conn.connection
+            with dbapi_conn.cursor() as cur:
+                s_buf = compat.StringIO()
+                writer = csv.writer(s_buf)
+                writer.writerows(data_iter)
+                s_buf.seek(0)
+
+                columns = ', '.join('"{}"'.format(k) for k in keys)
+                if table.schema:
+                    table_name = '{}.{}'.format(table.schema, table.name)
+                else:
+                    table_name = table.name
+
+                sql_query = 'COPY {} ({}) FROM STDIN WITH CSV'.format(
+                    table_name, columns)
+                cur.copy_expert(sql=sql_query, file=s_buf)
+
+        expected = DataFrame({'col1': [1, 2], 'col2': [0.1, 0.2],
+                              'col3': ['a', 'n']})
+        expected.to_sql('test_copy_insert', self.conn, index=False,
+                        method=psql_insert_copy)
+        result = sql.read_sql_table('test_copy_insert', self.conn)
+        tm.assert_frame_equal(result, expected)
+
 
 @pytest.mark.single
-class TestMySQLAlchemy(_TestMySQLAlchemy, _TestSQLAlchemy, unittest.TestCase):
+@pytest.mark.db
+class TestMySQLAlchemy(_TestMySQLAlchemy, _TestSQLAlchemy):
     pass
 
 
 @pytest.mark.single
-class TestMySQLAlchemyConn(_TestMySQLAlchemy, _TestSQLAlchemyConn,
-                           unittest.TestCase):
+@pytest.mark.db
+class TestMySQLAlchemyConn(_TestMySQLAlchemy, _TestSQLAlchemyConn):
     pass
 
 
 @pytest.mark.single
-class TestPostgreSQLAlchemy(_TestPostgreSQLAlchemy, _TestSQLAlchemy,
-                            unittest.TestCase):
+@pytest.mark.db
+class TestPostgreSQLAlchemy(_TestPostgreSQLAlchemy, _TestSQLAlchemy):
     pass
 
 
 @pytest.mark.single
-class TestPostgreSQLAlchemyConn(_TestPostgreSQLAlchemy, _TestSQLAlchemyConn,
-                                unittest.TestCase):
+@pytest.mark.db
+class TestPostgreSQLAlchemyConn(_TestPostgreSQLAlchemy, _TestSQLAlchemyConn):
     pass
 
 
 @pytest.mark.single
-class TestSQLiteAlchemy(_TestSQLiteAlchemy, _TestSQLAlchemy,
-                        unittest.TestCase):
+class TestSQLiteAlchemy(_TestSQLiteAlchemy, _TestSQLAlchemy):
     pass
 
 
 @pytest.mark.single
-class TestSQLiteAlchemyConn(_TestSQLiteAlchemy, _TestSQLAlchemyConn,
-                            unittest.TestCase):
+class TestSQLiteAlchemyConn(_TestSQLiteAlchemy, _TestSQLAlchemyConn):
     pass
 
 
@@ -1932,7 +1993,7 @@ class TestSQLiteAlchemyConn(_TestSQLiteAlchemy, _TestSQLAlchemyConn,
 # -- Test Sqlite / MySQL fallback
 
 @pytest.mark.single
-class TestSQLiteFallback(SQLiteMixIn, PandasSQLTest, unittest.TestCase):
+class TestSQLiteFallback(SQLiteMixIn, PandasSQLTest):
     """
     Test the fallback mode against an in-memory sqlite database.
 
@@ -1943,14 +2004,17 @@ class TestSQLiteFallback(SQLiteMixIn, PandasSQLTest, unittest.TestCase):
     def connect(cls):
         return sqlite3.connect(':memory:')
 
-    def setUp(self):
+    def setup_connect(self):
         self.conn = self.connect()
-        self.pandasSQL = sql.SQLiteDatabase(self.conn)
-
-        self._load_iris_data()
 
+    def load_test_data_and_sql(self):
+        self.pandasSQL = sql.SQLiteDatabase(self.conn)
         self._load_test1_data()
 
+    @pytest.fixture(autouse=True)
+    def setup_method(self, load_iris_data):
+        self.load_test_data_and_sql()
+
     def test_read_sql(self):
         self._read_sql_iris()
 
@@ -1981,13 +2045,11 @@ def test_create_and_drop_table(self):
 
         self.pandasSQL.to_sql(temp_frame, 'drop_test_frame')
 
-        self.assertTrue(self.pandasSQL.has_table('drop_test_frame'),
-                        'Table not written to DB')
+        assert self.pandasSQL.has_table('drop_test_frame')
 
         self.pandasSQL.drop_table('drop_test_frame')
 
-        self.assertFalse(self.pandasSQL.has_table('drop_test_frame'),
-                         'Table not deleted from DB')
+        assert not self.pandasSQL.has_table('drop_test_frame')
 
     def test_roundtrip(self):
         self._roundtrip()
@@ -2053,22 +2115,22 @@ def test_dtype(self):
         df.to_sql('dtype_test2', self.conn, dtype={'B': 'STRING'})
 
         # sqlite stores Boolean values as INTEGER
-        self.assertEqual(self._get_sqlite_column_type(
-            'dtype_test', 'B'), 'INTEGER')
+        assert self._get_sqlite_column_type(
+            'dtype_test', 'B') == 'INTEGER'
 
-        self.assertEqual(self._get_sqlite_column_type(
-            'dtype_test2', 'B'), 'STRING')
-        self.assertRaises(ValueError, df.to_sql,
-                          'error', self.conn, dtype={'B': bool})
+        assert self._get_sqlite_column_type(
+            'dtype_test2', 'B') == 'STRING'
+        pytest.raises(ValueError, df.to_sql,
+                      'error', self.conn, dtype={'B': bool})
 
         # single dtype
         df.to_sql('single_dtype_test', self.conn, dtype='STRING')
-        self.assertEqual(
-            self._get_sqlite_column_type('single_dtype_test', 'A'), 'STRING')
-        self.assertEqual(
-            self._get_sqlite_column_type('single_dtype_test', 'B'), 'STRING')
+        assert self._get_sqlite_column_type(
+            'single_dtype_test', 'A') == 'STRING'
+        assert self._get_sqlite_column_type(
+            'single_dtype_test', 'B') == 'STRING'
 
-    def test_notnull_dtype(self):
+    def test_notna_dtype(self):
         if self.flavor == 'mysql':
             pytest.skip('Not applicable to MySQL legacy')
 
@@ -2079,21 +2141,20 @@ def test_notnull_dtype(self):
                 }
         df = DataFrame(cols)
 
-        tbl = 'notnull_dtype_test'
+        tbl = 'notna_dtype_test'
         df.to_sql(tbl, self.conn)
 
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Bool'), 'INTEGER')
-        self.assertEqual(self._get_sqlite_column_type(
-            tbl, 'Date'), 'TIMESTAMP')
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Int'), 'INTEGER')
-        self.assertEqual(self._get_sqlite_column_type(tbl, 'Float'), 'REAL')
+        assert self._get_sqlite_column_type(tbl, 'Bool') == 'INTEGER'
+        assert self._get_sqlite_column_type(tbl, 'Date') == 'TIMESTAMP'
+        assert self._get_sqlite_column_type(tbl, 'Int') == 'INTEGER'
+        assert self._get_sqlite_column_type(tbl, 'Float') == 'REAL'
 
     def test_illegal_names(self):
         # For sqlite, these should work fine
         df = DataFrame([[1, 2], [3, 4]], columns=['a', 'b'])
 
         # Raise error on blank
-        self.assertRaises(ValueError, df.to_sql, "", self.conn)
+        pytest.raises(ValueError, df.to_sql, "", self.conn)
 
         for ndx, weird_name in enumerate(
                 ['test_weird_name]', 'test_weird_name[',
@@ -2113,6 +2174,11 @@ def test_illegal_names(self):
 # -- Old tests from 0.13.1 (before refactor using sqlalchemy)
 
 
+def date_format(dt):
+    """Returns date in YYYYMMDD format."""
+    return dt.strftime('%Y%m%d')
+
+
 _formatters = {
     datetime: lambda dt: "'%s'" % date_format(dt),
     str: lambda x: "'%s'" % x,
@@ -2133,7 +2199,7 @@ def format_query(sql, *args):
     """
     processed_args = []
     for arg in args:
-        if isinstance(arg, float) and isnull(arg):
+        if isinstance(arg, float) and isna(arg):
             arg = None
 
         formatter = _formatters[type(arg)]
@@ -2151,17 +2217,18 @@ def tquery(query, con=None, cur=None):
         return list(res)
 
 
-def _skip_if_no_pymysql():
-    try:
-        import pymysql  # noqa
-    except ImportError:
-        pytest.skip('pymysql not installed, skipping')
-
-
 @pytest.mark.single
-class TestXSQLite(SQLiteMixIn, tm.TestCase):
+class TestXSQLite(SQLiteMixIn):
 
-    def setUp(self):
+    @pytest.fixture(autouse=True)
+    def setup_method(self, request, datapath):
+        self.method = request.function
+        self.conn = sqlite3.connect(':memory:')
+
+        # In some test cases we may close db connection
+        # Re-open conn here so we can perform cleanup in teardown
+        yield
+        self.method = request.function
         self.conn = sqlite3.connect(':memory:')
 
     def test_basic(self):
@@ -2187,7 +2254,7 @@ def test_write_row_by_row(self):
 
         result = sql.read_sql("select * from test", con=self.conn)
         result.index = frame.index
-        tm.assert_frame_equal(result, frame)
+        tm.assert_frame_equal(result, frame, check_less_precise=True)
 
     def test_execute(self):
         frame = tm.makeTimeDataFrame()
@@ -2211,12 +2278,12 @@ def test_schema(self):
         for l in lines:
             tokens = l.split(' ')
             if len(tokens) == 2 and tokens[0] == 'A':
-                self.assertTrue(tokens[1] == 'DATETIME')
+                assert tokens[1] == 'DATETIME'
 
         frame = tm.makeTimeDataFrame()
         create_sql = sql.get_schema(frame, 'test', keys=['A', 'B'])
         lines = create_sql.splitlines()
-        self.assertTrue('PRIMARY KEY ("A", "B")' in create_sql)
+        assert 'PRIMARY KEY ("A", "B")' in create_sql
         cur = self.conn.cursor()
         cur.execute(create_sql)
 
@@ -2236,13 +2303,8 @@ def test_execute_fail(self):
         sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
         sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
 
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.execute,
-                              'INSERT INTO test VALUES("foo", "bar", 7)',
-                              self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
+        with pytest.raises(Exception):
+            sql.execute('INSERT INTO test VALUES("foo", "bar", 7)', self.conn)
 
     def test_execute_closed_connection(self):
         create_sql = """
@@ -2259,15 +2321,9 @@ def test_execute_closed_connection(self):
 
         sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
         self.conn.close()
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, tquery, "select * from test",
-                              con=self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
 
-        # Initialize connection again (needed for tearDown)
-        self.setUp()
+        with pytest.raises(Exception):
+            tquery("select * from test", con=self.conn)
 
     def test_na_roundtrip(self):
         pass
@@ -2305,10 +2361,10 @@ def test_onecolumn_of_integer(self):
         sql.to_sql(mono_df, con=self.conn, name='mono_df', index=False)
         # computing the sum via sql
         con_x = self.conn
-        the_sum = sum([my_c0[0]
-                       for my_c0 in con_x.execute("select * from mono_df")])
+        the_sum = sum(my_c0[0]
+                      for my_c0 in con_x.execute("select * from mono_df"))
         # it should not fail, and gives 3 ( Issue #3628 )
-        self.assertEqual(the_sum, 3)
+        assert the_sum == 3
 
         result = sql.read_sql("select * from mono_df", con_x)
         tm.assert_frame_equal(result, mono_df)
@@ -2328,140 +2384,96 @@ def clean_up(test_table_to_drop):
             self.drop_table(test_table_to_drop)
 
         # test if invalid value for if_exists raises appropriate error
-        self.assertRaises(ValueError,
-                          sql.to_sql,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          if_exists='notvalidvalue')
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='notvalidvalue')
         clean_up(table_name)
 
         # test if_exists='fail'
         sql.to_sql(frame=df_if_exists_1, con=self.conn,
                    name=table_name, if_exists='fail')
-        self.assertRaises(ValueError,
-                          sql.to_sql,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          if_exists='fail')
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='fail')
 
         # test if_exists='replace'
         sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
                    if_exists='replace', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
         sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
                    if_exists='replace', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(3, 'C'), (4, 'D'), (5, 'E')])
+        assert (tquery(sql_select, con=self.conn) ==
+                [(3, 'C'), (4, 'D'), (5, 'E')])
         clean_up(table_name)
 
         # test if_exists='append'
         sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
                    if_exists='fail', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
         sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
                    if_exists='append', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
+        assert (tquery(sql_select, con=self.conn) ==
+                [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
         clean_up(table_name)
 
 
 @pytest.mark.single
-class TestSQLFlavorDeprecation(tm.TestCase):
-    """
-    gh-13611: test that the 'flavor' parameter
-    is appropriately deprecated by checking the
-    functions that directly raise the warning
-    """
-
-    con = 1234  # don't need real connection for this
-    funcs = ['SQLiteDatabase', 'pandasSQL_builder']
-
-    def test_unsupported_flavor(self):
-        msg = 'is not supported'
-
-        for func in self.funcs:
-            tm.assertRaisesRegexp(ValueError, msg, getattr(sql, func),
-                                  self.con, flavor='mysql')
-
-    def test_deprecated_flavor(self):
-        for func in self.funcs:
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                getattr(sql, func)(self.con, flavor='sqlite')
-
-
-@pytest.mark.single
+@pytest.mark.db
 @pytest.mark.skip(reason="gh-13611: there is no support for MySQL "
                   "if SQLAlchemy is not installed")
-class TestXMySQL(MySQLMixIn, tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        _skip_if_no_pymysql()
+class TestXMySQL(MySQLMixIn):
 
-        # test connection
-        import pymysql
-        try:
-            # Try Travis defaults.
-            # No real user should allow root access with a blank password.
-            pymysql.connect(host='localhost', user='root', passwd='',
-                            db='pandas_nosetest')
-        except:
-            pass
-        else:
-            return
+    @pytest.fixture(autouse=True, scope='class')
+    def setup_class(cls):
+        pymysql = pytest.importorskip('pymysql')
+        pymysql.connect(host='localhost', user='root', passwd='',
+                        db='pandas_nosetest')
         try:
             pymysql.connect(read_default_group='pandas')
         except pymysql.ProgrammingError:
-            pytest.skip(
+            raise RuntimeError(
                 "Create a group of connection parameters under the heading "
                 "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+                "typically located at ~/.my.cnf or /etc/.my.cnf.")
         except pymysql.Error:
-            pytest.skip(
+            raise RuntimeError(
                 "Cannot connect to database. "
                 "Create a group of connection parameters under the heading "
                 "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+                "typically located at ~/.my.cnf or /etc/.my.cnf.")
 
-    def setUp(self):
-        _skip_if_no_pymysql()
-        import pymysql
-        try:
-            # Try Travis defaults.
-            # No real user should allow root access with a blank password.
-            self.conn = pymysql.connect(host='localhost', user='root',
-                                        passwd='', db='pandas_nosetest')
-        except:
-            pass
-        else:
-            return
+    @pytest.fixture(autouse=True)
+    def setup_method(self, request, datapath):
+        pymysql = pytest.importorskip('pymysql')
+        pymysql.connect(host='localhost', user='root', passwd='',
+                        db='pandas_nosetest')
         try:
-            self.conn = pymysql.connect(read_default_group='pandas')
+            pymysql.connect(read_default_group='pandas')
         except pymysql.ProgrammingError:
-            pytest.skip(
+            raise RuntimeError(
                 "Create a group of connection parameters under the heading "
                 "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+                "typically located at ~/.my.cnf or /etc/.my.cnf.")
         except pymysql.Error:
-            pytest.skip(
+            raise RuntimeError(
                 "Cannot connect to database. "
                 "Create a group of connection parameters under the heading "
                 "[pandas] in your system's mysql default file, "
-                "typically located at ~/.my.cnf or /etc/.my.cnf. ")
+                "typically located at ~/.my.cnf or /etc/.my.cnf.")
+
+        self.method = request.function
 
     def test_basic(self):
-        _skip_if_no_pymysql()
         frame = tm.makeTimeDataFrame()
         self._check_roundtrip(frame)
 
     def test_write_row_by_row(self):
-
-        _skip_if_no_pymysql()
         frame = tm.makeTimeDataFrame()
         frame.iloc[0, 0] = np.nan
         drop_sql = "DROP TABLE IF EXISTS test"
@@ -2478,10 +2490,9 @@ def test_write_row_by_row(self):
 
         result = sql.read_sql("select * from test", con=self.conn)
         result.index = frame.index
-        tm.assert_frame_equal(result, frame)
+        tm.assert_frame_equal(result, frame, check_less_precise=True)
 
     def test_chunksize_read_type(self):
-        _skip_if_no_pymysql()
         frame = tm.makeTimeDataFrame()
         frame.index.name = "index"
         drop_sql = "DROP TABLE IF EXISTS test"
@@ -2496,7 +2507,6 @@ def test_chunksize_read_type(self):
         tm.assert_frame_equal(frame[:chunksize], chunk_df)
 
     def test_execute(self):
-        _skip_if_no_pymysql()
         frame = tm.makeTimeDataFrame()
         drop_sql = "DROP TABLE IF EXISTS test"
         create_sql = sql.get_schema(frame, 'test')
@@ -2516,26 +2526,24 @@ def test_execute(self):
         tm.assert_frame_equal(result, frame[:1])
 
     def test_schema(self):
-        _skip_if_no_pymysql()
         frame = tm.makeTimeDataFrame()
         create_sql = sql.get_schema(frame, 'test')
         lines = create_sql.splitlines()
         for l in lines:
             tokens = l.split(' ')
             if len(tokens) == 2 and tokens[0] == 'A':
-                self.assertTrue(tokens[1] == 'DATETIME')
+                assert tokens[1] == 'DATETIME'
 
         frame = tm.makeTimeDataFrame()
         drop_sql = "DROP TABLE IF EXISTS test"
         create_sql = sql.get_schema(frame, 'test', keys=['A', 'B'])
         lines = create_sql.splitlines()
-        self.assertTrue('PRIMARY KEY (`A`, `B`)' in create_sql)
+        assert 'PRIMARY KEY (`A`, `B`)' in create_sql
         cur = self.conn.cursor()
         cur.execute(drop_sql)
         cur.execute(create_sql)
 
     def test_execute_fail(self):
-        _skip_if_no_pymysql()
         drop_sql = "DROP TABLE IF EXISTS test"
         create_sql = """
         CREATE TABLE test
@@ -2553,16 +2561,10 @@ def test_execute_fail(self):
         sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
         sql.execute('INSERT INTO test VALUES("foo", "baz", 2.567)', self.conn)
 
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, sql.execute,
-                              'INSERT INTO test VALUES("foo", "bar", 7)',
-                              self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
+        with pytest.raises(Exception):
+            sql.execute('INSERT INTO test VALUES("foo", "bar", 7)', self.conn)
 
-    def test_execute_closed_connection(self):
-        _skip_if_no_pymysql()
+    def test_execute_closed_connection(self, request, datapath):
         drop_sql = "DROP TABLE IF EXISTS test"
         create_sql = """
         CREATE TABLE test
@@ -2579,22 +2581,17 @@ def test_execute_closed_connection(self):
 
         sql.execute('INSERT INTO test VALUES("foo", "bar", 1.234)', self.conn)
         self.conn.close()
-        try:
-            sys.stdout = StringIO()
-            self.assertRaises(Exception, tquery, "select * from test",
-                              con=self.conn)
-        finally:
-            sys.stdout = sys.__stdout__
+
+        with pytest.raises(Exception):
+            tquery("select * from test", con=self.conn)
 
         # Initialize connection again (needed for tearDown)
-        self.setUp()
+        self.setup_method(request, datapath)
 
     def test_na_roundtrip(self):
-        _skip_if_no_pymysql()
         pass
 
     def _check_roundtrip(self, frame):
-        _skip_if_no_pymysql()
         drop_sql = "DROP TABLE IF EXISTS test_table"
         cur = self.conn.cursor()
         with warnings.catch_warnings():
@@ -2631,13 +2628,11 @@ def _check_roundtrip(self, frame):
         tm.assert_frame_equal(expected, result)
 
     def test_keyword_as_column_names(self):
-        _skip_if_no_pymysql()
         df = DataFrame({'From': np.ones(5)})
         sql.to_sql(df, con=self.conn, name='testkeywords',
                    if_exists='replace', index=False)
 
     def test_if_exists(self):
-        _skip_if_no_pymysql()
         df_if_exists_1 = DataFrame({'col1': [1, 2], 'col2': ['A', 'B']})
         df_if_exists_2 = DataFrame(
             {'col1': [3, 4, 5], 'col2': ['C', 'D', 'E']})
@@ -2652,42 +2647,40 @@ def clean_up(test_table_to_drop):
             self.drop_table(test_table_to_drop)
 
         # test if invalid value for if_exists raises appropriate error
-        self.assertRaises(ValueError,
-                          sql.to_sql,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          if_exists='notvalidvalue')
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='notvalidvalue')
         clean_up(table_name)
 
         # test if_exists='fail'
         sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
                    if_exists='fail', index=False)
-        self.assertRaises(ValueError,
-                          sql.to_sql,
-                          frame=df_if_exists_1,
-                          con=self.conn,
-                          name=table_name,
-                          if_exists='fail')
+        pytest.raises(ValueError,
+                      sql.to_sql,
+                      frame=df_if_exists_1,
+                      con=self.conn,
+                      name=table_name,
+                      if_exists='fail')
 
         # test if_exists='replace'
         sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
                    if_exists='replace', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
         sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
                    if_exists='replace', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(3, 'C'), (4, 'D'), (5, 'E')])
+        assert (tquery(sql_select, con=self.conn) ==
+                [(3, 'C'), (4, 'D'), (5, 'E')])
         clean_up(table_name)
 
         # test if_exists='append'
         sql.to_sql(frame=df_if_exists_1, con=self.conn, name=table_name,
                    if_exists='fail', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B')])
+        assert tquery(sql_select, con=self.conn) == [(1, 'A'), (2, 'B')]
         sql.to_sql(frame=df_if_exists_2, con=self.conn, name=table_name,
                    if_exists='append', index=False)
-        self.assertEqual(tquery(sql_select, con=self.conn),
-                         [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
+        assert (tquery(sql_select, con=self.conn) ==
+                [(1, 'A'), (2, 'B'), (3, 'C'), (4, 'D'), (5, 'E')])
         clean_up(table_name)
diff --git a/pandas/tests/io/test_stata.py b/pandas/tests/io/test_stata.py
index db594889c91ee..586297d2e3872 100644
--- a/pandas/tests/io/test_stata.py
+++ b/pandas/tests/io/test_stata.py
@@ -1,32 +1,51 @@
 # -*- coding: utf-8 -*-
 # pylint: disable=E1101
 
+from collections import OrderedDict
 import datetime as dt
+from datetime import datetime
+import gzip
+import io
 import os
 import struct
-import sys
 import warnings
-from datetime import datetime
-from distutils.version import LooseVersion
 
-import pytest
 import numpy as np
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import PY3, ResourceWarning, iterkeys
+
+from pandas.core.dtypes.common import is_categorical_dtype
+
 import pandas as pd
-import pandas.util.testing as tm
-from pandas import compat
-from pandas.compat import iterkeys
 from pandas.core.frame import DataFrame, Series
+import pandas.util.testing as tm
+
 from pandas.io.parsers import read_csv
-from pandas.io.stata import (read_stata, StataReader, InvalidColumnName,
-                             PossiblePrecisionLoss, StataMissingValue)
-from pandas._libs.tslib import NaT
-from pandas.types.common import is_categorical_dtype
+from pandas.io.stata import (
+    InvalidColumnName, PossiblePrecisionLoss, StataMissingValue, StataReader,
+    read_stata)
+
+
+@pytest.fixture
+def dirpath(datapath):
+    return datapath("io", "data")
+
+
+@pytest.fixture
+def parsed_114(dirpath):
+    dta14_114 = os.path.join(dirpath, 'stata5_114.dta')
+    parsed_114 = read_stata(dta14_114, convert_dates=True)
+    parsed_114.index.name = 'index'
+    return parsed_114
 
 
-class TestStata(tm.TestCase):
+class TestStata(object):
 
-    def setUp(self):
-        self.dirpath = tm.get_data_path()
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
+        self.dirpath = datapath("io", "data")
         self.dta1_114 = os.path.join(self.dirpath, 'stata1_114.dta')
         self.dta1_117 = os.path.join(self.dirpath, 'stata1_117.dta')
 
@@ -82,6 +101,9 @@ def setUp(self):
         self.dta23 = os.path.join(self.dirpath, 'stata15.dta')
 
         self.dta24_111 = os.path.join(self.dirpath, 'stata7_111.dta')
+        self.dta25_118 = os.path.join(self.dirpath, 'stata16_118.dta')
+
+        self.stata_dates = os.path.join(self.dirpath, 'stata13_dates.dta')
 
     def read_dta(self, file):
         # Legacy default reader configuration
@@ -90,28 +112,31 @@ def read_dta(self, file):
     def read_csv(self, file):
         return read_csv(file, parse_dates=True)
 
-    def test_read_empty_dta(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_empty_dta(self, version):
         empty_ds = DataFrame(columns=['unit'])
         # GH 7369, make sure can read a 0-obs dta file
         with tm.ensure_clean() as path:
-            empty_ds.to_stata(path, write_index=False)
+            empty_ds.to_stata(path, write_index=False, version=version)
             empty_ds2 = read_stata(path)
             tm.assert_frame_equal(empty_ds, empty_ds2)
 
     def test_data_method(self):
         # Minimal testing of legacy data method
         with StataReader(self.dta1_114) as rdr:
-            with warnings.catch_warnings(record=True) as w:  # noqa
+            with tm.assert_produces_warning(UserWarning):
                 parsed_114_data = rdr.data()
 
         with StataReader(self.dta1_114) as rdr:
             parsed_114_read = rdr.read()
         tm.assert_frame_equal(parsed_114_data, parsed_114_read)
 
-    def test_read_dta1(self):
+    @pytest.mark.parametrize(
+        'file', ['dta1_114', 'dta1_117'])
+    def test_read_dta1(self, file):
 
-        parsed_114 = self.read_dta(self.dta1_114)
-        parsed_117 = self.read_dta(self.dta1_117)
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
 
         # Pandas uses np.nan as missing value.
         # Thus, all columns will be of type float, regardless of their name.
@@ -123,12 +148,9 @@ def test_read_dta1(self):
         # the casting doesn't fail so need to match stata here
         expected['float_miss'] = expected['float_miss'].astype(np.float32)
 
-        tm.assert_frame_equal(parsed_114, expected)
-        tm.assert_frame_equal(parsed_117, expected)
+        tm.assert_frame_equal(parsed, expected)
 
     def test_read_dta2(self):
-        if LooseVersion(sys.version) < '2.7':
-            pytest.skip('datetime interp under 2.6 is faulty')
 
         expected = DataFrame.from_records(
             [
@@ -181,7 +203,7 @@ def test_read_dta2(self):
             w = [x for x in w if x.category is UserWarning]
 
             # should get warning for each call to read_dta
-            self.assertEqual(len(w), 3)
+            assert len(w) == 3
 
         # buggy test because of the NaT comparison on certain platforms
         # Format 113 test fails since it does not support tc and tC formats
@@ -193,11 +215,12 @@ def test_read_dta2(self):
         tm.assert_frame_equal(parsed_117, expected,
                               check_datetimelike_compat=True)
 
-    def test_read_dta3(self):
-        parsed_113 = self.read_dta(self.dta3_113)
-        parsed_114 = self.read_dta(self.dta3_114)
-        parsed_115 = self.read_dta(self.dta3_115)
-        parsed_117 = self.read_dta(self.dta3_117)
+    @pytest.mark.parametrize(
+        'file', ['dta3_113', 'dta3_114', 'dta3_115', 'dta3_117'])
+    def test_read_dta3(self, file):
+
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
 
         # match stata here
         expected = self.read_csv(self.csv3)
@@ -205,16 +228,14 @@ def test_read_dta3(self):
         expected['year'] = expected['year'].astype(np.int16)
         expected['quarter'] = expected['quarter'].astype(np.int8)
 
-        tm.assert_frame_equal(parsed_113, expected)
-        tm.assert_frame_equal(parsed_114, expected)
-        tm.assert_frame_equal(parsed_115, expected)
-        tm.assert_frame_equal(parsed_117, expected)
+        tm.assert_frame_equal(parsed, expected)
+
+    @pytest.mark.parametrize(
+        'file', ['dta4_113', 'dta4_114', 'dta4_115', 'dta4_117'])
+    def test_read_dta4(self, file):
 
-    def test_read_dta4(self):
-        parsed_113 = self.read_dta(self.dta4_113)
-        parsed_114 = self.read_dta(self.dta4_114)
-        parsed_115 = self.read_dta(self.dta4_115)
-        parsed_117 = self.read_dta(self.dta4_117)
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
 
         expected = DataFrame.from_records(
             [
@@ -237,10 +258,7 @@ def test_read_dta4(self):
                               for col in expected], axis=1)
 
         # stata doesn't save .category metadata
-        tm.assert_frame_equal(parsed_113, expected, check_categorical=False)
-        tm.assert_frame_equal(parsed_114, expected, check_categorical=False)
-        tm.assert_frame_equal(parsed_115, expected, check_categorical=False)
-        tm.assert_frame_equal(parsed_117, expected, check_categorical=False)
+        tm.assert_frame_equal(parsed, expected, check_categorical=False)
 
     # File containing strls
     def test_read_dta12(self):
@@ -283,7 +301,7 @@ def test_read_dta18(self):
                            u'Floats': u'float data'}
             tm.assert_dict_equal(vl, vl_expected)
 
-            self.assertEqual(rdr.data_label, u'This is a  Ünicode data label')
+            assert rdr.data_label == u'This is a  Ünicode data label'
 
     def test_read_write_dta5(self):
         original = DataFrame([(np.nan, np.nan, np.nan, np.nan, np.nan)],
@@ -310,7 +328,8 @@ def test_write_dta6(self):
             tm.assert_frame_equal(written_and_read_again.set_index('index'),
                                   original, check_index_type=False)
 
-    def test_read_write_dta10(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_write_dta10(self, version):
         original = DataFrame(data=[["string", "object", 1, 1.1,
                                     np.datetime64('2003-12-25')]],
                              columns=['string', 'object', 'integer',
@@ -321,9 +340,9 @@ def test_read_write_dta10(self):
         original['integer'] = original['integer'].astype(np.int32)
 
         with tm.ensure_clean() as path:
-            original.to_stata(path, {'datetime': 'tc'})
+            original.to_stata(path, {'datetime': 'tc'}, version=version)
             written_and_read_again = self.read_dta(path)
-            # original.index is np.int32, readed index is np.int64
+            # original.index is np.int32, read index is np.int64
             tm.assert_frame_equal(written_and_read_again.set_index('index'),
                                   original, check_index_type=False)
 
@@ -342,25 +361,24 @@ def test_write_preserves_original(self):
             df.to_stata(path, write_index=False)
         tm.assert_frame_equal(df, df_copy)
 
-    def test_encoding(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_encoding(self, version):
 
         # GH 4626, proper encoding handling
         raw = read_stata(self.dta_encoding)
-        encoded = read_stata(self.dta_encoding, encoding="latin-1")
+        with tm.assert_produces_warning(FutureWarning):
+            encoded = read_stata(self.dta_encoding, encoding='latin-1')
         result = encoded.kreis1849[0]
 
-        if compat.PY3:
-            expected = raw.kreis1849[0]
-            self.assertEqual(result, expected)
-            self.assertIsInstance(result, compat.string_types)
-        else:
-            expected = raw.kreis1849.str.decode("latin-1")[0]
-            self.assertEqual(result, expected)
-            self.assertIsInstance(result, unicode)  # noqa
+        expected = raw.kreis1849[0]
+        assert result == expected
+        assert isinstance(result, compat.string_types)
 
         with tm.ensure_clean() as path:
-            encoded.to_stata(path, encoding='latin-1', write_index=False)
-            reread_encoded = read_stata(path, encoding='latin-1')
+            with tm.assert_produces_warning(FutureWarning):
+                encoded.to_stata(path, write_index=False, version=version,
+                                 encoding='latin-1')
+            reread_encoded = read_stata(path)
             tm.assert_frame_equal(encoded, reread_encoded)
 
     def test_read_write_dta11(self):
@@ -374,16 +392,15 @@ def test_read_write_dta11(self):
         formatted = formatted.astype(np.int32)
 
         with tm.ensure_clean() as path:
-            with warnings.catch_warnings(record=True) as w:
+            with tm.assert_produces_warning(pd.io.stata.InvalidColumnName):
                 original.to_stata(path, None)
-                # should get a warning for that format.
-            self.assertEqual(len(w), 1)
 
             written_and_read_again = self.read_dta(path)
             tm.assert_frame_equal(
                 written_and_read_again.set_index('index'), formatted)
 
-    def test_read_write_dta12(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_read_write_dta12(self, version):
         original = DataFrame([(1, 2, 3, 4, 5, 6)],
                              columns=['astringwithmorethan32characters_1',
                                       'astringwithmorethan32characters_2',
@@ -403,9 +420,10 @@ def test_read_write_dta12(self):
 
         with tm.ensure_clean() as path:
             with warnings.catch_warnings(record=True) as w:
-                original.to_stata(path, None)
+                warnings.simplefilter('always', InvalidColumnName)
+                original.to_stata(path, None, version=version)
                 # should get a warning for that format.
-                self.assertEqual(len(w), 1)
+                assert len(w) == 1
 
             written_and_read_again = self.read_dta(path)
             tm.assert_frame_equal(
@@ -427,7 +445,14 @@ def test_read_write_dta13(self):
             tm.assert_frame_equal(written_and_read_again.set_index('index'),
                                   formatted)
 
-    def test_read_write_reread_dta14(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    @pytest.mark.parametrize(
+        'file', ['dta14_113', 'dta14_114', 'dta14_115', 'dta14_117'])
+    def test_read_write_reread_dta14(self, file, parsed_114, version):
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
+        parsed.index.name = 'index'
+
         expected = self.read_csv(self.csv14)
         cols = ['byte_', 'int_', 'long_', 'float_', 'double_']
         for col in cols:
@@ -436,26 +461,18 @@ def test_read_write_reread_dta14(self):
         expected['date_td'] = pd.to_datetime(
             expected['date_td'], errors='coerce')
 
-        parsed_113 = self.read_dta(self.dta14_113)
-        parsed_113.index.name = 'index'
-        parsed_114 = self.read_dta(self.dta14_114)
-        parsed_114.index.name = 'index'
-        parsed_115 = self.read_dta(self.dta14_115)
-        parsed_115.index.name = 'index'
-        parsed_117 = self.read_dta(self.dta14_117)
-        parsed_117.index.name = 'index'
-
-        tm.assert_frame_equal(parsed_114, parsed_113)
-        tm.assert_frame_equal(parsed_114, parsed_115)
-        tm.assert_frame_equal(parsed_114, parsed_117)
+        tm.assert_frame_equal(parsed_114, parsed)
 
         with tm.ensure_clean() as path:
-            parsed_114.to_stata(path, {'date_td': 'td'})
+            parsed_114.to_stata(path, {'date_td': 'td'}, version=version)
             written_and_read_again = self.read_dta(path)
             tm.assert_frame_equal(
                 written_and_read_again.set_index('index'), parsed_114)
 
-    def test_read_write_reread_dta15(self):
+    @pytest.mark.parametrize(
+        'file', ['dta15_113', 'dta15_114', 'dta15_115', 'dta15_117'])
+    def test_read_write_reread_dta15(self, file):
+
         expected = self.read_csv(self.csv15)
         expected['byte_'] = expected['byte_'].astype(np.int8)
         expected['int_'] = expected['int_'].astype(np.int16)
@@ -465,28 +482,35 @@ def test_read_write_reread_dta15(self):
         expected['date_td'] = expected['date_td'].apply(
             datetime.strptime, args=('%Y-%m-%d',))
 
-        parsed_113 = self.read_dta(self.dta15_113)
-        parsed_114 = self.read_dta(self.dta15_114)
-        parsed_115 = self.read_dta(self.dta15_115)
-        parsed_117 = self.read_dta(self.dta15_117)
+        file = getattr(self, file)
+        parsed = self.read_dta(file)
 
-        tm.assert_frame_equal(expected, parsed_114)
-        tm.assert_frame_equal(parsed_113, parsed_114)
-        tm.assert_frame_equal(parsed_114, parsed_115)
-        tm.assert_frame_equal(parsed_114, parsed_117)
+        tm.assert_frame_equal(expected, parsed)
 
-    def test_timestamp_and_label(self):
-        original = DataFrame([(1,)], columns=['var'])
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_timestamp_and_label(self, version):
+        original = DataFrame([(1,)], columns=['variable'])
         time_stamp = datetime(2000, 2, 29, 14, 21)
         data_label = 'This is a data file.'
         with tm.ensure_clean() as path:
             original.to_stata(path, time_stamp=time_stamp,
-                              data_label=data_label)
+                              data_label=data_label,
+                              version=version)
 
             with StataReader(path) as reader:
                 assert reader.time_stamp == '29 Feb 2000 14:21'
                 assert reader.data_label == data_label
 
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_invalid_timestamp(self, version):
+        original = DataFrame([(1,)], columns=['variable'])
+        time_stamp = '01 Jan 2000, 00:00:00'
+        with tm.ensure_clean() as path:
+            msg = "time_stamp should be datetime type"
+            with pytest.raises(ValueError, match=msg):
+                original.to_stata(path, time_stamp=time_stamp,
+                                  version=version)
+
     def test_numeric_column_names(self):
         original = DataFrame(np.reshape(np.arange(25.0), (5, 5)))
         original.index.name = 'index'
@@ -502,7 +526,8 @@ def test_numeric_column_names(self):
             written_and_read_again.columns = map(convert_col_name, columns)
             tm.assert_frame_equal(original, written_and_read_again)
 
-    def test_nan_to_missing_value(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_nan_to_missing_value(self, version):
         s1 = Series(np.arange(4.0), dtype=np.float32)
         s2 = Series(np.arange(4.0), dtype=np.float64)
         s1[::2] = np.nan
@@ -510,7 +535,7 @@ def test_nan_to_missing_value(self):
         original = DataFrame({'s1': s1, 's2': s2})
         original.index.name = 'index'
         with tm.ensure_clean() as path:
-            original.to_stata(path)
+            original.to_stata(path, version=version)
             written_and_read_again = self.read_dta(path)
             written_and_read_again = written_and_read_again.set_index('index')
             tm.assert_frame_equal(written_and_read_again, original)
@@ -523,8 +548,8 @@ def test_no_index(self):
         with tm.ensure_clean() as path:
             original.to_stata(path, write_index=False)
             written_and_read_again = self.read_dta(path)
-            tm.assertRaises(
-                KeyError, lambda: written_and_read_again['index_not_written'])
+            with pytest.raises(KeyError, match=original.index.name):
+                written_and_read_again['index_not_written']
 
     def test_string_no_dates(self):
         s1 = Series(['a', 'A longer string'])
@@ -583,9 +608,19 @@ def test_105(self):
         df0['psch_dis'] = df0["psch_dis"].astype(np.float32)
         tm.assert_frame_equal(df.head(3), df0)
 
+    def test_value_labels_old_format(self):
+        # GH 19417
+        #
+        # Test that value_labels() returns an empty dict if the file format
+        # predates supporting value labels.
+        dpath = os.path.join(self.dirpath, 'S4_EDUC1.dta')
+        reader = StataReader(dpath)
+        assert reader.value_labels() == {}
+        reader.close()
+
     def test_date_export_formats(self):
         columns = ['tc', 'td', 'tw', 'tm', 'tq', 'th', 'ty']
-        conversions = dict(((c, c) for c in columns))
+        conversions = {c: c for c in columns}
         data = [datetime(2006, 11, 20, 23, 13, 20)] * len(columns)
         original = DataFrame([data], columns=columns)
         original.index.name = 'index'
@@ -615,7 +650,9 @@ def test_write_missing_strings(self):
             tm.assert_frame_equal(written_and_read_again.set_index('index'),
                                   expected)
 
-    def test_bool_uint(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    @pytest.mark.parametrize('byteorder', ['>', '<'])
+    def test_bool_uint(self, byteorder, version):
         s0 = Series([0, 1, True], dtype=np.bool)
         s1 = Series([0, 1, 100], dtype=np.uint8)
         s2 = Series([0, 1, 255], dtype=np.uint8)
@@ -634,7 +671,7 @@ def test_bool_uint(self):
             expected[c] = expected[c].astype(t)
 
         with tm.ensure_clean() as path:
-            original.to_stata(path)
+            original.to_stata(path, byteorder=byteorder, version=version)
             written_and_read_again = self.read_dta(path)
             written_and_read_again = written_and_read_again.set_index('index')
             tm.assert_frame_equal(written_and_read_again, expected)
@@ -647,10 +684,10 @@ def test_variable_labels(self):
         keys = ('var1', 'var2', 'var3')
         labels = ('label1', 'label2', 'label3')
         for k, v in compat.iteritems(sr_115):
-            self.assertTrue(k in sr_117)
-            self.assertTrue(v == sr_117[k])
-            self.assertTrue(k in keys)
-            self.assertTrue(v in labels)
+            assert k in sr_117
+            assert v == sr_117[k]
+            assert k in keys
+            assert v in labels
 
     def test_minimal_size_col(self):
         str_lens = (1, 100, 244)
@@ -667,8 +704,8 @@ def test_minimal_size_col(self):
                 variables = sr.varlist
                 formats = sr.fmtlist
                 for variable, fmt, typ in zip(variables, formats, typlist):
-                    self.assertTrue(int(variable[1:]) == int(fmt[1:-1]))
-                    self.assertTrue(int(variable[1:]) == typ)
+                    assert int(variable[1:]) == int(fmt[1:-1])
+                    assert int(variable[1:]) == typ
 
     def test_excessively_long_string(self):
         str_lens = (1, 244, 500)
@@ -677,7 +714,11 @@ def test_excessively_long_string(self):
             s['s' + str(str_len)] = Series(['a' * str_len,
                                             'b' * str_len, 'c' * str_len])
         original = DataFrame(s)
-        with tm.assertRaises(ValueError):
+        msg = (r"Fixed width strings in Stata \.dta files are limited to 244"
+               r" \(or fewer\)\ncharacters\.  Column 's500' does not satisfy"
+               r" this restriction\. Use the\n'version=117' parameter to write"
+               r" the newer \(Stata 13 and later\) format\.")
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path)
 
@@ -694,23 +735,25 @@ def test_missing_value_generator(self):
             offset = valid_range[t][1]
             for i in range(0, 27):
                 val = StataMissingValue(offset + 1 + i)
-                self.assertTrue(val.string == expected_values[i])
+                assert val.string == expected_values[i]
 
         # Test extremes for floats
         val = StataMissingValue(struct.unpack('<f', b'\x00\x00\x00\x7f')[0])
-        self.assertTrue(val.string == '.')
+        assert val.string == '.'
         val = StataMissingValue(struct.unpack('<f', b'\x00\xd0\x00\x7f')[0])
-        self.assertTrue(val.string == '.z')
+        assert val.string == '.z'
 
         # Test extremes for floats
         val = StataMissingValue(struct.unpack(
             '<d', b'\x00\x00\x00\x00\x00\x00\xe0\x7f')[0])
-        self.assertTrue(val.string == '.')
+        assert val.string == '.'
         val = StataMissingValue(struct.unpack(
             '<d', b'\x00\x00\x00\x00\x00\x1a\xe0\x7f')[0])
-        self.assertTrue(val.string == '.z')
+        assert val.string == '.z'
 
-    def test_missing_value_conversion(self):
+    @pytest.mark.parametrize(
+        'file', ['dta17_113', 'dta17_115', 'dta17_117'])
+    def test_missing_value_conversion(self, file):
         columns = ['int8_', 'int16_', 'int32_', 'float32_', 'float64_']
         smv = StataMissingValue(101)
         keys = [key for key in iterkeys(smv.MISSING_VALUES)]
@@ -721,13 +764,8 @@ def test_missing_value_conversion(self):
             data.append(row)
         expected = DataFrame(data, columns=columns)
 
-        parsed_113 = read_stata(self.dta17_113, convert_missing=True)
-        parsed_115 = read_stata(self.dta17_115, convert_missing=True)
-        parsed_117 = read_stata(self.dta17_117, convert_missing=True)
-
-        tm.assert_frame_equal(expected, parsed_113)
-        tm.assert_frame_equal(expected, parsed_115)
-        tm.assert_frame_equal(expected, parsed_117)
+        parsed = read_stata(getattr(self, file), convert_missing=True)
+        tm.assert_frame_equal(parsed, expected)
 
     def test_big_dates(self):
         yr = [1960, 2000, 9999, 100, 2262, 1677]
@@ -748,7 +786,7 @@ def test_big_dates(self):
                 else:
                     row.append(datetime(yr[i], mo[i], dd[i]))
             expected.append(row)
-        expected.append([NaT] * 7)
+        expected.append([pd.NaT] * 7)
         columns = ['date_tc', 'date_td', 'date_tw', 'date_tm', 'date_tq',
                    'date_th', 'date_ty']
 
@@ -772,7 +810,7 @@ def test_big_dates(self):
         tm.assert_frame_equal(expected, parsed_117,
                               check_datetimelike_compat=True)
 
-        date_conversion = dict((c, c[-2:]) for c in columns)
+        date_conversion = {c: c[-2:] for c in columns}
         # {c : c[-2:] for c in columns}
         with tm.ensure_clean() as path:
             expected.index.name = 'index'
@@ -831,15 +869,22 @@ def test_drop_column(self):
                                columns=columns)
         tm.assert_frame_equal(expected, reordered)
 
-        with tm.assertRaises(ValueError):
+        msg = "columns contains duplicate entries"
+        with pytest.raises(ValueError, match=msg):
             columns = ['byte_', 'byte_']
             read_stata(self.dta15_117, convert_dates=True, columns=columns)
 
-        with tm.assertRaises(ValueError):
+        msg = ("The following columns were not found in the Stata data set:"
+               " not_found")
+        with pytest.raises(ValueError, match=msg):
             columns = ['byte_', 'int_', 'long_', 'not_found']
             read_stata(self.dta15_117, convert_dates=True, columns=columns)
 
-    def test_categorical_writing(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    @pytest.mark.filterwarnings(
+        "ignore:\\nStata value:pandas.io.stata.ValueLabelTypeMismatch"
+    )
+    def test_categorical_writing(self, version):
         original = DataFrame.from_records(
             [
                 ["one", "ten", "one", "one", "one", 1],
@@ -869,12 +914,10 @@ def test_categorical_writing(self):
         expected.index.name = 'index'
 
         with tm.ensure_clean() as path:
-            with warnings.catch_warnings(record=True) as w:  # noqa
-                # Silence warnings
-                original.to_stata(path)
-                written_and_read_again = self.read_dta(path)
-                res = written_and_read_again.set_index('index')
-                tm.assert_frame_equal(res, expected, check_categorical=False)
+            original.to_stata(path, version=version)
+            written_and_read_again = self.read_dta(path)
+            res = written_and_read_again.set_index('index')
+            tm.assert_frame_equal(res, expected, check_categorical=False)
 
     def test_categorical_warnings_and_errors(self):
         # Warning for non-string labels
@@ -889,7 +932,10 @@ def test_categorical_warnings_and_errors(self):
         original = pd.concat([original[col].astype('category')
                               for col in original], axis=1)
         with tm.ensure_clean() as path:
-            tm.assertRaises(ValueError, original.to_stata, path)
+            msg = ("Stata value labels for a single variable must have"
+                   r" a combined length less than 32,000 characters\.")
+            with pytest.raises(ValueError, match=msg):
+                original.to_stata(path)
 
         original = pd.DataFrame.from_records(
             [['a'],
@@ -901,12 +947,12 @@ def test_categorical_warnings_and_errors(self):
         original = pd.concat([original[col].astype('category')
                               for col in original], axis=1)
 
-        with warnings.catch_warnings(record=True) as w:
+        with tm.assert_produces_warning(pd.io.stata.ValueLabelTypeMismatch):
             original.to_stata(path)
             # should get a warning for mixed content
-            self.assertEqual(len(w), 1)
 
-    def test_categorical_with_stata_missing_values(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_categorical_with_stata_missing_values(self, version):
         values = [['a' + str(i)] for i in range(120)]
         values.append([np.nan])
         original = pd.DataFrame.from_records(values, columns=['many_labels'])
@@ -914,12 +960,14 @@ def test_categorical_with_stata_missing_values(self):
                               for col in original], axis=1)
         original.index.name = 'index'
         with tm.ensure_clean() as path:
-            original.to_stata(path)
+            original.to_stata(path, version=version)
             written_and_read_again = self.read_dta(path)
             res = written_and_read_again.set_index('index')
             tm.assert_frame_equal(res, original, check_categorical=False)
 
-    def test_categorical_order(self):
+    @pytest.mark.parametrize(
+        'file', ['dta19_115', 'dta19_117'])
+    def test_categorical_order(self, file):
         # Directly construct using expected codes
         # Format is is_cat, col_name, labels (in order), underlying data
         expected = [(True, 'ordered', ['a', 'b', 'c', 'd', 'e'], np.arange(5)),
@@ -941,94 +989,94 @@ def test_categorical_order(self):
                 cols.append((col, pd.Categorical.from_codes(codes, labels)))
             else:
                 cols.append((col, pd.Series(labels, dtype=np.float32)))
-        expected = DataFrame.from_items(cols)
+        expected = DataFrame.from_dict(OrderedDict(cols))
 
         # Read with and with out categoricals, ensure order is identical
-        parsed_115 = read_stata(self.dta19_115)
-        parsed_117 = read_stata(self.dta19_117)
-        tm.assert_frame_equal(expected, parsed_115, check_categorical=False)
-        tm.assert_frame_equal(expected, parsed_117, check_categorical=False)
+        file = getattr(self, file)
+        parsed = read_stata(file)
+        tm.assert_frame_equal(expected, parsed, check_categorical=False)
 
         # Check identity of codes
         for col in expected:
             if is_categorical_dtype(expected[col]):
                 tm.assert_series_equal(expected[col].cat.codes,
-                                       parsed_115[col].cat.codes)
+                                       parsed[col].cat.codes)
                 tm.assert_index_equal(expected[col].cat.categories,
-                                      parsed_115[col].cat.categories)
+                                      parsed[col].cat.categories)
+
+    @pytest.mark.parametrize(
+        'file', ['dta20_115', 'dta20_117'])
+    def test_categorical_sorting(self, file):
+        parsed = read_stata(getattr(self, file))
 
-    def test_categorical_sorting(self):
-        parsed_115 = read_stata(self.dta20_115)
-        parsed_117 = read_stata(self.dta20_117)
         # Sort based on codes, not strings
-        parsed_115 = parsed_115.sort_values("srh")
-        parsed_117 = parsed_117.sort_values("srh")
+        parsed = parsed.sort_values("srh", na_position='first')
+
         # Don't sort index
-        parsed_115.index = np.arange(parsed_115.shape[0])
-        parsed_117.index = np.arange(parsed_117.shape[0])
+        parsed.index = np.arange(parsed.shape[0])
         codes = [-1, -1, 0, 1, 1, 1, 2, 2, 3, 4]
         categories = ["Poor", "Fair", "Good", "Very good", "Excellent"]
         cat = pd.Categorical.from_codes(codes=codes, categories=categories)
         expected = pd.Series(cat, name='srh')
-        tm.assert_series_equal(expected, parsed_115["srh"],
-                               check_categorical=False)
-        tm.assert_series_equal(expected, parsed_117["srh"],
+        tm.assert_series_equal(expected, parsed["srh"],
                                check_categorical=False)
 
-    def test_categorical_ordering(self):
-        parsed_115 = read_stata(self.dta19_115)
-        parsed_117 = read_stata(self.dta19_117)
+    @pytest.mark.parametrize(
+        'file', ['dta19_115', 'dta19_117'])
+    def test_categorical_ordering(self, file):
+        file = getattr(self, file)
+        parsed = read_stata(file)
 
-        parsed_115_unordered = read_stata(self.dta19_115,
-                                          order_categoricals=False)
-        parsed_117_unordered = read_stata(self.dta19_117,
-                                          order_categoricals=False)
-        for col in parsed_115:
-            if not is_categorical_dtype(parsed_115[col]):
+        parsed_unordered = read_stata(file,
+                                      order_categoricals=False)
+        for col in parsed:
+            if not is_categorical_dtype(parsed[col]):
                 continue
-            self.assertEqual(True, parsed_115[col].cat.ordered)
-            self.assertEqual(True, parsed_117[col].cat.ordered)
-            self.assertEqual(False, parsed_115_unordered[col].cat.ordered)
-            self.assertEqual(False, parsed_117_unordered[col].cat.ordered)
-
-    def test_read_chunks_117(self):
-        files_117 = [self.dta1_117, self.dta2_117, self.dta3_117,
-                     self.dta4_117, self.dta14_117, self.dta15_117,
-                     self.dta16_117, self.dta17_117, self.dta18_117,
-                     self.dta19_117, self.dta20_117]
-
-        for fname in files_117:
-            for chunksize in 1, 2:
-                for convert_categoricals in False, True:
-                    for convert_dates in False, True:
-
-                        with warnings.catch_warnings(record=True) as w:
-                            warnings.simplefilter("always")
-                            parsed = read_stata(
-                                fname,
-                                convert_categoricals=convert_categoricals,
-                                convert_dates=convert_dates)
-                        itr = read_stata(
-                            fname, iterator=True,
-                            convert_categoricals=convert_categoricals,
-                            convert_dates=convert_dates)
-
-                        pos = 0
-                        for j in range(5):
-                            with warnings.catch_warnings(record=True) as w:  # noqa
-                                warnings.simplefilter("always")
-                                try:
-                                    chunk = itr.read(chunksize)
-                                except StopIteration:
-                                    break
-                            from_frame = parsed.iloc[pos:pos + chunksize, :]
-                            tm.assert_frame_equal(
-                                from_frame, chunk, check_dtype=False,
-                                check_datetimelike_compat=True,
-                                check_categorical=False)
-
-                            pos += chunksize
-                        itr.close()
+            assert parsed[col].cat.ordered
+            assert not parsed_unordered[col].cat.ordered
+
+    @pytest.mark.parametrize(
+        'file', ['dta1_117', 'dta2_117', 'dta3_117',
+                 'dta4_117', 'dta14_117', 'dta15_117',
+                 'dta16_117', 'dta17_117', 'dta18_117',
+                 'dta19_117', 'dta20_117'])
+    @pytest.mark.parametrize(
+        'chunksize', [1, 2])
+    @pytest.mark.parametrize(
+        'convert_categoricals', [False, True])
+    @pytest.mark.parametrize(
+        'convert_dates', [False, True])
+    def test_read_chunks_117(self, file, chunksize,
+                             convert_categoricals, convert_dates):
+        fname = getattr(self, file)
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            parsed = read_stata(
+                fname,
+                convert_categoricals=convert_categoricals,
+                convert_dates=convert_dates)
+        itr = read_stata(
+            fname, iterator=True,
+            convert_categoricals=convert_categoricals,
+            convert_dates=convert_dates)
+
+        pos = 0
+        for j in range(5):
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                warnings.simplefilter("always")
+                try:
+                    chunk = itr.read(chunksize)
+                except StopIteration:
+                    break
+            from_frame = parsed.iloc[pos:pos + chunksize, :]
+            tm.assert_frame_equal(
+                from_frame, chunk, check_dtype=False,
+                check_datetimelike_compat=True,
+                check_categorical=False)
+
+            pos += chunksize
+        itr.close()
 
     def test_iterator(self):
 
@@ -1053,49 +1101,54 @@ def test_iterator(self):
             tm.assert_frame_equal(parsed.iloc[0:5, :], chunk)
 
         # GH12153
-        from_chunks = pd.concat(read_stata(fname, chunksize=4))
+        with read_stata(fname, chunksize=4) as itr:
+            from_chunks = pd.concat(itr)
         tm.assert_frame_equal(parsed, from_chunks)
 
-    def test_read_chunks_115(self):
-        files_115 = [self.dta2_115, self.dta3_115, self.dta4_115,
-                     self.dta14_115, self.dta15_115, self.dta16_115,
-                     self.dta17_115, self.dta18_115, self.dta19_115,
-                     self.dta20_115]
-
-        for fname in files_115:
-            for chunksize in 1, 2:
-                for convert_categoricals in False, True:
-                    for convert_dates in False, True:
-
-                        # Read the whole file
-                        with warnings.catch_warnings(record=True) as w:
-                            warnings.simplefilter("always")
-                            parsed = read_stata(
-                                fname,
-                                convert_categoricals=convert_categoricals,
-                                convert_dates=convert_dates)
-
-                        # Compare to what we get when reading by chunk
-                        itr = read_stata(
-                            fname, iterator=True,
-                            convert_dates=convert_dates,
-                            convert_categoricals=convert_categoricals)
-                        pos = 0
-                        for j in range(5):
-                            with warnings.catch_warnings(record=True) as w:  # noqa
-                                warnings.simplefilter("always")
-                                try:
-                                    chunk = itr.read(chunksize)
-                                except StopIteration:
-                                    break
-                            from_frame = parsed.iloc[pos:pos + chunksize, :]
-                            tm.assert_frame_equal(
-                                from_frame, chunk, check_dtype=False,
-                                check_datetimelike_compat=True,
-                                check_categorical=False)
-
-                            pos += chunksize
-                        itr.close()
+    @pytest.mark.parametrize(
+        'file', ['dta2_115', 'dta3_115', 'dta4_115',
+                 'dta14_115', 'dta15_115', 'dta16_115',
+                 'dta17_115', 'dta18_115', 'dta19_115',
+                 'dta20_115'])
+    @pytest.mark.parametrize(
+        'chunksize', [1, 2])
+    @pytest.mark.parametrize(
+        'convert_categoricals', [False, True])
+    @pytest.mark.parametrize(
+        'convert_dates', [False, True])
+    def test_read_chunks_115(self, file, chunksize,
+                             convert_categoricals, convert_dates):
+        fname = getattr(self, file)
+
+        # Read the whole file
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            parsed = read_stata(
+                fname,
+                convert_categoricals=convert_categoricals,
+                convert_dates=convert_dates)
+
+        # Compare to what we get when reading by chunk
+        itr = read_stata(
+            fname, iterator=True,
+            convert_dates=convert_dates,
+            convert_categoricals=convert_categoricals)
+        pos = 0
+        for j in range(5):
+            with warnings.catch_warnings(record=True) as w:  # noqa
+                warnings.simplefilter("always")
+                try:
+                    chunk = itr.read(chunksize)
+                except StopIteration:
+                    break
+            from_frame = parsed.iloc[pos:pos + chunksize, :]
+            tm.assert_frame_equal(
+                from_frame, chunk, check_dtype=False,
+                check_datetimelike_compat=True,
+                check_categorical=False)
+
+            pos += chunksize
+        itr.close()
 
     def test_read_chunks_columns(self):
         fname = self.dta3_117
@@ -1113,7 +1166,8 @@ def test_read_chunks_columns(self):
                 tm.assert_frame_equal(from_frame, chunk, check_dtype=False)
                 pos += chunksize
 
-    def test_write_variable_labels(self):
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_write_variable_labels(self, version):
         # GH 13631, add support for writing variable labels
         original = pd.DataFrame({'a': [1, 2, 3, 4],
                                  'b': [1.0, 3.0, 27.0, 81.0],
@@ -1122,21 +1176,51 @@ def test_write_variable_labels(self):
         original.index.name = 'index'
         variable_labels = {'a': 'City Rank', 'b': 'City Exponent', 'c': 'City'}
         with tm.ensure_clean() as path:
-            original.to_stata(path, variable_labels=variable_labels)
+            original.to_stata(path,
+                              variable_labels=variable_labels,
+                              version=version)
             with StataReader(path) as sr:
                 read_labels = sr.variable_labels()
             expected_labels = {'index': '',
                                'a': 'City Rank',
                                'b': 'City Exponent',
                                'c': 'City'}
-            tm.assert_equal(read_labels, expected_labels)
+            assert read_labels == expected_labels
 
         variable_labels['index'] = 'The Index'
         with tm.ensure_clean() as path:
-            original.to_stata(path, variable_labels=variable_labels)
+            original.to_stata(path,
+                              variable_labels=variable_labels,
+                              version=version)
             with StataReader(path) as sr:
                 read_labels = sr.variable_labels()
-            tm.assert_equal(read_labels, variable_labels)
+            assert read_labels == variable_labels
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_invalid_variable_labels(self, version):
+        original = pd.DataFrame({'a': [1, 2, 3, 4],
+                                 'b': [1.0, 3.0, 27.0, 81.0],
+                                 'c': ['Atlanta', 'Birmingham',
+                                       'Cincinnati', 'Detroit']})
+        original.index.name = 'index'
+        variable_labels = {'a': 'very long' * 10,
+                           'b': 'City Exponent',
+                           'c': 'City'}
+        with tm.ensure_clean() as path:
+            msg = "Variable labels must be 80 characters or fewer"
+            with pytest.raises(ValueError, match=msg):
+                original.to_stata(path,
+                                  variable_labels=variable_labels,
+                                  version=version)
+
+        variable_labels['a'] = u'invalid character Œ'
+        with tm.ensure_clean() as path:
+            msg = ("Variable labels must contain only characters that can be"
+                   " encoded in Latin-1")
+            with pytest.raises(ValueError, match=msg):
+                original.to_stata(path,
+                                  variable_labels=variable_labels,
+                                  version=version)
 
     def test_write_variable_label_errors(self):
         original = pd.DataFrame({'a': [1, 2, 3, 4],
@@ -1151,7 +1235,9 @@ def test_write_variable_label_errors(self):
                                 'b': 'City Exponent',
                                 'c': u''.join(values)}
 
-        with tm.assertRaises(ValueError):
+        msg = ("Variable labels must contain only characters that can be"
+               " encoded in Latin-1")
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path, variable_labels=variable_labels_utf8)
 
@@ -1161,7 +1247,8 @@ def test_write_variable_label_errors(self):
                                      'that is too long for Stata which means '
                                      'that it has more than 80 characters'}
 
-        with tm.assertRaises(ValueError):
+        msg = "Variable labels must be 80 characters or fewer"
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path, variable_labels=variable_labels_long)
 
@@ -1185,10 +1272,18 @@ def test_default_date_conversion(self):
             direct = read_stata(path, convert_dates=True)
             tm.assert_frame_equal(reread, direct)
 
+            dates_idx = original.columns.tolist().index('dates')
+            original.to_stata(path,
+                              write_index=False,
+                              convert_dates={dates_idx: 'tc'})
+            direct = read_stata(path, convert_dates=True)
+            tm.assert_frame_equal(reread, direct)
+
     def test_unsupported_type(self):
         original = pd.DataFrame({'a': [1 + 2j, 2 + 4j]})
 
-        with tm.assertRaises(NotImplementedError):
+        msg = "Data type complex128 not supported"
+        with pytest.raises(NotImplementedError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path)
 
@@ -1200,7 +1295,8 @@ def test_unsupported_datetype(self):
                                  'strs': ['apple', 'banana', 'cherry'],
                                  'dates': dates})
 
-        with tm.assertRaises(NotImplementedError):
+        msg = "Format %tC not implemented"
+        with pytest.raises(NotImplementedError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path, convert_dates={'dates': 'tC'})
 
@@ -1208,15 +1304,16 @@ def test_unsupported_datetype(self):
         original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
                                  'strs': ['apple', 'banana', 'cherry'],
                                  'dates': dates})
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             with tm.ensure_clean() as path:
                 original.to_stata(path)
 
     def test_repeated_column_labels(self):
         # GH 13923
-        with tm.assertRaises(ValueError) as cm:
+        msg = (r"Value labels for column ethnicsn are not unique\. The"
+               r" repeated labels are:\n\n-+wolof")
+        with pytest.raises(ValueError, match=msg):
             read_stata(self.dta23, convert_categoricals=True)
-            tm.assertTrue('wolof' in cm.exception)
 
     def test_stata_111(self):
         # 111 is an old version but still used by current versions of
@@ -1239,17 +1336,18 @@ def test_out_of_range_double(self):
                         'ColumnTooBig': [0.0,
                                          np.finfo(np.double).eps,
                                          np.finfo(np.double).max]})
-        with tm.assertRaises(ValueError) as cm:
+        msg = (r"Column ColumnTooBig has a maximum value \(.+\)"
+               r" outside the range supported by Stata \(.+\)")
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 df.to_stata(path)
-            tm.assertTrue('ColumnTooBig' in cm.exception)
 
         df.loc[2, 'ColumnTooBig'] = np.inf
-        with tm.assertRaises(ValueError) as cm:
+        msg = ("Column ColumnTooBig has a maximum value of infinity which"
+               " is outside the range supported by Stata")
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 df.to_stata(path)
-            tm.assertTrue('ColumnTooBig' in cm.exception)
-            tm.assertTrue('infinity' in cm.exception)
 
     def test_out_of_range_float(self):
         original = DataFrame({'ColumnOk': [0.0,
@@ -1271,15 +1369,245 @@ def test_out_of_range_float(self):
                                   reread.set_index('index'))
 
         original.loc[2, 'ColumnTooBig'] = np.inf
-        with tm.assertRaises(ValueError) as cm:
+        msg = ("Column ColumnTooBig has a maximum value of infinity which"
+               " is outside the range supported by Stata")
+        with pytest.raises(ValueError, match=msg):
             with tm.ensure_clean() as path:
                 original.to_stata(path)
-            tm.assertTrue('ColumnTooBig' in cm.exception)
-            tm.assertTrue('infinity' in cm.exception)
 
-    def test_invalid_encoding(self):
-        # GH15723, validate encoding
-        original = self.read_csv(self.csv3)
-        with tm.assertRaises(ValueError):
+    def test_path_pathlib(self):
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        reader = lambda x: read_stata(x).set_index('index')
+        result = tm.round_trip_pathlib(df.to_stata, reader)
+        tm.assert_frame_equal(df, result)
+
+    def test_pickle_path_localpath(self):
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        reader = lambda x: read_stata(x).set_index('index')
+        result = tm.round_trip_localpath(df.to_stata, reader)
+        tm.assert_frame_equal(df, result)
+
+    @pytest.mark.parametrize(
+        'write_index', [True, False])
+    def test_value_labels_iterator(self, write_index):
+        # GH 16923
+        d = {'A': ['B', 'E', 'C', 'A', 'E']}
+        df = pd.DataFrame(data=d)
+        df['A'] = df['A'].astype('category')
+        with tm.ensure_clean() as path:
+            df.to_stata(path, write_index=write_index)
+
+            with pd.read_stata(path, iterator=True) as dta_iter:
+                value_labels = dta_iter.value_labels()
+        assert value_labels == {'A': {0: 'A', 1: 'B', 2: 'C', 3: 'E'}}
+
+    def test_set_index(self):
+        # GH 17328
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            df.to_stata(path)
+            reread = pd.read_stata(path, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    @pytest.mark.parametrize(
+        'column', ['ms', 'day', 'week', 'month', 'qtr', 'half', 'yr'])
+    def test_date_parsing_ignores_format_details(self, column):
+        # GH 17797
+        #
+        # Test that display formats are ignored when determining if a numeric
+        # column is a date value.
+        #
+        # All date types are stored as numbers and format associated with the
+        # column denotes both the type of the date and the display format.
+        #
+        # STATA supports 9 date types which each have distinct units. We test 7
+        # of the 9 types, ignoring %tC and %tb. %tC is a variant of %tc that
+        # accounts for leap seconds and %tb relies on STATAs business calendar.
+        df = read_stata(self.stata_dates)
+        unformatted = df.loc[0, column]
+        formatted = df.loc[0, column + "_fmt"]
+        assert unformatted == formatted
+
+    def test_writer_117(self):
+        original = DataFrame(data=[['string', 'object', 1, 1, 1, 1.1, 1.1,
+                                    np.datetime64('2003-12-25'),
+                                    'a', 'a' * 2045, 'a' * 5000, 'a'],
+                                   ['string-1', 'object-1', 1, 1, 1, 1.1, 1.1,
+                                    np.datetime64('2003-12-26'),
+                                    'b', 'b' * 2045, '', '']
+                                   ],
+                             columns=['string', 'object', 'int8', 'int16',
+                                      'int32', 'float32', 'float64',
+                                      'datetime',
+                                      's1', 's2045', 'srtl', 'forced_strl'])
+        original['object'] = Series(original['object'], dtype=object)
+        original['int8'] = Series(original['int8'], dtype=np.int8)
+        original['int16'] = Series(original['int16'], dtype=np.int16)
+        original['int32'] = original['int32'].astype(np.int32)
+        original['float32'] = Series(original['float32'], dtype=np.float32)
+        original.index.name = 'index'
+        original.index = original.index.astype(np.int32)
+        copy = original.copy()
+        with tm.ensure_clean() as path:
+            original.to_stata(path,
+                              convert_dates={'datetime': 'tc'},
+                              convert_strl=['forced_strl'],
+                              version=117)
+            written_and_read_again = self.read_dta(path)
+            # original.index is np.int32, read index is np.int64
+            tm.assert_frame_equal(written_and_read_again.set_index('index'),
+                                  original, check_index_type=False)
+            tm.assert_frame_equal(original, copy)
+
+    def test_convert_strl_name_swap(self):
+        original = DataFrame([['a' * 3000, 'A', 'apple'],
+                              ['b' * 1000, 'B', 'banana']],
+                             columns=['long1' * 10, 'long', 1])
+        original.index.name = 'index'
+
+        with tm.assert_produces_warning(pd.io.stata.InvalidColumnName):
             with tm.ensure_clean() as path:
-                original.to_stata(path, encoding='utf-8')
+                original.to_stata(path, convert_strl=['long', 1], version=117)
+                reread = self.read_dta(path)
+                reread = reread.set_index('index')
+                reread.columns = original.columns
+                tm.assert_frame_equal(reread, original,
+                                      check_index_type=False)
+
+    def test_invalid_date_conversion(self):
+        # GH 12259
+        dates = [dt.datetime(1999, 12, 31, 12, 12, 12, 12000),
+                 dt.datetime(2012, 12, 21, 12, 21, 12, 21000),
+                 dt.datetime(1776, 7, 4, 7, 4, 7, 4000)]
+        original = pd.DataFrame({'nums': [1.0, 2.0, 3.0],
+                                 'strs': ['apple', 'banana', 'cherry'],
+                                 'dates': dates})
+
+        with tm.ensure_clean() as path:
+            msg = "convert_dates key must be a column or an integer"
+            with pytest.raises(ValueError, match=msg):
+                original.to_stata(path,
+                                  convert_dates={'wrong_name': 'tc'})
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_nonfile_writing(self, version):
+        # GH 21041
+        bio = io.BytesIO()
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            df.to_stata(bio, version=version)
+            bio.seek(0)
+            with open(path, 'wb') as dta:
+                dta.write(bio.read())
+            reread = pd.read_stata(path, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    def test_gzip_writing(self):
+        # writing version 117 requires seek and cannot be used with gzip
+        df = tm.makeDataFrame()
+        df.index.name = 'index'
+        with tm.ensure_clean() as path:
+            with gzip.GzipFile(path, 'wb') as gz:
+                df.to_stata(gz, version=114)
+            with gzip.GzipFile(path, 'rb') as gz:
+                reread = pd.read_stata(gz, index_col='index')
+        tm.assert_frame_equal(df, reread)
+
+    def test_unicode_dta_118(self):
+        unicode_df = self.read_dta(self.dta25_118)
+
+        columns = ['utf8', 'latin1', 'ascii', 'utf8_strl', 'ascii_strl']
+        values = [[u'ραηδας', u'PÄNDÄS', 'p', u'ραηδας', 'p'],
+                  [u'ƤĀńĐąŜ', u'Ö', 'a', u'ƤĀńĐąŜ', 'a'],
+                  [u'ᴘᴀᴎᴅᴀS', u'Ü', 'n', u'ᴘᴀᴎᴅᴀS', 'n'],
+                  ['      ', '      ', 'd', '      ', 'd'],
+                  [' ', '', 'a', ' ', 'a'],
+                  ['', '', 's', '', 's'],
+                  ['', '', ' ', '', ' ']]
+        expected = pd.DataFrame(values, columns=columns)
+
+        tm.assert_frame_equal(unicode_df, expected)
+
+    def test_mixed_string_strl(self):
+        # GH 23633
+        output = [
+            {'mixed': 'string' * 500,
+             'number': 0},
+            {'mixed': None,
+             'number': 1}
+        ]
+        output = pd.DataFrame(output)
+        output.number = output.number.astype('int32')
+
+        with tm.ensure_clean() as path:
+            output.to_stata(path, write_index=False, version=117)
+            reread = read_stata(path)
+            expected = output.fillna('')
+            tm.assert_frame_equal(reread, expected)
+
+            # Check strl supports all None (null)
+            output.loc[:, 'mixed'] = None
+            output.to_stata(path, write_index=False, convert_strl=['mixed'],
+                            version=117)
+            reread = read_stata(path)
+            expected = output.fillna('')
+            tm.assert_frame_equal(reread, expected)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_all_none_exception(self, version):
+        output = [
+            {'none': 'none',
+             'number': 0},
+            {'none': None,
+             'number': 1}
+        ]
+        output = pd.DataFrame(output)
+        output.loc[:, 'none'] = None
+        with tm.ensure_clean() as path:
+            msg = (r"Column `none` cannot be exported\.\n\n"
+                   "Only string-like object arrays containing all strings or a"
+                   r" mix of strings and None can be exported\. Object arrays"
+                   r" containing only null values are prohibited\. Other"
+                   " object typescannot be exported and must first be"
+                   r" converted to one of the supported types\.")
+            with pytest.raises(ValueError, match=msg):
+                output.to_stata(path, version=version)
+
+    @pytest.mark.parametrize('version', [114, 117])
+    def test_invalid_file_not_written(self, version):
+        content = 'Here is one __�__ Another one __·__ Another one __½__'
+        df = DataFrame([content], columns=['invalid'])
+        expected_exc = UnicodeEncodeError if PY3 else UnicodeDecodeError
+        with tm.ensure_clean() as path:
+            msg1 = (r"'latin-1' codec can't encode character '\\ufffd'"
+                    r" in position 14: ordinal not in range\(256\)")
+            msg2 = ("'ascii' codec can't decode byte 0xef in position 14:"
+                    r" ordinal not in range\(128\)")
+            with pytest.raises(expected_exc, match=r'{}|{}'.format(
+                    msg1, msg2)):
+                with tm.assert_produces_warning(ResourceWarning):
+                    df.to_stata(path)
+
+    def test_strl_latin1(self):
+        # GH 23573, correct GSO data to reflect correct size
+        output = DataFrame([[u'pandas'] * 2, [u'þâÑÐÅ§'] * 2],
+                           columns=['var_str', 'var_strl'])
+
+        with tm.ensure_clean() as path:
+            output.to_stata(path, version=117, convert_strl=['var_strl'])
+            with open(path, 'rb') as reread:
+                content = reread.read()
+                expected = u'þâÑÐÅ§'
+                assert expected.encode('latin-1') in content
+                assert expected.encode('utf-8') in content
+                gsos = content.split(b'strls')[1][1:-2]
+                for gso in gsos.split(b'GSO')[1:]:
+                    val = gso.split(b'\x00')[-2]
+                    size = gso[gso.find(b'\x82') + 1]
+                    if not PY3:
+                        size = ord(size)
+                    assert len(val) == size - 1
diff --git a/pandas/tests/plotting/common.py b/pandas/tests/plotting/common.py
index c31d8b539ae6f..4ca916a0aa4e4 100644
--- a/pandas/tests/plotting/common.py
+++ b/pandas/tests/plotting/common.py
@@ -1,22 +1,26 @@
 #!/usr/bin/env python
 # coding: utf-8
 
-import pytest
 import os
 import warnings
 
-from pandas import DataFrame, Series
-from pandas.compat import zip, iteritems
-from pandas.util.decorators import cache_readonly
-from pandas.types.api import is_list_like
-import pandas.util.testing as tm
-from pandas.util.testing import (ensure_clean,
-                                 assert_is_valid_plot_return_object)
-
 import numpy as np
 from numpy import random
+import pytest
 
-import pandas.tools.plotting as plotting
+from pandas.compat import iteritems, zip
+from pandas.util._decorators import cache_readonly
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.api import is_list_like
+
+from pandas import DataFrame, Series
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_is_valid_plot_return_object, ensure_clean)
+
+import pandas.plotting as plotting
+from pandas.plotting._tools import _flatten
 
 
 """
@@ -37,44 +41,28 @@ def _ok_for_gaussian_kde(kind):
             from scipy.stats import gaussian_kde  # noqa
         except ImportError:
             return False
+
     return True
 
 
-@tm.mplskip
-class TestPlotBase(tm.TestCase):
+@td.skip_if_no_mpl
+class TestPlotBase(object):
 
-    def setUp(self):
+    def setup_method(self, method):
 
         import matplotlib as mpl
         mpl.rcdefaults()
 
-        self.mpl_le_1_2_1 = plotting._mpl_le_1_2_1()
-        self.mpl_ge_1_3_1 = plotting._mpl_ge_1_3_1()
-        self.mpl_ge_1_4_0 = plotting._mpl_ge_1_4_0()
-        self.mpl_ge_1_5_0 = plotting._mpl_ge_1_5_0()
-        self.mpl_ge_2_0_0 = plotting._mpl_ge_2_0_0()
-        self.mpl_ge_2_0_1 = plotting._mpl_ge_2_0_1()
-
-        if self.mpl_ge_1_4_0:
-            self.bp_n_objects = 7
-        else:
-            self.bp_n_objects = 8
-        if self.mpl_ge_1_5_0:
-            # 1.5 added PolyCollections to legend handler
-            # so we have twice as many items.
-            self.polycollection_factor = 2
-        else:
-            self.polycollection_factor = 1
+        self.mpl_ge_2_0_1 = plotting._compat._mpl_ge_2_0_1()
+        self.mpl_ge_2_1_0 = plotting._compat._mpl_ge_2_1_0()
+        self.mpl_ge_2_2_0 = plotting._compat._mpl_ge_2_2_0()
+        self.mpl_ge_2_2_2 = plotting._compat._mpl_ge_2_2_2()
+        self.mpl_ge_3_0_0 = plotting._compat._mpl_ge_3_0_0()
 
-        if self.mpl_ge_2_0_0:
-            self.default_figsize = (6.4, 4.8)
-        else:
-            self.default_figsize = (8.0, 6.0)
-        self.default_tick_position = 'left' if self.mpl_ge_2_0_0 else 'default'
-        # common test data
-        from pandas import read_csv
-        path = os.path.join(os.path.dirname(curpath()), 'data', 'iris.csv')
-        self.iris = read_csv(path)
+        self.bp_n_objects = 7
+        self.polycollection_factor = 2
+        self.default_figsize = (6.4, 4.8)
+        self.default_tick_position = 'left'
 
         n = 100
         with tm.RNGContext(42):
@@ -93,7 +81,7 @@ def setUp(self):
                                     "C": np.arange(20) + np.random.uniform(
                                         size=20)})
 
-    def tearDown(self):
+    def teardown_method(self, method):
         tm.close()
 
     @cache_readonly
@@ -125,10 +113,10 @@ def _check_legend_labels(self, axes, labels=None, visible=True):
         axes = self._flatten_visible(axes)
         for ax in axes:
             if visible:
-                self.assertTrue(ax.get_legend() is not None)
+                assert ax.get_legend() is not None
                 self._check_text_labels(ax.get_legend().get_texts(), labels)
             else:
-                self.assertTrue(ax.get_legend() is None)
+                assert ax.get_legend() is None
 
     def _check_data(self, xp, rs):
         """
@@ -147,7 +135,7 @@ def check_line(xpl, rsl):
             rsdata = rsl.get_xydata()
             tm.assert_almost_equal(xpdata, rsdata)
 
-        self.assertEqual(len(xp_lines), len(rs_lines))
+        assert len(xp_lines) == len(rs_lines)
         [check_line(xpl, rsl) for xpl, rsl in zip(xp_lines, rs_lines)]
         tm.close()
 
@@ -168,7 +156,7 @@ def _check_visible(self, collections, visible=True):
             collections = [collections]
 
         for patch in collections:
-            self.assertEqual(patch.get_visible(), visible)
+            assert patch.get_visible() == visible
 
     def _get_colors_mapped(self, series, colors):
         unique = series.unique()
@@ -206,7 +194,7 @@ def _check_colors(self, collections, linecolors=None, facecolors=None,
                 linecolors = self._get_colors_mapped(mapping, linecolors)
                 linecolors = linecolors[:len(collections)]
 
-            self.assertEqual(len(collections), len(linecolors))
+            assert len(collections) == len(linecolors)
             for patch, color in zip(collections, linecolors):
                 if isinstance(patch, Line2D):
                     result = patch.get_color()
@@ -218,7 +206,7 @@ def _check_colors(self, collections, linecolors=None, facecolors=None,
                     result = patch.get_edgecolor()
 
                 expected = conv.to_rgba(color)
-                self.assertEqual(result, expected)
+                assert result == expected
 
         if facecolors is not None:
 
@@ -226,7 +214,7 @@ def _check_colors(self, collections, linecolors=None, facecolors=None,
                 facecolors = self._get_colors_mapped(mapping, facecolors)
                 facecolors = facecolors[:len(collections)]
 
-            self.assertEqual(len(collections), len(facecolors))
+            assert len(collections) == len(facecolors)
             for patch, color in zip(collections, facecolors):
                 if isinstance(patch, Collection):
                     # returned as list of np.array
@@ -238,7 +226,7 @@ def _check_colors(self, collections, linecolors=None, facecolors=None,
                     result = tuple(result)
 
                 expected = conv.to_rgba(color)
-                self.assertEqual(result, expected)
+                assert result == expected
 
     def _check_text_labels(self, texts, expected):
         """
@@ -252,12 +240,12 @@ def _check_text_labels(self, texts, expected):
             expected text label, or its list
         """
         if not is_list_like(texts):
-            self.assertEqual(texts.get_text(), expected)
+            assert texts.get_text() == expected
         else:
             labels = [t.get_text() for t in texts]
-            self.assertEqual(len(labels), len(expected))
-            for l, e in zip(labels, expected):
-                self.assertEqual(l, e)
+            assert len(labels) == len(expected)
+            for label, e in zip(labels, expected):
+                assert label == e
 
     def _check_ticks_props(self, axes, xlabelsize=None, xrot=None,
                            ylabelsize=None, yrot=None):
@@ -290,10 +278,10 @@ def _check_ticks_props(self, axes, xlabelsize=None, xrot=None,
 
                 for label in labels:
                     if xlabelsize is not None:
-                        self.assertAlmostEqual(label.get_fontsize(),
+                        tm.assert_almost_equal(label.get_fontsize(),
                                                xlabelsize)
                     if xrot is not None:
-                        self.assertAlmostEqual(label.get_rotation(), xrot)
+                        tm.assert_almost_equal(label.get_rotation(), xrot)
 
             if ylabelsize or yrot:
                 if isinstance(ax.yaxis.get_minor_formatter(), NullFormatter):
@@ -304,10 +292,10 @@ def _check_ticks_props(self, axes, xlabelsize=None, xrot=None,
 
                 for label in labels:
                     if ylabelsize is not None:
-                        self.assertAlmostEqual(label.get_fontsize(),
+                        tm.assert_almost_equal(label.get_fontsize(),
                                                ylabelsize)
                     if yrot is not None:
-                        self.assertAlmostEqual(label.get_rotation(), yrot)
+                        tm.assert_almost_equal(label.get_rotation(), yrot)
 
     def _check_ax_scales(self, axes, xaxis='linear', yaxis='linear'):
         """
@@ -323,8 +311,8 @@ def _check_ax_scales(self, axes, xaxis='linear', yaxis='linear'):
         """
         axes = self._flatten_visible(axes)
         for ax in axes:
-            self.assertEqual(ax.xaxis.get_scale(), xaxis)
-            self.assertEqual(ax.yaxis.get_scale(), yaxis)
+            assert ax.xaxis.get_scale() == xaxis
+            assert ax.yaxis.get_scale() == yaxis
 
     def _check_axes_shape(self, axes, axes_num=None, layout=None,
                           figsize=None):
@@ -347,16 +335,16 @@ def _check_axes_shape(self, axes, axes_num=None, layout=None,
         visible_axes = self._flatten_visible(axes)
 
         if axes_num is not None:
-            self.assertEqual(len(visible_axes), axes_num)
+            assert len(visible_axes) == axes_num
             for ax in visible_axes:
                 # check something drawn on visible axes
-                self.assertTrue(len(ax.get_children()) > 0)
+                assert len(ax.get_children()) > 0
 
         if layout is not None:
-            result = self._get_axes_layout(plotting._flatten(axes))
-            self.assertEqual(result, layout)
+            result = self._get_axes_layout(_flatten(axes))
+            assert result == layout
 
-        self.assert_numpy_array_equal(
+        tm.assert_numpy_array_equal(
             visible_axes[0].figure.get_size_inches(),
             np.array(figsize, dtype=np.float64))
 
@@ -379,7 +367,7 @@ def _flatten_visible(self, axes):
         axes : matplotlib Axes object, or its list-like
 
         """
-        axes = plotting._flatten(axes)
+        axes = _flatten(axes)
         axes = [ax for ax in axes if ax.get_visible()]
         return axes
 
@@ -407,8 +395,8 @@ def _check_has_errorbars(self, axes, xerr=0, yerr=0):
                     xerr_count += 1
                 if has_yerr:
                     yerr_count += 1
-            self.assertEqual(xerr, xerr_count)
-            self.assertEqual(yerr, yerr_count)
+            assert xerr == xerr_count
+            assert yerr == yerr_count
 
     def _check_box_return_type(self, returned, return_type, expected_keys=None,
                                check_ax_title=True):
@@ -435,36 +423,36 @@ def _check_box_return_type(self, returned, return_type, expected_keys=None,
             if return_type is None:
                 return_type = 'dict'
 
-            self.assertTrue(isinstance(returned, types[return_type]))
+            assert isinstance(returned, types[return_type])
             if return_type == 'both':
-                self.assertIsInstance(returned.ax, Axes)
-                self.assertIsInstance(returned.lines, dict)
+                assert isinstance(returned.ax, Axes)
+                assert isinstance(returned.lines, dict)
         else:
             # should be fixed when the returning default is changed
             if return_type is None:
                 for r in self._flatten_visible(returned):
-                    self.assertIsInstance(r, Axes)
+                    assert isinstance(r, Axes)
                 return
 
-            self.assertTrue(isinstance(returned, Series))
+            assert isinstance(returned, Series)
 
-            self.assertEqual(sorted(returned.keys()), sorted(expected_keys))
+            assert sorted(returned.keys()) == sorted(expected_keys)
             for key, value in iteritems(returned):
-                self.assertTrue(isinstance(value, types[return_type]))
+                assert isinstance(value, types[return_type])
                 # check returned dict has correct mapping
                 if return_type == 'axes':
                     if check_ax_title:
-                        self.assertEqual(value.get_title(), key)
+                        assert value.get_title() == key
                 elif return_type == 'both':
                     if check_ax_title:
-                        self.assertEqual(value.ax.get_title(), key)
-                    self.assertIsInstance(value.ax, Axes)
-                    self.assertIsInstance(value.lines, dict)
+                        assert value.ax.get_title() == key
+                    assert isinstance(value.ax, Axes)
+                    assert isinstance(value.lines, dict)
                 elif return_type == 'dict':
                     line = value['medians'][0]
-                    axes = line.axes if self.mpl_ge_1_5_0 else line.get_axes()
+                    axes = line.axes
                     if check_ax_title:
-                        self.assertEqual(axes.get_title(), key)
+                        assert axes.get_title() == key
                 else:
                     raise AssertionError
 
@@ -489,40 +477,32 @@ def is_grid_on():
             spndx += 1
             mpl.rc('axes', grid=False)
             obj.plot(kind=kind, **kws)
-            self.assertFalse(is_grid_on())
+            assert not is_grid_on()
 
             self.plt.subplot(1, 4 * len(kinds), spndx)
             spndx += 1
             mpl.rc('axes', grid=True)
             obj.plot(kind=kind, grid=False, **kws)
-            self.assertFalse(is_grid_on())
+            assert not is_grid_on()
 
             if kind != 'pie':
                 self.plt.subplot(1, 4 * len(kinds), spndx)
                 spndx += 1
                 mpl.rc('axes', grid=True)
                 obj.plot(kind=kind, **kws)
-                self.assertTrue(is_grid_on())
+                assert is_grid_on()
 
                 self.plt.subplot(1, 4 * len(kinds), spndx)
                 spndx += 1
                 mpl.rc('axes', grid=False)
                 obj.plot(kind=kind, grid=True, **kws)
-                self.assertTrue(is_grid_on())
+                assert is_grid_on()
 
-    def _maybe_unpack_cycler(self, rcParams, field='color'):
+    def _unpack_cycler(self, rcParams, field='color'):
         """
-        Compat layer for MPL 1.5 change to color cycle
-
-        Before: plt.rcParams['axes.color_cycle'] -> ['b', 'g', 'r'...]
-        After : plt.rcParams['axes.prop_cycle'] -> cycler(...)
+        Auxiliary function for correctly unpacking cycler after MPL >= 1.5
         """
-        if self.mpl_ge_1_5_0:
-            cyl = rcParams['axes.prop_cycle']
-            colors = [v[field] for v in cyl]
-        else:
-            colors = rcParams['axes.color_cycle']
-        return colors
+        return [v[field] for v in rcParams['axes.prop_cycle']]
 
 
 def _check_plot_works(f, filterwarnings='always', **kwargs):
diff --git a/pandas/tests/plotting/test_boxplot_method.py b/pandas/tests/plotting/test_boxplot_method.py
index 31c150bc1e64f..e6b9795aebe7c 100644
--- a/pandas/tests/plotting/test_boxplot_method.py
+++ b/pandas/tests/plotting/test_boxplot_method.py
@@ -1,42 +1,30 @@
 # coding: utf-8
 
-import pytest
 import itertools
 import string
-from distutils.version import LooseVersion
-
-from pandas import Series, DataFrame, MultiIndex
-from pandas.compat import range, lzip
-import pandas.util.testing as tm
-from pandas.util.testing import slow
 
 import numpy as np
 from numpy import random
-from numpy.random import randn
+import pytest
 
-import pandas.tools.plotting as plotting
+from pandas.compat import lzip, range
+import pandas.util._test_decorators as td
 
-from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works)
+from pandas import DataFrame, MultiIndex, Series
+from pandas.tests.plotting.common import TestPlotBase, _check_plot_works
+import pandas.util.testing as tm
 
+import pandas.plotting as plotting
 
 """ Test cases for .boxplot method """
 
 
-def _skip_if_mpl_14_or_dev_boxplot():
-    # GH 8382
-    # Boxplot failures on 1.4 and 1.4.1
-    # Don't need try / except since that's done at class level
-    import matplotlib
-    if str(matplotlib.__version__) >= LooseVersion('1.4'):
-        pytest.skip("Matplotlib Regression in 1.4 and current dev.")
-
-
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFramePlots(TestPlotBase):
 
-    @slow
-    def test_boxplot_legacy(self):
-        df = DataFrame(randn(6, 4),
+    @pytest.mark.slow
+    def test_boxplot_legacy1(self):
+        df = DataFrame(np.random.randn(6, 4),
                        index=list(string.ascii_letters[:6]),
                        columns=['one', 'two', 'three', 'four'])
         df['indic'] = ['foo', 'bar'] * 3
@@ -54,11 +42,14 @@ def test_boxplot_legacy(self):
             _check_plot_works(df.boxplot, by='indic')
         with tm.assert_produces_warning(UserWarning):
             _check_plot_works(df.boxplot, by=['indic', 'indic2'])
-        _check_plot_works(plotting.boxplot, data=df['one'], return_type='dict')
+        _check_plot_works(plotting._core.boxplot, data=df['one'],
+                          return_type='dict')
         _check_plot_works(df.boxplot, notch=1, return_type='dict')
         with tm.assert_produces_warning(UserWarning):
             _check_plot_works(df.boxplot, by='indic', notch=1)
 
+    @pytest.mark.slow
+    def test_boxplot_legacy2(self):
         df = DataFrame(np.random.rand(10, 2), columns=['Col1', 'Col2'])
         df['X'] = Series(['A', 'A', 'A', 'A', 'A', 'B', 'B', 'B', 'B', 'B'])
         df['Y'] = Series(['A'] * 10)
@@ -69,43 +60,43 @@ def test_boxplot_legacy(self):
         # passed ax should be used:
         fig, ax = self.plt.subplots()
         axes = df.boxplot('Col1', by='X', ax=ax)
-        ax_axes = ax.axes if self.mpl_ge_1_5_0 else ax.get_axes()
-        self.assertIs(ax_axes, axes)
+        ax_axes = ax.axes
+        assert ax_axes is axes
 
         fig, ax = self.plt.subplots()
         axes = df.groupby('Y').boxplot(ax=ax, return_type='axes')
-        ax_axes = ax.axes if self.mpl_ge_1_5_0 else ax.get_axes()
-        self.assertIs(ax_axes, axes['A'])
+        ax_axes = ax.axes
+        assert ax_axes is axes['A']
 
         # Multiple columns with an ax argument should use same figure
         fig, ax = self.plt.subplots()
         with tm.assert_produces_warning(UserWarning):
             axes = df.boxplot(column=['Col1', 'Col2'],
                               by='X', ax=ax, return_type='axes')
-        self.assertIs(axes['Col1'].get_figure(), fig)
+        assert axes['Col1'].get_figure() is fig
 
         # When by is None, check that all relevant lines are present in the
         # dict
         fig, ax = self.plt.subplots()
         d = df.boxplot(ax=ax, return_type='dict')
         lines = list(itertools.chain.from_iterable(d.values()))
-        self.assertEqual(len(ax.get_lines()), len(lines))
+        assert len(ax.get_lines()) == len(lines)
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_return_type_none(self):
         # GH 12216; return_type=None & by=None -> axes
         result = self.hist_df.boxplot()
-        self.assertTrue(isinstance(result, self.plt.Axes))
+        assert isinstance(result, self.plt.Axes)
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_return_type_legacy(self):
         # API change in https://github.com/pandas-dev/pandas/pull/7096
         import matplotlib as mpl  # noqa
 
-        df = DataFrame(randn(6, 4),
+        df = DataFrame(np.random.randn(6, 4),
                        index=list(string.ascii_letters[:6]),
                        columns=['one', 'two', 'three', 'four'])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.boxplot(return_type='NOTATYPE')
 
         result = df.boxplot()
@@ -123,13 +114,13 @@ def test_boxplot_return_type_legacy(self):
             result = df.boxplot(return_type='both')
         self._check_box_return_type(result, 'both')
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_axis_limits(self):
 
         def _check_ax_limits(col, ax):
             y_min, y_max = ax.get_ylim()
-            self.assertTrue(y_min <= col.min())
-            self.assertTrue(y_max >= col.max())
+            assert y_min <= col.min()
+            assert y_max >= col.max()
 
         df = self.hist_df.copy()
         df['age'] = np.random.randint(1, 20, df.shape[0])
@@ -137,7 +128,7 @@ def _check_ax_limits(col, ax):
         height_ax, weight_ax = df.boxplot(['height', 'weight'], by='category')
         _check_ax_limits(df['height'], height_ax)
         _check_ax_limits(df['weight'], weight_ax)
-        self.assertEqual(weight_ax._sharey, height_ax)
+        assert weight_ax._sharey == height_ax
 
         # Two rows, one partial
         p = df.boxplot(['height', 'weight', 'age'], by='category')
@@ -147,28 +138,35 @@ def _check_ax_limits(col, ax):
         _check_ax_limits(df['height'], height_ax)
         _check_ax_limits(df['weight'], weight_ax)
         _check_ax_limits(df['age'], age_ax)
-        self.assertEqual(weight_ax._sharey, height_ax)
-        self.assertEqual(age_ax._sharey, height_ax)
-        self.assertIsNone(dummy_ax._sharey)
+        assert weight_ax._sharey == height_ax
+        assert age_ax._sharey == height_ax
+        assert dummy_ax._sharey is None
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_empty_column(self):
-        _skip_if_mpl_14_or_dev_boxplot()
         df = DataFrame(np.random.randn(20, 4))
         df.loc[:, 0] = np.nan
         _check_plot_works(df.boxplot, return_type='axes')
 
+    @pytest.mark.slow
+    def test_figsize(self):
+        df = DataFrame(np.random.rand(10, 5),
+                       columns=['A', 'B', 'C', 'D', 'E'])
+        result = df.boxplot(return_type='axes', figsize=(12, 8))
+        assert result.figure.bbox_inches.width == 12
+        assert result.figure.bbox_inches.height == 8
+
     def test_fontsize(self):
         df = DataFrame({"a": [1, 2, 3, 4, 5, 6]})
         self._check_ticks_props(df.boxplot("a", fontsize=16),
                                 xlabelsize=16, ylabelsize=16)
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFrameGroupByPlots(TestPlotBase):
 
-    @slow
-    def test_boxplot_legacy(self):
+    @pytest.mark.slow
+    def test_boxplot_legacy1(self):
         grouped = self.hist_df.groupby(by='gender')
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(grouped.boxplot, return_type='axes')
@@ -176,10 +174,12 @@ def test_boxplot_legacy(self):
         axes = _check_plot_works(grouped.boxplot, subplots=False,
                                  return_type='axes')
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
+
+    @pytest.mark.slow
+    def test_boxplot_legacy2(self):
         tuples = lzip(string.ascii_letters[:10], range(10))
         df = DataFrame(np.random.rand(10, 3),
                        index=MultiIndex.from_tuples(tuples))
-
         grouped = df.groupby(level=1)
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(grouped.boxplot, return_type='axes')
@@ -189,6 +189,11 @@ def test_boxplot_legacy(self):
                                  return_type='axes')
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
 
+    @pytest.mark.slow
+    def test_boxplot_legacy3(self):
+        tuples = lzip(string.ascii_letters[:10], range(10))
+        df = DataFrame(np.random.rand(10, 3),
+                       index=MultiIndex.from_tuples(tuples))
         grouped = df.unstack(level=1).groupby(level=0, axis=1)
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(grouped.boxplot, return_type='axes')
@@ -197,7 +202,7 @@ def test_boxplot_legacy(self):
                                  return_type='axes')
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_plot_fignums(self):
         n = 10
         weight = Series(np.random.normal(166, 20, size=n))
@@ -208,26 +213,26 @@ def test_grouped_plot_fignums(self):
         gb = df.groupby('gender')
 
         res = gb.plot()
-        self.assertEqual(len(self.plt.get_fignums()), 2)
-        self.assertEqual(len(res), 2)
+        assert len(self.plt.get_fignums()) == 2
+        assert len(res) == 2
         tm.close()
 
         res = gb.boxplot(return_type='axes')
-        self.assertEqual(len(self.plt.get_fignums()), 1)
-        self.assertEqual(len(res), 2)
+        assert len(self.plt.get_fignums()) == 1
+        assert len(res) == 2
         tm.close()
 
         # now works with GH 5610 as gender is excluded
         res = df.groupby('gender').hist()
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_box_return_type(self):
         df = self.hist_df
 
         # old style: return_type=None
         result = df.boxplot(by='gender')
-        self.assertIsInstance(result, np.ndarray)
+        assert isinstance(result, np.ndarray)
         self._check_box_return_type(
             result, None,
             expected_keys=['height', 'weight', 'category'])
@@ -258,17 +263,24 @@ def test_grouped_box_return_type(self):
             returned = df2.boxplot(by='category', return_type=t)
             self._check_box_return_type(returned, t, expected_keys=columns2)
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_box_layout(self):
         df = self.hist_df
 
-        self.assertRaises(ValueError, df.boxplot, column=['weight', 'height'],
-                          by=df.gender, layout=(1, 1))
-        self.assertRaises(ValueError, df.boxplot,
-                          column=['height', 'weight', 'category'],
-                          layout=(2, 1), return_type='dict')
-        self.assertRaises(ValueError, df.boxplot, column=['weight', 'height'],
-                          by=df.gender, layout=(-1, -1))
+        msg = "Layout of 1x1 must be larger than required size 2"
+        with pytest.raises(ValueError, match=msg):
+            df.boxplot(column=['weight', 'height'], by=df.gender,
+                       layout=(1, 1))
+
+        msg = "The 'layout' keyword is not supported when 'by' is None"
+        with pytest.raises(ValueError, match=msg):
+            df.boxplot(column=['height', 'weight', 'category'],
+                       layout=(2, 1), return_type='dict')
+
+        msg = "At least one dimension of layout must be positive"
+        with pytest.raises(ValueError, match=msg):
+            df.boxplot(column=['weight', 'height'], by=df.gender,
+                       layout=(-1, -1))
 
         # _check_plot_works adds an ax so catch warning. see GH #13188
         with tm.assert_produces_warning(UserWarning):
@@ -332,7 +344,7 @@ def test_grouped_box_layout(self):
             return_type='dict')
         self._check_axes_shape(self.plt.gcf().axes, axes_num=3, layout=(1, 3))
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_box_multiple_axes(self):
         # GH 6970, GH 7069
         df = self.hist_df
@@ -355,8 +367,8 @@ def test_grouped_box_multiple_axes(self):
                                   by='gender', return_type='axes', ax=axes[0])
         returned = np.array(list(returned.values))
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[0])
-        self.assertIs(returned[0].figure, fig)
+        tm.assert_numpy_array_equal(returned, axes[0])
+        assert returned[0].figure is fig
 
         # draw on second row
         with tm.assert_produces_warning(UserWarning):
@@ -365,10 +377,10 @@ def test_grouped_box_multiple_axes(self):
                 return_type='axes', ax=axes[1])
         returned = np.array(list(returned.values))
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[1])
-        self.assertIs(returned[0].figure, fig)
+        tm.assert_numpy_array_equal(returned, axes[1])
+        assert returned[0].figure is fig
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             fig, axes = self.plt.subplots(2, 3)
             # pass different number of axes from required
             with tm.assert_produces_warning(UserWarning):
diff --git a/pandas/tests/plotting/test_converter.py b/pandas/tests/plotting/test_converter.py
new file mode 100644
index 0000000000000..7dfc21562cc5d
--- /dev/null
+++ b/pandas/tests/plotting/test_converter.py
@@ -0,0 +1,346 @@
+from datetime import date, datetime
+import subprocess
+import sys
+
+import numpy as np
+import pytest
+
+from pandas.compat import u
+from pandas.compat.numpy import np_datetime64_compat
+
+from pandas import Index, Period, Series, Timestamp, date_range
+import pandas.core.config as cf
+import pandas.util.testing as tm
+
+from pandas.tseries.offsets import Day, Micro, Milli, Second
+
+converter = pytest.importorskip('pandas.plotting._converter')
+from pandas.plotting import (deregister_matplotlib_converters,  # isort:skip
+                             register_matplotlib_converters)
+
+
+def test_timtetonum_accepts_unicode():
+    assert (converter.time2num("00:01") == converter.time2num(u("00:01")))
+
+
+class TestRegistration(object):
+
+    def test_register_by_default(self):
+        # Run in subprocess to ensure a clean state
+        code = ("'import matplotlib.units; "
+                "import pandas as pd; "
+                "units = dict(matplotlib.units.registry); "
+                "assert pd.Timestamp in units)'")
+        call = [sys.executable, '-c', code]
+        assert subprocess.check_call(call) == 0
+
+    def test_warns(self):
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        # Set to the "warning" state, in case this isn't the first test run
+        converter._WARN = True
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False) as w:
+            ax.plot(s.index, s.values)
+            plt.close()
+
+        assert len(w) == 1
+        assert "Using an implicitly registered datetime converter" in str(w[0])
+
+    def test_registering_no_warning(self):
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        # Set to the "warn" state, in case this isn't the first test run
+        converter._WARN = True
+        register_matplotlib_converters()
+        with tm.assert_produces_warning(None) as w:
+            ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+    def test_pandas_plots_register(self):
+        pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        # Set to the "warn" state, in case this isn't the first test run
+        converter._WARN = True
+        with tm.assert_produces_warning(None) as w:
+            s.plot()
+
+        assert len(w) == 0
+
+    def test_matplotlib_formatters(self):
+        units = pytest.importorskip("matplotlib.units")
+        assert Timestamp in units.registry
+
+        ctx = cf.option_context("plotting.matplotlib.register_converters",
+                                False)
+        with ctx:
+            assert Timestamp not in units.registry
+
+        assert Timestamp in units.registry
+
+    def test_option_no_warning(self):
+        pytest.importorskip("matplotlib.pyplot")
+        ctx = cf.option_context("plotting.matplotlib.register_converters",
+                                False)
+        plt = pytest.importorskip("matplotlib.pyplot")
+        s = Series(range(12), index=date_range('2017', periods=12))
+        _, ax = plt.subplots()
+
+        converter._WARN = True
+        # Test without registering first, no warning
+        with ctx:
+            with tm.assert_produces_warning(None) as w:
+                ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+        # Now test with registering
+        converter._WARN = True
+        register_matplotlib_converters()
+        with ctx:
+            with tm.assert_produces_warning(None) as w:
+                ax.plot(s.index, s.values)
+
+        assert len(w) == 0
+
+    def test_registry_resets(self):
+        units = pytest.importorskip("matplotlib.units")
+        dates = pytest.importorskip("matplotlib.dates")
+
+        # make a copy, to reset to
+        original = dict(units.registry)
+
+        try:
+            # get to a known state
+            units.registry.clear()
+            date_converter = dates.DateConverter()
+            units.registry[datetime] = date_converter
+            units.registry[date] = date_converter
+
+            register_matplotlib_converters()
+            assert units.registry[date] is not date_converter
+            deregister_matplotlib_converters()
+            assert units.registry[date] is date_converter
+
+        finally:
+            # restore original stater
+            units.registry.clear()
+            for k, v in original.items():
+                units.registry[k] = v
+
+    def test_old_import_warns(self):
+        with tm.assert_produces_warning(FutureWarning) as w:
+            from pandas.tseries import converter
+            converter.register()
+
+        assert len(w)
+        assert ('pandas.plotting.register_matplotlib_converters' in
+                str(w[0].message))
+
+
+class TestDateTimeConverter(object):
+
+    def setup_method(self, method):
+        self.dtc = converter.DatetimeConverter()
+        self.tc = converter.TimeFormatter(None)
+
+    def test_convert_accepts_unicode(self):
+        r1 = self.dtc.convert("12:22", None, None)
+        r2 = self.dtc.convert(u("12:22"), None, None)
+        assert (r1 == r2), "DatetimeConverter.convert should accept unicode"
+
+    def test_conversion(self):
+        rs = self.dtc.convert(['2012-1-1'], None, None)[0]
+        xp = datetime(2012, 1, 1).toordinal()
+        assert rs == xp
+
+        rs = self.dtc.convert('2012-1-1', None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(date(2012, 1, 1), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(datetime(2012, 1, 1).toordinal(), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert('2012-1-1', None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(Timestamp('2012-1-1'), None, None)
+        assert rs == xp
+
+        # also testing datetime64 dtype (GH8614)
+        rs = self.dtc.convert(np_datetime64_compat('2012-01-01'), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(np_datetime64_compat(
+            '2012-01-01 00:00:00+0000'), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(np.array([
+            np_datetime64_compat('2012-01-01 00:00:00+0000'),
+            np_datetime64_compat('2012-01-02 00:00:00+0000')]), None, None)
+        assert rs[0] == xp
+
+        # we have a tz-aware date (constructed to that when we turn to utc it
+        # is the same as our sample)
+        ts = (Timestamp('2012-01-01')
+              .tz_localize('UTC')
+              .tz_convert('US/Eastern')
+              )
+        rs = self.dtc.convert(ts, None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(ts.to_pydatetime(), None, None)
+        assert rs == xp
+
+        rs = self.dtc.convert(Index([ts - Day(1), ts]), None, None)
+        assert rs[1] == xp
+
+        rs = self.dtc.convert(Index([ts - Day(1), ts]).to_pydatetime(),
+                              None, None)
+        assert rs[1] == xp
+
+    def test_conversion_float(self):
+        decimals = 9
+
+        rs = self.dtc.convert(
+            Timestamp('2012-1-1 01:02:03', tz='UTC'), None, None)
+        xp = converter.dates.date2num(Timestamp('2012-1-1 01:02:03', tz='UTC'))
+        tm.assert_almost_equal(rs, xp, decimals)
+
+        rs = self.dtc.convert(
+            Timestamp('2012-1-1 09:02:03', tz='Asia/Hong_Kong'), None, None)
+        tm.assert_almost_equal(rs, xp, decimals)
+
+        rs = self.dtc.convert(datetime(2012, 1, 1, 1, 2, 3), None, None)
+        tm.assert_almost_equal(rs, xp, decimals)
+
+    def test_conversion_outofbounds_datetime(self):
+        # 2579
+        values = [date(1677, 1, 1), date(1677, 1, 2)]
+        rs = self.dtc.convert(values, None, None)
+        xp = converter.dates.date2num(values)
+        tm.assert_numpy_array_equal(rs, xp)
+        rs = self.dtc.convert(values[0], None, None)
+        xp = converter.dates.date2num(values[0])
+        assert rs == xp
+
+        values = [datetime(1677, 1, 1, 12), datetime(1677, 1, 2, 12)]
+        rs = self.dtc.convert(values, None, None)
+        xp = converter.dates.date2num(values)
+        tm.assert_numpy_array_equal(rs, xp)
+        rs = self.dtc.convert(values[0], None, None)
+        xp = converter.dates.date2num(values[0])
+        assert rs == xp
+
+    @pytest.mark.parametrize('time,format_expected', [
+        (0, '00:00'),  # time2num(datetime.time.min)
+        (86399.999999, '23:59:59.999999'),  # time2num(datetime.time.max)
+        (90000, '01:00'),
+        (3723, '01:02:03'),
+        (39723.2, '11:02:03.200')
+    ])
+    def test_time_formatter(self, time, format_expected):
+        # issue 18478
+        result = self.tc(time)
+        assert result == format_expected
+
+    def test_dateindex_conversion(self):
+        decimals = 9
+
+        for freq in ('B', 'L', 'S'):
+            dateindex = tm.makeDateIndex(k=10, freq=freq)
+            rs = self.dtc.convert(dateindex, None, None)
+            xp = converter.dates.date2num(dateindex._mpl_repr())
+            tm.assert_almost_equal(rs, xp, decimals)
+
+    def test_resolution(self):
+        def _assert_less(ts1, ts2):
+            val1 = self.dtc.convert(ts1, None, None)
+            val2 = self.dtc.convert(ts2, None, None)
+            if not val1 < val2:
+                raise AssertionError('{0} is not less than {1}.'.format(val1,
+                                                                        val2))
+
+        # Matplotlib's time representation using floats cannot distinguish
+        # intervals smaller than ~10 microsecond in the common range of years.
+        ts = Timestamp('2012-1-1')
+        _assert_less(ts, ts + Second())
+        _assert_less(ts, ts + Milli())
+        _assert_less(ts, ts + Micro(50))
+
+    def test_convert_nested(self):
+        inner = [Timestamp('2017-01-01'), Timestamp('2017-01-02')]
+        data = [inner, inner]
+        result = self.dtc.convert(data, None, None)
+        expected = [self.dtc.convert(x, None, None) for x in data]
+        assert (np.array(result) == expected).all()
+
+
+class TestPeriodConverter(object):
+
+    def setup_method(self, method):
+        self.pc = converter.PeriodConverter()
+
+        class Axis(object):
+            pass
+
+        self.axis = Axis()
+        self.axis.freq = 'D'
+
+    def test_convert_accepts_unicode(self):
+        r1 = self.pc.convert("2012-1-1", None, self.axis)
+        r2 = self.pc.convert(u("2012-1-1"), None, self.axis)
+        assert r1 == r2
+
+    def test_conversion(self):
+        rs = self.pc.convert(['2012-1-1'], None, self.axis)[0]
+        xp = Period('2012-1-1').ordinal
+        assert rs == xp
+
+        rs = self.pc.convert('2012-1-1', None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert([date(2012, 1, 1)], None, self.axis)[0]
+        assert rs == xp
+
+        rs = self.pc.convert(date(2012, 1, 1), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert([Timestamp('2012-1-1')], None, self.axis)[0]
+        assert rs == xp
+
+        rs = self.pc.convert(Timestamp('2012-1-1'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(
+            np_datetime64_compat('2012-01-01'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(
+            np_datetime64_compat('2012-01-01 00:00:00+0000'), None, self.axis)
+        assert rs == xp
+
+        rs = self.pc.convert(np.array([
+            np_datetime64_compat('2012-01-01 00:00:00+0000'),
+            np_datetime64_compat('2012-01-02 00:00:00+0000')]),
+            None, self.axis)
+        assert rs[0] == xp
+
+    def test_integer_passthrough(self):
+        # GH9012
+        rs = self.pc.convert([0, 1], None, self.axis)
+        xp = [0, 1]
+        assert rs == xp
+
+    def test_convert_nested(self):
+        data = ['2012-1-1', '2012-1-2']
+        r1 = self.pc.convert([data, data], None, self.axis)
+        r2 = [self.pc.convert(data, None, self.axis) for _ in range(2)]
+        assert r1 == r2
diff --git a/pandas/tests/plotting/test_datetimelike.py b/pandas/tests/plotting/test_datetimelike.py
index 673c34903b259..6702ad6cfb761 100644
--- a/pandas/tests/plotting/test_datetimelike.py
+++ b/pandas/tests/plotting/test_datetimelike.py
@@ -1,31 +1,32 @@
 """ Test cases for time series specific (freq conversion, etc) """
+from datetime import date, datetime, time, timedelta
+import pickle
+import sys
 
-from datetime import datetime, timedelta, date, time
-
+import numpy as np
 import pytest
-from pandas.compat import lrange, zip
 
-import numpy as np
-from pandas import Index, Series, DataFrame
-from pandas.compat import is_platform_mac
-from pandas.tseries.index import date_range, bdate_range
-from pandas.tseries.tdi import timedelta_range
-from pandas.tseries.offsets import DateOffset
-from pandas.tseries.period import period_range, Period, PeriodIndex
-from pandas.tseries.resample import DatetimeIndex
+from pandas.compat import PY3, lrange, zip
+import pandas.util._test_decorators as td
 
-from pandas.util.testing import assert_series_equal, ensure_clean, slow
+from pandas import DataFrame, Index, NaT, Series, isna
+from pandas.core.indexes.datetimes import bdate_range, date_range
+from pandas.core.indexes.period import Period, PeriodIndex, period_range
+from pandas.core.indexes.timedeltas import timedelta_range
+from pandas.core.resample import DatetimeIndex
+from pandas.tests.plotting.common import (
+    TestPlotBase, _skip_if_no_scipy_gaussian_kde)
 import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal, ensure_clean
 
-from pandas.tests.plotting.common import (TestPlotBase,
-                                          _skip_if_no_scipy_gaussian_kde)
+from pandas.tseries.offsets import DateOffset
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestTSPlot(TestPlotBase):
 
-    def setUp(self):
-        TestPlotBase.setUp(self)
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
 
         freq = ['S', 'T', 'H', 'D', 'W', 'M', 'Q', 'A']
         idx = [period_range('12/31/1999', freq=x, periods=100) for x in freq]
@@ -41,10 +42,10 @@ def setUp(self):
                                       columns=['A', 'B', 'C'])
                             for x in idx]
 
-    def tearDown(self):
+    def teardown_method(self, method):
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_ts_plot_with_tz(self):
         # GH2877
         index = date_range('1/1/2011', periods=2, freq='H',
@@ -54,16 +55,15 @@ def test_ts_plot_with_tz(self):
 
     def test_fontsize_set_correctly(self):
         # For issue #8765
-        import matplotlib.pyplot as plt  # noqa
         df = DataFrame(np.random.randn(10, 9), index=range(10))
-        ax = df.plot(fontsize=2)
+        fig, ax = self.plt.subplots()
+        df.plot(fontsize=2, ax=ax)
         for label in (ax.get_xticklabels() + ax.get_yticklabels()):
-            self.assertEqual(label.get_fontsize(), 2)
+            assert label.get_fontsize() == 2
 
-    @slow
+    @pytest.mark.slow
     def test_frame_inferred(self):
         # inferred freq
-        import matplotlib.pyplot as plt  # noqa
         idx = date_range('1/1/1987', freq='MS', periods=100)
         idx = DatetimeIndex(idx.values, freq=None)
 
@@ -89,26 +89,38 @@ def test_is_error_nozeroindex(self):
         _check_plot_works(a.plot, yerr=a)
 
     def test_nonnumeric_exclude(self):
-        import matplotlib.pyplot as plt
-
         idx = date_range('1/1/1987', freq='A', periods=3)
         df = DataFrame({'A': ["x", "y", "z"], 'B': [1, 2, 3]}, idx)
 
-        ax = df.plot()  # it works
-        self.assertEqual(len(ax.get_lines()), 1)  # B was plotted
-        plt.close(plt.gcf())
+        fig, ax = self.plt.subplots()
+        df.plot(ax=ax)  # it works
+        assert len(ax.get_lines()) == 1  # B was plotted
+        self.plt.close(fig)
+
+        msg = "Empty 'DataFrame': no numeric data to plot"
+        with pytest.raises(TypeError, match=msg):
+            df['A'].plot()
+
+    def test_tsplot_deprecated(self):
+        from pandas.tseries.plotting import tsplot
+
+        _, ax = self.plt.subplots()
+        ts = tm.makeTimeSeries()
 
-        self.assertRaises(TypeError, df['A'].plot)
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(ts, self.plt.Axes.plot, ax=ax)
 
-    @slow
+    @pytest.mark.slow
     def test_tsplot(self):
+
         from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
 
-        ax = plt.gca()
+        _, ax = self.plt.subplots()
         ts = tm.makeTimeSeries()
 
-        f = lambda *args, **kwds: tsplot(s, plt.Axes.plot, *args, **kwds)
+        def f(*args, **kwds):
+            with tm.assert_produces_warning(FutureWarning):
+                return tsplot(s, self.plt.Axes.plot, *args, **kwds)
 
         for s in self.period_ser:
             _check_plot_works(f, s.index.freq, ax=ax, series=s)
@@ -122,90 +134,100 @@ def test_tsplot(self):
         for s in self.datetime_ser:
             _check_plot_works(s.plot, ax=ax)
 
-        ax = ts.plot(style='k')
-        color = (0., 0., 0., 1) if self.mpl_ge_2_0_0 else (0., 0., 0.)
-        self.assertEqual(color, ax.get_lines()[0].get_color())
+        _, ax = self.plt.subplots()
+        ts.plot(style='k', ax=ax)
+        color = (0., 0., 0., 1)
+        assert color == ax.get_lines()[0].get_color()
 
     def test_both_style_and_color(self):
-        import matplotlib.pyplot as plt  # noqa
 
         ts = tm.makeTimeSeries()
-        self.assertRaises(ValueError, ts.plot, style='b-', color='#000099')
+        msg = ("Cannot pass 'style' string with a color symbol and 'color' "
+               "keyword argument. Please use one or the other or pass 'style'"
+               " without a color symbol")
+        with pytest.raises(ValueError, match=msg):
+            ts.plot(style='b-', color='#000099')
 
         s = ts.reset_index(drop=True)
-        self.assertRaises(ValueError, s.plot, style='b-', color='#000099')
+        with pytest.raises(ValueError, match=msg):
+            s.plot(style='b-', color='#000099')
 
-    @slow
+    @pytest.mark.slow
     def test_high_freq(self):
         freaks = ['ms', 'us']
         for freq in freaks:
-            rng = date_range('1/1/2012', periods=100000, freq=freq)
+            _, ax = self.plt.subplots()
+            rng = date_range('1/1/2012', periods=100, freq=freq)
             ser = Series(np.random.randn(len(rng)), rng)
-            _check_plot_works(ser.plot)
+            _check_plot_works(ser.plot, ax=ax)
 
     def test_get_datevalue(self):
-        from pandas.tseries.converter import get_datevalue
-        self.assertIsNone(get_datevalue(None, 'D'))
-        self.assertEqual(get_datevalue(1987, 'A'), 1987)
-        self.assertEqual(get_datevalue(Period(1987, 'A'), 'M'),
-                         Period('1987-12', 'M').ordinal)
-        self.assertEqual(get_datevalue('1/1/1987', 'D'),
-                         Period('1987-1-1', 'D').ordinal)
-
-    @slow
+        from pandas.plotting._converter import get_datevalue
+        assert get_datevalue(None, 'D') is None
+        assert get_datevalue(1987, 'A') == 1987
+        assert (get_datevalue(Period(1987, 'A'), 'M') ==
+                Period('1987-12', 'M').ordinal)
+        assert (get_datevalue('1/1/1987', 'D') ==
+                Period('1987-1-1', 'D').ordinal)
+
+    @pytest.mark.slow
     def test_ts_plot_format_coord(self):
         def check_format_of_first_point(ax, expected_string):
             first_line = ax.get_lines()[0]
             first_x = first_line.get_xdata()[0].ordinal
             first_y = first_line.get_ydata()[0]
             try:
-                self.assertEqual(expected_string,
-                                 ax.format_coord(first_x, first_y))
+                assert expected_string == ax.format_coord(first_x, first_y)
             except (ValueError):
                 pytest.skip("skipping test because issue forming "
                             "test comparison GH7664")
 
         annual = Series(1, index=date_range('2014-01-01', periods=3,
                                             freq='A-DEC'))
-        check_format_of_first_point(annual.plot(), 't = 2014  y = 1.000000')
+        _, ax = self.plt.subplots()
+        annual.plot(ax=ax)
+        check_format_of_first_point(ax, 't = 2014  y = 1.000000')
 
         # note this is added to the annual plot already in existence, and
         # changes its freq field
         daily = Series(1, index=date_range('2014-01-01', periods=3, freq='D'))
-        check_format_of_first_point(daily.plot(),
+        daily.plot(ax=ax)
+        check_format_of_first_point(ax,
                                     't = 2014-01-01  y = 1.000000')
         tm.close()
 
         # tsplot
-        import matplotlib.pyplot as plt
         from pandas.tseries.plotting import tsplot
-        tsplot(annual, plt.Axes.plot)
-        check_format_of_first_point(plt.gca(), 't = 2014  y = 1.000000')
-        tsplot(daily, plt.Axes.plot)
-        check_format_of_first_point(plt.gca(), 't = 2014-01-01  y = 1.000000')
-
-    @slow
+        _, ax = self.plt.subplots()
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(annual, self.plt.Axes.plot, ax=ax)
+        check_format_of_first_point(ax, 't = 2014  y = 1.000000')
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(daily, self.plt.Axes.plot, ax=ax)
+        check_format_of_first_point(ax, 't = 2014-01-01  y = 1.000000')
+
+    @pytest.mark.slow
     def test_line_plot_period_series(self):
         for s in self.period_ser:
             _check_plot_works(s.plot, s.index.freq)
 
-    @slow
+    @pytest.mark.slow
     def test_line_plot_datetime_series(self):
         for s in self.datetime_ser:
             _check_plot_works(s.plot, s.index.freq.rule_code)
 
-    @slow
+    @pytest.mark.slow
     def test_line_plot_period_frame(self):
         for df in self.period_df:
             _check_plot_works(df.plot, df.index.freq)
 
-    @slow
+    @pytest.mark.slow
     def test_line_plot_datetime_frame(self):
         for df in self.datetime_df:
             freq = df.index.to_period(df.index.freq.rule_code).freq
             _check_plot_works(df.plot, freq)
 
-    @slow
+    @pytest.mark.slow
     def test_line_plot_inferred_freq(self):
         for ser in self.datetime_ser:
             ser = Series(ser.values, Index(np.asarray(ser.index)))
@@ -215,17 +237,14 @@ def test_line_plot_inferred_freq(self):
             _check_plot_works(ser.plot)
 
     def test_fake_inferred_business(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
+        _, ax = self.plt.subplots()
         rng = date_range('2001-1-1', '2001-1-10')
         ts = Series(lrange(len(rng)), rng)
         ts = ts[:3].append(ts[5:])
-        ax = ts.plot()
-        self.assertFalse(hasattr(ax, 'freq'))
+        ts.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
 
-    @slow
+    @pytest.mark.slow
     def test_plot_offset_freq(self):
         ser = tm.makeTimeSeries()
         _check_plot_works(ser.plot)
@@ -234,25 +253,21 @@ def test_plot_offset_freq(self):
         ser = Series(np.random.randn(len(dr)), dr)
         _check_plot_works(ser.plot)
 
-    @slow
+    @pytest.mark.slow
     def test_plot_multiple_inferred_freq(self):
         dr = Index([datetime(2000, 1, 1), datetime(2000, 1, 6), datetime(
             2000, 1, 11)])
         ser = Series(np.random.randn(len(dr)), dr)
         _check_plot_works(ser.plot)
 
-    @slow
+    @pytest.mark.slow
     def test_uhf(self):
-        import pandas.tseries.converter as conv
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
-
+        import pandas.plotting._converter as conv
         idx = date_range('2012-6-22 21:59:51.960928', freq='L', periods=500)
         df = DataFrame(np.random.randn(len(idx), 2), idx)
 
-        ax = df.plot()
+        _, ax = self.plt.subplots()
+        df.plot(ax=ax)
         axis = ax.get_xaxis()
 
         tlocs = axis.get_ticklocs()
@@ -261,96 +276,85 @@ def test_uhf(self):
             xp = conv._from_ordinal(loc).strftime('%H:%M:%S.%f')
             rs = str(label.get_text())
             if len(rs):
-                self.assertEqual(xp, rs)
+                assert xp == rs
 
-    @slow
+    @pytest.mark.slow
     def test_irreg_hf(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
-        fig.add_subplot(111)
-
         idx = date_range('2012-6-22 21:59:51', freq='S', periods=100)
         df = DataFrame(np.random.randn(len(idx), 2), idx)
 
         irreg = df.iloc[[0, 1, 3, 4]]
-        ax = irreg.plot()
+        _, ax = self.plt.subplots()
+        irreg.plot(ax=ax)
         diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
 
         sec = 1. / 24 / 60 / 60
-        self.assertTrue((np.fabs(diffs[1:] - [sec, sec * 2, sec]) < 1e-8).all(
-        ))
+        assert (np.fabs(diffs[1:] - [sec, sec * 2, sec]) < 1e-8).all()
 
-        plt.clf()
-        fig.add_subplot(111)
+        _, ax = self.plt.subplots()
         df2 = df.copy()
-        df2.index = df.index.asobject
-        ax = df2.plot()
+        df2.index = df.index.astype(object)
+        df2.plot(ax=ax)
         diffs = Series(ax.get_lines()[0].get_xydata()[:, 0]).diff()
-        self.assertTrue((np.fabs(diffs[1:] - sec) < 1e-8).all())
+        assert (np.fabs(diffs[1:] - sec) < 1e-8).all()
 
     def test_irregular_datetime64_repr_bug(self):
-        import matplotlib.pyplot as plt
         ser = tm.makeTimeSeries()
         ser = ser[[0, 1, 2, 7]]
 
-        fig = plt.gcf()
-        plt.clf()
-        ax = fig.add_subplot(211)
-        ret = ser.plot()
-        self.assertIsNotNone(ret)
+        _, ax = self.plt.subplots()
+
+        ret = ser.plot(ax=ax)
+        assert ret is not None
 
         for rs, xp in zip(ax.get_lines()[0].get_xdata(), ser.index):
-            self.assertEqual(rs, xp)
+            assert rs == xp
 
     def test_business_freq(self):
-        import matplotlib.pyplot as plt  # noqa
         bts = tm.makePeriodSeries()
-        ax = bts.plot()
-        self.assertEqual(ax.get_lines()[0].get_xydata()[0, 0],
-                         bts.index[0].ordinal)
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
+        assert ax.get_lines()[0].get_xydata()[0, 0] == bts.index[0].ordinal
         idx = ax.get_lines()[0].get_xdata()
-        self.assertEqual(PeriodIndex(data=idx).freqstr, 'B')
+        assert PeriodIndex(data=idx).freqstr == 'B'
 
-    @slow
+    @pytest.mark.slow
     def test_business_freq_convert(self):
-        n = tm.N
-        tm.N = 300
-        bts = tm.makeTimeSeries().asfreq('BM')
-        tm.N = n
+        bts = tm.makeTimeSeries(300).asfreq('BM')
         ts = bts.to_period('M')
-        ax = bts.plot()
-        self.assertEqual(ax.get_lines()[0].get_xydata()[0, 0],
-                         ts.index[0].ordinal)
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
+        assert ax.get_lines()[0].get_xydata()[0, 0] == ts.index[0].ordinal
         idx = ax.get_lines()[0].get_xdata()
-        self.assertEqual(PeriodIndex(data=idx).freqstr, 'M')
+        assert PeriodIndex(data=idx).freqstr == 'M'
 
     def test_nonzero_base(self):
         # GH2571
         idx = (date_range('2012-12-20', periods=24, freq='H') + timedelta(
             minutes=30))
         df = DataFrame(np.arange(24), index=idx)
-        ax = df.plot()
+        _, ax = self.plt.subplots()
+        df.plot(ax=ax)
         rs = ax.get_lines()[0].get_xdata()
-        self.assertFalse(Index(rs).is_normalized)
+        assert not Index(rs).is_normalized
 
     def test_dataframe(self):
         bts = DataFrame({'a': tm.makeTimeSeries()})
-        ax = bts.plot()
+        _, ax = self.plt.subplots()
+        bts.plot(ax=ax)
         idx = ax.get_lines()[0].get_xdata()
         tm.assert_index_equal(bts.index.to_period(), PeriodIndex(idx))
 
-    @slow
+    @pytest.mark.slow
     def test_axis_limits(self):
-        import matplotlib.pyplot as plt
 
         def _test(ax):
             xlim = ax.get_xlim()
             ax.set_xlim(xlim[0] - 5, xlim[1] + 10)
             ax.get_figure().canvas.draw()
             result = ax.get_xlim()
-            self.assertEqual(result[0], xlim[0] - 5)
-            self.assertEqual(result[1], xlim[1] + 10)
+            assert result[0] == xlim[0] - 5
+            assert result[1] == xlim[1] + 10
 
             # string
             expected = (Period('1/1/2000', ax.freq),
@@ -358,26 +362,28 @@ def _test(ax):
             ax.set_xlim('1/1/2000', '4/1/2000')
             ax.get_figure().canvas.draw()
             result = ax.get_xlim()
-            self.assertEqual(int(result[0]), expected[0].ordinal)
-            self.assertEqual(int(result[1]), expected[1].ordinal)
+            assert int(result[0]) == expected[0].ordinal
+            assert int(result[1]) == expected[1].ordinal
 
-            # datetim
+            # datetime
             expected = (Period('1/1/2000', ax.freq),
                         Period('4/1/2000', ax.freq))
             ax.set_xlim(datetime(2000, 1, 1), datetime(2000, 4, 1))
             ax.get_figure().canvas.draw()
             result = ax.get_xlim()
-            self.assertEqual(int(result[0]), expected[0].ordinal)
-            self.assertEqual(int(result[1]), expected[1].ordinal)
+            assert int(result[0]) == expected[0].ordinal
+            assert int(result[1]) == expected[1].ordinal
             fig = ax.get_figure()
-            plt.close(fig)
+            self.plt.close(fig)
 
         ser = tm.makeTimeSeries()
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
         _test(ax)
 
+        _, ax = self.plt.subplots()
         df = DataFrame({'a': ser, 'b': ser + 1})
-        ax = df.plot()
+        df.plot(ax=ax)
         _test(ax)
 
         df = DataFrame({'a': ser, 'b': ser + 1})
@@ -387,351 +393,427 @@ def _test(ax):
             _test(ax)
 
     def test_get_finder(self):
-        import pandas.tseries.converter as conv
+        import pandas.plotting._converter as conv
 
-        self.assertEqual(conv.get_finder('B'), conv._daily_finder)
-        self.assertEqual(conv.get_finder('D'), conv._daily_finder)
-        self.assertEqual(conv.get_finder('M'), conv._monthly_finder)
-        self.assertEqual(conv.get_finder('Q'), conv._quarterly_finder)
-        self.assertEqual(conv.get_finder('A'), conv._annual_finder)
-        self.assertEqual(conv.get_finder('W'), conv._daily_finder)
+        assert conv.get_finder('B') == conv._daily_finder
+        assert conv.get_finder('D') == conv._daily_finder
+        assert conv.get_finder('M') == conv._monthly_finder
+        assert conv.get_finder('Q') == conv._quarterly_finder
+        assert conv.get_finder('A') == conv._annual_finder
+        assert conv.get_finder('W') == conv._daily_finder
 
-    @slow
+    @pytest.mark.slow
     def test_finder_daily(self):
-        import matplotlib.pyplot as plt
-        xp = Period('1999-1-1', freq='B').ordinal
         day_lst = [10, 40, 252, 400, 950, 2750, 10000]
-        for n in day_lst:
+
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            xpl1 = xpl2 = [Period('1999-1-1', freq='B').ordinal] * len(day_lst)
+        else:  # 2.0.1, 2.1.0, 2.2.2, 2.2.3
+            xpl1 = [7565, 7564, 7553, 7546, 7518, 7428, 7066]
+            xpl2 = [7566, 7564, 7554, 7546, 7519, 7429, 7066]
+
+        rs1 = []
+        rs2 = []
+        for i, n in enumerate(day_lst):
             rng = bdate_range('1999-1-1', periods=n)
             ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
             xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
+            rs1.append(xaxis.get_majorticklocs()[0])
+
             vmin, vmax = ax.get_xlim()
             ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
+            rs2.append(xaxis.get_majorticklocs()[0])
+            self.plt.close(ax.get_figure())
 
-    @slow
+        assert rs1 == xpl1
+        assert rs2 == xpl2
+
+    @pytest.mark.slow
     def test_finder_quarterly(self):
-        import matplotlib.pyplot as plt
-        xp = Period('1988Q1').ordinal
         yrs = [3.5, 11]
-        for n in yrs:
+
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            xpl1 = xpl2 = [Period('1988Q1').ordinal] * len(yrs)
+        else:  # 2.0.1, 2.1.0, 2.2.2, 2.2.3
+            xpl1 = [68, 68]
+            xpl2 = [72, 68]
+
+        rs1 = []
+        rs2 = []
+        for i, n in enumerate(yrs):
             rng = period_range('1987Q2', periods=int(n * 4), freq='Q')
             ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
             xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, xp)
+            rs1.append(xaxis.get_majorticklocs()[0])
+
             (vmin, vmax) = ax.get_xlim()
             ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
+            rs2.append(xaxis.get_majorticklocs()[0])
+            self.plt.close(ax.get_figure())
 
-    @slow
+        assert rs1 == xpl1
+        assert rs2 == xpl2
+
+    @pytest.mark.slow
     def test_finder_monthly(self):
-        import matplotlib.pyplot as plt
-        xp = Period('Jan 1988').ordinal
         yrs = [1.15, 2.5, 4, 11]
-        for n in yrs:
+
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            xpl1 = xpl2 = [Period('Jan 1988').ordinal] * len(yrs)
+        else:  # 2.0.1, 2.1.0, 2.2.2, 2.2.3
+            xpl1 = [216, 216, 204, 204]
+            xpl2 = [216, 216, 216, 204]
+
+        rs1 = []
+        rs2 = []
+        for i, n in enumerate(yrs):
             rng = period_range('1987Q2', periods=int(n * 12), freq='M')
             ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
             xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, xp)
+            rs1.append(xaxis.get_majorticklocs()[0])
+
             vmin, vmax = ax.get_xlim()
             ax.set_xlim(vmin + 0.9, vmax)
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(xp, rs)
-            plt.close(ax.get_figure())
+            rs2.append(xaxis.get_majorticklocs()[0])
+            self.plt.close(ax.get_figure())
+
+        assert rs1 == xpl1
+        assert rs2 == xpl2
 
     def test_finder_monthly_long(self):
         rng = period_range('1988Q1', periods=24 * 12, freq='M')
         ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
         xaxis = ax.get_xaxis()
         rs = xaxis.get_majorticklocs()[0]
         xp = Period('1989Q1', 'M').ordinal
-        self.assertEqual(rs, xp)
+        assert rs == xp
 
-    @slow
+    @pytest.mark.slow
     def test_finder_annual(self):
-        import matplotlib.pyplot as plt
-        xp = [1987, 1988, 1990, 1990, 1995, 2020, 2070, 2170]
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            xp = [1987, 1988, 1990, 1990, 1995, 2020, 2070, 2170]
+        else:  # 2.0.1, 2.1.0, 2.2.2, 2.2.3
+            xp = [1986, 1986, 1990, 1990, 1995, 2020, 1970, 1970]
+
+        xp = [Period(x, freq='A').ordinal for x in xp]
+        rs = []
         for i, nyears in enumerate([5, 10, 19, 49, 99, 199, 599, 1001]):
             rng = period_range('1987', periods=nyears, freq='A')
             ser = Series(np.random.randn(len(rng)), rng)
-            ax = ser.plot()
+            _, ax = self.plt.subplots()
+            ser.plot(ax=ax)
             xaxis = ax.get_xaxis()
-            rs = xaxis.get_majorticklocs()[0]
-            self.assertEqual(rs, Period(xp[i], freq='A').ordinal)
-            plt.close(ax.get_figure())
+            rs.append(xaxis.get_majorticklocs()[0])
+            self.plt.close(ax.get_figure())
+
+        assert rs == xp
 
-    @slow
+    @pytest.mark.slow
     def test_finder_minutely(self):
         nminutes = 50 * 24 * 60
         rng = date_range('1/1/1999', freq='Min', periods=nminutes)
         ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
         xaxis = ax.get_xaxis()
         rs = xaxis.get_majorticklocs()[0]
         xp = Period('1/1/1999', freq='Min').ordinal
-        self.assertEqual(rs, xp)
+
+        assert rs == xp
 
     def test_finder_hourly(self):
         nhours = 23
         rng = date_range('1/1/1999', freq='H', periods=nhours)
         ser = Series(np.random.randn(len(rng)), rng)
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
         xaxis = ax.get_xaxis()
         rs = xaxis.get_majorticklocs()[0]
-        xp = Period('1/1/1999', freq='H').ordinal
-        self.assertEqual(rs, xp)
+        if self.mpl_ge_2_0_1:
+            xp = Period('1/1/1999', freq='H').ordinal
+        else:  # 2.0.0
+            xp = Period('1998-12-31 22:00', freq='H').ordinal
 
-    @slow
-    def test_gaps(self):
-        import matplotlib.pyplot as plt
+        assert rs == xp
 
+    @pytest.mark.slow
+    def test_gaps(self):
         ts = tm.makeTimeSeries()
         ts[5:25] = np.nan
-        ax = ts.plot()
+        _, ax = self.plt.subplots()
+        ts.plot(ax=ax)
         lines = ax.get_lines()
-        tm._skip_if_mpl_1_5()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
+        assert len(lines) == 1
+        line = lines[0]
+        data = line.get_xydata()
+
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            data = np.ma.MaskedArray(data, mask=isna(data), fill_value=np.nan)
+
+        assert isinstance(data, np.ma.core.MaskedArray)
         mask = data.mask
-        self.assertTrue(mask[5:25, 1].all())
-        plt.close(ax.get_figure())
+        assert mask[5:25, 1].all()
+        self.plt.close(ax.get_figure())
 
         # irregular
         ts = tm.makeTimeSeries()
         ts = ts[[0, 1, 2, 5, 7, 9, 12, 15, 20]]
         ts[2:5] = np.nan
-        ax = ts.plot()
+        _, ax = self.plt.subplots()
+        ax = ts.plot(ax=ax)
         lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
+        assert len(lines) == 1
+        line = lines[0]
+        data = line.get_xydata()
+
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            data = np.ma.MaskedArray(data, mask=isna(data), fill_value=np.nan)
+
+        assert isinstance(data, np.ma.core.MaskedArray)
         mask = data.mask
-        self.assertTrue(mask[2:5, 1].all())
-        plt.close(ax.get_figure())
+        assert mask[2:5, 1].all()
+        self.plt.close(ax.get_figure())
 
         # non-ts
         idx = [0, 1, 2, 5, 7, 9, 12, 15, 20]
         ser = Series(np.random.randn(len(idx)), idx)
         ser[2:5] = np.nan
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ser.plot(ax=ax)
         lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        l = lines[0]
-        data = l.get_xydata()
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
+        assert len(lines) == 1
+        line = lines[0]
+        data = line.get_xydata()
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            data = np.ma.MaskedArray(data, mask=isna(data), fill_value=np.nan)
+
+        assert isinstance(data, np.ma.core.MaskedArray)
         mask = data.mask
-        self.assertTrue(mask[2:5, 1].all())
+        assert mask[2:5, 1].all()
 
-    @slow
+    @pytest.mark.slow
     def test_gap_upsample(self):
         low = tm.makeTimeSeries()
         low[5:25] = np.nan
-        ax = low.plot()
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
 
         idxh = date_range(low.index[0], low.index[-1], freq='12h')
         s = Series(np.random.randn(len(idxh)), idxh)
         s.plot(secondary_y=True)
         lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
-        self.assertEqual(len(ax.right_ax.get_lines()), 1)
-        l = lines[0]
-        data = l.get_xydata()
+        assert len(lines) == 1
+        assert len(ax.right_ax.get_lines()) == 1
 
-        tm._skip_if_mpl_1_5()
+        line = lines[0]
+        data = line.get_xydata()
+        if (self.mpl_ge_3_0_0 or not self.mpl_ge_2_0_1
+                or (self.mpl_ge_2_1_0 and not self.mpl_ge_2_2_2)):
+            # 2.0.0, 2.2.0 (exactly) or >= 3.0.0
+            data = np.ma.MaskedArray(data, mask=isna(data), fill_value=np.nan)
 
-        tm.assertIsInstance(data, np.ma.core.MaskedArray)
+        assert isinstance(data, np.ma.core.MaskedArray)
         mask = data.mask
-        self.assertTrue(mask[5:25, 1].all())
+        assert mask[5:25, 1].all()
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y(self):
-        import matplotlib.pyplot as plt
-
         ser = Series(np.random.randn(10))
         ser2 = Series(np.random.randn(10))
+        fig, _ = self.plt.subplots()
         ax = ser.plot(secondary_y=True)
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
         axes = fig.get_axes()
-        l = ax.get_lines()[0]
-        xp = Series(l.get_ydata(), l.get_xdata())
+        line = ax.get_lines()[0]
+        xp = Series(line.get_ydata(), line.get_xdata())
         assert_series_equal(ser, xp)
-        self.assertEqual(ax.get_yaxis().get_ticks_position(), 'right')
-        self.assertFalse(axes[0].get_yaxis().get_visible())
-        plt.close(fig)
+        assert ax.get_yaxis().get_ticks_position() == 'right'
+        assert not axes[0].get_yaxis().get_visible()
+        self.plt.close(fig)
 
-        ax2 = ser2.plot()
-        self.assertEqual(ax2.get_yaxis().get_ticks_position(),
-                         self.default_tick_position)
-        plt.close(ax2.get_figure())
+        _, ax2 = self.plt.subplots()
+        ser2.plot(ax=ax2)
+        assert (ax2.get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        self.plt.close(ax2.get_figure())
 
         ax = ser2.plot()
         ax2 = ser.plot(secondary_y=True)
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertFalse(hasattr(ax, 'left_ax'))
-        self.assertTrue(hasattr(ax, 'right_ax'))
-        self.assertTrue(hasattr(ax2, 'left_ax'))
-        self.assertFalse(hasattr(ax2, 'right_ax'))
+        assert ax.get_yaxis().get_visible()
+        assert not hasattr(ax, 'left_ax')
+        assert hasattr(ax, 'right_ax')
+        assert hasattr(ax2, 'left_ax')
+        assert not hasattr(ax2, 'right_ax')
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y_ts(self):
-        import matplotlib.pyplot as plt
         idx = date_range('1/1/2000', periods=10)
         ser = Series(np.random.randn(10), idx)
         ser2 = Series(np.random.randn(10), idx)
+        fig, _ = self.plt.subplots()
         ax = ser.plot(secondary_y=True)
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
         axes = fig.get_axes()
-        l = ax.get_lines()[0]
-        xp = Series(l.get_ydata(), l.get_xdata()).to_timestamp()
+        line = ax.get_lines()[0]
+        xp = Series(line.get_ydata(), line.get_xdata()).to_timestamp()
         assert_series_equal(ser, xp)
-        self.assertEqual(ax.get_yaxis().get_ticks_position(), 'right')
-        self.assertFalse(axes[0].get_yaxis().get_visible())
-        plt.close(fig)
+        assert ax.get_yaxis().get_ticks_position() == 'right'
+        assert not axes[0].get_yaxis().get_visible()
+        self.plt.close(fig)
 
-        ax2 = ser2.plot()
-        self.assertEqual(ax2.get_yaxis().get_ticks_position(),
-                         self.default_tick_position)
-        plt.close(ax2.get_figure())
+        _, ax2 = self.plt.subplots()
+        ser2.plot(ax=ax2)
+        assert (ax2.get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        self.plt.close(ax2.get_figure())
 
         ax = ser2.plot()
         ax2 = ser.plot(secondary_y=True)
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert ax.get_yaxis().get_visible()
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_secondary_kde(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
 
-        import matplotlib.pyplot as plt  # noqa
         ser = Series(np.random.randn(10))
-        ax = ser.plot(secondary_y=True, kind='density')
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
-        fig = ax.get_figure()
+        fig, ax = self.plt.subplots()
+        ax = ser.plot(secondary_y=True, kind='density', ax=ax)
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
         axes = fig.get_axes()
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(), 'right')
+        assert axes[1].get_yaxis().get_ticks_position() == 'right'
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_bar(self):
         ser = Series(np.random.randn(10))
-        ax = ser.plot(secondary_y=True, kind='bar')
-        fig = ax.get_figure()
+        fig, ax = self.plt.subplots()
+        ser.plot(secondary_y=True, kind='bar', ax=ax)
         axes = fig.get_axes()
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(), 'right')
+        assert axes[1].get_yaxis().get_ticks_position() == 'right'
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_frame(self):
         df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
         axes = df.plot(secondary_y=['a', 'c'], subplots=True)
-        self.assertEqual(axes[0].get_yaxis().get_ticks_position(), 'right')
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(),
-                         self.default_tick_position)
-        self.assertEqual(axes[2].get_yaxis().get_ticks_position(), 'right')
+        assert axes[0].get_yaxis().get_ticks_position() == 'right'
+        assert (axes[1].get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        assert axes[2].get_yaxis().get_ticks_position() == 'right'
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_bar_frame(self):
         df = DataFrame(np.random.randn(5, 3), columns=['a', 'b', 'c'])
         axes = df.plot(kind='bar', secondary_y=['a', 'c'], subplots=True)
-        self.assertEqual(axes[0].get_yaxis().get_ticks_position(), 'right')
-        self.assertEqual(axes[1].get_yaxis().get_ticks_position(),
-                         self.default_tick_position)
-        self.assertEqual(axes[2].get_yaxis().get_ticks_position(), 'right')
+        assert axes[0].get_yaxis().get_ticks_position() == 'right'
+        assert (axes[1].get_yaxis().get_ticks_position() ==
+                self.default_tick_position)
+        assert axes[2].get_yaxis().get_ticks_position() == 'right'
 
     def test_mixed_freq_regular_first(self):
-        import matplotlib.pyplot as plt  # noqa
+        # TODO
         s1 = tm.makeTimeSeries()
         s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
 
         # it works!
-        s1.plot()
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
 
-        ax2 = s2.plot(style='g')
+        ax2 = s2.plot(style='g', ax=ax)
         lines = ax2.get_lines()
         idx1 = PeriodIndex(lines[0].get_xdata())
         idx2 = PeriodIndex(lines[1].get_xdata())
-        self.assertTrue(idx1.equals(s1.index.to_period('B')))
-        self.assertTrue(idx2.equals(s2.index.to_period('B')))
+
+        tm.assert_index_equal(idx1, s1.index.to_period('B'))
+        tm.assert_index_equal(idx2, s2.index.to_period('B'))
+
         left, right = ax2.get_xlim()
         pidx = s1.index.to_period()
-        self.assertEqual(left, pidx[0].ordinal)
-        self.assertEqual(right, pidx[-1].ordinal)
+        assert left <= pidx[0].ordinal
+        assert right >= pidx[-1].ordinal
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_freq_irregular_first(self):
-        import matplotlib.pyplot as plt  # noqa
         s1 = tm.makeTimeSeries()
         s2 = s1[[0, 5, 10, 11, 12, 13, 14, 15]]
-        s2.plot(style='g')
-        ax = s1.plot()
-        self.assertFalse(hasattr(ax, 'freq'))
+        _, ax = self.plt.subplots()
+        s2.plot(style='g', ax=ax)
+        s1.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
         lines = ax.get_lines()
         x1 = lines[0].get_xdata()
-        tm.assert_numpy_array_equal(x1, s2.index.asobject.values)
+        tm.assert_numpy_array_equal(x1, s2.index.astype(object).values)
         x2 = lines[1].get_xdata()
-        tm.assert_numpy_array_equal(x2, s1.index.asobject.values)
+        tm.assert_numpy_array_equal(x2, s1.index.astype(object).values)
 
     def test_mixed_freq_regular_first_df(self):
         # GH 9852
-        import matplotlib.pyplot as plt  # noqa
         s1 = tm.makeTimeSeries().to_frame()
         s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
-        ax = s1.plot()
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
         ax2 = s2.plot(style='g', ax=ax)
         lines = ax2.get_lines()
         idx1 = PeriodIndex(lines[0].get_xdata())
         idx2 = PeriodIndex(lines[1].get_xdata())
-        self.assertTrue(idx1.equals(s1.index.to_period('B')))
-        self.assertTrue(idx2.equals(s2.index.to_period('B')))
+        assert idx1.equals(s1.index.to_period('B'))
+        assert idx2.equals(s2.index.to_period('B'))
         left, right = ax2.get_xlim()
         pidx = s1.index.to_period()
-        self.assertEqual(left, pidx[0].ordinal)
-        self.assertEqual(right, pidx[-1].ordinal)
+        assert left <= pidx[0].ordinal
+        assert right >= pidx[-1].ordinal
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_freq_irregular_first_df(self):
         # GH 9852
-        import matplotlib.pyplot as plt  # noqa
         s1 = tm.makeTimeSeries().to_frame()
         s2 = s1.iloc[[0, 5, 10, 11, 12, 13, 14, 15], :]
-        ax = s2.plot(style='g')
-        ax = s1.plot(ax=ax)
-        self.assertFalse(hasattr(ax, 'freq'))
+        _, ax = self.plt.subplots()
+        s2.plot(style='g', ax=ax)
+        s1.plot(ax=ax)
+        assert not hasattr(ax, 'freq')
         lines = ax.get_lines()
         x1 = lines[0].get_xdata()
-        tm.assert_numpy_array_equal(x1, s2.index.asobject.values)
+        tm.assert_numpy_array_equal(x1, s2.index.astype(object).values)
         x2 = lines[1].get_xdata()
-        tm.assert_numpy_array_equal(x2, s1.index.asobject.values)
+        tm.assert_numpy_array_equal(x2, s1.index.astype(object).values)
 
     def test_mixed_freq_hf_first(self):
         idxh = date_range('1/1/1999', periods=365, freq='D')
         idxl = date_range('1/1/1999', periods=12, freq='M')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        high.plot()
-        ax = low.plot()
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'D')
+            assert PeriodIndex(data=l.get_xdata()).freq == 'D'
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_freq_alignment(self):
         ts_ind = date_range('2012-01-01 13:00', '2012-01-02', freq='H')
         ts_data = np.random.randn(12)
@@ -739,44 +821,46 @@ def test_mixed_freq_alignment(self):
         ts = Series(ts_data, index=ts_ind)
         ts2 = ts.asfreq('T').interpolate()
 
-        ax = ts.plot()
-        ts2.plot(style='r')
+        _, ax = self.plt.subplots()
+        ax = ts.plot(ax=ax)
+        ts2.plot(style='r', ax=ax)
 
-        self.assertEqual(ax.lines[0].get_xdata()[0],
-                         ax.lines[1].get_xdata()[0])
+        assert ax.lines[0].get_xdata()[0] == ax.lines[1].get_xdata()[0]
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_freq_lf_first(self):
-        import matplotlib.pyplot as plt
 
         idxh = date_range('1/1/1999', periods=365, freq='D')
         idxl = date_range('1/1/1999', periods=12, freq='M')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot(legend=True)
-        ax = high.plot(legend=True)
+        _, ax = self.plt.subplots()
+        low.plot(legend=True, ax=ax)
+        high.plot(legend=True, ax=ax)
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'D')
+            assert PeriodIndex(data=l.get_xdata()).freq == 'D'
         leg = ax.get_legend()
-        self.assertEqual(len(leg.texts), 2)
-        plt.close(ax.get_figure())
+        assert len(leg.texts) == 2
+        self.plt.close(ax.get_figure())
 
         idxh = date_range('1/1/1999', periods=240, freq='T')
         idxl = date_range('1/1/1999', periods=4, freq='H')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot()
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'T')
+            assert PeriodIndex(data=l.get_xdata()).freq == 'T'
 
     def test_mixed_freq_irreg_period(self):
         ts = tm.makeTimeSeries()
         irreg = ts[[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 15, 16, 17, 18, 29]]
         rng = period_range('1/3/2000', periods=30, freq='B')
         ps = Series(np.random.randn(len(rng)), rng)
-        irreg.plot()
-        ps.plot()
+        _, ax = self.plt.subplots()
+        irreg.plot(ax=ax)
+        ps.plot(ax=ax)
 
     def test_mixed_freq_shared_ax(self):
 
@@ -790,10 +874,10 @@ def test_mixed_freq_shared_ax(self):
         s1.plot(ax=ax1)
         s2.plot(ax=ax2)
 
-        self.assertEqual(ax1.freq, 'M')
-        self.assertEqual(ax2.freq, 'M')
-        self.assertEqual(ax1.lines[0].get_xydata()[0, 0],
-                         ax2.lines[0].get_xydata()[0, 0])
+        assert ax1.freq == 'M'
+        assert ax2.freq == 'M'
+        assert (ax1.lines[0].get_xydata()[0, 0] ==
+                ax2.lines[0].get_xydata()[0, 0])
 
         # using twinx
         fig, ax1 = self.plt.subplots()
@@ -801,8 +885,8 @@ def test_mixed_freq_shared_ax(self):
         s1.plot(ax=ax1)
         s2.plot(ax=ax2)
 
-        self.assertEqual(ax1.lines[0].get_xydata()[0, 0],
-                         ax2.lines[0].get_xydata()[0, 0])
+        assert (ax1.lines[0].get_xydata()[0, 0] ==
+                ax2.lines[0].get_xydata()[0, 0])
 
         # TODO (GH14330, GH14322)
         # plotting the irregular first does not yet work
@@ -810,65 +894,79 @@ def test_mixed_freq_shared_ax(self):
         # ax2 = ax1.twinx()
         # s2.plot(ax=ax1)
         # s1.plot(ax=ax2)
-        # self.assertEqual(ax1.lines[0].get_xydata()[0, 0],
-        #                  ax2.lines[0].get_xydata()[0, 0])
+        # assert (ax1.lines[0].get_xydata()[0, 0] ==
+        #         ax2.lines[0].get_xydata()[0, 0])
+
+    def test_nat_handling(self):
+
+        _, ax = self.plt.subplots()
+
+        dti = DatetimeIndex(['2015-01-01', NaT, '2015-01-03'])
+        s = Series(range(len(dti)), dti)
+        s.plot(ax=ax)
+        xdata = ax.get_lines()[0].get_xdata()
+        # plot x data is bounded by index values
+        assert s.index.min() <= Series(xdata).min()
+        assert Series(xdata).max() <= s.index.max()
 
-    @slow
+    @pytest.mark.slow
     def test_to_weekly_resampling(self):
         idxh = date_range('1/1/1999', periods=52, freq='W')
         idxl = date_range('1/1/1999', periods=12, freq='M')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        high.plot()
-        ax = low.plot()
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
 
-        # tsplot
+        _, ax = self.plt.subplots()
         from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
-
-        tsplot(high, plt.Axes.plot)
-        lines = tsplot(low, plt.Axes.plot)
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(high, self.plt.Axes.plot, ax=ax)
+        with tm.assert_produces_warning(FutureWarning):
+            lines = tsplot(low, self.plt.Axes.plot, ax=ax)
         for l in lines:
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
 
-    @slow
+    @pytest.mark.slow
     def test_from_weekly_resampling(self):
         idxh = date_range('1/1/1999', periods=52, freq='W')
         idxl = date_range('1/1/1999', periods=12, freq='M')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot()
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
 
         expected_h = idxh.to_period().asi8.astype(np.float64)
         expected_l = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540, 1544,
                                1549, 1553, 1558, 1562], dtype=np.float64)
         for l in ax.get_lines():
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
             xdata = l.get_xdata(orig=False)
             if len(xdata) == 12:  # idxl lines
-                self.assert_numpy_array_equal(xdata, expected_l)
+                tm.assert_numpy_array_equal(xdata, expected_l)
             else:
-                self.assert_numpy_array_equal(xdata, expected_h)
+                tm.assert_numpy_array_equal(xdata, expected_h)
         tm.close()
 
-        # tsplot
+        _, ax = self.plt.subplots()
         from pandas.tseries.plotting import tsplot
-        import matplotlib.pyplot as plt
-
-        tsplot(low, plt.Axes.plot)
-        lines = tsplot(high, plt.Axes.plot)
+        with tm.assert_produces_warning(FutureWarning):
+            tsplot(low, self.plt.Axes.plot, ax=ax)
+        with tm.assert_produces_warning(FutureWarning):
+            lines = tsplot(high, self.plt.Axes.plot, ax=ax)
         for l in lines:
-            self.assertTrue(PeriodIndex(data=l.get_xdata()).freq, idxh.freq)
+            assert PeriodIndex(data=l.get_xdata()).freq == idxh.freq
             xdata = l.get_xdata(orig=False)
             if len(xdata) == 12:  # idxl lines
-                self.assert_numpy_array_equal(xdata, expected_l)
+                tm.assert_numpy_array_equal(xdata, expected_l)
             else:
-                self.assert_numpy_array_equal(xdata, expected_h)
+                tm.assert_numpy_array_equal(xdata, expected_h)
 
-    @slow
+    @pytest.mark.slow
     def test_from_resampling_area_line_mixed(self):
         idxh = date_range('1/1/1999', periods=52, freq='W')
         idxl = date_range('1/1/1999', periods=12, freq='M')
@@ -879,8 +977,9 @@ def test_from_resampling_area_line_mixed(self):
 
         # low to high
         for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
-            ax = low.plot(kind=kind1, stacked=True)
-            ax = high.plot(kind=kind2, stacked=True, ax=ax)
+            _, ax = self.plt.subplots()
+            low.plot(kind=kind1, stacked=True, ax=ax)
+            high.plot(kind=kind2, stacked=True, ax=ax)
 
             # check low dataframe result
             expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540,
@@ -888,45 +987,44 @@ def test_from_resampling_area_line_mixed(self):
                                   dtype=np.float64)
             expected_y = np.zeros(len(expected_x), dtype=np.float64)
             for i in range(3):
-                l = ax.lines[i]
-                self.assertEqual(PeriodIndex(l.get_xdata()).freq, idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False),
-                                              expected_x)
+                line = ax.lines[i]
+                assert PeriodIndex(line.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(line.get_xdata(orig=False),
+                                            expected_x)
                 # check stacked values are correct
                 expected_y += low[i].values
-                self.assert_numpy_array_equal(
-                    l.get_ydata(orig=False), expected_y)
+                tm.assert_numpy_array_equal(line.get_ydata(orig=False),
+                                            expected_y)
 
             # check high dataframe result
             expected_x = idxh.to_period().asi8.astype(np.float64)
             expected_y = np.zeros(len(expected_x), dtype=np.float64)
             for i in range(3):
-                l = ax.lines[3 + i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq,
-                                 idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False),
-                                              expected_x)
+                line = ax.lines[3 + i]
+                assert PeriodIndex(data=line.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(line.get_xdata(orig=False),
+                                            expected_x)
                 expected_y += high[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False),
-                                              expected_y)
+                tm.assert_numpy_array_equal(line.get_ydata(orig=False),
+                                            expected_y)
 
         # high to low
         for kind1, kind2 in [('line', 'area'), ('area', 'line')]:
-            ax = high.plot(kind=kind1, stacked=True)
-            ax = low.plot(kind=kind2, stacked=True, ax=ax)
+            _, ax = self.plt.subplots()
+            high.plot(kind=kind1, stacked=True, ax=ax)
+            low.plot(kind=kind2, stacked=True, ax=ax)
 
             # check high dataframe result
             expected_x = idxh.to_period().asi8.astype(np.float64)
             expected_y = np.zeros(len(expected_x), dtype=np.float64)
             for i in range(3):
-                l = ax.lines[i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq,
-                                 idxh.freq)
-                self.assert_numpy_array_equal(
-                    l.get_xdata(orig=False), expected_x)
+                line = ax.lines[i]
+                assert PeriodIndex(data=line.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(line.get_xdata(orig=False),
+                                            expected_x)
                 expected_y += high[i].values
-                self.assert_numpy_array_equal(
-                    l.get_ydata(orig=False), expected_y)
+                tm.assert_numpy_array_equal(line.get_ydata(orig=False),
+                                            expected_y)
 
             # check low dataframe result
             expected_x = np.array([1514, 1519, 1523, 1527, 1531, 1536, 1540,
@@ -934,16 +1032,15 @@ def test_from_resampling_area_line_mixed(self):
                                   dtype=np.float64)
             expected_y = np.zeros(len(expected_x), dtype=np.float64)
             for i in range(3):
-                l = ax.lines[3 + i]
-                self.assertEqual(PeriodIndex(data=l.get_xdata()).freq,
-                                 idxh.freq)
-                self.assert_numpy_array_equal(l.get_xdata(orig=False),
-                                              expected_x)
+                lines = ax.lines[3 + i]
+                assert PeriodIndex(data=lines.get_xdata()).freq == idxh.freq
+                tm.assert_numpy_array_equal(lines.get_xdata(orig=False),
+                                            expected_x)
                 expected_y += low[i].values
-                self.assert_numpy_array_equal(l.get_ydata(orig=False),
-                                              expected_y)
+                tm.assert_numpy_array_equal(lines.get_ydata(orig=False),
+                                            expected_y)
 
-    @slow
+    @pytest.mark.slow
     def test_mixed_freq_second_millisecond(self):
         # GH 7772, GH 7760
         idxh = date_range('2014-07-01 09:00', freq='S', periods=50)
@@ -951,21 +1048,23 @@ def test_mixed_freq_second_millisecond(self):
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
         # high to low
-        high.plot()
-        ax = low.plot()
-        self.assertEqual(len(ax.get_lines()), 2)
+        _, ax = self.plt.subplots()
+        high.plot(ax=ax)
+        low.plot(ax=ax)
+        assert len(ax.get_lines()) == 2
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'L')
+            assert PeriodIndex(data=l.get_xdata()).freq == 'L'
         tm.close()
 
         # low to high
-        low.plot()
-        ax = high.plot()
-        self.assertEqual(len(ax.get_lines()), 2)
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        high.plot(ax=ax)
+        assert len(ax.get_lines()) == 2
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(data=l.get_xdata()).freq, 'L')
+            assert PeriodIndex(data=l.get_xdata()).freq == 'L'
 
-    @slow
+    @pytest.mark.slow
     def test_irreg_dtypes(self):
         # date
         idx = [date(2000, 1, 1), date(2000, 1, 5), date(2000, 1, 20)]
@@ -974,11 +1073,13 @@ def test_irreg_dtypes(self):
 
         # np.datetime64
         idx = date_range('1/1/2000', periods=10)
-        idx = idx[[0, 2, 5, 9]].asobject
+        idx = idx[[0, 2, 5, 9]].astype(object)
         df = DataFrame(np.random.randn(len(idx), 3), idx)
-        _check_plot_works(df.plot)
+        _, ax = self.plt.subplots()
+        _check_plot_works(df.plot, ax=ax)
 
-    @slow
+    @pytest.mark.xfail(reason="fails with py2.7.15", strict=False)
+    @pytest.mark.slow
     def test_time(self):
         t = datetime(1, 1, 1, 3, 30, 0)
         deltas = np.random.randint(1, 20, 3).cumsum()
@@ -986,34 +1087,43 @@ def test_time(self):
         df = DataFrame({'a': np.random.randn(len(ts)),
                         'b': np.random.randn(len(ts))},
                        index=ts)
-        ax = df.plot()
+        fig, ax = self.plt.subplots()
+        df.plot(ax=ax)
 
         # verify tick labels
+        fig.canvas.draw()
         ticks = ax.get_xticks()
         labels = ax.get_xticklabels()
         for t, l in zip(ticks, labels):
             m, s = divmod(int(t), 60)
             h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S')
-                self.assertEqual(xp, rs)
+            rs = l.get_text()
+            if len(rs) > 0:
+                if s != 0:
+                    xp = time(h, m, s).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s).strftime('%H:%M')
+                assert xp == rs
 
         # change xlim
         ax.set_xlim('1:30', '5:00')
 
         # check tick labels again
+        fig.canvas.draw()
         ticks = ax.get_xticks()
         labels = ax.get_xticklabels()
         for t, l in zip(ticks, labels):
             m, s = divmod(int(t), 60)
             h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S')
-                self.assertEqual(xp, rs)
-
-    @slow
+            rs = l.get_text()
+            if len(rs) > 0:
+                if s != 0:
+                    xp = time(h, m, s).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s).strftime('%H:%M')
+                assert xp == rs
+
+    @pytest.mark.slow
     def test_time_musec(self):
         t = datetime(1, 1, 1, 3, 30, 0)
         deltas = np.random.randint(1, 20, 3).cumsum()
@@ -1022,159 +1132,166 @@ def test_time_musec(self):
         df = DataFrame({'a': np.random.randn(len(ts)),
                         'b': np.random.randn(len(ts))},
                        index=ts)
-        ax = df.plot()
+        fig, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
 
         # verify tick labels
+        fig.canvas.draw()
         ticks = ax.get_xticks()
         labels = ax.get_xticklabels()
         for t, l in zip(ticks, labels):
             m, s = divmod(int(t), 60)
 
-            # TODO: unused?
-            # us = int((t - int(t)) * 1e6)
+            us = int(round((t - int(t)) * 1e6))
 
             h, m = divmod(m, 60)
-            xp = l.get_text()
-            if len(xp) > 0:
-                rs = time(h, m, s).strftime('%H:%M:%S.%f')
-                self.assertEqual(xp, rs)
-
-    @slow
+            rs = l.get_text()
+            if len(rs) > 0:
+                if (us % 1000) != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S.%f')
+                elif (us // 1000) != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S.%f')[:-3]
+                elif s != 0:
+                    xp = time(h, m, s, us).strftime('%H:%M:%S')
+                else:
+                    xp = time(h, m, s, us).strftime('%H:%M')
+                assert xp == rs
+
+    @pytest.mark.slow
     def test_secondary_upsample(self):
         idxh = date_range('1/1/1999', periods=365, freq='D')
         idxl = date_range('1/1/1999', periods=12, freq='M')
         high = Series(np.random.randn(len(idxh)), idxh)
         low = Series(np.random.randn(len(idxl)), idxl)
-        low.plot()
-        ax = high.plot(secondary_y=True)
+        _, ax = self.plt.subplots()
+        low.plot(ax=ax)
+        ax = high.plot(secondary_y=True, ax=ax)
         for l in ax.get_lines():
-            self.assertEqual(PeriodIndex(l.get_xdata()).freq, 'D')
-        self.assertTrue(hasattr(ax, 'left_ax'))
-        self.assertFalse(hasattr(ax, 'right_ax'))
+            assert PeriodIndex(l.get_xdata()).freq == 'D'
+        assert hasattr(ax, 'left_ax')
+        assert not hasattr(ax, 'right_ax')
         for l in ax.left_ax.get_lines():
-            self.assertEqual(PeriodIndex(l.get_xdata()).freq, 'D')
+            assert PeriodIndex(l.get_xdata()).freq == 'D'
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_legend(self):
-        import matplotlib.pyplot as plt
-        fig = plt.gcf()
-        plt.clf()
+        fig = self.plt.figure()
         ax = fig.add_subplot(211)
 
         # ts
         df = tm.makeTimeDataFrame()
-        ax = df.plot(secondary_y=['A', 'B'])
+        df.plot(secondary_y=['A', 'B'], ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A (right)')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B (right)')
-        self.assertEqual(leg.get_texts()[2].get_text(), 'C')
-        self.assertEqual(leg.get_texts()[3].get_text(), 'D')
-        self.assertIsNone(ax.right_ax.get_legend())
+        assert len(leg.get_lines()) == 4
+        assert leg.get_texts()[0].get_text() == 'A (right)'
+        assert leg.get_texts()[1].get_text() == 'B (right)'
+        assert leg.get_texts()[2].get_text() == 'C'
+        assert leg.get_texts()[3].get_text() == 'D'
+        assert ax.right_ax.get_legend() is None
         colors = set()
         for line in leg.get_lines():
             colors.add(line.get_color())
 
         # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
+        assert len(colors) == 4
+        self.plt.close(fig)
 
-        plt.clf()
+        fig = self.plt.figure()
         ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['A', 'C'], mark_right=False)
+        df.plot(secondary_y=['A', 'C'], mark_right=False, ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
-        self.assertEqual(leg.get_texts()[2].get_text(), 'C')
-        self.assertEqual(leg.get_texts()[3].get_text(), 'D')
-
-        plt.clf()
-        ax = df.plot(kind='bar', secondary_y=['A'])
+        assert len(leg.get_lines()) == 4
+        assert leg.get_texts()[0].get_text() == 'A'
+        assert leg.get_texts()[1].get_text() == 'B'
+        assert leg.get_texts()[2].get_text() == 'C'
+        assert leg.get_texts()[3].get_text() == 'D'
+        self.plt.close(fig)
+
+        fig, ax = self.plt.subplots()
+        df.plot(kind='bar', secondary_y=['A'], ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A (right)')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
+        assert leg.get_texts()[0].get_text() == 'A (right)'
+        assert leg.get_texts()[1].get_text() == 'B'
+        self.plt.close(fig)
 
-        plt.clf()
-        ax = df.plot(kind='bar', secondary_y=['A'], mark_right=False)
+        fig, ax = self.plt.subplots()
+        df.plot(kind='bar', secondary_y=['A'], mark_right=False, ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(leg.get_texts()[0].get_text(), 'A')
-        self.assertEqual(leg.get_texts()[1].get_text(), 'B')
+        assert leg.get_texts()[0].get_text() == 'A'
+        assert leg.get_texts()[1].get_text() == 'B'
+        self.plt.close(fig)
 
-        plt.clf()
+        fig = self.plt.figure()
         ax = fig.add_subplot(211)
         df = tm.makeTimeDataFrame()
-        ax = df.plot(secondary_y=['C', 'D'])
+        ax = df.plot(secondary_y=['C', 'D'], ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
         colors = set()
         for line in leg.get_lines():
             colors.add(line.get_color())
 
         # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
+        assert len(colors) == 4
+        self.plt.close(fig)
 
         # non-ts
         df = tm.makeDataFrame()
-        plt.clf()
+        fig = self.plt.figure()
         ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['A', 'B'])
+        ax = df.plot(secondary_y=['A', 'B'], ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
         colors = set()
         for line in leg.get_lines():
             colors.add(line.get_color())
 
         # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
+        assert len(colors) == 4
+        self.plt.close()
 
-        plt.clf()
+        fig = self.plt.figure()
         ax = fig.add_subplot(211)
-        ax = df.plot(secondary_y=['C', 'D'])
+        ax = df.plot(secondary_y=['C', 'D'], ax=ax)
         leg = ax.get_legend()
-        self.assertEqual(len(leg.get_lines()), 4)
-        self.assertIsNone(ax.right_ax.get_legend())
+        assert len(leg.get_lines()) == 4
+        assert ax.right_ax.get_legend() is None
         colors = set()
         for line in leg.get_lines():
             colors.add(line.get_color())
 
         # TODO: color cycle problems
-        self.assertEqual(len(colors), 4)
+        assert len(colors) == 4
 
     def test_format_date_axis(self):
         rng = date_range('1/1/2012', periods=12, freq='M')
         df = DataFrame(np.random.randn(len(rng), 3), rng)
-        ax = df.plot()
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
         xaxis = ax.get_xaxis()
         for l in xaxis.get_ticklabels():
             if len(l.get_text()) > 0:
-                self.assertEqual(l.get_rotation(), 30)
+                assert l.get_rotation() == 30
 
-    @slow
+    @pytest.mark.slow
     def test_ax_plot(self):
-        import matplotlib.pyplot as plt
-
-        x = DatetimeIndex(start='2012-01-02', periods=10, freq='D')
+        x = date_range(start='2012-01-02', periods=10, freq='D')
         y = lrange(len(x))
-        fig = plt.figure()
-        ax = fig.add_subplot(111)
+        _, ax = self.plt.subplots()
         lines = ax.plot(x, y, label='Y')
         tm.assert_index_equal(DatetimeIndex(lines[0].get_xdata()), x)
 
-    @slow
+    @pytest.mark.slow
     def test_mpl_nopandas(self):
-        import matplotlib.pyplot as plt
-
         dates = [date(2008, 12, 31), date(2009, 1, 31)]
         values1 = np.arange(10.0, 11.0, 0.5)
         values2 = np.arange(11.0, 12.0, 0.5)
 
         kw = dict(fmt='-', lw=4)
 
-        plt.close('all')
-        fig = plt.figure()
-        ax = fig.add_subplot(111)
+        _, ax = self.plt.subplots()
         ax.plot_date([x.toordinal() for x in dates], values1, **kw)
         ax.plot_date([x.toordinal() for x in dates], values2, **kw)
 
@@ -1185,22 +1302,23 @@ def test_mpl_nopandas(self):
         exp = np.array([x.toordinal() for x in dates], dtype=np.float64)
         tm.assert_numpy_array_equal(line2.get_xydata()[:, 0], exp)
 
-    @slow
+    @pytest.mark.slow
     def test_irregular_ts_shared_ax_xlim(self):
         # GH 2960
         ts = tm.makeTimeSeries()[:20]
         ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
 
         # plot the left section of the irregular series, then the right section
-        ax = ts_irregular[:5].plot()
+        _, ax = self.plt.subplots()
+        ts_irregular[:5].plot(ax=ax)
         ts_irregular[5:].plot(ax=ax)
 
         # check that axis limits are correct
         left, right = ax.get_xlim()
-        self.assertEqual(left, ts_irregular.index.min().toordinal())
-        self.assertEqual(right, ts_irregular.index.max().toordinal())
+        assert left <= ts_irregular.index.min().toordinal()
+        assert right >= ts_irregular.index.max().toordinal()
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y_non_ts_xlim(self):
         # GH 3490 - non-timeseries with secondary y
         index_1 = [1, 2, 3, 4]
@@ -1208,15 +1326,16 @@ def test_secondary_y_non_ts_xlim(self):
         s1 = Series(1, index=index_1)
         s2 = Series(2, index=index_2)
 
-        ax = s1.plot()
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
         left_before, right_before = ax.get_xlim()
         s2.plot(secondary_y=True, ax=ax)
         left_after, right_after = ax.get_xlim()
 
-        self.assertEqual(left_before, left_after)
-        self.assertTrue(right_before < right_after)
+        assert left_before >= left_after
+        assert right_before < right_after
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y_regular_ts_xlim(self):
         # GH 3490 - regular-timeseries with secondary y
         index_1 = date_range(start='2000-01-01', periods=4, freq='D')
@@ -1224,76 +1343,81 @@ def test_secondary_y_regular_ts_xlim(self):
         s1 = Series(1, index=index_1)
         s2 = Series(2, index=index_2)
 
-        ax = s1.plot()
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
         left_before, right_before = ax.get_xlim()
         s2.plot(secondary_y=True, ax=ax)
         left_after, right_after = ax.get_xlim()
 
-        self.assertEqual(left_before, left_after)
-        self.assertTrue(right_before < right_after)
+        assert left_before >= left_after
+        assert right_before < right_after
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y_mixed_freq_ts_xlim(self):
         # GH 3490 - mixed frequency timeseries with secondary y
         rng = date_range('2000-01-01', periods=10000, freq='min')
         ts = Series(1, index=rng)
 
-        ax = ts.plot()
+        _, ax = self.plt.subplots()
+        ts.plot(ax=ax)
         left_before, right_before = ax.get_xlim()
         ts.resample('D').mean().plot(secondary_y=True, ax=ax)
         left_after, right_after = ax.get_xlim()
 
         # a downsample should not have changed either limit
-        self.assertEqual(left_before, left_after)
-        self.assertEqual(right_before, right_after)
+        assert left_before == left_after
+        assert right_before == right_after
 
-    @slow
+    @pytest.mark.slow
     def test_secondary_y_irregular_ts_xlim(self):
         # GH 3490 - irregular-timeseries with secondary y
         ts = tm.makeTimeSeries()[:20]
         ts_irregular = ts[[1, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18]]
 
-        ax = ts_irregular[:5].plot()
+        _, ax = self.plt.subplots()
+        ts_irregular[:5].plot(ax=ax)
         # plot higher-x values on secondary axis
         ts_irregular[5:].plot(secondary_y=True, ax=ax)
         # ensure secondary limits aren't overwritten by plot on primary
         ts_irregular[:5].plot(ax=ax)
 
         left, right = ax.get_xlim()
-        self.assertEqual(left, ts_irregular.index.min().toordinal())
-        self.assertEqual(right, ts_irregular.index.max().toordinal())
+        assert left <= ts_irregular.index.min().toordinal()
+        assert right >= ts_irregular.index.max().toordinal()
 
     def test_plot_outofbounds_datetime(self):
         # 2579 - checking this does not raise
         values = [date(1677, 1, 1), date(1677, 1, 2)]
-        self.plt.plot(values)
+        _, ax = self.plt.subplots()
+        ax.plot(values)
 
         values = [datetime(1677, 1, 1, 12), datetime(1677, 1, 2, 12)]
-        self.plt.plot(values)
+        ax.plot(values)
 
     def test_format_timedelta_ticks_narrow(self):
-        if is_platform_mac():
-            pytest.skip("skip on mac for precision display issue on older mpl")
 
-        expected_labels = [
-            '00:00:00.00000000{:d}'.format(i)
-            for i in range(10)]
+        if self.mpl_ge_2_0_1:
+            expected_labels = (['00:00:00.0000000{:0>2d}'.format(i)
+                                for i in range(10)])
+        else:  # 2.0.0
+            expected_labels = [''] + [
+                '00:00:00.00000000{:d}'.format(2 * i)
+                for i in range(5)] + ['']
 
         rng = timedelta_range('0', periods=10, freq='ns')
         df = DataFrame(np.random.randn(len(rng), 3), rng)
-        ax = df.plot(fontsize=2)
-        fig = ax.get_figure()
+        fig, ax = self.plt.subplots()
+        df.plot(fontsize=2, ax=ax)
         fig.canvas.draw()
         labels = ax.get_xticklabels()
-        self.assertEqual(len(labels), len(expected_labels))
-        for l, l_expected in zip(labels, expected_labels):
-            self.assertEqual(l.get_text(), l_expected)
 
-    def test_format_timedelta_ticks_wide(self):
-        if is_platform_mac():
-            pytest.skip("skip on mac for precision display issue on older mpl")
+        result_labels = [x.get_text() for x in labels]
+        assert len(result_labels) == len(expected_labels)
+        assert result_labels == expected_labels
 
+    def test_format_timedelta_ticks_wide(self):
         expected_labels = [
+            '',
             '00:00:00',
             '1 days 03:46:40',
             '2 days 07:33:20',
@@ -1302,35 +1426,99 @@ def test_format_timedelta_ticks_wide(self):
             '5 days 18:53:20',
             '6 days 22:40:00',
             '8 days 02:26:40',
+            '9 days 06:13:20',
             ''
         ]
+        if self.mpl_ge_2_2_0:
+            expected_labels = expected_labels[1:-1]
+        elif self.mpl_ge_2_0_1:
+            expected_labels = expected_labels[1:-1]
+            expected_labels[-1] = ''
 
         rng = timedelta_range('0', periods=10, freq='1 d')
         df = DataFrame(np.random.randn(len(rng), 3), rng)
-        ax = df.plot(fontsize=2)
-        fig = ax.get_figure()
+        fig, ax = self.plt.subplots()
+        ax = df.plot(fontsize=2, ax=ax)
         fig.canvas.draw()
         labels = ax.get_xticklabels()
-        self.assertEqual(len(labels), len(expected_labels))
-        for l, l_expected in zip(labels, expected_labels):
-            self.assertEqual(l.get_text(), l_expected)
+
+        result_labels = [x.get_text() for x in labels]
+        assert len(result_labels) == len(expected_labels)
+        assert result_labels == expected_labels
 
     def test_timedelta_plot(self):
         # test issue #8711
         s = Series(range(5), timedelta_range('1day', periods=5))
-        _check_plot_works(s.plot)
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
 
         # test long period
         index = timedelta_range('1 day 2 hr 30 min 10 s',
                                 periods=10, freq='1 d')
         s = Series(np.random.randn(len(index)), index)
-        _check_plot_works(s.plot)
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
 
         # test short period
         index = timedelta_range('1 day 2 hr 30 min 10 s',
                                 periods=10, freq='1 ns')
         s = Series(np.random.randn(len(index)), index)
-        _check_plot_works(s.plot)
+        _, ax = self.plt.subplots()
+        _check_plot_works(s.plot, ax=ax)
+
+    def test_hist(self):
+        # https://github.com/matplotlib/matplotlib/issues/8459
+        rng = date_range('1/1/2011', periods=10, freq='H')
+        x = rng
+        w1 = np.arange(0, 1, .1)
+        w2 = np.arange(0, 1, .1)[::-1]
+        _, ax = self.plt.subplots()
+        ax.hist([x, x], weights=[w1, w2])
+
+    @pytest.mark.slow
+    def test_overlapping_datetime(self):
+        # GB 6608
+        s1 = Series([1, 2, 3], index=[datetime(1995, 12, 31),
+                                      datetime(2000, 12, 31),
+                                      datetime(2005, 12, 31)])
+        s2 = Series([1, 2, 3], index=[datetime(1997, 12, 31),
+                                      datetime(2003, 12, 31),
+                                      datetime(2008, 12, 31)])
+
+        # plot first series, then add the second series to those axes,
+        # then try adding the first series again
+        _, ax = self.plt.subplots()
+        s1.plot(ax=ax)
+        s2.plot(ax=ax)
+        s1.plot(ax=ax)
+
+    @pytest.mark.xfail(reason="GH9053 matplotlib does not use"
+                              " ax.xaxis.converter")
+    def test_add_matplotlib_datetime64(self):
+        # GH9053 - ensure that a plot with PeriodConverter still understands
+        # datetime64 data. This still fails because matplotlib overrides the
+        # ax.xaxis.converter with a DatetimeConverter
+        s = Series(np.random.randn(10),
+                   index=date_range('1970-01-02', periods=10))
+        ax = s.plot()
+        ax.plot(s.index, s.values, color='g')
+        l1, l2 = ax.lines
+        tm.assert_numpy_array_equal(l1.get_xydata(), l2.get_xydata())
+
+    def test_matplotlib_scatter_datetime64(self):
+        # https://github.com/matplotlib/matplotlib/issues/11391
+        df = DataFrame(np.random.RandomState(0).rand(10, 2),
+                       columns=["x", "y"])
+        df["time"] = date_range("2018-01-01", periods=10, freq="D")
+        fig, ax = self.plt.subplots()
+        ax.scatter(x="time", y="y", data=df)
+        fig.canvas.draw()
+        label = ax.get_xticklabels()[0]
+        if self.mpl_ge_3_0_0:
+            expected = "2017-12-08"
+        else:
+            expected = "2017-12-12"
+        assert label.get_text() == expected
 
 
 def _check_plot_works(f, freq=None, series=None, *args, **kwargs):
@@ -1368,5 +1556,15 @@ def _check_plot_works(f, freq=None, series=None, *args, **kwargs):
 
         with ensure_clean(return_filelike=True) as path:
             plt.savefig(path)
+
+        # GH18439
+        # this is supported only in Python 3 pickle since
+        # pickle in Python2 doesn't support instancemethod pickling
+        # TODO(statsmodels 0.10.0): Remove the statsmodels check
+        # https://github.com/pandas-dev/pandas/issues/24088
+        # https://github.com/statsmodels/statsmodels/issues/4772
+        if PY3 and 'statsmodels' not in sys.modules:
+            with ensure_clean(return_filelike=True) as path:
+                pickle.dump(fig, path)
     finally:
         plt.close(fig)
diff --git a/pandas/tests/plotting/test_frame.py b/pandas/tests/plotting/test_frame.py
index 48af366f24ea4..98b241f5c8206 100644
--- a/pandas/tests/plotting/test_frame.py
+++ b/pandas/tests/plotting/test_frame.py
@@ -2,37 +2,36 @@
 
 """ Test cases for DataFrame.plot """
 
-import pytest
+from datetime import date, datetime
 import string
 import warnings
 
-from datetime import datetime, date
+import numpy as np
+from numpy.random import rand, randn
+import pytest
 
-import pandas as pd
-from pandas import (Series, DataFrame, MultiIndex, PeriodIndex, date_range,
-                    bdate_range)
-from pandas.types.api import is_list_like
-from pandas.compat import (range, lrange, StringIO, lmap, lzip, u, zip, PY3)
-from pandas.formats.printing import pprint_thing
-import pandas.util.testing as tm
-from pandas.util.testing import slow
+from pandas.compat import PY3, lmap, lrange, lzip, range, u, zip
+import pandas.util._test_decorators as td
 
-from pandas.core.config import set_option
+from pandas.core.dtypes.api import is_list_like
 
-import numpy as np
-from numpy.random import rand, randn
+import pandas as pd
+from pandas import (
+    DataFrame, MultiIndex, PeriodIndex, Series, bdate_range, date_range)
+from pandas.tests.plotting.common import (
+    TestPlotBase, _check_plot_works, _ok_for_gaussian_kde,
+    _skip_if_no_scipy_gaussian_kde)
+import pandas.util.testing as tm
 
-import pandas.tools.plotting as plotting
-from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works,
-                                          _skip_if_no_scipy_gaussian_kde,
-                                          _ok_for_gaussian_kde)
+from pandas.io.formats.printing import pprint_thing
+import pandas.plotting as plotting
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFramePlots(TestPlotBase):
 
-    def setUp(self):
-        TestPlotBase.setUp(self)
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
         import matplotlib as mpl
         mpl.rcdefaults()
 
@@ -42,7 +41,15 @@ def setUp(self):
                                     "C": np.arange(20) + np.random.uniform(
                                         size=20)})
 
-    @slow
+    def _assert_ytickslabels_visibility(self, axes, expected):
+        for ax, exp in zip(axes, expected):
+            self._check_visible(ax.get_yticklabels(), visible=exp)
+
+    def _assert_xtickslabels_visibility(self, axes, expected):
+        for ax, exp in zip(axes, expected):
+            self._check_visible(ax.get_xticklabels(), visible=exp)
+
+    @pytest.mark.slow
     def test_plot(self):
         df = self.tdf
         _check_plot_works(df.plot, grid=False)
@@ -63,8 +70,7 @@ def test_plot(self):
         self._check_axes_shape(axes, axes_num=4, layout=(4, 1))
 
         df = DataFrame({'x': [1, 2], 'y': [3, 4]})
-        # mpl >= 1.5.2 (or slightly below) throw AttributError
-        with tm.assertRaises((TypeError, AttributeError)):
+        with pytest.raises(AttributeError, match='Unknown property blarg'):
             df.plot.line(blarg=True)
 
         df = DataFrame(np.random.rand(10, 3),
@@ -134,12 +140,32 @@ def test_plot(self):
         # passed ax should be used:
         fig, ax = self.plt.subplots()
         axes = df.plot.bar(subplots=True, ax=ax)
-        self.assertEqual(len(axes), 1)
-        if self.mpl_ge_1_5_0:
-            result = ax.axes
-        else:
-            result = ax.get_axes()  # deprecated
-        self.assertIs(result, axes[0])
+        assert len(axes) == 1
+        result = ax.axes
+        assert result is axes[0]
+
+    # GH 15516
+    def test_mpl2_color_cycle_str(self):
+        colors = ['C' + str(x) for x in range(10)]
+        df = DataFrame(randn(10, 3), columns=['a', 'b', 'c'])
+        for c in colors:
+            _check_plot_works(df.plot, color=c)
+
+    def test_color_single_series_list(self):
+        # GH 3486
+        df = DataFrame({"A": [1, 2, 3]})
+        _check_plot_works(df.plot, color=['red'])
+
+    def test_rgb_tuple_color(self):
+        # GH 16695
+        df = DataFrame({'x': [1, 2], 'y': [3, 4]})
+        _check_plot_works(df.plot, x='x', y='y', color=(1, 0, 0))
+        _check_plot_works(df.plot, x='x', y='y', color=(1, 0, 0, 0.5))
+
+    def test_color_empty_string(self):
+        df = DataFrame(randn(10, 2))
+        with pytest.raises(ValueError):
+            df.plot(color='')
 
     def test_color_and_style_arguments(self):
         df = DataFrame({'x': [1, 2], 'y': [3, 4]})
@@ -148,35 +174,35 @@ def test_color_and_style_arguments(self):
         ax = df.plot(color=['red', 'black'], style=['-', '--'])
         # check that the linestyles are correctly set:
         linestyle = [line.get_linestyle() for line in ax.lines]
-        self.assertEqual(linestyle, ['-', '--'])
+        assert linestyle == ['-', '--']
         # check that the colors are correctly set:
         color = [line.get_color() for line in ax.lines]
-        self.assertEqual(color, ['red', 'black'])
+        assert color == ['red', 'black']
         # passing both 'color' and 'style' arguments should not be allowed
         # if there is a color symbol in the style strings:
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot(color=['red', 'black'], style=['k-', 'r--'])
 
     def test_nonnumeric_exclude(self):
         df = DataFrame({'A': ["x", "y", "z"], 'B': [1, 2, 3]})
         ax = df.plot()
-        self.assertEqual(len(ax.get_lines()), 1)  # B was plotted
+        assert len(ax.get_lines()) == 1  # B was plotted
 
-    @slow
+    @pytest.mark.slow
     def test_implicit_label(self):
         df = DataFrame(randn(10, 3), columns=['a', 'b', 'c'])
         ax = df.plot(x='a', y='b')
         self._check_text_labels(ax.xaxis.get_label(), 'a')
 
-    @slow
+    @pytest.mark.slow
     def test_donot_overwrite_index_name(self):
         # GH 8494
         df = DataFrame(randn(2, 2), columns=['a', 'b'])
         df.index.name = 'NAME'
         df.plot(y='b', label='LABEL')
-        self.assertEqual(df.index.name, 'NAME')
+        assert df.index.name == 'NAME'
 
-    @slow
+    @pytest.mark.slow
     def test_plot_xy(self):
         # columns.inferred_type == 'string'
         df = self.tdf
@@ -202,7 +228,7 @@ def test_plot_xy(self):
         # columns.inferred_type == 'mixed'
         # TODO add MultiIndex test
 
-    @slow
+    @pytest.mark.slow
     def test_logscales(self):
         df = DataFrame({'a': np.arange(100)}, index=np.arange(100))
         ax = df.plot(logy=True)
@@ -214,40 +240,41 @@ def test_logscales(self):
         ax = df.plot(loglog=True)
         self._check_ax_scales(ax, xaxis='log', yaxis='log')
 
-    @slow
+    @pytest.mark.slow
     def test_xcompat(self):
         import pandas as pd
 
         df = self.tdf
         ax = df.plot(x_compat=True)
         lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
 
         tm.close()
-        pd.plot_params['xaxis.compat'] = True
+        pd.plotting.plot_params['xaxis.compat'] = True
         ax = df.plot()
         lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
 
         tm.close()
-        pd.plot_params['x_compat'] = False
+        pd.plotting.plot_params['x_compat'] = False
+
         ax = df.plot()
         lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-        self.assertIsInstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+        assert isinstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
 
         tm.close()
         # useful if you're plotting a bunch together
-        with pd.plot_params.use('x_compat', True):
+        with pd.plotting.plot_params.use('x_compat', True):
             ax = df.plot()
             lines = ax.get_lines()
-            self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
+            assert not isinstance(lines[0].get_xdata(), PeriodIndex)
 
         tm.close()
         ax = df.plot()
         lines = ax.get_lines()
-        self.assertNotIsInstance(lines[0].get_xdata(), PeriodIndex)
-        self.assertIsInstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
+        assert not isinstance(lines[0].get_xdata(), PeriodIndex)
+        assert isinstance(PeriodIndex(lines[0].get_xdata()), PeriodIndex)
 
     def test_period_compat(self):
         # GH 9012
@@ -265,20 +292,43 @@ def test_unsorted_index(self):
         df = DataFrame({'y': np.arange(100)}, index=np.arange(99, -1, -1),
                        dtype=np.int64)
         ax = df.plot()
-        l = ax.get_lines()[0]
-        rs = l.get_xydata()
+        lines = ax.get_lines()[0]
+        rs = lines.get_xydata()
         rs = Series(rs[:, 1], rs[:, 0], dtype=np.int64, name='y')
         tm.assert_series_equal(rs, df.y, check_index_type=False)
         tm.close()
 
         df.index = pd.Index(np.arange(99, -1, -1), dtype=np.float64)
         ax = df.plot()
-        l = ax.get_lines()[0]
-        rs = l.get_xydata()
+        lines = ax.get_lines()[0]
+        rs = lines.get_xydata()
         rs = Series(rs[:, 1], rs[:, 0], dtype=np.int64, name='y')
         tm.assert_series_equal(rs, df.y)
 
-    @slow
+    def test_unsorted_index_lims(self):
+        df = DataFrame({'y': [0., 1., 2., 3.]}, index=[1., 0., 3., 2.])
+        ax = df.plot()
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+        df = DataFrame({'y': [0., 1., np.nan, 3., 4., 5., 6.]},
+                       index=[1., 0., 3., 2., np.nan, 3., 2.])
+        ax = df.plot()
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+        df = DataFrame({'y': [0., 1., 2., 3.], 'z': [91., 90., 93., 92.]})
+        ax = df.plot(x='z', y='y')
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data()[0])
+        assert xmax >= np.nanmax(lines[0].get_data()[0])
+
+    @pytest.mark.slow
     def test_subplots(self):
         df = DataFrame(np.random.rand(10, 3),
                        index=list(string.ascii_letters[:10]))
@@ -286,7 +336,7 @@ def test_subplots(self):
         for kind in ['bar', 'barh', 'line', 'area']:
             axes = df.plot(kind=kind, subplots=True, sharex=True, legend=True)
             self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
-            self.assertEqual(axes.shape, (3, ))
+            assert axes.shape == (3, )
 
             for ax, column in zip(axes, df.columns):
                 self._check_legend_labels(ax,
@@ -316,9 +366,60 @@ def test_subplots(self):
 
             axes = df.plot(kind=kind, subplots=True, legend=False)
             for ax in axes:
-                self.assertTrue(ax.get_legend() is None)
-
-    @slow
+                assert ax.get_legend() is None
+
+    def test_groupby_boxplot_sharey(self):
+        # https://github.com/pandas-dev/pandas/issues/20968
+        # sharey can now be switched check whether the right
+        # pair of axes is turned on or off
+
+        df = DataFrame({'a': [-1.43, -0.15, -3.70, -1.43, -0.14],
+                        'b': [0.56, 0.84, 0.29, 0.56, 0.85],
+                        'c': [0, 1, 2, 3, 1]},
+                       index=[0, 1, 2, 3, 4])
+
+        # behavior without keyword
+        axes = df.groupby('c').boxplot()
+        expected = [True, False, True, False]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+        # set sharey=True should be identical
+        axes = df.groupby('c').boxplot(sharey=True)
+        expected = [True, False, True, False]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+        # sharey=False, all yticklabels should be visible
+        axes = df.groupby('c').boxplot(sharey=False)
+        expected = [True, True, True, True]
+        self._assert_ytickslabels_visibility(axes, expected)
+
+    def test_groupby_boxplot_sharex(self):
+        # https://github.com/pandas-dev/pandas/issues/20968
+        # sharex can now be switched check whether the right
+        # pair of axes is turned on or off
+
+        df = DataFrame({'a': [-1.43, -0.15, -3.70, -1.43, -0.14],
+                        'b': [0.56, 0.84, 0.29, 0.56, 0.85],
+                        'c': [0, 1, 2, 3, 1]},
+                       index=[0, 1, 2, 3, 4])
+
+        # behavior without keyword
+        axes = df.groupby('c').boxplot()
+        expected = [True, True, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+        # set sharex=False should be identical
+        axes = df.groupby('c').boxplot(sharex=False)
+        expected = [True, True, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+        # sharex=True, yticklabels should be visible
+        # only for bottom plots
+        axes = df.groupby('c').boxplot(sharex=True)
+        expected = [False, False, True, True]
+        self._assert_xtickslabels_visibility(axes, expected)
+
+    @pytest.mark.slow
     def test_subplots_timeseries(self):
         idx = date_range(start='2014-07-01', freq='M', periods=10)
         df = DataFrame(np.random.rand(10, 3), index=idx)
@@ -354,7 +455,83 @@ def test_subplots_timeseries(self):
                 self._check_ticks_props(ax, xlabelsize=7, xrot=45,
                                         ylabelsize=7)
 
-    @slow
+    def test_subplots_timeseries_y_axis(self):
+        # GH16953
+        data = {"numeric": np.array([1, 2, 5]),
+                "timedelta": [pd.Timedelta(-10, unit="s"),
+                              pd.Timedelta(10, unit="m"),
+                              pd.Timedelta(10, unit="h")],
+                "datetime_no_tz": [pd.to_datetime("2017-08-01 00:00:00"),
+                                   pd.to_datetime("2017-08-01 02:00:00"),
+                                   pd.to_datetime("2017-08-02 00:00:00")],
+                "datetime_all_tz": [pd.to_datetime("2017-08-01 00:00:00",
+                                                   utc=True),
+                                    pd.to_datetime("2017-08-01 02:00:00",
+                                                   utc=True),
+                                    pd.to_datetime("2017-08-02 00:00:00",
+                                                   utc=True)],
+                "text": ["This", "should", "fail"]}
+        testdata = DataFrame(data)
+
+        ax_numeric = testdata.plot(y="numeric")
+        assert (ax_numeric.get_lines()[0].get_data()[1] ==
+                testdata["numeric"].values).all()
+        ax_timedelta = testdata.plot(y="timedelta")
+        assert (ax_timedelta.get_lines()[0].get_data()[1] ==
+                testdata["timedelta"].values).all()
+        ax_datetime_no_tz = testdata.plot(y="datetime_no_tz")
+        assert (ax_datetime_no_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_no_tz"].values).all()
+        ax_datetime_all_tz = testdata.plot(y="datetime_all_tz")
+        assert (ax_datetime_all_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_all_tz"].values).all()
+        with pytest.raises(TypeError):
+            testdata.plot(y="text")
+
+    @pytest.mark.xfail(reason='not support for period, categorical, '
+                              'datetime_mixed_tz')
+    def test_subplots_timeseries_y_axis_not_supported(self):
+        """
+        This test will fail for:
+            period:
+                since period isn't yet implemented in ``select_dtypes``
+                and because it will need a custom value converter +
+                tick formater (as was done for x-axis plots)
+
+            categorical:
+                 because it will need a custom value converter +
+                 tick formater (also doesn't work for x-axis, as of now)
+
+            datetime_mixed_tz:
+                because of the way how pandas handels ``Series`` of
+                ``datetime`` objects with different timezone,
+                generally converting ``datetime`` objects in a tz-aware
+                form could help with this problem
+        """
+        data = {"numeric": np.array([1, 2, 5]),
+                "period": [pd.Period('2017-08-01 00:00:00', freq='H'),
+                           pd.Period('2017-08-01 02:00', freq='H'),
+                           pd.Period('2017-08-02 00:00:00', freq='H')],
+                "categorical": pd.Categorical(["c", "b", "a"],
+                                              categories=["a", "b", "c"],
+                                              ordered=False),
+                "datetime_mixed_tz": [pd.to_datetime("2017-08-01 00:00:00",
+                                                     utc=True),
+                                      pd.to_datetime("2017-08-01 02:00:00"),
+                                      pd.to_datetime("2017-08-02 00:00:00")]}
+        testdata = pd.DataFrame(data)
+        ax_period = testdata.plot(x="numeric", y="period")
+        assert (ax_period.get_lines()[0].get_data()[1] ==
+                testdata["period"].values).all()
+        ax_categorical = testdata.plot(x="numeric", y="categorical")
+        assert (ax_categorical.get_lines()[0].get_data()[1] ==
+                testdata["categorical"].values).all()
+        ax_datetime_mixed_tz = testdata.plot(x="numeric",
+                                             y="datetime_mixed_tz")
+        assert (ax_datetime_mixed_tz.get_lines()[0].get_data()[1] ==
+                testdata["datetime_mixed_tz"].values).all()
+
+    @pytest.mark.slow
     def test_subplots_layout(self):
         # GH 6667
         df = DataFrame(np.random.rand(10, 3),
@@ -362,60 +539,56 @@ def test_subplots_layout(self):
 
         axes = df.plot(subplots=True, layout=(2, 2))
         self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
+        assert axes.shape == (2, 2)
 
         axes = df.plot(subplots=True, layout=(-1, 2))
         self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
+        assert axes.shape == (2, 2)
 
         axes = df.plot(subplots=True, layout=(2, -1))
         self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertEqual(axes.shape, (2, 2))
+        assert axes.shape == (2, 2)
 
         axes = df.plot(subplots=True, layout=(1, 4))
         self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
-        self.assertEqual(axes.shape, (1, 4))
+        assert axes.shape == (1, 4)
 
         axes = df.plot(subplots=True, layout=(-1, 4))
         self._check_axes_shape(axes, axes_num=3, layout=(1, 4))
-        self.assertEqual(axes.shape, (1, 4))
+        assert axes.shape == (1, 4)
 
         axes = df.plot(subplots=True, layout=(4, -1))
         self._check_axes_shape(axes, axes_num=3, layout=(4, 1))
-        self.assertEqual(axes.shape, (4, 1))
+        assert axes.shape == (4, 1)
 
-        with tm.assertRaises(ValueError):
-            axes = df.plot(subplots=True, layout=(1, 1))
-        with tm.assertRaises(ValueError):
-            axes = df.plot(subplots=True, layout=(-1, -1))
+        with pytest.raises(ValueError):
+            df.plot(subplots=True, layout=(1, 1))
+        with pytest.raises(ValueError):
+            df.plot(subplots=True, layout=(-1, -1))
 
         # single column
         df = DataFrame(np.random.rand(10, 1),
                        index=list(string.ascii_letters[:10]))
         axes = df.plot(subplots=True)
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        self.assertEqual(axes.shape, (1, ))
+        assert axes.shape == (1, )
 
         axes = df.plot(subplots=True, layout=(3, 3))
         self._check_axes_shape(axes, axes_num=1, layout=(3, 3))
-        self.assertEqual(axes.shape, (3, 3))
+        assert axes.shape == (3, 3)
 
-    @slow
+    @pytest.mark.slow
     def test_subplots_warnings(self):
         # GH 9464
-        warnings.simplefilter('error')
-        try:
+        with tm.assert_produces_warning(None):
             df = DataFrame(np.random.randn(100, 4))
             df.plot(subplots=True, layout=(3, 2))
 
             df = DataFrame(np.random.randn(100, 4),
                            index=date_range('1/1/2000', periods=100))
             df.plot(subplots=True, layout=(3, 2))
-        except Warning as w:
-            self.fail(w)
-        warnings.simplefilter('default')
 
-    @slow
+    @pytest.mark.slow
     def test_subplots_multiple_axes(self):
         # GH 5353, 6970, GH 7069
         fig, axes = self.plt.subplots(2, 3)
@@ -425,18 +598,18 @@ def test_subplots_multiple_axes(self):
         returned = df.plot(subplots=True, ax=axes[0], sharex=False,
                            sharey=False)
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assertEqual(returned.shape, (3, ))
-        self.assertIs(returned[0].figure, fig)
+        assert returned.shape == (3, )
+        assert returned[0].figure is fig
         # draw on second row
         returned = df.plot(subplots=True, ax=axes[1], sharex=False,
                            sharey=False)
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assertEqual(returned.shape, (3, ))
-        self.assertIs(returned[0].figure, fig)
+        assert returned.shape == (3, )
+        assert returned[0].figure is fig
         self._check_axes_shape(axes, axes_num=6, layout=(2, 3))
         tm.close()
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             fig, axes = self.plt.subplots(2, 3)
             # pass different number of axes from required
             df.plot(subplots=True, ax=axes)
@@ -447,24 +620,24 @@ def test_subplots_multiple_axes(self):
         # TestDataFrameGroupByPlots.test_grouped_box_multiple_axes
         fig, axes = self.plt.subplots(2, 2)
         with warnings.catch_warnings():
-            warnings.simplefilter('ignore')
+            warnings.simplefilter("ignore", UserWarning)
             df = DataFrame(np.random.rand(10, 4),
                            index=list(string.ascii_letters[:10]))
 
             returned = df.plot(subplots=True, ax=axes, layout=(2, 1),
                                sharex=False, sharey=False)
             self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-            self.assertEqual(returned.shape, (4, ))
+            assert returned.shape == (4, )
 
             returned = df.plot(subplots=True, ax=axes, layout=(2, -1),
                                sharex=False, sharey=False)
             self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-            self.assertEqual(returned.shape, (4, ))
+            assert returned.shape == (4, )
 
             returned = df.plot(subplots=True, ax=axes, layout=(-1, 2),
                                sharex=False, sharey=False)
         self._check_axes_shape(returned, axes_num=4, layout=(2, 2))
-        self.assertEqual(returned.shape, (4, ))
+        assert returned.shape == (4, )
 
         # single column
         fig, axes = self.plt.subplots(1, 1)
@@ -473,7 +646,7 @@ def test_subplots_multiple_axes(self):
 
         axes = df.plot(subplots=True, ax=[axes], sharex=False, sharey=False)
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
-        self.assertEqual(axes.shape, (1, ))
+        assert axes.shape == (1, )
 
     def test_subplots_ts_share_axes(self):
         # GH 3964
@@ -516,44 +689,44 @@ def test_subplots_sharex_axes_existing_axes(self):
         for ax in axes.ravel():
             self._check_visible(ax.get_yticklabels(), visible=True)
 
-    @slow
+    @pytest.mark.slow
     def test_subplots_dup_columns(self):
         # GH 10962
         df = DataFrame(np.random.rand(5, 5), columns=list('aaaaa'))
         axes = df.plot(subplots=True)
         for ax in axes:
             self._check_legend_labels(ax, labels=['a'])
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
         tm.close()
 
         axes = df.plot(subplots=True, secondary_y='a')
         for ax in axes:
             # (right) is only attached when subplots=False
             self._check_legend_labels(ax, labels=['a'])
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
         tm.close()
 
         ax = df.plot(secondary_y='a')
         self._check_legend_labels(ax, labels=['a (right)'] * 5)
-        self.assertEqual(len(ax.lines), 0)
-        self.assertEqual(len(ax.right_ax.lines), 5)
+        assert len(ax.lines) == 0
+        assert len(ax.right_ax.lines) == 5
 
     def test_negative_log(self):
         df = - DataFrame(rand(6, 4),
                          index=list(string.ascii_letters[:6]),
                          columns=['x', 'y', 'z', 'four'])
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot.area(logy=True)
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot.area(loglog=True)
 
     def _compare_stacked_y_cood(self, normal_lines, stacked_lines):
         base = np.zeros(len(normal_lines[0].get_data()[1]))
         for nl, sl in zip(normal_lines, stacked_lines):
-            base += nl.get_data()[1]  # get y coodinates
+            base += nl.get_data()[1]  # get y coordinates
             sy = sl.get_data()[1]
-            self.assert_numpy_array_equal(base, sy)
+            tm.assert_numpy_array_equal(base, sy)
 
     def test_line_area_stacked(self):
         with tm.RNGContext(42):
@@ -584,7 +757,7 @@ def test_line_area_stacked(self):
                 self._compare_stacked_y_cood(ax1.lines[2:], ax2.lines[2:])
 
                 _check_plot_works(mixed_df.plot, stacked=False)
-                with tm.assertRaises(ValueError):
+                with pytest.raises(ValueError):
                     mixed_df.plot(stacked=True)
 
                 _check_plot_works(df.plot, kind=kind, logx=True, stacked=True)
@@ -603,55 +776,55 @@ def test_line_area_nan_df(self):
             # remove nan for comparison purpose
 
             exp = np.array([1, 2, 3], dtype=np.float64)
-            self.assert_numpy_array_equal(np.delete(masked1.data, 2), exp)
+            tm.assert_numpy_array_equal(np.delete(masked1.data, 2), exp)
 
             exp = np.array([3, 2, 1], dtype=np.float64)
-            self.assert_numpy_array_equal(np.delete(masked2.data, 1), exp)
-            self.assert_numpy_array_equal(
+            tm.assert_numpy_array_equal(np.delete(masked2.data, 1), exp)
+            tm.assert_numpy_array_equal(
                 masked1.mask, np.array([False, False, True, False]))
-            self.assert_numpy_array_equal(
+            tm.assert_numpy_array_equal(
                 masked2.mask, np.array([False, True, False, False]))
 
             expected1 = np.array([1, 2, 0, 3], dtype=np.float64)
             expected2 = np.array([3, 0, 2, 1], dtype=np.float64)
 
             ax = _check_plot_works(d.plot, stacked=True)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(),
-                                          expected1 + expected2)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(),
+                                        expected1 + expected2)
 
             ax = _check_plot_works(d.plot.area)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(),
-                                          expected1 + expected2)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(),
+                                        expected1 + expected2)
 
             ax = _check_plot_works(d.plot.area, stacked=False)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
-            self.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected2)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected1)
+            tm.assert_numpy_array_equal(ax.lines[1].get_ydata(), expected2)
 
     def test_line_lim(self):
         df = DataFrame(rand(6, 3), columns=['x', 'y', 'z'])
         ax = df.plot()
         xmin, xmax = ax.get_xlim()
         lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data()[0][0])
-        self.assertEqual(xmax, lines[0].get_data()[0][-1])
+        assert xmin <= lines[0].get_data()[0][0]
+        assert xmax >= lines[0].get_data()[0][-1]
 
         ax = df.plot(secondary_y=True)
         xmin, xmax = ax.get_xlim()
         lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data()[0][0])
-        self.assertEqual(xmax, lines[0].get_data()[0][-1])
+        assert xmin <= lines[0].get_data()[0][0]
+        assert xmax >= lines[0].get_data()[0][-1]
 
         axes = df.plot(secondary_y=True, subplots=True)
         self._check_axes_shape(axes, axes_num=3, layout=(3, 1))
         for ax in axes:
-            self.assertTrue(hasattr(ax, 'left_ax'))
-            self.assertFalse(hasattr(ax, 'right_ax'))
+            assert hasattr(ax, 'left_ax')
+            assert not hasattr(ax, 'right_ax')
             xmin, xmax = ax.get_xlim()
             lines = ax.get_lines()
-            self.assertEqual(xmin, lines[0].get_data()[0][0])
-            self.assertEqual(xmax, lines[0].get_data()[0][-1])
+            assert xmin <= lines[0].get_data()[0][0]
+            assert xmax >= lines[0].get_data()[0][-1]
 
     def test_area_lim(self):
         df = DataFrame(rand(6, 4), columns=['x', 'y', 'z', 'four'])
@@ -662,18 +835,18 @@ def test_area_lim(self):
             xmin, xmax = ax.get_xlim()
             ymin, ymax = ax.get_ylim()
             lines = ax.get_lines()
-            self.assertEqual(xmin, lines[0].get_data()[0][0])
-            self.assertEqual(xmax, lines[0].get_data()[0][-1])
-            self.assertEqual(ymin, 0)
+            assert xmin <= lines[0].get_data()[0][0]
+            assert xmax >= lines[0].get_data()[0][-1]
+            assert ymin == 0
 
             ax = _check_plot_works(neg_df.plot.area, stacked=stacked)
             ymin, ymax = ax.get_ylim()
-            self.assertEqual(ymax, 0)
+            assert ymax == 0
 
-    @slow
+    @pytest.mark.slow
     def test_bar_colors(self):
         import matplotlib.pyplot as plt
-        default_colors = self._maybe_unpack_cycler(plt.rcParams)
+        default_colors = self._unpack_cycler(plt.rcParams)
 
         df = DataFrame(randn(5, 5))
         ax = df.plot.bar()
@@ -706,28 +879,42 @@ def test_bar_colors(self):
         self._check_colors(ax.patches[::5], facecolors=['green'] * 5)
         tm.close()
 
-    @slow
+    def test_bar_user_colors(self):
+        df = pd.DataFrame({"A": range(4),
+                           "B": range(1, 5),
+                           "color": ['red', 'blue', 'blue', 'red']})
+        # This should *only* work when `y` is specified, else
+        # we use one color per column
+        ax = df.plot.bar(y='A', color=df['color'])
+        result = [p.get_facecolor() for p in ax.patches]
+        expected = [(1., 0., 0., 1.),
+                    (0., 0., 1., 1.),
+                    (0., 0., 1., 1.),
+                    (1., 0., 0., 1.)]
+        assert result == expected
+
+    @pytest.mark.slow
     def test_bar_linewidth(self):
         df = DataFrame(randn(5, 5))
 
         # regular
         ax = df.plot.bar(linewidth=2)
         for r in ax.patches:
-            self.assertEqual(r.get_linewidth(), 2)
+            assert r.get_linewidth() == 2
 
         # stacked
         ax = df.plot.bar(stacked=True, linewidth=2)
         for r in ax.patches:
-            self.assertEqual(r.get_linewidth(), 2)
+            assert r.get_linewidth() == 2
 
         # subplots
         axes = df.plot.bar(linewidth=2, subplots=True)
         self._check_axes_shape(axes, axes_num=5, layout=(5, 1))
         for ax in axes:
             for r in ax.patches:
-                self.assertEqual(r.get_linewidth(), 2)
+                assert r.get_linewidth() == 2
 
-    @slow
+    @pytest.mark.slow
     def test_bar_barwidth(self):
         df = DataFrame(randn(5, 5))
 
@@ -736,36 +923,36 @@ def test_bar_barwidth(self):
         # regular
         ax = df.plot.bar(width=width)
         for r in ax.patches:
-            self.assertEqual(r.get_width(), width / len(df.columns))
+            assert r.get_width() == width / len(df.columns)
 
         # stacked
         ax = df.plot.bar(stacked=True, width=width)
         for r in ax.patches:
-            self.assertEqual(r.get_width(), width)
+            assert r.get_width() == width
 
         # horizontal regular
         ax = df.plot.barh(width=width)
         for r in ax.patches:
-            self.assertEqual(r.get_height(), width / len(df.columns))
+            assert r.get_height() == width / len(df.columns)
 
         # horizontal stacked
         ax = df.plot.barh(stacked=True, width=width)
         for r in ax.patches:
-            self.assertEqual(r.get_height(), width)
+            assert r.get_height() == width
 
         # subplots
         axes = df.plot.bar(width=width, subplots=True)
         for ax in axes:
             for r in ax.patches:
-                self.assertEqual(r.get_width(), width)
+                assert r.get_width() == width
 
         # horizontal subplots
         axes = df.plot.barh(width=width, subplots=True)
         for ax in axes:
             for r in ax.patches:
-                self.assertEqual(r.get_height(), width)
+                assert r.get_height() == width
 
-    @slow
+    @pytest.mark.slow
     def test_bar_barwidth_position(self):
         df = DataFrame(randn(5, 5))
         self._check_bar_alignment(df, kind='bar', stacked=False, width=0.9,
@@ -781,7 +968,7 @@ def test_bar_barwidth_position(self):
         self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9,
                                   position=0.2)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_barwidth_position_int(self):
         # GH 12979
         df = DataFrame(randn(5, 5))
@@ -790,10 +977,10 @@ def test_bar_barwidth_position_int(self):
             ax = df.plot.bar(stacked=True, width=w)
             ticks = ax.xaxis.get_ticklocs()
             tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4]))
-            self.assertEqual(ax.get_xlim(), (-0.75, 4.75))
+            assert ax.get_xlim() == (-0.75, 4.75)
             # check left-edge of bars
-            self.assertEqual(ax.patches[0].get_x(), -0.5)
-            self.assertEqual(ax.patches[-1].get_x(), 3.5)
+            assert ax.patches[0].get_x() == -0.5
+            assert ax.patches[-1].get_x() == 3.5
 
         self._check_bar_alignment(df, kind='bar', stacked=True, width=1)
         self._check_bar_alignment(df, kind='barh', stacked=False, width=1)
@@ -801,36 +988,36 @@ def test_bar_barwidth_position_int(self):
         self._check_bar_alignment(df, kind='bar', subplots=True, width=1)
         self._check_bar_alignment(df, kind='barh', subplots=True, width=1)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_bottom_left(self):
         df = DataFrame(rand(5, 5))
         ax = df.plot.bar(stacked=False, bottom=1)
         result = [p.get_y() for p in ax.patches]
-        self.assertEqual(result, [1] * 25)
+        assert result == [1] * 25
 
         ax = df.plot.bar(stacked=True, bottom=[-1, -2, -3, -4, -5])
         result = [p.get_y() for p in ax.patches[:5]]
-        self.assertEqual(result, [-1, -2, -3, -4, -5])
+        assert result == [-1, -2, -3, -4, -5]
 
         ax = df.plot.barh(stacked=False, left=np.array([1, 1, 1, 1, 1]))
         result = [p.get_x() for p in ax.patches]
-        self.assertEqual(result, [1] * 25)
+        assert result == [1] * 25
 
         ax = df.plot.barh(stacked=True, left=[1, 2, 3, 4, 5])
         result = [p.get_x() for p in ax.patches[:5]]
-        self.assertEqual(result, [1, 2, 3, 4, 5])
+        assert result == [1, 2, 3, 4, 5]
 
         axes = df.plot.bar(subplots=True, bottom=-1)
         for ax in axes:
             result = [p.get_y() for p in ax.patches]
-            self.assertEqual(result, [-1] * 5)
+            assert result == [-1] * 5
 
         axes = df.plot.barh(subplots=True, left=np.array([1, 1, 1, 1, 1]))
         for ax in axes:
             result = [p.get_x() for p in ax.patches]
-            self.assertEqual(result, [1] * 5)
+            assert result == [1] * 5
 
-    @slow
+    @pytest.mark.slow
     def test_bar_nan(self):
         df = DataFrame({'A': [10, np.nan, 20],
                         'B': [5, 10, 20],
@@ -838,17 +1025,17 @@ def test_bar_nan(self):
         ax = df.plot.bar()
         expected = [10, 0, 20, 5, 10, 20, 1, 2, 3]
         result = [p.get_height() for p in ax.patches]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         ax = df.plot.bar(stacked=True)
         result = [p.get_height() for p in ax.patches]
-        self.assertEqual(result, expected)
+        assert result == expected
 
         result = [p.get_y() for p in ax.patches]
         expected = [0.0, 0.0, 0.0, 10.0, 0.0, 20.0, 15.0, 10.0, 40.0]
-        self.assertEqual(result, expected)
+        assert result == expected
 
-    @slow
+    @pytest.mark.slow
     def test_bar_categorical(self):
         # GH 13019
         df1 = pd.DataFrame(np.random.randn(6, 5),
@@ -863,18 +1050,18 @@ def test_bar_categorical(self):
             ax = df.plot.bar()
             ticks = ax.xaxis.get_ticklocs()
             tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4, 5]))
-            self.assertEqual(ax.get_xlim(), (-0.5, 5.5))
+            assert ax.get_xlim() == (-0.5, 5.5)
             # check left-edge of bars
-            self.assertEqual(ax.patches[0].get_x(), -0.25)
-            self.assertEqual(ax.patches[-1].get_x(), 5.15)
+            assert ax.patches[0].get_x() == -0.25
+            assert ax.patches[-1].get_x() == 5.15
 
             ax = df.plot.bar(stacked=True)
             tm.assert_numpy_array_equal(ticks, np.array([0, 1, 2, 3, 4, 5]))
-            self.assertEqual(ax.get_xlim(), (-0.5, 5.5))
-            self.assertEqual(ax.patches[0].get_x(), -0.25)
-            self.assertEqual(ax.patches[-1].get_x(), 4.75)
+            assert ax.get_xlim() == (-0.5, 5.5)
+            assert ax.patches[0].get_x() == -0.25
+            assert ax.patches[-1].get_x() == 4.75
 
-    @slow
+    @pytest.mark.slow
     def test_plot_scatter(self):
         df = DataFrame(randn(6, 4),
                        index=list(string.ascii_letters[:6]),
@@ -883,16 +1070,97 @@ def test_plot_scatter(self):
         _check_plot_works(df.plot.scatter, x='x', y='y')
         _check_plot_works(df.plot.scatter, x=1, y=2)
 
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.plot.scatter(x='x')
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.plot.scatter(y='y')
 
         # GH 6951
         axes = df.plot(x='x', y='y', kind='scatter', subplots=True)
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
 
-    @slow
+    @pytest.mark.slow
+    def test_if_scatterplot_colorbar_affects_xaxis_visibility(self):
+        # addressing issue #10611, to ensure colobar does not
+        # interfere with x-axis label and ticklabels with
+        # ipython inline backend.
+        random_array = np.random.random((1000, 3))
+        df = pd.DataFrame(random_array,
+                          columns=['A label', 'B label', 'C label'])
+
+        ax1 = df.plot.scatter(x='A label', y='B label')
+        ax2 = df.plot.scatter(x='A label', y='B label', c='C label')
+
+        vis1 = [vis.get_visible() for vis in
+                ax1.xaxis.get_minorticklabels()]
+        vis2 = [vis.get_visible() for vis in
+                ax2.xaxis.get_minorticklabels()]
+        assert vis1 == vis2
+
+        vis1 = [vis.get_visible() for vis in
+                ax1.xaxis.get_majorticklabels()]
+        vis2 = [vis.get_visible() for vis in
+                ax2.xaxis.get_majorticklabels()]
+        assert vis1 == vis2
+
+        assert (ax1.xaxis.get_label().get_visible() ==
+                ax2.xaxis.get_label().get_visible())
+
+    @pytest.mark.slow
+    def test_if_hexbin_xaxis_label_is_visible(self):
+        # addressing issue #10678, to ensure colobar does not
+        # interfere with x-axis label and ticklabels with
+        # ipython inline backend.
+        random_array = np.random.random((1000, 3))
+        df = pd.DataFrame(random_array,
+                          columns=['A label', 'B label', 'C label'])
+
+        ax = df.plot.hexbin('A label', 'B label', gridsize=12)
+        assert all(vis.get_visible() for vis in
+                   ax.xaxis.get_minorticklabels())
+        assert all(vis.get_visible() for vis in
+                   ax.xaxis.get_majorticklabels())
+        assert ax.xaxis.get_label().get_visible()
+
+    @pytest.mark.slow
+    def test_if_scatterplot_colorbars_are_next_to_parent_axes(self):
+        import matplotlib.pyplot as plt
+        random_array = np.random.random((1000, 3))
+        df = pd.DataFrame(random_array,
+                          columns=['A label', 'B label', 'C label'])
+
+        fig, axes = plt.subplots(1, 2)
+        df.plot.scatter('A label', 'B label', c='C label', ax=axes[0])
+        df.plot.scatter('A label', 'B label', c='C label', ax=axes[1])
+        plt.tight_layout()
+
+        points = np.array([ax.get_position().get_points()
+                           for ax in fig.axes])
+        axes_x_coords = points[:, :, 0]
+        parent_distance = axes_x_coords[1, :] - axes_x_coords[0, :]
+        colorbar_distance = axes_x_coords[3, :] - axes_x_coords[2, :]
+        assert np.isclose(parent_distance,
+                          colorbar_distance, atol=1e-7).all()
+
+    @pytest.mark.slow
+    def test_plot_scatter_with_categorical_data(self):
+        # GH 16199
+        df = pd.DataFrame({'x': [1, 2, 3, 4],
+                           'y': pd.Categorical(['a', 'b', 'a', 'c'])})
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='x', y='y', kind='scatter')
+        ve.match('requires y column to be numeric')
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='y', y='x', kind='scatter')
+        ve.match('requires x column to be numeric')
+
+        with pytest.raises(ValueError) as ve:
+            df.plot(x='y', y='y', kind='scatter')
+        ve.match('requires x column to be numeric')
+
+    @pytest.mark.slow
     def test_plot_scatter_with_c(self):
         df = DataFrame(randn(6, 4),
                        index=list(string.ascii_letters[:6]),
@@ -902,25 +1170,23 @@ def test_plot_scatter_with_c(self):
                 df.plot.scatter(x=0, y=1, c=2)]
         for ax in axes:
             # default to Greys
-            self.assertEqual(ax.collections[0].cmap.name, 'Greys')
-
-            if self.mpl_ge_1_3_1:
+            assert ax.collections[0].cmap.name == 'Greys'
 
-                # n.b. there appears to be no public method to get the colorbar
-                # label
-                self.assertEqual(ax.collections[0].colorbar._label, 'z')
+            # n.b. there appears to be no public method
+            # to get the colorbar label
+            assert ax.collections[0].colorbar._label == 'z'
 
         cm = 'cubehelix'
         ax = df.plot.scatter(x='x', y='y', c='z', colormap=cm)
-        self.assertEqual(ax.collections[0].cmap.name, cm)
+        assert ax.collections[0].cmap.name == cm
 
         # verify turning off colorbar works
         ax = df.plot.scatter(x='x', y='y', c='z', colorbar=False)
-        self.assertIs(ax.collections[0].colorbar, None)
+        assert ax.collections[0].colorbar is None
 
         # verify that we can still plot a solid color
         ax = df.plot.scatter(x=0, y=1, c='red')
-        self.assertIs(ax.collections[0].colorbar, None)
+        assert ax.collections[0].colorbar is None
         self._check_colors(ax.collections, facecolors=['r'])
 
         # Ensure that we can pass an np.array straight through to matplotlib,
@@ -938,8 +1204,8 @@ def test_plot_scatter_with_c(self):
         # identical to the values we supplied, normally we'd be on shaky ground
         # comparing floats for equality but here we expect them to be
         # identical.
-        self.assertTrue(np.array_equal(ax.collections[0].get_facecolor(),
-                                       rgba_array))
+        tm.assert_numpy_array_equal(ax.collections[0]
+                                    .get_facecolor(), rgba_array)
         # we don't test the colors of the faces in this next plot because they
         # are dependent on the spring colormap, which may change its colors
         # later.
@@ -948,10 +1214,10 @@ def test_plot_scatter_with_c(self):
 
     def test_scatter_colors(self):
         df = DataFrame({'a': [1, 2, 3], 'b': [1, 2, 3], 'c': [1, 2, 3]})
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.plot.scatter(x='a', y='b', c='c', color='green')
 
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+        default_colors = self._unpack_cycler(self.plt.rcParams)
 
         ax = df.plot.scatter(x='a', y='b', c='c')
         tm.assert_numpy_array_equal(
@@ -962,7 +1228,7 @@ def test_scatter_colors(self):
         tm.assert_numpy_array_equal(ax.collections[0].get_facecolor()[0],
                                     np.array([1, 1, 1, 1], dtype=np.float64))
 
-    @slow
+    @pytest.mark.slow
     def test_plot_bar(self):
         df = DataFrame(randn(6, 4),
                        index=list(string.ascii_letters[:6]),
@@ -1006,21 +1272,20 @@ def _check_bar_alignment(self, df, kind='bar', stacked=False,
             if kind == 'bar':
                 axis = ax.xaxis
                 ax_min, ax_max = ax.get_xlim()
-                min_edge = min([p.get_x() for p in ax.patches])
-                max_edge = max([p.get_x() + p.get_width() for p in ax.patches])
+                min_edge = min(p.get_x() for p in ax.patches)
+                max_edge = max(p.get_x() + p.get_width() for p in ax.patches)
             elif kind == 'barh':
                 axis = ax.yaxis
                 ax_min, ax_max = ax.get_ylim()
-                min_edge = min([p.get_y() for p in ax.patches])
-                max_edge = max([p.get_y() + p.get_height() for p in ax.patches
-                                ])
+                min_edge = min(p.get_y() for p in ax.patches)
+                max_edge = max(p.get_y() + p.get_height() for p in ax.patches)
             else:
                 raise ValueError
 
             # GH 7498
             # compare margins between lim and bar edges
-            self.assertAlmostEqual(ax_min, min_edge - 0.25)
-            self.assertAlmostEqual(ax_max, max_edge + 0.25)
+            tm.assert_almost_equal(ax_min, min_edge - 0.25)
+            tm.assert_almost_equal(ax_max, max_edge + 0.25)
 
             p = ax.patches[0]
             if kind == 'bar' and (stacked is True or subplots is True):
@@ -1040,20 +1305,20 @@ def _check_bar_alignment(self, df, kind='bar', stacked=False,
                 raise ValueError
 
             # Check the ticks locates on integer
-            self.assertTrue((axis.get_ticklocs() == np.arange(len(df))).all())
+            assert (axis.get_ticklocs() == np.arange(len(df))).all()
 
             if align == 'center':
                 # Check whether the bar locates on center
-                self.assertAlmostEqual(axis.get_ticklocs()[0], center)
+                tm.assert_almost_equal(axis.get_ticklocs()[0], center)
             elif align == 'edge':
                 # Check whether the bar's edge starts from the tick
-                self.assertAlmostEqual(axis.get_ticklocs()[0], edge)
+                tm.assert_almost_equal(axis.get_ticklocs()[0], edge)
             else:
                 raise ValueError
 
         return axes
 
-    @slow
+    @pytest.mark.slow
     def test_bar_stacked_center(self):
         # GH2157
         df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
@@ -1062,7 +1327,7 @@ def test_bar_stacked_center(self):
         self._check_bar_alignment(df, kind='barh', stacked=True)
         self._check_bar_alignment(df, kind='barh', stacked=True, width=0.9)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_center(self):
         df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
         self._check_bar_alignment(df, kind='bar', stacked=False)
@@ -1070,7 +1335,7 @@ def test_bar_center(self):
         self._check_bar_alignment(df, kind='barh', stacked=False)
         self._check_bar_alignment(df, kind='barh', stacked=False, width=0.9)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_subplots_center(self):
         df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
         self._check_bar_alignment(df, kind='bar', subplots=True)
@@ -1078,7 +1343,7 @@ def test_bar_subplots_center(self):
         self._check_bar_alignment(df, kind='barh', subplots=True)
         self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_align_single_column(self):
         df = DataFrame(randn(5))
         self._check_bar_alignment(df, kind='bar', stacked=False)
@@ -1088,7 +1353,7 @@ def test_bar_align_single_column(self):
         self._check_bar_alignment(df, kind='bar', subplots=True)
         self._check_bar_alignment(df, kind='barh', subplots=True)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_edge(self):
         df = DataFrame({'A': [3] * 5, 'B': lrange(5)}, index=lrange(5))
 
@@ -1113,25 +1378,20 @@ def test_bar_edge(self):
         self._check_bar_alignment(df, kind='barh', subplots=True, width=0.9,
                                   align='edge')
 
-    @slow
+    @pytest.mark.slow
     def test_bar_log_no_subplots(self):
         # GH3254, GH3298 matplotlib/matplotlib#1882, #1892
         # regressions in 1.2.1
-        expected = np.array([1., 10.])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 100))
+        expected = np.array([.1, 1., 10., 100])
 
         # no subplots
         df = DataFrame({'A': [3] * 5, 'B': lrange(1, 6)}, index=lrange(5))
         ax = df.plot.bar(grid=True, log=True)
         tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_log_subplots(self):
-        expected = np.array([1., 10., 100., 1000.])
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 1e4))
+        expected = np.array([.1, 1., 10., 100., 1000., 1e4])
 
         ax = DataFrame([Series([200, 300]), Series([300, 500])]).plot.bar(
             log=True, subplots=True)
@@ -1139,7 +1399,7 @@ def test_bar_log_subplots(self):
         tm.assert_numpy_array_equal(ax[0].yaxis.get_ticklocs(), expected)
         tm.assert_numpy_array_equal(ax[1].yaxis.get_ticklocs(), expected)
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot(self):
         df = self.hist_df
         series = df['height']
@@ -1150,7 +1410,7 @@ def test_boxplot(self):
         self._check_text_labels(ax.get_xticklabels(), labels)
         tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(),
                                     np.arange(1, len(numeric_cols) + 1))
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
 
         # different warning on py3
         if not PY3:
@@ -1161,7 +1421,7 @@ def test_boxplot(self):
             self._check_ax_scales(axes, yaxis='log')
             for ax, label in zip(axes, labels):
                 self._check_text_labels(ax.get_xticklabels(), [label])
-                self.assertEqual(len(ax.lines), self.bp_n_objects)
+                assert len(ax.lines) == self.bp_n_objects
 
         axes = series.plot.box(rot=40)
         self._check_ticks_props(axes, xrot=40, yrot=0)
@@ -1175,9 +1435,9 @@ def test_boxplot(self):
         labels = [pprint_thing(c) for c in numeric_cols]
         self._check_text_labels(ax.get_xticklabels(), labels)
         tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), positions)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_vertical(self):
         df = self.hist_df
         numeric_cols = df._get_numeric_data().columns
@@ -1187,7 +1447,7 @@ def test_boxplot_vertical(self):
         ax = df.plot.box(rot=50, fontsize=8, vert=False)
         self._check_ticks_props(ax, xrot=0, yrot=50, ylabelsize=8)
         self._check_text_labels(ax.get_yticklabels(), labels)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
 
         # _check_plot_works adds an ax so catch warning. see GH #13188
         with tm.assert_produces_warning(UserWarning):
@@ -1197,20 +1457,20 @@ def test_boxplot_vertical(self):
         self._check_ax_scales(axes, xaxis='log')
         for ax, label in zip(axes, labels):
             self._check_text_labels(ax.get_yticklabels(), [label])
-            self.assertEqual(len(ax.lines), self.bp_n_objects)
+            assert len(ax.lines) == self.bp_n_objects
 
         positions = np.array([3, 2, 8])
         ax = df.plot.box(positions=positions, vert=False)
         self._check_text_labels(ax.get_yticklabels(), labels)
         tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), positions)
-        self.assertEqual(len(ax.lines), self.bp_n_objects * len(numeric_cols))
+        assert len(ax.lines) == self.bp_n_objects * len(numeric_cols)
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_return_type(self):
         df = DataFrame(randn(6, 4),
                        index=list(string.ascii_letters[:6]),
                        columns=['one', 'two', 'three', 'four'])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot.box(return_type='NOTATYPE')
 
         result = df.plot.box(return_type='dict')
@@ -1225,13 +1485,13 @@ def test_boxplot_return_type(self):
         result = df.plot.box(return_type='both')
         self._check_box_return_type(result, 'both')
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_subplots_return_type(self):
         df = self.hist_df
 
         # normal style: return_type=None
         result = df.plot.box(subplots=True)
-        self.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         self._check_box_return_type(result, None, expected_keys=[
                                     'height', 'weight', 'category'])
 
@@ -1242,10 +1502,11 @@ def test_boxplot_subplots_return_type(self):
                 expected_keys=['height', 'weight', 'category'],
                 check_ax_title=False)
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_df(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
+
         df = DataFrame(randn(100, 4))
         ax = _check_plot_works(df.plot, kind='kde')
         expected = [pprint_thing(c) for c in df.columns]
@@ -1263,19 +1524,18 @@ def test_kde_df(self):
         axes = df.plot(kind='kde', logy=True, subplots=True)
         self._check_ax_scales(axes, yaxis='log')
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_missing_vals(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
+
         df = DataFrame(np.random.uniform(size=(100, 4)))
         df.loc[0, 0] = np.nan
         _check_plot_works(df.plot, kind='kde')
 
-    @slow
+    @pytest.mark.slow
     def test_hist_df(self):
         from matplotlib.patches import Rectangle
-        if self.mpl_le_1_2_1:
-            pytest.skip("not supported in matplotlib <= 1.2.x")
 
         df = DataFrame(randn(100, 4))
         series = df[0]
@@ -1294,16 +1554,20 @@ def test_hist_df(self):
         self._check_ticks_props(axes, xrot=40, yrot=0)
         tm.close()
 
-        ax = series.plot.hist(normed=True, cumulative=True, bins=4)
+        if plotting._compat._mpl_ge_2_2_0():
+            kwargs = {"density": True}
+        else:
+            kwargs = {"normed": True}
+        ax = series.plot.hist(cumulative=True, bins=4, **kwargs)
         # height of last bin (index 5) must be 1.0
         rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-        self.assertAlmostEqual(rects[-1].get_height(), 1.0)
+        tm.assert_almost_equal(rects[-1].get_height(), 1.0)
         tm.close()
 
         ax = series.plot.hist(cumulative=True, bins=4)
         rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
 
-        self.assertAlmostEqual(rects[-2].get_height(), 100.0)
+        tm.assert_almost_equal(rects[-2].get_height(), 100.0)
         tm.close()
 
         # if horizontal, yticklabels are rotated
@@ -1319,19 +1583,19 @@ def _check_box_coord(self, patches, expected_y=None, expected_h=None,
         # dtype is depending on above values, no need to check
 
         if expected_y is not None:
-            self.assert_numpy_array_equal(result_y, expected_y,
-                                          check_dtype=False)
+            tm.assert_numpy_array_equal(result_y, expected_y,
+                                        check_dtype=False)
         if expected_h is not None:
-            self.assert_numpy_array_equal(result_height, expected_h,
-                                          check_dtype=False)
+            tm.assert_numpy_array_equal(result_height, expected_h,
+                                        check_dtype=False)
         if expected_x is not None:
-            self.assert_numpy_array_equal(result_x, expected_x,
-                                          check_dtype=False)
+            tm.assert_numpy_array_equal(result_x, expected_x,
+                                        check_dtype=False)
         if expected_w is not None:
-            self.assert_numpy_array_equal(result_width, expected_w,
-                                          check_dtype=False)
+            tm.assert_numpy_array_equal(result_width, expected_w,
+                                        check_dtype=False)
 
-    @slow
+    @pytest.mark.slow
     def test_hist_df_coord(self):
         normal_df = DataFrame({'A': np.repeat(np.array([1, 2, 3, 4, 5]),
                                               np.array([10, 9, 8, 7, 6])),
@@ -1383,51 +1647,49 @@ def test_hist_df_coord(self):
                                   expected_y=np.array([0, 0, 0, 0, 0]),
                                   expected_h=np.array([6, 7, 8, 9, 10]))
 
-            if self.mpl_ge_1_3_1:
-
-                # horizontal
-                ax = df.plot.hist(bins=5, orientation='horizontal')
-                self._check_box_coord(ax.patches[:5],
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(ax.patches[5:10],
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(ax.patches[10:],
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([6, 7, 8, 9, 10]))
-
-                ax = df.plot.hist(bins=5, stacked=True,
-                                  orientation='horizontal')
-                self._check_box_coord(ax.patches[:5],
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(ax.patches[5:10],
-                                      expected_x=np.array([10, 9, 8, 7, 6]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(
-                    ax.patches[10:],
-                    expected_x=np.array([18, 17, 16, 15, 14]),
-                    expected_w=np.array([6, 7, 8, 9, 10]))
-
-                axes = df.plot.hist(bins=5, stacked=True, subplots=True,
-                                    orientation='horizontal')
-                self._check_box_coord(axes[0].patches,
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([10, 9, 8, 7, 6]))
-                self._check_box_coord(axes[1].patches,
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([8, 8, 8, 8, 8]))
-                self._check_box_coord(axes[2].patches,
-                                      expected_x=np.array([0, 0, 0, 0, 0]),
-                                      expected_w=np.array([6, 7, 8, 9, 10]))
-
-    @slow
+            # horizontal
+            ax = df.plot.hist(bins=5, orientation='horizontal')
+            self._check_box_coord(ax.patches[:5],
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(ax.patches[5:10],
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(ax.patches[10:],
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([6, 7, 8, 9, 10]))
+
+            ax = df.plot.hist(bins=5, stacked=True,
+                              orientation='horizontal')
+            self._check_box_coord(ax.patches[:5],
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(ax.patches[5:10],
+                                  expected_x=np.array([10, 9, 8, 7, 6]),
+                                  expected_w=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(
+                ax.patches[10:],
+                expected_x=np.array([18, 17, 16, 15, 14]),
+                expected_w=np.array([6, 7, 8, 9, 10]))
+
+            axes = df.plot.hist(bins=5, stacked=True, subplots=True,
+                                orientation='horizontal')
+            self._check_box_coord(axes[0].patches,
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([10, 9, 8, 7, 6]))
+            self._check_box_coord(axes[1].patches,
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([8, 8, 8, 8, 8]))
+            self._check_box_coord(axes[2].patches,
+                                  expected_x=np.array([0, 0, 0, 0, 0]),
+                                  expected_w=np.array([6, 7, 8, 9, 10]))
+
+    @pytest.mark.slow
     def test_plot_int_columns(self):
         df = DataFrame(randn(100, 4)).cumsum()
         _check_plot_works(df.plot, legend=True)
 
-    @slow
+    @pytest.mark.slow
     def test_df_legend_labels(self):
         kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
         df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
@@ -1494,7 +1756,7 @@ def test_df_legend_labels(self):
         self._check_text_labels(ax.xaxis.get_label(), 'a')
         ax = df5.plot(y='c', label='LABEL_c', ax=ax)
         self._check_legend_labels(ax, labels=['LABEL_b', 'LABEL_c'])
-        self.assertTrue(df5.columns.tolist() == ['b', 'c'])
+        assert df5.columns.tolist() == ['b', 'c']
 
     def test_legend_name(self):
         multi = DataFrame(randn(4, 4),
@@ -1520,7 +1782,7 @@ def test_legend_name(self):
         leg_title = ax.legend_.get_title()
         self._check_text_labels(leg_title, 'new')
 
-    @slow
+    @pytest.mark.slow
     def test_no_legend(self):
         kinds = ['line', 'bar', 'barh', 'kde', 'area', 'hist']
         df = DataFrame(rand(3, 3), columns=['a', 'b', 'c'])
@@ -1532,7 +1794,7 @@ def test_no_legend(self):
             ax = df.plot(kind=kind, legend=False)
             self._check_legend_labels(ax, visible=False)
 
-    @slow
+    @pytest.mark.slow
     def test_style_by_column(self):
         import matplotlib.pyplot as plt
         fig = plt.gcf()
@@ -1546,20 +1808,19 @@ def test_style_by_column(self):
             fig.add_subplot(111)
             ax = df.plot(style=markers)
             for i, l in enumerate(ax.get_lines()[:len(markers)]):
-                self.assertEqual(l.get_marker(), markers[i])
+                assert l.get_marker() == markers[i]
 
-    @slow
+    @pytest.mark.slow
     def test_line_label_none(self):
         s = Series([1, 2])
         ax = s.plot()
-        self.assertEqual(ax.get_legend(), None)
+        assert ax.get_legend() is None
 
         ax = s.plot(legend=True)
-        self.assertEqual(ax.get_legend().get_texts()[0].get_text(), 'None')
+        assert ax.get_legend().get_texts()[0].get_text() == 'None'
 
-    @slow
+    @pytest.mark.slow
     def test_line_colors(self):
-        import sys
         from matplotlib import cm
 
         custom_colors = 'rgcby'
@@ -1568,16 +1829,13 @@ def test_line_colors(self):
         ax = df.plot(color=custom_colors)
         self._check_colors(ax.get_lines(), linecolors=custom_colors)
 
-        tmp = sys.stderr
-        sys.stderr = StringIO()
-        try:
-            tm.close()
-            ax2 = df.plot(colors=custom_colors)
-            lines2 = ax2.get_lines()
-            for l1, l2 in zip(ax.get_lines(), lines2):
-                self.assertEqual(l1.get_color(), l2.get_color())
-        finally:
-            sys.stderr = tmp
+        tm.close()
+
+        ax2 = df.plot(color=custom_colors)
+        lines2 = ax2.get_lines()
+
+        for l1, l2 in zip(ax.get_lines(), lines2):
+            assert l1.get_color() == l2.get_color()
 
         tm.close()
 
@@ -1606,30 +1864,29 @@ def test_line_colors(self):
         self._check_colors(ax.get_lines(), linecolors=custom_colors)
         tm.close()
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             # Color contains shorthand hex value results in ValueError
             custom_colors = ['#F00', '#00F', '#FF0', '#000', '#FFF']
             # Forced show plot
             _check_plot_works(df.plot, color=custom_colors)
 
-    @slow
+    @pytest.mark.slow
     def test_dont_modify_colors(self):
         colors = ['r', 'g', 'b']
         pd.DataFrame(np.random.rand(10, 2)).plot(color=colors)
-        self.assertEqual(len(colors), 3)
+        assert len(colors) == 3
 
-    @slow
+    @pytest.mark.slow
     def test_line_colors_and_styles_subplots(self):
         # GH 9894
         from matplotlib import cm
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+        default_colors = self._unpack_cycler(self.plt.rcParams)
 
         df = DataFrame(randn(5, 5))
 
         axes = df.plot(subplots=True)
         for ax, c in zip(axes, list(default_colors)):
-            if self.mpl_ge_2_0_0:
-                c = [c]
+            c = [c]
             self._check_colors(ax.get_lines(), linecolors=c)
         tm.close()
 
@@ -1663,7 +1920,7 @@ def test_line_colors_and_styles_subplots(self):
             self._check_colors(ax.get_lines(), linecolors=[c])
         tm.close()
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             # Color contains shorthand hex value results in ValueError
             custom_colors = ['#F00', '#00F', '#FF0', '#000', '#FFF']
             # Forced show plot
@@ -1696,7 +1953,7 @@ def test_line_colors_and_styles_subplots(self):
             self._check_colors(ax.get_lines(), linecolors=[c])
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_area_colors(self):
         from matplotlib import cm
         from matplotlib.collections import PolyCollection
@@ -1710,16 +1967,10 @@ def test_area_colors(self):
         self._check_colors(poly, facecolors=custom_colors)
 
         handles, labels = ax.get_legend_handles_labels()
-        if self.mpl_ge_1_5_0:
-            self._check_colors(handles, facecolors=custom_colors)
-        else:
-            # legend is stored as Line2D, thus check linecolors
-            linehandles = [x for x in handles
-                           if not isinstance(x, PolyCollection)]
-            self._check_colors(linehandles, linecolors=custom_colors)
+        self._check_colors(handles, facecolors=custom_colors)
 
         for h in handles:
-            self.assertTrue(h.get_alpha() is None)
+            assert h.get_alpha() is None
         tm.close()
 
         ax = df.plot.area(colormap='jet')
@@ -1729,14 +1980,9 @@ def test_area_colors(self):
         self._check_colors(poly, facecolors=jet_colors)
 
         handles, labels = ax.get_legend_handles_labels()
-        if self.mpl_ge_1_5_0:
-            self._check_colors(handles, facecolors=jet_colors)
-        else:
-            linehandles = [x for x in handles
-                           if not isinstance(x, PolyCollection)]
-            self._check_colors(linehandles, linecolors=jet_colors)
+        self._check_colors(handles, facecolors=jet_colors)
         for h in handles:
-            self.assertTrue(h.get_alpha() is None)
+            assert h.get_alpha() is None
         tm.close()
 
         # When stacked=False, alpha is set to 0.5
@@ -1747,18 +1993,14 @@ def test_area_colors(self):
         self._check_colors(poly, facecolors=jet_with_alpha)
 
         handles, labels = ax.get_legend_handles_labels()
-        if self.mpl_ge_1_5_0:
-            linecolors = jet_with_alpha
-        else:
-            # Line2D can't have alpha in its linecolor
-            linecolors = jet_colors
+        linecolors = jet_with_alpha
         self._check_colors(handles[:len(jet_colors)], linecolors=linecolors)
         for h in handles:
-            self.assertEqual(h.get_alpha(), 0.5)
+            assert h.get_alpha() == 0.5
 
-    @slow
+    @pytest.mark.slow
     def test_hist_colors(self):
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+        default_colors = self._unpack_cycler(self.plt.rcParams)
 
         df = DataFrame(randn(5, 5))
         ax = df.plot.hist()
@@ -1790,9 +2032,9 @@ def test_hist_colors(self):
         self._check_colors(ax.patches[::10], facecolors=['green'] * 5)
         tm.close()
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_colors(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
 
         from matplotlib import cm
@@ -1813,13 +2055,13 @@ def test_kde_colors(self):
         rgba_colors = lmap(cm.jet, np.linspace(0, 1, len(df)))
         self._check_colors(ax.get_lines(), linecolors=rgba_colors)
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_colors_and_styles_subplots(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
 
         from matplotlib import cm
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+        default_colors = self._unpack_cycler(self.plt.rcParams)
 
         df = DataFrame(randn(5, 5))
 
@@ -1872,13 +2114,13 @@ def test_kde_colors_and_styles_subplots(self):
             self._check_colors(ax.get_lines(), linecolors=[c])
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_colors(self):
         def _check_colors(bp, box_c, whiskers_c, medians_c, caps_c='k',
                           fliers_c=None):
             # TODO: outside this func?
             if fliers_c is None:
-                fliers_c = 'k' if self.mpl_ge_2_0_0 else 'b'
+                fliers_c = 'k'
             self._check_colors(bp['boxes'],
                                linecolors=[box_c] * len(bp['boxes']))
             self._check_colors(bp['whiskers'],
@@ -1890,7 +2132,7 @@ def _check_colors(bp, box_c, whiskers_c, medians_c, caps_c='k',
             self._check_colors(bp['caps'],
                                linecolors=[caps_c] * len(bp['caps']))
 
-        default_colors = self._maybe_unpack_cycler(self.plt.rcParams)
+        default_colors = self._unpack_cycler(self.plt.rcParams)
 
         df = DataFrame(randn(5, 5))
         bp = df.plot.box(return_type='dict')
@@ -1933,23 +2175,20 @@ def _check_colors(bp, box_c, whiskers_c, medians_c, caps_c='k',
         _check_colors(bp, (0, 1, 0), (0, 1, 0), (0, 1, 0),
                       (0, 1, 0), '#123456')
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             # Color contains invalid key results in ValueError
             df.plot.box(color=dict(boxes='red', xxxx='blue'))
 
     def test_default_color_cycle(self):
         import matplotlib.pyplot as plt
+        import cycler
         colors = list('rgbk')
-        if self.mpl_ge_1_5_0:
-            import cycler
-            plt.rcParams['axes.prop_cycle'] = cycler.cycler('color', colors)
-        else:
-            plt.rcParams['axes.color_cycle'] = colors
+        plt.rcParams['axes.prop_cycle'] = cycler.cycler('color', colors)
 
         df = DataFrame(randn(5, 3))
         ax = df.plot()
 
-        expected = self._maybe_unpack_cycler(plt.rcParams)[:3]
+        expected = self._unpack_cycler(plt.rcParams)[:3]
         self._check_colors(ax.get_lines(), linecolors=expected)
 
     def test_unordered_ts(self):
@@ -1960,13 +2199,13 @@ def test_unordered_ts(self):
                        columns=['test'])
         ax = df.plot()
         xticks = ax.lines[0].get_xdata()
-        self.assertTrue(xticks[0] < xticks[1])
+        assert xticks[0] < xticks[1]
         ydata = ax.lines[0].get_ydata()
         tm.assert_numpy_array_equal(ydata, np.array([1.0, 2.0, 3.0]))
 
     def test_kind_both_ways(self):
         df = DataFrame({'x': [1, 2, 3]})
-        for kind in plotting._common_kinds:
+        for kind in plotting._core._common_kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
             df.plot(kind=kind)
@@ -1977,21 +2216,21 @@ def test_kind_both_ways(self):
 
     def test_all_invalid_plot_data(self):
         df = DataFrame(list('abcd'))
-        for kind in plotting._common_kinds:
+        for kind in plotting._core._common_kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
-            with tm.assertRaises(TypeError):
+            with pytest.raises(TypeError):
                 df.plot(kind=kind)
 
-    @slow
+    @pytest.mark.slow
     def test_partially_invalid_plot_data(self):
         with tm.RNGContext(42):
             df = DataFrame(randn(10, 2), dtype=object)
             df[np.random.rand(df.shape[0]) > 0.5] = 'a'
-            for kind in plotting._common_kinds:
+            for kind in plotting._core._common_kinds:
                 if not _ok_for_gaussian_kde(kind):
                     continue
-                with tm.assertRaises(TypeError):
+                with pytest.raises(TypeError):
                     df.plot(kind=kind)
 
         with tm.RNGContext(42):
@@ -2000,74 +2239,119 @@ def test_partially_invalid_plot_data(self):
             df = DataFrame(rand(10, 2), dtype=object)
             df[np.random.rand(df.shape[0]) > 0.5] = 'a'
             for kind in kinds:
-                with tm.assertRaises(TypeError):
+                with pytest.raises(TypeError):
                     df.plot(kind=kind)
 
     def test_invalid_kind(self):
         df = DataFrame(randn(10, 2))
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot(kind='aasdf')
 
-    @slow
+    @pytest.mark.parametrize("x,y,lbl", [
+        (['B', 'C'], 'A', 'a'),
+        (['A'], ['B', 'C'], ['b', 'c']),
+        ('A', ['B', 'C'], 'badlabel')
+    ])
+    def test_invalid_xy_args(self, x, y, lbl):
+        # GH 18671, 19699 allows y to be list-like but not x
+        df = DataFrame({"A": [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        with pytest.raises(ValueError):
+            df.plot(x=x, y=y, label=lbl)
+
+    @pytest.mark.parametrize("x,y", [
+        ('A', 'B'),
+        (['A'], 'B')
+    ])
+    def test_invalid_xy_args_dup_cols(self, x, y):
+        # GH 18671, 19699 allows y to be list-like but not x
+        df = DataFrame([[1, 3, 5], [2, 4, 6]], columns=list('AAB'))
+        with pytest.raises(ValueError):
+            df.plot(x=x, y=y)
+
+    @pytest.mark.parametrize("x,y,lbl,colors", [
+        ('A', ['B'], ['b'], ['red']),
+        ('A', ['B', 'C'], ['b', 'c'], ['red', 'blue']),
+        (0, [1, 2], ['bokeh', 'cython'], ['green', 'yellow'])
+    ])
+    def test_y_listlike(self, x, y, lbl, colors):
+        # GH 19699: tests list-like y and verifies lbls & colors
+        df = DataFrame({"A": [1, 2], 'B': [3, 4], 'C': [5, 6]})
+        _check_plot_works(df.plot, x='A', y=y, label=lbl)
+
+        ax = df.plot(x=x, y=y, label=lbl, color=colors)
+        assert len(ax.lines) == len(y)
+        self._check_colors(ax.get_lines(), linecolors=colors)
+
+    @pytest.mark.parametrize("x,y,colnames", [
+        (0, 1, ['A', 'B']),
+        (1, 0, [0, 1])
+    ])
+    def test_xy_args_integer(self, x, y, colnames):
+        # GH 20056: tests integer args for xy and checks col names
+        df = DataFrame({"A": [1, 2], 'B': [3, 4]})
+        df.columns = colnames
+        _check_plot_works(df.plot, x=x, y=y)
+
+    @pytest.mark.slow
     def test_hexbin_basic(self):
         df = self.hexbin_df
 
         ax = df.plot.hexbin(x='A', y='B', gridsize=10)
         # TODO: need better way to test. This just does existence.
-        self.assertEqual(len(ax.collections), 1)
+        assert len(ax.collections) == 1
 
         # GH 6951
         axes = df.plot.hexbin(x='A', y='B', subplots=True)
         # hexbin should have 2 axes in the figure, 1 for plotting and another
         # is colorbar
-        self.assertEqual(len(axes[0].figure.axes), 2)
+        assert len(axes[0].figure.axes) == 2
         # return value is single axes
         self._check_axes_shape(axes, axes_num=1, layout=(1, 1))
 
-    @slow
+    @pytest.mark.slow
     def test_hexbin_with_c(self):
         df = self.hexbin_df
 
         ax = df.plot.hexbin(x='A', y='B', C='C')
-        self.assertEqual(len(ax.collections), 1)
+        assert len(ax.collections) == 1
 
         ax = df.plot.hexbin(x='A', y='B', C='C', reduce_C_function=np.std)
-        self.assertEqual(len(ax.collections), 1)
+        assert len(ax.collections) == 1
 
-    @slow
+    @pytest.mark.slow
     def test_hexbin_cmap(self):
         df = self.hexbin_df
 
         # Default to BuGn
         ax = df.plot.hexbin(x='A', y='B')
-        self.assertEqual(ax.collections[0].cmap.name, 'BuGn')
+        assert ax.collections[0].cmap.name == 'BuGn'
 
         cm = 'cubehelix'
         ax = df.plot.hexbin(x='A', y='B', colormap=cm)
-        self.assertEqual(ax.collections[0].cmap.name, cm)
+        assert ax.collections[0].cmap.name == cm
 
-    @slow
+    @pytest.mark.slow
     def test_no_color_bar(self):
         df = self.hexbin_df
 
         ax = df.plot.hexbin(x='A', y='B', colorbar=None)
-        self.assertIs(ax.collections[0].colorbar, None)
+        assert ax.collections[0].colorbar is None
 
-    @slow
+    @pytest.mark.slow
     def test_allow_cmap(self):
         df = self.hexbin_df
 
         ax = df.plot.hexbin(x='A', y='B', cmap='YlGn')
-        self.assertEqual(ax.collections[0].cmap.name, 'YlGn')
+        assert ax.collections[0].cmap.name == 'YlGn'
 
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             df.plot.hexbin(x='A', y='B', cmap='YlGn', colormap='BuGn')
 
-    @slow
+    @pytest.mark.slow
     def test_pie_df(self):
         df = DataFrame(np.random.rand(5, 3), columns=['X', 'Y', 'Z'],
                        index=['a', 'b', 'c', 'd', 'e'])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot.pie()
 
         ax = _check_plot_works(df.plot.pie, y='Y')
@@ -2080,11 +2364,11 @@ def test_pie_df(self):
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(df.plot.pie,
                                      subplots=True)
-        self.assertEqual(len(axes), len(df.columns))
+        assert len(axes) == len(df.columns)
         for ax in axes:
             self._check_text_labels(ax.texts, df.index)
         for ax, ylabel in zip(axes, df.columns):
-            self.assertEqual(ax.get_ylabel(), ylabel)
+            assert ax.get_ylabel() == ylabel
 
         labels = ['A', 'B', 'C', 'D', 'E']
         color_args = ['r', 'g', 'b', 'c', 'm']
@@ -2092,7 +2376,7 @@ def test_pie_df(self):
             axes = _check_plot_works(df.plot.pie,
                                      subplots=True, labels=labels,
                                      colors=color_args)
-        self.assertEqual(len(axes), len(df.columns))
+        assert len(axes) == len(df.columns)
 
         for ax in axes:
             self._check_text_labels(ax.texts, labels)
@@ -2110,83 +2394,85 @@ def test_pie_df_nan(self):
             expected = list(base_expected)  # force copy
             expected[i] = ''
             result = [x.get_text() for x in ax.texts]
-            self.assertEqual(result, expected)
+            assert result == expected
             # legend labels
             # NaN's not included in legend with subplots
             # see https://github.com/pandas-dev/pandas/issues/8390
-            self.assertEqual([x.get_text() for x in
-                              ax.get_legend().get_texts()],
-                             base_expected[:i] + base_expected[i + 1:])
+            assert ([x.get_text() for x in ax.get_legend().get_texts()] ==
+                    base_expected[:i] + base_expected[i + 1:])
 
-    @slow
+    @pytest.mark.slow
     def test_errorbar_plot(self):
-        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
-        df = DataFrame(d)
-        d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
-        df_err = DataFrame(d_err)
-
-        # check line plots
-        ax = _check_plot_works(df.plot, yerr=df_err, logy=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-        ax = _check_plot_works(df.plot, yerr=df_err, logx=True, logy=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
-        ax = _check_plot_works(df.plot, yerr=df_err, loglog=True)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
+        with warnings.catch_warnings():
+            d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
+            df = DataFrame(d)
+            d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
+            df_err = DataFrame(d_err)
 
-        kinds = ['line', 'bar', 'barh']
-        for kind in kinds:
-            ax = _check_plot_works(df.plot, yerr=df_err['x'], kind=kind)
+            # check line plots
+            ax = _check_plot_works(df.plot, yerr=df_err, logy=True)
             self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=d_err, kind=kind)
+            ax = _check_plot_works(df.plot, yerr=df_err, logx=True, logy=True)
             self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=df_err, xerr=df_err,
-                                   kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            ax = _check_plot_works(df.plot, yerr=df_err['x'], xerr=df_err['x'],
-                                   kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            ax = _check_plot_works(df.plot, xerr=0.2, yerr=0.2, kind=kind)
-            self._check_has_errorbars(ax, xerr=2, yerr=2)
-            # _check_plot_works adds an ax so catch warning. see GH #13188
-            with tm.assert_produces_warning(UserWarning):
+            ax = _check_plot_works(df.plot, yerr=df_err, loglog=True)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+            kinds = ['line', 'bar', 'barh']
+            for kind in kinds:
+                ax = _check_plot_works(df.plot, yerr=df_err['x'], kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=d_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=df_err, xerr=df_err,
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+                ax = _check_plot_works(df.plot, yerr=df_err['x'],
+                                       xerr=df_err['x'],
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+                ax = _check_plot_works(df.plot, xerr=0.2, yerr=0.2, kind=kind)
+                self._check_has_errorbars(ax, xerr=2, yerr=2)
+
+                # _check_plot_works adds an ax so catch warning. see GH #13188
                 axes = _check_plot_works(df.plot,
                                          yerr=df_err, xerr=df_err,
                                          subplots=True,
                                          kind=kind)
-            self._check_has_errorbars(axes, xerr=1, yerr=1)
-
-        ax = _check_plot_works((df + 1).plot, yerr=df_err,
-                               xerr=df_err, kind='bar', log=True)
-        self._check_has_errorbars(ax, xerr=2, yerr=2)
+                self._check_has_errorbars(axes, xerr=1, yerr=1)
 
-        # yerr is raw error values
-        ax = _check_plot_works(df['y'].plot, yerr=np.ones(12) * 0.4)
-        self._check_has_errorbars(ax, xerr=0, yerr=1)
-        ax = _check_plot_works(df.plot, yerr=np.ones((2, 12)) * 0.4)
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
+            ax = _check_plot_works((df + 1).plot, yerr=df_err,
+                                   xerr=df_err, kind='bar', log=True)
+            self._check_has_errorbars(ax, xerr=2, yerr=2)
 
-        # yerr is iterator
-        import itertools
-        ax = _check_plot_works(df.plot, yerr=itertools.repeat(0.1, len(df)))
-        self._check_has_errorbars(ax, xerr=0, yerr=2)
+            # yerr is raw error values
+            ax = _check_plot_works(df['y'].plot, yerr=np.ones(12) * 0.4)
+            self._check_has_errorbars(ax, xerr=0, yerr=1)
+            ax = _check_plot_works(df.plot, yerr=np.ones((2, 12)) * 0.4)
+            self._check_has_errorbars(ax, xerr=0, yerr=2)
 
-        # yerr is column name
-        for yerr in ['yerr', u('誤差')]:
-            s_df = df.copy()
-            s_df[yerr] = np.ones(12) * 0.2
-            ax = _check_plot_works(s_df.plot, yerr=yerr)
+            # yerr is iterator
+            import itertools
+            ax = _check_plot_works(df.plot,
+                                   yerr=itertools.repeat(0.1, len(df)))
             self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(s_df.plot, y='y', x='x', yerr=yerr)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
 
-        with tm.assertRaises(ValueError):
-            df.plot(yerr=np.random.randn(11))
+            # yerr is column name
+            for yerr in ['yerr', u('誤差')]:
+                s_df = df.copy()
+                s_df[yerr] = np.ones(12) * 0.2
+                ax = _check_plot_works(s_df.plot, yerr=yerr)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(s_df.plot, y='y', x='x', yerr=yerr)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+
+            with pytest.raises(ValueError):
+                df.plot(yerr=np.random.randn(11))
 
-        df_err = DataFrame({'x': ['zzz'] * 12, 'y': ['zzz'] * 12})
-        with tm.assertRaises((ValueError, TypeError)):
-            df.plot(yerr=df_err)
+            df_err = DataFrame({'x': ['zzz'] * 12, 'y': ['zzz'] * 12})
+            with pytest.raises((ValueError, TypeError)):
+                df.plot(yerr=df_err)
 
-    @slow
+    @pytest.mark.slow
     def test_errorbar_with_integer_column_names(self):
         # test with integer column names
         df = DataFrame(np.random.randn(10, 2))
@@ -2196,7 +2482,7 @@ def test_errorbar_with_integer_column_names(self):
         ax = _check_plot_works(df.plot, y=0, yerr=1)
         self._check_has_errorbars(ax, xerr=0, yerr=1)
 
-    @slow
+    @pytest.mark.slow
     def test_errorbar_with_partial_columns(self):
         df = DataFrame(np.random.randn(10, 3))
         df_err = DataFrame(np.random.randn(10, 2), columns=[0, 2])
@@ -2219,36 +2505,37 @@ def test_errorbar_with_partial_columns(self):
             ax = _check_plot_works(df.plot, yerr=err)
             self._check_has_errorbars(ax, xerr=0, yerr=1)
 
-    @slow
+    @pytest.mark.slow
     def test_errorbar_timeseries(self):
 
-        d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
-        d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
+        with warnings.catch_warnings():
+            d = {'x': np.arange(12), 'y': np.arange(12, 0, -1)}
+            d_err = {'x': np.ones(12) * 0.2, 'y': np.ones(12) * 0.4}
 
-        # check time-series plots
-        ix = date_range('1/1/2000', '1/1/2001', freq='M')
-        tdf = DataFrame(d, index=ix)
-        tdf_err = DataFrame(d_err, index=ix)
+            # check time-series plots
+            ix = date_range('1/1/2000', '1/1/2001', freq='M')
+            tdf = DataFrame(d, index=ix)
+            tdf_err = DataFrame(d_err, index=ix)
 
-        kinds = ['line', 'bar', 'barh']
-        for kind in kinds:
-            ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(tdf.plot, yerr=d_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            ax = _check_plot_works(tdf.plot, y='y', yerr=tdf_err['x'],
-                                   kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(tdf.plot, y='y', yerr='x', kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=1)
-            ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
-            self._check_has_errorbars(ax, xerr=0, yerr=2)
-            # _check_plot_works adds an ax so catch warning. see GH #13188
-            with tm.assert_produces_warning(UserWarning):
+            kinds = ['line', 'bar', 'barh']
+            for kind in kinds:
+                ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(tdf.plot, yerr=d_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+                ax = _check_plot_works(tdf.plot, y='y', yerr=tdf_err['x'],
+                                       kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+                ax = _check_plot_works(tdf.plot, y='y', yerr='x', kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=1)
+                ax = _check_plot_works(tdf.plot, yerr=tdf_err, kind=kind)
+                self._check_has_errorbars(ax, xerr=0, yerr=2)
+
+                # _check_plot_works adds an ax so catch warning. see GH #13188
                 axes = _check_plot_works(tdf.plot,
                                          kind=kind, yerr=tdf_err,
                                          subplots=True)
-            self._check_has_errorbars(axes, xerr=0, yerr=1)
+                self._check_has_errorbars(axes, xerr=0, yerr=1)
 
     def test_errorbar_asymmetrical(self):
 
@@ -2257,28 +2544,20 @@ def test_errorbar_asymmetrical(self):
 
         # each column is [0, 1, 2, 3, 4], [3, 4, 5, 6, 7]...
         df = DataFrame(np.arange(15).reshape(3, 5)).T
-        data = df.values
 
         ax = df.plot(yerr=err, xerr=err / 2)
 
-        if self.mpl_ge_2_0_0:
-            yerr_0_0 = ax.collections[1].get_paths()[0].vertices[:, 1]
-            expected_0_0 = err[0, :, 0] * np.array([-1, 1])
-            tm.assert_almost_equal(yerr_0_0, expected_0_0)
-        else:
-            self.assertEqual(ax.lines[7].get_ydata()[0],
-                             data[0, 1] - err[1, 0, 0])
-            self.assertEqual(ax.lines[8].get_ydata()[0],
-                             data[0, 1] + err[1, 1, 0])
-
-            self.assertEqual(ax.lines[5].get_xdata()[0], -err[1, 0, 0] / 2)
-            self.assertEqual(ax.lines[6].get_xdata()[0], err[1, 1, 0] / 2)
+        yerr_0_0 = ax.collections[1].get_paths()[0].vertices[:, 1]
+        expected_0_0 = err[0, :, 0] * np.array([-1, 1])
+        tm.assert_almost_equal(yerr_0_0, expected_0_0)
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot(yerr=err.T)
 
         tm.close()
 
+    # This XPASSES when tested with mpl == 3.0.1
+    @td.xfail_if_mpl_2_2
     def test_table(self):
         df = DataFrame(np.random.rand(10, 3),
                        index=list(string.ascii_letters[:10]))
@@ -2286,9 +2565,9 @@ def test_table(self):
         _check_plot_works(df.plot, table=df)
 
         ax = df.plot()
-        self.assertTrue(len(ax.tables) == 0)
+        assert len(ax.tables) == 0
         plotting.table(ax, df.T)
-        self.assertTrue(len(ax.tables) == 1)
+        assert len(ax.tables) == 1
 
     def test_errorbar_scatter(self):
         df = DataFrame(
@@ -2332,7 +2611,7 @@ def _check_errorbar_color(containers, expected, has_err='has_xerr'):
         self._check_has_errorbars(ax, xerr=0, yerr=1)
         _check_errorbar_color(ax.containers, 'green', has_err='has_yerr')
 
-    @slow
+    @pytest.mark.slow
     def test_sharex_and_ax(self):
         # https://github.com/pandas-dev/pandas/issues/9737 using gridspec,
         # the axis in fig.get_axis() are sorted differently than pandas
@@ -2348,7 +2627,7 @@ def test_sharex_and_ax(self):
 
         def _check(axes):
             for ax in axes:
-                self.assertEqual(len(ax.lines), 1)
+                assert len(ax.lines) == 1
                 self._check_visible(ax.get_yticklabels(), visible=True)
             for ax in [axes[0], axes[2]]:
                 self._check_visible(ax.get_xticklabels(), visible=False)
@@ -2378,13 +2657,13 @@ def _check(axes):
 
         gs.tight_layout(plt.gcf())
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             self._check_visible(ax.get_yticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(minor=True), visible=True)
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_sharey_and_ax(self):
         # https://github.com/pandas-dev/pandas/issues/9737 using gridspec,
         # the axis in fig.get_axis() are sorted differently than pandas
@@ -2400,7 +2679,7 @@ def test_sharey_and_ax(self):
 
         def _check(axes):
             for ax in axes:
-                self.assertEqual(len(ax.lines), 1)
+                assert len(ax.lines) == 1
                 self._check_visible(ax.get_xticklabels(), visible=True)
                 self._check_visible(
                     ax.get_xticklabels(minor=True), visible=True)
@@ -2430,7 +2709,7 @@ def _check(axes):
 
         gs.tight_layout(plt.gcf())
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             self._check_visible(ax.get_yticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(minor=True), visible=True)
@@ -2441,7 +2720,7 @@ def test_memory_leak(self):
         import gc
 
         results = {}
-        for kind in plotting._plot_klass.keys():
+        for kind in plotting._core._plot_klass.keys():
             if not _ok_for_gaussian_kde(kind):
                 continue
             args = {}
@@ -2463,11 +2742,11 @@ def test_memory_leak(self):
         gc.collect()
         for key in results:
             # check that every plot was collected
-            with tm.assertRaises(ReferenceError):
+            with pytest.raises(ReferenceError):
                 # need to actually access something to get an error
                 results[key].lines
 
-    @slow
+    @pytest.mark.slow
     def test_df_subplots_patterns_minorticks(self):
         # GH 10657
         import matplotlib.pyplot as plt
@@ -2480,7 +2759,7 @@ def test_df_subplots_patterns_minorticks(self):
         fig, axes = plt.subplots(2, 1, sharex=True)
         axes = df.plot(subplots=True, ax=axes)
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             self._check_visible(ax.get_yticklabels(), visible=True)
         # xaxis of 1st ax must be hidden
         self._check_visible(axes[0].get_xticklabels(), visible=False)
@@ -2493,7 +2772,7 @@ def test_df_subplots_patterns_minorticks(self):
         with tm.assert_produces_warning(UserWarning):
             axes = df.plot(subplots=True, ax=axes, sharex=True)
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             self._check_visible(ax.get_yticklabels(), visible=True)
         # xaxis of 1st ax must be hidden
         self._check_visible(axes[0].get_xticklabels(), visible=False)
@@ -2506,13 +2785,13 @@ def test_df_subplots_patterns_minorticks(self):
         fig, axes = plt.subplots(2, 1)
         axes = df.plot(subplots=True, ax=axes)
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             self._check_visible(ax.get_yticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(minor=True), visible=True)
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_df_gridspec_patterns(self):
         # GH 10819
         import matplotlib.pyplot as plt
@@ -2540,9 +2819,9 @@ def _get_horizontal_grid():
 
         for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
             ax1 = ts.plot(ax=ax1)
-            self.assertEqual(len(ax1.lines), 1)
+            assert len(ax1.lines) == 1
             ax2 = df.plot(ax=ax2)
-            self.assertEqual(len(ax2.lines), 2)
+            assert len(ax2.lines) == 2
             for ax in [ax1, ax2]:
                 self._check_visible(ax.get_yticklabels(), visible=True)
                 self._check_visible(ax.get_xticklabels(), visible=True)
@@ -2553,8 +2832,8 @@ def _get_horizontal_grid():
         # subplots=True
         for ax1, ax2 in [_get_vertical_grid(), _get_horizontal_grid()]:
             axes = df.plot(subplots=True, ax=[ax1, ax2])
-            self.assertEqual(len(ax1.lines), 1)
-            self.assertEqual(len(ax2.lines), 1)
+            assert len(ax1.lines) == 1
+            assert len(ax2.lines) == 1
             for ax in axes:
                 self._check_visible(ax.get_yticklabels(), visible=True)
                 self._check_visible(ax.get_xticklabels(), visible=True)
@@ -2567,8 +2846,8 @@ def _get_horizontal_grid():
         with tm.assert_produces_warning(UserWarning):
             axes = df.plot(subplots=True, ax=[ax1, ax2], sharex=True,
                            sharey=True)
-        self.assertEqual(len(axes[0].lines), 1)
-        self.assertEqual(len(axes[1].lines), 1)
+        assert len(axes[0].lines) == 1
+        assert len(axes[1].lines) == 1
         for ax in [ax1, ax2]:
             # yaxis are visible because there is only one column
             self._check_visible(ax.get_yticklabels(), visible=True)
@@ -2584,8 +2863,8 @@ def _get_horizontal_grid():
         with tm.assert_produces_warning(UserWarning):
             axes = df.plot(subplots=True, ax=[ax1, ax2], sharex=True,
                            sharey=True)
-        self.assertEqual(len(axes[0].lines), 1)
-        self.assertEqual(len(axes[1].lines), 1)
+        assert len(axes[0].lines) == 1
+        assert len(axes[1].lines) == 1
         self._check_visible(axes[0].get_yticklabels(), visible=True)
         # yaxis of axes1 (right) are hidden
         self._check_visible(axes[1].get_yticklabels(), visible=False)
@@ -2610,7 +2889,7 @@ def _get_boxed_grid():
                        index=ts.index, columns=list('ABCD'))
         axes = df.plot(subplots=True, ax=axes)
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
             # axis are visible because these are not shared
             self._check_visible(ax.get_yticklabels(), visible=True)
             self._check_visible(ax.get_xticklabels(), visible=True)
@@ -2622,7 +2901,7 @@ def _get_boxed_grid():
         with tm.assert_produces_warning(UserWarning):
             axes = df.plot(subplots=True, ax=axes, sharex=True, sharey=True)
         for ax in axes:
-            self.assertEqual(len(ax.lines), 1)
+            assert len(ax.lines) == 1
         for ax in [axes[0], axes[2]]:  # left column
             self._check_visible(ax.get_yticklabels(), visible=True)
         for ax in [axes[1], axes[3]]:  # right column
@@ -2635,31 +2914,17 @@ def _get_boxed_grid():
             self._check_visible(ax.get_xticklabels(minor=True), visible=True)
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_df_grid_settings(self):
         # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
         self._check_grid_settings(
             DataFrame({'a': [1, 2, 3], 'b': [2, 3, 4]}),
-            plotting._dataframe_kinds, kws={'x': 'a', 'y': 'b'})
-
-    def test_option_mpl_style(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            set_option('display.mpl_style', 'default')
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            set_option('display.mpl_style', None)
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            set_option('display.mpl_style', False)
-
-        with tm.assertRaises(ValueError):
-            set_option('display.mpl_style', 'default2')
+            plotting._core._dataframe_kinds, kws={'x': 'a', 'y': 'b'})
 
     def test_invalid_colormap(self):
         df = DataFrame(randn(3, 2), columns=['A', 'B'])
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.plot(colormap='invalid_colormap')
 
     def test_plain_axes(self):
@@ -2686,7 +2951,7 @@ def test_plain_axes(self):
         Series(rand(10)).plot(ax=cax)
 
         fig, ax = self.plt.subplots()
-        from mpl_toolkits.axes_grid.inset_locator import inset_axes
+        from mpl_toolkits.axes_grid1.inset_locator import inset_axes
         iax = inset_axes(ax, width="30%", height=1., loc=3)
         Series(rand(10)).plot(ax=ax)
         Series(rand(10)).plot(ax=iax)
@@ -2696,21 +2961,32 @@ def test_passed_bar_colors(self):
         color_tuples = [(0.9, 0, 0, 1), (0, 0.9, 0, 1), (0, 0, 0.9, 1)]
         colormap = mpl.colors.ListedColormap(color_tuples)
         barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar", cmap=colormap)
-        self.assertEqual(color_tuples, [c.get_facecolor()
-                                        for c in barplot.patches])
+        assert color_tuples == [c.get_facecolor() for c in barplot.patches]
 
     def test_rcParams_bar_colors(self):
         import matplotlib as mpl
         color_tuples = [(0.9, 0, 0, 1), (0, 0.9, 0, 1), (0, 0, 0.9, 1)]
-        try:  # mpl 1.5
-            with mpl.rc_context(
-                    rc={'axes.prop_cycle': mpl.cycler("color", color_tuples)}):
-                barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar")
-        except (AttributeError, KeyError):  # mpl 1.4
-            with mpl.rc_context(rc={'axes.color_cycle': color_tuples}):
-                barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar")
-        self.assertEqual(color_tuples, [c.get_facecolor()
-                                        for c in barplot.patches])
+        with mpl.rc_context(
+                rc={'axes.prop_cycle': mpl.cycler("color", color_tuples)}):
+            barplot = pd.DataFrame([[1, 2, 3]]).plot(kind="bar")
+        assert color_tuples == [c.get_facecolor() for c in barplot.patches]
+
+    @pytest.mark.parametrize('method', ['line', 'barh', 'bar'])
+    def test_secondary_axis_font_size(self, method):
+        # GH: 12565
+        df = (pd.DataFrame(np.random.randn(15, 2),
+                           columns=list('AB'))
+              .assign(C=lambda df: df.B.cumsum())
+              .assign(D=lambda df: df.C * 1.1))
+
+        fontsize = 20
+        sy = ['C', 'D']
+
+        kwargs = dict(secondary_y=sy, fontsize=fontsize,
+                      mark_right=True)
+        ax = getattr(df.plot, method)(**kwargs)
+        self._check_ticks_props(axes=ax.right_ax,
+                                ylabelsize=fontsize)
 
 
 def _generate_4_axes_via_gridspec():
diff --git a/pandas/tests/plotting/test_groupby.py b/pandas/tests/plotting/test_groupby.py
index 93efb3f994c38..5a5ee75928c97 100644
--- a/pandas/tests/plotting/test_groupby.py
+++ b/pandas/tests/plotting/test_groupby.py
@@ -3,15 +3,16 @@
 """ Test cases for GroupBy.plot """
 
 
-from pandas import Series, DataFrame
-import pandas.util.testing as tm
-
 import numpy as np
 
+import pandas.util._test_decorators as td
+
+from pandas import DataFrame, Series
 from pandas.tests.plotting.common import TestPlotBase
+import pandas.util.testing as tm
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFrameGroupByPlots(TestPlotBase):
 
     def test_series_groupby_plotting_nominally_works(self):
@@ -68,7 +69,7 @@ def test_plot_kwargs(self):
         res = df.groupby('z').plot(kind='scatter', x='x', y='y')
         # check that a scatter plot is effectively plotted: the axes should
         # contain a PathCollection from the scatter plot (GH11805)
-        self.assertEqual(len(res['a'].collections), 1)
+        assert len(res['a'].collections) == 1
 
         res = df.groupby('z').plot.scatter(x='x', y='y')
-        self.assertEqual(len(res['a'].collections), 1)
+        assert len(res['a'].collections) == 1
diff --git a/pandas/tests/plotting/test_hist_method.py b/pandas/tests/plotting/test_hist_method.py
index 380bdc12abce4..4f0bef52b5e15 100644
--- a/pandas/tests/plotting/test_hist_method.py
+++ b/pandas/tests/plotting/test_hist_method.py
@@ -2,29 +2,32 @@
 
 """ Test cases for .hist method """
 
-from pandas import Series, DataFrame
-import pandas.util.testing as tm
-from pandas.util.testing import slow
-
 import numpy as np
 from numpy.random import randn
+import pytest
+
+import pandas.util._test_decorators as td
+
+from pandas import DataFrame, Series
+from pandas.tests.plotting.common import TestPlotBase, _check_plot_works
+import pandas.util.testing as tm
 
-import pandas.tools.plotting as plotting
-from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works)
+from pandas.plotting._compat import _mpl_ge_2_2_0
+from pandas.plotting._core import grouped_hist
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestSeriesPlots(TestPlotBase):
 
-    def setUp(self):
-        TestPlotBase.setUp(self)
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
         import matplotlib as mpl
         mpl.rcdefaults()
 
         self.ts = tm.makeTimeSeries()
         self.ts.name = 'ts'
 
-    @slow
+    @pytest.mark.slow
     def test_hist_legacy(self):
         _check_plot_works(self.ts.hist)
         _check_plot_works(self.ts.hist, grid=False)
@@ -45,25 +48,25 @@ def test_hist_legacy(self):
         _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
         _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             self.ts.hist(by=self.ts.index, figure=fig)
 
-    @slow
+    @pytest.mark.slow
     def test_hist_bins_legacy(self):
         df = DataFrame(np.random.randn(10, 2))
         ax = df.hist(bins=2)[0][0]
-        self.assertEqual(len(ax.patches), 2)
+        assert len(ax.patches) == 2
 
-    @slow
+    @pytest.mark.slow
     def test_hist_layout(self):
         df = self.hist_df
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.height.hist(layout=(1, 1))
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.height.hist(layout=[1, 1])
 
-    @slow
+    @pytest.mark.slow
     def test_hist_layout_with_by(self):
         df = self.hist_df
 
@@ -109,7 +112,7 @@ def test_hist_layout_with_by(self):
         self._check_axes_shape(
             axes, axes_num=4, layout=(4, 2), figsize=(12, 7))
 
-    @slow
+    @pytest.mark.slow
     def test_hist_no_overlap(self):
         from matplotlib.pyplot import subplot, gcf
         x = Series(randn(2))
@@ -119,29 +122,29 @@ def test_hist_no_overlap(self):
         subplot(122)
         y.hist()
         fig = gcf()
-        axes = fig.axes if self.mpl_ge_1_5_0 else fig.get_axes()
-        self.assertEqual(len(axes), 2)
+        axes = fig.axes
+        assert len(axes) == 2
 
-    @slow
+    @pytest.mark.slow
     def test_hist_by_no_extra_plots(self):
         df = self.hist_df
         axes = df.height.hist(by=df.gender)  # noqa
-        self.assertEqual(len(self.plt.get_fignums()), 1)
+        assert len(self.plt.get_fignums()) == 1
 
-    @slow
+    @pytest.mark.slow
     def test_plot_fails_when_ax_differs_from_figure(self):
         from pylab import figure
         fig1 = figure()
         fig2 = figure()
         ax1 = fig1.add_subplot(111)
-        with tm.assertRaises(AssertionError):
+        with pytest.raises(AssertionError):
             self.ts.hist(ax=ax1, figure=fig2)
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFramePlots(TestPlotBase):
 
-    @slow
+    @pytest.mark.slow
     def test_hist_df_legacy(self):
         from matplotlib.patches import Rectangle
         with tm.assert_produces_warning(UserWarning):
@@ -152,7 +155,7 @@ def test_hist_df_legacy(self):
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(df.hist, grid=False)
         self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
-        self.assertFalse(axes[1, 1].get_visible())
+        assert not axes[1, 1].get_visible()
 
         df = DataFrame(randn(100, 1))
         _check_plot_works(df.hist)
@@ -191,10 +194,14 @@ def test_hist_df_legacy(self):
 
         tm.close()
         # make sure kwargs to hist are handled
-        ax = ser.hist(normed=True, cumulative=True, bins=4)
+        if _mpl_ge_2_2_0():
+            kwargs = {"density": True}
+        else:
+            kwargs = {"normed": True}
+        ax = ser.hist(cumulative=True, bins=4, **kwargs)
         # height of last bin (index 5) must be 1.0
         rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
-        self.assertAlmostEqual(rects[-1].get_height(), 1.0)
+        tm.assert_almost_equal(rects[-1].get_height(), 1.0)
 
         tm.close()
         ax = ser.hist(log=True)
@@ -204,10 +211,10 @@ def test_hist_df_legacy(self):
         tm.close()
 
         # propagate attr exception from matplotlib.Axes.hist
-        with tm.assertRaises(AttributeError):
+        with pytest.raises(AttributeError):
             ser.hist(foo='bar')
 
-    @slow
+    @pytest.mark.slow
     def test_hist_layout(self):
         df = DataFrame(randn(100, 3))
 
@@ -229,16 +236,16 @@ def test_hist_layout(self):
             self._check_axes_shape(axes, axes_num=3, layout=expected)
 
         # layout too small for all 4 plots
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.hist(layout=(1, 1))
 
         # invalid format for layout
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.hist(layout=(1,))
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.hist(layout=(-1, -1))
 
-    @slow
+    @pytest.mark.slow
     # GH 9351
     def test_tight_layout(self):
         if self.mpl_ge_2_0_1:
@@ -249,10 +256,10 @@ def test_tight_layout(self):
             tm.close()
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFrameGroupByPlots(TestPlotBase):
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_hist_legacy(self):
         from matplotlib.patches import Rectangle
 
@@ -260,7 +267,7 @@ def test_grouped_hist_legacy(self):
         df['C'] = np.random.randint(0, 4, 500)
         df['D'] = ['X'] * 500
 
-        axes = plotting.grouped_hist(df.A, by=df.C)
+        axes = grouped_hist(df.A, by=df.C)
         self._check_axes_shape(axes, axes_num=4, layout=(2, 2))
 
         tm.close()
@@ -277,32 +284,37 @@ def test_grouped_hist_legacy(self):
         # make sure kwargs to hist are handled
         xf, yf = 20, 18
         xrot, yrot = 30, 40
-        axes = plotting.grouped_hist(df.A, by=df.C, normed=True,
-                                     cumulative=True, bins=4,
-                                     xlabelsize=xf, xrot=xrot,
-                                     ylabelsize=yf, yrot=yrot)
+
+        if _mpl_ge_2_2_0():
+            kwargs = {"density": True}
+        else:
+            kwargs = {"normed": True}
+
+        axes = grouped_hist(df.A, by=df.C, cumulative=True,
+                            bins=4, xlabelsize=xf, xrot=xrot,
+                            ylabelsize=yf, yrot=yrot, **kwargs)
         # height of last bin (index 5) must be 1.0
         for ax in axes.ravel():
             rects = [x for x in ax.get_children() if isinstance(x, Rectangle)]
             height = rects[-1].get_height()
-            self.assertAlmostEqual(height, 1.0)
+            tm.assert_almost_equal(height, 1.0)
         self._check_ticks_props(axes, xlabelsize=xf, xrot=xrot,
                                 ylabelsize=yf, yrot=yrot)
 
         tm.close()
-        axes = plotting.grouped_hist(df.A, by=df.C, log=True)
+        axes = grouped_hist(df.A, by=df.C, log=True)
         # scale of y must be 'log'
         self._check_ax_scales(axes, yaxis='log')
 
         tm.close()
         # propagate attr exception from matplotlib.Axes.hist
-        with tm.assertRaises(AttributeError):
-            plotting.grouped_hist(df.A, by=df.C, foo='bar')
+        with pytest.raises(AttributeError):
+            grouped_hist(df.A, by=df.C, foo='bar')
 
         with tm.assert_produces_warning(FutureWarning):
             df.hist(by='C', figsize='default')
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_hist_legacy2(self):
         n = 10
         weight = Series(np.random.normal(166, 20, size=n))
@@ -313,19 +325,24 @@ def test_grouped_hist_legacy2(self):
                             'gender': gender_int})
         gb = df_int.groupby('gender')
         axes = gb.hist()
-        self.assertEqual(len(axes), 2)
-        self.assertEqual(len(self.plt.get_fignums()), 2)
+        assert len(axes) == 2
+        assert len(self.plt.get_fignums()) == 2
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_hist_layout(self):
         df = self.hist_df
-        self.assertRaises(ValueError, df.hist, column='weight', by=df.gender,
-                          layout=(1, 1))
-        self.assertRaises(ValueError, df.hist, column='height', by=df.category,
-                          layout=(1, 3))
-        self.assertRaises(ValueError, df.hist, column='height', by=df.category,
-                          layout=(-1, -1))
+        msg = "Layout of 1x1 must be larger than required size 2"
+        with pytest.raises(ValueError, match=msg):
+            df.hist(column='weight', by=df.gender, layout=(1, 1))
+
+        msg = "Layout of 1x3 must be larger than required size 4"
+        with pytest.raises(ValueError, match=msg):
+            df.hist(column='height', by=df.category, layout=(1, 3))
+
+        msg = "At least one dimension of layout must be positive"
+        with pytest.raises(ValueError, match=msg):
+            df.hist(column='height', by=df.category, layout=(-1, -1))
 
         with tm.assert_produces_warning(UserWarning):
             axes = _check_plot_works(df.hist, column='height', by=df.gender,
@@ -366,7 +383,7 @@ def test_grouped_hist_layout(self):
         axes = df.hist(column=['height', 'weight', 'category'])
         self._check_axes_shape(axes, axes_num=3, layout=(2, 2))
 
-    @slow
+    @pytest.mark.slow
     def test_grouped_hist_multiple_axes(self):
         # GH 6970, GH 7069
         df = self.hist_df
@@ -374,54 +391,54 @@ def test_grouped_hist_multiple_axes(self):
         fig, axes = self.plt.subplots(2, 3)
         returned = df.hist(column=['height', 'weight', 'category'], ax=axes[0])
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[0])
-        self.assertIs(returned[0].figure, fig)
+        tm.assert_numpy_array_equal(returned, axes[0])
+        assert returned[0].figure is fig
         returned = df.hist(by='classroom', ax=axes[1])
         self._check_axes_shape(returned, axes_num=3, layout=(1, 3))
-        self.assert_numpy_array_equal(returned, axes[1])
-        self.assertIs(returned[0].figure, fig)
+        tm.assert_numpy_array_equal(returned, axes[1])
+        assert returned[0].figure is fig
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             fig, axes = self.plt.subplots(2, 3)
             # pass different number of axes from required
             axes = df.hist(column='height', ax=axes)
 
-    @slow
+    @pytest.mark.slow
     def test_axis_share_x(self):
         df = self.hist_df
         # GH4089
         ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True)
 
         # share x
-        self.assertTrue(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_x_axes.joined(ax1, ax2))
+        assert ax1._shared_x_axes.joined(ax1, ax2)
+        assert ax2._shared_x_axes.joined(ax1, ax2)
 
         # don't share y
-        self.assertFalse(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertFalse(ax2._shared_y_axes.joined(ax1, ax2))
+        assert not ax1._shared_y_axes.joined(ax1, ax2)
+        assert not ax2._shared_y_axes.joined(ax1, ax2)
 
-    @slow
+    @pytest.mark.slow
     def test_axis_share_y(self):
         df = self.hist_df
         ax1, ax2 = df.hist(column='height', by=df.gender, sharey=True)
 
         # share y
-        self.assertTrue(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_y_axes.joined(ax1, ax2))
+        assert ax1._shared_y_axes.joined(ax1, ax2)
+        assert ax2._shared_y_axes.joined(ax1, ax2)
 
         # don't share x
-        self.assertFalse(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertFalse(ax2._shared_x_axes.joined(ax1, ax2))
+        assert not ax1._shared_x_axes.joined(ax1, ax2)
+        assert not ax2._shared_x_axes.joined(ax1, ax2)
 
-    @slow
+    @pytest.mark.slow
     def test_axis_share_xy(self):
         df = self.hist_df
         ax1, ax2 = df.hist(column='height', by=df.gender, sharex=True,
                            sharey=True)
 
         # share both x and y
-        self.assertTrue(ax1._shared_x_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_x_axes.joined(ax1, ax2))
+        assert ax1._shared_x_axes.joined(ax1, ax2)
+        assert ax2._shared_x_axes.joined(ax1, ax2)
 
-        self.assertTrue(ax1._shared_y_axes.joined(ax1, ax2))
-        self.assertTrue(ax2._shared_y_axes.joined(ax1, ax2))
+        assert ax1._shared_y_axes.joined(ax1, ax2)
+        assert ax2._shared_y_axes.joined(ax1, ax2)
diff --git a/pandas/tests/plotting/test_misc.py b/pandas/tests/plotting/test_misc.py
index 11f00386ec592..98248586f3d27 100644
--- a/pandas/tests/plotting/test_misc.py
+++ b/pandas/tests/plotting/test_misc.py
@@ -2,91 +2,69 @@
 
 """ Test cases for misc plot functions """
 
-from pandas import Series, DataFrame
-from pandas.compat import lmap
-import pandas.util.testing as tm
-from pandas.util.testing import slow
-
 import numpy as np
 from numpy import random
 from numpy.random import randn
+import pytest
+
+from pandas.compat import lmap
+import pandas.util._test_decorators as td
+
+from pandas import DataFrame
+from pandas.tests.plotting.common import TestPlotBase, _check_plot_works
+import pandas.util.testing as tm
 
-import pandas.tools.plotting as plotting
-from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works,
-                                          _ok_for_gaussian_kde)
+import pandas.plotting as plotting
 
 
-@tm.mplskip
+@td.skip_if_mpl
+def test_import_error_message():
+    # GH-19810
+    df = DataFrame({"A": [1, 2]})
+
+    with pytest.raises(ImportError, match='matplotlib is required'):
+        df.plot()
+
+
+@td.skip_if_no_mpl
 class TestSeriesPlots(TestPlotBase):
 
-    def setUp(self):
-        TestPlotBase.setUp(self)
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
         import matplotlib as mpl
         mpl.rcdefaults()
 
         self.ts = tm.makeTimeSeries()
         self.ts.name = 'ts'
 
-    @slow
+    @pytest.mark.slow
     def test_autocorrelation_plot(self):
-        from pandas.tools.plotting import autocorrelation_plot
+        from pandas.plotting import autocorrelation_plot
         _check_plot_works(autocorrelation_plot, series=self.ts)
         _check_plot_works(autocorrelation_plot, series=self.ts.values)
 
         ax = autocorrelation_plot(self.ts, label='Test')
         self._check_legend_labels(ax, labels=['Test'])
 
-    @slow
+    @pytest.mark.slow
     def test_lag_plot(self):
-        from pandas.tools.plotting import lag_plot
+        from pandas.plotting import lag_plot
         _check_plot_works(lag_plot, series=self.ts)
         _check_plot_works(lag_plot, series=self.ts, lag=5)
 
-    @slow
+    @pytest.mark.slow
     def test_bootstrap_plot(self):
-        from pandas.tools.plotting import bootstrap_plot
+        from pandas.plotting import bootstrap_plot
         _check_plot_works(bootstrap_plot, series=self.ts, size=10)
 
 
-@tm.mplskip
+@td.skip_if_no_mpl
 class TestDataFramePlots(TestPlotBase):
 
-    @slow
-    def test_scatter_plot_legacy(self):
-        tm._skip_if_no_scipy()
-
-        df = DataFrame(randn(100, 2))
-
-        def scat(**kwds):
-            return plotting.scatter_matrix(df, **kwds)
-
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat)
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat, marker='+')
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat, vmin=0)
-        if _ok_for_gaussian_kde('kde'):
-            with tm.assert_produces_warning(UserWarning):
-                _check_plot_works(scat, diagonal='kde')
-        if _ok_for_gaussian_kde('density'):
-            with tm.assert_produces_warning(UserWarning):
-                _check_plot_works(scat, diagonal='density')
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat, diagonal='hist')
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat, range_padding=.1)
-
-        def scat2(x, y, by=None, ax=None, figsize=None):
-            return plotting.scatter_plot(df, x, y, by, ax, figsize=None)
-
-        _check_plot_works(scat2, x=0, y=1)
-        grouper = Series(np.repeat([1, 2, 3, 4, 5], 20), df.index)
-        with tm.assert_produces_warning(UserWarning):
-            _check_plot_works(scat2, x=0, y=1, by=grouper)
-
+    # This XPASSES when tested with mpl == 3.0.1
+    @td.xfail_if_mpl_2_2
+    @td.skip_if_no_scipy
     def test_scatter_matrix_axis(self):
-        tm._skip_if_no_scipy()
         scatter_matrix = plotting.scatter_matrix
 
         with tm.RNGContext(42):
@@ -99,10 +77,7 @@ def test_scatter_matrix_axis(self):
         axes0_labels = axes[0][0].yaxis.get_majorticklabels()
 
         # GH 5662
-        if self.mpl_ge_2_0_0:
-            expected = ['-2', '0', '2']
-        else:
-            expected = ['-2', '-1', '0', '1', '2']
+        expected = ['-2', '0', '2']
         self._check_text_labels(axes0_labels, expected)
         self._check_ticks_props(
             axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
@@ -114,20 +89,17 @@ def test_scatter_matrix_axis(self):
             axes = _check_plot_works(scatter_matrix, filterwarnings='always',
                                      frame=df, range_padding=.1)
         axes0_labels = axes[0][0].yaxis.get_majorticklabels()
-        if self.mpl_ge_2_0_0:
-            expected = ['-1.0', '-0.5', '0.0']
-        else:
-            expected = ['-1.2', '-1.0', '-0.8', '-0.6', '-0.4', '-0.2', '0.0']
+        expected = ['-1.0', '-0.5', '0.0']
         self._check_text_labels(axes0_labels, expected)
         self._check_ticks_props(
             axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
 
-    @slow
-    def test_andrews_curves(self):
-        from pandas.tools.plotting import andrews_curves
+    @pytest.mark.slow
+    def test_andrews_curves(self, iris):
+        from pandas.plotting import andrews_curves
         from matplotlib import cm
 
-        df = self.iris
+        df = iris
 
         _check_plot_works(andrews_curves, frame=df, class_column='Name')
 
@@ -187,12 +159,12 @@ def test_andrews_curves(self):
         with tm.assert_produces_warning(FutureWarning):
             andrews_curves(data=df, class_column='Name')
 
-    @slow
-    def test_parallel_coordinates(self):
-        from pandas.tools.plotting import parallel_coordinates
+    @pytest.mark.slow
+    def test_parallel_coordinates(self, iris):
+        from pandas.plotting import parallel_coordinates
         from matplotlib import cm
 
-        df = self.iris
+        df = iris
 
         ax = _check_plot_works(parallel_coordinates,
                                frame=df, class_column='Name')
@@ -235,12 +207,34 @@ def test_parallel_coordinates(self):
         with tm.assert_produces_warning(FutureWarning):
             parallel_coordinates(df, 'Name', colors=colors)
 
-    @slow
-    def test_radviz(self):
-        from pandas.tools.plotting import radviz
+    # not sure if this is indicative of a problem
+    @pytest.mark.filterwarnings("ignore:Attempting to set:UserWarning")
+    def test_parallel_coordinates_with_sorted_labels(self):
+        """ For #15908 """
+        from pandas.plotting import parallel_coordinates
+
+        df = DataFrame({"feat": [i for i in range(30)],
+                        "class": [2 for _ in range(10)] +
+                                 [3 for _ in range(10)] +
+                                 [1 for _ in range(10)]})
+        ax = parallel_coordinates(df, 'class', sort_labels=True)
+        polylines, labels = ax.get_legend_handles_labels()
+        color_label_tuples = \
+            zip([polyline.get_color() for polyline in polylines], labels)
+        ordered_color_label_tuples = sorted(color_label_tuples,
+                                            key=lambda x: x[1])
+        prev_next_tupels = zip([i for i in ordered_color_label_tuples[0:-1]],
+                               [i for i in ordered_color_label_tuples[1:]])
+        for prev, nxt in prev_next_tupels:
+            # labels and colors are ordered strictly increasing
+            assert prev[1] < nxt[1] and prev[0] < nxt[0]
+
+    @pytest.mark.slow
+    def test_radviz(self, iris):
+        from pandas.plotting import radviz
         from matplotlib import cm
 
-        df = self.iris
+        df = iris
         _check_plot_works(radviz, frame=df, class_column='Name')
 
         rgba = ('#556270', '#4ECDC4', '#C7F464')
@@ -273,28 +267,96 @@ def test_radviz(self):
         handles, labels = ax.get_legend_handles_labels()
         self._check_colors(handles, facecolors=colors)
 
-    @slow
-    def test_subplot_titles(self):
-        df = self.iris.drop('Name', axis=1).head()
+    @pytest.mark.slow
+    def test_subplot_titles(self, iris):
+        df = iris.drop('Name', axis=1).head()
         # Use the column names as the subplot titles
         title = list(df.columns)
 
         # Case len(title) == len(df)
         plot = df.plot(subplots=True, title=title)
-        self.assertEqual([p.get_title() for p in plot], title)
+        assert [p.get_title() for p in plot] == title
 
         # Case len(title) > len(df)
-        self.assertRaises(ValueError, df.plot, subplots=True,
-                          title=title + ["kittens > puppies"])
+        msg = ("The length of `title` must equal the number of columns if"
+               " using `title` of type `list` and `subplots=True`")
+        with pytest.raises(ValueError, match=msg):
+            df.plot(subplots=True, title=title + ["kittens > puppies"])
 
         # Case len(title) < len(df)
-        self.assertRaises(ValueError, df.plot, subplots=True, title=title[:2])
+        with pytest.raises(ValueError, match=msg):
+            df.plot(subplots=True, title=title[:2])
 
         # Case subplots=False and title is of type list
-        self.assertRaises(ValueError, df.plot, subplots=False, title=title)
+        msg = ("Using `title` of type `list` is not supported unless"
+               " `subplots=True` is passed")
+        with pytest.raises(ValueError, match=msg):
+            df.plot(subplots=False, title=title)
 
         # Case df with 3 numeric columns but layout of (2,2)
         plot = df.drop('SepalWidth', axis=1).plot(subplots=True, layout=(2, 2),
                                                   title=title[:-1])
         title_list = [ax.get_title() for sublist in plot for ax in sublist]
-        self.assertEqual(title_list, title[:3] + [''])
+        assert title_list == title[:3] + ['']
+
+    def test_get_standard_colors_random_seed(self):
+        # GH17525
+        df = DataFrame(np.zeros((10, 10)))
+
+        # Make sure that the random seed isn't reset by _get_standard_colors
+        plotting.parallel_coordinates(df, 0)
+        rand1 = random.random()
+        plotting.parallel_coordinates(df, 0)
+        rand2 = random.random()
+        assert rand1 != rand2
+
+        # Make sure it produces the same colors every time it's called
+        from pandas.plotting._style import _get_standard_colors
+        color1 = _get_standard_colors(1, color_type='random')
+        color2 = _get_standard_colors(1, color_type='random')
+        assert color1 == color2
+
+    def test_get_standard_colors_default_num_colors(self):
+        from pandas.plotting._style import _get_standard_colors
+
+        # Make sure the default color_types returns the specified amount
+        color1 = _get_standard_colors(1, color_type='default')
+        color2 = _get_standard_colors(9, color_type='default')
+        color3 = _get_standard_colors(20, color_type='default')
+        assert len(color1) == 1
+        assert len(color2) == 9
+        assert len(color3) == 20
+
+    def test_plot_single_color(self):
+        # Example from #20585. All 3 bars should have the same color
+        df = DataFrame({'account-start': ['2017-02-03', '2017-03-03',
+                                          '2017-01-01'],
+                        'client': ['Alice Anders', 'Bob Baker',
+                                   'Charlie Chaplin'],
+                        'balance': [-1432.32, 10.43, 30000.00],
+                        'db-id': [1234, 2424, 251],
+                        'proxy-id': [525, 1525, 2542],
+                        'rank': [52, 525, 32],
+                        })
+        ax = df.client.value_counts().plot.bar()
+        colors = lmap(lambda rect: rect.get_facecolor(),
+                      ax.get_children()[0:3])
+        assert all(color == colors[0] for color in colors)
+
+    def test_get_standard_colors_no_appending(self):
+        # GH20726
+
+        # Make sure not to add more colors so that matplotlib can cycle
+        # correctly.
+        from matplotlib import cm
+        color_before = cm.gnuplot(range(5))
+        color_after = plotting._style._get_standard_colors(
+            1, color=color_before)
+        assert len(color_after) == len(color_before)
+
+        df = DataFrame(np.random.randn(48, 4), columns=list("ABCD"))
+
+        color_list = cm.gnuplot(np.linspace(0, 1, 16))
+        p = df.A.plot.bar(figsize=(16, 7), color=color_list)
+        assert (p.patches[1].get_facecolor()
+                == p.patches[17].get_facecolor())
diff --git a/pandas/tests/plotting/test_series.py b/pandas/tests/plotting/test_series.py
index 8c00d606059a4..a234ea8f9416b 100644
--- a/pandas/tests/plotting/test_series.py
+++ b/pandas/tests/plotting/test_series.py
@@ -3,30 +3,31 @@
 """ Test cases for Series.plot """
 
 
-import itertools
-
 from datetime import datetime
-
-import pandas as pd
-from pandas import Series, DataFrame, date_range
-from pandas.compat import range, lrange
-import pandas.util.testing as tm
-from pandas.util.testing import slow
+from itertools import chain
 
 import numpy as np
 from numpy.random import randn
+import pytest
 
-import pandas.tools.plotting as plotting
-from pandas.tests.plotting.common import (TestPlotBase, _check_plot_works,
-                                          _skip_if_no_scipy_gaussian_kde,
-                                          _ok_for_gaussian_kde)
+from pandas.compat import lrange, range
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import DataFrame, Series, date_range
+from pandas.tests.plotting.common import (
+    TestPlotBase, _check_plot_works, _ok_for_gaussian_kde,
+    _skip_if_no_scipy_gaussian_kde)
+import pandas.util.testing as tm
 
+import pandas.plotting as plotting
 
-@tm.mplskip
+
+@td.skip_if_no_mpl
 class TestSeriesPlots(TestPlotBase):
 
-    def setUp(self):
-        TestPlotBase.setUp(self)
+    def setup_method(self, method):
+        TestPlotBase.setup_method(self, method)
         import matplotlib as mpl
         mpl.rcdefaults()
 
@@ -39,7 +40,7 @@ def setUp(self):
         self.iseries = tm.makePeriodSeries()
         self.iseries.name = 'iseries'
 
-    @slow
+    @pytest.mark.slow
     def test_plot(self):
         _check_plot_works(self.ts.plot, label='foo')
         _check_plot_works(self.ts.plot, use_index=False)
@@ -77,88 +78,97 @@ def test_plot(self):
         ax = _check_plot_works(self.ts.plot, subplots=True, layout=(1, -1))
         self._check_axes_shape(ax, axes_num=1, layout=(1, 1))
 
-    @slow
+    @pytest.mark.slow
     def test_plot_figsize_and_title(self):
         # figsize and title
-        ax = self.series.plot(title='Test', figsize=(16, 8))
+        _, ax = self.plt.subplots()
+        ax = self.series.plot(title='Test', figsize=(16, 8), ax=ax)
         self._check_text_labels(ax.title, 'Test')
         self._check_axes_shape(ax, axes_num=1, layout=(1, 1), figsize=(16, 8))
 
     def test_dont_modify_rcParams(self):
         # GH 8242
-        if self.mpl_ge_1_5_0:
-            key = 'axes.prop_cycle'
-        else:
-            key = 'axes.color_cycle'
+        key = 'axes.prop_cycle'
         colors = self.plt.rcParams[key]
-        Series([1, 2, 3]).plot()
-        self.assertEqual(colors, self.plt.rcParams[key])
+        _, ax = self.plt.subplots()
+        Series([1, 2, 3]).plot(ax=ax)
+        assert colors == self.plt.rcParams[key]
 
     def test_ts_line_lim(self):
-        ax = self.ts.plot()
+        fig, ax = self.plt.subplots()
+        ax = self.ts.plot(ax=ax)
         xmin, xmax = ax.get_xlim()
         lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data(orig=False)[0][0])
-        self.assertEqual(xmax, lines[0].get_data(orig=False)[0][-1])
+        assert xmin <= lines[0].get_data(orig=False)[0][0]
+        assert xmax >= lines[0].get_data(orig=False)[0][-1]
         tm.close()
 
-        ax = self.ts.plot(secondary_y=True)
+        ax = self.ts.plot(secondary_y=True, ax=ax)
         xmin, xmax = ax.get_xlim()
         lines = ax.get_lines()
-        self.assertEqual(xmin, lines[0].get_data(orig=False)[0][0])
-        self.assertEqual(xmax, lines[0].get_data(orig=False)[0][-1])
+        assert xmin <= lines[0].get_data(orig=False)[0][0]
+        assert xmax >= lines[0].get_data(orig=False)[0][-1]
 
     def test_ts_area_lim(self):
-        ax = self.ts.plot.area(stacked=False)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.area(stacked=False, ax=ax)
         xmin, xmax = ax.get_xlim()
         line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
         tm.close()
 
         # GH 7471
-        ax = self.ts.plot.area(stacked=False, x_compat=True)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.area(stacked=False, x_compat=True, ax=ax)
         xmin, xmax = ax.get_xlim()
         line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
         tm.close()
 
         tz_ts = self.ts.copy()
         tz_ts.index = tz_ts.tz_localize('GMT').tz_convert('CET')
-        ax = tz_ts.plot.area(stacked=False, x_compat=True)
+        _, ax = self.plt.subplots()
+        ax = tz_ts.plot.area(stacked=False, x_compat=True, ax=ax)
         xmin, xmax = ax.get_xlim()
         line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
         tm.close()
 
-        ax = tz_ts.plot.area(stacked=False, secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = tz_ts.plot.area(stacked=False, secondary_y=True, ax=ax)
         xmin, xmax = ax.get_xlim()
         line = ax.get_lines()[0].get_data(orig=False)[0]
-        self.assertEqual(xmin, line[0])
-        self.assertEqual(xmax, line[-1])
+        assert xmin <= line[0]
+        assert xmax >= line[-1]
 
     def test_label(self):
         s = Series([1, 2])
-        ax = s.plot(label='LABEL', legend=True)
+        _, ax = self.plt.subplots()
+        ax = s.plot(label='LABEL', legend=True, ax=ax)
         self._check_legend_labels(ax, labels=['LABEL'])
         self.plt.close()
-        ax = s.plot(legend=True)
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, ax=ax)
         self._check_legend_labels(ax, labels=['None'])
         self.plt.close()
         # get name from index
         s.name = 'NAME'
-        ax = s.plot(legend=True)
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, ax=ax)
         self._check_legend_labels(ax, labels=['NAME'])
         self.plt.close()
         # override the default
-        ax = s.plot(legend=True, label='LABEL')
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=True, label='LABEL', ax=ax)
         self._check_legend_labels(ax, labels=['LABEL'])
         self.plt.close()
         # Add lebel info, but don't draw
-        ax = s.plot(legend=False, label='LABEL')
-        self.assertEqual(ax.get_legend(), None)  # Hasn't been drawn
+        _, ax = self.plt.subplots()
+        ax = s.plot(legend=False, label='LABEL', ax=ax)
+        assert ax.get_legend() is None  # Hasn't been drawn
         ax.legend()  # draw it
         self._check_legend_labels(ax, labels=['LABEL'])
 
@@ -172,91 +182,113 @@ def test_line_area_nan_series(self):
             masked = ax.lines[0].get_ydata()
             # remove nan for comparison purpose
             exp = np.array([1, 2, 3], dtype=np.float64)
-            self.assert_numpy_array_equal(np.delete(masked.data, 2), exp)
-            self.assert_numpy_array_equal(
+            tm.assert_numpy_array_equal(np.delete(masked.data, 2), exp)
+            tm.assert_numpy_array_equal(
                 masked.mask, np.array([False, False, True, False]))
 
             expected = np.array([1, 2, 0, 3], dtype=np.float64)
             ax = _check_plot_works(d.plot, stacked=True)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
             ax = _check_plot_works(d.plot.area)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
             ax = _check_plot_works(d.plot.area, stacked=False)
-            self.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
+            tm.assert_numpy_array_equal(ax.lines[0].get_ydata(), expected)
 
     def test_line_use_index_false(self):
         s = Series([1, 2, 3], index=['a', 'b', 'c'])
         s.index.name = 'The Index'
-        ax = s.plot(use_index=False)
+        _, ax = self.plt.subplots()
+        ax = s.plot(use_index=False, ax=ax)
         label = ax.get_xlabel()
-        self.assertEqual(label, '')
-        ax2 = s.plot.bar(use_index=False)
+        assert label == ''
+        _, ax = self.plt.subplots()
+        ax2 = s.plot.bar(use_index=False, ax=ax)
         label2 = ax2.get_xlabel()
-        self.assertEqual(label2, '')
+        assert label2 == ''
 
-    @slow
+    @pytest.mark.slow
     def test_bar_log(self):
-        expected = np.array([1., 10., 100., 1000.])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((.1, expected, 1e4))
+        expected = np.array([1e-1, 1e0, 1e1, 1e2, 1e3, 1e4])
 
-        ax = Series([200, 500]).plot.bar(log=True)
+        _, ax = self.plt.subplots()
+        ax = Series([200, 500]).plot.bar(log=True, ax=ax)
         tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
         tm.close()
 
-        ax = Series([200, 500]).plot.barh(log=True)
+        _, ax = self.plt.subplots()
+        ax = Series([200, 500]).plot.barh(log=True, ax=ax)
         tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
         tm.close()
 
         # GH 9905
-        expected = np.array([1.0e-03, 1.0e-02, 1.0e-01, 1.0e+00])
-
-        if not self.mpl_le_1_2_1:
-            expected = np.hstack((1.0e-04, expected, 1.0e+01))
-        if self.mpl_ge_2_0_0:
-            expected = np.hstack((1.0e-05, expected))
+        expected = np.array([1e-5, 1e-4, 1e-3, 1e-2, 1e-1, 1e0, 1e1])
 
-        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='bar')
-        ymin = 0.0007943282347242822 if self.mpl_ge_2_0_0 else 0.001
-        ymax = 0.12589254117941673 if self.mpl_ge_2_0_0 else .10000000000000001
+        _, ax = self.plt.subplots()
+        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='bar', ax=ax)
+        ymin = 0.0007943282347242822
+        ymax = 0.12589254117941673
         res = ax.get_ylim()
-        self.assertAlmostEqual(res[0], ymin)
-        self.assertAlmostEqual(res[1], ymax)
+        tm.assert_almost_equal(res[0], ymin)
+        tm.assert_almost_equal(res[1], ymax)
         tm.assert_numpy_array_equal(ax.yaxis.get_ticklocs(), expected)
         tm.close()
 
-        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='barh')
+        _, ax = self.plt.subplots()
+        ax = Series([0.1, 0.01, 0.001]).plot(log=True, kind='barh', ax=ax)
         res = ax.get_xlim()
-        self.assertAlmostEqual(res[0], ymin)
-        self.assertAlmostEqual(res[1], ymax)
+        tm.assert_almost_equal(res[0], ymin)
+        tm.assert_almost_equal(res[1], ymax)
         tm.assert_numpy_array_equal(ax.xaxis.get_ticklocs(), expected)
 
-    @slow
+    @pytest.mark.slow
     def test_bar_ignore_index(self):
         df = Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])
-        ax = df.plot.bar(use_index=False)
+        _, ax = self.plt.subplots()
+        ax = df.plot.bar(use_index=False, ax=ax)
         self._check_text_labels(ax.get_xticklabels(), ['0', '1', '2', '3'])
 
+    def test_bar_user_colors(self):
+        s = Series([1, 2, 3, 4])
+        ax = s.plot.bar(color=['red', 'blue', 'blue', 'red'])
+        result = [p.get_facecolor() for p in ax.patches]
+        expected = [(1., 0., 0., 1.),
+                    (0., 0., 1., 1.),
+                    (0., 0., 1., 1.),
+                    (1., 0., 0., 1.)]
+        assert result == expected
+
     def test_rotation(self):
         df = DataFrame(randn(5, 5))
         # Default rot 0
-        axes = df.plot()
+        _, ax = self.plt.subplots()
+        axes = df.plot(ax=ax)
         self._check_ticks_props(axes, xrot=0)
 
-        axes = df.plot(rot=30)
+        _, ax = self.plt.subplots()
+        axes = df.plot(rot=30, ax=ax)
         self._check_ticks_props(axes, xrot=30)
 
     def test_irregular_datetime(self):
         rng = date_range('1/1/2000', '3/1/2000')
         rng = rng[[0, 1, 2, 3, 5, 9, 10, 11, 12]]
         ser = Series(randn(len(rng)), rng)
-        ax = ser.plot()
+        _, ax = self.plt.subplots()
+        ax = ser.plot(ax=ax)
         xp = datetime(1999, 1, 1).toordinal()
         ax.set_xlim('1/1/1999', '1/1/2001')
-        self.assertEqual(xp, ax.get_xlim()[0])
+        assert xp == ax.get_xlim()[0]
+
+    def test_unsorted_index_xlim(self):
+        ser = Series([0., 1., np.nan, 3., 4., 5., 6.],
+                     index=[1., 0., 3., 2., np.nan, 3., 2.])
+        _, ax = self.plt.subplots()
+        ax = ser.plot(ax=ax)
+        xmin, xmax = ax.get_xlim()
+        lines = ax.get_lines()
+        assert xmin <= np.nanmin(lines[0].get_data(orig=False)[0])
+        assert xmax >= np.nanmax(lines[0].get_data(orig=False)[0])
 
-    @slow
+    @pytest.mark.slow
     def test_pie_series(self):
         # if sum of values is less than 1.0, pie handle them as rate and draw
         # semicircle.
@@ -264,7 +296,7 @@ def test_pie_series(self):
                         index=['a', 'b', 'c', 'd', 'e'], name='YLABEL')
         ax = _check_plot_works(series.plot.pie)
         self._check_text_labels(ax.texts, series.index)
-        self.assertEqual(ax.get_ylabel(), 'YLABEL')
+        assert ax.get_ylabel() == 'YLABEL'
 
         # without wedge labels
         ax = _check_plot_works(series.plot.pie, labels=None)
@@ -290,14 +322,13 @@ def test_pie_series(self):
                                autopct='%.2f', fontsize=7)
         pcts = ['{0:.2f}'.format(s * 100)
                 for s in series.values / float(series.sum())]
-        iters = [iter(series.index), iter(pcts)]
-        expected_texts = list(next(it) for it in itertools.cycle(iters))
+        expected_texts = list(chain.from_iterable(zip(series.index, pcts)))
         self._check_text_labels(ax.texts, expected_texts)
         for t in ax.texts:
-            self.assertEqual(t.get_fontsize(), 7)
+            assert t.get_fontsize() == 7
 
         # includes negative value
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             series = Series([1, 2, 0, 4, -1], index=['a', 'b', 'c', 'd', 'e'])
             series.plot.pie()
 
@@ -309,31 +340,35 @@ def test_pie_series(self):
 
     def test_pie_nan(self):
         s = Series([1, np.nan, 1, 1])
-        ax = s.plot.pie(legend=True)
+        _, ax = self.plt.subplots()
+        ax = s.plot.pie(legend=True, ax=ax)
         expected = ['0', '', '2', '3']
         result = [x.get_text() for x in ax.texts]
-        self.assertEqual(result, expected)
+        assert result == expected
 
-    @slow
+    @pytest.mark.slow
     def test_hist_df_kwargs(self):
         df = DataFrame(np.random.randn(10, 2))
-        ax = df.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 10)
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 10
 
-    @slow
+    @pytest.mark.slow
     def test_hist_df_with_nonnumerics(self):
         # GH 9853
         with tm.RNGContext(1):
             df = DataFrame(
                 np.random.randn(10, 4), columns=['A', 'B', 'C', 'D'])
         df['E'] = ['x', 'y'] * 5
-        ax = df.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 20)
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 20
 
-        ax = df.plot.hist()  # bins=10
-        self.assertEqual(len(ax.patches), 40)
+        _, ax = self.plt.subplots()
+        ax = df.plot.hist(ax=ax)  # bins=10
+        assert len(ax.patches) == 40
 
-    @slow
+    @pytest.mark.slow
     def test_hist_legacy(self):
         _check_plot_works(self.ts.hist)
         _check_plot_works(self.ts.hist, grid=False)
@@ -356,25 +391,25 @@ def test_hist_legacy(self):
         _check_plot_works(self.ts.hist, figure=fig, ax=ax1)
         _check_plot_works(self.ts.hist, figure=fig, ax=ax2)
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             self.ts.hist(by=self.ts.index, figure=fig)
 
-    @slow
+    @pytest.mark.slow
     def test_hist_bins_legacy(self):
         df = DataFrame(np.random.randn(10, 2))
         ax = df.hist(bins=2)[0][0]
-        self.assertEqual(len(ax.patches), 2)
+        assert len(ax.patches) == 2
 
-    @slow
+    @pytest.mark.slow
     def test_hist_layout(self):
         df = self.hist_df
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.height.hist(layout=(1, 1))
 
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.height.hist(layout=[1, 1])
 
-    @slow
+    @pytest.mark.slow
     def test_hist_layout_with_by(self):
         df = self.hist_df
 
@@ -418,7 +453,7 @@ def test_hist_layout_with_by(self):
         self._check_axes_shape(axes, axes_num=4, layout=(4, 2),
                                figsize=(12, 7))
 
-    @slow
+    @pytest.mark.slow
     def test_hist_no_overlap(self):
         from matplotlib.pyplot import subplot, gcf
         x = Series(randn(2))
@@ -428,114 +463,138 @@ def test_hist_no_overlap(self):
         subplot(122)
         y.hist()
         fig = gcf()
-        axes = fig.axes if self.mpl_ge_1_5_0 else fig.get_axes()
-        self.assertEqual(len(axes), 2)
+        axes = fig.axes
+        assert len(axes) == 2
 
-    @slow
+    @pytest.mark.slow
     def test_hist_secondary_legend(self):
         # GH 9610
         df = DataFrame(np.random.randn(30, 4), columns=list('abcd'))
 
         # primary -> secondary
-        ax = df['a'].plot.hist(legend=True)
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, ax=ax)
         df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
         # both legends are dran on left ax
         # left and right axis must be visible
         self._check_legend_labels(ax, labels=['a', 'b (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
         tm.close()
 
         # secondary -> secondary
-        ax = df['a'].plot.hist(legend=True, secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, secondary_y=True, ax=ax)
         df['b'].plot.hist(ax=ax, legend=True, secondary_y=True)
         # both legends are draw on left ax
         # left axis must be invisible, right axis must be visible
         self._check_legend_labels(ax.left_ax,
                                   labels=['a (right)', 'b (right)'])
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
         tm.close()
 
         # secondary -> primary
-        ax = df['a'].plot.hist(legend=True, secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = df['a'].plot.hist(legend=True, secondary_y=True, ax=ax)
         # right axes is returned
         df['b'].plot.hist(ax=ax, legend=True)
         # both legends are draw on left ax
         # left and right axis must be visible
         self._check_legend_labels(ax.left_ax, labels=['a (right)', 'b'])
-        self.assertTrue(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
         tm.close()
 
-    @slow
+    @pytest.mark.slow
     def test_df_series_secondary_legend(self):
         # GH 9779
         df = DataFrame(np.random.randn(30, 3), columns=list('abc'))
         s = Series(np.random.randn(30), name='x')
 
         # primary -> secondary (without passing ax)
-        ax = df.plot()
-        s.plot(legend=True, secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
+        s.plot(legend=True, secondary_y=True, ax=ax)
         # both legends are dran on left ax
         # left and right axis must be visible
         self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
         tm.close()
 
         # primary -> secondary (with passing ax)
-        ax = df.plot()
+        _, ax = self.plt.subplots()
+        ax = df.plot(ax=ax)
         s.plot(ax=ax, legend=True, secondary_y=True)
         # both legends are dran on left ax
         # left and right axis must be visible
         self._check_legend_labels(ax, labels=['a', 'b', 'c', 'x (right)'])
-        self.assertTrue(ax.get_yaxis().get_visible())
-        self.assertTrue(ax.right_ax.get_yaxis().get_visible())
+        assert ax.get_yaxis().get_visible()
+        assert ax.right_ax.get_yaxis().get_visible()
         tm.close()
 
         # seconcary -> secondary (without passing ax)
-        ax = df.plot(secondary_y=True)
-        s.plot(legend=True, secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, ax=ax)
+        s.plot(legend=True, secondary_y=True, ax=ax)
         # both legends are dran on left ax
         # left axis must be invisible and right axis must be visible
         expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
         self._check_legend_labels(ax.left_ax, labels=expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
         tm.close()
 
         # secondary -> secondary (with passing ax)
-        ax = df.plot(secondary_y=True)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, ax=ax)
         s.plot(ax=ax, legend=True, secondary_y=True)
         # both legends are dran on left ax
         # left axis must be invisible and right axis must be visible
         expected = ['a (right)', 'b (right)', 'c (right)', 'x (right)']
         self._check_legend_labels(ax.left_ax, expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
         tm.close()
 
         # secondary -> secondary (with passing ax)
-        ax = df.plot(secondary_y=True, mark_right=False)
+        _, ax = self.plt.subplots()
+        ax = df.plot(secondary_y=True, mark_right=False, ax=ax)
         s.plot(ax=ax, legend=True, secondary_y=True)
         # both legends are dran on left ax
         # left axis must be invisible and right axis must be visible
         expected = ['a', 'b', 'c', 'x (right)']
         self._check_legend_labels(ax.left_ax, expected)
-        self.assertFalse(ax.left_ax.get_yaxis().get_visible())
-        self.assertTrue(ax.get_yaxis().get_visible())
+        assert not ax.left_ax.get_yaxis().get_visible()
+        assert ax.get_yaxis().get_visible()
         tm.close()
 
-    @slow
+    @pytest.mark.slow
+    def test_secondary_logy(self):
+        # GH 25545
+        s1 = Series(np.random.randn(30))
+        s2 = Series(np.random.randn(30))
+
+        ax1 = s1.plot(logy=True)
+        ax2 = s2.plot(secondary_y=True, logy=True)
+
+        assert ax1.get_yscale() == 'log'
+        assert ax2.get_yscale() == 'log'
+
+    @pytest.mark.slow
     def test_plot_fails_with_dupe_color_and_style(self):
         x = Series(randn(2))
-        with tm.assertRaises(ValueError):
-            x.plot(style='k--', color='k')
+        with pytest.raises(ValueError):
+            _, ax = self.plt.subplots()
+            x.plot(style='k--', color='k', ax=ax)
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_hist_kde(self):
-        ax = self.ts.plot.hist(logy=True)
+
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(logy=True, ax=ax)
         self._check_ax_scales(ax, yaxis='log')
         xlabels = ax.get_xticklabels()
         # ticks are values, thus ticklabels are blank
@@ -543,122 +602,136 @@ def test_hist_kde(self):
         ylabels = ax.get_yticklabels()
         self._check_text_labels(ylabels, [''] * len(ylabels))
 
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
         _check_plot_works(self.ts.plot.kde)
         _check_plot_works(self.ts.plot.density)
-        ax = self.ts.plot.kde(logy=True)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, ax=ax)
         self._check_ax_scales(ax, yaxis='log')
         xlabels = ax.get_xticklabels()
         self._check_text_labels(xlabels, [''] * len(xlabels))
         ylabels = ax.get_yticklabels()
         self._check_text_labels(ylabels, [''] * len(ylabels))
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_kwargs(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
-        from numpy import linspace
-        _check_plot_works(self.ts.plot.kde, bw_method=.5,
-                          ind=linspace(-100, 100, 20))
+
+        sample_points = np.linspace(-100, 100, 20)
+        _check_plot_works(self.ts.plot.kde, bw_method='scott', ind=20)
+        _check_plot_works(self.ts.plot.kde, bw_method=None, ind=20)
+        _check_plot_works(self.ts.plot.kde, bw_method=None, ind=np.int(20))
+        _check_plot_works(self.ts.plot.kde, bw_method=.5, ind=sample_points)
         _check_plot_works(self.ts.plot.density, bw_method=.5,
-                          ind=linspace(-100, 100, 20))
-        ax = self.ts.plot.kde(logy=True, bw_method=.5,
-                              ind=linspace(-100, 100, 20))
+                          ind=sample_points)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, bw_method=.5, ind=sample_points,
+                              ax=ax)
         self._check_ax_scales(ax, yaxis='log')
         self._check_text_labels(ax.yaxis.get_label(), 'Density')
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_kde_missing_vals(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
+
         s = Series(np.random.uniform(size=50))
         s[0] = np.nan
         axes = _check_plot_works(s.plot.kde)
-        # check if the values have any missing values
-        # GH14821
-        self.assertTrue(any(~np.isnan(axes.lines[0].get_xdata())),
-                        msg='Missing Values not dropped')
 
-    @slow
+        # gh-14821: check if the values have any missing values
+        assert any(~np.isnan(axes.lines[0].get_xdata()))
+
+    @pytest.mark.slow
     def test_hist_kwargs(self):
-        ax = self.ts.plot.hist(bins=5)
-        self.assertEqual(len(ax.patches), 5)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(bins=5, ax=ax)
+        assert len(ax.patches) == 5
         self._check_text_labels(ax.yaxis.get_label(), 'Frequency')
         tm.close()
 
-        if self.mpl_ge_1_3_1:
-            ax = self.ts.plot.hist(orientation='horizontal')
-            self._check_text_labels(ax.xaxis.get_label(), 'Frequency')
-            tm.close()
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(orientation='horizontal', ax=ax)
+        self._check_text_labels(ax.xaxis.get_label(), 'Frequency')
+        tm.close()
 
-            ax = self.ts.plot.hist(align='left', stacked=True)
-            tm.close()
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(align='left', stacked=True, ax=ax)
+        tm.close()
 
-    @slow
+    @pytest.mark.slow
+    @td.skip_if_no_scipy
     def test_hist_kde_color(self):
-        ax = self.ts.plot.hist(logy=True, bins=10, color='b')
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.hist(logy=True, bins=10, color='b', ax=ax)
         self._check_ax_scales(ax, yaxis='log')
-        self.assertEqual(len(ax.patches), 10)
+        assert len(ax.patches) == 10
         self._check_colors(ax.patches, facecolors=['b'] * 10)
 
-        tm._skip_if_no_scipy()
         _skip_if_no_scipy_gaussian_kde()
-        ax = self.ts.plot.kde(logy=True, color='r')
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.kde(logy=True, color='r', ax=ax)
         self._check_ax_scales(ax, yaxis='log')
         lines = ax.get_lines()
-        self.assertEqual(len(lines), 1)
+        assert len(lines) == 1
         self._check_colors(lines, ['r'])
 
-    @slow
+    @pytest.mark.slow
     def test_boxplot_series(self):
-        ax = self.ts.plot.box(logy=True)
+        _, ax = self.plt.subplots()
+        ax = self.ts.plot.box(logy=True, ax=ax)
         self._check_ax_scales(ax, yaxis='log')
         xlabels = ax.get_xticklabels()
         self._check_text_labels(xlabels, [self.ts.name])
         ylabels = ax.get_yticklabels()
         self._check_text_labels(ylabels, [''] * len(ylabels))
 
-    @slow
+    @pytest.mark.slow
     def test_kind_both_ways(self):
         s = Series(range(3))
-        for kind in plotting._common_kinds + plotting._series_kinds:
+        kinds = (plotting._core._common_kinds +
+                 plotting._core._series_kinds)
+        _, ax = self.plt.subplots()
+        for kind in kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
-            s.plot(kind=kind)
+            s.plot(kind=kind, ax=ax)
             getattr(s.plot, kind)()
 
-    @slow
+    @pytest.mark.slow
     def test_invalid_plot_data(self):
         s = Series(list('abcd'))
-        for kind in plotting._common_kinds:
+        _, ax = self.plt.subplots()
+        for kind in plotting._core._common_kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
-            with tm.assertRaises(TypeError):
-                s.plot(kind=kind)
+            with pytest.raises(TypeError):
+                s.plot(kind=kind, ax=ax)
 
-    @slow
+    @pytest.mark.slow
     def test_valid_object_plot(self):
         s = Series(lrange(10), dtype=object)
-        for kind in plotting._common_kinds:
+        for kind in plotting._core._common_kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
             _check_plot_works(s.plot, kind=kind)
 
     def test_partially_invalid_plot_data(self):
         s = Series(['a', 'b', 1.0, 2])
-        for kind in plotting._common_kinds:
+        _, ax = self.plt.subplots()
+        for kind in plotting._core._common_kinds:
             if not _ok_for_gaussian_kde(kind):
                 continue
-            with tm.assertRaises(TypeError):
-                s.plot(kind=kind)
+            with pytest.raises(TypeError):
+                s.plot(kind=kind, ax=ax)
 
     def test_invalid_kind(self):
         s = Series([1, 2])
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             s.plot(kind='aasdf')
 
-    @slow
+    @pytest.mark.slow
     def test_dup_datetime_index_plot(self):
         dr1 = date_range('1/1/2009', periods=4)
         dr2 = date_range('1/2/2009', periods=4)
@@ -667,7 +740,7 @@ def test_dup_datetime_index_plot(self):
         s = Series(values, index=index)
         _check_plot_works(s.plot)
 
-    @slow
+    @pytest.mark.slow
     def test_errorbar_plot(self):
 
         s = Series(np.arange(10), name='x')
@@ -702,103 +775,109 @@ def test_errorbar_plot(self):
         self._check_has_errorbars(ax, xerr=0, yerr=1)
 
         # check incorrect lengths and types
-        with tm.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             s.plot(yerr=np.arange(11))
 
         s_err = ['zzz'] * 10
-        # in mpl 1.5+ this is a TypeError
-        with tm.assertRaises((ValueError, TypeError)):
+        # MPL > 2.0.0 will most likely use TypeError here
+        with pytest.raises((TypeError, ValueError)):
             s.plot(yerr=s_err)
 
+    # This XPASSES when tested with mpl == 3.0.1
+    @td.xfail_if_mpl_2_2
     def test_table(self):
         _check_plot_works(self.series.plot, table=True)
         _check_plot_works(self.series.plot, table=self.series)
 
-    @slow
+    @pytest.mark.slow
     def test_series_grid_settings(self):
         # Make sure plot defaults to rcParams['axes.grid'] setting, GH 9792
         self._check_grid_settings(Series([1, 2, 3]),
-                                  plotting._series_kinds +
-                                  plotting._common_kinds)
+                                  plotting._core._series_kinds +
+                                  plotting._core._common_kinds)
 
-    @slow
+    @pytest.mark.slow
     def test_standard_colors(self):
+        from pandas.plotting._style import _get_standard_colors
+
         for c in ['r', 'red', 'green', '#FF0000']:
-            result = plotting._get_standard_colors(1, color=c)
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(1, color=c)
+            assert result == [c]
 
-            result = plotting._get_standard_colors(1, color=[c])
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(1, color=[c])
+            assert result == [c]
 
-            result = plotting._get_standard_colors(3, color=c)
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(3, color=c)
+            assert result == [c] * 3
 
-            result = plotting._get_standard_colors(3, color=[c])
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(3, color=[c])
+            assert result == [c] * 3
 
-    @slow
+    @pytest.mark.slow
     def test_standard_colors_all(self):
         import matplotlib.colors as colors
+        from pandas.plotting._style import _get_standard_colors
 
         # multiple colors like mediumaquamarine
         for c in colors.cnames:
-            result = plotting._get_standard_colors(num_colors=1, color=c)
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(num_colors=1, color=c)
+            assert result == [c]
 
-            result = plotting._get_standard_colors(num_colors=1, color=[c])
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(num_colors=1, color=[c])
+            assert result == [c]
 
-            result = plotting._get_standard_colors(num_colors=3, color=c)
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(num_colors=3, color=c)
+            assert result == [c] * 3
 
-            result = plotting._get_standard_colors(num_colors=3, color=[c])
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(num_colors=3, color=[c])
+            assert result == [c] * 3
 
         # single letter colors like k
         for c in colors.ColorConverter.colors:
-            result = plotting._get_standard_colors(num_colors=1, color=c)
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(num_colors=1, color=c)
+            assert result == [c]
 
-            result = plotting._get_standard_colors(num_colors=1, color=[c])
-            self.assertEqual(result, [c])
+            result = _get_standard_colors(num_colors=1, color=[c])
+            assert result == [c]
 
-            result = plotting._get_standard_colors(num_colors=3, color=c)
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(num_colors=3, color=c)
+            assert result == [c] * 3
 
-            result = plotting._get_standard_colors(num_colors=3, color=[c])
-            self.assertEqual(result, [c] * 3)
+            result = _get_standard_colors(num_colors=3, color=[c])
+            assert result == [c] * 3
 
     def test_series_plot_color_kwargs(self):
         # GH1890
-        ax = Series(np.arange(12) + 1).plot(color='green')
+        _, ax = self.plt.subplots()
+        ax = Series(np.arange(12) + 1).plot(color='green', ax=ax)
         self._check_colors(ax.get_lines(), linecolors=['green'])
 
     def test_time_series_plot_color_kwargs(self):
         # #1890
+        _, ax = self.plt.subplots()
         ax = Series(np.arange(12) + 1, index=date_range(
-            '1/1/2000', periods=12)).plot(color='green')
+            '1/1/2000', periods=12)).plot(color='green', ax=ax)
         self._check_colors(ax.get_lines(), linecolors=['green'])
 
     def test_time_series_plot_color_with_empty_kwargs(self):
         import matplotlib as mpl
 
-        if self.mpl_ge_1_5_0:
-            def_colors = self._maybe_unpack_cycler(mpl.rcParams)
-        else:
-            def_colors = mpl.rcParams['axes.color_cycle']
+        def_colors = self._unpack_cycler(mpl.rcParams)
         index = date_range('1/1/2000', periods=12)
         s = Series(np.arange(1, 13), index=index)
 
         ncolors = 3
 
+        _, ax = self.plt.subplots()
         for i in range(ncolors):
-            ax = s.plot()
+            ax = s.plot(ax=ax)
         self._check_colors(ax.get_lines(), linecolors=def_colors[:ncolors])
 
     def test_xticklabels(self):
         # GH11529
         s = Series(np.arange(10), index=['P%02d' % i for i in range(10)])
-        ax = s.plot(xticks=[0, 3, 5, 9])
+        _, ax = self.plt.subplots()
+        ax = s.plot(xticks=[0, 3, 5, 9], ax=ax)
         exp = ['P%02d' % i for i in [0, 3, 5, 9]]
         self._check_text_labels(ax.get_xticklabels(), exp)
 
@@ -810,3 +889,15 @@ def test_custom_business_day_freq(self):
             freq=CustomBusinessDay(holidays=['2014-05-26'])))
 
         _check_plot_works(s.plot)
+
+    @pytest.mark.xfail
+    def test_plot_accessor_updates_on_inplace(self):
+        s = Series([1, 2, 3, 4])
+        _, ax = self.plt.subplots()
+        ax = s.plot(ax=ax)
+        before = ax.xaxis.get_ticklocs()
+
+        s.drop([0, 1], inplace=True)
+        _, ax = self.plt.subplots()
+        after = ax.xaxis.get_ticklocs()
+        tm.assert_numpy_array_equal(before, after)
diff --git a/pandas/tests/reductions/__init__.py b/pandas/tests/reductions/__init__.py
new file mode 100644
index 0000000000000..e3851753b6742
--- /dev/null
+++ b/pandas/tests/reductions/__init__.py
@@ -0,0 +1,4 @@
+"""
+Tests for reductions where we want to test for matching behavior across
+Array, Index, Series, and DataFrame methods.
+"""
diff --git a/pandas/tests/reductions/test_reductions.py b/pandas/tests/reductions/test_reductions.py
new file mode 100644
index 0000000000000..fbf7f610688ba
--- /dev/null
+++ b/pandas/tests/reductions/test_reductions.py
@@ -0,0 +1,1161 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, NaT, Period, PeriodIndex,
+    RangeIndex, Series, Timedelta, TimedeltaIndex, Timestamp, compat, isna,
+    timedelta_range, to_timedelta)
+from pandas.core import nanops
+import pandas.util.testing as tm
+
+
+def get_objs():
+    indexes = [
+        tm.makeBoolIndex(10, name='a'),
+        tm.makeIntIndex(10, name='a'),
+        tm.makeFloatIndex(10, name='a'),
+        tm.makeDateIndex(10, name='a'),
+        tm.makeDateIndex(10, name='a').tz_localize(tz='US/Eastern'),
+        tm.makePeriodIndex(10, name='a'),
+        tm.makeStringIndex(10, name='a'),
+        tm.makeUnicodeIndex(10, name='a')
+    ]
+
+    arr = np.random.randn(10)
+    series = [Series(arr, index=idx, name='a') for idx in indexes]
+
+    objs = indexes + series
+    return objs
+
+
+objs = get_objs()
+
+
+class TestReductions(object):
+
+    @pytest.mark.parametrize('opname', ['max', 'min'])
+    @pytest.mark.parametrize('obj', objs)
+    def test_ops(self, opname, obj):
+        result = getattr(obj, opname)()
+        if not isinstance(obj, PeriodIndex):
+            expected = getattr(obj.values, opname)()
+        else:
+            expected = pd.Period(
+                ordinal=getattr(obj._ndarray_values, opname)(),
+                freq=obj.freq)
+        try:
+            assert result == expected
+        except TypeError:
+            # comparing tz-aware series with np.array results in
+            # TypeError
+            expected = expected.astype('M8[ns]').astype('int64')
+            assert result.value == expected
+
+    def test_nanops(self):
+        # GH#7261
+        for opname in ['max', 'min']:
+            for klass in [Index, Series]:
+                arg_op = 'arg' + opname if klass is Index else 'idx' + opname
+
+                obj = klass([np.nan, 2.0])
+                assert getattr(obj, opname)() == 2.0
+
+                obj = klass([np.nan])
+                assert pd.isna(getattr(obj, opname)())
+                assert pd.isna(getattr(obj, opname)(skipna=False))
+
+                obj = klass([])
+                assert pd.isna(getattr(obj, opname)())
+                assert pd.isna(getattr(obj, opname)(skipna=False))
+
+                obj = klass([pd.NaT, datetime(2011, 11, 1)])
+                # check DatetimeIndex monotonic path
+                assert getattr(obj, opname)() == datetime(2011, 11, 1)
+                assert getattr(obj, opname)(skipna=False) is pd.NaT
+
+                assert getattr(obj, arg_op)() == 1
+                result = getattr(obj, arg_op)(skipna=False)
+                if klass is Series:
+                    assert np.isnan(result)
+                else:
+                    assert result == -1
+
+                obj = klass([pd.NaT, datetime(2011, 11, 1), pd.NaT])
+                # check DatetimeIndex non-monotonic path
+                assert getattr(obj, opname)(), datetime(2011, 11, 1)
+                assert getattr(obj, opname)(skipna=False) is pd.NaT
+
+                assert getattr(obj, arg_op)() == 1
+                result = getattr(obj, arg_op)(skipna=False)
+                if klass is Series:
+                    assert np.isnan(result)
+                else:
+                    assert result == -1
+
+                for dtype in ["M8[ns]", "datetime64[ns, UTC]"]:
+                    # cases with empty Series/DatetimeIndex
+                    obj = klass([], dtype=dtype)
+
+                    assert getattr(obj, opname)() is pd.NaT
+                    assert getattr(obj, opname)(skipna=False) is pd.NaT
+
+                    with pytest.raises(ValueError, match="empty sequence"):
+                        getattr(obj, arg_op)()
+                    with pytest.raises(ValueError, match="empty sequence"):
+                        getattr(obj, arg_op)(skipna=False)
+
+        # argmin/max
+        obj = Index(np.arange(5, dtype='int64'))
+        assert obj.argmin() == 0
+        assert obj.argmax() == 4
+
+        obj = Index([np.nan, 1, np.nan, 2])
+        assert obj.argmin() == 1
+        assert obj.argmax() == 3
+        assert obj.argmin(skipna=False) == -1
+        assert obj.argmax(skipna=False) == -1
+
+        obj = Index([np.nan])
+        assert obj.argmin() == -1
+        assert obj.argmax() == -1
+        assert obj.argmin(skipna=False) == -1
+        assert obj.argmax(skipna=False) == -1
+
+        obj = Index([pd.NaT, datetime(2011, 11, 1), datetime(2011, 11, 2),
+                     pd.NaT])
+        assert obj.argmin() == 1
+        assert obj.argmax() == 2
+        assert obj.argmin(skipna=False) == -1
+        assert obj.argmax(skipna=False) == -1
+
+        obj = Index([pd.NaT])
+        assert obj.argmin() == -1
+        assert obj.argmax() == -1
+        assert obj.argmin(skipna=False) == -1
+        assert obj.argmax(skipna=False) == -1
+
+    @pytest.mark.parametrize('op, expected_col', [
+        ['max', 'a'], ['min', 'b']
+    ])
+    def test_same_tz_min_max_axis_1(self, op, expected_col):
+        # GH 10390
+        df = DataFrame(pd.date_range('2016-01-01 00:00:00', periods=3,
+                                     tz='UTC'),
+                       columns=['a'])
+        df['b'] = df.a.subtract(pd.Timedelta(seconds=3600))
+        result = getattr(df, op)(axis=1)
+        expected = df[expected_col]
+        tm.assert_series_equal(result, expected)
+
+
+class TestIndexReductions(object):
+    # Note: the name TestIndexReductions indicates these tests
+    #  were moved from a Index-specific test file, _not_ that these tests are
+    #  intended long-term to be Index-specific
+
+    @pytest.mark.parametrize('start,stop,step',
+                             [(0, 400, 3), (500, 0, -6), (-10**6, 10**6, 4),
+                              (10**6, -10**6, -4), (0, 10, 20)])
+    def test_max_min_range(self, start, stop, step):
+        # GH#17607
+        idx = RangeIndex(start, stop, step)
+        expected = idx._int64index.max()
+        result = idx.max()
+        assert result == expected
+
+        # skipna should be irrelevant since RangeIndex should never have NAs
+        result2 = idx.max(skipna=False)
+        assert result2 == expected
+
+        expected = idx._int64index.min()
+        result = idx.min()
+        assert result == expected
+
+        # skipna should be irrelevant since RangeIndex should never have NAs
+        result2 = idx.min(skipna=False)
+        assert result2 == expected
+
+        # empty
+        idx = RangeIndex(start, stop, -step)
+        assert isna(idx.max())
+        assert isna(idx.min())
+
+    def test_minmax_timedelta64(self):
+
+        # monotonic
+        idx1 = TimedeltaIndex(['1 days', '2 days', '3 days'])
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = TimedeltaIndex(['1 days', np.nan, '3 days', 'NaT'])
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == Timedelta('1 days')
+            assert idx.max() == Timedelta('3 days')
+            assert idx.argmin() == 0
+            assert idx.argmax() == 2
+
+        for op in ['min', 'max']:
+            # Return NaT
+            obj = TimedeltaIndex([])
+            assert pd.isna(getattr(obj, op)())
+
+            obj = TimedeltaIndex([pd.NaT])
+            assert pd.isna(getattr(obj, op)())
+
+            obj = TimedeltaIndex([pd.NaT, pd.NaT, pd.NaT])
+            assert pd.isna(getattr(obj, op)())
+
+    def test_numpy_minmax_timedelta64(self):
+        td = timedelta_range('16815 days', '16820 days', freq='D')
+
+        assert np.min(td) == Timedelta('16815 days')
+        assert np.max(td) == Timedelta('16820 days')
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.min(td, out=0)
+        with pytest.raises(ValueError, match=errmsg):
+            np.max(td, out=0)
+
+        assert np.argmin(td) == 0
+        assert np.argmax(td) == 5
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmin(td, out=0)
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmax(td, out=0)
+
+    def test_timedelta_ops(self):
+        # GH#4984
+        # make sure ops return Timedelta
+        s = Series([Timestamp('20130101') + timedelta(seconds=i * i)
+                    for i in range(10)])
+        td = s.diff()
+
+        result = td.mean()
+        expected = to_timedelta(timedelta(seconds=9))
+        assert result == expected
+
+        result = td.to_frame().mean()
+        assert result[0] == expected
+
+        result = td.quantile(.1)
+        expected = Timedelta(np.timedelta64(2600, 'ms'))
+        assert result == expected
+
+        result = td.median()
+        expected = to_timedelta('00:00:09')
+        assert result == expected
+
+        result = td.to_frame().median()
+        assert result[0] == expected
+
+        # GH#6462
+        # consistency in returned values for sum
+        result = td.sum()
+        expected = to_timedelta('00:01:21')
+        assert result == expected
+
+        result = td.to_frame().sum()
+        assert result[0] == expected
+
+        # std
+        result = td.std()
+        expected = to_timedelta(Series(td.dropna().values).std())
+        assert result == expected
+
+        result = td.to_frame().std()
+        assert result[0] == expected
+
+        # invalid ops
+        for op in ['skew', 'kurt', 'sem', 'prod']:
+            msg = "reduction operation '{}' not allowed for this dtype"
+            with pytest.raises(TypeError, match=msg.format(op)):
+                getattr(td, op)()
+
+        # GH#10040
+        # make sure NaT is properly handled by median()
+        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07')])
+        assert s.diff().median() == timedelta(days=4)
+
+        s = Series([Timestamp('2015-02-03'), Timestamp('2015-02-07'),
+                    Timestamp('2015-02-15')])
+        assert s.diff().median() == timedelta(days=6)
+
+    def test_minmax_tz(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # monotonic
+        idx1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                 '2011-01-03'], tz=tz)
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = pd.DatetimeIndex(['2011-01-01', pd.NaT, '2011-01-03',
+                                 '2011-01-02', pd.NaT], tz=tz)
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == Timestamp('2011-01-01', tz=tz)
+            assert idx.max() == Timestamp('2011-01-03', tz=tz)
+            assert idx.argmin() == 0
+            assert idx.argmax() == 2
+
+    @pytest.mark.parametrize('op', ['min', 'max'])
+    def test_minmax_nat_datetime64(self, op):
+        # Return NaT
+        obj = DatetimeIndex([])
+        assert pd.isna(getattr(obj, op)())
+
+        obj = DatetimeIndex([pd.NaT])
+        assert pd.isna(getattr(obj, op)())
+
+        obj = DatetimeIndex([pd.NaT, pd.NaT, pd.NaT])
+        assert pd.isna(getattr(obj, op)())
+
+    def test_numpy_minmax_datetime64(self):
+        dr = pd.date_range(start='2016-01-15', end='2016-01-20')
+
+        assert np.min(dr) == Timestamp('2016-01-15 00:00:00', freq='D')
+        assert np.max(dr) == Timestamp('2016-01-20 00:00:00', freq='D')
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.min(dr, out=0)
+
+        with pytest.raises(ValueError, match=errmsg):
+            np.max(dr, out=0)
+
+        assert np.argmin(dr) == 0
+        assert np.argmax(dr) == 5
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmin(dr, out=0)
+
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmax(dr, out=0)
+
+    def test_minmax_period(self):
+
+        # monotonic
+        idx1 = pd.PeriodIndex([NaT, '2011-01-01', '2011-01-02',
+                               '2011-01-03'], freq='D')
+        assert idx1.is_monotonic
+
+        # non-monotonic
+        idx2 = pd.PeriodIndex(['2011-01-01', NaT, '2011-01-03',
+                               '2011-01-02', NaT], freq='D')
+        assert not idx2.is_monotonic
+
+        for idx in [idx1, idx2]:
+            assert idx.min() == pd.Period('2011-01-01', freq='D')
+            assert idx.max() == pd.Period('2011-01-03', freq='D')
+        assert idx1.argmin() == 1
+        assert idx2.argmin() == 0
+        assert idx1.argmax() == 3
+        assert idx2.argmax() == 2
+
+        for op in ['min', 'max']:
+            # Return NaT
+            obj = PeriodIndex([], freq='M')
+            result = getattr(obj, op)()
+            assert result is NaT
+
+            obj = PeriodIndex([NaT], freq='M')
+            result = getattr(obj, op)()
+            assert result is NaT
+
+            obj = PeriodIndex([NaT, NaT, NaT], freq='M')
+            result = getattr(obj, op)()
+            assert result is NaT
+
+    def test_numpy_minmax_period(self):
+        pr = pd.period_range(start='2016-01-15', end='2016-01-20')
+
+        assert np.min(pr) == Period('2016-01-15', freq='D')
+        assert np.max(pr) == Period('2016-01-20', freq='D')
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.min(pr, out=0)
+        with pytest.raises(ValueError, match=errmsg):
+            np.max(pr, out=0)
+
+        assert np.argmin(pr) == 0
+        assert np.argmax(pr) == 5
+
+        errmsg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmin(pr, out=0)
+        with pytest.raises(ValueError, match=errmsg):
+            np.argmax(pr, out=0)
+
+    def test_min_max_categorical(self):
+
+        ci = pd.CategoricalIndex(list('aabbca'),
+                                 categories=list('cab'),
+                                 ordered=False)
+        with pytest.raises(TypeError):
+            ci.min()
+        with pytest.raises(TypeError):
+            ci.max()
+
+        ci = pd.CategoricalIndex(list('aabbca'),
+                                 categories=list('cab'),
+                                 ordered=True)
+        assert ci.min() == 'c'
+        assert ci.max() == 'b'
+
+
+class TestSeriesReductions(object):
+    # Note: the name TestSeriesReductions indicates these tests
+    #  were moved from a series-specific test file, _not_ that these tests are
+    #  intended long-term to be series-specific
+
+    def test_sum_inf(self):
+        s = Series(np.random.randn(10))
+        s2 = s.copy()
+
+        s[5:8] = np.inf
+        s2[5:8] = np.nan
+
+        assert np.isinf(s.sum())
+
+        arr = np.random.randn(100, 100).astype('f4')
+        arr[:, 2] = np.inf
+
+        with pd.option_context("mode.use_inf_as_na", True):
+            tm.assert_almost_equal(s.sum(), s2.sum())
+
+        res = nanops.nansum(arr, axis=1)
+        assert np.isinf(res).all()
+
+    @pytest.mark.parametrize("use_bottleneck", [True, False])
+    @pytest.mark.parametrize("method, unit", [
+        ("sum", 0.0),
+        ("prod", 1.0)
+    ])
+    def test_empty(self, method, unit, use_bottleneck):
+        with pd.option_context("use_bottleneck", use_bottleneck):
+            # GH#9422 / GH#18921
+            # Entirely empty
+            s = Series([])
+            # NA by default
+            result = getattr(s, method)()
+            assert result == unit
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(min_count=1)
+            assert pd.isna(result)
+
+            # Skipna, default
+            result = getattr(s, method)(skipna=True)
+            result == unit
+
+            # Skipna, explicit
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert pd.isna(result)
+
+            # All-NA
+            s = Series([np.nan])
+            # NA by default
+            result = getattr(s, method)()
+            assert result == unit
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(min_count=1)
+            assert pd.isna(result)
+
+            # Skipna, default
+            result = getattr(s, method)(skipna=True)
+            result == unit
+
+            # skipna, explicit
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == unit
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert pd.isna(result)
+
+            # Mix of valid, empty
+            s = Series([np.nan, 1])
+            # Default
+            result = getattr(s, method)()
+            assert result == 1.0
+
+            # Explicit
+            result = getattr(s, method)(min_count=0)
+            assert result == 1.0
+
+            result = getattr(s, method)(min_count=1)
+            assert result == 1.0
+
+            # Skipna
+            result = getattr(s, method)(skipna=True)
+            assert result == 1.0
+
+            result = getattr(s, method)(skipna=True, min_count=0)
+            assert result == 1.0
+
+            result = getattr(s, method)(skipna=True, min_count=1)
+            assert result == 1.0
+
+            # GH#844 (changed in GH#9422)
+            df = DataFrame(np.empty((10, 0)))
+            assert (getattr(df, method)(1) == unit).all()
+
+            s = pd.Series([1])
+            result = getattr(s, method)(min_count=2)
+            assert pd.isna(result)
+
+            s = pd.Series([np.nan])
+            result = getattr(s, method)(min_count=2)
+            assert pd.isna(result)
+
+            s = pd.Series([np.nan, 1])
+            result = getattr(s, method)(min_count=2)
+            assert pd.isna(result)
+
+    @pytest.mark.parametrize('method, unit', [
+        ('sum', 0.0),
+        ('prod', 1.0),
+    ])
+    def test_empty_multi(self, method, unit):
+        s = pd.Series([1, np.nan, np.nan, np.nan],
+                      index=pd.MultiIndex.from_product([('a', 'b'), (0, 1)]))
+        # 1 / 0 by default
+        result = getattr(s, method)(level=0)
+        expected = pd.Series([1, unit], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+        # min_count=0
+        result = getattr(s, method)(level=0, min_count=0)
+        expected = pd.Series([1, unit], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+        # min_count=1
+        result = getattr(s, method)(level=0, min_count=1)
+        expected = pd.Series([1, np.nan], index=['a', 'b'])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "method", ['mean', 'median', 'std', 'var'])
+    def test_ops_consistency_on_empty(self, method):
+
+        # GH#7869
+        # consistency on empty
+
+        # float
+        result = getattr(Series(dtype=float), method)()
+        assert pd.isna(result)
+
+        # timedelta64[ns]
+        result = getattr(Series(dtype='m8[ns]'), method)()
+        assert result is pd.NaT
+
+    def test_nansum_buglet(self):
+        ser = Series([1.0, np.nan], index=[0, 1])
+        result = np.nansum(ser)
+        tm.assert_almost_equal(result, 1)
+
+    @pytest.mark.parametrize("use_bottleneck", [True, False])
+    def test_sum_overflow(self, use_bottleneck):
+
+        with pd.option_context('use_bottleneck', use_bottleneck):
+            # GH#6915
+            # overflowing on the smaller int dtypes
+            for dtype in ['int32', 'int64']:
+                v = np.arange(5000000, dtype=dtype)
+                s = Series(v)
+
+                result = s.sum(skipna=False)
+                assert int(result) == v.sum(dtype='int64')
+                result = s.min(skipna=False)
+                assert int(result) == 0
+                result = s.max(skipna=False)
+                assert int(result) == v[-1]
+
+            for dtype in ['float32', 'float64']:
+                v = np.arange(5000000, dtype=dtype)
+                s = Series(v)
+
+                result = s.sum(skipna=False)
+                assert result == v.sum(dtype=dtype)
+                result = s.min(skipna=False)
+                assert np.allclose(float(result), 0.0)
+                result = s.max(skipna=False)
+                assert np.allclose(float(result), v[-1])
+
+    def test_empty_timeseries_reductions_return_nat(self):
+        # covers GH#11245
+        for dtype in ('m8[ns]', 'm8[ns]', 'M8[ns]', 'M8[ns, UTC]'):
+            assert Series([], dtype=dtype).min() is pd.NaT
+            assert Series([], dtype=dtype).max() is pd.NaT
+            assert Series([], dtype=dtype).min(skipna=False) is pd.NaT
+            assert Series([], dtype=dtype).max(skipna=False) is pd.NaT
+
+    def test_numpy_argmin_deprecated(self):
+        # See GH#16830
+        data = np.arange(1, 11)
+
+        s = Series(data, index=data)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # The deprecation of Series.argmin also causes a deprecation
+            # warning when calling np.argmin. This behavior is temporary
+            # until the implementation of Series.argmin is corrected.
+            result = np.argmin(s)
+
+        assert result == 1
+
+        with tm.assert_produces_warning(FutureWarning):
+            # argmin is aliased to idxmin
+            result = s.argmin()
+
+        assert result == 1
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            msg = "the 'out' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.argmin(s, out=data)
+
+    def test_numpy_argmax_deprecated(self):
+        # See GH#16830
+        data = np.arange(1, 11)
+
+        s = Series(data, index=data)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # The deprecation of Series.argmax also causes a deprecation
+            # warning when calling np.argmax. This behavior is temporary
+            # until the implementation of Series.argmax is corrected.
+            result = np.argmax(s)
+        assert result == 10
+
+        with tm.assert_produces_warning(FutureWarning):
+            # argmax is aliased to idxmax
+            result = s.argmax()
+
+        assert result == 10
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            msg = "the 'out' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.argmax(s, out=data)
+
+    def test_idxmin(self):
+        # test idxmin
+        # _check_stat_op approach can not be used here because of isna check.
+        string_series = tm.makeStringSeries().rename('series')
+
+        # add some NaNs
+        string_series[5:15] = np.NaN
+
+        # skipna or no
+        assert string_series[string_series.idxmin()] == string_series.min()
+        assert pd.isna(string_series.idxmin(skipna=False))
+
+        # no NaNs
+        nona = string_series.dropna()
+        assert nona[nona.idxmin()] == nona.min()
+        assert (nona.index.values.tolist().index(nona.idxmin()) ==
+                nona.values.argmin())
+
+        # all NaNs
+        allna = string_series * np.nan
+        assert pd.isna(allna.idxmin())
+
+        # datetime64[ns]
+        s = Series(pd.date_range('20130102', periods=6))
+        result = s.idxmin()
+        assert result == 0
+
+        s[0] = np.nan
+        result = s.idxmin()
+        assert result == 1
+
+    def test_idxmax(self):
+        # test idxmax
+        # _check_stat_op approach can not be used here because of isna check.
+        string_series = tm.makeStringSeries().rename('series')
+
+        # add some NaNs
+        string_series[5:15] = np.NaN
+
+        # skipna or no
+        assert string_series[string_series.idxmax()] == string_series.max()
+        assert pd.isna(string_series.idxmax(skipna=False))
+
+        # no NaNs
+        nona = string_series.dropna()
+        assert nona[nona.idxmax()] == nona.max()
+        assert (nona.index.values.tolist().index(nona.idxmax()) ==
+                nona.values.argmax())
+
+        # all NaNs
+        allna = string_series * np.nan
+        assert pd.isna(allna.idxmax())
+
+        from pandas import date_range
+        s = Series(date_range('20130102', periods=6))
+        result = s.idxmax()
+        assert result == 5
+
+        s[5] = np.nan
+        result = s.idxmax()
+        assert result == 4
+
+        # Float64Index
+        # GH#5914
+        s = pd.Series([1, 2, 3], [1.1, 2.1, 3.1])
+        result = s.idxmax()
+        assert result == 3.1
+        result = s.idxmin()
+        assert result == 1.1
+
+        s = pd.Series(s.index, s.index)
+        result = s.idxmax()
+        assert result == 3.1
+        result = s.idxmin()
+        assert result == 1.1
+
+    def test_all_any(self):
+        ts = tm.makeTimeSeries()
+        bool_series = ts > 0
+        assert not bool_series.all()
+        assert bool_series.any()
+
+        # Alternative types, with implicit 'object' dtype.
+        s = Series(['abc', True])
+        assert 'abc' == s.any()  # 'abc' || True => 'abc'
+
+    def test_all_any_params(self):
+        # Check skipna, with implicit 'object' dtype.
+        s1 = Series([np.nan, True])
+        s2 = Series([np.nan, False])
+        assert s1.all(skipna=False)  # nan && True => True
+        assert s1.all(skipna=True)
+        assert np.isnan(s2.any(skipna=False))  # nan || False => nan
+        assert not s2.any(skipna=True)
+
+        # Check level.
+        s = pd.Series([False, False, True, True, False, True],
+                      index=[0, 0, 1, 1, 2, 2])
+        tm.assert_series_equal(s.all(level=0), Series([False, True, False]))
+        tm.assert_series_equal(s.any(level=0), Series([False, True, True]))
+
+        # bool_only is not implemented with level option.
+        with pytest.raises(NotImplementedError):
+            s.any(bool_only=True, level=0)
+        with pytest.raises(NotImplementedError):
+            s.all(bool_only=True, level=0)
+
+        # bool_only is not implemented alone.
+        with pytest.raises(NotImplementedError):
+            s.any(bool_only=True,)
+        with pytest.raises(NotImplementedError):
+            s.all(bool_only=True)
+
+    def test_timedelta64_analytics(self):
+
+        # index min/max
+        dti = pd.date_range('2012-1-1', periods=3, freq='D')
+        td = Series(dti) - pd.Timestamp('20120101')
+
+        result = td.idxmin()
+        assert result == 0
+
+        result = td.idxmax()
+        assert result == 2
+
+        # GH#2982
+        # with NaT
+        td[0] = np.nan
+
+        result = td.idxmin()
+        assert result == 1
+
+        result = td.idxmax()
+        assert result == 2
+
+        # abs
+        s1 = Series(pd.date_range('20120101', periods=3))
+        s2 = Series(pd.date_range('20120102', periods=3))
+        expected = Series(s2 - s1)
+
+        # FIXME: don't leave commented-out code
+        # this fails as numpy returns timedelta64[us]
+        # result = np.abs(s1-s2)
+        # assert_frame_equal(result,expected)
+
+        result = (s1 - s2).abs()
+        tm.assert_series_equal(result, expected)
+
+        # max/min
+        result = td.max()
+        expected = pd.Timedelta('2 days')
+        assert result == expected
+
+        result = td.min()
+        expected = pd.Timedelta('1 days')
+        assert result == expected
+
+    @pytest.mark.parametrize(
+        "test_input,error_type",
+        [
+            (pd.Series([]), ValueError),
+
+            # For strings, or any Series with dtype 'O'
+            (pd.Series(['foo', 'bar', 'baz']), TypeError),
+            (pd.Series([(1,), (2,)]), TypeError),
+
+            # For mixed data types
+            (
+                pd.Series(['foo', 'foo', 'bar', 'bar', None, np.nan, 'baz']),
+                TypeError
+            ),
+        ]
+    )
+    def test_assert_idxminmax_raises(self, test_input, error_type):
+        """
+        Cases where ``Series.argmax`` and related should raise an exception
+        """
+        with pytest.raises(error_type):
+            test_input.idxmin()
+        with pytest.raises(error_type):
+            test_input.idxmin(skipna=False)
+        with pytest.raises(error_type):
+            test_input.idxmax()
+        with pytest.raises(error_type):
+            test_input.idxmax(skipna=False)
+
+    def test_idxminmax_with_inf(self):
+        # For numeric data with NA and Inf (GH #13595)
+        s = pd.Series([0, -np.inf, np.inf, np.nan])
+
+        assert s.idxmin() == 1
+        assert np.isnan(s.idxmin(skipna=False))
+
+        assert s.idxmax() == 2
+        assert np.isnan(s.idxmax(skipna=False))
+
+        # Using old-style behavior that treats floating point nan, -inf, and
+        # +inf as missing
+        with pd.option_context('mode.use_inf_as_na', True):
+            assert s.idxmin() == 0
+            assert np.isnan(s.idxmin(skipna=False))
+            assert s.idxmax() == 0
+            np.isnan(s.idxmax(skipna=False))
+
+
+class TestDatetime64SeriesReductions(object):
+    # Note: the name TestDatetime64SeriesReductions indicates these tests
+    #  were moved from a series-specific test file, _not_ that these tests are
+    #  intended long-term to be series-specific
+
+    @pytest.mark.parametrize('nat_ser', [
+        Series([pd.NaT, pd.NaT]),
+        Series([pd.NaT, pd.Timedelta('nat')]),
+        Series([pd.Timedelta('nat'), pd.Timedelta('nat')])])
+    def test_minmax_nat_series(self, nat_ser):
+        # GH#23282
+        assert nat_ser.min() is pd.NaT
+        assert nat_ser.max() is pd.NaT
+        assert nat_ser.min(skipna=False) is pd.NaT
+        assert nat_ser.max(skipna=False) is pd.NaT
+
+    @pytest.mark.parametrize('nat_df', [
+        pd.DataFrame([pd.NaT, pd.NaT]),
+        pd.DataFrame([pd.NaT, pd.Timedelta('nat')]),
+        pd.DataFrame([pd.Timedelta('nat'), pd.Timedelta('nat')])])
+    def test_minmax_nat_dataframe(self, nat_df):
+        # GH#23282
+        assert nat_df.min()[0] is pd.NaT
+        assert nat_df.max()[0] is pd.NaT
+        assert nat_df.min(skipna=False)[0] is pd.NaT
+        assert nat_df.max(skipna=False)[0] is pd.NaT
+
+    def test_min_max(self):
+        rng = pd.date_range('1/1/2000', '12/31/2000')
+        rng2 = rng.take(np.random.permutation(len(rng)))
+
+        the_min = rng2.min()
+        the_max = rng2.max()
+        assert isinstance(the_min, pd.Timestamp)
+        assert isinstance(the_max, pd.Timestamp)
+        assert the_min == rng[0]
+        assert the_max == rng[-1]
+
+        assert rng.min() == rng[0]
+        assert rng.max() == rng[-1]
+
+    def test_min_max_series(self):
+        rng = pd.date_range('1/1/2000', periods=10, freq='4h')
+        lvls = ['A', 'A', 'A', 'B', 'B', 'B', 'C', 'C', 'C', 'C']
+        df = DataFrame({'TS': rng, 'V': np.random.randn(len(rng)), 'L': lvls})
+
+        result = df.TS.max()
+        exp = pd.Timestamp(df.TS.iat[-1])
+        assert isinstance(result, pd.Timestamp)
+        assert result == exp
+
+        result = df.TS.min()
+        exp = pd.Timestamp(df.TS.iat[0])
+        assert isinstance(result, pd.Timestamp)
+        assert result == exp
+
+
+class TestCategoricalSeriesReductions(object):
+    # Note: the name TestCategoricalSeriesReductions indicates these tests
+    #  were moved from a series-specific test file, _not_ that these tests are
+    #  intended long-term to be series-specific
+
+    def test_min_max(self):
+        # unordered cats have no min/max
+        cat = Series(Categorical(["a", "b", "c", "d"], ordered=False))
+        with pytest.raises(TypeError):
+            cat.min()
+        with pytest.raises(TypeError):
+            cat.max()
+
+        cat = Series(Categorical(["a", "b", "c", "d"], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "a"
+        assert _max == "d"
+
+        cat = Series(Categorical(["a", "b", "c", "d"], categories=[
+                     'd', 'c', 'b', 'a'], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert _min == "d"
+        assert _max == "a"
+
+        cat = Series(Categorical(
+            [np.nan, "b", "c", np.nan], categories=['d', 'c', 'b', 'a'
+                                                    ], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == "b"
+
+        cat = Series(Categorical(
+            [np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1], ordered=True))
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == 1
+
+    def test_min_max_numeric_only(self):
+        # TODO deprecate numeric_only argument for Categorical and use
+        # skipna as well, see GH25303
+        cat = Series(Categorical(
+            ["a", "b", np.nan, "a"], categories=['b', 'a'], ordered=True))
+
+        _min = cat.min()
+        _max = cat.max()
+        assert np.isnan(_min)
+        assert _max == "a"
+
+        _min = cat.min(numeric_only=True)
+        _max = cat.max(numeric_only=True)
+        assert _min == "b"
+        assert _max == "a"
+
+        _min = cat.min(numeric_only=False)
+        _max = cat.max(numeric_only=False)
+        assert np.isnan(_min)
+        assert _max == "a"
+
+
+class TestSeriesMode(object):
+    # Note: the name TestSeriesMode indicates these tests
+    #  were moved from a series-specific test file, _not_ that these tests are
+    #  intended long-term to be series-specific
+
+    @pytest.mark.parametrize('dropna, expected', [
+        (True, Series([], dtype=np.float64)),
+        (False, Series([], dtype=np.float64))
+    ])
+    def test_mode_empty(self, dropna, expected):
+        s = Series([], dtype=np.float64)
+        result = s.mode(dropna)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, data, expected', [
+        (True, [1, 1, 1, 2], [1]),
+        (True, [1, 1, 1, 2, 3, 3, 3], [1, 3]),
+        (False, [1, 1, 1, 2], [1]),
+        (False, [1, 1, 1, 2, 3, 3, 3], [1, 3]),
+    ])
+    @pytest.mark.parametrize(
+        'dt',
+        list(np.typecodes['AllInteger'] + np.typecodes['Float'])
+    )
+    def test_mode_numerical(self, dropna, data, expected, dt):
+        s = Series(data, dtype=dt)
+        result = s.mode(dropna)
+        expected = Series(expected, dtype=dt)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected', [
+        (True, [1.0]),
+        (False, [1, np.nan]),
+    ])
+    def test_mode_numerical_nan(self, dropna, expected):
+        s = Series([1, 1, 2, np.nan, np.nan])
+        result = s.mode(dropna)
+        expected = Series(expected)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2, expected3', [
+        (True, ['b'], ['bar'], ['nan']),
+        (False, ['b'], [np.nan], ['nan'])
+    ])
+    def test_mode_str_obj(self, dropna, expected1, expected2, expected3):
+        # Test string and object types.
+        data = ['a'] * 2 + ['b'] * 3
+
+        s = Series(data, dtype='c')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='c')
+        tm.assert_series_equal(result, expected1)
+
+        data = ['foo', 'bar', 'bar', np.nan, np.nan, np.nan]
+
+        s = Series(data, dtype=object)
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype=object)
+        tm.assert_series_equal(result, expected2)
+
+        data = ['foo', 'bar', 'bar', np.nan, np.nan, np.nan]
+
+        s = Series(data, dtype=object).astype(str)
+        result = s.mode(dropna)
+        expected3 = Series(expected3, dtype=str)
+        tm.assert_series_equal(result, expected3)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['foo'], ['foo']),
+        (False, ['foo'], [np.nan])
+    ])
+    def test_mode_mixeddtype(self, dropna, expected1, expected2):
+        s = Series([1, 'foo', 'foo'])
+        result = s.mode(dropna)
+        expected = Series(expected1)
+        tm.assert_series_equal(result, expected)
+
+        s = Series([1, 'foo', 'foo', np.nan, np.nan, np.nan])
+        result = s.mode(dropna)
+        expected = Series(expected2, dtype=object)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['1900-05-03', '2011-01-03', '2013-01-02'],
+               ['2011-01-03', '2013-01-02']),
+        (False, [np.nan], [np.nan, '2011-01-03', '2013-01-02']),
+    ])
+    def test_mode_datetime(self, dropna, expected1, expected2):
+        s = Series(['2011-01-03', '2013-01-02',
+                    '1900-05-03', 'nan', 'nan'], dtype='M8[ns]')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='M8[ns]')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(['2011-01-03', '2013-01-02', '1900-05-03',
+                    '2011-01-03', '2013-01-02', 'nan', 'nan'],
+                   dtype='M8[ns]')
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='M8[ns]')
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, ['-1 days', '0 days', '1 days'], ['2 min', '1 day']),
+        (False, [np.nan], [np.nan, '2 min', '1 day']),
+    ])
+    def test_mode_timedelta(self, dropna, expected1, expected2):
+        # gh-5986: Test timedelta types.
+
+        s = Series(['1 days', '-1 days', '0 days', 'nan', 'nan'],
+                   dtype='timedelta64[ns]')
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='timedelta64[ns]')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(['1 day', '1 day', '-1 day', '-1 day 2 min',
+                    '2 min', '2 min', 'nan', 'nan'],
+                   dtype='timedelta64[ns]')
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='timedelta64[ns]')
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2, expected3', [
+        (True, Categorical([1, 2], categories=[1, 2]),
+         Categorical(['a'], categories=[1, 'a']),
+         Categorical([3, 1], categories=[3, 2, 1], ordered=True)),
+        (False, Categorical([np.nan], categories=[1, 2]),
+         Categorical([np.nan, 'a'], categories=[1, 'a']),
+         Categorical([np.nan, 3, 1], categories=[3, 2, 1], ordered=True)),
+    ])
+    def test_mode_category(self, dropna, expected1, expected2, expected3):
+        s = Series(Categorical([1, 2, np.nan, np.nan]))
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype='category')
+        tm.assert_series_equal(result, expected1)
+
+        s = Series(Categorical([1, 'a', 'a', np.nan, np.nan]))
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype='category')
+        tm.assert_series_equal(result, expected2)
+
+        s = Series(Categorical([1, 1, 2, 3, 3, np.nan, np.nan],
+                               categories=[3, 2, 1], ordered=True))
+        result = s.mode(dropna)
+        expected3 = Series(expected3, dtype='category')
+        tm.assert_series_equal(result, expected3)
+
+    @pytest.mark.parametrize('dropna, expected1, expected2', [
+        (True, [2**63], [1, 2**63]),
+        (False, [2**63], [1, 2**63])
+    ])
+    def test_mode_intoverflow(self, dropna, expected1, expected2):
+        # Test for uint64 overflow.
+        s = Series([1, 2**63, 2**63], dtype=np.uint64)
+        result = s.mode(dropna)
+        expected1 = Series(expected1, dtype=np.uint64)
+        tm.assert_series_equal(result, expected1)
+
+        s = Series([1, 2**63], dtype=np.uint64)
+        result = s.mode(dropna)
+        expected2 = Series(expected2, dtype=np.uint64)
+        tm.assert_series_equal(result, expected2)
+
+    @pytest.mark.skipif(not compat.PY3, reason="only PY3")
+    def test_mode_sortwarning(self):
+        # Check for the warning that is raised when the mode
+        # results cannot be sorted
+
+        expected = Series(['foo', np.nan])
+        s = Series([1, 'foo', 'foo', np.nan, np.nan])
+
+        with tm.assert_produces_warning(UserWarning, check_stacklevel=False):
+            result = s.mode(dropna=False)
+            result = result.sort_values().reset_index(drop=True)
+
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/reductions/test_stat_reductions.py b/pandas/tests/reductions/test_stat_reductions.py
new file mode 100644
index 0000000000000..11ecd03f6c7e1
--- /dev/null
+++ b/pandas/tests/reductions/test_stat_reductions.py
@@ -0,0 +1,202 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for statistical reductions of 2nd moment or higher: var, skew, kurt, ...
+"""
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import DataFrame, Series, compat
+import pandas.util.testing as tm
+
+
+class TestSeriesStatReductions(object):
+    # Note: the name TestSeriesStatReductions indicates these tests
+    #  were moved from a series-specific test file, _not_ that these tests are
+    #  intended long-term to be series-specific
+
+    def _check_stat_op(self, name, alternate, string_series_,
+                       check_objects=False, check_allna=False):
+
+        with pd.option_context('use_bottleneck', False):
+            f = getattr(Series, name)
+
+            # add some NaNs
+            string_series_[5:15] = np.NaN
+
+            # mean, idxmax, idxmin, min, and max are valid for dates
+            if name not in ['max', 'min', 'mean']:
+                ds = Series(pd.date_range('1/1/2001', periods=10))
+                with pytest.raises(TypeError):
+                    f(ds)
+
+            # skipna or no
+            assert pd.notna(f(string_series_))
+            assert pd.isna(f(string_series_, skipna=False))
+
+            # check the result is correct
+            nona = string_series_.dropna()
+            tm.assert_almost_equal(f(nona), alternate(nona.values))
+            tm.assert_almost_equal(f(string_series_), alternate(nona.values))
+
+            allna = string_series_ * np.nan
+
+            if check_allna:
+                assert np.isnan(f(allna))
+
+            # dtype=object with None, it works!
+            s = Series([1, 2, 3, None, 5])
+            f(s)
+
+            # GH#2888
+            items = [0]
+            items.extend(lrange(2 ** 40, 2 ** 40 + 1000))
+            s = Series(items, dtype='int64')
+            tm.assert_almost_equal(float(f(s)), float(alternate(s.values)))
+
+            # check date range
+            if check_objects:
+                s = Series(pd.bdate_range('1/1/2000', periods=10))
+                res = f(s)
+                exp = alternate(s)
+                assert res == exp
+
+            # check on string data
+            if name not in ['sum', 'min', 'max']:
+                with pytest.raises(TypeError):
+                    f(Series(list('abc')))
+
+            # Invalid axis.
+            with pytest.raises(ValueError):
+                f(string_series_, axis=1)
+
+            # Unimplemented numeric_only parameter.
+            if 'numeric_only' in compat.signature(f).args:
+                with pytest.raises(NotImplementedError, match=name):
+                    f(string_series_, numeric_only=True)
+
+    def test_sum(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('sum', np.sum, string_series, check_allna=False)
+
+    def test_mean(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('mean', np.mean, string_series)
+
+    def test_median(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('median', np.median, string_series)
+
+        # test with integers, test failure
+        int_ts = Series(np.ones(10, dtype=int), index=lrange(10))
+        tm.assert_almost_equal(np.median(int_ts), int_ts.median())
+
+    def test_prod(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('prod', np.prod, string_series)
+
+    def test_min(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('min', np.min, string_series, check_objects=True)
+
+    def test_max(self):
+        string_series = tm.makeStringSeries().rename('series')
+        self._check_stat_op('max', np.max, string_series, check_objects=True)
+
+    def test_var_std(self):
+        string_series = tm.makeStringSeries().rename('series')
+        datetime_series = tm.makeTimeSeries().rename('ts')
+
+        alt = lambda x: np.std(x, ddof=1)
+        self._check_stat_op('std', alt, string_series)
+
+        alt = lambda x: np.var(x, ddof=1)
+        self._check_stat_op('var', alt, string_series)
+
+        result = datetime_series.std(ddof=4)
+        expected = np.std(datetime_series.values, ddof=4)
+        tm.assert_almost_equal(result, expected)
+
+        result = datetime_series.var(ddof=4)
+        expected = np.var(datetime_series.values, ddof=4)
+        tm.assert_almost_equal(result, expected)
+
+        # 1 - element series with ddof=1
+        s = datetime_series.iloc[[0]]
+        result = s.var(ddof=1)
+        assert pd.isna(result)
+
+        result = s.std(ddof=1)
+        assert pd.isna(result)
+
+    def test_sem(self):
+        string_series = tm.makeStringSeries().rename('series')
+        datetime_series = tm.makeTimeSeries().rename('ts')
+
+        alt = lambda x: np.std(x, ddof=1) / np.sqrt(len(x))
+        self._check_stat_op('sem', alt, string_series)
+
+        result = datetime_series.sem(ddof=4)
+        expected = np.std(datetime_series.values,
+                          ddof=4) / np.sqrt(len(datetime_series.values))
+        tm.assert_almost_equal(result, expected)
+
+        # 1 - element series with ddof=1
+        s = datetime_series.iloc[[0]]
+        result = s.sem(ddof=1)
+        assert pd.isna(result)
+
+    @td.skip_if_no_scipy
+    def test_skew(self):
+        from scipy.stats import skew
+
+        string_series = tm.makeStringSeries().rename('series')
+
+        alt = lambda x: skew(x, bias=False)
+        self._check_stat_op('skew', alt, string_series)
+
+        # test corner cases, skew() returns NaN unless there's at least 3
+        # values
+        min_N = 3
+        for i in range(1, min_N + 1):
+            s = Series(np.ones(i))
+            df = DataFrame(np.ones((i, i)))
+            if i < min_N:
+                assert np.isnan(s.skew())
+                assert np.isnan(df.skew()).all()
+            else:
+                assert 0 == s.skew()
+                assert (df.skew() == 0).all()
+
+    @td.skip_if_no_scipy
+    def test_kurt(self):
+        from scipy.stats import kurtosis
+
+        string_series = tm.makeStringSeries().rename('series')
+
+        alt = lambda x: kurtosis(x, bias=False)
+        self._check_stat_op('kurt', alt, string_series)
+
+        index = pd.MultiIndex(
+            levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
+            codes=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1]]
+        )
+        s = Series(np.random.randn(6), index=index)
+        tm.assert_almost_equal(s.kurt(), s.kurt(level=0)['bar'])
+
+        # test corner cases, kurt() returns NaN unless there's at least 4
+        # values
+        min_N = 4
+        for i in range(1, min_N + 1):
+            s = Series(np.ones(i))
+            df = DataFrame(np.ones((i, i)))
+            if i < min_N:
+                assert np.isnan(s.kurt())
+                assert np.isnan(df.kurt()).all()
+            else:
+                assert 0 == s.kurt()
+                assert (df.kurt() == 0).all()
diff --git a/pandas/tests/resample/__init__.py b/pandas/tests/resample/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/resample/conftest.py b/pandas/tests/resample/conftest.py
new file mode 100644
index 0000000000000..d0f78f6d5b439
--- /dev/null
+++ b/pandas/tests/resample/conftest.py
@@ -0,0 +1,142 @@
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Series
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.period import period_range
+
+# The various methods we support
+downsample_methods = ['min', 'max', 'first', 'last', 'sum', 'mean', 'sem',
+                      'median', 'prod', 'var', 'std', 'ohlc', 'quantile']
+upsample_methods = ['count', 'size']
+series_methods = ['nunique']
+resample_methods = downsample_methods + upsample_methods + series_methods
+
+
+@pytest.fixture(params=downsample_methods)
+def downsample_method(request):
+    """Fixture for parametrization of Grouper downsample methods."""
+    return request.param
+
+
+@pytest.fixture(params=upsample_methods)
+def upsample_method(request):
+    """Fixture for parametrization of Grouper upsample methods."""
+    return request.param
+
+
+@pytest.fixture(params=resample_methods)
+def resample_method(request):
+    """Fixture for parametrization of Grouper resample methods."""
+    return request.param
+
+
+@pytest.fixture
+def simple_date_range_series():
+    """
+    Series with date range index and random data for test purposes.
+    """
+    def _simple_date_range_series(start, end, freq='D'):
+        rng = date_range(start, end, freq=freq)
+        return Series(np.random.randn(len(rng)), index=rng)
+    return _simple_date_range_series
+
+
+@pytest.fixture
+def simple_period_range_series():
+    """
+    Series with period range index and random data for test purposes.
+    """
+    def _simple_period_range_series(start, end, freq='D'):
+        rng = period_range(start, end, freq=freq)
+        return Series(np.random.randn(len(rng)), index=rng)
+    return _simple_period_range_series
+
+
+@pytest.fixture
+def _index_start():
+    """Fixture for parametrization of index, series and frame."""
+    return datetime(2005, 1, 1)
+
+
+@pytest.fixture
+def _index_end():
+    """Fixture for parametrization of index, series and frame."""
+    return datetime(2005, 1, 10)
+
+
+@pytest.fixture
+def _index_freq():
+    """Fixture for parametrization of index, series and frame."""
+    return 'D'
+
+
+@pytest.fixture
+def _index_name():
+    """Fixture for parametrization of index, series and frame."""
+    return None
+
+
+@pytest.fixture
+def index(_index_factory, _index_start, _index_end, _index_freq, _index_name):
+    """Fixture for parametrization of date_range, period_range and
+    timedelta_range indexes"""
+    return _index_factory(
+        _index_start, _index_end, freq=_index_freq, name=_index_name)
+
+
+@pytest.fixture
+def _static_values(index):
+    """Fixture for parametrization of values used in parametrization of
+    Series and DataFrames with date_range, period_range and
+    timedelta_range indexes"""
+    return np.arange(len(index))
+
+
+@pytest.fixture
+def _series_name():
+    """Fixture for parametrization of Series name for Series used with
+    date_range, period_range and timedelta_range indexes"""
+    return None
+
+
+@pytest.fixture
+def series(index, _series_name, _static_values):
+    """Fixture for parametrization of Series with date_range, period_range and
+    timedelta_range indexes"""
+    return Series(_static_values, index=index, name=_series_name)
+
+
+@pytest.fixture
+def empty_series(series):
+    """Fixture for parametrization of empty Series with date_range,
+    period_range and timedelta_range indexes"""
+    return series[:0]
+
+
+@pytest.fixture
+def frame(index, _series_name, _static_values):
+    """Fixture for parametrization of DataFrame with date_range, period_range
+    and timedelta_range indexes"""
+    # _series_name is intentionally unused
+    return DataFrame({'value': _static_values}, index=index)
+
+
+@pytest.fixture
+def empty_frame(series):
+    """Fixture for parametrization of empty DataFrame with date_range,
+    period_range and timedelta_range indexes"""
+    index = series.index[:0]
+    return DataFrame(index=index)
+
+
+@pytest.fixture(params=[Series, DataFrame])
+def series_and_frame(request, series, frame):
+    """Fixture for parametrization of Series and DataFrame with date_range,
+    period_range and timedelta_range indexes"""
+    if request.param == Series:
+        return series
+    if request.param == DataFrame:
+        return frame
diff --git a/pandas/tests/resample/test_base.py b/pandas/tests/resample/test_base.py
new file mode 100644
index 0000000000000..8f912ea5c524a
--- /dev/null
+++ b/pandas/tests/resample/test_base.py
@@ -0,0 +1,235 @@
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas.compat import range, zip
+
+import pandas as pd
+from pandas import DataFrame, Series
+from pandas.core.groupby.groupby import DataError
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.period import PeriodIndex, period_range
+from pandas.core.indexes.timedeltas import TimedeltaIndex, timedelta_range
+from pandas.core.resample import TimeGrouper
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_index_equal,
+    assert_series_equal)
+
+# a fixture value can be overridden by the test parameter value. Note that the
+# value of the fixture can be overridden this way even if the test doesn't use
+# it directly (doesn't mention it in the function prototype).
+# see https://docs.pytest.org/en/latest/fixture.html#override-a-fixture-with-direct-test-parametrization  # noqa
+# in this module we override the fixture values defined in conftest.py
+# tuples of '_index_factory,_series_name,_index_start,_index_end'
+DATE_RANGE = (date_range, 'dti', datetime(2005, 1, 1), datetime(2005, 1, 10))
+PERIOD_RANGE = (
+    period_range, 'pi', datetime(2005, 1, 1), datetime(2005, 1, 10))
+TIMEDELTA_RANGE = (timedelta_range, 'tdi', '1 day', '10 day')
+
+all_ts = pytest.mark.parametrize(
+    '_index_factory,_series_name,_index_start,_index_end',
+    [DATE_RANGE, PERIOD_RANGE, TIMEDELTA_RANGE]
+)
+
+
+@pytest.fixture
+def create_index(_index_factory):
+    def _create_index(*args, **kwargs):
+        """ return the _index_factory created using the args, kwargs """
+        return _index_factory(*args, **kwargs)
+    return _create_index
+
+
+@pytest.mark.parametrize('freq', ['2D', '1H'])
+@pytest.mark.parametrize(
+    '_index_factory,_series_name,_index_start,_index_end',
+    [DATE_RANGE, TIMEDELTA_RANGE]
+)
+def test_asfreq(series_and_frame, freq, create_index):
+    obj = series_and_frame
+
+    result = obj.resample(freq).asfreq()
+    new_index = create_index(obj.index[0], obj.index[-1], freq=freq)
+    expected = obj.reindex(new_index)
+    assert_almost_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    '_index_factory,_series_name,_index_start,_index_end',
+    [DATE_RANGE, TIMEDELTA_RANGE]
+)
+def test_asfreq_fill_value(series, create_index):
+    # test for fill value during resampling, issue 3715
+
+    s = series
+
+    result = s.resample('1H').asfreq()
+    new_index = create_index(s.index[0], s.index[-1], freq='1H')
+    expected = s.reindex(new_index)
+    assert_series_equal(result, expected)
+
+    frame = s.to_frame('value')
+    frame.iloc[1] = None
+    result = frame.resample('1H').asfreq(fill_value=4.0)
+    new_index = create_index(frame.index[0],
+                             frame.index[-1], freq='1H')
+    expected = frame.reindex(new_index, fill_value=4.0)
+    assert_frame_equal(result, expected)
+
+
+@all_ts
+def test_resample_interpolate(frame):
+    # # 12925
+    df = frame
+    assert_frame_equal(
+        df.resample('1T').asfreq().interpolate(),
+        df.resample('1T').interpolate())
+
+
+def test_raises_on_non_datetimelike_index():
+    # this is a non datetimelike index
+    xp = DataFrame()
+    msg = ("Only valid with DatetimeIndex, TimedeltaIndex or PeriodIndex,"
+           " but got an instance of 'Index'")
+    with pytest.raises(TypeError, match=msg):
+        xp.resample('A').mean()
+
+
+@all_ts
+@pytest.mark.parametrize('freq', ['M', 'D', 'H'])
+def test_resample_empty_series(freq, empty_series, resample_method):
+    # GH12771 & GH12868
+
+    if resample_method == 'ohlc':
+        pytest.skip('need to test for ohlc from GH13083')
+
+    s = empty_series
+    result = getattr(s.resample(freq), resample_method)()
+
+    expected = s.copy()
+    if isinstance(s.index, PeriodIndex):
+        expected.index = s.index.asfreq(freq=freq)
+    else:
+        expected.index = s.index._shallow_copy(freq=freq)
+    assert_index_equal(result.index, expected.index)
+    assert result.index.freq == expected.index.freq
+    assert_series_equal(result, expected, check_dtype=False)
+
+
+@all_ts
+@pytest.mark.parametrize('freq', ['M', 'D', 'H'])
+def test_resample_empty_dataframe(empty_frame, freq, resample_method):
+    # GH13212
+    df = empty_frame
+    # count retains dimensions too
+    result = getattr(df.resample(freq), resample_method)()
+    if resample_method != 'size':
+        expected = df.copy()
+    else:
+        # GH14962
+        expected = Series([])
+
+    if isinstance(df.index, PeriodIndex):
+        expected.index = df.index.asfreq(freq=freq)
+    else:
+        expected.index = df.index._shallow_copy(freq=freq)
+    assert_index_equal(result.index, expected.index)
+    assert result.index.freq == expected.index.freq
+    assert_almost_equal(result, expected, check_dtype=False)
+
+    # test size for GH13212 (currently stays as df)
+
+
+@pytest.mark.parametrize("index", tm.all_timeseries_index_generator(0))
+@pytest.mark.parametrize(
+    "dtype",
+    [np.float, np.int, np.object, 'datetime64[ns]'])
+def test_resample_empty_dtypes(index, dtype, resample_method):
+
+    # Empty series were sometimes causing a segfault (for the functions
+    # with Cython bounds-checking disabled) or an IndexError.  We just run
+    # them to ensure they no longer do.  (GH #10228)
+    empty_series = Series([], index, dtype)
+    try:
+        getattr(empty_series.resample('d'), resample_method)()
+    except DataError:
+        # Ignore these since some combinations are invalid
+        # (ex: doing mean with dtype of np.object)
+        pass
+
+
+@all_ts
+def test_resample_loffset_arg_type(frame, create_index):
+    # GH 13218, 15002
+    df = frame
+    expected_means = [df.values[i:i + 2].mean()
+                      for i in range(0, len(df.values), 2)]
+    expected_index = create_index(df.index[0],
+                                  periods=len(df.index) / 2,
+                                  freq='2D')
+
+    # loffset coerces PeriodIndex to DateTimeIndex
+    if isinstance(expected_index, PeriodIndex):
+        expected_index = expected_index.to_timestamp()
+
+    expected_index += timedelta(hours=2)
+    expected = DataFrame({'value': expected_means}, index=expected_index)
+
+    for arg in ['mean', {'value': 'mean'}, ['mean']]:
+
+        result_agg = df.resample('2D', loffset='2H').agg(arg)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result_how = df.resample('2D', how=arg, loffset='2H')
+
+        if isinstance(arg, list):
+            expected.columns = pd.MultiIndex.from_tuples([('value',
+                                                           'mean')])
+
+        # GH 13022, 7687 - TODO: fix resample w/ TimedeltaIndex
+        if isinstance(expected.index, TimedeltaIndex):
+            msg = "DataFrame are different"
+            with pytest.raises(AssertionError, match=msg):
+                assert_frame_equal(result_agg, expected)
+            with pytest.raises(AssertionError, match=msg):
+                assert_frame_equal(result_how, expected)
+        else:
+            assert_frame_equal(result_agg, expected)
+            assert_frame_equal(result_how, expected)
+
+
+@all_ts
+def test_apply_to_empty_series(empty_series):
+    # GH 14313
+    s = empty_series
+    for freq in ['M', 'D', 'H']:
+        result = s.resample(freq).apply(lambda x: 1)
+        expected = s.resample(freq).apply(np.sum)
+
+        assert_series_equal(result, expected, check_dtype=False)
+
+
+@all_ts
+def test_resampler_is_iterable(series):
+    # GH 15314
+    freq = 'H'
+    tg = TimeGrouper(freq, convention='start')
+    grouped = series.groupby(tg)
+    resampled = series.resample(freq)
+    for (rk, rv), (gk, gv) in zip(resampled, grouped):
+        assert rk == gk
+        assert_series_equal(rv, gv)
+
+
+@all_ts
+def test_resample_quantile(series):
+    # GH 15023
+    s = series
+    q = 0.75
+    freq = 'H'
+    result = s.resample(freq).quantile(q)
+    expected = s.resample(freq).agg(lambda x: x.quantile(q)).rename(s.name)
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/resample/test_datetime_index.py b/pandas/tests/resample/test_datetime_index.py
new file mode 100644
index 0000000000000..ce675893d9907
--- /dev/null
+++ b/pandas/tests/resample/test_datetime_index.py
@@ -0,0 +1,1478 @@
+from datetime import datetime, timedelta
+from functools import partial
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas.compat import StringIO, range
+from pandas.errors import UnsupportedFunctionCall
+
+import pandas as pd
+from pandas import DataFrame, Series, Timedelta, Timestamp, isna, notna
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.period import Period, period_range
+from pandas.core.resample import (
+    DatetimeIndex, TimeGrouper, _get_timestamp_range_edges)
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+import pandas.tseries.offsets as offsets
+from pandas.tseries.offsets import BDay, Minute
+
+
+@pytest.fixture()
+def _index_factory():
+    return date_range
+
+
+@pytest.fixture
+def _index_freq():
+    return 'Min'
+
+
+@pytest.fixture
+def _static_values(index):
+    return np.random.rand(len(index))
+
+
+def test_custom_grouper(index):
+
+    dti = index
+    s = Series(np.array([1] * len(dti)), index=dti, dtype='int64')
+
+    b = TimeGrouper(Minute(5))
+    g = s.groupby(b)
+
+    # check all cython functions work
+    funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
+    for f in funcs:
+        g._cython_agg_general(f)
+
+    b = TimeGrouper(Minute(5), closed='right', label='right')
+    g = s.groupby(b)
+    # check all cython functions work
+    funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
+    for f in funcs:
+        g._cython_agg_general(f)
+
+    assert g.ngroups == 2593
+    assert notna(g.mean()).all()
+
+    # construct expected val
+    arr = [1] + [5] * 2592
+    idx = dti[0:-1:5]
+    idx = idx.append(dti[-1:])
+    expect = Series(arr, index=idx)
+
+    # GH2763 - return in put dtype if we can
+    result = g.agg(np.sum)
+    assert_series_equal(result, expect)
+
+    df = DataFrame(np.random.rand(len(dti), 10),
+                   index=dti, dtype='float64')
+    r = df.groupby(b).agg(np.sum)
+
+    assert len(r.columns) == 10
+    assert len(r.index) == 2593
+
+
+@pytest.mark.parametrize(
+    '_index_start,_index_end,_index_name',
+    [('1/1/2000 00:00:00', '1/1/2000 00:13:00', 'index')])
+@pytest.mark.parametrize('closed, expected', [
+    ('right',
+        lambda s: Series(
+            [s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
+            index=date_range(
+                '1/1/2000', periods=4, freq='5min', name='index'))),
+    ('left',
+        lambda s: Series(
+            [s[:5].mean(), s[5:10].mean(), s[10:].mean()],
+            index=date_range(
+                '1/1/2000 00:05', periods=3, freq='5min', name='index'))
+     )
+])
+def test_resample_basic(series, closed, expected):
+    s = series
+    expected = expected(s)
+    result = s.resample('5min', closed=closed, label='right').mean()
+    assert_series_equal(result, expected)
+
+
+def test_resample_basic_grouper(series):
+    s = series
+    result = s.resample('5Min').last()
+    grouper = TimeGrouper(Minute(5), closed='left', label='left')
+    expected = s.groupby(grouper).agg(lambda x: x[-1])
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    '_index_start,_index_end,_index_name',
+    [('1/1/2000 00:00:00', '1/1/2000 00:13:00', 'index')])
+@pytest.mark.parametrize('keyword,value', [
+    ('label', 'righttt'),
+    ('closed', 'righttt'),
+    ('convention', 'starttt')
+])
+def test_resample_string_kwargs(series, keyword, value):
+    # see gh-19303
+    # Check that wrong keyword argument strings raise an error
+    msg = "Unsupported value {value} for `{keyword}`".format(
+        value=value, keyword=keyword)
+    with pytest.raises(ValueError, match=msg):
+        series.resample('5min', **({keyword: value}))
+
+
+@pytest.mark.parametrize(
+    '_index_start,_index_end,_index_name',
+    [('1/1/2000 00:00:00', '1/1/2000 00:13:00', 'index')])
+def test_resample_how(series, downsample_method):
+    if downsample_method == 'ohlc':
+        pytest.skip('covered by test_resample_how_ohlc')
+
+    s = series
+    grouplist = np.ones_like(s)
+    grouplist[0] = 0
+    grouplist[1:6] = 1
+    grouplist[6:11] = 2
+    grouplist[11:] = 3
+    expected = s.groupby(grouplist).agg(downsample_method)
+    expected.index = date_range(
+        '1/1/2000', periods=4, freq='5min', name='index')
+
+    result = getattr(s.resample(
+        '5min', closed='right', label='right'), downsample_method)()
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    '_index_start,_index_end,_index_name',
+    [('1/1/2000 00:00:00', '1/1/2000 00:13:00', 'index')])
+def test_resample_how_ohlc(series):
+    s = series
+    grouplist = np.ones_like(s)
+    grouplist[0] = 0
+    grouplist[1:6] = 1
+    grouplist[6:11] = 2
+    grouplist[11:] = 3
+
+    def _ohlc(group):
+        if isna(group).all():
+            return np.repeat(np.nan, 4)
+        return [group[0], group.max(), group.min(), group[-1]]
+
+    expected = DataFrame(
+        s.groupby(grouplist).agg(_ohlc).values.tolist(),
+        index=date_range('1/1/2000', periods=4, freq='5min', name='index'),
+        columns=['open', 'high', 'low', 'close'])
+
+    result = s.resample('5min', closed='right', label='right').ohlc()
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'func', ['min', 'max', 'sum', 'prod', 'mean', 'var', 'std'])
+def test_numpy_compat(func):
+    # see gh-12811
+    s = Series([1, 2, 3, 4, 5], index=date_range(
+        '20130101', periods=5, freq='s'))
+    r = s.resample('2s')
+
+    msg = "numpy operations are not valid with resample"
+
+    with pytest.raises(UnsupportedFunctionCall, match=msg):
+        getattr(r, func)(func, 1, 2, 3)
+    with pytest.raises(UnsupportedFunctionCall, match=msg):
+        getattr(r, func)(axis=1)
+
+
+def test_resample_how_callables():
+    # GH#7929
+    data = np.arange(5, dtype=np.int64)
+    ind = date_range(start='2014-01-01', periods=len(data), freq='d')
+    df = DataFrame({"A": data, "B": data}, index=ind)
+
+    def fn(x, a=1):
+        return str(type(x))
+
+    class FnClass(object):
+
+        def __call__(self, x):
+            return str(type(x))
+
+    df_standard = df.resample("M").apply(fn)
+    df_lambda = df.resample("M").apply(lambda x: str(type(x)))
+    df_partial = df.resample("M").apply(partial(fn))
+    df_partial2 = df.resample("M").apply(partial(fn, a=2))
+    df_class = df.resample("M").apply(FnClass())
+
+    assert_frame_equal(df_standard, df_lambda)
+    assert_frame_equal(df_standard, df_partial)
+    assert_frame_equal(df_standard, df_partial2)
+    assert_frame_equal(df_standard, df_class)
+
+
+def test_resample_rounding():
+    # GH 8371
+    # odd results when rounding is needed
+
+    data = """date,time,value
+11-08-2014,00:00:01.093,1
+11-08-2014,00:00:02.159,1
+11-08-2014,00:00:02.667,1
+11-08-2014,00:00:03.175,1
+11-08-2014,00:00:07.058,1
+11-08-2014,00:00:07.362,1
+11-08-2014,00:00:08.324,1
+11-08-2014,00:00:08.830,1
+11-08-2014,00:00:08.982,1
+11-08-2014,00:00:09.815,1
+11-08-2014,00:00:10.540,1
+11-08-2014,00:00:11.061,1
+11-08-2014,00:00:11.617,1
+11-08-2014,00:00:13.607,1
+11-08-2014,00:00:14.535,1
+11-08-2014,00:00:15.525,1
+11-08-2014,00:00:17.960,1
+11-08-2014,00:00:20.674,1
+11-08-2014,00:00:21.191,1"""
+
+    df = pd.read_csv(StringIO(data), parse_dates={'timestamp': [
+        'date', 'time']}, index_col='timestamp')
+    df.index.name = None
+    result = df.resample('6s').sum()
+    expected = DataFrame({'value': [
+        4, 9, 4, 2
+    ]}, index=date_range('2014-11-08', freq='6s', periods=4))
+    assert_frame_equal(result, expected)
+
+    result = df.resample('7s').sum()
+    expected = DataFrame({'value': [
+        4, 10, 4, 1
+    ]}, index=date_range('2014-11-08', freq='7s', periods=4))
+    assert_frame_equal(result, expected)
+
+    result = df.resample('11s').sum()
+    expected = DataFrame({'value': [
+        11, 8
+    ]}, index=date_range('2014-11-08', freq='11s', periods=2))
+    assert_frame_equal(result, expected)
+
+    result = df.resample('13s').sum()
+    expected = DataFrame({'value': [
+        13, 6
+    ]}, index=date_range('2014-11-08', freq='13s', periods=2))
+    assert_frame_equal(result, expected)
+
+    result = df.resample('17s').sum()
+    expected = DataFrame({'value': [
+        16, 3
+    ]}, index=date_range('2014-11-08', freq='17s', periods=2))
+    assert_frame_equal(result, expected)
+
+
+def test_resample_basic_from_daily():
+    # from daily
+    dti = date_range(start=datetime(2005, 1, 1),
+                     end=datetime(2005, 1, 10), freq='D', name='index')
+
+    s = Series(np.random.rand(len(dti)), dti)
+
+    # to weekly
+    result = s.resample('w-sun').last()
+
+    assert len(result) == 3
+    assert (result.index.dayofweek == [6, 6, 6]).all()
+    assert result.iloc[0] == s['1/2/2005']
+    assert result.iloc[1] == s['1/9/2005']
+    assert result.iloc[2] == s.iloc[-1]
+
+    result = s.resample('W-MON').last()
+    assert len(result) == 2
+    assert (result.index.dayofweek == [0, 0]).all()
+    assert result.iloc[0] == s['1/3/2005']
+    assert result.iloc[1] == s['1/10/2005']
+
+    result = s.resample('W-TUE').last()
+    assert len(result) == 2
+    assert (result.index.dayofweek == [1, 1]).all()
+    assert result.iloc[0] == s['1/4/2005']
+    assert result.iloc[1] == s['1/10/2005']
+
+    result = s.resample('W-WED').last()
+    assert len(result) == 2
+    assert (result.index.dayofweek == [2, 2]).all()
+    assert result.iloc[0] == s['1/5/2005']
+    assert result.iloc[1] == s['1/10/2005']
+
+    result = s.resample('W-THU').last()
+    assert len(result) == 2
+    assert (result.index.dayofweek == [3, 3]).all()
+    assert result.iloc[0] == s['1/6/2005']
+    assert result.iloc[1] == s['1/10/2005']
+
+    result = s.resample('W-FRI').last()
+    assert len(result) == 2
+    assert (result.index.dayofweek == [4, 4]).all()
+    assert result.iloc[0] == s['1/7/2005']
+    assert result.iloc[1] == s['1/10/2005']
+
+    # to biz day
+    result = s.resample('B').last()
+    assert len(result) == 7
+    assert (result.index.dayofweek == [4, 0, 1, 2, 3, 4, 0]).all()
+
+    assert result.iloc[0] == s['1/2/2005']
+    assert result.iloc[1] == s['1/3/2005']
+    assert result.iloc[5] == s['1/9/2005']
+    assert result.index.name == 'index'
+
+
+def test_resample_upsampling_picked_but_not_correct():
+
+    # Test for issue #3020
+    dates = date_range('01-Jan-2014', '05-Jan-2014', freq='D')
+    series = Series(1, index=dates)
+
+    result = series.resample('D').mean()
+    assert result.index[0] == dates[0]
+
+    # GH 5955
+    # incorrect deciding to upsample when the axis frequency matches the
+    # resample frequency
+
+    s = Series(np.arange(1., 6), index=[datetime(
+        1975, 1, i, 12, 0) for i in range(1, 6)])
+    expected = Series(np.arange(1., 6), index=date_range(
+        '19750101', periods=5, freq='D'))
+
+    result = s.resample('D').count()
+    assert_series_equal(result, Series(1, index=expected.index))
+
+    result1 = s.resample('D').sum()
+    result2 = s.resample('D').mean()
+    assert_series_equal(result1, expected)
+    assert_series_equal(result2, expected)
+
+
+def test_resample_frame_basic():
+    df = tm.makeTimeDataFrame()
+
+    b = TimeGrouper('M')
+    g = df.groupby(b)
+
+    # check all cython functions work
+    funcs = ['add', 'mean', 'prod', 'min', 'max', 'var']
+    for f in funcs:
+        g._cython_agg_general(f)
+
+    result = df.resample('A').mean()
+    assert_series_equal(result['A'], df['A'].resample('A').mean())
+
+    result = df.resample('M').mean()
+    assert_series_equal(result['A'], df['A'].resample('M').mean())
+
+    df.resample('M', kind='period').mean()
+    df.resample('W-WED', kind='period').mean()
+
+
+@pytest.mark.parametrize('loffset', [timedelta(minutes=1),
+                                     '1min', Minute(1),
+                                     np.timedelta64(1, 'm')])
+def test_resample_loffset(loffset):
+    # GH 7687
+    rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
+    s = Series(np.random.randn(14), index=rng)
+
+    result = s.resample('5min', closed='right', label='right',
+                        loffset=loffset).mean()
+    idx = date_range('1/1/2000', periods=4, freq='5min')
+    expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
+                      index=idx + timedelta(minutes=1))
+    assert_series_equal(result, expected)
+    assert result.index.freq == Minute(5)
+
+    # from daily
+    dti = date_range(start=datetime(2005, 1, 1),
+                     end=datetime(2005, 1, 10), freq='D')
+    ser = Series(np.random.rand(len(dti)), dti)
+
+    # to weekly
+    result = ser.resample('w-sun').last()
+    business_day_offset = BDay()
+    expected = ser.resample('w-sun', loffset=-business_day_offset).last()
+    assert result.index[0] - business_day_offset == expected.index[0]
+
+
+def test_resample_loffset_upsample():
+    # GH 20744
+    rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
+    s = Series(np.random.randn(14), index=rng)
+
+    result = s.resample('5min', closed='right', label='right',
+                        loffset=timedelta(minutes=1)).ffill()
+    idx = date_range('1/1/2000', periods=4, freq='5min')
+    expected = Series([s[0], s[5], s[10], s[-1]],
+                      index=idx + timedelta(minutes=1))
+
+    assert_series_equal(result, expected)
+
+
+def test_resample_loffset_count():
+    # GH 12725
+    start_time = '1/1/2000 00:00:00'
+    rng = date_range(start_time, periods=100, freq='S')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    result = ts.resample('10S', loffset='1s').count()
+
+    expected_index = (
+        date_range(start_time, periods=10, freq='10S') +
+        timedelta(seconds=1)
+    )
+    expected = Series(10, index=expected_index)
+
+    assert_series_equal(result, expected)
+
+    # Same issue should apply to .size() since it goes through
+    #   same code path
+    result = ts.resample('10S', loffset='1s').size()
+
+    assert_series_equal(result, expected)
+
+
+def test_resample_upsample():
+    # from daily
+    dti = date_range(start=datetime(2005, 1, 1),
+                     end=datetime(2005, 1, 10), freq='D', name='index')
+
+    s = Series(np.random.rand(len(dti)), dti)
+
+    # to minutely, by padding
+    result = s.resample('Min').pad()
+    assert len(result) == 12961
+    assert result[0] == s[0]
+    assert result[-1] == s[-1]
+
+    assert result.index.name == 'index'
+
+
+def test_resample_how_method():
+    # GH9915
+    s = Series([11, 22],
+               index=[Timestamp('2015-03-31 21:48:52.672000'),
+                      Timestamp('2015-03-31 21:49:52.739000')])
+    expected = Series([11, np.NaN, np.NaN, np.NaN, np.NaN, np.NaN, 22],
+                      index=[Timestamp('2015-03-31 21:48:50'),
+                             Timestamp('2015-03-31 21:49:00'),
+                             Timestamp('2015-03-31 21:49:10'),
+                             Timestamp('2015-03-31 21:49:20'),
+                             Timestamp('2015-03-31 21:49:30'),
+                             Timestamp('2015-03-31 21:49:40'),
+                             Timestamp('2015-03-31 21:49:50')])
+    assert_series_equal(s.resample("10S").mean(), expected)
+
+
+def test_resample_extra_index_point():
+    # GH#9756
+    index = date_range(start='20150101', end='20150331', freq='BM')
+    expected = DataFrame({'A': Series([21, 41, 63], index=index)})
+
+    index = date_range(start='20150101', end='20150331', freq='B')
+    df = DataFrame(
+        {'A': Series(range(len(index)), index=index)}, dtype='int64')
+    result = df.resample('BM').last()
+    assert_frame_equal(result, expected)
+
+
+def test_upsample_with_limit():
+    rng = date_range('1/1/2000', periods=3, freq='5t')
+    ts = Series(np.random.randn(len(rng)), rng)
+
+    result = ts.resample('t').ffill(limit=2)
+    expected = ts.reindex(result.index, method='ffill', limit=2)
+    assert_series_equal(result, expected)
+
+
+def test_nearest_upsample_with_limit():
+    rng = date_range('1/1/2000', periods=3, freq='5t')
+    ts = Series(np.random.randn(len(rng)), rng)
+
+    result = ts.resample('t').nearest(limit=2)
+    expected = ts.reindex(result.index, method='nearest', limit=2)
+    assert_series_equal(result, expected)
+
+
+def test_resample_ohlc(series):
+    s = series
+
+    grouper = TimeGrouper(Minute(5))
+    expect = s.groupby(grouper).agg(lambda x: x[-1])
+    result = s.resample('5Min').ohlc()
+
+    assert len(result) == len(expect)
+    assert len(result.columns) == 4
+
+    xs = result.iloc[-2]
+    assert xs['open'] == s[-6]
+    assert xs['high'] == s[-6:-1].max()
+    assert xs['low'] == s[-6:-1].min()
+    assert xs['close'] == s[-2]
+
+    xs = result.iloc[0]
+    assert xs['open'] == s[0]
+    assert xs['high'] == s[:5].max()
+    assert xs['low'] == s[:5].min()
+    assert xs['close'] == s[4]
+
+
+def test_resample_ohlc_result():
+
+    # GH 12332
+    index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
+    index = index.union(pd.date_range('4-15-2000', '5-15-2000', freq='h'))
+    s = Series(range(len(index)), index=index)
+
+    a = s.loc[:'4-15-2000'].resample('30T').ohlc()
+    assert isinstance(a, DataFrame)
+
+    b = s.loc[:'4-14-2000'].resample('30T').ohlc()
+    assert isinstance(b, DataFrame)
+
+    # GH12348
+    # raising on odd period
+    rng = date_range('2013-12-30', '2014-01-07')
+    index = rng.drop([Timestamp('2014-01-01'),
+                      Timestamp('2013-12-31'),
+                      Timestamp('2014-01-04'),
+                      Timestamp('2014-01-05')])
+    df = DataFrame(data=np.arange(len(index)), index=index)
+    result = df.resample('B').mean()
+    expected = df.reindex(index=date_range(rng[0], rng[-1], freq='B'))
+    assert_frame_equal(result, expected)
+
+
+def test_resample_ohlc_dataframe():
+    df = (
+        DataFrame({
+            'PRICE': {
+                Timestamp('2011-01-06 10:59:05', tz=None): 24990,
+                Timestamp('2011-01-06 12:43:33', tz=None): 25499,
+                Timestamp('2011-01-06 12:54:09', tz=None): 25499},
+            'VOLUME': {
+                Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
+                Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
+                Timestamp('2011-01-06 12:54:09', tz=None): 100000000}})
+    ).reindex(['VOLUME', 'PRICE'], axis=1)
+    res = df.resample('H').ohlc()
+    exp = pd.concat([df['VOLUME'].resample('H').ohlc(),
+                     df['PRICE'].resample('H').ohlc()],
+                    axis=1,
+                    keys=['VOLUME', 'PRICE'])
+    assert_frame_equal(exp, res)
+
+    df.columns = [['a', 'b'], ['c', 'd']]
+    res = df.resample('H').ohlc()
+    exp.columns = pd.MultiIndex.from_tuples([
+        ('a', 'c', 'open'), ('a', 'c', 'high'), ('a', 'c', 'low'),
+        ('a', 'c', 'close'), ('b', 'd', 'open'), ('b', 'd', 'high'),
+        ('b', 'd', 'low'), ('b', 'd', 'close')])
+    assert_frame_equal(exp, res)
+
+    # dupe columns fail atm
+    # df.columns = ['PRICE', 'PRICE']
+
+
+def test_resample_dup_index():
+
+    # GH 4812
+    # dup columns with resample raising
+    df = DataFrame(np.random.randn(4, 12), index=[2000, 2000, 2000, 2000],
+                   columns=[Period(year=2000, month=i + 1, freq='M')
+                            for i in range(12)])
+    df.iloc[3, :] = np.nan
+    result = df.resample('Q', axis=1).mean()
+    expected = df.groupby(lambda x: int((x.month - 1) / 3), axis=1).mean()
+    expected.columns = [
+        Period(year=2000, quarter=i + 1, freq='Q') for i in range(4)]
+    assert_frame_equal(result, expected)
+
+
+def test_resample_reresample():
+    dti = date_range(start=datetime(2005, 1, 1),
+                     end=datetime(2005, 1, 10), freq='D')
+    s = Series(np.random.rand(len(dti)), dti)
+    bs = s.resample('B', closed='right', label='right').mean()
+    result = bs.resample('8H').mean()
+    assert len(result) == 22
+    assert isinstance(result.index.freq, offsets.DateOffset)
+    assert result.index.freq == offsets.Hour(8)
+
+
+def test_resample_timestamp_to_period(simple_date_range_series):
+    ts = simple_date_range_series('1/1/1990', '1/1/2000')
+
+    result = ts.resample('A-DEC', kind='period').mean()
+    expected = ts.resample('A-DEC').mean()
+    expected.index = period_range('1990', '2000', freq='a-dec')
+    assert_series_equal(result, expected)
+
+    result = ts.resample('A-JUN', kind='period').mean()
+    expected = ts.resample('A-JUN').mean()
+    expected.index = period_range('1990', '2000', freq='a-jun')
+    assert_series_equal(result, expected)
+
+    result = ts.resample('M', kind='period').mean()
+    expected = ts.resample('M').mean()
+    expected.index = period_range('1990-01', '2000-01', freq='M')
+    assert_series_equal(result, expected)
+
+    result = ts.resample('M', kind='period').mean()
+    expected = ts.resample('M').mean()
+    expected.index = period_range('1990-01', '2000-01', freq='M')
+    assert_series_equal(result, expected)
+
+
+def test_ohlc_5min():
+    def _ohlc(group):
+        if isna(group).all():
+            return np.repeat(np.nan, 4)
+        return [group[0], group.max(), group.min(), group[-1]]
+
+    rng = date_range('1/1/2000 00:00:00', '1/1/2000 5:59:50', freq='10s')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    resampled = ts.resample('5min', closed='right',
+                            label='right').ohlc()
+
+    assert (resampled.loc['1/1/2000 00:00'] == ts[0]).all()
+
+    exp = _ohlc(ts[1:31])
+    assert (resampled.loc['1/1/2000 00:05'] == exp).all()
+
+    exp = _ohlc(ts['1/1/2000 5:55:01':])
+    assert (resampled.loc['1/1/2000 6:00:00'] == exp).all()
+
+
+def test_downsample_non_unique():
+    rng = date_range('1/1/2000', '2/29/2000')
+    rng2 = rng.repeat(5).values
+    ts = Series(np.random.randn(len(rng2)), index=rng2)
+
+    result = ts.resample('M').mean()
+
+    expected = ts.groupby(lambda x: x.month).mean()
+    assert len(result) == 2
+    assert_almost_equal(result[0], expected[1])
+    assert_almost_equal(result[1], expected[2])
+
+
+def test_asfreq_non_unique():
+    # GH #1077
+    rng = date_range('1/1/2000', '2/29/2000')
+    rng2 = rng.repeat(2).values
+    ts = Series(np.random.randn(len(rng2)), index=rng2)
+
+    msg = 'cannot reindex from a duplicate axis'
+    with pytest.raises(ValueError, match=msg):
+        ts.asfreq('B')
+
+
+def test_resample_axis1():
+    rng = date_range('1/1/2000', '2/29/2000')
+    df = DataFrame(np.random.randn(3, len(rng)), columns=rng,
+                   index=['a', 'b', 'c'])
+
+    result = df.resample('M', axis=1).mean()
+    expected = df.T.resample('M').mean().T
+    tm.assert_frame_equal(result, expected)
+
+
+def test_resample_anchored_ticks():
+    # If a fixed delta (5 minute, 4 hour) evenly divides a day, we should
+    # "anchor" the origin at midnight so we get regular intervals rather
+    # than starting from the first timestamp which might start in the
+    # middle of a desired interval
+
+    rng = date_range('1/1/2000 04:00:00', periods=86400, freq='s')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+    ts[:2] = np.nan  # so results are the same
+
+    freqs = ['t', '5t', '15t', '30t', '4h', '12h']
+    for freq in freqs:
+        result = ts[2:].resample(freq, closed='left', label='left').mean()
+        expected = ts.resample(freq, closed='left', label='left').mean()
+        assert_series_equal(result, expected)
+
+
+def test_resample_single_group():
+    mysum = lambda x: x.sum()
+
+    rng = date_range('2000-1-1', '2000-2-10', freq='D')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+    assert_series_equal(ts.resample('M').sum(),
+                        ts.resample('M').apply(mysum))
+
+    rng = date_range('2000-1-1', '2000-1-10', freq='D')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+    assert_series_equal(ts.resample('M').sum(),
+                        ts.resample('M').apply(mysum))
+
+    # GH 3849
+    s = Series([30.1, 31.6], index=[Timestamp('20070915 15:30:00'),
+                                    Timestamp('20070915 15:40:00')])
+    expected = Series([0.75], index=[Timestamp('20070915')])
+    result = s.resample('D').apply(lambda x: np.std(x))
+    assert_series_equal(result, expected)
+
+
+def test_resample_base():
+    rng = date_range('1/1/2000 00:00:00', '1/1/2000 02:00', freq='s')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    resampled = ts.resample('5min', base=2).mean()
+    exp_rng = date_range('12/31/1999 23:57:00', '1/1/2000 01:57',
+                         freq='5min')
+    tm.assert_index_equal(resampled.index, exp_rng)
+
+
+def test_resample_daily_anchored():
+    rng = date_range('1/1/2000 0:00:00', periods=10000, freq='T')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+    ts[:2] = np.nan  # so results are the same
+
+    result = ts[2:].resample('D', closed='left', label='left').mean()
+    expected = ts.resample('D', closed='left', label='left').mean()
+    assert_series_equal(result, expected)
+
+
+def test_resample_to_period_monthly_buglet():
+    # GH #1259
+
+    rng = date_range('1/1/2000', '12/31/2000')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    result = ts.resample('M', kind='period').mean()
+    exp_index = period_range('Jan-2000', 'Dec-2000', freq='M')
+    tm.assert_index_equal(result.index, exp_index)
+
+
+def test_period_with_agg():
+
+    # aggregate a period resampler with a lambda
+    s2 = Series(np.random.randint(0, 5, 50),
+                index=pd.period_range('2012-01-01', freq='H', periods=50),
+                dtype='float64')
+
+    expected = s2.to_timestamp().resample('D').mean().to_period()
+    result = s2.resample('D').agg(lambda x: x.mean())
+    assert_series_equal(result, expected)
+
+
+def test_resample_segfault():
+    # GH 8573
+    # segfaulting in older versions
+    all_wins_and_wagers = [
+        (1, datetime(2013, 10, 1, 16, 20), 1, 0),
+        (2, datetime(2013, 10, 1, 16, 10), 1, 0),
+        (2, datetime(2013, 10, 1, 18, 15), 1, 0),
+        (2, datetime(2013, 10, 1, 16, 10, 31), 1, 0)]
+
+    df = DataFrame.from_records(all_wins_and_wagers,
+                                columns=("ID", "timestamp", "A", "B")
+                                ).set_index("timestamp")
+    result = df.groupby("ID").resample("5min").sum()
+    expected = df.groupby("ID").apply(lambda x: x.resample("5min").sum())
+    assert_frame_equal(result, expected)
+
+
+def test_resample_dtype_preservation():
+
+    # GH 12202
+    # validation tests for dtype preservation
+
+    df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                          periods=4, freq='W'),
+                    'group': [1, 1, 2, 2],
+                    'val': Series([5, 6, 7, 8],
+                                  dtype='int32')}
+                   ).set_index('date')
+
+    result = df.resample('1D').ffill()
+    assert result.val.dtype == np.int32
+
+    result = df.groupby('group').resample('1D').ffill()
+    assert result.val.dtype == np.int32
+
+
+def test_resample_dtype_coerceion():
+
+    pytest.importorskip('scipy.interpolate')
+
+    # GH 16361
+    df = {"a": [1, 3, 1, 4]}
+    df = DataFrame(df, index=pd.date_range("2017-01-01", "2017-01-04"))
+
+    expected = (df.astype("float64")
+                .resample("H")
+                .mean()
+                ["a"]
+                .interpolate("cubic")
+                )
+
+    result = df.resample("H")["a"].mean().interpolate("cubic")
+    tm.assert_series_equal(result, expected)
+
+    result = df.resample("H").mean()["a"].interpolate("cubic")
+    tm.assert_series_equal(result, expected)
+
+
+def test_weekly_resample_buglet():
+    # #1327
+    rng = date_range('1/1/2000', freq='B', periods=20)
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    resampled = ts.resample('W').mean()
+    expected = ts.resample('W-SUN').mean()
+    assert_series_equal(resampled, expected)
+
+
+def test_monthly_resample_error():
+    # #1451
+    dates = date_range('4/16/2012 20:00', periods=5000, freq='h')
+    ts = Series(np.random.randn(len(dates)), index=dates)
+    # it works!
+    ts.resample('M')
+
+
+def test_nanosecond_resample_error():
+    # GH 12307 - Values falls after last bin when
+    # Resampling using pd.tseries.offsets.Nano as period
+    start = 1443707890427
+    exp_start = 1443707890400
+    indx = pd.date_range(
+        start=pd.to_datetime(start),
+        periods=10,
+        freq='100n'
+    )
+    ts = Series(range(len(indx)), index=indx)
+    r = ts.resample(pd.tseries.offsets.Nano(100))
+    result = r.agg('mean')
+
+    exp_indx = pd.date_range(
+        start=pd.to_datetime(exp_start),
+        periods=10,
+        freq='100n'
+    )
+    exp = Series(range(len(exp_indx)), index=exp_indx)
+
+    assert_series_equal(result, exp)
+
+
+def test_resample_anchored_intraday(simple_date_range_series):
+    # #1471, #1458
+
+    rng = date_range('1/1/2012', '4/1/2012', freq='100min')
+    df = DataFrame(rng.month, index=rng)
+
+    result = df.resample('M').mean()
+    expected = df.resample(
+        'M', kind='period').mean().to_timestamp(how='end')
+    expected.index += Timedelta(1, 'ns') - Timedelta(1, 'D')
+    tm.assert_frame_equal(result, expected)
+
+    result = df.resample('M', closed='left').mean()
+    exp = df.tshift(1, freq='D').resample('M', kind='period').mean()
+    exp = exp.to_timestamp(how='end')
+
+    exp.index = exp.index + Timedelta(1, 'ns') - Timedelta(1, 'D')
+    tm.assert_frame_equal(result, exp)
+
+    rng = date_range('1/1/2012', '4/1/2012', freq='100min')
+    df = DataFrame(rng.month, index=rng)
+
+    result = df.resample('Q').mean()
+    expected = df.resample(
+        'Q', kind='period').mean().to_timestamp(how='end')
+    expected.index += Timedelta(1, 'ns') - Timedelta(1, 'D')
+    tm.assert_frame_equal(result, expected)
+
+    result = df.resample('Q', closed='left').mean()
+    expected = df.tshift(1, freq='D').resample('Q', kind='period',
+                                               closed='left').mean()
+    expected = expected.to_timestamp(how='end')
+    expected.index += Timedelta(1, 'ns') - Timedelta(1, 'D')
+    tm.assert_frame_equal(result, expected)
+
+    ts = simple_date_range_series('2012-04-29 23:00', '2012-04-30 5:00',
+                                  freq='h')
+    resampled = ts.resample('M').mean()
+    assert len(resampled) == 1
+
+
+def test_resample_anchored_monthstart(simple_date_range_series):
+    ts = simple_date_range_series('1/1/2000', '12/31/2002')
+
+    freqs = ['MS', 'BMS', 'QS-MAR', 'AS-DEC', 'AS-JUN']
+
+    for freq in freqs:
+        ts.resample(freq).mean()
+
+
+def test_resample_anchored_multiday():
+    # When resampling a range spanning multiple days, ensure that the
+    # start date gets used to determine the offset.  Fixes issue where
+    # a one day period is not a multiple of the frequency.
+    #
+    # See: https://github.com/pandas-dev/pandas/issues/8683
+
+    index = pd.date_range(
+        '2014-10-14 23:06:23.206', periods=3, freq='400L'
+    ) | pd.date_range(
+        '2014-10-15 23:00:00', periods=2, freq='2200L')
+
+    s = Series(np.random.randn(5), index=index)
+
+    # Ensure left closing works
+    result = s.resample('2200L').mean()
+    assert result.index[-1] == Timestamp('2014-10-15 23:00:02.000')
+
+    # Ensure right closing works
+    result = s.resample('2200L', label='right').mean()
+    assert result.index[-1] == Timestamp('2014-10-15 23:00:04.200')
+
+
+def test_corner_cases(simple_period_range_series,
+                      simple_date_range_series):
+    # miscellaneous test coverage
+
+    rng = date_range('1/1/2000', periods=12, freq='t')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    result = ts.resample('5t', closed='right', label='left').mean()
+    ex_index = date_range('1999-12-31 23:55', periods=4, freq='5t')
+    tm.assert_index_equal(result.index, ex_index)
+
+    len0pts = simple_period_range_series(
+        '2007-01', '2010-05', freq='M')[:0]
+    # it works
+    result = len0pts.resample('A-DEC').mean()
+    assert len(result) == 0
+
+    # resample to periods
+    ts = simple_date_range_series(
+        '2000-04-28', '2000-04-30 11:00', freq='h')
+    result = ts.resample('M', kind='period').mean()
+    assert len(result) == 1
+    assert result.index[0] == Period('2000-04', freq='M')
+
+
+def test_anchored_lowercase_buglet():
+    dates = date_range('4/16/2012 20:00', periods=50000, freq='s')
+    ts = Series(np.random.randn(len(dates)), index=dates)
+    # it works!
+    ts.resample('d').mean()
+
+
+def test_upsample_apply_functions():
+    # #1596
+    rng = pd.date_range('2012-06-12', periods=4, freq='h')
+
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    result = ts.resample('20min').aggregate(['mean', 'sum'])
+    assert isinstance(result, DataFrame)
+
+
+def test_resample_not_monotonic():
+    rng = pd.date_range('2012-06-12', periods=200, freq='h')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    ts = ts.take(np.random.permutation(len(ts)))
+
+    result = ts.resample('D').sum()
+    exp = ts.sort_index().resample('D').sum()
+    assert_series_equal(result, exp)
+
+
+def test_resample_median_bug_1688():
+
+    for dtype in ['int64', 'int32', 'float64', 'float32']:
+        df = DataFrame([1, 2], index=[datetime(2012, 1, 1, 0, 0, 0),
+                                      datetime(2012, 1, 1, 0, 5, 0)],
+                       dtype=dtype)
+
+        result = df.resample("T").apply(lambda x: x.mean())
+        exp = df.asfreq('T')
+        tm.assert_frame_equal(result, exp)
+
+        result = df.resample("T").median()
+        exp = df.asfreq('T')
+        tm.assert_frame_equal(result, exp)
+
+
+def test_how_lambda_functions(simple_date_range_series):
+
+    ts = simple_date_range_series('1/1/2000', '4/1/2000')
+
+    result = ts.resample('M').apply(lambda x: x.mean())
+    exp = ts.resample('M').mean()
+    tm.assert_series_equal(result, exp)
+
+    foo_exp = ts.resample('M').mean()
+    foo_exp.name = 'foo'
+    bar_exp = ts.resample('M').std()
+    bar_exp.name = 'bar'
+
+    result = ts.resample('M').apply(
+        [lambda x: x.mean(), lambda x: x.std(ddof=1)])
+    result.columns = ['foo', 'bar']
+    tm.assert_series_equal(result['foo'], foo_exp)
+    tm.assert_series_equal(result['bar'], bar_exp)
+
+    # this is a MI Series, so comparing the names of the results
+    # doesn't make sense
+    result = ts.resample('M').aggregate({'foo': lambda x: x.mean(),
+                                         'bar': lambda x: x.std(ddof=1)})
+    tm.assert_series_equal(result['foo'], foo_exp, check_names=False)
+    tm.assert_series_equal(result['bar'], bar_exp, check_names=False)
+
+
+def test_resample_unequal_times():
+    # #1772
+    start = datetime(1999, 3, 1, 5)
+    # end hour is less than start
+    end = datetime(2012, 7, 31, 4)
+    bad_ind = date_range(start, end, freq="30min")
+    df = DataFrame({'close': 1}, index=bad_ind)
+
+    # it works!
+    df.resample('AS').sum()
+
+
+def test_resample_consistency():
+
+    # GH 6418
+    # resample with bfill / limit / reindex consistency
+
+    i30 = pd.date_range('2002-02-02', periods=4, freq='30T')
+    s = Series(np.arange(4.), index=i30)
+    s[2] = np.NaN
+
+    # Upsample by factor 3 with reindex() and resample() methods:
+    i10 = pd.date_range(i30[0], i30[-1], freq='10T')
+
+    s10 = s.reindex(index=i10, method='bfill')
+    s10_2 = s.reindex(index=i10, method='bfill', limit=2)
+    rl = s.reindex_like(s10, method='bfill', limit=2)
+    r10_2 = s.resample('10Min').bfill(limit=2)
+    r10 = s.resample('10Min').bfill()
+
+    # s10_2, r10, r10_2, rl should all be equal
+    assert_series_equal(s10_2, r10)
+    assert_series_equal(s10_2, r10_2)
+    assert_series_equal(s10_2, rl)
+
+
+def test_resample_timegrouper():
+    # GH 7227
+    dates1 = [datetime(2014, 10, 1), datetime(2014, 9, 3),
+              datetime(2014, 11, 5), datetime(2014, 9, 5),
+              datetime(2014, 10, 8), datetime(2014, 7, 15)]
+
+    dates2 = dates1[:2] + [pd.NaT] + dates1[2:4] + [pd.NaT] + dates1[4:]
+    dates3 = [pd.NaT] + dates1 + [pd.NaT]
+
+    for dates in [dates1, dates2, dates3]:
+        df = DataFrame(dict(A=dates, B=np.arange(len(dates))))
+        result = df.set_index('A').resample('M').count()
+        exp_idx = pd.DatetimeIndex(['2014-07-31', '2014-08-31',
+                                    '2014-09-30',
+                                    '2014-10-31', '2014-11-30'],
+                                   freq='M', name='A')
+        expected = DataFrame({'B': [1, 0, 2, 2, 1]}, index=exp_idx)
+        assert_frame_equal(result, expected)
+
+        result = df.groupby(pd.Grouper(freq='M', key='A')).count()
+        assert_frame_equal(result, expected)
+
+        df = DataFrame(dict(A=dates, B=np.arange(len(dates)), C=np.arange(
+            len(dates))))
+        result = df.set_index('A').resample('M').count()
+        expected = DataFrame({'B': [1, 0, 2, 2, 1], 'C': [1, 0, 2, 2, 1]},
+                             index=exp_idx, columns=['B', 'C'])
+        assert_frame_equal(result, expected)
+
+        result = df.groupby(pd.Grouper(freq='M', key='A')).count()
+        assert_frame_equal(result, expected)
+
+
+def test_resample_nunique():
+
+    # GH 12352
+    df = DataFrame({
+        'ID': {Timestamp('2015-06-05 00:00:00'): '0010100903',
+               Timestamp('2015-06-08 00:00:00'): '0010150847'},
+        'DATE': {Timestamp('2015-06-05 00:00:00'): '2015-06-05',
+                 Timestamp('2015-06-08 00:00:00'): '2015-06-08'}})
+    r = df.resample('D')
+    g = df.groupby(pd.Grouper(freq='D'))
+    expected = df.groupby(pd.Grouper(freq='D')).ID.apply(lambda x:
+                                                         x.nunique())
+    assert expected.name == 'ID'
+
+    for t in [r, g]:
+        result = r.ID.nunique()
+        assert_series_equal(result, expected)
+
+    result = df.ID.resample('D').nunique()
+    assert_series_equal(result, expected)
+
+    result = df.ID.groupby(pd.Grouper(freq='D')).nunique()
+    assert_series_equal(result, expected)
+
+
+def test_resample_nunique_preserves_column_level_names():
+    # see gh-23222
+    df = tm.makeTimeDataFrame(freq="1D").abs()
+    df.columns = pd.MultiIndex.from_arrays([df.columns.tolist()] * 2,
+                                           names=["lev0", "lev1"])
+    result = df.resample("1h").nunique()
+    tm.assert_index_equal(df.columns, result.columns)
+
+
+def test_resample_nunique_with_date_gap():
+    # GH 13453
+    index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
+    index2 = pd.date_range('4-15-2000', '5-15-2000', freq='h')
+    index3 = index.append(index2)
+    s = Series(range(len(index3)), index=index3, dtype='int64')
+    r = s.resample('M')
+
+    # Since all elements are unique, these should all be the same
+    results = [
+        r.count(),
+        r.nunique(),
+        r.agg(Series.nunique),
+        r.agg('nunique')
+    ]
+
+    assert_series_equal(results[0], results[1])
+    assert_series_equal(results[0], results[2])
+    assert_series_equal(results[0], results[3])
+
+
+@pytest.mark.parametrize('n', [10000, 100000])
+@pytest.mark.parametrize('k', [10, 100, 1000])
+def test_resample_group_info(n, k):
+    # GH10914
+
+    # use a fixed seed to always have the same uniques
+    prng = np.random.RandomState(1234)
+
+    dr = date_range(start='2015-08-27', periods=n // 10, freq='T')
+    ts = Series(prng.randint(0, n // k, n).astype('int64'),
+                index=prng.choice(dr, n))
+
+    left = ts.resample('30T').nunique()
+    ix = date_range(start=ts.index.min(), end=ts.index.max(),
+                    freq='30T')
+
+    vals = ts.values
+    bins = np.searchsorted(ix.values, ts.index, side='right')
+
+    sorter = np.lexsort((vals, bins))
+    vals, bins = vals[sorter], bins[sorter]
+
+    mask = np.r_[True, vals[1:] != vals[:-1]]
+    mask |= np.r_[True, bins[1:] != bins[:-1]]
+
+    arr = np.bincount(bins[mask] - 1,
+                      minlength=len(ix)).astype('int64', copy=False)
+    right = Series(arr, index=ix)
+
+    assert_series_equal(left, right)
+
+
+def test_resample_size():
+    n = 10000
+    dr = date_range('2015-09-19', periods=n, freq='T')
+    ts = Series(np.random.randn(n), index=np.random.choice(dr, n))
+
+    left = ts.resample('7T').size()
+    ix = date_range(start=left.index.min(), end=ts.index.max(), freq='7T')
+
+    bins = np.searchsorted(ix.values, ts.index.values, side='right')
+    val = np.bincount(bins, minlength=len(ix) + 1)[1:].astype('int64',
+                                                              copy=False)
+
+    right = Series(val, index=ix)
+    assert_series_equal(left, right)
+
+
+def test_resample_across_dst():
+    # The test resamples a DatetimeIndex with values before and after a
+    # DST change
+    # Issue: 14682
+
+    # The DatetimeIndex we will start with
+    # (note that DST happens at 03:00+02:00 -> 02:00+01:00)
+    # 2016-10-30 02:23:00+02:00, 2016-10-30 02:23:00+01:00
+    df1 = DataFrame([1477786980, 1477790580], columns=['ts'])
+    dti1 = DatetimeIndex(pd.to_datetime(df1.ts, unit='s')
+                         .dt.tz_localize('UTC')
+                            .dt.tz_convert('Europe/Madrid'))
+
+    # The expected DatetimeIndex after resampling.
+    # 2016-10-30 02:00:00+02:00, 2016-10-30 02:00:00+01:00
+    df2 = DataFrame([1477785600, 1477789200], columns=['ts'])
+    dti2 = DatetimeIndex(pd.to_datetime(df2.ts, unit='s')
+                         .dt.tz_localize('UTC')
+                            .dt.tz_convert('Europe/Madrid'))
+    df = DataFrame([5, 5], index=dti1)
+
+    result = df.resample(rule='H').sum()
+    expected = DataFrame([5, 5], index=dti2)
+
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_with_dst_time_change():
+    # GH 24972
+    index = pd.DatetimeIndex([1478064900001000000, 1480037118776792000],
+                             tz='UTC').tz_convert('America/Chicago')
+
+    df = pd.DataFrame([1, 2], index=index)
+    result = df.groupby(pd.Grouper(freq='1d')).last()
+    expected_index_values = pd.date_range('2016-11-02', '2016-11-24',
+                                          freq='d', tz='America/Chicago')
+
+    index = pd.DatetimeIndex(expected_index_values)
+    expected = pd.DataFrame([1.0] + ([np.nan] * 21) + [2.0], index=index)
+    assert_frame_equal(result, expected)
+
+
+def test_resample_dst_anchor():
+    # 5172
+    dti = DatetimeIndex([datetime(2012, 11, 4, 23)], tz='US/Eastern')
+    df = DataFrame([5], index=dti)
+    assert_frame_equal(df.resample(rule='D').sum(),
+                       DataFrame([5], index=df.index.normalize()))
+    df.resample(rule='MS').sum()
+    assert_frame_equal(
+        df.resample(rule='MS').sum(),
+        DataFrame([5], index=DatetimeIndex([datetime(2012, 11, 1)],
+                                           tz='US/Eastern')))
+
+    dti = date_range('2013-09-30', '2013-11-02', freq='30Min',
+                     tz='Europe/Paris')
+    values = range(dti.size)
+    df = DataFrame({"a": values,
+                    "b": values,
+                    "c": values}, index=dti, dtype='int64')
+    how = {"a": "min", "b": "max", "c": "count"}
+
+    assert_frame_equal(
+        df.resample("W-MON").agg(how)[["a", "b", "c"]],
+        DataFrame({"a": [0, 48, 384, 720, 1056, 1394],
+                   "b": [47, 383, 719, 1055, 1393, 1586],
+                   "c": [48, 336, 336, 336, 338, 193]},
+                  index=date_range('9/30/2013', '11/4/2013',
+                                   freq='W-MON', tz='Europe/Paris')),
+        'W-MON Frequency')
+
+    assert_frame_equal(
+        df.resample("2W-MON").agg(how)[["a", "b", "c"]],
+        DataFrame({"a": [0, 48, 720, 1394],
+                   "b": [47, 719, 1393, 1586],
+                   "c": [48, 672, 674, 193]},
+                  index=date_range('9/30/2013', '11/11/2013',
+                                   freq='2W-MON', tz='Europe/Paris')),
+        '2W-MON Frequency')
+
+    assert_frame_equal(
+        df.resample("MS").agg(how)[["a", "b", "c"]],
+        DataFrame({"a": [0, 48, 1538],
+                   "b": [47, 1537, 1586],
+                   "c": [48, 1490, 49]},
+                  index=date_range('9/1/2013', '11/1/2013',
+                                   freq='MS', tz='Europe/Paris')),
+        'MS Frequency')
+
+    assert_frame_equal(
+        df.resample("2MS").agg(how)[["a", "b", "c"]],
+        DataFrame({"a": [0, 1538],
+                   "b": [1537, 1586],
+                   "c": [1538, 49]},
+                  index=date_range('9/1/2013', '11/1/2013',
+                                   freq='2MS', tz='Europe/Paris')),
+        '2MS Frequency')
+
+    df_daily = df['10/26/2013':'10/29/2013']
+    assert_frame_equal(
+        df_daily.resample("D").agg({"a": "min", "b": "max", "c": "count"})
+        [["a", "b", "c"]],
+        DataFrame({"a": [1248, 1296, 1346, 1394],
+                   "b": [1295, 1345, 1393, 1441],
+                   "c": [48, 50, 48, 48]},
+                  index=date_range('10/26/2013', '10/29/2013',
+                                   freq='D', tz='Europe/Paris')),
+        'D Frequency')
+
+
+def test_downsample_across_dst():
+    # GH 8531
+    tz = pytz.timezone('Europe/Berlin')
+    dt = datetime(2014, 10, 26)
+    dates = date_range(tz.localize(dt), periods=4, freq='2H')
+    result = Series(5, index=dates).resample('H').mean()
+    expected = Series([5., np.nan] * 3 + [5.],
+                      index=date_range(tz.localize(dt), periods=7,
+                                       freq='H'))
+    tm.assert_series_equal(result, expected)
+
+
+def test_downsample_across_dst_weekly():
+    # GH 9119, GH 21459
+    df = DataFrame(index=DatetimeIndex([
+        '2017-03-25', '2017-03-26', '2017-03-27',
+        '2017-03-28', '2017-03-29'
+    ], tz='Europe/Amsterdam'),
+        data=[11, 12, 13, 14, 15])
+    result = df.resample('1W').sum()
+    expected = DataFrame([23, 42], index=pd.DatetimeIndex([
+        '2017-03-26', '2017-04-02'
+    ], tz='Europe/Amsterdam'))
+    tm.assert_frame_equal(result, expected)
+
+    idx = pd.date_range("2013-04-01", "2013-05-01", tz='Europe/London',
+                        freq='H')
+    s = Series(index=idx)
+    result = s.resample('W').mean()
+    expected = Series(index=pd.date_range(
+        '2013-04-07', freq='W', periods=5, tz='Europe/London'
+    ))
+    tm.assert_series_equal(result, expected)
+
+
+def test_resample_with_nat():
+    # GH 13020
+    index = DatetimeIndex([pd.NaT,
+                           '1970-01-01 00:00:00',
+                           pd.NaT,
+                           '1970-01-01 00:00:01',
+                           '1970-01-01 00:00:02'])
+    frame = DataFrame([2, 3, 5, 7, 11], index=index)
+
+    index_1s = DatetimeIndex(['1970-01-01 00:00:00',
+                              '1970-01-01 00:00:01',
+                              '1970-01-01 00:00:02'])
+    frame_1s = DataFrame([3, 7, 11], index=index_1s)
+    assert_frame_equal(frame.resample('1s').mean(), frame_1s)
+
+    index_2s = DatetimeIndex(['1970-01-01 00:00:00',
+                              '1970-01-01 00:00:02'])
+    frame_2s = DataFrame([5, 11], index=index_2s)
+    assert_frame_equal(frame.resample('2s').mean(), frame_2s)
+
+    index_3s = DatetimeIndex(['1970-01-01 00:00:00'])
+    frame_3s = DataFrame([7], index=index_3s)
+    assert_frame_equal(frame.resample('3s').mean(), frame_3s)
+
+    assert_frame_equal(frame.resample('60s').mean(), frame_3s)
+
+
+def test_resample_datetime_values():
+    # GH 13119
+    # check that datetime dtype is preserved when NaT values are
+    # introduced by the resampling
+
+    dates = [datetime(2016, 1, 15), datetime(2016, 1, 19)]
+    df = DataFrame({'timestamp': dates}, index=dates)
+
+    exp = Series([datetime(2016, 1, 15), pd.NaT, datetime(2016, 1, 19)],
+                 index=date_range('2016-01-15', periods=3, freq='2D'),
+                 name='timestamp')
+
+    res = df.resample('2D').first()['timestamp']
+    tm.assert_series_equal(res, exp)
+    res = df['timestamp'].resample('2D').first()
+    tm.assert_series_equal(res, exp)
+
+
+def test_resample_apply_with_additional_args(series):
+    # GH 14615
+    def f(data, add_arg):
+        return np.mean(data) * add_arg
+
+    multiplier = 10
+    result = series.resample('D').apply(f, multiplier)
+    expected = series.resample('D').mean().multiply(multiplier)
+    tm.assert_series_equal(result, expected)
+
+    # Testing as kwarg
+    result = series.resample('D').apply(f, add_arg=multiplier)
+    expected = series.resample('D').mean().multiply(multiplier)
+    tm.assert_series_equal(result, expected)
+
+    # Testing dataframe
+    df = pd.DataFrame({"A": 1, "B": 2},
+                      index=pd.date_range('2017', periods=10))
+    result = df.groupby("A").resample("D").agg(f, multiplier)
+    expected = df.groupby("A").resample('D').mean().multiply(multiplier)
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize('k', [1, 2, 3])
+@pytest.mark.parametrize('n1, freq1, n2, freq2', [
+    (30, 'S', 0.5, 'Min'),
+    (60, 'S', 1, 'Min'),
+    (3600, 'S', 1, 'H'),
+    (60, 'Min', 1, 'H'),
+    (21600, 'S', 0.25, 'D'),
+    (86400, 'S', 1, 'D'),
+    (43200, 'S', 0.5, 'D'),
+    (1440, 'Min', 1, 'D'),
+    (12, 'H', 0.5, 'D'),
+    (24, 'H', 1, 'D'),
+])
+def test_resample_equivalent_offsets(n1, freq1, n2, freq2, k):
+    # GH 24127
+    n1_ = n1 * k
+    n2_ = n2 * k
+    s = pd.Series(0, index=pd.date_range('19910905 13:00',
+                                         '19911005 07:00',
+                                         freq=freq1))
+    s = s + range(len(s))
+
+    result1 = s.resample(str(n1_) + freq1).mean()
+    result2 = s.resample(str(n2_) + freq2).mean()
+    assert_series_equal(result1, result2)
+
+
+@pytest.mark.parametrize('first,last,offset,exp_first,exp_last', [
+    ('19910905', '19920406', 'D', '19910905', '19920407'),
+    ('19910905 00:00', '19920406 06:00', 'D', '19910905', '19920407'),
+    ('19910905 06:00', '19920406 06:00', 'H', '19910905 06:00',
+        '19920406 07:00'),
+    ('19910906', '19920406', 'M', '19910831', '19920430'),
+    ('19910831', '19920430', 'M', '19910831', '19920531'),
+    ('1991-08', '1992-04', 'M', '19910831', '19920531'),
+])
+def test_get_timestamp_range_edges(first, last, offset,
+                                   exp_first, exp_last):
+    first = pd.Period(first)
+    first = first.to_timestamp(first.freq)
+    last = pd.Period(last)
+    last = last.to_timestamp(last.freq)
+
+    exp_first = pd.Timestamp(exp_first, freq=offset)
+    exp_last = pd.Timestamp(exp_last, freq=offset)
+
+    offset = pd.tseries.frequencies.to_offset(offset)
+    result = _get_timestamp_range_edges(first, last, offset)
+    expected = (exp_first, exp_last)
+    assert result == expected
diff --git a/pandas/tests/resample/test_period_index.py b/pandas/tests/resample/test_period_index.py
new file mode 100644
index 0000000000000..8abdf9034527b
--- /dev/null
+++ b/pandas/tests/resample/test_period_index.py
@@ -0,0 +1,772 @@
+from datetime import datetime, timedelta
+
+import dateutil
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslibs.ccalendar import DAYS, MONTHS
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas.compat import lrange, range, zip
+
+import pandas as pd
+from pandas import DataFrame, Series, Timestamp
+from pandas.core.indexes.base import InvalidIndexError
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.indexes.period import Period, PeriodIndex, period_range
+from pandas.core.resample import _get_period_range_edges
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+import pandas.tseries.offsets as offsets
+
+
+@pytest.fixture()
+def _index_factory():
+    return period_range
+
+
+@pytest.fixture
+def _series_name():
+    return 'pi'
+
+
+class TestPeriodIndex(object):
+
+    @pytest.mark.parametrize('freq', ['2D', '1H', '2H'])
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    def test_asfreq(self, series_and_frame, freq, kind):
+        # GH 12884, 15944
+        # make sure .asfreq() returns PeriodIndex (except kind='timestamp')
+
+        obj = series_and_frame
+        if kind == 'timestamp':
+            expected = obj.to_timestamp().resample(freq).asfreq()
+        else:
+            start = obj.index[0].to_timestamp(how='start')
+            end = (obj.index[-1] + obj.index.freq).to_timestamp(how='start')
+            new_index = date_range(start=start, end=end, freq=freq,
+                                   closed='left')
+            expected = obj.to_timestamp().reindex(new_index).to_period(freq)
+        result = obj.resample(freq, kind=kind).asfreq()
+        assert_almost_equal(result, expected)
+
+    def test_asfreq_fill_value(self, series):
+        # test for fill value during resampling, issue 3715
+
+        s = series
+        new_index = date_range(s.index[0].to_timestamp(how='start'),
+                               (s.index[-1]).to_timestamp(how='start'),
+                               freq='1H')
+        expected = s.to_timestamp().reindex(new_index, fill_value=4.0)
+        result = s.resample('1H', kind='timestamp').asfreq(fill_value=4.0)
+        assert_series_equal(result, expected)
+
+        frame = s.to_frame('value')
+        new_index = date_range(frame.index[0].to_timestamp(how='start'),
+                               (frame.index[-1]).to_timestamp(how='start'),
+                               freq='1H')
+        expected = frame.to_timestamp().reindex(new_index, fill_value=3.0)
+        result = frame.resample('1H', kind='timestamp').asfreq(fill_value=3.0)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('freq', ['H', '12H', '2D', 'W'])
+    @pytest.mark.parametrize('kind', [None, 'period', 'timestamp'])
+    @pytest.mark.parametrize('kwargs', [dict(on='date'), dict(level='d')])
+    def test_selection(self, index, freq, kind, kwargs):
+        # This is a bug, these should be implemented
+        # GH 14008
+        rng = np.arange(len(index), dtype=np.int64)
+        df = DataFrame({'date': index, 'a': rng},
+                       index=pd.MultiIndex.from_arrays([rng, index],
+                                                       names=['v', 'd']))
+        msg = ("Resampling from level= or on= selection with a PeriodIndex is"
+               r" not currently supported, use \.set_index\(\.\.\.\) to"
+               " explicitly set index")
+        with pytest.raises(NotImplementedError, match=msg):
+            df.resample(freq, kind=kind, **kwargs)
+
+    @pytest.mark.parametrize('month', MONTHS)
+    @pytest.mark.parametrize('meth', ['ffill', 'bfill'])
+    @pytest.mark.parametrize('conv', ['start', 'end'])
+    @pytest.mark.parametrize('targ', ['D', 'B', 'M'])
+    def test_annual_upsample_cases(self, targ, conv, meth, month,
+                                   simple_period_range_series):
+        ts = simple_period_range_series(
+            '1/1/1990', '12/31/1991', freq='A-%s' % month)
+
+        result = getattr(ts.resample(targ, convention=conv), meth)()
+        expected = result.to_timestamp(targ, how=conv)
+        expected = expected.asfreq(targ, meth).to_period()
+        assert_series_equal(result, expected)
+
+    def test_basic_downsample(self, simple_period_range_series):
+        ts = simple_period_range_series('1/1/1990', '6/30/1995', freq='M')
+        result = ts.resample('a-dec').mean()
+
+        expected = ts.groupby(ts.index.year).mean()
+        expected.index = period_range('1/1/1990', '6/30/1995', freq='a-dec')
+        assert_series_equal(result, expected)
+
+        # this is ok
+        assert_series_equal(ts.resample('a-dec').mean(), result)
+        assert_series_equal(ts.resample('a').mean(), result)
+
+    @pytest.mark.parametrize('rule,expected_error_msg', [
+        ('a-dec', '<YearEnd: month=12>'),
+        ('q-mar', '<QuarterEnd: startingMonth=3>'),
+        ('M', '<MonthEnd>'),
+        ('w-thu', '<Week: weekday=3>')
+    ])
+    def test_not_subperiod(
+            self, simple_period_range_series, rule, expected_error_msg):
+        # These are incompatible period rules for resampling
+        ts = simple_period_range_series('1/1/1990', '6/30/1995', freq='w-wed')
+        msg = ("Frequency <Week: weekday=2> cannot be resampled to {}, as they"
+               " are not sub or super periods").format(expected_error_msg)
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            ts.resample(rule).mean()
+
+    @pytest.mark.parametrize('freq', ['D', '2D'])
+    def test_basic_upsample(self, freq, simple_period_range_series):
+        ts = simple_period_range_series('1/1/1990', '6/30/1995', freq='M')
+        result = ts.resample('a-dec').mean()
+
+        resampled = result.resample(freq, convention='end').ffill()
+        expected = result.to_timestamp(freq, how='end')
+        expected = expected.asfreq(freq, 'ffill').to_period(freq)
+        assert_series_equal(resampled, expected)
+
+    def test_upsample_with_limit(self):
+        rng = period_range('1/1/2000', periods=5, freq='A')
+        ts = Series(np.random.randn(len(rng)), rng)
+
+        result = ts.resample('M', convention='end').ffill(limit=2)
+        expected = ts.asfreq('M').reindex(result.index, method='ffill',
+                                          limit=2)
+        assert_series_equal(result, expected)
+
+    def test_annual_upsample(self, simple_period_range_series):
+        ts = simple_period_range_series('1/1/1990', '12/31/1995', freq='A-DEC')
+        df = DataFrame({'a': ts})
+        rdf = df.resample('D').ffill()
+        exp = df['a'].resample('D').ffill()
+        assert_series_equal(rdf['a'], exp)
+
+        rng = period_range('2000', '2003', freq='A-DEC')
+        ts = Series([1, 2, 3, 4], index=rng)
+
+        result = ts.resample('M').ffill()
+        ex_index = period_range('2000-01', '2003-12', freq='M')
+
+        expected = ts.asfreq('M', how='start').reindex(ex_index,
+                                                       method='ffill')
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('month', MONTHS)
+    @pytest.mark.parametrize('target', ['D', 'B', 'M'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_quarterly_upsample(self, month, target, convention,
+                                simple_period_range_series):
+        freq = 'Q-{month}'.format(month=month)
+        ts = simple_period_range_series('1/1/1990', '12/31/1995', freq=freq)
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('target', ['D', 'B'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_monthly_upsample(self, target, convention,
+                              simple_period_range_series):
+        ts = simple_period_range_series('1/1/1990', '12/31/1995', freq='M')
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    def test_resample_basic(self):
+        # GH3609
+        s = Series(range(100), index=date_range(
+            '20130101', freq='s', periods=100, name='idx'), dtype='float')
+        s[10:30] = np.nan
+        index = PeriodIndex([
+            Period('2013-01-01 00:00', 'T'),
+            Period('2013-01-01 00:01', 'T')], name='idx')
+        expected = Series([34.5, 79.5], index=index)
+        result = s.to_period().resample('T', kind='period').mean()
+        assert_series_equal(result, expected)
+        result2 = s.resample('T', kind='period').mean()
+        assert_series_equal(result2, expected)
+
+    @pytest.mark.parametrize('freq,expected_vals', [('M', [31, 29, 31, 9]),
+                                                    ('2M', [31 + 29, 31 + 9])])
+    def test_resample_count(self, freq, expected_vals):
+        # GH12774
+        series = Series(1, index=pd.period_range(start='2000', periods=100))
+        result = series.resample(freq).count()
+        expected_index = pd.period_range(start='2000', freq=freq,
+                                         periods=len(expected_vals))
+        expected = Series(expected_vals, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_resample_same_freq(self, resample_method):
+
+        # GH12770
+        series = Series(range(3), index=pd.period_range(
+            start='2000', periods=3, freq='M'))
+        expected = series
+
+        result = getattr(series.resample('M'), resample_method)()
+        assert_series_equal(result, expected)
+
+    def test_resample_incompat_freq(self):
+        msg = ("Frequency <MonthEnd> cannot be resampled to <Week: weekday=6>,"
+               " as they are not sub or super periods")
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            Series(range(3), index=pd.period_range(
+                start='2000', periods=3, freq='M')).resample('W').mean()
+
+    def test_with_local_timezone_pytz(self):
+        # see gh-5430
+        local_timezone = pytz.timezone('America/Los_Angeles')
+
+        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
+                         tzinfo=pytz.utc)
+        # 1 day later
+        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
+                       tzinfo=pytz.utc)
+
+        index = pd.date_range(start, end, freq='H')
+
+        series = Series(1, index=index)
+        series = series.tz_convert(local_timezone)
+        result = series.resample('D', kind='period').mean()
+
+        # Create the expected series
+        # Index is moved back a day with the timezone conversion from UTC to
+        # Pacific
+        expected_index = (pd.period_range(start=start, end=end, freq='D') -
+                          offsets.Day())
+        expected = Series(1, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_resample_with_pytz(self):
+        # GH 13238
+        s = Series(2, index=pd.date_range('2017-01-01', periods=48, freq="H",
+                                          tz="US/Eastern"))
+        result = s.resample("D").mean()
+        expected = Series(2, index=pd.DatetimeIndex(['2017-01-01',
+                                                     '2017-01-02'],
+                                                    tz="US/Eastern"))
+        assert_series_equal(result, expected)
+        # Especially assert that the timezone is LMT for pytz
+        assert result.index.tz == pytz.timezone('US/Eastern')
+
+    def test_with_local_timezone_dateutil(self):
+        # see gh-5430
+        local_timezone = 'dateutil/America/Los_Angeles'
+
+        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
+                         tzinfo=dateutil.tz.tzutc())
+        # 1 day later
+        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
+                       tzinfo=dateutil.tz.tzutc())
+
+        index = pd.date_range(start, end, freq='H', name='idx')
+
+        series = Series(1, index=index)
+        series = series.tz_convert(local_timezone)
+        result = series.resample('D', kind='period').mean()
+
+        # Create the expected series
+        # Index is moved back a day with the timezone conversion from UTC to
+        # Pacific
+        expected_index = (pd.period_range(start=start, end=end, freq='D',
+                                          name='idx') - offsets.Day())
+        expected = Series(1, index=expected_index)
+        assert_series_equal(result, expected)
+
+    def test_resample_nonexistent_time_bin_edge(self):
+        # GH 19375
+        index = date_range('2017-03-12', '2017-03-12 1:45:00', freq='15T')
+        s = Series(np.zeros(len(index)), index=index)
+        expected = s.tz_localize('US/Pacific')
+        result = expected.resample('900S').mean()
+        tm.assert_series_equal(result, expected)
+
+        # GH 23742
+        index = date_range(start='2017-10-10', end='2017-10-20', freq='1H')
+        index = index.tz_localize('UTC').tz_convert('America/Sao_Paulo')
+        df = DataFrame(data=list(range(len(index))), index=index)
+        result = df.groupby(pd.Grouper(freq='1D')).count()
+        expected = date_range(start='2017-10-09', end='2017-10-20', freq='D',
+                              tz="America/Sao_Paulo",
+                              nonexistent='shift_forward', closed='left')
+        tm.assert_index_equal(result.index, expected)
+
+    def test_resample_ambiguous_time_bin_edge(self):
+        # GH 10117
+        idx = pd.date_range("2014-10-25 22:00:00", "2014-10-26 00:30:00",
+                            freq="30T", tz="Europe/London")
+        expected = Series(np.zeros(len(idx)), index=idx)
+        result = expected.resample('30T').mean()
+        tm.assert_series_equal(result, expected)
+
+    def test_fill_method_and_how_upsample(self):
+        # GH2073
+        s = Series(np.arange(9, dtype='int64'),
+                   index=date_range('2010-01-01', periods=9, freq='Q'))
+        last = s.resample('M').ffill()
+        both = s.resample('M').ffill().resample('M').last().astype('int64')
+        assert_series_equal(last, both)
+
+    @pytest.mark.parametrize('day', DAYS)
+    @pytest.mark.parametrize('target', ['D', 'B'])
+    @pytest.mark.parametrize('convention', ['start', 'end'])
+    def test_weekly_upsample(self, day, target, convention,
+                             simple_period_range_series):
+        freq = 'W-{day}'.format(day=day)
+        ts = simple_period_range_series('1/1/1990', '12/31/1995', freq=freq)
+        result = ts.resample(target, convention=convention).ffill()
+        expected = result.to_timestamp(target, how=convention)
+        expected = expected.asfreq(target, 'ffill').to_period()
+        assert_series_equal(result, expected)
+
+    def test_resample_to_timestamps(self, simple_period_range_series):
+        ts = simple_period_range_series('1/1/1990', '12/31/1995', freq='M')
+
+        result = ts.resample('A-DEC', kind='timestamp').mean()
+        expected = ts.to_timestamp(how='start').resample('A-DEC').mean()
+        assert_series_equal(result, expected)
+
+    def test_resample_to_quarterly(self, simple_period_range_series):
+        for month in MONTHS:
+            ts = simple_period_range_series(
+                '1990', '1992', freq='A-%s' % month)
+            quar_ts = ts.resample('Q-%s' % month).ffill()
+
+            stamps = ts.to_timestamp('D', how='start')
+            qdates = period_range(ts.index[0].asfreq('D', 'start'),
+                                  ts.index[-1].asfreq('D', 'end'),
+                                  freq='Q-%s' % month)
+
+            expected = stamps.reindex(qdates.to_timestamp('D', 's'),
+                                      method='ffill')
+            expected.index = qdates
+
+            assert_series_equal(quar_ts, expected)
+
+        # conforms, but different month
+        ts = simple_period_range_series('1990', '1992', freq='A-JUN')
+
+        for how in ['start', 'end']:
+            result = ts.resample('Q-MAR', convention=how).ffill()
+            expected = ts.asfreq('Q-MAR', how=how)
+            expected = expected.reindex(result.index, method='ffill')
+
+            # .to_timestamp('D')
+            # expected = expected.resample('Q-MAR').ffill()
+
+            assert_series_equal(result, expected)
+
+    def test_resample_fill_missing(self):
+        rng = PeriodIndex([2000, 2005, 2007, 2009], freq='A')
+
+        s = Series(np.random.randn(4), index=rng)
+
+        stamps = s.to_timestamp()
+        filled = s.resample('A').ffill()
+        expected = stamps.resample('A').ffill().to_period('A')
+        assert_series_equal(filled, expected)
+
+    def test_cant_fill_missing_dups(self):
+        rng = PeriodIndex([2000, 2005, 2005, 2007, 2007], freq='A')
+        s = Series(np.random.randn(5), index=rng)
+        msg = "Reindexing only valid with uniquely valued Index objects"
+        with pytest.raises(InvalidIndexError, match=msg):
+            s.resample('A').ffill()
+
+    @pytest.mark.parametrize('freq', ['5min'])
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    def test_resample_5minute(self, freq, kind):
+        rng = period_range('1/1/2000', '1/5/2000', freq='T')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        expected = ts.to_timestamp().resample(freq).mean()
+        if kind != 'timestamp':
+            expected = expected.to_period(freq)
+        result = ts.resample(freq, kind=kind).mean()
+        assert_series_equal(result, expected)
+
+    def test_upsample_daily_business_daily(self, simple_period_range_series):
+        ts = simple_period_range_series('1/1/2000', '2/1/2000', freq='B')
+
+        result = ts.resample('D').asfreq()
+        expected = ts.asfreq('D').reindex(period_range('1/3/2000', '2/1/2000'))
+        assert_series_equal(result, expected)
+
+        ts = simple_period_range_series('1/1/2000', '2/1/2000')
+        result = ts.resample('H', convention='s').asfreq()
+        exp_rng = period_range('1/1/2000', '2/1/2000 23:00', freq='H')
+        expected = ts.asfreq('H', how='s').reindex(exp_rng)
+        assert_series_equal(result, expected)
+
+    def test_resample_irregular_sparse(self):
+        dr = date_range(start='1/1/2012', freq='5min', periods=1000)
+        s = Series(np.array(100), index=dr)
+        # subset the data.
+        subset = s[:'2012-01-04 06:55']
+
+        result = subset.resample('10min').apply(len)
+        expected = s.resample('10min').apply(len).loc[result.index]
+        assert_series_equal(result, expected)
+
+    def test_resample_weekly_all_na(self):
+        rng = date_range('1/1/2000', periods=10, freq='W-WED')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts.resample('W-THU').asfreq()
+
+        assert result.isna().all()
+
+        result = ts.resample('W-THU').asfreq().ffill()[:-1]
+        expected = ts.asfreq('W-THU').ffill()
+        assert_series_equal(result, expected)
+
+    def test_resample_tz_localized(self):
+        dr = date_range(start='2012-4-13', end='2012-5-1')
+        ts = Series(lrange(len(dr)), dr)
+
+        ts_utc = ts.tz_localize('UTC')
+        ts_local = ts_utc.tz_convert('America/Los_Angeles')
+
+        result = ts_local.resample('W').mean()
+
+        ts_local_naive = ts_local.copy()
+        ts_local_naive.index = [x.replace(tzinfo=None)
+                                for x in ts_local_naive.index.to_pydatetime()]
+
+        exp = ts_local_naive.resample(
+            'W').mean().tz_localize('America/Los_Angeles')
+
+        assert_series_equal(result, exp)
+
+        # it works
+        result = ts_local.resample('D').mean()
+
+        # #2245
+        idx = date_range('2001-09-20 15:59', '2001-09-20 16:00', freq='T',
+                         tz='Australia/Sydney')
+        s = Series([1, 2], index=idx)
+
+        result = s.resample('D', closed='right', label='right').mean()
+        ex_index = date_range('2001-09-21', periods=1, freq='D',
+                              tz='Australia/Sydney')
+        expected = Series([1.5], index=ex_index)
+
+        assert_series_equal(result, expected)
+
+        # for good measure
+        result = s.resample('D', kind='period').mean()
+        ex_index = period_range('2001-09-20', periods=1, freq='D')
+        expected = Series([1.5], index=ex_index)
+        assert_series_equal(result, expected)
+
+        # GH 6397
+        # comparing an offset that doesn't propagate tz's
+        rng = date_range('1/1/2011', periods=20000, freq='H')
+        rng = rng.tz_localize('EST')
+        ts = DataFrame(index=rng)
+        ts['first'] = np.random.randn(len(rng))
+        ts['second'] = np.cumsum(np.random.randn(len(rng)))
+        expected = DataFrame(
+            {
+                'first': ts.resample('A').sum()['first'],
+                'second': ts.resample('A').mean()['second']},
+            columns=['first', 'second'])
+        result = ts.resample(
+            'A').agg({'first': np.sum,
+                      'second': np.mean}).reindex(columns=['first', 'second'])
+        assert_frame_equal(result, expected)
+
+    def test_closed_left_corner(self):
+        # #1465
+        s = Series(np.random.randn(21),
+                   index=date_range(start='1/1/2012 9:30',
+                                    freq='1min', periods=21))
+        s[0] = np.nan
+
+        result = s.resample('10min', closed='left', label='right').mean()
+        exp = s[1:].resample('10min', closed='left', label='right').mean()
+        assert_series_equal(result, exp)
+
+        result = s.resample('10min', closed='left', label='left').mean()
+        exp = s[1:].resample('10min', closed='left', label='left').mean()
+
+        ex_index = date_range(start='1/1/2012 9:30', freq='10min', periods=3)
+
+        tm.assert_index_equal(result.index, ex_index)
+        assert_series_equal(result, exp)
+
+    def test_quarterly_resampling(self):
+        rng = period_range('2000Q1', periods=10, freq='Q-DEC')
+        ts = Series(np.arange(10), index=rng)
+
+        result = ts.resample('A').mean()
+        exp = ts.to_timestamp().resample('A').mean().to_period()
+        assert_series_equal(result, exp)
+
+    def test_resample_weekly_bug_1726(self):
+        # 8/6/12 is a Monday
+        ind = date_range(start="8/6/2012", end="8/26/2012", freq="D")
+        n = len(ind)
+        data = [[x] * 5 for x in range(n)]
+        df = DataFrame(data, columns=['open', 'high', 'low', 'close', 'vol'],
+                       index=ind)
+
+        # it works!
+        df.resample('W-MON', closed='left', label='left').first()
+
+    def test_resample_with_dst_time_change(self):
+        # GH 15549
+        index = (
+            pd.DatetimeIndex([1457537600000000000, 1458059600000000000])
+            .tz_localize("UTC").tz_convert('America/Chicago')
+        )
+        df = pd.DataFrame([1, 2], index=index)
+        result = df.resample('12h', closed='right',
+                             label='right').last().ffill()
+
+        expected_index_values = ['2016-03-09 12:00:00-06:00',
+                                 '2016-03-10 00:00:00-06:00',
+                                 '2016-03-10 12:00:00-06:00',
+                                 '2016-03-11 00:00:00-06:00',
+                                 '2016-03-11 12:00:00-06:00',
+                                 '2016-03-12 00:00:00-06:00',
+                                 '2016-03-12 12:00:00-06:00',
+                                 '2016-03-13 00:00:00-06:00',
+                                 '2016-03-13 13:00:00-05:00',
+                                 '2016-03-14 01:00:00-05:00',
+                                 '2016-03-14 13:00:00-05:00',
+                                 '2016-03-15 01:00:00-05:00',
+                                 '2016-03-15 13:00:00-05:00']
+        index = pd.to_datetime(expected_index_values, utc=True).tz_convert(
+            'America/Chicago')
+        expected = pd.DataFrame([1.0, 1.0, 1.0, 1.0, 1.0,
+                                 1.0, 1.0, 1.0, 1.0, 1.0,
+                                 1.0, 1.0, 2.0], index=index)
+        assert_frame_equal(result, expected)
+
+    def test_resample_bms_2752(self):
+        # GH2753
+        foo = Series(index=pd.bdate_range('20000101', '20000201'))
+        res1 = foo.resample("BMS").mean()
+        res2 = foo.resample("BMS").mean().resample("B").mean()
+        assert res1.index[0] == Timestamp('20000103')
+        assert res1.index[0] == res2.index[0]
+
+    # def test_monthly_convention_span(self):
+    #     rng = period_range('2000-01', periods=3, freq='M')
+    #     ts = Series(np.arange(3), index=rng)
+
+    #     # hacky way to get same thing
+    #     exp_index = period_range('2000-01-01', '2000-03-31', freq='D')
+    #     expected = ts.asfreq('D', how='end').reindex(exp_index)
+    #     expected = expected.fillna(method='bfill')
+
+    #     result = ts.resample('D', convention='span').mean()
+
+    #     assert_series_equal(result, expected)
+
+    def test_default_right_closed_label(self):
+        end_freq = ['D', 'Q', 'M', 'D']
+        end_types = ['M', 'A', 'Q', 'W']
+
+        for from_freq, to_freq in zip(end_freq, end_types):
+            idx = date_range(start='8/15/2012', periods=100, freq=from_freq)
+            df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+            resampled = df.resample(to_freq).mean()
+            assert_frame_equal(resampled, df.resample(to_freq, closed='right',
+                                                      label='right').mean())
+
+    def test_default_left_closed_label(self):
+        others = ['MS', 'AS', 'QS', 'D', 'H']
+        others_freq = ['D', 'Q', 'M', 'H', 'T']
+
+        for from_freq, to_freq in zip(others_freq, others):
+            idx = date_range(start='8/15/2012', periods=100, freq=from_freq)
+            df = DataFrame(np.random.randn(len(idx), 2), idx)
+
+            resampled = df.resample(to_freq).mean()
+            assert_frame_equal(resampled, df.resample(to_freq, closed='left',
+                                                      label='left').mean())
+
+    def test_all_values_single_bin(self):
+        # 2070
+        index = period_range(start="2012-01-01", end="2012-12-31", freq="M")
+        s = Series(np.random.randn(len(index)), index=index)
+
+        result = s.resample("A").mean()
+        tm.assert_almost_equal(result[0], s.mean())
+
+    def test_evenly_divisible_with_no_extra_bins(self):
+        # 4076
+        # when the frequency is evenly divisible, sometimes extra bins
+
+        df = DataFrame(np.random.randn(9, 3),
+                       index=date_range('2000-1-1', periods=9))
+        result = df.resample('5D').mean()
+        expected = pd.concat(
+            [df.iloc[0:5].mean(), df.iloc[5:].mean()], axis=1).T
+        expected.index = [Timestamp('2000-1-1'), Timestamp('2000-1-6')]
+        assert_frame_equal(result, expected)
+
+        index = date_range(start='2001-5-4', periods=28)
+        df = DataFrame(
+            [{'REST_KEY': 1, 'DLY_TRN_QT': 80, 'DLY_SLS_AMT': 90,
+              'COOP_DLY_TRN_QT': 30, 'COOP_DLY_SLS_AMT': 20}] * 28 +
+            [{'REST_KEY': 2, 'DLY_TRN_QT': 70, 'DLY_SLS_AMT': 10,
+              'COOP_DLY_TRN_QT': 50, 'COOP_DLY_SLS_AMT': 20}] * 28,
+            index=index.append(index)).sort_index()
+
+        index = date_range('2001-5-4', periods=4, freq='7D')
+        expected = DataFrame(
+            [{'REST_KEY': 14, 'DLY_TRN_QT': 14, 'DLY_SLS_AMT': 14,
+              'COOP_DLY_TRN_QT': 14, 'COOP_DLY_SLS_AMT': 14}] * 4,
+            index=index)
+        result = df.resample('7D').count()
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(
+            [{'REST_KEY': 21, 'DLY_TRN_QT': 1050, 'DLY_SLS_AMT': 700,
+              'COOP_DLY_TRN_QT': 560, 'COOP_DLY_SLS_AMT': 280}] * 4,
+            index=index)
+        result = df.resample('7D').sum()
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('kind', ['period', None, 'timestamp'])
+    @pytest.mark.parametrize('agg_arg', ['mean', {'value': 'mean'}, ['mean']])
+    def test_loffset_returns_datetimeindex(self, frame, kind, agg_arg):
+        # make sure passing loffset returns DatetimeIndex in all cases
+        # basic method taken from Base.test_resample_loffset_arg_type()
+        df = frame
+        expected_means = [df.values[i:i + 2].mean()
+                          for i in range(0, len(df.values), 2)]
+        expected_index = period_range(
+            df.index[0], periods=len(df.index) / 2, freq='2D')
+
+        # loffset coerces PeriodIndex to DateTimeIndex
+        expected_index = expected_index.to_timestamp()
+        expected_index += timedelta(hours=2)
+        expected = DataFrame({'value': expected_means}, index=expected_index)
+
+        result_agg = df.resample('2D', loffset='2H', kind=kind).agg(agg_arg)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result_how = df.resample('2D', how=agg_arg, loffset='2H',
+                                     kind=kind)
+        if isinstance(agg_arg, list):
+            expected.columns = pd.MultiIndex.from_tuples([('value', 'mean')])
+        assert_frame_equal(result_agg, expected)
+        assert_frame_equal(result_how, expected)
+
+    @pytest.mark.parametrize('freq, period_mult', [('H', 24), ('12H', 2)])
+    @pytest.mark.parametrize('kind', [None, 'period'])
+    def test_upsampling_ohlc(self, freq, period_mult, kind):
+        # GH 13083
+        pi = period_range(start='2000', freq='D', periods=10)
+        s = Series(range(len(pi)), index=pi)
+        expected = s.to_timestamp().resample(freq).ohlc().to_period(freq)
+
+        # timestamp-based resampling doesn't include all sub-periods
+        # of the last original period, so extend accordingly:
+        new_index = period_range(start='2000', freq=freq,
+                                 periods=period_mult * len(pi))
+        expected = expected.reindex(new_index)
+        result = s.resample(freq, kind=kind).ohlc()
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('periods, values',
+                             [([pd.NaT, '1970-01-01 00:00:00', pd.NaT,
+                                '1970-01-01 00:00:02', '1970-01-01 00:00:03'],
+                               [2, 3, 5, 7, 11]),
+                              ([pd.NaT, pd.NaT, '1970-01-01 00:00:00', pd.NaT,
+                                pd.NaT, pd.NaT, '1970-01-01 00:00:02',
+                                '1970-01-01 00:00:03', pd.NaT, pd.NaT],
+                               [1, 2, 3, 5, 6, 8, 7, 11, 12, 13])])
+    @pytest.mark.parametrize('freq, expected_values',
+                             [('1s', [3, np.NaN, 7, 11]),
+                              ('2s', [3, int((7 + 11) / 2)]),
+                              ('3s', [int((3 + 7) / 2), 11])])
+    def test_resample_with_nat(self, periods, values, freq, expected_values):
+        # GH 13224
+        index = PeriodIndex(periods, freq='S')
+        frame = DataFrame(values, index=index)
+
+        expected_index = period_range('1970-01-01 00:00:00',
+                                      periods=len(expected_values), freq=freq)
+        expected = DataFrame(expected_values, index=expected_index)
+        result = frame.resample(freq).mean()
+        assert_frame_equal(result, expected)
+
+    def test_resample_with_only_nat(self):
+        # GH 13224
+        pi = PeriodIndex([pd.NaT] * 3, freq='S')
+        frame = DataFrame([2, 3, 5], index=pi)
+        expected_index = PeriodIndex(data=[], freq=pi.freq)
+        expected = DataFrame([], index=expected_index)
+        result = frame.resample('1s').mean()
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('start,end,start_freq,end_freq,base', [
+        ('19910905', '19910909 03:00', 'H', '24H', 10),
+        ('19910905', '19910909 12:00', 'H', '24H', 10),
+        ('19910905', '19910909 23:00', 'H', '24H', 10),
+        ('19910905 10:00', '19910909', 'H', '24H', 10),
+        ('19910905 10:00', '19910909 10:00', 'H', '24H', 10),
+        ('19910905', '19910909 10:00', 'H', '24H', 10),
+        ('19910905 12:00', '19910909', 'H', '24H', 10),
+        ('19910905 12:00', '19910909 03:00', 'H', '24H', 10),
+        ('19910905 12:00', '19910909 12:00', 'H', '24H', 10),
+        ('19910905 12:00', '19910909 12:00', 'H', '24H', 34),
+        ('19910905 12:00', '19910909 12:00', 'H', '17H', 10),
+        ('19910905 12:00', '19910909 12:00', 'H', '17H', 3),
+        ('19910905 12:00', '19910909 1:00', 'H', 'M', 3),
+        ('19910905', '19910913 06:00', '2H', '24H', 10),
+        ('19910905', '19910905 01:39', 'Min', '5Min', 3),
+        ('19910905', '19910905 03:18', '2Min', '5Min', 3),
+    ])
+    def test_resample_with_non_zero_base(self, start, end, start_freq,
+                                         end_freq, base):
+        # GH 23882
+        s = pd.Series(0, index=pd.period_range(start, end, freq=start_freq))
+        s = s + np.arange(len(s))
+        result = s.resample(end_freq, base=base).mean()
+        result = result.to_timestamp(end_freq)
+        # to_timestamp casts 24H -> D
+        result = result.asfreq(end_freq) if end_freq == '24H' else result
+        expected = s.to_timestamp().resample(end_freq, base=base).mean()
+        assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('first,last,offset,exp_first,exp_last', [
+        ('19910905', '19920406', 'D', '19910905', '19920406'),
+        ('19910905 00:00', '19920406 06:00', 'D', '19910905', '19920406'),
+        ('19910905 06:00', '19920406 06:00', 'H', '19910905 06:00',
+         '19920406 06:00'),
+        ('19910906', '19920406', 'M', '1991-09', '1992-04'),
+        ('19910831', '19920430', 'M', '1991-08', '1992-04'),
+        ('1991-08', '1992-04', 'M', '1991-08', '1992-04'),
+    ])
+    def test_get_period_range_edges(self, first, last, offset,
+                                    exp_first, exp_last):
+        first = pd.Period(first)
+        last = pd.Period(last)
+
+        exp_first = pd.Period(exp_first, freq=offset)
+        exp_last = pd.Period(exp_last, freq=offset)
+
+        offset = pd.tseries.frequencies.to_offset(offset)
+        result = _get_period_range_edges(first, last, offset)
+        expected = (exp_first, exp_last)
+        assert result == expected
diff --git a/pandas/tests/resample/test_resample_api.py b/pandas/tests/resample/test_resample_api.py
new file mode 100644
index 0000000000000..97f1e07380ef9
--- /dev/null
+++ b/pandas/tests/resample/test_resample_api.py
@@ -0,0 +1,573 @@
+# pylint: disable=E1101
+
+from collections import OrderedDict
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas import DataFrame, Series
+from pandas.core.indexes.datetimes import date_range
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+dti = date_range(start=datetime(2005, 1, 1),
+                 end=datetime(2005, 1, 10), freq='Min')
+
+test_series = Series(np.random.rand(len(dti)), dti)
+test_frame = DataFrame(
+    {'A': test_series, 'B': test_series, 'C': np.arange(len(dti))})
+
+
+def test_str():
+
+    r = test_series.resample('H')
+    assert ('DatetimeIndexResampler [freq=<Hour>, axis=0, closed=left, '
+            'label=left, convention=start, base=0]' in str(r))
+
+
+def test_api():
+
+    r = test_series.resample('H')
+    result = r.mean()
+    assert isinstance(result, Series)
+    assert len(result) == 217
+
+    r = test_series.to_frame().resample('H')
+    result = r.mean()
+    assert isinstance(result, DataFrame)
+    assert len(result) == 217
+
+
+def test_groupby_resample_api():
+
+    # GH 12448
+    # .groupby(...).resample(...) hitting warnings
+    # when appropriate
+    df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                          periods=4,
+                                          freq='W'),
+                    'group': [1, 1, 2, 2],
+                    'val': [5, 6, 7, 8]}).set_index('date')
+
+    # replication step
+    i = pd.date_range('2016-01-03', periods=8).tolist() + \
+        pd.date_range('2016-01-17', periods=8).tolist()
+    index = pd.MultiIndex.from_arrays([[1] * 8 + [2] * 8, i],
+                                      names=['group', 'date'])
+    expected = DataFrame({'val': [5] * 7 + [6] + [7] * 7 + [8]},
+                         index=index)
+    result = df.groupby('group').apply(
+        lambda x: x.resample('1D').ffill())[['val']]
+    assert_frame_equal(result, expected)
+
+
+def test_groupby_resample_on_api():
+
+    # GH 15021
+    # .groupby(...).resample(on=...) results in an unexpected
+    # keyword warning.
+    df = DataFrame({'key': ['A', 'B'] * 5,
+                    'dates': pd.date_range('2016-01-01', periods=10),
+                    'values': np.random.randn(10)})
+
+    expected = df.set_index('dates').groupby('key').resample('D').mean()
+
+    result = df.groupby('key').resample('D', on='dates').mean()
+    assert_frame_equal(result, expected)
+
+
+def test_pipe():
+    # GH17905
+
+    # series
+    r = test_series.resample('H')
+    expected = r.max() - r.mean()
+    result = r.pipe(lambda x: x.max() - x.mean())
+    tm.assert_series_equal(result, expected)
+
+    # dataframe
+    r = test_frame.resample('H')
+    expected = r.max() - r.mean()
+    result = r.pipe(lambda x: x.max() - x.mean())
+    tm.assert_frame_equal(result, expected)
+
+
+def test_getitem():
+
+    r = test_frame.resample('H')
+    tm.assert_index_equal(r._selected_obj.columns, test_frame.columns)
+
+    r = test_frame.resample('H')['B']
+    assert r._selected_obj.name == test_frame.columns[1]
+
+    # technically this is allowed
+    r = test_frame.resample('H')['A', 'B']
+    tm.assert_index_equal(r._selected_obj.columns,
+                          test_frame.columns[[0, 1]])
+
+    r = test_frame.resample('H')['A', 'B']
+    tm.assert_index_equal(r._selected_obj.columns,
+                          test_frame.columns[[0, 1]])
+
+
+@pytest.mark.parametrize('key', [['D'], ['A', 'D']])
+def test_select_bad_cols(key):
+    g = test_frame.resample('H')
+    # 'A' should not be referenced as a bad column...
+    # will have to rethink regex if you change message!
+    msg = r"^\"Columns not found: 'D'\"$"
+    with pytest.raises(KeyError, match=msg):
+        g[key]
+
+
+def test_attribute_access():
+
+    r = test_frame.resample('H')
+    tm.assert_series_equal(r.A.sum(), r['A'].sum())
+
+
+def test_api_compat_before_use():
+
+    # make sure that we are setting the binner
+    # on these attributes
+    for attr in ['groups', 'ngroups', 'indices']:
+        rng = pd.date_range('1/1/2012', periods=100, freq='S')
+        ts = Series(np.arange(len(rng)), index=rng)
+        rs = ts.resample('30s')
+
+        # before use
+        getattr(rs, attr)
+
+        # after grouper is initialized is ok
+        rs.mean()
+        getattr(rs, attr)
+
+
+def tests_skip_nuisance():
+
+    df = test_frame
+    df['D'] = 'foo'
+    r = df.resample('H')
+    result = r[['A', 'B']].sum()
+    expected = pd.concat([r.A.sum(), r.B.sum()], axis=1)
+    assert_frame_equal(result, expected)
+
+    expected = r[['A', 'B', 'C']].sum()
+    result = r.sum()
+    assert_frame_equal(result, expected)
+
+
+def test_downsample_but_actually_upsampling():
+
+    # this is reindex / asfreq
+    rng = pd.date_range('1/1/2012', periods=100, freq='S')
+    ts = Series(np.arange(len(rng), dtype='int64'), index=rng)
+    result = ts.resample('20s').asfreq()
+    expected = Series([0, 20, 40, 60, 80],
+                      index=pd.date_range('2012-01-01 00:00:00',
+                                          freq='20s',
+                                          periods=5))
+    assert_series_equal(result, expected)
+
+
+def test_combined_up_downsampling_of_irregular():
+
+    # since we are reallydoing an operation like this
+    # ts2.resample('2s').mean().ffill()
+    # preserve these semantics
+
+    rng = pd.date_range('1/1/2012', periods=100, freq='S')
+    ts = Series(np.arange(len(rng)), index=rng)
+    ts2 = ts.iloc[[0, 1, 2, 3, 5, 7, 11, 15, 16, 25, 30]]
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = ts2.resample('2s', how='mean', fill_method='ffill')
+    expected = ts2.resample('2s').mean().ffill()
+    assert_series_equal(result, expected)
+
+
+def test_transform():
+
+    r = test_series.resample('20min')
+    expected = test_series.groupby(
+        pd.Grouper(freq='20min')).transform('mean')
+    result = r.transform('mean')
+    assert_series_equal(result, expected)
+
+
+def test_fillna():
+
+    # need to upsample here
+    rng = pd.date_range('1/1/2012', periods=10, freq='2S')
+    ts = Series(np.arange(len(rng), dtype='int64'), index=rng)
+    r = ts.resample('s')
+
+    expected = r.ffill()
+    result = r.fillna(method='ffill')
+    assert_series_equal(result, expected)
+
+    expected = r.bfill()
+    result = r.fillna(method='bfill')
+    assert_series_equal(result, expected)
+
+    msg = (r"Invalid fill method\. Expecting pad \(ffill\), backfill"
+           r" \(bfill\) or nearest\. Got 0")
+    with pytest.raises(ValueError, match=msg):
+        r.fillna(0)
+
+
+def test_apply_without_aggregation():
+
+    # both resample and groupby should work w/o aggregation
+    r = test_series.resample('20min')
+    g = test_series.groupby(pd.Grouper(freq='20min'))
+
+    for t in [g, r]:
+        result = t.apply(lambda x: x)
+        assert_series_equal(result, test_series)
+
+
+def test_agg_consistency():
+
+    # make sure that we are consistent across
+    # similar aggregations with and w/o selection list
+    df = DataFrame(np.random.randn(1000, 3),
+                   index=pd.date_range('1/1/2012', freq='S', periods=1000),
+                   columns=['A', 'B', 'C'])
+
+    r = df.resample('3T')
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        expected = r[['A', 'B', 'C']].agg({'r1': 'mean', 'r2': 'sum'})
+        result = r.agg({'r1': 'mean', 'r2': 'sum'})
+    assert_frame_equal(result, expected)
+
+# TODO: once GH 14008 is fixed, move these tests into
+# `Base` test class
+
+
+def test_agg():
+    # test with all three Resampler apis and TimeGrouper
+
+    np.random.seed(1234)
+    index = date_range(datetime(2005, 1, 1),
+                       datetime(2005, 1, 10), freq='D')
+    index.name = 'date'
+    df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+    df_col = df.reset_index()
+    df_mult = df_col.copy()
+    df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                              names=['index', 'date'])
+    r = df.resample('2D')
+    cases = [
+        r,
+        df_col.resample('2D', on='date'),
+        df_mult.resample('2D', level='date'),
+        df.groupby(pd.Grouper(freq='2D'))
+    ]
+
+    a_mean = r['A'].mean()
+    a_std = r['A'].std()
+    a_sum = r['A'].sum()
+    b_mean = r['B'].mean()
+    b_std = r['B'].std()
+    b_sum = r['B'].sum()
+
+    expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+    expected.columns = pd.MultiIndex.from_product([['A', 'B'],
+                                                   ['mean', 'std']])
+    for t in cases:
+        result = t.aggregate([np.mean, np.std])
+        assert_frame_equal(result, expected)
+
+    expected = pd.concat([a_mean, b_std], axis=1)
+    for t in cases:
+        result = t.aggregate({'A': np.mean,
+                              'B': np.std})
+        assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([a_mean, a_std], axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                  ('A', 'std')])
+    for t in cases:
+        result = t.aggregate({'A': ['mean', 'std']})
+        assert_frame_equal(result, expected)
+
+    expected = pd.concat([a_mean, a_sum], axis=1)
+    expected.columns = ['mean', 'sum']
+    for t in cases:
+        result = t['A'].aggregate(['mean', 'sum'])
+    assert_frame_equal(result, expected)
+
+    expected = pd.concat([a_mean, a_sum], axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                  ('A', 'sum')])
+    for t in cases:
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
+        assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                  ('A', 'sum'),
+                                                  ('B', 'mean2'),
+                                                  ('B', 'sum2')])
+    for t in cases:
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'},
+                                  'B': {'mean2': 'mean', 'sum2': 'sum'}})
+        assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
+                                                  ('A', 'std'),
+                                                  ('B', 'mean'),
+                                                  ('B', 'std')])
+    for t in cases:
+        result = t.aggregate({'A': ['mean', 'std'],
+                              'B': ['mean', 'std']})
+        assert_frame_equal(result, expected, check_like=True)
+
+    expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('r1', 'A', 'mean'),
+                                                  ('r1', 'A', 'sum'),
+                                                  ('r2', 'B', 'mean'),
+                                                  ('r2', 'B', 'sum')])
+
+
+def test_agg_misc():
+    # test with all three Resampler apis and TimeGrouper
+
+    np.random.seed(1234)
+    index = date_range(datetime(2005, 1, 1),
+                       datetime(2005, 1, 10), freq='D')
+    index.name = 'date'
+    df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+    df_col = df.reset_index()
+    df_mult = df_col.copy()
+    df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                              names=['index', 'date'])
+
+    r = df.resample('2D')
+    cases = [
+        r,
+        df_col.resample('2D', on='date'),
+        df_mult.resample('2D', level='date'),
+        df.groupby(pd.Grouper(freq='2D'))
+    ]
+
+    # passed lambda
+    for t in cases:
+        result = t.agg({'A': np.sum,
+                        'B': lambda x: np.std(x, ddof=1)})
+        rcustom = t['B'].apply(lambda x: np.std(x, ddof=1))
+        expected = pd.concat([r['A'].sum(), rcustom], axis=1)
+        assert_frame_equal(result, expected, check_like=True)
+
+    # agg with renamers
+    expected = pd.concat([t['A'].sum(),
+                          t['B'].sum(),
+                          t['A'].mean(),
+                          t['B'].mean()],
+                         axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('result1', 'A'),
+                                                  ('result1', 'B'),
+                                                  ('result2', 'A'),
+                                                  ('result2', 'B')])
+
+    for t in cases:
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t[['A', 'B']].agg(OrderedDict([('result1', np.sum),
+                                                    ('result2', np.mean)]))
+        assert_frame_equal(result, expected, check_like=True)
+
+    # agg with different hows
+    expected = pd.concat([t['A'].sum(),
+                          t['A'].std(),
+                          t['B'].mean(),
+                          t['B'].std()],
+                         axis=1)
+    expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                  ('A', 'std'),
+                                                  ('B', 'mean'),
+                                                  ('B', 'std')])
+    for t in cases:
+        result = t.agg(OrderedDict([('A', ['sum', 'std']),
+                                    ('B', ['mean', 'std'])]))
+        assert_frame_equal(result, expected, check_like=True)
+
+    # equivalent of using a selection list / or not
+    for t in cases:
+        result = t[['A', 'B']].agg({'A': ['sum', 'std'],
+                                    'B': ['mean', 'std']})
+        assert_frame_equal(result, expected, check_like=True)
+
+    # series like aggs
+    for t in cases:
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t['A'].agg({'A': ['sum', 'std']})
+        expected = pd.concat([t['A'].sum(),
+                              t['A'].std()],
+                             axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                      ('A', 'std')])
+        assert_frame_equal(result, expected, check_like=True)
+
+        expected = pd.concat([t['A'].agg(['sum', 'std']),
+                              t['A'].agg(['mean', 'std'])],
+                             axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
+                                                      ('A', 'std'),
+                                                      ('B', 'mean'),
+                                                      ('B', 'std')])
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t['A'].agg({'A': ['sum', 'std'],
+                                 'B': ['mean', 'std']})
+        assert_frame_equal(result, expected, check_like=True)
+
+    # errors
+    # invalid names in the agg specification
+    msg = "\"Column 'B' does not exist!\""
+    for t in cases:
+        with pytest.raises(KeyError, match=msg):
+            t[['A']].agg({'A': ['sum', 'std'],
+                          'B': ['mean', 'std']})
+
+
+def test_agg_nested_dicts():
+
+    np.random.seed(1234)
+    index = date_range(datetime(2005, 1, 1),
+                       datetime(2005, 1, 10), freq='D')
+    index.name = 'date'
+    df = DataFrame(np.random.rand(10, 2), columns=list('AB'), index=index)
+    df_col = df.reset_index()
+    df_mult = df_col.copy()
+    df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
+                                              names=['index', 'date'])
+    r = df.resample('2D')
+    cases = [
+        r,
+        df_col.resample('2D', on='date'),
+        df_mult.resample('2D', level='date'),
+        df.groupby(pd.Grouper(freq='2D'))
+    ]
+
+    msg = r"cannot perform renaming for r(1|2) with a nested dictionary"
+    for t in cases:
+        with pytest.raises(pd.core.base.SpecificationError, match=msg):
+            t.aggregate({'r1': {'A': ['mean', 'sum']},
+                         'r2': {'B': ['mean', 'sum']}})
+
+    for t in cases:
+        expected = pd.concat([t['A'].mean(), t['A'].std(), t['B'].mean(),
+                              t['B'].std()], axis=1)
+        expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
+            'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
+                                        'B': {'rb': ['mean', 'std']}})
+        assert_frame_equal(result, expected, check_like=True)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = t.agg({'A': {'ra': ['mean', 'std']},
+                            'B': {'rb': ['mean', 'std']}})
+        assert_frame_equal(result, expected, check_like=True)
+
+
+def test_try_aggregate_non_existing_column():
+    # GH 16766
+    data = [
+        {'dt': datetime(2017, 6, 1, 0), 'x': 1.0, 'y': 2.0},
+        {'dt': datetime(2017, 6, 1, 1), 'x': 2.0, 'y': 2.0},
+        {'dt': datetime(2017, 6, 1, 2), 'x': 3.0, 'y': 1.5}
+    ]
+    df = DataFrame(data).set_index('dt')
+
+    # Error as we don't have 'z' column
+    msg = "\"Column 'z' does not exist!\""
+    with pytest.raises(KeyError, match=msg):
+        df.resample('30T').agg({'x': ['mean'],
+                                'y': ['median'],
+                                'z': ['sum']})
+
+
+def test_selection_api_validation():
+    # GH 13500
+    index = date_range(datetime(2005, 1, 1),
+                       datetime(2005, 1, 10), freq='D')
+
+    rng = np.arange(len(index), dtype=np.int64)
+    df = DataFrame({'date': index, 'a': rng},
+                   index=pd.MultiIndex.from_arrays([rng, index],
+                                                   names=['v', 'd']))
+    df_exp = DataFrame({'a': rng}, index=index)
+
+    # non DatetimeIndex
+    msg = ("Only valid with DatetimeIndex, TimedeltaIndex or PeriodIndex,"
+           " but got an instance of 'Int64Index'")
+    with pytest.raises(TypeError, match=msg):
+        df.resample('2D', level='v')
+
+    msg = "The Grouper cannot specify both a key and a level!"
+    with pytest.raises(ValueError, match=msg):
+        df.resample('2D', on='date', level='d')
+
+    msg = "unhashable type: 'list'"
+    with pytest.raises(TypeError, match=msg):
+        df.resample('2D', on=['a', 'date'])
+
+    msg = r"\"Level \['a', 'date'\] not found\""
+    with pytest.raises(KeyError, match=msg):
+        df.resample('2D', level=['a', 'date'])
+
+    # upsampling not allowed
+    msg = ("Upsampling from level= or on= selection is not supported, use"
+           r" \.set_index\(\.\.\.\) to explicitly set index to datetime-like")
+    with pytest.raises(ValueError, match=msg):
+        df.resample('2D', level='d').asfreq()
+    with pytest.raises(ValueError, match=msg):
+        df.resample('2D', on='date').asfreq()
+
+    exp = df_exp.resample('2D').sum()
+    exp.index.name = 'date'
+    assert_frame_equal(exp, df.resample('2D', on='date').sum())
+
+    exp.index.name = 'd'
+    assert_frame_equal(exp, df.resample('2D', level='d').sum())
+
+
+@pytest.mark.parametrize('col_name', ['t2', 't2x', 't2q', 'T_2M',
+                                      't2p', 't2m', 't2m1', 'T2M'])
+def test_agg_with_datetime_index_list_agg_func(col_name):
+    # GH 22660
+    # The parametrized column names would get converted to dates by our
+    # date parser. Some would result in OutOfBoundsError (ValueError) while
+    # others would result in OverflowError when passed into Timestamp.
+    # We catch these errors and move on to the correct branch.
+    df = pd.DataFrame(list(range(200)),
+                      index=pd.date_range(start='2017-01-01', freq='15min',
+                                          periods=200, tz='Europe/Berlin'),
+                      columns=[col_name])
+    result = df.resample('1d').aggregate(['mean'])
+    expected = pd.DataFrame([47.5, 143.5, 195.5],
+                            index=pd.date_range(start='2017-01-01', freq='D',
+                                                periods=3, tz='Europe/Berlin'),
+                            columns=pd.MultiIndex(levels=[[col_name],
+                                                          ['mean']],
+                                                  codes=[[0], [0]]))
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/resample/test_resampler_grouper.py b/pandas/tests/resample/test_resampler_grouper.py
new file mode 100644
index 0000000000000..b61acfc3d2c5e
--- /dev/null
+++ b/pandas/tests/resample/test_resampler_grouper.py
@@ -0,0 +1,260 @@
+# pylint: disable=E1101
+
+from textwrap import dedent
+
+import numpy as np
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas import DataFrame, Series, Timestamp
+from pandas.core.indexes.datetimes import date_range
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+test_frame = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                        'B': np.arange(40)},
+                       index=date_range('1/1/2000',
+                                        freq='s',
+                                        periods=40))
+
+
+def test_tab_complete_ipython6_warning(ip):
+    from IPython.core.completer import provisionalcompleter
+    code = dedent("""\
+    import pandas.util.testing as tm
+    s = tm.makeTimeSeries()
+    rs = s.resample("D")
+    """)
+    ip.run_code(code)
+
+    with tm.assert_produces_warning(None):
+        with provisionalcompleter('ignore'):
+            list(ip.Completer.completions('rs.', 1))
+
+
+def test_deferred_with_groupby():
+
+    # GH 12486
+    # support deferred resample ops with groupby
+    data = [['2010-01-01', 'A', 2], ['2010-01-02', 'A', 3],
+            ['2010-01-05', 'A', 8], ['2010-01-10', 'A', 7],
+            ['2010-01-13', 'A', 3], ['2010-01-01', 'B', 5],
+            ['2010-01-03', 'B', 2], ['2010-01-04', 'B', 1],
+            ['2010-01-11', 'B', 7], ['2010-01-14', 'B', 3]]
+
+    df = DataFrame(data, columns=['date', 'id', 'score'])
+    df.date = pd.to_datetime(df.date)
+
+    def f(x):
+        return x.set_index('date').resample('D').asfreq()
+    expected = df.groupby('id').apply(f)
+    result = df.set_index('date').groupby('id').resample('D').asfreq()
+    assert_frame_equal(result, expected)
+
+    df = DataFrame({'date': pd.date_range(start='2016-01-01',
+                                          periods=4,
+                                          freq='W'),
+                    'group': [1, 1, 2, 2],
+                    'val': [5, 6, 7, 8]}).set_index('date')
+
+    def f(x):
+        return x.resample('1D').ffill()
+    expected = df.groupby('group').apply(f)
+    result = df.groupby('group').resample('1D').ffill()
+    assert_frame_equal(result, expected)
+
+
+def test_getitem():
+    g = test_frame.groupby('A')
+
+    expected = g.B.apply(lambda x: x.resample('2s').mean())
+
+    result = g.resample('2s').B.mean()
+    assert_series_equal(result, expected)
+
+    result = g.B.resample('2s').mean()
+    assert_series_equal(result, expected)
+
+    result = g.resample('2s').mean().B
+    assert_series_equal(result, expected)
+
+
+def test_getitem_multiple():
+
+    # GH 13174
+    # multiple calls after selection causing an issue with aliasing
+    data = [{'id': 1, 'buyer': 'A'}, {'id': 2, 'buyer': 'B'}]
+    df = DataFrame(data, index=pd.date_range('2016-01-01', periods=2))
+    r = df.groupby('id').resample('1D')
+    result = r['buyer'].count()
+    expected = Series([1, 1],
+                      index=pd.MultiIndex.from_tuples(
+        [(1, Timestamp('2016-01-01')),
+         (2, Timestamp('2016-01-02'))],
+        names=['id', None]),
+        name='buyer')
+    assert_series_equal(result, expected)
+
+    result = r['buyer'].count()
+    assert_series_equal(result, expected)
+
+
+def test_groupby_resample_on_api_with_getitem():
+    # GH 17813
+    df = pd.DataFrame({'id': list('aabbb'),
+                       'date': pd.date_range('1-1-2016', periods=5),
+                       'data': 1})
+    exp = df.set_index('date').groupby('id').resample('2D')['data'].sum()
+    result = df.groupby('id').resample('2D', on='date')['data'].sum()
+    assert_series_equal(result, exp)
+
+
+def test_nearest():
+
+    # GH 17496
+    # Resample nearest
+    index = pd.date_range('1/1/2000', periods=3, freq='T')
+    result = Series(range(3), index=index).resample('20s').nearest()
+
+    expected = Series(
+        [0, 0, 1, 1, 1, 2, 2],
+        index=pd.DatetimeIndex(
+            ['2000-01-01 00:00:00', '2000-01-01 00:00:20',
+                '2000-01-01 00:00:40', '2000-01-01 00:01:00',
+                '2000-01-01 00:01:20', '2000-01-01 00:01:40',
+                '2000-01-01 00:02:00'],
+            dtype='datetime64[ns]',
+            freq='20S'))
+    assert_series_equal(result, expected)
+
+
+def test_methods():
+    g = test_frame.groupby('A')
+    r = g.resample('2s')
+
+    for f in ['first', 'last', 'median', 'sem', 'sum', 'mean',
+              'min', 'max']:
+        result = getattr(r, f)()
+        expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+        assert_frame_equal(result, expected)
+
+    for f in ['size']:
+        result = getattr(r, f)()
+        expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+        assert_series_equal(result, expected)
+
+    for f in ['count']:
+        result = getattr(r, f)()
+        expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+        assert_frame_equal(result, expected)
+
+    # series only
+    for f in ['nunique']:
+        result = getattr(r.B, f)()
+        expected = g.B.apply(lambda x: getattr(x.resample('2s'), f)())
+        assert_series_equal(result, expected)
+
+    for f in ['nearest', 'backfill', 'ffill', 'asfreq']:
+        result = getattr(r, f)()
+        expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
+        assert_frame_equal(result, expected)
+
+    result = r.ohlc()
+    expected = g.apply(lambda x: x.resample('2s').ohlc())
+    assert_frame_equal(result, expected)
+
+    for f in ['std', 'var']:
+        result = getattr(r, f)(ddof=1)
+        expected = g.apply(lambda x: getattr(x.resample('2s'), f)(ddof=1))
+        assert_frame_equal(result, expected)
+
+
+def test_apply():
+
+    g = test_frame.groupby('A')
+    r = g.resample('2s')
+
+    # reduction
+    expected = g.resample('2s').sum()
+
+    def f(x):
+        return x.resample('2s').sum()
+
+    result = r.apply(f)
+    assert_frame_equal(result, expected)
+
+    def f(x):
+        return x.resample('2s').apply(lambda y: y.sum())
+
+    result = g.apply(f)
+    assert_frame_equal(result, expected)
+
+
+def test_apply_with_mutated_index():
+    # GH 15169
+    index = pd.date_range('1-1-2015', '12-31-15', freq='D')
+    df = DataFrame(data={'col1': np.random.rand(len(index))}, index=index)
+
+    def f(x):
+        s = Series([1, 2], index=['a', 'b'])
+        return s
+
+    expected = df.groupby(pd.Grouper(freq='M')).apply(f)
+
+    result = df.resample('M').apply(f)
+    assert_frame_equal(result, expected)
+
+    # A case for series
+    expected = df['col1'].groupby(pd.Grouper(freq='M')).apply(f)
+    result = df['col1'].resample('M').apply(f)
+    assert_series_equal(result, expected)
+
+
+def test_resample_groupby_with_label():
+    # GH 13235
+    index = date_range('2000-01-01', freq='2D', periods=5)
+    df = DataFrame(index=index,
+                   data={'col0': [0, 0, 1, 1, 2], 'col1': [1, 1, 1, 1, 1]}
+                   )
+    result = df.groupby('col0').resample('1W', label='left').sum()
+
+    mi = [np.array([0, 0, 1, 2]),
+          pd.to_datetime(np.array(['1999-12-26', '2000-01-02',
+                                   '2000-01-02', '2000-01-02'])
+                         )
+          ]
+    mindex = pd.MultiIndex.from_arrays(mi, names=['col0', None])
+    expected = DataFrame(data={'col0': [0, 0, 2, 2], 'col1': [1, 1, 2, 1]},
+                         index=mindex
+                         )
+
+    assert_frame_equal(result, expected)
+
+
+def test_consistency_with_window():
+
+    # consistent return values with window
+    df = test_frame
+    expected = pd.Int64Index([1, 2, 3], name='A')
+    result = df.groupby('A').resample('2s').mean()
+    assert result.index.nlevels == 2
+    tm.assert_index_equal(result.index.levels[0], expected)
+
+    result = df.groupby('A').rolling(20).mean()
+    assert result.index.nlevels == 2
+    tm.assert_index_equal(result.index.levels[0], expected)
+
+
+def test_median_duplicate_columns():
+    # GH 14233
+
+    df = DataFrame(np.random.randn(20, 3),
+                   columns=list('aaa'),
+                   index=pd.date_range('2012-01-01', periods=20, freq='s'))
+    df2 = df.copy()
+    df2.columns = ['a', 'b', 'c']
+    expected = df2.resample('5s').median()
+    result = df.resample('5s').median()
+    expected.columns = result.columns
+    assert_frame_equal(result, expected)
diff --git a/pandas/tests/resample/test_time_grouper.py b/pandas/tests/resample/test_time_grouper.py
new file mode 100644
index 0000000000000..2f330d1f2484b
--- /dev/null
+++ b/pandas/tests/resample/test_time_grouper.py
@@ -0,0 +1,266 @@
+from datetime import datetime
+from operator import methodcaller
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Series
+from pandas.core.indexes.datetimes import date_range
+from pandas.core.resample import TimeGrouper
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+test_series = Series(np.random.randn(1000),
+                     index=date_range('1/1/2000', periods=1000))
+
+
+def test_apply():
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        grouper = pd.TimeGrouper(freq='A', label='right', closed='right')
+
+    grouped = test_series.groupby(grouper)
+
+    def f(x):
+        return x.sort_values()[-3:]
+
+    applied = grouped.apply(f)
+    expected = test_series.groupby(lambda x: x.year).apply(f)
+
+    applied.index = applied.index.droplevel(0)
+    expected.index = expected.index.droplevel(0)
+    assert_series_equal(applied, expected)
+
+
+def test_count():
+    test_series[::3] = np.nan
+
+    expected = test_series.groupby(lambda x: x.year).count()
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        grouper = pd.TimeGrouper(freq='A', label='right', closed='right')
+    result = test_series.groupby(grouper).count()
+    expected.index = result.index
+    assert_series_equal(result, expected)
+
+    result = test_series.resample('A').count()
+    expected.index = result.index
+    assert_series_equal(result, expected)
+
+
+def test_numpy_reduction():
+    result = test_series.resample('A', closed='right').prod()
+
+    expected = test_series.groupby(lambda x: x.year).agg(np.prod)
+    expected.index = result.index
+
+    assert_series_equal(result, expected)
+
+
+def test_apply_iteration():
+    # #2300
+    N = 1000
+    ind = pd.date_range(start="2000-01-01", freq="D", periods=N)
+    df = DataFrame({'open': 1, 'close': 2}, index=ind)
+    tg = TimeGrouper('M')
+
+    _, grouper, _ = tg._get_grouper(df)
+
+    # Errors
+    grouped = df.groupby(grouper, group_keys=False)
+
+    def f(df):
+        return df['close'] / df['open']
+
+    # it works!
+    result = grouped.apply(f)
+    tm.assert_index_equal(result.index, df.index)
+
+
+@pytest.mark.parametrize('name, func', [
+    ('Int64Index', tm.makeIntIndex),
+    ('Index', tm.makeUnicodeIndex),
+    ('Float64Index', tm.makeFloatIndex),
+    ('MultiIndex', lambda m: tm.makeCustomIndex(m, 2))
+])
+def test_fails_on_no_datetime_index(name, func):
+    n = 2
+    index = func(n)
+    df = DataFrame({'a': np.random.randn(n)}, index=index)
+
+    msg = ("Only valid with DatetimeIndex, TimedeltaIndex "
+           "or PeriodIndex, but got an instance of '{}'".format(name))
+    with pytest.raises(TypeError, match=msg):
+        df.groupby(TimeGrouper('D'))
+
+
+def test_aaa_group_order():
+    # GH 12840
+    # check TimeGrouper perform stable sorts
+    n = 20
+    data = np.random.randn(n, 4)
+    df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
+                 datetime(2013, 1, 3), datetime(2013, 1, 4),
+                 datetime(2013, 1, 5)] * 4
+    grouped = df.groupby(TimeGrouper(key='key', freq='D'))
+
+    tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 1)),
+                          df[::5])
+    tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 2)),
+                          df[1::5])
+    tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 3)),
+                          df[2::5])
+    tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 4)),
+                          df[3::5])
+    tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 5)),
+                          df[4::5])
+
+
+def test_aggregate_normal(resample_method):
+    """Check TimeGrouper's aggregation is identical as normal groupby."""
+
+    if resample_method == 'ohlc':
+        pytest.xfail(reason='DataError: No numeric types to aggregate')
+
+    data = np.random.randn(20, 4)
+    normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    normal_df['key'] = [1, 2, 3, 4, 5] * 4
+
+    dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
+                    datetime(2013, 1, 3), datetime(2013, 1, 4),
+                    datetime(2013, 1, 5)] * 4
+
+    normal_grouped = normal_df.groupby('key')
+    dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+    expected = getattr(normal_grouped, resample_method)()
+    dt_result = getattr(dt_grouped, resample_method)()
+    expected.index = date_range(start='2013-01-01', freq='D',
+                                periods=5, name='key')
+    tm.assert_equal(expected, dt_result)
+
+    # if TimeGrouper is used included, 'nth' doesn't work yet
+
+    """
+    for func in ['nth']:
+        expected = getattr(normal_grouped, func)(3)
+        expected.index = date_range(start='2013-01-01',
+                                    freq='D', periods=5, name='key')
+        dt_result = getattr(dt_grouped, func)(3)
+        assert_frame_equal(expected, dt_result)
+    """
+
+
+@pytest.mark.parametrize('method, method_args, unit', [
+    ('sum', dict(), 0),
+    ('sum', dict(min_count=0), 0),
+    ('sum', dict(min_count=1), np.nan),
+    ('prod', dict(), 1),
+    ('prod', dict(min_count=0), 1),
+    ('prod', dict(min_count=1), np.nan)
+])
+def test_resample_entirly_nat_window(method, method_args, unit):
+    s = pd.Series([0] * 2 + [np.nan] * 2,
+                  index=pd.date_range('2017', periods=4))
+    result = methodcaller(method, **method_args)(s.resample("2d"))
+    expected = pd.Series([0.0, unit],
+                         index=pd.to_datetime(['2017-01-01',
+                                               '2017-01-03']))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('func, fill_value', [
+    ('min', np.nan),
+    ('max', np.nan),
+    ('sum', 0),
+    ('prod', 1),
+    ('count', 0),
+])
+def test_aggregate_with_nat(func, fill_value):
+    # check TimeGrouper's aggregation is identical as normal groupby
+    # if NaT is included, 'var', 'std', 'mean', 'first','last'
+    # and 'nth' doesn't work yet
+
+    n = 20
+    data = np.random.randn(n, 4).astype('int64')
+    normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
+
+    dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
+                    datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
+
+    normal_grouped = normal_df.groupby('key')
+    dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+    normal_result = getattr(normal_grouped, func)()
+    dt_result = getattr(dt_grouped, func)()
+
+    pad = DataFrame([[fill_value] * 4], index=[3],
+                    columns=['A', 'B', 'C', 'D'])
+    expected = normal_result.append(pad)
+    expected = expected.sort_index()
+    expected.index = date_range(start='2013-01-01', freq='D',
+                                periods=5, name='key')
+    assert_frame_equal(expected, dt_result)
+    assert dt_result.index.name == 'key'
+
+
+def test_aggregate_with_nat_size():
+    # GH 9925
+    n = 20
+    data = np.random.randn(n, 4).astype('int64')
+    normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
+
+    dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
+    dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
+                    datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
+
+    normal_grouped = normal_df.groupby('key')
+    dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
+
+    normal_result = normal_grouped.size()
+    dt_result = dt_grouped.size()
+
+    pad = Series([0], index=[3])
+    expected = normal_result.append(pad)
+    expected = expected.sort_index()
+    expected.index = date_range(start='2013-01-01', freq='D',
+                                periods=5, name='key')
+    assert_series_equal(expected, dt_result)
+    assert dt_result.index.name == 'key'
+
+
+def test_repr():
+    # GH18203
+    result = repr(TimeGrouper(key='A', freq='H'))
+    expected = ("TimeGrouper(key='A', freq=<Hour>, axis=0, sort=True, "
+                "closed='left', label='left', how='mean', "
+                "convention='e', base=0)")
+    assert result == expected
+
+
+@pytest.mark.parametrize('method, method_args, expected_values', [
+    ('sum', dict(), [1, 0, 1]),
+    ('sum', dict(min_count=0), [1, 0, 1]),
+    ('sum', dict(min_count=1), [1, np.nan, 1]),
+    ('sum', dict(min_count=2), [np.nan, np.nan, np.nan]),
+    ('prod', dict(), [1, 1, 1]),
+    ('prod', dict(min_count=0), [1, 1, 1]),
+    ('prod', dict(min_count=1), [1, np.nan, 1]),
+    ('prod', dict(min_count=2), [np.nan, np.nan, np.nan]),
+])
+def test_upsample_sum(method, method_args, expected_values):
+    s = pd.Series(1, index=pd.date_range("2017", periods=2, freq="H"))
+    resampled = s.resample("30T")
+    index = pd.to_datetime(['2017-01-01T00:00:00',
+                            '2017-01-01T00:30:00',
+                            '2017-01-01T01:00:00'])
+    result = methodcaller(method, **method_args)(resampled)
+    expected = pd.Series(expected_values, index=index)
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/resample/test_timedelta.py b/pandas/tests/resample/test_timedelta.py
new file mode 100644
index 0000000000000..3498d30d11689
--- /dev/null
+++ b/pandas/tests/resample/test_timedelta.py
@@ -0,0 +1,128 @@
+from datetime import timedelta
+
+import numpy as np
+
+import pandas as pd
+from pandas import DataFrame, Series
+from pandas.core.indexes.timedeltas import timedelta_range
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+
+def test_asfreq_bug():
+    df = DataFrame(data=[1, 3],
+                   index=[timedelta(), timedelta(minutes=3)])
+    result = df.resample('1T').asfreq()
+    expected = DataFrame(data=[1, np.nan, np.nan, 3],
+                         index=timedelta_range('0 day',
+                                               periods=4,
+                                               freq='1T'))
+    assert_frame_equal(result, expected)
+
+
+def test_resample_with_nat():
+    # GH 13223
+    index = pd.to_timedelta(['0s', pd.NaT, '2s'])
+    result = DataFrame({'value': [2, 3, 5]}, index).resample('1s').mean()
+    expected = DataFrame({'value': [2.5, np.nan, 5.0]},
+                         index=timedelta_range('0 day',
+                                               periods=3,
+                                               freq='1S'))
+    assert_frame_equal(result, expected)
+
+
+def test_resample_as_freq_with_subperiod():
+    # GH 13022
+    index = timedelta_range('00:00:00', '00:10:00', freq='5T')
+    df = DataFrame(data={'value': [1, 5, 10]}, index=index)
+    result = df.resample('2T').asfreq()
+    expected_data = {'value': [1, np.nan, np.nan, np.nan, np.nan, 10]}
+    expected = DataFrame(data=expected_data,
+                         index=timedelta_range('00:00:00',
+                                               '00:10:00', freq='2T'))
+    tm.assert_frame_equal(result, expected)
+
+
+def test_resample_with_timedeltas():
+
+    expected = DataFrame({'A': np.arange(1480)})
+    expected = expected.groupby(expected.index // 30).sum()
+    expected.index = pd.timedelta_range('0 days', freq='30T', periods=50)
+
+    df = DataFrame({'A': np.arange(1480)}, index=pd.to_timedelta(
+        np.arange(1480), unit='T'))
+    result = df.resample('30T').sum()
+
+    assert_frame_equal(result, expected)
+
+    s = df['A']
+    result = s.resample('30T').sum()
+    assert_series_equal(result, expected['A'])
+
+
+def test_resample_single_period_timedelta():
+
+    s = Series(list(range(5)), index=pd.timedelta_range(
+        '1 day', freq='s', periods=5))
+    result = s.resample('2s').sum()
+    expected = Series([1, 5, 4], index=pd.timedelta_range(
+        '1 day', freq='2s', periods=3))
+    assert_series_equal(result, expected)
+
+
+def test_resample_timedelta_idempotency():
+
+    # GH 12072
+    index = pd.timedelta_range('0', periods=9, freq='10L')
+    series = Series(range(9), index=index)
+    result = series.resample('10L').mean()
+    expected = series
+    assert_series_equal(result, expected)
+
+
+def test_resample_base_with_timedeltaindex():
+
+    # GH 10530
+    rng = timedelta_range(start='0s', periods=25, freq='s')
+    ts = Series(np.random.randn(len(rng)), index=rng)
+
+    with_base = ts.resample('2s', base=5).mean()
+    without_base = ts.resample('2s').mean()
+
+    exp_without_base = timedelta_range(start='0s', end='25s', freq='2s')
+    exp_with_base = timedelta_range(start='5s', end='29s', freq='2s')
+
+    tm.assert_index_equal(without_base.index, exp_without_base)
+    tm.assert_index_equal(with_base.index, exp_with_base)
+
+
+def test_resample_categorical_data_with_timedeltaindex():
+    # GH #12169
+    df = DataFrame({'Group_obj': 'A'},
+                   index=pd.to_timedelta(list(range(20)), unit='s'))
+    df['Group'] = df['Group_obj'].astype('category')
+    result = df.resample('10s').agg(lambda x: (x.value_counts().index[0]))
+    expected = DataFrame({'Group_obj': ['A', 'A'],
+                          'Group': ['A', 'A']},
+                         index=pd.to_timedelta([0, 10], unit='s'))
+    expected = expected.reindex(['Group_obj', 'Group'], axis=1)
+    expected['Group'] = expected['Group_obj'].astype('category')
+    tm.assert_frame_equal(result, expected)
+
+
+def test_resample_timedelta_values():
+    # GH 13119
+    # check that timedelta dtype is preserved when NaT values are
+    # introduced by the resampling
+
+    times = timedelta_range('1 day', '4 day', freq='4D')
+    df = DataFrame({'time': times}, index=times)
+
+    times2 = timedelta_range('1 day', '4 day', freq='2D')
+    exp = Series(times2, index=times2, name='time')
+    exp.iloc[1] = pd.NaT
+
+    res = df.resample('2D').first()['time']
+    tm.assert_series_equal(res, exp)
+    res = df['time'].resample('2D').first()
+    tm.assert_series_equal(res, exp)
diff --git a/pandas/tests/reshape/__init__.py b/pandas/tests/reshape/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tools/data/cut_data.csv b/pandas/tests/reshape/data/cut_data.csv
similarity index 99%
rename from pandas/tests/tools/data/cut_data.csv
rename to pandas/tests/reshape/data/cut_data.csv
index 7d9d480599579..c198ec77e45da 100644
--- a/pandas/tests/tools/data/cut_data.csv
+++ b/pandas/tests/reshape/data/cut_data.csv
@@ -1 +1 @@
-1.001 0.994 0.9951 0.9956 0.9956 0.9951 0.9949 1.001 0.994 0.9938 0.9908 0.9947 0.992 0.9912 1.0002 0.9914 0.9928 0.9892 0.9917 0.9955 0.9892 0.9912 0.993 0.9937 0.9951 0.9955 0.993 0.9961 0.9914 0.9906 0.9974 0.9934 0.992 0.9939 0.9962 0.9905 0.9934 0.9906 0.9999 0.9999 0.9937 0.9937 0.9954 0.9934 0.9934 0.9931 0.994 0.9939 0.9954 0.995 0.9917 0.9914 0.991 0.9911 0.993 0.9908 0.9962 0.9972 0.9931 0.9926 0.9951 0.9972 0.991 0.9931 0.9927 0.9934 0.9903 0.992 0.9926 0.9962 0.9956 0.9958 0.9964 0.9941 0.9926 0.9962 0.9898 0.9912 0.9961 0.9949 0.9929 0.9985 0.9946 0.9966 0.9974 0.9975 0.9974 0.9972 0.9974 0.9975 0.9974 0.9957 0.99 0.9899 0.9916 0.9969 0.9979 0.9913 0.9956 0.9979 0.9975 0.9962 0.997 1 0.9975 0.9974 0.9962 0.999 0.999 0.9927 0.9959 1 0.9982 0.9968 0.9968 0.994 0.9914 0.9911 0.9982 0.9982 0.9934 0.9984 0.9952 0.9952 0.9928 0.9912 0.994 0.9958 0.9924 0.9924 0.994 0.9958 0.9979 0.9982 0.9961 0.9979 0.992 0.9975 0.9917 0.9923 0.9927 0.9975 0.992 0.9947 0.9921 0.9905 0.9918 0.9951 0.9917 0.994 0.9934 0.9968 0.994 0.9919 0.9966 0.9979 0.9979 0.9898 0.9894 0.9894 0.9898 0.998 0.9932 0.9979 0.997 0.9972 0.9974 0.9896 0.9968 0.9958 0.9906 0.9917 0.9902 0.9918 0.999 0.9927 0.991 0.9972 0.9931 0.995 0.9951 0.9936 1.001 0.9979 0.997 0.9972 0.9954 0.9924 0.9906 0.9962 0.9962 1.001 0.9928 0.9942 0.9942 0.9942 0.9942 0.9961 0.998 0.9961 0.9984 0.998 0.9973 0.9949 0.9924 0.9972 0.9958 0.9968 0.9938 0.993 0.994 0.9918 0.9958 0.9944 0.9912 0.9961 0.9939 0.9961 0.9989 0.9938 0.9939 0.9971 0.9912 0.9936 0.9929 0.9998 0.9938 0.9969 0.9938 0.9998 0.9972 0.9976 0.9976 0.9979 0.9979 0.9979 0.9979 0.9972 0.9918 0.9982 0.9985 0.9944 0.9903 0.9934 0.9975 0.9923 0.99 0.9905 0.9905 0.996 0.9964 0.998 0.9975 0.9913 0.9932 0.9935 0.9927 0.9927 0.9912 0.9904 0.9939 0.9996 0.9944 0.9977 0.9912 0.9996 0.9965 0.9944 0.9945 0.9944 0.9965 0.9944 0.9972 0.9949 0.9966 0.9954 0.9954 0.9915 0.9919 0.9916 0.99 0.9909 0.9938 0.9982 0.9988 0.9961 0.9978 0.9979 0.9979 0.9979 0.9979 0.9945 1 0.9957 0.9968 0.9934 0.9976 0.9932 0.997 0.9923 0.9914 0.992 0.9914 0.9914 0.9949 0.9949 0.995 0.995 0.9927 0.9928 0.9917 0.9918 0.9954 0.9941 0.9941 0.9934 0.9927 0.9938 0.9933 0.9934 0.9927 0.9938 0.9927 0.9946 0.993 0.9946 0.9976 0.9944 0.9978 0.992 0.9912 0.9927 0.9906 0.9954 0.9923 0.9906 0.991 0.9972 0.9945 0.9934 0.9964 0.9948 0.9962 0.9931 0.993 0.9942 0.9906 0.9995 0.998 0.997 0.9914 0.992 0.9924 0.992 0.9937 0.9978 0.9978 0.9927 0.994 0.9935 0.9968 0.9941 0.9942 0.9978 0.9923 0.9912 0.9923 0.9927 0.9931 0.9941 0.9927 0.9931 0.9934 0.9936 0.9893 0.9893 0.9919 0.9924 0.9927 0.9919 0.9924 0.9975 0.9969 0.9936 0.991 0.9893 0.9906 0.9941 0.995 0.9983 0.9983 0.9916 0.9957 0.99 0.9976 0.992 0.9917 0.9917 0.9993 0.9908 0.9917 0.9976 0.9934 1 0.9918 0.992 0.9896 0.9932 0.992 0.9917 0.9999 0.998 0.9918 0.9918 0.9999 0.998 0.9927 0.9959 0.9927 0.9929 0.9898 0.9954 0.9954 0.9954 0.9954 0.9954 0.9954 0.9974 0.9936 0.9978 0.9974 0.9927 0.9934 0.9938 0.9922 0.992 0.9935 0.9906 0.9934 0.9934 0.9913 0.9938 0.9898 0.9975 0.9975 0.9937 0.9914 0.9982 0.9982 0.9929 0.9971 0.9921 0.9931 0.9924 0.9929 0.9982 0.9892 0.9956 0.9924 0.9971 0.9956 0.9982 0.9973 0.9932 0.9976 0.9962 0.9956 0.9932 0.9976 0.9992 0.9983 0.9937 0.99 0.9944 0.9938 0.9965 0.9893 0.9927 0.994 0.9928 0.9964 0.9917 0.9972 0.9964 0.9954 0.993 0.9928 0.9916 0.9936 0.9962 0.9899 0.9898 0.996 0.9907 0.994 0.9913 0.9976 0.9904 0.992 0.9976 0.999 0.9975 0.9937 0.9937 0.998 0.998 0.9944 0.9938 0.9907 0.9938 0.9921 0.9908 0.9931 0.9915 0.9952 0.9926 0.9934 0.992 0.9918 0.9942 0.9942 0.9942 0.9901 0.9898 0.9902 0.9934 0.9906 0.9898 0.9896 0.9922 0.9947 0.9945 0.9976 0.9976 0.9976 0.9987 0.9987 0.9976 0.992 0.9955 0.9953 0.9976 0.992 0.9952 0.9983 0.9933 0.9958 0.9922 0.9928 0.9976 0.9976 0.9916 0.9901 0.9976 0.9901 0.9916 0.9982 0.993 0.9969 0.991 0.9953 0.9924 0.9969 0.9928 0.9945 0.9967 0.9944 0.9928 0.9929 0.9948 0.9976 0.9912 0.9987 0.99 0.991 0.9933 0.9933 0.9899 0.9912 0.9912 0.9976 0.994 0.9947 0.9954 0.993 0.9954 0.9963 0.992 0.9926 0.995 0.9983 0.992 0.9968 0.9905 0.9904 0.9926 0.9968 0.9928 0.9949 0.9909 0.9937 0.9914 0.9905 0.9904 0.9924 0.9924 0.9965 0.9965 0.9993 0.9965 0.9908 0.992 0.9978 0.9978 0.9978 0.9978 0.9912 0.9928 0.9928 0.993 0.9993 0.9965 0.9937 0.9913 0.9934 0.9952 0.9983 0.9957 0.9957 0.9916 0.9999 0.9999 0.9936 0.9972 0.9933 0.9934 0.9931 0.9976 0.9937 0.9937 0.991 0.9979 0.9971 0.9969 0.9968 0.9961 0.993 0.9973 0.9944 0.9986 0.9986 0.9986 0.9986 0.9972 0.9917 0.992 0.9932 0.9936 0.9915 0.9922 0.9934 0.9952 0.9972 0.9934 0.9958 0.9944 0.9908 0.9958 0.9925 0.9966 0.9972 0.9912 0.995 0.9928 0.9968 0.9955 0.9981 0.991 0.991 0.991 0.992 0.9931 0.997 0.9948 0.9923 0.9976 0.9938 0.9984 0.9972 0.9922 0.9935 0.9944 0.9942 0.9944 0.9997 0.9977 0.9912 0.9982 0.9982 0.9983 0.998 0.9894 0.9927 0.9917 0.9904 0.993 0.9941 0.9943 0.99855 0.99345 0.998 0.9916 0.9916 0.99475 0.99325 0.9933 0.9969 1.0002 0.9933 0.9937 0.99685 0.99455 0.9917 0.99035 0.9914 0.99225 0.99155 0.9954 0.99455 0.9924 0.99695 0.99655 0.9934 0.998 0.9971 0.9948 0.998 0.9971 0.99215 0.9948 0.9915 0.99115 0.9932 0.9977 0.99535 0.99165 0.9953 0.9928 0.9958 0.9928 0.9928 0.9964 0.9987 0.9953 0.9932 0.9907 0.99755 0.99935 0.9932 0.9932 0.9958 0.99585 1.00055 0.9985 0.99505 0.992 0.9988 0.99175 0.9962 0.9962 0.9942 0.9927 0.9927 0.99985 0.997 0.9918 0.99215 0.99865 0.9992 1.0006 0.99135 0.99715 0.9992 1.0006 0.99865 0.99815 0.99815 0.99815 0.9949 0.99815 0.99815 0.99225 0.99445 0.99225 0.99335 0.99625 0.9971 0.9983 0.99445 0.99085 0.9977 0.9953 0.99775 0.99795 0.99505 0.9977 0.9975 0.99745 0.9976 0.99775 0.9953 0.9932 0.99405 1 0.99785 0.9939 0.9939 0.99675 0.9939 0.99675 0.98965 0.9971 0.99445 0.9945 0.9939 0.9958 0.9956 0.99055 0.9959 0.9925 0.9963 0.9935 0.99105 0.99045 0.9963 0.99155 0.99085 0.99085 0.99085 0.9924 0.9924 0.99975 0.99975 0.99315 0.9917 0.9917 0.99845 0.9921 0.99975 0.9909 0.99315 0.99855 0.9934 0.9978 0.9934 0.9949 0.99855 0.9986 0.99725 0.9946 0.99255 0.9996 0.9939 0.99 0.9937 0.9886 0.9934 1 0.9994 0.9926 0.9956 0.9978 0.9915 0.9939 0.9932 0.993 0.9898 0.9921 0.9932 0.9919 0.993 0.9953 0.9928 0.9928 0.9976 0.9906 0.9918 0.99185 0.9918 0.99185 0.994 0.9908 0.9928 0.9896 0.9908 0.9918 0.9952 0.9923 0.9915 0.9952 0.9947 0.9983 0.9975 0.995 0.9944 0.994 0.9944 0.9908 0.99795 0.9985 0.99425 0.99425 0.9943 0.9924 0.9946 0.9924 0.995 0.9919 0.99 0.9923 0.9956 0.9978 0.9978 0.9967 0.9934 0.9936 0.9932 0.9934 0.998 0.9978 0.9929 0.9974 0.99685 0.99495 0.99745 0.99505 0.992 0.9978 0.9956 0.9982 0.99485 0.9971 0.99265 0.9904 0.9965 0.9946 0.99965 0.9935 0.996 0.9942 0.9936 0.9965 0.9928 0.9928 0.9965 0.9936 0.9938 0.9926 0.9926 0.9983 0.9983 0.992 0.9983 0.9923 0.9972 0.9928 0.9928 0.9994 0.991 0.9906 0.9894 0.9898 0.9994 0.991 0.9925 0.9956 0.9946 0.9966 0.9951 0.9927 0.9927 0.9951 0.9894 0.9907 0.9925 0.9928 0.9941 0.9941 0.9925 0.9935 0.9932 0.9944 0.9972 0.994 0.9956 0.9927 0.9924 0.9966 0.9997 0.9936 0.9936 0.9952 0.9952 0.9928 0.9911 0.993 0.9911 0.9932 0.993 0.993 0.9932 0.9932 0.9943 0.9968 0.9994 0.9926 0.9968 0.9932 0.9916 0.9946 0.9925 0.9925 0.9935 0.9962 0.9928 0.993 0.993 0.9956 0.9941 0.9972 0.9948 0.9955 0.9972 0.9972 0.9983 0.9942 0.9936 0.9956 0.9953 0.9918 0.995 0.992 0.9952 1.001 0.9924 0.9932 0.9937 0.9918 0.9934 0.991 0.9962 0.9932 0.9908 0.9962 0.9918 0.9941 0.9931 0.9981 0.9931 0.9944 0.992 0.9966 0.9956 0.9956 0.9949 1.0002 0.9942 0.9923 0.9917 0.9931 0.992 1.0002 0.9953 0.9951 0.9974 0.9904 0.9974 0.9944 1.0004 0.9952 0.9956 0.995 0.995 0.9995 0.9942 0.9977 0.992 0.992 0.9995 0.9934 1.0006 0.9982 0.9928 0.9945 0.9963 0.9906 0.9956 0.9942 0.9962 0.9894 0.995 0.9908 0.9914 0.9938 0.9977 0.9922 0.992 0.9903 0.9893 0.9952 0.9903 0.9912 0.9983 0.9937 0.9932 0.9928 0.9922 0.9976 0.9922 0.9974 0.998 0.9931 0.9911 0.9944 0.9937 0.9974 0.989 0.992 0.9928 0.9918 0.9936 0.9944 0.9988 0.994 0.9953 0.9986 0.9914 0.9934 0.996 0.9937 0.9921 0.998 0.996 0.9933 0.9933 0.9959 0.9936 0.9953 0.9938 0.9952 0.9959 0.9959 0.9937 0.992 0.9967 0.9944 0.9998 0.9998 0.9942 0.9998 0.9945 0.9998 0.9946 0.9942 0.9928 0.9946 0.9927 0.9938 0.9918 0.9945 0.9966 0.9954 0.9913 0.9931 0.9986 0.9965 0.9984 0.9952 0.9956 0.9949 0.9954 0.996 0.9931 0.992 0.9912 0.9978 0.9938 0.9914 0.9932 0.9944 0.9913 0.9948 0.998 0.9998 0.9964 0.9992 0.9948 0.9998 0.998 0.9939 0.992 0.9922 0.9955 0.9917 0.9917 0.9954 0.9986 0.9955 0.9917 0.9907 0.9922 0.9958 0.993 0.9917 0.9926 0.9959 0.9906 0.9993 0.993 0.9906 0.992 0.992 0.994 0.9959 0.9908 0.9902 0.9908 0.9943 0.9921 0.9911 0.9986 0.992 0.992 0.9943 0.9937 0.993 0.9902 0.9928 0.9896 0.998 0.9954 0.9938 0.9918 0.9896 0.9944 0.9999 0.9953 0.992 0.9925 0.9981 0.9952 0.9927 0.9927 0.9911 0.9936 0.9959 0.9946 0.9948 0.9955 0.9951 0.9952 0.9946 0.9946 0.9944 0.9938 0.9963 0.991 1.0003 0.9966 0.9993 1.0003 0.9938 0.9965 0.9938 0.9993 0.9938 1.0003 0.9966 0.9942 0.9928 0.991 0.9911 0.9977 0.9927 0.9911 0.991 0.9912 0.9907 0.9902 0.992 0.994 0.9966 0.993 0.993 0.993 0.9966 0.9942 0.9925 0.9925 0.9928 0.995 0.9939 0.9958 0.9952 1 0.9948 0.99 0.9958 0.9948 0.9949 0.997 0.9927 0.9938 0.9949 0.9953 0.997 0.9932 0.9927 0.9932 0.9955 0.9914 0.991 0.992 0.9924 0.9927 0.9911 0.9958 0.9928 0.9902 0.994 0.994 0.9972 1.0004 0.991 0.9918 0.995 0.9941 0.9956 0.9956 0.9959 0.9922 0.9931 0.9959 0.9984 0.9908 0.991 0.9928 0.9936 0.9941 0.9924 0.9917 0.9906 0.995 0.9956 0.9955 0.9907 1 0.9953 0.9911 0.9922 0.9951 0.9948 0.9906 0.994 0.9907 0.9927 0.9914 0.9958 1 0.9984 0.9941 0.9944 0.998 0.998 0.9902 0.9911 0.9929 0.993 0.9918 0.992 0.9932 0.992 0.994 0.9923 0.993 0.9956 0.9907 0.99 0.9918 0.9926 0.995 0.99 0.99 0.9946 0.9907 0.9898 0.9918 0.9986 0.9986 0.9928 0.9986 0.9979 0.994 0.9937 0.9938 0.9942 0.9944 0.993 0.9986 0.9932 0.9934 0.9928 0.9925 0.9944 0.9909 0.9932 0.9934 1.0001 0.992 0.9916 0.998 0.9919 0.9925 0.9977 0.9944 0.991 0.99 0.9917 0.9923 0.9928 0.9923 0.9928 0.9902 0.9893 0.9917 0.9982 1.0005 0.9923 0.9951 0.9956 0.998 0.9928 0.9938 0.9914 0.9955 0.9924 0.9911 0.9917 0.9917 0.9932 0.9955 0.9929 0.9955 0.9958 1.0012 0.9968 0.9911 0.9924 0.991 0.9946 0.9928 0.9946 0.9917 0.9918 0.9926 0.9931 0.9932 0.9903 0.9928 0.9929 0.9958 0.9955 0.9911 0.9938 0.9942 0.9945 0.9962 0.992 0.9927 0.9948 0.9945 0.9942 0.9952 0.9942 0.9958 0.9918 0.9932 1.0004 0.9972 0.9998 0.9918 0.9918 0.9964 0.9936 0.9931 0.9938 0.9934 0.99 0.9914 0.9904 0.994 0.9938 0.9933 0.9909 0.9942 0.9945 0.9954 0.996 0.9991 0.993 0.9942 0.9934 0.9939 0.9937 0.994 0.9926 0.9951 0.9952 0.9935 0.9938 0.9939 0.9933 0.9927 0.998 0.9997 0.9981 0.992 0.9954 0.992 0.9997 0.9981 0.9943 0.9941 0.9936 0.9996 0.9932 0.9926 0.9936 0.992 0.9936 0.9996 0.993 0.9924 0.9928 0.9926 0.9952 0.9945 0.9945 0.9903 0.9932 0.9953 0.9936 0.9912 0.9962 0.9965 0.9932 0.9967 0.9953 0.9963 0.992 0.991 0.9958 0.99 0.991 0.9958 0.9938 0.9996 0.9946 0.9974 0.9945 0.9946 0.9974 0.9957 0.9931 0.9947 0.9953 0.9931 0.9946 0.9978 0.9989 1.0004 0.9938 0.9934 0.9978 0.9956 0.9982 0.9948 0.9956 0.9982 0.9926 0.991 0.9945 0.9916 0.9953 0.9938 0.9956 0.9906 0.9956 0.9932 0.9914 0.9938 0.996 0.9906 0.98815 0.9942 0.9903 0.9906 0.9935 1.0024 0.9968 0.9906 0.9941 0.9919 0.9928 0.9958 0.9932 0.9957 0.9937 0.9982 0.9928 0.9919 0.9956 0.9957 0.9954 0.993 0.9954 0.9987 0.9956 0.9928 0.9951 0.993 0.9928 0.9926 0.9938 1.0001 0.9933 0.9952 0.9934 0.9988 0.993 0.9952 0.9948 0.9998 0.9971 0.9998 0.9962 0.9948 0.99 0.9942 0.9965 0.9912 0.9978 0.9928 1.0103 0.9956 0.9936 0.9929 0.9966 0.9964 0.996 0.9959 0.9954 0.9914 1.0103 1.0004 0.9911 0.9938 0.9927 0.9922 0.9924 0.9963 0.9936 0.9951 0.9951 0.9955 0.9961 0.9936 0.992 0.9944 0.9944 1.0008 0.9962 0.9986 0.9986 1 0.9986 0.9982 1 0.9949 0.9915 0.9951 0.9986 0.9927 0.9955 0.9952 0.9928 0.9982 0.9914 0.9927 0.9918 0.9944 0.9969 0.9955 0.9954 0.9955 0.9921 0.9934 0.9998 0.9946 0.9984 0.9924 0.9939 0.995 0.9957 0.9953 0.9912 0.9939 0.9921 0.9954 0.9933 0.9941 0.995 0.9977 0.9912 0.9945 0.9952 0.9924 0.9986 0.9953 0.9939 0.9929 0.9988 0.9906 0.9914 0.9978 0.9928 0.9948 0.9978 0.9946 0.9908 0.9954 0.9906 0.99705 0.9982 0.9932 0.9977 0.994 0.9982 0.9929 0.9924 0.9966 0.9921 0.9967 0.9934 0.9914 0.99705 0.9961 0.9967 0.9926 0.99605 0.99435 0.9948 0.9916 0.997 0.9961 0.9967 0.9961 0.9955 0.9922 0.9918 0.9955 0.9941 0.9955 0.9955 0.9924 0.9973 0.999 0.9941 0.9922 0.9922 0.9953 0.9945 0.9945 0.9957 0.9932 0.9945 0.9913 0.9909 0.9939 0.991 0.9954 0.9943 0.993 1.0002 0.9946 0.9953 0.9918 0.9936 0.9984 0.9956 0.9966 0.9942 0.9984 0.9956 0.9966 0.9974 0.9944 1.0008 0.9974 1.0008 0.9928 0.9944 0.9908 0.9917 0.9911 0.9912 0.9953 0.9932 0.9896 0.9889 0.9912 0.9926 0.9911 0.9964 0.9974 0.9944 0.9974 0.9964 0.9963 0.9948 0.9948 0.9953 0.9948 0.9953 0.9949 0.9988 0.9954 0.992 0.9984 0.9954 0.9926 0.992 0.9976 0.9972 0.991 0.998 0.9966 0.998 1.0007 0.992 0.9925 0.991 0.9934 0.9955 0.9944 0.9981 0.9968 0.9946 0.9946 0.9981 0.9946 0.997 0.9924 0.9958 0.994 0.9958 0.9984 0.9948 0.9932 0.9952 0.9924 0.9945 0.9976 0.9976 0.9938 0.9997 0.994 0.9921 0.9986 0.9987 0.9991 0.9987 0.9991 0.9991 0.9948 0.9987 0.993 0.9988 1 0.9932 0.9991 0.9989 1 1 0.9952 0.9969 0.9966 0.9966 0.9976 0.99 0.9988 0.9942 0.9984 0.9932 0.9969 0.9966 0.9933 0.9916 0.9914 0.9966 0.9958 0.9926 0.9939 0.9953 0.9906 0.9914 0.9958 0.9926 0.9991 0.9994 0.9976 0.9966 0.9953 0.9923 0.993 0.9931 0.9932 0.9926 0.9938 0.9966 0.9974 0.9924 0.9948 0.9964 0.9924 0.9966 0.9974 0.9938 0.9928 0.9959 1.0001 0.9959 1.0001 0.9968 0.9932 0.9954 0.9992 0.9932 0.9939 0.9952 0.9996 0.9966 0.9925 0.996 0.9996 0.9973 0.9937 0.9966 1.0017 0.993 0.993 0.9959 0.9958 1.0017 0.9958 0.9979 0.9941 0.997 0.9934 0.9927 0.9944 0.9927 0.9963 1.0011 1.0011 0.9959 0.9973 0.9966 0.9932 0.9984 0.999 0.999 0.999 0.999 0.999 1.0006 0.9937 0.9954 0.997 0.9912 0.9939 0.999 0.9957 0.9926 0.9994 1.0004 0.9994 1.0004 1.0004 1.0002 0.9922 0.9922 0.9934 0.9926 0.9941 0.9994 1.0004 0.9924 0.9948 0.9935 0.9918 0.9948 0.9924 0.9979 0.993 0.994 0.991 0.993 0.9922 0.9979 0.9937 0.9928 0.9965 0.9928 0.9991 0.9948 0.9925 0.9958 0.9962 0.9965 0.9951 0.9944 0.9916 0.9987 0.9928 0.9926 0.9934 0.9944 0.9949 0.9926 0.997 0.9949 0.9948 0.992 0.9964 0.9926 0.9982 0.9955 0.9955 0.9958 0.9997 1.0001 1.0001 0.9918 0.9918 0.9931 1.0001 0.9926 0.9966 0.9932 0.9969 0.9925 0.9914 0.996 0.9952 0.9934 0.9939 0.9939 0.9906 0.9901 0.9948 0.995 0.9953 0.9953 0.9952 0.996 0.9948 0.9951 0.9931 0.9962 0.9948 0.9959 0.9962 0.9958 0.9948 0.9948 0.994 0.9942 0.9942 0.9948 0.9964 0.9958 0.9932 0.9986 0.9986 0.9988 0.9953 0.9983 1 0.9951 0.9983 0.9906 0.9981 0.9936 0.9951 0.9953 1.0005 0.9972 1 0.9969 1.0001 1.0001 1.0001 0.9934 0.9969 1.0001 0.9902 0.993 0.9914 0.9941 0.9967 0.9918 0.998 0.9967 0.9918 0.9957 0.9986 0.9958 0.9948 0.9918 0.9923 0.9998 0.9998 0.9914 0.9939 0.9966 0.995 0.9966 0.994 0.9972 0.9998 0.9998 0.9982 0.9924 0.9972 0.997 0.9954 0.9962 0.9972 0.9921 0.9905 0.9998 0.993 0.9941 0.9994 0.9962 0.992 0.9922 0.994 0.9897 0.9954 0.99 0.9948 0.9922 0.998 0.9944 0.9944 0.9986 0.9986 0.9986 0.9986 0.9986 0.996 0.9999 0.9986 0.9986 0.996 0.9951 0.9999 0.993 0.9982 0.992 0.9963 0.995 0.9956 0.997 0.9936 0.9935 0.9963 0.9967 0.9912 0.9981 0.9966 0.9967 0.9963 0.9935 0.9902 0.99 0.996 0.9966 0.9962 0.994 0.996 0.994 0.9944 0.9974 0.996 0.9922 0.9917 0.9918 0.9936 0.9938 0.9918 0.9939 0.9917 0.9981 0.9941 0.9928 0.9952 0.9898 0.9914 0.9981 0.9957 0.998 0.9957 0.9986 0.9983 0.9982 0.997 0.9947 0.997 0.9947 0.99416 0.99516 0.99496 0.9974 0.99579 0.9983 0.99471 0.9974 0.99644 0.99579 0.99699 0.99758 0.9977 0.99397 0.9983 0.99471 0.99243 0.9962 1.00182 0.99384 0.99582 0.9962 0.9924 0.99466 0.99212 0.99449 0.99748 0.99449 0.99748 0.99475 0.99189 0.99827 0.99752 0.99827 0.99479 0.99752 0.99642 1.00047 0.99382 0.99784 0.99486 0.99537 0.99382 0.99838 0.99566 0.99268 0.99566 0.99468 0.9933 0.99307 0.99907 0.99907 0.99907 0.99907 0.99471 0.99471 0.99907 0.99148 0.99383 0.99365 0.99272 0.99148 0.99235 0.99508 0.9946 0.99674 0.99018 0.99235 0.99084 0.99856 0.99591 0.9975 0.9944 0.99173 0.99378 0.99805 0.99534 0.99232 0.99805 0.99078 0.99534 0.99061 0.99182 0.9966 0.9912 0.99779 0.99814 0.99096 0.99379 0.99426 0.99228 0.99335 0.99595 0.99297 0.99687 0.99297 0.99687 0.99445 0.9986 0.99154 0.9981 0.98993 1.00241 0.99716 0.99437 0.9972 0.99756 0.99509 0.99572 0.99756 0.99175 0.99254 0.99509 0.99676 0.9979 0.99194 0.99077 0.99782 0.99942 0.99708 0.99353 0.99256 0.99199 0.9918 0.99354 0.99244 0.99831 0.99396 0.99724 0.99524 0.9927 0.99802 0.99512 0.99438 0.99679 0.99652 0.99698 0.99474 0.99511 0.99582 0.99125 0.99256 0.9911 0.99168 0.9911 0.99556 1.00098 0.99516 0.99516 0.99518 0.99347 0.9929 0.99347 0.99841 0.99362 0.99361 0.9914 0.99114 0.9925 0.99453 0.9938 0.9938 0.99806 0.9961 1.00016 0.9916 0.99116 0.99319 0.99517 0.99514 0.99566 0.99166 0.99587 0.99558 0.99117 0.99399 0.99741 0.99405 0.99622 1.00051 0.99803 0.99405 0.99773 0.99397 0.99622 0.99713 0.99274 1.00118 0.99176 0.9969 0.99771 0.99411 0.99771 0.99411 0.99194 0.99558 0.99194 0.99558 0.99577 0.99564 0.99578 0.99888 1.00014 0.99441 0.99594 0.99437 0.99594 0.9979 0.99434 0.99203 0.998 0.99316 0.998 0.99314 0.99316 0.99612 0.99295 0.99394 0.99642 0.99642 0.99248 0.99268 0.99954 0.99692 0.99592 0.99592 0.99692 0.99822 0.99822 0.99402 0.99404 0.99787 0.99347 0.99838 0.99839 0.99375 0.99155 0.9936 0.99434 0.9922 0.99571 0.99658 0.99076 0.99496 0.9937 0.99076 0.99542 0.99825 0.99289 0.99432 0.99523 0.99542 0.9959 0.99543 0.99662 0.99088 0.99088 0.99922 0.9966 0.99466 0.99922 0.99836 0.99836 0.99238 0.99645 1 1 0.99376 1 0.99513 0.99556 0.99556 0.99543 0.99886 0.99526 0.99166 0.99691 0.99732 0.99573 0.99656 0.99112 0.99214 0.99165 0.99004 0.99463 0.99683 0.99004 0.99596 0.99898 0.99114 0.99508 0.99306 0.99898 0.99508 0.99114 0.99342 0.99345 0.99772 0.99239 0.99502 0.99502 0.99479 0.99207 0.99497 0.99828 0.99542 0.99542 0.99228 0.99706 0.99497 0.99669 0.99828 0.99269 0.99196 0.99662 0.99475 0.99544 0.99944 0.99475 0.99544 0.9966 0.99066 0.9907 0.99066 0.998 0.9907 0.99066 0.99307 0.99106 0.99696 0.99106 0.99307 0.99167 0.99902 0.98992 0.99182 0.99556 0.99582 0.99182 0.98972 0.99352 0.9946 0.99273 0.99628 0.99582 0.99553 0.98914 0.99354 0.99976 0.99808 0.99808 0.99808 0.99808 0.99808 0.99808 0.9919 0.99808 0.99499 0.99655 0.99615 0.99296 0.99482 0.99079 0.99366 0.99434 0.98958 0.99434 0.99938 0.99059 0.99835 0.98958 0.99159 0.99159 0.98931 0.9938 0.99558 0.99563 0.98931 0.99691 0.9959 0.99159 0.99628 0.99076 0.99678 0.99678 0.99678 0.99089 0.99537 1.0002 0.99628 0.99089 0.99678 0.99076 0.99332 0.99316 0.99272 0.99636 0.99202 0.99148 0.99064 0.99884 0.99773 1.00013 0.98974 0.99773 1.00013 0.99112 0.99136 0.99132 0.99642 0.99488 0.99527 0.99578 0.99352 0.99199 0.99198 0.99756 0.99578 0.99561 0.99347 0.98936 0.99786 0.99705 0.9942 0.9948 0.99116 0.99688 0.98974 0.99542 0.99154 0.99118 0.99044 0.9914 0.9979 0.98892 0.99114 0.99188 0.99583 0.98892 0.98892 0.99704 0.9911 0.99334 0.99334 0.99094 0.99014 0.99304 0.99652 0.98944 0.99772 0.99367 0.99304 0.99183 0.99126 0.98944 0.99577 0.99772 0.99652 0.99428 0.99388 0.99208 0.99256 0.99388 0.9925 0.99904 0.99216 0.99208 0.99428 0.99165 0.99924 0.99924 0.99924 0.9956 0.99562 0.9972 0.99924 0.9958 0.99976 0.99976 0.99296 0.9957 0.9958 0.99579 0.99541 0.99976 0.99518 0.99168 0.99276 0.99085 0.99873 0.99172 0.99312 0.99276 0.9972 0.99278 0.99092 0.9962 0.99053 0.99858 0.9984 0.99335 0.99053 0.9949 0.9962 0.99092 0.99532 0.99727 0.99026 0.99668 0.99727 0.9952 0.99144 0.99144 0.99015 0.9914 0.99693 0.99035 0.99693 0.99035 0.99006 0.99126 0.98994 0.98985 0.9971 0.99882 0.99477 0.99478 0.99576 0.99578 0.99354 0.99244 0.99084 0.99612 0.99356 0.98952 0.99612 0.99084 0.99244 0.99955 0.99374 0.9892 0.99144 0.99352 0.99352 0.9935 0.99237 0.99144 0.99022 0.99032 1.03898 0.99587 0.99587 0.99587 0.99976 0.99354 0.99976 0.99552 0.99552 0.99587 0.99604 0.99584 0.98894 0.9963 0.993 0.98894 0.9963 0.99068 0.98964 0.99604 0.99584 0.9923 0.99437 0.993 0.99238 0.99801 0.99802 0.99566 0.99067 0.99066 0.9929 0.9934 0.99067 0.98912 0.99066 0.99228 0.98912 0.9958 0.99052 0.99312 0.9968 0.99502 0.99084 0.99573 0.99256 0.9959 0.99084 0.99084 0.99644 0.99526 0.9954 0.99095 0.99188 0.9909 0.99256 0.9959 0.99581 0.99132 0.98936 0.99136 0.99142 0.99232 0.99232 0.993 0.99311 0.99132 0.98993 0.99208 0.99776 0.99839 0.99574 0.99093 0.99156 0.99278 0.9924 0.98984 0.99035 0.9924 0.99165 0.9923 0.99278 0.99008 0.98964 0.99156 0.9909 0.98984 0.9889 0.99178 0.99076 0.9889 0.99046 0.98999 0.98946 0.98976 0.99046 0.99672 0.99482 0.98945 0.98883 0.99362 0.99075 0.99436 0.98988 0.99158 0.99265 0.99195 0.99168 0.9918 0.99313 0.9895 0.9932 0.99848 0.9909 0.99014 0.9952 0.99652 0.99848 0.99104 0.99772 0.9922 0.99076 0.99622 0.9902 0.99114 0.9938 0.99594 0.9902 0.99035 0.99032 0.99558 0.99622 0.99076 0.99413 0.99043 0.99043 0.98982 0.98934 0.9902 0.99449 0.99629 0.9948 0.98984 0.99326 0.99834 0.99555 0.98975 0.99216 0.99216 0.99834 0.9901 0.98975 0.99573 0.99326 0.99215 0.98993 0.99218 0.99555 0.99564 0.99564 0.99397 0.99576 0.99601 0.99564 0.99397 0.98713 0.99308 0.99308 0.99582 0.99494 0.9929 0.99471 0.9929 0.9929 0.99037 0.99304 0.99026 0.98986 0.99471 0.98951 0.99634 0.99368 0.99792 0.99026 0.99362 0.98919 0.99835 0.99835 0.99038 0.99104 0.99038 0.99286 0.99296 0.99835 0.9954 0.9914 0.99286 0.99604 0.99604 0.99119 0.99007 0.99507 0.99596 0.99011 0.99184 0.99469 0.99469 0.99406 0.99305 0.99096 0.98956 0.9921 0.99496 0.99406 0.99406 0.9888 0.98942 0.99082 0.98802 17.3 1.4 1.3 1.6 5.25 2.4 14.6 11.8 1.5 1.8 7.7 2 1.8 1.4 16.7 8.1 8 4.7 8.1 2.1 16.7 6.4 1.5 7.6 1.5 12.4 1.3 1.7 8.1 7.1 7.6 2.3 6.5 1.4 12.7 1.6 1.1 1.2 6.5 4.6 0.6 10.6 4.6 4.8 2.7 12.6 0.6 9.2 6.6 7 8.45 11.1 18.15 18.15 4.1 4.1 4.6 18.15 4.9 8.3 1.4 11.5 1.8 1.6 2.4 4.9 1.8 4.3 4.4 1.4 1.6 1.3 5.2 5.6 5.3 4.9 2.4 1.6 2.1 1.4 7.1 1.6 10.7 11.1 10.7 1.6 1.6 1.5 1.5 1.6 1.6 8 7.7 2.7 15.1 15.1 8.9 6 12.3 13.1 6.7 12.3 2.3 11.1 1.5 6.7 6 15.2 10.2 13.1 10.7 17.1 17.1 17.1 1.9 10.7 17.1 1.2 1.2 3.1 1.5 10.7 4.9 12.6 10.7 4.9 12.15 12 1.7 2.6 1.4 1.9 16.9 16.9 2.1 7 7.1 5.9 7.1 8.7 13.2 15.3 15.3 13.2 2.7 10.65 10 6.8 15.6 13.2 5.1 3 15.3 2.1 1.9 8.6 8.75 3.6 4.7 1.3 1.8 9.7 4 2.4 4.7 18.8 1.8 1.8 12.8 12.8 12.8 12.8 12.8 7.8 16.75 12.8 12.8 7.8 5.4 16.75 1.3 10.1 3.8 10.9 6.6 9.8 11.7 1.2 1.4 9.6 12.2 2.6 10.7 4.9 12.2 9.6 1.4 1.1 1 8.2 11.3 7.3 2.3 8.2 2.1 2 10 15.75 3.9 2 1.5 1.6 1.4 1.5 1.4 2 13.8 1.3 3.8 6.9 2.2 1.6 13.8 10.8 12.8 10.8 15.3 12.1 12 11.6 9.2 11.6 9.2 2.8 1.6 6.1 8.5 7.8 14.9 6.2 8.5 8.2 7.8 10.6 11.2 11.6 7.1 14.9 6.2 1.7 7.7 17.3 1.4 7.7 7.7 3.4 1.6 1.4 1.4 10.4 1.4 10.4 4.1 2.8 15.7 10.9 15.7 6.5 10.9 5.9 17.3 1.4 13.5 8.5 6.2 1.4 14.95 7.7 1.3 7.7 1.3 1.3 1.3 15.6 15.6 15.6 15.6 4.9 5 15.6 6.5 1.4 2.7 1.2 6.5 6.4 6.9 7.2 10.6 3.5 6.4 2.3 12.05 7 11.8 1.4 5 2.2 14.6 1.6 1.3 14.6 2.8 1.6 3.3 6.3 8.1 1.6 10.6 11.8 1.7 8.1 1.4 1.3 1.8 7.2 1.1 11.95 1.1 11.95 2.2 12.7 1.4 10.6 1.9 17.8 10.2 4.8 9.8 8.4 7.2 4.8 8.4 4.5 1.4 7.2 11 11.1 2.6 2 10.1 13.3 11.4 1.3 1.4 1.4 7 2 1.2 12.9 5 10.1 3.75 1.7 12.6 1.3 1.6 7.6 8.1 14.9 6 6 7.2 3 1.2 2 4.9 2 8.9 16.45 2 1.9 5.1 4.4 5.8 4.4 12.9 1.3 1.3 1.2 2.7 1.7 8.2 1.5 1.5 12.9 3.9 17.75 4.9 1.6 1.4 2 2 8.2 2.1 1.8 8.5 4.45 5.8 13 2.7 7.3 19.1 8.8 2.7 7.4 2.3 6.85 11.4 0.9 19.35 7.9 11.75 7.7 3 7.7 3 1.5 7.5 1.5 7.5 8.3 7.05 8.4 13.9 17.5 5.6 9.4 4.8 9.4 9.7 6.3 1.6 14.6 2.5 14.6 2.6 2.5 8.2 1.5 2.3 10 10 1.6 1.6 16 10.4 7.4 7.4 10.4 16.05 16.05 2.6 2.5 10.8 1.2 12.1 11.95 1.7 0.8 1.4 1.3 6.3 10.3 15.55 1.5 1.5 1.4 1.5 7.9 13 1 4.85 7.1 7.9 7.5 7.6 10.3 1.7 1.7 19.95 7.7 5.3 19.95 12.7 12.7 1.5 11.3 18.1 18.1 7 18.1 6.4 1.4 1.4 3.1 14.1 7.7 5.2 11.6 10.4 7.5 11.2 0.8 1.4 4.7 3.1 4 11.3 3.1 8.1 14.8 1.4 8.1 3.5 14.8 8.1 1.4 1.5 1.5 12.8 1.6 7.1 7.1 11.2 1.7 6.7 17.3 8.6 8.6 1.5 12.1 6.7 10.7 17.3 1.8 1.4 7.5 4.8 7.1 16.9 4.8 7.1 11.3 1.1 1.2 1.1 12.9 1.2 1.1 1.2 2.3 10 2.3 1.2 1.4 14.9 1.8 1.8 7 8.6 1.8 1.1 1.3 4.9 1.9 10.4 10 8.6 1.7 1.7 18.95 12.8 12.8 12.8 12.8 12.8 12.8 0.7 12.8 1.4 13.3 8.5 1.5 11.7 5 1.2 2.1 1.4 2.1 16 1.1 15.3 1.4 2.8 2.8 0.9 2.5 8.1 8.2 0.9 11.1 7.8 2.8 10.1 3.2 14.2 14.2 14.2 2.9 6 20.4 10.1 2.9 14.2 3.2 0.95 1.7 1.7 9 1.3 1.4 2.4 16 11.4 14.35 2.1 11.4 14.35 1.1 1.1 1.2 15.8 5.2 5.2 9.6 5.2 1.2 0.8 14.45 9.6 6.9 3.4 2.3 11 5.95 5.1 5.4 1.2 12.6 1 6.6 1.5 1 1.1 6.6 8.2 2 1.4 2 7.5 2 2 13.3 2.85 5.6 5.6 1 3.2 1 7.1 2.4 11.2 9.5 1 1.8 2.6 2.4 8 11.2 7.1 3.3 10.3 1.2 1.6 10.3 9.65 16.4 1.5 1.2 3.3 5 16.3 16.3 16.3 6.5 6.4 10.2 16.3 7.4 13.7 13.7 1.3 7.4 7.4 7.45 7.2 13.7 10.4 1.1 6.5 4.6 13.9 5.2 1.7 6.5 16.4 3.6 1.5 12.4 1.7 6.2 6.2 2.6 1.7 9.3 12.4 1.5 9.1 12 4.8 12.3 12 2.7 3.6 3.6 4.3 1.8 11.8 1.8 11.8 1.8 1.4 6.6 1.55 0.7 6.4 11.8 4.3 5.1 5.8 5.9 1.3 1.4 1.2 7.4 10.8 1.8 7.4 1.2 1.4 14.4 1.7 3.6 3.6 10.05 10.05 10.5 1.9 3.6 1.65 1.9 65.8 6.85 7.4 7.4 20.2 11 20.2 6.2 6.2 6.85 8 8.2 2.2 10.1 7.2 2.2 10.1 1.6 1.3 8 8.2 5.3 14 7.2 1.6 11.8 9.6 6.1 2.7 3.6 1.7 1.6 2.7 1 0.9 1.6 1 10.6 2 1.2 6.2 9.2 5 6.3 3.3 8 1.2 1.2 16.2 11.6 7.2 1.1 3.4 1.4 3.3 8 9.3 2.3 0.9 3.5 1.7 1.3 1.3 5.6 7.4 2.3 1 1.5 10 14.9 9.3 1 1 5.9 5 1.25 3.9 5 0.8 1 5.9 1.6 1.3 1 1.1 1.25 1.4 1.2 5 1.4 1.7 1.8 1.6 1.5 1.7 13.9 5.9 2.1 1.1 6.7 2.7 6.7 3.95 7.75 10.6 1.6 2.5 0.7 11.1 5.15 4.7 9.7 1.7 1.4 2 7.5 9.7 0.8 13.1 1.1 2.2 8.9 1.1 0.9 1.7 6.9 1.1 1 1 7.6 8.9 2.2 1.2 1 1 3.1 1.95 2.2 8.75 11.9 2.7 5.45 6.3 14.4 7.8 1.6 9.1 9.1 14.4 1.3 1.6 11.3 6.3 0.7 1.25 0.7 7.8 10.3 10.3 7.8 8.7 8.3 10.3 7.8 1.2 8.3 8.3 6.2 5 1.8 1.6 1.8 1.8 2.9 6 0.9 1.1 1.6 5.45 14.05 8 13.1 4.9 1.3 2.2 14.9 14.9 0.95 1.4 0.95 1.7 5.6 14.9 7.1 1.2 9.6 11.4 11.4 7.9 5 11.1 8 3.8 10.55 10.2 10.2 9.8 6.3 1.1 4.5 6.3 10.9 9.8 9.8 0.8 0.8 1.2 1.3 9.8 10.2 10.9 6.3 6.3 1.2 0.9 1.1 4.5 3.7 18.1 1.35 5.5 3.1 12.85 19.8 8.25 12.85 3.8 6.9 8.25 11.7 4.6 4 19.8 12.85 1.2 8.9 11.7 6.2 14.8 14.8 10.8 1.6 8.3 8.4 2.5 3.5 17.2 2.1 12.2 11.8 16.8 17.2 1.1 14.7 5.5 6.1 1.2 1.3 8.7 1.7 8.7 10.2 4.5 5.9 1.7 1.4 5.4 7.9 1.1 7 7 7.6 7 12.3 15.3 12.3 1.2 2.3 6.1 7.6 10.2 4.1 2.9 8.5 1.5 3.1 7.9 3.5 4.9 1.1 7 1.2 4.5 2.6 9.9 4.5 9.5 1.5 3.2 2.6 11.2 3.2 2.3 4.9 4.9 1.4 1.5 6.7 2.1 4.3 10.9 7 2.3 2.5 2.6 3.2 2.5 14.7 4.5 2.2 1.9 1.6 17.3 4.2 4.2 2.5 1.9 1.4 0.8 8 1.6 1.7 5.5 17.3 8.6 6.9 2.1 2.2 1.5 2.5 17.6 4.2 2.9 4.8 11.9 0.9 1.3 6.4 4.3 11.9 8.1 1.3 0.9 17.2 17.2 17.2 8.7 17.2 8.7 7.5 17.2 4.6 3.7 2.2 7.4 15.1 7.4 4.8 7.9 1 15.1 7.4 4.8 4.6 1.4 6.2 6.1 5.1 6.3 0.9 2.3 6.6 7.5 8.6 11.9 2.3 7.1 4.3 1.1 1 7.9 1 1 1 7.3 1.7 1.3 6.4 1.8 1.5 3.8 7.9 1 1.2 5.3 9.1 6.5 9.1 6.3 5.1 6.5 2.4 9.1 7.5 5 6.75 1.2 1.6 16.05 5 12.4 0.95 4.6 1.7 1 1.3 5 2.5 2.6 2.1 12.75 1.1 12.4 3.7 2.65 2.5 8.2 7.3 1.1 6.6 7 14.5 11.8 3 3.7 6 4.6 2.5 3.3 1 1.1 1.4 3.3 8.55 2.5 6.7 3.8 4.5 4.6 4.2 11.3 5.5 4.2 2.2 14.5 14.5 14.5 14.5 14.5 14.5 1.5 18.75 3.6 1.4 5.1 10.5 2 2.6 9.2 1.8 5.7 2.4 1.9 1.4 0.9 4.6 1.4 9.2 1.4 1.8 2.3 2.3 4.4 6.4 2.9 2.8 2.9 4.4 8.2 1 2.9 7 1.8 1.5 7 8.2 7.6 2.3 8.7 1 2.9 6.7 5 1.9 2 1.9 8.5 12.6 5.2 2.1 1.1 1.3 1.1 9.2 1.2 1.1 8.3 1.8 1.4 15.7 4.35 1.8 1.6 2 5 1.8 1.3 1 1.4 8.1 8.6 3.7 5.7 2.35 13.65 13.65 13.65 15.2 4.6 1.2 4.6 6.65 13.55 13.65 9.8 10.3 6.7 15.2 9.9 7.2 1.1 8.3 11.25 12.8 9.65 12.6 12.2 8.3 11.25 1.3 9.9 7.2 1.1 1.1 4.8 1.1 1.4 1.7 10.6 1.4 1.1 5.55 2.1 1.7 9 1.7 1.8 4.7 11.3 3.6 6.9 3.6 4.9 6.95 1.9 4.7 11.3 1.8 11.3 8.2 8.3 9.55 8.4 7.8 7.8 10.2 5.5 7.8 7.4 3.3 5 3.3 5 1.3 1.2 7.4 7.8 9.9 0.7 4.6 5.6 9.5 14.8 4.6 2.1 11.6 1.2 11.6 2.1 20.15 4.7 4.3 14.5 4.9 14.55 14.55 10.05 4.9 14.5 14.55 15.25 3.15 1.3 5.2 1.1 7.1 8.8 18.5 8.8 1.4 1.2 5 1.6 18.75 6 9.4 9.7 4.75 6 5.35 5.35 6.8 6.9 1.4 0.9 1.2 1.3 2.6 12 9.85 3.85 2 1.6 7.8 1.9 2 10.3 1.1 12 3.85 9.85 2 4 1.1 10.4 6.1 1.8 10.4 4.7 4 1.1 6.4 8.15 6.1 4.8 1.2 1.1 1.4 7.4 1.8 1 15.5 15.5 8.4 2.4 3.95 19.95 2 3 15.5 8.4 14.3 4.2 1.4 3 4.9 2.4 14.3 10.7 11 1.4 1.2 12.9 10.8 1.3 2 1.8 1.2 7.5 9.7 3.8 7.2 9.7 6.3 6.3 0.8 8.6 6.3 3.1 7.2 7.1 6.4 14.7 7.2 7.1 1.9 1.2 4.8 1.2 3.4 4.3 8.5 1.8 1.8 19.5 8.5 19.9 8.3 1.8 1.1 16.65 16.65 16.65 0.9 6.1 10.2 0.9 16.65 3.85 4.4 4.5 3.2 4.5 4.4 9.7 4.2 4.2 1.1 9.7 4.2 5.6 4.2 1.6 1.6 1.1 14.6 2.6 1.2 7.25 6.55 7 1.5 1.4 7.25 1 4.2 17.5 17.5 17.5 1.5 1.3 3.9 4.2 7.6 1 1.1 11.8 1.4 9.7 12.9 1.6 7.2 7.1 1.9 8.8 7.2 1.4 14.3 14.3 8.8 1.4 1.8 14.3 7.2 1.2 11.8 0.9 12.6 26.05 4.7 12.6 1.2 26.05 6.1 11.8 0.9 5.6 5.3 5.7 8 8 17.6 8 8.8 1.5 1.4 4.8 2.4 3.7 4.9 5.7 5.7 4.9 2 5.1 4.5 3.2 6.65 1.6 4 17.75 1.4 17.75 7.2 5.7 8.5 11.4 5.4 2.7 4.3 1.2 1.8 1.3 5.7 2.7 11.7 4.3 11 1.6 11.6 6.2 1.8 1.2 1 2.4 1.2 8.2 18.8 9.6 12.9 9.2 1.2 12.9 8 12.9 1.6 12 2.5 9.2 4.4 8.8 9.6 8 18.8 1.3 1.2 12.9 1.2 1.6 1.5 18.15 13.1 13.1 13.1 13.1 1 1.6 11.8 1.4 1 13.1 10.6 10.4 1.1 7.4 1.2 3.4 18.15 8 2.5 2 2 6.9 1.2 9.4 2.9 6.9 5.4 1.3 20.8 10.3 1.3 1.6 13.1 1.8 8 1.6 1.4 14.7 14.7 14.7 14.7 14.7 14.7 14.7 1.8 10.6 12.5 6.8 14.7 2.9 1.4 1.4 2.1 7.4 2.9 1.4 1.4 7.4 5 2.5 6.1 2.7 2.1 12.9 12.9 12.9 13.7 12.9 2.4 9.8 13.7 1.3 12.1 6.1 7.7 6.1 1.4 7.7 12.1 6.8 9.2 8.3 17.4 2.7 12.8 8.2 8.1 8.2 8.3 8 11.8 12 1.7 17.4 13.9 10.7 2 2.2 1.3 1.1 2 6.4 1.3 1.1 10.7 6.4 6.3 6.4 15.1 2 2 2.2 12.1 8.8 8.8 5.1 6.8 6.8 3.7 12.2 5.7 8.1 2.5 4 6.8 1 5.1 5.8 10.6 3.5 3.5 16.4 4.8 3.3 1.2 1.2 4.8 3.3 2.5 8.7 1.6 4 2.5 16.2 9 16.2 1.4 7 9 3.1 1.5 4.6 4.8 4.6 1.5 2.7 6.3 7.2 7.2 12.4 6.6 6.6 4 4.8 1.3 7.2 11.1 12.4 9.8 6.6 13.3 11.7 8 1.6 16.55 1.5 10.2 6.6 17.8 17.8 1.5 7.4 17.8 2 7.4 2 17.8 12.1 8.2 1.5 8.7 3.5 6.4 2.1 7.7 12.3 1.3 8.7 3.5 1.1 2.8 3.5 1.9 3.8 3.8 2.4 4.8 4.8 6.2 1.3 3.8 1.5 4.8 1.9 6.2 7.9 1.6 1.4 2.6 14.8 2.4 0.9 0.9 1.2 9.9 3.9 15.6 15.6 1.5 1.6 7.8 5.6 1.3 16.7 7.95 6.7 1.1 6.3 8.9 1 1.5 6.6 6.2 6.3 2.1 2.2 5.4 8.9 1 17.9 2.6 1.3 17.9 2.6 2.3 4.3 7.1 7.1 11.9 11.7 5.8 3.8 12.4 6.5 7.1 7.6 7.9 2.8 10.6 2.8 1.5 7.6 7.9 1.7 7.6 7.5 1.7 1.7 12.1 4.5 1.7 8 7.6 8.6 8.6 14.6 1.6 8.6 14.6 1.1 3.7 8.9 8.9 4.7 8.9 3.1 5.8 5.8 5.8 1 15.8 1.5 5.2 1.5 2.5 1 15.8 5.9 3.1 3.1 5.8 11.5 18 4.8 8.5 1.6 18 4.8 5.9 1.1 8.5 13.1 4.1 2.9 13.1 1.1 1.5 7.75 1.15 1 17.8 5.7 17.8 7.4 1.4 1.4 1 4.4 1.6 7.9 15.5 15.5 15.5 15.5 17.55 13.5 13.5 1.3 15.5 11.6 7.9 15.5 17.55 11.6 13.15 1.9 13.5 1.3 6.1 6.1 1.9 1.9 1.6 11.3 8.4 8.3 8.4 12.2 8 1.3 12.7 1.3 10.5 12.5 9.6 1.5 1.5 7.8 10.8 12.5 8.6 1.2 14.5 3.7 1.1 1.1 3.8 4.6 10.2 7.9 2.4 10.7 4.9 10.7 1.1 7.9 5.6 2.4 14.2 9.5 9.5 4.1 4.7 1.4 0.9 20.3 3.5 2.7 1.2 1.2 2 1.1 1.5 1.2 18.1 18.1 3.6 3.5 12.1 17.45 12.1 3 1.6 5.7 5.6 6.8 15.6 6 1.8 8.6 8.6 11.5 7.8 2.4 5 8.6 1.5 5.4 11.9 11.9 9 10 11.9 11.9 15.5 5.4 15 1.4 9.4 3.7 15 1.4 6.5 1.4 6.3 13.7 13.7 13.7 13.7 13.7 13.7 1.5 1.6 1.4 3.5 1 1.4 1.5 13.7 1.6 5.2 1.4 11.9 2.4 3.2 1.7 4.2 15.4 13 5.6 9.7 2.5 4 15.4 1.2 2 1.2 5.1 1.4 1.2 6.5 1.3 6.5 2.7 1.3 7.4 12.9 1.3 1.2 2.6 2.3 1.3 10.5 2.6 14.4 1.2 3.1 1.7 6 11.8 6.2 1.4 12.1 12.1 12.1 3.9 4.6 12.1 1.2 8.1 3.9 1.1 6.5 10.1 10.7 3.2 12.4 5.2 5 2.5 9.2 6.9 2 15 15 1.2 15 1.8 10.8 3.9 4.2 2 13.5 13.3 2.2 1.4 1.6 2.2 14.8 1.8 14.8 1.3 9.9 5.1 5.1 1.5 1.5 11.1 5.25 2.3 7.9 8 1.4 5.25 2.3 2.3 3.5 13.7 9.9 15.4 16 16 16 16 2.4 5.5 2.3 16.8 16 17.8 17.8 6.8 6.8 6.8 6.8 1.6 4.7 11.8 17.8 15.7 5.8 15.7 9 15.7 5.8 8.8 10.2 6.6 6.5 8.9 11.1 4.2 1.6 7.4 11.5 1.6 2 4.8 9.8 1.9 4.2 1.6 7.3 5.4 10.4 1.9 7.3 5.4 7.7 11.5 1.2 2.2 1 8.2 8.3 8.2 9.3 8.1 8.2 8.3 13.9 13.9 13.9 13.9 13.9 13.9 13.9 2 13.9 15.7 1.2 1.5 1.2 3.2 1.2 2.6 13.2 10.4 5.7 2.5 1.6 1.4 7.4 2.5 5.6 3.6 7.5 5.8 1.6 1.5 2.9 11.2 9.65 10.1 3.2 11.2 11.45 9.65 4.5 2.7 3.5 1.7 2.1 4.8 5 2.6 6.6 5 7.3 5 1.7 2.6 8.2 8.2 5 1.2 7.1 9.5 15.8 15.5 15.8 17.05 12.7 12.3 11.8 11.8 11.8 12.3 11.8 13.6 5.2 6.2 7.9 7.9 3.3 2.8 7.9 3.3 6.3 4.9 10.4 4.9 10.4 16 6.3 2.2 17.3 17.3 17.3 17.3 2.2 2.2 17.3 6.6 6.5 12.3 5 2.8 13.6 2.8 5.4 10.9 1.7 9.15 4.5 9.15 1.4 5.9 16.4 1.2 16.4 5.9 7.8 7.8 2.8 2.9 2.5 12.8 12.2 7.7 2.8 2.9 17.3 19.3 19.3 19.3 2.7 6.4 17.3 2.4 2.8 1.7 15.4 15.4 4.1 6.6 1.2 2.1 1 1.1 1.4 1.6 9.8 1.9 1.3 7.9 7.9 4.5 22.6 7.9 3.5 1.2 4.5 2 7.8 0.9 2.9 2.9 3.5 4.2 9.7 10.5 1.1 16.1 1.1 8.1 6.2 7.7 2.4 16.3 2.3 8.4 8.5 6 1.1 1.75 2.6 1.3 2.1 1.1 1.1 2.8 9 2.8 2.2 5.1 3.5 12.7 7.5 2 3.5 14.3 9.8 12.7 12.7 5.1 3.5 12.7 12.9 12.9 1.3 10.5 1.5 12.7 12.9 1.2 6.2 8.8 3.9 1.3 9.1 9.1 3.9 1.8 2.1 1.4 14.7 9.1 1.9 1.8 9.6 3.9 1.3 11.8 1.9 12 7.9 9.3 4.6 2.2 10.2 10.6 1.4 9.1 11.1 9.1 4.4 2.8 1.1 1.3 1.2 3.3 9.7 2.3 1.1 11.4 1.2 14.7 13.8 1.3 6.3 7.9 2 11.8 1.2 10 5.2 1.2 7.2 9.9 5.3 13.55 2.2 9.9 4.3 13 13.55 1 1.1 6.9 13.4 4.6 9.9 3 5.8 12.9 3.2 0.8 2.5 2.4 7.2 7.3 6.3 4.25 1.2 2 4.25 4.7 4.5 1.4 4.1 5.3 4.2 6.65 8.2 2.6 2.6 2 12.2 2.3 8.2 5 10.7 10.8 1.7 1.3 1.7 12.7 1.3 1.2 1.3 5.7 3.4 1.1 1 1 1.65 6.8 6.8 4.9 1.4 2.5 10.8 10.8 10.8 10.8 2.8 1.3 2 1.1 8.2 6 6.1 8.2 8.8 6.1 6 1.2 11.4 1.3 1.3 6.2 3.2 4.5 9.9 6.2 11.4 1.3 1.3 0.9 0.7 1 1 10.4 1.3 12.5 12.5 12.5 12.5 19.25 1.1 12.5 19.25 9 1.2 9 1.3 12.8 12.8 7.6 7.6 1.4 8.3 9 1.85 12.55 1.4 1.8 4 12.55 9 3 1.85 7.9 2.6 1.2 7.1 7.9 1.3 10.7 7.7 8.4 10.7 12.7 1.8 7.7 10.5 1.6 1.85 10.5 10.5 1 1.2 1.7 1.6 9 1.9 1.2 1.5 3.9 3.6 1.2 5 2.9 10.4 11.4 18.35 18.4 1.2 7.1 1.3 1.5 10.2 2.2 3.5 3.5 3.9 7.4 7.4 11 1.5 3.9 5.4 1.5 5 1.2 13 13 13 13 8.6 1.7 1.2 1.2 1.2 2 19.4 0.8 6.3 6.4 12.1 12.1 12.9 2.4 4.3 4.2 12.9 1.7 2.2 12.1 3.4 7.4 7.3 1.1 1.1 1.4 14.5 8 1.1 1.1 2.2 5.8 0.9 6.4 10.9 7.3 8.3 1.3 3.3 1 1.1 1 5.1 3.2 12.6 3.7 1.7 5.1 1 1.3 1.5 4.6 10.3 6.1 6.1 1.2 10.3 9.9 1.6 1.1 1.5 1.2 1.5 1.1 11.5 7.8 7.4 1.45 8.9 1.1 1 2.5 1.1 2.4 2.3 5.1 2.5 8.9 2.5 8.9 1.6 1.4 3.9 13.7 13.7 9.2 7.8 7.6 7.7 3 1.3 4 1.1 2 1.9 1.4 4.5 10.1 6.6 1.9 12.4 1.6 2.5 1.2 2.5 0.8 0.9 8.1 8.1 11.75 1.3 1.9 8.3 8.1 5.7 1.9 1.2 11.75 2.2 0.9 1.3 1.6 8 1.2 1.1 0.8 
\ No newline at end of file
+1.001 0.994 0.9951 0.9956 0.9956 0.9951 0.9949 1.001 0.994 0.9938 0.9908 0.9947 0.992 0.9912 1.0002 0.9914 0.9928 0.9892 0.9917 0.9955 0.9892 0.9912 0.993 0.9937 0.9951 0.9955 0.993 0.9961 0.9914 0.9906 0.9974 0.9934 0.992 0.9939 0.9962 0.9905 0.9934 0.9906 0.9999 0.9999 0.9937 0.9937 0.9954 0.9934 0.9934 0.9931 0.994 0.9939 0.9954 0.995 0.9917 0.9914 0.991 0.9911 0.993 0.9908 0.9962 0.9972 0.9931 0.9926 0.9951 0.9972 0.991 0.9931 0.9927 0.9934 0.9903 0.992 0.9926 0.9962 0.9956 0.9958 0.9964 0.9941 0.9926 0.9962 0.9898 0.9912 0.9961 0.9949 0.9929 0.9985 0.9946 0.9966 0.9974 0.9975 0.9974 0.9972 0.9974 0.9975 0.9974 0.9957 0.99 0.9899 0.9916 0.9969 0.9979 0.9913 0.9956 0.9979 0.9975 0.9962 0.997 1 0.9975 0.9974 0.9962 0.999 0.999 0.9927 0.9959 1 0.9982 0.9968 0.9968 0.994 0.9914 0.9911 0.9982 0.9982 0.9934 0.9984 0.9952 0.9952 0.9928 0.9912 0.994 0.9958 0.9924 0.9924 0.994 0.9958 0.9979 0.9982 0.9961 0.9979 0.992 0.9975 0.9917 0.9923 0.9927 0.9975 0.992 0.9947 0.9921 0.9905 0.9918 0.9951 0.9917 0.994 0.9934 0.9968 0.994 0.9919 0.9966 0.9979 0.9979 0.9898 0.9894 0.9894 0.9898 0.998 0.9932 0.9979 0.997 0.9972 0.9974 0.9896 0.9968 0.9958 0.9906 0.9917 0.9902 0.9918 0.999 0.9927 0.991 0.9972 0.9931 0.995 0.9951 0.9936 1.001 0.9979 0.997 0.9972 0.9954 0.9924 0.9906 0.9962 0.9962 1.001 0.9928 0.9942 0.9942 0.9942 0.9942 0.9961 0.998 0.9961 0.9984 0.998 0.9973 0.9949 0.9924 0.9972 0.9958 0.9968 0.9938 0.993 0.994 0.9918 0.9958 0.9944 0.9912 0.9961 0.9939 0.9961 0.9989 0.9938 0.9939 0.9971 0.9912 0.9936 0.9929 0.9998 0.9938 0.9969 0.9938 0.9998 0.9972 0.9976 0.9976 0.9979 0.9979 0.9979 0.9979 0.9972 0.9918 0.9982 0.9985 0.9944 0.9903 0.9934 0.9975 0.9923 0.99 0.9905 0.9905 0.996 0.9964 0.998 0.9975 0.9913 0.9932 0.9935 0.9927 0.9927 0.9912 0.9904 0.9939 0.9996 0.9944 0.9977 0.9912 0.9996 0.9965 0.9944 0.9945 0.9944 0.9965 0.9944 0.9972 0.9949 0.9966 0.9954 0.9954 0.9915 0.9919 0.9916 0.99 0.9909 0.9938 0.9982 0.9988 0.9961 0.9978 0.9979 0.9979 0.9979 0.9979 0.9945 1 0.9957 0.9968 0.9934 0.9976 0.9932 0.997 0.9923 0.9914 0.992 0.9914 0.9914 0.9949 0.9949 0.995 0.995 0.9927 0.9928 0.9917 0.9918 0.9954 0.9941 0.9941 0.9934 0.9927 0.9938 0.9933 0.9934 0.9927 0.9938 0.9927 0.9946 0.993 0.9946 0.9976 0.9944 0.9978 0.992 0.9912 0.9927 0.9906 0.9954 0.9923 0.9906 0.991 0.9972 0.9945 0.9934 0.9964 0.9948 0.9962 0.9931 0.993 0.9942 0.9906 0.9995 0.998 0.997 0.9914 0.992 0.9924 0.992 0.9937 0.9978 0.9978 0.9927 0.994 0.9935 0.9968 0.9941 0.9942 0.9978 0.9923 0.9912 0.9923 0.9927 0.9931 0.9941 0.9927 0.9931 0.9934 0.9936 0.9893 0.9893 0.9919 0.9924 0.9927 0.9919 0.9924 0.9975 0.9969 0.9936 0.991 0.9893 0.9906 0.9941 0.995 0.9983 0.9983 0.9916 0.9957 0.99 0.9976 0.992 0.9917 0.9917 0.9993 0.9908 0.9917 0.9976 0.9934 1 0.9918 0.992 0.9896 0.9932 0.992 0.9917 0.9999 0.998 0.9918 0.9918 0.9999 0.998 0.9927 0.9959 0.9927 0.9929 0.9898 0.9954 0.9954 0.9954 0.9954 0.9954 0.9954 0.9974 0.9936 0.9978 0.9974 0.9927 0.9934 0.9938 0.9922 0.992 0.9935 0.9906 0.9934 0.9934 0.9913 0.9938 0.9898 0.9975 0.9975 0.9937 0.9914 0.9982 0.9982 0.9929 0.9971 0.9921 0.9931 0.9924 0.9929 0.9982 0.9892 0.9956 0.9924 0.9971 0.9956 0.9982 0.9973 0.9932 0.9976 0.9962 0.9956 0.9932 0.9976 0.9992 0.9983 0.9937 0.99 0.9944 0.9938 0.9965 0.9893 0.9927 0.994 0.9928 0.9964 0.9917 0.9972 0.9964 0.9954 0.993 0.9928 0.9916 0.9936 0.9962 0.9899 0.9898 0.996 0.9907 0.994 0.9913 0.9976 0.9904 0.992 0.9976 0.999 0.9975 0.9937 0.9937 0.998 0.998 0.9944 0.9938 0.9907 0.9938 0.9921 0.9908 0.9931 0.9915 0.9952 0.9926 0.9934 0.992 0.9918 0.9942 0.9942 0.9942 0.9901 0.9898 0.9902 0.9934 0.9906 0.9898 0.9896 0.9922 0.9947 0.9945 0.9976 0.9976 0.9976 0.9987 0.9987 0.9976 0.992 0.9955 0.9953 0.9976 0.992 0.9952 0.9983 0.9933 0.9958 0.9922 0.9928 0.9976 0.9976 0.9916 0.9901 0.9976 0.9901 0.9916 0.9982 0.993 0.9969 0.991 0.9953 0.9924 0.9969 0.9928 0.9945 0.9967 0.9944 0.9928 0.9929 0.9948 0.9976 0.9912 0.9987 0.99 0.991 0.9933 0.9933 0.9899 0.9912 0.9912 0.9976 0.994 0.9947 0.9954 0.993 0.9954 0.9963 0.992 0.9926 0.995 0.9983 0.992 0.9968 0.9905 0.9904 0.9926 0.9968 0.9928 0.9949 0.9909 0.9937 0.9914 0.9905 0.9904 0.9924 0.9924 0.9965 0.9965 0.9993 0.9965 0.9908 0.992 0.9978 0.9978 0.9978 0.9978 0.9912 0.9928 0.9928 0.993 0.9993 0.9965 0.9937 0.9913 0.9934 0.9952 0.9983 0.9957 0.9957 0.9916 0.9999 0.9999 0.9936 0.9972 0.9933 0.9934 0.9931 0.9976 0.9937 0.9937 0.991 0.9979 0.9971 0.9969 0.9968 0.9961 0.993 0.9973 0.9944 0.9986 0.9986 0.9986 0.9986 0.9972 0.9917 0.992 0.9932 0.9936 0.9915 0.9922 0.9934 0.9952 0.9972 0.9934 0.9958 0.9944 0.9908 0.9958 0.9925 0.9966 0.9972 0.9912 0.995 0.9928 0.9968 0.9955 0.9981 0.991 0.991 0.991 0.992 0.9931 0.997 0.9948 0.9923 0.9976 0.9938 0.9984 0.9972 0.9922 0.9935 0.9944 0.9942 0.9944 0.9997 0.9977 0.9912 0.9982 0.9982 0.9983 0.998 0.9894 0.9927 0.9917 0.9904 0.993 0.9941 0.9943 0.99855 0.99345 0.998 0.9916 0.9916 0.99475 0.99325 0.9933 0.9969 1.0002 0.9933 0.9937 0.99685 0.99455 0.9917 0.99035 0.9914 0.99225 0.99155 0.9954 0.99455 0.9924 0.99695 0.99655 0.9934 0.998 0.9971 0.9948 0.998 0.9971 0.99215 0.9948 0.9915 0.99115 0.9932 0.9977 0.99535 0.99165 0.9953 0.9928 0.9958 0.9928 0.9928 0.9964 0.9987 0.9953 0.9932 0.9907 0.99755 0.99935 0.9932 0.9932 0.9958 0.99585 1.00055 0.9985 0.99505 0.992 0.9988 0.99175 0.9962 0.9962 0.9942 0.9927 0.9927 0.99985 0.997 0.9918 0.99215 0.99865 0.9992 1.0006 0.99135 0.99715 0.9992 1.0006 0.99865 0.99815 0.99815 0.99815 0.9949 0.99815 0.99815 0.99225 0.99445 0.99225 0.99335 0.99625 0.9971 0.9983 0.99445 0.99085 0.9977 0.9953 0.99775 0.99795 0.99505 0.9977 0.9975 0.99745 0.9976 0.99775 0.9953 0.9932 0.99405 1 0.99785 0.9939 0.9939 0.99675 0.9939 0.99675 0.98965 0.9971 0.99445 0.9945 0.9939 0.9958 0.9956 0.99055 0.9959 0.9925 0.9963 0.9935 0.99105 0.99045 0.9963 0.99155 0.99085 0.99085 0.99085 0.9924 0.9924 0.99975 0.99975 0.99315 0.9917 0.9917 0.99845 0.9921 0.99975 0.9909 0.99315 0.99855 0.9934 0.9978 0.9934 0.9949 0.99855 0.9986 0.99725 0.9946 0.99255 0.9996 0.9939 0.99 0.9937 0.9886 0.9934 1 0.9994 0.9926 0.9956 0.9978 0.9915 0.9939 0.9932 0.993 0.9898 0.9921 0.9932 0.9919 0.993 0.9953 0.9928 0.9928 0.9976 0.9906 0.9918 0.99185 0.9918 0.99185 0.994 0.9908 0.9928 0.9896 0.9908 0.9918 0.9952 0.9923 0.9915 0.9952 0.9947 0.9983 0.9975 0.995 0.9944 0.994 0.9944 0.9908 0.99795 0.9985 0.99425 0.99425 0.9943 0.9924 0.9946 0.9924 0.995 0.9919 0.99 0.9923 0.9956 0.9978 0.9978 0.9967 0.9934 0.9936 0.9932 0.9934 0.998 0.9978 0.9929 0.9974 0.99685 0.99495 0.99745 0.99505 0.992 0.9978 0.9956 0.9982 0.99485 0.9971 0.99265 0.9904 0.9965 0.9946 0.99965 0.9935 0.996 0.9942 0.9936 0.9965 0.9928 0.9928 0.9965 0.9936 0.9938 0.9926 0.9926 0.9983 0.9983 0.992 0.9983 0.9923 0.9972 0.9928 0.9928 0.9994 0.991 0.9906 0.9894 0.9898 0.9994 0.991 0.9925 0.9956 0.9946 0.9966 0.9951 0.9927 0.9927 0.9951 0.9894 0.9907 0.9925 0.9928 0.9941 0.9941 0.9925 0.9935 0.9932 0.9944 0.9972 0.994 0.9956 0.9927 0.9924 0.9966 0.9997 0.9936 0.9936 0.9952 0.9952 0.9928 0.9911 0.993 0.9911 0.9932 0.993 0.993 0.9932 0.9932 0.9943 0.9968 0.9994 0.9926 0.9968 0.9932 0.9916 0.9946 0.9925 0.9925 0.9935 0.9962 0.9928 0.993 0.993 0.9956 0.9941 0.9972 0.9948 0.9955 0.9972 0.9972 0.9983 0.9942 0.9936 0.9956 0.9953 0.9918 0.995 0.992 0.9952 1.001 0.9924 0.9932 0.9937 0.9918 0.9934 0.991 0.9962 0.9932 0.9908 0.9962 0.9918 0.9941 0.9931 0.9981 0.9931 0.9944 0.992 0.9966 0.9956 0.9956 0.9949 1.0002 0.9942 0.9923 0.9917 0.9931 0.992 1.0002 0.9953 0.9951 0.9974 0.9904 0.9974 0.9944 1.0004 0.9952 0.9956 0.995 0.995 0.9995 0.9942 0.9977 0.992 0.992 0.9995 0.9934 1.0006 0.9982 0.9928 0.9945 0.9963 0.9906 0.9956 0.9942 0.9962 0.9894 0.995 0.9908 0.9914 0.9938 0.9977 0.9922 0.992 0.9903 0.9893 0.9952 0.9903 0.9912 0.9983 0.9937 0.9932 0.9928 0.9922 0.9976 0.9922 0.9974 0.998 0.9931 0.9911 0.9944 0.9937 0.9974 0.989 0.992 0.9928 0.9918 0.9936 0.9944 0.9988 0.994 0.9953 0.9986 0.9914 0.9934 0.996 0.9937 0.9921 0.998 0.996 0.9933 0.9933 0.9959 0.9936 0.9953 0.9938 0.9952 0.9959 0.9959 0.9937 0.992 0.9967 0.9944 0.9998 0.9998 0.9942 0.9998 0.9945 0.9998 0.9946 0.9942 0.9928 0.9946 0.9927 0.9938 0.9918 0.9945 0.9966 0.9954 0.9913 0.9931 0.9986 0.9965 0.9984 0.9952 0.9956 0.9949 0.9954 0.996 0.9931 0.992 0.9912 0.9978 0.9938 0.9914 0.9932 0.9944 0.9913 0.9948 0.998 0.9998 0.9964 0.9992 0.9948 0.9998 0.998 0.9939 0.992 0.9922 0.9955 0.9917 0.9917 0.9954 0.9986 0.9955 0.9917 0.9907 0.9922 0.9958 0.993 0.9917 0.9926 0.9959 0.9906 0.9993 0.993 0.9906 0.992 0.992 0.994 0.9959 0.9908 0.9902 0.9908 0.9943 0.9921 0.9911 0.9986 0.992 0.992 0.9943 0.9937 0.993 0.9902 0.9928 0.9896 0.998 0.9954 0.9938 0.9918 0.9896 0.9944 0.9999 0.9953 0.992 0.9925 0.9981 0.9952 0.9927 0.9927 0.9911 0.9936 0.9959 0.9946 0.9948 0.9955 0.9951 0.9952 0.9946 0.9946 0.9944 0.9938 0.9963 0.991 1.0003 0.9966 0.9993 1.0003 0.9938 0.9965 0.9938 0.9993 0.9938 1.0003 0.9966 0.9942 0.9928 0.991 0.9911 0.9977 0.9927 0.9911 0.991 0.9912 0.9907 0.9902 0.992 0.994 0.9966 0.993 0.993 0.993 0.9966 0.9942 0.9925 0.9925 0.9928 0.995 0.9939 0.9958 0.9952 1 0.9948 0.99 0.9958 0.9948 0.9949 0.997 0.9927 0.9938 0.9949 0.9953 0.997 0.9932 0.9927 0.9932 0.9955 0.9914 0.991 0.992 0.9924 0.9927 0.9911 0.9958 0.9928 0.9902 0.994 0.994 0.9972 1.0004 0.991 0.9918 0.995 0.9941 0.9956 0.9956 0.9959 0.9922 0.9931 0.9959 0.9984 0.9908 0.991 0.9928 0.9936 0.9941 0.9924 0.9917 0.9906 0.995 0.9956 0.9955 0.9907 1 0.9953 0.9911 0.9922 0.9951 0.9948 0.9906 0.994 0.9907 0.9927 0.9914 0.9958 1 0.9984 0.9941 0.9944 0.998 0.998 0.9902 0.9911 0.9929 0.993 0.9918 0.992 0.9932 0.992 0.994 0.9923 0.993 0.9956 0.9907 0.99 0.9918 0.9926 0.995 0.99 0.99 0.9946 0.9907 0.9898 0.9918 0.9986 0.9986 0.9928 0.9986 0.9979 0.994 0.9937 0.9938 0.9942 0.9944 0.993 0.9986 0.9932 0.9934 0.9928 0.9925 0.9944 0.9909 0.9932 0.9934 1.0001 0.992 0.9916 0.998 0.9919 0.9925 0.9977 0.9944 0.991 0.99 0.9917 0.9923 0.9928 0.9923 0.9928 0.9902 0.9893 0.9917 0.9982 1.0005 0.9923 0.9951 0.9956 0.998 0.9928 0.9938 0.9914 0.9955 0.9924 0.9911 0.9917 0.9917 0.9932 0.9955 0.9929 0.9955 0.9958 1.0012 0.9968 0.9911 0.9924 0.991 0.9946 0.9928 0.9946 0.9917 0.9918 0.9926 0.9931 0.9932 0.9903 0.9928 0.9929 0.9958 0.9955 0.9911 0.9938 0.9942 0.9945 0.9962 0.992 0.9927 0.9948 0.9945 0.9942 0.9952 0.9942 0.9958 0.9918 0.9932 1.0004 0.9972 0.9998 0.9918 0.9918 0.9964 0.9936 0.9931 0.9938 0.9934 0.99 0.9914 0.9904 0.994 0.9938 0.9933 0.9909 0.9942 0.9945 0.9954 0.996 0.9991 0.993 0.9942 0.9934 0.9939 0.9937 0.994 0.9926 0.9951 0.9952 0.9935 0.9938 0.9939 0.9933 0.9927 0.998 0.9997 0.9981 0.992 0.9954 0.992 0.9997 0.9981 0.9943 0.9941 0.9936 0.9996 0.9932 0.9926 0.9936 0.992 0.9936 0.9996 0.993 0.9924 0.9928 0.9926 0.9952 0.9945 0.9945 0.9903 0.9932 0.9953 0.9936 0.9912 0.9962 0.9965 0.9932 0.9967 0.9953 0.9963 0.992 0.991 0.9958 0.99 0.991 0.9958 0.9938 0.9996 0.9946 0.9974 0.9945 0.9946 0.9974 0.9957 0.9931 0.9947 0.9953 0.9931 0.9946 0.9978 0.9989 1.0004 0.9938 0.9934 0.9978 0.9956 0.9982 0.9948 0.9956 0.9982 0.9926 0.991 0.9945 0.9916 0.9953 0.9938 0.9956 0.9906 0.9956 0.9932 0.9914 0.9938 0.996 0.9906 0.98815 0.9942 0.9903 0.9906 0.9935 1.0024 0.9968 0.9906 0.9941 0.9919 0.9928 0.9958 0.9932 0.9957 0.9937 0.9982 0.9928 0.9919 0.9956 0.9957 0.9954 0.993 0.9954 0.9987 0.9956 0.9928 0.9951 0.993 0.9928 0.9926 0.9938 1.0001 0.9933 0.9952 0.9934 0.9988 0.993 0.9952 0.9948 0.9998 0.9971 0.9998 0.9962 0.9948 0.99 0.9942 0.9965 0.9912 0.9978 0.9928 1.0103 0.9956 0.9936 0.9929 0.9966 0.9964 0.996 0.9959 0.9954 0.9914 1.0103 1.0004 0.9911 0.9938 0.9927 0.9922 0.9924 0.9963 0.9936 0.9951 0.9951 0.9955 0.9961 0.9936 0.992 0.9944 0.9944 1.0008 0.9962 0.9986 0.9986 1 0.9986 0.9982 1 0.9949 0.9915 0.9951 0.9986 0.9927 0.9955 0.9952 0.9928 0.9982 0.9914 0.9927 0.9918 0.9944 0.9969 0.9955 0.9954 0.9955 0.9921 0.9934 0.9998 0.9946 0.9984 0.9924 0.9939 0.995 0.9957 0.9953 0.9912 0.9939 0.9921 0.9954 0.9933 0.9941 0.995 0.9977 0.9912 0.9945 0.9952 0.9924 0.9986 0.9953 0.9939 0.9929 0.9988 0.9906 0.9914 0.9978 0.9928 0.9948 0.9978 0.9946 0.9908 0.9954 0.9906 0.99705 0.9982 0.9932 0.9977 0.994 0.9982 0.9929 0.9924 0.9966 0.9921 0.9967 0.9934 0.9914 0.99705 0.9961 0.9967 0.9926 0.99605 0.99435 0.9948 0.9916 0.997 0.9961 0.9967 0.9961 0.9955 0.9922 0.9918 0.9955 0.9941 0.9955 0.9955 0.9924 0.9973 0.999 0.9941 0.9922 0.9922 0.9953 0.9945 0.9945 0.9957 0.9932 0.9945 0.9913 0.9909 0.9939 0.991 0.9954 0.9943 0.993 1.0002 0.9946 0.9953 0.9918 0.9936 0.9984 0.9956 0.9966 0.9942 0.9984 0.9956 0.9966 0.9974 0.9944 1.0008 0.9974 1.0008 0.9928 0.9944 0.9908 0.9917 0.9911 0.9912 0.9953 0.9932 0.9896 0.9889 0.9912 0.9926 0.9911 0.9964 0.9974 0.9944 0.9974 0.9964 0.9963 0.9948 0.9948 0.9953 0.9948 0.9953 0.9949 0.9988 0.9954 0.992 0.9984 0.9954 0.9926 0.992 0.9976 0.9972 0.991 0.998 0.9966 0.998 1.0007 0.992 0.9925 0.991 0.9934 0.9955 0.9944 0.9981 0.9968 0.9946 0.9946 0.9981 0.9946 0.997 0.9924 0.9958 0.994 0.9958 0.9984 0.9948 0.9932 0.9952 0.9924 0.9945 0.9976 0.9976 0.9938 0.9997 0.994 0.9921 0.9986 0.9987 0.9991 0.9987 0.9991 0.9991 0.9948 0.9987 0.993 0.9988 1 0.9932 0.9991 0.9989 1 1 0.9952 0.9969 0.9966 0.9966 0.9976 0.99 0.9988 0.9942 0.9984 0.9932 0.9969 0.9966 0.9933 0.9916 0.9914 0.9966 0.9958 0.9926 0.9939 0.9953 0.9906 0.9914 0.9958 0.9926 0.9991 0.9994 0.9976 0.9966 0.9953 0.9923 0.993 0.9931 0.9932 0.9926 0.9938 0.9966 0.9974 0.9924 0.9948 0.9964 0.9924 0.9966 0.9974 0.9938 0.9928 0.9959 1.0001 0.9959 1.0001 0.9968 0.9932 0.9954 0.9992 0.9932 0.9939 0.9952 0.9996 0.9966 0.9925 0.996 0.9996 0.9973 0.9937 0.9966 1.0017 0.993 0.993 0.9959 0.9958 1.0017 0.9958 0.9979 0.9941 0.997 0.9934 0.9927 0.9944 0.9927 0.9963 1.0011 1.0011 0.9959 0.9973 0.9966 0.9932 0.9984 0.999 0.999 0.999 0.999 0.999 1.0006 0.9937 0.9954 0.997 0.9912 0.9939 0.999 0.9957 0.9926 0.9994 1.0004 0.9994 1.0004 1.0004 1.0002 0.9922 0.9922 0.9934 0.9926 0.9941 0.9994 1.0004 0.9924 0.9948 0.9935 0.9918 0.9948 0.9924 0.9979 0.993 0.994 0.991 0.993 0.9922 0.9979 0.9937 0.9928 0.9965 0.9928 0.9991 0.9948 0.9925 0.9958 0.9962 0.9965 0.9951 0.9944 0.9916 0.9987 0.9928 0.9926 0.9934 0.9944 0.9949 0.9926 0.997 0.9949 0.9948 0.992 0.9964 0.9926 0.9982 0.9955 0.9955 0.9958 0.9997 1.0001 1.0001 0.9918 0.9918 0.9931 1.0001 0.9926 0.9966 0.9932 0.9969 0.9925 0.9914 0.996 0.9952 0.9934 0.9939 0.9939 0.9906 0.9901 0.9948 0.995 0.9953 0.9953 0.9952 0.996 0.9948 0.9951 0.9931 0.9962 0.9948 0.9959 0.9962 0.9958 0.9948 0.9948 0.994 0.9942 0.9942 0.9948 0.9964 0.9958 0.9932 0.9986 0.9986 0.9988 0.9953 0.9983 1 0.9951 0.9983 0.9906 0.9981 0.9936 0.9951 0.9953 1.0005 0.9972 1 0.9969 1.0001 1.0001 1.0001 0.9934 0.9969 1.0001 0.9902 0.993 0.9914 0.9941 0.9967 0.9918 0.998 0.9967 0.9918 0.9957 0.9986 0.9958 0.9948 0.9918 0.9923 0.9998 0.9998 0.9914 0.9939 0.9966 0.995 0.9966 0.994 0.9972 0.9998 0.9998 0.9982 0.9924 0.9972 0.997 0.9954 0.9962 0.9972 0.9921 0.9905 0.9998 0.993 0.9941 0.9994 0.9962 0.992 0.9922 0.994 0.9897 0.9954 0.99 0.9948 0.9922 0.998 0.9944 0.9944 0.9986 0.9986 0.9986 0.9986 0.9986 0.996 0.9999 0.9986 0.9986 0.996 0.9951 0.9999 0.993 0.9982 0.992 0.9963 0.995 0.9956 0.997 0.9936 0.9935 0.9963 0.9967 0.9912 0.9981 0.9966 0.9967 0.9963 0.9935 0.9902 0.99 0.996 0.9966 0.9962 0.994 0.996 0.994 0.9944 0.9974 0.996 0.9922 0.9917 0.9918 0.9936 0.9938 0.9918 0.9939 0.9917 0.9981 0.9941 0.9928 0.9952 0.9898 0.9914 0.9981 0.9957 0.998 0.9957 0.9986 0.9983 0.9982 0.997 0.9947 0.997 0.9947 0.99416 0.99516 0.99496 0.9974 0.99579 0.9983 0.99471 0.9974 0.99644 0.99579 0.99699 0.99758 0.9977 0.99397 0.9983 0.99471 0.99243 0.9962 1.00182 0.99384 0.99582 0.9962 0.9924 0.99466 0.99212 0.99449 0.99748 0.99449 0.99748 0.99475 0.99189 0.99827 0.99752 0.99827 0.99479 0.99752 0.99642 1.00047 0.99382 0.99784 0.99486 0.99537 0.99382 0.99838 0.99566 0.99268 0.99566 0.99468 0.9933 0.99307 0.99907 0.99907 0.99907 0.99907 0.99471 0.99471 0.99907 0.99148 0.99383 0.99365 0.99272 0.99148 0.99235 0.99508 0.9946 0.99674 0.99018 0.99235 0.99084 0.99856 0.99591 0.9975 0.9944 0.99173 0.99378 0.99805 0.99534 0.99232 0.99805 0.99078 0.99534 0.99061 0.99182 0.9966 0.9912 0.99779 0.99814 0.99096 0.99379 0.99426 0.99228 0.99335 0.99595 0.99297 0.99687 0.99297 0.99687 0.99445 0.9986 0.99154 0.9981 0.98993 1.00241 0.99716 0.99437 0.9972 0.99756 0.99509 0.99572 0.99756 0.99175 0.99254 0.99509 0.99676 0.9979 0.99194 0.99077 0.99782 0.99942 0.99708 0.99353 0.99256 0.99199 0.9918 0.99354 0.99244 0.99831 0.99396 0.99724 0.99524 0.9927 0.99802 0.99512 0.99438 0.99679 0.99652 0.99698 0.99474 0.99511 0.99582 0.99125 0.99256 0.9911 0.99168 0.9911 0.99556 1.00098 0.99516 0.99516 0.99518 0.99347 0.9929 0.99347 0.99841 0.99362 0.99361 0.9914 0.99114 0.9925 0.99453 0.9938 0.9938 0.99806 0.9961 1.00016 0.9916 0.99116 0.99319 0.99517 0.99514 0.99566 0.99166 0.99587 0.99558 0.99117 0.99399 0.99741 0.99405 0.99622 1.00051 0.99803 0.99405 0.99773 0.99397 0.99622 0.99713 0.99274 1.00118 0.99176 0.9969 0.99771 0.99411 0.99771 0.99411 0.99194 0.99558 0.99194 0.99558 0.99577 0.99564 0.99578 0.99888 1.00014 0.99441 0.99594 0.99437 0.99594 0.9979 0.99434 0.99203 0.998 0.99316 0.998 0.99314 0.99316 0.99612 0.99295 0.99394 0.99642 0.99642 0.99248 0.99268 0.99954 0.99692 0.99592 0.99592 0.99692 0.99822 0.99822 0.99402 0.99404 0.99787 0.99347 0.99838 0.99839 0.99375 0.99155 0.9936 0.99434 0.9922 0.99571 0.99658 0.99076 0.99496 0.9937 0.99076 0.99542 0.99825 0.99289 0.99432 0.99523 0.99542 0.9959 0.99543 0.99662 0.99088 0.99088 0.99922 0.9966 0.99466 0.99922 0.99836 0.99836 0.99238 0.99645 1 1 0.99376 1 0.99513 0.99556 0.99556 0.99543 0.99886 0.99526 0.99166 0.99691 0.99732 0.99573 0.99656 0.99112 0.99214 0.99165 0.99004 0.99463 0.99683 0.99004 0.99596 0.99898 0.99114 0.99508 0.99306 0.99898 0.99508 0.99114 0.99342 0.99345 0.99772 0.99239 0.99502 0.99502 0.99479 0.99207 0.99497 0.99828 0.99542 0.99542 0.99228 0.99706 0.99497 0.99669 0.99828 0.99269 0.99196 0.99662 0.99475 0.99544 0.99944 0.99475 0.99544 0.9966 0.99066 0.9907 0.99066 0.998 0.9907 0.99066 0.99307 0.99106 0.99696 0.99106 0.99307 0.99167 0.99902 0.98992 0.99182 0.99556 0.99582 0.99182 0.98972 0.99352 0.9946 0.99273 0.99628 0.99582 0.99553 0.98914 0.99354 0.99976 0.99808 0.99808 0.99808 0.99808 0.99808 0.99808 0.9919 0.99808 0.99499 0.99655 0.99615 0.99296 0.99482 0.99079 0.99366 0.99434 0.98958 0.99434 0.99938 0.99059 0.99835 0.98958 0.99159 0.99159 0.98931 0.9938 0.99558 0.99563 0.98931 0.99691 0.9959 0.99159 0.99628 0.99076 0.99678 0.99678 0.99678 0.99089 0.99537 1.0002 0.99628 0.99089 0.99678 0.99076 0.99332 0.99316 0.99272 0.99636 0.99202 0.99148 0.99064 0.99884 0.99773 1.00013 0.98974 0.99773 1.00013 0.99112 0.99136 0.99132 0.99642 0.99488 0.99527 0.99578 0.99352 0.99199 0.99198 0.99756 0.99578 0.99561 0.99347 0.98936 0.99786 0.99705 0.9942 0.9948 0.99116 0.99688 0.98974 0.99542 0.99154 0.99118 0.99044 0.9914 0.9979 0.98892 0.99114 0.99188 0.99583 0.98892 0.98892 0.99704 0.9911 0.99334 0.99334 0.99094 0.99014 0.99304 0.99652 0.98944 0.99772 0.99367 0.99304 0.99183 0.99126 0.98944 0.99577 0.99772 0.99652 0.99428 0.99388 0.99208 0.99256 0.99388 0.9925 0.99904 0.99216 0.99208 0.99428 0.99165 0.99924 0.99924 0.99924 0.9956 0.99562 0.9972 0.99924 0.9958 0.99976 0.99976 0.99296 0.9957 0.9958 0.99579 0.99541 0.99976 0.99518 0.99168 0.99276 0.99085 0.99873 0.99172 0.99312 0.99276 0.9972 0.99278 0.99092 0.9962 0.99053 0.99858 0.9984 0.99335 0.99053 0.9949 0.9962 0.99092 0.99532 0.99727 0.99026 0.99668 0.99727 0.9952 0.99144 0.99144 0.99015 0.9914 0.99693 0.99035 0.99693 0.99035 0.99006 0.99126 0.98994 0.98985 0.9971 0.99882 0.99477 0.99478 0.99576 0.99578 0.99354 0.99244 0.99084 0.99612 0.99356 0.98952 0.99612 0.99084 0.99244 0.99955 0.99374 0.9892 0.99144 0.99352 0.99352 0.9935 0.99237 0.99144 0.99022 0.99032 1.03898 0.99587 0.99587 0.99587 0.99976 0.99354 0.99976 0.99552 0.99552 0.99587 0.99604 0.99584 0.98894 0.9963 0.993 0.98894 0.9963 0.99068 0.98964 0.99604 0.99584 0.9923 0.99437 0.993 0.99238 0.99801 0.99802 0.99566 0.99067 0.99066 0.9929 0.9934 0.99067 0.98912 0.99066 0.99228 0.98912 0.9958 0.99052 0.99312 0.9968 0.99502 0.99084 0.99573 0.99256 0.9959 0.99084 0.99084 0.99644 0.99526 0.9954 0.99095 0.99188 0.9909 0.99256 0.9959 0.99581 0.99132 0.98936 0.99136 0.99142 0.99232 0.99232 0.993 0.99311 0.99132 0.98993 0.99208 0.99776 0.99839 0.99574 0.99093 0.99156 0.99278 0.9924 0.98984 0.99035 0.9924 0.99165 0.9923 0.99278 0.99008 0.98964 0.99156 0.9909 0.98984 0.9889 0.99178 0.99076 0.9889 0.99046 0.98999 0.98946 0.98976 0.99046 0.99672 0.99482 0.98945 0.98883 0.99362 0.99075 0.99436 0.98988 0.99158 0.99265 0.99195 0.99168 0.9918 0.99313 0.9895 0.9932 0.99848 0.9909 0.99014 0.9952 0.99652 0.99848 0.99104 0.99772 0.9922 0.99076 0.99622 0.9902 0.99114 0.9938 0.99594 0.9902 0.99035 0.99032 0.99558 0.99622 0.99076 0.99413 0.99043 0.99043 0.98982 0.98934 0.9902 0.99449 0.99629 0.9948 0.98984 0.99326 0.99834 0.99555 0.98975 0.99216 0.99216 0.99834 0.9901 0.98975 0.99573 0.99326 0.99215 0.98993 0.99218 0.99555 0.99564 0.99564 0.99397 0.99576 0.99601 0.99564 0.99397 0.98713 0.99308 0.99308 0.99582 0.99494 0.9929 0.99471 0.9929 0.9929 0.99037 0.99304 0.99026 0.98986 0.99471 0.98951 0.99634 0.99368 0.99792 0.99026 0.99362 0.98919 0.99835 0.99835 0.99038 0.99104 0.99038 0.99286 0.99296 0.99835 0.9954 0.9914 0.99286 0.99604 0.99604 0.99119 0.99007 0.99507 0.99596 0.99011 0.99184 0.99469 0.99469 0.99406 0.99305 0.99096 0.98956 0.9921 0.99496 0.99406 0.99406 0.9888 0.98942 0.99082 0.98802 17.3 1.4 1.3 1.6 5.25 2.4 14.6 11.8 1.5 1.8 7.7 2 1.8 1.4 16.7 8.1 8 4.7 8.1 2.1 16.7 6.4 1.5 7.6 1.5 12.4 1.3 1.7 8.1 7.1 7.6 2.3 6.5 1.4 12.7 1.6 1.1 1.2 6.5 4.6 0.6 10.6 4.6 4.8 2.7 12.6 0.6 9.2 6.6 7 8.45 11.1 18.15 18.15 4.1 4.1 4.6 18.15 4.9 8.3 1.4 11.5 1.8 1.6 2.4 4.9 1.8 4.3 4.4 1.4 1.6 1.3 5.2 5.6 5.3 4.9 2.4 1.6 2.1 1.4 7.1 1.6 10.7 11.1 10.7 1.6 1.6 1.5 1.5 1.6 1.6 8 7.7 2.7 15.1 15.1 8.9 6 12.3 13.1 6.7 12.3 2.3 11.1 1.5 6.7 6 15.2 10.2 13.1 10.7 17.1 17.1 17.1 1.9 10.7 17.1 1.2 1.2 3.1 1.5 10.7 4.9 12.6 10.7 4.9 12.15 12 1.7 2.6 1.4 1.9 16.9 16.9 2.1 7 7.1 5.9 7.1 8.7 13.2 15.3 15.3 13.2 2.7 10.65 10 6.8 15.6 13.2 5.1 3 15.3 2.1 1.9 8.6 8.75 3.6 4.7 1.3 1.8 9.7 4 2.4 4.7 18.8 1.8 1.8 12.8 12.8 12.8 12.8 12.8 7.8 16.75 12.8 12.8 7.8 5.4 16.75 1.3 10.1 3.8 10.9 6.6 9.8 11.7 1.2 1.4 9.6 12.2 2.6 10.7 4.9 12.2 9.6 1.4 1.1 1 8.2 11.3 7.3 2.3 8.2 2.1 2 10 15.75 3.9 2 1.5 1.6 1.4 1.5 1.4 2 13.8 1.3 3.8 6.9 2.2 1.6 13.8 10.8 12.8 10.8 15.3 12.1 12 11.6 9.2 11.6 9.2 2.8 1.6 6.1 8.5 7.8 14.9 6.2 8.5 8.2 7.8 10.6 11.2 11.6 7.1 14.9 6.2 1.7 7.7 17.3 1.4 7.7 7.7 3.4 1.6 1.4 1.4 10.4 1.4 10.4 4.1 2.8 15.7 10.9 15.7 6.5 10.9 5.9 17.3 1.4 13.5 8.5 6.2 1.4 14.95 7.7 1.3 7.7 1.3 1.3 1.3 15.6 15.6 15.6 15.6 4.9 5 15.6 6.5 1.4 2.7 1.2 6.5 6.4 6.9 7.2 10.6 3.5 6.4 2.3 12.05 7 11.8 1.4 5 2.2 14.6 1.6 1.3 14.6 2.8 1.6 3.3 6.3 8.1 1.6 10.6 11.8 1.7 8.1 1.4 1.3 1.8 7.2 1.1 11.95 1.1 11.95 2.2 12.7 1.4 10.6 1.9 17.8 10.2 4.8 9.8 8.4 7.2 4.8 8.4 4.5 1.4 7.2 11 11.1 2.6 2 10.1 13.3 11.4 1.3 1.4 1.4 7 2 1.2 12.9 5 10.1 3.75 1.7 12.6 1.3 1.6 7.6 8.1 14.9 6 6 7.2 3 1.2 2 4.9 2 8.9 16.45 2 1.9 5.1 4.4 5.8 4.4 12.9 1.3 1.3 1.2 2.7 1.7 8.2 1.5 1.5 12.9 3.9 17.75 4.9 1.6 1.4 2 2 8.2 2.1 1.8 8.5 4.45 5.8 13 2.7 7.3 19.1 8.8 2.7 7.4 2.3 6.85 11.4 0.9 19.35 7.9 11.75 7.7 3 7.7 3 1.5 7.5 1.5 7.5 8.3 7.05 8.4 13.9 17.5 5.6 9.4 4.8 9.4 9.7 6.3 1.6 14.6 2.5 14.6 2.6 2.5 8.2 1.5 2.3 10 10 1.6 1.6 16 10.4 7.4 7.4 10.4 16.05 16.05 2.6 2.5 10.8 1.2 12.1 11.95 1.7 0.8 1.4 1.3 6.3 10.3 15.55 1.5 1.5 1.4 1.5 7.9 13 1 4.85 7.1 7.9 7.5 7.6 10.3 1.7 1.7 19.95 7.7 5.3 19.95 12.7 12.7 1.5 11.3 18.1 18.1 7 18.1 6.4 1.4 1.4 3.1 14.1 7.7 5.2 11.6 10.4 7.5 11.2 0.8 1.4 4.7 3.1 4 11.3 3.1 8.1 14.8 1.4 8.1 3.5 14.8 8.1 1.4 1.5 1.5 12.8 1.6 7.1 7.1 11.2 1.7 6.7 17.3 8.6 8.6 1.5 12.1 6.7 10.7 17.3 1.8 1.4 7.5 4.8 7.1 16.9 4.8 7.1 11.3 1.1 1.2 1.1 12.9 1.2 1.1 1.2 2.3 10 2.3 1.2 1.4 14.9 1.8 1.8 7 8.6 1.8 1.1 1.3 4.9 1.9 10.4 10 8.6 1.7 1.7 18.95 12.8 12.8 12.8 12.8 12.8 12.8 0.7 12.8 1.4 13.3 8.5 1.5 11.7 5 1.2 2.1 1.4 2.1 16 1.1 15.3 1.4 2.8 2.8 0.9 2.5 8.1 8.2 0.9 11.1 7.8 2.8 10.1 3.2 14.2 14.2 14.2 2.9 6 20.4 10.1 2.9 14.2 3.2 0.95 1.7 1.7 9 1.3 1.4 2.4 16 11.4 14.35 2.1 11.4 14.35 1.1 1.1 1.2 15.8 5.2 5.2 9.6 5.2 1.2 0.8 14.45 9.6 6.9 3.4 2.3 11 5.95 5.1 5.4 1.2 12.6 1 6.6 1.5 1 1.1 6.6 8.2 2 1.4 2 7.5 2 2 13.3 2.85 5.6 5.6 1 3.2 1 7.1 2.4 11.2 9.5 1 1.8 2.6 2.4 8 11.2 7.1 3.3 10.3 1.2 1.6 10.3 9.65 16.4 1.5 1.2 3.3 5 16.3 16.3 16.3 6.5 6.4 10.2 16.3 7.4 13.7 13.7 1.3 7.4 7.4 7.45 7.2 13.7 10.4 1.1 6.5 4.6 13.9 5.2 1.7 6.5 16.4 3.6 1.5 12.4 1.7 6.2 6.2 2.6 1.7 9.3 12.4 1.5 9.1 12 4.8 12.3 12 2.7 3.6 3.6 4.3 1.8 11.8 1.8 11.8 1.8 1.4 6.6 1.55 0.7 6.4 11.8 4.3 5.1 5.8 5.9 1.3 1.4 1.2 7.4 10.8 1.8 7.4 1.2 1.4 14.4 1.7 3.6 3.6 10.05 10.05 10.5 1.9 3.6 1.65 1.9 65.8 6.85 7.4 7.4 20.2 11 20.2 6.2 6.2 6.85 8 8.2 2.2 10.1 7.2 2.2 10.1 1.6 1.3 8 8.2 5.3 14 7.2 1.6 11.8 9.6 6.1 2.7 3.6 1.7 1.6 2.7 1 0.9 1.6 1 10.6 2 1.2 6.2 9.2 5 6.3 3.3 8 1.2 1.2 16.2 11.6 7.2 1.1 3.4 1.4 3.3 8 9.3 2.3 0.9 3.5 1.7 1.3 1.3 5.6 7.4 2.3 1 1.5 10 14.9 9.3 1 1 5.9 5 1.25 3.9 5 0.8 1 5.9 1.6 1.3 1 1.1 1.25 1.4 1.2 5 1.4 1.7 1.8 1.6 1.5 1.7 13.9 5.9 2.1 1.1 6.7 2.7 6.7 3.95 7.75 10.6 1.6 2.5 0.7 11.1 5.15 4.7 9.7 1.7 1.4 2 7.5 9.7 0.8 13.1 1.1 2.2 8.9 1.1 0.9 1.7 6.9 1.1 1 1 7.6 8.9 2.2 1.2 1 1 3.1 1.95 2.2 8.75 11.9 2.7 5.45 6.3 14.4 7.8 1.6 9.1 9.1 14.4 1.3 1.6 11.3 6.3 0.7 1.25 0.7 7.8 10.3 10.3 7.8 8.7 8.3 10.3 7.8 1.2 8.3 8.3 6.2 5 1.8 1.6 1.8 1.8 2.9 6 0.9 1.1 1.6 5.45 14.05 8 13.1 4.9 1.3 2.2 14.9 14.9 0.95 1.4 0.95 1.7 5.6 14.9 7.1 1.2 9.6 11.4 11.4 7.9 5 11.1 8 3.8 10.55 10.2 10.2 9.8 6.3 1.1 4.5 6.3 10.9 9.8 9.8 0.8 0.8 1.2 1.3 9.8 10.2 10.9 6.3 6.3 1.2 0.9 1.1 4.5 3.7 18.1 1.35 5.5 3.1 12.85 19.8 8.25 12.85 3.8 6.9 8.25 11.7 4.6 4 19.8 12.85 1.2 8.9 11.7 6.2 14.8 14.8 10.8 1.6 8.3 8.4 2.5 3.5 17.2 2.1 12.2 11.8 16.8 17.2 1.1 14.7 5.5 6.1 1.2 1.3 8.7 1.7 8.7 10.2 4.5 5.9 1.7 1.4 5.4 7.9 1.1 7 7 7.6 7 12.3 15.3 12.3 1.2 2.3 6.1 7.6 10.2 4.1 2.9 8.5 1.5 3.1 7.9 3.5 4.9 1.1 7 1.2 4.5 2.6 9.9 4.5 9.5 1.5 3.2 2.6 11.2 3.2 2.3 4.9 4.9 1.4 1.5 6.7 2.1 4.3 10.9 7 2.3 2.5 2.6 3.2 2.5 14.7 4.5 2.2 1.9 1.6 17.3 4.2 4.2 2.5 1.9 1.4 0.8 8 1.6 1.7 5.5 17.3 8.6 6.9 2.1 2.2 1.5 2.5 17.6 4.2 2.9 4.8 11.9 0.9 1.3 6.4 4.3 11.9 8.1 1.3 0.9 17.2 17.2 17.2 8.7 17.2 8.7 7.5 17.2 4.6 3.7 2.2 7.4 15.1 7.4 4.8 7.9 1 15.1 7.4 4.8 4.6 1.4 6.2 6.1 5.1 6.3 0.9 2.3 6.6 7.5 8.6 11.9 2.3 7.1 4.3 1.1 1 7.9 1 1 1 7.3 1.7 1.3 6.4 1.8 1.5 3.8 7.9 1 1.2 5.3 9.1 6.5 9.1 6.3 5.1 6.5 2.4 9.1 7.5 5 6.75 1.2 1.6 16.05 5 12.4 0.95 4.6 1.7 1 1.3 5 2.5 2.6 2.1 12.75 1.1 12.4 3.7 2.65 2.5 8.2 7.3 1.1 6.6 7 14.5 11.8 3 3.7 6 4.6 2.5 3.3 1 1.1 1.4 3.3 8.55 2.5 6.7 3.8 4.5 4.6 4.2 11.3 5.5 4.2 2.2 14.5 14.5 14.5 14.5 14.5 14.5 1.5 18.75 3.6 1.4 5.1 10.5 2 2.6 9.2 1.8 5.7 2.4 1.9 1.4 0.9 4.6 1.4 9.2 1.4 1.8 2.3 2.3 4.4 6.4 2.9 2.8 2.9 4.4 8.2 1 2.9 7 1.8 1.5 7 8.2 7.6 2.3 8.7 1 2.9 6.7 5 1.9 2 1.9 8.5 12.6 5.2 2.1 1.1 1.3 1.1 9.2 1.2 1.1 8.3 1.8 1.4 15.7 4.35 1.8 1.6 2 5 1.8 1.3 1 1.4 8.1 8.6 3.7 5.7 2.35 13.65 13.65 13.65 15.2 4.6 1.2 4.6 6.65 13.55 13.65 9.8 10.3 6.7 15.2 9.9 7.2 1.1 8.3 11.25 12.8 9.65 12.6 12.2 8.3 11.25 1.3 9.9 7.2 1.1 1.1 4.8 1.1 1.4 1.7 10.6 1.4 1.1 5.55 2.1 1.7 9 1.7 1.8 4.7 11.3 3.6 6.9 3.6 4.9 6.95 1.9 4.7 11.3 1.8 11.3 8.2 8.3 9.55 8.4 7.8 7.8 10.2 5.5 7.8 7.4 3.3 5 3.3 5 1.3 1.2 7.4 7.8 9.9 0.7 4.6 5.6 9.5 14.8 4.6 2.1 11.6 1.2 11.6 2.1 20.15 4.7 4.3 14.5 4.9 14.55 14.55 10.05 4.9 14.5 14.55 15.25 3.15 1.3 5.2 1.1 7.1 8.8 18.5 8.8 1.4 1.2 5 1.6 18.75 6 9.4 9.7 4.75 6 5.35 5.35 6.8 6.9 1.4 0.9 1.2 1.3 2.6 12 9.85 3.85 2 1.6 7.8 1.9 2 10.3 1.1 12 3.85 9.85 2 4 1.1 10.4 6.1 1.8 10.4 4.7 4 1.1 6.4 8.15 6.1 4.8 1.2 1.1 1.4 7.4 1.8 1 15.5 15.5 8.4 2.4 3.95 19.95 2 3 15.5 8.4 14.3 4.2 1.4 3 4.9 2.4 14.3 10.7 11 1.4 1.2 12.9 10.8 1.3 2 1.8 1.2 7.5 9.7 3.8 7.2 9.7 6.3 6.3 0.8 8.6 6.3 3.1 7.2 7.1 6.4 14.7 7.2 7.1 1.9 1.2 4.8 1.2 3.4 4.3 8.5 1.8 1.8 19.5 8.5 19.9 8.3 1.8 1.1 16.65 16.65 16.65 0.9 6.1 10.2 0.9 16.65 3.85 4.4 4.5 3.2 4.5 4.4 9.7 4.2 4.2 1.1 9.7 4.2 5.6 4.2 1.6 1.6 1.1 14.6 2.6 1.2 7.25 6.55 7 1.5 1.4 7.25 1 4.2 17.5 17.5 17.5 1.5 1.3 3.9 4.2 7.6 1 1.1 11.8 1.4 9.7 12.9 1.6 7.2 7.1 1.9 8.8 7.2 1.4 14.3 14.3 8.8 1.4 1.8 14.3 7.2 1.2 11.8 0.9 12.6 26.05 4.7 12.6 1.2 26.05 6.1 11.8 0.9 5.6 5.3 5.7 8 8 17.6 8 8.8 1.5 1.4 4.8 2.4 3.7 4.9 5.7 5.7 4.9 2 5.1 4.5 3.2 6.65 1.6 4 17.75 1.4 17.75 7.2 5.7 8.5 11.4 5.4 2.7 4.3 1.2 1.8 1.3 5.7 2.7 11.7 4.3 11 1.6 11.6 6.2 1.8 1.2 1 2.4 1.2 8.2 18.8 9.6 12.9 9.2 1.2 12.9 8 12.9 1.6 12 2.5 9.2 4.4 8.8 9.6 8 18.8 1.3 1.2 12.9 1.2 1.6 1.5 18.15 13.1 13.1 13.1 13.1 1 1.6 11.8 1.4 1 13.1 10.6 10.4 1.1 7.4 1.2 3.4 18.15 8 2.5 2 2 6.9 1.2 9.4 2.9 6.9 5.4 1.3 20.8 10.3 1.3 1.6 13.1 1.8 8 1.6 1.4 14.7 14.7 14.7 14.7 14.7 14.7 14.7 1.8 10.6 12.5 6.8 14.7 2.9 1.4 1.4 2.1 7.4 2.9 1.4 1.4 7.4 5 2.5 6.1 2.7 2.1 12.9 12.9 12.9 13.7 12.9 2.4 9.8 13.7 1.3 12.1 6.1 7.7 6.1 1.4 7.7 12.1 6.8 9.2 8.3 17.4 2.7 12.8 8.2 8.1 8.2 8.3 8 11.8 12 1.7 17.4 13.9 10.7 2 2.2 1.3 1.1 2 6.4 1.3 1.1 10.7 6.4 6.3 6.4 15.1 2 2 2.2 12.1 8.8 8.8 5.1 6.8 6.8 3.7 12.2 5.7 8.1 2.5 4 6.8 1 5.1 5.8 10.6 3.5 3.5 16.4 4.8 3.3 1.2 1.2 4.8 3.3 2.5 8.7 1.6 4 2.5 16.2 9 16.2 1.4 7 9 3.1 1.5 4.6 4.8 4.6 1.5 2.7 6.3 7.2 7.2 12.4 6.6 6.6 4 4.8 1.3 7.2 11.1 12.4 9.8 6.6 13.3 11.7 8 1.6 16.55 1.5 10.2 6.6 17.8 17.8 1.5 7.4 17.8 2 7.4 2 17.8 12.1 8.2 1.5 8.7 3.5 6.4 2.1 7.7 12.3 1.3 8.7 3.5 1.1 2.8 3.5 1.9 3.8 3.8 2.4 4.8 4.8 6.2 1.3 3.8 1.5 4.8 1.9 6.2 7.9 1.6 1.4 2.6 14.8 2.4 0.9 0.9 1.2 9.9 3.9 15.6 15.6 1.5 1.6 7.8 5.6 1.3 16.7 7.95 6.7 1.1 6.3 8.9 1 1.5 6.6 6.2 6.3 2.1 2.2 5.4 8.9 1 17.9 2.6 1.3 17.9 2.6 2.3 4.3 7.1 7.1 11.9 11.7 5.8 3.8 12.4 6.5 7.1 7.6 7.9 2.8 10.6 2.8 1.5 7.6 7.9 1.7 7.6 7.5 1.7 1.7 12.1 4.5 1.7 8 7.6 8.6 8.6 14.6 1.6 8.6 14.6 1.1 3.7 8.9 8.9 4.7 8.9 3.1 5.8 5.8 5.8 1 15.8 1.5 5.2 1.5 2.5 1 15.8 5.9 3.1 3.1 5.8 11.5 18 4.8 8.5 1.6 18 4.8 5.9 1.1 8.5 13.1 4.1 2.9 13.1 1.1 1.5 7.75 1.15 1 17.8 5.7 17.8 7.4 1.4 1.4 1 4.4 1.6 7.9 15.5 15.5 15.5 15.5 17.55 13.5 13.5 1.3 15.5 11.6 7.9 15.5 17.55 11.6 13.15 1.9 13.5 1.3 6.1 6.1 1.9 1.9 1.6 11.3 8.4 8.3 8.4 12.2 8 1.3 12.7 1.3 10.5 12.5 9.6 1.5 1.5 7.8 10.8 12.5 8.6 1.2 14.5 3.7 1.1 1.1 3.8 4.6 10.2 7.9 2.4 10.7 4.9 10.7 1.1 7.9 5.6 2.4 14.2 9.5 9.5 4.1 4.7 1.4 0.9 20.3 3.5 2.7 1.2 1.2 2 1.1 1.5 1.2 18.1 18.1 3.6 3.5 12.1 17.45 12.1 3 1.6 5.7 5.6 6.8 15.6 6 1.8 8.6 8.6 11.5 7.8 2.4 5 8.6 1.5 5.4 11.9 11.9 9 10 11.9 11.9 15.5 5.4 15 1.4 9.4 3.7 15 1.4 6.5 1.4 6.3 13.7 13.7 13.7 13.7 13.7 13.7 1.5 1.6 1.4 3.5 1 1.4 1.5 13.7 1.6 5.2 1.4 11.9 2.4 3.2 1.7 4.2 15.4 13 5.6 9.7 2.5 4 15.4 1.2 2 1.2 5.1 1.4 1.2 6.5 1.3 6.5 2.7 1.3 7.4 12.9 1.3 1.2 2.6 2.3 1.3 10.5 2.6 14.4 1.2 3.1 1.7 6 11.8 6.2 1.4 12.1 12.1 12.1 3.9 4.6 12.1 1.2 8.1 3.9 1.1 6.5 10.1 10.7 3.2 12.4 5.2 5 2.5 9.2 6.9 2 15 15 1.2 15 1.8 10.8 3.9 4.2 2 13.5 13.3 2.2 1.4 1.6 2.2 14.8 1.8 14.8 1.3 9.9 5.1 5.1 1.5 1.5 11.1 5.25 2.3 7.9 8 1.4 5.25 2.3 2.3 3.5 13.7 9.9 15.4 16 16 16 16 2.4 5.5 2.3 16.8 16 17.8 17.8 6.8 6.8 6.8 6.8 1.6 4.7 11.8 17.8 15.7 5.8 15.7 9 15.7 5.8 8.8 10.2 6.6 6.5 8.9 11.1 4.2 1.6 7.4 11.5 1.6 2 4.8 9.8 1.9 4.2 1.6 7.3 5.4 10.4 1.9 7.3 5.4 7.7 11.5 1.2 2.2 1 8.2 8.3 8.2 9.3 8.1 8.2 8.3 13.9 13.9 13.9 13.9 13.9 13.9 13.9 2 13.9 15.7 1.2 1.5 1.2 3.2 1.2 2.6 13.2 10.4 5.7 2.5 1.6 1.4 7.4 2.5 5.6 3.6 7.5 5.8 1.6 1.5 2.9 11.2 9.65 10.1 3.2 11.2 11.45 9.65 4.5 2.7 3.5 1.7 2.1 4.8 5 2.6 6.6 5 7.3 5 1.7 2.6 8.2 8.2 5 1.2 7.1 9.5 15.8 15.5 15.8 17.05 12.7 12.3 11.8 11.8 11.8 12.3 11.8 13.6 5.2 6.2 7.9 7.9 3.3 2.8 7.9 3.3 6.3 4.9 10.4 4.9 10.4 16 6.3 2.2 17.3 17.3 17.3 17.3 2.2 2.2 17.3 6.6 6.5 12.3 5 2.8 13.6 2.8 5.4 10.9 1.7 9.15 4.5 9.15 1.4 5.9 16.4 1.2 16.4 5.9 7.8 7.8 2.8 2.9 2.5 12.8 12.2 7.7 2.8 2.9 17.3 19.3 19.3 19.3 2.7 6.4 17.3 2.4 2.8 1.7 15.4 15.4 4.1 6.6 1.2 2.1 1 1.1 1.4 1.6 9.8 1.9 1.3 7.9 7.9 4.5 22.6 7.9 3.5 1.2 4.5 2 7.8 0.9 2.9 2.9 3.5 4.2 9.7 10.5 1.1 16.1 1.1 8.1 6.2 7.7 2.4 16.3 2.3 8.4 8.5 6 1.1 1.75 2.6 1.3 2.1 1.1 1.1 2.8 9 2.8 2.2 5.1 3.5 12.7 7.5 2 3.5 14.3 9.8 12.7 12.7 5.1 3.5 12.7 12.9 12.9 1.3 10.5 1.5 12.7 12.9 1.2 6.2 8.8 3.9 1.3 9.1 9.1 3.9 1.8 2.1 1.4 14.7 9.1 1.9 1.8 9.6 3.9 1.3 11.8 1.9 12 7.9 9.3 4.6 2.2 10.2 10.6 1.4 9.1 11.1 9.1 4.4 2.8 1.1 1.3 1.2 3.3 9.7 2.3 1.1 11.4 1.2 14.7 13.8 1.3 6.3 7.9 2 11.8 1.2 10 5.2 1.2 7.2 9.9 5.3 13.55 2.2 9.9 4.3 13 13.55 1 1.1 6.9 13.4 4.6 9.9 3 5.8 12.9 3.2 0.8 2.5 2.4 7.2 7.3 6.3 4.25 1.2 2 4.25 4.7 4.5 1.4 4.1 5.3 4.2 6.65 8.2 2.6 2.6 2 12.2 2.3 8.2 5 10.7 10.8 1.7 1.3 1.7 12.7 1.3 1.2 1.3 5.7 3.4 1.1 1 1 1.65 6.8 6.8 4.9 1.4 2.5 10.8 10.8 10.8 10.8 2.8 1.3 2 1.1 8.2 6 6.1 8.2 8.8 6.1 6 1.2 11.4 1.3 1.3 6.2 3.2 4.5 9.9 6.2 11.4 1.3 1.3 0.9 0.7 1 1 10.4 1.3 12.5 12.5 12.5 12.5 19.25 1.1 12.5 19.25 9 1.2 9 1.3 12.8 12.8 7.6 7.6 1.4 8.3 9 1.85 12.55 1.4 1.8 4 12.55 9 3 1.85 7.9 2.6 1.2 7.1 7.9 1.3 10.7 7.7 8.4 10.7 12.7 1.8 7.7 10.5 1.6 1.85 10.5 10.5 1 1.2 1.7 1.6 9 1.9 1.2 1.5 3.9 3.6 1.2 5 2.9 10.4 11.4 18.35 18.4 1.2 7.1 1.3 1.5 10.2 2.2 3.5 3.5 3.9 7.4 7.4 11 1.5 3.9 5.4 1.5 5 1.2 13 13 13 13 8.6 1.7 1.2 1.2 1.2 2 19.4 0.8 6.3 6.4 12.1 12.1 12.9 2.4 4.3 4.2 12.9 1.7 2.2 12.1 3.4 7.4 7.3 1.1 1.1 1.4 14.5 8 1.1 1.1 2.2 5.8 0.9 6.4 10.9 7.3 8.3 1.3 3.3 1 1.1 1 5.1 3.2 12.6 3.7 1.7 5.1 1 1.3 1.5 4.6 10.3 6.1 6.1 1.2 10.3 9.9 1.6 1.1 1.5 1.2 1.5 1.1 11.5 7.8 7.4 1.45 8.9 1.1 1 2.5 1.1 2.4 2.3 5.1 2.5 8.9 2.5 8.9 1.6 1.4 3.9 13.7 13.7 9.2 7.8 7.6 7.7 3 1.3 4 1.1 2 1.9 1.4 4.5 10.1 6.6 1.9 12.4 1.6 2.5 1.2 2.5 0.8 0.9 8.1 8.1 11.75 1.3 1.9 8.3 8.1 5.7 1.9 1.2 11.75 2.2 0.9 1.3 1.6 8 1.2 1.1 0.8
\ No newline at end of file
diff --git a/pandas/tests/reshape/merge/__init__.py b/pandas/tests/reshape/merge/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tools/data/allow_exact_matches.csv b/pandas/tests/reshape/merge/data/allow_exact_matches.csv
similarity index 100%
rename from pandas/tests/tools/data/allow_exact_matches.csv
rename to pandas/tests/reshape/merge/data/allow_exact_matches.csv
diff --git a/pandas/tests/tools/data/allow_exact_matches_and_tolerance.csv b/pandas/tests/reshape/merge/data/allow_exact_matches_and_tolerance.csv
similarity index 100%
rename from pandas/tests/tools/data/allow_exact_matches_and_tolerance.csv
rename to pandas/tests/reshape/merge/data/allow_exact_matches_and_tolerance.csv
diff --git a/pandas/tests/tools/data/asof.csv b/pandas/tests/reshape/merge/data/asof.csv
similarity index 100%
rename from pandas/tests/tools/data/asof.csv
rename to pandas/tests/reshape/merge/data/asof.csv
diff --git a/pandas/tests/tools/data/asof2.csv b/pandas/tests/reshape/merge/data/asof2.csv
similarity index 100%
rename from pandas/tests/tools/data/asof2.csv
rename to pandas/tests/reshape/merge/data/asof2.csv
diff --git a/pandas/tests/tools/data/quotes.csv b/pandas/tests/reshape/merge/data/quotes.csv
similarity index 100%
rename from pandas/tests/tools/data/quotes.csv
rename to pandas/tests/reshape/merge/data/quotes.csv
diff --git a/pandas/tests/tools/data/quotes2.csv b/pandas/tests/reshape/merge/data/quotes2.csv
similarity index 100%
rename from pandas/tests/tools/data/quotes2.csv
rename to pandas/tests/reshape/merge/data/quotes2.csv
diff --git a/pandas/tests/tools/data/tolerance.csv b/pandas/tests/reshape/merge/data/tolerance.csv
similarity index 100%
rename from pandas/tests/tools/data/tolerance.csv
rename to pandas/tests/reshape/merge/data/tolerance.csv
diff --git a/pandas/tests/tools/data/trades.csv b/pandas/tests/reshape/merge/data/trades.csv
similarity index 100%
rename from pandas/tests/tools/data/trades.csv
rename to pandas/tests/reshape/merge/data/trades.csv
diff --git a/pandas/tests/tools/data/trades2.csv b/pandas/tests/reshape/merge/data/trades2.csv
similarity index 100%
rename from pandas/tests/tools/data/trades2.csv
rename to pandas/tests/reshape/merge/data/trades2.csv
diff --git a/pandas/tests/reshape/merge/test_join.py b/pandas/tests/reshape/merge/test_join.py
new file mode 100644
index 0000000000000..62c9047b17f3d
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_join.py
@@ -0,0 +1,789 @@
+# pylint: disable=E1103
+
+import numpy as np
+from numpy.random import randn
+import pytest
+
+from pandas._libs import join as libjoin
+import pandas.compat as compat
+from pandas.compat import lrange
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series, concat, merge
+from pandas.tests.reshape.merge.test_merge import NGROUPS, N, get_test_data
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
+
+a_ = np.array
+
+
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+class TestJoin(object):
+
+    def setup_method(self, method):
+        # aggregate multiple columns
+        self.df = DataFrame({'key1': get_test_data(),
+                             'key2': get_test_data(),
+                             'data1': np.random.randn(N),
+                             'data2': np.random.randn(N)})
+
+        # exclude a couple keys for fun
+        self.df = self.df[self.df['key2'] > 1]
+
+        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
+                              'key2': get_test_data(ngroups=NGROUPS // 2,
+                                                    n=N // 5),
+                              'value': np.random.randn(N // 5)})
+
+        index, data = tm.getMixedTypeDict()
+        self.target = DataFrame(data, index=index)
+
+        # Join on string value
+        self.source = DataFrame({'MergedA': data['A'], 'MergedD': data['D']},
+                                index=data['C'])
+
+    def test_cython_left_outer_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
+        max_group = 5
+
+        ls, rs = libjoin.left_outer_join(left, right, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
+                     6, 6, 7, 7, 8, 8, 9, 10])
+        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
+                     4, 5, 4, 5, 4, 5, -1, -1])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_cython_right_outer_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
+        max_group = 5
+
+        rs, ls = libjoin.left_outer_join(right, left, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        #            0        1        1        1
+        exp_li = a_([0, 1, 2, 3, 4, 5, 3, 4, 5, 3, 4, 5,
+                     #            2        2        4
+                     6, 7, 8, 6, 7, 8, -1])
+        exp_ri = a_([0, 0, 0, 1, 1, 1, 2, 2, 2, 3, 3, 3,
+                     4, 4, 4, 5, 5, 5, 6])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_cython_inner_join(self):
+        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
+        right = a_([1, 1, 0, 4, 2, 2, 1, 4], dtype=np.int64)
+        max_group = 5
+
+        ls, rs = libjoin.inner_join(left, right, max_group)
+
+        exp_ls = left.argsort(kind='mergesort')
+        exp_rs = right.argsort(kind='mergesort')
+
+        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
+                     6, 6, 7, 7, 8, 8])
+        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
+                     4, 5, 4, 5, 4, 5])
+
+        exp_ls = exp_ls.take(exp_li)
+        exp_ls[exp_li == -1] = -1
+
+        exp_rs = exp_rs.take(exp_ri)
+        exp_rs[exp_ri == -1] = -1
+
+        tm.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
+        tm.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
+
+    def test_left_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='left')
+
+        joined_both = merge(self.df, self.df2)
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='left')
+
+    def test_right_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='right')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='right')
+
+        joined_both = merge(self.df, self.df2, how='right')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='right')
+
+    def test_full_outer_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='outer')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='outer')
+
+        joined_both = merge(self.df, self.df2, how='outer')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='outer')
+
+    def test_inner_join(self):
+        joined_key2 = merge(self.df, self.df2, on='key2', how='inner')
+        _check_join(self.df, self.df2, joined_key2, ['key2'], how='inner')
+
+        joined_both = merge(self.df, self.df2, how='inner')
+        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
+                    how='inner')
+
+    def test_handle_overlap(self):
+        joined = merge(self.df, self.df2, on='key2',
+                       suffixes=['.foo', '.bar'])
+
+        assert 'key1.foo' in joined
+        assert 'key1.bar' in joined
+
+    def test_handle_overlap_arbitrary_key(self):
+        joined = merge(self.df, self.df2,
+                       left_on='key2', right_on='key1',
+                       suffixes=['.foo', '.bar'])
+        assert 'key1.foo' in joined
+        assert 'key2.bar' in joined
+
+    def test_join_on(self):
+        target = self.target
+        source = self.source
+
+        merged = target.join(source, on='C')
+        tm.assert_series_equal(merged['MergedA'], target['A'],
+                               check_names=False)
+        tm.assert_series_equal(merged['MergedD'], target['D'],
+                               check_names=False)
+
+        # join with duplicates (fix regression from DataFrame/Matrix merge)
+        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
+        joined = df.join(df2, on='key')
+        expected = DataFrame({'key': ['a', 'a', 'b', 'b', 'c'],
+                              'value': [0, 0, 1, 1, 2]})
+        assert_frame_equal(joined, expected)
+
+        # Test when some are missing
+        df_a = DataFrame([[1], [2], [3]], index=['a', 'b', 'c'],
+                         columns=['one'])
+        df_b = DataFrame([['foo'], ['bar']], index=[1, 2],
+                         columns=['two'])
+        df_c = DataFrame([[1], [2]], index=[1, 2],
+                         columns=['three'])
+        joined = df_a.join(df_b, on='one')
+        joined = joined.join(df_c, on='one')
+        assert np.isnan(joined['two']['c'])
+        assert np.isnan(joined['three']['c'])
+
+        # merge column not p resent
+        with pytest.raises(KeyError, match="^'E'$"):
+            target.join(source, on='E')
+
+        # overlap
+        source_copy = source.copy()
+        source_copy['A'] = 0
+        msg = ("You are trying to merge on float64 and object columns. If"
+               " you wish to proceed you should use pd.concat")
+        with pytest.raises(ValueError, match=msg):
+            target.join(source_copy, on='A')
+
+    def test_join_on_fails_with_different_right_index(self):
+        df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                        'b': np.random.randn(3)})
+        df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                         'b': np.random.randn(10)},
+                        index=tm.makeCustomIndex(10, 2))
+        msg = (r'len\(left_on\) must equal the number of levels in the index'
+               ' of "right"')
+        with pytest.raises(ValueError, match=msg):
+            merge(df, df2, left_on='a', right_index=True)
+
+    def test_join_on_fails_with_different_left_index(self):
+        df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                        'b': np.random.randn(3)},
+                       index=tm.makeCustomIndex(3, 2))
+        df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                         'b': np.random.randn(10)})
+        msg = (r'len\(right_on\) must equal the number of levels in the index'
+               ' of "left"')
+        with pytest.raises(ValueError, match=msg):
+            merge(df, df2, right_on='b', left_index=True)
+
+    def test_join_on_fails_with_different_column_counts(self):
+        df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
+                        'b': np.random.randn(3)})
+        df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
+                         'b': np.random.randn(10)},
+                        index=tm.makeCustomIndex(10, 2))
+        msg = r"len\(right_on\) must equal len\(left_on\)"
+        with pytest.raises(ValueError, match=msg):
+            merge(df, df2, right_on='a', left_on=['a', 'b'])
+
+    @pytest.mark.parametrize("wrong_type", [2, 'str', None, np.array([0, 1])])
+    def test_join_on_fails_with_wrong_object_type(self, wrong_type):
+        # GH12081 - original issue
+
+        # GH21220 - merging of Series and DataFrame is now allowed
+        # Edited test to remove the Series object from test parameters
+
+        df = DataFrame({'a': [1, 1]})
+        msg = ("Can only merge Series or DataFrame objects, a {} was passed"
+               .format(str(type(wrong_type))))
+        with pytest.raises(TypeError, match=msg):
+            merge(wrong_type, df, left_on='a', right_on='a')
+        with pytest.raises(TypeError, match=msg):
+            merge(df, wrong_type, left_on='a', right_on='a')
+
+    def test_join_on_pass_vector(self):
+        expected = self.target.join(self.source, on='C')
+        del expected['C']
+
+        join_col = self.target.pop('C')
+        result = self.target.join(self.source, on=join_col)
+        assert_frame_equal(result, expected)
+
+    def test_join_with_len0(self):
+        # nothing to merge
+        merged = self.target.join(self.source.reindex([]), on='C')
+        for col in self.source:
+            assert col in merged
+            assert merged[col].isna().all()
+
+        merged2 = self.target.join(self.source.reindex([]), on='C',
+                                   how='inner')
+        tm.assert_index_equal(merged2.columns, merged.columns)
+        assert len(merged2) == 0
+
+    def test_join_on_inner(self):
+        df = DataFrame({'key': ['a', 'a', 'd', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1]}, index=['a', 'b'])
+
+        joined = df.join(df2, on='key', how='inner')
+
+        expected = df.join(df2, on='key')
+        expected = expected[expected['value'].notna()]
+        tm.assert_series_equal(joined['key'], expected['key'],
+                               check_dtype=False)
+        tm.assert_series_equal(joined['value'], expected['value'],
+                               check_dtype=False)
+        tm.assert_index_equal(joined.index, expected.index)
+
+    def test_join_on_singlekey_list(self):
+        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
+        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
+
+        # corner cases
+        joined = df.join(df2, on=['key'])
+        expected = df.join(df2, on='key')
+
+        assert_frame_equal(joined, expected)
+
+    def test_join_on_series(self):
+        result = self.target.join(self.source['MergedA'], on='C')
+        expected = self.target.join(self.source[['MergedA']], on='C')
+        assert_frame_equal(result, expected)
+
+    def test_join_on_series_buglet(self):
+        # GH #638
+        df = DataFrame({'a': [1, 1]})
+        ds = Series([2], index=[1], name='b')
+        result = df.join(ds, on='a')
+        expected = DataFrame({'a': [1, 1],
+                              'b': [2, 2]}, index=df.index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_index_mixed(self, join_type):
+        # no overlapping blocks
+        df1 = DataFrame(index=np.arange(10))
+        df1['bool'] = True
+        df1['string'] = 'foo'
+
+        df2 = DataFrame(index=np.arange(5, 15))
+        df2['int'] = 1
+        df2['float'] = 1.
+
+        joined = df1.join(df2, how=join_type)
+        expected = _join_by_hand(df1, df2, how=join_type)
+        assert_frame_equal(joined, expected)
+
+        joined = df2.join(df1, how=join_type)
+        expected = _join_by_hand(df2, df1, how=join_type)
+        assert_frame_equal(joined, expected)
+
+    def test_join_index_mixed_overlap(self):
+        df1 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
+                        index=np.arange(10),
+                        columns=['A', 'B', 'C', 'D'])
+        assert df1['B'].dtype == np.int64
+        assert df1['D'].dtype == np.bool_
+
+        df2 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
+                        index=np.arange(0, 10, 2),
+                        columns=['A', 'B', 'C', 'D'])
+
+        # overlap
+        joined = df1.join(df2, lsuffix='_one', rsuffix='_two')
+        expected_columns = ['A_one', 'B_one', 'C_one', 'D_one',
+                            'A_two', 'B_two', 'C_two', 'D_two']
+        df1.columns = expected_columns[:4]
+        df2.columns = expected_columns[4:]
+        expected = _join_by_hand(df1, df2)
+        assert_frame_equal(joined, expected)
+
+    def test_join_empty_bug(self):
+        # generated an exception in 0.4.3
+        x = DataFrame()
+        x.join(DataFrame([3], index=[0], columns=['A']), how='outer')
+
+    def test_join_unconsolidated(self):
+        # GH #331
+        a = DataFrame(randn(30, 2), columns=['a', 'b'])
+        c = Series(randn(30))
+        a['c'] = c
+        d = DataFrame(randn(30, 1), columns=['q'])
+
+        # it works!
+        a.join(d)
+        d.join(a)
+
+    def test_join_multiindex(self):
+        index1 = MultiIndex.from_arrays([['a', 'a', 'a', 'b', 'b', 'b'],
+                                         [1, 2, 3, 1, 2, 3]],
+                                        names=['first', 'second'])
+
+        index2 = MultiIndex.from_arrays([['b', 'b', 'b', 'c', 'c', 'c'],
+                                         [1, 2, 3, 1, 2, 3]],
+                                        names=['first', 'second'])
+
+        df1 = DataFrame(data=np.random.randn(6), index=index1,
+                        columns=['var X'])
+        df2 = DataFrame(data=np.random.randn(6), index=index2,
+                        columns=['var Y'])
+
+        df1 = df1.sort_index(level=0)
+        df2 = df2.sort_index(level=0)
+
+        joined = df1.join(df2, how='outer')
+        ex_index = Index(index1.values).union(Index(index2.values))
+        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
+        expected.index.names = index1.names
+        assert_frame_equal(joined, expected)
+        assert joined.index.names == index1.names
+
+        df1 = df1.sort_index(level=1)
+        df2 = df2.sort_index(level=1)
+
+        joined = df1.join(df2, how='outer').sort_index(level=0)
+        ex_index = Index(index1.values).union(Index(index2.values))
+        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
+        expected.index.names = index1.names
+
+        assert_frame_equal(joined, expected)
+        assert joined.index.names == index1.names
+
+    def test_join_inner_multiindex(self):
+        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
+                'qux', 'snap']
+        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
+                'three', 'one']
+
+        data = np.random.randn(len(key1))
+        data = DataFrame({'key1': key1, 'key2': key2,
+                          'data': data})
+
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+        to_join = DataFrame(np.random.randn(10, 3), index=index,
+                            columns=['j_one', 'j_two', 'j_three'])
+
+        joined = data.join(to_join, on=['key1', 'key2'], how='inner')
+        expected = merge(data, to_join.reset_index(),
+                         left_on=['key1', 'key2'],
+                         right_on=['first', 'second'], how='inner',
+                         sort=False)
+
+        expected2 = merge(to_join, data,
+                          right_on=['key1', 'key2'], left_index=True,
+                          how='inner', sort=False)
+        assert_frame_equal(joined, expected2.reindex_like(joined))
+
+        expected2 = merge(to_join, data, right_on=['key1', 'key2'],
+                          left_index=True, how='inner', sort=False)
+
+        expected = expected.drop(['first', 'second'], axis=1)
+        expected.index = joined.index
+
+        assert joined.index.is_monotonic
+        assert_frame_equal(joined, expected)
+
+        # _assert_same_contents(expected, expected2.loc[:, expected.columns])
+
+    def test_join_hierarchical_mixed(self):
+        # GH 2024
+        df = DataFrame([(1, 2, 3), (4, 5, 6)], columns=['a', 'b', 'c'])
+        new_df = df.groupby(['a']).agg({'b': [np.mean, np.sum]})
+        other_df = DataFrame(
+            [(1, 2, 3), (7, 10, 6)], columns=['a', 'b', 'd'])
+        other_df.set_index('a', inplace=True)
+        # GH 9455, 12219
+        with tm.assert_produces_warning(UserWarning):
+            result = merge(new_df, other_df, left_index=True, right_index=True)
+        assert ('b', 'mean') in result
+        assert 'b' in result
+
+    def test_join_float64_float32(self):
+
+        a = DataFrame(randn(10, 2), columns=['a', 'b'], dtype=np.float64)
+        b = DataFrame(randn(10, 1), columns=['c'], dtype=np.float32)
+        joined = a.join(b)
+        assert joined.dtypes['a'] == 'float64'
+        assert joined.dtypes['b'] == 'float64'
+        assert joined.dtypes['c'] == 'float32'
+
+        a = np.random.randint(0, 5, 100).astype('int64')
+        b = np.random.random(100).astype('float64')
+        c = np.random.random(100).astype('float32')
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+        xpdf = DataFrame({'a': a, 'b': b, 'c': c})
+        s = DataFrame(np.random.random(5).astype('float32'), columns=['md'])
+        rs = df.merge(s, left_on='a', right_index=True)
+        assert rs.dtypes['a'] == 'int64'
+        assert rs.dtypes['b'] == 'float64'
+        assert rs.dtypes['c'] == 'float32'
+        assert rs.dtypes['md'] == 'float32'
+
+        xp = xpdf.merge(s, left_on='a', right_index=True)
+        assert_frame_equal(rs, xp)
+
+    def test_join_many_non_unique_index(self):
+        df1 = DataFrame({"a": [1, 1], "b": [1, 1], "c": [10, 20]})
+        df2 = DataFrame({"a": [1, 1], "b": [1, 2], "d": [100, 200]})
+        df3 = DataFrame({"a": [1, 1], "b": [1, 2], "e": [1000, 2000]})
+        idf1 = df1.set_index(["a", "b"])
+        idf2 = df2.set_index(["a", "b"])
+        idf3 = df3.set_index(["a", "b"])
+
+        result = idf1.join([idf2, idf3], how='outer')
+
+        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='outer')
+        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='outer')
+
+        result = result.reset_index()
+        expected = expected[result.columns]
+        expected['a'] = expected.a.astype('int64')
+        expected['b'] = expected.b.astype('int64')
+        assert_frame_equal(result, expected)
+
+        df1 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 1], "c": [10, 20, 30]})
+        df2 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 2], "d": [100, 200, 300]})
+        df3 = DataFrame(
+            {"a": [1, 1, 1], "b": [1, 1, 2], "e": [1000, 2000, 3000]})
+        idf1 = df1.set_index(["a", "b"])
+        idf2 = df2.set_index(["a", "b"])
+        idf3 = df3.set_index(["a", "b"])
+        result = idf1.join([idf2, idf3], how='inner')
+
+        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='inner')
+        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='inner')
+
+        result = result.reset_index()
+
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+        # GH 11519
+        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
+                              'foo', 'bar', 'foo', 'foo'],
+                        'B': ['one', 'one', 'two', 'three',
+                              'two', 'two', 'one', 'three'],
+                        'C': np.random.randn(8),
+                        'D': np.random.randn(8)})
+        s = Series(np.repeat(np.arange(8), 2),
+                   index=np.repeat(np.arange(8), 2), name='TEST')
+        inner = df.join(s, how='inner')
+        outer = df.join(s, how='outer')
+        left = df.join(s, how='left')
+        right = df.join(s, how='right')
+        assert_frame_equal(inner, outer)
+        assert_frame_equal(inner, left)
+        assert_frame_equal(inner, right)
+
+    def test_join_sort(self):
+        left = DataFrame({'key': ['foo', 'bar', 'baz', 'foo'],
+                          'value': [1, 2, 3, 4]})
+        right = DataFrame({'value2': ['a', 'b', 'c']},
+                          index=['bar', 'baz', 'foo'])
+
+        joined = left.join(right, on='key', sort=True)
+        expected = DataFrame({'key': ['bar', 'baz', 'foo', 'foo'],
+                              'value': [2, 3, 1, 4],
+                              'value2': ['a', 'b', 'c', 'c']},
+                             index=[1, 2, 0, 3])
+        assert_frame_equal(joined, expected)
+
+        # smoke test
+        joined = left.join(right, on='key', sort=False)
+        tm.assert_index_equal(joined.index, pd.Index(lrange(4)))
+
+    def test_join_mixed_non_unique_index(self):
+        # GH 12814, unorderable types in py3 with a non-unique index
+        df1 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 3, 'a'])
+        df2 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 3, 3, 4])
+        result = df1.join(df2)
+        expected = DataFrame({'a': [1, 2, 3, 3, 4],
+                              'b': [5, np.nan, 6, 7, np.nan]},
+                             index=[1, 2, 3, 3, 'a'])
+        tm.assert_frame_equal(result, expected)
+
+        df3 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 2, 'a'])
+        df4 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 2, 3, 4])
+        result = df3.join(df4)
+        expected = DataFrame({'a': [1, 2, 3, 4], 'b': [5, 6, 6, np.nan]},
+                             index=[1, 2, 2, 'a'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_non_unique_period_index(self):
+        # GH #16871
+        index = pd.period_range('2016-01-01', periods=16, freq='M')
+        df = DataFrame([i for i in range(len(index))],
+                       index=index, columns=['pnum'])
+        df2 = concat([df, df])
+        result = df.join(df2, how='inner', rsuffix='_df2')
+        expected = DataFrame(
+            np.tile(np.arange(16, dtype=np.int64).repeat(2).reshape(-1, 1), 2),
+            columns=['pnum', 'pnum_df2'], index=df2.sort_index().index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_mixed_type_join_with_suffix(self):
+        # GH #916
+        df = DataFrame(np.random.randn(20, 6),
+                       columns=['a', 'b', 'c', 'd', 'e', 'f'])
+        df.insert(0, 'id', 0)
+        df.insert(5, 'dt', 'foo')
+
+        grouped = df.groupby('id')
+        mn = grouped.mean()
+        cn = grouped.count()
+
+        # it works!
+        mn.join(cn, rsuffix='_right')
+
+    def test_join_many(self):
+        df = DataFrame(np.random.randn(10, 6), columns=list('abcdef'))
+        df_list = [df[['a', 'b']], df[['c', 'd']], df[['e', 'f']]]
+
+        joined = df_list[0].join(df_list[1:])
+        tm.assert_frame_equal(joined, df)
+
+        df_list = [df[['a', 'b']][:-2],
+                   df[['c', 'd']][2:], df[['e', 'f']][1:9]]
+
+        def _check_diff_index(df_list, result, exp_index):
+            reindexed = [x.reindex(exp_index) for x in df_list]
+            expected = reindexed[0].join(reindexed[1:])
+            tm.assert_frame_equal(result, expected)
+
+        # different join types
+        joined = df_list[0].join(df_list[1:], how='outer')
+        _check_diff_index(df_list, joined, df.index)
+
+        joined = df_list[0].join(df_list[1:])
+        _check_diff_index(df_list, joined, df_list[0].index)
+
+        joined = df_list[0].join(df_list[1:], how='inner')
+        _check_diff_index(df_list, joined, df.index[2:8])
+
+        msg = "Joining multiple DataFrames only supported for joining on index"
+        with pytest.raises(ValueError, match=msg):
+            df_list[0].join(df_list[1:], on='a')
+
+    def test_join_many_mixed(self):
+        df = DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
+        df['key'] = ['foo', 'bar'] * 4
+        df1 = df.loc[:, ['A', 'B']]
+        df2 = df.loc[:, ['C', 'D']]
+        df3 = df.loc[:, ['key']]
+
+        result = df1.join([df2, df3])
+        assert_frame_equal(result, df)
+
+    def test_join_dups(self):
+
+        # joining dups
+        df = concat([DataFrame(np.random.randn(10, 4),
+                               columns=['A', 'A', 'B', 'B']),
+                     DataFrame(np.random.randint(0, 10, size=20)
+                               .reshape(10, 2),
+                               columns=['A', 'C'])],
+                    axis=1)
+
+        expected = concat([df, df], axis=1)
+        result = df.join(df, rsuffix='_2')
+        result.columns = expected.columns
+        assert_frame_equal(result, expected)
+
+        # GH 4975, invalid join on dups
+        w = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        x = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        y = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+        z = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
+
+        dta = x.merge(y, left_index=True, right_index=True).merge(
+            z, left_index=True, right_index=True, how="outer")
+        dta = dta.merge(w, left_index=True, right_index=True)
+        expected = concat([x, y, z, w], axis=1)
+        expected.columns = ['x_x', 'y_x', 'x_y',
+                            'y_y', 'x_x', 'y_x', 'x_y', 'y_y']
+        assert_frame_equal(dta, expected)
+
+    def test_join_multi_to_multi(self, join_type):
+        # GH 20475
+        leftindex = MultiIndex.from_product([list('abc'), list('xy'), [1, 2]],
+                                            names=['abc', 'xy', 'num'])
+        left = DataFrame({'v1': range(12)}, index=leftindex)
+
+        rightindex = MultiIndex.from_product([list('abc'), list('xy')],
+                                             names=['abc', 'xy'])
+        right = DataFrame({'v2': [100 * i for i in range(1, 7)]},
+                          index=rightindex)
+
+        result = left.join(right, on=['abc', 'xy'], how=join_type)
+        expected = (left.reset_index()
+                        .merge(right.reset_index(),
+                               on=['abc', 'xy'], how=join_type)
+                        .set_index(['abc', 'xy', 'num'])
+                    )
+        assert_frame_equal(expected, result)
+
+        msg = (r'len\(left_on\) must equal the number of levels in the index'
+               ' of "right"')
+        with pytest.raises(ValueError, match=msg):
+            left.join(right, on='xy', how=join_type)
+
+        with pytest.raises(ValueError, match=msg):
+            right.join(left, on=['abc', 'xy'], how=join_type)
+
+    def test_join_on_tz_aware_datetimeindex(self):
+        # GH 23931
+        df1 = pd.DataFrame(
+            {
+                'date': pd.date_range(start='2018-01-01', periods=5,
+                                      tz='America/Chicago'),
+                'vals': list('abcde')
+            }
+        )
+
+        df2 = pd.DataFrame(
+            {
+                'date': pd.date_range(start='2018-01-03', periods=5,
+                                      tz='America/Chicago'),
+                'vals_2': list('tuvwx')
+            }
+        )
+        result = df1.join(df2.set_index('date'), on='date')
+        expected = df1.copy()
+        expected['vals_2'] = pd.Series([np.nan] * len(expected), dtype=object)
+        assert_frame_equal(result, expected)
+
+
+def _check_join(left, right, result, join_col, how='left',
+                lsuffix='_x', rsuffix='_y'):
+
+    # some smoke tests
+    for c in join_col:
+        assert(result[c].notna().all())
+
+    left_grouped = left.groupby(join_col)
+    right_grouped = right.groupby(join_col)
+
+    for group_key, group in result.groupby(join_col):
+        l_joined = _restrict_to_columns(group, left.columns, lsuffix)
+        r_joined = _restrict_to_columns(group, right.columns, rsuffix)
+
+        try:
+            lgroup = left_grouped.get_group(group_key)
+        except KeyError:
+            if how in ('left', 'inner'):
+                raise AssertionError('key %s should not have been in the join'
+                                     % str(group_key))
+
+            _assert_all_na(l_joined, left.columns, join_col)
+        else:
+            _assert_same_contents(l_joined, lgroup)
+
+        try:
+            rgroup = right_grouped.get_group(group_key)
+        except KeyError:
+            if how in ('right', 'inner'):
+                raise AssertionError('key %s should not have been in the join'
+                                     % str(group_key))
+
+            _assert_all_na(r_joined, right.columns, join_col)
+        else:
+            _assert_same_contents(r_joined, rgroup)
+
+
+def _restrict_to_columns(group, columns, suffix):
+    found = [c for c in group.columns
+             if c in columns or c.replace(suffix, '') in columns]
+
+    # filter
+    group = group.loc[:, found]
+
+    # get rid of suffixes, if any
+    group = group.rename(columns=lambda x: x.replace(suffix, ''))
+
+    # put in the right order...
+    group = group.loc[:, columns]
+
+    return group
+
+
+def _assert_same_contents(join_chunk, source):
+    NA_SENTINEL = -1234567  # drop_duplicates not so NA-friendly...
+
+    jvalues = join_chunk.fillna(NA_SENTINEL).drop_duplicates().values
+    svalues = source.fillna(NA_SENTINEL).drop_duplicates().values
+
+    rows = {tuple(row) for row in jvalues}
+    assert(len(rows) == len(source))
+    assert(all(tuple(row) in rows for row in svalues))
+
+
+def _assert_all_na(join_chunk, source_columns, join_col):
+    for c in source_columns:
+        if c in join_col:
+            continue
+        assert(join_chunk[c].isna().all())
+
+
+def _join_by_hand(a, b, how='left'):
+    join_index = a.index.join(b.index, how=how)
+
+    a_re = a.reindex(join_index)
+    b_re = b.reindex(join_index)
+
+    result_columns = a.columns.append(b.columns)
+
+    for col, s in compat.iteritems(b_re):
+        a_re[col] = s
+    return a_re.reindex(columns=result_columns)
diff --git a/pandas/tests/reshape/merge/test_merge.py b/pandas/tests/reshape/merge/test_merge.py
new file mode 100644
index 0000000000000..7a97368504fd6
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge.py
@@ -0,0 +1,1668 @@
+# pylint: disable=E1103
+
+from collections import OrderedDict
+from datetime import date, datetime
+import random
+import re
+
+import numpy as np
+from numpy import nan
+import pytest
+
+from pandas.compat import lrange
+
+from pandas.core.dtypes.common import is_categorical_dtype, is_object_dtype
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DataFrame, DatetimeIndex, Float64Index,
+    Int64Index, MultiIndex, RangeIndex, Series, UInt64Index)
+from pandas.api.types import CategoricalDtype as CDT
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.merge import MergeError, merge
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
+
+N = 50
+NGROUPS = 8
+
+
+def get_test_data(ngroups=NGROUPS, n=N):
+    unique_groups = lrange(ngroups)
+    arr = np.asarray(np.tile(unique_groups, n // ngroups))
+
+    if len(arr) < n:
+        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)])
+
+    random.shuffle(arr)
+    return arr
+
+
+def get_series():
+    return [
+        pd.Series([1], dtype='int64'),
+        pd.Series([1], dtype='Int64'),
+        pd.Series([1.23]),
+        pd.Series(['foo']),
+        pd.Series([True]),
+        pd.Series([pd.Timestamp('2018-01-01')]),
+        pd.Series([pd.Timestamp('2018-01-01', tz='US/Eastern')]),
+    ]
+
+
+def get_series_na():
+    return [
+        pd.Series([np.nan], dtype='Int64'),
+        pd.Series([np.nan], dtype='float'),
+        pd.Series([np.nan], dtype='object'),
+        pd.Series([pd.NaT]),
+    ]
+
+
+@pytest.fixture(params=get_series(), ids=lambda x: x.dtype.name)
+def series_of_dtype(request):
+    """
+    A parametrized fixture returning a variety of Series of different
+    dtypes
+    """
+    return request.param
+
+
+@pytest.fixture(params=get_series(), ids=lambda x: x.dtype.name)
+def series_of_dtype2(request):
+    """
+    A duplicate of the series_of_dtype fixture, so that it can be used
+    twice by a single function
+    """
+    return request.param
+
+
+@pytest.fixture(params=get_series_na(), ids=lambda x: x.dtype.name)
+def series_of_dtype_all_na(request):
+    """
+    A parametrized fixture returning a variety of Series with all NA
+    values
+    """
+    return request.param
+
+
+class TestMerge(object):
+
+    def setup_method(self, method):
+        # aggregate multiple columns
+        self.df = DataFrame({'key1': get_test_data(),
+                             'key2': get_test_data(),
+                             'data1': np.random.randn(N),
+                             'data2': np.random.randn(N)})
+
+        # exclude a couple keys for fun
+        self.df = self.df[self.df['key2'] > 1]
+
+        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
+                              'key2': get_test_data(ngroups=NGROUPS // 2,
+                                                    n=N // 5),
+                              'value': np.random.randn(N // 5)})
+
+        self.left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                               'v1': np.random.randn(7)})
+        self.right = DataFrame({'v2': np.random.randn(4)},
+                               index=['d', 'b', 'c', 'a'])
+
+    def test_merge_inner_join_empty(self):
+        # GH 15328
+        df_empty = pd.DataFrame()
+        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
+        result = pd.merge(df_empty, df_a, left_index=True, right_index=True)
+        expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
+        assert_frame_equal(result, expected)
+
+    def test_merge_common(self):
+        joined = merge(self.df, self.df2)
+        exp = merge(self.df, self.df2, on=['key1', 'key2'])
+        tm.assert_frame_equal(joined, exp)
+
+    def test_merge_index_as_on_arg(self):
+        # GH14355
+
+        left = self.df.set_index('key1')
+        right = self.df2.set_index('key1')
+        result = merge(left, right, on='key1')
+        expected = merge(self.df, self.df2, on='key1').set_index('key1')
+        assert_frame_equal(result, expected)
+
+    def test_merge_index_singlekey_right_vs_left(self):
+        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                          'v1': np.random.randn(7)})
+        right = DataFrame({'v2': np.random.randn(4)},
+                          index=['d', 'b', 'c', 'a'])
+
+        merged1 = merge(left, right, left_on='key',
+                        right_index=True, how='left', sort=False)
+        merged2 = merge(right, left, right_on='key',
+                        left_index=True, how='right', sort=False)
+        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
+
+        merged1 = merge(left, right, left_on='key',
+                        right_index=True, how='left', sort=True)
+        merged2 = merge(right, left, right_on='key',
+                        left_index=True, how='right', sort=True)
+        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
+
+    def test_merge_index_singlekey_inner(self):
+        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
+                          'v1': np.random.randn(7)})
+        right = DataFrame({'v2': np.random.randn(4)},
+                          index=['d', 'b', 'c', 'a'])
+
+        # inner join
+        result = merge(left, right, left_on='key', right_index=True,
+                       how='inner')
+        expected = left.join(right, on='key').loc[result.index]
+        assert_frame_equal(result, expected)
+
+        result = merge(right, left, right_on='key', left_index=True,
+                       how='inner')
+        expected = left.join(right, on='key').loc[result.index]
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+    def test_merge_misspecified(self):
+        msg = "Must pass right_on or right_index=True"
+        with pytest.raises(pd.errors.MergeError, match=msg):
+            merge(self.left, self.right, left_index=True)
+        msg = "Must pass left_on or left_index=True"
+        with pytest.raises(pd.errors.MergeError, match=msg):
+            merge(self.left, self.right, right_index=True)
+
+        msg = ('Can only pass argument "on" OR "left_on" and "right_on", not'
+               ' a combination of both')
+        with pytest.raises(pd.errors.MergeError, match=msg):
+            merge(self.left, self.left, left_on='key', on='key')
+
+        msg = r"len\(right_on\) must equal len\(left_on\)"
+        with pytest.raises(ValueError, match=msg):
+            merge(self.df, self.df2, left_on=['key1'],
+                  right_on=['key1', 'key2'])
+
+    def test_index_and_on_parameters_confusion(self):
+        msg = ("right_index parameter must be of type bool, not"
+               r" <(class|type) 'list'>")
+        with pytest.raises(ValueError, match=msg):
+            merge(self.df, self.df2, how='left',
+                  left_index=False, right_index=['key1', 'key2'])
+        msg = ("left_index parameter must be of type bool, not "
+               r"<(class|type) 'list'>")
+        with pytest.raises(ValueError, match=msg):
+            merge(self.df, self.df2, how='left',
+                  left_index=['key1', 'key2'], right_index=False)
+        with pytest.raises(ValueError, match=msg):
+            merge(self.df, self.df2, how='left',
+                  left_index=['key1', 'key2'], right_index=['key1', 'key2'])
+
+    def test_merge_overlap(self):
+        merged = merge(self.left, self.left, on='key')
+        exp_len = (self.left['key'].value_counts() ** 2).sum()
+        assert len(merged) == exp_len
+        assert 'v1_x' in merged
+        assert 'v1_y' in merged
+
+    def test_merge_different_column_key_names(self):
+        left = DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
+                          'value': [1, 2, 3, 4]})
+        right = DataFrame({'rkey': ['foo', 'bar', 'qux', 'foo'],
+                           'value': [5, 6, 7, 8]})
+
+        merged = left.merge(right, left_on='lkey', right_on='rkey',
+                            how='outer', sort=True)
+
+        exp = pd.Series(['bar', 'baz', 'foo', 'foo', 'foo', 'foo', np.nan],
+                        name='lkey')
+        tm.assert_series_equal(merged['lkey'], exp)
+
+        exp = pd.Series(['bar', np.nan, 'foo', 'foo', 'foo', 'foo', 'qux'],
+                        name='rkey')
+        tm.assert_series_equal(merged['rkey'], exp)
+
+        exp = pd.Series([2, 3, 1, 1, 4, 4, np.nan], name='value_x')
+        tm.assert_series_equal(merged['value_x'], exp)
+
+        exp = pd.Series([6, np.nan, 5, 8, 5, 8, 7], name='value_y')
+        tm.assert_series_equal(merged['value_y'], exp)
+
+    def test_merge_copy(self):
+        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
+        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
+
+        merged = merge(left, right, left_index=True,
+                       right_index=True, copy=True)
+
+        merged['a'] = 6
+        assert (left['a'] == 0).all()
+
+        merged['d'] = 'peekaboo'
+        assert (right['d'] == 'bar').all()
+
+    def test_merge_nocopy(self):
+        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
+        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
+
+        merged = merge(left, right, left_index=True,
+                       right_index=True, copy=False)
+
+        merged['a'] = 6
+        assert (left['a'] == 6).all()
+
+        merged['d'] = 'peekaboo'
+        assert (right['d'] == 'peekaboo').all()
+
+    def test_intelligently_handle_join_key(self):
+        # #733, be a bit more 1337 about not returning unconsolidated DataFrame
+
+        left = DataFrame({'key': [1, 1, 2, 2, 3],
+                          'value': lrange(5)}, columns=['value', 'key'])
+        right = DataFrame({'key': [1, 1, 2, 3, 4, 5],
+                           'rvalue': lrange(6)})
+
+        joined = merge(left, right, on='key', how='outer')
+        expected = DataFrame({'key': [1, 1, 1, 1, 2, 2, 3, 4, 5],
+                              'value': np.array([0, 0, 1, 1, 2, 3, 4,
+                                                 np.nan, np.nan]),
+                              'rvalue': [0, 1, 0, 1, 2, 2, 3, 4, 5]},
+                             columns=['value', 'key', 'rvalue'])
+        assert_frame_equal(joined, expected)
+
+    def test_merge_join_key_dtype_cast(self):
+        # #8596
+
+        df1 = DataFrame({'key': [1], 'v1': [10]})
+        df2 = DataFrame({'key': [2], 'v1': [20]})
+        df = merge(df1, df2, how='outer')
+        assert df['key'].dtype == 'int64'
+
+        df1 = DataFrame({'key': [True], 'v1': [1]})
+        df2 = DataFrame({'key': [False], 'v1': [0]})
+        df = merge(df1, df2, how='outer')
+
+        # GH13169
+        # this really should be bool
+        assert df['key'].dtype == 'object'
+
+        df1 = DataFrame({'val': [1]})
+        df2 = DataFrame({'val': [2]})
+        lkey = np.array([1])
+        rkey = np.array([2])
+        df = merge(df1, df2, left_on=lkey, right_on=rkey, how='outer')
+        assert df['key_0'].dtype == 'int64'
+
+    def test_handle_join_key_pass_array(self):
+        left = DataFrame({'key': [1, 1, 2, 2, 3],
+                          'value': lrange(5)}, columns=['value', 'key'])
+        right = DataFrame({'rvalue': lrange(6)})
+        key = np.array([1, 1, 2, 3, 4, 5])
+
+        merged = merge(left, right, left_on='key', right_on=key, how='outer')
+        merged2 = merge(right, left, left_on=key, right_on='key', how='outer')
+
+        assert_series_equal(merged['key'], merged2['key'])
+        assert merged['key'].notna().all()
+        assert merged2['key'].notna().all()
+
+        left = DataFrame({'value': lrange(5)}, columns=['value'])
+        right = DataFrame({'rvalue': lrange(6)})
+        lkey = np.array([1, 1, 2, 2, 3])
+        rkey = np.array([1, 1, 2, 3, 4, 5])
+
+        merged = merge(left, right, left_on=lkey, right_on=rkey, how='outer')
+        tm.assert_series_equal(merged['key_0'], Series([1, 1, 1, 1, 2,
+                                                        2, 3, 4, 5],
+                                                       name='key_0'))
+
+        left = DataFrame({'value': lrange(3)})
+        right = DataFrame({'rvalue': lrange(6)})
+
+        key = np.array([0, 1, 1, 2, 2, 3], dtype=np.int64)
+        merged = merge(left, right, left_index=True, right_on=key, how='outer')
+        tm.assert_series_equal(merged['key_0'], Series(key, name='key_0'))
+
+    def test_no_overlap_more_informative_error(self):
+        dt = datetime.now()
+        df1 = DataFrame({'x': ['a']}, index=[dt])
+
+        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
+
+        msg = ('No common columns to perform merge on. '
+               'Merge options: left_on={lon}, right_on={ron}, '
+               'left_index={lidx}, right_index={ridx}'
+               .format(lon=None, ron=None, lidx=False, ridx=False))
+
+        with pytest.raises(MergeError, match=msg):
+            merge(df1, df2)
+
+    def test_merge_non_unique_indexes(self):
+
+        dt = datetime(2012, 5, 1)
+        dt2 = datetime(2012, 5, 2)
+        dt3 = datetime(2012, 5, 3)
+        dt4 = datetime(2012, 5, 4)
+
+        df1 = DataFrame({'x': ['a']}, index=[dt])
+        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
+        _check_merge(df1, df2)
+
+        # Not monotonic
+        df1 = DataFrame({'x': ['a', 'b', 'q']}, index=[dt2, dt, dt4])
+        df2 = DataFrame({'y': ['c', 'd', 'e', 'f', 'g', 'h']},
+                        index=[dt3, dt3, dt2, dt2, dt, dt])
+        _check_merge(df1, df2)
+
+        df1 = DataFrame({'x': ['a', 'b']}, index=[dt, dt])
+        df2 = DataFrame({'y': ['c', 'd']}, index=[dt, dt])
+        _check_merge(df1, df2)
+
+    def test_merge_non_unique_index_many_to_many(self):
+        dt = datetime(2012, 5, 1)
+        dt2 = datetime(2012, 5, 2)
+        dt3 = datetime(2012, 5, 3)
+        df1 = DataFrame({'x': ['a', 'b', 'c', 'd']},
+                        index=[dt2, dt2, dt, dt])
+        df2 = DataFrame({'y': ['e', 'f', 'g', ' h', 'i']},
+                        index=[dt2, dt2, dt3, dt, dt])
+        _check_merge(df1, df2)
+
+    def test_left_merge_empty_dataframe(self):
+        left = DataFrame({'key': [1], 'value': [2]})
+        right = DataFrame({'key': []})
+
+        result = merge(left, right, on='key', how='left')
+        assert_frame_equal(result, left)
+
+        result = merge(right, left, on='key', how='right')
+        assert_frame_equal(result, left)
+
+    @pytest.mark.parametrize('kwarg',
+                             [dict(left_index=True, right_index=True),
+                              dict(left_index=True, right_on='x'),
+                              dict(left_on='a', right_index=True),
+                              dict(left_on='a', right_on='x')])
+    def test_merge_left_empty_right_empty(self, join_type, kwarg):
+        # GH 10824
+        left = pd.DataFrame([], columns=['a', 'b', 'c'])
+        right = pd.DataFrame([], columns=['x', 'y', 'z'])
+
+        exp_in = pd.DataFrame([], columns=['a', 'b', 'c', 'x', 'y', 'z'],
+                              index=pd.Index([], dtype=object),
+                              dtype=object)
+
+        result = pd.merge(left, right, how=join_type, **kwarg)
+        tm.assert_frame_equal(result, exp_in)
+
+    def test_merge_left_empty_right_notempty(self):
+        # GH 10824
+        left = pd.DataFrame([], columns=['a', 'b', 'c'])
+        right = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                             columns=['x', 'y', 'z'])
+
+        exp_out = pd.DataFrame({'a': np.array([np.nan] * 3, dtype=object),
+                                'b': np.array([np.nan] * 3, dtype=object),
+                                'c': np.array([np.nan] * 3, dtype=object),
+                                'x': [1, 4, 7],
+                                'y': [2, 5, 8],
+                                'z': [3, 6, 9]},
+                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
+        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
+        # result will have object dtype
+        exp_in.index = exp_in.index.astype(object)
+
+        def check1(exp, kwarg):
+            result = pd.merge(left, right, how='inner', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='left', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        def check2(exp, kwarg):
+            result = pd.merge(left, right, how='right', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='outer', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        for kwarg in [dict(left_index=True, right_index=True),
+                      dict(left_index=True, right_on='x')]:
+            check1(exp_in, kwarg)
+            check2(exp_out, kwarg)
+
+        kwarg = dict(left_on='a', right_index=True)
+        check1(exp_in, kwarg)
+        exp_out['a'] = [0, 1, 2]
+        check2(exp_out, kwarg)
+
+        kwarg = dict(left_on='a', right_on='x')
+        check1(exp_in, kwarg)
+        exp_out['a'] = np.array([np.nan] * 3, dtype=object)
+        check2(exp_out, kwarg)
+
+    def test_merge_left_notempty_right_empty(self):
+        # GH 10824
+        left = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                            columns=['a', 'b', 'c'])
+        right = pd.DataFrame([], columns=['x', 'y', 'z'])
+
+        exp_out = pd.DataFrame({'a': [1, 4, 7],
+                                'b': [2, 5, 8],
+                                'c': [3, 6, 9],
+                                'x': np.array([np.nan] * 3, dtype=object),
+                                'y': np.array([np.nan] * 3, dtype=object),
+                                'z': np.array([np.nan] * 3, dtype=object)},
+                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
+        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
+        # result will have object dtype
+        exp_in.index = exp_in.index.astype(object)
+
+        def check1(exp, kwarg):
+            result = pd.merge(left, right, how='inner', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='right', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+        def check2(exp, kwarg):
+            result = pd.merge(left, right, how='left', **kwarg)
+            tm.assert_frame_equal(result, exp)
+            result = pd.merge(left, right, how='outer', **kwarg)
+            tm.assert_frame_equal(result, exp)
+
+            for kwarg in [dict(left_index=True, right_index=True),
+                          dict(left_index=True, right_on='x'),
+                          dict(left_on='a', right_index=True),
+                          dict(left_on='a', right_on='x')]:
+                check1(exp_in, kwarg)
+                check2(exp_out, kwarg)
+
+    def test_merge_empty_frame(self, series_of_dtype, series_of_dtype2):
+        # GH 25183
+        df = pd.DataFrame({'key': series_of_dtype, 'value': series_of_dtype2},
+                          columns=['key', 'value'])
+        df_empty = df[:0]
+        expected = pd.DataFrame({
+            'value_x': pd.Series(dtype=df.dtypes['value']),
+            'key': pd.Series(dtype=df.dtypes['key']),
+            'value_y': pd.Series(dtype=df.dtypes['value']),
+        }, columns=['value_x', 'key', 'value_y'])
+        actual = df_empty.merge(df, on='key')
+        assert_frame_equal(actual, expected)
+
+    def test_merge_all_na_column(self, series_of_dtype,
+                                 series_of_dtype_all_na):
+        # GH 25183
+        df_left = pd.DataFrame(
+            {'key': series_of_dtype, 'value': series_of_dtype_all_na},
+            columns=['key', 'value'])
+        df_right = pd.DataFrame(
+            {'key': series_of_dtype, 'value': series_of_dtype_all_na},
+            columns=['key', 'value'])
+        expected = pd.DataFrame({
+            'key': series_of_dtype,
+            'value_x': series_of_dtype_all_na,
+            'value_y': series_of_dtype_all_na,
+        }, columns=['key', 'value_x', 'value_y'])
+        actual = df_left.merge(df_right, on='key')
+        assert_frame_equal(actual, expected)
+
+    def test_merge_nosort(self):
+        # #2098, anything to do?
+
+        from datetime import datetime
+
+        d = {"var1": np.random.randint(0, 10, size=10),
+             "var2": np.random.randint(0, 10, size=10),
+             "var3": [datetime(2012, 1, 12),
+                      datetime(2011, 2, 4),
+                      datetime(2010, 2, 3),
+                      datetime(2012, 1, 12),
+                      datetime(2011, 2, 4),
+                      datetime(2012, 4, 3),
+                      datetime(2012, 3, 4),
+                      datetime(2008, 5, 1),
+                      datetime(2010, 2, 3),
+                      datetime(2012, 2, 3)]}
+        df = DataFrame.from_dict(d)
+        var3 = df.var3.unique()
+        var3.sort()
+        new = DataFrame.from_dict({"var3": var3,
+                                   "var8": np.random.random(7)})
+
+        result = df.merge(new, on="var3", sort=False)
+        exp = merge(df, new, on='var3', sort=False)
+        assert_frame_equal(result, exp)
+
+        assert (df.var3.unique() == result.var3.unique()).all()
+
+    def test_merge_nan_right(self):
+        df1 = DataFrame({"i1": [0, 1], "i2": [0, 1]})
+        df2 = DataFrame({"i1": [0], "i3": [0]})
+        result = df1.join(df2, on="i1", rsuffix="_")
+        expected = (DataFrame({'i1': {0: 0.0, 1: 1}, 'i2': {0: 0, 1: 1},
+                               'i1_': {0: 0, 1: np.nan},
+                               'i3': {0: 0.0, 1: np.nan},
+                               None: {0: 0, 1: 0}})
+                    .set_index(None)
+                    .reset_index()[['i1', 'i2', 'i1_', 'i3']])
+        assert_frame_equal(result, expected, check_dtype=False)
+
+        df1 = DataFrame({"i1": [0, 1], "i2": [0.5, 1.5]})
+        df2 = DataFrame({"i1": [0], "i3": [0.7]})
+        result = df1.join(df2, rsuffix="_", on='i1')
+        expected = (DataFrame({'i1': {0: 0, 1: 1}, 'i1_': {0: 0.0, 1: nan},
+                               'i2': {0: 0.5, 1: 1.5},
+                               'i3': {0: 0.69999999999999996,
+                                      1: nan}})
+                    [['i1', 'i2', 'i1_', 'i3']])
+        assert_frame_equal(result, expected)
+
+    def test_merge_type(self):
+        class NotADataFrame(DataFrame):
+
+            @property
+            def _constructor(self):
+                return NotADataFrame
+
+        nad = NotADataFrame(self.df)
+        result = nad.merge(self.df2, on='key1')
+
+        assert isinstance(result, NotADataFrame)
+
+    def test_join_append_timedeltas(self):
+
+        import datetime as dt
+        from pandas import NaT
+
+        # timedelta64 issues with join/merge
+        # GH 5695
+
+        d = {'d': dt.datetime(2013, 11, 5, 5, 56), 't': dt.timedelta(0, 22500)}
+        df = DataFrame(columns=list('dt'))
+        df = df.append(d, ignore_index=True)
+        result = df.append(d, ignore_index=True)
+        expected = DataFrame({'d': [dt.datetime(2013, 11, 5, 5, 56),
+                                    dt.datetime(2013, 11, 5, 5, 56)],
+                              't': [dt.timedelta(0, 22500),
+                                    dt.timedelta(0, 22500)]})
+        assert_frame_equal(result, expected)
+
+        td = np.timedelta64(300000000)
+        lhs = DataFrame(Series([td, td], index=["A", "B"]))
+        rhs = DataFrame(Series([td], index=["A"]))
+
+        result = lhs.join(rhs, rsuffix='r', how="left")
+        expected = DataFrame({'0': Series([td, td], index=list('AB')),
+                              '0r': Series([td, NaT], index=list('AB'))})
+        assert_frame_equal(result, expected)
+
+    def test_other_datetime_unit(self):
+        # GH 13389
+        df1 = pd.DataFrame({'entity_id': [101, 102]})
+        s = pd.Series([None, None], index=[101, 102], name='days')
+
+        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
+                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
+                      'datetime64[ns]']:
+
+            df2 = s.astype(dtype).to_frame('days')
+            # coerces to datetime64[ns], thus sholuld not be affected
+            assert df2['days'].dtype == 'datetime64[ns]'
+
+            result = df1.merge(df2, left_on='entity_id', right_index=True)
+
+            exp = pd.DataFrame({'entity_id': [101, 102],
+                                'days': np.array(['nat', 'nat'],
+                                                 dtype='datetime64[ns]')},
+                               columns=['entity_id', 'days'])
+            tm.assert_frame_equal(result, exp)
+
+    @pytest.mark.parametrize("unit", ['D', 'h', 'm', 's', 'ms', 'us', 'ns'])
+    def test_other_timedelta_unit(self, unit):
+        # GH 13389
+        df1 = pd.DataFrame({'entity_id': [101, 102]})
+        s = pd.Series([None, None], index=[101, 102], name='days')
+
+        dtype = "m8[{}]".format(unit)
+        df2 = s.astype(dtype).to_frame('days')
+        assert df2['days'].dtype == 'm8[ns]'
+
+        result = df1.merge(df2, left_on='entity_id', right_index=True)
+
+        exp = pd.DataFrame({'entity_id': [101, 102],
+                            'days': np.array(['nat', 'nat'],
+                                             dtype=dtype)},
+                           columns=['entity_id', 'days'])
+        tm.assert_frame_equal(result, exp)
+
+    def test_overlapping_columns_error_message(self):
+        df = DataFrame({'key': [1, 2, 3],
+                        'v1': [4, 5, 6],
+                        'v2': [7, 8, 9]})
+        df2 = DataFrame({'key': [1, 2, 3],
+                         'v1': [4, 5, 6],
+                         'v2': [7, 8, 9]})
+
+        df.columns = ['key', 'foo', 'foo']
+        df2.columns = ['key', 'bar', 'bar']
+        expected = DataFrame({'key': [1, 2, 3],
+                              'v1': [4, 5, 6],
+                              'v2': [7, 8, 9],
+                              'v3': [4, 5, 6],
+                              'v4': [7, 8, 9]})
+        expected.columns = ['key', 'foo', 'foo', 'bar', 'bar']
+        assert_frame_equal(merge(df, df2), expected)
+
+        # #2649, #10639
+        df2.columns = ['key1', 'foo', 'foo']
+        msg = (r"Data columns not unique: Index\(\[u?'foo', u?'foo'\],"
+               r" dtype='object'\)")
+        with pytest.raises(MergeError, match=msg):
+            merge(df, df2)
+
+    def test_merge_on_datetime64tz(self):
+
+        # GH11405
+        left = pd.DataFrame({'key': pd.date_range('20151010', periods=2,
+                                                  tz='US/Eastern'),
+                             'value': [1, 2]})
+        right = pd.DataFrame({'key': pd.date_range('20151011', periods=3,
+                                                   tz='US/Eastern'),
+                              'value': [1, 2, 3]})
+
+        expected = DataFrame({'key': pd.date_range('20151010', periods=4,
+                                                   tz='US/Eastern'),
+                              'value_x': [1, 2, np.nan, np.nan],
+                              'value_y': [np.nan, 1, 2, 3]})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+
+        left = pd.DataFrame({'key': [1, 2],
+                             'value': pd.date_range('20151010', periods=2,
+                                                    tz='US/Eastern')})
+        right = pd.DataFrame({'key': [2, 3],
+                              'value': pd.date_range('20151011', periods=2,
+                                                     tz='US/Eastern')})
+        expected = DataFrame({
+            'key': [1, 2, 3],
+            'value_x': list(pd.date_range('20151010', periods=2,
+                                          tz='US/Eastern')) + [pd.NaT],
+            'value_y': [pd.NaT] + list(pd.date_range('20151011', periods=2,
+                                                     tz='US/Eastern'))})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+        assert result['value_x'].dtype == 'datetime64[ns, US/Eastern]'
+        assert result['value_y'].dtype == 'datetime64[ns, US/Eastern]'
+
+    def test_merge_on_datetime64tz_empty(self):
+        # https://github.com/pandas-dev/pandas/issues/25014
+        dtz = pd.DatetimeTZDtype(tz='UTC')
+        right = pd.DataFrame({'date': [pd.Timestamp('2018', tz=dtz.tz)],
+                              'value': [4.0],
+                              'date2': [pd.Timestamp('2019', tz=dtz.tz)]},
+                             columns=['date', 'value', 'date2'])
+        left = right[:0]
+        result = left.merge(right, on='date')
+        expected = pd.DataFrame({
+            'value_x': pd.Series(dtype=float),
+            'date2_x': pd.Series(dtype=dtz),
+            'date': pd.Series(dtype=dtz),
+            'value_y': pd.Series(dtype=float),
+            'date2_y': pd.Series(dtype=dtz),
+        }, columns=['value_x', 'date2_x', 'date', 'value_y', 'date2_y'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_merge_datetime64tz_with_dst_transition(self):
+        # GH 18885
+        df1 = pd.DataFrame(pd.date_range(
+            '2017-10-29 01:00', periods=4, freq='H', tz='Europe/Madrid'),
+            columns=['date'])
+        df1['value'] = 1
+        df2 = pd.DataFrame({
+            'date': pd.to_datetime([
+                '2017-10-29 03:00:00', '2017-10-29 04:00:00',
+                '2017-10-29 05:00:00'
+            ]),
+            'value': 2
+        })
+        df2['date'] = df2['date'].dt.tz_localize('UTC').dt.tz_convert(
+            'Europe/Madrid')
+        result = pd.merge(df1, df2, how='outer', on='date')
+        expected = pd.DataFrame({
+            'date': pd.date_range(
+                '2017-10-29 01:00', periods=7, freq='H', tz='Europe/Madrid'),
+            'value_x': [1] * 4 + [np.nan] * 3,
+            'value_y': [np.nan] * 4 + [2] * 3
+        })
+        assert_frame_equal(result, expected)
+
+    def test_merge_non_unique_period_index(self):
+        # GH #16871
+        index = pd.period_range('2016-01-01', periods=16, freq='M')
+        df = DataFrame([i for i in range(len(index))],
+                       index=index, columns=['pnum'])
+        df2 = concat([df, df])
+        result = df.merge(df2, left_index=True, right_index=True, how='inner')
+        expected = DataFrame(
+            np.tile(np.arange(16, dtype=np.int64).repeat(2).reshape(-1, 1), 2),
+            columns=['pnum_x', 'pnum_y'], index=df2.sort_index().index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_merge_on_periods(self):
+        left = pd.DataFrame({'key': pd.period_range('20151010', periods=2,
+                                                    freq='D'),
+                             'value': [1, 2]})
+        right = pd.DataFrame({'key': pd.period_range('20151011', periods=3,
+                                                     freq='D'),
+                              'value': [1, 2, 3]})
+
+        expected = DataFrame({'key': pd.period_range('20151010', periods=4,
+                                                     freq='D'),
+                              'value_x': [1, 2, np.nan, np.nan],
+                              'value_y': [np.nan, 1, 2, 3]})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+
+        left = pd.DataFrame({'key': [1, 2],
+                             'value': pd.period_range('20151010', periods=2,
+                                                      freq='D')})
+        right = pd.DataFrame({'key': [2, 3],
+                              'value': pd.period_range('20151011', periods=2,
+                                                       freq='D')})
+
+        exp_x = pd.period_range('20151010', periods=2, freq='D')
+        exp_y = pd.period_range('20151011', periods=2, freq='D')
+        expected = DataFrame({'key': [1, 2, 3],
+                              'value_x': list(exp_x) + [pd.NaT],
+                              'value_y': [pd.NaT] + list(exp_y)})
+        result = pd.merge(left, right, on='key', how='outer')
+        assert_frame_equal(result, expected)
+        assert result['value_x'].dtype == 'Period[D]'
+        assert result['value_y'].dtype == 'Period[D]'
+
+    def test_indicator(self):
+        # PR #10054. xref #7412 and closes #8790.
+        df1 = DataFrame({'col1': [0, 1], 'col_conflict': [1, 2],
+                         'col_left': ['a', 'b']})
+        df1_copy = df1.copy()
+
+        df2 = DataFrame({'col1': [1, 2, 3, 4, 5],
+                         'col_conflict': [1, 2, 3, 4, 5],
+                         'col_right': [2, 2, 2, 2, 2]})
+        df2_copy = df2.copy()
+
+        df_result = DataFrame({
+            'col1': [0, 1, 2, 3, 4, 5],
+            'col_conflict_x': [1, 2, np.nan, np.nan, np.nan, np.nan],
+            'col_left': ['a', 'b', np.nan, np.nan, np.nan, np.nan],
+            'col_conflict_y': [np.nan, 1, 2, 3, 4, 5],
+            'col_right': [np.nan, 2, 2, 2, 2, 2]})
+        df_result['_merge'] = Categorical(
+            ['left_only', 'both', 'right_only',
+             'right_only', 'right_only', 'right_only'],
+            categories=['left_only', 'right_only', 'both'])
+
+        df_result = df_result[['col1', 'col_conflict_x', 'col_left',
+                               'col_conflict_y', 'col_right', '_merge']]
+
+        test = merge(df1, df2, on='col1', how='outer', indicator=True)
+        assert_frame_equal(test, df_result)
+        test = df1.merge(df2, on='col1', how='outer', indicator=True)
+        assert_frame_equal(test, df_result)
+
+        # No side effects
+        assert_frame_equal(df1, df1_copy)
+        assert_frame_equal(df2, df2_copy)
+
+        # Check with custom name
+        df_result_custom_name = df_result
+        df_result_custom_name = df_result_custom_name.rename(
+            columns={'_merge': 'custom_name'})
+
+        test_custom_name = merge(
+            df1, df2, on='col1', how='outer', indicator='custom_name')
+        assert_frame_equal(test_custom_name, df_result_custom_name)
+        test_custom_name = df1.merge(
+            df2, on='col1', how='outer', indicator='custom_name')
+        assert_frame_equal(test_custom_name, df_result_custom_name)
+
+        # Check only accepts strings and booleans
+        msg = "indicator option can only accept boolean or string arguments"
+        with pytest.raises(ValueError, match=msg):
+            merge(df1, df2, on='col1', how='outer', indicator=5)
+        with pytest.raises(ValueError, match=msg):
+            df1.merge(df2, on='col1', how='outer', indicator=5)
+
+        # Check result integrity
+
+        test2 = merge(df1, df2, on='col1', how='left', indicator=True)
+        assert (test2._merge != 'right_only').all()
+        test2 = df1.merge(df2, on='col1', how='left', indicator=True)
+        assert (test2._merge != 'right_only').all()
+
+        test3 = merge(df1, df2, on='col1', how='right', indicator=True)
+        assert (test3._merge != 'left_only').all()
+        test3 = df1.merge(df2, on='col1', how='right', indicator=True)
+        assert (test3._merge != 'left_only').all()
+
+        test4 = merge(df1, df2, on='col1', how='inner', indicator=True)
+        assert (test4._merge == 'both').all()
+        test4 = df1.merge(df2, on='col1', how='inner', indicator=True)
+        assert (test4._merge == 'both').all()
+
+        # Check if working name in df
+        for i in ['_right_indicator', '_left_indicator', '_merge']:
+            df_badcolumn = DataFrame({'col1': [1, 2], i: [2, 2]})
+
+            msg = ("Cannot use `indicator=True` option when data contains a"
+                   " column named {}|"
+                   "Cannot use name of an existing column for indicator"
+                   " column").format(i)
+            with pytest.raises(ValueError, match=msg):
+                merge(df1, df_badcolumn, on='col1',
+                      how='outer', indicator=True)
+            with pytest.raises(ValueError, match=msg):
+                df1.merge(df_badcolumn, on='col1', how='outer', indicator=True)
+
+        # Check for name conflict with custom name
+        df_badcolumn = DataFrame(
+            {'col1': [1, 2], 'custom_column_name': [2, 2]})
+
+        msg = "Cannot use name of an existing column for indicator column"
+        with pytest.raises(ValueError, match=msg):
+            merge(df1, df_badcolumn, on='col1', how='outer',
+                  indicator='custom_column_name')
+        with pytest.raises(ValueError, match=msg):
+            df1.merge(df_badcolumn, on='col1', how='outer',
+                      indicator='custom_column_name')
+
+        # Merge on multiple columns
+        df3 = DataFrame({'col1': [0, 1], 'col2': ['a', 'b']})
+
+        df4 = DataFrame({'col1': [1, 1, 3], 'col2': ['b', 'x', 'y']})
+
+        hand_coded_result = DataFrame({'col1': [0, 1, 1, 3],
+                                       'col2': ['a', 'b', 'x', 'y']})
+        hand_coded_result['_merge'] = Categorical(
+            ['left_only', 'both', 'right_only', 'right_only'],
+            categories=['left_only', 'right_only', 'both'])
+
+        test5 = merge(df3, df4, on=['col1', 'col2'],
+                      how='outer', indicator=True)
+        assert_frame_equal(test5, hand_coded_result)
+        test5 = df3.merge(df4, on=['col1', 'col2'],
+                          how='outer', indicator=True)
+        assert_frame_equal(test5, hand_coded_result)
+
+    def test_validation(self):
+        left = DataFrame({'a': ['a', 'b', 'c', 'd'],
+                          'b': ['cat', 'dog', 'weasel', 'horse']},
+                         index=range(4))
+
+        right = DataFrame({'a': ['a', 'b', 'c', 'd', 'e'],
+                           'c': ['meow', 'bark', 'um... weasel noise?',
+                                 'nay', 'chirp']},
+                          index=range(5))
+
+        # Make sure no side effects.
+        left_copy = left.copy()
+        right_copy = right.copy()
+
+        result = merge(left, right, left_index=True, right_index=True,
+                       validate='1:1')
+        assert_frame_equal(left, left_copy)
+        assert_frame_equal(right, right_copy)
+
+        # make sure merge still correct
+        expected = DataFrame({'a_x': ['a', 'b', 'c', 'd'],
+                              'b': ['cat', 'dog', 'weasel', 'horse'],
+                              'a_y': ['a', 'b', 'c', 'd'],
+                              'c': ['meow', 'bark', 'um... weasel noise?',
+                                    'nay']},
+                             index=range(4),
+                             columns=['a_x', 'b', 'a_y', 'c'])
+
+        result = merge(left, right, left_index=True, right_index=True,
+                       validate='one_to_one')
+        assert_frame_equal(result, expected)
+
+        expected_2 = DataFrame({'a': ['a', 'b', 'c', 'd'],
+                                'b': ['cat', 'dog', 'weasel', 'horse'],
+                                'c': ['meow', 'bark', 'um... weasel noise?',
+                                      'nay']},
+                               index=range(4))
+
+        result = merge(left, right, on='a', validate='1:1')
+        assert_frame_equal(left, left_copy)
+        assert_frame_equal(right, right_copy)
+        assert_frame_equal(result, expected_2)
+
+        result = merge(left, right, on='a', validate='one_to_one')
+        assert_frame_equal(result, expected_2)
+
+        # One index, one column
+        expected_3 = DataFrame({'b': ['cat', 'dog', 'weasel', 'horse'],
+                                'a': ['a', 'b', 'c', 'd'],
+                                'c': ['meow', 'bark', 'um... weasel noise?',
+                                      'nay']},
+                               columns=['b', 'a', 'c'],
+                               index=range(4))
+
+        left_index_reset = left.set_index('a')
+        result = merge(left_index_reset, right, left_index=True,
+                       right_on='a', validate='one_to_one')
+        assert_frame_equal(result, expected_3)
+
+        # Dups on right
+        right_w_dups = right.append(pd.DataFrame({'a': ['e'], 'c': ['moo']},
+                                                 index=[4]))
+        merge(left, right_w_dups, left_index=True, right_index=True,
+              validate='one_to_many')
+
+        msg = ("Merge keys are not unique in right dataset; not a one-to-one"
+               " merge")
+        with pytest.raises(MergeError, match=msg):
+            merge(left, right_w_dups, left_index=True, right_index=True,
+                  validate='one_to_one')
+
+        with pytest.raises(MergeError, match=msg):
+            merge(left, right_w_dups, on='a', validate='one_to_one')
+
+        # Dups on left
+        left_w_dups = left.append(pd.DataFrame({'a': ['a'], 'c': ['cow']},
+                                               index=[3]), sort=True)
+        merge(left_w_dups, right, left_index=True, right_index=True,
+              validate='many_to_one')
+
+        msg = ("Merge keys are not unique in left dataset; not a one-to-one"
+               " merge")
+        with pytest.raises(MergeError, match=msg):
+            merge(left_w_dups, right, left_index=True, right_index=True,
+                  validate='one_to_one')
+
+        with pytest.raises(MergeError, match=msg):
+            merge(left_w_dups, right, on='a', validate='one_to_one')
+
+        # Dups on both
+        merge(left_w_dups, right_w_dups, on='a', validate='many_to_many')
+
+        msg = ("Merge keys are not unique in right dataset; not a many-to-one"
+               " merge")
+        with pytest.raises(MergeError, match=msg):
+            merge(left_w_dups, right_w_dups, left_index=True,
+                  right_index=True, validate='many_to_one')
+
+        msg = ("Merge keys are not unique in left dataset; not a one-to-many"
+               " merge")
+        with pytest.raises(MergeError, match=msg):
+            merge(left_w_dups, right_w_dups, on='a',
+                  validate='one_to_many')
+
+        # Check invalid arguments
+        msg = "Not a valid argument for validate"
+        with pytest.raises(ValueError, match=msg):
+            merge(left, right, on='a', validate='jibberish')
+
+        # Two column merge, dups in both, but jointly no dups.
+        left = DataFrame({'a': ['a', 'a', 'b', 'b'],
+                          'b': [0, 1, 0, 1],
+                          'c': ['cat', 'dog', 'weasel', 'horse']},
+                         index=range(4))
+
+        right = DataFrame({'a': ['a', 'a', 'b'],
+                           'b': [0, 1, 0],
+                           'd': ['meow', 'bark', 'um... weasel noise?']},
+                          index=range(3))
+
+        expected_multi = DataFrame({'a': ['a', 'a', 'b'],
+                                    'b': [0, 1, 0],
+                                    'c': ['cat', 'dog', 'weasel'],
+                                    'd': ['meow', 'bark',
+                                          'um... weasel noise?']},
+                                   index=range(3))
+
+        msg = ("Merge keys are not unique in either left or right dataset;"
+               " not a one-to-one merge")
+        with pytest.raises(MergeError, match=msg):
+            merge(left, right, on='a', validate='1:1')
+
+        result = merge(left, right, on=['a', 'b'], validate='1:1')
+        assert_frame_equal(result, expected_multi)
+
+    def test_merge_two_empty_df_no_division_error(self):
+        # GH17776, PR #17846
+        a = pd.DataFrame({'a': [], 'b': [], 'c': []})
+        with np.errstate(divide='raise'):
+            merge(a, a, on=('a', 'b'))
+
+    @pytest.mark.parametrize('how', ['right', 'outer'])
+    def test_merge_on_index_with_more_values(self, how):
+        # GH 24212
+        # pd.merge gets [0, 1, 2, -1, -1, -1] as left_indexer, ensure that
+        # -1 is interpreted as a missing value instead of the last element
+        df1 = pd.DataFrame({'a': [1, 2, 3], 'key': [0, 2, 2]})
+        df2 = pd.DataFrame({'b': [1, 2, 3, 4, 5]})
+        result = df1.merge(df2, left_on='key', right_index=True, how=how)
+        expected = pd.DataFrame([[1.0, 0, 1],
+                                 [2.0, 2, 3],
+                                 [3.0, 2, 3],
+                                 [np.nan, 1, 2],
+                                 [np.nan, 3, 4],
+                                 [np.nan, 4, 5]],
+                                columns=['a', 'key', 'b'])
+        expected.set_index(Int64Index([0, 1, 2, 1, 3, 4]), inplace=True)
+        assert_frame_equal(result, expected)
+
+    def test_merge_right_index_right(self):
+        # Note: the expected output here is probably incorrect.
+        # See https://github.com/pandas-dev/pandas/issues/17257 for more.
+        # We include this as a regression test for GH-24897.
+        left = pd.DataFrame({'a': [1, 2, 3], 'key': [0, 1, 1]})
+        right = pd.DataFrame({'b': [1, 2, 3]})
+
+        expected = pd.DataFrame({'a': [1, 2, 3, None],
+                                 'key': [0, 1, 1, 2],
+                                 'b': [1, 2, 2, 3]},
+                                columns=['a', 'key', 'b'],
+                                index=[0, 1, 2, 2])
+        result = left.merge(right, left_on='key', right_index=True,
+                            how='right')
+        tm.assert_frame_equal(result, expected)
+
+
+def _check_merge(x, y):
+    for how in ['inner', 'left', 'outer']:
+        result = x.join(y, how=how)
+
+        expected = merge(x.reset_index(), y.reset_index(), how=how,
+                         sort=True)
+        expected = expected.set_index('index')
+
+        # TODO check_names on merge?
+        assert_frame_equal(result, expected, check_names=False)
+
+
+class TestMergeDtypes(object):
+
+    @pytest.mark.parametrize('right_vals', [
+        ['foo', 'bar'],
+        Series(['foo', 'bar']).astype('category'),
+    ])
+    def test_different(self, right_vals):
+
+        left = DataFrame({'A': ['foo', 'bar'],
+                          'B': Series(['foo', 'bar']).astype('category'),
+                          'C': [1, 2],
+                          'D': [1.0, 2.0],
+                          'E': Series([1, 2], dtype='uint64'),
+                          'F': Series([1, 2], dtype='int32')})
+        right = DataFrame({'A': right_vals})
+
+        # GH 9780
+        # We allow merging on object and categorical cols and cast
+        # categorical cols to object
+        result = pd.merge(left, right, on='A')
+        assert is_object_dtype(result.A.dtype)
+
+    @pytest.mark.parametrize('d1', [np.int64, np.int32,
+                                    np.int16, np.int8, np.uint8])
+    @pytest.mark.parametrize('d2', [np.int64, np.float64,
+                                    np.float32, np.float16])
+    def test_join_multi_dtypes(self, d1, d2):
+
+        dtype1 = np.dtype(d1)
+        dtype2 = np.dtype(d2)
+
+        left = DataFrame({'k1': np.array([0, 1, 2] * 8, dtype=dtype1),
+                          'k2': ['foo', 'bar'] * 12,
+                          'v': np.array(np.arange(24), dtype=np.int64)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': np.array([5, 7], dtype=dtype2)}, index=index)
+
+        result = left.join(right, on=['k1', 'k2'])
+
+        expected = left.copy()
+
+        if dtype2.kind == 'i':
+            dtype2 = np.dtype('float64')
+        expected['v2'] = np.array(np.nan, dtype=dtype2)
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on=['k1', 'k2'], sort=True)
+        expected.sort_values(['k1', 'k2'], kind='mergesort', inplace=True)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('int_vals, float_vals, exp_vals', [
+        ([1, 2, 3], [1.0, 2.0, 3.0], {'X': [1, 2, 3], 'Y': [1.0, 2.0, 3.0]}),
+        ([1, 2, 3], [1.0, 3.0], {'X': [1, 3], 'Y': [1.0, 3.0]}),
+        ([1, 2], [1.0, 2.0, 3.0], {'X': [1, 2], 'Y': [1.0, 2.0]}),
+    ])
+    def test_merge_on_ints_floats(self, int_vals, float_vals, exp_vals):
+        # GH 16572
+        # Check that float column is not cast to object if
+        # merging on float and int columns
+        A = DataFrame({'X': int_vals})
+        B = DataFrame({'Y': float_vals})
+        expected = DataFrame(exp_vals)
+
+        result = A.merge(B, left_on='X', right_on='Y')
+        assert_frame_equal(result, expected)
+
+        result = B.merge(A, left_on='Y', right_on='X')
+        assert_frame_equal(result, expected[['Y', 'X']])
+
+    def test_merge_on_ints_floats_warning(self):
+        # GH 16572
+        # merge will produce a warning when merging on int and
+        # float columns where the float values are not exactly
+        # equal to their int representation
+        A = DataFrame({'X': [1, 2, 3]})
+        B = DataFrame({'Y': [1.1, 2.5, 3.0]})
+        expected = DataFrame({'X': [3], 'Y': [3.0]})
+
+        with tm.assert_produces_warning(UserWarning):
+            result = A.merge(B, left_on='X', right_on='Y')
+            assert_frame_equal(result, expected)
+
+        with tm.assert_produces_warning(UserWarning):
+            result = B.merge(A, left_on='Y', right_on='X')
+            assert_frame_equal(result, expected[['Y', 'X']])
+
+        # test no warning if float has NaNs
+        B = DataFrame({'Y': [np.nan, np.nan, 3.0]})
+
+        with tm.assert_produces_warning(None):
+            result = B.merge(A, left_on='Y', right_on='X')
+            assert_frame_equal(result, expected[['Y', 'X']])
+
+    def test_merge_incompat_infer_boolean_object(self):
+        # GH21119: bool + object bool merge OK
+        df1 = DataFrame({'key': Series([True, False], dtype=object)})
+        df2 = DataFrame({'key': [True, False]})
+
+        expected = DataFrame({'key': [True, False]}, dtype=object)
+        result = pd.merge(df1, df2, on='key')
+        assert_frame_equal(result, expected)
+        result = pd.merge(df2, df1, on='key')
+        assert_frame_equal(result, expected)
+
+        # with missing value
+        df1 = DataFrame({'key': Series([True, False, np.nan], dtype=object)})
+        df2 = DataFrame({'key': [True, False]})
+
+        expected = DataFrame({'key': [True, False]}, dtype=object)
+        result = pd.merge(df1, df2, on='key')
+        assert_frame_equal(result, expected)
+        result = pd.merge(df2, df1, on='key')
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('df1_vals, df2_vals', [
+
+        # merge on category coerces to object
+        ([0, 1, 2], Series(['a', 'b', 'a']).astype('category')),
+        ([0.0, 1.0, 2.0], Series(['a', 'b', 'a']).astype('category')),
+
+        # no not infer
+        ([0, 1], pd.Series([False, True], dtype=object)),
+        ([0, 1], pd.Series([False, True], dtype=bool)),
+    ])
+    def test_merge_incompat_dtypes_are_ok(self, df1_vals, df2_vals):
+        # these are explicity allowed incompat merges, that pass thru
+        # the result type is dependent on if the values on the rhs are
+        # inferred, otherwise these will be coereced to object
+
+        df1 = DataFrame({'A': df1_vals})
+        df2 = DataFrame({'A': df2_vals})
+
+        result = pd.merge(df1, df2, on=['A'])
+        assert is_object_dtype(result.A.dtype)
+        result = pd.merge(df2, df1, on=['A'])
+        assert is_object_dtype(result.A.dtype)
+
+    @pytest.mark.parametrize('df1_vals, df2_vals', [
+        # do not infer to numeric
+
+        (Series([1, 2], dtype='uint64'), ["a", "b", "c"]),
+        (Series([1, 2], dtype='int32'), ["a", "b", "c"]),
+        ([0, 1, 2], ["0", "1", "2"]),
+        ([0.0, 1.0, 2.0], ["0", "1", "2"]),
+        ([0, 1, 2], [u"0", u"1", u"2"]),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), ['2011-01-01',
+                                                          '2011-01-02']),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), [0, 1]),
+        (pd.date_range('1/1/2011', periods=2, freq='D'), [0.0, 1.0]),
+        (pd.date_range('20130101', periods=3),
+            pd.date_range('20130101', periods=3, tz='US/Eastern')),
+    ])
+    def test_merge_incompat_dtypes_error(self, df1_vals, df2_vals):
+        # GH 9780, GH 15800
+        # Raise a ValueError when a user tries to merge on
+        # dtypes that are incompatible (e.g., obj and int/float)
+
+        df1 = DataFrame({'A': df1_vals})
+        df2 = DataFrame({'A': df2_vals})
+
+        msg = ("You are trying to merge on {lk_dtype} and "
+               "{rk_dtype} columns. If you wish to proceed "
+               "you should use pd.concat".format(lk_dtype=df1['A'].dtype,
+                                                 rk_dtype=df2['A'].dtype))
+        msg = re.escape(msg)
+        with pytest.raises(ValueError, match=msg):
+            pd.merge(df1, df2, on=['A'])
+
+        # Check that error still raised when swapping order of dataframes
+        msg = ("You are trying to merge on {lk_dtype} and "
+               "{rk_dtype} columns. If you wish to proceed "
+               "you should use pd.concat".format(lk_dtype=df2['A'].dtype,
+                                                 rk_dtype=df1['A'].dtype))
+        msg = re.escape(msg)
+        with pytest.raises(ValueError, match=msg):
+            pd.merge(df2, df1, on=['A'])
+
+
+@pytest.fixture
+def left():
+    np.random.seed(1234)
+    return DataFrame(
+        {'X': Series(np.random.choice(
+            ['foo', 'bar'],
+            size=(10,))).astype(CDT(['foo', 'bar'])),
+         'Y': np.random.choice(['one', 'two', 'three'], size=(10,))})
+
+
+@pytest.fixture
+def right():
+    np.random.seed(1234)
+    return DataFrame(
+        {'X': Series(['foo', 'bar']).astype(CDT(['foo', 'bar'])),
+         'Z': [1, 2]})
+
+
+class TestMergeCategorical(object):
+
+    def test_identical(self, left):
+        # merging on the same, should preserve dtypes
+        merged = pd.merge(left, left, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           np.dtype('O')],
+                          index=['X', 'Y_x', 'Y_y'])
+        assert_series_equal(result, expected)
+
+    def test_basic(self, left, right):
+        # we have matching Categorical dtypes in X
+        # so should preserve the merged column
+        merged = pd.merge(left, right, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           np.dtype('int64')],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+    def test_merge_categorical(self):
+        # GH 9426
+
+        right = DataFrame({'c': {0: 'a',
+                                 1: 'b',
+                                 2: 'c',
+                                 3: 'd',
+                                 4: 'e'},
+                           'd': {0: 'null',
+                                 1: 'null',
+                                 2: 'null',
+                                 3: 'null',
+                                 4: 'null'}})
+        left = DataFrame({'a': {0: 'f',
+                                1: 'f',
+                                2: 'f',
+                                3: 'f',
+                                4: 'f'},
+                          'b': {0: 'g',
+                                1: 'g',
+                                2: 'g',
+                                3: 'g',
+                                4: 'g'}})
+        df = pd.merge(left, right, how='left', left_on='b', right_on='c')
+
+        # object-object
+        expected = df.copy()
+
+        # object-cat
+        # note that we propagate the category
+        # because we don't have any matching rows
+        cright = right.copy()
+        cright['d'] = cright['d'].astype('category')
+        result = pd.merge(left, cright, how='left', left_on='b', right_on='c')
+        expected['d'] = expected['d'].astype(CategoricalDtype(['null']))
+        tm.assert_frame_equal(result, expected)
+
+        # cat-object
+        cleft = left.copy()
+        cleft['b'] = cleft['b'].astype('category')
+        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
+        tm.assert_frame_equal(result, expected)
+
+        # cat-cat
+        cright = right.copy()
+        cright['d'] = cright['d'].astype('category')
+        cleft = left.copy()
+        cleft['b'] = cleft['b'].astype('category')
+        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
+        tm.assert_frame_equal(result, expected)
+
+    def tests_merge_categorical_unordered_equal(self):
+        # GH-19551
+        df1 = DataFrame({
+            'Foo': Categorical(['A', 'B', 'C'], categories=['A', 'B', 'C']),
+            'Left': ['A0', 'B0', 'C0'],
+        })
+
+        df2 = DataFrame({
+            'Foo': Categorical(['C', 'B', 'A'], categories=['C', 'B', 'A']),
+            'Right': ['C1', 'B1', 'A1'],
+        })
+        result = pd.merge(df1, df2, on=['Foo'])
+        expected = DataFrame({
+            'Foo': pd.Categorical(['A', 'B', 'C']),
+            'Left': ['A0', 'B0', 'C0'],
+            'Right': ['A1', 'B1', 'C1'],
+        })
+        assert_frame_equal(result, expected)
+
+    def test_other_columns(self, left, right):
+        # non-merge columns should preserve if possible
+        right = right.assign(Z=right.Z.astype('category'))
+
+        merged = pd.merge(left, right, on='X')
+        result = merged.dtypes.sort_index()
+        expected = Series([CategoricalDtype(),
+                           np.dtype('O'),
+                           CategoricalDtype()],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+        # categories are preserved
+        assert left.X.values.is_dtype_equal(merged.X.values)
+        assert right.Z.values.is_dtype_equal(merged.Z.values)
+
+    @pytest.mark.parametrize(
+        'change', [lambda x: x,
+                   lambda x: x.astype(CDT(['foo', 'bar', 'bah'])),
+                   lambda x: x.astype(CDT(ordered=True))])
+    def test_dtype_on_merged_different(self, change, join_type, left, right):
+        # our merging columns, X now has 2 different dtypes
+        # so we must be object as a result
+
+        X = change(right.X.astype('object'))
+        right = right.assign(X=X)
+        assert is_categorical_dtype(left.X.values)
+        # assert not left.X.values.is_dtype_equal(right.X.values)
+
+        merged = pd.merge(left, right, on='X', how=join_type)
+
+        result = merged.dtypes.sort_index()
+        expected = Series([np.dtype('O'),
+                           np.dtype('O'),
+                           np.dtype('int64')],
+                          index=['X', 'Y', 'Z'])
+        assert_series_equal(result, expected)
+
+    def test_self_join_multiple_categories(self):
+        # GH 16767
+        # non-duplicates should work with multiple categories
+        m = 5
+        df = pd.DataFrame({
+            'a': ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j'] * m,
+            'b': ['t', 'w', 'x', 'y', 'z'] * 2 * m,
+            'c': [letter
+                  for each in ['m', 'n', 'u', 'p', 'o']
+                  for letter in [each] * 2 * m],
+            'd': [letter
+                  for each in ['aa', 'bb', 'cc', 'dd', 'ee',
+                               'ff', 'gg', 'hh', 'ii', 'jj']
+                  for letter in [each] * m]})
+
+        # change them all to categorical variables
+        df = df.apply(lambda x: x.astype('category'))
+
+        # self-join should equal ourselves
+        result = pd.merge(df, df, on=list(df.columns))
+
+        assert_frame_equal(result, df)
+
+    def test_dtype_on_categorical_dates(self):
+        # GH 16900
+        # dates should not be coerced to ints
+
+        df = pd.DataFrame(
+            [[date(2001, 1, 1), 1.1],
+             [date(2001, 1, 2), 1.3]],
+            columns=['date', 'num2']
+        )
+        df['date'] = df['date'].astype('category')
+
+        df2 = pd.DataFrame(
+            [[date(2001, 1, 1), 1.3],
+             [date(2001, 1, 3), 1.4]],
+            columns=['date', 'num4']
+        )
+        df2['date'] = df2['date'].astype('category')
+
+        expected_outer = pd.DataFrame([
+            [pd.Timestamp('2001-01-01'), 1.1, 1.3],
+            [pd.Timestamp('2001-01-02'), 1.3, np.nan],
+            [pd.Timestamp('2001-01-03'), np.nan, 1.4]],
+            columns=['date', 'num2', 'num4']
+        )
+        result_outer = pd.merge(df, df2, how='outer', on=['date'])
+        assert_frame_equal(result_outer, expected_outer)
+
+        expected_inner = pd.DataFrame(
+            [[pd.Timestamp('2001-01-01'), 1.1, 1.3]],
+            columns=['date', 'num2', 'num4']
+        )
+        result_inner = pd.merge(df, df2, how='inner', on=['date'])
+        assert_frame_equal(result_inner, expected_inner)
+
+    @pytest.mark.parametrize('ordered', [True, False])
+    @pytest.mark.parametrize('category_column,categories,expected_categories',
+                             [([False, True, True, False], [True, False],
+                               [True, False]),
+                              ([2, 1, 1, 2], [1, 2], [1, 2]),
+                              (['False', 'True', 'True', 'False'],
+                               ['True', 'False'], ['True', 'False'])])
+    def test_merging_with_bool_or_int_cateorical_column(self, category_column,
+                                                        categories,
+                                                        expected_categories,
+                                                        ordered):
+        # GH 17187
+        # merging with a boolean/int categorical column
+        df1 = pd.DataFrame({'id': [1, 2, 3, 4],
+                            'cat': category_column})
+        df1['cat'] = df1['cat'].astype(CDT(categories, ordered=ordered))
+        df2 = pd.DataFrame({'id': [2, 4], 'num': [1, 9]})
+        result = df1.merge(df2)
+        expected = pd.DataFrame({'id': [2, 4], 'cat': expected_categories,
+                                 'num': [1, 9]})
+        expected['cat'] = expected['cat'].astype(
+            CDT(categories, ordered=ordered))
+        assert_frame_equal(expected, result)
+
+    def test_merge_on_int_array(self):
+        # GH 23020
+        df = pd.DataFrame({'A': pd.Series([1, 2, np.nan], dtype='Int64'),
+                           'B': 1})
+        result = pd.merge(df, df, on='A')
+        expected = pd.DataFrame({'A': pd.Series([1, 2, np.nan], dtype='Int64'),
+                                 'B_x': 1,
+                                 'B_y': 1})
+        assert_frame_equal(result, expected)
+
+
+@pytest.fixture
+def left_df():
+    return DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
+
+
+@pytest.fixture
+def right_df():
+    return DataFrame({'b': [300, 100, 200]}, index=[3, 1, 2])
+
+
+class TestMergeOnIndexes(object):
+
+    @pytest.mark.parametrize(
+        "how, sort, expected",
+        [('inner', False, DataFrame({'a': [20, 10],
+                                     'b': [200, 100]},
+                                    index=[2, 1])),
+         ('inner', True, DataFrame({'a': [10, 20],
+                                    'b': [100, 200]},
+                                   index=[1, 2])),
+         ('left', False, DataFrame({'a': [20, 10, 0],
+                                    'b': [200, 100, np.nan]},
+                                   index=[2, 1, 0])),
+         ('left', True, DataFrame({'a': [0, 10, 20],
+                                   'b': [np.nan, 100, 200]},
+                                  index=[0, 1, 2])),
+         ('right', False, DataFrame({'a': [np.nan, 10, 20],
+                                     'b': [300, 100, 200]},
+                                    index=[3, 1, 2])),
+         ('right', True, DataFrame({'a': [10, 20, np.nan],
+                                    'b': [100, 200, 300]},
+                                   index=[1, 2, 3])),
+         ('outer', False, DataFrame({'a': [0, 10, 20, np.nan],
+                                     'b': [np.nan, 100, 200, 300]},
+                                    index=[0, 1, 2, 3])),
+         ('outer', True, DataFrame({'a': [0, 10, 20, np.nan],
+                                    'b': [np.nan, 100, 200, 300]},
+                                   index=[0, 1, 2, 3]))])
+    def test_merge_on_indexes(self, left_df, right_df, how, sort, expected):
+        result = pd.merge(left_df, right_df,
+                          left_index=True,
+                          right_index=True,
+                          how=how,
+                          sort=sort)
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'index', [
+        CategoricalIndex(['A', 'B'], categories=['A', 'B'], name='index_col'),
+        Float64Index([1.0, 2.0], name='index_col'),
+        Int64Index([1, 2], name='index_col'),
+        UInt64Index([1, 2], name='index_col'),
+        RangeIndex(start=0, stop=2, name='index_col'),
+        DatetimeIndex(["2018-01-01", "2018-01-02"], name='index_col'),
+    ], ids=lambda x: type(x).__name__)
+def test_merge_index_types(index):
+    # gh-20777
+    # assert key access is consistent across index types
+    left = DataFrame({"left_data": [1, 2]}, index=index)
+    right = DataFrame({"right_data": [1.0, 2.0]}, index=index)
+
+    result = left.merge(right, on=['index_col'])
+
+    expected = DataFrame(
+        OrderedDict([('left_data', [1, 2]), ('right_data', [1.0, 2.0])]),
+        index=index)
+    assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("on,left_on,right_on,left_index,right_index,nm", [
+    (['outer', 'inner'], None, None, False, False, 'B'),
+    (None, None, None, True, True, 'B'),
+    (None, ['outer', 'inner'], None, False, True, 'B'),
+    (None, None, ['outer', 'inner'], True, False, 'B'),
+    (['outer', 'inner'], None, None, False, False, None),
+    (None, None, None, True, True, None),
+    (None, ['outer', 'inner'], None, False, True, None),
+    (None, None, ['outer', 'inner'], True, False, None)])
+def test_merge_series(on, left_on, right_on, left_index, right_index, nm):
+    # GH 21220
+    a = pd.DataFrame({"A": [1, 2, 3, 4]},
+                     index=pd.MultiIndex.from_product([['a', 'b'], [0, 1]],
+                     names=['outer', 'inner']))
+    b = pd.Series([1, 2, 3, 4],
+                  index=pd.MultiIndex.from_product([['a', 'b'], [1, 2]],
+                  names=['outer', 'inner']), name=nm)
+    expected = pd.DataFrame({"A": [2, 4], "B": [1, 3]},
+                            index=pd.MultiIndex.from_product([['a', 'b'], [1]],
+                            names=['outer', 'inner']))
+    if nm is not None:
+        result = pd.merge(a, b, on=on, left_on=left_on, right_on=right_on,
+                          left_index=left_index, right_index=right_index)
+        tm.assert_frame_equal(result, expected)
+    else:
+        msg = "Cannot merge a Series without a name"
+        with pytest.raises(ValueError, match=msg):
+            result = pd.merge(a, b, on=on, left_on=left_on, right_on=right_on,
+                              left_index=left_index, right_index=right_index)
+
+
+@pytest.mark.parametrize("col1, col2, kwargs, expected_cols", [
+    (0, 0, dict(suffixes=("", "_dup")), ["0", "0_dup"]),
+    (0, 0, dict(suffixes=(None, "_dup")), [0, "0_dup"]),
+    (0, 0, dict(suffixes=("_x", "_y")), ["0_x", "0_y"]),
+    ("a", 0, dict(suffixes=(None, "_y")), ["a", 0]),
+    (0.0, 0.0, dict(suffixes=("_x", None)), ["0.0_x", 0.0]),
+    ("b", "b", dict(suffixes=(None, "_y")), ["b", "b_y"]),
+    ("a", "a", dict(suffixes=("_x", None)), ["a_x", "a"]),
+    ("a", "b", dict(suffixes=("_x", None)), ["a", "b"]),
+    ("a", "a", dict(suffixes=[None, "_x"]), ["a", "a_x"]),
+    (0, 0, dict(suffixes=["_a", None]), ["0_a", 0]),
+    ("a", "a", dict(), ["a_x", "a_y"]),
+    (0, 0, dict(), ["0_x", "0_y"])
+])
+def test_merge_suffix(col1, col2, kwargs, expected_cols):
+    # issue: 24782
+    a = pd.DataFrame({col1: [1, 2, 3]})
+    b = pd.DataFrame({col2: [4, 5, 6]})
+
+    expected = pd.DataFrame([[1, 4], [2, 5], [3, 6]],
+                            columns=expected_cols)
+
+    result = a.merge(b, left_index=True, right_index=True, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+    result = pd.merge(a, b, left_index=True, right_index=True, **kwargs)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("col1, col2, suffixes", [
+    ("a", "a", [None, None]),
+    ("a", "a", (None, None)),
+    ("a", "a", ("", None)),
+    (0, 0, [None, None]),
+    (0, 0, (None, ""))
+])
+def test_merge_suffix_error(col1, col2, suffixes):
+    # issue: 24782
+    a = pd.DataFrame({col1: [1, 2, 3]})
+    b = pd.DataFrame({col2: [3, 4, 5]})
+
+    # TODO: might reconsider current raise behaviour, see issue 24782
+    msg = "columns overlap but no suffix specified"
+    with pytest.raises(ValueError, match=msg):
+        pd.merge(a, b, left_index=True, right_index=True, suffixes=suffixes)
+
+
+@pytest.mark.parametrize("col1, col2, suffixes", [
+    ("a", "a", None),
+    (0, 0, None)
+])
+def test_merge_suffix_none_error(col1, col2, suffixes):
+    # issue: 24782
+    a = pd.DataFrame({col1: [1, 2, 3]})
+    b = pd.DataFrame({col2: [3, 4, 5]})
+
+    # TODO: might reconsider current raise behaviour, see GH24782
+    msg = "iterable"
+    with pytest.raises(TypeError, match=msg):
+        pd.merge(a, b, left_index=True, right_index=True, suffixes=suffixes)
diff --git a/pandas/tests/tools/test_merge_asof.py b/pandas/tests/reshape/merge/test_merge_asof.py
similarity index 79%
rename from pandas/tests/tools/test_merge_asof.py
rename to pandas/tests/reshape/merge/test_merge_asof.py
index c9460cc74c94a..1d1d7d48adaab 100644
--- a/pandas/tests/tools/test_merge_asof.py
+++ b/pandas/tests/reshape/merge/test_merge_asof.py
@@ -1,19 +1,17 @@
-import os
-
-import pytz
 import numpy as np
+import pytest
+import pytz
+
 import pandas as pd
-from pandas import (merge_asof, read_csv,
-                    to_datetime, Timedelta)
-from pandas.tools.merge import MergeError
-from pandas.util import testing as tm
+from pandas import Timedelta, merge_asof, read_csv, to_datetime
+from pandas.core.reshape.merge import MergeError
 from pandas.util.testing import assert_frame_equal
 
 
-class TestAsOfMerge(tm.TestCase):
+class TestAsOfMerge(object):
 
-    def read_data(self, name, dedupe=False):
-        path = os.path.join(tm.get_data_path(), name)
+    def read_data(self, datapath, name, dedupe=False):
+        path = datapath('reshape', 'merge', 'data', name)
         x = read_csv(path)
         if dedupe:
             x = (x.drop_duplicates(['time', 'ticker'], keep='last')
@@ -22,15 +20,17 @@ def read_data(self, name, dedupe=False):
         x.time = to_datetime(x.time)
         return x
 
-    def setUp(self):
+    @pytest.fixture(autouse=True)
+    def setup_method(self, datapath):
 
-        self.trades = self.read_data('trades.csv')
-        self.quotes = self.read_data('quotes.csv', dedupe=True)
-        self.asof = self.read_data('asof.csv')
-        self.tolerance = self.read_data('tolerance.csv')
-        self.allow_exact_matches = self.read_data('allow_exact_matches.csv')
+        self.trades = self.read_data(datapath, 'trades.csv')
+        self.quotes = self.read_data(datapath, 'quotes.csv', dedupe=True)
+        self.asof = self.read_data(datapath, 'asof.csv')
+        self.tolerance = self.read_data(datapath, 'tolerance.csv')
+        self.allow_exact_matches = self.read_data(datapath,
+                                                  'allow_exact_matches.csv')
         self.allow_exact_matches_and_tolerance = self.read_data(
-            'allow_exact_matches_and_tolerance.csv')
+            datapath, 'allow_exact_matches_and_tolerance.csv')
 
     def test_examples1(self):
         """ doc-string examples """
@@ -91,11 +91,30 @@ def test_examples2(self):
                       by='ticker',
                       tolerance=pd.Timedelta('2ms'))
 
-        pd.merge_asof(trades, quotes,
-                      on='time',
-                      by='ticker',
-                      tolerance=pd.Timedelta('10ms'),
-                      allow_exact_matches=False)
+        expected = pd.DataFrame({
+            'time': pd.to_datetime(['20160525 13:30:00.023',
+                                    '20160525 13:30:00.038',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048',
+                                    '20160525 13:30:00.048']),
+            'ticker': ['MSFT', 'MSFT', 'GOOG', 'GOOG', 'AAPL'],
+            'price': [51.95, 51.95,
+                      720.77, 720.92, 98.00],
+            'quantity': [75, 155,
+                         100, 100, 100],
+            'bid': [np.nan, 51.97, np.nan,
+                    np.nan, np.nan],
+            'ask': [np.nan, 51.98, np.nan,
+                    np.nan, np.nan]},
+            columns=['time', 'ticker', 'price', 'quantity',
+                     'bid', 'ask'])
+
+        result = pd.merge_asof(trades, quotes,
+                               on='time',
+                               by='ticker',
+                               tolerance=pd.Timedelta('10ms'),
+                               allow_exact_matches=False)
+        assert_frame_equal(result, expected)
 
     def test_examples3(self):
         """ doc-string examples """
@@ -200,14 +219,14 @@ def test_multi_index(self):
         # MultiIndex is prohibited
         trades = self.trades.set_index(['time', 'price'])
         quotes = self.quotes.set_index('time')
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        left_index=True,
                        right_index=True)
 
         trades = self.trades.set_index('time')
         quotes = self.quotes.set_index(['time', 'bid'])
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        left_index=True,
                        right_index=True)
@@ -217,7 +236,7 @@ def test_on_and_index(self):
         # 'on' parameter and index together is prohibited
         trades = self.trades.set_index('time')
         quotes = self.quotes.set_index('time')
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        left_on='price',
                        left_index=True,
@@ -225,7 +244,7 @@ def test_on_and_index(self):
 
         trades = self.trades.set_index('time')
         quotes = self.quotes.set_index('time')
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        right_on='bid',
                        left_index=True,
@@ -399,15 +418,15 @@ def test_multiby_indexed(self):
 
         assert_frame_equal(expected, result)
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             pd.merge_asof(left, right, left_index=True, right_index=True,
                           left_by=['k1', 'k2'], right_by=['k1'])
 
-    def test_basic2(self):
+    def test_basic2(self, datapath):
 
-        expected = self.read_data('asof2.csv')
-        trades = self.read_data('trades2.csv')
-        quotes = self.read_data('quotes2.csv', dedupe=True)
+        expected = self.read_data(datapath, 'asof2.csv')
+        trades = self.read_data(datapath, 'trades2.csv')
+        quotes = self.read_data(datapath, 'quotes2.csv', dedupe=True)
 
         result = merge_asof(trades, quotes,
                             on='time',
@@ -432,29 +451,29 @@ def test_valid_join_keys(self):
         trades = self.trades
         quotes = self.quotes
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        left_on='time',
                        right_on='bid',
                        by='ticker')
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        on=['time', 'ticker'],
                        by='ticker')
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        by='ticker')
 
-    def test_with_duplicates(self):
+    def test_with_duplicates(self, datapath):
 
         q = pd.concat([self.quotes, self.quotes]).sort_values(
             ['time', 'ticker']).reset_index(drop=True)
         result = merge_asof(self.trades, q,
                             on='time',
                             by='ticker')
-        expected = self.read_data('asof.csv')
+        expected = self.read_data(datapath, 'asof.csv')
         assert_frame_equal(result, expected)
 
     def test_with_duplicates_no_on(self):
@@ -474,7 +493,7 @@ def test_valid_allow_exact_matches(self):
         trades = self.trades
         quotes = self.quotes
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        on='time',
                        by='ticker',
@@ -498,27 +517,27 @@ def test_valid_tolerance(self):
                    tolerance=1)
 
         # incompat
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        on='time',
                        by='ticker',
                        tolerance=1)
 
         # invalid
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades.reset_index(), quotes.reset_index(),
                        on='index',
                        by='ticker',
                        tolerance=1.0)
 
         # invalid negative
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades, quotes,
                        on='time',
                        by='ticker',
                        tolerance=-Timedelta('1s'))
 
-        with self.assertRaises(MergeError):
+        with pytest.raises(MergeError):
             merge_asof(trades.reset_index(), quotes.reset_index(),
                        on='index',
                        by='ticker',
@@ -530,24 +549,24 @@ def test_non_sorted(self):
         quotes = self.quotes.sort_values('time', ascending=False)
 
         # we require that we are already sorted on time & quotes
-        self.assertFalse(trades.time.is_monotonic)
-        self.assertFalse(quotes.time.is_monotonic)
-        with self.assertRaises(ValueError):
+        assert not trades.time.is_monotonic
+        assert not quotes.time.is_monotonic
+        with pytest.raises(ValueError):
             merge_asof(trades, quotes,
                        on='time',
                        by='ticker')
 
         trades = self.trades.sort_values('time')
-        self.assertTrue(trades.time.is_monotonic)
-        self.assertFalse(quotes.time.is_monotonic)
-        with self.assertRaises(ValueError):
+        assert trades.time.is_monotonic
+        assert not quotes.time.is_monotonic
+        with pytest.raises(ValueError):
             merge_asof(trades, quotes,
                        on='time',
                        by='ticker')
 
         quotes = self.quotes.sort_values('time')
-        self.assertTrue(trades.time.is_monotonic)
-        self.assertTrue(quotes.time.is_monotonic)
+        assert trades.time.is_monotonic
+        assert quotes.time.is_monotonic
 
         # ok, though has dupes
         merge_asof(trades, self.quotes,
@@ -601,26 +620,41 @@ def test_tolerance_nearest(self):
     def test_tolerance_tz(self):
         # GH 14844
         left = pd.DataFrame(
-            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-02'),
-                                      freq='D', periods=5,
-                                      tz=pytz.timezone('UTC')),
+            {'date': pd.date_range(start=pd.to_datetime('2016-01-02'),
+                                   freq='D', periods=5,
+                                   tz=pytz.timezone('UTC')),
              'value1': np.arange(5)})
         right = pd.DataFrame(
-            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-01'),
-                                      freq='D', periods=5,
-                                      tz=pytz.timezone('UTC')),
+            {'date': pd.date_range(start=pd.to_datetime('2016-01-01'),
+                                   freq='D', periods=5,
+                                   tz=pytz.timezone('UTC')),
              'value2': list("ABCDE")})
         result = pd.merge_asof(left, right, on='date',
                                tolerance=pd.Timedelta('1 day'))
 
         expected = pd.DataFrame(
-            {'date': pd.DatetimeIndex(start=pd.to_datetime('2016-01-02'),
-                                      freq='D', periods=5,
-                                      tz=pytz.timezone('UTC')),
+            {'date': pd.date_range(start=pd.to_datetime('2016-01-02'),
+                                   freq='D', periods=5,
+                                   tz=pytz.timezone('UTC')),
              'value1': np.arange(5),
              'value2': list("BCDEE")})
         assert_frame_equal(result, expected)
 
+    def test_tolerance_float(self):
+        # GH22981
+        left = pd.DataFrame({'a': [1.1, 3.5, 10.9],
+                             'left_val': ['a', 'b', 'c']})
+        right = pd.DataFrame({'a': [1.0, 2.5, 3.3, 7.5, 11.5],
+                              'right_val': [1.0, 2.5, 3.3, 7.5, 11.5]})
+
+        expected = pd.DataFrame({'a': [1.1, 3.5, 10.9],
+                                 'left_val': ['a', 'b', 'c'],
+                                 'right_val': [1, 3.3, np.nan]})
+
+        result = pd.merge_asof(left, right, on='a', direction='nearest',
+                               tolerance=0.5)
+        assert_frame_equal(result, expected)
+
     def test_index_tolerance(self):
         # GH 15135
         expected = self.tolerance.set_index('time')
@@ -871,77 +905,64 @@ def test_on_float(self):
 
         assert_frame_equal(result, expected)
 
-    def test_on_specialized_type(self):
-        # GH13936
-        for dtype in [np.uint8, np.uint16, np.uint32, np.uint64,
-                      np.int8, np.int16, np.int32, np.int64,
-                      np.float16, np.float32, np.float64]:
-            df1 = pd.DataFrame({
-                'value': [5, 2, 25, 100, 78, 120, 79],
-                'symbol': list("ABCDEFG")},
-                columns=['symbol', 'value'])
-            df1.value = dtype(df1.value)
-
-            df2 = pd.DataFrame({
-                'value': [0, 80, 120, 125],
-                'result': list('xyzw')},
-                columns=['value', 'result'])
-            df2.value = dtype(df2.value)
-
-            df1 = df1.sort_values('value').reset_index(drop=True)
-
-            if dtype == np.float16:
-                with self.assertRaises(MergeError):
-                    pd.merge_asof(df1, df2, on='value')
-                continue
-
-            result = pd.merge_asof(df1, df2, on='value')
-
-            expected = pd.DataFrame(
-                {'symbol': list("BACEGDF"),
-                 'value': [2, 5, 25, 78, 79, 100, 120],
-                 'result': list('xxxxxyz')
-                 }, columns=['symbol', 'value', 'result'])
-            expected.value = dtype(expected.value)
-
-            assert_frame_equal(result, expected)
-
-    def test_on_specialized_type_by_int(self):
-        # GH13936
-        for dtype in [np.uint8, np.uint16, np.uint32, np.uint64,
-                      np.int8, np.int16, np.int32, np.int64,
-                      np.float16, np.float32, np.float64]:
-            df1 = pd.DataFrame({
-                'value': [5, 2, 25, 100, 78, 120, 79],
-                'key': [1, 2, 3, 2, 3, 1, 2],
-                'symbol': list("ABCDEFG")},
-                columns=['symbol', 'key', 'value'])
-            df1.value = dtype(df1.value)
-
-            df2 = pd.DataFrame({
-                'value': [0, 80, 120, 125],
-                'key': [1, 2, 2, 3],
-                'result': list('xyzw')},
-                columns=['value', 'key', 'result'])
-            df2.value = dtype(df2.value)
-
-            df1 = df1.sort_values('value').reset_index(drop=True)
-
-            if dtype == np.float16:
-                with self.assertRaises(MergeError):
-                    pd.merge_asof(df1, df2, on='value', by='key')
-            else:
-                result = pd.merge_asof(df1, df2, on='value', by='key')
+    def test_on_specialized_type(self, any_real_dtype):
+        # see gh-13936
+        dtype = np.dtype(any_real_dtype).type
+
+        df1 = pd.DataFrame({
+            "value": [5, 2, 25, 100, 78, 120, 79],
+            "symbol": list("ABCDEFG")},
+            columns=["symbol", "value"])
+        df1.value = dtype(df1.value)
+
+        df2 = pd.DataFrame({
+            "value": [0, 80, 120, 125],
+            "result": list("xyzw")},
+            columns=["value", "result"])
+        df2.value = dtype(df2.value)
+
+        df1 = df1.sort_values("value").reset_index(drop=True)
+        result = pd.merge_asof(df1, df2, on="value")
+
+        expected = pd.DataFrame(
+            {"symbol": list("BACEGDF"),
+             "value": [2, 5, 25, 78, 79, 100, 120],
+             "result": list("xxxxxyz")
+             }, columns=["symbol", "value", "result"])
+        expected.value = dtype(expected.value)
+
+        assert_frame_equal(result, expected)
+
+    def test_on_specialized_type_by_int(self, any_real_dtype):
+        # see gh-13936
+        dtype = np.dtype(any_real_dtype).type
 
-                expected = pd.DataFrame({
-                    'symbol': list("BACEGDF"),
-                    'key': [2, 1, 3, 3, 2, 2, 1],
-                    'value': [2, 5, 25, 78, 79, 100, 120],
-                    'result': [np.nan, 'x', np.nan, np.nan, np.nan, 'y', 'x']},
-                    columns=['symbol', 'key', 'value', 'result'])
-                expected.value = dtype(expected.value)
+        df1 = pd.DataFrame({
+            "value": [5, 2, 25, 100, 78, 120, 79],
+            "key": [1, 2, 3, 2, 3, 1, 2],
+            "symbol": list("ABCDEFG")},
+            columns=["symbol", "key", "value"])
+        df1.value = dtype(df1.value)
+
+        df2 = pd.DataFrame({
+            "value": [0, 80, 120, 125],
+            "key": [1, 2, 2, 3],
+            "result": list("xyzw")},
+            columns=["value", "key", "result"])
+        df2.value = dtype(df2.value)
+
+        df1 = df1.sort_values("value").reset_index(drop=True)
+        result = pd.merge_asof(df1, df2, on="value", by="key")
 
-                assert_frame_equal(result, expected)
+        expected = pd.DataFrame({
+            "symbol": list("BACEGDF"),
+            "key": [2, 1, 3, 3, 2, 2, 1],
+            "value": [2, 5, 25, 78, 79, 100, 120],
+            "result": [np.nan, "x", np.nan, np.nan, np.nan, "y", "x"]},
+            columns=["symbol", "key", "value", "result"])
+        expected.value = dtype(expected.value)
+
+        assert_frame_equal(result, expected)
 
     def test_on_float_by_int(self):
         # type specialize both "by" and "on" parameters
@@ -972,3 +993,46 @@ def test_on_float_by_int(self):
             columns=['symbol', 'exch', 'price', 'mpv'])
 
         assert_frame_equal(result, expected)
+
+    def test_merge_datatype_error(self):
+        """ Tests merge datatype mismatch error """
+        msg = r'merge keys \[0\] object and int64, must be the same type'
+
+        left = pd.DataFrame({'left_val': [1, 5, 10],
+                             'a': ['a', 'b', 'c']})
+        right = pd.DataFrame({'right_val': [1, 2, 3, 6, 7],
+                              'a': [1, 2, 3, 6, 7]})
+
+        with pytest.raises(MergeError, match=msg):
+            merge_asof(left, right, on='a')
+
+    @pytest.mark.parametrize('func', [lambda x: x, lambda x: to_datetime(x)],
+                             ids=['numeric', 'datetime'])
+    @pytest.mark.parametrize('side', ['left', 'right'])
+    def test_merge_on_nans(self, func, side):
+        # GH 23189
+        msg = "Merge keys contain null values on {} side".format(side)
+        nulls = func([1.0, 5.0, np.nan])
+        non_nulls = func([1.0, 5.0, 10.])
+        df_null = pd.DataFrame({'a': nulls, 'left_val': ['a', 'b', 'c']})
+        df = pd.DataFrame({'a': non_nulls, 'right_val': [1, 6, 11]})
+
+        with pytest.raises(ValueError, match=msg):
+            if side == 'left':
+                merge_asof(df_null, df, on='a')
+            else:
+                merge_asof(df, df_null, on='a')
+
+    def test_merge_by_col_tz_aware(self):
+        # GH 21184
+        left = pd.DataFrame(
+            {'by_col': pd.DatetimeIndex(['2018-01-01']).tz_localize('UTC'),
+             'on_col': [2], 'values': ['a']})
+        right = pd.DataFrame(
+            {'by_col': pd.DatetimeIndex(['2018-01-01']).tz_localize('UTC'),
+             'on_col': [1], 'values': ['b']})
+        result = pd.merge_asof(left, right, by='by_col', on='on_col')
+        expected = pd.DataFrame([
+            [pd.Timestamp('2018-01-01', tz='UTC'), 2, 'a', 'b']
+        ], columns=['by_col', 'on_col', 'values_x', 'values_y'])
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/merge/test_merge_index_as_string.py b/pandas/tests/reshape/merge/test_merge_index_as_string.py
new file mode 100644
index 0000000000000..12d9483af8761
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge_index_as_string.py
@@ -0,0 +1,177 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame
+from pandas.util.testing import assert_frame_equal
+
+
+@pytest.fixture
+def df1():
+    return DataFrame(dict(
+        outer=[1, 1, 1, 2, 2, 2, 2, 3, 3, 4, 4],
+        inner=[1, 2, 3, 1, 2, 3, 4, 1, 2, 1, 2],
+        v1=np.linspace(0, 1, 11)))
+
+
+@pytest.fixture
+def df2():
+    return DataFrame(dict(
+        outer=[1, 1, 1, 1, 1, 1, 2, 2, 3, 3, 3, 3],
+        inner=[1, 2, 2, 3, 3, 4, 2, 3, 1, 1, 2, 3],
+        v2=np.linspace(10, 11, 12)))
+
+
+@pytest.fixture(params=[[], ['outer'], ['outer', 'inner']])
+def left_df(request, df1):
+    """ Construct left test DataFrame with specified levels
+    (any of 'outer', 'inner', and 'v1')"""
+    levels = request.param
+    if levels:
+        df1 = df1.set_index(levels)
+
+    return df1
+
+
+@pytest.fixture(params=[[], ['outer'], ['outer', 'inner']])
+def right_df(request, df2):
+    """ Construct right test DataFrame with specified levels
+    (any of 'outer', 'inner', and 'v2')"""
+    levels = request.param
+
+    if levels:
+        df2 = df2.set_index(levels)
+
+    return df2
+
+
+def compute_expected(df_left, df_right,
+                     on=None, left_on=None, right_on=None, how=None):
+    """
+    Compute the expected merge result for the test case.
+
+    This method computes the expected result of merging two DataFrames on
+    a combination of their columns and index levels. It does so by
+    explicitly dropping/resetting their named index levels, performing a
+    merge on their columns, and then finally restoring the appropriate
+    index in the result.
+
+    Parameters
+    ----------
+    df_left : DataFrame
+        The left DataFrame (may have zero or more named index levels)
+    df_right : DataFrame
+        The right DataFrame (may have zero or more named index levels)
+    on : list of str
+        The on parameter to the merge operation
+    left_on : list of str
+        The left_on parameter to the merge operation
+    right_on : list of str
+        The right_on parameter to the merge operation
+    how : str
+        The how parameter to the merge operation
+
+    Returns
+    -------
+    DataFrame
+        The expected merge result
+    """
+
+    # Handle on param if specified
+    if on is not None:
+        left_on, right_on = on, on
+
+    # Compute input named index levels
+    left_levels = [n for n in df_left.index.names if n is not None]
+    right_levels = [n for n in df_right.index.names if n is not None]
+
+    # Compute output named index levels
+    output_levels = [i for i in left_on
+                     if i in right_levels and i in left_levels]
+
+    # Drop index levels that aren't involved in the merge
+    drop_left = [n for n in left_levels if n not in left_on]
+    if drop_left:
+        df_left = df_left.reset_index(drop_left, drop=True)
+
+    drop_right = [n for n in right_levels if n not in right_on]
+    if drop_right:
+        df_right = df_right.reset_index(drop_right, drop=True)
+
+    # Convert remaining index levels to columns
+    reset_left = [n for n in left_levels if n in left_on]
+    if reset_left:
+        df_left = df_left.reset_index(level=reset_left)
+
+    reset_right = [n for n in right_levels if n in right_on]
+    if reset_right:
+        df_right = df_right.reset_index(level=reset_right)
+
+    # Perform merge
+    expected = df_left.merge(df_right,
+                             left_on=left_on,
+                             right_on=right_on,
+                             how=how)
+
+    # Restore index levels
+    if output_levels:
+        expected = expected.set_index(output_levels)
+
+    return expected
+
+
+@pytest.mark.parametrize('on,how',
+                         [(['outer'], 'inner'),
+                          (['inner'], 'left'),
+                          (['outer', 'inner'], 'right'),
+                          (['inner', 'outer'], 'outer')])
+def test_merge_indexes_and_columns_on(left_df, right_df, on, how):
+
+    # Construct expected result
+    expected = compute_expected(left_df, right_df, on=on, how=how)
+
+    # Perform merge
+    result = left_df.merge(right_df, on=on, how=how)
+    assert_frame_equal(result, expected, check_like=True)
+
+
+@pytest.mark.parametrize('left_on,right_on,how',
+                         [(['outer'], ['outer'], 'inner'),
+                          (['inner'], ['inner'], 'right'),
+                          (['outer', 'inner'], ['outer', 'inner'], 'left'),
+                          (['inner', 'outer'], ['inner', 'outer'], 'outer')])
+def test_merge_indexes_and_columns_lefton_righton(
+        left_df, right_df, left_on, right_on, how):
+
+    # Construct expected result
+    expected = compute_expected(left_df, right_df,
+                                left_on=left_on,
+                                right_on=right_on,
+                                how=how)
+
+    # Perform merge
+    result = left_df.merge(right_df,
+                           left_on=left_on, right_on=right_on, how=how)
+    assert_frame_equal(result, expected, check_like=True)
+
+
+@pytest.mark.parametrize('left_index',
+                         ['inner', ['inner', 'outer']])
+def test_join_indexes_and_columns_on(df1, df2, left_index, join_type):
+
+    # Construct left_df
+    left_df = df1.set_index(left_index)
+
+    # Construct right_df
+    right_df = df2.set_index(['outer', 'inner'])
+
+    # Result
+    expected = (left_df.reset_index()
+                .join(right_df, on=['outer', 'inner'], how=join_type,
+                      lsuffix='_x', rsuffix='_y')
+                .set_index(left_index))
+
+    # Perform join
+    result = left_df.join(right_df, on=['outer', 'inner'], how=join_type,
+                          lsuffix='_x', rsuffix='_y')
+
+    assert_frame_equal(result, expected, check_like=True)
diff --git a/pandas/tests/reshape/merge/test_merge_ordered.py b/pandas/tests/reshape/merge/test_merge_ordered.py
new file mode 100644
index 0000000000000..414f46cdb296c
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_merge_ordered.py
@@ -0,0 +1,103 @@
+from numpy import nan
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, merge_ordered
+from pandas.util.testing import assert_frame_equal
+
+
+class TestMergeOrdered(object):
+
+    def setup_method(self, method):
+        self.left = DataFrame({'key': ['a', 'c', 'e'],
+                               'lvalue': [1, 2., 3]})
+
+        self.right = DataFrame({'key': ['b', 'c', 'd', 'f'],
+                                'rvalue': [1, 2, 3., 4]})
+
+    def test_basic(self):
+        result = merge_ordered(self.left, self.right, on='key')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
+                              'lvalue': [1, nan, 2, nan, 3, nan],
+                              'rvalue': [nan, 1, 2, 3, nan, 4]})
+
+        assert_frame_equal(result, expected)
+
+    def test_ffill(self):
+        result = merge_ordered(
+            self.left, self.right, on='key', fill_method='ffill')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
+                              'lvalue': [1., 1, 2, 2, 3, 3.],
+                              'rvalue': [nan, 1, 2, 3, 3, 4]})
+        assert_frame_equal(result, expected)
+
+    def test_multigroup(self):
+        left = pd.concat([self.left, self.left], ignore_index=True)
+
+        left['group'] = ['a'] * 3 + ['b'] * 3
+
+        result = merge_ordered(left, self.right, on='key', left_by='group',
+                               fill_method='ffill')
+        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'] * 2,
+                              'lvalue': [1., 1, 2, 2, 3, 3.] * 2,
+                              'rvalue': [nan, 1, 2, 3, 3, 4] * 2})
+        expected['group'] = ['a'] * 6 + ['b'] * 6
+
+        assert_frame_equal(result, expected.loc[:, result.columns])
+
+        result2 = merge_ordered(self.right, left, on='key', right_by='group',
+                                fill_method='ffill')
+        assert_frame_equal(result, result2.loc[:, result.columns])
+
+        result = merge_ordered(left, self.right, on='key', left_by='group')
+        assert result['group'].notna().all()
+
+    def test_merge_type(self):
+        class NotADataFrame(DataFrame):
+
+            @property
+            def _constructor(self):
+                return NotADataFrame
+
+        nad = NotADataFrame(self.left)
+        result = nad.merge(self.right, on='key')
+
+        assert isinstance(result, NotADataFrame)
+
+    def test_empty_sequence_concat(self):
+        # GH 9157
+        empty_pat = "[Nn]o objects"
+        none_pat = "objects.*None"
+        test_cases = [
+            ((), empty_pat),
+            ([], empty_pat),
+            ({}, empty_pat),
+            ([None], none_pat),
+            ([None, None], none_pat)
+        ]
+        for df_seq, pattern in test_cases:
+            with pytest.raises(ValueError, match=pattern):
+                pd.concat(df_seq)
+
+        pd.concat([pd.DataFrame()])
+        pd.concat([None, pd.DataFrame()])
+        pd.concat([pd.DataFrame(), None])
+
+    def test_doc_example(self):
+        left = DataFrame({'group': list('aaabbb'),
+                          'key': ['a', 'c', 'e', 'a', 'c', 'e'],
+                          'lvalue': [1, 2, 3] * 2,
+                          })
+
+        right = DataFrame({'key': ['b', 'c', 'd'],
+                           'rvalue': [1, 2, 3]})
+
+        result = merge_ordered(left, right, fill_method='ffill',
+                               left_by='group')
+
+        expected = DataFrame({'group': list('aaaaabbbbb'),
+                              'key': ['a', 'b', 'c', 'd', 'e'] * 2,
+                              'lvalue': [1, 1, 2, 2, 3] * 2,
+                              'rvalue': [nan, 1, 2, 3, 3] * 2})
+
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/merge/test_multi.py b/pandas/tests/reshape/merge/test_multi.py
new file mode 100644
index 0000000000000..7e8b5b1120bc6
--- /dev/null
+++ b/pandas/tests/reshape/merge/test_multi.py
@@ -0,0 +1,668 @@
+# pylint: disable=E1103
+
+from collections import OrderedDict
+
+import numpy as np
+from numpy import nan
+from numpy.random import randn
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.core.reshape.concat import concat
+from pandas.core.reshape.merge import merge
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def left():
+    """left dataframe (not multi-indexed) for multi-index join tests"""
+    # a little relevant example with NAs
+    key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
+            'qux', 'snap']
+    key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
+            'three', 'one']
+
+    data = np.random.randn(len(key1))
+    return DataFrame({'key1': key1, 'key2': key2, 'data': data})
+
+
+@pytest.fixture
+def right():
+    """right dataframe (multi-indexed) for multi-index join tests"""
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                               ['one', 'two', 'three']],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['key1', 'key2'])
+
+    return DataFrame(np.random.randn(10, 3), index=index,
+                     columns=['j_one', 'j_two', 'j_three'])
+
+
+@pytest.fixture
+def left_multi():
+    return (
+        DataFrame(
+            dict(Origin=['A', 'A', 'B', 'B', 'C'],
+                 Destination=['A', 'B', 'A', 'C', 'A'],
+                 Period=['AM', 'AM', 'IP', 'AM', 'OP'],
+                 TripPurp=['hbw', 'nhb', 'hbo', 'nhb', 'hbw'],
+                 Trips=[1987, 3647, 2470, 4296, 4444]),
+            columns=['Origin', 'Destination', 'Period',
+                     'TripPurp', 'Trips'])
+        .set_index(['Origin', 'Destination', 'Period', 'TripPurp']))
+
+
+@pytest.fixture
+def right_multi():
+    return (
+        DataFrame(
+            dict(Origin=['A', 'A', 'B', 'B', 'C', 'C', 'E'],
+                 Destination=['A', 'B', 'A', 'B', 'A', 'B', 'F'],
+                 Period=['AM', 'AM', 'IP', 'AM', 'OP', 'IP', 'AM'],
+                 LinkType=['a', 'b', 'c', 'b', 'a', 'b', 'a'],
+                 Distance=[100, 80, 90, 80, 75, 35, 55]),
+            columns=['Origin', 'Destination', 'Period',
+                     'LinkType', 'Distance'])
+        .set_index(['Origin', 'Destination', 'Period', 'LinkType']))
+
+
+@pytest.fixture
+def on_cols_multi():
+    return ['Origin', 'Destination', 'Period']
+
+
+@pytest.fixture
+def idx_cols_multi():
+    return ['Origin', 'Destination', 'Period', 'TripPurp', 'LinkType']
+
+
+class TestMergeMulti(object):
+
+    def setup_method(self):
+        self.index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                        ['one', 'two', 'three']],
+                                codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                       [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                                names=['first', 'second'])
+        self.to_join = DataFrame(np.random.randn(10, 3), index=self.index,
+                                 columns=['j_one', 'j_two', 'j_three'])
+
+        # a little relevant example with NAs
+        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
+                'qux', 'snap']
+        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
+                'three', 'one']
+
+        data = np.random.randn(len(key1))
+        self.data = DataFrame({'key1': key1, 'key2': key2,
+                               'data': data})
+
+    def test_merge_on_multikey(self, left, right, join_type):
+        on_cols = ['key1', 'key2']
+        result = (left.join(right, on=on_cols, how=join_type)
+                  .reset_index(drop=True))
+
+        expected = pd.merge(left, right.reset_index(),
+                            on=on_cols, how=join_type)
+
+        tm.assert_frame_equal(result, expected)
+
+        result = (left.join(right, on=on_cols, how=join_type, sort=True)
+                  .reset_index(drop=True))
+
+        expected = pd.merge(left, right.reset_index(),
+                            on=on_cols, how=join_type, sort=True)
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("sort", [False, True])
+    def test_left_join_multi_index(self, left, right, sort):
+        icols = ['1st', '2nd', '3rd']
+
+        def bind_cols(df):
+            iord = lambda a: 0 if a != a else ord(a)
+            f = lambda ts: ts.map(iord) - ord('a')
+            return (f(df['1st']) + f(df['3rd']) * 1e2 +
+                    df['2nd'].fillna(0) * 1e4)
+
+        def run_asserts(left, right, sort):
+            res = left.join(right, on=icols, how='left', sort=sort)
+
+            assert len(left) < len(res) + 1
+            assert not res['4th'].isna().any()
+            assert not res['5th'].isna().any()
+
+            tm.assert_series_equal(
+                res['4th'], - res['5th'], check_names=False)
+            result = bind_cols(res.iloc[:, :-2])
+            tm.assert_series_equal(res['4th'], result, check_names=False)
+            assert result.name is None
+
+            if sort:
+                tm.assert_frame_equal(
+                    res, res.sort_values(icols, kind='mergesort'))
+
+            out = merge(left, right.reset_index(), on=icols,
+                        sort=sort, how='left')
+
+            res.index = np.arange(len(res))
+            tm.assert_frame_equal(out, res)
+
+        lc = list(map(chr, np.arange(ord('a'), ord('z') + 1)))
+        left = DataFrame(np.random.choice(lc, (5000, 2)),
+                         columns=['1st', '3rd'])
+        left.insert(1, '2nd', np.random.randint(0, 1000, len(left)))
+
+        i = np.random.permutation(len(left))
+        right = left.iloc[i].copy()
+
+        left['4th'] = bind_cols(left)
+        right['5th'] = - bind_cols(right)
+        right.set_index(icols, inplace=True)
+
+        run_asserts(left, right, sort)
+
+        # inject some nulls
+        left.loc[1::23, '1st'] = np.nan
+        left.loc[2::37, '2nd'] = np.nan
+        left.loc[3::43, '3rd'] = np.nan
+        left['4th'] = bind_cols(left)
+
+        i = np.random.permutation(len(left))
+        right = left.iloc[i, :-1]
+        right['5th'] = - bind_cols(right)
+        right.set_index(icols, inplace=True)
+
+        run_asserts(left, right, sort)
+
+    @pytest.mark.parametrize("sort", [False, True])
+    def test_merge_right_vs_left(self, left, right, sort):
+        # compare left vs right merge with multikey
+        on_cols = ['key1', 'key2']
+        merged_left_right = left.merge(right,
+                                       left_on=on_cols, right_index=True,
+                                       how='left', sort=sort)
+
+        merge_right_left = right.merge(left,
+                                       right_on=on_cols, left_index=True,
+                                       how='right', sort=sort)
+
+        # Reorder columns
+        merge_right_left = merge_right_left[merged_left_right.columns]
+
+        tm.assert_frame_equal(merged_left_right, merge_right_left)
+
+    def test_compress_group_combinations(self):
+
+        # ~ 40000000 possible unique groups
+        key1 = tm.rands_array(10, 10000)
+        key1 = np.tile(key1, 2)
+        key2 = key1[::-1]
+
+        df = DataFrame({'key1': key1, 'key2': key2,
+                        'value1': np.random.randn(20000)})
+
+        df2 = DataFrame({'key1': key1[::2], 'key2': key2[::2],
+                         'value2': np.random.randn(10000)})
+
+        # just to hit the label compression code path
+        merge(df, df2, how='outer')
+
+    def test_left_join_index_preserve_order(self):
+
+        on_cols = ['k1', 'k2']
+        left = DataFrame({'k1': [0, 1, 2] * 8,
+                          'k2': ['foo', 'bar'] * 12,
+                          'v': np.array(np.arange(24), dtype=np.int64)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': [5, 7]}, index=index)
+
+        result = left.join(right, on=on_cols)
+
+        expected = left.copy()
+        expected['v2'] = np.nan
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+
+        result.sort_values(on_cols, kind='mergesort', inplace=True)
+        expected = left.join(right, on=on_cols, sort=True)
+
+        tm.assert_frame_equal(result, expected)
+
+        # test join with multi dtypes blocks
+        left = DataFrame({'k1': [0, 1, 2] * 8,
+                          'k2': ['foo', 'bar'] * 12,
+                          'k3': np.array([0, 1, 2] * 8, dtype=np.float32),
+                          'v': np.array(np.arange(24), dtype=np.int32)})
+
+        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
+        right = DataFrame({'v2': [5, 7]}, index=index)
+
+        result = left.join(right, on=on_cols)
+
+        expected = left.copy()
+        expected['v2'] = np.nan
+        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
+        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
+
+        tm.assert_frame_equal(result, expected)
+
+        result = result.sort_values(on_cols, kind='mergesort')
+        expected = left.join(right, on=on_cols, sort=True)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_left_join_index_multi_match_multiindex(self):
+        left = DataFrame([
+            ['X', 'Y', 'C', 'a'],
+            ['W', 'Y', 'C', 'e'],
+            ['V', 'Q', 'A', 'h'],
+            ['V', 'R', 'D', 'i'],
+            ['X', 'Y', 'D', 'b'],
+            ['X', 'Y', 'A', 'c'],
+            ['W', 'Q', 'B', 'f'],
+            ['W', 'R', 'C', 'g'],
+            ['V', 'Y', 'C', 'j'],
+            ['X', 'Y', 'B', 'd']],
+            columns=['cola', 'colb', 'colc', 'tag'],
+            index=[3, 2, 0, 1, 7, 6, 4, 5, 9, 8])
+
+        right = (DataFrame([
+            ['W', 'R', 'C', 0],
+            ['W', 'Q', 'B', 3],
+            ['W', 'Q', 'B', 8],
+            ['X', 'Y', 'A', 1],
+            ['X', 'Y', 'A', 4],
+            ['X', 'Y', 'B', 5],
+            ['X', 'Y', 'C', 6],
+            ['X', 'Y', 'C', 9],
+            ['X', 'Q', 'C', -6],
+            ['X', 'R', 'C', -9],
+            ['V', 'Y', 'C', 7],
+            ['V', 'R', 'D', 2],
+            ['V', 'R', 'D', -1],
+            ['V', 'Q', 'A', -3]],
+            columns=['col1', 'col2', 'col3', 'val'])
+            .set_index(['col1', 'col2', 'col3']))
+
+        result = left.join(right, on=['cola', 'colb', 'colc'], how='left')
+
+        expected = DataFrame([
+            ['X', 'Y', 'C', 'a', 6],
+            ['X', 'Y', 'C', 'a', 9],
+            ['W', 'Y', 'C', 'e', nan],
+            ['V', 'Q', 'A', 'h', -3],
+            ['V', 'R', 'D', 'i', 2],
+            ['V', 'R', 'D', 'i', -1],
+            ['X', 'Y', 'D', 'b', nan],
+            ['X', 'Y', 'A', 'c', 1],
+            ['X', 'Y', 'A', 'c', 4],
+            ['W', 'Q', 'B', 'f', 3],
+            ['W', 'Q', 'B', 'f', 8],
+            ['W', 'R', 'C', 'g', 0],
+            ['V', 'Y', 'C', 'j', 7],
+            ['X', 'Y', 'B', 'd', 5]],
+            columns=['cola', 'colb', 'colc', 'tag', 'val'],
+            index=[3, 3, 2, 0, 1, 1, 7, 6, 6, 4, 4, 5, 9, 8])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on=['cola', 'colb', 'colc'],
+                           how='left', sort=True)
+
+        expected = expected.sort_values(['cola', 'colb', 'colc'],
+                                        kind='mergesort')
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_left_join_index_multi_match(self):
+        left = DataFrame([
+            ['c', 0],
+            ['b', 1],
+            ['a', 2],
+            ['b', 3]],
+            columns=['tag', 'val'],
+            index=[2, 0, 1, 3])
+
+        right = (DataFrame([
+            ['a', 'v'],
+            ['c', 'w'],
+            ['c', 'x'],
+            ['d', 'y'],
+            ['a', 'z'],
+            ['c', 'r'],
+            ['e', 'q'],
+            ['c', 's']],
+            columns=['tag', 'char'])
+            .set_index('tag'))
+
+        result = left.join(right, on='tag', how='left')
+
+        expected = DataFrame([
+            ['c', 0, 'w'],
+            ['c', 0, 'x'],
+            ['c', 0, 'r'],
+            ['c', 0, 's'],
+            ['b', 1, nan],
+            ['a', 2, 'v'],
+            ['a', 2, 'z'],
+            ['b', 3, nan]],
+            columns=['tag', 'val', 'char'],
+            index=[2, 2, 2, 2, 0, 1, 1, 3])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = left.join(right, on='tag', how='left', sort=True)
+        expected2 = expected.sort_values('tag', kind='mergesort')
+
+        tm.assert_frame_equal(result, expected2)
+
+        # GH7331 - maintain left frame order in left merge
+        result = merge(left, right.reset_index(), how='left', on='tag')
+        expected.index = np.arange(len(expected))
+        tm.assert_frame_equal(result, expected)
+
+    def test_left_merge_na_buglet(self):
+        left = DataFrame({'id': list('abcde'), 'v1': randn(5),
+                          'v2': randn(5), 'dummy': list('abcde'),
+                          'v3': randn(5)},
+                         columns=['id', 'v1', 'v2', 'dummy', 'v3'])
+        right = DataFrame({'id': ['a', 'b', np.nan, np.nan, np.nan],
+                           'sv3': [1.234, 5.678, np.nan, np.nan, np.nan]})
+
+        result = merge(left, right, on='id', how='left')
+
+        rdf = right.drop(['id'], axis=1)
+        expected = left.join(rdf)
+        tm.assert_frame_equal(result, expected)
+
+    def test_merge_na_keys(self):
+        data = [[1950, "A", 1.5],
+                [1950, "B", 1.5],
+                [1955, "B", 1.5],
+                [1960, "B", np.nan],
+                [1970, "B", 4.],
+                [1950, "C", 4.],
+                [1960, "C", np.nan],
+                [1965, "C", 3.],
+                [1970, "C", 4.]]
+
+        frame = DataFrame(data, columns=["year", "panel", "data"])
+
+        other_data = [[1960, 'A', np.nan],
+                      [1970, 'A', np.nan],
+                      [1955, 'A', np.nan],
+                      [1965, 'A', np.nan],
+                      [1965, 'B', np.nan],
+                      [1955, 'C', np.nan]]
+        other = DataFrame(other_data, columns=['year', 'panel', 'data'])
+
+        result = frame.merge(other, how='outer')
+
+        expected = frame.fillna(-999).merge(other.fillna(-999), how='outer')
+        expected = expected.replace(-999, np.nan)
+
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("klass", [None, np.asarray, Series, Index])
+    def test_merge_datetime_index(self, klass):
+        # see gh-19038
+        df = DataFrame([1, 2, 3],
+                       ["2016-01-01", "2017-01-01", "2018-01-01"],
+                       columns=["a"])
+        df.index = pd.to_datetime(df.index)
+        on_vector = df.index.year
+
+        if klass is not None:
+            on_vector = klass(on_vector)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("a", [1, 2, 3]),
+                ("key_1", [2016, 2017, 2018]),
+            ])
+        )
+
+        result = df.merge(df, on=["a", on_vector], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("key_0", [2016, 2017, 2018]),
+                ("a_x", [1, 2, 3]),
+                ("a_y", [1, 2, 3]),
+            ])
+        )
+
+        result = df.merge(df, on=[df.index.year], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_multi_levels(self):
+
+        # GH 3662
+        # merge multi-levels
+        household = (
+            DataFrame(
+                dict(household_id=[1, 2, 3],
+                     male=[0, 1, 0],
+                     wealth=[196087.3, 316478.7, 294750]),
+                columns=['household_id', 'male', 'wealth'])
+            .set_index('household_id'))
+        portfolio = (
+            DataFrame(
+                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
+                     asset_id=["nl0000301109", "nl0000289783", "gb00b03mlx29",
+                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
+                               np.nan],
+                     name=["ABN Amro", "Robeco", "Royal Dutch Shell",
+                           "Royal Dutch Shell",
+                           "AAB Eastern Europe Equity Fund",
+                           "Postbank BioTech Fonds", np.nan],
+                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
+                columns=['household_id', 'asset_id', 'name', 'share'])
+            .set_index(['household_id', 'asset_id']))
+        result = household.join(portfolio, how='inner')
+        expected = (
+            DataFrame(
+                dict(male=[0, 1, 1, 0, 0, 0],
+                     wealth=[196087.3, 316478.7, 316478.7,
+                             294750.0, 294750.0, 294750.0],
+                     name=['ABN Amro', 'Robeco', 'Royal Dutch Shell',
+                           'Royal Dutch Shell',
+                           'AAB Eastern Europe Equity Fund',
+                           'Postbank BioTech Fonds'],
+                     share=[1.00, 0.40, 0.60, 0.15, 0.60, 0.25],
+                     household_id=[1, 2, 2, 3, 3, 3],
+                     asset_id=['nl0000301109', 'nl0000289783', 'gb00b03mlx29',
+                               'gb00b03mlx29', 'lu0197800237',
+                               'nl0000289965']))
+            .set_index(['household_id', 'asset_id'])
+            .reindex(columns=['male', 'wealth', 'name', 'share']))
+        tm.assert_frame_equal(result, expected)
+
+        # equivalency
+        result = (merge(household.reset_index(), portfolio.reset_index(),
+                        on=['household_id'], how='inner')
+                  .set_index(['household_id', 'asset_id']))
+        tm.assert_frame_equal(result, expected)
+
+        result = household.join(portfolio, how='outer')
+        expected = (concat([
+            expected,
+            (DataFrame(
+                dict(share=[1.00]),
+                index=MultiIndex.from_tuples(
+                    [(4, np.nan)],
+                    names=['household_id', 'asset_id'])))
+        ], axis=0, sort=True).reindex(columns=expected.columns))
+        tm.assert_frame_equal(result, expected)
+
+        # invalid cases
+        household.index.name = 'foo'
+
+        with pytest.raises(ValueError):
+            household.join(portfolio, how='inner')
+
+        portfolio2 = portfolio.copy()
+        portfolio2.index.set_names(['household_id', 'foo'])
+
+        with pytest.raises(ValueError):
+            portfolio2.join(portfolio, how='inner')
+
+    def test_join_multi_levels2(self):
+
+        # some more advanced merges
+        # GH6360
+        household = (
+            DataFrame(
+                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
+                     asset_id=["nl0000301109", "nl0000301109", "gb00b03mlx29",
+                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
+                               np.nan],
+                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
+                columns=['household_id', 'asset_id', 'share'])
+            .set_index(['household_id', 'asset_id']))
+
+        log_return = DataFrame(dict(
+            asset_id=["gb00b03mlx29", "gb00b03mlx29",
+                      "gb00b03mlx29", "lu0197800237", "lu0197800237"],
+            t=[233, 234, 235, 180, 181],
+            log_return=[.09604978, -.06524096, .03532373, .03025441, .036997]
+        )).set_index(["asset_id", "t"])
+
+        expected = (
+            DataFrame(dict(
+                household_id=[2, 2, 2, 3, 3, 3, 3, 3],
+                asset_id=["gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "lu0197800237", "lu0197800237"],
+                t=[233, 234, 235, 233, 234, 235, 180, 181],
+                share=[0.6, 0.6, 0.6, 0.15, 0.15, 0.15, 0.6, 0.6],
+                log_return=[.09604978, -.06524096, .03532373,
+                            .09604978, -.06524096, .03532373,
+                            .03025441, .036997]
+            ))
+            .set_index(["household_id", "asset_id", "t"])
+            .reindex(columns=['share', 'log_return']))
+
+        # this is the equivalency
+        result = (merge(household.reset_index(), log_return.reset_index(),
+                        on=['asset_id'], how='inner')
+                  .set_index(['household_id', 'asset_id', 't']))
+        tm.assert_frame_equal(result, expected)
+
+        expected = (
+            DataFrame(dict(
+                household_id=[1, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 4],
+                asset_id=["nl0000301109", "nl0000301109", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29",
+                          "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29",
+                          "lu0197800237", "lu0197800237",
+                          "nl0000289965", None],
+                t=[None, None, 233, 234, 235, 233, 234,
+                   235, 180, 181, None, None],
+                share=[1.0, 0.4, 0.6, 0.6, 0.6, 0.15,
+                       0.15, 0.15, 0.6, 0.6, 0.25, 1.0],
+                log_return=[None, None, .09604978, -.06524096, .03532373,
+                            .09604978, -.06524096, .03532373,
+                            .03025441, .036997, None, None]
+            ))
+            .set_index(["household_id", "asset_id", "t"])
+            .reindex(columns=['share', 'log_return']))
+
+        result = (merge(household.reset_index(), log_return.reset_index(),
+                  on=['asset_id'], how='outer')
+                  .set_index(['household_id', 'asset_id', 't']))
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestJoinMultiMulti(object):
+
+    def test_join_multi_multi(self, left_multi, right_multi, join_type,
+                              on_cols_multi, idx_cols_multi):
+        # Multi-index join tests
+        expected = (pd.merge(left_multi.reset_index(),
+                             right_multi.reset_index(),
+                             how=join_type, on=on_cols_multi).
+                    set_index(idx_cols_multi).sort_index())
+
+        result = left_multi.join(right_multi, how=join_type).sort_index()
+        tm.assert_frame_equal(result, expected)
+
+    def test_join_multi_empty_frames(self, left_multi, right_multi, join_type,
+                                     on_cols_multi, idx_cols_multi):
+
+        left_multi = left_multi.drop(columns=left_multi.columns)
+        right_multi = right_multi.drop(columns=right_multi.columns)
+
+        expected = (pd.merge(left_multi.reset_index(),
+                             right_multi.reset_index(),
+                             how=join_type, on=on_cols_multi)
+                    .set_index(idx_cols_multi).sort_index())
+
+        result = left_multi.join(right_multi, how=join_type).sort_index()
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("box", [None, np.asarray, Series, Index])
+    def test_merge_datetime_index(self, box):
+        # see gh-19038
+        df = DataFrame([1, 2, 3],
+                       ["2016-01-01", "2017-01-01", "2018-01-01"],
+                       columns=["a"])
+        df.index = pd.to_datetime(df.index)
+        on_vector = df.index.year
+
+        if box is not None:
+            on_vector = box(on_vector)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("a", [1, 2, 3]),
+                ("key_1", [2016, 2017, 2018]),
+            ])
+        )
+
+        result = df.merge(df, on=["a", on_vector], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+        expected = DataFrame(
+            OrderedDict([
+                ("key_0", [2016, 2017, 2018]),
+                ("a_x", [1, 2, 3]),
+                ("a_y", [1, 2, 3]),
+            ])
+        )
+
+        result = df.merge(df, on=[df.index.year], how="inner")
+        tm.assert_frame_equal(result, expected)
+
+    def test_single_common_level(self):
+        index_left = pd.MultiIndex.from_tuples([('K0', 'X0'), ('K0', 'X1'),
+                                                ('K1', 'X2')],
+                                               names=['key', 'X'])
+
+        left = pd.DataFrame({'A': ['A0', 'A1', 'A2'],
+                             'B': ['B0', 'B1', 'B2']},
+                            index=index_left)
+
+        index_right = pd.MultiIndex.from_tuples([('K0', 'Y0'), ('K1', 'Y1'),
+                                                 ('K2', 'Y2'), ('K2', 'Y3')],
+                                                names=['key', 'Y'])
+
+        right = pd.DataFrame({'C': ['C0', 'C1', 'C2', 'C3'],
+                              'D': ['D0', 'D1', 'D2', 'D3']},
+                             index=index_right)
+
+        result = left.join(right)
+        expected = (pd.merge(left.reset_index(), right.reset_index(),
+                             on=['key'], how='inner')
+                    .set_index(['key', 'X', 'Y']))
+
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_concat.py b/pandas/tests/reshape/test_concat.py
new file mode 100644
index 0000000000000..a186d32ed8800
--- /dev/null
+++ b/pandas/tests/reshape/test_concat.py
@@ -0,0 +1,2563 @@
+from collections import deque
+import datetime as dt
+from datetime import datetime
+from decimal import Decimal
+from itertools import combinations
+from warnings import catch_warnings
+
+import dateutil
+import numpy as np
+from numpy.random import randn
+import pytest
+
+from pandas.compat import PY2, Iterable, StringIO, iteritems
+
+from pandas.core.dtypes.dtypes import CategoricalDtype
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, MultiIndex, Panel, Series,
+    Timestamp, concat, date_range, isna, read_csv)
+from pandas.tests.extension.decimal import to_decimal
+from pandas.util import testing as tm
+from pandas.util.testing import assert_frame_equal, makeCustomDataframe as mkdf
+
+
+@pytest.fixture(params=[True, False])
+def sort(request):
+    """Boolean sort keyword for concat and DataFrame.append."""
+    return request.param
+
+
+@pytest.fixture(params=[True, False, None])
+def sort_with_none(request):
+    """Boolean sort keyword for concat and DataFrame.append.
+
+    Includes the default of None
+    """
+    # TODO: Replace with sort once keyword changes.
+    return request.param
+
+
+class ConcatenateBase(object):
+
+    def setup_method(self, method):
+        self.frame = DataFrame(tm.getSeriesData())
+        self.mixed_frame = self.frame.copy()
+        self.mixed_frame['foo'] = 'bar'
+
+
+class TestConcatAppendCommon(ConcatenateBase):
+
+    """
+    Test common dtype coercion rules between concat and append.
+    """
+
+    def setup_method(self, method):
+
+        dt_data = [pd.Timestamp('2011-01-01'),
+                   pd.Timestamp('2011-01-02'),
+                   pd.Timestamp('2011-01-03')]
+        tz_data = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+                   pd.Timestamp('2011-01-02', tz='US/Eastern'),
+                   pd.Timestamp('2011-01-03', tz='US/Eastern')]
+
+        td_data = [pd.Timedelta('1 days'),
+                   pd.Timedelta('2 days'),
+                   pd.Timedelta('3 days')]
+
+        period_data = [pd.Period('2011-01', freq='M'),
+                       pd.Period('2011-02', freq='M'),
+                       pd.Period('2011-03', freq='M')]
+
+        self.data = {'bool': [True, False, True],
+                     'int64': [1, 2, 3],
+                     'float64': [1.1, np.nan, 3.3],
+                     'category': pd.Categorical(['X', 'Y', 'Z']),
+                     'object': ['a', 'b', 'c'],
+                     'datetime64[ns]': dt_data,
+                     'datetime64[ns, US/Eastern]': tz_data,
+                     'timedelta64[ns]': td_data,
+                     'period[M]': period_data}
+
+    def _check_expected_dtype(self, obj, label):
+        """
+        Check whether obj has expected dtype depending on label
+        considering not-supported dtypes
+        """
+        if isinstance(obj, pd.Index):
+            if label == 'bool':
+                assert obj.dtype == 'object'
+            else:
+                assert obj.dtype == label
+        elif isinstance(obj, pd.Series):
+            if label.startswith('period'):
+                assert obj.dtype == 'Period[M]'
+            else:
+                assert obj.dtype == label
+        else:
+            raise ValueError
+
+    def test_dtypes(self):
+        # to confirm test case covers intended dtypes
+        for typ, vals in iteritems(self.data):
+            self._check_expected_dtype(pd.Index(vals), typ)
+            self._check_expected_dtype(pd.Series(vals), typ)
+
+    def test_concatlike_same_dtypes(self):
+        # GH 13660
+        for typ1, vals1 in iteritems(self.data):
+
+            vals2 = vals1
+            vals3 = vals1
+
+            if typ1 == 'category':
+                exp_data = pd.Categorical(list(vals1) + list(vals2))
+                exp_data3 = pd.Categorical(list(vals1) + list(vals2) +
+                                           list(vals3))
+            else:
+                exp_data = vals1 + vals2
+                exp_data3 = vals1 + vals2 + vals3
+
+            # ----- Index ----- #
+
+            # index.append
+            res = pd.Index(vals1).append(pd.Index(vals2))
+            exp = pd.Index(exp_data)
+            tm.assert_index_equal(res, exp)
+
+            # 3 elements
+            res = pd.Index(vals1).append([pd.Index(vals2), pd.Index(vals3)])
+            exp = pd.Index(exp_data3)
+            tm.assert_index_equal(res, exp)
+
+            # index.append name mismatch
+            i1 = pd.Index(vals1, name='x')
+            i2 = pd.Index(vals2, name='y')
+            res = i1.append(i2)
+            exp = pd.Index(exp_data)
+            tm.assert_index_equal(res, exp)
+
+            # index.append name match
+            i1 = pd.Index(vals1, name='x')
+            i2 = pd.Index(vals2, name='x')
+            res = i1.append(i2)
+            exp = pd.Index(exp_data, name='x')
+            tm.assert_index_equal(res, exp)
+
+            # cannot append non-index
+            with pytest.raises(TypeError, match='all inputs must be Index'):
+                pd.Index(vals1).append(vals2)
+
+            with pytest.raises(TypeError, match='all inputs must be Index'):
+                pd.Index(vals1).append([pd.Index(vals2), vals3])
+
+            # ----- Series ----- #
+
+            # series.append
+            res = pd.Series(vals1).append(pd.Series(vals2),
+                                          ignore_index=True)
+            exp = pd.Series(exp_data)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # concat
+            res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
+                            ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # 3 elements
+            res = pd.Series(vals1).append([pd.Series(vals2), pd.Series(vals3)],
+                                          ignore_index=True)
+            exp = pd.Series(exp_data3)
+            tm.assert_series_equal(res, exp)
+
+            res = pd.concat([pd.Series(vals1), pd.Series(vals2),
+                             pd.Series(vals3)], ignore_index=True)
+            tm.assert_series_equal(res, exp)
+
+            # name mismatch
+            s1 = pd.Series(vals1, name='x')
+            s2 = pd.Series(vals2, name='y')
+            res = s1.append(s2, ignore_index=True)
+            exp = pd.Series(exp_data)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            res = pd.concat([s1, s2], ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # name match
+            s1 = pd.Series(vals1, name='x')
+            s2 = pd.Series(vals2, name='x')
+            res = s1.append(s2, ignore_index=True)
+            exp = pd.Series(exp_data, name='x')
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            res = pd.concat([s1, s2], ignore_index=True)
+            tm.assert_series_equal(res, exp, check_index_type=True)
+
+            # cannot append non-index
+            msg = (r'cannot concatenate object of type \"(.+?)\";'
+                   ' only pd.Series, pd.DataFrame, and pd.Panel'
+                   r' \(deprecated\) objs are valid')
+            with pytest.raises(TypeError, match=msg):
+                pd.Series(vals1).append(vals2)
+
+            with pytest.raises(TypeError, match=msg):
+                pd.Series(vals1).append([pd.Series(vals2), vals3])
+
+            with pytest.raises(TypeError, match=msg):
+                pd.concat([pd.Series(vals1), vals2])
+
+            with pytest.raises(TypeError, match=msg):
+                pd.concat([pd.Series(vals1), pd.Series(vals2), vals3])
+
+    def test_concatlike_dtypes_coercion(self):
+        # GH 13660
+        for typ1, vals1 in iteritems(self.data):
+            for typ2, vals2 in iteritems(self.data):
+
+                vals3 = vals2
+
+                # basically infer
+                exp_index_dtype = None
+                exp_series_dtype = None
+
+                if typ1 == typ2:
+                    # same dtype is tested in test_concatlike_same_dtypes
+                    continue
+                elif typ1 == 'category' or typ2 == 'category':
+                    # ToDo: suspicious
+                    continue
+
+                # specify expected dtype
+                if typ1 == 'bool' and typ2 in ('int64', 'float64'):
+                    # series coerces to numeric based on numpy rule
+                    # index doesn't because bool is object dtype
+                    exp_series_dtype = typ2
+                elif typ2 == 'bool' and typ1 in ('int64', 'float64'):
+                    exp_series_dtype = typ1
+                elif (typ1 == 'datetime64[ns, US/Eastern]' or
+                      typ2 == 'datetime64[ns, US/Eastern]' or
+                      typ1 == 'timedelta64[ns]' or
+                      typ2 == 'timedelta64[ns]'):
+                    exp_index_dtype = object
+                    exp_series_dtype = object
+
+                exp_data = vals1 + vals2
+                exp_data3 = vals1 + vals2 + vals3
+
+                # ----- Index ----- #
+
+                # index.append
+                res = pd.Index(vals1).append(pd.Index(vals2))
+                exp = pd.Index(exp_data, dtype=exp_index_dtype)
+                tm.assert_index_equal(res, exp)
+
+                # 3 elements
+                res = pd.Index(vals1).append([pd.Index(vals2),
+                                              pd.Index(vals3)])
+                exp = pd.Index(exp_data3, dtype=exp_index_dtype)
+                tm.assert_index_equal(res, exp)
+
+                # ----- Series ----- #
+
+                # series.append
+                res = pd.Series(vals1).append(pd.Series(vals2),
+                                              ignore_index=True)
+                exp = pd.Series(exp_data, dtype=exp_series_dtype)
+                tm.assert_series_equal(res, exp, check_index_type=True)
+
+                # concat
+                res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
+                                ignore_index=True)
+                tm.assert_series_equal(res, exp, check_index_type=True)
+
+                # 3 elements
+                res = pd.Series(vals1).append([pd.Series(vals2),
+                                               pd.Series(vals3)],
+                                              ignore_index=True)
+                exp = pd.Series(exp_data3, dtype=exp_series_dtype)
+                tm.assert_series_equal(res, exp)
+
+                res = pd.concat([pd.Series(vals1), pd.Series(vals2),
+                                 pd.Series(vals3)], ignore_index=True)
+                tm.assert_series_equal(res, exp)
+
+    def test_concatlike_common_coerce_to_pandas_object(self):
+        # GH 13626
+        # result must be Timestamp/Timedelta, not datetime.datetime/timedelta
+        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'])
+        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
+
+        exp = pd.Index([pd.Timestamp('2011-01-01'),
+                        pd.Timestamp('2011-01-02'),
+                        pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')])
+
+        res = dti.append(tdi)
+        tm.assert_index_equal(res, exp)
+        assert isinstance(res[0], pd.Timestamp)
+        assert isinstance(res[-1], pd.Timedelta)
+
+        dts = pd.Series(dti)
+        tds = pd.Series(tdi)
+        res = dts.append(tds)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+        assert isinstance(res.iloc[0], pd.Timestamp)
+        assert isinstance(res.iloc[-1], pd.Timedelta)
+
+        res = pd.concat([dts, tds])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+        assert isinstance(res.iloc[0], pd.Timestamp)
+        assert isinstance(res.iloc[-1], pd.Timedelta)
+
+    def test_concatlike_datetimetz(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH 7795
+        dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
+        dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'], tz=tz)
+
+        exp = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                '2012-01-01', '2012-01-02'], tz=tz)
+
+        res = dti1.append(dti2)
+        tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts2 = pd.Series(dti2)
+        res = dts1.append(dts2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    @pytest.mark.parametrize('tz',
+                             ['UTC', 'US/Eastern', 'Asia/Tokyo', 'EST5EDT'])
+    def test_concatlike_datetimetz_short(self, tz):
+        # GH#7795
+        ix1 = pd.date_range(start='2014-07-15', end='2014-07-17',
+                            freq='D', tz=tz)
+        ix2 = pd.DatetimeIndex(['2014-07-11', '2014-07-21'], tz=tz)
+        df1 = pd.DataFrame(0, index=ix1, columns=['A', 'B'])
+        df2 = pd.DataFrame(0, index=ix2, columns=['A', 'B'])
+
+        exp_idx = pd.DatetimeIndex(['2014-07-15', '2014-07-16',
+                                    '2014-07-17', '2014-07-11',
+                                    '2014-07-21'], tz=tz)
+        exp = pd.DataFrame(0, index=exp_idx, columns=['A', 'B'])
+
+        tm.assert_frame_equal(df1.append(df2), exp)
+        tm.assert_frame_equal(pd.concat([df1, df2]), exp)
+
+    def test_concatlike_datetimetz_to_object(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH 13660
+
+        # different tz coerces to object
+        dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
+        dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'])
+
+        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
+                        pd.Timestamp('2011-01-02', tz=tz),
+                        pd.Timestamp('2012-01-01'),
+                        pd.Timestamp('2012-01-02')], dtype=object)
+
+        res = dti1.append(dti2)
+        tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts2 = pd.Series(dti2)
+        res = dts1.append(dts2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        # different tz
+        dti3 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'],
+                                tz='US/Pacific')
+
+        exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
+                        pd.Timestamp('2011-01-02', tz=tz),
+                        pd.Timestamp('2012-01-01', tz='US/Pacific'),
+                        pd.Timestamp('2012-01-02', tz='US/Pacific')],
+                       dtype=object)
+
+        res = dti1.append(dti3)
+        # tm.assert_index_equal(res, exp)
+
+        dts1 = pd.Series(dti1)
+        dts3 = pd.Series(dti3)
+        res = dts1.append(dts3)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([dts1, dts3])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period(self):
+        # GH 13660
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        pi2 = pd.PeriodIndex(['2012-01', '2012-02'], freq='M')
+
+        exp = pd.PeriodIndex(['2011-01', '2011-02', '2012-01',
+                              '2012-02'], freq='M')
+
+        res = pi1.append(pi2)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        ps2 = pd.Series(pi2)
+        res = ps1.append(ps2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, ps2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period_diff_freq_to_object(self):
+        # GH 13221
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        pi2 = pd.PeriodIndex(['2012-01-01', '2012-02-01'], freq='D')
+
+        exp = pd.Index([pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M'),
+                        pd.Period('2012-01-01', freq='D'),
+                        pd.Period('2012-02-01', freq='D')], dtype=object)
+
+        res = pi1.append(pi2)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        ps2 = pd.Series(pi2)
+        res = ps1.append(ps2)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, ps2])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concatlike_common_period_mixed_dt_to_object(self):
+        # GH 13221
+        # different datetimelike
+        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
+        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
+        exp = pd.Index([pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M'),
+                        pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days')], dtype=object)
+
+        res = pi1.append(tdi)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        tds = pd.Series(tdi)
+        res = ps1.append(tds)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([ps1, tds])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        # inverse
+        exp = pd.Index([pd.Timedelta('1 days'),
+                        pd.Timedelta('2 days'),
+                        pd.Period('2011-01', freq='M'),
+                        pd.Period('2011-02', freq='M')], dtype=object)
+
+        res = tdi.append(pi1)
+        tm.assert_index_equal(res, exp)
+
+        ps1 = pd.Series(pi1)
+        tds = pd.Series(tdi)
+        res = tds.append(ps1)
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+        res = pd.concat([tds, ps1])
+        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
+
+    def test_concat_categorical(self):
+        # GH 13524
+
+        # same categories -> category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2], dtype='category')
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2], dtype='category')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # partially different categories => not-category
+        s1 = pd.Series([3, 2], dtype='category')
+        s2 = pd.Series([2, 1], dtype='category')
+
+        exp = pd.Series([3, 2, 2, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # completely different categories (same dtype) => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, 1, 3, 2], dtype='category')
+
+        exp = pd.Series([10, 11, np.nan, np.nan, 1, 3, 2], dtype='object')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+    def test_union_categorical_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19096
+        a = pd.Series(Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c']))
+        b = pd.Series(Categorical(['a', 'b', 'c'], categories=['b', 'a', 'c']))
+        result = pd.concat([a, b], ignore_index=True)
+        expected = pd.Series(Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                                         categories=['a', 'b', 'c']))
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_categorical_coercion(self):
+        # GH 13524
+
+        # category + not-category => not-category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2])
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2], dtype='object')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # result shouldn't be affected by 1st elem dtype
+        exp = pd.Series([2, 1, 2, 1, 2, np.nan], dtype='object')
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # all values are not in category => not-category
+        s1 = pd.Series([3, 2], dtype='category')
+        s2 = pd.Series([2, 1])
+
+        exp = pd.Series([3, 2, 2, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([2, 1, 3, 2])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # completely different categories => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series([1, 3, 2])
+
+        exp = pd.Series([10, 11, np.nan, 1, 3, 2], dtype='object')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([1, 3, 2, 10, 11, np.nan], dtype='object')
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # different dtype => not-category
+        s1 = pd.Series([10, 11, np.nan], dtype='category')
+        s2 = pd.Series(['a', 'b', 'c'])
+
+        exp = pd.Series([10, 11, np.nan, 'a', 'b', 'c'])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series(['a', 'b', 'c', 10, 11, np.nan])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # if normal series only contains NaN-likes => not-category
+        s1 = pd.Series([10, 11], dtype='category')
+        s2 = pd.Series([np.nan, np.nan, np.nan])
+
+        exp = pd.Series([10, 11, np.nan, np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series([np.nan, np.nan, np.nan, 10, 11])
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+    def test_concat_categorical_3elem_coercion(self):
+        # GH 13524
+
+        # mixed dtypes => not-category
+        s1 = pd.Series([1, 2, np.nan], dtype='category')
+        s2 = pd.Series([2, 1, 2], dtype='category')
+        s3 = pd.Series([1, 2, 1, 2, np.nan])
+
+        exp = pd.Series([1, 2, np.nan, 2, 1, 2, 1, 2, 1, 2, np.nan],
+                        dtype='object')
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([1, 2, 1, 2, np.nan, 1, 2, np.nan, 2, 1, 2],
+                        dtype='object')
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+        # values are all in either category => not-category
+        s1 = pd.Series([4, 5, 6], dtype='category')
+        s2 = pd.Series([1, 2, 3], dtype='category')
+        s3 = pd.Series([1, 3, 4])
+
+        exp = pd.Series([4, 5, 6, 1, 2, 3, 1, 3, 4])
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([1, 3, 4, 4, 5, 6, 1, 2, 3])
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+        # values are all in either category => not-category
+        s1 = pd.Series([4, 5, 6], dtype='category')
+        s2 = pd.Series([1, 2, 3], dtype='category')
+        s3 = pd.Series([10, 11, 12])
+
+        exp = pd.Series([4, 5, 6, 1, 2, 3, 10, 11, 12])
+        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
+
+        exp = pd.Series([10, 11, 12, 4, 5, 6, 1, 2, 3])
+        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
+
+    def test_concat_categorical_multi_coercion(self):
+        # GH 13524
+
+        s1 = pd.Series([1, 3], dtype='category')
+        s2 = pd.Series([3, 4], dtype='category')
+        s3 = pd.Series([2, 3])
+        s4 = pd.Series([2, 2], dtype='category')
+        s5 = pd.Series([1, np.nan])
+        s6 = pd.Series([1, 3, 2], dtype='category')
+
+        # mixed dtype, values are all in categories => not-category
+        exp = pd.Series([1, 3, 3, 4, 2, 3, 2, 2, 1, np.nan, 1, 3, 2])
+        res = pd.concat([s1, s2, s3, s4, s5, s6], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+        res = s1.append([s2, s3, s4, s5, s6], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = pd.Series([1, 3, 2, 1, np.nan, 2, 2, 2, 3, 3, 4, 1, 3])
+        res = pd.concat([s6, s5, s4, s3, s2, s1], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+        res = s6.append([s5, s4, s3, s2, s1], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+    def test_concat_categorical_ordered(self):
+        # GH 13524
+
+        s1 = pd.Series(pd.Categorical([1, 2, np.nan], ordered=True))
+        s2 = pd.Series(pd.Categorical([2, 1, 2], ordered=True))
+
+        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2], ordered=True))
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2, 1, 2, np.nan],
+                                       ordered=True))
+        tm.assert_series_equal(pd.concat([s1, s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append([s2, s1], ignore_index=True), exp)
+
+    def test_concat_categorical_coercion_nan(self):
+        # GH 13524
+
+        # some edge cases
+        # category + not-category => not category
+        s1 = pd.Series(np.array([np.nan, np.nan], dtype=np.float64),
+                       dtype='category')
+        s2 = pd.Series([np.nan, 1])
+
+        exp = pd.Series([np.nan, np.nan, np.nan, 1])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        s1 = pd.Series([1, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        exp = pd.Series([1, np.nan, np.nan, np.nan], dtype='object')
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        # mixed dtype, all nan-likes => not-category
+        s1 = pd.Series([np.nan, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        exp = pd.Series([np.nan, np.nan, np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+        # all category nan-likes => category
+        s1 = pd.Series([np.nan, np.nan], dtype='category')
+        s2 = pd.Series([np.nan, np.nan], dtype='category')
+
+        exp = pd.Series([np.nan, np.nan, np.nan, np.nan], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+    def test_concat_categorical_empty(self):
+        # GH 13524
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([1, 2], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([], dtype='category')
+
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([], dtype='object')
+
+        # different dtype => not-category
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
+
+        s1 = pd.Series([], dtype='category')
+        s2 = pd.Series([np.nan, np.nan])
+
+        # empty Series is ignored
+        exp = pd.Series([np.nan, np.nan])
+        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
+        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
+
+        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
+        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
+
+
+class TestAppend(ConcatenateBase):
+
+    def test_append(self, sort):
+        begin_index = self.frame.index[:5]
+        end_index = self.frame.index[5:]
+
+        begin_frame = self.frame.reindex(begin_index)
+        end_frame = self.frame.reindex(end_index)
+
+        appended = begin_frame.append(end_frame)
+        tm.assert_almost_equal(appended['A'], self.frame['A'])
+
+        del end_frame['A']
+        partial_appended = begin_frame.append(end_frame, sort=sort)
+        assert 'A' in partial_appended
+
+        partial_appended = end_frame.append(begin_frame, sort=sort)
+        assert 'A' in partial_appended
+
+        # mixed type handling
+        appended = self.mixed_frame[:5].append(self.mixed_frame[5:])
+        tm.assert_frame_equal(appended, self.mixed_frame)
+
+        # what to test here
+        mixed_appended = self.mixed_frame[:5].append(self.frame[5:], sort=sort)
+        mixed_appended2 = self.frame[:5].append(self.mixed_frame[5:],
+                                                sort=sort)
+
+        # all equal except 'foo' column
+        tm.assert_frame_equal(
+            mixed_appended.reindex(columns=['A', 'B', 'C', 'D']),
+            mixed_appended2.reindex(columns=['A', 'B', 'C', 'D']))
+
+        # append empty
+        empty = DataFrame({})
+
+        appended = self.frame.append(empty)
+        tm.assert_frame_equal(self.frame, appended)
+        assert appended is not self.frame
+
+        appended = empty.append(self.frame)
+        tm.assert_frame_equal(self.frame, appended)
+        assert appended is not self.frame
+
+        # Overlap
+        msg = "Indexes have overlapping values"
+        with pytest.raises(ValueError, match=msg):
+            self.frame.append(self.frame, verify_integrity=True)
+
+        # see gh-6129: new columns
+        df = DataFrame({'a': {'x': 1, 'y': 2}, 'b': {'x': 3, 'y': 4}})
+        row = Series([5, 6, 7], index=['a', 'b', 'c'], name='z')
+        expected = DataFrame({'a': {'x': 1, 'y': 2, 'z': 5}, 'b': {
+                             'x': 3, 'y': 4, 'z': 6}, 'c': {'z': 7}})
+        result = df.append(row)
+        tm.assert_frame_equal(result, expected)
+
+    def test_append_length0_frame(self, sort):
+        df = DataFrame(columns=['A', 'B', 'C'])
+        df3 = DataFrame(index=[0, 1], columns=['A', 'B'])
+        df5 = df.append(df3, sort=sort)
+
+        expected = DataFrame(index=[0, 1], columns=['A', 'B', 'C'])
+        assert_frame_equal(df5, expected)
+
+    def test_append_records(self):
+        arr1 = np.zeros((2,), dtype=('i4,f4,a10'))
+        arr1[:] = [(1, 2., 'Hello'), (2, 3., "World")]
+
+        arr2 = np.zeros((3,), dtype=('i4,f4,a10'))
+        arr2[:] = [(3, 4., 'foo'),
+                   (5, 6., "bar"),
+                   (7., 8., 'baz')]
+
+        df1 = DataFrame(arr1)
+        df2 = DataFrame(arr2)
+
+        result = df1.append(df2, ignore_index=True)
+        expected = DataFrame(np.concatenate((arr1, arr2)))
+        assert_frame_equal(result, expected)
+
+    # rewrite sort fixture, since we also want to test default of None
+    def test_append_sorts(self, sort_with_none):
+        df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+        df2 = pd.DataFrame({"a": [1, 2], 'c': [3, 4]}, index=[2, 3])
+
+        if sort_with_none is None:
+            # only warn if not explicitly specified
+            # don't check stacklevel since its set for concat, and append
+            # has an extra stack.
+            ctx = tm.assert_produces_warning(FutureWarning,
+                                             check_stacklevel=False)
+        else:
+            ctx = tm.assert_produces_warning(None)
+
+        with ctx:
+            result = df1.append(df2, sort=sort_with_none)
+
+        # for None / True
+        expected = pd.DataFrame({"b": [1, 2, None, None],
+                                 "a": [1, 2, 1, 2],
+                                 "c": [None, None, 3, 4]},
+                                columns=['a', 'b', 'c'])
+        if sort_with_none is False:
+            expected = expected[['b', 'a', 'c']]
+        tm.assert_frame_equal(result, expected)
+
+    def test_append_different_columns(self, sort):
+        df = DataFrame({'bools': np.random.randn(10) > 0,
+                        'ints': np.random.randint(0, 10, 10),
+                        'floats': np.random.randn(10),
+                        'strings': ['foo', 'bar'] * 5})
+
+        a = df[:5].loc[:, ['bools', 'ints', 'floats']]
+        b = df[5:].loc[:, ['strings', 'ints', 'floats']]
+
+        appended = a.append(b, sort=sort)
+        assert isna(appended['strings'][0:4]).all()
+        assert isna(appended['bools'][5:]).all()
+
+    def test_append_many(self, sort):
+        chunks = [self.frame[:5], self.frame[5:10],
+                  self.frame[10:15], self.frame[15:]]
+
+        result = chunks[0].append(chunks[1:])
+        tm.assert_frame_equal(result, self.frame)
+
+        chunks[-1] = chunks[-1].copy()
+        chunks[-1]['foo'] = 'bar'
+        result = chunks[0].append(chunks[1:], sort=sort)
+        tm.assert_frame_equal(result.loc[:, self.frame.columns], self.frame)
+        assert (result['foo'][15:] == 'bar').all()
+        assert result['foo'][:15].isna().all()
+
+    def test_append_preserve_index_name(self):
+        # #980
+        df1 = DataFrame(data=None, columns=['A', 'B', 'C'])
+        df1 = df1.set_index(['A'])
+        df2 = DataFrame(data=[[1, 4, 7], [2, 5, 8], [3, 6, 9]],
+                        columns=['A', 'B', 'C'])
+        df2 = df2.set_index(['A'])
+
+        result = df1.append(df2)
+        assert result.index.name == 'A'
+
+    indexes_can_append = [
+        pd.RangeIndex(3),
+        pd.Index([4, 5, 6]),
+        pd.Index([4.5, 5.5, 6.5]),
+        pd.Index(list('abc')),
+        pd.CategoricalIndex('A B C'.split()),
+        pd.CategoricalIndex('D E F'.split(), ordered=True),
+        pd.DatetimeIndex([dt.datetime(2013, 1, 3, 0, 0),
+                          dt.datetime(2013, 1, 3, 6, 10),
+                          dt.datetime(2013, 1, 3, 7, 12)]),
+    ]
+
+    indexes_cannot_append_with_other = [
+        pd.IntervalIndex.from_breaks([0, 1, 2, 3]),
+        pd.MultiIndex.from_arrays(['A B C'.split(), 'D E F'.split()]),
+    ]
+
+    all_indexes = indexes_can_append + indexes_cannot_append_with_other
+
+    @pytest.mark.parametrize("index",
+                             all_indexes,
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_same_columns_type(self, index):
+        # GH18359
+
+        # df wider than ser
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=index)
+        ser_index = index[:2]
+        ser = pd.Series([7, 8], index=ser_index, name=2)
+        result = df.append(ser)
+        expected = pd.DataFrame([[1., 2., 3.], [4, 5, 6], [7, 8, np.nan]],
+                                index=[0, 1, 2],
+                                columns=index)
+        assert_frame_equal(result, expected)
+
+        # ser wider than df
+        ser_index = index
+        index = index[:2]
+        df = pd.DataFrame([[1, 2], [4, 5]], columns=index)
+        ser = pd.Series([7, 8, 9], index=ser_index, name=2)
+        result = df.append(ser)
+        expected = pd.DataFrame([[1, 2, np.nan], [4, 5, np.nan], [7, 8, 9]],
+                                index=[0, 1, 2],
+                                columns=ser_index)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("df_columns, series_index",
+                             combinations(indexes_can_append, r=2),
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_different_columns_types(self, df_columns, series_index):
+        # GH18359
+        # See also test 'test_append_different_columns_types_raises' below
+        # for errors raised when appending
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=df_columns)
+        ser = pd.Series([7, 8, 9], index=series_index, name=2)
+
+        result = df.append(ser)
+        idx_diff = ser.index.difference(df_columns)
+        combined_columns = Index(df_columns.tolist()).append(idx_diff)
+        expected = pd.DataFrame([[1., 2., 3., np.nan, np.nan, np.nan],
+                                 [4, 5, 6, np.nan, np.nan, np.nan],
+                                 [np.nan, np.nan, np.nan, 7, 8, 9]],
+                                index=[0, 1, 2],
+                                columns=combined_columns)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('index_can_append', indexes_can_append,
+                             ids=lambda x: x.__class__.__name__)
+    @pytest.mark.parametrize('index_cannot_append_with_other',
+                             indexes_cannot_append_with_other,
+                             ids=lambda x: x.__class__.__name__)
+    def test_append_different_columns_types_raises(
+            self, index_can_append, index_cannot_append_with_other):
+        # GH18359
+        # Dataframe.append will raise if IntervalIndex/MultiIndex appends
+        # or is appended to a different index type
+        #
+        # See also test 'test_append_different_columns_types' above for
+        # appending without raising.
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]], columns=index_can_append)
+        ser = pd.Series([7, 8, 9], index=index_cannot_append_with_other,
+                        name=2)
+        msg = ("the other index needs to be an IntervalIndex too, but was"
+               r" type {}|"
+               r"object of type '(int|long|float|Timestamp)' has no len\(\)|"
+               "Expected tuple, got str")
+        with pytest.raises(TypeError, match=msg.format(
+                index_can_append.__class__.__name__)):
+            df.append(ser)
+
+        df = pd.DataFrame([[1, 2, 3], [4, 5, 6]],
+                          columns=index_cannot_append_with_other)
+        ser = pd.Series([7, 8, 9], index=index_can_append, name=2)
+        msg = (r"unorderable types: (Interval|int)\(\) > "
+               r"(int|long|float|str)\(\)|"
+               r"Expected tuple, got (int|long|float|str)|"
+               r"Cannot compare type 'Timestamp' with type '(int|long)'|"
+               r"'>' not supported between instances of 'int' and 'str'")
+        with pytest.raises(TypeError, match=msg):
+            df.append(ser)
+
+    def test_append_dtype_coerce(self, sort):
+
+        # GH 4993
+        # appending with datetime will incorrectly convert datetime64
+
+        df1 = DataFrame(index=[1, 2], data=[dt.datetime(2013, 1, 1, 0, 0),
+                                            dt.datetime(2013, 1, 2, 0, 0)],
+                        columns=['start_time'])
+        df2 = DataFrame(index=[4, 5], data=[[dt.datetime(2013, 1, 3, 0, 0),
+                                             dt.datetime(2013, 1, 3, 6, 10)],
+                                            [dt.datetime(2013, 1, 4, 0, 0),
+                                             dt.datetime(2013, 1, 4, 7, 10)]],
+                        columns=['start_time', 'end_time'])
+
+        expected = concat([Series([pd.NaT,
+                                   pd.NaT,
+                                   dt.datetime(2013, 1, 3, 6, 10),
+                                   dt.datetime(2013, 1, 4, 7, 10)],
+                                  name='end_time'),
+                           Series([dt.datetime(2013, 1, 1, 0, 0),
+                                   dt.datetime(2013, 1, 2, 0, 0),
+                                   dt.datetime(2013, 1, 3, 0, 0),
+                                   dt.datetime(2013, 1, 4, 0, 0)],
+                                  name='start_time')],
+                          axis=1, sort=sort)
+        result = df1.append(df2, ignore_index=True, sort=sort)
+        if sort:
+            expected = expected[['end_time', 'start_time']]
+        else:
+            expected = expected[['start_time', 'end_time']]
+
+        assert_frame_equal(result, expected)
+
+    def test_append_missing_column_proper_upcast(self, sort):
+        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8')})
+        df2 = DataFrame({'B': np.array([True, False, True, False],
+                                       dtype=bool)})
+
+        appended = df1.append(df2, ignore_index=True, sort=sort)
+        assert appended['A'].dtype == 'f8'
+        assert appended['B'].dtype == 'O'
+
+    def test_append_empty_frame_to_series_with_dateutil_tz(self):
+        # GH 23682
+        date = Timestamp('2018-10-24 07:30:00', tz=dateutil.tz.tzutc())
+        s = Series({'date': date, 'a': 1.0, 'b': 2.0})
+        df = DataFrame(columns=['c', 'd'])
+        result = df.append(s, ignore_index=True)
+        # n.b. it's not clear to me that expected is correct here.
+        # It's possible that the `date` column should have
+        # datetime64[ns, tz] dtype for both result and expected.
+        # that would be more consistent with new columns having
+        # their own dtype (float for a and b, datetime64ns, tz for date).
+        expected = DataFrame([[np.nan, np.nan, 1., 2., date]],
+                             columns=['c', 'd', 'a', 'b', 'date'],
+                             dtype=object)
+        # These columns get cast to object after append
+        expected['a'] = expected['a'].astype(float)
+        expected['b'] = expected['b'].astype(float)
+        assert_frame_equal(result, expected)
+
+
+class TestConcatenate(ConcatenateBase):
+
+    def test_concat_copy(self):
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randint(0, 10, size=4).reshape(4, 1))
+        df3 = DataFrame({5: 'foo'}, index=range(4))
+
+        # These are actual copies.
+        result = concat([df, df2, df3], axis=1, copy=True)
+
+        for b in result._data.blocks:
+            assert b.values.base is None
+
+        # These are the same.
+        result = concat([df, df2, df3], axis=1, copy=False)
+
+        for b in result._data.blocks:
+            if b.is_float:
+                assert b.values.base is df._data.blocks[0].values.base
+            elif b.is_integer:
+                assert b.values.base is df2._data.blocks[0].values.base
+            elif b.is_object:
+                assert b.values.base is not None
+
+        # Float block was consolidated.
+        df4 = DataFrame(np.random.randn(4, 1))
+        result = concat([df, df2, df3, df4], axis=1, copy=False)
+        for b in result._data.blocks:
+            if b.is_float:
+                assert b.values.base is None
+            elif b.is_integer:
+                assert b.values.base is df2._data.blocks[0].values.base
+            elif b.is_object:
+                assert b.values.base is not None
+
+    def test_concat_with_group_keys(self):
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        # axis=0
+        df = DataFrame(np.random.randn(3, 4))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        result = concat([df, df2], keys=[0, 1])
+        exp_index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1, 1],
+                                            [0, 1, 2, 0, 1, 2, 3]])
+        expected = DataFrame(np.r_[df.values, df2.values],
+                             index=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([df, df], keys=[0, 1])
+        exp_index2 = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
+                                             [0, 1, 2, 0, 1, 2]])
+        expected = DataFrame(np.r_[df.values, df.values],
+                             index=exp_index2)
+        tm.assert_frame_equal(result, expected)
+
+        # axis=1
+        df = DataFrame(np.random.randn(4, 3))
+        df2 = DataFrame(np.random.randn(4, 4))
+
+        result = concat([df, df2], keys=[0, 1], axis=1)
+        expected = DataFrame(np.c_[df.values, df2.values],
+                             columns=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([df, df], keys=[0, 1], axis=1)
+        expected = DataFrame(np.c_[df.values, df.values],
+                             columns=exp_index2)
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_keys_specific_levels(self):
+        df = DataFrame(np.random.randn(10, 4))
+        pieces = [df.iloc[:, [0, 1]], df.iloc[:, [2]], df.iloc[:, [3]]]
+        level = ['three', 'two', 'one', 'zero']
+        result = concat(pieces, axis=1, keys=['one', 'two', 'three'],
+                        levels=[level],
+                        names=['group_key'])
+
+        tm.assert_index_equal(result.columns.levels[0],
+                              Index(level, name='group_key'))
+        assert result.columns.names[0] == 'group_key'
+
+    def test_concat_dataframe_keys_bug(self, sort):
+        t1 = DataFrame({
+            'value': Series([1, 2, 3], index=Index(['a', 'b', 'c'],
+                                                   name='id'))})
+        t2 = DataFrame({
+            'value': Series([7, 8], index=Index(['a', 'b'], name='id'))})
+
+        # it works
+        result = concat([t1, t2], axis=1, keys=['t1', 't2'], sort=sort)
+        assert list(result.columns) == [('t1', 'value'), ('t2', 'value')]
+
+    def test_concat_series_partial_columns_names(self):
+        # GH10698
+        foo = Series([1, 2], name='foo')
+        bar = Series([1, 2])
+        baz = Series([4, 5])
+
+        result = concat([foo, bar, baz], axis=1)
+        expected = DataFrame({'foo': [1, 2], 0: [1, 2], 1: [
+                             4, 5]}, columns=['foo', 0, 1])
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([foo, bar, baz], axis=1, keys=[
+                        'red', 'blue', 'yellow'])
+        expected = DataFrame({'red': [1, 2], 'blue': [1, 2], 'yellow': [
+                             4, 5]}, columns=['red', 'blue', 'yellow'])
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([foo, bar, baz], axis=1, ignore_index=True)
+        expected = DataFrame({0: [1, 2], 1: [1, 2], 2: [4, 5]})
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_dict(self):
+        frames = {'foo': DataFrame(np.random.randn(4, 3)),
+                  'bar': DataFrame(np.random.randn(4, 3)),
+                  'baz': DataFrame(np.random.randn(4, 3)),
+                  'qux': DataFrame(np.random.randn(4, 3))}
+
+        sorted_keys = sorted(frames)
+
+        result = concat(frames)
+        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys)
+        tm.assert_frame_equal(result, expected)
+
+        result = concat(frames, axis=1)
+        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys,
+                          axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        keys = ['baz', 'foo', 'bar']
+        result = concat(frames, keys=keys)
+        expected = concat([frames[k] for k in keys], keys=keys)
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_ignore_index(self, sort):
+        frame1 = DataFrame({"test1": ["a", "b", "c"],
+                            "test2": [1, 2, 3],
+                            "test3": [4.5, 3.2, 1.2]})
+        frame2 = DataFrame({"test3": [5.2, 2.2, 4.3]})
+        frame1.index = Index(["x", "y", "z"])
+        frame2.index = Index(["x", "y", "q"])
+
+        v1 = concat([frame1, frame2], axis=1,
+                    ignore_index=True, sort=sort)
+
+        nan = np.nan
+        expected = DataFrame([[nan, nan, nan, 4.3],
+                              ['a', 1, 4.5, 5.2],
+                              ['b', 2, 3.2, 2.2],
+                              ['c', 3, 1.2, nan]],
+                             index=Index(["q", "x", "y", "z"]))
+        if not sort:
+            expected = expected.loc[['x', 'y', 'z', 'q']]
+
+        tm.assert_frame_equal(v1, expected)
+
+    def test_concat_multiindex_with_keys(self):
+        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
+                                   ['one', 'two', 'three']],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           names=['first', 'second'])
+        frame = DataFrame(np.random.randn(10, 3), index=index,
+                          columns=Index(['A', 'B', 'C'], name='exp'))
+        result = concat([frame, frame], keys=[0, 1], names=['iteration'])
+
+        assert result.index.names == ('iteration',) + index.names
+        tm.assert_frame_equal(result.loc[0], frame)
+        tm.assert_frame_equal(result.loc[1], frame)
+        assert result.index.nlevels == 3
+
+    def test_concat_multiindex_with_tz(self):
+        # GH 6606
+        df = DataFrame({'dt': [datetime(2014, 1, 1),
+                               datetime(2014, 1, 2),
+                               datetime(2014, 1, 3)],
+                        'b': ['A', 'B', 'C'],
+                        'c': [1, 2, 3], 'd': [4, 5, 6]})
+        df['dt'] = df['dt'].apply(lambda d: Timestamp(d, tz='US/Pacific'))
+        df = df.set_index(['dt', 'b'])
+
+        exp_idx1 = DatetimeIndex(['2014-01-01', '2014-01-02',
+                                  '2014-01-03'] * 2,
+                                 tz='US/Pacific', name='dt')
+        exp_idx2 = Index(['A', 'B', 'C'] * 2, name='b')
+        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
+        expected = DataFrame({'c': [1, 2, 3] * 2, 'd': [4, 5, 6] * 2},
+                             index=exp_idx, columns=['c', 'd'])
+
+        result = concat([df, df])
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_multiindex_with_none_in_index_names(self):
+        # GH 15787
+        index = pd.MultiIndex.from_product([[1], range(5)],
+                                           names=['level1', None])
+        df = pd.DataFrame({'col': range(5)}, index=index, dtype=np.int32)
+
+        result = concat([df, df], keys=[1, 2], names=['level2'])
+        index = pd.MultiIndex.from_product([[1, 2], [1], range(5)],
+                                           names=['level2', 'level1', None])
+        expected = pd.DataFrame({'col': list(range(5)) * 2},
+                                index=index, dtype=np.int32)
+        assert_frame_equal(result, expected)
+
+        result = concat([df, df[:2]], keys=[1, 2], names=['level2'])
+        level2 = [1] * 5 + [2] * 2
+        level1 = [1] * 7
+        no_name = list(range(5)) + list(range(2))
+        tuples = list(zip(level2, level1, no_name))
+        index = pd.MultiIndex.from_tuples(tuples,
+                                          names=['level2', 'level1', None])
+        expected = pd.DataFrame({'col': no_name}, index=index,
+                                dtype=np.int32)
+        assert_frame_equal(result, expected)
+
+    def test_concat_keys_and_levels(self):
+        df = DataFrame(np.random.randn(1, 3))
+        df2 = DataFrame(np.random.randn(1, 4))
+
+        levels = [['foo', 'baz'], ['one', 'two']]
+        names = ['first', 'second']
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        levels=levels,
+                        names=names)
+        expected = concat([df, df2, df, df2])
+        exp_index = MultiIndex(levels=levels + [[0]],
+                               codes=[[0, 0, 1, 1], [0, 1, 0, 1],
+                                      [0, 0, 0, 0]],
+                               names=names + [None])
+        expected.index = exp_index
+
+        tm.assert_frame_equal(result, expected)
+
+        # no names
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        levels=levels)
+        assert result.index.names == (None,) * 3
+
+        # no levels
+        result = concat([df, df2, df, df2],
+                        keys=[('foo', 'one'), ('foo', 'two'),
+                              ('baz', 'one'), ('baz', 'two')],
+                        names=['first', 'second'])
+        assert result.index.names == ('first', 'second') + (None,)
+        tm.assert_index_equal(result.index.levels[0],
+                              Index(['baz', 'foo'], name='first'))
+
+    def test_concat_keys_levels_no_overlap(self):
+        # GH #1406
+        df = DataFrame(np.random.randn(1, 3), index=['a'])
+        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
+
+        msg = "Values not found in passed level"
+        with pytest.raises(ValueError, match=msg):
+            concat([df, df],
+                   keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
+
+        msg = "Key one not in level"
+        with pytest.raises(ValueError, match=msg):
+            concat([df, df2],
+                   keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
+
+    def test_concat_rename_index(self):
+        a = DataFrame(np.random.rand(3, 3),
+                      columns=list('ABC'),
+                      index=Index(list('abc'), name='index_a'))
+        b = DataFrame(np.random.rand(3, 3),
+                      columns=list('ABC'),
+                      index=Index(list('abc'), name='index_b'))
+
+        result = concat([a, b], keys=['key0', 'key1'],
+                        names=['lvl0', 'lvl1'])
+
+        exp = concat([a, b], keys=['key0', 'key1'], names=['lvl0'])
+        names = list(exp.index.names)
+        names[1] = 'lvl1'
+        exp.index.set_names(names, inplace=True)
+
+        tm.assert_frame_equal(result, exp)
+        assert result.index.names == exp.index.names
+
+    def test_crossed_dtypes_weird_corner(self):
+        columns = ['A', 'B', 'C', 'D']
+        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='f8'),
+                         'B': np.array([1, 2, 3, 4], dtype='i8'),
+                         'C': np.array([1, 2, 3, 4], dtype='f8'),
+                         'D': np.array([1, 2, 3, 4], dtype='i8')},
+                        columns=columns)
+
+        df2 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8'),
+                         'B': np.array([1, 2, 3, 4], dtype='f8'),
+                         'C': np.array([1, 2, 3, 4], dtype='i8'),
+                         'D': np.array([1, 2, 3, 4], dtype='f8')},
+                        columns=columns)
+
+        appended = df1.append(df2, ignore_index=True)
+        expected = DataFrame(np.concatenate([df1.values, df2.values], axis=0),
+                             columns=columns)
+        tm.assert_frame_equal(appended, expected)
+
+        df = DataFrame(np.random.randn(1, 3), index=['a'])
+        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
+        result = concat(
+            [df, df2], keys=['one', 'two'], names=['first', 'second'])
+        assert result.index.names == ('first', 'second')
+
+    def test_dups_index(self):
+        # GH 4771
+
+        # single dtypes
+        df = DataFrame(np.random.randint(0, 10, size=40).reshape(
+            10, 4), columns=['A', 'A', 'C', 'C'])
+
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result.iloc[:, :4], df)
+        assert_frame_equal(result.iloc[:, 4:], df)
+
+        result = concat([df, df], axis=0)
+        assert_frame_equal(result.iloc[:10], df)
+        assert_frame_equal(result.iloc[10:], df)
+
+        # multi dtypes
+        df = concat([DataFrame(np.random.randn(10, 4),
+                               columns=['A', 'A', 'B', 'B']),
+                     DataFrame(np.random.randint(0, 10, size=20)
+                               .reshape(10, 2),
+                               columns=['A', 'C'])],
+                    axis=1)
+
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result.iloc[:, :6], df)
+        assert_frame_equal(result.iloc[:, 6:], df)
+
+        result = concat([df, df], axis=0)
+        assert_frame_equal(result.iloc[:10], df)
+        assert_frame_equal(result.iloc[10:], df)
+
+        # append
+        result = df.iloc[0:8, :].append(df.iloc[8:])
+        assert_frame_equal(result, df)
+
+        result = df.iloc[0:8, :].append(df.iloc[8:9]).append(df.iloc[9:10])
+        assert_frame_equal(result, df)
+
+        expected = concat([df, df], axis=0)
+        result = df.append(df)
+        assert_frame_equal(result, expected)
+
+    def test_with_mixed_tuples(self, sort):
+        # 10697
+        # columns have mixed tuples, so handle properly
+        df1 = DataFrame({u'A': 'foo', (u'B', 1): 'bar'}, index=range(2))
+        df2 = DataFrame({u'B': 'foo', (u'B', 1): 'bar'}, index=range(2))
+
+        # it works
+        concat([df1, df2], sort=sort)
+
+    def test_handle_empty_objects(self, sort):
+        df = DataFrame(np.random.randn(10, 4), columns=list('abcd'))
+
+        baz = df[:5].copy()
+        baz['foo'] = 'bar'
+        empty = df[5:5]
+
+        frames = [baz, empty, empty, df[5:]]
+        concatted = concat(frames, axis=0, sort=sort)
+
+        expected = df.reindex(columns=['a', 'b', 'c', 'd', 'foo'])
+        expected['foo'] = expected['foo'].astype('O')
+        expected.loc[0:4, 'foo'] = 'bar'
+
+        tm.assert_frame_equal(concatted, expected)
+
+        # empty as first element with time series
+        # GH3259
+        df = DataFrame(dict(A=range(10000)), index=date_range(
+            '20130101', periods=10000, freq='s'))
+        empty = DataFrame()
+        result = concat([df, empty], axis=1)
+        assert_frame_equal(result, df)
+        result = concat([empty, df], axis=1)
+        assert_frame_equal(result, df)
+
+        result = concat([df, empty])
+        assert_frame_equal(result, df)
+        result = concat([empty, df])
+        assert_frame_equal(result, df)
+
+    def test_concat_mixed_objs(self):
+
+        # concat mixed series/frames
+        # G2385
+
+        # axis 1
+        index = date_range('01-Jan-2013', periods=10, freq='H')
+        arr = np.arange(10, dtype='int64')
+        s1 = Series(arr, index=index)
+        s2 = Series(arr, index=index)
+        df = DataFrame(arr.reshape(-1, 1), index=index)
+
+        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
+                             index=index, columns=[0, 0])
+        result = concat([df, df], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
+                             index=index, columns=[0, 1])
+        result = concat([s1, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=[0, 1, 2])
+        result = concat([s1, s2, s1], axis=1)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.repeat(arr, 5).reshape(-1, 5),
+                             index=index, columns=[0, 0, 1, 2, 3])
+        result = concat([s1, df, s2, s2, s1], axis=1)
+        assert_frame_equal(result, expected)
+
+        # with names
+        s1.name = 'foo'
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=['foo', 0, 0])
+        result = concat([s1, df, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        s2.name = 'bar'
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=['foo', 0, 'bar'])
+        result = concat([s1, df, s2], axis=1)
+        assert_frame_equal(result, expected)
+
+        # ignore index
+        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
+                             index=index, columns=[0, 1, 2])
+        result = concat([s1, df, s2], axis=1, ignore_index=True)
+        assert_frame_equal(result, expected)
+
+        # axis 0
+        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1),
+                             index=index.tolist() * 3, columns=[0])
+        result = concat([s1, df, s2])
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1), columns=[0])
+        result = concat([s1, df, s2], ignore_index=True)
+        assert_frame_equal(result, expected)
+
+    def test_empty_dtype_coerce(self):
+
+        # xref to #12411
+        # xref to #12045
+        # xref to #11594
+        # see below
+
+        # 10571
+        df1 = DataFrame(data=[[1, None], [2, None]], columns=['a', 'b'])
+        df2 = DataFrame(data=[[3, None], [4, None]], columns=['a', 'b'])
+        result = concat([df1, df2])
+        expected = df1.dtypes
+        tm.assert_series_equal(result.dtypes, expected)
+
+    def test_dtype_coerceion(self):
+
+        # 12411
+        df = DataFrame({'date': [pd.Timestamp('20130101').tz_localize('UTC'),
+                                 pd.NaT]})
+
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+        # 12045
+        import datetime
+        df = DataFrame({'date': [datetime.datetime(2012, 1, 1),
+                                 datetime.datetime(1012, 1, 2)]})
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+        # 11594
+        df = DataFrame({'text': ['some words'] + [None] * 9})
+        result = concat([df.iloc[[0]], df.iloc[[1]]])
+        tm.assert_series_equal(result.dtypes, df.dtypes)
+
+    @pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+    # Panel.rename warning we don't care about
+    @pytest.mark.filterwarnings("ignore:Using:FutureWarning")
+    def test_panel_concat_buglet(self, sort):
+        # #2257
+        def make_panel():
+            index = 5
+            cols = 3
+
+            def df():
+                return DataFrame(np.random.randn(index, cols),
+                                 index=["I%s" % i for i in range(index)],
+                                 columns=["C%s" % i for i in range(cols)])
+            return Panel({"Item%s" % x: df() for x in ['A', 'B', 'C']})
+
+        panel1 = make_panel()
+        panel2 = make_panel()
+
+        panel2 = panel2.rename(major_axis={x: "%s_1" % x
+                                           for x in panel2.major_axis})
+
+        panel3 = panel2.rename(major_axis=lambda x: '%s_1' % x)
+        panel3 = panel3.rename(minor_axis=lambda x: '%s_1' % x)
+
+        # it works!
+        concat([panel1, panel3], axis=1, verify_integrity=True, sort=sort)
+
+    def test_concat_series(self):
+
+        ts = tm.makeTimeSeries()
+        ts.name = 'foo'
+
+        pieces = [ts[:5], ts[5:15], ts[15:]]
+
+        result = concat(pieces)
+        tm.assert_series_equal(result, ts)
+        assert result.name == ts.name
+
+        result = concat(pieces, keys=[0, 1, 2])
+        expected = ts.copy()
+
+        ts.index = DatetimeIndex(np.array(ts.index.values, dtype='M8[ns]'))
+
+        exp_codes = [np.repeat([0, 1, 2], [len(x) for x in pieces]),
+                     np.arange(len(ts))]
+        exp_index = MultiIndex(levels=[[0, 1, 2], ts.index],
+                               codes=exp_codes)
+        expected.index = exp_index
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_series_axis1(self, sort=sort):
+        ts = tm.makeTimeSeries()
+
+        pieces = [ts[:-2], ts[2:], ts[2:-2]]
+
+        result = concat(pieces, axis=1)
+        expected = DataFrame(pieces).T
+        assert_frame_equal(result, expected)
+
+        result = concat(pieces, keys=['A', 'B', 'C'], axis=1)
+        expected = DataFrame(pieces, index=['A', 'B', 'C']).T
+        assert_frame_equal(result, expected)
+
+        # preserve series names, #2489
+        s = Series(randn(5), name='A')
+        s2 = Series(randn(5), name='B')
+
+        result = concat([s, s2], axis=1)
+        expected = DataFrame({'A': s, 'B': s2})
+        assert_frame_equal(result, expected)
+
+        s2.name = None
+        result = concat([s, s2], axis=1)
+        tm.assert_index_equal(result.columns,
+                              Index(['A', 0], dtype='object'))
+
+        # must reindex, #2603
+        s = Series(randn(3), index=['c', 'a', 'b'], name='A')
+        s2 = Series(randn(4), index=['d', 'a', 'b', 'c'], name='B')
+        result = concat([s, s2], axis=1, sort=sort)
+        expected = DataFrame({'A': s, 'B': s2})
+        assert_frame_equal(result, expected)
+
+    def test_concat_series_axis1_names_applied(self):
+        # ensure names argument is not ignored on axis=1, #23490
+        s = Series([1, 2, 3])
+        s2 = Series([4, 5, 6])
+        result = concat([s, s2], axis=1, keys=['a', 'b'], names=['A'])
+        expected = DataFrame([[1, 4], [2, 5], [3, 6]],
+                             columns=pd.Index(['a', 'b'], name='A'))
+        assert_frame_equal(result, expected)
+
+        result = concat([s, s2], axis=1, keys=[('a', 1), ('b', 2)],
+                        names=['A', 'B'])
+        expected = DataFrame([[1, 4], [2, 5], [3, 6]],
+                             columns=MultiIndex.from_tuples([('a', 1),
+                                                             ('b', 2)],
+                                                            names=['A', 'B']))
+        assert_frame_equal(result, expected)
+
+    def test_concat_single_with_key(self):
+        df = DataFrame(np.random.randn(10, 4))
+
+        result = concat([df], keys=['foo'])
+        expected = concat([df, df], keys=['foo', 'bar'])
+        tm.assert_frame_equal(result, expected[:10])
+
+    def test_concat_exclude_none(self):
+        df = DataFrame(np.random.randn(10, 4))
+
+        pieces = [df[:5], None, None, df[5:]]
+        result = concat(pieces)
+        tm.assert_frame_equal(result, df)
+        with pytest.raises(ValueError, match="All objects passed were None"):
+            concat([None, None])
+
+    def test_concat_datetime64_block(self):
+        from pandas.core.indexes.datetimes import date_range
+
+        rng = date_range('1/1/2000', periods=10)
+
+        df = DataFrame({'time': rng})
+
+        result = concat([df, df])
+        assert (result.iloc[:10]['time'] == rng).all()
+        assert (result.iloc[10:]['time'] == rng).all()
+
+    def test_concat_timedelta64_block(self):
+        from pandas import to_timedelta
+
+        rng = to_timedelta(np.arange(10), unit='s')
+
+        df = DataFrame({'time': rng})
+
+        result = concat([df, df])
+        assert (result.iloc[:10]['time'] == rng).all()
+        assert (result.iloc[10:]['time'] == rng).all()
+
+    def test_concat_keys_with_none(self):
+        # #1649
+        df0 = DataFrame([[10, 20, 30], [10, 20, 30], [10, 20, 30]])
+
+        result = concat(dict(a=None, b=df0, c=df0[:2], d=df0[:1], e=df0))
+        expected = concat(dict(b=df0, c=df0[:2], d=df0[:1], e=df0))
+        tm.assert_frame_equal(result, expected)
+
+        result = concat([None, df0, df0[:2], df0[:1], df0],
+                        keys=['a', 'b', 'c', 'd', 'e'])
+        expected = concat([df0, df0[:2], df0[:1], df0],
+                          keys=['b', 'c', 'd', 'e'])
+        tm.assert_frame_equal(result, expected)
+
+    def test_concat_bug_1719(self):
+        ts1 = tm.makeTimeSeries()
+        ts2 = tm.makeTimeSeries()[::2]
+
+        # to join with union
+        # these two are of different length!
+        left = concat([ts1, ts2], join='outer', axis=1)
+        right = concat([ts2, ts1], join='outer', axis=1)
+
+        assert len(left) == len(right)
+
+    def test_concat_bug_2972(self):
+        ts0 = Series(np.zeros(5))
+        ts1 = Series(np.ones(5))
+        ts0.name = ts1.name = 'same name'
+        result = concat([ts0, ts1], axis=1)
+
+        expected = DataFrame({0: ts0, 1: ts1})
+        expected.columns = ['same name', 'same name']
+        assert_frame_equal(result, expected)
+
+    def test_concat_bug_3602(self):
+
+        # GH 3602, duplicate columns
+        df1 = DataFrame({'firmNo': [0, 0, 0, 0], 'prc': [6, 6, 6, 6],
+                         'stringvar': ['rrr', 'rrr', 'rrr', 'rrr']})
+        df2 = DataFrame({'C': [9, 10, 11, 12], 'misc': [1, 2, 3, 4],
+                         'prc': [6, 6, 6, 6]})
+        expected = DataFrame([[0, 6, 'rrr', 9, 1, 6],
+                              [0, 6, 'rrr', 10, 2, 6],
+                              [0, 6, 'rrr', 11, 3, 6],
+                              [0, 6, 'rrr', 12, 4, 6]])
+        expected.columns = ['firmNo', 'prc', 'stringvar', 'C', 'misc', 'prc']
+
+        result = concat([df1, df2], axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_concat_inner_join_empty(self):
+        # GH 15328
+        df_empty = pd.DataFrame()
+        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
+        df_expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
+
+        for how, expected in [('inner', df_expected), ('outer', df_a)]:
+            result = pd.concat([df_a, df_empty], axis=1, join=how)
+            assert_frame_equal(result, expected)
+
+    def test_concat_series_axis1_same_names_ignore_index(self):
+        dates = date_range('01-Jan-2013', '01-Jan-2014', freq='MS')[0:-1]
+        s1 = Series(randn(len(dates)), index=dates, name='value')
+        s2 = Series(randn(len(dates)), index=dates, name='value')
+
+        result = concat([s1, s2], axis=1, ignore_index=True)
+        expected = Index([0, 1])
+
+        tm.assert_index_equal(result.columns, expected)
+
+    def test_concat_iterables(self):
+        # GH8645 check concat works with tuples, list, generators, and weird
+        # stuff like deque and custom iterables
+        df1 = DataFrame([1, 2, 3])
+        df2 = DataFrame([4, 5, 6])
+        expected = DataFrame([1, 2, 3, 4, 5, 6])
+        assert_frame_equal(concat((df1, df2), ignore_index=True), expected)
+        assert_frame_equal(concat([df1, df2], ignore_index=True), expected)
+        assert_frame_equal(concat((df for df in (df1, df2)),
+                                  ignore_index=True), expected)
+        assert_frame_equal(
+            concat(deque((df1, df2)), ignore_index=True), expected)
+
+        class CustomIterator1(object):
+
+            def __len__(self):
+                return 2
+
+            def __getitem__(self, index):
+                try:
+                    return {0: df1, 1: df2}[index]
+                except KeyError:
+                    raise IndexError
+        assert_frame_equal(pd.concat(CustomIterator1(),
+                                     ignore_index=True), expected)
+
+        class CustomIterator2(Iterable):
+
+            def __iter__(self):
+                yield df1
+                yield df2
+        assert_frame_equal(pd.concat(CustomIterator2(),
+                                     ignore_index=True), expected)
+
+    def test_concat_invalid(self):
+
+        # trying to concat a ndframe with a non-ndframe
+        df1 = mkdf(10, 2)
+        msg = ('cannot concatenate object of type "{}";'
+               ' only pd.Series, pd.DataFrame, and pd.Panel'
+               r' \(deprecated\) objs are valid')
+        for obj in [1, dict(), [1, 2], (1, 2)]:
+            with pytest.raises(TypeError, match=msg.format(type(obj))):
+                concat([df1, obj])
+
+    def test_concat_invalid_first_argument(self):
+        df1 = mkdf(10, 2)
+        df2 = mkdf(10, 2)
+        msg = ('first argument must be an iterable of pandas '
+               'objects, you passed an object of type "DataFrame"')
+        with pytest.raises(TypeError, match=msg):
+            concat(df1, df2)
+
+        # generator ok though
+        concat(DataFrame(np.random.rand(5, 5)) for _ in range(3))
+
+        # text reader ok
+        # GH6583
+        data = """index,A,B,C,D
+foo,2,3,4,5
+bar,7,8,9,10
+baz,12,13,14,15
+qux,12,13,14,15
+foo2,12,13,14,15
+bar2,12,13,14,15
+"""
+
+        reader = read_csv(StringIO(data), chunksize=1)
+        result = concat(reader, ignore_index=True)
+        expected = read_csv(StringIO(data))
+        assert_frame_equal(result, expected)
+
+    def test_concat_NaT_series(self):
+        # GH 11693
+        # test for merging NaT series with datetime series.
+        x = Series(date_range('20151124 08:00', '20151124 09:00',
+                              freq='1h', tz='US/Eastern'))
+        y = Series(pd.NaT, index=[0, 1], dtype='datetime64[ns, US/Eastern]')
+        expected = Series([x[0], x[1], pd.NaT, pd.NaT])
+
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # all NaT with tz
+        expected = Series(pd.NaT, index=range(4),
+                          dtype='datetime64[ns, US/Eastern]')
+        result = pd.concat([y, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # without tz
+        x = pd.Series(pd.date_range('20151124 08:00',
+                                    '20151124 09:00', freq='1h'))
+        y = pd.Series(pd.date_range('20151124 10:00',
+                                    '20151124 11:00', freq='1h'))
+        y[:] = pd.NaT
+        expected = pd.Series([x[0], x[1], pd.NaT, pd.NaT])
+        result = pd.concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # all NaT without tz
+        x[:] = pd.NaT
+        expected = pd.Series(pd.NaT, index=range(4),
+                             dtype='datetime64[ns]')
+        result = pd.concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_tz_frame(self):
+        df2 = DataFrame(dict(A=pd.Timestamp('20130102', tz='US/Eastern'),
+                             B=pd.Timestamp('20130603', tz='CET')),
+                        index=range(5))
+
+        # concat
+        df3 = pd.concat([df2.A.to_frame(), df2.B.to_frame()], axis=1)
+        assert_frame_equal(df2, df3)
+
+    def test_concat_tz_series(self):
+        # gh-11755: tz and no tz
+        x = Series(date_range('20151124 08:00',
+                              '20151124 09:00',
+                              freq='1h', tz='UTC'))
+        y = Series(date_range('2012-01-01', '2012-01-02'))
+        expected = Series([x[0], x[1], y[0], y[1]],
+                          dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # gh-11887: concat tz and object
+        x = Series(date_range('20151124 08:00',
+                              '20151124 09:00',
+                              freq='1h', tz='UTC'))
+        y = Series(['a', 'b'])
+        expected = Series([x[0], x[1], y[0], y[1]],
+                          dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+        # see gh-12217 and gh-12306
+        # Concatenating two UTC times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('UTC')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)]])
+        second[0] = second[0].dt.tz_localize('UTC')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, UTC]'
+
+        # Concatenating two London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+        # Concatenating 2+1 London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)], [datetime(2016, 1, 2)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 3)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+        # Concat'ing 1+2 London times
+        first = pd.DataFrame([[datetime(2016, 1, 1)]])
+        first[0] = first[0].dt.tz_localize('Europe/London')
+
+        second = pd.DataFrame([[datetime(2016, 1, 2)], [datetime(2016, 1, 3)]])
+        second[0] = second[0].dt.tz_localize('Europe/London')
+
+        result = pd.concat([first, second])
+        assert result[0].dtype == 'datetime64[ns, Europe/London]'
+
+    def test_concat_tz_series_with_datetimelike(self):
+        # see gh-12620: tz and timedelta
+        x = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+             pd.Timestamp('2011-02-01', tz='US/Eastern')]
+        y = [pd.Timedelta('1 day'), pd.Timedelta('2 day')]
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
+
+        # tz and period
+        y = [pd.Period('2011-03', freq='M'), pd.Period('2011-04', freq='M')]
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
+
+    def test_concat_tz_series_tzlocal(self):
+        # see gh-13583
+        x = [pd.Timestamp('2011-01-01', tz=dateutil.tz.tzlocal()),
+             pd.Timestamp('2011-02-01', tz=dateutil.tz.tzlocal())]
+        y = [pd.Timestamp('2012-01-01', tz=dateutil.tz.tzlocal()),
+             pd.Timestamp('2012-02-01', tz=dateutil.tz.tzlocal())]
+
+        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
+        tm.assert_series_equal(result, pd.Series(x + y))
+        assert result.dtype == 'datetime64[ns, tzlocal()]'
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    @pytest.mark.parametrize('s', [pd.NaT, pd.Timestamp('20150101')])
+    def test_concat_NaT_dataframes_all_NaT_axis_0(self, tz1, tz2, s):
+        # GH 12396
+
+        # tz-naive
+        first = pd.DataFrame([[pd.NaT], [pd.NaT]]).apply(
+            lambda x: x.dt.tz_localize(tz1))
+        second = pd.DataFrame([s]).apply(lambda x: x.dt.tz_localize(tz2))
+
+        result = pd.concat([first, second], axis=0)
+        expected = pd.DataFrame(pd.Series(
+            [pd.NaT, pd.NaT, s], index=[0, 1, 0]))
+        expected = expected.apply(lambda x: x.dt.tz_localize(tz2))
+        if tz1 != tz2:
+            expected = expected.astype(object)
+
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    def test_concat_NaT_dataframes_all_NaT_axis_1(self, tz1, tz2):
+        # GH 12396
+
+        first = pd.DataFrame(pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1))
+        second = pd.DataFrame(pd.Series(
+            [pd.NaT]).dt.tz_localize(tz2), columns=[1])
+        expected = pd.DataFrame(
+            {0: pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1),
+             1: pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz2)}
+        )
+        result = pd.concat([first, second], axis=1)
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz1', [None, 'UTC'])
+    @pytest.mark.parametrize('tz2', [None, 'UTC'])
+    def test_concat_NaT_series_dataframe_all_NaT(self, tz1, tz2):
+        # GH 12396
+
+        # tz-naive
+        first = pd.Series([pd.NaT, pd.NaT]).dt.tz_localize(tz1)
+        second = pd.DataFrame([[pd.Timestamp('2015/01/01', tz=tz2)],
+                               [pd.Timestamp('2016/01/01', tz=tz2)]],
+                              index=[2, 3])
+
+        expected = pd.DataFrame([pd.NaT, pd.NaT,
+                                 pd.Timestamp('2015/01/01', tz=tz2),
+                                 pd.Timestamp('2016/01/01', tz=tz2)])
+        if tz1 != tz2:
+            expected = expected.astype(object)
+
+        result = pd.concat([first, second])
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    def test_concat_NaT_dataframes(self, tz):
+        # GH 12396
+
+        first = pd.DataFrame([[pd.NaT], [pd.NaT]])
+        first = first.apply(lambda x: x.dt.tz_localize(tz))
+        second = pd.DataFrame([[pd.Timestamp('2015/01/01', tz=tz)],
+                               [pd.Timestamp('2016/01/01', tz=tz)]],
+                              index=[2, 3])
+        expected = pd.DataFrame([pd.NaT, pd.NaT,
+                                 pd.Timestamp('2015/01/01', tz=tz),
+                                 pd.Timestamp('2016/01/01', tz=tz)])
+
+        result = pd.concat([first, second], axis=0)
+        assert_frame_equal(result, expected)
+
+    def test_concat_period_series(self):
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='D'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='Period[D]')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_concat_period_multiple_freq_series(self):
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='M'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+    def test_concat_period_other_series(self):
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='M'))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        # non-period
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(pd.DatetimeIndex(['2015-11-01', '2015-12-01']))
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
+        y = Series(['A', 'B'])
+        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
+        result = concat([x, y], ignore_index=True)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'object'
+
+    def test_concat_empty_series(self):
+        # GH 11082
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name='y')
+        res = pd.concat([s1, s2], axis=1)
+        exp = pd.DataFrame({'x': [1, 2, 3], 'y': [np.nan, np.nan, np.nan]})
+        tm.assert_frame_equal(res, exp)
+
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name='y')
+        res = pd.concat([s1, s2], axis=0)
+        # name will be reset
+        exp = pd.Series([1, 2, 3])
+        tm.assert_series_equal(res, exp)
+
+        # empty Series with no name
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series(name=None)
+        res = pd.concat([s1, s2], axis=1)
+        exp = pd.DataFrame({'x': [1, 2, 3], 0: [np.nan, np.nan, np.nan]},
+                           columns=['x', 0])
+        tm.assert_frame_equal(res, exp)
+
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    @pytest.mark.parametrize('values', [[], [1, 2, 3]])
+    def test_concat_empty_series_timelike(self, tz, values):
+        # GH 18447
+
+        first = Series([], dtype='M8[ns]').dt.tz_localize(tz)
+        second = Series(values)
+        expected = DataFrame(
+            {0: pd.Series([pd.NaT] * len(values),
+                          dtype='M8[ns]'
+                          ).dt.tz_localize(tz),
+             1: values})
+        result = concat([first, second], axis=1)
+        assert_frame_equal(result, expected)
+
+    def test_default_index(self):
+        # is_series and ignore_index
+        s1 = pd.Series([1, 2, 3], name='x')
+        s2 = pd.Series([4, 5, 6], name='y')
+        res = pd.concat([s1, s2], axis=1, ignore_index=True)
+        assert isinstance(res.columns, pd.RangeIndex)
+        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
+        # use check_index_type=True to check the result have
+        # RangeIndex (default index)
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        # is_series and all inputs have no names
+        s1 = pd.Series([1, 2, 3])
+        s2 = pd.Series([4, 5, 6])
+        res = pd.concat([s1, s2], axis=1, ignore_index=False)
+        assert isinstance(res.columns, pd.RangeIndex)
+        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
+        exp.columns = pd.RangeIndex(2)
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        # is_dataframe and ignore_index
+        df1 = pd.DataFrame({'A': [1, 2], 'B': [5, 6]})
+        df2 = pd.DataFrame({'A': [3, 4], 'B': [7, 8]})
+
+        res = pd.concat([df1, df2], axis=0, ignore_index=True)
+        exp = pd.DataFrame([[1, 5], [2, 6], [3, 7], [4, 8]],
+                           columns=['A', 'B'])
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+        res = pd.concat([df1, df2], axis=1, ignore_index=True)
+        exp = pd.DataFrame([[1, 5, 3, 7], [2, 6, 4, 8]])
+        tm.assert_frame_equal(res, exp, check_index_type=True,
+                              check_column_type=True)
+
+    def test_concat_multiindex_rangeindex(self):
+        # GH13542
+        # when multi-index levels are RangeIndex objects
+        # there is a bug in concat with objects of len 1
+
+        df = DataFrame(np.random.randn(9, 2))
+        df.index = MultiIndex(levels=[pd.RangeIndex(3), pd.RangeIndex(3)],
+                              codes=[np.repeat(np.arange(3), 3),
+                                     np.tile(np.arange(3), 3)])
+
+        res = concat([df.iloc[[2, 3, 4], :], df.iloc[[5], :]])
+        exp = df.iloc[[2, 3, 4, 5], :]
+        tm.assert_frame_equal(res, exp)
+
+    def test_concat_multiindex_dfs_with_deepcopy(self):
+        # GH 9967
+        from copy import deepcopy
+        example_multiindex1 = pd.MultiIndex.from_product([['a'], ['b']])
+        example_dataframe1 = pd.DataFrame([0], index=example_multiindex1)
+
+        example_multiindex2 = pd.MultiIndex.from_product([['a'], ['c']])
+        example_dataframe2 = pd.DataFrame([1], index=example_multiindex2)
+
+        example_dict = {'s1': example_dataframe1, 's2': example_dataframe2}
+        expected_index = pd.MultiIndex(levels=[['s1', 's2'],
+                                               ['a'],
+                                               ['b', 'c']],
+                                       codes=[[0, 1], [0, 0], [0, 1]],
+                                       names=['testname', None, None])
+        expected = pd.DataFrame([[0], [1]], index=expected_index)
+        result_copy = pd.concat(deepcopy(example_dict), names=['testname'])
+        tm.assert_frame_equal(result_copy, expected)
+        result_no_copy = pd.concat(example_dict, names=['testname'])
+        tm.assert_frame_equal(result_no_copy, expected)
+
+    def test_categorical_concat_append(self):
+        cat = Categorical(["a", "b"], categories=["a", "b"])
+        vals = [1, 2]
+        df = DataFrame({"cats": cat, "vals": vals})
+        cat2 = Categorical(["a", "b", "a", "b"], categories=["a", "b"])
+        vals2 = [1, 2, 1, 2]
+        exp = DataFrame({"cats": cat2, "vals": vals2},
+                        index=Index([0, 1, 0, 1]))
+
+        tm.assert_frame_equal(pd.concat([df, df]), exp)
+        tm.assert_frame_equal(df.append(df), exp)
+
+        # GH 13524 can concat different categories
+        cat3 = Categorical(["a", "b"], categories=["a", "b", "c"])
+        vals3 = [1, 2]
+        df_different_categories = DataFrame({"cats": cat3, "vals": vals3})
+
+        res = pd.concat([df, df_different_categories], ignore_index=True)
+        exp = DataFrame({"cats": list('abab'), "vals": [1, 2, 1, 2]})
+        tm.assert_frame_equal(res, exp)
+
+        res = df.append(df_different_categories, ignore_index=True)
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_concat_dtypes(self):
+
+        # GH8143
+        index = ['cat', 'obj', 'num']
+        cat = Categorical(['a', 'b', 'c'])
+        obj = Series(['a', 'b', 'c'])
+        num = Series([1, 2, 3])
+        df = pd.concat([Series(cat), obj, num], axis=1, keys=index)
+
+        result = df.dtypes == 'object'
+        expected = Series([False, True, False], index=index)
+        tm.assert_series_equal(result, expected)
+
+        result = df.dtypes == 'int64'
+        expected = Series([False, False, True], index=index)
+        tm.assert_series_equal(result, expected)
+
+        result = df.dtypes == 'category'
+        expected = Series([True, False, False], index=index)
+        tm.assert_series_equal(result, expected)
+
+    def test_categorical_concat(self, sort):
+        # See GH 10177
+        df1 = DataFrame(np.arange(18, dtype='int64').reshape(6, 3),
+                        columns=["a", "b", "c"])
+
+        df2 = DataFrame(np.arange(14, dtype='int64').reshape(7, 2),
+                        columns=["a", "c"])
+
+        cat_values = ["one", "one", "two", "one", "two", "two", "one"]
+        df2['h'] = Series(Categorical(cat_values))
+
+        res = pd.concat((df1, df2), axis=0, ignore_index=True, sort=sort)
+        exp = DataFrame({'a': [0, 3, 6, 9, 12, 15, 0, 2, 4, 6, 8, 10, 12],
+                         'b': [1, 4, 7, 10, 13, 16, np.nan, np.nan, np.nan,
+                               np.nan, np.nan, np.nan, np.nan],
+                         'c': [2, 5, 8, 11, 14, 17, 1, 3, 5, 7, 9, 11, 13],
+                         'h': [None] * 6 + cat_values})
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_concat_gh7864(self):
+        # GH 7864
+        # make sure ordering is preserverd
+        df = DataFrame({"id": [1, 2, 3, 4, 5, 6], "raw_grade": list('abbaae')})
+        df["grade"] = Categorical(df["raw_grade"])
+        df['grade'].cat.set_categories(['e', 'a', 'b'])
+
+        df1 = df[0:3]
+        df2 = df[3:]
+
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              df1['grade'].cat.categories)
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              df2['grade'].cat.categories)
+
+        dfx = pd.concat([df1, df2])
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              dfx['grade'].cat.categories)
+
+        dfa = df1.append(df2)
+        tm.assert_index_equal(df['grade'].cat.categories,
+                              dfa['grade'].cat.categories)
+
+    def test_categorical_concat_preserve(self):
+
+        # GH 8641  series concat not preserving category dtype
+        # GH 13524 can concat different categories
+        s = Series(list('abc'), dtype='category')
+        s2 = Series(list('abd'), dtype='category')
+
+        exp = Series(list('abcabd'))
+        res = pd.concat([s, s2], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(list('abcabc'), dtype='category')
+        res = pd.concat([s, s], ignore_index=True)
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(list('abcabc'), index=[0, 1, 2, 0, 1, 2],
+                     dtype='category')
+        res = pd.concat([s, s])
+        tm.assert_series_equal(res, exp)
+
+        a = Series(np.arange(6, dtype='int64'))
+        b = Series(list('aabbca'))
+
+        df2 = DataFrame({'A': a,
+                         'B': b.astype(CategoricalDtype(list('cab')))})
+        res = pd.concat([df2, df2])
+        exp = DataFrame(
+            {'A': pd.concat([a, a]),
+             'B': pd.concat([b, b]).astype(CategoricalDtype(list('cab')))})
+        tm.assert_frame_equal(res, exp)
+
+    def test_categorical_index_preserver(self):
+
+        a = Series(np.arange(6, dtype='int64'))
+        b = Series(list('aabbca'))
+
+        df2 = DataFrame({'A': a,
+                         'B': b.astype(CategoricalDtype(list('cab')))
+                         }).set_index('B')
+        result = pd.concat([df2, df2])
+        expected = DataFrame(
+            {'A': pd.concat([a, a]),
+             'B': pd.concat([b, b]).astype(CategoricalDtype(list('cab')))
+             }).set_index('B')
+        tm.assert_frame_equal(result, expected)
+
+        # wrong catgories
+        df3 = DataFrame({'A': a, 'B': Categorical(b, categories=list('abe'))
+                         }).set_index('B')
+        msg = "categories must match existing categories when appending"
+        with pytest.raises(TypeError, match=msg):
+            pd.concat([df2, df3])
+
+    def test_concat_categoricalindex(self):
+        # GH 16111, categories that aren't lexsorted
+        categories = [9, 0, 1, 2, 3]
+
+        a = pd.Series(1, index=pd.CategoricalIndex([9, 0],
+                                                   categories=categories))
+        b = pd.Series(2, index=pd.CategoricalIndex([0, 1],
+                                                   categories=categories))
+        c = pd.Series(3, index=pd.CategoricalIndex([1, 2],
+                                                   categories=categories))
+
+        result = pd.concat([a, b, c], axis=1)
+
+        exp_idx = pd.CategoricalIndex([9, 0, 1, 2], categories=categories)
+        exp = pd.DataFrame({0: [1, 1, np.nan, np.nan],
+                            1: [np.nan, 2, 2, np.nan],
+                            2: [np.nan, np.nan, 3, 3]},
+                           columns=[0, 1, 2],
+                           index=exp_idx)
+        tm.assert_frame_equal(result, exp)
+
+    def test_concat_order(self):
+        # GH 17344
+        dfs = [pd.DataFrame(index=range(3), columns=['a', 1, None])]
+        dfs += [pd.DataFrame(index=range(3), columns=[None, 1, 'a'])
+                for i in range(100)]
+
+        result = pd.concat(dfs, sort=True).columns
+
+        if PY2:
+            # Different sort order between incomparable objects between
+            # python 2 and python3 via Index.union.
+            expected = dfs[1].columns
+        else:
+            expected = dfs[0].columns
+        tm.assert_index_equal(result, expected)
+
+    def test_concat_datetime_timezone(self):
+        # GH 18523
+        idx1 = pd.date_range('2011-01-01', periods=3, freq='H',
+                             tz='Europe/Paris')
+        idx2 = pd.date_range(start=idx1[0], end=idx1[-1], freq='H')
+        df1 = pd.DataFrame({'a': [1, 2, 3]}, index=idx1)
+        df2 = pd.DataFrame({'b': [1, 2, 3]}, index=idx2)
+        result = pd.concat([df1, df2], axis=1)
+
+        exp_idx = DatetimeIndex(['2011-01-01 00:00:00+01:00',
+                                 '2011-01-01 01:00:00+01:00',
+                                 '2011-01-01 02:00:00+01:00'],
+                                freq='H'
+                                ).tz_convert('UTC').tz_convert('Europe/Paris')
+
+        expected = pd.DataFrame([[1, 1], [2, 2], [3, 3]],
+                                index=exp_idx, columns=['a', 'b'])
+
+        tm.assert_frame_equal(result, expected)
+
+        idx3 = pd.date_range('2011-01-01', periods=3,
+                             freq='H', tz='Asia/Tokyo')
+        df3 = pd.DataFrame({'b': [1, 2, 3]}, index=idx3)
+        result = pd.concat([df1, df3], axis=1)
+
+        exp_idx = DatetimeIndex(['2010-12-31 15:00:00+00:00',
+                                 '2010-12-31 16:00:00+00:00',
+                                 '2010-12-31 17:00:00+00:00',
+                                 '2010-12-31 23:00:00+00:00',
+                                 '2011-01-01 00:00:00+00:00',
+                                 '2011-01-01 01:00:00+00:00']
+                                )
+
+        expected = pd.DataFrame([[np.nan, 1], [np.nan, 2], [np.nan, 3],
+                                 [1, np.nan], [2, np.nan], [3, np.nan]],
+                                index=exp_idx, columns=['a', 'b'])
+
+        tm.assert_frame_equal(result, expected)
+
+        # GH 13783: Concat after resample
+        result = pd.concat([df1.resample('H').mean(),
+                            df2.resample('H').mean()], sort=True)
+        expected = pd.DataFrame({'a': [1, 2, 3] + [np.nan] * 3,
+                                 'b': [np.nan] * 3 + [1, 2, 3]},
+                                index=idx1.append(idx1))
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.skipif(PY2, reason="Unhashable Decimal dtype")
+    def test_concat_different_extension_dtypes_upcasts(self):
+        a = pd.Series(pd.core.arrays.integer_array([1, 2]))
+        b = pd.Series(to_decimal([1, 2]))
+
+        result = pd.concat([a, b], ignore_index=True)
+        expected = pd.Series([
+            1, 2,
+            Decimal(1), Decimal(2)
+        ], dtype=object)
+        tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
+@pytest.mark.parametrize('dt', np.sctypes['float'])
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+def test_concat_no_unnecessary_upcast(dt, pdt):
+    # GH 13247
+    dims = pdt().ndim
+    dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
+           pdt(np.array([np.nan], dtype=dt, ndmin=dims)),
+           pdt(np.array([5], dtype=dt, ndmin=dims))]
+    x = pd.concat(dfs)
+    assert x.values.dtype == dt
+
+
+@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
+@pytest.mark.parametrize('dt', np.sctypes['int'])
+@pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+def test_concat_will_upcast(dt, pdt):
+    with catch_warnings(record=True):
+        dims = pdt().ndim
+        dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
+               pdt(np.array([np.nan], ndmin=dims)),
+               pdt(np.array([5], dtype=dt, ndmin=dims))]
+        x = pd.concat(dfs)
+        assert x.values.dtype == 'float64'
+
+
+def test_concat_empty_and_non_empty_frame_regression():
+    # GH 18178 regression test
+    df1 = pd.DataFrame({'foo': [1]})
+    df2 = pd.DataFrame({'foo': []})
+    expected = pd.DataFrame({'foo': [1.0]})
+    result = pd.concat([df1, df2])
+    assert_frame_equal(result, expected)
+
+
+def test_concat_empty_and_non_empty_series_regression():
+    # GH 18187 regression test
+    s1 = pd.Series([1])
+    s2 = pd.Series([])
+    expected = s1
+    result = pd.concat([s1, s2])
+    tm.assert_series_equal(result, expected)
+
+
+def test_concat_sorts_columns(sort_with_none):
+    # GH-4588
+    df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2]}, columns=['b', 'a'])
+    df2 = pd.DataFrame({"a": [3, 4], "c": [5, 6]})
+
+    # for sort=True/None
+    expected = pd.DataFrame({"a": [1, 2, 3, 4],
+                             "b": [1, 2, None, None],
+                             "c": [None, None, 5, 6]},
+                            columns=['a', 'b', 'c'])
+
+    if sort_with_none is False:
+        expected = expected[['b', 'a', 'c']]
+
+    if sort_with_none is None:
+        # only warn if not explicitly specified
+        ctx = tm.assert_produces_warning(FutureWarning)
+    else:
+        ctx = tm.assert_produces_warning(None)
+
+    # default
+    with ctx:
+        result = pd.concat([df1, df2], ignore_index=True, sort=sort_with_none)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_sorts_index(sort_with_none):
+    df1 = pd.DataFrame({"a": [1, 2, 3]}, index=['c', 'a', 'b'])
+    df2 = pd.DataFrame({"b": [1, 2]}, index=['a', 'b'])
+
+    # For True/None
+    expected = pd.DataFrame({"a": [2, 3, 1], "b": [1, 2, None]},
+                            index=['a', 'b', 'c'],
+                            columns=['a', 'b'])
+    if sort_with_none is False:
+        expected = expected.loc[['c', 'a', 'b']]
+
+    if sort_with_none is None:
+        # only warn if not explicitly specified
+        ctx = tm.assert_produces_warning(FutureWarning)
+    else:
+        ctx = tm.assert_produces_warning(None)
+
+    # Warn and sort by default
+    with ctx:
+        result = pd.concat([df1, df2], axis=1, sort=sort_with_none)
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_inner_sort(sort_with_none):
+    # https://github.com/pandas-dev/pandas/pull/20613
+    df1 = pd.DataFrame({"a": [1, 2], "b": [1, 2], "c": [1, 2]},
+                       columns=['b', 'a', 'c'])
+    df2 = pd.DataFrame({"a": [1, 2], 'b': [3, 4]}, index=[3, 4])
+
+    with tm.assert_produces_warning(None):
+        # unset sort should *not* warn for inner join
+        # since that never sorted
+        result = pd.concat([df1, df2], sort=sort_with_none,
+                           join='inner',
+                           ignore_index=True)
+
+    expected = pd.DataFrame({"b": [1, 2, 3, 4], "a": [1, 2, 1, 2]},
+                            columns=['b', 'a'])
+    if sort_with_none is True:
+        expected = expected[['a', 'b']]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_aligned_sort():
+    # GH-4588
+    df = pd.DataFrame({"c": [1, 2], "b": [3, 4], 'a': [5, 6]},
+                      columns=['c', 'b', 'a'])
+    result = pd.concat([df, df], sort=True, ignore_index=True)
+    expected = pd.DataFrame({'a': [5, 6, 5, 6], 'b': [3, 4, 3, 4],
+                             'c': [1, 2, 1, 2]},
+                            columns=['a', 'b', 'c'])
+    tm.assert_frame_equal(result, expected)
+
+    result = pd.concat([df, df[['c', 'b']]], join='inner', sort=True,
+                       ignore_index=True)
+    expected = expected[['b', 'c']]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_concat_aligned_sort_does_not_raise():
+    # GH-4588
+    # We catch TypeErrors from sorting internally and do not re-raise.
+    df = pd.DataFrame({1: [1, 2], "a": [3, 4]}, columns=[1, 'a'])
+    expected = pd.DataFrame({1: [1, 2, 1, 2], 'a': [3, 4, 3, 4]},
+                            columns=[1, 'a'])
+    result = pd.concat([df, df], ignore_index=True, sort=True)
+    tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("s1name,s2name", [
+    (np.int64(190), (43, 0)), (190, (43, 0))])
+def test_concat_series_name_npscalar_tuple(s1name, s2name):
+    # GH21015
+    s1 = pd.Series({'a': 1, 'b': 2}, name=s1name)
+    s2 = pd.Series({'c': 5, 'd': 6}, name=s2name)
+    result = pd.concat([s1, s2])
+    expected = pd.Series({'a': 1, 'b': 2, 'c': 5, 'd': 6})
+    tm.assert_series_equal(result, expected)
+
+
+def test_concat_categorical_tz():
+    # GH-23816
+    a = pd.Series(pd.date_range('2017-01-01', periods=2, tz='US/Pacific'))
+    b = pd.Series(['a', 'b'], dtype='category')
+    result = pd.concat([a, b], ignore_index=True)
+    expected = pd.Series([
+        pd.Timestamp('2017-01-01', tz="US/Pacific"),
+        pd.Timestamp('2017-01-02', tz="US/Pacific"),
+        'a', 'b'
+    ])
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/reshape/test_cut.py b/pandas/tests/reshape/test_cut.py
new file mode 100644
index 0000000000000..6833460fa515b
--- /dev/null
+++ b/pandas/tests/reshape/test_cut.py
@@ -0,0 +1,458 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, Interval, IntervalIndex,
+    Series, TimedeltaIndex, Timestamp, cut, date_range, isna, qcut,
+    timedelta_range, to_datetime)
+from pandas.api.types import CategoricalDtype as CDT
+import pandas.core.reshape.tile as tmod
+import pandas.util.testing as tm
+
+
+def test_simple():
+    data = np.ones(5, dtype="int64")
+    result = cut(data, 4, labels=False)
+
+    expected = np.array([1, 1, 1, 1, 1])
+    tm.assert_numpy_array_equal(result, expected, check_dtype=False)
+
+
+def test_bins():
+    data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1])
+    result, bins = cut(data, 3, retbins=True)
+
+    intervals = IntervalIndex.from_breaks(bins.round(3))
+    intervals = intervals.take([0, 0, 0, 1, 2, 0])
+    expected = Categorical(intervals, ordered=True)
+
+    tm.assert_categorical_equal(result, expected)
+    tm.assert_almost_equal(bins, np.array([0.1905, 3.36666667,
+                                           6.53333333, 9.7]))
+
+
+def test_right():
+    data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
+    result, bins = cut(data, 4, right=True, retbins=True)
+
+    intervals = IntervalIndex.from_breaks(bins.round(3))
+    expected = Categorical(intervals, ordered=True)
+    expected = expected.take([0, 0, 0, 2, 3, 0, 0])
+
+    tm.assert_categorical_equal(result, expected)
+    tm.assert_almost_equal(bins, np.array([0.1905, 2.575, 4.95, 7.325, 9.7]))
+
+
+def test_no_right():
+    data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
+    result, bins = cut(data, 4, right=False, retbins=True)
+
+    intervals = IntervalIndex.from_breaks(bins.round(3), closed="left")
+    intervals = intervals.take([0, 0, 0, 2, 3, 0, 1])
+    expected = Categorical(intervals, ordered=True)
+
+    tm.assert_categorical_equal(result, expected)
+    tm.assert_almost_equal(bins, np.array([0.2, 2.575, 4.95, 7.325, 9.7095]))
+
+
+def test_array_like():
+    data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+    result, bins = cut(data, 3, retbins=True)
+
+    intervals = IntervalIndex.from_breaks(bins.round(3))
+    intervals = intervals.take([0, 0, 0, 1, 2, 0])
+    expected = Categorical(intervals, ordered=True)
+
+    tm.assert_categorical_equal(result, expected)
+    tm.assert_almost_equal(bins, np.array([0.1905, 3.36666667,
+                                           6.53333333, 9.7]))
+
+
+def test_bins_from_interval_index():
+    c = cut(range(5), 3)
+    expected = c
+    result = cut(range(5), bins=expected.categories)
+    tm.assert_categorical_equal(result, expected)
+
+    expected = Categorical.from_codes(np.append(c.codes, -1),
+                                      categories=c.categories,
+                                      ordered=True)
+    result = cut(range(6), bins=expected.categories)
+    tm.assert_categorical_equal(result, expected)
+
+
+def test_bins_from_interval_index_doc_example():
+    # Make sure we preserve the bins.
+    ages = np.array([10, 15, 13, 12, 23, 25, 28, 59, 60])
+    c = cut(ages, bins=[0, 18, 35, 70])
+    expected = IntervalIndex.from_tuples([(0, 18), (18, 35), (35, 70)])
+    tm.assert_index_equal(c.categories, expected)
+
+    result = cut([25, 20, 50], bins=c.categories)
+    tm.assert_index_equal(result.categories, expected)
+    tm.assert_numpy_array_equal(result.codes,
+                                np.array([1, 1, 2], dtype="int8"))
+
+
+def test_bins_not_overlapping_from_interval_index():
+    # see gh-23980
+    msg = "Overlapping IntervalIndex is not accepted"
+    ii = IntervalIndex.from_tuples([(0, 10), (2, 12), (4, 14)])
+
+    with pytest.raises(ValueError, match=msg):
+        cut([5, 6], bins=ii)
+
+
+def test_bins_not_monotonic():
+    msg = "bins must increase monotonically"
+    data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+
+    with pytest.raises(ValueError, match=msg):
+        cut(data, [0.1, 1.5, 1, 10])
+
+
+def test_wrong_num_labels():
+    msg = "Bin labels must be one fewer than the number of bin edges"
+    data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
+
+    with pytest.raises(ValueError, match=msg):
+        cut(data, [0, 1, 10], labels=["foo", "bar", "baz"])
+
+
+@pytest.mark.parametrize("x,bins,msg", [
+    ([], 2, "Cannot cut empty array"),
+    ([1, 2, 3], 0.5, "`bins` should be a positive integer")
+])
+def test_cut_corner(x, bins, msg):
+    with pytest.raises(ValueError, match=msg):
+        cut(x, bins)
+
+
+@pytest.mark.parametrize("arg", [2, np.eye(2), DataFrame(np.eye(2))])
+@pytest.mark.parametrize("cut_func", [cut, qcut])
+def test_cut_not_1d_arg(arg, cut_func):
+    msg = "Input array must be 1 dimensional"
+    with pytest.raises(ValueError, match=msg):
+        cut_func(arg, 2)
+
+
+@pytest.mark.parametrize('data', [
+    [0, 1, 2, 3, 4, np.inf],
+    [-np.inf, 0, 1, 2, 3, 4],
+    [-np.inf, 0, 1, 2, 3, 4, np.inf]])
+def test_int_bins_with_inf(data):
+    # GH 24314
+    msg = 'cannot specify integer `bins` when input data contains infinity'
+    with pytest.raises(ValueError, match=msg):
+        cut(data, bins=3)
+
+
+def test_cut_out_of_range_more():
+    # see gh-1511
+    name = "x"
+
+    ser = Series([0, -1, 0, 1, -3], name=name)
+    ind = cut(ser, [0, 1], labels=False)
+
+    exp = Series([np.nan, np.nan, np.nan, 0, np.nan], name=name)
+    tm.assert_series_equal(ind, exp)
+
+
+@pytest.mark.parametrize("right,breaks,closed", [
+    (True, [-1e-3, 0.25, 0.5, 0.75, 1], "right"),
+    (False, [0, 0.25, 0.5, 0.75, 1 + 1e-3], "left")
+])
+def test_labels(right, breaks, closed):
+    arr = np.tile(np.arange(0, 1.01, 0.1), 4)
+
+    result, bins = cut(arr, 4, retbins=True, right=right)
+    ex_levels = IntervalIndex.from_breaks(breaks, closed=closed)
+    tm.assert_index_equal(result.categories, ex_levels)
+
+
+def test_cut_pass_series_name_to_factor():
+    name = "foo"
+    ser = Series(np.random.randn(100), name=name)
+
+    factor = cut(ser, 4)
+    assert factor.name == name
+
+
+def test_label_precision():
+    arr = np.arange(0, 0.73, 0.01)
+    result = cut(arr, 4, precision=2)
+
+    ex_levels = IntervalIndex.from_breaks([-0.00072, 0.18, 0.36, 0.54, 0.72])
+    tm.assert_index_equal(result.categories, ex_levels)
+
+
+@pytest.mark.parametrize("labels", [None, False])
+def test_na_handling(labels):
+    arr = np.arange(0, 0.75, 0.01)
+    arr[::3] = np.nan
+
+    result = cut(arr, 4, labels=labels)
+    result = np.asarray(result)
+
+    expected = np.where(isna(arr), np.nan, result)
+    tm.assert_almost_equal(result, expected)
+
+
+def test_inf_handling():
+    data = np.arange(6)
+    data_ser = Series(data, dtype="int64")
+
+    bins = [-np.inf, 2, 4, np.inf]
+    result = cut(data, bins)
+    result_ser = cut(data_ser, bins)
+
+    ex_uniques = IntervalIndex.from_breaks(bins)
+    tm.assert_index_equal(result.categories, ex_uniques)
+
+    assert result[5] == Interval(4, np.inf)
+    assert result[0] == Interval(-np.inf, 2)
+    assert result_ser[5] == Interval(4, np.inf)
+    assert result_ser[0] == Interval(-np.inf, 2)
+
+
+def test_cut_out_of_bounds():
+    arr = np.random.randn(100)
+    result = cut(arr, [-1, 0, 1])
+
+    mask = isna(result)
+    ex_mask = (arr < -1) | (arr > 1)
+    tm.assert_numpy_array_equal(mask, ex_mask)
+
+
+@pytest.mark.parametrize("get_labels,get_expected", [
+    (lambda labels: labels,
+     lambda labels: Categorical(["Medium"] + 4 * ["Small"] +
+                                ["Medium", "Large"],
+                                categories=labels, ordered=True)),
+    (lambda labels: Categorical.from_codes([0, 1, 2], labels),
+     lambda labels: Categorical.from_codes([1] + 4 * [0] + [1, 2], labels))
+])
+def test_cut_pass_labels(get_labels, get_expected):
+    bins = [0, 25, 50, 100]
+    arr = [50, 5, 10, 15, 20, 30, 70]
+    labels = ["Small", "Medium", "Large"]
+
+    result = cut(arr, bins, labels=get_labels(labels))
+    tm.assert_categorical_equal(result, get_expected(labels))
+
+
+def test_cut_pass_labels_compat():
+    # see gh-16459
+    arr = [50, 5, 10, 15, 20, 30, 70]
+    labels = ["Good", "Medium", "Bad"]
+
+    result = cut(arr, 3, labels=labels)
+    exp = cut(arr, 3, labels=Categorical(labels, categories=labels,
+                                         ordered=True))
+    tm.assert_categorical_equal(result, exp)
+
+
+@pytest.mark.parametrize("x", [np.arange(11.), np.arange(11.) / 1e10])
+def test_round_frac_just_works(x):
+    # It works.
+    cut(x, 2)
+
+
+@pytest.mark.parametrize("val,precision,expected", [
+    (-117.9998, 3, -118),
+    (117.9998, 3, 118),
+    (117.9998, 2, 118),
+    (0.000123456, 2, 0.00012)
+])
+def test_round_frac(val, precision, expected):
+    # see gh-1979
+    result = tmod._round_frac(val, precision=precision)
+    assert result == expected
+
+
+def test_cut_return_intervals():
+    ser = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
+    result = cut(ser, 3)
+
+    exp_bins = np.linspace(0, 8, num=4).round(3)
+    exp_bins[0] -= 0.008
+
+    expected = Series(IntervalIndex.from_breaks(exp_bins, closed="right").take(
+        [0, 0, 0, 1, 1, 1, 2, 2, 2])).astype(CDT(ordered=True))
+    tm.assert_series_equal(result, expected)
+
+
+def test_series_ret_bins():
+    # see gh-8589
+    ser = Series(np.arange(4))
+    result, bins = cut(ser, 2, retbins=True)
+
+    expected = Series(IntervalIndex.from_breaks(
+        [-0.003, 1.5, 3], closed="right").repeat(2)).astype(CDT(ordered=True))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs,msg", [
+    (dict(duplicates="drop"), None),
+    (dict(), "Bin edges must be unique"),
+    (dict(duplicates="raise"), "Bin edges must be unique"),
+    (dict(duplicates="foo"), "invalid value for 'duplicates' parameter")
+])
+def test_cut_duplicates_bin(kwargs, msg):
+    # see gh-20947
+    bins = [0, 2, 4, 6, 10, 10]
+    values = Series(np.array([1, 3, 5, 7, 9]), index=["a", "b", "c", "d", "e"])
+
+    if msg is not None:
+        with pytest.raises(ValueError, match=msg):
+            cut(values, bins, **kwargs)
+    else:
+        result = cut(values, bins, **kwargs)
+        expected = cut(values, pd.unique(bins))
+        tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("data", [9.0, -9.0, 0.0])
+@pytest.mark.parametrize("length", [1, 2])
+def test_single_bin(data, length):
+    # see gh-14652, gh-15428
+    ser = Series([data] * length)
+    result = cut(ser, 1, labels=False)
+
+    expected = Series([0] * length)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    "array_1_writeable,array_2_writeable",
+    [(True, True), (True, False), (False, False)])
+def test_cut_read_only(array_1_writeable, array_2_writeable):
+    # issue 18773
+    array_1 = np.arange(0, 100, 10)
+    array_1.flags.writeable = array_1_writeable
+
+    array_2 = np.arange(0, 100, 10)
+    array_2.flags.writeable = array_2_writeable
+
+    hundred_elements = np.arange(100)
+    tm.assert_categorical_equal(cut(hundred_elements, array_1),
+                                cut(hundred_elements, array_2))
+
+
+@pytest.mark.parametrize("conv", [
+    lambda v: Timestamp(v),
+    lambda v: to_datetime(v),
+    lambda v: np.datetime64(v),
+    lambda v: Timestamp(v).to_pydatetime(),
+])
+def test_datetime_bin(conv):
+    data = [np.datetime64("2012-12-13"), np.datetime64("2012-12-15")]
+    bin_data = ["2012-12-12", "2012-12-14", "2012-12-16"]
+
+    expected = Series(IntervalIndex([
+        Interval(Timestamp(bin_data[0]), Timestamp(bin_data[1])),
+        Interval(Timestamp(bin_data[1]), Timestamp(bin_data[2]))])).astype(
+        CDT(ordered=True))
+
+    bins = [conv(v) for v in bin_data]
+    result = Series(cut(data, bins=bins))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("data", [
+    to_datetime(Series(["2013-01-01", "2013-01-02", "2013-01-03"])),
+    [np.datetime64("2013-01-01"), np.datetime64("2013-01-02"),
+     np.datetime64("2013-01-03")],
+    np.array([np.datetime64("2013-01-01"), np.datetime64("2013-01-02"),
+              np.datetime64("2013-01-03")]),
+    DatetimeIndex(["2013-01-01", "2013-01-02", "2013-01-03"])
+])
+def test_datetime_cut(data):
+    # see gh-14714
+    #
+    # Testing time data when it comes in various collection types.
+    result, _ = cut(data, 3, retbins=True)
+    expected = Series(IntervalIndex([
+        Interval(Timestamp("2012-12-31 23:57:07.200000"),
+                 Timestamp("2013-01-01 16:00:00")),
+        Interval(Timestamp("2013-01-01 16:00:00"),
+                 Timestamp("2013-01-02 08:00:00")),
+        Interval(Timestamp("2013-01-02 08:00:00"),
+                 Timestamp("2013-01-03 00:00:00"))])).astype(CDT(ordered=True))
+    tm.assert_series_equal(Series(result), expected)
+
+
+@pytest.mark.parametrize("bins", [
+    3, [Timestamp("2013-01-01 04:57:07.200000"),
+        Timestamp("2013-01-01 21:00:00"),
+        Timestamp("2013-01-02 13:00:00"),
+        Timestamp("2013-01-03 05:00:00")]])
+@pytest.mark.parametrize("box", [list, np.array, Index, Series])
+def test_datetime_tz_cut(bins, box):
+    # see gh-19872
+    tz = "US/Eastern"
+    s = Series(date_range("20130101", periods=3, tz=tz))
+
+    if not isinstance(bins, int):
+        bins = box(bins)
+
+    result = cut(s, bins)
+    expected = Series(IntervalIndex([
+        Interval(Timestamp("2012-12-31 23:57:07.200000", tz=tz),
+                 Timestamp("2013-01-01 16:00:00", tz=tz)),
+        Interval(Timestamp("2013-01-01 16:00:00", tz=tz),
+                 Timestamp("2013-01-02 08:00:00", tz=tz)),
+        Interval(Timestamp("2013-01-02 08:00:00", tz=tz),
+                 Timestamp("2013-01-03 00:00:00", tz=tz))])).astype(
+        CDT(ordered=True))
+    tm.assert_series_equal(result, expected)
+
+
+def test_datetime_nan_error():
+    msg = "bins must be of datetime64 dtype"
+
+    with pytest.raises(ValueError, match=msg):
+        cut(date_range("20130101", periods=3), bins=[0, 2, 4])
+
+
+def test_datetime_nan_mask():
+    result = cut(date_range("20130102", periods=5),
+                 bins=date_range("20130101", periods=2))
+
+    mask = result.categories.isna()
+    tm.assert_numpy_array_equal(mask, np.array([False]))
+
+    mask = result.isna()
+    tm.assert_numpy_array_equal(mask, np.array([False, True, True,
+                                                True, True]))
+
+
+@pytest.mark.parametrize("tz", [None, "UTC", "US/Pacific"])
+def test_datetime_cut_roundtrip(tz):
+    # see gh-19891
+    ser = Series(date_range("20180101", periods=3, tz=tz))
+    result, result_bins = cut(ser, 2, retbins=True)
+
+    expected = cut(ser, result_bins)
+    tm.assert_series_equal(result, expected)
+
+    expected_bins = DatetimeIndex(["2017-12-31 23:57:07.200000",
+                                   "2018-01-02 00:00:00",
+                                   "2018-01-03 00:00:00"])
+    expected_bins = expected_bins.tz_localize(tz)
+    tm.assert_index_equal(result_bins, expected_bins)
+
+
+def test_timedelta_cut_roundtrip():
+    # see gh-19891
+    ser = Series(timedelta_range("1day", periods=3))
+    result, result_bins = cut(ser, 2, retbins=True)
+
+    expected = cut(ser, result_bins)
+    tm.assert_series_equal(result, expected)
+
+    expected_bins = TimedeltaIndex(["0 days 23:57:07.200000",
+                                    "2 days 00:00:00",
+                                    "3 days 00:00:00"])
+    tm.assert_index_equal(result_bins, expected_bins)
diff --git a/pandas/tests/reshape/test_melt.py b/pandas/tests/reshape/test_melt.py
new file mode 100644
index 0000000000000..6bd1958633e25
--- /dev/null
+++ b/pandas/tests/reshape/test_melt.py
@@ -0,0 +1,718 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+import numpy as np
+from numpy import nan
+import pytest
+
+from pandas.compat import range
+
+import pandas as pd
+from pandas import DataFrame, lreshape, melt, wide_to_long
+import pandas.util.testing as tm
+
+
+class TestMelt(object):
+
+    def setup_method(self, method):
+        self.df = tm.makeTimeDataFrame()[:10]
+        self.df['id1'] = (self.df['A'] > 0).astype(np.int64)
+        self.df['id2'] = (self.df['B'] > 0).astype(np.int64)
+
+        self.var_name = 'var'
+        self.value_name = 'val'
+
+        self.df1 = pd.DataFrame([[1.067683, -1.110463, 0.20867
+                                  ], [-1.321405, 0.368915, -1.055342],
+                                 [-0.807333, 0.08298, -0.873361]])
+        self.df1.columns = [list('ABC'), list('abc')]
+        self.df1.columns.names = ['CAP', 'low']
+
+    def test_top_level_method(self):
+        result = melt(self.df)
+        assert result.columns.tolist() == ['variable', 'value']
+
+    def test_method_signatures(self):
+        tm.assert_frame_equal(self.df.melt(),
+                              melt(self.df))
+
+        tm.assert_frame_equal(self.df.melt(id_vars=['id1', 'id2'],
+                                           value_vars=['A', 'B']),
+                              melt(self.df,
+                                   id_vars=['id1', 'id2'],
+                                   value_vars=['A', 'B']))
+
+        tm.assert_frame_equal(self.df.melt(var_name=self.var_name,
+                                           value_name=self.value_name),
+                              melt(self.df,
+                                   var_name=self.var_name,
+                                   value_name=self.value_name))
+
+        tm.assert_frame_equal(self.df1.melt(col_level=0),
+                              melt(self.df1, col_level=0))
+
+    def test_default_col_names(self):
+        result = self.df.melt()
+        assert result.columns.tolist() == ['variable', 'value']
+
+        result1 = self.df.melt(id_vars=['id1'])
+        assert result1.columns.tolist() == ['id1', 'variable', 'value']
+
+        result2 = self.df.melt(id_vars=['id1', 'id2'])
+        assert result2.columns.tolist() == ['id1', 'id2', 'variable', 'value']
+
+    def test_value_vars(self):
+        result3 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A')
+        assert len(result3) == 10
+
+        result4 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'])
+        expected4 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                               'id2': self.df['id2'].tolist() * 2,
+                               'variable': ['A'] * 10 + ['B'] * 10,
+                               'value': (self.df['A'].tolist() +
+                                         self.df['B'].tolist())},
+                              columns=['id1', 'id2', 'variable', 'value'])
+        tm.assert_frame_equal(result4, expected4)
+
+    def test_value_vars_types(self):
+        # GH 15348
+        expected = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                              'id2': self.df['id2'].tolist() * 2,
+                              'variable': ['A'] * 10 + ['B'] * 10,
+                              'value': (self.df['A'].tolist() +
+                                        self.df['B'].tolist())},
+                             columns=['id1', 'id2', 'variable', 'value'])
+
+        for type_ in (tuple, list, np.array):
+            result = self.df.melt(id_vars=['id1', 'id2'],
+                                  value_vars=type_(('A', 'B')))
+            tm.assert_frame_equal(result, expected)
+
+    def test_vars_work_with_multiindex(self):
+        expected = DataFrame({
+            ('A', 'a'): self.df1[('A', 'a')],
+            'CAP': ['B'] * len(self.df1),
+            'low': ['b'] * len(self.df1),
+            'value': self.df1[('B', 'b')],
+        }, columns=[('A', 'a'), 'CAP', 'low', 'value'])
+
+        result = self.df1.melt(id_vars=[('A', 'a')], value_vars=[('B', 'b')])
+        tm.assert_frame_equal(result, expected)
+
+    def test_single_vars_work_with_multiindex(self):
+        expected = DataFrame({
+            'A': {0: 1.067683, 1: -1.321405, 2: -0.807333},
+            'CAP': {0: 'B', 1: 'B', 2: 'B'},
+            'value': {0: -1.110463, 1: 0.368915, 2: 0.08298}})
+        result = self.df1.melt(['A'], ['B'], col_level=0)
+        tm.assert_frame_equal(result, expected)
+
+    def test_tuple_vars_fail_with_multiindex(self):
+        # melt should fail with an informative error message if
+        # the columns have a MultiIndex and a tuple is passed
+        # for id_vars or value_vars.
+        tuple_a = ('A', 'a')
+        list_a = [tuple_a]
+        tuple_b = ('B', 'b')
+        list_b = [tuple_b]
+
+        msg = (r"(id|value)_vars must be a list of tuples when columns are"
+               " a MultiIndex")
+        for id_vars, value_vars in ((tuple_a, list_b), (list_a, tuple_b),
+                                    (tuple_a, tuple_b)):
+            with pytest.raises(ValueError, match=msg):
+                self.df1.melt(id_vars=id_vars, value_vars=value_vars)
+
+    def test_custom_var_name(self):
+        result5 = self.df.melt(var_name=self.var_name)
+        assert result5.columns.tolist() == ['var', 'value']
+
+        result6 = self.df.melt(id_vars=['id1'], var_name=self.var_name)
+        assert result6.columns.tolist() == ['id1', 'var', 'value']
+
+        result7 = self.df.melt(id_vars=['id1', 'id2'], var_name=self.var_name)
+        assert result7.columns.tolist() == ['id1', 'id2', 'var', 'value']
+
+        result8 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                               var_name=self.var_name)
+        assert result8.columns.tolist() == ['id1', 'id2', 'var', 'value']
+
+        result9 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                               var_name=self.var_name)
+        expected9 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                               'id2': self.df['id2'].tolist() * 2,
+                               self.var_name: ['A'] * 10 + ['B'] * 10,
+                               'value': (self.df['A'].tolist() +
+                                         self.df['B'].tolist())},
+                              columns=['id1', 'id2', self.var_name, 'value'])
+        tm.assert_frame_equal(result9, expected9)
+
+    def test_custom_value_name(self):
+        result10 = self.df.melt(value_name=self.value_name)
+        assert result10.columns.tolist() == ['variable', 'val']
+
+        result11 = self.df.melt(id_vars=['id1'], value_name=self.value_name)
+        assert result11.columns.tolist() == ['id1', 'variable', 'val']
+
+        result12 = self.df.melt(id_vars=['id1', 'id2'],
+                                value_name=self.value_name)
+        assert result12.columns.tolist() == ['id1', 'id2', 'variable', 'val']
+
+        result13 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                                value_name=self.value_name)
+        assert result13.columns.tolist() == ['id1', 'id2', 'variable', 'val']
+
+        result14 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                                value_name=self.value_name)
+        expected14 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                                'id2': self.df['id2'].tolist() * 2,
+                                'variable': ['A'] * 10 + ['B'] * 10,
+                                self.value_name: (self.df['A'].tolist() +
+                                                  self.df['B'].tolist())},
+                               columns=['id1', 'id2', 'variable',
+                                        self.value_name])
+        tm.assert_frame_equal(result14, expected14)
+
+    def test_custom_var_and_value_name(self):
+
+        result15 = self.df.melt(var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result15.columns.tolist() == ['var', 'val']
+
+        result16 = self.df.melt(id_vars=['id1'], var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result16.columns.tolist() == ['id1', 'var', 'val']
+
+        result17 = self.df.melt(id_vars=['id1', 'id2'],
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result17.columns.tolist() == ['id1', 'id2', 'var', 'val']
+
+        result18 = self.df.melt(id_vars=['id1', 'id2'], value_vars='A',
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        assert result18.columns.tolist() == ['id1', 'id2', 'var', 'val']
+
+        result19 = self.df.melt(id_vars=['id1', 'id2'], value_vars=['A', 'B'],
+                                var_name=self.var_name,
+                                value_name=self.value_name)
+        expected19 = DataFrame({'id1': self.df['id1'].tolist() * 2,
+                                'id2': self.df['id2'].tolist() * 2,
+                                self.var_name: ['A'] * 10 + ['B'] * 10,
+                                self.value_name: (self.df['A'].tolist() +
+                                                  self.df['B'].tolist())},
+                               columns=['id1', 'id2', self.var_name,
+                                        self.value_name])
+        tm.assert_frame_equal(result19, expected19)
+
+        df20 = self.df.copy()
+        df20.columns.name = 'foo'
+        result20 = df20.melt()
+        assert result20.columns.tolist() == ['foo', 'value']
+
+    def test_col_level(self):
+        res1 = self.df1.melt(col_level=0)
+        res2 = self.df1.melt(col_level='CAP')
+        assert res1.columns.tolist() == ['CAP', 'value']
+        assert res2.columns.tolist() == ['CAP', 'value']
+
+    def test_multiindex(self):
+        res = self.df1.melt()
+        assert res.columns.tolist() == ['CAP', 'low', 'value']
+
+    @pytest.mark.parametrize("col", [
+        pd.Series(pd.date_range('2010', periods=5, tz='US/Pacific')),
+        pd.Series(["a", "b", "c", "a", "d"], dtype="category"),
+        pd.Series([0, 1, 0, 0, 0])])
+    def test_pandas_dtypes(self, col):
+        # GH 15785
+        df = DataFrame({'klass': range(5),
+                        'col': col,
+                        'attr1': [1, 0, 0, 0, 0],
+                        'attr2': col})
+        expected_value = pd.concat([pd.Series([1, 0, 0, 0, 0]), col],
+                                   ignore_index=True)
+        result = melt(df, id_vars=['klass', 'col'], var_name='attribute',
+                      value_name='value')
+        expected = DataFrame({0: list(range(5)) * 2,
+                              1: pd.concat([col] * 2, ignore_index=True),
+                              2: ['attr1'] * 5 + ['attr2'] * 5,
+                              3: expected_value})
+        expected.columns = ['klass', 'col', 'attribute', 'value']
+        tm.assert_frame_equal(result, expected)
+
+    def test_melt_missing_columns_raises(self):
+        # GH-23575
+        # This test is to ensure that pandas raises an error if melting is
+        # attempted with column names absent from the dataframe
+
+        # Generate data
+        df = pd.DataFrame(np.random.randn(5, 4), columns=list('abcd'))
+
+        # Try to melt with missing `value_vars` column name
+        msg = "The following '{Var}' are not present in the DataFrame: {Col}"
+        with pytest.raises(
+                KeyError,
+                match=msg.format(Var='value_vars', Col="\\['C'\\]")):
+            df.melt(['a', 'b'], ['C', 'd'])
+
+        # Try to melt with missing `id_vars` column name
+        with pytest.raises(
+                KeyError,
+                match=msg.format(Var='id_vars', Col="\\['A'\\]")):
+            df.melt(['A', 'b'], ['c', 'd'])
+
+        # Multiple missing
+        with pytest.raises(
+                KeyError,
+                match=msg.format(Var='id_vars',
+                                 Col="\\['not_here', 'or_there'\\]")):
+            df.melt(['a', 'b', 'not_here', 'or_there'], ['c', 'd'])
+
+        # Multiindex melt fails if column is missing from multilevel melt
+        multi = df.copy()
+        multi.columns = [list('ABCD'), list('abcd')]
+        with pytest.raises(
+            KeyError,
+            match=msg.format(Var='id_vars',
+                             Col="\\['E'\\]")):
+            multi.melt([('E', 'a')], [('B', 'b')])
+        # Multiindex fails if column is missing from single level melt
+        with pytest.raises(
+            KeyError,
+            match=msg.format(Var='value_vars',
+                             Col="\\['F'\\]")):
+            multi.melt(['A'], ['F'], col_level=0)
+
+
+class TestLreshape(object):
+
+    def test_pairs(self):
+        data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                            '11jan2009'],
+                'birthwt': [1766, 3301, 1454, 3139, 4133],
+                'id': [101, 102, 103, 104, 105],
+                'sex': ['Male', 'Female', 'Female', 'Female', 'Female'],
+                'visitdt1': ['11jan2009', '22dec2008', '04jan2009',
+                             '29dec2008', '20jan2009'],
+                'visitdt2':
+                ['21jan2009', nan, '22jan2009', '31dec2008', '03feb2009'],
+                'visitdt3': ['05feb2009', nan, nan, '02jan2009', '15feb2009'],
+                'wt1': [1823, 3338, 1549, 3298, 4306],
+                'wt2': [2011.0, nan, 1892.0, 3338.0, 4575.0],
+                'wt3': [2293.0, nan, nan, 3377.0, 4805.0]}
+
+        df = DataFrame(data)
+
+        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 4)],
+                'wt': ['wt%d' % i for i in range(1, 4)]}
+        result = lreshape(df, spec)
+
+        exp_data = {'birthdt':
+                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '21dec2008', '11jan2009'],
+                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 1454, 3139,
+                                4133, 1766, 3139, 4133],
+                    'id': [101, 102, 103, 104, 105, 101, 103, 104, 105, 101,
+                           104, 105],
+                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Male',
+                            'Female', 'Female'],
+                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
+                                '29dec2008', '20jan2009', '21jan2009',
+                                '22jan2009', '31dec2008', '03feb2009',
+                                '05feb2009', '02jan2009', '15feb2009'],
+                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0,
+                           1892.0, 3338.0, 4575.0, 2293.0, 3377.0, 4805.0]}
+        exp = DataFrame(exp_data, columns=result.columns)
+        tm.assert_frame_equal(result, exp)
+
+        result = lreshape(df, spec, dropna=False)
+        exp_data = {'birthdt':
+                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
+                     '11jan2009', '08jan2009', '20dec2008', '30dec2008',
+                     '21dec2008', '11jan2009', '08jan2009', '20dec2008',
+                     '30dec2008', '21dec2008', '11jan2009'],
+                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 3301, 1454,
+                                3139, 4133, 1766, 3301, 1454, 3139, 4133],
+                    'id': [101, 102, 103, 104, 105, 101, 102, 103, 104, 105,
+                           101, 102, 103, 104, 105],
+                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Female',
+                            'Male', 'Female', 'Female', 'Female', 'Female'],
+                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
+                                '29dec2008', '20jan2009', '21jan2009', nan,
+                                '22jan2009', '31dec2008', '03feb2009',
+                                '05feb2009', nan, nan, '02jan2009',
+                                '15feb2009'],
+                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0, nan,
+                           1892.0, 3338.0, 4575.0, 2293.0, nan, nan, 3377.0,
+                           4805.0]}
+        exp = DataFrame(exp_data, columns=result.columns)
+        tm.assert_frame_equal(result, exp)
+
+        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 3)],
+                'wt': ['wt%d' % i for i in range(1, 4)]}
+        msg = "All column lists must be same length"
+        with pytest.raises(ValueError, match=msg):
+            lreshape(df, spec)
+
+
+class TestWideToLong(object):
+
+    def test_simple(self):
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A1970": {0: "a",
+                                     1: "b",
+                                     2: "c"},
+                           "A1980": {0: "d",
+                                     1: "e",
+                                     2: "f"},
+                           "B1970": {0: 2.5,
+                                     1: 1.2,
+                                     2: .7},
+                           "B1980": {0: 3.2,
+                                     1: 1.3,
+                                     2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ["A", "B"], i="id", j="year")
+        tm.assert_frame_equal(result, expected)
+
+    def test_stubs(self):
+        # GH9204
+        df = pd.DataFrame([[0, 1, 2, 3, 8], [4, 5, 6, 7, 9]])
+        df.columns = ['id', 'inc1', 'inc2', 'edu1', 'edu2']
+        stubs = ['inc', 'edu']
+
+        # TODO: unused?
+        df_long = pd.wide_to_long(df, stubs, i='id', j='age')  # noqa
+
+        assert stubs == ['inc', 'edu']
+
+    def test_separating_character(self):
+        # GH14779
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A.1970": {0: "a",
+                                      1: "b",
+                                      2: "c"},
+                           "A.1980": {0: "d",
+                                      1: "e",
+                                      2: "f"},
+                           "B.1970": {0: 2.5,
+                                      1: 1.2,
+                                      2: .7},
+                           "B.1980": {0: 3.2,
+                                      1: 1.3,
+                                      2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ["A", "B"], i="id", j="year", sep=".")
+        tm.assert_frame_equal(result, expected)
+
+    def test_escapable_characters(self):
+        np.random.seed(123)
+        x = np.random.randn(3)
+        df = pd.DataFrame({"A(quarterly)1970": {0: "a",
+                                                1: "b",
+                                                2: "c"},
+                           "A(quarterly)1980": {0: "d",
+                                                1: "e",
+                                                2: "f"},
+                           "B(quarterly)1970": {0: 2.5,
+                                                1: 1.2,
+                                                2: .7},
+                           "B(quarterly)1980": {0: 3.2,
+                                                1: 1.3,
+                                                2: .1},
+                           "X": dict(zip(
+                               range(3), x))})
+        df["id"] = df.index
+        exp_data = {"X": x.tolist() + x.tolist(),
+                    "A(quarterly)": ['a', 'b', 'c', 'd', 'e', 'f'],
+                    "B(quarterly)": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
+                    "year": [1970, 1970, 1970, 1980, 1980, 1980],
+                    "id": [0, 1, 2, 0, 1, 2]}
+        expected = DataFrame(exp_data)
+        expected = expected.set_index(
+            ['id', 'year'])[["X", "A(quarterly)", "B(quarterly)"]]
+        result = wide_to_long(df, ["A(quarterly)", "B(quarterly)"],
+                              i="id", j="year")
+        tm.assert_frame_equal(result, expected)
+
+    def test_unbalanced(self):
+        # test that we can have a varying amount of time variables
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': ['X1', 'X1', 'X2', 'X2'],
+                    'A': [1.0, 3.0, 2.0, 4.0],
+                    'B': [5.0, np.nan, 6.0, np.nan],
+                    'id': [0, 0, 1, 1],
+                    'year': [2010, 2011, 2010, 2011]}
+        expected = pd.DataFrame(exp_data)
+        expected = expected.set_index(['id', 'year'])[["X", "A", "B"]]
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year')
+        tm.assert_frame_equal(result, expected)
+
+    def test_character_overlap(self):
+        # Test we handle overlapping characters in both id_vars and value_vars
+        df = pd.DataFrame({
+            'A11': ['a11', 'a22', 'a33'],
+            'A12': ['a21', 'a22', 'a23'],
+            'B11': ['b11', 'b12', 'b13'],
+            'B12': ['b21', 'b22', 'b23'],
+            'BB11': [1, 2, 3],
+            'BB12': [4, 5, 6],
+            'BBBX': [91, 92, 93],
+            'BBBZ': [91, 92, 93]
+        })
+        df['id'] = df.index
+        expected = pd.DataFrame({
+            'BBBX': [91, 92, 93, 91, 92, 93],
+            'BBBZ': [91, 92, 93, 91, 92, 93],
+            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
+            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
+            'BB': [1, 2, 3, 4, 5, 6],
+            'id': [0, 1, 2, 0, 1, 2],
+            'year': [11, 11, 11, 12, 12, 12]})
+        expected = expected.set_index(['id', 'year'])[
+            ['BBBX', 'BBBZ', 'A', 'B', 'BB']]
+        result = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_invalid_separator(self):
+        # if an invalid separator is supplied a empty data frame is returned
+        sep = 'nope!'
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': '',
+                    'A2010': [],
+                    'A2011': [],
+                    'B2010': [],
+                    'id': [],
+                    'year': [],
+                    'A': [],
+                    'B': []}
+        expected = pd.DataFrame(exp_data).astype({'year': 'int'})
+        expected = expected.set_index(['id', 'year'])[[
+            'X', 'A2010', 'A2011', 'B2010', 'A', 'B']]
+        expected.index.set_levels([0, 1], level=0, inplace=True)
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year', sep=sep)
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_num_string_disambiguation(self):
+        # Test that we can disambiguate number value_vars from
+        # string value_vars
+        df = pd.DataFrame({
+            'A11': ['a11', 'a22', 'a33'],
+            'A12': ['a21', 'a22', 'a23'],
+            'B11': ['b11', 'b12', 'b13'],
+            'B12': ['b21', 'b22', 'b23'],
+            'BB11': [1, 2, 3],
+            'BB12': [4, 5, 6],
+            'Arating': [91, 92, 93],
+            'Arating_old': [91, 92, 93]
+        })
+        df['id'] = df.index
+        expected = pd.DataFrame({
+            'Arating': [91, 92, 93, 91, 92, 93],
+            'Arating_old': [91, 92, 93, 91, 92, 93],
+            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
+            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
+            'BB': [1, 2, 3, 4, 5, 6],
+            'id': [0, 1, 2, 0, 1, 2],
+            'year': [11, 11, 11, 12, 12, 12]})
+        expected = expected.set_index(['id', 'year'])[
+            ['Arating', 'Arating_old', 'A', 'B', 'BB']]
+        result = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_invalid_suffixtype(self):
+        # If all stubs names end with a string, but a numeric suffix is
+        # assumed,  an empty data frame is returned
+        df = pd.DataFrame({'Aone': [1.0, 2.0],
+                           'Atwo': [3.0, 4.0],
+                           'Bone': [5.0, 6.0],
+                           'X': ['X1', 'X2']})
+        df['id'] = df.index
+        exp_data = {'X': '',
+                    'Aone': [],
+                    'Atwo': [],
+                    'Bone': [],
+                    'id': [],
+                    'year': [],
+                    'A': [],
+                    'B': []}
+        expected = pd.DataFrame(exp_data).astype({'year': 'int'})
+
+        expected = expected.set_index(['id', 'year'])
+        expected.index.set_levels([0, 1], level=0, inplace=True)
+        result = wide_to_long(df, ['A', 'B'], i='id', j='year')
+        tm.assert_frame_equal(result.sort_index(axis=1),
+                              expected.sort_index(axis=1))
+
+    def test_multiple_id_columns(self):
+        # Taken from http://www.ats.ucla.edu/stat/stata/modules/reshapel.htm
+        df = pd.DataFrame({
+            'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
+            'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+            'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
+            'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
+        })
+        expected = pd.DataFrame({
+            'ht': [2.8, 3.4, 2.9, 3.8, 2.2, 2.9, 2.0, 3.2, 1.8,
+                   2.8, 1.9, 2.4, 2.2, 3.3, 2.3, 3.4, 2.1, 2.9],
+            'famid': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3],
+            'birth': [1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3],
+            'age': [1, 2, 1, 2, 1, 2, 1, 2, 1,
+                    2, 1, 2, 1, 2, 1, 2, 1, 2]
+        })
+        expected = expected.set_index(['famid', 'birth', 'age'])[['ht']]
+        result = wide_to_long(df, 'ht', i=['famid', 'birth'], j='age')
+        tm.assert_frame_equal(result, expected)
+
+    def test_non_unique_idvars(self):
+        # GH16382
+        # Raise an error message if non unique id vars (i) are passed
+        df = pd.DataFrame({
+            'A_A1': [1, 2, 3, 4, 5],
+            'B_B1': [1, 2, 3, 4, 5],
+            'x': [1, 1, 1, 1, 1]
+        })
+        msg = "the id variables need to uniquely identify each row"
+        with pytest.raises(ValueError, match=msg):
+            wide_to_long(df, ['A_A', 'B_B'], i='x', j='colname')
+
+    def test_cast_j_int(self):
+        df = pd.DataFrame({
+            'actor_1': ['CCH Pounder', 'Johnny Depp', 'Christoph Waltz'],
+            'actor_2': ['Joel David Moore', 'Orlando Bloom', 'Rory Kinnear'],
+            'actor_fb_likes_1': [1000.0, 40000.0, 11000.0],
+            'actor_fb_likes_2': [936.0, 5000.0, 393.0],
+            'title': ['Avatar', "Pirates of the Caribbean", 'Spectre']})
+
+        expected = pd.DataFrame({
+            'actor': ['CCH Pounder',
+                      'Johnny Depp',
+                      'Christoph Waltz',
+                      'Joel David Moore',
+                      'Orlando Bloom',
+                      'Rory Kinnear'],
+            'actor_fb_likes': [1000.0, 40000.0, 11000.0, 936.0, 5000.0, 393.0],
+            'num': [1, 1, 1, 2, 2, 2],
+            'title': ['Avatar',
+                      'Pirates of the Caribbean',
+                      'Spectre',
+                      'Avatar',
+                      'Pirates of the Caribbean',
+                      'Spectre']}).set_index(['title', 'num'])
+        result = wide_to_long(df, ['actor', 'actor_fb_likes'],
+                              i='title', j='num', sep='_')
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_identical_stubnames(self):
+        df = pd.DataFrame({'A2010': [1.0, 2.0],
+                           'A2011': [3.0, 4.0],
+                           'B2010': [5.0, 6.0],
+                           'A': ['X1', 'X2']})
+        msg = "stubname can't be identical to a column name"
+        with pytest.raises(ValueError, match=msg):
+            wide_to_long(df, ['A', 'B'], i='A', j='colname')
+
+    def test_nonnumeric_suffix(self):
+        df = pd.DataFrame({'treatment_placebo': [1.0, 2.0],
+                           'treatment_test': [3.0, 4.0],
+                           'result_placebo': [5.0, 6.0],
+                           'A': ['X1', 'X2']})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X1', 'X2', 'X2'],
+            'colname': ['placebo', 'test', 'placebo', 'test'],
+            'result': [5.0, np.nan, 6.0, np.nan],
+            'treatment': [1.0, 3.0, 2.0, 4.0]})
+        expected = expected.set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='[a-z]+', sep='_')
+        tm.assert_frame_equal(result, expected)
+
+    def test_mixed_type_suffix(self):
+        df = pd.DataFrame({
+            'A': ['X1', 'X2'],
+            'result_1': [0, 9],
+            'result_foo': [5.0, 6.0],
+            'treatment_1': [1.0, 2.0],
+            'treatment_foo': [3.0, 4.0]})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X2', 'X1', 'X2'],
+            'colname': ['1', '1', 'foo', 'foo'],
+            'result': [0.0, 9.0, 5.0, 6.0],
+            'treatment': [1.0, 2.0, 3.0, 4.0]}).set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='.+', sep='_')
+        tm.assert_frame_equal(result, expected)
+
+    def test_float_suffix(self):
+        df = pd.DataFrame({
+            'treatment_1.1': [1.0, 2.0],
+            'treatment_2.1': [3.0, 4.0],
+            'result_1.2': [5.0, 6.0],
+            'result_1': [0, 9],
+            'A': ['X1', 'X2']})
+        expected = pd.DataFrame({
+            'A': ['X1', 'X1', 'X1', 'X1', 'X2', 'X2', 'X2', 'X2'],
+            'colname': [1, 1.1, 1.2, 2.1, 1, 1.1, 1.2, 2.1],
+            'result': [0.0, np.nan, 5.0, np.nan, 9.0, np.nan, 6.0, np.nan],
+            'treatment': [np.nan, 1.0, np.nan, 3.0, np.nan, 2.0, np.nan, 4.0]})
+        expected = expected.set_index(['A', 'colname'])
+        result = wide_to_long(df, ['result', 'treatment'],
+                              i='A', j='colname', suffix='[0-9.]+', sep='_')
+        tm.assert_frame_equal(result, expected)
+
+    def test_col_substring_of_stubname(self):
+        # GH22468
+        # Don't raise ValueError when a column name is a substring
+        # of a stubname that's been passed as a string
+        wide_data = {'node_id': {0: 0, 1: 1, 2: 2, 3: 3, 4: 4},
+                     'A': {0: 0.80, 1: 0.0, 2: 0.25, 3: 1.0, 4: 0.81},
+                     'PA0': {0: 0.74, 1: 0.56, 2: 0.56, 3: 0.98, 4: 0.6},
+                     'PA1': {0: 0.77, 1: 0.64, 2: 0.52, 3: 0.98, 4: 0.67},
+                     'PA3': {0: 0.34, 1: 0.70, 2: 0.52, 3: 0.98, 4: 0.67}
+                     }
+        wide_df = pd.DataFrame.from_dict(wide_data)
+        expected = pd.wide_to_long(wide_df,
+                                   stubnames=['PA'],
+                                   i=['node_id', 'A'],
+                                   j='time')
+        result = pd.wide_to_long(wide_df,
+                                 stubnames='PA',
+                                 i=['node_id', 'A'],
+                                 j='time')
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_pivot.py b/pandas/tests/reshape/test_pivot.py
new file mode 100644
index 0000000000000..e4fbb204af533
--- /dev/null
+++ b/pandas/tests/reshape/test_pivot.py
@@ -0,0 +1,1798 @@
+# -*- coding: utf-8 -*-
+
+from collections import OrderedDict
+from datetime import date, datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas.compat import product, range
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Grouper, Index, MultiIndex, Series, concat,
+    date_range)
+from pandas.api.types import CategoricalDtype as CDT
+from pandas.core.reshape.pivot import crosstab, pivot_table
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[True, False])
+def dropna(request):
+    return request.param
+
+
+class TestPivotTable(object):
+
+    def setup_method(self, method):
+        self.data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                                     'bar', 'bar', 'bar', 'bar',
+                                     'foo', 'foo', 'foo'],
+                               'B': ['one', 'one', 'one', 'two',
+                                     'one', 'one', 'one', 'two',
+                                     'two', 'two', 'one'],
+                               'C': ['dull', 'dull', 'shiny', 'dull',
+                                     'dull', 'shiny', 'shiny', 'dull',
+                                     'shiny', 'shiny', 'shiny'],
+                               'D': np.random.randn(11),
+                               'E': np.random.randn(11),
+                               'F': np.random.randn(11)})
+
+    def test_pivot_table(self):
+        index = ['A', 'B']
+        columns = 'C'
+        table = pivot_table(self.data, values='D',
+                            index=index, columns=columns)
+
+        table2 = self.data.pivot_table(
+            values='D', index=index, columns=columns)
+        tm.assert_frame_equal(table, table2)
+
+        # this works
+        pivot_table(self.data, values='D', index=index)
+
+        if len(index) > 1:
+            assert table.index.names == tuple(index)
+        else:
+            assert table.index.name == index[0]
+
+        if len(columns) > 1:
+            assert table.columns.names == columns
+        else:
+            assert table.columns.name == columns[0]
+
+        expected = self.data.groupby(
+            index + [columns])['D'].agg(np.mean).unstack()
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_table_nocols(self):
+        df = DataFrame({'rows': ['a', 'b', 'c'],
+                        'cols': ['x', 'y', 'z'],
+                        'values': [1, 2, 3]})
+        rs = df.pivot_table(columns='cols', aggfunc=np.sum)
+        xp = df.pivot_table(index='cols', aggfunc=np.sum).T
+        tm.assert_frame_equal(rs, xp)
+
+        rs = df.pivot_table(columns='cols', aggfunc={'values': 'mean'})
+        xp = df.pivot_table(index='cols', aggfunc={'values': 'mean'}).T
+        tm.assert_frame_equal(rs, xp)
+
+    def test_pivot_table_dropna(self):
+        df = DataFrame({'amount': {0: 60000, 1: 100000, 2: 50000, 3: 30000},
+                        'customer': {0: 'A', 1: 'A', 2: 'B', 3: 'C'},
+                        'month': {0: 201307, 1: 201309, 2: 201308, 3: 201310},
+                        'product': {0: 'a', 1: 'b', 2: 'c', 3: 'd'},
+                        'quantity': {0: 2000000, 1: 500000,
+                                     2: 1000000, 3: 1000000}})
+        pv_col = df.pivot_table('quantity', 'month', [
+                                'customer', 'product'], dropna=False)
+        pv_ind = df.pivot_table(
+            'quantity', ['customer', 'product'], 'month', dropna=False)
+
+        m = MultiIndex.from_tuples([('A', 'a'), ('A', 'b'), ('A', 'c'),
+                                    ('A', 'd'), ('B', 'a'), ('B', 'b'),
+                                    ('B', 'c'), ('B', 'd'), ('C', 'a'),
+                                    ('C', 'b'), ('C', 'c'), ('C', 'd')],
+                                   names=['customer', 'product'])
+        tm.assert_index_equal(pv_col.columns, m)
+        tm.assert_index_equal(pv_ind.index, m)
+
+    def test_pivot_table_categorical(self):
+
+        cat1 = Categorical(["a", "a", "b", "b"],
+                           categories=["a", "b", "z"], ordered=True)
+        cat2 = Categorical(["c", "d", "c", "d"],
+                           categories=["c", "d", "y"], ordered=True)
+        df = DataFrame({"A": cat1, "B": cat2, "values": [1, 2, 3, 4]})
+        result = pd.pivot_table(df, values='values', index=['A', 'B'],
+                                dropna=True)
+
+        exp_index = pd.MultiIndex.from_arrays(
+            [cat1, cat2],
+            names=['A', 'B'])
+        expected = DataFrame(
+            {'values': [1, 2, 3, 4]},
+            index=exp_index)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_dropna_categoricals(self, dropna):
+        # GH 15193
+        categories = ['a', 'b', 'c', 'd']
+
+        df = DataFrame({'A': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c'],
+                        'B': [1, 2, 3, 1, 2, 3, 1, 2, 3],
+                        'C': range(0, 9)})
+
+        df['A'] = df['A'].astype(CDT(categories, ordered=False))
+        result = df.pivot_table(index='B', columns='A', values='C',
+                                dropna=dropna)
+        expected_columns = Series(['a', 'b', 'c'], name='A')
+        expected_columns = expected_columns.astype(
+            CDT(categories, ordered=False))
+        expected_index = Series([1, 2, 3], name='B')
+        expected = DataFrame([[0, 3, 6],
+                              [1, 4, 7],
+                              [2, 5, 8]],
+                             index=expected_index,
+                             columns=expected_columns,)
+        if not dropna:
+            # add back the non observed to compare
+            expected = expected.reindex(
+                columns=Categorical(categories)).astype('float')
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_with_non_observable_dropna(self, dropna):
+        # gh-21133
+        df = pd.DataFrame(
+            {'A': pd.Categorical([np.nan, 'low', 'high', 'low', 'high'],
+                                 categories=['low', 'high'],
+                                 ordered=True),
+             'B': range(5)})
+
+        result = df.pivot_table(index='A', values='B', dropna=dropna)
+        expected = pd.DataFrame(
+            {'B': [2, 3]},
+            index=pd.Index(
+                pd.Categorical.from_codes([0, 1],
+                                          categories=['low', 'high'],
+                                          ordered=True),
+                name='A'))
+
+        tm.assert_frame_equal(result, expected)
+
+        # gh-21378
+        df = pd.DataFrame(
+            {'A': pd.Categorical(['left', 'low', 'high', 'low', 'high'],
+                                 categories=['low', 'high', 'left'],
+                                 ordered=True),
+             'B': range(5)})
+
+        result = df.pivot_table(index='A', values='B', dropna=dropna)
+        expected = pd.DataFrame(
+            {'B': [2, 3, 0]},
+            index=pd.Index(
+                pd.Categorical.from_codes([0, 1, 2],
+                                          categories=['low', 'high', 'left'],
+                                          ordered=True),
+                name='A'))
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pass_array(self):
+        result = self.data.pivot_table(
+            'D', index=self.data.A, columns=self.data.C)
+        expected = self.data.pivot_table('D', index='A', columns='C')
+        tm.assert_frame_equal(result, expected)
+
+    def test_pass_function(self):
+        result = self.data.pivot_table('D', index=lambda x: x // 5,
+                                       columns=self.data.C)
+        expected = self.data.pivot_table('D', index=self.data.index // 5,
+                                         columns='C')
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_multiple(self):
+        index = ['A', 'B']
+        columns = 'C'
+        table = pivot_table(self.data, index=index, columns=columns)
+        expected = self.data.groupby(index + [columns]).agg(np.mean).unstack()
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_dtypes(self):
+
+        # can convert dtypes
+        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
+                      1, 2, 3, 4], 'i': ['a', 'b', 'a', 'b']})
+        assert f.dtypes['v'] == 'int64'
+
+        z = pivot_table(f, values='v', index=['a'], columns=[
+                        'i'], fill_value=0, aggfunc=np.sum)
+        result = z.get_dtype_counts()
+        expected = Series(dict(int64=2))
+        tm.assert_series_equal(result, expected)
+
+        # cannot convert dtypes
+        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
+                      1.5, 2.5, 3.5, 4.5], 'i': ['a', 'b', 'a', 'b']})
+        assert f.dtypes['v'] == 'float64'
+
+        z = pivot_table(f, values='v', index=['a'], columns=[
+                        'i'], fill_value=0, aggfunc=np.mean)
+        result = z.get_dtype_counts()
+        expected = Series(dict(float64=2))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('columns,values',
+                             [('bool1', ['float1', 'float2']),
+                              ('bool1', ['float1', 'float2', 'bool1']),
+                              ('bool2', ['float1', 'float2', 'bool1'])])
+    def test_pivot_preserve_dtypes(self, columns, values):
+        # GH 7142 regression test
+        v = np.arange(5, dtype=np.float64)
+        df = DataFrame({'float1': v, 'float2': v + 2.0,
+                        'bool1': v <= 2, 'bool2': v <= 3})
+
+        df_res = df.reset_index().pivot_table(
+            index='index', columns=columns, values=values)
+
+        result = dict(df_res.dtypes)
+        expected = {col: np.dtype('O') if col[0].startswith('b')
+                    else np.dtype('float64') for col in df_res}
+        assert result == expected
+
+    def test_pivot_no_values(self):
+        # GH 14380
+        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-01-02',
+                                '2011-01-01', '2011-01-02'])
+        df = pd.DataFrame({'A': [1, 2, 3, 4, 5]},
+                          index=idx)
+        res = df.pivot_table(index=df.index.month, columns=df.index.day)
+
+        exp_columns = pd.MultiIndex.from_tuples([('A', 1), ('A', 2)])
+        exp = pd.DataFrame([[2.5, 4.0], [2.0, np.nan]],
+                           index=[1, 2], columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+        df = pd.DataFrame({'A': [1, 2, 3, 4, 5],
+                           'dt': pd.date_range('2011-01-01', freq='D',
+                                               periods=5)},
+                          index=idx)
+        res = df.pivot_table(index=df.index.month,
+                             columns=pd.Grouper(key='dt', freq='M'))
+        exp_columns = pd.MultiIndex.from_tuples([('A',
+                                                  pd.Timestamp('2011-01-31'))])
+        exp_columns.names = [None, 'dt']
+        exp = pd.DataFrame([3.25, 2.0],
+                           index=[1, 2], columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+        res = df.pivot_table(index=pd.Grouper(freq='A'),
+                             columns=pd.Grouper(key='dt', freq='M'))
+        exp = pd.DataFrame([3],
+                           index=pd.DatetimeIndex(['2011-12-31']),
+                           columns=exp_columns)
+        tm.assert_frame_equal(res, exp)
+
+    def test_pivot_multi_values(self):
+        result = pivot_table(self.data, values=['D', 'E'],
+                             index='A', columns=['B', 'C'], fill_value=0)
+        expected = pivot_table(self.data.drop(['F'], axis=1),
+                               index='A', columns=['B', 'C'], fill_value=0)
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_multi_functions(self):
+        f = lambda func: pivot_table(self.data, values=['D', 'E'],
+                                     index=['A', 'B'], columns='C',
+                                     aggfunc=func)
+        result = f([np.mean, np.std])
+        means = f(np.mean)
+        stds = f(np.std)
+        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
+        tm.assert_frame_equal(result, expected)
+
+        # margins not supported??
+        f = lambda func: pivot_table(self.data, values=['D', 'E'],
+                                     index=['A', 'B'], columns='C',
+                                     aggfunc=func, margins=True)
+        result = f([np.mean, np.std])
+        means = f(np.mean)
+        stds = f(np.std)
+        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_index_with_nan(self, method):
+        # GH 3588
+        nan = np.nan
+        df = DataFrame({'a': ['R1', 'R2', nan, 'R4'],
+                        'b': ['C1', 'C2', 'C3', 'C4'],
+                        'c': [10, 15, 17, 20]})
+        if method:
+            result = df.pivot('a', 'b', 'c')
+        else:
+            result = pd.pivot(df, 'a', 'b', 'c')
+        expected = DataFrame([[nan, nan, 17, nan], [10, nan, nan, nan],
+                              [nan, 15, nan, nan], [nan, nan, nan, 20]],
+                             index=Index([nan, 'R1', 'R2', 'R4'], name='a'),
+                             columns=Index(['C1', 'C2', 'C3', 'C4'], name='b'))
+        tm.assert_frame_equal(result, expected)
+        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), expected.T)
+
+        # GH9491
+        df = DataFrame({'a': pd.date_range('2014-02-01', periods=6, freq='D'),
+                        'c': 100 + np.arange(6)})
+        df['b'] = df['a'] - pd.Timestamp('2014-02-02')
+        df.loc[1, 'a'] = df.loc[3, 'a'] = nan
+        df.loc[1, 'b'] = df.loc[4, 'b'] = nan
+
+        if method:
+            pv = df.pivot('a', 'b', 'c')
+        else:
+            pv = pd.pivot(df, 'a', 'b', 'c')
+        assert pv.notna().values.sum() == len(df)
+
+        for _, row in df.iterrows():
+            assert pv.loc[row['a'], row['b']] == row['c']
+
+        if method:
+            result = df.pivot('b', 'a', 'c')
+        else:
+            result = pd.pivot(df, 'b', 'a', 'c')
+        tm.assert_frame_equal(result, pv.T)
+
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_with_tz(self, method):
+        # GH 5878
+        df = DataFrame({'dt1': [datetime(2013, 1, 1, 9, 0),
+                                datetime(2013, 1, 2, 9, 0),
+                                datetime(2013, 1, 1, 9, 0),
+                                datetime(2013, 1, 2, 9, 0)],
+                        'dt2': [datetime(2014, 1, 1, 9, 0),
+                                datetime(2014, 1, 1, 9, 0),
+                                datetime(2014, 1, 2, 9, 0),
+                                datetime(2014, 1, 2, 9, 0)],
+                        'data1': np.arange(4, dtype='int64'),
+                        'data2': np.arange(4, dtype='int64')})
+
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
+
+        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
+        exp_col2 = pd.DatetimeIndex(['2014/01/01 09:00',
+                                     '2014/01/02 09:00'] * 2,
+                                    name='dt2', tz='Asia/Tokyo')
+        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
+                             index=pd.DatetimeIndex(['2013/01/01 09:00',
+                                                     '2013/01/02 09:00'],
+                                                    name='dt1',
+                                                    tz='US/Pacific'),
+                             columns=exp_col)
+
+        if method:
+            pv = df.pivot(index='dt1', columns='dt2')
+        else:
+            pv = pd.pivot(df, index='dt1', columns='dt2')
+        tm.assert_frame_equal(pv, expected)
+
+        expected = DataFrame([[0, 2], [1, 3]],
+                             index=pd.DatetimeIndex(['2013/01/01 09:00',
+                                                     '2013/01/02 09:00'],
+                                                    name='dt1',
+                                                    tz='US/Pacific'),
+                             columns=pd.DatetimeIndex(['2014/01/01 09:00',
+                                                       '2014/01/02 09:00'],
+                                                      name='dt2',
+                                                      tz='Asia/Tokyo'))
+
+        if method:
+            pv = df.pivot(index='dt1', columns='dt2', values='data1')
+        else:
+            pv = pd.pivot(df, index='dt1', columns='dt2', values='data1')
+        tm.assert_frame_equal(pv, expected)
+
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_periods(self, method):
+        df = DataFrame({'p1': [pd.Period('2013-01-01', 'D'),
+                               pd.Period('2013-01-02', 'D'),
+                               pd.Period('2013-01-01', 'D'),
+                               pd.Period('2013-01-02', 'D')],
+                        'p2': [pd.Period('2013-01', 'M'),
+                               pd.Period('2013-01', 'M'),
+                               pd.Period('2013-02', 'M'),
+                               pd.Period('2013-02', 'M')],
+                        'data1': np.arange(4, dtype='int64'),
+                        'data2': np.arange(4, dtype='int64')})
+
+        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
+        exp_col2 = pd.PeriodIndex(['2013-01', '2013-02'] * 2,
+                                  name='p2', freq='M')
+        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
+                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
+                                                  name='p1', freq='D'),
+                             columns=exp_col)
+        if method:
+            pv = df.pivot(index='p1', columns='p2')
+        else:
+            pv = pd.pivot(df, index='p1', columns='p2')
+        tm.assert_frame_equal(pv, expected)
+
+        expected = DataFrame([[0, 2], [1, 3]],
+                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
+                                                  name='p1', freq='D'),
+                             columns=pd.PeriodIndex(['2013-01', '2013-02'],
+                                                    name='p2', freq='M'))
+        if method:
+            pv = df.pivot(index='p1', columns='p2', values='data1')
+        else:
+            pv = pd.pivot(df, index='p1', columns='p2', values='data1')
+        tm.assert_frame_equal(pv, expected)
+
+    @pytest.mark.parametrize('values', [
+        ['baz', 'zoo'], np.array(['baz', 'zoo']),
+        pd.Series(['baz', 'zoo']), pd.Index(['baz', 'zoo'])
+    ])
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_with_list_like_values(self, values, method):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+
+        if method:
+            result = df.pivot(index='foo', columns='bar', values=values)
+        else:
+            result = pd.pivot(df, index='foo', columns='bar', values=values)
+
+        data = [[1, 2, 3, 'x', 'y', 'z'],
+                [4, 5, 6, 'q', 'w', 't']]
+        index = Index(data=['one', 'two'], name='foo')
+        columns = MultiIndex(levels=[['baz', 'zoo'], ['A', 'B', 'C']],
+                             codes=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]],
+                             names=[None, 'bar'])
+        expected = DataFrame(data=data, index=index,
+                             columns=columns, dtype='object')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('values', [
+        ['bar', 'baz'], np.array(['bar', 'baz']),
+        pd.Series(['bar', 'baz']), pd.Index(['bar', 'baz'])
+    ])
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_with_list_like_values_nans(self, values, method):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+
+        if method:
+            result = df.pivot(index='zoo', columns='foo', values=values)
+        else:
+            result = pd.pivot(df, index='zoo', columns='foo', values=values)
+
+        data = [[np.nan, 'A', np.nan, 4],
+                [np.nan, 'C', np.nan, 6],
+                [np.nan, 'B', np.nan, 5],
+                ['A', np.nan, 1, np.nan],
+                ['B', np.nan, 2, np.nan],
+                ['C', np.nan, 3, np.nan]]
+        index = Index(data=['q', 't', 'w', 'x', 'y', 'z'], name='zoo')
+        columns = MultiIndex(levels=[['bar', 'baz'], ['one', 'two']],
+                             codes=[[0, 0, 1, 1], [0, 1, 0, 1]],
+                             names=[None, 'foo'])
+        expected = DataFrame(data=data, index=index,
+                             columns=columns, dtype='object')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.xfail(reason='MultiIndexed unstack with tuple names fails'
+                              'with KeyError GH#19966')
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_with_multiindex(self, method):
+        # issue #17160
+        index = Index(data=[0, 1, 2, 3, 4, 5])
+        data = [['one', 'A', 1, 'x'],
+                ['one', 'B', 2, 'y'],
+                ['one', 'C', 3, 'z'],
+                ['two', 'A', 4, 'q'],
+                ['two', 'B', 5, 'w'],
+                ['two', 'C', 6, 't']]
+        columns = MultiIndex(levels=[['bar', 'baz'], ['first', 'second']],
+                             codes=[[0, 0, 1, 1], [0, 1, 0, 1]])
+        df = DataFrame(data=data, index=index, columns=columns, dtype='object')
+        if method:
+            result = df.pivot(index=('bar', 'first'),
+                              columns=('bar', 'second'),
+                              values=('baz', 'first'))
+        else:
+            result = pd.pivot(df,
+                              index=('bar', 'first'),
+                              columns=('bar', 'second'),
+                              values=('baz', 'first'))
+
+        data = {'A': Series([1, 4], index=['one', 'two']),
+                'B': Series([2, 5], index=['one', 'two']),
+                'C': Series([3, 6], index=['one', 'two'])}
+        expected = DataFrame(data)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('method', [True, False])
+    def test_pivot_with_tuple_of_values(self, method):
+        # issue #17160
+        df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two', 'two'],
+                           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+                           'baz': [1, 2, 3, 4, 5, 6],
+                           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+        with pytest.raises(KeyError, match=r"^\('bar', 'baz'\)$"):
+            # tuple is seen as a single column name
+            if method:
+                df.pivot(index='zoo', columns='foo', values=('bar', 'baz'))
+            else:
+                pd.pivot(df, index='zoo', columns='foo', values=('bar', 'baz'))
+
+    def test_margins(self):
+        def _check_output(result, values_col, index=['A', 'B'],
+                          columns=['C'],
+                          margins_col='All'):
+            col_margins = result.loc[result.index[:-1], margins_col]
+            expected_col_margins = self.data.groupby(index)[values_col].mean()
+            tm.assert_series_equal(col_margins, expected_col_margins,
+                                   check_names=False)
+            assert col_margins.name == margins_col
+
+            result = result.sort_index()
+            index_margins = result.loc[(margins_col, '')].iloc[:-1]
+
+            expected_ix_margins = self.data.groupby(columns)[values_col].mean()
+            tm.assert_series_equal(index_margins, expected_ix_margins,
+                                   check_names=False)
+            assert index_margins.name == (margins_col, '')
+
+            grand_total_margins = result.loc[(margins_col, ''), margins_col]
+            expected_total_margins = self.data[values_col].mean()
+            assert grand_total_margins == expected_total_margins
+
+        # column specified
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C',
+                                       margins=True, aggfunc=np.mean)
+        _check_output(result, 'D')
+
+        # Set a different margins_name (not 'All')
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C',
+                                       margins=True, aggfunc=np.mean,
+                                       margins_name='Totals')
+        _check_output(result, 'D', margins_col='Totals')
+
+        # no column specified
+        table = self.data.pivot_table(index=['A', 'B'], columns='C',
+                                      margins=True, aggfunc=np.mean)
+        for value_col in table.columns.levels[0]:
+            _check_output(table[value_col], value_col)
+
+        # no col
+
+        # to help with a buglet
+        self.data.columns = [k * 2 for k in self.data.columns]
+        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
+                                      aggfunc=np.mean)
+        for value_col in table.columns:
+            totals = table.loc[('All', ''), value_col]
+            assert totals == self.data[value_col].mean()
+
+        # no rows
+        rtable = self.data.pivot_table(columns=['AA', 'BB'], margins=True,
+                                       aggfunc=np.mean)
+        assert isinstance(rtable, Series)
+
+        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
+                                      aggfunc='mean')
+        for item in ['DD', 'EE', 'FF']:
+            totals = table.loc[('All', ''), item]
+            assert totals == self.data[item].mean()
+
+    def test_margins_dtype(self):
+        # GH 17013
+
+        df = self.data.copy()
+        df[['D', 'E', 'F']] = np.arange(len(df) * 3).reshape(len(df), 3)
+
+        mi_val = list(product(['bar', 'foo'], ['one', 'two'])) + [('All', '')]
+        mi = MultiIndex.from_tuples(mi_val, names=('A', 'B'))
+        expected = DataFrame({'dull': [12, 21, 3, 9, 45],
+                              'shiny': [33, 0, 36, 51, 120]},
+                             index=mi).rename_axis('C', axis=1)
+        expected['All'] = expected['dull'] + expected['shiny']
+
+        result = df.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C', margins=True,
+                                       aggfunc=np.sum, fill_value=0)
+
+        tm.assert_frame_equal(expected, result)
+
+    @pytest.mark.xfail(reason='GH#17035 (len of floats is casted back to '
+                              'floats)')
+    def test_margins_dtype_len(self):
+        mi_val = list(product(['bar', 'foo'], ['one', 'two'])) + [('All', '')]
+        mi = MultiIndex.from_tuples(mi_val, names=('A', 'B'))
+        expected = DataFrame({'dull': [1, 1, 2, 1, 5],
+                              'shiny': [2, 0, 2, 2, 6]},
+                             index=mi).rename_axis('C', axis=1)
+        expected['All'] = expected['dull'] + expected['shiny']
+
+        result = self.data.pivot_table(values='D', index=['A', 'B'],
+                                       columns='C', margins=True,
+                                       aggfunc=len, fill_value=0)
+
+        tm.assert_frame_equal(expected, result)
+
+    def test_pivot_integer_columns(self):
+        # caused by upstream bug in unstack
+
+        d = date.min
+        data = list(product(['foo', 'bar'], ['A', 'B', 'C'], ['x1', 'x2'],
+                            [d + timedelta(i)
+                             for i in range(20)], [1.0]))
+        df = DataFrame(data)
+        table = df.pivot_table(values=4, index=[0, 1, 3], columns=[2])
+
+        df2 = df.rename(columns=str)
+        table2 = df2.pivot_table(
+            values='4', index=['0', '1', '3'], columns=['2'])
+
+        tm.assert_frame_equal(table, table2, check_names=False)
+
+    def test_pivot_no_level_overlap(self):
+        # GH #1181
+
+        data = DataFrame({'a': ['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'] * 2,
+                          'b': [0, 0, 0, 0, 1, 1, 1, 1] * 2,
+                          'c': (['foo'] * 4 + ['bar'] * 4) * 2,
+                          'value': np.random.randn(16)})
+
+        table = data.pivot_table('value', index='a', columns=['b', 'c'])
+
+        grouped = data.groupby(['a', 'b', 'c'])['value'].mean()
+        expected = grouped.unstack('b').unstack('c').dropna(axis=1, how='all')
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_columns_lexsorted(self):
+
+        n = 10000
+
+        dtype = np.dtype([
+            ("Index", object),
+            ("Symbol", object),
+            ("Year", int),
+            ("Month", int),
+            ("Day", int),
+            ("Quantity", int),
+            ("Price", float),
+        ])
+
+        products = np.array([
+            ('SP500', 'ADBE'),
+            ('SP500', 'NVDA'),
+            ('SP500', 'ORCL'),
+            ('NDQ100', 'AAPL'),
+            ('NDQ100', 'MSFT'),
+            ('NDQ100', 'GOOG'),
+            ('FTSE', 'DGE.L'),
+            ('FTSE', 'TSCO.L'),
+            ('FTSE', 'GSK.L'),
+        ], dtype=[('Index', object), ('Symbol', object)])
+        items = np.empty(n, dtype=dtype)
+        iproduct = np.random.randint(0, len(products), n)
+        items['Index'] = products['Index'][iproduct]
+        items['Symbol'] = products['Symbol'][iproduct]
+        dr = pd.date_range(date(2000, 1, 1),
+                           date(2010, 12, 31))
+        dates = dr[np.random.randint(0, len(dr), n)]
+        items['Year'] = dates.year
+        items['Month'] = dates.month
+        items['Day'] = dates.day
+        items['Price'] = np.random.lognormal(4.0, 2.0, n)
+
+        df = DataFrame(items)
+
+        pivoted = df.pivot_table('Price', index=['Month', 'Day'],
+                                 columns=['Index', 'Symbol', 'Year'],
+                                 aggfunc='mean')
+
+        assert pivoted.columns.is_monotonic
+
+    def test_pivot_complex_aggfunc(self):
+        f = OrderedDict([('D', ['std']), ('E', ['sum'])])
+        expected = self.data.groupby(['A', 'B']).agg(f).unstack('B')
+        result = self.data.pivot_table(index='A', columns='B', aggfunc=f)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_margins_no_values_no_cols(self):
+        # Regression test on pivot table: no values or cols passed.
+        result = self.data[['A', 'B']].pivot_table(
+            index=['A', 'B'], aggfunc=len, margins=True)
+        result_list = result.tolist()
+        assert sum(result_list[:-1]) == result_list[-1]
+
+    def test_margins_no_values_two_rows(self):
+        # Regression test on pivot table: no values passed but rows are a
+        # multi-index
+        result = self.data[['A', 'B', 'C']].pivot_table(
+            index=['A', 'B'], columns='C', aggfunc=len, margins=True)
+        assert result.All.tolist() == [3.0, 1.0, 4.0, 3.0, 11.0]
+
+    def test_margins_no_values_one_row_one_col(self):
+        # Regression test on pivot table: no values passed but row and col
+        # defined
+        result = self.data[['A', 'B']].pivot_table(
+            index='A', columns='B', aggfunc=len, margins=True)
+        assert result.All.tolist() == [4.0, 7.0, 11.0]
+
+    def test_margins_no_values_two_row_two_cols(self):
+        # Regression test on pivot table: no values passed but rows and cols
+        # are multi-indexed
+        self.data['D'] = ['a', 'b', 'c', 'd',
+                          'e', 'f', 'g', 'h', 'i', 'j', 'k']
+        result = self.data[['A', 'B', 'C', 'D']].pivot_table(
+            index=['A', 'B'], columns=['C', 'D'], aggfunc=len, margins=True)
+        assert result.All.tolist() == [3.0, 1.0, 4.0, 3.0, 11.0]
+
+    @pytest.mark.parametrize(
+        'margin_name', ['foo', 'one', 666, None, ['a', 'b']])
+    def test_pivot_table_with_margins_set_margin_name(self, margin_name):
+        # see gh-3335
+        msg = (r'Conflicting name "{}" in margins|'
+               "margins_name argument must be a string").format(margin_name)
+        with pytest.raises(ValueError, match=msg):
+            # multi-index index
+            pivot_table(self.data, values='D', index=['A', 'B'],
+                        columns=['C'], margins=True,
+                        margins_name=margin_name)
+        with pytest.raises(ValueError, match=msg):
+            # multi-index column
+            pivot_table(self.data, values='D', index=['C'],
+                        columns=['A', 'B'], margins=True,
+                        margins_name=margin_name)
+        with pytest.raises(ValueError, match=msg):
+            # non-multi-index index/column
+            pivot_table(self.data, values='D', index=['A'],
+                        columns=['B'], margins=True,
+                        margins_name=margin_name)
+
+    def test_pivot_timegrouper(self):
+        df = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [datetime(2013, 1, 1),
+                     datetime(2013, 1, 1),
+                     datetime(2013, 10, 1),
+                     datetime(2013, 10, 2),
+                     datetime(2013, 10, 1),
+                     datetime(2013, 10, 2),
+                     datetime(2013, 12, 2),
+                     datetime(2013, 12, 2), ]}).set_index('Date')
+
+        expected = DataFrame(np.array([10, 18, 3], dtype='int64')
+                             .reshape(1, 3),
+                             index=[datetime(2013, 12, 31)],
+                             columns='Carl Joe Mark'.split())
+        expected.index.name = 'Date'
+        expected.columns.name = 'Buyer'
+
+        result = pivot_table(df, index=Grouper(freq='A'), columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer', columns=Grouper(freq='A'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        expected = DataFrame(np.array([1, np.nan, 3, 9, 18, np.nan])
+                             .reshape(2, 3),
+                             index=[datetime(2013, 1, 1),
+                                    datetime(2013, 7, 1)],
+                             columns='Carl Joe Mark'.split())
+        expected.index.name = 'Date'
+        expected.columns.name = 'Buyer'
+
+        result = pivot_table(df, index=Grouper(freq='6MS'), columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        # passing the name
+        df = df.reset_index()
+        result = pivot_table(df, index=Grouper(freq='6MS', key='Date'),
+                             columns='Buyer',
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer',
+                             columns=Grouper(freq='6MS', key='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        msg = "'The grouper name foo is not found'"
+        with pytest.raises(KeyError, match=msg):
+            pivot_table(df, index=Grouper(freq='6MS', key='foo'),
+                        columns='Buyer', values='Quantity', aggfunc=np.sum)
+        with pytest.raises(KeyError, match=msg):
+            pivot_table(df, index='Buyer',
+                        columns=Grouper(freq='6MS', key='foo'),
+                        values='Quantity', aggfunc=np.sum)
+
+        # passing the level
+        df = df.set_index('Date')
+        result = pivot_table(df, index=Grouper(freq='6MS', level='Date'),
+                             columns='Buyer', values='Quantity',
+                             aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index='Buyer',
+                             columns=Grouper(freq='6MS', level='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        msg = "The level foo is not valid"
+        with pytest.raises(ValueError, match=msg):
+            pivot_table(df, index=Grouper(freq='6MS', level='foo'),
+                        columns='Buyer', values='Quantity', aggfunc=np.sum)
+        with pytest.raises(ValueError, match=msg):
+            pivot_table(df, index='Buyer',
+                        columns=Grouper(freq='6MS', level='foo'),
+                        values='Quantity', aggfunc=np.sum)
+
+        # double grouper
+        df = DataFrame({
+            'Branch': 'A A A A A A A B'.split(),
+            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
+            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
+            'Date': [datetime(2013, 11, 1, 13, 0), datetime(2013, 9, 1, 13, 5),
+                     datetime(2013, 10, 1, 20, 0),
+                     datetime(2013, 10, 2, 10, 0),
+                     datetime(2013, 11, 1, 20, 0),
+                     datetime(2013, 10, 2, 10, 0),
+                     datetime(2013, 10, 2, 12, 0),
+                     datetime(2013, 12, 5, 14, 0)],
+            'PayDay': [datetime(2013, 10, 4, 0, 0),
+                       datetime(2013, 10, 15, 13, 5),
+                       datetime(2013, 9, 5, 20, 0),
+                       datetime(2013, 11, 2, 10, 0),
+                       datetime(2013, 10, 7, 20, 0),
+                       datetime(2013, 9, 5, 10, 0),
+                       datetime(2013, 12, 30, 12, 0),
+                       datetime(2013, 11, 20, 14, 0), ]})
+
+        result = pivot_table(df, index=Grouper(freq='M', key='Date'),
+                             columns=Grouper(freq='M', key='PayDay'),
+                             values='Quantity', aggfunc=np.sum)
+        expected = DataFrame(np.array([np.nan, 3, np.nan, np.nan,
+                                       6, np.nan, 1, 9,
+                                       np.nan, 9, np.nan, np.nan, np.nan,
+                                       np.nan, 3, np.nan]).reshape(4, 4),
+                             index=[datetime(2013, 9, 30),
+                                    datetime(2013, 10, 31),
+                                    datetime(2013, 11, 30),
+                                    datetime(2013, 12, 31)],
+                             columns=[datetime(2013, 9, 30),
+                                      datetime(2013, 10, 31),
+                                      datetime(2013, 11, 30),
+                                      datetime(2013, 12, 31)])
+        expected.index.name = 'Date'
+        expected.columns.name = 'PayDay'
+
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=Grouper(freq='M', key='PayDay'),
+                             columns=Grouper(freq='M', key='Date'),
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+        tuples = [(datetime(2013, 9, 30), datetime(2013, 10, 31)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 9, 30)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 11, 30)),
+                  (datetime(2013, 10, 31),
+                   datetime(2013, 12, 31)),
+                  (datetime(2013, 11, 30),
+                   datetime(2013, 10, 31)),
+                  (datetime(2013, 12, 31), datetime(2013, 11, 30)), ]
+        idx = MultiIndex.from_tuples(tuples, names=['Date', 'PayDay'])
+        expected = DataFrame(np.array([3, np.nan, 6, np.nan, 1, np.nan,
+                                       9, np.nan, 9, np.nan,
+                                       np.nan, 3]).reshape(6, 2),
+                             index=idx, columns=['A', 'B'])
+        expected.columns.name = 'Branch'
+
+        result = pivot_table(
+            df, index=[Grouper(freq='M', key='Date'),
+                       Grouper(freq='M', key='PayDay')], columns=['Branch'],
+            values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=['Branch'],
+                             columns=[Grouper(freq='M', key='Date'),
+                                      Grouper(freq='M', key='PayDay')],
+                             values='Quantity', aggfunc=np.sum)
+        tm.assert_frame_equal(result, expected.T)
+
+    def test_pivot_datetime_tz(self):
+        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00',
+                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00']
+        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
+                  '2013-01-01 15:00:00',
+                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
+                  '2013-02-01 15:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'dt1': dates1, 'dt2': dates2,
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
+
+        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00',
+                                    '2011-07-19 08:00:00',
+                                    '2011-07-19 09:00:00'],
+                                   tz='US/Pacific', name='dt1')
+        exp_col1 = Index(['value1', 'value1'])
+        exp_col2 = Index(['a', 'b'], name='label')
+        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2])
+        expected = DataFrame([[0, 3], [1, 4], [2, 5]],
+                             index=exp_idx, columns=exp_col)
+        result = pivot_table(df, index=['dt1'], columns=[
+                             'label'], values=['value1'])
+        tm.assert_frame_equal(result, expected)
+
+        exp_col1 = Index(['sum', 'sum', 'sum', 'sum',
+                          'mean', 'mean', 'mean', 'mean'])
+        exp_col2 = Index(['value1', 'value1', 'value2', 'value2'] * 2)
+        exp_col3 = pd.DatetimeIndex(['2013-01-01 15:00:00',
+                                     '2013-02-01 15:00:00'] * 4,
+                                    tz='Asia/Tokyo', name='dt2')
+        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2, exp_col3])
+        expected = DataFrame(np.array([[0, 3, 1, 2, 0, 3, 1, 2],
+                                       [1, 4, 2, 1, 1, 4, 2, 1],
+                                       [2, 5, 1, 2, 2, 5, 1, 2]],
+                                      dtype='int64'),
+                             index=exp_idx,
+                             columns=exp_col)
+
+        result = pivot_table(df, index=['dt1'], columns=['dt2'],
+                             values=['value1', 'value2'],
+                             aggfunc=[np.sum, np.mean])
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_dtaccessor(self):
+        # GH 8103
+        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00',
+                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
+                  '2011-07-19 09:00:00']
+        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
+                  '2013-01-01 15:00:00',
+                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
+                  '2013-02-01 15:00:00']
+        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
+                        'dt1': dates1, 'dt2': dates2,
+                        'value1': np.arange(6, dtype='int64'),
+                        'value2': [1, 2] * 3})
+        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d))
+        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d))
+
+        result = pivot_table(df, index='label', columns=df['dt1'].dt.hour,
+                             values='value1')
+
+        exp_idx = Index(['a', 'b'], name='label')
+        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
+                             index=exp_idx,
+                             columns=Index([7, 8, 9], name='dt1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=df['dt2'].dt.month,
+                             columns=df['dt1'].dt.hour,
+                             values='value1')
+
+        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
+                             index=Index([1, 2], name='dt2'),
+                             columns=Index([7, 8, 9], name='dt1'))
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=df['dt2'].dt.year.values,
+                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
+                             values='value1')
+
+        exp_col = MultiIndex.from_arrays(
+            [[7, 7, 8, 8, 9, 9], [1, 2] * 3], names=['dt1', 'dt2'])
+        expected = DataFrame(np.array([[0, 3, 1, 4, 2, 5]], dtype='int64'),
+                             index=[2013], columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(df, index=np.array(['X', 'X', 'X',
+                                                 'X', 'Y', 'Y']),
+                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
+                             values='value1')
+        expected = DataFrame(np.array([[0, 3, 1, np.nan, 2, np.nan],
+                                       [np.nan, np.nan, np.nan,
+                                        4, np.nan, 5]]),
+                             index=['X', 'Y'], columns=exp_col)
+        tm.assert_frame_equal(result, expected)
+
+    def test_daily(self):
+        rng = date_range('1/1/2000', '12/31/2004', freq='D')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        annual = pivot_table(DataFrame(ts), index=ts.index.year,
+                             columns=ts.index.dayofyear)
+        annual.columns = annual.columns.droplevel(0)
+
+        doy = np.asarray(ts.index.dayofyear)
+
+        for i in range(1, 367):
+            subset = ts[doy == i]
+            subset.index = subset.index.year
+
+            result = annual[i].dropna()
+            tm.assert_series_equal(result, subset, check_names=False)
+            assert result.name == i
+
+    def test_monthly(self):
+        rng = date_range('1/1/2000', '12/31/2004', freq='M')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        annual = pivot_table(pd.DataFrame(ts), index=ts.index.year,
+                             columns=ts.index.month)
+        annual.columns = annual.columns.droplevel(0)
+
+        month = ts.index.month
+        for i in range(1, 13):
+            subset = ts[month == i]
+            subset.index = subset.index.year
+            result = annual[i].dropna()
+            tm.assert_series_equal(result, subset, check_names=False)
+            assert result.name == i
+
+    def test_pivot_table_with_iterator_values(self):
+        # GH 12017
+        aggs = {'D': 'sum', 'E': 'mean'}
+
+        pivot_values_list = pd.pivot_table(
+            self.data, index=['A'], values=list(aggs.keys()), aggfunc=aggs,
+        )
+
+        pivot_values_keys = pd.pivot_table(
+            self.data, index=['A'], values=aggs.keys(), aggfunc=aggs,
+        )
+        tm.assert_frame_equal(pivot_values_keys, pivot_values_list)
+
+        agg_values_gen = (value for value in aggs.keys())
+        pivot_values_gen = pd.pivot_table(
+            self.data, index=['A'], values=agg_values_gen, aggfunc=aggs,
+        )
+        tm.assert_frame_equal(pivot_values_gen, pivot_values_list)
+
+    def test_pivot_table_margins_name_with_aggfunc_list(self):
+        # GH 13354
+        margins_name = 'Weekly'
+        costs = pd.DataFrame(
+            {'item': ['bacon', 'cheese', 'bacon', 'cheese'],
+             'cost': [2.5, 4.5, 3.2, 3.3],
+             'day': ['M', 'M', 'T', 'T']}
+        )
+        table = costs.pivot_table(
+            index="item", columns="day", margins=True,
+            margins_name=margins_name, aggfunc=[np.mean, max]
+        )
+        ix = pd.Index(
+            ['bacon', 'cheese', margins_name], dtype='object', name='item'
+        )
+        tups = [('mean', 'cost', 'M'), ('mean', 'cost', 'T'),
+                ('mean', 'cost', margins_name), ('max', 'cost', 'M'),
+                ('max', 'cost', 'T'), ('max', 'cost', margins_name)]
+        cols = pd.MultiIndex.from_tuples(tups, names=[None, None, 'day'])
+        expected = pd.DataFrame(table.values, index=ix, columns=cols)
+        tm.assert_frame_equal(table, expected)
+
+    @pytest.mark.xfail(reason='GH#17035 (np.mean of ints is casted back to '
+                              'ints)')
+    def test_categorical_margins(self, observed):
+        # GH 10989
+        df = pd.DataFrame({'x': np.arange(8),
+                           'y': np.arange(8) // 4,
+                           'z': np.arange(8) % 2})
+
+        expected = pd.DataFrame([[1.0, 2.0, 1.5], [5, 6, 5.5], [3, 4, 3.5]])
+        expected.index = Index([0, 1, 'All'], name='y')
+        expected.columns = Index([0, 1, 'All'], name='z')
+
+        table = df.pivot_table('x', 'y', 'z', dropna=observed, margins=True)
+        tm.assert_frame_equal(table, expected)
+
+    @pytest.mark.xfail(reason='GH#17035 (np.mean of ints is casted back to '
+                              'ints)')
+    def test_categorical_margins_category(self, observed):
+        df = pd.DataFrame({'x': np.arange(8),
+                           'y': np.arange(8) // 4,
+                           'z': np.arange(8) % 2})
+
+        expected = pd.DataFrame([[1.0, 2.0, 1.5], [5, 6, 5.5], [3, 4, 3.5]])
+        expected.index = Index([0, 1, 'All'], name='y')
+        expected.columns = Index([0, 1, 'All'], name='z')
+
+        df.y = df.y.astype('category')
+        df.z = df.z.astype('category')
+        table = df.pivot_table('x', 'y', 'z', dropna=observed, margins=True)
+        tm.assert_frame_equal(table, expected)
+
+    def test_categorical_aggfunc(self, observed):
+        # GH 9534
+        df = pd.DataFrame({"C1": ["A", "B", "C", "C"],
+                           "C2": ["a", "a", "b", "b"],
+                           "V": [1, 2, 3, 4]})
+        df["C1"] = df["C1"].astype("category")
+        result = df.pivot_table("V", index="C1", columns="C2",
+                                dropna=observed, aggfunc="count")
+
+        expected_index = pd.CategoricalIndex(['A', 'B', 'C'],
+                                             categories=['A', 'B', 'C'],
+                                             ordered=False,
+                                             name='C1')
+        expected_columns = pd.Index(['a', 'b'], name='C2')
+        expected_data = np.array([[1., np.nan],
+                                  [1., np.nan],
+                                  [np.nan, 2.]])
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_categorical_pivot_index_ordering(self, observed):
+        # GH 8731
+        df = pd.DataFrame({'Sales': [100, 120, 220],
+                           'Month': ['January', 'January', 'January'],
+                           'Year': [2013, 2014, 2013]})
+        months = ['January', 'February', 'March', 'April', 'May', 'June',
+                  'July', 'August', 'September', 'October', 'November',
+                  'December']
+        df['Month'] = df['Month'].astype('category').cat.set_categories(months)
+        result = df.pivot_table(values='Sales',
+                                index='Month',
+                                columns='Year',
+                                dropna=observed,
+                                aggfunc='sum')
+        expected_columns = pd.Int64Index([2013, 2014], name='Year')
+        expected_index = pd.CategoricalIndex(['January'],
+                                             categories=months,
+                                             ordered=False,
+                                             name='Month')
+        expected = pd.DataFrame([[320, 120]],
+                                index=expected_index,
+                                columns=expected_columns)
+        if not observed:
+            result = result.dropna().astype(np.int64)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_table_not_series(self):
+        # GH 4386
+        # pivot_table always returns a DataFrame
+        # when values is not list like and columns is None
+        # and aggfunc is not instance of list
+        df = DataFrame({'col1': [3, 4, 5],
+                        'col2': ['C', 'D', 'E'],
+                        'col3': [1, 3, 9]})
+
+        result = df.pivot_table('col1', index=['col3', 'col2'], aggfunc=np.sum)
+        m = MultiIndex.from_arrays([[1, 3, 9],
+                                    ['C', 'D', 'E']],
+                                   names=['col3', 'col2'])
+        expected = DataFrame([3, 4, 5],
+                             index=m, columns=['col1'])
+
+        tm.assert_frame_equal(result, expected)
+
+        result = df.pivot_table(
+            'col1', index='col3', columns='col2', aggfunc=np.sum
+        )
+        expected = DataFrame([[3, np.NaN, np.NaN],
+                              [np.NaN, 4, np.NaN],
+                              [np.NaN, np.NaN, 5]],
+                             index=Index([1, 3, 9], name='col3'),
+                             columns=Index(['C', 'D', 'E'], name='col2'))
+
+        tm.assert_frame_equal(result, expected)
+
+        result = df.pivot_table('col1', index='col3', aggfunc=[np.sum])
+        m = MultiIndex.from_arrays([['sum'],
+                                    ['col1']])
+        expected = DataFrame([3, 4, 5],
+                             index=Index([1, 3, 9], name='col3'),
+                             columns=m)
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_pivot_margins_name_unicode(self):
+        # issue #13292
+        greek = u'\u0394\u03bf\u03ba\u03b9\u03bc\u03ae'
+        frame = pd.DataFrame({'foo': [1, 2, 3]})
+        table = pd.pivot_table(frame, index=['foo'], aggfunc=len, margins=True,
+                               margins_name=greek)
+        index = pd.Index([1, 2, 3, greek], dtype='object', name='foo')
+        expected = pd.DataFrame(index=index)
+        tm.assert_frame_equal(table, expected)
+
+    def test_pivot_string_as_func(self):
+        # GH #18713
+        # for correctness purposes
+        data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo', 'bar', 'bar',
+                                'bar', 'bar', 'foo', 'foo', 'foo'],
+                          'B': ['one', 'one', 'one', 'two', 'one', 'one',
+                                'one', 'two', 'two', 'two', 'one'],
+                          'C': range(11)})
+
+        result = pivot_table(data, index='A', columns='B', aggfunc='sum')
+        mi = MultiIndex(levels=[['C'], ['one', 'two']],
+                        codes=[[0, 0], [0, 1]], names=[None, 'B'])
+        expected = DataFrame({('C', 'one'): {'bar': 15, 'foo': 13},
+                              ('C', 'two'): {'bar': 7, 'foo': 20}},
+                             columns=mi).rename_axis('A')
+        tm.assert_frame_equal(result, expected)
+
+        result = pivot_table(data, index='A', columns='B',
+                             aggfunc=['sum', 'mean'])
+        mi = MultiIndex(levels=[['sum', 'mean'], ['C'], ['one', 'two']],
+                        codes=[[0, 0, 1, 1], [0, 0, 0, 0], [0, 1, 0, 1]],
+                        names=[None, None, 'B'])
+        expected = DataFrame({('mean', 'C', 'one'): {'bar': 5.0, 'foo': 3.25},
+                              ('mean', 'C', 'two'): {'bar': 7.0,
+                                                     'foo': 6.666666666666667},
+                              ('sum', 'C', 'one'): {'bar': 15, 'foo': 13},
+                              ('sum', 'C', 'two'): {'bar': 7, 'foo': 20}},
+                             columns=mi).rename_axis('A')
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('f, f_numpy',
+                             [('sum', np.sum),
+                              ('mean', np.mean),
+                              ('std', np.std),
+                              (['sum', 'mean'], [np.sum, np.mean]),
+                              (['sum', 'std'], [np.sum, np.std]),
+                              (['std', 'mean'], [np.std, np.mean])])
+    def test_pivot_string_func_vs_func(self, f, f_numpy):
+        # GH #18713
+        # for consistency purposes
+        result = pivot_table(self.data, index='A', columns='B', aggfunc=f)
+        expected = pivot_table(self.data, index='A', columns='B',
+                               aggfunc=f_numpy)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.slow
+    def test_pivot_number_of_levels_larger_than_int32(self):
+        # GH 20601
+        df = DataFrame({'ind1': np.arange(2 ** 16),
+                        'ind2': np.arange(2 ** 16),
+                        'count': 0})
+
+        msg = "Unstacked DataFrame is too big, causing int32 overflow"
+        with pytest.raises(ValueError, match=msg):
+            df.pivot_table(index='ind1', columns='ind2',
+                           values='count', aggfunc='count')
+
+
+class TestCrosstab(object):
+
+    def setup_method(self, method):
+        df = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
+                              'bar', 'bar', 'bar', 'bar',
+                              'foo', 'foo', 'foo'],
+                        'B': ['one', 'one', 'one', 'two',
+                              'one', 'one', 'one', 'two',
+                              'two', 'two', 'one'],
+                        'C': ['dull', 'dull', 'shiny', 'dull',
+                              'dull', 'shiny', 'shiny', 'dull',
+                              'shiny', 'shiny', 'shiny'],
+                        'D': np.random.randn(11),
+                        'E': np.random.randn(11),
+                        'F': np.random.randn(11)})
+
+        self.df = df.append(df, ignore_index=True)
+
+    def test_crosstab_single(self):
+        df = self.df
+        result = crosstab(df['A'], df['C'])
+        expected = df.groupby(['A', 'C']).size().unstack()
+        tm.assert_frame_equal(result, expected.fillna(0).astype(np.int64))
+
+    def test_crosstab_multiple(self):
+        df = self.df
+
+        result = crosstab(df['A'], [df['B'], df['C']])
+        expected = df.groupby(['A', 'B', 'C']).size()
+        expected = expected.unstack(
+            'B').unstack('C').fillna(0).astype(np.int64)
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab([df['B'], df['C']], df['A'])
+        expected = df.groupby(['B', 'C', 'A']).size()
+        expected = expected.unstack('A').fillna(0).astype(np.int64)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_ndarray(self):
+        a = np.random.randint(0, 5, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 10, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'))
+        expected = crosstab(df['a'], [df['b'], df['c']])
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab([b, c], a, colnames=['a'], rownames=('b', 'c'))
+        expected = crosstab([df['b'], df['c']], df['a'])
+        tm.assert_frame_equal(result, expected)
+
+        # assign arbitrary names
+        result = crosstab(self.df['A'].values, self.df['C'].values)
+        assert result.index.name == 'row_0'
+        assert result.columns.name == 'col_0'
+
+    def test_crosstab_non_aligned(self):
+        # GH 17005
+        a = pd.Series([0, 1, 1], index=['a', 'b', 'c'])
+        b = pd.Series([3, 4, 3, 4, 3], index=['a', 'b', 'c', 'd', 'f'])
+        c = np.array([3, 4, 3])
+
+        expected = pd.DataFrame([[1, 0], [1, 1]],
+                                index=Index([0, 1], name='row_0'),
+                                columns=Index([3, 4], name='col_0'))
+
+        result = crosstab(a, b)
+        tm.assert_frame_equal(result, expected)
+
+        result = crosstab(a, c)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_margins(self):
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                          margins=True)
+
+        assert result.index.names == ('a',)
+        assert result.columns.names == ['b', 'c']
+
+        all_cols = result['All', '']
+        exp_cols = df.groupby(['a']).size().astype('i8')
+        # to keep index.name
+        exp_margin = Series([len(df)], index=Index(['All'], name='a'))
+        exp_cols = exp_cols.append(exp_margin)
+        exp_cols.name = ('All', '')
+
+        tm.assert_series_equal(all_cols, exp_cols)
+
+        all_rows = result.loc['All']
+        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
+        exp_rows = exp_rows.append(Series([len(df)], index=[('All', '')]))
+        exp_rows.name = 'All'
+
+        exp_rows = exp_rows.reindex(all_rows.index)
+        exp_rows = exp_rows.fillna(0).astype(np.int64)
+        tm.assert_series_equal(all_rows, exp_rows)
+
+    def test_crosstab_margins_set_margin_name(self):
+        # GH 15972
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+
+        df = DataFrame({'a': a, 'b': b, 'c': c})
+
+        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                          margins=True, margins_name='TOTAL')
+
+        assert result.index.names == ('a',)
+        assert result.columns.names == ['b', 'c']
+
+        all_cols = result['TOTAL', '']
+        exp_cols = df.groupby(['a']).size().astype('i8')
+        # to keep index.name
+        exp_margin = Series([len(df)], index=Index(['TOTAL'], name='a'))
+        exp_cols = exp_cols.append(exp_margin)
+        exp_cols.name = ('TOTAL', '')
+
+        tm.assert_series_equal(all_cols, exp_cols)
+
+        all_rows = result.loc['TOTAL']
+        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
+        exp_rows = exp_rows.append(Series([len(df)], index=[('TOTAL', '')]))
+        exp_rows.name = 'TOTAL'
+
+        exp_rows = exp_rows.reindex(all_rows.index)
+        exp_rows = exp_rows.fillna(0).astype(np.int64)
+        tm.assert_series_equal(all_rows, exp_rows)
+
+        msg = "margins_name argument must be a string"
+        for margins_name in [666, None, ['a', 'b']]:
+            with pytest.raises(ValueError, match=msg):
+                crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
+                         margins=True, margins_name=margins_name)
+
+    def test_crosstab_pass_values(self):
+        a = np.random.randint(0, 7, size=100)
+        b = np.random.randint(0, 3, size=100)
+        c = np.random.randint(0, 5, size=100)
+        values = np.random.randn(100)
+
+        table = crosstab([a, b], c, values, aggfunc=np.sum,
+                         rownames=['foo', 'bar'], colnames=['baz'])
+
+        df = DataFrame({'foo': a, 'bar': b, 'baz': c, 'values': values})
+
+        expected = df.pivot_table('values', index=['foo', 'bar'],
+                                  columns='baz', aggfunc=np.sum)
+        tm.assert_frame_equal(table, expected)
+
+    def test_crosstab_dropna(self):
+        # GH 3820
+        a = np.array(['foo', 'foo', 'foo', 'bar',
+                      'bar', 'foo', 'foo'], dtype=object)
+        b = np.array(['one', 'one', 'two', 'one',
+                      'two', 'two', 'two'], dtype=object)
+        c = np.array(['dull', 'dull', 'dull', 'dull',
+                      'dull', 'shiny', 'shiny'], dtype=object)
+        res = pd.crosstab(a, [b, c], rownames=['a'],
+                          colnames=['b', 'c'], dropna=False)
+        m = MultiIndex.from_tuples([('one', 'dull'), ('one', 'shiny'),
+                                    ('two', 'dull'), ('two', 'shiny')],
+                                   names=['b', 'c'])
+        tm.assert_index_equal(res.columns, m)
+
+    def test_crosstab_no_overlap(self):
+        # GS 10291
+
+        s1 = pd.Series([1, 2, 3], index=[1, 2, 3])
+        s2 = pd.Series([4, 5, 6], index=[4, 5, 6])
+
+        actual = crosstab(s1, s2)
+        expected = pd.DataFrame()
+
+        tm.assert_frame_equal(actual, expected)
+
+    def test_margin_dropna(self):
+        # GH 12577
+        # pivot_table counts null into margin ('All')
+        # when margins=true and dropna=true
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
+                           'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 3, 5]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
+                        'b': [3, np.nan, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3.0, 4.0, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, np.nan, 2],
+                        'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        # GH 12642
+        # _add_margins raises KeyError: Level None not found
+        # when margins=True and dropna=False
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
+                           'b': [3, 3, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
+        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 4, 6]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3, 4, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
+                        'b': [3, np.nan, 4, 4, 4, 4]})
+        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
+        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 4, 6]])
+        expected.index = Index([1.0, 2.0, 'All'], name='a')
+        expected.columns = Index([3.0, 4.0, 'All'], name='b')
+        tm.assert_frame_equal(actual, expected)
+
+        a = np.array(['foo', 'foo', 'foo', 'bar',
+                      'bar', 'foo', 'foo'], dtype=object)
+        b = np.array(['one', 'one', 'two', 'one',
+                      'two', np.nan, 'two'], dtype=object)
+        c = np.array(['dull', 'dull', 'dull', 'dull',
+                      'dull', 'shiny', 'shiny'], dtype=object)
+
+        actual = pd.crosstab(a, [b, c], rownames=['a'],
+                             colnames=['b', 'c'], margins=True, dropna=False)
+        m = MultiIndex.from_arrays([['one', 'one', 'two', 'two', 'All'],
+                                    ['dull', 'shiny', 'dull', 'shiny', '']],
+                                   names=['b', 'c'])
+        expected = DataFrame([[1, 0, 1, 0, 2], [2, 0, 1, 1, 5],
+                              [3, 0, 2, 1, 7]], columns=m)
+        expected.index = Index(['bar', 'foo', 'All'], name='a')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
+                             colnames=['c'], margins=True, dropna=False)
+        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
+                                    ['one', 'two', 'one', 'two', '']],
+                                   names=['a', 'b'])
+        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
+                              [5, 2, 7]], index=m)
+        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
+        tm.assert_frame_equal(actual, expected)
+
+        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
+                             colnames=['c'], margins=True, dropna=True)
+        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
+                                    ['one', 'two', 'one', 'two', '']],
+                                   names=['a', 'b'])
+        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
+                              [5, 1, 6]], index=m)
+        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
+        tm.assert_frame_equal(actual, expected)
+
+    def test_crosstab_normalize(self):
+        # Issue 12578
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [1, 1, np.nan, 1, 1]})
+
+        rindex = pd.Index([1, 2], name='a')
+        cindex = pd.Index([3, 4], name='b')
+        full_normal = pd.DataFrame([[0.2, 0], [0.2, 0.6]],
+                                   index=rindex, columns=cindex)
+        row_normal = pd.DataFrame([[1.0, 0], [0.25, 0.75]],
+                                  index=rindex, columns=cindex)
+        col_normal = pd.DataFrame([[0.5, 0], [0.5, 1.0]],
+                                  index=rindex, columns=cindex)
+
+        # Check all normalize args
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='all'),
+                              full_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True),
+                              full_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index'),
+                              row_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns'),
+                              col_normal)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=1),
+                              pd.crosstab(df.a, df.b, normalize='columns'))
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=0),
+                              pd.crosstab(df.a, df.b, normalize='index'))
+
+        row_normal_margins = pd.DataFrame([[1.0, 0],
+                                           [0.25, 0.75],
+                                           [0.4, 0.6]],
+                                          index=pd.Index([1, 2, 'All'],
+                                                         name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4], name='b',
+                                                           dtype='object'))
+        col_normal_margins = pd.DataFrame([[0.5, 0, 0.2], [0.5, 1.0, 0.8]],
+                                          index=pd.Index([1, 2], name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4, 'All'],
+                                                           name='b',
+                                                           dtype='object'))
+
+        all_normal_margins = pd.DataFrame([[0.2, 0, 0.2],
+                                           [0.2, 0.6, 0.8],
+                                           [0.4, 0.6, 1]],
+                                          index=pd.Index([1, 2, 'All'],
+                                                         name='a',
+                                                         dtype='object'),
+                                          columns=pd.Index([3, 4, 'All'],
+                                                           name='b',
+                                                           dtype='object'))
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index',
+                                          margins=True), row_normal_margins)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns',
+                                          margins=True),
+                              col_normal_margins)
+        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True,
+                                          margins=True), all_normal_margins)
+
+        # Test arrays
+        pd.crosstab([np.array([1, 1, 2, 2]), np.array([1, 2, 1, 2])],
+                    np.array([1, 2, 1, 2]))
+
+        # Test with aggfunc
+        norm_counts = pd.DataFrame([[0.25, 0, 0.25],
+                                    [0.25, 0.5, 0.75],
+                                    [0.5, 0.5, 1]],
+                                   index=pd.Index([1, 2, 'All'],
+                                                  name='a',
+                                                  dtype='object'),
+                                   columns=pd.Index([3, 4, 'All'],
+                                                    name='b'))
+        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc='count',
+                                normalize='all',
+                                margins=True)
+        tm.assert_frame_equal(test_case, norm_counts)
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [0, 4, np.nan, 3, 3]})
+
+        norm_sum = pd.DataFrame([[0, 0, 0.],
+                                 [0.4, 0.6, 1],
+                                 [0.4, 0.6, 1]],
+                                index=pd.Index([1, 2, 'All'],
+                                               name='a',
+                                               dtype='object'),
+                                columns=pd.Index([3, 4, 'All'],
+                                                 name='b',
+                                                 dtype='object'))
+        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc=np.sum,
+                                normalize='all',
+                                margins=True)
+        tm.assert_frame_equal(test_case, norm_sum)
+
+    def test_crosstab_with_empties(self):
+        # Check handling of empties
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [np.nan, np.nan, np.nan, np.nan, np.nan]})
+
+        empty = pd.DataFrame([[0.0, 0.0], [0.0, 0.0]],
+                             index=pd.Index([1, 2],
+                                            name='a',
+                                            dtype='int64'),
+                             columns=pd.Index([3, 4], name='b'))
+
+        for i in [True, 'index', 'columns']:
+            calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
+                                     normalize=i)
+            tm.assert_frame_equal(empty, calculated)
+
+        nans = pd.DataFrame([[0.0, np.nan], [0.0, 0.0]],
+                            index=pd.Index([1, 2],
+                                           name='a',
+                                           dtype='int64'),
+                            columns=pd.Index([3, 4], name='b'))
+
+        calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
+                                 normalize=False)
+        tm.assert_frame_equal(nans, calculated)
+
+    def test_crosstab_errors(self):
+        # Issue 12578
+
+        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
+                           'c': [1, 1, np.nan, 1, 1]})
+
+        error = 'values cannot be used without an aggfunc.'
+        with pytest.raises(ValueError, match=error):
+            pd.crosstab(df.a, df.b, values=df.c)
+
+        error = 'aggfunc cannot be used without values'
+        with pytest.raises(ValueError, match=error):
+            pd.crosstab(df.a, df.b, aggfunc=np.mean)
+
+        error = 'Not a valid normalize argument'
+        with pytest.raises(ValueError, match=error):
+            pd.crosstab(df.a, df.b, normalize='42')
+
+        with pytest.raises(ValueError, match=error):
+            pd.crosstab(df.a, df.b, normalize=42)
+
+        error = 'Not a valid margins argument'
+        with pytest.raises(ValueError, match=error):
+            pd.crosstab(df.a, df.b, normalize='all', margins=42)
+
+    def test_crosstab_with_categorial_columns(self):
+        # GH 8860
+        df = pd.DataFrame({'MAKE': ['Honda', 'Acura', 'Tesla',
+                                    'Honda', 'Honda', 'Acura'],
+                           'MODEL': ['Sedan', 'Sedan', 'Electric',
+                                     'Pickup', 'Sedan', 'Sedan']})
+        categories = ['Sedan', 'Electric', 'Pickup']
+        df['MODEL'] = (df['MODEL'].astype('category')
+                                  .cat.set_categories(categories))
+        result = pd.crosstab(df['MAKE'], df['MODEL'])
+
+        expected_index = pd.Index(['Acura', 'Honda', 'Tesla'], name='MAKE')
+        expected_columns = pd.CategoricalIndex(categories,
+                                               categories=categories,
+                                               ordered=False,
+                                               name='MODEL')
+        expected_data = [[2, 0, 0], [2, 0, 1], [0, 1, 0]]
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_columns)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_with_numpy_size(self):
+        # GH 4003
+        df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 6,
+                           'B': ['A', 'B', 'C'] * 8,
+                           'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 4,
+                           'D': np.random.randn(24),
+                           'E': np.random.randn(24)})
+        result = pd.crosstab(index=[df['A'], df['B']],
+                             columns=[df['C']],
+                             margins=True,
+                             aggfunc=np.size,
+                             values=df['D'])
+        expected_index = pd.MultiIndex(levels=[['All', 'one', 'three', 'two'],
+                                               ['', 'A', 'B', 'C']],
+                                       codes=[[1, 1, 1, 2, 2, 2, 3, 3, 3, 0],
+                                              [1, 2, 3, 1, 2, 3, 1, 2, 3, 0]],
+                                       names=['A', 'B'])
+        expected_column = pd.Index(['bar', 'foo', 'All'],
+                                   dtype='object',
+                                   name='C')
+        expected_data = np.array([[2., 2., 4.],
+                                  [2., 2., 4.],
+                                  [2., 2., 4.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [2., np.nan, 2.],
+                                  [np.nan, 2., 2.],
+                                  [12., 12., 24.]])
+        expected = pd.DataFrame(expected_data,
+                                index=expected_index,
+                                columns=expected_column)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_dup_index_names(self):
+        # GH 13279
+        s = pd.Series(range(3), name='foo')
+
+        result = pd.crosstab(s, s)
+        expected_index = pd.Index(range(3), name='foo')
+        expected = pd.DataFrame(np.eye(3, dtype=np.int64),
+                                index=expected_index,
+                                columns=expected_index)
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("names", [['a', ('b', 'c')],
+                                       [('a', 'b'), 'c']])
+    def test_crosstab_tuple_name(self, names):
+        s1 = pd.Series(range(3), name=names[0])
+        s2 = pd.Series(range(1, 4), name=names[1])
+
+        mi = pd.MultiIndex.from_arrays([range(3), range(1, 4)], names=names)
+        expected = pd.Series(1, index=mi).unstack(1, fill_value=0)
+
+        result = pd.crosstab(s1, s2)
+        tm.assert_frame_equal(result, expected)
+
+    def test_crosstab_unsorted_order(self):
+        df = pd.DataFrame({"b": [3, 1, 2], 'a': [5, 4, 6]},
+                          index=['C', 'A', 'B'])
+        result = pd.crosstab(df.index, [df.b, df.a])
+        e_idx = pd.Index(['A', 'B', 'C'], name='row_0')
+        e_columns = pd.MultiIndex.from_tuples([(1, 4), (2, 6), (3, 5)],
+                                              names=['b', 'a'])
+        expected = pd.DataFrame([[1, 0, 0], [0, 1, 0], [0, 0, 1]],
+                                index=e_idx,
+                                columns=e_columns)
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/reshape/test_qcut.py b/pandas/tests/reshape/test_qcut.py
new file mode 100644
index 0000000000000..997df7fd7aa4c
--- /dev/null
+++ b/pandas/tests/reshape/test_qcut.py
@@ -0,0 +1,199 @@
+import os
+
+import numpy as np
+import pytest
+
+from pandas.compat import zip
+
+from pandas import (
+    Categorical, DatetimeIndex, Interval, IntervalIndex, NaT, Series,
+    TimedeltaIndex, Timestamp, cut, date_range, isna, qcut, timedelta_range)
+from pandas.api.types import CategoricalDtype as CDT
+from pandas.core.algorithms import quantile
+import pandas.util.testing as tm
+
+from pandas.tseries.offsets import Day, Nano
+
+
+def test_qcut():
+    arr = np.random.randn(1000)
+
+    # We store the bins as Index that have been
+    # rounded to comparisons are a bit tricky.
+    labels, bins = qcut(arr, 4, retbins=True)
+    ex_bins = quantile(arr, [0, .25, .5, .75, 1.])
+
+    result = labels.categories.left.values
+    assert np.allclose(result, ex_bins[:-1], atol=1e-2)
+
+    result = labels.categories.right.values
+    assert np.allclose(result, ex_bins[1:], atol=1e-2)
+
+    ex_levels = cut(arr, ex_bins, include_lowest=True)
+    tm.assert_categorical_equal(labels, ex_levels)
+
+
+def test_qcut_bounds():
+    arr = np.random.randn(1000)
+
+    factor = qcut(arr, 10, labels=False)
+    assert len(np.unique(factor)) == 10
+
+
+def test_qcut_specify_quantiles():
+    arr = np.random.randn(100)
+    factor = qcut(arr, [0, .25, .5, .75, 1.])
+
+    expected = qcut(arr, 4)
+    tm.assert_categorical_equal(factor, expected)
+
+
+def test_qcut_all_bins_same():
+    with pytest.raises(ValueError, match="edges.*unique"):
+        qcut([0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 3)
+
+
+def test_qcut_include_lowest():
+    values = np.arange(10)
+    ii = qcut(values, 4)
+
+    ex_levels = IntervalIndex([Interval(-0.001, 2.25), Interval(2.25, 4.5),
+                               Interval(4.5, 6.75), Interval(6.75, 9)])
+    tm.assert_index_equal(ii.categories, ex_levels)
+
+
+def test_qcut_nas():
+    arr = np.random.randn(100)
+    arr[:20] = np.nan
+
+    result = qcut(arr, 4)
+    assert isna(result[:20]).all()
+
+
+def test_qcut_index():
+    result = qcut([0, 2], 2)
+    intervals = [Interval(-0.001, 1), Interval(1, 2)]
+
+    expected = Categorical(intervals, ordered=True)
+    tm.assert_categorical_equal(result, expected)
+
+
+def test_qcut_binning_issues(datapath):
+    # see gh-1978, gh-1979
+    cut_file = datapath(os.path.join("reshape", "data", "cut_data.csv"))
+    arr = np.loadtxt(cut_file)
+    result = qcut(arr, 20)
+
+    starts = []
+    ends = []
+
+    for lev in np.unique(result):
+        s = lev.left
+        e = lev.right
+        assert s != e
+
+        starts.append(float(s))
+        ends.append(float(e))
+
+    for (sp, sn), (ep, en) in zip(zip(starts[:-1], starts[1:]),
+                                  zip(ends[:-1], ends[1:])):
+        assert sp < sn
+        assert ep < en
+        assert ep <= sn
+
+
+def test_qcut_return_intervals():
+    ser = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
+    res = qcut(ser, [0, 0.333, 0.666, 1])
+
+    exp_levels = np.array([Interval(-0.001, 2.664),
+                           Interval(2.664, 5.328), Interval(5.328, 8)])
+    exp = Series(exp_levels.take([0, 0, 0, 1, 1, 1, 2, 2, 2])).astype(
+        CDT(ordered=True))
+    tm.assert_series_equal(res, exp)
+
+
+@pytest.mark.parametrize("kwargs,msg", [
+    (dict(duplicates="drop"), None),
+    (dict(), "Bin edges must be unique"),
+    (dict(duplicates="raise"), "Bin edges must be unique"),
+    (dict(duplicates="foo"), "invalid value for 'duplicates' parameter")
+])
+def test_qcut_duplicates_bin(kwargs, msg):
+    # see gh-7751
+    values = [0, 0, 0, 0, 1, 2, 3]
+
+    if msg is not None:
+        with pytest.raises(ValueError, match=msg):
+            qcut(values, 3, **kwargs)
+    else:
+        result = qcut(values, 3, **kwargs)
+        expected = IntervalIndex([Interval(-0.001, 1), Interval(1, 3)])
+        tm.assert_index_equal(result.categories, expected)
+
+
+@pytest.mark.parametrize("data,start,end", [
+    (9.0, 8.999, 9.0),
+    (0.0, -0.001, 0.0),
+    (-9.0, -9.001, -9.0),
+])
+@pytest.mark.parametrize("length", [1, 2])
+@pytest.mark.parametrize("labels", [None, False])
+def test_single_quantile(data, start, end, length, labels):
+    # see gh-15431
+    ser = Series([data] * length)
+    result = qcut(ser, 1, labels=labels)
+
+    if labels is None:
+        intervals = IntervalIndex([Interval(start, end)] *
+                                  length, closed="right")
+        expected = Series(intervals).astype(CDT(ordered=True))
+    else:
+        expected = Series([0] * length)
+
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("ser", [
+    Series(DatetimeIndex(["20180101", NaT, "20180103"])),
+    Series(TimedeltaIndex(["0 days", NaT, "2 days"]))],
+    ids=lambda x: str(x.dtype))
+def test_qcut_nat(ser):
+    # see gh-19768
+    intervals = IntervalIndex.from_tuples([
+        (ser[0] - Nano(), ser[2] - Day()),
+        np.nan, (ser[2] - Day(), ser[2])])
+    expected = Series(Categorical(intervals, ordered=True))
+
+    result = qcut(ser, 2)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("bins", [3, np.linspace(0, 1, 4)])
+def test_datetime_tz_qcut(bins):
+    # see gh-19872
+    tz = "US/Eastern"
+    ser = Series(date_range("20130101", periods=3, tz=tz))
+
+    result = qcut(ser, bins)
+    expected = Series(IntervalIndex([
+        Interval(Timestamp("2012-12-31 23:59:59.999999999", tz=tz),
+                 Timestamp("2013-01-01 16:00:00", tz=tz)),
+        Interval(Timestamp("2013-01-01 16:00:00", tz=tz),
+                 Timestamp("2013-01-02 08:00:00", tz=tz)),
+        Interval(Timestamp("2013-01-02 08:00:00", tz=tz),
+                 Timestamp("2013-01-03 00:00:00", tz=tz))])).astype(
+        CDT(ordered=True))
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("arg,expected_bins", [
+    [timedelta_range("1day", periods=3),
+     TimedeltaIndex(["1 days", "2 days", "3 days"])],
+    [date_range("20180101", periods=3),
+     DatetimeIndex(["2018-01-01", "2018-01-02", "2018-01-03"])]])
+def test_date_like_qcut_bins(arg, expected_bins):
+    # see gh-19891
+    ser = Series(arg)
+    result, result_bins = qcut(ser, 2, retbins=True)
+    tm.assert_index_equal(result_bins, expected_bins)
diff --git a/pandas/tests/reshape/test_reshape.py b/pandas/tests/reshape/test_reshape.py
new file mode 100644
index 0000000000000..a5b6cffd1d86c
--- /dev/null
+++ b/pandas/tests/reshape/test_reshape.py
@@ -0,0 +1,626 @@
+# -*- coding: utf-8 -*-
+# pylint: disable-msg=W0612,E1101
+
+from collections import OrderedDict
+
+import numpy as np
+from numpy import nan
+import pytest
+
+from pandas.compat import u
+
+from pandas.core.dtypes.common import is_integer_dtype
+
+import pandas as pd
+from pandas import Categorical, DataFrame, Index, Series, get_dummies
+from pandas.core.sparse.api import SparseArray, SparseDtype
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal
+
+
+class TestGetDummies(object):
+
+    @pytest.fixture
+    def df(self):
+        return DataFrame({'A': ['a', 'b', 'a'],
+                          'B': ['b', 'b', 'c'],
+                          'C': [1, 2, 3]})
+
+    @pytest.fixture(params=['uint8', 'i8', np.float64, bool, None])
+    def dtype(self, request):
+        return np.dtype(request.param)
+
+    @pytest.fixture(params=['dense', 'sparse'])
+    def sparse(self, request):
+        # params are strings to simplify reading test results,
+        # e.g. TestGetDummies::test_basic[uint8-sparse] instead of [uint8-True]
+        return request.param == 'sparse'
+
+    def effective_dtype(self, dtype):
+        if dtype is None:
+            return np.uint8
+        return dtype
+
+    def test_raises_on_dtype_object(self, df):
+        with pytest.raises(ValueError):
+            get_dummies(df, dtype='object')
+
+    def test_basic(self, sparse, dtype):
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame({'a': [1, 0, 0],
+                              'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=self.effective_dtype(dtype))
+        if sparse:
+            expected = expected.apply(pd.SparseArray, fill_value=0.0)
+        result = get_dummies(s_list, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+        expected.index = list('ABC')
+        result = get_dummies(s_series_index, sparse=sparse, dtype=dtype)
+        assert_frame_equal(result, expected)
+
+    def test_basic_types(self, sparse, dtype):
+        # GH 10531
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_df = DataFrame({'a': [0, 1, 0, 1, 2],
+                          'b': ['A', 'A', 'B', 'C', 'C'],
+                          'c': [2, 3, 3, 3, 2]})
+
+        expected = DataFrame({'a': [1, 0, 0],
+                              'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=self.effective_dtype(dtype),
+                             columns=list('abc'))
+        if sparse:
+            if is_integer_dtype(dtype):
+                fill_value = 0
+            elif dtype == bool:
+                fill_value = False
+            else:
+                fill_value = 0.0
+
+            expected = expected.apply(SparseArray, fill_value=fill_value)
+        result = get_dummies(s_list, sparse=sparse, dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, sparse=sparse, dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+        result = get_dummies(s_df, columns=s_df.columns,
+                             sparse=sparse, dtype=dtype)
+        if sparse:
+            dtype_name = 'Sparse[{}, {}]'.format(
+                self.effective_dtype(dtype).name,
+                fill_value
+            )
+        else:
+            dtype_name = self.effective_dtype(dtype).name
+
+        expected = Series({dtype_name: 8})
+        tm.assert_series_equal(result.get_dtype_counts(), expected)
+
+        result = get_dummies(s_df, columns=['a'], sparse=sparse, dtype=dtype)
+
+        expected_counts = {'int64': 1, 'object': 1}
+        expected_counts[dtype_name] = 3 + expected_counts.get(dtype_name, 0)
+
+        expected = Series(expected_counts).sort_index()
+        tm.assert_series_equal(result.get_dtype_counts().sort_index(),
+                               expected)
+
+    def test_just_na(self, sparse):
+        just_na_list = [np.nan]
+        just_na_series = Series(just_na_list)
+        just_na_series_index = Series(just_na_list, index=['A'])
+
+        res_list = get_dummies(just_na_list, sparse=sparse)
+        res_series = get_dummies(just_na_series, sparse=sparse)
+        res_series_index = get_dummies(just_na_series_index, sparse=sparse)
+
+        assert res_list.empty
+        assert res_series.empty
+        assert res_series_index.empty
+
+        assert res_list.index.tolist() == [0]
+        assert res_series.index.tolist() == [0]
+        assert res_series_index.index.tolist() == ['A']
+
+    def test_include_na(self, sparse, dtype):
+        s = ['a', 'b', np.nan]
+        res = get_dummies(s, sparse=sparse, dtype=dtype)
+        exp = DataFrame({'a': [1, 0, 0],
+                         'b': [0, 1, 0]},
+                        dtype=self.effective_dtype(dtype))
+        if sparse:
+            exp = exp.apply(pd.SparseArray, fill_value=0.0)
+        assert_frame_equal(res, exp)
+
+        # Sparse dataframes do not allow nan labelled columns, see #GH8822
+        res_na = get_dummies(s, dummy_na=True, sparse=sparse, dtype=dtype)
+        exp_na = DataFrame({nan: [0, 0, 1],
+                            'a': [1, 0, 0],
+                            'b': [0, 1, 0]},
+                           dtype=self.effective_dtype(dtype))
+        exp_na = exp_na.reindex(['a', 'b', nan], axis=1)
+        # hack (NaN handling in assert_index_equal)
+        exp_na.columns = res_na.columns
+        if sparse:
+            exp_na = exp_na.apply(pd.SparseArray, fill_value=0.0)
+        assert_frame_equal(res_na, exp_na)
+
+        res_just_na = get_dummies([nan], dummy_na=True,
+                                  sparse=sparse, dtype=dtype)
+        exp_just_na = DataFrame(Series(1, index=[0]), columns=[nan],
+                                dtype=self.effective_dtype(dtype))
+        tm.assert_numpy_array_equal(res_just_na.values, exp_just_na.values)
+
+    def test_unicode(self, sparse):
+        # See GH 6885 - get_dummies chokes on unicode values
+        import unicodedata
+        e = 'e'
+        eacute = unicodedata.lookup('LATIN SMALL LETTER E WITH ACUTE')
+        s = [e, eacute, eacute]
+        res = get_dummies(s, prefix='letter', sparse=sparse)
+        exp = DataFrame({'letter_e': [1, 0, 0],
+                         u('letter_%s') % eacute: [0, 1, 1]},
+                        dtype=np.uint8)
+        if sparse:
+            exp = exp.apply(pd.SparseArray, fill_value=0)
+        assert_frame_equal(res, exp)
+
+    def test_dataframe_dummies_all_obj(self, df, sparse):
+        df = df[['A', 'B']]
+        result = get_dummies(df, sparse=sparse)
+        expected = DataFrame({'A_a': [1, 0, 1],
+                              'A_b': [0, 1, 0],
+                              'B_b': [1, 1, 0],
+                              'B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        if sparse:
+            expected = pd.DataFrame({
+                "A_a": pd.SparseArray([1, 0, 1], dtype='uint8'),
+                "A_b": pd.SparseArray([0, 1, 0], dtype='uint8'),
+                "B_b": pd.SparseArray([1, 1, 0], dtype='uint8'),
+                "B_c": pd.SparseArray([0, 0, 1], dtype='uint8'),
+            })
+
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_mix_default(self, df, sparse, dtype):
+        result = get_dummies(df, sparse=sparse, dtype=dtype)
+        if sparse:
+            arr = SparseArray
+            typ = SparseDtype(dtype, 0)
+        else:
+            arr = np.array
+            typ = dtype
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_a': arr([1, 0, 1], dtype=typ),
+                              'A_b': arr([0, 1, 0], dtype=typ),
+                              'B_b': arr([1, 1, 0], dtype=typ),
+                              'B_c': arr([0, 0, 1], dtype=typ)})
+        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_list(self, df, sparse):
+        prefixes = ['from_A', 'from_B']
+        result = get_dummies(df, prefix=prefixes, sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0],
+                              'from_B_b': [1, 1, 0],
+                              'from_B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        cols = ['from_A_a', 'from_A_b', 'from_B_b', 'from_B_c']
+        expected = expected[['C'] + cols]
+
+        typ = pd.SparseArray if sparse else pd.Series
+        expected[cols] = expected[cols].apply(lambda x: typ(x))
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_str(self, df, sparse):
+        # not that you should do this...
+        result = get_dummies(df, prefix='bad', sparse=sparse)
+        bad_columns = ['bad_a', 'bad_b', 'bad_b', 'bad_c']
+        expected = DataFrame([[1, 1, 0, 1, 0],
+                              [2, 0, 1, 1, 0],
+                              [3, 1, 0, 0, 1]],
+                             columns=['C'] + bad_columns,
+                             dtype=np.uint8)
+        expected = expected.astype({"C": np.int64})
+        if sparse:
+            # work around astyping & assigning with duplicate columns
+            # https://github.com/pandas-dev/pandas/issues/14427
+            expected = pd.concat([
+                pd.Series([1, 2, 3], name='C'),
+                pd.Series([1, 0, 1], name='bad_a', dtype='Sparse[uint8]'),
+                pd.Series([0, 1, 0], name='bad_b', dtype='Sparse[uint8]'),
+                pd.Series([1, 1, 0], name='bad_b', dtype='Sparse[uint8]'),
+                pd.Series([0, 0, 1], name='bad_c', dtype='Sparse[uint8]'),
+            ], axis=1)
+
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_subset(self, df, sparse):
+        result = get_dummies(df, prefix=['from_A'], columns=['A'],
+                             sparse=sparse)
+        expected = DataFrame({'B': ['b', 'b', 'c'],
+                              'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0]}, dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        if sparse:
+            cols = ['from_A_a', 'from_A_b']
+            expected[cols] = expected[cols].apply(lambda x: pd.SparseSeries(x))
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_sep(self, df, sparse):
+        result = get_dummies(df, prefix_sep='..', sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A..a': [1, 0, 1],
+                              'A..b': [0, 1, 0],
+                              'B..b': [1, 1, 0],
+                              'B..c': [0, 0, 1]},
+                             dtype=np.uint8)
+        expected[['C']] = df[['C']]
+        expected = expected[['C', 'A..a', 'A..b', 'B..b', 'B..c']]
+        if sparse:
+            cols = ['A..a', 'A..b', 'B..b', 'B..c']
+            expected[cols] = expected[cols].apply(lambda x: pd.SparseSeries(x))
+
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, prefix_sep=['..', '__'], sparse=sparse)
+        expected = expected.rename(columns={'B..b': 'B__b', 'B..c': 'B__c'})
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, prefix_sep={'A': '..', 'B': '__'},
+                             sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_prefix_bad_length(self, df, sparse):
+        with pytest.raises(ValueError):
+            get_dummies(df, prefix=['too few'], sparse=sparse)
+
+    def test_dataframe_dummies_prefix_sep_bad_length(self, df, sparse):
+        with pytest.raises(ValueError):
+            get_dummies(df, prefix_sep=['bad'], sparse=sparse)
+
+    def test_dataframe_dummies_prefix_dict(self, sparse):
+        prefixes = {'A': 'from_A', 'B': 'from_B'}
+        df = DataFrame({'C': [1, 2, 3],
+                        'A': ['a', 'b', 'a'],
+                        'B': ['b', 'b', 'c']})
+        result = get_dummies(df, prefix=prefixes, sparse=sparse)
+
+        expected = DataFrame({'C': [1, 2, 3],
+                              'from_A_a': [1, 0, 1],
+                              'from_A_b': [0, 1, 0],
+                              'from_B_b': [1, 1, 0],
+                              'from_B_c': [0, 0, 1]})
+
+        columns = ['from_A_a', 'from_A_b', 'from_B_b', 'from_B_c']
+        expected[columns] = expected[columns].astype(np.uint8)
+        if sparse:
+            expected[columns] = expected[columns].apply(
+                lambda x: pd.SparseSeries(x)
+            )
+
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_with_na(self, df, sparse, dtype):
+        df.loc[3, :] = [np.nan, np.nan, np.nan]
+        result = get_dummies(df, dummy_na=True,
+                             sparse=sparse, dtype=dtype).sort_index(axis=1)
+
+        if sparse:
+            arr = SparseArray
+            typ = SparseDtype(dtype, 0)
+        else:
+            arr = np.array
+            typ = dtype
+
+        expected = DataFrame({'C': [1, 2, 3, np.nan],
+                              'A_a': arr([1, 0, 1, 0], dtype=typ),
+                              'A_b': arr([0, 1, 0, 0], dtype=typ),
+                              'A_nan': arr([0, 0, 0, 1], dtype=typ),
+                              'B_b': arr([1, 1, 0, 0], dtype=typ),
+                              'B_c': arr([0, 0, 1, 0], dtype=typ),
+                              'B_nan': arr([0, 0, 0, 1], dtype=typ)
+                              }).sort_index(axis=1)
+
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, dummy_na=False, sparse=sparse, dtype=dtype)
+        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_with_categorical(self, df, sparse, dtype):
+        df['cat'] = pd.Categorical(['x', 'y', 'y'])
+        result = get_dummies(df, sparse=sparse, dtype=dtype).sort_index(axis=1)
+        if sparse:
+            arr = SparseArray
+            typ = SparseDtype(dtype, 0)
+        else:
+            arr = np.array
+            typ = dtype
+
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_a': arr([1, 0, 1], dtype=typ),
+                              'A_b': arr([0, 1, 0], dtype=typ),
+                              'B_b': arr([1, 1, 0], dtype=typ),
+                              'B_c': arr([0, 0, 1], dtype=typ),
+                              'cat_x': arr([1, 0, 0], dtype=typ),
+                              'cat_y': arr([0, 1, 1], dtype=typ)
+                              }).sort_index(axis=1)
+
+        assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('get_dummies_kwargs,expected', [
+        ({'data': pd.DataFrame(({u'ä': ['a']}))},
+         pd.DataFrame({u'ä_a': [1]}, dtype=np.uint8)),
+
+        ({'data': pd.DataFrame({'x': [u'ä']})},
+         pd.DataFrame({u'x_ä': [1]}, dtype=np.uint8)),
+
+        ({'data': pd.DataFrame({'x': [u'a']}), 'prefix':u'ä'},
+         pd.DataFrame({u'ä_a': [1]}, dtype=np.uint8)),
+
+        ({'data': pd.DataFrame({'x': [u'a']}), 'prefix_sep':u'ä'},
+         pd.DataFrame({u'xäa': [1]}, dtype=np.uint8))])
+    def test_dataframe_dummies_unicode(self, get_dummies_kwargs, expected):
+        # GH22084 pd.get_dummies incorrectly encodes unicode characters
+        # in dataframe column names
+        result = get_dummies(**get_dummies_kwargs)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first(self, sparse):
+        # GH12402 Add a new parameter `drop_first` to avoid collinearity
+        # Basic case
+        s_list = list('abc')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame({'b': [0, 1, 0],
+                              'c': [0, 0, 1]},
+                             dtype=np.uint8)
+
+        result = get_dummies(s_list, drop_first=True, sparse=sparse)
+        if sparse:
+            expected = expected.apply(pd.SparseArray, fill_value=0)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        expected.index = list('ABC')
+        result = get_dummies(s_series_index, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first_one_level(self, sparse):
+        # Test the case that categorical variable only has one level.
+        s_list = list('aaa')
+        s_series = Series(s_list)
+        s_series_index = Series(s_list, list('ABC'))
+
+        expected = DataFrame(index=np.arange(3))
+
+        result = get_dummies(s_list, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(s_series, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+        expected = DataFrame(index=list('ABC'))
+        result = get_dummies(s_series_index, drop_first=True, sparse=sparse)
+        assert_frame_equal(result, expected)
+
+    def test_basic_drop_first_NA(self, sparse):
+        # Test NA handling together with drop_first
+        s_NA = ['a', 'b', np.nan]
+        res = get_dummies(s_NA, drop_first=True, sparse=sparse)
+        exp = DataFrame({'b': [0, 1, 0]}, dtype=np.uint8)
+        if sparse:
+            exp = exp.apply(pd.SparseArray, fill_value=0)
+
+        assert_frame_equal(res, exp)
+
+        res_na = get_dummies(s_NA, dummy_na=True, drop_first=True,
+                             sparse=sparse)
+        exp_na = DataFrame(
+            {'b': [0, 1, 0],
+             nan: [0, 0, 1]},
+            dtype=np.uint8).reindex(['b', nan], axis=1)
+        if sparse:
+            exp_na = exp_na.apply(pd.SparseArray, fill_value=0)
+        assert_frame_equal(res_na, exp_na)
+
+        res_just_na = get_dummies([nan], dummy_na=True, drop_first=True,
+                                  sparse=sparse)
+        exp_just_na = DataFrame(index=np.arange(1))
+        assert_frame_equal(res_just_na, exp_just_na)
+
+    def test_dataframe_dummies_drop_first(self, df, sparse):
+        df = df[['A', 'B']]
+        result = get_dummies(df, drop_first=True, sparse=sparse)
+        expected = DataFrame({'A_b': [0, 1, 0],
+                              'B_c': [0, 0, 1]},
+                             dtype=np.uint8)
+        if sparse:
+            expected = expected.apply(pd.SparseArray, fill_value=0)
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_drop_first_with_categorical(
+            self, df, sparse, dtype):
+        df['cat'] = pd.Categorical(['x', 'y', 'y'])
+        result = get_dummies(df, drop_first=True, sparse=sparse)
+        expected = DataFrame({'C': [1, 2, 3],
+                              'A_b': [0, 1, 0],
+                              'B_c': [0, 0, 1],
+                              'cat_y': [0, 1, 1]})
+        cols = ['A_b', 'B_c', 'cat_y']
+        expected[cols] = expected[cols].astype(np.uint8)
+        expected = expected[['C', 'A_b', 'B_c', 'cat_y']]
+        if sparse:
+            for col in cols:
+                expected[col] = pd.SparseSeries(expected[col])
+        assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_drop_first_with_na(self, df, sparse):
+        df.loc[3, :] = [np.nan, np.nan, np.nan]
+        result = get_dummies(df, dummy_na=True, drop_first=True,
+                             sparse=sparse).sort_index(axis=1)
+        expected = DataFrame({'C': [1, 2, 3, np.nan],
+                              'A_b': [0, 1, 0, 0],
+                              'A_nan': [0, 0, 0, 1],
+                              'B_c': [0, 0, 1, 0],
+                              'B_nan': [0, 0, 0, 1]})
+        cols = ['A_b', 'A_nan', 'B_c', 'B_nan']
+        expected[cols] = expected[cols].astype(np.uint8)
+        expected = expected.sort_index(axis=1)
+        if sparse:
+            for col in cols:
+                expected[col] = pd.SparseSeries(expected[col])
+
+        assert_frame_equal(result, expected)
+
+        result = get_dummies(df, dummy_na=False, drop_first=True,
+                             sparse=sparse)
+        expected = expected[['C', 'A_b', 'B_c']]
+        assert_frame_equal(result, expected)
+
+    def test_int_int(self):
+        data = Series([1, 2, 1])
+        result = pd.get_dummies(data)
+        expected = DataFrame([[1, 0],
+                              [0, 1],
+                              [1, 0]],
+                             columns=[1, 2],
+                             dtype=np.uint8)
+        tm.assert_frame_equal(result, expected)
+
+        data = Series(pd.Categorical(['a', 'b', 'a']))
+        result = pd.get_dummies(data)
+        expected = DataFrame([[1, 0],
+                              [0, 1],
+                              [1, 0]],
+                             columns=pd.Categorical(['a', 'b']),
+                             dtype=np.uint8)
+        tm.assert_frame_equal(result, expected)
+
+    def test_int_df(self, dtype):
+        data = DataFrame(
+            {'A': [1, 2, 1],
+             'B': pd.Categorical(['a', 'b', 'a']),
+             'C': [1, 2, 1],
+             'D': [1., 2., 1.]
+             }
+        )
+        columns = ['C', 'D', 'A_1', 'A_2', 'B_a', 'B_b']
+        expected = DataFrame([
+            [1, 1., 1, 0, 1, 0],
+            [2, 2., 0, 1, 0, 1],
+            [1, 1., 1, 0, 1, 0]
+        ], columns=columns)
+        expected[columns[2:]] = expected[columns[2:]].astype(dtype)
+        result = pd.get_dummies(data, columns=['A', 'B'], dtype=dtype)
+        tm.assert_frame_equal(result, expected)
+
+    def test_dataframe_dummies_preserve_categorical_dtype(self, dtype):
+        # GH13854
+        for ordered in [False, True]:
+            cat = pd.Categorical(list("xy"), categories=list("xyz"),
+                                 ordered=ordered)
+            result = get_dummies(cat, dtype=dtype)
+
+            data = np.array([[1, 0, 0], [0, 1, 0]],
+                            dtype=self.effective_dtype(dtype))
+            cols = pd.CategoricalIndex(cat.categories,
+                                       categories=cat.categories,
+                                       ordered=ordered)
+            expected = DataFrame(data, columns=cols,
+                                 dtype=self.effective_dtype(dtype))
+
+            tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize('sparse', [True, False])
+    def test_get_dummies_dont_sparsify_all_columns(self, sparse):
+        # GH18914
+        df = DataFrame.from_dict(OrderedDict([('GDP', [1, 2]),
+                                              ('Nation', ['AB', 'CD'])]))
+        df = get_dummies(df, columns=['Nation'], sparse=sparse)
+        df2 = df.reindex(columns=['GDP'])
+
+        tm.assert_frame_equal(df[['GDP']], df2)
+
+    def test_get_dummies_duplicate_columns(self, df):
+        # GH20839
+        df.columns = ["A", "A", "A"]
+        result = get_dummies(df).sort_index(axis=1)
+
+        expected = DataFrame([[1, 1, 0, 1, 0],
+                              [2, 0, 1, 1, 0],
+                              [3, 1, 0, 0, 1]],
+                             columns=['A', 'A_a', 'A_b', 'A_b', 'A_c'],
+                             dtype=np.uint8).sort_index(axis=1)
+
+        expected = expected.astype({"A": np.int64})
+
+        tm.assert_frame_equal(result, expected)
+
+
+class TestCategoricalReshape(object):
+
+    def test_reshaping_multi_index_categorical(self):
+
+        # construct a MultiIndexed DataFrame formerly created
+        #  via `tm.makePanel().to_frame()`
+        cols = ['ItemA', 'ItemB', 'ItemC']
+        data = {c: tm.makeTimeDataFrame() for c in cols}
+        df = pd.concat({c: data[c].stack() for c in data}, axis='columns')
+        df.index.names = ['major', 'minor']
+        df['str'] = 'foo'
+
+        dti = df.index.levels[0]
+
+        df['category'] = df['str'].astype('category')
+        result = df['category'].unstack()
+
+        c = Categorical(['foo'] * len(dti))
+        expected = DataFrame({'A': c.copy(),
+                              'B': c.copy(),
+                              'C': c.copy(),
+                              'D': c.copy()},
+                             columns=Index(list('ABCD'), name='minor'),
+                             index=dti)
+        tm.assert_frame_equal(result, expected)
+
+
+class TestMakeAxisDummies(object):
+
+    def test_preserve_categorical_dtype(self):
+        # GH13854
+        for ordered in [False, True]:
+            cidx = pd.CategoricalIndex(list("xyz"), ordered=ordered)
+            midx = pd.MultiIndex(levels=[['a'], cidx],
+                                 codes=[[0, 0], [0, 1]])
+            df = DataFrame([[10, 11]], index=midx)
+
+            expected = DataFrame([[1.0, 0.0, 0.0], [0.0, 1.0, 0.0]],
+                                 index=midx, columns=cidx)
+
+            from pandas.core.reshape.reshape import make_axis_dummies
+            result = make_axis_dummies(df)
+            tm.assert_frame_equal(result, expected)
+
+            result = make_axis_dummies(df, transform=lambda x: x)
+            tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/tools/test_union_categoricals.py b/pandas/tests/reshape/test_union_categoricals.py
similarity index 90%
rename from pandas/tests/tools/test_union_categoricals.py
rename to pandas/tests/reshape/test_union_categoricals.py
index 299b60f2a00b0..9b2b8bf9ed49f 100644
--- a/pandas/tests/tools/test_union_categoricals.py
+++ b/pandas/tests/reshape/test_union_categoricals.py
@@ -1,11 +1,14 @@
 import numpy as np
+import pytest
+
+from pandas.core.dtypes.concat import union_categoricals
+
 import pandas as pd
-from pandas import Categorical, Series, CategoricalIndex
-from pandas.types.concat import union_categoricals
+from pandas import Categorical, CategoricalIndex, Series
 from pandas.util import testing as tm
 
 
-class TestUnionCategoricals(tm.TestCase):
+class TestUnionCategoricals(object):
 
     def test_union_categorical(self):
         # GH 13361
@@ -56,11 +59,11 @@ def test_union_categorical(self):
         s = Categorical([0, 1.2, 2])
         s2 = Categorical([2, 3, 4])
         msg = 'dtype of categories must be the same'
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([s, s2])
 
         msg = 'No Categoricals to union'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             union_categoricals([])
 
     def test_union_categoricals_nan(self):
@@ -88,7 +91,8 @@ def test_union_categoricals_nan(self):
         tm.assert_categorical_equal(res, exp)
 
         # all NaN
-        res = union_categoricals([pd.Categorical([np.nan, np.nan]),
+        res = union_categoricals([pd.Categorical(np.array([np.nan, np.nan],
+                                                          dtype=object)),
                                   pd.Categorical(['X'])])
         exp = Categorical([np.nan, np.nan, 'X'])
         tm.assert_categorical_equal(res, exp)
@@ -105,17 +109,11 @@ def test_union_categoricals_empty(self):
         exp = Categorical([])
         tm.assert_categorical_equal(res, exp)
 
-        res = union_categoricals([pd.Categorical([]),
-                                  pd.Categorical([1.0])])
-        exp = Categorical([1.0])
+        res = union_categoricals([Categorical([]),
+                                  Categorical(['1'])])
+        exp = Categorical(['1'])
         tm.assert_categorical_equal(res, exp)
 
-        # to make dtype equal
-        nanc = pd.Categorical(np.array([np.nan], dtype=np.float64))
-        res = union_categoricals([nanc,
-                                  pd.Categorical([])])
-        tm.assert_categorical_equal(res, nanc)
-
     def test_union_categorical_same_category(self):
         # check fastpath
         c1 = Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4])
@@ -132,12 +130,21 @@ def test_union_categorical_same_category(self):
                           categories=['x', 'y', 'z'])
         tm.assert_categorical_equal(res, exp)
 
+    def test_union_categorical_same_categories_different_order(self):
+        # https://github.com/pandas-dev/pandas/issues/19096
+        c1 = Categorical(['a', 'b', 'c'], categories=['a', 'b', 'c'])
+        c2 = Categorical(['a', 'b', 'c'], categories=['b', 'a', 'c'])
+        result = union_categoricals([c1, c2])
+        expected = Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                               categories=['a', 'b', 'c'])
+        tm.assert_categorical_equal(result, expected)
+
     def test_union_categoricals_ordered(self):
         c1 = Categorical([1, 2, 3], ordered=True)
         c2 = Categorical([1, 2, 3], ordered=False)
 
         msg = 'Categorical.ordered must be the same'
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([c1, c2])
 
         res = union_categoricals([c1, c1])
@@ -155,7 +162,7 @@ def test_union_categoricals_ordered(self):
         c2 = Categorical([1, 2, 3], categories=[3, 2, 1], ordered=True)
 
         msg = "to union ordered Categoricals, all categories must be the same"
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([c1, c2])
 
     def test_union_categoricals_ignore_order(self):
@@ -168,7 +175,7 @@ def test_union_categoricals_ignore_order(self):
         tm.assert_categorical_equal(res, exp)
 
         msg = 'Categorical.ordered must be the same'
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([c1, c2], ignore_order=False)
 
         res = union_categoricals([c1, c1], ignore_order=True)
@@ -206,10 +213,10 @@ def test_union_categoricals_ignore_order(self):
         tm.assert_categorical_equal(result, expected)
 
         msg = "to union ordered Categoricals, all categories must be the same"
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([c1, c2], ignore_order=False)
 
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             union_categoricals([c1, c2])
 
     def test_union_categoricals_sort(self):
@@ -254,7 +261,7 @@ def test_union_categoricals_sort(self):
         c1 = Categorical([np.nan])
         c2 = Categorical([np.nan])
         result = union_categoricals([c1, c2], sort_categories=True)
-        expected = Categorical([np.nan, np.nan], categories=[])
+        expected = Categorical([np.nan, np.nan])
         tm.assert_categorical_equal(result, expected)
 
         c1 = Categorical([])
@@ -265,7 +272,7 @@ def test_union_categoricals_sort(self):
 
         c1 = Categorical(['b', 'a'], categories=['b', 'a', 'c'], ordered=True)
         c2 = Categorical(['a', 'c'], categories=['b', 'a', 'c'], ordered=True)
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             union_categoricals([c1, c2], sort_categories=True)
 
     def test_union_categoricals_sort_false(self):
@@ -303,7 +310,7 @@ def test_union_categoricals_sort_false(self):
         c1 = Categorical([np.nan])
         c2 = Categorical([np.nan])
         result = union_categoricals([c1, c2], sort_categories=False)
-        expected = Categorical([np.nan, np.nan], categories=[])
+        expected = Categorical([np.nan, np.nan])
         tm.assert_categorical_equal(result, expected)
 
         c1 = Categorical([])
@@ -335,5 +342,5 @@ def test_union_categorical_unwrap(self):
         result = union_categoricals([c1, c2])
         tm.assert_categorical_equal(result, expected)
 
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             union_categoricals([c1, ['a', 'b', 'c']])
diff --git a/pandas/tests/reshape/test_util.py b/pandas/tests/reshape/test_util.py
new file mode 100644
index 0000000000000..a8d9e7a775442
--- /dev/null
+++ b/pandas/tests/reshape/test_util.py
@@ -0,0 +1,53 @@
+import numpy as np
+import pytest
+
+from pandas import Index, date_range
+from pandas.core.reshape.util import cartesian_product
+import pandas.util.testing as tm
+
+
+class TestCartesianProduct(object):
+
+    def test_simple(self):
+        x, y = list('ABC'), [1, 22]
+        result1, result2 = cartesian_product([x, y])
+        expected1 = np.array(['A', 'A', 'B', 'B', 'C', 'C'])
+        expected2 = np.array([1, 22, 1, 22, 1, 22])
+        tm.assert_numpy_array_equal(result1, expected1)
+        tm.assert_numpy_array_equal(result2, expected2)
+
+    def test_datetimeindex(self):
+        # regression test for GitHub issue #6439
+        # make sure that the ordering on datetimeindex is consistent
+        x = date_range('2000-01-01', periods=2)
+        result1, result2 = [Index(y).day for y in cartesian_product([x, x])]
+        expected1 = Index([1, 1, 2, 2])
+        expected2 = Index([1, 2, 1, 2])
+        tm.assert_index_equal(result1, expected1)
+        tm.assert_index_equal(result2, expected2)
+
+    def test_empty(self):
+        # product of empty factors
+        X = [[], [0, 1], []]
+        Y = [[], [], ['a', 'b', 'c']]
+        for x, y in zip(X, Y):
+            expected1 = np.array([], dtype=np.asarray(x).dtype)
+            expected2 = np.array([], dtype=np.asarray(y).dtype)
+            result1, result2 = cartesian_product([x, y])
+            tm.assert_numpy_array_equal(result1, expected1)
+            tm.assert_numpy_array_equal(result2, expected2)
+
+        # empty product (empty input):
+        result = cartesian_product([])
+        expected = []
+        assert result == expected
+
+    @pytest.mark.parametrize("X", [
+        1, [1], [1, 2], [[1], 2],
+        'a', ['a'], ['a', 'b'], [['a'], 'b']
+    ])
+    def test_invalid_input(self, X):
+        msg = "Input must be a list-like of list-likes"
+
+        with pytest.raises(TypeError, match=msg):
+            cartesian_product(X=X)
diff --git a/pandas/tests/scalar/interval/__init__.py b/pandas/tests/scalar/interval/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/interval/test_interval.py b/pandas/tests/scalar/interval/test_interval.py
new file mode 100644
index 0000000000000..432f44725e2ba
--- /dev/null
+++ b/pandas/tests/scalar/interval/test_interval.py
@@ -0,0 +1,225 @@
+from __future__ import division
+
+import numpy as np
+import pytest
+
+from pandas import Interval, Timedelta, Timestamp
+import pandas.core.common as com
+
+
+@pytest.fixture
+def interval():
+    return Interval(0, 1)
+
+
+class TestInterval(object):
+
+    def test_properties(self, interval):
+        assert interval.closed == 'right'
+        assert interval.left == 0
+        assert interval.right == 1
+        assert interval.mid == 0.5
+
+    def test_repr(self, interval):
+        assert repr(interval) == "Interval(0, 1, closed='right')"
+        assert str(interval) == "(0, 1]"
+
+        interval_left = Interval(0, 1, closed='left')
+        assert repr(interval_left) == "Interval(0, 1, closed='left')"
+        assert str(interval_left) == "[0, 1)"
+
+    def test_contains(self, interval):
+        assert 0.5 in interval
+        assert 1 in interval
+        assert 0 not in interval
+
+        msg = "__contains__ not defined for two intervals"
+        with pytest.raises(TypeError, match=msg):
+            interval in interval
+
+        interval_both = Interval(0, 1, closed='both')
+        assert 0 in interval_both
+        assert 1 in interval_both
+
+        interval_neither = Interval(0, 1, closed='neither')
+        assert 0 not in interval_neither
+        assert 0.5 in interval_neither
+        assert 1 not in interval_neither
+
+    def test_equal(self):
+        assert Interval(0, 1) == Interval(0, 1, closed='right')
+        assert Interval(0, 1) != Interval(0, 1, closed='left')
+        assert Interval(0, 1) != 0
+
+    def test_comparison(self):
+        with pytest.raises(TypeError, match='unorderable types'):
+            Interval(0, 1) < 2
+
+        assert Interval(0, 1) < Interval(1, 2)
+        assert Interval(0, 1) < Interval(0, 2)
+        assert Interval(0, 1) < Interval(0.5, 1.5)
+        assert Interval(0, 1) <= Interval(0, 1)
+        assert Interval(0, 1) > Interval(-1, 2)
+        assert Interval(0, 1) >= Interval(0, 1)
+
+    def test_hash(self, interval):
+        # should not raise
+        hash(interval)
+
+    @pytest.mark.parametrize('left, right, expected', [
+        (0, 5, 5),
+        (-2, 5.5, 7.5),
+        (10, 10, 0),
+        (10, np.inf, np.inf),
+        (-np.inf, -5, np.inf),
+        (-np.inf, np.inf, np.inf),
+        (Timedelta('0 days'), Timedelta('5 days'), Timedelta('5 days')),
+        (Timedelta('10 days'), Timedelta('10 days'), Timedelta('0 days')),
+        (Timedelta('1H10M'), Timedelta('5H5M'), Timedelta('3H55M')),
+        (Timedelta('5S'), Timedelta('1H'), Timedelta('59M55S'))])
+    def test_length(self, left, right, expected):
+        # GH 18789
+        iv = Interval(left, right)
+        result = iv.length
+        assert result == expected
+
+    @pytest.mark.parametrize('left, right, expected', [
+        ('2017-01-01', '2017-01-06', '5 days'),
+        ('2017-01-01', '2017-01-01 12:00:00', '12 hours'),
+        ('2017-01-01 12:00', '2017-01-01 12:00:00', '0 days'),
+        ('2017-01-01 12:01', '2017-01-05 17:31:00', '4 days 5 hours 30 min')])
+    @pytest.mark.parametrize('tz', (None, 'UTC', 'CET', 'US/Eastern'))
+    def test_length_timestamp(self, tz, left, right, expected):
+        # GH 18789
+        iv = Interval(Timestamp(left, tz=tz), Timestamp(right, tz=tz))
+        result = iv.length
+        expected = Timedelta(expected)
+        assert result == expected
+
+    @pytest.mark.parametrize('left, right', [
+        ('a', 'z'),
+        (('a', 'b'), ('c', 'd')),
+        (list('AB'), list('ab')),
+        (Interval(0, 1), Interval(1, 2))])
+    def test_length_errors(self, left, right):
+        # GH 18789
+        iv = Interval(left, right)
+        msg = 'cannot compute length between .* and .*'
+        with pytest.raises(TypeError, match=msg):
+            iv.length
+
+    def test_math_add(self, closed):
+        interval = Interval(0, 1, closed=closed)
+        expected = Interval(1, 2, closed=closed)
+
+        result = interval + 1
+        assert result == expected
+
+        result = 1 + interval
+        assert result == expected
+
+        result = interval
+        result += 1
+        assert result == expected
+
+        msg = r"unsupported operand type\(s\) for \+"
+        with pytest.raises(TypeError, match=msg):
+            interval + interval
+
+        with pytest.raises(TypeError, match=msg):
+            interval + 'foo'
+
+    def test_math_sub(self, closed):
+        interval = Interval(0, 1, closed=closed)
+        expected = Interval(-1, 0, closed=closed)
+
+        result = interval - 1
+        assert result == expected
+
+        result = interval
+        result -= 1
+        assert result == expected
+
+        msg = r"unsupported operand type\(s\) for -"
+        with pytest.raises(TypeError, match=msg):
+            interval - interval
+
+        with pytest.raises(TypeError, match=msg):
+            interval - 'foo'
+
+    def test_math_mult(self, closed):
+        interval = Interval(0, 1, closed=closed)
+        expected = Interval(0, 2, closed=closed)
+
+        result = interval * 2
+        assert result == expected
+
+        result = 2 * interval
+        assert result == expected
+
+        result = interval
+        result *= 2
+        assert result == expected
+
+        msg = r"unsupported operand type\(s\) for \*"
+        with pytest.raises(TypeError, match=msg):
+            interval * interval
+
+        msg = r"can\'t multiply sequence by non-int"
+        with pytest.raises(TypeError, match=msg):
+            interval * 'foo'
+
+    def test_math_div(self, closed):
+        interval = Interval(0, 1, closed=closed)
+        expected = Interval(0, 0.5, closed=closed)
+
+        result = interval / 2.0
+        assert result == expected
+
+        result = interval
+        result /= 2.0
+        assert result == expected
+
+        msg = r"unsupported operand type\(s\) for /"
+        with pytest.raises(TypeError, match=msg):
+            interval / interval
+
+        with pytest.raises(TypeError, match=msg):
+            interval / 'foo'
+
+    def test_math_floordiv(self, closed):
+        interval = Interval(1, 2, closed=closed)
+        expected = Interval(0, 1, closed=closed)
+
+        result = interval // 2
+        assert result == expected
+
+        result = interval
+        result //= 2
+        assert result == expected
+
+        msg = r"unsupported operand type\(s\) for //"
+        with pytest.raises(TypeError, match=msg):
+            interval // interval
+
+        with pytest.raises(TypeError, match=msg):
+            interval // 'foo'
+
+    def test_constructor_errors(self):
+        msg = "invalid option for 'closed': foo"
+        with pytest.raises(ValueError, match=msg):
+            Interval(0, 1, closed='foo')
+
+        msg = 'left side of interval must be <= right side'
+        with pytest.raises(ValueError, match=msg):
+            Interval(1, 0)
+
+    @pytest.mark.parametrize('tz_left, tz_right', [
+        (None, 'UTC'), ('UTC', None), ('UTC', 'US/Eastern')])
+    def test_constructor_errors_tz(self, tz_left, tz_right):
+        # GH 18538
+        left = Timestamp('2017-01-01', tz=tz_left)
+        right = Timestamp('2017-01-02', tz=tz_right)
+        error = TypeError if com._any_none(tz_left, tz_right) else ValueError
+        with pytest.raises(error):
+            Interval(left, right)
diff --git a/pandas/tests/scalar/interval/test_ops.py b/pandas/tests/scalar/interval/test_ops.py
new file mode 100644
index 0000000000000..869ff205c2f51
--- /dev/null
+++ b/pandas/tests/scalar/interval/test_ops.py
@@ -0,0 +1,60 @@
+"""Tests for Interval-Interval operations, such as overlaps, contains, etc."""
+import pytest
+
+from pandas import Interval, Timedelta, Timestamp
+
+
+@pytest.fixture(params=[
+    (Timedelta('0 days'), Timedelta('1 day')),
+    (Timestamp('2018-01-01'), Timedelta('1 day')),
+    (0, 1)], ids=lambda x: type(x[0]).__name__)
+def start_shift(request):
+    """
+    Fixture for generating intervals of types from a start value and a shift
+    value that can be added to start to generate an endpoint
+    """
+    return request.param
+
+
+class TestOverlaps(object):
+
+    def test_overlaps_self(self, start_shift, closed):
+        start, shift = start_shift
+        interval = Interval(start, start + shift, closed)
+        assert interval.overlaps(interval)
+
+    def test_overlaps_nested(self, start_shift, closed, other_closed):
+        start, shift = start_shift
+        interval1 = Interval(start, start + 3 * shift, other_closed)
+        interval2 = Interval(start + shift, start + 2 * shift, closed)
+
+        # nested intervals should always overlap
+        assert interval1.overlaps(interval2)
+
+    def test_overlaps_disjoint(self, start_shift, closed, other_closed):
+        start, shift = start_shift
+        interval1 = Interval(start, start + shift, other_closed)
+        interval2 = Interval(start + 2 * shift, start + 3 * shift, closed)
+
+        # disjoint intervals should never overlap
+        assert not interval1.overlaps(interval2)
+
+    def test_overlaps_endpoint(self, start_shift, closed, other_closed):
+        start, shift = start_shift
+        interval1 = Interval(start, start + shift, other_closed)
+        interval2 = Interval(start + shift, start + 2 * shift, closed)
+
+        # overlap if shared endpoint is closed for both (overlap at a point)
+        result = interval1.overlaps(interval2)
+        expected = interval1.closed_right and interval2.closed_left
+        assert result == expected
+
+    @pytest.mark.parametrize('other', [
+        10, True, 'foo', Timedelta('1 day'), Timestamp('2018-01-01')],
+        ids=lambda x: type(x).__name__)
+    def test_overlaps_invalid_type(self, other):
+        interval = Interval(0, 1)
+        msg = '`other` must be an Interval, got {other}'.format(
+            other=type(other).__name__)
+        with pytest.raises(TypeError, match=msg):
+            interval.overlaps(other)
diff --git a/pandas/tests/scalar/period/__init__.py b/pandas/tests/scalar/period/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/period/test_asfreq.py b/pandas/tests/scalar/period/test_asfreq.py
new file mode 100644
index 0000000000000..f46f2da6c076d
--- /dev/null
+++ b/pandas/tests/scalar/period/test_asfreq.py
@@ -0,0 +1,747 @@
+import pytest
+
+from pandas._libs.tslibs.frequencies import (
+    INVALID_FREQ_ERR_MSG, _period_code_map)
+from pandas.errors import OutOfBoundsDatetime
+
+from pandas import Period, offsets
+
+
+class TestFreqConversion(object):
+    """Test frequency conversion of date objects"""
+    @pytest.mark.parametrize('freq', ['A', 'Q', 'M', 'W', 'B', 'D'])
+    def test_asfreq_near_zero(self, freq):
+        # GH#19643, GH#19650
+        per = Period('0001-01-01', freq=freq)
+        tup1 = (per.year, per.hour, per.day)
+
+        prev = per - 1
+        assert prev.ordinal == per.ordinal - 1
+        tup2 = (prev.year, prev.month, prev.day)
+        assert tup2 < tup1
+
+    def test_asfreq_near_zero_weekly(self):
+        # GH#19834
+        per1 = Period('0001-01-01', 'D') + 6
+        per2 = Period('0001-01-01', 'D') - 6
+        week1 = per1.asfreq('W')
+        week2 = per2.asfreq('W')
+        assert week1 != week2
+        assert week1.asfreq('D', 'E') >= per1
+        assert week2.asfreq('D', 'S') <= per2
+
+    @pytest.mark.xfail(reason='GH#19643 period_helper asfreq functions fail '
+                              'to check for overflows')
+    def test_to_timestamp_out_of_bounds(self):
+        # GH#19643, currently gives Timestamp('1754-08-30 22:43:41.128654848')
+        per = Period('0001-01-01', freq='B')
+        with pytest.raises(OutOfBoundsDatetime):
+            per.to_timestamp()
+
+    def test_asfreq_corner(self):
+        val = Period(freq='A', year=2007)
+        result1 = val.asfreq('5t')
+        result2 = val.asfreq('t')
+        expected = Period('2007-12-31 23:59', freq='t')
+        assert result1.ordinal == expected.ordinal
+        assert result1.freqstr == '5T'
+        assert result2.ordinal == expected.ordinal
+        assert result2.freqstr == 'T'
+
+    def test_conv_annual(self):
+        # frequency conversion tests: from Annual Frequency
+
+        ival_A = Period(freq='A', year=2007)
+
+        ival_AJAN = Period(freq="A-JAN", year=2007)
+        ival_AJUN = Period(freq="A-JUN", year=2007)
+        ival_ANOV = Period(freq="A-NOV", year=2007)
+
+        ival_A_to_Q_start = Period(freq='Q', year=2007, quarter=1)
+        ival_A_to_Q_end = Period(freq='Q', year=2007, quarter=4)
+        ival_A_to_M_start = Period(freq='M', year=2007, month=1)
+        ival_A_to_M_end = Period(freq='M', year=2007, month=12)
+        ival_A_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_A_to_W_end = Period(freq='W', year=2007, month=12, day=31)
+        ival_A_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_A_to_B_end = Period(freq='B', year=2007, month=12, day=31)
+        ival_A_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_A_to_D_end = Period(freq='D', year=2007, month=12, day=31)
+        ival_A_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_A_to_H_end = Period(freq='H', year=2007, month=12, day=31,
+                                 hour=23)
+        ival_A_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_A_to_T_end = Period(freq='Min', year=2007, month=12, day=31,
+                                 hour=23, minute=59)
+        ival_A_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_A_to_S_end = Period(freq='S', year=2007, month=12, day=31,
+                                 hour=23, minute=59, second=59)
+
+        ival_AJAN_to_D_end = Period(freq='D', year=2007, month=1, day=31)
+        ival_AJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
+        ival_AJUN_to_D_end = Period(freq='D', year=2007, month=6, day=30)
+        ival_AJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
+        ival_ANOV_to_D_end = Period(freq='D', year=2007, month=11, day=30)
+        ival_ANOV_to_D_start = Period(freq='D', year=2006, month=12, day=1)
+
+        assert ival_A.asfreq('Q', 'S') == ival_A_to_Q_start
+        assert ival_A.asfreq('Q', 'e') == ival_A_to_Q_end
+        assert ival_A.asfreq('M', 's') == ival_A_to_M_start
+        assert ival_A.asfreq('M', 'E') == ival_A_to_M_end
+        assert ival_A.asfreq('W', 'S') == ival_A_to_W_start
+        assert ival_A.asfreq('W', 'E') == ival_A_to_W_end
+        assert ival_A.asfreq('B', 'S') == ival_A_to_B_start
+        assert ival_A.asfreq('B', 'E') == ival_A_to_B_end
+        assert ival_A.asfreq('D', 'S') == ival_A_to_D_start
+        assert ival_A.asfreq('D', 'E') == ival_A_to_D_end
+        assert ival_A.asfreq('H', 'S') == ival_A_to_H_start
+        assert ival_A.asfreq('H', 'E') == ival_A_to_H_end
+        assert ival_A.asfreq('min', 'S') == ival_A_to_T_start
+        assert ival_A.asfreq('min', 'E') == ival_A_to_T_end
+        assert ival_A.asfreq('T', 'S') == ival_A_to_T_start
+        assert ival_A.asfreq('T', 'E') == ival_A_to_T_end
+        assert ival_A.asfreq('S', 'S') == ival_A_to_S_start
+        assert ival_A.asfreq('S', 'E') == ival_A_to_S_end
+
+        assert ival_AJAN.asfreq('D', 'S') == ival_AJAN_to_D_start
+        assert ival_AJAN.asfreq('D', 'E') == ival_AJAN_to_D_end
+
+        assert ival_AJUN.asfreq('D', 'S') == ival_AJUN_to_D_start
+        assert ival_AJUN.asfreq('D', 'E') == ival_AJUN_to_D_end
+
+        assert ival_ANOV.asfreq('D', 'S') == ival_ANOV_to_D_start
+        assert ival_ANOV.asfreq('D', 'E') == ival_ANOV_to_D_end
+
+        assert ival_A.asfreq('A') == ival_A
+
+    def test_conv_quarterly(self):
+        # frequency conversion tests: from Quarterly Frequency
+
+        ival_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_Q_end_of_year = Period(freq='Q', year=2007, quarter=4)
+
+        ival_QEJAN = Period(freq="Q-JAN", year=2007, quarter=1)
+        ival_QEJUN = Period(freq="Q-JUN", year=2007, quarter=1)
+
+        ival_Q_to_A = Period(freq='A', year=2007)
+        ival_Q_to_M_start = Period(freq='M', year=2007, month=1)
+        ival_Q_to_M_end = Period(freq='M', year=2007, month=3)
+        ival_Q_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_Q_to_W_end = Period(freq='W', year=2007, month=3, day=31)
+        ival_Q_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_Q_to_B_end = Period(freq='B', year=2007, month=3, day=30)
+        ival_Q_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_Q_to_D_end = Period(freq='D', year=2007, month=3, day=31)
+        ival_Q_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_Q_to_H_end = Period(freq='H', year=2007, month=3, day=31, hour=23)
+        ival_Q_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_Q_to_T_end = Period(freq='Min', year=2007, month=3, day=31,
+                                 hour=23, minute=59)
+        ival_Q_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_Q_to_S_end = Period(freq='S', year=2007, month=3, day=31, hour=23,
+                                 minute=59, second=59)
+
+        ival_QEJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
+        ival_QEJAN_to_D_end = Period(freq='D', year=2006, month=4, day=30)
+
+        ival_QEJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
+        ival_QEJUN_to_D_end = Period(freq='D', year=2006, month=9, day=30)
+
+        assert ival_Q.asfreq('A') == ival_Q_to_A
+        assert ival_Q_end_of_year.asfreq('A') == ival_Q_to_A
+
+        assert ival_Q.asfreq('M', 'S') == ival_Q_to_M_start
+        assert ival_Q.asfreq('M', 'E') == ival_Q_to_M_end
+        assert ival_Q.asfreq('W', 'S') == ival_Q_to_W_start
+        assert ival_Q.asfreq('W', 'E') == ival_Q_to_W_end
+        assert ival_Q.asfreq('B', 'S') == ival_Q_to_B_start
+        assert ival_Q.asfreq('B', 'E') == ival_Q_to_B_end
+        assert ival_Q.asfreq('D', 'S') == ival_Q_to_D_start
+        assert ival_Q.asfreq('D', 'E') == ival_Q_to_D_end
+        assert ival_Q.asfreq('H', 'S') == ival_Q_to_H_start
+        assert ival_Q.asfreq('H', 'E') == ival_Q_to_H_end
+        assert ival_Q.asfreq('Min', 'S') == ival_Q_to_T_start
+        assert ival_Q.asfreq('Min', 'E') == ival_Q_to_T_end
+        assert ival_Q.asfreq('S', 'S') == ival_Q_to_S_start
+        assert ival_Q.asfreq('S', 'E') == ival_Q_to_S_end
+
+        assert ival_QEJAN.asfreq('D', 'S') == ival_QEJAN_to_D_start
+        assert ival_QEJAN.asfreq('D', 'E') == ival_QEJAN_to_D_end
+        assert ival_QEJUN.asfreq('D', 'S') == ival_QEJUN_to_D_start
+        assert ival_QEJUN.asfreq('D', 'E') == ival_QEJUN_to_D_end
+
+        assert ival_Q.asfreq('Q') == ival_Q
+
+    def test_conv_monthly(self):
+        # frequency conversion tests: from Monthly Frequency
+
+        ival_M = Period(freq='M', year=2007, month=1)
+        ival_M_end_of_year = Period(freq='M', year=2007, month=12)
+        ival_M_end_of_quarter = Period(freq='M', year=2007, month=3)
+        ival_M_to_A = Period(freq='A', year=2007)
+        ival_M_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_M_to_W_start = Period(freq='W', year=2007, month=1, day=1)
+        ival_M_to_W_end = Period(freq='W', year=2007, month=1, day=31)
+        ival_M_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_M_to_B_end = Period(freq='B', year=2007, month=1, day=31)
+        ival_M_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_M_to_D_end = Period(freq='D', year=2007, month=1, day=31)
+        ival_M_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_M_to_H_end = Period(freq='H', year=2007, month=1, day=31, hour=23)
+        ival_M_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_M_to_T_end = Period(freq='Min', year=2007, month=1, day=31,
+                                 hour=23, minute=59)
+        ival_M_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_M_to_S_end = Period(freq='S', year=2007, month=1, day=31, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_M.asfreq('A') == ival_M_to_A
+        assert ival_M_end_of_year.asfreq('A') == ival_M_to_A
+        assert ival_M.asfreq('Q') == ival_M_to_Q
+        assert ival_M_end_of_quarter.asfreq('Q') == ival_M_to_Q
+
+        assert ival_M.asfreq('W', 'S') == ival_M_to_W_start
+        assert ival_M.asfreq('W', 'E') == ival_M_to_W_end
+        assert ival_M.asfreq('B', 'S') == ival_M_to_B_start
+        assert ival_M.asfreq('B', 'E') == ival_M_to_B_end
+        assert ival_M.asfreq('D', 'S') == ival_M_to_D_start
+        assert ival_M.asfreq('D', 'E') == ival_M_to_D_end
+        assert ival_M.asfreq('H', 'S') == ival_M_to_H_start
+        assert ival_M.asfreq('H', 'E') == ival_M_to_H_end
+        assert ival_M.asfreq('Min', 'S') == ival_M_to_T_start
+        assert ival_M.asfreq('Min', 'E') == ival_M_to_T_end
+        assert ival_M.asfreq('S', 'S') == ival_M_to_S_start
+        assert ival_M.asfreq('S', 'E') == ival_M_to_S_end
+
+        assert ival_M.asfreq('M') == ival_M
+
+    def test_conv_weekly(self):
+        # frequency conversion tests: from Weekly Frequency
+        ival_W = Period(freq='W', year=2007, month=1, day=1)
+
+        ival_WSUN = Period(freq='W', year=2007, month=1, day=7)
+        ival_WSAT = Period(freq='W-SAT', year=2007, month=1, day=6)
+        ival_WFRI = Period(freq='W-FRI', year=2007, month=1, day=5)
+        ival_WTHU = Period(freq='W-THU', year=2007, month=1, day=4)
+        ival_WWED = Period(freq='W-WED', year=2007, month=1, day=3)
+        ival_WTUE = Period(freq='W-TUE', year=2007, month=1, day=2)
+        ival_WMON = Period(freq='W-MON', year=2007, month=1, day=1)
+
+        ival_WSUN_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_WSUN_to_D_end = Period(freq='D', year=2007, month=1, day=7)
+        ival_WSAT_to_D_start = Period(freq='D', year=2006, month=12, day=31)
+        ival_WSAT_to_D_end = Period(freq='D', year=2007, month=1, day=6)
+        ival_WFRI_to_D_start = Period(freq='D', year=2006, month=12, day=30)
+        ival_WFRI_to_D_end = Period(freq='D', year=2007, month=1, day=5)
+        ival_WTHU_to_D_start = Period(freq='D', year=2006, month=12, day=29)
+        ival_WTHU_to_D_end = Period(freq='D', year=2007, month=1, day=4)
+        ival_WWED_to_D_start = Period(freq='D', year=2006, month=12, day=28)
+        ival_WWED_to_D_end = Period(freq='D', year=2007, month=1, day=3)
+        ival_WTUE_to_D_start = Period(freq='D', year=2006, month=12, day=27)
+        ival_WTUE_to_D_end = Period(freq='D', year=2007, month=1, day=2)
+        ival_WMON_to_D_start = Period(freq='D', year=2006, month=12, day=26)
+        ival_WMON_to_D_end = Period(freq='D', year=2007, month=1, day=1)
+
+        ival_W_end_of_year = Period(freq='W', year=2007, month=12, day=31)
+        ival_W_end_of_quarter = Period(freq='W', year=2007, month=3, day=31)
+        ival_W_end_of_month = Period(freq='W', year=2007, month=1, day=31)
+        ival_W_to_A = Period(freq='A', year=2007)
+        ival_W_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_W_to_M = Period(freq='M', year=2007, month=1)
+
+        if Period(freq='D', year=2007, month=12, day=31).weekday == 6:
+            ival_W_to_A_end_of_year = Period(freq='A', year=2007)
+        else:
+            ival_W_to_A_end_of_year = Period(freq='A', year=2008)
+
+        if Period(freq='D', year=2007, month=3, day=31).weekday == 6:
+            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=1)
+        else:
+            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=2)
+
+        if Period(freq='D', year=2007, month=1, day=31).weekday == 6:
+            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=1)
+        else:
+            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=2)
+
+        ival_W_to_B_start = Period(freq='B', year=2007, month=1, day=1)
+        ival_W_to_B_end = Period(freq='B', year=2007, month=1, day=5)
+        ival_W_to_D_start = Period(freq='D', year=2007, month=1, day=1)
+        ival_W_to_D_end = Period(freq='D', year=2007, month=1, day=7)
+        ival_W_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_W_to_H_end = Period(freq='H', year=2007, month=1, day=7, hour=23)
+        ival_W_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_W_to_T_end = Period(freq='Min', year=2007, month=1, day=7,
+                                 hour=23, minute=59)
+        ival_W_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_W_to_S_end = Period(freq='S', year=2007, month=1, day=7, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_W.asfreq('A') == ival_W_to_A
+        assert ival_W_end_of_year.asfreq('A') == ival_W_to_A_end_of_year
+
+        assert ival_W.asfreq('Q') == ival_W_to_Q
+        assert ival_W_end_of_quarter.asfreq('Q') == ival_W_to_Q_end_of_quarter
+
+        assert ival_W.asfreq('M') == ival_W_to_M
+        assert ival_W_end_of_month.asfreq('M') == ival_W_to_M_end_of_month
+
+        assert ival_W.asfreq('B', 'S') == ival_W_to_B_start
+        assert ival_W.asfreq('B', 'E') == ival_W_to_B_end
+
+        assert ival_W.asfreq('D', 'S') == ival_W_to_D_start
+        assert ival_W.asfreq('D', 'E') == ival_W_to_D_end
+
+        assert ival_WSUN.asfreq('D', 'S') == ival_WSUN_to_D_start
+        assert ival_WSUN.asfreq('D', 'E') == ival_WSUN_to_D_end
+        assert ival_WSAT.asfreq('D', 'S') == ival_WSAT_to_D_start
+        assert ival_WSAT.asfreq('D', 'E') == ival_WSAT_to_D_end
+        assert ival_WFRI.asfreq('D', 'S') == ival_WFRI_to_D_start
+        assert ival_WFRI.asfreq('D', 'E') == ival_WFRI_to_D_end
+        assert ival_WTHU.asfreq('D', 'S') == ival_WTHU_to_D_start
+        assert ival_WTHU.asfreq('D', 'E') == ival_WTHU_to_D_end
+        assert ival_WWED.asfreq('D', 'S') == ival_WWED_to_D_start
+        assert ival_WWED.asfreq('D', 'E') == ival_WWED_to_D_end
+        assert ival_WTUE.asfreq('D', 'S') == ival_WTUE_to_D_start
+        assert ival_WTUE.asfreq('D', 'E') == ival_WTUE_to_D_end
+        assert ival_WMON.asfreq('D', 'S') == ival_WMON_to_D_start
+        assert ival_WMON.asfreq('D', 'E') == ival_WMON_to_D_end
+
+        assert ival_W.asfreq('H', 'S') == ival_W_to_H_start
+        assert ival_W.asfreq('H', 'E') == ival_W_to_H_end
+        assert ival_W.asfreq('Min', 'S') == ival_W_to_T_start
+        assert ival_W.asfreq('Min', 'E') == ival_W_to_T_end
+        assert ival_W.asfreq('S', 'S') == ival_W_to_S_start
+        assert ival_W.asfreq('S', 'E') == ival_W_to_S_end
+
+        assert ival_W.asfreq('W') == ival_W
+
+        msg = INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            ival_W.asfreq('WK')
+
+    def test_conv_weekly_legacy(self):
+        # frequency conversion tests: from Weekly Frequency
+        msg = INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK', year=2007, month=1, day=1)
+
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-SAT', year=2007, month=1, day=6)
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-FRI', year=2007, month=1, day=5)
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-THU', year=2007, month=1, day=4)
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-WED', year=2007, month=1, day=3)
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-TUE', year=2007, month=1, day=2)
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK-MON', year=2007, month=1, day=1)
+
+    def test_conv_business(self):
+        # frequency conversion tests: from Business Frequency"
+
+        ival_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_B_end_of_year = Period(freq='B', year=2007, month=12, day=31)
+        ival_B_end_of_quarter = Period(freq='B', year=2007, month=3, day=30)
+        ival_B_end_of_month = Period(freq='B', year=2007, month=1, day=31)
+        ival_B_end_of_week = Period(freq='B', year=2007, month=1, day=5)
+
+        ival_B_to_A = Period(freq='A', year=2007)
+        ival_B_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_B_to_M = Period(freq='M', year=2007, month=1)
+        ival_B_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_B_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_B_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_B_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
+        ival_B_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_B_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
+                                 hour=23, minute=59)
+        ival_B_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_B_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_B.asfreq('A') == ival_B_to_A
+        assert ival_B_end_of_year.asfreq('A') == ival_B_to_A
+        assert ival_B.asfreq('Q') == ival_B_to_Q
+        assert ival_B_end_of_quarter.asfreq('Q') == ival_B_to_Q
+        assert ival_B.asfreq('M') == ival_B_to_M
+        assert ival_B_end_of_month.asfreq('M') == ival_B_to_M
+        assert ival_B.asfreq('W') == ival_B_to_W
+        assert ival_B_end_of_week.asfreq('W') == ival_B_to_W
+
+        assert ival_B.asfreq('D') == ival_B_to_D
+
+        assert ival_B.asfreq('H', 'S') == ival_B_to_H_start
+        assert ival_B.asfreq('H', 'E') == ival_B_to_H_end
+        assert ival_B.asfreq('Min', 'S') == ival_B_to_T_start
+        assert ival_B.asfreq('Min', 'E') == ival_B_to_T_end
+        assert ival_B.asfreq('S', 'S') == ival_B_to_S_start
+        assert ival_B.asfreq('S', 'E') == ival_B_to_S_end
+
+        assert ival_B.asfreq('B') == ival_B
+
+    def test_conv_daily(self):
+        # frequency conversion tests: from Business Frequency"
+
+        ival_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_D_end_of_year = Period(freq='D', year=2007, month=12, day=31)
+        ival_D_end_of_quarter = Period(freq='D', year=2007, month=3, day=31)
+        ival_D_end_of_month = Period(freq='D', year=2007, month=1, day=31)
+        ival_D_end_of_week = Period(freq='D', year=2007, month=1, day=7)
+
+        ival_D_friday = Period(freq='D', year=2007, month=1, day=5)
+        ival_D_saturday = Period(freq='D', year=2007, month=1, day=6)
+        ival_D_sunday = Period(freq='D', year=2007, month=1, day=7)
+
+        # TODO: unused?
+        # ival_D_monday = Period(freq='D', year=2007, month=1, day=8)
+
+        ival_B_friday = Period(freq='B', year=2007, month=1, day=5)
+        ival_B_monday = Period(freq='B', year=2007, month=1, day=8)
+
+        ival_D_to_A = Period(freq='A', year=2007)
+
+        ival_Deoq_to_AJAN = Period(freq='A-JAN', year=2008)
+        ival_Deoq_to_AJUN = Period(freq='A-JUN', year=2007)
+        ival_Deoq_to_ADEC = Period(freq='A-DEC', year=2007)
+
+        ival_D_to_QEJAN = Period(freq="Q-JAN", year=2007, quarter=4)
+        ival_D_to_QEJUN = Period(freq="Q-JUN", year=2007, quarter=3)
+        ival_D_to_QEDEC = Period(freq="Q-DEC", year=2007, quarter=1)
+
+        ival_D_to_M = Period(freq='M', year=2007, month=1)
+        ival_D_to_W = Period(freq='W', year=2007, month=1, day=7)
+
+        ival_D_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_D_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
+        ival_D_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_D_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
+                                 hour=23, minute=59)
+        ival_D_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_D_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
+                                 minute=59, second=59)
+
+        assert ival_D.asfreq('A') == ival_D_to_A
+
+        assert ival_D_end_of_quarter.asfreq('A-JAN') == ival_Deoq_to_AJAN
+        assert ival_D_end_of_quarter.asfreq('A-JUN') == ival_Deoq_to_AJUN
+        assert ival_D_end_of_quarter.asfreq('A-DEC') == ival_Deoq_to_ADEC
+
+        assert ival_D_end_of_year.asfreq('A') == ival_D_to_A
+        assert ival_D_end_of_quarter.asfreq('Q') == ival_D_to_QEDEC
+        assert ival_D.asfreq("Q-JAN") == ival_D_to_QEJAN
+        assert ival_D.asfreq("Q-JUN") == ival_D_to_QEJUN
+        assert ival_D.asfreq("Q-DEC") == ival_D_to_QEDEC
+        assert ival_D.asfreq('M') == ival_D_to_M
+        assert ival_D_end_of_month.asfreq('M') == ival_D_to_M
+        assert ival_D.asfreq('W') == ival_D_to_W
+        assert ival_D_end_of_week.asfreq('W') == ival_D_to_W
+
+        assert ival_D_friday.asfreq('B') == ival_B_friday
+        assert ival_D_saturday.asfreq('B', 'S') == ival_B_friday
+        assert ival_D_saturday.asfreq('B', 'E') == ival_B_monday
+        assert ival_D_sunday.asfreq('B', 'S') == ival_B_friday
+        assert ival_D_sunday.asfreq('B', 'E') == ival_B_monday
+
+        assert ival_D.asfreq('H', 'S') == ival_D_to_H_start
+        assert ival_D.asfreq('H', 'E') == ival_D_to_H_end
+        assert ival_D.asfreq('Min', 'S') == ival_D_to_T_start
+        assert ival_D.asfreq('Min', 'E') == ival_D_to_T_end
+        assert ival_D.asfreq('S', 'S') == ival_D_to_S_start
+        assert ival_D.asfreq('S', 'E') == ival_D_to_S_end
+
+        assert ival_D.asfreq('D') == ival_D
+
+    def test_conv_hourly(self):
+        # frequency conversion tests: from Hourly Frequency"
+
+        ival_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_H_end_of_year = Period(freq='H', year=2007, month=12, day=31,
+                                    hour=23)
+        ival_H_end_of_quarter = Period(freq='H', year=2007, month=3, day=31,
+                                       hour=23)
+        ival_H_end_of_month = Period(freq='H', year=2007, month=1, day=31,
+                                     hour=23)
+        ival_H_end_of_week = Period(freq='H', year=2007, month=1, day=7,
+                                    hour=23)
+        ival_H_end_of_day = Period(freq='H', year=2007, month=1, day=1,
+                                   hour=23)
+        ival_H_end_of_bus = Period(freq='H', year=2007, month=1, day=1,
+                                   hour=23)
+
+        ival_H_to_A = Period(freq='A', year=2007)
+        ival_H_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_H_to_M = Period(freq='M', year=2007, month=1)
+        ival_H_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_H_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_H_to_B = Period(freq='B', year=2007, month=1, day=1)
+
+        ival_H_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=0, minute=0)
+        ival_H_to_T_end = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                                 minute=59)
+        ival_H_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_H_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                 minute=59, second=59)
+
+        assert ival_H.asfreq('A') == ival_H_to_A
+        assert ival_H_end_of_year.asfreq('A') == ival_H_to_A
+        assert ival_H.asfreq('Q') == ival_H_to_Q
+        assert ival_H_end_of_quarter.asfreq('Q') == ival_H_to_Q
+        assert ival_H.asfreq('M') == ival_H_to_M
+        assert ival_H_end_of_month.asfreq('M') == ival_H_to_M
+        assert ival_H.asfreq('W') == ival_H_to_W
+        assert ival_H_end_of_week.asfreq('W') == ival_H_to_W
+        assert ival_H.asfreq('D') == ival_H_to_D
+        assert ival_H_end_of_day.asfreq('D') == ival_H_to_D
+        assert ival_H.asfreq('B') == ival_H_to_B
+        assert ival_H_end_of_bus.asfreq('B') == ival_H_to_B
+
+        assert ival_H.asfreq('Min', 'S') == ival_H_to_T_start
+        assert ival_H.asfreq('Min', 'E') == ival_H_to_T_end
+        assert ival_H.asfreq('S', 'S') == ival_H_to_S_start
+        assert ival_H.asfreq('S', 'E') == ival_H_to_S_end
+
+        assert ival_H.asfreq('H') == ival_H
+
+    def test_conv_minutely(self):
+        # frequency conversion tests: from Minutely Frequency"
+
+        ival_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0)
+        ival_T_end_of_year = Period(freq='Min', year=2007, month=12, day=31,
+                                    hour=23, minute=59)
+        ival_T_end_of_quarter = Period(freq='Min', year=2007, month=3, day=31,
+                                       hour=23, minute=59)
+        ival_T_end_of_month = Period(freq='Min', year=2007, month=1, day=31,
+                                     hour=23, minute=59)
+        ival_T_end_of_week = Period(freq='Min', year=2007, month=1, day=7,
+                                    hour=23, minute=59)
+        ival_T_end_of_day = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=23, minute=59)
+        ival_T_end_of_bus = Period(freq='Min', year=2007, month=1, day=1,
+                                   hour=23, minute=59)
+        ival_T_end_of_hour = Period(freq='Min', year=2007, month=1, day=1,
+                                    hour=0, minute=59)
+
+        ival_T_to_A = Period(freq='A', year=2007)
+        ival_T_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_T_to_M = Period(freq='M', year=2007, month=1)
+        ival_T_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_T_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_T_to_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_T_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+
+        ival_T_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                   minute=0, second=0)
+        ival_T_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
+                                 minute=0, second=59)
+
+        assert ival_T.asfreq('A') == ival_T_to_A
+        assert ival_T_end_of_year.asfreq('A') == ival_T_to_A
+        assert ival_T.asfreq('Q') == ival_T_to_Q
+        assert ival_T_end_of_quarter.asfreq('Q') == ival_T_to_Q
+        assert ival_T.asfreq('M') == ival_T_to_M
+        assert ival_T_end_of_month.asfreq('M') == ival_T_to_M
+        assert ival_T.asfreq('W') == ival_T_to_W
+        assert ival_T_end_of_week.asfreq('W') == ival_T_to_W
+        assert ival_T.asfreq('D') == ival_T_to_D
+        assert ival_T_end_of_day.asfreq('D') == ival_T_to_D
+        assert ival_T.asfreq('B') == ival_T_to_B
+        assert ival_T_end_of_bus.asfreq('B') == ival_T_to_B
+        assert ival_T.asfreq('H') == ival_T_to_H
+        assert ival_T_end_of_hour.asfreq('H') == ival_T_to_H
+
+        assert ival_T.asfreq('S', 'S') == ival_T_to_S_start
+        assert ival_T.asfreq('S', 'E') == ival_T_to_S_end
+
+        assert ival_T.asfreq('Min') == ival_T
+
+    def test_conv_secondly(self):
+        # frequency conversion tests: from Secondly Frequency"
+
+        ival_S = Period(freq='S', year=2007, month=1, day=1, hour=0, minute=0,
+                        second=0)
+        ival_S_end_of_year = Period(freq='S', year=2007, month=12, day=31,
+                                    hour=23, minute=59, second=59)
+        ival_S_end_of_quarter = Period(freq='S', year=2007, month=3, day=31,
+                                       hour=23, minute=59, second=59)
+        ival_S_end_of_month = Period(freq='S', year=2007, month=1, day=31,
+                                     hour=23, minute=59, second=59)
+        ival_S_end_of_week = Period(freq='S', year=2007, month=1, day=7,
+                                    hour=23, minute=59, second=59)
+        ival_S_end_of_day = Period(freq='S', year=2007, month=1, day=1,
+                                   hour=23, minute=59, second=59)
+        ival_S_end_of_bus = Period(freq='S', year=2007, month=1, day=1,
+                                   hour=23, minute=59, second=59)
+        ival_S_end_of_hour = Period(freq='S', year=2007, month=1, day=1,
+                                    hour=0, minute=59, second=59)
+        ival_S_end_of_minute = Period(freq='S', year=2007, month=1, day=1,
+                                      hour=0, minute=0, second=59)
+
+        ival_S_to_A = Period(freq='A', year=2007)
+        ival_S_to_Q = Period(freq='Q', year=2007, quarter=1)
+        ival_S_to_M = Period(freq='M', year=2007, month=1)
+        ival_S_to_W = Period(freq='W', year=2007, month=1, day=7)
+        ival_S_to_D = Period(freq='D', year=2007, month=1, day=1)
+        ival_S_to_B = Period(freq='B', year=2007, month=1, day=1)
+        ival_S_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        ival_S_to_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                             minute=0)
+
+        assert ival_S.asfreq('A') == ival_S_to_A
+        assert ival_S_end_of_year.asfreq('A') == ival_S_to_A
+        assert ival_S.asfreq('Q') == ival_S_to_Q
+        assert ival_S_end_of_quarter.asfreq('Q') == ival_S_to_Q
+        assert ival_S.asfreq('M') == ival_S_to_M
+        assert ival_S_end_of_month.asfreq('M') == ival_S_to_M
+        assert ival_S.asfreq('W') == ival_S_to_W
+        assert ival_S_end_of_week.asfreq('W') == ival_S_to_W
+        assert ival_S.asfreq('D') == ival_S_to_D
+        assert ival_S_end_of_day.asfreq('D') == ival_S_to_D
+        assert ival_S.asfreq('B') == ival_S_to_B
+        assert ival_S_end_of_bus.asfreq('B') == ival_S_to_B
+        assert ival_S.asfreq('H') == ival_S_to_H
+        assert ival_S_end_of_hour.asfreq('H') == ival_S_to_H
+        assert ival_S.asfreq('Min') == ival_S_to_T
+        assert ival_S_end_of_minute.asfreq('Min') == ival_S_to_T
+
+        assert ival_S.asfreq('S') == ival_S
+
+    def test_asfreq_mult(self):
+        # normal freq to mult freq
+        p = Period(freq='A', year=2007)
+        # ordinal will not change
+        for freq in ['3A', offsets.YearEnd(3)]:
+            result = p.asfreq(freq)
+            expected = Period('2007', freq='3A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        # ordinal will not change
+        for freq in ['3A', offsets.YearEnd(3)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007', freq='3A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        # mult freq to normal freq
+        p = Period(freq='3A', year=2007)
+        # ordinal will change because how=E is the default
+        for freq in ['A', offsets.YearEnd()]:
+            result = p.asfreq(freq)
+            expected = Period('2009', freq='A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        # ordinal will not change
+        for freq in ['A', offsets.YearEnd()]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007', freq='A')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        p = Period(freq='A', year=2007)
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq)
+            expected = Period('2007-12', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007-01', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        p = Period(freq='3A', year=2007)
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq)
+            expected = Period('2009-12', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+        for freq in ['2M', offsets.MonthEnd(2)]:
+            result = p.asfreq(freq, how='S')
+            expected = Period('2007-01', freq='2M')
+
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+    def test_asfreq_combined(self):
+        # normal freq to combined freq
+        p = Period('2007', freq='H')
+
+        # ordinal will not change
+        expected = Period('2007', freq='25H')
+        for freq, how in zip(['1D1H', '1H1D'], ['E', 'S']):
+            result = p.asfreq(freq, how=how)
+            assert result == expected
+            assert result.ordinal == expected.ordinal
+            assert result.freq == expected.freq
+
+        # combined freq to normal freq
+        p1 = Period(freq='1D1H', year=2007)
+        p2 = Period(freq='1H1D', year=2007)
+
+        # ordinal will change because how=E is the default
+        result1 = p1.asfreq('H')
+        result2 = p2.asfreq('H')
+        expected = Period('2007-01-02', freq='H')
+        assert result1 == expected
+        assert result1.ordinal == expected.ordinal
+        assert result1.freq == expected.freq
+        assert result2 == expected
+        assert result2.ordinal == expected.ordinal
+        assert result2.freq == expected.freq
+
+        # ordinal will not change
+        result1 = p1.asfreq('H', how='S')
+        result2 = p2.asfreq('H', how='S')
+        expected = Period('2007-01-01', freq='H')
+        assert result1 == expected
+        assert result1.ordinal == expected.ordinal
+        assert result1.freq == expected.freq
+        assert result2 == expected
+        assert result2.ordinal == expected.ordinal
+        assert result2.freq == expected.freq
+
+    def test_asfreq_MS(self):
+        initial = Period("2013")
+
+        assert initial.asfreq(freq="M", how="S") == Period('2013-01', 'M')
+
+        msg = INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            initial.asfreq(freq="MS", how="S")
+
+        with pytest.raises(ValueError, match=msg):
+            Period('2013-01', 'MS')
+
+        assert _period_code_map.get("MS") is None
diff --git a/pandas/tests/scalar/period/test_period.py b/pandas/tests/scalar/period/test_period.py
new file mode 100644
index 0000000000000..8ca19745055a3
--- /dev/null
+++ b/pandas/tests/scalar/period/test_period.py
@@ -0,0 +1,1498 @@
+from datetime import date, datetime, timedelta
+
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslibs import iNaT, period as libperiod
+from pandas._libs.tslibs.ccalendar import DAYS, MONTHS
+from pandas._libs.tslibs.frequencies import INVALID_FREQ_ERR_MSG
+from pandas._libs.tslibs.parsing import DateParseError
+from pandas._libs.tslibs.period import IncompatibleFrequency
+from pandas._libs.tslibs.timezones import dateutil_gettz, maybe_get_tz
+from pandas.compat import iteritems, text_type
+from pandas.compat.numpy import np_datetime64_compat
+
+import pandas as pd
+from pandas import NaT, Period, Timedelta, Timestamp, offsets
+import pandas.core.indexes.period as period
+import pandas.util.testing as tm
+
+
+class TestPeriodConstruction(object):
+    def test_construction(self):
+        i1 = Period('1/1/2005', freq='M')
+        i2 = Period('Jan 2005')
+
+        assert i1 == i2
+
+        i1 = Period('2005', freq='A')
+        i2 = Period('2005')
+        i3 = Period('2005', freq='a')
+
+        assert i1 == i2
+        assert i1 == i3
+
+        i4 = Period('2005', freq='M')
+        i5 = Period('2005', freq='m')
+
+        msg = r"Input has different freq=M from Period\(freq=A-DEC\)"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            i1 != i4
+        assert i4 == i5
+
+        i1 = Period.now('Q')
+        i2 = Period(datetime.now(), freq='Q')
+        i3 = Period.now('q')
+
+        assert i1 == i2
+        assert i1 == i3
+
+        i1 = Period('1982', freq='min')
+        i2 = Period('1982', freq='MIN')
+        assert i1 == i2
+        i2 = Period('1982', freq=('Min', 1))
+        assert i1 == i2
+
+        i1 = Period(year=2005, month=3, day=1, freq='D')
+        i2 = Period('3/1/2005', freq='D')
+        assert i1 == i2
+
+        i3 = Period(year=2005, month=3, day=1, freq='d')
+        assert i1 == i3
+
+        i1 = Period('2007-01-01 09:00:00.001')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat(
+            '2007-01-01 09:00:00.001Z'), freq='L')
+        assert i1 == expected
+
+        i1 = Period('2007-01-01 09:00:00.00101')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
+                          freq='U')
+        assert i1 == expected
+
+        msg = "Must supply freq for ordinal value"
+        with pytest.raises(ValueError, match=msg):
+            Period(ordinal=200701)
+
+        with pytest.raises(ValueError, match="Invalid frequency: X"):
+            Period('2007-1-1', freq='X')
+
+    def test_construction_bday(self):
+
+        # Biz day construction, roll forward if non-weekday
+        i1 = Period('3/10/12', freq='B')
+        i2 = Period('3/10/12', freq='D')
+        assert i1 == i2.asfreq('B')
+        i2 = Period('3/11/12', freq='D')
+        assert i1 == i2.asfreq('B')
+        i2 = Period('3/12/12', freq='D')
+        assert i1 == i2.asfreq('B')
+
+        i3 = Period('3/10/12', freq='b')
+        assert i1 == i3
+
+        i1 = Period(year=2012, month=3, day=10, freq='B')
+        i2 = Period('3/12/12', freq='B')
+        assert i1 == i2
+
+    def test_construction_quarter(self):
+
+        i1 = Period(year=2005, quarter=1, freq='Q')
+        i2 = Period('1/1/2005', freq='Q')
+        assert i1 == i2
+
+        i1 = Period(year=2005, quarter=3, freq='Q')
+        i2 = Period('9/1/2005', freq='Q')
+        assert i1 == i2
+
+        i1 = Period('2005Q1')
+        i2 = Period(year=2005, quarter=1, freq='Q')
+        i3 = Period('2005q1')
+        assert i1 == i2
+        assert i1 == i3
+
+        i1 = Period('05Q1')
+        assert i1 == i2
+        lower = Period('05q1')
+        assert i1 == lower
+
+        i1 = Period('1Q2005')
+        assert i1 == i2
+        lower = Period('1q2005')
+        assert i1 == lower
+
+        i1 = Period('1Q05')
+        assert i1 == i2
+        lower = Period('1q05')
+        assert i1 == lower
+
+        i1 = Period('4Q1984')
+        assert i1.year == 1984
+        lower = Period('4q1984')
+        assert i1 == lower
+
+    def test_construction_month(self):
+
+        expected = Period('2007-01', freq='M')
+        i1 = Period('200701', freq='M')
+        assert i1 == expected
+
+        i1 = Period('200701', freq='M')
+        assert i1 == expected
+
+        i1 = Period(200701, freq='M')
+        assert i1 == expected
+
+        i1 = Period(ordinal=200701, freq='M')
+        assert i1.year == 18695
+
+        i1 = Period(datetime(2007, 1, 1), freq='M')
+        i2 = Period('200701', freq='M')
+        assert i1 == i2
+
+        i1 = Period(date(2007, 1, 1), freq='M')
+        i2 = Period(datetime(2007, 1, 1), freq='M')
+        i3 = Period(np.datetime64('2007-01-01'), freq='M')
+        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
+        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
+        assert i1 == i2
+        assert i1 == i3
+        assert i1 == i4
+        assert i1 == i5
+
+    def test_period_constructor_offsets(self):
+        assert (Period('1/1/2005', freq=offsets.MonthEnd()) ==
+                Period('1/1/2005', freq='M'))
+        assert (Period('2005', freq=offsets.YearEnd()) ==
+                Period('2005', freq='A'))
+        assert (Period('2005', freq=offsets.MonthEnd()) ==
+                Period('2005', freq='M'))
+        assert (Period('3/10/12', freq=offsets.BusinessDay()) ==
+                Period('3/10/12', freq='B'))
+        assert (Period('3/10/12', freq=offsets.Day()) ==
+                Period('3/10/12', freq='D'))
+
+        assert (Period(year=2005, quarter=1,
+                       freq=offsets.QuarterEnd(startingMonth=12)) ==
+                Period(year=2005, quarter=1, freq='Q'))
+        assert (Period(year=2005, quarter=2,
+                       freq=offsets.QuarterEnd(startingMonth=12)) ==
+                Period(year=2005, quarter=2, freq='Q'))
+
+        assert (Period(year=2005, month=3, day=1, freq=offsets.Day()) ==
+                Period(year=2005, month=3, day=1, freq='D'))
+        assert (Period(year=2012, month=3, day=10, freq=offsets.BDay()) ==
+                Period(year=2012, month=3, day=10, freq='B'))
+
+        expected = Period('2005-03-01', freq='3D')
+        assert (Period(year=2005, month=3, day=1,
+                       freq=offsets.Day(3)) == expected)
+        assert Period(year=2005, month=3, day=1, freq='3D') == expected
+
+        assert (Period(year=2012, month=3, day=10,
+                       freq=offsets.BDay(3)) ==
+                Period(year=2012, month=3, day=10, freq='3B'))
+
+        assert (Period(200701, freq=offsets.MonthEnd()) ==
+                Period(200701, freq='M'))
+
+        i1 = Period(ordinal=200701, freq=offsets.MonthEnd())
+        i2 = Period(ordinal=200701, freq='M')
+        assert i1 == i2
+        assert i1.year == 18695
+        assert i2.year == 18695
+
+        i1 = Period(datetime(2007, 1, 1), freq='M')
+        i2 = Period('200701', freq='M')
+        assert i1 == i2
+
+        i1 = Period(date(2007, 1, 1), freq='M')
+        i2 = Period(datetime(2007, 1, 1), freq='M')
+        i3 = Period(np.datetime64('2007-01-01'), freq='M')
+        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
+        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
+        assert i1 == i2
+        assert i1 == i3
+        assert i1 == i4
+        assert i1 == i5
+
+        i1 = Period('2007-01-01 09:00:00.001')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat(
+            '2007-01-01 09:00:00.001Z'), freq='L')
+        assert i1 == expected
+
+        i1 = Period('2007-01-01 09:00:00.00101')
+        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
+        assert i1 == expected
+
+        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
+                          freq='U')
+        assert i1 == expected
+
+    def test_invalid_arguments(self):
+        with pytest.raises(ValueError):
+            Period(datetime.now())
+        with pytest.raises(ValueError):
+            Period(datetime.now().date())
+
+        with pytest.raises(ValueError):
+            Period(1.6, freq='D')
+        with pytest.raises(ValueError):
+            Period(ordinal=1.6, freq='D')
+        with pytest.raises(ValueError):
+            Period(ordinal=2, value=1, freq='D')
+
+        with pytest.raises(ValueError):
+            Period(month=1)
+
+        with pytest.raises(ValueError):
+            Period('-2000', 'A')
+        with pytest.raises(DateParseError):
+            Period('0', 'A')
+        with pytest.raises(DateParseError):
+            Period('1/1/-2000', 'A')
+
+    def test_constructor_corner(self):
+        expected = Period('2007-01', freq='2M')
+        assert Period(year=2007, month=1, freq='2M') == expected
+
+        assert Period(None) is NaT
+
+        p = Period('2007-01-01', freq='D')
+
+        result = Period(p, freq='A')
+        exp = Period('2007', freq='A')
+        assert result == exp
+
+    def test_constructor_infer_freq(self):
+        p = Period('2007-01-01')
+        assert p.freq == 'D'
+
+        p = Period('2007-01-01 07')
+        assert p.freq == 'H'
+
+        p = Period('2007-01-01 07:10')
+        assert p.freq == 'T'
+
+        p = Period('2007-01-01 07:10:15')
+        assert p.freq == 'S'
+
+        p = Period('2007-01-01 07:10:15.123')
+        assert p.freq == 'L'
+
+        p = Period('2007-01-01 07:10:15.123000')
+        assert p.freq == 'L'
+
+        p = Period('2007-01-01 07:10:15.123400')
+        assert p.freq == 'U'
+
+    def test_multiples(self):
+        result1 = Period('1989', freq='2A')
+        result2 = Period('1989', freq='A')
+        assert result1.ordinal == result2.ordinal
+        assert result1.freqstr == '2A-DEC'
+        assert result2.freqstr == 'A-DEC'
+        assert result1.freq == offsets.YearEnd(2)
+        assert result2.freq == offsets.YearEnd()
+
+        assert (result1 + 1).ordinal == result1.ordinal + 2
+        assert (1 + result1).ordinal == result1.ordinal + 2
+        assert (result1 - 1).ordinal == result2.ordinal - 2
+        assert (-1 + result1).ordinal == result2.ordinal - 2
+
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_period_cons_quarterly(self, month):
+        # bugs in scikits.timeseries
+        freq = 'Q-%s' % month
+        exp = Period('1989Q3', freq=freq)
+        assert '1989Q3' in str(exp)
+        stamp = exp.to_timestamp('D', how='end')
+        p = Period(stamp, freq=freq)
+        assert p == exp
+
+        stamp = exp.to_timestamp('3D', how='end')
+        p = Period(stamp, freq=freq)
+        assert p == exp
+
+    @pytest.mark.parametrize('month', MONTHS)
+    def test_period_cons_annual(self, month):
+        # bugs in scikits.timeseries
+        freq = 'A-%s' % month
+        exp = Period('1989', freq=freq)
+        stamp = exp.to_timestamp('D', how='end') + timedelta(days=30)
+        p = Period(stamp, freq=freq)
+
+        assert p == exp + 1
+        assert isinstance(p, Period)
+
+    @pytest.mark.parametrize('day', DAYS)
+    @pytest.mark.parametrize('num', range(10, 17))
+    def test_period_cons_weekly(self, num, day):
+        daystr = '2011-02-%d' % num
+        freq = 'W-%s' % day
+
+        result = Period(daystr, freq=freq)
+        expected = Period(daystr, freq='D').asfreq(freq)
+        assert result == expected
+        assert isinstance(result, Period)
+
+    def test_period_from_ordinal(self):
+        p = Period('2011-01', freq='M')
+        res = Period._from_ordinal(p.ordinal, freq='M')
+        assert p == res
+        assert isinstance(res, Period)
+
+    def test_period_cons_nat(self):
+        p = Period('NaT', freq='M')
+        assert p is NaT
+
+        p = Period('nat', freq='W-SUN')
+        assert p is NaT
+
+        p = Period(iNaT, freq='D')
+        assert p is NaT
+
+        p = Period(iNaT, freq='3D')
+        assert p is NaT
+
+        p = Period(iNaT, freq='1D1H')
+        assert p is NaT
+
+        p = Period('NaT')
+        assert p is NaT
+
+        p = Period(iNaT)
+        assert p is NaT
+
+    def test_period_cons_mult(self):
+        p1 = Period('2011-01', freq='3M')
+        p2 = Period('2011-01', freq='M')
+        assert p1.ordinal == p2.ordinal
+
+        assert p1.freq == offsets.MonthEnd(3)
+        assert p1.freqstr == '3M'
+
+        assert p2.freq == offsets.MonthEnd()
+        assert p2.freqstr == 'M'
+
+        result = p1 + 1
+        assert result.ordinal == (p2 + 3).ordinal
+
+        assert result.freq == p1.freq
+        assert result.freqstr == '3M'
+
+        result = p1 - 1
+        assert result.ordinal == (p2 - 3).ordinal
+        assert result.freq == p1.freq
+        assert result.freqstr == '3M'
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -3M')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='-3M')
+
+        msg = ('Frequency must be positive, because it' ' represents span: 0M')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='0M')
+
+    def test_period_cons_combined(self):
+        p = [(Period('2011-01', freq='1D1H'),
+              Period('2011-01', freq='1H1D'),
+              Period('2011-01', freq='H')),
+             (Period(ordinal=1, freq='1D1H'),
+              Period(ordinal=1, freq='1H1D'),
+              Period(ordinal=1, freq='H'))]
+
+        for p1, p2, p3 in p:
+            assert p1.ordinal == p3.ordinal
+            assert p2.ordinal == p3.ordinal
+
+            assert p1.freq == offsets.Hour(25)
+            assert p1.freqstr == '25H'
+
+            assert p2.freq == offsets.Hour(25)
+            assert p2.freqstr == '25H'
+
+            assert p3.freq == offsets.Hour()
+            assert p3.freqstr == 'H'
+
+            result = p1 + 1
+            assert result.ordinal == (p3 + 25).ordinal
+            assert result.freq == p1.freq
+            assert result.freqstr == '25H'
+
+            result = p2 + 1
+            assert result.ordinal == (p3 + 25).ordinal
+            assert result.freq == p2.freq
+            assert result.freqstr == '25H'
+
+            result = p1 - 1
+            assert result.ordinal == (p3 - 25).ordinal
+            assert result.freq == p1.freq
+            assert result.freqstr == '25H'
+
+            result = p2 - 1
+            assert result.ordinal == (p3 - 25).ordinal
+            assert result.freq == p2.freq
+            assert result.freqstr == '25H'
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: -25H')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='-1D1H')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='-1H1D')
+        with pytest.raises(ValueError, match=msg):
+            Period(ordinal=1, freq='-1D1H')
+        with pytest.raises(ValueError, match=msg):
+            Period(ordinal=1, freq='-1H1D')
+
+        msg = ('Frequency must be positive, because it'
+               ' represents span: 0D')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='0D0H')
+        with pytest.raises(ValueError, match=msg):
+            Period(ordinal=1, freq='0D0H')
+
+        # You can only combine together day and intraday offsets
+        msg = ('Invalid frequency: 1W1D')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='1W1D')
+        msg = ('Invalid frequency: 1D1W')
+        with pytest.raises(ValueError, match=msg):
+            Period('2011-01', freq='1D1W')
+
+
+class TestPeriodMethods(object):
+    def test_round_trip(self):
+        p = Period('2000Q1')
+        new_p = tm.round_trip_pickle(p)
+        assert new_p == p
+
+    def test_hash(self):
+        assert (hash(Period('2011-01', freq='M')) ==
+                hash(Period('2011-01', freq='M')))
+
+        assert (hash(Period('2011-01-01', freq='D')) !=
+                hash(Period('2011-01', freq='M')))
+
+        assert (hash(Period('2011-01', freq='3M')) !=
+                hash(Period('2011-01', freq='2M')))
+
+        assert (hash(Period('2011-01', freq='M')) !=
+                hash(Period('2011-02', freq='M')))
+
+    # --------------------------------------------------------------
+    # to_timestamp
+
+    @pytest.mark.parametrize('tzstr', ['Europe/Brussels',
+                                       'Asia/Tokyo', 'US/Pacific'])
+    def test_to_timestamp_tz_arg(self, tzstr):
+        p = Period('1/1/2005', freq='M').to_timestamp(tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='3H').to_timestamp(tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='A').to_timestamp(freq='A', tz=tzstr)
+        exp = Timestamp('31/12/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='A').to_timestamp(freq='3H', tz=tzstr)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        exp_zone = pytz.timezone(tzstr).normalize(p)
+
+        assert p == exp
+        assert p.tz == exp_zone.tzinfo
+        assert p.tz == exp.tz
+
+    @pytest.mark.parametrize('tzstr', ['dateutil/Europe/Brussels',
+                                       'dateutil/Asia/Tokyo',
+                                       'dateutil/US/Pacific'])
+    def test_to_timestamp_tz_arg_dateutil(self, tzstr):
+        tz = maybe_get_tz(tzstr)
+        p = Period('1/1/2005', freq='M').to_timestamp(tz=tz)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        assert p == exp
+        assert p.tz == dateutil_gettz(tzstr.split('/', 1)[1])
+        assert p.tz == exp.tz
+
+        p = Period('1/1/2005', freq='M').to_timestamp(freq='3H', tz=tz)
+        exp = Timestamp('1/1/2005', tz='UTC').tz_convert(tzstr)
+        assert p == exp
+        assert p.tz == dateutil_gettz(tzstr.split('/', 1)[1])
+        assert p.tz == exp.tz
+
+    def test_to_timestamp_tz_arg_dateutil_from_string(self):
+        p = Period('1/1/2005',
+                   freq='M').to_timestamp(tz='dateutil/Europe/Brussels')
+        assert p.tz == dateutil_gettz('Europe/Brussels')
+
+    def test_to_timestamp_mult(self):
+        p = Period('2011-01', freq='M')
+        assert p.to_timestamp(how='S') == Timestamp('2011-01-01')
+        expected = Timestamp('2011-02-01') - Timedelta(1, 'ns')
+        assert p.to_timestamp(how='E') == expected
+
+        p = Period('2011-01', freq='3M')
+        assert p.to_timestamp(how='S') == Timestamp('2011-01-01')
+        expected = Timestamp('2011-04-01') - Timedelta(1, 'ns')
+        assert p.to_timestamp(how='E') == expected
+
+    def test_to_timestamp(self):
+        p = Period('1982', freq='A')
+        start_ts = p.to_timestamp(how='S')
+        aliases = ['s', 'StarT', 'BEGIn']
+        for a in aliases:
+            assert start_ts == p.to_timestamp('D', how=a)
+            # freq with mult should not affect to the result
+            assert start_ts == p.to_timestamp('3D', how=a)
+
+        end_ts = p.to_timestamp(how='E')
+        aliases = ['e', 'end', 'FINIsH']
+        for a in aliases:
+            assert end_ts == p.to_timestamp('D', how=a)
+            assert end_ts == p.to_timestamp('3D', how=a)
+
+        from_lst = ['A', 'Q', 'M', 'W', 'B', 'D', 'H', 'Min', 'S']
+
+        def _ex(p):
+            return Timestamp((p + p.freq).start_time.value - 1)
+
+        for i, fcode in enumerate(from_lst):
+            p = Period('1982', freq=fcode)
+            result = p.to_timestamp().to_period(fcode)
+            assert result == p
+
+            assert p.start_time == p.to_timestamp(how='S')
+
+            assert p.end_time == _ex(p)
+
+        # Frequency other than daily
+
+        p = Period('1985', freq='A')
+
+        result = p.to_timestamp('H', how='end')
+        expected = Timestamp(1986, 1, 1) - Timedelta(1, 'ns')
+        assert result == expected
+        result = p.to_timestamp('3H', how='end')
+        assert result == expected
+
+        result = p.to_timestamp('T', how='end')
+        expected = Timestamp(1986, 1, 1) - Timedelta(1, 'ns')
+        assert result == expected
+        result = p.to_timestamp('2T', how='end')
+        assert result == expected
+
+        result = p.to_timestamp(how='end')
+        expected = Timestamp(1986, 1, 1) - Timedelta(1, 'ns')
+        assert result == expected
+
+        expected = datetime(1985, 1, 1)
+        result = p.to_timestamp('H', how='start')
+        assert result == expected
+        result = p.to_timestamp('T', how='start')
+        assert result == expected
+        result = p.to_timestamp('S', how='start')
+        assert result == expected
+        result = p.to_timestamp('3H', how='start')
+        assert result == expected
+        result = p.to_timestamp('5S', how='start')
+        assert result == expected
+
+    # --------------------------------------------------------------
+    # Rendering: __repr__, strftime, etc
+
+    def test_repr(self):
+        p = Period('Jan-2000')
+        assert '2000-01' in repr(p)
+
+        p = Period('2000-12-15')
+        assert '2000-12-15' in repr(p)
+
+    def test_repr_nat(self):
+        p = Period('nat', freq='M')
+        assert repr(NaT) in repr(p)
+
+    def test_millisecond_repr(self):
+        p = Period('2000-01-01 12:15:02.123')
+
+        assert repr(p) == "Period('2000-01-01 12:15:02.123', 'L')"
+
+    def test_microsecond_repr(self):
+        p = Period('2000-01-01 12:15:02.123567')
+
+        assert repr(p) == "Period('2000-01-01 12:15:02.123567', 'U')"
+
+    def test_strftime(self):
+        # GH#3363
+        p = Period('2000-1-1 12:34:12', freq='S')
+        res = p.strftime('%Y-%m-%d %H:%M:%S')
+        assert res == '2000-01-01 12:34:12'
+        assert isinstance(res, text_type)
+
+
+class TestPeriodProperties(object):
+    "Test properties such as year, month, weekday, etc...."
+
+    @pytest.mark.parametrize('freq', ['A', 'M', 'D', 'H'])
+    def test_is_leap_year(self, freq):
+        # GH 13727
+        p = Period('2000-01-01 00:00:00', freq=freq)
+        assert p.is_leap_year
+        assert isinstance(p.is_leap_year, bool)
+
+        p = Period('1999-01-01 00:00:00', freq=freq)
+        assert not p.is_leap_year
+
+        p = Period('2004-01-01 00:00:00', freq=freq)
+        assert p.is_leap_year
+
+        p = Period('2100-01-01 00:00:00', freq=freq)
+        assert not p.is_leap_year
+
+    def test_quarterly_negative_ordinals(self):
+        p = Period(ordinal=-1, freq='Q-DEC')
+        assert p.year == 1969
+        assert p.quarter == 4
+        assert isinstance(p, Period)
+
+        p = Period(ordinal=-2, freq='Q-DEC')
+        assert p.year == 1969
+        assert p.quarter == 3
+        assert isinstance(p, Period)
+
+        p = Period(ordinal=-2, freq='M')
+        assert p.year == 1969
+        assert p.month == 11
+        assert isinstance(p, Period)
+
+    def test_freq_str(self):
+        i1 = Period('1982', freq='Min')
+        assert i1.freq == offsets.Minute()
+        assert i1.freqstr == 'T'
+
+    def test_period_deprecated_freq(self):
+        cases = {"M": ["MTH", "MONTH", "MONTHLY", "Mth", "month", "monthly"],
+                 "B": ["BUS", "BUSINESS", "BUSINESSLY", "WEEKDAY", "bus"],
+                 "D": ["DAY", "DLY", "DAILY", "Day", "Dly", "Daily"],
+                 "H": ["HR", "HOUR", "HRLY", "HOURLY", "hr", "Hour", "HRly"],
+                 "T": ["minute", "MINUTE", "MINUTELY", "minutely"],
+                 "S": ["sec", "SEC", "SECOND", "SECONDLY", "second"],
+                 "L": ["MILLISECOND", "MILLISECONDLY", "millisecond"],
+                 "U": ["MICROSECOND", "MICROSECONDLY", "microsecond"],
+                 "N": ["NANOSECOND", "NANOSECONDLY", "nanosecond"]}
+
+        msg = INVALID_FREQ_ERR_MSG
+        for exp, freqs in iteritems(cases):
+            for freq in freqs:
+                with pytest.raises(ValueError, match=msg):
+                    Period('2016-03-01 09:00', freq=freq)
+                with pytest.raises(ValueError, match=msg):
+                    Period(ordinal=1, freq=freq)
+
+            # check supported freq-aliases still works
+            p1 = Period('2016-03-01 09:00', freq=exp)
+            p2 = Period(ordinal=1, freq=exp)
+            assert isinstance(p1, Period)
+            assert isinstance(p2, Period)
+
+    def test_start_time(self):
+        freq_lst = ['A', 'Q', 'M', 'D', 'H', 'T', 'S']
+        xp = datetime(2012, 1, 1)
+        for f in freq_lst:
+            p = Period('2012', freq=f)
+            assert p.start_time == xp
+        assert Period('2012', freq='B').start_time == datetime(2012, 1, 2)
+        assert Period('2012', freq='W').start_time == datetime(2011, 12, 26)
+
+    def test_end_time(self):
+        p = Period('2012', freq='A')
+
+        def _ex(*args):
+            return Timestamp(Timestamp(datetime(*args)).value - 1)
+
+        xp = _ex(2013, 1, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='Q')
+        xp = _ex(2012, 4, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='M')
+        xp = _ex(2012, 2, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='D')
+        xp = _ex(2012, 1, 2)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='H')
+        xp = _ex(2012, 1, 1, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='B')
+        xp = _ex(2012, 1, 3)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='W')
+        xp = _ex(2012, 1, 2)
+        assert xp == p.end_time
+
+        # Test for GH 11738
+        p = Period('2012', freq='15D')
+        xp = _ex(2012, 1, 16)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='1D1H')
+        xp = _ex(2012, 1, 2, 1)
+        assert xp == p.end_time
+
+        p = Period('2012', freq='1H1D')
+        xp = _ex(2012, 1, 2, 1)
+        assert xp == p.end_time
+
+    def test_anchor_week_end_time(self):
+        def _ex(*args):
+            return Timestamp(Timestamp(datetime(*args)).value - 1)
+
+        p = Period('2013-1-1', 'W-SAT')
+        xp = _ex(2013, 1, 6)
+        assert p.end_time == xp
+
+    def test_properties_annually(self):
+        # Test properties on Periods with annually frequency.
+        a_date = Period(freq='A', year=2007)
+        assert a_date.year == 2007
+
+    def test_properties_quarterly(self):
+        # Test properties on Periods with daily frequency.
+        qedec_date = Period(freq="Q-DEC", year=2007, quarter=1)
+        qejan_date = Period(freq="Q-JAN", year=2007, quarter=1)
+        qejun_date = Period(freq="Q-JUN", year=2007, quarter=1)
+        #
+        for x in range(3):
+            for qd in (qedec_date, qejan_date, qejun_date):
+                assert (qd + x).qyear == 2007
+                assert (qd + x).quarter == x + 1
+
+    def test_properties_monthly(self):
+        # Test properties on Periods with daily frequency.
+        m_date = Period(freq='M', year=2007, month=1)
+        for x in range(11):
+            m_ival_x = m_date + x
+            assert m_ival_x.year == 2007
+            if 1 <= x + 1 <= 3:
+                assert m_ival_x.quarter == 1
+            elif 4 <= x + 1 <= 6:
+                assert m_ival_x.quarter == 2
+            elif 7 <= x + 1 <= 9:
+                assert m_ival_x.quarter == 3
+            elif 10 <= x + 1 <= 12:
+                assert m_ival_x.quarter == 4
+            assert m_ival_x.month == x + 1
+
+    def test_properties_weekly(self):
+        # Test properties on Periods with daily frequency.
+        w_date = Period(freq='W', year=2007, month=1, day=7)
+        #
+        assert w_date.year == 2007
+        assert w_date.quarter == 1
+        assert w_date.month == 1
+        assert w_date.week == 1
+        assert (w_date - 1).week == 52
+        assert w_date.days_in_month == 31
+        assert Period(freq='W', year=2012,
+                      month=2, day=1).days_in_month == 29
+
+    def test_properties_weekly_legacy(self):
+        # Test properties on Periods with daily frequency.
+        w_date = Period(freq='W', year=2007, month=1, day=7)
+        assert w_date.year == 2007
+        assert w_date.quarter == 1
+        assert w_date.month == 1
+        assert w_date.week == 1
+        assert (w_date - 1).week == 52
+        assert w_date.days_in_month == 31
+
+        exp = Period(freq='W', year=2012, month=2, day=1)
+        assert exp.days_in_month == 29
+
+        msg = INVALID_FREQ_ERR_MSG
+        with pytest.raises(ValueError, match=msg):
+            Period(freq='WK', year=2007, month=1, day=7)
+
+    def test_properties_daily(self):
+        # Test properties on Periods with daily frequency.
+        b_date = Period(freq='B', year=2007, month=1, day=1)
+        #
+        assert b_date.year == 2007
+        assert b_date.quarter == 1
+        assert b_date.month == 1
+        assert b_date.day == 1
+        assert b_date.weekday == 0
+        assert b_date.dayofyear == 1
+        assert b_date.days_in_month == 31
+        assert Period(freq='B', year=2012,
+                      month=2, day=1).days_in_month == 29
+
+        d_date = Period(freq='D', year=2007, month=1, day=1)
+
+        assert d_date.year == 2007
+        assert d_date.quarter == 1
+        assert d_date.month == 1
+        assert d_date.day == 1
+        assert d_date.weekday == 0
+        assert d_date.dayofyear == 1
+        assert d_date.days_in_month == 31
+        assert Period(freq='D', year=2012, month=2,
+                      day=1).days_in_month == 29
+
+    def test_properties_hourly(self):
+        # Test properties on Periods with hourly frequency.
+        h_date1 = Period(freq='H', year=2007, month=1, day=1, hour=0)
+        h_date2 = Period(freq='2H', year=2007, month=1, day=1, hour=0)
+
+        for h_date in [h_date1, h_date2]:
+            assert h_date.year == 2007
+            assert h_date.quarter == 1
+            assert h_date.month == 1
+            assert h_date.day == 1
+            assert h_date.weekday == 0
+            assert h_date.dayofyear == 1
+            assert h_date.hour == 0
+            assert h_date.days_in_month == 31
+            assert Period(freq='H', year=2012, month=2, day=1,
+                          hour=0).days_in_month == 29
+
+    def test_properties_minutely(self):
+        # Test properties on Periods with minutely frequency.
+        t_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0)
+        #
+        assert t_date.quarter == 1
+        assert t_date.month == 1
+        assert t_date.day == 1
+        assert t_date.weekday == 0
+        assert t_date.dayofyear == 1
+        assert t_date.hour == 0
+        assert t_date.minute == 0
+        assert t_date.days_in_month == 31
+        assert Period(freq='D', year=2012, month=2, day=1, hour=0,
+                      minute=0).days_in_month == 29
+
+    def test_properties_secondly(self):
+        # Test properties on Periods with secondly frequency.
+        s_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
+                        minute=0, second=0)
+        #
+        assert s_date.year == 2007
+        assert s_date.quarter == 1
+        assert s_date.month == 1
+        assert s_date.day == 1
+        assert s_date.weekday == 0
+        assert s_date.dayofyear == 1
+        assert s_date.hour == 0
+        assert s_date.minute == 0
+        assert s_date.second == 0
+        assert s_date.days_in_month == 31
+        assert Period(freq='Min', year=2012, month=2, day=1, hour=0,
+                      minute=0, second=0).days_in_month == 29
+
+
+class TestPeriodField(object):
+
+    def test_get_period_field_array_raises_on_out_of_range(self):
+        msg = "Buffer dtype mismatch, expected 'int64_t' but got 'double'"
+        with pytest.raises(ValueError, match=msg):
+            libperiod.get_period_field_arr(-1, np.empty(1), 0)
+
+
+class TestComparisons(object):
+
+    def setup_method(self, method):
+        self.january1 = Period('2000-01', 'M')
+        self.january2 = Period('2000-01', 'M')
+        self.february = Period('2000-02', 'M')
+        self.march = Period('2000-03', 'M')
+        self.day = Period('2012-01-01', 'D')
+
+    def test_equal(self):
+        assert self.january1 == self.january2
+
+    def test_equal_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 == self.day
+
+    def test_notEqual(self):
+        assert self.january1 != 1
+        assert self.january1 != self.february
+
+    def test_greater(self):
+        assert self.february > self.january1
+
+    def test_greater_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 > self.day
+
+    def test_greater_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 > 1
+
+    def test_greaterEqual(self):
+        assert self.january1 >= self.january2
+
+    def test_greaterEqual_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 >= self.day
+
+        with pytest.raises(TypeError):
+            print(self.january1 >= 1)
+
+    def test_smallerEqual(self):
+        assert self.january1 <= self.january2
+
+    def test_smallerEqual_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 <= self.day
+
+    def test_smallerEqual_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 <= 1
+
+    def test_smaller(self):
+        assert self.january1 < self.february
+
+    def test_smaller_Raises_Value(self):
+        with pytest.raises(period.IncompatibleFrequency):
+            self.january1 < self.day
+
+    def test_smaller_Raises_Type(self):
+        with pytest.raises(TypeError):
+            self.january1 < 1
+
+    def test_sort(self):
+        periods = [self.march, self.january1, self.february]
+        correctPeriods = [self.january1, self.february, self.march]
+        assert sorted(periods) == correctPeriods
+
+    def test_period_nat_comp(self):
+        p_nat = Period('NaT', freq='D')
+        p = Period('2011-01-01', freq='D')
+
+        nat = Timestamp('NaT')
+        t = Timestamp('2011-01-01')
+        # confirm Period('NaT') work identical with Timestamp('NaT')
+        for left, right in [(p_nat, p), (p, p_nat), (p_nat, p_nat), (nat, t),
+                            (t, nat), (nat, nat)]:
+            assert not left < right
+            assert not left > right
+            assert not left == right
+            assert left != right
+            assert not left <= right
+            assert not left >= right
+
+
+class TestArithmetic(object):
+
+    def test_sub_delta(self):
+        left, right = Period('2011', freq='A'), Period('2007', freq='A')
+        result = left - right
+        assert result == 4 * right.freq
+
+        with pytest.raises(period.IncompatibleFrequency):
+            left - Period('2007-01', freq='M')
+
+    def test_add_integer(self):
+        per1 = Period(freq='D', year=2008, month=1, day=1)
+        per2 = Period(freq='D', year=2008, month=1, day=2)
+        assert per1 + 1 == per2
+        assert 1 + per1 == per2
+
+    def test_add_sub_nat(self):
+        # GH#13071
+        p = Period('2011-01', freq='M')
+        assert p + NaT is NaT
+        assert NaT + p is NaT
+        assert p - NaT is NaT
+        assert NaT - p is NaT
+
+        p = Period('NaT', freq='M')
+        assert p + NaT is NaT
+        assert NaT + p is NaT
+        assert p - NaT is NaT
+        assert NaT - p is NaT
+
+    def test_add_invalid(self):
+        # GH#4731
+        per1 = Period(freq='D', year=2008, month=1, day=1)
+        per2 = Period(freq='D', year=2008, month=1, day=2)
+
+        msg = r"unsupported operand type\(s\)"
+        with pytest.raises(TypeError, match=msg):
+            per1 + "str"
+        with pytest.raises(TypeError, match=msg):
+            "str" + per1
+        with pytest.raises(TypeError, match=msg):
+            per1 + per2
+
+    boxes = [lambda x: x, lambda x: pd.Series([x]), lambda x: pd.Index([x])]
+    ids = ['identity', 'Series', 'Index']
+
+    @pytest.mark.parametrize('lbox', boxes, ids=ids)
+    @pytest.mark.parametrize('rbox', boxes, ids=ids)
+    def test_add_timestamp_raises(self, rbox, lbox):
+        # GH#17983
+        ts = Timestamp('2017')
+        per = Period('2017', freq='M')
+
+        # We may get a different message depending on which class raises
+        # the error.
+        msg = (r"cannot add|unsupported operand|"
+               r"can only operate on a|incompatible type|"
+               r"ufunc add cannot use operands")
+        with pytest.raises(TypeError, match=msg):
+            lbox(ts) + rbox(per)
+
+        with pytest.raises(TypeError, match=msg):
+            lbox(per) + rbox(ts)
+
+        with pytest.raises(TypeError, match=msg):
+            lbox(per) + rbox(per)
+
+    def test_sub(self):
+        per1 = Period('2011-01-01', freq='D')
+        per2 = Period('2011-01-15', freq='D')
+
+        off = per1.freq
+        assert per1 - per2 == -14 * off
+        assert per2 - per1 == 14 * off
+
+        msg = r"Input has different freq=M from Period\(freq=D\)"
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
+            per1 - Period('2011-02', freq='M')
+
+    @pytest.mark.parametrize('n', [1, 2, 3, 4])
+    def test_sub_n_gt_1_ticks(self, tick_classes, n):
+        # GH 23878
+        p1 = pd.Period('19910905', freq=tick_classes(n))
+        p2 = pd.Period('19920406', freq=tick_classes(n))
+
+        expected = (pd.Period(str(p2), freq=p2.freq.base)
+                    - pd.Period(str(p1), freq=p1.freq.base))
+
+        assert (p2 - p1) == expected
+
+    @pytest.mark.parametrize('normalize', [True, False])
+    @pytest.mark.parametrize('n', [1, 2, 3, 4])
+    @pytest.mark.parametrize('offset, kwd_name', [
+        (pd.offsets.YearEnd, 'month'),
+        (pd.offsets.QuarterEnd, 'startingMonth'),
+        (pd.offsets.MonthEnd, None),
+        (pd.offsets.Week, 'weekday')
+    ])
+    def test_sub_n_gt_1_offsets(self, offset, kwd_name, n, normalize):
+        # GH 23878
+        kwds = {kwd_name: 3} if kwd_name is not None else {}
+        p1_d = '19910905'
+        p2_d = '19920406'
+        p1 = pd.Period(p1_d, freq=offset(n, normalize, **kwds))
+        p2 = pd.Period(p2_d, freq=offset(n, normalize, **kwds))
+
+        expected = (pd.Period(p2_d, freq=p2.freq.base)
+                    - pd.Period(p1_d, freq=p1.freq.base))
+
+        assert (p2 - p1) == expected
+
+    def test_add_offset(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('2011', freq=freq)
+            exp = Period('2013', freq=freq)
+            assert p + offsets.YearEnd(2) == exp
+            assert offsets.YearEnd(2) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('2011-03', freq=freq)
+            exp = Period('2011-05', freq=freq)
+            assert p + offsets.MonthEnd(2) == exp
+            assert offsets.MonthEnd(2) + p == exp
+
+            exp = Period('2012-03', freq=freq)
+            assert p + offsets.MonthEnd(12) == exp
+            assert offsets.MonthEnd(12) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('2011-04-01', freq=freq)
+
+            exp = Period('2011-04-06', freq=freq)
+            assert p + offsets.Day(5) == exp
+            assert offsets.Day(5) + p == exp
+
+            exp = Period('2011-04-02', freq=freq)
+            assert p + offsets.Hour(24) == exp
+            assert offsets.Hour(24) + p == exp
+
+            exp = Period('2011-04-03', freq=freq)
+            assert p + np.timedelta64(2, 'D') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(2, 'D') + p
+
+            exp = Period('2011-04-02', freq=freq)
+            assert p + np.timedelta64(3600 * 24, 's') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3600 * 24, 's') + p
+
+            exp = Period('2011-03-30', freq=freq)
+            assert p + timedelta(-2) == exp
+            assert timedelta(-2) + p == exp
+
+            exp = Period('2011-04-03', freq=freq)
+            assert p + timedelta(hours=48) == exp
+            assert timedelta(hours=48) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('2011-04-01 09:00', freq=freq)
+
+            exp = Period('2011-04-03 09:00', freq=freq)
+            assert p + offsets.Day(2) == exp
+            assert offsets.Day(2) + p == exp
+
+            exp = Period('2011-04-01 12:00', freq=freq)
+            assert p + offsets.Hour(3) == exp
+            assert offsets.Hour(3) + p == exp
+
+            exp = Period('2011-04-01 12:00', freq=freq)
+            assert p + np.timedelta64(3, 'h') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3, 'h') + p
+
+            exp = Period('2011-04-01 10:00', freq=freq)
+            assert p + np.timedelta64(3600, 's') == exp
+            with pytest.raises(TypeError):
+                np.timedelta64(3600, 's') + p
+
+            exp = Period('2011-04-01 11:00', freq=freq)
+            assert p + timedelta(minutes=120) == exp
+            assert timedelta(minutes=120) + p == exp
+
+            exp = Period('2011-04-05 12:00', freq=freq)
+            assert p + timedelta(days=4, minutes=180) == exp
+            assert timedelta(days=4, minutes=180) + p == exp
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p + o
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    with pytest.raises(period.IncompatibleFrequency):
+                        o + p
+
+    def test_add_offset_nat(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.YearEnd(2)]:
+                assert p + o is NaT
+                assert o + p is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
+                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
+                      timedelta(hours=48)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
+                      np.timedelta64(3600, 's'), timedelta(minutes=120),
+                      timedelta(days=4, minutes=180)]:
+                assert p + o is NaT
+
+                if not isinstance(o, np.timedelta64):
+                    assert o + p is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                assert p + o is NaT
+
+                if isinstance(o, np.timedelta64):
+                    with pytest.raises(TypeError):
+                        o + p
+                else:
+                    assert o + p is NaT
+
+    def test_sub_offset(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('2011', freq=freq)
+            assert p - offsets.YearEnd(2) == Period('2009', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('2011-03', freq=freq)
+            assert p - offsets.MonthEnd(2) == Period('2011-01', freq=freq)
+            assert p - offsets.MonthEnd(12) == Period('2010-03', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('2011-04-01', freq=freq)
+            assert p - offsets.Day(5) == Period('2011-03-27', freq=freq)
+            assert p - offsets.Hour(24) == Period('2011-03-31', freq=freq)
+            assert p - np.timedelta64(2, 'D') == Period(
+                '2011-03-30', freq=freq)
+            assert p - np.timedelta64(3600 * 24, 's') == Period(
+                '2011-03-31', freq=freq)
+            assert p - timedelta(-2) == Period('2011-04-03', freq=freq)
+            assert p - timedelta(hours=48) == Period('2011-03-30', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('2011-04-01 09:00', freq=freq)
+            assert p - offsets.Day(2) == Period('2011-03-30 09:00', freq=freq)
+            assert p - offsets.Hour(3) == Period('2011-04-01 06:00', freq=freq)
+            assert p - np.timedelta64(3, 'h') == Period(
+                '2011-04-01 06:00', freq=freq)
+            assert p - np.timedelta64(3600, 's') == Period(
+                '2011-04-01 08:00', freq=freq)
+            assert p - timedelta(minutes=120) == Period(
+                '2011-04-01 07:00', freq=freq)
+            assert p - timedelta(days=4, minutes=180) == Period(
+                '2011-03-28 06:00', freq=freq)
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                with pytest.raises(period.IncompatibleFrequency):
+                    p - o
+
+    def test_sub_offset_nat(self):
+        # freq is DateOffset
+        for freq in ['A', '2A', '3A']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.YearEnd(2)]:
+                assert p - o is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p - o is NaT
+
+        for freq in ['M', '2M', '3M']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
+                assert p - o is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(365, 'D'),
+                      timedelta(365)]:
+                assert p - o is NaT
+
+        # freq is Tick
+        for freq in ['D', '2D', '3D']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
+                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
+                      timedelta(hours=48)]:
+                assert p - o is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(4, 'h'),
+                      timedelta(hours=23)]:
+                assert p - o is NaT
+
+        for freq in ['H', '2H', '3H']:
+            p = Period('NaT', freq=freq)
+            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
+                      np.timedelta64(3600, 's'), timedelta(minutes=120),
+                      timedelta(days=4, minutes=180)]:
+                assert p - o is NaT
+
+            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
+                      offsets.Minute(), np.timedelta64(3200, 's'),
+                      timedelta(hours=23, minutes=30)]:
+                assert p - o is NaT
+
+    @pytest.mark.parametrize('freq', ['M', '2M', '3M'])
+    def test_nat_ops(self, freq):
+        p = Period('NaT', freq=freq)
+        assert p + 1 is NaT
+        assert 1 + p is NaT
+        assert p - 1 is NaT
+        assert p - Period('2011-01', freq=freq) is NaT
+        assert Period('2011-01', freq=freq) - p is NaT
+
+    def test_period_ops_offset(self):
+        p = Period('2011-04-01', freq='D')
+        result = p + offsets.Day()
+        exp = Period('2011-04-02', freq='D')
+        assert result == exp
+
+        result = p - offsets.Day(2)
+        exp = Period('2011-03-30', freq='D')
+        assert result == exp
+
+        msg = r"Input cannot be converted to Period\(freq=D\)"
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
+            p + offsets.Hour(2)
+
+        with pytest.raises(period.IncompatibleFrequency, match=msg):
+            p - offsets.Hour(2)
+
+
+def test_period_immutable():
+    # see gh-17116
+    per = Period('2014Q1')
+    with pytest.raises(AttributeError):
+        per.ordinal = 14
+
+    freq = per.freq
+    with pytest.raises(AttributeError):
+        per.freq = 2 * freq
+
+
+# TODO: This doesn't fail on all systems; track down which
+@pytest.mark.xfail(reason="Parses as Jan 1, 0007 on some systems",
+                   strict=False)
+def test_small_year_parsing():
+    per1 = Period('0001-01-07', 'D')
+    assert per1.year == 1
+    assert per1.day == 7
diff --git a/pandas/tests/scalar/test_nat.py b/pandas/tests/scalar/test_nat.py
index ce2ed237f5559..43747ea8621d9 100644
--- a/pandas/tests/scalar/test_nat.py
+++ b/pandas/tests/scalar/test_nat.py
@@ -1,26 +1,28 @@
-import pytest
-
 from datetime import datetime, timedelta
-import pytz
 
 import numpy as np
-from pandas import (NaT, Index, Timestamp, Timedelta, Period,
-                    DatetimeIndex, PeriodIndex,
-                    TimedeltaIndex, Series, isnull)
+import pytest
+import pytz
+
+from pandas._libs.tslibs import iNaT
+import pandas.compat as compat
+
+from pandas import (
+    DatetimeIndex, Index, NaT, Period, Series, Timedelta, TimedeltaIndex,
+    Timestamp, isna)
+from pandas.core.arrays import PeriodArray
 from pandas.util import testing as tm
-from pandas._libs.tslib import iNaT
 
 
-@pytest.mark.parametrize('nat, idx', [(Timestamp('NaT'), DatetimeIndex),
-                                      (Timedelta('NaT'), TimedeltaIndex),
-                                      (Period('NaT', freq='M'), PeriodIndex)])
+@pytest.mark.parametrize("nat,idx", [(Timestamp("NaT"), DatetimeIndex),
+                                     (Timedelta("NaT"), TimedeltaIndex),
+                                     (Period("NaT", freq="M"), PeriodArray)])
 def test_nat_fields(nat, idx):
 
     for field in idx._field_ops:
-
         # weekday is a property of DTI, but a method
         # on NaT/Timestamp for compat with datetime
-        if field == 'weekday':
+        if field == "weekday":
             continue
 
         result = getattr(NaT, field)
@@ -39,210 +41,310 @@ def test_nat_fields(nat, idx):
 
 
 def test_nat_vector_field_access():
-    idx = DatetimeIndex(['1/1/2000', None, None, '1/4/2000'])
+    idx = DatetimeIndex(["1/1/2000", None, None, "1/4/2000"])
 
     for field in DatetimeIndex._field_ops:
         # weekday is a property of DTI, but a method
         # on NaT/Timestamp for compat with datetime
-        if field == 'weekday':
+        if field == "weekday":
             continue
 
         result = getattr(idx, field)
         expected = Index([getattr(x, field) for x in idx])
         tm.assert_index_equal(result, expected)
 
-    s = Series(idx)
+    ser = Series(idx)
 
     for field in DatetimeIndex._field_ops:
-
         # weekday is a property of DTI, but a method
         # on NaT/Timestamp for compat with datetime
-        if field == 'weekday':
+        if field == "weekday":
             continue
 
-        result = getattr(s.dt, field)
+        result = getattr(ser.dt, field)
         expected = [getattr(x, field) for x in idx]
         tm.assert_series_equal(result, Series(expected))
 
     for field in DatetimeIndex._bool_ops:
-        result = getattr(s.dt, field)
+        result = getattr(ser.dt, field)
         expected = [getattr(x, field) for x in idx]
         tm.assert_series_equal(result, Series(expected))
 
 
-@pytest.mark.parametrize('klass', [Timestamp, Timedelta, Period])
-def test_identity(klass):
-    assert klass(None) is NaT
-
-    result = klass(np.nan)
-    assert result is NaT
-
-    result = klass(None)
-    assert result is NaT
-
-    result = klass(iNaT)
-    assert result is NaT
-
-    result = klass(np.nan)
-    assert result is NaT
-
-    result = klass(float('nan'))
-    assert result is NaT
-
-    result = klass(NaT)
-    assert result is NaT
-
-    result = klass('NaT')
-    assert result is NaT
-
-    assert isnull(klass('nat'))
-
-
-@pytest.mark.parametrize('klass', [Timestamp, Timedelta, Period])
-def test_equality(klass):
-
-    # nat
-    if klass is not Period:
-        klass('').value == iNaT
-    klass('nat').value == iNaT
-    klass('NAT').value == iNaT
-    klass(None).value == iNaT
-    klass(np.nan).value == iNaT
-    assert isnull(klass('nat'))
-
-
-@pytest.mark.parametrize('klass', [Timestamp, Timedelta])
-def test_round_nat(klass):
-    # GH14940
-    ts = klass('nat')
-    for method in ["round", "floor", "ceil"]:
-        round_method = getattr(ts, method)
-        for freq in ["s", "5s", "min", "5min", "h", "5h"]:
-            assert round_method(freq) is ts
-
-
-def test_NaT_methods():
-    # GH 9513
-    raise_methods = ['astimezone', 'combine', 'ctime', 'dst',
-                     'fromordinal', 'fromtimestamp', 'isocalendar',
-                     'strftime', 'strptime', 'time', 'timestamp',
-                     'timetuple', 'timetz', 'toordinal', 'tzname',
-                     'utcfromtimestamp', 'utcnow', 'utcoffset',
-                     'utctimetuple']
-    nat_methods = ['date', 'now', 'replace', 'to_datetime', 'today']
-    nan_methods = ['weekday', 'isoweekday']
-
-    for method in raise_methods:
-        if hasattr(NaT, method):
-            with pytest.raises(ValueError):
-                getattr(NaT, method)()
-
-    for method in nan_methods:
-        if hasattr(NaT, method):
-            assert np.isnan(getattr(NaT, method)())
-
-    for method in nat_methods:
-        if hasattr(NaT, method):
-            # see gh-8254
-            exp_warning = None
-            if method == 'to_datetime':
-                exp_warning = FutureWarning
-            with tm.assert_produces_warning(
-                    exp_warning, check_stacklevel=False):
-                assert getattr(NaT, method)() is NaT
-
-    # GH 12300
-    assert NaT.isoformat() == 'NaT'
-
-
-@pytest.mark.parametrize('klass', [Timestamp, Timedelta])
-def test_isoformat(klass):
-
-    result = klass('NaT').isoformat()
-    expected = 'NaT'
-    assert result == expected
-
-
-def test_nat_arithmetic():
-    # GH 6873
-    i = 2
-    f = 1.5
-
-    for (left, right) in [(NaT, i), (NaT, f), (NaT, np.nan)]:
-        assert left / right is NaT
-        assert left * right is NaT
-        assert right * left is NaT
-        with pytest.raises(TypeError):
-            right / left
-
-    # Timestamp / datetime
-    t = Timestamp('2014-01-01')
-    dt = datetime(2014, 1, 1)
-    for (left, right) in [(NaT, NaT), (NaT, t), (NaT, dt)]:
-        # NaT __add__ or __sub__ Timestamp-like (or inverse) returns NaT
-        assert right + left is NaT
-        assert left + right is NaT
-        assert left - right is NaT
-        assert right - left is NaT
-
-    # timedelta-like
-    # offsets are tested in test_offsets.py
-
-    delta = timedelta(3600)
-    td = Timedelta('5s')
-
-    for (left, right) in [(NaT, delta), (NaT, td)]:
-        # NaT + timedelta-like returns NaT
-        assert right + left is NaT
-        assert left + right is NaT
-        assert right - left is NaT
-        assert left - right is NaT
-
-    # GH 11718
-    t_utc = Timestamp('2014-01-01', tz='UTC')
-    t_tz = Timestamp('2014-01-01', tz='US/Eastern')
-    dt_tz = pytz.timezone('Asia/Tokyo').localize(dt)
-
-    for (left, right) in [(NaT, t_utc), (NaT, t_tz),
-                          (NaT, dt_tz)]:
-        # NaT __add__ or __sub__ Timestamp-like (or inverse) returns NaT
-        assert right + left is NaT
-        assert left + right is NaT
-        assert left - right is NaT
-        assert right - left is NaT
-
-    # int addition / subtraction
-    for (left, right) in [(NaT, 2), (NaT, 0), (NaT, -3)]:
-        assert right + left is NaT
-        assert left + right is NaT
-        assert left - right is NaT
-        assert right - left is NaT
-
-
-def test_nat_arithmetic_index():
-    # GH 11718
-
-    dti = DatetimeIndex(['2011-01-01', '2011-01-02'], name='x')
-    exp = DatetimeIndex([NaT, NaT], name='x')
-    tm.assert_index_equal(dti + NaT, exp)
-    tm.assert_index_equal(NaT + dti, exp)
-
-    dti_tz = DatetimeIndex(['2011-01-01', '2011-01-02'],
-                           tz='US/Eastern', name='x')
-    exp = DatetimeIndex([NaT, NaT], name='x', tz='US/Eastern')
-    tm.assert_index_equal(dti_tz + NaT, exp)
-    tm.assert_index_equal(NaT + dti_tz, exp)
-
-    exp = TimedeltaIndex([NaT, NaT], name='x')
-    for (left, right) in [(NaT, dti), (NaT, dti_tz)]:
-        tm.assert_index_equal(left - right, exp)
-        tm.assert_index_equal(right - left, exp)
-
-    # timedelta
-    tdi = TimedeltaIndex(['1 day', '2 day'], name='x')
-    exp = DatetimeIndex([NaT, NaT], name='x')
-    for (left, right) in [(NaT, tdi)]:
-        tm.assert_index_equal(left + right, exp)
-        tm.assert_index_equal(right + left, exp)
-        tm.assert_index_equal(left - right, exp)
-        tm.assert_index_equal(right - left, exp)
+@pytest.mark.parametrize("klass", [Timestamp, Timedelta, Period])
+@pytest.mark.parametrize("value", [None, np.nan, iNaT, float("nan"),
+                                   NaT, "NaT", "nat"])
+def test_identity(klass, value):
+    assert klass(value) is NaT
+
+
+@pytest.mark.parametrize("klass", [Timestamp, Timedelta, Period])
+@pytest.mark.parametrize("value", ["", "nat", "NAT", None, np.nan])
+def test_equality(klass, value):
+    if klass is Period and value == "":
+        pytest.skip("Period cannot parse empty string")
+
+    assert klass(value).value == iNaT
+
+
+@pytest.mark.parametrize("klass", [Timestamp, Timedelta])
+@pytest.mark.parametrize("method", ["round", "floor", "ceil"])
+@pytest.mark.parametrize("freq", ["s", "5s", "min", "5min", "h", "5h"])
+def test_round_nat(klass, method, freq):
+    # see gh-14940
+    ts = klass("nat")
+
+    round_method = getattr(ts, method)
+    assert round_method(freq) is ts
+
+
+@pytest.mark.parametrize("method", [
+    "astimezone", "combine", "ctime", "dst", "fromordinal",
+    "fromtimestamp", "isocalendar", "strftime", "strptime",
+    "time", "timestamp", "timetuple", "timetz", "toordinal",
+    "tzname", "utcfromtimestamp", "utcnow", "utcoffset",
+    "utctimetuple", "timestamp"
+])
+def test_nat_methods_raise(method):
+    # see gh-9513, gh-17329
+    msg = "NaTType does not support {method}".format(method=method)
+
+    with pytest.raises(ValueError, match=msg):
+        getattr(NaT, method)()
+
+
+@pytest.mark.parametrize("method", [
+    "weekday", "isoweekday"
+])
+def test_nat_methods_nan(method):
+    # see gh-9513, gh-17329
+    assert np.isnan(getattr(NaT, method)())
+
+
+@pytest.mark.parametrize("method", [
+    "date", "now", "replace", "today",
+    "tz_convert", "tz_localize"
+])
+def test_nat_methods_nat(method):
+    # see gh-8254, gh-9513, gh-17329
+    assert getattr(NaT, method)() is NaT
+
+
+@pytest.mark.parametrize("get_nat", [
+    lambda x: NaT,
+    lambda x: Timedelta(x),
+    lambda x: Timestamp(x)
+])
+def test_nat_iso_format(get_nat):
+    # see gh-12300
+    assert get_nat("NaT").isoformat() == "NaT"
+
+
+@pytest.mark.parametrize("klass,expected", [
+    (Timestamp, ["freqstr", "normalize", "to_julian_date", "to_period", "tz"]),
+    (Timedelta, ["components", "delta", "is_populated", "to_pytimedelta",
+                 "to_timedelta64", "view"])
+])
+def test_missing_public_nat_methods(klass, expected):
+    # see gh-17327
+    #
+    # NaT should have *most* of the Timestamp and Timedelta methods.
+    # Here, we check which public methods NaT does not have. We
+    # ignore any missing private methods.
+    nat_names = dir(NaT)
+    klass_names = dir(klass)
+
+    missing = [x for x in klass_names if x not in nat_names and
+               not x.startswith("_")]
+    missing.sort()
+
+    assert missing == expected
+
+
+def _get_overlap_public_nat_methods(klass, as_tuple=False):
+    """
+    Get overlapping public methods between NaT and another class.
+
+    Parameters
+    ----------
+    klass : type
+        The class to compare with NaT
+    as_tuple : bool, default False
+        Whether to return a list of tuples of the form (klass, method).
+
+    Returns
+    -------
+    overlap : list
+    """
+    nat_names = dir(NaT)
+    klass_names = dir(klass)
+
+    overlap = [x for x in nat_names if x in klass_names and
+               not x.startswith("_") and
+               callable(getattr(klass, x))]
+
+    # Timestamp takes precedence over Timedelta in terms of overlap.
+    if klass is Timedelta:
+        ts_names = dir(Timestamp)
+        overlap = [x for x in overlap if x not in ts_names]
+
+    if as_tuple:
+        overlap = [(klass, method) for method in overlap]
+
+    overlap.sort()
+    return overlap
+
+
+@pytest.mark.parametrize("klass,expected", [
+    (Timestamp, ["astimezone", "ceil", "combine", "ctime", "date", "day_name",
+                 "dst", "floor", "fromisoformat", "fromordinal",
+                 "fromtimestamp", "isocalendar", "isoformat", "isoweekday",
+                 "month_name", "now", "replace", "round", "strftime",
+                 "strptime", "time", "timestamp", "timetuple", "timetz",
+                 "to_datetime64", "to_numpy", "to_pydatetime", "today",
+                 "toordinal", "tz_convert", "tz_localize", "tzname",
+                 "utcfromtimestamp", "utcnow", "utcoffset", "utctimetuple",
+                 "weekday"]),
+    (Timedelta, ["total_seconds"])
+])
+def test_overlap_public_nat_methods(klass, expected):
+    # see gh-17327
+    #
+    # NaT should have *most* of the Timestamp and Timedelta methods.
+    # In case when Timestamp, Timedelta, and NaT are overlap, the overlap
+    # is considered to be with Timestamp and NaT, not Timedelta.
+
+    # "fromisoformat" was introduced in 3.7
+    if klass is Timestamp and not compat.PY37:
+        expected.remove("fromisoformat")
+
+    assert _get_overlap_public_nat_methods(klass) == expected
+
+
+@pytest.mark.parametrize("compare", (
+    _get_overlap_public_nat_methods(Timestamp, True) +
+    _get_overlap_public_nat_methods(Timedelta, True))
+)
+def test_nat_doc_strings(compare):
+    # see gh-17327
+    #
+    # The docstrings for overlapping methods should match.
+    klass, method = compare
+    klass_doc = getattr(klass, method).__doc__
+
+    nat_doc = getattr(NaT, method).__doc__
+    assert klass_doc == nat_doc
+
+
+_ops = {
+    "left_plus_right": lambda a, b: a + b,
+    "right_plus_left": lambda a, b: b + a,
+    "left_minus_right": lambda a, b: a - b,
+    "right_minus_left": lambda a, b: b - a,
+    "left_times_right": lambda a, b: a * b,
+    "right_times_left": lambda a, b: b * a,
+    "left_div_right": lambda a, b: a / b,
+    "right_div_left": lambda a, b: b / a,
+}
+
+
+@pytest.mark.parametrize("op_name", list(_ops.keys()))
+@pytest.mark.parametrize("value,val_type", [
+    (2, "scalar"),
+    (1.5, "scalar"),
+    (np.nan, "scalar"),
+    (timedelta(3600), "timedelta"),
+    (Timedelta("5s"), "timedelta"),
+    (datetime(2014, 1, 1), "timestamp"),
+    (Timestamp("2014-01-01"), "timestamp"),
+    (Timestamp("2014-01-01", tz="UTC"), "timestamp"),
+    (Timestamp("2014-01-01", tz="US/Eastern"), "timestamp"),
+    (pytz.timezone("Asia/Tokyo").localize(datetime(2014, 1, 1)), "timestamp"),
+])
+def test_nat_arithmetic_scalar(op_name, value, val_type):
+    # see gh-6873
+    invalid_ops = {
+        "scalar": {"right_div_left"},
+        "timedelta": {"left_times_right", "right_times_left"},
+        "timestamp": {"left_times_right", "right_times_left",
+                      "left_div_right", "right_div_left"}
+    }
+
+    op = _ops[op_name]
+
+    if op_name in invalid_ops.get(val_type, set()):
+        if (val_type == "timedelta" and "times" in op_name and
+                isinstance(value, Timedelta)):
+            msg = "Cannot multiply"
+        else:
+            msg = "unsupported operand type"
+
+        with pytest.raises(TypeError, match=msg):
+            op(NaT, value)
+    else:
+        if val_type == "timedelta" and "div" in op_name:
+            expected = np.nan
+        else:
+            expected = NaT
+
+        assert op(NaT, value) is expected
+
+
+@pytest.mark.parametrize("val,expected", [
+    (np.nan, NaT),
+    (NaT, np.nan),
+    (np.timedelta64("NaT"), np.nan)
+])
+def test_nat_rfloordiv_timedelta(val, expected):
+    # see gh-#18846
+    #
+    # See also test_timedelta.TestTimedeltaArithmetic.test_floordiv
+    td = Timedelta(hours=3, minutes=4)
+    assert td // val is expected
+
+
+@pytest.mark.parametrize("op_name", [
+    "left_plus_right", "right_plus_left",
+    "left_minus_right", "right_minus_left"
+])
+@pytest.mark.parametrize("value", [
+    DatetimeIndex(["2011-01-01", "2011-01-02"], name="x"),
+    DatetimeIndex(["2011-01-01", "2011-01-02"], name="x"),
+    TimedeltaIndex(["1 day", "2 day"], name="x"),
+])
+def test_nat_arithmetic_index(op_name, value):
+    # see gh-11718
+    exp_name = "x"
+    exp_data = [NaT] * 2
+
+    if isinstance(value, DatetimeIndex) and "plus" in op_name:
+        expected = DatetimeIndex(exp_data, name=exp_name, tz=value.tz)
+    else:
+        expected = TimedeltaIndex(exp_data, name=exp_name)
+
+    tm.assert_index_equal(_ops[op_name](NaT, value), expected)
+
+
+@pytest.mark.parametrize("op_name", [
+    "left_plus_right", "right_plus_left",
+    "left_minus_right", "right_minus_left"
+])
+@pytest.mark.parametrize("box", [TimedeltaIndex, Series])
+def test_nat_arithmetic_td64_vector(op_name, box):
+    # see gh-19124
+    vec = box(["1 day", "2 day"], dtype="timedelta64[ns]")
+    box_nat = box([NaT, NaT], dtype="timedelta64[ns]")
+    tm.assert_equal(_ops[op_name](vec, NaT), box_nat)
+
+
+def test_nat_pinned_docstrings():
+    # see gh-17327
+    assert NaT.ctime.__doc__ == datetime.ctime.__doc__
+
+
+def test_to_numpy_alias():
+    # GH 24653: alias .to_numpy() for scalars
+    expected = NaT.to_datetime64()
+    result = NaT.to_numpy()
+
+    assert isna(expected) and isna(result)
diff --git a/pandas/tests/scalar/test_period.py b/pandas/tests/scalar/test_period.py
deleted file mode 100644
index 7a15600d6041e..0000000000000
--- a/pandas/tests/scalar/test_period.py
+++ /dev/null
@@ -1,1419 +0,0 @@
-import numpy as np
-from datetime import datetime, date, timedelta
-
-import pandas as pd
-import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas.compat import text_type, iteritems
-from pandas.compat.numpy import np_datetime64_compat
-
-from pandas._libs import tslib, period as libperiod
-from pandas import Period, Timestamp, offsets
-from pandas.tseries.frequencies import DAYS, MONTHS
-
-
-class TestPeriodProperties(tm.TestCase):
-    "Test properties such as year, month, weekday, etc...."
-
-    def test_is_leap_year(self):
-        # GH 13727
-        for freq in ['A', 'M', 'D', 'H']:
-            p = Period('2000-01-01 00:00:00', freq=freq)
-            self.assertTrue(p.is_leap_year)
-            self.assertIsInstance(p.is_leap_year, bool)
-
-            p = Period('1999-01-01 00:00:00', freq=freq)
-            self.assertFalse(p.is_leap_year)
-
-            p = Period('2004-01-01 00:00:00', freq=freq)
-            self.assertTrue(p.is_leap_year)
-
-            p = Period('2100-01-01 00:00:00', freq=freq)
-            self.assertFalse(p.is_leap_year)
-
-    def test_quarterly_negative_ordinals(self):
-        p = Period(ordinal=-1, freq='Q-DEC')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.quarter, 4)
-        self.assertIsInstance(p, Period)
-
-        p = Period(ordinal=-2, freq='Q-DEC')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.quarter, 3)
-        self.assertIsInstance(p, Period)
-
-        p = Period(ordinal=-2, freq='M')
-        self.assertEqual(p.year, 1969)
-        self.assertEqual(p.month, 11)
-        self.assertIsInstance(p, Period)
-
-    def test_period_cons_quarterly(self):
-        # bugs in scikits.timeseries
-        for month in MONTHS:
-            freq = 'Q-%s' % month
-            exp = Period('1989Q3', freq=freq)
-            self.assertIn('1989Q3', str(exp))
-            stamp = exp.to_timestamp('D', how='end')
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp)
-
-            stamp = exp.to_timestamp('3D', how='end')
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp)
-
-    def test_period_cons_annual(self):
-        # bugs in scikits.timeseries
-        for month in MONTHS:
-            freq = 'A-%s' % month
-            exp = Period('1989', freq=freq)
-            stamp = exp.to_timestamp('D', how='end') + timedelta(days=30)
-            p = Period(stamp, freq=freq)
-            self.assertEqual(p, exp + 1)
-            self.assertIsInstance(p, Period)
-
-    def test_period_cons_weekly(self):
-        for num in range(10, 17):
-            daystr = '2011-02-%d' % num
-            for day in DAYS:
-                freq = 'W-%s' % day
-
-                result = Period(daystr, freq=freq)
-                expected = Period(daystr, freq='D').asfreq(freq)
-                self.assertEqual(result, expected)
-                self.assertIsInstance(result, Period)
-
-    def test_period_from_ordinal(self):
-        p = pd.Period('2011-01', freq='M')
-        res = pd.Period._from_ordinal(p.ordinal, freq='M')
-        self.assertEqual(p, res)
-        self.assertIsInstance(res, Period)
-
-    def test_period_cons_nat(self):
-        p = Period('NaT', freq='M')
-        self.assertIs(p, pd.NaT)
-
-        p = Period('nat', freq='W-SUN')
-        self.assertIs(p, pd.NaT)
-
-        p = Period(tslib.iNaT, freq='D')
-        self.assertIs(p, pd.NaT)
-
-        p = Period(tslib.iNaT, freq='3D')
-        self.assertIs(p, pd.NaT)
-
-        p = Period(tslib.iNaT, freq='1D1H')
-        self.assertIs(p, pd.NaT)
-
-        p = Period('NaT')
-        self.assertIs(p, pd.NaT)
-
-        p = Period(tslib.iNaT)
-        self.assertIs(p, pd.NaT)
-
-    def test_period_cons_mult(self):
-        p1 = Period('2011-01', freq='3M')
-        p2 = Period('2011-01', freq='M')
-        self.assertEqual(p1.ordinal, p2.ordinal)
-
-        self.assertEqual(p1.freq, offsets.MonthEnd(3))
-        self.assertEqual(p1.freqstr, '3M')
-
-        self.assertEqual(p2.freq, offsets.MonthEnd())
-        self.assertEqual(p2.freqstr, 'M')
-
-        result = p1 + 1
-        self.assertEqual(result.ordinal, (p2 + 3).ordinal)
-        self.assertEqual(result.freq, p1.freq)
-        self.assertEqual(result.freqstr, '3M')
-
-        result = p1 - 1
-        self.assertEqual(result.ordinal, (p2 - 3).ordinal)
-        self.assertEqual(result.freq, p1.freq)
-        self.assertEqual(result.freqstr, '3M')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -3M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='-3M')
-
-        msg = ('Frequency must be positive, because it' ' represents span: 0M')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='0M')
-
-    def test_period_cons_combined(self):
-        p = [(Period('2011-01', freq='1D1H'),
-              Period('2011-01', freq='1H1D'),
-              Period('2011-01', freq='H')),
-             (Period(ordinal=1, freq='1D1H'),
-              Period(ordinal=1, freq='1H1D'),
-              Period(ordinal=1, freq='H'))]
-
-        for p1, p2, p3 in p:
-            self.assertEqual(p1.ordinal, p3.ordinal)
-            self.assertEqual(p2.ordinal, p3.ordinal)
-
-            self.assertEqual(p1.freq, offsets.Hour(25))
-            self.assertEqual(p1.freqstr, '25H')
-
-            self.assertEqual(p2.freq, offsets.Hour(25))
-            self.assertEqual(p2.freqstr, '25H')
-
-            self.assertEqual(p3.freq, offsets.Hour())
-            self.assertEqual(p3.freqstr, 'H')
-
-            result = p1 + 1
-            self.assertEqual(result.ordinal, (p3 + 25).ordinal)
-            self.assertEqual(result.freq, p1.freq)
-            self.assertEqual(result.freqstr, '25H')
-
-            result = p2 + 1
-            self.assertEqual(result.ordinal, (p3 + 25).ordinal)
-            self.assertEqual(result.freq, p2.freq)
-            self.assertEqual(result.freqstr, '25H')
-
-            result = p1 - 1
-            self.assertEqual(result.ordinal, (p3 - 25).ordinal)
-            self.assertEqual(result.freq, p1.freq)
-            self.assertEqual(result.freqstr, '25H')
-
-            result = p2 - 1
-            self.assertEqual(result.ordinal, (p3 - 25).ordinal)
-            self.assertEqual(result.freq, p2.freq)
-            self.assertEqual(result.freqstr, '25H')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: -25H')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='-1D1H')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='-1H1D')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period(ordinal=1, freq='-1D1H')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period(ordinal=1, freq='-1H1D')
-
-        msg = ('Frequency must be positive, because it'
-               ' represents span: 0D')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='0D0H')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period(ordinal=1, freq='0D0H')
-
-        # You can only combine together day and intraday offsets
-        msg = ('Invalid frequency: 1W1D')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='1W1D')
-        msg = ('Invalid frequency: 1D1W')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            Period('2011-01', freq='1D1W')
-
-    def test_timestamp_tz_arg(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        for case in ['Europe/Brussels', 'Asia/Tokyo', 'US/Pacific']:
-            p = Period('1/1/2005', freq='M').to_timestamp(tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='3H').to_timestamp(tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='A').to_timestamp(freq='A', tz=case)
-            exp = Timestamp('31/12/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005', freq='A').to_timestamp(freq='3H', tz=case)
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            exp_zone = pytz.timezone(case).normalize(p)
-
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, exp_zone.tzinfo)
-            self.assertEqual(p.tz, exp.tz)
-
-    def test_timestamp_tz_arg_dateutil(self):
-        from pandas._libs.tslib import _dateutil_gettz as gettz
-        from pandas._libs.tslib import maybe_get_tz
-        for case in ['dateutil/Europe/Brussels', 'dateutil/Asia/Tokyo',
-                     'dateutil/US/Pacific']:
-            p = Period('1/1/2005', freq='M').to_timestamp(
-                tz=maybe_get_tz(case))
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, gettz(case.split('/', 1)[1]))
-            self.assertEqual(p.tz, exp.tz)
-
-            p = Period('1/1/2005',
-                       freq='M').to_timestamp(freq='3H', tz=maybe_get_tz(case))
-            exp = Timestamp('1/1/2005', tz='UTC').tz_convert(case)
-            self.assertEqual(p, exp)
-            self.assertEqual(p.tz, gettz(case.split('/', 1)[1]))
-            self.assertEqual(p.tz, exp.tz)
-
-    def test_timestamp_tz_arg_dateutil_from_string(self):
-        from pandas._libs.tslib import _dateutil_gettz as gettz
-        p = Period('1/1/2005',
-                   freq='M').to_timestamp(tz='dateutil/Europe/Brussels')
-        self.assertEqual(p.tz, gettz('Europe/Brussels'))
-
-    def test_timestamp_mult(self):
-        p = pd.Period('2011-01', freq='M')
-        self.assertEqual(p.to_timestamp(how='S'), pd.Timestamp('2011-01-01'))
-        self.assertEqual(p.to_timestamp(how='E'), pd.Timestamp('2011-01-31'))
-
-        p = pd.Period('2011-01', freq='3M')
-        self.assertEqual(p.to_timestamp(how='S'), pd.Timestamp('2011-01-01'))
-        self.assertEqual(p.to_timestamp(how='E'), pd.Timestamp('2011-03-31'))
-
-    def test_construction(self):
-        i1 = Period('1/1/2005', freq='M')
-        i2 = Period('Jan 2005')
-
-        self.assertEqual(i1, i2)
-
-        i1 = Period('2005', freq='A')
-        i2 = Period('2005')
-        i3 = Period('2005', freq='a')
-
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        i4 = Period('2005', freq='M')
-        i5 = Period('2005', freq='m')
-
-        self.assertRaises(ValueError, i1.__ne__, i4)
-        self.assertEqual(i4, i5)
-
-        i1 = Period.now('Q')
-        i2 = Period(datetime.now(), freq='Q')
-        i3 = Period.now('q')
-
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        i1 = Period('1982', freq='min')
-        i2 = Period('1982', freq='MIN')
-        self.assertEqual(i1, i2)
-        i2 = Period('1982', freq=('Min', 1))
-        self.assertEqual(i1, i2)
-
-        i1 = Period(year=2005, month=3, day=1, freq='D')
-        i2 = Period('3/1/2005', freq='D')
-        self.assertEqual(i1, i2)
-
-        i3 = Period(year=2005, month=3, day=1, freq='d')
-        self.assertEqual(i1, i3)
-
-        i1 = Period('2007-01-01 09:00:00.001')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np_datetime64_compat(
-            '2007-01-01 09:00:00.001Z'), freq='L')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('2007-01-01 09:00:00.00101')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
-                          freq='U')
-        self.assertEqual(i1, expected)
-
-        self.assertRaises(ValueError, Period, ordinal=200701)
-
-        self.assertRaises(ValueError, Period, '2007-1-1', freq='X')
-
-    def test_construction_bday(self):
-
-        # Biz day construction, roll forward if non-weekday
-        i1 = Period('3/10/12', freq='B')
-        i2 = Period('3/10/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-        i2 = Period('3/11/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-        i2 = Period('3/12/12', freq='D')
-        self.assertEqual(i1, i2.asfreq('B'))
-
-        i3 = Period('3/10/12', freq='b')
-        self.assertEqual(i1, i3)
-
-        i1 = Period(year=2012, month=3, day=10, freq='B')
-        i2 = Period('3/12/12', freq='B')
-        self.assertEqual(i1, i2)
-
-    def test_construction_quarter(self):
-
-        i1 = Period(year=2005, quarter=1, freq='Q')
-        i2 = Period('1/1/2005', freq='Q')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(year=2005, quarter=3, freq='Q')
-        i2 = Period('9/1/2005', freq='Q')
-        self.assertEqual(i1, i2)
-
-        i1 = Period('2005Q1')
-        i2 = Period(year=2005, quarter=1, freq='Q')
-        i3 = Period('2005q1')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-
-        i1 = Period('05Q1')
-        self.assertEqual(i1, i2)
-        lower = Period('05q1')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('1Q2005')
-        self.assertEqual(i1, i2)
-        lower = Period('1q2005')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('1Q05')
-        self.assertEqual(i1, i2)
-        lower = Period('1q05')
-        self.assertEqual(i1, lower)
-
-        i1 = Period('4Q1984')
-        self.assertEqual(i1.year, 1984)
-        lower = Period('4q1984')
-        self.assertEqual(i1, lower)
-
-    def test_construction_month(self):
-
-        expected = Period('2007-01', freq='M')
-        i1 = Period('200701', freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('200701', freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period(200701, freq='M')
-        self.assertEqual(i1, expected)
-
-        i1 = Period(ordinal=200701, freq='M')
-        self.assertEqual(i1.year, 18695)
-
-        i1 = Period(datetime(2007, 1, 1), freq='M')
-        i2 = Period('200701', freq='M')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(date(2007, 1, 1), freq='M')
-        i2 = Period(datetime(2007, 1, 1), freq='M')
-        i3 = Period(np.datetime64('2007-01-01'), freq='M')
-        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
-        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-        self.assertEqual(i1, i4)
-        self.assertEqual(i1, i5)
-
-    def test_period_constructor_offsets(self):
-        self.assertEqual(Period('1/1/2005', freq=offsets.MonthEnd()),
-                         Period('1/1/2005', freq='M'))
-        self.assertEqual(Period('2005', freq=offsets.YearEnd()),
-                         Period('2005', freq='A'))
-        self.assertEqual(Period('2005', freq=offsets.MonthEnd()),
-                         Period('2005', freq='M'))
-        self.assertEqual(Period('3/10/12', freq=offsets.BusinessDay()),
-                         Period('3/10/12', freq='B'))
-        self.assertEqual(Period('3/10/12', freq=offsets.Day()),
-                         Period('3/10/12', freq='D'))
-
-        self.assertEqual(Period(year=2005, quarter=1,
-                                freq=offsets.QuarterEnd(startingMonth=12)),
-                         Period(year=2005, quarter=1, freq='Q'))
-        self.assertEqual(Period(year=2005, quarter=2,
-                                freq=offsets.QuarterEnd(startingMonth=12)),
-                         Period(year=2005, quarter=2, freq='Q'))
-
-        self.assertEqual(Period(year=2005, month=3, day=1, freq=offsets.Day()),
-                         Period(year=2005, month=3, day=1, freq='D'))
-        self.assertEqual(Period(year=2012, month=3, day=10,
-                                freq=offsets.BDay()),
-                         Period(year=2012, month=3, day=10, freq='B'))
-
-        expected = Period('2005-03-01', freq='3D')
-        self.assertEqual(Period(year=2005, month=3, day=1,
-                                freq=offsets.Day(3)), expected)
-        self.assertEqual(Period(year=2005, month=3, day=1, freq='3D'),
-                         expected)
-
-        self.assertEqual(Period(year=2012, month=3, day=10,
-                                freq=offsets.BDay(3)),
-                         Period(year=2012, month=3, day=10, freq='3B'))
-
-        self.assertEqual(Period(200701, freq=offsets.MonthEnd()),
-                         Period(200701, freq='M'))
-
-        i1 = Period(ordinal=200701, freq=offsets.MonthEnd())
-        i2 = Period(ordinal=200701, freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1.year, 18695)
-        self.assertEqual(i2.year, 18695)
-
-        i1 = Period(datetime(2007, 1, 1), freq='M')
-        i2 = Period('200701', freq='M')
-        self.assertEqual(i1, i2)
-
-        i1 = Period(date(2007, 1, 1), freq='M')
-        i2 = Period(datetime(2007, 1, 1), freq='M')
-        i3 = Period(np.datetime64('2007-01-01'), freq='M')
-        i4 = Period(np_datetime64_compat('2007-01-01 00:00:00Z'), freq='M')
-        i5 = Period(np_datetime64_compat('2007-01-01 00:00:00.000Z'), freq='M')
-        self.assertEqual(i1, i2)
-        self.assertEqual(i1, i3)
-        self.assertEqual(i1, i4)
-        self.assertEqual(i1, i5)
-
-        i1 = Period('2007-01-01 09:00:00.001')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1000), freq='L')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np_datetime64_compat(
-            '2007-01-01 09:00:00.001Z'), freq='L')
-        self.assertEqual(i1, expected)
-
-        i1 = Period('2007-01-01 09:00:00.00101')
-        expected = Period(datetime(2007, 1, 1, 9, 0, 0, 1010), freq='U')
-        self.assertEqual(i1, expected)
-
-        expected = Period(np_datetime64_compat('2007-01-01 09:00:00.00101Z'),
-                          freq='U')
-        self.assertEqual(i1, expected)
-
-        self.assertRaises(ValueError, Period, ordinal=200701)
-
-        self.assertRaises(ValueError, Period, '2007-1-1', freq='X')
-
-    def test_freq_str(self):
-        i1 = Period('1982', freq='Min')
-        self.assertEqual(i1.freq, offsets.Minute())
-        self.assertEqual(i1.freqstr, 'T')
-
-    def test_period_deprecated_freq(self):
-        cases = {"M": ["MTH", "MONTH", "MONTHLY", "Mth", "month", "monthly"],
-                 "B": ["BUS", "BUSINESS", "BUSINESSLY", "WEEKDAY", "bus"],
-                 "D": ["DAY", "DLY", "DAILY", "Day", "Dly", "Daily"],
-                 "H": ["HR", "HOUR", "HRLY", "HOURLY", "hr", "Hour", "HRly"],
-                 "T": ["minute", "MINUTE", "MINUTELY", "minutely"],
-                 "S": ["sec", "SEC", "SECOND", "SECONDLY", "second"],
-                 "L": ["MILLISECOND", "MILLISECONDLY", "millisecond"],
-                 "U": ["MICROSECOND", "MICROSECONDLY", "microsecond"],
-                 "N": ["NANOSECOND", "NANOSECONDLY", "nanosecond"]}
-
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        for exp, freqs in iteritems(cases):
-            for freq in freqs:
-                with self.assertRaisesRegexp(ValueError, msg):
-                    Period('2016-03-01 09:00', freq=freq)
-                with self.assertRaisesRegexp(ValueError, msg):
-                    Period(ordinal=1, freq=freq)
-
-            # check supported freq-aliases still works
-            p1 = Period('2016-03-01 09:00', freq=exp)
-            p2 = Period(ordinal=1, freq=exp)
-            tm.assertIsInstance(p1, Period)
-            tm.assertIsInstance(p2, Period)
-
-    def test_hash(self):
-        self.assertEqual(hash(Period('2011-01', freq='M')),
-                         hash(Period('2011-01', freq='M')))
-
-        self.assertNotEqual(hash(Period('2011-01-01', freq='D')),
-                            hash(Period('2011-01', freq='M')))
-
-        self.assertNotEqual(hash(Period('2011-01', freq='3M')),
-                            hash(Period('2011-01', freq='2M')))
-
-        self.assertNotEqual(hash(Period('2011-01', freq='M')),
-                            hash(Period('2011-02', freq='M')))
-
-    def test_repr(self):
-        p = Period('Jan-2000')
-        self.assertIn('2000-01', repr(p))
-
-        p = Period('2000-12-15')
-        self.assertIn('2000-12-15', repr(p))
-
-    def test_repr_nat(self):
-        p = Period('nat', freq='M')
-        self.assertIn(repr(tslib.NaT), repr(p))
-
-    def test_millisecond_repr(self):
-        p = Period('2000-01-01 12:15:02.123')
-
-        self.assertEqual("Period('2000-01-01 12:15:02.123', 'L')", repr(p))
-
-    def test_microsecond_repr(self):
-        p = Period('2000-01-01 12:15:02.123567')
-
-        self.assertEqual("Period('2000-01-01 12:15:02.123567', 'U')", repr(p))
-
-    def test_strftime(self):
-        p = Period('2000-1-1 12:34:12', freq='S')
-        res = p.strftime('%Y-%m-%d %H:%M:%S')
-        self.assertEqual(res, '2000-01-01 12:34:12')
-        tm.assertIsInstance(res, text_type)  # GH3363
-
-    def test_sub_delta(self):
-        left, right = Period('2011', freq='A'), Period('2007', freq='A')
-        result = left - right
-        self.assertEqual(result, 4)
-
-        with self.assertRaises(period.IncompatibleFrequency):
-            left - Period('2007-01', freq='M')
-
-    def test_to_timestamp(self):
-        p = Period('1982', freq='A')
-        start_ts = p.to_timestamp(how='S')
-        aliases = ['s', 'StarT', 'BEGIn']
-        for a in aliases:
-            self.assertEqual(start_ts, p.to_timestamp('D', how=a))
-            # freq with mult should not affect to the result
-            self.assertEqual(start_ts, p.to_timestamp('3D', how=a))
-
-        end_ts = p.to_timestamp(how='E')
-        aliases = ['e', 'end', 'FINIsH']
-        for a in aliases:
-            self.assertEqual(end_ts, p.to_timestamp('D', how=a))
-            self.assertEqual(end_ts, p.to_timestamp('3D', how=a))
-
-        from_lst = ['A', 'Q', 'M', 'W', 'B', 'D', 'H', 'Min', 'S']
-
-        def _ex(p):
-            return Timestamp((p + 1).start_time.value - 1)
-
-        for i, fcode in enumerate(from_lst):
-            p = Period('1982', freq=fcode)
-            result = p.to_timestamp().to_period(fcode)
-            self.assertEqual(result, p)
-
-            self.assertEqual(p.start_time, p.to_timestamp(how='S'))
-
-            self.assertEqual(p.end_time, _ex(p))
-
-        # Frequency other than daily
-
-        p = Period('1985', freq='A')
-
-        result = p.to_timestamp('H', how='end')
-        expected = datetime(1985, 12, 31, 23)
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('3H', how='end')
-        self.assertEqual(result, expected)
-
-        result = p.to_timestamp('T', how='end')
-        expected = datetime(1985, 12, 31, 23, 59)
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('2T', how='end')
-        self.assertEqual(result, expected)
-
-        result = p.to_timestamp(how='end')
-        expected = datetime(1985, 12, 31)
-        self.assertEqual(result, expected)
-
-        expected = datetime(1985, 1, 1)
-        result = p.to_timestamp('H', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('T', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('S', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('3H', how='start')
-        self.assertEqual(result, expected)
-        result = p.to_timestamp('5S', how='start')
-        self.assertEqual(result, expected)
-
-    def test_start_time(self):
-        freq_lst = ['A', 'Q', 'M', 'D', 'H', 'T', 'S']
-        xp = datetime(2012, 1, 1)
-        for f in freq_lst:
-            p = Period('2012', freq=f)
-            self.assertEqual(p.start_time, xp)
-        self.assertEqual(Period('2012', freq='B').start_time,
-                         datetime(2012, 1, 2))
-        self.assertEqual(Period('2012', freq='W').start_time,
-                         datetime(2011, 12, 26))
-
-    def test_end_time(self):
-        p = Period('2012', freq='A')
-
-        def _ex(*args):
-            return Timestamp(Timestamp(datetime(*args)).value - 1)
-
-        xp = _ex(2013, 1, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='Q')
-        xp = _ex(2012, 4, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='M')
-        xp = _ex(2012, 2, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='D')
-        xp = _ex(2012, 1, 2)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='H')
-        xp = _ex(2012, 1, 1, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='B')
-        xp = _ex(2012, 1, 3)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='W')
-        xp = _ex(2012, 1, 2)
-        self.assertEqual(xp, p.end_time)
-
-        # Test for GH 11738
-        p = Period('2012', freq='15D')
-        xp = _ex(2012, 1, 16)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='1D1H')
-        xp = _ex(2012, 1, 2, 1)
-        self.assertEqual(xp, p.end_time)
-
-        p = Period('2012', freq='1H1D')
-        xp = _ex(2012, 1, 2, 1)
-        self.assertEqual(xp, p.end_time)
-
-    def test_anchor_week_end_time(self):
-        def _ex(*args):
-            return Timestamp(Timestamp(datetime(*args)).value - 1)
-
-        p = Period('2013-1-1', 'W-SAT')
-        xp = _ex(2013, 1, 6)
-        self.assertEqual(p.end_time, xp)
-
-    def test_properties_annually(self):
-        # Test properties on Periods with annually frequency.
-        a_date = Period(freq='A', year=2007)
-        self.assertEqual(a_date.year, 2007)
-
-    def test_properties_quarterly(self):
-        # Test properties on Periods with daily frequency.
-        qedec_date = Period(freq="Q-DEC", year=2007, quarter=1)
-        qejan_date = Period(freq="Q-JAN", year=2007, quarter=1)
-        qejun_date = Period(freq="Q-JUN", year=2007, quarter=1)
-        #
-        for x in range(3):
-            for qd in (qedec_date, qejan_date, qejun_date):
-                self.assertEqual((qd + x).qyear, 2007)
-                self.assertEqual((qd + x).quarter, x + 1)
-
-    def test_properties_monthly(self):
-        # Test properties on Periods with daily frequency.
-        m_date = Period(freq='M', year=2007, month=1)
-        for x in range(11):
-            m_ival_x = m_date + x
-            self.assertEqual(m_ival_x.year, 2007)
-            if 1 <= x + 1 <= 3:
-                self.assertEqual(m_ival_x.quarter, 1)
-            elif 4 <= x + 1 <= 6:
-                self.assertEqual(m_ival_x.quarter, 2)
-            elif 7 <= x + 1 <= 9:
-                self.assertEqual(m_ival_x.quarter, 3)
-            elif 10 <= x + 1 <= 12:
-                self.assertEqual(m_ival_x.quarter, 4)
-            self.assertEqual(m_ival_x.month, x + 1)
-
-    def test_properties_weekly(self):
-        # Test properties on Periods with daily frequency.
-        w_date = Period(freq='W', year=2007, month=1, day=7)
-        #
-        self.assertEqual(w_date.year, 2007)
-        self.assertEqual(w_date.quarter, 1)
-        self.assertEqual(w_date.month, 1)
-        self.assertEqual(w_date.week, 1)
-        self.assertEqual((w_date - 1).week, 52)
-        self.assertEqual(w_date.days_in_month, 31)
-        self.assertEqual(Period(freq='W', year=2012,
-                                month=2, day=1).days_in_month, 29)
-
-    def test_properties_weekly_legacy(self):
-        # Test properties on Periods with daily frequency.
-        w_date = Period(freq='W', year=2007, month=1, day=7)
-        self.assertEqual(w_date.year, 2007)
-        self.assertEqual(w_date.quarter, 1)
-        self.assertEqual(w_date.month, 1)
-        self.assertEqual(w_date.week, 1)
-        self.assertEqual((w_date - 1).week, 52)
-        self.assertEqual(w_date.days_in_month, 31)
-
-        exp = Period(freq='W', year=2012, month=2, day=1)
-        self.assertEqual(exp.days_in_month, 29)
-
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK', year=2007, month=1, day=7)
-
-    def test_properties_daily(self):
-        # Test properties on Periods with daily frequency.
-        b_date = Period(freq='B', year=2007, month=1, day=1)
-        #
-        self.assertEqual(b_date.year, 2007)
-        self.assertEqual(b_date.quarter, 1)
-        self.assertEqual(b_date.month, 1)
-        self.assertEqual(b_date.day, 1)
-        self.assertEqual(b_date.weekday, 0)
-        self.assertEqual(b_date.dayofyear, 1)
-        self.assertEqual(b_date.days_in_month, 31)
-        self.assertEqual(Period(freq='B', year=2012,
-                                month=2, day=1).days_in_month, 29)
-        #
-        d_date = Period(freq='D', year=2007, month=1, day=1)
-        #
-        self.assertEqual(d_date.year, 2007)
-        self.assertEqual(d_date.quarter, 1)
-        self.assertEqual(d_date.month, 1)
-        self.assertEqual(d_date.day, 1)
-        self.assertEqual(d_date.weekday, 0)
-        self.assertEqual(d_date.dayofyear, 1)
-        self.assertEqual(d_date.days_in_month, 31)
-        self.assertEqual(Period(freq='D', year=2012, month=2,
-                                day=1).days_in_month, 29)
-
-    def test_properties_hourly(self):
-        # Test properties on Periods with hourly frequency.
-        h_date1 = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        h_date2 = Period(freq='2H', year=2007, month=1, day=1, hour=0)
-
-        for h_date in [h_date1, h_date2]:
-            self.assertEqual(h_date.year, 2007)
-            self.assertEqual(h_date.quarter, 1)
-            self.assertEqual(h_date.month, 1)
-            self.assertEqual(h_date.day, 1)
-            self.assertEqual(h_date.weekday, 0)
-            self.assertEqual(h_date.dayofyear, 1)
-            self.assertEqual(h_date.hour, 0)
-            self.assertEqual(h_date.days_in_month, 31)
-            self.assertEqual(Period(freq='H', year=2012, month=2, day=1,
-                                    hour=0).days_in_month, 29)
-
-    def test_properties_minutely(self):
-        # Test properties on Periods with minutely frequency.
-        t_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                        minute=0)
-        #
-        self.assertEqual(t_date.quarter, 1)
-        self.assertEqual(t_date.month, 1)
-        self.assertEqual(t_date.day, 1)
-        self.assertEqual(t_date.weekday, 0)
-        self.assertEqual(t_date.dayofyear, 1)
-        self.assertEqual(t_date.hour, 0)
-        self.assertEqual(t_date.minute, 0)
-        self.assertEqual(t_date.days_in_month, 31)
-        self.assertEqual(Period(freq='D', year=2012, month=2, day=1, hour=0,
-                                minute=0).days_in_month, 29)
-
-    def test_properties_secondly(self):
-        # Test properties on Periods with secondly frequency.
-        s_date = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                        minute=0, second=0)
-        #
-        self.assertEqual(s_date.year, 2007)
-        self.assertEqual(s_date.quarter, 1)
-        self.assertEqual(s_date.month, 1)
-        self.assertEqual(s_date.day, 1)
-        self.assertEqual(s_date.weekday, 0)
-        self.assertEqual(s_date.dayofyear, 1)
-        self.assertEqual(s_date.hour, 0)
-        self.assertEqual(s_date.minute, 0)
-        self.assertEqual(s_date.second, 0)
-        self.assertEqual(s_date.days_in_month, 31)
-        self.assertEqual(Period(freq='Min', year=2012, month=2, day=1, hour=0,
-                                minute=0, second=0).days_in_month, 29)
-
-    def test_pnow(self):
-
-        # deprecation, xref #13790
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            period.pnow('D')
-
-    def test_constructor_corner(self):
-        expected = Period('2007-01', freq='2M')
-        self.assertEqual(Period(year=2007, month=1, freq='2M'), expected)
-
-        self.assertRaises(ValueError, Period, datetime.now())
-        self.assertRaises(ValueError, Period, datetime.now().date())
-        self.assertRaises(ValueError, Period, 1.6, freq='D')
-        self.assertRaises(ValueError, Period, ordinal=1.6, freq='D')
-        self.assertRaises(ValueError, Period, ordinal=2, value=1, freq='D')
-        self.assertIs(Period(None), pd.NaT)
-        self.assertRaises(ValueError, Period, month=1)
-
-        p = Period('2007-01-01', freq='D')
-
-        result = Period(p, freq='A')
-        exp = Period('2007', freq='A')
-        self.assertEqual(result, exp)
-
-    def test_constructor_infer_freq(self):
-        p = Period('2007-01-01')
-        self.assertEqual(p.freq, 'D')
-
-        p = Period('2007-01-01 07')
-        self.assertEqual(p.freq, 'H')
-
-        p = Period('2007-01-01 07:10')
-        self.assertEqual(p.freq, 'T')
-
-        p = Period('2007-01-01 07:10:15')
-        self.assertEqual(p.freq, 'S')
-
-        p = Period('2007-01-01 07:10:15.123')
-        self.assertEqual(p.freq, 'L')
-
-        p = Period('2007-01-01 07:10:15.123000')
-        self.assertEqual(p.freq, 'L')
-
-        p = Period('2007-01-01 07:10:15.123400')
-        self.assertEqual(p.freq, 'U')
-
-    def test_badinput(self):
-        self.assertRaises(ValueError, Period, '-2000', 'A')
-        self.assertRaises(tslib.DateParseError, Period, '0', 'A')
-        self.assertRaises(tslib.DateParseError, Period, '1/1/-2000', 'A')
-
-    def test_multiples(self):
-        result1 = Period('1989', freq='2A')
-        result2 = Period('1989', freq='A')
-        self.assertEqual(result1.ordinal, result2.ordinal)
-        self.assertEqual(result1.freqstr, '2A-DEC')
-        self.assertEqual(result2.freqstr, 'A-DEC')
-        self.assertEqual(result1.freq, offsets.YearEnd(2))
-        self.assertEqual(result2.freq, offsets.YearEnd())
-
-        self.assertEqual((result1 + 1).ordinal, result1.ordinal + 2)
-        self.assertEqual((1 + result1).ordinal, result1.ordinal + 2)
-        self.assertEqual((result1 - 1).ordinal, result2.ordinal - 2)
-        self.assertEqual((-1 + result1).ordinal, result2.ordinal - 2)
-
-    def test_round_trip(self):
-
-        p = Period('2000Q1')
-        new_p = self.round_trip_pickle(p)
-        self.assertEqual(new_p, p)
-
-
-class TestPeriodField(tm.TestCase):
-
-    def test_get_period_field_raises_on_out_of_range(self):
-        self.assertRaises(ValueError, libperiod.get_period_field, -1, 0, 0)
-
-    def test_get_period_field_array_raises_on_out_of_range(self):
-        self.assertRaises(ValueError, libperiod.get_period_field_arr, -1,
-                          np.empty(1), 0)
-
-
-class TestComparisons(tm.TestCase):
-
-    def setUp(self):
-        self.january1 = Period('2000-01', 'M')
-        self.january2 = Period('2000-01', 'M')
-        self.february = Period('2000-02', 'M')
-        self.march = Period('2000-03', 'M')
-        self.day = Period('2012-01-01', 'D')
-
-    def test_equal(self):
-        self.assertEqual(self.january1, self.january2)
-
-    def test_equal_Raises_Value(self):
-        with tm.assertRaises(period.IncompatibleFrequency):
-            self.january1 == self.day
-
-    def test_notEqual(self):
-        self.assertNotEqual(self.january1, 1)
-        self.assertNotEqual(self.january1, self.february)
-
-    def test_greater(self):
-        self.assertTrue(self.february > self.january1)
-
-    def test_greater_Raises_Value(self):
-        with tm.assertRaises(period.IncompatibleFrequency):
-            self.january1 > self.day
-
-    def test_greater_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 > 1
-
-    def test_greaterEqual(self):
-        self.assertTrue(self.january1 >= self.january2)
-
-    def test_greaterEqual_Raises_Value(self):
-        with tm.assertRaises(period.IncompatibleFrequency):
-            self.january1 >= self.day
-
-        with tm.assertRaises(TypeError):
-            print(self.january1 >= 1)
-
-    def test_smallerEqual(self):
-        self.assertTrue(self.january1 <= self.january2)
-
-    def test_smallerEqual_Raises_Value(self):
-        with tm.assertRaises(period.IncompatibleFrequency):
-            self.january1 <= self.day
-
-    def test_smallerEqual_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 <= 1
-
-    def test_smaller(self):
-        self.assertTrue(self.january1 < self.february)
-
-    def test_smaller_Raises_Value(self):
-        with tm.assertRaises(period.IncompatibleFrequency):
-            self.january1 < self.day
-
-    def test_smaller_Raises_Type(self):
-        with tm.assertRaises(TypeError):
-            self.january1 < 1
-
-    def test_sort(self):
-        periods = [self.march, self.january1, self.february]
-        correctPeriods = [self.january1, self.february, self.march]
-        self.assertEqual(sorted(periods), correctPeriods)
-
-    def test_period_nat_comp(self):
-        p_nat = Period('NaT', freq='D')
-        p = Period('2011-01-01', freq='D')
-
-        nat = pd.Timestamp('NaT')
-        t = pd.Timestamp('2011-01-01')
-        # confirm Period('NaT') work identical with Timestamp('NaT')
-        for left, right in [(p_nat, p), (p, p_nat), (p_nat, p_nat), (nat, t),
-                            (t, nat), (nat, nat)]:
-            self.assertEqual(left < right, False)
-            self.assertEqual(left > right, False)
-            self.assertEqual(left == right, False)
-            self.assertEqual(left != right, True)
-            self.assertEqual(left <= right, False)
-            self.assertEqual(left >= right, False)
-
-
-class TestMethods(tm.TestCase):
-
-    def test_add(self):
-        dt1 = Period(freq='D', year=2008, month=1, day=1)
-        dt2 = Period(freq='D', year=2008, month=1, day=2)
-        self.assertEqual(dt1 + 1, dt2)
-        self.assertEqual(1 + dt1, dt2)
-
-    def test_add_pdnat(self):
-        p = pd.Period('2011-01', freq='M')
-        self.assertIs(p + pd.NaT, pd.NaT)
-        self.assertIs(pd.NaT + p, pd.NaT)
-
-        p = pd.Period('NaT', freq='M')
-        self.assertIs(p + pd.NaT, pd.NaT)
-        self.assertIs(pd.NaT + p, pd.NaT)
-
-    def test_add_raises(self):
-        # GH 4731
-        dt1 = Period(freq='D', year=2008, month=1, day=1)
-        dt2 = Period(freq='D', year=2008, month=1, day=2)
-        msg = r"unsupported operand type\(s\)"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            dt1 + "str"
-
-        msg = r"unsupported operand type\(s\)"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            "str" + dt1
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            dt1 + dt2
-
-    def test_sub(self):
-        dt1 = Period('2011-01-01', freq='D')
-        dt2 = Period('2011-01-15', freq='D')
-
-        self.assertEqual(dt1 - dt2, -14)
-        self.assertEqual(dt2 - dt1, 14)
-
-        msg = r"Input has different freq=M from Period\(freq=D\)"
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-            dt1 - pd.Period('2011-02', freq='M')
-
-    def test_add_offset(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('2011', freq=freq)
-            exp = Period('2013', freq=freq)
-            self.assertEqual(p + offsets.YearEnd(2), exp)
-            self.assertEqual(offsets.YearEnd(2) + p, exp)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p + o
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    with tm.assertRaises(period.IncompatibleFrequency):
-                        o + p
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('2011-03', freq=freq)
-            exp = Period('2011-05', freq=freq)
-            self.assertEqual(p + offsets.MonthEnd(2), exp)
-            self.assertEqual(offsets.MonthEnd(2) + p, exp)
-
-            exp = Period('2012-03', freq=freq)
-            self.assertEqual(p + offsets.MonthEnd(12), exp)
-            self.assertEqual(offsets.MonthEnd(12) + p, exp)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p + o
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    with tm.assertRaises(period.IncompatibleFrequency):
-                        o + p
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('2011-04-01', freq=freq)
-
-            exp = Period('2011-04-06', freq=freq)
-            self.assertEqual(p + offsets.Day(5), exp)
-            self.assertEqual(offsets.Day(5) + p, exp)
-
-            exp = Period('2011-04-02', freq=freq)
-            self.assertEqual(p + offsets.Hour(24), exp)
-            self.assertEqual(offsets.Hour(24) + p, exp)
-
-            exp = Period('2011-04-03', freq=freq)
-            self.assertEqual(p + np.timedelta64(2, 'D'), exp)
-            with tm.assertRaises(TypeError):
-                np.timedelta64(2, 'D') + p
-
-            exp = Period('2011-04-02', freq=freq)
-            self.assertEqual(p + np.timedelta64(3600 * 24, 's'), exp)
-            with tm.assertRaises(TypeError):
-                np.timedelta64(3600 * 24, 's') + p
-
-            exp = Period('2011-03-30', freq=freq)
-            self.assertEqual(p + timedelta(-2), exp)
-            self.assertEqual(timedelta(-2) + p, exp)
-
-            exp = Period('2011-04-03', freq=freq)
-            self.assertEqual(p + timedelta(hours=48), exp)
-            self.assertEqual(timedelta(hours=48) + p, exp)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(4, 'h'),
-                      timedelta(hours=23)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p + o
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    with tm.assertRaises(period.IncompatibleFrequency):
-                        o + p
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('2011-04-01 09:00', freq=freq)
-
-            exp = Period('2011-04-03 09:00', freq=freq)
-            self.assertEqual(p + offsets.Day(2), exp)
-            self.assertEqual(offsets.Day(2) + p, exp)
-
-            exp = Period('2011-04-01 12:00', freq=freq)
-            self.assertEqual(p + offsets.Hour(3), exp)
-            self.assertEqual(offsets.Hour(3) + p, exp)
-
-            exp = Period('2011-04-01 12:00', freq=freq)
-            self.assertEqual(p + np.timedelta64(3, 'h'), exp)
-            with tm.assertRaises(TypeError):
-                np.timedelta64(3, 'h') + p
-
-            exp = Period('2011-04-01 10:00', freq=freq)
-            self.assertEqual(p + np.timedelta64(3600, 's'), exp)
-            with tm.assertRaises(TypeError):
-                np.timedelta64(3600, 's') + p
-
-            exp = Period('2011-04-01 11:00', freq=freq)
-            self.assertEqual(p + timedelta(minutes=120), exp)
-            self.assertEqual(timedelta(minutes=120) + p, exp)
-
-            exp = Period('2011-04-05 12:00', freq=freq)
-            self.assertEqual(p + timedelta(days=4, minutes=180), exp)
-            self.assertEqual(timedelta(days=4, minutes=180) + p, exp)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(3200, 's'),
-                      timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p + o
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    with tm.assertRaises(period.IncompatibleFrequency):
-                        o + p
-
-    def test_add_offset_nat(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.YearEnd(2)]:
-                self.assertIs(p + o, tslib.NaT)
-                self.assertIs(o + p, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
-                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
-                      timedelta(hours=48)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(4, 'h'),
-                      timedelta(hours=23)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
-                      np.timedelta64(3600, 's'), timedelta(minutes=120),
-                      timedelta(days=4, minutes=180)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if not isinstance(o, np.timedelta64):
-                    self.assertIs(o + p, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(3200, 's'),
-                      timedelta(hours=23, minutes=30)]:
-                self.assertIs(p + o, tslib.NaT)
-
-                if isinstance(o, np.timedelta64):
-                    with tm.assertRaises(TypeError):
-                        o + p
-                else:
-                    self.assertIs(o + p, tslib.NaT)
-
-    def test_sub_pdnat(self):
-        # GH 13071
-        p = pd.Period('2011-01', freq='M')
-        self.assertIs(p - pd.NaT, pd.NaT)
-        self.assertIs(pd.NaT - p, pd.NaT)
-
-        p = pd.Period('NaT', freq='M')
-        self.assertIs(p - pd.NaT, pd.NaT)
-        self.assertIs(pd.NaT - p, pd.NaT)
-
-    def test_sub_offset(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('2011', freq=freq)
-            self.assertEqual(p - offsets.YearEnd(2), Period('2009', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p - o
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('2011-03', freq=freq)
-            self.assertEqual(p - offsets.MonthEnd(2),
-                             Period('2011-01', freq=freq))
-            self.assertEqual(p - offsets.MonthEnd(12),
-                             Period('2010-03', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p - o
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('2011-04-01', freq=freq)
-            self.assertEqual(p - offsets.Day(5),
-                             Period('2011-03-27', freq=freq))
-            self.assertEqual(p - offsets.Hour(24),
-                             Period('2011-03-31', freq=freq))
-            self.assertEqual(p - np.timedelta64(2, 'D'),
-                             Period('2011-03-30', freq=freq))
-            self.assertEqual(p - np.timedelta64(3600 * 24, 's'),
-                             Period('2011-03-31', freq=freq))
-            self.assertEqual(p - timedelta(-2),
-                             Period('2011-04-03', freq=freq))
-            self.assertEqual(p - timedelta(hours=48),
-                             Period('2011-03-30', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(4, 'h'),
-                      timedelta(hours=23)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p - o
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('2011-04-01 09:00', freq=freq)
-            self.assertEqual(p - offsets.Day(2),
-                             Period('2011-03-30 09:00', freq=freq))
-            self.assertEqual(p - offsets.Hour(3),
-                             Period('2011-04-01 06:00', freq=freq))
-            self.assertEqual(p - np.timedelta64(3, 'h'),
-                             Period('2011-04-01 06:00', freq=freq))
-            self.assertEqual(p - np.timedelta64(3600, 's'),
-                             Period('2011-04-01 08:00', freq=freq))
-            self.assertEqual(p - timedelta(minutes=120),
-                             Period('2011-04-01 07:00', freq=freq))
-            self.assertEqual(p - timedelta(days=4, minutes=180),
-                             Period('2011-03-28 06:00', freq=freq))
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(3200, 's'),
-                      timedelta(hours=23, minutes=30)]:
-                with tm.assertRaises(period.IncompatibleFrequency):
-                    p - o
-
-    def test_sub_offset_nat(self):
-        # freq is DateOffset
-        for freq in ['A', '2A', '3A']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.YearEnd(2)]:
-                self.assertIs(p - o, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                self.assertIs(p - o, tslib.NaT)
-
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.MonthEnd(2), offsets.MonthEnd(12)]:
-                self.assertIs(p - o, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(365, 'D'),
-                      timedelta(365)]:
-                self.assertIs(p - o, tslib.NaT)
-
-        # freq is Tick
-        for freq in ['D', '2D', '3D']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(5), offsets.Hour(24), np.timedelta64(2, 'D'),
-                      np.timedelta64(3600 * 24, 's'), timedelta(-2),
-                      timedelta(hours=48)]:
-                self.assertIs(p - o, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(4, 'h'),
-                      timedelta(hours=23)]:
-                self.assertIs(p - o, tslib.NaT)
-
-        for freq in ['H', '2H', '3H']:
-            p = Period('NaT', freq=freq)
-            for o in [offsets.Day(2), offsets.Hour(3), np.timedelta64(3, 'h'),
-                      np.timedelta64(3600, 's'), timedelta(minutes=120),
-                      timedelta(days=4, minutes=180)]:
-                self.assertIs(p - o, tslib.NaT)
-
-            for o in [offsets.YearBegin(2), offsets.MonthBegin(1),
-                      offsets.Minute(), np.timedelta64(3200, 's'),
-                      timedelta(hours=23, minutes=30)]:
-                self.assertIs(p - o, tslib.NaT)
-
-    def test_nat_ops(self):
-        for freq in ['M', '2M', '3M']:
-            p = Period('NaT', freq=freq)
-            self.assertIs(p + 1, tslib.NaT)
-            self.assertIs(1 + p, tslib.NaT)
-            self.assertIs(p - 1, tslib.NaT)
-            self.assertIs(p - Period('2011-01', freq=freq), tslib.NaT)
-            self.assertIs(Period('2011-01', freq=freq) - p, tslib.NaT)
-
-    def test_period_ops_offset(self):
-        p = Period('2011-04-01', freq='D')
-        result = p + offsets.Day()
-        exp = pd.Period('2011-04-02', freq='D')
-        self.assertEqual(result, exp)
-
-        result = p - offsets.Day(2)
-        exp = pd.Period('2011-03-30', freq='D')
-        self.assertEqual(result, exp)
-
-        msg = r"Input cannot be converted to Period\(freq=D\)"
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-            p + offsets.Hour(2)
-
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-            p - offsets.Hour(2)
diff --git a/pandas/tests/scalar/test_period_asfreq.py b/pandas/tests/scalar/test_period_asfreq.py
deleted file mode 100644
index d311fef8a826d..0000000000000
--- a/pandas/tests/scalar/test_period_asfreq.py
+++ /dev/null
@@ -1,721 +0,0 @@
-import pandas as pd
-from pandas import Period, offsets
-from pandas.util import testing as tm
-from pandas.tseries.frequencies import _period_code_map
-
-
-class TestFreqConversion(tm.TestCase):
-    "Test frequency conversion of date objects"
-
-    def test_asfreq_corner(self):
-        val = Period(freq='A', year=2007)
-        result1 = val.asfreq('5t')
-        result2 = val.asfreq('t')
-        expected = Period('2007-12-31 23:59', freq='t')
-        self.assertEqual(result1.ordinal, expected.ordinal)
-        self.assertEqual(result1.freqstr, '5T')
-        self.assertEqual(result2.ordinal, expected.ordinal)
-        self.assertEqual(result2.freqstr, 'T')
-
-    def test_conv_annual(self):
-        # frequency conversion tests: from Annual Frequency
-
-        ival_A = Period(freq='A', year=2007)
-
-        ival_AJAN = Period(freq="A-JAN", year=2007)
-        ival_AJUN = Period(freq="A-JUN", year=2007)
-        ival_ANOV = Period(freq="A-NOV", year=2007)
-
-        ival_A_to_Q_start = Period(freq='Q', year=2007, quarter=1)
-        ival_A_to_Q_end = Period(freq='Q', year=2007, quarter=4)
-        ival_A_to_M_start = Period(freq='M', year=2007, month=1)
-        ival_A_to_M_end = Period(freq='M', year=2007, month=12)
-        ival_A_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_A_to_W_end = Period(freq='W', year=2007, month=12, day=31)
-        ival_A_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_A_to_B_end = Period(freq='B', year=2007, month=12, day=31)
-        ival_A_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_A_to_D_end = Period(freq='D', year=2007, month=12, day=31)
-        ival_A_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_A_to_H_end = Period(freq='H', year=2007, month=12, day=31,
-                                 hour=23)
-        ival_A_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_A_to_T_end = Period(freq='Min', year=2007, month=12, day=31,
-                                 hour=23, minute=59)
-        ival_A_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_A_to_S_end = Period(freq='S', year=2007, month=12, day=31,
-                                 hour=23, minute=59, second=59)
-
-        ival_AJAN_to_D_end = Period(freq='D', year=2007, month=1, day=31)
-        ival_AJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
-        ival_AJUN_to_D_end = Period(freq='D', year=2007, month=6, day=30)
-        ival_AJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
-        ival_ANOV_to_D_end = Period(freq='D', year=2007, month=11, day=30)
-        ival_ANOV_to_D_start = Period(freq='D', year=2006, month=12, day=1)
-
-        self.assertEqual(ival_A.asfreq('Q', 'S'), ival_A_to_Q_start)
-        self.assertEqual(ival_A.asfreq('Q', 'e'), ival_A_to_Q_end)
-        self.assertEqual(ival_A.asfreq('M', 's'), ival_A_to_M_start)
-        self.assertEqual(ival_A.asfreq('M', 'E'), ival_A_to_M_end)
-        self.assertEqual(ival_A.asfreq('W', 'S'), ival_A_to_W_start)
-        self.assertEqual(ival_A.asfreq('W', 'E'), ival_A_to_W_end)
-        self.assertEqual(ival_A.asfreq('B', 'S'), ival_A_to_B_start)
-        self.assertEqual(ival_A.asfreq('B', 'E'), ival_A_to_B_end)
-        self.assertEqual(ival_A.asfreq('D', 'S'), ival_A_to_D_start)
-        self.assertEqual(ival_A.asfreq('D', 'E'), ival_A_to_D_end)
-        self.assertEqual(ival_A.asfreq('H', 'S'), ival_A_to_H_start)
-        self.assertEqual(ival_A.asfreq('H', 'E'), ival_A_to_H_end)
-        self.assertEqual(ival_A.asfreq('min', 'S'), ival_A_to_T_start)
-        self.assertEqual(ival_A.asfreq('min', 'E'), ival_A_to_T_end)
-        self.assertEqual(ival_A.asfreq('T', 'S'), ival_A_to_T_start)
-        self.assertEqual(ival_A.asfreq('T', 'E'), ival_A_to_T_end)
-        self.assertEqual(ival_A.asfreq('S', 'S'), ival_A_to_S_start)
-        self.assertEqual(ival_A.asfreq('S', 'E'), ival_A_to_S_end)
-
-        self.assertEqual(ival_AJAN.asfreq('D', 'S'), ival_AJAN_to_D_start)
-        self.assertEqual(ival_AJAN.asfreq('D', 'E'), ival_AJAN_to_D_end)
-
-        self.assertEqual(ival_AJUN.asfreq('D', 'S'), ival_AJUN_to_D_start)
-        self.assertEqual(ival_AJUN.asfreq('D', 'E'), ival_AJUN_to_D_end)
-
-        self.assertEqual(ival_ANOV.asfreq('D', 'S'), ival_ANOV_to_D_start)
-        self.assertEqual(ival_ANOV.asfreq('D', 'E'), ival_ANOV_to_D_end)
-
-        self.assertEqual(ival_A.asfreq('A'), ival_A)
-
-    def test_conv_quarterly(self):
-        # frequency conversion tests: from Quarterly Frequency
-
-        ival_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_Q_end_of_year = Period(freq='Q', year=2007, quarter=4)
-
-        ival_QEJAN = Period(freq="Q-JAN", year=2007, quarter=1)
-        ival_QEJUN = Period(freq="Q-JUN", year=2007, quarter=1)
-
-        ival_Q_to_A = Period(freq='A', year=2007)
-        ival_Q_to_M_start = Period(freq='M', year=2007, month=1)
-        ival_Q_to_M_end = Period(freq='M', year=2007, month=3)
-        ival_Q_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_Q_to_W_end = Period(freq='W', year=2007, month=3, day=31)
-        ival_Q_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_Q_to_B_end = Period(freq='B', year=2007, month=3, day=30)
-        ival_Q_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_Q_to_D_end = Period(freq='D', year=2007, month=3, day=31)
-        ival_Q_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_Q_to_H_end = Period(freq='H', year=2007, month=3, day=31, hour=23)
-        ival_Q_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_Q_to_T_end = Period(freq='Min', year=2007, month=3, day=31,
-                                 hour=23, minute=59)
-        ival_Q_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_Q_to_S_end = Period(freq='S', year=2007, month=3, day=31, hour=23,
-                                 minute=59, second=59)
-
-        ival_QEJAN_to_D_start = Period(freq='D', year=2006, month=2, day=1)
-        ival_QEJAN_to_D_end = Period(freq='D', year=2006, month=4, day=30)
-
-        ival_QEJUN_to_D_start = Period(freq='D', year=2006, month=7, day=1)
-        ival_QEJUN_to_D_end = Period(freq='D', year=2006, month=9, day=30)
-
-        self.assertEqual(ival_Q.asfreq('A'), ival_Q_to_A)
-        self.assertEqual(ival_Q_end_of_year.asfreq('A'), ival_Q_to_A)
-
-        self.assertEqual(ival_Q.asfreq('M', 'S'), ival_Q_to_M_start)
-        self.assertEqual(ival_Q.asfreq('M', 'E'), ival_Q_to_M_end)
-        self.assertEqual(ival_Q.asfreq('W', 'S'), ival_Q_to_W_start)
-        self.assertEqual(ival_Q.asfreq('W', 'E'), ival_Q_to_W_end)
-        self.assertEqual(ival_Q.asfreq('B', 'S'), ival_Q_to_B_start)
-        self.assertEqual(ival_Q.asfreq('B', 'E'), ival_Q_to_B_end)
-        self.assertEqual(ival_Q.asfreq('D', 'S'), ival_Q_to_D_start)
-        self.assertEqual(ival_Q.asfreq('D', 'E'), ival_Q_to_D_end)
-        self.assertEqual(ival_Q.asfreq('H', 'S'), ival_Q_to_H_start)
-        self.assertEqual(ival_Q.asfreq('H', 'E'), ival_Q_to_H_end)
-        self.assertEqual(ival_Q.asfreq('Min', 'S'), ival_Q_to_T_start)
-        self.assertEqual(ival_Q.asfreq('Min', 'E'), ival_Q_to_T_end)
-        self.assertEqual(ival_Q.asfreq('S', 'S'), ival_Q_to_S_start)
-        self.assertEqual(ival_Q.asfreq('S', 'E'), ival_Q_to_S_end)
-
-        self.assertEqual(ival_QEJAN.asfreq('D', 'S'), ival_QEJAN_to_D_start)
-        self.assertEqual(ival_QEJAN.asfreq('D', 'E'), ival_QEJAN_to_D_end)
-        self.assertEqual(ival_QEJUN.asfreq('D', 'S'), ival_QEJUN_to_D_start)
-        self.assertEqual(ival_QEJUN.asfreq('D', 'E'), ival_QEJUN_to_D_end)
-
-        self.assertEqual(ival_Q.asfreq('Q'), ival_Q)
-
-    def test_conv_monthly(self):
-        # frequency conversion tests: from Monthly Frequency
-
-        ival_M = Period(freq='M', year=2007, month=1)
-        ival_M_end_of_year = Period(freq='M', year=2007, month=12)
-        ival_M_end_of_quarter = Period(freq='M', year=2007, month=3)
-        ival_M_to_A = Period(freq='A', year=2007)
-        ival_M_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_M_to_W_start = Period(freq='W', year=2007, month=1, day=1)
-        ival_M_to_W_end = Period(freq='W', year=2007, month=1, day=31)
-        ival_M_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_M_to_B_end = Period(freq='B', year=2007, month=1, day=31)
-        ival_M_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_M_to_D_end = Period(freq='D', year=2007, month=1, day=31)
-        ival_M_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_M_to_H_end = Period(freq='H', year=2007, month=1, day=31, hour=23)
-        ival_M_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_M_to_T_end = Period(freq='Min', year=2007, month=1, day=31,
-                                 hour=23, minute=59)
-        ival_M_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_M_to_S_end = Period(freq='S', year=2007, month=1, day=31, hour=23,
-                                 minute=59, second=59)
-
-        self.assertEqual(ival_M.asfreq('A'), ival_M_to_A)
-        self.assertEqual(ival_M_end_of_year.asfreq('A'), ival_M_to_A)
-        self.assertEqual(ival_M.asfreq('Q'), ival_M_to_Q)
-        self.assertEqual(ival_M_end_of_quarter.asfreq('Q'), ival_M_to_Q)
-
-        self.assertEqual(ival_M.asfreq('W', 'S'), ival_M_to_W_start)
-        self.assertEqual(ival_M.asfreq('W', 'E'), ival_M_to_W_end)
-        self.assertEqual(ival_M.asfreq('B', 'S'), ival_M_to_B_start)
-        self.assertEqual(ival_M.asfreq('B', 'E'), ival_M_to_B_end)
-        self.assertEqual(ival_M.asfreq('D', 'S'), ival_M_to_D_start)
-        self.assertEqual(ival_M.asfreq('D', 'E'), ival_M_to_D_end)
-        self.assertEqual(ival_M.asfreq('H', 'S'), ival_M_to_H_start)
-        self.assertEqual(ival_M.asfreq('H', 'E'), ival_M_to_H_end)
-        self.assertEqual(ival_M.asfreq('Min', 'S'), ival_M_to_T_start)
-        self.assertEqual(ival_M.asfreq('Min', 'E'), ival_M_to_T_end)
-        self.assertEqual(ival_M.asfreq('S', 'S'), ival_M_to_S_start)
-        self.assertEqual(ival_M.asfreq('S', 'E'), ival_M_to_S_end)
-
-        self.assertEqual(ival_M.asfreq('M'), ival_M)
-
-    def test_conv_weekly(self):
-        # frequency conversion tests: from Weekly Frequency
-        ival_W = Period(freq='W', year=2007, month=1, day=1)
-
-        ival_WSUN = Period(freq='W', year=2007, month=1, day=7)
-        ival_WSAT = Period(freq='W-SAT', year=2007, month=1, day=6)
-        ival_WFRI = Period(freq='W-FRI', year=2007, month=1, day=5)
-        ival_WTHU = Period(freq='W-THU', year=2007, month=1, day=4)
-        ival_WWED = Period(freq='W-WED', year=2007, month=1, day=3)
-        ival_WTUE = Period(freq='W-TUE', year=2007, month=1, day=2)
-        ival_WMON = Period(freq='W-MON', year=2007, month=1, day=1)
-
-        ival_WSUN_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_WSUN_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_WSAT_to_D_start = Period(freq='D', year=2006, month=12, day=31)
-        ival_WSAT_to_D_end = Period(freq='D', year=2007, month=1, day=6)
-        ival_WFRI_to_D_start = Period(freq='D', year=2006, month=12, day=30)
-        ival_WFRI_to_D_end = Period(freq='D', year=2007, month=1, day=5)
-        ival_WTHU_to_D_start = Period(freq='D', year=2006, month=12, day=29)
-        ival_WTHU_to_D_end = Period(freq='D', year=2007, month=1, day=4)
-        ival_WWED_to_D_start = Period(freq='D', year=2006, month=12, day=28)
-        ival_WWED_to_D_end = Period(freq='D', year=2007, month=1, day=3)
-        ival_WTUE_to_D_start = Period(freq='D', year=2006, month=12, day=27)
-        ival_WTUE_to_D_end = Period(freq='D', year=2007, month=1, day=2)
-        ival_WMON_to_D_start = Period(freq='D', year=2006, month=12, day=26)
-        ival_WMON_to_D_end = Period(freq='D', year=2007, month=1, day=1)
-
-        ival_W_end_of_year = Period(freq='W', year=2007, month=12, day=31)
-        ival_W_end_of_quarter = Period(freq='W', year=2007, month=3, day=31)
-        ival_W_end_of_month = Period(freq='W', year=2007, month=1, day=31)
-        ival_W_to_A = Period(freq='A', year=2007)
-        ival_W_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_W_to_M = Period(freq='M', year=2007, month=1)
-
-        if Period(freq='D', year=2007, month=12, day=31).weekday == 6:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2007)
-        else:
-            ival_W_to_A_end_of_year = Period(freq='A', year=2008)
-
-        if Period(freq='D', year=2007, month=3, day=31).weekday == 6:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=1)
-        else:
-            ival_W_to_Q_end_of_quarter = Period(freq='Q', year=2007, quarter=2)
-
-        if Period(freq='D', year=2007, month=1, day=31).weekday == 6:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=1)
-        else:
-            ival_W_to_M_end_of_month = Period(freq='M', year=2007, month=2)
-
-        ival_W_to_B_start = Period(freq='B', year=2007, month=1, day=1)
-        ival_W_to_B_end = Period(freq='B', year=2007, month=1, day=5)
-        ival_W_to_D_start = Period(freq='D', year=2007, month=1, day=1)
-        ival_W_to_D_end = Period(freq='D', year=2007, month=1, day=7)
-        ival_W_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_W_to_H_end = Period(freq='H', year=2007, month=1, day=7, hour=23)
-        ival_W_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_W_to_T_end = Period(freq='Min', year=2007, month=1, day=7,
-                                 hour=23, minute=59)
-        ival_W_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_W_to_S_end = Period(freq='S', year=2007, month=1, day=7, hour=23,
-                                 minute=59, second=59)
-
-        self.assertEqual(ival_W.asfreq('A'), ival_W_to_A)
-        self.assertEqual(ival_W_end_of_year.asfreq('A'),
-                         ival_W_to_A_end_of_year)
-        self.assertEqual(ival_W.asfreq('Q'), ival_W_to_Q)
-        self.assertEqual(ival_W_end_of_quarter.asfreq('Q'),
-                         ival_W_to_Q_end_of_quarter)
-        self.assertEqual(ival_W.asfreq('M'), ival_W_to_M)
-        self.assertEqual(ival_W_end_of_month.asfreq('M'),
-                         ival_W_to_M_end_of_month)
-
-        self.assertEqual(ival_W.asfreq('B', 'S'), ival_W_to_B_start)
-        self.assertEqual(ival_W.asfreq('B', 'E'), ival_W_to_B_end)
-
-        self.assertEqual(ival_W.asfreq('D', 'S'), ival_W_to_D_start)
-        self.assertEqual(ival_W.asfreq('D', 'E'), ival_W_to_D_end)
-
-        self.assertEqual(ival_WSUN.asfreq('D', 'S'), ival_WSUN_to_D_start)
-        self.assertEqual(ival_WSUN.asfreq('D', 'E'), ival_WSUN_to_D_end)
-        self.assertEqual(ival_WSAT.asfreq('D', 'S'), ival_WSAT_to_D_start)
-        self.assertEqual(ival_WSAT.asfreq('D', 'E'), ival_WSAT_to_D_end)
-        self.assertEqual(ival_WFRI.asfreq('D', 'S'), ival_WFRI_to_D_start)
-        self.assertEqual(ival_WFRI.asfreq('D', 'E'), ival_WFRI_to_D_end)
-        self.assertEqual(ival_WTHU.asfreq('D', 'S'), ival_WTHU_to_D_start)
-        self.assertEqual(ival_WTHU.asfreq('D', 'E'), ival_WTHU_to_D_end)
-        self.assertEqual(ival_WWED.asfreq('D', 'S'), ival_WWED_to_D_start)
-        self.assertEqual(ival_WWED.asfreq('D', 'E'), ival_WWED_to_D_end)
-        self.assertEqual(ival_WTUE.asfreq('D', 'S'), ival_WTUE_to_D_start)
-        self.assertEqual(ival_WTUE.asfreq('D', 'E'), ival_WTUE_to_D_end)
-        self.assertEqual(ival_WMON.asfreq('D', 'S'), ival_WMON_to_D_start)
-        self.assertEqual(ival_WMON.asfreq('D', 'E'), ival_WMON_to_D_end)
-
-        self.assertEqual(ival_W.asfreq('H', 'S'), ival_W_to_H_start)
-        self.assertEqual(ival_W.asfreq('H', 'E'), ival_W_to_H_end)
-        self.assertEqual(ival_W.asfreq('Min', 'S'), ival_W_to_T_start)
-        self.assertEqual(ival_W.asfreq('Min', 'E'), ival_W_to_T_end)
-        self.assertEqual(ival_W.asfreq('S', 'S'), ival_W_to_S_start)
-        self.assertEqual(ival_W.asfreq('S', 'E'), ival_W_to_S_end)
-
-        self.assertEqual(ival_W.asfreq('W'), ival_W)
-
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            ival_W.asfreq('WK')
-
-    def test_conv_weekly_legacy(self):
-        # frequency conversion tests: from Weekly Frequency
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK', year=2007, month=1, day=1)
-
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-SAT', year=2007, month=1, day=6)
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-FRI', year=2007, month=1, day=5)
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-THU', year=2007, month=1, day=4)
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-WED', year=2007, month=1, day=3)
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-TUE', year=2007, month=1, day=2)
-        with self.assertRaisesRegexp(ValueError, msg):
-            Period(freq='WK-MON', year=2007, month=1, day=1)
-
-    def test_conv_business(self):
-        # frequency conversion tests: from Business Frequency"
-
-        ival_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_B_end_of_year = Period(freq='B', year=2007, month=12, day=31)
-        ival_B_end_of_quarter = Period(freq='B', year=2007, month=3, day=30)
-        ival_B_end_of_month = Period(freq='B', year=2007, month=1, day=31)
-        ival_B_end_of_week = Period(freq='B', year=2007, month=1, day=5)
-
-        ival_B_to_A = Period(freq='A', year=2007)
-        ival_B_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_B_to_M = Period(freq='M', year=2007, month=1)
-        ival_B_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_B_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_B_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_B_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
-        ival_B_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_B_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
-                                 hour=23, minute=59)
-        ival_B_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_B_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
-                                 minute=59, second=59)
-
-        self.assertEqual(ival_B.asfreq('A'), ival_B_to_A)
-        self.assertEqual(ival_B_end_of_year.asfreq('A'), ival_B_to_A)
-        self.assertEqual(ival_B.asfreq('Q'), ival_B_to_Q)
-        self.assertEqual(ival_B_end_of_quarter.asfreq('Q'), ival_B_to_Q)
-        self.assertEqual(ival_B.asfreq('M'), ival_B_to_M)
-        self.assertEqual(ival_B_end_of_month.asfreq('M'), ival_B_to_M)
-        self.assertEqual(ival_B.asfreq('W'), ival_B_to_W)
-        self.assertEqual(ival_B_end_of_week.asfreq('W'), ival_B_to_W)
-
-        self.assertEqual(ival_B.asfreq('D'), ival_B_to_D)
-
-        self.assertEqual(ival_B.asfreq('H', 'S'), ival_B_to_H_start)
-        self.assertEqual(ival_B.asfreq('H', 'E'), ival_B_to_H_end)
-        self.assertEqual(ival_B.asfreq('Min', 'S'), ival_B_to_T_start)
-        self.assertEqual(ival_B.asfreq('Min', 'E'), ival_B_to_T_end)
-        self.assertEqual(ival_B.asfreq('S', 'S'), ival_B_to_S_start)
-        self.assertEqual(ival_B.asfreq('S', 'E'), ival_B_to_S_end)
-
-        self.assertEqual(ival_B.asfreq('B'), ival_B)
-
-    def test_conv_daily(self):
-        # frequency conversion tests: from Business Frequency"
-
-        ival_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_D_end_of_year = Period(freq='D', year=2007, month=12, day=31)
-        ival_D_end_of_quarter = Period(freq='D', year=2007, month=3, day=31)
-        ival_D_end_of_month = Period(freq='D', year=2007, month=1, day=31)
-        ival_D_end_of_week = Period(freq='D', year=2007, month=1, day=7)
-
-        ival_D_friday = Period(freq='D', year=2007, month=1, day=5)
-        ival_D_saturday = Period(freq='D', year=2007, month=1, day=6)
-        ival_D_sunday = Period(freq='D', year=2007, month=1, day=7)
-
-        # TODO: unused?
-        # ival_D_monday = Period(freq='D', year=2007, month=1, day=8)
-
-        ival_B_friday = Period(freq='B', year=2007, month=1, day=5)
-        ival_B_monday = Period(freq='B', year=2007, month=1, day=8)
-
-        ival_D_to_A = Period(freq='A', year=2007)
-
-        ival_Deoq_to_AJAN = Period(freq='A-JAN', year=2008)
-        ival_Deoq_to_AJUN = Period(freq='A-JUN', year=2007)
-        ival_Deoq_to_ADEC = Period(freq='A-DEC', year=2007)
-
-        ival_D_to_QEJAN = Period(freq="Q-JAN", year=2007, quarter=4)
-        ival_D_to_QEJUN = Period(freq="Q-JUN", year=2007, quarter=3)
-        ival_D_to_QEDEC = Period(freq="Q-DEC", year=2007, quarter=1)
-
-        ival_D_to_M = Period(freq='M', year=2007, month=1)
-        ival_D_to_W = Period(freq='W', year=2007, month=1, day=7)
-
-        ival_D_to_H_start = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_D_to_H_end = Period(freq='H', year=2007, month=1, day=1, hour=23)
-        ival_D_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_D_to_T_end = Period(freq='Min', year=2007, month=1, day=1,
-                                 hour=23, minute=59)
-        ival_D_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_D_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=23,
-                                 minute=59, second=59)
-
-        self.assertEqual(ival_D.asfreq('A'), ival_D_to_A)
-
-        self.assertEqual(ival_D_end_of_quarter.asfreq('A-JAN'),
-                         ival_Deoq_to_AJAN)
-        self.assertEqual(ival_D_end_of_quarter.asfreq('A-JUN'),
-                         ival_Deoq_to_AJUN)
-        self.assertEqual(ival_D_end_of_quarter.asfreq('A-DEC'),
-                         ival_Deoq_to_ADEC)
-
-        self.assertEqual(ival_D_end_of_year.asfreq('A'), ival_D_to_A)
-        self.assertEqual(ival_D_end_of_quarter.asfreq('Q'), ival_D_to_QEDEC)
-        self.assertEqual(ival_D.asfreq("Q-JAN"), ival_D_to_QEJAN)
-        self.assertEqual(ival_D.asfreq("Q-JUN"), ival_D_to_QEJUN)
-        self.assertEqual(ival_D.asfreq("Q-DEC"), ival_D_to_QEDEC)
-        self.assertEqual(ival_D.asfreq('M'), ival_D_to_M)
-        self.assertEqual(ival_D_end_of_month.asfreq('M'), ival_D_to_M)
-        self.assertEqual(ival_D.asfreq('W'), ival_D_to_W)
-        self.assertEqual(ival_D_end_of_week.asfreq('W'), ival_D_to_W)
-
-        self.assertEqual(ival_D_friday.asfreq('B'), ival_B_friday)
-        self.assertEqual(ival_D_saturday.asfreq('B', 'S'), ival_B_friday)
-        self.assertEqual(ival_D_saturday.asfreq('B', 'E'), ival_B_monday)
-        self.assertEqual(ival_D_sunday.asfreq('B', 'S'), ival_B_friday)
-        self.assertEqual(ival_D_sunday.asfreq('B', 'E'), ival_B_monday)
-
-        self.assertEqual(ival_D.asfreq('H', 'S'), ival_D_to_H_start)
-        self.assertEqual(ival_D.asfreq('H', 'E'), ival_D_to_H_end)
-        self.assertEqual(ival_D.asfreq('Min', 'S'), ival_D_to_T_start)
-        self.assertEqual(ival_D.asfreq('Min', 'E'), ival_D_to_T_end)
-        self.assertEqual(ival_D.asfreq('S', 'S'), ival_D_to_S_start)
-        self.assertEqual(ival_D.asfreq('S', 'E'), ival_D_to_S_end)
-
-        self.assertEqual(ival_D.asfreq('D'), ival_D)
-
-    def test_conv_hourly(self):
-        # frequency conversion tests: from Hourly Frequency"
-
-        ival_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_H_end_of_year = Period(freq='H', year=2007, month=12, day=31,
-                                    hour=23)
-        ival_H_end_of_quarter = Period(freq='H', year=2007, month=3, day=31,
-                                       hour=23)
-        ival_H_end_of_month = Period(freq='H', year=2007, month=1, day=31,
-                                     hour=23)
-        ival_H_end_of_week = Period(freq='H', year=2007, month=1, day=7,
-                                    hour=23)
-        ival_H_end_of_day = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=23)
-        ival_H_end_of_bus = Period(freq='H', year=2007, month=1, day=1,
-                                   hour=23)
-
-        ival_H_to_A = Period(freq='A', year=2007)
-        ival_H_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_H_to_M = Period(freq='M', year=2007, month=1)
-        ival_H_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_H_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_H_to_B = Period(freq='B', year=2007, month=1, day=1)
-
-        ival_H_to_T_start = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=0, minute=0)
-        ival_H_to_T_end = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                                 minute=59)
-        ival_H_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_H_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                 minute=59, second=59)
-
-        self.assertEqual(ival_H.asfreq('A'), ival_H_to_A)
-        self.assertEqual(ival_H_end_of_year.asfreq('A'), ival_H_to_A)
-        self.assertEqual(ival_H.asfreq('Q'), ival_H_to_Q)
-        self.assertEqual(ival_H_end_of_quarter.asfreq('Q'), ival_H_to_Q)
-        self.assertEqual(ival_H.asfreq('M'), ival_H_to_M)
-        self.assertEqual(ival_H_end_of_month.asfreq('M'), ival_H_to_M)
-        self.assertEqual(ival_H.asfreq('W'), ival_H_to_W)
-        self.assertEqual(ival_H_end_of_week.asfreq('W'), ival_H_to_W)
-        self.assertEqual(ival_H.asfreq('D'), ival_H_to_D)
-        self.assertEqual(ival_H_end_of_day.asfreq('D'), ival_H_to_D)
-        self.assertEqual(ival_H.asfreq('B'), ival_H_to_B)
-        self.assertEqual(ival_H_end_of_bus.asfreq('B'), ival_H_to_B)
-
-        self.assertEqual(ival_H.asfreq('Min', 'S'), ival_H_to_T_start)
-        self.assertEqual(ival_H.asfreq('Min', 'E'), ival_H_to_T_end)
-        self.assertEqual(ival_H.asfreq('S', 'S'), ival_H_to_S_start)
-        self.assertEqual(ival_H.asfreq('S', 'E'), ival_H_to_S_end)
-
-        self.assertEqual(ival_H.asfreq('H'), ival_H)
-
-    def test_conv_minutely(self):
-        # frequency conversion tests: from Minutely Frequency"
-
-        ival_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                        minute=0)
-        ival_T_end_of_year = Period(freq='Min', year=2007, month=12, day=31,
-                                    hour=23, minute=59)
-        ival_T_end_of_quarter = Period(freq='Min', year=2007, month=3, day=31,
-                                       hour=23, minute=59)
-        ival_T_end_of_month = Period(freq='Min', year=2007, month=1, day=31,
-                                     hour=23, minute=59)
-        ival_T_end_of_week = Period(freq='Min', year=2007, month=1, day=7,
-                                    hour=23, minute=59)
-        ival_T_end_of_day = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=23, minute=59)
-        ival_T_end_of_bus = Period(freq='Min', year=2007, month=1, day=1,
-                                   hour=23, minute=59)
-        ival_T_end_of_hour = Period(freq='Min', year=2007, month=1, day=1,
-                                    hour=0, minute=59)
-
-        ival_T_to_A = Period(freq='A', year=2007)
-        ival_T_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_T_to_M = Period(freq='M', year=2007, month=1)
-        ival_T_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_T_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_T_to_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_T_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
-
-        ival_T_to_S_start = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                   minute=0, second=0)
-        ival_T_to_S_end = Period(freq='S', year=2007, month=1, day=1, hour=0,
-                                 minute=0, second=59)
-
-        self.assertEqual(ival_T.asfreq('A'), ival_T_to_A)
-        self.assertEqual(ival_T_end_of_year.asfreq('A'), ival_T_to_A)
-        self.assertEqual(ival_T.asfreq('Q'), ival_T_to_Q)
-        self.assertEqual(ival_T_end_of_quarter.asfreq('Q'), ival_T_to_Q)
-        self.assertEqual(ival_T.asfreq('M'), ival_T_to_M)
-        self.assertEqual(ival_T_end_of_month.asfreq('M'), ival_T_to_M)
-        self.assertEqual(ival_T.asfreq('W'), ival_T_to_W)
-        self.assertEqual(ival_T_end_of_week.asfreq('W'), ival_T_to_W)
-        self.assertEqual(ival_T.asfreq('D'), ival_T_to_D)
-        self.assertEqual(ival_T_end_of_day.asfreq('D'), ival_T_to_D)
-        self.assertEqual(ival_T.asfreq('B'), ival_T_to_B)
-        self.assertEqual(ival_T_end_of_bus.asfreq('B'), ival_T_to_B)
-        self.assertEqual(ival_T.asfreq('H'), ival_T_to_H)
-        self.assertEqual(ival_T_end_of_hour.asfreq('H'), ival_T_to_H)
-
-        self.assertEqual(ival_T.asfreq('S', 'S'), ival_T_to_S_start)
-        self.assertEqual(ival_T.asfreq('S', 'E'), ival_T_to_S_end)
-
-        self.assertEqual(ival_T.asfreq('Min'), ival_T)
-
-    def test_conv_secondly(self):
-        # frequency conversion tests: from Secondly Frequency"
-
-        ival_S = Period(freq='S', year=2007, month=1, day=1, hour=0, minute=0,
-                        second=0)
-        ival_S_end_of_year = Period(freq='S', year=2007, month=12, day=31,
-                                    hour=23, minute=59, second=59)
-        ival_S_end_of_quarter = Period(freq='S', year=2007, month=3, day=31,
-                                       hour=23, minute=59, second=59)
-        ival_S_end_of_month = Period(freq='S', year=2007, month=1, day=31,
-                                     hour=23, minute=59, second=59)
-        ival_S_end_of_week = Period(freq='S', year=2007, month=1, day=7,
-                                    hour=23, minute=59, second=59)
-        ival_S_end_of_day = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=23, minute=59, second=59)
-        ival_S_end_of_bus = Period(freq='S', year=2007, month=1, day=1,
-                                   hour=23, minute=59, second=59)
-        ival_S_end_of_hour = Period(freq='S', year=2007, month=1, day=1,
-                                    hour=0, minute=59, second=59)
-        ival_S_end_of_minute = Period(freq='S', year=2007, month=1, day=1,
-                                      hour=0, minute=0, second=59)
-
-        ival_S_to_A = Period(freq='A', year=2007)
-        ival_S_to_Q = Period(freq='Q', year=2007, quarter=1)
-        ival_S_to_M = Period(freq='M', year=2007, month=1)
-        ival_S_to_W = Period(freq='W', year=2007, month=1, day=7)
-        ival_S_to_D = Period(freq='D', year=2007, month=1, day=1)
-        ival_S_to_B = Period(freq='B', year=2007, month=1, day=1)
-        ival_S_to_H = Period(freq='H', year=2007, month=1, day=1, hour=0)
-        ival_S_to_T = Period(freq='Min', year=2007, month=1, day=1, hour=0,
-                             minute=0)
-
-        self.assertEqual(ival_S.asfreq('A'), ival_S_to_A)
-        self.assertEqual(ival_S_end_of_year.asfreq('A'), ival_S_to_A)
-        self.assertEqual(ival_S.asfreq('Q'), ival_S_to_Q)
-        self.assertEqual(ival_S_end_of_quarter.asfreq('Q'), ival_S_to_Q)
-        self.assertEqual(ival_S.asfreq('M'), ival_S_to_M)
-        self.assertEqual(ival_S_end_of_month.asfreq('M'), ival_S_to_M)
-        self.assertEqual(ival_S.asfreq('W'), ival_S_to_W)
-        self.assertEqual(ival_S_end_of_week.asfreq('W'), ival_S_to_W)
-        self.assertEqual(ival_S.asfreq('D'), ival_S_to_D)
-        self.assertEqual(ival_S_end_of_day.asfreq('D'), ival_S_to_D)
-        self.assertEqual(ival_S.asfreq('B'), ival_S_to_B)
-        self.assertEqual(ival_S_end_of_bus.asfreq('B'), ival_S_to_B)
-        self.assertEqual(ival_S.asfreq('H'), ival_S_to_H)
-        self.assertEqual(ival_S_end_of_hour.asfreq('H'), ival_S_to_H)
-        self.assertEqual(ival_S.asfreq('Min'), ival_S_to_T)
-        self.assertEqual(ival_S_end_of_minute.asfreq('Min'), ival_S_to_T)
-
-        self.assertEqual(ival_S.asfreq('S'), ival_S)
-
-    def test_asfreq_mult(self):
-        # normal freq to mult freq
-        p = Period(freq='A', year=2007)
-        # ordinal will not change
-        for freq in ['3A', offsets.YearEnd(3)]:
-            result = p.asfreq(freq)
-            expected = Period('2007', freq='3A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        # ordinal will not change
-        for freq in ['3A', offsets.YearEnd(3)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007', freq='3A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        # mult freq to normal freq
-        p = Period(freq='3A', year=2007)
-        # ordinal will change because how=E is the default
-        for freq in ['A', offsets.YearEnd()]:
-            result = p.asfreq(freq)
-            expected = Period('2009', freq='A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        # ordinal will not change
-        for freq in ['A', offsets.YearEnd()]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007', freq='A')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        p = Period(freq='A', year=2007)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq)
-            expected = Period('2007-12', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007-01', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        p = Period(freq='3A', year=2007)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq)
-            expected = Period('2009-12', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-        for freq in ['2M', offsets.MonthEnd(2)]:
-            result = p.asfreq(freq, how='S')
-            expected = Period('2007-01', freq='2M')
-
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-    def test_asfreq_combined(self):
-        # normal freq to combined freq
-        p = Period('2007', freq='H')
-
-        # ordinal will not change
-        expected = Period('2007', freq='25H')
-        for freq, how in zip(['1D1H', '1H1D'], ['E', 'S']):
-            result = p.asfreq(freq, how=how)
-            self.assertEqual(result, expected)
-            self.assertEqual(result.ordinal, expected.ordinal)
-            self.assertEqual(result.freq, expected.freq)
-
-        # combined freq to normal freq
-        p1 = Period(freq='1D1H', year=2007)
-        p2 = Period(freq='1H1D', year=2007)
-
-        # ordinal will change because how=E is the default
-        result1 = p1.asfreq('H')
-        result2 = p2.asfreq('H')
-        expected = Period('2007-01-02', freq='H')
-        self.assertEqual(result1, expected)
-        self.assertEqual(result1.ordinal, expected.ordinal)
-        self.assertEqual(result1.freq, expected.freq)
-        self.assertEqual(result2, expected)
-        self.assertEqual(result2.ordinal, expected.ordinal)
-        self.assertEqual(result2.freq, expected.freq)
-
-        # ordinal will not change
-        result1 = p1.asfreq('H', how='S')
-        result2 = p2.asfreq('H', how='S')
-        expected = Period('2007-01-01', freq='H')
-        self.assertEqual(result1, expected)
-        self.assertEqual(result1.ordinal, expected.ordinal)
-        self.assertEqual(result1.freq, expected.freq)
-        self.assertEqual(result2, expected)
-        self.assertEqual(result2.ordinal, expected.ordinal)
-        self.assertEqual(result2.freq, expected.freq)
-
-    def test_asfreq_MS(self):
-        initial = Period("2013")
-
-        self.assertEqual(initial.asfreq(freq="M", how="S"),
-                         Period('2013-01', 'M'))
-
-        msg = pd.tseries.frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            initial.asfreq(freq="MS", how="S")
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            pd.Period('2013-01', 'MS')
-
-        self.assertTrue(_period_code_map.get("MS") is None)
diff --git a/pandas/tests/scalar/test_timedelta.py b/pandas/tests/scalar/test_timedelta.py
deleted file mode 100644
index c2b895925b685..0000000000000
--- a/pandas/tests/scalar/test_timedelta.py
+++ /dev/null
@@ -1,699 +0,0 @@
-""" test the scalar Timedelta """
-import numpy as np
-from datetime import timedelta
-
-import pandas as pd
-import pandas.util.testing as tm
-from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type as ct
-from pandas import (Timedelta, TimedeltaIndex, timedelta_range, Series,
-                    to_timedelta, compat)
-from pandas._libs.tslib import iNaT, NaTType
-
-
-class TestTimedeltas(tm.TestCase):
-    _multiprocess_can_split_ = True
-
-    def setUp(self):
-        pass
-
-    def test_construction(self):
-
-        expected = np.timedelta64(10, 'D').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta(10, unit='d').value, expected)
-        self.assertEqual(Timedelta(10.0, unit='d').value, expected)
-        self.assertEqual(Timedelta('10 days').value, expected)
-        self.assertEqual(Timedelta(days=10).value, expected)
-        self.assertEqual(Timedelta(days=10.0).value, expected)
-
-        expected += np.timedelta64(10, 's').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta('10 days 00:00:10').value, expected)
-        self.assertEqual(Timedelta(days=10, seconds=10).value, expected)
-        self.assertEqual(
-            Timedelta(days=10, milliseconds=10 * 1000).value, expected)
-        self.assertEqual(
-            Timedelta(days=10, microseconds=10 * 1000 * 1000).value, expected)
-
-        # test construction with np dtypes
-        # GH 8757
-        timedelta_kwargs = {'days': 'D',
-                            'seconds': 's',
-                            'microseconds': 'us',
-                            'milliseconds': 'ms',
-                            'minutes': 'm',
-                            'hours': 'h',
-                            'weeks': 'W'}
-        npdtypes = [np.int64, np.int32, np.int16, np.float64, np.float32,
-                    np.float16]
-        for npdtype in npdtypes:
-            for pykwarg, npkwarg in timedelta_kwargs.items():
-                expected = np.timedelta64(1,
-                                          npkwarg).astype('m8[ns]').view('i8')
-                self.assertEqual(
-                    Timedelta(**{pykwarg: npdtype(1)}).value, expected)
-
-        # rounding cases
-        self.assertEqual(Timedelta(82739999850000).value, 82739999850000)
-        self.assertTrue('0 days 22:58:59.999850' in str(Timedelta(
-            82739999850000)))
-        self.assertEqual(Timedelta(123072001000000).value, 123072001000000)
-        self.assertTrue('1 days 10:11:12.001' in str(Timedelta(
-            123072001000000)))
-
-        # string conversion with/without leading zero
-        # GH 9570
-        self.assertEqual(Timedelta('0:00:00'), timedelta(hours=0))
-        self.assertEqual(Timedelta('00:00:00'), timedelta(hours=0))
-        self.assertEqual(Timedelta('-1:00:00'), -timedelta(hours=1))
-        self.assertEqual(Timedelta('-01:00:00'), -timedelta(hours=1))
-
-        # more strings & abbrevs
-        # GH 8190
-        self.assertEqual(Timedelta('1 h'), timedelta(hours=1))
-        self.assertEqual(Timedelta('1 hour'), timedelta(hours=1))
-        self.assertEqual(Timedelta('1 hr'), timedelta(hours=1))
-        self.assertEqual(Timedelta('1 hours'), timedelta(hours=1))
-        self.assertEqual(Timedelta('-1 hours'), -timedelta(hours=1))
-        self.assertEqual(Timedelta('1 m'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1.5 m'), timedelta(seconds=90))
-        self.assertEqual(Timedelta('1 minute'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1 minutes'), timedelta(minutes=1))
-        self.assertEqual(Timedelta('1 s'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 second'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 seconds'), timedelta(seconds=1))
-        self.assertEqual(Timedelta('1 ms'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 milli'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 millisecond'), timedelta(milliseconds=1))
-        self.assertEqual(Timedelta('1 us'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1 micros'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1 microsecond'), timedelta(microseconds=1))
-        self.assertEqual(Timedelta('1.5 microsecond'),
-                         Timedelta('00:00:00.000001500'))
-        self.assertEqual(Timedelta('1 ns'), Timedelta('00:00:00.000000001'))
-        self.assertEqual(Timedelta('1 nano'), Timedelta('00:00:00.000000001'))
-        self.assertEqual(Timedelta('1 nanosecond'),
-                         Timedelta('00:00:00.000000001'))
-
-        # combos
-        self.assertEqual(Timedelta('10 days 1 hour'),
-                         timedelta(days=10, hours=1))
-        self.assertEqual(Timedelta('10 days 1 h'), timedelta(days=10, hours=1))
-        self.assertEqual(Timedelta('10 days 1 h 1m 1s'), timedelta(
-            days=10, hours=1, minutes=1, seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s'), -
-                         timedelta(days=10, hours=1, minutes=1, seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s'), -
-                         timedelta(days=10, hours=1, minutes=1, seconds=1))
-        self.assertEqual(Timedelta('-10 days 1 h 1m 1s 3us'), -
-                         timedelta(days=10, hours=1, minutes=1,
-                                   seconds=1, microseconds=3))
-        self.assertEqual(Timedelta('-10 days 1 h 1.5m 1s 3us'), -
-                         timedelta(days=10, hours=1, minutes=1,
-                                   seconds=31, microseconds=3))
-
-        # currently invalid as it has a - on the hhmmdd part (only allowed on
-        # the days)
-        self.assertRaises(ValueError,
-                          lambda: Timedelta('-10 days -1 h 1.5m 1s 3us'))
-
-        # only leading neg signs are allowed
-        self.assertRaises(ValueError,
-                          lambda: Timedelta('10 days -1 h 1.5m 1s 3us'))
-
-        # no units specified
-        self.assertRaises(ValueError, lambda: Timedelta('3.1415'))
-
-        # invalid construction
-        tm.assertRaisesRegexp(ValueError, "cannot construct a Timedelta",
-                              lambda: Timedelta())
-        tm.assertRaisesRegexp(ValueError, "unit abbreviation w/o a number",
-                              lambda: Timedelta('foo'))
-        tm.assertRaisesRegexp(ValueError,
-                              "cannot construct a Timedelta from the passed "
-                              "arguments, allowed keywords are ",
-                              lambda: Timedelta(day=10))
-
-        # roundtripping both for string and value
-        for v in ['1s', '-1s', '1us', '-1us', '1 day', '-1 day',
-                  '-23:59:59.999999', '-1 days +23:59:59.999999', '-1ns',
-                  '1ns', '-23:59:59.999999999']:
-
-            td = Timedelta(v)
-            self.assertEqual(Timedelta(td.value), td)
-
-            # str does not normally display nanos
-            if not td.nanoseconds:
-                self.assertEqual(Timedelta(str(td)), td)
-            self.assertEqual(Timedelta(td._repr_base(format='all')), td)
-
-        # floats
-        expected = np.timedelta64(
-            10, 's').astype('m8[ns]').view('i8') + np.timedelta64(
-                500, 'ms').astype('m8[ns]').view('i8')
-        self.assertEqual(Timedelta(10.5, unit='s').value, expected)
-
-        # offset
-        self.assertEqual(to_timedelta(pd.offsets.Hour(2)),
-                         Timedelta('0 days, 02:00:00'))
-        self.assertEqual(Timedelta(pd.offsets.Hour(2)),
-                         Timedelta('0 days, 02:00:00'))
-        self.assertEqual(Timedelta(pd.offsets.Second(2)),
-                         Timedelta('0 days, 00:00:02'))
-
-        # unicode
-        # GH 11995
-        expected = Timedelta('1H')
-        result = pd.Timedelta(u'1H')
-        self.assertEqual(result, expected)
-        self.assertEqual(to_timedelta(pd.offsets.Hour(2)),
-                         Timedelta(u'0 days, 02:00:00'))
-
-        self.assertRaises(ValueError, lambda: Timedelta(u'foo bar'))
-
-    def test_overflow_on_construction(self):
-        # xref https://github.com/statsmodels/statsmodels/issues/3374
-        value = pd.Timedelta('1day').value * 20169940
-        self.assertRaises(OverflowError, pd.Timedelta, value)
-
-    def test_total_seconds_scalar(self):
-        # GH 10939
-        rng = Timedelta('1 days, 10:11:12.100123456')
-        expt = 1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9
-        tm.assert_almost_equal(rng.total_seconds(), expt)
-
-        rng = Timedelta(np.nan)
-        self.assertTrue(np.isnan(rng.total_seconds()))
-
-    def test_repr(self):
-
-        self.assertEqual(repr(Timedelta(10, unit='d')),
-                         "Timedelta('10 days 00:00:00')")
-        self.assertEqual(repr(Timedelta(10, unit='s')),
-                         "Timedelta('0 days 00:00:10')")
-        self.assertEqual(repr(Timedelta(10, unit='ms')),
-                         "Timedelta('0 days 00:00:00.010000')")
-        self.assertEqual(repr(Timedelta(-10, unit='ms')),
-                         "Timedelta('-1 days +23:59:59.990000')")
-
-    def test_conversion(self):
-
-        for td in [Timedelta(10, unit='d'),
-                   Timedelta('1 days, 10:11:12.012345')]:
-            pydt = td.to_pytimedelta()
-            self.assertTrue(td == Timedelta(pydt))
-            self.assertEqual(td, pydt)
-            self.assertTrue(isinstance(pydt, timedelta) and not isinstance(
-                pydt, Timedelta))
-
-            self.assertEqual(td, np.timedelta64(td.value, 'ns'))
-            td64 = td.to_timedelta64()
-            self.assertEqual(td64, np.timedelta64(td.value, 'ns'))
-            self.assertEqual(td, td64)
-            self.assertTrue(isinstance(td64, np.timedelta64))
-
-        # this is NOT equal and cannot be roundtriped (because of the nanos)
-        td = Timedelta('1 days, 10:11:12.012345678')
-        self.assertTrue(td != td.to_pytimedelta())
-
-    def test_freq_conversion(self):
-
-        td = Timedelta('1 days 2 hours 3 ns')
-        result = td / np.timedelta64(1, 'D')
-        self.assertEqual(result, td.value / float(86400 * 1e9))
-        result = td / np.timedelta64(1, 's')
-        self.assertEqual(result, td.value / float(1e9))
-        result = td / np.timedelta64(1, 'ns')
-        self.assertEqual(result, td.value)
-
-    def test_fields(self):
-        def check(value):
-            # that we are int/long like
-            self.assertTrue(isinstance(value, (int, compat.long)))
-
-        # compat to datetime.timedelta
-        rng = to_timedelta('1 days, 10:11:12')
-        self.assertEqual(rng.days, 1)
-        self.assertEqual(rng.seconds, 10 * 3600 + 11 * 60 + 12)
-        self.assertEqual(rng.microseconds, 0)
-        self.assertEqual(rng.nanoseconds, 0)
-
-        self.assertRaises(AttributeError, lambda: rng.hours)
-        self.assertRaises(AttributeError, lambda: rng.minutes)
-        self.assertRaises(AttributeError, lambda: rng.milliseconds)
-
-        # GH 10050
-        check(rng.days)
-        check(rng.seconds)
-        check(rng.microseconds)
-        check(rng.nanoseconds)
-
-        td = Timedelta('-1 days, 10:11:12')
-        self.assertEqual(abs(td), Timedelta('13:48:48'))
-        self.assertTrue(str(td) == "-1 days +10:11:12")
-        self.assertEqual(-td, Timedelta('0 days 13:48:48'))
-        self.assertEqual(-Timedelta('-1 days, 10:11:12').value, 49728000000000)
-        self.assertEqual(Timedelta('-1 days, 10:11:12').value, -49728000000000)
-
-        rng = to_timedelta('-1 days, 10:11:12.100123456')
-        self.assertEqual(rng.days, -1)
-        self.assertEqual(rng.seconds, 10 * 3600 + 11 * 60 + 12)
-        self.assertEqual(rng.microseconds, 100 * 1000 + 123)
-        self.assertEqual(rng.nanoseconds, 456)
-        self.assertRaises(AttributeError, lambda: rng.hours)
-        self.assertRaises(AttributeError, lambda: rng.minutes)
-        self.assertRaises(AttributeError, lambda: rng.milliseconds)
-
-        # components
-        tup = pd.to_timedelta(-1, 'us').components
-        self.assertEqual(tup.days, -1)
-        self.assertEqual(tup.hours, 23)
-        self.assertEqual(tup.minutes, 59)
-        self.assertEqual(tup.seconds, 59)
-        self.assertEqual(tup.milliseconds, 999)
-        self.assertEqual(tup.microseconds, 999)
-        self.assertEqual(tup.nanoseconds, 0)
-
-        # GH 10050
-        check(tup.days)
-        check(tup.hours)
-        check(tup.minutes)
-        check(tup.seconds)
-        check(tup.milliseconds)
-        check(tup.microseconds)
-        check(tup.nanoseconds)
-
-        tup = Timedelta('-1 days 1 us').components
-        self.assertEqual(tup.days, -2)
-        self.assertEqual(tup.hours, 23)
-        self.assertEqual(tup.minutes, 59)
-        self.assertEqual(tup.seconds, 59)
-        self.assertEqual(tup.milliseconds, 999)
-        self.assertEqual(tup.microseconds, 999)
-        self.assertEqual(tup.nanoseconds, 0)
-
-    def test_nat_converters(self):
-        self.assertEqual(to_timedelta(
-            'nat', box=False).astype('int64'), iNaT)
-        self.assertEqual(to_timedelta(
-            'nan', box=False).astype('int64'), iNaT)
-
-        def testit(unit, transform):
-
-            # array
-            result = to_timedelta(np.arange(5), unit=unit)
-            expected = TimedeltaIndex([np.timedelta64(i, transform(unit))
-                                       for i in np.arange(5).tolist()])
-            tm.assert_index_equal(result, expected)
-
-            # scalar
-            result = to_timedelta(2, unit=unit)
-            expected = Timedelta(np.timedelta64(2, transform(unit)).astype(
-                'timedelta64[ns]'))
-            self.assertEqual(result, expected)
-
-        # validate all units
-        # GH 6855
-        for unit in ['Y', 'M', 'W', 'D', 'y', 'w', 'd']:
-            testit(unit, lambda x: x.upper())
-        for unit in ['days', 'day', 'Day', 'Days']:
-            testit(unit, lambda x: 'D')
-        for unit in ['h', 'm', 's', 'ms', 'us', 'ns', 'H', 'S', 'MS', 'US',
-                     'NS']:
-            testit(unit, lambda x: x.lower())
-
-        # offsets
-
-        # m
-        testit('T', lambda x: 'm')
-
-        # ms
-        testit('L', lambda x: 'ms')
-
-    def test_numeric_conversions(self):
-        self.assertEqual(ct(0), np.timedelta64(0, 'ns'))
-        self.assertEqual(ct(10), np.timedelta64(10, 'ns'))
-        self.assertEqual(ct(10, unit='ns'), np.timedelta64(
-            10, 'ns').astype('m8[ns]'))
-
-        self.assertEqual(ct(10, unit='us'), np.timedelta64(
-            10, 'us').astype('m8[ns]'))
-        self.assertEqual(ct(10, unit='ms'), np.timedelta64(
-            10, 'ms').astype('m8[ns]'))
-        self.assertEqual(ct(10, unit='s'), np.timedelta64(
-            10, 's').astype('m8[ns]'))
-        self.assertEqual(ct(10, unit='d'), np.timedelta64(
-            10, 'D').astype('m8[ns]'))
-
-    def test_timedelta_conversions(self):
-        self.assertEqual(ct(timedelta(seconds=1)),
-                         np.timedelta64(1, 's').astype('m8[ns]'))
-        self.assertEqual(ct(timedelta(microseconds=1)),
-                         np.timedelta64(1, 'us').astype('m8[ns]'))
-        self.assertEqual(ct(timedelta(days=1)),
-                         np.timedelta64(1, 'D').astype('m8[ns]'))
-
-    def test_round(self):
-
-        t1 = Timedelta('1 days 02:34:56.789123456')
-        t2 = Timedelta('-1 days 02:34:56.789123456')
-
-        for (freq, s1, s2) in [('N', t1, t2),
-                               ('U', Timedelta('1 days 02:34:56.789123000'),
-                                Timedelta('-1 days 02:34:56.789123000')),
-                               ('L', Timedelta('1 days 02:34:56.789000000'),
-                                Timedelta('-1 days 02:34:56.789000000')),
-                               ('S', Timedelta('1 days 02:34:57'),
-                                Timedelta('-1 days 02:34:57')),
-                               ('2S', Timedelta('1 days 02:34:56'),
-                                Timedelta('-1 days 02:34:56')),
-                               ('5S', Timedelta('1 days 02:34:55'),
-                                Timedelta('-1 days 02:34:55')),
-                               ('T', Timedelta('1 days 02:35:00'),
-                                Timedelta('-1 days 02:35:00')),
-                               ('12T', Timedelta('1 days 02:36:00'),
-                                Timedelta('-1 days 02:36:00')),
-                               ('H', Timedelta('1 days 03:00:00'),
-                                Timedelta('-1 days 03:00:00')),
-                               ('d', Timedelta('1 days'),
-                                Timedelta('-1 days'))]:
-            r1 = t1.round(freq)
-            self.assertEqual(r1, s1)
-            r2 = t2.round(freq)
-            self.assertEqual(r2, s2)
-
-        # invalid
-        for freq in ['Y', 'M', 'foobar']:
-            self.assertRaises(ValueError, lambda: t1.round(freq))
-
-        t1 = timedelta_range('1 days', periods=3, freq='1 min 2 s 3 us')
-        t2 = -1 * t1
-        t1a = timedelta_range('1 days', periods=3, freq='1 min 2 s')
-        t1c = pd.TimedeltaIndex([1, 1, 1], unit='D')
-
-        # note that negative times round DOWN! so don't give whole numbers
-        for (freq, s1, s2) in [('N', t1, t2),
-                               ('U', t1, t2),
-                               ('L', t1a,
-                                TimedeltaIndex(['-1 days +00:00:00',
-                                                '-2 days +23:58:58',
-                                                '-2 days +23:57:56'],
-                                               dtype='timedelta64[ns]',
-                                               freq=None)
-                                ),
-                               ('S', t1a,
-                                TimedeltaIndex(['-1 days +00:00:00',
-                                                '-2 days +23:58:58',
-                                                '-2 days +23:57:56'],
-                                               dtype='timedelta64[ns]',
-                                               freq=None)
-                                ),
-                               ('12T', t1c,
-                                TimedeltaIndex(['-1 days',
-                                                '-1 days',
-                                                '-1 days'],
-                                               dtype='timedelta64[ns]',
-                                               freq=None)
-                                ),
-                               ('H', t1c,
-                                TimedeltaIndex(['-1 days',
-                                                '-1 days',
-                                                '-1 days'],
-                                               dtype='timedelta64[ns]',
-                                               freq=None)
-                                ),
-                               ('d', t1c,
-                                pd.TimedeltaIndex([-1, -1, -1], unit='D')
-                                )]:
-
-            r1 = t1.round(freq)
-            tm.assert_index_equal(r1, s1)
-            r2 = t2.round(freq)
-        tm.assert_index_equal(r2, s2)
-
-        # invalid
-        for freq in ['Y', 'M', 'foobar']:
-            self.assertRaises(ValueError, lambda: t1.round(freq))
-
-    def test_contains(self):
-        # Checking for any NaT-like objects
-        # GH 13603
-        td = to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
-        for v in [pd.NaT, None, float('nan'), np.nan]:
-            self.assertFalse((v in td))
-
-        td = to_timedelta([pd.NaT])
-        for v in [pd.NaT, None, float('nan'), np.nan]:
-            self.assertTrue((v in td))
-
-    def test_identity(self):
-
-        td = Timedelta(10, unit='d')
-        self.assertTrue(isinstance(td, Timedelta))
-        self.assertTrue(isinstance(td, timedelta))
-
-    def test_short_format_converters(self):
-        def conv(v):
-            return v.astype('m8[ns]')
-
-        self.assertEqual(ct('10'), np.timedelta64(10, 'ns'))
-        self.assertEqual(ct('10ns'), np.timedelta64(10, 'ns'))
-        self.assertEqual(ct('100'), np.timedelta64(100, 'ns'))
-        self.assertEqual(ct('100ns'), np.timedelta64(100, 'ns'))
-
-        self.assertEqual(ct('1000'), np.timedelta64(1000, 'ns'))
-        self.assertEqual(ct('1000ns'), np.timedelta64(1000, 'ns'))
-        self.assertEqual(ct('1000NS'), np.timedelta64(1000, 'ns'))
-
-        self.assertEqual(ct('10us'), np.timedelta64(10000, 'ns'))
-        self.assertEqual(ct('100us'), np.timedelta64(100000, 'ns'))
-        self.assertEqual(ct('1000us'), np.timedelta64(1000000, 'ns'))
-        self.assertEqual(ct('1000Us'), np.timedelta64(1000000, 'ns'))
-        self.assertEqual(ct('1000uS'), np.timedelta64(1000000, 'ns'))
-
-        self.assertEqual(ct('1ms'), np.timedelta64(1000000, 'ns'))
-        self.assertEqual(ct('10ms'), np.timedelta64(10000000, 'ns'))
-        self.assertEqual(ct('100ms'), np.timedelta64(100000000, 'ns'))
-        self.assertEqual(ct('1000ms'), np.timedelta64(1000000000, 'ns'))
-
-        self.assertEqual(ct('-1s'), -np.timedelta64(1000000000, 'ns'))
-        self.assertEqual(ct('1s'), np.timedelta64(1000000000, 'ns'))
-        self.assertEqual(ct('10s'), np.timedelta64(10000000000, 'ns'))
-        self.assertEqual(ct('100s'), np.timedelta64(100000000000, 'ns'))
-        self.assertEqual(ct('1000s'), np.timedelta64(1000000000000, 'ns'))
-
-        self.assertEqual(ct('1d'), conv(np.timedelta64(1, 'D')))
-        self.assertEqual(ct('-1d'), -conv(np.timedelta64(1, 'D')))
-        self.assertEqual(ct('1D'), conv(np.timedelta64(1, 'D')))
-        self.assertEqual(ct('10D'), conv(np.timedelta64(10, 'D')))
-        self.assertEqual(ct('100D'), conv(np.timedelta64(100, 'D')))
-        self.assertEqual(ct('1000D'), conv(np.timedelta64(1000, 'D')))
-        self.assertEqual(ct('10000D'), conv(np.timedelta64(10000, 'D')))
-
-        # space
-        self.assertEqual(ct(' 10000D '), conv(np.timedelta64(10000, 'D')))
-        self.assertEqual(ct(' - 10000D '), -conv(np.timedelta64(10000, 'D')))
-
-        # invalid
-        self.assertRaises(ValueError, ct, '1foo')
-        self.assertRaises(ValueError, ct, 'foo')
-
-    def test_full_format_converters(self):
-        def conv(v):
-            return v.astype('m8[ns]')
-
-        d1 = np.timedelta64(1, 'D')
-
-        self.assertEqual(ct('1days'), conv(d1))
-        self.assertEqual(ct('1days,'), conv(d1))
-        self.assertEqual(ct('- 1days,'), -conv(d1))
-
-        self.assertEqual(ct('00:00:01'), conv(np.timedelta64(1, 's')))
-        self.assertEqual(ct('06:00:01'), conv(
-            np.timedelta64(6 * 3600 + 1, 's')))
-        self.assertEqual(ct('06:00:01.0'), conv(
-            np.timedelta64(6 * 3600 + 1, 's')))
-        self.assertEqual(ct('06:00:01.01'), conv(
-            np.timedelta64(1000 * (6 * 3600 + 1) + 10, 'ms')))
-
-        self.assertEqual(ct('- 1days, 00:00:01'),
-                         conv(-d1 + np.timedelta64(1, 's')))
-        self.assertEqual(ct('1days, 06:00:01'), conv(
-            d1 + np.timedelta64(6 * 3600 + 1, 's')))
-        self.assertEqual(ct('1days, 06:00:01.01'), conv(
-            d1 + np.timedelta64(1000 * (6 * 3600 + 1) + 10, 'ms')))
-
-        # invalid
-        self.assertRaises(ValueError, ct, '- 1days, 00')
-
-    def test_overflow(self):
-        # GH 9442
-        s = Series(pd.date_range('20130101', periods=100000, freq='H'))
-        s[0] += pd.Timedelta('1s 1ms')
-
-        # mean
-        result = (s - s.min()).mean()
-        expected = pd.Timedelta((pd.DatetimeIndex((s - s.min())).asi8 / len(s)
-                                 ).sum())
-
-        # the computation is converted to float so might be some loss of
-        # precision
-        self.assertTrue(np.allclose(result.value / 1000, expected.value /
-                                    1000))
-
-        # sum
-        self.assertRaises(ValueError, lambda: (s - s.min()).sum())
-        s1 = s[0:10000]
-        self.assertRaises(ValueError, lambda: (s1 - s1.min()).sum())
-        s2 = s[0:1000]
-        result = (s2 - s2.min()).sum()
-
-    def test_pickle(self):
-
-        v = Timedelta('1 days 10:11:12.0123456')
-        v_p = self.round_trip_pickle(v)
-        self.assertEqual(v, v_p)
-
-    def test_timedelta_hash_equality(self):
-        # GH 11129
-        v = Timedelta(1, 'D')
-        td = timedelta(days=1)
-        self.assertEqual(hash(v), hash(td))
-
-        d = {td: 2}
-        self.assertEqual(d[v], 2)
-
-        tds = timedelta_range('1 second', periods=20)
-        self.assertTrue(all(hash(td) == hash(td.to_pytimedelta()) for td in
-                            tds))
-
-        # python timedeltas drop ns resolution
-        ns_td = Timedelta(1, 'ns')
-        self.assertNotEqual(hash(ns_td), hash(ns_td.to_pytimedelta()))
-
-    def test_implementation_limits(self):
-        min_td = Timedelta(Timedelta.min)
-        max_td = Timedelta(Timedelta.max)
-
-        # GH 12727
-        # timedelta limits correspond to int64 boundaries
-        self.assertTrue(min_td.value == np.iinfo(np.int64).min + 1)
-        self.assertTrue(max_td.value == np.iinfo(np.int64).max)
-
-        # Beyond lower limit, a NAT before the Overflow
-        self.assertIsInstance(min_td - Timedelta(1, 'ns'),
-                              NaTType)
-
-        with tm.assertRaises(OverflowError):
-            min_td - Timedelta(2, 'ns')
-
-        with tm.assertRaises(OverflowError):
-            max_td + Timedelta(1, 'ns')
-
-        # Same tests using the internal nanosecond values
-        td = Timedelta(min_td.value - 1, 'ns')
-        self.assertIsInstance(td, NaTType)
-
-        with tm.assertRaises(OverflowError):
-            Timedelta(min_td.value - 2, 'ns')
-
-        with tm.assertRaises(OverflowError):
-            Timedelta(max_td.value + 1, 'ns')
-
-    def test_timedelta_arithmetic(self):
-        data = pd.Series(['nat', '32 days'], dtype='timedelta64[ns]')
-        deltas = [timedelta(days=1), Timedelta(1, unit='D')]
-        for delta in deltas:
-            result_method = data.add(delta)
-            result_operator = data + delta
-            expected = pd.Series(['nat', '33 days'], dtype='timedelta64[ns]')
-            tm.assert_series_equal(result_operator, expected)
-            tm.assert_series_equal(result_method, expected)
-
-            result_method = data.sub(delta)
-            result_operator = data - delta
-            expected = pd.Series(['nat', '31 days'], dtype='timedelta64[ns]')
-            tm.assert_series_equal(result_operator, expected)
-            tm.assert_series_equal(result_method, expected)
-            # GH 9396
-            result_method = data.div(delta)
-            result_operator = data / delta
-            expected = pd.Series([np.nan, 32.], dtype='float64')
-            tm.assert_series_equal(result_operator, expected)
-            tm.assert_series_equal(result_method, expected)
-
-    def test_apply_to_timedelta(self):
-        timedelta_NaT = pd.to_timedelta('NaT')
-
-        list_of_valid_strings = ['00:00:01', '00:00:02']
-        a = pd.to_timedelta(list_of_valid_strings)
-        b = Series(list_of_valid_strings).apply(pd.to_timedelta)
-        # Can't compare until apply on a Series gives the correct dtype
-        # assert_series_equal(a, b)
-
-        list_of_strings = ['00:00:01', np.nan, pd.NaT, timedelta_NaT]
-
-        # TODO: unused?
-        a = pd.to_timedelta(list_of_strings)  # noqa
-        b = Series(list_of_strings).apply(pd.to_timedelta)  # noqa
-        # Can't compare until apply on a Series gives the correct dtype
-        # assert_series_equal(a, b)
-
-    def test_components(self):
-        rng = timedelta_range('1 days, 10:11:12', periods=2, freq='s')
-        rng.components
-
-        # with nat
-        s = Series(rng)
-        s[1] = np.nan
-
-        result = s.dt.components
-        self.assertFalse(result.iloc[0].isnull().all())
-        self.assertTrue(result.iloc[1].isnull().all())
-
-    def test_isoformat(self):
-        td = Timedelta(days=6, minutes=50, seconds=3,
-                       milliseconds=10, microseconds=10, nanoseconds=12)
-        expected = 'P6DT0H50M3.010010012S'
-        result = td.isoformat()
-        self.assertEqual(result, expected)
-
-        td = Timedelta(days=4, hours=12, minutes=30, seconds=5)
-        result = td.isoformat()
-        expected = 'P4DT12H30M5S'
-        self.assertEqual(result, expected)
-
-        td = Timedelta(nanoseconds=123)
-        result = td.isoformat()
-        expected = 'P0DT0H0M0.000000123S'
-        self.assertEqual(result, expected)
-
-        # trim nano
-        td = Timedelta(microseconds=10)
-        result = td.isoformat()
-        expected = 'P0DT0H0M0.00001S'
-        self.assertEqual(result, expected)
-
-        # trim micro
-        td = Timedelta(milliseconds=1)
-        result = td.isoformat()
-        expected = 'P0DT0H0M0.001S'
-        self.assertEqual(result, expected)
-
-        # don't strip every 0
-        result = Timedelta(minutes=1).isoformat()
-        expected = 'P0DT0H1M0S'
-        self.assertEqual(result, expected)
-
-    def test_ops_error_str(self):
-        # GH 13624
-        td = Timedelta('1 day')
-
-        for l, r in [(td, 'a'), ('a', td)]:
-
-            with tm.assertRaises(TypeError):
-                l + r
-
-            with tm.assertRaises(TypeError):
-                l > r
-
-            self.assertFalse(l == r)
-            self.assertTrue(l != r)
diff --git a/pandas/tests/scalar/test_timestamp.py b/pandas/tests/scalar/test_timestamp.py
deleted file mode 100644
index e39375141ad5f..0000000000000
--- a/pandas/tests/scalar/test_timestamp.py
+++ /dev/null
@@ -1,1527 +0,0 @@
-""" test the scalar Timestamp """
-
-import sys
-import operator
-import calendar
-import numpy as np
-from datetime import datetime, timedelta
-from distutils.version import LooseVersion
-
-import pandas.util.testing as tm
-from pandas.tseries import offsets, frequencies
-from pandas._libs import tslib, period
-from pandas._libs.tslib import get_timezone
-
-from pandas.compat import lrange, long
-from pandas.util.testing import assert_series_equal
-from pandas.compat.numpy import np_datetime64_compat
-from pandas import (Timestamp, date_range, Period, Timedelta, compat,
-                    Series, NaT, DataFrame, DatetimeIndex)
-from pandas.tseries.frequencies import (RESO_DAY, RESO_HR, RESO_MIN, RESO_US,
-                                        RESO_MS, RESO_SEC)
-
-
-class TestTimestamp(tm.TestCase):
-
-    def test_constructor(self):
-        base_str = '2014-07-01 09:00'
-        base_dt = datetime(2014, 7, 1, 9)
-        base_expected = 1404205200000000000
-
-        # confirm base representation is correct
-        import calendar
-        self.assertEqual(calendar.timegm(base_dt.timetuple()) * 1000000000,
-                         base_expected)
-
-        tests = [(base_str, base_dt, base_expected),
-                 ('2014-07-01 10:00', datetime(2014, 7, 1, 10),
-                  base_expected + 3600 * 1000000000),
-                 ('2014-07-01 09:00:00.000008000',
-                  datetime(2014, 7, 1, 9, 0, 0, 8),
-                  base_expected + 8000),
-                 ('2014-07-01 09:00:00.000000005',
-                  Timestamp('2014-07-01 09:00:00.000000005'),
-                  base_expected + 5)]
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-        import pytz
-        import dateutil
-        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
-                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
-                     (pytz.FixedOffset(-180), -3),
-                     (dateutil.tz.tzoffset(None, 18000), 5)]
-
-        for date_str, date, expected in tests:
-            for result in [Timestamp(date_str), Timestamp(date)]:
-                # only with timestring
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-                # re-creation shouldn't affect to internal value
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-            # with timezone
-            for tz, offset in timezones:
-                for result in [Timestamp(date_str, tz=tz), Timestamp(date,
-                                                                     tz=tz)]:
-                    expected_tz = expected - offset * 3600 * 1000000000
-                    self.assertEqual(result.value, expected_tz)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                    # should preserve tz
-                    result = Timestamp(result)
-                    self.assertEqual(result.value, expected_tz)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                    # should convert to UTC
-                    result = Timestamp(result, tz='UTC')
-                    expected_utc = expected - offset * 3600 * 1000000000
-                    self.assertEqual(result.value, expected_utc)
-                    self.assertEqual(tslib.pydt_to_i8(result), expected_utc)
-
-    def test_constructor_with_stringoffset(self):
-        # GH 7833
-        base_str = '2014-07-01 11:00:00+02:00'
-        base_dt = datetime(2014, 7, 1, 9)
-        base_expected = 1404205200000000000
-
-        # confirm base representation is correct
-        import calendar
-        self.assertEqual(calendar.timegm(base_dt.timetuple()) * 1000000000,
-                         base_expected)
-
-        tests = [(base_str, base_expected),
-                 ('2014-07-01 12:00:00+02:00',
-                  base_expected + 3600 * 1000000000),
-                 ('2014-07-01 11:00:00.000008000+02:00', base_expected + 8000),
-                 ('2014-07-01 11:00:00.000000005+02:00', base_expected + 5)]
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-        import pytz
-        import dateutil
-        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
-                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
-                     (pytz.FixedOffset(-180), -3),
-                     (dateutil.tz.tzoffset(None, 18000), 5)]
-
-        for date_str, expected in tests:
-            for result in [Timestamp(date_str)]:
-                # only with timestring
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-                # re-creation shouldn't affect to internal value
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected)
-                self.assertEqual(tslib.pydt_to_i8(result), expected)
-
-            # with timezone
-            for tz, offset in timezones:
-                result = Timestamp(date_str, tz=tz)
-                expected_tz = expected
-                self.assertEqual(result.value, expected_tz)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                # should preserve tz
-                result = Timestamp(result)
-                self.assertEqual(result.value, expected_tz)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_tz)
-
-                # should convert to UTC
-                result = Timestamp(result, tz='UTC')
-                expected_utc = expected
-                self.assertEqual(result.value, expected_utc)
-                self.assertEqual(tslib.pydt_to_i8(result), expected_utc)
-
-        # This should be 2013-11-01 05:00 in UTC
-        # converted to Chicago tz
-        result = Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')
-        self.assertEqual(result.value, Timestamp('2013-11-01 05:00').value)
-        expected = "Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')"  # noqa
-        self.assertEqual(repr(result), expected)
-        self.assertEqual(result, eval(repr(result)))
-
-        # This should be 2013-11-01 05:00 in UTC
-        # converted to Tokyo tz (+09:00)
-        result = Timestamp('2013-11-01 00:00:00-0500', tz='Asia/Tokyo')
-        self.assertEqual(result.value, Timestamp('2013-11-01 05:00').value)
-        expected = "Timestamp('2013-11-01 14:00:00+0900', tz='Asia/Tokyo')"
-        self.assertEqual(repr(result), expected)
-        self.assertEqual(result, eval(repr(result)))
-
-        # GH11708
-        # This should be 2015-11-18 10:00 in UTC
-        # converted to Asia/Katmandu
-        result = Timestamp("2015-11-18 15:45:00+05:45", tz="Asia/Katmandu")
-        self.assertEqual(result.value, Timestamp("2015-11-18 10:00").value)
-        expected = "Timestamp('2015-11-18 15:45:00+0545', tz='Asia/Katmandu')"
-        self.assertEqual(repr(result), expected)
-        self.assertEqual(result, eval(repr(result)))
-
-        # This should be 2015-11-18 10:00 in UTC
-        # converted to Asia/Kolkata
-        result = Timestamp("2015-11-18 15:30:00+05:30", tz="Asia/Kolkata")
-        self.assertEqual(result.value, Timestamp("2015-11-18 10:00").value)
-        expected = "Timestamp('2015-11-18 15:30:00+0530', tz='Asia/Kolkata')"
-        self.assertEqual(repr(result), expected)
-        self.assertEqual(result, eval(repr(result)))
-
-    def test_constructor_invalid(self):
-        with tm.assertRaisesRegexp(TypeError, 'Cannot convert input'):
-            Timestamp(slice(2))
-        with tm.assertRaisesRegexp(ValueError, 'Cannot convert Period'):
-            Timestamp(Period('1000-01-01'))
-
-    def test_constructor_positional(self):
-        # GH 10758
-        with tm.assertRaises(TypeError):
-            Timestamp(2000, 1)
-        with tm.assertRaises(ValueError):
-            Timestamp(2000, 0, 1)
-        with tm.assertRaises(ValueError):
-            Timestamp(2000, 13, 1)
-        with tm.assertRaises(ValueError):
-            Timestamp(2000, 1, 0)
-        with tm.assertRaises(ValueError):
-            Timestamp(2000, 1, 32)
-
-        # GH 11630
-        self.assertEqual(
-            repr(Timestamp(2015, 11, 12)),
-            repr(Timestamp('20151112')))
-
-        self.assertEqual(
-            repr(Timestamp(2015, 11, 12, 1, 2, 3, 999999)),
-            repr(Timestamp('2015-11-12 01:02:03.999999')))
-
-    def test_constructor_keyword(self):
-        # GH 10758
-        with tm.assertRaises(TypeError):
-            Timestamp(year=2000, month=1)
-        with tm.assertRaises(ValueError):
-            Timestamp(year=2000, month=0, day=1)
-        with tm.assertRaises(ValueError):
-            Timestamp(year=2000, month=13, day=1)
-        with tm.assertRaises(ValueError):
-            Timestamp(year=2000, month=1, day=0)
-        with tm.assertRaises(ValueError):
-            Timestamp(year=2000, month=1, day=32)
-
-        self.assertEqual(
-            repr(Timestamp(year=2015, month=11, day=12)),
-            repr(Timestamp('20151112')))
-
-        self.assertEqual(
-            repr(Timestamp(year=2015, month=11, day=12,
-                           hour=1, minute=2, second=3, microsecond=999999)),
-            repr(Timestamp('2015-11-12 01:02:03.999999')))
-
-    def test_constructor_fromordinal(self):
-        base = datetime(2000, 1, 1)
-
-        ts = Timestamp.fromordinal(base.toordinal(), freq='D')
-        self.assertEqual(base, ts)
-        self.assertEqual(ts.freq, 'D')
-        self.assertEqual(base.toordinal(), ts.toordinal())
-
-        ts = Timestamp.fromordinal(base.toordinal(), tz='US/Eastern')
-        self.assertEqual(Timestamp('2000-01-01', tz='US/Eastern'), ts)
-        self.assertEqual(base.toordinal(), ts.toordinal())
-
-    def test_constructor_offset_depr(self):
-        # GH 12160
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            ts = Timestamp('2011-01-01', offset='D')
-        self.assertEqual(ts.freq, 'D')
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            self.assertEqual(ts.offset, 'D')
-
-        msg = "Can only specify freq or offset, not both"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            Timestamp('2011-01-01', offset='D', freq='D')
-
-    def test_constructor_offset_depr_fromordinal(self):
-        # GH 12160
-        base = datetime(2000, 1, 1)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            ts = Timestamp.fromordinal(base.toordinal(), offset='D')
-        self.assertEqual(Timestamp('2000-01-01'), ts)
-        self.assertEqual(ts.freq, 'D')
-        self.assertEqual(base.toordinal(), ts.toordinal())
-
-        msg = "Can only specify freq or offset, not both"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            Timestamp.fromordinal(base.toordinal(), offset='D', freq='D')
-
-    def test_conversion(self):
-        # GH 9255
-        ts = Timestamp('2000-01-01')
-
-        result = ts.to_pydatetime()
-        expected = datetime(2000, 1, 1)
-        self.assertEqual(result, expected)
-        self.assertEqual(type(result), type(expected))
-
-        result = ts.to_datetime64()
-        expected = np.datetime64(ts.value, 'ns')
-        self.assertEqual(result, expected)
-        self.assertEqual(type(result), type(expected))
-        self.assertEqual(result.dtype, expected.dtype)
-
-    def test_repr(self):
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-
-        dates = ['2014-03-07', '2014-01-01 09:00',
-                 '2014-01-01 00:00:00.000000001']
-
-        # dateutil zone change (only matters for repr)
-        import dateutil
-        if (dateutil.__version__ >= LooseVersion('2.3') and
-            (dateutil.__version__ <= LooseVersion('2.4.0') or
-             dateutil.__version__ >= LooseVersion('2.6.0'))):
-            timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
-                         'dateutil/US/Pacific']
-        else:
-            timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
-                         'dateutil/America/Los_Angeles']
-
-        freqs = ['D', 'M', 'S', 'N']
-
-        for date in dates:
-            for tz in timezones:
-                for freq in freqs:
-
-                    # avoid to match with timezone name
-                    freq_repr = "'{0}'".format(freq)
-                    if tz.startswith('dateutil'):
-                        tz_repr = tz.replace('dateutil', '')
-                    else:
-                        tz_repr = tz
-
-                    date_only = Timestamp(date)
-                    self.assertIn(date, repr(date_only))
-                    self.assertNotIn(tz_repr, repr(date_only))
-                    self.assertNotIn(freq_repr, repr(date_only))
-                    self.assertEqual(date_only, eval(repr(date_only)))
-
-                    date_tz = Timestamp(date, tz=tz)
-                    self.assertIn(date, repr(date_tz))
-                    self.assertIn(tz_repr, repr(date_tz))
-                    self.assertNotIn(freq_repr, repr(date_tz))
-                    self.assertEqual(date_tz, eval(repr(date_tz)))
-
-                    date_freq = Timestamp(date, freq=freq)
-                    self.assertIn(date, repr(date_freq))
-                    self.assertNotIn(tz_repr, repr(date_freq))
-                    self.assertIn(freq_repr, repr(date_freq))
-                    self.assertEqual(date_freq, eval(repr(date_freq)))
-
-                    date_tz_freq = Timestamp(date, tz=tz, freq=freq)
-                    self.assertIn(date, repr(date_tz_freq))
-                    self.assertIn(tz_repr, repr(date_tz_freq))
-                    self.assertIn(freq_repr, repr(date_tz_freq))
-                    self.assertEqual(date_tz_freq, eval(repr(date_tz_freq)))
-
-        # this can cause the tz field to be populated, but it's redundant to
-        # information in the datestring
-        tm._skip_if_no_pytz()
-        import pytz  # noqa
-        date_with_utc_offset = Timestamp('2014-03-13 00:00:00-0400', tz=None)
-        self.assertIn('2014-03-13 00:00:00-0400', repr(date_with_utc_offset))
-        self.assertNotIn('tzoffset', repr(date_with_utc_offset))
-        self.assertIn('pytz.FixedOffset(-240)', repr(date_with_utc_offset))
-        expr = repr(date_with_utc_offset).replace("'pytz.FixedOffset(-240)'",
-                                                  'pytz.FixedOffset(-240)')
-        self.assertEqual(date_with_utc_offset, eval(expr))
-
-    def test_bounds_with_different_units(self):
-        out_of_bounds_dates = ('1677-09-21', '2262-04-12', )
-
-        time_units = ('D', 'h', 'm', 's', 'ms', 'us')
-
-        for date_string in out_of_bounds_dates:
-            for unit in time_units:
-                self.assertRaises(ValueError, Timestamp, np.datetime64(
-                    date_string, dtype='M8[%s]' % unit))
-
-        in_bounds_dates = ('1677-09-23', '2262-04-11', )
-
-        for date_string in in_bounds_dates:
-            for unit in time_units:
-                Timestamp(np.datetime64(date_string, dtype='M8[%s]' % unit))
-
-    def test_tz(self):
-        t = '2014-02-01 09:00'
-        ts = Timestamp(t)
-        local = ts.tz_localize('Asia/Tokyo')
-        self.assertEqual(local.hour, 9)
-        self.assertEqual(local, Timestamp(t, tz='Asia/Tokyo'))
-        conv = local.tz_convert('US/Eastern')
-        self.assertEqual(conv, Timestamp('2014-01-31 19:00', tz='US/Eastern'))
-        self.assertEqual(conv.hour, 19)
-
-        # preserves nanosecond
-        ts = Timestamp(t) + offsets.Nano(5)
-        local = ts.tz_localize('Asia/Tokyo')
-        self.assertEqual(local.hour, 9)
-        self.assertEqual(local.nanosecond, 5)
-        conv = local.tz_convert('US/Eastern')
-        self.assertEqual(conv.nanosecond, 5)
-        self.assertEqual(conv.hour, 19)
-
-    def test_tz_localize_ambiguous(self):
-
-        ts = Timestamp('2014-11-02 01:00')
-        ts_dst = ts.tz_localize('US/Eastern', ambiguous=True)
-        ts_no_dst = ts.tz_localize('US/Eastern', ambiguous=False)
-
-        rng = date_range('2014-11-02', periods=3, freq='H', tz='US/Eastern')
-        self.assertEqual(rng[1], ts_dst)
-        self.assertEqual(rng[2], ts_no_dst)
-        self.assertRaises(ValueError, ts.tz_localize, 'US/Eastern',
-                          ambiguous='infer')
-
-        # GH 8025
-        with tm.assertRaisesRegexp(TypeError,
-                                   'Cannot localize tz-aware Timestamp, use '
-                                   'tz_convert for conversions'):
-            Timestamp('2011-01-01', tz='US/Eastern').tz_localize('Asia/Tokyo')
-
-        with tm.assertRaisesRegexp(TypeError,
-                                   'Cannot convert tz-naive Timestamp, use '
-                                   'tz_localize to localize'):
-            Timestamp('2011-01-01').tz_convert('Asia/Tokyo')
-
-    def test_tz_localize_nonexistent(self):
-        # See issue 13057
-        from pytz.exceptions import NonExistentTimeError
-        times = ['2015-03-08 02:00', '2015-03-08 02:30',
-                 '2015-03-29 02:00', '2015-03-29 02:30']
-        timezones = ['US/Eastern', 'US/Pacific',
-                     'Europe/Paris', 'Europe/Belgrade']
-        for t, tz in zip(times, timezones):
-            ts = Timestamp(t)
-            self.assertRaises(NonExistentTimeError, ts.tz_localize,
-                              tz)
-            self.assertRaises(NonExistentTimeError, ts.tz_localize,
-                              tz, errors='raise')
-            self.assertIs(ts.tz_localize(tz, errors='coerce'),
-                          NaT)
-
-    def test_tz_localize_errors_ambiguous(self):
-        # See issue 13057
-        from pytz.exceptions import AmbiguousTimeError
-        ts = Timestamp('2015-11-1 01:00')
-        self.assertRaises(AmbiguousTimeError,
-                          ts.tz_localize, 'US/Pacific', errors='coerce')
-
-    def test_tz_localize_roundtrip(self):
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            for t in ['2014-02-01 09:00', '2014-07-08 09:00',
-                      '2014-11-01 17:00', '2014-11-05 00:00']:
-                ts = Timestamp(t)
-                localized = ts.tz_localize(tz)
-                self.assertEqual(localized, Timestamp(t, tz=tz))
-
-                with tm.assertRaises(TypeError):
-                    localized.tz_localize(tz)
-
-                reset = localized.tz_localize(None)
-                self.assertEqual(reset, ts)
-                self.assertTrue(reset.tzinfo is None)
-
-    def test_tz_convert_roundtrip(self):
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']:
-            for t in ['2014-02-01 09:00', '2014-07-08 09:00',
-                      '2014-11-01 17:00', '2014-11-05 00:00']:
-                ts = Timestamp(t, tz='UTC')
-                converted = ts.tz_convert(tz)
-
-                reset = converted.tz_convert(None)
-                self.assertEqual(reset, Timestamp(t))
-                self.assertTrue(reset.tzinfo is None)
-                self.assertEqual(reset,
-                                 converted.tz_convert('UTC').tz_localize(None))
-
-    def test_barely_oob_dts(self):
-        one_us = np.timedelta64(1).astype('timedelta64[us]')
-
-        # By definition we can't go out of bounds in [ns], so we
-        # convert the datetime64s to [us] so we can go out of bounds
-        min_ts_us = np.datetime64(Timestamp.min).astype('M8[us]')
-        max_ts_us = np.datetime64(Timestamp.max).astype('M8[us]')
-
-        # No error for the min/max datetimes
-        Timestamp(min_ts_us)
-        Timestamp(max_ts_us)
-
-        # One us less than the minimum is an error
-        self.assertRaises(ValueError, Timestamp, min_ts_us - one_us)
-
-        # One us more than the maximum is an error
-        self.assertRaises(ValueError, Timestamp, max_ts_us + one_us)
-
-    def test_utc_z_designator(self):
-        self.assertEqual(get_timezone(
-            Timestamp('2014-11-02 01:00Z').tzinfo), 'UTC')
-
-    def test_now(self):
-        # #9000
-        ts_from_string = Timestamp('now')
-        ts_from_method = Timestamp.now()
-        ts_datetime = datetime.now()
-
-        ts_from_string_tz = Timestamp('now', tz='US/Eastern')
-        ts_from_method_tz = Timestamp.now(tz='US/Eastern')
-
-        # Check that the delta between the times is less than 1s (arbitrarily
-        # small)
-        delta = Timedelta(seconds=1)
-        self.assertTrue(abs(ts_from_method - ts_from_string) < delta)
-        self.assertTrue(abs(ts_datetime - ts_from_method) < delta)
-        self.assertTrue(abs(ts_from_method_tz - ts_from_string_tz) < delta)
-        self.assertTrue(abs(ts_from_string_tz.tz_localize(None) -
-                            ts_from_method_tz.tz_localize(None)) < delta)
-
-    def test_today(self):
-
-        ts_from_string = Timestamp('today')
-        ts_from_method = Timestamp.today()
-        ts_datetime = datetime.today()
-
-        ts_from_string_tz = Timestamp('today', tz='US/Eastern')
-        ts_from_method_tz = Timestamp.today(tz='US/Eastern')
-
-        # Check that the delta between the times is less than 1s (arbitrarily
-        # small)
-        delta = Timedelta(seconds=1)
-        self.assertTrue(abs(ts_from_method - ts_from_string) < delta)
-        self.assertTrue(abs(ts_datetime - ts_from_method) < delta)
-        self.assertTrue(abs(ts_from_method_tz - ts_from_string_tz) < delta)
-        self.assertTrue(abs(ts_from_string_tz.tz_localize(None) -
-                            ts_from_method_tz.tz_localize(None)) < delta)
-
-    def test_asm8(self):
-        np.random.seed(7960929)
-        ns = [Timestamp.min.value, Timestamp.max.value, 1000, ]
-        for n in ns:
-            self.assertEqual(Timestamp(n).asm8.view('i8'),
-                             np.datetime64(n, 'ns').view('i8'), n)
-        self.assertEqual(Timestamp('nat').asm8.view('i8'),
-                         np.datetime64('nat', 'ns').view('i8'))
-
-    def test_fields(self):
-        def check(value, equal):
-            # that we are int/long like
-            self.assertTrue(isinstance(value, (int, compat.long)))
-            self.assertEqual(value, equal)
-
-        # GH 10050
-        ts = Timestamp('2015-05-10 09:06:03.000100001')
-        check(ts.year, 2015)
-        check(ts.month, 5)
-        check(ts.day, 10)
-        check(ts.hour, 9)
-        check(ts.minute, 6)
-        check(ts.second, 3)
-        self.assertRaises(AttributeError, lambda: ts.millisecond)
-        check(ts.microsecond, 100)
-        check(ts.nanosecond, 1)
-        check(ts.dayofweek, 6)
-        check(ts.quarter, 2)
-        check(ts.dayofyear, 130)
-        check(ts.week, 19)
-        check(ts.daysinmonth, 31)
-        check(ts.daysinmonth, 31)
-
-        # GH 13303
-        ts = Timestamp('2014-12-31 23:59:00-05:00', tz='US/Eastern')
-        check(ts.year, 2014)
-        check(ts.month, 12)
-        check(ts.day, 31)
-        check(ts.hour, 23)
-        check(ts.minute, 59)
-        check(ts.second, 0)
-        self.assertRaises(AttributeError, lambda: ts.millisecond)
-        check(ts.microsecond, 0)
-        check(ts.nanosecond, 0)
-        check(ts.dayofweek, 2)
-        check(ts.quarter, 4)
-        check(ts.dayofyear, 365)
-        check(ts.week, 1)
-        check(ts.daysinmonth, 31)
-
-        ts = Timestamp('2014-01-01 00:00:00+01:00')
-        starts = ['is_month_start', 'is_quarter_start', 'is_year_start']
-        for start in starts:
-            self.assertTrue(getattr(ts, start))
-        ts = Timestamp('2014-12-31 23:59:59+01:00')
-        ends = ['is_month_end', 'is_year_end', 'is_quarter_end']
-        for end in ends:
-            self.assertTrue(getattr(ts, end))
-
-    def test_pprint(self):
-        # GH12622
-        import pprint
-        nested_obj = {'foo': 1,
-                      'bar': [{'w': {'a': Timestamp('2011-01-01')}}] * 10}
-        result = pprint.pformat(nested_obj, width=50)
-        expected = r"""{'bar': [{'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
-         {'w': {'a': Timestamp('2011-01-01 00:00:00')}}],
- 'foo': 1}"""
-        self.assertEqual(result, expected)
-
-    def to_datetime_depr(self):
-        # see gh-8254
-        ts = Timestamp('2011-01-01')
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            expected = datetime(2011, 1, 1)
-            result = ts.to_datetime()
-            self.assertEqual(result, expected)
-
-    def to_pydatetime_nonzero_nano(self):
-        ts = Timestamp('2011-01-01 9:00:00.123456789')
-
-        # Warn the user of data loss (nanoseconds).
-        with tm.assert_produces_warning(UserWarning,
-                                        check_stacklevel=False):
-            expected = datetime(2011, 1, 1, 9, 0, 0, 123456)
-            result = ts.to_pydatetime()
-            self.assertEqual(result, expected)
-
-    def test_round(self):
-
-        # round
-        dt = Timestamp('20130101 09:10:11')
-        result = dt.round('D')
-        expected = Timestamp('20130101')
-        self.assertEqual(result, expected)
-
-        dt = Timestamp('20130101 19:10:11')
-        result = dt.round('D')
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-        dt = Timestamp('20130201 12:00:00')
-        result = dt.round('D')
-        expected = Timestamp('20130202')
-        self.assertEqual(result, expected)
-
-        dt = Timestamp('20130104 12:00:00')
-        result = dt.round('D')
-        expected = Timestamp('20130105')
-        self.assertEqual(result, expected)
-
-        dt = Timestamp('20130104 12:32:00')
-        result = dt.round('30Min')
-        expected = Timestamp('20130104 12:30:00')
-        self.assertEqual(result, expected)
-
-        dti = date_range('20130101 09:10:11', periods=5)
-        result = dti.round('D')
-        expected = date_range('20130101', periods=5)
-        tm.assert_index_equal(result, expected)
-
-        # floor
-        dt = Timestamp('20130101 09:10:11')
-        result = dt.floor('D')
-        expected = Timestamp('20130101')
-        self.assertEqual(result, expected)
-
-        # ceil
-        dt = Timestamp('20130101 09:10:11')
-        result = dt.ceil('D')
-        expected = Timestamp('20130102')
-        self.assertEqual(result, expected)
-
-        # round with tz
-        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
-        result = dt.round('D')
-        expected = Timestamp('20130101', tz='US/Eastern')
-        self.assertEqual(result, expected)
-
-        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
-        result = dt.round('s')
-        self.assertEqual(result, dt)
-
-        dti = date_range('20130101 09:10:11',
-                         periods=5).tz_localize('UTC').tz_convert('US/Eastern')
-        result = dti.round('D')
-        expected = date_range('20130101', periods=5).tz_localize('US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-        result = dti.round('s')
-        tm.assert_index_equal(result, dti)
-
-        # invalid
-        for freq in ['Y', 'M', 'foobar']:
-            self.assertRaises(ValueError, lambda: dti.round(freq))
-
-        # GH 14440 & 15578
-        result = Timestamp('2016-10-17 12:00:00.0015').round('ms')
-        expected = Timestamp('2016-10-17 12:00:00.002000')
-        self.assertEqual(result, expected)
-
-        result = Timestamp('2016-10-17 12:00:00.00149').round('ms')
-        expected = Timestamp('2016-10-17 12:00:00.001000')
-        self.assertEqual(result, expected)
-
-        ts = Timestamp('2016-10-17 12:00:00.0015')
-        for freq in ['us', 'ns']:
-            self.assertEqual(ts, ts.round(freq))
-
-        result = Timestamp('2016-10-17 12:00:00.001501031').round('10ns')
-        expected = Timestamp('2016-10-17 12:00:00.001501030')
-        self.assertEqual(result, expected)
-
-        with tm.assert_produces_warning():
-            Timestamp('2016-10-17 12:00:00.001501031').round('1010ns')
-
-    def test_round_misc(self):
-        stamp = Timestamp('2000-01-05 05:09:15.13')
-
-        def _check_round(freq, expected):
-            result = stamp.round(freq=freq)
-            self.assertEqual(result, expected)
-
-        for freq, expected in [('D', Timestamp('2000-01-05 00:00:00')),
-                               ('H', Timestamp('2000-01-05 05:00:00')),
-                               ('S', Timestamp('2000-01-05 05:09:15'))]:
-            _check_round(freq, expected)
-
-        msg = frequencies._INVALID_FREQ_ERROR
-        with self.assertRaisesRegexp(ValueError, msg):
-            stamp.round('foo')
-
-    def test_class_ops_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import timezone
-
-        def compare(x, y):
-            self.assertEqual(int(Timestamp(x).value / 1e9),
-                             int(Timestamp(y).value / 1e9))
-
-        compare(Timestamp.now(), datetime.now())
-        compare(Timestamp.now('UTC'), datetime.now(timezone('UTC')))
-        compare(Timestamp.utcnow(), datetime.utcnow())
-        compare(Timestamp.today(), datetime.today())
-        current_time = calendar.timegm(datetime.now().utctimetuple())
-        compare(Timestamp.utcfromtimestamp(current_time),
-                datetime.utcfromtimestamp(current_time))
-        compare(Timestamp.fromtimestamp(current_time),
-                datetime.fromtimestamp(current_time))
-
-        date_component = datetime.utcnow()
-        time_component = (date_component + timedelta(minutes=10)).time()
-        compare(Timestamp.combine(date_component, time_component),
-                datetime.combine(date_component, time_component))
-
-    def test_class_ops_dateutil(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzutc
-
-        def compare(x, y):
-            self.assertEqual(int(np.round(Timestamp(x).value / 1e9)),
-                             int(np.round(Timestamp(y).value / 1e9)))
-
-        compare(Timestamp.now(), datetime.now())
-        compare(Timestamp.now('UTC'), datetime.now(tzutc()))
-        compare(Timestamp.utcnow(), datetime.utcnow())
-        compare(Timestamp.today(), datetime.today())
-        current_time = calendar.timegm(datetime.now().utctimetuple())
-        compare(Timestamp.utcfromtimestamp(current_time),
-                datetime.utcfromtimestamp(current_time))
-        compare(Timestamp.fromtimestamp(current_time),
-                datetime.fromtimestamp(current_time))
-
-        date_component = datetime.utcnow()
-        time_component = (date_component + timedelta(minutes=10)).time()
-        compare(Timestamp.combine(date_component, time_component),
-                datetime.combine(date_component, time_component))
-
-    def test_basics_nanos(self):
-        val = np.int64(946684800000000000).view('M8[ns]')
-        stamp = Timestamp(val.view('i8') + 500)
-        self.assertEqual(stamp.year, 2000)
-        self.assertEqual(stamp.month, 1)
-        self.assertEqual(stamp.microsecond, 0)
-        self.assertEqual(stamp.nanosecond, 500)
-
-        # GH 14415
-        val = np.iinfo(np.int64).min + 80000000000000
-        stamp = Timestamp(val)
-        self.assertEqual(stamp.year, 1677)
-        self.assertEqual(stamp.month, 9)
-        self.assertEqual(stamp.day, 21)
-        self.assertEqual(stamp.microsecond, 145224)
-        self.assertEqual(stamp.nanosecond, 192)
-
-    def test_unit(self):
-
-        def check(val, unit=None, h=1, s=1, us=0):
-            stamp = Timestamp(val, unit=unit)
-            self.assertEqual(stamp.year, 2000)
-            self.assertEqual(stamp.month, 1)
-            self.assertEqual(stamp.day, 1)
-            self.assertEqual(stamp.hour, h)
-            if unit != 'D':
-                self.assertEqual(stamp.minute, 1)
-                self.assertEqual(stamp.second, s)
-                self.assertEqual(stamp.microsecond, us)
-            else:
-                self.assertEqual(stamp.minute, 0)
-                self.assertEqual(stamp.second, 0)
-                self.assertEqual(stamp.microsecond, 0)
-            self.assertEqual(stamp.nanosecond, 0)
-
-        ts = Timestamp('20000101 01:01:01')
-        val = ts.value
-        days = (ts - Timestamp('1970-01-01')).days
-
-        check(val)
-        check(val / long(1000), unit='us')
-        check(val / long(1000000), unit='ms')
-        check(val / long(1000000000), unit='s')
-        check(days, unit='D', h=0)
-
-        # using truediv, so these are like floats
-        if compat.PY3:
-            check((val + 500000) / long(1000000000), unit='s', us=500)
-            check((val + 500000000) / long(1000000000), unit='s', us=500000)
-            check((val + 500000) / long(1000000), unit='ms', us=500)
-
-        # get chopped in py2
-        else:
-            check((val + 500000) / long(1000000000), unit='s')
-            check((val + 500000000) / long(1000000000), unit='s')
-            check((val + 500000) / long(1000000), unit='ms')
-
-        # ok
-        check((val + 500000) / long(1000), unit='us', us=500)
-        check((val + 500000000) / long(1000000), unit='ms', us=500000)
-
-        # floats
-        check(val / 1000.0 + 5, unit='us', us=5)
-        check(val / 1000.0 + 5000, unit='us', us=5000)
-        check(val / 1000000.0 + 0.5, unit='ms', us=500)
-        check(val / 1000000.0 + 0.005, unit='ms', us=5)
-        check(val / 1000000000.0 + 0.5, unit='s', us=500000)
-        check(days + 0.5, unit='D', h=12)
-
-    def test_roundtrip(self):
-
-        # test value to string and back conversions
-        # further test accessors
-        base = Timestamp('20140101 00:00:00')
-
-        result = Timestamp(base.value + Timedelta('5ms').value)
-        self.assertEqual(result, Timestamp(str(base) + ".005000"))
-        self.assertEqual(result.microsecond, 5000)
-
-        result = Timestamp(base.value + Timedelta('5us').value)
-        self.assertEqual(result, Timestamp(str(base) + ".000005"))
-        self.assertEqual(result.microsecond, 5)
-
-        result = Timestamp(base.value + Timedelta('5ns').value)
-        self.assertEqual(result, Timestamp(str(base) + ".000000005"))
-        self.assertEqual(result.nanosecond, 5)
-        self.assertEqual(result.microsecond, 0)
-
-        result = Timestamp(base.value + Timedelta('6ms 5us').value)
-        self.assertEqual(result, Timestamp(str(base) + ".006005"))
-        self.assertEqual(result.microsecond, 5 + 6 * 1000)
-
-        result = Timestamp(base.value + Timedelta('200ms 5us').value)
-        self.assertEqual(result, Timestamp(str(base) + ".200005"))
-        self.assertEqual(result.microsecond, 5 + 200 * 1000)
-
-    def test_comparison(self):
-        # 5-18-2012 00:00:00.000
-        stamp = long(1337299200000000000)
-
-        val = Timestamp(stamp)
-
-        self.assertEqual(val, val)
-        self.assertFalse(val != val)
-        self.assertFalse(val < val)
-        self.assertTrue(val <= val)
-        self.assertFalse(val > val)
-        self.assertTrue(val >= val)
-
-        other = datetime(2012, 5, 18)
-        self.assertEqual(val, other)
-        self.assertFalse(val != other)
-        self.assertFalse(val < other)
-        self.assertTrue(val <= other)
-        self.assertFalse(val > other)
-        self.assertTrue(val >= other)
-
-        other = Timestamp(stamp + 100)
-
-        self.assertNotEqual(val, other)
-        self.assertNotEqual(val, other)
-        self.assertTrue(val < other)
-        self.assertTrue(val <= other)
-        self.assertTrue(other > val)
-        self.assertTrue(other >= val)
-
-    def test_compare_invalid(self):
-
-        # GH 8058
-        val = Timestamp('20130101 12:01:02')
-        self.assertFalse(val == 'foo')
-        self.assertFalse(val == 10.0)
-        self.assertFalse(val == 1)
-        self.assertFalse(val == long(1))
-        self.assertFalse(val == [])
-        self.assertFalse(val == {'foo': 1})
-        self.assertFalse(val == np.float64(1))
-        self.assertFalse(val == np.int64(1))
-
-        self.assertTrue(val != 'foo')
-        self.assertTrue(val != 10.0)
-        self.assertTrue(val != 1)
-        self.assertTrue(val != long(1))
-        self.assertTrue(val != [])
-        self.assertTrue(val != {'foo': 1})
-        self.assertTrue(val != np.float64(1))
-        self.assertTrue(val != np.int64(1))
-
-        # ops testing
-        df = DataFrame(np.random.randn(5, 2))
-        a = df[0]
-        b = Series(np.random.randn(5))
-        b.name = Timestamp('2000-01-01')
-        tm.assert_series_equal(a / b, 1 / (b / a))
-
-    def test_cant_compare_tz_naive_w_aware(self):
-        tm._skip_if_no_pytz()
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz='utc')
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_cant_compare_tz_naive_w_aware_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import utc
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz=utc)
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_cant_compare_tz_naive_w_aware_dateutil(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzutc
-        utc = tzutc()
-        # #1404
-        a = Timestamp('3/12/2012')
-        b = Timestamp('3/12/2012', tz=utc)
-
-        self.assertRaises(Exception, a.__eq__, b)
-        self.assertRaises(Exception, a.__ne__, b)
-        self.assertRaises(Exception, a.__lt__, b)
-        self.assertRaises(Exception, a.__gt__, b)
-        self.assertRaises(Exception, b.__eq__, a)
-        self.assertRaises(Exception, b.__ne__, a)
-        self.assertRaises(Exception, b.__lt__, a)
-        self.assertRaises(Exception, b.__gt__, a)
-
-        if sys.version_info < (3, 3):
-            self.assertRaises(Exception, a.__eq__, b.to_pydatetime())
-            self.assertRaises(Exception, a.to_pydatetime().__eq__, b)
-        else:
-            self.assertFalse(a == b.to_pydatetime())
-            self.assertFalse(a.to_pydatetime() == b)
-
-    def test_delta_preserve_nanos(self):
-        val = Timestamp(long(1337299200000000123))
-        result = val + timedelta(1)
-        self.assertEqual(result.nanosecond, val.nanosecond)
-
-    def test_frequency_misc(self):
-        self.assertEqual(frequencies.get_freq_group('T'),
-                         frequencies.FreqGroup.FR_MIN)
-
-        code, stride = frequencies.get_freq_code(offsets.Hour())
-        self.assertEqual(code, frequencies.FreqGroup.FR_HR)
-
-        code, stride = frequencies.get_freq_code((5, 'T'))
-        self.assertEqual(code, frequencies.FreqGroup.FR_MIN)
-        self.assertEqual(stride, 5)
-
-        offset = offsets.Hour()
-        result = frequencies.to_offset(offset)
-        self.assertEqual(result, offset)
-
-        result = frequencies.to_offset((5, 'T'))
-        expected = offsets.Minute(5)
-        self.assertEqual(result, expected)
-
-        self.assertRaises(ValueError, frequencies.get_freq_code, (5, 'baz'))
-
-        self.assertRaises(ValueError, frequencies.to_offset, '100foo')
-
-        self.assertRaises(ValueError, frequencies.to_offset, ('', ''))
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = frequencies.get_standard_freq(offsets.Hour())
-        self.assertEqual(result, 'H')
-
-    def test_hash_equivalent(self):
-        d = {datetime(2011, 1, 1): 5}
-        stamp = Timestamp(datetime(2011, 1, 1))
-        self.assertEqual(d[stamp], 5)
-
-    def test_timestamp_compare_scalars(self):
-        # case where ndim == 0
-        lhs = np.datetime64(datetime(2013, 12, 6))
-        rhs = Timestamp('now')
-        nat = Timestamp('nat')
-
-        ops = {'gt': 'lt',
-               'lt': 'gt',
-               'ge': 'le',
-               'le': 'ge',
-               'eq': 'eq',
-               'ne': 'ne'}
-
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-            expected = left_f(lhs, rhs)
-
-            result = right_f(rhs, lhs)
-            self.assertEqual(result, expected)
-
-            expected = left_f(rhs, nat)
-            result = right_f(nat, rhs)
-            self.assertEqual(result, expected)
-
-    def test_timestamp_compare_series(self):
-        # make sure we can compare Timestamps on the right AND left hand side
-        # GH4982
-        s = Series(date_range('20010101', periods=10), name='dates')
-        s_nat = s.copy(deep=True)
-
-        s[0] = Timestamp('nat')
-        s[3] = Timestamp('nat')
-
-        ops = {'lt': 'gt', 'le': 'ge', 'eq': 'eq', 'ne': 'ne'}
-
-        for left, right in ops.items():
-            left_f = getattr(operator, left)
-            right_f = getattr(operator, right)
-
-            # no nats
-            expected = left_f(s, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), s)
-            tm.assert_series_equal(result, expected)
-
-            # nats
-            expected = left_f(s, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), s)
-            tm.assert_series_equal(result, expected)
-
-            # compare to timestamp with series containing nats
-            expected = left_f(s_nat, Timestamp('20010109'))
-            result = right_f(Timestamp('20010109'), s_nat)
-            tm.assert_series_equal(result, expected)
-
-            # compare to nat with series containing nats
-            expected = left_f(s_nat, Timestamp('nat'))
-            result = right_f(Timestamp('nat'), s_nat)
-            tm.assert_series_equal(result, expected)
-
-    def test_is_leap_year(self):
-        # GH 13727
-        for tz in [None, 'UTC', 'US/Eastern', 'Asia/Tokyo']:
-            dt = Timestamp('2000-01-01 00:00:00', tz=tz)
-            self.assertTrue(dt.is_leap_year)
-            self.assertIsInstance(dt.is_leap_year, bool)
-
-            dt = Timestamp('1999-01-01 00:00:00', tz=tz)
-            self.assertFalse(dt.is_leap_year)
-
-            dt = Timestamp('2004-01-01 00:00:00', tz=tz)
-            self.assertTrue(dt.is_leap_year)
-
-            dt = Timestamp('2100-01-01 00:00:00', tz=tz)
-            self.assertFalse(dt.is_leap_year)
-
-
-class TestTimestampNsOperations(tm.TestCase):
-
-    def setUp(self):
-        self.timestamp = Timestamp(datetime.utcnow())
-
-    def assert_ns_timedelta(self, modified_timestamp, expected_value):
-        value = self.timestamp.value
-        modified_value = modified_timestamp.value
-
-        self.assertEqual(modified_value - value, expected_value)
-
-    def test_timedelta_ns_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'ns'),
-                                 -123)
-
-    def test_timedelta_ns_based_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(
-            1234567898, 'ns'), 1234567898)
-
-    def test_timedelta_us_arithmetic(self):
-        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'us'),
-                                 -123000)
-
-    def test_timedelta_ms_arithmetic(self):
-        time = self.timestamp + np.timedelta64(-123, 'ms')
-        self.assert_ns_timedelta(time, -123000000)
-
-    def test_nanosecond_string_parsing(self):
-        ts = Timestamp('2013-05-01 07:15:45.123456789')
-        # GH 7878
-        expected_repr = '2013-05-01 07:15:45.123456789'
-        expected_value = 1367392545123456789
-        self.assertEqual(ts.value, expected_value)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789+09:00', tz='Asia/Tokyo')
-        self.assertEqual(ts.value, expected_value - 9 * 3600 * 1000000000)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='UTC')
-        self.assertEqual(ts.value, expected_value)
-        self.assertIn(expected_repr, repr(ts))
-
-        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='US/Eastern')
-        self.assertEqual(ts.value, expected_value + 4 * 3600 * 1000000000)
-        self.assertIn(expected_repr, repr(ts))
-
-        # GH 10041
-        ts = Timestamp('20130501T071545.123456789')
-        self.assertEqual(ts.value, expected_value)
-        self.assertIn(expected_repr, repr(ts))
-
-    def test_nanosecond_timestamp(self):
-        # GH 7610
-        expected = 1293840000000000005
-        t = Timestamp('2011-01-01') + offsets.Nano(5)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        t = Timestamp(t)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000005Z'))
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000005')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 5)
-
-        expected = 1293840000000000010
-        t = t + offsets.Nano(5)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-        t = Timestamp(t)
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000010Z'))
-        self.assertEqual(repr(t), "Timestamp('2011-01-01 00:00:00.000000010')")
-        self.assertEqual(t.value, expected)
-        self.assertEqual(t.nanosecond, 10)
-
-
-class TestTimestampOps(tm.TestCase):
-
-    def test_timestamp_and_datetime(self):
-        self.assertEqual((Timestamp(datetime(
-            2013, 10, 13)) - datetime(2013, 10, 12)).days, 1)
-        self.assertEqual((datetime(2013, 10, 12) -
-                          Timestamp(datetime(2013, 10, 13))).days, -1)
-
-    def test_timestamp_and_series(self):
-        timestamp_series = Series(date_range('2014-03-17', periods=2, freq='D',
-                                             tz='US/Eastern'))
-        first_timestamp = timestamp_series[0]
-
-        delta_series = Series([np.timedelta64(0, 'D'), np.timedelta64(1, 'D')])
-        assert_series_equal(timestamp_series - first_timestamp, delta_series)
-        assert_series_equal(first_timestamp - timestamp_series, -delta_series)
-
-    def test_addition_subtraction_types(self):
-        # Assert on the types resulting from Timestamp +/- various date/time
-        # objects
-        datetime_instance = datetime(2014, 3, 4)
-        timedelta_instance = timedelta(seconds=1)
-        # build a timestamp with a frequency, since then it supports
-        # addition/subtraction of integers
-        timestamp_instance = date_range(datetime_instance, periods=1,
-                                        freq='D')[0]
-
-        self.assertEqual(type(timestamp_instance + 1), Timestamp)
-        self.assertEqual(type(timestamp_instance - 1), Timestamp)
-
-        # Timestamp + datetime not supported, though subtraction is supported
-        # and yields timedelta more tests in tseries/base/tests/test_base.py
-        self.assertEqual(
-            type(timestamp_instance - datetime_instance), Timedelta)
-        self.assertEqual(
-            type(timestamp_instance + timedelta_instance), Timestamp)
-        self.assertEqual(
-            type(timestamp_instance - timedelta_instance), Timestamp)
-
-        # Timestamp +/- datetime64 not supported, so not tested (could possibly
-        # assert error raised?)
-        timedelta64_instance = np.timedelta64(1, 'D')
-        self.assertEqual(
-            type(timestamp_instance + timedelta64_instance), Timestamp)
-        self.assertEqual(
-            type(timestamp_instance - timedelta64_instance), Timestamp)
-
-    def test_addition_subtraction_preserve_frequency(self):
-        timestamp_instance = date_range('2014-03-05', periods=1, freq='D')[0]
-        timedelta_instance = timedelta(days=1)
-        original_freq = timestamp_instance.freq
-        self.assertEqual((timestamp_instance + 1).freq, original_freq)
-        self.assertEqual((timestamp_instance - 1).freq, original_freq)
-        self.assertEqual(
-            (timestamp_instance + timedelta_instance).freq, original_freq)
-        self.assertEqual(
-            (timestamp_instance - timedelta_instance).freq, original_freq)
-
-        timedelta64_instance = np.timedelta64(1, 'D')
-        self.assertEqual(
-            (timestamp_instance + timedelta64_instance).freq, original_freq)
-        self.assertEqual(
-            (timestamp_instance - timedelta64_instance).freq, original_freq)
-
-    def test_resolution(self):
-
-        for freq, expected in zip(['A', 'Q', 'M', 'D', 'H', 'T',
-                                   'S', 'L', 'U'],
-                                  [RESO_DAY, RESO_DAY,
-                                   RESO_DAY, RESO_DAY,
-                                   RESO_HR, RESO_MIN,
-                                   RESO_SEC, RESO_MS,
-                                   RESO_US]):
-            for tz in [None, 'Asia/Tokyo', 'US/Eastern',
-                       'dateutil/US/Eastern']:
-                idx = date_range(start='2013-04-01', periods=30, freq=freq,
-                                 tz=tz)
-                result = period.resolution(idx.asi8, idx.tz)
-                self.assertEqual(result, expected)
-
-
-class TestTimestampToJulianDate(tm.TestCase):
-
-    def test_compare_1700(self):
-        r = Timestamp('1700-06-23').to_julian_date()
-        self.assertEqual(r, 2342145.5)
-
-    def test_compare_2000(self):
-        r = Timestamp('2000-04-12').to_julian_date()
-        self.assertEqual(r, 2451646.5)
-
-    def test_compare_2100(self):
-        r = Timestamp('2100-08-12').to_julian_date()
-        self.assertEqual(r, 2488292.5)
-
-    def test_compare_hour01(self):
-        r = Timestamp('2000-08-12T01:00:00').to_julian_date()
-        self.assertEqual(r, 2451768.5416666666666666)
-
-    def test_compare_hour13(self):
-        r = Timestamp('2000-08-12T13:00:00').to_julian_date()
-        self.assertEqual(r, 2451769.0416666666666666)
-
-
-class TestTimeSeries(tm.TestCase):
-
-    def test_timestamp_to_datetime(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('20090415', '20090519', tz='US/Eastern')
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_dateutil(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('20090415', '20090519', tz='dateutil/US/Eastern')
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_explicit_pytz(self):
-        tm._skip_if_no_pytz()
-        import pytz
-        rng = date_range('20090415', '20090519',
-                         tz=pytz.timezone('US/Eastern'))
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_to_datetime_explicit_dateutil(self):
-        tm._skip_if_windows_python_3()
-        tm._skip_if_no_dateutil()
-        from pandas._libs.tslib import _dateutil_gettz as gettz
-        rng = date_range('20090415', '20090519', tz=gettz('US/Eastern'))
-
-        stamp = rng[0]
-        dtval = stamp.to_pydatetime()
-        self.assertEqual(stamp, dtval)
-        self.assertEqual(stamp.tzinfo, dtval.tzinfo)
-
-    def test_timestamp_fields(self):
-        # extra fields from DatetimeIndex like quarter and week
-        idx = tm.makeDateIndex(100)
-
-        fields = ['dayofweek', 'dayofyear', 'week', 'weekofyear', 'quarter',
-                  'days_in_month', 'is_month_start', 'is_month_end',
-                  'is_quarter_start', 'is_quarter_end', 'is_year_start',
-                  'is_year_end', 'weekday_name']
-        for f in fields:
-            expected = getattr(idx, f)[-1]
-            result = getattr(Timestamp(idx[-1]), f)
-            self.assertEqual(result, expected)
-
-        self.assertEqual(idx.freq, Timestamp(idx[-1], idx.freq).freq)
-        self.assertEqual(idx.freqstr, Timestamp(idx[-1], idx.freq).freqstr)
-
-    def test_timestamp_date_out_of_range(self):
-        self.assertRaises(ValueError, Timestamp, '1676-01-01')
-        self.assertRaises(ValueError, Timestamp, '2263-01-01')
-
-        # 1475
-        self.assertRaises(ValueError, DatetimeIndex, ['1400-01-01'])
-        self.assertRaises(ValueError, DatetimeIndex, [datetime(1400, 1, 1)])
-
-    def test_timestamp_repr(self):
-        # pre-1900
-        stamp = Timestamp('1850-01-01', tz='US/Eastern')
-        repr(stamp)
-
-        iso8601 = '1850-01-01 01:23:45.012345'
-        stamp = Timestamp(iso8601, tz='US/Eastern')
-        result = repr(stamp)
-        self.assertIn(iso8601, result)
-
-    def test_timestamp_from_ordinal(self):
-
-        # GH 3042
-        dt = datetime(2011, 4, 16, 0, 0)
-        ts = Timestamp.fromordinal(dt.toordinal())
-        self.assertEqual(ts.to_pydatetime(), dt)
-
-        # with a tzinfo
-        stamp = Timestamp('2011-4-16', tz='US/Eastern')
-        dt_tz = stamp.to_pydatetime()
-        ts = Timestamp.fromordinal(dt_tz.toordinal(), tz='US/Eastern')
-        self.assertEqual(ts.to_pydatetime(), dt_tz)
-
-    def test_timestamp_compare_with_early_datetime(self):
-        # e.g. datetime.min
-        stamp = Timestamp('2012-01-01')
-
-        self.assertFalse(stamp == datetime.min)
-        self.assertFalse(stamp == datetime(1600, 1, 1))
-        self.assertFalse(stamp == datetime(2700, 1, 1))
-        self.assertNotEqual(stamp, datetime.min)
-        self.assertNotEqual(stamp, datetime(1600, 1, 1))
-        self.assertNotEqual(stamp, datetime(2700, 1, 1))
-        self.assertTrue(stamp > datetime(1600, 1, 1))
-        self.assertTrue(stamp >= datetime(1600, 1, 1))
-        self.assertTrue(stamp < datetime(2700, 1, 1))
-        self.assertTrue(stamp <= datetime(2700, 1, 1))
-
-    def test_timestamp_equality(self):
-
-        # GH 11034
-        s = Series([Timestamp('2000-01-29 01:59:00'), 'NaT'])
-        result = s != s
-        assert_series_equal(result, Series([False, True]))
-        result = s != s[0]
-        assert_series_equal(result, Series([False, True]))
-        result = s != s[1]
-        assert_series_equal(result, Series([True, True]))
-
-        result = s == s
-        assert_series_equal(result, Series([True, False]))
-        result = s == s[0]
-        assert_series_equal(result, Series([True, False]))
-        result = s == s[1]
-        assert_series_equal(result, Series([False, False]))
-
-    def test_series_box_timestamp(self):
-        rng = date_range('20090415', '20090519', freq='B')
-        s = Series(rng)
-
-        tm.assertIsInstance(s[5], Timestamp)
-
-        rng = date_range('20090415', '20090519', freq='B')
-        s = Series(rng, index=rng)
-        tm.assertIsInstance(s[5], Timestamp)
-
-        tm.assertIsInstance(s.iat[5], Timestamp)
-
-    def test_frame_setitem_timestamp(self):
-        # 2155
-        columns = DatetimeIndex(start='1/1/2012', end='2/1/2012',
-                                freq=offsets.BDay())
-        index = lrange(10)
-        data = DataFrame(columns=columns, index=index)
-        t = datetime(2012, 11, 1)
-        ts = Timestamp(t)
-        data[ts] = np.nan  # works
-
-    def test_to_html_timestamp(self):
-        rng = date_range('2000-01-01', periods=10)
-        df = DataFrame(np.random.randn(10, 4), index=rng)
-
-        result = df.to_html()
-        self.assertIn('2000-01-01', result)
-
-    def test_series_map_box_timestamps(self):
-        # #2689, #2627
-        s = Series(date_range('1/1/2000', periods=10))
-
-        def f(x):
-            return (x.hour, x.day, x.month)
-
-        # it works!
-        s.map(f)
-        s.apply(f)
-        DataFrame(s).applymap(f)
-
-    def test_dti_slicing(self):
-        dti = DatetimeIndex(start='1/1/2005', end='12/1/2005', freq='M')
-        dti2 = dti[[1, 3, 5]]
-
-        v1 = dti2[0]
-        v2 = dti2[1]
-        v3 = dti2[2]
-
-        self.assertEqual(v1, Timestamp('2/28/2005'))
-        self.assertEqual(v2, Timestamp('4/30/2005'))
-        self.assertEqual(v3, Timestamp('6/30/2005'))
-
-        # don't carry freq through irregular slicing
-        self.assertIsNone(dti2.freq)
-
-    def test_woy_boundary(self):
-        # make sure weeks at year boundaries are correct
-        d = datetime(2013, 12, 31)
-        result = Timestamp(d).week
-        expected = 1  # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2008, 12, 28)
-        result = Timestamp(d).week
-        expected = 52  # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2009, 12, 31)
-        result = Timestamp(d).week
-        expected = 53  # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2010, 1, 1)
-        result = Timestamp(d).week
-        expected = 53  # ISO standard
-        self.assertEqual(result, expected)
-
-        d = datetime(2010, 1, 3)
-        result = Timestamp(d).week
-        expected = 53  # ISO standard
-        self.assertEqual(result, expected)
-
-        result = np.array([Timestamp(datetime(*args)).week
-                           for args in [(2000, 1, 1), (2000, 1, 2), (
-                               2005, 1, 1), (2005, 1, 2)]])
-        self.assertTrue((result == [52, 52, 53, 53]).all())
-
-
-class TestTsUtil(tm.TestCase):
-
-    def test_min_valid(self):
-        # Ensure that Timestamp.min is a valid Timestamp
-        Timestamp(Timestamp.min)
-
-    def test_max_valid(self):
-        # Ensure that Timestamp.max is a valid Timestamp
-        Timestamp(Timestamp.max)
-
-    def test_to_datetime_bijective(self):
-        # Ensure that converting to datetime and back only loses precision
-        # by going from nanoseconds to microseconds.
-        exp_warning = None if Timestamp.max.nanosecond == 0 else UserWarning
-        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
-            self.assertEqual(
-                Timestamp(Timestamp.max.to_pydatetime()).value / 1000,
-                Timestamp.max.value / 1000)
-
-        exp_warning = None if Timestamp.min.nanosecond == 0 else UserWarning
-        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
-            self.assertEqual(
-                Timestamp(Timestamp.min.to_pydatetime()).value / 1000,
-                Timestamp.min.value / 1000)
diff --git a/pandas/tests/scalar/timedelta/__init__.py b/pandas/tests/scalar/timedelta/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/timedelta/test_arithmetic.py b/pandas/tests/scalar/timedelta/test_arithmetic.py
new file mode 100644
index 0000000000000..b6ad251d598ab
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_arithmetic.py
@@ -0,0 +1,691 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for scalar Timedelta arithmetic ops
+"""
+from datetime import datetime, timedelta
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import NaT, Timedelta, Timestamp
+from pandas.core import ops
+import pandas.util.testing as tm
+
+
+class TestTimedeltaAdditionSubtraction(object):
+    """
+    Tests for Timedelta methods:
+
+        __add__, __radd__,
+        __sub__, __rsub__
+    """
+    @pytest.mark.parametrize('ten_seconds', [
+        Timedelta(10, unit='s'),
+        timedelta(seconds=10),
+        np.timedelta64(10, 's'),
+        np.timedelta64(10000000000, 'ns'),
+        pd.offsets.Second(10)])
+    def test_td_add_sub_ten_seconds(self, ten_seconds):
+        # GH#6808
+        base = Timestamp('20130101 09:01:12.123456')
+        expected_add = Timestamp('20130101 09:01:22.123456')
+        expected_sub = Timestamp('20130101 09:01:02.123456')
+
+        result = base + ten_seconds
+        assert result == expected_add
+
+        result = base - ten_seconds
+        assert result == expected_sub
+
+    @pytest.mark.parametrize('one_day_ten_secs', [
+        Timedelta('1 day, 00:00:10'),
+        Timedelta('1 days, 00:00:10'),
+        timedelta(days=1, seconds=10),
+        np.timedelta64(1, 'D') + np.timedelta64(10, 's'),
+        pd.offsets.Day() + pd.offsets.Second(10)])
+    def test_td_add_sub_one_day_ten_seconds(self, one_day_ten_secs):
+        # GH#6808
+        base = Timestamp('20130102 09:01:12.123456')
+        expected_add = Timestamp('20130103 09:01:22.123456')
+        expected_sub = Timestamp('20130101 09:01:02.123456')
+
+        result = base + one_day_ten_secs
+        assert result == expected_add
+
+        result = base - one_day_ten_secs
+        assert result == expected_sub
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_datetimelike_scalar(self, op):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = op(td, datetime(2016, 1, 1))
+        if op is operator.add:
+            # datetime + Timedelta does _not_ call Timedelta.__radd__,
+            # so we get a datetime back instead of a Timestamp
+            assert isinstance(result, Timestamp)
+        assert result == Timestamp(2016, 1, 11)
+
+        result = op(td, Timestamp('2018-01-12 18:09'))
+        assert isinstance(result, Timestamp)
+        assert result == Timestamp('2018-01-22 18:09')
+
+        result = op(td, np.datetime64('2018-01-12'))
+        assert isinstance(result, Timestamp)
+        assert result == Timestamp('2018-01-22')
+
+        result = op(td, NaT)
+        assert result is NaT
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_td(self, op):
+        td = Timedelta(10, unit='d')
+
+        result = op(td, Timedelta(days=10))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=20)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_pytimedelta(self, op):
+        td = Timedelta(10, unit='d')
+        result = op(td, timedelta(days=9))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=19)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_timedelta64(self, op):
+        td = Timedelta(10, unit='d')
+        result = op(td, np.timedelta64(-4, 'D'))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=6)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_offset(self, op):
+        td = Timedelta(10, unit='d')
+
+        result = op(td, pd.offsets.Hour(6))
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=10, hours=6)
+
+    def test_td_sub_td(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+        result = td - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_pytimedelta(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+
+        result = td - td.to_pytimedelta()
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+        result = td.to_pytimedelta() - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_timedelta64(self):
+        td = Timedelta(10, unit='d')
+        expected = Timedelta(0, unit='ns')
+
+        result = td - td.to_timedelta64()
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+        result = td.to_timedelta64() - td
+        assert isinstance(result, Timedelta)
+        assert result == expected
+
+    def test_td_sub_nat(self):
+        # In this context pd.NaT is treated as timedelta-like
+        td = Timedelta(10, unit='d')
+        result = td - NaT
+        assert result is NaT
+
+    def test_td_sub_td64_nat(self):
+        td = Timedelta(10, unit='d')
+        td_nat = np.timedelta64('NaT')
+
+        result = td - td_nat
+        assert result is NaT
+
+        result = td_nat - td
+        assert result is NaT
+
+    def test_td_sub_offset(self):
+        td = Timedelta(10, unit='d')
+        result = td - pd.offsets.Hour(1)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(239, unit='h')
+
+    def test_td_add_sub_numeric_raises(self):
+        td = Timedelta(10, unit='d')
+        for other in [2, 2.0, np.int64(2), np.float64(2)]:
+            with pytest.raises(TypeError):
+                td + other
+            with pytest.raises(TypeError):
+                other + td
+            with pytest.raises(TypeError):
+                td - other
+            with pytest.raises(TypeError):
+                other - td
+
+    def test_td_rsub_nat(self):
+        td = Timedelta(10, unit='d')
+        result = NaT - td
+        assert result is NaT
+
+        result = np.datetime64('NaT') - td
+        assert result is NaT
+
+    def test_td_rsub_offset(self):
+        result = pd.offsets.Hour(1) - Timedelta(10, unit='d')
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(-239, unit='h')
+
+    def test_td_sub_timedeltalike_object_dtype_array(self):
+        # GH#21980
+        arr = np.array([Timestamp('20130101 9:01'),
+                        Timestamp('20121230 9:02')])
+        exp = np.array([Timestamp('20121231 9:01'),
+                        Timestamp('20121229 9:02')])
+        res = arr - Timedelta('1D')
+        tm.assert_numpy_array_equal(res, exp)
+
+    def test_td_sub_mixed_most_timedeltalike_object_dtype_array(self):
+        # GH#21980
+        now = Timestamp.now()
+        arr = np.array([now,
+                        Timedelta('1D'),
+                        np.timedelta64(2, 'h')])
+        exp = np.array([now - Timedelta('1D'),
+                        Timedelta('0D'),
+                        np.timedelta64(2, 'h') - Timedelta('1D')])
+        res = arr - Timedelta('1D')
+        tm.assert_numpy_array_equal(res, exp)
+
+    def test_td_rsub_mixed_most_timedeltalike_object_dtype_array(self):
+        # GH#21980
+        now = Timestamp.now()
+        arr = np.array([now,
+                        Timedelta('1D'),
+                        np.timedelta64(2, 'h')])
+        with pytest.raises(TypeError):
+            Timedelta('1D') - arr
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_timedeltalike_object_dtype_array(self, op):
+        # GH#21980
+        arr = np.array([Timestamp('20130101 9:01'),
+                        Timestamp('20121230 9:02')])
+        exp = np.array([Timestamp('20130102 9:01'),
+                        Timestamp('20121231 9:02')])
+        res = op(arr, Timedelta('1D'))
+        tm.assert_numpy_array_equal(res, exp)
+
+    @pytest.mark.parametrize('op', [operator.add, ops.radd])
+    def test_td_add_mixed_timedeltalike_object_dtype_array(self, op):
+        # GH#21980
+        now = Timestamp.now()
+        arr = np.array([now,
+                        Timedelta('1D')])
+        exp = np.array([now + Timedelta('1D'),
+                        Timedelta('2D')])
+        res = op(arr, Timedelta('1D'))
+        tm.assert_numpy_array_equal(res, exp)
+
+
+class TestTimedeltaMultiplicationDivision(object):
+    """
+    Tests for Timedelta methods:
+
+        __mul__, __rmul__,
+        __div__, __rdiv__,
+        __truediv__, __rtruediv__,
+        __floordiv__, __rfloordiv__,
+        __mod__, __rmod__,
+        __divmod__, __rdivmod__
+    """
+
+    # ---------------------------------------------------------------
+    # Timedelta.__mul__, __rmul__
+
+    @pytest.mark.parametrize('td_nat', [NaT,
+                                        np.timedelta64('NaT', 'ns'),
+                                        np.timedelta64('NaT')])
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul])
+    def test_td_mul_nat(self, op, td_nat):
+        # GH#19819
+        td = Timedelta(10, unit='d')
+        with pytest.raises(TypeError):
+            op(td, td_nat)
+
+    @pytest.mark.parametrize('nan', [np.nan, np.float64('NaN'), float('nan')])
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul])
+    def test_td_mul_nan(self, op, nan):
+        # np.float64('NaN') has a 'dtype' attr, avoid treating as array
+        td = Timedelta(10, unit='d')
+        result = op(td, nan)
+        assert result is NaT
+
+    @pytest.mark.parametrize('op', [operator.mul, ops.rmul])
+    def test_td_mul_scalar(self, op):
+        # GH#19738
+        td = Timedelta(minutes=3)
+
+        result = op(td, 2)
+        assert result == Timedelta(minutes=6)
+
+        result = op(td, 1.5)
+        assert result == Timedelta(minutes=4, seconds=30)
+
+        assert op(td, np.nan) is NaT
+
+        assert op(-1, td).value == -1 * td.value
+        assert op(-1.0, td).value == -1.0 * td.value
+
+        with pytest.raises(TypeError):
+            # timedelta * datetime is gibberish
+            op(td, Timestamp(2016, 1, 2))
+
+        with pytest.raises(TypeError):
+            # invalid multiply with another timedelta
+            op(td, td)
+
+    # ---------------------------------------------------------------
+    # Timedelta.__div__, __truediv__
+
+    def test_td_div_timedeltalike_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = td / pd.offsets.Hour(1)
+        assert result == 240
+
+        assert td / td == 1
+        assert td / np.timedelta64(60, 'h') == 4
+
+        assert np.isnan(td / NaT)
+
+    def test_td_div_numeric_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+
+        result = td / 2
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=5)
+
+        result = td / 5.0
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(days=2)
+
+    @pytest.mark.parametrize('nan', [np.nan, np.float64('NaN'), float('nan')])
+    def test_td_div_nan(self, nan):
+        # np.float64('NaN') has a 'dtype' attr, avoid treating as array
+        td = Timedelta(10, unit='d')
+        result = td / nan
+        assert result is NaT
+
+        result = td // nan
+        assert result is NaT
+
+    # ---------------------------------------------------------------
+    # Timedelta.__rdiv__
+
+    def test_td_rdiv_timedeltalike_scalar(self):
+        # GH#19738
+        td = Timedelta(10, unit='d')
+        result = pd.offsets.Hour(1) / td
+        assert result == 1 / 240.0
+
+        assert np.timedelta64(60, 'h') / td == 0.25
+
+    # ---------------------------------------------------------------
+    # Timedelta.__floordiv__
+
+    def test_td_floordiv_timedeltalike_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        scalar = Timedelta(hours=3, minutes=3)
+
+        assert td // scalar == 1
+        assert -td // scalar.to_pytimedelta() == -2
+        assert (2 * td) // scalar.to_timedelta64() == 2
+
+    def test_td_floordiv_null_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        assert td // np.nan is NaT
+        assert np.isnan(td // NaT)
+        assert np.isnan(td // np.timedelta64('NaT'))
+
+    def test_td_floordiv_offsets(self):
+        # GH#19738
+        td = Timedelta(hours=3, minutes=4)
+        assert td // pd.offsets.Hour(1) == 3
+        assert td // pd.offsets.Minute(2) == 92
+
+    def test_td_floordiv_invalid_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        with pytest.raises(TypeError):
+            td // np.datetime64('2016-01-01', dtype='datetime64[us]')
+
+    def test_td_floordiv_numeric_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+
+        expected = Timedelta(hours=1, minutes=32)
+        assert td // 2 == expected
+        assert td // 2.0 == expected
+        assert td // np.float64(2.0) == expected
+        assert td // np.int32(2.0) == expected
+        assert td // np.uint8(2.0) == expected
+
+    def test_td_floordiv_timedeltalike_array(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        scalar = Timedelta(hours=3, minutes=3)
+
+        # Array-like others
+        assert td // np.array(scalar.to_timedelta64()) == 1
+
+        res = (3 * td) // np.array([scalar.to_timedelta64()])
+        expected = np.array([3], dtype=np.int64)
+        tm.assert_numpy_array_equal(res, expected)
+
+        res = (10 * td) // np.array([scalar.to_timedelta64(),
+                                     np.timedelta64('NaT')])
+        expected = np.array([10, np.nan])
+        tm.assert_numpy_array_equal(res, expected)
+
+    def test_td_floordiv_numeric_series(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=4)
+        ser = pd.Series([1], dtype=np.int64)
+        res = td // ser
+        assert res.dtype.kind == 'm'
+
+    # ---------------------------------------------------------------
+    # Timedelta.__rfloordiv__
+
+    def test_td_rfloordiv_timedeltalike_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        scalar = Timedelta(hours=3, minutes=4)
+
+        # scalar others
+        # x // Timedelta is defined only for timedelta-like x. int-like,
+        # float-like, and date-like, in particular, should all either
+        # a) raise TypeError directly or
+        # b) return NotImplemented, following which the reversed
+        #    operation will raise TypeError.
+        assert td.__rfloordiv__(scalar) == 1
+        assert (-td).__rfloordiv__(scalar.to_pytimedelta()) == -2
+        assert (2 * td).__rfloordiv__(scalar.to_timedelta64()) == 0
+
+    def test_td_rfloordiv_null_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        assert np.isnan(td.__rfloordiv__(NaT))
+        assert np.isnan(td.__rfloordiv__(np.timedelta64('NaT')))
+
+    def test_td_rfloordiv_offsets(self):
+        # GH#19738
+        assert pd.offsets.Hour(1) // Timedelta(minutes=25) == 2
+
+    def test_td_rfloordiv_invalid_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        dt64 = np.datetime64('2016-01-01', dtype='datetime64[us]')
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(dt64)
+
+    def test_td_rfloordiv_numeric_scalar(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+
+        assert td.__rfloordiv__(np.nan) is NotImplemented
+        assert td.__rfloordiv__(3.5) is NotImplemented
+        assert td.__rfloordiv__(2) is NotImplemented
+
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(np.float64(2.0))
+        with pytest.raises(TypeError):
+            td.__rfloordiv__(np.uint8(9))
+        with tm.assert_produces_warning(FutureWarning):
+            # GH-19761: Change to TypeError.
+            td.__rfloordiv__(np.int32(2.0))
+
+    def test_td_rfloordiv_timedeltalike_array(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        scalar = Timedelta(hours=3, minutes=4)
+
+        # Array-like others
+        assert td.__rfloordiv__(np.array(scalar.to_timedelta64())) == 1
+
+        res = td.__rfloordiv__(np.array([(3 * scalar).to_timedelta64()]))
+        expected = np.array([3], dtype=np.int64)
+        tm.assert_numpy_array_equal(res, expected)
+
+        arr = np.array([(10 * scalar).to_timedelta64(),
+                        np.timedelta64('NaT')])
+        res = td.__rfloordiv__(arr)
+        expected = np.array([10, np.nan])
+        tm.assert_numpy_array_equal(res, expected)
+
+    def test_td_rfloordiv_numeric_series(self):
+        # GH#18846
+        td = Timedelta(hours=3, minutes=3)
+        ser = pd.Series([1], dtype=np.int64)
+        res = td.__rfloordiv__(ser)
+        assert res is NotImplemented
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # TODO: GH-19761. Change to TypeError.
+            ser // td
+
+    # ----------------------------------------------------------------
+    # Timedelta.__mod__, __rmod__
+
+    def test_mod_timedeltalike(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        # Timedelta-like others
+        result = td % Timedelta(hours=6)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=1)
+
+        result = td % timedelta(minutes=60)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(0)
+
+        result = td % NaT
+        assert result is NaT
+
+    def test_mod_timedelta64_nat(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % np.timedelta64('NaT', 'ns')
+        assert result is NaT
+
+    def test_mod_timedelta64(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % np.timedelta64(2, 'h')
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=1)
+
+    def test_mod_offset(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        result = td % pd.offsets.Hour(5)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(hours=2)
+
+    def test_mod_numeric(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        # Numeric Others
+        result = td % 2
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(0)
+
+        result = td % 1e12
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=3, seconds=20)
+
+        result = td % int(1e12)
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=3, seconds=20)
+
+    def test_mod_invalid(self):
+        # GH#19365
+        td = Timedelta(hours=37)
+
+        with pytest.raises(TypeError):
+            td % Timestamp('2018-01-22')
+
+        with pytest.raises(TypeError):
+            td % []
+
+    def test_rmod_pytimedelta(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        result = timedelta(minutes=4) % td
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=1)
+
+    def test_rmod_timedelta64(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+        result = np.timedelta64(5, 'm') % td
+        assert isinstance(result, Timedelta)
+        assert result == Timedelta(minutes=2)
+
+    def test_rmod_invalid(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        with pytest.raises(TypeError):
+            Timestamp('2018-01-22') % td
+
+        with pytest.raises(TypeError):
+            15 % td
+
+        with pytest.raises(TypeError):
+            16.0 % td
+
+        with pytest.raises(TypeError):
+            np.array([22, 24]) % td
+
+    # ----------------------------------------------------------------
+    # Timedelta.__divmod__, __rdivmod__
+
+    def test_divmod_numeric(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, 53 * 3600 * 1e9)
+        assert result[0] == Timedelta(1, unit='ns')
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=1)
+
+        assert result
+        result = divmod(td, np.nan)
+        assert result[0] is NaT
+        assert result[1] is NaT
+
+    def test_divmod(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, timedelta(days=1))
+        assert result[0] == 2
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=6)
+
+        result = divmod(td, 54)
+        assert result[0] == Timedelta(hours=1)
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(0)
+
+        result = divmod(td, NaT)
+        assert np.isnan(result[0])
+        assert result[1] is NaT
+
+    def test_divmod_offset(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        result = divmod(td, pd.offsets.Hour(-4))
+        assert result[0] == -14
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=-2)
+
+    def test_divmod_invalid(self):
+        # GH#19365
+        td = Timedelta(days=2, hours=6)
+
+        with pytest.raises(TypeError):
+            divmod(td, Timestamp('2018-01-22'))
+
+    def test_rdivmod_pytimedelta(self):
+        # GH#19365
+        result = divmod(timedelta(days=2, hours=6), Timedelta(days=1))
+        assert result[0] == 2
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=6)
+
+    def test_rdivmod_offset(self):
+        result = divmod(pd.offsets.Hour(54), Timedelta(hours=-4))
+        assert result[0] == -14
+        assert isinstance(result[1], Timedelta)
+        assert result[1] == Timedelta(hours=-2)
+
+    def test_rdivmod_invalid(self):
+        # GH#19365
+        td = Timedelta(minutes=3)
+
+        with pytest.raises(TypeError):
+            divmod(Timestamp('2018-01-22'), td)
+
+        with pytest.raises(TypeError):
+            divmod(15, td)
+
+        with pytest.raises(TypeError):
+            divmod(16.0, td)
+
+        with pytest.raises(TypeError):
+            divmod(np.array([22, 24]), td)
+
+    # ----------------------------------------------------------------
+
+    @pytest.mark.parametrize('op', [
+        operator.mul,
+        ops.rmul,
+        operator.truediv,
+        ops.rdiv,
+        ops.rsub])
+    @pytest.mark.parametrize('arr', [
+        np.array([Timestamp('20130101 9:01'), Timestamp('20121230 9:02')]),
+        np.array([Timestamp.now(), Timedelta('1D')])
+    ])
+    def test_td_op_timedelta_timedeltalike_array(self, op, arr):
+        with pytest.raises(TypeError):
+            op(arr, Timedelta('1D'))
diff --git a/pandas/tests/scalar/timedelta/test_construction.py b/pandas/tests/scalar/timedelta/test_construction.py
new file mode 100644
index 0000000000000..880eca914749b
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_construction.py
@@ -0,0 +1,210 @@
+# -*- coding: utf-8 -*-
+from datetime import timedelta
+
+import numpy as np
+import pytest
+
+from pandas import Timedelta, offsets, to_timedelta
+
+
+def test_construction():
+    expected = np.timedelta64(10, 'D').astype('m8[ns]').view('i8')
+    assert Timedelta(10, unit='d').value == expected
+    assert Timedelta(10.0, unit='d').value == expected
+    assert Timedelta('10 days').value == expected
+    assert Timedelta(days=10).value == expected
+    assert Timedelta(days=10.0).value == expected
+
+    expected += np.timedelta64(10, 's').astype('m8[ns]').view('i8')
+    assert Timedelta('10 days 00:00:10').value == expected
+    assert Timedelta(days=10, seconds=10).value == expected
+    assert Timedelta(days=10, milliseconds=10 * 1000).value == expected
+    assert Timedelta(days=10,
+                     microseconds=10 * 1000 * 1000).value == expected
+
+    # rounding cases
+    assert Timedelta(82739999850000).value == 82739999850000
+    assert ('0 days 22:58:59.999850' in str(Timedelta(82739999850000)))
+    assert Timedelta(123072001000000).value == 123072001000000
+    assert ('1 days 10:11:12.001' in str(Timedelta(123072001000000)))
+
+    # string conversion with/without leading zero
+    # GH#9570
+    assert Timedelta('0:00:00') == timedelta(hours=0)
+    assert Timedelta('00:00:00') == timedelta(hours=0)
+    assert Timedelta('-1:00:00') == -timedelta(hours=1)
+    assert Timedelta('-01:00:00') == -timedelta(hours=1)
+
+    # more strings & abbrevs
+    # GH#8190
+    assert Timedelta('1 h') == timedelta(hours=1)
+    assert Timedelta('1 hour') == timedelta(hours=1)
+    assert Timedelta('1 hr') == timedelta(hours=1)
+    assert Timedelta('1 hours') == timedelta(hours=1)
+    assert Timedelta('-1 hours') == -timedelta(hours=1)
+    assert Timedelta('1 m') == timedelta(minutes=1)
+    assert Timedelta('1.5 m') == timedelta(seconds=90)
+    assert Timedelta('1 minute') == timedelta(minutes=1)
+    assert Timedelta('1 minutes') == timedelta(minutes=1)
+    assert Timedelta('1 s') == timedelta(seconds=1)
+    assert Timedelta('1 second') == timedelta(seconds=1)
+    assert Timedelta('1 seconds') == timedelta(seconds=1)
+    assert Timedelta('1 ms') == timedelta(milliseconds=1)
+    assert Timedelta('1 milli') == timedelta(milliseconds=1)
+    assert Timedelta('1 millisecond') == timedelta(milliseconds=1)
+    assert Timedelta('1 us') == timedelta(microseconds=1)
+    assert Timedelta('1 micros') == timedelta(microseconds=1)
+    assert Timedelta('1 microsecond') == timedelta(microseconds=1)
+    assert Timedelta('1.5 microsecond') == Timedelta('00:00:00.000001500')
+    assert Timedelta('1 ns') == Timedelta('00:00:00.000000001')
+    assert Timedelta('1 nano') == Timedelta('00:00:00.000000001')
+    assert Timedelta('1 nanosecond') == Timedelta('00:00:00.000000001')
+
+    # combos
+    assert Timedelta('10 days 1 hour') == timedelta(days=10, hours=1)
+    assert Timedelta('10 days 1 h') == timedelta(days=10, hours=1)
+    assert Timedelta('10 days 1 h 1m 1s') == timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1)
+    assert Timedelta('-10 days 1 h 1m 1s 3us') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=1, microseconds=3)
+    assert Timedelta('-10 days 1 h 1.5m 1s 3us') == -timedelta(
+        days=10, hours=1, minutes=1, seconds=31, microseconds=3)
+
+    # Currently invalid as it has a - on the hh:mm:dd part
+    # (only allowed on the days)
+    with pytest.raises(ValueError):
+        Timedelta('-10 days -1 h 1.5m 1s 3us')
+
+    # only leading neg signs are allowed
+    with pytest.raises(ValueError):
+        Timedelta('10 days -1 h 1.5m 1s 3us')
+
+    # no units specified
+    with pytest.raises(ValueError):
+        Timedelta('3.1415')
+
+    # invalid construction
+    with pytest.raises(ValueError, match="cannot construct a Timedelta"):
+        Timedelta()
+
+    with pytest.raises(ValueError, match="unit abbreviation w/o a number"):
+        Timedelta('foo')
+
+    msg = ("cannot construct a Timedelta from "
+           "the passed arguments, allowed keywords are ")
+    with pytest.raises(ValueError, match=msg):
+        Timedelta(day=10)
+
+    # floats
+    expected = np.timedelta64(
+        10, 's').astype('m8[ns]').view('i8') + np.timedelta64(
+            500, 'ms').astype('m8[ns]').view('i8')
+    assert Timedelta(10.5, unit='s').value == expected
+
+    # offset
+    assert to_timedelta(offsets.Hour(2)) == Timedelta(hours=2)
+    assert Timedelta(offsets.Hour(2)) == Timedelta(hours=2)
+    assert Timedelta(offsets.Second(2)) == Timedelta(seconds=2)
+
+    # GH#11995: unicode
+    expected = Timedelta('1H')
+    result = Timedelta(u'1H')
+    assert result == expected
+    assert to_timedelta(offsets.Hour(2)) == Timedelta(u'0 days, 02:00:00')
+
+    with pytest.raises(ValueError):
+        Timedelta(u'foo bar')
+
+
+@pytest.mark.parametrize('item', list({'days': 'D',
+                                       'seconds': 's',
+                                       'microseconds': 'us',
+                                       'milliseconds': 'ms',
+                                       'minutes': 'm',
+                                       'hours': 'h',
+                                       'weeks': 'W'}.items()))
+@pytest.mark.parametrize('npdtype', [np.int64, np.int32, np.int16,
+                                     np.float64, np.float32, np.float16])
+def test_td_construction_with_np_dtypes(npdtype, item):
+    # GH#8757: test construction with np dtypes
+    pykwarg, npkwarg = item
+    expected = np.timedelta64(1, npkwarg).astype('m8[ns]').view('i8')
+    assert Timedelta(**{pykwarg: npdtype(1)}).value == expected
+
+
+@pytest.mark.parametrize('val', [
+    '1s', '-1s', '1us', '-1us', '1 day', '-1 day',
+    '-23:59:59.999999', '-1 days +23:59:59.999999', '-1ns',
+    '1ns', '-23:59:59.999999999'])
+def test_td_from_repr_roundtrip(val):
+    # round-trip both for string and value
+    td = Timedelta(val)
+    assert Timedelta(td.value) == td
+
+    # str does not normally display nanos
+    if not td.nanoseconds:
+        assert Timedelta(str(td)) == td
+    assert Timedelta(td._repr_base(format='all')) == td
+
+
+def test_overflow_on_construction():
+    # GH#3374
+    value = Timedelta('1day').value * 20169940
+    with pytest.raises(OverflowError):
+        Timedelta(value)
+
+    # xref GH#17637
+    with pytest.raises(OverflowError):
+        Timedelta(7 * 19999, unit='D')
+
+    with pytest.raises(OverflowError):
+        Timedelta(timedelta(days=13 * 19999))
+
+
+@pytest.mark.parametrize('fmt,exp', [
+    ('P6DT0H50M3.010010012S', Timedelta(days=6, minutes=50, seconds=3,
+                                        milliseconds=10, microseconds=10,
+                                        nanoseconds=12)),
+    ('P-6DT0H50M3.010010012S', Timedelta(days=-6, minutes=50, seconds=3,
+                                         milliseconds=10, microseconds=10,
+                                         nanoseconds=12)),
+    ('P4DT12H30M5S', Timedelta(days=4, hours=12, minutes=30, seconds=5)),
+    ('P0DT0H0M0.000000123S', Timedelta(nanoseconds=123)),
+    ('P0DT0H0M0.00001S', Timedelta(microseconds=10)),
+    ('P0DT0H0M0.001S', Timedelta(milliseconds=1)),
+    ('P0DT0H1M0S', Timedelta(minutes=1)),
+    ('P1DT25H61M61S', Timedelta(days=1, hours=25, minutes=61, seconds=61))
+])
+def test_iso_constructor(fmt, exp):
+    assert Timedelta(fmt) == exp
+
+
+@pytest.mark.parametrize('fmt', [
+    'PPPPPPPPPPPP', 'PDTHMS', 'P0DT999H999M999S',
+    'P1DT0H0M0.0000000000000S', 'P1DT0H0M00000000000S',
+    'P1DT0H0M0.S'])
+def test_iso_constructor_raises(fmt):
+    with pytest.raises(ValueError, match=('Invalid ISO 8601 Duration '
+                                          'format - {}'.format(fmt))):
+        Timedelta(fmt)
+
+
+@pytest.mark.parametrize('constructed_td, conversion', [
+    (Timedelta(nanoseconds=100), '100ns'),
+    (Timedelta(days=1, hours=1, minutes=1, weeks=1, seconds=1, milliseconds=1,
+               microseconds=1, nanoseconds=1), 694861001001001),
+    (Timedelta(microseconds=1) + Timedelta(nanoseconds=1), '1us1ns'),
+    (Timedelta(microseconds=1) - Timedelta(nanoseconds=1), '999ns'),
+    (Timedelta(microseconds=1) + 5 * Timedelta(nanoseconds=-2), '990ns')])
+def test_td_constructor_on_nanoseconds(constructed_td, conversion):
+    # GH#9273
+    assert constructed_td == Timedelta(conversion)
+
+
+def test_td_constructor_value_error():
+    with pytest.raises(TypeError):
+        Timedelta(nanoseconds='abc')
diff --git a/pandas/tests/scalar/timedelta/test_formats.py b/pandas/tests/scalar/timedelta/test_formats.py
new file mode 100644
index 0000000000000..0d0b24f192f96
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_formats.py
@@ -0,0 +1,28 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+from pandas import Timedelta
+
+
+@pytest.mark.parametrize('td, expected_repr', [
+    (Timedelta(10, unit='d'), "Timedelta('10 days 00:00:00')"),
+    (Timedelta(10, unit='s'), "Timedelta('0 days 00:00:10')"),
+    (Timedelta(10, unit='ms'), "Timedelta('0 days 00:00:00.010000')"),
+    (Timedelta(-10, unit='ms'), "Timedelta('-1 days +23:59:59.990000')")])
+def test_repr(td, expected_repr):
+    assert repr(td) == expected_repr
+
+
+@pytest.mark.parametrize('td, expected_iso', [
+    (Timedelta(days=6, minutes=50, seconds=3, milliseconds=10, microseconds=10,
+               nanoseconds=12), 'P6DT0H50M3.010010012S'),
+    (Timedelta(days=4, hours=12, minutes=30, seconds=5), 'P4DT12H30M5S'),
+    (Timedelta(nanoseconds=123), 'P0DT0H0M0.000000123S'),
+    # trim nano
+    (Timedelta(microseconds=10), 'P0DT0H0M0.00001S'),
+    # trim micro
+    (Timedelta(milliseconds=1), 'P0DT0H0M0.001S'),
+    # don't strip every 0
+    (Timedelta(minutes=1), 'P0DT0H1M0S')])
+def test_isoformat(td, expected_iso):
+    assert td.isoformat() == expected_iso
diff --git a/pandas/tests/scalar/timedelta/test_timedelta.py b/pandas/tests/scalar/timedelta/test_timedelta.py
new file mode 100644
index 0000000000000..ee2c2e9e1959c
--- /dev/null
+++ b/pandas/tests/scalar/timedelta/test_timedelta.py
@@ -0,0 +1,759 @@
+""" test the scalar Timedelta """
+from datetime import timedelta
+import re
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import NaT, iNaT
+import pandas.compat as compat
+
+import pandas as pd
+from pandas import (
+    Series, Timedelta, TimedeltaIndex, timedelta_range, to_timedelta)
+import pandas.util.testing as tm
+
+
+class TestTimedeltaArithmetic(object):
+
+    def test_arithmetic_overflow(self):
+        with pytest.raises(OverflowError):
+            pd.Timestamp('1700-01-01') + pd.Timedelta(13 * 19999, unit='D')
+
+        with pytest.raises(OverflowError):
+            pd.Timestamp('1700-01-01') + timedelta(days=13 * 19999)
+
+    def test_array_timedelta_floordiv(self):
+        # https://github.com/pandas-dev/pandas/issues/19761
+        ints = pd.date_range('2012-10-08', periods=4, freq='D').view('i8')
+        msg = r"Use 'array // timedelta.value'"
+        with tm.assert_produces_warning(FutureWarning) as m:
+            result = ints // pd.Timedelta(1, unit='s')
+
+        assert msg in str(m[0].message)
+        expected = np.array([1349654400, 1349740800, 1349827200, 1349913600],
+                            dtype='i8')
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_ops_error_str(self):
+        # GH 13624
+        td = Timedelta('1 day')
+
+        for left, right in [(td, 'a'), ('a', td)]:
+
+            with pytest.raises(TypeError):
+                left + right
+
+            with pytest.raises(TypeError):
+                left > right
+
+            assert not left == right
+            assert left != right
+
+    def test_ops_notimplemented(self):
+        class Other(object):
+            pass
+
+        other = Other()
+
+        td = Timedelta('1 day')
+        assert td.__add__(other) is NotImplemented
+        assert td.__sub__(other) is NotImplemented
+        assert td.__truediv__(other) is NotImplemented
+        assert td.__mul__(other) is NotImplemented
+        assert td.__floordiv__(other) is NotImplemented
+
+    def test_unary_ops(self):
+        td = Timedelta(10, unit='d')
+
+        # __neg__, __pos__
+        assert -td == Timedelta(-10, unit='d')
+        assert -td == Timedelta('-10d')
+        assert +td == Timedelta(10, unit='d')
+
+        # __abs__, __abs__(__neg__)
+        assert abs(td) == td
+        assert abs(-td) == td
+        assert abs(-td) == Timedelta('10d')
+
+
+class TestTimedeltaComparison(object):
+    def test_compare_tick(self, tick_classes):
+        cls = tick_classes
+
+        off = cls(4)
+        td = off.delta
+        assert isinstance(td, Timedelta)
+
+        assert td == off
+        assert not td != off
+        assert td <= off
+        assert td >= off
+        assert not td < off
+        assert not td > off
+
+        assert not td == 2 * off
+        assert td != 2 * off
+        assert td <= 2 * off
+        assert td < 2 * off
+        assert not td >= 2 * off
+        assert not td > 2 * off
+
+    def test_comparison_object_array(self):
+        # analogous to GH#15183
+        td = Timedelta('2 days')
+        other = Timedelta('3 hours')
+
+        arr = np.array([other, td], dtype=object)
+        res = arr == td
+        expected = np.array([False, True], dtype=bool)
+        assert (res == expected).all()
+
+        # 2D case
+        arr = np.array([[other, td],
+                        [td, other]],
+                       dtype=object)
+        res = arr != td
+        expected = np.array([[True, False], [False, True]], dtype=bool)
+        assert res.shape == expected.shape
+        assert (res == expected).all()
+
+    def test_compare_timedelta_ndarray(self):
+        # GH11835
+        periods = [Timedelta('0 days 01:00:00'), Timedelta('0 days 01:00:00')]
+        arr = np.array(periods)
+        result = arr[0] > arr
+        expected = np.array([False, False])
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.skip(reason="GH#20829 is reverted until after 0.24.0")
+    def test_compare_custom_object(self):
+        """
+        Make sure non supported operations on Timedelta returns NonImplemented
+        and yields to other operand (GH#20829).
+        """
+        class CustomClass(object):
+
+            def __init__(self, cmp_result=None):
+                self.cmp_result = cmp_result
+
+            def generic_result(self):
+                if self.cmp_result is None:
+                    return NotImplemented
+                else:
+                    return self.cmp_result
+
+            def __eq__(self, other):
+                return self.generic_result()
+
+            def __gt__(self, other):
+                return self.generic_result()
+
+        t = Timedelta('1s')
+
+        assert not (t == "string")
+        assert not (t == 1)
+        assert not (t == CustomClass())
+        assert not (t == CustomClass(cmp_result=False))
+
+        assert t < CustomClass(cmp_result=True)
+        assert not (t < CustomClass(cmp_result=False))
+
+        assert t == CustomClass(cmp_result=True)
+
+    @pytest.mark.parametrize("val", ["string", 1])
+    def test_compare_unknown_type(self, val):
+        # GH20829
+        t = Timedelta('1s')
+        with pytest.raises(TypeError):
+            t >= val
+        with pytest.raises(TypeError):
+            t > val
+        with pytest.raises(TypeError):
+            t <= val
+        with pytest.raises(TypeError):
+            t < val
+
+
+class TestTimedeltas(object):
+
+    @pytest.mark.parametrize("unit, value, expected", [
+        ('us', 9.999, 9999), ('ms', 9.999999, 9999999),
+        ('s', 9.999999999, 9999999999)])
+    def test_rounding_on_int_unit_construction(self, unit, value, expected):
+        # GH 12690
+        result = Timedelta(value, unit=unit)
+        assert result.value == expected
+        result = Timedelta(str(value) + unit)
+        assert result.value == expected
+
+    def test_total_seconds_scalar(self):
+        # see gh-10939
+        rng = Timedelta('1 days, 10:11:12.100123456')
+        expt = 1 * 86400 + 10 * 3600 + 11 * 60 + 12 + 100123456. / 1e9
+        tm.assert_almost_equal(rng.total_seconds(), expt)
+
+        rng = Timedelta(np.nan)
+        assert np.isnan(rng.total_seconds())
+
+    def test_conversion(self):
+
+        for td in [Timedelta(10, unit='d'),
+                   Timedelta('1 days, 10:11:12.012345')]:
+            pydt = td.to_pytimedelta()
+            assert td == Timedelta(pydt)
+            assert td == pydt
+            assert (isinstance(pydt, timedelta) and not isinstance(
+                pydt, Timedelta))
+
+            assert td == np.timedelta64(td.value, 'ns')
+            td64 = td.to_timedelta64()
+
+            assert td64 == np.timedelta64(td.value, 'ns')
+            assert td == td64
+
+            assert isinstance(td64, np.timedelta64)
+
+        # this is NOT equal and cannot be roundtriped (because of the nanos)
+        td = Timedelta('1 days, 10:11:12.012345678')
+        assert td != td.to_pytimedelta()
+
+    def test_freq_conversion(self):
+
+        # truediv
+        td = Timedelta('1 days 2 hours 3 ns')
+        result = td / np.timedelta64(1, 'D')
+        assert result == td.value / float(86400 * 1e9)
+        result = td / np.timedelta64(1, 's')
+        assert result == td.value / float(1e9)
+        result = td / np.timedelta64(1, 'ns')
+        assert result == td.value
+
+        # floordiv
+        td = Timedelta('1 days 2 hours 3 ns')
+        result = td // np.timedelta64(1, 'D')
+        assert result == 1
+        result = td // np.timedelta64(1, 's')
+        assert result == 93600
+        result = td // np.timedelta64(1, 'ns')
+        assert result == td.value
+
+    def test_fields(self):
+        def check(value):
+            # that we are int/long like
+            assert isinstance(value, (int, compat.long))
+
+        # compat to datetime.timedelta
+        rng = to_timedelta('1 days, 10:11:12')
+        assert rng.days == 1
+        assert rng.seconds == 10 * 3600 + 11 * 60 + 12
+        assert rng.microseconds == 0
+        assert rng.nanoseconds == 0
+
+        msg = "'Timedelta' object has no attribute '{}'"
+        with pytest.raises(AttributeError, match=msg.format('hours')):
+            rng.hours
+        with pytest.raises(AttributeError, match=msg.format('minutes')):
+            rng.minutes
+        with pytest.raises(AttributeError, match=msg.format('milliseconds')):
+            rng.milliseconds
+
+        # GH 10050
+        check(rng.days)
+        check(rng.seconds)
+        check(rng.microseconds)
+        check(rng.nanoseconds)
+
+        td = Timedelta('-1 days, 10:11:12')
+        assert abs(td) == Timedelta('13:48:48')
+        assert str(td) == "-1 days +10:11:12"
+        assert -td == Timedelta('0 days 13:48:48')
+        assert -Timedelta('-1 days, 10:11:12').value == 49728000000000
+        assert Timedelta('-1 days, 10:11:12').value == -49728000000000
+
+        rng = to_timedelta('-1 days, 10:11:12.100123456')
+        assert rng.days == -1
+        assert rng.seconds == 10 * 3600 + 11 * 60 + 12
+        assert rng.microseconds == 100 * 1000 + 123
+        assert rng.nanoseconds == 456
+        msg = "'Timedelta' object has no attribute '{}'"
+        with pytest.raises(AttributeError, match=msg.format('hours')):
+            rng.hours
+        with pytest.raises(AttributeError, match=msg.format('minutes')):
+            rng.minutes
+        with pytest.raises(AttributeError, match=msg.format('milliseconds')):
+            rng.milliseconds
+
+        # components
+        tup = pd.to_timedelta(-1, 'us').components
+        assert tup.days == -1
+        assert tup.hours == 23
+        assert tup.minutes == 59
+        assert tup.seconds == 59
+        assert tup.milliseconds == 999
+        assert tup.microseconds == 999
+        assert tup.nanoseconds == 0
+
+        # GH 10050
+        check(tup.days)
+        check(tup.hours)
+        check(tup.minutes)
+        check(tup.seconds)
+        check(tup.milliseconds)
+        check(tup.microseconds)
+        check(tup.nanoseconds)
+
+        tup = Timedelta('-1 days 1 us').components
+        assert tup.days == -2
+        assert tup.hours == 23
+        assert tup.minutes == 59
+        assert tup.seconds == 59
+        assert tup.milliseconds == 999
+        assert tup.microseconds == 999
+        assert tup.nanoseconds == 0
+
+    def test_iso_conversion(self):
+        # GH #21877
+        expected = Timedelta(1, unit='s')
+        assert to_timedelta('P0DT0H0M1S') == expected
+
+    def test_nat_converters(self):
+        result = to_timedelta('nat', box=False)
+        assert result.dtype.kind == 'm'
+        assert result.astype('int64') == iNaT
+
+        result = to_timedelta('nan', box=False)
+        assert result.dtype.kind == 'm'
+        assert result.astype('int64') == iNaT
+
+    @pytest.mark.filterwarnings("ignore:M and Y units are deprecated")
+    @pytest.mark.parametrize('units, np_unit',
+                             [(['Y', 'y'], 'Y'),
+                              (['M'], 'M'),
+                              (['W', 'w'], 'W'),
+                              (['D', 'd', 'days', 'day', 'Days', 'Day'], 'D'),
+                              (['m', 'minute', 'min', 'minutes', 't',
+                                'Minute', 'Min', 'Minutes', 'T'], 'm'),
+                              (['s', 'seconds', 'sec', 'second',
+                                'S', 'Seconds', 'Sec', 'Second'], 's'),
+                              (['ms', 'milliseconds', 'millisecond', 'milli',
+                                'millis', 'l', 'MS', 'Milliseconds',
+                                'Millisecond', 'Milli', 'Millis', 'L'], 'ms'),
+                              (['us', 'microseconds', 'microsecond', 'micro',
+                                'micros', 'u', 'US', 'Microseconds',
+                                'Microsecond', 'Micro', 'Micros', 'U'], 'us'),
+                              (['ns', 'nanoseconds', 'nanosecond', 'nano',
+                                'nanos', 'n', 'NS', 'Nanoseconds',
+                                'Nanosecond', 'Nano', 'Nanos', 'N'], 'ns')])
+    @pytest.mark.parametrize('wrapper', [np.array, list, pd.Index])
+    def test_unit_parser(self, units, np_unit, wrapper):
+        # validate all units, GH 6855, GH 21762
+        for unit in units:
+            # array-likes
+            expected = TimedeltaIndex([np.timedelta64(i, np_unit)
+                                       for i in np.arange(5).tolist()])
+            result = to_timedelta(wrapper(range(5)), unit=unit)
+            tm.assert_index_equal(result, expected)
+            result = TimedeltaIndex(wrapper(range(5)), unit=unit)
+            tm.assert_index_equal(result, expected)
+
+            if unit == 'M':
+                # M is treated as minutes in string repr
+                expected = TimedeltaIndex([np.timedelta64(i, 'm')
+                                           for i in np.arange(5).tolist()])
+
+            str_repr = ['{}{}'.format(x, unit) for x in np.arange(5)]
+            result = to_timedelta(wrapper(str_repr))
+            tm.assert_index_equal(result, expected)
+            result = TimedeltaIndex(wrapper(str_repr))
+            tm.assert_index_equal(result, expected)
+
+            # scalar
+            expected = Timedelta(np.timedelta64(2, np_unit).astype(
+                'timedelta64[ns]'))
+
+            result = to_timedelta(2, unit=unit)
+            assert result == expected
+            result = Timedelta(2, unit=unit)
+            assert result == expected
+
+            if unit == 'M':
+                expected = Timedelta(np.timedelta64(2, 'm').astype(
+                    'timedelta64[ns]'))
+
+            result = to_timedelta('2{}'.format(unit))
+            assert result == expected
+            result = Timedelta('2{}'.format(unit))
+            assert result == expected
+
+    @pytest.mark.skipif(compat.PY2, reason="requires python3.5 or higher")
+    @pytest.mark.parametrize('unit', ['Y', 'y', 'M'])
+    def test_unit_m_y_deprecated(self, unit):
+        with tm.assert_produces_warning(FutureWarning) as w1:
+            Timedelta(10, unit)
+        msg = r'.* units are deprecated .*'
+        assert re.match(msg, str(w1[0].message))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False) as w2:
+            to_timedelta(10, unit)
+        msg = r'.* units are deprecated .*'
+        assert re.match(msg, str(w2[0].message))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False) as w3:
+            to_timedelta([1, 2], unit)
+        msg = r'.* units are deprecated .*'
+        assert re.match(msg, str(w3[0].message))
+
+    def test_numeric_conversions(self):
+        assert Timedelta(0) == np.timedelta64(0, 'ns')
+        assert Timedelta(10) == np.timedelta64(10, 'ns')
+        assert Timedelta(10, unit='ns') == np.timedelta64(10, 'ns')
+
+        assert Timedelta(10, unit='us') == np.timedelta64(10, 'us')
+        assert Timedelta(10, unit='ms') == np.timedelta64(10, 'ms')
+        assert Timedelta(10, unit='s') == np.timedelta64(10, 's')
+        assert Timedelta(10, unit='d') == np.timedelta64(10, 'D')
+
+    def test_timedelta_conversions(self):
+        assert (Timedelta(timedelta(seconds=1)) ==
+                np.timedelta64(1, 's').astype('m8[ns]'))
+        assert (Timedelta(timedelta(microseconds=1)) ==
+                np.timedelta64(1, 'us').astype('m8[ns]'))
+        assert (Timedelta(timedelta(days=1)) ==
+                np.timedelta64(1, 'D').astype('m8[ns]'))
+
+    def test_to_numpy_alias(self):
+        # GH 24653: alias .to_numpy() for scalars
+        td = Timedelta('10m7s')
+        assert td.to_timedelta64() == td.to_numpy()
+
+    def test_round(self):
+
+        t1 = Timedelta('1 days 02:34:56.789123456')
+        t2 = Timedelta('-1 days 02:34:56.789123456')
+
+        for (freq, s1, s2) in [('N', t1, t2),
+                               ('U', Timedelta('1 days 02:34:56.789123000'),
+                                Timedelta('-1 days 02:34:56.789123000')),
+                               ('L', Timedelta('1 days 02:34:56.789000000'),
+                                Timedelta('-1 days 02:34:56.789000000')),
+                               ('S', Timedelta('1 days 02:34:57'),
+                                Timedelta('-1 days 02:34:57')),
+                               ('2S', Timedelta('1 days 02:34:56'),
+                                Timedelta('-1 days 02:34:56')),
+                               ('5S', Timedelta('1 days 02:34:55'),
+                                Timedelta('-1 days 02:34:55')),
+                               ('T', Timedelta('1 days 02:35:00'),
+                                Timedelta('-1 days 02:35:00')),
+                               ('12T', Timedelta('1 days 02:36:00'),
+                                Timedelta('-1 days 02:36:00')),
+                               ('H', Timedelta('1 days 03:00:00'),
+                                Timedelta('-1 days 03:00:00')),
+                               ('d', Timedelta('1 days'),
+                                Timedelta('-1 days'))]:
+            r1 = t1.round(freq)
+            assert r1 == s1
+            r2 = t2.round(freq)
+            assert r2 == s2
+
+        # invalid
+        for freq, msg in [
+            ('Y', '<YearEnd: month=12> is a non-fixed frequency'),
+            ('M', '<MonthEnd> is a non-fixed frequency'),
+                ('foobar', 'Invalid frequency: foobar')]:
+            with pytest.raises(ValueError, match=msg):
+                t1.round(freq)
+
+        t1 = timedelta_range('1 days', periods=3, freq='1 min 2 s 3 us')
+        t2 = -1 * t1
+        t1a = timedelta_range('1 days', periods=3, freq='1 min 2 s')
+        t1c = pd.TimedeltaIndex([1, 1, 1], unit='D')
+
+        # note that negative times round DOWN! so don't give whole numbers
+        for (freq, s1, s2) in [('N', t1, t2),
+                               ('U', t1, t2),
+                               ('L', t1a,
+                                TimedeltaIndex(['-1 days +00:00:00',
+                                                '-2 days +23:58:58',
+                                                '-2 days +23:57:56'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('S', t1a,
+                                TimedeltaIndex(['-1 days +00:00:00',
+                                                '-2 days +23:58:58',
+                                                '-2 days +23:57:56'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('12T', t1c,
+                                TimedeltaIndex(['-1 days',
+                                                '-1 days',
+                                                '-1 days'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('H', t1c,
+                                TimedeltaIndex(['-1 days',
+                                                '-1 days',
+                                                '-1 days'],
+                                               dtype='timedelta64[ns]',
+                                               freq=None)
+                                ),
+                               ('d', t1c,
+                                pd.TimedeltaIndex([-1, -1, -1], unit='D')
+                                )]:
+
+            r1 = t1.round(freq)
+            tm.assert_index_equal(r1, s1)
+            r2 = t2.round(freq)
+            tm.assert_index_equal(r2, s2)
+
+        # invalid
+        for freq, msg in [
+            ('Y', '<YearEnd: month=12> is a non-fixed frequency'),
+            ('M', '<MonthEnd> is a non-fixed frequency'),
+                ('foobar', 'Invalid frequency: foobar')]:
+            with pytest.raises(ValueError, match=msg):
+                t1.round(freq)
+
+    def test_contains(self):
+        # Checking for any NaT-like objects
+        # GH 13603
+        td = to_timedelta(range(5), unit='d') + pd.offsets.Hour(1)
+        for v in [pd.NaT, None, float('nan'), np.nan]:
+            assert not (v in td)
+
+        td = to_timedelta([pd.NaT])
+        for v in [pd.NaT, None, float('nan'), np.nan]:
+            assert (v in td)
+
+    def test_identity(self):
+
+        td = Timedelta(10, unit='d')
+        assert isinstance(td, Timedelta)
+        assert isinstance(td, timedelta)
+
+    def test_short_format_converters(self):
+        def conv(v):
+            return v.astype('m8[ns]')
+
+        assert Timedelta('10') == np.timedelta64(10, 'ns')
+        assert Timedelta('10ns') == np.timedelta64(10, 'ns')
+        assert Timedelta('100') == np.timedelta64(100, 'ns')
+        assert Timedelta('100ns') == np.timedelta64(100, 'ns')
+
+        assert Timedelta('1000') == np.timedelta64(1000, 'ns')
+        assert Timedelta('1000ns') == np.timedelta64(1000, 'ns')
+        assert Timedelta('1000NS') == np.timedelta64(1000, 'ns')
+
+        assert Timedelta('10us') == np.timedelta64(10000, 'ns')
+        assert Timedelta('100us') == np.timedelta64(100000, 'ns')
+        assert Timedelta('1000us') == np.timedelta64(1000000, 'ns')
+        assert Timedelta('1000Us') == np.timedelta64(1000000, 'ns')
+        assert Timedelta('1000uS') == np.timedelta64(1000000, 'ns')
+
+        assert Timedelta('1ms') == np.timedelta64(1000000, 'ns')
+        assert Timedelta('10ms') == np.timedelta64(10000000, 'ns')
+        assert Timedelta('100ms') == np.timedelta64(100000000, 'ns')
+        assert Timedelta('1000ms') == np.timedelta64(1000000000, 'ns')
+
+        assert Timedelta('-1s') == -np.timedelta64(1000000000, 'ns')
+        assert Timedelta('1s') == np.timedelta64(1000000000, 'ns')
+        assert Timedelta('10s') == np.timedelta64(10000000000, 'ns')
+        assert Timedelta('100s') == np.timedelta64(100000000000, 'ns')
+        assert Timedelta('1000s') == np.timedelta64(1000000000000, 'ns')
+
+        assert Timedelta('1d') == conv(np.timedelta64(1, 'D'))
+        assert Timedelta('-1d') == -conv(np.timedelta64(1, 'D'))
+        assert Timedelta('1D') == conv(np.timedelta64(1, 'D'))
+        assert Timedelta('10D') == conv(np.timedelta64(10, 'D'))
+        assert Timedelta('100D') == conv(np.timedelta64(100, 'D'))
+        assert Timedelta('1000D') == conv(np.timedelta64(1000, 'D'))
+        assert Timedelta('10000D') == conv(np.timedelta64(10000, 'D'))
+
+        # space
+        assert Timedelta(' 10000D ') == conv(np.timedelta64(10000, 'D'))
+        assert Timedelta(' - 10000D ') == -conv(np.timedelta64(10000, 'D'))
+
+        # invalid
+        with pytest.raises(ValueError):
+            Timedelta('1foo')
+        with pytest.raises(ValueError):
+            Timedelta('foo')
+
+    def test_full_format_converters(self):
+        def conv(v):
+            return v.astype('m8[ns]')
+
+        d1 = np.timedelta64(1, 'D')
+
+        assert Timedelta('1days') == conv(d1)
+        assert Timedelta('1days,') == conv(d1)
+        assert Timedelta('- 1days,') == -conv(d1)
+
+        assert Timedelta('00:00:01') == conv(np.timedelta64(1, 's'))
+        assert Timedelta('06:00:01') == conv(np.timedelta64(6 * 3600 + 1, 's'))
+        assert Timedelta('06:00:01.0') == conv(
+            np.timedelta64(6 * 3600 + 1, 's'))
+        assert Timedelta('06:00:01.01') == conv(np.timedelta64(
+            1000 * (6 * 3600 + 1) + 10, 'ms'))
+
+        assert (Timedelta('- 1days, 00:00:01') ==
+                conv(-d1 + np.timedelta64(1, 's')))
+        assert (Timedelta('1days, 06:00:01') ==
+                conv(d1 + np.timedelta64(6 * 3600 + 1, 's')))
+        assert (Timedelta('1days, 06:00:01.01') ==
+                conv(d1 + np.timedelta64(1000 * (6 * 3600 + 1) + 10, 'ms')))
+
+        # invalid
+        with pytest.raises(ValueError):
+            Timedelta('- 1days, 00')
+
+    def test_overflow(self):
+        # GH 9442
+        s = Series(pd.date_range('20130101', periods=100000, freq='H'))
+        s[0] += pd.Timedelta('1s 1ms')
+
+        # mean
+        result = (s - s.min()).mean()
+        expected = pd.Timedelta((pd.TimedeltaIndex((s - s.min())).asi8 / len(s)
+                                 ).sum())
+
+        # the computation is converted to float so
+        # might be some loss of precision
+        assert np.allclose(result.value / 1000, expected.value / 1000)
+
+        # sum
+        msg = "overflow in timedelta operation"
+        with pytest.raises(ValueError, match=msg):
+            (s - s.min()).sum()
+        s1 = s[0:10000]
+        with pytest.raises(ValueError, match=msg):
+            (s1 - s1.min()).sum()
+        s2 = s[0:1000]
+        result = (s2 - s2.min()).sum()
+
+    def test_pickle(self):
+
+        v = Timedelta('1 days 10:11:12.0123456')
+        v_p = tm.round_trip_pickle(v)
+        assert v == v_p
+
+    def test_timedelta_hash_equality(self):
+        # GH 11129
+        v = Timedelta(1, 'D')
+        td = timedelta(days=1)
+        assert hash(v) == hash(td)
+
+        d = {td: 2}
+        assert d[v] == 2
+
+        tds = timedelta_range('1 second', periods=20)
+        assert all(hash(td) == hash(td.to_pytimedelta()) for td in tds)
+
+        # python timedeltas drop ns resolution
+        ns_td = Timedelta(1, 'ns')
+        assert hash(ns_td) != hash(ns_td.to_pytimedelta())
+
+    def test_implementation_limits(self):
+        min_td = Timedelta(Timedelta.min)
+        max_td = Timedelta(Timedelta.max)
+
+        # GH 12727
+        # timedelta limits correspond to int64 boundaries
+        assert min_td.value == np.iinfo(np.int64).min + 1
+        assert max_td.value == np.iinfo(np.int64).max
+
+        # Beyond lower limit, a NAT before the Overflow
+        assert (min_td - Timedelta(1, 'ns')) is NaT
+
+        with pytest.raises(OverflowError):
+            min_td - Timedelta(2, 'ns')
+
+        with pytest.raises(OverflowError):
+            max_td + Timedelta(1, 'ns')
+
+        # Same tests using the internal nanosecond values
+        td = Timedelta(min_td.value - 1, 'ns')
+        assert td is NaT
+
+        with pytest.raises(OverflowError):
+            Timedelta(min_td.value - 2, 'ns')
+
+        with pytest.raises(OverflowError):
+            Timedelta(max_td.value + 1, 'ns')
+
+    def test_total_seconds_precision(self):
+        # GH 19458
+        assert Timedelta('30S').total_seconds() == 30.0
+        assert Timedelta('0').total_seconds() == 0.0
+        assert Timedelta('-2S').total_seconds() == -2.0
+        assert Timedelta('5.324S').total_seconds() == 5.324
+        assert (Timedelta('30S').total_seconds() - 30.0) < 1e-20
+        assert (30.0 - Timedelta('30S').total_seconds()) < 1e-20
+
+    def test_timedelta_arithmetic(self):
+        data = pd.Series(['nat', '32 days'], dtype='timedelta64[ns]')
+        deltas = [timedelta(days=1), Timedelta(1, unit='D')]
+        for delta in deltas:
+            result_method = data.add(delta)
+            result_operator = data + delta
+            expected = pd.Series(['nat', '33 days'], dtype='timedelta64[ns]')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+
+            result_method = data.sub(delta)
+            result_operator = data - delta
+            expected = pd.Series(['nat', '31 days'], dtype='timedelta64[ns]')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+            # GH 9396
+            result_method = data.div(delta)
+            result_operator = data / delta
+            expected = pd.Series([np.nan, 32.], dtype='float64')
+            tm.assert_series_equal(result_operator, expected)
+            tm.assert_series_equal(result_method, expected)
+
+    def test_apply_to_timedelta(self):
+        timedelta_NaT = pd.to_timedelta('NaT')
+
+        list_of_valid_strings = ['00:00:01', '00:00:02']
+        a = pd.to_timedelta(list_of_valid_strings)
+        b = Series(list_of_valid_strings).apply(pd.to_timedelta)
+        # Can't compare until apply on a Series gives the correct dtype
+        # assert_series_equal(a, b)
+
+        list_of_strings = ['00:00:01', np.nan, pd.NaT, timedelta_NaT]
+
+        # TODO: unused?
+        a = pd.to_timedelta(list_of_strings)  # noqa
+        b = Series(list_of_strings).apply(pd.to_timedelta)  # noqa
+        # Can't compare until apply on a Series gives the correct dtype
+        # assert_series_equal(a, b)
+
+    def test_components(self):
+        rng = timedelta_range('1 days, 10:11:12', periods=2, freq='s')
+        rng.components
+
+        # with nat
+        s = Series(rng)
+        s[1] = np.nan
+
+        result = s.dt.components
+        assert not result.iloc[0].isna().all()
+        assert result.iloc[1].isna().all()
+
+
+@pytest.mark.parametrize('value, expected', [
+    (Timedelta('10S'), True),
+    (Timedelta('-10S'), True),
+    (Timedelta(10, unit='ns'), True),
+    (Timedelta(0, unit='ns'), False),
+    (Timedelta(-10, unit='ns'), True),
+    (Timedelta(None), True),
+    (pd.NaT, True),
+])
+def test_truthiness(value, expected):
+    # https://github.com/pandas-dev/pandas/issues/21484
+    assert bool(value) is expected
diff --git a/pandas/tests/scalar/timestamp/__init__.py b/pandas/tests/scalar/timestamp/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/scalar/timestamp/test_arithmetic.py b/pandas/tests/scalar/timestamp/test_arithmetic.py
new file mode 100644
index 0000000000000..331d66589802d
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_arithmetic.py
@@ -0,0 +1,117 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas.compat import long
+
+from pandas import Timedelta, Timestamp
+import pandas.util.testing as tm
+
+from pandas.tseries import offsets
+from pandas.tseries.frequencies import to_offset
+
+
+class TestTimestampArithmetic(object):
+    def test_overflow_offset(self):
+        # no overflow expected
+
+        stamp = Timestamp("2000/1/1")
+        offset_no_overflow = to_offset("D") * 100
+
+        expected = Timestamp("2000/04/10")
+        assert stamp + offset_no_overflow == expected
+
+        assert offset_no_overflow + stamp == expected
+
+        expected = Timestamp("1999/09/23")
+        assert stamp - offset_no_overflow == expected
+
+    def test_overflow_offset_raises(self):
+        # xref https://github.com/statsmodels/statsmodels/issues/3374
+        # ends up multiplying really large numbers which overflow
+
+        stamp = Timestamp('2017-01-13 00:00:00', freq='D')
+        offset_overflow = 20169940 * offsets.Day(1)
+        msg = ("the add operation between "
+               r"\<-?\d+ \* Days\> and \d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2} "
+               "will overflow")
+
+        with pytest.raises(OverflowError, match=msg):
+            stamp + offset_overflow
+
+        with pytest.raises(OverflowError, match=msg):
+            offset_overflow + stamp
+
+        with pytest.raises(OverflowError, match=msg):
+            stamp - offset_overflow
+
+        # xref https://github.com/pandas-dev/pandas/issues/14080
+        # used to crash, so check for proper overflow exception
+
+        stamp = Timestamp("2000/1/1")
+        offset_overflow = to_offset("D") * 100 ** 25
+
+        with pytest.raises(OverflowError, match=msg):
+            stamp + offset_overflow
+
+        with pytest.raises(OverflowError, match=msg):
+            offset_overflow + stamp
+
+        with pytest.raises(OverflowError, match=msg):
+            stamp - offset_overflow
+
+    def test_delta_preserve_nanos(self):
+        val = Timestamp(long(1337299200000000123))
+        result = val + timedelta(1)
+        assert result.nanosecond == val.nanosecond
+
+    def test_timestamp_sub_datetime(self):
+        dt = datetime(2013, 10, 12)
+        ts = Timestamp(datetime(2013, 10, 13))
+        assert (ts - dt).days == 1
+        assert (dt - ts).days == -1
+
+    def test_addition_subtraction_types(self):
+        # Assert on the types resulting from Timestamp +/- various date/time
+        # objects
+        dt = datetime(2014, 3, 4)
+        td = timedelta(seconds=1)
+        # build a timestamp with a frequency, since then it supports
+        # addition/subtraction of integers
+        ts = Timestamp(dt, freq='D')
+
+        with tm.assert_produces_warning(FutureWarning):
+            # GH#22535 add/sub with integers is deprecated
+            assert type(ts + 1) == Timestamp
+            assert type(ts - 1) == Timestamp
+
+        # Timestamp + datetime not supported, though subtraction is supported
+        # and yields timedelta more tests in tseries/base/tests/test_base.py
+        assert type(ts - dt) == Timedelta
+        assert type(ts + td) == Timestamp
+        assert type(ts - td) == Timestamp
+
+        # Timestamp +/- datetime64 not supported, so not tested (could possibly
+        # assert error raised?)
+        td64 = np.timedelta64(1, 'D')
+        assert type(ts + td64) == Timestamp
+        assert type(ts - td64) == Timestamp
+
+    def test_addition_subtraction_preserve_frequency(self):
+        ts = Timestamp('2014-03-05', freq='D')
+        td = timedelta(days=1)
+        original_freq = ts.freq
+
+        with tm.assert_produces_warning(FutureWarning):
+            # GH#22535 add/sub with integers is deprecated
+            assert (ts + 1).freq == original_freq
+            assert (ts - 1).freq == original_freq
+
+        assert (ts + td).freq == original_freq
+        assert (ts - td).freq == original_freq
+
+        td64 = np.timedelta64(1, 'D')
+        assert (ts + td64).freq == original_freq
+        assert (ts - td64).freq == original_freq
diff --git a/pandas/tests/scalar/timestamp/test_comparisons.py b/pandas/tests/scalar/timestamp/test_comparisons.py
new file mode 100644
index 0000000000000..74dd52c48153f
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_comparisons.py
@@ -0,0 +1,168 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+import operator
+
+import numpy as np
+import pytest
+
+from pandas.compat import PY2, long
+
+from pandas import Timestamp
+
+
+class TestTimestampComparison(object):
+    def test_comparison_object_array(self):
+        # GH#15183
+        ts = Timestamp('2011-01-03 00:00:00-0500', tz='US/Eastern')
+        other = Timestamp('2011-01-01 00:00:00-0500', tz='US/Eastern')
+        naive = Timestamp('2011-01-01 00:00:00')
+
+        arr = np.array([other, ts], dtype=object)
+        res = arr == ts
+        expected = np.array([False, True], dtype=bool)
+        assert (res == expected).all()
+
+        # 2D case
+        arr = np.array([[other, ts],
+                        [ts, other]],
+                       dtype=object)
+        res = arr != ts
+        expected = np.array([[True, False], [False, True]], dtype=bool)
+        assert res.shape == expected.shape
+        assert (res == expected).all()
+
+        # tzaware mismatch
+        arr = np.array([naive], dtype=object)
+        with pytest.raises(TypeError):
+            arr < ts
+
+    def test_comparison(self):
+        # 5-18-2012 00:00:00.000
+        stamp = long(1337299200000000000)
+
+        val = Timestamp(stamp)
+
+        assert val == val
+        assert not val != val
+        assert not val < val
+        assert val <= val
+        assert not val > val
+        assert val >= val
+
+        other = datetime(2012, 5, 18)
+        assert val == other
+        assert not val != other
+        assert not val < other
+        assert val <= other
+        assert not val > other
+        assert val >= other
+
+        other = Timestamp(stamp + 100)
+
+        assert val != other
+        assert val != other
+        assert val < other
+        assert val <= other
+        assert other > val
+        assert other >= val
+
+    def test_compare_invalid(self):
+        # GH#8058
+        val = Timestamp('20130101 12:01:02')
+        assert not val == 'foo'
+        assert not val == 10.0
+        assert not val == 1
+        assert not val == long(1)
+        assert not val == []
+        assert not val == {'foo': 1}
+        assert not val == np.float64(1)
+        assert not val == np.int64(1)
+
+        assert val != 'foo'
+        assert val != 10.0
+        assert val != 1
+        assert val != long(1)
+        assert val != []
+        assert val != {'foo': 1}
+        assert val != np.float64(1)
+        assert val != np.int64(1)
+
+    def test_cant_compare_tz_naive_w_aware(self, utc_fixture):
+        # see GH#1404
+        a = Timestamp('3/12/2012')
+        b = Timestamp('3/12/2012', tz=utc_fixture)
+
+        with pytest.raises(TypeError):
+            a == b
+        with pytest.raises(TypeError):
+            a != b
+        with pytest.raises(TypeError):
+            a < b
+        with pytest.raises(TypeError):
+            a <= b
+        with pytest.raises(TypeError):
+            a > b
+        with pytest.raises(TypeError):
+            a >= b
+
+        with pytest.raises(TypeError):
+            b == a
+        with pytest.raises(TypeError):
+            b != a
+        with pytest.raises(TypeError):
+            b < a
+        with pytest.raises(TypeError):
+            b <= a
+        with pytest.raises(TypeError):
+            b > a
+        with pytest.raises(TypeError):
+            b >= a
+
+        if PY2:
+            with pytest.raises(TypeError):
+                a == b.to_pydatetime()
+            with pytest.raises(TypeError):
+                a.to_pydatetime() == b
+        else:
+            assert not a == b.to_pydatetime()
+            assert not a.to_pydatetime() == b
+
+    def test_timestamp_compare_scalars(self):
+        # case where ndim == 0
+        lhs = np.datetime64(datetime(2013, 12, 6))
+        rhs = Timestamp('now')
+        nat = Timestamp('nat')
+
+        ops = {'gt': 'lt',
+               'lt': 'gt',
+               'ge': 'le',
+               'le': 'ge',
+               'eq': 'eq',
+               'ne': 'ne'}
+
+        for left, right in ops.items():
+            left_f = getattr(operator, left)
+            right_f = getattr(operator, right)
+            expected = left_f(lhs, rhs)
+
+            result = right_f(rhs, lhs)
+            assert result == expected
+
+            expected = left_f(rhs, nat)
+            result = right_f(nat, rhs)
+            assert result == expected
+
+    def test_timestamp_compare_with_early_datetime(self):
+        # e.g. datetime.min
+        stamp = Timestamp('2012-01-01')
+
+        assert not stamp == datetime.min
+        assert not stamp == datetime(1600, 1, 1)
+        assert not stamp == datetime(2700, 1, 1)
+        assert stamp != datetime.min
+        assert stamp != datetime(1600, 1, 1)
+        assert stamp != datetime(2700, 1, 1)
+        assert stamp > datetime(1600, 1, 1)
+        assert stamp >= datetime(1600, 1, 1)
+        assert stamp < datetime(2700, 1, 1)
+        assert stamp <= datetime(2700, 1, 1)
diff --git a/pandas/tests/scalar/timestamp/test_rendering.py b/pandas/tests/scalar/timestamp/test_rendering.py
new file mode 100644
index 0000000000000..29b65ee4df745
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_rendering.py
@@ -0,0 +1,96 @@
+# -*- coding: utf-8 -*-
+
+from distutils.version import LooseVersion
+import pprint
+
+import dateutil
+import pytest
+import pytz  # noqa  # a test below uses pytz but only inside a `eval` call
+
+from pandas import Timestamp
+
+
+class TestTimestampRendering(object):
+
+    # dateutil zone change (only matters for repr)
+    if LooseVersion(dateutil.__version__) >= LooseVersion('2.6.0'):
+        timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
+                     'dateutil/US/Pacific']
+    else:
+        timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern',
+                     'dateutil/America/Los_Angeles']
+
+    @pytest.mark.parametrize('tz', timezones)
+    @pytest.mark.parametrize('freq', ['D', 'M', 'S', 'N'])
+    @pytest.mark.parametrize('date', ['2014-03-07', '2014-01-01 09:00',
+                                      '2014-01-01 00:00:00.000000001'])
+    def test_repr(self, date, freq, tz):
+        # avoid to match with timezone name
+        freq_repr = "'{0}'".format(freq)
+        if tz.startswith('dateutil'):
+            tz_repr = tz.replace('dateutil', '')
+        else:
+            tz_repr = tz
+
+        date_only = Timestamp(date)
+        assert date in repr(date_only)
+        assert tz_repr not in repr(date_only)
+        assert freq_repr not in repr(date_only)
+        assert date_only == eval(repr(date_only))
+
+        date_tz = Timestamp(date, tz=tz)
+        assert date in repr(date_tz)
+        assert tz_repr in repr(date_tz)
+        assert freq_repr not in repr(date_tz)
+        assert date_tz == eval(repr(date_tz))
+
+        date_freq = Timestamp(date, freq=freq)
+        assert date in repr(date_freq)
+        assert tz_repr not in repr(date_freq)
+        assert freq_repr in repr(date_freq)
+        assert date_freq == eval(repr(date_freq))
+
+        date_tz_freq = Timestamp(date, tz=tz, freq=freq)
+        assert date in repr(date_tz_freq)
+        assert tz_repr in repr(date_tz_freq)
+        assert freq_repr in repr(date_tz_freq)
+        assert date_tz_freq == eval(repr(date_tz_freq))
+
+    def test_repr_utcoffset(self):
+        # This can cause the tz field to be populated, but it's redundant to
+        # include this information in the date-string.
+        date_with_utc_offset = Timestamp('2014-03-13 00:00:00-0400', tz=None)
+        assert '2014-03-13 00:00:00-0400' in repr(date_with_utc_offset)
+        assert 'tzoffset' not in repr(date_with_utc_offset)
+        assert 'pytz.FixedOffset(-240)' in repr(date_with_utc_offset)
+        expr = repr(date_with_utc_offset).replace("'pytz.FixedOffset(-240)'",
+                                                  'pytz.FixedOffset(-240)')
+        assert date_with_utc_offset == eval(expr)
+
+    def test_timestamp_repr_pre1900(self):
+        # pre-1900
+        stamp = Timestamp('1850-01-01', tz='US/Eastern')
+        repr(stamp)
+
+        iso8601 = '1850-01-01 01:23:45.012345'
+        stamp = Timestamp(iso8601, tz='US/Eastern')
+        result = repr(stamp)
+        assert iso8601 in result
+
+    def test_pprint(self):
+        # GH#12622
+        nested_obj = {'foo': 1,
+                      'bar': [{'w': {'a': Timestamp('2011-01-01')}}] * 10}
+        result = pprint.pformat(nested_obj, width=50)
+        expected = r"""{'bar': [{'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}},
+         {'w': {'a': Timestamp('2011-01-01 00:00:00')}}],
+ 'foo': 1}"""
+        assert result == expected
diff --git a/pandas/tests/scalar/timestamp/test_timestamp.py b/pandas/tests/scalar/timestamp/test_timestamp.py
new file mode 100644
index 0000000000000..b55d00b44fd67
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_timestamp.py
@@ -0,0 +1,988 @@
+""" test the scalar Timestamp """
+
+import calendar
+from datetime import datetime, timedelta
+import locale
+import unicodedata
+
+import dateutil
+from dateutil.tz import tzutc
+import numpy as np
+import pytest
+import pytz
+from pytz import timezone, utc
+
+from pandas._libs.tslibs import conversion
+from pandas._libs.tslibs.timezones import dateutil_gettz as gettz, get_timezone
+from pandas.compat import PY2, PY3, long
+from pandas.compat.numpy import np_datetime64_compat
+from pandas.errors import OutOfBoundsDatetime
+import pandas.util._test_decorators as td
+
+from pandas import NaT, Period, Timedelta, Timestamp
+import pandas.util.testing as tm
+
+from pandas.tseries import offsets
+
+
+class TestTimestampProperties(object):
+
+    def test_properties_business(self):
+        ts = Timestamp('2017-10-01', freq='B')
+        control = Timestamp('2017-10-01')
+        assert ts.dayofweek == 6
+        assert not ts.is_month_start    # not a weekday
+        assert not ts.is_quarter_start  # not a weekday
+        # Control case: non-business is month/qtr start
+        assert control.is_month_start
+        assert control.is_quarter_start
+
+        ts = Timestamp('2017-09-30', freq='B')
+        control = Timestamp('2017-09-30')
+        assert ts.dayofweek == 5
+        assert not ts.is_month_end    # not a weekday
+        assert not ts.is_quarter_end  # not a weekday
+        # Control case: non-business is month/qtr start
+        assert control.is_month_end
+        assert control.is_quarter_end
+
+    def test_fields(self):
+        def check(value, equal):
+            # that we are int/long like
+            assert isinstance(value, (int, long))
+            assert value == equal
+
+        # GH 10050
+        ts = Timestamp('2015-05-10 09:06:03.000100001')
+        check(ts.year, 2015)
+        check(ts.month, 5)
+        check(ts.day, 10)
+        check(ts.hour, 9)
+        check(ts.minute, 6)
+        check(ts.second, 3)
+        msg = "'Timestamp' object has no attribute 'millisecond'"
+        with pytest.raises(AttributeError, match=msg):
+            ts.millisecond
+        check(ts.microsecond, 100)
+        check(ts.nanosecond, 1)
+        check(ts.dayofweek, 6)
+        check(ts.quarter, 2)
+        check(ts.dayofyear, 130)
+        check(ts.week, 19)
+        check(ts.daysinmonth, 31)
+        check(ts.daysinmonth, 31)
+
+        # GH 13303
+        ts = Timestamp('2014-12-31 23:59:00-05:00', tz='US/Eastern')
+        check(ts.year, 2014)
+        check(ts.month, 12)
+        check(ts.day, 31)
+        check(ts.hour, 23)
+        check(ts.minute, 59)
+        check(ts.second, 0)
+        msg = "'Timestamp' object has no attribute 'millisecond'"
+        with pytest.raises(AttributeError, match=msg):
+            ts.millisecond
+        check(ts.microsecond, 0)
+        check(ts.nanosecond, 0)
+        check(ts.dayofweek, 2)
+        check(ts.quarter, 4)
+        check(ts.dayofyear, 365)
+        check(ts.week, 1)
+        check(ts.daysinmonth, 31)
+
+        ts = Timestamp('2014-01-01 00:00:00+01:00')
+        starts = ['is_month_start', 'is_quarter_start', 'is_year_start']
+        for start in starts:
+            assert getattr(ts, start)
+        ts = Timestamp('2014-12-31 23:59:59+01:00')
+        ends = ['is_month_end', 'is_year_end', 'is_quarter_end']
+        for end in ends:
+            assert getattr(ts, end)
+
+    # GH 12806
+    @pytest.mark.parametrize('data',
+                             [Timestamp('2017-08-28 23:00:00'),
+                              Timestamp('2017-08-28 23:00:00', tz='EST')])
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_names(self, data, time_locale):
+        # GH 17354
+        # Test .weekday_name, .day_name(), .month_name
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert data.weekday_name == 'Monday'
+        if time_locale is None:
+            expected_day = 'Monday'
+            expected_month = 'August'
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_day = calendar.day_name[0].capitalize()
+                expected_month = calendar.month_name[8].capitalize()
+
+        result_day = data.day_name(time_locale)
+        result_month = data.month_name(time_locale)
+
+        # Work around https://github.com/pandas-dev/pandas/issues/22342
+        # different normalizations
+
+        if not PY2:
+            expected_day = unicodedata.normalize("NFD", expected_day)
+            expected_month = unicodedata.normalize("NFD", expected_month)
+
+            result_day = unicodedata.normalize("NFD", result_day,)
+            result_month = unicodedata.normalize("NFD", result_month)
+
+        assert result_day == expected_day
+        assert result_month == expected_month
+
+        # Test NaT
+        nan_ts = Timestamp(NaT)
+        assert np.isnan(nan_ts.day_name(time_locale))
+        assert np.isnan(nan_ts.month_name(time_locale))
+
+    def test_is_leap_year(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        # GH 13727
+        dt = Timestamp('2000-01-01 00:00:00', tz=tz)
+        assert dt.is_leap_year
+        assert isinstance(dt.is_leap_year, bool)
+
+        dt = Timestamp('1999-01-01 00:00:00', tz=tz)
+        assert not dt.is_leap_year
+
+        dt = Timestamp('2004-01-01 00:00:00', tz=tz)
+        assert dt.is_leap_year
+
+        dt = Timestamp('2100-01-01 00:00:00', tz=tz)
+        assert not dt.is_leap_year
+
+    def test_woy_boundary(self):
+        # make sure weeks at year boundaries are correct
+        d = datetime(2013, 12, 31)
+        result = Timestamp(d).week
+        expected = 1  # ISO standard
+        assert result == expected
+
+        d = datetime(2008, 12, 28)
+        result = Timestamp(d).week
+        expected = 52  # ISO standard
+        assert result == expected
+
+        d = datetime(2009, 12, 31)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        d = datetime(2010, 1, 1)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        d = datetime(2010, 1, 3)
+        result = Timestamp(d).week
+        expected = 53  # ISO standard
+        assert result == expected
+
+        result = np.array([Timestamp(datetime(*args)).week
+                           for args in [(2000, 1, 1), (2000, 1, 2), (
+                               2005, 1, 1), (2005, 1, 2)]])
+        assert (result == [52, 52, 53, 53]).all()
+
+    def test_resolution(self):
+        # GH#21336, GH#21365
+        dt = Timestamp('2100-01-01 00:00:00')
+        assert dt.resolution == Timedelta(nanoseconds=1)
+
+
+class TestTimestampConstructors(object):
+
+    def test_constructor(self):
+        base_str = '2014-07-01 09:00'
+        base_dt = datetime(2014, 7, 1, 9)
+        base_expected = 1404205200000000000
+
+        # confirm base representation is correct
+        import calendar
+        assert (calendar.timegm(base_dt.timetuple()) * 1000000000 ==
+                base_expected)
+
+        tests = [(base_str, base_dt, base_expected),
+                 ('2014-07-01 10:00', datetime(2014, 7, 1, 10),
+                  base_expected + 3600 * 1000000000),
+                 ('2014-07-01 09:00:00.000008000',
+                  datetime(2014, 7, 1, 9, 0, 0, 8),
+                  base_expected + 8000),
+                 ('2014-07-01 09:00:00.000000005',
+                  Timestamp('2014-07-01 09:00:00.000000005'),
+                  base_expected + 5)]
+
+        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
+                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
+                     (pytz.FixedOffset(-180), -3),
+                     (dateutil.tz.tzoffset(None, 18000), 5)]
+
+        for date_str, date, expected in tests:
+            for result in [Timestamp(date_str), Timestamp(date)]:
+                # only with timestring
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+                # re-creation shouldn't affect to internal value
+                result = Timestamp(result)
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+            # with timezone
+            for tz, offset in timezones:
+                for result in [Timestamp(date_str, tz=tz), Timestamp(date,
+                                                                     tz=tz)]:
+                    expected_tz = expected - offset * 3600 * 1000000000
+                    assert result.value == expected_tz
+                    assert conversion.pydt_to_i8(result) == expected_tz
+
+                    # should preserve tz
+                    result = Timestamp(result)
+                    assert result.value == expected_tz
+                    assert conversion.pydt_to_i8(result) == expected_tz
+
+                    # should convert to UTC
+                    if tz is not None:
+                        result = Timestamp(result).tz_convert('UTC')
+                    else:
+                        result = Timestamp(result, tz='UTC')
+                    expected_utc = expected - offset * 3600 * 1000000000
+                    assert result.value == expected_utc
+                    assert conversion.pydt_to_i8(result) == expected_utc
+
+    def test_constructor_with_stringoffset(self):
+        # GH 7833
+        base_str = '2014-07-01 11:00:00+02:00'
+        base_dt = datetime(2014, 7, 1, 9)
+        base_expected = 1404205200000000000
+
+        # confirm base representation is correct
+        import calendar
+        assert (calendar.timegm(base_dt.timetuple()) * 1000000000 ==
+                base_expected)
+
+        tests = [(base_str, base_expected),
+                 ('2014-07-01 12:00:00+02:00',
+                  base_expected + 3600 * 1000000000),
+                 ('2014-07-01 11:00:00.000008000+02:00', base_expected + 8000),
+                 ('2014-07-01 11:00:00.000000005+02:00', base_expected + 5)]
+
+        timezones = [(None, 0), ('UTC', 0), (pytz.utc, 0), ('Asia/Tokyo', 9),
+                     ('US/Eastern', -4), ('dateutil/US/Pacific', -7),
+                     (pytz.FixedOffset(-180), -3),
+                     (dateutil.tz.tzoffset(None, 18000), 5)]
+
+        for date_str, expected in tests:
+            for result in [Timestamp(date_str)]:
+                # only with timestring
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+                # re-creation shouldn't affect to internal value
+                result = Timestamp(result)
+                assert result.value == expected
+                assert conversion.pydt_to_i8(result) == expected
+
+            # with timezone
+            for tz, offset in timezones:
+                result = Timestamp(date_str, tz=tz)
+                expected_tz = expected
+                assert result.value == expected_tz
+                assert conversion.pydt_to_i8(result) == expected_tz
+
+                # should preserve tz
+                result = Timestamp(result)
+                assert result.value == expected_tz
+                assert conversion.pydt_to_i8(result) == expected_tz
+
+                # should convert to UTC
+                result = Timestamp(result).tz_convert('UTC')
+                expected_utc = expected
+                assert result.value == expected_utc
+                assert conversion.pydt_to_i8(result) == expected_utc
+
+        # This should be 2013-11-01 05:00 in UTC
+        # converted to Chicago tz
+        result = Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')
+        assert result.value == Timestamp('2013-11-01 05:00').value
+        expected = "Timestamp('2013-11-01 00:00:00-0500', tz='America/Chicago')"  # noqa
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # This should be 2013-11-01 05:00 in UTC
+        # converted to Tokyo tz (+09:00)
+        result = Timestamp('2013-11-01 00:00:00-0500', tz='Asia/Tokyo')
+        assert result.value == Timestamp('2013-11-01 05:00').value
+        expected = "Timestamp('2013-11-01 14:00:00+0900', tz='Asia/Tokyo')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # GH11708
+        # This should be 2015-11-18 10:00 in UTC
+        # converted to Asia/Katmandu
+        result = Timestamp("2015-11-18 15:45:00+05:45", tz="Asia/Katmandu")
+        assert result.value == Timestamp("2015-11-18 10:00").value
+        expected = "Timestamp('2015-11-18 15:45:00+0545', tz='Asia/Katmandu')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+        # This should be 2015-11-18 10:00 in UTC
+        # converted to Asia/Kolkata
+        result = Timestamp("2015-11-18 15:30:00+05:30", tz="Asia/Kolkata")
+        assert result.value == Timestamp("2015-11-18 10:00").value
+        expected = "Timestamp('2015-11-18 15:30:00+0530', tz='Asia/Kolkata')"
+        assert repr(result) == expected
+        assert result == eval(repr(result))
+
+    def test_constructor_invalid(self):
+        with pytest.raises(TypeError, match='Cannot convert input'):
+            Timestamp(slice(2))
+        with pytest.raises(ValueError, match='Cannot convert Period'):
+            Timestamp(Period('1000-01-01'))
+
+    def test_constructor_invalid_tz(self):
+        # GH#17690
+        with pytest.raises(TypeError, match='must be a datetime.tzinfo'):
+            Timestamp('2017-10-22', tzinfo='US/Eastern')
+
+        with pytest.raises(ValueError, match='at most one of'):
+            Timestamp('2017-10-22', tzinfo=utc, tz='UTC')
+
+        with pytest.raises(ValueError, match="Invalid frequency:"):
+            # GH#5168
+            # case where user tries to pass tz as an arg, not kwarg, gets
+            # interpreted as a `freq`
+            Timestamp('2012-01-01', 'US/Pacific')
+
+    def test_constructor_strptime(self):
+        # GH25016
+        # Test support for Timestamp.strptime
+        fmt = '%Y%m%d-%H%M%S-%f%z'
+        ts = '20190129-235348-000001+0000'
+        with pytest.raises(NotImplementedError):
+            Timestamp.strptime(ts, fmt)
+
+    def test_constructor_tz_or_tzinfo(self):
+        # GH#17943, GH#17690, GH#5168
+        stamps = [Timestamp(year=2017, month=10, day=22, tz='UTC'),
+                  Timestamp(year=2017, month=10, day=22, tzinfo=utc),
+                  Timestamp(year=2017, month=10, day=22, tz=utc),
+                  Timestamp(datetime(2017, 10, 22), tzinfo=utc),
+                  Timestamp(datetime(2017, 10, 22), tz='UTC'),
+                  Timestamp(datetime(2017, 10, 22), tz=utc)]
+        assert all(ts == stamps[0] for ts in stamps)
+
+    def test_constructor_positional(self):
+        # see gh-10758
+        with pytest.raises(TypeError):
+            Timestamp(2000, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 0, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 13, 1)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 1, 0)
+        with pytest.raises(ValueError):
+            Timestamp(2000, 1, 32)
+
+        # see gh-11630
+        assert (repr(Timestamp(2015, 11, 12)) ==
+                repr(Timestamp('20151112')))
+        assert (repr(Timestamp(2015, 11, 12, 1, 2, 3, 999999)) ==
+                repr(Timestamp('2015-11-12 01:02:03.999999')))
+
+    def test_constructor_keyword(self):
+        # GH 10758
+        with pytest.raises(TypeError):
+            Timestamp(year=2000, month=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=0, day=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=13, day=1)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=1, day=0)
+        with pytest.raises(ValueError):
+            Timestamp(year=2000, month=1, day=32)
+
+        assert (repr(Timestamp(year=2015, month=11, day=12)) ==
+                repr(Timestamp('20151112')))
+
+        assert (repr(Timestamp(year=2015, month=11, day=12, hour=1, minute=2,
+                               second=3, microsecond=999999)) ==
+                repr(Timestamp('2015-11-12 01:02:03.999999')))
+
+    def test_constructor_fromordinal(self):
+        base = datetime(2000, 1, 1)
+
+        ts = Timestamp.fromordinal(base.toordinal(), freq='D')
+        assert base == ts
+        assert ts.freq == 'D'
+        assert base.toordinal() == ts.toordinal()
+
+        ts = Timestamp.fromordinal(base.toordinal(), tz='US/Eastern')
+        assert Timestamp('2000-01-01', tz='US/Eastern') == ts
+        assert base.toordinal() == ts.toordinal()
+
+        # GH#3042
+        dt = datetime(2011, 4, 16, 0, 0)
+        ts = Timestamp.fromordinal(dt.toordinal())
+        assert ts.to_pydatetime() == dt
+
+        # with a tzinfo
+        stamp = Timestamp('2011-4-16', tz='US/Eastern')
+        dt_tz = stamp.to_pydatetime()
+        ts = Timestamp.fromordinal(dt_tz.toordinal(), tz='US/Eastern')
+        assert ts.to_pydatetime() == dt_tz
+
+    @pytest.mark.parametrize('result', [
+        Timestamp(datetime(2000, 1, 2, 3, 4, 5, 6), nanosecond=1),
+        Timestamp(year=2000, month=1, day=2, hour=3, minute=4, second=5,
+                  microsecond=6, nanosecond=1),
+        Timestamp(year=2000, month=1, day=2, hour=3, minute=4, second=5,
+                  microsecond=6, nanosecond=1, tz='UTC'),
+        Timestamp(2000, 1, 2, 3, 4, 5, 6, 1, None),
+        Timestamp(2000, 1, 2, 3, 4, 5, 6, 1, pytz.UTC)])
+    def test_constructor_nanosecond(self, result):
+        # GH 18898
+        expected = Timestamp(datetime(2000, 1, 2, 3, 4, 5, 6), tz=result.tz)
+        expected = expected + Timedelta(nanoseconds=1)
+        assert result == expected
+
+    @pytest.mark.parametrize('z', ['Z0', 'Z00'])
+    def test_constructor_invalid_Z0_isostring(self, z):
+        # GH 8910
+        with pytest.raises(ValueError):
+            Timestamp('2014-11-02 01:00{}'.format(z))
+
+    @pytest.mark.parametrize('arg', ['year', 'month', 'day', 'hour', 'minute',
+                                     'second', 'microsecond', 'nanosecond'])
+    def test_invalid_date_kwarg_with_string_input(self, arg):
+        kwarg = {arg: 1}
+        with pytest.raises(ValueError):
+            Timestamp('2010-10-10 12:59:59.999999999', **kwarg)
+
+    def test_out_of_bounds_value(self):
+        one_us = np.timedelta64(1).astype('timedelta64[us]')
+
+        # By definition we can't go out of bounds in [ns], so we
+        # convert the datetime64s to [us] so we can go out of bounds
+        min_ts_us = np.datetime64(Timestamp.min).astype('M8[us]')
+        max_ts_us = np.datetime64(Timestamp.max).astype('M8[us]')
+
+        # No error for the min/max datetimes
+        Timestamp(min_ts_us)
+        Timestamp(max_ts_us)
+
+        # One us less than the minimum is an error
+        with pytest.raises(ValueError):
+            Timestamp(min_ts_us - one_us)
+
+        # One us more than the maximum is an error
+        with pytest.raises(ValueError):
+            Timestamp(max_ts_us + one_us)
+
+    def test_out_of_bounds_string(self):
+        with pytest.raises(ValueError):
+            Timestamp('1676-01-01')
+        with pytest.raises(ValueError):
+            Timestamp('2263-01-01')
+
+    def test_barely_out_of_bounds(self):
+        # GH#19529
+        # GH#19382 close enough to bounds that dropping nanos would result
+        # in an in-bounds datetime
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp('2262-04-11 23:47:16.854775808')
+
+    def test_bounds_with_different_units(self):
+        out_of_bounds_dates = ('1677-09-21', '2262-04-12')
+
+        time_units = ('D', 'h', 'm', 's', 'ms', 'us')
+
+        for date_string in out_of_bounds_dates:
+            for unit in time_units:
+                dt64 = np.datetime64(date_string, dtype='M8[%s]' % unit)
+                with pytest.raises(ValueError):
+                    Timestamp(dt64)
+
+        in_bounds_dates = ('1677-09-23', '2262-04-11')
+
+        for date_string in in_bounds_dates:
+            for unit in time_units:
+                dt64 = np.datetime64(date_string, dtype='M8[%s]' % unit)
+                Timestamp(dt64)
+
+    def test_min_valid(self):
+        # Ensure that Timestamp.min is a valid Timestamp
+        Timestamp(Timestamp.min)
+
+    def test_max_valid(self):
+        # Ensure that Timestamp.max is a valid Timestamp
+        Timestamp(Timestamp.max)
+
+    def test_now(self):
+        # GH#9000
+        ts_from_string = Timestamp('now')
+        ts_from_method = Timestamp.now()
+        ts_datetime = datetime.now()
+
+        ts_from_string_tz = Timestamp('now', tz='US/Eastern')
+        ts_from_method_tz = Timestamp.now(tz='US/Eastern')
+
+        # Check that the delta between the times is less than 1s (arbitrarily
+        # small)
+        delta = Timedelta(seconds=1)
+        assert abs(ts_from_method - ts_from_string) < delta
+        assert abs(ts_datetime - ts_from_method) < delta
+        assert abs(ts_from_method_tz - ts_from_string_tz) < delta
+        assert (abs(ts_from_string_tz.tz_localize(None) -
+                    ts_from_method_tz.tz_localize(None)) < delta)
+
+    def test_today(self):
+        ts_from_string = Timestamp('today')
+        ts_from_method = Timestamp.today()
+        ts_datetime = datetime.today()
+
+        ts_from_string_tz = Timestamp('today', tz='US/Eastern')
+        ts_from_method_tz = Timestamp.today(tz='US/Eastern')
+
+        # Check that the delta between the times is less than 1s (arbitrarily
+        # small)
+        delta = Timedelta(seconds=1)
+        assert abs(ts_from_method - ts_from_string) < delta
+        assert abs(ts_datetime - ts_from_method) < delta
+        assert abs(ts_from_method_tz - ts_from_string_tz) < delta
+        assert (abs(ts_from_string_tz.tz_localize(None) -
+                    ts_from_method_tz.tz_localize(None)) < delta)
+
+    @pytest.mark.parametrize('tz', [None, pytz.timezone('US/Pacific')])
+    def test_disallow_setting_tz(self, tz):
+        # GH 3746
+        ts = Timestamp('2010')
+        with pytest.raises(AttributeError):
+            ts.tz = tz
+
+    @pytest.mark.parametrize('offset', ['+0300', '+0200'])
+    def test_construct_timestamp_near_dst(self, offset):
+        # GH 20854
+        expected = Timestamp('2016-10-30 03:00:00{}'.format(offset),
+                             tz='Europe/Helsinki')
+        result = Timestamp(expected).tz_convert('Europe/Helsinki')
+        assert result == expected
+
+    @pytest.mark.parametrize('arg', [
+        '2013/01/01 00:00:00+09:00', '2013-01-01 00:00:00+09:00'])
+    def test_construct_with_different_string_format(self, arg):
+        # GH 12064
+        result = Timestamp(arg)
+        expected = Timestamp(datetime(2013, 1, 1), tz=pytz.FixedOffset(540))
+        assert result == expected
+
+    def test_construct_timestamp_preserve_original_frequency(self):
+        # GH 22311
+        result = Timestamp(Timestamp('2010-08-08', freq='D')).freq
+        expected = offsets.Day()
+        assert result == expected
+
+    def test_constructor_invalid_frequency(self):
+        # GH 22311
+        with pytest.raises(ValueError, match="Invalid frequency:"):
+            Timestamp('2012-01-01', freq=[])
+
+    @pytest.mark.parametrize('box', [datetime, Timestamp])
+    def test_depreciate_tz_and_tzinfo_in_datetime_input(self, box):
+        # GH 23579
+        kwargs = {'year': 2018, 'month': 1, 'day': 1, 'tzinfo': utc}
+        with tm.assert_produces_warning(FutureWarning):
+            Timestamp(box(**kwargs), tz='US/Pacific')
+
+    def test_dont_convert_dateutil_utc_to_pytz_utc(self):
+        result = Timestamp(datetime(2018, 1, 1), tz=tzutc())
+        expected = Timestamp(datetime(2018, 1, 1)).tz_localize(tzutc())
+        assert result == expected
+
+
+class TestTimestamp(object):
+
+    def test_tz(self):
+        tstr = '2014-02-01 09:00'
+        ts = Timestamp(tstr)
+        local = ts.tz_localize('Asia/Tokyo')
+        assert local.hour == 9
+        assert local == Timestamp(tstr, tz='Asia/Tokyo')
+        conv = local.tz_convert('US/Eastern')
+        assert conv == Timestamp('2014-01-31 19:00', tz='US/Eastern')
+        assert conv.hour == 19
+
+        # preserves nanosecond
+        ts = Timestamp(tstr) + offsets.Nano(5)
+        local = ts.tz_localize('Asia/Tokyo')
+        assert local.hour == 9
+        assert local.nanosecond == 5
+        conv = local.tz_convert('US/Eastern')
+        assert conv.nanosecond == 5
+        assert conv.hour == 19
+
+    def test_utc_z_designator(self):
+        assert get_timezone(Timestamp('2014-11-02 01:00Z').tzinfo) is utc
+
+    def test_asm8(self):
+        np.random.seed(7960929)
+        ns = [Timestamp.min.value, Timestamp.max.value, 1000]
+
+        for n in ns:
+            assert (Timestamp(n).asm8.view('i8') ==
+                    np.datetime64(n, 'ns').view('i8') == n)
+
+        assert (Timestamp('nat').asm8.view('i8') ==
+                np.datetime64('nat', 'ns').view('i8'))
+
+    def test_class_ops_pytz(self):
+        def compare(x, y):
+            assert (int(Timestamp(x).value / 1e9) ==
+                    int(Timestamp(y).value / 1e9))
+
+        compare(Timestamp.now(), datetime.now())
+        compare(Timestamp.now('UTC'), datetime.now(timezone('UTC')))
+        compare(Timestamp.utcnow(), datetime.utcnow())
+        compare(Timestamp.today(), datetime.today())
+        current_time = calendar.timegm(datetime.now().utctimetuple())
+        compare(Timestamp.utcfromtimestamp(current_time),
+                datetime.utcfromtimestamp(current_time))
+        compare(Timestamp.fromtimestamp(current_time),
+                datetime.fromtimestamp(current_time))
+
+        date_component = datetime.utcnow()
+        time_component = (date_component + timedelta(minutes=10)).time()
+        compare(Timestamp.combine(date_component, time_component),
+                datetime.combine(date_component, time_component))
+
+    def test_class_ops_dateutil(self):
+        def compare(x, y):
+            assert (int(np.round(Timestamp(x).value / 1e9)) ==
+                    int(np.round(Timestamp(y).value / 1e9)))
+
+        compare(Timestamp.now(), datetime.now())
+        compare(Timestamp.now('UTC'), datetime.now(tzutc()))
+        compare(Timestamp.utcnow(), datetime.utcnow())
+        compare(Timestamp.today(), datetime.today())
+        current_time = calendar.timegm(datetime.now().utctimetuple())
+        compare(Timestamp.utcfromtimestamp(current_time),
+                datetime.utcfromtimestamp(current_time))
+        compare(Timestamp.fromtimestamp(current_time),
+                datetime.fromtimestamp(current_time))
+
+        date_component = datetime.utcnow()
+        time_component = (date_component + timedelta(minutes=10)).time()
+        compare(Timestamp.combine(date_component, time_component),
+                datetime.combine(date_component, time_component))
+
+    def test_basics_nanos(self):
+        val = np.int64(946684800000000000).view('M8[ns]')
+        stamp = Timestamp(val.view('i8') + 500)
+        assert stamp.year == 2000
+        assert stamp.month == 1
+        assert stamp.microsecond == 0
+        assert stamp.nanosecond == 500
+
+        # GH 14415
+        val = np.iinfo(np.int64).min + 80000000000000
+        stamp = Timestamp(val)
+        assert stamp.year == 1677
+        assert stamp.month == 9
+        assert stamp.day == 21
+        assert stamp.microsecond == 145224
+        assert stamp.nanosecond == 192
+
+    @pytest.mark.parametrize('value, check_kwargs', [
+        [946688461000000000, {}],
+        [946688461000000000 / long(1000), dict(unit='us')],
+        [946688461000000000 / long(1000000), dict(unit='ms')],
+        [946688461000000000 / long(1000000000), dict(unit='s')],
+        [10957, dict(unit='D', h=0)],
+        pytest.param((946688461000000000 + 500000) / long(1000000000),
+                     dict(unit='s', us=499, ns=964),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000000) / long(1000000000),
+                     dict(unit='s', us=500000),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000) / long(1000000),
+                     dict(unit='ms', us=500),
+                     marks=pytest.mark.skipif(not PY3,
+                                              reason='using truediv, so these'
+                                                     ' are like floats')),
+        pytest.param((946688461000000000 + 500000) / long(1000000000),
+                     dict(unit='s'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        pytest.param((946688461000000000 + 500000000) / long(1000000000),
+                     dict(unit='s'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        pytest.param((946688461000000000 + 500000) / long(1000000),
+                     dict(unit='ms'),
+                     marks=pytest.mark.skipif(PY3,
+                                              reason='get chopped in py2')),
+        [(946688461000000000 + 500000) / long(1000), dict(unit='us', us=500)],
+        [(946688461000000000 + 500000000) / long(1000000),
+         dict(unit='ms', us=500000)],
+        [946688461000000000 / 1000.0 + 5, dict(unit='us', us=5)],
+        [946688461000000000 / 1000.0 + 5000, dict(unit='us', us=5000)],
+        [946688461000000000 / 1000000.0 + 0.5, dict(unit='ms', us=500)],
+        [946688461000000000 / 1000000.0 + 0.005, dict(unit='ms', us=5, ns=5)],
+        [946688461000000000 / 1000000000.0 + 0.5, dict(unit='s', us=500000)],
+        [10957 + 0.5, dict(unit='D', h=12)]])
+    def test_unit(self, value, check_kwargs):
+        def check(value, unit=None, h=1, s=1, us=0, ns=0):
+            stamp = Timestamp(value, unit=unit)
+            assert stamp.year == 2000
+            assert stamp.month == 1
+            assert stamp.day == 1
+            assert stamp.hour == h
+            if unit != 'D':
+                assert stamp.minute == 1
+                assert stamp.second == s
+                assert stamp.microsecond == us
+            else:
+                assert stamp.minute == 0
+                assert stamp.second == 0
+                assert stamp.microsecond == 0
+            assert stamp.nanosecond == ns
+
+        check(value, **check_kwargs)
+
+    def test_roundtrip(self):
+
+        # test value to string and back conversions
+        # further test accessors
+        base = Timestamp('20140101 00:00:00')
+
+        result = Timestamp(base.value + Timedelta('5ms').value)
+        assert result == Timestamp(str(base) + ".005000")
+        assert result.microsecond == 5000
+
+        result = Timestamp(base.value + Timedelta('5us').value)
+        assert result == Timestamp(str(base) + ".000005")
+        assert result.microsecond == 5
+
+        result = Timestamp(base.value + Timedelta('5ns').value)
+        assert result == Timestamp(str(base) + ".000000005")
+        assert result.nanosecond == 5
+        assert result.microsecond == 0
+
+        result = Timestamp(base.value + Timedelta('6ms 5us').value)
+        assert result == Timestamp(str(base) + ".006005")
+        assert result.microsecond == 5 + 6 * 1000
+
+        result = Timestamp(base.value + Timedelta('200ms 5us').value)
+        assert result == Timestamp(str(base) + ".200005")
+        assert result.microsecond == 5 + 200 * 1000
+
+    def test_hash_equivalent(self):
+        d = {datetime(2011, 1, 1): 5}
+        stamp = Timestamp(datetime(2011, 1, 1))
+        assert d[stamp] == 5
+
+    def test_tz_conversion_freq(self, tz_naive_fixture):
+        # GH25241
+        t1 = Timestamp('2019-01-01 10:00', freq='H')
+        assert t1.tz_localize(tz=tz_naive_fixture).freq == t1.freq
+        t2 = Timestamp('2019-01-02 12:00', tz='UTC', freq='T')
+        assert t2.tz_convert(tz='UTC').freq == t2.freq
+
+
+class TestTimestampNsOperations(object):
+
+    def setup_method(self, method):
+        self.timestamp = Timestamp(datetime.utcnow())
+
+    def assert_ns_timedelta(self, modified_timestamp, expected_value):
+        value = self.timestamp.value
+        modified_value = modified_timestamp.value
+
+        assert modified_value - value == expected_value
+
+    def test_timedelta_ns_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'ns'),
+                                 -123)
+
+    def test_timedelta_ns_based_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(
+            1234567898, 'ns'), 1234567898)
+
+    def test_timedelta_us_arithmetic(self):
+        self.assert_ns_timedelta(self.timestamp + np.timedelta64(-123, 'us'),
+                                 -123000)
+
+    def test_timedelta_ms_arithmetic(self):
+        time = self.timestamp + np.timedelta64(-123, 'ms')
+        self.assert_ns_timedelta(time, -123000000)
+
+    def test_nanosecond_string_parsing(self):
+        ts = Timestamp('2013-05-01 07:15:45.123456789')
+        # GH 7878
+        expected_repr = '2013-05-01 07:15:45.123456789'
+        expected_value = 1367392545123456789
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789+09:00', tz='Asia/Tokyo')
+        assert ts.value == expected_value - 9 * 3600 * 1000000000
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='UTC')
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+        ts = Timestamp('2013-05-01 07:15:45.123456789', tz='US/Eastern')
+        assert ts.value == expected_value + 4 * 3600 * 1000000000
+        assert expected_repr in repr(ts)
+
+        # GH 10041
+        ts = Timestamp('20130501T071545.123456789')
+        assert ts.value == expected_value
+        assert expected_repr in repr(ts)
+
+    def test_nanosecond_timestamp(self):
+        # GH 7610
+        expected = 1293840000000000005
+        t = Timestamp('2011-01-01') + offsets.Nano(5)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        t = Timestamp(t)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000005Z'))
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000005')"
+        assert t.value == expected
+        assert t.nanosecond == 5
+
+        expected = 1293840000000000010
+        t = t + offsets.Nano(5)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+        t = Timestamp(t)
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+        t = Timestamp(np_datetime64_compat('2011-01-01 00:00:00.000000010Z'))
+        assert repr(t) == "Timestamp('2011-01-01 00:00:00.000000010')"
+        assert t.value == expected
+        assert t.nanosecond == 10
+
+
+class TestTimestampToJulianDate(object):
+
+    def test_compare_1700(self):
+        r = Timestamp('1700-06-23').to_julian_date()
+        assert r == 2342145.5
+
+    def test_compare_2000(self):
+        r = Timestamp('2000-04-12').to_julian_date()
+        assert r == 2451646.5
+
+    def test_compare_2100(self):
+        r = Timestamp('2100-08-12').to_julian_date()
+        assert r == 2488292.5
+
+    def test_compare_hour01(self):
+        r = Timestamp('2000-08-12T01:00:00').to_julian_date()
+        assert r == 2451768.5416666666666666
+
+    def test_compare_hour13(self):
+        r = Timestamp('2000-08-12T13:00:00').to_julian_date()
+        assert r == 2451769.0416666666666666
+
+
+class TestTimestampConversion(object):
+    def test_conversion(self):
+        # GH#9255
+        ts = Timestamp('2000-01-01')
+
+        result = ts.to_pydatetime()
+        expected = datetime(2000, 1, 1)
+        assert result == expected
+        assert type(result) == type(expected)
+
+        result = ts.to_datetime64()
+        expected = np.datetime64(ts.value, 'ns')
+        assert result == expected
+        assert type(result) == type(expected)
+        assert result.dtype == expected.dtype
+
+    def test_to_pydatetime_nonzero_nano(self):
+        ts = Timestamp('2011-01-01 9:00:00.123456789')
+
+        # Warn the user of data loss (nanoseconds).
+        with tm.assert_produces_warning(UserWarning,
+                                        check_stacklevel=False):
+            expected = datetime(2011, 1, 1, 9, 0, 0, 123456)
+            result = ts.to_pydatetime()
+            assert result == expected
+
+    def test_timestamp_to_datetime(self):
+        stamp = Timestamp('20090415', tz='US/Eastern', freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_timestamp_to_datetime_dateutil(self):
+        stamp = Timestamp('20090415', tz='dateutil/US/Eastern', freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_timestamp_to_datetime_explicit_pytz(self):
+        stamp = Timestamp('20090415', tz=pytz.timezone('US/Eastern'), freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    @td.skip_if_windows_python_3
+    def test_timestamp_to_datetime_explicit_dateutil(self):
+        stamp = Timestamp('20090415', tz=gettz('US/Eastern'), freq='D')
+        dtval = stamp.to_pydatetime()
+        assert stamp == dtval
+        assert stamp.tzinfo == dtval.tzinfo
+
+    def test_to_datetime_bijective(self):
+        # Ensure that converting to datetime and back only loses precision
+        # by going from nanoseconds to microseconds.
+        exp_warning = None if Timestamp.max.nanosecond == 0 else UserWarning
+        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
+            assert (Timestamp(Timestamp.max.to_pydatetime()).value / 1000 ==
+                    Timestamp.max.value / 1000)
+
+        exp_warning = None if Timestamp.min.nanosecond == 0 else UserWarning
+        with tm.assert_produces_warning(exp_warning, check_stacklevel=False):
+            assert (Timestamp(Timestamp.min.to_pydatetime()).value / 1000 ==
+                    Timestamp.min.value / 1000)
+
+    def test_to_period_tz_warning(self):
+        # GH#21333 make sure a warning is issued when timezone
+        # info is lost
+        ts = Timestamp('2009-04-15 16:17:18', tz='US/Eastern')
+        with tm.assert_produces_warning(UserWarning):
+            # warning that timezone info will be lost
+            ts.to_period('D')
+
+    def test_to_numpy_alias(self):
+        # GH 24653: alias .to_numpy() for scalars
+        ts = Timestamp(datetime.now())
+        assert ts.to_datetime64() == ts.to_numpy()
diff --git a/pandas/tests/scalar/timestamp/test_timezones.py b/pandas/tests/scalar/timestamp/test_timezones.py
new file mode 100644
index 0000000000000..bc67a3e72f8d0
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_timezones.py
@@ -0,0 +1,389 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Timestamp timezone-related methods
+"""
+from datetime import date, datetime, timedelta
+from distutils.version import LooseVersion
+
+import dateutil
+from dateutil.tz import gettz, tzoffset
+import pytest
+import pytz
+from pytz.exceptions import AmbiguousTimeError, NonExistentTimeError
+
+from pandas._libs.tslibs import timezones
+from pandas.errors import OutOfBoundsDatetime
+import pandas.util._test_decorators as td
+
+from pandas import NaT, Timestamp
+import pandas.util.testing as tm
+
+
+class TestTimestampTZOperations(object):
+    # --------------------------------------------------------------
+    # Timestamp.tz_localize
+
+    def test_tz_localize_pushes_out_of_bounds(self):
+        # GH#12677
+        # tz_localize that pushes away from the boundary is OK
+        pac = Timestamp.min.tz_localize('US/Pacific')
+        assert pac.value > Timestamp.min.value
+        pac.tz_convert('Asia/Tokyo')  # tz_convert doesn't change value
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp.min.tz_localize('Asia/Tokyo')
+
+        # tz_localize that pushes away from the boundary is OK
+        tokyo = Timestamp.max.tz_localize('Asia/Tokyo')
+        assert tokyo.value < Timestamp.max.value
+        tokyo.tz_convert('US/Pacific')  # tz_convert doesn't change value
+        with pytest.raises(OutOfBoundsDatetime):
+            Timestamp.max.tz_localize('US/Pacific')
+
+    def test_tz_localize_ambiguous_bool(self):
+        # make sure that we are correctly accepting bool values as ambiguous
+        # GH#14402
+        ts = Timestamp('2015-11-01 01:00:03')
+        expected0 = Timestamp('2015-11-01 01:00:03-0500', tz='US/Central')
+        expected1 = Timestamp('2015-11-01 01:00:03-0600', tz='US/Central')
+
+        with pytest.raises(pytz.AmbiguousTimeError):
+            ts.tz_localize('US/Central')
+
+        result = ts.tz_localize('US/Central', ambiguous=True)
+        assert result == expected0
+
+        result = ts.tz_localize('US/Central', ambiguous=False)
+        assert result == expected1
+
+    def test_tz_localize_ambiguous(self):
+        ts = Timestamp('2014-11-02 01:00')
+        ts_dst = ts.tz_localize('US/Eastern', ambiguous=True)
+        ts_no_dst = ts.tz_localize('US/Eastern', ambiguous=False)
+
+        assert (ts_no_dst.value - ts_dst.value) / 1e9 == 3600
+        with pytest.raises(ValueError):
+            ts.tz_localize('US/Eastern', ambiguous='infer')
+
+        # GH#8025
+        msg = ('Cannot localize tz-aware Timestamp, '
+               'use tz_convert for conversions')
+        with pytest.raises(TypeError, match=msg):
+            Timestamp('2011-01-01', tz='US/Eastern').tz_localize('Asia/Tokyo')
+
+        msg = ('Cannot convert tz-naive Timestamp, '
+               'use tz_localize to localize')
+        with pytest.raises(TypeError, match=msg):
+            Timestamp('2011-01-01').tz_convert('Asia/Tokyo')
+
+    @pytest.mark.parametrize('stamp, tz', [
+        ('2015-03-08 02:00', 'US/Eastern'),
+        ('2015-03-08 02:30', 'US/Pacific'),
+        ('2015-03-29 02:00', 'Europe/Paris'),
+        ('2015-03-29 02:30', 'Europe/Belgrade')])
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_tz_localize_nonexistent(self, stamp, tz):
+        # GH#13057
+        ts = Timestamp(stamp)
+        with pytest.raises(NonExistentTimeError):
+            ts.tz_localize(tz)
+        # GH 22644
+        with pytest.raises(NonExistentTimeError):
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize(tz, errors='raise')
+        with tm.assert_produces_warning(FutureWarning):
+            assert ts.tz_localize(tz, errors='coerce') is NaT
+
+    def test_tz_localize_errors_ambiguous(self):
+        # GH#13057
+        ts = Timestamp('2015-11-1 01:00')
+        with pytest.raises(AmbiguousTimeError):
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize('US/Pacific', errors='coerce')
+
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_tz_localize_errors_invalid_arg(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        ts = Timestamp('2015-03-29 02:00:00')
+        with pytest.raises(ValueError):
+            with tm.assert_produces_warning(FutureWarning):
+                ts.tz_localize(tz, errors='foo')
+
+    def test_tz_localize_errors_coerce(self):
+        # GH 22644
+        # make sure errors='coerce' gets mapped correctly to nonexistent
+        tz = 'Europe/Warsaw'
+        ts = Timestamp('2015-03-29 02:00:00')
+        with tm.assert_produces_warning(FutureWarning):
+            result = ts.tz_localize(tz, errors='coerce')
+        expected = ts.tz_localize(tz, nonexistent='NaT')
+        assert result is expected
+
+    @pytest.mark.parametrize('stamp', ['2014-02-01 09:00', '2014-07-08 09:00',
+                                       '2014-11-01 17:00', '2014-11-05 00:00'])
+    def test_tz_localize_roundtrip(self, stamp, tz_aware_fixture):
+        tz = tz_aware_fixture
+        ts = Timestamp(stamp)
+        localized = ts.tz_localize(tz)
+        assert localized == Timestamp(stamp, tz=tz)
+
+        with pytest.raises(TypeError):
+            localized.tz_localize(tz)
+
+        reset = localized.tz_localize(None)
+        assert reset == ts
+        assert reset.tzinfo is None
+
+    def test_tz_localize_ambiguous_compat(self):
+        # validate that pytz and dateutil are compat for dst
+        # when the transition happens
+        naive = Timestamp('2013-10-27 01:00:00')
+
+        pytz_zone = 'Europe/London'
+        dateutil_zone = 'dateutil/Europe/London'
+        result_pytz = naive.tz_localize(pytz_zone, ambiguous=0)
+        result_dateutil = naive.tz_localize(dateutil_zone, ambiguous=0)
+        assert result_pytz.value == result_dateutil.value
+        assert result_pytz.value == 1382835600000000000
+
+        if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+            # dateutil 2.6 buggy w.r.t. ambiguous=0
+            # see gh-14621
+            # see https://github.com/dateutil/dateutil/issues/321
+            assert (result_pytz.to_pydatetime().tzname() ==
+                    result_dateutil.to_pydatetime().tzname())
+            assert str(result_pytz) == str(result_dateutil)
+        elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+            # fixed ambiguous behavior
+            assert result_pytz.to_pydatetime().tzname() == 'GMT'
+            assert result_dateutil.to_pydatetime().tzname() == 'BST'
+            assert str(result_pytz) != str(result_dateutil)
+
+        # 1 hour difference
+        result_pytz = naive.tz_localize(pytz_zone, ambiguous=1)
+        result_dateutil = naive.tz_localize(dateutil_zone, ambiguous=1)
+        assert result_pytz.value == result_dateutil.value
+        assert result_pytz.value == 1382832000000000000
+
+        # dateutil < 2.6 is buggy w.r.t. ambiguous timezones
+        if LooseVersion(dateutil.__version__) > LooseVersion('2.5.3'):
+            # see gh-14621
+            assert str(result_pytz) == str(result_dateutil)
+            assert (result_pytz.to_pydatetime().tzname() ==
+                    result_dateutil.to_pydatetime().tzname())
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_tz_localize(self, tz):
+        stamp = Timestamp('3/11/2012 04:00')
+
+        result = stamp.tz_localize(tz)
+        expected = Timestamp('3/11/2012 04:00', tz=tz)
+        assert result.hour == expected.hour
+        assert result == expected
+
+    @pytest.mark.parametrize('start_ts, tz, end_ts, shift', [
+        ['2015-03-29 02:20:00', 'Europe/Warsaw', '2015-03-29 03:00:00',
+         'forward'],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 01:59:59.999999999', 'backward'],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 03:20:00', timedelta(hours=1)],
+        ['2015-03-29 02:20:00', 'Europe/Warsaw',
+         '2015-03-29 01:20:00', timedelta(hours=-1)],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 03:00:00',
+         'forward'],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 01:59:59.999999999',
+         'backward'],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 03:33:00',
+         timedelta(hours=1)],
+        ['2018-03-11 02:33:00', 'US/Pacific', '2018-03-11 01:33:00',
+         timedelta(hours=-1)]
+    ])
+    @pytest.mark.parametrize('tz_type', ['', 'dateutil/'])
+    def test_timestamp_tz_localize_nonexistent_shift(self, start_ts, tz,
+                                                     end_ts, shift,
+                                                     tz_type):
+        # GH 8917, 24466
+        tz = tz_type + tz
+        if isinstance(shift, str):
+            shift = 'shift_' + shift
+        ts = Timestamp(start_ts)
+        result = ts.tz_localize(tz, nonexistent=shift)
+        expected = Timestamp(end_ts).tz_localize(tz)
+        assert result == expected
+
+    @pytest.mark.parametrize('offset', [-1, 1])
+    @pytest.mark.parametrize('tz_type', ['', 'dateutil/'])
+    def test_timestamp_tz_localize_nonexistent_shift_invalid(self, offset,
+                                                             tz_type):
+        # GH 8917, 24466
+        tz = tz_type + 'Europe/Warsaw'
+        ts = Timestamp('2015-03-29 02:20:00')
+        msg = "The provided timedelta will relocalize on a nonexistent time"
+        with pytest.raises(ValueError, match=msg):
+            ts.tz_localize(tz, nonexistent=timedelta(seconds=offset))
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    def test_timestamp_tz_localize_nonexistent_NaT(self, tz):
+        # GH 8917
+        ts = Timestamp('2015-03-29 02:20:00')
+        result = ts.tz_localize(tz, nonexistent='NaT')
+        assert result is NaT
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    def test_timestamp_tz_localize_nonexistent_raise(self, tz):
+        # GH 8917
+        ts = Timestamp('2015-03-29 02:20:00')
+        with pytest.raises(pytz.NonExistentTimeError):
+            ts.tz_localize(tz, nonexistent='raise')
+        with pytest.raises(ValueError):
+            ts.tz_localize(tz, nonexistent='foo')
+
+    # ------------------------------------------------------------------
+    # Timestamp.tz_convert
+
+    @pytest.mark.parametrize('stamp', ['2014-02-01 09:00', '2014-07-08 09:00',
+                                       '2014-11-01 17:00', '2014-11-05 00:00'])
+    def test_tz_convert_roundtrip(self, stamp, tz_aware_fixture):
+        tz = tz_aware_fixture
+
+        ts = Timestamp(stamp, tz='UTC')
+        converted = ts.tz_convert(tz)
+
+        reset = converted.tz_convert(None)
+        assert reset == Timestamp(stamp)
+        assert reset.tzinfo is None
+        assert reset == converted.tz_convert('UTC').tz_localize(None)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_astimezone(self, tzstr):
+        # astimezone is an alias for tz_convert, so keep it with
+        # the tz_convert tests
+        utcdate = Timestamp('3/11/2012 22:00', tz='UTC')
+        expected = utcdate.tz_convert(tzstr)
+        result = utcdate.astimezone(tzstr)
+        assert expected == result
+        assert isinstance(result, Timestamp)
+
+    @td.skip_if_windows
+    def test_tz_convert_utc_with_system_utc(self):
+        from pandas._libs.tslibs.timezones import maybe_get_tz
+
+        # from system utc to real utc
+        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
+        # check that the time hasn't changed.
+        assert ts == ts.tz_convert(dateutil.tz.tzutc())
+
+        # from system utc to real utc
+        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
+        # check that the time hasn't changed.
+        assert ts == ts.tz_convert(dateutil.tz.tzutc())
+
+    # ------------------------------------------------------------------
+    # Timestamp.__init__ with tz str or tzinfo
+
+    def test_timestamp_constructor_tz_utc(self):
+        utc_stamp = Timestamp('3/11/2012 05:00', tz='utc')
+        assert utc_stamp.tzinfo is pytz.utc
+        assert utc_stamp.hour == 5
+
+        utc_stamp = Timestamp('3/11/2012 05:00').tz_localize('utc')
+        assert utc_stamp.hour == 5
+
+    def test_timestamp_to_datetime_tzoffset(self):
+        tzinfo = tzoffset(None, 7200)
+        expected = Timestamp('3/11/2012 04:00', tz=tzinfo)
+        result = Timestamp(expected.to_pydatetime())
+        assert expected == result
+
+    def test_timestamp_constructor_near_dst_boundary(self):
+        # GH#11481 & GH#15777
+        # Naive string timestamps were being localized incorrectly
+        # with tz_convert_single instead of tz_localize_to_utc
+
+        for tz in ['Europe/Brussels', 'Europe/Prague']:
+            result = Timestamp('2015-10-25 01:00', tz=tz)
+            expected = Timestamp('2015-10-25 01:00').tz_localize(tz)
+            assert result == expected
+
+            with pytest.raises(pytz.AmbiguousTimeError):
+                Timestamp('2015-10-25 02:00', tz=tz)
+
+        result = Timestamp('2017-03-26 01:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 01:00').tz_localize('Europe/Paris')
+        assert result == expected
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            Timestamp('2017-03-26 02:00', tz='Europe/Paris')
+
+        # GH#11708
+        naive = Timestamp('2015-11-18 10:00:00')
+        result = naive.tz_localize('UTC').tz_convert('Asia/Kolkata')
+        expected = Timestamp('2015-11-18 15:30:00+0530', tz='Asia/Kolkata')
+        assert result == expected
+
+        # GH#15823
+        result = Timestamp('2017-03-26 00:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 00:00:00+0100', tz='Europe/Paris')
+        assert result == expected
+
+        result = Timestamp('2017-03-26 01:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 01:00:00+0100', tz='Europe/Paris')
+        assert result == expected
+
+        with pytest.raises(pytz.NonExistentTimeError):
+            Timestamp('2017-03-26 02:00', tz='Europe/Paris')
+
+        result = Timestamp('2017-03-26 02:00:00+0100', tz='Europe/Paris')
+        naive = Timestamp(result.value)
+        expected = naive.tz_localize('UTC').tz_convert('Europe/Paris')
+        assert result == expected
+
+        result = Timestamp('2017-03-26 03:00', tz='Europe/Paris')
+        expected = Timestamp('2017-03-26 03:00:00+0200', tz='Europe/Paris')
+        assert result == expected
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_constructed_by_date_and_tz(self, tz):
+        # GH#2993, Timestamp cannot be constructed by datetime.date
+        # and tz correctly
+
+        result = Timestamp(date(2012, 3, 11), tz=tz)
+
+        expected = Timestamp('3/11/2012', tz=tz)
+        assert result.hour == expected.hour
+        assert result == expected
+
+    @pytest.mark.parametrize('tz', [pytz.timezone('US/Eastern'),
+                                    gettz('US/Eastern'),
+                                    'US/Eastern', 'dateutil/US/Eastern'])
+    def test_timestamp_add_timedelta_push_over_dst_boundary(self, tz):
+        # GH#1389
+
+        # 4 hours before DST transition
+        stamp = Timestamp('3/10/2012 22:00', tz=tz)
+
+        result = stamp + timedelta(hours=6)
+
+        # spring forward, + "7" hours
+        expected = Timestamp('3/11/2012 05:00', tz=tz)
+
+        assert result == expected
+
+    def test_timestamp_timetz_equivalent_with_datetime_tz(self,
+                                                          tz_naive_fixture):
+        # GH21358
+        tz = timezones.maybe_get_tz(tz_naive_fixture)
+
+        stamp = Timestamp('2018-06-04 10:20:30', tz=tz)
+        _datetime = datetime(2018, 6, 4, hour=10,
+                             minute=20, second=30, tzinfo=tz)
+
+        result = stamp.timetz()
+        expected = _datetime.timetz()
+
+        assert result == expected
diff --git a/pandas/tests/scalar/timestamp/test_unary_ops.py b/pandas/tests/scalar/timestamp/test_unary_ops.py
new file mode 100644
index 0000000000000..adcf66200a672
--- /dev/null
+++ b/pandas/tests/scalar/timestamp/test_unary_ops.py
@@ -0,0 +1,377 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+from dateutil.tz import gettz
+import pytest
+import pytz
+from pytz import utc
+
+from pandas._libs.tslibs import conversion
+from pandas._libs.tslibs.frequencies import INVALID_FREQ_ERR_MSG
+from pandas.compat import PY3, PY36
+import pandas.util._test_decorators as td
+
+from pandas import NaT, Timestamp
+import pandas.util.testing as tm
+
+from pandas.tseries.frequencies import to_offset
+
+
+class TestTimestampUnaryOps(object):
+
+    # --------------------------------------------------------------
+    # Timestamp.round
+    @pytest.mark.parametrize('timestamp, freq, expected', [
+        ('20130101 09:10:11', 'D', '20130101'),
+        ('20130101 19:10:11', 'D', '20130102'),
+        ('20130201 12:00:00', 'D', '20130202'),
+        ('20130104 12:00:00', 'D', '20130105'),
+        ('2000-01-05 05:09:15.13', 'D', '2000-01-05 00:00:00'),
+        ('2000-01-05 05:09:15.13', 'H', '2000-01-05 05:00:00'),
+        ('2000-01-05 05:09:15.13', 'S', '2000-01-05 05:09:15')
+    ])
+    def test_round_frequencies(self, timestamp, freq, expected):
+        dt = Timestamp(timestamp)
+        result = dt.round(freq)
+        expected = Timestamp(expected)
+        assert result == expected
+
+    def test_round_tzaware(self):
+        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
+        result = dt.round('D')
+        expected = Timestamp('20130101', tz='US/Eastern')
+        assert result == expected
+
+        dt = Timestamp('20130101 09:10:11', tz='US/Eastern')
+        result = dt.round('s')
+        assert result == dt
+
+    def test_round_30min(self):
+        # round
+        dt = Timestamp('20130104 12:32:00')
+        result = dt.round('30Min')
+        expected = Timestamp('20130104 12:30:00')
+        assert result == expected
+
+    def test_round_subsecond(self):
+        # GH#14440 & GH#15578
+        result = Timestamp('2016-10-17 12:00:00.0015').round('ms')
+        expected = Timestamp('2016-10-17 12:00:00.002000')
+        assert result == expected
+
+        result = Timestamp('2016-10-17 12:00:00.00149').round('ms')
+        expected = Timestamp('2016-10-17 12:00:00.001000')
+        assert result == expected
+
+        ts = Timestamp('2016-10-17 12:00:00.0015')
+        for freq in ['us', 'ns']:
+            assert ts == ts.round(freq)
+
+        result = Timestamp('2016-10-17 12:00:00.001501031').round('10ns')
+        expected = Timestamp('2016-10-17 12:00:00.001501030')
+        assert result == expected
+
+    def test_round_nonstandard_freq(self):
+        with tm.assert_produces_warning(False):
+            Timestamp('2016-10-17 12:00:00.001501031').round('1010ns')
+
+    def test_round_invalid_arg(self):
+        stamp = Timestamp('2000-01-05 05:09:15.13')
+        with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+            stamp.round('foo')
+
+    @pytest.mark.parametrize('test_input, rounder, freq, expected', [
+        ('2117-01-01 00:00:45', 'floor', '15s', '2117-01-01 00:00:45'),
+        ('2117-01-01 00:00:45', 'ceil', '15s', '2117-01-01 00:00:45'),
+        ('2117-01-01 00:00:45.000000012', 'floor', '10ns',
+         '2117-01-01 00:00:45.000000010'),
+        ('1823-01-01 00:00:01.000000012', 'ceil', '10ns',
+         '1823-01-01 00:00:01.000000020'),
+        ('1823-01-01 00:00:01', 'floor', '1s', '1823-01-01 00:00:01'),
+        ('1823-01-01 00:00:01', 'ceil', '1s', '1823-01-01 00:00:01'),
+        ('NaT', 'floor', '1s', 'NaT'),
+        ('NaT', 'ceil', '1s', 'NaT')
+    ])
+    def test_ceil_floor_edge(self, test_input, rounder, freq, expected):
+        dt = Timestamp(test_input)
+        func = getattr(dt, rounder)
+        result = func(freq)
+
+        if dt is NaT:
+            assert result is NaT
+        else:
+            expected = Timestamp(expected)
+            assert result == expected
+
+    @pytest.mark.parametrize('test_input, freq, expected', [
+        ('2018-01-01 00:02:06', '2s', '2018-01-01 00:02:06'),
+        ('2018-01-01 00:02:00', '2T', '2018-01-01 00:02:00'),
+        ('2018-01-01 00:04:00', '4T', '2018-01-01 00:04:00'),
+        ('2018-01-01 00:15:00', '15T', '2018-01-01 00:15:00'),
+        ('2018-01-01 00:20:00', '20T', '2018-01-01 00:20:00'),
+        ('2018-01-01 03:00:00', '3H', '2018-01-01 03:00:00'),
+    ])
+    @pytest.mark.parametrize('rounder', ['ceil', 'floor', 'round'])
+    def test_round_minute_freq(self, test_input, freq, expected, rounder):
+        # Ensure timestamps that shouldnt round dont!
+        # GH#21262
+
+        dt = Timestamp(test_input)
+        expected = Timestamp(expected)
+        func = getattr(dt, rounder)
+        result = func(freq)
+        assert result == expected
+
+    def test_ceil(self):
+        dt = Timestamp('20130101 09:10:11')
+        result = dt.ceil('D')
+        expected = Timestamp('20130102')
+        assert result == expected
+
+    def test_floor(self):
+        dt = Timestamp('20130101 09:10:11')
+        result = dt.floor('D')
+        expected = Timestamp('20130101')
+        assert result == expected
+
+    @pytest.mark.parametrize('method', ['ceil', 'round', 'floor'])
+    def test_round_dst_border_ambiguous(self, method):
+        # GH 18946 round near "fall back" DST
+        ts = Timestamp('2017-10-29 00:00:00', tz='UTC').tz_convert(
+            'Europe/Madrid'
+        )
+        #
+        result = getattr(ts, method)('H', ambiguous=True)
+        assert result == ts
+
+        result = getattr(ts, method)('H', ambiguous=False)
+        expected = Timestamp('2017-10-29 01:00:00', tz='UTC').tz_convert(
+            'Europe/Madrid'
+        )
+        assert result == expected
+
+        result = getattr(ts, method)('H', ambiguous='NaT')
+        assert result is NaT
+
+        with pytest.raises(pytz.AmbiguousTimeError):
+            getattr(ts, method)('H', ambiguous='raise')
+
+    @pytest.mark.parametrize('method, ts_str, freq', [
+        ['ceil', '2018-03-11 01:59:00-0600', '5min'],
+        ['round', '2018-03-11 01:59:00-0600', '5min'],
+        ['floor', '2018-03-11 03:01:00-0500', '2H']])
+    def test_round_dst_border_nonexistent(self, method, ts_str, freq):
+        # GH 23324 round near "spring forward" DST
+        ts = Timestamp(ts_str, tz='America/Chicago')
+        result = getattr(ts, method)(freq, nonexistent='shift_forward')
+        expected = Timestamp('2018-03-11 03:00:00', tz='America/Chicago')
+        assert result == expected
+
+        result = getattr(ts, method)(freq, nonexistent='NaT')
+        assert result is NaT
+
+        with pytest.raises(pytz.NonExistentTimeError,
+                           match='2018-03-11 02:00:00'):
+            getattr(ts, method)(freq, nonexistent='raise')
+
+    @pytest.mark.parametrize('timestamp', [
+        '2018-01-01 0:0:0.124999360',
+        '2018-01-01 0:0:0.125000367',
+        '2018-01-01 0:0:0.125500',
+        '2018-01-01 0:0:0.126500',
+        '2018-01-01 12:00:00',
+        '2019-01-01 12:00:00',
+    ])
+    @pytest.mark.parametrize('freq', [
+        '2ns', '3ns', '4ns', '5ns', '6ns', '7ns',
+        '250ns', '500ns', '750ns',
+        '1us', '19us', '250us', '500us', '750us',
+        '1s', '2s', '3s',
+        '1D',
+    ])
+    def test_round_int64(self, timestamp, freq):
+        """check that all rounding modes are accurate to int64 precision
+           see GH#22591
+        """
+        dt = Timestamp(timestamp)
+        unit = to_offset(freq).nanos
+
+        # test floor
+        result = dt.floor(freq)
+        assert result.value % unit == 0, "floor not a {} multiple".format(freq)
+        assert 0 <= dt.value - result.value < unit, "floor error"
+
+        # test ceil
+        result = dt.ceil(freq)
+        assert result.value % unit == 0, "ceil not a {} multiple".format(freq)
+        assert 0 <= result.value - dt.value < unit, "ceil error"
+
+        # test round
+        result = dt.round(freq)
+        assert result.value % unit == 0, "round not a {} multiple".format(freq)
+        assert abs(result.value - dt.value) <= unit // 2, "round error"
+        if unit % 2 == 0 and abs(result.value - dt.value) == unit // 2:
+            # round half to even
+            assert result.value // unit % 2 == 0, "round half to even error"
+
+    # --------------------------------------------------------------
+    # Timestamp.replace
+
+    def test_replace_naive(self):
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00')
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00')
+        assert result == expected
+
+    def test_replace_aware(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        # replacing datetime components with and w/o presence of a timezone
+        ts = Timestamp('2016-01-01 09:00:00', tz=tz)
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00', tz=tz)
+        assert result == expected
+
+    def test_replace_preserves_nanos(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        result = ts.replace(hour=0)
+        expected = Timestamp('2016-01-01 00:00:00.000000123', tz=tz)
+        assert result == expected
+
+    def test_replace_multiple(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        # replacing datetime components with and w/o presence of a timezone
+        # test all
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        result = ts.replace(year=2015, month=2, day=2, hour=0, minute=5,
+                            second=5, microsecond=5, nanosecond=5)
+        expected = Timestamp('2015-02-02 00:05:05.000005005', tz=tz)
+        assert result == expected
+
+    def test_replace_invalid_kwarg(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        with pytest.raises(TypeError):
+            ts.replace(foo=5)
+
+    def test_replace_integer_args(self, tz_aware_fixture):
+        tz = tz_aware_fixture
+        # GH#14621, GH#7825
+        ts = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
+        with pytest.raises(ValueError):
+            ts.replace(hour=0.1)
+
+    def test_replace_tzinfo_equiv_tz_localize_none(self):
+        # GH#14621, GH#7825
+        # assert conversion to naive is the same as replacing tzinfo with None
+        ts = Timestamp('2013-11-03 01:59:59.999999-0400', tz='US/Eastern')
+        assert ts.tz_localize(None) == ts.replace(tzinfo=None)
+
+    @td.skip_if_windows
+    def test_replace_tzinfo(self):
+        # GH#15683
+        dt = datetime(2016, 3, 27, 1)
+        tzinfo = pytz.timezone('CET').localize(dt, is_dst=False).tzinfo
+
+        result_dt = dt.replace(tzinfo=tzinfo)
+        result_pd = Timestamp(dt).replace(tzinfo=tzinfo)
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                assert result_dt.timestamp() == result_pd.timestamp()
+
+        assert result_dt == result_pd
+        assert result_dt == result_pd.to_pydatetime()
+
+        result_dt = dt.replace(tzinfo=tzinfo).replace(tzinfo=None)
+        result_pd = Timestamp(dt).replace(tzinfo=tzinfo).replace(tzinfo=None)
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                assert result_dt.timestamp() == result_pd.timestamp()
+
+        assert result_dt == result_pd
+        assert result_dt == result_pd.to_pydatetime()
+
+    @pytest.mark.parametrize('tz, normalize', [
+        (pytz.timezone('US/Eastern'), lambda x: x.tzinfo.normalize(x)),
+        (gettz('US/Eastern'), lambda x: x)])
+    def test_replace_across_dst(self, tz, normalize):
+        # GH#18319 check that 1) timezone is correctly normalized and
+        # 2) that hour is not incorrectly changed by this normalization
+        ts_naive = Timestamp('2017-12-03 16:03:30')
+        ts_aware = conversion.localize_pydatetime(ts_naive, tz)
+
+        # Preliminary sanity-check
+        assert ts_aware == normalize(ts_aware)
+
+        # Replace across DST boundary
+        ts2 = ts_aware.replace(month=6)
+
+        # Check that `replace` preserves hour literal
+        assert (ts2.hour, ts2.minute) == (ts_aware.hour, ts_aware.minute)
+
+        # Check that post-replace object is appropriately normalized
+        ts2b = normalize(ts2)
+        assert ts2 == ts2b
+
+    def test_replace_dst_border(self):
+        # Gh 7825
+        t = Timestamp('2013-11-3', tz='America/Chicago')
+        result = t.replace(hour=3)
+        expected = Timestamp('2013-11-3 03:00:00', tz='America/Chicago')
+        assert result == expected
+
+    @pytest.mark.skipif(not PY36, reason='Fold not available until PY3.6')
+    @pytest.mark.parametrize('fold', [0, 1])
+    @pytest.mark.parametrize('tz', ['dateutil/Europe/London', 'Europe/London'])
+    def test_replace_dst_fold(self, fold, tz):
+        # GH 25017
+        d = datetime(2019, 10, 27, 2, 30)
+        ts = Timestamp(d, tz=tz)
+        result = ts.replace(hour=1, fold=fold)
+        expected = Timestamp(datetime(2019, 10, 27, 1, 30)).tz_localize(
+            tz, ambiguous=not fold
+        )
+        assert result == expected
+
+    # --------------------------------------------------------------
+    # Timestamp.normalize
+
+    @pytest.mark.parametrize('arg', ['2013-11-30', '2013-11-30 12:00:00'])
+    def test_normalize(self, tz_naive_fixture, arg):
+        tz = tz_naive_fixture
+        ts = Timestamp(arg, tz=tz)
+        result = ts.normalize()
+        expected = Timestamp('2013-11-30', tz=tz)
+        assert result == expected
+
+    # --------------------------------------------------------------
+
+    @td.skip_if_windows
+    def test_timestamp(self):
+        # GH#17329
+        # tz-naive --> treat it as if it were UTC for purposes of timestamp()
+        ts = Timestamp.now()
+        uts = ts.replace(tzinfo=utc)
+        assert ts.timestamp() == uts.timestamp()
+
+        tsc = Timestamp('2014-10-11 11:00:01.12345678', tz='US/Central')
+        utsc = tsc.tz_convert('UTC')
+
+        # utsc is a different representation of the same time
+        assert tsc.timestamp() == utsc.timestamp()
+
+        if PY3:
+            # datetime.timestamp() converts in the local timezone
+            with tm.set_timezone('UTC'):
+                # should agree with datetime.timestamp method
+                dt = ts.to_pydatetime()
+                assert dt.timestamp() == ts.timestamp()
diff --git a/pandas/tests/series/common.py b/pandas/tests/series/common.py
index 613961e1c670f..cacca38b2d608 100644
--- a/pandas/tests/series/common.py
+++ b/pandas/tests/series/common.py
@@ -1,6 +1,7 @@
-from pandas.util.decorators import cache_readonly
-import pandas.util.testing as tm
+from pandas.util._decorators import cache_readonly
+
 import pandas as pd
+import pandas.util.testing as tm
 
 _ts = tm.makeTimeSeries()
 
diff --git a/pandas/tests/series/conftest.py b/pandas/tests/series/conftest.py
new file mode 100644
index 0000000000000..367e7a1baa7f3
--- /dev/null
+++ b/pandas/tests/series/conftest.py
@@ -0,0 +1,33 @@
+import pytest
+
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def datetime_series():
+    """
+    Fixture for Series of floats with DatetimeIndex
+    """
+    s = tm.makeTimeSeries()
+    s.name = 'ts'
+    return s
+
+
+@pytest.fixture
+def string_series():
+    """
+    Fixture for Series of floats with Index of unique strings
+    """
+    s = tm.makeStringSeries()
+    s.name = 'series'
+    return s
+
+
+@pytest.fixture
+def object_series():
+    """
+    Fixture for Series of dtype datetime64[ns] with Index of unique strings
+    """
+    s = tm.makeObjectSeries()
+    s.name = 'objects'
+    return s
diff --git a/pandas/tests/series/indexing/__init__.py b/pandas/tests/series/indexing/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/series/indexing/conftest.py b/pandas/tests/series/indexing/conftest.py
new file mode 100644
index 0000000000000..0e06f6b8e4640
--- /dev/null
+++ b/pandas/tests/series/indexing/conftest.py
@@ -0,0 +1,8 @@
+import pytest
+
+from pandas.tests.series.common import TestData
+
+
+@pytest.fixture(scope='module')
+def test_data():
+    return TestData()
diff --git a/pandas/tests/series/indexing/test_alter_index.py b/pandas/tests/series/indexing/test_alter_index.py
new file mode 100644
index 0000000000000..a826a0644fa78
--- /dev/null
+++ b/pandas/tests/series/indexing/test_alter_index.py
@@ -0,0 +1,564 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+from datetime import datetime
+
+import numpy as np
+from numpy import nan
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import lrange, range
+
+import pandas as pd
+from pandas import Categorical, Series, date_range, isna
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
+
+
+@pytest.mark.parametrize(
+    'first_slice,second_slice', [
+        [[2, None], [None, -5]],
+        [[None, 0], [None, -5]],
+        [[None, -5], [None, 0]],
+        [[None, 0], [None, 0]]
+    ])
+@pytest.mark.parametrize('fill', [None, -1])
+def test_align(test_data, first_slice, second_slice, join_type, fill):
+    a = test_data.ts[slice(*first_slice)]
+    b = test_data.ts[slice(*second_slice)]
+
+    aa, ab = a.align(b, join=join_type, fill_value=fill)
+
+    join_index = a.index.join(b.index, how=join_type)
+    if fill is not None:
+        diff_a = aa.index.difference(join_index)
+        diff_b = ab.index.difference(join_index)
+        if len(diff_a) > 0:
+            assert (aa.reindex(diff_a) == fill).all()
+        if len(diff_b) > 0:
+            assert (ab.reindex(diff_b) == fill).all()
+
+    ea = a.reindex(join_index)
+    eb = b.reindex(join_index)
+
+    if fill is not None:
+        ea = ea.fillna(fill)
+        eb = eb.fillna(fill)
+
+    assert_series_equal(aa, ea)
+    assert_series_equal(ab, eb)
+    assert aa.name == 'ts'
+    assert ea.name == 'ts'
+    assert ab.name == 'ts'
+    assert eb.name == 'ts'
+
+
+@pytest.mark.parametrize(
+    'first_slice,second_slice', [
+        [[2, None], [None, -5]],
+        [[None, 0], [None, -5]],
+        [[None, -5], [None, 0]],
+        [[None, 0], [None, 0]]
+    ])
+@pytest.mark.parametrize('method', ['pad', 'bfill'])
+@pytest.mark.parametrize('limit', [None, 1])
+def test_align_fill_method(test_data,
+                           first_slice, second_slice,
+                           join_type, method, limit):
+    a = test_data.ts[slice(*first_slice)]
+    b = test_data.ts[slice(*second_slice)]
+
+    aa, ab = a.align(b, join=join_type, method=method, limit=limit)
+
+    join_index = a.index.join(b.index, how=join_type)
+    ea = a.reindex(join_index)
+    eb = b.reindex(join_index)
+
+    ea = ea.fillna(method=method, limit=limit)
+    eb = eb.fillna(method=method, limit=limit)
+
+    assert_series_equal(aa, ea)
+    assert_series_equal(ab, eb)
+
+
+def test_align_nocopy(test_data):
+    b = test_data.ts[:5].copy()
+
+    # do copy
+    a = test_data.ts.copy()
+    ra, _ = a.align(b, join='left')
+    ra[:5] = 5
+    assert not (a[:5] == 5).any()
+
+    # do not copy
+    a = test_data.ts.copy()
+    ra, _ = a.align(b, join='left', copy=False)
+    ra[:5] = 5
+    assert (a[:5] == 5).all()
+
+    # do copy
+    a = test_data.ts.copy()
+    b = test_data.ts[:5].copy()
+    _, rb = a.align(b, join='right')
+    rb[:3] = 5
+    assert not (b[:3] == 5).any()
+
+    # do not copy
+    a = test_data.ts.copy()
+    b = test_data.ts[:5].copy()
+    _, rb = a.align(b, join='right', copy=False)
+    rb[:2] = 5
+    assert (b[:2] == 5).all()
+
+
+def test_align_same_index(test_data):
+    a, b = test_data.ts.align(test_data.ts, copy=False)
+    assert a.index is test_data.ts.index
+    assert b.index is test_data.ts.index
+
+    a, b = test_data.ts.align(test_data.ts, copy=True)
+    assert a.index is not test_data.ts.index
+    assert b.index is not test_data.ts.index
+
+
+def test_align_multiindex():
+    # GH 10665
+
+    midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
+                                      names=('a', 'b', 'c'))
+    idx = pd.Index(range(2), name='b')
+    s1 = pd.Series(np.arange(12, dtype='int64'), index=midx)
+    s2 = pd.Series(np.arange(2, dtype='int64'), index=idx)
+
+    # these must be the same results (but flipped)
+    res1l, res1r = s1.align(s2, join='left')
+    res2l, res2r = s2.align(s1, join='right')
+
+    expl = s1
+    tm.assert_series_equal(expl, res1l)
+    tm.assert_series_equal(expl, res2r)
+    expr = pd.Series([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
+    tm.assert_series_equal(expr, res1r)
+    tm.assert_series_equal(expr, res2l)
+
+    res1l, res1r = s1.align(s2, join='right')
+    res2l, res2r = s2.align(s1, join='left')
+
+    exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
+                                         names=('a', 'b', 'c'))
+    expl = pd.Series([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
+    tm.assert_series_equal(expl, res1l)
+    tm.assert_series_equal(expl, res2r)
+    expr = pd.Series([0, 0, 1, 1] * 2, index=exp_idx)
+    tm.assert_series_equal(expr, res1r)
+    tm.assert_series_equal(expr, res2l)
+
+
+def test_reindex(test_data):
+    identity = test_data.series.reindex(test_data.series.index)
+
+    # __array_interface__ is not defined for older numpies
+    # and on some pythons
+    try:
+        assert np.may_share_memory(test_data.series.index, identity.index)
+    except AttributeError:
+        pass
+
+    assert identity.index.is_(test_data.series.index)
+    assert identity.index.identical(test_data.series.index)
+
+    subIndex = test_data.series.index[10:20]
+    subSeries = test_data.series.reindex(subIndex)
+
+    for idx, val in compat.iteritems(subSeries):
+        assert val == test_data.series[idx]
+
+    subIndex2 = test_data.ts.index[10:20]
+    subTS = test_data.ts.reindex(subIndex2)
+
+    for idx, val in compat.iteritems(subTS):
+        assert val == test_data.ts[idx]
+    stuffSeries = test_data.ts.reindex(subIndex)
+
+    assert np.isnan(stuffSeries).all()
+
+    # This is extremely important for the Cython code to not screw up
+    nonContigIndex = test_data.ts.index[::2]
+    subNonContig = test_data.ts.reindex(nonContigIndex)
+    for idx, val in compat.iteritems(subNonContig):
+        assert val == test_data.ts[idx]
+
+    # return a copy the same index here
+    result = test_data.ts.reindex()
+    assert not (result is test_data.ts)
+
+
+def test_reindex_nan():
+    ts = Series([2, 3, 5, 7], index=[1, 4, nan, 8])
+
+    i, j = [nan, 1, nan, 8, 4, nan], [2, 0, 2, 3, 1, 2]
+    assert_series_equal(ts.reindex(i), ts.iloc[j])
+
+    ts.index = ts.index.astype('object')
+
+    # reindex coerces index.dtype to float, loc/iloc doesn't
+    assert_series_equal(ts.reindex(i), ts.iloc[j], check_index_type=False)
+
+
+def test_reindex_series_add_nat():
+    rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
+    series = Series(rng)
+
+    result = series.reindex(lrange(15))
+    assert np.issubdtype(result.dtype, np.dtype('M8[ns]'))
+
+    mask = result.isna()
+    assert mask[-5:].all()
+    assert not mask[:-5].any()
+
+
+def test_reindex_with_datetimes():
+    rng = date_range('1/1/2000', periods=20)
+    ts = Series(np.random.randn(20), index=rng)
+
+    result = ts.reindex(list(ts.index[5:10]))
+    expected = ts[5:10]
+    tm.assert_series_equal(result, expected)
+
+    result = ts[list(ts.index[5:10])]
+    tm.assert_series_equal(result, expected)
+
+
+def test_reindex_corner(test_data):
+    # (don't forget to fix this) I think it's fixed
+    test_data.empty.reindex(test_data.ts.index, method='pad')  # it works
+
+    # corner case: pad empty series
+    reindexed = test_data.empty.reindex(test_data.ts.index, method='pad')
+
+    # pass non-Index
+    reindexed = test_data.ts.reindex(list(test_data.ts.index))
+    assert_series_equal(test_data.ts, reindexed)
+
+    # bad fill method
+    ts = test_data.ts[::2]
+    msg = (r"Invalid fill method\. Expecting pad \(ffill\), backfill"
+           r" \(bfill\) or nearest\. Got foo")
+    with pytest.raises(ValueError, match=msg):
+        ts.reindex(test_data.ts.index, method='foo')
+
+
+def test_reindex_pad():
+    s = Series(np.arange(10), dtype='int64')
+    s2 = s[::2]
+
+    reindexed = s2.reindex(s.index, method='pad')
+    reindexed2 = s2.reindex(s.index, method='ffill')
+    assert_series_equal(reindexed, reindexed2)
+
+    expected = Series([0, 0, 2, 2, 4, 4, 6, 6, 8, 8], index=np.arange(10))
+    assert_series_equal(reindexed, expected)
+
+    # GH4604
+    s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 'd', 'e'])
+    new_index = ['a', 'g', 'c', 'f']
+    expected = Series([1, 1, 3, 3], index=new_index)
+
+    # this changes dtype because the ffill happens after
+    result = s.reindex(new_index).ffill()
+    assert_series_equal(result, expected.astype('float64'))
+
+    result = s.reindex(new_index).ffill(downcast='infer')
+    assert_series_equal(result, expected)
+
+    expected = Series([1, 5, 3, 5], index=new_index)
+    result = s.reindex(new_index, method='ffill')
+    assert_series_equal(result, expected)
+
+    # inference of new dtype
+    s = Series([True, False, False, True], index=list('abcd'))
+    new_index = 'agc'
+    result = s.reindex(list(new_index)).ffill()
+    expected = Series([True, True, False], index=list(new_index))
+    assert_series_equal(result, expected)
+
+    # GH4618 shifted series downcasting
+    s = Series(False, index=lrange(0, 5))
+    result = s.shift(1).fillna(method='bfill')
+    expected = Series(False, index=lrange(0, 5))
+    assert_series_equal(result, expected)
+
+
+def test_reindex_nearest():
+    s = Series(np.arange(10, dtype='int64'))
+    target = [0.1, 0.9, 1.5, 2.0]
+    actual = s.reindex(target, method='nearest')
+    expected = Series(np.around(target).astype('int64'), target)
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex_like(actual, method='nearest')
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex_like(actual, method='nearest', tolerance=1)
+    assert_series_equal(expected, actual)
+    actual = s.reindex_like(actual, method='nearest',
+                            tolerance=[1, 2, 3, 4])
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex(target, method='nearest', tolerance=0.2)
+    expected = Series([0, 1, np.nan, 2], target)
+    assert_series_equal(expected, actual)
+
+    actual = s.reindex(target, method='nearest',
+                       tolerance=[0.3, 0.01, 0.4, 3])
+    expected = Series([0, np.nan, np.nan, 2], target)
+    assert_series_equal(expected, actual)
+
+
+def test_reindex_backfill():
+    pass
+
+
+def test_reindex_int(test_data):
+    ts = test_data.ts[::2]
+    int_ts = Series(np.zeros(len(ts), dtype=int), index=ts.index)
+
+    # this should work fine
+    reindexed_int = int_ts.reindex(test_data.ts.index)
+
+    # if NaNs introduced
+    assert reindexed_int.dtype == np.float_
+
+    # NO NaNs introduced
+    reindexed_int = int_ts.reindex(int_ts.index[::2])
+    assert reindexed_int.dtype == np.int_
+
+
+def test_reindex_bool(test_data):
+    # A series other than float, int, string, or object
+    ts = test_data.ts[::2]
+    bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
+
+    # this should work fine
+    reindexed_bool = bool_ts.reindex(test_data.ts.index)
+
+    # if NaNs introduced
+    assert reindexed_bool.dtype == np.object_
+
+    # NO NaNs introduced
+    reindexed_bool = bool_ts.reindex(bool_ts.index[::2])
+    assert reindexed_bool.dtype == np.bool_
+
+
+def test_reindex_bool_pad(test_data):
+    # fail
+    ts = test_data.ts[5:]
+    bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
+    filled_bool = bool_ts.reindex(test_data.ts.index, method='pad')
+    assert isna(filled_bool[:5]).all()
+
+
+def test_reindex_categorical():
+    index = date_range('20000101', periods=3)
+
+    # reindexing to an invalid Categorical
+    s = Series(['a', 'b', 'c'], dtype='category')
+    result = s.reindex(index)
+    expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
+                                  categories=['a', 'b', 'c']))
+    expected.index = index
+    tm.assert_series_equal(result, expected)
+
+    # partial reindexing
+    expected = Series(Categorical(values=['b', 'c'], categories=['a', 'b',
+                                                                 'c']))
+    expected.index = [1, 2]
+    result = s.reindex([1, 2])
+    tm.assert_series_equal(result, expected)
+
+    expected = Series(Categorical(
+        values=['c', np.nan], categories=['a', 'b', 'c']))
+    expected.index = [2, 3]
+    result = s.reindex([2, 3])
+    tm.assert_series_equal(result, expected)
+
+
+def test_reindex_like(test_data):
+    other = test_data.ts[::2]
+    assert_series_equal(test_data.ts.reindex(other.index),
+                        test_data.ts.reindex_like(other))
+
+    # GH 7179
+    day1 = datetime(2013, 3, 5)
+    day2 = datetime(2013, 5, 5)
+    day3 = datetime(2014, 3, 5)
+
+    series1 = Series([5, None, None], [day1, day2, day3])
+    series2 = Series([None, None], [day1, day3])
+
+    result = series1.reindex_like(series2, method='pad')
+    expected = Series([5, np.nan], index=[day1, day3])
+    assert_series_equal(result, expected)
+
+
+def test_reindex_fill_value():
+    # -----------------------------------------------------------
+    # floats
+    floats = Series([1., 2., 3.])
+    result = floats.reindex([1, 2, 3])
+    expected = Series([2., 3., np.nan], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    result = floats.reindex([1, 2, 3], fill_value=0)
+    expected = Series([2., 3., 0], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    # -----------------------------------------------------------
+    # ints
+    ints = Series([1, 2, 3])
+
+    result = ints.reindex([1, 2, 3])
+    expected = Series([2., 3., np.nan], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+    # don't upcast
+    result = ints.reindex([1, 2, 3], fill_value=0)
+    expected = Series([2, 3, 0], index=[1, 2, 3])
+    assert issubclass(result.dtype.type, np.integer)
+    assert_series_equal(result, expected)
+
+    # -----------------------------------------------------------
+    # objects
+    objects = Series([1, 2, 3], dtype=object)
+
+    result = objects.reindex([1, 2, 3])
+    expected = Series([2, 3, np.nan], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    result = objects.reindex([1, 2, 3], fill_value='foo')
+    expected = Series([2, 3, 'foo'], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    # ------------------------------------------------------------
+    # bools
+    bools = Series([True, False, True])
+
+    result = bools.reindex([1, 2, 3])
+    expected = Series([False, True, np.nan], index=[1, 2, 3], dtype=object)
+    assert_series_equal(result, expected)
+
+    result = bools.reindex([1, 2, 3], fill_value=False)
+    expected = Series([False, True, False], index=[1, 2, 3])
+    assert_series_equal(result, expected)
+
+
+def test_reindex_datetimeindexes_tz_naive_and_aware():
+    # GH 8306
+    idx = date_range('20131101', tz='America/Chicago', periods=7)
+    newidx = date_range('20131103', periods=10, freq='H')
+    s = Series(range(7), index=idx)
+    with pytest.raises(TypeError):
+        s.reindex(newidx, method='ffill')
+
+
+def test_reindex_empty_series_tz_dtype():
+    # GH 20869
+    result = Series(dtype='datetime64[ns, UTC]').reindex([0, 1])
+    expected = Series([pd.NaT] * 2, dtype='datetime64[ns, UTC]')
+    tm.assert_equal(result, expected)
+
+
+def test_rename():
+    # GH 17407
+    s = Series(range(1, 6), index=pd.Index(range(2, 7), name='IntIndex'))
+    result = s.rename(str)
+    expected = s.rename(lambda i: str(i))
+    assert_series_equal(result, expected)
+
+    assert result.name == expected.name
+
+
+@pytest.mark.parametrize(
+    'data, index, drop_labels,'
+    ' axis, expected_data, expected_index',
+    [
+        # Unique Index
+        ([1, 2], ['one', 'two'], ['two'],
+         0, [1], ['one']),
+        ([1, 2], ['one', 'two'], ['two'],
+         'rows', [1], ['one']),
+        ([1, 1, 2], ['one', 'two', 'one'], ['two'],
+         0, [1, 2], ['one', 'one']),
+
+        # GH 5248 Non-Unique Index
+        ([1, 1, 2], ['one', 'two', 'one'], 'two',
+         0, [1, 2], ['one', 'one']),
+        ([1, 1, 2], ['one', 'two', 'one'], ['one'],
+         0, [1], ['two']),
+        ([1, 1, 2], ['one', 'two', 'one'], 'one',
+         0, [1], ['two'])])
+def test_drop_unique_and_non_unique_index(data, index, axis, drop_labels,
+                                          expected_data, expected_index):
+
+    s = Series(data=data, index=index)
+    result = s.drop(drop_labels, axis=axis)
+    expected = Series(data=expected_data, index=expected_index)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize(
+    'data, index, drop_labels,'
+    ' axis, error_type, error_desc',
+    [
+        # single string/tuple-like
+        (range(3), list('abc'), 'bc',
+         0, KeyError, 'not found in axis'),
+
+        # bad axis
+        (range(3), list('abc'), ('a',),
+         0, KeyError, 'not found in axis'),
+        (range(3), list('abc'), 'one',
+         'columns', ValueError, 'No axis named columns')])
+def test_drop_exception_raised(data, index, drop_labels,
+                               axis, error_type, error_desc):
+
+    with pytest.raises(error_type, match=error_desc):
+        Series(data, index=index).drop(drop_labels, axis=axis)
+
+
+def test_drop_with_ignore_errors():
+    # errors='ignore'
+    s = Series(range(3), index=list('abc'))
+    result = s.drop('bc', errors='ignore')
+    tm.assert_series_equal(result, s)
+    result = s.drop(['a', 'd'], errors='ignore')
+    expected = s.iloc[1:]
+    tm.assert_series_equal(result, expected)
+
+    # GH 8522
+    s = Series([2, 3], index=[True, False])
+    assert s.index.is_object()
+    result = s.drop(True)
+    expected = Series([3], index=[False])
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('index', [[1, 2, 3], [1, 1, 3]])
+@pytest.mark.parametrize('drop_labels', [[], [1], [3]])
+def test_drop_empty_list(index, drop_labels):
+    # GH 21494
+    expected_index = [i for i in index if i not in drop_labels]
+    series = pd.Series(index=index).drop(drop_labels)
+    tm.assert_series_equal(series, pd.Series(index=expected_index))
+
+
+@pytest.mark.parametrize('data, index, drop_labels', [
+    (None, [1, 2, 3], [1, 4]),
+    (None, [1, 2, 2], [1, 4]),
+    ([2, 3], [0, 1], [False, True])
+])
+def test_drop_non_empty_list(data, index, drop_labels):
+    # GH 21494 and GH 16877
+    with pytest.raises(KeyError, match='not found in axis'):
+        pd.Series(data=data, index=index).drop(drop_labels)
diff --git a/pandas/tests/series/indexing/test_boolean.py b/pandas/tests/series/indexing/test_boolean.py
new file mode 100644
index 0000000000000..9017d13051b88
--- /dev/null
+++ b/pandas/tests/series/indexing/test_boolean.py
@@ -0,0 +1,634 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, range
+
+from pandas.core.dtypes.common import is_integer
+
+import pandas as pd
+from pandas import Index, Series, Timestamp, date_range, isna
+from pandas.core.indexing import IndexingError
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
+
+from pandas.tseries.offsets import BDay
+
+
+def test_getitem_boolean(test_data):
+    s = test_data.series
+    mask = s > s.median()
+
+    # passing list is OK
+    result = s[list(mask)]
+    expected = s[mask]
+    assert_series_equal(result, expected)
+    tm.assert_index_equal(result.index, s.index[mask])
+
+
+def test_getitem_boolean_empty():
+    s = Series([], dtype=np.int64)
+    s.index.name = 'index_name'
+    s = s[s.isna()]
+    assert s.index.name == 'index_name'
+    assert s.dtype == np.int64
+
+    # GH5877
+    # indexing with empty series
+    s = Series(['A', 'B'])
+    expected = Series(np.nan, index=['C'], dtype=object)
+    result = s[Series(['C'], dtype=object)]
+    assert_series_equal(result, expected)
+
+    s = Series(['A', 'B'])
+    expected = Series(dtype=object, index=Index([], dtype='int64'))
+    result = s[Series([], dtype=object)]
+    assert_series_equal(result, expected)
+
+    # invalid because of the boolean indexer
+    # that's empty or not-aligned
+    msg = (r"Unalignable boolean Series provided as indexer \(index of"
+           r" the boolean Series and of the indexed object do not match")
+    with pytest.raises(IndexingError, match=msg):
+        s[Series([], dtype=bool)]
+
+    with pytest.raises(IndexingError, match=msg):
+        s[Series([True], dtype=bool)]
+
+
+def test_getitem_boolean_object(test_data):
+    # using column from DataFrame
+
+    s = test_data.series
+    mask = s > s.median()
+    omask = mask.astype(object)
+
+    # getitem
+    result = s[omask]
+    expected = s[mask]
+    assert_series_equal(result, expected)
+
+    # setitem
+    s2 = s.copy()
+    cop = s.copy()
+    cop[omask] = 5
+    s2[mask] = 5
+    assert_series_equal(cop, s2)
+
+    # nans raise exception
+    omask[5:10] = np.nan
+    msg = "cannot index with vector containing NA / NaN values"
+    with pytest.raises(ValueError, match=msg):
+        s[omask]
+    with pytest.raises(ValueError, match=msg):
+        s[omask] = 5
+
+
+def test_getitem_setitem_boolean_corner(test_data):
+    ts = test_data.ts
+    mask_shifted = ts.shift(1, freq=BDay()) > ts.median()
+
+    # these used to raise...??
+
+    msg = (r"Unalignable boolean Series provided as indexer \(index of"
+           r" the boolean Series and of the indexed object do not match")
+    with pytest.raises(IndexingError, match=msg):
+        ts[mask_shifted]
+    with pytest.raises(IndexingError, match=msg):
+        ts[mask_shifted] = 1
+
+    with pytest.raises(IndexingError, match=msg):
+        ts.loc[mask_shifted]
+    with pytest.raises(IndexingError, match=msg):
+        ts.loc[mask_shifted] = 1
+
+
+def test_setitem_boolean(test_data):
+    mask = test_data.series > test_data.series.median()
+
+    # similar indexed series
+    result = test_data.series.copy()
+    result[mask] = test_data.series * 2
+    expected = test_data.series * 2
+    assert_series_equal(result[mask], expected[mask])
+
+    # needs alignment
+    result = test_data.series.copy()
+    result[mask] = (test_data.series * 2)[0:5]
+    expected = (test_data.series * 2)[0:5].reindex_like(test_data.series)
+    expected[-mask] = test_data.series[mask]
+    assert_series_equal(result[mask], expected[mask])
+
+
+def test_get_set_boolean_different_order(test_data):
+    ordered = test_data.series.sort_values()
+
+    # setting
+    copy = test_data.series.copy()
+    copy[ordered > 0] = 0
+
+    expected = test_data.series.copy()
+    expected[expected > 0] = 0
+
+    assert_series_equal(copy, expected)
+
+    # getting
+    sel = test_data.series[ordered > 0]
+    exp = test_data.series[test_data.series > 0]
+    assert_series_equal(sel, exp)
+
+
+def test_where_unsafe_int(sint_dtype):
+    s = Series(np.arange(10), dtype=sint_dtype)
+    mask = s < 5
+
+    s[mask] = lrange(2, 7)
+    expected = Series(lrange(2, 7) + lrange(5, 10), dtype=sint_dtype)
+
+    assert_series_equal(s, expected)
+
+
+def test_where_unsafe_float(float_dtype):
+    s = Series(np.arange(10), dtype=float_dtype)
+    mask = s < 5
+
+    s[mask] = lrange(2, 7)
+    expected = Series(lrange(2, 7) + lrange(5, 10), dtype=float_dtype)
+
+    assert_series_equal(s, expected)
+
+
+@pytest.mark.parametrize("dtype,expected_dtype", [
+    (np.int8, np.float64),
+    (np.int16, np.float64),
+    (np.int32, np.float64),
+    (np.int64, np.float64),
+    (np.float32, np.float32),
+    (np.float64, np.float64)
+])
+def test_where_unsafe_upcast(dtype, expected_dtype):
+    # see gh-9743
+    s = Series(np.arange(10), dtype=dtype)
+    values = [2.5, 3.5, 4.5, 5.5, 6.5]
+    mask = s < 5
+    expected = Series(values + lrange(5, 10), dtype=expected_dtype)
+    s[mask] = values
+    assert_series_equal(s, expected)
+
+
+def test_where_unsafe():
+    # see gh-9731
+    s = Series(np.arange(10), dtype="int64")
+    values = [2.5, 3.5, 4.5, 5.5]
+
+    mask = s > 5
+    expected = Series(lrange(6) + values, dtype="float64")
+
+    s[mask] = values
+    assert_series_equal(s, expected)
+
+    # see gh-3235
+    s = Series(np.arange(10), dtype='int64')
+    mask = s < 5
+    s[mask] = lrange(2, 7)
+    expected = Series(lrange(2, 7) + lrange(5, 10), dtype='int64')
+    assert_series_equal(s, expected)
+    assert s.dtype == expected.dtype
+
+    s = Series(np.arange(10), dtype='int64')
+    mask = s > 5
+    s[mask] = [0] * 4
+    expected = Series([0, 1, 2, 3, 4, 5] + [0] * 4, dtype='int64')
+    assert_series_equal(s, expected)
+
+    s = Series(np.arange(10))
+    mask = s > 5
+
+    msg = "cannot assign mismatch length to masked array"
+    with pytest.raises(ValueError, match=msg):
+        s[mask] = [5, 4, 3, 2, 1]
+
+    with pytest.raises(ValueError, match=msg):
+        s[mask] = [0] * 5
+
+    # dtype changes
+    s = Series([1, 2, 3, 4])
+    result = s.where(s > 2, np.nan)
+    expected = Series([np.nan, np.nan, 3, 4])
+    assert_series_equal(result, expected)
+
+    # GH 4667
+    # setting with None changes dtype
+    s = Series(range(10)).astype(float)
+    s[8] = None
+    result = s[8]
+    assert isna(result)
+
+    s = Series(range(10)).astype(float)
+    s[s > 8] = None
+    result = s[isna(s)]
+    expected = Series(np.nan, index=[9])
+    assert_series_equal(result, expected)
+
+
+def test_where_raise_on_error_deprecation():
+    # gh-14968
+    # deprecation of raise_on_error
+    s = Series(np.random.randn(5))
+    cond = s > 0
+    with tm.assert_produces_warning(FutureWarning):
+        s.where(cond, raise_on_error=True)
+    with tm.assert_produces_warning(FutureWarning):
+        s.mask(cond, raise_on_error=True)
+
+
+def test_where():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.where(cond).dropna()
+    rs2 = s[cond]
+    assert_series_equal(rs, rs2)
+
+    rs = s.where(cond, -s)
+    assert_series_equal(rs, s.abs())
+
+    rs = s.where(cond)
+    assert (s.shape == rs.shape)
+    assert (rs is not s)
+
+    # test alignment
+    cond = Series([True, False, False, True, False], index=s.index)
+    s2 = -(s.abs())
+
+    expected = s2[cond].reindex(s2.index[:3]).reindex(s2.index)
+    rs = s2.where(cond[:3])
+    assert_series_equal(rs, expected)
+
+    expected = s2.abs()
+    expected.iloc[0] = s2[0]
+    rs = s2.where(cond[:3], -s2)
+    assert_series_equal(rs, expected)
+
+
+def test_where_error():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    msg = "Array conditional must be same shape as self"
+    with pytest.raises(ValueError, match=msg):
+        s.where(1)
+    with pytest.raises(ValueError, match=msg):
+        s.where(cond[:3].values, -s)
+
+    # GH 2745
+    s = Series([1, 2])
+    s[[True, False]] = [0, 1]
+    expected = Series([0, 2])
+    assert_series_equal(s, expected)
+
+    # failures
+    msg = "cannot assign mismatch length to masked array"
+    with pytest.raises(ValueError, match=msg):
+        s[[True, False]] = [0, 2, 3]
+    msg = ("NumPy boolean array indexing assignment cannot assign 0 input"
+           " values to the 1 output values where the mask is true")
+    with pytest.raises(ValueError, match=msg):
+        s[[True, False]] = []
+
+
+@pytest.mark.parametrize('klass', [list, tuple, np.array, Series])
+def test_where_array_like(klass):
+    # see gh-15414
+    s = Series([1, 2, 3])
+    cond = [False, True, True]
+    expected = Series([np.nan, 2, 3])
+
+    result = s.where(klass(cond))
+    assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('cond', [
+    [1, 0, 1],
+    Series([2, 5, 7]),
+    ["True", "False", "True"],
+    [Timestamp("2017-01-01"), pd.NaT, Timestamp("2017-01-02")]
+])
+def test_where_invalid_input(cond):
+    # see gh-15414: only boolean arrays accepted
+    s = Series([1, 2, 3])
+    msg = "Boolean array expected for the condition"
+
+    with pytest.raises(ValueError, match=msg):
+        s.where(cond)
+
+    msg = "Array conditional must be same shape as self"
+    with pytest.raises(ValueError, match=msg):
+        s.where([True])
+
+
+def test_where_ndframe_align():
+    msg = "Array conditional must be same shape as self"
+    s = Series([1, 2, 3])
+
+    cond = [True]
+    with pytest.raises(ValueError, match=msg):
+        s.where(cond)
+
+    expected = Series([1, np.nan, np.nan])
+
+    out = s.where(Series(cond))
+    tm.assert_series_equal(out, expected)
+
+    cond = np.array([False, True, False, True])
+    with pytest.raises(ValueError, match=msg):
+        s.where(cond)
+
+    expected = Series([np.nan, 2, np.nan])
+
+    out = s.where(Series(cond))
+    tm.assert_series_equal(out, expected)
+
+
+def test_where_setitem_invalid():
+    # GH 2702
+    # make sure correct exceptions are raised on invalid list assignment
+
+    msg = ("cannot set using a {} indexer with a different length than"
+           " the value")
+
+    # slice
+    s = Series(list('abc'))
+
+    with pytest.raises(ValueError, match=msg.format('slice')):
+        s[0:3] = list(range(27))
+
+    s[0:3] = list(range(3))
+    expected = Series([0, 1, 2])
+    assert_series_equal(s.astype(np.int64), expected, )
+
+    # slice with step
+    s = Series(list('abcdef'))
+
+    with pytest.raises(ValueError, match=msg.format('slice')):
+        s[0:4:2] = list(range(27))
+
+    s = Series(list('abcdef'))
+    s[0:4:2] = list(range(2))
+    expected = Series([0, 'b', 1, 'd', 'e', 'f'])
+    assert_series_equal(s, expected)
+
+    # neg slices
+    s = Series(list('abcdef'))
+
+    with pytest.raises(ValueError, match=msg.format('slice')):
+        s[:-1] = list(range(27))
+
+    s[-3:-1] = list(range(2))
+    expected = Series(['a', 'b', 'c', 0, 1, 'f'])
+    assert_series_equal(s, expected)
+
+    # list
+    s = Series(list('abc'))
+
+    with pytest.raises(ValueError, match=msg.format('list-like')):
+        s[[0, 1, 2]] = list(range(27))
+
+    s = Series(list('abc'))
+
+    with pytest.raises(ValueError, match=msg.format('list-like')):
+        s[[0, 1, 2]] = list(range(2))
+
+    # scalar
+    s = Series(list('abc'))
+    s[0] = list(range(10))
+    expected = Series([list(range(10)), 'b', 'c'])
+    assert_series_equal(s, expected)
+
+
+@pytest.mark.parametrize('size', range(2, 6))
+@pytest.mark.parametrize('mask', [
+    [True, False, False, False, False],
+    [True, False],
+    [False]
+])
+@pytest.mark.parametrize('item', [
+    2.0, np.nan, np.finfo(np.float).max, np.finfo(np.float).min
+])
+# Test numpy arrays, lists and tuples as the input to be
+# broadcast
+@pytest.mark.parametrize('box', [
+    lambda x: np.array([x]),
+    lambda x: [x],
+    lambda x: (x,)
+])
+def test_broadcast(size, mask, item, box):
+    selection = np.resize(mask, size)
+
+    data = np.arange(size, dtype=float)
+
+    # Construct the expected series by taking the source
+    # data or item based on the selection
+    expected = Series([item if use_item else data[
+        i] for i, use_item in enumerate(selection)])
+
+    s = Series(data)
+    s[selection] = box(item)
+    assert_series_equal(s, expected)
+
+    s = Series(data)
+    result = s.where(~selection, box(item))
+    assert_series_equal(result, expected)
+
+    s = Series(data)
+    result = s.mask(selection, box(item))
+    assert_series_equal(result, expected)
+
+
+def test_where_inplace():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.copy()
+
+    rs.where(cond, inplace=True)
+    assert_series_equal(rs.dropna(), s[cond])
+    assert_series_equal(rs, s.where(cond))
+
+    rs = s.copy()
+    rs.where(cond, -s, inplace=True)
+    assert_series_equal(rs, s.where(cond, -s))
+
+
+def test_where_dups():
+    # GH 4550
+    # where crashes with dups in index
+    s1 = Series(list(range(3)))
+    s2 = Series(list(range(3)))
+    comb = pd.concat([s1, s2])
+    result = comb.where(comb < 2)
+    expected = Series([0, 1, np.nan, 0, 1, np.nan],
+                      index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(result, expected)
+
+    # GH 4548
+    # inplace updating not working with dups
+    comb[comb < 1] = 5
+    expected = Series([5, 1, 2, 5, 1, 2], index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(comb, expected)
+
+    comb[comb < 2] += 10
+    expected = Series([5, 11, 2, 5, 11, 2], index=[0, 1, 2, 0, 1, 2])
+    assert_series_equal(comb, expected)
+
+
+def test_where_numeric_with_string():
+    # GH 9280
+    s = pd.Series([1, 2, 3])
+    w = s.where(s > 1, 'X')
+
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+    w = s.where(s > 1, ['X', 'Y', 'Z'])
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+    w = s.where(s > 1, np.array(['X', 'Y', 'Z']))
+    assert not is_integer(w[0])
+    assert is_integer(w[1])
+    assert is_integer(w[2])
+    assert isinstance(w[0], str)
+    assert w.dtype == 'object'
+
+
+def test_where_timedelta_coerce():
+    s = Series([1, 2], dtype='timedelta64[ns]')
+    expected = Series([10, 10])
+    mask = np.array([False, False])
+
+    rs = s.where(mask, [10, 10])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10.0)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, 10.0])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, np.nan])
+    expected = Series([10, None], dtype='object')
+    assert_series_equal(rs, expected)
+
+
+def test_where_datetime_conversion():
+    s = Series(date_range('20130102', periods=2))
+    expected = Series([10, 10])
+    mask = np.array([False, False])
+
+    rs = s.where(mask, [10, 10])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, 10.0)
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, 10.0])
+    assert_series_equal(rs, expected)
+
+    rs = s.where(mask, [10.0, np.nan])
+    expected = Series([10, None], dtype='object')
+    assert_series_equal(rs, expected)
+
+    # GH 15701
+    timestamps = ['2016-12-31 12:00:04+00:00',
+                  '2016-12-31 12:00:04.010000+00:00']
+    s = Series([pd.Timestamp(t) for t in timestamps])
+    rs = s.where(Series([False, True]))
+    expected = Series([pd.NaT, s[1]])
+    assert_series_equal(rs, expected)
+
+
+def test_where_dt_tz_values(tz_naive_fixture):
+    ser1 = pd.Series(pd.DatetimeIndex(['20150101', '20150102', '20150103'],
+                                      tz=tz_naive_fixture))
+    ser2 = pd.Series(pd.DatetimeIndex(['20160514', '20160515', '20160516'],
+                                      tz=tz_naive_fixture))
+    mask = pd.Series([True, True, False])
+    result = ser1.where(mask, ser2)
+    exp = pd.Series(pd.DatetimeIndex(['20150101', '20150102', '20160516'],
+                                     tz=tz_naive_fixture))
+    assert_series_equal(exp, result)
+
+
+def test_mask():
+    # compare with tested results in test_where
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.where(~cond, np.nan)
+    assert_series_equal(rs, s.mask(cond))
+
+    rs = s.where(~cond)
+    rs2 = s.mask(cond)
+    assert_series_equal(rs, rs2)
+
+    rs = s.where(~cond, -s)
+    rs2 = s.mask(cond, -s)
+    assert_series_equal(rs, rs2)
+
+    cond = Series([True, False, False, True, False], index=s.index)
+    s2 = -(s.abs())
+    rs = s2.where(~cond[:3])
+    rs2 = s2.mask(cond[:3])
+    assert_series_equal(rs, rs2)
+
+    rs = s2.where(~cond[:3], -s2)
+    rs2 = s2.mask(cond[:3], -s2)
+    assert_series_equal(rs, rs2)
+
+    msg = "Array conditional must be same shape as self"
+    with pytest.raises(ValueError, match=msg):
+        s.mask(1)
+    with pytest.raises(ValueError, match=msg):
+        s.mask(cond[:3].values, -s)
+
+    # dtype changes
+    s = Series([1, 2, 3, 4])
+    result = s.mask(s > 2, np.nan)
+    expected = Series([1, 2, np.nan, np.nan])
+    assert_series_equal(result, expected)
+
+    # see gh-21891
+    s = Series([1, 2])
+    res = s.mask([True, False])
+
+    exp = Series([np.nan, 2])
+    tm.assert_series_equal(res, exp)
+
+
+def test_mask_inplace():
+    s = Series(np.random.randn(5))
+    cond = s > 0
+
+    rs = s.copy()
+    rs.mask(cond, inplace=True)
+    assert_series_equal(rs.dropna(), s[~cond])
+    assert_series_equal(rs, s.mask(cond))
+
+    rs = s.copy()
+    rs.mask(cond, -s, inplace=True)
+    assert_series_equal(rs, s.mask(cond, -s))
diff --git a/pandas/tests/series/indexing/test_callable.py b/pandas/tests/series/indexing/test_callable.py
new file mode 100644
index 0000000000000..b656137545903
--- /dev/null
+++ b/pandas/tests/series/indexing/test_callable.py
@@ -0,0 +1,33 @@
+import pandas as pd
+import pandas.util.testing as tm
+
+
+def test_getitem_callable():
+    # GH 12533
+    s = pd.Series(4, index=list('ABCD'))
+    result = s[lambda x: 'A']
+    assert result == s.loc['A']
+
+    result = s[lambda x: ['A', 'B']]
+    tm.assert_series_equal(result, s.loc[['A', 'B']])
+
+    result = s[lambda x: [True, False, True, True]]
+    tm.assert_series_equal(result, s.iloc[[0, 2, 3]])
+
+
+def test_setitem_callable():
+    # GH 12533
+    s = pd.Series([1, 2, 3, 4], index=list('ABCD'))
+    s[lambda x: 'A'] = -1
+    tm.assert_series_equal(s, pd.Series([-1, 2, 3, 4], index=list('ABCD')))
+
+
+def test_setitem_other_callable():
+    # GH 13299
+    inc = lambda x: x + 1
+
+    s = pd.Series([1, 2, -1, 4])
+    s[s < 0] = inc
+
+    expected = pd.Series([1, 2, inc, 4])
+    tm.assert_series_equal(s, expected)
diff --git a/pandas/tests/series/indexing/test_datetime.py b/pandas/tests/series/indexing/test_datetime.py
new file mode 100644
index 0000000000000..0efc9feb0dbd4
--- /dev/null
+++ b/pandas/tests/series/indexing/test_datetime.py
@@ -0,0 +1,714 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas._libs import iNaT
+import pandas._libs.index as _index
+from pandas.compat import lrange, range
+
+import pandas as pd
+from pandas import DataFrame, DatetimeIndex, NaT, Series, Timestamp, date_range
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+
+"""
+Also test support for datetime64[ns] in Series / DataFrame
+"""
+
+
+def test_fancy_getitem():
+    dti = date_range(freq='WOM-1FRI', start=datetime(2005, 1, 1),
+                     end=datetime(2010, 1, 1))
+
+    s = Series(np.arange(len(dti)), index=dti)
+
+    assert s[48] == 48
+    assert s['1/2/2009'] == 48
+    assert s['2009-1-2'] == 48
+    assert s[datetime(2009, 1, 2)] == 48
+    assert s[Timestamp(datetime(2009, 1, 2))] == 48
+    with pytest.raises(KeyError, match=r"^'2009-1-3'$"):
+        s['2009-1-3']
+    assert_series_equal(s['3/6/2009':'2009-06-05'],
+                        s[datetime(2009, 3, 6):datetime(2009, 6, 5)])
+
+
+def test_fancy_setitem():
+    dti = date_range(freq='WOM-1FRI', start=datetime(2005, 1, 1),
+                     end=datetime(2010, 1, 1))
+
+    s = Series(np.arange(len(dti)), index=dti)
+    s[48] = -1
+    assert s[48] == -1
+    s['1/2/2009'] = -2
+    assert s[48] == -2
+    s['1/2/2009':'2009-06-05'] = -3
+    assert (s[48:54] == -3).all()
+
+
+def test_dti_snap():
+    dti = DatetimeIndex(['1/1/2002', '1/2/2002', '1/3/2002', '1/4/2002',
+                         '1/5/2002', '1/6/2002', '1/7/2002'], freq='D')
+
+    res = dti.snap(freq='W-MON')
+    exp = date_range('12/31/2001', '1/7/2002', freq='w-mon')
+    exp = exp.repeat([3, 4])
+    assert (res == exp).all()
+
+    res = dti.snap(freq='B')
+
+    exp = date_range('1/1/2002', '1/7/2002', freq='b')
+    exp = exp.repeat([1, 1, 1, 2, 2])
+    assert (res == exp).all()
+
+
+def test_dti_reset_index_round_trip():
+    dti = date_range(start='1/1/2001', end='6/1/2001', freq='D')
+    d1 = DataFrame({'v': np.random.rand(len(dti))}, index=dti)
+    d2 = d1.reset_index()
+    assert d2.dtypes[0] == np.dtype('M8[ns]')
+    d3 = d2.set_index('index')
+    assert_frame_equal(d1, d3, check_names=False)
+
+    # #2329
+    stamp = datetime(2012, 11, 22)
+    df = DataFrame([[stamp, 12.1]], columns=['Date', 'Value'])
+    df = df.set_index('Date')
+
+    assert df.index[0] == stamp
+    assert df.reset_index()['Date'][0] == stamp
+
+
+def test_series_set_value():
+    # #1561
+
+    dates = [datetime(2001, 1, 1), datetime(2001, 1, 2)]
+    index = DatetimeIndex(dates)
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        s = Series().set_value(dates[0], 1.)
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        s2 = s.set_value(dates[1], np.nan)
+
+    exp = Series([1., np.nan], index=index)
+
+    assert_series_equal(s2, exp)
+
+    # s = Series(index[:1], index[:1])
+    # s2 = s.set_value(dates[1], index[1])
+    # assert s2.values.dtype == 'M8[ns]'
+
+
+@pytest.mark.slow
+def test_slice_locs_indexerror():
+    times = [datetime(2000, 1, 1) + timedelta(minutes=i * 10)
+             for i in range(100000)]
+    s = Series(lrange(100000), times)
+    s.loc[datetime(1900, 1, 1):datetime(2100, 1, 1)]
+
+
+def test_slicing_datetimes():
+    # GH 7523
+
+    # unique
+    df = DataFrame(np.arange(4., dtype='float64'),
+                   index=[datetime(2001, 1, i, 10, 00)
+                          for i in [1, 2, 3, 4]])
+    result = df.loc[datetime(2001, 1, 1, 10):]
+    assert_frame_equal(result, df)
+    result = df.loc[:datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+    result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+
+    result = df.loc[datetime(2001, 1, 1, 11):]
+    expected = df.iloc[1:]
+    assert_frame_equal(result, expected)
+    result = df.loc['20010101 11':]
+    assert_frame_equal(result, expected)
+
+    # duplicates
+    df = pd.DataFrame(np.arange(5., dtype='float64'),
+                      index=[datetime(2001, 1, i, 10, 00)
+                             for i in [1, 2, 2, 3, 4]])
+
+    result = df.loc[datetime(2001, 1, 1, 10):]
+    assert_frame_equal(result, df)
+    result = df.loc[:datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+    result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
+    assert_frame_equal(result, df)
+
+    result = df.loc[datetime(2001, 1, 1, 11):]
+    expected = df.iloc[1:]
+    assert_frame_equal(result, expected)
+    result = df.loc['20010101 11':]
+    assert_frame_equal(result, expected)
+
+
+def test_frame_datetime64_duplicated():
+    dates = date_range('2010-07-01', end='2010-08-05')
+
+    tst = DataFrame({'symbol': 'AAA', 'date': dates})
+    result = tst.duplicated(['date', 'symbol'])
+    assert (-result).all()
+
+    tst = DataFrame({'date': dates})
+    result = tst.duplicated()
+    assert (-result).all()
+
+
+def test_getitem_setitem_datetime_tz_pytz():
+    from pytz import timezone as tz
+    from pandas import date_range
+
+    N = 50
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
+    ts = Series(np.random.randn(N), index=rng)
+
+    # also test Timestamp tz handling, GH #2789
+    result = ts.copy()
+    result["1990-01-01 09:00:00+00:00"] = 0
+    result["1990-01-01 09:00:00+00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result["1990-01-01 03:00:00-06:00"] = 0
+    result["1990-01-01 03:00:00-06:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    # repeat with datetimes
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+
+    # comparison dates with datetime MUST be localized!
+    date = tz('US/Central').localize(datetime(1990, 1, 1, 3))
+    result[date] = 0
+    result[date] = ts[4]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_datetime_tz_dateutil():
+    from dateutil.tz import tzutc
+    from pandas._libs.tslibs.timezones import dateutil_gettz as gettz
+
+    tz = lambda x: tzutc() if x == 'UTC' else gettz(
+        x)  # handle special case for utc in dateutil
+
+    from pandas import date_range
+
+    N = 50
+
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H',
+                     tz='America/New_York')
+    ts = Series(np.random.randn(N), index=rng)
+
+    # also test Timestamp tz handling, GH #2789
+    result = ts.copy()
+    result["1990-01-01 09:00:00+00:00"] = 0
+    result["1990-01-01 09:00:00+00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result["1990-01-01 03:00:00-06:00"] = 0
+    result["1990-01-01 03:00:00-06:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    # repeat with datetimes
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
+    result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = 0
+    result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = ts[4]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_datetimeindex():
+    N = 50
+    # testing with timezone, GH #2785
+    rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
+    ts = Series(np.random.randn(N), index=rng)
+
+    result = ts["1990-01-01 04:00:00"]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result["1990-01-01 04:00:00"] = 0
+    result["1990-01-01 04:00:00"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts["1990-01-01 04:00:00":"1990-01-01 07:00:00"]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = 0
+    result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = "1990-01-01 04:00:00"
+    rb = "1990-01-01 07:00:00"
+    # GH#18435 strings get a pass from tzawareness compat
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    lb = "1990-01-01 04:00:00-0500"
+    rb = "1990-01-01 07:00:00-0500"
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    # repeat all the above with naive datetimes
+    result = ts[datetime(1990, 1, 1, 4)]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 4)] = 0
+    result[datetime(1990, 1, 1, 4)] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = 0
+    result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = datetime(1990, 1, 1, 4)
+    rb = datetime(1990, 1, 1, 7)
+    msg = "Cannot compare tz-naive and tz-aware datetime-like objects"
+    with pytest.raises(TypeError, match=msg):
+        # tznaive vs tzaware comparison is invalid
+        # see GH#18376, GH#18162
+        ts[(ts.index >= lb) & (ts.index <= rb)]
+
+    lb = pd.Timestamp(datetime(1990, 1, 1, 4)).tz_localize(rng.tzinfo)
+    rb = pd.Timestamp(datetime(1990, 1, 1, 7)).tz_localize(rng.tzinfo)
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts[ts.index[4]]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts[ts.index[4:8]]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[ts.index[4:8]] = 0
+    result[4:8] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    # also test partial date slicing
+    result = ts["1990-01-02"]
+    expected = ts[24:48]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-02"] = 0
+    result["1990-01-02"] = ts[24:48]
+    assert_series_equal(result, ts)
+
+
+def test_getitem_setitem_periodindex():
+    from pandas import period_range
+
+    N = 50
+    rng = period_range('1/1/1990', periods=N, freq='H')
+    ts = Series(np.random.randn(N), index=rng)
+
+    result = ts["1990-01-01 04"]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts.copy()
+    result["1990-01-01 04"] = 0
+    result["1990-01-01 04"] = ts[4]
+    assert_series_equal(result, ts)
+
+    result = ts["1990-01-01 04":"1990-01-01 07"]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result["1990-01-01 04":"1990-01-01 07"] = 0
+    result["1990-01-01 04":"1990-01-01 07"] = ts[4:8]
+    assert_series_equal(result, ts)
+
+    lb = "1990-01-01 04"
+    rb = "1990-01-01 07"
+    result = ts[(ts.index >= lb) & (ts.index <= rb)]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    # GH 2782
+    result = ts[ts.index[4]]
+    expected = ts[4]
+    assert result == expected
+
+    result = ts[ts.index[4:8]]
+    expected = ts[4:8]
+    assert_series_equal(result, expected)
+
+    result = ts.copy()
+    result[ts.index[4:8]] = 0
+    result[4:8] = ts[4:8]
+    assert_series_equal(result, ts)
+
+
+# FutureWarning from NumPy.
+@pytest.mark.filterwarnings("ignore:Using a non-tuple:FutureWarning")
+def test_getitem_median_slice_bug():
+    index = date_range('20090415', '20090519', freq='2B')
+    s = Series(np.random.randn(13), index=index)
+
+    indexer = [slice(6, 7, None)]
+    result = s[indexer]
+    expected = s[indexer[0]]
+    assert_series_equal(result, expected)
+
+
+def test_datetime_indexing():
+    from pandas import date_range
+
+    index = date_range('1/1/2000', '1/7/2000')
+    index = index.repeat(3)
+
+    s = Series(len(index), index=index)
+    stamp = Timestamp('1/8/2000')
+
+    with pytest.raises(KeyError, match=r"^947289600000000000L?$"):
+        s[stamp]
+    s[stamp] = 0
+    assert s[stamp] == 0
+
+    # not monotonic
+    s = Series(len(index), index=index)
+    s = s[::-1]
+
+    with pytest.raises(KeyError, match=r"^947289600000000000L?$"):
+        s[stamp]
+    s[stamp] = 0
+    assert s[stamp] == 0
+
+
+"""
+test duplicates in time series
+"""
+
+
+@pytest.fixture(scope='module')
+def dups():
+    dates = [datetime(2000, 1, 2), datetime(2000, 1, 2),
+             datetime(2000, 1, 2), datetime(2000, 1, 3),
+             datetime(2000, 1, 3), datetime(2000, 1, 3),
+             datetime(2000, 1, 4), datetime(2000, 1, 4),
+             datetime(2000, 1, 4), datetime(2000, 1, 5)]
+
+    return Series(np.random.randn(len(dates)), index=dates)
+
+
+def test_constructor(dups):
+    assert isinstance(dups, Series)
+    assert isinstance(dups.index, DatetimeIndex)
+
+
+def test_is_unique_monotonic(dups):
+    assert not dups.index.is_unique
+
+
+def test_index_unique(dups):
+    uniques = dups.index.unique()
+    expected = DatetimeIndex([datetime(2000, 1, 2), datetime(2000, 1, 3),
+                              datetime(2000, 1, 4), datetime(2000, 1, 5)])
+    assert uniques.dtype == 'M8[ns]'  # sanity
+    tm.assert_index_equal(uniques, expected)
+    assert dups.index.nunique() == 4
+
+    # #2563
+    assert isinstance(uniques, DatetimeIndex)
+
+    dups_local = dups.index.tz_localize('US/Eastern')
+    dups_local.name = 'foo'
+    result = dups_local.unique()
+    expected = DatetimeIndex(expected, name='foo')
+    expected = expected.tz_localize('US/Eastern')
+    assert result.tz is not None
+    assert result.name == 'foo'
+    tm.assert_index_equal(result, expected)
+
+    # NaT, note this is excluded
+    arr = [1370745748 + t for t in range(20)] + [iNaT]
+    idx = DatetimeIndex(arr * 3)
+    tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
+    assert idx.nunique() == 20
+    assert idx.nunique(dropna=False) == 21
+
+    arr = [Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t)
+           for t in range(20)] + [NaT]
+    idx = DatetimeIndex(arr * 3)
+    tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
+    assert idx.nunique() == 20
+    assert idx.nunique(dropna=False) == 21
+
+
+def test_index_dupes_contains():
+    d = datetime(2011, 12, 5, 20, 30)
+    ix = DatetimeIndex([d, d])
+    assert d in ix
+
+
+def test_duplicate_dates_indexing(dups):
+    ts = dups
+
+    uniques = ts.index.unique()
+    for date in uniques:
+        result = ts[date]
+
+        mask = ts.index == date
+        total = (ts.index == date).sum()
+        expected = ts[mask]
+        if total > 1:
+            assert_series_equal(result, expected)
+        else:
+            assert_almost_equal(result, expected[0])
+
+        cp = ts.copy()
+        cp[date] = 0
+        expected = Series(np.where(mask, 0, ts), index=ts.index)
+        assert_series_equal(cp, expected)
+
+    with pytest.raises(KeyError, match=r"^947116800000000000L?$"):
+        ts[datetime(2000, 1, 6)]
+
+    # new index
+    ts[datetime(2000, 1, 6)] = 0
+    assert ts[datetime(2000, 1, 6)] == 0
+
+
+def test_range_slice():
+    idx = DatetimeIndex(['1/1/2000', '1/2/2000', '1/2/2000', '1/3/2000',
+                         '1/4/2000'])
+
+    ts = Series(np.random.randn(len(idx)), index=idx)
+
+    result = ts['1/2/2000':]
+    expected = ts[1:]
+    assert_series_equal(result, expected)
+
+    result = ts['1/2/2000':'1/3/2000']
+    expected = ts[1:4]
+    assert_series_equal(result, expected)
+
+
+def test_groupby_average_dup_values(dups):
+    result = dups.groupby(level=0).mean()
+    expected = dups.groupby(dups.index).mean()
+    assert_series_equal(result, expected)
+
+
+def test_indexing_over_size_cutoff():
+    import datetime
+    # #1821
+
+    old_cutoff = _index._SIZE_CUTOFF
+    try:
+        _index._SIZE_CUTOFF = 1000
+
+        # create large list of non periodic datetime
+        dates = []
+        sec = datetime.timedelta(seconds=1)
+        half_sec = datetime.timedelta(microseconds=500000)
+        d = datetime.datetime(2011, 12, 5, 20, 30)
+        n = 1100
+        for i in range(n):
+            dates.append(d)
+            dates.append(d + sec)
+            dates.append(d + sec + half_sec)
+            dates.append(d + sec + sec + half_sec)
+            d += 3 * sec
+
+        # duplicate some values in the list
+        duplicate_positions = np.random.randint(0, len(dates) - 1, 20)
+        for p in duplicate_positions:
+            dates[p + 1] = dates[p]
+
+        df = DataFrame(np.random.randn(len(dates), 4),
+                       index=dates,
+                       columns=list('ABCD'))
+
+        pos = n * 3
+        timestamp = df.index[pos]
+        assert timestamp in df.index
+
+        # it works!
+        df.loc[timestamp]
+        assert len(df.loc[[timestamp]]) > 0
+    finally:
+        _index._SIZE_CUTOFF = old_cutoff
+
+
+def test_indexing_unordered():
+    # GH 2437
+    rng = date_range(start='2011-01-01', end='2011-01-15')
+    ts = Series(np.random.rand(len(rng)), index=rng)
+    ts2 = pd.concat([ts[0:4], ts[-4:], ts[4:-4]])
+
+    for t in ts.index:
+        # TODO: unused?
+        s = str(t)  # noqa
+
+        expected = ts[t]
+        result = ts2[t]
+        assert expected == result
+
+    # GH 3448 (ranges)
+    def compare(slobj):
+        result = ts2[slobj].copy()
+        result = result.sort_index()
+        expected = ts[slobj]
+        assert_series_equal(result, expected)
+
+    compare(slice('2011-01-01', '2011-01-15'))
+    compare(slice('2010-12-30', '2011-01-15'))
+    compare(slice('2011-01-01', '2011-01-16'))
+
+    # partial ranges
+    compare(slice('2011-01-01', '2011-01-6'))
+    compare(slice('2011-01-06', '2011-01-8'))
+    compare(slice('2011-01-06', '2011-01-12'))
+
+    # single values
+    result = ts2['2011'].sort_index()
+    expected = ts['2011']
+    assert_series_equal(result, expected)
+
+    # diff freq
+    rng = date_range(datetime(2005, 1, 1), periods=20, freq='M')
+    ts = Series(np.arange(len(rng)), index=rng)
+    ts = ts.take(np.random.permutation(20))
+
+    result = ts['2005']
+    for t in result.index:
+        assert t.year == 2005
+
+
+def test_indexing():
+    idx = date_range("2001-1-1", periods=20, freq='M')
+    ts = Series(np.random.rand(len(idx)), index=idx)
+
+    # getting
+
+    # GH 3070, make sure semantics work on Series/Frame
+    expected = ts['2001']
+    expected.name = 'A'
+
+    df = DataFrame(dict(A=ts))
+    result = df['2001']['A']
+    assert_series_equal(expected, result)
+
+    # setting
+    ts['2001'] = 1
+    expected = ts['2001']
+    expected.name = 'A'
+
+    df.loc['2001', 'A'] = 1
+
+    result = df['2001']['A']
+    assert_series_equal(expected, result)
+
+    # GH3546 (not including times on the last day)
+    idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:00',
+                     freq='H')
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013-05']
+    assert_series_equal(expected, ts)
+
+    idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:59',
+                     freq='S')
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013-05']
+    assert_series_equal(expected, ts)
+
+    idx = [Timestamp('2013-05-31 00:00'),
+           Timestamp(datetime(2013, 5, 31, 23, 59, 59, 999999))]
+    ts = Series(lrange(len(idx)), index=idx)
+    expected = ts['2013']
+    assert_series_equal(expected, ts)
+
+    # GH14826, indexing with a seconds resolution string / datetime object
+    df = DataFrame(np.random.rand(5, 5),
+                   columns=['open', 'high', 'low', 'close', 'volume'],
+                   index=date_range('2012-01-02 18:01:00',
+                                    periods=5, tz='US/Central', freq='s'))
+    expected = df.loc[[df.index[2]]]
+
+    # this is a single date, so will raise
+    with pytest.raises(KeyError, match=r"^'2012-01-02 18:01:02'$"):
+        df['2012-01-02 18:01:02']
+    msg = r"Timestamp\('2012-01-02 18:01:02-0600', tz='US/Central', freq='S'\)"
+    with pytest.raises(KeyError, match=msg):
+        df[df.index[2]]
+
+
+"""
+test NaT support
+"""
+
+
+def test_set_none_nan():
+    series = Series(date_range('1/1/2000', periods=10))
+    series[3] = None
+    assert series[3] is NaT
+
+    series[3:5] = None
+    assert series[4] is NaT
+
+    series[5] = np.nan
+    assert series[5] is NaT
+
+    series[5:7] = np.nan
+    assert series[6] is NaT
+
+
+def test_nat_operations():
+    # GH 8617
+    s = Series([0, pd.NaT], dtype='m8[ns]')
+    exp = s[0]
+    assert s.median() == exp
+    assert s.min() == exp
+    assert s.max() == exp
+
+
+@pytest.mark.parametrize('method', ["round", "floor", "ceil"])
+@pytest.mark.parametrize('freq', ["s", "5s", "min", "5min", "h", "5h"])
+def test_round_nat(method, freq):
+    # GH14940
+    s = Series([pd.NaT])
+    expected = Series(pd.NaT)
+    round_method = getattr(s.dt, method)
+    assert_series_equal(round_method(freq), expected)
diff --git a/pandas/tests/series/indexing/test_iloc.py b/pandas/tests/series/indexing/test_iloc.py
new file mode 100644
index 0000000000000..fa85da6a70d62
--- /dev/null
+++ b/pandas/tests/series/indexing/test_iloc.py
@@ -0,0 +1,37 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+
+from pandas.compat import lrange, range
+
+from pandas import Series
+from pandas.util.testing import assert_almost_equal, assert_series_equal
+
+
+def test_iloc():
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+
+    for i in range(len(s)):
+        result = s.iloc[i]
+        exp = s[s.index[i]]
+        assert_almost_equal(result, exp)
+
+    # pass a slice
+    result = s.iloc[slice(1, 3)]
+    expected = s.loc[2:4]
+    assert_series_equal(result, expected)
+
+    # test slice is a view
+    result[:] = 0
+    assert (s[1:3] == 0).all()
+
+    # list of integers
+    result = s.iloc[[0, 2, 3, 4, 5]]
+    expected = s.reindex(s.index[[0, 2, 3, 4, 5]])
+    assert_series_equal(result, expected)
+
+
+def test_iloc_nonunique():
+    s = Series([0, 1, 2], index=[0, 1, 0])
+    assert s.iloc[2] == 2
diff --git a/pandas/tests/series/indexing/test_indexing.py b/pandas/tests/series/indexing/test_indexing.py
new file mode 100644
index 0000000000000..dbe667a166d0a
--- /dev/null
+++ b/pandas/tests/series/indexing/test_indexing.py
@@ -0,0 +1,841 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+""" test get/set & misc """
+
+from datetime import timedelta
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, range
+
+from pandas.core.dtypes.common import is_scalar
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, MultiIndex, Series, Timedelta, Timestamp)
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
+
+from pandas.tseries.offsets import BDay
+
+
+def test_basic_indexing():
+    s = Series(np.random.randn(5), index=['a', 'b', 'a', 'a', 'b'])
+
+    msg = "index out of bounds"
+    with pytest.raises(IndexError, match=msg):
+        s[5]
+    msg = "index 5 is out of bounds for axis 0 with size 5"
+    with pytest.raises(IndexError, match=msg):
+        s[5] = 0
+
+    with pytest.raises(KeyError, match=r"^'c'$"):
+        s['c']
+
+    s = s.sort_index()
+
+    msg = r"index out of bounds|^5$"
+    with pytest.raises(IndexError, match=msg):
+        s[5]
+    msg = r"index 5 is out of bounds for axis (0|1) with size 5|^5$"
+    with pytest.raises(IndexError, match=msg):
+        s[5] = 0
+
+
+def test_basic_getitem_with_labels(test_data):
+    indices = test_data.ts.index[[5, 10, 15]]
+
+    result = test_data.ts[indices]
+    expected = test_data.ts.reindex(indices)
+    assert_series_equal(result, expected)
+
+    result = test_data.ts[indices[0]:indices[2]]
+    expected = test_data.ts.loc[indices[0]:indices[2]]
+    assert_series_equal(result, expected)
+
+    # integer indexes, be careful
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+    inds = [0, 2, 5, 7, 8]
+    arr_inds = np.array([0, 2, 5, 7, 8])
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[inds]
+    expected = s.reindex(inds)
+    assert_series_equal(result, expected)
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[arr_inds]
+    expected = s.reindex(arr_inds)
+    assert_series_equal(result, expected)
+
+    # GH12089
+    # with tz for values
+    s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
+               index=['a', 'b', 'c'])
+    expected = Timestamp('2011-01-01', tz='US/Eastern')
+    result = s.loc['a']
+    assert result == expected
+    result = s.iloc[0]
+    assert result == expected
+    result = s['a']
+    assert result == expected
+
+
+def test_getitem_setitem_ellipsis():
+    s = Series(np.random.randn(10))
+
+    np.fix(s)
+
+    result = s[...]
+    assert_series_equal(result, s)
+
+    s[...] = 5
+    assert (result == 5).all()
+
+
+def test_getitem_get(test_data):
+    test_series = test_data.series
+    test_obj_series = test_data.objSeries
+
+    idx1 = test_series.index[5]
+    idx2 = test_obj_series.index[5]
+
+    assert test_series[idx1] == test_series.get(idx1)
+    assert test_obj_series[idx2] == test_obj_series.get(idx2)
+
+    assert test_series[idx1] == test_series[5]
+    assert test_obj_series[idx2] == test_obj_series[5]
+
+    assert test_series.get(-1) == test_series.get(test_series.index[-1])
+    assert test_series[5] == test_series.get(test_series.index[5])
+
+    # missing
+    d = test_data.ts.index[0] - BDay()
+    msg = r"Timestamp\('1999-12-31 00:00:00', freq='B'\)"
+    with pytest.raises(KeyError, match=msg):
+        test_data.ts[d]
+
+    # None
+    # GH 5652
+    for s in [Series(), Series(index=list('abc'))]:
+        result = s.get(None)
+        assert result is None
+
+
+def test_getitem_fancy(test_data):
+    slice1 = test_data.series[[1, 2, 3]]
+    slice2 = test_data.objSeries[[1, 2, 3]]
+    assert test_data.series.index[2] == slice1.index[1]
+    assert test_data.objSeries.index[2] == slice2.index[1]
+    assert test_data.series[2] == slice1[1]
+    assert test_data.objSeries[2] == slice2[1]
+
+
+def test_getitem_generator(test_data):
+    gen = (x > 0 for x in test_data.series)
+    result = test_data.series[gen]
+    result2 = test_data.series[iter(test_data.series > 0)]
+    expected = test_data.series[test_data.series > 0]
+    assert_series_equal(result, expected)
+    assert_series_equal(result2, expected)
+
+
+def test_type_promotion():
+    # GH12599
+    s = pd.Series()
+    s["a"] = pd.Timestamp("2016-01-01")
+    s["b"] = 3.0
+    s["c"] = "foo"
+    expected = Series([pd.Timestamp("2016-01-01"), 3.0, "foo"],
+                      index=["a", "b", "c"])
+    assert_series_equal(s, expected)
+
+
+@pytest.mark.parametrize(
+    'result_1, duplicate_item, expected_1',
+    [
+        [
+            pd.Series({1: 12, 2: [1, 2, 2, 3]}), pd.Series({1: 313}),
+            pd.Series({1: 12, }, dtype=object),
+        ],
+        [
+            pd.Series({1: [1, 2, 3], 2: [1, 2, 2, 3]}),
+            pd.Series({1: [1, 2, 3]}), pd.Series({1: [1, 2, 3], }),
+        ],
+    ])
+def test_getitem_with_duplicates_indices(
+        result_1, duplicate_item, expected_1):
+    # GH 17610
+    result = result_1.append(duplicate_item)
+    expected = expected_1.append(duplicate_item)
+    assert_series_equal(result[1], expected)
+    assert result[2] == result_1[2]
+
+
+def test_getitem_out_of_bounds(test_data):
+    # don't segfault, GH #495
+    msg = "index out of bounds"
+    with pytest.raises(IndexError, match=msg):
+        test_data.ts[len(test_data.ts)]
+
+    # GH #917
+    s = Series([])
+    with pytest.raises(IndexError, match=msg):
+        s[-1]
+
+
+def test_getitem_setitem_integers():
+    # caused bug without test
+    s = Series([1, 2, 3], ['a', 'b', 'c'])
+
+    assert s.iloc[0] == s['a']
+    s.iloc[0] = 5
+    tm.assert_almost_equal(s['a'], 5)
+
+
+def test_getitem_box_float64(test_data):
+    value = test_data.ts[5]
+    assert isinstance(value, np.float64)
+
+
+@pytest.mark.parametrize(
+    'arr',
+    [
+        np.random.randn(10),
+        tm.makeDateIndex(10, name='a').tz_localize(
+            tz='US/Eastern'),
+    ])
+def test_get(arr):
+    # GH 21260
+    s = Series(arr, index=[2 * i for i in range(len(arr))])
+    assert s.get(4) == s.iloc[2]
+
+    result = s.get([4, 6])
+    expected = s.iloc[[2, 3]]
+    tm.assert_series_equal(result, expected)
+
+    result = s.get(slice(2))
+    expected = s.iloc[[0, 1]]
+    tm.assert_series_equal(result, expected)
+
+    assert s.get(-1) is None
+    assert s.get(s.index.max() + 1) is None
+
+    s = Series(arr[:6], index=list('abcdef'))
+    assert s.get('c') == s.iloc[2]
+
+    result = s.get(slice('b', 'd'))
+    expected = s.iloc[[1, 2, 3]]
+    tm.assert_series_equal(result, expected)
+
+    result = s.get('Z')
+    assert result is None
+
+    assert s.get(4) == s.iloc[4]
+    assert s.get(-1) == s.iloc[-1]
+    assert s.get(len(s)) is None
+
+    # GH 21257
+    s = pd.Series(arr)
+    s2 = s[::2]
+    assert s2.get(1) is None
+
+
+def test_series_box_timestamp():
+    rng = pd.date_range('20090415', '20090519', freq='B')
+    ser = Series(rng)
+
+    assert isinstance(ser[5], pd.Timestamp)
+
+    rng = pd.date_range('20090415', '20090519', freq='B')
+    ser = Series(rng, index=rng)
+    assert isinstance(ser[5], pd.Timestamp)
+
+    assert isinstance(ser.iat[5], pd.Timestamp)
+
+
+def test_getitem_ambiguous_keyerror():
+    s = Series(lrange(10), index=lrange(0, 20, 2))
+    with pytest.raises(KeyError, match=r"^1L?$"):
+        s[1]
+    with pytest.raises(KeyError, match=r"^1L?$"):
+        s.loc[1]
+
+
+def test_getitem_unordered_dup():
+    obj = Series(lrange(5), index=['c', 'a', 'a', 'b', 'b'])
+    assert is_scalar(obj['c'])
+    assert obj['c'] == 0
+
+
+def test_getitem_dups_with_missing():
+    # breaks reindex, so need to use .loc internally
+    # GH 4246
+    s = Series([1, 2, 3, 4], ['foo', 'bar', 'foo', 'bah'])
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        expected = s.loc[['foo', 'bar', 'bah', 'bam']]
+
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        result = s[['foo', 'bar', 'bah', 'bam']]
+    assert_series_equal(result, expected)
+
+
+def test_getitem_dups():
+    s = Series(range(5), index=['A', 'A', 'B', 'C', 'C'], dtype=np.int64)
+    expected = Series([3, 4], index=['C', 'C'], dtype=np.int64)
+    result = s['C']
+    assert_series_equal(result, expected)
+
+
+def test_setitem_ambiguous_keyerror():
+    s = Series(lrange(10), index=lrange(0, 20, 2))
+
+    # equivalent of an append
+    s2 = s.copy()
+    s2[1] = 5
+    expected = s.append(Series([5], index=[1]))
+    assert_series_equal(s2, expected)
+
+    s2 = s.copy()
+    s2.loc[1] = 5
+    expected = s.append(Series([5], index=[1]))
+    assert_series_equal(s2, expected)
+
+
+def test_getitem_dataframe():
+    rng = list(range(10))
+    s = pd.Series(10, index=rng)
+    df = pd.DataFrame(rng, index=rng)
+    msg = ("Indexing a Series with DataFrame is not supported,"
+           " use the appropriate DataFrame column")
+    with pytest.raises(TypeError, match=msg):
+        s[df > 5]
+
+
+def test_setitem(test_data):
+    test_data.ts[test_data.ts.index[5]] = np.NaN
+    test_data.ts[[1, 2, 17]] = np.NaN
+    test_data.ts[6] = np.NaN
+    assert np.isnan(test_data.ts[6])
+    assert np.isnan(test_data.ts[2])
+    test_data.ts[np.isnan(test_data.ts)] = 5
+    assert not np.isnan(test_data.ts[2])
+
+    # caught this bug when writing tests
+    series = Series(tm.makeIntIndex(20).astype(float),
+                    index=tm.makeIntIndex(20))
+
+    series[::2] = 0
+    assert (series[::2] == 0).all()
+
+    # set item that's not contained
+    s = test_data.series.copy()
+    s['foobar'] = 1
+
+    app = Series([1], index=['foobar'], name='series')
+    expected = test_data.series.append(app)
+    assert_series_equal(s, expected)
+
+    # Test for issue #10193
+    key = pd.Timestamp('2012-01-01')
+    series = pd.Series()
+    series[key] = 47
+    expected = pd.Series(47, [key])
+    assert_series_equal(series, expected)
+
+    series = pd.Series([], pd.DatetimeIndex([], freq='D'))
+    series[key] = 47
+    expected = pd.Series(47, pd.DatetimeIndex([key], freq='D'))
+    assert_series_equal(series, expected)
+
+
+def test_setitem_dtypes():
+    # change dtypes
+    # GH 4463
+    expected = Series([np.nan, 2, 3])
+
+    s = Series([1, 2, 3])
+    s.iloc[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([1, 2, 3])
+    s.loc[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([1, 2, 3])
+    s[0] = np.nan
+    assert_series_equal(s, expected)
+
+    s = Series([False])
+    s.loc[0] = np.nan
+    assert_series_equal(s, Series([np.nan]))
+
+    s = Series([False, True])
+    s.loc[0] = np.nan
+    assert_series_equal(s, Series([np.nan, 1.0]))
+
+
+def test_set_value(test_data):
+    idx = test_data.ts.index[10]
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        res = test_data.ts.set_value(idx, 0)
+    assert res is test_data.ts
+    assert test_data.ts[idx] == 0
+
+    # equiv
+    s = test_data.series.copy()
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        res = s.set_value('foobar', 0)
+    assert res is s
+    assert res.index[-1] == 'foobar'
+    assert res['foobar'] == 0
+
+    s = test_data.series.copy()
+    s.loc['foobar'] = 0
+    assert s.index[-1] == 'foobar'
+    assert s['foobar'] == 0
+
+
+def test_setslice(test_data):
+    sl = test_data.ts[5:20]
+    assert len(sl) == len(sl.index)
+    assert sl.index.is_unique is True
+
+
+# FutureWarning from NumPy about [slice(None, 5).
+@pytest.mark.filterwarnings("ignore:Using a non-tuple:FutureWarning")
+def test_basic_getitem_setitem_corner(test_data):
+    # invalid tuples, e.g. td.ts[:, None] vs. td.ts[:, 2]
+    msg = "Can only tuple-index with a MultiIndex"
+    with pytest.raises(ValueError, match=msg):
+        test_data.ts[:, 2]
+    with pytest.raises(ValueError, match=msg):
+        test_data.ts[:, 2] = 2
+
+    # weird lists. [slice(0, 5)] will work but not two slices
+    result = test_data.ts[[slice(None, 5)]]
+    expected = test_data.ts[:5]
+    assert_series_equal(result, expected)
+
+    # OK
+    msg = r"unhashable type(: 'slice')?"
+    with pytest.raises(TypeError, match=msg):
+        test_data.ts[[5, slice(None, None)]]
+    with pytest.raises(TypeError, match=msg):
+        test_data.ts[[5, slice(None, None)]] = 2
+
+
+@pytest.mark.parametrize('tz', ['US/Eastern', 'UTC', 'Asia/Tokyo'])
+def test_setitem_with_tz(tz):
+    orig = pd.Series(pd.date_range('2016-01-01', freq='H', periods=3,
+                                   tz=tz))
+    assert orig.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    # scalar
+    s = orig.copy()
+    s[1] = pd.Timestamp('2011-01-01', tz=tz)
+    exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2016-01-01 02:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    # vector
+    vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                      pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
+    assert vals.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    s[[1, 2]] = vals
+    exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2012-01-01 00:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+
+def test_setitem_with_tz_dst():
+    # GH XXX
+    tz = 'US/Eastern'
+    orig = pd.Series(pd.date_range('2016-11-06', freq='H', periods=3,
+                                   tz=tz))
+    assert orig.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    # scalar
+    s = orig.copy()
+    s[1] = pd.Timestamp('2011-01-01', tz=tz)
+    exp = pd.Series([pd.Timestamp('2016-11-06 00:00-04:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00-05:00', tz=tz),
+                     pd.Timestamp('2016-11-06 01:00-05:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
+    tm.assert_series_equal(s, exp)
+
+    # vector
+    vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
+                      pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
+    assert vals.dtype == 'datetime64[ns, {0}]'.format(tz)
+
+    s[[1, 2]] = vals
+    exp = pd.Series([pd.Timestamp('2016-11-06 00:00', tz=tz),
+                     pd.Timestamp('2011-01-01 00:00', tz=tz),
+                     pd.Timestamp('2012-01-01 00:00', tz=tz)])
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.loc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.iloc[[1, 2]] = vals
+    tm.assert_series_equal(s, exp)
+
+
+def test_categorial_assigning_ops():
+    orig = Series(Categorical(["b", "b"], categories=["a", "b"]))
+    s = orig.copy()
+    s[:] = "a"
+    exp = Series(Categorical(["a", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[1] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[s.index > 0] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s[[False, True]] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]))
+    tm.assert_series_equal(s, exp)
+
+    s = orig.copy()
+    s.index = ["x", "y"]
+    s["y"] = "a"
+    exp = Series(Categorical(["b", "a"], categories=["a", "b"]),
+                 index=["x", "y"])
+    tm.assert_series_equal(s, exp)
+
+    # ensure that one can set something to np.nan
+    s = Series(Categorical([1, 2, 3]))
+    exp = Series(Categorical([1, np.nan, 3], categories=[1, 2, 3]))
+    s[1] = np.nan
+    tm.assert_series_equal(s, exp)
+
+
+def test_slice(test_data):
+    numSlice = test_data.series[10:20]
+    numSliceEnd = test_data.series[-10:]
+    objSlice = test_data.objSeries[10:20]
+
+    assert test_data.series.index[9] not in numSlice.index
+    assert test_data.objSeries.index[9] not in objSlice.index
+
+    assert len(numSlice) == len(numSlice.index)
+    assert test_data.series[numSlice.index[0]] == numSlice[numSlice.index[0]]
+
+    assert numSlice.index[1] == test_data.series.index[11]
+    assert tm.equalContents(numSliceEnd, np.array(test_data.series)[-10:])
+
+    # Test return view.
+    sl = test_data.series[10:20]
+    sl[:] = 0
+
+    assert (test_data.series[10:20] == 0).all()
+
+
+def test_slice_can_reorder_not_uniquely_indexed():
+    s = Series(1, index=['a', 'a', 'b', 'b', 'c'])
+    s[::-1]  # it works!
+
+
+def test_ix_setitem(test_data):
+    inds = test_data.series.index[[3, 4, 7]]
+
+    result = test_data.series.copy()
+    result.loc[inds] = 5
+
+    expected = test_data.series.copy()
+    expected[[3, 4, 7]] = 5
+    assert_series_equal(result, expected)
+
+    result.iloc[5:10] = 10
+    expected[5:10] = 10
+    assert_series_equal(result, expected)
+
+    # set slice with indices
+    d1, d2 = test_data.series.index[[5, 15]]
+    result.loc[d1:d2] = 6
+    expected[5:16] = 6  # because it's inclusive
+    assert_series_equal(result, expected)
+
+    # set index value
+    test_data.series.loc[d1] = 4
+    test_data.series.loc[d2] = 6
+    assert test_data.series[d1] == 4
+    assert test_data.series[d2] == 6
+
+
+def test_setitem_na():
+    # these induce dtype changes
+    expected = Series([np.nan, 3, np.nan, 5, np.nan, 7, np.nan, 9, np.nan])
+    s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
+    s[::2] = np.nan
+    assert_series_equal(s, expected)
+
+    # gets coerced to float, right?
+    expected = Series([np.nan, 1, np.nan, 0])
+    s = Series([True, True, False, False])
+    s[::2] = np.nan
+    assert_series_equal(s, expected)
+
+    expected = Series([np.nan, np.nan, np.nan, np.nan, np.nan, 5, 6, 7, 8,
+                       9])
+    s = Series(np.arange(10))
+    s[:5] = np.nan
+    assert_series_equal(s, expected)
+
+
+def test_timedelta_assignment():
+    # GH 8209
+    s = Series([])
+    s.loc['B'] = timedelta(1)
+    tm.assert_series_equal(s, Series(Timedelta('1 days'), index=['B']))
+
+    s = s.reindex(s.index.insert(0, 'A'))
+    tm.assert_series_equal(s, Series(
+        [np.nan, Timedelta('1 days')], index=['A', 'B']))
+
+    result = s.fillna(timedelta(1))
+    expected = Series(Timedelta('1 days'), index=['A', 'B'])
+    tm.assert_series_equal(result, expected)
+
+    s.loc['A'] = timedelta(1)
+    tm.assert_series_equal(s, expected)
+
+    # GH 14155
+    s = Series(10 * [np.timedelta64(10, 'm')])
+    s.loc[[1, 2, 3]] = np.timedelta64(20, 'm')
+    expected = pd.Series(10 * [np.timedelta64(10, 'm')])
+    expected.loc[[1, 2, 3]] = pd.Timedelta(np.timedelta64(20, 'm'))
+    tm.assert_series_equal(s, expected)
+
+
+def test_underlying_data_conversion():
+    # GH 4080
+    df = DataFrame({c: [1, 2, 3] for c in ['a', 'b', 'c']})
+    df.set_index(['a', 'b', 'c'], inplace=True)
+    s = Series([1], index=[(2, 2, 2)])
+    df['val'] = 0
+    df
+    df['val'].update(s)
+
+    expected = DataFrame(
+        dict(a=[1, 2, 3], b=[1, 2, 3], c=[1, 2, 3], val=[0, 1, 0]))
+    expected.set_index(['a', 'b', 'c'], inplace=True)
+    tm.assert_frame_equal(df, expected)
+
+    # GH 3970
+    # these are chained assignments as well
+    pd.set_option('chained_assignment', None)
+    df = DataFrame({"aa": range(5), "bb": [2.2] * 5})
+    df["cc"] = 0.0
+
+    ck = [True] * len(df)
+
+    df["bb"].iloc[0] = .13
+
+    # TODO: unused
+    df_tmp = df.iloc[ck]  # noqa
+
+    df["bb"].iloc[0] = .15
+    assert df['bb'].iloc[0] == 0.15
+    pd.set_option('chained_assignment', 'raise')
+
+    # GH 3217
+    df = DataFrame(dict(a=[1, 3], b=[np.nan, 2]))
+    df['c'] = np.nan
+    df['c'].update(pd.Series(['foo'], index=[0]))
+
+    expected = DataFrame(dict(a=[1, 3], b=[np.nan, 2], c=['foo', np.nan]))
+    tm.assert_frame_equal(df, expected)
+
+
+def test_preserve_refs(test_data):
+    seq = test_data.ts[[5, 10, 15]]
+    seq[1] = np.NaN
+    assert not np.isnan(test_data.ts[10])
+
+
+def test_cast_on_putmask():
+    # GH 2746
+
+    # need to upcast
+    s = Series([1, 2], index=[1, 2], dtype='int64')
+    s[[True, False]] = Series([0], index=[1], dtype='int64')
+    expected = Series([0, 2], index=[1, 2], dtype='int64')
+
+    assert_series_equal(s, expected)
+
+
+def test_type_promote_putmask():
+    # GH8387: test that changing types does not break alignment
+    ts = Series(np.random.randn(100), index=np.arange(100, 0, -1)).round(5)
+    left, mask = ts.copy(), ts > 0
+    right = ts[mask].copy().map(str)
+    left[mask] = right
+    assert_series_equal(left, ts.map(lambda t: str(t) if t > 0 else t))
+
+    s = Series([0, 1, 2, 0])
+    mask = s > 0
+    s2 = s[mask].map(str)
+    s[mask] = s2
+    assert_series_equal(s, Series([0, '1', '2', 0]))
+
+    s = Series([0, 'foo', 'bar', 0])
+    mask = Series([False, True, True, False])
+    s2 = s[mask]
+    s[mask] = s2
+    assert_series_equal(s, Series([0, 'foo', 'bar', 0]))
+
+
+def test_multilevel_preserve_name():
+    index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
+                                                              'three']],
+                       codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                              [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                       names=['first', 'second'])
+    s = Series(np.random.randn(len(index)), index=index, name='sth')
+
+    result = s['foo']
+    result2 = s.loc['foo']
+    assert result.name == s.name
+    assert result2.name == s.name
+
+
+def test_setitem_scalar_into_readonly_backing_data():
+    # GH14359: test that you cannot mutate a read only buffer
+
+    array = np.zeros(5)
+    array.flags.writeable = False  # make the array immutable
+    series = Series(array)
+
+    for n in range(len(series)):
+        msg = "assignment destination is read-only"
+        with pytest.raises(ValueError, match=msg):
+            series[n] = 1
+
+        assert array[n] == 0
+
+
+def test_setitem_slice_into_readonly_backing_data():
+    # GH14359: test that you cannot mutate a read only buffer
+
+    array = np.zeros(5)
+    array.flags.writeable = False  # make the array immutable
+    series = Series(array)
+
+    msg = "assignment destination is read-only"
+    with pytest.raises(ValueError, match=msg):
+        series[1:3] = 1
+
+    assert not array.any()
+
+
+"""
+miscellaneous methods
+"""
+
+
+def test_select(test_data):
+    # deprecated: gh-12410
+    with tm.assert_produces_warning(FutureWarning,
+                                    check_stacklevel=False):
+        n = len(test_data.ts)
+        result = test_data.ts.select(lambda x: x >= test_data.ts.index[n // 2])
+        expected = test_data.ts.reindex(test_data.ts.index[n // 2:])
+        assert_series_equal(result, expected)
+
+        result = test_data.ts.select(lambda x: x.weekday() == 2)
+        expected = test_data.ts[test_data.ts.index.weekday == 2]
+        assert_series_equal(result, expected)
+
+
+def test_pop():
+    # GH 6600
+    df = DataFrame({'A': 0, 'B': np.arange(5, dtype='int64'), 'C': 0, })
+    k = df.iloc[4]
+
+    result = k.pop('B')
+    assert result == 4
+
+    expected = Series([0, 0], index=['A', 'C'], name=4)
+    assert_series_equal(k, expected)
+
+
+def test_take():
+    s = Series([-1, 5, 6, 2, 4])
+
+    actual = s.take([1, 3, 4])
+    expected = Series([5, 2, 4], index=[1, 3, 4])
+    tm.assert_series_equal(actual, expected)
+
+    actual = s.take([-1, 3, 4])
+    expected = Series([4, 2, 4], index=[4, 3, 4])
+    tm.assert_series_equal(actual, expected)
+
+    msg = "index {} is out of bounds for size 5"
+    with pytest.raises(IndexError, match=msg.format(10)):
+        s.take([1, 10])
+    with pytest.raises(IndexError, match=msg.format(5)):
+        s.take([2, 5])
+
+    with tm.assert_produces_warning(FutureWarning):
+        s.take([-1, 3, 4], convert=False)
+
+
+def test_take_categorical():
+    # https://github.com/pandas-dev/pandas/issues/20664
+    s = Series(pd.Categorical(['a', 'b', 'c']))
+    result = s.take([-2, -2, 0])
+    expected = Series(pd.Categorical(['b', 'b', 'a'],
+                      categories=['a', 'b', 'c']),
+                      index=[1, 1, 0])
+    assert_series_equal(result, expected)
+
+
+def test_head_tail(test_data):
+    assert_series_equal(test_data.series.head(), test_data.series[:5])
+    assert_series_equal(test_data.series.head(0), test_data.series[0:0])
+    assert_series_equal(test_data.series.tail(), test_data.series[-5:])
+    assert_series_equal(test_data.series.tail(0), test_data.series[0:0])
diff --git a/pandas/tests/series/indexing/test_loc.py b/pandas/tests/series/indexing/test_loc.py
new file mode 100644
index 0000000000000..8c1709ff016b3
--- /dev/null
+++ b/pandas/tests/series/indexing/test_loc.py
@@ -0,0 +1,168 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange
+
+import pandas as pd
+from pandas import Series, Timestamp
+from pandas.util.testing import assert_series_equal
+
+
+@pytest.mark.parametrize("val,expected", [
+    (2**63 - 1, 3),
+    (2**63, 4),
+])
+def test_loc_uint64(val, expected):
+    # see gh-19399
+    s = Series({2**63 - 1: 3, 2**63: 4})
+    assert s.loc[val] == expected
+
+
+def test_loc_getitem(test_data):
+    inds = test_data.series.index[[3, 4, 7]]
+    assert_series_equal(
+        test_data.series.loc[inds],
+        test_data.series.reindex(inds))
+    assert_series_equal(test_data.series.iloc[5::2], test_data.series[5::2])
+
+    # slice with indices
+    d1, d2 = test_data.ts.index[[5, 15]]
+    result = test_data.ts.loc[d1:d2]
+    expected = test_data.ts.truncate(d1, d2)
+    assert_series_equal(result, expected)
+
+    # boolean
+    mask = test_data.series > test_data.series.median()
+    assert_series_equal(test_data.series.loc[mask], test_data.series[mask])
+
+    # ask for index value
+    assert test_data.ts.loc[d1] == test_data.ts[d1]
+    assert test_data.ts.loc[d2] == test_data.ts[d2]
+
+
+def test_loc_getitem_not_monotonic(test_data):
+    d1, d2 = test_data.ts.index[[5, 15]]
+
+    ts2 = test_data.ts[::2][[1, 2, 0]]
+
+    msg = r"Timestamp\('2000-01-10 00:00:00'\)"
+    with pytest.raises(KeyError, match=msg):
+        ts2.loc[d1:d2]
+    with pytest.raises(KeyError, match=msg):
+        ts2.loc[d1:d2] = 0
+
+
+def test_loc_getitem_setitem_integer_slice_keyerrors():
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+
+    # this is OK
+    cp = s.copy()
+    cp.iloc[4:10] = 0
+    assert (cp.iloc[4:10] == 0).all()
+
+    # so is this
+    cp = s.copy()
+    cp.iloc[3:11] = 0
+    assert (cp.iloc[3:11] == 0).values.all()
+
+    result = s.iloc[2:6]
+    result2 = s.loc[3:11]
+    expected = s.reindex([4, 6, 8, 10])
+
+    assert_series_equal(result, expected)
+    assert_series_equal(result2, expected)
+
+    # non-monotonic, raise KeyError
+    s2 = s.iloc[lrange(5) + lrange(5, 10)[::-1]]
+    with pytest.raises(KeyError, match=r"^3L?$"):
+        s2.loc[3:11]
+    with pytest.raises(KeyError, match=r"^3L?$"):
+        s2.loc[3:11] = 0
+
+
+def test_loc_getitem_iterator(test_data):
+    idx = iter(test_data.series.index[:10])
+    result = test_data.series.loc[idx]
+    assert_series_equal(result, test_data.series[:10])
+
+
+def test_loc_setitem_boolean(test_data):
+    mask = test_data.series > test_data.series.median()
+
+    result = test_data.series.copy()
+    result.loc[mask] = 0
+    expected = test_data.series
+    expected[mask] = 0
+    assert_series_equal(result, expected)
+
+
+def test_loc_setitem_corner(test_data):
+    inds = list(test_data.series.index[[5, 8, 12]])
+    test_data.series.loc[inds] = 5
+    msg = r"\['foo'\] not in index"
+    with pytest.raises(KeyError, match=msg):
+        test_data.series.loc[inds + ['foo']] = 5
+
+
+def test_basic_setitem_with_labels(test_data):
+    indices = test_data.ts.index[[5, 10, 15]]
+
+    cp = test_data.ts.copy()
+    exp = test_data.ts.copy()
+    cp[indices] = 0
+    exp.loc[indices] = 0
+    assert_series_equal(cp, exp)
+
+    cp = test_data.ts.copy()
+    exp = test_data.ts.copy()
+    cp[indices[0]:indices[2]] = 0
+    exp.loc[indices[0]:indices[2]] = 0
+    assert_series_equal(cp, exp)
+
+    # integer indexes, be careful
+    s = Series(np.random.randn(10), index=lrange(0, 20, 2))
+    inds = [0, 4, 6]
+    arr_inds = np.array([0, 4, 6])
+
+    cp = s.copy()
+    exp = s.copy()
+    s[inds] = 0
+    s.loc[inds] = 0
+    assert_series_equal(cp, exp)
+
+    cp = s.copy()
+    exp = s.copy()
+    s[arr_inds] = 0
+    s.loc[arr_inds] = 0
+    assert_series_equal(cp, exp)
+
+    inds_notfound = [0, 4, 5, 6]
+    arr_inds_notfound = np.array([0, 4, 5, 6])
+    msg = r"\[5\] not contained in the index"
+    with pytest.raises(ValueError, match=msg):
+        s[inds_notfound] = 0
+    with pytest.raises(Exception, match=msg):
+        s[arr_inds_notfound] = 0
+
+    # GH12089
+    # with tz for values
+    s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
+               index=['a', 'b', 'c'])
+    s2 = s.copy()
+    expected = Timestamp('2011-01-03', tz='US/Eastern')
+    s2.loc['a'] = expected
+    result = s2.loc['a']
+    assert result == expected
+
+    s2 = s.copy()
+    s2.iloc[0] = expected
+    result = s2.iloc[0]
+    assert result == expected
+
+    s2 = s.copy()
+    s2['a'] = expected
+    result = s2['a']
+    assert result == expected
diff --git a/pandas/tests/series/indexing/test_numeric.py b/pandas/tests/series/indexing/test_numeric.py
new file mode 100644
index 0000000000000..e4afb0e456706
--- /dev/null
+++ b/pandas/tests/series/indexing/test_numeric.py
@@ -0,0 +1,259 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+
+import numpy as np
+import pytest
+
+from pandas.compat import lrange, range
+
+import pandas as pd
+from pandas import DataFrame, Index, Series
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
+
+
+def test_get():
+    # GH 6383
+    s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56, 45,
+                         51, 39, 55, 43, 54, 52, 51, 54]))
+
+    result = s.get(25, 0)
+    expected = 0
+    assert result == expected
+
+    s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56,
+                         45, 51, 39, 55, 43, 54, 52, 51, 54]),
+               index=pd.Float64Index(
+                   [25.0, 36.0, 49.0, 64.0, 81.0, 100.0,
+                    121.0, 144.0, 169.0, 196.0, 1225.0,
+                    1296.0, 1369.0, 1444.0, 1521.0, 1600.0,
+                    1681.0, 1764.0, 1849.0, 1936.0],
+                   dtype='object'))
+
+    result = s.get(25, 0)
+    expected = 43
+    assert result == expected
+
+    # GH 7407
+    # with a boolean accessor
+    df = pd.DataFrame({'i': [0] * 3, 'b': [False] * 3})
+    vc = df.i.value_counts()
+    result = vc.get(99, default='Missing')
+    assert result == 'Missing'
+
+    vc = df.b.value_counts()
+    result = vc.get(False, default='Missing')
+    assert result == 3
+
+    result = vc.get(True, default='Missing')
+    assert result == 'Missing'
+
+
+def test_get_nan():
+    # GH 8569
+    s = pd.Float64Index(range(10)).to_series()
+    assert s.get(np.nan) is None
+    assert s.get(np.nan, default='Missing') == 'Missing'
+
+
+def test_get_nan_multiple():
+    # GH 8569
+    # ensure that fixing "test_get_nan" above hasn't broken get
+    # with multiple elements
+    s = pd.Float64Index(range(10)).to_series()
+
+    idx = [2, 30]
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        assert_series_equal(s.get(idx),
+                            Series([2, np.nan], index=idx))
+
+    idx = [2, np.nan]
+    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+        assert_series_equal(s.get(idx),
+                            Series([2, np.nan], index=idx))
+
+    # GH 17295 - all missing keys
+    idx = [20, 30]
+    assert(s.get(idx) is None)
+
+    idx = [np.nan, np.nan]
+    assert(s.get(idx) is None)
+
+
+def test_delitem():
+    # GH 5542
+    # should delete the item inplace
+    s = Series(lrange(5))
+    del s[0]
+
+    expected = Series(lrange(1, 5), index=lrange(1, 5))
+    assert_series_equal(s, expected)
+
+    del s[1]
+    expected = Series(lrange(2, 5), index=lrange(2, 5))
+    assert_series_equal(s, expected)
+
+    # empty
+    s = Series()
+
+    with pytest.raises(KeyError, match=r"^0$"):
+        del s[0]
+
+    # only 1 left, del, add, del
+    s = Series(1)
+    del s[0]
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='int64')))
+    s[0] = 1
+    assert_series_equal(s, Series(1))
+    del s[0]
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='int64')))
+
+    # Index(dtype=object)
+    s = Series(1, index=['a'])
+    del s['a']
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='object')))
+    s['a'] = 1
+    assert_series_equal(s, Series(1, index=['a']))
+    del s['a']
+    assert_series_equal(s, Series(dtype='int64', index=Index(
+        [], dtype='object')))
+
+
+def test_slice_float64():
+    values = np.arange(10., 50., 2)
+    index = Index(values)
+
+    start, end = values[[5, 15]]
+
+    s = Series(np.random.randn(20), index=index)
+
+    result = s[start:end]
+    expected = s.iloc[5:16]
+    assert_series_equal(result, expected)
+
+    result = s.loc[start:end]
+    assert_series_equal(result, expected)
+
+    df = DataFrame(np.random.randn(20, 3), index=index)
+
+    result = df[start:end]
+    expected = df.iloc[5:16]
+    tm.assert_frame_equal(result, expected)
+
+    result = df.loc[start:end]
+    tm.assert_frame_equal(result, expected)
+
+
+def test_getitem_negative_out_of_bounds():
+    s = Series(tm.rands_array(5, 10), index=tm.rands_array(10, 10))
+
+    msg = "index out of bounds"
+    with pytest.raises(IndexError, match=msg):
+        s[-11]
+    msg = "index -11 is out of bounds for axis 0 with size 10"
+    with pytest.raises(IndexError, match=msg):
+        s[-11] = 'foo'
+
+
+def test_getitem_regression():
+    s = Series(lrange(5), index=lrange(5))
+    result = s[lrange(5)]
+    assert_series_equal(result, s)
+
+
+def test_getitem_setitem_slice_bug():
+    s = Series(lrange(10), lrange(10))
+    result = s[-12:]
+    assert_series_equal(result, s)
+
+    result = s[-7:]
+    assert_series_equal(result, s[3:])
+
+    result = s[:-12]
+    assert_series_equal(result, s[:0])
+
+    s = Series(lrange(10), lrange(10))
+    s[-12:] = 0
+    assert (s == 0).all()
+
+    s[:-12] = 5
+    assert (s == 0).all()
+
+
+def test_getitem_setitem_slice_integers():
+    s = Series(np.random.randn(8), index=[2, 4, 6, 8, 10, 12, 14, 16])
+
+    result = s[:4]
+    expected = s.reindex([2, 4, 6, 8])
+    assert_series_equal(result, expected)
+
+    s[:4] = 0
+    assert (s[:4] == 0).all()
+    assert not (s[4:] == 0).any()
+
+
+def test_setitem_float_labels():
+    # note labels are floats
+    s = Series(['a', 'b', 'c'], index=[0, 0.5, 1])
+    tmp = s.copy()
+
+    s.loc[1] = 'zoo'
+    tmp.iloc[2] = 'zoo'
+
+    assert_series_equal(s, tmp)
+
+
+def test_slice_float_get_set(test_data):
+    msg = (r"cannot do slice indexing on <class 'pandas\.core\.indexes"
+           r"\.datetimes\.DatetimeIndex'> with these indexers \[{key}\]"
+           r" of <(class|type) 'float'>")
+    with pytest.raises(TypeError, match=msg.format(key=r"4\.0")):
+        test_data.ts[4.0:10.0]
+
+    with pytest.raises(TypeError, match=msg.format(key=r"4\.0")):
+        test_data.ts[4.0:10.0] = 0
+
+    with pytest.raises(TypeError, match=msg.format(key=r"4\.5")):
+        test_data.ts[4.5:10.0]
+    with pytest.raises(TypeError, match=msg.format(key=r"4\.5")):
+        test_data.ts[4.5:10.0] = 0
+
+
+def test_slice_floats2():
+    s = Series(np.random.rand(10), index=np.arange(10, 20, dtype=float))
+
+    assert len(s.loc[12.0:]) == 8
+    assert len(s.loc[12.5:]) == 7
+
+    i = np.arange(10, 20, dtype=float)
+    i[2] = 12.2
+    s.index = i
+    assert len(s.loc[12.0:]) == 8
+    assert len(s.loc[12.5:]) == 7
+
+
+def test_int_indexing():
+    s = Series(np.random.randn(6), index=[0, 0, 1, 1, 2, 2])
+
+    with pytest.raises(KeyError, match=r"^5$"):
+        s[5]
+
+    with pytest.raises(KeyError, match=r"^'c'$"):
+        s['c']
+
+    # not monotonic
+    s = Series(np.random.randn(6), index=[2, 2, 0, 0, 1, 1])
+
+    with pytest.raises(KeyError, match=r"^5$"):
+        s[5]
+
+    with pytest.raises(KeyError, match=r"^'c'$"):
+        s['c']
+
+
+def test_getitem_int64(test_data):
+    idx = np.int64(5)
+    assert test_data.ts[idx] == test_data.ts[5]
diff --git a/pandas/tests/series/test_alter_axes.py b/pandas/tests/series/test_alter_axes.py
index 5997b91097cbc..73adc7d4bf82f 100644
--- a/pandas/tests/series/test_alter_axes.py
+++ b/pandas/tests/series/test_alter_axes.py
@@ -4,56 +4,57 @@
 from datetime import datetime
 
 import numpy as np
-import pandas as pd
-
-from pandas import Index, Series
-from pandas.core.index import MultiIndex, RangeIndex
+import pytest
 
 from pandas.compat import lrange, range, zip
-from pandas.util.testing import assert_series_equal, assert_frame_equal
-import pandas.util.testing as tm
 
-from .common import TestData
+from pandas import DataFrame, Index, MultiIndex, RangeIndex, Series
+import pandas.util.testing as tm
 
 
-class TestSeriesAlterAxes(TestData, tm.TestCase):
+class TestSeriesAlterAxes(object):
 
-    def test_setindex(self):
+    def test_setindex(self, string_series):
         # wrong type
-        series = self.series.copy()
-        self.assertRaises(TypeError, setattr, series, 'index', None)
+        msg = (r"Index\(\.\.\.\) must be called with a collection of some"
+               r" kind, None was passed")
+        with pytest.raises(TypeError, match=msg):
+            string_series.index = None
 
         # wrong length
-        series = self.series.copy()
-        self.assertRaises(Exception, setattr, series, 'index',
-                          np.arange(len(series) - 1))
+        msg = ("Length mismatch: Expected axis has 30 elements, new"
+               " values have 29 elements")
+        with pytest.raises(ValueError, match=msg):
+            string_series.index = np.arange(len(string_series) - 1)
 
         # works
-        series = self.series.copy()
-        series.index = np.arange(len(series))
-        tm.assertIsInstance(series.index, Index)
+        string_series.index = np.arange(len(string_series))
+        assert isinstance(string_series.index, Index)
 
-    def test_rename(self):
+    # Renaming
+
+    def test_rename(self, datetime_series):
+        ts = datetime_series
         renamer = lambda x: x.strftime('%Y%m%d')
-        renamed = self.ts.rename(renamer)
-        self.assertEqual(renamed.index[0], renamer(self.ts.index[0]))
+        renamed = ts.rename(renamer)
+        assert renamed.index[0] == renamer(ts.index[0])
 
         # dict
-        rename_dict = dict(zip(self.ts.index, renamed.index))
-        renamed2 = self.ts.rename(rename_dict)
-        assert_series_equal(renamed, renamed2)
+        rename_dict = dict(zip(ts.index, renamed.index))
+        renamed2 = ts.rename(rename_dict)
+        tm.assert_series_equal(renamed, renamed2)
 
         # partial dict
         s = Series(np.arange(4), index=['a', 'b', 'c', 'd'], dtype='int64')
         renamed = s.rename({'b': 'foo', 'd': 'bar'})
-        self.assert_index_equal(renamed.index, Index(['a', 'foo', 'c', 'bar']))
+        tm.assert_index_equal(renamed.index, Index(['a', 'foo', 'c', 'bar']))
 
         # index with name
         renamer = Series(np.arange(4),
                          index=Index(['a', 'b', 'c', 'd'], name='name'),
                          dtype='int64')
         renamed = renamer.rename({})
-        self.assertEqual(renamed.index.name, renamer.index.name)
+        assert renamed.index.name == renamer.index.name
 
     def test_rename_by_series(self):
         s = Series(range(5), name='foo')
@@ -66,48 +67,56 @@ def test_rename_set_name(self):
         s = Series(range(4), index=list('abcd'))
         for name in ['foo', 123, 123., datetime(2001, 11, 11), ('foo',)]:
             result = s.rename(name)
-            self.assertEqual(result.name, name)
-            self.assert_numpy_array_equal(result.index.values, s.index.values)
-            self.assertTrue(s.name is None)
+            assert result.name == name
+            tm.assert_numpy_array_equal(result.index.values, s.index.values)
+            assert s.name is None
 
     def test_rename_set_name_inplace(self):
         s = Series(range(3), index=list('abc'))
         for name in ['foo', 123, 123., datetime(2001, 11, 11), ('foo',)]:
             s.rename(name, inplace=True)
-            self.assertEqual(s.name, name)
+            assert s.name == name
 
             exp = np.array(['a', 'b', 'c'], dtype=np.object_)
-            self.assert_numpy_array_equal(s.index.values, exp)
+            tm.assert_numpy_array_equal(s.index.values, exp)
+
+    def test_rename_axis_supported(self):
+        # Supporting axis for compatibility, detailed in GH-18589
+        s = Series(range(5))
+        s.rename({}, axis=0)
+        s.rename({}, axis='index')
+        with pytest.raises(ValueError, match='No axis named 5'):
+            s.rename({}, axis=5)
 
     def test_set_name_attribute(self):
         s = Series([1, 2, 3])
         s2 = Series([1, 2, 3], name='bar')
         for name in [7, 7., 'name', datetime(2001, 1, 1), (1,), u"\u05D0"]:
             s.name = name
-            self.assertEqual(s.name, name)
+            assert s.name == name
             s2.name = name
-            self.assertEqual(s2.name, name)
+            assert s2.name == name
 
     def test_set_name(self):
         s = Series([1, 2, 3])
         s2 = s._set_name('foo')
-        self.assertEqual(s2.name, 'foo')
-        self.assertTrue(s.name is None)
-        self.assertTrue(s is not s2)
+        assert s2.name == 'foo'
+        assert s.name is None
+        assert s is not s2
 
-    def test_rename_inplace(self):
+    def test_rename_inplace(self, datetime_series):
         renamer = lambda x: x.strftime('%Y%m%d')
-        expected = renamer(self.ts.index[0])
+        expected = renamer(datetime_series.index[0])
 
-        self.ts.rename(renamer, inplace=True)
-        self.assertEqual(self.ts.index[0], expected)
+        datetime_series.rename(renamer, inplace=True)
+        assert datetime_series.index[0] == expected
 
     def test_set_index_makes_timeseries(self):
         idx = tm.makeDateIndex(10)
 
         s = Series(lrange(10))
         s.index = idx
-        self.assertTrue(s.index.is_all_dates)
+        assert s.index.is_all_dates
 
     def test_reset_index(self):
         df = tm.makeDataFrame()[:5]
@@ -116,70 +125,223 @@ def test_reset_index(self):
 
         ser.name = 'value'
         df = ser.reset_index()
-        self.assertIn('value', df)
+        assert 'value' in df
 
         df = ser.reset_index(name='value2')
-        self.assertIn('value2', df)
+        assert 'value2' in df
 
         # check inplace
         s = ser.reset_index(drop=True)
         s2 = ser
         s2.reset_index(drop=True, inplace=True)
-        assert_series_equal(s, s2)
+        tm.assert_series_equal(s, s2)
 
         # level
         index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
+                           codes=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1]])
         s = Series(np.random.randn(6), index=index)
         rs = s.reset_index(level=1)
-        self.assertEqual(len(rs.columns), 2)
+        assert len(rs.columns) == 2
 
         rs = s.reset_index(level=[0, 2], drop=True)
-        self.assert_index_equal(rs.index, Index(index.get_level_values(1)))
-        tm.assertIsInstance(rs, Series)
+        tm.assert_index_equal(rs.index, Index(index.get_level_values(1)))
+        assert isinstance(rs, Series)
+
+    def test_reset_index_name(self):
+        s = Series([1, 2, 3], index=Index(range(3), name='x'))
+        assert s.reset_index().index.name is None
+        assert s.reset_index(drop=True).index.name is None
+
+    def test_reset_index_level(self):
+        df = DataFrame([[1, 2, 3], [4, 5, 6]],
+                       columns=['A', 'B', 'C'])
+
+        for levels in ['A', 'B'], [0, 1]:
+            # With MultiIndex
+            s = df.set_index(['A', 'B'])['C']
+
+            result = s.reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = s.reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df.set_index('B'))
+
+            result = s.reset_index(level=levels)
+            tm.assert_frame_equal(result, df)
+
+            result = df.set_index(['A', 'B']).reset_index(level=levels,
+                                                          drop=True)
+            tm.assert_frame_equal(result, df[['C']])
+
+            with pytest.raises(KeyError, match='Level E '):
+                s.reset_index(level=['A', 'E'])
+
+            # With single-level Index
+            s = df.set_index('A')['B']
+
+            result = s.reset_index(level=levels[0])
+            tm.assert_frame_equal(result, df[['A', 'B']])
+
+            result = s.reset_index(level=levels[:1])
+            tm.assert_frame_equal(result, df[['A', 'B']])
+
+            result = s.reset_index(level=levels[0], drop=True)
+            tm.assert_series_equal(result, df['B'])
+
+            with pytest.raises(IndexError, match='Too many levels'):
+                s.reset_index(level=[0, 1, 2])
+
+        # Check that .reset_index([],drop=True) doesn't fail
+        result = Series(range(4)).reset_index([], drop=True)
+        expected = Series(range(4))
+        tm.assert_series_equal(result, expected)
 
     def test_reset_index_range(self):
         # GH 12071
-        s = pd.Series(range(2), name='A', dtype='int64')
+        s = Series(range(2), name='A', dtype='int64')
         series_result = s.reset_index()
-        tm.assertIsInstance(series_result.index, RangeIndex)
-        series_expected = pd.DataFrame([[0, 0], [1, 1]],
-                                       columns=['index', 'A'],
-                                       index=RangeIndex(stop=2))
-        assert_frame_equal(series_result, series_expected)
+        assert isinstance(series_result.index, RangeIndex)
+        series_expected = DataFrame([[0, 0], [1, 1]],
+                                    columns=['index', 'A'],
+                                    index=RangeIndex(stop=2))
+        tm.assert_frame_equal(series_result, series_expected)
 
     def test_reorder_levels(self):
         index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]],
+                           codes=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1]],
                            names=['L0', 'L1', 'L2'])
         s = Series(np.arange(6), index=index)
 
         # no change, position
         result = s.reorder_levels([0, 1, 2])
-        assert_series_equal(s, result)
+        tm.assert_series_equal(s, result)
 
         # no change, labels
         result = s.reorder_levels(['L0', 'L1', 'L2'])
-        assert_series_equal(s, result)
+        tm.assert_series_equal(s, result)
 
         # rotate, position
         result = s.reorder_levels([1, 2, 0])
         e_idx = MultiIndex(levels=[['one', 'two', 'three'], [0, 1], ['bar']],
-                           labels=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1],
-                                   [0, 0, 0, 0, 0, 0]],
+                           codes=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1],
+                                  [0, 0, 0, 0, 0, 0]],
                            names=['L1', 'L2', 'L0'])
         expected = Series(np.arange(6), index=e_idx)
-        assert_series_equal(result, expected)
-
-        result = s.reorder_levels([0, 0, 0])
-        e_idx = MultiIndex(levels=[['bar'], ['bar'], ['bar']],
-                           labels=[[0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0],
-                                   [0, 0, 0, 0, 0, 0]],
-                           names=['L0', 'L0', 'L0'])
-        expected = Series(range(6), index=e_idx)
-        assert_series_equal(result, expected)
-
-        result = s.reorder_levels(['L0', 'L0', 'L0'])
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
+
+    def test_rename_axis_mapper(self):
+        # GH 19978
+        mi = MultiIndex.from_product([['a', 'b', 'c'], [1, 2]],
+                                     names=['ll', 'nn'])
+        s = Series([i for i in range(len(mi))], index=mi)
+
+        result = s.rename_axis(index={'ll': 'foo'})
+        assert result.index.names == ['foo', 'nn']
+
+        result = s.rename_axis(index=str.upper, axis=0)
+        assert result.index.names == ['LL', 'NN']
+
+        result = s.rename_axis(index=['foo', 'goo'])
+        assert result.index.names == ['foo', 'goo']
+
+        with pytest.raises(TypeError, match='unexpected'):
+            s.rename_axis(columns='wrong')
+
+    def test_rename_axis_inplace(self, datetime_series):
+        # GH 15704
+        expected = datetime_series.rename_axis('foo')
+        result = datetime_series
+        no_return = result.rename_axis('foo', inplace=True)
+
+        assert no_return is None
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('kwargs', [{'mapper': None}, {'index': None}, {}])
+    def test_rename_axis_none(self, kwargs):
+        # GH 25034
+        index = Index(list('abc'), name='foo')
+        df = Series([1, 2, 3], index=index)
+
+        result = df.rename_axis(**kwargs)
+        expected_index = index.rename(None) if kwargs else index
+        expected = Series([1, 2, 3], index=expected_index)
+        tm.assert_series_equal(result, expected)
+
+    def test_set_axis_inplace_axes(self, axis_series):
+        # GH14636
+        ser = Series(np.arange(4), index=[1, 3, 5, 7], dtype='int64')
+
+        expected = ser.copy()
+        expected.index = list('abcd')
+
+        # inplace=True
+        # The FutureWarning comes from the fact that we would like to have
+        # inplace default to False some day
+        for inplace, warn in [(None, FutureWarning), (True, None)]:
+            result = ser.copy()
+            kwargs = {'inplace': inplace}
+            with tm.assert_produces_warning(warn):
+                result.set_axis(list('abcd'), axis=axis_series, **kwargs)
+            tm.assert_series_equal(result, expected)
+
+    def test_set_axis_inplace(self):
+        # GH14636
+
+        s = Series(np.arange(4), index=[1, 3, 5, 7], dtype='int64')
+
+        expected = s.copy()
+        expected.index = list('abcd')
+
+        # inplace=False
+        result = s.set_axis(list('abcd'), axis=0, inplace=False)
+        tm.assert_series_equal(expected, result)
+
+        # omitting the "axis" parameter
+        with tm.assert_produces_warning(None):
+            result = s.set_axis(list('abcd'), inplace=False)
+        tm.assert_series_equal(result, expected)
+
+        # wrong values for the "axis" parameter
+        for axis in [2, 'foo']:
+            with pytest.raises(ValueError, match='No axis named'):
+                s.set_axis(list('abcd'), axis=axis, inplace=False)
+
+    def test_set_axis_prior_to_deprecation_signature(self):
+        s = Series(np.arange(4), index=[1, 3, 5, 7], dtype='int64')
+
+        expected = s.copy()
+        expected.index = list('abcd')
+
+        for axis in [0, 'index']:
+            with tm.assert_produces_warning(FutureWarning):
+                result = s.set_axis(0, list('abcd'), inplace=False)
+            tm.assert_series_equal(result, expected)
+
+    def test_reset_index_drop_errors(self):
+        #  GH 20925
+
+        # KeyError raised for series index when passed level name is missing
+        s = Series(range(4))
+        with pytest.raises(KeyError, match='must be same as name'):
+            s.reset_index('wrong', drop=True)
+        with pytest.raises(KeyError, match='must be same as name'):
+            s.reset_index('wrong')
+
+        # KeyError raised for series when level to be dropped is missing
+        s = Series(range(4), index=MultiIndex.from_product([[1, 2]] * 2))
+        with pytest.raises(KeyError, match='not found'):
+            s.reset_index('wrong', drop=True)
+
+    def test_droplevel(self):
+        # GH20342
+        ser = Series([1, 2, 3, 4])
+        ser.index = MultiIndex.from_arrays([(1, 2, 3, 4), (5, 6, 7, 8)],
+                                           names=['a', 'b'])
+        expected = ser.reset_index('b', drop=True)
+        result = ser.droplevel('b', axis='index')
+        tm.assert_series_equal(result, expected)
+        # test that droplevel raises ValueError on axis != 0
+        with pytest.raises(ValueError):
+            ser.droplevel(1, axis='columns')
diff --git a/pandas/tests/series/test_analytics.py b/pandas/tests/series/test_analytics.py
index b747a680c17dd..d7d9c526503cb 100644
--- a/pandas/tests/series/test_analytics.py
+++ b/pandas/tests/series/test_analytics.py
@@ -1,317 +1,31 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-from itertools import product
 from distutils.version import LooseVersion
+from itertools import product
+import operator
 
+import numpy as np
+from numpy import nan
 import pytest
 
-from numpy import nan
-import numpy as np
-import pandas as pd
+from pandas.compat import PY2, PY35, is_platform_windows, lrange, range
+import pandas.util._test_decorators as td
 
-from pandas import (Series, Categorical, DataFrame, isnull, notnull,
-                    bdate_range, date_range, _np_version_under1p10)
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DataFrame, Series, compat, date_range, isna,
+    notna)
+from pandas.api.types import is_scalar
 from pandas.core.index import MultiIndex
-from pandas.tseries.index import Timestamp
-from pandas.tseries.tdi import Timedelta
-import pandas.core.config as cf
-
-import pandas.core.nanops as nanops
-
-from pandas.compat import lrange, range
-from pandas import compat
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal, assert_index_equal)
+from pandas.core.indexes.datetimes import Timestamp
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_index_equal,
+    assert_series_equal)
 
-from .common import TestData
-
-
-class TestSeriesAnalytics(TestData, tm.TestCase):
-
-    def test_sum_zero(self):
-        arr = np.array([])
-        self.assertEqual(nanops.nansum(arr), 0)
-
-        arr = np.empty((10, 0))
-        self.assertTrue((nanops.nansum(arr, axis=1) == 0).all())
-
-        # GH #844
-        s = Series([], index=[])
-        self.assertEqual(s.sum(), 0)
-
-        df = DataFrame(np.empty((10, 0)))
-        self.assertTrue((df.sum(1) == 0).all())
-
-    def test_nansum_buglet(self):
-        s = Series([1.0, np.nan], index=[0, 1])
-        result = np.nansum(s)
-        assert_almost_equal(result, 1)
-
-    def test_overflow(self):
-        # GH 6915
-        # overflowing on the smaller int dtypes
-        for dtype in ['int32', 'int64']:
-            v = np.arange(5000000, dtype=dtype)
-            s = Series(v)
-
-            # no bottleneck
-            result = s.sum(skipna=False)
-            self.assertEqual(int(result), v.sum(dtype='int64'))
-            result = s.min(skipna=False)
-            self.assertEqual(int(result), 0)
-            result = s.max(skipna=False)
-            self.assertEqual(int(result), v[-1])
-
-            # use bottleneck if available
-            result = s.sum()
-            self.assertEqual(int(result), v.sum(dtype='int64'))
-            result = s.min()
-            self.assertEqual(int(result), 0)
-            result = s.max()
-            self.assertEqual(int(result), v[-1])
-
-        for dtype in ['float32', 'float64']:
-            v = np.arange(5000000, dtype=dtype)
-            s = Series(v)
-
-            # no bottleneck
-            result = s.sum(skipna=False)
-            self.assertEqual(result, v.sum(dtype=dtype))
-            result = s.min(skipna=False)
-            self.assertTrue(np.allclose(float(result), 0.0))
-            result = s.max(skipna=False)
-            self.assertTrue(np.allclose(float(result), v[-1]))
-
-            # use bottleneck if available
-            result = s.sum()
-            self.assertEqual(result, v.sum(dtype=dtype))
-            result = s.min()
-            self.assertTrue(np.allclose(float(result), 0.0))
-            result = s.max()
-            self.assertTrue(np.allclose(float(result), v[-1]))
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum, check_allna=True)
-
-    def test_sum_inf(self):
-        import pandas.core.nanops as nanops
-
-        s = Series(np.random.randn(10))
-        s2 = s.copy()
-
-        s[5:8] = np.inf
-        s2[5:8] = np.nan
-
-        self.assertTrue(np.isinf(s.sum()))
-
-        arr = np.random.randn(100, 100).astype('f4')
-        arr[:, 2] = np.inf
-
-        with cf.option_context("mode.use_inf_as_null", True):
-            assert_almost_equal(s.sum(), s2.sum())
-
-        res = nanops.nansum(arr, axis=1)
-        self.assertTrue(np.isinf(res).all())
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean)
-
-    def test_median(self):
-        self._check_stat_op('median', np.median)
-
-        # test with integers, test failure
-        int_ts = Series(np.ones(10, dtype=int), index=lrange(10))
-        self.assertAlmostEqual(np.median(int_ts), int_ts.median())
-
-    def test_mode(self):
-        # No mode should be found.
-        exp = Series([], dtype=np.float64)
-        tm.assert_series_equal(Series([]).mode(), exp)
-
-        exp = Series([1], dtype=np.int64)
-        tm.assert_series_equal(Series([1]).mode(), exp)
-
-        exp = Series(['a', 'b', 'c'], dtype=np.object)
-        tm.assert_series_equal(Series(['a', 'b', 'c']).mode(), exp)
-
-        # Test numerical data types.
-        exp_single = [1]
-        data_single = [1] * 5 + [2] * 3
-
-        exp_multi = [1, 3]
-        data_multi = [1] * 5 + [2] * 3 + [3] * 5
-
-        for dt in np.typecodes['AllInteger'] + np.typecodes['Float']:
-            s = Series(data_single, dtype=dt)
-            exp = Series(exp_single, dtype=dt)
-            tm.assert_series_equal(s.mode(), exp)
-
-            s = Series(data_multi, dtype=dt)
-            exp = Series(exp_multi, dtype=dt)
-            tm.assert_series_equal(s.mode(), exp)
-
-        # Test string and object types.
-        exp = ['b']
-        data = ['a'] * 2 + ['b'] * 3
-
-        s = Series(data, dtype='c')
-        exp = Series(exp, dtype='c')
-        tm.assert_series_equal(s.mode(), exp)
-
-        exp = ['bar']
-        data = ['foo'] * 2 + ['bar'] * 3
-
-        for dt in [str, object]:
-            s = Series(data, dtype=dt)
-            exp = Series(exp, dtype=dt)
-            tm.assert_series_equal(s.mode(), exp)
-
-        # Test datetime types.
-        exp = Series(['1900-05-03', '2011-01-03',
-                      '2013-01-02'], dtype='M8[ns]')
-        s = Series(['2011-01-03', '2013-01-02',
-                    '1900-05-03'], dtype='M8[ns]')
-        tm.assert_series_equal(s.mode(), exp)
-
-        exp = Series(['2011-01-03', '2013-01-02'], dtype='M8[ns]')
-        s = Series(['2011-01-03', '2013-01-02', '1900-05-03',
-                    '2011-01-03', '2013-01-02'], dtype='M8[ns]')
-        tm.assert_series_equal(s.mode(), exp)
-
-        # gh-5986: Test timedelta types.
-        exp = Series(['-1 days', '0 days', '1 days'], dtype='timedelta64[ns]')
-        s = Series(['1 days', '-1 days', '0 days'],
-                   dtype='timedelta64[ns]')
-        tm.assert_series_equal(s.mode(), exp)
-
-        exp = Series(['2 min', '1 day'], dtype='timedelta64[ns]')
-        s = Series(['1 day', '1 day', '-1 day', '-1 day 2 min',
-                    '2 min', '2 min'], dtype='timedelta64[ns]')
-        tm.assert_series_equal(s.mode(), exp)
-
-        # Test mixed dtype.
-        exp = Series(['foo'])
-        s = Series([1, 'foo', 'foo'])
-        tm.assert_series_equal(s.mode(), exp)
-
-        # Test for uint64 overflow.
-        exp = Series([2**63], dtype=np.uint64)
-        s = Series([1, 2**63, 2**63], dtype=np.uint64)
-        tm.assert_series_equal(s.mode(), exp)
-
-        exp = Series([1, 2**63], dtype=np.uint64)
-        s = Series([1, 2**63], dtype=np.uint64)
-        tm.assert_series_equal(s.mode(), exp)
-
-        # Test category dtype.
-        c = Categorical([1, 2])
-        exp = Categorical([1, 2], categories=[1, 2])
-        exp = Series(exp, dtype='category')
-        tm.assert_series_equal(Series(c).mode(), exp)
-
-        c = Categorical([1, 'a', 'a'])
-        exp = Categorical(['a'], categories=[1, 'a'])
-        exp = Series(exp, dtype='category')
-        tm.assert_series_equal(Series(c).mode(), exp)
-
-        c = Categorical([1, 1, 2, 3, 3])
-        exp = Categorical([1, 3], categories=[1, 2, 3])
-        exp = Series(exp, dtype='category')
-        tm.assert_series_equal(Series(c).mode(), exp)
-
-    def test_prod(self):
-        self._check_stat_op('prod', np.prod)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min, check_objects=True)
-
-    def test_max(self):
-        self._check_stat_op('max', np.max, check_objects=True)
-
-    def test_var_std(self):
-        alt = lambda x: np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
-
-        alt = lambda x: np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
-
-        result = self.ts.std(ddof=4)
-        expected = np.std(self.ts.values, ddof=4)
-        assert_almost_equal(result, expected)
-
-        result = self.ts.var(ddof=4)
-        expected = np.var(self.ts.values, ddof=4)
-        assert_almost_equal(result, expected)
-
-        # 1 - element series with ddof=1
-        s = self.ts.iloc[[0]]
-        result = s.var(ddof=1)
-        self.assertTrue(isnull(result))
-
-        result = s.std(ddof=1)
-        self.assertTrue(isnull(result))
 
-    def test_sem(self):
-        alt = lambda x: np.std(x, ddof=1) / np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-        result = self.ts.sem(ddof=4)
-        expected = np.std(self.ts.values,
-                          ddof=4) / np.sqrt(len(self.ts.values))
-        assert_almost_equal(result, expected)
-
-        # 1 - element series with ddof=1
-        s = self.ts.iloc[[0]]
-        result = s.sem(ddof=1)
-        self.assertTrue(isnull(result))
-
-    def test_skew(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import skew
-        alt = lambda x: skew(x, bias=False)
-        self._check_stat_op('skew', alt)
-
-        # test corner cases, skew() returns NaN unless there's at least 3
-        # values
-        min_N = 3
-        for i in range(1, min_N + 1):
-            s = Series(np.ones(i))
-            df = DataFrame(np.ones((i, i)))
-            if i < min_N:
-                self.assertTrue(np.isnan(s.skew()))
-                self.assertTrue(np.isnan(df.skew()).all())
-            else:
-                self.assertEqual(0, s.skew())
-                self.assertTrue((df.skew() == 0).all())
-
-    def test_kurt(self):
-        tm._skip_if_no_scipy()
-
-        from scipy.stats import kurtosis
-        alt = lambda x: kurtosis(x, bias=False)
-        self._check_stat_op('kurt', alt)
-
-        index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
-        s = Series(np.random.randn(6), index=index)
-        self.assertAlmostEqual(s.kurt(), s.kurt(level=0)['bar'])
-
-        # test corner cases, kurt() returns NaN unless there's at least 4
-        # values
-        min_N = 4
-        for i in range(1, min_N + 1):
-            s = Series(np.ones(i))
-            df = DataFrame(np.ones((i, i)))
-            if i < min_N:
-                self.assertTrue(np.isnan(s.kurt()))
-                self.assertTrue(np.isnan(df.kurt()).all())
-            else:
-                self.assertEqual(0, s.kurt())
-                self.assertTrue((df.kurt() == 0).all())
+class TestSeriesAnalytics(object):
 
     def test_describe(self):
         s = Series([0, 1, 2, 3, 4], name='int_data')
@@ -320,31 +34,48 @@ def test_describe(self):
                           name='int_data',
                           index=['count', 'mean', 'std', 'min', '25%',
                                  '50%', '75%', 'max'])
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         s = Series([True, True, False, False, False], name='bool_data')
         result = s.describe()
         expected = Series([5, 2, False, 3], name='bool_data',
                           index=['count', 'unique', 'top', 'freq'])
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         s = Series(['a', 'a', 'b', 'c', 'd'], name='str_data')
         result = s.describe()
         expected = Series([5, 4, 'a', 2], name='str_data',
                           index=['count', 'unique', 'top', 'freq'])
-        self.assert_series_equal(result, expected)
-
-    def test_argsort(self):
-        self._check_accum_op('argsort', check_dtype=False)
-        argsorted = self.ts.argsort()
-        self.assertTrue(issubclass(argsorted.dtype.type, np.integer))
+        tm.assert_series_equal(result, expected)
+
+    def test_describe_with_tz(self, tz_naive_fixture):
+        # GH 21332
+        tz = tz_naive_fixture
+        name = str(tz_naive_fixture)
+        start = Timestamp(2018, 1, 1)
+        end = Timestamp(2018, 1, 5)
+        s = Series(date_range(start, end, tz=tz), name=name)
+        result = s.describe()
+        expected = Series(
+            [5, 5, s.value_counts().index[0], 1, start.tz_localize(tz),
+             end.tz_localize(tz)
+             ],
+            name=name,
+            index=['count', 'unique', 'top', 'freq', 'first', 'last']
+        )
+        tm.assert_series_equal(result, expected)
+
+    def test_argsort(self, datetime_series):
+        self._check_accum_op('argsort', datetime_series, check_dtype=False)
+        argsorted = datetime_series.argsort()
+        assert issubclass(argsorted.dtype.type, np.integer)
 
         # GH 2967 (introduced bug in 0.11-dev I think)
         s = Series([Timestamp('201301%02d' % (i + 1)) for i in range(5)])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         shifted = s.shift(-1)
-        self.assertEqual(shifted.dtype, 'datetime64[ns]')
-        self.assertTrue(isnull(shifted[4]))
+        assert shifted.dtype == 'datetime64[ns]'
+        assert isna(shifted[4])
 
         result = s.argsort()
         expected = Series(lrange(5), dtype='int64')
@@ -362,37 +93,42 @@ def test_argsort_stable(self):
         mexpected = np.argsort(s.values, kind='mergesort')
         qexpected = np.argsort(s.values, kind='quicksort')
 
-        self.assert_series_equal(mindexer, Series(mexpected),
-                                 check_dtype=False)
-        self.assert_series_equal(qindexer, Series(qexpected),
-                                 check_dtype=False)
-        self.assertFalse(np.array_equal(qindexer, mindexer))
-
-    def test_cumsum(self):
-        self._check_accum_op('cumsum')
-
-    def test_cumprod(self):
-        self._check_accum_op('cumprod')
-
-    def test_cummin(self):
-        self.assert_numpy_array_equal(self.ts.cummin().values,
-                                      np.minimum.accumulate(np.array(self.ts)))
-        ts = self.ts.copy()
+        tm.assert_series_equal(mindexer, Series(mexpected),
+                               check_dtype=False)
+        tm.assert_series_equal(qindexer, Series(qexpected),
+                               check_dtype=False)
+        msg = (r"ndarray Expected type <(class|type) 'numpy\.ndarray'>,"
+               r" found <class 'pandas\.core\.series\.Series'> instead")
+        with pytest.raises(AssertionError, match=msg):
+            tm.assert_numpy_array_equal(qindexer, mindexer)
+
+    def test_cumsum(self, datetime_series):
+        self._check_accum_op('cumsum', datetime_series)
+
+    def test_cumprod(self, datetime_series):
+        self._check_accum_op('cumprod', datetime_series)
+
+    def test_cummin(self, datetime_series):
+        tm.assert_numpy_array_equal(datetime_series.cummin().values,
+                                    np.minimum
+                                    .accumulate(np.array(datetime_series)))
+        ts = datetime_series.copy()
         ts[::2] = np.NaN
         result = ts.cummin()[1::2]
-        expected = np.minimum.accumulate(ts.valid())
+        expected = np.minimum.accumulate(ts.dropna())
 
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
-    def test_cummax(self):
-        self.assert_numpy_array_equal(self.ts.cummax().values,
-                                      np.maximum.accumulate(np.array(self.ts)))
-        ts = self.ts.copy()
+    def test_cummax(self, datetime_series):
+        tm.assert_numpy_array_equal(datetime_series.cummax().values,
+                                    np.maximum
+                                    .accumulate(np.array(datetime_series)))
+        ts = datetime_series.copy()
         ts[::2] = np.NaN
         result = ts.cummax()[1::2]
-        expected = np.maximum.accumulate(ts.valid())
+        expected = np.maximum.accumulate(ts.dropna())
 
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_cummin_datetime64(self):
         s = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT', '2000-1-1',
@@ -401,13 +137,13 @@ def test_cummin_datetime64(self):
         expected = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT',
                                              '2000-1-1', 'NaT', '2000-1-1']))
         result = s.cummin(skipna=True)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
         expected = pd.Series(pd.to_datetime(
             ['NaT', '2000-1-2', '2000-1-2', '2000-1-1', '2000-1-1', '2000-1-1'
              ]))
         result = s.cummin(skipna=False)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
     def test_cummax_datetime64(self):
         s = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT', '2000-1-1',
@@ -416,13 +152,13 @@ def test_cummax_datetime64(self):
         expected = pd.Series(pd.to_datetime(['NaT', '2000-1-2', 'NaT',
                                              '2000-1-2', 'NaT', '2000-1-3']))
         result = s.cummax(skipna=True)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
         expected = pd.Series(pd.to_datetime(
             ['NaT', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-2', '2000-1-3'
              ]))
         result = s.cummax(skipna=False)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
     def test_cummin_timedelta64(self):
         s = pd.Series(pd.to_timedelta(['NaT',
@@ -439,7 +175,7 @@ def test_cummin_timedelta64(self):
                                               'NaT',
                                               '1 min', ]))
         result = s.cummin(skipna=True)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
         expected = pd.Series(pd.to_timedelta(['NaT',
                                               '2 min',
@@ -448,7 +184,7 @@ def test_cummin_timedelta64(self):
                                               '1 min',
                                               '1 min', ]))
         result = s.cummin(skipna=False)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
     def test_cummax_timedelta64(self):
         s = pd.Series(pd.to_timedelta(['NaT',
@@ -465,7 +201,7 @@ def test_cummax_timedelta64(self):
                                               'NaT',
                                               '3 min', ]))
         result = s.cummax(skipna=True)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
         expected = pd.Series(pd.to_timedelta(['NaT',
                                               '2 min',
@@ -474,7 +210,7 @@ def test_cummax_timedelta64(self):
                                               '2 min',
                                               '3 min', ]))
         result = s.cummax(skipna=False)
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
     def test_npdiff(self):
         pytest.skip("skipping due to Series no longer being an "
@@ -486,97 +222,21 @@ def test_npdiff(self):
         r = np.diff(s)
         assert_series_equal(Series([nan, 0, 0, 0, nan]), r)
 
-    def _check_stat_op(self, name, alternate, check_objects=False,
-                       check_allna=False):
-        import pandas.core.nanops as nanops
-
-        def testit():
-            f = getattr(Series, name)
-
-            # add some NaNs
-            self.series[5:15] = np.NaN
-
-            # idxmax, idxmin, min, and max are valid for dates
-            if name not in ['max', 'min']:
-                ds = Series(date_range('1/1/2001', periods=10))
-                self.assertRaises(TypeError, f, ds)
-
-            # skipna or no
-            self.assertTrue(notnull(f(self.series)))
-            self.assertTrue(isnull(f(self.series, skipna=False)))
-
-            # check the result is correct
-            nona = self.series.dropna()
-            assert_almost_equal(f(nona), alternate(nona.values))
-            assert_almost_equal(f(self.series), alternate(nona.values))
-
-            allna = self.series * nan
-
-            if check_allna:
-                # xref 9422
-                # bottleneck >= 1.0 give 0.0 for an allna Series sum
-                try:
-                    self.assertTrue(nanops._USE_BOTTLENECK)
-                    import bottleneck as bn  # noqa
-                    self.assertTrue(bn.__version__ >= LooseVersion('1.0'))
-                    self.assertEqual(f(allna), 0.0)
-                except:
-                    self.assertTrue(np.isnan(f(allna)))
-
-            # dtype=object with None, it works!
-            s = Series([1, 2, 3, None, 5])
-            f(s)
-
-            # 2888
-            l = [0]
-            l.extend(lrange(2 ** 40, 2 ** 40 + 1000))
-            s = Series(l, dtype='int64')
-            assert_almost_equal(float(f(s)), float(alternate(s.values)))
-
-            # check date range
-            if check_objects:
-                s = Series(bdate_range('1/1/2000', periods=10))
-                res = f(s)
-                exp = alternate(s)
-                self.assertEqual(res, exp)
-
-            # check on string data
-            if name not in ['sum', 'min', 'max']:
-                self.assertRaises(TypeError, f, Series(list('abc')))
-
-            # Invalid axis.
-            self.assertRaises(ValueError, f, self.series, axis=1)
-
-            # Unimplemented numeric_only parameter.
-            if 'numeric_only' in compat.signature(f).args:
-                self.assertRaisesRegexp(NotImplementedError, name, f,
-                                        self.series, numeric_only=True)
-
-        testit()
-
-        try:
-            import bottleneck as bn  # noqa
-            nanops._USE_BOTTLENECK = False
-            testit()
-            nanops._USE_BOTTLENECK = True
-        except ImportError:
-            pass
-
-    def _check_accum_op(self, name, check_dtype=True):
+    def _check_accum_op(self, name, datetime_series_, check_dtype=True):
         func = getattr(np, name)
-        self.assert_numpy_array_equal(func(self.ts).values,
-                                      func(np.array(self.ts)),
-                                      check_dtype=check_dtype)
+        tm.assert_numpy_array_equal(func(datetime_series_).values,
+                                    func(np.array(datetime_series_)),
+                                    check_dtype=check_dtype)
 
         # with missing values
-        ts = self.ts.copy()
+        ts = datetime_series_.copy()
         ts[::2] = np.NaN
 
         result = func(ts)[1::2]
-        expected = func(np.array(ts.valid()))
+        expected = func(np.array(ts.dropna()))
 
-        self.assert_numpy_array_equal(result.values, expected,
-                                      check_dtype=False)
+        tm.assert_numpy_array_equal(result.values, expected,
+                                    check_dtype=False)
 
     def test_compress(self):
         cond = [True, False, True, False, False]
@@ -584,7 +244,9 @@ def test_compress(self):
                    index=list('abcde'), name='foo')
         expected = Series(s.values.compress(cond),
                           index=list('ac'), name='foo')
-        tm.assert_series_equal(s.compress(cond), expected)
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.compress(cond)
+        tm.assert_series_equal(result, expected)
 
     def test_numpy_compress(self):
         cond = [True, False, True, False, False]
@@ -592,23 +254,25 @@ def test_numpy_compress(self):
                    index=list('abcde'), name='foo')
         expected = Series(s.values.compress(cond),
                           index=list('ac'), name='foo')
-        tm.assert_series_equal(np.compress(cond, s), expected)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            tm.assert_series_equal(np.compress(cond, s), expected)
 
-        msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.compress,
-                              cond, s, axis=1)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            msg = "the 'axis' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.compress(cond, s, axis=1)
 
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.compress,
-                              cond, s, out=s)
-
-    def test_round(self):
-        self.ts.index.name = "index_name"
-        result = self.ts.round(2)
-        expected = Series(np.round(self.ts.values, 2),
-                          index=self.ts.index, name='ts')
+            msg = "the 'out' parameter is not supported"
+            with pytest.raises(ValueError, match=msg):
+                np.compress(cond, s, out=s)
+
+    def test_round(self, datetime_series):
+        datetime_series.index.name = "index_name"
+        result = datetime_series.round(2)
+        expected = Series(np.round(datetime_series.values, 2),
+                          index=datetime_series.index, name='ts')
         assert_series_equal(result, expected)
-        self.assertEqual(result.name, self.ts.name)
+        assert result.name == datetime_series.name
 
     def test_numpy_round(self):
         # See gh-12600
@@ -618,157 +282,75 @@ def test_numpy_round(self):
         assert_series_equal(out, expected)
 
         msg = "the 'out' parameter is not supported"
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             np.round(s, decimals=0, out=s)
 
+    @pytest.mark.xfail(
+        PY2 and is_platform_windows(), reason="numpy/numpy#7882",
+        raises=AssertionError, strict=True)
+    def test_numpy_round_nan(self):
+        # See gh-14197
+        s = Series([1.53, np.nan, 0.06])
+        with tm.assert_produces_warning(None):
+            result = s.round()
+        expected = Series([2., np.nan, 0.])
+        assert_series_equal(result, expected)
+
     def test_built_in_round(self):
         if not compat.PY3:
             pytest.skip(
-                'build in round cannot be overriden prior to Python 3')
+                'build in round cannot be overridden prior to Python 3')
 
         s = Series([1.123, 2.123, 3.123], index=lrange(3))
         result = round(s)
         expected_rounded0 = Series([1., 2., 3.], index=lrange(3))
-        self.assert_series_equal(result, expected_rounded0)
+        tm.assert_series_equal(result, expected_rounded0)
 
         decimals = 2
         expected_rounded = Series([1.12, 2.12, 3.12], index=lrange(3))
         result = round(s, decimals)
-        self.assert_series_equal(result, expected_rounded)
+        tm.assert_series_equal(result, expected_rounded)
 
     def test_prod_numpy16_bug(self):
         s = Series([1., 1., 1.], index=lrange(3))
         result = s.prod()
-        self.assertNotIsInstance(result, Series)
-
-    def test_all_any(self):
-        ts = tm.makeTimeSeries()
-        bool_series = ts > 0
-        self.assertFalse(bool_series.all())
-        self.assertTrue(bool_series.any())
-
-        # Alternative types, with implicit 'object' dtype.
-        s = Series(['abc', True])
-        self.assertEqual('abc', s.any())  # 'abc' || True => 'abc'
-
-    def test_all_any_params(self):
-        # Check skipna, with implicit 'object' dtype.
-        s1 = Series([np.nan, True])
-        s2 = Series([np.nan, False])
-        self.assertTrue(s1.all(skipna=False))  # nan && True => True
-        self.assertTrue(s1.all(skipna=True))
-        self.assertTrue(np.isnan(s2.any(skipna=False)))  # nan || False => nan
-        self.assertFalse(s2.any(skipna=True))
-
-        # Check level.
-        s = pd.Series([False, False, True, True, False, True],
-                      index=[0, 0, 1, 1, 2, 2])
-        assert_series_equal(s.all(level=0), Series([False, True, False]))
-        assert_series_equal(s.any(level=0), Series([False, True, True]))
-
-        # bool_only is not implemented with level option.
-        self.assertRaises(NotImplementedError, s.any, bool_only=True, level=0)
-        self.assertRaises(NotImplementedError, s.all, bool_only=True, level=0)
-
-        # bool_only is not implemented alone.
-        self.assertRaises(NotImplementedError, s.any, bool_only=True)
-        self.assertRaises(NotImplementedError, s.all, bool_only=True)
-
-    def test_modulo(self):
-        with np.errstate(all='ignore'):
-
-            # GH3590, modulo as ints
-            p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-            result = p['first'] % p['second']
-            expected = Series(p['first'].values % p['second'].values,
-                              dtype='float64')
-            expected.iloc[0:3] = np.nan
-            assert_series_equal(result, expected)
-
-            result = p['first'] % 0
-            expected = Series(np.nan, index=p.index, name='first')
-            assert_series_equal(result, expected)
-
-            p = p.astype('float64')
-            result = p['first'] % p['second']
-            expected = Series(p['first'].values % p['second'].values)
-            assert_series_equal(result, expected)
-
-            p = p.astype('float64')
-            result = p['first'] % p['second']
-            result2 = p['second'] % p['first']
-            self.assertFalse(np.array_equal(result, result2))
-
-            # GH 9144
-            s = Series([0, 1])
-
-            result = s % 0
-            expected = Series([nan, nan])
-            assert_series_equal(result, expected)
-
-            result = 0 % s
-            expected = Series([nan, 0.0])
-            assert_series_equal(result, expected)
-
-    def test_ops_consistency_on_empty(self):
-
-        # GH 7869
-        # consistency on empty
 
-        # float
-        result = Series(dtype=float).sum()
-        self.assertEqual(result, 0)
-
-        result = Series(dtype=float).mean()
-        self.assertTrue(isnull(result))
-
-        result = Series(dtype=float).median()
-        self.assertTrue(isnull(result))
-
-        # timedelta64[ns]
-        result = Series(dtype='m8[ns]').sum()
-        self.assertEqual(result, Timedelta(0))
-
-        result = Series(dtype='m8[ns]').mean()
-        self.assertTrue(result is pd.NaT)
-
-        result = Series(dtype='m8[ns]').median()
-        self.assertTrue(result is pd.NaT)
-
-    def test_corr(self):
-        tm._skip_if_no_scipy()
+        assert not isinstance(result, Series)
 
+    @td.skip_if_no_scipy
+    def test_corr(self, datetime_series):
         import scipy.stats as stats
 
         # full overlap
-        self.assertAlmostEqual(self.ts.corr(self.ts), 1)
+        tm.assert_almost_equal(datetime_series.corr(datetime_series), 1)
 
         # partial overlap
-        self.assertAlmostEqual(self.ts[:15].corr(self.ts[5:]), 1)
+        tm.assert_almost_equal(datetime_series[:15].corr(datetime_series[5:]),
+                               1)
 
-        self.assertTrue(isnull(self.ts[:15].corr(self.ts[5:], min_periods=12)))
+        assert isna(datetime_series[:15].corr(datetime_series[5:],
+                    min_periods=12))
 
-        ts1 = self.ts[:15].reindex(self.ts.index)
-        ts2 = self.ts[5:].reindex(self.ts.index)
-        self.assertTrue(isnull(ts1.corr(ts2, min_periods=12)))
+        ts1 = datetime_series[:15].reindex(datetime_series.index)
+        ts2 = datetime_series[5:].reindex(datetime_series.index)
+        assert isna(ts1.corr(ts2, min_periods=12))
 
         # No overlap
-        self.assertTrue(np.isnan(self.ts[::2].corr(self.ts[1::2])))
+        assert np.isnan(datetime_series[::2].corr(datetime_series[1::2]))
 
         # all NA
-        cp = self.ts[:10].copy()
+        cp = datetime_series[:10].copy()
         cp[:] = np.nan
-        self.assertTrue(isnull(cp.corr(cp)))
+        assert isna(cp.corr(cp))
 
         A = tm.makeTimeSeries()
         B = tm.makeTimeSeries()
         result = A.corr(B)
         expected, _ = stats.pearsonr(A, B)
-        self.assertAlmostEqual(result, expected)
+        tm.assert_almost_equal(result, expected)
 
+    @td.skip_if_no_scipy
     def test_corr_rank(self):
-        tm._skip_if_no_scipy()
-
         import scipy
         import scipy.stats as stats
 
@@ -778,14 +360,14 @@ def test_corr_rank(self):
         A[-5:] = A[:5]
         result = A.corr(B, method='kendall')
         expected = stats.kendalltau(A, B)[0]
-        self.assertAlmostEqual(result, expected)
+        tm.assert_almost_equal(result, expected)
 
         result = A.corr(B, method='spearman')
         expected = stats.spearmanr(A, B)[0]
-        self.assertAlmostEqual(result, expected)
+        tm.assert_almost_equal(result, expected)
 
         # these methods got rewritten in 0.8
-        if scipy.__version__ < LooseVersion('0.9'):
+        if LooseVersion(scipy.__version__) < LooseVersion('0.9'):
             pytest.skip("skipping corr rank because of scipy version "
                         "{0}".format(scipy.__version__))
 
@@ -798,38 +380,81 @@ def test_corr_rank(self):
              1.17258718, -1.06009347, -0.10222060, -0.89076239, 0.89372375])
         kexp = 0.4319297
         sexp = 0.5853767
-        self.assertAlmostEqual(A.corr(B, method='kendall'), kexp)
-        self.assertAlmostEqual(A.corr(B, method='spearman'), sexp)
+        tm.assert_almost_equal(A.corr(B, method='kendall'), kexp)
+        tm.assert_almost_equal(A.corr(B, method='spearman'), sexp)
+
+    def test_corr_invalid_method(self):
+        # GH PR #22298
+        s1 = pd.Series(np.random.randn(10))
+        s2 = pd.Series(np.random.randn(10))
+        msg = ("method must be either 'pearson', 'spearman', "
+               "or 'kendall'")
+        with pytest.raises(ValueError, match=msg):
+            s1.corr(s2, method="____")
+
+    def test_corr_callable_method(self, datetime_series):
+        # simple correlation example
+        # returns 1 if exact equality, 0 otherwise
+        my_corr = lambda a, b: 1. if (a == b).all() else 0.
+
+        # simple example
+        s1 = Series([1, 2, 3, 4, 5])
+        s2 = Series([5, 4, 3, 2, 1])
+        expected = 0
+        tm.assert_almost_equal(
+            s1.corr(s2, method=my_corr),
+            expected)
 
-    def test_cov(self):
         # full overlap
-        self.assertAlmostEqual(self.ts.cov(self.ts), self.ts.std() ** 2)
+        tm.assert_almost_equal(datetime_series.corr(
+            datetime_series, method=my_corr), 1.)
 
         # partial overlap
-        self.assertAlmostEqual(self.ts[:15].cov(self.ts[5:]),
-                               self.ts[5:15].std() ** 2)
+        tm.assert_almost_equal(datetime_series[:15].corr(
+            datetime_series[5:], method=my_corr), 1.)
 
         # No overlap
-        self.assertTrue(np.isnan(self.ts[::2].cov(self.ts[1::2])))
+        assert np.isnan(datetime_series[::2].corr(
+            datetime_series[1::2], method=my_corr))
+
+        # dataframe example
+        df = pd.DataFrame([s1, s2])
+        expected = pd.DataFrame([
+            {0: 1., 1: 0}, {0: 0, 1: 1.}])
+        tm.assert_almost_equal(
+            df.transpose().corr(method=my_corr), expected)
+
+    def test_cov(self, datetime_series):
+        # full overlap
+        tm.assert_almost_equal(datetime_series.cov(datetime_series),
+                               datetime_series.std() ** 2)
+
+        # partial overlap
+        tm.assert_almost_equal(datetime_series[:15].cov(datetime_series[5:]),
+                               datetime_series[5:15].std() ** 2)
+
+        # No overlap
+        assert np.isnan(datetime_series[::2].cov(datetime_series[1::2]))
 
         # all NA
-        cp = self.ts[:10].copy()
+        cp = datetime_series[:10].copy()
         cp[:] = np.nan
-        self.assertTrue(isnull(cp.cov(cp)))
+        assert isna(cp.cov(cp))
 
         # min_periods
-        self.assertTrue(isnull(self.ts[:15].cov(self.ts[5:], min_periods=12)))
+        assert isna(datetime_series[:15].cov(datetime_series[5:],
+                    min_periods=12))
 
-        ts1 = self.ts[:15].reindex(self.ts.index)
-        ts2 = self.ts[5:].reindex(self.ts.index)
-        self.assertTrue(isnull(ts1.cov(ts2, min_periods=12)))
+        ts1 = datetime_series[:15].reindex(datetime_series.index)
+        ts2 = datetime_series[5:].reindex(datetime_series.index)
+        assert isna(ts1.cov(ts2, min_periods=12))
 
-    def test_count(self):
-        self.assertEqual(self.ts.count(), len(self.ts))
+    def test_count(self, datetime_series):
+        assert datetime_series.count() == len(datetime_series)
 
-        self.ts[::2] = np.NaN
+        datetime_series[::2] = np.NaN
 
-        self.assertEqual(self.ts.count(), np.isfinite(self.ts).sum())
+        assert datetime_series.count() == np.isfinite(datetime_series).sum()
 
         mi = MultiIndex.from_arrays([list('aabbcc'), [1, 2, 2, nan, 1, 2]])
         ts = Series(np.arange(len(mi)), index=mi)
@@ -857,110 +482,106 @@ def test_dot(self):
 
         # Check ndarray argument
         result = a.dot(b.values)
-        self.assertTrue(np.all(result == expected.values))
+        assert np.all(result == expected.values)
         assert_almost_equal(a.dot(b['2'].values), expected['2'])
 
         # Check series argument
         assert_almost_equal(a.dot(b['1']), expected['1'])
         assert_almost_equal(a.dot(b2['1']), expected['1'])
 
-        self.assertRaises(Exception, a.dot, a.values[:3])
-        self.assertRaises(ValueError, a.dot, b.T)
-
-    def test_value_counts_nunique(self):
-
-        # basics.rst doc example
-        series = Series(np.random.randn(500))
-        series[20:500] = np.nan
-        series[10:20] = 5000
-        result = series.nunique()
-        self.assertEqual(result, 11)
-
-    def test_unique(self):
-
-        # 714 also, dtype=float
-        s = Series([1.2345] * 100)
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        s = Series([1.2345] * 100, dtype='f4')
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        # NAs in object arrays #714
-        s = Series(['foo'] * 100, dtype='O')
-        s[::2] = np.nan
-        result = s.unique()
-        self.assertEqual(len(result), 2)
-
-        # decision about None
-        s = Series([1, 2, 3, None, None, None], dtype=object)
-        result = s.unique()
-        expected = np.array([1, 2, 3, None], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_drop_duplicates(self):
-        # check both int and object
-        for s in [Series([1, 2, 3, 3]), Series(['1', '2', '3', '3'])]:
-            expected = Series([False, False, False, True])
-            assert_series_equal(s.duplicated(), expected)
-            assert_series_equal(s.drop_duplicates(), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, False, True, False])
-            assert_series_equal(s.duplicated(keep='last'), expected)
-            assert_series_equal(s.drop_duplicates(keep='last'), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep='last', inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, False, True, True])
-            assert_series_equal(s.duplicated(keep=False), expected)
-            assert_series_equal(s.drop_duplicates(keep=False), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep=False, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-        for s in [Series([1, 2, 3, 5, 3, 2, 4]),
-                  Series(['1', '2', '3', '5', '3', '2', '4'])]:
-            expected = Series([False, False, False, False, True, True, False])
-            assert_series_equal(s.duplicated(), expected)
-            assert_series_equal(s.drop_duplicates(), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, True, True, False, False, False, False])
-            assert_series_equal(s.duplicated(keep='last'), expected)
-            assert_series_equal(s.drop_duplicates(keep='last'), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep='last', inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-            expected = Series([False, True, True, False, True, True, False])
-            assert_series_equal(s.duplicated(keep=False), expected)
-            assert_series_equal(s.drop_duplicates(keep=False), s[~expected])
-            sc = s.copy()
-            sc.drop_duplicates(keep=False, inplace=True)
-            assert_series_equal(sc, s[~expected])
-
-    def test_clip(self):
-        val = self.ts.median()
-
-        self.assertEqual(self.ts.clip_lower(val).min(), val)
-        self.assertEqual(self.ts.clip_upper(val).max(), val)
-
-        self.assertEqual(self.ts.clip(lower=val).min(), val)
-        self.assertEqual(self.ts.clip(upper=val).max(), val)
-
-        result = self.ts.clip(-0.5, 0.5)
-        expected = np.clip(self.ts, -0.5, 0.5)
+        msg = r"Dot product shape mismatch, \(4L?,\) vs \(3L?,\)"
+        # exception raised is of type Exception
+        with pytest.raises(Exception, match=msg):
+            a.dot(a.values[:3])
+        msg = "matrices are not aligned"
+        with pytest.raises(ValueError, match=msg):
+            a.dot(b.T)
+
+    @pytest.mark.skipif(not PY35,
+                        reason='matmul supported for Python>=3.5')
+    def test_matmul(self):
+        # matmul test is for GH #10259
+        a = Series(np.random.randn(4), index=['p', 'q', 'r', 's'])
+        b = DataFrame(np.random.randn(3, 4), index=['1', '2', '3'],
+                      columns=['p', 'q', 'r', 's']).T
+
+        # Series @ DataFrame
+        result = operator.matmul(a, b)
+        expected = Series(np.dot(a.values, b.values), index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # DataFrame @ Series
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
         assert_series_equal(result, expected)
-        tm.assertIsInstance(expected, Series)
+
+        # Series @ Series
+        result = operator.matmul(a, a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # vector (1D np.array) @ Series (__rmatmul__)
+        result = operator.matmul(a.values, a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # vector (1D list) @ Series (__rmatmul__)
+        result = operator.matmul(a.values.tolist(), a)
+        expected = np.dot(a.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # matrix (2D np.array) @ Series (__rmatmul__)
+        result = operator.matmul(b.T.values, a)
+        expected = np.dot(b.T.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # GH 21530
+        # matrix (2D nested lists) @ Series (__rmatmul__)
+        result = operator.matmul(b.T.values.tolist(), a)
+        expected = np.dot(b.T.values, a.values)
+        assert_almost_equal(result, expected)
+
+        # mixed dtype DataFrame @ Series
+        a['p'] = int(a.p)
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        # different dtypes DataFrame @ Series
+        a = a.astype(int)
+        result = operator.matmul(b.T, a)
+        expected = Series(np.dot(b.T.values, a.T.values),
+                          index=['1', '2', '3'])
+        assert_series_equal(result, expected)
+
+        msg = r"Dot product shape mismatch, \(4,\) vs \(3,\)"
+        # exception raised is of type Exception
+        with pytest.raises(Exception, match=msg):
+            a.dot(a.values[:3])
+        msg = "matrices are not aligned"
+        with pytest.raises(ValueError, match=msg):
+            a.dot(b.T)
+
+    def test_clip(self, datetime_series):
+        val = datetime_series.median()
+
+        with tm.assert_produces_warning(FutureWarning):
+            assert datetime_series.clip_lower(val).min() == val
+        with tm.assert_produces_warning(FutureWarning):
+            assert datetime_series.clip_upper(val).max() == val
+
+        assert datetime_series.clip(lower=val).min() == val
+        assert datetime_series.clip(upper=val).max() == val
+
+        result = datetime_series.clip(-0.5, 0.5)
+        expected = np.clip(datetime_series, -0.5, 0.5)
+        assert_series_equal(result, expected)
+        assert isinstance(expected, Series)
 
     def test_clip_types_and_nulls(self):
 
@@ -970,12 +591,29 @@ def test_clip_types_and_nulls(self):
 
         for s in sers:
             thresh = s[2]
-            l = s.clip_lower(thresh)
-            u = s.clip_upper(thresh)
-            self.assertEqual(l[notnull(l)].min(), thresh)
-            self.assertEqual(u[notnull(u)].max(), thresh)
-            self.assertEqual(list(isnull(s)), list(isnull(l)))
-            self.assertEqual(list(isnull(s)), list(isnull(u)))
+            with tm.assert_produces_warning(FutureWarning):
+                lower = s.clip_lower(thresh)
+            with tm.assert_produces_warning(FutureWarning):
+                upper = s.clip_upper(thresh)
+            assert lower[notna(lower)].min() == thresh
+            assert upper[notna(upper)].max() == thresh
+            assert list(isna(s)) == list(isna(lower))
+            assert list(isna(s)) == list(isna(upper))
+
+    def test_clip_with_na_args(self):
+        """Should process np.nan argument as None """
+        # GH # 17276
+        s = Series([1, 2, 3])
+
+        assert_series_equal(s.clip(np.nan), Series([1, 2, 3]))
+        assert_series_equal(s.clip(upper=np.nan, lower=np.nan),
+                            Series([1, 2, 3]))
+
+        # GH #19992
+        assert_series_equal(s.clip(lower=[0, 4, np.nan]),
+                            Series([1, 4, np.nan]))
+        assert_series_equal(s.clip(upper=[1, np.nan, 1]),
+                            Series([1, np.nan, 1]))
 
     def test_clip_against_series(self):
         # GH #6966
@@ -983,25 +621,42 @@ def test_clip_against_series(self):
         s = Series([1.0, 1.0, 4.0])
         threshold = Series([1.0, 2.0, 3.0])
 
-        assert_series_equal(s.clip_lower(threshold), Series([1.0, 2.0, 4.0]))
-        assert_series_equal(s.clip_upper(threshold), Series([1.0, 1.0, 3.0]))
+        with tm.assert_produces_warning(FutureWarning):
+            assert_series_equal(s.clip_lower(threshold),
+                                Series([1.0, 2.0, 4.0]))
+        with tm.assert_produces_warning(FutureWarning):
+            assert_series_equal(s.clip_upper(threshold),
+                                Series([1.0, 1.0, 3.0]))
 
         lower = Series([1.0, 2.0, 3.0])
         upper = Series([1.5, 2.5, 3.5])
+
         assert_series_equal(s.clip(lower, upper), Series([1.0, 2.0, 3.5]))
         assert_series_equal(s.clip(1.5, upper), Series([1.5, 1.5, 3.5]))
 
+    @pytest.mark.parametrize("inplace", [True, False])
+    @pytest.mark.parametrize("upper", [[1, 2, 3], np.asarray([1, 2, 3])])
+    def test_clip_against_list_like(self, inplace, upper):
+        # GH #15390
+        original = pd.Series([5, 6, 7])
+        result = original.clip(upper=upper, inplace=inplace)
+        expected = pd.Series([1, 2, 3])
+
+        if inplace:
+            result = original
+        tm.assert_series_equal(result, expected, check_exact=True)
+
     def test_clip_with_datetimes(self):
 
         # GH 11838
         # naive and tz-aware datetimes
 
         t = Timestamp('2015-12-01 09:30:30')
-        s = Series([Timestamp('2015-12-01 09:30:00'), Timestamp(
-            '2015-12-01 09:31:00')])
+        s = Series([Timestamp('2015-12-01 09:30:00'),
+                    Timestamp('2015-12-01 09:31:00')])
         result = s.clip(upper=t)
-        expected = Series([Timestamp('2015-12-01 09:30:00'), Timestamp(
-            '2015-12-01 09:30:30')])
+        expected = Series([Timestamp('2015-12-01 09:30:00'),
+                           Timestamp('2015-12-01 09:30:30')])
         assert_series_equal(result, expected)
 
         t = Timestamp('2015-12-01 09:30:30', tz='US/Eastern')
@@ -1014,12 +669,6 @@ def test_clip_with_datetimes(self):
 
     def test_cummethods_bool(self):
         # GH 6270
-        # looks like a buggy np.maximum.accumulate for numpy 1.6.1, py 3.2
-        def cummin(x):
-            return np.minimum.accumulate(x)
-
-        def cummax(x):
-            return np.maximum.accumulate(x)
 
         a = pd.Series([False, False, False, True, True, False, False])
         b = ~a
@@ -1027,8 +676,8 @@ def cummax(x):
         d = ~c
         methods = {'cumsum': np.cumsum,
                    'cumprod': np.cumprod,
-                   'cummin': cummin,
-                   'cummax': cummax}
+                   'cummin': np.minimum.accumulate,
+                   'cummax': np.maximum.accumulate}
         args = product((a, b, c, d), methods)
         for s, method in args:
             expected = Series(methods[method](s.values))
@@ -1056,14 +705,28 @@ def test_isin(self):
         expected = Series([True, False, True, False, False, False, True, True])
         assert_series_equal(result, expected)
 
+        # GH: 16012
+        # This specific issue has to have a series over 1e6 in len, but the
+        # comparison array (in_list) must be large enough so that numpy doesn't
+        # do a manual masking trick that will avoid this issue altogether
+        s = Series(list('abcdefghijk' * 10 ** 5))
+        # If numpy doesn't do the manual comparison/mask, these
+        # unorderable mixed types are what cause the exception in numpy
+        in_list = [-1, 'a', 'b', 'G', 'Y', 'Z', 'E',
+                   'K', 'E', 'S', 'I', 'R', 'R'] * 6
+
+        assert s.isin(in_list).sum() == 200000
+
     def test_isin_with_string_scalar(self):
         # GH4763
         s = Series(['A', 'B', 'C', 'a', 'B', 'B', 'A', 'C'])
-        with tm.assertRaises(TypeError):
+        msg = (r"only list-like objects are allowed to be passed to isin\(\),"
+               r" you passed a \[str\]")
+        with pytest.raises(TypeError, match=msg):
             s.isin('a')
 
-        with tm.assertRaises(TypeError):
-            s = Series(['aaa', 'b', 'c'])
+        s = Series(['aaa', 'b', 'c'])
+        with pytest.raises(TypeError, match=msg):
             s.isin('aaa')
 
     def test_isin_with_i8(self):
@@ -1099,187 +762,60 @@ def test_isin_with_i8(self):
         result = s.isin(s[0:2])
         assert_series_equal(result, expected)
 
-    def test_timedelta64_analytics(self):
-        from pandas import date_range
-
-        # index min/max
-        td = Series(date_range('2012-1-1', periods=3, freq='D')) - \
-            Timestamp('20120101')
-
-        result = td.idxmin()
-        self.assertEqual(result, 0)
-
-        result = td.idxmax()
-        self.assertEqual(result, 2)
-
-        # GH 2982
-        # with NaT
-        td[0] = np.nan
-
-        result = td.idxmin()
-        self.assertEqual(result, 1)
-
-        result = td.idxmax()
-        self.assertEqual(result, 2)
-
-        # abs
-        s1 = Series(date_range('20120101', periods=3))
-        s2 = Series(date_range('20120102', periods=3))
-        expected = Series(s2 - s1)
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_isin_empty(self, empty):
+        # see gh-16991
+        s = Series(["a", "b"])
+        expected = Series([False, False])
 
-        # this fails as numpy returns timedelta64[us]
-        # result = np.abs(s1-s2)
-        # assert_frame_equal(result,expected)
-
-        result = (s1 - s2).abs()
-        assert_series_equal(result, expected)
-
-        # max/min
-        result = td.max()
-        expected = Timedelta('2 days')
-        self.assertEqual(result, expected)
-
-        result = td.min()
-        expected = Timedelta('1 days')
-        self.assertEqual(result, expected)
-
-    def test_idxmin(self):
-        # test idxmin
-        # _check_stat_op approach can not be used here because of isnull check.
-
-        # add some NaNs
-        self.series[5:15] = np.NaN
-
-        # skipna or no
-        self.assertEqual(self.series[self.series.idxmin()], self.series.min())
-        self.assertTrue(isnull(self.series.idxmin(skipna=False)))
-
-        # no NaNs
-        nona = self.series.dropna()
-        self.assertEqual(nona[nona.idxmin()], nona.min())
-        self.assertEqual(nona.index.values.tolist().index(nona.idxmin()),
-                         nona.values.argmin())
-
-        # all NaNs
-        allna = self.series * nan
-        self.assertTrue(isnull(allna.idxmin()))
-
-        # datetime64[ns]
-        from pandas import date_range
-        s = Series(date_range('20130102', periods=6))
-        result = s.idxmin()
-        self.assertEqual(result, 0)
-
-        s[0] = np.nan
-        result = s.idxmin()
-        self.assertEqual(result, 1)
-
-    def test_numpy_argmin(self):
-        # argmin is aliased to idxmin
-        data = np.random.randint(0, 11, size=10)
-        result = np.argmin(Series(data))
-        self.assertEqual(result, np.argmin(data))
-
-        if not _np_version_under1p10:
-            msg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, np.argmin,
-                                  Series(data), out=data)
-
-    def test_idxmax(self):
-        # test idxmax
-        # _check_stat_op approach can not be used here because of isnull check.
-
-        # add some NaNs
-        self.series[5:15] = np.NaN
-
-        # skipna or no
-        self.assertEqual(self.series[self.series.idxmax()], self.series.max())
-        self.assertTrue(isnull(self.series.idxmax(skipna=False)))
-
-        # no NaNs
-        nona = self.series.dropna()
-        self.assertEqual(nona[nona.idxmax()], nona.max())
-        self.assertEqual(nona.index.values.tolist().index(nona.idxmax()),
-                         nona.values.argmax())
-
-        # all NaNs
-        allna = self.series * nan
-        self.assertTrue(isnull(allna.idxmax()))
-
-        from pandas import date_range
-        s = Series(date_range('20130102', periods=6))
-        result = s.idxmax()
-        self.assertEqual(result, 5)
-
-        s[5] = np.nan
-        result = s.idxmax()
-        self.assertEqual(result, 4)
-
-        # Float64Index
-        # GH 5914
-        s = pd.Series([1, 2, 3], [1.1, 2.1, 3.1])
-        result = s.idxmax()
-        self.assertEqual(result, 3.1)
-        result = s.idxmin()
-        self.assertEqual(result, 1.1)
-
-        s = pd.Series(s.index, s.index)
-        result = s.idxmax()
-        self.assertEqual(result, 3.1)
-        result = s.idxmin()
-        self.assertEqual(result, 1.1)
-
-    def test_numpy_argmax(self):
-
-        # argmax is aliased to idxmax
-        data = np.random.randint(0, 11, size=10)
-        result = np.argmax(Series(data))
-        self.assertEqual(result, np.argmax(data))
-
-        if not _np_version_under1p10:
-            msg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, np.argmax,
-                                  Series(data), out=data)
+        result = s.isin(empty)
+        tm.assert_series_equal(expected, result)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_ptp(self):
+        # GH21614
         N = 1000
         arr = np.random.randn(N)
         ser = Series(arr)
-        self.assertEqual(np.ptp(ser), np.ptp(arr))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            assert np.ptp(ser) == np.ptp(arr)
 
         # GH11163
         s = Series([3, 5, np.nan, -3, 10])
-        self.assertEqual(s.ptp(), 13)
-        self.assertTrue(pd.isnull(s.ptp(skipna=False)))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            assert s.ptp() == 13
+            assert pd.isna(s.ptp(skipna=False))
 
         mi = pd.MultiIndex.from_product([['a', 'b'], [1, 2, 3]])
         s = pd.Series([1, np.nan, 7, 3, 5, np.nan], index=mi)
 
         expected = pd.Series([6, 2], index=['a', 'b'], dtype=np.float64)
-        self.assert_series_equal(s.ptp(level=0), expected)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            tm.assert_series_equal(s.ptp(level=0), expected)
 
         expected = pd.Series([np.nan, np.nan], index=['a', 'b'])
-        self.assert_series_equal(s.ptp(level=0, skipna=False), expected)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            tm.assert_series_equal(s.ptp(level=0, skipna=False), expected)
 
-        with self.assertRaises(ValueError):
-            s.ptp(axis=1)
+        msg = ("No axis named 1 for object type"
+               " <class 'pandas.core.series.Series'>")
+        with pytest.raises(ValueError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                s.ptp(axis=1)
 
         s = pd.Series(['a', 'b', 'c', 'd', 'e'])
-        with self.assertRaises(TypeError):
-            s.ptp()
-
-        with self.assertRaises(NotImplementedError):
-            s.ptp(numeric_only=True)
-
-    def test_empty_timeseries_redections_return_nat(self):
-        # covers #11245
-        for dtype in ('m8[ns]', 'm8[ns]', 'M8[ns]', 'M8[ns, UTC]'):
-            self.assertIs(Series([], dtype=dtype).min(), pd.NaT)
-            self.assertIs(Series([], dtype=dtype).max(), pd.NaT)
-
-    def test_unique_data_ownership(self):
-        # it works! #1807
-        Series(Series(["a", "c", "b"]).unique()).sort_values()
+        msg = r"unsupported operand type\(s\) for -: 'str' and 'str'"
+        with pytest.raises(TypeError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                s.ptp()
+
+        msg = r"Series\.ptp does not implement numeric_only\."
+        with pytest.raises(NotImplementedError, match=msg):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                s.ptp(numeric_only=True)
 
     def test_repeat(self):
         s = Series(np.random.randn(3), index=['a', 'b', 'c'])
@@ -1288,10 +824,6 @@ def test_repeat(self):
         exp = Series(s.values.repeat(5), index=s.index.values.repeat(5))
         assert_series_equal(reps, exp)
 
-        with tm.assert_produces_warning(FutureWarning):
-            result = s.repeat(reps=5)
-            assert_series_equal(result, exp)
-
         to_rep = [2, 3, 4]
         reps = s.repeat(to_rep)
         exp = Series(s.values.repeat(to_rep),
@@ -1305,26 +837,25 @@ def test_numpy_repeat(self):
         assert_series_equal(np.repeat(s, 2), expected)
 
         msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.repeat, s, 2, axis=0)
+        with pytest.raises(ValueError, match=msg):
+            np.repeat(s, 2, axis=0)
 
     def test_searchsorted(self):
         s = Series([1, 2, 3])
 
-        idx = s.searchsorted(1, side='left')
-        tm.assert_numpy_array_equal(idx, np.array([0], dtype=np.intp))
+        result = s.searchsorted(1, side='left')
+        assert is_scalar(result)
+        assert result == 0
 
-        idx = s.searchsorted(1, side='right')
-        tm.assert_numpy_array_equal(idx, np.array([1], dtype=np.intp))
-
-        with tm.assert_produces_warning(FutureWarning):
-            idx = s.searchsorted(v=1, side='left')
-            tm.assert_numpy_array_equal(idx, np.array([0], dtype=np.intp))
+        result = s.searchsorted(1, side='right')
+        assert is_scalar(result)
+        assert result == 1
 
     def test_searchsorted_numeric_dtypes_scalar(self):
         s = Series([1, 2, 90, 1000, 3e9])
         r = s.searchsorted(30)
-        e = 2
-        self.assertEqual(r, e)
+        assert is_scalar(r)
+        assert r == 2
 
         r = s.searchsorted([30])
         e = np.array([2], dtype=np.intp)
@@ -1340,8 +871,8 @@ def test_search_sorted_datetime64_scalar(self):
         s = Series(pd.date_range('20120101', periods=10, freq='2D'))
         v = pd.Timestamp('20120102')
         r = s.searchsorted(v)
-        e = 1
-        self.assertEqual(r, e)
+        assert is_scalar(r)
+        assert r == 1
 
     def test_search_sorted_datetime64_list(self):
         s = Series(pd.date_range('20120101', periods=10, freq='2D'))
@@ -1357,103 +888,22 @@ def test_searchsorted_sorter(self):
         e = np.array([0, 2], dtype=np.intp)
         tm.assert_numpy_array_equal(r, e)
 
-    def test_is_unique(self):
-        # GH11946
-        s = Series(np.random.randint(0, 10, size=1000))
-        self.assertFalse(s.is_unique)
-        s = Series(np.arange(1000))
-        self.assertTrue(s.is_unique)
-
     def test_is_monotonic(self):
 
         s = Series(np.random.randint(0, 10, size=1000))
-        self.assertFalse(s.is_monotonic)
+        assert not s.is_monotonic
         s = Series(np.arange(1000))
-        self.assertTrue(s.is_monotonic)
-        self.assertTrue(s.is_monotonic_increasing)
+        assert s.is_monotonic is True
+        assert s.is_monotonic_increasing is True
         s = Series(np.arange(1000, 0, -1))
-        self.assertTrue(s.is_monotonic_decreasing)
+        assert s.is_monotonic_decreasing is True
 
         s = Series(pd.date_range('20130101', periods=10))
-        self.assertTrue(s.is_monotonic)
-        self.assertTrue(s.is_monotonic_increasing)
+        assert s.is_monotonic is True
+        assert s.is_monotonic_increasing is True
         s = Series(list(reversed(s.tolist())))
-        self.assertFalse(s.is_monotonic)
-        self.assertTrue(s.is_monotonic_decreasing)
-
-    def test_nsmallest_nlargest(self):
-        # float, int, datetime64 (use i8), timedelts64 (same),
-        # object that are numbers, object that are strings
-
-        base = [3, 2, 1, 2, 5]
-
-        s_list = [
-            Series(base, dtype='int8'),
-            Series(base, dtype='int16'),
-            Series(base, dtype='int32'),
-            Series(base, dtype='int64'),
-            Series(base, dtype='float32'),
-            Series(base, dtype='float64'),
-            Series(base, dtype='uint8'),
-            Series(base, dtype='uint16'),
-            Series(base, dtype='uint32'),
-            Series(base, dtype='uint64'),
-            Series(base).astype('timedelta64[ns]'),
-            Series(pd.to_datetime(['2003', '2002', '2001', '2002', '2005'])),
-        ]
-
-        raising = [
-            Series([3., 2, 1, 2, '5'], dtype='object'),
-            Series([3., 2, 1, 2, 5], dtype='object'),
-            # not supported on some archs
-            # Series([3., 2, 1, 2, 5], dtype='complex256'),
-            Series([3., 2, 1, 2, 5], dtype='complex128'),
-        ]
-
-        for r in raising:
-            dt = r.dtype
-            msg = "Cannot use method 'n(larg|small)est' with dtype %s" % dt
-            args = 2, len(r), 0, -1
-            methods = r.nlargest, r.nsmallest
-            for method, arg in product(methods, args):
-                with tm.assertRaisesRegexp(TypeError, msg):
-                    method(arg)
-
-        for s in s_list:
-
-            assert_series_equal(s.nsmallest(2), s.iloc[[2, 1]])
-            assert_series_equal(s.nsmallest(2, keep='last'), s.iloc[[2, 3]])
-
-            empty = s.iloc[0:0]
-            assert_series_equal(s.nsmallest(0), empty)
-            assert_series_equal(s.nsmallest(-1), empty)
-            assert_series_equal(s.nlargest(0), empty)
-            assert_series_equal(s.nlargest(-1), empty)
-
-            assert_series_equal(s.nsmallest(len(s)), s.sort_values())
-            assert_series_equal(s.nsmallest(len(s) + 1), s.sort_values())
-            assert_series_equal(s.nlargest(len(s)), s.iloc[[4, 0, 1, 3, 2]])
-            assert_series_equal(s.nlargest(len(s) + 1),
-                                s.iloc[[4, 0, 1, 3, 2]])
-
-        s = Series([3., np.nan, 1, 2, 5])
-        assert_series_equal(s.nlargest(), s.iloc[[4, 0, 3, 2]])
-        assert_series_equal(s.nsmallest(), s.iloc[[2, 3, 0, 4]])
-
-        msg = 'keep must be either "first", "last"'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.nsmallest(keep='invalid')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.nlargest(keep='invalid')
-
-        # GH 13412
-        s = Series([1, 4, 3, 2], index=[0, 0, 1, 1])
-        result = s.nlargest(3)
-        expected = s.sort_values(ascending=False).head(3)
-        assert_series_equal(result, expected)
-        result = s.nsmallest(3)
-        expected = s.sort_values().head(3)
-        assert_series_equal(result, expected)
+        assert s.is_monotonic is False
+        assert s.is_monotonic_decreasing is True
 
     def test_sort_index_level(self):
         mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
@@ -1489,10 +939,10 @@ def test_apply_categorical(self):
         result = s.apply(lambda x: 'A')
         exp = pd.Series(['A'] * 7, name='XX', index=list('abcdefg'))
         tm.assert_series_equal(result, exp)
-        self.assertEqual(result.dtype, np.object)
+        assert result.dtype == np.object
 
-    def test_shift_int(self):
-        ts = self.ts.astype(int)
+    def test_shift_int(self, datetime_series):
+        ts = datetime_series.astype(int)
         shifted = ts.shift(1)
         expected = ts.astype(float).shift(1)
         assert_series_equal(shifted, expected)
@@ -1501,84 +951,26 @@ def test_shift_categorical(self):
         # GH 9416
         s = pd.Series(['a', 'b', 'c', 'd'], dtype='category')
 
-        assert_series_equal(s.iloc[:-1], s.shift(1).shift(-1).valid())
+        assert_series_equal(s.iloc[:-1], s.shift(1).shift(-1).dropna())
 
         sp1 = s.shift(1)
         assert_index_equal(s.index, sp1.index)
-        self.assertTrue(np.all(sp1.values.codes[:1] == -1))
-        self.assertTrue(np.all(s.values.codes[:-1] == sp1.values.codes[1:]))
+        assert np.all(sp1.values.codes[:1] == -1)
+        assert np.all(s.values.codes[:-1] == sp1.values.codes[1:])
 
         sn2 = s.shift(-2)
         assert_index_equal(s.index, sn2.index)
-        self.assertTrue(np.all(sn2.values.codes[-2:] == -1))
-        self.assertTrue(np.all(s.values.codes[2:] == sn2.values.codes[:-2]))
+        assert np.all(sn2.values.codes[-2:] == -1)
+        assert np.all(s.values.codes[2:] == sn2.values.codes[:-2])
 
         assert_index_equal(s.values.categories, sp1.values.categories)
         assert_index_equal(s.values.categories, sn2.values.categories)
 
-    def test_reshape_deprecate(self):
-        x = Series(np.random.random(10), name='x')
-        tm.assert_produces_warning(FutureWarning, x.reshape, x.shape)
-
-    def test_reshape_non_2d(self):
-        # see gh-4554
-        with tm.assert_produces_warning(FutureWarning):
-            x = Series(np.random.random(201), name='x')
-            self.assertTrue(x.reshape(x.shape, ) is x)
-
-        # see gh-2719
-        with tm.assert_produces_warning(FutureWarning):
-            a = Series([1, 2, 3, 4])
-            result = a.reshape(2, 2)
-            expected = a.values.reshape(2, 2)
-            tm.assert_numpy_array_equal(result, expected)
-            self.assertIsInstance(result, type(expected))
-
-    def test_reshape_2d_return_array(self):
-        x = Series(np.random.random(201), name='x')
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = x.reshape((-1, 1))
-            self.assertNotIsInstance(result, Series)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result2 = np.reshape(x, (-1, 1))
-            self.assertNotIsInstance(result2, Series)
-
-        with tm.assert_produces_warning(FutureWarning):
-            result = x[:, None]
-            expected = x.reshape((-1, 1))
-            assert_almost_equal(result, expected)
-
-    def test_reshape_bad_kwarg(self):
-        a = Series([1, 2, 3, 4])
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            msg = "'foo' is an invalid keyword argument for this function"
-            tm.assertRaisesRegexp(TypeError, msg, a.reshape, (2, 2), foo=2)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            msg = r"reshape\(\) got an unexpected keyword argument 'foo'"
-            tm.assertRaisesRegexp(TypeError, msg, a.reshape, a.shape, foo=2)
-
-    def test_numpy_reshape(self):
-        a = Series([1, 2, 3, 4])
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = np.reshape(a, (2, 2))
-            expected = a.values.reshape(2, 2)
-            tm.assert_numpy_array_equal(result, expected)
-            self.assertIsInstance(result, type(expected))
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = np.reshape(a, a.shape)
-            tm.assert_series_equal(result, a)
-
     def test_unstack(self):
         from numpy import nan
 
         index = MultiIndex(levels=[['bar', 'foo'], ['one', 'three', 'two']],
-                           labels=[[1, 1, 0, 0], [0, 1, 0, 2]])
+                           codes=[[1, 1, 0, 0], [0, 1, 0, 2]])
 
         s = Series(np.arange(4.), index=index)
         unstacked = s.unstack()
@@ -1593,14 +985,14 @@ def test_unstack(self):
         assert_frame_equal(unstacked, expected.T)
 
         index = MultiIndex(levels=[['bar'], ['one', 'two', 'three'], [0, 1]],
-                           labels=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
-                                   [0, 1, 0, 1, 0, 1]])
+                           codes=[[0, 0, 0, 0, 0, 0], [0, 1, 2, 0, 1, 2],
+                                  [0, 1, 0, 1, 0, 1]])
         s = Series(np.random.randn(6), index=index)
         exp_index = MultiIndex(levels=[['one', 'two', 'three'], [0, 1]],
-                               labels=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1]])
+                               codes=[[0, 1, 2, 0, 1, 2], [0, 1, 0, 1, 0, 1]])
         expected = DataFrame({'bar': s.values},
                              index=exp_index).sort_index(level=0)
-        unstacked = s.unstack(0)
+        unstacked = s.unstack(0).sort_index()
         assert_frame_equal(unstacked, expected)
 
         # GH5873
@@ -1729,3 +1121,392 @@ def test_value_counts_categorical_not_ordered(self):
                         index=exp_idx, name='xxx')
         tm.assert_series_equal(s.value_counts(normalize=True), exp)
         tm.assert_series_equal(idx.value_counts(normalize=True), exp)
+
+    @pytest.mark.parametrize("func", [np.any, np.all])
+    @pytest.mark.parametrize("kwargs", [
+        dict(keepdims=True),
+        dict(out=object()),
+    ])
+    @td.skip_if_np_lt_115
+    def test_validate_any_all_out_keepdims_raises(self, kwargs, func):
+        s = pd.Series([1, 2])
+        param = list(kwargs)[0]
+        name = func.__name__
+
+        msg = (r"the '{arg}' parameter is not "
+               r"supported in the pandas "
+               r"implementation of {fname}\(\)").format(arg=param, fname=name)
+        with pytest.raises(ValueError, match=msg):
+            func(s, **kwargs)
+
+    @td.skip_if_np_lt_115
+    def test_validate_sum_initial(self):
+        s = pd.Series([1, 2])
+        msg = (r"the 'initial' parameter is not "
+               r"supported in the pandas "
+               r"implementation of sum\(\)")
+        with pytest.raises(ValueError, match=msg):
+            np.sum(s, initial=10)
+
+    def test_validate_median_initial(self):
+        s = pd.Series([1, 2])
+        msg = (r"the 'overwrite_input' parameter is not "
+               r"supported in the pandas "
+               r"implementation of median\(\)")
+        with pytest.raises(ValueError, match=msg):
+            # It seems like np.median doesn't dispatch, so we use the
+            # method instead of the ufunc.
+            s.median(overwrite_input=True)
+
+    @td.skip_if_np_lt_115
+    def test_validate_stat_keepdims(self):
+        s = pd.Series([1, 2])
+        msg = (r"the 'keepdims' parameter is not "
+               r"supported in the pandas "
+               r"implementation of sum\(\)")
+        with pytest.raises(ValueError, match=msg):
+            np.sum(s, keepdims=True)
+
+
+main_dtypes = [
+    'datetime',
+    'datetimetz',
+    'timedelta',
+    'int8',
+    'int16',
+    'int32',
+    'int64',
+    'float32',
+    'float64',
+    'uint8',
+    'uint16',
+    'uint32',
+    'uint64'
+]
+
+
+@pytest.fixture
+def s_main_dtypes():
+    """A DataFrame with many dtypes
+
+    * datetime
+    * datetimetz
+    * timedelta
+    * [u]int{8,16,32,64}
+    * float{32,64}
+
+    The columns are the name of the dtype.
+    """
+    df = pd.DataFrame(
+        {'datetime': pd.to_datetime(['2003', '2002',
+                                     '2001', '2002',
+                                     '2005']),
+         'datetimetz': pd.to_datetime(
+             ['2003', '2002',
+              '2001', '2002',
+              '2005']).tz_localize('US/Eastern'),
+         'timedelta': pd.to_timedelta(['3d', '2d', '1d',
+                                       '2d', '5d'])})
+
+    for dtype in ['int8', 'int16', 'int32', 'int64',
+                  'float32', 'float64',
+                  'uint8', 'uint16', 'uint32', 'uint64']:
+        df[dtype] = Series([3, 2, 1, 2, 5], dtype=dtype)
+
+    return df
+
+
+@pytest.fixture(params=main_dtypes)
+def s_main_dtypes_split(request, s_main_dtypes):
+    """Each series in s_main_dtypes."""
+    return s_main_dtypes[request.param]
+
+
+def assert_check_nselect_boundary(vals, dtype, method):
+    # helper function for 'test_boundary_{dtype}' tests
+    s = Series(vals, dtype=dtype)
+    result = getattr(s, method)(3)
+    expected_idxr = [0, 1, 2] if method == 'nsmallest' else [3, 2, 1]
+    expected = s.loc[expected_idxr]
+    tm.assert_series_equal(result, expected)
+
+
+class TestNLargestNSmallest(object):
+
+    @pytest.mark.parametrize(
+        "r", [Series([3., 2, 1, 2, '5'], dtype='object'),
+              Series([3., 2, 1, 2, 5], dtype='object'),
+              # not supported on some archs
+              # Series([3., 2, 1, 2, 5], dtype='complex256'),
+              Series([3., 2, 1, 2, 5], dtype='complex128'),
+              Series(list('abcde')),
+              Series(list('abcde'), dtype='category')])
+    def test_error(self, r):
+        dt = r.dtype
+        msg = ("Cannot use method 'n(larg|small)est' with "
+               "dtype {dt}".format(dt=dt))
+        args = 2, len(r), 0, -1
+        methods = r.nlargest, r.nsmallest
+        for method, arg in product(methods, args):
+            with pytest.raises(TypeError, match=msg):
+                method(arg)
+
+    def test_nsmallest_nlargest(self, s_main_dtypes_split):
+        # float, int, datetime64 (use i8), timedelts64 (same),
+        # object that are numbers, object that are strings
+        s = s_main_dtypes_split
+
+        assert_series_equal(s.nsmallest(2), s.iloc[[2, 1]])
+        assert_series_equal(s.nsmallest(2, keep='last'), s.iloc[[2, 3]])
+
+        empty = s.iloc[0:0]
+        assert_series_equal(s.nsmallest(0), empty)
+        assert_series_equal(s.nsmallest(-1), empty)
+        assert_series_equal(s.nlargest(0), empty)
+        assert_series_equal(s.nlargest(-1), empty)
+
+        assert_series_equal(s.nsmallest(len(s)), s.sort_values())
+        assert_series_equal(s.nsmallest(len(s) + 1), s.sort_values())
+        assert_series_equal(s.nlargest(len(s)), s.iloc[[4, 0, 1, 3, 2]])
+        assert_series_equal(s.nlargest(len(s) + 1),
+                            s.iloc[[4, 0, 1, 3, 2]])
+
+    def test_misc(self):
+
+        s = Series([3., np.nan, 1, 2, 5])
+        assert_series_equal(s.nlargest(), s.iloc[[4, 0, 3, 2]])
+        assert_series_equal(s.nsmallest(), s.iloc[[2, 3, 0, 4]])
+
+        msg = 'keep must be either "first", "last"'
+        with pytest.raises(ValueError, match=msg):
+            s.nsmallest(keep='invalid')
+        with pytest.raises(ValueError, match=msg):
+            s.nlargest(keep='invalid')
+
+        # GH 15297
+        s = Series([1] * 5, index=[1, 2, 3, 4, 5])
+        expected_first = Series([1] * 3, index=[1, 2, 3])
+        expected_last = Series([1] * 3, index=[5, 4, 3])
+
+        result = s.nsmallest(3)
+        assert_series_equal(result, expected_first)
+
+        result = s.nsmallest(3, keep='last')
+        assert_series_equal(result, expected_last)
+
+        result = s.nlargest(3)
+        assert_series_equal(result, expected_first)
+
+        result = s.nlargest(3, keep='last')
+        assert_series_equal(result, expected_last)
+
+    @pytest.mark.parametrize('n', range(1, 5))
+    def test_n(self, n):
+
+        # GH 13412
+        s = Series([1, 4, 3, 2], index=[0, 0, 1, 1])
+        result = s.nlargest(n)
+        expected = s.sort_values(ascending=False).head(n)
+        assert_series_equal(result, expected)
+
+        result = s.nsmallest(n)
+        expected = s.sort_values().head(n)
+        assert_series_equal(result, expected)
+
+    def test_boundary_integer(self, nselect_method, any_int_dtype):
+        # GH 21426
+        dtype_info = np.iinfo(any_int_dtype)
+        min_val, max_val = dtype_info.min, dtype_info.max
+        vals = [min_val, min_val + 1, max_val - 1, max_val]
+        assert_check_nselect_boundary(vals, any_int_dtype, nselect_method)
+
+    def test_boundary_float(self, nselect_method, float_dtype):
+        # GH 21426
+        dtype_info = np.finfo(float_dtype)
+        min_val, max_val = dtype_info.min, dtype_info.max
+        min_2nd, max_2nd = np.nextafter(
+            [min_val, max_val], 0, dtype=float_dtype)
+        vals = [min_val, min_2nd, max_2nd, max_val]
+        assert_check_nselect_boundary(vals, float_dtype, nselect_method)
+
+    @pytest.mark.parametrize('dtype', ['datetime64[ns]', 'timedelta64[ns]'])
+    def test_boundary_datetimelike(self, nselect_method, dtype):
+        # GH 21426
+        # use int64 bounds and +1 to min_val since true minimum is NaT
+        # (include min_val/NaT at end to maintain same expected_idxr)
+        dtype_info = np.iinfo('int64')
+        min_val, max_val = dtype_info.min, dtype_info.max
+        vals = [min_val + 1, min_val + 2, max_val - 1, max_val, min_val]
+        assert_check_nselect_boundary(vals, dtype, nselect_method)
+
+    def test_duplicate_keep_all_ties(self):
+        # see gh-16818
+        s = Series([10, 9, 8, 7, 7, 7, 7, 6])
+        result = s.nlargest(4, keep='all')
+        expected = Series([10, 9, 8, 7, 7, 7, 7])
+        assert_series_equal(result, expected)
+
+        result = s.nsmallest(2, keep='all')
+        expected = Series([6, 7, 7, 7, 7], index=[7, 3, 4, 5, 6])
+        assert_series_equal(result, expected)
+
+
+class TestCategoricalSeriesAnalytics(object):
+
+    def test_count(self):
+
+        s = Series(Categorical([np.nan, 1, 2, np.nan],
+                               categories=[5, 4, 3, 2, 1], ordered=True))
+        result = s.count()
+        assert result == 2
+
+    def test_value_counts(self):
+        # GH 12835
+        cats = Categorical(list('abcccb'), categories=list('cabd'))
+        s = Series(cats, name='xxx')
+        res = s.value_counts(sort=False)
+
+        exp_index = CategoricalIndex(list('cabd'), categories=cats.categories)
+        exp = Series([3, 1, 2, 0], name='xxx', index=exp_index)
+        tm.assert_series_equal(res, exp)
+
+        res = s.value_counts(sort=True)
+
+        exp_index = CategoricalIndex(list('cbad'), categories=cats.categories)
+        exp = Series([3, 2, 1, 0], name='xxx', index=exp_index)
+        tm.assert_series_equal(res, exp)
+
+        # check object dtype handles the Series.name as the same
+        # (tested in test_base.py)
+        s = Series(["a", "b", "c", "c", "c", "b"], name='xxx')
+        res = s.value_counts()
+        exp = Series([3, 2, 1], name='xxx', index=["c", "b", "a"])
+        tm.assert_series_equal(res, exp)
+
+    def test_value_counts_with_nan(self):
+        # see gh-9443
+
+        # sanity check
+        s = Series(["a", "b", "a"], dtype="category")
+        exp = Series([2, 1], index=CategoricalIndex(["a", "b"]))
+
+        res = s.value_counts(dropna=True)
+        tm.assert_series_equal(res, exp)
+
+        res = s.value_counts(dropna=True)
+        tm.assert_series_equal(res, exp)
+
+        # same Series via two different constructions --> same behaviour
+        series = [
+            Series(["a", "b", None, "a", None, None], dtype="category"),
+            Series(Categorical(["a", "b", None, "a", None, None],
+                               categories=["a", "b"]))
+        ]
+
+        for s in series:
+            # None is a NaN value, so we exclude its count here
+            exp = Series([2, 1], index=CategoricalIndex(["a", "b"]))
+            res = s.value_counts(dropna=True)
+            tm.assert_series_equal(res, exp)
+
+            # we don't exclude the count of None and sort by counts
+            exp = Series([3, 2, 1], index=CategoricalIndex([np.nan, "a", "b"]))
+            res = s.value_counts(dropna=False)
+            tm.assert_series_equal(res, exp)
+
+            # When we aren't sorting by counts, and np.nan isn't a
+            # category, it should be last.
+            exp = Series([2, 1, 3], index=CategoricalIndex(["a", "b", np.nan]))
+            res = s.value_counts(dropna=False, sort=False)
+            tm.assert_series_equal(res, exp)
+
+    @pytest.mark.parametrize(
+        "dtype",
+        ["int_", "uint", "float_", "unicode_", "timedelta64[h]",
+         pytest.param("datetime64[D]",
+                      marks=pytest.mark.xfail(reason="GH#7996"))]
+    )
+    @pytest.mark.parametrize("is_ordered", [True, False])
+    def test_drop_duplicates_categorical_non_bool(self, dtype, is_ordered):
+        cat_array = np.array([1, 2, 3, 4, 5], dtype=np.dtype(dtype))
+
+        # Test case 1
+        input1 = np.array([1, 2, 3, 3], dtype=np.dtype(dtype))
+        tc1 = Series(Categorical(input1, categories=cat_array,
+                                 ordered=is_ordered))
+
+        expected = Series([False, False, False, True])
+        tm.assert_series_equal(tc1.duplicated(), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, False])
+        tm.assert_series_equal(tc1.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(keep='last'),
+                               tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        expected = Series([False, False, True, True])
+        tm.assert_series_equal(tc1.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc1.drop_duplicates(keep=False), tc1[~expected])
+        sc = tc1.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc1[~expected])
+
+        # Test case 2
+        input2 = np.array([1, 2, 3, 5, 3, 2, 4], dtype=np.dtype(dtype))
+        tc2 = Series(Categorical(
+            input2, categories=cat_array, ordered=is_ordered)
+        )
+
+        expected = Series([False, False, False, False, True, True, False])
+        tm.assert_series_equal(tc2.duplicated(), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, False, False, False])
+        tm.assert_series_equal(tc2.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(keep='last'),
+                               tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+        expected = Series([False, True, True, False, True, True, False])
+        tm.assert_series_equal(tc2.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc2.drop_duplicates(keep=False), tc2[~expected])
+        sc = tc2.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc2[~expected])
+
+    @pytest.mark.parametrize("is_ordered", [True, False])
+    def test_drop_duplicates_categorical_bool(self, is_ordered):
+        tc = Series(Categorical([True, False, True, False],
+                                categories=[True, False], ordered=is_ordered))
+
+        expected = Series([False, False, True, True])
+        tm.assert_series_equal(tc.duplicated(), expected)
+        tm.assert_series_equal(tc.drop_duplicates(), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, False, False])
+        tm.assert_series_equal(tc.duplicated(keep='last'), expected)
+        tm.assert_series_equal(tc.drop_duplicates(keep='last'), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep='last', inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
+
+        expected = Series([True, True, True, True])
+        tm.assert_series_equal(tc.duplicated(keep=False), expected)
+        tm.assert_series_equal(tc.drop_duplicates(keep=False), tc[~expected])
+        sc = tc.copy()
+        sc.drop_duplicates(keep=False, inplace=True)
+        tm.assert_series_equal(sc, tc[~expected])
diff --git a/pandas/tests/series/test_api.py b/pandas/tests/series/test_api.py
new file mode 100644
index 0000000000000..1f2e2b179c687
--- /dev/null
+++ b/pandas/tests/series/test_api.py
@@ -0,0 +1,712 @@
+# coding=utf-8
+# pylint: disable-msg=E1101,W0612
+from collections import OrderedDict
+import pydoc
+import warnings
+
+import numpy as np
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import isidentifier, lzip, range, string_types
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, DatetimeIndex, Index, Series, TimedeltaIndex,
+    date_range, period_range, timedelta_range)
+from pandas.core.arrays import PeriodArray
+from pandas.core.indexes.datetimes import Timestamp
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal, ensure_clean
+
+import pandas.io.formats.printing as printing
+
+from .common import TestData
+
+
+class SharedWithSparse(object):
+    """
+    A collection of tests Series and SparseSeries can share.
+
+    In generic tests on this class, use ``self._assert_series_equal()``
+    which is implemented in sub-classes.
+    """
+    def _assert_series_equal(self, left, right):
+        """Dispatch to series class dependent assertion"""
+        raise NotImplementedError
+
+    def test_scalarop_preserve_name(self):
+        result = self.ts * 2
+        assert result.name == self.ts.name
+
+    def test_copy_name(self):
+        result = self.ts.copy()
+        assert result.name == self.ts.name
+
+    def test_copy_index_name_checking(self):
+        # don't want to be able to modify the index stored elsewhere after
+        # making a copy
+
+        self.ts.index.name = None
+        assert self.ts.index.name is None
+        assert self.ts is self.ts
+
+        cp = self.ts.copy()
+        cp.index.name = 'foo'
+        printing.pprint_thing(self.ts.index.name)
+        assert self.ts.index.name is None
+
+    def test_append_preserve_name(self):
+        result = self.ts[:5].append(self.ts[5:])
+        assert result.name == self.ts.name
+
+    def test_binop_maybe_preserve_name(self):
+        # names match, preserve
+        result = self.ts * self.ts
+        assert result.name == self.ts.name
+        result = self.ts.mul(self.ts)
+        assert result.name == self.ts.name
+
+        result = self.ts * self.ts[:-2]
+        assert result.name == self.ts.name
+
+        # names don't match, don't preserve
+        cp = self.ts.copy()
+        cp.name = 'something else'
+        result = self.ts + cp
+        assert result.name is None
+        result = self.ts.add(cp)
+        assert result.name is None
+
+        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'floordiv', 'mod', 'pow']
+        ops = ops + ['r' + op for op in ops]
+        for op in ops:
+            # names match, preserve
+            s = self.ts.copy()
+            result = getattr(s, op)(s)
+            assert result.name == self.ts.name
+
+            # names don't match, don't preserve
+            cp = self.ts.copy()
+            cp.name = 'changed'
+            result = getattr(s, op)(cp)
+            assert result.name is None
+
+    def test_combine_first_name(self):
+        result = self.ts.combine_first(self.ts[:5])
+        assert result.name == self.ts.name
+
+    def test_getitem_preserve_name(self):
+        result = self.ts[self.ts > 0]
+        assert result.name == self.ts.name
+
+        result = self.ts[[0, 2, 4]]
+        assert result.name == self.ts.name
+
+        result = self.ts[5:10]
+        assert result.name == self.ts.name
+
+    def test_pickle(self):
+        unp_series = self._pickle_roundtrip(self.series)
+        unp_ts = self._pickle_roundtrip(self.ts)
+        assert_series_equal(unp_series, self.series)
+        assert_series_equal(unp_ts, self.ts)
+
+    def _pickle_roundtrip(self, obj):
+
+        with ensure_clean() as path:
+            obj.to_pickle(path)
+            unpickled = pd.read_pickle(path)
+            return unpickled
+
+    def test_argsort_preserve_name(self):
+        result = self.ts.argsort()
+        assert result.name == self.ts.name
+
+    def test_sort_index_name(self):
+        result = self.ts.sort_index(ascending=False)
+        assert result.name == self.ts.name
+
+    def test_to_sparse_pass_name(self):
+        result = self.ts.to_sparse()
+        assert result.name == self.ts.name
+
+    def test_constructor_dict(self):
+        d = {'a': 0., 'b': 1., 'c': 2.}
+        result = self.series_klass(d)
+        expected = self.series_klass(d, index=sorted(d.keys()))
+        self._assert_series_equal(result, expected)
+
+        result = self.series_klass(d, index=['b', 'c', 'd', 'a'])
+        expected = self.series_klass([1, 2, np.nan, 0],
+                                     index=['b', 'c', 'd', 'a'])
+        self._assert_series_equal(result, expected)
+
+    def test_constructor_subclass_dict(self):
+        data = tm.TestSubDict((x, 10.0 * x) for x in range(10))
+        series = self.series_klass(data)
+        expected = self.series_klass(dict(compat.iteritems(data)))
+        self._assert_series_equal(series, expected)
+
+    def test_constructor_ordereddict(self):
+        # GH3283
+        data = OrderedDict(
+            ('col%s' % i, np.random.random()) for i in range(12))
+
+        series = self.series_klass(data)
+        expected = self.series_klass(list(data.values()), list(data.keys()))
+        self._assert_series_equal(series, expected)
+
+        # Test with subclass
+        class A(OrderedDict):
+            pass
+
+        series = self.series_klass(A(data))
+        self._assert_series_equal(series, expected)
+
+    def test_constructor_dict_multiindex(self):
+        d = {('a', 'a'): 0., ('b', 'a'): 1., ('b', 'c'): 2.}
+        _d = sorted(d.items())
+        result = self.series_klass(d)
+        expected = self.series_klass(
+            [x[1] for x in _d],
+            index=pd.MultiIndex.from_tuples([x[0] for x in _d]))
+        self._assert_series_equal(result, expected)
+
+        d['z'] = 111.
+        _d.insert(0, ('z', d['z']))
+        result = self.series_klass(d)
+        expected = self.series_klass([x[1] for x in _d],
+                                     index=pd.Index([x[0] for x in _d],
+                                                    tupleize_cols=False))
+        result = result.reindex(index=expected.index)
+        self._assert_series_equal(result, expected)
+
+    def test_constructor_dict_timedelta_index(self):
+        # GH #12169 : Resample category data with timedelta index
+        # construct Series from dict as data and TimedeltaIndex as index
+        # will result NaN in result Series data
+        expected = self.series_klass(
+            data=['A', 'B', 'C'],
+            index=pd.to_timedelta([0, 10, 20], unit='s')
+        )
+
+        result = self.series_klass(
+            data={pd.to_timedelta(0, unit='s'): 'A',
+                  pd.to_timedelta(10, unit='s'): 'B',
+                  pd.to_timedelta(20, unit='s'): 'C'},
+            index=pd.to_timedelta([0, 10, 20], unit='s')
+        )
+        self._assert_series_equal(result, expected)
+
+    def test_from_array_deprecated(self):
+
+        with tm.assert_produces_warning(FutureWarning):
+            self.series_klass.from_array([1, 2, 3])
+
+    def test_sparse_accessor_updates_on_inplace(self):
+        s = pd.Series([1, 1, 2, 3], dtype="Sparse[int]")
+        s.drop([0, 1], inplace=True)
+        assert s.sparse.density == 1.0
+
+
+class TestSeriesMisc(TestData, SharedWithSparse):
+
+    series_klass = Series
+    # SharedWithSparse tests use generic, series_klass-agnostic assertion
+    _assert_series_equal = staticmethod(tm.assert_series_equal)
+
+    def test_tab_completion(self):
+        # GH 9910
+        s = Series(list('abcd'))
+        # Series of str values should have .str but not .dt/.cat in __dir__
+        assert 'str' in dir(s)
+        assert 'dt' not in dir(s)
+        assert 'cat' not in dir(s)
+
+        # similarly for .dt
+        s = Series(date_range('1/1/2015', periods=5))
+        assert 'dt' in dir(s)
+        assert 'str' not in dir(s)
+        assert 'cat' not in dir(s)
+
+        # Similarly for .cat, but with the twist that str and dt should be
+        # there if the categories are of that type first cat and str.
+        s = Series(list('abbcd'), dtype="category")
+        assert 'cat' in dir(s)
+        assert 'str' in dir(s)  # as it is a string categorical
+        assert 'dt' not in dir(s)
+
+        # similar to cat and str
+        s = Series(date_range('1/1/2015', periods=5)).astype("category")
+        assert 'cat' in dir(s)
+        assert 'str' not in dir(s)
+        assert 'dt' in dir(s)  # as it is a datetime categorical
+
+    def test_tab_completion_with_categorical(self):
+        # test the tab completion display
+        ok_for_cat = ['name', 'index', 'categorical', 'categories', 'codes',
+                      'ordered', 'set_categories', 'add_categories',
+                      'remove_categories', 'rename_categories',
+                      'reorder_categories', 'remove_unused_categories',
+                      'as_ordered', 'as_unordered']
+
+        def get_dir(s):
+            results = [r for r in s.cat.__dir__() if not r.startswith('_')]
+            return list(sorted(set(results)))
+
+        s = Series(list('aabbcde')).astype('category')
+        results = get_dir(s)
+        tm.assert_almost_equal(results, list(sorted(set(ok_for_cat))))
+
+    @pytest.mark.parametrize("index", [
+        tm.makeUnicodeIndex(10),
+        tm.makeStringIndex(10),
+        tm.makeCategoricalIndex(10),
+        Index(['foo', 'bar', 'baz'] * 2),
+        tm.makeDateIndex(10),
+        tm.makePeriodIndex(10),
+        tm.makeTimedeltaIndex(10),
+        tm.makeIntIndex(10),
+        tm.makeUIntIndex(10),
+        tm.makeIntIndex(10),
+        tm.makeFloatIndex(10),
+        Index([True, False]),
+        Index(['a{}'.format(i) for i in range(101)]),
+        pd.MultiIndex.from_tuples(lzip('ABCD', 'EFGH')),
+        pd.MultiIndex.from_tuples(lzip([0, 1, 2, 3], 'EFGH')), ])
+    def test_index_tab_completion(self, index):
+        # dir contains string-like values of the Index.
+        s = pd.Series(index=index)
+        dir_s = dir(s)
+        for i, x in enumerate(s.index.unique(level=0)):
+            if i < 100:
+                assert (not isinstance(x, string_types) or
+                        not isidentifier(x) or x in dir_s)
+            else:
+                assert x not in dir_s
+
+    def test_not_hashable(self):
+        s_empty = Series()
+        s = Series([1])
+        msg = "'Series' objects are mutable, thus they cannot be hashed"
+        with pytest.raises(TypeError, match=msg):
+            hash(s_empty)
+        with pytest.raises(TypeError, match=msg):
+            hash(s)
+
+    def test_contains(self):
+        tm.assert_contains_all(self.ts.index, self.ts)
+
+    def test_iter(self):
+        for i, val in enumerate(self.series):
+            assert val == self.series[i]
+
+        for i, val in enumerate(self.ts):
+            assert val == self.ts[i]
+
+    def test_keys(self):
+        # HACK: By doing this in two stages, we avoid 2to3 wrapping the call
+        # to .keys() in a list()
+        getkeys = self.ts.keys
+        assert getkeys() is self.ts.index
+
+    def test_values(self):
+        tm.assert_almost_equal(self.ts.values, self.ts, check_dtype=False)
+
+    def test_iteritems(self):
+        for idx, val in compat.iteritems(self.series):
+            assert val == self.series[idx]
+
+        for idx, val in compat.iteritems(self.ts):
+            assert val == self.ts[idx]
+
+        # assert is lazy (genrators don't define reverse, lists do)
+        assert not hasattr(self.series.iteritems(), 'reverse')
+
+    def test_items(self):
+        for idx, val in self.series.items():
+            assert val == self.series[idx]
+
+        for idx, val in self.ts.items():
+            assert val == self.ts[idx]
+
+        # assert is lazy (genrators don't define reverse, lists do)
+        assert not hasattr(self.series.items(), 'reverse')
+
+    def test_raise_on_info(self):
+        s = Series(np.random.randn(10))
+        msg = "'Series' object has no attribute 'info'"
+        with pytest.raises(AttributeError, match=msg):
+            s.info()
+
+    def test_copy(self):
+
+        for deep in [None, False, True]:
+            s = Series(np.arange(10), dtype='float64')
+
+            # default deep is True
+            if deep is None:
+                s2 = s.copy()
+            else:
+                s2 = s.copy(deep=deep)
+
+            s2[::2] = np.NaN
+
+            if deep is None or deep is True:
+                # Did not modify original Series
+                assert np.isnan(s2[0])
+                assert not np.isnan(s[0])
+            else:
+                # we DID modify the original Series
+                assert np.isnan(s2[0])
+                assert np.isnan(s[0])
+
+        # GH 11794
+        # copy of tz-aware
+        expected = Series([Timestamp('2012/01/01', tz='UTC')])
+        expected2 = Series([Timestamp('1999/01/01', tz='UTC')])
+
+        for deep in [None, False, True]:
+
+            s = Series([Timestamp('2012/01/01', tz='UTC')])
+
+            if deep is None:
+                s2 = s.copy()
+            else:
+                s2 = s.copy(deep=deep)
+
+            s2[0] = pd.Timestamp('1999/01/01', tz='UTC')
+
+            # default deep is True
+            if deep is None or deep is True:
+                # Did not modify original Series
+                assert_series_equal(s2, expected2)
+                assert_series_equal(s, expected)
+            else:
+                # we DID modify the original Series
+                assert_series_equal(s2, expected2)
+                assert_series_equal(s, expected2)
+
+    def test_axis_alias(self):
+        s = Series([1, 2, np.nan])
+        assert_series_equal(s.dropna(axis='rows'), s.dropna(axis='index'))
+        assert s.dropna().sum('rows') == 3
+        assert s._get_axis_number('rows') == 0
+        assert s._get_axis_name('rows') == 'index'
+
+    def test_class_axis(self):
+        # https://github.com/pandas-dev/pandas/issues/18147
+        # no exception and no empty docstring
+        assert pydoc.getdoc(Series.index)
+
+    def test_numpy_unique(self):
+        # it works!
+        np.unique(self.ts)
+
+    def test_ndarray_compat(self):
+
+        # test numpy compat with Series as sub-class of NDFrame
+        tsdf = DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
+                         index=date_range('1/1/2000', periods=1000))
+
+        def f(x):
+            return x[x.idxmax()]
+
+        result = tsdf.apply(f)
+        expected = tsdf.max()
+        tm.assert_series_equal(result, expected)
+
+        # .item()
+        s = Series([1])
+        result = s.item()
+        assert result == 1
+        assert s.item() == s.iloc[0]
+
+        # using an ndarray like function
+        s = Series(np.random.randn(10))
+        result = Series(np.ones_like(s))
+        expected = Series(1, index=range(10), dtype='float64')
+        tm.assert_series_equal(result, expected)
+
+        # ravel
+        s = Series(np.random.randn(10))
+        tm.assert_almost_equal(s.ravel(order='F'), s.values.ravel(order='F'))
+
+        # compress
+        # GH 6658
+        s = Series([0, 1., -1], index=list('abc'))
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = np.compress(s > 0, s)
+        tm.assert_series_equal(result, Series([1.], index=['b']))
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = np.compress(s < -1, s)
+        # result empty Index(dtype=object) as the same as original
+        exp = Series([], dtype='float64', index=Index([], dtype='object'))
+        tm.assert_series_equal(result, exp)
+
+        s = Series([0, 1., -1], index=[.1, .2, .3])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = np.compress(s > 0, s)
+        tm.assert_series_equal(result, Series([1.], index=[.2]))
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = np.compress(s < -1, s)
+        # result empty Float64Index as the same as original
+        exp = Series([], dtype='float64', index=Index([], dtype='float64'))
+        tm.assert_series_equal(result, exp)
+
+    def test_str_accessor_updates_on_inplace(self):
+        s = pd.Series(list('abc'))
+        s.drop([0], inplace=True)
+        assert len(s.str.lower()) == 2
+
+    def test_str_attribute(self):
+        # GH9068
+        methods = ['strip', 'rstrip', 'lstrip']
+        s = Series([' jack', 'jill ', ' jesse ', 'frank'])
+        for method in methods:
+            expected = Series([getattr(str, method)(x) for x in s.values])
+            assert_series_equal(getattr(Series.str, method)(s.str), expected)
+
+        # str accessor only valid with string values
+        s = Series(range(5))
+        with pytest.raises(AttributeError, match='only use .str accessor'):
+            s.str.repeat(2)
+
+    def test_empty_method(self):
+        s_empty = pd.Series()
+        assert s_empty.empty
+
+        for full_series in [pd.Series([1]), pd.Series(index=[1])]:
+            assert not full_series.empty
+
+    def test_tab_complete_warning(self, ip):
+        # https://github.com/pandas-dev/pandas/issues/16409
+        pytest.importorskip('IPython', minversion="6.0.0")
+        from IPython.core.completer import provisionalcompleter
+
+        code = "import pandas as pd; s = pd.Series()"
+        ip.run_code(code)
+        with tm.assert_produces_warning(None):
+            with provisionalcompleter('ignore'):
+                list(ip.Completer.completions('s.', 1))
+
+
+class TestCategoricalSeries(object):
+
+    @pytest.mark.parametrize(
+        "method",
+        [
+            lambda x: x.cat.set_categories([1, 2, 3]),
+            lambda x: x.cat.reorder_categories([2, 3, 1], ordered=True),
+            lambda x: x.cat.rename_categories([1, 2, 3]),
+            lambda x: x.cat.remove_unused_categories(),
+            lambda x: x.cat.remove_categories([2]),
+            lambda x: x.cat.add_categories([4]),
+            lambda x: x.cat.as_ordered(),
+            lambda x: x.cat.as_unordered(),
+        ])
+    def test_getname_categorical_accessor(self, method):
+        # GH 17509
+        s = Series([1, 2, 3], name='A').astype('category')
+        expected = 'A'
+        result = method(s).name
+        assert result == expected
+
+    def test_cat_accessor(self):
+        s = Series(Categorical(["a", "b", np.nan, "a"]))
+        tm.assert_index_equal(s.cat.categories, Index(["a", "b"]))
+        assert not s.cat.ordered, False
+
+        exp = Categorical(["a", "b", np.nan, "a"], categories=["b", "a"])
+        s.cat.set_categories(["b", "a"], inplace=True)
+        tm.assert_categorical_equal(s.values, exp)
+
+        res = s.cat.set_categories(["b", "a"])
+        tm.assert_categorical_equal(res.values, exp)
+
+        s[:] = "a"
+        s = s.cat.remove_unused_categories()
+        tm.assert_index_equal(s.cat.categories, Index(["a"]))
+
+    def test_cat_accessor_api(self):
+        # GH 9322
+        from pandas.core.arrays.categorical import CategoricalAccessor
+        assert Series.cat is CategoricalAccessor
+        s = Series(list('aabbcde')).astype('category')
+        assert isinstance(s.cat, CategoricalAccessor)
+
+        invalid = Series([1])
+        with pytest.raises(AttributeError, match="only use .cat accessor"):
+            invalid.cat
+        assert not hasattr(invalid, 'cat')
+
+    def test_cat_accessor_no_new_attributes(self):
+        # https://github.com/pandas-dev/pandas/issues/10673
+        c = Series(list('aabbcde')).astype('category')
+        with pytest.raises(AttributeError,
+                           match="You cannot add any new attribute"):
+            c.cat.xlabel = "a"
+
+    def test_cat_accessor_updates_on_inplace(self):
+        s = Series(list('abc')).astype('category')
+        s.drop(0, inplace=True)
+        s.cat.remove_unused_categories(inplace=True)
+        assert len(s.cat.categories) == 2
+
+    def test_categorical_delegations(self):
+
+        # invalid accessor
+        msg = r"Can only use \.cat accessor with a 'category' dtype"
+        with pytest.raises(AttributeError, match=msg):
+            Series([1, 2, 3]).cat
+        with pytest.raises(AttributeError, match=msg):
+            Series([1, 2, 3]).cat()
+        with pytest.raises(AttributeError, match=msg):
+            Series(['a', 'b', 'c']).cat
+        with pytest.raises(AttributeError, match=msg):
+            Series(np.arange(5.)).cat
+        with pytest.raises(AttributeError, match=msg):
+            Series([Timestamp('20130101')]).cat
+
+        # Series should delegate calls to '.categories', '.codes', '.ordered'
+        # and the methods '.set_categories()' 'drop_unused_categories()' to the
+        # categorical# -*- coding: utf-8 -*-
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        exp_categories = Index(["a", "b", "c"])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        s.cat.categories = [1, 2, 3]
+        exp_categories = Index([1, 2, 3])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+
+        exp_codes = Series([0, 1, 2, 0], dtype='int8')
+        tm.assert_series_equal(s.cat.codes, exp_codes)
+
+        assert s.cat.ordered
+        s = s.cat.as_unordered()
+        assert not s.cat.ordered
+        s.cat.as_ordered(inplace=True)
+        assert s.cat.ordered
+
+        # reorder
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        exp_categories = Index(["c", "b", "a"])
+        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        s = s.cat.set_categories(["c", "b", "a"])
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(s.values.__array__(), exp_values)
+        tm.assert_numpy_array_equal(s.__array__(), exp_values)
+
+        # remove unused categories
+        s = Series(Categorical(["a", "b", "b", "a"], categories=["a", "b", "c"
+                                                                 ]))
+        exp_categories = Index(["a", "b"])
+        exp_values = np.array(["a", "b", "b", "a"], dtype=np.object_)
+        s = s.cat.remove_unused_categories()
+        tm.assert_index_equal(s.cat.categories, exp_categories)
+        tm.assert_numpy_array_equal(s.values.__array__(), exp_values)
+        tm.assert_numpy_array_equal(s.__array__(), exp_values)
+
+        # This method is likely to be confused, so test that it raises an error
+        # on wrong inputs:
+        msg = "'Series' object has no attribute 'set_categories'"
+        with pytest.raises(AttributeError, match=msg):
+            s.set_categories([4, 3, 2, 1])
+
+        # right: s.cat.set_categories([4,3,2,1])
+
+        # GH18862 (let Series.cat.rename_categories take callables)
+        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
+        result = s.cat.rename_categories(lambda x: x.upper())
+        expected = Series(Categorical(["A", "B", "C", "A"],
+                                      categories=["A", "B", "C"],
+                                      ordered=True))
+        tm.assert_series_equal(result, expected)
+
+    def test_dt_accessor_api_for_categorical(self):
+        # https://github.com/pandas-dev/pandas/issues/10661
+        from pandas.core.indexes.accessors import Properties
+
+        s_dr = Series(date_range('1/1/2015', periods=5, tz="MET"))
+        c_dr = s_dr.astype("category")
+
+        s_pr = Series(period_range('1/1/2015', freq='D', periods=5))
+        c_pr = s_pr.astype("category")
+
+        s_tdr = Series(timedelta_range('1 days', '10 days'))
+        c_tdr = s_tdr.astype("category")
+
+        # only testing field (like .day)
+        # and bool (is_month_start)
+        get_ops = lambda x: x._datetimelike_ops
+
+        test_data = [
+            ("Datetime", get_ops(DatetimeIndex), s_dr, c_dr),
+            ("Period", get_ops(PeriodArray), s_pr, c_pr),
+            ("Timedelta", get_ops(TimedeltaIndex), s_tdr, c_tdr)]
+
+        assert isinstance(c_dr.dt, Properties)
+
+        special_func_defs = [
+            ('strftime', ("%Y-%m-%d",), {}),
+            ('tz_convert', ("EST",), {}),
+            ('round', ("D",), {}),
+            ('floor', ("D",), {}),
+            ('ceil', ("D",), {}),
+            ('asfreq', ("D",), {}),
+            # ('tz_localize', ("UTC",), {}),
+        ]
+        _special_func_names = [f[0] for f in special_func_defs]
+
+        # the series is already localized
+        _ignore_names = ['tz_localize', 'components']
+
+        for name, attr_names, s, c in test_data:
+            func_names = [f
+                          for f in dir(s.dt)
+                          if not (f.startswith("_") or f in attr_names or f in
+                                  _special_func_names or f in _ignore_names)]
+
+            func_defs = [(f, (), {}) for f in func_names]
+            for f_def in special_func_defs:
+                if f_def[0] in dir(s.dt):
+                    func_defs.append(f_def)
+
+            for func, args, kwargs in func_defs:
+                with warnings.catch_warnings():
+                    if func == 'to_period':
+                        # dropping TZ
+                        warnings.simplefilter("ignore", UserWarning)
+                    res = getattr(c.dt, func)(*args, **kwargs)
+                    exp = getattr(s.dt, func)(*args, **kwargs)
+
+                if isinstance(res, DataFrame):
+                    tm.assert_frame_equal(res, exp)
+                elif isinstance(res, Series):
+                    tm.assert_series_equal(res, exp)
+                else:
+                    tm.assert_almost_equal(res, exp)
+
+            for attr in attr_names:
+                try:
+                    res = getattr(c.dt, attr)
+                    exp = getattr(s.dt, attr)
+                except Exception as e:
+                    print(name, attr)
+                    raise e
+
+            if isinstance(res, DataFrame):
+                tm.assert_frame_equal(res, exp)
+            elif isinstance(res, Series):
+                tm.assert_series_equal(res, exp)
+            else:
+                tm.assert_almost_equal(res, exp)
+
+        invalid = Series([1, 2, 3]).astype('category')
+        msg = "Can only use .dt accessor with datetimelike"
+
+        with pytest.raises(AttributeError, match=msg):
+            invalid.dt
+        assert not hasattr(invalid, 'str')
diff --git a/pandas/tests/series/test_apply.py b/pandas/tests/series/test_apply.py
index 16d1466bb90fe..162a27db34cb1 100644
--- a/pandas/tests/series/test_apply.py
+++ b/pandas/tests/series/test_apply.py
@@ -1,43 +1,44 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
+from collections import Counter, OrderedDict, defaultdict
+from itertools import chain
+
 import numpy as np
-import pandas as pd
+import pytest
 
-from pandas import (Index, Series, DataFrame, isnull)
+import pandas.compat as compat
 from pandas.compat import lrange
-from pandas import compat
-from pandas.util.testing import assert_series_equal
-import pandas.util.testing as tm
 
-from .common import TestData
+import pandas as pd
+from pandas import DataFrame, Index, Series, isna
+from pandas.conftest import _get_cython_table_params
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestSeriesApply(TestData, tm.TestCase):
+class TestSeriesApply():
 
-    def test_apply(self):
+    def test_apply(self, datetime_series):
         with np.errstate(all='ignore'):
-            assert_series_equal(self.ts.apply(np.sqrt), np.sqrt(self.ts))
+            tm.assert_series_equal(datetime_series.apply(np.sqrt),
+                                   np.sqrt(datetime_series))
 
-            # elementwise-apply
+            # element-wise apply
             import math
-            assert_series_equal(self.ts.apply(math.exp), np.exp(self.ts))
-
-            # how to handle Series result, #2316
-            result = self.ts.apply(lambda x: Series(
-                [x, x ** 2], index=['x', 'x^2']))
-            expected = DataFrame({'x': self.ts, 'x^2': self.ts ** 2})
-            tm.assert_frame_equal(result, expected)
+            tm.assert_series_equal(datetime_series.apply(math.exp),
+                                   np.exp(datetime_series))
 
         # empty series
         s = Series(dtype=object, name='foo', index=pd.Index([], name='bar'))
         rs = s.apply(lambda x: x)
         tm.assert_series_equal(s, rs)
+
         # check all metadata (GH 9322)
-        self.assertIsNot(s, rs)
-        self.assertIs(s.index, rs.index)
-        self.assertEqual(s.dtype, rs.dtype)
-        self.assertEqual(s.name, rs.name)
+        assert s is not rs
+        assert s.index is rs.index
+        assert s.dtype == rs.dtype
+        assert s.name == rs.name
 
         # index but no data
         s = Series(index=[1, 2, 3])
@@ -62,20 +63,38 @@ def test_apply_dont_convert_dtype(self):
 
         f = lambda x: x if x > 0 else np.nan
         result = s.apply(f, convert_dtype=False)
-        self.assertEqual(result.dtype, object)
+        assert result.dtype == object
+
+    def test_with_string_args(self, datetime_series):
+
+        for arg in ['sum', 'mean', 'min', 'max', 'std']:
+            result = datetime_series.apply(arg)
+            expected = getattr(datetime_series, arg)()
+            assert result == expected
 
     def test_apply_args(self):
         s = Series(['foo,bar'])
 
         result = s.apply(str.split, args=(',', ))
-        self.assertEqual(result[0], ['foo', 'bar'])
-        tm.assertIsInstance(result[0], list)
+        assert result[0] == ['foo', 'bar']
+        assert isinstance(result[0], list)
+
+    def test_series_map_box_timestamps(self):
+        # GH#2689, GH#2627
+        ser = Series(pd.date_range('1/1/2000', periods=10))
+
+        def func(x):
+            return (x.hour, x.day, x.month)
+
+        # it works!
+        ser.map(func)
+        ser.apply(func)
 
     def test_apply_box(self):
         # ufunc will not be boxed. Same test cases as the test_map_box
         vals = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         # boxed value must be Timestamp instance
         res = s.apply(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
                                                      x.day, x.tz))
@@ -85,7 +104,7 @@ def test_apply_box(self):
         vals = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
                 pd.Timestamp('2011-01-02', tz='US/Eastern')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns, US/Eastern]')
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
         res = s.apply(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
                                                      x.day, x.tz))
         exp = pd.Series(['Timestamp_1_US/Eastern', 'Timestamp_2_US/Eastern'])
@@ -94,16 +113,16 @@ def test_apply_box(self):
         # timedelta
         vals = [pd.Timedelta('1 days'), pd.Timedelta('2 days')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         res = s.apply(lambda x: '{0}_{1}'.format(x.__class__.__name__, x.days))
         exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
         tm.assert_series_equal(res, exp)
 
-        # period (object dtype, not boxed)
+        # period
         vals = [pd.Period('2011-01-01', freq='M'),
                 pd.Period('2011-01-02', freq='M')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'object')
+        assert s.dtype == 'Period[M]'
         res = s.apply(lambda x: '{0}_{1}'.format(x.__class__.__name__,
                                                  x.freqstr))
         exp = pd.Series(['Period_M', 'Period_M'])
@@ -136,10 +155,276 @@ def f(x):
         exp = pd.Series(['Asia/Tokyo'] * 25, name='XX')
         tm.assert_series_equal(result, exp)
 
+    def test_apply_dict_depr(self):
+
+        tsdf = pd.DataFrame(np.random.randn(10, 3),
+                            columns=['A', 'B', 'C'],
+                            index=pd.date_range('1/1/2000', periods=10))
+        with tm.assert_produces_warning(FutureWarning):
+            tsdf.A.agg({'foo': ['sum', 'mean']})
+
+    @pytest.mark.parametrize('series', [
+        ['1-1', '1-1', np.NaN],
+        ['1-1', '1-2', np.NaN]])
+    def test_apply_categorical_with_nan_values(self, series):
+        # GH 20714 bug fixed in: GH 24275
+        s = pd.Series(series, dtype='category')
+        result = s.apply(lambda x: x.split('-')[0])
+        result = result.astype(object)
+        expected = pd.Series(['1', '1', np.NaN], dtype='category')
+        expected = expected.astype(object)
+        tm.assert_series_equal(result, expected)
+
 
-class TestSeriesMap(TestData, tm.TestCase):
+class TestSeriesAggregate():
+
+    def test_transform(self, string_series):
+        # transforming functions
+
+        with np.errstate(all='ignore'):
+
+            f_sqrt = np.sqrt(string_series)
+            f_abs = np.abs(string_series)
+
+            # ufunc
+            result = string_series.transform(np.sqrt)
+            expected = f_sqrt.copy()
+            assert_series_equal(result, expected)
+
+            result = string_series.apply(np.sqrt)
+            assert_series_equal(result, expected)
+
+            # list-like
+            result = string_series.transform([np.sqrt])
+            expected = f_sqrt.to_frame().copy()
+            expected.columns = ['sqrt']
+            assert_frame_equal(result, expected)
+
+            result = string_series.transform([np.sqrt])
+            assert_frame_equal(result, expected)
+
+            result = string_series.transform(['sqrt'])
+            assert_frame_equal(result, expected)
+
+            # multiple items in list
+            # these are in the order as if we are applying both functions per
+            # series and then concatting
+            expected = pd.concat([f_sqrt, f_abs], axis=1)
+            expected.columns = ['sqrt', 'absolute']
+            result = string_series.apply([np.sqrt, np.abs])
+            assert_frame_equal(result, expected)
+
+            result = string_series.transform(['sqrt', 'abs'])
+            expected.columns = ['sqrt', 'abs']
+            assert_frame_equal(result, expected)
+
+            # dict, provide renaming
+            expected = pd.concat([f_sqrt, f_abs], axis=1)
+            expected.columns = ['foo', 'bar']
+            expected = expected.unstack().rename('series')
+
+            result = string_series.apply({'foo': np.sqrt, 'bar': np.abs})
+            assert_series_equal(result.reindex_like(expected), expected)
+
+    def test_transform_and_agg_error(self, string_series):
+        # we are trying to transform with an aggregator
+        with pytest.raises(ValueError):
+            string_series.transform(['min', 'max'])
+
+        with pytest.raises(ValueError):
+            with np.errstate(all='ignore'):
+                string_series.agg(['sqrt', 'max'])
+
+        with pytest.raises(ValueError):
+            with np.errstate(all='ignore'):
+                string_series.transform(['sqrt', 'max'])
+
+        with pytest.raises(ValueError):
+            with np.errstate(all='ignore'):
+                string_series.agg({'foo': np.sqrt, 'bar': 'sum'})
+
+    def test_demo(self):
+        # demonstration tests
+        s = Series(range(6), dtype='int64', name='series')
+
+        result = s.agg(['min', 'max'])
+        expected = Series([0, 5], index=['min', 'max'], name='series')
+        tm.assert_series_equal(result, expected)
+
+        result = s.agg({'foo': 'min'})
+        expected = Series([0], index=['foo'], name='series')
+        tm.assert_series_equal(result, expected)
+
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.agg({'foo': ['min', 'max']})
+
+        expected = DataFrame(
+            {'foo': [0, 5]},
+            index=['min', 'max']).unstack().rename('series')
+        tm.assert_series_equal(result, expected)
+
+    def test_multiple_aggregators_with_dict_api(self):
+
+        s = Series(range(6), dtype='int64', name='series')
+        # nested renaming
+        with tm.assert_produces_warning(FutureWarning):
+            result = s.agg({'foo': ['min', 'max'], 'bar': ['sum', 'mean']})
+
+        expected = DataFrame(
+            {'foo': [5.0, np.nan, 0.0, np.nan],
+             'bar': [np.nan, 2.5, np.nan, 15.0]},
+            columns=['foo', 'bar'],
+            index=['max', 'mean',
+                   'min', 'sum']).unstack().rename('series')
+        tm.assert_series_equal(result.reindex_like(expected), expected)
+
+    def test_agg_apply_evaluate_lambdas_the_same(self, string_series):
+        # test that we are evaluating row-by-row first
+        # before vectorized evaluation
+        result = string_series.apply(lambda x: str(x))
+        expected = string_series.agg(lambda x: str(x))
+        tm.assert_series_equal(result, expected)
+
+        result = string_series.apply(str)
+        expected = string_series.agg(str)
+        tm.assert_series_equal(result, expected)
+
+    def test_with_nested_series(self, datetime_series):
+        # GH 2316
+        # .agg with a reducer and a transform, what to do
+        result = datetime_series.apply(lambda x: Series(
+            [x, x ** 2], index=['x', 'x^2']))
+        expected = DataFrame({'x': datetime_series,
+                              'x^2': datetime_series ** 2})
+        tm.assert_frame_equal(result, expected)
+
+        result = datetime_series.agg(lambda x: Series(
+            [x, x ** 2], index=['x', 'x^2']))
+        tm.assert_frame_equal(result, expected)
+
+    def test_replicate_describe(self, string_series):
+        # this also tests a result set that is all scalars
+        expected = string_series.describe()
+        result = string_series.apply(OrderedDict(
+            [('count', 'count'),
+             ('mean', 'mean'),
+             ('std', 'std'),
+             ('min', 'min'),
+             ('25%', lambda x: x.quantile(0.25)),
+             ('50%', 'median'),
+             ('75%', lambda x: x.quantile(0.75)),
+             ('max', 'max')]))
+        assert_series_equal(result, expected)
 
-    def test_map(self):
+    def test_reduce(self, string_series):
+        # reductions with named functions
+        result = string_series.agg(['sum', 'mean'])
+        expected = Series([string_series.sum(),
+                           string_series.mean()],
+                          ['sum', 'mean'],
+                          name=string_series.name)
+        assert_series_equal(result, expected)
+
+    def test_non_callable_aggregates(self):
+        # test agg using non-callable series attributes
+        s = Series([1, 2, None])
+
+        # Calling agg w/ just a string arg same as calling s.arg
+        result = s.agg('size')
+        expected = s.size
+        assert result == expected
+
+        # test when mixed w/ callable reducers
+        result = s.agg(['size', 'count', 'mean'])
+        expected = Series(OrderedDict([('size', 3.0),
+                                       ('count', 2.0),
+                                       ('mean', 1.5)]))
+        assert_series_equal(result[expected.index], expected)
+
+    @pytest.mark.parametrize("series, func, expected", chain(
+        _get_cython_table_params(Series(), [
+            ('sum', 0),
+            ('max', np.nan),
+            ('min', np.nan),
+            ('all', True),
+            ('any', False),
+            ('mean', np.nan),
+            ('prod', 1),
+            ('std', np.nan),
+            ('var', np.nan),
+            ('median', np.nan),
+        ]),
+        _get_cython_table_params(Series([np.nan, 1, 2, 3]), [
+            ('sum', 6),
+            ('max', 3),
+            ('min', 1),
+            ('all', True),
+            ('any', True),
+            ('mean', 2),
+            ('prod', 6),
+            ('std', 1),
+            ('var', 1),
+            ('median', 2),
+        ]),
+        _get_cython_table_params(Series('a b c'.split()), [
+            ('sum', 'abc'),
+            ('max', 'c'),
+            ('min', 'a'),
+            ('all', 'c'),  # see GH12863
+            ('any', 'a'),
+        ]),
+    ))
+    def test_agg_cython_table(self, series, func, expected):
+        # GH21224
+        # test reducing functions in
+        # pandas.core.base.SelectionMixin._cython_table
+        result = series.agg(func)
+        if tm.is_number(expected):
+            assert np.isclose(result, expected, equal_nan=True)
+        else:
+            assert result == expected
+
+    @pytest.mark.parametrize("series, func, expected", chain(
+        _get_cython_table_params(Series(), [
+            ('cumprod', Series([], Index([]))),
+            ('cumsum', Series([], Index([]))),
+        ]),
+        _get_cython_table_params(Series([np.nan, 1, 2, 3]), [
+            ('cumprod', Series([np.nan, 1, 2, 6])),
+            ('cumsum', Series([np.nan, 1, 3, 6])),
+        ]),
+        _get_cython_table_params(Series('a b c'.split()), [
+            ('cumsum', Series(['a', 'ab', 'abc'])),
+        ]),
+    ))
+    def test_agg_cython_table_transform(self, series, func, expected):
+        # GH21224
+        # test transforming functions in
+        # pandas.core.base.SelectionMixin._cython_table (cumprod, cumsum)
+        result = series.agg(func)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("series, func, expected", chain(
+        _get_cython_table_params(Series('a b c'.split()), [
+            ('mean', TypeError),  # mean raises TypeError
+            ('prod', TypeError),
+            ('std', TypeError),
+            ('var', TypeError),
+            ('median', TypeError),
+            ('cumprod', TypeError),
+        ])
+    ))
+    def test_agg_cython_table_raises(self, series, func, expected):
+        # GH21224
+        with pytest.raises(expected):
+            # e.g. Series('a b'.split()).cumprod() will raise
+            series.agg(func)
+
+
+class TestSeriesMap():
+
+    def test_map(self, datetime_series):
         index, data = tm.getMixedTypeDict()
 
         source = Series(data['B'], index=data['C'])
@@ -148,17 +433,17 @@ def test_map(self):
         merged = target.map(source)
 
         for k, v in compat.iteritems(merged):
-            self.assertEqual(v, source[target[k]])
+            assert v == source[target[k]]
 
         # input could be a dict
         merged = target.map(source.to_dict())
 
         for k, v in compat.iteritems(merged):
-            self.assertEqual(v, source[target[k]])
+            assert v == source[target[k]]
 
         # function
-        result = self.ts.map(lambda x: x * 2)
-        self.assert_series_equal(result, self.ts * 2)
+        result = datetime_series.map(lambda x: x * 2)
+        tm.assert_series_equal(result, datetime_series * 2)
 
         # GH 10324
         a = Series([1, 2, 3, 4])
@@ -166,9 +451,9 @@ def test_map(self):
         c = Series(["even", "odd", "even", "odd"])
 
         exp = Series(["odd", "even", "odd", np.nan], dtype="category")
-        self.assert_series_equal(a.map(b), exp)
+        tm.assert_series_equal(a.map(b), exp)
         exp = Series(["odd", "even", "odd", np.nan])
-        self.assert_series_equal(a.map(c), exp)
+        tm.assert_series_equal(a.map(c), exp)
 
         a = Series(['a', 'b', 'c', 'd'])
         b = Series([1, 2, 3, 4],
@@ -176,9 +461,9 @@ def test_map(self):
         c = Series([1, 2, 3, 4], index=Index(['b', 'c', 'd', 'e']))
 
         exp = Series([np.nan, 1, 2, 3])
-        self.assert_series_equal(a.map(b), exp)
+        tm.assert_series_equal(a.map(b), exp)
         exp = Series([np.nan, 1, 2, 3])
-        self.assert_series_equal(a.map(c), exp)
+        tm.assert_series_equal(a.map(c), exp)
 
         a = Series(['a', 'b', 'c', 'd'])
         b = Series(['B', 'C', 'D', 'E'], dtype='category',
@@ -187,9 +472,17 @@ def test_map(self):
 
         exp = Series(pd.Categorical([np.nan, 'B', 'C', 'D'],
                                     categories=['B', 'C', 'D', 'E']))
-        self.assert_series_equal(a.map(b), exp)
+        tm.assert_series_equal(a.map(b), exp)
         exp = Series([np.nan, 'B', 'C', 'D'])
-        self.assert_series_equal(a.map(c), exp)
+        tm.assert_series_equal(a.map(c), exp)
+
+    @pytest.mark.parametrize("index", tm.all_index_generator(10))
+    def test_map_empty(self, index):
+        s = Series(index)
+        result = s.map({})
+
+        expected = pd.Series(np.nan, index=s.index)
+        tm.assert_series_equal(result, expected)
 
     def test_map_compat(self):
         # related GH 8024
@@ -202,25 +495,25 @@ def test_map_int(self):
         left = Series({'a': 1., 'b': 2., 'c': 3., 'd': 4})
         right = Series({1: 11, 2: 22, 3: 33})
 
-        self.assertEqual(left.dtype, np.float_)
-        self.assertTrue(issubclass(right.dtype.type, np.integer))
+        assert left.dtype == np.float_
+        assert issubclass(right.dtype.type, np.integer)
 
         merged = left.map(right)
-        self.assertEqual(merged.dtype, np.float_)
-        self.assertTrue(isnull(merged['d']))
-        self.assertTrue(not isnull(merged['c']))
+        assert merged.dtype == np.float_
+        assert isna(merged['d'])
+        assert not isna(merged['c'])
 
     def test_map_type_inference(self):
         s = Series(lrange(3))
         s2 = s.map(lambda x: np.where(x == 0, 0, 1))
-        self.assertTrue(issubclass(s2.dtype.type, np.integer))
+        assert issubclass(s2.dtype.type, np.integer)
 
-    def test_map_decimal(self):
+    def test_map_decimal(self, string_series):
         from decimal import Decimal
 
-        result = self.series.map(lambda x: Decimal(str(x)))
-        self.assertEqual(result.dtype, np.object_)
-        tm.assertIsInstance(result[0], Decimal)
+        result = string_series.map(lambda x: Decimal(str(x)))
+        assert result.dtype == np.object_
+        assert isinstance(result[0], Decimal)
 
     def test_map_na_exclusion(self):
         s = Series([1.5, np.nan, 3, np.nan, 5])
@@ -236,18 +529,60 @@ def test_map_dict_with_tuple_keys(self):
         converted to a multi-index, preventing tuple values
         from being mapped properly.
         """
+        # GH 18496
         df = pd.DataFrame({'a': [(1, ), (2, ), (3, 4), (5, 6)]})
         label_mappings = {(1, ): 'A', (2, ): 'B', (3, 4): 'A', (5, 6): 'B'}
+
         df['labels'] = df['a'].map(label_mappings)
         df['expected_labels'] = pd.Series(['A', 'B', 'A', 'B'], index=df.index)
         # All labels should be filled now
         tm.assert_series_equal(df['labels'], df['expected_labels'],
                                check_names=False)
 
+    def test_map_counter(self):
+        s = Series(['a', 'b', 'c'], index=[1, 2, 3])
+        counter = Counter()
+        counter['b'] = 5
+        counter['c'] += 1
+        result = s.map(counter)
+        expected = Series([0, 5, 1], index=[1, 2, 3])
+        assert_series_equal(result, expected)
+
+    def test_map_defaultdict(self):
+        s = Series([1, 2, 3], index=['a', 'b', 'c'])
+        default_dict = defaultdict(lambda: 'blank')
+        default_dict[1] = 'stuff'
+        result = s.map(default_dict)
+        expected = Series(['stuff', 'blank', 'blank'], index=['a', 'b', 'c'])
+        assert_series_equal(result, expected)
+
+    def test_map_dict_subclass_with_missing(self):
+        """
+        Test Series.map with a dictionary subclass that defines __missing__,
+        i.e. sets a default value (GH #15999).
+        """
+        class DictWithMissing(dict):
+            def __missing__(self, key):
+                return 'missing'
+        s = Series([1, 2, 3])
+        dictionary = DictWithMissing({3: 'three'})
+        result = s.map(dictionary)
+        expected = Series(['missing', 'missing', 'three'])
+        assert_series_equal(result, expected)
+
+    def test_map_dict_subclass_without_missing(self):
+        class DictWithoutMissing(dict):
+            pass
+        s = Series([1, 2, 3])
+        dictionary = DictWithoutMissing({3: 'three'})
+        result = s.map(dictionary)
+        expected = Series([np.nan, np.nan, 'three'])
+        assert_series_equal(result, expected)
+
     def test_map_box(self):
         vals = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         # boxed value must be Timestamp instance
         res = s.map(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
                                                    x.day, x.tz))
@@ -257,7 +592,7 @@ def test_map_box(self):
         vals = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
                 pd.Timestamp('2011-01-02', tz='US/Eastern')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns, US/Eastern]')
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
         res = s.map(lambda x: '{0}_{1}_{2}'.format(x.__class__.__name__,
                                                    x.day, x.tz))
         exp = pd.Series(['Timestamp_1_US/Eastern', 'Timestamp_2_US/Eastern'])
@@ -266,16 +601,16 @@ def test_map_box(self):
         # timedelta
         vals = [pd.Timedelta('1 days'), pd.Timedelta('2 days')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         res = s.map(lambda x: '{0}_{1}'.format(x.__class__.__name__, x.days))
         exp = pd.Series(['Timedelta_1', 'Timedelta_2'])
         tm.assert_series_equal(res, exp)
 
-        # period (object dtype, not boxed)
+        # period
         vals = [pd.Period('2011-01-01', freq='M'),
                 pd.Period('2011-01-02', freq='M')]
         s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'object')
+        assert s.dtype == 'Period[M]'
         res = s.map(lambda x: '{0}_{1}'.format(x.__class__.__name__,
                                                x.freqstr))
         exp = pd.Series(['Period_M', 'Period_M'])
@@ -296,9 +631,9 @@ def test_map_categorical(self):
         result = s.map(lambda x: 'A')
         exp = pd.Series(['A'] * 7, name='XX', index=list('abcdefg'))
         tm.assert_series_equal(result, exp)
-        self.assertEqual(result.dtype, np.object)
+        assert result.dtype == np.object
 
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             s.map(lambda x: x, na_action='ignore')
 
     def test_map_datetimetz(self):
@@ -319,7 +654,7 @@ def test_map_datetimetz(self):
         exp = pd.Series(list(range(24)) + [0], name='XX', dtype=np.int64)
         tm.assert_series_equal(result, exp)
 
-        with tm.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             s.map(lambda x: x, na_action='ignore')
 
         # not vectorized
@@ -331,3 +666,14 @@ def f(x):
         result = s.map(f)
         exp = pd.Series(['Asia/Tokyo'] * 25, name='XX')
         tm.assert_series_equal(result, exp)
+
+    @pytest.mark.parametrize("vals,mapping,exp", [
+        (list('abc'), {np.nan: 'not NaN'}, [np.nan] * 3 + ['not NaN']),
+        (list('abc'), {'a': 'a letter'}, ['a letter'] + [np.nan] * 3),
+        (list(range(3)), {0: 42}, [42] + [np.nan] * 3)])
+    def test_map_missing_mixed(self, vals, mapping, exp):
+        # GH20495
+        s = pd.Series(vals + [np.nan])
+        result = s.map(mapping)
+
+        tm.assert_series_equal(result, pd.Series(exp))
diff --git a/pandas/tests/series/test_arithmetic.py b/pandas/tests/series/test_arithmetic.py
new file mode 100644
index 0000000000000..687ed59772d18
--- /dev/null
+++ b/pandas/tests/series/test_arithmetic.py
@@ -0,0 +1,172 @@
+# -*- coding: utf-8 -*-
+import operator
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import Series, compat
+from pandas.core.indexes.period import IncompatibleFrequency
+import pandas.util.testing as tm
+
+
+def _permute(obj):
+    return obj.take(np.random.permutation(len(obj)))
+
+
+class TestSeriesFlexArithmetic(object):
+    @pytest.mark.parametrize(
+        'ts',
+        [
+            (lambda x: x, lambda x: x * 2, False),
+            (lambda x: x, lambda x: x[::2], False),
+            (lambda x: x, lambda x: 5, True),
+            (lambda x: tm.makeFloatSeries(),
+             lambda x: tm.makeFloatSeries(),
+             True)
+        ])
+    @pytest.mark.parametrize('opname', ['add', 'sub', 'mul', 'floordiv',
+                                        'truediv', 'div', 'pow'])
+    def test_flex_method_equivalence(self, opname, ts):
+        # check that Series.{opname} behaves like Series.__{opname}__,
+        tser = tm.makeTimeSeries().rename('ts')
+
+        series = ts[0](tser)
+        other = ts[1](tser)
+        check_reverse = ts[2]
+
+        if opname == 'div' and compat.PY3:
+            pytest.skip('div test only for Py3')
+
+        op = getattr(Series, opname)
+
+        if op == 'div':
+            alt = operator.truediv
+        else:
+            alt = getattr(operator, opname)
+
+        result = op(series, other)
+        expected = alt(series, other)
+        tm.assert_almost_equal(result, expected)
+        if check_reverse:
+            rop = getattr(Series, "r" + opname)
+            result = rop(series, other)
+            expected = alt(other, series)
+            tm.assert_almost_equal(result, expected)
+
+
+class TestSeriesArithmetic(object):
+    # Some of these may end up in tests/arithmetic, but are not yet sorted
+
+    def test_add_series_with_period_index(self):
+        rng = pd.period_range('1/1/2000', '1/1/2010', freq='A')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ts + ts[::2]
+        expected = ts + ts
+        expected[1::2] = np.nan
+        tm.assert_series_equal(result, expected)
+
+        result = ts + _permute(ts[::2])
+        tm.assert_series_equal(result, expected)
+
+        msg = "Input has different freq=D from PeriodIndex\\(freq=A-DEC\\)"
+        with pytest.raises(IncompatibleFrequency, match=msg):
+            ts + ts.asfreq('D', how="end")
+
+
+# ------------------------------------------------------------------
+# Comparisons
+
+class TestSeriesFlexComparison(object):
+    def test_comparison_flex_basic(self):
+        left = pd.Series(np.random.randn(10))
+        right = pd.Series(np.random.randn(10))
+
+        tm.assert_series_equal(left.eq(right), left == right)
+        tm.assert_series_equal(left.ne(right), left != right)
+        tm.assert_series_equal(left.le(right), left < right)
+        tm.assert_series_equal(left.lt(right), left <= right)
+        tm.assert_series_equal(left.gt(right), left > right)
+        tm.assert_series_equal(left.ge(right), left >= right)
+
+        # axis
+        for axis in [0, None, 'index']:
+            tm.assert_series_equal(left.eq(right, axis=axis), left == right)
+            tm.assert_series_equal(left.ne(right, axis=axis), left != right)
+            tm.assert_series_equal(left.le(right, axis=axis), left < right)
+            tm.assert_series_equal(left.lt(right, axis=axis), left <= right)
+            tm.assert_series_equal(left.gt(right, axis=axis), left > right)
+            tm.assert_series_equal(left.ge(right, axis=axis), left >= right)
+
+        #
+        msg = 'No axis named 1 for object type'
+        for op in ['eq', 'ne', 'le', 'le', 'gt', 'ge']:
+            with pytest.raises(ValueError, match=msg):
+                getattr(left, op)(right, axis=1)
+
+
+class TestSeriesComparison(object):
+    def test_comparison_different_length(self):
+        a = Series(['a', 'b', 'c'])
+        b = Series(['b', 'a'])
+        with pytest.raises(ValueError):
+            a < b
+
+        a = Series([1, 2])
+        b = Series([2, 3, 4])
+        with pytest.raises(ValueError):
+            a == b
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_ser_flex_cmp_return_dtypes(self, opname):
+        # GH#15115
+        ser = Series([1, 3, 2], index=range(3))
+        const = 2
+
+        result = getattr(ser, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, Series([1], ['bool']))
+
+    @pytest.mark.parametrize('opname', ['eq', 'ne', 'gt', 'lt', 'ge', 'le'])
+    def test_ser_flex_cmp_return_dtypes_empty(self, opname):
+        # GH#15115 empty Series case
+        ser = Series([1, 3, 2], index=range(3))
+        empty = ser.iloc[:0]
+        const = 2
+
+        result = getattr(empty, opname)(const).get_dtype_counts()
+        tm.assert_series_equal(result, Series([1], ['bool']))
+
+    @pytest.mark.parametrize('op', [operator.eq, operator.ne,
+                                    operator.le, operator.lt,
+                                    operator.ge, operator.gt])
+    @pytest.mark.parametrize('names', [(None, None, None),
+                                       ('foo', 'bar', None),
+                                       ('baz', 'baz', 'baz')])
+    def test_ser_cmp_result_names(self, names, op):
+        # datetime64 dtype
+        dti = pd.date_range('1949-06-07 03:00:00',
+                            freq='H', periods=5, name=names[0])
+        ser = Series(dti).rename(names[1])
+        result = op(ser, dti)
+        assert result.name == names[2]
+
+        # datetime64tz dtype
+        dti = dti.tz_localize('US/Central')
+        ser = Series(dti).rename(names[1])
+        result = op(ser, dti)
+        assert result.name == names[2]
+
+        # timedelta64 dtype
+        tdi = dti - dti.shift(1)
+        ser = Series(tdi).rename(names[1])
+        result = op(ser, tdi)
+        assert result.name == names[2]
+
+        # categorical
+        if op in [operator.eq, operator.ne]:
+            # categorical dtype comparisons raise for inequalities
+            cidx = tdi.astype('category')
+            ser = Series(cidx).rename(names[1])
+            result = op(ser, cidx)
+            assert result.name == names[2]
diff --git a/pandas/tests/series/test_asof.py b/pandas/tests/series/test_asof.py
index 82914a99e2f6c..488fc894b953e 100644
--- a/pandas/tests/series/test_asof.py
+++ b/pandas/tests/series/test_asof.py
@@ -1,15 +1,13 @@
 # coding=utf-8
 
 import numpy as np
-from pandas import (offsets, Series, notnull,
-                    isnull, date_range, Timestamp)
+import pytest
 
+from pandas import Series, Timestamp, date_range, isna, notna, offsets
 import pandas.util.testing as tm
 
-from .common import TestData
 
-
-class TestSeriesAsof(TestData, tm.TestCase):
+class TestSeriesAsof():
 
     def test_basic(self):
 
@@ -21,21 +19,21 @@ def test_basic(self):
         dates = date_range('1/1/1990', periods=N * 3, freq='25s')
 
         result = ts.asof(dates)
-        self.assertTrue(notnull(result).all())
+        assert notna(result).all()
         lb = ts.index[14]
         ub = ts.index[30]
 
         result = ts.asof(list(dates))
-        self.assertTrue(notnull(result).all())
+        assert notna(result).all()
         lb = ts.index[14]
         ub = ts.index[30]
 
         mask = (result.index >= lb) & (result.index < ub)
         rs = result[mask]
-        self.assertTrue((rs == ts[lb]).all())
+        assert (rs == ts[lb]).all()
 
         val = result[result.index[result.index >= ub][0]]
-        self.assertEqual(ts[ub], val)
+        assert ts[ub] == val
 
     def test_scalar(self):
 
@@ -48,20 +46,20 @@ def test_scalar(self):
         val1 = ts.asof(ts.index[7])
         val2 = ts.asof(ts.index[19])
 
-        self.assertEqual(val1, ts[4])
-        self.assertEqual(val2, ts[14])
+        assert val1 == ts[4]
+        assert val2 == ts[14]
 
         # accepts strings
         val1 = ts.asof(str(ts.index[7]))
-        self.assertEqual(val1, ts[4])
+        assert val1 == ts[4]
 
         # in there
         result = ts.asof(ts.index[3])
-        self.assertEqual(result, ts[3])
+        assert result == ts[3]
 
         # no as of value
         d = ts.index[0] - offsets.BDay()
-        self.assertTrue(np.isnan(ts.asof(d)))
+        assert np.isnan(ts.asof(d))
 
     def test_with_nan(self):
         # basic asof test
@@ -96,19 +94,19 @@ def test_periodindex(self):
         dates = date_range('1/1/1990', periods=N * 3, freq='37min')
 
         result = ts.asof(dates)
-        self.assertTrue(notnull(result).all())
+        assert notna(result).all()
         lb = ts.index[14]
         ub = ts.index[30]
 
         result = ts.asof(list(dates))
-        self.assertTrue(notnull(result).all())
+        assert notna(result).all()
         lb = ts.index[14]
         ub = ts.index[30]
 
         pix = PeriodIndex(result.index.values, freq='H')
         mask = (pix >= lb) & (pix < ub)
         rs = result[mask]
-        self.assertTrue((rs == ts[lb]).all())
+        assert (rs == ts[lb]).all()
 
         ts[5:10] = np.nan
         ts[15:20] = np.nan
@@ -116,19 +114,19 @@ def test_periodindex(self):
         val1 = ts.asof(ts.index[7])
         val2 = ts.asof(ts.index[19])
 
-        self.assertEqual(val1, ts[4])
-        self.assertEqual(val2, ts[14])
+        assert val1 == ts[4]
+        assert val2 == ts[14]
 
         # accepts strings
         val1 = ts.asof(str(ts.index[7]))
-        self.assertEqual(val1, ts[4])
+        assert val1 == ts[4]
 
         # in there
-        self.assertEqual(ts.asof(ts.index[3]), ts[3])
+        assert ts.asof(ts.index[3]) == ts[3]
 
         # no as of value
         d = ts.index[0].to_timestamp() - offsets.BDay()
-        self.assertTrue(isnull(ts.asof(d)))
+        assert isna(ts.asof(d))
 
     def test_errors(self):
 
@@ -138,15 +136,15 @@ def test_errors(self):
                           Timestamp('20130102')])
 
         # non-monotonic
-        self.assertFalse(s.index.is_monotonic)
-        with self.assertRaises(ValueError):
+        assert not s.index.is_monotonic
+        with pytest.raises(ValueError):
             s.asof(s.index[0])
 
         # subset with Series
         N = 10
         rng = date_range('1/1/1990', periods=N, freq='53s')
         s = Series(np.random.randn(N), index=rng)
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             s.asof(s.index[0], subset='foo')
 
     def test_all_nans(self):
@@ -168,7 +166,7 @@ def test_all_nans(self):
         # testing scalar input
         date = date_range('1/1/1990', periods=N * 3, freq='25s')[0]
         result = Series(np.nan, index=rng).asof(date)
-        assert isnull(result)
+        assert isna(result)
 
         # test name is propagated
         result = Series(np.nan, index=[1, 2, 3, 4], name='test').asof([4, 5])
diff --git a/pandas/tests/series/test_block_internals.py b/pandas/tests/series/test_block_internals.py
new file mode 100644
index 0000000000000..e74b32181ce0f
--- /dev/null
+++ b/pandas/tests/series/test_block_internals.py
@@ -0,0 +1,43 @@
+# -*- coding: utf-8 -*-
+
+import pandas as pd
+
+# Segregated collection of methods that require the BlockManager internal data
+# structure
+
+
+class TestSeriesBlockInternals(object):
+
+    def test_setitem_invalidates_datetime_index_freq(self):
+        # GH#24096 altering a datetime64tz Series inplace invalidates the
+        #  `freq` attribute on the underlying DatetimeIndex
+
+        dti = pd.date_range('20130101', periods=3, tz='US/Eastern')
+        ts = dti[1]
+        ser = pd.Series(dti)
+        assert ser._values is not dti
+        assert ser._values._data.base is not dti._data._data.base
+        assert dti.freq == 'D'
+        ser.iloc[1] = pd.NaT
+        assert ser._values.freq is None
+
+        # check that the DatetimeIndex was not altered in place
+        assert ser._values is not dti
+        assert ser._values._data.base is not dti._data._data.base
+        assert dti[1] == ts
+        assert dti.freq == 'D'
+
+    def test_dt64tz_setitem_does_not_mutate_dti(self):
+        # GH#21907, GH#24096
+        dti = pd.date_range('2016-01-01', periods=10, tz='US/Pacific')
+        ts = dti[0]
+        ser = pd.Series(dti)
+        assert ser._values is not dti
+        assert ser._values._data.base is not dti._data._data.base
+        assert ser._data.blocks[0].values is not dti
+        assert (ser._data.blocks[0].values._data.base
+                is not dti._data._data.base)
+
+        ser[::3] = pd.NaT
+        assert ser[0] is pd.NaT
+        assert dti[0] == ts
diff --git a/pandas/tests/series/test_combine_concat.py b/pandas/tests/series/test_combine_concat.py
index d4e5d36c15c68..45e3dffde60f7 100644
--- a/pandas/tests/series/test_combine_concat.py
+++ b/pandas/tests/series/test_combine_concat.py
@@ -3,39 +3,38 @@
 
 from datetime import datetime
 
-from numpy import nan
 import numpy as np
-import pandas as pd
-
-from pandas import Series, DataFrame, date_range, DatetimeIndex
+from numpy import nan
+import pytest
 
-from pandas import compat
-from pandas.util.testing import assert_series_equal
+import pandas as pd
+from pandas import DataFrame, DatetimeIndex, Series, compat, date_range
 import pandas.util.testing as tm
-
-from .common import TestData
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 
-class TestSeriesCombine(TestData, tm.TestCase):
+class TestSeriesCombine(object):
 
-    def test_append(self):
-        appendedSeries = self.series.append(self.objSeries)
+    def test_append(self, datetime_series, string_series, object_series):
+        appendedSeries = string_series.append(object_series)
         for idx, value in compat.iteritems(appendedSeries):
-            if idx in self.series.index:
-                self.assertEqual(value, self.series[idx])
-            elif idx in self.objSeries.index:
-                self.assertEqual(value, self.objSeries[idx])
+            if idx in string_series.index:
+                assert value == string_series[idx]
+            elif idx in object_series.index:
+                assert value == object_series[idx]
             else:
-                self.fail("orphaned index!")
+                raise AssertionError("orphaned index!")
 
-        self.assertRaises(ValueError, self.ts.append, self.ts,
-                          verify_integrity=True)
+        msg = "Indexes have overlapping values:"
+        with pytest.raises(ValueError, match=msg):
+            datetime_series.append(datetime_series, verify_integrity=True)
 
-    def test_append_many(self):
-        pieces = [self.ts[:5], self.ts[5:10], self.ts[10:]]
+    def test_append_many(self, datetime_series):
+        pieces = [datetime_series[:5], datetime_series[5:10],
+                  datetime_series[10:]]
 
         result = pieces[0].append(pieces[1:])
-        assert_series_equal(result, self.ts)
+        assert_series_equal(result, datetime_series)
 
     def test_append_duplicates(self):
         # GH 13677
@@ -53,11 +52,24 @@ def test_append_duplicates(self):
                                exp, check_index_type=True)
 
         msg = 'Indexes have overlapping values:'
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             s1.append(s2, verify_integrity=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
+        with pytest.raises(ValueError, match=msg):
             pd.concat([s1, s2], verify_integrity=True)
 
+    def test_combine_scalar(self):
+        # GH 21248
+        # Note - combine() with another Series is tested elsewhere because
+        # it is used when testing operators
+        s = pd.Series([i * 10 for i in range(5)])
+        result = s.combine(3, lambda x, y: x + y)
+        expected = pd.Series([i * 10 + 3 for i in range(5)])
+        tm.assert_series_equal(result, expected)
+
+        result = s.combine(22, lambda x, y: min(x, y))
+        expected = pd.Series([min(i * 10, 22) for i in range(5)])
+        tm.assert_series_equal(result, expected)
+
     def test_combine_first(self):
         values = tm.makeIntIndex(20).values.astype(float)
         series = Series(values, index=tm.makeIntIndex(20))
@@ -68,14 +80,14 @@ def test_combine_first(self):
         # nothing used from the input
         combined = series.combine_first(series_copy)
 
-        self.assert_series_equal(combined, series)
+        tm.assert_series_equal(combined, series)
 
         # Holes filled from input
         combined = series_copy.combine_first(series)
-        self.assertTrue(np.isfinite(combined).all())
+        assert np.isfinite(combined).all()
 
-        self.assert_series_equal(combined[::2], series[::2])
-        self.assert_series_equal(combined[1::2], series_copy[1::2])
+        tm.assert_series_equal(combined[::2], series[::2])
+        tm.assert_series_equal(combined[1::2], series_copy[1::2])
 
         # mixed types
         index = tm.makeStringIndex(20)
@@ -105,8 +117,40 @@ def test_update(self):
         df = DataFrame([{"a": 1}, {"a": 3, "b": 2}])
         df['c'] = np.nan
 
-        # this will fail as long as series is a sub-class of ndarray
-        # df['c'].update(Series(['foo'],index=[0])) #####
+        df['c'].update(Series(['foo'], index=[0]))
+        expected = DataFrame([[1, np.nan, 'foo'], [3, 2., np.nan]],
+                             columns=['a', 'b', 'c'])
+        assert_frame_equal(df, expected)
+
+    @pytest.mark.parametrize('other, dtype, expected', [
+        # other is int
+        ([61, 63], 'int32', pd.Series([10, 61, 12], dtype='int32')),
+        ([61, 63], 'int64', pd.Series([10, 61, 12])),
+        ([61, 63], float, pd.Series([10., 61., 12.])),
+        ([61, 63], object, pd.Series([10, 61, 12], dtype=object)),
+        # other is float, but can be cast to int
+        ([61., 63.], 'int32', pd.Series([10, 61, 12], dtype='int32')),
+        ([61., 63.], 'int64', pd.Series([10, 61, 12])),
+        ([61., 63.], float, pd.Series([10., 61., 12.])),
+        ([61., 63.], object, pd.Series([10, 61., 12], dtype=object)),
+        # others is float, cannot be cast to int
+        ([61.1, 63.1], 'int32', pd.Series([10., 61.1, 12.])),
+        ([61.1, 63.1], 'int64', pd.Series([10., 61.1, 12.])),
+        ([61.1, 63.1], float, pd.Series([10., 61.1, 12.])),
+        ([61.1, 63.1], object, pd.Series([10, 61.1, 12], dtype=object)),
+        # other is object, cannot be cast
+        ([(61,), (63,)], 'int32', pd.Series([10, (61,), 12])),
+        ([(61,), (63,)], 'int64', pd.Series([10, (61,), 12])),
+        ([(61,), (63,)], float, pd.Series([10., (61,), 12.])),
+        ([(61,), (63,)], object, pd.Series([10, (61,), 12]))
+    ])
+    def test_update_dtypes(self, other, dtype, expected):
+
+        s = Series([10, 11, 12], dtype=dtype)
+        other = Series(other, index=[1, 3])
+        s.update(other)
+
+        assert_series_equal(s, expected)
 
     def test_concat_empty_series_dtypes_roundtrips(self):
 
@@ -115,24 +159,24 @@ def test_concat_empty_series_dtypes_roundtrips(self):
                                 'M8[ns]'])
 
         for dtype in dtypes:
-            self.assertEqual(pd.concat([Series(dtype=dtype)]).dtype, dtype)
-            self.assertEqual(pd.concat([Series(dtype=dtype),
-                                        Series(dtype=dtype)]).dtype, dtype)
+            assert pd.concat([Series(dtype=dtype)]).dtype == dtype
+            assert pd.concat([Series(dtype=dtype),
+                              Series(dtype=dtype)]).dtype == dtype
 
         def int_result_type(dtype, dtype2):
-            typs = set([dtype.kind, dtype2.kind])
-            if not len(typs - set(['i', 'u', 'b'])) and (dtype.kind == 'i' or
-                                                         dtype2.kind == 'i'):
+            typs = {dtype.kind, dtype2.kind}
+            if not len(typs - {'i', 'u', 'b'}) and (dtype.kind == 'i' or
+                                                    dtype2.kind == 'i'):
                 return 'i'
-            elif not len(typs - set(['u', 'b'])) and (dtype.kind == 'u' or
-                                                      dtype2.kind == 'u'):
+            elif not len(typs - {'u', 'b'}) and (dtype.kind == 'u' or
+                                                 dtype2.kind == 'u'):
                 return 'u'
             return None
 
         def float_result_type(dtype, dtype2):
-            typs = set([dtype.kind, dtype2.kind])
-            if not len(typs - set(['f', 'i', 'u'])) and (dtype.kind == 'f' or
-                                                         dtype2.kind == 'f'):
+            typs = {dtype.kind, dtype2.kind}
+            if not len(typs - {'f', 'i', 'u'}) and (dtype.kind == 'f' or
+                                                    dtype2.kind == 'f'):
                 return 'f'
             return None
 
@@ -153,58 +197,75 @@ def get_result_type(dtype, dtype2):
                 expected = get_result_type(dtype, dtype2)
                 result = pd.concat([Series(dtype=dtype), Series(dtype=dtype2)
                                     ]).dtype
-                self.assertEqual(result.kind, expected)
+                assert result.kind == expected
+
+    def test_combine_first_dt_tz_values(self, tz_naive_fixture):
+        ser1 = pd.Series(pd.DatetimeIndex(['20150101', '20150102', '20150103'],
+                                          tz=tz_naive_fixture),
+                         name='ser1')
+        ser2 = pd.Series(pd.DatetimeIndex(['20160514', '20160515', '20160516'],
+                                          tz=tz_naive_fixture),
+                         index=[2, 3, 4], name='ser2')
+        result = ser1.combine_first(ser2)
+        exp_vals = pd.DatetimeIndex(['20150101', '20150102', '20150103',
+                                     '20160515', '20160516'],
+                                    tz=tz_naive_fixture)
+        exp = pd.Series(exp_vals, name='ser1')
+        assert_series_equal(exp, result)
 
     def test_concat_empty_series_dtypes(self):
 
-        # bools
-        self.assertEqual(pd.concat([Series(dtype=np.bool_),
-                                    Series(dtype=np.int32)]).dtype, np.int32)
-        self.assertEqual(pd.concat([Series(dtype=np.bool_),
-                                    Series(dtype=np.float32)]).dtype,
-                         np.object_)
-
-        # datetimelike
-        self.assertEqual(pd.concat([Series(dtype='m8[ns]'),
-                                    Series(dtype=np.bool)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='m8[ns]'),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.bool)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
-        self.assertEqual(pd.concat([Series(dtype='M8[ns]'),
-                                    Series(dtype=np.bool_),
-                                    Series(dtype=np.int64)]).dtype, np.object_)
+        # booleans
+        assert pd.concat([Series(dtype=np.bool_),
+                          Series(dtype=np.int32)]).dtype == np.int32
+        assert pd.concat([Series(dtype=np.bool_),
+                          Series(dtype=np.float32)]).dtype == np.object_
+
+        # datetime-like
+        assert pd.concat([Series(dtype='m8[ns]'),
+                          Series(dtype=np.bool)]).dtype == np.object_
+        assert pd.concat([Series(dtype='m8[ns]'),
+                          Series(dtype=np.int64)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.bool)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.int64)]).dtype == np.object_
+        assert pd.concat([Series(dtype='M8[ns]'),
+                          Series(dtype=np.bool_),
+                          Series(dtype=np.int64)]).dtype == np.object_
 
         # categorical
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='category')]).dtype,
-                         'category')
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='float64')]).dtype,
-                         'float64')
-        self.assertEqual(pd.concat([Series(dtype='category'),
-                                    Series(dtype='object')]).dtype, 'object')
+        assert pd.concat([Series(dtype='category'),
+                          Series(dtype='category')]).dtype == 'category'
+        # GH 18515
+        assert pd.concat([Series(np.array([]), dtype='category'),
+                          Series(dtype='float64')]).dtype == 'float64'
+        assert pd.concat([Series(dtype='category'),
+                          Series(dtype='object')]).dtype == 'object'
 
         # sparse
+        # TODO: move?
         result = pd.concat([Series(dtype='float64').to_sparse(), Series(
             dtype='float64').to_sparse()])
-        self.assertEqual(result.dtype, np.float64)
-        self.assertEqual(result.ftype, 'float64:sparse')
+        assert result.dtype == 'Sparse[float64]'
+        assert result.ftype == 'float64:sparse'
 
         result = pd.concat([Series(dtype='float64').to_sparse(), Series(
             dtype='float64')])
-        self.assertEqual(result.dtype, np.float64)
-        self.assertEqual(result.ftype, 'float64:sparse')
+        # TODO: release-note: concat sparse dtype
+        expected = pd.core.sparse.api.SparseDtype(np.float64)
+        assert result.dtype == expected
+        assert result.ftype == 'float64:sparse'
 
         result = pd.concat([Series(dtype='float64').to_sparse(), Series(
             dtype='object')])
-        self.assertEqual(result.dtype, np.object_)
-        self.assertEqual(result.ftype, 'object:dense')
+        # TODO: release-note: concat sparse dtype
+        expected = pd.core.sparse.api.SparseDtype('object')
+        assert result.dtype == expected
+        assert result.ftype == 'object:sparse'
 
     def test_combine_first_dt64(self):
-        from pandas.tseries.tools import to_datetime
+        from pandas.core.tools.datetimes import to_datetime
         s0 = to_datetime(Series(["2010", np.NaN]))
         s1 = to_datetime(Series([np.NaN, "2011"]))
         rs = s0.combine_first(s1)
@@ -218,7 +279,7 @@ def test_combine_first_dt64(self):
         assert_series_equal(rs, xp)
 
 
-class TestTimeseries(tm.TestCase):
+class TestTimeseries(object):
 
     def test_append_concat(self):
         rng = date_range('5/8/2012 1:45', periods=10, freq='5T')
@@ -243,13 +304,11 @@ def test_append_concat(self):
         rng2 = rng.copy()
         rng1.name = 'foo'
         rng2.name = 'bar'
-        self.assertEqual(rng1.append(rng1).name, 'foo')
-        self.assertIsNone(rng1.append(rng2).name)
+        assert rng1.append(rng1).name == 'foo'
+        assert rng1.append(rng2).name is None
 
     def test_append_concat_tz(self):
-        # GH 2938
-        tm._skip_if_no_pytz()
-
+        # see gh-2938
         rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
                          tz='US/Eastern')
         rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
@@ -270,8 +329,7 @@ def test_append_concat_tz(self):
         tm.assert_index_equal(appended, rng3)
 
     def test_append_concat_tz_explicit_pytz(self):
-        # GH 2938
-        tm._skip_if_no_pytz()
+        # see gh-2938
         from pytz import timezone as timezone
 
         rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
@@ -294,8 +352,7 @@ def test_append_concat_tz_explicit_pytz(self):
         tm.assert_index_equal(appended, rng3)
 
     def test_append_concat_tz_dateutil(self):
-        # GH 2938
-        tm._skip_if_no_dateutil()
+        # see gh-2938
         rng = date_range('5/8/2012 1:45', periods=10, freq='5T',
                          tz='dateutil/US/Eastern')
         rng2 = date_range('5/8/2012 2:35', periods=10, freq='5T',
diff --git a/pandas/tests/series/test_constructors.py b/pandas/tests/series/test_constructors.py
index 24e4355fa9f9a..8525b877618c9 100644
--- a/pandas/tests/series/test_constructors.py
+++ b/pandas/tests/series/test_constructors.py
@@ -1,84 +1,166 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
+from collections import OrderedDict
 from datetime import datetime, timedelta
 
-from numpy import nan
 import numpy as np
+from numpy import nan
 import numpy.ma as ma
-import pandas as pd
-
-from pandas.types.common import is_categorical_dtype, is_datetime64tz_dtype
-from pandas import (Index, Series, isnull, date_range,
-                    period_range, NaT)
-from pandas.core.index import MultiIndex
-from pandas.tseries.index import Timestamp, DatetimeIndex
+import pytest
 
 from pandas._libs import lib
 from pandas._libs.tslib import iNaT
+from pandas.compat import PY36, long, lrange, range, zip
 
-from pandas.compat import lrange, range, zip, OrderedDict, long
-from pandas import compat
-from pandas.util.testing import assert_series_equal
+from pandas.core.dtypes.common import (
+    is_categorical_dtype, is_datetime64tz_dtype)
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, IntervalIndex, MultiIndex, NaT, Series,
+    Timestamp, date_range, isna, period_range, timedelta_range)
+from pandas.api.types import CategoricalDtype
+from pandas.core.arrays import period_array
 import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
 
-from .common import TestData
 
+class TestSeriesConstructors():
 
-class TestSeriesConstructors(TestData, tm.TestCase):
+    def test_invalid_dtype(self):
+        # GH15520
+        msg = 'not understood'
+        invalid_list = [pd.Timestamp, 'pd.Timestamp', list]
+        for dtype in invalid_list:
+            with pytest.raises(TypeError, match=msg):
+                Series([], name='time', dtype=dtype)
 
     def test_scalar_conversion(self):
 
         # Pass in scalar is disabled
         scalar = Series(0.5)
-        self.assertNotIsInstance(scalar, float)
+        assert not isinstance(scalar, float)
 
-        # coercion
-        self.assertEqual(float(Series([1.])), 1.0)
-        self.assertEqual(int(Series([1.])), 1)
-        self.assertEqual(long(Series([1.])), 1)
+        # Coercion
+        assert float(Series([1.])) == 1.0
+        assert int(Series([1.])) == 1
+        assert long(Series([1.])) == 1
 
-    def test_constructor(self):
-        self.assertTrue(self.ts.index.is_all_dates)
+    def test_constructor(self, datetime_series):
+        empty_series = Series()
+
+        assert datetime_series.index.is_all_dates
 
         # Pass in Series
-        derived = Series(self.ts)
-        self.assertTrue(derived.index.is_all_dates)
+        derived = Series(datetime_series)
+        assert derived.index.is_all_dates
 
-        self.assertTrue(tm.equalContents(derived.index, self.ts.index))
+        assert tm.equalContents(derived.index, datetime_series.index)
         # Ensure new index is not created
-        self.assertEqual(id(self.ts.index), id(derived.index))
+        assert id(datetime_series.index) == id(derived.index)
 
         # Mixed type Series
         mixed = Series(['hello', np.NaN], index=[0, 1])
-        self.assertEqual(mixed.dtype, np.object_)
-        self.assertIs(mixed[1], np.NaN)
+        assert mixed.dtype == np.object_
+        assert mixed[1] is np.NaN
+
+        assert not empty_series.index.is_all_dates
+        assert not Series({}).index.is_all_dates
 
-        self.assertFalse(self.empty.index.is_all_dates)
-        self.assertFalse(Series({}).index.is_all_dates)
-        self.assertRaises(Exception, Series, np.random.randn(3, 3),
-                          index=np.arange(3))
+        # exception raised is of type Exception
+        with pytest.raises(Exception, match="Data must be 1-dimensional"):
+            Series(np.random.randn(3, 3), index=np.arange(3))
 
         mixed.name = 'Series'
         rs = Series(mixed).name
         xp = 'Series'
-        self.assertEqual(rs, xp)
+        assert rs == xp
 
         # raise on MultiIndex GH4187
         m = MultiIndex.from_arrays([[1, 2], [3, 4]])
-        self.assertRaises(NotImplementedError, Series, m)
+        msg = "initializing a Series from a MultiIndex is not supported"
+        with pytest.raises(NotImplementedError, match=msg):
+            Series(m)
 
-    def test_constructor_empty(self):
+    @pytest.mark.parametrize('input_class', [list, dict, OrderedDict])
+    def test_constructor_empty(self, input_class):
         empty = Series()
-        empty2 = Series([])
+        empty2 = Series(input_class())
 
-        # the are Index() and RangeIndex() which don't compare type equal
+        # these are Index() and RangeIndex() which don't compare type equal
         # but are just .equals
         assert_series_equal(empty, empty2, check_index_type=False)
 
-        empty = Series(index=lrange(10))
-        empty2 = Series(np.nan, index=lrange(10))
-        assert_series_equal(empty, empty2)
+        # With explicit dtype:
+        empty = Series(dtype='float64')
+        empty2 = Series(input_class(), dtype='float64')
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+        # GH 18515 : with dtype=category:
+        empty = Series(dtype='category')
+        empty2 = Series(input_class(), dtype='category')
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+        if input_class is not list:
+            # With index:
+            empty = Series(index=lrange(10))
+            empty2 = Series(input_class(), index=lrange(10))
+            assert_series_equal(empty, empty2)
+
+            # With index and dtype float64:
+            empty = Series(np.nan, index=lrange(10))
+            empty2 = Series(input_class(), index=lrange(10), dtype='float64')
+            assert_series_equal(empty, empty2)
+
+            # GH 19853 : with empty string, index and dtype str
+            empty = Series('', dtype=str, index=range(3))
+            empty2 = Series('', index=range(3))
+            assert_series_equal(empty, empty2)
+
+    @pytest.mark.parametrize('input_arg', [np.nan, float('nan')])
+    def test_constructor_nan(self, input_arg):
+        empty = Series(dtype='float64', index=lrange(10))
+        empty2 = Series(input_arg, index=lrange(10))
+
+        assert_series_equal(empty, empty2, check_index_type=False)
+
+    @pytest.mark.parametrize('dtype', [
+        'f8', 'i8', 'M8[ns]', 'm8[ns]', 'category', 'object',
+        'datetime64[ns, UTC]',
+    ])
+    @pytest.mark.parametrize('index', [None, pd.Index([])])
+    def test_constructor_dtype_only(self, dtype, index):
+        # GH-20865
+        result = pd.Series(dtype=dtype, index=index)
+        assert result.dtype == dtype
+        assert len(result) == 0
+
+    def test_constructor_no_data_index_order(self):
+        result = pd.Series(index=['b', 'a', 'c'])
+        assert result.index.tolist() == ['b', 'a', 'c']
+
+    def test_constructor_no_data_string_type(self):
+        # GH 22477
+        result = pd.Series(index=[1], dtype=str)
+        assert np.isnan(result.iloc[0])
+
+    @pytest.mark.parametrize('item', ['entry', 'ѐ', 13])
+    def test_constructor_string_element_string_type(self, item):
+        # GH 22477
+        result = pd.Series(item, index=[1], dtype=str)
+        assert result.iloc[0] == str(item)
+
+    def test_constructor_dtype_str_na_values(self, string_dtype):
+        # https://github.com/pandas-dev/pandas/issues/21083
+        ser = Series(['x', None], dtype=string_dtype)
+        result = ser.isna()
+        expected = Series([False, True])
+        tm.assert_series_equal(result, expected)
+        assert ser.iloc[1] is None
+
+        ser = Series(['x', np.nan], dtype=string_dtype)
+        assert np.isnan(ser.iloc[1])
 
     def test_constructor_series(self):
         index1 = ['d', 'b', 'a', 'c']
@@ -88,12 +170,29 @@ def test_constructor_series(self):
 
         assert_series_equal(s2, s1.sort_index())
 
-    def test_constructor_iterator(self):
+    def test_constructor_iterable(self):
+        # GH 21987
+        class Iter():
+            def __iter__(self):
+                for i in range(10):
+                    yield i
 
+        expected = Series(list(range(10)), dtype='int64')
+        result = Series(Iter(), dtype='int64')
+        assert_series_equal(result, expected)
+
+    def test_constructor_sequence(self):
+        # GH 21987
         expected = Series(list(range(10)), dtype='int64')
         result = Series(range(10), dtype='int64')
         assert_series_equal(result, expected)
 
+    def test_constructor_single_str(self):
+        # GH 21987
+        expected = Series(['abc'])
+        result = Series('abc')
+        assert_series_equal(result, expected)
+
     def test_constructor_list_like(self):
 
         # make sure that we are coercing different
@@ -105,6 +204,28 @@ def test_constructor_list_like(self):
             result = Series(obj, index=[0, 1, 2])
             assert_series_equal(result, expected)
 
+    @pytest.mark.parametrize('input_vals', [
+        ([1, 2]),
+        (['1', '2']),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H'))),
+        (list(pd.date_range('1/1/2011', periods=2, freq='H',
+                            tz='US/Eastern'))),
+        ([pd.Interval(left=0, right=5)]),
+    ])
+    def test_constructor_list_str(self, input_vals, string_dtype):
+        # GH 16605
+        # Ensure that data elements from a list are converted to strings
+        # when dtype is str, 'str', or 'U'
+        result = Series(input_vals, dtype=string_dtype)
+        expected = Series(input_vals).astype(string_dtype)
+        assert_series_equal(result, expected)
+
+    def test_constructor_list_str_na(self, string_dtype):
+        result = Series([1.0, 2.0, np.nan], dtype=string_dtype)
+        expected = Series(['1.0', '2.0', np.nan], dtype=object)
+        assert_series_equal(result, expected)
+        assert np.isnan(result[2])
+
     def test_constructor_generator(self):
         gen = (i for i in range(10))
 
@@ -136,16 +257,134 @@ def test_constructor_categorical(self):
         res = Series(cat)
         tm.assert_categorical_equal(res.values, cat)
 
+        # can cast to a new dtype
+        result = Series(pd.Categorical([1, 2, 3]),
+                        dtype='int64')
+        expected = pd.Series([1, 2, 3], dtype='int64')
+        tm.assert_series_equal(result, expected)
+
         # GH12574
-        self.assertRaises(
-            ValueError, lambda: Series(pd.Categorical([1, 2, 3]),
-                                       dtype='int64'))
         cat = Series(pd.Categorical([1, 2, 3]), dtype='category')
-        self.assertTrue(is_categorical_dtype(cat))
-        self.assertTrue(is_categorical_dtype(cat.dtype))
+        assert is_categorical_dtype(cat)
+        assert is_categorical_dtype(cat.dtype)
         s = Series([1, 2, 3], dtype='category')
-        self.assertTrue(is_categorical_dtype(s))
-        self.assertTrue(is_categorical_dtype(s.dtype))
+        assert is_categorical_dtype(s)
+        assert is_categorical_dtype(s.dtype)
+
+    def test_constructor_categorical_with_coercion(self):
+        factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        # test basic creation / coercion of categoricals
+        s = Series(factor, name='A')
+        assert s.dtype == 'category'
+        assert len(s) == len(factor)
+        str(s.values)
+        str(s)
+
+        # in a frame
+        df = DataFrame({'A': factor})
+        result = df['A']
+        tm.assert_series_equal(result, s)
+        result = df.iloc[:, 0]
+        tm.assert_series_equal(result, s)
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        df = DataFrame({'A': s})
+        result = df['A']
+        tm.assert_series_equal(result, s)
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        # multiples
+        df = DataFrame({'A': s, 'B': s, 'C': 1})
+        result1 = df['A']
+        result2 = df['B']
+        tm.assert_series_equal(result1, s)
+        tm.assert_series_equal(result2, s, check_names=False)
+        assert result2.name == 'B'
+        assert len(df) == len(factor)
+        str(df.values)
+        str(df)
+
+        # GH8623
+        x = DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
+                       [1, 'John P. Doe']],
+                      columns=['person_id', 'person_name'])
+        x['person_name'] = Categorical(x.person_name
+                                       )  # doing this breaks transform
+
+        expected = x.iloc[0].person_name
+        result = x.person_name.iloc[0]
+        assert result == expected
+
+        result = x.person_name[0]
+        assert result == expected
+
+        result = x.person_name.loc[0]
+        assert result == expected
+
+    def test_constructor_categorical_dtype(self):
+        result = pd.Series(['a', 'b'],
+                           dtype=CategoricalDtype(['a', 'b', 'c'],
+                                                  ordered=True))
+        assert is_categorical_dtype(result) is True
+        tm.assert_index_equal(result.cat.categories, pd.Index(['a', 'b', 'c']))
+        assert result.cat.ordered
+
+        result = pd.Series(['a', 'b'], dtype=CategoricalDtype(['b', 'a']))
+        assert is_categorical_dtype(result)
+        tm.assert_index_equal(result.cat.categories, pd.Index(['b', 'a']))
+        assert result.cat.ordered is False
+
+        # GH 19565 - Check broadcasting of scalar with Categorical dtype
+        result = Series('a', index=[0, 1],
+                        dtype=CategoricalDtype(['a', 'b'], ordered=True))
+        expected = Series(['a', 'a'], index=[0, 1],
+                          dtype=CategoricalDtype(['a', 'b'], ordered=True))
+        tm.assert_series_equal(result, expected, check_categorical=True)
+
+    def test_categorical_sideeffects_free(self):
+        # Passing a categorical to a Series and then changing values in either
+        # the series or the categorical should not change the values in the
+        # other one, IF you specify copy!
+        cat = Categorical(["a", "b", "c", "a"])
+        s = Series(cat, copy=True)
+        assert s.cat is not cat
+        s.cat.categories = [1, 2, 3]
+        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
+        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        # setting
+        s[0] = 2
+        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s2)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_cat)
+
+        # however, copy is False by default
+        # so this WILL change values
+        cat = Categorical(["a", "b", "c", "a"])
+        s = Series(cat)
+        assert s.values is cat
+        s.cat.categories = [1, 2, 3]
+        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_s)
+
+        s[0] = 2
+        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
+        tm.assert_numpy_array_equal(s.__array__(), exp_s2)
+        tm.assert_numpy_array_equal(cat.__array__(), exp_s2)
+
+    def test_unordered_compare_equal(self):
+        left = pd.Series(['a', 'b', 'c'],
+                         dtype=CategoricalDtype(['a', 'b']))
+        right = pd.Series(pd.Categorical(['a', 'b', np.nan],
+                                         categories=['a', 'b']))
+        tm.assert_series_equal(left, right)
 
     def test_constructor_maskedarray(self):
         data = ma.masked_all((3, ), dtype=float)
@@ -218,29 +457,66 @@ def test_constructor_maskedarray(self):
                            datetime(2001, 1, 3)], index=index, dtype='M8[ns]')
         assert_series_equal(result, expected)
 
+    def test_constructor_maskedarray_hardened(self):
+        # Check numpy masked arrays with hard masks -- from GH24574
+        data = ma.masked_all((3, ), dtype=float).harden_mask()
+        result = pd.Series(data)
+        expected = pd.Series([nan, nan, nan])
+        tm.assert_series_equal(result, expected)
+
     def test_series_ctor_plus_datetimeindex(self):
         rng = date_range('20090415', '20090519', freq='B')
-        data = dict((k, 1) for k in rng)
+        data = {k: 1 for k in rng}
 
         result = Series(data, index=rng)
-        self.assertIs(result.index, rng)
+        assert result.index is rng
 
     def test_constructor_default_index(self):
         s = Series([0, 1, 2])
         tm.assert_index_equal(s.index, pd.Index(np.arange(3)))
 
+    @pytest.mark.parametrize('input', [[1, 2, 3],
+                                       (1, 2, 3),
+                                       list(range(3)),
+                                       pd.Categorical(['a', 'b', 'a']),
+                                       (i for i in range(3)),
+                                       map(lambda x: x, range(3))])
+    def test_constructor_index_mismatch(self, input):
+        # GH 19342
+        # test that construction of a Series with an index of different length
+        # raises an error
+        msg = 'Length of passed values is 3, index implies 4'
+        with pytest.raises(ValueError, match=msg):
+            Series(input, index=np.arange(4))
+
+    def test_constructor_numpy_scalar(self):
+        # GH 19342
+        # construction with a numpy scalar
+        # should not raise
+        result = Series(np.array(100), index=np.arange(4), dtype='int64')
+        expected = Series(100, index=np.arange(4), dtype='int64')
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_broadcast_list(self):
+        # GH 19342
+        # construction with single-element container and index
+        # should raise
+        msg = "Length of passed values is 1, index implies 3"
+        with pytest.raises(ValueError, match=msg):
+            Series(['foo'], index=['a', 'b', 'c'])
+
     def test_constructor_corner(self):
         df = tm.makeTimeDataFrame()
         objs = [df, df]
         s = Series(objs, index=[0, 1])
-        tm.assertIsInstance(s, Series)
+        assert isinstance(s, Series)
 
     def test_constructor_sanitize(self):
         s = Series(np.array([1., 1., 8.]), dtype='i8')
-        self.assertEqual(s.dtype, np.dtype('i8'))
+        assert s.dtype == np.dtype('i8')
 
         s = Series(np.array([1., 1., np.nan]), copy=True, dtype='i8')
-        self.assertEqual(s.dtype, np.dtype('f8'))
+        assert s.dtype == np.dtype('f8')
 
     def test_constructor_copy(self):
         # GH15125
@@ -254,16 +530,35 @@ def test_constructor_copy(self):
 
             # changes to origin of copy does not affect the copy
             x[0] = 2.
-            self.assertFalse(x.equals(y))
-            self.assertEqual(x[0], 2.)
-            self.assertEqual(y[0], 1.)
+            assert not x.equals(y)
+            assert x[0] == 2.
+            assert y[0] == 1.
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            pd.date_range('20170101', periods=3, tz='US/Eastern'),
+            pd.date_range('20170101', periods=3),
+            pd.timedelta_range('1 day', periods=3),
+            pd.period_range('2012Q1', periods=3, freq='Q'),
+            pd.Index(list('abc')),
+            pd.Int64Index([1, 2, 3]),
+            pd.RangeIndex(0, 3)],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_limit_copies(self, index):
+        # GH 17449
+        # limit copies of input
+        s = pd.Series(index)
+
+        # we make 1 copy; this is just a smoke test here
+        assert s._data.blocks[0].values is not index
 
     def test_constructor_pass_none(self):
         s = Series(None, index=lrange(5))
-        self.assertEqual(s.dtype, np.float64)
+        assert s.dtype == np.float64
 
         s = Series(None, index=lrange(5), dtype=object)
-        self.assertEqual(s.dtype, np.object_)
+        assert s.dtype == np.object_
 
         # GH 7431
         # inference on the index
@@ -274,12 +569,12 @@ def test_constructor_pass_none(self):
     def test_constructor_pass_nan_nat(self):
         # GH 13467
         exp = Series([np.nan, np.nan], dtype=np.float64)
-        self.assertEqual(exp.dtype, np.float64)
+        assert exp.dtype == np.float64
         tm.assert_series_equal(Series([np.nan, np.nan]), exp)
         tm.assert_series_equal(Series(np.array([np.nan, np.nan])), exp)
 
         exp = Series([pd.NaT, pd.NaT])
-        self.assertEqual(exp.dtype, 'datetime64[ns]')
+        assert exp.dtype == 'datetime64[ns]'
         tm.assert_series_equal(Series([pd.NaT, pd.NaT]), exp)
         tm.assert_series_equal(Series(np.array([pd.NaT, pd.NaT])), exp)
 
@@ -290,26 +585,44 @@ def test_constructor_pass_nan_nat(self):
         tm.assert_series_equal(Series(np.array([np.nan, pd.NaT])), exp)
 
     def test_constructor_cast(self):
-        self.assertRaises(ValueError, Series, ['a', 'b', 'c'], dtype=float)
+        msg = "could not convert string to float"
+        with pytest.raises(ValueError, match=msg):
+            Series(["a", "b", "c"], dtype=float)
+
+    def test_constructor_unsigned_dtype_overflow(self, uint_dtype):
+        # see gh-15832
+        msg = 'Trying to coerce negative values to unsigned integers'
+        with pytest.raises(OverflowError, match=msg):
+            Series([-1], dtype=uint_dtype)
+
+    def test_constructor_coerce_float_fail(self, any_int_dtype):
+        # see gh-15832
+        msg = "Trying to coerce float values to integers"
+        with pytest.raises(ValueError, match=msg):
+            Series([1, 2, 3.5], dtype=any_int_dtype)
+
+    def test_constructor_coerce_float_valid(self, float_dtype):
+        s = Series([1, 2, 3.5], dtype=float_dtype)
+        expected = Series([1, 2, 3.5]).astype(float_dtype)
+        assert_series_equal(s, expected)
 
-    def test_constructor_dtype_nocast(self):
-        # 1572
+    def test_constructor_dtype_no_cast(self):
+        # see gh-1572
         s = Series([1, 2, 3])
-
         s2 = Series(s, dtype=np.int64)
 
         s2[1] = 5
-        self.assertEqual(s[1], 5)
+        assert s[1] == 5
 
     def test_constructor_datelike_coercion(self):
 
         # GH 9477
-        # incorrectly infering on dateimelike looking when object dtype is
+        # incorrectly inferring on dateimelike looking when object dtype is
         # specified
         s = Series([Timestamp('20130101'), 'NOV'], dtype=object)
-        self.assertEqual(s.iloc[0], Timestamp('20130101'))
-        self.assertEqual(s.iloc[1], 'NOV')
-        self.assertTrue(s.dtype == object)
+        assert s.iloc[0] == Timestamp('20130101')
+        assert s.iloc[1] == 'NOV'
+        assert s.dtype == object
 
         # the dtype was being reset on the slicing and re-inferred to datetime
         # even thought the blocks are mixed
@@ -323,30 +636,38 @@ def test_constructor_datelike_coercion(self):
              'mat': mat}, index=belly)
 
         result = df.loc['3T19']
-        self.assertTrue(result.dtype == object)
+        assert result.dtype == object
         result = df.loc['216']
-        self.assertTrue(result.dtype == object)
+        assert result.dtype == object
+
+    def test_constructor_datetimes_with_nulls(self):
+        # gh-15869
+        for arr in [np.array([None, None, None, None,
+                              datetime.now(), None]),
+                    np.array([None, None, datetime.now(), None])]:
+            result = Series(arr)
+            assert result.dtype == 'M8[ns]'
 
     def test_constructor_dtype_datetime64(self):
 
         s = Series(iNaT, dtype='M8[ns]', index=lrange(5))
-        self.assertTrue(isnull(s).all())
+        assert isna(s).all()
 
         # in theory this should be all nulls, but since
         # we are not specifying a dtype is ambiguous
         s = Series(iNaT, index=lrange(5))
-        self.assertFalse(isnull(s).all())
+        assert not isna(s).all()
 
         s = Series(nan, dtype='M8[ns]', index=lrange(5))
-        self.assertTrue(isnull(s).all())
+        assert isna(s).all()
 
         s = Series([datetime(2001, 1, 2, 0, 0), iNaT], dtype='M8[ns]')
-        self.assertTrue(isnull(s[1]))
-        self.assertEqual(s.dtype, 'M8[ns]')
+        assert isna(s[1])
+        assert s.dtype == 'M8[ns]'
 
         s = Series([datetime(2001, 1, 2, 0, 0), nan], dtype='M8[ns]')
-        self.assertTrue(isnull(s[1]))
-        self.assertEqual(s.dtype, 'M8[ns]')
+        assert isna(s[1])
+        assert s.dtype == 'M8[ns]'
 
         # GH3416
         dates = [
@@ -356,32 +677,35 @@ def test_constructor_dtype_datetime64(self):
         ]
 
         s = Series(dates)
-        self.assertEqual(s.dtype, 'M8[ns]')
+        assert s.dtype == 'M8[ns]'
 
         s.iloc[0] = np.nan
-        self.assertEqual(s.dtype, 'M8[ns]')
-
-        # invalid astypes
-        for t in ['s', 'D', 'us', 'ms']:
-            self.assertRaises(TypeError, s.astype, 'M8[%s]' % t)
+        assert s.dtype == 'M8[ns]'
 
         # GH3414 related
-        self.assertRaises(TypeError, lambda x: Series(
+        # msg = (r"cannot astype a datetimelike from \[datetime64\[ns\]\] to"
+        #        r" \[int32\]")
+        # with pytest.raises(TypeError, match=msg):
+        #     Series(Series(dates).astype('int') / 1000000, dtype='M8[ms]')
+        pytest.raises(TypeError, lambda x: Series(
             Series(dates).astype('int') / 1000000, dtype='M8[ms]'))
-        self.assertRaises(TypeError,
-                          lambda x: Series(dates, dtype='datetime64'))
+
+        msg = (r"The 'datetime64' dtype has no unit\. Please pass in"
+               r" 'datetime64\[ns\]' instead\.")
+        with pytest.raises(ValueError, match=msg):
+            Series(dates, dtype='datetime64')
 
         # invalid dates can be help as object
         result = Series([datetime(2, 1, 1)])
-        self.assertEqual(result[0], datetime(2, 1, 1, 0, 0))
+        assert result[0] == datetime(2, 1, 1, 0, 0)
 
         result = Series([datetime(3000, 1, 1)])
-        self.assertEqual(result[0], datetime(3000, 1, 1, 0, 0))
+        assert result[0] == datetime(3000, 1, 1, 0, 0)
 
         # don't mix types
         result = Series([Timestamp('20130101'), 1], index=['a', 'b'])
-        self.assertEqual(result['a'], Timestamp('20130101'))
-        self.assertEqual(result['b'], 1)
+        assert result['a'] == Timestamp('20130101')
+        assert result['b'] == 1
 
         # GH6529
         # coerce datetime64 non-ns properly
@@ -406,45 +730,45 @@ def test_constructor_dtype_datetime64(self):
         dates2 = np.array([d.date() for d in dates.to_pydatetime()],
                           dtype=object)
         series1 = Series(dates2, dates)
-        self.assert_numpy_array_equal(series1.values, dates2)
-        self.assertEqual(series1.dtype, object)
+        tm.assert_numpy_array_equal(series1.values, dates2)
+        assert series1.dtype == object
 
         # these will correctly infer a datetime
         s = Series([None, pd.NaT, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         s = Series([np.nan, pd.NaT, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         s = Series([pd.NaT, None, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
         s = Series([pd.NaT, np.nan, '2013-08-05 15:30:00.000001'])
-        self.assertEqual(s.dtype, 'datetime64[ns]')
+        assert s.dtype == 'datetime64[ns]'
 
         # tz-aware (UTC and other tz's)
         # GH 8411
         dr = date_range('20130101', periods=3)
-        self.assertTrue(Series(dr).iloc[0].tz is None)
+        assert Series(dr).iloc[0].tz is None
         dr = date_range('20130101', periods=3, tz='UTC')
-        self.assertTrue(str(Series(dr).iloc[0].tz) == 'UTC')
+        assert str(Series(dr).iloc[0].tz) == 'UTC'
         dr = date_range('20130101', periods=3, tz='US/Eastern')
-        self.assertTrue(str(Series(dr).iloc[0].tz) == 'US/Eastern')
+        assert str(Series(dr).iloc[0].tz) == 'US/Eastern'
 
         # non-convertible
         s = Series([1479596223000, -1479590, pd.NaT])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is pd.NaT)
-        self.assertTrue('NaT' in str(s))
+        assert s.dtype == 'object'
+        assert s[2] is pd.NaT
+        assert 'NaT' in str(s)
 
         # if we passed a NaT it remains
         s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), pd.NaT])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is pd.NaT)
-        self.assertTrue('NaT' in str(s))
+        assert s.dtype == 'object'
+        assert s[2] is pd.NaT
+        assert 'NaT' in str(s)
 
         # if we passed a nan it remains
         s = Series([datetime(2010, 1, 1), datetime(2, 1, 1), np.nan])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(s[2] is np.nan)
-        self.assertTrue('NaN' in str(s))
+        assert s.dtype == 'object'
+        assert s[2] is np.nan
+        assert 'NaN' in str(s)
 
     def test_constructor_with_datetime_tz(self):
 
@@ -453,27 +777,27 @@ def test_constructor_with_datetime_tz(self):
 
         dr = date_range('20130101', periods=3, tz='US/Eastern')
         s = Series(dr)
-        self.assertTrue(s.dtype.name == 'datetime64[ns, US/Eastern]')
-        self.assertTrue(s.dtype == 'datetime64[ns, US/Eastern]')
-        self.assertTrue(is_datetime64tz_dtype(s.dtype))
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(s))
+        assert s.dtype.name == 'datetime64[ns, US/Eastern]'
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        assert is_datetime64tz_dtype(s.dtype)
+        assert 'datetime64[ns, US/Eastern]' in str(s)
 
         # export
         result = s.values
-        self.assertIsInstance(result, np.ndarray)
-        self.assertTrue(result.dtype == 'datetime64[ns]')
+        assert isinstance(result, np.ndarray)
+        assert result.dtype == 'datetime64[ns]'
 
         exp = pd.DatetimeIndex(result)
         exp = exp.tz_localize('UTC').tz_convert(tz=s.dt.tz)
-        self.assert_index_equal(dr, exp)
+        tm.assert_index_equal(dr, exp)
 
         # indexing
         result = s.iloc[0]
-        self.assertEqual(result, Timestamp('2013-01-01 00:00:00-0500',
-                                           tz='US/Eastern', freq='D'))
+        assert result == Timestamp('2013-01-01 00:00:00-0500',
+                                   tz='US/Eastern', freq='D')
         result = s[0]
-        self.assertEqual(result, Timestamp('2013-01-01 00:00:00-0500',
-                                           tz='US/Eastern', freq='D'))
+        assert result == Timestamp('2013-01-01 00:00:00-0500',
+                                   tz='US/Eastern', freq='D')
 
         result = s[Series([True, True, False], index=s.index)]
         assert_series_equal(result, s[0:2])
@@ -485,36 +809,17 @@ def test_constructor_with_datetime_tz(self):
         result = pd.concat([s.iloc[0:1], s.iloc[1:]])
         assert_series_equal(result, s)
 
-        # astype
-        result = s.astype(object)
-        expected = Series(DatetimeIndex(s._values).asobject)
-        assert_series_equal(result, expected)
-
-        result = Series(s.values).dt.tz_localize('UTC').dt.tz_convert(s.dt.tz)
-        assert_series_equal(result, s)
-
-        # astype - datetime64[ns, tz]
-        result = Series(s.values).astype('datetime64[ns, US/Eastern]')
-        assert_series_equal(result, s)
-
-        result = Series(s.values).astype(s.dtype)
-        assert_series_equal(result, s)
-
-        result = s.astype('datetime64[ns, CET]')
-        expected = Series(date_range('20130101 06:00:00', periods=3, tz='CET'))
-        assert_series_equal(result, expected)
-
         # short str
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(s))
+        assert 'datetime64[ns, US/Eastern]' in str(s)
 
         # formatting with NaT
         result = s.shift()
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(result))
-        self.assertTrue('NaT' in str(result))
+        assert 'datetime64[ns, US/Eastern]' in str(result)
+        assert 'NaT' in str(result)
 
         # long str
         t = Series(date_range('20130101', periods=1000, tz='US/Eastern'))
-        self.assertTrue('datetime64[ns, US/Eastern]' in str(t))
+        assert 'datetime64[ns, US/Eastern]' in str(t)
 
         result = pd.DatetimeIndex(s, freq='infer')
         tm.assert_index_equal(result, dr)
@@ -522,19 +827,52 @@ def test_constructor_with_datetime_tz(self):
         # inference
         s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
                     pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Pacific')])
-        self.assertTrue(s.dtype == 'datetime64[ns, US/Pacific]')
-        self.assertTrue(lib.infer_dtype(s) == 'datetime64')
+        assert s.dtype == 'datetime64[ns, US/Pacific]'
+        assert lib.infer_dtype(s, skipna=True) == 'datetime64'
 
         s = Series([pd.Timestamp('2013-01-01 13:00:00-0800', tz='US/Pacific'),
                     pd.Timestamp('2013-01-02 14:00:00-0800', tz='US/Eastern')])
-        self.assertTrue(s.dtype == 'object')
-        self.assertTrue(lib.infer_dtype(s) == 'datetime')
+        assert s.dtype == 'object'
+        assert lib.infer_dtype(s, skipna=True) == 'datetime'
 
         # with all NaT
         s = Series(pd.NaT, index=[0, 1], dtype='datetime64[ns, US/Eastern]')
         expected = Series(pd.DatetimeIndex(['NaT', 'NaT'], tz='US/Eastern'))
         assert_series_equal(s, expected)
 
+    @pytest.mark.parametrize("arr_dtype", [np.int64, np.float64])
+    @pytest.mark.parametrize("dtype", ["M8", "m8"])
+    @pytest.mark.parametrize("unit", ['ns', 'us', 'ms', 's', 'h', 'm', 'D'])
+    def test_construction_to_datetimelike_unit(self, arr_dtype, dtype, unit):
+        # tests all units
+        # gh-19223
+        dtype = "{}[{}]".format(dtype, unit)
+        arr = np.array([1, 2, 3], dtype=arr_dtype)
+        s = Series(arr)
+        result = s.astype(dtype)
+        expected = Series(arr.astype(dtype))
+
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('arg',
+                             ['2013-01-01 00:00:00', pd.NaT, np.nan, None])
+    def test_constructor_with_naive_string_and_datetimetz_dtype(self, arg):
+        # GH 17415: With naive string
+        result = Series([arg], dtype='datetime64[ns, CET]')
+        expected = Series(pd.Timestamp(arg)).dt.tz_localize('CET')
+        assert_series_equal(result, expected)
+
+    def test_construction_interval(self):
+        # construction from interval & array of intervals
+        index = IntervalIndex.from_breaks(np.arange(3), closed='right')
+        result = Series(index)
+        repr(result)
+        str(result)
+        tm.assert_index_equal(Index(result.values), index)
+
+        result = Series(index.values)
+        tm.assert_index_equal(Index(result.values), index)
+
     def test_construction_consistency(self):
 
         # make sure that we are not re-localizing upon construction
@@ -550,17 +888,33 @@ def test_construction_consistency(self):
         result = Series(s.values, dtype=s.dtype)
         tm.assert_series_equal(result, s)
 
+    def test_constructor_infer_period(self):
+        data = [pd.Period('2000', 'D'), pd.Period('2001', 'D'), None]
+        result = pd.Series(data)
+        expected = pd.Series(period_array(data))
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'Period[D]'
+
+        data = np.asarray(data, dtype=object)
+        tm.assert_series_equal(result, expected)
+        assert result.dtype == 'Period[D]'
+
+    def test_constructor_period_incompatible_frequency(self):
+        data = [pd.Period('2000', 'D'), pd.Period('2001', 'A')]
+        result = pd.Series(data)
+        assert result.dtype == object
+        assert result.tolist() == data
+
     def test_constructor_periodindex(self):
         # GH7932
         # converting a PeriodIndex when put in a Series
 
         pi = period_range('20130101', periods=5, freq='D')
         s = Series(pi)
-        expected = Series(pi.asobject)
+        assert s.dtype == 'Period[D]'
+        expected = Series(pi.astype(object))
         assert_series_equal(s, expected)
 
-        self.assertEqual(s.dtype, 'object')
-
     def test_constructor_dict(self):
         d = {'a': 0., 'b': 1., 'c': 2.}
         result = Series(d, index=['b', 'c', 'd', 'a'])
@@ -575,47 +929,32 @@ def test_constructor_dict(self):
         expected.iloc[1] = 1
         assert_series_equal(result, expected)
 
-    def test_constructor_dict_multiindex(self):
-        check = lambda result, expected: tm.assert_series_equal(
-            result, expected, check_dtype=True, check_series_type=True)
-        d = {('a', 'a'): 0., ('b', 'a'): 1., ('b', 'c'): 2.}
-        _d = sorted(d.items())
-        ser = Series(d)
-        expected = Series([x[1] for x in _d],
-                          index=MultiIndex.from_tuples([x[0] for x in _d]))
-        check(ser, expected)
-
-        d['z'] = 111.
-        _d.insert(0, ('z', d['z']))
-        ser = Series(d)
-        expected = Series([x[1] for x in _d], index=Index(
-            [x[0] for x in _d], tupleize_cols=False))
-        ser = ser.reindex(index=expected.index)
-        check(ser, expected)
-
-    def test_constructor_dict_timedelta_index(self):
-        # GH #12169 : Resample category data with timedelta index
-        # construct Series from dict as data and TimedeltaIndex as index
-        # will result NaN in result Series data
-        expected = Series(
-            data=['A', 'B', 'C'],
-            index=pd.to_timedelta([0, 10, 20], unit='s')
-        )
-
-        result = Series(
-            data={pd.to_timedelta(0, unit='s'): 'A',
-                  pd.to_timedelta(10, unit='s'): 'B',
-                  pd.to_timedelta(20, unit='s'): 'C'},
-            index=pd.to_timedelta([0, 10, 20], unit='s')
-        )
-        # this should work
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': 1, 'a': 0, 'c': 2}
+        result = Series(d)
+        if PY36:
+            expected = Series([1, 0, 2], index=list('bac'))
+        else:
+            expected = Series([0, 1, 2], index=list('abc'))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("value", [2, np.nan, None, float('nan')])
+    def test_constructor_dict_nan_key(self, value):
+        # GH 18480
+        d = {1: 'a', value: 'b', float('nan'): 'c', 4: 'd'}
+        result = Series(d).sort_values()
+        expected = Series(['a', 'b', 'c', 'd'], index=[1, value, np.nan, 4])
         assert_series_equal(result, expected)
 
-    def test_constructor_subclass_dict(self):
-        data = tm.TestSubDict((x, 10.0 * x) for x in range(10))
-        series = Series(data)
-        refseries = Series(dict(compat.iteritems(data)))
-        assert_series_equal(refseries, series)
+        # MultiIndex:
+        d = {(1, 1): 'a', (2, np.nan): 'b', (3, value): 'c'}
+        result = Series(d).sort_values()
+        expected = Series(['a', 'b', 'c'],
+                          index=Index([(1, 1), (2, np.nan), (3, value)]))
+        assert_series_equal(result, expected)
 
     def test_constructor_dict_datetime64_index(self):
         # GH 9456
@@ -640,163 +979,166 @@ def create_data(constructor):
         assert_series_equal(result_datetime, expected)
         assert_series_equal(result_Timestamp, expected)
 
-    def test_orderedDict_ctor(self):
-        # GH3283
-        import pandas
-        import random
-        data = OrderedDict([('col%s' % i, random.random()) for i in range(12)])
-        s = pandas.Series(data)
-        self.assertTrue(all(s.values == list(data.values())))
-
-    def test_orderedDict_subclass_ctor(self):
-        # GH3283
-        import pandas
-        import random
-
-        class A(OrderedDict):
-            pass
-
-        data = A([('col%s' % i, random.random()) for i in range(12)])
-        s = pandas.Series(data)
-        self.assertTrue(all(s.values == list(data.values())))
-
     def test_constructor_list_of_tuples(self):
         data = [(1, 1), (2, 2), (2, 3)]
         s = Series(data)
-        self.assertEqual(list(s), data)
+        assert list(s) == data
 
     def test_constructor_tuple_of_tuples(self):
         data = ((1, 1), (2, 2), (2, 3))
         s = Series(data)
-        self.assertEqual(tuple(s), data)
+        assert tuple(s) == data
+
+    def test_constructor_dict_of_tuples(self):
+        data = {(1, 2): 3,
+                (None, 5): 6}
+        result = Series(data).sort_values()
+        expected = Series([3, 6],
+                          index=MultiIndex.from_tuples([(1, 2), (None, 5)]))
+        tm.assert_series_equal(result, expected)
 
     def test_constructor_set(self):
-        values = set([1, 2, 3, 4, 5])
-        self.assertRaises(TypeError, Series, values)
+        values = {1, 2, 3, 4, 5}
+        with pytest.raises(TypeError, match="'set' type is unordered"):
+            Series(values)
         values = frozenset(values)
-        self.assertRaises(TypeError, Series, values)
+        with pytest.raises(TypeError, match="'frozenset' type is unordered"):
+            Series(values)
 
+    # https://github.com/pandas-dev/pandas/issues/22698
+    @pytest.mark.filterwarnings("ignore:elementwise comparison:FutureWarning")
     def test_fromDict(self):
         data = {'a': 0, 'b': 1, 'c': 2, 'd': 3}
 
         series = Series(data)
-        self.assertTrue(tm.is_sorted(series.index))
+        assert tm.is_sorted(series.index)
 
         data = {'a': 0, 'b': '1', 'c': '2', 'd': datetime.now()}
         series = Series(data)
-        self.assertEqual(series.dtype, np.object_)
+        assert series.dtype == np.object_
 
         data = {'a': 0, 'b': '1', 'c': '2', 'd': '3'}
         series = Series(data)
-        self.assertEqual(series.dtype, np.object_)
+        assert series.dtype == np.object_
 
         data = {'a': '0', 'b': '1'}
         series = Series(data, dtype=float)
-        self.assertEqual(series.dtype, np.float64)
+        assert series.dtype == np.float64
 
-    def test_fromValue(self):
+    def test_fromValue(self, datetime_series):
 
-        nans = Series(np.NaN, index=self.ts.index)
-        self.assertEqual(nans.dtype, np.float_)
-        self.assertEqual(len(nans), len(self.ts))
+        nans = Series(np.NaN, index=datetime_series.index)
+        assert nans.dtype == np.float_
+        assert len(nans) == len(datetime_series)
 
-        strings = Series('foo', index=self.ts.index)
-        self.assertEqual(strings.dtype, np.object_)
-        self.assertEqual(len(strings), len(self.ts))
+        strings = Series('foo', index=datetime_series.index)
+        assert strings.dtype == np.object_
+        assert len(strings) == len(datetime_series)
 
         d = datetime.now()
-        dates = Series(d, index=self.ts.index)
-        self.assertEqual(dates.dtype, 'M8[ns]')
-        self.assertEqual(len(dates), len(self.ts))
+        dates = Series(d, index=datetime_series.index)
+        assert dates.dtype == 'M8[ns]'
+        assert len(dates) == len(datetime_series)
 
         # GH12336
         # Test construction of categorical series from value
-        categorical = Series(0, index=self.ts.index, dtype="category")
-        expected = Series(0, index=self.ts.index).astype("category")
-        self.assertEqual(categorical.dtype, 'category')
-        self.assertEqual(len(categorical), len(self.ts))
+        categorical = Series(0, index=datetime_series.index, dtype="category")
+        expected = Series(0, index=datetime_series.index).astype("category")
+        assert categorical.dtype == 'category'
+        assert len(categorical) == len(datetime_series)
         tm.assert_series_equal(categorical, expected)
 
     def test_constructor_dtype_timedelta64(self):
 
         # basic
         td = Series([timedelta(days=i) for i in range(3)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([timedelta(days=1)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([timedelta(days=1), timedelta(days=2), np.timedelta64(
             1, 's')])
 
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         # mixed with NaT
         td = Series([timedelta(days=1), NaT], dtype='m8[ns]')
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([timedelta(days=1), np.nan], dtype='m8[ns]')
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([np.timedelta64(300000000), pd.NaT], dtype='m8[ns]')
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         # improved inference
         # GH5689
         td = Series([np.timedelta64(300000000), NaT])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         # because iNaT is int, not coerced to timedelta
         td = Series([np.timedelta64(300000000), iNaT])
-        self.assertEqual(td.dtype, 'object')
+        assert td.dtype == 'object'
 
         td = Series([np.timedelta64(300000000), np.nan])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([pd.NaT, np.timedelta64(300000000)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         td = Series([np.timedelta64(1, 's')])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
+        assert td.dtype == 'timedelta64[ns]'
 
         # these are frequency conversion astypes
         # for t in ['s', 'D', 'us', 'ms']:
-        #    self.assertRaises(TypeError, td.astype, 'm8[%s]' % t)
+        #    pytest.raises(TypeError, td.astype, 'm8[%s]' % t)
 
         # valid astype
         td.astype('int64')
 
         # invalid casting
-        self.assertRaises(TypeError, td.astype, 'int32')
+        msg = (r"cannot astype a timedelta from \[timedelta64\[ns\]\] to"
+               r" \[int32\]")
+        with pytest.raises(TypeError, match=msg):
+            td.astype('int32')
 
         # this is an invalid casting
-        def f():
+        msg = "Could not convert object to NumPy timedelta"
+        with pytest.raises(ValueError, match=msg):
             Series([timedelta(days=1), 'foo'], dtype='m8[ns]')
 
-        self.assertRaises(Exception, f)
-
         # leave as object here
         td = Series([timedelta(days=i) for i in range(3)] + ['foo'])
-        self.assertEqual(td.dtype, 'object')
+        assert td.dtype == 'object'
 
         # these will correctly infer a timedelta
         s = Series([None, pd.NaT, '1 Day'])
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         s = Series([np.nan, pd.NaT, '1 Day'])
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         s = Series([pd.NaT, None, '1 Day'])
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
         s = Series([pd.NaT, np.nan, '1 Day'])
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
+        assert s.dtype == 'timedelta64[ns]'
+
+    # GH 16406
+    def test_constructor_mixed_tz(self):
+        s = Series([Timestamp('20130101'),
+                    Timestamp('20130101', tz='US/Eastern')])
+        expected = Series([Timestamp('20130101'),
+                           Timestamp('20130101', tz='US/Eastern')],
+                          dtype='object')
+        assert_series_equal(s, expected)
 
     def test_NaT_scalar(self):
         series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
 
         val = series[3]
-        self.assertTrue(isnull(val))
+        assert isna(val)
 
         series[2] = val
-        self.assertTrue(isnull(series[2]))
+        assert isna(series[2])
 
     def test_NaT_cast(self):
         # GH10747
@@ -808,26 +1150,119 @@ def test_constructor_name_hashable(self):
         for n in [777, 777., 'name', datetime(2001, 11, 11), (1, ), u"\u05D0"]:
             for data in [[1, 2, 3], np.ones(3), {'a': 0, 'b': 1}]:
                 s = Series(data, name=n)
-                self.assertEqual(s.name, n)
+                assert s.name == n
 
     def test_constructor_name_unhashable(self):
+        msg = r"Series\.name must be a hashable type"
         for n in [['name_list'], np.ones(2), {1: 2}]:
             for data in [['name_list'], np.ones(2), {1: 2}]:
-                self.assertRaises(TypeError, Series, data, name=n)
+                with pytest.raises(TypeError, match=msg):
+                    Series(data, name=n)
 
     def test_auto_conversion(self):
         series = Series(list(date_range('1/1/2000', periods=10)))
-        self.assertEqual(series.dtype, 'M8[ns]')
+        assert series.dtype == 'M8[ns]'
 
-    def test_constructor_cant_cast_datetime64(self):
-        msg = "Cannot cast datetime64 to "
-        with tm.assertRaisesRegexp(TypeError, msg):
-            Series(date_range('1/1/2000', periods=10), dtype=float)
+    def test_convert_non_ns(self):
+        # convert from a numpy array of non-ns timedelta64
+        arr = np.array([1, 2, 3], dtype='timedelta64[s]')
+        s = Series(arr)
+        expected = Series(pd.timedelta_range('00:00:01', periods=3, freq='s'))
+        assert_series_equal(s, expected)
 
-        with tm.assertRaisesRegexp(TypeError, msg):
-            Series(date_range('1/1/2000', periods=10), dtype=int)
+        # convert from a numpy array of non-ns datetime64
+        # note that creating a numpy datetime64 is in LOCAL time!!!!
+        # seems to work for M8[D], but not for M8[s]
+
+        s = Series(np.array(['2013-01-01', '2013-01-02',
+                             '2013-01-03'], dtype='datetime64[D]'))
+        assert_series_equal(s, Series(date_range('20130101', periods=3,
+                                                 freq='D')))
+
+        # s = Series(np.array(['2013-01-01 00:00:01','2013-01-01
+        # 00:00:02','2013-01-01 00:00:03'],dtype='datetime64[s]'))
+
+        # assert_series_equal(s,date_range('20130101
+        # 00:00:01',period=3,freq='s'))
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            date_range('1/1/2000', periods=10),
+            timedelta_range('1 day', periods=10),
+            period_range('2000-Q1', periods=10, freq='Q')],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_cant_cast_datetimelike(self, index):
+
+        # floats are not ok
+        msg = "Cannot cast {}.*? to ".format(
+            # strip Index to convert PeriodIndex -> Period
+            # We don't care whether the error message says
+            # PeriodIndex or PeriodArray
+            type(index).__name__.rstrip("Index")
+        )
+        with pytest.raises(TypeError, match=msg):
+            Series(index, dtype=float)
+
+        # ints are ok
+        # we test with np.int64 to get similar results on
+        # windows / 32-bit platforms
+        result = Series(index, dtype=np.int64)
+        expected = Series(index.astype(np.int64))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        "index",
+        [
+            date_range('1/1/2000', periods=10),
+            timedelta_range('1 day', periods=10),
+            period_range('2000-Q1', periods=10, freq='Q')],
+        ids=lambda x: type(x).__name__)
+    def test_constructor_cast_object(self, index):
+        s = Series(index, dtype=object)
+        exp = Series(index).astype(object)
+        tm.assert_series_equal(s, exp)
+
+        s = Series(pd.Index(index, dtype=object), dtype=object)
+        exp = Series(index).astype(object)
+        tm.assert_series_equal(s, exp)
 
-    def test_constructor_cast_object(self):
-        s = Series(date_range('1/1/2000', periods=10), dtype=object)
-        exp = Series(date_range('1/1/2000', periods=10))
+        s = Series(index.astype(object), dtype=object)
+        exp = Series(index).astype(object)
         tm.assert_series_equal(s, exp)
+
+    @pytest.mark.parametrize("dtype", [
+        np.datetime64,
+        np.timedelta64,
+    ])
+    def test_constructor_generic_timestamp_no_frequency(self, dtype):
+        # see gh-15524, gh-15987
+        msg = "dtype has no unit. Please pass in"
+
+        with pytest.raises(ValueError, match=msg):
+            Series([], dtype=dtype)
+
+    @pytest.mark.parametrize("dtype,msg", [
+        ("m8[ps]", "cannot convert timedeltalike"),
+        ("M8[ps]", "cannot convert datetimelike"),
+    ])
+    def test_constructor_generic_timestamp_bad_frequency(self, dtype, msg):
+        # see gh-15524, gh-15987
+
+        with pytest.raises(TypeError, match=msg):
+            Series([], dtype=dtype)
+
+    @pytest.mark.parametrize('dtype', [None, 'uint8', 'category'])
+    def test_constructor_range_dtype(self, dtype):
+        # GH 16804
+        expected = Series([0, 1, 2, 3, 4], dtype=dtype or 'int64')
+        result = Series(range(5), dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+    def test_constructor_tz_mixed_data(self):
+        # GH 13051
+        dt_list = [Timestamp('2016-05-01 02:03:37'),
+                   Timestamp('2016-04-30 19:03:37-0700', tz='US/Pacific')]
+        result = Series(dt_list)
+        expected = Series(dt_list, dtype=object)
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_datetime_values.py b/pandas/tests/series/test_datetime_values.py
index 89f972a33a630..a916cf300653a 100644
--- a/pandas/tests/series/test_datetime_values.py
+++ b/pandas/tests/series/test_datetime_values.py
@@ -1,36 +1,42 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-from datetime import datetime, date
+import calendar
+from datetime import date, datetime, time
+import locale
+import unicodedata
 
 import numpy as np
-import pandas as pd
+import pytest
+import pytz
 
-from pandas.types.common import is_integer_dtype, is_list_like
-from pandas import (Index, Series, DataFrame, bdate_range,
-                    date_range, period_range, timedelta_range,
-                    PeriodIndex, Timestamp, DatetimeIndex, TimedeltaIndex)
-import pandas.core.common as com
+from pandas._libs.tslibs.timezones import maybe_get_tz
 
-from pandas.util.testing import assert_series_equal
-import pandas.util.testing as tm
+from pandas.core.dtypes.common import is_integer_dtype, is_list_like
 
-from .common import TestData
+import pandas as pd
+from pandas import (
+    DataFrame, DatetimeIndex, Index, PeriodIndex, Series, TimedeltaIndex,
+    bdate_range, compat, date_range, period_range, timedelta_range)
+from pandas.core.arrays import PeriodArray
+import pandas.core.common as com
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
 
 
-class TestSeriesDatetimeValues(TestData, tm.TestCase):
+class TestSeriesDatetimeValues():
 
     def test_dt_namespace_accessor(self):
 
         # GH 7207, 11128
         # test .dt namespace accessor
 
-        ok_for_period = PeriodIndex._datetimelike_ops
+        ok_for_period = PeriodArray._datetimelike_ops
         ok_for_period_methods = ['strftime', 'to_timestamp', 'asfreq']
         ok_for_dt = DatetimeIndex._datetimelike_ops
         ok_for_dt_methods = ['to_period', 'to_pydatetime', 'tz_localize',
                              'tz_convert', 'normalize', 'strftime', 'round',
-                             'floor', 'ceil', 'weekday_name']
+                             'floor', 'ceil', 'day_name', 'month_name']
         ok_for_td = TimedeltaIndex._datetimelike_ops
         ok_for_td_methods = ['components', 'to_pytimedelta', 'total_seconds',
                              'round', 'floor', 'ceil']
@@ -48,7 +54,7 @@ def compare(s, name):
             a = getattr(s.dt, prop)
             b = get_expected(s, prop)
             if not (is_list_like(a) and is_list_like(b)):
-                self.assertEqual(a, b)
+                assert a == b
             else:
                 tm.assert_series_equal(a, b)
 
@@ -68,8 +74,8 @@ def compare(s, name):
                 getattr(s.dt, prop)
 
             result = s.dt.to_pydatetime()
-            self.assertIsInstance(result, np.ndarray)
-            self.assertTrue(result.dtype == object)
+            assert isinstance(result, np.ndarray)
+            assert result.dtype == object
 
             result = s.dt.tz_localize('US/Eastern')
             exp_values = DatetimeIndex(s.values).tz_localize('US/Eastern')
@@ -77,10 +83,9 @@ def compare(s, name):
             tm.assert_series_equal(result, expected)
 
             tz_result = result.dt.tz
-            self.assertEqual(str(tz_result), 'US/Eastern')
+            assert str(tz_result) == 'US/Eastern'
             freq_result = s.dt.freq
-            self.assertEqual(freq_result, DatetimeIndex(s.values,
-                                                        freq='infer').freq)
+            assert freq_result == DatetimeIndex(s.values, freq='infer').freq
 
             # let's localize, then convert
             result = s.dt.tz_localize('UTC').dt.tz_convert('US/Eastern')
@@ -89,42 +94,6 @@ def compare(s, name):
             expected = Series(exp_values, index=s.index, name='xxx')
             tm.assert_series_equal(result, expected)
 
-        # round
-        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
-                                   '2012-01-01 12:01:00',
-                                   '2012-01-01 08:00:00']), name='xxx')
-        result = s.dt.round('D')
-        expected = Series(pd.to_datetime(['2012-01-02', '2012-01-02',
-                                          '2012-01-01']), name='xxx')
-        tm.assert_series_equal(result, expected)
-
-        # round with tz
-        result = (s.dt.tz_localize('UTC')
-                   .dt.tz_convert('US/Eastern')
-                   .dt.round('D'))
-        exp_values = pd.to_datetime(['2012-01-01', '2012-01-01',
-                                     '2012-01-01']).tz_localize('US/Eastern')
-        expected = Series(exp_values, name='xxx')
-        tm.assert_series_equal(result, expected)
-
-        # floor
-        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
-                                   '2012-01-01 12:01:00',
-                                   '2012-01-01 08:00:00']), name='xxx')
-        result = s.dt.floor('D')
-        expected = Series(pd.to_datetime(['2012-01-01', '2012-01-01',
-                                          '2012-01-01']), name='xxx')
-        tm.assert_series_equal(result, expected)
-
-        # ceil
-        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
-                                   '2012-01-01 12:01:00',
-                                   '2012-01-01 08:00:00']), name='xxx')
-        result = s.dt.ceil('D')
-        expected = Series(pd.to_datetime(['2012-01-02', '2012-01-02',
-                                          '2012-01-02']), name='xxx')
-        tm.assert_series_equal(result, expected)
-
         # datetimeindex with tz
         s = Series(date_range('20130101', periods=5, tz='US/Eastern'),
                    name='xxx')
@@ -138,8 +107,8 @@ def compare(s, name):
             getattr(s.dt, prop)
 
         result = s.dt.to_pydatetime()
-        self.assertIsInstance(result, np.ndarray)
-        self.assertTrue(result.dtype == object)
+        assert isinstance(result, np.ndarray)
+        assert result.dtype == object
 
         result = s.dt.tz_convert('CET')
         expected = Series(s._values.tz_convert('CET'),
@@ -147,12 +116,11 @@ def compare(s, name):
         tm.assert_series_equal(result, expected)
 
         tz_result = result.dt.tz
-        self.assertEqual(str(tz_result), 'CET')
+        assert str(tz_result) == 'CET'
         freq_result = s.dt.freq
-        self.assertEqual(freq_result, DatetimeIndex(s.values,
-                                                    freq='infer').freq)
+        assert freq_result == DatetimeIndex(s.values, freq='infer').freq
 
-        # timedeltaindex
+        # timedelta index
         cases = [Series(timedelta_range('1 day', periods=5),
                         index=list('abcde'), name='xxx'),
                  Series(timedelta_range('1 day 01:23:45', periods=5,
@@ -169,20 +137,19 @@ def compare(s, name):
                 getattr(s.dt, prop)
 
             result = s.dt.components
-            self.assertIsInstance(result, DataFrame)
+            assert isinstance(result, DataFrame)
             tm.assert_index_equal(result.index, s.index)
 
             result = s.dt.to_pytimedelta()
-            self.assertIsInstance(result, np.ndarray)
-            self.assertTrue(result.dtype == object)
+            assert isinstance(result, np.ndarray)
+            assert result.dtype == object
 
             result = s.dt.total_seconds()
-            self.assertIsInstance(result, pd.Series)
-            self.assertTrue(result.dtype == 'float64')
+            assert isinstance(result, pd.Series)
+            assert result.dtype == 'float64'
 
             freq_result = s.dt.freq
-            self.assertEqual(freq_result, TimedeltaIndex(s.values,
-                                                         freq='infer').freq)
+            assert freq_result == TimedeltaIndex(s.values, freq='infer').freq
 
         # both
         index = date_range('20130101', periods=3, freq='D')
@@ -216,7 +183,7 @@ def compare(s, name):
                 getattr(s.dt, prop)
 
             freq_result = s.dt.freq
-            self.assertEqual(freq_result, PeriodIndex(s.values).freq)
+            assert freq_result == PeriodIndex(s.values).freq
 
         # test limited display api
         def get_dir(s):
@@ -229,7 +196,7 @@ def get_dir(s):
             results, list(sorted(set(ok_for_dt + ok_for_dt_methods))))
 
         s = Series(period_range('20130101', periods=5,
-                                freq='D', name='xxx').asobject)
+                                freq='D', name='xxx').astype(object))
         results = get_dir(s)
         tm.assert_almost_equal(
             results, list(sorted(set(ok_for_period + ok_for_period_methods))))
@@ -249,24 +216,162 @@ def get_dir(s):
 
         # no setting allowed
         s = Series(date_range('20130101', periods=5, freq='D'), name='xxx')
-        with tm.assertRaisesRegexp(ValueError, "modifications"):
+        with pytest.raises(ValueError, match="modifications"):
             s.dt.hour = 5
 
         # trying to set a copy
         with pd.option_context('chained_assignment', 'raise'):
-
-            def f():
+            with pytest.raises(com.SettingWithCopyError):
                 s.dt.hour[0] = 5
 
-            self.assertRaises(com.SettingWithCopyError, f)
+    @pytest.mark.parametrize('method, dates', [
+        ['round', ['2012-01-02', '2012-01-02', '2012-01-01']],
+        ['floor', ['2012-01-01', '2012-01-01', '2012-01-01']],
+        ['ceil', ['2012-01-02', '2012-01-02', '2012-01-02']]
+    ])
+    def test_dt_round(self, method, dates):
+        # round
+        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
+                                   '2012-01-01 12:01:00',
+                                   '2012-01-01 08:00:00']), name='xxx')
+        result = getattr(s.dt, method)('D')
+        expected = Series(pd.to_datetime(dates), name='xxx')
+        tm.assert_series_equal(result, expected)
+
+    def test_dt_round_tz(self):
+        s = Series(pd.to_datetime(['2012-01-01 13:00:00',
+                                   '2012-01-01 12:01:00',
+                                   '2012-01-01 08:00:00']), name='xxx')
+        result = (s.dt.tz_localize('UTC')
+                  .dt.tz_convert('US/Eastern')
+                  .dt.round('D'))
+
+        exp_values = pd.to_datetime(['2012-01-01', '2012-01-01',
+                                     '2012-01-01']).tz_localize('US/Eastern')
+        expected = Series(exp_values, name='xxx')
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('method', ['ceil', 'round', 'floor'])
+    def test_dt_round_tz_ambiguous(self, method):
+        # GH 18946 round near "fall back" DST
+        df1 = pd.DataFrame([
+            pd.to_datetime('2017-10-29 02:00:00+02:00', utc=True),
+            pd.to_datetime('2017-10-29 02:00:00+01:00', utc=True),
+            pd.to_datetime('2017-10-29 03:00:00+01:00', utc=True)
+        ],
+            columns=['date'])
+        df1['date'] = df1['date'].dt.tz_convert('Europe/Madrid')
+        # infer
+        result = getattr(df1.date.dt, method)('H', ambiguous='infer')
+        expected = df1['date']
+        tm.assert_series_equal(result, expected)
+
+        # bool-array
+        result = getattr(df1.date.dt, method)(
+            'H', ambiguous=[True, False, False]
+        )
+        tm.assert_series_equal(result, expected)
+
+        # NaT
+        result = getattr(df1.date.dt, method)('H', ambiguous='NaT')
+        expected = df1['date'].copy()
+        expected.iloc[0:2] = pd.NaT
+        tm.assert_series_equal(result, expected)
+
+        # raise
+        with pytest.raises(pytz.AmbiguousTimeError):
+            getattr(df1.date.dt, method)('H', ambiguous='raise')
+
+    @pytest.mark.parametrize('method, ts_str, freq', [
+        ['ceil', '2018-03-11 01:59:00-0600', '5min'],
+        ['round', '2018-03-11 01:59:00-0600', '5min'],
+        ['floor', '2018-03-11 03:01:00-0500', '2H']])
+    def test_dt_round_tz_nonexistent(self, method, ts_str, freq):
+        # GH 23324 round near "spring forward" DST
+        s = Series([pd.Timestamp(ts_str, tz='America/Chicago')])
+        result = getattr(s.dt, method)(freq, nonexistent='shift_forward')
+        expected = Series(
+            [pd.Timestamp('2018-03-11 03:00:00', tz='America/Chicago')]
+        )
+        tm.assert_series_equal(result, expected)
+
+        result = getattr(s.dt, method)(freq, nonexistent='NaT')
+        expected = Series([pd.NaT]).dt.tz_localize(result.dt.tz)
+        tm.assert_series_equal(result, expected)
+
+        with pytest.raises(pytz.NonExistentTimeError,
+                           match='2018-03-11 02:00:00'):
+            getattr(s.dt, method)(freq, nonexistent='raise')
+
+    def test_dt_namespace_accessor_categorical(self):
+        # GH 19468
+        dti = DatetimeIndex(['20171111', '20181212']).repeat(2)
+        s = Series(pd.Categorical(dti), name='foo')
+        result = s.dt.year
+        expected = Series([2017, 2017, 2018, 2018], name='foo')
+        tm.assert_series_equal(result, expected)
 
     def test_dt_accessor_no_new_attributes(self):
         # https://github.com/pandas-dev/pandas/issues/10673
         s = Series(date_range('20130101', periods=5, freq='D'))
-        with tm.assertRaisesRegexp(AttributeError,
-                                   "You cannot add any new attribute"):
+        with pytest.raises(AttributeError,
+                           match="You cannot add any new attribute"):
             s.dt.xlabel = "a"
 
+    @pytest.mark.parametrize('time_locale', [
+        None] if tm.get_locales() is None else [None] + tm.get_locales())
+    def test_dt_accessor_datetime_name_accessors(self, time_locale):
+        # Test Monday -> Sunday and January -> December, in that sequence
+        if time_locale is None:
+            # If the time_locale is None, day-name and month_name should
+            # return the english attributes
+            expected_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                             'Friday', 'Saturday', 'Sunday']
+            expected_months = ['January', 'February', 'March', 'April', 'May',
+                               'June', 'July', 'August', 'September',
+                               'October', 'November', 'December']
+        else:
+            with tm.set_locale(time_locale, locale.LC_TIME):
+                expected_days = calendar.day_name[:]
+                expected_months = calendar.month_name[1:]
+
+        s = Series(date_range(freq='D', start=datetime(1998, 1, 1),
+                              periods=365))
+        english_days = ['Monday', 'Tuesday', 'Wednesday', 'Thursday',
+                        'Friday', 'Saturday', 'Sunday']
+        for day, name, eng_name in zip(range(4, 11),
+                                       expected_days,
+                                       english_days):
+            name = name.capitalize()
+            assert s.dt.weekday_name[day] == eng_name
+            assert s.dt.day_name(locale=time_locale)[day] == name
+        s = s.append(Series([pd.NaT]))
+        assert np.isnan(s.dt.day_name(locale=time_locale).iloc[-1])
+
+        s = Series(date_range(freq='M', start='2012', end='2013'))
+        result = s.dt.month_name(locale=time_locale)
+        expected = Series([month.capitalize() for month in expected_months])
+
+        # work around https://github.com/pandas-dev/pandas/issues/22342
+        if not compat.PY2:
+            result = result.str.normalize("NFD")
+            expected = expected.str.normalize("NFD")
+
+        tm.assert_series_equal(result, expected)
+
+        for s_date, expected in zip(s, expected_months):
+            result = s_date.month_name(locale=time_locale)
+            expected = expected.capitalize()
+
+            if not compat.PY2:
+                result = unicodedata.normalize("NFD", result)
+                expected = unicodedata.normalize("NFD", expected)
+
+            assert result == expected
+
+        s = s.append(Series([pd.NaT]))
+        assert np.isnan(s.dt.month_name(locale=time_locale).iloc[-1])
+
     def test_strftime(self):
         # GH 10086
         s = Series(date_range('20130101', periods=5))
@@ -306,16 +411,16 @@ def test_strftime(self):
         datetime_index = date_range('20150301', periods=5)
         result = datetime_index.strftime("%Y/%m/%d")
 
-        expected = np.array(['2015/03/01', '2015/03/02', '2015/03/03',
-                             '2015/03/04', '2015/03/05'], dtype=np.object_)
+        expected = Index(['2015/03/01', '2015/03/02', '2015/03/03',
+                          '2015/03/04', '2015/03/05'], dtype=np.object_)
         # dtype may be S10 or U10 depending on python version
-        self.assert_numpy_array_equal(result, expected, check_dtype=False)
+        tm.assert_index_equal(result, expected)
 
         period_index = period_range('20150301', periods=5)
         result = period_index.strftime("%Y/%m/%d")
-        expected = np.array(['2015/03/01', '2015/03/02', '2015/03/03',
-                             '2015/03/04', '2015/03/05'], dtype='=U10')
-        self.assert_numpy_array_equal(result, expected)
+        expected = Index(['2015/03/01', '2015/03/02', '2015/03/03',
+                          '2015/03/04', '2015/03/05'], dtype='=U10')
+        tm.assert_index_equal(result, expected)
 
         s = Series([datetime(2013, 1, 1, 2, 32, 59), datetime(2013, 1, 2, 14,
                                                               32, 1)])
@@ -364,31 +469,31 @@ def test_valid_dt_with_missing_values(self):
 
     def test_dt_accessor_api(self):
         # GH 9322
-        from pandas.tseries.common import (CombinedDatetimelikeProperties,
-                                           DatetimeProperties)
-        self.assertIs(Series.dt, CombinedDatetimelikeProperties)
+        from pandas.core.indexes.accessors import (
+            CombinedDatetimelikeProperties, DatetimeProperties)
+        assert Series.dt is CombinedDatetimelikeProperties
 
         s = Series(date_range('2000-01-01', periods=3))
-        self.assertIsInstance(s.dt, DatetimeProperties)
-
-        for s in [Series(np.arange(5)), Series(list('abcde')),
-                  Series(np.random.randn(5))]:
-            with tm.assertRaisesRegexp(AttributeError,
-                                       "only use .dt accessor"):
-                s.dt
-            self.assertFalse(hasattr(s, 'dt'))
-
-    def test_sub_of_datetime_from_TimeSeries(self):
-        from pandas.tseries.timedeltas import to_timedelta
-        from datetime import datetime
-        a = Timestamp(datetime(1993, 0o1, 0o7, 13, 30, 00))
-        b = datetime(1993, 6, 22, 13, 30)
-        a = Series([a])
-        result = to_timedelta(np.abs(a - b))
-        self.assertEqual(result.dtype, 'timedelta64[ns]')
+        assert isinstance(s.dt, DatetimeProperties)
+
+    @pytest.mark.parametrize('ser', [Series(np.arange(5)),
+                                     Series(list('abcde')),
+                                     Series(np.random.randn(5))])
+    def test_dt_accessor_invalid(self, ser):
+        # GH#9322 check that series with incorrect dtypes don't have attr
+        with pytest.raises(AttributeError, match="only use .dt accessor"):
+            ser.dt
+        assert not hasattr(ser, 'dt')
+
+    def test_dt_accessor_updates_on_inplace(self):
+        s = Series(pd.date_range('2018-01-01', periods=10))
+        s[2] = None
+        s.fillna(pd.Timestamp('2018-01-01'), inplace=True)
+        result = s.dt.date
+        assert result[0] == result[2]
 
     def test_between(self):
-        s = Series(bdate_range('1/1/2000', periods=20).asobject)
+        s = Series(bdate_range('1/1/2000', periods=20).astype(object))
         s[::2] = np.nan
 
         result = s[s.between(s[3], s[17])]
@@ -410,3 +515,42 @@ def test_date_tz(self):
                            date(2015, 11, 22)])
         assert_series_equal(s.dt.date, expected)
         assert_series_equal(s.apply(lambda x: x.date()), expected)
+
+    def test_datetime_understood(self):
+        # Ensures it doesn't fail to create the right series
+        # reported in issue#16726
+        series = pd.Series(pd.date_range("2012-01-01", periods=3))
+        offset = pd.offsets.DateOffset(days=6)
+        result = series - offset
+        expected = pd.Series(pd.to_datetime([
+            '2011-12-26', '2011-12-27', '2011-12-28']))
+        tm.assert_series_equal(result, expected)
+
+    def test_dt_timetz_accessor(self, tz_naive_fixture):
+        # GH21358
+        tz = maybe_get_tz(tz_naive_fixture)
+
+        dtindex = pd.DatetimeIndex(['2014-04-04 23:56', '2014-07-18 21:24',
+                                    '2015-11-22 22:14'], tz=tz)
+        s = Series(dtindex)
+        expected = Series([time(23, 56, tzinfo=tz), time(21, 24, tzinfo=tz),
+                           time(22, 14, tzinfo=tz)])
+        result = s.dt.timetz
+        tm.assert_series_equal(result, expected)
+
+    def test_setitem_with_string_index(self):
+        # GH 23451
+        x = pd.Series([1, 2, 3], index=['Date', 'b', 'other'])
+        x['Date'] = date.today()
+        assert x.Date == date.today()
+        assert x['Date'] == date.today()
+
+    def test_setitem_with_different_tz(self):
+        # GH#24024
+        ser = pd.Series(pd.date_range('2000', periods=2, tz="US/Central"))
+        ser[0] = pd.Timestamp("2000", tz='US/Eastern')
+        expected = pd.Series([
+            pd.Timestamp("2000-01-01 00:00:00-05:00", tz="US/Eastern"),
+            pd.Timestamp("2000-01-02 00:00:00-06:00", tz="US/Central"),
+        ], dtype=object)
+        tm.assert_series_equal(ser, expected)
diff --git a/pandas/tests/series/test_dtypes.py b/pandas/tests/series/test_dtypes.py
index a2aaff25516ae..d8046c4944afc 100644
--- a/pandas/tests/series/test_dtypes.py
+++ b/pandas/tests/series/test_dtypes.py
@@ -1,163 +1,441 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-import sys
-from datetime import datetime
+from datetime import datetime, timedelta
 import string
+import sys
 
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas import Series, Timestamp, Timedelta, DataFrame, date_range
-
+from pandas._libs.tslibs import iNaT
+import pandas.compat as compat
 from pandas.compat import lrange, range, u
-from pandas import compat
-from pandas.util.testing import assert_series_equal
+
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, Series, Timedelta, Timestamp, date_range)
+from pandas.api.types import CategoricalDtype
 import pandas.util.testing as tm
 
-from .common import TestData
 
+class TestSeriesDtypes(object):
+
+    def test_dt64_series_astype_object(self):
+        dt64ser = Series(date_range('20130101', periods=3))
+        result = dt64ser.astype(object)
+        assert isinstance(result.iloc[0], datetime)
+        assert result.dtype == np.object_
+
+    def test_td64_series_astype_object(self):
+        tdser = Series(['59 Days', '59 Days', 'NaT'], dtype='timedelta64[ns]')
+        result = tdser.astype(object)
+        assert isinstance(result.iloc[0], timedelta)
+        assert result.dtype == np.object_
+
+    @pytest.mark.parametrize("dtype", ["float32", "float64",
+                                       "int64", "int32"])
+    def test_astype(self, dtype):
+        s = Series(np.random.randn(5), name='foo')
+        as_typed = s.astype(dtype)
 
-class TestSeriesDtypes(TestData, tm.TestCase):
+        assert as_typed.dtype == dtype
+        assert as_typed.name == s.name
 
-    def test_astype(self):
+    def test_asobject_deprecated(self):
         s = Series(np.random.randn(5), name='foo')
+        with tm.assert_produces_warning(FutureWarning):
+            o = s.asobject
+        assert isinstance(o, np.ndarray)
+
+    def test_dtype(self, datetime_series):
+
+        assert datetime_series.dtype == np.dtype('float64')
+        assert datetime_series.dtypes == np.dtype('float64')
+        assert datetime_series.ftype == 'float64:dense'
+        assert datetime_series.ftypes == 'float64:dense'
+        tm.assert_series_equal(datetime_series.get_dtype_counts(),
+                               Series(1, ['float64']))
+        # GH18243 - Assert .get_ftype_counts is deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            tm.assert_series_equal(datetime_series.get_ftype_counts(),
+                                   Series(1, ['float64:dense']))
 
-        for dtype in ['float32', 'float64', 'int64', 'int32']:
-            astyped = s.astype(dtype)
-            self.assertEqual(astyped.dtype, dtype)
-            self.assertEqual(astyped.name, s.name)
-
-    def test_dtype(self):
-
-        self.assertEqual(self.ts.dtype, np.dtype('float64'))
-        self.assertEqual(self.ts.dtypes, np.dtype('float64'))
-        self.assertEqual(self.ts.ftype, 'float64:dense')
-        self.assertEqual(self.ts.ftypes, 'float64:dense')
-        assert_series_equal(self.ts.get_dtype_counts(), Series(1, ['float64']))
-        assert_series_equal(self.ts.get_ftype_counts(), Series(
-            1, ['float64:dense']))
-
-    def test_astype_cast_nan_inf_int(self):
-        # GH14265, check nan and inf raise error when converting to int
-        types = [np.int32, np.int64]
-        values = [np.nan, np.inf]
+    @pytest.mark.parametrize("value", [np.nan, np.inf])
+    @pytest.mark.parametrize("dtype", [np.int32, np.int64])
+    def test_astype_cast_nan_inf_int(self, dtype, value):
+        # gh-14265: check NaN and inf raise error when converting to int
         msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
+        s = Series([value])
 
-        for this_type in types:
-            for this_val in values:
-                s = Series([this_val])
-                with self.assertRaisesRegexp(ValueError, msg):
-                    s.astype(this_type)
+        with pytest.raises(ValueError, match=msg):
+            s.astype(dtype)
 
-    def test_astype_cast_object_int(self):
+    @pytest.mark.parametrize("dtype", [int, np.int8, np.int64])
+    def test_astype_cast_object_int_fail(self, dtype):
         arr = Series(["car", "house", "tree", "1"])
+        msg = r"invalid literal for (int|long)\(\) with base 10: 'car'"
+        with pytest.raises(ValueError, match=msg):
+            arr.astype(dtype)
 
-        self.assertRaises(ValueError, arr.astype, int)
-        self.assertRaises(ValueError, arr.astype, np.int64)
-        self.assertRaises(ValueError, arr.astype, np.int8)
-
+    def test_astype_cast_object_int(self):
         arr = Series(['1', '2', '3', '4'], dtype=object)
         result = arr.astype(int)
-        self.assert_series_equal(result, Series(np.arange(1, 5)))
 
-    def test_astype_datetimes(self):
-        import pandas._libs.tslib as tslib
+        tm.assert_series_equal(result, Series(np.arange(1, 5)))
+
+    def test_astype_datetime(self):
+        s = Series(iNaT, dtype='M8[ns]', index=lrange(5))
 
-        s = Series(tslib.iNaT, dtype='M8[ns]', index=lrange(5))
         s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
+        assert s.dtype == np.object_
 
         s = Series([datetime(2001, 1, 2, 0, 0)])
+
         s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
+        assert s.dtype == np.object_
 
         s = Series([datetime(2001, 1, 2, 0, 0) for i in range(3)])
+
         s[1] = np.nan
-        self.assertEqual(s.dtype, 'M8[ns]')
-        s = s.astype('O')
-        self.assertEqual(s.dtype, np.object_)
+        assert s.dtype == 'M8[ns]'
 
-    def test_astype_str(self):
-        # GH4405
-        digits = string.digits
-        s1 = Series([digits * 10, tm.rands(63), tm.rands(64), tm.rands(1000)])
-        s2 = Series([digits * 10, tm.rands(63), tm.rands(64), nan, 1.0])
-        types = (compat.text_type, np.str_)
-        for typ in types:
-            for s in (s1, s2):
-                res = s.astype(typ)
-                expec = s.map(compat.text_type)
-                assert_series_equal(res, expec)
-
-        # GH9757
-        # Test str and unicode on python 2.x and just str on python 3.x
-        for tt in set([str, compat.text_type]):
-            ts = Series([Timestamp('2010-01-04 00:00:00')])
-            s = ts.astype(tt)
-            expected = Series([tt('2010-01-04')])
-            assert_series_equal(s, expected)
-
-            ts = Series([Timestamp('2010-01-04 00:00:00', tz='US/Eastern')])
-            s = ts.astype(tt)
-            expected = Series([tt('2010-01-04 00:00:00-05:00')])
-            assert_series_equal(s, expected)
-
-            td = Series([Timedelta(1, unit='d')])
-            s = td.astype(tt)
-            expected = Series([tt('1 days 00:00:00.000000000')])
-            assert_series_equal(s, expected)
+        s = s.astype('O')
+        assert s.dtype == np.object_
+
+    def test_astype_datetime64tz(self):
+        s = Series(date_range('20130101', periods=3, tz='US/Eastern'))
+
+        # astype
+        result = s.astype(object)
+        expected = Series(s.astype(object), dtype=object)
+        tm.assert_series_equal(result, expected)
+
+        result = Series(s.values).dt.tz_localize('UTC').dt.tz_convert(s.dt.tz)
+        tm.assert_series_equal(result, s)
+
+        # astype - object, preserves on construction
+        result = Series(s.astype(object))
+        expected = s.astype(object)
+        tm.assert_series_equal(result, expected)
+
+        # astype - datetime64[ns, tz]
+        result = Series(s.values).astype('datetime64[ns, US/Eastern]')
+        tm.assert_series_equal(result, s)
+
+        result = Series(s.values).astype(s.dtype)
+        tm.assert_series_equal(result, s)
+
+        result = s.astype('datetime64[ns, CET]')
+        expected = Series(date_range('20130101 06:00:00', periods=3, tz='CET'))
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [compat.text_type, np.str_])
+    @pytest.mark.parametrize("series", [Series([string.digits * 10,
+                                                tm.rands(63),
+                                                tm.rands(64),
+                                                tm.rands(1000)]),
+                                        Series([string.digits * 10,
+                                                tm.rands(63),
+                                                tm.rands(64), np.nan, 1.0])])
+    def test_astype_str_map(self, dtype, series):
+        # see gh-4405
+        result = series.astype(dtype)
+        expected = series.map(compat.text_type)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("dtype", [str, compat.text_type])
+    def test_astype_str_cast(self, dtype):
+        # see gh-9757: test str and unicode on python 2.x
+        # and just str on python 3.x
+        ts = Series([Timestamp('2010-01-04 00:00:00')])
+        s = ts.astype(dtype)
+
+        expected = Series([dtype('2010-01-04')])
+        tm.assert_series_equal(s, expected)
+
+        ts = Series([Timestamp('2010-01-04 00:00:00', tz='US/Eastern')])
+        s = ts.astype(dtype)
+
+        expected = Series([dtype('2010-01-04 00:00:00-05:00')])
+        tm.assert_series_equal(s, expected)
+
+        td = Series([Timedelta(1, unit='d')])
+        s = td.astype(dtype)
+
+        expected = Series([dtype('1 days 00:00:00.000000000')])
+        tm.assert_series_equal(s, expected)
 
     def test_astype_unicode(self):
-
-        # GH7758
-        # a bit of magic is required to set default encoding encoding to utf-8
+        # see gh-7758: A bit of magic is required to set
+        # default encoding to utf-8
         digits = string.digits
         test_series = [
             Series([digits * 10, tm.rands(63), tm.rands(64), tm.rands(1000)]),
             Series([u('データーサイエンス、お前はもう死んでいる')]),
-
         ]
 
         former_encoding = None
+
         if not compat.PY3:
-            # in python we can force the default encoding for this test
+            # In Python, we can force the default encoding for this test
             former_encoding = sys.getdefaultencoding()
             reload(sys)  # noqa
+
             sys.setdefaultencoding("utf-8")
         if sys.getdefaultencoding() == "utf-8":
             test_series.append(Series([u('野菜食べないとやばい')
                                        .encode("utf-8")]))
+
         for s in test_series:
             res = s.astype("unicode")
             expec = s.map(compat.text_type)
-            assert_series_equal(res, expec)
-        # restore the former encoding
+            tm.assert_series_equal(res, expec)
+
+        # Restore the former encoding
         if former_encoding is not None and former_encoding != "utf-8":
             reload(sys)  # noqa
             sys.setdefaultencoding(former_encoding)
 
-    def test_astype_dict(self):
-        # GH7271
+    @pytest.mark.parametrize("dtype_class", [dict, Series])
+    def test_astype_dict_like(self, dtype_class):
+        # see gh-7271
         s = Series(range(0, 10, 2), name='abc')
 
-        result = s.astype({'abc': str})
+        dt1 = dtype_class({'abc': str})
+        result = s.astype(dt1)
         expected = Series(['0', '2', '4', '6', '8'], name='abc')
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
-        result = s.astype({'abc': 'float64'})
+        dt2 = dtype_class({'abc': 'float64'})
+        result = s.astype(dt2)
         expected = Series([0.0, 2.0, 4.0, 6.0, 8.0], dtype='float64',
                           name='abc')
-        assert_series_equal(result, expected)
-
-        self.assertRaises(KeyError, s.astype, {'abc': str, 'def': str})
-        self.assertRaises(KeyError, s.astype, {0: str})
-
-    def test_complexx(self):
-        # GH4819
-        # complex access for ndarray compat
+        tm.assert_series_equal(result, expected)
+
+        dt3 = dtype_class({'abc': str, 'def': str})
+        msg = ("Only the Series name can be used for the key in Series dtype"
+               r" mappings\.")
+        with pytest.raises(KeyError, match=msg):
+            s.astype(dt3)
+
+        dt4 = dtype_class({0: str})
+        with pytest.raises(KeyError, match=msg):
+            s.astype(dt4)
+
+        # GH16717
+        # if dtypes provided is empty, it should error
+        dt5 = dtype_class({})
+        with pytest.raises(KeyError, match=msg):
+            s.astype(dt5)
+
+    def test_astype_categories_deprecation(self):
+
+        # deprecated 17636
+        s = Series(['a', 'b', 'a'])
+        expected = s.astype(CategoricalDtype(['a', 'b'], ordered=True))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            result = s.astype('category', categories=['a', 'b'], ordered=True)
+        tm.assert_series_equal(result, expected)
+
+    def test_astype_from_categorical(self):
+        items = ["a", "b", "c", "a"]
+        s = Series(items)
+        exp = Series(Categorical(items))
+        res = s.astype('category')
+        tm.assert_series_equal(res, exp)
+
+        items = [1, 2, 3, 1]
+        s = Series(items)
+        exp = Series(Categorical(items))
+        res = s.astype('category')
+        tm.assert_series_equal(res, exp)
+
+        df = DataFrame({"cats": [1, 2, 3, 4, 5, 6],
+                        "vals": [1, 2, 3, 4, 5, 6]})
+        cats = Categorical([1, 2, 3, 4, 5, 6])
+        exp_df = DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
+        df["cats"] = df["cats"].astype("category")
+        tm.assert_frame_equal(exp_df, df)
+
+        df = DataFrame({"cats": ['a', 'b', 'b', 'a', 'a', 'd'],
+                        "vals": [1, 2, 3, 4, 5, 6]})
+        cats = Categorical(['a', 'b', 'b', 'a', 'a', 'd'])
+        exp_df = DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
+        df["cats"] = df["cats"].astype("category")
+        tm.assert_frame_equal(exp_df, df)
+
+        # with keywords
+        lst = ["a", "b", "c", "a"]
+        s = Series(lst)
+        exp = Series(Categorical(lst, ordered=True))
+        res = s.astype(CategoricalDtype(None, ordered=True))
+        tm.assert_series_equal(res, exp)
+
+        exp = Series(Categorical(lst, categories=list('abcdef'), ordered=True))
+        res = s.astype(CategoricalDtype(list('abcdef'), ordered=True))
+        tm.assert_series_equal(res, exp)
+
+    def test_astype_categorical_to_other(self):
+
+        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
+        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
+        cat_labels = Categorical(labels, labels)
+
+        df = df.sort_values(by=['value'], ascending=True)
+        df['value_group'] = pd.cut(df.value, range(0, 10500, 500),
+                                   right=False, labels=cat_labels)
+
+        s = df['value_group']
+        expected = s
+        tm.assert_series_equal(s.astype('category'), expected)
+        tm.assert_series_equal(s.astype(CategoricalDtype()), expected)
+        msg = (r"could not convert string to float|"
+               r"invalid literal for float\(\)")
+        with pytest.raises(ValueError, match=msg):
+            s.astype('float64')
+
+        cat = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
+        exp = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
+        tm.assert_series_equal(cat.astype('str'), exp)
+        s2 = Series(Categorical(['1', '2', '3', '4']))
+        exp2 = Series([1, 2, 3, 4]).astype(int)
+        tm.assert_series_equal(s2.astype('int'), exp2)
+
+        # object don't sort correctly, so just compare that we have the same
+        # values
+        def cmp(a, b):
+            tm.assert_almost_equal(
+                np.sort(np.unique(a)), np.sort(np.unique(b)))
+
+        expected = Series(np.array(s.values), name='value_group')
+        cmp(s.astype('object'), expected)
+        cmp(s.astype(np.object_), expected)
+
+        # array conversion
+        tm.assert_almost_equal(np.array(s), np.array(s.values))
+
+        # valid conversion
+        for valid in [lambda x: x.astype('category'),
+                      lambda x: x.astype(CategoricalDtype()),
+                      lambda x: x.astype('object').astype('category'),
+                      lambda x: x.astype('object').astype(
+                          CategoricalDtype())
+                      ]:
+
+            result = valid(s)
+            # compare series values
+            # internal .categories can't be compared because it is sorted
+            tm.assert_series_equal(result, s, check_categorical=False)
+
+        # invalid conversion (these are NOT a dtype)
+        msg = (r"invalid type <class 'pandas\.core\.arrays\.categorical\."
+               "Categorical'> for astype")
+        for invalid in [lambda x: x.astype(Categorical),
+                        lambda x: x.astype('object').astype(Categorical)]:
+            with pytest.raises(TypeError, match=msg):
+                invalid(s)
+
+    @pytest.mark.parametrize('name', [None, 'foo'])
+    @pytest.mark.parametrize('dtype_ordered', [True, False])
+    @pytest.mark.parametrize('series_ordered', [True, False])
+    def test_astype_categorical_to_categorical(self, name, dtype_ordered,
+                                               series_ordered):
+        # GH 10696/18593
+        s_data = list('abcaacbab')
+        s_dtype = CategoricalDtype(list('bac'), ordered=series_ordered)
+        s = Series(s_data, dtype=s_dtype, name=name)
+
+        # unspecified categories
+        dtype = CategoricalDtype(ordered=dtype_ordered)
+        result = s.astype(dtype)
+        exp_dtype = CategoricalDtype(s_dtype.categories, dtype_ordered)
+        expected = Series(s_data, name=name, dtype=exp_dtype)
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.astype('category', ordered=dtype_ordered)
+        tm.assert_series_equal(result, expected)
+
+        # different categories
+        dtype = CategoricalDtype(list('adc'), dtype_ordered)
+        result = s.astype(dtype)
+        expected = Series(s_data, name=name, dtype=dtype)
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            result = s.astype(
+                'category', categories=list('adc'), ordered=dtype_ordered)
+        tm.assert_series_equal(result, expected)
+
+        if dtype_ordered is False:
+            # not specifying ordered, so only test once
+            expected = s
+            result = s.astype('category')
+            tm.assert_series_equal(result, expected)
+
+    def test_astype_categoricaldtype(self):
+        s = Series(['a', 'b', 'a'])
+        result = s.astype(CategoricalDtype(['a', 'b'], ordered=True))
+        expected = Series(Categorical(['a', 'b', 'a'], ordered=True))
+        tm.assert_series_equal(result, expected)
+
+        result = s.astype(CategoricalDtype(['a', 'b'], ordered=False))
+        expected = Series(Categorical(['a', 'b', 'a'], ordered=False))
+        tm.assert_series_equal(result, expected)
+
+        result = s.astype(CategoricalDtype(['a', 'b', 'c'], ordered=False))
+        expected = Series(Categorical(['a', 'b', 'a'],
+                                      categories=['a', 'b', 'c'],
+                                      ordered=False))
+        tm.assert_series_equal(result, expected)
+        tm.assert_index_equal(result.cat.categories, Index(['a', 'b', 'c']))
+
+    def test_astype_categoricaldtype_with_args(self):
+        s = Series(['a', 'b'])
+        type_ = CategoricalDtype(['a', 'b'])
+
+        msg = (r"Cannot specify a CategoricalDtype and also `categories` or"
+               r" `ordered`\. Use `dtype=CategoricalDtype\(categories,"
+               r" ordered\)` instead\.")
+        with pytest.raises(TypeError, match=msg):
+            s.astype(type_, ordered=True)
+        with pytest.raises(TypeError, match=msg):
+            s.astype(type_, categories=['a', 'b'])
+        with pytest.raises(TypeError, match=msg):
+            s.astype(type_, categories=['a', 'b'], ordered=False)
+
+    @pytest.mark.parametrize("dtype", [
+        np.datetime64,
+        np.timedelta64,
+    ])
+    def test_astype_generic_timestamp_no_frequency(self, dtype):
+        # see gh-15524, gh-15987
+        data = [1]
+        s = Series(data)
+
+        msg = "dtype has no unit. Please pass in"
+        with pytest.raises(ValueError, match=msg):
+            s.astype(dtype)
+
+    @pytest.mark.parametrize("dtype", np.typecodes['All'])
+    def test_astype_empty_constructor_equality(self, dtype):
+        # see gh-15524
+
+        if dtype not in (
+            "S", "V",  # poor support (if any) currently
+            "M", "m"   # Generic timestamps raise a ValueError. Already tested.
+        ):
+            init_empty = Series([], dtype=dtype)
+            as_type_empty = Series([]).astype(dtype)
+            tm.assert_series_equal(init_empty, as_type_empty)
+
+    def test_complex(self):
+        # see gh-4819: complex access for ndarray compat
         a = np.arange(5, dtype=np.float64)
         b = Series(a + 4j * a)
+
         tm.assert_numpy_array_equal(a, b.real)
         tm.assert_numpy_array_equal(4 * a, b.imag)
 
@@ -166,23 +444,21 @@ def test_complexx(self):
         tm.assert_numpy_array_equal(4 * a, b.imag)
 
     def test_arg_for_errors_in_astype(self):
-        # issue #14878
+        # see gh-14878
+        s = Series([1, 2, 3])
 
-        sr = Series([1, 2, 3])
-
-        with self.assertRaises(ValueError):
-            sr.astype(np.float64, errors=False)
-
-        with tm.assert_produces_warning(FutureWarning):
-            sr.astype(np.int8, raise_on_error=True)
+        msg = (r"Expected value of kwarg 'errors' to be one of \['raise',"
+               r" 'ignore'\]\. Supplied value is 'False'")
+        with pytest.raises(ValueError, match=msg):
+            s.astype(np.float64, errors=False)
 
-        sr.astype(np.int8, errors='raise')
+        s.astype(np.int8, errors='raise')
 
     def test_intercept_astype_object(self):
         series = Series(date_range('1/1/2000', periods=10))
 
-        # this test no longer makes sense as series is by default already
-        # M8[ns]
+        # This test no longer makes sense, as
+        # Series is by default already M8[ns].
         expected = series.astype('object')
 
         df = DataFrame({'a': series,
@@ -192,9 +468,51 @@ def test_intercept_astype_object(self):
         tm.assert_series_equal(df.dtypes, exp_dtypes)
 
         result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
+        assert (result[:, 0] == expected.values).all()
 
         df = DataFrame({'a': series, 'b': ['foo'] * len(series)})
 
         result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
+        assert (result[:, 0] == expected.values).all()
+
+    def test_series_to_categorical(self):
+        # see gh-16524: test conversion of Series to Categorical
+        series = Series(['a', 'b', 'c'])
+
+        result = Series(series, dtype='category')
+        expected = Series(['a', 'b', 'c'], dtype='category')
+
+        tm.assert_series_equal(result, expected)
+
+    def test_infer_objects_series(self):
+        # GH 11221
+        actual = Series(np.array([1, 2, 3], dtype='O')).infer_objects()
+        expected = Series([1, 2, 3])
+        tm.assert_series_equal(actual, expected)
+
+        actual = Series(np.array([1, 2, 3, None], dtype='O')).infer_objects()
+        expected = Series([1., 2., 3., np.nan])
+        tm.assert_series_equal(actual, expected)
+
+        # only soft conversions, unconvertable pass thru unchanged
+        actual = (Series(np.array([1, 2, 3, None, 'a'], dtype='O'))
+                  .infer_objects())
+        expected = Series([1, 2, 3, None, 'a'])
+
+        assert actual.dtype == 'object'
+        tm.assert_series_equal(actual, expected)
+
+    def test_is_homogeneous_type(self):
+        assert Series()._is_homogeneous_type
+        assert Series([1, 2])._is_homogeneous_type
+        assert Series(pd.Categorical([1, 2]))._is_homogeneous_type
+
+    @pytest.mark.parametrize("data", [
+        pd.period_range("2000", periods=4),
+        pd.IntervalIndex.from_breaks([1, 2, 3, 4])
+    ])
+    def test_values_compatibility(self, data):
+        # https://github.com/pandas-dev/pandas/issues/23995
+        result = pd.Series(data).values
+        expected = np.array(data.astype(object))
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/series/test_duplicates.py b/pandas/tests/series/test_duplicates.py
new file mode 100644
index 0000000000000..a975edacc19c7
--- /dev/null
+++ b/pandas/tests/series/test_duplicates.py
@@ -0,0 +1,148 @@
+# coding=utf-8
+
+import numpy as np
+import pytest
+
+from pandas import Categorical, Series
+import pandas.util.testing as tm
+
+
+def test_value_counts_nunique():
+    # basics.rst doc example
+    series = Series(np.random.randn(500))
+    series[20:500] = np.nan
+    series[10:20] = 5000
+    result = series.nunique()
+    assert result == 11
+
+    # GH 18051
+    s = Series(Categorical([]))
+    assert s.nunique() == 0
+    s = Series(Categorical([np.nan]))
+    assert s.nunique() == 0
+
+
+def test_unique():
+    # GH714 also, dtype=float
+    s = Series([1.2345] * 100)
+    s[::2] = np.nan
+    result = s.unique()
+    assert len(result) == 2
+
+    s = Series([1.2345] * 100, dtype='f4')
+    s[::2] = np.nan
+    result = s.unique()
+    assert len(result) == 2
+
+    # NAs in object arrays #714
+    s = Series(['foo'] * 100, dtype='O')
+    s[::2] = np.nan
+    result = s.unique()
+    assert len(result) == 2
+
+    # decision about None
+    s = Series([1, 2, 3, None, None, None], dtype=object)
+    result = s.unique()
+    expected = np.array([1, 2, 3, None], dtype=object)
+    tm.assert_numpy_array_equal(result, expected)
+
+    # GH 18051
+    s = Series(Categorical([]))
+    tm.assert_categorical_equal(s.unique(), Categorical([]), check_dtype=False)
+    s = Series(Categorical([np.nan]))
+    tm.assert_categorical_equal(s.unique(), Categorical([np.nan]),
+                                check_dtype=False)
+
+
+def test_unique_data_ownership():
+    # it works! #1807
+    Series(Series(["a", "c", "b"]).unique()).sort_values()
+
+
+@pytest.mark.parametrize('data, expected', [
+    (np.random.randint(0, 10, size=1000), False),
+    (np.arange(1000), True),
+    ([], True),
+    ([np.nan], True),
+    (['foo', 'bar', np.nan], True),
+    (['foo', 'foo', np.nan], False),
+    (['foo', 'bar', np.nan, np.nan], False)])
+def test_is_unique(data, expected):
+    # GH11946 / GH25180
+    s = Series(data)
+    assert s.is_unique is expected
+
+
+def test_is_unique_class_ne(capsys):
+    # GH 20661
+    class Foo(object):
+        def __init__(self, val):
+            self._value = val
+
+        def __ne__(self, other):
+            raise Exception("NEQ not supported")
+
+    with capsys.disabled():
+        li = [Foo(i) for i in range(5)]
+        s = Series(li, index=[i for i in range(5)])
+    s.is_unique
+    captured = capsys.readouterr()
+    assert len(captured.err) == 0
+
+
+@pytest.mark.parametrize(
+    'keep, expected',
+    [
+        ('first', Series([False, False, False, False, True, True, False])),
+        ('last', Series([False, True, True, False, False, False, False])),
+        (False, Series([False, True, True, False, True, True, False]))
+    ])
+def test_drop_duplicates(any_numpy_dtype, keep, expected):
+    tc = Series([1, 0, 3, 5, 3, 0, 4], dtype=np.dtype(any_numpy_dtype))
+
+    if tc.dtype == 'bool':
+        pytest.skip('tested separately in test_drop_duplicates_bool')
+
+    tm.assert_series_equal(tc.duplicated(keep=keep), expected)
+    tm.assert_series_equal(tc.drop_duplicates(keep=keep), tc[~expected])
+    sc = tc.copy()
+    sc.drop_duplicates(keep=keep, inplace=True)
+    tm.assert_series_equal(sc, tc[~expected])
+
+
+@pytest.mark.parametrize('keep, expected',
+                         [('first', Series([False, False, True, True])),
+                          ('last', Series([True, True, False, False])),
+                          (False, Series([True, True, True, True]))])
+def test_drop_duplicates_bool(keep, expected):
+    tc = Series([True, False, True, False])
+
+    tm.assert_series_equal(tc.duplicated(keep=keep), expected)
+    tm.assert_series_equal(tc.drop_duplicates(keep=keep), tc[~expected])
+    sc = tc.copy()
+    sc.drop_duplicates(keep=keep, inplace=True)
+    tm.assert_series_equal(sc, tc[~expected])
+
+
+@pytest.mark.parametrize('keep, expected', [
+    ('first', Series([False, False, True, False, True], name='name')),
+    ('last', Series([True, True, False, False, False], name='name')),
+    (False, Series([True, True, True, False, True], name='name'))
+])
+def test_duplicated_keep(keep, expected):
+    s = Series(['a', 'b', 'b', 'c', 'a'], name='name')
+
+    result = s.duplicated(keep=keep)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('keep, expected', [
+    ('first', Series([False, False, True, False, True])),
+    ('last', Series([True, True, False, False, False])),
+    (False, Series([True, True, True, False, True]))
+])
+def test_duplicated_nan_none(keep, expected):
+    s = Series([np.nan, 3, 3, None, np.nan], dtype=object)
+
+    result = s.duplicated(keep=keep)
+    tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_indexing.py b/pandas/tests/series/test_indexing.py
deleted file mode 100644
index 0b6c0c601ac72..0000000000000
--- a/pandas/tests/series/test_indexing.py
+++ /dev/null
@@ -1,2688 +0,0 @@
-# coding=utf-8
-# pylint: disable-msg=E1101,W0612
-
-from datetime import datetime, timedelta
-
-from numpy import nan
-import numpy as np
-import pandas as pd
-
-import pandas._libs.index as _index
-from pandas.types.common import is_integer, is_scalar
-from pandas import (Index, Series, DataFrame, isnull,
-                    date_range, NaT, MultiIndex,
-                    Timestamp, DatetimeIndex, Timedelta)
-from pandas.core.indexing import IndexingError
-from pandas.tseries.offsets import BDay
-from pandas._libs import tslib, lib
-
-from pandas.compat import lrange, range
-from pandas import compat
-from pandas.util.testing import (slow,
-                                 assert_series_equal,
-                                 assert_almost_equal,
-                                 assert_frame_equal)
-import pandas.util.testing as tm
-
-from pandas.tests.series.common import TestData
-
-JOIN_TYPES = ['inner', 'outer', 'left', 'right']
-
-
-class TestSeriesIndexing(TestData, tm.TestCase):
-
-    def test_get(self):
-
-        # GH 6383
-        s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56, 45,
-                             51, 39, 55, 43, 54, 52, 51, 54]))
-
-        result = s.get(25, 0)
-        expected = 0
-        self.assertEqual(result, expected)
-
-        s = Series(np.array([43, 48, 60, 48, 50, 51, 50, 45, 57, 48, 56,
-                             45, 51, 39, 55, 43, 54, 52, 51, 54]),
-                   index=pd.Float64Index(
-                       [25.0, 36.0, 49.0, 64.0, 81.0, 100.0,
-                        121.0, 144.0, 169.0, 196.0, 1225.0,
-                        1296.0, 1369.0, 1444.0, 1521.0, 1600.0,
-                        1681.0, 1764.0, 1849.0, 1936.0],
-                       dtype='object'))
-
-        result = s.get(25, 0)
-        expected = 43
-        self.assertEqual(result, expected)
-
-        # GH 7407
-        # with a boolean accessor
-        df = pd.DataFrame({'i': [0] * 3, 'b': [False] * 3})
-        vc = df.i.value_counts()
-        result = vc.get(99, default='Missing')
-        self.assertEqual(result, 'Missing')
-
-        vc = df.b.value_counts()
-        result = vc.get(False, default='Missing')
-        self.assertEqual(result, 3)
-
-        result = vc.get(True, default='Missing')
-        self.assertEqual(result, 'Missing')
-
-    def test_delitem(self):
-
-        # GH 5542
-        # should delete the item inplace
-        s = Series(lrange(5))
-        del s[0]
-
-        expected = Series(lrange(1, 5), index=lrange(1, 5))
-        assert_series_equal(s, expected)
-
-        del s[1]
-        expected = Series(lrange(2, 5), index=lrange(2, 5))
-        assert_series_equal(s, expected)
-
-        # empty
-        s = Series()
-
-        def f():
-            del s[0]
-
-        self.assertRaises(KeyError, f)
-
-        # only 1 left, del, add, del
-        s = Series(1)
-        del s[0]
-        assert_series_equal(s, Series(dtype='int64', index=Index(
-            [], dtype='int64')))
-        s[0] = 1
-        assert_series_equal(s, Series(1))
-        del s[0]
-        assert_series_equal(s, Series(dtype='int64', index=Index(
-            [], dtype='int64')))
-
-        # Index(dtype=object)
-        s = Series(1, index=['a'])
-        del s['a']
-        assert_series_equal(s, Series(dtype='int64', index=Index(
-            [], dtype='object')))
-        s['a'] = 1
-        assert_series_equal(s, Series(1, index=['a']))
-        del s['a']
-        assert_series_equal(s, Series(dtype='int64', index=Index(
-            [], dtype='object')))
-
-    def test_getitem_setitem_ellipsis(self):
-        s = Series(np.random.randn(10))
-
-        np.fix(s)
-
-        result = s[...]
-        assert_series_equal(result, s)
-
-        s[...] = 5
-        self.assertTrue((result == 5).all())
-
-    def test_getitem_negative_out_of_bounds(self):
-        s = Series(tm.rands_array(5, 10), index=tm.rands_array(10, 10))
-
-        self.assertRaises(IndexError, s.__getitem__, -11)
-        self.assertRaises(IndexError, s.__setitem__, -11, 'foo')
-
-    def test_pop(self):
-        # GH 6600
-        df = DataFrame({'A': 0, 'B': np.arange(5, dtype='int64'), 'C': 0, })
-        k = df.iloc[4]
-
-        result = k.pop('B')
-        self.assertEqual(result, 4)
-
-        expected = Series([0, 0], index=['A', 'C'], name=4)
-        assert_series_equal(k, expected)
-
-    def test_getitem_get(self):
-        idx1 = self.series.index[5]
-        idx2 = self.objSeries.index[5]
-
-        self.assertEqual(self.series[idx1], self.series.get(idx1))
-        self.assertEqual(self.objSeries[idx2], self.objSeries.get(idx2))
-
-        self.assertEqual(self.series[idx1], self.series[5])
-        self.assertEqual(self.objSeries[idx2], self.objSeries[5])
-
-        self.assertEqual(
-            self.series.get(-1), self.series.get(self.series.index[-1]))
-        self.assertEqual(self.series[5], self.series.get(self.series.index[5]))
-
-        # missing
-        d = self.ts.index[0] - BDay()
-        self.assertRaises(KeyError, self.ts.__getitem__, d)
-
-        # None
-        # GH 5652
-        for s in [Series(), Series(index=list('abc'))]:
-            result = s.get(None)
-            self.assertIsNone(result)
-
-    def test_iloc(self):
-
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-
-        for i in range(len(s)):
-            result = s.iloc[i]
-            exp = s[s.index[i]]
-            assert_almost_equal(result, exp)
-
-        # pass a slice
-        result = s.iloc[slice(1, 3)]
-        expected = s.loc[2:4]
-        assert_series_equal(result, expected)
-
-        # test slice is a view
-        result[:] = 0
-        self.assertTrue((s[1:3] == 0).all())
-
-        # list of integers
-        result = s.iloc[[0, 2, 3, 4, 5]]
-        expected = s.reindex(s.index[[0, 2, 3, 4, 5]])
-        assert_series_equal(result, expected)
-
-    def test_iloc_nonunique(self):
-        s = Series([0, 1, 2], index=[0, 1, 0])
-        self.assertEqual(s.iloc[2], 2)
-
-    def test_getitem_regression(self):
-        s = Series(lrange(5), index=lrange(5))
-        result = s[lrange(5)]
-        assert_series_equal(result, s)
-
-    def test_getitem_setitem_slice_bug(self):
-        s = Series(lrange(10), lrange(10))
-        result = s[-12:]
-        assert_series_equal(result, s)
-
-        result = s[-7:]
-        assert_series_equal(result, s[3:])
-
-        result = s[:-12]
-        assert_series_equal(result, s[:0])
-
-        s = Series(lrange(10), lrange(10))
-        s[-12:] = 0
-        self.assertTrue((s == 0).all())
-
-        s[:-12] = 5
-        self.assertTrue((s == 0).all())
-
-    def test_getitem_int64(self):
-        idx = np.int64(5)
-        self.assertEqual(self.ts[idx], self.ts[5])
-
-    def test_getitem_fancy(self):
-        slice1 = self.series[[1, 2, 3]]
-        slice2 = self.objSeries[[1, 2, 3]]
-        self.assertEqual(self.series.index[2], slice1.index[1])
-        self.assertEqual(self.objSeries.index[2], slice2.index[1])
-        self.assertEqual(self.series[2], slice1[1])
-        self.assertEqual(self.objSeries[2], slice2[1])
-
-    def test_getitem_boolean(self):
-        s = self.series
-        mask = s > s.median()
-
-        # passing list is OK
-        result = s[list(mask)]
-        expected = s[mask]
-        assert_series_equal(result, expected)
-        self.assert_index_equal(result.index, s.index[mask])
-
-    def test_getitem_boolean_empty(self):
-        s = Series([], dtype=np.int64)
-        s.index.name = 'index_name'
-        s = s[s.isnull()]
-        self.assertEqual(s.index.name, 'index_name')
-        self.assertEqual(s.dtype, np.int64)
-
-        # GH5877
-        # indexing with empty series
-        s = Series(['A', 'B'])
-        expected = Series(np.nan, index=['C'], dtype=object)
-        result = s[Series(['C'], dtype=object)]
-        assert_series_equal(result, expected)
-
-        s = Series(['A', 'B'])
-        expected = Series(dtype=object, index=Index([], dtype='int64'))
-        result = s[Series([], dtype=object)]
-        assert_series_equal(result, expected)
-
-        # invalid because of the boolean indexer
-        # that's empty or not-aligned
-        def f():
-            s[Series([], dtype=bool)]
-
-        self.assertRaises(IndexingError, f)
-
-        def f():
-            s[Series([True], dtype=bool)]
-
-        self.assertRaises(IndexingError, f)
-
-    def test_getitem_generator(self):
-        gen = (x > 0 for x in self.series)
-        result = self.series[gen]
-        result2 = self.series[iter(self.series > 0)]
-        expected = self.series[self.series > 0]
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-    def test_type_promotion(self):
-        # GH12599
-        s = pd.Series()
-        s["a"] = pd.Timestamp("2016-01-01")
-        s["b"] = 3.0
-        s["c"] = "foo"
-        expected = Series([pd.Timestamp("2016-01-01"), 3.0, "foo"],
-                          index=["a", "b", "c"])
-        assert_series_equal(s, expected)
-
-    def test_getitem_boolean_object(self):
-        # using column from DataFrame
-
-        s = self.series
-        mask = s > s.median()
-        omask = mask.astype(object)
-
-        # getitem
-        result = s[omask]
-        expected = s[mask]
-        assert_series_equal(result, expected)
-
-        # setitem
-        s2 = s.copy()
-        cop = s.copy()
-        cop[omask] = 5
-        s2[mask] = 5
-        assert_series_equal(cop, s2)
-
-        # nans raise exception
-        omask[5:10] = np.nan
-        self.assertRaises(Exception, s.__getitem__, omask)
-        self.assertRaises(Exception, s.__setitem__, omask, 5)
-
-    def test_getitem_setitem_boolean_corner(self):
-        ts = self.ts
-        mask_shifted = ts.shift(1, freq=BDay()) > ts.median()
-
-        # these used to raise...??
-
-        self.assertRaises(Exception, ts.__getitem__, mask_shifted)
-        self.assertRaises(Exception, ts.__setitem__, mask_shifted, 1)
-        # ts[mask_shifted]
-        # ts[mask_shifted] = 1
-
-        self.assertRaises(Exception, ts.loc.__getitem__, mask_shifted)
-        self.assertRaises(Exception, ts.loc.__setitem__, mask_shifted, 1)
-        # ts.loc[mask_shifted]
-        # ts.loc[mask_shifted] = 2
-
-    def test_getitem_setitem_slice_integers(self):
-        s = Series(np.random.randn(8), index=[2, 4, 6, 8, 10, 12, 14, 16])
-
-        result = s[:4]
-        expected = s.reindex([2, 4, 6, 8])
-        assert_series_equal(result, expected)
-
-        s[:4] = 0
-        self.assertTrue((s[:4] == 0).all())
-        self.assertTrue(not (s[4:] == 0).any())
-
-    def test_getitem_setitem_datetime_tz_pytz(self):
-        tm._skip_if_no_pytz()
-        from pytz import timezone as tz
-
-        from pandas import date_range
-
-        N = 50
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(N), index=rng)
-
-        # also test Timestamp tz handling, GH #2789
-        result = ts.copy()
-        result["1990-01-01 09:00:00+00:00"] = 0
-        result["1990-01-01 09:00:00+00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result["1990-01-01 03:00:00-06:00"] = 0
-        result["1990-01-01 03:00:00-06:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        # repeat with datetimes
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-
-        # comparison dates with datetime MUST be localized!
-        date = tz('US/Central').localize(datetime(1990, 1, 1, 3))
-        result[date] = 0
-        result[date] = ts[4]
-        assert_series_equal(result, ts)
-
-    def test_getitem_setitem_datetime_tz_dateutil(self):
-        tm._skip_if_no_dateutil()
-        from dateutil.tz import tzutc
-        from pandas._libs.tslib import _dateutil_gettz as gettz
-
-        tz = lambda x: tzutc() if x == 'UTC' else gettz(
-            x)  # handle special case for utc in dateutil
-
-        from pandas import date_range
-
-        N = 50
-
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H',
-                         tz='America/New_York')
-        ts = Series(np.random.randn(N), index=rng)
-
-        # also test Timestamp tz handling, GH #2789
-        result = ts.copy()
-        result["1990-01-01 09:00:00+00:00"] = 0
-        result["1990-01-01 09:00:00+00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result["1990-01-01 03:00:00-06:00"] = 0
-        result["1990-01-01 03:00:00-06:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        # repeat with datetimes
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = 0
-        result[datetime(1990, 1, 1, 9, tzinfo=tz('UTC'))] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = 0
-        result[datetime(1990, 1, 1, 3, tzinfo=tz('America/Chicago'))] = ts[4]
-        assert_series_equal(result, ts)
-
-    def test_getitem_setitem_datetimeindex(self):
-        N = 50
-        # testing with timezone, GH #2785
-        rng = date_range('1/1/1990', periods=N, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(N), index=rng)
-
-        result = ts["1990-01-01 04:00:00"]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04:00:00"] = 0
-        result["1990-01-01 04:00:00"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts["1990-01-01 04:00:00":"1990-01-01 07:00:00"]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = 0
-        result["1990-01-01 04:00:00":"1990-01-01 07:00:00"] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = "1990-01-01 04:00:00"
-        rb = "1990-01-01 07:00:00"
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        # repeat all the above with naive datetimes
-        result = ts[datetime(1990, 1, 1, 4)]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 4)] = 0
-        result[datetime(1990, 1, 1, 4)] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = 0
-        result[datetime(1990, 1, 1, 4):datetime(1990, 1, 1, 7)] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = datetime(1990, 1, 1, 4)
-        rb = datetime(1990, 1, 1, 7)
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts[ts.index[4]]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts[ts.index[4:8]]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[ts.index[4:8]] = 0
-        result[4:8] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        # also test partial date slicing
-        result = ts["1990-01-02"]
-        expected = ts[24:48]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-02"] = 0
-        result["1990-01-02"] = ts[24:48]
-        assert_series_equal(result, ts)
-
-    def test_getitem_setitem_periodindex(self):
-        from pandas import period_range
-
-        N = 50
-        rng = period_range('1/1/1990', periods=N, freq='H')
-        ts = Series(np.random.randn(N), index=rng)
-
-        result = ts["1990-01-01 04"]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04"] = 0
-        result["1990-01-01 04"] = ts[4]
-        assert_series_equal(result, ts)
-
-        result = ts["1990-01-01 04":"1990-01-01 07"]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result["1990-01-01 04":"1990-01-01 07"] = 0
-        result["1990-01-01 04":"1990-01-01 07"] = ts[4:8]
-        assert_series_equal(result, ts)
-
-        lb = "1990-01-01 04"
-        rb = "1990-01-01 07"
-        result = ts[(ts.index >= lb) & (ts.index <= rb)]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        # GH 2782
-        result = ts[ts.index[4]]
-        expected = ts[4]
-        self.assertEqual(result, expected)
-
-        result = ts[ts.index[4:8]]
-        expected = ts[4:8]
-        assert_series_equal(result, expected)
-
-        result = ts.copy()
-        result[ts.index[4:8]] = 0
-        result[4:8] = ts[4:8]
-        assert_series_equal(result, ts)
-
-    def test_getitem_median_slice_bug(self):
-        index = date_range('20090415', '20090519', freq='2B')
-        s = Series(np.random.randn(13), index=index)
-
-        indexer = [slice(6, 7, None)]
-        result = s[indexer]
-        expected = s[indexer[0]]
-        assert_series_equal(result, expected)
-
-    def test_getitem_out_of_bounds(self):
-        # don't segfault, GH #495
-        self.assertRaises(IndexError, self.ts.__getitem__, len(self.ts))
-
-        # GH #917
-        s = Series([])
-        self.assertRaises(IndexError, s.__getitem__, -1)
-
-    def test_getitem_setitem_integers(self):
-        # caused bug without test
-        s = Series([1, 2, 3], ['a', 'b', 'c'])
-
-        self.assertEqual(s.iloc[0], s['a'])
-        s.iloc[0] = 5
-        self.assertAlmostEqual(s['a'], 5)
-
-    def test_getitem_box_float64(self):
-        value = self.ts[5]
-        tm.assertIsInstance(value, np.float64)
-
-    def test_getitem_ambiguous_keyerror(self):
-        s = Series(lrange(10), index=lrange(0, 20, 2))
-        self.assertRaises(KeyError, s.__getitem__, 1)
-        self.assertRaises(KeyError, s.loc.__getitem__, 1)
-
-    def test_getitem_unordered_dup(self):
-        obj = Series(lrange(5), index=['c', 'a', 'a', 'b', 'b'])
-        self.assertTrue(is_scalar(obj['c']))
-        self.assertEqual(obj['c'], 0)
-
-    def test_getitem_dups_with_missing(self):
-
-        # breaks reindex, so need to use .loc internally
-        # GH 4246
-        s = Series([1, 2, 3, 4], ['foo', 'bar', 'foo', 'bah'])
-        expected = s.loc[['foo', 'bar', 'bah', 'bam']]
-        result = s[['foo', 'bar', 'bah', 'bam']]
-        assert_series_equal(result, expected)
-
-    def test_getitem_dups(self):
-        s = Series(range(5), index=['A', 'A', 'B', 'C', 'C'], dtype=np.int64)
-        expected = Series([3, 4], index=['C', 'C'], dtype=np.int64)
-        result = s['C']
-        assert_series_equal(result, expected)
-
-    def test_getitem_dataframe(self):
-        rng = list(range(10))
-        s = pd.Series(10, index=rng)
-        df = pd.DataFrame(rng, index=rng)
-        self.assertRaises(TypeError, s.__getitem__, df > 5)
-
-    def test_getitem_callable(self):
-        # GH 12533
-        s = pd.Series(4, index=list('ABCD'))
-        result = s[lambda x: 'A']
-        self.assertEqual(result, s.loc['A'])
-
-        result = s[lambda x: ['A', 'B']]
-        tm.assert_series_equal(result, s.loc[['A', 'B']])
-
-        result = s[lambda x: [True, False, True, True]]
-        tm.assert_series_equal(result, s.iloc[[0, 2, 3]])
-
-    def test_setitem_ambiguous_keyerror(self):
-        s = Series(lrange(10), index=lrange(0, 20, 2))
-
-        # equivalent of an append
-        s2 = s.copy()
-        s2[1] = 5
-        expected = s.append(Series([5], index=[1]))
-        assert_series_equal(s2, expected)
-
-        s2 = s.copy()
-        s2.loc[1] = 5
-        expected = s.append(Series([5], index=[1]))
-        assert_series_equal(s2, expected)
-
-    def test_setitem_float_labels(self):
-        # note labels are floats
-        s = Series(['a', 'b', 'c'], index=[0, 0.5, 1])
-        tmp = s.copy()
-
-        s.loc[1] = 'zoo'
-        tmp.iloc[2] = 'zoo'
-
-        assert_series_equal(s, tmp)
-
-    def test_setitem_callable(self):
-        # GH 12533
-        s = pd.Series([1, 2, 3, 4], index=list('ABCD'))
-        s[lambda x: 'A'] = -1
-        tm.assert_series_equal(s, pd.Series([-1, 2, 3, 4], index=list('ABCD')))
-
-    def test_setitem_other_callable(self):
-        # GH 13299
-        inc = lambda x: x + 1
-
-        s = pd.Series([1, 2, -1, 4])
-        s[s < 0] = inc
-
-        expected = pd.Series([1, 2, inc, 4])
-        tm.assert_series_equal(s, expected)
-
-    def test_slice(self):
-        numSlice = self.series[10:20]
-        numSliceEnd = self.series[-10:]
-        objSlice = self.objSeries[10:20]
-
-        self.assertNotIn(self.series.index[9], numSlice.index)
-        self.assertNotIn(self.objSeries.index[9], objSlice.index)
-
-        self.assertEqual(len(numSlice), len(numSlice.index))
-        self.assertEqual(self.series[numSlice.index[0]],
-                         numSlice[numSlice.index[0]])
-
-        self.assertEqual(numSlice.index[1], self.series.index[11])
-
-        self.assertTrue(tm.equalContents(numSliceEnd, np.array(self.series)[
-            -10:]))
-
-        # test return view
-        sl = self.series[10:20]
-        sl[:] = 0
-        self.assertTrue((self.series[10:20] == 0).all())
-
-    def test_slice_can_reorder_not_uniquely_indexed(self):
-        s = Series(1, index=['a', 'a', 'b', 'b', 'c'])
-        s[::-1]  # it works!
-
-    def test_slice_float_get_set(self):
-
-        self.assertRaises(TypeError, lambda: self.ts[4.0:10.0])
-
-        def f():
-            self.ts[4.0:10.0] = 0
-
-        self.assertRaises(TypeError, f)
-
-        self.assertRaises(TypeError, self.ts.__getitem__, slice(4.5, 10.0))
-        self.assertRaises(TypeError, self.ts.__setitem__, slice(4.5, 10.0), 0)
-
-    def test_slice_floats2(self):
-        s = Series(np.random.rand(10), index=np.arange(10, 20, dtype=float))
-
-        self.assertEqual(len(s.loc[12.0:]), 8)
-        self.assertEqual(len(s.loc[12.5:]), 7)
-
-        i = np.arange(10, 20, dtype=float)
-        i[2] = 12.2
-        s.index = i
-        self.assertEqual(len(s.loc[12.0:]), 8)
-        self.assertEqual(len(s.loc[12.5:]), 7)
-
-    def test_slice_float64(self):
-
-        values = np.arange(10., 50., 2)
-        index = Index(values)
-
-        start, end = values[[5, 15]]
-
-        s = Series(np.random.randn(20), index=index)
-
-        result = s[start:end]
-        expected = s.iloc[5:16]
-        assert_series_equal(result, expected)
-
-        result = s.loc[start:end]
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.randn(20, 3), index=index)
-
-        result = df[start:end]
-        expected = df.iloc[5:16]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[start:end]
-        tm.assert_frame_equal(result, expected)
-
-    def test_setitem(self):
-        self.ts[self.ts.index[5]] = np.NaN
-        self.ts[[1, 2, 17]] = np.NaN
-        self.ts[6] = np.NaN
-        self.assertTrue(np.isnan(self.ts[6]))
-        self.assertTrue(np.isnan(self.ts[2]))
-        self.ts[np.isnan(self.ts)] = 5
-        self.assertFalse(np.isnan(self.ts[2]))
-
-        # caught this bug when writing tests
-        series = Series(tm.makeIntIndex(20).astype(float),
-                        index=tm.makeIntIndex(20))
-
-        series[::2] = 0
-        self.assertTrue((series[::2] == 0).all())
-
-        # set item that's not contained
-        s = self.series.copy()
-        s['foobar'] = 1
-
-        app = Series([1], index=['foobar'], name='series')
-        expected = self.series.append(app)
-        assert_series_equal(s, expected)
-
-        # Test for issue #10193
-        key = pd.Timestamp('2012-01-01')
-        series = pd.Series()
-        series[key] = 47
-        expected = pd.Series(47, [key])
-        assert_series_equal(series, expected)
-
-        series = pd.Series([], pd.DatetimeIndex([], freq='D'))
-        series[key] = 47
-        expected = pd.Series(47, pd.DatetimeIndex([key], freq='D'))
-        assert_series_equal(series, expected)
-
-    def test_setitem_dtypes(self):
-
-        # change dtypes
-        # GH 4463
-        expected = Series([np.nan, 2, 3])
-
-        s = Series([1, 2, 3])
-        s.iloc[0] = np.nan
-        assert_series_equal(s, expected)
-
-        s = Series([1, 2, 3])
-        s.loc[0] = np.nan
-        assert_series_equal(s, expected)
-
-        s = Series([1, 2, 3])
-        s[0] = np.nan
-        assert_series_equal(s, expected)
-
-        s = Series([False])
-        s.loc[0] = np.nan
-        assert_series_equal(s, Series([np.nan]))
-
-        s = Series([False, True])
-        s.loc[0] = np.nan
-        assert_series_equal(s, Series([np.nan, 1.0]))
-
-    def test_set_value(self):
-        idx = self.ts.index[10]
-        res = self.ts.set_value(idx, 0)
-        self.assertIs(res, self.ts)
-        self.assertEqual(self.ts[idx], 0)
-
-        # equiv
-        s = self.series.copy()
-        res = s.set_value('foobar', 0)
-        self.assertIs(res, s)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res['foobar'], 0)
-
-        s = self.series.copy()
-        s.loc['foobar'] = 0
-        self.assertEqual(s.index[-1], 'foobar')
-        self.assertEqual(s['foobar'], 0)
-
-    def test_setslice(self):
-        sl = self.ts[5:20]
-        self.assertEqual(len(sl), len(sl.index))
-        self.assertTrue(sl.index.is_unique)
-
-    def test_basic_getitem_setitem_corner(self):
-        # invalid tuples, e.g. self.ts[:, None] vs. self.ts[:, 2]
-        with tm.assertRaisesRegexp(ValueError, 'tuple-index'):
-            self.ts[:, 2]
-        with tm.assertRaisesRegexp(ValueError, 'tuple-index'):
-            self.ts[:, 2] = 2
-
-        # weird lists. [slice(0, 5)] will work but not two slices
-        result = self.ts[[slice(None, 5)]]
-        expected = self.ts[:5]
-        assert_series_equal(result, expected)
-
-        # OK
-        self.assertRaises(Exception, self.ts.__getitem__,
-                          [5, slice(None, None)])
-        self.assertRaises(Exception, self.ts.__setitem__,
-                          [5, slice(None, None)], 2)
-
-    def test_basic_getitem_with_labels(self):
-        indices = self.ts.index[[5, 10, 15]]
-
-        result = self.ts[indices]
-        expected = self.ts.reindex(indices)
-        assert_series_equal(result, expected)
-
-        result = self.ts[indices[0]:indices[2]]
-        expected = self.ts.loc[indices[0]:indices[2]]
-        assert_series_equal(result, expected)
-
-        # integer indexes, be careful
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-        inds = [0, 2, 5, 7, 8]
-        arr_inds = np.array([0, 2, 5, 7, 8])
-        result = s[inds]
-        expected = s.reindex(inds)
-        assert_series_equal(result, expected)
-
-        result = s[arr_inds]
-        expected = s.reindex(arr_inds)
-        assert_series_equal(result, expected)
-
-        # GH12089
-        # with tz for values
-        s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
-                   index=['a', 'b', 'c'])
-        expected = Timestamp('2011-01-01', tz='US/Eastern')
-        result = s.loc['a']
-        self.assertEqual(result, expected)
-        result = s.iloc[0]
-        self.assertEqual(result, expected)
-        result = s['a']
-        self.assertEqual(result, expected)
-
-    def test_basic_setitem_with_labels(self):
-        indices = self.ts.index[[5, 10, 15]]
-
-        cp = self.ts.copy()
-        exp = self.ts.copy()
-        cp[indices] = 0
-        exp.loc[indices] = 0
-        assert_series_equal(cp, exp)
-
-        cp = self.ts.copy()
-        exp = self.ts.copy()
-        cp[indices[0]:indices[2]] = 0
-        exp.loc[indices[0]:indices[2]] = 0
-        assert_series_equal(cp, exp)
-
-        # integer indexes, be careful
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-        inds = [0, 4, 6]
-        arr_inds = np.array([0, 4, 6])
-
-        cp = s.copy()
-        exp = s.copy()
-        s[inds] = 0
-        s.loc[inds] = 0
-        assert_series_equal(cp, exp)
-
-        cp = s.copy()
-        exp = s.copy()
-        s[arr_inds] = 0
-        s.loc[arr_inds] = 0
-        assert_series_equal(cp, exp)
-
-        inds_notfound = [0, 4, 5, 6]
-        arr_inds_notfound = np.array([0, 4, 5, 6])
-        self.assertRaises(Exception, s.__setitem__, inds_notfound, 0)
-        self.assertRaises(Exception, s.__setitem__, arr_inds_notfound, 0)
-
-        # GH12089
-        # with tz for values
-        s = Series(pd.date_range("2011-01-01", periods=3, tz="US/Eastern"),
-                   index=['a', 'b', 'c'])
-        s2 = s.copy()
-        expected = Timestamp('2011-01-03', tz='US/Eastern')
-        s2.loc['a'] = expected
-        result = s2.loc['a']
-        self.assertEqual(result, expected)
-
-        s2 = s.copy()
-        s2.iloc[0] = expected
-        result = s2.iloc[0]
-        self.assertEqual(result, expected)
-
-        s2 = s.copy()
-        s2['a'] = expected
-        result = s2['a']
-        self.assertEqual(result, expected)
-
-    def test_loc_getitem(self):
-        inds = self.series.index[[3, 4, 7]]
-        assert_series_equal(self.series.loc[inds], self.series.reindex(inds))
-        assert_series_equal(self.series.iloc[5::2], self.series[5::2])
-
-        # slice with indices
-        d1, d2 = self.ts.index[[5, 15]]
-        result = self.ts.loc[d1:d2]
-        expected = self.ts.truncate(d1, d2)
-        assert_series_equal(result, expected)
-
-        # boolean
-        mask = self.series > self.series.median()
-        assert_series_equal(self.series.loc[mask], self.series[mask])
-
-        # ask for index value
-        self.assertEqual(self.ts.loc[d1], self.ts[d1])
-        self.assertEqual(self.ts.loc[d2], self.ts[d2])
-
-    def test_loc_getitem_not_monotonic(self):
-        d1, d2 = self.ts.index[[5, 15]]
-
-        ts2 = self.ts[::2][[1, 2, 0]]
-
-        self.assertRaises(KeyError, ts2.loc.__getitem__, slice(d1, d2))
-        self.assertRaises(KeyError, ts2.loc.__setitem__, slice(d1, d2), 0)
-
-    def test_loc_getitem_setitem_integer_slice_keyerrors(self):
-        s = Series(np.random.randn(10), index=lrange(0, 20, 2))
-
-        # this is OK
-        cp = s.copy()
-        cp.iloc[4:10] = 0
-        self.assertTrue((cp.iloc[4:10] == 0).all())
-
-        # so is this
-        cp = s.copy()
-        cp.iloc[3:11] = 0
-        self.assertTrue((cp.iloc[3:11] == 0).values.all())
-
-        result = s.iloc[2:6]
-        result2 = s.loc[3:11]
-        expected = s.reindex([4, 6, 8, 10])
-
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        # non-monotonic, raise KeyError
-        s2 = s.iloc[lrange(5) + lrange(5, 10)[::-1]]
-        self.assertRaises(KeyError, s2.loc.__getitem__, slice(3, 11))
-        self.assertRaises(KeyError, s2.loc.__setitem__, slice(3, 11), 0)
-
-    def test_loc_getitem_iterator(self):
-        idx = iter(self.series.index[:10])
-        result = self.series.loc[idx]
-        assert_series_equal(result, self.series[:10])
-
-    def test_setitem_with_tz(self):
-        for tz in ['US/Eastern', 'UTC', 'Asia/Tokyo']:
-            orig = pd.Series(pd.date_range('2016-01-01', freq='H', periods=3,
-                                           tz=tz))
-            self.assertEqual(orig.dtype, 'datetime64[ns, {0}]'.format(tz))
-
-            # scalar
-            s = orig.copy()
-            s[1] = pd.Timestamp('2011-01-01', tz=tz)
-            exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
-                             pd.Timestamp('2011-01-01 00:00', tz=tz),
-                             pd.Timestamp('2016-01-01 02:00', tz=tz)])
-            tm.assert_series_equal(s, exp)
-
-            s = orig.copy()
-            s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
-            tm.assert_series_equal(s, exp)
-
-            s = orig.copy()
-            s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
-            tm.assert_series_equal(s, exp)
-
-            # vector
-            vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                              pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
-            self.assertEqual(vals.dtype, 'datetime64[ns, {0}]'.format(tz))
-
-            s[[1, 2]] = vals
-            exp = pd.Series([pd.Timestamp('2016-01-01 00:00', tz=tz),
-                             pd.Timestamp('2011-01-01 00:00', tz=tz),
-                             pd.Timestamp('2012-01-01 00:00', tz=tz)])
-            tm.assert_series_equal(s, exp)
-
-            s = orig.copy()
-            s.loc[[1, 2]] = vals
-            tm.assert_series_equal(s, exp)
-
-            s = orig.copy()
-            s.iloc[[1, 2]] = vals
-            tm.assert_series_equal(s, exp)
-
-    def test_setitem_with_tz_dst(self):
-        # GH XXX
-        tz = 'US/Eastern'
-        orig = pd.Series(pd.date_range('2016-11-06', freq='H', periods=3,
-                                       tz=tz))
-        self.assertEqual(orig.dtype, 'datetime64[ns, {0}]'.format(tz))
-
-        # scalar
-        s = orig.copy()
-        s[1] = pd.Timestamp('2011-01-01', tz=tz)
-        exp = pd.Series([pd.Timestamp('2016-11-06 00:00', tz=tz),
-                         pd.Timestamp('2011-01-01 00:00', tz=tz),
-                         pd.Timestamp('2016-11-06 02:00', tz=tz)])
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.loc[1] = pd.Timestamp('2011-01-01', tz=tz)
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.iloc[1] = pd.Timestamp('2011-01-01', tz=tz)
-        tm.assert_series_equal(s, exp)
-
-        # vector
-        vals = pd.Series([pd.Timestamp('2011-01-01', tz=tz),
-                          pd.Timestamp('2012-01-01', tz=tz)], index=[1, 2])
-        self.assertEqual(vals.dtype, 'datetime64[ns, {0}]'.format(tz))
-
-        s[[1, 2]] = vals
-        exp = pd.Series([pd.Timestamp('2016-11-06 00:00', tz=tz),
-                         pd.Timestamp('2011-01-01 00:00', tz=tz),
-                         pd.Timestamp('2012-01-01 00:00', tz=tz)])
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.loc[[1, 2]] = vals
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.iloc[[1, 2]] = vals
-        tm.assert_series_equal(s, exp)
-
-    def test_where(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.where(cond).dropna()
-        rs2 = s[cond]
-        assert_series_equal(rs, rs2)
-
-        rs = s.where(cond, -s)
-        assert_series_equal(rs, s.abs())
-
-        rs = s.where(cond)
-        assert (s.shape == rs.shape)
-        assert (rs is not s)
-
-        # test alignment
-        cond = Series([True, False, False, True, False], index=s.index)
-        s2 = -(s.abs())
-
-        expected = s2[cond].reindex(s2.index[:3]).reindex(s2.index)
-        rs = s2.where(cond[:3])
-        assert_series_equal(rs, expected)
-
-        expected = s2.abs()
-        expected.iloc[0] = s2[0]
-        rs = s2.where(cond[:3], -s2)
-        assert_series_equal(rs, expected)
-
-        self.assertRaises(ValueError, s.where, 1)
-        self.assertRaises(ValueError, s.where, cond[:3].values, -s)
-
-        # GH 2745
-        s = Series([1, 2])
-        s[[True, False]] = [0, 1]
-        expected = Series([0, 2])
-        assert_series_equal(s, expected)
-
-        # failures
-        self.assertRaises(ValueError, s.__setitem__, tuple([[[True, False]]]),
-                          [0, 2, 3])
-        self.assertRaises(ValueError, s.__setitem__, tuple([[[True, False]]]),
-                          [])
-
-        # unsafe dtype changes
-        for dtype in [np.int8, np.int16, np.int32, np.int64, np.float16,
-                      np.float32, np.float64]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            s[mask] = lrange(2, 7)
-            expected = Series(lrange(2, 7) + lrange(5, 10), dtype=dtype)
-            assert_series_equal(s, expected)
-            self.assertEqual(s.dtype, expected.dtype)
-
-        # these are allowed operations, but are upcasted
-        for dtype in [np.int64, np.float64]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            values = [2.5, 3.5, 4.5, 5.5, 6.5]
-            s[mask] = values
-            expected = Series(values + lrange(5, 10), dtype='float64')
-            assert_series_equal(s, expected)
-            self.assertEqual(s.dtype, expected.dtype)
-
-        # GH 9731
-        s = Series(np.arange(10), dtype='int64')
-        mask = s > 5
-        values = [2.5, 3.5, 4.5, 5.5]
-        s[mask] = values
-        expected = Series(lrange(6) + values, dtype='float64')
-        assert_series_equal(s, expected)
-
-        # can't do these as we are forced to change the itemsize of the input
-        # to something we cannot
-        for dtype in [np.int8, np.int16, np.int32, np.float16, np.float32]:
-            s = Series(np.arange(10), dtype=dtype)
-            mask = s < 5
-            values = [2.5, 3.5, 4.5, 5.5, 6.5]
-            self.assertRaises(Exception, s.__setitem__, tuple(mask), values)
-
-        # GH3235
-        s = Series(np.arange(10), dtype='int64')
-        mask = s < 5
-        s[mask] = lrange(2, 7)
-        expected = Series(lrange(2, 7) + lrange(5, 10), dtype='int64')
-        assert_series_equal(s, expected)
-        self.assertEqual(s.dtype, expected.dtype)
-
-        s = Series(np.arange(10), dtype='int64')
-        mask = s > 5
-        s[mask] = [0] * 4
-        expected = Series([0, 1, 2, 3, 4, 5] + [0] * 4, dtype='int64')
-        assert_series_equal(s, expected)
-
-        s = Series(np.arange(10))
-        mask = s > 5
-
-        def f():
-            s[mask] = [5, 4, 3, 2, 1]
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            s[mask] = [0] * 5
-
-        self.assertRaises(ValueError, f)
-
-        # dtype changes
-        s = Series([1, 2, 3, 4])
-        result = s.where(s > 2, np.nan)
-        expected = Series([np.nan, np.nan, 3, 4])
-        assert_series_equal(result, expected)
-
-        # GH 4667
-        # setting with None changes dtype
-        s = Series(range(10)).astype(float)
-        s[8] = None
-        result = s[8]
-        self.assertTrue(isnull(result))
-
-        s = Series(range(10)).astype(float)
-        s[s > 8] = None
-        result = s[isnull(s)]
-        expected = Series(np.nan, index=[9])
-        assert_series_equal(result, expected)
-
-    def test_where_array_like(self):
-        # see gh-15414
-        s = Series([1, 2, 3])
-        cond = [False, True, True]
-        expected = Series([np.nan, 2, 3])
-        klasses = [list, tuple, np.array, Series]
-
-        for klass in klasses:
-            result = s.where(klass(cond))
-            assert_series_equal(result, expected)
-
-    def test_where_invalid_input(self):
-        # see gh-15414: only boolean arrays accepted
-        s = Series([1, 2, 3])
-        msg = "Boolean array expected for the condition"
-
-        conds = [
-            [1, 0, 1],
-            Series([2, 5, 7]),
-            ["True", "False", "True"],
-            [Timestamp("2017-01-01"),
-             pd.NaT, Timestamp("2017-01-02")]
-        ]
-
-        for cond in conds:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                s.where(cond)
-
-        msg = "Array conditional must be same shape as self"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.where([True])
-
-    def test_where_ndframe_align(self):
-        msg = "Array conditional must be same shape as self"
-        s = Series([1, 2, 3])
-
-        cond = [True]
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.where(cond)
-
-        expected = Series([1, np.nan, np.nan])
-
-        out = s.where(Series(cond))
-        tm.assert_series_equal(out, expected)
-
-        cond = np.array([False, True, False, True])
-        with tm.assertRaisesRegexp(ValueError, msg):
-            s.where(cond)
-
-        expected = Series([np.nan, 2, np.nan])
-
-        out = s.where(Series(cond))
-        tm.assert_series_equal(out, expected)
-
-    def test_where_setitem_invalid(self):
-
-        # GH 2702
-        # make sure correct exceptions are raised on invalid list assignment
-
-        # slice
-        s = Series(list('abc'))
-
-        def f():
-            s[0:3] = list(range(27))
-
-        self.assertRaises(ValueError, f)
-
-        s[0:3] = list(range(3))
-        expected = Series([0, 1, 2])
-        assert_series_equal(s.astype(np.int64), expected, )
-
-        # slice with step
-        s = Series(list('abcdef'))
-
-        def f():
-            s[0:4:2] = list(range(27))
-
-        self.assertRaises(ValueError, f)
-
-        s = Series(list('abcdef'))
-        s[0:4:2] = list(range(2))
-        expected = Series([0, 'b', 1, 'd', 'e', 'f'])
-        assert_series_equal(s, expected)
-
-        # neg slices
-        s = Series(list('abcdef'))
-
-        def f():
-            s[:-1] = list(range(27))
-
-        self.assertRaises(ValueError, f)
-
-        s[-3:-1] = list(range(2))
-        expected = Series(['a', 'b', 'c', 0, 1, 'f'])
-        assert_series_equal(s, expected)
-
-        # list
-        s = Series(list('abc'))
-
-        def f():
-            s[[0, 1, 2]] = list(range(27))
-
-        self.assertRaises(ValueError, f)
-
-        s = Series(list('abc'))
-
-        def f():
-            s[[0, 1, 2]] = list(range(2))
-
-        self.assertRaises(ValueError, f)
-
-        # scalar
-        s = Series(list('abc'))
-        s[0] = list(range(10))
-        expected = Series([list(range(10)), 'b', 'c'])
-        assert_series_equal(s, expected)
-
-    def test_where_broadcast(self):
-        # Test a variety of differently sized series
-        for size in range(2, 6):
-            # Test a variety of boolean indices
-            for selection in [
-                    # First element should be set
-                    np.resize([True, False, False, False, False], size),
-                    # Set alternating elements]
-                    np.resize([True, False], size),
-                    # No element should be set
-                    np.resize([False], size)]:
-
-                # Test a variety of different numbers as content
-                for item in [2.0, np.nan, np.finfo(np.float).max,
-                             np.finfo(np.float).min]:
-                    # Test numpy arrays, lists and tuples as the input to be
-                    # broadcast
-                    for arr in [np.array([item]), [item], (item, )]:
-                        data = np.arange(size, dtype=float)
-                        s = Series(data)
-                        s[selection] = arr
-                        # Construct the expected series by taking the source
-                        # data or item based on the selection
-                        expected = Series([item if use_item else data[
-                            i] for i, use_item in enumerate(selection)])
-                        assert_series_equal(s, expected)
-
-                        s = Series(data)
-                        result = s.where(~selection, arr)
-                        assert_series_equal(result, expected)
-
-    def test_where_inplace(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.copy()
-
-        rs.where(cond, inplace=True)
-        assert_series_equal(rs.dropna(), s[cond])
-        assert_series_equal(rs, s.where(cond))
-
-        rs = s.copy()
-        rs.where(cond, -s, inplace=True)
-        assert_series_equal(rs, s.where(cond, -s))
-
-    def test_where_dups(self):
-        # GH 4550
-        # where crashes with dups in index
-        s1 = Series(list(range(3)))
-        s2 = Series(list(range(3)))
-        comb = pd.concat([s1, s2])
-        result = comb.where(comb < 2)
-        expected = Series([0, 1, np.nan, 0, 1, np.nan],
-                          index=[0, 1, 2, 0, 1, 2])
-        assert_series_equal(result, expected)
-
-        # GH 4548
-        # inplace updating not working with dups
-        comb[comb < 1] = 5
-        expected = Series([5, 1, 2, 5, 1, 2], index=[0, 1, 2, 0, 1, 2])
-        assert_series_equal(comb, expected)
-
-        comb[comb < 2] += 10
-        expected = Series([5, 11, 2, 5, 11, 2], index=[0, 1, 2, 0, 1, 2])
-        assert_series_equal(comb, expected)
-
-    def test_where_datetime(self):
-        s = Series(date_range('20130102', periods=2))
-        expected = Series([10, 10], dtype='datetime64[ns]')
-        mask = np.array([False, False])
-
-        rs = s.where(mask, [10, 10])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10.0)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, 10.0])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, np.nan])
-        expected = Series([10, None], dtype='datetime64[ns]')
-        assert_series_equal(rs, expected)
-
-        # GH 15701
-        timestamps = ['2016-12-31 12:00:04+00:00',
-                      '2016-12-31 12:00:04.010000+00:00']
-        s = Series([pd.Timestamp(t) for t in timestamps])
-        rs = s.where(Series([False, True]))
-        expected = Series([pd.NaT, s[1]])
-        assert_series_equal(rs, expected)
-
-    def test_where_timedelta(self):
-        s = Series([1, 2], dtype='timedelta64[ns]')
-        expected = Series([10, 10], dtype='timedelta64[ns]')
-        mask = np.array([False, False])
-
-        rs = s.where(mask, [10, 10])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, 10.0)
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, 10.0])
-        assert_series_equal(rs, expected)
-
-        rs = s.where(mask, [10.0, np.nan])
-        expected = Series([10, None], dtype='timedelta64[ns]')
-        assert_series_equal(rs, expected)
-
-    def test_mask(self):
-        # compare with tested results in test_where
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.where(~cond, np.nan)
-        assert_series_equal(rs, s.mask(cond))
-
-        rs = s.where(~cond)
-        rs2 = s.mask(cond)
-        assert_series_equal(rs, rs2)
-
-        rs = s.where(~cond, -s)
-        rs2 = s.mask(cond, -s)
-        assert_series_equal(rs, rs2)
-
-        cond = Series([True, False, False, True, False], index=s.index)
-        s2 = -(s.abs())
-        rs = s2.where(~cond[:3])
-        rs2 = s2.mask(cond[:3])
-        assert_series_equal(rs, rs2)
-
-        rs = s2.where(~cond[:3], -s2)
-        rs2 = s2.mask(cond[:3], -s2)
-        assert_series_equal(rs, rs2)
-
-        self.assertRaises(ValueError, s.mask, 1)
-        self.assertRaises(ValueError, s.mask, cond[:3].values, -s)
-
-        # dtype changes
-        s = Series([1, 2, 3, 4])
-        result = s.mask(s > 2, np.nan)
-        expected = Series([1, 2, np.nan, np.nan])
-        assert_series_equal(result, expected)
-
-    def test_mask_broadcast(self):
-        # GH 8801
-        # copied from test_where_broadcast
-        for size in range(2, 6):
-            for selection in [
-                    # First element should be set
-                    np.resize([True, False, False, False, False], size),
-                    # Set alternating elements]
-                    np.resize([True, False], size),
-                    # No element should be set
-                    np.resize([False], size)]:
-                for item in [2.0, np.nan, np.finfo(np.float).max,
-                             np.finfo(np.float).min]:
-                    for arr in [np.array([item]), [item], (item, )]:
-                        data = np.arange(size, dtype=float)
-                        s = Series(data)
-                        result = s.mask(selection, arr)
-                        expected = Series([item if use_item else data[
-                            i] for i, use_item in enumerate(selection)])
-                        assert_series_equal(result, expected)
-
-    def test_mask_inplace(self):
-        s = Series(np.random.randn(5))
-        cond = s > 0
-
-        rs = s.copy()
-        rs.mask(cond, inplace=True)
-        assert_series_equal(rs.dropna(), s[~cond])
-        assert_series_equal(rs, s.mask(cond))
-
-        rs = s.copy()
-        rs.mask(cond, -s, inplace=True)
-        assert_series_equal(rs, s.mask(cond, -s))
-
-    def test_ix_setitem(self):
-        inds = self.series.index[[3, 4, 7]]
-
-        result = self.series.copy()
-        result.loc[inds] = 5
-
-        expected = self.series.copy()
-        expected[[3, 4, 7]] = 5
-        assert_series_equal(result, expected)
-
-        result.iloc[5:10] = 10
-        expected[5:10] = 10
-        assert_series_equal(result, expected)
-
-        # set slice with indices
-        d1, d2 = self.series.index[[5, 15]]
-        result.loc[d1:d2] = 6
-        expected[5:16] = 6  # because it's inclusive
-        assert_series_equal(result, expected)
-
-        # set index value
-        self.series.loc[d1] = 4
-        self.series.loc[d2] = 6
-        self.assertEqual(self.series[d1], 4)
-        self.assertEqual(self.series[d2], 6)
-
-    def test_where_numeric_with_string(self):
-        # GH 9280
-        s = pd.Series([1, 2, 3])
-        w = s.where(s > 1, 'X')
-
-        self.assertFalse(is_integer(w[0]))
-        self.assertTrue(is_integer(w[1]))
-        self.assertTrue(is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-        w = s.where(s > 1, ['X', 'Y', 'Z'])
-        self.assertFalse(is_integer(w[0]))
-        self.assertTrue(is_integer(w[1]))
-        self.assertTrue(is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-        w = s.where(s > 1, np.array(['X', 'Y', 'Z']))
-        self.assertFalse(is_integer(w[0]))
-        self.assertTrue(is_integer(w[1]))
-        self.assertTrue(is_integer(w[2]))
-        self.assertTrue(isinstance(w[0], str))
-        self.assertTrue(w.dtype == 'object')
-
-    def test_setitem_boolean(self):
-        mask = self.series > self.series.median()
-
-        # similiar indexed series
-        result = self.series.copy()
-        result[mask] = self.series * 2
-        expected = self.series * 2
-        assert_series_equal(result[mask], expected[mask])
-
-        # needs alignment
-        result = self.series.copy()
-        result[mask] = (self.series * 2)[0:5]
-        expected = (self.series * 2)[0:5].reindex_like(self.series)
-        expected[-mask] = self.series[mask]
-        assert_series_equal(result[mask], expected[mask])
-
-    def test_ix_setitem_boolean(self):
-        mask = self.series > self.series.median()
-
-        result = self.series.copy()
-        result.loc[mask] = 0
-        expected = self.series
-        expected[mask] = 0
-        assert_series_equal(result, expected)
-
-    def test_ix_setitem_corner(self):
-        inds = list(self.series.index[[5, 8, 12]])
-        self.series.loc[inds] = 5
-        self.assertRaises(Exception, self.series.loc.__setitem__,
-                          inds + ['foo'], 5)
-
-    def test_get_set_boolean_different_order(self):
-        ordered = self.series.sort_values()
-
-        # setting
-        copy = self.series.copy()
-        copy[ordered > 0] = 0
-
-        expected = self.series.copy()
-        expected[expected > 0] = 0
-
-        assert_series_equal(copy, expected)
-
-        # getting
-        sel = self.series[ordered > 0]
-        exp = self.series[self.series > 0]
-        assert_series_equal(sel, exp)
-
-    def test_setitem_na(self):
-        # these induce dtype changes
-        expected = Series([np.nan, 3, np.nan, 5, np.nan, 7, np.nan, 9, np.nan])
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
-        s[::2] = np.nan
-        assert_series_equal(s, expected)
-
-        # get's coerced to float, right?
-        expected = Series([np.nan, 1, np.nan, 0])
-        s = Series([True, True, False, False])
-        s[::2] = np.nan
-        assert_series_equal(s, expected)
-
-        expected = Series([np.nan, np.nan, np.nan, np.nan, np.nan, 5, 6, 7, 8,
-                           9])
-        s = Series(np.arange(10))
-        s[:5] = np.nan
-        assert_series_equal(s, expected)
-
-    def test_basic_indexing(self):
-        s = Series(np.random.randn(5), index=['a', 'b', 'a', 'a', 'b'])
-
-        self.assertRaises(IndexError, s.__getitem__, 5)
-        self.assertRaises(IndexError, s.__setitem__, 5, 0)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-        s = s.sort_index()
-
-        self.assertRaises(IndexError, s.__getitem__, 5)
-        self.assertRaises(IndexError, s.__setitem__, 5, 0)
-
-    def test_int_indexing(self):
-        s = Series(np.random.randn(6), index=[0, 0, 1, 1, 2, 2])
-
-        self.assertRaises(KeyError, s.__getitem__, 5)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-        # not monotonic
-        s = Series(np.random.randn(6), index=[2, 2, 0, 0, 1, 1])
-
-        self.assertRaises(KeyError, s.__getitem__, 5)
-
-        self.assertRaises(KeyError, s.__getitem__, 'c')
-
-    def test_datetime_indexing(self):
-        from pandas import date_range
-
-        index = date_range('1/1/2000', '1/7/2000')
-        index = index.repeat(3)
-
-        s = Series(len(index), index=index)
-        stamp = Timestamp('1/8/2000')
-
-        self.assertRaises(KeyError, s.__getitem__, stamp)
-        s[stamp] = 0
-        self.assertEqual(s[stamp], 0)
-
-        # not monotonic
-        s = Series(len(index), index=index)
-        s = s[::-1]
-
-        self.assertRaises(KeyError, s.__getitem__, stamp)
-        s[stamp] = 0
-        self.assertEqual(s[stamp], 0)
-
-    def test_timedelta_assignment(self):
-        # GH 8209
-        s = Series([])
-        s.loc['B'] = timedelta(1)
-        tm.assert_series_equal(s, Series(Timedelta('1 days'), index=['B']))
-
-        s = s.reindex(s.index.insert(0, 'A'))
-        tm.assert_series_equal(s, Series(
-            [np.nan, Timedelta('1 days')], index=['A', 'B']))
-
-        result = s.fillna(timedelta(1))
-        expected = Series(Timedelta('1 days'), index=['A', 'B'])
-        tm.assert_series_equal(result, expected)
-
-        s.loc['A'] = timedelta(1)
-        tm.assert_series_equal(s, expected)
-
-        # GH 14155
-        s = Series(10 * [np.timedelta64(10, 'm')])
-        s.loc[[1, 2, 3]] = np.timedelta64(20, 'm')
-        expected = pd.Series(10 * [np.timedelta64(10, 'm')])
-        expected.loc[[1, 2, 3]] = pd.Timedelta(np.timedelta64(20, 'm'))
-        tm.assert_series_equal(s, expected)
-
-    def test_underlying_data_conversion(self):
-
-        # GH 4080
-        df = DataFrame(dict((c, [1, 2, 3]) for c in ['a', 'b', 'c']))
-        df.set_index(['a', 'b', 'c'], inplace=True)
-        s = Series([1], index=[(2, 2, 2)])
-        df['val'] = 0
-        df
-        df['val'].update(s)
-
-        expected = DataFrame(
-            dict(a=[1, 2, 3], b=[1, 2, 3], c=[1, 2, 3], val=[0, 1, 0]))
-        expected.set_index(['a', 'b', 'c'], inplace=True)
-        tm.assert_frame_equal(df, expected)
-
-        # GH 3970
-        # these are chained assignments as well
-        pd.set_option('chained_assignment', None)
-        df = DataFrame({"aa": range(5), "bb": [2.2] * 5})
-        df["cc"] = 0.0
-
-        ck = [True] * len(df)
-
-        df["bb"].iloc[0] = .13
-
-        # TODO: unused
-        df_tmp = df.iloc[ck]  # noqa
-
-        df["bb"].iloc[0] = .15
-        self.assertEqual(df['bb'].iloc[0], 0.15)
-        pd.set_option('chained_assignment', 'raise')
-
-        # GH 3217
-        df = DataFrame(dict(a=[1, 3], b=[np.nan, 2]))
-        df['c'] = np.nan
-        df['c'].update(pd.Series(['foo'], index=[0]))
-
-        expected = DataFrame(dict(a=[1, 3], b=[np.nan, 2], c=['foo', np.nan]))
-        tm.assert_frame_equal(df, expected)
-
-    def test_preserveRefs(self):
-        seq = self.ts[[5, 10, 15]]
-        seq[1] = np.NaN
-        self.assertFalse(np.isnan(self.ts[10]))
-
-    def test_drop(self):
-
-        # unique
-        s = Series([1, 2], index=['one', 'two'])
-        expected = Series([1], index=['one'])
-        result = s.drop(['two'])
-        assert_series_equal(result, expected)
-        result = s.drop('two', axis='rows')
-        assert_series_equal(result, expected)
-
-        # non-unique
-        # GH 5248
-        s = Series([1, 1, 2], index=['one', 'two', 'one'])
-        expected = Series([1, 2], index=['one', 'one'])
-        result = s.drop(['two'], axis=0)
-        assert_series_equal(result, expected)
-        result = s.drop('two')
-        assert_series_equal(result, expected)
-
-        expected = Series([1], index=['two'])
-        result = s.drop(['one'])
-        assert_series_equal(result, expected)
-        result = s.drop('one')
-        assert_series_equal(result, expected)
-
-        # single string/tuple-like
-        s = Series(range(3), index=list('abc'))
-        self.assertRaises(ValueError, s.drop, 'bc')
-        self.assertRaises(ValueError, s.drop, ('a', ))
-
-        # errors='ignore'
-        s = Series(range(3), index=list('abc'))
-        result = s.drop('bc', errors='ignore')
-        assert_series_equal(result, s)
-        result = s.drop(['a', 'd'], errors='ignore')
-        expected = s.iloc[1:]
-        assert_series_equal(result, expected)
-
-        # bad axis
-        self.assertRaises(ValueError, s.drop, 'one', axis='columns')
-
-        # GH 8522
-        s = Series([2, 3], index=[True, False])
-        self.assertTrue(s.index.is_object())
-        result = s.drop(True)
-        expected = Series([3], index=[False])
-        assert_series_equal(result, expected)
-
-    def test_align(self):
-        def _check_align(a, b, how='left', fill=None):
-            aa, ab = a.align(b, join=how, fill_value=fill)
-
-            join_index = a.index.join(b.index, how=how)
-            if fill is not None:
-                diff_a = aa.index.difference(join_index)
-                diff_b = ab.index.difference(join_index)
-                if len(diff_a) > 0:
-                    self.assertTrue((aa.reindex(diff_a) == fill).all())
-                if len(diff_b) > 0:
-                    self.assertTrue((ab.reindex(diff_b) == fill).all())
-
-            ea = a.reindex(join_index)
-            eb = b.reindex(join_index)
-
-            if fill is not None:
-                ea = ea.fillna(fill)
-                eb = eb.fillna(fill)
-
-            assert_series_equal(aa, ea)
-            assert_series_equal(ab, eb)
-            self.assertEqual(aa.name, 'ts')
-            self.assertEqual(ea.name, 'ts')
-            self.assertEqual(ab.name, 'ts')
-            self.assertEqual(eb.name, 'ts')
-
-        for kind in JOIN_TYPES:
-            _check_align(self.ts[2:], self.ts[:-5], how=kind)
-            _check_align(self.ts[2:], self.ts[:-5], how=kind, fill=-1)
-
-            # empty left
-            _check_align(self.ts[:0], self.ts[:-5], how=kind)
-            _check_align(self.ts[:0], self.ts[:-5], how=kind, fill=-1)
-
-            # empty right
-            _check_align(self.ts[:-5], self.ts[:0], how=kind)
-            _check_align(self.ts[:-5], self.ts[:0], how=kind, fill=-1)
-
-            # both empty
-            _check_align(self.ts[:0], self.ts[:0], how=kind)
-            _check_align(self.ts[:0], self.ts[:0], how=kind, fill=-1)
-
-    def test_align_fill_method(self):
-        def _check_align(a, b, how='left', method='pad', limit=None):
-            aa, ab = a.align(b, join=how, method=method, limit=limit)
-
-            join_index = a.index.join(b.index, how=how)
-            ea = a.reindex(join_index)
-            eb = b.reindex(join_index)
-
-            ea = ea.fillna(method=method, limit=limit)
-            eb = eb.fillna(method=method, limit=limit)
-
-            assert_series_equal(aa, ea)
-            assert_series_equal(ab, eb)
-
-        for kind in JOIN_TYPES:
-            for meth in ['pad', 'bfill']:
-                _check_align(self.ts[2:], self.ts[:-5], how=kind, method=meth)
-                _check_align(self.ts[2:], self.ts[:-5], how=kind, method=meth,
-                             limit=1)
-
-                # empty left
-                _check_align(self.ts[:0], self.ts[:-5], how=kind, method=meth)
-                _check_align(self.ts[:0], self.ts[:-5], how=kind, method=meth,
-                             limit=1)
-
-                # empty right
-                _check_align(self.ts[:-5], self.ts[:0], how=kind, method=meth)
-                _check_align(self.ts[:-5], self.ts[:0], how=kind, method=meth,
-                             limit=1)
-
-                # both empty
-                _check_align(self.ts[:0], self.ts[:0], how=kind, method=meth)
-                _check_align(self.ts[:0], self.ts[:0], how=kind, method=meth,
-                             limit=1)
-
-    def test_align_nocopy(self):
-        b = self.ts[:5].copy()
-
-        # do copy
-        a = self.ts.copy()
-        ra, _ = a.align(b, join='left')
-        ra[:5] = 5
-        self.assertFalse((a[:5] == 5).any())
-
-        # do not copy
-        a = self.ts.copy()
-        ra, _ = a.align(b, join='left', copy=False)
-        ra[:5] = 5
-        self.assertTrue((a[:5] == 5).all())
-
-        # do copy
-        a = self.ts.copy()
-        b = self.ts[:5].copy()
-        _, rb = a.align(b, join='right')
-        rb[:3] = 5
-        self.assertFalse((b[:3] == 5).any())
-
-        # do not copy
-        a = self.ts.copy()
-        b = self.ts[:5].copy()
-        _, rb = a.align(b, join='right', copy=False)
-        rb[:2] = 5
-        self.assertTrue((b[:2] == 5).all())
-
-    def test_align_sameindex(self):
-        a, b = self.ts.align(self.ts, copy=False)
-        self.assertIs(a.index, self.ts.index)
-        self.assertIs(b.index, self.ts.index)
-
-        # a, b = self.ts.align(self.ts, copy=True)
-        # self.assertIsNot(a.index, self.ts.index)
-        # self.assertIsNot(b.index, self.ts.index)
-
-    def test_align_multiindex(self):
-        # GH 10665
-
-        midx = pd.MultiIndex.from_product([range(2), range(3), range(2)],
-                                          names=('a', 'b', 'c'))
-        idx = pd.Index(range(2), name='b')
-        s1 = pd.Series(np.arange(12, dtype='int64'), index=midx)
-        s2 = pd.Series(np.arange(2, dtype='int64'), index=idx)
-
-        # these must be the same results (but flipped)
-        res1l, res1r = s1.align(s2, join='left')
-        res2l, res2r = s2.align(s1, join='right')
-
-        expl = s1
-        tm.assert_series_equal(expl, res1l)
-        tm.assert_series_equal(expl, res2r)
-        expr = pd.Series([0, 0, 1, 1, np.nan, np.nan] * 2, index=midx)
-        tm.assert_series_equal(expr, res1r)
-        tm.assert_series_equal(expr, res2l)
-
-        res1l, res1r = s1.align(s2, join='right')
-        res2l, res2r = s2.align(s1, join='left')
-
-        exp_idx = pd.MultiIndex.from_product([range(2), range(2), range(2)],
-                                             names=('a', 'b', 'c'))
-        expl = pd.Series([0, 1, 2, 3, 6, 7, 8, 9], index=exp_idx)
-        tm.assert_series_equal(expl, res1l)
-        tm.assert_series_equal(expl, res2r)
-        expr = pd.Series([0, 0, 1, 1] * 2, index=exp_idx)
-        tm.assert_series_equal(expr, res1r)
-        tm.assert_series_equal(expr, res2l)
-
-    def test_reindex(self):
-
-        identity = self.series.reindex(self.series.index)
-
-        # __array_interface__ is not defined for older numpies
-        # and on some pythons
-        try:
-            self.assertTrue(np.may_share_memory(self.series.index,
-                                                identity.index))
-        except (AttributeError):
-            pass
-
-        self.assertTrue(identity.index.is_(self.series.index))
-        self.assertTrue(identity.index.identical(self.series.index))
-
-        subIndex = self.series.index[10:20]
-        subSeries = self.series.reindex(subIndex)
-
-        for idx, val in compat.iteritems(subSeries):
-            self.assertEqual(val, self.series[idx])
-
-        subIndex2 = self.ts.index[10:20]
-        subTS = self.ts.reindex(subIndex2)
-
-        for idx, val in compat.iteritems(subTS):
-            self.assertEqual(val, self.ts[idx])
-        stuffSeries = self.ts.reindex(subIndex)
-
-        self.assertTrue(np.isnan(stuffSeries).all())
-
-        # This is extremely important for the Cython code to not screw up
-        nonContigIndex = self.ts.index[::2]
-        subNonContig = self.ts.reindex(nonContigIndex)
-        for idx, val in compat.iteritems(subNonContig):
-            self.assertEqual(val, self.ts[idx])
-
-        # return a copy the same index here
-        result = self.ts.reindex()
-        self.assertFalse((result is self.ts))
-
-    def test_reindex_nan(self):
-        ts = Series([2, 3, 5, 7], index=[1, 4, nan, 8])
-
-        i, j = [nan, 1, nan, 8, 4, nan], [2, 0, 2, 3, 1, 2]
-        assert_series_equal(ts.reindex(i), ts.iloc[j])
-
-        ts.index = ts.index.astype('object')
-
-        # reindex coerces index.dtype to float, loc/iloc doesn't
-        assert_series_equal(ts.reindex(i), ts.iloc[j], check_index_type=False)
-
-    def test_reindex_series_add_nat(self):
-        rng = date_range('1/1/2000 00:00:00', periods=10, freq='10s')
-        series = Series(rng)
-
-        result = series.reindex(lrange(15))
-        self.assertTrue(np.issubdtype(result.dtype, np.dtype('M8[ns]')))
-
-        mask = result.isnull()
-        self.assertTrue(mask[-5:].all())
-        self.assertFalse(mask[:-5].any())
-
-    def test_reindex_with_datetimes(self):
-        rng = date_range('1/1/2000', periods=20)
-        ts = Series(np.random.randn(20), index=rng)
-
-        result = ts.reindex(list(ts.index[5:10]))
-        expected = ts[5:10]
-        tm.assert_series_equal(result, expected)
-
-        result = ts[list(ts.index[5:10])]
-        tm.assert_series_equal(result, expected)
-
-    def test_reindex_corner(self):
-        # (don't forget to fix this) I think it's fixed
-        self.empty.reindex(self.ts.index, method='pad')  # it works
-
-        # corner case: pad empty series
-        reindexed = self.empty.reindex(self.ts.index, method='pad')
-
-        # pass non-Index
-        reindexed = self.ts.reindex(list(self.ts.index))
-        assert_series_equal(self.ts, reindexed)
-
-        # bad fill method
-        ts = self.ts[::2]
-        self.assertRaises(Exception, ts.reindex, self.ts.index, method='foo')
-
-    def test_reindex_pad(self):
-
-        s = Series(np.arange(10), dtype='int64')
-        s2 = s[::2]
-
-        reindexed = s2.reindex(s.index, method='pad')
-        reindexed2 = s2.reindex(s.index, method='ffill')
-        assert_series_equal(reindexed, reindexed2)
-
-        expected = Series([0, 0, 2, 2, 4, 4, 6, 6, 8, 8], index=np.arange(10))
-        assert_series_equal(reindexed, expected)
-
-        # GH4604
-        s = Series([1, 2, 3, 4, 5], index=['a', 'b', 'c', 'd', 'e'])
-        new_index = ['a', 'g', 'c', 'f']
-        expected = Series([1, 1, 3, 3], index=new_index)
-
-        # this changes dtype because the ffill happens after
-        result = s.reindex(new_index).ffill()
-        assert_series_equal(result, expected.astype('float64'))
-
-        result = s.reindex(new_index).ffill(downcast='infer')
-        assert_series_equal(result, expected)
-
-        expected = Series([1, 5, 3, 5], index=new_index)
-        result = s.reindex(new_index, method='ffill')
-        assert_series_equal(result, expected)
-
-        # inferrence of new dtype
-        s = Series([True, False, False, True], index=list('abcd'))
-        new_index = 'agc'
-        result = s.reindex(list(new_index)).ffill()
-        expected = Series([True, True, False], index=list(new_index))
-        assert_series_equal(result, expected)
-
-        # GH4618 shifted series downcasting
-        s = Series(False, index=lrange(0, 5))
-        result = s.shift(1).fillna(method='bfill')
-        expected = Series(False, index=lrange(0, 5))
-        assert_series_equal(result, expected)
-
-    def test_reindex_nearest(self):
-        s = Series(np.arange(10, dtype='int64'))
-        target = [0.1, 0.9, 1.5, 2.0]
-        actual = s.reindex(target, method='nearest')
-        expected = Series(np.around(target).astype('int64'), target)
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex_like(actual, method='nearest')
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex_like(actual, method='nearest', tolerance=1)
-        assert_series_equal(expected, actual)
-
-        actual = s.reindex(target, method='nearest', tolerance=0.2)
-        expected = Series([0, 1, np.nan, 2], target)
-        assert_series_equal(expected, actual)
-
-    def test_reindex_backfill(self):
-        pass
-
-    def test_reindex_int(self):
-        ts = self.ts[::2]
-        int_ts = Series(np.zeros(len(ts), dtype=int), index=ts.index)
-
-        # this should work fine
-        reindexed_int = int_ts.reindex(self.ts.index)
-
-        # if NaNs introduced
-        self.assertEqual(reindexed_int.dtype, np.float_)
-
-        # NO NaNs introduced
-        reindexed_int = int_ts.reindex(int_ts.index[::2])
-        self.assertEqual(reindexed_int.dtype, np.int_)
-
-    def test_reindex_bool(self):
-
-        # A series other than float, int, string, or object
-        ts = self.ts[::2]
-        bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
-
-        # this should work fine
-        reindexed_bool = bool_ts.reindex(self.ts.index)
-
-        # if NaNs introduced
-        self.assertEqual(reindexed_bool.dtype, np.object_)
-
-        # NO NaNs introduced
-        reindexed_bool = bool_ts.reindex(bool_ts.index[::2])
-        self.assertEqual(reindexed_bool.dtype, np.bool_)
-
-    def test_reindex_bool_pad(self):
-        # fail
-        ts = self.ts[5:]
-        bool_ts = Series(np.zeros(len(ts), dtype=bool), index=ts.index)
-        filled_bool = bool_ts.reindex(self.ts.index, method='pad')
-        self.assertTrue(isnull(filled_bool[:5]).all())
-
-    def test_reindex_like(self):
-        other = self.ts[::2]
-        assert_series_equal(self.ts.reindex(other.index),
-                            self.ts.reindex_like(other))
-
-        # GH 7179
-        day1 = datetime(2013, 3, 5)
-        day2 = datetime(2013, 5, 5)
-        day3 = datetime(2014, 3, 5)
-
-        series1 = Series([5, None, None], [day1, day2, day3])
-        series2 = Series([None, None], [day1, day3])
-
-        result = series1.reindex_like(series2, method='pad')
-        expected = Series([5, np.nan], index=[day1, day3])
-        assert_series_equal(result, expected)
-
-    def test_reindex_fill_value(self):
-        # -----------------------------------------------------------
-        # floats
-        floats = Series([1., 2., 3.])
-        result = floats.reindex([1, 2, 3])
-        expected = Series([2., 3., np.nan], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        result = floats.reindex([1, 2, 3], fill_value=0)
-        expected = Series([2., 3., 0], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        # -----------------------------------------------------------
-        # ints
-        ints = Series([1, 2, 3])
-
-        result = ints.reindex([1, 2, 3])
-        expected = Series([2., 3., np.nan], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-        # don't upcast
-        result = ints.reindex([1, 2, 3], fill_value=0)
-        expected = Series([2, 3, 0], index=[1, 2, 3])
-        self.assertTrue(issubclass(result.dtype.type, np.integer))
-        assert_series_equal(result, expected)
-
-        # -----------------------------------------------------------
-        # objects
-        objects = Series([1, 2, 3], dtype=object)
-
-        result = objects.reindex([1, 2, 3])
-        expected = Series([2, 3, np.nan], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        result = objects.reindex([1, 2, 3], fill_value='foo')
-        expected = Series([2, 3, 'foo'], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        # ------------------------------------------------------------
-        # bools
-        bools = Series([True, False, True])
-
-        result = bools.reindex([1, 2, 3])
-        expected = Series([False, True, np.nan], index=[1, 2, 3], dtype=object)
-        assert_series_equal(result, expected)
-
-        result = bools.reindex([1, 2, 3], fill_value=False)
-        expected = Series([False, True, False], index=[1, 2, 3])
-        assert_series_equal(result, expected)
-
-    def test_select(self):
-        n = len(self.ts)
-        result = self.ts.select(lambda x: x >= self.ts.index[n // 2])
-        expected = self.ts.reindex(self.ts.index[n // 2:])
-        assert_series_equal(result, expected)
-
-        result = self.ts.select(lambda x: x.weekday() == 2)
-        expected = self.ts[self.ts.index.weekday == 2]
-        assert_series_equal(result, expected)
-
-    def test_cast_on_putmask(self):
-
-        # GH 2746
-
-        # need to upcast
-        s = Series([1, 2], index=[1, 2], dtype='int64')
-        s[[True, False]] = Series([0], index=[1], dtype='int64')
-        expected = Series([0, 2], index=[1, 2], dtype='int64')
-
-        assert_series_equal(s, expected)
-
-    def test_type_promote_putmask(self):
-
-        # GH8387: test that changing types does not break alignment
-        ts = Series(np.random.randn(100), index=np.arange(100, 0, -1)).round(5)
-        left, mask = ts.copy(), ts > 0
-        right = ts[mask].copy().map(str)
-        left[mask] = right
-        assert_series_equal(left, ts.map(lambda t: str(t) if t > 0 else t))
-
-        s = Series([0, 1, 2, 0])
-        mask = s > 0
-        s2 = s[mask].map(str)
-        s[mask] = s2
-        assert_series_equal(s, Series([0, '1', '2', 0]))
-
-        s = Series([0, 'foo', 'bar', 0])
-        mask = Series([False, True, True, False])
-        s2 = s[mask]
-        s[mask] = s2
-        assert_series_equal(s, Series([0, 'foo', 'bar', 0]))
-
-    def test_head_tail(self):
-        assert_series_equal(self.series.head(), self.series[:5])
-        assert_series_equal(self.series.head(0), self.series[0:0])
-        assert_series_equal(self.series.tail(), self.series[-5:])
-        assert_series_equal(self.series.tail(0), self.series[0:0])
-
-    def test_multilevel_preserve_name(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
-                                                                  'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        s = Series(np.random.randn(len(index)), index=index, name='sth')
-
-        result = s['foo']
-        result2 = s.loc['foo']
-        self.assertEqual(result.name, s.name)
-        self.assertEqual(result2.name, s.name)
-
-    def test_setitem_scalar_into_readonly_backing_data(self):
-        # GH14359: test that you cannot mutate a read only buffer
-
-        array = np.zeros(5)
-        array.flags.writeable = False  # make the array immutable
-        series = Series(array)
-
-        for n in range(len(series)):
-            with self.assertRaises(ValueError):
-                series[n] = 1
-
-            self.assertEqual(
-                array[n],
-                0,
-                msg='even though the ValueError was raised, the underlying'
-                ' array was still mutated!',
-            )
-
-    def test_setitem_slice_into_readonly_backing_data(self):
-        # GH14359: test that you cannot mutate a read only buffer
-
-        array = np.zeros(5)
-        array.flags.writeable = False  # make the array immutable
-        series = Series(array)
-
-        with self.assertRaises(ValueError):
-            series[1:3] = 1
-
-        self.assertTrue(
-            not array.any(),
-            msg='even though the ValueError was raised, the underlying'
-            ' array was still mutated!',
-        )
-
-
-class TestTimeSeriesDuplicates(tm.TestCase):
-
-    def setUp(self):
-        dates = [datetime(2000, 1, 2), datetime(2000, 1, 2),
-                 datetime(2000, 1, 2), datetime(2000, 1, 3),
-                 datetime(2000, 1, 3), datetime(2000, 1, 3),
-                 datetime(2000, 1, 4), datetime(2000, 1, 4),
-                 datetime(2000, 1, 4), datetime(2000, 1, 5)]
-
-        self.dups = Series(np.random.randn(len(dates)), index=dates)
-
-    def test_constructor(self):
-        tm.assertIsInstance(self.dups, Series)
-        tm.assertIsInstance(self.dups.index, DatetimeIndex)
-
-    def test_is_unique_monotonic(self):
-        self.assertFalse(self.dups.index.is_unique)
-
-    def test_index_unique(self):
-        uniques = self.dups.index.unique()
-        expected = DatetimeIndex([datetime(2000, 1, 2), datetime(2000, 1, 3),
-                                  datetime(2000, 1, 4), datetime(2000, 1, 5)])
-        self.assertEqual(uniques.dtype, 'M8[ns]')  # sanity
-        tm.assert_index_equal(uniques, expected)
-        self.assertEqual(self.dups.index.nunique(), 4)
-
-        # #2563
-        self.assertTrue(isinstance(uniques, DatetimeIndex))
-
-        dups_local = self.dups.index.tz_localize('US/Eastern')
-        dups_local.name = 'foo'
-        result = dups_local.unique()
-        expected = DatetimeIndex(expected, name='foo')
-        expected = expected.tz_localize('US/Eastern')
-        self.assertTrue(result.tz is not None)
-        self.assertEqual(result.name, 'foo')
-        tm.assert_index_equal(result, expected)
-
-        # NaT, note this is excluded
-        arr = [1370745748 + t for t in range(20)] + [tslib.iNaT]
-        idx = DatetimeIndex(arr * 3)
-        tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
-        self.assertEqual(idx.nunique(), 20)
-        self.assertEqual(idx.nunique(dropna=False), 21)
-
-        arr = [Timestamp('2013-06-09 02:42:28') + timedelta(seconds=t)
-               for t in range(20)] + [NaT]
-        idx = DatetimeIndex(arr * 3)
-        tm.assert_index_equal(idx.unique(), DatetimeIndex(arr))
-        self.assertEqual(idx.nunique(), 20)
-        self.assertEqual(idx.nunique(dropna=False), 21)
-
-    def test_index_dupes_contains(self):
-        d = datetime(2011, 12, 5, 20, 30)
-        ix = DatetimeIndex([d, d])
-        self.assertTrue(d in ix)
-
-    def test_duplicate_dates_indexing(self):
-        ts = self.dups
-
-        uniques = ts.index.unique()
-        for date in uniques:
-            result = ts[date]
-
-            mask = ts.index == date
-            total = (ts.index == date).sum()
-            expected = ts[mask]
-            if total > 1:
-                assert_series_equal(result, expected)
-            else:
-                assert_almost_equal(result, expected[0])
-
-            cp = ts.copy()
-            cp[date] = 0
-            expected = Series(np.where(mask, 0, ts), index=ts.index)
-            assert_series_equal(cp, expected)
-
-        self.assertRaises(KeyError, ts.__getitem__, datetime(2000, 1, 6))
-
-        # new index
-        ts[datetime(2000, 1, 6)] = 0
-        self.assertEqual(ts[datetime(2000, 1, 6)], 0)
-
-    def test_range_slice(self):
-        idx = DatetimeIndex(['1/1/2000', '1/2/2000', '1/2/2000', '1/3/2000',
-                             '1/4/2000'])
-
-        ts = Series(np.random.randn(len(idx)), index=idx)
-
-        result = ts['1/2/2000':]
-        expected = ts[1:]
-        assert_series_equal(result, expected)
-
-        result = ts['1/2/2000':'1/3/2000']
-        expected = ts[1:4]
-        assert_series_equal(result, expected)
-
-    def test_groupby_average_dup_values(self):
-        result = self.dups.groupby(level=0).mean()
-        expected = self.dups.groupby(self.dups.index).mean()
-        assert_series_equal(result, expected)
-
-    def test_indexing_over_size_cutoff(self):
-        import datetime
-        # #1821
-
-        old_cutoff = _index._SIZE_CUTOFF
-        try:
-            _index._SIZE_CUTOFF = 1000
-
-            # create large list of non periodic datetime
-            dates = []
-            sec = datetime.timedelta(seconds=1)
-            half_sec = datetime.timedelta(microseconds=500000)
-            d = datetime.datetime(2011, 12, 5, 20, 30)
-            n = 1100
-            for i in range(n):
-                dates.append(d)
-                dates.append(d + sec)
-                dates.append(d + sec + half_sec)
-                dates.append(d + sec + sec + half_sec)
-                d += 3 * sec
-
-            # duplicate some values in the list
-            duplicate_positions = np.random.randint(0, len(dates) - 1, 20)
-            for p in duplicate_positions:
-                dates[p + 1] = dates[p]
-
-            df = DataFrame(np.random.randn(len(dates), 4),
-                           index=dates,
-                           columns=list('ABCD'))
-
-            pos = n * 3
-            timestamp = df.index[pos]
-            self.assertIn(timestamp, df.index)
-
-            # it works!
-            df.loc[timestamp]
-            self.assertTrue(len(df.loc[[timestamp]]) > 0)
-        finally:
-            _index._SIZE_CUTOFF = old_cutoff
-
-    def test_indexing_unordered(self):
-        # GH 2437
-        rng = date_range(start='2011-01-01', end='2011-01-15')
-        ts = Series(np.random.rand(len(rng)), index=rng)
-        ts2 = pd.concat([ts[0:4], ts[-4:], ts[4:-4]])
-
-        for t in ts.index:
-            # TODO: unused?
-            s = str(t)  # noqa
-
-            expected = ts[t]
-            result = ts2[t]
-            self.assertTrue(expected == result)
-
-        # GH 3448 (ranges)
-        def compare(slobj):
-            result = ts2[slobj].copy()
-            result = result.sort_index()
-            expected = ts[slobj]
-            assert_series_equal(result, expected)
-
-        compare(slice('2011-01-01', '2011-01-15'))
-        compare(slice('2010-12-30', '2011-01-15'))
-        compare(slice('2011-01-01', '2011-01-16'))
-
-        # partial ranges
-        compare(slice('2011-01-01', '2011-01-6'))
-        compare(slice('2011-01-06', '2011-01-8'))
-        compare(slice('2011-01-06', '2011-01-12'))
-
-        # single values
-        result = ts2['2011'].sort_index()
-        expected = ts['2011']
-        assert_series_equal(result, expected)
-
-        # diff freq
-        rng = date_range(datetime(2005, 1, 1), periods=20, freq='M')
-        ts = Series(np.arange(len(rng)), index=rng)
-        ts = ts.take(np.random.permutation(20))
-
-        result = ts['2005']
-        for t in result.index:
-            self.assertTrue(t.year == 2005)
-
-    def test_indexing(self):
-
-        idx = date_range("2001-1-1", periods=20, freq='M')
-        ts = Series(np.random.rand(len(idx)), index=idx)
-
-        # getting
-
-        # GH 3070, make sure semantics work on Series/Frame
-        expected = ts['2001']
-        expected.name = 'A'
-
-        df = DataFrame(dict(A=ts))
-        result = df['2001']['A']
-        assert_series_equal(expected, result)
-
-        # setting
-        ts['2001'] = 1
-        expected = ts['2001']
-        expected.name = 'A'
-
-        df.loc['2001', 'A'] = 1
-
-        result = df['2001']['A']
-        assert_series_equal(expected, result)
-
-        # GH3546 (not including times on the last day)
-        idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:00',
-                         freq='H')
-        ts = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013-05']
-        assert_series_equal(expected, ts)
-
-        idx = date_range(start='2013-05-31 00:00', end='2013-05-31 23:59',
-                         freq='S')
-        ts = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013-05']
-        assert_series_equal(expected, ts)
-
-        idx = [Timestamp('2013-05-31 00:00'),
-               Timestamp(datetime(2013, 5, 31, 23, 59, 59, 999999))]
-        ts = Series(lrange(len(idx)), index=idx)
-        expected = ts['2013']
-        assert_series_equal(expected, ts)
-
-        # GH14826, indexing with a seconds resolution string / datetime object
-        df = DataFrame(np.random.rand(5, 5),
-                       columns=['open', 'high', 'low', 'close', 'volume'],
-                       index=date_range('2012-01-02 18:01:00',
-                                        periods=5, tz='US/Central', freq='s'))
-        expected = df.loc[[df.index[2]]]
-
-        # this is a single date, so will raise
-        self.assertRaises(KeyError, df.__getitem__, '2012-01-02 18:01:02', )
-        self.assertRaises(KeyError, df.__getitem__, df.index[2], )
-
-
-class TestDatetimeIndexing(tm.TestCase):
-    """
-    Also test support for datetime64[ns] in Series / DataFrame
-    """
-
-    def setUp(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='Min')
-        self.series = Series(np.random.rand(len(dti)), dti)
-
-    def test_fancy_getitem(self):
-        dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
-                            end=datetime(2010, 1, 1))
-
-        s = Series(np.arange(len(dti)), index=dti)
-
-        self.assertEqual(s[48], 48)
-        self.assertEqual(s['1/2/2009'], 48)
-        self.assertEqual(s['2009-1-2'], 48)
-        self.assertEqual(s[datetime(2009, 1, 2)], 48)
-        self.assertEqual(s[lib.Timestamp(datetime(2009, 1, 2))], 48)
-        self.assertRaises(KeyError, s.__getitem__, '2009-1-3')
-
-        assert_series_equal(s['3/6/2009':'2009-06-05'],
-                            s[datetime(2009, 3, 6):datetime(2009, 6, 5)])
-
-    def test_fancy_setitem(self):
-        dti = DatetimeIndex(freq='WOM-1FRI', start=datetime(2005, 1, 1),
-                            end=datetime(2010, 1, 1))
-
-        s = Series(np.arange(len(dti)), index=dti)
-        s[48] = -1
-        self.assertEqual(s[48], -1)
-        s['1/2/2009'] = -2
-        self.assertEqual(s[48], -2)
-        s['1/2/2009':'2009-06-05'] = -3
-        self.assertTrue((s[48:54] == -3).all())
-
-    def test_dti_snap(self):
-        dti = DatetimeIndex(['1/1/2002', '1/2/2002', '1/3/2002', '1/4/2002',
-                             '1/5/2002', '1/6/2002', '1/7/2002'], freq='D')
-
-        res = dti.snap(freq='W-MON')
-        exp = date_range('12/31/2001', '1/7/2002', freq='w-mon')
-        exp = exp.repeat([3, 4])
-        self.assertTrue((res == exp).all())
-
-        res = dti.snap(freq='B')
-
-        exp = date_range('1/1/2002', '1/7/2002', freq='b')
-        exp = exp.repeat([1, 1, 1, 2, 2])
-        self.assertTrue((res == exp).all())
-
-    def test_dti_reset_index_round_trip(self):
-        dti = DatetimeIndex(start='1/1/2001', end='6/1/2001', freq='D')
-        d1 = DataFrame({'v': np.random.rand(len(dti))}, index=dti)
-        d2 = d1.reset_index()
-        self.assertEqual(d2.dtypes[0], np.dtype('M8[ns]'))
-        d3 = d2.set_index('index')
-        assert_frame_equal(d1, d3, check_names=False)
-
-        # #2329
-        stamp = datetime(2012, 11, 22)
-        df = DataFrame([[stamp, 12.1]], columns=['Date', 'Value'])
-        df = df.set_index('Date')
-
-        self.assertEqual(df.index[0], stamp)
-        self.assertEqual(df.reset_index()['Date'][0], stamp)
-
-    def test_series_set_value(self):
-        # #1561
-
-        dates = [datetime(2001, 1, 1), datetime(2001, 1, 2)]
-        index = DatetimeIndex(dates)
-
-        s = Series().set_value(dates[0], 1.)
-        s2 = s.set_value(dates[1], np.nan)
-
-        exp = Series([1., np.nan], index=index)
-
-        assert_series_equal(s2, exp)
-
-        # s = Series(index[:1], index[:1])
-        # s2 = s.set_value(dates[1], index[1])
-        # self.assertEqual(s2.values.dtype, 'M8[ns]')
-
-    @slow
-    def test_slice_locs_indexerror(self):
-        times = [datetime(2000, 1, 1) + timedelta(minutes=i * 10)
-                 for i in range(100000)]
-        s = Series(lrange(100000), times)
-        s.loc[datetime(1900, 1, 1):datetime(2100, 1, 1)]
-
-    def test_slicing_datetimes(self):
-
-        # GH 7523
-
-        # unique
-        df = DataFrame(np.arange(4., dtype='float64'),
-                       index=[datetime(2001, 1, i, 10, 00)
-                              for i in [1, 2, 3, 4]])
-        result = df.loc[datetime(2001, 1, 1, 10):]
-        assert_frame_equal(result, df)
-        result = df.loc[:datetime(2001, 1, 4, 10)]
-        assert_frame_equal(result, df)
-        result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
-        assert_frame_equal(result, df)
-
-        result = df.loc[datetime(2001, 1, 1, 11):]
-        expected = df.iloc[1:]
-        assert_frame_equal(result, expected)
-        result = df.loc['20010101 11':]
-        assert_frame_equal(result, expected)
-
-        # duplicates
-        df = pd.DataFrame(np.arange(5., dtype='float64'),
-                          index=[datetime(2001, 1, i, 10, 00)
-                                 for i in [1, 2, 2, 3, 4]])
-
-        result = df.loc[datetime(2001, 1, 1, 10):]
-        assert_frame_equal(result, df)
-        result = df.loc[:datetime(2001, 1, 4, 10)]
-        assert_frame_equal(result, df)
-        result = df.loc[datetime(2001, 1, 1, 10):datetime(2001, 1, 4, 10)]
-        assert_frame_equal(result, df)
-
-        result = df.loc[datetime(2001, 1, 1, 11):]
-        expected = df.iloc[1:]
-        assert_frame_equal(result, expected)
-        result = df.loc['20010101 11':]
-        assert_frame_equal(result, expected)
-
-    def test_frame_datetime64_duplicated(self):
-        dates = date_range('2010-07-01', end='2010-08-05')
-
-        tst = DataFrame({'symbol': 'AAA', 'date': dates})
-        result = tst.duplicated(['date', 'symbol'])
-        self.assertTrue((-result).all())
-
-        tst = DataFrame({'date': dates})
-        result = tst.duplicated()
-        self.assertTrue((-result).all())
-
-
-class TestNatIndexing(tm.TestCase):
-
-    def setUp(self):
-        self.series = Series(date_range('1/1/2000', periods=10))
-
-    # ---------------------------------------------------------------------
-    # NaT support
-
-    def test_set_none_nan(self):
-        self.series[3] = None
-        self.assertIs(self.series[3], NaT)
-
-        self.series[3:5] = None
-        self.assertIs(self.series[4], NaT)
-
-        self.series[5] = np.nan
-        self.assertIs(self.series[5], NaT)
-
-        self.series[5:7] = np.nan
-        self.assertIs(self.series[6], NaT)
-
-    def test_nat_operations(self):
-        # GH 8617
-        s = Series([0, pd.NaT], dtype='m8[ns]')
-        exp = s[0]
-        self.assertEqual(s.median(), exp)
-        self.assertEqual(s.min(), exp)
-        self.assertEqual(s.max(), exp)
-
-    def test_round_nat(self):
-        # GH14940
-        s = Series([pd.NaT])
-        expected = Series(pd.NaT)
-        for method in ["round", "floor", "ceil"]:
-            round_method = getattr(s.dt, method)
-            for freq in ["s", "5s", "min", "5min", "h", "5h"]:
-                assert_series_equal(round_method(freq), expected)
diff --git a/pandas/tests/series/test_internals.py b/pandas/tests/series/test_internals.py
index 4b1c303200739..26b868872ee0d 100644
--- a/pandas/tests/series/test_internals.py
+++ b/pandas/tests/series/test_internals.py
@@ -3,18 +3,17 @@
 
 from datetime import datetime
 
-from numpy import nan
 import numpy as np
+import pytest
 
-from pandas import Series
-from pandas.tseries.index import Timestamp
-import pandas._libs.lib as lib
-
-from pandas.util.testing import assert_series_equal
+import pandas as pd
+from pandas import NaT, Series, Timestamp
+from pandas.core.internals.blocks import IntBlock
 import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
 
 
-class TestSeriesInternals(tm.TestCase):
+class TestSeriesInternals(object):
 
     def test_convert_objects(self):
 
@@ -85,7 +84,7 @@ def test_convert_objects(self):
 
         expected = Series([Timestamp('20010101'), Timestamp('20010102'),
                            Timestamp('20010103'),
-                           lib.NaT, lib.NaT, lib.NaT, Timestamp('20010104'),
+                           NaT, NaT, NaT, Timestamp('20010104'),
                            Timestamp('20010105')], dtype='M8[ns]')
         with tm.assert_produces_warning(FutureWarning):
             result = s2.convert_objects(convert_dates='coerce',
@@ -101,7 +100,7 @@ def test_convert_objects(self):
         with tm.assert_produces_warning(FutureWarning):
             result = s.convert_objects(convert_dates='coerce',
                                        convert_numeric=False)
-        expected = Series([lib.NaT] * 2 + [Timestamp(1)] * 2)
+        expected = Series([NaT] * 2 + [Timestamp(1)] * 2)
         assert_series_equal(result, expected)
 
         # preserver if non-object
@@ -114,7 +113,7 @@ def test_convert_objects(self):
         # r = s.copy()
         # r[0] = np.nan
         # result = r.convert_objects(convert_dates=True,convert_numeric=False)
-        # self.assertEqual(result.dtype, 'M8[ns]')
+        # assert result.dtype == 'M8[ns]'
 
         # dateutil parses some single letters into today's value as a date
         for x in 'abcdefghijklmnopqrstuvwxyz':
@@ -147,14 +146,14 @@ def test_convert(self):
         # Test coercion returns correct type
         s = Series(['a', 'b', 'c'])
         results = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT] * 3)
+        expected = Series([NaT] * 3)
         assert_series_equal(results, expected)
 
         results = s._convert(numeric=True, coerce=True)
         expected = Series([np.nan] * 3)
         assert_series_equal(results, expected)
 
-        expected = Series([lib.NaT] * 3, dtype=np.dtype('m8[ns]'))
+        expected = Series([NaT] * 3, dtype=np.dtype('m8[ns]'))
         results = s._convert(timedelta=True, coerce=True)
         assert_series_equal(results, expected)
 
@@ -164,15 +163,15 @@ def test_convert(self):
         # Test coercion with mixed types
         s = Series(['a', '3.1415', dt, td])
         results = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT, lib.NaT, dt, lib.NaT])
+        expected = Series([NaT, NaT, dt, NaT])
         assert_series_equal(results, expected)
 
         results = s._convert(numeric=True, coerce=True)
-        expected = Series([nan, 3.1415, nan, nan])
+        expected = Series([np.nan, 3.1415, np.nan, np.nan])
         assert_series_equal(results, expected)
 
         results = s._convert(timedelta=True, coerce=True)
-        expected = Series([lib.NaT, lib.NaT, lib.NaT, td],
+        expected = Series([NaT, NaT, NaT, td],
                           dtype=np.dtype('m8[ns]'))
         assert_series_equal(results, expected)
 
@@ -180,7 +179,7 @@ def test_convert(self):
         results = s._convert(datetime=True)
         assert_series_equal(results, s)
         results = s._convert(numeric=True)
-        expected = Series([nan, 3.1415, nan, nan])
+        expected = Series([np.nan, 3.1415, np.nan, np.nan])
         assert_series_equal(results, expected)
         results = s._convert(timedelta=True)
         assert_series_equal(results, s)
@@ -229,13 +228,13 @@ def test_convert(self):
         r['a'] = 'garbled'
         result = r._convert(numeric=True)
         expected = s.copy()
-        expected['a'] = nan
+        expected['a'] = np.nan
         assert_series_equal(result, expected)
 
         # GH 4119, not converting a mixed type (e.g.floats and object)
         s = Series([1, 'na', 3, 4])
         result = s._convert(datetime=True, numeric=True)
-        expected = Series([1, nan, 3, 4])
+        expected = Series([1, np.nan, 3, 4])
         assert_series_equal(result, expected)
 
         s = Series([1, '', 3, 4])
@@ -258,7 +257,7 @@ def test_convert(self):
         assert_series_equal(result, expected)
 
         expected = Series([Timestamp('20010101'), Timestamp('20010102'),
-                           Timestamp('20010103'), lib.NaT, lib.NaT, lib.NaT,
+                           Timestamp('20010103'), NaT, NaT, NaT,
                            Timestamp('20010104'), Timestamp('20010105')],
                           dtype='M8[ns]')
         result = s2._convert(datetime=True, numeric=False, timedelta=False,
@@ -269,7 +268,7 @@ def test_convert(self):
 
         s = Series(['foo', 'bar', 1, 1.0], dtype='O')
         result = s._convert(datetime=True, coerce=True)
-        expected = Series([lib.NaT] * 2 + [Timestamp(1)] * 2)
+        expected = Series([NaT] * 2 + [Timestamp(1)] * 2)
         assert_series_equal(result, expected)
 
         # preserver if non-object
@@ -280,10 +279,10 @@ def test_convert(self):
         # r = s.copy()
         # r[0] = np.nan
         # result = r._convert(convert_dates=True,convert_numeric=False)
-        # self.assertEqual(result.dtype, 'M8[ns]')
+        # assert result.dtype == 'M8[ns]'
 
         # dateutil parses some single letters into today's value as a date
-        expected = Series([lib.NaT])
+        expected = Series([NaT])
         for x in 'abcdefghijklmnopqrstuvwxyz':
             s = Series([x])
             result = s._convert(datetime=True, coerce=True)
@@ -294,7 +293,9 @@ def test_convert(self):
 
     def test_convert_no_arg_error(self):
         s = Series(['1.0', '2'])
-        self.assertRaises(ValueError, s._convert)
+        msg = r"At least one of datetime, numeric or timedelta must be True\."
+        with pytest.raises(ValueError, match=msg):
+            s._convert()
 
     def test_convert_preserve_bool(self):
         s = Series([1, True, 3, 5], dtype=object)
@@ -307,3 +308,36 @@ def test_convert_preserve_all_bool(self):
         r = s._convert(datetime=True, numeric=True)
         e = Series([False, True, False, False], dtype=bool)
         tm.assert_series_equal(r, e)
+
+    def test_constructor_no_pandas_array(self):
+        ser = pd.Series([1, 2, 3])
+        result = pd.Series(ser.array)
+        tm.assert_series_equal(ser, result)
+        assert isinstance(result._data.blocks[0], IntBlock)
+
+    def test_from_array(self):
+        result = pd.Series(pd.array(['1H', '2H'], dtype='timedelta64[ns]'))
+        assert result._data.blocks[0].is_extension is False
+
+        result = pd.Series(pd.array(['2015'], dtype='datetime64[ns]'))
+        assert result._data.blocks[0].is_extension is False
+
+    def test_from_list_dtype(self):
+        result = pd.Series(['1H', '2H'], dtype='timedelta64[ns]')
+        assert result._data.blocks[0].is_extension is False
+
+        result = pd.Series(['2015'], dtype='datetime64[ns]')
+        assert result._data.blocks[0].is_extension is False
+
+
+def test_hasnans_unchached_for_series():
+    # GH#19700
+    idx = pd.Index([0, 1])
+    assert idx.hasnans is False
+    assert 'hasnans' in idx._cache
+    ser = idx.to_series()
+    assert ser.hasnans is False
+    assert not hasattr(ser, '_cache')
+    ser.iloc[-1] = np.nan
+    assert ser.hasnans is True
+    assert Series.hasnans.__doc__ == pd.Index.hasnans.__doc__
diff --git a/pandas/tests/series/test_io.py b/pandas/tests/series/test_io.py
index d514fbfc142f0..5749b0c6551d6 100644
--- a/pandas/tests/series/test_io.py
+++ b/pandas/tests/series/test_io.py
@@ -1,93 +1,141 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
+import collections
 from datetime import datetime
 
 import numpy as np
-import pandas as pd
+import pytest
 
-from pandas import Series, DataFrame
+from pandas.compat import StringIO, u
 
-from pandas.compat import StringIO, u, long
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal, ensure_clean)
+import pandas as pd
+from pandas import DataFrame, Series
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal, ensure_clean)
+
+from pandas.io.common import _get_handle
+
+
+class TestSeriesToCSV():
+
+    def read_csv(self, path, **kwargs):
+        params = dict(squeeze=True, index_col=0,
+                      header=None, parse_dates=True)
+        params.update(**kwargs)
+
+        header = params.get("header")
+        out = pd.read_csv(path, **params)
 
-from .common import TestData
+        if header is None:
+            out.name = out.index.name = None
 
+        return out
 
-class TestSeriesToCSV(TestData, tm.TestCase):
+    def test_from_csv_deprecation(self, datetime_series):
+        # see gh-17812
+        with ensure_clean() as path:
+            datetime_series.to_csv(path, header=False)
 
-    def test_from_csv(self):
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                ts = self.read_csv(path)
+                depr_ts = Series.from_csv(path)
+                assert_series_equal(depr_ts, ts)
 
+    @pytest.mark.parametrize("arg", ["path", "header", "both"])
+    def test_to_csv_deprecation(self, arg, datetime_series):
+        # see gh-19715
         with ensure_clean() as path:
-            self.ts.to_csv(path)
-            ts = Series.from_csv(path)
-            assert_series_equal(self.ts, ts, check_names=False)
-            self.assertTrue(ts.name is None)
-            self.assertTrue(ts.index.name is None)
-
-            # GH10483
-            self.ts.to_csv(path, header=True)
-            ts_h = Series.from_csv(path, header=0)
-            self.assertTrue(ts_h.name == 'ts')
-
-            self.series.to_csv(path)
-            series = Series.from_csv(path)
-            self.assertIsNone(series.name)
-            self.assertIsNone(series.index.name)
-            assert_series_equal(self.series, series, check_names=False)
-            self.assertTrue(series.name is None)
-            self.assertTrue(series.index.name is None)
-
-            self.series.to_csv(path, header=True)
-            series_h = Series.from_csv(path, header=0)
-            self.assertTrue(series_h.name == 'series')
-
-            outfile = open(path, 'w')
-            outfile.write('1998-01-01|1.0\n1999-01-01|2.0')
-            outfile.close()
-            series = Series.from_csv(path, sep='|')
-            checkseries = Series({datetime(1998, 1, 1): 1.0,
-                                  datetime(1999, 1, 1): 2.0})
-            assert_series_equal(checkseries, series)
-
-            series = Series.from_csv(path, sep='|', parse_dates=False)
-            checkseries = Series({'1998-01-01': 1.0, '1999-01-01': 2.0})
-            assert_series_equal(checkseries, series)
-
-    def test_to_csv(self):
+            if arg == "path":
+                kwargs = dict(path=path, header=False)
+            elif arg == "header":
+                kwargs = dict(path_or_buf=path)
+            else:  # Both discrepancies match.
+                kwargs = dict(path=path)
+
+            with tm.assert_produces_warning(FutureWarning):
+                datetime_series.to_csv(**kwargs)
+
+                # Make sure roundtrip still works.
+                ts = self.read_csv(path)
+                assert_series_equal(datetime_series, ts, check_names=False)
+
+    def test_from_csv(self, datetime_series, string_series):
+
+        with ensure_clean() as path:
+            datetime_series.to_csv(path, header=False)
+            ts = self.read_csv(path)
+            assert_series_equal(datetime_series, ts, check_names=False)
+
+            assert ts.name is None
+            assert ts.index.name is None
+
+            with tm.assert_produces_warning(FutureWarning,
+                                            check_stacklevel=False):
+                depr_ts = Series.from_csv(path)
+                assert_series_equal(depr_ts, ts)
+
+            # see gh-10483
+            datetime_series.to_csv(path, header=True)
+            ts_h = self.read_csv(path, header=0)
+            assert ts_h.name == "ts"
+
+            string_series.to_csv(path, header=False)
+            series = self.read_csv(path)
+            assert_series_equal(string_series, series, check_names=False)
+
+            assert series.name is None
+            assert series.index.name is None
+
+            string_series.to_csv(path, header=True)
+            series_h = self.read_csv(path, header=0)
+            assert series_h.name == "series"
+
+            with open(path, "w") as outfile:
+                outfile.write("1998-01-01|1.0\n1999-01-01|2.0")
+
+            series = self.read_csv(path, sep="|")
+            check_series = Series({datetime(1998, 1, 1): 1.0,
+                                   datetime(1999, 1, 1): 2.0})
+            assert_series_equal(check_series, series)
+
+            series = self.read_csv(path, sep="|", parse_dates=False)
+            check_series = Series({"1998-01-01": 1.0, "1999-01-01": 2.0})
+            assert_series_equal(check_series, series)
+
+    def test_to_csv(self, datetime_series):
         import io
 
         with ensure_clean() as path:
-            self.ts.to_csv(path)
+            datetime_series.to_csv(path, header=False)
 
             with io.open(path, newline=None) as f:
                 lines = f.readlines()
             assert (lines[1] != '\n')
 
-            self.ts.to_csv(path, index=False)
+            datetime_series.to_csv(path, index=False, header=False)
             arr = np.loadtxt(path)
-            assert_almost_equal(arr, self.ts.values)
+            assert_almost_equal(arr, datetime_series.values)
 
     def test_to_csv_unicode_index(self):
         buf = StringIO()
         s = Series([u("\u05d0"), "d2"], index=[u("\u05d0"), u("\u05d1")])
 
-        s.to_csv(buf, encoding='UTF-8')
+        s.to_csv(buf, encoding="UTF-8", header=False)
         buf.seek(0)
 
-        s2 = Series.from_csv(buf, index_col=0, encoding='UTF-8')
-
+        s2 = self.read_csv(buf, index_col=0, encoding="UTF-8")
         assert_series_equal(s, s2)
 
     def test_to_csv_float_format(self):
 
         with ensure_clean() as filename:
             ser = Series([0.123456, 0.234567, 0.567567])
-            ser.to_csv(filename, float_format='%.2f')
+            ser.to_csv(filename, float_format="%.2f", header=False)
 
-            rs = Series.from_csv(filename)
+            rs = self.read_csv(filename)
             xp = Series([0.12, 0.23, 0.57])
             assert_series_equal(rs, xp)
 
@@ -97,50 +145,87 @@ def test_to_csv_list_entries(self):
         split = s.str.split(r'\s+and\s+')
 
         buf = StringIO()
-        split.to_csv(buf)
+        split.to_csv(buf, header=False)
 
     def test_to_csv_path_is_none(self):
         # GH 8215
         # Series.to_csv() was returning None, inconsistent with
         # DataFrame.to_csv() which returned string
         s = Series([1, 2, 3])
-        csv_str = s.to_csv(path=None)
-        self.assertIsInstance(csv_str, str)
-
+        csv_str = s.to_csv(path_or_buf=None, header=False)
+        assert isinstance(csv_str, str)
+
+    @pytest.mark.parametrize('s,encoding', [
+        (Series([0.123456, 0.234567, 0.567567], index=['A', 'B', 'C'],
+                name='X'), None),
+        # GH 21241, 21118
+        (Series(['abc', 'def', 'ghi'], name='X'), 'ascii'),
+        (Series(["123", u"你好", u"世界"], name=u"中文"), 'gb2312'),
+        (Series(["123", u"Γειά σου", u"Κόσμε"], name=u"Ελληνικά"), 'cp737')
+    ])
+    def test_to_csv_compression(self, s, encoding, compression):
 
-class TestSeriesIO(TestData, tm.TestCase):
+        with ensure_clean() as filename:
 
-    def test_to_frame(self):
-        self.ts.name = None
-        rs = self.ts.to_frame()
-        xp = pd.DataFrame(self.ts.values, index=self.ts.index)
+            s.to_csv(filename, compression=compression, encoding=encoding,
+                     header=True)
+            # test the round trip - to_csv -> read_csv
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_series_equal(s, result)
+
+            # test the round trip using file handle - to_csv -> read_csv
+            f, _handles = _get_handle(filename, 'w', compression=compression,
+                                      encoding=encoding)
+            with f:
+                s.to_csv(f, encoding=encoding, header=True)
+            result = pd.read_csv(filename, compression=compression,
+                                 encoding=encoding, index_col=0, squeeze=True)
+            assert_series_equal(s, result)
+
+            # explicitly ensure file was compressed
+            with tm.decompress_file(filename, compression) as fh:
+                text = fh.read().decode(encoding or 'utf8')
+                assert s.name in text
+
+            with tm.decompress_file(filename, compression) as fh:
+                assert_series_equal(s, pd.read_csv(fh,
+                                                   index_col=0,
+                                                   squeeze=True,
+                                                   encoding=encoding))
+
+
+class TestSeriesIO():
+
+    def test_to_frame(self, datetime_series):
+        datetime_series.name = None
+        rs = datetime_series.to_frame()
+        xp = pd.DataFrame(datetime_series.values, index=datetime_series.index)
         assert_frame_equal(rs, xp)
 
-        self.ts.name = 'testname'
-        rs = self.ts.to_frame()
-        xp = pd.DataFrame(dict(testname=self.ts.values), index=self.ts.index)
+        datetime_series.name = 'testname'
+        rs = datetime_series.to_frame()
+        xp = pd.DataFrame(dict(testname=datetime_series.values),
+                          index=datetime_series.index)
         assert_frame_equal(rs, xp)
 
-        rs = self.ts.to_frame(name='testdifferent')
-        xp = pd.DataFrame(
-            dict(testdifferent=self.ts.values), index=self.ts.index)
+        rs = datetime_series.to_frame(name='testdifferent')
+        xp = pd.DataFrame(dict(testdifferent=datetime_series.values),
+                          index=datetime_series.index)
         assert_frame_equal(rs, xp)
 
-    def test_to_dict(self):
-        self.assert_series_equal(Series(self.ts.to_dict(), name='ts'), self.ts)
-
     def test_timeseries_periodindex(self):
         # GH2891
         from pandas import period_range
         prng = period_range('1/1/2011', '1/1/2012', freq='M')
         ts = Series(np.random.randn(len(prng)), prng)
-        new_ts = self.round_trip_pickle(ts)
-        self.assertEqual(new_ts.index.freq, 'M')
+        new_ts = tm.round_trip_pickle(ts)
+        assert new_ts.index.freq == 'M'
 
     def test_pickle_preserve_name(self):
         for n in [777, 777., 'name', datetime(2001, 11, 11), (1, 2)]:
             unpickled = self._pickle_roundtrip_name(tm.makeTimeSeries(name=n))
-            self.assertEqual(unpickled.name, n)
+            assert unpickled.name == n
 
     def _pickle_roundtrip_name(self, obj):
 
@@ -163,40 +248,20 @@ class SubclassedFrame(DataFrame):
 
         s = SubclassedSeries([1, 2, 3], name='X')
         result = s.to_frame()
-        self.assertTrue(isinstance(result, SubclassedFrame))
+        assert isinstance(result, SubclassedFrame)
         expected = SubclassedFrame({'X': [1, 2, 3]})
         assert_frame_equal(result, expected)
 
-
-class TestSeriesToList(TestData, tm.TestCase):
-
-    def test_tolist(self):
-        rs = self.ts.tolist()
-        xp = self.ts.values.tolist()
-        assert_almost_equal(rs, xp)
-
-        # datetime64
-        s = Series(self.ts.index)
-        rs = s.tolist()
-        self.assertEqual(self.ts.index[0], rs[0])
-
-    def test_tolist_np_int(self):
-        # GH10904
-        for t in ['int8', 'int16', 'int32', 'int64']:
-            s = pd.Series([1], dtype=t)
-            self.assertIsInstance(s.tolist()[0], (int, long))
-
-    def test_tolist_np_uint(self):
-        # GH10904
-        for t in ['uint8', 'uint16']:
-            s = pd.Series([1], dtype=t)
-            self.assertIsInstance(s.tolist()[0], int)
-        for t in ['uint32', 'uint64']:
-            s = pd.Series([1], dtype=t)
-            self.assertIsInstance(s.tolist()[0], long)
-
-    def test_tolist_np_float(self):
-        # GH10904
-        for t in ['float16', 'float32', 'float64']:
-            s = pd.Series([1], dtype=t)
-            self.assertIsInstance(s.tolist()[0], float)
+    @pytest.mark.parametrize('mapping', (
+        dict,
+        collections.defaultdict(list),
+        collections.OrderedDict))
+    def test_to_dict(self, mapping, datetime_series):
+        # GH16122
+        tm.assert_series_equal(
+            Series(datetime_series.to_dict(mapping), name='ts'),
+            datetime_series)
+        from_method = Series(datetime_series.to_dict(collections.Counter))
+        from_constructor = Series(collections
+                                  .Counter(datetime_series.iteritems()))
+        tm.assert_series_equal(from_method, from_constructor)
diff --git a/pandas/tests/series/test_misc_api.py b/pandas/tests/series/test_misc_api.py
deleted file mode 100644
index 2facbaf1fe31e..0000000000000
--- a/pandas/tests/series/test_misc_api.py
+++ /dev/null
@@ -1,350 +0,0 @@
-# coding=utf-8
-# pylint: disable-msg=E1101,W0612
-
-import numpy as np
-import pandas as pd
-
-from pandas import Index, Series, DataFrame, date_range
-from pandas.tseries.index import Timestamp
-
-from pandas.compat import range
-from pandas import compat
-import pandas.formats.printing as printing
-from pandas.util.testing import (assert_series_equal,
-                                 ensure_clean)
-import pandas.util.testing as tm
-
-from .common import TestData
-
-
-class SharedWithSparse(object):
-
-    def test_scalarop_preserve_name(self):
-        result = self.ts * 2
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_copy_name(self):
-        result = self.ts.copy()
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_copy_index_name_checking(self):
-        # don't want to be able to modify the index stored elsewhere after
-        # making a copy
-
-        self.ts.index.name = None
-        self.assertIsNone(self.ts.index.name)
-        self.assertIs(self.ts, self.ts)
-
-        cp = self.ts.copy()
-        cp.index.name = 'foo'
-        printing.pprint_thing(self.ts.index.name)
-        self.assertIsNone(self.ts.index.name)
-
-    def test_append_preserve_name(self):
-        result = self.ts[:5].append(self.ts[5:])
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_binop_maybe_preserve_name(self):
-        # names match, preserve
-        result = self.ts * self.ts
-        self.assertEqual(result.name, self.ts.name)
-        result = self.ts.mul(self.ts)
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts * self.ts[:-2]
-        self.assertEqual(result.name, self.ts.name)
-
-        # names don't match, don't preserve
-        cp = self.ts.copy()
-        cp.name = 'something else'
-        result = self.ts + cp
-        self.assertIsNone(result.name)
-        result = self.ts.add(cp)
-        self.assertIsNone(result.name)
-
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'floordiv', 'mod', 'pow']
-        ops = ops + ['r' + op for op in ops]
-        for op in ops:
-            # names match, preserve
-            s = self.ts.copy()
-            result = getattr(s, op)(s)
-            self.assertEqual(result.name, self.ts.name)
-
-            # names don't match, don't preserve
-            cp = self.ts.copy()
-            cp.name = 'changed'
-            result = getattr(s, op)(cp)
-            self.assertIsNone(result.name)
-
-    def test_combine_first_name(self):
-        result = self.ts.combine_first(self.ts[:5])
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_getitem_preserve_name(self):
-        result = self.ts[self.ts > 0]
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts[[0, 2, 4]]
-        self.assertEqual(result.name, self.ts.name)
-
-        result = self.ts[5:10]
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_pickle(self):
-        unp_series = self._pickle_roundtrip(self.series)
-        unp_ts = self._pickle_roundtrip(self.ts)
-        assert_series_equal(unp_series, self.series)
-        assert_series_equal(unp_ts, self.ts)
-
-    def _pickle_roundtrip(self, obj):
-
-        with ensure_clean() as path:
-            obj.to_pickle(path)
-            unpickled = pd.read_pickle(path)
-            return unpickled
-
-    def test_argsort_preserve_name(self):
-        result = self.ts.argsort()
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_sort_index_name(self):
-        result = self.ts.sort_index(ascending=False)
-        self.assertEqual(result.name, self.ts.name)
-
-    def test_to_sparse_pass_name(self):
-        result = self.ts.to_sparse()
-        self.assertEqual(result.name, self.ts.name)
-
-
-class TestSeriesMisc(TestData, SharedWithSparse, tm.TestCase):
-
-    def test_tab_completion(self):
-        # GH 9910
-        s = Series(list('abcd'))
-        # Series of str values should have .str but not .dt/.cat in __dir__
-        self.assertTrue('str' in dir(s))
-        self.assertTrue('dt' not in dir(s))
-        self.assertTrue('cat' not in dir(s))
-
-        # similiarly for .dt
-        s = Series(date_range('1/1/2015', periods=5))
-        self.assertTrue('dt' in dir(s))
-        self.assertTrue('str' not in dir(s))
-        self.assertTrue('cat' not in dir(s))
-
-        # similiarly for .cat, but with the twist that str and dt should be
-        # there if the categories are of that type first cat and str
-        s = Series(list('abbcd'), dtype="category")
-        self.assertTrue('cat' in dir(s))
-        self.assertTrue('str' in dir(s))  # as it is a string categorical
-        self.assertTrue('dt' not in dir(s))
-
-        # similar to cat and str
-        s = Series(date_range('1/1/2015', periods=5)).astype("category")
-        self.assertTrue('cat' in dir(s))
-        self.assertTrue('str' not in dir(s))
-        self.assertTrue('dt' in dir(s))  # as it is a datetime categorical
-
-    def test_not_hashable(self):
-        s_empty = Series()
-        s = Series([1])
-        self.assertRaises(TypeError, hash, s_empty)
-        self.assertRaises(TypeError, hash, s)
-
-    def test_contains(self):
-        tm.assert_contains_all(self.ts.index, self.ts)
-
-    def test_iter(self):
-        for i, val in enumerate(self.series):
-            self.assertEqual(val, self.series[i])
-
-        for i, val in enumerate(self.ts):
-            self.assertEqual(val, self.ts[i])
-
-    def test_iter_box(self):
-        vals = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')]
-        s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns]')
-        for res, exp in zip(s, vals):
-            self.assertIsInstance(res, pd.Timestamp)
-            self.assertEqual(res, exp)
-            self.assertIsNone(res.tz)
-
-        vals = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
-                pd.Timestamp('2011-01-02', tz='US/Eastern')]
-        s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'datetime64[ns, US/Eastern]')
-        for res, exp in zip(s, vals):
-            self.assertIsInstance(res, pd.Timestamp)
-            self.assertEqual(res, exp)
-            self.assertEqual(res.tz, exp.tz)
-
-        # timedelta
-        vals = [pd.Timedelta('1 days'), pd.Timedelta('2 days')]
-        s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'timedelta64[ns]')
-        for res, exp in zip(s, vals):
-            self.assertIsInstance(res, pd.Timedelta)
-            self.assertEqual(res, exp)
-
-        # period (object dtype, not boxed)
-        vals = [pd.Period('2011-01-01', freq='M'),
-                pd.Period('2011-01-02', freq='M')]
-        s = pd.Series(vals)
-        self.assertEqual(s.dtype, 'object')
-        for res, exp in zip(s, vals):
-            self.assertIsInstance(res, pd.Period)
-            self.assertEqual(res, exp)
-            self.assertEqual(res.freq, 'M')
-
-    def test_keys(self):
-        # HACK: By doing this in two stages, we avoid 2to3 wrapping the call
-        # to .keys() in a list()
-        getkeys = self.ts.keys
-        self.assertIs(getkeys(), self.ts.index)
-
-    def test_values(self):
-        self.assert_almost_equal(self.ts.values, self.ts, check_dtype=False)
-
-    def test_iteritems(self):
-        for idx, val in compat.iteritems(self.series):
-            self.assertEqual(val, self.series[idx])
-
-        for idx, val in compat.iteritems(self.ts):
-            self.assertEqual(val, self.ts[idx])
-
-        # assert is lazy (genrators don't define reverse, lists do)
-        self.assertFalse(hasattr(self.series.iteritems(), 'reverse'))
-
-    def test_raise_on_info(self):
-        s = Series(np.random.randn(10))
-        with tm.assertRaises(AttributeError):
-            s.info()
-
-    def test_copy(self):
-
-        for deep in [None, False, True]:
-            s = Series(np.arange(10), dtype='float64')
-
-            # default deep is True
-            if deep is None:
-                s2 = s.copy()
-            else:
-                s2 = s.copy(deep=deep)
-
-            s2[::2] = np.NaN
-
-            if deep is None or deep is True:
-                # Did not modify original Series
-                self.assertTrue(np.isnan(s2[0]))
-                self.assertFalse(np.isnan(s[0]))
-            else:
-                # we DID modify the original Series
-                self.assertTrue(np.isnan(s2[0]))
-                self.assertTrue(np.isnan(s[0]))
-
-        # GH 11794
-        # copy of tz-aware
-        expected = Series([Timestamp('2012/01/01', tz='UTC')])
-        expected2 = Series([Timestamp('1999/01/01', tz='UTC')])
-
-        for deep in [None, False, True]:
-
-            s = Series([Timestamp('2012/01/01', tz='UTC')])
-
-            if deep is None:
-                s2 = s.copy()
-            else:
-                s2 = s.copy(deep=deep)
-
-            s2[0] = pd.Timestamp('1999/01/01', tz='UTC')
-
-            # default deep is True
-            if deep is None or deep is True:
-                # Did not modify original Series
-                assert_series_equal(s2, expected2)
-                assert_series_equal(s, expected)
-            else:
-                # we DID modify the original Series
-                assert_series_equal(s2, expected2)
-                assert_series_equal(s, expected2)
-
-    def test_axis_alias(self):
-        s = Series([1, 2, np.nan])
-        assert_series_equal(s.dropna(axis='rows'), s.dropna(axis='index'))
-        self.assertEqual(s.dropna().sum('rows'), 3)
-        self.assertEqual(s._get_axis_number('rows'), 0)
-        self.assertEqual(s._get_axis_name('rows'), 'index')
-
-    def test_numpy_unique(self):
-        # it works!
-        np.unique(self.ts)
-
-    def test_ndarray_compat(self):
-
-        # test numpy compat with Series as sub-class of NDFrame
-        tsdf = DataFrame(np.random.randn(1000, 3), columns=['A', 'B', 'C'],
-                         index=date_range('1/1/2000', periods=1000))
-
-        def f(x):
-            return x[x.argmax()]
-
-        result = tsdf.apply(f)
-        expected = tsdf.max()
-        assert_series_equal(result, expected)
-
-        # .item()
-        s = Series([1])
-        result = s.item()
-        self.assertEqual(result, 1)
-        self.assertEqual(s.item(), s.iloc[0])
-
-        # using an ndarray like function
-        s = Series(np.random.randn(10))
-        result = np.ones_like(s)
-        expected = Series(1, index=range(10), dtype='float64')
-        # assert_series_equal(result,expected)
-
-        # ravel
-        s = Series(np.random.randn(10))
-        tm.assert_almost_equal(s.ravel(order='F'), s.values.ravel(order='F'))
-
-        # compress
-        # GH 6658
-        s = Series([0, 1., -1], index=list('abc'))
-        result = np.compress(s > 0, s)
-        assert_series_equal(result, Series([1.], index=['b']))
-
-        result = np.compress(s < -1, s)
-        # result empty Index(dtype=object) as the same as original
-        exp = Series([], dtype='float64', index=Index([], dtype='object'))
-        assert_series_equal(result, exp)
-
-        s = Series([0, 1., -1], index=[.1, .2, .3])
-        result = np.compress(s > 0, s)
-        assert_series_equal(result, Series([1.], index=[.2]))
-
-        result = np.compress(s < -1, s)
-        # result empty Float64Index as the same as original
-        exp = Series([], dtype='float64', index=Index([], dtype='float64'))
-        assert_series_equal(result, exp)
-
-    def test_str_attribute(self):
-        # GH9068
-        methods = ['strip', 'rstrip', 'lstrip']
-        s = Series([' jack', 'jill ', ' jesse ', 'frank'])
-        for method in methods:
-            expected = Series([getattr(str, method)(x) for x in s.values])
-            assert_series_equal(getattr(Series.str, method)(s.str), expected)
-
-        # str accessor only valid with string values
-        s = Series(range(5))
-        with self.assertRaisesRegexp(AttributeError, 'only use .str accessor'):
-            s.str.repeat(2)
-
-    def test_empty_method(self):
-        s_empty = pd.Series()
-        tm.assert_equal(s_empty.empty, True)
-
-        for full_series in [pd.Series([1]), pd.Series(index=[1])]:
-            tm.assert_equal(full_series.empty, False)
diff --git a/pandas/tests/series/test_missing.py b/pandas/tests/series/test_missing.py
index 7174283494fe7..ef9e575e60385 100644
--- a/pandas/tests/series/test_missing.py
+++ b/pandas/tests/series/test_missing.py
@@ -1,27 +1,32 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-import pytz
-from datetime import timedelta, datetime
-
+from datetime import datetime, timedelta
 from distutils.version import LooseVersion
-from numpy import nan
+
 import numpy as np
-import pandas as pd
+from numpy import nan
+import pytest
+import pytz
 
-from pandas import (Series, DataFrame, isnull, date_range,
-                    MultiIndex, Index, Timestamp, NaT)
-from pandas.compat import range
 from pandas._libs.tslib import iNaT
-from pandas.util.testing import assert_series_equal, assert_frame_equal
-import pandas.util.testing as tm
+from pandas.compat import PY2, range
+from pandas.errors import PerformanceWarning
+import pandas.util._test_decorators as td
 
-from .common import TestData
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, IntervalIndex, MultiIndex, NaT, Series,
+    Timestamp, date_range, isna)
+from pandas.core.series import remove_na
+import pandas.util.testing as tm
+from pandas.util.testing import assert_frame_equal, assert_series_equal
 
 try:
     import scipy
-    _is_scipy_ge_0190 = scipy.__version__ >= LooseVersion('0.19.0')
-except:
+    _is_scipy_ge_0190 = (LooseVersion(scipy.__version__) >=
+                         LooseVersion('0.19.0'))
+except ImportError:
     _is_scipy_ge_0190 = False
 
 
@@ -46,29 +51,38 @@ def _simple_ts(start, end, freq='D'):
     return Series(np.random.randn(len(rng)), index=rng)
 
 
-class TestSeriesMissingData(TestData, tm.TestCase):
+class TestSeriesMissingData():
+
+    def test_remove_na_deprecation(self):
+        # see gh-16971
+        with tm.assert_produces_warning(FutureWarning):
+            remove_na(Series([]))
 
     def test_timedelta_fillna(self):
         # GH 3371
-        s = Series([Timestamp('20130101'), Timestamp('20130101'), Timestamp(
-            '20130102'), Timestamp('20130103 9:01:01')])
+        s = Series([Timestamp('20130101'), Timestamp('20130101'),
+                    Timestamp('20130102'), Timestamp('20130103 9:01:01')])
         td = s.diff()
 
         # reg fillna
-        result = td.fillna(0)
-        expected = Series([timedelta(0), timedelta(0), timedelta(1), timedelta(
-            days=1, seconds=9 * 3600 + 60 + 1)])
+        with tm.assert_produces_warning(FutureWarning):
+            result = td.fillna(0)
+        expected = Series([timedelta(0), timedelta(0), timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
         assert_series_equal(result, expected)
 
-        # interprested as seconds
-        result = td.fillna(1)
-        expected = Series([timedelta(seconds=1), timedelta(0), timedelta(1),
+        # interpreted as seconds, deprecated
+        with tm.assert_produces_warning(FutureWarning):
+            result = td.fillna(1)
+        expected = Series([timedelta(seconds=1),
+                           timedelta(0), timedelta(1),
                            timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
         assert_series_equal(result, expected)
 
         result = td.fillna(timedelta(days=1, seconds=1))
-        expected = Series([timedelta(days=1, seconds=1), timedelta(
-            0), timedelta(1), timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
+        expected = Series([timedelta(days=1, seconds=1), timedelta(0),
+                           timedelta(1),
+                           timedelta(days=1, seconds=9 * 3600 + 60 + 1)])
         assert_series_equal(result, expected)
 
         result = td.fillna(np.timedelta64(int(1e9)))
@@ -85,14 +99,16 @@ def test_timedelta_fillna(self):
         # ffill
         td[2] = np.nan
         result = td.ffill()
-        expected = td.fillna(0)
+        with tm.assert_produces_warning(FutureWarning):
+            expected = td.fillna(0)
         expected[0] = np.nan
         assert_series_equal(result, expected)
 
         # bfill
         td[2] = np.nan
         result = td.bfill()
-        expected = td.fillna(0)
+        with tm.assert_produces_warning(FutureWarning):
+            expected = td.fillna(0)
         expected[2] = timedelta(days=1, seconds=9 * 3600 + 60 + 1)
         assert_series_equal(result, expected)
 
@@ -136,6 +152,7 @@ def test_datetime64_fillna(self):
         assert_series_equal(result, expected)
 
     def test_datetime64_tz_fillna(self):
+
         for tz in ['US/Eastern', 'Asia/Tokyo']:
             # DatetimeBlock
             s = Series([Timestamp('2011-01-01 10:00'), pd.NaT,
@@ -147,24 +164,24 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2011-01-02 10:00'),
                                Timestamp('2011-01-03 10:00'),
                                Timestamp('2011-01-02 10:00')])
-            self.assert_series_equal(expected, result)
+            tm.assert_series_equal(expected, result)
             # check s is not changed
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
             expected = Series([Timestamp('2011-01-01 10:00'),
                                Timestamp('2011-01-02 10:00', tz=tz),
                                Timestamp('2011-01-03 10:00'),
                                Timestamp('2011-01-02 10:00', tz=tz)])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna('AAA')
             expected = Series([Timestamp('2011-01-01 10:00'), 'AAA',
                                Timestamp('2011-01-03 10:00'), 'AAA'],
                               dtype=object)
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
                                3: pd.Timestamp('2011-01-04 10:00')})
@@ -172,8 +189,8 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2011-01-02 10:00', tz=tz),
                                Timestamp('2011-01-03 10:00'),
                                Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna({1: pd.Timestamp('2011-01-02 10:00'),
                                3: pd.Timestamp('2011-01-04 10:00')})
@@ -181,31 +198,31 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2011-01-02 10:00'),
                                Timestamp('2011-01-03 10:00'),
                                Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             # DatetimeBlockTZ
             idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
                                     '2011-01-03 10:00', pd.NaT], tz=tz)
             s = pd.Series(idx)
-            self.assertEqual(s.dtype, 'datetime64[ns, {0}]'.format(tz))
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            assert s.dtype == 'datetime64[ns, {0}]'.format(tz)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna(pd.Timestamp('2011-01-02 10:00'))
             expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
                                Timestamp('2011-01-02 10:00'),
                                Timestamp('2011-01-03 10:00', tz=tz),
                                Timestamp('2011-01-02 10:00')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna(pd.Timestamp('2011-01-02 10:00', tz=tz))
             idx = pd.DatetimeIndex(['2011-01-01 10:00', '2011-01-02 10:00',
                                     '2011-01-03 10:00', '2011-01-02 10:00'],
                                    tz=tz)
             expected = Series(idx)
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna(pd.Timestamp('2011-01-02 10:00',
                                            tz=tz).to_pydatetime())
@@ -213,15 +230,15 @@ def test_datetime64_tz_fillna(self):
                                     '2011-01-03 10:00', '2011-01-02 10:00'],
                                    tz=tz)
             expected = Series(idx)
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna('AAA')
             expected = Series([Timestamp('2011-01-01 10:00', tz=tz), 'AAA',
                                Timestamp('2011-01-03 10:00', tz=tz), 'AAA'],
                               dtype=object)
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
                                3: pd.Timestamp('2011-01-04 10:00')})
@@ -229,8 +246,8 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2011-01-02 10:00', tz=tz),
                                Timestamp('2011-01-03 10:00', tz=tz),
                                Timestamp('2011-01-04 10:00')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna({1: pd.Timestamp('2011-01-02 10:00', tz=tz),
                                3: pd.Timestamp('2011-01-04 10:00', tz=tz)})
@@ -238,8 +255,8 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2011-01-02 10:00', tz=tz),
                                Timestamp('2011-01-03 10:00', tz=tz),
                                Timestamp('2011-01-04 10:00', tz=tz)])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             # filling with a naive/other zone, coerce to object
             result = s.fillna(Timestamp('20130101'))
@@ -247,16 +264,62 @@ def test_datetime64_tz_fillna(self):
                                Timestamp('2013-01-01'),
                                Timestamp('2011-01-03 10:00', tz=tz),
                                Timestamp('2013-01-01')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
 
             result = s.fillna(Timestamp('20130101', tz='US/Pacific'))
             expected = Series([Timestamp('2011-01-01 10:00', tz=tz),
                                Timestamp('2013-01-01', tz='US/Pacific'),
                                Timestamp('2011-01-03 10:00', tz=tz),
                                Timestamp('2013-01-01', tz='US/Pacific')])
-            self.assert_series_equal(expected, result)
-            self.assert_series_equal(pd.isnull(s), null_loc)
+            tm.assert_series_equal(expected, result)
+            tm.assert_series_equal(pd.isna(s), null_loc)
+
+        # with timezone
+        # GH 15855
+        df = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'), pd.NaT])
+        exp = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                         pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        assert_series_equal(df.fillna(method='pad'), exp)
+
+        df = pd.Series([pd.NaT, pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        exp = pd.Series([pd.Timestamp('2012-11-11 00:00:00+01:00'),
+                         pd.Timestamp('2012-11-11 00:00:00+01:00')])
+        assert_series_equal(df.fillna(method='bfill'), exp)
+
+    def test_fillna_consistency(self):
+        # GH 16402
+        # fillna with a tz aware to a tz-naive, should result in object
+
+        s = Series([Timestamp('20130101'), pd.NaT])
+
+        result = s.fillna(Timestamp('20130101', tz='US/Eastern'))
+        expected = Series([Timestamp('20130101'),
+                           Timestamp('2013-01-01', tz='US/Eastern')],
+                          dtype='object')
+        assert_series_equal(result, expected)
+
+        # where (we ignore the errors=)
+        result = s.where([True, False],
+                         Timestamp('20130101', tz='US/Eastern'),
+                         errors='ignore')
+        assert_series_equal(result, expected)
+
+        result = s.where([True, False],
+                         Timestamp('20130101', tz='US/Eastern'),
+                         errors='ignore')
+        assert_series_equal(result, expected)
+
+        # with a non-datetime
+        result = s.fillna('foo')
+        expected = Series([Timestamp('20130101'),
+                           'foo'])
+        assert_series_equal(result, expected)
+
+        # assignment
+        s2 = s.copy()
+        s2[1] = 'foo'
+        assert_series_equal(s2, expected)
 
     def test_datetime64tz_fillna_round_issue(self):
         # GH 14872
@@ -297,16 +360,89 @@ def test_fillna_int(self):
 
     def test_fillna_raise(self):
         s = Series(np.random.randint(-100, 100, 50))
-        self.assertRaises(TypeError, s.fillna, [1, 2])
-        self.assertRaises(TypeError, s.fillna, (1, 2))
+        msg = ('"value" parameter must be a scalar or dict, but you passed a'
+               ' "list"')
+        with pytest.raises(TypeError, match=msg):
+            s.fillna([1, 2])
+
+        msg = ('"value" parameter must be a scalar or dict, but you passed a'
+               ' "tuple"')
+        with pytest.raises(TypeError, match=msg):
+            s.fillna((1, 2))
 
         # related GH 9217, make sure limit is an int and greater than 0
         s = Series([1, 2, 3, None])
+        msg = (r"Cannot specify both 'value' and 'method'\.|"
+               r"Limit must be greater than 0|"
+               "Limit must be an integer")
         for limit in [-1, 0, 1., 2.]:
             for method in ['backfill', 'bfill', 'pad', 'ffill', None]:
-                with tm.assertRaises(ValueError):
+                with pytest.raises(ValueError, match=msg):
                     s.fillna(1, limit=limit, method=method)
 
+    def test_categorical_nan_equality(self):
+        cat = Series(Categorical(["a", "b", "c", np.nan]))
+        exp = Series([True, True, True, False])
+        res = (cat == cat)
+        tm.assert_series_equal(res, exp)
+
+    def test_categorical_nan_handling(self):
+
+        # NaNs are represented as -1 in labels
+        s = Series(Categorical(["a", "b", np.nan, "a"]))
+        tm.assert_index_equal(s.cat.categories, Index(["a", "b"]))
+        tm.assert_numpy_array_equal(s.values.codes,
+                                    np.array([0, 1, -1, 0], dtype=np.int8))
+
+    @pytest.mark.parametrize('fill_value, expected_output', [
+        ('a', ['a', 'a', 'b', 'a', 'a']),
+        ({1: 'a', 3: 'b', 4: 'b'}, ['a', 'a', 'b', 'b', 'b']),
+        ({1: 'a'}, ['a', 'a', 'b', np.nan, np.nan]),
+        ({1: 'a', 3: 'b'}, ['a', 'a', 'b', 'b', np.nan]),
+        (Series('a'), ['a', np.nan, 'b', np.nan, np.nan]),
+        (Series('a', index=[1]), ['a', 'a', 'b', np.nan, np.nan]),
+        (Series({1: 'a', 3: 'b'}), ['a', 'a', 'b', 'b', np.nan]),
+        (Series(['a', 'b'], index=[3, 4]), ['a', np.nan, 'b', 'a', 'b'])
+    ])
+    def test_fillna_categorical(self, fill_value, expected_output):
+        # GH 17033
+        # Test fillna for a Categorical series
+        data = ['a', np.nan, 'b', np.nan, np.nan]
+        s = Series(Categorical(data, categories=['a', 'b']))
+        exp = Series(Categorical(expected_output, categories=['a', 'b']))
+        tm.assert_series_equal(s.fillna(fill_value), exp)
+
+    def test_fillna_categorical_raise(self):
+        data = ['a', np.nan, 'b', np.nan, np.nan]
+        s = Series(Categorical(data, categories=['a', 'b']))
+
+        with pytest.raises(ValueError,
+                           match="fill value must be in categories"):
+            s.fillna('d')
+
+        with pytest.raises(ValueError,
+                           match="fill value must be in categories"):
+            s.fillna(Series('d'))
+
+        with pytest.raises(ValueError,
+                           match="fill value must be in categories"):
+            s.fillna({1: 'd', 3: 'a'})
+
+        msg = ('"value" parameter must be a scalar or '
+               'dict, but you passed a "list"')
+        with pytest.raises(TypeError, match=msg):
+            s.fillna(['a', 'b'])
+
+        msg = ('"value" parameter must be a scalar or '
+               'dict, but you passed a "tuple"')
+        with pytest.raises(TypeError, match=msg):
+            s.fillna(('a', 'b'))
+
+        msg = ('"value" parameter must be a scalar, dict '
+               'or Series, but you passed a "DataFrame"')
+        with pytest.raises(TypeError, match=msg):
+            s.fillna(DataFrame({1: ['a'], 3: ['b']}))
+
     def test_fillna_nat(self):
         series = Series([0, 1, 2, iNaT], dtype='M8[ns]')
 
@@ -344,34 +480,51 @@ def test_fillna_nat(self):
         assert_frame_equal(filled, expected)
         assert_frame_equal(filled2, expected)
 
-    def test_isnull_for_inf(self):
+    def test_isna_for_inf(self):
+        s = Series(['a', np.inf, np.nan, 1.0])
+        with pd.option_context('mode.use_inf_as_na', True):
+            r = s.isna()
+            dr = s.dropna()
+        e = Series([False, True, True, False])
+        de = Series(['a', 1.0], index=[0, 3])
+        tm.assert_series_equal(r, e)
+        tm.assert_series_equal(dr, de)
+
+    def test_isnull_for_inf_deprecated(self):
+        # gh-17115
         s = Series(['a', np.inf, np.nan, 1.0])
         with pd.option_context('mode.use_inf_as_null', True):
-            r = s.isnull()
+            r = s.isna()
             dr = s.dropna()
+
         e = Series([False, True, True, False])
         de = Series(['a', 1.0], index=[0, 3])
         tm.assert_series_equal(r, e)
         tm.assert_series_equal(dr, de)
 
-    def test_fillna(self):
+    def test_fillna(self, datetime_series):
         ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
 
-        self.assert_series_equal(ts, ts.fillna(method='ffill'))
+        tm.assert_series_equal(ts, ts.fillna(method='ffill'))
 
         ts[2] = np.NaN
 
         exp = Series([0., 1., 1., 3., 4.], index=ts.index)
-        self.assert_series_equal(ts.fillna(method='ffill'), exp)
+        tm.assert_series_equal(ts.fillna(method='ffill'), exp)
 
         exp = Series([0., 1., 3., 3., 4.], index=ts.index)
-        self.assert_series_equal(ts.fillna(method='backfill'), exp)
+        tm.assert_series_equal(ts.fillna(method='backfill'), exp)
 
         exp = Series([0., 1., 5., 3., 4.], index=ts.index)
-        self.assert_series_equal(ts.fillna(value=5), exp)
+        tm.assert_series_equal(ts.fillna(value=5), exp)
+
+        msg = "Must specify a fill 'value' or 'method'"
+        with pytest.raises(ValueError, match=msg):
+            ts.fillna()
 
-        self.assertRaises(ValueError, ts.fillna)
-        self.assertRaises(ValueError, self.ts.fillna, value=0, method='ffill')
+        msg = "Cannot specify both 'value' and 'method'"
+        with pytest.raises(ValueError, match=msg):
+            datetime_series.fillna(value=0, method='ffill')
 
         # GH 5703
         s1 = Series([np.nan])
@@ -441,11 +594,11 @@ def test_fillna_inplace(self):
         expected = x.fillna(value=0)
         assert_series_equal(y, expected)
 
-    def test_fillna_invalid_method(self):
+    def test_fillna_invalid_method(self, datetime_series):
         try:
-            self.ts.fillna(method='ffil')
+            datetime_series.fillna(method='ffil')
         except ValueError as inst:
-            self.assertIn('ffil', str(inst))
+            assert 'ffil' in str(inst)
 
     def test_ffill(self):
         ts = Series([0., 1., 2., 3., 4.], index=tm.makeDateIndex(5))
@@ -470,45 +623,49 @@ def test_timedelta64_nan(self):
         # nan ops on timedeltas
         td1 = td.copy()
         td1[0] = np.nan
-        self.assertTrue(isnull(td1[0]))
-        self.assertEqual(td1[0].value, iNaT)
+        assert isna(td1[0])
+        assert td1[0].value == iNaT
         td1[0] = td[0]
-        self.assertFalse(isnull(td1[0]))
+        assert not isna(td1[0])
 
         td1[1] = iNaT
-        self.assertTrue(isnull(td1[1]))
-        self.assertEqual(td1[1].value, iNaT)
+        assert isna(td1[1])
+        assert td1[1].value == iNaT
         td1[1] = td[1]
-        self.assertFalse(isnull(td1[1]))
+        assert not isna(td1[1])
 
         td1[2] = NaT
-        self.assertTrue(isnull(td1[2]))
-        self.assertEqual(td1[2].value, iNaT)
+        assert isna(td1[2])
+        assert td1[2].value == iNaT
         td1[2] = td[2]
-        self.assertFalse(isnull(td1[2]))
+        assert not isna(td1[2])
 
         # boolean setting
         # this doesn't work, not sure numpy even supports it
         # result = td[(td>np.timedelta64(timedelta(days=3))) &
         # td<np.timedelta64(timedelta(days=7)))] = np.nan
-        # self.assertEqual(isnull(result).sum(), 7)
+        # assert isna(result).sum() == 7
 
         # NumPy limitiation =(
 
         # def test_logical_range_select(self):
         #     np.random.seed(12345)
-        #     selector = -0.5 <= self.ts <= 0.5
-        #     expected = (self.ts >= -0.5) & (self.ts <= 0.5)
+        #     selector = -0.5 <= datetime_series <= 0.5
+        #     expected = (datetime_series >= -0.5) & (datetime_series <= 0.5)
         #     assert_series_equal(selector, expected)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_dropna_empty(self):
         s = Series([])
-        self.assertEqual(len(s.dropna()), 0)
+        assert len(s.dropna()) == 0
         s.dropna(inplace=True)
-        self.assertEqual(len(s), 0)
+        assert len(s) == 0
 
         # invalid axis
-        self.assertRaises(ValueError, s.dropna, axis=1)
+        msg = ("No axis named 1 for object type"
+               " <class 'pandas.core.series.Series'>")
+        with pytest.raises(ValueError, match=msg):
+            s.dropna(axis=1)
 
     def test_datetime64_tz_dropna(self):
         # DatetimeBlock
@@ -517,55 +674,68 @@ def test_datetime64_tz_dropna(self):
         result = s.dropna()
         expected = Series([Timestamp('2011-01-01 10:00'),
                            Timestamp('2011-01-03 10:00')], index=[0, 2])
-        self.assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
         # DatetimeBlockTZ
         idx = pd.DatetimeIndex(['2011-01-01 10:00', pd.NaT,
                                 '2011-01-03 10:00', pd.NaT],
                                tz='Asia/Tokyo')
         s = pd.Series(idx)
-        self.assertEqual(s.dtype, 'datetime64[ns, Asia/Tokyo]')
+        assert s.dtype == 'datetime64[ns, Asia/Tokyo]'
         result = s.dropna()
         expected = Series([Timestamp('2011-01-01 10:00', tz='Asia/Tokyo'),
                            Timestamp('2011-01-03 10:00', tz='Asia/Tokyo')],
                           index=[0, 2])
-        self.assertEqual(result.dtype, 'datetime64[ns, Asia/Tokyo]')
-        self.assert_series_equal(result, expected)
+        assert result.dtype == 'datetime64[ns, Asia/Tokyo]'
+        tm.assert_series_equal(result, expected)
 
     def test_dropna_no_nan(self):
         for s in [Series([1, 2, 3], name='x'), Series(
                 [False, True, False], name='x')]:
 
             result = s.dropna()
-            self.assert_series_equal(result, s)
-            self.assertFalse(result is s)
+            tm.assert_series_equal(result, s)
+            assert result is not s
 
             s2 = s.copy()
             s2.dropna(inplace=True)
-            self.assert_series_equal(s2, s)
+            tm.assert_series_equal(s2, s)
 
-    def test_valid(self):
-        ts = self.ts.copy()
+    def test_dropna_intervals(self):
+        s = Series([np.nan, 1, 2, 3], IntervalIndex.from_arrays(
+            [np.nan, 0, 1, 2],
+            [np.nan, 1, 2, 3]))
+
+        result = s.dropna()
+        expected = s.iloc[1:]
+        assert_series_equal(result, expected)
+
+    def test_valid(self, datetime_series):
+        ts = datetime_series.copy()
         ts[::2] = np.NaN
 
-        result = ts.valid()
-        self.assertEqual(len(result), ts.count())
+        result = ts.dropna()
+        assert len(result) == ts.count()
         tm.assert_series_equal(result, ts[1::2])
-        tm.assert_series_equal(result, ts[pd.notnull(ts)])
+        tm.assert_series_equal(result, ts[pd.notna(ts)])
 
-    def test_isnull(self):
+    def test_isna(self):
         ser = Series([0, 5.4, 3, nan, -0.001])
-        np.array_equal(ser.isnull(),
-                       Series([False, False, False, True, False]).values)
+        expected = Series([False, False, False, True, False])
+        tm.assert_series_equal(ser.isna(), expected)
+
         ser = Series(["hi", "", nan])
-        np.array_equal(ser.isnull(), Series([False, False, True]).values)
+        expected = Series([False, False, True])
+        tm.assert_series_equal(ser.isna(), expected)
 
-    def test_notnull(self):
+    def test_notna(self):
         ser = Series([0, 5.4, 3, nan, -0.001])
-        np.array_equal(ser.notnull(),
-                       Series([True, True, True, False, True]).values)
+        expected = Series([True, True, True, False, True])
+        tm.assert_series_equal(ser.notna(), expected)
+
         ser = Series(["hi", "", nan])
-        np.array_equal(ser.notnull(), Series([True, True, False]).values)
+        expected = Series([True, True, False])
+        tm.assert_series_equal(ser.notna(), expected)
 
     def test_pad_nan(self):
         x = Series([np.nan, 1., np.nan, 3., np.nan], ['z', 'a', 'b', 'c', 'd'],
@@ -576,7 +746,7 @@ def test_pad_nan(self):
         expected = Series([np.nan, 1.0, 1.0, 3.0, 3.0],
                           ['z', 'a', 'b', 'c', 'd'], dtype=float)
         assert_series_equal(x[1:], expected[1:])
-        self.assertTrue(np.isnan(x[0]), np.isnan(expected[0]))
+        assert np.isnan(x[0]), np.isnan(expected[0])
 
     def test_pad_require_monotonicity(self):
         rng = date_range('1/1/2000', '3/1/2000', freq='B')
@@ -584,16 +754,18 @@ def test_pad_require_monotonicity(self):
         # neither monotonic increasing or decreasing
         rng2 = rng[[1, 0, 2]]
 
-        self.assertRaises(ValueError, rng2.get_indexer, rng, method='pad')
+        msg = "index must be monotonic increasing or decreasing"
+        with pytest.raises(ValueError, match=msg):
+            rng2.get_indexer(rng, method='pad')
 
-    def test_dropna_preserve_name(self):
-        self.ts[:5] = np.nan
-        result = self.ts.dropna()
-        self.assertEqual(result.name, self.ts.name)
-        name = self.ts.name
-        ts = self.ts.copy()
+    def test_dropna_preserve_name(self, datetime_series):
+        datetime_series[:5] = np.nan
+        result = datetime_series.dropna()
+        assert result.name == datetime_series.name
+        name = datetime_series.name
+        ts = datetime_series.copy()
         ts.dropna(inplace=True)
-        self.assertEqual(ts.name, name)
+        assert ts.name == name
 
     def test_fill_value_when_combine_const(self):
         # GH12723
@@ -626,16 +798,21 @@ def test_sparse_series_fillna_limit(self):
         s = Series(np.random.randn(10), index=index)
 
         ss = s[:2].reindex(index).to_sparse()
-        result = ss.fillna(method='pad', limit=5)
-        expected = ss.fillna(method='pad', limit=5)
+        # TODO: what is this test doing? why are result an expected
+        # the same call to fillna?
+        with tm.assert_produces_warning(PerformanceWarning):
+            # TODO: release-note fillna performance warning
+            result = ss.fillna(method='pad', limit=5)
+            expected = ss.fillna(method='pad', limit=5)
         expected = expected.to_dense()
         expected[-3:] = np.nan
         expected = expected.to_sparse()
         assert_series_equal(result, expected)
 
         ss = s[-2:].reindex(index).to_sparse()
-        result = ss.fillna(method='backfill', limit=5)
-        expected = ss.fillna(method='backfill')
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = ss.fillna(method='backfill', limit=5)
+            expected = ss.fillna(method='backfill')
         expected = expected.to_dense()
         expected[:3] = np.nan
         expected = expected.to_sparse()
@@ -647,14 +824,16 @@ def test_sparse_series_pad_backfill_limit(self):
         s = s.to_sparse()
 
         result = s[:2].reindex(index, method='pad', limit=5)
-        expected = s[:2].reindex(index).fillna(method='pad')
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = s[:2].reindex(index).fillna(method='pad')
         expected = expected.to_dense()
         expected[-3:] = np.nan
         expected = expected.to_sparse()
         assert_series_equal(result, expected)
 
         result = s[-2:].reindex(index, method='backfill', limit=5)
-        expected = s[-2:].reindex(index).fillna(method='backfill')
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = s[-2:].reindex(index).fillna(method='backfill')
         expected = expected.to_dense()
         expected[:3] = np.nan
         expected = expected.to_sparse()
@@ -677,34 +856,53 @@ def test_series_pad_backfill_limit(self):
         assert_series_equal(result, expected)
 
 
-class TestSeriesInterpolateData(TestData, tm.TestCase):
+@pytest.fixture(params=['linear', 'index', 'values', 'nearest', 'slinear',
+                        'zero', 'quadratic', 'cubic', 'barycentric', 'krogh',
+                        'polynomial', 'spline', 'piecewise_polynomial',
+                        'from_derivatives', 'pchip', 'akima', ])
+def nontemporal_method(request):
+    """ Fixture that returns an (method name, required kwargs) pair.
+
+    This fixture does not include method 'time' as a parameterization; that
+    method requires a Series with a DatetimeIndex, and is generally tested
+    separately from these non-temporal methods.
+    """
+    method = request.param
+    kwargs = dict(order=1) if method in ('spline', 'polynomial') else dict()
+    return method, kwargs
 
-    def test_interpolate(self):
-        ts = Series(np.arange(len(self.ts), dtype=float), self.ts.index)
+
+class TestSeriesInterpolateData():
+    def test_interpolate(self, datetime_series, string_series):
+        ts = Series(np.arange(len(datetime_series), dtype=float),
+                    datetime_series.index)
 
         ts_copy = ts.copy()
         ts_copy[5:10] = np.NaN
 
         linear_interp = ts_copy.interpolate(method='linear')
-        self.assert_series_equal(linear_interp, ts)
+        tm.assert_series_equal(linear_interp, ts)
 
-        ord_ts = Series([d.toordinal() for d in self.ts.index],
-                        index=self.ts.index).astype(float)
+        ord_ts = Series([d.toordinal() for d in datetime_series.index],
+                        index=datetime_series.index).astype(float)
 
         ord_ts_copy = ord_ts.copy()
         ord_ts_copy[5:10] = np.NaN
 
         time_interp = ord_ts_copy.interpolate(method='time')
-        self.assert_series_equal(time_interp, ord_ts)
-
-        # try time interpolation on a non-TimeSeries
-        # Only raises ValueError if there are NaNs.
-        non_ts = self.series.copy()
-        non_ts[0] = np.NaN
-        self.assertRaises(ValueError, non_ts.interpolate, method='time')
-
+        tm.assert_series_equal(time_interp, ord_ts)
+
+    def test_interpolate_time_raises_for_non_timeseries(self):
+        # When method='time' is used on a non-TimeSeries that contains a null
+        # value, a ValueError should be raised.
+        non_ts = Series([0, 1, 2, np.NaN])
+        msg = ("time-weighted interpolation only works on Series.* "
+               "with a DatetimeIndex")
+        with pytest.raises(ValueError, match=msg):
+            non_ts.interpolate(method='time')
+
+    @td.skip_if_no_scipy
     def test_interpolate_pchip(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_pchip()
 
         ser = Series(np.sort(np.random.uniform(size=100)))
@@ -716,8 +914,8 @@ def test_interpolate_pchip(self):
         # does not blow up, GH5977
         interp_s[49:51]
 
+    @td.skip_if_no_scipy
     def test_interpolate_akima(self):
-        tm._skip_if_no_scipy()
         _skip_if_no_akima()
 
         ser = Series([10, 11, 12, 13])
@@ -731,9 +929,8 @@ def test_interpolate_akima(self):
         interp_s = ser.reindex(new_index).interpolate(method='akima')
         assert_series_equal(interp_s[1:3], expected)
 
+    @td.skip_if_no_scipy
     def test_interpolate_piecewise_polynomial(self):
-        tm._skip_if_no_scipy()
-
         ser = Series([10, 11, 12, 13])
 
         expected = Series([11.00, 11.25, 11.50, 11.75,
@@ -746,9 +943,8 @@ def test_interpolate_piecewise_polynomial(self):
             method='piecewise_polynomial')
         assert_series_equal(interp_s[1:3], expected)
 
+    @td.skip_if_no_scipy
     def test_interpolate_from_derivatives(self):
-        tm._skip_if_no_scipy()
-
         ser = Series([10, 11, 12, 13])
 
         expected = Series([11.00, 11.25, 11.50, 11.75,
@@ -761,19 +957,17 @@ def test_interpolate_from_derivatives(self):
             method='from_derivatives')
         assert_series_equal(interp_s[1:3], expected)
 
-    def test_interpolate_corners(self):
-        s = Series([np.nan, np.nan])
-        assert_series_equal(s.interpolate(), s)
-
-        s = Series([]).interpolate()
-        assert_series_equal(s.interpolate(), s)
-
-        tm._skip_if_no_scipy()
+    @pytest.mark.parametrize("kwargs", [
+        {},
+        pytest.param({'method': 'polynomial', 'order': 1},
+                     marks=td.skip_if_no_scipy)
+    ])
+    def test_interpolate_corners(self, kwargs):
         s = Series([np.nan, np.nan])
-        assert_series_equal(s.interpolate(method='polynomial', order=1), s)
+        assert_series_equal(s.interpolate(**kwargs), s)
 
         s = Series([]).interpolate()
-        assert_series_equal(s.interpolate(method='polynomial', order=1), s)
+        assert_series_equal(s.interpolate(**kwargs), s)
 
     def test_interpolate_index_values(self):
         s = Series(np.nan, index=np.sort(np.random.rand(30)))
@@ -784,7 +978,7 @@ def test_interpolate_index_values(self):
         result = s.interpolate(method='index')
 
         expected = s.copy()
-        bad = isnull(expected.values)
+        bad = isna(expected.values)
         good = ~bad
         expected = Series(np.interp(vals[bad], vals[good],
                                     s.values[good]),
@@ -800,20 +994,22 @@ def test_interpolate_index_values(self):
 
     def test_interpolate_non_ts(self):
         s = Series([1, 3, np.nan, np.nan, np.nan, 11])
-        with tm.assertRaises(ValueError):
+        msg = ("time-weighted interpolation only works on Series or DataFrames"
+               " with a DatetimeIndex")
+        with pytest.raises(ValueError, match=msg):
             s.interpolate(method='time')
 
-    # New interpolation tests
-    def test_nan_interpolate(self):
+    @pytest.mark.parametrize("kwargs", [
+        {},
+        pytest.param({'method': 'polynomial', 'order': 1},
+                     marks=td.skip_if_no_scipy)
+    ])
+    def test_nan_interpolate(self, kwargs):
         s = Series([0, 1, np.nan, 3])
-        result = s.interpolate()
+        result = s.interpolate(**kwargs)
         expected = Series([0., 1., 2., 3.])
         assert_series_equal(result, expected)
 
-        tm._skip_if_no_scipy()
-        result = s.interpolate(method='polynomial', order=1)
-        assert_series_equal(result, expected)
-
     def test_nan_irregular_index(self):
         s = Series([1, 2, np.nan, 4], index=[1, 3, 5, 9])
         result = s.interpolate()
@@ -826,16 +1022,15 @@ def test_nan_str_index(self):
         expected = Series([0., 1., 2., 2.], index=list('abcd'))
         assert_series_equal(result, expected)
 
+    @td.skip_if_no_scipy
     def test_interp_quad(self):
-        tm._skip_if_no_scipy()
         sq = Series([1, 4, np.nan, 16], index=[1, 2, 3, 4])
         result = sq.interpolate(method='quadratic')
         expected = Series([1., 4., 9., 16.], index=[1, 2, 3, 4])
         assert_series_equal(result, expected)
 
+    @td.skip_if_no_scipy
     def test_interp_scipy_basic(self):
-        tm._skip_if_no_scipy()
-
         s = Series([1, 3, np.nan, 12, np.nan, 25])
         # slinear
         expected = Series([1., 3., 7.5, 12., 18.5, 25.])
@@ -883,16 +1078,35 @@ def test_interp_limit(self):
         result = s.interpolate(method='linear', limit=2)
         assert_series_equal(result, expected)
 
-        # GH 9217, make sure limit is an int and greater than 0
-        methods = ['linear', 'time', 'index', 'values', 'nearest', 'zero',
-                   'slinear', 'quadratic', 'cubic', 'barycentric', 'krogh',
-                   'polynomial', 'spline', 'piecewise_polynomial', None,
-                   'from_derivatives', 'pchip', 'akima']
-        s = pd.Series([1, 2, np.nan, np.nan, 5])
-        for limit in [-1, 0, 1., 2.]:
-            for method in methods:
-                with tm.assertRaises(ValueError):
-                    s.interpolate(limit=limit, method=method)
+    @pytest.mark.parametrize("limit", [-1, 0])
+    def test_interpolate_invalid_nonpositive_limit(self, nontemporal_method,
+                                                   limit):
+        # GH 9217: make sure limit is greater than zero.
+        s = pd.Series([1, 2, np.nan, 4])
+        method, kwargs = nontemporal_method
+        with pytest.raises(ValueError, match="Limit must be greater than 0"):
+            s.interpolate(limit=limit, method=method, **kwargs)
+
+    def test_interpolate_invalid_float_limit(self, nontemporal_method):
+        # GH 9217: make sure limit is an integer.
+        s = pd.Series([1, 2, np.nan, 4])
+        method, kwargs = nontemporal_method
+        limit = 2.0
+        with pytest.raises(ValueError, match="Limit must be an integer"):
+            s.interpolate(limit=limit, method=method, **kwargs)
+
+    @pytest.mark.parametrize("invalid_method", [None, 'nonexistent_method'])
+    def test_interp_invalid_method(self, invalid_method):
+        s = Series([1, 3, np.nan, 12, np.nan, 25])
+
+        msg = "method must be one of.* Got '{}' instead".format(invalid_method)
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method=invalid_method)
+
+        # When an invalid method and invalid limit (such as -1) are
+        # provided, the error message reflects the invalid method.
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method=invalid_method, limit=-1)
 
     def test_interp_limit_forward(self):
         s = Series([1, 3, np.nan, np.nan, np.nan, 11])
@@ -908,15 +1122,76 @@ def test_interp_limit_forward(self):
                                limit_direction='FORWARD')
         assert_series_equal(result, expected)
 
+    def test_interp_unlimited(self):
+        # these test are for issue #16282 default Limit=None is unlimited
+        s = Series([np.nan, 1., 3., np.nan, np.nan, np.nan, 11., np.nan])
+        expected = Series([1., 1., 3., 5., 7., 9., 11., 11.])
+        result = s.interpolate(method='linear',
+                               limit_direction='both')
+        assert_series_equal(result, expected)
+
+        expected = Series([np.nan, 1., 3., 5., 7., 9., 11., 11.])
+        result = s.interpolate(method='linear',
+                               limit_direction='forward')
+        assert_series_equal(result, expected)
+
+        expected = Series([1., 1., 3., 5., 7., 9., 11., np.nan])
+        result = s.interpolate(method='linear',
+                               limit_direction='backward')
+        assert_series_equal(result, expected)
+
     def test_interp_limit_bad_direction(self):
         s = Series([1, 3, np.nan, np.nan, np.nan, 11])
 
-        self.assertRaises(ValueError, s.interpolate, method='linear', limit=2,
-                          limit_direction='abc')
+        msg = (r"Invalid limit_direction: expecting one of \['forward',"
+               r" 'backward', 'both'\], got 'abc'")
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method='linear', limit=2, limit_direction='abc')
 
         # raises an error even if no limit is specified.
-        self.assertRaises(ValueError, s.interpolate, method='linear',
-                          limit_direction='abc')
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method='linear', limit_direction='abc')
+
+    # limit_area introduced GH #16284
+    def test_interp_limit_area(self):
+        # These tests are for issue #9218 -- fill NaNs in both directions.
+        s = Series([nan, nan, 3, nan, nan, nan, 7, nan, nan])
+
+        expected = Series([nan, nan, 3., 4., 5., 6., 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside')
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., 4., nan, nan, 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside',
+                               limit=1)
+
+        expected = Series([nan, nan, 3., 4., nan, 6., 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='inside',
+                               limit_direction='both', limit=1)
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., nan, nan, nan, 7., 7., 7.])
+        result = s.interpolate(method='linear', limit_area='outside')
+        assert_series_equal(result, expected)
+
+        expected = Series([nan, nan, 3., nan, nan, nan, 7., 7., nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               limit=1)
+
+        expected = Series([nan, 3., 3., nan, nan, nan, 7., 7., nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               limit_direction='both', limit=1)
+        assert_series_equal(result, expected)
+
+        expected = Series([3., 3., 3., nan, nan, nan, 7., nan, nan])
+        result = s.interpolate(method='linear', limit_area='outside',
+                               direction='backward')
+
+        # raises an error even if limit type is wrong.
+        msg = (r"Invalid limit_area: expecting one of \['inside', 'outside'\],"
+               " got abc")
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method='linear', limit_area='abc')
 
     def test_interp_limit_direction(self):
         # These tests are for issue #9218 -- fill NaNs in both directions.
@@ -979,9 +1254,8 @@ def test_interp_limit_before_ends(self):
                                limit_direction='both')
         assert_series_equal(result, expected)
 
+    @td.skip_if_no_scipy
     def test_interp_all_good(self):
-        # scipy
-        tm._skip_if_no_scipy()
         s = Series([1, 2, 3])
         result = s.interpolate(method='polynomial', order=1)
         assert_series_equal(result, s)
@@ -990,7 +1264,11 @@ def test_interp_all_good(self):
         result = s.interpolate()
         assert_series_equal(result, s)
 
-    def test_interp_multiIndex(self):
+    @pytest.mark.parametrize("check_scipy", [
+        False,
+        pytest.param(True, marks=td.skip_if_no_scipy)
+    ])
+    def test_interp_multiIndex(self, check_scipy):
         idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
         s = Series([1, 2, np.nan], index=idx)
 
@@ -999,18 +1277,20 @@ def test_interp_multiIndex(self):
         result = s.interpolate()
         assert_series_equal(result, expected)
 
-        tm._skip_if_no_scipy()
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='polynomial', order=1)
+        msg = "Only `method=linear` interpolation is supported on MultiIndexes"
+        if check_scipy:
+            with pytest.raises(ValueError, match=msg):
+                s.interpolate(method='polynomial', order=1)
 
+    @td.skip_if_no_scipy
     def test_interp_nonmono_raise(self):
-        tm._skip_if_no_scipy()
         s = Series([1, np.nan, 3], index=[0, 2, 1])
-        with tm.assertRaises(ValueError):
+        msg = "krogh interpolation requires that the index be monotonic"
+        with pytest.raises(ValueError, match=msg):
             s.interpolate(method='krogh')
 
+    @td.skip_if_no_scipy
     def test_interp_datetime64(self):
-        tm._skip_if_no_scipy()
         df = Series([1, np.nan, 3], index=date_range('1/1/2000', periods=3))
         result = df.interpolate(method='nearest')
         expected = Series([1., 1., 3.],
@@ -1024,25 +1304,32 @@ def test_interp_limit_no_nans(self):
         expected = s
         assert_series_equal(result, expected)
 
-    def test_no_order(self):
-        tm._skip_if_no_scipy()
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize("method", ['polynomial', 'spline'])
+    def test_no_order(self, method):
+        # see GH-10633, GH-24014
         s = Series([0, 1, np.nan, 3])
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='polynomial')
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline')
+        msg = "You must specify the order of the spline or polynomial"
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method=method)
 
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize('order', [-1, -1.0, 0, 0.0, np.nan])
+    def test_interpolate_spline_invalid_order(self, order):
+        s = Series([0, 1, np.nan, 3])
+        msg = "order needs to be specified and greater than 0"
+        with pytest.raises(ValueError, match=msg):
+            s.interpolate(method='spline', order=order)
+
+    @td.skip_if_no_scipy
     def test_spline(self):
-        tm._skip_if_no_scipy()
         s = Series([1, 2, np.nan, 4, 5, np.nan, 7])
         result = s.interpolate(method='spline', order=1)
         expected = Series([1., 2., 3., 4., 5., 6., 7.])
         assert_series_equal(result, expected)
 
+    @td.skip_if_no('scipy', min_version='0.15')
     def test_spline_extrapolate(self):
-        tm.skip_if_no_package(
-            'scipy', min_version='0.15',
-            app='setting ext on scipy.interpolate.UnivariateSpline')
         s = Series([1, 2, 3, 4, np.nan, 6, np.nan])
         result3 = s.interpolate(method='spline', order=1, ext=3)
         expected3 = Series([1., 2., 3., 4., 5., 6., 6.])
@@ -1052,33 +1339,20 @@ def test_spline_extrapolate(self):
         expected1 = Series([1., 2., 3., 4., 5., 6., 7.])
         assert_series_equal(result1, expected1)
 
+    @td.skip_if_no_scipy
     def test_spline_smooth(self):
-        tm._skip_if_no_scipy()
         s = Series([1, 2, np.nan, 4, 5.1, np.nan, 7])
-        self.assertNotEqual(s.interpolate(method='spline', order=3, s=0)[5],
-                            s.interpolate(method='spline', order=3)[5])
+        assert (s.interpolate(method='spline', order=3, s=0)[5] !=
+                s.interpolate(method='spline', order=3)[5])
 
+    @td.skip_if_no_scipy
     def test_spline_interpolation(self):
-        tm._skip_if_no_scipy()
-
         s = Series(np.arange(10) ** 2)
         s[np.random.randint(0, 9, 3)] = np.nan
         result1 = s.interpolate(method='spline', order=1)
         expected1 = s.interpolate(method='spline', order=1)
         assert_series_equal(result1, expected1)
 
-    # GH #10633
-    def test_spline_error(self):
-        tm._skip_if_no_scipy()
-
-        s = pd.Series(np.arange(10) ** 2)
-        s[np.random.randint(0, 9, 3)] = np.nan
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline')
-
-        with tm.assertRaises(ValueError):
-            s.interpolate(method='spline', order=0)
-
     def test_interp_timedelta64(self):
         # GH 6424
         df = Series([1, np.nan, 3],
@@ -1118,4 +1392,10 @@ def test_series_interpolate_intraday(self):
         new_index = index.append(index + pd.DateOffset(hours=1)).sort_values()
         result = ts.reindex(new_index).interpolate(method='time')
 
-        self.assert_numpy_array_equal(result.values, exp.values)
+        tm.assert_numpy_array_equal(result.values, exp.values)
+
+    def test_nonzero_warning(self):
+        # GH 24048
+        ser = pd.Series([1, 0, 3, 4])
+        with tm.assert_produces_warning(FutureWarning):
+            ser.nonzero()
diff --git a/pandas/tests/series/test_operators.py b/pandas/tests/series/test_operators.py
index 3d609dec7958a..b2aac441db195 100644
--- a/pandas/tests/series/test_operators.py
+++ b/pandas/tests/series/test_operators.py
@@ -1,936 +1,441 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-from collections import Iterable
 from datetime import datetime, timedelta
 import operator
-from itertools import product, starmap
 
-from numpy import nan, inf
 import numpy as np
-import pandas as pd
+import pytest
 
-from pandas import (Index, Series, DataFrame, isnull, bdate_range,
-                    NaT, date_range, timedelta_range,
-                    _np_version_under1p8)
-from pandas.tseries.index import Timestamp
-from pandas.tseries.tdi import Timedelta
-import pandas.core.nanops as nanops
+import pandas.compat as compat
+from pandas.compat import range
 
-from pandas.compat import range, zip
-from pandas import compat
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal, assert_index_equal)
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, Series, bdate_range, date_range, isna)
+from pandas.core import ops
+import pandas.core.nanops as nanops
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
 
 from .common import TestData
 
 
-class TestSeriesOperators(TestData, tm.TestCase):
+class TestSeriesLogicalOps(object):
+    @pytest.mark.parametrize('bool_op', [operator.and_,
+                                         operator.or_, operator.xor])
+    def test_bool_operators_with_nas(self, bool_op):
+        # boolean &, |, ^ should work with object arrays and propagate NAs
+        ser = Series(bdate_range('1/1/2000', periods=10), dtype=object)
+        ser[::2] = np.nan
 
-    def test_series_comparison_scalars(self):
-        series = Series(date_range('1/1/2000', periods=10))
+        mask = ser.isna()
+        filled = ser.fillna(ser[0])
 
-        val = datetime(2000, 1, 4)
-        result = series > val
-        expected = Series([x > val for x in series])
-        self.assert_series_equal(result, expected)
+        result = bool_op(ser < ser[9], ser > ser[3])
 
-        val = series[5]
-        result = series > val
-        expected = Series([x > val for x in series])
-        self.assert_series_equal(result, expected)
+        expected = bool_op(filled < filled[9], filled > filled[3])
+        expected[mask] = False
+        assert_series_equal(result, expected)
 
-    def test_comparisons(self):
-        left = np.random.randn(10)
-        right = np.random.randn(10)
-        left[:3] = np.nan
+    def test_operators_bitwise(self):
+        # GH#9016: support bitwise op for integer types
+        index = list('bca')
 
-        result = nanops.nangt(left, right)
-        with np.errstate(invalid='ignore'):
-            expected = (left > right).astype('O')
-        expected[:3] = np.nan
+        s_tft = Series([True, False, True], index=index)
+        s_fff = Series([False, False, False], index=index)
+        s_tff = Series([True, False, False], index=index)
+        s_empty = Series([])
 
-        assert_almost_equal(result, expected)
+        # TODO: unused
+        # s_0101 = Series([0, 1, 0, 1])
 
-        s = Series(['a', 'b', 'c'])
-        s2 = Series([False, True, False])
+        s_0123 = Series(range(4), dtype='int64')
+        s_3333 = Series([3] * 4)
+        s_4444 = Series([4] * 4)
 
-        # it works!
-        exp = Series([False, False, False])
-        assert_series_equal(s == s2, exp)
-        assert_series_equal(s2 == s, exp)
+        res = s_tft & s_empty
+        expected = s_fff
+        assert_series_equal(res, expected)
 
-    def test_op_method(self):
-        def check(series, other, check_reverse=False):
-            simple_ops = ['add', 'sub', 'mul', 'floordiv', 'truediv', 'pow']
-            if not compat.PY3:
-                simple_ops.append('div')
-
-            for opname in simple_ops:
-                op = getattr(Series, opname)
-
-                if op == 'div':
-                    alt = operator.truediv
-                else:
-                    alt = getattr(operator, opname)
-
-                result = op(series, other)
-                expected = alt(series, other)
-                assert_almost_equal(result, expected)
-                if check_reverse:
-                    rop = getattr(Series, "r" + opname)
-                    result = rop(series, other)
-                    expected = alt(other, series)
-                    assert_almost_equal(result, expected)
-
-        check(self.ts, self.ts * 2)
-        check(self.ts, self.ts[::2])
-        check(self.ts, 5, check_reverse=True)
-        check(tm.makeFloatSeries(), tm.makeFloatSeries(), check_reverse=True)
+        res = s_tft | s_empty
+        expected = s_tft
+        assert_series_equal(res, expected)
 
-    def test_neg(self):
-        assert_series_equal(-self.series, -1 * self.series)
+        res = s_0123 & s_3333
+        expected = Series(range(4), dtype='int64')
+        assert_series_equal(res, expected)
 
-    def test_invert(self):
-        assert_series_equal(-(self.series < 0), ~(self.series < 0))
-
-    def test_div(self):
-        with np.errstate(all='ignore'):
-            # no longer do integer div for any ops, but deal with the 0's
-            p = DataFrame({'first': [3, 4, 5, 8], 'second': [0, 0, 0, 3]})
-            result = p['first'] / p['second']
-            expected = Series(
-                p['first'].values.astype(float) / p['second'].values,
-                dtype='float64')
-            expected.iloc[0:3] = np.inf
-            assert_series_equal(result, expected)
+        res = s_0123 | s_4444
+        expected = Series(range(4, 8), dtype='int64')
+        assert_series_equal(res, expected)
 
-            result = p['first'] / 0
-            expected = Series(np.inf, index=p.index, name='first')
-            assert_series_equal(result, expected)
+        s_a0b1c0 = Series([1], list('b'))
 
-            p = p.astype('float64')
-            result = p['first'] / p['second']
-            expected = Series(p['first'].values / p['second'].values)
-            assert_series_equal(result, expected)
+        res = s_tft & s_a0b1c0
+        expected = s_tff.reindex(list('abc'))
+        assert_series_equal(res, expected)
 
-            p = DataFrame({'first': [3, 4, 5, 8], 'second': [1, 1, 1, 1]})
-            result = p['first'] / p['second']
-            assert_series_equal(result, p['first'].astype('float64'),
-                                check_names=False)
-            self.assertTrue(result.name is None)
-            self.assertFalse(np.array_equal(result, p['second'] / p['first']))
-
-            # inf signing
-            s = Series([np.nan, 1., -1.])
-            result = s / 0
-            expected = Series([np.nan, np.inf, -np.inf])
-            assert_series_equal(result, expected)
+        res = s_tft | s_a0b1c0
+        expected = s_tft.reindex(list('abc'))
+        assert_series_equal(res, expected)
 
-            # float/integer issue
-            # GH 7785
-            p = DataFrame({'first': (1, 0), 'second': (-0.01, -0.02)})
-            expected = Series([-0.01, -np.inf])
+        n0 = 0
+        res = s_tft & n0
+        expected = s_fff
+        assert_series_equal(res, expected)
 
-            result = p['second'].div(p['first'])
-            assert_series_equal(result, expected, check_names=False)
+        res = s_0123 & n0
+        expected = Series([0] * 4)
+        assert_series_equal(res, expected)
 
-            result = p['second'] / p['first']
-            assert_series_equal(result, expected)
+        n1 = 1
+        res = s_tft & n1
+        expected = s_tft
+        assert_series_equal(res, expected)
 
-            # GH 9144
-            s = Series([-1, 0, 1])
+        res = s_0123 & n1
+        expected = Series([0, 1, 0, 1])
+        assert_series_equal(res, expected)
 
-            result = 0 / s
-            expected = Series([0.0, nan, 0.0])
-            assert_series_equal(result, expected)
+        s_1111 = Series([1] * 4, dtype='int8')
+        res = s_0123 & s_1111
+        expected = Series([0, 1, 0, 1], dtype='int64')
+        assert_series_equal(res, expected)
 
-            result = s / 0
-            expected = Series([-inf, nan, inf])
-            assert_series_equal(result, expected)
+        res = s_0123.astype(np.int16) | s_1111.astype(np.int32)
+        expected = Series([1, 1, 3, 3], dtype='int32')
+        assert_series_equal(res, expected)
 
-            result = s // 0
-            expected = Series([-inf, nan, inf])
-            assert_series_equal(result, expected)
+        with pytest.raises(TypeError):
+            s_1111 & 'a'
+        with pytest.raises(TypeError):
+            s_1111 & ['a', 'b', 'c', 'd']
+        with pytest.raises(TypeError):
+            s_0123 & np.NaN
+        with pytest.raises(TypeError):
+            s_0123 & 3.14
+        with pytest.raises(TypeError):
+            s_0123 & [0.1, 4, 3.14, 2]
 
-            # GH 8674
-            zero_array = np.array([0] * 5)
-            data = np.random.randn(5)
-            expected = pd.Series([0.] * 5)
-            result = zero_array / pd.Series(data)
-            assert_series_equal(result, expected)
+        # s_0123 will be all false now because of reindexing like s_tft
+        exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
+        assert_series_equal(s_tft & s_0123, exp)
 
-            result = pd.Series(zero_array) / data
-            assert_series_equal(result, expected)
+        # s_tft will be all false now because of reindexing like s_0123
+        exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
+        assert_series_equal(s_0123 & s_tft, exp)
 
-            result = pd.Series(zero_array) / pd.Series(data)
-            assert_series_equal(result, expected)
+        assert_series_equal(s_0123 & False, Series([False] * 4))
+        assert_series_equal(s_0123 ^ False, Series([False, True, True, True]))
+        assert_series_equal(s_0123 & [False], Series([False] * 4))
+        assert_series_equal(s_0123 & (False), Series([False] * 4))
+        assert_series_equal(s_0123 & Series([False, np.NaN, False, False]),
+                            Series([False] * 4))
 
-    def test_operators(self):
-        def _check_op(series, other, op, pos_only=False,
-                      check_dtype=True):
-            left = np.abs(series) if pos_only else series
-            right = np.abs(other) if pos_only else other
-
-            cython_or_numpy = op(left, right)
-            python = left.combine(right, op)
-            assert_series_equal(cython_or_numpy, python,
-                                check_dtype=check_dtype)
-
-        def check(series, other):
-            simple_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'mod']
-
-            for opname in simple_ops:
-                _check_op(series, other, getattr(operator, opname))
-
-            _check_op(series, other, operator.pow, pos_only=True)
-
-            _check_op(series, other, lambda x, y: operator.add(y, x))
-            _check_op(series, other, lambda x, y: operator.sub(y, x))
-            _check_op(series, other, lambda x, y: operator.truediv(y, x))
-            _check_op(series, other, lambda x, y: operator.floordiv(y, x))
-            _check_op(series, other, lambda x, y: operator.mul(y, x))
-            _check_op(series, other, lambda x, y: operator.pow(y, x),
-                      pos_only=True)
-            _check_op(series, other, lambda x, y: operator.mod(y, x))
-
-        check(self.ts, self.ts * 2)
-        check(self.ts, self.ts * 0)
-        check(self.ts, self.ts[::2])
-        check(self.ts, 5)
-
-        def check_comparators(series, other, check_dtype=True):
-            _check_op(series, other, operator.gt, check_dtype=check_dtype)
-            _check_op(series, other, operator.ge, check_dtype=check_dtype)
-            _check_op(series, other, operator.eq, check_dtype=check_dtype)
-            _check_op(series, other, operator.lt, check_dtype=check_dtype)
-            _check_op(series, other, operator.le, check_dtype=check_dtype)
-
-        check_comparators(self.ts, 5)
-        check_comparators(self.ts, self.ts + 1, check_dtype=False)
-
-    def test_divmod(self):
-        def check(series, other):
-            results = divmod(series, other)
-            if isinstance(other, Iterable) and len(series) != len(other):
-                # if the lengths don't match, this is the test where we use
-                # `self.ts[::2]`. Pad every other value in `other_np` with nan.
-                other_np = []
-                for n in other:
-                    other_np.append(n)
-                    other_np.append(np.nan)
-            else:
-                other_np = other
-            other_np = np.asarray(other_np)
-            with np.errstate(all='ignore'):
-                expecteds = divmod(series.values, np.asarray(other_np))
+        s_ftft = Series([False, True, False, True])
+        assert_series_equal(s_0123 & Series([0.1, 4, -3.14, 2]), s_ftft)
 
-            for result, expected in zip(results, expecteds):
-                # check the values, name, and index separatly
-                assert_almost_equal(np.asarray(result), expected)
+        s_abNd = Series(['a', 'b', np.NaN, 'd'])
+        res = s_0123 & s_abNd
+        expected = s_ftft
+        assert_series_equal(res, expected)
 
-                self.assertEqual(result.name, series.name)
-                assert_index_equal(result.index, series.index)
+    def test_scalar_na_logical_ops_corners(self):
+        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
 
-        check(self.ts, self.ts * 2)
-        check(self.ts, self.ts * 0)
-        check(self.ts, self.ts[::2])
-        check(self.ts, 5)
+        with pytest.raises(TypeError):
+            s & datetime(2005, 1, 1)
 
-    def test_operators_empty_int_corner(self):
-        s1 = Series([], [], dtype=np.int32)
-        s2 = Series({'x': 0.})
-        assert_series_equal(s1 * s2, Series([np.nan], index=['x']))
+        s = Series([2, 3, 4, 5, 6, 7, 8, 9, datetime(2005, 1, 1)])
+        s[::2] = np.nan
 
-    def test_operators_timedelta64(self):
-
-        # invalid ops
-        self.assertRaises(Exception, self.objSeries.__add__, 1)
-        self.assertRaises(Exception, self.objSeries.__add__,
-                          np.array(1, dtype=np.int64))
-        self.assertRaises(Exception, self.objSeries.__sub__, 1)
-        self.assertRaises(Exception, self.objSeries.__sub__,
-                          np.array(1, dtype=np.int64))
-
-        # seriese ops
-        v1 = date_range('2012-1-1', periods=3, freq='D')
-        v2 = date_range('2012-1-2', periods=3, freq='D')
-        rs = Series(v2) - Series(v1)
-        xp = Series(1e9 * 3600 * 24,
-                    rs.index).astype('int64').astype('timedelta64[ns]')
-        assert_series_equal(rs, xp)
-        self.assertEqual(rs.dtype, 'timedelta64[ns]')
-
-        df = DataFrame(dict(A=v1))
-        td = Series([timedelta(days=i) for i in range(3)])
-        self.assertEqual(td.dtype, 'timedelta64[ns]')
-
-        # series on the rhs
-        result = df['A'] - df['A'].shift()
-        self.assertEqual(result.dtype, 'timedelta64[ns]')
-
-        result = df['A'] + td
-        self.assertEqual(result.dtype, 'M8[ns]')
-
-        # scalar Timestamp on rhs
-        maxa = df['A'].max()
-        tm.assertIsInstance(maxa, Timestamp)
-
-        resultb = df['A'] - df['A'].max()
-        self.assertEqual(resultb.dtype, 'timedelta64[ns]')
-
-        # timestamp on lhs
-        result = resultb + df['A']
-        values = [Timestamp('20111230'), Timestamp('20120101'),
-                  Timestamp('20120103')]
-        expected = Series(values, name='A')
+        expected = Series(True, index=s.index)
+        expected[::2] = False
+        result = s & list(s)
         assert_series_equal(result, expected)
 
-        # datetimes on rhs
-        result = df['A'] - datetime(2001, 1, 1)
-        expected = Series(
-            [timedelta(days=4017 + i) for i in range(3)], name='A')
-        assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'm8[ns]')
-
-        d = datetime(2001, 1, 1, 3, 4)
-        resulta = df['A'] - d
-        self.assertEqual(resulta.dtype, 'm8[ns]')
-
-        # roundtrip
-        resultb = resulta + d
-        assert_series_equal(df['A'], resultb)
-
-        # timedeltas on rhs
-        td = timedelta(days=1)
-        resulta = df['A'] + td
-        resultb = resulta - td
-        assert_series_equal(resultb, df['A'])
-        self.assertEqual(resultb.dtype, 'M8[ns]')
-
-        # roundtrip
-        td = timedelta(minutes=5, seconds=3)
-        resulta = df['A'] + td
-        resultb = resulta - td
-        assert_series_equal(df['A'], resultb)
-        self.assertEqual(resultb.dtype, 'M8[ns]')
-
-        # inplace
-        value = rs[2] + np.timedelta64(timedelta(minutes=5, seconds=1))
-        rs[2] += np.timedelta64(timedelta(minutes=5, seconds=1))
-        self.assertEqual(rs[2], value)
-
-    def test_operator_series_comparison_zerorank(self):
-        # GH 13006
-        result = np.float64(0) > pd.Series([1, 2, 3])
-        expected = 0.0 > pd.Series([1, 2, 3])
-        self.assert_series_equal(result, expected)
-        result = pd.Series([1, 2, 3]) < np.float64(0)
-        expected = pd.Series([1, 2, 3]) < 0.0
-        self.assert_series_equal(result, expected)
-        result = np.array([0, 1, 2])[0] > pd.Series([0, 1, 2])
-        expected = 0.0 > pd.Series([1, 2, 3])
-        self.assert_series_equal(result, expected)
-
-    def test_timedeltas_with_DateOffset(self):
-
-        # GH 4532
-        # operate with pd.offsets
-        s = Series([Timestamp('20130101 9:01'), Timestamp('20130101 9:02')])
-
-        result = s + pd.offsets.Second(5)
-        result2 = pd.offsets.Second(5) + s
-        expected = Series([Timestamp('20130101 9:01:05'), Timestamp(
-            '20130101 9:02:05')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        d = DataFrame({'A': s})
+        # TODO: Fix this exception - needs to be fixed! (see GH5035)
+        # (previously this was a TypeError because series returned
+        # NotImplemented
 
-        result = s - pd.offsets.Second(5)
-        result2 = -pd.offsets.Second(5) + s
-        expected = Series([Timestamp('20130101 9:00:55'), Timestamp(
-            '20130101 9:01:55')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        # this is an alignment issue; these are equivalent
+        # https://github.com/pandas-dev/pandas/issues/5284
 
-        result = s + pd.offsets.Milli(5)
-        result2 = pd.offsets.Milli(5) + s
-        expected = Series([Timestamp('20130101 9:01:00.005'), Timestamp(
-            '20130101 9:02:00.005')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        with pytest.raises(TypeError):
+            d.__and__(s, axis='columns')
 
-        result = s + pd.offsets.Minute(5) + pd.offsets.Milli(5)
-        expected = Series([Timestamp('20130101 9:06:00.005'), Timestamp(
-            '20130101 9:07:00.005')])
-        assert_series_equal(result, expected)
+        with pytest.raises(TypeError):
+            s & d
 
-        # operate with np.timedelta64 correctly
-        result = s + np.timedelta64(1, 's')
-        result2 = np.timedelta64(1, 's') + s
-        expected = Series([Timestamp('20130101 9:01:01'), Timestamp(
-            '20130101 9:02:01')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
+        # this is wrong as its not a boolean result
+        # result = d.__and__(s,axis='index')
 
-        result = s + np.timedelta64(5, 'ms')
-        result2 = np.timedelta64(5, 'ms') + s
-        expected = Series([Timestamp('20130101 9:01:00.005'), Timestamp(
-            '20130101 9:02:00.005')])
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-
-        # valid DateOffsets
-        for do in ['Hour', 'Minute', 'Second', 'Day', 'Micro', 'Milli',
-                   'Nano']:
-            op = getattr(pd.offsets, do)
-            s + op(5)
-            op(5) + s
-
-    def test_timedelta_series_ops(self):
-        # GH11925
-
-        s = Series(timedelta_range('1 day', periods=3))
-        ts = Timestamp('2012-01-01')
-        expected = Series(date_range('2012-01-02', periods=3))
-        assert_series_equal(ts + s, expected)
-        assert_series_equal(s + ts, expected)
-
-        expected2 = Series(date_range('2011-12-31', periods=3, freq='-1D'))
-        assert_series_equal(ts - s, expected2)
-        assert_series_equal(ts + (-s), expected2)
-
-    def test_timedelta64_operations_with_DateOffset(self):
-        # GH 10699
-        td = Series([timedelta(minutes=5, seconds=3)] * 3)
-        result = td + pd.offsets.Minute(1)
-        expected = Series([timedelta(minutes=6, seconds=3)] * 3)
-        assert_series_equal(result, expected)
+    @pytest.mark.parametrize('op', [
+        operator.and_,
+        operator.or_,
+        operator.xor,
 
-        result = td - pd.offsets.Minute(1)
-        expected = Series([timedelta(minutes=4, seconds=3)] * 3)
-        assert_series_equal(result, expected)
+    ])
+    def test_logical_ops_with_index(self, op):
+        # GH#22092, GH#19792
+        ser = Series([True, True, False, False])
+        idx1 = Index([True, False, True, False])
+        idx2 = Index([1, 0, 1, 0])
 
-        result = td + Series([pd.offsets.Minute(1), pd.offsets.Second(3),
-                              pd.offsets.Hour(2)])
-        expected = Series([timedelta(minutes=6, seconds=3), timedelta(
-            minutes=5, seconds=6), timedelta(hours=2, minutes=5, seconds=3)])
-        assert_series_equal(result, expected)
+        expected = Series([op(ser[n], idx1[n]) for n in range(len(ser))])
 
-        result = td + pd.offsets.Minute(1) + pd.offsets.Second(12)
-        expected = Series([timedelta(minutes=6, seconds=15)] * 3)
+        result = op(ser, idx1)
         assert_series_equal(result, expected)
 
-        # valid DateOffsets
-        for do in ['Hour', 'Minute', 'Second', 'Day', 'Micro', 'Milli',
-                   'Nano']:
-            op = getattr(pd.offsets, do)
-            td + op(5)
-            op(5) + td
-            td - op(5)
-            op(5) - td
-
-    def test_timedelta64_operations_with_timedeltas(self):
-
-        # td operate with td
-        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
-        td2 = timedelta(minutes=5, seconds=4)
-        result = td1 - td2
-        expected = Series([timedelta(seconds=0)] * 3) - Series([timedelta(
-            seconds=1)] * 3)
-        self.assertEqual(result.dtype, 'm8[ns]')
-        assert_series_equal(result, expected)
+        expected = Series([op(ser[n], idx2[n]) for n in range(len(ser))],
+                          dtype=bool)
 
-        result2 = td2 - td1
-        expected = (Series([timedelta(seconds=1)] * 3) - Series([timedelta(
-            seconds=0)] * 3))
-        assert_series_equal(result2, expected)
-
-        # roundtrip
-        assert_series_equal(result + td2, td1)
-
-        # Now again, using pd.to_timedelta, which should build
-        # a Series or a scalar, depending on input.
-        td1 = Series(pd.to_timedelta(['00:05:03'] * 3))
-        td2 = pd.to_timedelta('00:05:04')
-        result = td1 - td2
-        expected = Series([timedelta(seconds=0)] * 3) - Series([timedelta(
-            seconds=1)] * 3)
-        self.assertEqual(result.dtype, 'm8[ns]')
+        result = op(ser, idx2)
         assert_series_equal(result, expected)
 
-        result2 = td2 - td1
-        expected = (Series([timedelta(seconds=1)] * 3) - Series([timedelta(
-            seconds=0)] * 3))
-        assert_series_equal(result2, expected)
-
-        # roundtrip
-        assert_series_equal(result + td2, td1)
+    @pytest.mark.parametrize("op, expected", [
+        (ops.rand_, pd.Index([False, True])),
+        (ops.ror_, pd.Index([False, True])),
+        (ops.rxor, pd.Index([])),
+    ])
+    def test_reverse_ops_with_index(self, op, expected):
+        # https://github.com/pandas-dev/pandas/pull/23628
+        # multi-set Index ops are buggy, so let's avoid duplicates...
+        ser = Series([True, False])
+        idx = Index([False, True])
+        result = op(ser, idx)
+        tm.assert_index_equal(result, expected)
 
-    def test_timedelta64_operations_with_integers(self):
+    def test_logical_ops_label_based(self):
+        # GH#4947
+        # logical ops should be label based
 
-        # GH 4521
-        # divide/multiply by integers
-        startdate = Series(date_range('2013-01-01', '2013-01-03'))
-        enddate = Series(date_range('2013-03-01', '2013-03-03'))
-
-        s1 = enddate - startdate
-        s1[2] = np.nan
-        s2 = Series([2, 3, 4])
-        expected = Series(s1.values.astype(np.int64) / s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 / s2
-        assert_series_equal(result, expected)
+        a = Series([True, False, True], list('bca'))
+        b = Series([False, True, False], list('abc'))
 
-        s2 = Series([20, 30, 40])
-        expected = Series(s1.values.astype(np.int64) / s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 / s2
+        expected = Series([False, True, False], list('abc'))
+        result = a & b
         assert_series_equal(result, expected)
 
-        result = s1 / 2
-        expected = Series(s1.values.astype(np.int64) / 2, dtype='m8[ns]')
-        expected[2] = np.nan
+        expected = Series([True, True, False], list('abc'))
+        result = a | b
         assert_series_equal(result, expected)
 
-        s2 = Series([20, 30, 40])
-        expected = Series(s1.values.astype(np.int64) * s2, dtype='m8[ns]')
-        expected[2] = np.nan
-        result = s1 * s2
+        expected = Series([True, False, False], list('abc'))
+        result = a ^ b
         assert_series_equal(result, expected)
 
-        for dtype in ['int32', 'int16', 'uint32', 'uint64', 'uint32', 'uint16',
-                      'uint8']:
-            s2 = Series([20, 30, 40], dtype=dtype)
-            expected = Series(
-                s1.values.astype(np.int64) * s2.astype(np.int64),
-                dtype='m8[ns]')
-            expected[2] = np.nan
-            result = s1 * s2
-            assert_series_equal(result, expected)
+        # rhs is bigger
+        a = Series([True, False, True], list('bca'))
+        b = Series([False, True, False, True], list('abcd'))
 
-        result = s1 * 2
-        expected = Series(s1.values.astype(np.int64) * 2, dtype='m8[ns]')
-        expected[2] = np.nan
+        expected = Series([False, True, False, False], list('abcd'))
+        result = a & b
         assert_series_equal(result, expected)
 
-        result = s1 * -1
-        expected = Series(s1.values.astype(np.int64) * -1, dtype='m8[ns]')
-        expected[2] = np.nan
+        expected = Series([True, True, False, False], list('abcd'))
+        result = a | b
         assert_series_equal(result, expected)
 
-        # invalid ops
-        assert_series_equal(s1 / s2.astype(float),
-                            Series([Timedelta('2 days 22:48:00'), Timedelta(
-                                '1 days 23:12:00'), Timedelta('NaT')]))
-        assert_series_equal(s1 / 2.0,
-                            Series([Timedelta('29 days 12:00:00'), Timedelta(
-                                '29 days 12:00:00'), Timedelta('NaT')]))
-
-        for op in ['__add__', '__sub__']:
-            sop = getattr(s1, op, None)
-            if sop is not None:
-                self.assertRaises(TypeError, sop, 1)
-                self.assertRaises(TypeError, sop, s2.values)
-
-    def test_timedelta64_conversions(self):
-        startdate = Series(date_range('2013-01-01', '2013-01-03'))
-        enddate = Series(date_range('2013-03-01', '2013-03-03'))
+        # filling
 
-        s1 = enddate - startdate
-        s1[2] = np.nan
+        # vs empty
+        result = a & Series([])
+        expected = Series([False, False, False], list('bca'))
+        assert_series_equal(result, expected)
 
-        for m in [1, 3, 10]:
-            for unit in ['D', 'h', 'm', 's', 'ms', 'us', 'ns']:
+        result = a | Series([])
+        expected = Series([True, False, True], list('bca'))
+        assert_series_equal(result, expected)
 
-                # op
-                expected = s1.apply(lambda x: x / np.timedelta64(m, unit))
-                result = s1 / np.timedelta64(m, unit)
-                assert_series_equal(result, expected)
+        # vs non-matching
+        result = a & Series([1], ['z'])
+        expected = Series([False, False, False, False], list('abcz'))
+        assert_series_equal(result, expected)
 
-                if m == 1 and unit != 'ns':
+        result = a | Series([1], ['z'])
+        expected = Series([True, True, False, False], list('abcz'))
+        assert_series_equal(result, expected)
 
-                    # astype
-                    result = s1.astype("timedelta64[{0}]".format(unit))
-                    assert_series_equal(result, expected)
+        # identity
+        # we would like s[s|e] == s to hold for any e, whether empty or not
+        for e in [Series([]), Series([1], ['z']),
+                  Series(np.nan, b.index), Series(np.nan, a.index)]:
+            result = a[a | e]
+            assert_series_equal(result, a[a])
 
-                # reverse op
-                expected = s1.apply(
-                    lambda x: Timedelta(np.timedelta64(m, unit)) / x)
-                result = np.timedelta64(m, unit) / s1
+        for e in [Series(['z'])]:
+            result = a[a | e]
+            assert_series_equal(result, a[a])
 
-        # astype
-        s = Series(date_range('20130101', periods=3))
-        result = s.astype(object)
-        self.assertIsInstance(result.iloc[0], datetime)
-        self.assertTrue(result.dtype == np.object_)
+        # vs scalars
+        index = list('bca')
+        t = Series([True, False, True])
 
-        result = s1.astype(object)
-        self.assertIsInstance(result.iloc[0], timedelta)
-        self.assertTrue(result.dtype == np.object_)
+        for v in [True, 1, 2]:
+            result = Series([True, False, True], index=index) | v
+            expected = Series([True, True, True], index=index)
+            assert_series_equal(result, expected)
 
-    def test_timedelta64_equal_timedelta_supported_ops(self):
-        ser = Series([Timestamp('20130301'), Timestamp('20130228 23:00:00'),
-                      Timestamp('20130228 22:00:00'), Timestamp(
-                          '20130228 21:00:00')])
+        for v in [np.nan, 'foo']:
+            with pytest.raises(TypeError):
+                t | v
 
-        intervals = 'D', 'h', 'm', 's', 'us'
+        for v in [False, 0]:
+            result = Series([True, False, True], index=index) | v
+            expected = Series([True, False, True], index=index)
+            assert_series_equal(result, expected)
 
-        # TODO: unused
-        # npy16_mappings = {'D': 24 * 60 * 60 * 1000000,
-        #                   'h': 60 * 60 * 1000000,
-        #                   'm': 60 * 1000000,
-        #                   's': 1000000,
-        #                   'us': 1}
-
-        def timedelta64(*args):
-            return sum(starmap(np.timedelta64, zip(args, intervals)))
-
-        for op, d, h, m, s, us in product([operator.add, operator.sub],
-                                          *([range(2)] * 5)):
-            nptd = timedelta64(d, h, m, s, us)
-            pytd = timedelta(days=d, hours=h, minutes=m, seconds=s,
-                             microseconds=us)
-            lhs = op(ser, nptd)
-            rhs = op(ser, pytd)
-
-            try:
-                assert_series_equal(lhs, rhs)
-            except:
-                raise AssertionError(
-                    "invalid comparsion [op->{0},d->{1},h->{2},m->{3},"
-                    "s->{4},us->{5}]\n{6}\n{7}\n".format(op, d, h, m, s,
-                                                         us, lhs, rhs))
-
-    def test_operators_datetimelike(self):
-        def run_ops(ops, get_ser, test_ser):
-
-            # check that we are getting a TypeError
-            # with 'operate' (from core/ops.py) for the ops that are not
-            # defined
-            for op_str in ops:
-                op = getattr(get_ser, op_str, None)
-                with tm.assertRaisesRegexp(TypeError, 'operate'):
-                    op(test_ser)
-
-        # ## timedelta64 ###
-        td1 = Series([timedelta(minutes=5, seconds=3)] * 3)
-        td1.iloc[2] = np.nan
-        td2 = timedelta(minutes=5, seconds=4)
-        ops = ['__mul__', '__floordiv__', '__pow__', '__rmul__',
-               '__rfloordiv__', '__rpow__']
-        run_ops(ops, td1, td2)
-        td1 + td2
-        td2 + td1
-        td1 - td2
-        td2 - td1
-        td1 / td2
-        td2 / td1
-
-        # ## datetime64 ###
-        dt1 = Series([Timestamp('20111230'), Timestamp('20120101'),
-                      Timestamp('20120103')])
-        dt1.iloc[2] = np.nan
-        dt2 = Series([Timestamp('20111231'), Timestamp('20120102'),
-                      Timestamp('20120104')])
-        ops = ['__add__', '__mul__', '__floordiv__', '__truediv__', '__div__',
-               '__pow__', '__radd__', '__rmul__', '__rfloordiv__',
-               '__rtruediv__', '__rdiv__', '__rpow__']
-        run_ops(ops, dt1, dt2)
-        dt1 - dt2
-        dt2 - dt1
-
-        # ## datetime64 with timetimedelta ###
-        ops = ['__mul__', '__floordiv__', '__truediv__', '__div__', '__pow__',
-               '__rmul__', '__rfloordiv__', '__rtruediv__', '__rdiv__',
-               '__rpow__']
-        run_ops(ops, dt1, td1)
-        dt1 + td1
-        td1 + dt1
-        dt1 - td1
-        # TODO: Decide if this ought to work.
-        # td1 - dt1
-
-        # ## timetimedelta with datetime64 ###
-        ops = ['__sub__', '__mul__', '__floordiv__', '__truediv__', '__div__',
-               '__pow__', '__rmul__', '__rfloordiv__', '__rtruediv__',
-               '__rdiv__', '__rpow__']
-        run_ops(ops, td1, dt1)
-        td1 + dt1
-        dt1 + td1
-
-        # 8260, 10763
-        # datetime64 with tz
-        ops = ['__mul__', '__floordiv__', '__truediv__', '__div__', '__pow__',
-               '__rmul__', '__rfloordiv__', '__rtruediv__', '__rdiv__',
-               '__rpow__']
-
-        tz = 'US/Eastern'
-        dt1 = Series(date_range('2000-01-01 09:00:00', periods=5,
-                                tz=tz), name='foo')
-        dt2 = dt1.copy()
-        dt2.iloc[2] = np.nan
-        td1 = Series(timedelta_range('1 days 1 min', periods=5, freq='H'))
-        td2 = td1.copy()
-        td2.iloc[1] = np.nan
-        run_ops(ops, dt1, td1)
-
-        result = dt1 + td1[0]
-        exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        for v in [True, 1]:
+            result = Series([True, False, True], index=index) & v
+            expected = Series([True, False, True], index=index)
+            assert_series_equal(result, expected)
 
-        result = dt2 + td2[0]
-        exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        for v in [False, 0]:
+            result = Series([True, False, True], index=index) & v
+            expected = Series([False, False, False], index=index)
+            assert_series_equal(result, expected)
+        for v in [np.nan]:
+            with pytest.raises(TypeError):
+                t & v
 
-        # odd numpy behavior with scalar timedeltas
-        if not _np_version_under1p8:
-            result = td1[0] + dt1
-            exp = (dt1.dt.tz_localize(None) + td1[0]).dt.tz_localize(tz)
-            assert_series_equal(result, exp)
+    def test_logical_ops_df_compat(self):
+        # GH#1134
+        s1 = pd.Series([True, False, True], index=list('ABC'), name='x')
+        s2 = pd.Series([True, True, False], index=list('ABD'), name='x')
 
-            result = td2[0] + dt2
-            exp = (dt2.dt.tz_localize(None) + td2[0]).dt.tz_localize(tz)
-            assert_series_equal(result, exp)
+        exp = pd.Series([True, False, False, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s1 & s2, exp)
+        assert_series_equal(s2 & s1, exp)
 
-        result = dt1 - td1[0]
-        exp = (dt1.dt.tz_localize(None) - td1[0]).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
-        self.assertRaises(TypeError, lambda: td1[0] - dt1)
+        # True | np.nan => True
+        exp = pd.Series([True, True, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s1 | s2, exp)
+        # np.nan | True => np.nan, filled with False
+        exp = pd.Series([True, True, False, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s2 | s1, exp)
 
-        result = dt2 - td2[0]
-        exp = (dt2.dt.tz_localize(None) - td2[0]).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
-        self.assertRaises(TypeError, lambda: td2[0] - dt2)
+        # DataFrame doesn't fill nan with False
+        exp = pd.DataFrame({'x': [True, False, np.nan, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s1.to_frame() & s2.to_frame(), exp)
+        assert_frame_equal(s2.to_frame() & s1.to_frame(), exp)
 
-        result = dt1 + td1
-        exp = (dt1.dt.tz_localize(None) + td1).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        exp = pd.DataFrame({'x': [True, True, np.nan, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s1.to_frame() | s2.to_frame(), exp)
+        assert_frame_equal(s2.to_frame() | s1.to_frame(), exp)
 
-        result = dt2 + td2
-        exp = (dt2.dt.tz_localize(None) + td2).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        # different length
+        s3 = pd.Series([True, False, True], index=list('ABC'), name='x')
+        s4 = pd.Series([True, True, True, True], index=list('ABCD'), name='x')
 
-        result = dt1 - td1
-        exp = (dt1.dt.tz_localize(None) - td1).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        exp = pd.Series([True, False, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s3 & s4, exp)
+        assert_series_equal(s4 & s3, exp)
 
-        result = dt2 - td2
-        exp = (dt2.dt.tz_localize(None) - td2).dt.tz_localize(tz)
-        assert_series_equal(result, exp)
+        # np.nan | True => np.nan, filled with False
+        exp = pd.Series([True, True, True, False],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s3 | s4, exp)
+        # True | np.nan => True
+        exp = pd.Series([True, True, True, True],
+                        index=list('ABCD'), name='x')
+        assert_series_equal(s4 | s3, exp)
 
-        self.assertRaises(TypeError, lambda: td1 - dt1)
-        self.assertRaises(TypeError, lambda: td2 - dt2)
-
-    def test_sub_datetime_compat(self):
-        # GH 14088
-        tm._skip_if_no_pytz()
-        import pytz
-        s = Series([datetime(2016, 8, 23, 12, tzinfo=pytz.utc), pd.NaT])
-        dt = datetime(2016, 8, 22, 12, tzinfo=pytz.utc)
-        exp = Series([Timedelta('1 days'), pd.NaT])
-        assert_series_equal(s - dt, exp)
-        assert_series_equal(s - Timestamp(dt), exp)
-
-    def test_sub_single_tz(self):
-        # GH12290
-        s1 = Series([pd.Timestamp('2016-02-10', tz='America/Sao_Paulo')])
-        s2 = Series([pd.Timestamp('2016-02-08', tz='America/Sao_Paulo')])
-        result = s1 - s2
-        expected = Series([Timedelta('2days')])
-        assert_series_equal(result, expected)
-        result = s2 - s1
-        expected = Series([Timedelta('-2days')])
-        assert_series_equal(result, expected)
+        exp = pd.DataFrame({'x': [True, False, True, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s3.to_frame() & s4.to_frame(), exp)
+        assert_frame_equal(s4.to_frame() & s3.to_frame(), exp)
 
-    def test_ops_nat(self):
-        # GH 11349
-        timedelta_series = Series([NaT, Timedelta('1s')])
-        datetime_series = Series([NaT, Timestamp('19900315')])
-        nat_series_dtype_timedelta = Series(
-            [NaT, NaT], dtype='timedelta64[ns]')
-        nat_series_dtype_timestamp = Series([NaT, NaT], dtype='datetime64[ns]')
-        single_nat_dtype_datetime = Series([NaT], dtype='datetime64[ns]')
-        single_nat_dtype_timedelta = Series([NaT], dtype='timedelta64[ns]')
-
-        # subtraction
-        assert_series_equal(timedelta_series - NaT, nat_series_dtype_timedelta)
-        assert_series_equal(-NaT + timedelta_series,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(timedelta_series - single_nat_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(-single_nat_dtype_timedelta + timedelta_series,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(datetime_series - NaT, nat_series_dtype_timestamp)
-        assert_series_equal(-NaT + datetime_series, nat_series_dtype_timestamp)
-
-        assert_series_equal(datetime_series - single_nat_dtype_datetime,
-                            nat_series_dtype_timedelta)
-        with tm.assertRaises(TypeError):
-            -single_nat_dtype_datetime + datetime_series
-
-        assert_series_equal(datetime_series - single_nat_dtype_timedelta,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(-single_nat_dtype_timedelta + datetime_series,
-                            nat_series_dtype_timestamp)
-
-        # without a Series wrapping the NaT, it is ambiguous
-        # whether it is a datetime64 or timedelta64
-        # defaults to interpreting it as timedelta64
-        assert_series_equal(nat_series_dtype_timestamp - NaT,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(-NaT + nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        assert_series_equal(nat_series_dtype_timestamp -
-                            single_nat_dtype_datetime,
-                            nat_series_dtype_timedelta)
-        with tm.assertRaises(TypeError):
-            -single_nat_dtype_datetime + nat_series_dtype_timestamp
-
-        assert_series_equal(nat_series_dtype_timestamp -
-                            single_nat_dtype_timedelta,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(-single_nat_dtype_timedelta +
-                            nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        with tm.assertRaises(TypeError):
-            timedelta_series - single_nat_dtype_datetime
-
-        # addition
-        assert_series_equal(nat_series_dtype_timestamp + NaT,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(NaT + nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        assert_series_equal(nat_series_dtype_timestamp +
-                            single_nat_dtype_timedelta,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(single_nat_dtype_timedelta +
-                            nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        assert_series_equal(nat_series_dtype_timedelta + NaT,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(NaT + nat_series_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(nat_series_dtype_timedelta +
-                            single_nat_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(single_nat_dtype_timedelta +
-                            nat_series_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(timedelta_series + NaT, nat_series_dtype_timedelta)
-        assert_series_equal(NaT + timedelta_series, nat_series_dtype_timedelta)
-
-        assert_series_equal(timedelta_series + single_nat_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(single_nat_dtype_timedelta + timedelta_series,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(nat_series_dtype_timestamp + NaT,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(NaT + nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        assert_series_equal(nat_series_dtype_timestamp +
-                            single_nat_dtype_timedelta,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(single_nat_dtype_timedelta +
-                            nat_series_dtype_timestamp,
-                            nat_series_dtype_timestamp)
-
-        assert_series_equal(nat_series_dtype_timedelta + NaT,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(NaT + nat_series_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(nat_series_dtype_timedelta +
-                            single_nat_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(single_nat_dtype_timedelta +
-                            nat_series_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(nat_series_dtype_timedelta +
-                            single_nat_dtype_datetime,
-                            nat_series_dtype_timestamp)
-        assert_series_equal(single_nat_dtype_datetime +
-                            nat_series_dtype_timedelta,
-                            nat_series_dtype_timestamp)
-
-        # multiplication
-        assert_series_equal(nat_series_dtype_timedelta * 1.0,
-                            nat_series_dtype_timedelta)
-        assert_series_equal(1.0 * nat_series_dtype_timedelta,
-                            nat_series_dtype_timedelta)
-
-        assert_series_equal(timedelta_series * 1, timedelta_series)
-        assert_series_equal(1 * timedelta_series, timedelta_series)
-
-        assert_series_equal(timedelta_series * 1.5,
-                            Series([NaT, Timedelta('1.5s')]))
-        assert_series_equal(1.5 * timedelta_series,
-                            Series([NaT, Timedelta('1.5s')]))
-
-        assert_series_equal(timedelta_series * nan, nat_series_dtype_timedelta)
-        assert_series_equal(nan * timedelta_series, nat_series_dtype_timedelta)
-
-        with tm.assertRaises(TypeError):
-            datetime_series * 1
-        with tm.assertRaises(TypeError):
-            nat_series_dtype_timestamp * 1
-        with tm.assertRaises(TypeError):
-            datetime_series * 1.0
-        with tm.assertRaises(TypeError):
-            nat_series_dtype_timestamp * 1.0
-
-        # division
-        assert_series_equal(timedelta_series / 2,
-                            Series([NaT, Timedelta('0.5s')]))
-        assert_series_equal(timedelta_series / 2.0,
-                            Series([NaT, Timedelta('0.5s')]))
-        assert_series_equal(timedelta_series / nan, nat_series_dtype_timedelta)
-        with tm.assertRaises(TypeError):
-            nat_series_dtype_timestamp / 1.0
-        with tm.assertRaises(TypeError):
-            nat_series_dtype_timestamp / 1
+        exp = pd.DataFrame({'x': [True, True, True, np.nan]},
+                           index=list('ABCD'))
+        assert_frame_equal(s3.to_frame() | s4.to_frame(), exp)
+        assert_frame_equal(s4.to_frame() | s3.to_frame(), exp)
 
-    def test_ops_datetimelike_align(self):
-        # GH 7500
-        # datetimelike ops need to align
-        dt = Series(date_range('2012-1-1', periods=3, freq='D'))
-        dt.iloc[2] = np.nan
-        dt2 = dt[::-1]
 
-        expected = Series([timedelta(0), timedelta(0), pd.NaT])
-        # name is reset
-        result = dt2 - dt
-        assert_series_equal(result, expected)
+class TestSeriesComparisons(object):
+    def test_comparisons(self):
+        left = np.random.randn(10)
+        right = np.random.randn(10)
+        left[:3] = np.nan
 
-        expected = Series(expected, name=0)
-        result = (dt2.to_frame() - dt.to_frame())[0]
-        assert_series_equal(result, expected)
+        result = nanops.nangt(left, right)
+        with np.errstate(invalid='ignore'):
+            expected = (left > right).astype('O')
+        expected[:3] = np.nan
 
-    def test_object_comparisons(self):
-        s = Series(['a', 'b', np.nan, 'c', 'a'])
+        assert_almost_equal(result, expected)
 
-        result = s == 'a'
-        expected = Series([True, False, False, False, True])
-        assert_series_equal(result, expected)
+        s = Series(['a', 'b', 'c'])
+        s2 = Series([False, True, False])
 
-        result = s < 'a'
-        expected = Series([False, False, False, False, False])
-        assert_series_equal(result, expected)
+        # it works!
+        exp = Series([False, False, False])
+        assert_series_equal(s == s2, exp)
+        assert_series_equal(s2 == s, exp)
 
-        result = s != 'a'
-        expected = -(s == 'a')
-        assert_series_equal(result, expected)
+    def test_categorical_comparisons(self):
+        # GH 8938
+        # allow equality comparisons
+        a = Series(list('abc'), dtype="category")
+        b = Series(list('abc'), dtype="object")
+        c = Series(['a', 'b', 'cc'], dtype="object")
+        d = Series(list('acb'), dtype="object")
+        e = Categorical(list('abc'))
+        f = Categorical(list('acb'))
+
+        # vs scalar
+        assert not (a == 'a').all()
+        assert ((a != 'a') == ~(a == 'a')).all()
+
+        assert not ('a' == a).all()
+        assert (a == 'a')[0]
+        assert ('a' == a)[0]
+        assert not ('a' != a)[0]
+
+        # vs list-like
+        assert (a == a).all()
+        assert not (a != a).all()
+
+        assert (a == list(a)).all()
+        assert (a == b).all()
+        assert (b == a).all()
+        assert ((~(a == b)) == (a != b)).all()
+        assert ((~(b == a)) == (b != a)).all()
+
+        assert not (a == c).all()
+        assert not (c == a).all()
+        assert not (a == d).all()
+        assert not (d == a).all()
+
+        # vs a cat-like
+        assert (a == e).all()
+        assert (e == a).all()
+        assert not (a == f).all()
+        assert not (f == a).all()
+
+        assert ((~(a == e) == (a != e)).all())
+        assert ((~(e == a) == (e != a)).all())
+        assert ((~(a == f) == (a != f)).all())
+        assert ((~(f == a) == (f != a)).all())
+
+        # non-equality is not comparable
+        with pytest.raises(TypeError):
+            a < b
+        with pytest.raises(TypeError):
+            b < a
+        with pytest.raises(TypeError):
+            a > b
+        with pytest.raises(TypeError):
+            b > a
 
     def test_comparison_tuples(self):
         # GH11339
@@ -970,18 +475,18 @@ def test_comparison_tuples(self):
         assert_series_equal(result, expected)
 
     def test_comparison_operators_with_nas(self):
-        s = Series(bdate_range('1/1/2000', periods=10), dtype=object)
-        s[::2] = np.nan
+        ser = Series(bdate_range('1/1/2000', periods=10), dtype=object)
+        ser[::2] = np.nan
 
         # test that comparisons work
         ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
         for op in ops:
-            val = s[5]
+            val = ser[5]
 
             f = getattr(operator, op)
-            result = f(s, val)
+            result = f(ser, val)
 
-            expected = f(s.dropna(), val).reindex(s.index)
+            expected = f(ser.dropna(), val).reindex(ser.index)
 
             if op == 'ne':
                 expected = expected.fillna(True).astype(bool)
@@ -995,271 +500,78 @@ def test_comparison_operators_with_nas(self):
             # expected = f(val, s.dropna()).reindex(s.index)
             # assert_series_equal(result, expected)
 
-            # boolean &, |, ^ should work with object arrays and propagate NAs
-
-        ops = ['and_', 'or_', 'xor']
-        mask = s.isnull()
-        for bool_op in ops:
-            f = getattr(operator, bool_op)
-
-            filled = s.fillna(s[0])
-
-            result = f(s < s[9], s > s[3])
-
-            expected = f(filled < filled[9], filled > filled[3])
-            expected[mask] = False
-            assert_series_equal(result, expected)
-
-    def test_comparison_object_numeric_nas(self):
-        s = Series(np.random.randn(10), dtype=object)
-        shifted = s.shift(2)
-
-        ops = ['lt', 'le', 'gt', 'ge', 'eq', 'ne']
-        for op in ops:
-            f = getattr(operator, op)
-
-            result = f(s, shifted)
-            expected = f(s.astype(float), shifted.astype(float))
-            assert_series_equal(result, expected)
-
-    def test_comparison_invalid(self):
-
-        # GH4968
-        # invalid date/int comparisons
-        s = Series(range(5))
-        s2 = Series(date_range('20010101', periods=5))
-
-        for (x, y) in [(s, s2), (s2, s)]:
-            self.assertRaises(TypeError, lambda: x == y)
-            self.assertRaises(TypeError, lambda: x != y)
-            self.assertRaises(TypeError, lambda: x >= y)
-            self.assertRaises(TypeError, lambda: x > y)
-            self.assertRaises(TypeError, lambda: x < y)
-            self.assertRaises(TypeError, lambda: x <= y)
-
-    def test_more_na_comparisons(self):
-        for dtype in [None, object]:
-            left = Series(['a', np.nan, 'c'], dtype=dtype)
-            right = Series(['a', np.nan, 'd'], dtype=dtype)
-
-            result = left == right
-            expected = Series([True, False, False])
-            assert_series_equal(result, expected)
-
-            result = left != right
-            expected = Series([False, True, True])
-            assert_series_equal(result, expected)
-
-            result = left == np.nan
-            expected = Series([False, False, False])
-            assert_series_equal(result, expected)
-
-            result = left != np.nan
-            expected = Series([True, True, True])
-            assert_series_equal(result, expected)
+    def test_unequal_categorical_comparison_raises_type_error(self):
+        # unequal comparison should raise for unordered cats
+        cat = Series(Categorical(list("abc")))
+        with pytest.raises(TypeError):
+            cat > "b"
+
+        cat = Series(Categorical(list("abc"), ordered=False))
+        with pytest.raises(TypeError):
+            cat > "b"
+
+        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
+        # and following comparisons with scalars not in categories should raise
+        # for unequal comps, but not for equal/not equal
+        cat = Series(Categorical(list("abc"), ordered=True))
+
+        with pytest.raises(TypeError):
+            cat < "d"
+        with pytest.raises(TypeError):
+            cat > "d"
+        with pytest.raises(TypeError):
+            "d" < cat
+        with pytest.raises(TypeError):
+            "d" > cat
+
+        tm.assert_series_equal(cat == "d", Series([False, False, False]))
+        tm.assert_series_equal(cat != "d", Series([True, True, True]))
 
-    def test_nat_comparisons(self):
-        data = [([pd.Timestamp('2011-01-01'), pd.NaT,
-                  pd.Timestamp('2011-01-03')],
-                 [pd.NaT, pd.NaT, pd.Timestamp('2011-01-03')]),
-
-                ([pd.Timedelta('1 days'), pd.NaT,
-                  pd.Timedelta('3 days')],
-                 [pd.NaT, pd.NaT, pd.Timedelta('3 days')]),
-
-                ([pd.Period('2011-01', freq='M'), pd.NaT,
-                  pd.Period('2011-03', freq='M')],
-                 [pd.NaT, pd.NaT, pd.Period('2011-03', freq='M')])]
-
-        # add lhs / rhs switched data
-        data = data + [(r, l) for l, r in data]
-
-        for l, r in data:
-            for dtype in [None, object]:
-                left = Series(l, dtype=dtype)
-
-                # Series, Index
-                for right in [Series(r, dtype=dtype), Index(r, dtype=dtype)]:
-                    expected = Series([False, False, True])
-                    assert_series_equal(left == right, expected)
-
-                    expected = Series([True, True, False])
-                    assert_series_equal(left != right, expected)
-
-                    expected = Series([False, False, False])
-                    assert_series_equal(left < right, expected)
-
-                    expected = Series([False, False, False])
-                    assert_series_equal(left > right, expected)
-
-                    expected = Series([False, False, True])
-                    assert_series_equal(left >= right, expected)
-
-                    expected = Series([False, False, True])
-                    assert_series_equal(left <= right, expected)
-
-    def test_nat_comparisons_scalar(self):
-        data = [[pd.Timestamp('2011-01-01'), pd.NaT,
-                 pd.Timestamp('2011-01-03')],
-
-                [pd.Timedelta('1 days'), pd.NaT, pd.Timedelta('3 days')],
-
-                [pd.Period('2011-01', freq='M'), pd.NaT,
-                 pd.Period('2011-03', freq='M')]]
-
-        for l in data:
-            for dtype in [None, object]:
-                left = Series(l, dtype=dtype)
-
-                expected = Series([False, False, False])
-                assert_series_equal(left == pd.NaT, expected)
-                assert_series_equal(pd.NaT == left, expected)
-
-                expected = Series([True, True, True])
-                assert_series_equal(left != pd.NaT, expected)
-                assert_series_equal(pd.NaT != left, expected)
-
-                expected = Series([False, False, False])
-                assert_series_equal(left < pd.NaT, expected)
-                assert_series_equal(pd.NaT > left, expected)
-                assert_series_equal(left <= pd.NaT, expected)
-                assert_series_equal(pd.NaT >= left, expected)
-
-                assert_series_equal(left > pd.NaT, expected)
-                assert_series_equal(pd.NaT < left, expected)
-                assert_series_equal(left >= pd.NaT, expected)
-                assert_series_equal(pd.NaT <= left, expected)
-
-    def test_comparison_different_length(self):
-        a = Series(['a', 'b', 'c'])
-        b = Series(['b', 'a'])
-        self.assertRaises(ValueError, a.__lt__, b)
-
-        a = Series([1, 2])
-        b = Series([2, 3, 4])
-        self.assertRaises(ValueError, a.__eq__, b)
-
-    def test_comparison_label_based(self):
-
-        # GH 4947
-        # comparisons should be label based
+    def test_ne(self):
+        ts = Series([3, 4, 5, 6, 7], [3, 4, 5, 6, 7], dtype=float)
+        expected = [True, True, False, True, True]
+        assert tm.equalContents(ts.index != 5, expected)
+        assert tm.equalContents(~(ts.index == 5), expected)
 
-        a = Series([True, False, True], list('bca'))
-        b = Series([False, True, False], list('abc'))
+    def test_comp_ops_df_compat(self):
+        # GH 1134
+        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
 
-        expected = Series([False, True, False], list('abc'))
-        result = a & b
-        assert_series_equal(result, expected)
+        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
+        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
 
-        expected = Series([True, True, False], list('abc'))
-        result = a | b
-        assert_series_equal(result, expected)
+        for left, right in [(s1, s2), (s2, s1), (s3, s4), (s4, s3)]:
 
-        expected = Series([True, False, False], list('abc'))
-        result = a ^ b
-        assert_series_equal(result, expected)
+            msg = "Can only compare identically-labeled Series objects"
+            with pytest.raises(ValueError, match=msg):
+                left == right
 
-        # rhs is bigger
-        a = Series([True, False, True], list('bca'))
-        b = Series([False, True, False, True], list('abcd'))
+            with pytest.raises(ValueError, match=msg):
+                left != right
 
-        expected = Series([False, True, False, False], list('abcd'))
-        result = a & b
-        assert_series_equal(result, expected)
+            with pytest.raises(ValueError, match=msg):
+                left < right
 
-        expected = Series([True, True, False, False], list('abcd'))
-        result = a | b
-        assert_series_equal(result, expected)
+            msg = "Can only compare identically-labeled DataFrame objects"
+            with pytest.raises(ValueError, match=msg):
+                left.to_frame() == right.to_frame()
 
-        # filling
+            with pytest.raises(ValueError, match=msg):
+                left.to_frame() != right.to_frame()
 
-        # vs empty
-        result = a & Series([])
-        expected = Series([False, False, False], list('bca'))
-        assert_series_equal(result, expected)
+            with pytest.raises(ValueError, match=msg):
+                left.to_frame() < right.to_frame()
 
-        result = a | Series([])
-        expected = Series([True, False, True], list('bca'))
+    def test_compare_series_interval_keyword(self):
+        # GH 25338
+        s = Series(['IntervalA', 'IntervalB', 'IntervalC'])
+        result = s == 'IntervalA'
+        expected = Series([True, False, False])
         assert_series_equal(result, expected)
 
-        # vs non-matching
-        result = a & Series([1], ['z'])
-        expected = Series([False, False, False, False], list('abcz'))
-        assert_series_equal(result, expected)
-
-        result = a | Series([1], ['z'])
-        expected = Series([True, True, False, False], list('abcz'))
-        assert_series_equal(result, expected)
-
-        # identity
-        # we would like s[s|e] == s to hold for any e, whether empty or not
-        for e in [Series([]), Series([1], ['z']),
-                  Series(np.nan, b.index), Series(np.nan, a.index)]:
-            result = a[a | e]
-            assert_series_equal(result, a[a])
-
-        for e in [Series(['z'])]:
-            if compat.PY3:
-                with tm.assert_produces_warning(RuntimeWarning):
-                    result = a[a | e]
-            else:
-                result = a[a | e]
-            assert_series_equal(result, a[a])
-
-        # vs scalars
-        index = list('bca')
-        t = Series([True, False, True])
-
-        for v in [True, 1, 2]:
-            result = Series([True, False, True], index=index) | v
-            expected = Series([True, True, True], index=index)
-            assert_series_equal(result, expected)
-
-        for v in [np.nan, 'foo']:
-            self.assertRaises(TypeError, lambda: t | v)
-
-        for v in [False, 0]:
-            result = Series([True, False, True], index=index) | v
-            expected = Series([True, False, True], index=index)
-            assert_series_equal(result, expected)
-
-        for v in [True, 1]:
-            result = Series([True, False, True], index=index) & v
-            expected = Series([True, False, True], index=index)
-            assert_series_equal(result, expected)
-
-        for v in [False, 0]:
-            result = Series([True, False, True], index=index) & v
-            expected = Series([False, False, False], index=index)
-            assert_series_equal(result, expected)
-        for v in [np.nan]:
-            self.assertRaises(TypeError, lambda: t & v)
-
-    def test_comparison_flex_basic(self):
-        left = pd.Series(np.random.randn(10))
-        right = pd.Series(np.random.randn(10))
-
-        assert_series_equal(left.eq(right), left == right)
-        assert_series_equal(left.ne(right), left != right)
-        assert_series_equal(left.le(right), left < right)
-        assert_series_equal(left.lt(right), left <= right)
-        assert_series_equal(left.gt(right), left > right)
-        assert_series_equal(left.ge(right), left >= right)
-
-        # axis
-        for axis in [0, None, 'index']:
-            assert_series_equal(left.eq(right, axis=axis), left == right)
-            assert_series_equal(left.ne(right, axis=axis), left != right)
-            assert_series_equal(left.le(right, axis=axis), left < right)
-            assert_series_equal(left.lt(right, axis=axis), left <= right)
-            assert_series_equal(left.gt(right, axis=axis), left > right)
-            assert_series_equal(left.ge(right, axis=axis), left >= right)
-
-        #
-        msg = 'No axis named 1 for object type'
-        for op in ['eq', 'ne', 'le', 'le', 'gt', 'ge']:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                getattr(left, op)(right, axis=1)
+
+class TestSeriesFlexComparisonOps(object):
 
     def test_comparison_flex_alignment(self):
         left = Series([1, 3, 2], index=list('abc'))
@@ -1305,158 +617,29 @@ def test_comparison_flex_alignment_fill(self):
         exp = pd.Series([True, True, False, False], index=list('abcd'))
         assert_series_equal(left.gt(right, fill_value=0), exp)
 
-    def test_return_dtypes_bool_op_costant(self):
-        # gh15115
-        s = pd.Series([1, 3, 2], index=range(3))
-        const = 2
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            result = getattr(s, op)(const).get_dtype_counts()
-            self.assert_series_equal(result, Series([1], ['bool']))
-
-        # empty Series
-        empty = s.iloc[:0]
-        for op in ['eq', 'ne', 'gt', 'lt', 'ge', 'le']:
-            result = getattr(empty, op)(const).get_dtype_counts()
-            self.assert_series_equal(result, Series([1], ['bool']))
-
-    def test_operators_bitwise(self):
-        # GH 9016: support bitwise op for integer types
-        index = list('bca')
-
-        s_tft = Series([True, False, True], index=index)
-        s_fff = Series([False, False, False], index=index)
-        s_tff = Series([True, False, False], index=index)
-        s_empty = Series([])
-
-        # TODO: unused
-        # s_0101 = Series([0, 1, 0, 1])
-
-        s_0123 = Series(range(4), dtype='int64')
-        s_3333 = Series([3] * 4)
-        s_4444 = Series([4] * 4)
-
-        res = s_tft & s_empty
-        expected = s_fff
-        assert_series_equal(res, expected)
-
-        res = s_tft | s_empty
-        expected = s_tft
-        assert_series_equal(res, expected)
-
-        res = s_0123 & s_3333
-        expected = Series(range(4), dtype='int64')
-        assert_series_equal(res, expected)
-
-        res = s_0123 | s_4444
-        expected = Series(range(4, 8), dtype='int64')
-        assert_series_equal(res, expected)
-
-        s_a0b1c0 = Series([1], list('b'))
-
-        res = s_tft & s_a0b1c0
-        expected = s_tff.reindex(list('abc'))
-        assert_series_equal(res, expected)
-
-        res = s_tft | s_a0b1c0
-        expected = s_tft.reindex(list('abc'))
-        assert_series_equal(res, expected)
-
-        n0 = 0
-        res = s_tft & n0
-        expected = s_fff
-        assert_series_equal(res, expected)
-
-        res = s_0123 & n0
-        expected = Series([0] * 4)
-        assert_series_equal(res, expected)
-
-        n1 = 1
-        res = s_tft & n1
-        expected = s_tft
-        assert_series_equal(res, expected)
-
-        res = s_0123 & n1
-        expected = Series([0, 1, 0, 1])
-        assert_series_equal(res, expected)
-
-        s_1111 = Series([1] * 4, dtype='int8')
-        res = s_0123 & s_1111
-        expected = Series([0, 1, 0, 1], dtype='int64')
-        assert_series_equal(res, expected)
-
-        res = s_0123.astype(np.int16) | s_1111.astype(np.int32)
-        expected = Series([1, 1, 3, 3], dtype='int32')
-        assert_series_equal(res, expected)
-
-        self.assertRaises(TypeError, lambda: s_1111 & 'a')
-        self.assertRaises(TypeError, lambda: s_1111 & ['a', 'b', 'c', 'd'])
-        self.assertRaises(TypeError, lambda: s_0123 & np.NaN)
-        self.assertRaises(TypeError, lambda: s_0123 & 3.14)
-        self.assertRaises(TypeError, lambda: s_0123 & [0.1, 4, 3.14, 2])
-
-        # s_0123 will be all false now because of reindexing like s_tft
-        if compat.PY3:
-            # unable to sort incompatible object via .union.
-            exp = Series([False] * 7, index=['b', 'c', 'a', 0, 1, 2, 3])
-            with tm.assert_produces_warning(RuntimeWarning):
-                assert_series_equal(s_tft & s_0123, exp)
-        else:
-            exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
-            assert_series_equal(s_tft & s_0123, exp)
-
-        # s_tft will be all false now because of reindexing like s_0123
-        if compat.PY3:
-            # unable to sort incompatible object via .union.
-            exp = Series([False] * 7, index=[0, 1, 2, 3, 'b', 'c', 'a'])
-            with tm.assert_produces_warning(RuntimeWarning):
-                assert_series_equal(s_0123 & s_tft, exp)
-        else:
-            exp = Series([False] * 7, index=[0, 1, 2, 3, 'a', 'b', 'c'])
-            assert_series_equal(s_0123 & s_tft, exp)
-
-        assert_series_equal(s_0123 & False, Series([False] * 4))
-        assert_series_equal(s_0123 ^ False, Series([False, True, True, True]))
-        assert_series_equal(s_0123 & [False], Series([False] * 4))
-        assert_series_equal(s_0123 & (False), Series([False] * 4))
-        assert_series_equal(s_0123 & Series([False, np.NaN, False, False]),
-                            Series([False] * 4))
-
-        s_ftft = Series([False, True, False, True])
-        assert_series_equal(s_0123 & Series([0.1, 4, -3.14, 2]), s_ftft)
-
-        s_abNd = Series(['a', 'b', np.NaN, 'd'])
-        res = s_0123 & s_abNd
-        expected = s_ftft
-        assert_series_equal(res, expected)
-
-    def test_scalar_na_cmp_corners(self):
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, 10])
-
-        def tester(a, b):
-            return a & b
-
-        self.assertRaises(TypeError, tester, s, datetime(2005, 1, 1))
-
-        s = Series([2, 3, 4, 5, 6, 7, 8, 9, datetime(2005, 1, 1)])
-        s[::2] = np.nan
 
-        expected = Series(True, index=s.index)
-        expected[::2] = False
-        assert_series_equal(tester(s, list(s)), expected)
+class TestSeriesOperators(TestData):
 
-        d = DataFrame({'A': s})
-        # TODO: Fix this exception - needs to be fixed! (see GH5035)
-        # (previously this was a TypeError because series returned
-        # NotImplemented
+    def test_operators_empty_int_corner(self):
+        s1 = Series([], [], dtype=np.int32)
+        s2 = Series({'x': 0.})
+        assert_series_equal(s1 * s2, Series([np.nan], index=['x']))
 
-        # this is an alignment issue; these are equivalent
-        # https://github.com/pandas-dev/pandas/issues/5284
+    def test_ops_datetimelike_align(self):
+        # GH 7500
+        # datetimelike ops need to align
+        dt = Series(date_range('2012-1-1', periods=3, freq='D'))
+        dt.iloc[2] = np.nan
+        dt2 = dt[::-1]
 
-        self.assertRaises(ValueError, lambda: d.__and__(s, axis='columns'))
-        self.assertRaises(ValueError, tester, s, d)
+        expected = Series([timedelta(0), timedelta(0), pd.NaT])
+        # name is reset
+        result = dt2 - dt
+        assert_series_equal(result, expected)
 
-        # this is wrong as its not a boolean result
-        # result = d.__and__(s,axis='index')
+        expected = Series(expected, name=0)
+        result = (dt2.to_frame() - dt.to_frame())[0]
+        assert_series_equal(result, expected)
 
     def test_operators_corner(self):
         series = self.ts
@@ -1464,10 +647,10 @@ def test_operators_corner(self):
         empty = Series([], index=Index([]))
 
         result = series + empty
-        self.assertTrue(np.isnan(result).all())
+        assert np.isnan(result).all()
 
         result = empty + Series([], index=Index([]))
-        self.assertEqual(len(result), 0)
+        assert len(result) == 0
 
         # TODO: this returned NotImplemented earlier, what to do?
         # deltas = Series([timedelta(1)] * 5, index=np.arange(5))
@@ -1480,259 +663,46 @@ def test_operators_corner(self):
         added = self.ts + int_ts
         expected = Series(self.ts.values[:-5] + int_ts.values,
                           index=self.ts.index[:-5], name='ts')
-        self.assert_series_equal(added[:-5], expected)
-
-    def test_operators_reverse_object(self):
-        # GH 56
-        arr = Series(np.random.randn(10), index=np.arange(10), dtype=object)
-
-        def _check_op(arr, op):
-            result = op(1., arr)
-            expected = op(1., arr.astype(float))
-            assert_series_equal(result.astype(float), expected)
-
-        _check_op(arr, operator.add)
-        _check_op(arr, operator.sub)
-        _check_op(arr, operator.mul)
-        _check_op(arr, operator.truediv)
-        _check_op(arr, operator.floordiv)
-
-    def test_arith_ops_df_compat(self):
-        # GH 1134
-        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
-        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
-
-        exp = pd.Series([3.0, 4.0, np.nan, np.nan],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s1 + s2, exp)
-        assert_series_equal(s2 + s1, exp)
-
-        exp = pd.DataFrame({'x': [3.0, 4.0, np.nan, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s1.to_frame() + s2.to_frame(), exp)
-        assert_frame_equal(s2.to_frame() + s1.to_frame(), exp)
-
-        # different length
-        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
-        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
-
-        exp = pd.Series([3, 4, 5, np.nan],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s3 + s4, exp)
-        assert_series_equal(s4 + s3, exp)
-
-        exp = pd.DataFrame({'x': [3, 4, 5, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s3.to_frame() + s4.to_frame(), exp)
-        assert_frame_equal(s4.to_frame() + s3.to_frame(), exp)
-
-    def test_comp_ops_df_compat(self):
-        # GH 1134
-        s1 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
-        s2 = pd.Series([2, 2, 2], index=list('ABD'), name='x')
-
-        s3 = pd.Series([1, 2, 3], index=list('ABC'), name='x')
-        s4 = pd.Series([2, 2, 2, 2], index=list('ABCD'), name='x')
-
-        for l, r in [(s1, s2), (s2, s1), (s3, s4), (s4, s3)]:
-
-            msg = "Can only compare identically-labeled Series objects"
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l == r
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l != r
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l < r
-
-            msg = "Can only compare identically-labeled DataFrame objects"
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l.to_frame() == r.to_frame()
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l.to_frame() != r.to_frame()
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                l.to_frame() < r.to_frame()
-
-    def test_bool_ops_df_compat(self):
-        # GH 1134
-        s1 = pd.Series([True, False, True], index=list('ABC'), name='x')
-        s2 = pd.Series([True, True, False], index=list('ABD'), name='x')
-
-        exp = pd.Series([True, False, False, False],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s1 & s2, exp)
-        assert_series_equal(s2 & s1, exp)
-
-        # True | np.nan => True
-        exp = pd.Series([True, True, True, False],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s1 | s2, exp)
-        # np.nan | True => np.nan, filled with False
-        exp = pd.Series([True, True, False, False],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s2 | s1, exp)
-
-        # DataFrame doesn't fill nan with False
-        exp = pd.DataFrame({'x': [True, False, np.nan, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s1.to_frame() & s2.to_frame(), exp)
-        assert_frame_equal(s2.to_frame() & s1.to_frame(), exp)
-
-        exp = pd.DataFrame({'x': [True, True, np.nan, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s1.to_frame() | s2.to_frame(), exp)
-        assert_frame_equal(s2.to_frame() | s1.to_frame(), exp)
-
-        # different length
-        s3 = pd.Series([True, False, True], index=list('ABC'), name='x')
-        s4 = pd.Series([True, True, True, True], index=list('ABCD'), name='x')
-
-        exp = pd.Series([True, False, True, False],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s3 & s4, exp)
-        assert_series_equal(s4 & s3, exp)
-
-        # np.nan | True => np.nan, filled with False
-        exp = pd.Series([True, True, True, False],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s3 | s4, exp)
-        # True | np.nan => True
-        exp = pd.Series([True, True, True, True],
-                        index=list('ABCD'), name='x')
-        assert_series_equal(s4 | s3, exp)
-
-        exp = pd.DataFrame({'x': [True, False, True, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s3.to_frame() & s4.to_frame(), exp)
-        assert_frame_equal(s4.to_frame() & s3.to_frame(), exp)
-
-        exp = pd.DataFrame({'x': [True, True, True, np.nan]},
-                           index=list('ABCD'))
-        assert_frame_equal(s3.to_frame() | s4.to_frame(), exp)
-        assert_frame_equal(s4.to_frame() | s3.to_frame(), exp)
-
-    def test_series_frame_radd_bug(self):
-        # GH 353
-        vals = Series(tm.rands_array(5, 10))
-        result = 'foo_' + vals
-        expected = vals.map(lambda x: 'foo_' + x)
-        assert_series_equal(result, expected)
-
-        frame = DataFrame({'vals': vals})
-        result = 'foo_' + frame
-        expected = DataFrame({'vals': vals.map(lambda x: 'foo_' + x)})
-        assert_frame_equal(result, expected)
-
-        # really raise this time
-        with tm.assertRaises(TypeError):
-            datetime.now() + self.ts
-
-        with tm.assertRaises(TypeError):
-            self.ts + datetime.now()
-
-    def test_series_radd_more(self):
-        data = [[1, 2, 3],
-                [1.1, 2.2, 3.3],
-                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
-                 pd.NaT],
-                ['x', 'y', 1]]
-
-        for d in data:
-            for dtype in [None, object]:
-                s = Series(d, dtype=dtype)
-                with tm.assertRaises(TypeError):
-                    'foo_' + s
-
-        for dtype in [None, object]:
-            res = 1 + pd.Series([1, 2, 3], dtype=dtype)
-            exp = pd.Series([2, 3, 4], dtype=dtype)
-            assert_series_equal(res, exp)
-            res = pd.Series([1, 2, 3], dtype=dtype) + 1
-            assert_series_equal(res, exp)
-
-            res = np.nan + pd.Series([1, 2, 3], dtype=dtype)
-            exp = pd.Series([np.nan, np.nan, np.nan], dtype=dtype)
-            assert_series_equal(res, exp)
-            res = pd.Series([1, 2, 3], dtype=dtype) + np.nan
-            assert_series_equal(res, exp)
-
-            s = pd.Series([pd.Timedelta('1 days'), pd.Timedelta('2 days'),
-                           pd.Timedelta('3 days')], dtype=dtype)
-            exp = pd.Series([pd.Timedelta('4 days'), pd.Timedelta('5 days'),
-                             pd.Timedelta('6 days')])
-            assert_series_equal(pd.Timedelta('3 days') + s, exp)
-            assert_series_equal(s + pd.Timedelta('3 days'), exp)
-
-        s = pd.Series(['x', np.nan, 'x'])
-        assert_series_equal('a' + s, pd.Series(['ax', np.nan, 'ax']))
-        assert_series_equal(s + 'a', pd.Series(['xa', np.nan, 'xa']))
-
-    def test_frame_radd_more(self):
-        data = [[1, 2, 3],
-                [1.1, 2.2, 3.3],
-                [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
-                 pd.NaT],
-                ['x', 'y', 1]]
-
-        for d in data:
-            for dtype in [None, object]:
-                s = DataFrame(d, dtype=dtype)
-                with tm.assertRaises(TypeError):
-                    'foo_' + s
-
-        for dtype in [None, object]:
-            res = 1 + pd.DataFrame([1, 2, 3], dtype=dtype)
-            exp = pd.DataFrame([2, 3, 4], dtype=dtype)
-            assert_frame_equal(res, exp)
-            res = pd.DataFrame([1, 2, 3], dtype=dtype) + 1
-            assert_frame_equal(res, exp)
-
-            res = np.nan + pd.DataFrame([1, 2, 3], dtype=dtype)
-            exp = pd.DataFrame([np.nan, np.nan, np.nan], dtype=dtype)
-            assert_frame_equal(res, exp)
-            res = pd.DataFrame([1, 2, 3], dtype=dtype) + np.nan
-            assert_frame_equal(res, exp)
-
-        df = pd.DataFrame(['x', np.nan, 'x'])
-        assert_frame_equal('a' + df, pd.DataFrame(['ax', np.nan, 'ax']))
-        assert_frame_equal(df + 'a', pd.DataFrame(['xa', np.nan, 'xa']))
-
-    def test_operators_frame(self):
-        # rpow does not work with DataFrame
-        df = DataFrame({'A': self.ts})
-
-        assert_series_equal(self.ts + self.ts, self.ts + df['A'],
-                            check_names=False)
-        assert_series_equal(self.ts ** self.ts, self.ts ** df['A'],
-                            check_names=False)
-        assert_series_equal(self.ts < self.ts, self.ts < df['A'],
-                            check_names=False)
-        assert_series_equal(self.ts / self.ts, self.ts / df['A'],
-                            check_names=False)
-
-    def test_operators_combine(self):
+        tm.assert_series_equal(added[:-5], expected)
+
+    pairings = []
+    for op in ['add', 'sub', 'mul', 'pow', 'truediv', 'floordiv']:
+        fv = 0
+        lop = getattr(Series, op)
+        lequiv = getattr(operator, op)
+        rop = getattr(Series, 'r' + op)
+        # bind op at definition time...
+        requiv = lambda x, y, op=op: getattr(operator, op)(y, x)
+        pairings.append((lop, lequiv, fv))
+        pairings.append((rop, requiv, fv))
+    if compat.PY3:
+        pairings.append((Series.div, operator.truediv, 1))
+        pairings.append((Series.rdiv, lambda x, y: operator.truediv(y, x), 1))
+    else:
+        pairings.append((Series.div, operator.div, 1))
+        pairings.append((Series.rdiv, lambda x, y: operator.div(y, x), 1))
+
+    @pytest.mark.parametrize('op, equiv_op, fv', pairings)
+    def test_operators_combine(self, op, equiv_op, fv):
         def _check_fill(meth, op, a, b, fill_value=0):
             exp_index = a.index.union(b.index)
             a = a.reindex(exp_index)
             b = b.reindex(exp_index)
 
-            amask = isnull(a)
-            bmask = isnull(b)
+            amask = isna(a)
+            bmask = isna(b)
 
             exp_values = []
             for i in range(len(exp_index)):
                 with np.errstate(all='ignore'):
                     if amask[i]:
                         if bmask[i]:
-                            exp_values.append(nan)
+                            exp_values.append(np.nan)
                             continue
                         exp_values.append(op(fill_value, b[i]))
                     elif bmask[i]:
                         if amask[i]:
-                            exp_values.append(nan)
+                            exp_values.append(np.nan)
                             continue
                         exp_values.append(op(a[i], fill_value))
                     else:
@@ -1742,41 +712,15 @@ def _check_fill(meth, op, a, b, fill_value=0):
             expected = Series(exp_values, exp_index)
             assert_series_equal(result, expected)
 
-        a = Series([nan, 1., 2., 3., nan], index=np.arange(5))
-        b = Series([nan, 1, nan, 3, nan, 4.], index=np.arange(6))
-
-        pairings = []
-        for op in ['add', 'sub', 'mul', 'pow', 'truediv', 'floordiv']:
-            fv = 0
-            lop = getattr(Series, op)
-            lequiv = getattr(operator, op)
-            rop = getattr(Series, 'r' + op)
-            # bind op at definition time...
-            requiv = lambda x, y, op=op: getattr(operator, op)(y, x)
-            pairings.append((lop, lequiv, fv))
-            pairings.append((rop, requiv, fv))
-
-        if compat.PY3:
-            pairings.append((Series.div, operator.truediv, 1))
-            pairings.append((Series.rdiv, lambda x, y: operator.truediv(y, x),
-                             1))
-        else:
-            pairings.append((Series.div, operator.div, 1))
-            pairings.append((Series.rdiv, lambda x, y: operator.div(y, x), 1))
-
-        for op, equiv_op, fv in pairings:
-            result = op(a, b)
-            exp = equiv_op(a, b)
-            assert_series_equal(result, exp)
-            _check_fill(op, equiv_op, a, b, fill_value=fv)
-            # should accept axis=0 or axis='rows'
-            op(a, b, axis=0)
+        a = Series([np.nan, 1., 2., 3., np.nan], index=np.arange(5))
+        b = Series([np.nan, 1, np.nan, 3, np.nan, 4.], index=np.arange(6))
 
-    def test_ne(self):
-        ts = Series([3, 4, 5, 6, 7], [3, 4, 5, 6, 7], dtype=float)
-        expected = [True, True, False, True, True]
-        self.assertTrue(tm.equalContents(ts.index != 5, expected))
-        self.assertTrue(tm.equalContents(~(ts.index == 5), expected))
+        result = op(a, b)
+        exp = equiv_op(a, b)
+        assert_series_equal(result, exp)
+        _check_fill(op, equiv_op, a, b, fill_value=fv)
+        # should accept axis=0 or axis='rows'
+        op(a, b, axis=0)
 
     def test_operators_na_handling(self):
         from decimal import Decimal
@@ -1786,68 +730,8 @@ def test_operators_na_handling(self):
 
         result = s + s.shift(1)
         result2 = s.shift(1) + s
-        self.assertTrue(isnull(result[0]))
-        self.assertTrue(isnull(result2[0]))
-
-        s = Series(['foo', 'bar', 'baz', np.nan])
-        result = 'prefix_' + s
-        expected = Series(['prefix_foo', 'prefix_bar', 'prefix_baz', np.nan])
-        assert_series_equal(result, expected)
-
-        result = s + '_suffix'
-        expected = Series(['foo_suffix', 'bar_suffix', 'baz_suffix', np.nan])
-        assert_series_equal(result, expected)
-
-    def test_divide_decimal(self):
-        """ resolves issue #9787 """
-        from decimal import Decimal
-
-        expected = Series([Decimal(5)])
-
-        s = Series([Decimal(10)])
-        s = s / Decimal(2)
-
-        assert_series_equal(expected, s)
-
-        s = Series([Decimal(10)])
-        s = s // Decimal(2)
-
-        assert_series_equal(expected, s)
-
-    def test_datetime64_with_index(self):
-
-        # arithmetic integer ops with an index
-        s = Series(np.random.randn(5))
-        expected = s - s.index.to_series()
-        result = s - s.index
-        assert_series_equal(result, expected)
-
-        # GH 4629
-        # arithmetic datetime64 ops with an index
-        s = Series(date_range('20130101', periods=5),
-                   index=date_range('20130101', periods=5))
-        expected = s - s.index.to_series()
-        result = s - s.index
-        assert_series_equal(result, expected)
-
-        result = s - s.index.to_period()
-        assert_series_equal(result, expected)
-
-        df = DataFrame(np.random.randn(5, 2),
-                       index=date_range('20130101', periods=5))
-        df['date'] = Timestamp('20130102')
-        df['expected'] = df['date'] - df.index.to_series()
-        df['result'] = df['date'] - df.index
-        assert_series_equal(df['result'], df['expected'], check_names=False)
-
-    def test_dti_tz_convert_to_utc(self):
-        base = pd.DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
-                                tz='UTC')
-        idx1 = base.tz_convert('Asia/Tokyo')[:2]
-        idx2 = base.tz_convert('US/Eastern')[1:]
-
-        res = Series([1, 2], index=idx1) + Series([1, 1], index=idx2)
-        assert_series_equal(res, Series([np.nan, 3, np.nan], index=base))
+        assert isna(result[0])
+        assert isna(result2[0])
 
     def test_op_duplicate_index(self):
         # GH14227
@@ -1856,3 +740,17 @@ def test_op_duplicate_index(self):
         result = s1 + s2
         expected = pd.Series([11, 12, np.nan], index=[1, 1, 2])
         assert_series_equal(result, expected)
+
+
+class TestSeriesUnaryOps(object):
+    # __neg__, __pos__, __inv__
+
+    def test_neg(self):
+        ser = tm.makeStringSeries()
+        ser.name = 'series'
+        assert_series_equal(-ser, -1 * ser)
+
+    def test_invert(self):
+        ser = tm.makeStringSeries()
+        ser.name = 'series'
+        assert_series_equal(-(ser < 0), ~(ser < 0))
diff --git a/pandas/tests/series/test_period.py b/pandas/tests/series/test_period.py
index f1ae7765648ca..7e0feb418e8df 100644
--- a/pandas/tests/series/test_period.py
+++ b/pandas/tests/series/test_period.py
@@ -1,44 +1,41 @@
 import numpy as np
+import pytest
 
 import pandas as pd
+from pandas import DataFrame, Period, Series, period_range
+from pandas.core.arrays import PeriodArray
 import pandas.util.testing as tm
-import pandas.tseries.period as period
-from pandas import Series, period_range, DataFrame, Period
 
 
-def _permute(obj):
-    return obj.take(np.random.permutation(len(obj)))
+class TestSeriesPeriod(object):
 
-
-class TestSeriesPeriod(tm.TestCase):
-
-    def setUp(self):
+    def setup_method(self, method):
         self.series = Series(period_range('2000-01-01', periods=10, freq='D'))
 
     def test_auto_conversion(self):
         series = Series(list(period_range('2000-01-01', periods=10, freq='D')))
-        self.assertEqual(series.dtype, 'object')
+        assert series.dtype == 'Period[D]'
 
         series = pd.Series([pd.Period('2011-01-01', freq='D'),
                             pd.Period('2011-02-01', freq='D')])
-        self.assertEqual(series.dtype, 'object')
+        assert series.dtype == 'Period[D]'
 
     def test_getitem(self):
-        self.assertEqual(self.series[1], pd.Period('2000-01-02', freq='D'))
+        assert self.series[1] == pd.Period('2000-01-02', freq='D')
 
         result = self.series[[2, 4]]
         exp = pd.Series([pd.Period('2000-01-03', freq='D'),
                          pd.Period('2000-01-05', freq='D')],
-                        index=[2, 4])
-        self.assert_series_equal(result, exp)
-        self.assertEqual(result.dtype, 'object')
+                        index=[2, 4], dtype='Period[D]')
+        tm.assert_series_equal(result, exp)
+        assert result.dtype == 'Period[D]'
 
-    def test_isnull(self):
+    def test_isna(self):
         # GH 13737
         s = Series([pd.Period('2011-01', freq='M'),
                     pd.Period('NaT', freq='M')])
-        tm.assert_series_equal(s.isnull(), Series([False, True]))
-        tm.assert_series_equal(s.notnull(), Series([True, False]))
+        tm.assert_series_equal(s.isna(), Series([False, True]))
+        tm.assert_series_equal(s.notna(), Series([True, False]))
 
     def test_fillna(self):
         # GH 13737
@@ -49,12 +46,7 @@ def test_fillna(self):
         exp = Series([pd.Period('2011-01', freq='M'),
                       pd.Period('2012-01', freq='M')])
         tm.assert_series_equal(res, exp)
-        self.assertEqual(res.dtype, 'object')
-
-        res = s.fillna('XXX')
-        exp = Series([pd.Period('2011-01', freq='M'), 'XXX'])
-        tm.assert_series_equal(res, exp)
-        self.assertEqual(res.dtype, 'object')
+        assert res.dtype == 'Period[M]'
 
     def test_dropna(self):
         # GH 13737
@@ -63,17 +55,6 @@ def test_dropna(self):
         tm.assert_series_equal(s.dropna(),
                                Series([pd.Period('2011-01', freq='M')]))
 
-    def test_series_comparison_scalars(self):
-        val = pd.Period('2000-01-04', freq='D')
-        result = self.series > val
-        expected = pd.Series([x > val for x in self.series])
-        tm.assert_series_equal(result, expected)
-
-        val = self.series[5]
-        result = self.series > val
-        expected = pd.Series([x > val for x in self.series])
-        tm.assert_series_equal(result, expected)
-
     def test_between(self):
         left, right = self.series[[2, 7]]
         result = self.series.between(left, right)
@@ -83,36 +64,36 @@ def test_between(self):
     # ---------------------------------------------------------------------
     # NaT support
 
-    """
-    # ToDo: Enable when support period dtype
+    @pytest.mark.xfail(reason="PeriodDtype Series not supported yet")
     def test_NaT_scalar(self):
-        series = Series([0, 1000, 2000, iNaT], dtype='period[D]')
+        series = Series([0, 1000, 2000, pd._libs.iNaT], dtype='period[D]')
 
         val = series[3]
-        self.assertTrue(isnull(val))
+        assert pd.isna(val)
 
         series[2] = val
-        self.assertTrue(isnull(series[2]))
+        assert pd.isna(series[2])
 
+    @pytest.mark.xfail(reason="PeriodDtype Series not supported yet")
     def test_NaT_cast(self):
         result = Series([np.nan]).astype('period[D]')
-        expected = Series([NaT])
+        expected = Series([pd.NaT])
         tm.assert_series_equal(result, expected)
-    """
 
-    def test_set_none_nan(self):
-        # currently Period is stored as object dtype, not as NaT
+    def test_set_none(self):
         self.series[3] = None
-        self.assertIs(self.series[3], None)
+        assert self.series[3] is pd.NaT
 
         self.series[3:5] = None
-        self.assertIs(self.series[4], None)
+        assert self.series[4] is pd.NaT
 
+    def test_set_nan(self):
+        # Do we want to allow this?
         self.series[5] = np.nan
-        self.assertTrue(np.isnan(self.series[5]))
+        assert self.series[5] is pd.NaT
 
         self.series[5:7] = np.nan
-        self.assertTrue(np.isnan(self.series[6]))
+        assert self.series[6] is pd.NaT
 
     def test_intercept_astype_object(self):
         expected = self.series.astype('object')
@@ -121,128 +102,74 @@ def test_intercept_astype_object(self):
                         'b': np.random.randn(len(self.series))})
 
         result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
+        assert (result[:, 0] == expected.values).all()
 
         df = DataFrame({'a': self.series, 'b': ['foo'] * len(self.series)})
 
         result = df.values.squeeze()
-        self.assertTrue((result[:, 0] == expected.values).all())
-
-    def test_comp_series_period_scalar(self):
-        # GH 13200
-        for freq in ['M', '2M', '3M']:
-            base = Series([Period(x, freq=freq) for x in
-                           ['2011-01', '2011-02', '2011-03', '2011-04']])
-            p = Period('2011-02', freq=freq)
-
-            exp = pd.Series([False, True, False, False])
-            tm.assert_series_equal(base == p, exp)
-            tm.assert_series_equal(p == base, exp)
-
-            exp = pd.Series([True, False, True, True])
-            tm.assert_series_equal(base != p, exp)
-            tm.assert_series_equal(p != base, exp)
-
-            exp = pd.Series([False, False, True, True])
-            tm.assert_series_equal(base > p, exp)
-            tm.assert_series_equal(p < base, exp)
-
-            exp = pd.Series([True, False, False, False])
-            tm.assert_series_equal(base < p, exp)
-            tm.assert_series_equal(p > base, exp)
-
-            exp = pd.Series([False, True, True, True])
-            tm.assert_series_equal(base >= p, exp)
-            tm.assert_series_equal(p <= base, exp)
-
-            exp = pd.Series([True, True, False, False])
-            tm.assert_series_equal(base <= p, exp)
-            tm.assert_series_equal(p >= base, exp)
-
-            # different base freq
-            msg = "Input has different freq=A-DEC from Period"
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                base <= Period('2011', freq='A')
-
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                Period('2011', freq='A') >= base
-
-    def test_comp_series_period_series(self):
-        # GH 13200
-        for freq in ['M', '2M', '3M']:
-            base = Series([Period(x, freq=freq) for x in
-                           ['2011-01', '2011-02', '2011-03', '2011-04']])
+        assert (result[:, 0] == expected.values).all()
 
-            s = Series([Period(x, freq=freq) for x in
-                        ['2011-02', '2011-01', '2011-03', '2011-05']])
-
-            exp = Series([False, False, True, False])
-            tm.assert_series_equal(base == s, exp)
-
-            exp = Series([True, True, False, True])
-            tm.assert_series_equal(base != s, exp)
-
-            exp = Series([False, True, False, False])
-            tm.assert_series_equal(base > s, exp)
-
-            exp = Series([True, False, False, True])
-            tm.assert_series_equal(base < s, exp)
-
-            exp = Series([False, True, True, False])
-            tm.assert_series_equal(base >= s, exp)
-
-            exp = Series([True, False, True, True])
-            tm.assert_series_equal(base <= s, exp)
-
-            s2 = Series([Period(x, freq='A') for x in
-                         ['2011', '2011', '2011', '2011']])
-
-            # different base freq
-            msg = "Input has different freq=A-DEC from Period"
-            with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-                base <= s2
-
-    def test_comp_series_period_object(self):
-        # GH 13200
-        base = Series([Period('2011', freq='A'), Period('2011-02', freq='M'),
-                       Period('2013', freq='A'), Period('2011-04', freq='M')])
-
-        s = Series([Period('2012', freq='A'), Period('2011-01', freq='M'),
-                    Period('2013', freq='A'), Period('2011-05', freq='M')])
-
-        exp = Series([False, False, True, False])
-        tm.assert_series_equal(base == s, exp)
-
-        exp = Series([True, True, False, True])
-        tm.assert_series_equal(base != s, exp)
-
-        exp = Series([False, True, False, False])
-        tm.assert_series_equal(base > s, exp)
-
-        exp = Series([True, False, False, True])
-        tm.assert_series_equal(base < s, exp)
-
-        exp = Series([False, True, True, False])
-        tm.assert_series_equal(base >= s, exp)
-
-        exp = Series([True, False, True, True])
-        tm.assert_series_equal(base <= s, exp)
-
-    def test_align_series(self):
+    def test_align_series(self, join_type):
         rng = period_range('1/1/2000', '1/1/2010', freq='A')
         ts = Series(np.random.randn(len(rng)), index=rng)
 
-        result = ts + ts[::2]
-        expected = ts + ts
-        expected[1::2] = np.nan
+        ts.align(ts[::2], join=join_type)
+
+    def test_truncate(self):
+        # GH 17717
+        idx1 = pd.PeriodIndex([
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-03')
+        ])
+        series1 = pd.Series([1, 2, 3], index=idx1)
+        result1 = series1.truncate(after='2017-09-02')
+
+        expected_idx1 = pd.PeriodIndex([
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-02')
+        ])
+        tm.assert_series_equal(result1, pd.Series([1, 2], index=expected_idx1))
+
+        idx2 = pd.PeriodIndex([
+            pd.Period('2017-09-03'),
+            pd.Period('2017-09-02'),
+            pd.Period('2017-09-03')
+        ])
+        series2 = pd.Series([1, 2, 3], index=idx2)
+        result2 = series2.sort_index().truncate(after='2017-09-02')
+
+        expected_idx2 = pd.PeriodIndex([
+            pd.Period('2017-09-02')
+        ])
+        tm.assert_series_equal(result2, pd.Series([2], index=expected_idx2))
+
+    @pytest.mark.parametrize('input_vals', [
+        [Period('2016-01', freq='M'), Period('2016-02', freq='M')],
+        [Period('2016-01-01', freq='D'), Period('2016-01-02', freq='D')],
+        [Period('2016-01-01 00:00:00', freq='H'),
+         Period('2016-01-01 01:00:00', freq='H')],
+        [Period('2016-01-01 00:00:00', freq='M'),
+         Period('2016-01-01 00:01:00', freq='M')],
+        [Period('2016-01-01 00:00:00', freq='S'),
+         Period('2016-01-01 00:00:01', freq='S')]
+    ])
+    def test_end_time_timevalues(self, input_vals):
+        # GH 17157
+        # Check that the time part of the Period is adjusted by end_time
+        # when using the dt accessor on a Series
+        input_vals = PeriodArray._from_sequence(np.asarray(input_vals))
+
+        s = Series(input_vals)
+        result = s.dt.end_time
+        expected = s.apply(lambda x: x.end_time)
         tm.assert_series_equal(result, expected)
 
-        result = ts + _permute(ts[::2])
+    @pytest.mark.parametrize('input_vals', [
+        ('2001'), ('NaT')
+    ])
+    def test_to_period(self, input_vals):
+        # GH 21205
+        expected = Series([input_vals], dtype='Period[D]')
+        result = Series([input_vals], dtype='datetime64[ns]').dt.to_period('D')
         tm.assert_series_equal(result, expected)
-
-        # it works!
-        for kind in ['inner', 'outer', 'left', 'right']:
-            ts.align(ts[::2], join=kind)
-        msg = "Input has different freq=D from PeriodIndex\\(freq=A-DEC\\)"
-        with tm.assertRaisesRegexp(period.IncompatibleFrequency, msg):
-            ts + ts.asfreq('D', how="end")
diff --git a/pandas/tests/series/test_quantile.py b/pandas/tests/series/test_quantile.py
index b8d1b92081858..4f462e11e9bb9 100644
--- a/pandas/tests/series/test_quantile.py
+++ b/pandas/tests/series/test_quantile.py
@@ -1,59 +1,58 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
-import pytest
 import numpy as np
-import pandas as pd
+import pytest
+
+from pandas.core.dtypes.common import is_integer
 
-from pandas import (Index, Series, _np_version_under1p9)
-from pandas.tseries.index import Timestamp
-from pandas.types.common import is_integer
+import pandas as pd
+from pandas import Index, Series
+from pandas.core.indexes.datetimes import Timestamp
 import pandas.util.testing as tm
 
 from .common import TestData
 
 
-class TestSeriesQuantile(TestData, tm.TestCase):
+class TestSeriesQuantile(TestData):
 
     def test_quantile(self):
-        from numpy import percentile
 
         q = self.ts.quantile(0.1)
-        self.assertEqual(q, percentile(self.ts.valid(), 10))
+        assert q == np.percentile(self.ts.dropna(), 10)
 
         q = self.ts.quantile(0.9)
-        self.assertEqual(q, percentile(self.ts.valid(), 90))
+        assert q == np.percentile(self.ts.dropna(), 90)
 
         # object dtype
         q = Series(self.ts, dtype=object).quantile(0.9)
-        self.assertEqual(q, percentile(self.ts.valid(), 90))
+        assert q == np.percentile(self.ts.dropna(), 90)
 
         # datetime64[ns] dtype
         dts = self.ts.index.to_series()
         q = dts.quantile(.2)
-        self.assertEqual(q, Timestamp('2000-01-10 19:12:00'))
+        assert q == Timestamp('2000-01-10 19:12:00')
 
         # timedelta64[ns] dtype
         tds = dts.diff()
         q = tds.quantile(.25)
-        self.assertEqual(q, pd.to_timedelta('24:00:00'))
+        assert q == pd.to_timedelta('24:00:00')
 
         # GH7661
         result = Series([np.timedelta64('NaT')]).sum()
-        self.assertTrue(result is pd.NaT)
+        assert result == pd.Timedelta(0)
 
         msg = 'percentiles should all be in the interval \\[0, 1\\]'
         for invalid in [-1, 2, [0.5, -1], [0.5, 2]]:
-            with tm.assertRaisesRegexp(ValueError, msg):
+            with pytest.raises(ValueError, match=msg):
                 self.ts.quantile(invalid)
 
     def test_quantile_multi(self):
-        from numpy import percentile
 
         qs = [.1, .9]
         result = self.ts.quantile(qs)
-        expected = pd.Series([percentile(self.ts.valid(), 10),
-                              percentile(self.ts.valid(), 90)],
+        expected = pd.Series([np.percentile(self.ts.dropna(), 10),
+                              np.percentile(self.ts.dropna(), 90)],
                              index=qs, name=self.ts.name)
         tm.assert_series_equal(result, expected)
 
@@ -71,59 +70,28 @@ def test_quantile_multi(self):
         tm.assert_series_equal(result, expected)
 
     def test_quantile_interpolation(self):
-        # GH #10174
-        if _np_version_under1p9:
-            pytest.skip("Numpy version is under 1.9")
-
-        from numpy import percentile
+        # see gh-10174
 
         # interpolation = linear (default case)
         q = self.ts.quantile(0.1, interpolation='linear')
-        self.assertEqual(q, percentile(self.ts.valid(), 10))
+        assert q == np.percentile(self.ts.dropna(), 10)
         q1 = self.ts.quantile(0.1)
-        self.assertEqual(q1, percentile(self.ts.valid(), 10))
+        assert q1 == np.percentile(self.ts.dropna(), 10)
 
         # test with and without interpolation keyword
-        self.assertEqual(q, q1)
+        assert q == q1
 
     def test_quantile_interpolation_dtype(self):
         # GH #10174
-        if _np_version_under1p9:
-            pytest.skip("Numpy version is under 1.9")
-
-        from numpy import percentile
 
         # interpolation = linear (default case)
         q = pd.Series([1, 3, 4]).quantile(0.5, interpolation='lower')
-        self.assertEqual(q, percentile(np.array([1, 3, 4]), 50))
-        self.assertTrue(is_integer(q))
+        assert q == np.percentile(np.array([1, 3, 4]), 50)
+        assert is_integer(q)
 
         q = pd.Series([1, 3, 4]).quantile(0.5, interpolation='higher')
-        self.assertEqual(q, percentile(np.array([1, 3, 4]), 50))
-        self.assertTrue(is_integer(q))
-
-    def test_quantile_interpolation_np_lt_1p9(self):
-        # GH #10174
-        if not _np_version_under1p9:
-            pytest.skip("Numpy version is greater than 1.9")
-
-        from numpy import percentile
-
-        # interpolation = linear (default case)
-        q = self.ts.quantile(0.1, interpolation='linear')
-        self.assertEqual(q, percentile(self.ts.valid(), 10))
-        q1 = self.ts.quantile(0.1)
-        self.assertEqual(q1, percentile(self.ts.valid(), 10))
-
-        # interpolation other than linear
-        expErrMsg = "Interpolation methods other than "
-        with tm.assertRaisesRegexp(ValueError, expErrMsg):
-            self.ts.quantile(0.9, interpolation='nearest')
-
-        # object dtype
-        with tm.assertRaisesRegexp(ValueError, expErrMsg):
-            q = Series(self.ts, dtype=object).quantile(0.7,
-                                                       interpolation='higher')
+        assert q == np.percentile(np.array([1, 3, 4]), 50)
+        assert is_integer(q)
 
     def test_quantile_nan(self):
 
@@ -131,14 +99,14 @@ def test_quantile_nan(self):
         s = pd.Series([1, 2, 3, 4, np.nan])
         result = s.quantile(0.5)
         expected = 2.5
-        self.assertEqual(result, expected)
+        assert result == expected
 
         # all nan/empty
         cases = [Series([]), Series([np.nan, np.nan])]
 
         for s in cases:
             res = s.quantile(0.5)
-            self.assertTrue(np.isnan(res))
+            assert np.isnan(res)
 
             res = s.quantile([0.5])
             tm.assert_series_equal(res, pd.Series([np.nan], index=[0.5]))
@@ -147,51 +115,60 @@ def test_quantile_nan(self):
             tm.assert_series_equal(res, pd.Series([np.nan, np.nan],
                                                   index=[0.2, 0.3]))
 
-    def test_quantile_box(self):
-        cases = [[pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
-                  pd.Timestamp('2011-01-03')],
-                 [pd.Timestamp('2011-01-01', tz='US/Eastern'),
-                  pd.Timestamp('2011-01-02', tz='US/Eastern'),
-                  pd.Timestamp('2011-01-03', tz='US/Eastern')],
-                 [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
-                  pd.Timedelta('3 days')],
-                 # NaT
-                 [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
-                  pd.Timestamp('2011-01-03'), pd.NaT],
-                 [pd.Timestamp('2011-01-01', tz='US/Eastern'),
-                  pd.Timestamp('2011-01-02', tz='US/Eastern'),
-                  pd.Timestamp('2011-01-03', tz='US/Eastern'), pd.NaT],
-                 [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
-                  pd.Timedelta('3 days'), pd.NaT]]
-
-        for case in cases:
-            s = pd.Series(case, name='XXX')
-            res = s.quantile(0.5)
-            self.assertEqual(res, case[1])
+    @pytest.mark.parametrize('case', [
+        [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
+         pd.Timestamp('2011-01-03')],
+        [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+         pd.Timestamp('2011-01-02', tz='US/Eastern'),
+         pd.Timestamp('2011-01-03', tz='US/Eastern')],
+        [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+         pd.Timedelta('3 days')],
+        # NaT
+        [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02'),
+         pd.Timestamp('2011-01-03'), pd.NaT],
+        [pd.Timestamp('2011-01-01', tz='US/Eastern'),
+         pd.Timestamp('2011-01-02', tz='US/Eastern'),
+         pd.Timestamp('2011-01-03', tz='US/Eastern'), pd.NaT],
+        [pd.Timedelta('1 days'), pd.Timedelta('2 days'),
+         pd.Timedelta('3 days'), pd.NaT]])
+    def test_quantile_box(self, case):
+        s = pd.Series(case, name='XXX')
+        res = s.quantile(0.5)
+        assert res == case[1]
 
-            res = s.quantile([0.5])
-            exp = pd.Series([case[1]], index=[0.5], name='XXX')
-            tm.assert_series_equal(res, exp)
+        res = s.quantile([0.5])
+        exp = pd.Series([case[1]], index=[0.5], name='XXX')
+        tm.assert_series_equal(res, exp)
 
     def test_datetime_timedelta_quantiles(self):
         # covers #9694
-        self.assertTrue(pd.isnull(Series([], dtype='M8[ns]').quantile(.5)))
-        self.assertTrue(pd.isnull(Series([], dtype='m8[ns]').quantile(.5)))
+        assert pd.isna(Series([], dtype='M8[ns]').quantile(.5))
+        assert pd.isna(Series([], dtype='m8[ns]').quantile(.5))
 
     def test_quantile_nat(self):
         res = Series([pd.NaT, pd.NaT]).quantile(0.5)
-        self.assertTrue(res is pd.NaT)
+        assert res is pd.NaT
 
         res = Series([pd.NaT, pd.NaT]).quantile([0.5])
         tm.assert_series_equal(res, pd.Series([pd.NaT], index=[0.5]))
 
+    @pytest.mark.parametrize('values, dtype', [
+        ([0, 0, 0, 1, 2, 3], 'Sparse[int]'),
+        ([0., None, 1., 2.], 'Sparse[float]'),
+    ])
+    def test_quantile_sparse(self, values, dtype):
+        ser = pd.Series(values, dtype=dtype)
+        result = ser.quantile([0.5])
+        expected = pd.Series(np.asarray(ser)).quantile([0.5])
+        tm.assert_series_equal(result, expected)
+
     def test_quantile_empty(self):
 
         # floats
         s = Series([], dtype='float64')
 
         res = s.quantile(0.5)
-        self.assertTrue(np.isnan(res))
+        assert np.isnan(res)
 
         res = s.quantile([0.5])
         exp = Series([np.nan], index=[0.5])
@@ -201,7 +178,7 @@ def test_quantile_empty(self):
         s = Series([], dtype='int64')
 
         res = s.quantile(0.5)
-        self.assertTrue(np.isnan(res))
+        assert np.isnan(res)
 
         res = s.quantile([0.5])
         exp = Series([np.nan], index=[0.5])
@@ -211,7 +188,7 @@ def test_quantile_empty(self):
         s = Series([], dtype='datetime64[ns]')
 
         res = s.quantile(0.5)
-        self.assertTrue(res is pd.NaT)
+        assert res is pd.NaT
 
         res = s.quantile([0.5])
         exp = Series([pd.NaT], index=[0.5])
diff --git a/pandas/tests/series/test_rank.py b/pandas/tests/series/test_rank.py
index f47eae3adc3ae..373083c077e28 100644
--- a/pandas/tests/series/test_rank.py
+++ b/pandas/tests/series/test_rank.py
@@ -1,21 +1,25 @@
 # -*- coding: utf-8 -*-
-from pandas import compat
-
-import pytest
-
 from distutils.version import LooseVersion
-from numpy import nan
+from itertools import chain
+
 import numpy as np
+from numpy import nan
+import pytest
 
-from pandas import (Series, date_range, NaT)
+from pandas._libs.algos import Infinity, NegInfinity
+from pandas._libs.tslib import iNaT
+import pandas.compat as compat
+from pandas.compat import PY2, product
+import pandas.util._test_decorators as td
 
-from pandas.compat import product
-from pandas.util.testing import assert_series_equal
-import pandas.util.testing as tm
+from pandas import NaT, Series, Timestamp, date_range
+from pandas.api.types import CategoricalDtype
 from pandas.tests.series.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import assert_series_equal
 
 
-class TestSeriesRank(tm.TestCase, TestData):
+class TestSeriesRank(TestData):
     s = Series([1, 3, 4, 2, nan, 2, 1, 5, nan, 3])
 
     results = {
@@ -28,8 +32,8 @@ class TestSeriesRank(tm.TestCase, TestData):
     }
 
     def test_rank(self):
-        tm._skip_if_no_scipy()
-        from scipy.stats import rankdata
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
 
         self.ts[::2] = np.nan
         self.ts[:10][::3] = 4.
@@ -123,35 +127,25 @@ def test_rank_categorical(self):
         exp_desc = Series([6., 5., 4., 3., 2., 1.])
         ordered = Series(
             ['first', 'second', 'third', 'fourth', 'fifth', 'sixth']
-        ).astype(
-            'category',
-            categories=['first', 'second', 'third',
-                        'fourth', 'fifth', 'sixth'],
-            ordered=True
-        )
+        ).astype(CategoricalDtype(categories=['first', 'second', 'third',
+                                              'fourth', 'fifth', 'sixth'],
+                                  ordered=True))
         assert_series_equal(ordered.rank(), exp)
         assert_series_equal(ordered.rank(ascending=False), exp_desc)
 
         # Unordered categoricals should be ranked as objects
-        unordered = Series(
-            ['first', 'second', 'third', 'fourth', 'fifth', 'sixth'],
-        ).astype(
-            'category',
-            categories=['first', 'second', 'third',
-                        'fourth', 'fifth', 'sixth'],
-            ordered=False
-        )
+        unordered = Series(['first', 'second', 'third', 'fourth',
+                            'fifth', 'sixth']).astype(
+            CategoricalDtype(categories=['first', 'second', 'third',
+                                         'fourth', 'fifth', 'sixth'],
+                             ordered=False))
         exp_unordered = Series([2., 4., 6., 3., 1., 5.])
         res = unordered.rank()
         assert_series_equal(res, exp_unordered)
 
         unordered1 = Series(
             [1, 2, 3, 4, 5, 6],
-        ).astype(
-            'category',
-            categories=[1, 2, 3, 4, 5, 6],
-            ordered=False
-        )
+        ).astype(CategoricalDtype([1, 2, 3, 4, 5, 6], False))
         exp_unordered1 = Series([1., 2., 3., 4., 5., 6.])
         res1 = unordered1.rank()
         assert_series_equal(res1, exp_unordered1)
@@ -159,14 +153,8 @@ def test_rank_categorical(self):
         # Test na_option for rank data
         na_ser = Series(
             ['first', 'second', 'third', 'fourth', 'fifth', 'sixth', np.NaN]
-        ).astype(
-            'category',
-            categories=[
-                'first', 'second', 'third', 'fourth',
-                'fifth', 'sixth', 'seventh'
-            ],
-            ordered=True
-        )
+        ).astype(CategoricalDtype(['first', 'second', 'third', 'fourth',
+                                   'fifth', 'sixth', 'seventh'], True))
 
         exp_top = Series([2., 3., 4., 5., 6., 7., 1.])
         exp_bot = Series([1., 2., 3., 4., 5., 6., 7.])
@@ -194,14 +182,19 @@ def test_rank_categorical(self):
             exp_keep
         )
 
+        # Test invalid values for na_option
+        msg = "na_option must be one of 'keep', 'top', or 'bottom'"
+
+        with pytest.raises(ValueError, match=msg):
+            na_ser.rank(na_option='bad', ascending=False)
+
+        # invalid type
+        with pytest.raises(ValueError, match=msg):
+            na_ser.rank(na_option=True, ascending=False)
+
         # Test with pct=True
-        na_ser = Series(
-            ['first', 'second', 'third', 'fourth', np.NaN],
-        ).astype(
-            'category',
-            categories=['first', 'second', 'third', 'fourth'],
-            ordered=True
-        )
+        na_ser = Series(['first', 'second', 'third', 'fourth', np.NaN]).astype(
+            CategoricalDtype(['first', 'second', 'third', 'fourth'], True))
         exp_top = Series([0.4, 0.6, 0.8, 1., 0.2])
         exp_bot = Series([0.2, 0.4, 0.6, 0.8, 1.])
         exp_keep = Series([0.25, 0.5, 0.75, 1., np.NaN])
@@ -210,21 +203,55 @@ def test_rank_categorical(self):
         assert_series_equal(na_ser.rank(na_option='bottom', pct=True), exp_bot)
         assert_series_equal(na_ser.rank(na_option='keep', pct=True), exp_keep)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_rank_signature(self):
         s = Series([0, 1])
         s.rank(method='average')
-        self.assertRaises(ValueError, s.rank, 'average')
-
-    def test_rank_inf(self):
-        pytest.skip('DataFrame.rank does not currently rank '
-                    'np.inf and -np.inf properly')
-
-        values = np.array(
-            [-np.inf, -50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10,
-             2, 40, np.inf], dtype='float64')
+        msg = ("No axis named average for object type"
+               " <class 'pandas.core.series.Series'>")
+        with pytest.raises(ValueError, match=msg):
+            s.rank('average')
+
+    @pytest.mark.parametrize('contents,dtype', [
+        ([-np.inf, -50, -1, -1e-20, -1e-25, -1e-50, 0, 1e-40, 1e-20, 1e-10,
+          2, 40, np.inf],
+         'float64'),
+        ([-np.inf, -50, -1, -1e-20, -1e-25, -1e-45, 0, 1e-40, 1e-20, 1e-10,
+          2, 40, np.inf],
+         'float32'),
+        ([np.iinfo(np.uint8).min, 1, 2, 100, np.iinfo(np.uint8).max],
+         'uint8'),
+        pytest.param([np.iinfo(np.int64).min, -100, 0, 1, 9999, 100000,
+                      1e10, np.iinfo(np.int64).max],
+                     'int64',
+                     marks=pytest.mark.xfail(
+                         reason="iNaT is equivalent to minimum value of dtype"
+                                "int64 pending issue GH#16674")),
+        ([NegInfinity(), '1', 'A', 'BA', 'Ba', 'C', Infinity()],
+         'object')
+    ])
+    def test_rank_inf(self, contents, dtype):
+        dtype_na_map = {
+            'float64': np.nan,
+            'float32': np.nan,
+            'int64': iNaT,
+            'object': None
+        }
+        # Insert nans at random positions if underlying dtype has missing
+        # value. Then adjust the expected order by adding nans accordingly
+        # This is for testing whether rank calculation is affected
+        # when values are interwined with nan values.
+        values = np.array(contents, dtype=dtype)
+        exp_order = np.array(range(len(values)), dtype='float64') + 1.0
+        if dtype in dtype_na_map:
+            na_value = dtype_na_map[dtype]
+            nan_indices = np.random.choice(range(len(values)), 5)
+            values = np.insert(values, nan_indices, na_value)
+            exp_order = np.insert(exp_order, nan_indices, np.nan)
+        # shuffle the testing array and expected results in the same way
         random_order = np.random.permutation(len(values))
         iseries = Series(values[random_order])
-        exp = Series(random_order + 1.0, dtype='float64')
+        exp = Series(exp_order[random_order], dtype='float64')
         iranks = iseries.rank()
         assert_series_equal(iranks, exp)
 
@@ -236,7 +263,7 @@ def _check(s, expected, method='average'):
             tm.assert_series_equal(result, Series(expected))
 
         dtypes = [None, object]
-        disabled = set([(object, 'first')])
+        disabled = {(object, 'first')}
         results = self.results
 
         for method, dtype in product(results, dtypes):
@@ -245,11 +272,57 @@ def _check(s, expected, method='average'):
             series = s if dtype is None else s.astype(dtype)
             _check(series, results[method], method=method)
 
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize('ascending', [True, False])
+    @pytest.mark.parametrize('method', ['average', 'min', 'max', 'first',
+                                        'dense'])
+    @pytest.mark.parametrize('na_option', ['top', 'bottom', 'keep'])
+    def test_rank_tie_methods_on_infs_nans(self, method, na_option, ascending):
+        dtypes = [('object', None, Infinity(), NegInfinity()),
+                  ('float64', np.nan, np.inf, -np.inf)]
+        chunk = 3
+        disabled = {('object', 'first')}
+
+        def _check(s, method, na_option, ascending):
+            exp_ranks = {
+                'average': ([2, 2, 2], [5, 5, 5], [8, 8, 8]),
+                'min': ([1, 1, 1], [4, 4, 4], [7, 7, 7]),
+                'max': ([3, 3, 3], [6, 6, 6], [9, 9, 9]),
+                'first': ([1, 2, 3], [4, 5, 6], [7, 8, 9]),
+                'dense': ([1, 1, 1], [2, 2, 2], [3, 3, 3])
+            }
+            ranks = exp_ranks[method]
+            if na_option == 'top':
+                order = [ranks[1], ranks[0], ranks[2]]
+            elif na_option == 'bottom':
+                order = [ranks[0], ranks[2], ranks[1]]
+            else:
+                order = [ranks[0], [np.nan] * chunk, ranks[1]]
+            expected = order if ascending else order[::-1]
+            expected = list(chain.from_iterable(expected))
+            result = s.rank(method=method, na_option=na_option,
+                            ascending=ascending)
+            tm.assert_series_equal(result, Series(expected, dtype='float64'))
+
+        for dtype, na_value, pos_inf, neg_inf in dtypes:
+            in_arr = [neg_inf] * chunk + [na_value] * chunk + [pos_inf] * chunk
+            iseries = Series(in_arr, dtype=dtype)
+            if (dtype, method) in disabled:
+                continue
+            _check(iseries, method, na_option, ascending)
+
+    def test_rank_desc_mix_nans_infs(self):
+        # GH 19538
+        # check descending ranking when mix nans and infs
+        iseries = Series([1, np.nan, np.inf, -np.inf, 25])
+        result = iseries.rank(ascending=False)
+        exp = Series([3, np.nan, 1, 4, 2], dtype='float64')
+        tm.assert_series_equal(result, exp)
+
     def test_rank_methods_series(self):
-        tm.skip_if_no_package('scipy', min_version='0.13',
-                              app='scipy.stats.rankdata')
+        pytest.importorskip('scipy.stats.special')
+        rankdata = pytest.importorskip('scipy.stats.rankdata')
         import scipy
-        from scipy.stats import rankdata
 
         xs = np.random.randn(9)
         xs = np.concatenate([xs[i:] for i in range(0, 9, 2)])  # add duplicates
@@ -265,7 +338,7 @@ def test_rank_methods_series(self):
                 sprank = rankdata(vals, m if m != 'first' else 'ordinal')
                 expected = Series(sprank, index=index)
 
-                if LooseVersion(scipy.__version__) >= '0.17.0':
+                if LooseVersion(scipy.__version__) >= LooseVersion('0.17.0'):
                     expected = expected.astype('float64')
                 tm.assert_series_equal(result, expected)
 
@@ -322,3 +395,115 @@ def test_rank_object_bug(self):
         # smoke tests
         Series([np.nan] * 32).astype(object).rank(ascending=True)
         Series([np.nan] * 32).astype(object).rank(ascending=False)
+
+    def test_rank_modify_inplace(self):
+        # GH 18521
+        # Check rank does not mutate series
+        s = Series([Timestamp('2017-01-05 10:20:27.569000'), NaT])
+        expected = s.copy()
+
+        s.rank()
+        result = s
+        assert_series_equal(result, expected)
+
+
+# GH15630, pct should be on 100% basis when method='dense'
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1., 1.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 2, 2. / 2, 2. / 2]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 3, 1. / 3, 3. / 3, 3. / 3, 2. / 3]),
+    ([1, 1, 3, 3, 5, 5], [1. / 3, 1. / 3, 2. / 3, 2. / 3, 3. / 3, 3. / 3]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_dense_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='dense', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1. / 2, 1. / 2]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2. / 3, 2. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 5, 1. / 5, 4. / 5, 4. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [1. / 6, 1. / 6, 3. / 6, 3. / 6, 5. / 6, 5. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_min_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='min', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1., 1.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 3. / 3, 3. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [2. / 5, 2. / 5, 5. / 5, 5. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [2. / 6, 2. / 6, 4. / 6, 4. / 6, 6. / 6, 6. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_max_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='max', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['O', 'f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1.5 / 2, 1.5 / 2]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2.5 / 3, 2.5 / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1.5 / 5, 1.5 / 5, 4.5 / 5, 4.5 / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5],
+     [1.5 / 6, 1.5 / 6, 3.5 / 6, 3.5 / 6, 5.5 / 6, 5.5 / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_average_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='average', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize('dtype', ['f8', 'i8'])
+@pytest.mark.parametrize('ser, exp', [
+    ([1], [1.]),
+    ([1, 2], [1. / 2, 2. / 2]),
+    ([2, 2], [1. / 2, 2. / 2.]),
+    ([1, 2, 3], [1. / 3, 2. / 3, 3. / 3]),
+    ([1, 2, 2], [1. / 3, 2. / 3, 3. / 3]),
+    ([4, 2, 1], [3. / 3, 2. / 3, 1. / 3],),
+    ([1, 1, 5, 5, 3], [1. / 5, 2. / 5, 4. / 5, 5. / 5, 3. / 5]),
+    ([1, 1, 3, 3, 5, 5], [1. / 6, 2. / 6, 3. / 6, 4. / 6, 5. / 6, 6. / 6]),
+    ([-5, -4, -3, -2, -1], [1. / 5, 2. / 5, 3. / 5, 4. / 5, 5. / 5])])
+def test_rank_first_pct(dtype, ser, exp):
+        s = Series(ser).astype(dtype)
+        result = s.rank(method='first', pct=True)
+        expected = Series(exp).astype(result.dtype)
+        assert_series_equal(result, expected)
+
+
+@pytest.mark.single
+@pytest.mark.high_memory
+def test_pct_max_many_rows():
+        # GH 18271
+        s = Series(np.arange(2**24 + 1))
+        result = s.rank(pct=True).max()
+        assert result == 1
diff --git a/pandas/tests/series/test_replace.py b/pandas/tests/series/test_replace.py
index 5190eb110f4cf..40b28047080da 100644
--- a/pandas/tests/series/test_replace.py
+++ b/pandas/tests/series/test_replace.py
@@ -2,14 +2,15 @@
 # pylint: disable-msg=E1101,W0612
 
 import numpy as np
+import pytest
+
 import pandas as pd
-import pandas._libs.lib as lib
 import pandas.util.testing as tm
 
 from .common import TestData
 
 
-class TestSeriesReplace(TestData, tm.TestCase):
+class TestSeriesReplace(TestData):
     def test_replace(self):
         N = 100
         ser = pd.Series(np.random.randn(N))
@@ -35,18 +36,18 @@ def test_replace(self):
         # replace list with a single value
         rs = ser.replace([np.nan, 'foo', 'bar'], -1)
 
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -1).all())
-        self.assertTrue((rs[20:30] == -1).all())
-        self.assertTrue((pd.isnull(ser[:5])).all())
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -1).all()
+        assert (rs[20:30] == -1).all()
+        assert (pd.isna(ser[:5])).all()
 
         # replace with different values
         rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
 
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -2).all())
-        self.assertTrue((rs[20:30] == -3).all())
-        self.assertTrue((pd.isnull(ser[:5])).all())
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -2).all()
+        assert (rs[20:30] == -3).all()
+        assert (pd.isna(ser[:5])).all()
 
         # replace with different values with 2 lists
         rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
@@ -55,14 +56,14 @@ def test_replace(self):
         # replace inplace
         ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
 
-        self.assertTrue((ser[:5] == -1).all())
-        self.assertTrue((ser[6:10] == -1).all())
-        self.assertTrue((ser[20:30] == -1).all())
+        assert (ser[:5] == -1).all()
+        assert (ser[6:10] == -1).all()
+        assert (ser[20:30] == -1).all()
 
         ser = pd.Series([np.nan, 0, np.inf])
         tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
 
-        ser = pd.Series([np.nan, 0, 'foo', 'bar', np.inf, None, lib.NaT])
+        ser = pd.Series([np.nan, 0, 'foo', 'bar', np.inf, None, pd.NaT])
         tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
         filled = ser.copy()
         filled[4] = 0
@@ -72,11 +73,13 @@ def test_replace(self):
         tm.assert_series_equal(ser.replace(np.nan, 0), ser.fillna(0))
 
         # malformed
-        self.assertRaises(ValueError, ser.replace, [1, 2, 3], [np.nan, 0])
+        msg = r"Replacement lists must match in length\. Expecting 3 got 2"
+        with pytest.raises(ValueError, match=msg):
+            ser.replace([1, 2, 3], [np.nan, 0])
 
         # make sure that we aren't just masking a TypeError because bools don't
         # implement indexing
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
+        with pytest.raises(TypeError, match='Cannot compare types .+'):
             ser.replace([1, 2], [np.nan, 0])
 
         ser = pd.Series([0, 1, 2, 3, 4])
@@ -106,6 +109,13 @@ def test_replace_gh5319(self):
                              pd.Timestamp('20120101'))
         tm.assert_series_equal(result, expected)
 
+        # GH 11792: Test with replacing NaT in a list with tz data
+        ts = pd.Timestamp('2015/01/01', tz='UTC')
+        s = pd.Series([pd.NaT, pd.Timestamp('2015/01/01', tz='UTC')])
+        result = s.replace([np.nan, pd.NaT], pd.Timestamp.min)
+        expected = pd.Series([pd.Timestamp.min, ts], dtype=object)
+        tm.assert_series_equal(expected, result)
+
     def test_replace_with_single_list(self):
         ser = pd.Series([0, 1, 2, 3, 4])
         result = ser.replace([1, 2, 3])
@@ -117,10 +127,25 @@ def test_replace_with_single_list(self):
 
         # make sure things don't get corrupted when fillna call fails
         s = ser.copy()
-        with tm.assertRaises(ValueError):
+        msg = (r"Invalid fill method\. Expecting pad \(ffill\) or backfill"
+               r" \(bfill\)\. Got crash_cymbal")
+        with pytest.raises(ValueError, match=msg):
             s.replace([1, 2, 3], inplace=True, method='crash_cymbal')
         tm.assert_series_equal(s, ser)
 
+    def test_replace_with_empty_list(self):
+        # GH 21977
+        s = pd.Series([[1], [2, 3], [], np.nan, [4]])
+        expected = s
+        result = s.replace([], np.nan)
+        tm.assert_series_equal(result, expected)
+
+        # GH 19266
+        with pytest.raises(ValueError, match="cannot assign mismatch"):
+            s.replace({np.nan: []})
+        with pytest.raises(ValueError, match="cannot assign mismatch"):
+            s.replace({np.nan: ['dummy', 'alt']})
+
     def test_replace_mixed_types(self):
         s = pd.Series(np.arange(5), dtype='int64')
 
@@ -184,7 +209,7 @@ def test_replace_bool_with_bool(self):
 
     def test_replace_with_dict_with_bool_keys(self):
         s = pd.Series([True, False, True])
-        with tm.assertRaisesRegexp(TypeError, 'Cannot compare types .+'):
+        with pytest.raises(TypeError, match='Cannot compare types .+'):
             s.replace({'asdf': 'asdb', True: 'yes'})
 
     def test_replace2(self):
@@ -198,18 +223,18 @@ def test_replace2(self):
         # replace list with a single value
         rs = ser.replace([np.nan, 'foo', 'bar'], -1)
 
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -1).all())
-        self.assertTrue((rs[20:30] == -1).all())
-        self.assertTrue((pd.isnull(ser[:5])).all())
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -1).all()
+        assert (rs[20:30] == -1).all()
+        assert (pd.isna(ser[:5])).all()
 
         # replace with different values
         rs = ser.replace({np.nan: -1, 'foo': -2, 'bar': -3})
 
-        self.assertTrue((rs[:5] == -1).all())
-        self.assertTrue((rs[6:10] == -2).all())
-        self.assertTrue((rs[20:30] == -3).all())
-        self.assertTrue((pd.isnull(ser[:5])).all())
+        assert (rs[:5] == -1).all()
+        assert (rs[6:10] == -2).all()
+        assert (rs[20:30] == -3).all()
+        assert (pd.isna(ser[:5])).all()
 
         # replace with different values with 2 lists
         rs2 = ser.replace([np.nan, 'foo', 'bar'], [-1, -2, -3])
@@ -217,9 +242,9 @@ def test_replace2(self):
 
         # replace inplace
         ser.replace([np.nan, 'foo', 'bar'], -1, inplace=True)
-        self.assertTrue((ser[:5] == -1).all())
-        self.assertTrue((ser[6:10] == -1).all())
-        self.assertTrue((ser[20:30] == -1).all())
+        assert (ser[:5] == -1).all()
+        assert (ser[6:10] == -1).all()
+        assert (ser[20:30] == -1).all()
 
     def test_replace_with_empty_dictlike(self):
         # GH 15289
@@ -234,6 +259,14 @@ def test_replace_string_with_number(self):
         expected = pd.Series([1, 2, 3])
         tm.assert_series_equal(expected, result)
 
+    def test_replace_replacer_equals_replacement(self):
+        # GH 20656
+        # make sure all replacers are matching against original values
+        s = pd.Series(['a', 'b'])
+        expected = pd.Series(['b', 'a'])
+        result = s.replace({'a': 'b', 'b': 'a'})
+        tm.assert_series_equal(expected, result)
+
     def test_replace_unicode_with_number(self):
         # GH 15743
         s = pd.Series([1, 2, 3])
diff --git a/pandas/tests/series/test_repr.py b/pandas/tests/series/test_repr.py
index 99a406a71b12b..842207f2a572f 100644
--- a/pandas/tests/series/test_repr.py
+++ b/pandas/tests/series/test_repr.py
@@ -4,25 +4,28 @@
 from datetime import datetime, timedelta
 
 import numpy as np
-import pandas as pd
 
-from pandas import (Index, Series, DataFrame, date_range)
-from pandas.core.index import MultiIndex
+import pandas.compat as compat
+from pandas.compat import lrange, range, u
 
-from pandas.compat import StringIO, lrange, range, u
-from pandas import compat
+import pandas as pd
+from pandas import (
+    Categorical, DataFrame, Index, Series, date_range, option_context,
+    period_range, timedelta_range)
+from pandas.core.base import StringMixin
+from pandas.core.index import MultiIndex
 import pandas.util.testing as tm
 
 from .common import TestData
 
 
-class TestSeriesRepr(TestData, tm.TestCase):
+class TestSeriesRepr(TestData):
 
     def test_multilevel_name_print(self):
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
                                                                   'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['first', 'second'])
         s = Series(lrange(0, len(index)), index=index, name='sth')
         expected = ["first  second", "foo    one       0",
@@ -32,24 +35,29 @@ def test_multilevel_name_print(self):
                     "qux    one       7", "       two       8",
                     "       three     9", "Name: sth, dtype: int64"]
         expected = "\n".join(expected)
-        self.assertEqual(repr(s), expected)
+        assert repr(s) == expected
 
     def test_name_printing(self):
-        # test small series
+        # Test small Series.
         s = Series([0, 1, 2])
+
         s.name = "test"
-        self.assertIn("Name: test", repr(s))
+        assert "Name: test" in repr(s)
+
         s.name = None
-        self.assertNotIn("Name:", repr(s))
-        # test big series (diff code path)
+        assert "Name:" not in repr(s)
+
+        # Test big Series (diff code path).
         s = Series(lrange(0, 1000))
+
         s.name = "test"
-        self.assertIn("Name: test", repr(s))
+        assert "Name: test" in repr(s)
+
         s.name = None
-        self.assertNotIn("Name:", repr(s))
+        assert "Name:" not in repr(s)
 
         s = Series(index=date_range('20010101', '20020101'), name='test')
-        self.assertIn("Name: test", repr(s))
+        assert "Name: test" in repr(s)
 
     def test_repr(self):
         str(self.ts)
@@ -88,44 +96,38 @@ def test_repr(self):
         # 0 as name
         ser = Series(np.random.randn(100), name=0)
         rep_str = repr(ser)
-        self.assertIn("Name: 0", rep_str)
+        assert "Name: 0" in rep_str
 
         # tidy repr
         ser = Series(np.random.randn(1001), name=0)
         rep_str = repr(ser)
-        self.assertIn("Name: 0", rep_str)
+        assert "Name: 0" in rep_str
 
         ser = Series(["a\n\r\tb"], name="a\n\r\td", index=["a\n\r\tf"])
-        self.assertFalse("\t" in repr(ser))
-        self.assertFalse("\r" in repr(ser))
-        self.assertFalse("a\n" in repr(ser))
+        assert "\t" not in repr(ser)
+        assert "\r" not in repr(ser)
+        assert "a\n" not in repr(ser)
 
         # with empty series (#4651)
         s = Series([], dtype=np.int64, name='foo')
-        self.assertEqual(repr(s), 'Series([], Name: foo, dtype: int64)')
+        assert repr(s) == 'Series([], Name: foo, dtype: int64)'
 
         s = Series([], dtype=np.int64, name=None)
-        self.assertEqual(repr(s), 'Series([], dtype: int64)')
+        assert repr(s) == 'Series([], dtype: int64)'
 
     def test_tidy_repr(self):
         a = Series([u("\u05d0")] * 1000)
         a.name = 'title1'
         repr(a)  # should not raise exception
 
-    def test_repr_bool_fails(self):
+    def test_repr_bool_fails(self, capsys):
         s = Series([DataFrame(np.random.randn(2, 2)) for i in range(5)])
 
-        import sys
+        # It works (with no Cython exception barf)!
+        repr(s)
 
-        buf = StringIO()
-        tmp = sys.stderr
-        sys.stderr = buf
-        try:
-            # it works (with no Cython exception barf)!
-            repr(s)
-        finally:
-            sys.stderr = tmp
-        self.assertEqual(buf.getvalue(), '')
+        captured = capsys.readouterr()
+        assert captured.err == ''
 
     def test_repr_name_iterable_indexable(self):
         s = Series([1, 2, 3], name=np.int64(3))
@@ -137,8 +139,7 @@ def test_repr_name_iterable_indexable(self):
         repr(s)
 
     def test_repr_should_return_str(self):
-        # http://docs.python.org/py3k/reference/datamodel.html#object.__repr__
-        # http://docs.python.org/reference/datamodel.html#object.__repr__
+        # https://docs.python.org/3/reference/datamodel.html#object.__repr__
         # ...The return value must be a string object.
 
         # (str on py2.x, str (unicode) on py3)
@@ -146,7 +147,7 @@ def test_repr_should_return_str(self):
         data = [8, 5, 3, 5]
         index1 = [u("\u03c3"), u("\u03c4"), u("\u03c5"), u("\u03c6")]
         df = Series(data, index=index1)
-        self.assertTrue(type(df.__repr__() == str))  # both py2 / 3
+        assert type(df.__repr__() == str)  # both py2 / 3
 
     def test_repr_max_rows(self):
         # GH 6863
@@ -174,7 +175,310 @@ def test_timeseries_repr_object_dtype(self):
         repr(ts)
 
         ts = tm.makeTimeSeries(1000)
-        self.assertTrue(repr(ts).splitlines()[-1].startswith('Freq:'))
+        assert repr(ts).splitlines()[-1].startswith('Freq:')
 
         ts2 = ts.iloc[np.random.randint(0, len(ts) - 1, 400)]
         repr(ts2).splitlines()[-1]
+
+    def test_latex_repr(self):
+        result = r"""\begin{tabular}{ll}
+\toprule
+{} &         0 \\
+\midrule
+0 &  $\alpha$ \\
+1 &         b \\
+2 &         c \\
+\bottomrule
+\end{tabular}
+"""
+        with option_context('display.latex.escape', False,
+                            'display.latex.repr', True):
+            s = Series([r'$\alpha$', 'b', 'c'])
+            assert result == s._repr_latex_()
+
+        assert s._repr_latex_() is None
+
+    def test_index_repr_in_frame_with_nan(self):
+        # see gh-25061
+        i = Index([1, np.nan])
+        s = Series([1, 2], index=i)
+        exp = """1.0    1\nNaN    2\ndtype: int64"""
+
+        assert repr(s) == exp
+
+
+class TestCategoricalRepr(object):
+
+    def test_categorical_repr_unicode(self):
+        # GH#21002 if len(index) > 60, sys.getdefaultencoding()=='ascii',
+        # and we are working in PY2, then rendering a Categorical could raise
+        # UnicodeDecodeError by trying to decode when it shouldn't
+
+        class County(StringMixin):
+            name = u'San Sebastián'
+            state = u'PR'
+
+            def __unicode__(self):
+                return self.name + u', ' + self.state
+
+        cat = pd.Categorical([County() for n in range(61)])
+        idx = pd.Index(cat)
+        ser = idx.to_series()
+
+        if compat.PY3:
+            # no reloading of sys, just check that the default (utf8) works
+            # as expected
+            repr(ser)
+            str(ser)
+
+        else:
+            # set sys.defaultencoding to ascii, then change it back after
+            # the test
+            with tm.set_defaultencoding('ascii'):
+                repr(ser)
+                str(ser)
+
+    def test_categorical_repr(self):
+        a = Series(Categorical([1, 2, 3, 4]))
+        exp = u("0    1\n1    2\n2    3\n3    4\n" +
+                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
+
+        assert exp == a.__unicode__()
+
+        a = Series(Categorical(["a", "b"] * 25))
+        exp = u("0     a\n1     b\n" + "     ..\n" + "48    a\n49    b\n" +
+                "Length: 50, dtype: category\nCategories (2, object): [a, b]")
+        with option_context("display.max_rows", 5):
+            assert exp == repr(a)
+
+        levs = list("abcdefghijklmnopqrstuvwxyz")
+        a = Series(Categorical(["a", "b"], categories=levs, ordered=True))
+        exp = u("0    a\n1    b\n" + "dtype: category\n"
+                "Categories (26, object): [a < b < c < d ... w < x < y < z]")
+        assert exp == a.__unicode__()
+
+    def test_categorical_series_repr(self):
+        s = Series(Categorical([1, 2, 3]))
+        exp = """0    1
+1    2
+2    3
+dtype: category
+Categories (3, int64): [1, 2, 3]"""
+
+        assert repr(s) == exp
+
+        s = Series(Categorical(np.arange(10)))
+        exp = """0    0
+1    1
+2    2
+3    3
+4    4
+5    5
+6    6
+7    7
+8    8
+9    9
+dtype: category
+Categories (10, int64): [0, 1, 2, 3, ..., 6, 7, 8, 9]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_ordered(self):
+        s = Series(Categorical([1, 2, 3], ordered=True))
+        exp = """0    1
+1    2
+2    3
+dtype: category
+Categories (3, int64): [1 < 2 < 3]"""
+
+        assert repr(s) == exp
+
+        s = Series(Categorical(np.arange(10), ordered=True))
+        exp = """0    0
+1    1
+2    2
+3    3
+4    4
+5    5
+6    6
+7    7
+8    8
+9    9
+dtype: category
+Categories (10, int64): [0 < 1 < 2 < 3 ... 6 < 7 < 8 < 9]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_datetime(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   2011-01-01 09:00:00
+1   2011-01-01 10:00:00
+2   2011-01-01 11:00:00
+3   2011-01-01 12:00:00
+4   2011-01-01 13:00:00
+dtype: category
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
+                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        s = Series(Categorical(idx))
+        exp = """0   2011-01-01 09:00:00-05:00
+1   2011-01-01 10:00:00-05:00
+2   2011-01-01 11:00:00-05:00
+3   2011-01-01 12:00:00-05:00
+4   2011-01-01 13:00:00-05:00
+dtype: category
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,
+                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_datetime_ordered(self):
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01-01 09:00:00
+1   2011-01-01 10:00:00
+2   2011-01-01 11:00:00
+3   2011-01-01 12:00:00
+4   2011-01-01 13:00:00
+dtype: category
+Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
+                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = date_range('2011-01-01 09:00', freq='H', periods=5,
+                         tz='US/Eastern')
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   2011-01-01 09:00:00-05:00
+1   2011-01-01 10:00:00-05:00
+2   2011-01-01 11:00:00-05:00
+3   2011-01-01 12:00:00-05:00
+4   2011-01-01 13:00:00-05:00
+dtype: category
+Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
+                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
+                                             2011-01-01 13:00:00-05:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_period(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0    2011-01-01 09:00
+1    2011-01-01 10:00
+2    2011-01-01 11:00
+3    2011-01-01 12:00
+4    2011-01-01 13:00
+dtype: category
+Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0    2011-01
+1    2011-02
+2    2011-03
+3    2011-04
+4    2011-05
+dtype: category
+Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_period_ordered(self):
+        idx = period_range('2011-01-01 09:00', freq='H', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0    2011-01-01 09:00
+1    2011-01-01 10:00
+2    2011-01-01 11:00
+3    2011-01-01 12:00
+4    2011-01-01 13:00
+dtype: category
+Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
+                            2011-01-01 13:00]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = period_range('2011-01', freq='M', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0    2011-01
+1    2011-02
+2    2011-03
+3    2011-04
+4    2011-05
+dtype: category
+Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_timedelta(self):
+        idx = timedelta_range('1 days', periods=5)
+        s = Series(Categorical(idx))
+        exp = """0   1 days
+1   2 days
+2   3 days
+3   4 days
+4   5 days
+dtype: category
+Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
+
+        assert repr(s) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        s = Series(Categorical(idx))
+        exp = """0   0 days 01:00:00
+1   1 days 01:00:00
+2   2 days 01:00:00
+3   3 days 01:00:00
+4   4 days 01:00:00
+5   5 days 01:00:00
+6   6 days 01:00:00
+7   7 days 01:00:00
+8   8 days 01:00:00
+9   9 days 01:00:00
+dtype: category
+Categories (10, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
+                                   3 days 01:00:00, ..., 6 days 01:00:00, 7 days 01:00:00,
+                                   8 days 01:00:00, 9 days 01:00:00]"""  # noqa
+
+        assert repr(s) == exp
+
+    def test_categorical_series_repr_timedelta_ordered(self):
+        idx = timedelta_range('1 days', periods=5)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   1 days
+1   2 days
+2   3 days
+3   4 days
+4   5 days
+dtype: category
+Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""  # noqa
+
+        assert repr(s) == exp
+
+        idx = timedelta_range('1 hours', periods=10)
+        s = Series(Categorical(idx, ordered=True))
+        exp = """0   0 days 01:00:00
+1   1 days 01:00:00
+2   2 days 01:00:00
+3   3 days 01:00:00
+4   4 days 01:00:00
+5   5 days 01:00:00
+6   6 days 01:00:00
+7   7 days 01:00:00
+8   8 days 01:00:00
+9   9 days 01:00:00
+dtype: category
+Categories (10, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
+                                   3 days 01:00:00 ... 6 days 01:00:00 < 7 days 01:00:00 <
+                                   8 days 01:00:00 < 9 days 01:00:00]"""  # noqa
+
+        assert repr(s) == exp
diff --git a/pandas/tests/series/test_sorting.py b/pandas/tests/series/test_sorting.py
index 66ecba960ae0b..162fa4ac9ab52 100644
--- a/pandas/tests/series/test_sorting.py
+++ b/pandas/tests/series/test_sorting.py
@@ -1,24 +1,20 @@
 # coding=utf-8
 
-import numpy as np
 import random
 
-from pandas import (DataFrame, Series, MultiIndex)
+import numpy as np
+import pytest
+
+from pandas.compat import PY2
 
-from pandas.util.testing import (assert_series_equal, assert_almost_equal)
+from pandas import Categorical, DataFrame, IntervalIndex, MultiIndex, Series
 import pandas.util.testing as tm
+from pandas.util.testing import assert_almost_equal, assert_series_equal
 
 from .common import TestData
 
 
-class TestSeriesSorting(TestData, tm.TestCase):
-
-    def test_sortlevel_deprecated(self):
-        ts = self.ts.copy()
-
-        # see gh-9816
-        with tm.assert_produces_warning(FutureWarning):
-            ts.sortlevel()
+class TestSeriesSorting(TestData):
 
     def test_sort_values(self):
 
@@ -26,20 +22,20 @@ def test_sort_values(self):
         ser = Series([3, 2, 4, 1], ['A', 'B', 'C', 'D'])
         expected = Series([1, 2, 3, 4], ['D', 'B', 'A', 'C'])
         result = ser.sort_values()
-        self.assert_series_equal(expected, result)
+        tm.assert_series_equal(expected, result)
 
         ts = self.ts.copy()
         ts[:5] = np.NaN
         vals = ts.values
 
         result = ts.sort_values()
-        self.assertTrue(np.isnan(result[-5:]).all())
-        self.assert_numpy_array_equal(result[:-5].values, np.sort(vals[5:]))
+        assert np.isnan(result[-5:]).all()
+        tm.assert_numpy_array_equal(result[:-5].values, np.sort(vals[5:]))
 
         # na_position
         result = ts.sort_values(na_position='first')
-        self.assertTrue(np.isnan(result[:5]).all())
-        self.assert_numpy_array_equal(result[5:].values, np.sort(vals[5:]))
+        assert np.isnan(result[:5]).all()
+        tm.assert_numpy_array_equal(result[5:].values, np.sort(vals[5:]))
 
         # something object-type
         ser = Series(['A', 'B'], [1, 2])
@@ -48,10 +44,10 @@ def test_sort_values(self):
 
         # ascending=False
         ordered = ts.sort_values(ascending=False)
-        expected = np.sort(ts.valid().values)[::-1]
-        assert_almost_equal(expected, ordered.valid().values)
+        expected = np.sort(ts.dropna().values)[::-1]
+        assert_almost_equal(expected, ordered.dropna().values)
         ordered = ts.sort_values(ascending=False, na_position='first')
-        assert_almost_equal(expected, ordered.valid().values)
+        assert_almost_equal(expected, ordered.dropna().values)
 
         # ascending=[False] should behave the same as ascending=False
         ordered = ts.sort_values(ascending=[False])
@@ -61,34 +57,40 @@ def test_sort_values(self):
         expected = ts.sort_values(ascending=False, na_position='first')
         assert_series_equal(expected, ordered)
 
-        self.assertRaises(ValueError,
-                          lambda: ts.sort_values(ascending=None))
-        self.assertRaises(ValueError,
-                          lambda: ts.sort_values(ascending=[]))
-        self.assertRaises(ValueError,
-                          lambda: ts.sort_values(ascending=[1, 2, 3]))
-        self.assertRaises(ValueError,
-                          lambda: ts.sort_values(ascending=[False, False]))
-        self.assertRaises(ValueError,
-                          lambda: ts.sort_values(ascending='foobar'))
+        msg = "ascending must be boolean"
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending=None)
+        msg = r"Length of ascending \(0\) must be 1 for Series"
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending=[])
+        msg = r"Length of ascending \(3\) must be 1 for Series"
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending=[1, 2, 3])
+        msg = r"Length of ascending \(2\) must be 1 for Series"
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending=[False, False])
+        msg = "ascending must be boolean"
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending='foobar')
 
         # inplace=True
         ts = self.ts.copy()
         ts.sort_values(ascending=False, inplace=True)
-        self.assert_series_equal(ts, self.ts.sort_values(ascending=False))
-        self.assert_index_equal(ts.index,
-                                self.ts.sort_values(ascending=False).index)
+        tm.assert_series_equal(ts, self.ts.sort_values(ascending=False))
+        tm.assert_index_equal(ts.index,
+                              self.ts.sort_values(ascending=False).index)
 
         # GH 5856/5853
         # Series.sort_values operating on a view
         df = DataFrame(np.random.randn(10, 4))
         s = df.iloc[:, 0]
 
-        def f():
+        msg = ("This Series is a view of some other array, to sort in-place"
+               " you must create a copy")
+        with pytest.raises(ValueError, match=msg):
             s.sort_values(inplace=True)
 
-        self.assertRaises(ValueError, f)
-
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_sort_index(self):
         rindex = list(self.ts.index)
         random.shuffle(rindex)
@@ -110,13 +112,16 @@ def test_sort_index(self):
         sorted_series = random_order.sort_index(axis=0)
         assert_series_equal(sorted_series, self.ts)
 
-        self.assertRaises(ValueError, lambda: random_order.sort_values(axis=1))
+        msg = ("No axis named 1 for object type"
+               " <class 'pandas.core.series.Series'>")
+        with pytest.raises(ValueError, match=msg):
+            random_order.sort_values(axis=1)
 
         sorted_series = random_order.sort_index(level=0, axis=0)
         assert_series_equal(sorted_series, self.ts)
 
-        self.assertRaises(ValueError,
-                          lambda: random_order.sort_index(level=0, axis=1))
+        with pytest.raises(ValueError, match=msg):
+            random_order.sort_index(level=0, axis=1)
 
     def test_sort_index_inplace(self):
 
@@ -127,30 +132,32 @@ def test_sort_index_inplace(self):
         # descending
         random_order = self.ts.reindex(rindex)
         result = random_order.sort_index(ascending=False, inplace=True)
-        self.assertIs(result, None,
-                      msg='sort_index() inplace should return None')
-        assert_series_equal(random_order, self.ts.reindex(self.ts.index[::-1]))
+
+        assert result is None
+        tm.assert_series_equal(random_order, self.ts.reindex(
+            self.ts.index[::-1]))
 
         # ascending
         random_order = self.ts.reindex(rindex)
         result = random_order.sort_index(ascending=True, inplace=True)
-        self.assertIs(result, None,
-                      msg='sort_index() inplace should return None')
-        assert_series_equal(random_order, self.ts)
 
-    def test_sort_index_multiindex(self):
+        assert result is None
+        tm.assert_series_equal(random_order, self.ts)
+
+    @pytest.mark.parametrize("level", ['A', 0])  # GH 21052
+    def test_sort_index_multiindex(self, level):
 
         mi = MultiIndex.from_tuples([[1, 1, 3], [1, 1, 1]], names=list('ABC'))
         s = Series([1, 2], mi)
         backwards = s.iloc[[1, 0]]
 
         # implicit sort_remaining=True
-        res = s.sort_index(level='A')
+        res = s.sort_index(level=level)
         assert_series_equal(backwards, res)
 
         # GH13496
-        # rows share same level='A': sort has no effect without remaining lvls
-        res = s.sort_index(level='A', sort_remaining=False)
+        # sort has no effect without remaining lvls
+        res = s.sort_index(level=level, sort_remaining=False)
         assert_series_equal(s, res)
 
     def test_sort_index_kind(self):
@@ -177,3 +184,87 @@ def test_sort_index_na_position(self):
         expected_series_last = Series(index=[1, 2, 3, 3, 4, np.nan])
         index_sorted_series = series.sort_index(na_position='last')
         assert_series_equal(expected_series_last, index_sorted_series)
+
+    def test_sort_index_intervals(self):
+        s = Series([np.nan, 1, 2, 3], IntervalIndex.from_arrays(
+            [0, 1, 2, 3],
+            [1, 2, 3, 4]))
+
+        result = s.sort_index()
+        expected = s
+        assert_series_equal(result, expected)
+
+        result = s.sort_index(ascending=False)
+        expected = Series([3, 2, 1, np.nan], IntervalIndex.from_arrays(
+            [3, 2, 1, 0],
+            [4, 3, 2, 1]))
+        assert_series_equal(result, expected)
+
+    def test_sort_values_categorical(self):
+
+        c = Categorical(["a", "b", "b", "a"], ordered=False)
+        cat = Series(c.copy())
+
+        # sort in the categories order
+        expected = Series(
+            Categorical(["a", "a", "b", "b"],
+                        ordered=False), index=[0, 3, 1, 2])
+        result = cat.sort_values()
+        tm.assert_series_equal(result, expected)
+
+        cat = Series(Categorical(["a", "c", "b", "d"], ordered=True))
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        cat = Series(Categorical(["a", "c", "b", "d"], categories=[
+                     "a", "b", "c", "d"], ordered=True))
+        res = cat.sort_values()
+        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        res = cat.sort_values(ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res.__array__(), exp)
+
+        raw_cat1 = Categorical(["a", "b", "c", "d"],
+                               categories=["a", "b", "c", "d"], ordered=False)
+        raw_cat2 = Categorical(["a", "b", "c", "d"],
+                               categories=["d", "c", "b", "a"], ordered=True)
+        s = ["a", "b", "c", "d"]
+        df = DataFrame({"unsort": raw_cat1,
+                        "sort": raw_cat2,
+                        "string": s,
+                        "values": [1, 2, 3, 4]})
+
+        # Cats must be sorted in a dataframe
+        res = df.sort_values(by=["string"], ascending=False)
+        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
+        tm.assert_numpy_array_equal(res["sort"].values.__array__(), exp)
+        assert res["sort"].dtype == "category"
+
+        res = df.sort_values(by=["sort"], ascending=False)
+        exp = df.sort_values(by=["string"], ascending=True)
+        tm.assert_series_equal(res["values"], exp["values"])
+        assert res["sort"].dtype == "category"
+        assert res["unsort"].dtype == "category"
+
+        # unordered cat, but we allow this
+        df.sort_values(by=["unsort"], ascending=False)
+
+        # multi-columns sort
+        # GH 7848
+        df = DataFrame({"id": [6, 5, 4, 3, 2, 1],
+                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
+        df["grade"] = Categorical(df["raw_grade"], ordered=True)
+        df['grade'] = df['grade'].cat.set_categories(['b', 'e', 'a'])
+
+        # sorts 'grade' according to the order of the categories
+        result = df.sort_values(by=['grade'])
+        expected = df.iloc[[1, 2, 5, 0, 3, 4]]
+        tm.assert_frame_equal(result, expected)
+
+        # multi
+        result = df.sort_values(by=['grade', 'id'])
+        expected = df.iloc[[2, 1, 5, 4, 3, 0]]
+        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/series/test_subclass.py b/pandas/tests/series/test_subclass.py
index 3b1b8aca426e1..68a162ee4c287 100644
--- a/pandas/tests/series/test_subclass.py
+++ b/pandas/tests/series/test_subclass.py
@@ -1,68 +1,76 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
-
 import numpy as np
+
 import pandas as pd
+from pandas import SparseDtype
 import pandas.util.testing as tm
 
 
-class TestSeriesSubclassing(tm.TestCase):
+class TestSeriesSubclassing(object):
 
     def test_indexing_sliced(self):
         s = tm.SubclassedSeries([1, 2, 3, 4], index=list('abcd'))
         res = s.loc[['a', 'b']]
         exp = tm.SubclassedSeries([1, 2], index=list('ab'))
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
 
         res = s.iloc[[2, 3]]
         exp = tm.SubclassedSeries([3, 4], index=list('cd'))
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
 
         res = s.loc[['a', 'b']]
         exp = tm.SubclassedSeries([1, 2], index=list('ab'))
         tm.assert_series_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedSeries)
 
     def test_to_frame(self):
         s = tm.SubclassedSeries([1, 2, 3, 4], index=list('abcd'), name='xxx')
         res = s.to_frame()
         exp = tm.SubclassedDataFrame({'xxx': [1, 2, 3, 4]}, index=list('abcd'))
         tm.assert_frame_equal(res, exp)
-        tm.assertIsInstance(res, tm.SubclassedDataFrame)
+
+    def test_subclass_unstack(self):
+        # GH 15564
+        s = tm.SubclassedSeries(
+            [1, 2, 3, 4], index=[list('aabb'), list('xyxy')])
+
+        res = s.unstack()
+        exp = tm.SubclassedDataFrame(
+            {'x': [1, 3], 'y': [2, 4]}, index=['a', 'b'])
+
+        tm.assert_frame_equal(res, exp)
 
 
-class TestSparseSeriesSubclassing(tm.TestCase):
+class TestSparseSeriesSubclassing(object):
 
     def test_subclass_sparse_slice(self):
         # int64
         s = tm.SubclassedSparseSeries([1, 2, 3, 4, 5])
         exp = tm.SubclassedSparseSeries([2, 3, 4], index=[1, 2, 3])
         tm.assert_sp_series_equal(s.loc[1:3], exp)
-        self.assertEqual(s.loc[1:3].dtype, np.int64)
+        assert s.loc[1:3].dtype == SparseDtype(np.int64)
 
         exp = tm.SubclassedSparseSeries([2, 3], index=[1, 2])
         tm.assert_sp_series_equal(s.iloc[1:3], exp)
-        self.assertEqual(s.iloc[1:3].dtype, np.int64)
+        assert s.iloc[1:3].dtype == SparseDtype(np.int64)
 
         exp = tm.SubclassedSparseSeries([2, 3], index=[1, 2])
         tm.assert_sp_series_equal(s[1:3], exp)
-        self.assertEqual(s[1:3].dtype, np.int64)
+        assert s[1:3].dtype == SparseDtype(np.int64)
 
         # float64
         s = tm.SubclassedSparseSeries([1., 2., 3., 4., 5.])
         exp = tm.SubclassedSparseSeries([2., 3., 4.], index=[1, 2, 3])
         tm.assert_sp_series_equal(s.loc[1:3], exp)
-        self.assertEqual(s.loc[1:3].dtype, np.float64)
+        assert s.loc[1:3].dtype == SparseDtype(np.float64)
 
         exp = tm.SubclassedSparseSeries([2., 3.], index=[1, 2])
         tm.assert_sp_series_equal(s.iloc[1:3], exp)
-        self.assertEqual(s.iloc[1:3].dtype, np.float64)
+        assert s.iloc[1:3].dtype == SparseDtype(np.float64)
 
         exp = tm.SubclassedSparseSeries([2., 3.], index=[1, 2])
         tm.assert_sp_series_equal(s[1:3], exp)
-        self.assertEqual(s[1:3].dtype, np.float64)
+        assert s[1:3].dtype == SparseDtype(np.float64)
 
     def test_subclass_sparse_addition(self):
         s1 = tm.SubclassedSparseSeries([1, 3, 5])
@@ -76,25 +84,25 @@ def test_subclass_sparse_addition(self):
         tm.assert_sp_series_equal(s1 + s2, exp)
 
     def test_subclass_sparse_to_frame(self):
-        s = tm.SubclassedSparseSeries([1, 2], index=list('abcd'), name='xxx')
+        s = tm.SubclassedSparseSeries([1, 2], index=list('ab'), name='xxx')
         res = s.to_frame()
 
         exp_arr = pd.SparseArray([1, 2], dtype=np.int64, kind='block',
                                  fill_value=0)
         exp = tm.SubclassedSparseDataFrame({'xxx': exp_arr},
-                                           index=list('abcd'),
+                                           index=list('ab'),
                                            default_fill_value=0)
         tm.assert_sp_frame_equal(res, exp)
 
         # create from int dict
         res = tm.SubclassedSparseDataFrame({'xxx': [1, 2]},
-                                           index=list('abcd'),
+                                           index=list('ab'),
                                            default_fill_value=0)
         tm.assert_sp_frame_equal(res, exp)
 
-        s = tm.SubclassedSparseSeries([1.1, 2.1], index=list('abcd'),
+        s = tm.SubclassedSparseSeries([1.1, 2.1], index=list('ab'),
                                       name='xxx')
         res = s.to_frame()
         exp = tm.SubclassedSparseDataFrame({'xxx': [1.1, 2.1]},
-                                           index=list('abcd'))
+                                           index=list('ab'))
         tm.assert_sp_frame_equal(res, exp)
diff --git a/pandas/tests/series/test_timeseries.py b/pandas/tests/series/test_timeseries.py
index ce7d5a573bfab..b6896685dd474 100644
--- a/pandas/tests/series/test_timeseries.py
+++ b/pandas/tests/series/test_timeseries.py
@@ -1,23 +1,29 @@
 # coding=utf-8
 # pylint: disable-msg=E1101,W0612
 
+from datetime import datetime, time, timedelta
+
 import numpy as np
-from datetime import datetime, timedelta, time
+import pytest
 
-import pandas as pd
-import pandas.util.testing as tm
 from pandas._libs.tslib import iNaT
-from pandas.compat import lrange, StringIO, product
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.offsets import BDay, BMonthEnd
-from pandas import (Index, Series, date_range, NaT, concat, DataFrame,
-                    Timestamp, to_datetime, offsets,
-                    timedelta_range)
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal, _skip_if_has_locale)
+from pandas._libs.tslibs.np_datetime import OutOfBoundsDatetime
+from pandas.compat import PY2, StringIO, lrange, product
+from pandas.errors import NullFrequencyError
+import pandas.util._test_decorators as td
 
+import pandas as pd
+from pandas import (
+    DataFrame, Index, NaT, Series, Timestamp, concat, date_range, offsets,
+    timedelta_range, to_datetime)
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.indexes.timedeltas import TimedeltaIndex
 from pandas.tests.series.common import TestData
+import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+from pandas.tseries.offsets import BDay, BMonthEnd
 
 
 def _simple_ts(start, end, freq='D'):
@@ -31,7 +37,7 @@ def assert_range_equal(left, right):
     assert (left.tz == right.tz)
 
 
-class TestTimeSeries(TestData, tm.TestCase):
+class TestTimeSeries(TestData):
 
     def test_shift(self):
         shifted = self.ts.shift(1)
@@ -39,7 +45,7 @@ def test_shift(self):
 
         tm.assert_index_equal(shifted.index, self.ts.index)
         tm.assert_index_equal(unshifted.index, self.ts.index)
-        tm.assert_numpy_array_equal(unshifted.valid().values,
+        tm.assert_numpy_array_equal(unshifted.dropna().values,
                                     self.ts.values[:-1])
 
         offset = BDay()
@@ -66,14 +72,16 @@ def test_shift(self):
         unshifted = shifted.shift(-1)
         tm.assert_index_equal(shifted.index, ps.index)
         tm.assert_index_equal(unshifted.index, ps.index)
-        tm.assert_numpy_array_equal(unshifted.valid().values, ps.values[:-1])
+        tm.assert_numpy_array_equal(unshifted.dropna().values, ps.values[:-1])
 
         shifted2 = ps.shift(1, 'B')
         shifted3 = ps.shift(1, BDay())
         assert_series_equal(shifted2, shifted3)
         assert_series_equal(ps, shifted2.shift(-1, 'B'))
 
-        self.assertRaises(ValueError, ps.shift, freq='D')
+        msg = "Given freq D does not match PeriodIndex freq B"
+        with pytest.raises(ValueError, match=msg):
+            ps.shift(freq='D')
 
         # legacy support
         shifted4 = ps.shift(1, freq='B')
@@ -104,7 +112,10 @@ def test_shift(self):
         # incompat tz
         s2 = Series(date_range('2000-01-01 09:00:00', periods=5,
                                tz='CET'), name='foo')
-        self.assertRaises(ValueError, lambda: s - s2)
+        msg = ("DatetimeArray subtraction must have the same timezones or no"
+               " timezones")
+        with pytest.raises(TypeError, match=msg):
+            s - s2
 
     def test_shift2(self):
         ts = Series(np.random.randn(5),
@@ -120,7 +131,42 @@ def test_shift2(self):
         tm.assert_index_equal(result.index, exp_index)
 
         idx = DatetimeIndex(['2000-01-01', '2000-01-02', '2000-01-04'])
-        self.assertRaises(ValueError, idx.shift, 1)
+        msg = "Cannot shift with no freq"
+        with pytest.raises(NullFrequencyError, match=msg):
+            idx.shift(1)
+
+    def test_shift_fill_value(self):
+        # GH #24128
+        ts = Series([1.0, 2.0, 3.0, 4.0, 5.0],
+                    index=date_range('1/1/2000', periods=5, freq='H'))
+
+        exp = Series([0.0, 1.0, 2.0, 3.0, 4.0],
+                     index=date_range('1/1/2000', periods=5, freq='H'))
+        # check that fill value works
+        result = ts.shift(1, fill_value=0.0)
+        tm.assert_series_equal(result, exp)
+
+        exp = Series([0.0, 0.0, 1.0, 2.0, 3.0],
+                     index=date_range('1/1/2000', periods=5, freq='H'))
+        result = ts.shift(2, fill_value=0.0)
+        tm.assert_series_equal(result, exp)
+
+        ts = pd.Series([1, 2, 3])
+        res = ts.shift(2, fill_value=0)
+        assert res.dtype == ts.dtype
+
+    def test_categorical_shift_fill_value(self):
+        ts = pd.Series(['a', 'b', 'c', 'd'], dtype="category")
+        res = ts.shift(1, fill_value='a')
+        expected = pd.Series(pd.Categorical(['a', 'a', 'b', 'c'],
+                                            categories=['a', 'b', 'c', 'd'],
+                                            ordered=False))
+        tm.assert_equal(res, expected)
+
+        # check for incorrect fill_value
+        msg = "'fill_value=f' is not present in this Categorical's categories"
+        with pytest.raises(ValueError, match=msg):
+            ts.shift(1, fill_value='f')
 
     def test_shift_dst(self):
         # GH 13926
@@ -129,25 +175,25 @@ def test_shift_dst(self):
 
         res = s.shift(0)
         tm.assert_series_equal(res, s)
-        self.assertEqual(res.dtype, 'datetime64[ns, US/Eastern]')
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
 
         res = s.shift(1)
-        exp_vals = [NaT] + dates.asobject.values.tolist()[:9]
+        exp_vals = [NaT] + dates.astype(object).values.tolist()[:9]
         exp = Series(exp_vals)
         tm.assert_series_equal(res, exp)
-        self.assertEqual(res.dtype, 'datetime64[ns, US/Eastern]')
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
 
         res = s.shift(-2)
-        exp_vals = dates.asobject.values.tolist()[2:] + [NaT, NaT]
+        exp_vals = dates.astype(object).values.tolist()[2:] + [NaT, NaT]
         exp = Series(exp_vals)
         tm.assert_series_equal(res, exp)
-        self.assertEqual(res.dtype, 'datetime64[ns, US/Eastern]')
+        assert res.dtype == 'datetime64[ns, US/Eastern]'
 
         for ex in [10, -10, 20, -20]:
             res = s.shift(ex)
             exp = Series([NaT] * 10, dtype='datetime64[ns, US/Eastern]')
             tm.assert_series_equal(res, exp)
-            self.assertEqual(res.dtype, 'datetime64[ns, US/Eastern]')
+            assert res.dtype == 'datetime64[ns, US/Eastern]'
 
     def test_tshift(self):
         # PeriodIndex
@@ -163,7 +209,9 @@ def test_tshift(self):
         shifted3 = ps.tshift(freq=BDay())
         assert_series_equal(shifted, shifted3)
 
-        self.assertRaises(ValueError, ps.tshift, freq='M')
+        msg = "Given freq M does not match PeriodIndex freq B"
+        with pytest.raises(ValueError, match=msg):
+            ps.tshift(freq='M')
 
         # DatetimeIndex
         shifted = self.ts.tshift(1)
@@ -182,7 +230,9 @@ def test_tshift(self):
         assert_series_equal(unshifted, inferred_ts)
 
         no_freq = self.ts[[0, 5, 7]]
-        self.assertRaises(ValueError, no_freq.tshift)
+        msg = "Freq was not given and was not set in the index"
+        with pytest.raises(ValueError, match=msg):
+            no_freq.tshift()
 
     def test_truncate(self):
         offset = BDay()
@@ -230,9 +280,28 @@ def test_truncate(self):
         truncated = ts.truncate(before=self.ts.index[-1] + offset)
         assert (len(truncated) == 0)
 
-        self.assertRaises(ValueError, ts.truncate,
-                          before=self.ts.index[-1] + offset,
-                          after=self.ts.index[0] - offset)
+        msg = "Truncate: 1999-12-31 00:00:00 must be after 2000-02-14 00:00:00"
+        with pytest.raises(ValueError, match=msg):
+            ts.truncate(before=self.ts.index[-1] + offset,
+                        after=self.ts.index[0] - offset)
+
+    def test_truncate_nonsortedindex(self):
+        # GH 17935
+
+        s = pd.Series(['a', 'b', 'c', 'd', 'e'],
+                      index=[5, 3, 2, 9, 0])
+        msg = 'truncate requires a sorted index'
+
+        with pytest.raises(ValueError, match=msg):
+            s.truncate(before=3, after=9)
+
+        rng = pd.date_range('2011-01-01', '2012-01-01', freq='W')
+        ts = pd.Series(np.random.randn(len(rng)), index=rng)
+        msg = 'truncate requires a sorted index'
+
+        with pytest.raises(ValueError, match=msg):
+            ts.sort_values(ascending=False).truncate(before='2011-11',
+                                                     after='2011-12')
 
     def test_asfreq(self):
         ts = Series([0., 1., 2.], index=[datetime(2009, 10, 30), datetime(
@@ -240,25 +309,25 @@ def test_asfreq(self):
 
         daily_ts = ts.asfreq('B')
         monthly_ts = daily_ts.asfreq('BM')
-        assert_series_equal(monthly_ts, ts)
+        tm.assert_series_equal(monthly_ts, ts)
 
         daily_ts = ts.asfreq('B', method='pad')
         monthly_ts = daily_ts.asfreq('BM')
-        assert_series_equal(monthly_ts, ts)
+        tm.assert_series_equal(monthly_ts, ts)
 
         daily_ts = ts.asfreq(BDay())
         monthly_ts = daily_ts.asfreq(BMonthEnd())
-        assert_series_equal(monthly_ts, ts)
+        tm.assert_series_equal(monthly_ts, ts)
 
         result = ts[:0].asfreq('M')
-        self.assertEqual(len(result), 0)
-        self.assertIsNot(result, ts)
+        assert len(result) == 0
+        assert result is not ts
 
         daily_ts = ts.asfreq('D', fill_value=-1)
         result = daily_ts.value_counts().sort_index()
         expected = Series([60, 1, 1, 1],
                           index=[-1.0, 2.0, 1.0, 0.0]).sort_index()
-        assert_series_equal(result, expected)
+        tm.assert_series_equal(result, expected)
 
     def test_asfreq_datetimeindex_empty_series(self):
         # GH 14320
@@ -266,7 +335,7 @@ def test_asfreq_datetimeindex_empty_series(self):
             ["2016-09-29 11:00"])).asfreq('H')
         result = Series(index=pd.DatetimeIndex(["2016-09-29 11:00"]),
                         data=[3]).asfreq('H')
-        self.assert_index_equal(expected.index, result.index)
+        tm.assert_index_equal(expected.index, result.index)
 
     def test_diff(self):
         # Just run the function
@@ -278,7 +347,7 @@ def test_diff(self):
         s = Series([a, b])
 
         rs = s.diff()
-        self.assertEqual(rs[1], 1)
+        assert rs[1] == 1
 
         # neg n
         rs = self.ts.diff(-1)
@@ -323,15 +392,43 @@ def test_pct_change(self):
 
         rs = self.ts.pct_change(freq='5D')
         filled = self.ts.fillna(method='pad')
-        assert_series_equal(rs, filled / filled.shift(freq='5D') - 1)
+        assert_series_equal(rs,
+                            (filled / filled.shift(freq='5D') - 1)
+                            .reindex_like(filled))
 
     def test_pct_change_shift_over_nas(self):
         s = Series([1., 1.5, np.nan, 2.5, 3.])
 
         chg = s.pct_change()
-        expected = Series([np.nan, 0.5, np.nan, 2.5 / 1.5 - 1, .2])
+        expected = Series([np.nan, 0.5, 0., 2.5 / 1.5 - 1, .2])
         assert_series_equal(chg, expected)
 
+    @pytest.mark.parametrize("freq, periods, fill_method, limit",
+                             [('5B', 5, None, None),
+                              ('3B', 3, None, None),
+                              ('3B', 3, 'bfill', None),
+                              ('7B', 7, 'pad', 1),
+                              ('7B', 7, 'bfill', 3),
+                              ('14B', 14, None, None)])
+    def test_pct_change_periods_freq(self, freq, periods, fill_method, limit):
+        # GH 7292
+        rs_freq = self.ts.pct_change(freq=freq,
+                                     fill_method=fill_method,
+                                     limit=limit)
+        rs_periods = self.ts.pct_change(periods,
+                                        fill_method=fill_method,
+                                        limit=limit)
+        assert_series_equal(rs_freq, rs_periods)
+
+        empty_ts = Series(index=self.ts.index)
+        rs_freq = empty_ts.pct_change(freq=freq,
+                                      fill_method=fill_method,
+                                      limit=limit)
+        rs_periods = empty_ts.pct_change(periods,
+                                         fill_method=fill_method,
+                                         limit=limit)
+        assert_series_equal(rs_freq, rs_periods)
+
     def test_autocorr(self):
         # Just run the function
         corr1 = self.ts.autocorr()
@@ -341,10 +438,10 @@ def test_autocorr(self):
 
         # corr() with lag needs Series of at least length 2
         if len(self.ts) <= 2:
-            self.assertTrue(np.isnan(corr1))
-            self.assertTrue(np.isnan(corr2))
+            assert np.isnan(corr1)
+            assert np.isnan(corr2)
         else:
-            self.assertEqual(corr1, corr2)
+            assert corr1 == corr2
 
         # Choose a random lag between 1 and length of Series - 2
         # and compare the result with the Series corr() function
@@ -354,34 +451,43 @@ def test_autocorr(self):
 
         # corr() with lag needs Series of at least length 2
         if len(self.ts) <= 2:
-            self.assertTrue(np.isnan(corr1))
-            self.assertTrue(np.isnan(corr2))
+            assert np.isnan(corr1)
+            assert np.isnan(corr2)
         else:
-            self.assertEqual(corr1, corr2)
+            assert corr1 == corr2
 
     def test_first_last_valid(self):
         ts = self.ts.copy()
         ts[:5] = np.NaN
 
         index = ts.first_valid_index()
-        self.assertEqual(index, ts.index[5])
+        assert index == ts.index[5]
 
         ts[-5:] = np.NaN
         index = ts.last_valid_index()
-        self.assertEqual(index, ts.index[-6])
+        assert index == ts.index[-6]
 
         ts[:] = np.nan
-        self.assertIsNone(ts.last_valid_index())
-        self.assertIsNone(ts.first_valid_index())
+        assert ts.last_valid_index() is None
+        assert ts.first_valid_index() is None
 
         ser = Series([], index=[])
-        self.assertIsNone(ser.last_valid_index())
-        self.assertIsNone(ser.first_valid_index())
+        assert ser.last_valid_index() is None
+        assert ser.first_valid_index() is None
 
         # GH12800
         empty = Series()
-        self.assertIsNone(empty.last_valid_index())
-        self.assertIsNone(empty.first_valid_index())
+        assert empty.last_valid_index() is None
+        assert empty.first_valid_index() is None
+
+        # GH20499: its preserves freq with holes
+        ts.index = date_range("20110101", periods=len(ts), freq="B")
+        ts.iloc[1] = 1
+        ts.iloc[-2] = 1
+        assert ts.first_valid_index() == ts.index[1]
+        assert ts.last_valid_index() == ts.index[-2]
+        assert ts.first_valid_index().freq == ts.index.freq
+        assert ts.last_valid_index().freq == ts.index.freq
 
     def test_mpl_compat_hack(self):
         result = self.ts[:, np.newaxis]
@@ -391,17 +497,8 @@ def test_mpl_compat_hack(self):
     def test_timeseries_coercion(self):
         idx = tm.makeDateIndex(10000)
         ser = Series(np.random.randn(len(idx)), idx.astype(object))
-        self.assertTrue(ser.index.is_all_dates)
-        self.assertIsInstance(ser.index, DatetimeIndex)
-
-    def test_empty_series_ops(self):
-        # see issue #13844
-        a = Series(dtype='M8[ns]')
-        b = Series(dtype='m8[ns]')
-        assert_series_equal(a, a + b)
-        assert_series_equal(a, a - b)
-        assert_series_equal(a, b + a)
-        self.assertRaises(TypeError, lambda x, y: x - y, b, a)
+        assert ser.index.is_all_dates
+        assert isinstance(ser.index, DatetimeIndex)
 
     def test_contiguous_boolean_preserve_freq(self):
         rng = date_range('1/1/2000', '3/1/2000', freq='B')
@@ -411,12 +508,12 @@ def test_contiguous_boolean_preserve_freq(self):
 
         masked = rng[mask]
         expected = rng[10:20]
-        self.assertIsNotNone(expected.freq)
+        assert expected.freq is not None
         assert_range_equal(masked, expected)
 
         mask[22] = True
         masked = rng[mask]
-        self.assertIsNone(masked.freq)
+        assert masked.freq is None
 
     def test_to_datetime_unit(self):
 
@@ -466,9 +563,11 @@ def test_to_datetime_unit(self):
                                   Timestamp('1970-01-03')] + ['NaT'] * 3)
         tm.assert_index_equal(result, expected)
 
-        with self.assertRaises(ValueError):
+        msg = "non convertible value foo with the unit 'D'"
+        with pytest.raises(ValueError, match=msg):
             to_datetime([1, 2, 'foo'], unit='D')
-        with self.assertRaises(ValueError):
+        msg = "cannot convert input 111111111 with the unit 'D'"
+        with pytest.raises(OutOfBoundsDatetime, match=msg):
             to_datetime([1, 2, 111111111], unit='D')
 
         # coerce we can process
@@ -485,7 +584,7 @@ def test_series_ctor_datetime64(self):
         dates = np.asarray(rng)
 
         series = Series(dates)
-        self.assertTrue(np.issubdtype(series.dtype, np.dtype('M8[ns]')))
+        assert np.issubdtype(series.dtype, np.dtype('M8[ns]'))
 
     def test_series_repr_nat(self):
         series = Series([0, 1000, 2000, iNaT], dtype='M8[ns]')
@@ -496,7 +595,7 @@ def test_series_repr_nat(self):
                     '2   1970-01-01 00:00:00.000002\n'
                     '3                          NaT\n'
                     'dtype: datetime64[ns]')
-        self.assertEqual(result, expected)
+        assert result == expected
 
     def test_asfreq_keep_index_name(self):
         # GH #9854
@@ -504,8 +603,8 @@ def test_asfreq_keep_index_name(self):
         index = pd.date_range('20130101', periods=20, name=index_name)
         df = pd.DataFrame([x for x in range(20)], columns=['foo'], index=index)
 
-        self.assertEqual(index_name, df.index.name)
-        self.assertEqual(index_name, df.asfreq('10D').index.name)
+        assert index_name == df.index.name
+        assert index_name == df.asfreq('10D').index.name
 
     def test_promote_datetime_date(self):
         rng = date_range('1/1/2000', periods=20)
@@ -528,7 +627,7 @@ def test_promote_datetime_date(self):
 
         result = rng.get_indexer(ts2.index)
         expected = rng.get_indexer(ts_slice.index)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_asfreq_normalize(self):
         rng = date_range('1/1/2000 09:30', periods=20)
@@ -553,11 +652,11 @@ def test_asfreq_normalize(self):
     def test_first_subset(self):
         ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
         result = ts.first('10d')
-        self.assertEqual(len(result), 20)
+        assert len(result) == 20
 
         ts = _simple_ts('1/1/2000', '1/1/2010')
         result = ts.first('10d')
-        self.assertEqual(len(result), 10)
+        assert len(result) == 10
 
         result = ts.first('3M')
         expected = ts[:'3/31/2000']
@@ -570,14 +669,21 @@ def test_first_subset(self):
         result = ts[:0].first('3M')
         assert_series_equal(result, ts[:0])
 
+    def test_first_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        msg = "'first' only supports a DatetimeIndex index"
+        with pytest.raises(TypeError, match=msg):
+            ser.first('1D')
+
     def test_last_subset(self):
         ts = _simple_ts('1/1/2000', '1/1/2010', freq='12h')
         result = ts.last('10d')
-        self.assertEqual(len(result), 20)
+        assert len(result) == 20
 
         ts = _simple_ts('1/1/2000', '1/1/2010')
         result = ts.last('10d')
-        self.assertEqual(len(result), 10)
+        assert len(result) == 10
 
         result = ts.last('21D')
         expected = ts['12/12/2009':]
@@ -590,6 +696,13 @@ def test_last_subset(self):
         result = ts[:0].last('3M')
         assert_series_equal(result, ts[:0])
 
+    def test_last_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        msg = "'last' only supports a DatetimeIndex index"
+        with pytest.raises(TypeError, match=msg):
+            ser.last('1D')
+
     def test_format_pre_1900_dates(self):
         rng = date_range('1/1/1850', '1/1/1950', freq='A-DEC')
         rng.format()
@@ -600,9 +713,9 @@ def test_at_time(self):
         rng = date_range('1/1/2000', '1/5/2000', freq='5min')
         ts = Series(np.random.randn(len(rng)), index=rng)
         rs = ts.at_time(rng[1])
-        self.assertTrue((rs.index.hour == rng[1].hour).all())
-        self.assertTrue((rs.index.minute == rng[1].minute).all())
-        self.assertTrue((rs.index.second == rng[1].second).all())
+        assert (rs.index.hour == rng[1].hour).all()
+        assert (rs.index.minute == rng[1].minute).all()
+        assert (rs.index.second == rng[1].second).all()
 
         result = ts.at_time('9:30')
         expected = ts.at_time(time(9, 30))
@@ -636,7 +749,14 @@ def test_at_time(self):
         rng = date_range('1/1/2012', freq='23Min', periods=384)
         ts = Series(np.random.randn(len(rng)), rng)
         rs = ts.at_time('16:00')
-        self.assertEqual(len(rs), 0)
+        assert len(rs) == 0
+
+    def test_at_time_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        msg = "Index must be DatetimeIndex"
+        with pytest.raises(TypeError, match=msg):
+            ser.at_time('00:00')
 
     def test_between(self):
         series = Series(date_range('1/1/2000', periods=10))
@@ -661,18 +781,18 @@ def test_between_time(self):
             if not inc_end:
                 exp_len -= 4
 
-            self.assertEqual(len(filtered), exp_len)
+            assert len(filtered) == exp_len
             for rs in filtered.index:
                 t = rs.time()
                 if inc_start:
-                    self.assertTrue(t >= stime)
+                    assert t >= stime
                 else:
-                    self.assertTrue(t > stime)
+                    assert t > stime
 
                 if inc_end:
-                    self.assertTrue(t <= etime)
+                    assert t <= etime
                 else:
-                    self.assertTrue(t < etime)
+                    assert t < etime
 
         result = ts.between_time('00:00', '01:00')
         expected = ts.between_time(stime, etime)
@@ -693,37 +813,48 @@ def test_between_time(self):
             if not inc_end:
                 exp_len -= 4
 
-            self.assertEqual(len(filtered), exp_len)
+            assert len(filtered) == exp_len
             for rs in filtered.index:
                 t = rs.time()
                 if inc_start:
-                    self.assertTrue((t >= stime) or (t <= etime))
+                    assert (t >= stime) or (t <= etime)
                 else:
-                    self.assertTrue((t > stime) or (t <= etime))
+                    assert (t > stime) or (t <= etime)
 
                 if inc_end:
-                    self.assertTrue((t <= etime) or (t >= stime))
+                    assert (t <= etime) or (t >= stime)
                 else:
-                    self.assertTrue((t < etime) or (t >= stime))
+                    assert (t < etime) or (t >= stime)
+
+    def test_between_time_raises(self):
+        # GH20725
+        ser = pd.Series('a b c'.split())
+        msg = "Index must be DatetimeIndex"
+        with pytest.raises(TypeError, match=msg):
+            ser.between_time(start_time='00:00', end_time='12:00')
 
     def test_between_time_types(self):
         # GH11818
         rng = date_range('1/1/2000', '1/5/2000', freq='5min')
-        self.assertRaises(ValueError, rng.indexer_between_time,
-                          datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+        msg = (r"Cannot convert arg \[datetime\.datetime\(2010, 1, 2, 1, 0\)\]"
+               " to a time")
+        with pytest.raises(ValueError, match=msg):
+            rng.indexer_between_time(datetime(2010, 1, 2, 1),
+                                     datetime(2010, 1, 2, 5))
 
         frame = DataFrame({'A': 0}, index=rng)
-        self.assertRaises(ValueError, frame.between_time,
-                          datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+        with pytest.raises(ValueError, match=msg):
+            frame.between_time(datetime(2010, 1, 2, 1),
+                               datetime(2010, 1, 2, 5))
 
         series = Series(0, index=rng)
-        self.assertRaises(ValueError, series.between_time,
-                          datetime(2010, 1, 2, 1), datetime(2010, 1, 2, 5))
+        with pytest.raises(ValueError, match=msg):
+            series.between_time(datetime(2010, 1, 2, 1),
+                                datetime(2010, 1, 2, 5))
 
+    @td.skip_if_has_locale
     def test_between_time_formats(self):
         # GH11818
-        _skip_if_has_locale()
-
         rng = date_range('1/1/2000', '1/5/2000', freq='5min')
         ts = DataFrame(np.random.randn(len(rng), 2), index=rng)
 
@@ -734,12 +865,25 @@ def test_between_time_formats(self):
         expected_length = 28
 
         for time_string in strings:
-            self.assertEqual(len(ts.between_time(*time_string)),
-                             expected_length,
-                             "%s - %s" % time_string)
+            assert len(ts.between_time(*time_string)) == expected_length
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_between_time_axis(self):
+        # issue 8839
+        rng = date_range('1/1/2000', periods=100, freq='10min')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+        stime, etime = ('08:00:00', '09:00:00')
+        expected_length = 7
+
+        assert len(ts.between_time(stime, etime)) == expected_length
+        assert len(ts.between_time(stime, etime, axis=0)) == expected_length
+        msg = ("No axis named 1 for object type"
+               " <class 'pandas.core.series.Series'>")
+        with pytest.raises(ValueError, match=msg):
+            ts.between_time(stime, etime, axis=1)
 
     def test_to_period(self):
-        from pandas.tseries.period import period_range
+        from pandas.core.indexes.period import period_range
 
         ts = _simple_ts('1/1/2000', '1/1/2001')
 
@@ -794,7 +938,7 @@ def test_to_csv_numpy_16_bug(self):
         frame.to_csv(buf)
 
         result = buf.getvalue()
-        self.assertIn('2000-01-01', result)
+        assert '2000-01-01' in result
 
     def test_series_map_box_timedelta(self):
         # GH 11349
@@ -815,96 +959,67 @@ def test_asfreq_resample_set_correct_freq(self):
         df = df.set_index(pd.to_datetime(df.date))
 
         # testing the settings before calling .asfreq() and .resample()
-        self.assertEqual(df.index.freq, None)
-        self.assertEqual(df.index.inferred_freq, 'D')
+        assert df.index.freq is None
+        assert df.index.inferred_freq == 'D'
 
         # does .asfreq() set .freq correctly?
-        self.assertEqual(df.asfreq('D').index.freq, 'D')
+        assert df.asfreq('D').index.freq == 'D'
 
         # does .resample() set .freq correctly?
-        self.assertEqual(df.resample('D').asfreq().index.freq, 'D')
+        assert df.resample('D').asfreq().index.freq == 'D'
 
     def test_pickle(self):
 
         # GH4606
-        p = self.round_trip_pickle(NaT)
-        self.assertTrue(p is NaT)
+        p = tm.round_trip_pickle(NaT)
+        assert p is NaT
 
         idx = pd.to_datetime(['2013-01-01', NaT, '2014-01-06'])
-        idx_p = self.round_trip_pickle(idx)
-        self.assertTrue(idx_p[0] == idx[0])
-        self.assertTrue(idx_p[1] is NaT)
-        self.assertTrue(idx_p[2] == idx[2])
+        idx_p = tm.round_trip_pickle(idx)
+        assert idx_p[0] == idx[0]
+        assert idx_p[1] is NaT
+        assert idx_p[2] == idx[2]
 
         # GH11002
         # don't infer freq
         idx = date_range('1750-1-1', '2050-1-1', freq='7D')
-        idx_p = self.round_trip_pickle(idx)
+        idx_p = tm.round_trip_pickle(idx)
         tm.assert_index_equal(idx, idx_p)
 
-    def test_setops_preserve_freq(self):
-        for tz in [None, 'Asia/Tokyo', 'US/Eastern']:
-            rng = date_range('1/1/2000', '1/1/2002', name='idx', tz=tz)
-
-            result = rng[:50].union(rng[50:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].union(rng[30:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].union(rng[60:100])
-            self.assertEqual(result.name, rng.name)
-            self.assertIsNone(result.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].intersection(rng[25:75])
-            self.assertEqual(result.name, rng.name)
-            self.assertEqual(result.freqstr, 'D')
-            self.assertEqual(result.tz, rng.tz)
-
-            nofreq = DatetimeIndex(list(rng[25:75]), name='other')
-            result = rng[:50].union(nofreq)
-            self.assertIsNone(result.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-            result = rng[:50].intersection(nofreq)
-            self.assertIsNone(result.name)
-            self.assertEqual(result.freq, rng.freq)
-            self.assertEqual(result.tz, rng.tz)
-
-    def test_min_max(self):
-        rng = date_range('1/1/2000', '12/31/2000')
-        rng2 = rng.take(np.random.permutation(len(rng)))
-
-        the_min = rng2.min()
-        the_max = rng2.max()
-        tm.assertIsInstance(the_min, Timestamp)
-        tm.assertIsInstance(the_max, Timestamp)
-        self.assertEqual(the_min, rng[0])
-        self.assertEqual(the_max, rng[-1])
-
-        self.assertEqual(rng.min(), rng[0])
-        self.assertEqual(rng.max(), rng[-1])
-
-    def test_min_max_series(self):
-        rng = date_range('1/1/2000', periods=10, freq='4h')
-        lvls = ['A', 'A', 'A', 'B', 'B', 'B', 'C', 'C', 'C', 'C']
-        df = DataFrame({'TS': rng, 'V': np.random.randn(len(rng)), 'L': lvls})
-
-        result = df.TS.max()
-        exp = Timestamp(df.TS.iat[-1])
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, exp)
-
-        result = df.TS.min()
-        exp = Timestamp(df.TS.iat[0])
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, exp)
+    @pytest.mark.parametrize('tz', [None, 'Asia/Tokyo', 'US/Eastern'])
+    def test_setops_preserve_freq(self, tz):
+        rng = date_range('1/1/2000', '1/1/2002', name='idx', tz=tz)
+
+        result = rng[:50].union(rng[50:100])
+        assert result.name == rng.name
+        assert result.freq == rng.freq
+        assert result.tz == rng.tz
+
+        result = rng[:50].union(rng[30:100])
+        assert result.name == rng.name
+        assert result.freq == rng.freq
+        assert result.tz == rng.tz
+
+        result = rng[:50].union(rng[60:100])
+        assert result.name == rng.name
+        assert result.freq is None
+        assert result.tz == rng.tz
+
+        result = rng[:50].intersection(rng[25:75])
+        assert result.name == rng.name
+        assert result.freqstr == 'D'
+        assert result.tz == rng.tz
+
+        nofreq = DatetimeIndex(list(rng[25:75]), name='other')
+        result = rng[:50].union(nofreq)
+        assert result.name is None
+        assert result.freq == rng.freq
+        assert result.tz == rng.tz
+
+        result = rng[:50].intersection(nofreq)
+        assert result.name is None
+        assert result.freq == rng.freq
+        assert result.tz == rng.tz
 
     def test_from_M8_structured(self):
         dates = [(datetime(2012, 9, 9, 0, 0), datetime(2012, 9, 8, 15, 10))]
@@ -912,23 +1027,75 @@ def test_from_M8_structured(self):
                        dtype=[('Date', 'M8[us]'), ('Forecasting', 'M8[us]')])
         df = DataFrame(arr)
 
-        self.assertEqual(df['Date'][0], dates[0][0])
-        self.assertEqual(df['Forecasting'][0], dates[0][1])
+        assert df['Date'][0] == dates[0][0]
+        assert df['Forecasting'][0] == dates[0][1]
 
         s = Series(arr['Date'])
-        self.assertTrue(s[0], Timestamp)
-        self.assertEqual(s[0], dates[0][0])
+        assert isinstance(s[0], Timestamp)
+        assert s[0] == dates[0][0]
 
-        s = Series.from_array(arr['Date'], Index([0]))
-        self.assertEqual(s[0], dates[0][0])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s = Series.from_array(arr['Date'], Index([0]))
+            assert s[0] == dates[0][0]
 
     def test_get_level_values_box(self):
         from pandas import MultiIndex
 
         dates = date_range('1/1/2000', periods=4)
         levels = [dates, [0, 1]]
-        labels = [[0, 0, 1, 1, 2, 2, 3, 3], [0, 1, 0, 1, 0, 1, 0, 1]]
-
-        index = MultiIndex(levels=levels, labels=labels)
-
-        self.assertTrue(isinstance(index.get_level_values(0)[0], Timestamp))
+        codes = [[0, 0, 1, 1, 2, 2, 3, 3], [0, 1, 0, 1, 0, 1, 0, 1]]
+
+        index = MultiIndex(levels=levels, codes=codes)
+
+        assert isinstance(index.get_level_values(0)[0], Timestamp)
+
+    def test_view_tz(self):
+        # GH#24024
+        ser = pd.Series(pd.date_range('2000', periods=4, tz='US/Central'))
+        result = ser.view("i8")
+        expected = pd.Series([946706400000000000,
+                              946792800000000000,
+                              946879200000000000,
+                              946965600000000000])
+        tm.assert_series_equal(result, expected)
+
+    def test_asarray_tz_naive(self):
+        # This shouldn't produce a warning.
+        ser = pd.Series(pd.date_range('2000', periods=2))
+        expected = np.array(['2000-01-01', '2000-01-02'], dtype='M8[ns]')
+        with tm.assert_produces_warning(None):
+            result = np.asarray(ser)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # optionally, object
+        with tm.assert_produces_warning(None):
+            result = np.asarray(ser, dtype=object)
+
+        expected = np.array([pd.Timestamp('2000-01-01'),
+                             pd.Timestamp('2000-01-02')])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_asarray_tz_aware(self):
+        tz = 'US/Central'
+        ser = pd.Series(pd.date_range('2000', periods=2, tz=tz))
+        expected = np.array(['2000-01-01T06', '2000-01-02T06'], dtype='M8[ns]')
+        # We warn by default and return an ndarray[M8[ns]]
+        with tm.assert_produces_warning(FutureWarning):
+            result = np.asarray(ser)
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # Old behavior with no warning
+        with tm.assert_produces_warning(None):
+            result = np.asarray(ser, dtype="M8[ns]")
+
+        tm.assert_numpy_array_equal(result, expected)
+
+        # Future behavior with no warning
+        expected = np.array([pd.Timestamp("2000-01-01", tz=tz),
+                             pd.Timestamp("2000-01-02", tz=tz)])
+        with tm.assert_produces_warning(None):
+            result = np.asarray(ser, dtype=object)
+
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/series/test_timezones.py b/pandas/tests/series/test_timezones.py
new file mode 100644
index 0000000000000..ec644a8e93da2
--- /dev/null
+++ b/pandas/tests/series/test_timezones.py
@@ -0,0 +1,366 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Series timezone-related methods
+"""
+from datetime import datetime
+
+from dateutil.tz import tzoffset
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs.tslibs import conversion, timezones
+from pandas.compat import lrange
+
+from pandas import DatetimeIndex, Index, NaT, Series, Timestamp
+from pandas.core.indexes.datetimes import date_range
+import pandas.util.testing as tm
+
+
+class TestSeriesTimezones(object):
+    # -----------------------------------------------------------------
+    # Series.tz_localize
+    def test_series_tz_localize(self):
+
+        rng = date_range('1/1/2011', periods=100, freq='H')
+        ts = Series(1, index=rng)
+
+        result = ts.tz_localize('utc')
+        assert result.index.tz.zone == 'UTC'
+
+        # Can't localize if already tz-aware
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+        ts = Series(1, index=rng)
+
+        with pytest.raises(TypeError, match='Already tz-aware'):
+            ts.tz_localize('US/Eastern')
+
+    @pytest.mark.filterwarnings('ignore::FutureWarning')
+    def test_tz_localize_errors_deprecation(self):
+        # GH 22644
+        tz = 'Europe/Warsaw'
+        n = 60
+        rng = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        ts = Series(rng)
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            with pytest.raises(ValueError):
+                ts.dt.tz_localize(tz, errors='foo')
+            # make sure errors='coerce' gets mapped correctly to nonexistent
+            result = ts.dt.tz_localize(tz, errors='coerce')
+            expected = ts.dt.tz_localize(tz, nonexistent='NaT')
+            tm.assert_series_equal(result, expected)
+
+    def test_series_tz_localize_ambiguous_bool(self):
+        # make sure that we are correctly accepting bool values as ambiguous
+
+        # GH#14402
+        ts = Timestamp('2015-11-01 01:00:03')
+        expected0 = Timestamp('2015-11-01 01:00:03-0500', tz='US/Central')
+        expected1 = Timestamp('2015-11-01 01:00:03-0600', tz='US/Central')
+
+        ser = Series([ts])
+        expected0 = Series([expected0])
+        expected1 = Series([expected1])
+
+        with pytest.raises(pytz.AmbiguousTimeError):
+            ser.dt.tz_localize('US/Central')
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=True)
+        tm.assert_series_equal(result, expected0)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=[True])
+        tm.assert_series_equal(result, expected0)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=False)
+        tm.assert_series_equal(result, expected1)
+
+        result = ser.dt.tz_localize('US/Central', ambiguous=[False])
+        tm.assert_series_equal(result, expected1)
+
+    @pytest.mark.parametrize('tz', ['Europe/Warsaw', 'dateutil/Europe/Warsaw'])
+    @pytest.mark.parametrize('method, exp', [
+        ['shift_forward', '2015-03-29 03:00:00'],
+        ['NaT', NaT],
+        ['raise', None],
+        ['foo', 'invalid']
+    ])
+    def test_series_tz_localize_nonexistent(self, tz, method, exp):
+        # GH 8917
+        n = 60
+        dti = date_range(start='2015-03-29 02:00:00', periods=n, freq='min')
+        s = Series(1, dti)
+        if method == 'raise':
+            with pytest.raises(pytz.NonExistentTimeError):
+                s.tz_localize(tz, nonexistent=method)
+        elif exp == 'invalid':
+            with pytest.raises(ValueError):
+                dti.tz_localize(tz, nonexistent=method)
+        else:
+            result = s.tz_localize(tz, nonexistent=method)
+            expected = Series(1, index=DatetimeIndex([exp] * n, tz=tz))
+            tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_series_tz_localize_empty(self, tzstr):
+        # GH#2248
+        ser = Series()
+
+        ser2 = ser.tz_localize('utc')
+        assert ser2.index.tz == pytz.utc
+
+        ser2 = ser.tz_localize(tzstr)
+        timezones.tz_compare(ser2.index.tz, timezones.maybe_get_tz(tzstr))
+
+    # -----------------------------------------------------------------
+    # Series.tz_convert
+
+    def test_series_tz_convert(self):
+        rng = date_range('1/1/2011', periods=200, freq='D', tz='US/Eastern')
+        ts = Series(1, index=rng)
+
+        result = ts.tz_convert('Europe/Berlin')
+        assert result.index.tz.zone == 'Europe/Berlin'
+
+        # can't convert tz-naive
+        rng = date_range('1/1/2011', periods=200, freq='D')
+        ts = Series(1, index=rng)
+
+        with pytest.raises(TypeError, match="Cannot convert tz-naive"):
+            ts.tz_convert('US/Eastern')
+
+    def test_series_tz_convert_to_utc(self):
+        base = DatetimeIndex(['2011-01-01', '2011-01-02', '2011-01-03'],
+                             tz='UTC')
+        idx1 = base.tz_convert('Asia/Tokyo')[:2]
+        idx2 = base.tz_convert('US/Eastern')[1:]
+
+        res = Series([1, 2], index=idx1) + Series([1, 1], index=idx2)
+        tm.assert_series_equal(res, Series([np.nan, 3, np.nan], index=base))
+
+    # -----------------------------------------------------------------
+    # Series.append
+
+    def test_series_append_aware(self):
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
+                                  tz='US/Eastern')
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        assert ts_result.index.tz == rng1.tz
+
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H', tz='UTC')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H', tz='UTC')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
+                                  tz='UTC')
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        utc = rng1.tz
+        assert utc == ts_result.index.tz
+
+        # GH#7795
+        # different tz coerces to object dtype, not UTC
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Central')
+        ser1 = Series([1], index=rng1)
+        ser2 = Series([2], index=rng2)
+        ts_result = ser1.append(ser2)
+        exp_index = Index([Timestamp('1/1/2011 01:00', tz='US/Eastern'),
+                           Timestamp('1/1/2011 02:00', tz='US/Central')])
+        exp = Series([1, 2], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+
+    def test_series_append_aware_naive(self):
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
+        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series(np.random.randn(len(rng1)), index=rng1)
+        ser2 = Series(np.random.randn(len(rng2)), index=rng2)
+        ts_result = ser1.append(ser2)
+
+        expected = ser1.index.astype(object).append(ser2.index.astype(object))
+        assert ts_result.index.equals(expected)
+
+        # mixed
+        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
+        rng2 = lrange(100)
+        ser1 = Series(np.random.randn(len(rng1)), index=rng1)
+        ser2 = Series(np.random.randn(len(rng2)), index=rng2)
+        ts_result = ser1.append(ser2)
+
+        expected = ser1.index.astype(object).append(ser2.index)
+        assert ts_result.index.equals(expected)
+
+    def test_series_append_dst(self):
+        rng1 = date_range('1/1/2016 01:00', periods=3, freq='H',
+                          tz='US/Eastern')
+        rng2 = date_range('8/1/2016 01:00', periods=3, freq='H',
+                          tz='US/Eastern')
+        ser1 = Series([1, 2, 3], index=rng1)
+        ser2 = Series([10, 11, 12], index=rng2)
+        ts_result = ser1.append(ser2)
+
+        exp_index = DatetimeIndex(['2016-01-01 01:00', '2016-01-01 02:00',
+                                   '2016-01-01 03:00', '2016-08-01 01:00',
+                                   '2016-08-01 02:00', '2016-08-01 03:00'],
+                                  tz='US/Eastern')
+        exp = Series([1, 2, 3, 10, 11, 12], index=exp_index)
+        tm.assert_series_equal(ts_result, exp)
+        assert ts_result.index.tz == rng1.tz
+
+    # -----------------------------------------------------------------
+
+    def test_dateutil_tzoffset_support(self):
+        values = [188.5, 328.25]
+        tzinfo = tzoffset(None, 7200)
+        index = [datetime(2012, 5, 11, 11, tzinfo=tzinfo),
+                 datetime(2012, 5, 11, 12, tzinfo=tzinfo)]
+        series = Series(data=values, index=index)
+
+        assert series.index.tz == tzinfo
+
+        # it works! #2443
+        repr(series.index[0])
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_tz_aware_asfreq(self, tz):
+        dr = date_range('2011-12-01', '2012-07-20', freq='D', tz=tz)
+
+        ser = Series(np.random.randn(len(dr)), index=dr)
+
+        # it works!
+        ser.asfreq('T')
+
+    @pytest.mark.parametrize('tz', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_string_index_alias_tz_aware(self, tz):
+        rng = date_range('1/1/2000', periods=10, tz=tz)
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        result = ser['1/3/2000']
+        tm.assert_almost_equal(result, ser[2])
+
+    # TODO: De-duplicate with test below
+    def test_series_add_tz_mismatch_converts_to_utc_duplicate(self):
+        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        ts_moscow = ser.tz_convert('Europe/Moscow')
+
+        result = ser + ts_moscow
+        assert result.index.tz is pytz.utc
+
+        result = ts_moscow + ser
+        assert result.index.tz is pytz.utc
+
+    def test_series_add_tz_mismatch_converts_to_utc(self):
+        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
+
+        perm = np.random.permutation(100)[:90]
+        ser1 = Series(np.random.randn(90),
+                      index=rng.take(perm).tz_convert('US/Eastern'))
+
+        perm = np.random.permutation(100)[:90]
+        ser2 = Series(np.random.randn(90),
+                      index=rng.take(perm).tz_convert('Europe/Berlin'))
+
+        result = ser1 + ser2
+
+        uts1 = ser1.tz_convert('utc')
+        uts2 = ser2.tz_convert('utc')
+        expected = uts1 + uts2
+
+        assert result.index.tz == pytz.UTC
+        tm.assert_series_equal(result, expected)
+
+    def test_series_add_aware_naive_raises(self):
+        rng = date_range('1/1/2011', periods=10, freq='H')
+        ser = Series(np.random.randn(len(rng)), index=rng)
+
+        ser_utc = ser.tz_localize('utc')
+
+        with pytest.raises(Exception):
+            ser + ser_utc
+
+        with pytest.raises(Exception):
+            ser_utc + ser
+
+    def test_series_align_aware(self):
+        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
+        ser = Series(np.random.randn(len(idx1)), index=idx1)
+        ser_central = ser.tz_convert('US/Central')
+        # # different timezones convert to UTC
+
+        new1, new2 = ser.align(ser_central)
+        assert new1.index.tz == pytz.UTC
+        assert new2.index.tz == pytz.UTC
+
+    @pytest.mark.parametrize('tzstr', ['US/Eastern', 'dateutil/US/Eastern'])
+    def test_localized_at_time_between_time(self, tzstr):
+        from datetime import time
+        tz = timezones.maybe_get_tz(tzstr)
+
+        rng = date_range('4/16/2012', '5/1/2012', freq='H')
+        ts = Series(np.random.randn(len(rng)), index=rng)
+
+        ts_local = ts.tz_localize(tzstr)
+
+        result = ts_local.at_time(time(10, 0))
+        expected = ts.at_time(time(10, 0)).tz_localize(tzstr)
+        tm.assert_series_equal(result, expected)
+        assert timezones.tz_compare(result.index.tz, tz)
+
+        t1, t2 = time(10, 0), time(11, 0)
+        result = ts_local.between_time(t1, t2)
+        expected = ts.between_time(t1, t2).tz_localize(tzstr)
+        tm.assert_series_equal(result, expected)
+        assert timezones.tz_compare(result.index.tz, tz)
+
+    @pytest.mark.parametrize('tzstr', ['Europe/Berlin',
+                                       'dateutil/Europe/Berlin'])
+    def test_getitem_pydatetime_tz(self, tzstr):
+        tz = timezones.maybe_get_tz(tzstr)
+
+        index = date_range(start='2012-12-24 16:00', end='2012-12-24 18:00',
+                           freq='H', tz=tzstr)
+        ts = Series(index=index, data=index.hour)
+        time_pandas = Timestamp('2012-12-24 17:00', tz=tzstr)
+
+        dt = datetime(2012, 12, 24, 17, 0)
+        time_datetime = conversion.localize_pydatetime(dt, tz)
+        assert ts[time_pandas] == ts[time_datetime]
+
+    def test_series_truncate_datetimeindex_tz(self):
+        # GH 9243
+        idx = date_range('4/1/2005', '4/30/2005', freq='D', tz='US/Pacific')
+        s = Series(range(len(idx)), index=idx)
+        result = s.truncate(datetime(2005, 4, 2), datetime(2005, 4, 4))
+        expected = Series([1, 2, 3], index=idx[1:4])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('copy', [True, False])
+    @pytest.mark.parametrize('method, tz', [
+        ['tz_localize', None],
+        ['tz_convert', 'Europe/Berlin']
+    ])
+    def test_tz_localize_convert_copy_inplace_mutate(self, copy, method, tz):
+        # GH 6326
+        result = Series(np.arange(0, 5),
+                        index=date_range('20131027', periods=5, freq='1H',
+                                         tz=tz))
+        getattr(result, method)('UTC', copy=copy)
+        expected = Series(np.arange(0, 5),
+                          index=date_range('20131027', periods=5, freq='1H',
+                                           tz=tz))
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/series/test_validate.py b/pandas/tests/series/test_validate.py
index cf0482b41c80a..8f7c16f2c3132 100644
--- a/pandas/tests/series/test_validate.py
+++ b/pandas/tests/series/test_validate.py
@@ -1,33 +1,19 @@
-from unittest import TestCase
-from pandas.core.series import Series
+import pytest
 
 
-class TestSeriesValidate(TestCase):
+class TestSeriesValidate(object):
     """Tests for error handling related to data types of method arguments."""
-    s = Series([1, 2, 3, 4, 5])
 
-    def test_validate_bool_args(self):
-        # Tests for error handling related to boolean arguments.
-        invalid_values = [1, "True", [1, 2, 3], 5.0]
+    @pytest.mark.parametrize("func", ["reset_index", "_set_name",
+                                      "sort_values", "sort_index",
+                                      "rename", "dropna"])
+    @pytest.mark.parametrize("inplace", [1, "True", [1, 2, 3], 5.0])
+    def test_validate_bool_args(self, string_series, func, inplace):
+        msg = "For argument \"inplace\" expected type bool"
+        kwargs = dict(inplace=inplace)
 
-        for value in invalid_values:
-            with self.assertRaises(ValueError):
-                self.s.reset_index(inplace=value)
+        if func == "_set_name":
+            kwargs["name"] = "hello"
 
-            with self.assertRaises(ValueError):
-                self.s._set_name(name='hello', inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.s.sort_values(inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.s.sort_index(inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.s.sort_index(inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.s.rename(inplace=value)
-
-            with self.assertRaises(ValueError):
-                self.s.dropna(inplace=value)
+        with pytest.raises(ValueError, match=msg):
+            getattr(string_series, func)(**kwargs)
diff --git a/pandas/tests/sparse/common.py b/pandas/tests/sparse/common.py
index 3aeef8d436e1a..e69de29bb2d1d 100644
--- a/pandas/tests/sparse/common.py
+++ b/pandas/tests/sparse/common.py
@@ -1,10 +0,0 @@
-import pytest
-
-import pandas.util.testing as tm
-
-
-@pytest.fixture(params=['bsr', 'coo', 'csc', 'csr', 'dia', 'dok', 'lil'])
-def spmatrix(request):
-    tm._skip_if_no_scipy()
-    from scipy import sparse
-    return getattr(sparse, request.param + '_matrix')
diff --git a/pandas/tests/sparse/frame/__init__.py b/pandas/tests/sparse/frame/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/frame/conftest.py b/pandas/tests/sparse/frame/conftest.py
new file mode 100644
index 0000000000000..3423260c1720a
--- /dev/null
+++ b/pandas/tests/sparse/frame/conftest.py
@@ -0,0 +1,115 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, SparseArray, SparseDataFrame, bdate_range
+
+data = {'A': [np.nan, np.nan, np.nan, 0, 1, 2, 3, 4, 5, 6],
+        'B': [0, 1, 2, np.nan, np.nan, np.nan, 3, 4, 5, 6],
+        'C': np.arange(10, dtype=np.float64),
+        'D': [0, 1, 2, 3, 4, 5, np.nan, np.nan, np.nan, np.nan]}
+dates = bdate_range('1/1/2011', periods=10)
+
+
+# fixture names must be compatible with the tests in
+# tests/frame/test_api.SharedWithSparse
+
+@pytest.fixture
+def float_frame_dense():
+    """
+    Fixture for dense DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; some entries are missing
+    """
+    return DataFrame(data, index=dates)
+
+
+@pytest.fixture
+def float_frame():
+    """
+    Fixture for sparse DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; some entries are missing
+    """
+    # default_kind='block' is the default
+    return SparseDataFrame(data, index=dates, default_kind='block')
+
+
+@pytest.fixture
+def float_frame_int_kind():
+    """
+    Fixture for sparse DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D'] and default_kind='integer'.
+    Some entries are missing.
+    """
+    return SparseDataFrame(data, index=dates, default_kind='integer')
+
+
+@pytest.fixture
+def float_string_frame():
+    """
+    Fixture for sparse DataFrame of floats and strings with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D', 'foo']; some entries are missing
+    """
+    sdf = SparseDataFrame(data, index=dates)
+    sdf['foo'] = SparseArray(['bar'] * len(dates))
+    return sdf
+
+
+@pytest.fixture
+def float_frame_fill0_dense():
+    """
+    Fixture for dense DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; missing entries have been filled with 0
+    """
+    values = SparseDataFrame(data).values
+    values[np.isnan(values)] = 0
+    return DataFrame(values, columns=['A', 'B', 'C', 'D'], index=dates)
+
+
+@pytest.fixture
+def float_frame_fill0():
+    """
+    Fixture for sparse DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; missing entries have been filled with 0
+    """
+    values = SparseDataFrame(data).values
+    values[np.isnan(values)] = 0
+    return SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                           default_fill_value=0, index=dates)
+
+
+@pytest.fixture
+def float_frame_fill2_dense():
+    """
+    Fixture for dense DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; missing entries have been filled with 2
+    """
+    values = SparseDataFrame(data).values
+    values[np.isnan(values)] = 2
+    return DataFrame(values, columns=['A', 'B', 'C', 'D'], index=dates)
+
+
+@pytest.fixture
+def float_frame_fill2():
+    """
+    Fixture for sparse DataFrame of floats with DatetimeIndex
+
+    Columns are ['A', 'B', 'C', 'D']; missing entries have been filled with 2
+    """
+    values = SparseDataFrame(data).values
+    values[np.isnan(values)] = 2
+    return SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                           default_fill_value=2, index=dates)
+
+
+@pytest.fixture
+def empty_frame():
+    """
+    Fixture for empty SparseDataFrame
+    """
+    return SparseDataFrame()
diff --git a/pandas/tests/sparse/frame/test_analytics.py b/pandas/tests/sparse/frame/test_analytics.py
new file mode 100644
index 0000000000000..95c1c8c453d0a
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_analytics.py
@@ -0,0 +1,39 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, SparseDataFrame, SparseSeries
+from pandas.util import testing as tm
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_quantile():
+    # GH 17386
+    data = [[1, 1], [2, 10], [3, 100], [np.nan, np.nan]]
+    q = 0.1
+
+    sparse_df = SparseDataFrame(data)
+    result = sparse_df.quantile(q)
+
+    dense_df = DataFrame(data)
+    dense_expected = dense_df.quantile(q)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_quantile_multi():
+    # GH 17386
+    data = [[1, 1], [2, 10], [3, 100], [np.nan, np.nan]]
+    q = [0.1, 0.5]
+
+    sparse_df = SparseDataFrame(data)
+    result = sparse_df.quantile(q)
+
+    dense_df = DataFrame(data)
+    dense_expected = dense_df.quantile(q)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/frame/test_apply.py b/pandas/tests/sparse/frame/test_apply.py
new file mode 100644
index 0000000000000..b5ea0a5c90e1a
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_apply.py
@@ -0,0 +1,105 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Series, SparseDataFrame, bdate_range
+from pandas.core import nanops
+from pandas.core.sparse.api import SparseDtype
+from pandas.util import testing as tm
+
+
+@pytest.fixture
+def dates():
+    return bdate_range('1/1/2011', periods=10)
+
+
+@pytest.fixture
+def empty():
+    return SparseDataFrame()
+
+
+@pytest.fixture
+def frame(dates):
+    data = {'A': [np.nan, np.nan, np.nan, 0, 1, 2, 3, 4, 5, 6],
+            'B': [0, 1, 2, np.nan, np.nan, np.nan, 3, 4, 5, 6],
+            'C': np.arange(10, dtype=np.float64),
+            'D': [0, 1, 2, 3, 4, 5, np.nan, np.nan, np.nan, np.nan]}
+
+    return SparseDataFrame(data, index=dates)
+
+
+@pytest.fixture
+def fill_frame(frame):
+    values = frame.values.copy()
+    values[np.isnan(values)] = 2
+
+    return SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
+                           default_fill_value=2,
+                           index=frame.index)
+
+
+def test_apply(frame):
+    applied = frame.apply(np.sqrt)
+    assert isinstance(applied, SparseDataFrame)
+    tm.assert_almost_equal(applied.values, np.sqrt(frame.values))
+
+    # agg / broadcast
+    with tm.assert_produces_warning(FutureWarning):
+        broadcasted = frame.apply(np.sum, broadcast=True)
+    assert isinstance(broadcasted, SparseDataFrame)
+
+    with tm.assert_produces_warning(FutureWarning):
+        exp = frame.to_dense().apply(np.sum, broadcast=True)
+    tm.assert_frame_equal(broadcasted.to_dense(), exp)
+
+    applied = frame.apply(np.sum)
+    tm.assert_series_equal(applied,
+                           frame.to_dense().apply(nanops.nansum).to_sparse())
+
+
+def test_apply_fill(fill_frame):
+    applied = fill_frame.apply(np.sqrt)
+    assert applied['A'].fill_value == np.sqrt(2)
+
+
+def test_apply_empty(empty):
+    assert empty.apply(np.sqrt) is empty
+
+
+def test_apply_nonuq():
+    orig = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
+                     index=['a', 'a', 'c'])
+    sparse = orig.to_sparse()
+    res = sparse.apply(lambda s: s[0], axis=1)
+    exp = orig.apply(lambda s: s[0], axis=1)
+
+    # dtype must be kept
+    assert res.dtype == SparseDtype(np.int64)
+
+    # ToDo: apply must return subclassed dtype
+    assert isinstance(res, Series)
+    tm.assert_series_equal(res.to_dense(), exp)
+
+    # df.T breaks
+    sparse = orig.T.to_sparse()
+    res = sparse.apply(lambda s: s[0], axis=0)  # noqa
+    exp = orig.T.apply(lambda s: s[0], axis=0)
+
+    # TODO: no non-unique columns supported in sparse yet
+    # tm.assert_series_equal(res.to_dense(), exp)
+
+
+def test_applymap(frame):
+    # just test that it works
+    result = frame.applymap(lambda x: x * 2)
+    assert isinstance(result, SparseDataFrame)
+
+
+def test_apply_keep_sparse_dtype():
+    # GH 23744
+    sdf = SparseDataFrame(np.array([[0, 1, 0], [0, 0, 0], [0, 0, 1]]),
+                          columns=['b', 'a', 'c'], default_fill_value=1)
+    df = DataFrame(sdf)
+
+    expected = sdf.apply(np.exp)
+    result = df.apply(np.exp)
+    tm.assert_frame_equal(expected, result)
diff --git a/pandas/tests/sparse/frame/test_frame.py b/pandas/tests/sparse/frame/test_frame.py
new file mode 100644
index 0000000000000..888d1fa1bfe45
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_frame.py
@@ -0,0 +1,1407 @@
+# pylint: disable-msg=E1101,W0612
+
+import operator
+
+import numpy as np
+from numpy import nan
+import pytest
+
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas.compat import PY2, lrange
+from pandas.errors import PerformanceWarning
+
+import pandas as pd
+from pandas import DataFrame, Panel, Series, bdate_range, compat
+from pandas.core.indexes.datetimes import DatetimeIndex
+from pandas.core.sparse import frame as spf
+from pandas.core.sparse.api import (
+    SparseArray, SparseDataFrame, SparseDtype, SparseSeries)
+from pandas.tests.frame.test_api import SharedWithSparse
+from pandas.util import testing as tm
+
+from pandas.tseries.offsets import BDay
+
+
+class TestSparseDataFrame(SharedWithSparse):
+    klass = SparseDataFrame
+
+    # SharedWithSparse tests use generic, klass-agnostic assertion
+    _assert_frame_equal = staticmethod(tm.assert_sp_frame_equal)
+    _assert_series_equal = staticmethod(tm.assert_sp_series_equal)
+
+    def test_iterrows(self, float_frame, float_string_frame):
+        # Same as parent, but we don't ensure the sparse kind is the same.
+        for k, v in float_frame.iterrows():
+            exp = float_frame.loc[k]
+            tm.assert_sp_series_equal(v, exp, check_kind=False)
+
+        for k, v in float_string_frame.iterrows():
+            exp = float_string_frame.loc[k]
+            tm.assert_sp_series_equal(v, exp, check_kind=False)
+
+    def test_itertuples(self, float_frame):
+        for i, tup in enumerate(float_frame.itertuples()):
+            s = self.klass._constructor_sliced(tup[1:])
+            s.name = tup[0]
+            expected = float_frame.iloc[i, :].reset_index(drop=True)
+            tm.assert_sp_series_equal(s, expected, check_kind=False)
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        dat = np.array([0, 1, np.nan, 3, 4, 5], dtype='float')
+        df = SparseDataFrame({'foo': dat}, index=range(6))
+
+        exp = df.fillna(0).add(2)
+        res = df.add(2, fill_value=0)
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_values(self, empty_frame, float_frame):
+        empty = empty_frame.values
+        assert empty.shape == (0, 0)
+
+        no_cols = SparseDataFrame(index=np.arange(10))
+        mat = no_cols.values
+        assert mat.shape == (10, 0)
+
+        no_index = SparseDataFrame(columns=np.arange(10))
+        mat = no_index.values
+        assert mat.shape == (0, 10)
+
+    def test_copy(self, float_frame):
+        cp = float_frame.copy()
+        assert isinstance(cp, SparseDataFrame)
+        tm.assert_sp_frame_equal(cp, float_frame)
+
+        # as of v0.15.0
+        # this is now identical (but not is_a )
+        assert cp.index.identical(float_frame.index)
+
+    def test_constructor(self, float_frame, float_frame_int_kind,
+                         float_frame_fill0):
+        for col, series in compat.iteritems(float_frame):
+            assert isinstance(series, SparseSeries)
+
+        assert isinstance(float_frame_int_kind['A'].sp_index, IntIndex)
+
+        # constructed zframe from matrix above
+        assert float_frame_fill0['A'].fill_value == 0
+        # XXX: changed asarray
+        expected = pd.SparseArray([0, 0, 0, 0, 1., 2., 3., 4., 5., 6.],
+                                  fill_value=0, kind='block')
+        tm.assert_sp_array_equal(expected,
+                                 float_frame_fill0['A'].values)
+        tm.assert_numpy_array_equal(np.array([0., 0., 0., 0., 1., 2.,
+                                              3., 4., 5., 6.]),
+                                    float_frame_fill0['A'].to_dense().values)
+
+        # construct no data
+        sdf = SparseDataFrame(columns=np.arange(10), index=np.arange(10))
+        for col, series in compat.iteritems(sdf):
+            assert isinstance(series, SparseSeries)
+
+        # construct from nested dict
+        data = {c: s.to_dict() for c, s in compat.iteritems(float_frame)}
+
+        sdf = SparseDataFrame(data)
+        tm.assert_sp_frame_equal(sdf, float_frame)
+
+        # TODO: test data is copied from inputs
+
+        # init dict with different index
+        idx = float_frame.index[:5]
+        cons = SparseDataFrame(
+            float_frame, index=idx, columns=float_frame.columns,
+            default_fill_value=float_frame.default_fill_value,
+            default_kind=float_frame.default_kind, copy=True)
+        reindexed = float_frame.reindex(idx)
+
+        tm.assert_sp_frame_equal(cons, reindexed, exact_indices=False)
+
+        # assert level parameter breaks reindex
+        with pytest.raises(TypeError):
+            float_frame.reindex(idx, level=0)
+
+        repr(float_frame)
+
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': [2, 3], 'a': [0, 1]}
+        frame = SparseDataFrame(data=d)
+        if compat.PY36:
+            expected = SparseDataFrame(data=d, columns=list('ba'))
+        else:
+            expected = SparseDataFrame(data=d, columns=list('ab'))
+        tm.assert_sp_frame_equal(frame, expected)
+
+    def test_constructor_ndarray(self, float_frame):
+        # no index or columns
+        sp = SparseDataFrame(float_frame.values)
+
+        # 1d
+        sp = SparseDataFrame(float_frame['A'].values, index=float_frame.index,
+                             columns=['A'])
+        tm.assert_sp_frame_equal(sp, float_frame.reindex(columns=['A']))
+
+        # raise on level argument
+        msg = "Reindex by level not supported for sparse"
+        with pytest.raises(TypeError, match=msg):
+            float_frame.reindex(columns=['A'], level=1)
+
+        # wrong length index / columns
+        with pytest.raises(ValueError, match="^Index length"):
+            SparseDataFrame(float_frame.values, index=float_frame.index[:-1])
+
+        with pytest.raises(ValueError, match="^Column length"):
+            SparseDataFrame(float_frame.values,
+                            columns=float_frame.columns[:-1])
+
+    # GH 9272
+    def test_constructor_empty(self):
+        sp = SparseDataFrame()
+        assert len(sp.index) == 0
+        assert len(sp.columns) == 0
+
+    def test_constructor_dataframe(self, float_frame):
+        dense = float_frame.to_dense()
+        sp = SparseDataFrame(dense)
+        tm.assert_sp_frame_equal(sp, float_frame)
+
+    def test_constructor_convert_index_once(self):
+        arr = np.array([1.5, 2.5, 3.5])
+        sdf = SparseDataFrame(columns=lrange(4), index=arr)
+        assert sdf[0].index is sdf[1].index
+
+    def test_constructor_from_series(self):
+
+        # GH 2873
+        x = Series(np.random.randn(10000), name='a')
+        x = x.to_sparse(fill_value=0)
+        assert isinstance(x, SparseSeries)
+        df = SparseDataFrame(x)
+        assert isinstance(df, SparseDataFrame)
+
+        x = Series(np.random.randn(10000), name='a')
+        y = Series(np.random.randn(10000), name='b')
+        x2 = x.astype(float)
+        x2.loc[:9998] = np.NaN
+        # TODO: x_sparse is unused...fix
+        x_sparse = x2.to_sparse(fill_value=np.NaN)  # noqa
+
+        # Currently fails too with weird ufunc error
+        # df1 = SparseDataFrame([x_sparse, y])
+
+        y.loc[:9998] = 0
+        # TODO: y_sparse is unsused...fix
+        y_sparse = y.to_sparse(fill_value=0)  # noqa
+        # without sparse value raises error
+        # df2 = SparseDataFrame([x2_sparse, y])
+
+    def test_constructor_from_dense_series(self):
+        # GH 19393
+        # series with name
+        x = Series(np.random.randn(10000), name='a')
+        result = SparseDataFrame(x)
+        expected = x.to_frame().to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+        # series with no name
+        x = Series(np.random.randn(10000))
+        result = SparseDataFrame(x)
+        expected = x.to_frame().to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_constructor_from_unknown_type(self):
+        # GH 19393
+        class Unknown(object):
+            pass
+        with pytest.raises(TypeError,
+                           match=('SparseDataFrame called with unknown type '
+                                  '"Unknown" for data argument')):
+            SparseDataFrame(Unknown())
+
+    def test_constructor_preserve_attr(self):
+        # GH 13866
+        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        df = pd.SparseDataFrame({'x': arr})
+        assert df['x'].dtype == SparseDtype(np.int64)
+        assert df['x'].fill_value == 0
+
+        s = pd.SparseSeries(arr, name='x')
+        assert s.dtype == SparseDtype(np.int64)
+        assert s.fill_value == 0
+
+        df = pd.SparseDataFrame(s)
+        assert df['x'].dtype == SparseDtype(np.int64)
+        assert df['x'].fill_value == 0
+
+        df = pd.SparseDataFrame({'x': s})
+        assert df['x'].dtype == SparseDtype(np.int64)
+        assert df['x'].fill_value == 0
+
+    def test_constructor_nan_dataframe(self):
+        # GH 10079
+        trains = np.arange(100)
+        thresholds = [10, 20, 30, 40, 50, 60]
+        tuples = [(i, j) for i in trains for j in thresholds]
+        index = pd.MultiIndex.from_tuples(tuples,
+                                          names=['trains', 'thresholds'])
+        matrix = np.empty((len(index), len(trains)))
+        matrix.fill(np.nan)
+        df = pd.DataFrame(matrix, index=index, columns=trains, dtype=float)
+        result = df.to_sparse()
+        expected = pd.SparseDataFrame(matrix, index=index, columns=trains,
+                                      dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_type_coercion_at_construction(self):
+        # GH 15682
+        result = pd.SparseDataFrame(
+            {'a': [1, 0, 0], 'b': [0, 1, 0], 'c': [0, 0, 1]}, dtype='uint8',
+            default_fill_value=0)
+        expected = pd.SparseDataFrame(
+            {'a': pd.SparseSeries([1, 0, 0], dtype='uint8'),
+             'b': pd.SparseSeries([0, 1, 0], dtype='uint8'),
+             'c': pd.SparseSeries([0, 0, 1], dtype='uint8')},
+            default_fill_value=0)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_default_dtype(self):
+        result = pd.SparseDataFrame(columns=list('ab'), index=range(2))
+        expected = pd.SparseDataFrame([[np.nan, np.nan], [np.nan, np.nan]],
+                                      columns=list('ab'), index=range(2))
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_nan_data_with_int_dtype_raises_error(self):
+        sdf = pd.SparseDataFrame([[np.nan, np.nan], [np.nan, np.nan]],
+                                 columns=list('ab'), index=range(2))
+        msg = "Cannot convert non-finite values"
+        with pytest.raises(ValueError, match=msg):
+            pd.SparseDataFrame(sdf, dtype=np.int64)
+
+    def test_dtypes(self):
+        df = DataFrame(np.random.randn(10000, 4))
+        df.loc[:9998] = np.nan
+        sdf = df.to_sparse()
+
+        result = sdf.get_dtype_counts()
+        expected = Series({'Sparse[float64, nan]': 4})
+        tm.assert_series_equal(result, expected)
+
+    def test_shape(self, float_frame, float_frame_int_kind,
+                   float_frame_fill0, float_frame_fill2):
+        # see gh-10452
+        assert float_frame.shape == (10, 4)
+        assert float_frame_int_kind.shape == (10, 4)
+        assert float_frame_fill0.shape == (10, 4)
+        assert float_frame_fill2.shape == (10, 4)
+
+    def test_str(self):
+        df = DataFrame(np.random.randn(10000, 4))
+        df.loc[:9998] = np.nan
+
+        sdf = df.to_sparse()
+        str(sdf)
+
+    def test_array_interface(self, float_frame):
+        res = np.sqrt(float_frame)
+        dres = np.sqrt(float_frame.to_dense())
+        tm.assert_frame_equal(res.to_dense(), dres)
+
+    def test_pickle(self, float_frame, float_frame_int_kind, float_frame_dense,
+                    float_frame_fill0, float_frame_fill0_dense,
+                    float_frame_fill2, float_frame_fill2_dense):
+
+        def _test_roundtrip(frame, orig):
+            result = tm.round_trip_pickle(frame)
+            tm.assert_sp_frame_equal(frame, result)
+            tm.assert_frame_equal(result.to_dense(), orig, check_dtype=False)
+
+        _test_roundtrip(SparseDataFrame(), DataFrame())
+        _test_roundtrip(float_frame, float_frame_dense)
+        _test_roundtrip(float_frame_int_kind, float_frame_dense)
+        _test_roundtrip(float_frame_fill0, float_frame_fill0_dense)
+        _test_roundtrip(float_frame_fill2, float_frame_fill2_dense)
+
+    def test_dense_to_sparse(self):
+        df = DataFrame({'A': [nan, nan, nan, 1, 2],
+                        'B': [1, 2, nan, nan, nan]})
+        sdf = df.to_sparse()
+        assert isinstance(sdf, SparseDataFrame)
+        assert np.isnan(sdf.default_fill_value)
+        assert isinstance(sdf['A'].sp_index, BlockIndex)
+        tm.assert_frame_equal(sdf.to_dense(), df)
+
+        sdf = df.to_sparse(kind='integer')
+        assert isinstance(sdf['A'].sp_index, IntIndex)
+
+        df = DataFrame({'A': [0, 0, 0, 1, 2],
+                        'B': [1, 2, 0, 0, 0]}, dtype=float)
+        sdf = df.to_sparse(fill_value=0)
+        assert sdf.default_fill_value == 0
+        tm.assert_frame_equal(sdf.to_dense(), df)
+
+    def test_density(self):
+        df = SparseSeries([nan, nan, nan, 0, 1, 2, 3, 4, 5, 6])
+        assert df.density == 0.7
+
+        df = SparseDataFrame({'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                              'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                              'C': np.arange(10),
+                              'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]})
+
+        assert df.density == 0.75
+
+    def test_sparse_to_dense(self):
+        pass
+
+    def test_sparse_series_ops(self, float_frame):
+        self._check_frame_ops(float_frame)
+
+    def test_sparse_series_ops_i(self, float_frame_int_kind):
+        self._check_frame_ops(float_frame_int_kind)
+
+    def test_sparse_series_ops_z(self, float_frame_fill0):
+        self._check_frame_ops(float_frame_fill0)
+
+    def test_sparse_series_ops_fill(self, float_frame_fill2):
+        self._check_frame_ops(float_frame_fill2)
+
+    def _check_frame_ops(self, frame):
+
+        def _compare_to_dense(a, b, da, db, op):
+            sparse_result = op(a, b)
+            dense_result = op(da, db)
+
+            fill = sparse_result.default_fill_value
+            dense_result = dense_result.to_sparse(fill_value=fill)
+            tm.assert_sp_frame_equal(sparse_result, dense_result,
+                                     exact_indices=False)
+
+            if isinstance(a, DataFrame) and isinstance(db, DataFrame):
+                mixed_result = op(a, db)
+                assert isinstance(mixed_result, SparseDataFrame)
+                tm.assert_sp_frame_equal(mixed_result, sparse_result,
+                                         exact_indices=False)
+
+        opnames = ['add', 'sub', 'mul', 'truediv', 'floordiv']
+        ops = [getattr(operator, name) for name in opnames]
+
+        fidx = frame.index
+
+        # time series operations
+
+        series = [frame['A'], frame['B'], frame['C'], frame['D'],
+                  frame['A'].reindex(fidx[:7]), frame['A'].reindex(fidx[::2]),
+                  SparseSeries(
+                      [], index=[])]
+
+        for op in opnames:
+            _compare_to_dense(frame, frame[::2], frame.to_dense(),
+                              frame[::2].to_dense(), getattr(operator, op))
+
+            # 2304, no auto-broadcasting
+            for i, s in enumerate(series):
+                f = lambda a, b: getattr(a, op)(b, axis='index')
+                _compare_to_dense(frame, s, frame.to_dense(), s.to_dense(), f)
+
+                # rops are not implemented
+                # _compare_to_dense(s, frame, s.to_dense(),
+                #                   frame.to_dense(), f)
+
+                # cross-sectional operations
+        series = [frame.xs(fidx[0]), frame.xs(fidx[3]), frame.xs(fidx[5]),
+                  frame.xs(fidx[7]), frame.xs(fidx[5])[:2]]
+
+        for op in ops:
+            for s in series:
+                _compare_to_dense(frame, s, frame.to_dense(), s, op)
+                _compare_to_dense(s, frame, s, frame.to_dense(), op)
+
+        # it works!
+        result = frame + frame.loc[:, ['A', 'B']]  # noqa
+
+    def test_op_corners(self, float_frame, empty_frame):
+        empty = empty_frame + empty_frame
+        assert empty.empty
+
+        foo = float_frame + empty_frame
+        assert isinstance(foo.index, DatetimeIndex)
+        tm.assert_frame_equal(foo, float_frame * np.nan)
+
+        foo = empty_frame + float_frame
+        tm.assert_frame_equal(foo, float_frame * np.nan)
+
+    def test_scalar_ops(self):
+        pass
+
+    def test_getitem(self):
+        # 1585 select multiple columns
+        sdf = SparseDataFrame(index=[0, 1, 2], columns=['a', 'b', 'c'])
+
+        result = sdf[['a', 'b']]
+        exp = sdf.reindex(columns=['a', 'b'])
+        tm.assert_sp_frame_equal(result, exp)
+
+        with pytest.raises(KeyError, match=r"\['d'\] not in index"):
+            sdf[['a', 'd']]
+
+    def test_iloc(self, float_frame):
+
+        # GH 2227
+        result = float_frame.iloc[:, 0]
+        assert isinstance(result, SparseSeries)
+        tm.assert_sp_series_equal(result, float_frame['A'])
+
+        # preserve sparse index type. #2251
+        data = {'A': [0, 1]}
+        iframe = SparseDataFrame(data, default_kind='integer')
+        tm.assert_class_equal(iframe['A'].sp_index,
+                              iframe.iloc[:, 0].sp_index)
+
+    def test_set_value(self, float_frame):
+
+        # ok, as the index gets converted to object
+        frame = float_frame.copy()
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = frame.set_value('foobar', 'B', 1.5)
+        assert res.index.dtype == 'object'
+
+        res = float_frame
+        res.index = res.index.astype(object)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res = float_frame.set_value('foobar', 'B', 1.5)
+        assert res is not float_frame
+        assert res.index[-1] == 'foobar'
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res.get_value('foobar', 'B') == 1.5
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            res2 = res.set_value('foobar', 'qux', 1.5)
+        assert res2 is not res
+        tm.assert_index_equal(res2.columns,
+                              pd.Index(list(float_frame.columns) + ['qux']))
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            assert res2.get_value('foobar', 'qux') == 1.5
+
+    def test_fancy_index_misc(self, float_frame):
+        # axis = 0
+        sliced = float_frame.iloc[-2:, :]
+        expected = float_frame.reindex(index=float_frame.index[-2:])
+        tm.assert_sp_frame_equal(sliced, expected)
+
+        # axis = 1
+        sliced = float_frame.iloc[:, -2:]
+        expected = float_frame.reindex(columns=float_frame.columns[-2:])
+        tm.assert_sp_frame_equal(sliced, expected)
+
+    def test_getitem_overload(self, float_frame):
+        # slicing
+        sl = float_frame[:20]
+        tm.assert_sp_frame_equal(sl,
+                                 float_frame.reindex(float_frame.index[:20]))
+
+        # boolean indexing
+        d = float_frame.index[5]
+        indexer = float_frame.index > d
+
+        subindex = float_frame.index[indexer]
+        subframe = float_frame[indexer]
+
+        tm.assert_index_equal(subindex, subframe.index)
+        msg = "Item wrong length 9 instead of 10"
+        with pytest.raises(ValueError, match=msg):
+            float_frame[indexer[:-1]]
+
+    def test_setitem(self, float_frame, float_frame_int_kind,
+                     float_frame_dense,
+                     float_frame_fill0, float_frame_fill0_dense,
+                     float_frame_fill2, float_frame_fill2_dense):
+
+        def _check_frame(frame, orig):
+            N = len(frame)
+
+            # insert SparseSeries
+            frame['E'] = frame['A']
+            assert isinstance(frame['E'], SparseSeries)
+            tm.assert_sp_series_equal(frame['E'], frame['A'],
+                                      check_names=False)
+
+            # insert SparseSeries differently-indexed
+            to_insert = frame['A'][::2]
+            frame['E'] = to_insert
+            expected = to_insert.to_dense().reindex(frame.index)
+            result = frame['E'].to_dense()
+            tm.assert_series_equal(result, expected, check_names=False)
+            assert result.name == 'E'
+
+            # insert Series
+            frame['F'] = frame['A'].to_dense()
+            assert isinstance(frame['F'], SparseSeries)
+            tm.assert_sp_series_equal(frame['F'], frame['A'],
+                                      check_names=False)
+
+            # insert Series differently-indexed
+            to_insert = frame['A'].to_dense()[::2]
+            frame['G'] = to_insert
+            expected = to_insert.reindex(frame.index)
+            expected.name = 'G'
+            tm.assert_series_equal(frame['G'].to_dense(), expected)
+
+            # insert ndarray
+            frame['H'] = np.random.randn(N)
+            assert isinstance(frame['H'], SparseSeries)
+
+            to_sparsify = np.random.randn(N)
+            to_sparsify[N // 2:] = frame.default_fill_value
+            frame['I'] = to_sparsify
+            assert len(frame['I'].sp_values) == N // 2
+
+            # insert ndarray wrong size
+            msg = "Length of values does not match length of index"
+            with pytest.raises(AssertionError, match=msg):
+                frame['foo'] = np.random.randn(N - 1)
+
+            # scalar value
+            frame['J'] = 5
+            assert len(frame['J'].sp_values) == N
+            assert (frame['J'].sp_values == 5).all()
+
+            frame['K'] = frame.default_fill_value
+            assert len(frame['K'].sp_values) == 0
+
+        _check_frame(float_frame, float_frame_dense)
+        _check_frame(float_frame_int_kind, float_frame_dense)
+        _check_frame(float_frame_fill0, float_frame_fill0_dense)
+        _check_frame(float_frame_fill2, float_frame_fill2_dense)
+
+    @pytest.mark.parametrize('values', [
+        [True, False],
+        [0, 1],
+        [1, None],
+        ['a', 'b'],
+        [pd.Timestamp('2017'), pd.NaT],
+        [pd.Timedelta('10s'), pd.NaT],
+    ])
+    def test_setitem_more(self, values):
+        df = pd.DataFrame({"A": values})
+        df['A'] = pd.SparseArray(values)
+        expected = pd.DataFrame({'A': pd.SparseArray(values)})
+        tm.assert_frame_equal(df, expected)
+
+    def test_setitem_corner(self, float_frame):
+        float_frame['a'] = float_frame['B']
+        tm.assert_sp_series_equal(float_frame['a'], float_frame['B'],
+                                  check_names=False)
+
+    def test_setitem_array(self, float_frame):
+        arr = float_frame['B']
+
+        float_frame['E'] = arr
+        tm.assert_sp_series_equal(float_frame['E'], float_frame['B'],
+                                  check_names=False)
+
+        float_frame['F'] = arr[:-1]
+        index = float_frame.index[:-1]
+        tm.assert_sp_series_equal(float_frame['E'].reindex(index),
+                                  float_frame['F'].reindex(index),
+                                  check_names=False)
+
+    def test_setitem_chained_no_consolidate(self):
+        # https://github.com/pandas-dev/pandas/pull/19268
+        # issuecomment-361696418
+        # chained setitem used to cause consolidation
+        sdf = pd.SparseDataFrame([[np.nan, 1], [2, np.nan]])
+        with pd.option_context('mode.chained_assignment', None):
+            sdf[0][1] = 2
+        assert len(sdf._data.blocks) == 2
+
+    def test_delitem(self, float_frame):
+        A = float_frame['A']
+        C = float_frame['C']
+
+        del float_frame['B']
+        assert 'B' not in float_frame
+        tm.assert_sp_series_equal(float_frame['A'], A)
+        tm.assert_sp_series_equal(float_frame['C'], C)
+
+        del float_frame['D']
+        assert 'D' not in float_frame
+
+        del float_frame['A']
+        assert 'A' not in float_frame
+
+    def test_set_columns(self, float_frame):
+        float_frame.columns = float_frame.columns
+        msg = ("Length mismatch: Expected axis has 4 elements, new values have"
+               " 3 elements")
+        with pytest.raises(ValueError, match=msg):
+            float_frame.columns = float_frame.columns[:-1]
+
+    def test_set_index(self, float_frame):
+        float_frame.index = float_frame.index
+        msg = ("Length mismatch: Expected axis has 10 elements, new values"
+               " have 9 elements")
+        with pytest.raises(ValueError, match=msg):
+            float_frame.index = float_frame.index[:-1]
+
+    def test_ctor_reindex(self):
+        idx = pd.Index([0, 1, 2, 3])
+        msg = "Length of passed values is 2, index implies 4"
+        with pytest.raises(ValueError, match=msg):
+            pd.SparseDataFrame({"A": [1, 2]}, index=idx)
+
+    def test_append(self, float_frame):
+        a = float_frame[:5]
+        b = float_frame[5:]
+
+        appended = a.append(b)
+        tm.assert_sp_frame_equal(appended, float_frame, exact_indices=False)
+
+        a = float_frame.iloc[:5, :3]
+        b = float_frame.iloc[5:]
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            # Stacklevel is set for pd.concat, not append
+            appended = a.append(b)
+        tm.assert_sp_frame_equal(appended.iloc[:, :3], float_frame.iloc[:, :3],
+                                 exact_indices=False)
+
+        a = a[['B', 'C', 'A']].head(2)
+        b = b.head(2)
+
+        expected = pd.SparseDataFrame({
+            "B": [0., 1, None, 3],
+            "C": [0., 1, 5, 6],
+            "A": [None, None, 2, 3],
+            "D": [None, None, 5, None],
+        }, index=a.index | b.index, columns=['B', 'C', 'A', 'D'])
+        with tm.assert_produces_warning(None):
+            appended = a.append(b, sort=False)
+
+        tm.assert_frame_equal(appended, expected)
+
+        with tm.assert_produces_warning(None):
+            appended = a.append(b, sort=True)
+
+        tm.assert_sp_frame_equal(appended, expected[['A', 'B', 'C', 'D']],
+                                 consolidate_block_indices=True,
+                                 check_kind=False)
+
+    def test_astype(self):
+        sparse = pd.SparseDataFrame({'A': SparseArray([1, 2, 3, 4],
+                                                      dtype=np.int64),
+                                     'B': SparseArray([4, 5, 6, 7],
+                                                      dtype=np.int64)})
+        assert sparse['A'].dtype == SparseDtype(np.int64)
+        assert sparse['B'].dtype == SparseDtype(np.int64)
+
+        # retain fill_value
+        res = sparse.astype(np.float64)
+        exp = pd.SparseDataFrame({'A': SparseArray([1., 2., 3., 4.],
+                                                   fill_value=0,
+                                                   kind='integer'),
+                                  'B': SparseArray([4., 5., 6., 7.],
+                                                   fill_value=0,
+                                                   kind='integer')},
+                                 default_fill_value=np.nan)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == SparseDtype(np.float64, 0)
+        assert res['B'].dtype == SparseDtype(np.float64, 0)
+
+        # update fill_value
+        res = sparse.astype(SparseDtype(np.float64, np.nan))
+        exp = pd.SparseDataFrame({'A': SparseArray([1., 2., 3., 4.],
+                                                   fill_value=np.nan,
+                                                   kind='integer'),
+                                  'B': SparseArray([4., 5., 6., 7.],
+                                                   fill_value=np.nan,
+                                                   kind='integer')},
+                                 default_fill_value=np.nan)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == SparseDtype(np.float64, np.nan)
+        assert res['B'].dtype == SparseDtype(np.float64, np.nan)
+
+    def test_astype_bool(self):
+        sparse = pd.SparseDataFrame({'A': SparseArray([0, 2, 0, 4],
+                                                      fill_value=0,
+                                                      dtype=np.int64),
+                                     'B': SparseArray([0, 5, 0, 7],
+                                                      fill_value=0,
+                                                      dtype=np.int64)},
+                                    default_fill_value=0)
+        assert sparse['A'].dtype == SparseDtype(np.int64)
+        assert sparse['B'].dtype == SparseDtype(np.int64)
+
+        res = sparse.astype(SparseDtype(bool, False))
+        exp = pd.SparseDataFrame({'A': SparseArray([False, True, False, True],
+                                                   dtype=np.bool,
+                                                   fill_value=False,
+                                                   kind='integer'),
+                                  'B': SparseArray([False, True, False, True],
+                                                   dtype=np.bool,
+                                                   fill_value=False,
+                                                   kind='integer')},
+                                 default_fill_value=False)
+        tm.assert_sp_frame_equal(res, exp)
+        assert res['A'].dtype == SparseDtype(np.bool)
+        assert res['B'].dtype == SparseDtype(np.bool)
+
+    def test_astype_object(self):
+        # This may change in GH-23125
+        df = pd.DataFrame({"A": SparseArray([0, 1]),
+                           "B": SparseArray([0, 1])})
+        result = df.astype(object)
+        dtype = SparseDtype(object, 0)
+        expected = pd.DataFrame({"A": SparseArray([0, 1], dtype=dtype),
+                                 "B": SparseArray([0, 1], dtype=dtype)})
+        tm.assert_frame_equal(result, expected)
+
+    def test_fillna(self, float_frame_fill0, float_frame_fill0_dense):
+        df = float_frame_fill0.reindex(lrange(5))
+        dense = float_frame_fill0_dense.reindex(lrange(5))
+
+        result = df.fillna(0)
+        expected = dense.fillna(0)
+        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
+                                 exact_indices=False)
+        tm.assert_frame_equal(result.to_dense(), expected)
+
+        result = df.copy()
+        result.fillna(0, inplace=True)
+        expected = dense.fillna(0)
+
+        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
+                                 exact_indices=False)
+        tm.assert_frame_equal(result.to_dense(), expected)
+
+        result = df.copy()
+        result = df['A']
+        result.fillna(0, inplace=True)
+
+        expected = dense['A'].fillna(0)
+        # this changes internal SparseArray repr
+        # tm.assert_sp_series_equal(result, expected.to_sparse(fill_value=0))
+        tm.assert_series_equal(result.to_dense(), expected)
+
+    def test_fillna_fill_value(self):
+        df = pd.DataFrame({'A': [1, 0, 0], 'B': [np.nan, np.nan, 4]})
+
+        sparse = pd.SparseDataFrame(df)
+        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
+                              df.fillna(-1), check_dtype=False)
+
+        sparse = pd.SparseDataFrame(df, default_fill_value=0)
+        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
+                              df.fillna(-1), check_dtype=False)
+
+    def test_sparse_frame_pad_backfill_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+        sdf = df.to_sparse()
+
+        result = sdf[:2].reindex(index, method='pad', limit=5)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = sdf[:2].reindex(index).fillna(method='pad')
+        expected = expected.to_dense()
+        expected.values[-3:] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+        result = sdf[-2:].reindex(index, method='backfill', limit=5)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = sdf[-2:].reindex(index).fillna(method='backfill')
+        expected = expected.to_dense()
+        expected.values[:3] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+    def test_sparse_frame_fillna_limit(self):
+        index = np.arange(10)
+        df = DataFrame(np.random.randn(10, 4), index=index)
+        sdf = df.to_sparse()
+
+        result = sdf[:2].reindex(index)
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = result.fillna(method='pad', limit=5)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = sdf[:2].reindex(index).fillna(method='pad')
+        expected = expected.to_dense()
+        expected.values[-3:] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+        result = sdf[-2:].reindex(index)
+        with tm.assert_produces_warning(PerformanceWarning):
+            result = result.fillna(method='backfill', limit=5)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            expected = sdf[-2:].reindex(index).fillna(method='backfill')
+        expected = expected.to_dense()
+        expected.values[:3] = np.nan
+        expected = expected.to_sparse()
+        tm.assert_frame_equal(result, expected)
+
+    def test_rename(self, float_frame):
+        result = float_frame.rename(index=str)
+        expected = SparseDataFrame(float_frame.values,
+                                   index=float_frame.index.strftime(
+                                       "%Y-%m-%d %H:%M:%S"),
+                                   columns=list('ABCD'))
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = float_frame.rename(columns=lambda x: '%s%d' % (x, 1))
+        data = {'A1': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
+                'B1': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
+                'C1': np.arange(10, dtype=np.float64),
+                'D1': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
+        expected = SparseDataFrame(data, index=float_frame.index)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_corr(self, float_frame):
+        res = float_frame.corr()
+        # XXX: this stays sparse
+        tm.assert_frame_equal(res, float_frame.to_dense().corr().to_sparse())
+
+    def test_describe(self, float_frame):
+        float_frame['foo'] = np.nan
+        float_frame.get_dtype_counts()
+        str(float_frame)
+        desc = float_frame.describe()  # noqa
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_join(self, float_frame):
+        left = float_frame.loc[:, ['A', 'B']]
+        right = float_frame.loc[:, ['C', 'D']]
+        joined = left.join(right)
+        tm.assert_sp_frame_equal(joined, float_frame, exact_indices=False)
+
+        right = float_frame.loc[:, ['B', 'D']]
+        msg = (r"columns overlap but no suffix specified: Index\(\['B'\],"
+               r" dtype='object'\)")
+        with pytest.raises(ValueError, match=msg):
+            left.join(right)
+
+        with pytest.raises(ValueError, match='Other Series must have a name'):
+            float_frame.join(Series(
+                np.random.randn(len(float_frame)), index=float_frame.index))
+
+    def test_reindex(self, float_frame, float_frame_int_kind,
+                     float_frame_fill0, float_frame_fill2):
+
+        def _check_frame(frame):
+            index = frame.index
+            sidx = index[::2]
+            sidx2 = index[:5]  # noqa
+
+            sparse_result = frame.reindex(sidx)
+            dense_result = frame.to_dense().reindex(sidx)
+            tm.assert_frame_equal(sparse_result.to_dense(), dense_result)
+
+            tm.assert_frame_equal(frame.reindex(list(sidx)).to_dense(),
+                                  dense_result)
+
+            sparse_result2 = sparse_result.reindex(index)
+            dense_result2 = dense_result.reindex(index)
+            tm.assert_frame_equal(sparse_result2.to_dense(), dense_result2)
+
+            # propagate CORRECT fill value
+            tm.assert_almost_equal(sparse_result.default_fill_value,
+                                   frame.default_fill_value)
+            tm.assert_almost_equal(sparse_result['A'].fill_value,
+                                   frame['A'].fill_value)
+
+            # length zero
+            length_zero = frame.reindex([])
+            assert len(length_zero) == 0
+            assert len(length_zero.columns) == len(frame.columns)
+            assert len(length_zero['A']) == 0
+
+            # frame being reindexed has length zero
+            length_n = length_zero.reindex(index)
+            assert len(length_n) == len(frame)
+            assert len(length_n.columns) == len(frame.columns)
+            assert len(length_n['A']) == len(frame)
+
+            # reindex columns
+            reindexed = frame.reindex(columns=['A', 'B', 'Z'])
+            assert len(reindexed.columns) == 3
+            tm.assert_almost_equal(reindexed['Z'].fill_value,
+                                   frame.default_fill_value)
+            assert np.isnan(reindexed['Z'].sp_values).all()
+
+        _check_frame(float_frame)
+        _check_frame(float_frame_int_kind)
+        _check_frame(float_frame_fill0)
+        _check_frame(float_frame_fill2)
+
+        # with copy=False
+        reindexed = float_frame.reindex(float_frame.index, copy=False)
+        reindexed['F'] = reindexed['A']
+        assert 'F' in float_frame
+
+        reindexed = float_frame.reindex(float_frame.index)
+        reindexed['G'] = reindexed['A']
+        assert 'G' not in float_frame
+
+    def test_reindex_fill_value(self, float_frame_fill0,
+                                float_frame_fill0_dense):
+        rng = bdate_range('20110110', periods=20)
+
+        result = float_frame_fill0.reindex(rng, fill_value=0)
+        exp = float_frame_fill0_dense.reindex(rng, fill_value=0)
+        exp = exp.to_sparse(float_frame_fill0.default_fill_value)
+        tm.assert_sp_frame_equal(result, exp)
+
+    def test_reindex_method(self):
+
+        sparse = SparseDataFrame(data=[[11., 12., 14.],
+                                       [21., 22., 24.],
+                                       [41., 42., 44.]],
+                                 index=[1, 2, 4],
+                                 columns=[1, 2, 4],
+                                 dtype=float)
+
+        # Over indices
+
+        # default method
+        result = sparse.reindex(index=range(6))
+        expected = SparseDataFrame(data=[[nan, nan, nan],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [nan, nan, nan],
+                                         [41., 42., 44.],
+                                         [nan, nan, nan]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='bfill'
+        result = sparse.reindex(index=range(6), method='bfill')
+        expected = SparseDataFrame(data=[[11., 12., 14.],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [41., 42., 44.],
+                                         [41., 42., 44.],
+                                         [nan, nan, nan]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='ffill'
+        result = sparse.reindex(index=range(6), method='ffill')
+        expected = SparseDataFrame(data=[[nan, nan, nan],
+                                         [11., 12., 14.],
+                                         [21., 22., 24.],
+                                         [21., 22., 24.],
+                                         [41., 42., 44.],
+                                         [41., 42., 44.]],
+                                   index=range(6),
+                                   columns=[1, 2, 4],
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # Over columns
+
+        # default method
+        result = sparse.reindex(columns=range(6))
+        expected = SparseDataFrame(data=[[nan, 11., 12., nan, 14., nan],
+                                         [nan, 21., 22., nan, 24., nan],
+                                         [nan, 41., 42., nan, 44., nan]],
+                                   index=[1, 2, 4],
+                                   columns=range(6),
+                                   dtype=float)
+        tm.assert_sp_frame_equal(result, expected)
+
+        # method='bfill'
+        with pytest.raises(NotImplementedError):
+            sparse.reindex(columns=range(6), method='bfill')
+
+        # method='ffill'
+        with pytest.raises(NotImplementedError):
+            sparse.reindex(columns=range(6), method='ffill')
+
+    def test_take(self, float_frame):
+        result = float_frame.take([1, 0, 2], axis=1)
+        expected = float_frame.reindex(columns=['B', 'A', 'C'])
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_to_dense(self, float_frame, float_frame_int_kind,
+                      float_frame_dense,
+                      float_frame_fill0, float_frame_fill0_dense,
+                      float_frame_fill2, float_frame_fill2_dense):
+        def _check(frame, orig):
+            dense_dm = frame.to_dense()
+            # Sparse[float] != float
+            tm.assert_frame_equal(frame, dense_dm, check_dtype=False)
+            tm.assert_frame_equal(dense_dm, orig, check_dtype=False)
+
+        _check(float_frame, float_frame_dense)
+        _check(float_frame_int_kind, float_frame_dense)
+        _check(float_frame_fill0, float_frame_fill0_dense)
+        _check(float_frame_fill2, float_frame_fill2_dense)
+
+    @pytest.mark.filterwarnings("ignore:\\nPanel:FutureWarning")
+    def test_stack_sparse_frame(self, float_frame, float_frame_int_kind,
+                                float_frame_fill0, float_frame_fill2):
+        def _check(frame):
+            dense_frame = frame.to_dense()  # noqa
+
+            wp = Panel.from_dict({'foo': frame})
+            from_dense_lp = wp.to_frame()
+
+            from_sparse_lp = spf.stack_sparse_frame(frame)
+
+            tm.assert_numpy_array_equal(from_dense_lp.values,
+                                        from_sparse_lp.values)
+
+        _check(float_frame)
+        _check(float_frame_int_kind)
+
+        # for now
+        msg = "This routine assumes NaN fill value"
+        with pytest.raises(TypeError, match=msg):
+            _check(float_frame_fill0)
+        with pytest.raises(TypeError, match=msg):
+            _check(float_frame_fill2)
+
+    def test_transpose(self, float_frame, float_frame_int_kind,
+                       float_frame_dense,
+                       float_frame_fill0, float_frame_fill0_dense,
+                       float_frame_fill2, float_frame_fill2_dense):
+
+        def _check(frame, orig):
+            transposed = frame.T
+            untransposed = transposed.T
+            tm.assert_sp_frame_equal(frame, untransposed)
+
+            tm.assert_frame_equal(frame.T.to_dense(), orig.T)
+            tm.assert_frame_equal(frame.T.T.to_dense(), orig.T.T)
+            tm.assert_sp_frame_equal(frame, frame.T.T, exact_indices=False)
+
+        _check(float_frame, float_frame_dense)
+        _check(float_frame_int_kind, float_frame_dense)
+        _check(float_frame_fill0, float_frame_fill0_dense)
+        _check(float_frame_fill2, float_frame_fill2_dense)
+
+    def test_shift(self, float_frame, float_frame_int_kind, float_frame_dense,
+                   float_frame_fill0, float_frame_fill0_dense,
+                   float_frame_fill2, float_frame_fill2_dense):
+
+        def _check(frame, orig):
+            shifted = frame.shift(0)
+            exp = orig.shift(0)
+            tm.assert_frame_equal(shifted.to_dense(), exp)
+
+            shifted = frame.shift(1)
+            exp = orig.shift(1)
+            tm.assert_frame_equal(shifted.to_dense(), exp)
+
+            shifted = frame.shift(-2)
+            exp = orig.shift(-2)
+            tm.assert_frame_equal(shifted.to_dense(), exp)
+
+            shifted = frame.shift(2, freq='B')
+            exp = orig.shift(2, freq='B')
+            exp = exp.to_sparse(frame.default_fill_value,
+                                kind=frame.default_kind)
+            tm.assert_frame_equal(shifted, exp)
+
+            shifted = frame.shift(2, freq=BDay())
+            exp = orig.shift(2, freq=BDay())
+            exp = exp.to_sparse(frame.default_fill_value,
+                                kind=frame.default_kind)
+            tm.assert_frame_equal(shifted, exp)
+
+        _check(float_frame, float_frame_dense)
+        _check(float_frame_int_kind, float_frame_dense)
+        _check(float_frame_fill0, float_frame_fill0_dense)
+        _check(float_frame_fill2, float_frame_fill2_dense)
+
+    def test_count(self, float_frame):
+        dense_result = float_frame.to_dense().count()
+
+        result = float_frame.count()
+        tm.assert_series_equal(result.to_dense(), dense_result)
+
+        result = float_frame.count(axis=None)
+        tm.assert_series_equal(result.to_dense(), dense_result)
+
+        result = float_frame.count(axis=0)
+        tm.assert_series_equal(result.to_dense(), dense_result)
+
+        result = float_frame.count(axis=1)
+        dense_result = float_frame.to_dense().count(axis=1)
+
+        # win32 don't check dtype
+        tm.assert_series_equal(result, dense_result, check_dtype=False)
+
+    def test_numpy_transpose(self):
+        sdf = SparseDataFrame([1, 2, 3], index=[1, 2, 3], columns=['a'])
+        result = np.transpose(np.transpose(sdf))
+        tm.assert_sp_frame_equal(result, sdf)
+
+        msg = "the 'axes' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.transpose(sdf, axes=1)
+
+    def test_combine_first(self, float_frame):
+        df = float_frame
+
+        result = df[::2].combine_first(df)
+
+        expected = df[::2].to_dense().combine_first(df.to_dense())
+        expected = expected.to_sparse(fill_value=df.default_fill_value)
+
+        tm.assert_sp_frame_equal(result, expected)
+
+    @pytest.mark.xfail(reason="No longer supported.")
+    def test_combine_first_with_dense(self):
+        # We could support this if we allow
+        # pd.core.dtypes.cast.find_common_type to special case SparseDtype
+        # but I don't think that's worth it.
+        df = self.frame
+
+        result = df[::2].combine_first(df.to_dense())
+        expected = df[::2].to_dense().combine_first(df.to_dense())
+        expected = expected.to_sparse(fill_value=df.default_fill_value)
+
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_combine_add(self, float_frame):
+        df = float_frame.to_dense()
+        df2 = df.copy()
+        df2['C'][:3] = np.nan
+        df['A'][:3] = 5.7
+
+        result = df.to_sparse().add(df2.to_sparse(), fill_value=0)
+        expected = df.add(df2, fill_value=0).to_sparse()
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_isin(self):
+        sparse_df = DataFrame({'flag': [1., 0., 1.]}).to_sparse(fill_value=0.)
+        xp = sparse_df[sparse_df.flag == 1.]
+        rs = sparse_df[sparse_df.flag.isin([1.])]
+        tm.assert_frame_equal(xp, rs)
+
+    def test_sparse_pow_issue(self):
+        # 2220
+        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
+
+        # note : no error without nan
+        df = SparseDataFrame({'A': [nan, 0, 1]})
+
+        # note that 2 ** df works fine, also df ** 1
+        result = 1 ** df
+
+        r1 = result.take([0], 1)['A']
+        r2 = result['A']
+
+        assert len(r2.sp_values) == len(r1.sp_values)
+
+    def test_as_blocks(self):
+        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [nan, -3.9]},
+                             dtype='float64')
+
+        # deprecated 0.21.0
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            df_blocks = df.blocks
+        assert list(df_blocks.keys()) == ['Sparse[float64, nan]']
+        tm.assert_frame_equal(df_blocks['Sparse[float64, nan]'], df)
+
+    @pytest.mark.xfail(reason='nan column names in _init_dict problematic '
+                              '(GH#16894)')
+    def test_nan_columnname(self):
+        # GH 8822
+        nan_colname = DataFrame(Series(1.0, index=[0]), columns=[nan])
+        nan_colname_sparse = nan_colname.to_sparse()
+        assert np.isnan(nan_colname_sparse.columns[0])
+
+    def test_isna(self):
+        # GH 8276
+        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
+                                 'B': [0, np.nan, np.nan, 2, np.nan]})
+
+        res = df.isna()
+        exp = pd.SparseDataFrame({'A': [True, True, False, False, True],
+                                  'B': [False, True, True, False, True]},
+                                 default_fill_value=True)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
+                                 'B': [0, np.nan, 0, 2, np.nan]},
+                                default_fill_value=0.)
+        res = df.isna()
+        assert isinstance(res, pd.SparseDataFrame)
+        exp = pd.DataFrame({'A': [False, False, False, False, True],
+                            'B': [False, True, False, False, True]})
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_notna(self):
+        # GH 8276
+        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
+                                 'B': [0, np.nan, np.nan, 2, np.nan]})
+
+        res = df.notna()
+        exp = pd.SparseDataFrame({'A': [False, False, True, True, False],
+                                  'B': [True, False, False, True, False]},
+                                 default_fill_value=False)
+        exp._default_fill_value = np.nan
+        tm.assert_sp_frame_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
+                                 'B': [0, np.nan, 0, 2, np.nan]},
+                                default_fill_value=0.)
+        res = df.notna()
+        assert isinstance(res, pd.SparseDataFrame)
+        exp = pd.DataFrame({'A': [True, True, True, True, False],
+                            'B': [True, False, True, True, False]})
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_default_fill_value_with_no_data(self):
+        # GH 16807
+        expected = pd.SparseDataFrame([[1.0, 1.0], [1.0, 1.0]],
+                                      columns=list('ab'), index=range(2))
+        result = pd.SparseDataFrame(columns=list('ab'), index=range(2),
+                                    default_fill_value=1.0)
+        tm.assert_frame_equal(expected, result)
+
+
+class TestSparseDataFrameArithmetic(object):
+
+    def test_numeric_op_scalar(self):
+        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
+                           'B': [0, 1, 2, nan],
+                           'C': [1., 2., 3., 4.],
+                           'D': [nan, nan, nan, nan]})
+        sparse = df.to_sparse()
+
+        tm.assert_sp_frame_equal(sparse + 1, (df + 1).to_sparse())
+
+    def test_comparison_op_scalar(self):
+        # GH 13001
+        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
+                           'B': [0, 1, 2, nan],
+                           'C': [1., 2., 3., 4.],
+                           'D': [nan, nan, nan, nan]})
+        sparse = df.to_sparse()
+
+        # comparison changes internal repr, compare with dense
+        res = sparse > 1
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), df > 1)
+
+        res = sparse != 0
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), df != 0)
+
+
+class TestSparseDataFrameAnalytics(object):
+
+    def test_cumsum(self, float_frame):
+        expected = SparseDataFrame(float_frame.to_dense().cumsum())
+
+        result = float_frame.cumsum()
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = float_frame.cumsum(axis=None)
+        tm.assert_sp_frame_equal(result, expected)
+
+        result = float_frame.cumsum(axis=0)
+        tm.assert_sp_frame_equal(result, expected)
+
+    def test_numpy_cumsum(self, float_frame):
+        result = np.cumsum(float_frame)
+        expected = SparseDataFrame(float_frame.to_dense().cumsum())
+        tm.assert_sp_frame_equal(result, expected)
+
+        msg = "the 'dtype' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.cumsum(float_frame, dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.cumsum(float_frame, out=result)
+
+    def test_numpy_func_call(self, float_frame):
+        # no exception should be raised even though
+        # numpy passes in 'axis=None' or `axis=-1'
+        funcs = ['sum', 'cumsum', 'var',
+                 'mean', 'prod', 'cumprod',
+                 'std', 'min', 'max']
+        for func in funcs:
+            getattr(np, func)(float_frame)
+
+    @pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH 17386)')
+    def test_quantile(self):
+        # GH 17386
+        data = [[1, 1], [2, 10], [3, 100], [nan, nan]]
+        q = 0.1
+
+        sparse_df = SparseDataFrame(data)
+        result = sparse_df.quantile(q)
+
+        dense_df = DataFrame(data)
+        dense_expected = dense_df.quantile(q)
+        sparse_expected = SparseSeries(dense_expected)
+
+        tm.assert_series_equal(result, dense_expected)
+        tm.assert_sp_series_equal(result, sparse_expected)
+
+    @pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH 17386)')
+    def test_quantile_multi(self):
+        # GH 17386
+        data = [[1, 1], [2, 10], [3, 100], [nan, nan]]
+        q = [0.1, 0.5]
+
+        sparse_df = SparseDataFrame(data)
+        result = sparse_df.quantile(q)
+
+        dense_df = DataFrame(data)
+        dense_expected = dense_df.quantile(q)
+        sparse_expected = SparseDataFrame(dense_expected)
+
+        tm.assert_frame_equal(result, dense_expected)
+        tm.assert_sp_frame_equal(result, sparse_expected)
+
+    def test_assign_with_sparse_frame(self):
+        # GH 19163
+        df = pd.DataFrame({"a": [1, 2, 3]})
+        res = df.to_sparse(fill_value=False).assign(newcol=False)
+        exp = df.assign(newcol=False).to_sparse(fill_value=False)
+
+        tm.assert_sp_frame_equal(res, exp)
+
+        for column in res.columns:
+            assert type(res[column]) is SparseSeries
+
+    @pytest.mark.parametrize("inplace", [True, False])
+    @pytest.mark.parametrize("how", ["all", "any"])
+    def test_dropna(self, inplace, how):
+        # Tests regression #21172.
+        expected = pd.SparseDataFrame({"F2": [0, 1]})
+        input_df = pd.SparseDataFrame(
+            {"F1": [float('nan'), float('nan')], "F2": [0, 1]}
+        )
+        result_df = input_df.dropna(axis=1, inplace=inplace, how=how)
+        if inplace:
+            result_df = input_df
+        tm.assert_sp_frame_equal(expected, result_df)
diff --git a/pandas/tests/sparse/frame/test_indexing.py b/pandas/tests/sparse/frame/test_indexing.py
new file mode 100644
index 0000000000000..2d2a7ac278dd6
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_indexing.py
@@ -0,0 +1,109 @@
+import numpy as np
+import pytest
+
+from pandas import DataFrame, SparseDataFrame
+from pandas.util import testing as tm
+
+pytestmark = pytest.mark.skip("Wrong SparseBlock initialization (GH 17386)")
+
+
+@pytest.mark.parametrize('data', [
+    [[1, 1], [2, 2], [3, 3], [4, 4], [0, 0]],
+    [[1.0, 1.0], [2.0, 2.0], [3.0, 3.0], [4.0, 4.0], [np.nan, np.nan]],
+    [
+        [1.0, 1.0 + 1.0j],
+        [2.0 + 2.0j, 2.0],
+        [3.0, 3.0 + 3.0j],
+        [4.0 + 4.0j, 4.0],
+        [np.nan, np.nan]
+    ]
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_numeric_data(data):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse > lower_bound)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense > lower_bound)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('data', [
+    [[1, 1], [2, 2], [3, 3], [4, 4], [0, 0]],
+    [[1.0, 1.0], [2.0, 2.0], [3.0, 3.0], [4.0, 4.0], [np.nan, np.nan]],
+    [
+        [1.0, 1.0 + 1.0j],
+        [2.0 + 2.0j, 2.0],
+        [3.0, 3.0 + 3.0j],
+        [4.0 + 4.0j, 4.0],
+        [np.nan, np.nan]
+    ]
+])
+@pytest.mark.parametrize('other', [
+    True,
+    -100,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_numeric_data_and_other(data, other):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse > lower_bound, other)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense > lower_bound, other)
+    sparse_expected = SparseDataFrame(dense_expected,
+                                      default_fill_value=other)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_bool_data():
+    # GH 17386
+    data = [[False, False], [True, True], [False, False]]
+    cond = True
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse == cond)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense == cond)
+    sparse_expected = SparseDataFrame(dense_expected)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('other', [
+    True,
+    0,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_bool_data_and_other(other):
+    # GH 17386
+    data = [[False, False], [True, True], [False, False]]
+    cond = True
+
+    sparse = SparseDataFrame(data)
+    result = sparse.where(sparse == cond, other)
+
+    dense = DataFrame(data)
+    dense_expected = dense.where(dense == cond, other)
+    sparse_expected = SparseDataFrame(dense_expected,
+                                      default_fill_value=other)
+
+    tm.assert_frame_equal(result, dense_expected)
+    tm.assert_sp_frame_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/frame/test_to_csv.py b/pandas/tests/sparse/frame/test_to_csv.py
new file mode 100644
index 0000000000000..ed19872f8a7ef
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_to_csv.py
@@ -0,0 +1,21 @@
+import numpy as np
+import pytest
+
+from pandas import SparseDataFrame, read_csv
+from pandas.util import testing as tm
+
+
+class TestSparseDataFrameToCsv(object):
+    fill_values = [np.nan, 0, None, 1]
+
+    @pytest.mark.parametrize('fill_value', fill_values)
+    def test_to_csv_sparse_dataframe(self, fill_value):
+        # GH19384
+        sdf = SparseDataFrame({'a': type(self).fill_values},
+                              default_fill_value=fill_value)
+
+        with tm.ensure_clean('sparse_df.csv') as path:
+            sdf.to_csv(path, index=False)
+            df = read_csv(path, skip_blank_lines=False)
+
+            tm.assert_sp_frame_equal(df.to_sparse(fill_value=fill_value), sdf)
diff --git a/pandas/tests/sparse/frame/test_to_from_scipy.py b/pandas/tests/sparse/frame/test_to_from_scipy.py
new file mode 100644
index 0000000000000..bdb2cd022b451
--- /dev/null
+++ b/pandas/tests/sparse/frame/test_to_from_scipy.py
@@ -0,0 +1,185 @@
+from distutils.version import LooseVersion
+
+import numpy as np
+import pytest
+
+from pandas.core.dtypes.common import is_bool_dtype
+
+import pandas as pd
+from pandas import SparseDataFrame, SparseSeries
+from pandas.core.sparse.api import SparseDtype
+from pandas.util import testing as tm
+
+scipy = pytest.importorskip('scipy')
+ignore_matrix_warning = pytest.mark.filterwarnings(
+    "ignore:the matrix subclass:PendingDeprecationWarning"
+)
+
+
+@pytest.mark.parametrize('index', [None, list('abc')])  # noqa: F811
+@pytest.mark.parametrize('columns', [None, list('def')])
+@pytest.mark.parametrize('fill_value', [None, 0, np.nan])
+@pytest.mark.parametrize('dtype', [bool, int, float, np.uint16])
+@ignore_matrix_warning
+def test_from_to_scipy(spmatrix, index, columns, fill_value, dtype):
+    # GH 4343
+    # Make one ndarray and from it one sparse matrix, both to be used for
+    # constructing frames and comparing results
+    arr = np.eye(3, dtype=dtype)
+    # GH 16179
+    arr[0, 1] = dtype(2)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm, index=index, columns=columns,
+                          default_fill_value=fill_value)
+
+    # Expected result construction is kind of tricky for all
+    # dtype-fill_value combinations; easiest to cast to something generic
+    # and except later on
+    rarr = arr.astype(object)
+    rarr[arr == 0] = np.nan
+    expected = SparseDataFrame(rarr, index=index, columns=columns).fillna(
+        fill_value if fill_value is not None else np.nan)
+
+    # Assert frame is as expected
+    sdf_obj = sdf.astype(object)
+    tm.assert_sp_frame_equal(sdf_obj, expected)
+    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
+
+    # Assert spmatrices equal
+    assert dict(sdf.to_coo().todok()) == dict(spm.todok())
+
+    # Ensure dtype is preserved if possible
+    # XXX: verify this
+    res_dtype = bool if is_bool_dtype(dtype) else dtype
+    tm.assert_contains_all(sdf.dtypes.apply(lambda dtype: dtype.subtype),
+                           {np.dtype(res_dtype)})
+    assert sdf.to_coo().dtype == res_dtype
+
+    # However, adding a str column results in an upcast to object
+    sdf['strings'] = np.arange(len(sdf)).astype(str)
+    assert sdf.to_coo().dtype == np.object_
+
+
+@pytest.mark.parametrize('fill_value', [None, 0, np.nan])  # noqa: F811
+@ignore_matrix_warning
+@pytest.mark.filterwarnings("ignore:object dtype is not supp:UserWarning")
+def test_from_to_scipy_object(spmatrix, fill_value):
+    # GH 4343
+    dtype = object
+    columns = list('cd')
+    index = list('ab')
+
+    if (spmatrix is scipy.sparse.dok_matrix and LooseVersion(
+            scipy.__version__) >= LooseVersion('0.19.0')):
+        pytest.skip("dok_matrix from object does not work in SciPy >= 0.19")
+
+    # Make one ndarray and from it one sparse matrix, both to be used for
+    # constructing frames and comparing results
+    arr = np.eye(2, dtype=dtype)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm, index=index, columns=columns,
+                          default_fill_value=fill_value)
+
+    # Expected result construction is kind of tricky for all
+    # dtype-fill_value combinations; easiest to cast to something generic
+    # and except later on
+    rarr = arr.astype(object)
+    rarr[arr == 0] = np.nan
+    expected = SparseDataFrame(rarr, index=index, columns=columns).fillna(
+        fill_value if fill_value is not None else np.nan)
+
+    # Assert frame is as expected
+    sdf_obj = sdf.astype(SparseDtype(object, fill_value))
+    tm.assert_sp_frame_equal(sdf_obj, expected)
+    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
+
+    # Assert spmatrices equal
+    assert dict(sdf.to_coo().todok()) == dict(spm.todok())
+
+    # Ensure dtype is preserved if possible
+    res_dtype = object
+    tm.assert_contains_all(sdf.dtypes.apply(lambda dtype: dtype.subtype),
+                           {np.dtype(res_dtype)})
+    assert sdf.to_coo().dtype == res_dtype
+
+
+@ignore_matrix_warning
+def test_from_scipy_correct_ordering(spmatrix):
+    # GH 16179
+    arr = np.arange(1, 5).reshape(2, 2)
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm)
+    expected = SparseDataFrame(arr)
+    tm.assert_sp_frame_equal(sdf, expected)
+    tm.assert_frame_equal(sdf.to_dense(), expected.to_dense())
+
+
+@ignore_matrix_warning
+def test_from_scipy_fillna(spmatrix):
+    # GH 16112
+    arr = np.eye(3)
+    arr[1:, 0] = np.nan
+
+    try:
+        spm = spmatrix(arr)
+        assert spm.dtype == arr.dtype
+    except (TypeError, AssertionError):
+        # If conversion to sparse fails for this spmatrix type and arr.dtype,
+        # then the combination is not currently supported in NumPy, so we
+        # can just skip testing it thoroughly
+        return
+
+    sdf = SparseDataFrame(spm).fillna(-1.0)
+
+    # Returning frame should fill all nan values with -1.0
+    expected = SparseDataFrame({
+        0: SparseSeries([1., -1, -1]),
+        1: SparseSeries([np.nan, 1, np.nan]),
+        2: SparseSeries([np.nan, np.nan, 1]),
+    }, default_fill_value=-1)
+
+    # fill_value is expected to be what .fillna() above was called with
+    # We don't use -1 as initial fill_value in expected SparseSeries
+    # construction because this way we obtain "compressed" SparseArrays,
+    # avoiding having to construct them ourselves
+    for col in expected:
+        expected[col].fill_value = -1
+
+    tm.assert_sp_frame_equal(sdf, expected)
+
+
+def test_index_names_multiple_nones():
+    # https://github.com/pandas-dev/pandas/pull/24092
+    sparse = pytest.importorskip("scipy.sparse")
+
+    s = (pd.Series(1, index=pd.MultiIndex.from_product([['A', 'B'], [0, 1]]))
+           .to_sparse())
+    result, _, _ = s.to_coo()
+    assert isinstance(result, sparse.coo_matrix)
+    result = result.toarray()
+    expected = np.ones((2, 2), dtype="int64")
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/sparse/series/__init__.py b/pandas/tests/sparse/series/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/sparse/series/test_indexing.py b/pandas/tests/sparse/series/test_indexing.py
new file mode 100644
index 0000000000000..0f4235d7cc3fe
--- /dev/null
+++ b/pandas/tests/sparse/series/test_indexing.py
@@ -0,0 +1,111 @@
+import numpy as np
+import pytest
+
+from pandas import Series, SparseSeries
+from pandas.util import testing as tm
+
+pytestmark = pytest.mark.skip("Wrong SparseBlock initialization (GH 17386)")
+
+
+@pytest.mark.parametrize('data', [
+    [1, 1, 2, 2, 3, 3, 4, 4, 0, 0],
+    [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, np.nan, np.nan],
+    [
+        1.0, 1.0 + 1.0j,
+        2.0 + 2.0j, 2.0,
+        3.0, 3.0 + 3.0j,
+        4.0 + 4.0j, 4.0,
+        np.nan, np.nan
+    ]
+])
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_numeric_data(data):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse > lower_bound)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense > lower_bound)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('data', [
+    [1, 1, 2, 2, 3, 3, 4, 4, 0, 0],
+    [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, np.nan, np.nan],
+    [
+        1.0, 1.0 + 1.0j,
+        2.0 + 2.0j, 2.0,
+        3.0, 3.0 + 3.0j,
+        4.0 + 4.0j, 4.0,
+        np.nan, np.nan
+    ]
+])
+@pytest.mark.parametrize('other', [
+    True,
+    -100,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.skip(reason='Wrong SparseBlock initialization '
+                         '(Segfault) '
+                         '(GH 17386)')
+def test_where_with_numeric_data_and_other(data, other):
+    # GH 17386
+    lower_bound = 1.5
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse > lower_bound, other)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense > lower_bound, other)
+    sparse_expected = SparseSeries(dense_expected, fill_value=other)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.xfail(reason='Wrong SparseBlock initialization (GH#17386)')
+def test_where_with_bool_data():
+    # GH 17386
+    data = [False, False, True, True, False, False]
+    cond = True
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse == cond)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense == cond)
+    sparse_expected = SparseSeries(dense_expected)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
+
+
+@pytest.mark.parametrize('other', [
+    True,
+    0,
+    0.1,
+    100.0 + 100.0j
+])
+@pytest.mark.skip(reason='Wrong SparseBlock initialization '
+                         '(Segfault) '
+                         '(GH 17386)')
+def test_where_with_bool_data_and_other(other):
+    # GH 17386
+    data = [False, False, True, True, False, False]
+    cond = True
+
+    sparse = SparseSeries(data)
+    result = sparse.where(sparse == cond, other)
+
+    dense = Series(data)
+    dense_expected = dense.where(dense == cond, other)
+    sparse_expected = SparseSeries(dense_expected, fill_value=other)
+
+    tm.assert_series_equal(result, dense_expected)
+    tm.assert_sp_series_equal(result, sparse_expected)
diff --git a/pandas/tests/sparse/series/test_series.py b/pandas/tests/sparse/series/test_series.py
new file mode 100644
index 0000000000000..93cf629f20957
--- /dev/null
+++ b/pandas/tests/sparse/series/test_series.py
@@ -0,0 +1,1535 @@
+# pylint: disable-msg=E1101,W0612
+
+from datetime import datetime
+import operator
+
+import numpy as np
+from numpy import nan
+import pytest
+
+from pandas._libs.sparse import BlockIndex, IntIndex
+from pandas.compat import PY36, range
+from pandas.errors import PerformanceWarning
+import pandas.util._test_decorators as td
+
+import pandas as pd
+from pandas import (
+    DataFrame, Series, SparseDtype, SparseSeries, bdate_range, compat, isna)
+from pandas.core.reshape.util import cartesian_product
+import pandas.core.sparse.frame as spf
+from pandas.tests.series.test_api import SharedWithSparse
+import pandas.util.testing as tm
+
+from pandas.tseries.offsets import BDay
+
+
+def _test_data1():
+    # nan-based
+    arr = np.arange(20, dtype=float)
+    index = np.arange(20)
+    arr[:2] = nan
+    arr[5:10] = nan
+    arr[-3:] = nan
+
+    return arr, index
+
+
+def _test_data2():
+    # nan-based
+    arr = np.arange(15, dtype=float)
+    index = np.arange(15)
+    arr[7:12] = nan
+    arr[-1:] = nan
+    return arr, index
+
+
+def _test_data1_zero():
+    # zero-based
+    arr, index = _test_data1()
+    arr[np.isnan(arr)] = 0
+    return arr, index
+
+
+def _test_data2_zero():
+    # zero-based
+    arr, index = _test_data2()
+    arr[np.isnan(arr)] = 0
+    return arr, index
+
+
+class TestSparseSeries(SharedWithSparse):
+
+    series_klass = SparseSeries
+    # SharedWithSparse tests use generic, series_klass-agnostic assertion
+    _assert_series_equal = staticmethod(tm.assert_sp_series_equal)
+
+    def setup_method(self, method):
+        arr, index = _test_data1()
+
+        date_index = bdate_range('1/1/2011', periods=len(index))
+
+        self.bseries = SparseSeries(arr, index=index, kind='block',
+                                    name='bseries')
+        self.ts = self.bseries
+
+        self.btseries = SparseSeries(arr, index=date_index, kind='block')
+
+        self.iseries = SparseSeries(arr, index=index, kind='integer',
+                                    name='iseries')
+
+        arr, index = _test_data2()
+        self.bseries2 = SparseSeries(arr, index=index, kind='block')
+        self.iseries2 = SparseSeries(arr, index=index, kind='integer')
+
+        arr, index = _test_data1_zero()
+        self.zbseries = SparseSeries(arr, index=index, kind='block',
+                                     fill_value=0, name='zbseries')
+        self.ziseries = SparseSeries(arr, index=index, kind='integer',
+                                     fill_value=0)
+
+        arr, index = _test_data2_zero()
+        self.zbseries2 = SparseSeries(arr, index=index, kind='block',
+                                      fill_value=0)
+        self.ziseries2 = SparseSeries(arr, index=index, kind='integer',
+                                      fill_value=0)
+
+    def test_constructor_dict_input(self):
+        # gh-16905
+        constructor_dict = {1: 1.}
+        index = [0, 1, 2]
+
+        # Series with index passed in
+        series = pd.Series(constructor_dict)
+        expected = SparseSeries(series, index=index)
+
+        result = SparseSeries(constructor_dict, index=index)
+        tm.assert_sp_series_equal(result, expected)
+
+        # Series with index and dictionary with no index
+        expected = SparseSeries(series)
+
+        result = SparseSeries(constructor_dict)
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_constructor_dict_order(self):
+        # GH19018
+        # initialization ordering: by insertion order if python>= 3.6, else
+        # order by value
+        d = {'b': 1, 'a': 0, 'c': 2}
+        result = SparseSeries(d)
+        if PY36:
+            expected = SparseSeries([1, 0, 2], index=list('bac'))
+        else:
+            expected = SparseSeries([0, 1, 2], index=list('abc'))
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_constructor_dtype(self):
+        arr = SparseSeries([np.nan, 1, 2, np.nan])
+        assert arr.dtype == SparseDtype(np.float64)
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseSeries([np.nan, 1, 2, np.nan], fill_value=0)
+        assert arr.dtype == SparseDtype(np.float64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64, fill_value=np.nan)
+        assert arr.dtype == SparseDtype(np.int64, np.nan)
+        assert np.isnan(arr.fill_value)
+
+        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+        arr = SparseSeries([0, 1, 2, 4], fill_value=0, dtype=np.int64)
+        assert arr.dtype == SparseDtype(np.int64, 0)
+        assert arr.fill_value == 0
+
+    def test_iteration_and_str(self):
+        [x for x in self.bseries]
+        str(self.bseries)
+
+    def test_construct_DataFrame_with_sp_series(self):
+        # it works!
+        df = DataFrame({'col': self.bseries})
+
+        # printing & access
+        df.iloc[:1]
+        df['col']
+        df.dtypes
+        str(df)
+
+        # blocking
+        expected = Series({'col': 'float64:sparse'})
+        result = df.ftypes
+        tm.assert_series_equal(expected, result)
+
+    def test_constructor_preserve_attr(self):
+        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
+        assert arr.dtype == SparseDtype(np.int64)
+        assert arr.fill_value == 0
+
+        s = pd.SparseSeries(arr, name='x')
+        assert s.dtype == SparseDtype(np.int64)
+        assert s.fill_value == 0
+
+    def test_series_density(self):
+        # GH2803
+        ts = Series(np.random.randn(10))
+        ts[2:-2] = nan
+        sts = ts.to_sparse()
+        density = sts.density  # don't die
+        assert density == 4 / 10.0
+
+    def test_sparse_to_dense(self):
+        arr, index = _test_data1()
+        series = self.bseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='bseries'))
+
+        series = self.iseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='iseries'))
+
+        arr, index = _test_data1_zero()
+        series = self.zbseries.to_dense()
+        tm.assert_series_equal(series, Series(arr, name='zbseries'))
+
+        series = self.ziseries.to_dense()
+        tm.assert_series_equal(series, Series(arr))
+
+    def test_to_dense_fill_value(self):
+        s = pd.Series([1, np.nan, np.nan, 3, np.nan])
+        res = SparseSeries(s).to_dense()
+        tm.assert_series_equal(res, s)
+
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([1, np.nan, 0, 3, 0])
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
+        res = SparseSeries(s).to_dense()
+        tm.assert_series_equal(res, s)
+
+        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
+        res = SparseSeries(s, fill_value=0).to_dense()
+        tm.assert_series_equal(res, s)
+
+    def test_dense_to_sparse(self):
+        series = self.bseries.to_dense()
+        bseries = series.to_sparse(kind='block')
+        iseries = series.to_sparse(kind='integer')
+        tm.assert_sp_series_equal(bseries, self.bseries)
+        tm.assert_sp_series_equal(iseries, self.iseries, check_names=False)
+        assert iseries.name == self.bseries.name
+
+        assert len(series) == len(bseries)
+        assert len(series) == len(iseries)
+        assert series.shape == bseries.shape
+        assert series.shape == iseries.shape
+
+        # non-NaN fill value
+        series = self.zbseries.to_dense()
+        zbseries = series.to_sparse(kind='block', fill_value=0)
+        ziseries = series.to_sparse(kind='integer', fill_value=0)
+        tm.assert_sp_series_equal(zbseries, self.zbseries)
+        tm.assert_sp_series_equal(ziseries, self.ziseries, check_names=False)
+        assert ziseries.name == self.zbseries.name
+
+        assert len(series) == len(zbseries)
+        assert len(series) == len(ziseries)
+        assert series.shape == zbseries.shape
+        assert series.shape == ziseries.shape
+
+    def test_to_dense_preserve_name(self):
+        assert (self.bseries.name is not None)
+        result = self.bseries.to_dense()
+        assert result.name == self.bseries.name
+
+    def test_constructor(self):
+        # test setup guys
+        assert np.isnan(self.bseries.fill_value)
+        assert isinstance(self.bseries.sp_index, BlockIndex)
+        assert np.isnan(self.iseries.fill_value)
+        assert isinstance(self.iseries.sp_index, IntIndex)
+
+        assert self.zbseries.fill_value == 0
+        tm.assert_numpy_array_equal(self.zbseries.values.values,
+                                    self.bseries.to_dense().fillna(0).values)
+
+        # pass SparseSeries
+        def _check_const(sparse, name):
+            # use passed series name
+            result = SparseSeries(sparse)
+            tm.assert_sp_series_equal(result, sparse)
+            assert sparse.name == name
+            assert result.name == name
+
+            # use passed name
+            result = SparseSeries(sparse, name='x')
+            tm.assert_sp_series_equal(result, sparse, check_names=False)
+            assert result.name == 'x'
+
+        _check_const(self.bseries, 'bseries')
+        _check_const(self.iseries, 'iseries')
+        _check_const(self.zbseries, 'zbseries')
+
+        # Sparse time series works
+        date_index = bdate_range('1/1/2000', periods=len(self.bseries))
+        s5 = SparseSeries(self.bseries, index=date_index)
+        assert isinstance(s5, SparseSeries)
+
+        # pass Series
+        bseries2 = SparseSeries(self.bseries.to_dense())
+        tm.assert_numpy_array_equal(self.bseries.sp_values, bseries2.sp_values)
+
+        # pass dict?
+
+        # don't copy the data by default
+        values = np.ones(self.bseries.npoints)
+        sp = SparseSeries(values, sparse_index=self.bseries.sp_index)
+        sp.sp_values[:5] = 97
+        assert values[0] == 97
+
+        assert len(sp) == 20
+        assert sp.shape == (20, )
+
+        # but can make it copy!
+        sp = SparseSeries(values, sparse_index=self.bseries.sp_index,
+                          copy=True)
+        sp.sp_values[:5] = 100
+        assert values[0] == 97
+
+        assert len(sp) == 20
+        assert sp.shape == (20, )
+
+    def test_constructor_scalar(self):
+        data = 5
+        sp = SparseSeries(data, np.arange(100))
+        sp = sp.reindex(np.arange(200))
+        assert (sp.loc[:99] == data).all()
+        assert isna(sp.loc[100:]).all()
+
+        data = np.nan
+        sp = SparseSeries(data, np.arange(100))
+        assert len(sp) == 100
+        assert sp.shape == (100, )
+
+    def test_constructor_ndarray(self):
+        pass
+
+    def test_constructor_nonnan(self):
+        arr = [0, 0, 0, nan, nan]
+        sp_series = SparseSeries(arr, fill_value=0)
+        tm.assert_numpy_array_equal(sp_series.values.values, np.array(arr))
+        assert len(sp_series) == 5
+        assert sp_series.shape == (5, )
+
+    def test_constructor_empty(self):
+        # see gh-9272
+        sp = SparseSeries()
+        assert len(sp.index) == 0
+        assert sp.shape == (0, )
+
+    def test_copy_astype(self):
+        cop = self.bseries.astype(np.float64)
+        assert cop is not self.bseries
+        assert cop.sp_index is self.bseries.sp_index
+        assert cop.dtype == SparseDtype(np.float64)
+
+        cop2 = self.iseries.copy()
+
+        tm.assert_sp_series_equal(cop, self.bseries)
+        tm.assert_sp_series_equal(cop2, self.iseries)
+
+        # test that data is copied
+        cop[:5] = 97
+        assert cop.sp_values[0] == 97
+        assert self.bseries.sp_values[0] != 97
+
+        # correct fill value
+        zbcop = self.zbseries.copy()
+        zicop = self.ziseries.copy()
+
+        tm.assert_sp_series_equal(zbcop, self.zbseries)
+        tm.assert_sp_series_equal(zicop, self.ziseries)
+
+        # no deep copy
+        view = self.bseries.copy(deep=False)
+        view.sp_values[:5] = 5
+        assert (self.bseries.sp_values[:5] == 5).all()
+
+    def test_shape(self):
+        # see gh-10452
+        assert self.bseries.shape == (20, )
+        assert self.btseries.shape == (20, )
+        assert self.iseries.shape == (20, )
+
+        assert self.bseries2.shape == (15, )
+        assert self.iseries2.shape == (15, )
+
+        assert self.zbseries2.shape == (15, )
+        assert self.ziseries2.shape == (15, )
+
+    def test_astype(self):
+        result = self.bseries.astype(SparseDtype(np.int64, 0))
+        expected = (self.bseries.to_dense()
+                    .fillna(0)
+                    .astype(np.int64)
+                    .to_sparse(fill_value=0))
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_astype_all(self):
+        orig = pd.Series(np.array([1, 2, 3]))
+        s = SparseSeries(orig)
+
+        types = [np.float64, np.float32, np.int64,
+                 np.int32, np.int16, np.int8]
+        for typ in types:
+            dtype = SparseDtype(typ)
+            res = s.astype(dtype)
+            assert res.dtype == dtype
+            tm.assert_series_equal(res.to_dense(), orig.astype(typ))
+
+    def test_kind(self):
+        assert self.bseries.kind == 'block'
+        assert self.iseries.kind == 'integer'
+
+    def test_to_frame(self):
+        # GH 9850
+        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x')
+        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_sp_frame_equal(s.to_frame(), exp)
+
+        exp = pd.SparseDataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_sp_frame_equal(s.to_frame(name='y'), exp)
+
+        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x', fill_value=0)
+        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]},
+                                 default_fill_value=0)
+
+        tm.assert_sp_frame_equal(s.to_frame(), exp)
+        exp = pd.DataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
+        tm.assert_frame_equal(s.to_frame(name='y').to_dense(), exp)
+
+    def test_pickle(self):
+        def _test_roundtrip(series):
+            unpickled = tm.round_trip_pickle(series)
+            tm.assert_sp_series_equal(series, unpickled)
+            tm.assert_series_equal(series.to_dense(), unpickled.to_dense())
+
+        self._check_all(_test_roundtrip)
+
+    def _check_all(self, check_func):
+        check_func(self.bseries)
+        check_func(self.iseries)
+        check_func(self.zbseries)
+        check_func(self.ziseries)
+
+    def test_getitem(self):
+        def _check_getitem(sp, dense):
+            for idx, val in compat.iteritems(dense):
+                tm.assert_almost_equal(val, sp[idx])
+
+            for i in range(len(dense)):
+                tm.assert_almost_equal(sp[i], dense[i])
+                # j = np.float64(i)
+                # assert_almost_equal(sp[j], dense[j])
+
+                # API change 1/6/2012
+                # negative getitem works
+                # for i in xrange(len(dense)):
+                #     assert_almost_equal(sp[-i], dense[-i])
+
+        _check_getitem(self.bseries, self.bseries.to_dense())
+        _check_getitem(self.btseries, self.btseries.to_dense())
+
+        _check_getitem(self.zbseries, self.zbseries.to_dense())
+        _check_getitem(self.iseries, self.iseries.to_dense())
+        _check_getitem(self.ziseries, self.ziseries.to_dense())
+
+        # exception handling
+        with pytest.raises(IndexError, match="Out of bounds access"):
+            self.bseries[len(self.bseries) + 1]
+
+        # index not contained
+        msg = r"Timestamp\('2011-01-31 00:00:00', freq='B'\)"
+        with pytest.raises(KeyError, match=msg):
+            self.btseries[self.btseries.index[-1] + BDay()]
+
+    def test_get_get_value(self):
+        tm.assert_almost_equal(self.bseries.get(10), self.bseries[10])
+        assert self.bseries.get(len(self.bseries) + 1) is None
+
+        dt = self.btseries.index[10]
+        result = self.btseries.get(dt)
+        expected = self.btseries.to_dense()[dt]
+        tm.assert_almost_equal(result, expected)
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            tm.assert_almost_equal(
+                self.bseries.get_value(10), self.bseries[10])
+
+    def test_set_value(self):
+
+        idx = self.btseries.index[7]
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            self.btseries.set_value(idx, 0)
+        assert self.btseries[idx] == 0
+
+        with tm.assert_produces_warning(FutureWarning,
+                                        check_stacklevel=False):
+            self.iseries.set_value('foobar', 0)
+        assert self.iseries.index[-1] == 'foobar'
+        assert self.iseries['foobar'] == 0
+
+    def test_getitem_slice(self):
+        idx = self.bseries.index
+        res = self.bseries[::2]
+        assert isinstance(res, SparseSeries)
+
+        expected = self.bseries.reindex(idx[::2])
+        tm.assert_sp_series_equal(res, expected)
+
+        res = self.bseries[:5]
+        assert isinstance(res, SparseSeries)
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:5]))
+
+        res = self.bseries[5:]
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[5:]))
+
+        # negative indices
+        res = self.bseries[:-3]
+        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:-3]))
+
+    def test_take(self):
+        def _compare_with_dense(sp):
+            dense = sp.to_dense()
+
+            def _compare(idx):
+                dense_result = dense.take(idx).values
+                sparse_result = sp.take(idx)
+                assert isinstance(sparse_result, SparseSeries)
+                tm.assert_almost_equal(dense_result,
+                                       sparse_result.values.values)
+
+            _compare([1., 2., 3., 4., 5., 0.])
+            _compare([7, 2, 9, 0, 4])
+            _compare([3, 6, 3, 4, 7])
+
+        self._check_all(_compare_with_dense)
+
+        msg = "index 21 is out of bounds for size 20"
+        with pytest.raises(IndexError, match=msg):
+            self.bseries.take([0, len(self.bseries) + 1])
+
+        # Corner case
+        # XXX: changed test. Why wsa this considered a corner case?
+        sp = SparseSeries(np.ones(10) * nan)
+        exp = pd.Series(np.repeat(nan, 5))
+        tm.assert_series_equal(sp.take([0, 1, 2, 3, 4]), exp.to_sparse())
+
+        with tm.assert_produces_warning(FutureWarning):
+            sp.take([1, 5], convert=True)
+
+        with tm.assert_produces_warning(FutureWarning):
+            sp.take([1, 5], convert=False)
+
+    def test_numpy_take(self):
+        sp = SparseSeries([1.0, 2.0, 3.0])
+        indices = [1, 2]
+
+        tm.assert_series_equal(np.take(sp, indices, axis=0).to_dense(),
+                               np.take(sp.to_dense(), indices, axis=0))
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.take(sp, indices, out=np.empty(sp.shape))
+
+        msg = "the 'mode' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.take(sp, indices, out=None, mode='clip')
+
+    def test_setitem(self):
+        self.bseries[5] = 7.
+        assert self.bseries[5] == 7.
+
+    def test_setslice(self):
+        self.bseries[5:10] = 7.
+        tm.assert_series_equal(self.bseries[5:10].to_dense(),
+                               Series(7., index=range(5, 10),
+                                      name=self.bseries.name))
+
+    def test_operators(self):
+
+        def _check_op(a, b, op):
+            sp_result = op(a, b)
+            adense = a.to_dense() if isinstance(a, SparseSeries) else a
+            bdense = b.to_dense() if isinstance(b, SparseSeries) else b
+            dense_result = op(adense, bdense)
+            tm.assert_almost_equal(sp_result.to_dense(), dense_result)
+
+        def check(a, b):
+            _check_op(a, b, operator.add)
+            _check_op(a, b, operator.sub)
+            _check_op(a, b, operator.truediv)
+            _check_op(a, b, operator.floordiv)
+            _check_op(a, b, operator.mul)
+
+            _check_op(a, b, lambda x, y: operator.add(y, x))
+            _check_op(a, b, lambda x, y: operator.sub(y, x))
+            _check_op(a, b, lambda x, y: operator.truediv(y, x))
+            _check_op(a, b, lambda x, y: operator.floordiv(y, x))
+            _check_op(a, b, lambda x, y: operator.mul(y, x))
+
+            # NaN ** 0 = 1 in C?
+            # _check_op(a, b, operator.pow)
+            # _check_op(a, b, lambda x, y: operator.pow(y, x))
+
+        check(self.bseries, self.bseries)
+        check(self.iseries, self.iseries)
+        check(self.bseries, self.iseries)
+
+        check(self.bseries, self.bseries2)
+        check(self.bseries, self.iseries2)
+        check(self.iseries, self.iseries2)
+
+        # scalar value
+        check(self.bseries, 5)
+
+        # zero-based
+        check(self.zbseries, self.zbseries * 2)
+        check(self.zbseries, self.zbseries2)
+        check(self.ziseries, self.ziseries2)
+
+        # with dense
+        result = self.bseries + self.bseries.to_dense()
+        tm.assert_sp_series_equal(result, self.bseries + self.bseries)
+
+    def test_binary_operators(self):
+
+        # skipping for now #####
+        import pytest
+        pytest.skip("skipping sparse binary operators test")
+
+        def _check_inplace_op(iop, op):
+            tmp = self.bseries.copy()
+
+            expected = op(tmp, self.bseries)
+            iop(tmp, self.bseries)
+            tm.assert_sp_series_equal(tmp, expected)
+
+        inplace_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow']
+        for op in inplace_ops:
+            _check_inplace_op(getattr(operator, "i%s" % op),
+                              getattr(operator, op))
+
+    @pytest.mark.parametrize("values, op, fill_value", [
+        ([True, False, False, True], operator.invert, True),
+        ([True, False, False, True], operator.invert, False),
+        ([0, 1, 2, 3], operator.pos, 0),
+        ([0, 1, 2, 3], operator.neg, 0),
+        ([0, np.nan, 2, 3], operator.pos, np.nan),
+        ([0, np.nan, 2, 3], operator.neg, np.nan),
+    ])
+    def test_unary_operators(self, values, op, fill_value):
+        # https://github.com/pandas-dev/pandas/issues/22835
+        values = np.asarray(values)
+        if op is operator.invert:
+            new_fill_value = not fill_value
+        else:
+            new_fill_value = op(fill_value)
+        s = SparseSeries(values,
+                         fill_value=fill_value,
+                         index=['a', 'b', 'c', 'd'],
+                         name='name')
+        result = op(s)
+        expected = SparseSeries(op(values),
+                                fill_value=new_fill_value,
+                                index=['a', 'b', 'c', 'd'],
+                                name='name')
+        tm.assert_sp_series_equal(result, expected)
+
+    def test_abs(self):
+        s = SparseSeries([1, 2, -3], name='x')
+        expected = SparseSeries([1, 2, 3], name='x')
+        result = s.abs()
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = np.abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        s = SparseSeries([1, -2, 2, -3], fill_value=-2, name='x')
+        expected = SparseSeries([1, 2, 3], sparse_index=s.sp_index,
+                                fill_value=2, name='x')
+        result = s.abs()
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+        result = np.abs(s)
+        tm.assert_sp_series_equal(result, expected)
+        assert result.name == 'x'
+
+    def test_reindex(self):
+        def _compare_with_series(sps, new_index):
+            spsre = sps.reindex(new_index)
+
+            series = sps.to_dense()
+            seriesre = series.reindex(new_index)
+            seriesre = seriesre.to_sparse(fill_value=sps.fill_value)
+
+            tm.assert_sp_series_equal(spsre, seriesre)
+            tm.assert_series_equal(spsre.to_dense(), seriesre.to_dense())
+
+        _compare_with_series(self.bseries, self.bseries.index[::2])
+        _compare_with_series(self.bseries, list(self.bseries.index[::2]))
+        _compare_with_series(self.bseries, self.bseries.index[:10])
+        _compare_with_series(self.bseries, self.bseries.index[5:])
+
+        _compare_with_series(self.zbseries, self.zbseries.index[::2])
+        _compare_with_series(self.zbseries, self.zbseries.index[:10])
+        _compare_with_series(self.zbseries, self.zbseries.index[5:])
+
+        # special cases
+        same_index = self.bseries.reindex(self.bseries.index)
+        tm.assert_sp_series_equal(self.bseries, same_index)
+        assert same_index is not self.bseries
+
+        # corner cases
+        sp = SparseSeries([], index=[])
+        # TODO: sp_zero is not used anywhere...remove?
+        sp_zero = SparseSeries([], index=[], fill_value=0)  # noqa
+        _compare_with_series(sp, np.arange(10))
+
+        # with copy=False
+        reindexed = self.bseries.reindex(self.bseries.index, copy=True)
+        reindexed.sp_values[:] = 1.
+        assert (self.bseries.sp_values != 1.).all()
+
+        reindexed = self.bseries.reindex(self.bseries.index, copy=False)
+        reindexed.sp_values[:] = 1.
+        tm.assert_numpy_array_equal(self.bseries.sp_values, np.repeat(1., 10))
+
+    def test_sparse_reindex(self):
+        length = 10
+
+        def _check(values, index1, index2, fill_value):
+            first_series = SparseSeries(values, sparse_index=index1,
+                                        fill_value=fill_value)
+            reindexed = first_series.sparse_reindex(index2)
+            assert reindexed.sp_index is index2
+
+            int_indices1 = index1.to_int_index().indices
+            int_indices2 = index2.to_int_index().indices
+
+            expected = Series(values, index=int_indices1)
+            expected = expected.reindex(int_indices2).fillna(fill_value)
+            tm.assert_almost_equal(expected.values, reindexed.sp_values)
+
+            # make sure level argument asserts
+            # TODO: expected is not used anywhere...remove?
+            expected = expected.reindex(int_indices2).fillna(fill_value)  # noqa
+
+        def _check_with_fill_value(values, first, second, fill_value=nan):
+            i_index1 = IntIndex(length, first)
+            i_index2 = IntIndex(length, second)
+
+            b_index1 = i_index1.to_block_index()
+            b_index2 = i_index2.to_block_index()
+
+            _check(values, i_index1, i_index2, fill_value)
+            _check(values, b_index1, b_index2, fill_value)
+
+        def _check_all(values, first, second):
+            _check_with_fill_value(values, first, second, fill_value=nan)
+            _check_with_fill_value(values, first, second, fill_value=0)
+
+        index1 = [2, 4, 5, 6, 8, 9]
+        values1 = np.arange(6.)
+
+        _check_all(values1, index1, [2, 4, 5])
+        _check_all(values1, index1, [2, 3, 4, 5, 6, 7, 8, 9])
+        _check_all(values1, index1, [0, 1])
+        _check_all(values1, index1, [0, 1, 7, 8, 9])
+        _check_all(values1, index1, [])
+
+        first_series = SparseSeries(values1,
+                                    sparse_index=IntIndex(length, index1),
+                                    fill_value=nan)
+        with pytest.raises(TypeError,
+                           match='new index must be a SparseIndex'):
+            first_series.sparse_reindex(0)
+
+    def test_repr(self):
+        # TODO: These aren't used
+        bsrepr = repr(self.bseries)  # noqa
+        isrepr = repr(self.iseries)  # noqa
+
+    def test_iter(self):
+        pass
+
+    def test_truncate(self):
+        pass
+
+    def test_fillna(self):
+        pass
+
+    def test_groupby(self):
+        pass
+
+    def test_reductions(self):
+        def _compare_with_dense(obj, op):
+            sparse_result = getattr(obj, op)()
+            series = obj.to_dense()
+            dense_result = getattr(series, op)()
+            assert sparse_result == dense_result
+
+        to_compare = ['count', 'sum', 'mean', 'std', 'var', 'skew']
+
+        def _compare_all(obj):
+            for op in to_compare:
+                _compare_with_dense(obj, op)
+
+        _compare_all(self.bseries)
+
+        self.bseries.sp_values[5:10] = np.NaN
+        _compare_all(self.bseries)
+
+        _compare_all(self.zbseries)
+        self.zbseries.sp_values[5:10] = np.NaN
+        _compare_all(self.zbseries)
+
+        series = self.zbseries.copy()
+        series.fill_value = 2
+        _compare_all(series)
+
+        nonna = Series(np.random.randn(20)).to_sparse()
+        _compare_all(nonna)
+
+        nonna2 = Series(np.random.randn(20)).to_sparse(fill_value=0)
+        _compare_all(nonna2)
+
+    def test_dropna(self):
+        sp = SparseSeries([0, 0, 0, nan, nan, 5, 6], fill_value=0)
+
+        sp_valid = sp.dropna()
+
+        expected = sp.to_dense().dropna()
+        expected = expected[expected != 0]
+        exp_arr = pd.SparseArray(expected.values, fill_value=0, kind='block')
+        tm.assert_sp_array_equal(sp_valid.values, exp_arr)
+        tm.assert_index_equal(sp_valid.index, expected.index)
+        assert len(sp_valid.sp_values) == 2
+
+        result = self.bseries.dropna()
+        expected = self.bseries.to_dense().dropna()
+        assert not isinstance(result, SparseSeries)
+        tm.assert_series_equal(result, expected)
+
+    def test_homogenize(self):
+        def _check_matches(indices, expected):
+            data = {i: SparseSeries(idx.to_int_index().indices,
+                                    sparse_index=idx, fill_value=np.nan)
+                    for i, idx in enumerate(indices)}
+
+            # homogenized is only valid with NaN fill values
+            homogenized = spf.homogenize(data)
+
+            for k, v in compat.iteritems(homogenized):
+                assert (v.sp_index.equals(expected))
+
+        indices1 = [BlockIndex(10, [2], [7]), BlockIndex(10, [1, 6], [3, 4]),
+                    BlockIndex(10, [0], [10])]
+        expected1 = BlockIndex(10, [2, 6], [2, 3])
+        _check_matches(indices1, expected1)
+
+        indices2 = [BlockIndex(10, [2], [7]), BlockIndex(10, [2], [7])]
+        expected2 = indices2[0]
+        _check_matches(indices2, expected2)
+
+        # must have NaN fill value
+        data = {'a': SparseSeries(np.arange(7), sparse_index=expected2,
+                                  fill_value=0)}
+        with pytest.raises(TypeError, match="NaN fill value"):
+            spf.homogenize(data)
+
+    def test_fill_value_corner(self):
+        cop = self.zbseries.copy()
+        cop.fill_value = 0
+        result = self.bseries / cop
+
+        assert np.isnan(result.fill_value)
+
+        cop2 = self.zbseries.copy()
+        cop2.fill_value = 1
+        result = cop2 / cop
+        # 1 / 0 is inf
+        assert np.isinf(result.fill_value)
+
+    def test_fill_value_when_combine_const(self):
+        # GH12723
+        s = SparseSeries([0, 1, np.nan, 3, 4, 5], index=np.arange(6))
+
+        exp = s.fillna(0).add(2)
+        res = s.add(2, fill_value=0)
+        tm.assert_series_equal(res, exp)
+
+    def test_shift(self):
+        series = SparseSeries([nan, 1., 2., 3., nan, nan], index=np.arange(6))
+
+        shifted = series.shift(0)
+        # assert shifted is not series
+        tm.assert_sp_series_equal(shifted, series)
+
+        f = lambda s: s.shift(1)
+        _dense_series_compare(series, f)
+
+        f = lambda s: s.shift(-2)
+        _dense_series_compare(series, f)
+
+        series = SparseSeries([nan, 1., 2., 3., nan, nan],
+                              index=bdate_range('1/1/2000', periods=6))
+        f = lambda s: s.shift(2, freq='B')
+        _dense_series_compare(series, f)
+
+        f = lambda s: s.shift(2, freq=BDay())
+        _dense_series_compare(series, f)
+
+    def test_shift_nan(self):
+        # GH 12908
+        orig = pd.Series([np.nan, 2, np.nan, 4, 0, np.nan, 0])
+        sparse = orig.to_sparse()
+
+        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(1), orig.shift(1).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(2), orig.shift(2).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(3), orig.shift(3).to_sparse(),
+                                  check_kind=False)
+
+        tm.assert_sp_series_equal(sparse.shift(-1), orig.shift(-1).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-2), orig.shift(-2).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-3), orig.shift(-3).to_sparse())
+        tm.assert_sp_series_equal(sparse.shift(-4), orig.shift(-4).to_sparse())
+
+        sparse = orig.to_sparse(fill_value=0)
+        tm.assert_sp_series_equal(
+            sparse.shift(0),
+            orig.shift(0).to_sparse(fill_value=sparse.fill_value)
+        )
+        tm.assert_sp_series_equal(sparse.shift(1),
+                                  orig.shift(1).to_sparse(fill_value=0),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(2),
+                                  orig.shift(2).to_sparse(fill_value=0),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(3),
+                                  orig.shift(3).to_sparse(fill_value=0),
+                                  check_kind=False)
+
+        tm.assert_sp_series_equal(sparse.shift(-1),
+                                  orig.shift(-1).to_sparse(fill_value=0),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-2),
+                                  orig.shift(-2).to_sparse(fill_value=0),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-3),
+                                  orig.shift(-3).to_sparse(fill_value=0),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-4),
+                                  orig.shift(-4).to_sparse(fill_value=0),
+                                  check_kind=False)
+
+    def test_shift_dtype(self):
+        # GH 12908
+        orig = pd.Series([1, 2, 3, 4], dtype=np.int64)
+
+        sparse = orig.to_sparse()
+        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse())
+
+        sparse = orig.to_sparse(fill_value=np.nan)
+        tm.assert_sp_series_equal(sparse.shift(0),
+                                  orig.shift(0).to_sparse(fill_value=np.nan))
+        # shift(1) or more span changes dtype to float64
+        # XXX: SparseSeries doesn't need to shift dtype here.
+        # Do we want to astype in shift, for backwards compat?
+        # If not, document it.
+        tm.assert_sp_series_equal(sparse.shift(1).astype('f8'),
+                                  orig.shift(1).to_sparse(kind='integer'))
+        tm.assert_sp_series_equal(sparse.shift(2).astype('f8'),
+                                  orig.shift(2).to_sparse(kind='integer'))
+        tm.assert_sp_series_equal(sparse.shift(3).astype('f8'),
+                                  orig.shift(3).to_sparse(kind='integer'))
+
+        tm.assert_sp_series_equal(sparse.shift(-1).astype('f8'),
+                                  orig.shift(-1).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-2).astype('f8'),
+                                  orig.shift(-2).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-3).astype('f8'),
+                                  orig.shift(-3).to_sparse(),
+                                  check_kind=False)
+        tm.assert_sp_series_equal(sparse.shift(-4).astype('f8'),
+                                  orig.shift(-4).to_sparse(),
+                                  check_kind=False)
+
+    @pytest.mark.parametrize("fill_value", [
+        0,
+        1,
+        np.nan
+    ])
+    @pytest.mark.parametrize("periods", [0, 1, 2, 3, -1, -2, -3, -4])
+    def test_shift_dtype_fill_value(self, fill_value, periods):
+        # GH 12908
+        orig = pd.Series([1, 0, 0, 4], dtype=np.dtype('int64'))
+
+        sparse = orig.to_sparse(fill_value=fill_value)
+
+        result = sparse.shift(periods)
+        expected = orig.shift(periods).to_sparse(fill_value=fill_value)
+
+        tm.assert_sp_series_equal(result, expected,
+                                  check_kind=False,
+                                  consolidate_block_indices=True)
+
+    def test_combine_first(self):
+        s = self.bseries
+
+        result = s[::2].combine_first(s)
+        result2 = s[::2].combine_first(s.to_dense())
+
+        expected = s[::2].to_dense().combine_first(s.to_dense())
+        expected = expected.to_sparse(fill_value=s.fill_value)
+
+        tm.assert_sp_series_equal(result, result2)
+        tm.assert_sp_series_equal(result, expected)
+
+    @pytest.mark.parametrize('deep', [True, False])
+    @pytest.mark.parametrize('fill_value', [0, 1, np.nan, None])
+    def test_memory_usage_deep(self, deep, fill_value):
+        values = [1.0] + [fill_value] * 20
+        sparse_series = SparseSeries(values, fill_value=fill_value)
+        dense_series = Series(values)
+        sparse_usage = sparse_series.memory_usage(deep=deep)
+        dense_usage = dense_series.memory_usage(deep=deep)
+
+        assert sparse_usage < dense_usage
+
+
+class TestSparseHandlingMultiIndexes(object):
+
+    def setup_method(self, method):
+        miindex = pd.MultiIndex.from_product(
+            [["x", "y"], ["10", "20"]], names=['row-foo', 'row-bar'])
+        micol = pd.MultiIndex.from_product(
+            [['a', 'b', 'c'], ["1", "2"]], names=['col-foo', 'col-bar'])
+        dense_multiindex_frame = pd.DataFrame(
+            index=miindex, columns=micol).sort_index().sort_index(axis=1)
+        self.dense_multiindex_frame = dense_multiindex_frame.fillna(value=3.14)
+
+    def test_to_sparse_preserve_multiindex_names_columns(self):
+        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
+        sparse_multiindex_frame = sparse_multiindex_frame.copy()
+        tm.assert_index_equal(sparse_multiindex_frame.columns,
+                              self.dense_multiindex_frame.columns)
+
+    def test_round_trip_preserve_multiindex_names(self):
+        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
+        round_trip_multiindex_frame = sparse_multiindex_frame.to_dense()
+        tm.assert_frame_equal(self.dense_multiindex_frame,
+                              round_trip_multiindex_frame,
+                              check_column_type=True,
+                              check_names=True)
+
+
+@td.skip_if_no_scipy
+@pytest.mark.filterwarnings(
+    "ignore:the matrix subclass:PendingDeprecationWarning"
+)
+class TestSparseSeriesScipyInteraction(object):
+    # Issue 8048: add SparseSeries coo methods
+
+    def setup_method(self, method):
+        import scipy.sparse
+        # SparseSeries inputs used in tests, the tests rely on the order
+        self.sparse_series = []
+        s = pd.Series([3.0, nan, 1.0, 2.0, nan, nan])
+        s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
+                                             (1, 2, 'a', 1),
+                                             (1, 1, 'b', 0),
+                                             (1, 1, 'b', 1),
+                                             (2, 1, 'b', 0),
+                                             (2, 1, 'b', 1)],
+                                            names=['A', 'B', 'C', 'D'])
+        self.sparse_series.append(s.to_sparse())
+
+        ss = self.sparse_series[0].copy()
+        ss.index.names = [3, 0, 1, 2]
+        self.sparse_series.append(ss)
+
+        ss = pd.Series([
+            nan
+        ] * 12, index=cartesian_product((range(3), range(4)))).to_sparse()
+        for k, v in zip([(0, 0), (1, 2), (1, 3)], [3.0, 1.0, 2.0]):
+            ss[k] = v
+        self.sparse_series.append(ss)
+
+        # results used in tests
+        self.coo_matrices = []
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 2, 3])), shape=(3, 4)))
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(3, 4)))
+        self.coo_matrices.append(scipy.sparse.coo_matrix(
+            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 0, 1])), shape=(3, 2)))
+        self.ils = [[(1, 2), (1, 1), (2, 1)], [(1, 1), (1, 2), (2, 1)],
+                    [(1, 2, 'a'), (1, 1, 'b'), (2, 1, 'b')]]
+        self.jls = [[('a', 0), ('a', 1), ('b', 0), ('b', 1)], [0, 1]]
+
+    def test_to_coo_text_names_integer_row_levels_nosort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': [0, 1], 'column_levels': [2, 3]}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_integer_row_levels_sort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': [0, 1],
+                  'column_levels': [2, 3],
+                  'sort_labels': True}
+        result = (self.coo_matrices[1], self.ils[1], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_text_row_levels_nosort_col_level_single(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': ['A', 'B', 'C'],
+                  'column_levels': ['D'],
+                  'sort_labels': False}
+        result = (self.coo_matrices[2], self.ils[2], self.jls[1])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_integer_names_integer_row_levels_nosort(self):
+        ss = self.sparse_series[1]
+        kwargs = {'row_levels': [3, 0], 'column_levels': [1, 2]}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_text_names_text_row_levels_nosort(self):
+        ss = self.sparse_series[0]
+        kwargs = {'row_levels': ['A', 'B'], 'column_levels': ['C', 'D']}
+        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
+        self._run_test(ss, kwargs, result)
+
+    def test_to_coo_bad_partition_nonnull_intersection(self):
+        ss = self.sparse_series[0]
+        msg = "Is not a partition because intersection is not null"
+        with pytest.raises(ValueError, match=msg):
+            ss.to_coo(['A', 'B', 'C'], ['C', 'D'])
+
+    def test_to_coo_bad_partition_small_union(self):
+        ss = self.sparse_series[0]
+        msg = "Is not a partition because union is not the whole"
+        with pytest.raises(ValueError, match=msg):
+            ss.to_coo(['A'], ['C', 'D'])
+
+    def test_to_coo_nlevels_less_than_two(self):
+        ss = self.sparse_series[0]
+        ss.index = np.arange(len(ss.index))
+        msg = "to_coo requires MultiIndex with nlevels > 2"
+        with pytest.raises(ValueError, match=msg):
+            ss.to_coo()
+
+    def test_to_coo_bad_ilevel(self):
+        ss = self.sparse_series[0]
+        with pytest.raises(KeyError, match="Level E not found"):
+            ss.to_coo(['A', 'B'], ['C', 'D', 'E'])
+
+    def test_to_coo_duplicate_index_entries(self):
+        ss = pd.concat([self.sparse_series[0],
+                        self.sparse_series[0]]).to_sparse()
+        msg = ("Duplicate index entries are not allowed in to_coo"
+               " transformation")
+        with pytest.raises(ValueError, match=msg):
+            ss.to_coo(['A', 'B'], ['C', 'D'])
+
+    def test_from_coo_dense_index(self):
+        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=True)
+        check = self.sparse_series[2]
+        tm.assert_sp_series_equal(ss, check)
+
+    def test_from_coo_nodense_index(self):
+        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=False)
+        check = self.sparse_series[2]
+        check = check.dropna().to_sparse()
+        tm.assert_sp_series_equal(ss, check)
+
+    def test_from_coo_long_repr(self):
+        # GH 13114
+        # test it doesn't raise error. Formatting is tested in test_format
+        import scipy.sparse
+
+        sparse = SparseSeries.from_coo(scipy.sparse.rand(350, 18))
+        repr(sparse)
+
+    def _run_test(self, ss, kwargs, check):
+        results = ss.to_coo(**kwargs)
+        self._check_results_to_coo(results, check)
+        # for every test, also test symmetry property (transpose), switch
+        # row_levels and column_levels
+        d = kwargs.copy()
+        d['row_levels'] = kwargs['column_levels']
+        d['column_levels'] = kwargs['row_levels']
+        results = ss.to_coo(**d)
+        results = (results[0].T, results[2], results[1])
+        self._check_results_to_coo(results, check)
+
+    def _check_results_to_coo(self, results, check):
+        (A, il, jl) = results
+        (A_result, il_result, jl_result) = check
+        # convert to dense and compare
+        tm.assert_numpy_array_equal(A.todense(), A_result.todense())
+        # or compare directly as difference of sparse
+        # assert(abs(A - A_result).max() < 1e-12) # max is failing in python
+        # 2.6
+        assert il == il_result
+        assert jl == jl_result
+
+    def test_concat(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
+
+            res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
+            tm.assert_sp_series_equal(res, exp,
+                                      consolidate_block_indices=True)
+
+    def test_concat_axis1(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y')
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        exp = pd.SparseDataFrame(exp)
+        tm.assert_sp_frame_equal(res, exp)
+
+    def test_concat_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+            sparse2 = pd.SparseSeries(val2, name='y', kind=kind, fill_value=0)
+
+            with tm.assert_produces_warning(PerformanceWarning):
+                res = pd.concat([sparse1, sparse2])
+            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            with tm.assert_produces_warning(PerformanceWarning):
+                res = pd.concat([sparse2, sparse1])
+            exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
+            tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_axis1_different_fill(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x')
+        sparse2 = pd.SparseSeries(val2, name='y', fill_value=0)
+
+        res = pd.concat([sparse1, sparse2], axis=1)
+        exp = pd.concat([pd.Series(val1, name='x'),
+                         pd.Series(val2, name='y')], axis=1)
+        assert isinstance(res, pd.SparseDataFrame)
+        tm.assert_frame_equal(res.to_dense(), exp)
+
+    def test_concat_different_kind(self):
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        sparse1 = pd.SparseSeries(val1, name='x', kind='integer')
+        sparse2 = pd.SparseSeries(val2, name='y', kind='block', fill_value=0)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pd.concat([sparse1, sparse2])
+        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+        exp = pd.SparseSeries(exp, kind='integer')
+        tm.assert_sp_series_equal(res, exp)
+
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pd.concat([sparse2, sparse1])
+        exp = pd.concat([pd.Series(val2), pd.Series(val1)])
+        exp = pd.SparseSeries(exp, kind='block', fill_value=0)
+        tm.assert_sp_series_equal(res, exp)
+
+    def test_concat_sparse_dense(self):
+        # use first input's fill_value
+        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
+        val2 = np.array([3, np.nan, 4, 0, 0])
+
+        for kind in ['integer', 'block']:
+            sparse = pd.SparseSeries(val1, name='x', kind=kind)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = pd.SparseSeries(exp, kind=kind)
+            tm.assert_sp_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = exp.astype("Sparse")
+            tm.assert_series_equal(res, exp)
+
+            sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
+            dense = pd.Series(val2, name='y')
+
+            res = pd.concat([sparse, dense])
+            exp = pd.concat([pd.Series(val1), dense])
+            exp = exp.astype(SparseDtype(exp.dtype, 0))
+            tm.assert_series_equal(res, exp)
+
+            res = pd.concat([dense, sparse, dense])
+            exp = pd.concat([dense, pd.Series(val1), dense])
+            exp = exp.astype(SparseDtype(exp.dtype, 0))
+            tm.assert_series_equal(res, exp)
+
+    def test_value_counts(self):
+        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
+        dense = pd.Series(vals, name='xx')
+
+        sparse = pd.SparseSeries(vals, name='xx')
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_value_counts_dup(self):
+        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
+
+        # numeric op may cause sp_values to include the same value as
+        # fill_value
+        dense = pd.Series(vals, name='xx') / 0.
+        sparse = pd.SparseSeries(vals, name='xx') / 0.
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        vals = [1, 2, 0, 0, 0, 1, 2, 0, 0, 1, 2, 0, 1, 1]
+
+        dense = pd.Series(vals, name='xx') * 0.
+        sparse = pd.SparseSeries(vals, name='xx') * 0.
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_value_counts_int(self):
+        vals = [1, 2, 0, 1, 2, 1, 2, 0, 1, 1]
+        dense = pd.Series(vals, name='xx')
+
+        # fill_value is np.nan, but should not be included in the result
+        sparse = pd.SparseSeries(vals, name='xx')
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
+        tm.assert_series_equal(sparse.value_counts(),
+                               dense.value_counts())
+        tm.assert_series_equal(sparse.value_counts(dropna=False),
+                               dense.value_counts(dropna=False))
+
+    def test_isna(self):
+        # GH 8276
+        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
+
+        res = s.isna()
+        exp = pd.SparseSeries([True, True, False, False, True], name='xxx',
+                              fill_value=True)
+        tm.assert_sp_series_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
+                            fill_value=0.)
+        res = s.isna()
+        assert isinstance(res, pd.SparseSeries)
+        exp = pd.Series([True, False, False, False, False], name='xxx')
+        tm.assert_series_equal(res.to_dense(), exp)
+
+    def test_notna(self):
+        # GH 8276
+        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
+
+        res = s.notna()
+        exp = pd.SparseSeries([False, False, True, True, False], name='xxx',
+                              fill_value=False)
+        tm.assert_sp_series_equal(res, exp)
+
+        # if fill_value is not nan, True can be included in sp_values
+        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
+                            fill_value=0.)
+        res = s.notna()
+        assert isinstance(res, pd.SparseSeries)
+        exp = pd.Series([False, True, True, True, True], name='xxx')
+        tm.assert_series_equal(res.to_dense(), exp)
+
+
+def _dense_series_compare(s, f):
+    result = f(s)
+    assert (isinstance(result, SparseSeries))
+    dense_result = f(s.to_dense())
+    tm.assert_series_equal(result.to_dense(), dense_result)
+
+
+class TestSparseSeriesAnalytics(object):
+
+    def setup_method(self, method):
+        arr, index = _test_data1()
+        self.bseries = SparseSeries(arr, index=index, kind='block',
+                                    name='bseries')
+
+        arr, index = _test_data1_zero()
+        self.zbseries = SparseSeries(arr, index=index, kind='block',
+                                     fill_value=0, name='zbseries')
+
+    def test_cumsum(self):
+        result = self.bseries.cumsum()
+        expected = SparseSeries(self.bseries.to_dense().cumsum())
+        tm.assert_sp_series_equal(result, expected)
+
+        result = self.zbseries.cumsum()
+        expected = self.zbseries.to_dense().cumsum().to_sparse()
+        tm.assert_series_equal(result, expected)
+
+        axis = 1  # Series is 1-D, so only axis = 0 is valid.
+        msg = "No axis named {axis}".format(axis=axis)
+        with pytest.raises(ValueError, match=msg):
+            self.bseries.cumsum(axis=axis)
+
+    def test_numpy_cumsum(self):
+        result = np.cumsum(self.bseries)
+        expected = SparseSeries(self.bseries.to_dense().cumsum())
+        tm.assert_sp_series_equal(result, expected)
+
+        result = np.cumsum(self.zbseries)
+        expected = self.zbseries.to_dense().cumsum().to_sparse()
+        tm.assert_series_equal(result, expected)
+
+        msg = "the 'dtype' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.cumsum(self.bseries, dtype=np.int64)
+
+        msg = "the 'out' parameter is not supported"
+        with pytest.raises(ValueError, match=msg):
+            np.cumsum(self.zbseries, out=result)
+
+    def test_numpy_func_call(self):
+        # no exception should be raised even though
+        # numpy passes in 'axis=None' or `axis=-1'
+        funcs = ['sum', 'cumsum', 'var', 'mean',
+                 'prod', 'cumprod', 'std', 'argsort',
+                 'min', 'max']
+        for func in funcs:
+            for series in ('bseries', 'zbseries'):
+                getattr(np, func)(getattr(self, series))
+
+    def test_deprecated_numpy_func_call(self):
+        # NOTE: These should be add to the 'test_numpy_func_call' test above
+        # once the behavior of argmin/argmax is corrected.
+        funcs = ['argmin', 'argmax']
+        for func in funcs:
+            for series in ('bseries', 'zbseries'):
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    getattr(np, func)(getattr(self, series))
+
+                with tm.assert_produces_warning(FutureWarning,
+                                                check_stacklevel=False):
+                    getattr(getattr(self, series), func)()
+
+    def test_deprecated_reindex_axis(self):
+        # https://github.com/pandas-dev/pandas/issues/17833
+        with tm.assert_produces_warning(FutureWarning) as m:
+            self.bseries.reindex_axis([0, 1, 2])
+        assert 'reindex' in str(m[0].message)
+
+
+@pytest.mark.parametrize(
+    'datetime_type', (np.datetime64,
+                      pd.Timestamp,
+                      lambda x: datetime.strptime(x, '%Y-%m-%d')))
+def test_constructor_dict_datetime64_index(datetime_type):
+    # GH 9456
+    dates = ['1984-02-19', '1988-11-06', '1989-12-03', '1990-03-15']
+    values = [42544017.198965244, 1234565, 40512335.181958228, -1]
+
+    result = SparseSeries(dict(zip(map(datetime_type, dates), values)))
+    expected = SparseSeries(values, map(pd.Timestamp, dates))
+
+    tm.assert_sp_series_equal(result, expected)
+
+
+def test_to_sparse():
+    # https://github.com/pandas-dev/pandas/issues/22389
+    arr = pd.SparseArray([1, 2, None, 3])
+    result = pd.Series(arr).to_sparse()
+    assert len(result) == 4
+    tm.assert_sp_array_equal(result.values, arr, check_kind=False)
+
+
+def test_constructor_mismatched_raises():
+    msg = "Length of passed values is 2, index implies 3"
+    with pytest.raises(ValueError, match=msg):
+        SparseSeries([1, 2], index=[1, 2, 3])
+
+
+def test_block_deprecated():
+    s = SparseSeries([1])
+    with tm.assert_produces_warning(FutureWarning):
+        s.block
diff --git a/pandas/tests/sparse/test_array.py b/pandas/tests/sparse/test_array.py
deleted file mode 100644
index 15531cecfe79b..0000000000000
--- a/pandas/tests/sparse/test_array.py
+++ /dev/null
@@ -1,812 +0,0 @@
-from pandas.compat import range
-import re
-import operator
-import warnings
-
-from numpy import nan
-import numpy as np
-
-from pandas import _np_version_under1p8
-from pandas.sparse.api import SparseArray, SparseSeries
-from pandas.sparse.libsparse import IntIndex
-from pandas.util.testing import assert_almost_equal, assertRaisesRegexp
-import pandas.util.testing as tm
-
-
-class TestSparseArray(tm.TestCase):
-
-    def setUp(self):
-        self.arr_data = np.array([nan, nan, 1, 2, 3, nan, 4, 5, nan, 6])
-        self.arr = SparseArray(self.arr_data)
-        self.zarr = SparseArray([0, 0, 1, 2, 3, 0, 4, 5, 0, 6], fill_value=0)
-
-    def test_constructor_dtype(self):
-        arr = SparseArray([np.nan, 1, 2, np.nan])
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseArray([np.nan, 1, 2, np.nan], fill_value=0)
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray([0, 1, 2, 4], dtype=np.float64)
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseArray([0, 1, 2, 4], dtype=np.int64)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=np.int64)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray([0, 1, 2, 4], dtype=None)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray([0, 1, 2, 4], fill_value=0, dtype=None)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-    def test_constructor_object_dtype(self):
-        # GH 11856
-        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object)
-        self.assertEqual(arr.dtype, np.object)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseArray(['A', 'A', np.nan, 'B'], dtype=np.object,
-                          fill_value='A')
-        self.assertEqual(arr.dtype, np.object)
-        self.assertEqual(arr.fill_value, 'A')
-
-    def test_constructor_spindex_dtype(self):
-        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]))
-        tm.assert_sp_array_equal(arr, SparseArray([np.nan, 1, 2, np.nan]))
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseArray(data=[1, 2, 3],
-                          sparse_index=IntIndex(4, [1, 2, 3]),
-                          dtype=np.int64, fill_value=0)
-        exp = SparseArray([0, 1, 2, 3], dtype=np.int64, fill_value=0)
-        tm.assert_sp_array_equal(arr, exp)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
-                          fill_value=0, dtype=np.int64)
-        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=np.int64)
-        tm.assert_sp_array_equal(arr, exp)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray(data=[1, 2, 3],
-                          sparse_index=IntIndex(4, [1, 2, 3]),
-                          dtype=None, fill_value=0)
-        exp = SparseArray([0, 1, 2, 3], dtype=None)
-        tm.assert_sp_array_equal(arr, exp)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        # scalar input
-        arr = SparseArray(data=1, sparse_index=IntIndex(1, [0]), dtype=None)
-        exp = SparseArray([1], dtype=None)
-        tm.assert_sp_array_equal(arr, exp)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseArray(data=[1, 2], sparse_index=IntIndex(4, [1, 2]),
-                          fill_value=0, dtype=None)
-        exp = SparseArray([0, 1, 2, 0], fill_value=0, dtype=None)
-        tm.assert_sp_array_equal(arr, exp)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-    def test_sparseseries_roundtrip(self):
-        # GH 13999
-        for kind in ['integer', 'block']:
-            for fill in [1, np.nan, 0]:
-                arr = SparseArray([np.nan, 1, np.nan, 2, 3], kind=kind,
-                                  fill_value=fill)
-                res = SparseArray(SparseSeries(arr))
-                tm.assert_sp_array_equal(arr, res)
-
-                arr = SparseArray([0, 0, 0, 1, 1, 2], dtype=np.int64,
-                                  kind=kind, fill_value=fill)
-                res = SparseArray(SparseSeries(arr), dtype=np.int64)
-                tm.assert_sp_array_equal(arr, res)
-
-                res = SparseArray(SparseSeries(arr))
-                tm.assert_sp_array_equal(arr, res)
-
-            for fill in [True, False, np.nan]:
-                arr = SparseArray([True, False, True, True], dtype=np.bool,
-                                  kind=kind, fill_value=fill)
-                res = SparseArray(SparseSeries(arr))
-                tm.assert_sp_array_equal(arr, res)
-
-                res = SparseArray(SparseSeries(arr))
-                tm.assert_sp_array_equal(arr, res)
-
-    def test_get_item(self):
-
-        self.assertTrue(np.isnan(self.arr[1]))
-        self.assertEqual(self.arr[2], 1)
-        self.assertEqual(self.arr[7], 5)
-
-        self.assertEqual(self.zarr[0], 0)
-        self.assertEqual(self.zarr[2], 1)
-        self.assertEqual(self.zarr[7], 5)
-
-        errmsg = re.compile("bounds")
-        assertRaisesRegexp(IndexError, errmsg, lambda: self.arr[11])
-        assertRaisesRegexp(IndexError, errmsg, lambda: self.arr[-11])
-        self.assertEqual(self.arr[-1], self.arr[len(self.arr) - 1])
-
-    def test_take(self):
-        self.assertTrue(np.isnan(self.arr.take(0)))
-        self.assertTrue(np.isscalar(self.arr.take(2)))
-
-        # np.take in < 1.8 doesn't support scalar indexing
-        if not _np_version_under1p8:
-            self.assertEqual(self.arr.take(2), np.take(self.arr_data, 2))
-            self.assertEqual(self.arr.take(6), np.take(self.arr_data, 6))
-
-        exp = SparseArray(np.take(self.arr_data, [2, 3]))
-        tm.assert_sp_array_equal(self.arr.take([2, 3]), exp)
-
-        exp = SparseArray(np.take(self.arr_data, [0, 1, 2]))
-        tm.assert_sp_array_equal(self.arr.take([0, 1, 2]), exp)
-
-    def test_take_fill_value(self):
-        data = np.array([1, np.nan, 0, 3, 0])
-        sparse = SparseArray(data, fill_value=0)
-
-        exp = SparseArray(np.take(data, [0]), fill_value=0)
-        tm.assert_sp_array_equal(sparse.take([0]), exp)
-
-        exp = SparseArray(np.take(data, [1, 3, 4]), fill_value=0)
-        tm.assert_sp_array_equal(sparse.take([1, 3, 4]), exp)
-
-    def test_take_negative(self):
-        exp = SparseArray(np.take(self.arr_data, [-1]))
-        tm.assert_sp_array_equal(self.arr.take([-1]), exp)
-
-        exp = SparseArray(np.take(self.arr_data, [-4, -3, -2]))
-        tm.assert_sp_array_equal(self.arr.take([-4, -3, -2]), exp)
-
-    def test_bad_take(self):
-        assertRaisesRegexp(IndexError, "bounds", lambda: self.arr.take(11))
-        self.assertRaises(IndexError, lambda: self.arr.take(-11))
-
-    def test_take_invalid_kwargs(self):
-        msg = r"take\(\) got an unexpected keyword argument 'foo'"
-        tm.assertRaisesRegexp(TypeError, msg, self.arr.take,
-                              [2, 3], foo=2)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, self.arr.take,
-                              [2, 3], out=self.arr)
-
-        msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, self.arr.take,
-                              [2, 3], mode='clip')
-
-    def test_take_filling(self):
-        # similar tests as GH 12631
-        sparse = SparseArray([np.nan, np.nan, 1, np.nan, 4])
-        result = sparse.take(np.array([1, 0, -1]))
-        expected = SparseArray([np.nan, np.nan, 4])
-        tm.assert_sp_array_equal(result, expected)
-
-        # fill_value
-        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
-        expected = SparseArray([np.nan, np.nan, np.nan])
-        tm.assert_sp_array_equal(result, expected)
-
-        # allow_fill=False
-        result = sparse.take(np.array([1, 0, -1]),
-                             allow_fill=False, fill_value=True)
-        expected = SparseArray([np.nan, np.nan, 4])
-        tm.assert_sp_array_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            sparse.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            sparse.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, -6]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]), fill_value=True)
-
-    def test_take_filling_fill_value(self):
-        # same tests as GH 12631
-        sparse = SparseArray([np.nan, 0, 1, 0, 4], fill_value=0)
-        result = sparse.take(np.array([1, 0, -1]))
-        expected = SparseArray([0, np.nan, 4], fill_value=0)
-        tm.assert_sp_array_equal(result, expected)
-
-        # fill_value
-        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
-        expected = SparseArray([0, np.nan, 0], fill_value=0)
-        tm.assert_sp_array_equal(result, expected)
-
-        # allow_fill=False
-        result = sparse.take(np.array([1, 0, -1]),
-                             allow_fill=False, fill_value=True)
-        expected = SparseArray([0, np.nan, 4], fill_value=0)
-        tm.assert_sp_array_equal(result, expected)
-
-        msg = ('When allow_fill=True and fill_value is not None, '
-               'all indices must be >= -1')
-        with tm.assertRaisesRegexp(ValueError, msg):
-            sparse.take(np.array([1, 0, -2]), fill_value=True)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            sparse.take(np.array([1, 0, -5]), fill_value=True)
-
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, -6]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]), fill_value=True)
-
-    def test_take_filling_all_nan(self):
-        sparse = SparseArray([np.nan, np.nan, np.nan, np.nan, np.nan])
-        result = sparse.take(np.array([1, 0, -1]))
-        expected = SparseArray([np.nan, np.nan, np.nan])
-        tm.assert_sp_array_equal(result, expected)
-
-        result = sparse.take(np.array([1, 0, -1]), fill_value=True)
-        expected = SparseArray([np.nan, np.nan, np.nan])
-        tm.assert_sp_array_equal(result, expected)
-
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, -6]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]))
-        with tm.assertRaises(IndexError):
-            sparse.take(np.array([1, 5]), fill_value=True)
-
-    def test_set_item(self):
-        def setitem():
-            self.arr[5] = 3
-
-        def setslice():
-            self.arr[1:5] = 2
-
-        assertRaisesRegexp(TypeError, "item assignment", setitem)
-        assertRaisesRegexp(TypeError, "item assignment", setslice)
-
-    def test_constructor_from_too_large_array(self):
-        assertRaisesRegexp(TypeError, "expected dimension <= 1 data",
-                           SparseArray, np.arange(10).reshape((2, 5)))
-
-    def test_constructor_from_sparse(self):
-        res = SparseArray(self.zarr)
-        self.assertEqual(res.fill_value, 0)
-        assert_almost_equal(res.sp_values, self.zarr.sp_values)
-
-    def test_constructor_copy(self):
-        cp = SparseArray(self.arr, copy=True)
-        cp.sp_values[:3] = 0
-        self.assertFalse((self.arr.sp_values[:3] == 0).any())
-
-        not_copy = SparseArray(self.arr)
-        not_copy.sp_values[:3] = 0
-        self.assertTrue((self.arr.sp_values[:3] == 0).all())
-
-    def test_constructor_bool(self):
-        # GH 10648
-        data = np.array([False, False, True, True, False, False])
-        arr = SparseArray(data, fill_value=False, dtype=bool)
-
-        self.assertEqual(arr.dtype, bool)
-        tm.assert_numpy_array_equal(arr.sp_values, np.array([True, True]))
-        tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
-        tm.assert_numpy_array_equal(arr.sp_index.indices,
-                                    np.array([2, 3], np.int32))
-
-        for dense in [arr.to_dense(), arr.values]:
-            self.assertEqual(dense.dtype, bool)
-            tm.assert_numpy_array_equal(dense, data)
-
-    def test_constructor_bool_fill_value(self):
-        arr = SparseArray([True, False, True], dtype=None)
-        self.assertEqual(arr.dtype, np.bool)
-        self.assertFalse(arr.fill_value)
-
-        arr = SparseArray([True, False, True], dtype=np.bool)
-        self.assertEqual(arr.dtype, np.bool)
-        self.assertFalse(arr.fill_value)
-
-        arr = SparseArray([True, False, True], dtype=np.bool, fill_value=True)
-        self.assertEqual(arr.dtype, np.bool)
-        self.assertTrue(arr.fill_value)
-
-    def test_constructor_float32(self):
-        # GH 10648
-        data = np.array([1., np.nan, 3], dtype=np.float32)
-        arr = SparseArray(data, dtype=np.float32)
-
-        self.assertEqual(arr.dtype, np.float32)
-        tm.assert_numpy_array_equal(arr.sp_values,
-                                    np.array([1, 3], dtype=np.float32))
-        tm.assert_numpy_array_equal(arr.sp_values, np.asarray(arr))
-        tm.assert_numpy_array_equal(arr.sp_index.indices,
-                                    np.array([0, 2], dtype=np.int32))
-
-        for dense in [arr.to_dense(), arr.values]:
-            self.assertEqual(dense.dtype, np.float32)
-            self.assert_numpy_array_equal(dense, data)
-
-    def test_astype(self):
-        res = self.arr.astype('f8')
-        res.sp_values[:3] = 27
-        self.assertFalse((self.arr.sp_values[:3] == 27).any())
-
-        msg = "unable to coerce current fill_value nan to int64 dtype"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.arr.astype('i8')
-
-        arr = SparseArray([0, np.nan, 0, 1])
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.astype('i8')
-
-        arr = SparseArray([0, np.nan, 0, 1], fill_value=0)
-        msg = 'Cannot convert non-finite values \\(NA or inf\\) to integer'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.astype('i8')
-
-    def test_astype_all(self):
-        vals = np.array([1, 2, 3])
-        arr = SparseArray(vals, fill_value=1)
-
-        types = [np.float64, np.float32, np.int64,
-                 np.int32, np.int16, np.int8]
-        for typ in types:
-            res = arr.astype(typ)
-            self.assertEqual(res.dtype, typ)
-            self.assertEqual(res.sp_values.dtype, typ)
-
-            tm.assert_numpy_array_equal(res.values, vals.astype(typ))
-
-    def test_set_fill_value(self):
-        arr = SparseArray([1., np.nan, 2.], fill_value=np.nan)
-        arr.fill_value = 2
-        self.assertEqual(arr.fill_value, 2)
-
-        arr = SparseArray([1, 0, 2], fill_value=0, dtype=np.int64)
-        arr.fill_value = 2
-        self.assertEqual(arr.fill_value, 2)
-
-        # coerces to int
-        msg = "unable to set fill_value 3\\.1 to int64 dtype"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.fill_value = 3.1
-
-        msg = "unable to set fill_value nan to int64 dtype"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.fill_value = np.nan
-
-        arr = SparseArray([True, False, True], fill_value=False, dtype=np.bool)
-        arr.fill_value = True
-        self.assertTrue(arr.fill_value)
-
-        # coerces to bool
-        msg = "unable to set fill_value 0 to bool dtype"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.fill_value = 0
-
-        msg = "unable to set fill_value nan to bool dtype"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            arr.fill_value = np.nan
-
-        # invalid
-        msg = "fill_value must be a scalar"
-        for val in [[1, 2, 3], np.array([1, 2]), (1, 2, 3)]:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                arr.fill_value = val
-
-    def test_copy_shallow(self):
-        arr2 = self.arr.copy(deep=False)
-
-        def _get_base(values):
-            base = values.base
-            while base.base is not None:
-                base = base.base
-            return base
-
-        assert (_get_base(arr2) is _get_base(self.arr))
-
-    def test_values_asarray(self):
-        assert_almost_equal(self.arr.values, self.arr_data)
-        assert_almost_equal(self.arr.to_dense(), self.arr_data)
-        assert_almost_equal(self.arr.sp_values, np.asarray(self.arr))
-
-    def test_to_dense(self):
-        vals = np.array([1, np.nan, np.nan, 3, np.nan])
-        res = SparseArray(vals).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        res = SparseArray(vals, fill_value=0).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        vals = np.array([1, np.nan, 0, 3, 0])
-        res = SparseArray(vals).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        res = SparseArray(vals, fill_value=0).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        vals = np.array([np.nan, np.nan, np.nan, np.nan, np.nan])
-        res = SparseArray(vals).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        res = SparseArray(vals, fill_value=0).to_dense()
-        tm.assert_numpy_array_equal(res, vals)
-
-        # see gh-14647
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            SparseArray(vals).to_dense(fill=2)
-
-    def test_getitem(self):
-        def _checkit(i):
-            assert_almost_equal(self.arr[i], self.arr.values[i])
-
-        for i in range(len(self.arr)):
-            _checkit(i)
-            _checkit(-i)
-
-    def test_getslice(self):
-        result = self.arr[:-3]
-        exp = SparseArray(self.arr.values[:-3])
-        tm.assert_sp_array_equal(result, exp)
-
-        result = self.arr[-4:]
-        exp = SparseArray(self.arr.values[-4:])
-        tm.assert_sp_array_equal(result, exp)
-
-        # two corner cases from Series
-        result = self.arr[-12:]
-        exp = SparseArray(self.arr)
-        tm.assert_sp_array_equal(result, exp)
-
-        result = self.arr[:-12]
-        exp = SparseArray(self.arr.values[:0])
-        tm.assert_sp_array_equal(result, exp)
-
-    def test_getslice_tuple(self):
-        dense = np.array([np.nan, 0, 3, 4, 0, 5, np.nan, np.nan, 0])
-
-        sparse = SparseArray(dense)
-        res = sparse[4:, ]
-        exp = SparseArray(dense[4:, ])
-        tm.assert_sp_array_equal(res, exp)
-
-        sparse = SparseArray(dense, fill_value=0)
-        res = sparse[4:, ]
-        exp = SparseArray(dense[4:, ], fill_value=0)
-        tm.assert_sp_array_equal(res, exp)
-
-        with tm.assertRaises(IndexError):
-            sparse[4:, :]
-
-        with tm.assertRaises(IndexError):
-            # check numpy compat
-            dense[4:, :]
-
-    def test_binary_operators(self):
-        data1 = np.random.randn(20)
-        data2 = np.random.randn(20)
-        data1[::2] = np.nan
-        data2[::3] = np.nan
-
-        arr1 = SparseArray(data1)
-        arr2 = SparseArray(data2)
-
-        data1[::2] = 3
-        data2[::3] = 3
-        farr1 = SparseArray(data1, fill_value=3)
-        farr2 = SparseArray(data2, fill_value=3)
-
-        def _check_op(op, first, second):
-            res = op(first, second)
-            exp = SparseArray(op(first.values, second.values),
-                              fill_value=first.fill_value)
-            tm.assertIsInstance(res, SparseArray)
-            assert_almost_equal(res.values, exp.values)
-
-            res2 = op(first, second.values)
-            tm.assertIsInstance(res2, SparseArray)
-            tm.assert_sp_array_equal(res, res2)
-
-            res3 = op(first.values, second)
-            tm.assertIsInstance(res3, SparseArray)
-            tm.assert_sp_array_equal(res, res3)
-
-            res4 = op(first, 4)
-            tm.assertIsInstance(res4, SparseArray)
-
-            # ignore this if the actual op raises (e.g. pow)
-            try:
-                exp = op(first.values, 4)
-                exp_fv = op(first.fill_value, 4)
-                assert_almost_equal(res4.fill_value, exp_fv)
-                assert_almost_equal(res4.values, exp)
-            except ValueError:
-                pass
-
-        def _check_inplace_op(op):
-            tmp = arr1.copy()
-            self.assertRaises(NotImplementedError, op, tmp, arr2)
-
-        with np.errstate(all='ignore'):
-            bin_ops = [operator.add, operator.sub, operator.mul,
-                       operator.truediv, operator.floordiv, operator.pow]
-            for op in bin_ops:
-                _check_op(op, arr1, arr2)
-                _check_op(op, farr1, farr2)
-
-            inplace_ops = ['iadd', 'isub', 'imul', 'itruediv', 'ifloordiv',
-                           'ipow']
-            for op in inplace_ops:
-                _check_inplace_op(getattr(operator, op))
-
-    def test_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            tm.assert_sp_array_equal(unpickled, obj)
-
-        _check_roundtrip(self.arr)
-        _check_roundtrip(self.zarr)
-
-    def test_generator_warnings(self):
-        sp_arr = SparseArray([1, 2, 3])
-        with warnings.catch_warnings(record=True) as w:
-            warnings.filterwarnings(action='always',
-                                    category=DeprecationWarning)
-            warnings.filterwarnings(action='always',
-                                    category=PendingDeprecationWarning)
-            for _ in sp_arr:
-                pass
-            assert len(w) == 0
-
-    def test_fillna(self):
-        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
-        res = s.fillna(-1)
-        exp = SparseArray([1, -1, -1, 3, -1], fill_value=-1, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
-        res = s.fillna(-1)
-        exp = SparseArray([1, -1, -1, 3, -1], fill_value=0, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        s = SparseArray([1, np.nan, 0, 3, 0])
-        res = s.fillna(-1)
-        exp = SparseArray([1, -1, 0, 3, 0], fill_value=-1, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        s = SparseArray([1, np.nan, 0, 3, 0], fill_value=0)
-        res = s.fillna(-1)
-        exp = SparseArray([1, -1, 0, 3, 0], fill_value=0, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        s = SparseArray([np.nan, np.nan, np.nan, np.nan])
-        res = s.fillna(-1)
-        exp = SparseArray([-1, -1, -1, -1], fill_value=-1, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        s = SparseArray([np.nan, np.nan, np.nan, np.nan], fill_value=0)
-        res = s.fillna(-1)
-        exp = SparseArray([-1, -1, -1, -1], fill_value=0, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-        # float dtype's fill_value is np.nan, replaced by -1
-        s = SparseArray([0., 0., 0., 0.])
-        res = s.fillna(-1)
-        exp = SparseArray([0., 0., 0., 0.], fill_value=-1)
-        tm.assert_sp_array_equal(res, exp)
-
-        # int dtype shouldn't have missing. No changes.
-        s = SparseArray([0, 0, 0, 0])
-        self.assertEqual(s.dtype, np.int64)
-        self.assertEqual(s.fill_value, 0)
-        res = s.fillna(-1)
-        tm.assert_sp_array_equal(res, s)
-
-        s = SparseArray([0, 0, 0, 0], fill_value=0)
-        self.assertEqual(s.dtype, np.int64)
-        self.assertEqual(s.fill_value, 0)
-        res = s.fillna(-1)
-        exp = SparseArray([0, 0, 0, 0], fill_value=0)
-        tm.assert_sp_array_equal(res, exp)
-
-        # fill_value can be nan if there is no missing hole.
-        # only fill_value will be changed
-        s = SparseArray([0, 0, 0, 0], fill_value=np.nan)
-        self.assertEqual(s.dtype, np.int64)
-        self.assertTrue(np.isnan(s.fill_value))
-        res = s.fillna(-1)
-        exp = SparseArray([0, 0, 0, 0], fill_value=-1)
-        tm.assert_sp_array_equal(res, exp)
-
-    def test_fillna_overlap(self):
-        s = SparseArray([1, np.nan, np.nan, 3, np.nan])
-        # filling with existing value doesn't replace existing value with
-        # fill_value, i.e. existing 3 remains in sp_values
-        res = s.fillna(3)
-        exp = np.array([1, 3, 3, 3, 3], dtype=np.float64)
-        tm.assert_numpy_array_equal(res.to_dense(), exp)
-
-        s = SparseArray([1, np.nan, np.nan, 3, np.nan], fill_value=0)
-        res = s.fillna(3)
-        exp = SparseArray([1, 3, 3, 3, 3], fill_value=0, dtype=np.float64)
-        tm.assert_sp_array_equal(res, exp)
-
-
-class TestSparseArrayAnalytics(tm.TestCase):
-
-    def test_sum(self):
-        data = np.arange(10).astype(float)
-        out = SparseArray(data).sum()
-        self.assertEqual(out, 45.0)
-
-        data[5] = np.nan
-        out = SparseArray(data, fill_value=2).sum()
-        self.assertEqual(out, 40.0)
-
-        out = SparseArray(data, fill_value=np.nan).sum()
-        self.assertEqual(out, 40.0)
-
-    def test_numpy_sum(self):
-        data = np.arange(10).astype(float)
-        out = np.sum(SparseArray(data))
-        self.assertEqual(out, 45.0)
-
-        data[5] = np.nan
-        out = np.sum(SparseArray(data, fill_value=2))
-        self.assertEqual(out, 40.0)
-
-        out = np.sum(SparseArray(data, fill_value=np.nan))
-        self.assertEqual(out, 40.0)
-
-        msg = "the 'dtype' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.sum,
-                              SparseArray(data), dtype=np.int64)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.sum,
-                              SparseArray(data), out=out)
-
-    def test_cumsum(self):
-        non_null_data = np.array([1, 2, 3, 4, 5], dtype=float)
-        non_null_expected = SparseArray(non_null_data.cumsum())
-
-        null_data = np.array([1, 2, np.nan, 4, 5], dtype=float)
-        null_expected = SparseArray(np.array([1.0, 3.0, np.nan, 7.0, 12.0]))
-
-        for data, expected in [
-            (null_data, null_expected),
-            (non_null_data, non_null_expected)
-        ]:
-            out = SparseArray(data).cumsum()
-            tm.assert_sp_array_equal(out, expected)
-
-            out = SparseArray(data, fill_value=np.nan).cumsum()
-            tm.assert_sp_array_equal(out, expected)
-
-            out = SparseArray(data, fill_value=2).cumsum()
-            tm.assert_sp_array_equal(out, expected)
-
-            axis = 1  # SparseArray currently 1-D, so only axis = 0 is valid.
-            msg = "axis\\(={axis}\\) out of bounds".format(axis=axis)
-            with tm.assertRaisesRegexp(ValueError, msg):
-                SparseArray(data).cumsum(axis=axis)
-
-    def test_numpy_cumsum(self):
-        non_null_data = np.array([1, 2, 3, 4, 5], dtype=float)
-        non_null_expected = SparseArray(non_null_data.cumsum())
-
-        null_data = np.array([1, 2, np.nan, 4, 5], dtype=float)
-        null_expected = SparseArray(np.array([1.0, 3.0, np.nan, 7.0, 12.0]))
-
-        for data, expected in [
-            (null_data, null_expected),
-            (non_null_data, non_null_expected)
-        ]:
-            out = np.cumsum(SparseArray(data))
-            tm.assert_sp_array_equal(out, expected)
-
-            out = np.cumsum(SparseArray(data, fill_value=np.nan))
-            tm.assert_sp_array_equal(out, expected)
-
-            out = np.cumsum(SparseArray(data, fill_value=2))
-            tm.assert_sp_array_equal(out, expected)
-
-            msg = "the 'dtype' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                                  SparseArray(data), dtype=np.int64)
-
-            msg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                                  SparseArray(data), out=out)
-
-    def test_mean(self):
-        data = np.arange(10).astype(float)
-        out = SparseArray(data).mean()
-        self.assertEqual(out, 4.5)
-
-        data[5] = np.nan
-        out = SparseArray(data).mean()
-        self.assertEqual(out, 40.0 / 9)
-
-    def test_numpy_mean(self):
-        data = np.arange(10).astype(float)
-        out = np.mean(SparseArray(data))
-        self.assertEqual(out, 4.5)
-
-        data[5] = np.nan
-        out = np.mean(SparseArray(data))
-        self.assertEqual(out, 40.0 / 9)
-
-        msg = "the 'dtype' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.mean,
-                              SparseArray(data), dtype=np.int64)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.mean,
-                              SparseArray(data), out=out)
-
-    def test_ufunc(self):
-        # GH 13853 make sure ufunc is applied to fill_value
-        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
-        result = SparseArray([1, np.nan, 2, np.nan, 2])
-        tm.assert_sp_array_equal(abs(sparse), result)
-        tm.assert_sp_array_equal(np.abs(sparse), result)
-
-        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
-        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
-                             fill_value=1)
-        tm.assert_sp_array_equal(abs(sparse), result)
-        tm.assert_sp_array_equal(np.abs(sparse), result)
-
-        sparse = SparseArray([1, -1, 2, -2], fill_value=-1)
-        result = SparseArray([1, 2, 2], sparse_index=sparse.sp_index,
-                             fill_value=1)
-        tm.assert_sp_array_equal(abs(sparse), result)
-        tm.assert_sp_array_equal(np.abs(sparse), result)
-
-        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
-        result = SparseArray(np.sin([1, np.nan, 2, np.nan, -2]))
-        tm.assert_sp_array_equal(np.sin(sparse), result)
-
-        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
-        result = SparseArray(np.sin([1, -1, 2, -2]), fill_value=np.sin(1))
-        tm.assert_sp_array_equal(np.sin(sparse), result)
-
-        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
-        result = SparseArray(np.sin([1, -1, 0, -2]), fill_value=np.sin(0))
-        tm.assert_sp_array_equal(np.sin(sparse), result)
-
-    def test_ufunc_args(self):
-        # GH 13853 make sure ufunc is applied to fill_value, including its arg
-        sparse = SparseArray([1, np.nan, 2, np.nan, -2])
-        result = SparseArray([2, np.nan, 3, np.nan, -1])
-        tm.assert_sp_array_equal(np.add(sparse, 1), result)
-
-        sparse = SparseArray([1, -1, 2, -2], fill_value=1)
-        result = SparseArray([2, 0, 3, -1], fill_value=2)
-        tm.assert_sp_array_equal(np.add(sparse, 1), result)
-
-        sparse = SparseArray([1, -1, 0, -2], fill_value=0)
-        result = SparseArray([2, 0, 1, -1], fill_value=1)
-        tm.assert_sp_array_equal(np.add(sparse, 1), result)
diff --git a/pandas/tests/sparse/test_combine_concat.py b/pandas/tests/sparse/test_combine_concat.py
index 81655daec6164..97d5aaca82778 100644
--- a/pandas/tests/sparse/test_combine_concat.py
+++ b/pandas/tests/sparse/test_combine_concat.py
@@ -1,32 +1,66 @@
 # pylint: disable-msg=E1101,W0612
+import itertools
 
 import numpy as np
+import pytest
+
+from pandas.errors import PerformanceWarning
+
 import pandas as pd
 import pandas.util.testing as tm
 
 
-class TestSparseSeriesConcat(tm.TestCase):
+class TestSparseArrayConcat(object):
+    @pytest.mark.parametrize('kind', ['integer', 'block'])
+    def test_basic(self, kind):
+        a = pd.SparseArray([1, 0, 0, 2], kind=kind)
+        b = pd.SparseArray([1, 0, 2, 2], kind=kind)
 
-    def test_concat(self):
+        result = pd.SparseArray._concat_same_type([a, b])
+        # Can't make any assertions about the sparse index itself
+        # since we aren't don't merge sparse blocs across arrays
+        # in to_concat
+        expected = np.array([1, 2, 1, 2, 2], dtype='int64')
+        tm.assert_numpy_array_equal(result.sp_values, expected)
+        assert result.kind == kind
+
+    @pytest.mark.parametrize('kind', ['integer', 'block'])
+    def test_uses_first_kind(self, kind):
+        other = 'integer' if kind == 'block' else 'block'
+        a = pd.SparseArray([1, 0, 0, 2], kind=kind)
+        b = pd.SparseArray([1, 0, 2, 2], kind=other)
+
+        result = pd.SparseArray._concat_same_type([a, b])
+        expected = np.array([1, 2, 1, 2, 2], dtype='int64')
+        tm.assert_numpy_array_equal(result.sp_values, expected)
+        assert result.kind == kind
+
+
+class TestSparseSeriesConcat(object):
+
+    @pytest.mark.parametrize('kind', [
+        'integer',
+        'block',
+    ])
+    def test_concat(self, kind):
         val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
         val2 = np.array([3, np.nan, 4, 0, 0])
 
-        for kind in ['integer', 'block']:
-            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
-            sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
+        sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
+        sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
 
-            res = pd.concat([sparse1, sparse2])
-            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
+        res = pd.concat([sparse1, sparse2])
+        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+        exp = pd.SparseSeries(exp, kind=kind)
+        tm.assert_sp_series_equal(res, exp, consolidate_block_indices=True)
 
-            sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
-            sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
+        sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
+        sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
 
-            res = pd.concat([sparse1, sparse2])
-            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-            exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
+        res = pd.concat([sparse1, sparse2])
+        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
+        exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
+        tm.assert_sp_series_equal(res, exp, consolidate_block_indices=True)
 
     def test_concat_axis1(self):
         val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
@@ -39,7 +73,7 @@ def test_concat_axis1(self):
         exp = pd.concat([pd.Series(val1, name='x'),
                          pd.Series(val2, name='y')], axis=1)
         exp = pd.SparseDataFrame(exp)
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
     def test_concat_different_fill(self):
         val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
@@ -49,12 +83,16 @@ def test_concat_different_fill(self):
             sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
             sparse2 = pd.SparseSeries(val2, name='y', kind=kind, fill_value=0)
 
-            res = pd.concat([sparse1, sparse2])
+            with tm.assert_produces_warning(PerformanceWarning):
+                res = pd.concat([sparse1, sparse2])
+
             exp = pd.concat([pd.Series(val1), pd.Series(val2)])
             exp = pd.SparseSeries(exp, kind=kind)
             tm.assert_sp_series_equal(res, exp)
 
-            res = pd.concat([sparse2, sparse1])
+            with tm.assert_produces_warning(PerformanceWarning):
+                res = pd.concat([sparse2, sparse1])
+
             exp = pd.concat([pd.Series(val2), pd.Series(val1)])
             exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
             tm.assert_sp_series_equal(res, exp)
@@ -69,7 +107,7 @@ def test_concat_axis1_different_fill(self):
         res = pd.concat([sparse1, sparse2], axis=1)
         exp = pd.concat([pd.Series(val1, name='x'),
                          pd.Series(val2, name='y')], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
+        assert isinstance(res, pd.SparseDataFrame)
         tm.assert_frame_equal(res.to_dense(), exp)
 
     def test_concat_different_kind(self):
@@ -77,54 +115,71 @@ def test_concat_different_kind(self):
         val2 = np.array([3, np.nan, 4, 0, 0])
 
         sparse1 = pd.SparseSeries(val1, name='x', kind='integer')
-        sparse2 = pd.SparseSeries(val2, name='y', kind='block', fill_value=0)
+        sparse2 = pd.SparseSeries(val2, name='y', kind='block')
 
         res = pd.concat([sparse1, sparse2])
         exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-        exp = pd.SparseSeries(exp, kind='integer')
+        exp = pd.SparseSeries(exp, kind=sparse1.kind)
         tm.assert_sp_series_equal(res, exp)
 
         res = pd.concat([sparse2, sparse1])
         exp = pd.concat([pd.Series(val2), pd.Series(val1)])
-        exp = pd.SparseSeries(exp, kind='block', fill_value=0)
-        tm.assert_sp_series_equal(res, exp)
-
-    def test_concat_sparse_dense(self):
+        exp = pd.SparseSeries(exp, kind=sparse2.kind)
+        tm.assert_sp_series_equal(res, exp, consolidate_block_indices=True)
+
+    @pytest.mark.parametrize('kind', [
+        'integer',
+        'block',
+    ])
+    def test_concat_sparse_dense(self, kind):
         # use first input's fill_value
         val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
         val2 = np.array([3, np.nan, 4, 0, 0])
 
-        for kind in ['integer', 'block']:
-            sparse = pd.SparseSeries(val1, name='x', kind=kind)
-            dense = pd.Series(val2, name='y')
-
-            res = pd.concat([sparse, dense])
-            exp = pd.concat([pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            res = pd.concat([dense, sparse, dense])
-            exp = pd.concat([dense, pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
-            dense = pd.Series(val2, name='y')
-
-            res = pd.concat([sparse, dense])
-            exp = pd.concat([pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
-            tm.assert_sp_series_equal(res, exp)
-
-            res = pd.concat([dense, sparse, dense])
-            exp = pd.concat([dense, pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
-            tm.assert_sp_series_equal(res, exp)
-
+        sparse = pd.SparseSeries(val1, name='x', kind=kind)
+        dense = pd.Series(val2, name='y')
 
-class TestSparseDataFrameConcat(tm.TestCase):
+        res = pd.concat([sparse, dense])
+        exp = pd.SparseSeries(pd.concat([pd.Series(val1), dense]), kind=kind)
+        tm.assert_sp_series_equal(res, exp)
 
-    def setUp(self):
+        res = pd.concat([dense, sparse, dense])
+        exp = pd.concat([dense, pd.Series(val1), dense])
+        # XXX: changed from SparseSeries to Series[sparse]
+        exp = pd.Series(
+            pd.SparseArray(exp, kind=kind),
+            index=exp.index,
+            name=exp.name,
+        )
+        tm.assert_series_equal(res, exp)
+
+        sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
+        dense = pd.Series(val2, name='y')
+
+        res = pd.concat([sparse, dense])
+        # XXX: changed from SparseSeries to Series[sparse]
+        exp = pd.concat([pd.Series(val1), dense])
+        exp = pd.Series(
+            pd.SparseArray(exp, kind=kind, fill_value=0),
+            index=exp.index,
+            name=exp.name,
+        )
+        tm.assert_series_equal(res, exp)
+
+        res = pd.concat([dense, sparse, dense])
+        exp = pd.concat([dense, pd.Series(val1), dense])
+        # XXX: changed from SparseSeries to Series[sparse]
+        exp = pd.Series(
+            pd.SparseArray(exp, kind=kind, fill_value=0),
+            index=exp.index,
+            name=exp.name,
+        )
+        tm.assert_series_equal(res, exp)
+
+
+class TestSparseDataFrameConcat(object):
+
+    def setup_method(self, method):
 
         self.dense1 = pd.DataFrame({'A': [0., 1., 2., np.nan],
                                     'B': [0., 0., 0., 0.],
@@ -148,19 +203,19 @@ def test_concat(self):
 
         res = pd.concat([sparse, sparse])
         exp = pd.concat([self.dense1, self.dense1]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse2, sparse2])
         exp = pd.concat([self.dense2, self.dense2]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse, sparse2])
         exp = pd.concat([self.dense1, self.dense2]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse2, sparse])
         exp = pd.concat([self.dense2, self.dense1]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         # fill_value = 0
         sparse = self.dense1.to_sparse(fill_value=0)
@@ -169,77 +224,106 @@ def test_concat(self):
         res = pd.concat([sparse, sparse])
         exp = pd.concat([self.dense1, self.dense1]).to_sparse(fill_value=0)
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse2, sparse2])
         exp = pd.concat([self.dense2, self.dense2]).to_sparse(fill_value=0)
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse, sparse2])
         exp = pd.concat([self.dense1, self.dense2]).to_sparse(fill_value=0)
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
         res = pd.concat([sparse2, sparse])
         exp = pd.concat([self.dense2, self.dense1]).to_sparse(fill_value=0)
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
     def test_concat_different_fill_value(self):
         # 1st fill_value will be used
         sparse = self.dense1.to_sparse()
         sparse2 = self.dense2.to_sparse(fill_value=0)
 
-        res = pd.concat([sparse, sparse2])
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pd.concat([sparse, sparse2])
         exp = pd.concat([self.dense1, self.dense2]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
 
-        res = pd.concat([sparse2, sparse])
+        with tm.assert_produces_warning(PerformanceWarning):
+            res = pd.concat([sparse2, sparse])
         exp = pd.concat([self.dense2, self.dense1]).to_sparse(fill_value=0)
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True)
+
+    def test_concat_different_columns_sort_warns(self):
+        sparse = self.dense1.to_sparse()
+        sparse3 = self.dense3.to_sparse()
+
+        with tm.assert_produces_warning(FutureWarning):
+            res = pd.concat([sparse, sparse3])
+        with tm.assert_produces_warning(FutureWarning):
+            exp = pd.concat([self.dense1, self.dense3])
+
+        exp = exp.to_sparse()
+        tm.assert_sp_frame_equal(res, exp, check_kind=False)
 
     def test_concat_different_columns(self):
         # fill_value = np.nan
         sparse = self.dense1.to_sparse()
         sparse3 = self.dense3.to_sparse()
 
-        res = pd.concat([sparse, sparse3])
-        exp = pd.concat([self.dense1, self.dense3]).to_sparse()
-        tm.assert_sp_frame_equal(res, exp)
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = pd.concat([self.dense1, self.dense3], sort=True).to_sparse()
+        tm.assert_sp_frame_equal(res, exp, check_kind=False)
 
-        res = pd.concat([sparse3, sparse])
-        exp = pd.concat([self.dense3, self.dense1]).to_sparse()
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = pd.concat([self.dense3, self.dense1], sort=True).to_sparse()
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, check_kind=False)
+
+    def test_concat_bug(self):
+        from pandas.core.sparse.api import SparseDtype
+        x = pd.SparseDataFrame({"A": pd.SparseArray([np.nan, np.nan],
+                                                    fill_value=0)})
+        y = pd.SparseDataFrame({"B": []})
+        res = pd.concat([x, y], sort=False)[['A']]
+        exp = pd.DataFrame({"A": pd.SparseArray([np.nan, np.nan],
+                                                dtype=SparseDtype(float, 0))})
+        tm.assert_frame_equal(res, exp)
 
-        # fill_value = 0
+    def test_concat_different_columns_buggy(self):
         sparse = self.dense1.to_sparse(fill_value=0)
         sparse3 = self.dense3.to_sparse(fill_value=0)
 
-        res = pd.concat([sparse, sparse3])
-        exp = pd.concat([self.dense1, self.dense3]).to_sparse(fill_value=0)
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = (pd.concat([self.dense1, self.dense3], sort=True)
+                 .to_sparse(fill_value=0))
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
 
-        res = pd.concat([sparse3, sparse])
-        exp = pd.concat([self.dense3, self.dense1]).to_sparse(fill_value=0)
+        tm.assert_sp_frame_equal(res, exp, check_kind=False,
+                                 consolidate_block_indices=True)
+
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = (pd.concat([self.dense3, self.dense1], sort=True)
+                 .to_sparse(fill_value=0))
         exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
+        tm.assert_sp_frame_equal(res, exp, check_kind=False,
+                                 consolidate_block_indices=True)
 
         # different fill values
         sparse = self.dense1.to_sparse()
         sparse3 = self.dense3.to_sparse(fill_value=0)
         # each columns keeps its fill_value, thus compare in dense
-        res = pd.concat([sparse, sparse3])
-        exp = pd.concat([self.dense1, self.dense3])
-        self.assertIsInstance(res, pd.SparseDataFrame)
+        res = pd.concat([sparse, sparse3], sort=True)
+        exp = pd.concat([self.dense1, self.dense3], sort=True)
+        assert isinstance(res, pd.SparseDataFrame)
         tm.assert_frame_equal(res.to_dense(), exp)
 
-        res = pd.concat([sparse3, sparse])
-        exp = pd.concat([self.dense3, self.dense1])
-        self.assertIsInstance(res, pd.SparseDataFrame)
+        res = pd.concat([sparse3, sparse], sort=True)
+        exp = pd.concat([self.dense3, self.dense1], sort=True)
+        assert isinstance(res, pd.SparseDataFrame)
         tm.assert_frame_equal(res.to_dense(), exp)
 
     def test_concat_series(self):
@@ -250,11 +334,11 @@ def test_concat_series(self):
         for col in ['A', 'D']:
             res = pd.concat([sparse, sparse2[col]])
             exp = pd.concat([self.dense1, self.dense2[col]]).to_sparse()
-            tm.assert_sp_frame_equal(res, exp)
+            tm.assert_sp_frame_equal(res, exp, check_kind=False)
 
             res = pd.concat([sparse2[col], sparse])
             exp = pd.concat([self.dense2[col], self.dense1]).to_sparse()
-            tm.assert_sp_frame_equal(res, exp)
+            tm.assert_sp_frame_equal(res, exp, check_kind=False)
 
         # fill_value = 0
         sparse = self.dense1.to_sparse(fill_value=0)
@@ -265,13 +349,16 @@ def test_concat_series(self):
             exp = pd.concat([self.dense1,
                              self.dense2[col]]).to_sparse(fill_value=0)
             exp._default_fill_value = np.nan
-            tm.assert_sp_frame_equal(res, exp)
+            tm.assert_sp_frame_equal(res, exp, check_kind=False,
+                                     consolidate_block_indices=True)
 
             res = pd.concat([sparse2[col], sparse])
             exp = pd.concat([self.dense2[col],
                              self.dense1]).to_sparse(fill_value=0)
+            exp['C'] = res['C']
             exp._default_fill_value = np.nan
-            tm.assert_sp_frame_equal(res, exp)
+            tm.assert_sp_frame_equal(res, exp, consolidate_block_indices=True,
+                                     check_kind=False)
 
     def test_concat_axis1(self):
         # fill_value = np.nan
@@ -309,45 +396,67 @@ def test_concat_axis1(self):
         # each columns keeps its fill_value, thus compare in dense
         res = pd.concat([sparse, sparse3], axis=1)
         exp = pd.concat([self.dense1, self.dense3], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
+        assert isinstance(res, pd.SparseDataFrame)
         tm.assert_frame_equal(res.to_dense(), exp)
 
         res = pd.concat([sparse3, sparse], axis=1)
         exp = pd.concat([self.dense3, self.dense1], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-    def test_concat_sparse_dense(self):
-        sparse = self.dense1.to_sparse()
-
-        res = pd.concat([sparse, self.dense2])
-        exp = pd.concat([self.dense1, self.dense2])
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-        res = pd.concat([self.dense2, sparse])
-        exp = pd.concat([self.dense2, self.dense1])
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-        sparse = self.dense1.to_sparse(fill_value=0)
-
-        res = pd.concat([sparse, self.dense2])
-        exp = pd.concat([self.dense1, self.dense2])
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-        res = pd.concat([self.dense2, sparse])
-        exp = pd.concat([self.dense2, self.dense1])
-        self.assertIsInstance(res, pd.SparseDataFrame)
+        assert isinstance(res, pd.SparseDataFrame)
         tm.assert_frame_equal(res.to_dense(), exp)
 
-        res = pd.concat([self.dense3, sparse], axis=1)
-        exp = pd.concat([self.dense3, self.dense1], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res, exp)
-
-        res = pd.concat([sparse, self.dense3], axis=1)
-        exp = pd.concat([self.dense1, self.dense3], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res, exp)
+    @pytest.mark.parametrize('fill_value,sparse_idx,dense_idx',
+                             itertools.product([None, 0, 1, np.nan],
+                                               [0, 1],
+                                               [1, 0]))
+    def test_concat_sparse_dense_rows(self, fill_value, sparse_idx, dense_idx):
+        frames = [self.dense1, self.dense2]
+        sparse_frame = [frames[dense_idx],
+                        frames[sparse_idx].to_sparse(fill_value=fill_value)]
+        dense_frame = [frames[dense_idx], frames[sparse_idx]]
+
+        # This will try both directions sparse + dense and dense + sparse
+        for _ in range(2):
+            res = pd.concat(sparse_frame)
+            exp = pd.concat(dense_frame)
+
+            assert isinstance(res, pd.SparseDataFrame)
+            tm.assert_frame_equal(res.to_dense(), exp)
+
+            sparse_frame = sparse_frame[::-1]
+            dense_frame = dense_frame[::-1]
+
+    @pytest.mark.parametrize('fill_value,sparse_idx,dense_idx',
+                             itertools.product([None, 0, 1, np.nan],
+                                               [0, 1],
+                                               [1, 0]))
+    @pytest.mark.xfail(reason="The iloc fails and I can't make expected",
+                       strict=False)
+    def test_concat_sparse_dense_cols(self, fill_value, sparse_idx, dense_idx):
+        # See GH16874, GH18914 and #18686 for why this should be a DataFrame
+        from pandas.core.dtypes.common import is_sparse
+
+        frames = [self.dense1, self.dense3]
+
+        sparse_frame = [frames[dense_idx],
+                        frames[sparse_idx].to_sparse(fill_value=fill_value)]
+        dense_frame = [frames[dense_idx], frames[sparse_idx]]
+
+        # This will try both directions sparse + dense and dense + sparse
+        for _ in range(2):
+            res = pd.concat(sparse_frame, axis=1)
+            exp = pd.concat(dense_frame, axis=1)
+            cols = [i for (i, x) in enumerate(res.dtypes) if is_sparse(x)]
+
+            for col in cols:
+                exp.iloc[:, col] = exp.iloc[:, col].astype("Sparse")
+
+            for column in frames[dense_idx].columns:
+                if dense_idx == sparse_idx:
+                    tm.assert_frame_equal(res[column], exp[column])
+                else:
+                    tm.assert_series_equal(res[column], exp[column])
+
+            tm.assert_frame_equal(res, exp)
+
+            sparse_frame = sparse_frame[::-1]
+            dense_frame = dense_frame[::-1]
diff --git a/pandas/tests/sparse/test_format.py b/pandas/tests/sparse/test_format.py
index ba870a2c33801..63018f9525b1f 100644
--- a/pandas/tests/sparse/test_format.py
+++ b/pandas/tests/sparse/test_format.py
@@ -2,18 +2,17 @@
 from __future__ import print_function
 
 import numpy as np
-import pandas as pd
 
-import pandas.util.testing as tm
-from pandas.compat import (is_platform_windows,
-                           is_platform_32bit)
-from pandas.core.config import option_context
+from pandas.compat import is_platform_32bit, is_platform_windows
 
+import pandas as pd
+from pandas.core.config import option_context
+import pandas.util.testing as tm
 
 use_32bit_repr = is_platform_windows() or is_platform_32bit()
 
 
-class TestSparseSeriesFormatting(tm.TestCase):
+class TestSparseSeriesFormatting(object):
 
     @property
     def dtype_format_for_platform(self):
@@ -24,19 +23,23 @@ def test_sparse_max_row(self):
         result = repr(s)
         dfm = self.dtype_format_for_platform
         exp = ("0    1.0\n1    NaN\n2    NaN\n3    3.0\n"
-               "4    NaN\ndtype: float64\nBlockIndex\n"
+               "4    NaN\ndtype: Sparse[float64, nan]\nBlockIndex\n"
                "Block locations: array([0, 3]{0})\n"
                "Block lengths: array([1, 1]{0})".format(dfm))
-        self.assertEqual(result, exp)
+        assert result == exp
+
+    def test_sparsea_max_row_truncated(self):
+        s = pd.Series([1, np.nan, np.nan, 3, np.nan]).to_sparse()
+        dfm = self.dtype_format_for_platform
 
         with option_context("display.max_rows", 3):
             # GH 10560
             result = repr(s)
             exp = ("0    1.0\n    ... \n4    NaN\n"
-                   "dtype: float64\nBlockIndex\n"
+                   "Length: 5, dtype: Sparse[float64, nan]\nBlockIndex\n"
                    "Block locations: array([0, 3]{0})\n"
                    "Block lengths: array([1, 1]{0})".format(dfm))
-            self.assertEqual(result, exp)
+            assert result == exp
 
     def test_sparse_mi_max_row(self):
         idx = pd.MultiIndex.from_tuples([('A', 0), ('A', 1), ('B', 0),
@@ -47,19 +50,20 @@ def test_sparse_mi_max_row(self):
         dfm = self.dtype_format_for_platform
         exp = ("A  0    1.0\n   1    NaN\nB  0    NaN\n"
                "C  0    3.0\n   1    NaN\n   2    NaN\n"
-               "dtype: float64\nBlockIndex\n"
+               "dtype: Sparse[float64, nan]\nBlockIndex\n"
                "Block locations: array([0, 3]{0})\n"
                "Block lengths: array([1, 1]{0})".format(dfm))
-        self.assertEqual(result, exp)
+        assert result == exp
 
-        with option_context("display.max_rows", 3):
+        with option_context("display.max_rows", 3,
+                            "display.show_dimensions", False):
             # GH 13144
             result = repr(s)
             exp = ("A  0    1.0\n       ... \nC  2    NaN\n"
-                   "dtype: float64\nBlockIndex\n"
+                   "dtype: Sparse[float64, nan]\nBlockIndex\n"
                    "Block locations: array([0, 3]{0})\n"
                    "Block lengths: array([1, 1]{0})".format(dfm))
-            self.assertEqual(result, exp)
+            assert result == exp
 
     def test_sparse_bool(self):
         # GH 13110
@@ -69,18 +73,18 @@ def test_sparse_bool(self):
         dtype = '' if use_32bit_repr else ', dtype=int32'
         exp = ("0     True\n1    False\n2    False\n"
                "3     True\n4    False\n5    False\n"
-               "dtype: bool\nBlockIndex\n"
+               "dtype: Sparse[bool, False]\nBlockIndex\n"
                "Block locations: array([0, 3]{0})\n"
                "Block lengths: array([1, 1]{0})".format(dtype))
-        self.assertEqual(result, exp)
+        assert result == exp
 
         with option_context("display.max_rows", 3):
             result = repr(s)
             exp = ("0     True\n     ...  \n5    False\n"
-                   "dtype: bool\nBlockIndex\n"
+                   "Length: 6, dtype: Sparse[bool, False]\nBlockIndex\n"
                    "Block locations: array([0, 3]{0})\n"
                    "Block lengths: array([1, 1]{0})".format(dtype))
-            self.assertEqual(result, exp)
+            assert result == exp
 
     def test_sparse_int(self):
         # GH 13110
@@ -89,21 +93,22 @@ def test_sparse_int(self):
         result = repr(s)
         dtype = '' if use_32bit_repr else ', dtype=int32'
         exp = ("0    0\n1    1\n2    0\n3    0\n4    1\n"
-               "5    0\ndtype: int64\nBlockIndex\n"
+               "5    0\ndtype: Sparse[int64, False]\nBlockIndex\n"
                "Block locations: array([1, 4]{0})\n"
                "Block lengths: array([1, 1]{0})".format(dtype))
-        self.assertEqual(result, exp)
+        assert result == exp
 
-        with option_context("display.max_rows", 3):
+        with option_context("display.max_rows", 3,
+                            "display.show_dimensions", False):
             result = repr(s)
             exp = ("0    0\n    ..\n5    0\n"
-                   "dtype: int64\nBlockIndex\n"
+                   "dtype: Sparse[int64, False]\nBlockIndex\n"
                    "Block locations: array([1, 4]{0})\n"
                    "Block lengths: array([1, 1]{0})".format(dtype))
-            self.assertEqual(result, exp)
+            assert result == exp
 
 
-class TestSparseDataFrameFormatting(tm.TestCase):
+class TestSparseDataFrameFormatting(object):
 
     def test_sparse_frame(self):
         # GH 13110
@@ -112,10 +117,10 @@ def test_sparse_frame(self):
                            'C': [0, 0, 3, 0, 5],
                            'D': [np.nan, np.nan, np.nan, 1, 2]})
         sparse = df.to_sparse()
-        self.assertEqual(repr(sparse), repr(df))
+        assert repr(sparse) == repr(df)
 
         with option_context("display.max_rows", 3):
-            self.assertEqual(repr(sparse), repr(df))
+            assert repr(sparse) == repr(df)
 
     def test_sparse_repr_after_set(self):
         # GH 15488
diff --git a/pandas/tests/sparse/test_frame.py b/pandas/tests/sparse/test_frame.py
deleted file mode 100644
index ae1a1e35f1859..0000000000000
--- a/pandas/tests/sparse/test_frame.py
+++ /dev/null
@@ -1,1319 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-
-import operator
-
-import pytest
-
-from numpy import nan
-import numpy as np
-import pandas as pd
-
-from pandas import Series, DataFrame, bdate_range, Panel
-from pandas.types.common import (is_bool_dtype,
-                                 is_float_dtype,
-                                 is_object_dtype,
-                                 is_float)
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.offsets import BDay
-import pandas.util.testing as tm
-from pandas.compat import lrange
-from pandas import compat
-import pandas.sparse.frame as spf
-
-from pandas.sparse.libsparse import BlockIndex, IntIndex
-from pandas.sparse.api import SparseSeries, SparseDataFrame, SparseArray
-from pandas.tests.frame.test_misc_api import SharedWithSparse
-
-from pandas.tests.sparse.common import spmatrix  # noqa: F401
-
-
-class TestSparseDataFrame(tm.TestCase, SharedWithSparse):
-    klass = SparseDataFrame
-
-    def setUp(self):
-        self.data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                     'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                     'C': np.arange(10, dtype=np.float64),
-                     'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
-
-        self.dates = bdate_range('1/1/2011', periods=10)
-
-        self.orig = pd.DataFrame(self.data, index=self.dates)
-        self.iorig = pd.DataFrame(self.data, index=self.dates)
-
-        self.frame = SparseDataFrame(self.data, index=self.dates)
-        self.iframe = SparseDataFrame(self.data, index=self.dates,
-                                      default_kind='integer')
-
-        values = self.frame.values.copy()
-        values[np.isnan(values)] = 0
-
-        self.zorig = pd.DataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                  index=self.dates)
-        self.zframe = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                      default_fill_value=0, index=self.dates)
-
-        values = self.frame.values.copy()
-        values[np.isnan(values)] = 2
-
-        self.fill_orig = pd.DataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                      index=self.dates)
-        self.fill_frame = SparseDataFrame(values, columns=['A', 'B', 'C', 'D'],
-                                          default_fill_value=2,
-                                          index=self.dates)
-
-        self.empty = SparseDataFrame()
-
-    def test_fill_value_when_combine_const(self):
-        # GH12723
-        dat = np.array([0, 1, np.nan, 3, 4, 5], dtype='float')
-        df = SparseDataFrame({'foo': dat}, index=range(6))
-
-        exp = df.fillna(0).add(2)
-        res = df.add(2, fill_value=0)
-        tm.assert_sp_frame_equal(res, exp)
-
-    def test_as_matrix(self):
-        empty = self.empty.as_matrix()
-        self.assertEqual(empty.shape, (0, 0))
-
-        no_cols = SparseDataFrame(index=np.arange(10))
-        mat = no_cols.as_matrix()
-        self.assertEqual(mat.shape, (10, 0))
-
-        no_index = SparseDataFrame(columns=np.arange(10))
-        mat = no_index.as_matrix()
-        self.assertEqual(mat.shape, (0, 10))
-
-    def test_copy(self):
-        cp = self.frame.copy()
-        tm.assertIsInstance(cp, SparseDataFrame)
-        tm.assert_sp_frame_equal(cp, self.frame)
-
-        # as of v0.15.0
-        # this is now identical (but not is_a )
-        self.assertTrue(cp.index.identical(self.frame.index))
-
-    def test_constructor(self):
-        for col, series in compat.iteritems(self.frame):
-            tm.assertIsInstance(series, SparseSeries)
-
-        tm.assertIsInstance(self.iframe['A'].sp_index, IntIndex)
-
-        # constructed zframe from matrix above
-        self.assertEqual(self.zframe['A'].fill_value, 0)
-        tm.assert_numpy_array_equal(pd.SparseArray([1., 2., 3., 4., 5., 6.]),
-                                    self.zframe['A'].values)
-        tm.assert_numpy_array_equal(np.array([0., 0., 0., 0., 1., 2.,
-                                              3., 4., 5., 6.]),
-                                    self.zframe['A'].to_dense().values)
-
-        # construct no data
-        sdf = SparseDataFrame(columns=np.arange(10), index=np.arange(10))
-        for col, series in compat.iteritems(sdf):
-            tm.assertIsInstance(series, SparseSeries)
-
-        # construct from nested dict
-        data = {}
-        for c, s in compat.iteritems(self.frame):
-            data[c] = s.to_dict()
-
-        sdf = SparseDataFrame(data)
-        tm.assert_sp_frame_equal(sdf, self.frame)
-
-        # TODO: test data is copied from inputs
-
-        # init dict with different index
-        idx = self.frame.index[:5]
-        cons = SparseDataFrame(
-            self.frame, index=idx, columns=self.frame.columns,
-            default_fill_value=self.frame.default_fill_value,
-            default_kind=self.frame.default_kind, copy=True)
-        reindexed = self.frame.reindex(idx)
-
-        tm.assert_sp_frame_equal(cons, reindexed, exact_indices=False)
-
-        # assert level parameter breaks reindex
-        with tm.assertRaises(TypeError):
-            self.frame.reindex(idx, level=0)
-
-        repr(self.frame)
-
-    def test_constructor_ndarray(self):
-        # no index or columns
-        sp = SparseDataFrame(self.frame.values)
-
-        # 1d
-        sp = SparseDataFrame(self.data['A'], index=self.dates, columns=['A'])
-        tm.assert_sp_frame_equal(sp, self.frame.reindex(columns=['A']))
-
-        # raise on level argument
-        self.assertRaises(TypeError, self.frame.reindex, columns=['A'],
-                          level=1)
-
-        # wrong length index / columns
-        with tm.assertRaisesRegexp(ValueError, "^Index length"):
-            SparseDataFrame(self.frame.values, index=self.frame.index[:-1])
-
-        with tm.assertRaisesRegexp(ValueError, "^Column length"):
-            SparseDataFrame(self.frame.values, columns=self.frame.columns[:-1])
-
-    # GH 9272
-    def test_constructor_empty(self):
-        sp = SparseDataFrame()
-        self.assertEqual(len(sp.index), 0)
-        self.assertEqual(len(sp.columns), 0)
-
-    def test_constructor_dataframe(self):
-        dense = self.frame.to_dense()
-        sp = SparseDataFrame(dense)
-        tm.assert_sp_frame_equal(sp, self.frame)
-
-    def test_constructor_convert_index_once(self):
-        arr = np.array([1.5, 2.5, 3.5])
-        sdf = SparseDataFrame(columns=lrange(4), index=arr)
-        self.assertTrue(sdf[0].index is sdf[1].index)
-
-    def test_constructor_from_series(self):
-
-        # GH 2873
-        x = Series(np.random.randn(10000), name='a')
-        x = x.to_sparse(fill_value=0)
-        tm.assertIsInstance(x, SparseSeries)
-        df = SparseDataFrame(x)
-        tm.assertIsInstance(df, SparseDataFrame)
-
-        x = Series(np.random.randn(10000), name='a')
-        y = Series(np.random.randn(10000), name='b')
-        x2 = x.astype(float)
-        x2.loc[:9998] = np.NaN
-        # TODO: x_sparse is unused...fix
-        x_sparse = x2.to_sparse(fill_value=np.NaN)  # noqa
-
-        # Currently fails too with weird ufunc error
-        # df1 = SparseDataFrame([x_sparse, y])
-
-        y.loc[:9998] = 0
-        # TODO: y_sparse is unsused...fix
-        y_sparse = y.to_sparse(fill_value=0)  # noqa
-        # without sparse value raises error
-        # df2 = SparseDataFrame([x2_sparse, y])
-
-    def test_constructor_preserve_attr(self):
-        # GH 13866
-        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        df = pd.SparseDataFrame({'x': arr})
-        self.assertEqual(df['x'].dtype, np.int64)
-        self.assertEqual(df['x'].fill_value, 0)
-
-        s = pd.SparseSeries(arr, name='x')
-        self.assertEqual(s.dtype, np.int64)
-        self.assertEqual(s.fill_value, 0)
-
-        df = pd.SparseDataFrame(s)
-        self.assertEqual(df['x'].dtype, np.int64)
-        self.assertEqual(df['x'].fill_value, 0)
-
-        df = pd.SparseDataFrame({'x': s})
-        self.assertEqual(df['x'].dtype, np.int64)
-        self.assertEqual(df['x'].fill_value, 0)
-
-    def test_constructor_nan_dataframe(self):
-        # GH 10079
-        trains = np.arange(100)
-        tresholds = [10, 20, 30, 40, 50, 60]
-        tuples = [(i, j) for i in trains for j in tresholds]
-        index = pd.MultiIndex.from_tuples(tuples,
-                                          names=['trains', 'tresholds'])
-        matrix = np.empty((len(index), len(trains)))
-        matrix.fill(np.nan)
-        df = pd.DataFrame(matrix, index=index, columns=trains, dtype=float)
-        result = df.to_sparse()
-        expected = pd.SparseDataFrame(matrix, index=index, columns=trains,
-                                      dtype=float)
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_type_coercion_at_construction(self):
-        # GH 15682
-        result = pd.SparseDataFrame(
-            {'a': [1, 0, 0], 'b': [0, 1, 0], 'c': [0, 0, 1]}, dtype='uint8',
-            default_fill_value=0)
-        expected = pd.SparseDataFrame(
-            {'a': pd.SparseSeries([1, 0, 0], dtype='uint8'),
-             'b': pd.SparseSeries([0, 1, 0], dtype='uint8'),
-             'c': pd.SparseSeries([0, 0, 1], dtype='uint8')},
-            default_fill_value=0)
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_dtypes(self):
-        df = DataFrame(np.random.randn(10000, 4))
-        df.loc[:9998] = np.nan
-        sdf = df.to_sparse()
-
-        result = sdf.get_dtype_counts()
-        expected = Series({'float64': 4})
-        tm.assert_series_equal(result, expected)
-
-    def test_shape(self):
-        # GH 10452
-        self.assertEqual(self.frame.shape, (10, 4))
-        self.assertEqual(self.iframe.shape, (10, 4))
-        self.assertEqual(self.zframe.shape, (10, 4))
-        self.assertEqual(self.fill_frame.shape, (10, 4))
-
-    def test_str(self):
-        df = DataFrame(np.random.randn(10000, 4))
-        df.loc[:9998] = np.nan
-
-        sdf = df.to_sparse()
-        str(sdf)
-
-    def test_array_interface(self):
-        res = np.sqrt(self.frame)
-        dres = np.sqrt(self.frame.to_dense())
-        tm.assert_frame_equal(res.to_dense(), dres)
-
-    def test_pickle(self):
-
-        def _test_roundtrip(frame, orig):
-            result = self.round_trip_pickle(frame)
-            tm.assert_sp_frame_equal(frame, result)
-            tm.assert_frame_equal(result.to_dense(), orig, check_dtype=False)
-
-        _test_roundtrip(SparseDataFrame(), DataFrame())
-        self._check_all(_test_roundtrip)
-
-    def test_dense_to_sparse(self):
-        df = DataFrame({'A': [nan, nan, nan, 1, 2],
-                        'B': [1, 2, nan, nan, nan]})
-        sdf = df.to_sparse()
-        tm.assertIsInstance(sdf, SparseDataFrame)
-        self.assertTrue(np.isnan(sdf.default_fill_value))
-        tm.assertIsInstance(sdf['A'].sp_index, BlockIndex)
-        tm.assert_frame_equal(sdf.to_dense(), df)
-
-        sdf = df.to_sparse(kind='integer')
-        tm.assertIsInstance(sdf['A'].sp_index, IntIndex)
-
-        df = DataFrame({'A': [0, 0, 0, 1, 2],
-                        'B': [1, 2, 0, 0, 0]}, dtype=float)
-        sdf = df.to_sparse(fill_value=0)
-        self.assertEqual(sdf.default_fill_value, 0)
-        tm.assert_frame_equal(sdf.to_dense(), df)
-
-    def test_density(self):
-        df = SparseSeries([nan, nan, nan, 0, 1, 2, 3, 4, 5, 6])
-        self.assertEqual(df.density, 0.7)
-
-        df = SparseDataFrame({'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                              'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                              'C': np.arange(10),
-                              'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]})
-
-        self.assertEqual(df.density, 0.75)
-
-    def test_sparse_to_dense(self):
-        pass
-
-    def test_sparse_series_ops(self):
-        self._check_frame_ops(self.frame)
-
-    def test_sparse_series_ops_i(self):
-        self._check_frame_ops(self.iframe)
-
-    def test_sparse_series_ops_z(self):
-        self._check_frame_ops(self.zframe)
-
-    def test_sparse_series_ops_fill(self):
-        self._check_frame_ops(self.fill_frame)
-
-    def _check_frame_ops(self, frame):
-
-        def _compare_to_dense(a, b, da, db, op):
-            sparse_result = op(a, b)
-            dense_result = op(da, db)
-
-            fill = sparse_result.default_fill_value
-            dense_result = dense_result.to_sparse(fill_value=fill)
-            tm.assert_sp_frame_equal(sparse_result, dense_result,
-                                     exact_indices=False)
-
-            if isinstance(a, DataFrame) and isinstance(db, DataFrame):
-                mixed_result = op(a, db)
-                tm.assertIsInstance(mixed_result, SparseDataFrame)
-                tm.assert_sp_frame_equal(mixed_result, sparse_result,
-                                         exact_indices=False)
-
-        opnames = ['add', 'sub', 'mul', 'truediv', 'floordiv']
-        ops = [getattr(operator, name) for name in opnames]
-
-        fidx = frame.index
-
-        # time series operations
-
-        series = [frame['A'], frame['B'], frame['C'], frame['D'],
-                  frame['A'].reindex(fidx[:7]), frame['A'].reindex(fidx[::2]),
-                  SparseSeries(
-                      [], index=[])]
-
-        for op in opnames:
-            _compare_to_dense(frame, frame[::2], frame.to_dense(),
-                              frame[::2].to_dense(), getattr(operator, op))
-
-            # 2304, no auto-broadcasting
-            for i, s in enumerate(series):
-                f = lambda a, b: getattr(a, op)(b, axis='index')
-                _compare_to_dense(frame, s, frame.to_dense(), s.to_dense(), f)
-
-                # rops are not implemented
-                # _compare_to_dense(s, frame, s.to_dense(),
-                #                   frame.to_dense(), f)
-
-                # cross-sectional operations
-        series = [frame.xs(fidx[0]), frame.xs(fidx[3]), frame.xs(fidx[5]),
-                  frame.xs(fidx[7]), frame.xs(fidx[5])[:2]]
-
-        for op in ops:
-            for s in series:
-                _compare_to_dense(frame, s, frame.to_dense(), s, op)
-                _compare_to_dense(s, frame, s, frame.to_dense(), op)
-
-        # it works!
-        result = self.frame + self.frame.loc[:, ['A', 'B']]  # noqa
-
-    def test_op_corners(self):
-        empty = self.empty + self.empty
-        self.assertTrue(empty.empty)
-
-        foo = self.frame + self.empty
-        tm.assertIsInstance(foo.index, DatetimeIndex)
-        tm.assert_frame_equal(foo, self.frame * np.nan)
-
-        foo = self.empty + self.frame
-        tm.assert_frame_equal(foo, self.frame * np.nan)
-
-    def test_scalar_ops(self):
-        pass
-
-    def test_getitem(self):
-        # 1585 select multiple columns
-        sdf = SparseDataFrame(index=[0, 1, 2], columns=['a', 'b', 'c'])
-
-        result = sdf[['a', 'b']]
-        exp = sdf.reindex(columns=['a', 'b'])
-        tm.assert_sp_frame_equal(result, exp)
-
-        self.assertRaises(Exception, sdf.__getitem__, ['a', 'd'])
-
-    def test_iloc(self):
-
-        # 2227
-        result = self.frame.iloc[:, 0]
-        self.assertTrue(isinstance(result, SparseSeries))
-        tm.assert_sp_series_equal(result, self.frame['A'])
-
-        # preserve sparse index type. #2251
-        data = {'A': [0, 1]}
-        iframe = SparseDataFrame(data, default_kind='integer')
-        self.assertEqual(type(iframe['A'].sp_index),
-                         type(iframe.iloc[:, 0].sp_index))
-
-    def test_set_value(self):
-
-        # ok as the index gets conver to object
-        frame = self.frame.copy()
-        res = frame.set_value('foobar', 'B', 1.5)
-        self.assertEqual(res.index.dtype, 'object')
-
-        res = self.frame
-        res.index = res.index.astype(object)
-
-        res = self.frame.set_value('foobar', 'B', 1.5)
-        self.assertIsNot(res, self.frame)
-        self.assertEqual(res.index[-1], 'foobar')
-        self.assertEqual(res.get_value('foobar', 'B'), 1.5)
-
-        res2 = res.set_value('foobar', 'qux', 1.5)
-        self.assertIsNot(res2, res)
-        self.assert_index_equal(res2.columns,
-                                pd.Index(list(self.frame.columns) + ['qux']))
-        self.assertEqual(res2.get_value('foobar', 'qux'), 1.5)
-
-    def test_fancy_index_misc(self):
-        # axis = 0
-        sliced = self.frame.iloc[-2:, :]
-        expected = self.frame.reindex(index=self.frame.index[-2:])
-        tm.assert_sp_frame_equal(sliced, expected)
-
-        # axis = 1
-        sliced = self.frame.iloc[:, -2:]
-        expected = self.frame.reindex(columns=self.frame.columns[-2:])
-        tm.assert_sp_frame_equal(sliced, expected)
-
-    def test_getitem_overload(self):
-        # slicing
-        sl = self.frame[:20]
-        tm.assert_sp_frame_equal(sl, self.frame.reindex(self.frame.index[:20]))
-
-        # boolean indexing
-        d = self.frame.index[5]
-        indexer = self.frame.index > d
-
-        subindex = self.frame.index[indexer]
-        subframe = self.frame[indexer]
-
-        self.assert_index_equal(subindex, subframe.index)
-        self.assertRaises(Exception, self.frame.__getitem__, indexer[:-1])
-
-    def test_setitem(self):
-
-        def _check_frame(frame, orig):
-            N = len(frame)
-
-            # insert SparseSeries
-            frame['E'] = frame['A']
-            tm.assertIsInstance(frame['E'], SparseSeries)
-            tm.assert_sp_series_equal(frame['E'], frame['A'],
-                                      check_names=False)
-
-            # insert SparseSeries differently-indexed
-            to_insert = frame['A'][::2]
-            frame['E'] = to_insert
-            expected = to_insert.to_dense().reindex(frame.index)
-            result = frame['E'].to_dense()
-            tm.assert_series_equal(result, expected, check_names=False)
-            self.assertEqual(result.name, 'E')
-
-            # insert Series
-            frame['F'] = frame['A'].to_dense()
-            tm.assertIsInstance(frame['F'], SparseSeries)
-            tm.assert_sp_series_equal(frame['F'], frame['A'],
-                                      check_names=False)
-
-            # insert Series differently-indexed
-            to_insert = frame['A'].to_dense()[::2]
-            frame['G'] = to_insert
-            expected = to_insert.reindex(frame.index)
-            expected.name = 'G'
-            tm.assert_series_equal(frame['G'].to_dense(), expected)
-
-            # insert ndarray
-            frame['H'] = np.random.randn(N)
-            tm.assertIsInstance(frame['H'], SparseSeries)
-
-            to_sparsify = np.random.randn(N)
-            to_sparsify[N // 2:] = frame.default_fill_value
-            frame['I'] = to_sparsify
-            self.assertEqual(len(frame['I'].sp_values), N // 2)
-
-            # insert ndarray wrong size
-            self.assertRaises(Exception, frame.__setitem__, 'foo',
-                              np.random.randn(N - 1))
-
-            # scalar value
-            frame['J'] = 5
-            self.assertEqual(len(frame['J'].sp_values), N)
-            self.assertTrue((frame['J'].sp_values == 5).all())
-
-            frame['K'] = frame.default_fill_value
-            self.assertEqual(len(frame['K'].sp_values), 0)
-
-        self._check_all(_check_frame)
-
-    def test_setitem_corner(self):
-        self.frame['a'] = self.frame['B']
-        tm.assert_sp_series_equal(self.frame['a'], self.frame['B'],
-                                  check_names=False)
-
-    def test_setitem_array(self):
-        arr = self.frame['B']
-
-        self.frame['E'] = arr
-        tm.assert_sp_series_equal(self.frame['E'], self.frame['B'],
-                                  check_names=False)
-
-        self.frame['F'] = arr[:-1]
-        index = self.frame.index[:-1]
-        tm.assert_sp_series_equal(self.frame['E'].reindex(index),
-                                  self.frame['F'].reindex(index),
-                                  check_names=False)
-
-    def test_delitem(self):
-        A = self.frame['A']
-        C = self.frame['C']
-
-        del self.frame['B']
-        self.assertNotIn('B', self.frame)
-        tm.assert_sp_series_equal(self.frame['A'], A)
-        tm.assert_sp_series_equal(self.frame['C'], C)
-
-        del self.frame['D']
-        self.assertNotIn('D', self.frame)
-
-        del self.frame['A']
-        self.assertNotIn('A', self.frame)
-
-    def test_set_columns(self):
-        self.frame.columns = self.frame.columns
-        self.assertRaises(Exception, setattr, self.frame, 'columns',
-                          self.frame.columns[:-1])
-
-    def test_set_index(self):
-        self.frame.index = self.frame.index
-        self.assertRaises(Exception, setattr, self.frame, 'index',
-                          self.frame.index[:-1])
-
-    def test_append(self):
-        a = self.frame[:5]
-        b = self.frame[5:]
-
-        appended = a.append(b)
-        tm.assert_sp_frame_equal(appended, self.frame, exact_indices=False)
-
-        a = self.frame.iloc[:5, :3]
-        b = self.frame.iloc[5:]
-        appended = a.append(b)
-        tm.assert_sp_frame_equal(appended.iloc[:, :3], self.frame.iloc[:, :3],
-                                 exact_indices=False)
-
-    def test_apply(self):
-        applied = self.frame.apply(np.sqrt)
-        tm.assertIsInstance(applied, SparseDataFrame)
-        tm.assert_almost_equal(applied.values, np.sqrt(self.frame.values))
-
-        applied = self.fill_frame.apply(np.sqrt)
-        self.assertEqual(applied['A'].fill_value, np.sqrt(2))
-
-        # agg / broadcast
-        broadcasted = self.frame.apply(np.sum, broadcast=True)
-        tm.assertIsInstance(broadcasted, SparseDataFrame)
-
-        exp = self.frame.to_dense().apply(np.sum, broadcast=True)
-        tm.assert_frame_equal(broadcasted.to_dense(), exp)
-
-        self.assertIs(self.empty.apply(np.sqrt), self.empty)
-
-        from pandas.core import nanops
-        applied = self.frame.apply(np.sum)
-        tm.assert_series_equal(applied,
-                               self.frame.to_dense().apply(nanops.nansum))
-
-    def test_apply_nonuq(self):
-        orig = DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                         index=['a', 'a', 'c'])
-        sparse = orig.to_sparse()
-        res = sparse.apply(lambda s: s[0], axis=1)
-        exp = orig.apply(lambda s: s[0], axis=1)
-        # dtype must be kept
-        self.assertEqual(res.dtype, np.int64)
-        # ToDo: apply must return subclassed dtype
-        self.assertIsInstance(res, pd.Series)
-        tm.assert_series_equal(res.to_dense(), exp)
-
-        # df.T breaks
-        sparse = orig.T.to_sparse()
-        res = sparse.apply(lambda s: s[0], axis=0)  # noqa
-        exp = orig.T.apply(lambda s: s[0], axis=0)
-        # TODO: no non-unique columns supported in sparse yet
-        # tm.assert_series_equal(res.to_dense(), exp)
-
-    def test_applymap(self):
-        # just test that it works
-        result = self.frame.applymap(lambda x: x * 2)
-        tm.assertIsInstance(result, SparseDataFrame)
-
-    def test_astype(self):
-        sparse = pd.SparseDataFrame({'A': SparseArray([1, 2, 3, 4],
-                                                      dtype=np.int64),
-                                     'B': SparseArray([4, 5, 6, 7],
-                                                      dtype=np.int64)})
-        self.assertEqual(sparse['A'].dtype, np.int64)
-        self.assertEqual(sparse['B'].dtype, np.int64)
-
-        res = sparse.astype(np.float64)
-        exp = pd.SparseDataFrame({'A': SparseArray([1., 2., 3., 4.],
-                                                   fill_value=0.),
-                                  'B': SparseArray([4., 5., 6., 7.],
-                                                   fill_value=0.)},
-                                 default_fill_value=np.nan)
-        tm.assert_sp_frame_equal(res, exp)
-        self.assertEqual(res['A'].dtype, np.float64)
-        self.assertEqual(res['B'].dtype, np.float64)
-
-        sparse = pd.SparseDataFrame({'A': SparseArray([0, 2, 0, 4],
-                                                      dtype=np.int64),
-                                     'B': SparseArray([0, 5, 0, 7],
-                                                      dtype=np.int64)},
-                                    default_fill_value=0)
-        self.assertEqual(sparse['A'].dtype, np.int64)
-        self.assertEqual(sparse['B'].dtype, np.int64)
-
-        res = sparse.astype(np.float64)
-        exp = pd.SparseDataFrame({'A': SparseArray([0., 2., 0., 4.],
-                                                   fill_value=0.),
-                                  'B': SparseArray([0., 5., 0., 7.],
-                                                   fill_value=0.)},
-                                 default_fill_value=0.)
-        tm.assert_sp_frame_equal(res, exp)
-        self.assertEqual(res['A'].dtype, np.float64)
-        self.assertEqual(res['B'].dtype, np.float64)
-
-    def test_astype_bool(self):
-        sparse = pd.SparseDataFrame({'A': SparseArray([0, 2, 0, 4],
-                                                      fill_value=0,
-                                                      dtype=np.int64),
-                                     'B': SparseArray([0, 5, 0, 7],
-                                                      fill_value=0,
-                                                      dtype=np.int64)},
-                                    default_fill_value=0)
-        self.assertEqual(sparse['A'].dtype, np.int64)
-        self.assertEqual(sparse['B'].dtype, np.int64)
-
-        res = sparse.astype(bool)
-        exp = pd.SparseDataFrame({'A': SparseArray([False, True, False, True],
-                                                   dtype=np.bool,
-                                                   fill_value=False),
-                                  'B': SparseArray([False, True, False, True],
-                                                   dtype=np.bool,
-                                                   fill_value=False)},
-                                 default_fill_value=False)
-        tm.assert_sp_frame_equal(res, exp)
-        self.assertEqual(res['A'].dtype, np.bool)
-        self.assertEqual(res['B'].dtype, np.bool)
-
-    def test_fillna(self):
-        df = self.zframe.reindex(lrange(5))
-        dense = self.zorig.reindex(lrange(5))
-
-        result = df.fillna(0)
-        expected = dense.fillna(0)
-        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
-                                 exact_indices=False)
-        tm.assert_frame_equal(result.to_dense(), expected)
-
-        result = df.copy()
-        result.fillna(0, inplace=True)
-        expected = dense.fillna(0)
-
-        tm.assert_sp_frame_equal(result, expected.to_sparse(fill_value=0),
-                                 exact_indices=False)
-        tm.assert_frame_equal(result.to_dense(), expected)
-
-        result = df.copy()
-        result = df['A']
-        result.fillna(0, inplace=True)
-
-        expected = dense['A'].fillna(0)
-        # this changes internal SparseArray repr
-        # tm.assert_sp_series_equal(result, expected.to_sparse(fill_value=0))
-        tm.assert_series_equal(result.to_dense(), expected)
-
-    def test_fillna_fill_value(self):
-        df = pd.DataFrame({'A': [1, 0, 0], 'B': [np.nan, np.nan, 4]})
-
-        sparse = pd.SparseDataFrame(df)
-        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
-                              df.fillna(-1), check_dtype=False)
-
-        sparse = pd.SparseDataFrame(df, default_fill_value=0)
-        tm.assert_frame_equal(sparse.fillna(-1).to_dense(),
-                              df.fillna(-1), check_dtype=False)
-
-    def test_sparse_frame_pad_backfill_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-        sdf = df.to_sparse()
-
-        result = sdf[:2].reindex(index, method='pad', limit=5)
-
-        expected = sdf[:2].reindex(index).fillna(method='pad')
-        expected = expected.to_dense()
-        expected.values[-3:] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-        result = sdf[-2:].reindex(index, method='backfill', limit=5)
-
-        expected = sdf[-2:].reindex(index).fillna(method='backfill')
-        expected = expected.to_dense()
-        expected.values[:3] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-    def test_sparse_frame_fillna_limit(self):
-        index = np.arange(10)
-        df = DataFrame(np.random.randn(10, 4), index=index)
-        sdf = df.to_sparse()
-
-        result = sdf[:2].reindex(index)
-        result = result.fillna(method='pad', limit=5)
-
-        expected = sdf[:2].reindex(index).fillna(method='pad')
-        expected = expected.to_dense()
-        expected.values[-3:] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-        result = sdf[-2:].reindex(index)
-        result = result.fillna(method='backfill', limit=5)
-
-        expected = sdf[-2:].reindex(index).fillna(method='backfill')
-        expected = expected.to_dense()
-        expected.values[:3] = np.nan
-        expected = expected.to_sparse()
-        tm.assert_frame_equal(result, expected)
-
-    def test_rename(self):
-        result = self.frame.rename(index=str)
-        expected = SparseDataFrame(self.data, index=self.dates.strftime(
-            "%Y-%m-%d %H:%M:%S"))
-        tm.assert_sp_frame_equal(result, expected)
-
-        result = self.frame.rename(columns=lambda x: '%s%d' % (x, len(x)))
-        data = {'A1': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                'B1': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                'C1': np.arange(10, dtype=np.float64),
-                'D1': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
-        expected = SparseDataFrame(data, index=self.dates)
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_corr(self):
-        res = self.frame.corr()
-        tm.assert_frame_equal(res, self.frame.to_dense().corr())
-
-    def test_describe(self):
-        self.frame['foo'] = np.nan
-        self.frame.get_dtype_counts()
-        str(self.frame)
-        desc = self.frame.describe()  # noqa
-
-    def test_join(self):
-        left = self.frame.loc[:, ['A', 'B']]
-        right = self.frame.loc[:, ['C', 'D']]
-        joined = left.join(right)
-        tm.assert_sp_frame_equal(joined, self.frame, exact_indices=False)
-
-        right = self.frame.loc[:, ['B', 'D']]
-        self.assertRaises(Exception, left.join, right)
-
-        with tm.assertRaisesRegexp(ValueError,
-                                   'Other Series must have a name'):
-            self.frame.join(Series(
-                np.random.randn(len(self.frame)), index=self.frame.index))
-
-    def test_reindex(self):
-
-        def _check_frame(frame):
-            index = frame.index
-            sidx = index[::2]
-            sidx2 = index[:5]  # noqa
-
-            sparse_result = frame.reindex(sidx)
-            dense_result = frame.to_dense().reindex(sidx)
-            tm.assert_frame_equal(sparse_result.to_dense(), dense_result)
-
-            tm.assert_frame_equal(frame.reindex(list(sidx)).to_dense(),
-                                  dense_result)
-
-            sparse_result2 = sparse_result.reindex(index)
-            dense_result2 = dense_result.reindex(index)
-            tm.assert_frame_equal(sparse_result2.to_dense(), dense_result2)
-
-            # propagate CORRECT fill value
-            tm.assert_almost_equal(sparse_result.default_fill_value,
-                                   frame.default_fill_value)
-            tm.assert_almost_equal(sparse_result['A'].fill_value,
-                                   frame['A'].fill_value)
-
-            # length zero
-            length_zero = frame.reindex([])
-            self.assertEqual(len(length_zero), 0)
-            self.assertEqual(len(length_zero.columns), len(frame.columns))
-            self.assertEqual(len(length_zero['A']), 0)
-
-            # frame being reindexed has length zero
-            length_n = length_zero.reindex(index)
-            self.assertEqual(len(length_n), len(frame))
-            self.assertEqual(len(length_n.columns), len(frame.columns))
-            self.assertEqual(len(length_n['A']), len(frame))
-
-            # reindex columns
-            reindexed = frame.reindex(columns=['A', 'B', 'Z'])
-            self.assertEqual(len(reindexed.columns), 3)
-            tm.assert_almost_equal(reindexed['Z'].fill_value,
-                                   frame.default_fill_value)
-            self.assertTrue(np.isnan(reindexed['Z'].sp_values).all())
-
-        _check_frame(self.frame)
-        _check_frame(self.iframe)
-        _check_frame(self.zframe)
-        _check_frame(self.fill_frame)
-
-        # with copy=False
-        reindexed = self.frame.reindex(self.frame.index, copy=False)
-        reindexed['F'] = reindexed['A']
-        self.assertIn('F', self.frame)
-
-        reindexed = self.frame.reindex(self.frame.index)
-        reindexed['G'] = reindexed['A']
-        self.assertNotIn('G', self.frame)
-
-    def test_reindex_fill_value(self):
-        rng = bdate_range('20110110', periods=20)
-
-        result = self.zframe.reindex(rng, fill_value=0)
-        exp = self.zorig.reindex(rng, fill_value=0)
-        exp = exp.to_sparse(self.zframe.default_fill_value)
-        tm.assert_sp_frame_equal(result, exp)
-
-    def test_reindex_method(self):
-
-        sparse = SparseDataFrame(data=[[11., 12., 14.],
-                                       [21., 22., 24.],
-                                       [41., 42., 44.]],
-                                 index=[1, 2, 4],
-                                 columns=[1, 2, 4],
-                                 dtype=float)
-
-        # Over indices
-
-        # default method
-        result = sparse.reindex(index=range(6))
-        expected = SparseDataFrame(data=[[nan, nan, nan],
-                                         [11., 12., 14.],
-                                         [21., 22., 24.],
-                                         [nan, nan, nan],
-                                         [41., 42., 44.],
-                                         [nan, nan, nan]],
-                                   index=range(6),
-                                   columns=[1, 2, 4],
-                                   dtype=float)
-        tm.assert_sp_frame_equal(result, expected)
-
-        # method='bfill'
-        result = sparse.reindex(index=range(6), method='bfill')
-        expected = SparseDataFrame(data=[[11., 12., 14.],
-                                         [11., 12., 14.],
-                                         [21., 22., 24.],
-                                         [41., 42., 44.],
-                                         [41., 42., 44.],
-                                         [nan, nan, nan]],
-                                   index=range(6),
-                                   columns=[1, 2, 4],
-                                   dtype=float)
-        tm.assert_sp_frame_equal(result, expected)
-
-        # method='ffill'
-        result = sparse.reindex(index=range(6), method='ffill')
-        expected = SparseDataFrame(data=[[nan, nan, nan],
-                                         [11., 12., 14.],
-                                         [21., 22., 24.],
-                                         [21., 22., 24.],
-                                         [41., 42., 44.],
-                                         [41., 42., 44.]],
-                                   index=range(6),
-                                   columns=[1, 2, 4],
-                                   dtype=float)
-        tm.assert_sp_frame_equal(result, expected)
-
-        # Over columns
-
-        # default method
-        result = sparse.reindex(columns=range(6))
-        expected = SparseDataFrame(data=[[nan, 11., 12., nan, 14., nan],
-                                         [nan, 21., 22., nan, 24., nan],
-                                         [nan, 41., 42., nan, 44., nan]],
-                                   index=[1, 2, 4],
-                                   columns=range(6),
-                                   dtype=float)
-        tm.assert_sp_frame_equal(result, expected)
-
-        # method='bfill'
-        with tm.assertRaises(NotImplementedError):
-            sparse.reindex(columns=range(6), method='bfill')
-
-        # method='ffill'
-        with tm.assertRaises(NotImplementedError):
-            sparse.reindex(columns=range(6), method='ffill')
-
-    def test_take(self):
-        result = self.frame.take([1, 0, 2], axis=1)
-        expected = self.frame.reindex(columns=['B', 'A', 'C'])
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_to_dense(self):
-        def _check(frame, orig):
-            dense_dm = frame.to_dense()
-            tm.assert_frame_equal(frame, dense_dm)
-            tm.assert_frame_equal(dense_dm, orig, check_dtype=False)
-
-        self._check_all(_check)
-
-    def test_stack_sparse_frame(self):
-        def _check(frame):
-            dense_frame = frame.to_dense()  # noqa
-
-            wp = Panel.from_dict({'foo': frame})
-            from_dense_lp = wp.to_frame()
-
-            from_sparse_lp = spf.stack_sparse_frame(frame)
-
-            self.assert_numpy_array_equal(from_dense_lp.values,
-                                          from_sparse_lp.values)
-
-        _check(self.frame)
-        _check(self.iframe)
-
-        # for now
-        self.assertRaises(Exception, _check, self.zframe)
-        self.assertRaises(Exception, _check, self.fill_frame)
-
-    def test_transpose(self):
-
-        def _check(frame, orig):
-            transposed = frame.T
-            untransposed = transposed.T
-            tm.assert_sp_frame_equal(frame, untransposed)
-
-            tm.assert_frame_equal(frame.T.to_dense(), orig.T)
-            tm.assert_frame_equal(frame.T.T.to_dense(), orig.T.T)
-            tm.assert_sp_frame_equal(frame, frame.T.T, exact_indices=False)
-
-        self._check_all(_check)
-
-    def test_shift(self):
-
-        def _check(frame, orig):
-            shifted = frame.shift(0)
-            exp = orig.shift(0)
-            tm.assert_frame_equal(shifted.to_dense(), exp)
-
-            shifted = frame.shift(1)
-            exp = orig.shift(1)
-            tm.assert_frame_equal(shifted, exp)
-
-            shifted = frame.shift(-2)
-            exp = orig.shift(-2)
-            tm.assert_frame_equal(shifted, exp)
-
-            shifted = frame.shift(2, freq='B')
-            exp = orig.shift(2, freq='B')
-            exp = exp.to_sparse(frame.default_fill_value)
-            tm.assert_frame_equal(shifted, exp)
-
-            shifted = frame.shift(2, freq=BDay())
-            exp = orig.shift(2, freq=BDay())
-            exp = exp.to_sparse(frame.default_fill_value)
-            tm.assert_frame_equal(shifted, exp)
-
-        self._check_all(_check)
-
-    def test_count(self):
-        dense_result = self.frame.to_dense().count()
-
-        result = self.frame.count()
-        tm.assert_series_equal(result, dense_result)
-
-        result = self.frame.count(axis=None)
-        tm.assert_series_equal(result, dense_result)
-
-        result = self.frame.count(axis=0)
-        tm.assert_series_equal(result, dense_result)
-
-        result = self.frame.count(axis=1)
-        dense_result = self.frame.to_dense().count(axis=1)
-
-        # win32 don't check dtype
-        tm.assert_series_equal(result, dense_result, check_dtype=False)
-
-    def _check_all(self, check_func):
-        check_func(self.frame, self.orig)
-        check_func(self.iframe, self.iorig)
-        check_func(self.zframe, self.zorig)
-        check_func(self.fill_frame, self.fill_orig)
-
-    def test_numpy_transpose(self):
-        sdf = SparseDataFrame([1, 2, 3], index=[1, 2, 3], columns=['a'])
-        result = np.transpose(np.transpose(sdf))
-        tm.assert_sp_frame_equal(result, sdf)
-
-        msg = "the 'axes' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.transpose, sdf, axes=1)
-
-    def test_combine_first(self):
-        df = self.frame
-
-        result = df[::2].combine_first(df)
-        result2 = df[::2].combine_first(df.to_dense())
-
-        expected = df[::2].to_dense().combine_first(df.to_dense())
-        expected = expected.to_sparse(fill_value=df.default_fill_value)
-
-        tm.assert_sp_frame_equal(result, result2)
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_combine_add(self):
-        df = self.frame.to_dense()
-        df2 = df.copy()
-        df2['C'][:3] = np.nan
-        df['A'][:3] = 5.7
-
-        result = df.to_sparse().add(df2.to_sparse(), fill_value=0)
-        expected = df.add(df2, fill_value=0).to_sparse()
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_isin(self):
-        sparse_df = DataFrame({'flag': [1., 0., 1.]}).to_sparse(fill_value=0.)
-        xp = sparse_df[sparse_df.flag == 1.]
-        rs = sparse_df[sparse_df.flag.isin([1.])]
-        tm.assert_frame_equal(xp, rs)
-
-    def test_sparse_pow_issue(self):
-        # 2220
-        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [2.5, -3.9]})
-
-        # note : no error without nan
-        df = SparseDataFrame({'A': [nan, 0, 1]})
-
-        # note that 2 ** df works fine, also df ** 1
-        result = 1 ** df
-
-        r1 = result.take([0], 1)['A']
-        r2 = result['A']
-
-        self.assertEqual(len(r2.sp_values), len(r1.sp_values))
-
-    def test_as_blocks(self):
-        df = SparseDataFrame({'A': [1.1, 3.3], 'B': [nan, -3.9]},
-                             dtype='float64')
-
-        df_blocks = df.blocks
-        self.assertEqual(list(df_blocks.keys()), ['float64'])
-        tm.assert_frame_equal(df_blocks['float64'], df)
-
-    def test_nan_columnname(self):
-        # GH 8822
-        nan_colname = DataFrame(Series(1.0, index=[0]), columns=[nan])
-        nan_colname_sparse = nan_colname.to_sparse()
-        self.assertTrue(np.isnan(nan_colname_sparse.columns[0]))
-
-    def test_isnull(self):
-        # GH 8276
-        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
-                                 'B': [0, np.nan, np.nan, 2, np.nan]})
-
-        res = df.isnull()
-        exp = pd.SparseDataFrame({'A': [True, True, False, False, True],
-                                  'B': [False, True, True, False, True]},
-                                 default_fill_value=True)
-        exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
-
-        # if fill_value is not nan, True can be included in sp_values
-        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
-                                 'B': [0, np.nan, 0, 2, np.nan]},
-                                default_fill_value=0.)
-        res = df.isnull()
-        tm.assertIsInstance(res, pd.SparseDataFrame)
-        exp = pd.DataFrame({'A': [False, False, False, False, True],
-                            'B': [False, True, False, False, True]})
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-    def test_isnotnull(self):
-        # GH 8276
-        df = pd.SparseDataFrame({'A': [np.nan, np.nan, 1, 2, np.nan],
-                                 'B': [0, np.nan, np.nan, 2, np.nan]})
-
-        res = df.isnotnull()
-        exp = pd.SparseDataFrame({'A': [False, False, True, True, False],
-                                  'B': [True, False, False, True, False]},
-                                 default_fill_value=False)
-        exp._default_fill_value = np.nan
-        tm.assert_sp_frame_equal(res, exp)
-
-        # if fill_value is not nan, True can be included in sp_values
-        df = pd.SparseDataFrame({'A': [0, 0, 1, 2, np.nan],
-                                 'B': [0, np.nan, 0, 2, np.nan]},
-                                default_fill_value=0.)
-        res = df.isnotnull()
-        tm.assertIsInstance(res, pd.SparseDataFrame)
-        exp = pd.DataFrame({'A': [True, True, True, True, False],
-                            'B': [True, False, True, True, False]})
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-
-@pytest.mark.parametrize('index', [None, list('ab')])  # noqa: F811
-@pytest.mark.parametrize('columns', [None, list('cd')])
-@pytest.mark.parametrize('fill_value', [None, 0, np.nan])
-@pytest.mark.parametrize('dtype', [bool, int, float, np.uint16])
-def test_from_to_scipy(spmatrix, index, columns, fill_value, dtype):
-    # GH 4343
-    tm.skip_if_no_package('scipy')
-
-    # Make one ndarray and from it one sparse matrix, both to be used for
-    # constructing frames and comparing results
-    arr = np.eye(2, dtype=dtype)
-    try:
-        spm = spmatrix(arr)
-        assert spm.dtype == arr.dtype
-    except (TypeError, AssertionError):
-        # If conversion to sparse fails for this spmatrix type and arr.dtype,
-        # then the combination is not currently supported in NumPy, so we
-        # can just skip testing it thoroughly
-        return
-
-    sdf = pd.SparseDataFrame(spm, index=index, columns=columns,
-                             default_fill_value=fill_value)
-
-    # Expected result construction is kind of tricky for all
-    # dtype-fill_value combinations; easiest to cast to something generic
-    # and except later on
-    rarr = arr.astype(object)
-    rarr[arr == 0] = np.nan
-    expected = pd.SparseDataFrame(rarr, index=index, columns=columns).fillna(
-        fill_value if fill_value is not None else np.nan)
-
-    # Assert frame is as expected
-    sdf_obj = sdf.astype(object)
-    tm.assert_sp_frame_equal(sdf_obj, expected)
-    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
-
-    # Assert spmatrices equal
-    tm.assert_equal(dict(sdf.to_coo().todok()), dict(spm.todok()))
-
-    # Ensure dtype is preserved if possible
-    was_upcast = ((fill_value is None or is_float(fill_value)) and
-                  not is_object_dtype(dtype) and
-                  not is_float_dtype(dtype))
-    res_dtype = (bool if is_bool_dtype(dtype) else
-                 float if was_upcast else
-                 dtype)
-    tm.assert_contains_all(sdf.dtypes, {np.dtype(res_dtype)})
-    tm.assert_equal(sdf.to_coo().dtype, res_dtype)
-
-    # However, adding a str column results in an upcast to object
-    sdf['strings'] = np.arange(len(sdf)).astype(str)
-    tm.assert_equal(sdf.to_coo().dtype, np.object_)
-
-
-@pytest.mark.parametrize('fill_value', [None, 0, np.nan])  # noqa: F811
-def test_from_to_scipy_object(spmatrix, fill_value):
-    # GH 4343
-    dtype = object
-    columns = list('cd')
-    index = list('ab')
-    tm.skip_if_no_package('scipy', max_version='0.19.0')
-
-    # Make one ndarray and from it one sparse matrix, both to be used for
-    # constructing frames and comparing results
-    arr = np.eye(2, dtype=dtype)
-    try:
-        spm = spmatrix(arr)
-        assert spm.dtype == arr.dtype
-    except (TypeError, AssertionError):
-        # If conversion to sparse fails for this spmatrix type and arr.dtype,
-        # then the combination is not currently supported in NumPy, so we
-        # can just skip testing it thoroughly
-        return
-
-    sdf = pd.SparseDataFrame(spm, index=index, columns=columns,
-                             default_fill_value=fill_value)
-
-    # Expected result construction is kind of tricky for all
-    # dtype-fill_value combinations; easiest to cast to something generic
-    # and except later on
-    rarr = arr.astype(object)
-    rarr[arr == 0] = np.nan
-    expected = pd.SparseDataFrame(rarr, index=index, columns=columns).fillna(
-        fill_value if fill_value is not None else np.nan)
-
-    # Assert frame is as expected
-    sdf_obj = sdf.astype(object)
-    tm.assert_sp_frame_equal(sdf_obj, expected)
-    tm.assert_frame_equal(sdf_obj.to_dense(), expected.to_dense())
-
-    # Assert spmatrices equal
-    tm.assert_equal(dict(sdf.to_coo().todok()), dict(spm.todok()))
-
-    # Ensure dtype is preserved if possible
-    res_dtype = object
-    tm.assert_contains_all(sdf.dtypes, {np.dtype(res_dtype)})
-    tm.assert_equal(sdf.to_coo().dtype, res_dtype)
-
-
-class TestSparseDataFrameArithmetic(tm.TestCase):
-
-    def test_numeric_op_scalar(self):
-        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
-                           'B': [0, 1, 2, nan],
-                           'C': [1., 2., 3., 4.],
-                           'D': [nan, nan, nan, nan]})
-        sparse = df.to_sparse()
-
-        tm.assert_sp_frame_equal(sparse + 1, (df + 1).to_sparse())
-
-    def test_comparison_op_scalar(self):
-        # GH 13001
-        df = pd.DataFrame({'A': [nan, nan, 0, 1, ],
-                           'B': [0, 1, 2, nan],
-                           'C': [1., 2., 3., 4.],
-                           'D': [nan, nan, nan, nan]})
-        sparse = df.to_sparse()
-
-        # comparison changes internal repr, compare with dense
-        res = sparse > 1
-        tm.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), df > 1)
-
-        res = sparse != 0
-        tm.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), df != 0)
-
-
-class TestSparseDataFrameAnalytics(tm.TestCase):
-    def setUp(self):
-        self.data = {'A': [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
-                     'B': [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],
-                     'C': np.arange(10, dtype=float),
-                     'D': [0, 1, 2, 3, 4, 5, nan, nan, nan, nan]}
-
-        self.dates = bdate_range('1/1/2011', periods=10)
-
-        self.frame = SparseDataFrame(self.data, index=self.dates)
-
-    def test_cumsum(self):
-        expected = SparseDataFrame(self.frame.to_dense().cumsum())
-
-        result = self.frame.cumsum()
-        tm.assert_sp_frame_equal(result, expected)
-
-        result = self.frame.cumsum(axis=None)
-        tm.assert_sp_frame_equal(result, expected)
-
-        result = self.frame.cumsum(axis=0)
-        tm.assert_sp_frame_equal(result, expected)
-
-    def test_numpy_cumsum(self):
-        result = np.cumsum(self.frame)
-        expected = SparseDataFrame(self.frame.to_dense().cumsum())
-        tm.assert_sp_frame_equal(result, expected)
-
-        msg = "the 'dtype' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                              self.frame, dtype=np.int64)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                              self.frame, out=result)
-
-    def test_numpy_func_call(self):
-        # no exception should be raised even though
-        # numpy passes in 'axis=None' or `axis=-1'
-        funcs = ['sum', 'cumsum', 'var',
-                 'mean', 'prod', 'cumprod',
-                 'std', 'min', 'max']
-        for func in funcs:
-            getattr(np, func)(self.frame)
diff --git a/pandas/tests/sparse/test_groupby.py b/pandas/tests/sparse/test_groupby.py
index 23bea94a2aef8..d0ff2a02c4046 100644
--- a/pandas/tests/sparse/test_groupby.py
+++ b/pandas/tests/sparse/test_groupby.py
@@ -1,12 +1,14 @@
 # -*- coding: utf-8 -*-
 import numpy as np
+import pytest
+
 import pandas as pd
 import pandas.util.testing as tm
 
 
-class TestSparseGroupBy(tm.TestCase):
+class TestSparseGroupBy(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.dense = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
                                          'foo', 'bar', 'foo', 'foo'],
                                    'B': ['one', 'one', 'two', 'three',
@@ -22,23 +24,47 @@ def test_first_last_nth(self):
         sparse_grouped = self.sparse.groupby('A')
         dense_grouped = self.dense.groupby('A')
 
-        tm.assert_frame_equal(sparse_grouped.first(),
-                              dense_grouped.first())
-        tm.assert_frame_equal(sparse_grouped.last(),
-                              dense_grouped.last())
-        tm.assert_frame_equal(sparse_grouped.nth(1),
-                              dense_grouped.nth(1))
+        sparse_grouped_first = sparse_grouped.first()
+        sparse_grouped_last = sparse_grouped.last()
+        sparse_grouped_nth = sparse_grouped.nth(1)
+
+        dense_grouped_first = dense_grouped.first().to_sparse()
+        dense_grouped_last = dense_grouped.last().to_sparse()
+        dense_grouped_nth = dense_grouped.nth(1).to_sparse()
+
+        # TODO: shouldn't these all be spares or not?
+        tm.assert_frame_equal(sparse_grouped_first,
+                              dense_grouped_first)
+        tm.assert_frame_equal(sparse_grouped_last,
+                              dense_grouped_last)
+        tm.assert_frame_equal(sparse_grouped_nth,
+                              dense_grouped_nth)
 
     def test_aggfuncs(self):
         sparse_grouped = self.sparse.groupby('A')
         dense_grouped = self.dense.groupby('A')
 
-        tm.assert_frame_equal(sparse_grouped.mean(),
-                              dense_grouped.mean())
+        result = sparse_grouped.mean().to_sparse()
+        expected = dense_grouped.mean().to_sparse()
+
+        tm.assert_frame_equal(result, expected)
 
         # ToDo: sparse sum includes str column
         # tm.assert_frame_equal(sparse_grouped.sum(),
         #                       dense_grouped.sum())
 
-        tm.assert_frame_equal(sparse_grouped.count(),
-                              dense_grouped.count())
+        result = sparse_grouped.count().to_sparse()
+        expected = dense_grouped.count().to_sparse()
+
+        tm.assert_frame_equal(result, expected)
+
+
+@pytest.mark.parametrize("fill_value", [0, np.nan])
+def test_groupby_includes_fill_value(fill_value):
+    # https://github.com/pandas-dev/pandas/issues/5078
+    df = pd.DataFrame({'a': [fill_value, 1, fill_value, fill_value],
+                       'b': [fill_value, 1, fill_value, fill_value]})
+    sdf = df.to_sparse(fill_value=fill_value)
+    result = sdf.groupby('a').sum()
+    expected = df.groupby('a').sum().to_sparse(fill_value=fill_value)
+    tm.assert_frame_equal(result, expected, check_index_type=False)
diff --git a/pandas/tests/sparse/test_indexing.py b/pandas/tests/sparse/test_indexing.py
index 1a0782c0a3db9..6d8c6f13cd32b 100644
--- a/pandas/tests/sparse/test_indexing.py
+++ b/pandas/tests/sparse/test_indexing.py
@@ -1,14 +1,16 @@
 # pylint: disable-msg=E1101,W0612
 
-import pytest  # noqa
 import numpy as np
+import pytest
+
 import pandas as pd
+from pandas.core.sparse.api import SparseDtype
 import pandas.util.testing as tm
 
 
-class TestSparseSeriesIndexing(tm.TestCase):
+class TestSparseSeriesIndexing(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.orig = pd.Series([1, np.nan, np.nan, 3, np.nan])
         self.sparse = self.orig.to_sparse()
 
@@ -16,9 +18,9 @@ def test_getitem(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse[0], 1)
-        self.assertTrue(np.isnan(sparse[1]))
-        self.assertEqual(sparse[3], 3)
+        assert sparse[0] == 1
+        assert np.isnan(sparse[1])
+        assert sparse[3] == 3
 
         result = sparse[[1, 3, 4]]
         exp = orig[[1, 3, 4]].to_sparse()
@@ -53,23 +55,23 @@ def test_getitem_int_dtype(self):
         res = s[::2]
         exp = pd.SparseSeries([0, 2, 4, 6], index=[0, 2, 4, 6], name='xxx')
         tm.assert_sp_series_equal(res, exp)
-        self.assertEqual(res.dtype, np.int64)
+        assert res.dtype == SparseDtype(np.int64)
 
         s = pd.SparseSeries([0, 1, 2, 3, 4, 5, 6], fill_value=0, name='xxx')
         res = s[::2]
         exp = pd.SparseSeries([0, 2, 4, 6], index=[0, 2, 4, 6],
                               fill_value=0, name='xxx')
         tm.assert_sp_series_equal(res, exp)
-        self.assertEqual(res.dtype, np.int64)
+        assert res.dtype == SparseDtype(np.int64)
 
     def test_getitem_fill_value(self):
         orig = pd.Series([1, np.nan, 0, 3, 0])
         sparse = orig.to_sparse(fill_value=0)
 
-        self.assertEqual(sparse[0], 1)
-        self.assertTrue(np.isnan(sparse[1]))
-        self.assertEqual(sparse[2], 0)
-        self.assertEqual(sparse[3], 3)
+        assert sparse[0] == 1
+        assert np.isnan(sparse[1])
+        assert sparse[2] == 0
+        assert sparse[3] == 3
 
         result = sparse[[1, 3, 4]]
         exp = orig[[1, 3, 4]].to_sparse(fill_value=0)
@@ -113,19 +115,19 @@ def test_loc(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse.loc[0], 1)
-        self.assertTrue(np.isnan(sparse.loc[1]))
+        assert sparse.loc[0] == 1
+        assert np.isnan(sparse.loc[1])
 
         result = sparse.loc[[1, 3, 4]]
         exp = orig.loc[[1, 3, 4]].to_sparse()
         tm.assert_sp_series_equal(result, exp)
 
         # exceeds the bounds
-        result = sparse.loc[[1, 3, 4, 5]]
-        exp = orig.loc[[1, 3, 4, 5]].to_sparse()
+        result = sparse.reindex([1, 3, 4, 5])
+        exp = orig.reindex([1, 3, 4, 5]).to_sparse()
         tm.assert_sp_series_equal(result, exp)
         # padded with NaN
-        self.assertTrue(np.isnan(result[-1]))
+        assert np.isnan(result[-1])
 
         # dense array
         result = sparse.loc[orig % 2 == 1]
@@ -145,8 +147,8 @@ def test_loc_index(self):
         orig = pd.Series([1, np.nan, np.nan, 3, np.nan], index=list('ABCDE'))
         sparse = orig.to_sparse()
 
-        self.assertEqual(sparse.loc['A'], 1)
-        self.assertTrue(np.isnan(sparse.loc['B']))
+        assert sparse.loc['A'] == 1
+        assert np.isnan(sparse.loc['B'])
 
         result = sparse.loc[['A', 'C', 'D']]
         exp = orig.loc[['A', 'C', 'D']].to_sparse()
@@ -170,8 +172,8 @@ def test_loc_index_fill_value(self):
         orig = pd.Series([1, np.nan, 0, 3, 0], index=list('ABCDE'))
         sparse = orig.to_sparse(fill_value=0)
 
-        self.assertEqual(sparse.loc['A'], 1)
-        self.assertTrue(np.isnan(sparse.loc['B']))
+        assert sparse.loc['A'] == 1
+        assert np.isnan(sparse.loc['B'])
 
         result = sparse.loc[['A', 'C', 'D']]
         exp = orig.loc[['A', 'C', 'D']].to_sparse(fill_value=0)
@@ -209,8 +211,8 @@ def test_iloc(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse.iloc[3], 3)
-        self.assertTrue(np.isnan(sparse.iloc[2]))
+        assert sparse.iloc[3] == 3
+        assert np.isnan(sparse.iloc[2])
 
         result = sparse.iloc[[1, 3, 4]]
         exp = orig.iloc[[1, 3, 4]].to_sparse()
@@ -220,16 +222,16 @@ def test_iloc(self):
         exp = orig.iloc[[1, -2, -4]].to_sparse()
         tm.assert_sp_series_equal(result, exp)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             sparse.iloc[[1, 3, 5]]
 
     def test_iloc_fill_value(self):
         orig = pd.Series([1, np.nan, 0, 3, 0])
         sparse = orig.to_sparse(fill_value=0)
 
-        self.assertEqual(sparse.iloc[3], 3)
-        self.assertTrue(np.isnan(sparse.iloc[1]))
-        self.assertEqual(sparse.iloc[4], 0)
+        assert sparse.iloc[3] == 3
+        assert np.isnan(sparse.iloc[1])
+        assert sparse.iloc[4] == 0
 
         result = sparse.iloc[[1, 3, 4]]
         exp = orig.iloc[[1, 3, 4]].to_sparse(fill_value=0)
@@ -249,74 +251,74 @@ def test_iloc_slice_fill_value(self):
     def test_at(self):
         orig = pd.Series([1, np.nan, np.nan, 3, np.nan])
         sparse = orig.to_sparse()
-        self.assertEqual(sparse.at[0], orig.at[0])
-        self.assertTrue(np.isnan(sparse.at[1]))
-        self.assertTrue(np.isnan(sparse.at[2]))
-        self.assertEqual(sparse.at[3], orig.at[3])
-        self.assertTrue(np.isnan(sparse.at[4]))
+        assert sparse.at[0] == orig.at[0]
+        assert np.isnan(sparse.at[1])
+        assert np.isnan(sparse.at[2])
+        assert sparse.at[3] == orig.at[3]
+        assert np.isnan(sparse.at[4])
 
         orig = pd.Series([1, np.nan, np.nan, 3, np.nan],
                          index=list('abcde'))
         sparse = orig.to_sparse()
-        self.assertEqual(sparse.at['a'], orig.at['a'])
-        self.assertTrue(np.isnan(sparse.at['b']))
-        self.assertTrue(np.isnan(sparse.at['c']))
-        self.assertEqual(sparse.at['d'], orig.at['d'])
-        self.assertTrue(np.isnan(sparse.at['e']))
+        assert sparse.at['a'] == orig.at['a']
+        assert np.isnan(sparse.at['b'])
+        assert np.isnan(sparse.at['c'])
+        assert sparse.at['d'] == orig.at['d']
+        assert np.isnan(sparse.at['e'])
 
     def test_at_fill_value(self):
         orig = pd.Series([1, np.nan, 0, 3, 0],
                          index=list('abcde'))
         sparse = orig.to_sparse(fill_value=0)
-        self.assertEqual(sparse.at['a'], orig.at['a'])
-        self.assertTrue(np.isnan(sparse.at['b']))
-        self.assertEqual(sparse.at['c'], orig.at['c'])
-        self.assertEqual(sparse.at['d'], orig.at['d'])
-        self.assertEqual(sparse.at['e'], orig.at['e'])
+        assert sparse.at['a'] == orig.at['a']
+        assert np.isnan(sparse.at['b'])
+        assert sparse.at['c'] == orig.at['c']
+        assert sparse.at['d'] == orig.at['d']
+        assert sparse.at['e'] == orig.at['e']
 
     def test_iat(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse.iat[0], orig.iat[0])
-        self.assertTrue(np.isnan(sparse.iat[1]))
-        self.assertTrue(np.isnan(sparse.iat[2]))
-        self.assertEqual(sparse.iat[3], orig.iat[3])
-        self.assertTrue(np.isnan(sparse.iat[4]))
+        assert sparse.iat[0] == orig.iat[0]
+        assert np.isnan(sparse.iat[1])
+        assert np.isnan(sparse.iat[2])
+        assert sparse.iat[3] == orig.iat[3]
+        assert np.isnan(sparse.iat[4])
 
-        self.assertTrue(np.isnan(sparse.iat[-1]))
-        self.assertEqual(sparse.iat[-5], orig.iat[-5])
+        assert np.isnan(sparse.iat[-1])
+        assert sparse.iat[-5] == orig.iat[-5]
 
     def test_iat_fill_value(self):
         orig = pd.Series([1, np.nan, 0, 3, 0])
         sparse = orig.to_sparse()
-        self.assertEqual(sparse.iat[0], orig.iat[0])
-        self.assertTrue(np.isnan(sparse.iat[1]))
-        self.assertEqual(sparse.iat[2], orig.iat[2])
-        self.assertEqual(sparse.iat[3], orig.iat[3])
-        self.assertEqual(sparse.iat[4], orig.iat[4])
+        assert sparse.iat[0] == orig.iat[0]
+        assert np.isnan(sparse.iat[1])
+        assert sparse.iat[2] == orig.iat[2]
+        assert sparse.iat[3] == orig.iat[3]
+        assert sparse.iat[4] == orig.iat[4]
 
-        self.assertEqual(sparse.iat[-1], orig.iat[-1])
-        self.assertEqual(sparse.iat[-5], orig.iat[-5])
+        assert sparse.iat[-1] == orig.iat[-1]
+        assert sparse.iat[-5] == orig.iat[-5]
 
     def test_get(self):
         s = pd.SparseSeries([1, np.nan, np.nan, 3, np.nan])
-        self.assertEqual(s.get(0), 1)
-        self.assertTrue(np.isnan(s.get(1)))
-        self.assertIsNone(s.get(5))
+        assert s.get(0) == 1
+        assert np.isnan(s.get(1))
+        assert s.get(5) is None
 
         s = pd.SparseSeries([1, np.nan, 0, 3, 0], index=list('ABCDE'))
-        self.assertEqual(s.get('A'), 1)
-        self.assertTrue(np.isnan(s.get('B')))
-        self.assertEqual(s.get('C'), 0)
-        self.assertIsNone(s.get('XX'))
+        assert s.get('A') == 1
+        assert np.isnan(s.get('B'))
+        assert s.get('C') == 0
+        assert s.get('XX') is None
 
         s = pd.SparseSeries([1, np.nan, 0, 3, 0], index=list('ABCDE'),
                             fill_value=0)
-        self.assertEqual(s.get('A'), 1)
-        self.assertTrue(np.isnan(s.get('B')))
-        self.assertEqual(s.get('C'), 0)
-        self.assertIsNone(s.get('XX'))
+        assert s.get('A') == 1
+        assert np.isnan(s.get('B'))
+        assert s.get('C') == 0
+        assert s.get('XX') is None
 
     def test_take(self):
         orig = pd.Series([1, np.nan, np.nan, 3, np.nan],
@@ -393,6 +395,10 @@ def test_fill_value_reindex(self):
                          index=list('ABCDE'))
         sparse = orig.to_sparse(fill_value=0)
 
+    def test_fill_value_reindex_coerces_float_int(self):
+        orig = pd.Series([1, np.nan, 0, 3, 0], index=list('ABCDE'))
+        sparse = orig.to_sparse(fill_value=0)
+
         res = sparse.reindex(['A', 'E', 'C', 'D'])
         exp = orig.reindex(['A', 'E', 'C', 'D']).to_sparse(fill_value=0)
         tm.assert_sp_series_equal(res, exp)
@@ -414,39 +420,45 @@ def test_reindex_nearest(self):
         expected = pd.Series([0, 1, np.nan, 2], target).to_sparse()
         tm.assert_sp_series_equal(expected, actual)
 
-    def tests_indexing_with_sparse(self):
-        # GH 13985
+        actual = s.reindex(target, method='nearest',
+                           tolerance=[0.3, 0.01, 0.4, 3])
+        expected = pd.Series([0, np.nan, np.nan, 2], target).to_sparse()
+        tm.assert_sp_series_equal(expected, actual)
 
-        for kind in ['integer', 'block']:
-            for fill in [True, False, np.nan]:
-                arr = pd.SparseArray([1, 2, 3], kind=kind)
-                indexer = pd.SparseArray([True, False, True], fill_value=fill,
-                                         dtype=bool)
+    @pytest.mark.parametrize("kind", ["integer", "block"])
+    @pytest.mark.parametrize("fill", [True, False, np.nan])
+    def tests_indexing_with_sparse(self, kind, fill):
+        # see gh-13985
+        arr = pd.SparseArray([1, 2, 3], kind=kind)
+        indexer = pd.SparseArray([True, False, True],
+                                 fill_value=fill,
+                                 dtype=bool)
 
-                tm.assert_sp_array_equal(pd.SparseArray([1, 3], kind=kind),
-                                         arr[indexer])
+        expected = arr[indexer]
+        result = pd.SparseArray([1, 3], kind=kind)
+        tm.assert_sp_array_equal(result, expected)
 
-                s = pd.SparseSeries(arr, index=['a', 'b', 'c'],
-                                    dtype=np.float64)
-                exp = pd.SparseSeries([1, 3], index=['a', 'c'],
-                                      dtype=np.float64, kind=kind)
-                tm.assert_sp_series_equal(s[indexer], exp)
-                tm.assert_sp_series_equal(s.loc[indexer], exp)
-                tm.assert_sp_series_equal(s.iloc[indexer], exp)
+        s = pd.SparseSeries(arr, index=["a", "b", "c"], dtype=np.float64)
+        expected = pd.SparseSeries([1, 3], index=["a", "c"], kind=kind,
+                                   dtype=SparseDtype(np.float64, s.fill_value))
 
-                indexer = pd.SparseSeries(indexer, index=['a', 'b', 'c'])
-                tm.assert_sp_series_equal(s[indexer], exp)
-                tm.assert_sp_series_equal(s.loc[indexer], exp)
+        tm.assert_sp_series_equal(s[indexer], expected)
+        tm.assert_sp_series_equal(s.loc[indexer], expected)
+        tm.assert_sp_series_equal(s.iloc[indexer], expected)
 
-                msg = ("iLocation based boolean indexing cannot use an "
-                       "indexable as a mask")
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    s.iloc[indexer]
+        indexer = pd.SparseSeries(indexer, index=["a", "b", "c"])
+        tm.assert_sp_series_equal(s[indexer], expected)
+        tm.assert_sp_series_equal(s.loc[indexer], expected)
+
+        msg = ("iLocation based boolean indexing cannot "
+               "use an indexable as a mask")
+        with pytest.raises(ValueError, match=msg):
+            s.iloc[indexer]
 
 
 class TestSparseSeriesMultiIndexing(TestSparseSeriesIndexing):
 
-    def setUp(self):
+    def setup_method(self, method):
         # Mi with duplicated values
         idx = pd.MultiIndex.from_tuples([('A', 0), ('A', 1), ('B', 0),
                                          ('C', 0), ('C', 1)])
@@ -457,9 +469,9 @@ def test_getitem_multi(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse[0], orig[0])
-        self.assertTrue(np.isnan(sparse[1]))
-        self.assertEqual(sparse[3], orig[3])
+        assert sparse[0] == orig[0]
+        assert np.isnan(sparse[1])
+        assert sparse[3] == orig[3]
 
         tm.assert_sp_series_equal(sparse['A'], orig['A'].to_sparse())
         tm.assert_sp_series_equal(sparse['B'], orig['B'].to_sparse())
@@ -486,9 +498,9 @@ def test_getitem_multi_tuple(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse['C', 0], orig['C', 0])
-        self.assertTrue(np.isnan(sparse['A', 1]))
-        self.assertTrue(np.isnan(sparse['B', 0]))
+        assert sparse['C', 0] == orig['C', 0]
+        assert np.isnan(sparse['A', 1])
+        assert np.isnan(sparse['B', 0])
 
     def test_getitems_slice_multi(self):
         orig = self.orig
@@ -544,9 +556,9 @@ def test_loc_multi_tuple(self):
         orig = self.orig
         sparse = self.sparse
 
-        self.assertEqual(sparse.loc['C', 0], orig.loc['C', 0])
-        self.assertTrue(np.isnan(sparse.loc['A', 1]))
-        self.assertTrue(np.isnan(sparse.loc['B', 0]))
+        assert sparse.loc['C', 0] == orig.loc['C', 0]
+        assert np.isnan(sparse.loc['A', 1])
+        assert np.isnan(sparse.loc['B', 0])
 
     def test_loc_slice(self):
         orig = self.orig
@@ -578,7 +590,7 @@ def test_reindex(self):
         exp = orig.reindex(['A'], level=0).to_sparse()
         tm.assert_sp_series_equal(res, exp)
 
-        with tm.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             # Incomplete keys are not accepted for reindexing:
             sparse.reindex(['A', 'C'])
 
@@ -586,10 +598,10 @@ def test_reindex(self):
         res = sparse.reindex(sparse.index, copy=True)
         exp = orig.reindex(orig.index, copy=True).to_sparse()
         tm.assert_sp_series_equal(res, exp)
-        self.assertIsNot(sparse, res)
+        assert sparse is not res
 
 
-class TestSparseDataFrameIndexing(tm.TestCase):
+class TestSparseDataFrameIndexing(object):
 
     def test_getitem(self):
         orig = pd.DataFrame([[1, np.nan, np.nan],
@@ -618,6 +630,10 @@ def test_getitem_fill_value(self):
                             columns=list('xyz'))
         sparse = orig.to_sparse(fill_value=0)
 
+        result = sparse[['z']]
+        expected = orig[['z']].to_sparse(fill_value=0)
+        tm.assert_sp_frame_equal(result, expected, check_fill_value=False)
+
         tm.assert_sp_series_equal(sparse['y'],
                                   orig['y'].to_sparse(fill_value=0))
 
@@ -645,16 +661,21 @@ def test_loc(self):
                             columns=list('xyz'))
         sparse = orig.to_sparse()
 
-        self.assertEqual(sparse.loc[0, 'x'], 1)
-        self.assertTrue(np.isnan(sparse.loc[1, 'z']))
-        self.assertEqual(sparse.loc[2, 'z'], 4)
-
-        tm.assert_sp_series_equal(sparse.loc[0], orig.loc[0].to_sparse())
-        tm.assert_sp_series_equal(sparse.loc[1], orig.loc[1].to_sparse())
+        assert sparse.loc[0, 'x'] == 1
+        assert np.isnan(sparse.loc[1, 'z'])
+        assert sparse.loc[2, 'z'] == 4
+
+        # have to specify `kind='integer'`, since we construct a
+        # new SparseArray here, and the default sparse type is
+        # integer there, but block in SparseSeries
+        tm.assert_sp_series_equal(sparse.loc[0],
+                                  orig.loc[0].to_sparse(kind='integer'))
+        tm.assert_sp_series_equal(sparse.loc[1],
+                                  orig.loc[1].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.loc[2, :],
-                                  orig.loc[2, :].to_sparse())
+                                  orig.loc[2, :].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.loc[2, :],
-                                  orig.loc[2, :].to_sparse())
+                                  orig.loc[2, :].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.loc[:, 'y'],
                                   orig.loc[:, 'y'].to_sparse())
         tm.assert_sp_series_equal(sparse.loc[:, 'y'],
@@ -677,8 +698,8 @@ def test_loc(self):
         tm.assert_sp_frame_equal(result, exp)
 
         # exceeds the bounds
-        result = sparse.loc[[1, 3, 4, 5]]
-        exp = orig.loc[[1, 3, 4, 5]].to_sparse()
+        result = sparse.reindex([1, 3, 4, 5])
+        exp = orig.reindex([1, 3, 4, 5]).to_sparse()
         tm.assert_sp_frame_equal(result, exp)
 
         # dense array
@@ -702,16 +723,18 @@ def test_loc_index(self):
                             index=list('abc'), columns=list('xyz'))
         sparse = orig.to_sparse()
 
-        self.assertEqual(sparse.loc['a', 'x'], 1)
-        self.assertTrue(np.isnan(sparse.loc['b', 'z']))
-        self.assertEqual(sparse.loc['c', 'z'], 4)
+        assert sparse.loc['a', 'x'] == 1
+        assert np.isnan(sparse.loc['b', 'z'])
+        assert sparse.loc['c', 'z'] == 4
 
-        tm.assert_sp_series_equal(sparse.loc['a'], orig.loc['a'].to_sparse())
-        tm.assert_sp_series_equal(sparse.loc['b'], orig.loc['b'].to_sparse())
+        tm.assert_sp_series_equal(sparse.loc['a'],
+                                  orig.loc['a'].to_sparse(kind='integer'))
+        tm.assert_sp_series_equal(sparse.loc['b'],
+                                  orig.loc['b'].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.loc['b', :],
-                                  orig.loc['b', :].to_sparse())
+                                  orig.loc['b', :].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.loc['b', :],
-                                  orig.loc['b', :].to_sparse())
+                                  orig.loc['b', :].to_sparse(kind='integer'))
 
         tm.assert_sp_series_equal(sparse.loc[:, 'z'],
                                   orig.loc[:, 'z'].to_sparse())
@@ -762,15 +785,17 @@ def test_iloc(self):
                              [np.nan, np.nan, 4]])
         sparse = orig.to_sparse()
 
-        self.assertEqual(sparse.iloc[1, 1], 3)
-        self.assertTrue(np.isnan(sparse.iloc[2, 0]))
+        assert sparse.iloc[1, 1] == 3
+        assert np.isnan(sparse.iloc[2, 0])
 
-        tm.assert_sp_series_equal(sparse.iloc[0], orig.loc[0].to_sparse())
-        tm.assert_sp_series_equal(sparse.iloc[1], orig.loc[1].to_sparse())
+        tm.assert_sp_series_equal(sparse.iloc[0],
+                                  orig.loc[0].to_sparse(kind='integer'))
+        tm.assert_sp_series_equal(sparse.iloc[1],
+                                  orig.loc[1].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.iloc[2, :],
-                                  orig.iloc[2, :].to_sparse())
+                                  orig.iloc[2, :].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.iloc[2, :],
-                                  orig.iloc[2, :].to_sparse())
+                                  orig.iloc[2, :].to_sparse(kind='integer'))
         tm.assert_sp_series_equal(sparse.iloc[:, 1],
                                   orig.iloc[:, 1].to_sparse())
         tm.assert_sp_series_equal(sparse.iloc[:, 1],
@@ -792,7 +817,7 @@ def test_iloc(self):
         exp = orig.iloc[[2], [1, 0]].to_sparse()
         tm.assert_sp_frame_equal(result, exp)
 
-        with tm.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             sparse.iloc[[1, 3, 5]]
 
     def test_iloc_slice(self):
@@ -810,10 +835,10 @@ def test_at(self):
                              [0, np.nan, 5]],
                             index=list('ABCD'), columns=list('xyz'))
         sparse = orig.to_sparse()
-        self.assertEqual(sparse.at['A', 'x'], orig.at['A', 'x'])
-        self.assertTrue(np.isnan(sparse.at['B', 'z']))
-        self.assertTrue(np.isnan(sparse.at['C', 'y']))
-        self.assertEqual(sparse.at['D', 'x'], orig.at['D', 'x'])
+        assert sparse.at['A', 'x'] == orig.at['A', 'x']
+        assert np.isnan(sparse.at['B', 'z'])
+        assert np.isnan(sparse.at['C', 'y'])
+        assert sparse.at['D', 'x'] == orig.at['D', 'x']
 
     def test_at_fill_value(self):
         orig = pd.DataFrame([[1, np.nan, 0],
@@ -822,10 +847,10 @@ def test_at_fill_value(self):
                              [0, np.nan, 5]],
                             index=list('ABCD'), columns=list('xyz'))
         sparse = orig.to_sparse(fill_value=0)
-        self.assertEqual(sparse.at['A', 'x'], orig.at['A', 'x'])
-        self.assertTrue(np.isnan(sparse.at['B', 'z']))
-        self.assertTrue(np.isnan(sparse.at['C', 'y']))
-        self.assertEqual(sparse.at['D', 'x'], orig.at['D', 'x'])
+        assert sparse.at['A', 'x'] == orig.at['A', 'x']
+        assert np.isnan(sparse.at['B', 'z'])
+        assert np.isnan(sparse.at['C', 'y'])
+        assert sparse.at['D', 'x'] == orig.at['D', 'x']
 
     def test_iat(self):
         orig = pd.DataFrame([[1, np.nan, 0],
@@ -834,13 +859,13 @@ def test_iat(self):
                              [0, np.nan, 5]],
                             index=list('ABCD'), columns=list('xyz'))
         sparse = orig.to_sparse()
-        self.assertEqual(sparse.iat[0, 0], orig.iat[0, 0])
-        self.assertTrue(np.isnan(sparse.iat[1, 2]))
-        self.assertTrue(np.isnan(sparse.iat[2, 1]))
-        self.assertEqual(sparse.iat[2, 0], orig.iat[2, 0])
+        assert sparse.iat[0, 0] == orig.iat[0, 0]
+        assert np.isnan(sparse.iat[1, 2])
+        assert np.isnan(sparse.iat[2, 1])
+        assert sparse.iat[2, 0] == orig.iat[2, 0]
 
-        self.assertTrue(np.isnan(sparse.iat[-1, -2]))
-        self.assertEqual(sparse.iat[-1, -1], orig.iat[-1, -1])
+        assert np.isnan(sparse.iat[-1, -2])
+        assert sparse.iat[-1, -1] == orig.iat[-1, -1]
 
     def test_iat_fill_value(self):
         orig = pd.DataFrame([[1, np.nan, 0],
@@ -849,13 +874,13 @@ def test_iat_fill_value(self):
                              [0, np.nan, 5]],
                             index=list('ABCD'), columns=list('xyz'))
         sparse = orig.to_sparse(fill_value=0)
-        self.assertEqual(sparse.iat[0, 0], orig.iat[0, 0])
-        self.assertTrue(np.isnan(sparse.iat[1, 2]))
-        self.assertTrue(np.isnan(sparse.iat[2, 1]))
-        self.assertEqual(sparse.iat[2, 0], orig.iat[2, 0])
+        assert sparse.iat[0, 0] == orig.iat[0, 0]
+        assert np.isnan(sparse.iat[1, 2])
+        assert np.isnan(sparse.iat[2, 1])
+        assert sparse.iat[2, 0] == orig.iat[2, 0]
 
-        self.assertTrue(np.isnan(sparse.iat[-1, -2]))
-        self.assertEqual(sparse.iat[-1, -1], orig.iat[-1, -1])
+        assert np.isnan(sparse.iat[-1, -2])
+        assert sparse.iat[-1, -1] == orig.iat[-1, -1]
 
     def test_take(self):
         orig = pd.DataFrame([[1, np.nan, 0],
@@ -944,7 +969,8 @@ def test_reindex_fill_value(self):
                              [0, 0, 0],
                              [0, 0, 0],
                              [0, 0, 0]],
-                            index=list('ABCD'), columns=list('xyz'))
+                            index=list('ABCD'), columns=list('xyz'),
+                            dtype=np.int)
         sparse = orig.to_sparse(fill_value=0)
 
         res = sparse.reindex(['A', 'C', 'B'])
@@ -952,9 +978,9 @@ def test_reindex_fill_value(self):
         tm.assert_sp_frame_equal(res, exp)
 
 
-class TestMultitype(tm.TestCase):
+class TestMultitype(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.cols = ['string', 'int', 'float', 'object']
 
         self.string_series = pd.SparseSeries(['a', 'b', 'c'])
@@ -972,7 +998,7 @@ def setUp(self):
 
     def test_frame_basic_dtypes(self):
         for _, row in self.sdf.iterrows():
-            self.assertEqual(row.dtype, object)
+            assert row.dtype == SparseDtype(object)
         tm.assert_sp_series_equal(self.sdf['string'], self.string_series,
                                   check_names=False)
         tm.assert_sp_series_equal(self.sdf['int'], self.int_series,
@@ -1014,13 +1040,14 @@ def test_frame_indexing_multiple(self):
 
     def test_series_indexing_single(self):
         for i, idx in enumerate(self.cols):
-            self.assertEqual(self.ss.iloc[i], self.ss[idx])
-            self.assertEqual(type(self.ss.iloc[i]),
-                             type(self.ss[idx]))
-        self.assertEqual(self.ss['string'], 'a')
-        self.assertEqual(self.ss['int'], 1)
-        self.assertEqual(self.ss['float'], 1.1)
-        self.assertEqual(self.ss['object'], [])
+            assert self.ss.iloc[i] == self.ss[idx]
+            tm.assert_class_equal(self.ss.iloc[i], self.ss[idx],
+                                  obj="series index")
+
+        assert self.ss['string'] == 'a'
+        assert self.ss['int'] == 1
+        assert self.ss['float'] == 1.1
+        assert self.ss['object'] == []
 
     def test_series_indexing_multiple(self):
         tm.assert_sp_series_equal(self.ss.loc[['string', 'int']],
diff --git a/pandas/tests/sparse/test_list.py b/pandas/tests/sparse/test_list.py
deleted file mode 100644
index 8511cd5997368..0000000000000
--- a/pandas/tests/sparse/test_list.py
+++ /dev/null
@@ -1,112 +0,0 @@
-from pandas.compat import range
-import unittest
-
-from numpy import nan
-import numpy as np
-
-from pandas.sparse.api import SparseList, SparseArray
-import pandas.util.testing as tm
-
-
-class TestSparseList(unittest.TestCase):
-
-    def setUp(self):
-        self.na_data = np.array([nan, nan, 1, 2, 3, nan, 4, 5, nan, 6])
-        self.zero_data = np.array([0, 0, 1, 2, 3, 0, 4, 5, 0, 6])
-
-    def test_deprecation(self):
-        # see gh-13784
-        with tm.assert_produces_warning(FutureWarning):
-            SparseList()
-
-    def test_constructor(self):
-        with tm.assert_produces_warning(FutureWarning):
-            lst1 = SparseList(self.na_data[:5])
-        with tm.assert_produces_warning(FutureWarning):
-            exp = SparseList()
-
-        exp.append(self.na_data[:5])
-        tm.assert_sp_list_equal(lst1, exp)
-
-    def test_len(self):
-        with tm.assert_produces_warning(FutureWarning):
-            arr = self.na_data
-            splist = SparseList()
-            splist.append(arr[:5])
-            self.assertEqual(len(splist), 5)
-            splist.append(arr[5])
-            self.assertEqual(len(splist), 6)
-            splist.append(arr[6:])
-            self.assertEqual(len(splist), 10)
-
-    def test_append_na(self):
-        with tm.assert_produces_warning(FutureWarning):
-            arr = self.na_data
-            splist = SparseList()
-            splist.append(arr[:5])
-            splist.append(arr[5])
-            splist.append(arr[6:])
-
-            sparr = splist.to_array()
-            tm.assert_sp_array_equal(sparr, SparseArray(arr))
-
-    def test_append_zero(self):
-        with tm.assert_produces_warning(FutureWarning):
-            arr = self.zero_data
-            splist = SparseList(fill_value=0)
-            splist.append(arr[:5])
-            splist.append(arr[5])
-            splist.append(arr[6:])
-
-            # list always produces int64, but SA constructor
-            # is platform dtype aware
-            sparr = splist.to_array()
-            exp = SparseArray(arr, fill_value=0)
-            tm.assert_sp_array_equal(sparr, exp, check_dtype=False)
-
-    def test_consolidate(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            arr = self.na_data
-            exp_sparr = SparseArray(arr)
-
-            splist = SparseList()
-            splist.append(arr[:5])
-            splist.append(arr[5])
-            splist.append(arr[6:])
-
-            consol = splist.consolidate(inplace=False)
-            self.assertEqual(consol.nchunks, 1)
-            self.assertEqual(splist.nchunks, 3)
-            tm.assert_sp_array_equal(consol.to_array(), exp_sparr)
-
-            splist.consolidate()
-            self.assertEqual(splist.nchunks, 1)
-            tm.assert_sp_array_equal(splist.to_array(), exp_sparr)
-
-    def test_copy(self):
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            arr = self.na_data
-            exp_sparr = SparseArray(arr)
-
-            splist = SparseList()
-            splist.append(arr[:5])
-            splist.append(arr[5])
-
-            cp = splist.copy()
-            cp.append(arr[6:])
-            self.assertEqual(splist.nchunks, 2)
-            tm.assert_sp_array_equal(cp.to_array(), exp_sparr)
-
-    def test_getitem(self):
-        with tm.assert_produces_warning(FutureWarning):
-            arr = self.na_data
-            splist = SparseList()
-            splist.append(arr[:5])
-            splist.append(arr[5])
-            splist.append(arr[6:])
-
-            for i in range(len(arr)):
-                tm.assert_almost_equal(splist[i], arr[i])
-                tm.assert_almost_equal(splist[-i], arr[-i])
diff --git a/pandas/tests/sparse/test_pivot.py b/pandas/tests/sparse/test_pivot.py
index 4ff9f20093c67..af7de43ec0f8a 100644
--- a/pandas/tests/sparse/test_pivot.py
+++ b/pandas/tests/sparse/test_pivot.py
@@ -1,11 +1,12 @@
 import numpy as np
+
 import pandas as pd
 import pandas.util.testing as tm
 
 
-class TestPivotTable(tm.TestCase):
+class TestPivotTable(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.dense = pd.DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
                                          'foo', 'bar', 'foo', 'foo'],
                                    'B': ['one', 'one', 'two', 'three',
@@ -47,4 +48,5 @@ def test_pivot_table_multi(self):
                                     values=['D', 'E'])
         res_dense = pd.pivot_table(self.dense, index='A', columns='B',
                                    values=['D', 'E'])
+        res_dense = res_dense.apply(lambda x: x.astype("Sparse[float64]"))
         tm.assert_frame_equal(res_sparse, res_dense)
diff --git a/pandas/tests/sparse/test_reshape.py b/pandas/tests/sparse/test_reshape.py
new file mode 100644
index 0000000000000..6830e40ce6533
--- /dev/null
+++ b/pandas/tests/sparse/test_reshape.py
@@ -0,0 +1,42 @@
+import numpy as np
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@pytest.fixture
+def sparse_df():
+    return pd.SparseDataFrame({0: {0: 1}, 1: {1: 1}, 2: {2: 1}})  # eye
+
+
+@pytest.fixture
+def multi_index3():
+    return pd.MultiIndex.from_tuples([(0, 0), (1, 1), (2, 2)])
+
+
+def test_sparse_frame_stack(sparse_df, multi_index3):
+    ss = sparse_df.stack()
+    expected = pd.SparseSeries(np.ones(3), index=multi_index3)
+    tm.assert_sp_series_equal(ss, expected)
+
+
+def test_sparse_frame_unstack(sparse_df):
+    mi = pd.MultiIndex.from_tuples([(0, 0), (1, 0), (1, 2)])
+    sparse_df.index = mi
+    arr = np.array([[1, np.nan, np.nan],
+                    [np.nan, 1, np.nan],
+                    [np.nan, np.nan, 1]])
+    unstacked_df = pd.DataFrame(arr, index=mi).unstack()
+    unstacked_sdf = sparse_df.unstack()
+
+    tm.assert_numpy_array_equal(unstacked_df.values, unstacked_sdf.values)
+
+
+def test_sparse_series_unstack(sparse_df, multi_index3):
+    frame = pd.SparseSeries(np.ones(3), index=multi_index3).unstack()
+
+    arr = np.array([1, np.nan, np.nan])
+    arrays = {i: pd.SparseArray(np.roll(arr, i)) for i in range(3)}
+    expected = pd.DataFrame(arrays)
+    tm.assert_frame_equal(frame, expected)
diff --git a/pandas/tests/sparse/test_series.py b/pandas/tests/sparse/test_series.py
deleted file mode 100644
index 8aa85a5b7f396..0000000000000
--- a/pandas/tests/sparse/test_series.py
+++ /dev/null
@@ -1,1362 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-
-import operator
-
-from numpy import nan
-import numpy as np
-import pandas as pd
-
-from pandas import Series, DataFrame, bdate_range
-from pandas.core.common import isnull
-from pandas.tseries.offsets import BDay
-import pandas.util.testing as tm
-from pandas.compat import range
-from pandas import compat
-from pandas.tools.util import cartesian_product
-
-import pandas.sparse.frame as spf
-
-from pandas.sparse.libsparse import BlockIndex, IntIndex
-from pandas.sparse.api import SparseSeries
-from pandas.tests.series.test_misc_api import SharedWithSparse
-
-
-def _test_data1():
-    # nan-based
-    arr = np.arange(20, dtype=float)
-    index = np.arange(20)
-    arr[:2] = nan
-    arr[5:10] = nan
-    arr[-3:] = nan
-
-    return arr, index
-
-
-def _test_data2():
-    # nan-based
-    arr = np.arange(15, dtype=float)
-    index = np.arange(15)
-    arr[7:12] = nan
-    arr[-1:] = nan
-    return arr, index
-
-
-def _test_data1_zero():
-    # zero-based
-    arr, index = _test_data1()
-    arr[np.isnan(arr)] = 0
-    return arr, index
-
-
-def _test_data2_zero():
-    # zero-based
-    arr, index = _test_data2()
-    arr[np.isnan(arr)] = 0
-    return arr, index
-
-
-class TestSparseSeries(tm.TestCase, SharedWithSparse):
-
-    def setUp(self):
-        arr, index = _test_data1()
-
-        date_index = bdate_range('1/1/2011', periods=len(index))
-
-        self.bseries = SparseSeries(arr, index=index, kind='block',
-                                    name='bseries')
-        self.ts = self.bseries
-
-        self.btseries = SparseSeries(arr, index=date_index, kind='block')
-
-        self.iseries = SparseSeries(arr, index=index, kind='integer',
-                                    name='iseries')
-
-        arr, index = _test_data2()
-        self.bseries2 = SparseSeries(arr, index=index, kind='block')
-        self.iseries2 = SparseSeries(arr, index=index, kind='integer')
-
-        arr, index = _test_data1_zero()
-        self.zbseries = SparseSeries(arr, index=index, kind='block',
-                                     fill_value=0, name='zbseries')
-        self.ziseries = SparseSeries(arr, index=index, kind='integer',
-                                     fill_value=0)
-
-        arr, index = _test_data2_zero()
-        self.zbseries2 = SparseSeries(arr, index=index, kind='block',
-                                      fill_value=0)
-        self.ziseries2 = SparseSeries(arr, index=index, kind='integer',
-                                      fill_value=0)
-
-    def test_constructor_dtype(self):
-        arr = SparseSeries([np.nan, 1, 2, np.nan])
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseSeries([np.nan, 1, 2, np.nan], fill_value=0)
-        self.assertEqual(arr.dtype, np.float64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64, fill_value=np.nan)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertTrue(np.isnan(arr.fill_value))
-
-        arr = SparseSeries([0, 1, 2, 4], dtype=np.int64)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        arr = SparseSeries([0, 1, 2, 4], fill_value=0, dtype=np.int64)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-    def test_iteration_and_str(self):
-        [x for x in self.bseries]
-        str(self.bseries)
-
-    def test_construct_DataFrame_with_sp_series(self):
-        # it works!
-        df = DataFrame({'col': self.bseries})
-
-        # printing & access
-        df.iloc[:1]
-        df['col']
-        df.dtypes
-        str(df)
-
-        tm.assert_sp_series_equal(df['col'], self.bseries, check_names=False)
-
-        result = df.iloc[:, 0]
-        tm.assert_sp_series_equal(result, self.bseries, check_names=False)
-
-        # blocking
-        expected = Series({'col': 'float64:sparse'})
-        result = df.ftypes
-        tm.assert_series_equal(expected, result)
-
-    def test_constructor_preserve_attr(self):
-        arr = pd.SparseArray([1, 0, 3, 0], dtype=np.int64, fill_value=0)
-        self.assertEqual(arr.dtype, np.int64)
-        self.assertEqual(arr.fill_value, 0)
-
-        s = pd.SparseSeries(arr, name='x')
-        self.assertEqual(s.dtype, np.int64)
-        self.assertEqual(s.fill_value, 0)
-
-    def test_series_density(self):
-        # GH2803
-        ts = Series(np.random.randn(10))
-        ts[2:-2] = nan
-        sts = ts.to_sparse()
-        density = sts.density  # don't die
-        self.assertEqual(density, 4 / 10.0)
-
-    def test_sparse_to_dense(self):
-        arr, index = _test_data1()
-        series = self.bseries.to_dense()
-        tm.assert_series_equal(series, Series(arr, name='bseries'))
-
-        # see gh-14647
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            series = self.bseries.to_dense(sparse_only=True)
-
-        indexer = np.isfinite(arr)
-        exp = Series(arr[indexer], index=index[indexer], name='bseries')
-        tm.assert_series_equal(series, exp)
-
-        series = self.iseries.to_dense()
-        tm.assert_series_equal(series, Series(arr, name='iseries'))
-
-        arr, index = _test_data1_zero()
-        series = self.zbseries.to_dense()
-        tm.assert_series_equal(series, Series(arr, name='zbseries'))
-
-        series = self.ziseries.to_dense()
-        tm.assert_series_equal(series, Series(arr))
-
-    def test_to_dense_fill_value(self):
-        s = pd.Series([1, np.nan, np.nan, 3, np.nan])
-        res = SparseSeries(s).to_dense()
-        tm.assert_series_equal(res, s)
-
-        res = SparseSeries(s, fill_value=0).to_dense()
-        tm.assert_series_equal(res, s)
-
-        s = pd.Series([1, np.nan, 0, 3, 0])
-        res = SparseSeries(s, fill_value=0).to_dense()
-        tm.assert_series_equal(res, s)
-
-        res = SparseSeries(s, fill_value=0).to_dense()
-        tm.assert_series_equal(res, s)
-
-        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
-        res = SparseSeries(s).to_dense()
-        tm.assert_series_equal(res, s)
-
-        s = pd.Series([np.nan, np.nan, np.nan, np.nan, np.nan])
-        res = SparseSeries(s, fill_value=0).to_dense()
-        tm.assert_series_equal(res, s)
-
-    def test_dense_to_sparse(self):
-        series = self.bseries.to_dense()
-        bseries = series.to_sparse(kind='block')
-        iseries = series.to_sparse(kind='integer')
-        tm.assert_sp_series_equal(bseries, self.bseries)
-        tm.assert_sp_series_equal(iseries, self.iseries, check_names=False)
-        self.assertEqual(iseries.name, self.bseries.name)
-
-        self.assertEqual(len(series), len(bseries))
-        self.assertEqual(len(series), len(iseries))
-        self.assertEqual(series.shape, bseries.shape)
-        self.assertEqual(series.shape, iseries.shape)
-
-        # non-NaN fill value
-        series = self.zbseries.to_dense()
-        zbseries = series.to_sparse(kind='block', fill_value=0)
-        ziseries = series.to_sparse(kind='integer', fill_value=0)
-        tm.assert_sp_series_equal(zbseries, self.zbseries)
-        tm.assert_sp_series_equal(ziseries, self.ziseries, check_names=False)
-        self.assertEqual(ziseries.name, self.zbseries.name)
-
-        self.assertEqual(len(series), len(zbseries))
-        self.assertEqual(len(series), len(ziseries))
-        self.assertEqual(series.shape, zbseries.shape)
-        self.assertEqual(series.shape, ziseries.shape)
-
-    def test_to_dense_preserve_name(self):
-        assert (self.bseries.name is not None)
-        result = self.bseries.to_dense()
-        self.assertEqual(result.name, self.bseries.name)
-
-    def test_constructor(self):
-        # test setup guys
-        self.assertTrue(np.isnan(self.bseries.fill_value))
-        tm.assertIsInstance(self.bseries.sp_index, BlockIndex)
-        self.assertTrue(np.isnan(self.iseries.fill_value))
-        tm.assertIsInstance(self.iseries.sp_index, IntIndex)
-
-        self.assertEqual(self.zbseries.fill_value, 0)
-        tm.assert_numpy_array_equal(self.zbseries.values.values,
-                                    self.bseries.to_dense().fillna(0).values)
-
-        # pass SparseSeries
-        def _check_const(sparse, name):
-            # use passed series name
-            result = SparseSeries(sparse)
-            tm.assert_sp_series_equal(result, sparse)
-            self.assertEqual(sparse.name, name)
-            self.assertEqual(result.name, name)
-
-            # use passed name
-            result = SparseSeries(sparse, name='x')
-            tm.assert_sp_series_equal(result, sparse, check_names=False)
-            self.assertEqual(result.name, 'x')
-
-        _check_const(self.bseries, 'bseries')
-        _check_const(self.iseries, 'iseries')
-        _check_const(self.zbseries, 'zbseries')
-
-        # Sparse time series works
-        date_index = bdate_range('1/1/2000', periods=len(self.bseries))
-        s5 = SparseSeries(self.bseries, index=date_index)
-        tm.assertIsInstance(s5, SparseSeries)
-
-        # pass Series
-        bseries2 = SparseSeries(self.bseries.to_dense())
-        tm.assert_numpy_array_equal(self.bseries.sp_values, bseries2.sp_values)
-
-        # pass dict?
-
-        # don't copy the data by default
-        values = np.ones(self.bseries.npoints)
-        sp = SparseSeries(values, sparse_index=self.bseries.sp_index)
-        sp.sp_values[:5] = 97
-        self.assertEqual(values[0], 97)
-
-        self.assertEqual(len(sp), 20)
-        self.assertEqual(sp.shape, (20, ))
-
-        # but can make it copy!
-        sp = SparseSeries(values, sparse_index=self.bseries.sp_index,
-                          copy=True)
-        sp.sp_values[:5] = 100
-        self.assertEqual(values[0], 97)
-
-        self.assertEqual(len(sp), 20)
-        self.assertEqual(sp.shape, (20, ))
-
-    def test_constructor_scalar(self):
-        data = 5
-        sp = SparseSeries(data, np.arange(100))
-        sp = sp.reindex(np.arange(200))
-        self.assertTrue((sp.loc[:99] == data).all())
-        self.assertTrue(isnull(sp.loc[100:]).all())
-
-        data = np.nan
-        sp = SparseSeries(data, np.arange(100))
-        self.assertEqual(len(sp), 100)
-        self.assertEqual(sp.shape, (100, ))
-
-    def test_constructor_ndarray(self):
-        pass
-
-    def test_constructor_nonnan(self):
-        arr = [0, 0, 0, nan, nan]
-        sp_series = SparseSeries(arr, fill_value=0)
-        tm.assert_numpy_array_equal(sp_series.values.values, np.array(arr))
-        self.assertEqual(len(sp_series), 5)
-        self.assertEqual(sp_series.shape, (5, ))
-
-    # GH 9272
-    def test_constructor_empty(self):
-        sp = SparseSeries()
-        self.assertEqual(len(sp.index), 0)
-        self.assertEqual(sp.shape, (0, ))
-
-    def test_copy_astype(self):
-        cop = self.bseries.astype(np.float64)
-        self.assertIsNot(cop, self.bseries)
-        self.assertIs(cop.sp_index, self.bseries.sp_index)
-        self.assertEqual(cop.dtype, np.float64)
-
-        cop2 = self.iseries.copy()
-
-        tm.assert_sp_series_equal(cop, self.bseries)
-        tm.assert_sp_series_equal(cop2, self.iseries)
-
-        # test that data is copied
-        cop[:5] = 97
-        self.assertEqual(cop.sp_values[0], 97)
-        self.assertNotEqual(self.bseries.sp_values[0], 97)
-
-        # correct fill value
-        zbcop = self.zbseries.copy()
-        zicop = self.ziseries.copy()
-
-        tm.assert_sp_series_equal(zbcop, self.zbseries)
-        tm.assert_sp_series_equal(zicop, self.ziseries)
-
-        # no deep copy
-        view = self.bseries.copy(deep=False)
-        view.sp_values[:5] = 5
-        self.assertTrue((self.bseries.sp_values[:5] == 5).all())
-
-    def test_shape(self):
-        # GH 10452
-        self.assertEqual(self.bseries.shape, (20, ))
-        self.assertEqual(self.btseries.shape, (20, ))
-        self.assertEqual(self.iseries.shape, (20, ))
-
-        self.assertEqual(self.bseries2.shape, (15, ))
-        self.assertEqual(self.iseries2.shape, (15, ))
-
-        self.assertEqual(self.zbseries2.shape, (15, ))
-        self.assertEqual(self.ziseries2.shape, (15, ))
-
-    def test_astype(self):
-        with tm.assertRaises(ValueError):
-            self.bseries.astype(np.int64)
-
-    def test_astype_all(self):
-        orig = pd.Series(np.array([1, 2, 3]))
-        s = SparseSeries(orig)
-
-        types = [np.float64, np.float32, np.int64,
-                 np.int32, np.int16, np.int8]
-        for typ in types:
-            res = s.astype(typ)
-            self.assertEqual(res.dtype, typ)
-            tm.assert_series_equal(res.to_dense(), orig.astype(typ))
-
-    def test_kind(self):
-        self.assertEqual(self.bseries.kind, 'block')
-        self.assertEqual(self.iseries.kind, 'integer')
-
-    def test_to_frame(self):
-        # GH 9850
-        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x')
-        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]})
-        tm.assert_sp_frame_equal(s.to_frame(), exp)
-
-        exp = pd.SparseDataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
-        tm.assert_sp_frame_equal(s.to_frame(name='y'), exp)
-
-        s = pd.SparseSeries([1, 2, 0, nan, 4, nan, 0], name='x', fill_value=0)
-        exp = pd.SparseDataFrame({'x': [1, 2, 0, nan, 4, nan, 0]},
-                                 default_fill_value=0)
-
-        tm.assert_sp_frame_equal(s.to_frame(), exp)
-        exp = pd.DataFrame({'y': [1, 2, 0, nan, 4, nan, 0]})
-        tm.assert_frame_equal(s.to_frame(name='y').to_dense(), exp)
-
-    def test_pickle(self):
-        def _test_roundtrip(series):
-            unpickled = self.round_trip_pickle(series)
-            tm.assert_sp_series_equal(series, unpickled)
-            tm.assert_series_equal(series.to_dense(), unpickled.to_dense())
-
-        self._check_all(_test_roundtrip)
-
-    def _check_all(self, check_func):
-        check_func(self.bseries)
-        check_func(self.iseries)
-        check_func(self.zbseries)
-        check_func(self.ziseries)
-
-    def test_getitem(self):
-        def _check_getitem(sp, dense):
-            for idx, val in compat.iteritems(dense):
-                tm.assert_almost_equal(val, sp[idx])
-
-            for i in range(len(dense)):
-                tm.assert_almost_equal(sp[i], dense[i])
-                # j = np.float64(i)
-                # assert_almost_equal(sp[j], dense[j])
-
-                # API change 1/6/2012
-                # negative getitem works
-                # for i in xrange(len(dense)):
-                #     assert_almost_equal(sp[-i], dense[-i])
-
-        _check_getitem(self.bseries, self.bseries.to_dense())
-        _check_getitem(self.btseries, self.btseries.to_dense())
-
-        _check_getitem(self.zbseries, self.zbseries.to_dense())
-        _check_getitem(self.iseries, self.iseries.to_dense())
-        _check_getitem(self.ziseries, self.ziseries.to_dense())
-
-        # exception handling
-        self.assertRaises(Exception, self.bseries.__getitem__,
-                          len(self.bseries) + 1)
-
-        # index not contained
-        self.assertRaises(Exception, self.btseries.__getitem__,
-                          self.btseries.index[-1] + BDay())
-
-    def test_get_get_value(self):
-        tm.assert_almost_equal(self.bseries.get(10), self.bseries[10])
-        self.assertIsNone(self.bseries.get(len(self.bseries) + 1))
-
-        dt = self.btseries.index[10]
-        result = self.btseries.get(dt)
-        expected = self.btseries.to_dense()[dt]
-        tm.assert_almost_equal(result, expected)
-
-        tm.assert_almost_equal(self.bseries.get_value(10), self.bseries[10])
-
-    def test_set_value(self):
-
-        idx = self.btseries.index[7]
-        self.btseries.set_value(idx, 0)
-        self.assertEqual(self.btseries[idx], 0)
-
-        self.iseries.set_value('foobar', 0)
-        self.assertEqual(self.iseries.index[-1], 'foobar')
-        self.assertEqual(self.iseries['foobar'], 0)
-
-    def test_getitem_slice(self):
-        idx = self.bseries.index
-        res = self.bseries[::2]
-        tm.assertIsInstance(res, SparseSeries)
-
-        expected = self.bseries.reindex(idx[::2])
-        tm.assert_sp_series_equal(res, expected)
-
-        res = self.bseries[:5]
-        tm.assertIsInstance(res, SparseSeries)
-        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:5]))
-
-        res = self.bseries[5:]
-        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[5:]))
-
-        # negative indices
-        res = self.bseries[:-3]
-        tm.assert_sp_series_equal(res, self.bseries.reindex(idx[:-3]))
-
-    def test_take(self):
-        def _compare_with_dense(sp):
-            dense = sp.to_dense()
-
-            def _compare(idx):
-                dense_result = dense.take(idx).values
-                sparse_result = sp.take(idx)
-                self.assertIsInstance(sparse_result, SparseSeries)
-                tm.assert_almost_equal(dense_result,
-                                       sparse_result.values.values)
-
-            _compare([1., 2., 3., 4., 5., 0.])
-            _compare([7, 2, 9, 0, 4])
-            _compare([3, 6, 3, 4, 7])
-
-        self._check_all(_compare_with_dense)
-
-        self.assertRaises(Exception, self.bseries.take,
-                          [0, len(self.bseries) + 1])
-
-        # Corner case
-        sp = SparseSeries(np.ones(10) * nan)
-        exp = pd.Series(np.repeat(nan, 5))
-        tm.assert_series_equal(sp.take([0, 1, 2, 3, 4]), exp)
-
-    def test_numpy_take(self):
-        sp = SparseSeries([1.0, 2.0, 3.0])
-        indices = [1, 2]
-
-        tm.assert_series_equal(np.take(sp, indices, axis=0).to_dense(),
-                               np.take(sp.to_dense(), indices, axis=0))
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.take,
-                              sp, indices, out=np.empty(sp.shape))
-
-        msg = "the 'mode' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.take,
-                              sp, indices, mode='clip')
-
-    def test_setitem(self):
-        self.bseries[5] = 7.
-        self.assertEqual(self.bseries[5], 7.)
-
-    def test_setslice(self):
-        self.bseries[5:10] = 7.
-        tm.assert_series_equal(self.bseries[5:10].to_dense(),
-                               Series(7., index=range(5, 10),
-                                      name=self.bseries.name))
-
-    def test_operators(self):
-
-        def _check_op(a, b, op):
-            sp_result = op(a, b)
-            adense = a.to_dense() if isinstance(a, SparseSeries) else a
-            bdense = b.to_dense() if isinstance(b, SparseSeries) else b
-            dense_result = op(adense, bdense)
-            tm.assert_almost_equal(sp_result.to_dense(), dense_result)
-
-        def check(a, b):
-            _check_op(a, b, operator.add)
-            _check_op(a, b, operator.sub)
-            _check_op(a, b, operator.truediv)
-            _check_op(a, b, operator.floordiv)
-            _check_op(a, b, operator.mul)
-
-            _check_op(a, b, lambda x, y: operator.add(y, x))
-            _check_op(a, b, lambda x, y: operator.sub(y, x))
-            _check_op(a, b, lambda x, y: operator.truediv(y, x))
-            _check_op(a, b, lambda x, y: operator.floordiv(y, x))
-            _check_op(a, b, lambda x, y: operator.mul(y, x))
-
-            # NaN ** 0 = 1 in C?
-            # _check_op(a, b, operator.pow)
-            # _check_op(a, b, lambda x, y: operator.pow(y, x))
-
-        check(self.bseries, self.bseries)
-        check(self.iseries, self.iseries)
-        check(self.bseries, self.iseries)
-
-        check(self.bseries, self.bseries2)
-        check(self.bseries, self.iseries2)
-        check(self.iseries, self.iseries2)
-
-        # scalar value
-        check(self.bseries, 5)
-
-        # zero-based
-        check(self.zbseries, self.zbseries * 2)
-        check(self.zbseries, self.zbseries2)
-        check(self.ziseries, self.ziseries2)
-
-        # with dense
-        result = self.bseries + self.bseries.to_dense()
-        tm.assert_sp_series_equal(result, self.bseries + self.bseries)
-
-    def test_binary_operators(self):
-
-        # skipping for now #####
-        import pytest
-        pytest.skip("skipping sparse binary operators test")
-
-        def _check_inplace_op(iop, op):
-            tmp = self.bseries.copy()
-
-            expected = op(tmp, self.bseries)
-            iop(tmp, self.bseries)
-            tm.assert_sp_series_equal(tmp, expected)
-
-        inplace_ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow']
-        for op in inplace_ops:
-            _check_inplace_op(getattr(operator, "i%s" % op),
-                              getattr(operator, op))
-
-    def test_abs(self):
-        s = SparseSeries([1, 2, -3], name='x')
-        expected = SparseSeries([1, 2, 3], name='x')
-        result = s.abs()
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = abs(s)
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = np.abs(s)
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        s = SparseSeries([1, -2, 2, -3], fill_value=-2, name='x')
-        expected = SparseSeries([1, 2, 3], sparse_index=s.sp_index,
-                                fill_value=2, name='x')
-        result = s.abs()
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = abs(s)
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-        result = np.abs(s)
-        tm.assert_sp_series_equal(result, expected)
-        self.assertEqual(result.name, 'x')
-
-    def test_reindex(self):
-        def _compare_with_series(sps, new_index):
-            spsre = sps.reindex(new_index)
-
-            series = sps.to_dense()
-            seriesre = series.reindex(new_index)
-            seriesre = seriesre.to_sparse(fill_value=sps.fill_value)
-
-            tm.assert_sp_series_equal(spsre, seriesre)
-            tm.assert_series_equal(spsre.to_dense(), seriesre.to_dense())
-
-        _compare_with_series(self.bseries, self.bseries.index[::2])
-        _compare_with_series(self.bseries, list(self.bseries.index[::2]))
-        _compare_with_series(self.bseries, self.bseries.index[:10])
-        _compare_with_series(self.bseries, self.bseries.index[5:])
-
-        _compare_with_series(self.zbseries, self.zbseries.index[::2])
-        _compare_with_series(self.zbseries, self.zbseries.index[:10])
-        _compare_with_series(self.zbseries, self.zbseries.index[5:])
-
-        # special cases
-        same_index = self.bseries.reindex(self.bseries.index)
-        tm.assert_sp_series_equal(self.bseries, same_index)
-        self.assertIsNot(same_index, self.bseries)
-
-        # corner cases
-        sp = SparseSeries([], index=[])
-        # TODO: sp_zero is not used anywhere...remove?
-        sp_zero = SparseSeries([], index=[], fill_value=0)  # noqa
-        _compare_with_series(sp, np.arange(10))
-
-        # with copy=False
-        reindexed = self.bseries.reindex(self.bseries.index, copy=True)
-        reindexed.sp_values[:] = 1.
-        self.assertTrue((self.bseries.sp_values != 1.).all())
-
-        reindexed = self.bseries.reindex(self.bseries.index, copy=False)
-        reindexed.sp_values[:] = 1.
-        tm.assert_numpy_array_equal(self.bseries.sp_values, np.repeat(1., 10))
-
-    def test_sparse_reindex(self):
-        length = 10
-
-        def _check(values, index1, index2, fill_value):
-            first_series = SparseSeries(values, sparse_index=index1,
-                                        fill_value=fill_value)
-            reindexed = first_series.sparse_reindex(index2)
-            self.assertIs(reindexed.sp_index, index2)
-
-            int_indices1 = index1.to_int_index().indices
-            int_indices2 = index2.to_int_index().indices
-
-            expected = Series(values, index=int_indices1)
-            expected = expected.reindex(int_indices2).fillna(fill_value)
-            tm.assert_almost_equal(expected.values, reindexed.sp_values)
-
-            # make sure level argument asserts
-            # TODO: expected is not used anywhere...remove?
-            expected = expected.reindex(int_indices2).fillna(fill_value)  # noqa
-
-        def _check_with_fill_value(values, first, second, fill_value=nan):
-            i_index1 = IntIndex(length, first)
-            i_index2 = IntIndex(length, second)
-
-            b_index1 = i_index1.to_block_index()
-            b_index2 = i_index2.to_block_index()
-
-            _check(values, i_index1, i_index2, fill_value)
-            _check(values, b_index1, b_index2, fill_value)
-
-        def _check_all(values, first, second):
-            _check_with_fill_value(values, first, second, fill_value=nan)
-            _check_with_fill_value(values, first, second, fill_value=0)
-
-        index1 = [2, 4, 5, 6, 8, 9]
-        values1 = np.arange(6.)
-
-        _check_all(values1, index1, [2, 4, 5])
-        _check_all(values1, index1, [2, 3, 4, 5, 6, 7, 8, 9])
-        _check_all(values1, index1, [0, 1])
-        _check_all(values1, index1, [0, 1, 7, 8, 9])
-        _check_all(values1, index1, [])
-
-        first_series = SparseSeries(values1,
-                                    sparse_index=IntIndex(length, index1),
-                                    fill_value=nan)
-        with tm.assertRaisesRegexp(TypeError,
-                                   'new index must be a SparseIndex'):
-            reindexed = first_series.sparse_reindex(0)  # noqa
-
-    def test_repr(self):
-        # TODO: These aren't used
-        bsrepr = repr(self.bseries)  # noqa
-        isrepr = repr(self.iseries)  # noqa
-
-    def test_iter(self):
-        pass
-
-    def test_truncate(self):
-        pass
-
-    def test_fillna(self):
-        pass
-
-    def test_groupby(self):
-        pass
-
-    def test_reductions(self):
-        def _compare_with_dense(obj, op):
-            sparse_result = getattr(obj, op)()
-            series = obj.to_dense()
-            dense_result = getattr(series, op)()
-            self.assertEqual(sparse_result, dense_result)
-
-        to_compare = ['count', 'sum', 'mean', 'std', 'var', 'skew']
-
-        def _compare_all(obj):
-            for op in to_compare:
-                _compare_with_dense(obj, op)
-
-        _compare_all(self.bseries)
-
-        self.bseries.sp_values[5:10] = np.NaN
-        _compare_all(self.bseries)
-
-        _compare_all(self.zbseries)
-        self.zbseries.sp_values[5:10] = np.NaN
-        _compare_all(self.zbseries)
-
-        series = self.zbseries.copy()
-        series.fill_value = 2
-        _compare_all(series)
-
-        nonna = Series(np.random.randn(20)).to_sparse()
-        _compare_all(nonna)
-
-        nonna2 = Series(np.random.randn(20)).to_sparse(fill_value=0)
-        _compare_all(nonna2)
-
-    def test_dropna(self):
-        sp = SparseSeries([0, 0, 0, nan, nan, 5, 6], fill_value=0)
-
-        sp_valid = sp.valid()
-
-        expected = sp.to_dense().valid()
-        expected = expected[expected != 0]
-        exp_arr = pd.SparseArray(expected.values, fill_value=0, kind='block')
-        tm.assert_sp_array_equal(sp_valid.values, exp_arr)
-        self.assert_index_equal(sp_valid.index, expected.index)
-        self.assertEqual(len(sp_valid.sp_values), 2)
-
-        result = self.bseries.dropna()
-        expected = self.bseries.to_dense().dropna()
-        self.assertNotIsInstance(result, SparseSeries)
-        tm.assert_series_equal(result, expected)
-
-    def test_homogenize(self):
-        def _check_matches(indices, expected):
-            data = {}
-            for i, idx in enumerate(indices):
-                data[i] = SparseSeries(idx.to_int_index().indices,
-                                       sparse_index=idx, fill_value=np.nan)
-            # homogenized is only valid with NaN fill values
-            homogenized = spf.homogenize(data)
-
-            for k, v in compat.iteritems(homogenized):
-                assert (v.sp_index.equals(expected))
-
-        indices1 = [BlockIndex(10, [2], [7]), BlockIndex(10, [1, 6], [3, 4]),
-                    BlockIndex(10, [0], [10])]
-        expected1 = BlockIndex(10, [2, 6], [2, 3])
-        _check_matches(indices1, expected1)
-
-        indices2 = [BlockIndex(10, [2], [7]), BlockIndex(10, [2], [7])]
-        expected2 = indices2[0]
-        _check_matches(indices2, expected2)
-
-        # must have NaN fill value
-        data = {'a': SparseSeries(np.arange(7), sparse_index=expected2,
-                                  fill_value=0)}
-        with tm.assertRaisesRegexp(TypeError, "NaN fill value"):
-            spf.homogenize(data)
-
-    def test_fill_value_corner(self):
-        cop = self.zbseries.copy()
-        cop.fill_value = 0
-        result = self.bseries / cop
-
-        self.assertTrue(np.isnan(result.fill_value))
-
-        cop2 = self.zbseries.copy()
-        cop2.fill_value = 1
-        result = cop2 / cop
-        # 1 / 0 is inf
-        self.assertTrue(np.isinf(result.fill_value))
-
-    def test_fill_value_when_combine_const(self):
-        # GH12723
-        s = SparseSeries([0, 1, np.nan, 3, 4, 5], index=np.arange(6))
-
-        exp = s.fillna(0).add(2)
-        res = s.add(2, fill_value=0)
-        self.assert_series_equal(res, exp)
-
-    def test_shift(self):
-        series = SparseSeries([nan, 1., 2., 3., nan, nan], index=np.arange(6))
-
-        shifted = series.shift(0)
-        self.assertIsNot(shifted, series)
-        tm.assert_sp_series_equal(shifted, series)
-
-        f = lambda s: s.shift(1)
-        _dense_series_compare(series, f)
-
-        f = lambda s: s.shift(-2)
-        _dense_series_compare(series, f)
-
-        series = SparseSeries([nan, 1., 2., 3., nan, nan],
-                              index=bdate_range('1/1/2000', periods=6))
-        f = lambda s: s.shift(2, freq='B')
-        _dense_series_compare(series, f)
-
-        f = lambda s: s.shift(2, freq=BDay())
-        _dense_series_compare(series, f)
-
-    def test_shift_nan(self):
-        # GH 12908
-        orig = pd.Series([np.nan, 2, np.nan, 4, 0, np.nan, 0])
-        sparse = orig.to_sparse()
-
-        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(1), orig.shift(1).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(2), orig.shift(2).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(3), orig.shift(3).to_sparse())
-
-        tm.assert_sp_series_equal(sparse.shift(-1), orig.shift(-1).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-2), orig.shift(-2).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-3), orig.shift(-3).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-4), orig.shift(-4).to_sparse())
-
-        sparse = orig.to_sparse(fill_value=0)
-        tm.assert_sp_series_equal(sparse.shift(0),
-                                  orig.shift(0).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(1),
-                                  orig.shift(1).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(2),
-                                  orig.shift(2).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(3),
-                                  orig.shift(3).to_sparse(fill_value=0))
-
-        tm.assert_sp_series_equal(sparse.shift(-1),
-                                  orig.shift(-1).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(-2),
-                                  orig.shift(-2).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(-3),
-                                  orig.shift(-3).to_sparse(fill_value=0))
-        tm.assert_sp_series_equal(sparse.shift(-4),
-                                  orig.shift(-4).to_sparse(fill_value=0))
-
-    def test_shift_dtype(self):
-        # GH 12908
-        orig = pd.Series([1, 2, 3, 4], dtype=np.int64)
-
-        sparse = orig.to_sparse()
-        tm.assert_sp_series_equal(sparse.shift(0), orig.shift(0).to_sparse())
-
-        sparse = orig.to_sparse(fill_value=np.nan)
-        tm.assert_sp_series_equal(sparse.shift(0),
-                                  orig.shift(0).to_sparse(fill_value=np.nan))
-        # shift(1) or more span changes dtype to float64
-        tm.assert_sp_series_equal(sparse.shift(1), orig.shift(1).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(2), orig.shift(2).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(3), orig.shift(3).to_sparse())
-
-        tm.assert_sp_series_equal(sparse.shift(-1), orig.shift(-1).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-2), orig.shift(-2).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-3), orig.shift(-3).to_sparse())
-        tm.assert_sp_series_equal(sparse.shift(-4), orig.shift(-4).to_sparse())
-
-    def test_shift_dtype_fill_value(self):
-        # GH 12908
-        orig = pd.Series([1, 0, 0, 4], dtype=np.int64)
-
-        for v in [0, 1, np.nan]:
-            sparse = orig.to_sparse(fill_value=v)
-
-            tm.assert_sp_series_equal(sparse.shift(0),
-                                      orig.shift(0).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(1),
-                                      orig.shift(1).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(2),
-                                      orig.shift(2).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(3),
-                                      orig.shift(3).to_sparse(fill_value=v))
-
-            tm.assert_sp_series_equal(sparse.shift(-1),
-                                      orig.shift(-1).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(-2),
-                                      orig.shift(-2).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(-3),
-                                      orig.shift(-3).to_sparse(fill_value=v))
-            tm.assert_sp_series_equal(sparse.shift(-4),
-                                      orig.shift(-4).to_sparse(fill_value=v))
-
-    def test_combine_first(self):
-        s = self.bseries
-
-        result = s[::2].combine_first(s)
-        result2 = s[::2].combine_first(s.to_dense())
-
-        expected = s[::2].to_dense().combine_first(s.to_dense())
-        expected = expected.to_sparse(fill_value=s.fill_value)
-
-        tm.assert_sp_series_equal(result, result2)
-        tm.assert_sp_series_equal(result, expected)
-
-
-class TestSparseHandlingMultiIndexes(tm.TestCase):
-
-    def setUp(self):
-        miindex = pd.MultiIndex.from_product(
-            [["x", "y"], ["10", "20"]], names=['row-foo', 'row-bar'])
-        micol = pd.MultiIndex.from_product(
-            [['a', 'b', 'c'], ["1", "2"]], names=['col-foo', 'col-bar'])
-        dense_multiindex_frame = pd.DataFrame(
-            index=miindex, columns=micol).sort_index().sort_index(axis=1)
-        self.dense_multiindex_frame = dense_multiindex_frame.fillna(value=3.14)
-
-    def test_to_sparse_preserve_multiindex_names_columns(self):
-        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
-        sparse_multiindex_frame = sparse_multiindex_frame.copy()
-        tm.assert_index_equal(sparse_multiindex_frame.columns,
-                              self.dense_multiindex_frame.columns)
-
-    def test_round_trip_preserve_multiindex_names(self):
-        sparse_multiindex_frame = self.dense_multiindex_frame.to_sparse()
-        round_trip_multiindex_frame = sparse_multiindex_frame.to_dense()
-        tm.assert_frame_equal(self.dense_multiindex_frame,
-                              round_trip_multiindex_frame,
-                              check_column_type=True,
-                              check_names=True)
-
-
-class TestSparseSeriesScipyInteraction(tm.TestCase):
-    # Issue 8048: add SparseSeries coo methods
-
-    def setUp(self):
-        tm._skip_if_no_scipy()
-        import scipy.sparse
-        # SparseSeries inputs used in tests, the tests rely on the order
-        self.sparse_series = []
-        s = pd.Series([3.0, nan, 1.0, 2.0, nan, nan])
-        s.index = pd.MultiIndex.from_tuples([(1, 2, 'a', 0),
-                                             (1, 2, 'a', 1),
-                                             (1, 1, 'b', 0),
-                                             (1, 1, 'b', 1),
-                                             (2, 1, 'b', 0),
-                                             (2, 1, 'b', 1)],
-                                            names=['A', 'B', 'C', 'D'])
-        self.sparse_series.append(s.to_sparse())
-
-        ss = self.sparse_series[0].copy()
-        ss.index.names = [3, 0, 1, 2]
-        self.sparse_series.append(ss)
-
-        ss = pd.Series([
-            nan
-        ] * 12, index=cartesian_product((range(3), range(4)))).to_sparse()
-        for k, v in zip([(0, 0), (1, 2), (1, 3)], [3.0, 1.0, 2.0]):
-            ss[k] = v
-        self.sparse_series.append(ss)
-
-        # results used in tests
-        self.coo_matrices = []
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 2, 3])), shape=(3, 4)))
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(3, 4)))
-        self.coo_matrices.append(scipy.sparse.coo_matrix(
-            ([3.0, 1.0, 2.0], ([0, 1, 1], [0, 0, 1])), shape=(3, 2)))
-        self.ils = [[(1, 2), (1, 1), (2, 1)], [(1, 1), (1, 2), (2, 1)],
-                    [(1, 2, 'a'), (1, 1, 'b'), (2, 1, 'b')]]
-        self.jls = [[('a', 0), ('a', 1), ('b', 0), ('b', 1)], [0, 1]]
-
-    def test_to_coo_text_names_integer_row_levels_nosort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': [0, 1], 'column_levels': [2, 3]}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_integer_row_levels_sort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': [0, 1],
-                  'column_levels': [2, 3],
-                  'sort_labels': True}
-        result = (self.coo_matrices[1], self.ils[1], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_text_row_levels_nosort_col_level_single(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': ['A', 'B', 'C'],
-                  'column_levels': ['D'],
-                  'sort_labels': False}
-        result = (self.coo_matrices[2], self.ils[2], self.jls[1])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_integer_names_integer_row_levels_nosort(self):
-        ss = self.sparse_series[1]
-        kwargs = {'row_levels': [3, 0], 'column_levels': [1, 2]}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_text_names_text_row_levels_nosort(self):
-        ss = self.sparse_series[0]
-        kwargs = {'row_levels': ['A', 'B'], 'column_levels': ['C', 'D']}
-        result = (self.coo_matrices[0], self.ils[0], self.jls[0])
-        self._run_test(ss, kwargs, result)
-
-    def test_to_coo_bad_partition_nonnull_intersection(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(ValueError, ss.to_coo, ['A', 'B', 'C'], ['C', 'D'])
-
-    def test_to_coo_bad_partition_small_union(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(ValueError, ss.to_coo, ['A'], ['C', 'D'])
-
-    def test_to_coo_nlevels_less_than_two(self):
-        ss = self.sparse_series[0]
-        ss.index = np.arange(len(ss.index))
-        self.assertRaises(ValueError, ss.to_coo)
-
-    def test_to_coo_bad_ilevel(self):
-        ss = self.sparse_series[0]
-        self.assertRaises(KeyError, ss.to_coo, ['A', 'B'], ['C', 'D', 'E'])
-
-    def test_to_coo_duplicate_index_entries(self):
-        ss = pd.concat([self.sparse_series[0],
-                        self.sparse_series[0]]).to_sparse()
-        self.assertRaises(ValueError, ss.to_coo, ['A', 'B'], ['C', 'D'])
-
-    def test_from_coo_dense_index(self):
-        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=True)
-        check = self.sparse_series[2]
-        tm.assert_sp_series_equal(ss, check)
-
-    def test_from_coo_nodense_index(self):
-        ss = SparseSeries.from_coo(self.coo_matrices[0], dense_index=False)
-        check = self.sparse_series[2]
-        check = check.dropna().to_sparse()
-        tm.assert_sp_series_equal(ss, check)
-
-    def test_from_coo_long_repr(self):
-        # GH 13114
-        # test it doesn't raise error. Formatting is tested in test_format
-        tm._skip_if_no_scipy()
-        import scipy.sparse
-
-        sparse = SparseSeries.from_coo(scipy.sparse.rand(350, 18))
-        repr(sparse)
-
-    def _run_test(self, ss, kwargs, check):
-        results = ss.to_coo(**kwargs)
-        self._check_results_to_coo(results, check)
-        # for every test, also test symmetry property (transpose), switch
-        # row_levels and column_levels
-        d = kwargs.copy()
-        d['row_levels'] = kwargs['column_levels']
-        d['column_levels'] = kwargs['row_levels']
-        results = ss.to_coo(**d)
-        results = (results[0].T, results[2], results[1])
-        self._check_results_to_coo(results, check)
-
-    def _check_results_to_coo(self, results, check):
-        (A, il, jl) = results
-        (A_result, il_result, jl_result) = check
-        # convert to dense and compare
-        tm.assert_numpy_array_equal(A.todense(), A_result.todense())
-        # or compare directly as difference of sparse
-        # assert(abs(A - A_result).max() < 1e-12) # max is failing in python
-        # 2.6
-        self.assertEqual(il, il_result)
-        self.assertEqual(jl, jl_result)
-
-    def test_concat(self):
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        for kind in ['integer', 'block']:
-            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
-            sparse2 = pd.SparseSeries(val2, name='y', kind=kind)
-
-            res = pd.concat([sparse1, sparse2])
-            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            sparse1 = pd.SparseSeries(val1, fill_value=0, name='x', kind=kind)
-            sparse2 = pd.SparseSeries(val2, fill_value=0, name='y', kind=kind)
-
-            res = pd.concat([sparse1, sparse2])
-            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-            exp = pd.SparseSeries(exp, fill_value=0, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-    def test_concat_axis1(self):
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        sparse1 = pd.SparseSeries(val1, name='x')
-        sparse2 = pd.SparseSeries(val2, name='y')
-
-        res = pd.concat([sparse1, sparse2], axis=1)
-        exp = pd.concat([pd.Series(val1, name='x'),
-                         pd.Series(val2, name='y')], axis=1)
-        exp = pd.SparseDataFrame(exp)
-        tm.assert_sp_frame_equal(res, exp)
-
-    def test_concat_different_fill(self):
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        for kind in ['integer', 'block']:
-            sparse1 = pd.SparseSeries(val1, name='x', kind=kind)
-            sparse2 = pd.SparseSeries(val2, name='y', kind=kind, fill_value=0)
-
-            res = pd.concat([sparse1, sparse2])
-            exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            res = pd.concat([sparse2, sparse1])
-            exp = pd.concat([pd.Series(val2), pd.Series(val1)])
-            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
-            tm.assert_sp_series_equal(res, exp)
-
-    def test_concat_axis1_different_fill(self):
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        sparse1 = pd.SparseSeries(val1, name='x')
-        sparse2 = pd.SparseSeries(val2, name='y', fill_value=0)
-
-        res = pd.concat([sparse1, sparse2], axis=1)
-        exp = pd.concat([pd.Series(val1, name='x'),
-                         pd.Series(val2, name='y')], axis=1)
-        self.assertIsInstance(res, pd.SparseDataFrame)
-        tm.assert_frame_equal(res.to_dense(), exp)
-
-    def test_concat_different_kind(self):
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        sparse1 = pd.SparseSeries(val1, name='x', kind='integer')
-        sparse2 = pd.SparseSeries(val2, name='y', kind='block', fill_value=0)
-
-        res = pd.concat([sparse1, sparse2])
-        exp = pd.concat([pd.Series(val1), pd.Series(val2)])
-        exp = pd.SparseSeries(exp, kind='integer')
-        tm.assert_sp_series_equal(res, exp)
-
-        res = pd.concat([sparse2, sparse1])
-        exp = pd.concat([pd.Series(val2), pd.Series(val1)])
-        exp = pd.SparseSeries(exp, kind='block', fill_value=0)
-        tm.assert_sp_series_equal(res, exp)
-
-    def test_concat_sparse_dense(self):
-        # use first input's fill_value
-        val1 = np.array([1, 2, np.nan, np.nan, 0, np.nan])
-        val2 = np.array([3, np.nan, 4, 0, 0])
-
-        for kind in ['integer', 'block']:
-            sparse = pd.SparseSeries(val1, name='x', kind=kind)
-            dense = pd.Series(val2, name='y')
-
-            res = pd.concat([sparse, dense])
-            exp = pd.concat([pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            res = pd.concat([dense, sparse, dense])
-            exp = pd.concat([dense, pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind)
-            tm.assert_sp_series_equal(res, exp)
-
-            sparse = pd.SparseSeries(val1, name='x', kind=kind, fill_value=0)
-            dense = pd.Series(val2, name='y')
-
-            res = pd.concat([sparse, dense])
-            exp = pd.concat([pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
-            tm.assert_sp_series_equal(res, exp)
-
-            res = pd.concat([dense, sparse, dense])
-            exp = pd.concat([dense, pd.Series(val1), dense])
-            exp = pd.SparseSeries(exp, kind=kind, fill_value=0)
-            tm.assert_sp_series_equal(res, exp)
-
-    def test_value_counts(self):
-        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
-        dense = pd.Series(vals, name='xx')
-
-        sparse = pd.SparseSeries(vals, name='xx')
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-    def test_value_counts_dup(self):
-        vals = [1, 2, nan, 0, nan, 1, 2, nan, nan, 1, 2, 0, 1, 1]
-
-        # numeric op may cause sp_values to include the same value as
-        # fill_value
-        dense = pd.Series(vals, name='xx') / 0.
-        sparse = pd.SparseSeries(vals, name='xx') / 0.
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-        vals = [1, 2, 0, 0, 0, 1, 2, 0, 0, 1, 2, 0, 1, 1]
-
-        dense = pd.Series(vals, name='xx') * 0.
-        sparse = pd.SparseSeries(vals, name='xx') * 0.
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-    def test_value_counts_int(self):
-        vals = [1, 2, 0, 1, 2, 1, 2, 0, 1, 1]
-        dense = pd.Series(vals, name='xx')
-
-        # fill_value is np.nan, but should not be included in the result
-        sparse = pd.SparseSeries(vals, name='xx')
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-        sparse = pd.SparseSeries(vals, name='xx', fill_value=0)
-        tm.assert_series_equal(sparse.value_counts(),
-                               dense.value_counts())
-        tm.assert_series_equal(sparse.value_counts(dropna=False),
-                               dense.value_counts(dropna=False))
-
-    def test_isnull(self):
-        # GH 8276
-        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
-
-        res = s.isnull()
-        exp = pd.SparseSeries([True, True, False, False, True], name='xxx',
-                              fill_value=True)
-        tm.assert_sp_series_equal(res, exp)
-
-        # if fill_value is not nan, True can be included in sp_values
-        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
-                            fill_value=0.)
-        res = s.isnull()
-        tm.assertIsInstance(res, pd.SparseSeries)
-        exp = pd.Series([True, False, False, False, False], name='xxx')
-        tm.assert_series_equal(res.to_dense(), exp)
-
-    def test_isnotnull(self):
-        # GH 8276
-        s = pd.SparseSeries([np.nan, np.nan, 1, 2, np.nan], name='xxx')
-
-        res = s.isnotnull()
-        exp = pd.SparseSeries([False, False, True, True, False], name='xxx',
-                              fill_value=False)
-        tm.assert_sp_series_equal(res, exp)
-
-        # if fill_value is not nan, True can be included in sp_values
-        s = pd.SparseSeries([np.nan, 0., 1., 2., 0.], name='xxx',
-                            fill_value=0.)
-        res = s.isnotnull()
-        tm.assertIsInstance(res, pd.SparseSeries)
-        exp = pd.Series([False, True, True, True, True], name='xxx')
-        tm.assert_series_equal(res.to_dense(), exp)
-
-
-def _dense_series_compare(s, f):
-    result = f(s)
-    assert (isinstance(result, SparseSeries))
-    dense_result = f(s.to_dense())
-    tm.assert_series_equal(result.to_dense(), dense_result)
-
-
-class TestSparseSeriesAnalytics(tm.TestCase):
-
-    def setUp(self):
-        arr, index = _test_data1()
-        self.bseries = SparseSeries(arr, index=index, kind='block',
-                                    name='bseries')
-
-        arr, index = _test_data1_zero()
-        self.zbseries = SparseSeries(arr, index=index, kind='block',
-                                     fill_value=0, name='zbseries')
-
-    def test_cumsum(self):
-        result = self.bseries.cumsum()
-        expected = SparseSeries(self.bseries.to_dense().cumsum())
-        tm.assert_sp_series_equal(result, expected)
-
-        result = self.zbseries.cumsum()
-        expected = self.zbseries.to_dense().cumsum()
-        tm.assert_series_equal(result, expected)
-
-        axis = 1  # Series is 1-D, so only axis = 0 is valid.
-        msg = "No axis named {axis}".format(axis=axis)
-        with tm.assertRaisesRegexp(ValueError, msg):
-            self.bseries.cumsum(axis=axis)
-
-    def test_numpy_cumsum(self):
-        result = np.cumsum(self.bseries)
-        expected = SparseSeries(self.bseries.to_dense().cumsum())
-        tm.assert_sp_series_equal(result, expected)
-
-        result = np.cumsum(self.zbseries)
-        expected = self.zbseries.to_dense().cumsum()
-        tm.assert_series_equal(result, expected)
-
-        msg = "the 'dtype' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                              self.bseries, dtype=np.int64)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.cumsum,
-                              self.zbseries, out=result)
-
-    def test_numpy_func_call(self):
-        # no exception should be raised even though
-        # numpy passes in 'axis=None' or `axis=-1'
-        funcs = ['sum', 'cumsum', 'var', 'mean',
-                 'prod', 'cumprod', 'std', 'argsort',
-                 'argmin', 'argmax', 'min', 'max']
-        for func in funcs:
-            for series in ('bseries', 'zbseries'):
-                getattr(np, func)(getattr(self, series))
diff --git a/pandas/tests/test_algos.py b/pandas/tests/test_algos.py
index ac3a42c3cf122..3f75c508d22f9 100644
--- a/pandas/tests/test_algos.py
+++ b/pandas/tests/test_algos.py
@@ -1,26 +1,34 @@
 # -*- coding: utf-8 -*-
-from pandas.compat import range
 
-import numpy as np
-from numpy.random import RandomState
-from numpy import nan
 from datetime import datetime
 from itertools import permutations
-from pandas import Series, Categorical, CategoricalIndex, Index
-import pandas as pd
+import struct
 
-from pandas import compat
-from pandas._libs import (groupby as libgroupby, algos as libalgos,
-                          hashtable)
-from pandas._libs.hashtable import unique_label_indices
-from pandas.compat import lrange
+import numpy as np
+from numpy import nan
+from numpy.random import RandomState
+import pytest
+
+from pandas._libs import (
+    algos as libalgos, groupby as libgroupby, hashtable as ht)
+from pandas.compat import PY2, lrange, range
+from pandas.compat.numpy import np_array_datetime64_compat
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.dtypes import CategoricalDtype as CDT
+
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DatetimeIndex, Index, IntervalIndex, Series,
+    Timestamp, compat)
 import pandas.core.algorithms as algos
+from pandas.core.arrays import DatetimeArray
+import pandas.core.common as com
 import pandas.util.testing as tm
-from pandas.compat.numpy import np_array_datetime64_compat
 from pandas.util.testing import assert_almost_equal
 
 
-class TestMatch(tm.TestCase):
+class TestMatch(object):
 
     def test_ints(self):
         values = np.array([0, 2, 1])
@@ -28,16 +36,16 @@ def test_ints(self):
 
         result = algos.match(to_match, values)
         expected = np.array([0, 2, 1, 1, 0, 2, -1, 0], dtype=np.int64)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = Series(algos.match(to_match, values, np.nan))
         expected = Series(np.array([0, 2, 1, 1, 0, 2, np.nan, 0]))
         tm.assert_series_equal(result, expected)
 
-        s = pd.Series(np.arange(5), dtype=np.float32)
+        s = Series(np.arange(5), dtype=np.float32)
         result = algos.match(s, [2, 4])
         expected = np.array([-1, -1, 0, -1, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = Series(algos.match(s, [2, 4], np.nan))
         expected = Series(np.array([np.nan, np.nan, 0, np.nan, 1]))
@@ -49,140 +57,54 @@ def test_strings(self):
 
         result = algos.match(to_match, values)
         expected = np.array([1, 0, -1, 0, 1, 2, -1], dtype=np.int64)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = Series(algos.match(to_match, values, np.nan))
         expected = Series(np.array([1, 0, np.nan, 0, 1, 2, np.nan]))
         tm.assert_series_equal(result, expected)
 
 
-class TestSafeSort(tm.TestCase):
-
-    def test_basic_sort(self):
-        values = [3, 1, 2, 0, 4]
-        result = algos.safe_sort(values)
-        expected = np.array([0, 1, 2, 3, 4])
-        tm.assert_numpy_array_equal(result, expected)
-
-        values = list("baaacb")
-        result = algos.safe_sort(values)
-        expected = np.array(list("aaabbc"))
-        tm.assert_numpy_array_equal(result, expected)
-
-        values = []
-        result = algos.safe_sort(values)
-        expected = np.array([])
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_labels(self):
-        values = [3, 1, 2, 0, 4]
-        expected = np.array([0, 1, 2, 3, 4])
-
-        labels = [0, 1, 1, 2, 3, 0, -1, 4]
-        result, result_labels = algos.safe_sort(values, labels)
-        expected_labels = np.array([3, 1, 1, 2, 0, 3, -1, 4], dtype=np.intp)
-        tm.assert_numpy_array_equal(result, expected)
-        tm.assert_numpy_array_equal(result_labels, expected_labels)
-
-        # na_sentinel
-        labels = [0, 1, 1, 2, 3, 0, 99, 4]
-        result, result_labels = algos.safe_sort(values, labels,
-                                                na_sentinel=99)
-        expected_labels = np.array([3, 1, 1, 2, 0, 3, 99, 4], dtype=np.intp)
-        tm.assert_numpy_array_equal(result, expected)
-        tm.assert_numpy_array_equal(result_labels, expected_labels)
-
-        # out of bound indices
-        labels = [0, 101, 102, 2, 3, 0, 99, 4]
-        result, result_labels = algos.safe_sort(values, labels)
-        expected_labels = np.array([3, -1, -1, 2, 0, 3, -1, 4], dtype=np.intp)
-        tm.assert_numpy_array_equal(result, expected)
-        tm.assert_numpy_array_equal(result_labels, expected_labels)
-
-        labels = []
-        result, result_labels = algos.safe_sort(values, labels)
-        expected_labels = np.array([], dtype=np.intp)
-        tm.assert_numpy_array_equal(result, expected)
-        tm.assert_numpy_array_equal(result_labels, expected_labels)
-
-    def test_mixed_integer(self):
-        values = np.array(['b', 1, 0, 'a', 0, 'b'], dtype=object)
-        result = algos.safe_sort(values)
-        expected = np.array([0, 0, 1, 'a', 'b', 'b'], dtype=object)
-        tm.assert_numpy_array_equal(result, expected)
-
-        values = np.array(['b', 1, 0, 'a'], dtype=object)
-        labels = [0, 1, 2, 3, 0, -1, 1]
-        result, result_labels = algos.safe_sort(values, labels)
-        expected = np.array([0, 1, 'a', 'b'], dtype=object)
-        expected_labels = np.array([3, 1, 0, 2, 3, -1, 1], dtype=np.intp)
-        tm.assert_numpy_array_equal(result, expected)
-        tm.assert_numpy_array_equal(result_labels, expected_labels)
-
-    def test_unsortable(self):
-        # GH 13714
-        arr = np.array([1, 2, datetime.now(), 0, 3], dtype=object)
-        if compat.PY2 and not pd._np_version_under1p10:
-            # RuntimeWarning: tp_compare didn't return -1 or -2 for exception
-            with tm.assert_produces_warning(RuntimeWarning):
-                tm.assertRaises(TypeError, algos.safe_sort, arr)
-        else:
-            tm.assertRaises(TypeError, algos.safe_sort, arr)
-
-    def test_exceptions(self):
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Only list-like objects are allowed"):
-            algos.safe_sort(values=1)
-
-        with tm.assertRaisesRegexp(TypeError,
-                                   "Only list-like objects or None"):
-            algos.safe_sort(values=[0, 1, 2], labels=1)
-
-        with tm.assertRaisesRegexp(ValueError, "values should be unique"):
-            algos.safe_sort(values=[0, 1, 2, 1], labels=[0, 1])
-
-
-class TestFactorize(tm.TestCase):
+class TestFactorize(object):
 
     def test_basic(self):
 
         labels, uniques = algos.factorize(['a', 'b', 'b', 'a', 'a', 'c', 'c',
                                            'c'])
-        self.assert_numpy_array_equal(
+        tm.assert_numpy_array_equal(
             uniques, np.array(['a', 'b', 'c'], dtype=object))
 
         labels, uniques = algos.factorize(['a', 'b', 'b', 'a',
                                            'a', 'c', 'c', 'c'], sort=True)
         exp = np.array([0, 1, 1, 0, 0, 2, 2, 2], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
+        tm.assert_numpy_array_equal(labels, exp)
         exp = np.array(['a', 'b', 'c'], dtype=object)
-        self.assert_numpy_array_equal(uniques, exp)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(range(5))))
         exp = np.array([0, 1, 2, 3, 4], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
+        tm.assert_numpy_array_equal(labels, exp)
         exp = np.array([4, 3, 2, 1, 0], dtype=np.int64)
-        self.assert_numpy_array_equal(uniques, exp)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(range(5))), sort=True)
 
         exp = np.array([4, 3, 2, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
+        tm.assert_numpy_array_equal(labels, exp)
         exp = np.array([0, 1, 2, 3, 4], dtype=np.int64)
-        self.assert_numpy_array_equal(uniques, exp)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(np.arange(5.))))
         exp = np.array([0, 1, 2, 3, 4], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
+        tm.assert_numpy_array_equal(labels, exp)
         exp = np.array([4., 3., 2., 1., 0.], dtype=np.float64)
-        self.assert_numpy_array_equal(uniques, exp)
+        tm.assert_numpy_array_equal(uniques, exp)
 
         labels, uniques = algos.factorize(list(reversed(np.arange(5.))),
                                           sort=True)
         exp = np.array([4, 3, 2, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
+        tm.assert_numpy_array_equal(labels, exp)
         exp = np.array([0., 1., 2., 3., 4.], dtype=np.float64)
-        self.assert_numpy_array_equal(uniques, exp)
+        tm.assert_numpy_array_equal(uniques, exp)
 
     def test_mixed(self):
 
@@ -191,34 +113,34 @@ def test_mixed(self):
         labels, uniques = algos.factorize(x)
 
         exp = np.array([0, 0, -1, 1, 2, 3], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        exp = pd.Index(['A', 'B', 3.14, np.inf])
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = Index(['A', 'B', 3.14, np.inf])
         tm.assert_index_equal(uniques, exp)
 
         labels, uniques = algos.factorize(x, sort=True)
         exp = np.array([2, 2, -1, 3, 0, 1], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        exp = pd.Index([3.14, np.inf, 'A', 'B'])
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = Index([3.14, np.inf, 'A', 'B'])
         tm.assert_index_equal(uniques, exp)
 
     def test_datelike(self):
 
         # M8
-        v1 = pd.Timestamp('20130101 09:00:00.00004')
-        v2 = pd.Timestamp('20130101')
+        v1 = Timestamp('20130101 09:00:00.00004')
+        v2 = Timestamp('20130101')
         x = Series([v1, v1, v1, v2, v2, v1])
         labels, uniques = algos.factorize(x)
 
         exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        exp = pd.DatetimeIndex([v1, v2])
-        self.assert_index_equal(uniques, exp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = DatetimeIndex([v1, v2])
+        tm.assert_index_equal(uniques, exp)
 
         labels, uniques = algos.factorize(x, sort=True)
         exp = np.array([1, 1, 1, 0, 0, 1], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        exp = pd.DatetimeIndex([v2, v1])
-        self.assert_index_equal(uniques, exp)
+        tm.assert_numpy_array_equal(labels, exp)
+        exp = DatetimeIndex([v2, v1])
+        tm.assert_index_equal(uniques, exp)
 
         # period
         v1 = pd.Period('201302', freq='M')
@@ -228,13 +150,13 @@ def test_datelike(self):
         # periods are not 'sorted' as they are converted back into an index
         labels, uniques = algos.factorize(x)
         exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        self.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
 
         labels, uniques = algos.factorize(x, sort=True)
         exp = np.array([0, 0, 0, 1, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        self.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.PeriodIndex([v1, v2]))
 
         # GH 5986
         v1 = pd.to_timedelta('1 day 1 min')
@@ -242,26 +164,26 @@ def test_datelike(self):
         x = Series([v1, v2, v1, v1, v2, v2, v1])
         labels, uniques = algos.factorize(x)
         exp = np.array([0, 1, 0, 0, 1, 1, 0], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        self.assert_index_equal(uniques, pd.to_timedelta([v1, v2]))
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.to_timedelta([v1, v2]))
 
         labels, uniques = algos.factorize(x, sort=True)
         exp = np.array([1, 0, 1, 1, 0, 0, 1], dtype=np.intp)
-        self.assert_numpy_array_equal(labels, exp)
-        self.assert_index_equal(uniques, pd.to_timedelta([v2, v1]))
+        tm.assert_numpy_array_equal(labels, exp)
+        tm.assert_index_equal(uniques, pd.to_timedelta([v2, v1]))
 
     def test_factorize_nan(self):
         # nan should map to na_sentinel, not reverse_indexer[na_sentinel]
         # rizer.factorize should not raise an exception if na_sentinel indexes
         # outside of reverse_indexer
         key = np.array([1, 2, 1, np.nan], dtype='O')
-        rizer = hashtable.Factorizer(len(key))
+        rizer = ht.Factorizer(len(key))
         for na_sentinel in (-1, 20):
             ids = rizer.factorize(key, sort=True, na_sentinel=na_sentinel)
             expected = np.array([0, 1, 0, na_sentinel], dtype='int32')
-            self.assertEqual(len(set(key)), len(set(expected)))
-            self.assertTrue(np.array_equal(
-                pd.isnull(key), expected == na_sentinel))
+            assert len(set(key)) == len(set(expected))
+            tm.assert_numpy_array_equal(pd.isna(key),
+                                        expected == na_sentinel)
 
         # nan still maps to na_sentinel when sort=False
         key = np.array([0, np.nan, 1], dtype='O')
@@ -271,51 +193,153 @@ def test_factorize_nan(self):
         ids = rizer.factorize(key, sort=False, na_sentinel=na_sentinel)  # noqa
 
         expected = np.array([2, -1, 0], dtype='int32')
-        self.assertEqual(len(set(key)), len(set(expected)))
-        self.assertTrue(
-            np.array_equal(pd.isnull(key), expected == na_sentinel))
-
+        assert len(set(key)) == len(set(expected))
+        tm.assert_numpy_array_equal(pd.isna(key), expected == na_sentinel)
+
+    @pytest.mark.parametrize("data,expected_label,expected_level", [
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2), 'nonsense'],
+            [0, 1, 2, 1, 3],
+            [(1, 1), (1, 2), (0, 0), 'nonsense']
+        ),
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2), (1, 2, 3)],
+            [0, 1, 2, 1, 3],
+            [(1, 1), (1, 2), (0, 0), (1, 2, 3)]
+        ),
+        (
+            [(1, 1), (1, 2), (0, 0), (1, 2)],
+            [0, 1, 2, 1],
+            [(1, 1), (1, 2), (0, 0)]
+        )
+    ])
+    def test_factorize_tuple_list(self, data, expected_label, expected_level):
+        # GH9454
+        result = pd.factorize(data)
+
+        tm.assert_numpy_array_equal(result[0],
+                                    np.array(expected_label, dtype=np.intp))
+
+        expected_level_array = com.asarray_tuplesafe(expected_level,
+                                                     dtype=object)
+        tm.assert_numpy_array_equal(result[1], expected_level_array)
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_complex_sorting(self):
         # gh 12666 - check no segfault
-        # Test not valid numpy versions older than 1.11
-        if pd._np_version_under1p11:
-            self.skipTest("Test valid only for numpy 1.11+")
-
         x17 = np.array([complex(i) for i in range(17)], dtype=object)
 
-        self.assertRaises(TypeError, algos.factorize, x17[::-1], sort=True)
+        msg = (r"'(<|>)' not supported between instances of 'complex' and"
+               r" 'complex'|"
+               r"unorderable types: complex\(\) > complex\(\)")
+        with pytest.raises(TypeError, match=msg):
+            algos.factorize(x17[::-1], sort=True)
 
-    def test_uint64_factorize(self):
-        data = np.array([2**63, 1, 2**63], dtype=np.uint64)
+    def test_float64_factorize(self, writable):
+        data = np.array([1.0, 1e8, 1.0, 1e-8, 1e8, 1.0], dtype=np.float64)
+        data.setflags(write=writable)
+        exp_labels = np.array([0, 1, 0, 2, 1, 0], dtype=np.intp)
+        exp_uniques = np.array([1.0, 1e8, 1e-8], dtype=np.float64)
+
+        labels, uniques = algos.factorize(data)
+        tm.assert_numpy_array_equal(labels, exp_labels)
+        tm.assert_numpy_array_equal(uniques, exp_uniques)
+
+    def test_uint64_factorize(self, writable):
+        data = np.array([2**64 - 1, 1, 2**64 - 1], dtype=np.uint64)
+        data.setflags(write=writable)
         exp_labels = np.array([0, 1, 0], dtype=np.intp)
-        exp_uniques = np.array([2**63, 1], dtype=np.uint64)
+        exp_uniques = np.array([2**64 - 1, 1], dtype=np.uint64)
 
         labels, uniques = algos.factorize(data)
         tm.assert_numpy_array_equal(labels, exp_labels)
         tm.assert_numpy_array_equal(uniques, exp_uniques)
 
-        data = np.array([2**63, -1, 2**63], dtype=object)
+    def test_int64_factorize(self, writable):
+        data = np.array([2**63 - 1, -2**63, 2**63 - 1], dtype=np.int64)
+        data.setflags(write=writable)
         exp_labels = np.array([0, 1, 0], dtype=np.intp)
-        exp_uniques = np.array([2**63, -1], dtype=object)
+        exp_uniques = np.array([2**63 - 1, -2**63], dtype=np.int64)
 
         labels, uniques = algos.factorize(data)
         tm.assert_numpy_array_equal(labels, exp_labels)
         tm.assert_numpy_array_equal(uniques, exp_uniques)
 
+    def test_string_factorize(self, writable):
+        data = np.array(['a', 'c', 'a', 'b', 'c'],
+                        dtype=object)
+        data.setflags(write=writable)
+        exp_labels = np.array([0, 1, 0, 2, 1], dtype=np.intp)
+        exp_uniques = np.array(['a', 'c', 'b'], dtype=object)
 
-class TestUnique(tm.TestCase):
+        labels, uniques = algos.factorize(data)
+        tm.assert_numpy_array_equal(labels, exp_labels)
+        tm.assert_numpy_array_equal(uniques, exp_uniques)
+
+    def test_object_factorize(self, writable):
+        data = np.array(['a', 'c', None, np.nan, 'a', 'b', pd.NaT, 'c'],
+                        dtype=object)
+        data.setflags(write=writable)
+        exp_labels = np.array([0, 1, -1, -1, 0, 2, -1, 1], dtype=np.intp)
+        exp_uniques = np.array(['a', 'c', 'b'], dtype=object)
+
+        labels, uniques = algos.factorize(data)
+        tm.assert_numpy_array_equal(labels, exp_labels)
+        tm.assert_numpy_array_equal(uniques, exp_uniques)
+
+    def test_deprecate_order(self):
+        # gh 19727 - check warning is raised for deprecated keyword, order.
+        # Test not valid once order keyword is removed.
+        data = np.array([2**63, 1, 2**63], dtype=np.uint64)
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            algos.factorize(data, order=True)
+        with tm.assert_produces_warning(False):
+            algos.factorize(data)
+
+    @pytest.mark.parametrize('data', [
+        np.array([0, 1, 0], dtype='u8'),
+        np.array([-2**63, 1, -2**63], dtype='i8'),
+        np.array(['__nan__', 'foo', '__nan__'], dtype='object'),
+    ])
+    def test_parametrized_factorize_na_value_default(self, data):
+        # arrays that include the NA default for that type, but isn't used.
+        l, u = algos.factorize(data)
+        expected_uniques = data[[0, 1]]
+        expected_labels = np.array([0, 1, 0], dtype=np.intp)
+        tm.assert_numpy_array_equal(l, expected_labels)
+        tm.assert_numpy_array_equal(u, expected_uniques)
+
+    @pytest.mark.parametrize('data, na_value', [
+        (np.array([0, 1, 0, 2], dtype='u8'), 0),
+        (np.array([1, 0, 1, 2], dtype='u8'), 1),
+        (np.array([-2**63, 1, -2**63, 0], dtype='i8'), -2**63),
+        (np.array([1, -2**63, 1, 0], dtype='i8'), 1),
+        (np.array(['a', '', 'a', 'b'], dtype=object), 'a'),
+        (np.array([(), ('a', 1), (), ('a', 2)], dtype=object), ()),
+        (np.array([('a', 1), (), ('a', 1), ('a', 2)], dtype=object),
+         ('a', 1)),
+    ])
+    def test_parametrized_factorize_na_value(self, data, na_value):
+        l, u = algos._factorize_array(data, na_value=na_value)
+        expected_uniques = data[[1, 3]]
+        expected_labels = np.array([-1, 0, -1, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(l, expected_labels)
+        tm.assert_numpy_array_equal(u, expected_uniques)
+
+
+class TestUnique(object):
 
     def test_ints(self):
         arr = np.random.randint(0, 100, size=50)
 
         result = algos.unique(arr)
-        tm.assertIsInstance(result, np.ndarray)
+        assert isinstance(result, np.ndarray)
 
     def test_objects(self):
         arr = np.random.randint(0, 100, size=50).astype('O')
 
         result = algos.unique(arr)
-        tm.assertIsInstance(result, np.ndarray)
+        assert isinstance(result, np.ndarray)
 
     def test_object_refcount_bug(self):
         lst = ['A', 'B', 'C', 'D', 'E']
@@ -343,22 +367,22 @@ def test_datetime64_dtype_array_returned(self):
              '2015-01-01T00:00:00.000000000+0000'],
             dtype='M8[ns]')
 
-        dt_index = pd.to_datetime(['2015-01-03T00:00:00.000000000+0000',
-                                   '2015-01-01T00:00:00.000000000+0000',
-                                   '2015-01-01T00:00:00.000000000+0000'])
+        dt_index = pd.to_datetime(['2015-01-03T00:00:00.000000000',
+                                   '2015-01-01T00:00:00.000000000',
+                                   '2015-01-01T00:00:00.000000000'])
         result = algos.unique(dt_index)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
-        s = pd.Series(dt_index)
+        s = Series(dt_index)
         result = algos.unique(s)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
         arr = s.values
         result = algos.unique(arr)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
     def test_timedelta64_dtype_array_returned(self):
         # GH 9431
@@ -367,31 +391,217 @@ def test_timedelta64_dtype_array_returned(self):
         td_index = pd.to_timedelta([31200, 45678, 31200, 10000, 45678])
         result = algos.unique(td_index)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
-        s = pd.Series(td_index)
+        s = Series(td_index)
         result = algos.unique(s)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
         arr = s.values
         result = algos.unique(arr)
         tm.assert_numpy_array_equal(result, expected)
-        self.assertEqual(result.dtype, expected.dtype)
+        assert result.dtype == expected.dtype
 
     def test_uint64_overflow(self):
-        s = pd.Series([1, 2, 2**63, 2**63], dtype=np.uint64)
+        s = Series([1, 2, 2**63, 2**63], dtype=np.uint64)
         exp = np.array([1, 2, 2**63], dtype=np.uint64)
         tm.assert_numpy_array_equal(algos.unique(s), exp)
 
+    def test_nan_in_object_array(self):
+        duplicated_items = ['a', np.nan, 'c', 'c']
+        result = pd.unique(duplicated_items)
+        expected = np.array(['a', np.nan, 'c'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_categorical(self):
+
+        # we are expecting to return in the order
+        # of appearance
+        expected = Categorical(list('bac'), categories=list('bac'))
+
+        # we are expecting to return in the order
+        # of the categories
+        expected_o = Categorical(
+            list('bac'), categories=list('abc'), ordered=True)
+
+        # GH 15939
+        c = Categorical(list('baabc'))
+        result = c.unique()
+        tm.assert_categorical_equal(result, expected)
+
+        result = algos.unique(c)
+        tm.assert_categorical_equal(result, expected)
+
+        c = Categorical(list('baabc'), ordered=True)
+        result = c.unique()
+        tm.assert_categorical_equal(result, expected_o)
+
+        result = algos.unique(c)
+        tm.assert_categorical_equal(result, expected_o)
+
+        # Series of categorical dtype
+        s = Series(Categorical(list('baabc')), name='foo')
+        result = s.unique()
+        tm.assert_categorical_equal(result, expected)
+
+        result = pd.unique(s)
+        tm.assert_categorical_equal(result, expected)
+
+        # CI -> return CI
+        ci = CategoricalIndex(Categorical(list('baabc'),
+                                          categories=list('bac')))
+        expected = CategoricalIndex(expected)
+        result = ci.unique()
+        tm.assert_index_equal(result, expected)
+
+        result = pd.unique(ci)
+        tm.assert_index_equal(result, expected)
+
+    def test_datetime64tz_aware(self):
+        # GH 15939
+
+        result = Series(
+            Index([Timestamp('20160101', tz='US/Eastern'),
+                   Timestamp('20160101', tz='US/Eastern')])).unique()
+        expected = DatetimeArray._from_sequence(np.array([
+            Timestamp('2016-01-01 00:00:00-0500', tz="US/Eastern")
+        ]))
+        tm.assert_extension_array_equal(result, expected)
+
+        result = Index([Timestamp('20160101', tz='US/Eastern'),
+                        Timestamp('20160101', tz='US/Eastern')]).unique()
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+        result = pd.unique(
+            Series(Index([Timestamp('20160101', tz='US/Eastern'),
+                          Timestamp('20160101', tz='US/Eastern')])))
+        expected = DatetimeArray._from_sequence(np.array([
+            Timestamp('2016-01-01', tz="US/Eastern"),
+        ]))
+        tm.assert_extension_array_equal(result, expected)
+
+        result = pd.unique(Index([Timestamp('20160101', tz='US/Eastern'),
+                                  Timestamp('20160101', tz='US/Eastern')]))
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]', freq=None)
+        tm.assert_index_equal(result, expected)
+
+    def test_order_of_appearance(self):
+        # 9346
+        # light testing of guarantee of order of appearance
+        # these also are the doc-examples
+        result = pd.unique(Series([2, 1, 3, 3]))
+        tm.assert_numpy_array_equal(result,
+                                    np.array([2, 1, 3], dtype='int64'))
+
+        result = pd.unique(Series([2] + [1] * 5))
+        tm.assert_numpy_array_equal(result,
+                                    np.array([2, 1], dtype='int64'))
+
+        result = pd.unique(Series([Timestamp('20160101'),
+                                   Timestamp('20160101')]))
+        expected = np.array(['2016-01-01T00:00:00.000000000'],
+                            dtype='datetime64[ns]')
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.unique(Index(
+            [Timestamp('20160101', tz='US/Eastern'),
+             Timestamp('20160101', tz='US/Eastern')]))
+        expected = DatetimeIndex(['2016-01-01 00:00:00'],
+                                 dtype='datetime64[ns, US/Eastern]',
+                                 freq=None)
+        tm.assert_index_equal(result, expected)
 
-class TestIsin(tm.TestCase):
+        result = pd.unique(list('aabc'))
+        expected = np.array(['a', 'b', 'c'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = pd.unique(Series(Categorical(list('aabc'))))
+        expected = Categorical(list('abc'))
+        tm.assert_categorical_equal(result, expected)
+
+    @pytest.mark.parametrize("arg ,expected", [
+        (('1', '1', '2'), np.array(['1', '2'], dtype=object)),
+        (('foo',), np.array(['foo'], dtype=object))
+    ])
+    def test_tuple_with_strings(self, arg, expected):
+        # see GH 17108
+        result = pd.unique(arg)
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_obj_none_preservation(self):
+        # GH 20866
+        arr = np.array(['foo', None], dtype=object)
+        result = pd.unique(arr)
+        expected = np.array(['foo', None], dtype=object)
+
+        tm.assert_numpy_array_equal(result, expected, strict_nan=True)
+
+    def test_signed_zero(self):
+        # GH 21866
+        a = np.array([-0.0, 0.0])
+        result = pd.unique(a)
+        expected = np.array([-0.0])  # 0.0 and -0.0 are equivalent
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_different_nans(self):
+        # GH 21866
+        # create different nans from bit-patterns:
+        NAN1 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000000))[0]
+        NAN2 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000001))[0]
+        assert NAN1 != NAN1
+        assert NAN2 != NAN2
+        a = np.array([NAN1, NAN2])  # NAN1 and NAN2 are equivalent
+        result = pd.unique(a)
+        expected = np.array([np.nan])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_first_nan_kept(self):
+        # GH 22295
+        # create different nans from bit-patterns:
+        bits_for_nan1 = 0xfff8000000000001
+        bits_for_nan2 = 0x7ff8000000000001
+        NAN1 = struct.unpack("d", struct.pack("=Q", bits_for_nan1))[0]
+        NAN2 = struct.unpack("d", struct.pack("=Q", bits_for_nan2))[0]
+        assert NAN1 != NAN1
+        assert NAN2 != NAN2
+        for el_type in [np.float64, np.object]:
+            a = np.array([NAN1, NAN2], dtype=el_type)
+            result = pd.unique(a)
+            assert result.size == 1
+            # use bit patterns to identify which nan was kept:
+            result_nan_bits = struct.unpack("=Q",
+                                            struct.pack("d", result[0]))[0]
+            assert result_nan_bits == bits_for_nan1
+
+    def test_do_not_mangle_na_values(self, unique_nulls_fixture,
+                                     unique_nulls_fixture2):
+        # GH 22295
+        if unique_nulls_fixture is unique_nulls_fixture2:
+            return  # skip it, values not unique
+        a = np.array([unique_nulls_fixture,
+                      unique_nulls_fixture2], dtype=np.object)
+        result = pd.unique(a)
+        assert result.size == 2
+        assert a[0] is unique_nulls_fixture
+        assert a[1] is unique_nulls_fixture2
+
+
+class TestIsin(object):
 
     def test_invalid(self):
 
-        self.assertRaises(TypeError, lambda: algos.isin(1, 1))
-        self.assertRaises(TypeError, lambda: algos.isin(1, [1]))
-        self.assertRaises(TypeError, lambda: algos.isin([1], 1))
+        msg = (r"only list-like objects are allowed to be passed to isin\(\),"
+               r" you passed a \[int\]")
+        with pytest.raises(TypeError, match=msg):
+            algos.isin(1, 1)
+        with pytest.raises(TypeError, match=msg):
+            algos.isin(1, [1])
+        with pytest.raises(TypeError, match=msg):
+            algos.isin([1], 1)
 
     def test_basic(self):
 
@@ -403,15 +613,15 @@ def test_basic(self):
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series([1, 2]), [1])
+        result = algos.isin(Series([1, 2]), [1])
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series([1, 2]), pd.Series([1]))
+        result = algos.isin(Series([1, 2]), Series([1]))
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series([1, 2]), set([1]))
+        result = algos.isin(Series([1, 2]), {1})
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
@@ -419,11 +629,11 @@ def test_basic(self):
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series(['a', 'b']), pd.Series(['a']))
+        result = algos.isin(Series(['a', 'b']), Series(['a']))
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
-        result = algos.isin(pd.Series(['a', 'b']), set(['a']))
+        result = algos.isin(Series(['a', 'b']), {'a'})
         expected = np.array([True, False])
         tm.assert_numpy_array_equal(result, expected)
 
@@ -468,47 +678,160 @@ def test_large(self):
         expected[1] = True
         tm.assert_numpy_array_equal(result, expected)
 
+    def test_categorical_from_codes(self):
+        # GH 16639
+        vals = np.array([0, 1, 2, 0])
+        cats = ['a', 'b', 'c']
+        Sd = Series(Categorical(1).from_codes(vals, cats))
+        St = Series(Categorical(1).from_codes(np.array([0, 1]), cats))
+        expected = np.array([True, True, False, True])
+        result = algos.isin(Sd, St)
+        tm.assert_numpy_array_equal(expected, result)
+
+    def test_same_nan_is_in(self):
+        # GH 22160
+        # nan is special, because from " a is b" doesn't follow "a == b"
+        # at least, isin() should follow python's "np.nan in [nan] == True"
+        # casting to -> np.float64 -> another float-object somewher on
+        # the way could lead jepardize this behavior
+        comps = [np.nan]  # could be casted to float64
+        values = [np.nan]
+        expected = np.array([True])
+        result = algos.isin(comps, values)
+        tm.assert_numpy_array_equal(expected, result)
+
+    def test_same_object_is_in(self):
+        # GH 22160
+        # there could be special treatment for nans
+        # the user however could define a custom class
+        # with similar behavior, then we at least should
+        # fall back to usual python's behavior: "a in [a] == True"
+        class LikeNan(object):
+            def __eq__(self):
+                return False
+
+            def __hash__(self):
+                return 0
+
+        a, b = LikeNan(), LikeNan()
+        # same object -> True
+        tm.assert_numpy_array_equal(algos.isin([a], [a]), np.array([True]))
+        # different objects -> False
+        tm.assert_numpy_array_equal(algos.isin([a], [b]), np.array([False]))
+
+    def test_different_nans(self):
+        # GH 22160
+        # all nans are handled as equivalent
+
+        comps = [float('nan')]
+        values = [float('nan')]
+        assert comps[0] is not values[0]  # different nan-objects
+
+        # as list of python-objects:
+        result = algos.isin(comps, values)
+        tm.assert_numpy_array_equal(np.array([True]), result)
+
+        # as object-array:
+        result = algos.isin(np.asarray(comps, dtype=np.object),
+                            np.asarray(values, dtype=np.object))
+        tm.assert_numpy_array_equal(np.array([True]), result)
+
+        # as float64-array:
+        result = algos.isin(np.asarray(comps, dtype=np.float64),
+                            np.asarray(values, dtype=np.float64))
+        tm.assert_numpy_array_equal(np.array([True]), result)
+
+    def test_no_cast(self):
+        # GH 22160
+        # ensure 42 is not casted to a string
+        comps = ['ss', 42]
+        values = ['42']
+        expected = np.array([False, False])
+        result = algos.isin(comps, values)
+        tm.assert_numpy_array_equal(expected, result)
+
+    @pytest.mark.parametrize("empty", [[], Series(), np.array([])])
+    def test_empty(self, empty):
+        # see gh-16991
+        vals = Index(["a", "b"])
+        expected = np.array([False, False])
+
+        result = algos.isin(vals, empty)
+        tm.assert_numpy_array_equal(expected, result)
+
+    def test_different_nan_objects(self):
+        # GH 22119
+        comps = np.array(['nan', np.nan * 1j, float('nan')], dtype=np.object)
+        vals = np.array([float('nan')], dtype=np.object)
+        expected = np.array([False, False, True])
+        result = algos.isin(comps, vals)
+        tm.assert_numpy_array_equal(expected, result)
+
+    def test_different_nans_as_float64(self):
+        # GH 21866
+        # create different nans from bit-patterns,
+        # these nans will land in different buckets in the hash-table
+        # if no special care is taken
+        NAN1 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000000))[0]
+        NAN2 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000001))[0]
+        assert NAN1 != NAN1
+        assert NAN2 != NAN2
+
+        # check that NAN1 and NAN2 are equivalent:
+        arr = np.array([NAN1, NAN2], dtype=np.float64)
+        lookup1 = np.array([NAN1], dtype=np.float64)
+        result = algos.isin(arr, lookup1)
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
+        lookup2 = np.array([NAN2], dtype=np.float64)
+        result = algos.isin(arr, lookup2)
+        expected = np.array([True, True])
+        tm.assert_numpy_array_equal(result, expected)
+
 
-class TestValueCounts(tm.TestCase):
+class TestValueCounts(object):
 
     def test_value_counts(self):
         np.random.seed(1234)
-        from pandas.tools.tile import cut
+        from pandas.core.reshape.tile import cut
 
         arr = np.random.randn(4)
         factor = cut(arr, 4)
 
-        tm.assertIsInstance(factor, Categorical)
+        # assert isinstance(factor, n)
         result = algos.value_counts(factor)
-        cats = ['(-1.194, -0.535]', '(-0.535, 0.121]', '(0.121, 0.777]',
-                '(0.777, 1.433]']
-        expected_index = CategoricalIndex(cats, cats, ordered=True)
-        expected = Series([1, 1, 1, 1], index=expected_index)
+        breaks = [-1.194, -0.535, 0.121, 0.777, 1.433]
+        index = IntervalIndex.from_breaks(breaks).astype(CDT(ordered=True))
+        expected = Series([1, 1, 1, 1], index=index)
         tm.assert_series_equal(result.sort_index(), expected.sort_index())
 
     def test_value_counts_bins(self):
         s = [1, 2, 3, 4]
         result = algos.value_counts(s, bins=1)
-        self.assertEqual(result.tolist(), [4])
-        self.assertEqual(result.index[0], 0.997)
+        expected = Series([4],
+                          index=IntervalIndex.from_tuples([(0.996, 4.0)]))
+        tm.assert_series_equal(result, expected)
 
         result = algos.value_counts(s, bins=2, sort=False)
-        self.assertEqual(result.tolist(), [2, 2])
-        self.assertEqual(result.index[0], 0.997)
-        self.assertEqual(result.index[1], 2.5)
+        expected = Series([2, 2],
+                          index=IntervalIndex.from_tuples([(0.996, 2.5),
+                                                           (2.5, 4.0)]))
+        tm.assert_series_equal(result, expected)
 
     def test_value_counts_dtypes(self):
         result = algos.value_counts([1, 1.])
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         result = algos.value_counts([1, 1.], bins=1)
-        self.assertEqual(len(result), 1)
+        assert len(result) == 1
 
         result = algos.value_counts(Series([1, 1., '1']))  # object
-        self.assertEqual(len(result), 2)
+        assert len(result) == 2
 
-        self.assertRaises(TypeError, lambda s: algos.value_counts(s, bins=1),
-                          ['1', 1])
+        msg = "bins argument only works with numeric data"
+        with pytest.raises(TypeError, match=msg):
+            algos.value_counts(['1', 1], bins=1)
 
     def test_value_counts_nat(self):
         td = Series([np.timedelta64(10000), pd.NaT], dtype='timedelta64[ns]')
@@ -517,36 +840,36 @@ def test_value_counts_nat(self):
         for s in [td, dt]:
             vc = algos.value_counts(s)
             vc_with_na = algos.value_counts(s, dropna=False)
-            self.assertEqual(len(vc), 1)
-            self.assertEqual(len(vc_with_na), 2)
+            assert len(vc) == 1
+            assert len(vc_with_na) == 2
 
-        exp_dt = pd.Series({pd.Timestamp('2014-01-01 00:00:00'): 1})
+        exp_dt = Series({Timestamp('2014-01-01 00:00:00'): 1})
         tm.assert_series_equal(algos.value_counts(dt), exp_dt)
         # TODO same for (timedelta)
 
     def test_value_counts_datetime_outofbounds(self):
         # GH 13663
-        s = pd.Series([datetime(3000, 1, 1), datetime(5000, 1, 1),
-                       datetime(5000, 1, 1), datetime(6000, 1, 1),
-                       datetime(3000, 1, 1), datetime(3000, 1, 1)])
+        s = Series([datetime(3000, 1, 1), datetime(5000, 1, 1),
+                    datetime(5000, 1, 1), datetime(6000, 1, 1),
+                    datetime(3000, 1, 1), datetime(3000, 1, 1)])
         res = s.value_counts()
 
-        exp_index = pd.Index([datetime(3000, 1, 1), datetime(5000, 1, 1),
-                              datetime(6000, 1, 1)], dtype=object)
-        exp = pd.Series([3, 2, 1], index=exp_index)
+        exp_index = Index([datetime(3000, 1, 1), datetime(5000, 1, 1),
+                           datetime(6000, 1, 1)], dtype=object)
+        exp = Series([3, 2, 1], index=exp_index)
         tm.assert_series_equal(res, exp)
 
         # GH 12424
-        res = pd.to_datetime(pd.Series(['2362-01-01', np.nan]),
+        res = pd.to_datetime(Series(['2362-01-01', np.nan]),
                              errors='ignore')
-        exp = pd.Series(['2362-01-01', np.nan], dtype=object)
+        exp = Series(['2362-01-01', np.nan], dtype=object)
         tm.assert_series_equal(res, exp)
 
     def test_categorical(self):
-        s = Series(pd.Categorical(list('aaabbc')))
+        s = Series(Categorical(list('aaabbc')))
         result = s.value_counts()
-        expected = pd.Series([3, 2, 1],
-                             index=pd.CategoricalIndex(['a', 'b', 'c']))
+        expected = Series([3, 2, 1], index=CategoricalIndex(['a', 'b', 'c']))
+
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # preserve order?
@@ -556,38 +879,38 @@ def test_categorical(self):
         tm.assert_series_equal(result, expected, check_index_type=True)
 
     def test_categorical_nans(self):
-        s = Series(pd.Categorical(list('aaaaabbbcc')))  # 4,3,2,1 (nan)
+        s = Series(Categorical(list('aaaaabbbcc')))  # 4,3,2,1 (nan)
         s.iloc[1] = np.nan
         result = s.value_counts()
-        expected = pd.Series([4, 3, 2], index=pd.CategoricalIndex(
+        expected = Series([4, 3, 2], index=CategoricalIndex(
             ['a', 'b', 'c'], categories=['a', 'b', 'c']))
         tm.assert_series_equal(result, expected, check_index_type=True)
         result = s.value_counts(dropna=False)
-        expected = pd.Series([
+        expected = Series([
             4, 3, 2, 1
-        ], index=pd.CategoricalIndex(['a', 'b', 'c', np.nan]))
+        ], index=CategoricalIndex(['a', 'b', 'c', np.nan]))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         # out of order
-        s = Series(pd.Categorical(
+        s = Series(Categorical(
             list('aaaaabbbcc'), ordered=True, categories=['b', 'a', 'c']))
         s.iloc[1] = np.nan
         result = s.value_counts()
-        expected = pd.Series([4, 3, 2], index=pd.CategoricalIndex(
+        expected = Series([4, 3, 2], index=CategoricalIndex(
             ['a', 'b', 'c'], categories=['b', 'a', 'c'], ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
         result = s.value_counts(dropna=False)
-        expected = pd.Series([4, 3, 2, 1], index=pd.CategoricalIndex(
+        expected = Series([4, 3, 2, 1], index=CategoricalIndex(
             ['a', 'b', 'c', np.nan], categories=['b', 'a', 'c'], ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
     def test_categorical_zeroes(self):
         # keep the `d` category with 0
-        s = Series(pd.Categorical(
+        s = Series(Categorical(
             list('bbbaac'), categories=list('abcd'), ordered=True))
         result = s.value_counts()
-        expected = Series([3, 2, 1, 0], index=pd.Categorical(
+        expected = Series([3, 2, 1, 0], index=Categorical(
             ['b', 'a', 'c', 'd'], categories=list('abcd'), ordered=True))
         tm.assert_series_equal(result, expected, check_index_type=True)
 
@@ -595,34 +918,34 @@ def test_dropna(self):
         # https://github.com/pandas-dev/pandas/issues/9443#issuecomment-73719328
 
         tm.assert_series_equal(
-            pd.Series([True, True, False]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False]).value_counts(dropna=True),
+            Series([2, 1], index=[True, False]))
         tm.assert_series_equal(
-            pd.Series([True, True, False]).value_counts(dropna=False),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False]).value_counts(dropna=False),
+            Series([2, 1], index=[True, False]))
 
         tm.assert_series_equal(
-            pd.Series([True, True, False, None]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[True, False]))
+            Series([True, True, False, None]).value_counts(dropna=True),
+            Series([2, 1], index=[True, False]))
         tm.assert_series_equal(
-            pd.Series([True, True, False, None]).value_counts(dropna=False),
-            pd.Series([2, 1, 1], index=[True, False, np.nan]))
+            Series([True, True, False, None]).value_counts(dropna=False),
+            Series([2, 1, 1], index=[True, False, np.nan]))
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5.]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5.]).value_counts(dropna=True),
+            Series([2, 1], index=[5., 10.3]))
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5.]).value_counts(dropna=False),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5.]).value_counts(dropna=False),
+            Series([2, 1], index=[5., 10.3]))
 
         tm.assert_series_equal(
-            pd.Series([10.3, 5., 5., None]).value_counts(dropna=True),
-            pd.Series([2, 1], index=[5., 10.3]))
+            Series([10.3, 5., 5., None]).value_counts(dropna=True),
+            Series([2, 1], index=[5., 10.3]))
 
         # 32-bit linux has a different ordering
         if not compat.is_platform_32bit():
-            tm.assert_series_equal(
-                pd.Series([10.3, 5., 5., None]).value_counts(dropna=False),
-                pd.Series([2, 1, 1], index=[5., 10.3, np.nan]))
+            result = Series([10.3, 5., 5., None]).value_counts(dropna=False)
+            expected = Series([2, 1, 1], index=[5., 10.3, np.nan])
+            tm.assert_series_equal(result, expected)
 
     def test_value_counts_normalized(self):
         # GH12558
@@ -656,7 +979,7 @@ def test_value_counts_uint64(self):
             tm.assert_series_equal(result, expected)
 
 
-class TestDuplicated(tm.TestCase):
+class TestDuplicated(object):
 
     def test_duplicated_with_nas(self):
         keys = np.array([0, 1, np.nan, 0, 2, np.nan], dtype=object)
@@ -696,55 +1019,55 @@ def test_duplicated_with_nas(self):
         expected = np.array(trues + trues)
         tm.assert_numpy_array_equal(result, expected)
 
-    def test_numeric_object_likes(self):
-        cases = [np.array([1, 2, 1, 5, 3,
-                           2, 4, 1, 5, 6]),
-                 np.array([1.1, 2.2, 1.1, np.nan, 3.3,
-                           2.2, 4.4, 1.1, np.nan, 6.6]),
-                 np.array([1 + 1j, 2 + 2j, 1 + 1j, 5 + 5j, 3 + 3j,
-                           2 + 2j, 4 + 4j, 1 + 1j, 5 + 5j, 6 + 6j]),
-                 np.array(['a', 'b', 'a', 'e', 'c',
-                           'b', 'd', 'a', 'e', 'f'], dtype=object),
-                 np.array([1, 2**63, 1, 3**5, 10,
-                           2**63, 39, 1, 3**5, 7], dtype=np.uint64)]
-
+    @pytest.mark.parametrize('case', [
+        np.array([1, 2, 1, 5, 3,
+                  2, 4, 1, 5, 6]),
+        np.array([1.1, 2.2, 1.1, np.nan, 3.3,
+                  2.2, 4.4, 1.1, np.nan, 6.6]),
+        np.array([1 + 1j, 2 + 2j, 1 + 1j, 5 + 5j, 3 + 3j,
+                  2 + 2j, 4 + 4j, 1 + 1j, 5 + 5j, 6 + 6j]),
+        np.array(['a', 'b', 'a', 'e', 'c',
+                  'b', 'd', 'a', 'e', 'f'], dtype=object),
+        np.array([1, 2**63, 1, 3**5, 10, 2**63, 39, 1, 3**5, 7],
+                 dtype=np.uint64),
+    ])
+    def test_numeric_object_likes(self, case):
         exp_first = np.array([False, False, True, False, False,
                               True, False, True, True, False])
         exp_last = np.array([True, True, True, True, False,
                              False, False, False, False, False])
         exp_false = exp_first | exp_last
 
-        for case in cases:
-            res_first = algos.duplicated(case, keep='first')
-            tm.assert_numpy_array_equal(res_first, exp_first)
+        res_first = algos.duplicated(case, keep='first')
+        tm.assert_numpy_array_equal(res_first, exp_first)
 
-            res_last = algos.duplicated(case, keep='last')
-            tm.assert_numpy_array_equal(res_last, exp_last)
+        res_last = algos.duplicated(case, keep='last')
+        tm.assert_numpy_array_equal(res_last, exp_last)
 
-            res_false = algos.duplicated(case, keep=False)
-            tm.assert_numpy_array_equal(res_false, exp_false)
+        res_false = algos.duplicated(case, keep=False)
+        tm.assert_numpy_array_equal(res_false, exp_false)
 
-            # index
-            for idx in [pd.Index(case), pd.Index(case, dtype='category')]:
-                res_first = idx.duplicated(keep='first')
-                tm.assert_numpy_array_equal(res_first, exp_first)
+        # index
+        for idx in [Index(case), Index(case, dtype='category')]:
+            res_first = idx.duplicated(keep='first')
+            tm.assert_numpy_array_equal(res_first, exp_first)
 
-                res_last = idx.duplicated(keep='last')
-                tm.assert_numpy_array_equal(res_last, exp_last)
+            res_last = idx.duplicated(keep='last')
+            tm.assert_numpy_array_equal(res_last, exp_last)
 
-                res_false = idx.duplicated(keep=False)
-                tm.assert_numpy_array_equal(res_false, exp_false)
+            res_false = idx.duplicated(keep=False)
+            tm.assert_numpy_array_equal(res_false, exp_false)
 
-            # series
-            for s in [pd.Series(case), pd.Series(case, dtype='category')]:
-                res_first = s.duplicated(keep='first')
-                tm.assert_series_equal(res_first, pd.Series(exp_first))
+        # series
+        for s in [Series(case), Series(case, dtype='category')]:
+            res_first = s.duplicated(keep='first')
+            tm.assert_series_equal(res_first, Series(exp_first))
 
-                res_last = s.duplicated(keep='last')
-                tm.assert_series_equal(res_last, pd.Series(exp_last))
+            res_last = s.duplicated(keep='last')
+            tm.assert_series_equal(res_last, Series(exp_last))
 
-                res_false = s.duplicated(keep=False)
-                tm.assert_series_equal(res_false, pd.Series(exp_false))
+            res_false = s.duplicated(keep=False)
+            tm.assert_series_equal(res_false, Series(exp_false))
 
     def test_datetime_likes(self):
 
@@ -753,8 +1076,8 @@ def test_datetime_likes(self):
         td = ['1 days', '2 days', '1 days', 'NaT', '3 days',
               '2 days', '4 days', '1 days', 'NaT', '6 days']
 
-        cases = [np.array([pd.Timestamp(d) for d in dt]),
-                 np.array([pd.Timestamp(d, tz='US/Eastern') for d in dt]),
+        cases = [np.array([Timestamp(d) for d in dt]),
+                 np.array([Timestamp(d, tz='US/Eastern') for d in dt]),
                  np.array([pd.Period(d, freq='D') for d in dt]),
                  np.array([np.datetime64(d) for d in dt]),
                  np.array([pd.Timedelta(d) for d in td])]
@@ -776,8 +1099,8 @@ def test_datetime_likes(self):
             tm.assert_numpy_array_equal(res_false, exp_false)
 
             # index
-            for idx in [pd.Index(case), pd.Index(case, dtype='category'),
-                        pd.Index(case, dtype=object)]:
+            for idx in [Index(case), Index(case, dtype='category'),
+                        Index(case, dtype=object)]:
                 res_first = idx.duplicated(keep='first')
                 tm.assert_numpy_array_equal(res_first, exp_first)
 
@@ -788,24 +1111,40 @@ def test_datetime_likes(self):
                 tm.assert_numpy_array_equal(res_false, exp_false)
 
             # series
-            for s in [pd.Series(case), pd.Series(case, dtype='category'),
-                      pd.Series(case, dtype=object)]:
+            for s in [Series(case), Series(case, dtype='category'),
+                      Series(case, dtype=object)]:
                 res_first = s.duplicated(keep='first')
-                tm.assert_series_equal(res_first, pd.Series(exp_first))
+                tm.assert_series_equal(res_first, Series(exp_first))
 
                 res_last = s.duplicated(keep='last')
-                tm.assert_series_equal(res_last, pd.Series(exp_last))
+                tm.assert_series_equal(res_last, Series(exp_last))
 
                 res_false = s.duplicated(keep=False)
-                tm.assert_series_equal(res_false, pd.Series(exp_false))
+                tm.assert_series_equal(res_false, Series(exp_false))
 
     def test_unique_index(self):
-        cases = [pd.Index([1, 2, 3]), pd.RangeIndex(0, 3)]
+        cases = [Index([1, 2, 3]), pd.RangeIndex(0, 3)]
         for case in cases:
-            self.assertTrue(case.is_unique)
+            assert case.is_unique is True
             tm.assert_numpy_array_equal(case.duplicated(),
                                         np.array([False, False, False]))
 
+    @pytest.mark.parametrize('arr, unique', [
+        ([(0, 0), (0, 1), (1, 0), (1, 1), (0, 0), (0, 1), (1, 0), (1, 1)],
+         [(0, 0), (0, 1), (1, 0), (1, 1)]),
+        ([('b', 'c'), ('a', 'b'), ('a', 'b'), ('b', 'c')],
+         [('b', 'c'), ('a', 'b')]),
+        ([('a', 1), ('b', 2), ('a', 3), ('a', 1)],
+         [('a', 1), ('b', 2), ('a', 3)]),
+    ])
+    def test_unique_tuples(self, arr, unique):
+        # https://github.com/pandas-dev/pandas/issues/16519
+        expected = np.empty(len(unique), dtype=object)
+        expected[:] = unique
+
+        result = pd.unique(arr)
+        tm.assert_numpy_array_equal(result, expected)
+
 
 class GroupVarTestMixin(object):
 
@@ -823,7 +1162,7 @@ def test_group_var_generic_1d(self):
         expected_counts = counts + 3
 
         self.algo(out, counts, values, labels)
-        self.assertTrue(np.allclose(out, expected_out, self.rtol))
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_1d_flat_labels(self):
@@ -839,7 +1178,7 @@ def test_group_var_generic_1d_flat_labels(self):
 
         self.algo(out, counts, values, labels)
 
-        self.assertTrue(np.allclose(out, expected_out, self.rtol))
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_2d_all_finite(self):
@@ -854,7 +1193,7 @@ def test_group_var_generic_2d_all_finite(self):
         expected_counts = counts + 2
 
         self.algo(out, counts, values, labels)
-        self.assertTrue(np.allclose(out, expected_out, self.rtol))
+        assert np.allclose(out, expected_out, self.rtol)
         tm.assert_numpy_array_equal(counts, expected_counts)
 
     def test_group_var_generic_2d_some_nan(self):
@@ -886,15 +1225,15 @@ def test_group_var_constant(self):
 
         self.algo(out, counts, values, labels)
 
-        self.assertEqual(counts[0], 3)
-        self.assertTrue(out[0, 0] >= 0)
+        assert counts[0] == 3
+        assert out[0, 0] >= 0
         tm.assert_almost_equal(out[0, 0], 0.0)
 
 
-class TestGroupVarFloat64(tm.TestCase, GroupVarTestMixin):
+class TestGroupVarFloat64(GroupVarTestMixin):
     __test__ = True
 
-    algo = libgroupby.group_var_float64
+    algo = staticmethod(libgroupby.group_var_float64)
     dtype = np.float64
     rtol = 1e-5
 
@@ -910,62 +1249,185 @@ def test_group_var_large_inputs(self):
 
         self.algo(out, counts, values, labels)
 
-        self.assertEqual(counts[0], 10 ** 6)
+        assert counts[0] == 10 ** 6
         tm.assert_almost_equal(out[0, 0], 1.0 / 12, check_less_precise=True)
 
 
-class TestGroupVarFloat32(tm.TestCase, GroupVarTestMixin):
+class TestGroupVarFloat32(GroupVarTestMixin):
     __test__ = True
 
-    algo = libgroupby.group_var_float32
+    algo = staticmethod(libgroupby.group_var_float32)
     dtype = np.float32
     rtol = 1e-2
 
 
-class TestHashTable(tm.TestCase):
+class TestHashTable(object):
 
-    def test_lookup_nan(self):
+    def test_lookup_nan(self, writable):
         xs = np.array([2.718, 3.14, np.nan, -7, 5, 2, 3])
-        m = hashtable.Float64HashTable()
+        # GH 21688 ensure we can deal with readonly memory views
+        xs.setflags(write=writable)
+        m = ht.Float64HashTable()
         m.map_locations(xs)
-        self.assert_numpy_array_equal(m.lookup(xs),
-                                      np.arange(len(xs), dtype=np.int64))
-
-    def test_lookup_overflow(self):
+        tm.assert_numpy_array_equal(m.lookup(xs), np.arange(len(xs),
+                                                            dtype=np.int64))
+
+    def test_add_signed_zeros(self):
+        # GH 21866 inconsistent hash-function for float64
+        # default hash-function would lead to different hash-buckets
+        # for 0.0 and -0.0 if there are more than 2^30 hash-buckets
+        # but this would mean 16GB
+        N = 4  # 12 * 10**8 would trigger the error, if you have enough memory
+        m = ht.Float64HashTable(N)
+        m.set_item(0.0, 0)
+        m.set_item(-0.0, 0)
+        assert len(m) == 1  # 0.0 and -0.0 are equivalent
+
+    def test_add_different_nans(self):
+        # GH 21866 inconsistent hash-function for float64
+        # create different nans from bit-patterns:
+        NAN1 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000000))[0]
+        NAN2 = struct.unpack("d", struct.pack("=Q", 0x7ff8000000000001))[0]
+        assert NAN1 != NAN1
+        assert NAN2 != NAN2
+        # default hash function would lead to different hash-buckets
+        # for NAN1 and NAN2 even if there are only 4 buckets:
+        m = ht.Float64HashTable()
+        m.set_item(NAN1, 0)
+        m.set_item(NAN2, 0)
+        assert len(m) == 1  # NAN1 and NAN2 are equivalent
+
+    def test_lookup_overflow(self, writable):
         xs = np.array([1, 2, 2**63], dtype=np.uint64)
-        m = hashtable.UInt64HashTable()
+        # GH 21688 ensure we can deal with readonly memory views
+        xs.setflags(write=writable)
+        m = ht.UInt64HashTable()
         m.map_locations(xs)
-        self.assert_numpy_array_equal(m.lookup(xs),
-                                      np.arange(len(xs), dtype=np.int64))
+        tm.assert_numpy_array_equal(m.lookup(xs), np.arange(len(xs),
+                                                            dtype=np.int64))
 
     def test_get_unique(self):
-        s = pd.Series([1, 2, 2**63, 2**63], dtype=np.uint64)
+        s = Series([1, 2, 2**63, 2**63], dtype=np.uint64)
         exp = np.array([1, 2, 2**63], dtype=np.uint64)
-        self.assert_numpy_array_equal(s.unique(), exp)
-
-    def test_vector_resize(self):
+        tm.assert_numpy_array_equal(s.unique(), exp)
+
+    @pytest.mark.parametrize('nvals', [0, 10])  # resizing to 0 is special case
+    @pytest.mark.parametrize('htable, uniques, dtype, safely_resizes', [
+        (ht.PyObjectHashTable, ht.ObjectVector, 'object', False),
+        (ht.StringHashTable, ht.ObjectVector, 'object', True),
+        (ht.Float64HashTable, ht.Float64Vector, 'float64', False),
+        (ht.Int64HashTable, ht.Int64Vector, 'int64', False),
+        (ht.UInt64HashTable, ht.UInt64Vector, 'uint64', False)])
+    def test_vector_resize(self, writable, htable, uniques, dtype,
+                           safely_resizes, nvals):
         # Test for memory errors after internal vector
-        # reallocations (pull request #7157)
-
-        def _test_vector_resize(htable, uniques, dtype, nvals):
-            vals = np.array(np.random.randn(1000), dtype=dtype)
-            # get_labels appends to the vector
-            htable.get_labels(vals[:nvals], uniques, 0, -1)
-            # to_array resizes the vector
-            uniques.to_array()
+        # reallocations (GH 7157)
+        vals = np.array(np.random.randn(1000), dtype=dtype)
+
+        # GH 21688 ensures we can deal with read-only memory views
+        vals.setflags(write=writable)
+
+        # initialise instances; cannot initialise in parametrization,
+        # as otherwise external views would be held on the array (which is
+        # one of the things this test is checking)
+        htable = htable()
+        uniques = uniques()
+
+        # get_labels may append to uniques
+        htable.get_labels(vals[:nvals], uniques, 0, -1)
+        # to_array() sets an external_view_exists flag on uniques.
+        tmp = uniques.to_array()
+        oldshape = tmp.shape
+
+        # subsequent get_labels() calls can no longer append to it
+        # (except for StringHashTables + ObjectVector)
+        if safely_resizes:
             htable.get_labels(vals, uniques, 0, -1)
-
-        test_cases = [
-            (hashtable.PyObjectHashTable, hashtable.ObjectVector, 'object'),
-            (hashtable.StringHashTable, hashtable.ObjectVector, 'object'),
-            (hashtable.Float64HashTable, hashtable.Float64Vector, 'float64'),
-            (hashtable.Int64HashTable, hashtable.Int64Vector, 'int64'),
-            (hashtable.UInt64HashTable, hashtable.UInt64Vector, 'uint64')]
-
-        for (tbl, vect, dtype) in test_cases:
-            # resizing to empty is a special case
-            _test_vector_resize(tbl(), vect(), dtype, 0)
-            _test_vector_resize(tbl(), vect(), dtype, 10)
+        else:
+            with pytest.raises(ValueError, match='external reference.*'):
+                htable.get_labels(vals, uniques, 0, -1)
+
+        uniques.to_array()   # should not raise here
+        assert tmp.shape == oldshape
+
+    @pytest.mark.parametrize('htable, tm_dtype', [
+        (ht.PyObjectHashTable, 'String'),
+        (ht.StringHashTable, 'String'),
+        (ht.Float64HashTable, 'Float'),
+        (ht.Int64HashTable, 'Int'),
+        (ht.UInt64HashTable, 'UInt')])
+    def test_hashtable_unique(self, htable, tm_dtype, writable):
+        # output of maker has guaranteed unique elements
+        maker = getattr(tm, 'make' + tm_dtype + 'Index')
+        s = Series(maker(1000))
+        if htable == ht.Float64HashTable:
+            # add NaN for float column
+            s.loc[500] = np.nan
+        elif htable == ht.PyObjectHashTable:
+            # use different NaN types for object column
+            s.loc[500:502] = [np.nan, None, pd.NaT]
+
+        # create duplicated selection
+        s_duplicated = s.sample(frac=3, replace=True).reset_index(drop=True)
+        s_duplicated.values.setflags(write=writable)
+
+        # drop_duplicates has own cython code (hash_table_func_helper.pxi)
+        # and is tested separately; keeps first occurrence like ht.unique()
+        expected_unique = s_duplicated.drop_duplicates(keep='first').values
+        result_unique = htable().unique(s_duplicated.values)
+        tm.assert_numpy_array_equal(result_unique, expected_unique)
+
+        # test return_inverse=True
+        # reconstruction can only succeed if the inverse is correct
+        result_unique, result_inverse = htable().unique(s_duplicated.values,
+                                                        return_inverse=True)
+        tm.assert_numpy_array_equal(result_unique, expected_unique)
+        reconstr = result_unique[result_inverse]
+        tm.assert_numpy_array_equal(reconstr, s_duplicated.values)
+
+    @pytest.mark.parametrize('htable, tm_dtype', [
+        (ht.PyObjectHashTable, 'String'),
+        (ht.StringHashTable, 'String'),
+        (ht.Float64HashTable, 'Float'),
+        (ht.Int64HashTable, 'Int'),
+        (ht.UInt64HashTable, 'UInt')])
+    def test_hashtable_factorize(self, htable, tm_dtype, writable):
+        # output of maker has guaranteed unique elements
+        maker = getattr(tm, 'make' + tm_dtype + 'Index')
+        s = Series(maker(1000))
+        if htable == ht.Float64HashTable:
+            # add NaN for float column
+            s.loc[500] = np.nan
+        elif htable == ht.PyObjectHashTable:
+            # use different NaN types for object column
+            s.loc[500:502] = [np.nan, None, pd.NaT]
+
+        # create duplicated selection
+        s_duplicated = s.sample(frac=3, replace=True).reset_index(drop=True)
+        s_duplicated.values.setflags(write=writable)
+        na_mask = s_duplicated.isna().values
+
+        result_unique, result_inverse = htable().factorize(s_duplicated.values)
+
+        # drop_duplicates has own cython code (hash_table_func_helper.pxi)
+        # and is tested separately; keeps first occurrence like ht.factorize()
+        # since factorize removes all NaNs, we do the same here
+        expected_unique = s_duplicated.dropna().drop_duplicates().values
+        tm.assert_numpy_array_equal(result_unique, expected_unique)
+
+        # reconstruction can only succeed if the inverse is correct. Since
+        # factorize removes the NaNs, those have to be excluded here as well
+        result_reconstruct = result_unique[result_inverse[~na_mask]]
+        expected_reconstruct = s_duplicated.dropna().values
+        tm.assert_numpy_array_equal(result_reconstruct, expected_reconstruct)
+
+    @pytest.mark.parametrize('hashtable', [
+        ht.PyObjectHashTable, ht.StringHashTable,
+        ht.Float64HashTable, ht.Int64HashTable, ht.UInt64HashTable])
+    def test_hashtable_large_sizehint(self, hashtable):
+        # GH 22729
+        size_hint = np.iinfo(np.uint32).max + 1
+        tbl = hashtable(size_hint=size_hint) # noqa
 
 
 def test_quantile():
@@ -980,23 +1442,23 @@ def test_unique_label_indices():
 
     a = np.random.randint(1, 1 << 10, 1 << 15).astype('i8')
 
-    left = unique_label_indices(a)
+    left = ht.unique_label_indices(a)
     right = np.unique(a, return_index=True)[1]
 
     tm.assert_numpy_array_equal(left, right,
                                 check_dtype=False)
 
     a[np.random.choice(len(a), 10)] = -1
-    left = unique_label_indices(a)
+    left = ht.unique_label_indices(a)
     right = np.unique(a, return_index=True)[1][1:]
     tm.assert_numpy_array_equal(left, right,
                                 check_dtype=False)
 
 
-class TestRank(tm.TestCase):
+class TestRank(object):
 
+    @td.skip_if_no_scipy
     def test_scipy_compat(self):
-        tm._skip_if_no_scipy()
         from scipy.stats import rankdata
 
         def _check(arr):
@@ -1029,30 +1491,41 @@ def test_too_many_ndims(self):
         arr = np.array([[[1, 2, 3], [4, 5, 6], [7, 8, 9]]])
         msg = "Array with ndim > 2 are not supported"
 
-        with tm.assertRaisesRegexp(TypeError, msg):
+        with pytest.raises(TypeError, match=msg):
             algos.rank(arr)
 
+    @pytest.mark.single
+    @pytest.mark.high_memory
+    @pytest.mark.parametrize('values', [
+        np.arange(2**24 + 1),
+        np.arange(2**25 + 2).reshape(2**24 + 1, 2)],
+        ids=['1d', '2d'])
+    def test_pct_max_many_rows(self, values):
+        # GH 18271
+        result = algos.rank(values, pct=True).max()
+        assert result == 1
+
 
 def test_pad_backfill_object_segfault():
 
     old = np.array([], dtype='O')
     new = np.array([datetime(2010, 12, 31)], dtype='O')
 
-    result = libalgos.pad_object(old, new)
+    result = libalgos.pad["object"](old, new)
     expected = np.array([-1], dtype=np.int64)
-    assert (np.array_equal(result, expected))
+    tm.assert_numpy_array_equal(result, expected)
 
-    result = libalgos.pad_object(new, old)
+    result = libalgos.pad["object"](new, old)
     expected = np.array([], dtype=np.int64)
-    assert (np.array_equal(result, expected))
+    tm.assert_numpy_array_equal(result, expected)
 
-    result = libalgos.backfill_object(old, new)
+    result = libalgos.backfill["object"](old, new)
     expected = np.array([-1], dtype=np.int64)
-    assert (np.array_equal(result, expected))
+    tm.assert_numpy_array_equal(result, expected)
 
-    result = libalgos.backfill_object(new, old)
+    result = libalgos.backfill["object"](new, old)
     expected = np.array([], dtype=np.int64)
-    assert (np.array_equal(result, expected))
+    tm.assert_numpy_array_equal(result, expected)
 
 
 def test_arrmap():
@@ -1061,7 +1534,7 @@ def test_arrmap():
     assert (result.dtype == np.bool_)
 
 
-class TestTseriesUtil(tm.TestCase):
+class TestTseriesUtil(object):
 
     def test_combineFunc(self):
         pass
@@ -1069,7 +1542,7 @@ def test_combineFunc(self):
     def test_reindex(self):
         pass
 
-    def test_isnull(self):
+    def test_isna(self):
         pass
 
     def test_groupby(self):
@@ -1082,36 +1555,36 @@ def test_backfill(self):
         old = Index([1, 5, 10])
         new = Index(lrange(12))
 
-        filler = libalgos.backfill_int64(old.values, new.values)
+        filler = libalgos.backfill["int64_t"](old.values, new.values)
 
         expect_filler = np.array([0, 0, 1, 1, 1, 1,
                                   2, 2, 2, 2, 2, -1], dtype=np.int64)
-        self.assert_numpy_array_equal(filler, expect_filler)
+        tm.assert_numpy_array_equal(filler, expect_filler)
 
         # corner case
         old = Index([1, 4])
         new = Index(lrange(5, 10))
-        filler = libalgos.backfill_int64(old.values, new.values)
+        filler = libalgos.backfill["int64_t"](old.values, new.values)
 
         expect_filler = np.array([-1, -1, -1, -1, -1], dtype=np.int64)
-        self.assert_numpy_array_equal(filler, expect_filler)
+        tm.assert_numpy_array_equal(filler, expect_filler)
 
     def test_pad(self):
         old = Index([1, 5, 10])
         new = Index(lrange(12))
 
-        filler = libalgos.pad_int64(old.values, new.values)
+        filler = libalgos.pad["int64_t"](old.values, new.values)
 
         expect_filler = np.array([-1, 0, 0, 0, 0, 1,
                                   1, 1, 1, 1, 2, 2], dtype=np.int64)
-        self.assert_numpy_array_equal(filler, expect_filler)
+        tm.assert_numpy_array_equal(filler, expect_filler)
 
         # corner case
         old = Index([5, 10])
         new = Index(lrange(5))
-        filler = libalgos.pad_int64(old.values, new.values)
+        filler = libalgos.pad["int64_t"](old.values, new.values)
         expect_filler = np.array([-1, -1, -1, -1, -1], dtype=np.int64)
-        self.assert_numpy_array_equal(filler, expect_filler)
+        tm.assert_numpy_array_equal(filler, expect_filler)
 
 
 def test_is_lexsorted():
@@ -1127,7 +1600,7 @@ def test_is_lexsorted():
                   1, 1, 1, 1, 1, 1, 1,
                   1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
                   0, 0, 0, 0, 0, 0, 0,
-                  0, 0, 0, 0, 0, 0, 0, 0, 0]),
+                  0, 0, 0, 0, 0, 0, 0, 0, 0], dtype='int64'),
         np.array([30, 29, 28, 27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16,
                   15, 14,
                   13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28,
@@ -1139,19 +1612,10 @@ def test_is_lexsorted():
                   7, 6, 5, 4, 3, 2, 1, 0, 30, 29, 28, 27, 26, 25, 24, 23, 22,
                   21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7,
                   6, 5,
-                  4, 3, 2, 1, 0])]
+                  4, 3, 2, 1, 0], dtype='int64')]
 
     assert (not libalgos.is_lexsorted(failure))
 
-# def test_get_group_index():
-#     a = np.array([0, 1, 2, 0, 2, 1, 0, 0], dtype=np.int64)
-#     b = np.array([1, 0, 3, 2, 0, 2, 3, 0], dtype=np.int64)
-#     expected = np.array([1, 4, 11, 2, 8, 6, 3, 0], dtype=np.int64)
-
-#     result = lib.get_group_index([a, b], (3, 4))
-
-#     assert(np.array_equal(result, expected))
-
 
 def test_groupsort_indexer():
     a = np.random.randint(0, 1000, 100).astype(np.int64)
@@ -1160,14 +1624,22 @@ def test_groupsort_indexer():
     result = libalgos.groupsort_indexer(a, 1000)[0]
 
     # need to use a stable sort
+    # np.argsort returns int, groupsort_indexer
+    # always returns int64
     expected = np.argsort(a, kind='mergesort')
-    assert (np.array_equal(result, expected))
+    expected = expected.astype(np.int64)
+
+    tm.assert_numpy_array_equal(result, expected)
 
     # compare with lexsort
+    # np.lexsort returns int, groupsort_indexer
+    # always returns int64
     key = a * 1000 + b
     result = libalgos.groupsort_indexer(key, 1000000)[0]
     expected = np.lexsort((b, a))
-    assert (np.array_equal(result, expected))
+    expected = expected.astype(np.int64)
+
+    tm.assert_numpy_array_equal(result, expected)
 
 
 def test_infinity_sort():
@@ -1185,11 +1657,15 @@ def test_infinity_sort():
     assert all(Inf > x or x is Inf for x in ref_nums)
     assert Inf >= Inf and Inf == Inf
     assert not Inf < Inf and not Inf > Inf
+    assert libalgos.Infinity() == libalgos.Infinity()
+    assert not libalgos.Infinity() != libalgos.Infinity()
 
     assert all(NegInf <= x for x in ref_nums)
     assert all(NegInf < x or x is NegInf for x in ref_nums)
     assert NegInf <= NegInf and NegInf == NegInf
     assert not NegInf < NegInf and not NegInf > NegInf
+    assert libalgos.NegInfinity() == libalgos.NegInfinity()
+    assert not libalgos.NegInfinity() != libalgos.NegInfinity()
 
     for perm in permutations(ref_nums):
         assert sorted(perm) == ref_nums
@@ -1199,6 +1675,25 @@ def test_infinity_sort():
     np.array([libalgos.NegInfinity()] * 32).argsort()
 
 
+def test_infinity_against_nan():
+    Inf = libalgos.Infinity()
+    NegInf = libalgos.NegInfinity()
+
+    assert not Inf > np.nan
+    assert not Inf >= np.nan
+    assert not Inf < np.nan
+    assert not Inf <= np.nan
+    assert not Inf == np.nan
+    assert Inf != np.nan
+
+    assert not NegInf > np.nan
+    assert not NegInf >= np.nan
+    assert not NegInf < np.nan
+    assert not NegInf <= np.nan
+    assert not NegInf == np.nan
+    assert NegInf != np.nan
+
+
 def test_ensure_platform_int():
     arr = np.arange(100, dtype=np.intp)
 
@@ -1212,27 +1707,27 @@ def test_int64_add_overflow():
     m = np.iinfo(np.int64).max
     n = np.iinfo(np.int64).min
 
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, m]), m)
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([n, n]), n)
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([n, n]), np.array([n, n]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, n]), np.array([n, n]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
                                    arr_mask=np.array([False, True]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
                                    b_mask=np.array([False, True]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
                                    arr_mask=np.array([False, True]),
                                    b_mask=np.array([False, True]))
-    with tm.assertRaisesRegexp(OverflowError, msg):
+    with pytest.raises(OverflowError, match=msg):
         with tm.assert_produces_warning(RuntimeWarning):
             algos.checked_add_with_arr(np.array([m, m]),
                                        np.array([np.nan, m]))
@@ -1240,29 +1735,23 @@ def test_int64_add_overflow():
     # Check that the nan boolean arrays override whether or not
     # the addition overflows. We don't check the result but just
     # the fact that an OverflowError is not raised.
-    with tm.assertRaises(AssertionError):
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
-                                       arr_mask=np.array([True, True]))
-    with tm.assertRaises(AssertionError):
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
-                                       b_mask=np.array([True, True]))
-    with tm.assertRaises(AssertionError):
-        with tm.assertRaisesRegexp(OverflowError, msg):
-            algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
-                                       arr_mask=np.array([True, False]),
-                                       b_mask=np.array([False, True]))
-
-
-class TestMode(tm.TestCase):
+    algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                               arr_mask=np.array([True, True]))
+    algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                               b_mask=np.array([True, True]))
+    algos.checked_add_with_arr(np.array([m, m]), np.array([m, m]),
+                               arr_mask=np.array([True, False]),
+                               b_mask=np.array([False, True]))
+
+
+class TestMode(object):
 
     def test_no_mode(self):
         exp = Series([], dtype=np.float64)
         tm.assert_series_equal(algos.mode([]), exp)
 
-    # GH 15714
     def test_mode_single(self):
+        # GH 15714
         exp_single = [1]
         data_single = [1]
 
@@ -1356,16 +1845,19 @@ def test_uint64_overflow(self):
 
     def test_categorical(self):
         c = Categorical([1, 2])
-        exp = Series([1, 2], dtype=np.int64)
-        tm.assert_series_equal(algos.mode(c), exp)
+        exp = c
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
 
         c = Categorical([1, 'a', 'a'])
-        exp = Series(['a'], dtype=object)
-        tm.assert_series_equal(algos.mode(c), exp)
+        exp = Categorical(['a'], categories=[1, 'a'])
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
 
         c = Categorical([1, 1, 2, 3, 3])
-        exp = Series([1, 3], dtype=np.int64)
-        tm.assert_series_equal(algos.mode(c), exp)
+        exp = Categorical([1, 3], categories=[1, 2, 3])
+        tm.assert_categorical_equal(algos.mode(c), exp)
+        tm.assert_categorical_equal(c.mode(), exp)
 
     def test_index(self):
         idx = Index([1, 2, 3])
diff --git a/pandas/tests/test_base.py b/pandas/tests/test_base.py
index 032e3a186b84a..ac365eb87d1bc 100644
--- a/pandas/tests/test_base.py
+++ b/pandas/tests/test_base.py
@@ -1,24 +1,32 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
 
+from datetime import datetime, timedelta
 import re
 import sys
-from datetime import datetime, timedelta
-import pytest
+
 import numpy as np
+import pytest
 
-import pandas as pd
+from pandas._libs.tslib import iNaT
 import pandas.compat as compat
-from pandas.types.common import (is_object_dtype, is_datetimetz,
-                                 needs_i8_conversion)
-import pandas.util.testing as tm
-from pandas import (Series, Index, DatetimeIndex, TimedeltaIndex, PeriodIndex,
-                    Timedelta)
-from pandas.compat import StringIO
+from pandas.compat import PYPY, StringIO, long
 from pandas.compat.numpy import np_array_datetime64_compat
-from pandas.core.base import PandasDelegate, NoNewAttributesMixin
-from pandas.tseries.base import DatetimeIndexOpsMixin
-from pandas._libs.tslib import iNaT
+
+from pandas.core.dtypes.common import (
+    is_datetime64_dtype, is_datetime64tz_dtype, is_object_dtype,
+    is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.dtypes import DatetimeTZDtype
+
+import pandas as pd
+from pandas import (
+    CategoricalIndex, DataFrame, DatetimeIndex, Index, Interval, IntervalIndex,
+    Panel, PeriodIndex, Series, Timedelta, TimedeltaIndex, Timestamp)
+from pandas.core.accessor import PandasDelegate
+from pandas.core.arrays import DatetimeArray, PandasArray, TimedeltaArray
+from pandas.core.base import NoNewAttributesMixin, PandasObject
+from pandas.core.indexes.datetimelike import DatetimeIndexOpsMixin
+import pandas.util.testing as tm
 
 
 class CheckStringMixin(object):
@@ -44,9 +52,10 @@ class CheckImmutable(object):
     mutable_regex = re.compile('does not support mutable operations')
 
     def check_mutable_error(self, *args, **kwargs):
-        # pass whatever functions you normally would to assertRaises (after the
-        # Exception kind)
-        tm.assertRaisesRegexp(TypeError, self.mutable_regex, *args, **kwargs)
+        # Pass whatever function you normally would to pytest.raises
+        # (after the Exception kind).
+        with pytest.raises(TypeError):
+            self.mutable_regex(*args, **kwargs)
 
     def test_no_mutable_funcs(self):
         def setitem():
@@ -69,6 +78,7 @@ def delslice():
 
         self.check_mutable_error(delslice)
         mutable_methods = getattr(self, "mutable_methods", [])
+
         for meth in mutable_methods:
             self.check_mutable_error(getattr(self.container, meth))
 
@@ -79,11 +89,11 @@ def test_slicing_maintains_type(self):
 
     def check_result(self, result, expected, klass=None):
         klass = klass or self.klass
-        self.assertIsInstance(result, klass)
-        self.assertEqual(result, expected)
+        assert isinstance(result, klass)
+        assert result == expected
 
 
-class TestPandasDelegate(tm.TestCase):
+class TestPandasDelegate(object):
 
     class Delegator(object):
         _properties = ['foo']
@@ -101,17 +111,18 @@ def bar(self, *args, **kwargs):
             """ a test bar method """
             pass
 
-    class Delegate(PandasDelegate):
+    class Delegate(PandasDelegate, PandasObject):
 
         def __init__(self, obj):
             self.obj = obj
 
-    def setUp(self):
+    def setup_method(self, method):
         pass
 
-    def test_invalida_delgation(self):
+    def test_invalid_delegation(self):
         # these show that in order for the delegation to work
-        # the _delegate_* methods need to be overriden to not raise a TypeError
+        # the _delegate_* methods need to be overridden to not raise
+        # a TypeError
 
         self.Delegate._add_delegate_accessors(
             delegate=self.Delegator,
@@ -126,21 +137,16 @@ def test_invalida_delgation(self):
 
         delegate = self.Delegate(self.Delegator())
 
-        def f():
+        with pytest.raises(TypeError):
             delegate.foo
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(TypeError):
             delegate.foo = 5
 
-        self.assertRaises(TypeError, f)
-
-        def f():
+        with pytest.raises(TypeError):
             delegate.foo()
 
-        self.assertRaises(TypeError, f)
-
+    @pytest.mark.skipif(PYPY, reason="not relevant for PyPy")
     def test_memory_usage(self):
         # Delegate does not implement memory_usage.
         # Check that we fall back to in-built `__sizeof__`
@@ -149,7 +155,7 @@ def test_memory_usage(self):
         sys.getsizeof(delegate)
 
 
-class Ops(tm.TestCase):
+class Ops(object):
 
     def _allow_na_ops(self, obj):
         """Whether to skip test cases including NaN"""
@@ -159,7 +165,7 @@ def _allow_na_ops(self, obj):
             return False
         return True
 
-    def setUp(self):
+    def setup_method(self, method):
         self.bool_index = tm.makeBoolIndex(10, name='a')
         self.int_index = tm.makeIntIndex(10, name='a')
         self.float_index = tm.makeFloatIndex(10, name='a')
@@ -171,19 +177,20 @@ def setUp(self):
         self.unicode_index = tm.makeUnicodeIndex(10, name='a')
 
         arr = np.random.randn(10)
+        self.bool_series = Series(arr, index=self.bool_index, name='a')
         self.int_series = Series(arr, index=self.int_index, name='a')
         self.float_series = Series(arr, index=self.float_index, name='a')
         self.dt_series = Series(arr, index=self.dt_index, name='a')
         self.dt_tz_series = self.dt_tz_index.to_series(keep_tz=True)
         self.period_series = Series(arr, index=self.period_index, name='a')
         self.string_series = Series(arr, index=self.string_index, name='a')
+        self.unicode_series = Series(arr, index=self.unicode_index, name='a')
 
         types = ['bool', 'int', 'float', 'dt', 'dt_tz', 'period', 'string',
                  'unicode']
-        fmts = ["{0}_{1}".format(t, f)
-                for t in types for f in ['index', 'series']]
-        self.objs = [getattr(self, f)
-                     for f in fmts if getattr(self, f, None) is not None]
+        self.indexes = [getattr(self, '{}_index'.format(t)) for t in types]
+        self.series = [getattr(self, '{}_series'.format(t)) for t in types]
+        self.objs = self.indexes + self.series
 
     def check_ops_properties(self, props, filter=None, ignore_failures=False):
         for op in props:
@@ -214,9 +221,9 @@ def check_ops_properties(self, props, filter=None, ignore_failures=False):
                     tm.assert_index_equal(result, expected)
                 elif isinstance(result, np.ndarray) and isinstance(expected,
                                                                    np.ndarray):
-                    self.assert_numpy_array_equal(result, expected)
+                    tm.assert_numpy_array_equal(result, expected)
                 else:
-                    self.assertEqual(result, expected)
+                    assert result == expected
 
             # freq raises AttributeError on an Int64Index because its not
             # defined we mostly care about Series here anyhow
@@ -225,14 +232,15 @@ def check_ops_properties(self, props, filter=None, ignore_failures=False):
 
                     # an object that is datetimelike will raise a TypeError,
                     # otherwise an AttributeError
+                    err = AttributeError
                     if issubclass(type(o), DatetimeIndexOpsMixin):
-                        self.assertRaises(TypeError, lambda: getattr(o, op))
-                    else:
-                        self.assertRaises(AttributeError,
-                                          lambda: getattr(o, op))
+                        err = TypeError
+
+                    with pytest.raises(err):
+                        getattr(o, op)
 
-    def test_binary_ops_docs(self):
-        from pandas import DataFrame, Panel
+    @pytest.mark.parametrize('klass', [Series, DataFrame, Panel])
+    def test_binary_ops_docs(self, klass):
         op_map = {'add': '+',
                   'sub': '-',
                   'mul': '*',
@@ -240,28 +248,24 @@ def test_binary_ops_docs(self):
                   'pow': '**',
                   'truediv': '/',
                   'floordiv': '//'}
-        for op_name in ['add', 'sub', 'mul', 'mod', 'pow', 'truediv',
-                        'floordiv']:
-            for klass in [Series, DataFrame, Panel]:
-                operand1 = klass.__name__.lower()
-                operand2 = 'other'
-                op = op_map[op_name]
-                expected_str = ' '.join([operand1, op, operand2])
-                self.assertTrue(expected_str in getattr(klass,
-                                                        op_name).__doc__)
-
-                # reverse version of the binary ops
-                expected_str = ' '.join([operand2, op, operand1])
-                self.assertTrue(expected_str in getattr(klass, 'r' +
-                                                        op_name).__doc__)
+        for op_name in op_map:
+            operand1 = klass.__name__.lower()
+            operand2 = 'other'
+            op = op_map[op_name]
+            expected_str = ' '.join([operand1, op, operand2])
+            assert expected_str in getattr(klass, op_name).__doc__
+
+            # reverse version of the binary ops
+            expected_str = ' '.join([operand2, op, operand1])
+            assert expected_str in getattr(klass, 'r' + op_name).__doc__
 
 
 class TestIndexOps(Ops):
 
-    def setUp(self):
-        super(TestIndexOps, self).setUp()
-        self.is_valid_objs = [o for o in self.objs if o._allow_index_ops]
-        self.not_valid_objs = [o for o in self.objs if not o._allow_index_ops]
+    def setup_method(self, method):
+        super(TestIndexOps, self).setup_method(method)
+        self.is_valid_objs = self.objs
+        self.not_valid_objs = []
 
     def test_none_comparison(self):
 
@@ -274,116 +278,69 @@ def test_none_comparison(self):
 
                 # noinspection PyComparisonWithNone
                 result = o == None  # noqa
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                assert not result.iat[0]
+                assert not result.iat[1]
 
                 # noinspection PyComparisonWithNone
                 result = o != None  # noqa
-                self.assertTrue(result.iat[0])
-                self.assertTrue(result.iat[1])
+                assert result.iat[0]
+                assert result.iat[1]
 
                 result = None == o  # noqa
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
-
-                # this fails for numpy < 1.9
-                # and oddly for *some* platforms
-                # result = None != o  # noqa
-                # self.assertTrue(result.iat[0])
-                # self.assertTrue(result.iat[1])
-
-                result = None > o
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                assert not result.iat[0]
+                assert not result.iat[1]
+
+                result = None != o  # noqa
+                assert result.iat[0]
+                assert result.iat[1]
+
+                if (is_datetime64_dtype(o) or is_datetime64tz_dtype(o)):
+                    # Following DatetimeIndex (and Timestamp) convention,
+                    # inequality comparisons with Series[datetime64] raise
+                    with pytest.raises(TypeError):
+                        None > o
+                    with pytest.raises(TypeError):
+                        o > None
+                else:
+                    result = None > o
+                    assert not result.iat[0]
+                    assert not result.iat[1]
 
-                result = o < None
-                self.assertFalse(result.iat[0])
-                self.assertFalse(result.iat[1])
+                    result = o < None
+                    assert not result.iat[0]
+                    assert not result.iat[1]
 
     def test_ndarray_compat_properties(self):
 
         for o in self.objs:
+            # Check that we work.
+            for p in ['shape', 'dtype', 'T', 'nbytes']:
+                assert getattr(o, p, None) is not None
 
-            # check that we work
-            for p in ['shape', 'dtype', 'flags', 'T', 'strides', 'itemsize',
-                      'nbytes']:
-                self.assertIsNotNone(getattr(o, p, None))
-            self.assertTrue(hasattr(o, 'base'))
+            # deprecated properties
+            for p in ['flags', 'strides', 'itemsize']:
+                with tm.assert_produces_warning(FutureWarning):
+                    assert getattr(o, p, None) is not None
 
-            # if we have a datetimelike dtype then needs a view to work
+            with tm.assert_produces_warning(FutureWarning):
+                assert hasattr(o, 'base')
+
+            # If we have a datetime-like dtype then needs a view to work
             # but the user is responsible for that
             try:
-                self.assertIsNotNone(o.data)
+                with tm.assert_produces_warning(FutureWarning):
+                    assert o.data is not None
             except ValueError:
                 pass
 
-            self.assertRaises(ValueError, o.item)  # len > 1
-            self.assertEqual(o.ndim, 1)
-            self.assertEqual(o.size, len(o))
+            with pytest.raises(ValueError):
+                o.item()  # len > 1
 
-        self.assertEqual(Index([1]).item(), 1)
-        self.assertEqual(Series([1]).item(), 1)
+            assert o.ndim == 1
+            assert o.size == len(o)
 
-    def test_ops(self):
-        for op in ['max', 'min']:
-            for o in self.objs:
-                result = getattr(o, op)()
-                if not isinstance(o, PeriodIndex):
-                    expected = getattr(o.values, op)()
-                else:
-                    expected = pd.Period(ordinal=getattr(o._values, op)(),
-                                         freq=o.freq)
-                try:
-                    self.assertEqual(result, expected)
-                except TypeError:
-                    # comparing tz-aware series with np.array results in
-                    # TypeError
-                    expected = expected.astype('M8[ns]').astype('int64')
-                    self.assertEqual(result.value, expected)
-
-    def test_nanops(self):
-        # GH 7261
-        for op in ['max', 'min']:
-            for klass in [Index, Series]:
-
-                obj = klass([np.nan, 2.0])
-                self.assertEqual(getattr(obj, op)(), 2.0)
-
-                obj = klass([np.nan])
-                self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-                obj = klass([])
-                self.assertTrue(pd.isnull(getattr(obj, op)()))
-
-                obj = klass([pd.NaT, datetime(2011, 11, 1)])
-                # check DatetimeIndex monotonic path
-                self.assertEqual(getattr(obj, op)(), datetime(2011, 11, 1))
-
-                obj = klass([pd.NaT, datetime(2011, 11, 1), pd.NaT])
-                # check DatetimeIndex non-monotonic path
-                self.assertEqual(getattr(obj, op)(), datetime(2011, 11, 1))
-
-        # argmin/max
-        obj = Index(np.arange(5, dtype='int64'))
-        self.assertEqual(obj.argmin(), 0)
-        self.assertEqual(obj.argmax(), 4)
-
-        obj = Index([np.nan, 1, np.nan, 2])
-        self.assertEqual(obj.argmin(), 1)
-        self.assertEqual(obj.argmax(), 3)
-
-        obj = Index([np.nan])
-        self.assertEqual(obj.argmin(), -1)
-        self.assertEqual(obj.argmax(), -1)
-
-        obj = Index([pd.NaT, datetime(2011, 11, 1), datetime(2011, 11, 2),
-                     pd.NaT])
-        self.assertEqual(obj.argmin(), 1)
-        self.assertEqual(obj.argmax(), 2)
-
-        obj = Index([pd.NaT])
-        self.assertEqual(obj.argmin(), -1)
-        self.assertEqual(obj.argmax(), -1)
+        assert Index([1]).item() == 1
+        assert Series([1]).item() == 1
 
     def test_value_counts_unique_nunique(self):
         for orig in self.objs:
@@ -400,315 +357,316 @@ def test_value_counts_unique_nunique(self):
             if isinstance(o, Index) and o.is_boolean():
                 continue
             elif isinstance(o, Index):
-                expected_index = pd.Index(o[::-1])
+                expected_index = Index(o[::-1])
                 expected_index.name = None
                 o = o.repeat(range(1, len(o) + 1))
                 o.name = 'a'
             else:
-                expected_index = pd.Index(values[::-1])
+                expected_index = Index(values[::-1])
                 idx = o.index.repeat(range(1, len(o) + 1))
-                rep = np.repeat(values, range(1, len(o) + 1))
+                # take-based repeat
+                indices = np.repeat(np.arange(len(o)), range(1, len(o) + 1))
+                rep = values.take(indices)
                 o = klass(rep, index=idx, name='a')
 
             # check values has the same dtype as the original
-            self.assertEqual(o.dtype, orig.dtype)
+            assert o.dtype == orig.dtype
 
             expected_s = Series(range(10, 0, -1), index=expected_index,
                                 dtype='int64', name='a')
 
             result = o.value_counts()
             tm.assert_series_equal(result, expected_s)
-            self.assertTrue(result.index.name is None)
-            self.assertEqual(result.name, 'a')
+            assert result.index.name is None
+            assert result.name == 'a'
 
             result = o.unique()
             if isinstance(o, Index):
-                self.assertTrue(isinstance(result, o.__class__))
-                self.assert_index_equal(result, orig)
-            elif is_datetimetz(o):
+                assert isinstance(result, o.__class__)
+                tm.assert_index_equal(result, orig)
+            elif is_datetime64tz_dtype(o):
                 # datetimetz Series returns array of Timestamp
-                self.assertEqual(result[0], orig[0])
+                assert result[0] == orig[0]
                 for r in result:
-                    self.assertIsInstance(r, pd.Timestamp)
-                tm.assert_numpy_array_equal(result,
-                                            orig._values.asobject.values)
+                    assert isinstance(r, Timestamp)
+
+                tm.assert_numpy_array_equal(
+                    result.astype(object),
+                    orig._values.astype(object))
             else:
                 tm.assert_numpy_array_equal(result, orig.values)
 
-            self.assertEqual(o.nunique(), len(np.unique(o.values)))
-
-    def test_value_counts_unique_nunique_null(self):
-
-        for null_obj in [np.nan, None]:
-            for orig in self.objs:
-                o = orig.copy()
-                klass = type(o)
-                values = o._values
-
-                if not self._allow_na_ops(o):
-                    continue
-
-                # special assign to the numpy array
-                if is_datetimetz(o):
-                    if isinstance(o, DatetimeIndex):
-                        v = o.asi8
-                        v[0:2] = iNaT
-                        values = o._shallow_copy(v)
-                    else:
-                        o = o.copy()
-                        o[0:2] = iNaT
-                        values = o._values
-
-                elif needs_i8_conversion(o):
-                    values[0:2] = iNaT
-                    values = o._shallow_copy(values)
-                else:
-                    values[0:2] = null_obj
-                # check values has the same dtype as the original
+            assert o.nunique() == len(np.unique(o.values))
 
-                self.assertEqual(values.dtype, o.dtype)
+    @pytest.mark.parametrize('null_obj', [np.nan, None])
+    def test_value_counts_unique_nunique_null(self, null_obj):
 
-                # create repeated values, 'n'th element is repeated by n+1
-                # times
-                if isinstance(o, (DatetimeIndex, PeriodIndex)):
-                    expected_index = o.copy()
-                    expected_index.name = None
+        for orig in self.objs:
+            o = orig.copy()
+            klass = type(o)
+            values = o._ndarray_values
 
-                    # attach name to klass
-                    o = klass(values.repeat(range(1, len(o) + 1)))
-                    o.name = 'a'
-                else:
-                    if is_datetimetz(o):
-                        expected_index = orig._values._shallow_copy(values)
-                    else:
-                        expected_index = pd.Index(values)
-                    expected_index.name = None
-                    o = o.repeat(range(1, len(o) + 1))
-                    o.name = 'a'
+            if not self._allow_na_ops(o):
+                continue
 
-                # check values has the same dtype as the original
-                self.assertEqual(o.dtype, orig.dtype)
-                # check values correctly have NaN
-                nanloc = np.zeros(len(o), dtype=np.bool)
-                nanloc[:3] = True
-                if isinstance(o, Index):
-                    self.assert_numpy_array_equal(pd.isnull(o), nanloc)
+            # special assign to the numpy array
+            if is_datetime64tz_dtype(o):
+                if isinstance(o, DatetimeIndex):
+                    v = o.asi8
+                    v[0:2] = iNaT
+                    values = o._shallow_copy(v)
                 else:
-                    exp = pd.Series(nanloc, o.index, name='a')
-                    self.assert_series_equal(pd.isnull(o), exp)
-
-                expected_s_na = Series(list(range(10, 2, -1)) + [3],
-                                       index=expected_index[9:0:-1],
-                                       dtype='int64', name='a')
-                expected_s = Series(list(range(10, 2, -1)),
-                                    index=expected_index[9:1:-1],
-                                    dtype='int64', name='a')
-
-                result_s_na = o.value_counts(dropna=False)
-                tm.assert_series_equal(result_s_na, expected_s_na)
-                self.assertTrue(result_s_na.index.name is None)
-                self.assertEqual(result_s_na.name, 'a')
-                result_s = o.value_counts()
-                tm.assert_series_equal(o.value_counts(), expected_s)
-                self.assertTrue(result_s.index.name is None)
-                self.assertEqual(result_s.name, 'a')
-
-                result = o.unique()
-                if isinstance(o, Index):
-                    tm.assert_index_equal(result,
-                                          Index(values[1:], name='a'))
-                elif is_datetimetz(o):
-                    # unable to compare NaT / nan
-                    tm.assert_numpy_array_equal(result[1:],
-                                                values[2:].asobject.values)
-                    self.assertIs(result[0], pd.NaT)
-                else:
-                    tm.assert_numpy_array_equal(result[1:], values[2:])
-
-                    self.assertTrue(pd.isnull(result[0]))
-                    self.assertEqual(result.dtype, orig.dtype)
+                    o = o.copy()
+                    o[0:2] = iNaT
+                    values = o._values
 
-                self.assertEqual(o.nunique(), 8)
-                self.assertEqual(o.nunique(dropna=False), 9)
-
-    def test_value_counts_inferred(self):
-        klasses = [Index, Series]
-        for klass in klasses:
-            s_values = ['a', 'b', 'b', 'b', 'b', 'c', 'd', 'd', 'a', 'a']
-            s = klass(s_values)
-            expected = Series([4, 3, 2, 1], index=['b', 'a', 'd', 'c'])
-            tm.assert_series_equal(s.value_counts(), expected)
-
-            if isinstance(s, Index):
-                exp = Index(np.unique(np.array(s_values, dtype=np.object_)))
-                tm.assert_index_equal(s.unique(), exp)
-            else:
-                exp = np.unique(np.array(s_values, dtype=np.object_))
-                tm.assert_numpy_array_equal(s.unique(), exp)
-
-            self.assertEqual(s.nunique(), 4)
-            # don't sort, have to sort after the fact as not sorting is
-            # platform-dep
-            hist = s.value_counts(sort=False).sort_values()
-            expected = Series([3, 1, 4, 2], index=list('acbd')).sort_values()
-            tm.assert_series_equal(hist, expected)
-
-            # sort ascending
-            hist = s.value_counts(ascending=True)
-            expected = Series([1, 2, 3, 4], index=list('cdab'))
-            tm.assert_series_equal(hist, expected)
-
-            # relative histogram.
-            hist = s.value_counts(normalize=True)
-            expected = Series([.4, .3, .2, .1], index=['b', 'a', 'd', 'c'])
-            tm.assert_series_equal(hist, expected)
-
-    def test_value_counts_bins(self):
-        klasses = [Index, Series]
-        for klass in klasses:
-            s_values = ['a', 'b', 'b', 'b', 'b', 'c', 'd', 'd', 'a', 'a']
-            s = klass(s_values)
-
-            # bins
-            self.assertRaises(TypeError,
-                              lambda bins: s.value_counts(bins=bins), 1)
-
-            s1 = Series([1, 1, 2, 3])
-            res1 = s1.value_counts(bins=1)
-            exp1 = Series({0.998: 4})
-            tm.assert_series_equal(res1, exp1)
-            res1n = s1.value_counts(bins=1, normalize=True)
-            exp1n = Series({0.998: 1.0})
-            tm.assert_series_equal(res1n, exp1n)
-
-            if isinstance(s1, Index):
-                tm.assert_index_equal(s1.unique(), Index([1, 2, 3]))
-            else:
-                exp = np.array([1, 2, 3], dtype=np.int64)
-                tm.assert_numpy_array_equal(s1.unique(), exp)
-
-            self.assertEqual(s1.nunique(), 3)
-
-            res4 = s1.value_counts(bins=4)
-            exp4 = Series({0.998: 2,
-                           1.5: 1,
-                           2.0: 0,
-                           2.5: 1}, index=[0.998, 2.5, 1.5, 2.0])
-            tm.assert_series_equal(res4, exp4)
-            res4n = s1.value_counts(bins=4, normalize=True)
-            exp4n = Series(
-                {0.998: 0.5,
-                 1.5: 0.25,
-                 2.0: 0.0,
-                 2.5: 0.25}, index=[0.998, 2.5, 1.5, 2.0])
-            tm.assert_series_equal(res4n, exp4n)
-
-            # handle NA's properly
-            s_values = ['a', 'b', 'b', 'b', np.nan, np.nan,
-                        'd', 'd', 'a', 'a', 'b']
-            s = klass(s_values)
-            expected = Series([4, 3, 2], index=['b', 'a', 'd'])
-            tm.assert_series_equal(s.value_counts(), expected)
-
-            if isinstance(s, Index):
-                exp = Index(['a', 'b', np.nan, 'd'])
-                tm.assert_index_equal(s.unique(), exp)
+            elif needs_i8_conversion(o):
+                values[0:2] = iNaT
+                values = o._shallow_copy(values)
             else:
-                exp = np.array(['a', 'b', np.nan, 'd'], dtype=object)
-                tm.assert_numpy_array_equal(s.unique(), exp)
-            self.assertEqual(s.nunique(), 3)
-
-            s = klass({})
-            expected = Series([], dtype=np.int64)
-            tm.assert_series_equal(s.value_counts(), expected,
-                                   check_index_type=False)
-            # returned dtype differs depending on original
-            if isinstance(s, Index):
-                self.assert_index_equal(s.unique(), Index([]),
-                                        exact=False)
-            else:
-                self.assert_numpy_array_equal(s.unique(), np.array([]),
-                                              check_dtype=False)
-
-            self.assertEqual(s.nunique(), 0)
-
-    def test_value_counts_datetime64(self):
-        klasses = [Index, Series]
-        for klass in klasses:
-            # GH 3002, datetime64[ns]
-            # don't test names though
-            txt = "\n".join(['xxyyzz20100101PIE', 'xxyyzz20100101GUM',
-                             'xxyyzz20100101EGG', 'xxyyww20090101EGG',
-                             'foofoo20080909PIE', 'foofoo20080909GUM'])
-            f = StringIO(txt)
-            df = pd.read_fwf(f, widths=[6, 8, 3],
-                             names=["person_id", "dt", "food"],
-                             parse_dates=["dt"])
-
-            s = klass(df['dt'].copy())
-            s.name = None
-
-            idx = pd.to_datetime(['2010-01-01 00:00:00Z',
-                                  '2008-09-09 00:00:00Z',
-                                  '2009-01-01 00:00:00X'])
-            expected_s = Series([3, 2, 1], index=idx)
-            tm.assert_series_equal(s.value_counts(), expected_s)
-
-            expected = np_array_datetime64_compat(['2010-01-01 00:00:00Z',
-                                                   '2009-01-01 00:00:00Z',
-                                                   '2008-09-09 00:00:00Z'],
-                                                  dtype='datetime64[ns]')
-            if isinstance(s, Index):
-                tm.assert_index_equal(s.unique(), DatetimeIndex(expected))
-            else:
-                tm.assert_numpy_array_equal(s.unique(), expected)
-
-            self.assertEqual(s.nunique(), 3)
-
-            # with NaT
-            s = df['dt'].copy()
-            s = klass([v for v in s.values] + [pd.NaT])
-
-            result = s.value_counts()
-            self.assertEqual(result.index.dtype, 'datetime64[ns]')
-            tm.assert_series_equal(result, expected_s)
+                values[0:2] = null_obj
+            # check values has the same dtype as the original
 
-            result = s.value_counts(dropna=False)
-            expected_s[pd.NaT] = 1
-            tm.assert_series_equal(result, expected_s)
+            assert values.dtype == o.dtype
 
-            unique = s.unique()
-            self.assertEqual(unique.dtype, 'datetime64[ns]')
+            # create repeated values, 'n'th element is repeated by n+1
+            # times
+            if isinstance(o, (DatetimeIndex, PeriodIndex)):
+                expected_index = o.copy()
+                expected_index.name = None
 
-            # numpy_array_equal cannot compare pd.NaT
-            if isinstance(s, Index):
-                exp_idx = DatetimeIndex(expected.tolist() + [pd.NaT])
-                tm.assert_index_equal(unique, exp_idx)
+                # attach name to klass
+                o = klass(values.repeat(range(1, len(o) + 1)))
+                o.name = 'a'
             else:
-                tm.assert_numpy_array_equal(unique[:3], expected)
-                self.assertTrue(pd.isnull(unique[3]))
-
-            self.assertEqual(s.nunique(), 3)
-            self.assertEqual(s.nunique(dropna=False), 4)
+                if isinstance(o, DatetimeIndex):
+                    expected_index = orig._values._shallow_copy(values)
+                else:
+                    expected_index = Index(values)
+                expected_index.name = None
+                o = o.repeat(range(1, len(o) + 1))
+                o.name = 'a'
 
-            # timedelta64[ns]
-            td = df.dt - df.dt + timedelta(1)
-            td = klass(td, name='dt')
+            # check values has the same dtype as the original
+            assert o.dtype == orig.dtype
+            # check values correctly have NaN
+            nanloc = np.zeros(len(o), dtype=np.bool)
+            nanloc[:3] = True
+            if isinstance(o, Index):
+                tm.assert_numpy_array_equal(pd.isna(o), nanloc)
+            else:
+                exp = Series(nanloc, o.index, name='a')
+                tm.assert_series_equal(pd.isna(o), exp)
+
+            expected_s_na = Series(list(range(10, 2, -1)) + [3],
+                                   index=expected_index[9:0:-1],
+                                   dtype='int64', name='a')
+            expected_s = Series(list(range(10, 2, -1)),
+                                index=expected_index[9:1:-1],
+                                dtype='int64', name='a')
 
-            result = td.value_counts()
-            expected_s = Series([6], index=[Timedelta('1day')], name='dt')
-            tm.assert_series_equal(result, expected_s)
+            result_s_na = o.value_counts(dropna=False)
+            tm.assert_series_equal(result_s_na, expected_s_na)
+            assert result_s_na.index.name is None
+            assert result_s_na.name == 'a'
+            result_s = o.value_counts()
+            tm.assert_series_equal(o.value_counts(), expected_s)
+            assert result_s.index.name is None
+            assert result_s.name == 'a'
 
-            expected = TimedeltaIndex(['1 days'], name='dt')
-            if isinstance(td, Index):
-                tm.assert_index_equal(td.unique(), expected)
+            result = o.unique()
+            if isinstance(o, Index):
+                tm.assert_index_equal(result,
+                                      Index(values[1:], name='a'))
+            elif is_datetime64tz_dtype(o):
+                # unable to compare NaT / nan
+                tm.assert_extension_array_equal(result[1:], values[2:])
+                assert result[0] is pd.NaT
             else:
-                tm.assert_numpy_array_equal(td.unique(), expected.values)
-
-            td2 = timedelta(1) + (df.dt - df.dt)
-            td2 = klass(td2, name='dt')
-            result2 = td2.value_counts()
-            tm.assert_series_equal(result2, expected_s)
+                tm.assert_numpy_array_equal(result[1:], values[2:])
+
+                assert pd.isna(result[0])
+                assert result.dtype == orig.dtype
+
+            assert o.nunique() == 8
+            assert o.nunique(dropna=False) == 9
+
+    @pytest.mark.parametrize('klass', [Index, Series])
+    def test_value_counts_inferred(self, klass):
+        s_values = ['a', 'b', 'b', 'b', 'b', 'c', 'd', 'd', 'a', 'a']
+        s = klass(s_values)
+        expected = Series([4, 3, 2, 1], index=['b', 'a', 'd', 'c'])
+        tm.assert_series_equal(s.value_counts(), expected)
+
+        if isinstance(s, Index):
+            exp = Index(np.unique(np.array(s_values, dtype=np.object_)))
+            tm.assert_index_equal(s.unique(), exp)
+        else:
+            exp = np.unique(np.array(s_values, dtype=np.object_))
+            tm.assert_numpy_array_equal(s.unique(), exp)
+
+        assert s.nunique() == 4
+        # don't sort, have to sort after the fact as not sorting is
+        # platform-dep
+        hist = s.value_counts(sort=False).sort_values()
+        expected = Series([3, 1, 4, 2], index=list('acbd')).sort_values()
+        tm.assert_series_equal(hist, expected)
+
+        # sort ascending
+        hist = s.value_counts(ascending=True)
+        expected = Series([1, 2, 3, 4], index=list('cdab'))
+        tm.assert_series_equal(hist, expected)
+
+        # relative histogram.
+        hist = s.value_counts(normalize=True)
+        expected = Series([.4, .3, .2, .1], index=['b', 'a', 'd', 'c'])
+        tm.assert_series_equal(hist, expected)
+
+    @pytest.mark.parametrize('klass', [Index, Series])
+    def test_value_counts_bins(self, klass):
+        s_values = ['a', 'b', 'b', 'b', 'b', 'c', 'd', 'd', 'a', 'a']
+        s = klass(s_values)
+
+        # bins
+        with pytest.raises(TypeError):
+            s.value_counts(bins=1)
+
+        s1 = Series([1, 1, 2, 3])
+        res1 = s1.value_counts(bins=1)
+        exp1 = Series({Interval(0.997, 3.0): 4})
+        tm.assert_series_equal(res1, exp1)
+        res1n = s1.value_counts(bins=1, normalize=True)
+        exp1n = Series({Interval(0.997, 3.0): 1.0})
+        tm.assert_series_equal(res1n, exp1n)
+
+        if isinstance(s1, Index):
+            tm.assert_index_equal(s1.unique(), Index([1, 2, 3]))
+        else:
+            exp = np.array([1, 2, 3], dtype=np.int64)
+            tm.assert_numpy_array_equal(s1.unique(), exp)
+
+        assert s1.nunique() == 3
+
+        # these return the same
+        res4 = s1.value_counts(bins=4, dropna=True)
+        intervals = IntervalIndex.from_breaks([0.997, 1.5, 2.0, 2.5, 3.0])
+        exp4 = Series([2, 1, 1, 0], index=intervals.take([0, 3, 1, 2]))
+        tm.assert_series_equal(res4, exp4)
+
+        res4 = s1.value_counts(bins=4, dropna=False)
+        intervals = IntervalIndex.from_breaks([0.997, 1.5, 2.0, 2.5, 3.0])
+        exp4 = Series([2, 1, 1, 0], index=intervals.take([0, 3, 1, 2]))
+        tm.assert_series_equal(res4, exp4)
+
+        res4n = s1.value_counts(bins=4, normalize=True)
+        exp4n = Series([0.5, 0.25, 0.25, 0],
+                       index=intervals.take([0, 3, 1, 2]))
+        tm.assert_series_equal(res4n, exp4n)
+
+        # handle NA's properly
+        s_values = ['a', 'b', 'b', 'b', np.nan, np.nan,
+                    'd', 'd', 'a', 'a', 'b']
+        s = klass(s_values)
+        expected = Series([4, 3, 2], index=['b', 'a', 'd'])
+        tm.assert_series_equal(s.value_counts(), expected)
+
+        if isinstance(s, Index):
+            exp = Index(['a', 'b', np.nan, 'd'])
+            tm.assert_index_equal(s.unique(), exp)
+        else:
+            exp = np.array(['a', 'b', np.nan, 'd'], dtype=object)
+            tm.assert_numpy_array_equal(s.unique(), exp)
+        assert s.nunique() == 3
+
+        s = klass({})
+        expected = Series([], dtype=np.int64)
+        tm.assert_series_equal(s.value_counts(), expected,
+                               check_index_type=False)
+        # returned dtype differs depending on original
+        if isinstance(s, Index):
+            tm.assert_index_equal(s.unique(), Index([]), exact=False)
+        else:
+            tm.assert_numpy_array_equal(s.unique(), np.array([]),
+                                        check_dtype=False)
+
+        assert s.nunique() == 0
+
+    @pytest.mark.parametrize('klass', [Index, Series])
+    def test_value_counts_datetime64(self, klass):
+
+        # GH 3002, datetime64[ns]
+        # don't test names though
+        txt = "\n".join(['xxyyzz20100101PIE', 'xxyyzz20100101GUM',
+                         'xxyyzz20100101EGG', 'xxyyww20090101EGG',
+                         'foofoo20080909PIE', 'foofoo20080909GUM'])
+        f = StringIO(txt)
+        df = pd.read_fwf(f, widths=[6, 8, 3],
+                         names=["person_id", "dt", "food"],
+                         parse_dates=["dt"])
+
+        s = klass(df['dt'].copy())
+        s.name = None
+        idx = pd.to_datetime(['2010-01-01 00:00:00',
+                              '2008-09-09 00:00:00',
+                              '2009-01-01 00:00:00'])
+        expected_s = Series([3, 2, 1], index=idx)
+        tm.assert_series_equal(s.value_counts(), expected_s)
+
+        expected = np_array_datetime64_compat(['2010-01-01 00:00:00',
+                                               '2009-01-01 00:00:00',
+                                               '2008-09-09 00:00:00'],
+                                              dtype='datetime64[ns]')
+        if isinstance(s, Index):
+            tm.assert_index_equal(s.unique(), DatetimeIndex(expected))
+        else:
+            tm.assert_numpy_array_equal(s.unique(), expected)
+
+        assert s.nunique() == 3
+
+        # with NaT
+        s = df['dt'].copy()
+        s = klass([v for v in s.values] + [pd.NaT])
+
+        result = s.value_counts()
+        assert result.index.dtype == 'datetime64[ns]'
+        tm.assert_series_equal(result, expected_s)
+
+        result = s.value_counts(dropna=False)
+        expected_s[pd.NaT] = 1
+        tm.assert_series_equal(result, expected_s)
+
+        unique = s.unique()
+        assert unique.dtype == 'datetime64[ns]'
+
+        # numpy_array_equal cannot compare pd.NaT
+        if isinstance(s, Index):
+            exp_idx = DatetimeIndex(expected.tolist() + [pd.NaT])
+            tm.assert_index_equal(unique, exp_idx)
+        else:
+            tm.assert_numpy_array_equal(unique[:3], expected)
+            assert pd.isna(unique[3])
+
+        assert s.nunique() == 3
+        assert s.nunique(dropna=False) == 4
+
+        # timedelta64[ns]
+        td = df.dt - df.dt + timedelta(1)
+        td = klass(td, name='dt')
+
+        result = td.value_counts()
+        expected_s = Series([6], index=[Timedelta('1day')], name='dt')
+        tm.assert_series_equal(result, expected_s)
+
+        expected = TimedeltaIndex(['1 days'], name='dt')
+        if isinstance(td, Index):
+            tm.assert_index_equal(td.unique(), expected)
+        else:
+            tm.assert_numpy_array_equal(td.unique(), expected.values)
+
+        td2 = timedelta(1) + (df.dt - df.dt)
+        td2 = klass(td2, name='dt')
+        result2 = td2.value_counts()
+        tm.assert_series_equal(result2, expected_s)
 
     def test_factorize(self):
         for orig in self.objs:
@@ -723,14 +681,14 @@ def test_factorize(self):
                 exp_uniques = o
             labels, uniques = o.factorize()
 
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
             if isinstance(o, Series):
-                self.assert_index_equal(uniques, Index(orig),
-                                        check_names=False)
+                tm.assert_index_equal(uniques, Index(orig),
+                                      check_names=False)
             else:
                 # factorize explicitly resets name
-                self.assert_index_equal(uniques, exp_uniques,
-                                        check_names=False)
+                tm.assert_index_equal(uniques, exp_uniques,
+                                      check_names=False)
 
     def test_factorize_repeated(self):
         for orig in self.objs:
@@ -753,24 +711,24 @@ def test_factorize_repeated(self):
                                dtype=np.intp)
             labels, uniques = n.factorize(sort=True)
 
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
             if isinstance(o, Series):
-                self.assert_index_equal(uniques, Index(orig).sort_values(),
-                                        check_names=False)
+                tm.assert_index_equal(uniques, Index(orig).sort_values(),
+                                      check_names=False)
             else:
-                self.assert_index_equal(uniques, o, check_names=False)
+                tm.assert_index_equal(uniques, o, check_names=False)
 
             exp_arr = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0, 1, 2, 3, 4],
                                np.intp)
             labels, uniques = n.factorize(sort=False)
-            self.assert_numpy_array_equal(labels, exp_arr)
+            tm.assert_numpy_array_equal(labels, exp_arr)
 
             if isinstance(o, Series):
                 expected = Index(o.iloc[5:10].append(o.iloc[:5]))
-                self.assert_index_equal(uniques, expected, check_names=False)
+                tm.assert_index_equal(uniques, expected, check_names=False)
             else:
                 expected = o[5:10].append(o[:5])
-                self.assert_index_equal(uniques, expected, check_names=False)
+                tm.assert_index_equal(uniques, expected, check_names=False)
 
     def test_duplicated_drop_duplicates_index(self):
         # GH 4060
@@ -788,13 +746,13 @@ def test_duplicated_drop_duplicates_index(self):
                 expected = np.array([False] * len(original), dtype=bool)
                 duplicated = original.duplicated()
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = original.drop_duplicates()
                 tm.assert_index_equal(result, original)
-                self.assertFalse(result is original)
+                assert result is not original
 
                 # has_duplicates
-                self.assertFalse(original.has_duplicates)
+                assert not original.has_duplicates
 
                 # create repeated values, 3rd and 5th values are duplicated
                 idx = original[list(range(len(original))) + [5, 3]]
@@ -802,7 +760,7 @@ def test_duplicated_drop_duplicates_index(self):
                                     dtype=bool)
                 duplicated = idx.duplicated()
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 tm.assert_index_equal(idx.drop_duplicates(), original)
 
                 base = [False] * len(idx)
@@ -812,7 +770,7 @@ def test_duplicated_drop_duplicates_index(self):
 
                 duplicated = idx.duplicated(keep='last')
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = idx.drop_duplicates(keep='last')
                 tm.assert_index_equal(result, idx[~expected])
 
@@ -823,13 +781,13 @@ def test_duplicated_drop_duplicates_index(self):
 
                 duplicated = idx.duplicated(keep=False)
                 tm.assert_numpy_array_equal(duplicated, expected)
-                self.assertTrue(duplicated.dtype == bool)
+                assert duplicated.dtype == bool
                 result = idx.drop_duplicates(keep=False)
                 tm.assert_index_equal(result, idx[~expected])
 
-                with tm.assertRaisesRegexp(
-                        TypeError, r"drop_duplicates\(\) got an unexpected "
-                        "keyword argument"):
+                with pytest.raises(TypeError,
+                                   match=(r"drop_duplicates\(\) got an "
+                                          r"unexpected keyword argument")):
                     idx.drop_duplicates(inplace=True)
 
             else:
@@ -838,7 +796,7 @@ def test_duplicated_drop_duplicates_index(self):
                 tm.assert_series_equal(original.duplicated(), expected)
                 result = original.drop_duplicates()
                 tm.assert_series_equal(result, original)
-                self.assertFalse(result is original)
+                assert result is not original
 
                 idx = original.index[list(range(len(original))) + [5, 3]]
                 values = original._values[list(range(len(original))) + [5, 3]]
@@ -898,11 +856,11 @@ def test_fillna(self):
             # values will not be changed
             result = o.fillna(o.astype(object).values[0])
             if isinstance(o, Index):
-                self.assert_index_equal(o, result)
+                tm.assert_index_equal(o, result)
             else:
-                self.assert_series_equal(o, result)
+                tm.assert_series_equal(o, result)
             # check shallow_copied
-            self.assertFalse(o is result)
+            assert o is not result
 
         for null_obj in [np.nan, None]:
             for orig in self.objs:
@@ -928,16 +886,17 @@ def test_fillna(self):
                 o = klass(values)
 
                 # check values has the same dtype as the original
-                self.assertEqual(o.dtype, orig.dtype)
+                assert o.dtype == orig.dtype
 
                 result = o.fillna(fill_value)
                 if isinstance(o, Index):
-                    self.assert_index_equal(result, expected)
+                    tm.assert_index_equal(result, expected)
                 else:
-                    self.assert_series_equal(result, expected)
+                    tm.assert_series_equal(result, expected)
                 # check shallow_copied
-                self.assertFalse(o is result)
+                assert o is not result
 
+    @pytest.mark.skipif(PYPY, reason="not relevant for PyPy")
     def test_memory_usage(self):
         for o in self.objs:
             res = o.memory_usage()
@@ -946,83 +905,447 @@ def test_memory_usage(self):
             if (is_object_dtype(o) or (isinstance(o, Series) and
                                        is_object_dtype(o.index))):
                 # if there are objects, only deep will pick them up
-                self.assertTrue(res_deep > res)
+                assert res_deep > res
             else:
-                self.assertEqual(res, res_deep)
+                assert res == res_deep
 
             if isinstance(o, Series):
-                self.assertEqual(
-                    (o.memory_usage(index=False) +
-                        o.index.memory_usage()),
-                    o.memory_usage(index=True)
-                )
+                assert ((o.memory_usage(index=False) +
+                         o.index.memory_usage()) ==
+                        o.memory_usage(index=True))
 
             # sys.getsizeof will call the .memory_usage with
             # deep=True, and add on some GC overhead
             diff = res_deep - sys.getsizeof(o)
-            self.assertTrue(abs(diff) < 100)
+            assert abs(diff) < 100
 
     def test_searchsorted(self):
         # See gh-12238
         for o in self.objs:
             index = np.searchsorted(o, max(o))
-            self.assertTrue(0 <= index <= len(o))
+            assert 0 <= index <= len(o)
 
             index = np.searchsorted(o, max(o), sorter=range(len(o)))
-            self.assertTrue(0 <= index <= len(o))
+            assert 0 <= index <= len(o)
 
     def test_validate_bool_args(self):
         invalid_values = [1, "True", [1, 2, 3], 5.0]
 
         for value in invalid_values:
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 self.int_series.drop_duplicates(inplace=value)
 
+    def test_getitem(self):
+        for i in self.indexes:
+            s = pd.Series(i)
+
+            assert i[0] == s.iloc[0]
+            assert i[5] == s.iloc[5]
+            assert i[-1] == s.iloc[-1]
+
+            assert i[-1] == i[9]
+
+            with pytest.raises(IndexError):
+                i[20]
+            with pytest.raises(IndexError):
+                s.iloc[20]
+
+    @pytest.mark.parametrize('indexer_klass', [list, pd.Index])
+    @pytest.mark.parametrize('indexer', [[True] * 10, [False] * 10,
+                                         [True, False, True, True, False,
+                                          False, True, True, False, True]])
+    def test_bool_indexing(self, indexer_klass, indexer):
+        # GH 22533
+        for idx in self.indexes:
+            exp_idx = [i for i in range(len(indexer)) if indexer[i]]
+            tm.assert_index_equal(idx[indexer_klass(indexer)], idx[exp_idx])
+            s = pd.Series(idx)
+            tm.assert_series_equal(s[indexer_klass(indexer)], s.iloc[exp_idx])
+
 
 class TestTranspose(Ops):
     errmsg = "the 'axes' parameter is not supported"
 
     def test_transpose(self):
         for obj in self.objs:
-            if isinstance(obj, Index):
-                tm.assert_index_equal(obj.transpose(), obj)
-            else:
-                tm.assert_series_equal(obj.transpose(), obj)
+            tm.assert_equal(obj.transpose(), obj)
 
     def test_transpose_non_default_axes(self):
         for obj in self.objs:
-            tm.assertRaisesRegexp(ValueError, self.errmsg,
-                                  obj.transpose, 1)
-            tm.assertRaisesRegexp(ValueError, self.errmsg,
-                                  obj.transpose, axes=1)
+            with pytest.raises(ValueError, match=self.errmsg):
+                obj.transpose(1)
+            with pytest.raises(ValueError, match=self.errmsg):
+                obj.transpose(axes=1)
 
     def test_numpy_transpose(self):
         for obj in self.objs:
-            if isinstance(obj, Index):
-                tm.assert_index_equal(np.transpose(obj), obj)
-            else:
-                tm.assert_series_equal(np.transpose(obj), obj)
+            tm.assert_equal(np.transpose(obj), obj)
 
-            tm.assertRaisesRegexp(ValueError, self.errmsg,
-                                  np.transpose, obj, axes=1)
+            with pytest.raises(ValueError, match=self.errmsg):
+                np.transpose(obj, axes=1)
 
 
-class TestNoNewAttributesMixin(tm.TestCase):
+class TestNoNewAttributesMixin(object):
 
     def test_mixin(self):
         class T(NoNewAttributesMixin):
             pass
 
         t = T()
-        self.assertFalse(hasattr(t, "__frozen"))
+        assert not hasattr(t, "__frozen")
+
         t.a = "test"
-        self.assertEqual(t.a, "test")
+        assert t.a == "test"
+
         t._freeze()
-        # self.assertTrue("__frozen" not in dir(t))
-        self.assertIs(getattr(t, "__frozen"), True)
+        assert "__frozen" in dir(t)
+        assert getattr(t, "__frozen")
 
-        def f():
+        with pytest.raises(AttributeError):
             t.b = "test"
 
-        self.assertRaises(AttributeError, f)
-        self.assertFalse(hasattr(t, "b"))
+        assert not hasattr(t, "b")
+
+
+class TestToIterable(object):
+    # test that we convert an iterable to python types
+
+    dtypes = [
+        ('int8', (int, long)),
+        ('int16', (int, long)),
+        ('int32', (int, long)),
+        ('int64', (int, long)),
+        ('uint8', (int, long)),
+        ('uint16', (int, long)),
+        ('uint32', (int, long)),
+        ('uint64', (int, long)),
+        ('float16', float),
+        ('float32', float),
+        ('float64', float),
+        ('datetime64[ns]', Timestamp),
+        ('datetime64[ns, US/Eastern]', Timestamp),
+        ('timedelta64[ns]', Timedelta)]
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype', dtypes)
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: x.to_list(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'to_list', 'list', 'iter'])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    @pytest.mark.filterwarnings("ignore:\\n    Passing:FutureWarning")
+    # TODO(GH-24559): Remove the filterwarnings
+    def test_iterable(self, typ, method, dtype, rdtype):
+        # gh-10904
+        # gh-13258
+        # coerce iteration to underlying python / pandas types
+        s = typ([1], dtype=dtype)
+        result = method(s)[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype, obj',
+        [
+            ('object', object, 'a'),
+            ('object', (int, long), 1),
+            ('category', object, 'a'),
+            ('category', (int, long), 1)])
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: x.to_list(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'to_list', 'list', 'iter'])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    def test_iterable_object_and_category(self, typ, method,
+                                          dtype, rdtype, obj):
+        # gh-10904
+        # gh-13258
+        # coerce iteration to underlying python / pandas types
+        s = typ([obj], dtype=dtype)
+        result = method(s)[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype', dtypes)
+    def test_iterable_items(self, dtype, rdtype):
+        # gh-13258
+        # test items / iteritems yields the correct boxed scalars
+        # this only applies to series
+        s = Series([1], dtype=dtype)
+        _, result = list(s.items())[0]
+        assert isinstance(result, rdtype)
+
+        _, result = list(s.iteritems())[0]
+        assert isinstance(result, rdtype)
+
+    @pytest.mark.parametrize(
+        'dtype, rdtype',
+        dtypes + [
+            ('object', (int, long)),
+            ('category', (int, long))])
+    @pytest.mark.parametrize('typ', [Series, Index])
+    @pytest.mark.filterwarnings("ignore:\\n    Passing:FutureWarning")
+    # TODO(GH-24559): Remove the filterwarnings
+    def test_iterable_map(self, typ, dtype, rdtype):
+        # gh-13236
+        # coerce iteration to underlying python / pandas types
+        s = typ([1], dtype=dtype)
+        result = s.map(type)[0]
+        if not isinstance(rdtype, tuple):
+            rdtype = tuple([rdtype])
+        assert result in rdtype
+
+    @pytest.mark.parametrize(
+        'method',
+        [
+            lambda x: x.tolist(),
+            lambda x: x.to_list(),
+            lambda x: list(x),
+            lambda x: list(x.__iter__()),
+        ], ids=['tolist', 'to_list', 'list', 'iter'])
+    def test_categorial_datetimelike(self, method):
+        i = CategoricalIndex([Timestamp('1999-12-31'),
+                              Timestamp('2000-12-31')])
+
+        result = method(i)[0]
+        assert isinstance(result, Timestamp)
+
+    def test_iter_box(self):
+        vals = [Timestamp('2011-01-01'), Timestamp('2011-01-02')]
+        s = Series(vals)
+        assert s.dtype == 'datetime64[ns]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timestamp)
+            assert res.tz is None
+            assert res == exp
+
+        vals = [Timestamp('2011-01-01', tz='US/Eastern'),
+                Timestamp('2011-01-02', tz='US/Eastern')]
+        s = Series(vals)
+
+        assert s.dtype == 'datetime64[ns, US/Eastern]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timestamp)
+            assert res.tz == exp.tz
+            assert res == exp
+
+        # timedelta
+        vals = [Timedelta('1 days'), Timedelta('2 days')]
+        s = Series(vals)
+        assert s.dtype == 'timedelta64[ns]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, Timedelta)
+            assert res == exp
+
+        # period
+        vals = [pd.Period('2011-01-01', freq='M'),
+                pd.Period('2011-01-02', freq='M')]
+        s = Series(vals)
+        assert s.dtype == 'Period[M]'
+        for res, exp in zip(s, vals):
+            assert isinstance(res, pd.Period)
+            assert res.freq == 'M'
+            assert res == exp
+
+
+@pytest.mark.parametrize('array, expected_type, dtype', [
+    (np.array([0, 1], dtype=np.int64), np.ndarray, 'int64'),
+    (np.array(['a', 'b']), np.ndarray, 'object'),
+    (pd.Categorical(['a', 'b']), pd.Categorical, 'category'),
+    (pd.DatetimeIndex(['2017', '2018'], tz="US/Central"), DatetimeArray,
+     'datetime64[ns, US/Central]'),
+
+    (pd.PeriodIndex([2018, 2019], freq='A'), pd.core.arrays.PeriodArray,
+     pd.core.dtypes.dtypes.PeriodDtype("A-DEC")),
+    (pd.IntervalIndex.from_breaks([0, 1, 2]), pd.core.arrays.IntervalArray,
+     'interval'),
+
+    # This test is currently failing for datetime64[ns] and timedelta64[ns].
+    # The NumPy type system is sufficient for representing these types, so
+    # we just use NumPy for Series / DataFrame columns of these types (so
+    # we get consolidation and so on).
+    # However, DatetimeIndex and TimedeltaIndex use the DateLikeArray
+    # abstraction to for code reuse.
+    # At the moment, we've judged that allowing this test to fail is more
+    # practical that overriding Series._values to special case
+    # Series[M8[ns]] and Series[m8[ns]] to return a DateLikeArray.
+    pytest.param(
+        pd.DatetimeIndex(['2017', '2018']), np.ndarray, 'datetime64[ns]',
+        marks=[pytest.mark.xfail(reason="datetime _values", strict=True)]
+    ),
+    pytest.param(
+        pd.TimedeltaIndex([10**10]), np.ndarray, 'm8[ns]',
+        marks=[pytest.mark.xfail(reason="timedelta _values", strict=True)]
+    ),
+
+])
+def test_values_consistent(array, expected_type, dtype):
+    l_values = pd.Series(array)._values
+    r_values = pd.Index(array)._values
+    assert type(l_values) is expected_type
+    assert type(l_values) is type(r_values)
+
+    tm.assert_equal(l_values, r_values)
+
+
+@pytest.mark.parametrize('array, expected', [
+    (np.array([0, 1], dtype=np.int64), np.array([0, 1], dtype=np.int64)),
+    (np.array(['0', '1']), np.array(['0', '1'], dtype=object)),
+    (pd.Categorical(['a', 'a']), np.array([0, 0], dtype='int8')),
+    (pd.DatetimeIndex(['2017-01-01T00:00:00']),
+     np.array(['2017-01-01T00:00:00'], dtype='M8[ns]')),
+    (pd.DatetimeIndex(['2017-01-01T00:00:00'], tz="US/Eastern"),
+     np.array(['2017-01-01T05:00:00'], dtype='M8[ns]')),
+    (pd.TimedeltaIndex([10**10]), np.array([10**10], dtype='m8[ns]')),
+    (pd.PeriodIndex(['2017', '2018'], freq='D'),
+     np.array([17167, 17532], dtype=np.int64)),
+])
+def test_ndarray_values(array, expected):
+    l_values = pd.Series(array)._ndarray_values
+    r_values = pd.Index(array)._ndarray_values
+    tm.assert_numpy_array_equal(l_values, r_values)
+    tm.assert_numpy_array_equal(l_values, expected)
+
+
+@pytest.mark.parametrize("arr", [
+    np.array([1, 2, 3]),
+])
+def test_numpy_array(arr):
+    ser = pd.Series(arr)
+    result = ser.array
+    expected = PandasArray(arr)
+    tm.assert_extension_array_equal(result, expected)
+
+
+def test_numpy_array_all_dtypes(any_numpy_dtype):
+    ser = pd.Series(dtype=any_numpy_dtype)
+    result = ser.array
+    if is_datetime64_dtype(any_numpy_dtype):
+        assert isinstance(result, DatetimeArray)
+    elif is_timedelta64_dtype(any_numpy_dtype):
+        assert isinstance(result, TimedeltaArray)
+    else:
+        assert isinstance(result, PandasArray)
+
+
+@pytest.mark.parametrize("array, attr", [
+    (pd.Categorical(['a', 'b']), '_codes'),
+    (pd.core.arrays.period_array(['2000', '2001'], freq='D'), '_data'),
+    (pd.core.arrays.integer_array([0, np.nan]), '_data'),
+    (pd.core.arrays.IntervalArray.from_breaks([0, 1]), '_left'),
+    (pd.SparseArray([0, 1]), '_sparse_values'),
+    (DatetimeArray(np.array([1, 2], dtype="datetime64[ns]")), "_data"),
+    # tz-aware Datetime
+    (DatetimeArray(np.array(['2000-01-01T12:00:00',
+                             '2000-01-02T12:00:00'],
+                            dtype='M8[ns]'),
+                   dtype=DatetimeTZDtype(tz="US/Central")),
+     '_data'),
+])
+@pytest.mark.parametrize('box', [pd.Series, pd.Index])
+def test_array(array, attr, box):
+    if array.dtype.name in ('Int64', 'Sparse[int64, 0]') and box is pd.Index:
+        pytest.skip("No index type for {}".format(array.dtype))
+    result = box(array, copy=False).array
+
+    if attr:
+        array = getattr(array, attr)
+        result = getattr(result, attr)
+
+    assert result is array
+
+
+def test_array_multiindex_raises():
+    idx = pd.MultiIndex.from_product([['A'], ['a', 'b']])
+    with pytest.raises(ValueError, match='MultiIndex'):
+        idx.array
+
+
+@pytest.mark.parametrize('array, expected', [
+    (np.array([1, 2], dtype=np.int64), np.array([1, 2], dtype=np.int64)),
+    (pd.Categorical(['a', 'b']), np.array(['a', 'b'], dtype=object)),
+    (pd.core.arrays.period_array(['2000', '2001'], freq='D'),
+     np.array([pd.Period('2000', freq="D"), pd.Period('2001', freq='D')])),
+    (pd.core.arrays.integer_array([0, np.nan]),
+     np.array([0, np.nan], dtype=object)),
+    (pd.core.arrays.IntervalArray.from_breaks([0, 1, 2]),
+     np.array([pd.Interval(0, 1), pd.Interval(1, 2)], dtype=object)),
+    (pd.SparseArray([0, 1]), np.array([0, 1], dtype=np.int64)),
+
+    # tz-naive datetime
+    (DatetimeArray(np.array(['2000', '2001'], dtype='M8[ns]')),
+     np.array(['2000', '2001'], dtype='M8[ns]')),
+
+    # tz-aware stays tz`-aware
+    (DatetimeArray(np.array(['2000-01-01T06:00:00',
+                             '2000-01-02T06:00:00'],
+                            dtype='M8[ns]'),
+                   dtype=DatetimeTZDtype(tz='US/Central')),
+     np.array([pd.Timestamp('2000-01-01', tz='US/Central'),
+               pd.Timestamp('2000-01-02', tz='US/Central')])),
+
+    # Timedelta
+    (TimedeltaArray(np.array([0, 3600000000000], dtype='i8'), freq='H'),
+     np.array([0, 3600000000000], dtype='m8[ns]')),
+])
+@pytest.mark.parametrize('box', [pd.Series, pd.Index])
+def test_to_numpy(array, expected, box):
+    thing = box(array)
+
+    if array.dtype.name in ('Int64', 'Sparse[int64, 0]') and box is pd.Index:
+        pytest.skip("No index type for {}".format(array.dtype))
+
+    result = thing.to_numpy()
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("as_series", [True, False])
+@pytest.mark.parametrize("arr", [
+    np.array([1, 2, 3], dtype="int64"),
+    np.array(['a', 'b', 'c'], dtype=object),
+])
+def test_to_numpy_copy(arr, as_series):
+    obj = pd.Index(arr, copy=False)
+    if as_series:
+        obj = pd.Series(obj.values, copy=False)
+
+    # no copy by default
+    result = obj.to_numpy()
+    assert np.shares_memory(arr, result) is True
+
+    result = obj.to_numpy(copy=False)
+    assert np.shares_memory(arr, result) is True
+
+    # copy=True
+    result = obj.to_numpy(copy=True)
+    assert np.shares_memory(arr, result) is False
+
+
+@pytest.mark.parametrize("as_series", [True, False])
+def test_to_numpy_dtype(as_series):
+    tz = "US/Eastern"
+    obj = pd.DatetimeIndex(['2000', '2001'], tz=tz)
+    if as_series:
+        obj = pd.Series(obj)
+
+    # preserve tz by default
+    result = obj.to_numpy()
+    expected = np.array([pd.Timestamp('2000', tz=tz),
+                         pd.Timestamp('2001', tz=tz)],
+                        dtype=object)
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = obj.to_numpy(dtype="object")
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = obj.to_numpy(dtype="M8[ns]")
+    expected = np.array(['2000-01-01T05', '2001-01-01T05'],
+                        dtype='M8[ns]')
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/test_categorical.py b/pandas/tests/test_categorical.py
deleted file mode 100644
index ea2697ec19df3..0000000000000
--- a/pandas/tests/test_categorical.py
+++ /dev/null
@@ -1,4427 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=E1101,E1103,W0232
-
-import pytest
-import sys
-from datetime import datetime
-from distutils.version import LooseVersion
-
-import numpy as np
-
-from pandas.types.dtypes import CategoricalDtype
-from pandas.types.common import (is_categorical_dtype,
-                                 is_object_dtype,
-                                 is_float_dtype,
-                                 is_integer_dtype)
-
-import pandas as pd
-import pandas.compat as compat
-import pandas.util.testing as tm
-from pandas import (Categorical, Index, Series, DataFrame,
-                    Timestamp, CategoricalIndex, isnull,
-                    date_range, DatetimeIndex,
-                    period_range, PeriodIndex,
-                    timedelta_range, TimedeltaIndex, NaT)
-from pandas.compat import range, lrange, u, PY3
-from pandas.core.config import option_context
-
-# GH 12066
-# flake8: noqa
-
-
-class TestCategorical(tm.TestCase):
-
-    def setUp(self):
-        self.factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
-                                  ordered=True)
-
-    def test_getitem(self):
-        self.assertEqual(self.factor[0], 'a')
-        self.assertEqual(self.factor[-1], 'c')
-
-        subf = self.factor[[0, 1, 2]]
-        tm.assert_numpy_array_equal(subf._codes,
-                                    np.array([0, 1, 1], dtype=np.int8))
-
-        subf = self.factor[np.asarray(self.factor) == 'c']
-        tm.assert_numpy_array_equal(subf._codes,
-                                    np.array([2, 2, 2], dtype=np.int8))
-
-    def test_getitem_listlike(self):
-
-        # GH 9469
-        # properly coerce the input indexers
-        np.random.seed(1)
-        c = Categorical(np.random.randint(0, 5, size=150000).astype(np.int8))
-        result = c.codes[np.array([100000]).astype(np.int64)]
-        expected = c[np.array([100000]).astype(np.int64)].codes
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_getitem_category_type(self):
-        # GH 14580
-        # test iloc() on Series with Categorical data
-
-        s = pd.Series([1, 2, 3]).astype('category')
-
-        # get slice
-        result = s.iloc[0:2]
-        expected = pd.Series([1, 2]).astype('category', categories=[1, 2, 3])
-        tm.assert_series_equal(result, expected)
-
-        # get list of indexes
-        result = s.iloc[[0, 1]]
-        expected = pd.Series([1, 2]).astype('category', categories=[1, 2, 3])
-        tm.assert_series_equal(result, expected)
-
-        # get boolean array
-        result = s.iloc[[True, False, False]]
-        expected = pd.Series([1]).astype('category', categories=[1, 2, 3])
-        tm.assert_series_equal(result, expected)
-
-    def test_setitem(self):
-
-        # int/positional
-        c = self.factor.copy()
-        c[0] = 'b'
-        self.assertEqual(c[0], 'b')
-        c[-1] = 'a'
-        self.assertEqual(c[-1], 'a')
-
-        # boolean
-        c = self.factor.copy()
-        indexer = np.zeros(len(c), dtype='bool')
-        indexer[0] = True
-        indexer[-1] = True
-        c[indexer] = 'c'
-        expected = Categorical(['c', 'b', 'b', 'a', 'a', 'c', 'c', 'c'],
-                               ordered=True)
-
-        self.assert_categorical_equal(c, expected)
-
-    def test_setitem_listlike(self):
-
-        # GH 9469
-        # properly coerce the input indexers
-        np.random.seed(1)
-        c = Categorical(np.random.randint(0, 5, size=150000).astype(
-            np.int8)).add_categories([-1000])
-        indexer = np.array([100000]).astype(np.int64)
-        c[indexer] = -1000
-
-        # we are asserting the code result here
-        # which maps to the -1000 category
-        result = c.codes[np.array([100000]).astype(np.int64)]
-        self.assertEqual(result, np.array([5], dtype='int8'))
-
-    def test_constructor_unsortable(self):
-
-        # it works!
-        arr = np.array([1, 2, 3, datetime.now()], dtype='O')
-        factor = Categorical(arr, ordered=False)
-        self.assertFalse(factor.ordered)
-
-        # this however will raise as cannot be sorted
-        self.assertRaises(
-            TypeError, lambda: Categorical(arr, ordered=True))
-
-    def test_is_equal_dtype(self):
-
-        # test dtype comparisons between cats
-
-        c1 = Categorical(list('aabca'), categories=list('abc'), ordered=False)
-        c2 = Categorical(list('aabca'), categories=list('cab'), ordered=False)
-        c3 = Categorical(list('aabca'), categories=list('cab'), ordered=True)
-        self.assertTrue(c1.is_dtype_equal(c1))
-        self.assertTrue(c2.is_dtype_equal(c2))
-        self.assertTrue(c3.is_dtype_equal(c3))
-        self.assertFalse(c1.is_dtype_equal(c2))
-        self.assertFalse(c1.is_dtype_equal(c3))
-        self.assertFalse(c1.is_dtype_equal(Index(list('aabca'))))
-        self.assertFalse(c1.is_dtype_equal(c1.astype(object)))
-        self.assertTrue(c1.is_dtype_equal(CategoricalIndex(c1)))
-        self.assertFalse(c1.is_dtype_equal(
-            CategoricalIndex(c1, categories=list('cab'))))
-        self.assertFalse(c1.is_dtype_equal(CategoricalIndex(c1, ordered=True)))
-
-    def test_constructor(self):
-
-        exp_arr = np.array(["a", "b", "c", "a", "b", "c"], dtype=np.object_)
-        c1 = Categorical(exp_arr)
-        self.assert_numpy_array_equal(c1.__array__(), exp_arr)
-        c2 = Categorical(exp_arr, categories=["a", "b", "c"])
-        self.assert_numpy_array_equal(c2.__array__(), exp_arr)
-        c2 = Categorical(exp_arr, categories=["c", "b", "a"])
-        self.assert_numpy_array_equal(c2.__array__(), exp_arr)
-
-        # categories must be unique
-        def f():
-            Categorical([1, 2], [1, 2, 2])
-
-        self.assertRaises(ValueError, f)
-
-        def f():
-            Categorical(["a", "b"], ["a", "b", "b"])
-
-        self.assertRaises(ValueError, f)
-
-        # The default should be unordered
-        c1 = Categorical(["a", "b", "c", "a"])
-        self.assertFalse(c1.ordered)
-
-        # Categorical as input
-        c1 = Categorical(["a", "b", "c", "a"])
-        c2 = Categorical(c1)
-        tm.assert_categorical_equal(c1, c2)
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
-        c2 = Categorical(c1)
-        tm.assert_categorical_equal(c1, c2)
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
-        c2 = Categorical(c1)
-        tm.assert_categorical_equal(c1, c2)
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
-        c2 = Categorical(c1, categories=["a", "b", "c"])
-        self.assert_numpy_array_equal(c1.__array__(), c2.__array__())
-        self.assert_index_equal(c2.categories, Index(["a", "b", "c"]))
-
-        # Series of dtype category
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
-        c2 = Categorical(Series(c1))
-        tm.assert_categorical_equal(c1, c2)
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "c", "b"])
-        c2 = Categorical(Series(c1))
-        tm.assert_categorical_equal(c1, c2)
-
-        # Series
-        c1 = Categorical(["a", "b", "c", "a"])
-        c2 = Categorical(Series(["a", "b", "c", "a"]))
-        tm.assert_categorical_equal(c1, c2)
-
-        c1 = Categorical(["a", "b", "c", "a"], categories=["a", "b", "c", "d"])
-        c2 = Categorical(Series(["a", "b", "c", "a"]),
-                         categories=["a", "b", "c", "d"])
-        tm.assert_categorical_equal(c1, c2)
-
-        # This should result in integer categories, not float!
-        cat = pd.Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
-        self.assertTrue(is_integer_dtype(cat.categories))
-
-        # https://github.com/pandas-dev/pandas/issues/3678
-        cat = pd.Categorical([np.nan, 1, 2, 3])
-        self.assertTrue(is_integer_dtype(cat.categories))
-
-        # this should result in floats
-        cat = pd.Categorical([np.nan, 1, 2., 3])
-        self.assertTrue(is_float_dtype(cat.categories))
-
-        cat = pd.Categorical([np.nan, 1., 2., 3.])
-        self.assertTrue(is_float_dtype(cat.categories))
-
-        # This doesn't work -> this would probably need some kind of "remember
-        # the original type" feature to try to cast the array interface result
-        # to...
-
-        # vals = np.asarray(cat[cat.notnull()])
-        # self.assertTrue(is_integer_dtype(vals))
-
-        # corner cases
-        cat = pd.Categorical([1])
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        cat = pd.Categorical(["a"])
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == "a")
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        # Scalars should be converted to lists
-        cat = pd.Categorical(1)
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        cat = pd.Categorical([1], categories=1)
-        self.assertTrue(len(cat.categories) == 1)
-        self.assertTrue(cat.categories[0] == 1)
-        self.assertTrue(len(cat.codes) == 1)
-        self.assertTrue(cat.codes[0] == 0)
-
-        # Catch old style constructor useage: two arrays, codes + categories
-        # We can only catch two cases:
-        #  - when the first is an integer dtype and the second is not
-        #  - when the resulting codes are all -1/NaN
-        with tm.assert_produces_warning(RuntimeWarning):
-            c_old = Categorical([0, 1, 2, 0, 1, 2],
-                                categories=["a", "b", "c"])  # noqa
-
-        with tm.assert_produces_warning(RuntimeWarning):
-            c_old = Categorical([0, 1, 2, 0, 1, 2],  # noqa
-                                categories=[3, 4, 5])
-
-        # the next one are from the old docs, but unfortunately these don't
-        # trigger :-(
-        with tm.assert_produces_warning(None):
-            c_old2 = Categorical([0, 1, 2, 0, 1, 2], [1, 2, 3])  # noqa
-            cat = Categorical([1, 2], categories=[1, 2, 3])
-
-        # this is a legitimate constructor
-        with tm.assert_produces_warning(None):
-            c = Categorical(np.array([], dtype='int64'),  # noqa
-                            categories=[3, 2, 1], ordered=True)
-
-    def test_constructor_with_null(self):
-
-        # Cannot have NaN in categories
-        with pytest.raises(ValueError):
-            pd.Categorical([np.nan, "a", "b", "c"],
-                           categories=[np.nan, "a", "b", "c"])
-
-        with pytest.raises(ValueError):
-            pd.Categorical([None, "a", "b", "c"],
-                           categories=[None, "a", "b", "c"])
-
-        with pytest.raises(ValueError):
-            pd.Categorical(DatetimeIndex(['nat', '20160101']),
-                           categories=[NaT, Timestamp('20160101')])
-
-
-    def test_constructor_with_index(self):
-        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
-        tm.assert_categorical_equal(ci.values, Categorical(ci))
-
-        ci = CategoricalIndex(list('aabbca'), categories=list('cab'))
-        tm.assert_categorical_equal(ci.values,
-                                    Categorical(ci.astype(object),
-                                                categories=ci.categories))
-
-    def test_constructor_with_generator(self):
-        # This was raising an Error in isnull(single_val).any() because isnull
-        # returned a scalar for a generator
-        xrange = range
-
-        exp = Categorical([0, 1, 2])
-        cat = Categorical((x for x in [0, 1, 2]))
-        tm.assert_categorical_equal(cat, exp)
-        cat = Categorical(xrange(3))
-        tm.assert_categorical_equal(cat, exp)
-
-        # This uses xrange internally
-        from pandas.core.index import MultiIndex
-        MultiIndex.from_product([range(5), ['a', 'b', 'c']])
-
-        # check that categories accept generators and sequences
-        cat = pd.Categorical([0, 1, 2], categories=(x for x in [0, 1, 2]))
-        tm.assert_categorical_equal(cat, exp)
-        cat = pd.Categorical([0, 1, 2], categories=xrange(3))
-        tm.assert_categorical_equal(cat, exp)
-
-    def test_constructor_with_datetimelike(self):
-
-        # 12077
-        # constructor wwth a datetimelike and NaT
-
-        for dtl in [pd.date_range('1995-01-01 00:00:00',
-                                  periods=5, freq='s'),
-                    pd.date_range('1995-01-01 00:00:00',
-                                  periods=5, freq='s', tz='US/Eastern'),
-                    pd.timedelta_range('1 day', periods=5, freq='s')]:
-
-            s = Series(dtl)
-            c = Categorical(s)
-            expected = type(dtl)(s)
-            expected.freq = None
-            tm.assert_index_equal(c.categories, expected)
-            self.assert_numpy_array_equal(c.codes, np.arange(5, dtype='int8'))
-
-            # with NaT
-            s2 = s.copy()
-            s2.iloc[-1] = pd.NaT
-            c = Categorical(s2)
-            expected = type(dtl)(s2.dropna())
-            expected.freq = None
-            tm.assert_index_equal(c.categories, expected)
-
-            exp = np.array([0, 1, 2, 3, -1], dtype=np.int8)
-            self.assert_numpy_array_equal(c.codes, exp)
-
-            result = repr(c)
-            self.assertTrue('NaT' in result)
-
-    def test_constructor_from_index_series_datetimetz(self):
-        idx = pd.date_range('2015-01-01 10:00', freq='D', periods=3,
-                            tz='US/Eastern')
-        result = pd.Categorical(idx)
-        tm.assert_index_equal(result.categories, idx)
-
-        result = pd.Categorical(pd.Series(idx))
-        tm.assert_index_equal(result.categories, idx)
-
-    def test_constructor_from_index_series_timedelta(self):
-        idx = pd.timedelta_range('1 days', freq='D', periods=3)
-        result = pd.Categorical(idx)
-        tm.assert_index_equal(result.categories, idx)
-
-        result = pd.Categorical(pd.Series(idx))
-        tm.assert_index_equal(result.categories, idx)
-
-    def test_constructor_from_index_series_period(self):
-        idx = pd.period_range('2015-01-01', freq='D', periods=3)
-        result = pd.Categorical(idx)
-        tm.assert_index_equal(result.categories, idx)
-
-        result = pd.Categorical(pd.Series(idx))
-        tm.assert_index_equal(result.categories, idx)
-
-    def test_constructor_invariant(self):
-        # GH 14190
-        vals = [
-            np.array([1., 1.2, 1.8, np.nan]),
-            np.array([1, 2, 3], dtype='int64'),
-            ['a', 'b', 'c', np.nan],
-            [pd.Period('2014-01'), pd.Period('2014-02'), pd.NaT],
-            [pd.Timestamp('2014-01-01'), pd.Timestamp('2014-01-02'), pd.NaT],
-            [pd.Timestamp('2014-01-01', tz='US/Eastern'),
-             pd.Timestamp('2014-01-02', tz='US/Eastern'), pd.NaT],
-        ]
-        for val in vals:
-            c = Categorical(val)
-            c2 = Categorical(c)
-            tm.assert_categorical_equal(c, c2)
-
-    def test_from_codes(self):
-
-        # too few categories
-        def f():
-            Categorical.from_codes([1, 2], [1, 2])
-
-        self.assertRaises(ValueError, f)
-
-        # no int codes
-        def f():
-            Categorical.from_codes(["a"], [1, 2])
-
-        self.assertRaises(ValueError, f)
-
-        # no unique categories
-        def f():
-            Categorical.from_codes([0, 1, 2], ["a", "a", "b"])
-
-        self.assertRaises(ValueError, f)
-
-        # NaN categories included
-        def f():
-            Categorical.from_codes([0, 1, 2], ["a", "b", np.nan])
-
-        self.assertRaises(ValueError, f)
-
-        # too negative
-        def f():
-            Categorical.from_codes([-2, 1, 2], ["a", "b", "c"])
-
-        self.assertRaises(ValueError, f)
-
-        exp = Categorical(["a", "b", "c"], ordered=False)
-        res = Categorical.from_codes([0, 1, 2], ["a", "b", "c"])
-        tm.assert_categorical_equal(exp, res)
-
-        # Not available in earlier numpy versions
-        if hasattr(np.random, "choice"):
-            codes = np.random.choice([0, 1], 5, p=[0.9, 0.1])
-            pd.Categorical.from_codes(codes, categories=["train", "test"])
-
-    def test_validate_ordered(self):
-        # see gh-14058
-        exp_msg = "'ordered' must either be 'True' or 'False'"
-        exp_err = TypeError
-
-        # This should be a boolean.
-        ordered = np.array([0, 1, 2])
-
-        with tm.assertRaisesRegexp(exp_err, exp_msg):
-            Categorical([1, 2, 3], ordered=ordered)
-
-        with tm.assertRaisesRegexp(exp_err, exp_msg):
-            Categorical.from_codes([0, 0, 1], categories=['a', 'b', 'c'],
-                                   ordered=ordered)
-
-    def test_comparisons(self):
-
-        result = self.factor[self.factor == 'a']
-        expected = self.factor[np.asarray(self.factor) == 'a']
-        tm.assert_categorical_equal(result, expected)
-
-        result = self.factor[self.factor != 'a']
-        expected = self.factor[np.asarray(self.factor) != 'a']
-        tm.assert_categorical_equal(result, expected)
-
-        result = self.factor[self.factor < 'c']
-        expected = self.factor[np.asarray(self.factor) < 'c']
-        tm.assert_categorical_equal(result, expected)
-
-        result = self.factor[self.factor > 'a']
-        expected = self.factor[np.asarray(self.factor) > 'a']
-        tm.assert_categorical_equal(result, expected)
-
-        result = self.factor[self.factor >= 'b']
-        expected = self.factor[np.asarray(self.factor) >= 'b']
-        tm.assert_categorical_equal(result, expected)
-
-        result = self.factor[self.factor <= 'b']
-        expected = self.factor[np.asarray(self.factor) <= 'b']
-        tm.assert_categorical_equal(result, expected)
-
-        n = len(self.factor)
-
-        other = self.factor[np.random.permutation(n)]
-        result = self.factor == other
-        expected = np.asarray(self.factor) == np.asarray(other)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = self.factor == 'd'
-        expected = np.repeat(False, len(self.factor))
-        self.assert_numpy_array_equal(result, expected)
-
-        # comparisons with categoricals
-        cat_rev = pd.Categorical(["a", "b", "c"], categories=["c", "b", "a"],
-                                 ordered=True)
-        cat_rev_base = pd.Categorical(
-            ["b", "b", "b"], categories=["c", "b", "a"], ordered=True)
-        cat = pd.Categorical(["a", "b", "c"], ordered=True)
-        cat_base = pd.Categorical(["b", "b", "b"], categories=cat.categories,
-                                  ordered=True)
-
-        # comparisons need to take categories ordering into account
-        res_rev = cat_rev > cat_rev_base
-        exp_rev = np.array([True, False, False])
-        self.assert_numpy_array_equal(res_rev, exp_rev)
-
-        res_rev = cat_rev < cat_rev_base
-        exp_rev = np.array([False, False, True])
-        self.assert_numpy_array_equal(res_rev, exp_rev)
-
-        res = cat > cat_base
-        exp = np.array([False, False, True])
-        self.assert_numpy_array_equal(res, exp)
-
-        # Only categories with same categories can be compared
-        def f():
-            cat > cat_rev
-
-        self.assertRaises(TypeError, f)
-
-        cat_rev_base2 = pd.Categorical(
-            ["b", "b", "b"], categories=["c", "b", "a", "d"])
-
-        def f():
-            cat_rev > cat_rev_base2
-
-        self.assertRaises(TypeError, f)
-
-        # Only categories with same ordering information can be compared
-        cat_unorderd = cat.set_ordered(False)
-        self.assertFalse((cat > cat).any())
-
-        def f():
-            cat > cat_unorderd
-
-        self.assertRaises(TypeError, f)
-
-        # comparison (in both directions) with Series will raise
-        s = Series(["b", "b", "b"])
-        self.assertRaises(TypeError, lambda: cat > s)
-        self.assertRaises(TypeError, lambda: cat_rev > s)
-        self.assertRaises(TypeError, lambda: s < cat)
-        self.assertRaises(TypeError, lambda: s < cat_rev)
-
-        # comparison with numpy.array will raise in both direction, but only on
-        # newer numpy versions
-        a = np.array(["b", "b", "b"])
-        self.assertRaises(TypeError, lambda: cat > a)
-        self.assertRaises(TypeError, lambda: cat_rev > a)
-
-        # The following work via '__array_priority__ = 1000'
-        # works only on numpy >= 1.7.1
-        if LooseVersion(np.__version__) > "1.7.1":
-            self.assertRaises(TypeError, lambda: a < cat)
-            self.assertRaises(TypeError, lambda: a < cat_rev)
-
-        # Make sure that unequal comparison take the categories order in
-        # account
-        cat_rev = pd.Categorical(
-            list("abc"), categories=list("cba"), ordered=True)
-        exp = np.array([True, False, False])
-        res = cat_rev > "b"
-        self.assert_numpy_array_equal(res, exp)
-
-    def test_argsort(self):
-        c = Categorical([5, 3, 1, 4, 2], ordered=True)
-
-        expected = np.array([2, 4, 1, 3, 0])
-        tm.assert_numpy_array_equal(c.argsort(ascending=True), expected,
-                                    check_dtype=False)
-
-        expected = expected[::-1]
-        tm.assert_numpy_array_equal(c.argsort(ascending=False), expected,
-                                    check_dtype=False)
-
-    def test_numpy_argsort(self):
-        c = Categorical([5, 3, 1, 4, 2], ordered=True)
-
-        expected = np.array([2, 4, 1, 3, 0])
-        tm.assert_numpy_array_equal(np.argsort(c), expected,
-                                    check_dtype=False)
-
-        msg = "the 'kind' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.argsort,
-                              c, kind='mergesort')
-
-        msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.argsort,
-                              c, axis=0)
-
-        msg = "the 'order' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.argsort,
-                              c, order='C')
-
-    def test_na_flags_int_categories(self):
-        # #1457
-
-        categories = lrange(10)
-        labels = np.random.randint(0, 10, 20)
-        labels[::5] = -1
-
-        cat = Categorical(labels, categories, fastpath=True)
-        repr(cat)
-
-        self.assert_numpy_array_equal(isnull(cat), labels == -1)
-
-    def test_categories_none(self):
-        factor = Categorical(['a', 'b', 'b', 'a',
-                              'a', 'c', 'c', 'c'], ordered=True)
-        tm.assert_categorical_equal(factor, self.factor)
-
-    def test_describe(self):
-        # string type
-        desc = self.factor.describe()
-        self.assertTrue(self.factor.ordered)
-        exp_index = pd.CategoricalIndex(['a', 'b', 'c'], name='categories',
-                                        ordered=self.factor.ordered)
-        expected = DataFrame({'counts': [3, 2, 3],
-                              'freqs': [3 / 8., 2 / 8., 3 / 8.]},
-                             index=exp_index)
-        tm.assert_frame_equal(desc, expected)
-
-        # check unused categories
-        cat = self.factor.copy()
-        cat.set_categories(["a", "b", "c", "d"], inplace=True)
-        desc = cat.describe()
-
-        exp_index = pd.CategoricalIndex(['a', 'b', 'c', 'd'],
-                                        ordered=self.factor.ordered,
-                                        name='categories')
-        expected = DataFrame({'counts': [3, 2, 3, 0],
-                              'freqs': [3 / 8., 2 / 8., 3 / 8., 0]},
-                             index=exp_index)
-        tm.assert_frame_equal(desc, expected)
-
-        # check an integer one
-        cat = Categorical([1, 2, 3, 1, 2, 3, 3, 2, 1, 1, 1])
-        desc = cat.describe()
-        exp_index = pd.CategoricalIndex([1, 2, 3], ordered=cat.ordered,
-                                        name='categories')
-        expected = DataFrame({'counts': [5, 3, 3],
-                              'freqs': [5 / 11., 3 / 11., 3 / 11.]},
-                             index=exp_index)
-        tm.assert_frame_equal(desc, expected)
-
-        # https://github.com/pandas-dev/pandas/issues/3678
-        # describe should work with NaN
-        cat = pd.Categorical([np.nan, 1, 2, 2])
-        desc = cat.describe()
-        expected = DataFrame({'counts': [1, 2, 1],
-                              'freqs': [1 / 4., 2 / 4., 1 / 4.]},
-                             index=pd.CategoricalIndex([1, 2, np.nan],
-                                                       categories=[1, 2],
-                                                       name='categories'))
-        tm.assert_frame_equal(desc, expected)
-
-    def test_print(self):
-        expected = ["[a, b, b, a, a, c, c, c]",
-                    "Categories (3, object): [a < b < c]"]
-        expected = "\n".join(expected)
-        actual = repr(self.factor)
-        self.assertEqual(actual, expected)
-
-    def test_big_print(self):
-        factor = Categorical([0, 1, 2, 0, 1, 2] * 100, ['a', 'b', 'c'],
-                             fastpath=True)
-        expected = ["[a, b, c, a, b, ..., b, c, a, b, c]", "Length: 600",
-                    "Categories (3, object): [a, b, c]"]
-        expected = "\n".join(expected)
-
-        actual = repr(factor)
-
-        self.assertEqual(actual, expected)
-
-    def test_empty_print(self):
-        factor = Categorical([], ["a", "b", "c"])
-        expected = ("[], Categories (3, object): [a, b, c]")
-        # hack because array_repr changed in numpy > 1.6.x
-        actual = repr(factor)
-        self.assertEqual(actual, expected)
-
-        self.assertEqual(expected, actual)
-        factor = Categorical([], ["a", "b", "c"], ordered=True)
-        expected = ("[], Categories (3, object): [a < b < c]")
-        actual = repr(factor)
-        self.assertEqual(expected, actual)
-
-        factor = Categorical([], [])
-        expected = ("[], Categories (0, object): []")
-        self.assertEqual(expected, repr(factor))
-
-    def test_print_none_width(self):
-        # GH10087
-        a = pd.Series(pd.Categorical([1, 2, 3, 4]))
-        exp = u("0    1\n1    2\n2    3\n3    4\n" +
-                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
-
-        with option_context("display.width", None):
-            self.assertEqual(exp, repr(a))
-
-    def test_unicode_print(self):
-        if PY3:
-            _rep = repr
-        else:
-            _rep = unicode  # noqa
-
-        c = pd.Categorical(['aaaaa', 'bb', 'cccc'] * 20)
-        expected = u"""\
-[aaaaa, bb, cccc, aaaaa, bb, ..., bb, cccc, aaaaa, bb, cccc]
-Length: 60
-Categories (3, object): [aaaaa, bb, cccc]"""
-
-        self.assertEqual(_rep(c), expected)
-
-        c = pd.Categorical([u'ああああ', u'いいいいい', u'ううううううう']
-                           * 20)
-        expected = u"""\
-[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
-Length: 60
-Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
-
-        self.assertEqual(_rep(c), expected)
-
-        # unicode option should not affect to Categorical, as it doesn't care
-        # the repr width
-        with option_context('display.unicode.east_asian_width', True):
-
-            c = pd.Categorical([u'ああああ', u'いいいいい', u'ううううううう']
-                               * 20)
-            expected = u"""[ああああ, いいいいい, ううううううう, ああああ, いいいいい, ..., いいいいい, ううううううう, ああああ, いいいいい, ううううううう]
-Length: 60
-Categories (3, object): [ああああ, いいいいい, ううううううう]"""  # noqa
-
-            self.assertEqual(_rep(c), expected)
-
-    def test_periodindex(self):
-        idx1 = PeriodIndex(['2014-01', '2014-01', '2014-02', '2014-02',
-                            '2014-03', '2014-03'], freq='M')
-
-        cat1 = Categorical(idx1)
-        str(cat1)
-        exp_arr = np.array([0, 0, 1, 1, 2, 2], dtype=np.int8)
-        exp_idx = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
-        self.assert_numpy_array_equal(cat1._codes, exp_arr)
-        self.assert_index_equal(cat1.categories, exp_idx)
-
-        idx2 = PeriodIndex(['2014-03', '2014-03', '2014-02', '2014-01',
-                            '2014-03', '2014-01'], freq='M')
-        cat2 = Categorical(idx2, ordered=True)
-        str(cat2)
-        exp_arr = np.array([2, 2, 1, 0, 2, 0], dtype=np.int8)
-        exp_idx2 = PeriodIndex(['2014-01', '2014-02', '2014-03'], freq='M')
-        self.assert_numpy_array_equal(cat2._codes, exp_arr)
-        self.assert_index_equal(cat2.categories, exp_idx2)
-
-        idx3 = PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
-                            '2013-08', '2013-07', '2013-05'], freq='M')
-        cat3 = Categorical(idx3, ordered=True)
-        exp_arr = np.array([6, 5, 4, 3, 2, 1, 0], dtype=np.int8)
-        exp_idx = PeriodIndex(['2013-05', '2013-07', '2013-08', '2013-09',
-                               '2013-10', '2013-11', '2013-12'], freq='M')
-        self.assert_numpy_array_equal(cat3._codes, exp_arr)
-        self.assert_index_equal(cat3.categories, exp_idx)
-
-    def test_categories_assigments(self):
-        s = pd.Categorical(["a", "b", "c", "a"])
-        exp = np.array([1, 2, 3, 1], dtype=np.int64)
-        s.categories = [1, 2, 3]
-        self.assert_numpy_array_equal(s.__array__(), exp)
-        self.assert_index_equal(s.categories, Index([1, 2, 3]))
-
-        # lengthen
-        def f():
-            s.categories = [1, 2, 3, 4]
-
-        self.assertRaises(ValueError, f)
-
-        # shorten
-        def f():
-            s.categories = [1, 2]
-
-        self.assertRaises(ValueError, f)
-
-    def test_construction_with_ordered(self):
-        # GH 9347, 9190
-        cat = Categorical([0, 1, 2])
-        self.assertFalse(cat.ordered)
-        cat = Categorical([0, 1, 2], ordered=False)
-        self.assertFalse(cat.ordered)
-        cat = Categorical([0, 1, 2], ordered=True)
-        self.assertTrue(cat.ordered)
-
-    def test_ordered_api(self):
-        # GH 9347
-        cat1 = pd.Categorical(["a", "c", "b"], ordered=False)
-        self.assert_index_equal(cat1.categories, Index(['a', 'b', 'c']))
-        self.assertFalse(cat1.ordered)
-
-        cat2 = pd.Categorical(["a", "c", "b"], categories=['b', 'c', 'a'],
-                              ordered=False)
-        self.assert_index_equal(cat2.categories, Index(['b', 'c', 'a']))
-        self.assertFalse(cat2.ordered)
-
-        cat3 = pd.Categorical(["a", "c", "b"], ordered=True)
-        self.assert_index_equal(cat3.categories, Index(['a', 'b', 'c']))
-        self.assertTrue(cat3.ordered)
-
-        cat4 = pd.Categorical(["a", "c", "b"], categories=['b', 'c', 'a'],
-                              ordered=True)
-        self.assert_index_equal(cat4.categories, Index(['b', 'c', 'a']))
-        self.assertTrue(cat4.ordered)
-
-    def test_set_ordered(self):
-
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        cat2 = cat.as_unordered()
-        self.assertFalse(cat2.ordered)
-        cat2 = cat.as_ordered()
-        self.assertTrue(cat2.ordered)
-        cat2.as_unordered(inplace=True)
-        self.assertFalse(cat2.ordered)
-        cat2.as_ordered(inplace=True)
-        self.assertTrue(cat2.ordered)
-
-        self.assertTrue(cat2.set_ordered(True).ordered)
-        self.assertFalse(cat2.set_ordered(False).ordered)
-        cat2.set_ordered(True, inplace=True)
-        self.assertTrue(cat2.ordered)
-        cat2.set_ordered(False, inplace=True)
-        self.assertFalse(cat2.ordered)
-
-        # removed in 0.19.0
-        msg = "can\'t set attribute"
-        with tm.assertRaisesRegexp(AttributeError, msg):
-            cat.ordered = True
-        with tm.assertRaisesRegexp(AttributeError, msg):
-            cat.ordered = False
-
-    def test_set_categories(self):
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        exp_categories = Index(["c", "b", "a"])
-        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
-
-        res = cat.set_categories(["c", "b", "a"], inplace=True)
-        self.assert_index_equal(cat.categories, exp_categories)
-        self.assert_numpy_array_equal(cat.__array__(), exp_values)
-        self.assertIsNone(res)
-
-        res = cat.set_categories(["a", "b", "c"])
-        # cat must be the same as before
-        self.assert_index_equal(cat.categories, exp_categories)
-        self.assert_numpy_array_equal(cat.__array__(), exp_values)
-        # only res is changed
-        exp_categories_back = Index(["a", "b", "c"])
-        self.assert_index_equal(res.categories, exp_categories_back)
-        self.assert_numpy_array_equal(res.__array__(), exp_values)
-
-        # not all "old" included in "new" -> all not included ones are now
-        # np.nan
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        res = cat.set_categories(["a"])
-        self.assert_numpy_array_equal(res.codes,
-                                      np.array([0, -1, -1, 0], dtype=np.int8))
-
-        # still not all "old" in "new"
-        res = cat.set_categories(["a", "b", "d"])
-        self.assert_numpy_array_equal(res.codes,
-                                      np.array([0, 1, -1, 0], dtype=np.int8))
-        self.assert_index_equal(res.categories, Index(["a", "b", "d"]))
-
-        # all "old" included in "new"
-        cat = cat.set_categories(["a", "b", "c", "d"])
-        exp_categories = Index(["a", "b", "c", "d"])
-        self.assert_index_equal(cat.categories, exp_categories)
-
-        # internals...
-        c = Categorical([1, 2, 3, 4, 1], categories=[1, 2, 3, 4], ordered=True)
-        self.assert_numpy_array_equal(c._codes,
-                                      np.array([0, 1, 2, 3, 0], dtype=np.int8))
-        self.assert_index_equal(c.categories, Index([1, 2, 3, 4]))
-
-        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(c.get_values(), exp)
-
-        # all "pointers" to '4' must be changed from 3 to 0,...
-        c = c.set_categories([4, 3, 2, 1])
-
-        # positions are changed
-        self.assert_numpy_array_equal(c._codes,
-                                      np.array([3, 2, 1, 0, 3], dtype=np.int8))
-
-        # categories are now in new order
-        self.assert_index_equal(c.categories, Index([4, 3, 2, 1]))
-
-        # output is the same
-        exp = np.array([1, 2, 3, 4, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(c.get_values(), exp)
-        self.assertTrue(c.min(), 4)
-        self.assertTrue(c.max(), 1)
-
-        # set_categories should set the ordering if specified
-        c2 = c.set_categories([4, 3, 2, 1], ordered=False)
-        self.assertFalse(c2.ordered)
-        self.assert_numpy_array_equal(c.get_values(), c2.get_values())
-
-        # set_categories should pass thru the ordering
-        c2 = c.set_ordered(False).set_categories([4, 3, 2, 1])
-        self.assertFalse(c2.ordered)
-        self.assert_numpy_array_equal(c.get_values(), c2.get_values())
-
-    def test_rename_categories(self):
-        cat = pd.Categorical(["a", "b", "c", "a"])
-
-        # inplace=False: the old one must not be changed
-        res = cat.rename_categories([1, 2, 3])
-        self.assert_numpy_array_equal(res.__array__(),
-                                      np.array([1, 2, 3, 1], dtype=np.int64))
-        self.assert_index_equal(res.categories, Index([1, 2, 3]))
-
-        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
-        self.assert_numpy_array_equal(cat.__array__(), exp_cat)
-
-        exp_cat = Index(["a", "b", "c"])
-        self.assert_index_equal(cat.categories, exp_cat)
-        res = cat.rename_categories([1, 2, 3], inplace=True)
-
-        # and now inplace
-        self.assertIsNone(res)
-        self.assert_numpy_array_equal(cat.__array__(),
-                                      np.array([1, 2, 3, 1], dtype=np.int64))
-        self.assert_index_equal(cat.categories, Index([1, 2, 3]))
-
-        # lengthen
-        def f():
-            cat.rename_categories([1, 2, 3, 4])
-
-        self.assertRaises(ValueError, f)
-
-        # shorten
-        def f():
-            cat.rename_categories([1, 2])
-
-        self.assertRaises(ValueError, f)
-
-    def test_reorder_categories(self):
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a", "b", "c", "a"], categories=["c", "b", "a"],
-                          ordered=True)
-
-        # first inplace == False
-        res = cat.reorder_categories(["c", "b", "a"])
-        # cat must be the same as before
-        self.assert_categorical_equal(cat, old)
-        # only res is changed
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.reorder_categories(["c", "b", "a"], inplace=True)
-        self.assertIsNone(res)
-        self.assert_categorical_equal(cat, new)
-
-        # not all "old" included in "new"
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-
-        def f():
-            cat.reorder_categories(["a"])
-
-        self.assertRaises(ValueError, f)
-
-        # still not all "old" in "new"
-        def f():
-            cat.reorder_categories(["a", "b", "d"])
-
-        self.assertRaises(ValueError, f)
-
-        # all "old" included in "new", but too long
-        def f():
-            cat.reorder_categories(["a", "b", "c", "d"])
-
-        self.assertRaises(ValueError, f)
-
-    def test_add_categories(self):
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a", "b", "c", "a"],
-                          categories=["a", "b", "c", "d"], ordered=True)
-
-        # first inplace == False
-        res = cat.add_categories("d")
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        res = cat.add_categories(["d"])
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.add_categories("d", inplace=True)
-        self.assert_categorical_equal(cat, new)
-        self.assertIsNone(res)
-
-        # new is in old categories
-        def f():
-            cat.add_categories(["d"])
-
-        self.assertRaises(ValueError, f)
-
-        # GH 9927
-        cat = Categorical(list("abc"), ordered=True)
-        expected = Categorical(
-            list("abc"), categories=list("abcde"), ordered=True)
-        # test with Series, np.array, index, list
-        res = cat.add_categories(Series(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(np.array(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(Index(["d", "e"]))
-        self.assert_categorical_equal(res, expected)
-        res = cat.add_categories(["d", "e"])
-        self.assert_categorical_equal(res, expected)
-
-    def test_remove_categories(self):
-        cat = Categorical(["a", "b", "c", "a"], ordered=True)
-        old = cat.copy()
-        new = Categorical(["a", "b", np.nan, "a"], categories=["a", "b"],
-                          ordered=True)
-
-        # first inplace == False
-        res = cat.remove_categories("c")
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        res = cat.remove_categories(["c"])
-        self.assert_categorical_equal(cat, old)
-        self.assert_categorical_equal(res, new)
-
-        # inplace == True
-        res = cat.remove_categories("c", inplace=True)
-        self.assert_categorical_equal(cat, new)
-        self.assertIsNone(res)
-
-        # removal is not in categories
-        def f():
-            cat.remove_categories(["c"])
-
-        self.assertRaises(ValueError, f)
-
-    def test_remove_unused_categories(self):
-        c = Categorical(["a", "b", "c", "d", "a"],
-                        categories=["a", "b", "c", "d", "e"])
-        exp_categories_all = Index(["a", "b", "c", "d", "e"])
-        exp_categories_dropped = Index(["a", "b", "c", "d"])
-
-        self.assert_index_equal(c.categories, exp_categories_all)
-
-        res = c.remove_unused_categories()
-        self.assert_index_equal(res.categories, exp_categories_dropped)
-        self.assert_index_equal(c.categories, exp_categories_all)
-
-        res = c.remove_unused_categories(inplace=True)
-        self.assert_index_equal(c.categories, exp_categories_dropped)
-        self.assertIsNone(res)
-
-        # with NaN values (GH11599)
-        c = Categorical(["a", "b", "c", np.nan],
-                        categories=["a", "b", "c", "d", "e"])
-        res = c.remove_unused_categories()
-        self.assert_index_equal(res.categories,
-                                Index(np.array(["a", "b", "c"])))
-        exp_codes = np.array([0, 1, 2, -1], dtype=np.int8)
-        self.assert_numpy_array_equal(res.codes, exp_codes)
-        self.assert_index_equal(c.categories, exp_categories_all)
-
-        val = ['F', np.nan, 'D', 'B', 'D', 'F', np.nan]
-        cat = pd.Categorical(values=val, categories=list('ABCDEFG'))
-        out = cat.remove_unused_categories()
-        self.assert_index_equal(out.categories, Index(['B', 'D', 'F']))
-        exp_codes = np.array([2, -1, 1, 0, 1, 2, -1], dtype=np.int8)
-        self.assert_numpy_array_equal(out.codes, exp_codes)
-        self.assertEqual(out.get_values().tolist(), val)
-
-        alpha = list('abcdefghijklmnopqrstuvwxyz')
-        val = np.random.choice(alpha[::2], 10000).astype('object')
-        val[np.random.choice(len(val), 100)] = np.nan
-
-        cat = pd.Categorical(values=val, categories=alpha)
-        out = cat.remove_unused_categories()
-        self.assertEqual(out.get_values().tolist(), val.tolist())
-
-    def test_nan_handling(self):
-
-        # Nans are represented as -1 in codes
-        c = Categorical(["a", "b", np.nan, "a"])
-        self.assert_index_equal(c.categories, Index(["a", "b"]))
-        self.assert_numpy_array_equal(c._codes,
-                                      np.array([0, 1, -1, 0], dtype=np.int8))
-        c[1] = np.nan
-        self.assert_index_equal(c.categories, Index(["a", "b"]))
-        self.assert_numpy_array_equal(c._codes,
-                                      np.array([0, -1, -1, 0], dtype=np.int8))
-
-        # Adding nan to categories should make assigned nan point to the
-        # category!
-        c = Categorical(["a", "b", np.nan, "a"])
-        self.assert_index_equal(c.categories, Index(["a", "b"]))
-        self.assert_numpy_array_equal(c._codes,
-                                      np.array([0, 1, -1, 0], dtype=np.int8))
-
-    def test_isnull(self):
-        exp = np.array([False, False, True])
-        c = Categorical(["a", "b", np.nan])
-        res = c.isnull()
-
-        self.assert_numpy_array_equal(res, exp)
-
-    def test_codes_immutable(self):
-
-        # Codes should be read only
-        c = Categorical(["a", "b", "c", "a", np.nan])
-        exp = np.array([0, 1, 2, 0, -1], dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-
-        # Assignments to codes should raise
-        def f():
-            c.codes = np.array([0, 1, 2, 0, 1], dtype='int8')
-
-        self.assertRaises(ValueError, f)
-
-        # changes in the codes array should raise
-        # np 1.6.1 raises RuntimeError rather than ValueError
-        codes = c.codes
-
-        def f():
-            codes[4] = 1
-
-        self.assertRaises(ValueError, f)
-
-        # But even after getting the codes, the original array should still be
-        # writeable!
-        c[4] = "a"
-        exp = np.array([0, 1, 2, 0, 0], dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-        c._codes[4] = 2
-        exp = np.array([0, 1, 2, 0, 2], dtype='int8')
-        self.assert_numpy_array_equal(c.codes, exp)
-
-    def test_min_max(self):
-
-        # unordered cats have no min/max
-        cat = Categorical(["a", "b", "c", "d"], ordered=False)
-        self.assertRaises(TypeError, lambda: cat.min())
-        self.assertRaises(TypeError, lambda: cat.max())
-        cat = Categorical(["a", "b", "c", "d"], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "a")
-        self.assertEqual(_max, "d")
-        cat = Categorical(["a", "b", "c", "d"],
-                          categories=['d', 'c', 'b', 'a'], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "d")
-        self.assertEqual(_max, "a")
-        cat = Categorical([np.nan, "b", "c", np.nan],
-                          categories=['d', 'c', 'b', 'a'], ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, "b")
-
-        _min = cat.min(numeric_only=True)
-        self.assertEqual(_min, "c")
-        _max = cat.max(numeric_only=True)
-        self.assertEqual(_max, "b")
-
-        cat = Categorical([np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1],
-                          ordered=True)
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, 1)
-
-        _min = cat.min(numeric_only=True)
-        self.assertEqual(_min, 2)
-        _max = cat.max(numeric_only=True)
-        self.assertEqual(_max, 1)
-
-    def test_unique(self):
-        # categories are reordered based on value when ordered=False
-        cat = Categorical(["a", "b"])
-        exp = Index(["a", "b"])
-        res = cat.unique()
-        self.assert_index_equal(res.categories, exp)
-        self.assert_categorical_equal(res, cat)
-
-        cat = Categorical(["a", "b", "a", "a"], categories=["a", "b", "c"])
-        res = cat.unique()
-        self.assert_index_equal(res.categories, exp)
-        tm.assert_categorical_equal(res, Categorical(exp))
-
-        cat = Categorical(["c", "a", "b", "a", "a"],
-                          categories=["a", "b", "c"])
-        exp = Index(["c", "a", "b"])
-        res = cat.unique()
-        self.assert_index_equal(res.categories, exp)
-        exp_cat = Categorical(exp, categories=['c', 'a', 'b'])
-        tm.assert_categorical_equal(res, exp_cat)
-
-        # nan must be removed
-        cat = Categorical(["b", np.nan, "b", np.nan, "a"],
-                          categories=["a", "b", "c"])
-        res = cat.unique()
-        exp = Index(["b", "a"])
-        self.assert_index_equal(res.categories, exp)
-        exp_cat = Categorical(["b", np.nan, "a"], categories=["b", "a"])
-        tm.assert_categorical_equal(res, exp_cat)
-
-    def test_unique_ordered(self):
-        # keep categories order when ordered=True
-        cat = Categorical(['b', 'a', 'b'], categories=['a', 'b'], ordered=True)
-        res = cat.unique()
-        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['c', 'b', 'a', 'a'], categories=['a', 'b', 'c'],
-                          ordered=True)
-        res = cat.unique()
-        exp_cat = Categorical(['c', 'b', 'a'], categories=['a', 'b', 'c'],
-                              ordered=True)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['b', 'a', 'a'], categories=['a', 'b', 'c'],
-                          ordered=True)
-        res = cat.unique()
-        exp_cat = Categorical(['b', 'a'], categories=['a', 'b'], ordered=True)
-        tm.assert_categorical_equal(res, exp_cat)
-
-        cat = Categorical(['b', 'b', np.nan, 'a'], categories=['a', 'b', 'c'],
-                          ordered=True)
-        res = cat.unique()
-        exp_cat = Categorical(['b', np.nan, 'a'], categories=['a', 'b'],
-                              ordered=True)
-        tm.assert_categorical_equal(res, exp_cat)
-
-    def test_unique_index_series(self):
-        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1])
-        # Categorical.unique sorts categories by appearance order
-        # if ordered=False
-        exp = Categorical([3, 1, 2], categories=[3, 1, 2])
-        tm.assert_categorical_equal(c.unique(), exp)
-
-        tm.assert_index_equal(Index(c).unique(), Index(exp))
-        tm.assert_categorical_equal(pd.Series(c).unique(), exp)
-
-        c = Categorical([1, 1, 2, 2], categories=[3, 2, 1])
-        exp = Categorical([1, 2], categories=[1, 2])
-        tm.assert_categorical_equal(c.unique(), exp)
-        tm.assert_index_equal(Index(c).unique(), Index(exp))
-        tm.assert_categorical_equal(pd.Series(c).unique(), exp)
-
-        c = Categorical([3, 1, 2, 2, 1], categories=[3, 2, 1], ordered=True)
-        # Categorical.unique keeps categories order if ordered=True
-        exp = Categorical([3, 1, 2], categories=[3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(c.unique(), exp)
-
-        tm.assert_index_equal(Index(c).unique(), Index(exp))
-        tm.assert_categorical_equal(pd.Series(c).unique(), exp)
-
-    def test_mode(self):
-        s = Categorical([1, 1, 2, 4, 5, 5, 5], categories=[5, 4, 3, 2, 1],
-                        ordered=True)
-        res = s.mode()
-        exp = Categorical([5], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-        s = Categorical([1, 1, 1, 4, 5, 5, 5], categories=[5, 4, 3, 2, 1],
-                        ordered=True)
-        res = s.mode()
-        exp = Categorical([5, 1], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-        s = Categorical([1, 2, 3, 4, 5], categories=[5, 4, 3, 2, 1],
-                        ordered=True)
-        res = s.mode()
-        exp = Categorical([5, 4, 3, 2, 1], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-        # NaN should not become the mode!
-        s = Categorical([np.nan, np.nan, np.nan, 4, 5],
-                        categories=[5, 4, 3, 2, 1], ordered=True)
-        res = s.mode()
-        exp = Categorical([5, 4], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-        s = Categorical([np.nan, np.nan, np.nan, 4, 5, 4],
-                        categories=[5, 4, 3, 2, 1], ordered=True)
-        res = s.mode()
-        exp = Categorical([4], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-        s = Categorical([np.nan, np.nan, 4, 5, 4], categories=[5, 4, 3, 2, 1],
-                        ordered=True)
-        res = s.mode()
-        exp = Categorical([4], categories=[5, 4, 3, 2, 1], ordered=True)
-        tm.assert_categorical_equal(res, exp)
-
-    def test_sort_values(self):
-
-        # unordered cats are sortable
-        cat = Categorical(["a", "b", "b", "a"], ordered=False)
-        cat.sort_values()
-
-        cat = Categorical(["a", "c", "b", "d"], ordered=True)
-
-        # sort_values
-        res = cat.sort_values()
-        exp = np.array(["a", "b", "c", "d"], dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, cat.categories)
-
-        cat = Categorical(["a", "c", "b", "d"],
-                          categories=["a", "b", "c", "d"], ordered=True)
-        res = cat.sort_values()
-        exp = np.array(["a", "b", "c", "d"], dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, cat.categories)
-
-        res = cat.sort_values(ascending=False)
-        exp = np.array(["d", "c", "b", "a"], dtype=object)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, cat.categories)
-
-        # sort (inplace order)
-        cat1 = cat.copy()
-        cat1.sort_values(inplace=True)
-        exp = np.array(["a", "b", "c", "d"], dtype=object)
-        self.assert_numpy_array_equal(cat1.__array__(), exp)
-        self.assert_index_equal(res.categories, cat.categories)
-
-        # reverse
-        cat = Categorical(["a", "c", "c", "b", "d"], ordered=True)
-        res = cat.sort_values(ascending=False)
-        exp_val = np.array(["d", "c", "c", "b", "a"], dtype=object)
-        exp_categories = Index(["a", "b", "c", "d"])
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_index_equal(res.categories, exp_categories)
-
-    def test_sort_values_na_position(self):
-        # see gh-12882
-        cat = Categorical([5, 2, np.nan, 2, np.nan], ordered=True)
-        exp_categories = Index([2, 5])
-
-        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
-        res = cat.sort_values()  # default arguments
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        exp = np.array([np.nan, np.nan, 2.0, 2.0, 5.0])
-        res = cat.sort_values(ascending=True, na_position='first')
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        exp = np.array([np.nan, np.nan, 5.0, 2.0, 2.0])
-        res = cat.sort_values(ascending=False, na_position='first')
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        exp = np.array([2.0, 2.0, 5.0, np.nan, np.nan])
-        res = cat.sort_values(ascending=True, na_position='last')
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        exp = np.array([5.0, 2.0, 2.0, np.nan, np.nan])
-        res = cat.sort_values(ascending=False, na_position='last')
-        self.assert_numpy_array_equal(res.__array__(), exp)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='last')
-        exp_val = np.array(["d", "c", "b", "a", np.nan], dtype=object)
-        exp_categories = Index(["a", "b", "c", "d"])
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_index_equal(res.categories, exp_categories)
-
-        cat = Categorical(["a", "c", "b", "d", np.nan], ordered=True)
-        res = cat.sort_values(ascending=False, na_position='first')
-        exp_val = np.array([np.nan, "d", "c", "b", "a"], dtype=object)
-        exp_categories = Index(["a", "b", "c", "d"])
-        self.assert_numpy_array_equal(res.__array__(), exp_val)
-        self.assert_index_equal(res.categories, exp_categories)
-
-    def test_slicing_directly(self):
-        cat = Categorical(["a", "b", "c", "d", "a", "b", "c"])
-        sliced = cat[3]
-        self.assertEqual(sliced, "d")
-        sliced = cat[3:5]
-        expected = Categorical(["d", "a"], categories=['a', 'b', 'c', 'd'])
-        self.assert_numpy_array_equal(sliced._codes, expected._codes)
-        tm.assert_index_equal(sliced.categories, expected.categories)
-
-    def test_set_item_nan(self):
-        cat = pd.Categorical([1, 2, 3])
-        cat[1] = np.nan
-
-        exp = pd.Categorical([1, np.nan, 3], categories=[1, 2, 3])
-        tm.assert_categorical_equal(cat, exp)
-
-    def test_shift(self):
-        # GH 9416
-        cat = pd.Categorical(['a', 'b', 'c', 'd', 'a'])
-
-        # shift forward
-        sp1 = cat.shift(1)
-        xp1 = pd.Categorical([np.nan, 'a', 'b', 'c', 'd'])
-        self.assert_categorical_equal(sp1, xp1)
-        self.assert_categorical_equal(cat[:-1], sp1[1:])
-
-        # shift back
-        sn2 = cat.shift(-2)
-        xp2 = pd.Categorical(['c', 'd', 'a', np.nan, np.nan],
-                             categories=['a', 'b', 'c', 'd'])
-        self.assert_categorical_equal(sn2, xp2)
-        self.assert_categorical_equal(cat[2:], sn2[:-2])
-
-        # shift by zero
-        self.assert_categorical_equal(cat, cat.shift(0))
-
-    def test_nbytes(self):
-        cat = pd.Categorical([1, 2, 3])
-        exp = cat._codes.nbytes + cat._categories.values.nbytes
-        self.assertEqual(cat.nbytes, exp)
-
-    def test_memory_usage(self):
-        cat = pd.Categorical([1, 2, 3])
-
-        # .categories is an index, so we include the hashtable
-        self.assertTrue(cat.nbytes > 0 and cat.nbytes <= cat.memory_usage())
-        self.assertTrue(cat.nbytes > 0 and
-                        cat.nbytes <= cat.memory_usage(deep=True))
-
-        cat = pd.Categorical(['foo', 'foo', 'bar'])
-        self.assertTrue(cat.memory_usage(deep=True) > cat.nbytes)
-
-        # sys.getsizeof will call the .memory_usage with
-        # deep=True, and add on some GC overhead
-        diff = cat.memory_usage(deep=True) - sys.getsizeof(cat)
-        self.assertTrue(abs(diff) < 100)
-
-    def test_searchsorted(self):
-        # https://github.com/pandas-dev/pandas/issues/8420
-        # https://github.com/pandas-dev/pandas/issues/14522
-
-        c1 = pd.Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
-                            categories=['cheese', 'milk', 'apple', 'bread'],
-                            ordered=True)
-        s1 = pd.Series(c1)
-        c2 = pd.Categorical(['cheese', 'milk', 'apple', 'bread', 'bread'],
-                            categories=['cheese', 'milk', 'apple', 'bread'],
-                            ordered=False)
-        s2 = pd.Series(c2)
-
-        # Searching for single item argument, side='left' (default)
-        res_cat = c1.searchsorted('apple')
-        res_ser = s1.searchsorted('apple')
-        exp = np.array([2], dtype=np.intp)
-        self.assert_numpy_array_equal(res_cat, exp)
-        self.assert_numpy_array_equal(res_ser, exp)
-
-        # Searching for single item array, side='left' (default)
-        res_cat = c1.searchsorted(['bread'])
-        res_ser = s1.searchsorted(['bread'])
-        exp = np.array([3], dtype=np.intp)
-        self.assert_numpy_array_equal(res_cat, exp)
-        self.assert_numpy_array_equal(res_ser, exp)
-
-        # Searching for several items array, side='right'
-        res_cat = c1.searchsorted(['apple', 'bread'], side='right')
-        res_ser = s1.searchsorted(['apple', 'bread'], side='right')
-        exp = np.array([3, 5], dtype=np.intp)
-        self.assert_numpy_array_equal(res_cat, exp)
-        self.assert_numpy_array_equal(res_ser, exp)
-
-        # Searching for a single value that is not from the Categorical
-        self.assertRaises(ValueError, lambda: c1.searchsorted('cucumber'))
-        self.assertRaises(ValueError, lambda: s1.searchsorted('cucumber'))
-
-        # Searching for multiple values one of each is not from the Categorical
-        self.assertRaises(ValueError,
-                          lambda: c1.searchsorted(['bread', 'cucumber']))
-        self.assertRaises(ValueError,
-                          lambda: s1.searchsorted(['bread', 'cucumber']))
-
-        # searchsorted call for unordered Categorical
-        self.assertRaises(ValueError, lambda: c2.searchsorted('apple'))
-        self.assertRaises(ValueError, lambda: s2.searchsorted('apple'))
-
-        with tm.assert_produces_warning(FutureWarning):
-            res = c1.searchsorted(v=['bread'])
-            exp = np.array([3], dtype=np.intp)
-            tm.assert_numpy_array_equal(res, exp)
-
-    def test_deprecated_labels(self):
-        # TODO: labels is deprecated and should be removed in 0.18 or 2017,
-        # whatever is earlier
-        cat = pd.Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
-        exp = cat.codes
-        with tm.assert_produces_warning(FutureWarning):
-            res = cat.labels
-        self.assert_numpy_array_equal(res, exp)
-
-    def test_deprecated_from_array(self):
-        # GH13854, `.from_array` is deprecated
-        with tm.assert_produces_warning(FutureWarning):
-            Categorical.from_array([0, 1])
-
-    def test_datetime_categorical_comparison(self):
-        dt_cat = pd.Categorical(
-            pd.date_range('2014-01-01', periods=3), ordered=True)
-        self.assert_numpy_array_equal(dt_cat > dt_cat[0],
-                                      np.array([False, True, True]))
-        self.assert_numpy_array_equal(dt_cat[0] < dt_cat,
-                                      np.array([False, True, True]))
-
-    def test_reflected_comparison_with_scalars(self):
-        # GH8658
-        cat = pd.Categorical([1, 2, 3], ordered=True)
-        self.assert_numpy_array_equal(cat > cat[0],
-                                      np.array([False, True, True]))
-        self.assert_numpy_array_equal(cat[0] < cat,
-                                      np.array([False, True, True]))
-
-    def test_comparison_with_unknown_scalars(self):
-        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
-        # and following comparisons with scalars not in categories should raise
-        # for unequal comps, but not for equal/not equal
-        cat = pd.Categorical([1, 2, 3], ordered=True)
-
-        self.assertRaises(TypeError, lambda: cat < 4)
-        self.assertRaises(TypeError, lambda: cat > 4)
-        self.assertRaises(TypeError, lambda: 4 < cat)
-        self.assertRaises(TypeError, lambda: 4 > cat)
-
-        self.assert_numpy_array_equal(cat == 4,
-                                      np.array([False, False, False]))
-        self.assert_numpy_array_equal(cat != 4,
-                                      np.array([True, True, True]))
-
-    def test_map(self):
-        c = pd.Categorical(list('ABABC'), categories=list('CBA'),
-                           ordered=True)
-        result = c.map(lambda x: x.lower())
-        exp = pd.Categorical(list('ababc'), categories=list('cba'),
-                             ordered=True)
-        tm.assert_categorical_equal(result, exp)
-
-        c = pd.Categorical(list('ABABC'), categories=list('ABC'),
-                           ordered=False)
-        result = c.map(lambda x: x.lower())
-        exp = pd.Categorical(list('ababc'), categories=list('abc'),
-                             ordered=False)
-        tm.assert_categorical_equal(result, exp)
-
-        result = c.map(lambda x: 1)
-        # GH 12766: Return an index not an array
-        tm.assert_index_equal(result, Index(np.array([1] * 5, dtype=np.int64)))
-
-    def test_validate_inplace(self):
-        cat = Categorical(['A', 'B', 'B', 'C', 'A'])
-        invalid_values = [1, "True", [1, 2, 3], 5.0]
-
-        for value in invalid_values:
-            with self.assertRaises(ValueError):
-                cat.set_ordered(value=True, inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.as_ordered(inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.as_unordered(inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.set_categories(['X', 'Y', 'Z'], rename=True, inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.rename_categories(['X', 'Y', 'Z'], inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.reorder_categories(
-                    ['X', 'Y', 'Z'], ordered=True, inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.add_categories(
-                    new_categories=['D', 'E', 'F'], inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.remove_categories(removals=['D', 'E', 'F'], inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.remove_unused_categories(inplace=value)
-
-            with self.assertRaises(ValueError):
-                cat.sort_values(inplace=value)
-
-
-class TestCategoricalAsBlock(tm.TestCase):
-
-    def setUp(self):
-        self.factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-
-        df = DataFrame({'value': np.random.randint(0, 10000, 100)})
-        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
-
-        df = df.sort_values(by=['value'], ascending=True)
-        df['value_group'] = pd.cut(df.value, range(0, 10500, 500), right=False,
-                                   labels=labels)
-        self.cat = df
-
-    def test_dtypes(self):
-
-        # GH8143
-        index = ['cat', 'obj', 'num']
-        cat = pd.Categorical(['a', 'b', 'c'])
-        obj = pd.Series(['a', 'b', 'c'])
-        num = pd.Series([1, 2, 3])
-        df = pd.concat([pd.Series(cat), obj, num], axis=1, keys=index)
-
-        result = df.dtypes == 'object'
-        expected = Series([False, True, False], index=index)
-        tm.assert_series_equal(result, expected)
-
-        result = df.dtypes == 'int64'
-        expected = Series([False, False, True], index=index)
-        tm.assert_series_equal(result, expected)
-
-        result = df.dtypes == 'category'
-        expected = Series([True, False, False], index=index)
-        tm.assert_series_equal(result, expected)
-
-    def test_codes_dtypes(self):
-
-        # GH 8453
-        result = Categorical(['foo', 'bar', 'baz'])
-        self.assertTrue(result.codes.dtype == 'int8')
-
-        result = Categorical(['foo%05d' % i for i in range(400)])
-        self.assertTrue(result.codes.dtype == 'int16')
-
-        result = Categorical(['foo%05d' % i for i in range(40000)])
-        self.assertTrue(result.codes.dtype == 'int32')
-
-        # adding cats
-        result = Categorical(['foo', 'bar', 'baz'])
-        self.assertTrue(result.codes.dtype == 'int8')
-        result = result.add_categories(['foo%05d' % i for i in range(400)])
-        self.assertTrue(result.codes.dtype == 'int16')
-
-        # removing cats
-        result = result.remove_categories(['foo%05d' % i for i in range(300)])
-        self.assertTrue(result.codes.dtype == 'int8')
-
-    def test_basic(self):
-
-        # test basic creation / coercion of categoricals
-        s = Series(self.factor, name='A')
-        self.assertEqual(s.dtype, 'category')
-        self.assertEqual(len(s), len(self.factor))
-        str(s.values)
-        str(s)
-
-        # in a frame
-        df = DataFrame({'A': self.factor})
-        result = df['A']
-        tm.assert_series_equal(result, s)
-        result = df.iloc[:, 0]
-        tm.assert_series_equal(result, s)
-        self.assertEqual(len(df), len(self.factor))
-        str(df.values)
-        str(df)
-
-        df = DataFrame({'A': s})
-        result = df['A']
-        tm.assert_series_equal(result, s)
-        self.assertEqual(len(df), len(self.factor))
-        str(df.values)
-        str(df)
-
-        # multiples
-        df = DataFrame({'A': s, 'B': s, 'C': 1})
-        result1 = df['A']
-        result2 = df['B']
-        tm.assert_series_equal(result1, s)
-        tm.assert_series_equal(result2, s, check_names=False)
-        self.assertEqual(result2.name, 'B')
-        self.assertEqual(len(df), len(self.factor))
-        str(df.values)
-        str(df)
-
-        # GH8623
-        x = pd.DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
-                          [1, 'John P. Doe']],
-                         columns=['person_id', 'person_name'])
-        x['person_name'] = pd.Categorical(x.person_name
-                                          )  # doing this breaks transform
-
-        expected = x.iloc[0].person_name
-        result = x.person_name.iloc[0]
-        self.assertEqual(result, expected)
-
-        result = x.person_name[0]
-        self.assertEqual(result, expected)
-
-        result = x.person_name.loc[0]
-        self.assertEqual(result, expected)
-
-    def test_creation_astype(self):
-        l = ["a", "b", "c", "a"]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l))
-        res = s.astype('category')
-        tm.assert_series_equal(res, exp)
-
-        l = [1, 2, 3, 1]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l))
-        res = s.astype('category')
-        tm.assert_series_equal(res, exp)
-
-        df = pd.DataFrame({"cats": [1, 2, 3, 4, 5, 6],
-                           "vals": [1, 2, 3, 4, 5, 6]})
-        cats = Categorical([1, 2, 3, 4, 5, 6])
-        exp_df = pd.DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
-        df["cats"] = df["cats"].astype("category")
-        tm.assert_frame_equal(exp_df, df)
-
-        df = pd.DataFrame({"cats": ['a', 'b', 'b', 'a', 'a', 'd'],
-                           "vals": [1, 2, 3, 4, 5, 6]})
-        cats = Categorical(['a', 'b', 'b', 'a', 'a', 'd'])
-        exp_df = pd.DataFrame({"cats": cats, "vals": [1, 2, 3, 4, 5, 6]})
-        df["cats"] = df["cats"].astype("category")
-        tm.assert_frame_equal(exp_df, df)
-
-        # with keywords
-        l = ["a", "b", "c", "a"]
-        s = pd.Series(l)
-        exp = pd.Series(Categorical(l, ordered=True))
-        res = s.astype('category', ordered=True)
-        tm.assert_series_equal(res, exp)
-
-        exp = pd.Series(Categorical(
-            l, categories=list('abcdef'), ordered=True))
-        res = s.astype('category', categories=list('abcdef'), ordered=True)
-        tm.assert_series_equal(res, exp)
-
-    def test_construction_series(self):
-
-        l = [1, 2, 3, 1]
-        exp = Series(l).astype('category')
-        res = Series(l, dtype='category')
-        tm.assert_series_equal(res, exp)
-
-        l = ["a", "b", "c", "a"]
-        exp = Series(l).astype('category')
-        res = Series(l, dtype='category')
-        tm.assert_series_equal(res, exp)
-
-        # insert into frame with different index
-        # GH 8076
-        index = pd.date_range('20000101', periods=3)
-        expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
-                                      categories=['a', 'b', 'c']))
-        expected.index = index
-
-        expected = DataFrame({'x': expected})
-        df = DataFrame(
-            {'x': Series(['a', 'b', 'c'], dtype='category')}, index=index)
-        tm.assert_frame_equal(df, expected)
-
-    def test_construction_frame(self):
-
-        # GH8626
-
-        # dict creation
-        df = DataFrame({'A': list('abc')}, dtype='category')
-        expected = Series(list('abc'), dtype='category', name='A')
-        tm.assert_series_equal(df['A'], expected)
-
-        # to_frame
-        s = Series(list('abc'), dtype='category')
-        result = s.to_frame()
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(result[0], expected)
-        result = s.to_frame(name='foo')
-        expected = Series(list('abc'), dtype='category', name='foo')
-        tm.assert_series_equal(result['foo'], expected)
-
-        # list-like creation
-        df = DataFrame(list('abc'), dtype='category')
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(df[0], expected)
-
-        # ndim != 1
-        df = DataFrame([pd.Categorical(list('abc'))])
-        expected = DataFrame({0: Series(list('abc'), dtype='category')})
-        tm.assert_frame_equal(df, expected)
-
-        df = DataFrame([pd.Categorical(list('abc')), pd.Categorical(list(
-            'abd'))])
-        expected = DataFrame({0: Series(list('abc'), dtype='category'),
-                              1: Series(list('abd'), dtype='category')},
-                             columns=[0, 1])
-        tm.assert_frame_equal(df, expected)
-
-        # mixed
-        df = DataFrame([pd.Categorical(list('abc')), list('def')])
-        expected = DataFrame({0: Series(list('abc'), dtype='category'),
-                              1: list('def')}, columns=[0, 1])
-        tm.assert_frame_equal(df, expected)
-
-        # invalid (shape)
-        self.assertRaises(
-            ValueError,
-            lambda: DataFrame([pd.Categorical(list('abc')),
-                               pd.Categorical(list('abdefg'))]))
-
-        # ndim > 1
-        self.assertRaises(NotImplementedError,
-                          lambda: pd.Categorical(np.array([list('abcd')])))
-
-    def test_reshaping(self):
-
-        p = tm.makePanel()
-        p['str'] = 'foo'
-        df = p.to_frame()
-        df['category'] = df['str'].astype('category')
-        result = df['category'].unstack()
-
-        c = Categorical(['foo'] * len(p.major_axis))
-        expected = DataFrame({'A': c.copy(),
-                              'B': c.copy(),
-                              'C': c.copy(),
-                              'D': c.copy()},
-                             columns=Index(list('ABCD'), name='minor'),
-                             index=p.major_axis.set_names('major'))
-        tm.assert_frame_equal(result, expected)
-
-    def test_reindex(self):
-
-        index = pd.date_range('20000101', periods=3)
-
-        # reindexing to an invalid Categorical
-        s = Series(['a', 'b', 'c'], dtype='category')
-        result = s.reindex(index)
-        expected = Series(Categorical(values=[np.nan, np.nan, np.nan],
-                                      categories=['a', 'b', 'c']))
-        expected.index = index
-        tm.assert_series_equal(result, expected)
-
-        # partial reindexing
-        expected = Series(Categorical(values=['b', 'c'], categories=['a', 'b',
-                                                                     'c']))
-        expected.index = [1, 2]
-        result = s.reindex([1, 2])
-        tm.assert_series_equal(result, expected)
-
-        expected = Series(Categorical(
-            values=['c', np.nan], categories=['a', 'b', 'c']))
-        expected.index = [2, 3]
-        result = s.reindex([2, 3])
-        tm.assert_series_equal(result, expected)
-
-    def test_sideeffects_free(self):
-        # Passing a categorical to a Series and then changing values in either
-        # the series or the categorical should not change the values in the
-        # other one, IF you specify copy!
-        cat = Categorical(["a", "b", "c", "a"])
-        s = pd.Series(cat, copy=True)
-        self.assertFalse(s.cat is cat)
-        s.cat.categories = [1, 2, 3]
-        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
-        exp_cat = np.array(["a", "b", "c", "a"], dtype=np.object_)
-        self.assert_numpy_array_equal(s.__array__(), exp_s)
-        self.assert_numpy_array_equal(cat.__array__(), exp_cat)
-
-        # setting
-        s[0] = 2
-        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(s.__array__(), exp_s2)
-        self.assert_numpy_array_equal(cat.__array__(), exp_cat)
-
-        # however, copy is False by default
-        # so this WILL change values
-        cat = Categorical(["a", "b", "c", "a"])
-        s = pd.Series(cat)
-        self.assertTrue(s.values is cat)
-        s.cat.categories = [1, 2, 3]
-        exp_s = np.array([1, 2, 3, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(s.__array__(), exp_s)
-        self.assert_numpy_array_equal(cat.__array__(), exp_s)
-
-        s[0] = 2
-        exp_s2 = np.array([2, 2, 3, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(s.__array__(), exp_s2)
-        self.assert_numpy_array_equal(cat.__array__(), exp_s2)
-
-    def test_nan_handling(self):
-
-        # NaNs are represented as -1 in labels
-        s = Series(Categorical(["a", "b", np.nan, "a"]))
-        self.assert_index_equal(s.cat.categories, Index(["a", "b"]))
-        self.assert_numpy_array_equal(s.values.codes,
-                                      np.array([0, 1, -1, 0], dtype=np.int8))
-
-    def test_cat_accessor(self):
-        s = Series(Categorical(["a", "b", np.nan, "a"]))
-        self.assert_index_equal(s.cat.categories, Index(["a", "b"]))
-        self.assertEqual(s.cat.ordered, False)
-        exp = Categorical(["a", "b", np.nan, "a"], categories=["b", "a"])
-        s.cat.set_categories(["b", "a"], inplace=True)
-        tm.assert_categorical_equal(s.values, exp)
-
-        res = s.cat.set_categories(["b", "a"])
-        tm.assert_categorical_equal(res.values, exp)
-
-        exp = Categorical(["a", "b", np.nan, "a"], categories=["b", "a"])
-        s[:] = "a"
-        s = s.cat.remove_unused_categories()
-        self.assert_index_equal(s.cat.categories, Index(["a"]))
-
-    def test_sequence_like(self):
-
-        # GH 7839
-        # make sure can iterate
-        df = DataFrame({"id": [1, 2, 3, 4, 5, 6],
-                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
-        df['grade'] = Categorical(df['raw_grade'])
-
-        # basic sequencing testing
-        result = list(df.grade.values)
-        expected = np.array(df.grade.values).tolist()
-        tm.assert_almost_equal(result, expected)
-
-        # iteration
-        for t in df.itertuples(index=False):
-            str(t)
-
-        for row, s in df.iterrows():
-            str(s)
-
-        for c, col in df.iteritems():
-            str(s)
-
-    def test_series_delegations(self):
-
-        # invalid accessor
-        self.assertRaises(AttributeError, lambda: Series([1, 2, 3]).cat)
-        tm.assertRaisesRegexp(
-            AttributeError,
-            r"Can only use .cat accessor with a 'category' dtype",
-            lambda: Series([1, 2, 3]).cat)
-        self.assertRaises(AttributeError, lambda: Series(['a', 'b', 'c']).cat)
-        self.assertRaises(AttributeError, lambda: Series(np.arange(5.)).cat)
-        self.assertRaises(AttributeError,
-                          lambda: Series([Timestamp('20130101')]).cat)
-
-        # Series should delegate calls to '.categories', '.codes', '.ordered'
-        # and the methods '.set_categories()' 'drop_unused_categories()' to the
-        # categorical
-        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
-        exp_categories = Index(["a", "b", "c"])
-        tm.assert_index_equal(s.cat.categories, exp_categories)
-        s.cat.categories = [1, 2, 3]
-        exp_categories = Index([1, 2, 3])
-        self.assert_index_equal(s.cat.categories, exp_categories)
-
-        exp_codes = Series([0, 1, 2, 0], dtype='int8')
-        tm.assert_series_equal(s.cat.codes, exp_codes)
-
-        self.assertEqual(s.cat.ordered, True)
-        s = s.cat.as_unordered()
-        self.assertEqual(s.cat.ordered, False)
-        s.cat.as_ordered(inplace=True)
-        self.assertEqual(s.cat.ordered, True)
-
-        # reorder
-        s = Series(Categorical(["a", "b", "c", "a"], ordered=True))
-        exp_categories = Index(["c", "b", "a"])
-        exp_values = np.array(["a", "b", "c", "a"], dtype=np.object_)
-        s = s.cat.set_categories(["c", "b", "a"])
-        tm.assert_index_equal(s.cat.categories, exp_categories)
-        self.assert_numpy_array_equal(s.values.__array__(), exp_values)
-        self.assert_numpy_array_equal(s.__array__(), exp_values)
-
-        # remove unused categories
-        s = Series(Categorical(["a", "b", "b", "a"], categories=["a", "b", "c"
-                                                                 ]))
-        exp_categories = Index(["a", "b"])
-        exp_values = np.array(["a", "b", "b", "a"], dtype=np.object_)
-        s = s.cat.remove_unused_categories()
-        self.assert_index_equal(s.cat.categories, exp_categories)
-        self.assert_numpy_array_equal(s.values.__array__(), exp_values)
-        self.assert_numpy_array_equal(s.__array__(), exp_values)
-
-        # This method is likely to be confused, so test that it raises an error
-        # on wrong inputs:
-        def f():
-            s.set_categories([4, 3, 2, 1])
-
-        self.assertRaises(Exception, f)
-        # right: s.cat.set_categories([4,3,2,1])
-
-    def test_series_functions_no_warnings(self):
-        df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
-        labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
-        with tm.assert_produces_warning(False):
-            df['group'] = pd.cut(df.value, range(0, 105, 10), right=False,
-                                 labels=labels)
-
-    def test_assignment_to_dataframe(self):
-        # assignment
-        df = DataFrame({'value': np.array(np.random.randint(0, 10000, 100),
-                                          dtype='int32')})
-        labels = ["{0} - {1}".format(i, i + 499) for i in range(0, 10000, 500)]
-
-        df = df.sort_values(by=['value'], ascending=True)
-        s = pd.cut(df.value, range(0, 10500, 500), right=False, labels=labels)
-        d = s.values
-        df['D'] = d
-        str(df)
-
-        result = df.dtypes
-        expected = Series(
-            [np.dtype('int32'), CategoricalDtype()], index=['value', 'D'])
-        tm.assert_series_equal(result, expected)
-
-        df['E'] = s
-        str(df)
-
-        result = df.dtypes
-        expected = Series([np.dtype('int32'), CategoricalDtype(),
-                           CategoricalDtype()],
-                          index=['value', 'D', 'E'])
-        tm.assert_series_equal(result, expected)
-
-        result1 = df['D']
-        result2 = df['E']
-        self.assert_categorical_equal(result1._data._block.values, d)
-
-        # sorting
-        s.name = 'E'
-        self.assert_series_equal(result2.sort_index(), s.sort_index())
-
-        cat = pd.Categorical([1, 2, 3, 10], categories=[1, 2, 3, 4, 10])
-        df = pd.DataFrame(pd.Series(cat))
-
-    def test_describe(self):
-
-        # Categoricals should not show up together with numerical columns
-        result = self.cat.describe()
-        self.assertEqual(len(result.columns), 1)
-
-        # In a frame, describe() for the cat should be the same as for string
-        # arrays (count, unique, top, freq)
-
-        cat = Categorical(["a", "b", "b", "b"], categories=['a', 'b', 'c'],
-                          ordered=True)
-        s = Series(cat)
-        result = s.describe()
-        expected = Series([4, 2, "b", 3],
-                          index=['count', 'unique', 'top', 'freq'])
-        tm.assert_series_equal(result, expected)
-
-        cat = pd.Series(pd.Categorical(["a", "b", "c", "c"]))
-        df3 = pd.DataFrame({"cat": cat, "s": ["a", "b", "c", "c"]})
-        res = df3.describe()
-        self.assert_numpy_array_equal(res["cat"].values, res["s"].values)
-
-    def test_repr(self):
-        a = pd.Series(pd.Categorical([1, 2, 3, 4]))
-        exp = u("0    1\n1    2\n2    3\n3    4\n" +
-                "dtype: category\nCategories (4, int64): [1, 2, 3, 4]")
-
-        self.assertEqual(exp, a.__unicode__())
-
-        a = pd.Series(pd.Categorical(["a", "b"] * 25))
-        exp = u("0     a\n1     b\n" + "     ..\n" + "48    a\n49    b\n" +
-                "dtype: category\nCategories (2, object): [a, b]")
-        with option_context("display.max_rows", 5):
-            self.assertEqual(exp, repr(a))
-
-        levs = list("abcdefghijklmnopqrstuvwxyz")
-        a = pd.Series(pd.Categorical(
-            ["a", "b"], categories=levs, ordered=True))
-        exp = u("0    a\n1    b\n" + "dtype: category\n"
-                "Categories (26, object): [a < b < c < d ... w < x < y < z]")
-        self.assertEqual(exp, a.__unicode__())
-
-    def test_categorical_repr(self):
-        c = pd.Categorical([1, 2, 3])
-        exp = """[1, 2, 3]
-Categories (3, int64): [1, 2, 3]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3])
-        exp = """[1, 2, 3, 1, 2, 3]
-Categories (3, int64): [1, 2, 3]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 4, 5] * 10)
-        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
-Length: 50
-Categories (5, int64): [1, 2, 3, 4, 5]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(np.arange(20))
-        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
-Length: 20
-Categories (20, int64): [0, 1, 2, 3, ..., 16, 17, 18, 19]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_ordered(self):
-        c = pd.Categorical([1, 2, 3], ordered=True)
-        exp = """[1, 2, 3]
-Categories (3, int64): [1 < 2 < 3]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 1, 2, 3], categories=[1, 2, 3],
-                           ordered=True)
-        exp = """[1, 2, 3, 1, 2, 3]
-Categories (3, int64): [1 < 2 < 3]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical([1, 2, 3, 4, 5] * 10, ordered=True)
-        exp = """[1, 2, 3, 4, 5, ..., 1, 2, 3, 4, 5]
-Length: 50
-Categories (5, int64): [1 < 2 < 3 < 4 < 5]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(np.arange(20), ordered=True)
-        exp = """[0, 1, 2, 3, 4, ..., 15, 16, 17, 18, 19]
-Length: 20
-Categories (20, int64): [0 < 1 < 2 < 3 ... 16 < 17 < 18 < 19]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx)
-
-        # TODO(wesm): exceeding 80 characters in the console is not good
-        # behavior
-        exp = (
-            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
-            "2011-01-01 12:00:00, 2011-01-01 13:00:00]\n"
-            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
-            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
-            "                                 2011-01-01 12:00:00, "
-            "2011-01-01 13:00:00]""")
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = (
-            "[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, "
-            "2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, "
-            "2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, "
-            "2011-01-01 13:00:00]\n"
-            "Categories (5, datetime64[ns]): [2011-01-01 09:00:00, "
-            "2011-01-01 10:00:00, 2011-01-01 11:00:00,\n"
-            "                                 2011-01-01 12:00:00, "
-            "2011-01-01 13:00:00]")
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        c = pd.Categorical(idx)
-        exp = (
-            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
-            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
-            "2011-01-01 13:00:00-05:00]\n"
-            "Categories (5, datetime64[ns, US/Eastern]): "
-            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
-            "                                             "
-            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
-            "                                             "
-            "2011-01-01 13:00:00-05:00]")
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = (
-            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, "
-            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, "
-            "2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, "
-            "2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, "
-            "2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]\n"
-            "Categories (5, datetime64[ns, US/Eastern]): "
-            "[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,\n"
-            "                                             "
-            "2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,\n"
-            "                                             "
-            "2011-01-01 13:00:00-05:00]")
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00, 2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00]
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""  # noqa
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""  # noqa
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00, 2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00]
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_period(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00, 2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00]
-Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[2011-01, 2011-02, 2011-03, 2011-04, 2011-05, 2011-01, 2011-02, 2011-03, 2011-04, 2011-05]
-Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        c = pd.Categorical(idx)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=20)
-        c = pd.Categorical(idx)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 20
-Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
-                                   18 days 01:00:00, 19 days 01:00:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 40
-Categories (20, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 16 days 01:00:00, 17 days 01:00:00,
-                                   18 days 01:00:00, 19 days 01:00:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[1 days, 2 days, 3 days, 4 days, 5 days, 1 days, 2 days, 3 days, 4 days, 5 days]
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-
-        self.assertEqual(repr(c), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=20)
-        c = pd.Categorical(idx, ordered=True)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 20
-Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
-                                   18 days 01:00:00 < 19 days 01:00:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-        c = pd.Categorical(idx.append(idx), categories=idx, ordered=True)
-        exp = """[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, ..., 15 days 01:00:00, 16 days 01:00:00, 17 days 01:00:00, 18 days 01:00:00, 19 days 01:00:00]
-Length: 40
-Categories (20, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 16 days 01:00:00 < 17 days 01:00:00 <
-                                   18 days 01:00:00 < 19 days 01:00:00]"""
-
-        self.assertEqual(repr(c), exp)
-
-    def test_categorical_series_repr(self):
-        s = pd.Series(pd.Categorical([1, 2, 3]))
-        exp = """0    1
-1    2
-2    3
-dtype: category
-Categories (3, int64): [1, 2, 3]"""
-
-        self.assertEqual(repr(s), exp)
-
-        s = pd.Series(pd.Categorical(np.arange(10)))
-        exp = """0    0
-1    1
-2    2
-3    3
-4    4
-5    5
-6    6
-7    7
-8    8
-9    9
-dtype: category
-Categories (10, int64): [0, 1, 2, 3, ..., 6, 7, 8, 9]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_ordered(self):
-        s = pd.Series(pd.Categorical([1, 2, 3], ordered=True))
-        exp = """0    1
-1    2
-2    3
-dtype: category
-Categories (3, int64): [1 < 2 < 3]"""
-
-        self.assertEqual(repr(s), exp)
-
-        s = pd.Series(pd.Categorical(np.arange(10), ordered=True))
-        exp = """0    0
-1    1
-2    2
-3    3
-4    4
-5    5
-6    6
-7    7
-8    8
-9    9
-dtype: category
-Categories (10, int64): [0 < 1 < 2 < 3 ... 6 < 7 < 8 < 9]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00:00
-1   2011-01-01 10:00:00
-2   2011-01-01 11:00:00
-3   2011-01-01 12:00:00
-4   2011-01-01 13:00:00
-dtype: category
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00,
-                                 2011-01-01 12:00:00, 2011-01-01 13:00:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2   2011-01-01 11:00:00-05:00
-3   2011-01-01 12:00:00-05:00
-4   2011-01-01 13:00:00-05:00
-dtype: category
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00,
-                                             2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00,
-                                             2011-01-01 13:00:00-05:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00:00
-1   2011-01-01 10:00:00
-2   2011-01-01 11:00:00
-3   2011-01-01 12:00:00
-4   2011-01-01 13:00:00
-dtype: category
-Categories (5, datetime64[ns]): [2011-01-01 09:00:00 < 2011-01-01 10:00:00 < 2011-01-01 11:00:00 <
-                                 2011-01-01 12:00:00 < 2011-01-01 13:00:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00:00-05:00
-1   2011-01-01 10:00:00-05:00
-2   2011-01-01 11:00:00-05:00
-3   2011-01-01 12:00:00-05:00
-4   2011-01-01 13:00:00-05:00
-dtype: category
-Categories (5, datetime64[ns, US/Eastern]): [2011-01-01 09:00:00-05:00 < 2011-01-01 10:00:00-05:00 <
-                                             2011-01-01 11:00:00-05:00 < 2011-01-01 12:00:00-05:00 <
-                                             2011-01-01 13:00:00-05:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_period(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01-01 09:00
-1   2011-01-01 10:00
-2   2011-01-01 11:00
-3   2011-01-01 12:00
-4   2011-01-01 13:00
-dtype: category
-Categories (5, period[H]): [2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00,
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   2011-01
-1   2011-02
-2   2011-03
-3   2011-04
-4   2011-05
-dtype: category
-Categories (5, period[M]): [2011-01, 2011-02, 2011-03, 2011-04, 2011-05]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01-01 09:00
-1   2011-01-01 10:00
-2   2011-01-01 11:00
-3   2011-01-01 12:00
-4   2011-01-01 13:00
-dtype: category
-Categories (5, period[H]): [2011-01-01 09:00 < 2011-01-01 10:00 < 2011-01-01 11:00 < 2011-01-01 12:00 <
-                            2011-01-01 13:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   2011-01
-1   2011-02
-2   2011-03
-3   2011-04
-4   2011-05
-dtype: category
-Categories (5, period[M]): [2011-01 < 2011-02 < 2011-03 < 2011-04 < 2011-05]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   1 days
-1   2 days
-2   3 days
-3   4 days
-4   5 days
-dtype: category
-Categories (5, timedelta64[ns]): [1 days, 2 days, 3 days, 4 days, 5 days]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        s = pd.Series(pd.Categorical(idx))
-        exp = """0   0 days 01:00:00
-1   1 days 01:00:00
-2   2 days 01:00:00
-3   3 days 01:00:00
-4   4 days 01:00:00
-5   5 days 01:00:00
-6   6 days 01:00:00
-7   7 days 01:00:00
-8   8 days 01:00:00
-9   9 days 01:00:00
-dtype: category
-Categories (10, timedelta64[ns]): [0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00,
-                                   3 days 01:00:00, ..., 6 days 01:00:00, 7 days 01:00:00,
-                                   8 days 01:00:00, 9 days 01:00:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_series_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   1 days
-1   2 days
-2   3 days
-3   4 days
-4   5 days
-dtype: category
-Categories (5, timedelta64[ns]): [1 days < 2 days < 3 days < 4 days < 5 days]"""
-
-        self.assertEqual(repr(s), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        s = pd.Series(pd.Categorical(idx, ordered=True))
-        exp = """0   0 days 01:00:00
-1   1 days 01:00:00
-2   2 days 01:00:00
-3   3 days 01:00:00
-4   4 days 01:00:00
-5   5 days 01:00:00
-6   6 days 01:00:00
-7   7 days 01:00:00
-8   8 days 01:00:00
-9   9 days 01:00:00
-dtype: category
-Categories (10, timedelta64[ns]): [0 days 01:00:00 < 1 days 01:00:00 < 2 days 01:00:00 <
-                                   3 days 01:00:00 ... 6 days 01:00:00 < 7 days 01:00:00 <
-                                   8 days 01:00:00 < 9 days 01:00:00]"""
-
-        self.assertEqual(repr(s), exp)
-
-    def test_categorical_index_repr(self):
-        idx = pd.CategoricalIndex(pd.Categorical([1, 2, 3]))
-        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=False, dtype='category')"""
-        self.assertEqual(repr(idx), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(np.arange(10)))
-        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_ordered(self):
-        i = pd.CategoricalIndex(pd.Categorical([1, 2, 3], ordered=True))
-        exp = """CategoricalIndex([1, 2, 3], categories=[1, 2, 3], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(np.arange(10), ordered=True))
-        exp = """CategoricalIndex([0, 1, 2, 3, 4, 5, 6, 7, 8, 9], categories=[0, 1, 2, 3, 4, 5, 6, 7, ...], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_datetime(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
-                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
-                  '2011-01-01 13:00:00'],
-                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=False, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=False, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_datetime_ordered(self):
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00', '2011-01-01 10:00:00',
-                  '2011-01-01 11:00:00', '2011-01-01 12:00:00',
-                  '2011-01-01 13:00:00'],
-                 categories=[2011-01-01 09:00:00, 2011-01-01 10:00:00, 2011-01-01 11:00:00, 2011-01-01 12:00:00, 2011-01-01 13:00:00], ordered=True, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                            tz='US/Eastern')
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(idx.append(idx), ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00:00-05:00', '2011-01-01 10:00:00-05:00',
-                  '2011-01-01 11:00:00-05:00', '2011-01-01 12:00:00-05:00',
-                  '2011-01-01 13:00:00-05:00', '2011-01-01 09:00:00-05:00',
-                  '2011-01-01 10:00:00-05:00', '2011-01-01 11:00:00-05:00',
-                  '2011-01-01 12:00:00-05:00', '2011-01-01 13:00:00-05:00'],
-                 categories=[2011-01-01 09:00:00-05:00, 2011-01-01 10:00:00-05:00, 2011-01-01 11:00:00-05:00, 2011-01-01 12:00:00-05:00, 2011-01-01 13:00:00-05:00], ordered=True, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_period(self):
-        # test all length
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=1)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00'], categories=[2011-01-01 09:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=2)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=3)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00'], categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        i = pd.CategoricalIndex(pd.Categorical(idx.append(idx)))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00', '2011-01-01 09:00',
-                  '2011-01-01 10:00', '2011-01-01 11:00', '2011-01-01 12:00',
-                  '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=False, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_period_ordered(self):
-        idx = pd.period_range('2011-01-01 09:00', freq='H', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01-01 09:00', '2011-01-01 10:00', '2011-01-01 11:00',
-                  '2011-01-01 12:00', '2011-01-01 13:00'],
-                 categories=[2011-01-01 09:00, 2011-01-01 10:00, 2011-01-01 11:00, 2011-01-01 12:00, 2011-01-01 13:00], ordered=True, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.period_range('2011-01', freq='M', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['2011-01', '2011-02', '2011-03', '2011-04', '2011-05'], categories=[2011-01, 2011-02, 2011-03, 2011-04, 2011-05], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=False, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        i = pd.CategoricalIndex(pd.Categorical(idx))
-        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
-                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
-                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
-                  '9 days 01:00:00'],
-                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=False, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_index_repr_timedelta_ordered(self):
-        idx = pd.timedelta_range('1 days', periods=5)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['1 days', '2 days', '3 days', '4 days', '5 days'], categories=[1 days 00:00:00, 2 days 00:00:00, 3 days 00:00:00, 4 days 00:00:00, 5 days 00:00:00], ordered=True, dtype='category')"""
-        self.assertEqual(repr(i), exp)
-
-        idx = pd.timedelta_range('1 hours', periods=10)
-        i = pd.CategoricalIndex(pd.Categorical(idx, ordered=True))
-        exp = """CategoricalIndex(['0 days 01:00:00', '1 days 01:00:00', '2 days 01:00:00',
-                  '3 days 01:00:00', '4 days 01:00:00', '5 days 01:00:00',
-                  '6 days 01:00:00', '7 days 01:00:00', '8 days 01:00:00',
-                  '9 days 01:00:00'],
-                 categories=[0 days 01:00:00, 1 days 01:00:00, 2 days 01:00:00, 3 days 01:00:00, 4 days 01:00:00, 5 days 01:00:00, 6 days 01:00:00, 7 days 01:00:00, ...], ordered=True, dtype='category')"""
-
-        self.assertEqual(repr(i), exp)
-
-    def test_categorical_frame(self):
-        # normal DataFrame
-        dt = pd.date_range('2011-01-01 09:00', freq='H', periods=5,
-                           tz='US/Eastern')
-        p = pd.period_range('2011-01', freq='M', periods=5)
-        df = pd.DataFrame({'dt': dt, 'p': p})
-        exp = """                         dt       p
-0 2011-01-01 09:00:00-05:00 2011-01
-1 2011-01-01 10:00:00-05:00 2011-02
-2 2011-01-01 11:00:00-05:00 2011-03
-3 2011-01-01 12:00:00-05:00 2011-04
-4 2011-01-01 13:00:00-05:00 2011-05"""
-
-        df = pd.DataFrame({'dt': pd.Categorical(dt), 'p': pd.Categorical(p)})
-        self.assertEqual(repr(df), exp)
-
-    def test_info(self):
-
-        # make sure it works
-        n = 2500
-        df = DataFrame({'int64': np.random.randint(100, size=n)})
-        df['category'] = Series(np.array(list('abcdefghij')).take(
-            np.random.randint(0, 10, size=n))).astype('category')
-        df.isnull()
-        buf = compat.StringIO()
-        df.info(buf=buf)
-
-        df2 = df[df['category'] == 'd']
-        buf = compat.StringIO()
-        df2.info(buf=buf)
-
-    def test_groupby_sort(self):
-
-        # http://stackoverflow.com/questions/23814368/sorting-pandas-categorical-labels-after-groupby
-        # This should result in a properly sorted Series so that the plot
-        # has a sorted x axis
-        # self.cat.groupby(['value_group'])['value_group'].count().plot(kind='bar')
-
-        res = self.cat.groupby(['value_group'])['value_group'].count()
-        exp = res[sorted(res.index, key=lambda x: float(x.split()[0]))]
-        exp.index = pd.CategoricalIndex(exp.index, name=exp.index.name)
-        tm.assert_series_equal(res, exp)
-
-    def test_min_max(self):
-        # unordered cats have no min/max
-        cat = Series(Categorical(["a", "b", "c", "d"], ordered=False))
-        self.assertRaises(TypeError, lambda: cat.min())
-        self.assertRaises(TypeError, lambda: cat.max())
-
-        cat = Series(Categorical(["a", "b", "c", "d"], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "a")
-        self.assertEqual(_max, "d")
-
-        cat = Series(Categorical(["a", "b", "c", "d"], categories=[
-                     'd', 'c', 'b', 'a'], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertEqual(_min, "d")
-        self.assertEqual(_max, "a")
-
-        cat = Series(Categorical(
-            [np.nan, "b", "c", np.nan], categories=['d', 'c', 'b', 'a'
-                                                    ], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, "b")
-
-        cat = Series(Categorical(
-            [np.nan, 1, 2, np.nan], categories=[5, 4, 3, 2, 1], ordered=True))
-        _min = cat.min()
-        _max = cat.max()
-        self.assertTrue(np.isnan(_min))
-        self.assertEqual(_max, 1)
-
-    def test_mode(self):
-        s = Series(Categorical([1, 1, 2, 4, 5, 5, 5],
-                               categories=[5, 4, 3, 2, 1], ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([5], categories=[
-                     5, 4, 3, 2, 1], ordered=True))
-        tm.assert_series_equal(res, exp)
-        s = Series(Categorical([1, 1, 1, 4, 5, 5, 5],
-                               categories=[5, 4, 3, 2, 1], ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([5, 1], categories=[
-                     5, 4, 3, 2, 1], ordered=True))
-        tm.assert_series_equal(res, exp)
-        s = Series(Categorical([1, 2, 3, 4, 5], categories=[5, 4, 3, 2, 1],
-                               ordered=True))
-        res = s.mode()
-        exp = Series(Categorical([5, 4, 3, 2, 1], categories=[5, 4, 3, 2, 1], ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_value_counts(self):
-        # GH 12835
-        cats = pd.Categorical(["a", "b", "c", "c", "c", "b"],
-                              categories=["c", "a", "b", "d"])
-        s = pd.Series(cats, name='xxx')
-        res = s.value_counts(sort=False)
-
-        exp_index = pd.CategoricalIndex(["c", "a", "b", "d"],
-                                        categories=cats.categories)
-        exp = Series([3, 1, 2, 0], name='xxx', index=exp_index)
-        tm.assert_series_equal(res, exp)
-
-        res = s.value_counts(sort=True)
-
-        exp_index = pd.CategoricalIndex(["c", "b", "a", "d"],
-                                        categories=cats.categories)
-        exp = Series([3, 2, 1, 0], name='xxx', index=exp_index)
-        tm.assert_series_equal(res, exp)
-
-        # check object dtype handles the Series.name as the same
-        # (tested in test_base.py)
-        s = pd.Series(["a", "b", "c", "c", "c", "b"], name='xxx')
-        res = s.value_counts()
-        exp = Series([3, 2, 1], name='xxx', index=["c", "b", "a"])
-        tm.assert_series_equal(res, exp)
-
-    def test_value_counts_with_nan(self):
-        # see gh-9443
-
-        # sanity check
-        s = pd.Series(["a", "b", "a"], dtype="category")
-        exp = pd.Series([2, 1], index=pd.CategoricalIndex(["a", "b"]))
-
-        res = s.value_counts(dropna=True)
-        tm.assert_series_equal(res, exp)
-
-        res = s.value_counts(dropna=True)
-        tm.assert_series_equal(res, exp)
-
-        # same Series via two different constructions --> same behaviour
-        series = [
-            pd.Series(["a", "b", None, "a", None, None], dtype="category"),
-            pd.Series(pd.Categorical(["a", "b", None, "a", None, None],
-                                     categories=["a", "b"]))
-        ]
-
-        for s in series:
-            # None is a NaN value, so we exclude its count here
-            exp = pd.Series([2, 1], index=pd.CategoricalIndex(["a", "b"]))
-            res = s.value_counts(dropna=True)
-            tm.assert_series_equal(res, exp)
-
-            # we don't exclude the count of None and sort by counts
-            exp = pd.Series(
-                [3, 2, 1], index=pd.CategoricalIndex([np.nan, "a", "b"]))
-            res = s.value_counts(dropna=False)
-            tm.assert_series_equal(res, exp)
-
-            # When we aren't sorting by counts, and np.nan isn't a
-            # category, it should be last.
-            exp = pd.Series(
-                [2, 1, 3], index=pd.CategoricalIndex(["a", "b", np.nan]))
-            res = s.value_counts(dropna=False, sort=False)
-            tm.assert_series_equal(res, exp)
-
-    def test_groupby(self):
-
-        cats = Categorical(["a", "a", "a", "b", "b", "b", "c", "c", "c"],
-                           categories=["a", "b", "c", "d"], ordered=True)
-        data = DataFrame({"a": [1, 1, 1, 2, 2, 2, 3, 4, 5], "b": cats})
-
-        exp_index = pd.CategoricalIndex(['a', 'b', 'c', 'd'], name='b',
-                                        ordered=True)
-        expected = DataFrame({'a': [1, 2, 4, np.nan]}, index=exp_index)
-        result = data.groupby("b").mean()
-        tm.assert_frame_equal(result, expected)
-
-        raw_cat1 = Categorical(["a", "a", "b", "b"],
-                               categories=["a", "b", "z"], ordered=True)
-        raw_cat2 = Categorical(["c", "d", "c", "d"],
-                               categories=["c", "d", "y"], ordered=True)
-        df = DataFrame({"A": raw_cat1, "B": raw_cat2, "values": [1, 2, 3, 4]})
-
-        # single grouper
-        gb = df.groupby("A")
-        exp_idx = pd.CategoricalIndex(['a', 'b', 'z'], name='A', ordered=True)
-        expected = DataFrame({'values': Series([3, 7, np.nan], index=exp_idx)})
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # multiple groupers
-        gb = df.groupby(['A', 'B'])
-        exp_index = pd.MultiIndex.from_product(
-            [Categorical(["a", "b", "z"], ordered=True),
-             Categorical(["c", "d", "y"], ordered=True)],
-            names=['A', 'B'])
-        expected = DataFrame({'values': [1, 2, np.nan, 3, 4, np.nan,
-                                         np.nan, np.nan, np.nan]},
-                             index=exp_index)
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # multiple groupers with a non-cat
-        df = df.copy()
-        df['C'] = ['foo', 'bar'] * 2
-        gb = df.groupby(['A', 'B', 'C'])
-        exp_index = pd.MultiIndex.from_product(
-            [Categorical(["a", "b", "z"], ordered=True),
-             Categorical(["c", "d", "y"], ordered=True),
-             ['foo', 'bar']],
-            names=['A', 'B', 'C'])
-        expected = DataFrame({'values': Series(
-            np.nan, index=exp_index)}).sort_index()
-        expected.iloc[[1, 2, 7, 8], 0] = [1, 2, 3, 4]
-        result = gb.sum()
-        tm.assert_frame_equal(result, expected)
-
-        # GH 8623
-        x = pd.DataFrame([[1, 'John P. Doe'], [2, 'Jane Dove'],
-                          [1, 'John P. Doe']],
-                         columns=['person_id', 'person_name'])
-        x['person_name'] = pd.Categorical(x.person_name)
-
-        g = x.groupby(['person_id'])
-        result = g.transform(lambda x: x)
-        tm.assert_frame_equal(result, x[['person_name']])
-
-        result = x.drop_duplicates('person_name')
-        expected = x.iloc[[0, 1]]
-        tm.assert_frame_equal(result, expected)
-
-        def f(x):
-            return x.drop_duplicates('person_name').iloc[0]
-
-        result = g.apply(f)
-        expected = x.iloc[[0, 1]].copy()
-        expected.index = Index([1, 2], name='person_id')
-        expected['person_name'] = expected['person_name'].astype('object')
-        tm.assert_frame_equal(result, expected)
-
-        # GH 9921
-        # Monotonic
-        df = DataFrame({"a": [5, 15, 25]})
-        c = pd.cut(df.a, bins=[0, 10, 20, 30, 40])
-
-        result = df.a.groupby(c).transform(sum)
-        tm.assert_series_equal(result, df['a'])
-
-        tm.assert_series_equal(
-            df.a.groupby(c).transform(lambda xs: np.sum(xs)), df['a'])
-        tm.assert_frame_equal(df.groupby(c).transform(sum), df[['a']])
-        tm.assert_frame_equal(
-            df.groupby(c).transform(lambda xs: np.max(xs)), df[['a']])
-
-        # Filter
-        tm.assert_series_equal(df.a.groupby(c).filter(np.all), df['a'])
-        tm.assert_frame_equal(df.groupby(c).filter(np.all), df)
-
-        # Non-monotonic
-        df = DataFrame({"a": [5, 15, 25, -5]})
-        c = pd.cut(df.a, bins=[-10, 0, 10, 20, 30, 40])
-
-        result = df.a.groupby(c).transform(sum)
-        tm.assert_series_equal(result, df['a'])
-
-        tm.assert_series_equal(
-            df.a.groupby(c).transform(lambda xs: np.sum(xs)), df['a'])
-        tm.assert_frame_equal(df.groupby(c).transform(sum), df[['a']])
-        tm.assert_frame_equal(
-            df.groupby(c).transform(lambda xs: np.sum(xs)), df[['a']])
-
-        # GH 9603
-        df = pd.DataFrame({'a': [1, 0, 0, 0]})
-        c = pd.cut(df.a, [0, 1, 2, 3, 4])
-        result = df.groupby(c).apply(len)
-
-        exp_index = pd.CategoricalIndex(c.values.categories,
-                                        ordered=c.values.ordered)
-        expected = pd.Series([1, 0, 0, 0], index=exp_index)
-        expected.index.name = 'a'
-        tm.assert_series_equal(result, expected)
-
-    def test_pivot_table(self):
-
-        raw_cat1 = Categorical(["a", "a", "b", "b"],
-                               categories=["a", "b", "z"], ordered=True)
-        raw_cat2 = Categorical(["c", "d", "c", "d"],
-                               categories=["c", "d", "y"], ordered=True)
-        df = DataFrame({"A": raw_cat1, "B": raw_cat2, "values": [1, 2, 3, 4]})
-        result = pd.pivot_table(df, values='values', index=['A', 'B'])
-
-        exp_index = pd.MultiIndex.from_product(
-            [Categorical(["a", "b", "z"], ordered=True),
-             Categorical(["c", "d", "y"], ordered=True)],
-            names=['A', 'B'])
-        expected = Series([1, 2, np.nan, 3, 4, np.nan, np.nan, np.nan, np.nan],
-                          index=exp_index, name='values')
-        tm.assert_series_equal(result, expected)
-
-    def test_count(self):
-
-        s = Series(Categorical([np.nan, 1, 2, np.nan],
-                               categories=[5, 4, 3, 2, 1], ordered=True))
-        result = s.count()
-        self.assertEqual(result, 2)
-
-    def test_sort_values(self):
-
-        c = Categorical(["a", "b", "b", "a"], ordered=False)
-        cat = Series(c.copy())
-
-        # 'order' was deprecated in gh-10726
-        # 'sort' was deprecated in gh-12882
-        for func in ('order', 'sort'):
-            with tm.assert_produces_warning(FutureWarning):
-                getattr(c, func)()
-
-        # sort in the categories order
-        expected = Series(
-            Categorical(["a", "a", "b", "b"],
-                        ordered=False), index=[0, 3, 1, 2])
-        result = cat.sort_values()
-        tm.assert_series_equal(result, expected)
-
-        cat = Series(Categorical(["a", "c", "b", "d"], ordered=True))
-        res = cat.sort_values()
-        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        cat = Series(Categorical(["a", "c", "b", "d"], categories=[
-                     "a", "b", "c", "d"], ordered=True))
-        res = cat.sort_values()
-        exp = np.array(["a", "b", "c", "d"], dtype=np.object_)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        res = cat.sort_values(ascending=False)
-        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
-        self.assert_numpy_array_equal(res.__array__(), exp)
-
-        raw_cat1 = Categorical(["a", "b", "c", "d"],
-                               categories=["a", "b", "c", "d"], ordered=False)
-        raw_cat2 = Categorical(["a", "b", "c", "d"],
-                               categories=["d", "c", "b", "a"], ordered=True)
-        s = ["a", "b", "c", "d"]
-        df = DataFrame({"unsort": raw_cat1,
-                        "sort": raw_cat2,
-                        "string": s,
-                        "values": [1, 2, 3, 4]})
-
-        # Cats must be sorted in a dataframe
-        res = df.sort_values(by=["string"], ascending=False)
-        exp = np.array(["d", "c", "b", "a"], dtype=np.object_)
-        self.assert_numpy_array_equal(res["sort"].values.__array__(), exp)
-        self.assertEqual(res["sort"].dtype, "category")
-
-        res = df.sort_values(by=["sort"], ascending=False)
-        exp = df.sort_values(by=["string"], ascending=True)
-        self.assert_series_equal(res["values"], exp["values"])
-        self.assertEqual(res["sort"].dtype, "category")
-        self.assertEqual(res["unsort"].dtype, "category")
-
-        # unordered cat, but we allow this
-        df.sort_values(by=["unsort"], ascending=False)
-
-        # multi-columns sort
-        # GH 7848
-        df = DataFrame({"id": [6, 5, 4, 3, 2, 1],
-                        "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
-        df["grade"] = pd.Categorical(df["raw_grade"], ordered=True)
-        df['grade'] = df['grade'].cat.set_categories(['b', 'e', 'a'])
-
-        # sorts 'grade' according to the order of the categories
-        result = df.sort_values(by=['grade'])
-        expected = df.iloc[[1, 2, 5, 0, 3, 4]]
-        tm.assert_frame_equal(result, expected)
-
-        # multi
-        result = df.sort_values(by=['grade', 'id'])
-        expected = df.iloc[[2, 1, 5, 4, 3, 0]]
-        tm.assert_frame_equal(result, expected)
-
-    def test_slicing(self):
-        cat = Series(Categorical([1, 2, 3, 4]))
-        reversed = cat[::-1]
-        exp = np.array([4, 3, 2, 1], dtype=np.int64)
-        self.assert_numpy_array_equal(reversed.__array__(), exp)
-
-        df = DataFrame({'value': (np.arange(100) + 1).astype('int64')})
-        df['D'] = pd.cut(df.value, bins=[0, 25, 50, 75, 100])
-
-        expected = Series([11, '(0, 25]'], index=['value', 'D'], name=10)
-        result = df.iloc[10]
-        tm.assert_series_equal(result, expected)
-
-        expected = DataFrame({'value': np.arange(11, 21).astype('int64')},
-                             index=np.arange(10, 20).astype('int64'))
-        expected['D'] = pd.cut(expected.value, bins=[0, 25, 50, 75, 100])
-        result = df.iloc[10:20]
-        tm.assert_frame_equal(result, expected)
-
-        expected = Series([9, '(0, 25]'], index=['value', 'D'], name=8)
-        result = df.loc[8]
-        tm.assert_series_equal(result, expected)
-
-    def test_slicing_and_getting_ops(self):
-
-        # systematically test the slicing operations:
-        #  for all slicing ops:
-        #   - returning a dataframe
-        #   - returning a column
-        #   - returning a row
-        #   - returning a single value
-
-        cats = pd.Categorical(
-            ["a", "c", "b", "c", "c", "c", "c"], categories=["a", "b", "c"])
-        idx = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values = [1, 2, 3, 4, 5, 6, 7]
-        df = pd.DataFrame({"cats": cats, "values": values}, index=idx)
-
-        # the expected values
-        cats2 = pd.Categorical(["b", "c"], categories=["a", "b", "c"])
-        idx2 = pd.Index(["j", "k"])
-        values2 = [3, 4]
-
-        # 2:4,: | "j":"k",:
-        exp_df = pd.DataFrame({"cats": cats2, "values": values2}, index=idx2)
-
-        # :,"cats" | :,0
-        exp_col = pd.Series(cats, index=idx, name='cats')
-
-        # "j",: | 2,:
-        exp_row = pd.Series(["b", 3], index=["cats", "values"], dtype="object",
-                            name="j")
-
-        # "j","cats | 2,0
-        exp_val = "b"
-
-        # iloc
-        # frame
-        res_df = df.iloc[2:4, :]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.iloc[2, :]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.iloc[:, 0]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.iloc[2, 0]
-        self.assertEqual(res_val, exp_val)
-
-        # loc
-        # frame
-        res_df = df.loc["j":"k", :]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.loc["j", :]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.loc[:, "cats"]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.loc["j", "cats"]
-        self.assertEqual(res_val, exp_val)
-
-        # ix
-        # frame
-        # res_df = df.loc["j":"k",[0,1]] # doesn't work?
-        res_df = df.loc["j":"k", :]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        # row
-        res_row = df.loc["j", :]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        # col
-        res_col = df.loc[:, "cats"]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(is_categorical_dtype(res_col))
-
-        # single value
-        res_val = df.loc["j", df.columns[0]]
-        self.assertEqual(res_val, exp_val)
-
-        # iat
-        res_val = df.iat[2, 0]
-        self.assertEqual(res_val, exp_val)
-
-        # at
-        res_val = df.at["j", "cats"]
-        self.assertEqual(res_val, exp_val)
-
-        # fancy indexing
-        exp_fancy = df.iloc[[2]]
-
-        res_fancy = df[df["cats"] == "b"]
-        tm.assert_frame_equal(res_fancy, exp_fancy)
-        res_fancy = df[df["values"] == 3]
-        tm.assert_frame_equal(res_fancy, exp_fancy)
-
-        # get_value
-        res_val = df.get_value("j", "cats")
-        self.assertEqual(res_val, exp_val)
-
-        # i : int, slice, or sequence of integers
-        res_row = df.iloc[2]
-        tm.assert_series_equal(res_row, exp_row)
-        tm.assertIsInstance(res_row["cats"], compat.string_types)
-
-        res_df = df.iloc[slice(2, 4)]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        res_df = df.iloc[[2, 3]]
-        tm.assert_frame_equal(res_df, exp_df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        res_col = df.iloc[:, 0]
-        tm.assert_series_equal(res_col, exp_col)
-        self.assertTrue(is_categorical_dtype(res_col))
-
-        res_df = df.iloc[:, slice(0, 2)]
-        tm.assert_frame_equal(res_df, df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-        res_df = df.iloc[:, [0, 1]]
-        tm.assert_frame_equal(res_df, df)
-        self.assertTrue(is_categorical_dtype(res_df["cats"]))
-
-    def test_slicing_doc_examples(self):
-
-        # GH 7918
-        cats = Categorical(["a", "b", "b", "b", "c", "c", "c"],
-                           categories=["a", "b", "c"])
-        idx = Index(["h", "i", "j", "k", "l", "m", "n", ])
-        values = [1, 2, 2, 2, 3, 4, 5]
-        df = DataFrame({"cats": cats, "values": values}, index=idx)
-
-        result = df.iloc[2:4, :]
-        expected = DataFrame(
-            {"cats": Categorical(['b', 'b'], categories=['a', 'b', 'c']),
-             "values": [2, 2]}, index=['j', 'k'])
-        tm.assert_frame_equal(result, expected)
-
-        result = df.iloc[2:4, :].dtypes
-        expected = Series(['category', 'int64'], ['cats', 'values'])
-        tm.assert_series_equal(result, expected)
-
-        result = df.loc["h":"j", "cats"]
-        expected = Series(Categorical(['a', 'b', 'b'],
-                                      categories=['a', 'b', 'c']),
-                          index=['h', 'i', 'j'], name='cats')
-        tm.assert_series_equal(result, expected)
-
-        result = df.loc["h":"j", df.columns[0:1]]
-        expected = DataFrame({'cats': Categorical(['a', 'b', 'b'],
-                                                  categories=['a', 'b', 'c'])},
-                             index=['h', 'i', 'j'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_assigning_ops(self):
-        # systematically test the assigning operations:
-        # for all slicing ops:
-        #  for value in categories and value not in categories:
-
-        #   - assign a single value -> exp_single_cats_value
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-
-        # assign multiple rows (mixed values) (-> array) -> exp_multi_row
-
-        # assign a part of a column with dtype == categorical ->
-        # exp_parts_cats_col
-
-        # assign a part of a column with dtype != categorical ->
-        # exp_parts_cats_col
-
-        cats = pd.Categorical(["a", "a", "a", "a", "a", "a", "a"],
-                              categories=["a", "b"])
-        idx = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values = [1, 1, 1, 1, 1, 1, 1]
-        orig = pd.DataFrame({"cats": cats, "values": values}, index=idx)
-
-        # the expected values
-        # changed single row
-        cats1 = pd.Categorical(["a", "a", "b", "a", "a", "a", "a"],
-                               categories=["a", "b"])
-        idx1 = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values1 = [1, 1, 2, 1, 1, 1, 1]
-        exp_single_row = pd.DataFrame({"cats": cats1,
-                                       "values": values1}, index=idx1)
-
-        # changed multiple rows
-        cats2 = pd.Categorical(["a", "a", "b", "b", "a", "a", "a"],
-                               categories=["a", "b"])
-        idx2 = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values2 = [1, 1, 2, 2, 1, 1, 1]
-        exp_multi_row = pd.DataFrame({"cats": cats2,
-                                      "values": values2}, index=idx2)
-
-        # changed part of the cats column
-        cats3 = pd.Categorical(
-            ["a", "a", "b", "b", "a", "a", "a"], categories=["a", "b"])
-        idx3 = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values3 = [1, 1, 1, 1, 1, 1, 1]
-        exp_parts_cats_col = pd.DataFrame(
-            {"cats": cats3,
-             "values": values3}, index=idx3)
-
-        # changed single value in cats col
-        cats4 = pd.Categorical(
-            ["a", "a", "b", "a", "a", "a", "a"], categories=["a", "b"])
-        idx4 = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        values4 = [1, 1, 1, 1, 1, 1, 1]
-        exp_single_cats_value = pd.DataFrame(
-            {"cats": cats4,
-             "values": values4}, index=idx4)
-
-        #  iloc
-        # ###############
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.iloc[2, 0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        df = orig.copy()
-        df.iloc[df.index == "j", 0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.iloc[2, 0] = "c"
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.iloc[2, :] = ["b", 2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.iloc[2, :] = ["c", 2]
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.iloc[2:4, :] = [["b", 2], ["b", 2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.iloc[2:4, :] = [["c", 2], ["c", 2]]
-
-        self.assertRaises(ValueError, f)
-
-        # assign a part of a column with dtype == categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.iloc[2:4, 0] = pd.Categorical(["b", "b"], categories=["a", "b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.iloc[2:4, 0] = pd.Categorical(
-                ["b", "b"], categories=["a", "b", "c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.iloc[2:4, 0] = pd.Categorical(
-                ["c", "c"], categories=["a", "b", "c"])
-
-        # assign a part of a column with dtype != categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.iloc[2:4, 0] = ["b", "b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.iloc[2:4, 0] = ["c", "c"]
-
-        #  loc
-        # ##############
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.loc["j", "cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        df = orig.copy()
-        df.loc[df.index == "j", "cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.loc["j", "cats"] = "c"
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.loc["j", :] = ["b", 2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.loc["j", :] = ["c", 2]
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
-
-        self.assertRaises(ValueError, f)
-
-        # assign a part of a column with dtype == categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k", "cats"] = pd.Categorical(
-            ["b", "b"], categories=["a", "b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.loc["j":"k", "cats"] = pd.Categorical(
-                ["b", "b"], categories=["a", "b", "c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.loc["j":"k", "cats"] = pd.Categorical(
-                ["c", "c"], categories=["a", "b", "c"])
-
-        # assign a part of a column with dtype != categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k", "cats"] = ["b", "b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.loc["j":"k", "cats"] = ["c", "c"]
-
-        #  loc
-        # ##############
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.loc["j", df.columns[0]] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        df = orig.copy()
-        df.loc[df.index == "j", df.columns[0]] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.loc["j", df.columns[0]] = "c"
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign a complete row (mixed values) -> exp_single_row
-        df = orig.copy()
-        df.loc["j", :] = ["b", 2]
-        tm.assert_frame_equal(df, exp_single_row)
-
-        #   - assign a complete row (mixed values) not in categories set
-        def f():
-            df = orig.copy()
-            df.loc["j", :] = ["c", 2]
-
-        self.assertRaises(ValueError, f)
-
-        #   - assign multiple rows (mixed values) -> exp_multi_row
-        df = orig.copy()
-        df.loc["j":"k", :] = [["b", 2], ["b", 2]]
-        tm.assert_frame_equal(df, exp_multi_row)
-
-        def f():
-            df = orig.copy()
-            df.loc["j":"k", :] = [["c", 2], ["c", 2]]
-
-        self.assertRaises(ValueError, f)
-
-        # assign a part of a column with dtype == categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k", df.columns[0]] = pd.Categorical(
-            ["b", "b"], categories=["a", "b"])
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            # different categories -> not sure if this should fail or pass
-            df = orig.copy()
-            df.loc["j":"k", df.columns[0]] = pd.Categorical(
-                ["b", "b"], categories=["a", "b", "c"])
-
-        with tm.assertRaises(ValueError):
-            # different values
-            df = orig.copy()
-            df.loc["j":"k", df.columns[0]] = pd.Categorical(
-                ["c", "c"], categories=["a", "b", "c"])
-
-        # assign a part of a column with dtype != categorical ->
-        # exp_parts_cats_col
-        df = orig.copy()
-        df.loc["j":"k", df.columns[0]] = ["b", "b"]
-        tm.assert_frame_equal(df, exp_parts_cats_col)
-
-        with tm.assertRaises(ValueError):
-            df.loc["j":"k", df.columns[0]] = ["c", "c"]
-
-        # iat
-        df = orig.copy()
-        df.iat[2, 0] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.iat[2, 0] = "c"
-
-        self.assertRaises(ValueError, f)
-
-        # at
-        #   - assign a single value -> exp_single_cats_value
-        df = orig.copy()
-        df.at["j", "cats"] = "b"
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        #   - assign a single value not in the current categories set
-        def f():
-            df = orig.copy()
-            df.at["j", "cats"] = "c"
-
-        self.assertRaises(ValueError, f)
-
-        # fancy indexing
-        catsf = pd.Categorical(["a", "a", "c", "c", "a", "a", "a"],
-                               categories=["a", "b", "c"])
-        idxf = pd.Index(["h", "i", "j", "k", "l", "m", "n"])
-        valuesf = [1, 1, 3, 3, 1, 1, 1]
-        df = pd.DataFrame({"cats": catsf, "values": valuesf}, index=idxf)
-
-        exp_fancy = exp_multi_row.copy()
-        exp_fancy["cats"].cat.set_categories(["a", "b", "c"], inplace=True)
-
-        df[df["cats"] == "c"] = ["b", 2]
-        # category c is kept in .categories
-        tm.assert_frame_equal(df, exp_fancy)
-
-        # set_value
-        df = orig.copy()
-        df.set_value("j", "cats", "b")
-        tm.assert_frame_equal(df, exp_single_cats_value)
-
-        def f():
-            df = orig.copy()
-            df.set_value("j", "cats", "c")
-
-        self.assertRaises(ValueError, f)
-
-        # Assigning a Category to parts of a int/... column uses the values of
-        # the Catgorical
-        df = pd.DataFrame({"a": [1, 1, 1, 1, 1],
-                           "b": ["a", "a", "a", "a", "a"]})
-        exp = pd.DataFrame({"a": [1, "b", "b", 1, 1],
-                            "b": ["a", "a", "b", "b", "a"]})
-        df.loc[1:2, "a"] = pd.Categorical(["b", "b"], categories=["a", "b"])
-        df.loc[2:3, "b"] = pd.Categorical(["b", "b"], categories=["a", "b"])
-        tm.assert_frame_equal(df, exp)
-
-        # Series
-        orig = Series(pd.Categorical(["b", "b"], categories=["a", "b"]))
-        s = orig.copy()
-        s[:] = "a"
-        exp = Series(pd.Categorical(["a", "a"], categories=["a", "b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[1] = "a"
-        exp = Series(pd.Categorical(["b", "a"], categories=["a", "b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[s.index > 0] = "a"
-        exp = Series(pd.Categorical(["b", "a"], categories=["a", "b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s[[False, True]] = "a"
-        exp = Series(pd.Categorical(["b", "a"], categories=["a", "b"]))
-        tm.assert_series_equal(s, exp)
-
-        s = orig.copy()
-        s.index = ["x", "y"]
-        s["y"] = "a"
-        exp = Series(pd.Categorical(["b", "a"], categories=["a", "b"]),
-                     index=["x", "y"])
-        tm.assert_series_equal(s, exp)
-
-        # ensure that one can set something to np.nan
-        s = Series(Categorical([1, 2, 3]))
-        exp = Series(Categorical([1, np.nan, 3], categories=[1, 2, 3]))
-        s[1] = np.nan
-        tm.assert_series_equal(s, exp)
-
-    def test_comparisons(self):
-        tests_data = [(list("abc"), list("cba"), list("bbb")),
-                      ([1, 2, 3], [3, 2, 1], [2, 2, 2])]
-        for data, reverse, base in tests_data:
-            cat_rev = pd.Series(pd.Categorical(data, categories=reverse,
-                                               ordered=True))
-            cat_rev_base = pd.Series(pd.Categorical(base, categories=reverse,
-                                                    ordered=True))
-            cat = pd.Series(pd.Categorical(data, ordered=True))
-            cat_base = pd.Series(pd.Categorical(
-                base, categories=cat.cat.categories, ordered=True))
-            s = Series(base)
-            a = np.array(base)
-
-            # comparisons need to take categories ordering into account
-            res_rev = cat_rev > cat_rev_base
-            exp_rev = Series([True, False, False])
-            tm.assert_series_equal(res_rev, exp_rev)
-
-            res_rev = cat_rev < cat_rev_base
-            exp_rev = Series([False, False, True])
-            tm.assert_series_equal(res_rev, exp_rev)
-
-            res = cat > cat_base
-            exp = Series([False, False, True])
-            tm.assert_series_equal(res, exp)
-
-            scalar = base[1]
-            res = cat > scalar
-            exp = Series([False, False, True])
-            exp2 = cat.values > scalar
-            tm.assert_series_equal(res, exp)
-            tm.assert_numpy_array_equal(res.values, exp2)
-            res_rev = cat_rev > scalar
-            exp_rev = Series([True, False, False])
-            exp_rev2 = cat_rev.values > scalar
-            tm.assert_series_equal(res_rev, exp_rev)
-            tm.assert_numpy_array_equal(res_rev.values, exp_rev2)
-
-            # Only categories with same categories can be compared
-            def f():
-                cat > cat_rev
-
-            self.assertRaises(TypeError, f)
-
-            # categorical cannot be compared to Series or numpy array, and also
-            # not the other way around
-            self.assertRaises(TypeError, lambda: cat > s)
-            self.assertRaises(TypeError, lambda: cat_rev > s)
-            self.assertRaises(TypeError, lambda: cat > a)
-            self.assertRaises(TypeError, lambda: cat_rev > a)
-
-            self.assertRaises(TypeError, lambda: s < cat)
-            self.assertRaises(TypeError, lambda: s < cat_rev)
-
-            self.assertRaises(TypeError, lambda: a < cat)
-            self.assertRaises(TypeError, lambda: a < cat_rev)
-
-        # unequal comparison should raise for unordered cats
-        cat = Series(Categorical(list("abc")))
-
-        def f():
-            cat > "b"
-
-        self.assertRaises(TypeError, f)
-        cat = Series(Categorical(list("abc"), ordered=False))
-
-        def f():
-            cat > "b"
-
-        self.assertRaises(TypeError, f)
-
-        # https://github.com/pandas-dev/pandas/issues/9836#issuecomment-92123057
-        # and following comparisons with scalars not in categories should raise
-        # for unequal comps, but not for equal/not equal
-        cat = Series(Categorical(list("abc"), ordered=True))
-
-        self.assertRaises(TypeError, lambda: cat < "d")
-        self.assertRaises(TypeError, lambda: cat > "d")
-        self.assertRaises(TypeError, lambda: "d" < cat)
-        self.assertRaises(TypeError, lambda: "d" > cat)
-
-        self.assert_series_equal(cat == "d", Series([False, False, False]))
-        self.assert_series_equal(cat != "d", Series([True, True, True]))
-
-        # And test NaN handling...
-        cat = Series(Categorical(["a", "b", "c", np.nan]))
-        exp = Series([True, True, True, False])
-        res = (cat == cat)
-        tm.assert_series_equal(res, exp)
-
-    def test_cat_equality(self):
-
-        # GH 8938
-        # allow equality comparisons
-        a = Series(list('abc'), dtype="category")
-        b = Series(list('abc'), dtype="object")
-        c = Series(['a', 'b', 'cc'], dtype="object")
-        d = Series(list('acb'), dtype="object")
-        e = Categorical(list('abc'))
-        f = Categorical(list('acb'))
-
-        # vs scalar
-        self.assertFalse((a == 'a').all())
-        self.assertTrue(((a != 'a') == ~(a == 'a')).all())
-
-        self.assertFalse(('a' == a).all())
-        self.assertTrue((a == 'a')[0])
-        self.assertTrue(('a' == a)[0])
-        self.assertFalse(('a' != a)[0])
-
-        # vs list-like
-        self.assertTrue((a == a).all())
-        self.assertFalse((a != a).all())
-
-        self.assertTrue((a == list(a)).all())
-        self.assertTrue((a == b).all())
-        self.assertTrue((b == a).all())
-        self.assertTrue(((~(a == b)) == (a != b)).all())
-        self.assertTrue(((~(b == a)) == (b != a)).all())
-
-        self.assertFalse((a == c).all())
-        self.assertFalse((c == a).all())
-        self.assertFalse((a == d).all())
-        self.assertFalse((d == a).all())
-
-        # vs a cat-like
-        self.assertTrue((a == e).all())
-        self.assertTrue((e == a).all())
-        self.assertFalse((a == f).all())
-        self.assertFalse((f == a).all())
-
-        self.assertTrue(((~(a == e) == (a != e)).all()))
-        self.assertTrue(((~(e == a) == (e != a)).all()))
-        self.assertTrue(((~(a == f) == (a != f)).all()))
-        self.assertTrue(((~(f == a) == (f != a)).all()))
-
-        # non-equality is not comparable
-        self.assertRaises(TypeError, lambda: a < b)
-        self.assertRaises(TypeError, lambda: b < a)
-        self.assertRaises(TypeError, lambda: a > b)
-        self.assertRaises(TypeError, lambda: b > a)
-
-    def test_concat_append(self):
-        cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-        vals = [1, 2]
-        df = pd.DataFrame({"cats": cat, "vals": vals})
-        cat2 = pd.Categorical(["a", "b", "a", "b"], categories=["a", "b"])
-        vals2 = [1, 2, 1, 2]
-        exp = pd.DataFrame({"cats": cat2,
-                            "vals": vals2}, index=pd.Index([0, 1, 0, 1]))
-
-        tm.assert_frame_equal(pd.concat([df, df]), exp)
-        tm.assert_frame_equal(df.append(df), exp)
-
-        # GH 13524 can concat different categories
-        cat3 = pd.Categorical(["a", "b"], categories=["a", "b", "c"])
-        vals3 = [1, 2]
-        df_different_categories = pd.DataFrame({"cats": cat3, "vals": vals3})
-
-        res = pd.concat([df, df_different_categories], ignore_index=True)
-        exp = pd.DataFrame({"cats": list('abab'), "vals": [1, 2, 1, 2]})
-        tm.assert_frame_equal(res, exp)
-
-        res = df.append(df_different_categories, ignore_index=True)
-        tm.assert_frame_equal(res, exp)
-
-    def test_concat_append_gh7864(self):
-        # GH 7864
-        # make sure ordering is preserverd
-        df = pd.DataFrame({"id": [1, 2, 3, 4, 5, 6],
-                           "raw_grade": ['a', 'b', 'b', 'a', 'a', 'e']})
-        df["grade"] = pd.Categorical(df["raw_grade"])
-        df['grade'].cat.set_categories(['e', 'a', 'b'])
-
-        df1 = df[0:3]
-        df2 = df[3:]
-
-        self.assert_index_equal(df['grade'].cat.categories,
-                                df1['grade'].cat.categories)
-        self.assert_index_equal(df['grade'].cat.categories,
-                                df2['grade'].cat.categories)
-
-        dfx = pd.concat([df1, df2])
-        self.assert_index_equal(df['grade'].cat.categories,
-                                dfx['grade'].cat.categories)
-
-        dfa = df1.append(df2)
-        self.assert_index_equal(df['grade'].cat.categories,
-                                dfa['grade'].cat.categories)
-
-    def test_concat_preserve(self):
-
-        # GH 8641  series concat not preserving category dtype
-        # GH 13524 can concat different categories
-        s = Series(list('abc'), dtype='category')
-        s2 = Series(list('abd'), dtype='category')
-
-        exp = Series(list('abcabd'))
-        res = pd.concat([s, s2], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-
-        exp = Series(list('abcabc'), dtype='category')
-        res = pd.concat([s, s], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-
-        exp = Series(list('abcabc'), index=[0, 1, 2, 0, 1, 2],
-                     dtype='category')
-        res = pd.concat([s, s])
-        tm.assert_series_equal(res, exp)
-
-        a = Series(np.arange(6, dtype='int64'))
-        b = Series(list('aabbca'))
-
-        df2 = DataFrame({'A': a,
-                         'B': b.astype('category', categories=list('cab'))})
-        res = pd.concat([df2, df2])
-        exp = DataFrame({'A': pd.concat([a, a]),
-                         'B': pd.concat([b, b]).astype(
-            'category', categories=list('cab'))})
-        tm.assert_frame_equal(res, exp)
-
-    def test_categorical_index_preserver(self):
-
-        a = Series(np.arange(6, dtype='int64'))
-        b = Series(list('aabbca'))
-
-        df2 = DataFrame({'A': a,
-                         'B': b.astype('category', categories=list('cab'))
-                         }).set_index('B')
-        result = pd.concat([df2, df2])
-        expected = DataFrame({'A': pd.concat([a, a]),
-                              'B': pd.concat([b, b]).astype(
-                                  'category', categories=list('cab'))
-                              }).set_index('B')
-        tm.assert_frame_equal(result, expected)
-
-        # wrong catgories
-        df3 = DataFrame({'A': a,
-                         'B': pd.Categorical(b, categories=list('abc'))
-                         }).set_index('B')
-        self.assertRaises(TypeError, lambda: pd.concat([df2, df3]))
-
-    def test_merge(self):
-        # GH 9426
-
-        right = DataFrame({'c': {0: 'a',
-                                 1: 'b',
-                                 2: 'c',
-                                 3: 'd',
-                                 4: 'e'},
-                           'd': {0: 'null',
-                                 1: 'null',
-                                 2: 'null',
-                                 3: 'null',
-                                 4: 'null'}})
-        left = DataFrame({'a': {0: 'f',
-                                1: 'f',
-                                2: 'f',
-                                3: 'f',
-                                4: 'f'},
-                          'b': {0: 'g',
-                                1: 'g',
-                                2: 'g',
-                                3: 'g',
-                                4: 'g'}})
-        df = pd.merge(left, right, how='left', left_on='b', right_on='c')
-
-        # object-object
-        expected = df.copy()
-
-        # object-cat
-        # note that we propogate the category
-        # because we don't have any matching rows
-        cright = right.copy()
-        cright['d'] = cright['d'].astype('category')
-        result = pd.merge(left, cright, how='left', left_on='b', right_on='c')
-        expected['d'] = expected['d'].astype('category', categories=['null'])
-        tm.assert_frame_equal(result, expected)
-
-        # cat-object
-        cleft = left.copy()
-        cleft['b'] = cleft['b'].astype('category')
-        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
-        tm.assert_frame_equal(result, expected)
-
-        # cat-cat
-        cright = right.copy()
-        cright['d'] = cright['d'].astype('category')
-        cleft = left.copy()
-        cleft['b'] = cleft['b'].astype('category')
-        result = pd.merge(cleft, cright, how='left', left_on='b', right_on='c')
-        tm.assert_frame_equal(result, expected)
-
-    def test_repeat(self):
-        # GH10183
-        cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-        exp = pd.Categorical(["a", "a", "b", "b"], categories=["a", "b"])
-        res = cat.repeat(2)
-        self.assert_categorical_equal(res, exp)
-
-    def test_numpy_repeat(self):
-        cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-        exp = pd.Categorical(["a", "a", "b", "b"], categories=["a", "b"])
-        self.assert_categorical_equal(np.repeat(cat, 2), exp)
-
-        msg = "the 'axis' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.repeat, cat, 2, axis=1)
-
-    def test_reshape(self):
-        cat = pd.Categorical([], categories=["a", "b"])
-        tm.assert_produces_warning(FutureWarning, cat.reshape, 0)
-
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical([], categories=["a", "b"])
-            self.assert_categorical_equal(cat.reshape(0), cat)
-
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical([], categories=["a", "b"])
-            self.assert_categorical_equal(cat.reshape((5, -1)), cat)
-
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-            self.assert_categorical_equal(cat.reshape(cat.shape), cat)
-
-        with tm.assert_produces_warning(FutureWarning):
-            cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-            self.assert_categorical_equal(cat.reshape(cat.size), cat)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            msg = "can only specify one unknown dimension"
-            cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-            tm.assertRaisesRegexp(ValueError, msg, cat.reshape, (-2, -1))
-
-    def test_numpy_reshape(self):
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            cat = pd.Categorical(["a", "b"], categories=["a", "b"])
-            self.assert_categorical_equal(np.reshape(cat, cat.shape), cat)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            msg = "the 'order' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, np.reshape,
-                                  cat, cat.shape, order='F')
-
-    def test_na_actions(self):
-
-        cat = pd.Categorical([1, 2, 3, np.nan], categories=[1, 2, 3])
-        vals = ["a", "b", np.nan, "d"]
-        df = pd.DataFrame({"cats": cat, "vals": vals})
-        cat2 = pd.Categorical([1, 2, 3, 3], categories=[1, 2, 3])
-        vals2 = ["a", "b", "b", "d"]
-        df_exp_fill = pd.DataFrame({"cats": cat2, "vals": vals2})
-        cat3 = pd.Categorical([1, 2, 3], categories=[1, 2, 3])
-        vals3 = ["a", "b", np.nan]
-        df_exp_drop_cats = pd.DataFrame({"cats": cat3, "vals": vals3})
-        cat4 = pd.Categorical([1, 2], categories=[1, 2, 3])
-        vals4 = ["a", "b"]
-        df_exp_drop_all = pd.DataFrame({"cats": cat4, "vals": vals4})
-
-        # fillna
-        res = df.fillna(value={"cats": 3, "vals": "b"})
-        tm.assert_frame_equal(res, df_exp_fill)
-
-        def f():
-            df.fillna(value={"cats": 4, "vals": "c"})
-
-        self.assertRaises(ValueError, f)
-
-        res = df.fillna(method='pad')
-        tm.assert_frame_equal(res, df_exp_fill)
-
-        res = df.dropna(subset=["cats"])
-        tm.assert_frame_equal(res, df_exp_drop_cats)
-
-        res = df.dropna()
-        tm.assert_frame_equal(res, df_exp_drop_all)
-
-        # make sure that fillna takes missing values into account
-        c = Categorical([np.nan, "b", np.nan], categories=["a", "b"])
-        df = pd.DataFrame({"cats": c, "vals": [1, 2, 3]})
-
-        cat_exp = Categorical(["a", "b", "a"], categories=["a", "b"])
-        df_exp = pd.DataFrame({"cats": cat_exp, "vals": [1, 2, 3]})
-
-        res = df.fillna("a")
-        tm.assert_frame_equal(res, df_exp)
-
-        # GH 14021
-        # np.nan should always be a is a valid filler
-        cat = Categorical([np.nan, 2, np.nan])
-        val = Categorical([np.nan, np.nan, np.nan])
-        df = DataFrame({"cats": cat, "vals": val})
-        res = df.fillna(df.median())
-        v_exp = [np.nan, np.nan, np.nan]
-        df_exp = pd.DataFrame({"cats": [2, 2, 2], "vals": v_exp},
-                              dtype='category')
-        tm.assert_frame_equal(res, df_exp)
-
-        result = df.cats.fillna(np.nan)
-        tm.assert_series_equal(result, df.cats)
-        result = df.vals.fillna(np.nan)
-        tm.assert_series_equal(result, df.vals)
-
-        idx = pd.DatetimeIndex(['2011-01-01 09:00', '2016-01-01 23:45',
-                                '2011-01-01 09:00', pd.NaT, pd.NaT])
-        df = DataFrame({'a': pd.Categorical(idx)})
-        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
-
-        idx = pd.PeriodIndex(['2011-01', '2011-01', '2011-01',
-                              pd.NaT, pd.NaT], freq='M')
-        df = DataFrame({'a': pd.Categorical(idx)})
-        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
-
-        idx = pd.TimedeltaIndex(['1 days', '2 days',
-                                 '1 days', pd.NaT, pd.NaT])
-        df = pd.DataFrame({'a': pd.Categorical(idx)})
-        tm.assert_frame_equal(df.fillna(value=pd.NaT), df)
-
-    def test_astype_to_other(self):
-
-        s = self.cat['value_group']
-        expected = s
-        tm.assert_series_equal(s.astype('category'), expected)
-        tm.assert_series_equal(s.astype(CategoricalDtype()), expected)
-        self.assertRaises(ValueError, lambda: s.astype('float64'))
-
-        cat = Series(Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c']))
-        exp = Series(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-        tm.assert_series_equal(cat.astype('str'), exp)
-        s2 = Series(Categorical(['1', '2', '3', '4']))
-        exp2 = Series([1, 2, 3, 4]).astype(int)
-        tm.assert_series_equal(s2.astype('int'), exp2)
-
-        # object don't sort correctly, so just compare that we have the same
-        # values
-        def cmp(a, b):
-            tm.assert_almost_equal(
-                np.sort(np.unique(a)), np.sort(np.unique(b)))
-
-        expected = Series(np.array(s.values), name='value_group')
-        cmp(s.astype('object'), expected)
-        cmp(s.astype(np.object_), expected)
-
-        # array conversion
-        tm.assert_almost_equal(np.array(s), np.array(s.values))
-
-        # valid conversion
-        for valid in [lambda x: x.astype('category'),
-                      lambda x: x.astype(CategoricalDtype()),
-                      lambda x: x.astype('object').astype('category'),
-                      lambda x: x.astype('object').astype(
-                          CategoricalDtype())
-                      ]:
-
-            result = valid(s)
-            # compare series values
-            # internal .categories can't be compared because it is sorted
-            tm.assert_series_equal(result, s, check_categorical=False)
-
-        # invalid conversion (these are NOT a dtype)
-        for invalid in [lambda x: x.astype(pd.Categorical),
-                        lambda x: x.astype('object').astype(pd.Categorical)]:
-            self.assertRaises(TypeError, lambda: invalid(s))
-
-    def test_astype_categorical(self):
-
-        cat = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-        tm.assert_categorical_equal(cat, cat.astype('category'))
-        tm.assert_almost_equal(np.array(cat), cat.astype('object'))
-
-        self.assertRaises(ValueError, lambda: cat.astype(float))
-
-    def test_to_records(self):
-
-        # GH8626
-
-        # dict creation
-        df = DataFrame({'A': list('abc')}, dtype='category')
-        expected = Series(list('abc'), dtype='category', name='A')
-        tm.assert_series_equal(df['A'], expected)
-
-        # list-like creation
-        df = DataFrame(list('abc'), dtype='category')
-        expected = Series(list('abc'), dtype='category', name=0)
-        tm.assert_series_equal(df[0], expected)
-
-        # to record array
-        # this coerces
-        result = df.to_records()
-        expected = np.rec.array([(0, 'a'), (1, 'b'), (2, 'c')],
-                                dtype=[('index', '=i8'), ('0', 'O')])
-        tm.assert_almost_equal(result, expected)
-
-    def test_numeric_like_ops(self):
-
-        # numeric ops should not succeed
-        for op in ['__add__', '__sub__', '__mul__', '__truediv__']:
-            self.assertRaises(TypeError,
-                              lambda: getattr(self.cat, op)(self.cat))
-
-        # reduction ops should not succeed (unless specifically defined, e.g.
-        # min/max)
-        s = self.cat['value_group']
-        for op in ['kurt', 'skew', 'var', 'std', 'mean', 'sum', 'median']:
-            self.assertRaises(TypeError,
-                              lambda: getattr(s, op)(numeric_only=False))
-
-        # mad technically works because it takes always the numeric data
-
-        # numpy ops
-        s = pd.Series(pd.Categorical([1, 2, 3, 4]))
-        self.assertRaises(TypeError, lambda: np.sum(s))
-
-        # numeric ops on a Series
-        for op in ['__add__', '__sub__', '__mul__', '__truediv__']:
-            self.assertRaises(TypeError, lambda: getattr(s, op)(2))
-
-        # invalid ufunc
-        self.assertRaises(TypeError, lambda: np.log(s))
-
-    def test_cat_tab_completition(self):
-        # test the tab completion display
-        ok_for_cat = ['categories', 'codes', 'ordered', 'set_categories',
-                      'add_categories', 'remove_categories',
-                      'rename_categories', 'reorder_categories',
-                      'remove_unused_categories', 'as_ordered', 'as_unordered']
-
-        def get_dir(s):
-            results = [r for r in s.cat.__dir__() if not r.startswith('_')]
-            return list(sorted(set(results)))
-
-        s = Series(list('aabbcde')).astype('category')
-        results = get_dir(s)
-        tm.assert_almost_equal(results, list(sorted(set(ok_for_cat))))
-
-    def test_cat_accessor_api(self):
-        # GH 9322
-        from pandas.core.categorical import CategoricalAccessor
-        self.assertIs(Series.cat, CategoricalAccessor)
-        s = Series(list('aabbcde')).astype('category')
-        self.assertIsInstance(s.cat, CategoricalAccessor)
-
-        invalid = Series([1])
-        with tm.assertRaisesRegexp(AttributeError, "only use .cat accessor"):
-            invalid.cat
-        self.assertFalse(hasattr(invalid, 'cat'))
-
-    def test_cat_accessor_no_new_attributes(self):
-        # https://github.com/pandas-dev/pandas/issues/10673
-        c = Series(list('aabbcde')).astype('category')
-        with tm.assertRaisesRegexp(AttributeError,
-                                   "You cannot add any new attribute"):
-            c.cat.xlabel = "a"
-
-    def test_str_accessor_api_for_categorical(self):
-        # https://github.com/pandas-dev/pandas/issues/10661
-        from pandas.core.strings import StringMethods
-        s = Series(list('aabb'))
-        s = s + " " + s
-        c = s.astype('category')
-        self.assertIsInstance(c.str, StringMethods)
-
-        # str functions, which need special arguments
-        special_func_defs = [
-            ('cat', (list("zyxw"),), {"sep": ","}),
-            ('center', (10,), {}),
-            ('contains', ("a",), {}),
-            ('count', ("a",), {}),
-            ('decode', ("UTF-8",), {}),
-            ('encode', ("UTF-8",), {}),
-            ('endswith', ("a",), {}),
-            ('extract', ("([a-z]*) ",), {"expand": False}),
-            ('extract', ("([a-z]*) ",), {"expand": True}),
-            ('extractall', ("([a-z]*) ",), {}),
-            ('find', ("a",), {}),
-            ('findall', ("a",), {}),
-            ('index', (" ",), {}),
-            ('ljust', (10,), {}),
-            ('match', ("a"), {}),  # deprecated...
-            ('normalize', ("NFC",), {}),
-            ('pad', (10,), {}),
-            ('partition', (" ",), {"expand": False}),  # not default
-            ('partition', (" ",), {"expand": True}),  # default
-            ('repeat', (3,), {}),
-            ('replace', ("a", "z"), {}),
-            ('rfind', ("a",), {}),
-            ('rindex', (" ",), {}),
-            ('rjust', (10,), {}),
-            ('rpartition', (" ",), {"expand": False}),  # not default
-            ('rpartition', (" ",), {"expand": True}),  # default
-            ('slice', (0, 1), {}),
-            ('slice_replace', (0, 1, "z"), {}),
-            ('split', (" ",), {"expand": False}),  # default
-            ('split', (" ",), {"expand": True}),  # not default
-            ('startswith', ("a",), {}),
-            ('wrap', (2,), {}),
-            ('zfill', (10,), {})
-        ]
-        _special_func_names = [f[0] for f in special_func_defs]
-
-        # * get, join: they need a individual elements of type lists, but
-        #   we can't make a categorical with lists as individual categories.
-        #   -> `s.str.split(" ").astype("category")` will error!
-        # * `translate` has different interfaces for py2 vs. py3
-        _ignore_names = ["get", "join", "translate"]
-
-        str_func_names = [f
-                          for f in dir(s.str)
-                          if not (f.startswith("_") or f in _special_func_names
-                                  or f in _ignore_names)]
-
-        func_defs = [(f, (), {}) for f in str_func_names]
-        func_defs.extend(special_func_defs)
-
-        for func, args, kwargs in func_defs:
-            res = getattr(c.str, func)(*args, **kwargs)
-            exp = getattr(s.str, func)(*args, **kwargs)
-
-            if isinstance(res, pd.DataFrame):
-                tm.assert_frame_equal(res, exp)
-            else:
-                tm.assert_series_equal(res, exp)
-
-        invalid = Series([1, 2, 3]).astype('category')
-        with tm.assertRaisesRegexp(AttributeError,
-                                   "Can only use .str accessor with string"):
-            invalid.str
-        self.assertFalse(hasattr(invalid, 'str'))
-
-    def test_dt_accessor_api_for_categorical(self):
-        # https://github.com/pandas-dev/pandas/issues/10661
-        from pandas.tseries.common import Properties
-
-        s_dr = Series(date_range('1/1/2015', periods=5, tz="MET"))
-        c_dr = s_dr.astype("category")
-
-        s_pr = Series(period_range('1/1/2015', freq='D', periods=5))
-        c_pr = s_pr.astype("category")
-
-        s_tdr = Series(timedelta_range('1 days', '10 days'))
-        c_tdr = s_tdr.astype("category")
-
-        # only testing field (like .day)
-        # and bool (is_month_start)
-        get_ops = lambda x: x._datetimelike_ops
-
-        test_data = [
-            ("Datetime", get_ops(DatetimeIndex), s_dr, c_dr),
-            ("Period", get_ops(PeriodIndex), s_pr, c_pr),
-            ("Timedelta", get_ops(TimedeltaIndex), s_tdr, c_tdr)]
-
-        self.assertIsInstance(c_dr.dt, Properties)
-
-        special_func_defs = [
-            ('strftime', ("%Y-%m-%d",), {}),
-            ('tz_convert', ("EST",), {}),
-            ('round', ("D",), {}),
-            ('floor', ("D",), {}),
-            ('ceil', ("D",), {}),
-            ('asfreq', ("D",), {}),
-            # ('tz_localize', ("UTC",), {}),
-        ]
-        _special_func_names = [f[0] for f in special_func_defs]
-
-        # the series is already localized
-        _ignore_names = ['tz_localize', 'components']
-
-        for name, attr_names, s, c in test_data:
-            func_names = [f
-                          for f in dir(s.dt)
-                          if not (f.startswith("_") or f in attr_names or f in
-                                  _special_func_names or f in _ignore_names)]
-
-            func_defs = [(f, (), {}) for f in func_names]
-            for f_def in special_func_defs:
-                if f_def[0] in dir(s.dt):
-                    func_defs.append(f_def)
-
-            for func, args, kwargs in func_defs:
-                res = getattr(c.dt, func)(*args, **kwargs)
-                exp = getattr(s.dt, func)(*args, **kwargs)
-
-                if isinstance(res, pd.DataFrame):
-                    tm.assert_frame_equal(res, exp)
-                elif isinstance(res, pd.Series):
-                    tm.assert_series_equal(res, exp)
-                else:
-                    tm.assert_almost_equal(res, exp)
-
-            for attr in attr_names:
-                try:
-                    res = getattr(c.dt, attr)
-                    exp = getattr(s.dt, attr)
-                except Exception as e:
-                    print(name, attr)
-                    raise e
-
-            if isinstance(res, pd.DataFrame):
-                tm.assert_frame_equal(res, exp)
-            elif isinstance(res, pd.Series):
-                tm.assert_series_equal(res, exp)
-            else:
-                tm.assert_almost_equal(res, exp)
-
-        invalid = Series([1, 2, 3]).astype('category')
-        with tm.assertRaisesRegexp(
-                AttributeError, "Can only use .dt accessor with datetimelike"):
-            invalid.dt
-        self.assertFalse(hasattr(invalid, 'str'))
-
-    def test_concat_categorical(self):
-        # See GH 10177
-        df1 = pd.DataFrame(np.arange(18, dtype='int64').reshape(6, 3),
-                           columns=["a", "b", "c"])
-
-        df2 = pd.DataFrame(np.arange(14, dtype='int64').reshape(7, 2),
-                           columns=["a", "c"])
-
-        cat_values = ["one", "one", "two", "one", "two", "two", "one"]
-        df2['h'] = pd.Series(pd.Categorical(cat_values))
-
-        res = pd.concat((df1, df2), axis=0, ignore_index=True)
-        exp = pd.DataFrame({'a': [0, 3, 6, 9, 12, 15, 0, 2, 4, 6, 8, 10, 12],
-                            'b': [1, 4, 7, 10, 13, 16, np.nan, np.nan,
-                                  np.nan, np.nan, np.nan, np.nan, np.nan],
-                            'c': [2, 5, 8, 11, 14, 17, 1, 3, 5, 7, 9, 11, 13],
-                            'h': [None] * 6 + cat_values})
-        tm.assert_frame_equal(res, exp)
-
-
-class TestCategoricalSubclassing(tm.TestCase):
-
-    def test_constructor(self):
-        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
-        self.assertIsInstance(sc, tm.SubclassedCategorical)
-        tm.assert_categorical_equal(sc, Categorical(['a', 'b', 'c']))
-
-    def test_from_array(self):
-        sc = tm.SubclassedCategorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
-        self.assertIsInstance(sc, tm.SubclassedCategorical)
-        exp = Categorical.from_codes([1, 0, 2], ['a', 'b', 'c'])
-        tm.assert_categorical_equal(sc, exp)
-
-    def test_map(self):
-        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
-        res = sc.map(lambda x: x.upper())
-        self.assertIsInstance(res, tm.SubclassedCategorical)
-        exp = Categorical(['A', 'B', 'C'])
-        tm.assert_categorical_equal(res, exp)
-
-    def test_map(self):
-        sc = tm.SubclassedCategorical(['a', 'b', 'c'])
-        res = sc.map(lambda x: x.upper())
-        self.assertIsInstance(res, tm.SubclassedCategorical)
-        exp = Categorical(['A', 'B', 'C'])
-        tm.assert_categorical_equal(res, exp)
diff --git a/pandas/tests/test_common.py b/pandas/tests/test_common.py
index 90b1157572be1..18eb760e31db8 100644
--- a/pandas/tests/test_common.py
+++ b/pandas/tests/test_common.py
@@ -1,29 +1,24 @@
 # -*- coding: utf-8 -*-
 
+import collections
+from functools import partial
+import string
+
 import numpy as np
+import pytest
 
+import pandas as pd
 from pandas import Series, Timestamp
-from pandas.compat import range, lmap
-import pandas.core.common as com
-import pandas.util.testing as tm
-
-
-def test_mut_exclusive():
-    msg = "mutually exclusive arguments: '[ab]' and '[ab]'"
-    with tm.assertRaisesRegexp(TypeError, msg):
-        com._mut_exclusive(a=1, b=2)
-    assert com._mut_exclusive(a=1, b=None) == 1
-    assert com._mut_exclusive(major=None, major_axis=None) is None
+from pandas.core import common as com, ops
 
 
 def test_get_callable_name():
-    from functools import partial
-    getname = com._get_callable_name
+    getname = com.get_callable_name
 
     def fn(x):
         return x
 
-    lambda_ = lambda x: x
+    lambda_ = lambda x: x  # noqa: E731
     part1 = partial(fn)
     part2 = partial(part1)
 
@@ -51,145 +46,73 @@ def test_all_not_none():
     assert (not com._all_not_none(None, None, None, None))
 
 
-def test_iterpairs():
-    data = [1, 2, 3, 4]
-    expected = [(1, 2), (2, 3), (3, 4)]
-
-    result = list(com.iterpairs(data))
-
-    assert (result == expected)
-
-
-def test_split_ranges():
-    def _bin(x, width):
-        "return int(x) as a base2 string of given width"
-        return ''.join(str((x >> i) & 1) for i in range(width - 1, -1, -1))
-
-    def test_locs(mask):
-        nfalse = sum(np.array(mask) == 0)
-
-        remaining = 0
-        for s, e in com.split_ranges(mask):
-            remaining += e - s
-
-            assert 0 not in mask[s:e]
-
-        # make sure the total items covered by the ranges are a complete cover
-        assert remaining + nfalse == len(mask)
-
-    # exhaustively test all possible mask sequences of length 8
-    ncols = 8
-    for i in range(2 ** ncols):
-        cols = lmap(int, list(_bin(i, ncols)))  # count up in base2
-        mask = [cols[i] == 1 for i in range(len(cols))]
-        test_locs(mask)
-
-    # base cases
-    test_locs([])
-    test_locs([0])
-    test_locs([1])
-
-
-def test_map_indices_py():
-    data = [4, 3, 2, 1]
-    expected = {4: 0, 3: 1, 2: 2, 1: 3}
-
-    result = com.map_indices_py(data)
-
-    assert (result == expected)
-
-
-def test_union():
-    a = [1, 2, 3]
-    b = [4, 5, 6]
-
-    union = sorted(com.union(a, b))
-
-    assert ((a + b) == union)
-
-
-def test_difference():
-    a = [1, 2, 3]
-    b = [1, 2, 3, 4, 5, 6]
-
-    inter = sorted(com.difference(b, a))
-
-    assert ([4, 5, 6] == inter)
-
-
-def test_intersection():
-    a = [1, 2, 3]
-    b = [1, 2, 3, 4, 5, 6]
-
-    inter = sorted(com.intersection(a, b))
-
-    assert (a == inter)
-
-
-def test_groupby():
-    values = ['foo', 'bar', 'baz', 'baz2', 'qux', 'foo3']
-    expected = {'f': ['foo', 'foo3'],
-                'b': ['bar', 'baz', 'baz2'],
-                'q': ['qux']}
-
-    grouped = com.groupby(values, lambda x: x[0])
-
-    for k, v in grouped:
-        assert v == expected[k]
-
-
 def test_random_state():
     import numpy.random as npr
     # Check with seed
-    state = com._random_state(5)
-    tm.assert_equal(state.uniform(), npr.RandomState(5).uniform())
+    state = com.random_state(5)
+    assert state.uniform() == npr.RandomState(5).uniform()
 
     # Check with random state object
     state2 = npr.RandomState(10)
-    tm.assert_equal(
-        com._random_state(state2).uniform(), npr.RandomState(10).uniform())
+    assert com.random_state(state2).uniform() == npr.RandomState(10).uniform()
 
     # check with no arg random state
-    assert com._random_state() is np.random
+    assert com.random_state() is np.random
 
     # Error for floats or strings
-    with tm.assertRaises(ValueError):
-        com._random_state('test')
+    with pytest.raises(ValueError):
+        com.random_state('test')
+
+    with pytest.raises(ValueError):
+        com.random_state(5.5)
 
-    with tm.assertRaises(ValueError):
-        com._random_state(5.5)
 
+@pytest.mark.parametrize('left, right, expected', [
+    (Series([1], name='x'), Series([2], name='x'), 'x'),
+    (Series([1], name='x'), Series([2], name='y'), None),
+    (Series([1]), Series([2], name='x'), None),
+    (Series([1], name='x'), Series([2]), None),
+    (Series([1], name='x'), [2], 'x'),
+    ([1], Series([2], name='y'), 'y')])
+def test_maybe_match_name(left, right, expected):
+    assert ops._maybe_match_name(left, right) == expected
 
-def test_maybe_match_name():
 
-    matched = com._maybe_match_name(
-        Series([1], name='x'), Series(
-            [2], name='x'))
-    assert (matched == 'x')
+def test_dict_compat():
+    data_datetime64 = {np.datetime64('1990-03-15'): 1,
+                       np.datetime64('2015-03-15'): 2}
+    data_unchanged = {1: 2, 3: 4, 5: 6}
+    expected = {Timestamp('1990-3-15'): 1, Timestamp('2015-03-15'): 2}
+    assert (com.dict_compat(data_datetime64) == expected)
+    assert (com.dict_compat(expected) == expected)
+    assert (com.dict_compat(data_unchanged) == data_unchanged)
 
-    matched = com._maybe_match_name(
-        Series([1], name='x'), Series(
-            [2], name='y'))
-    assert (matched is None)
 
-    matched = com._maybe_match_name(Series([1]), Series([2], name='x'))
-    assert (matched is None)
+def test_standardize_mapping():
+    # No uninitialized defaultdicts
+    with pytest.raises(TypeError):
+        com.standardize_mapping(collections.defaultdict)
 
-    matched = com._maybe_match_name(Series([1], name='x'), Series([2]))
-    assert (matched is None)
+    # No non-mapping subtypes, instance
+    with pytest.raises(TypeError):
+        com.standardize_mapping([])
 
-    matched = com._maybe_match_name(Series([1], name='x'), [2])
-    assert (matched == 'x')
+    # No non-mapping subtypes, class
+    with pytest.raises(TypeError):
+        com.standardize_mapping(list)
 
-    matched = com._maybe_match_name([1], Series([2], name='y'))
-    assert (matched == 'y')
+    fill = {'bad': 'data'}
+    assert (com.standardize_mapping(fill) == dict)
 
+    # Convert instance to type
+    assert (com.standardize_mapping({}) == dict)
 
-def test_dict_compat():
-    data_datetime64 = {np.datetime64('1990-03-15'): 1,
-                       np.datetime64('2015-03-15'): 2}
-    data_unchanged = {1: 2, 3: 4, 5: 6}
-    expected = {Timestamp('1990-3-15'): 1, Timestamp('2015-03-15'): 2}
-    assert (com._dict_compat(data_datetime64) == expected)
-    assert (com._dict_compat(expected) == expected)
-    assert (com._dict_compat(data_unchanged) == data_unchanged)
+    dd = collections.defaultdict(list)
+    assert isinstance(com.standardize_mapping(dd), partial)
+
+
+def test_git_version():
+    # GH 21295
+    git_version = pd.__git_version__
+    assert len(git_version) == 40
+    assert all(c in string.hexdigits for c in git_version)
diff --git a/pandas/tests/test_compat.py b/pandas/tests/test_compat.py
index 68c0b81eb18ce..d1a3ee43a4623 100644
--- a/pandas/tests/test_compat.py
+++ b/pandas/tests/test_compat.py
@@ -3,24 +3,30 @@
 Testing that functions from compat work as expected
 """
 
-from pandas.compat import (range, zip, map, filter, lrange, lzip, lmap,
-                           lfilter, builtins, iterkeys, itervalues, iteritems,
-                           next)
-import pandas.util.testing as tm
+import re
 
+import pytest
 
-class TestBuiltinIterators(tm.TestCase):
+from pandas.compat import (
+    PY2, builtins, filter, get_range_parameters, iteritems, iterkeys,
+    itervalues, lfilter, lmap, lrange, lzip, map, next, range, re_type, zip)
 
-    def check_result(self, actual, expected, lengths):
+
+class TestBuiltinIterators(object):
+
+    @classmethod
+    def check_result(cls, actual, expected, lengths):
         for (iter_res, list_res), exp, length in zip(actual, expected,
                                                      lengths):
-            self.assertNotIsInstance(iter_res, list)
-            tm.assertIsInstance(list_res, list)
+            assert not isinstance(iter_res, list)
+            assert isinstance(list_res, list)
+
             iter_res = list(iter_res)
-            self.assertEqual(len(list_res), length)
-            self.assertEqual(len(iter_res), length)
-            self.assertEqual(iter_res, exp)
-            self.assertEqual(list_res, exp)
+
+            assert len(list_res) == length
+            assert len(iter_res) == length
+            assert iter_res == exp
+            assert list_res == exp
 
     def test_range(self):
         actual1 = range(10)
@@ -64,6 +70,29 @@ def test_zip(self):
         self.check_result(actual, expected, lengths)
 
     def test_dict_iterators(self):
-        self.assertEqual(next(itervalues({1: 2})), 2)
-        self.assertEqual(next(iterkeys({1: 2})), 1)
-        self.assertEqual(next(iteritems({1: 2})), (1, 2))
+        assert next(itervalues({1: 2})) == 2
+        assert next(iterkeys({1: 2})) == 1
+        assert next(iteritems({1: 2})) == (1, 2)
+
+
+class TestCompatFunctions(object):
+
+    @pytest.mark.parametrize(
+        'start,stop,step', [(0, 10, 2), (11, -2, -1), (0, -5, 1), (2, 4, 8)])
+    def test_get_range_parameters(self, start, stop, step):
+        rng = range(start, stop, step)
+        if PY2 and len(rng) == 0:
+            start_expected, stop_expected, step_expected = 0, 0, 1
+        elif PY2 and len(rng) == 1:
+            start_expected, stop_expected, step_expected = start, start + 1, 1
+        else:
+            start_expected, stop_expected, step_expected = start, stop, step
+
+        start_result, stop_result, step_result = get_range_parameters(rng)
+        assert start_result == start_expected
+        assert stop_result == stop_expected
+        assert step_result == step_expected
+
+
+def test_re_type():
+    assert isinstance(re.compile(''), re_type)
diff --git a/pandas/tests/test_config.py b/pandas/tests/test_config.py
index c58aada193b15..baca66e0361ad 100644
--- a/pandas/tests/test_config.py
+++ b/pandas/tests/test_config.py
@@ -1,28 +1,39 @@
 # -*- coding: utf-8 -*-
-import pandas as pd
-import unittest
 import warnings
 
+import pytest
+
+from pandas.compat import PY2
+
+import pandas as pd
+from pandas.core.config import OptionError
 
-class TestConfig(unittest.TestCase):
 
-    def __init__(self, *args):
-        super(TestConfig, self).__init__(*args)
+class TestConfig(object):
 
+    @classmethod
+    def setup_class(cls):
         from copy import deepcopy
-        self.cf = pd.core.config
-        self.gc = deepcopy(getattr(self.cf, '_global_config'))
-        self.do = deepcopy(getattr(self.cf, '_deprecated_options'))
-        self.ro = deepcopy(getattr(self.cf, '_registered_options'))
 
-    def setUp(self):
+        cls.cf = pd.core.config
+        cls.gc = deepcopy(getattr(cls.cf, '_global_config'))
+        cls.do = deepcopy(getattr(cls.cf, '_deprecated_options'))
+        cls.ro = deepcopy(getattr(cls.cf, '_registered_options'))
+
+    def setup_method(self, method):
         setattr(self.cf, '_global_config', {})
-        setattr(
-            self.cf, 'options', self.cf.DictWrapper(self.cf._global_config))
+        setattr(self.cf, 'options', self.cf.DictWrapper(
+            self.cf._global_config))
         setattr(self.cf, '_deprecated_options', {})
         setattr(self.cf, '_registered_options', {})
 
-    def tearDown(self):
+        # Our test fixture in conftest.py sets "chained_assignment"
+        # to "raise" only after all test methods have been setup.
+        # However, after this setup, there is no longer any
+        # "chained_assignment" option, so re-register it.
+        self.cf.register_option('chained_assignment', 'raise')
+
+    def teardown_method(self, method):
         setattr(self.cf, '_global_config', self.gc)
         setattr(self.cf, '_deprecated_options', self.do)
         setattr(self.cf, '_registered_options', self.ro)
@@ -30,36 +41,45 @@ def tearDown(self):
     def test_api(self):
 
         # the pandas object exposes the user API
-        self.assertTrue(hasattr(pd, 'get_option'))
-        self.assertTrue(hasattr(pd, 'set_option'))
-        self.assertTrue(hasattr(pd, 'reset_option'))
-        self.assertTrue(hasattr(pd, 'describe_option'))
+        assert hasattr(pd, 'get_option')
+        assert hasattr(pd, 'set_option')
+        assert hasattr(pd, 'reset_option')
+        assert hasattr(pd, 'describe_option')
 
     def test_is_one_of_factory(self):
         v = self.cf.is_one_of_factory([None, 12])
 
         v(12)
         v(None)
-        self.assertRaises(ValueError, v, 1.1)
+        msg = r"Value must be one of None\|12"
+        with pytest.raises(ValueError, match=msg):
+            v(1.1)
 
     def test_register_option(self):
         self.cf.register_option('a', 1, 'doc')
 
         # can't register an already registered option
-        self.assertRaises(KeyError, self.cf.register_option, 'a', 1, 'doc')
+        msg = "Option 'a' has already been registered"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.register_option('a', 1, 'doc')
 
         # can't register an already registered option
-        self.assertRaises(KeyError, self.cf.register_option, 'a.b.c.d1', 1,
-                          'doc')
-        self.assertRaises(KeyError, self.cf.register_option, 'a.b.c.d2', 1,
-                          'doc')
+        msg = "Path prefix to option 'a' is already an option"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.register_option('a.b.c.d1', 1, 'doc')
+        with pytest.raises(OptionError, match=msg):
+            self.cf.register_option('a.b.c.d2', 1, 'doc')
 
         # no python keywords
-        self.assertRaises(ValueError, self.cf.register_option, 'for', 0)
-        self.assertRaises(ValueError, self.cf.register_option, 'a.for.b', 0)
+        msg = "for is a python keyword"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.register_option('for', 0)
+        with pytest.raises(ValueError, match=msg):
+            self.cf.register_option('a.for.b', 0)
         # must be valid identifier (ensure attribute access works)
-        self.assertRaises(ValueError, self.cf.register_option,
-                          'Oh my Goddess!', 0)
+        msg = "oh my goddess! is not a valid identifier"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.register_option('Oh my Goddess!', 0)
 
         # we can register options several levels deep
         # without predefining the intermediate steps
@@ -82,56 +102,46 @@ def test_describe_option(self):
         self.cf.register_option('l', "foo")
 
         # non-existent keys raise KeyError
-        self.assertRaises(KeyError, self.cf.describe_option, 'no.such.key')
+        msg = r"No such keys\(s\)"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.describe_option('no.such.key')
 
         # we can get the description for any key we registered
-        self.assertTrue(
-            'doc' in self.cf.describe_option('a', _print_desc=False))
-        self.assertTrue(
-            'doc2' in self.cf.describe_option('b', _print_desc=False))
-        self.assertTrue(
-            'precated' in self.cf.describe_option('b', _print_desc=False))
-
-        self.assertTrue(
-            'doc3' in self.cf.describe_option('c.d.e1', _print_desc=False))
-        self.assertTrue(
-            'doc4' in self.cf.describe_option('c.d.e2', _print_desc=False))
+        assert 'doc' in self.cf.describe_option('a', _print_desc=False)
+        assert 'doc2' in self.cf.describe_option('b', _print_desc=False)
+        assert 'precated' in self.cf.describe_option('b', _print_desc=False)
+        assert 'doc3' in self.cf.describe_option('c.d.e1', _print_desc=False)
+        assert 'doc4' in self.cf.describe_option('c.d.e2', _print_desc=False)
 
         # if no doc is specified we get a default message
         # saying "description not available"
-        self.assertTrue(
-            'vailable' in self.cf.describe_option('f', _print_desc=False))
-        self.assertTrue(
-            'vailable' in self.cf.describe_option('g.h', _print_desc=False))
-        self.assertTrue(
-            'precated' in self.cf.describe_option('g.h', _print_desc=False))
-        self.assertTrue(
-            'k' in self.cf.describe_option('g.h', _print_desc=False))
+        assert 'vailable' in self.cf.describe_option('f', _print_desc=False)
+        assert 'vailable' in self.cf.describe_option('g.h', _print_desc=False)
+        assert 'precated' in self.cf.describe_option('g.h', _print_desc=False)
+        assert 'k' in self.cf.describe_option('g.h', _print_desc=False)
 
         # default is reported
-        self.assertTrue(
-            'foo' in self.cf.describe_option('l', _print_desc=False))
+        assert 'foo' in self.cf.describe_option('l', _print_desc=False)
         # current value is reported
-        self.assertFalse(
-            'bar' in self.cf.describe_option('l', _print_desc=False))
+        assert 'bar' not in self.cf.describe_option('l', _print_desc=False)
         self.cf.set_option("l", "bar")
-        self.assertTrue(
-            'bar' in self.cf.describe_option('l', _print_desc=False))
+        assert 'bar' in self.cf.describe_option('l', _print_desc=False)
 
     def test_case_insensitive(self):
         self.cf.register_option('KanBAN', 1, 'doc')
 
-        self.assertTrue(
-            'doc' in self.cf.describe_option('kanbaN', _print_desc=False))
-        self.assertEqual(self.cf.get_option('kanBaN'), 1)
+        assert 'doc' in self.cf.describe_option('kanbaN', _print_desc=False)
+        assert self.cf.get_option('kanBaN') == 1
         self.cf.set_option('KanBan', 2)
-        self.assertEqual(self.cf.get_option('kAnBaN'), 2)
+        assert self.cf.get_option('kAnBaN') == 2
 
         # gets of non-existent keys fail
-        self.assertRaises(KeyError, self.cf.get_option, 'no_such_option')
+        msg = r"No such keys\(s\): 'no_such_option'"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.get_option('no_such_option')
         self.cf.deprecate_option('KanBan')
 
-        self.assertTrue(self.cf._is_deprecated('kAnBaN'))
+        assert self.cf._is_deprecated('kAnBaN')
 
     def test_get_option(self):
         self.cf.register_option('a', 1, 'doc')
@@ -139,130 +149,145 @@ def test_get_option(self):
         self.cf.register_option('b.b', None, 'doc2')
 
         # gets of existing keys succeed
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         # gets of non-existent keys fail
-        self.assertRaises(KeyError, self.cf.get_option, 'no_such_option')
+        msg = r"No such keys\(s\): 'no_such_option'"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.get_option('no_such_option')
 
     def test_set_option(self):
         self.cf.register_option('a', 1, 'doc')
         self.cf.register_option('b.c', 'hullo', 'doc2')
         self.cf.register_option('b.b', None, 'doc2')
 
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
         self.cf.set_option('b.b', 1.1)
 
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
-        self.assertEqual(self.cf.get_option('b.b'), 1.1)
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
+        assert self.cf.get_option('b.b') == 1.1
 
-        self.assertRaises(KeyError, self.cf.set_option, 'no.such.key', None)
+        msg = r"No such keys\(s\): 'no.such.key'"
+        with pytest.raises(OptionError, match=msg):
+            self.cf.set_option('no.such.key', None)
 
     def test_set_option_empty_args(self):
-        self.assertRaises(ValueError, self.cf.set_option)
+        msg = "Must provide an even number of non-keyword arguments"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option()
 
     def test_set_option_uneven_args(self):
-        self.assertRaises(ValueError, self.cf.set_option, 'a.b', 2, 'b.c')
+        msg = "Must provide an even number of non-keyword arguments"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option('a.b', 2, 'b.c')
 
     def test_set_option_invalid_single_argument_type(self):
-        self.assertRaises(ValueError, self.cf.set_option, 2)
+        msg = "Must provide an even number of non-keyword arguments"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option(2)
 
     def test_set_option_multiple(self):
         self.cf.register_option('a', 1, 'doc')
         self.cf.register_option('b.c', 'hullo', 'doc2')
         self.cf.register_option('b.b', None, 'doc2')
 
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
-        self.assertTrue(self.cf.get_option('b.b') is None)
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
+        assert self.cf.get_option('b.b') is None
 
         self.cf.set_option('a', '2', 'b.c', None, 'b.b', 10.0)
 
-        self.assertEqual(self.cf.get_option('a'), '2')
-        self.assertTrue(self.cf.get_option('b.c') is None)
-        self.assertEqual(self.cf.get_option('b.b'), 10.0)
+        assert self.cf.get_option('a') == '2'
+        assert self.cf.get_option('b.c') is None
+        assert self.cf.get_option('b.b') == 10.0
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_validation(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_text)
-        self.assertRaises(ValueError, self.cf.register_option, 'a.b.c.d2',
-                          'NO', 'doc', validator=self.cf.is_int)
+        msg = "Value must have type '<class 'int'>'"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.register_option(
+                'a.b.c.d2', 'NO', 'doc', validator=self.cf.is_int)
 
         self.cf.set_option('a', 2)  # int is_int
         self.cf.set_option('b.c', 'wurld')  # str is_str
 
-        self.assertRaises(
-            ValueError, self.cf.set_option, 'a', None)  # None not is_int
-        self.assertRaises(ValueError, self.cf.set_option, 'a', 'ab')
-        self.assertRaises(ValueError, self.cf.set_option, 'b.c', 1)
+        # None not is_int
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option('a', None)
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option('a', 'ab')
+
+        msg = r"Value must be an instance of <class 'str'>\|<class 'bytes'>"
+        with pytest.raises(ValueError, match=msg):
+            self.cf.set_option('b.c', 1)
 
         validator = self.cf.is_one_of_factory([None, self.cf.is_callable])
         self.cf.register_option('b', lambda: None, 'doc',
                                 validator=validator)
         self.cf.set_option('b', '%.1f'.format)  # Formatter is callable
         self.cf.set_option('b', None)  # Formatter is none (default)
-        self.assertRaises(ValueError, self.cf.set_option, 'b', '%.1f')
+        with pytest.raises(ValueError, match="Value must be a callable"):
+            self.cf.set_option('b', '%.1f')
 
     def test_reset_option(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_str)
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
 
         self.cf.reset_option('a')
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'wurld'
         self.cf.reset_option('b.c')
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
     def test_reset_option_all(self):
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2',
                                 validator=self.cf.is_str)
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
         self.cf.set_option('a', 2)
         self.cf.set_option('b.c', 'wurld')
-        self.assertEqual(self.cf.get_option('a'), 2)
-        self.assertEqual(self.cf.get_option('b.c'), 'wurld')
+        assert self.cf.get_option('a') == 2
+        assert self.cf.get_option('b.c') == 'wurld'
 
         self.cf.reset_option("all")
-        self.assertEqual(self.cf.get_option('a'), 1)
-        self.assertEqual(self.cf.get_option('b.c'), 'hullo')
+        assert self.cf.get_option('a') == 1
+        assert self.cf.get_option('b.c') == 'hullo'
 
     def test_deprecate_option(self):
         # we can deprecate non-existent options
         self.cf.deprecate_option('foo')
 
-        self.assertTrue(self.cf._is_deprecated('foo'))
+        assert self.cf._is_deprecated('foo')
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
-            try:
+            with pytest.raises(
+                    KeyError,
+                    match="No such keys.s.: 'foo'"):
                 self.cf.get_option('foo')
-            except KeyError:
-                pass
-            else:
-                self.fail("Nonexistent option didn't raise KeyError")
-
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'deprecated' in str(w[-1]))  # we get the default message
+            assert len(w) == 1  # should have raised one warning
+            assert 'deprecated' in str(w[-1])  # we get the default message
 
         self.cf.register_option('a', 1, 'doc', validator=self.cf.is_int)
         self.cf.register_option('b.c', 'hullo', 'doc2')
@@ -273,80 +298,73 @@ def test_deprecate_option(self):
             warnings.simplefilter('always')
             self.cf.get_option('a')
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the default message
-            self.assertTrue(
-                'nifty_ver' in str(w[-1]))  # with the removal_ver quoted
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the default message
+            assert 'nifty_ver' in str(w[-1])  # with the removal_ver quoted
 
-            self.assertRaises(
-                KeyError, self.cf.deprecate_option, 'a')  # can't depr. twice
+            msg = "Option 'a' has already been defined as deprecated"
+            with pytest.raises(OptionError, match=msg):
+                self.cf.deprecate_option('a')
 
         self.cf.deprecate_option('b.c', 'zounds!')
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
             self.cf.get_option('b.c')
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'zounds!' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'zounds!' in str(w[-1])  # we get the custom message
 
         # test rerouting keys
         self.cf.register_option('d.a', 'foo', 'doc2')
         self.cf.register_option('d.dep', 'bar', 'doc2')
-        self.assertEqual(self.cf.get_option('d.a'), 'foo')
-        self.assertEqual(self.cf.get_option('d.dep'), 'bar')
+        assert self.cf.get_option('d.a') == 'foo'
+        assert self.cf.get_option('d.dep') == 'bar'
 
         self.cf.deprecate_option('d.dep', rkey='d.a')  # reroute d.dep to d.a
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
-            self.assertEqual(self.cf.get_option('d.dep'), 'foo')
+            assert self.cf.get_option('d.dep') == 'foo'
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
             self.cf.set_option('d.dep', 'baz')  # should overwrite "d.a"
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter('always')
-            self.assertEqual(self.cf.get_option('d.dep'), 'baz')
+            assert self.cf.get_option('d.dep') == 'baz'
 
-            self.assertEqual(len(w), 1)  # should have raised one warning
-            self.assertTrue(
-                'eprecated' in str(w[-1]))  # we get the custom message
+            assert len(w) == 1  # should have raised one warning
+            assert 'eprecated' in str(w[-1])  # we get the custom message
 
     def test_config_prefix(self):
         with self.cf.config_prefix("base"):
             self.cf.register_option('a', 1, "doc1")
             self.cf.register_option('b', 2, "doc2")
-            self.assertEqual(self.cf.get_option('a'), 1)
-            self.assertEqual(self.cf.get_option('b'), 2)
+            assert self.cf.get_option('a') == 1
+            assert self.cf.get_option('b') == 2
 
             self.cf.set_option('a', 3)
             self.cf.set_option('b', 4)
-            self.assertEqual(self.cf.get_option('a'), 3)
-            self.assertEqual(self.cf.get_option('b'), 4)
+            assert self.cf.get_option('a') == 3
+            assert self.cf.get_option('b') == 4
 
-        self.assertEqual(self.cf.get_option('base.a'), 3)
-        self.assertEqual(self.cf.get_option('base.b'), 4)
-        self.assertTrue(
-            'doc1' in self.cf.describe_option('base.a', _print_desc=False))
-        self.assertTrue(
-            'doc2' in self.cf.describe_option('base.b', _print_desc=False))
+        assert self.cf.get_option('base.a') == 3
+        assert self.cf.get_option('base.b') == 4
+        assert 'doc1' in self.cf.describe_option('base.a', _print_desc=False)
+        assert 'doc2' in self.cf.describe_option('base.b', _print_desc=False)
 
         self.cf.reset_option('base.a')
         self.cf.reset_option('base.b')
 
         with self.cf.config_prefix("base"):
-            self.assertEqual(self.cf.get_option('a'), 1)
-            self.assertEqual(self.cf.get_option('b'), 2)
+            assert self.cf.get_option('a') == 1
+            assert self.cf.get_option('b') == 2
 
     def test_callback(self):
         k = [None]
@@ -361,21 +379,21 @@ def callback(key):
 
         del k[-1], v[-1]
         self.cf.set_option("d.a", "fooz")
-        self.assertEqual(k[-1], "d.a")
-        self.assertEqual(v[-1], "fooz")
+        assert k[-1] == "d.a"
+        assert v[-1] == "fooz"
 
         del k[-1], v[-1]
         self.cf.set_option("d.b", "boo")
-        self.assertEqual(k[-1], "d.b")
-        self.assertEqual(v[-1], "boo")
+        assert k[-1] == "d.b"
+        assert v[-1] == "boo"
 
         del k[-1], v[-1]
         self.cf.reset_option("d.b")
-        self.assertEqual(k[-1], "d.b")
+        assert k[-1] == "d.b"
 
     def test_set_ContextManager(self):
         def eq(val):
-            self.assertEqual(self.cf.get_option("a"), val)
+            assert self.cf.get_option("a") == val
 
         self.cf.register_option('a', 0)
         eq(0)
@@ -392,12 +410,6 @@ def eq(val):
     def test_attribute_access(self):
         holder = []
 
-        def f():
-            options.b = 1
-
-        def f2():
-            options.display = 1
-
         def f3(key):
             holder.append(True)
 
@@ -405,22 +417,25 @@ def f3(key):
         self.cf.register_option('c', 0, cb=f3)
         options = self.cf.options
 
-        self.assertEqual(options.a, 0)
+        assert options.a == 0
         with self.cf.option_context("a", 15):
-            self.assertEqual(options.a, 15)
+            assert options.a == 15
 
         options.a = 500
-        self.assertEqual(self.cf.get_option("a"), 500)
+        assert self.cf.get_option("a") == 500
 
         self.cf.reset_option("a")
-        self.assertEqual(options.a, self.cf.get_option("a", 0))
+        assert options.a == self.cf.get_option("a", 0)
 
-        self.assertRaises(KeyError, f)
-        self.assertRaises(KeyError, f2)
+        msg = "You can only set the value of existing options"
+        with pytest.raises(OptionError, match=msg):
+            options.b = 1
+        with pytest.raises(OptionError, match=msg):
+            options.display = 1
 
         # make sure callback kicks when using this form of setting
         options.c = 1
-        self.assertEqual(len(holder), 1)
+        assert len(holder) == 1
 
     def test_option_context_scope(self):
         # Ensure that creating a context does not affect the existing
@@ -435,11 +450,18 @@ def test_option_context_scope(self):
 
         # Ensure creating contexts didn't affect the current context.
         ctx = self.cf.option_context(option_name, context_value)
-        self.assertEqual(self.cf.get_option(option_name), original_value)
+        assert self.cf.get_option(option_name) == original_value
 
         # Ensure the correct value is available inside the context.
         with ctx:
-            self.assertEqual(self.cf.get_option(option_name), context_value)
+            assert self.cf.get_option(option_name) == context_value
 
         # Ensure the current context is reset
-        self.assertEqual(self.cf.get_option(option_name), original_value)
+        assert self.cf.get_option(option_name) == original_value
+
+    def test_dictwrapper_getattr(self):
+        options = self.cf.options
+        # GH 19789
+        with pytest.raises(OptionError, match="No such option"):
+            options.bananas
+        assert not hasattr(options, 'bananas')
diff --git a/pandas/tests/test_downstream.py b/pandas/tests/test_downstream.py
new file mode 100644
index 0000000000000..92b4e5a99041a
--- /dev/null
+++ b/pandas/tests/test_downstream.py
@@ -0,0 +1,135 @@
+# -*- coding: utf-8 -*-
+"""
+Testing that we work in the downstream packages
+"""
+import importlib
+import subprocess
+import sys
+
+import numpy as np  # noqa
+import pytest
+
+from pandas.compat import PY2, PY36, is_platform_windows
+
+from pandas import DataFrame
+from pandas.util import testing as tm
+
+
+def import_module(name):
+    # we *only* want to skip if the module is truly not available
+    # and NOT just an actual import error because of pandas changes
+
+    if PY36:
+        try:
+            return importlib.import_module(name)
+        except ModuleNotFoundError:  # noqa
+            pytest.skip("skipping as {} not available".format(name))
+
+    else:
+        try:
+            return importlib.import_module(name)
+        except ImportError as e:
+            if "No module named" in str(e) and name in str(e):
+                pytest.skip("skipping as {} not available".format(name))
+            raise
+
+
+@pytest.fixture
+def df():
+    return DataFrame({'A': [1, 2, 3]})
+
+
+def test_dask(df):
+
+    toolz = import_module('toolz')  # noqa
+    dask = import_module('dask')  # noqa
+
+    import dask.dataframe as dd
+
+    ddf = dd.from_pandas(df, npartitions=3)
+    assert ddf.A is not None
+    assert ddf.compute() is not None
+
+
+def test_xarray(df):
+
+    xarray = import_module('xarray')  # noqa
+
+    assert df.to_xarray() is not None
+
+
+@pytest.mark.skipif(is_platform_windows() and PY2,
+                    reason="Broken on Windows / Py2")
+def test_oo_optimizable():
+    # GH 21071
+    subprocess.check_call([sys.executable, "-OO", "-c", "import pandas"])
+
+
+@tm.network
+# Cython import warning
+@pytest.mark.filterwarnings("ignore:can't:ImportWarning")
+def test_statsmodels():
+
+    statsmodels = import_module('statsmodels')  # noqa
+    import statsmodels.api as sm
+    import statsmodels.formula.api as smf
+    df = sm.datasets.get_rdataset("Guerry", "HistData").data
+    smf.ols('Lottery ~ Literacy + np.log(Pop1831)', data=df).fit()
+
+
+# Cython import warning
+@pytest.mark.filterwarnings("ignore:can't:ImportWarning")
+def test_scikit_learn(df):
+
+    sklearn = import_module('sklearn')  # noqa
+    from sklearn import svm, datasets
+
+    digits = datasets.load_digits()
+    clf = svm.SVC(gamma=0.001, C=100.)
+    clf.fit(digits.data[:-1], digits.target[:-1])
+    clf.predict(digits.data[-1:])
+
+
+# Cython import warning and traitlets
+@tm.network
+@pytest.mark.filterwarnings("ignore")
+def test_seaborn():
+
+    seaborn = import_module('seaborn')
+    tips = seaborn.load_dataset("tips")
+    seaborn.stripplot(x="day", y="total_bill", data=tips)
+
+
+def test_pandas_gbq(df):
+
+    pandas_gbq = import_module('pandas_gbq')  # noqa
+
+
+@pytest.mark.xfail(reason="0.7.0 pending")
+@tm.network
+def test_pandas_datareader():
+
+    pandas_datareader = import_module('pandas_datareader')  # noqa
+    pandas_datareader.DataReader(
+        'F', 'quandl', '2017-01-01', '2017-02-01')
+
+
+# importing from pandas, Cython import warning
+@pytest.mark.filterwarnings("ignore:The 'warn':DeprecationWarning")
+@pytest.mark.filterwarnings("ignore:pandas.util:DeprecationWarning")
+@pytest.mark.filterwarnings("ignore:can't resolve:ImportWarning")
+def test_geopandas():
+
+    geopandas = import_module('geopandas')  # noqa
+    fp = geopandas.datasets.get_path('naturalearth_lowres')
+    assert geopandas.read_file(fp) is not None
+
+
+# Cython import warning
+@pytest.mark.filterwarnings("ignore:can't resolve:ImportWarning")
+def test_pyarrow(df):
+
+    pyarrow = import_module('pyarrow')  # noqa
+    table = pyarrow.Table.from_pandas(df)
+    result = table.to_pandas()
+    tm.assert_frame_equal(result, df)
diff --git a/pandas/tests/test_errors.py b/pandas/tests/test_errors.py
new file mode 100644
index 0000000000000..d3b6a237a97a1
--- /dev/null
+++ b/pandas/tests/test_errors.py
@@ -0,0 +1,74 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas.errors import AbstractMethodError
+
+import pandas as pd  # noqa
+
+
+@pytest.mark.parametrize(
+    "exc", ['UnsupportedFunctionCall', 'UnsortedIndexError',
+            'OutOfBoundsDatetime',
+            'ParserError', 'PerformanceWarning', 'DtypeWarning',
+            'EmptyDataError', 'ParserWarning', 'MergeError'])
+def test_exception_importable(exc):
+    from pandas import errors
+    e = getattr(errors, exc)
+    assert e is not None
+
+    # check that we can raise on them
+    with pytest.raises(e):
+        raise e()
+
+
+def test_catch_oob():
+    from pandas import errors
+
+    try:
+        pd.Timestamp('15000101')
+    except errors.OutOfBoundsDatetime:
+        pass
+
+
+def test_error_rename():
+    # see gh-12665
+    from pandas.errors import ParserError
+    from pandas.io.common import CParserError
+
+    try:
+        raise CParserError()
+    except ParserError:
+        pass
+
+    try:
+        raise ParserError()
+    except CParserError:
+        pass
+
+
+class Foo(object):
+    @classmethod
+    def classmethod(cls):
+        raise AbstractMethodError(cls, methodtype='classmethod')
+
+    @property
+    def property(self):
+        raise AbstractMethodError(self, methodtype='property')
+
+    def method(self):
+        raise AbstractMethodError(self)
+
+
+def test_AbstractMethodError_classmethod():
+    xpr = "This classmethod must be defined in the concrete class Foo"
+    with pytest.raises(AbstractMethodError, match=xpr):
+        Foo.classmethod()
+
+    xpr = "This property must be defined in the concrete class Foo"
+    with pytest.raises(AbstractMethodError, match=xpr):
+        Foo().property
+
+    xpr = "This method must be defined in the concrete class Foo"
+    with pytest.raises(AbstractMethodError, match=xpr):
+        Foo().method()
diff --git a/pandas/tests/test_expressions.py b/pandas/tests/test_expressions.py
index f669ebe371f9d..7a2680135ea80 100644
--- a/pandas/tests/test_expressions.py
+++ b/pandas/tests/test_expressions.py
@@ -1,23 +1,23 @@
 # -*- coding: utf-8 -*-
 from __future__ import print_function
-# pylint: disable-msg=W0612,E1101
 
-import re
 import operator
-import pytest
-
-from numpy.random import randn
+import re
 
 import numpy as np
+from numpy.random import randn
+import pytest
 
-from pandas.core.api import DataFrame, Panel
-from pandas.computation import expressions as expr
-from pandas import compat, _np_version_under1p11
-from pandas.util.testing import (assert_almost_equal, assert_series_equal,
-                                 assert_frame_equal, assert_panel_equal,
-                                 assert_panel4d_equal, slow)
-from pandas.formats.printing import pprint_thing
+from pandas import _np_version_under1p13, compat
+from pandas.core.api import DataFrame
+from pandas.core.computation import expressions as expr
 import pandas.util.testing as tm
+from pandas.util.testing import (
+    assert_almost_equal, assert_frame_equal, assert_series_equal)
+
+from pandas.io.formats.printing import pprint_thing
+
+# pylint: disable-msg=W0612,E1101
 
 
 _frame = DataFrame(randn(10000, 4), columns=list('ABCD'), dtype='float64')
@@ -32,25 +32,16 @@
                      'D': _frame2['D'].astype('int32')})
 _integer = DataFrame(
     np.random.randint(1, 100,
-                      size=(10001, 4)), columns=list('ABCD'), dtype='int64')
+                      size=(10001, 4)),
+    columns=list('ABCD'), dtype='int64')
 _integer2 = DataFrame(np.random.randint(1, 100, size=(101, 4)),
                       columns=list('ABCD'), dtype='int64')
-_frame_panel = Panel(dict(ItemA=_frame.copy(), ItemB=(
-    _frame.copy() + 3), ItemC=_frame.copy(), ItemD=_frame.copy()))
-_frame2_panel = Panel(dict(ItemA=_frame2.copy(), ItemB=(_frame2.copy() + 3),
-                           ItemC=_frame2.copy(), ItemD=_frame2.copy()))
-_integer_panel = Panel(dict(ItemA=_integer, ItemB=(_integer + 34).astype(
-    'int64')))
-_integer2_panel = Panel(dict(ItemA=_integer2, ItemB=(_integer2 + 34).astype(
-    'int64')))
-_mixed_panel = Panel(dict(ItemA=_mixed, ItemB=(_mixed + 3)))
-_mixed2_panel = Panel(dict(ItemA=_mixed2, ItemB=(_mixed2 + 3)))
 
 
 @pytest.mark.skipif(not expr._USE_NUMEXPR, reason='not using numexpr')
-class TestExpressions(tm.TestCase):
+class TestExpressions(object):
 
-    def setUp(self):
+    def setup_method(self, method):
 
         self.frame = _frame.copy()
         self.frame2 = _frame2.copy()
@@ -59,23 +50,17 @@ def setUp(self):
         self.integer = _integer.copy()
         self._MIN_ELEMENTS = expr._MIN_ELEMENTS
 
-    def tearDown(self):
+    def teardown_method(self, method):
         expr._MIN_ELEMENTS = self._MIN_ELEMENTS
 
     def run_arithmetic(self, df, other, assert_func, check_dtype=False,
                        test_flex=True):
         expr._MIN_ELEMENTS = 0
-        operations = ['add', 'sub', 'mul', 'mod', 'truediv', 'floordiv', 'pow']
+        operations = ['add', 'sub', 'mul', 'mod', 'truediv', 'floordiv']
         if not compat.PY3:
             operations.append('div')
         for arith in operations:
 
-            # numpy >= 1.11 doesn't handle integers
-            # raised to integer powers
-            # https://github.com/pandas-dev/pandas/issues/15363
-            if arith == 'pow' and not _np_version_under1p11:
-                continue
-
             operator_name = arith
             if arith == 'div':
                 operator_name = 'truediv'
@@ -107,7 +92,7 @@ def test_integer_arithmetic(self):
                             check_dtype=True)
 
     def run_binary(self, df, other, assert_func, test_flex=False,
-                   numexpr_ops=set(['gt', 'lt', 'ge', 'le', 'eq', 'ne'])):
+                   numexpr_ops={'gt', 'lt', 'ge', 'le', 'eq', 'ne'}):
         """
         tests solely that the result is the same whether or not numexpr is
         enabled.  Need to test whether the function does the correct thing
@@ -116,6 +101,7 @@ def run_binary(self, df, other, assert_func, test_flex=False,
         expr._MIN_ELEMENTS = 0
         expr.set_test_mode(True)
         operations = ['gt', 'lt', 'ge', 'le', 'eq', 'ne']
+
         for arith in operations:
             if test_flex:
                 op = lambda x, y: getattr(df, arith)(y)
@@ -168,46 +154,18 @@ def run_series(self, ser, other, binary_comp=None, **kwargs):
         # self.run_binary(ser, binary_comp, assert_frame_equal,
         # test_flex=True, **kwargs)
 
-    def run_panel(self, panel, other, binary_comp=None, run_binary=True,
-                  assert_func=assert_panel_equal, **kwargs):
-        self.run_arithmetic(panel, other, assert_func, test_flex=False,
-                            **kwargs)
-        self.run_arithmetic(panel, other, assert_func, test_flex=True,
-                            **kwargs)
-        if run_binary:
-            if binary_comp is None:
-                binary_comp = other + 1
-            self.run_binary(panel, binary_comp, assert_func,
-                            test_flex=False, **kwargs)
-            self.run_binary(panel, binary_comp, assert_func,
-                            test_flex=True, **kwargs)
-
     def test_integer_arithmetic_frame(self):
         self.run_frame(self.integer, self.integer)
 
     def test_integer_arithmetic_series(self):
         self.run_series(self.integer.iloc[:, 0], self.integer.iloc[:, 0])
 
-    @slow
-    def test_integer_panel(self):
-        self.run_panel(_integer2_panel, np.random.randint(1, 100))
-
     def test_float_arithemtic_frame(self):
         self.run_frame(self.frame2, self.frame2)
 
     def test_float_arithmetic_series(self):
         self.run_series(self.frame2.iloc[:, 0], self.frame2.iloc[:, 0])
 
-    @slow
-    def test_float_panel(self):
-        self.run_panel(_frame2_panel, np.random.randn() + 0.1, binary_comp=0.8)
-
-    @slow
-    def test_panel4d(self):
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.run_panel(tm.makePanel4D(), np.random.randn() + 0.5,
-                           assert_func=assert_panel4d_equal, binary_comp=3)
-
     def test_mixed_arithmetic_frame(self):
         # TODO: FIGURE OUT HOW TO GET IT TO WORK...
         # can't do arithmetic because comparison methods try to do *entire*
@@ -218,11 +176,6 @@ def test_mixed_arithmetic_series(self):
         for col in self.mixed2.columns:
             self.run_series(self.mixed2[col], self.mixed2[col], binary_comp=4)
 
-    @slow
-    def test_mixed_panel(self):
-        self.run_panel(_mixed2_panel, np.random.randint(1, 100),
-                       binary_comp=-2)
-
     def test_float_arithemtic(self):
         self.run_arithmetic(self.frame, self.frame, assert_frame_equal)
         self.run_arithmetic(self.frame.iloc[:, 0], self.frame.iloc[:, 0],
@@ -246,22 +199,22 @@ def test_invalid(self):
         # no op
         result = expr._can_use_numexpr(operator.add, None, self.frame,
                                        self.frame, 'evaluate')
-        self.assertFalse(result)
+        assert not result
 
         # mixed
         result = expr._can_use_numexpr(operator.add, '+', self.mixed,
                                        self.frame, 'evaluate')
-        self.assertFalse(result)
+        assert not result
 
         # min elements
         result = expr._can_use_numexpr(operator.add, '+', self.frame2,
                                        self.frame2, 'evaluate')
-        self.assertFalse(result)
+        assert not result
 
         # ok, we only check on first part of expression
         result = expr._can_use_numexpr(operator.add, '+', self.frame,
                                        self.frame2, 'evaluate')
-        self.assertTrue(result)
+        assert result
 
     def test_binary_ops(self):
         def testit():
@@ -272,10 +225,7 @@ def testit():
                 for op, op_str in [('add', '+'), ('sub', '-'), ('mul', '*'),
                                    ('div', '/'), ('pow', '**')]:
 
-                    # numpy >= 1.11 doesn't handle integers
-                    # raised to integer powers
-                    # https://github.com/pandas-dev/pandas/issues/15363
-                    if op == 'pow' and not _np_version_under1p11:
+                    if op == 'pow':
                         continue
 
                     if op == 'div':
@@ -285,7 +235,7 @@ def testit():
                     if op is not None:
                         result = expr._can_use_numexpr(op, op_str, f, f,
                                                        'evaluate')
-                        self.assertNotEqual(result, f._is_mixed_type)
+                        assert result != f._is_mixed_type
 
                         result = expr.evaluate(op, op_str, f, f,
                                                use_numexpr=True)
@@ -300,7 +250,7 @@ def testit():
 
                         result = expr._can_use_numexpr(op, op_str, f2, f2,
                                                        'evaluate')
-                        self.assertFalse(result)
+                        assert not result
 
         expr.set_use_numexpr(False)
         testit()
@@ -328,7 +278,7 @@ def testit():
 
                     result = expr._can_use_numexpr(op, op_str, f11, f12,
                                                    'evaluate')
-                    self.assertNotEqual(result, f11._is_mixed_type)
+                    assert result != f11._is_mixed_type
 
                     result = expr.evaluate(op, op_str, f11, f12,
                                            use_numexpr=True)
@@ -341,7 +291,7 @@ def testit():
 
                     result = expr._can_use_numexpr(op, op_str, f21, f22,
                                                    'evaluate')
-                    self.assertFalse(result)
+                    assert not result
 
         expr.set_use_numexpr(False)
         testit()
@@ -382,22 +332,22 @@ def test_bool_ops_raise_on_arithmetic(self):
                 f = getattr(operator, name)
                 err_msg = re.escape(msg % op)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(df, df)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(df.a, df.b)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(df.a, True)
 
-                with tm.assertRaisesRegexp(NotImplementedError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(False, df.a)
 
-                with tm.assertRaisesRegexp(TypeError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(False, df)
 
-                with tm.assertRaisesRegexp(TypeError, err_msg):
+                with pytest.raises(NotImplementedError, match=err_msg):
                     f(df, True)
 
     def test_bool_ops_warn_on_arithmetic(self):
@@ -412,6 +362,10 @@ def test_bool_ops_warn_on_arithmetic(self):
             f = getattr(operator, name)
             fe = getattr(operator, sub_funcs[subs[op]])
 
+            # >= 1.13.0 these are now TypeErrors
+            if op == '-' and not _np_version_under1p13:
+                continue
+
             with tm.use_numexpr(True, min_elements=5):
                 with tm.assert_produces_warning(check_stacklevel=False):
                     r = f(df, df)
@@ -442,3 +396,19 @@ def test_bool_ops_warn_on_arithmetic(self):
                     r = f(df, True)
                     e = fe(df, True)
                     tm.assert_frame_equal(r, e)
+
+    @pytest.mark.parametrize("test_input,expected", [
+        (DataFrame([[0, 1, 2, 'aa'], [0, 1, 2, 'aa']],
+                   columns=['a', 'b', 'c', 'dtype']),
+         DataFrame([[False, False], [False, False]],
+                   columns=['a', 'dtype'])),
+        (DataFrame([[0, 3, 2, 'aa'], [0, 4, 2, 'aa'], [0, 1, 1, 'bb']],
+                   columns=['a', 'b', 'c', 'dtype']),
+         DataFrame([[False, False], [False, False],
+                   [False, False]], columns=['a', 'dtype'])),
+    ])
+    def test_bool_ops_column_name_dtype(self, test_input, expected):
+        # GH 22383 - .ne fails if columns containing column name 'dtype'
+        result = test_input.loc[:, ['a', 'dtype']].ne(
+            test_input.loc[:, ['a', 'dtype']])
+        assert_frame_equal(result, expected)
diff --git a/pandas/tests/test_generic.py b/pandas/tests/test_generic.py
deleted file mode 100644
index a2329e2d1768e..0000000000000
--- a/pandas/tests/test_generic.py
+++ /dev/null
@@ -1,2057 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable-msg=E1101,W0612
-
-from operator import methodcaller
-from copy import copy, deepcopy
-import pytest
-import numpy as np
-from numpy import nan
-import pandas as pd
-
-from distutils.version import LooseVersion
-from pandas.types.common import is_scalar
-from pandas import (Index, Series, DataFrame, Panel, isnull,
-                    date_range, period_range, Panel4D)
-from pandas.core.index import MultiIndex
-
-import pandas.formats.printing as printing
-
-from pandas.compat import range, zip, PY3
-from pandas import compat
-from pandas.util.testing import (assertRaisesRegexp,
-                                 assert_series_equal,
-                                 assert_frame_equal,
-                                 assert_panel_equal,
-                                 assert_panel4d_equal,
-                                 assert_almost_equal)
-
-import pandas.util.testing as tm
-
-
-# ----------------------------------------------------------------------
-# Generic types test cases
-
-
-class Generic(object):
-
-    def setUp(self):
-        pass
-
-    @property
-    def _ndim(self):
-        return self._typ._AXIS_LEN
-
-    def _axes(self):
-        """ return the axes for my object typ """
-        return self._typ._AXIS_ORDERS
-
-    def _construct(self, shape, value=None, dtype=None, **kwargs):
-        """ construct an object for the given shape
-            if value is specified use that if its a scalar
-            if value is an array, repeat it as needed """
-
-        if isinstance(shape, int):
-            shape = tuple([shape] * self._ndim)
-        if value is not None:
-            if is_scalar(value):
-                if value == 'empty':
-                    arr = None
-
-                    # remove the info axis
-                    kwargs.pop(self._typ._info_axis_name, None)
-                else:
-                    arr = np.empty(shape, dtype=dtype)
-                    arr.fill(value)
-            else:
-                fshape = np.prod(shape)
-                arr = value.ravel()
-                new_shape = fshape / arr.shape[0]
-                if fshape % arr.shape[0] != 0:
-                    raise Exception("invalid value passed in _construct")
-
-                arr = np.repeat(arr, new_shape).reshape(shape)
-        else:
-            arr = np.random.randn(*shape)
-        return self._typ(arr, dtype=dtype, **kwargs)
-
-    def _compare(self, result, expected):
-        self._comparator(result, expected)
-
-    def test_rename(self):
-
-        # single axis
-        idx = list('ABCD')
-        # relabeling values passed into self.rename
-        args = [
-            str.lower,
-            {x: x.lower() for x in idx},
-            Series({x: x.lower() for x in idx}),
-        ]
-
-        for axis in self._axes():
-            kwargs = {axis: idx}
-            obj = self._construct(4, **kwargs)
-
-            for arg in args:
-                # rename a single axis
-                result = obj.rename(**{axis: arg})
-                expected = obj.copy()
-                setattr(expected, axis, list('abcd'))
-                self._compare(result, expected)
-
-        # multiple axes at once
-
-    def test_rename_axis(self):
-        idx = list('ABCD')
-        # relabeling values passed into self.rename
-        args = [
-            str.lower,
-            {x: x.lower() for x in idx},
-            Series({x: x.lower() for x in idx}),
-        ]
-
-        for axis in self._axes():
-            kwargs = {axis: idx}
-            obj = self._construct(4, **kwargs)
-
-            for arg in args:
-                # rename a single axis
-                result = obj.rename_axis(arg, axis=axis)
-                expected = obj.copy()
-                setattr(expected, axis, list('abcd'))
-                self._compare(result, expected)
-            # scalar values
-            for arg in ['foo', None]:
-                result = obj.rename_axis(arg, axis=axis)
-                expected = obj.copy()
-                getattr(expected, axis).name = arg
-                self._compare(result, expected)
-
-    def test_get_numeric_data(self):
-
-        n = 4
-        kwargs = {}
-        for i in range(self._ndim):
-            kwargs[self._typ._AXIS_NAMES[i]] = list(range(n))
-
-        # get the numeric data
-        o = self._construct(n, **kwargs)
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        # non-inclusion
-        result = o._get_bool_data()
-        expected = self._construct(n, value='empty', **kwargs)
-        self._compare(result, expected)
-
-        # get the bool data
-        arr = np.array([True, True, False, True])
-        o = self._construct(n, value=arr, **kwargs)
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        # _get_numeric_data is includes _get_bool_data, so can't test for
-        # non-inclusion
-
-    def test_get_default(self):
-
-        # GH 7725
-        d0 = "a", "b", "c", "d"
-        d1 = np.arange(4, dtype='int64')
-        others = "e", 10
-
-        for data, index in ((d0, d1), (d1, d0)):
-            s = Series(data, index=index)
-            for i, d in zip(index, data):
-                self.assertEqual(s.get(i), d)
-                self.assertEqual(s.get(i, d), d)
-                self.assertEqual(s.get(i, "z"), d)
-                for other in others:
-                    self.assertEqual(s.get(other, "z"), "z")
-                    self.assertEqual(s.get(other, other), other)
-
-    def test_nonzero(self):
-
-        # GH 4633
-        # look at the boolean/nonzero behavior for objects
-        obj = self._construct(shape=4)
-        self.assertRaises(ValueError, lambda: bool(obj == 0))
-        self.assertRaises(ValueError, lambda: bool(obj == 1))
-        self.assertRaises(ValueError, lambda: bool(obj))
-
-        obj = self._construct(shape=4, value=1)
-        self.assertRaises(ValueError, lambda: bool(obj == 0))
-        self.assertRaises(ValueError, lambda: bool(obj == 1))
-        self.assertRaises(ValueError, lambda: bool(obj))
-
-        obj = self._construct(shape=4, value=np.nan)
-        self.assertRaises(ValueError, lambda: bool(obj == 0))
-        self.assertRaises(ValueError, lambda: bool(obj == 1))
-        self.assertRaises(ValueError, lambda: bool(obj))
-
-        # empty
-        obj = self._construct(shape=0)
-        self.assertRaises(ValueError, lambda: bool(obj))
-
-        # invalid behaviors
-
-        obj1 = self._construct(shape=4, value=1)
-        obj2 = self._construct(shape=4, value=1)
-
-        def f():
-            if obj1:
-                printing.pprint_thing("this works and shouldn't")
-
-        self.assertRaises(ValueError, f)
-        self.assertRaises(ValueError, lambda: obj1 and obj2)
-        self.assertRaises(ValueError, lambda: obj1 or obj2)
-        self.assertRaises(ValueError, lambda: not obj1)
-
-    def test_numpy_1_7_compat_numeric_methods(self):
-        # GH 4435
-        # numpy in 1.7 tries to pass addtional arguments to pandas functions
-
-        o = self._construct(shape=4)
-        for op in ['min', 'max', 'max', 'var', 'std', 'prod', 'sum', 'cumsum',
-                   'cumprod', 'median', 'skew', 'kurt', 'compound', 'cummax',
-                   'cummin', 'all', 'any']:
-            f = getattr(np, op, None)
-            if f is not None:
-                f(o)
-
-    def test_downcast(self):
-        # test close downcasting
-
-        o = self._construct(shape=4, value=9, dtype=np.int64)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, o)
-
-        o = self._construct(shape=4, value=9.)
-        expected = o.astype(np.int64)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, expected)
-
-        o = self._construct(shape=4, value=9.5)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        self._compare(result, o)
-
-        # are close
-        o = self._construct(shape=4, value=9.000000000005)
-        result = o.copy()
-        result._data = o._data.downcast(dtypes='infer')
-        expected = o.astype(np.int64)
-        self._compare(result, expected)
-
-    def test_constructor_compound_dtypes(self):
-        # GH 5191
-        # compound dtypes should raise not-implementederror
-
-        def f(dtype):
-            return self._construct(shape=3, dtype=dtype)
-
-        self.assertRaises(NotImplementedError, f, [("A", "datetime64[h]"),
-                                                   ("B", "str"),
-                                                   ("C", "int32")])
-
-        # these work (though results may be unexpected)
-        f('int64')
-        f('float64')
-        f('M8[ns]')
-
-    def check_metadata(self, x, y=None):
-        for m in x._metadata:
-            v = getattr(x, m, None)
-            if y is None:
-                self.assertIsNone(v)
-            else:
-                self.assertEqual(v, getattr(y, m, None))
-
-    def test_metadata_propagation(self):
-        # check that the metadata matches up on the resulting ops
-
-        o = self._construct(shape=3)
-        o.name = 'foo'
-        o2 = self._construct(shape=3)
-        o2.name = 'bar'
-
-        # TODO
-        # Once panel can do non-trivial combine operations
-        # (currently there is an a raise in the Panel arith_ops to prevent
-        # this, though it actually does work)
-        # can remove all of these try: except: blocks on the actual operations
-
-        # ----------
-        # preserving
-        # ----------
-
-        # simple ops with scalars
-        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
-            result = getattr(o, op)(1)
-            self.check_metadata(o, result)
-
-        # ops with like
-        for op in ['__add__', '__sub__', '__truediv__', '__mul__']:
-            try:
-                result = getattr(o, op)(o)
-                self.check_metadata(o, result)
-            except (ValueError, AttributeError):
-                pass
-
-        # simple boolean
-        for op in ['__eq__', '__le__', '__ge__']:
-            v1 = getattr(o, op)(o)
-            self.check_metadata(o, v1)
-
-            try:
-                self.check_metadata(o, v1 & v1)
-            except (ValueError):
-                pass
-
-            try:
-                self.check_metadata(o, v1 | v1)
-            except (ValueError):
-                pass
-
-        # combine_first
-        try:
-            result = o.combine_first(o2)
-            self.check_metadata(o, result)
-        except (AttributeError):
-            pass
-
-        # ---------------------------
-        # non-preserving (by default)
-        # ---------------------------
-
-        # add non-like
-        try:
-            result = o + o2
-            self.check_metadata(result)
-        except (ValueError, AttributeError):
-            pass
-
-        # simple boolean
-        for op in ['__eq__', '__le__', '__ge__']:
-
-            # this is a name matching op
-            v1 = getattr(o, op)(o)
-
-            v2 = getattr(o, op)(o2)
-            self.check_metadata(v2)
-
-            try:
-                self.check_metadata(v1 & v2)
-            except (ValueError):
-                pass
-
-            try:
-                self.check_metadata(v1 | v2)
-            except (ValueError):
-                pass
-
-    def test_head_tail(self):
-        # GH5370
-
-        o = self._construct(shape=10)
-
-        # check all index types
-        for index in [tm.makeFloatIndex, tm.makeIntIndex, tm.makeStringIndex,
-                      tm.makeUnicodeIndex, tm.makeDateIndex,
-                      tm.makePeriodIndex]:
-            axis = o._get_axis_name(0)
-            setattr(o, axis, index(len(getattr(o, axis))))
-
-            # Panel + dims
-            try:
-                o.head()
-            except (NotImplementedError):
-                pytest.skip('not implemented on {0}'.format(
-                    o.__class__.__name__))
-
-            self._compare(o.head(), o.iloc[:5])
-            self._compare(o.tail(), o.iloc[-5:])
-
-            # 0-len
-            self._compare(o.head(0), o.iloc[0:0])
-            self._compare(o.tail(0), o.iloc[0:0])
-
-            # bounded
-            self._compare(o.head(len(o) + 1), o)
-            self._compare(o.tail(len(o) + 1), o)
-
-            # neg index
-            self._compare(o.head(-3), o.head(7))
-            self._compare(o.tail(-3), o.tail(7))
-
-    def test_sample(self):
-        # Fixes issue: 2419
-
-        o = self._construct(shape=10)
-
-        ###
-        # Check behavior of random_state argument
-        ###
-
-        # Check for stability when receives seed or random state -- run 10
-        # times.
-        for test in range(10):
-            seed = np.random.randint(0, 100)
-            self._compare(
-                o.sample(n=4, random_state=seed), o.sample(n=4,
-                                                           random_state=seed))
-            self._compare(
-                o.sample(frac=0.7, random_state=seed), o.sample(
-                    frac=0.7, random_state=seed))
-
-            self._compare(
-                o.sample(n=4, random_state=np.random.RandomState(test)),
-                o.sample(n=4, random_state=np.random.RandomState(test)))
-
-            self._compare(
-                o.sample(frac=0.7, random_state=np.random.RandomState(test)),
-                o.sample(frac=0.7, random_state=np.random.RandomState(test)))
-
-            os1, os2 = [], []
-            for _ in range(2):
-                np.random.seed(test)
-                os1.append(o.sample(n=4))
-                os2.append(o.sample(frac=0.7))
-            self._compare(*os1)
-            self._compare(*os2)
-
-        # Check for error when random_state argument invalid.
-        with tm.assertRaises(ValueError):
-            o.sample(random_state='astring!')
-
-        ###
-        # Check behavior of `frac` and `N`
-        ###
-
-        # Giving both frac and N throws error
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, frac=0.3)
-
-        # Check that raises right error for negative lengths
-        with tm.assertRaises(ValueError):
-            o.sample(n=-3)
-        with tm.assertRaises(ValueError):
-            o.sample(frac=-0.3)
-
-        # Make sure float values of `n` give error
-        with tm.assertRaises(ValueError):
-            o.sample(n=3.2)
-
-        # Check lengths are right
-        self.assertTrue(len(o.sample(n=4) == 4))
-        self.assertTrue(len(o.sample(frac=0.34) == 3))
-        self.assertTrue(len(o.sample(frac=0.36) == 4))
-
-        ###
-        # Check weights
-        ###
-
-        # Weight length must be right
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=[0, 1])
-
-        with tm.assertRaises(ValueError):
-            bad_weights = [0.5] * 11
-            o.sample(n=3, weights=bad_weights)
-
-        with tm.assertRaises(ValueError):
-            bad_weight_series = Series([0, 0, 0.2])
-            o.sample(n=4, weights=bad_weight_series)
-
-        # Check won't accept negative weights
-        with tm.assertRaises(ValueError):
-            bad_weights = [-0.1] * 10
-            o.sample(n=3, weights=bad_weights)
-
-        # Check inf and -inf throw errors:
-        with tm.assertRaises(ValueError):
-            weights_with_inf = [0.1] * 10
-            weights_with_inf[0] = np.inf
-            o.sample(n=3, weights=weights_with_inf)
-
-        with tm.assertRaises(ValueError):
-            weights_with_ninf = [0.1] * 10
-            weights_with_ninf[0] = -np.inf
-            o.sample(n=3, weights=weights_with_ninf)
-
-        # All zeros raises errors
-        zero_weights = [0] * 10
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=zero_weights)
-
-        # All missing weights
-        nan_weights = [np.nan] * 10
-        with tm.assertRaises(ValueError):
-            o.sample(n=3, weights=nan_weights)
-
-        # Check np.nan are replaced by zeros.
-        weights_with_nan = [np.nan] * 10
-        weights_with_nan[5] = 0.5
-        self._compare(
-            o.sample(n=1, axis=0, weights=weights_with_nan), o.iloc[5:6])
-
-        # Check None are also replaced by zeros.
-        weights_with_None = [None] * 10
-        weights_with_None[5] = 0.5
-        self._compare(
-            o.sample(n=1, axis=0, weights=weights_with_None), o.iloc[5:6])
-
-    def test_size_compat(self):
-        # GH8846
-        # size property should be defined
-
-        o = self._construct(shape=10)
-        self.assertTrue(o.size == np.prod(o.shape))
-        self.assertTrue(o.size == 10 ** len(o.axes))
-
-    def test_split_compat(self):
-        # xref GH8846
-        o = self._construct(shape=10)
-        self.assertTrue(len(np.array_split(o, 5)) == 5)
-        self.assertTrue(len(np.array_split(o, 2)) == 2)
-
-    def test_unexpected_keyword(self):  # GH8597
-        df = DataFrame(np.random.randn(5, 2), columns=['jim', 'joe'])
-        ca = pd.Categorical([0, 0, 2, 2, 3, np.nan])
-        ts = df['joe'].copy()
-        ts[2] = np.nan
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            df.drop('joe', axis=1, in_place=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            df.reindex([1, 0], inplace=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            ca.fillna(0, inplace=True)
-
-        with assertRaisesRegexp(TypeError, 'unexpected keyword'):
-            ts.fillna(0, in_place=True)
-
-    # See gh-12301
-    def test_stat_unexpected_keyword(self):
-        obj = self._construct(5)
-        starwars = 'Star Wars'
-        errmsg = 'unexpected keyword'
-
-        with assertRaisesRegexp(TypeError, errmsg):
-            obj.max(epic=starwars)  # stat_function
-        with assertRaisesRegexp(TypeError, errmsg):
-            obj.var(epic=starwars)  # stat_function_ddof
-        with assertRaisesRegexp(TypeError, errmsg):
-            obj.sum(epic=starwars)  # cum_function
-        with assertRaisesRegexp(TypeError, errmsg):
-            obj.any(epic=starwars)  # logical_function
-
-    def test_api_compat(self):
-
-        # GH 12021
-        # compat for __name__, __qualname__
-
-        obj = self._construct(5)
-        for func in ['sum', 'cumsum', 'any', 'var']:
-            f = getattr(obj, func)
-            self.assertEqual(f.__name__, func)
-            if PY3:
-                self.assertTrue(f.__qualname__.endswith(func))
-
-    def test_stat_non_defaults_args(self):
-        obj = self._construct(5)
-        out = np.array([0])
-        errmsg = "the 'out' parameter is not supported"
-
-        with assertRaisesRegexp(ValueError, errmsg):
-            obj.max(out=out)  # stat_function
-        with assertRaisesRegexp(ValueError, errmsg):
-            obj.var(out=out)  # stat_function_ddof
-        with assertRaisesRegexp(ValueError, errmsg):
-            obj.sum(out=out)  # cum_function
-        with assertRaisesRegexp(ValueError, errmsg):
-            obj.any(out=out)  # logical_function
-
-    def test_clip(self):
-        lower = 1
-        upper = 3
-        col = np.arange(5)
-
-        obj = self._construct(len(col), value=col)
-
-        if isinstance(obj, Panel):
-            msg = "clip is not supported yet for panels"
-            tm.assertRaisesRegexp(NotImplementedError, msg,
-                                  obj.clip, lower=lower,
-                                  upper=upper)
-
-        else:
-            out = obj.clip(lower=lower, upper=upper)
-            expected = self._construct(len(col), value=col
-                                       .clip(lower, upper))
-            self._compare(out, expected)
-
-            bad_axis = 'foo'
-            msg = ('No axis named {axis} '
-                   'for object').format(axis=bad_axis)
-            assertRaisesRegexp(ValueError, msg, obj.clip,
-                               lower=lower, upper=upper,
-                               axis=bad_axis)
-
-    def test_truncate_out_of_bounds(self):
-        # GH11382
-
-        # small
-        shape = [int(2e3)] + ([1] * (self._ndim - 1))
-        small = self._construct(shape, dtype='int8')
-        self._compare(small.truncate(), small)
-        self._compare(small.truncate(before=0, after=3e3), small)
-        self._compare(small.truncate(before=-1, after=2e3), small)
-
-        # big
-        shape = [int(2e6)] + ([1] * (self._ndim - 1))
-        big = self._construct(shape, dtype='int8')
-        self._compare(big.truncate(), big)
-        self._compare(big.truncate(before=0, after=3e6), big)
-        self._compare(big.truncate(before=-1, after=2e6), big)
-
-    def test_numpy_clip(self):
-        lower = 1
-        upper = 3
-        col = np.arange(5)
-
-        obj = self._construct(len(col), value=col)
-
-        if isinstance(obj, Panel):
-            msg = "clip is not supported yet for panels"
-            tm.assertRaisesRegexp(NotImplementedError, msg,
-                                  np.clip, obj,
-                                  lower, upper)
-        else:
-            out = np.clip(obj, lower, upper)
-            expected = self._construct(len(col), value=col
-                                       .clip(lower, upper))
-            self._compare(out, expected)
-
-            msg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg,
-                                  np.clip, obj,
-                                  lower, upper, out=col)
-
-    def test_validate_bool_args(self):
-        df = DataFrame({'a': [1, 2, 3], 'b': [4, 5, 6]})
-        invalid_values = [1, "True", [1, 2, 3], 5.0]
-
-        for value in invalid_values:
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).rename_axis(mapper={'a': 'x', 'b': 'y'},
-                                                 axis=1, inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).drop('a', axis=1, inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).sort_index(inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df)._consolidate(inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).fillna(value=0, inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).replace(to_replace=1, value=7,
-                                             inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).interpolate(inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df)._where(cond=df.a > 2, inplace=value)
-
-            with self.assertRaises(ValueError):
-                super(DataFrame, df).mask(cond=df.a > 2, inplace=value)
-
-    def test_copy_and_deepcopy(self):
-        # GH 15444
-        for shape in [0, 1, 2]:
-            obj = self._construct(shape)
-            for func in [copy,
-                         deepcopy,
-                         lambda x: x.copy(deep=False),
-                         lambda x: x.copy(deep=True)]:
-                obj_copy = func(obj)
-                self.assertIsNot(obj_copy, obj)
-                self._compare(obj_copy, obj)
-
-
-class TestSeries(tm.TestCase, Generic):
-    _typ = Series
-    _comparator = lambda self, x, y: assert_series_equal(x, y)
-
-    def setUp(self):
-        self.ts = tm.makeTimeSeries()  # Was at top level in test_series
-        self.ts.name = 'ts'
-
-        self.series = tm.makeStringSeries()
-        self.series.name = 'series'
-
-    def test_rename_mi(self):
-        s = Series([11, 21, 31],
-                   index=MultiIndex.from_tuples(
-                       [("A", x) for x in ["a", "B", "c"]]))
-        s.rename(str.lower)
-
-    def test_set_axis_name(self):
-        s = Series([1, 2, 3], index=['a', 'b', 'c'])
-        funcs = ['rename_axis', '_set_axis_name']
-        name = 'foo'
-        for func in funcs:
-            result = methodcaller(func, name)(s)
-            self.assertTrue(s.index.name is None)
-            self.assertEqual(result.index.name, name)
-
-    def test_set_axis_name_mi(self):
-        s = Series([11, 21, 31], index=MultiIndex.from_tuples(
-            [("A", x) for x in ["a", "B", "c"]],
-            names=['l1', 'l2'])
-        )
-        funcs = ['rename_axis', '_set_axis_name']
-        for func in funcs:
-            result = methodcaller(func, ['L1', 'L2'])(s)
-            self.assertTrue(s.index.name is None)
-            self.assertEqual(s.index.names, ['l1', 'l2'])
-            self.assertTrue(result.index.name is None)
-            self.assertTrue(result.index.names, ['L1', 'L2'])
-
-    def test_set_axis_name_raises(self):
-        s = pd.Series([1])
-        with tm.assertRaises(ValueError):
-            s._set_axis_name(name='a', axis=1)
-
-    def test_get_numeric_data_preserve_dtype(self):
-
-        # get the numeric data
-        o = Series([1, 2, 3])
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        o = Series([1, '2', 3.])
-        result = o._get_numeric_data()
-        expected = Series([], dtype=object, index=pd.Index([], dtype=object))
-        self._compare(result, expected)
-
-        o = Series([True, False, True])
-        result = o._get_numeric_data()
-        self._compare(result, o)
-
-        o = Series([True, False, True])
-        result = o._get_bool_data()
-        self._compare(result, o)
-
-        o = Series(date_range('20130101', periods=3))
-        result = o._get_numeric_data()
-        expected = Series([], dtype='M8[ns]', index=pd.Index([], dtype=object))
-        self._compare(result, expected)
-
-    def test_nonzero_single_element(self):
-
-        # allow single item via bool method
-        s = Series([True])
-        self.assertTrue(s.bool())
-
-        s = Series([False])
-        self.assertFalse(s.bool())
-
-        # single item nan to raise
-        for s in [Series([np.nan]), Series([pd.NaT]), Series([True]),
-                  Series([False])]:
-            self.assertRaises(ValueError, lambda: bool(s))
-
-        for s in [Series([np.nan]), Series([pd.NaT])]:
-            self.assertRaises(ValueError, lambda: s.bool())
-
-        # multiple bool are still an error
-        for s in [Series([True, True]), Series([False, False])]:
-            self.assertRaises(ValueError, lambda: bool(s))
-            self.assertRaises(ValueError, lambda: s.bool())
-
-        # single non-bool are an error
-        for s in [Series([1]), Series([0]), Series(['a']), Series([0.0])]:
-            self.assertRaises(ValueError, lambda: bool(s))
-            self.assertRaises(ValueError, lambda: s.bool())
-
-    def test_metadata_propagation_indiv(self):
-        # check that the metadata matches up on the resulting ops
-
-        o = Series(range(3), range(3))
-        o.name = 'foo'
-        o2 = Series(range(3), range(3))
-        o2.name = 'bar'
-
-        result = o.T
-        self.check_metadata(o, result)
-
-        # resample
-        ts = Series(np.random.rand(1000),
-                    index=date_range('20130101', periods=1000, freq='s'),
-                    name='foo')
-        result = ts.resample('1T').mean()
-        self.check_metadata(ts, result)
-
-        result = ts.resample('1T').min()
-        self.check_metadata(ts, result)
-
-        result = ts.resample('1T').apply(lambda x: x.sum())
-        self.check_metadata(ts, result)
-
-        _metadata = Series._metadata
-        _finalize = Series.__finalize__
-        Series._metadata = ['name', 'filename']
-        o.filename = 'foo'
-        o2.filename = 'bar'
-
-        def finalize(self, other, method=None, **kwargs):
-            for name in self._metadata:
-                if method == 'concat' and name == 'filename':
-                    value = '+'.join([getattr(
-                        o, name) for o in other.objs if getattr(o, name, None)
-                    ])
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, None))
-
-            return self
-
-        Series.__finalize__ = finalize
-
-        result = pd.concat([o, o2])
-        self.assertEqual(result.filename, 'foo+bar')
-        self.assertIsNone(result.name)
-
-        # reset
-        Series._metadata = _metadata
-        Series.__finalize__ = _finalize
-
-    def test_describe(self):
-        self.series.describe()
-        self.ts.describe()
-
-    def test_describe_objects(self):
-        s = Series(['a', 'b', 'b', np.nan, np.nan, np.nan, 'c', 'd', 'a', 'a'])
-        result = s.describe()
-        expected = Series({'count': 7, 'unique': 4,
-                           'top': 'a', 'freq': 3, 'second': 'b',
-                           'second_freq': 2}, index=result.index)
-        assert_series_equal(result, expected)
-
-        dt = list(self.ts.index)
-        dt.append(dt[0])
-        ser = Series(dt)
-        rs = ser.describe()
-        min_date = min(dt)
-        max_date = max(dt)
-        xp = Series({'count': len(dt),
-                     'unique': len(self.ts.index),
-                     'first': min_date, 'last': max_date, 'freq': 2,
-                     'top': min_date}, index=rs.index)
-        assert_series_equal(rs, xp)
-
-    def test_describe_empty(self):
-        result = pd.Series().describe()
-
-        self.assertEqual(result['count'], 0)
-        self.assertTrue(result.drop('count').isnull().all())
-
-        nanSeries = Series([np.nan])
-        nanSeries.name = 'NaN'
-        result = nanSeries.describe()
-        self.assertEqual(result['count'], 0)
-        self.assertTrue(result.drop('count').isnull().all())
-
-    def test_describe_none(self):
-        noneSeries = Series([None])
-        noneSeries.name = 'None'
-        expected = Series([0, 0], index=['count', 'unique'], name='None')
-        assert_series_equal(noneSeries.describe(), expected)
-
-    def test_to_xarray(self):
-
-        tm._skip_if_no_xarray()
-        import xarray
-        from xarray import DataArray
-
-        s = Series([])
-        s.index.name = 'foo'
-        result = s.to_xarray()
-        self.assertEqual(len(result), 0)
-        self.assertEqual(len(result.coords), 1)
-        assert_almost_equal(list(result.coords.keys()), ['foo'])
-        self.assertIsInstance(result, DataArray)
-
-        def testit(index, check_index_type=True, check_categorical=True):
-            s = Series(range(6), index=index(6))
-            s.index.name = 'foo'
-            result = s.to_xarray()
-            repr(result)
-            self.assertEqual(len(result), 6)
-            self.assertEqual(len(result.coords), 1)
-            assert_almost_equal(list(result.coords.keys()), ['foo'])
-            self.assertIsInstance(result, DataArray)
-
-            # idempotency
-            assert_series_equal(result.to_series(), s,
-                                check_index_type=check_index_type,
-                                check_categorical=check_categorical)
-
-        l = [tm.makeFloatIndex, tm.makeIntIndex,
-             tm.makeStringIndex, tm.makeUnicodeIndex,
-             tm.makeDateIndex, tm.makePeriodIndex,
-             tm.makeTimedeltaIndex]
-
-        if LooseVersion(xarray.__version__) >= '0.8.0':
-            l.append(tm.makeCategoricalIndex)
-
-        for index in l:
-            testit(index)
-
-        s = Series(range(6))
-        s.index.name = 'foo'
-        s.index = pd.MultiIndex.from_product([['a', 'b'], range(3)],
-                                             names=['one', 'two'])
-        result = s.to_xarray()
-        self.assertEqual(len(result), 2)
-        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
-        self.assertIsInstance(result, DataArray)
-        assert_series_equal(result.to_series(), s)
-
-
-class TestDataFrame(tm.TestCase, Generic):
-    _typ = DataFrame
-    _comparator = lambda self, x, y: assert_frame_equal(x, y)
-
-    def test_rename_mi(self):
-        df = DataFrame([
-            11, 21, 31
-        ], index=MultiIndex.from_tuples([("A", x) for x in ["a", "B", "c"]]))
-        df.rename(str.lower)
-
-    def test_set_axis_name(self):
-        df = pd.DataFrame([[1, 2], [3, 4]])
-        funcs = ['_set_axis_name', 'rename_axis']
-        for func in funcs:
-            result = methodcaller(func, 'foo')(df)
-            self.assertTrue(df.index.name is None)
-            self.assertEqual(result.index.name, 'foo')
-
-            result = methodcaller(func, 'cols', axis=1)(df)
-            self.assertTrue(df.columns.name is None)
-            self.assertEqual(result.columns.name, 'cols')
-
-    def test_set_axis_name_mi(self):
-        df = DataFrame(
-            np.empty((3, 3)),
-            index=MultiIndex.from_tuples([("A", x) for x in list('aBc')]),
-            columns=MultiIndex.from_tuples([('C', x) for x in list('xyz')])
-        )
-
-        level_names = ['L1', 'L2']
-        funcs = ['_set_axis_name', 'rename_axis']
-        for func in funcs:
-            result = methodcaller(func, level_names)(df)
-            self.assertEqual(result.index.names, level_names)
-            self.assertEqual(result.columns.names, [None, None])
-
-            result = methodcaller(func, level_names, axis=1)(df)
-            self.assertEqual(result.columns.names, ["L1", "L2"])
-            self.assertEqual(result.index.names, [None, None])
-
-    def test_nonzero_single_element(self):
-
-        # allow single item via bool method
-        df = DataFrame([[True]])
-        self.assertTrue(df.bool())
-
-        df = DataFrame([[False]])
-        self.assertFalse(df.bool())
-
-        df = DataFrame([[False, False]])
-        self.assertRaises(ValueError, lambda: df.bool())
-        self.assertRaises(ValueError, lambda: bool(df))
-
-    def test_get_numeric_data_preserve_dtype(self):
-
-        # get the numeric data
-        o = DataFrame({'A': [1, '2', 3.]})
-        result = o._get_numeric_data()
-        expected = DataFrame(index=[0, 1, 2], dtype=object)
-        self._compare(result, expected)
-
-    def test_describe(self):
-        tm.makeDataFrame().describe()
-        tm.makeMixedDataFrame().describe()
-        tm.makeTimeDataFrame().describe()
-
-    def test_describe_percentiles_percent_or_raw(self):
-        msg = 'percentiles should all be in the interval \\[0, 1\\]'
-
-        df = tm.makeDataFrame()
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[10, 50, 100])
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[2])
-
-        with tm.assertRaisesRegexp(ValueError, msg):
-            df.describe(percentiles=[-2])
-
-    def test_describe_percentiles_equivalence(self):
-        df = tm.makeDataFrame()
-        d1 = df.describe()
-        d2 = df.describe(percentiles=[.25, .75])
-        assert_frame_equal(d1, d2)
-
-    def test_describe_percentiles_insert_median(self):
-        df = tm.makeDataFrame()
-        d1 = df.describe(percentiles=[.25, .75])
-        d2 = df.describe(percentiles=[.25, .5, .75])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('25%' in d1.index)
-        self.assertTrue('75%' in d2.index)
-
-        # none above
-        d1 = df.describe(percentiles=[.25, .45])
-        d2 = df.describe(percentiles=[.25, .45, .5])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('25%' in d1.index)
-        self.assertTrue('45%' in d2.index)
-
-        # none below
-        d1 = df.describe(percentiles=[.75, 1])
-        d2 = df.describe(percentiles=[.5, .75, 1])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('75%' in d1.index)
-        self.assertTrue('100%' in d2.index)
-
-        # edge
-        d1 = df.describe(percentiles=[0, 1])
-        d2 = df.describe(percentiles=[0, .5, 1])
-        assert_frame_equal(d1, d2)
-        self.assertTrue('0%' in d1.index)
-        self.assertTrue('100%' in d2.index)
-
-    def test_describe_percentiles_insert_median_ndarray(self):
-        # GH14908
-        df = tm.makeDataFrame()
-        result = df.describe(percentiles=np.array([.25, .75]))
-        expected = df.describe(percentiles=[.25, .75])
-        assert_frame_equal(result, expected)
-
-    def test_describe_percentiles_unique(self):
-        # GH13104
-        df = tm.makeDataFrame()
-        with self.assertRaises(ValueError):
-            df.describe(percentiles=[0.1, 0.2, 0.4, 0.5, 0.2, 0.6])
-        with self.assertRaises(ValueError):
-            df.describe(percentiles=[0.1, 0.2, 0.4, 0.2, 0.6])
-
-    def test_describe_percentiles_formatting(self):
-        # GH13104
-        df = tm.makeDataFrame()
-
-        # default
-        result = df.describe().index
-        expected = Index(['count', 'mean', 'std', 'min', '25%', '50%', '75%',
-                          'max'],
-                         dtype='object')
-        tm.assert_index_equal(result, expected)
-
-        result = df.describe(percentiles=[0.0001, 0.0005, 0.001, 0.999,
-                                          0.9995, 0.9999]).index
-        expected = Index(['count', 'mean', 'std', 'min', '0.01%', '0.05%',
-                          '0.1%', '50%', '99.9%', '99.95%', '99.99%', 'max'],
-                         dtype='object')
-        tm.assert_index_equal(result, expected)
-
-        result = df.describe(percentiles=[0.00499, 0.005, 0.25, 0.50,
-                                          0.75]).index
-        expected = Index(['count', 'mean', 'std', 'min', '0.499%', '0.5%',
-                          '25%', '50%', '75%', 'max'],
-                         dtype='object')
-        tm.assert_index_equal(result, expected)
-
-        result = df.describe(percentiles=[0.00499, 0.01001, 0.25, 0.50,
-                                          0.75]).index
-        expected = Index(['count', 'mean', 'std', 'min', '0.5%', '1.0%',
-                          '25%', '50%', '75%', 'max'],
-                         dtype='object')
-        tm.assert_index_equal(result, expected)
-
-    def test_describe_column_index_type(self):
-        # GH13288
-        df = pd.DataFrame([1, 2, 3, 4])
-        df.columns = pd.Index([0], dtype=object)
-        result = df.describe().columns
-        expected = Index([0], dtype=object)
-        tm.assert_index_equal(result, expected)
-
-        df = pd.DataFrame({'A': list("BCDE"), 0: [1, 2, 3, 4]})
-        result = df.describe().columns
-        expected = Index([0], dtype=object)
-        tm.assert_index_equal(result, expected)
-
-    def test_describe_no_numeric(self):
-        df = DataFrame({'A': ['foo', 'foo', 'bar'] * 8,
-                        'B': ['a', 'b', 'c', 'd'] * 6})
-        desc = df.describe()
-        expected = DataFrame(dict((k, v.describe())
-                                  for k, v in compat.iteritems(df)),
-                             columns=df.columns)
-        assert_frame_equal(desc, expected)
-
-        ts = tm.makeTimeSeries()
-        df = DataFrame({'time': ts.index})
-        desc = df.describe()
-        self.assertEqual(desc.time['first'], min(ts.index))
-
-    def test_describe_empty(self):
-        df = DataFrame()
-        tm.assertRaisesRegexp(ValueError, 'DataFrame without columns',
-                              df.describe)
-
-        df = DataFrame(columns=['A', 'B'])
-        result = df.describe()
-        expected = DataFrame(0, columns=['A', 'B'], index=['count', 'unique'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_describe_empty_int_columns(self):
-        df = DataFrame([[0, 1], [1, 2]])
-        desc = df[df[0] < 0].describe()  # works
-        assert_series_equal(desc.xs('count'),
-                            Series([0, 0], dtype=float, name='count'))
-        self.assertTrue(isnull(desc.iloc[1:]).all().all())
-
-    def test_describe_objects(self):
-        df = DataFrame({"C1": ['a', 'a', 'c'], "C2": ['d', 'd', 'f']})
-        result = df.describe()
-        expected = DataFrame({"C1": [3, 2, 'a', 2], "C2": [3, 2, 'd', 2]},
-                             index=['count', 'unique', 'top', 'freq'])
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({"C1": pd.date_range('2010-01-01', periods=4, freq='D')
-                        })
-        df.loc[4] = pd.Timestamp('2010-01-04')
-        result = df.describe()
-        expected = DataFrame({"C1": [5, 4, pd.Timestamp('2010-01-04'), 2,
-                                     pd.Timestamp('2010-01-01'),
-                                     pd.Timestamp('2010-01-04')]},
-                             index=['count', 'unique', 'top', 'freq',
-                                    'first', 'last'])
-        assert_frame_equal(result, expected)
-
-        # mix time and str
-        df['C2'] = ['a', 'a', 'b', 'c', 'a']
-        result = df.describe()
-        expected['C2'] = [5, 3, 'a', 3, np.nan, np.nan]
-        assert_frame_equal(result, expected)
-
-        # just str
-        expected = DataFrame({'C2': [5, 3, 'a', 4]},
-                             index=['count', 'unique', 'top', 'freq'])
-        result = df[['C2']].describe()
-
-        # mix of time, str, numeric
-        df['C3'] = [2, 4, 6, 8, 2]
-        result = df.describe()
-        expected = DataFrame({"C3": [5., 4.4, 2.607681, 2., 2., 4., 6., 8.]},
-                             index=['count', 'mean', 'std', 'min', '25%',
-                                    '50%', '75%', 'max'])
-        assert_frame_equal(result, expected)
-        assert_frame_equal(df.describe(), df[['C3']].describe())
-
-        assert_frame_equal(df[['C1', 'C3']].describe(), df[['C3']].describe())
-        assert_frame_equal(df[['C2', 'C3']].describe(), df[['C3']].describe())
-
-    def test_describe_typefiltering(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                        'catB': ['a', 'b', 'c', 'd'] * 6,
-                        'numC': np.arange(24, dtype='int64'),
-                        'numD': np.arange(24.) + .5,
-                        'ts': tm.makeTimeSeries()[:24].index})
-
-        descN = df.describe()
-        expected_cols = ['numC', 'numD', ]
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(descN, expected)
-
-        desc = df.describe(include=['number'])
-        assert_frame_equal(desc, descN)
-        desc = df.describe(exclude=['object', 'datetime'])
-        assert_frame_equal(desc, descN)
-        desc = df.describe(include=['float'])
-        assert_frame_equal(desc, descN.drop('numC', 1))
-
-        descC = df.describe(include=['O'])
-        expected_cols = ['catA', 'catB']
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(descC, expected)
-
-        descD = df.describe(include=['datetime'])
-        assert_series_equal(descD.ts, df.ts.describe())
-
-        desc = df.describe(include=['object', 'number', 'datetime'])
-        assert_frame_equal(desc.loc[:, ["numC", "numD"]].dropna(), descN)
-        assert_frame_equal(desc.loc[:, ["catA", "catB"]].dropna(), descC)
-        descDs = descD.sort_index()  # the index order change for mixed-types
-        assert_frame_equal(desc.loc[:, "ts":].dropna().sort_index(), descDs)
-
-        desc = df.loc[:, 'catA':'catB'].describe(include='all')
-        assert_frame_equal(desc, descC)
-        desc = df.loc[:, 'numC':'numD'].describe(include='all')
-        assert_frame_equal(desc, descN)
-
-        desc = df.describe(percentiles=[], include='all')
-        cnt = Series(data=[4, 4, 6, 6, 6],
-                     index=['catA', 'catB', 'numC', 'numD', 'ts'])
-        assert_series_equal(desc.count(), cnt)
-        self.assertTrue('count' in desc.index)
-        self.assertTrue('unique' in desc.index)
-        self.assertTrue('50%' in desc.index)
-        self.assertTrue('first' in desc.index)
-
-        desc = df.drop("ts", 1).describe(percentiles=[], include='all')
-        assert_series_equal(desc.count(), cnt.drop("ts"))
-        self.assertTrue('first' not in desc.index)
-        desc = df.drop(["numC", "numD"], 1).describe(percentiles=[],
-                                                     include='all')
-        assert_series_equal(desc.count(), cnt.drop(["numC", "numD"]))
-        self.assertTrue('50%' not in desc.index)
-
-    def test_describe_typefiltering_category_bool(self):
-        df = DataFrame({'A_cat': pd.Categorical(['foo', 'foo', 'bar'] * 8),
-                        'B_str': ['a', 'b', 'c', 'd'] * 6,
-                        'C_bool': [True] * 12 + [False] * 12,
-                        'D_num': np.arange(24.) + .5,
-                        'E_ts': tm.makeTimeSeries()[:24].index})
-
-        desc = df.describe()
-        expected_cols = ['D_num']
-        expected = DataFrame(dict((k, df[k].describe())
-                                  for k in expected_cols),
-                             columns=expected_cols)
-        assert_frame_equal(desc, expected)
-
-        desc = df.describe(include=["category"])
-        self.assertTrue(desc.columns.tolist() == ["A_cat"])
-
-        # 'all' includes numpy-dtypes + category
-        desc1 = df.describe(include="all")
-        desc2 = df.describe(include=[np.generic, "category"])
-        assert_frame_equal(desc1, desc2)
-
-    def test_describe_timedelta(self):
-        df = DataFrame({"td": pd.to_timedelta(np.arange(24) % 20, "D")})
-        self.assertTrue(df.describe().loc["mean"][0] == pd.to_timedelta(
-            "8d4h"))
-
-    def test_describe_typefiltering_dupcol(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                        'catB': ['a', 'b', 'c', 'd'] * 6,
-                        'numC': np.arange(24),
-                        'numD': np.arange(24.) + .5,
-                        'ts': tm.makeTimeSeries()[:24].index})
-        s = df.describe(include='all').shape[1]
-        df = pd.concat([df, df], axis=1)
-        s2 = df.describe(include='all').shape[1]
-        self.assertTrue(s2 == 2 * s)
-
-    def test_describe_typefiltering_groupby(self):
-        df = DataFrame({'catA': ['foo', 'foo', 'bar'] * 8,
-                        'catB': ['a', 'b', 'c', 'd'] * 6,
-                        'numC': np.arange(24),
-                        'numD': np.arange(24.) + .5,
-                        'ts': tm.makeTimeSeries()[:24].index})
-        G = df.groupby('catA')
-        self.assertTrue(G.describe(include=['number']).shape == (2, 16))
-        self.assertTrue(G.describe(include=['number', 'object']).shape == (2,
-                                                                           33))
-        self.assertTrue(G.describe(include='all').shape == (2, 52))
-
-    def test_describe_multi_index_df_column_names(self):
-        """ Test that column names persist after the describe operation."""
-
-        df = pd.DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.random.randn(8)})
-
-        # GH 11517
-        # test for hierarchical index
-        hierarchical_index_df = df.groupby(['A', 'B']).mean().T
-        self.assertTrue(hierarchical_index_df.columns.names == ['A', 'B'])
-        self.assertTrue(hierarchical_index_df.describe().columns.names ==
-                        ['A', 'B'])
-
-        # test for non-hierarchical index
-        non_hierarchical_index_df = df.groupby(['A']).mean().T
-        self.assertTrue(non_hierarchical_index_df.columns.names == ['A'])
-        self.assertTrue(non_hierarchical_index_df.describe().columns.names ==
-                        ['A'])
-
-    def test_metadata_propagation_indiv(self):
-
-        # groupby
-        df = DataFrame(
-            {'A': ['foo', 'bar', 'foo', 'bar', 'foo', 'bar', 'foo', 'foo'],
-             'B': ['one', 'one', 'two', 'three', 'two', 'two', 'one', 'three'],
-             'C': np.random.randn(8),
-             'D': np.random.randn(8)})
-        result = df.groupby('A').sum()
-        self.check_metadata(df, result)
-
-        # resample
-        df = DataFrame(np.random.randn(1000, 2),
-                       index=date_range('20130101', periods=1000, freq='s'))
-        result = df.resample('1T')
-        self.check_metadata(df, result)
-
-        # merging with override
-        # GH 6923
-        _metadata = DataFrame._metadata
-        _finalize = DataFrame.__finalize__
-
-        np.random.seed(10)
-        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['a', 'b'])
-        df2 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=['c', 'd'])
-        DataFrame._metadata = ['filename']
-        df1.filename = 'fname1.csv'
-        df2.filename = 'fname2.csv'
-
-        def finalize(self, other, method=None, **kwargs):
-
-            for name in self._metadata:
-                if method == 'merge':
-                    left, right = other.left, other.right
-                    value = getattr(left, name, '') + '|' + getattr(right,
-                                                                    name, '')
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, ''))
-
-            return self
-
-        DataFrame.__finalize__ = finalize
-        result = df1.merge(df2, left_on=['a'], right_on=['c'], how='inner')
-        self.assertEqual(result.filename, 'fname1.csv|fname2.csv')
-
-        # concat
-        # GH 6927
-        DataFrame._metadata = ['filename']
-        df1 = DataFrame(np.random.randint(0, 4, (3, 2)), columns=list('ab'))
-        df1.filename = 'foo'
-
-        def finalize(self, other, method=None, **kwargs):
-            for name in self._metadata:
-                if method == 'concat':
-                    value = '+'.join([getattr(
-                        o, name) for o in other.objs if getattr(o, name, None)
-                    ])
-                    object.__setattr__(self, name, value)
-                else:
-                    object.__setattr__(self, name, getattr(other, name, None))
-
-            return self
-
-        DataFrame.__finalize__ = finalize
-
-        result = pd.concat([df1, df1])
-        self.assertEqual(result.filename, 'foo+foo')
-
-        # reset
-        DataFrame._metadata = _metadata
-        DataFrame.__finalize__ = _finalize
-
-    def test_tz_convert_and_localize(self):
-        l0 = date_range('20140701', periods=5, freq='D')
-
-        # TODO: l1 should be a PeriodIndex for testing
-        #       after GH2106 is addressed
-        with tm.assertRaises(NotImplementedError):
-            period_range('20140701', periods=1).tz_convert('UTC')
-        with tm.assertRaises(NotImplementedError):
-            period_range('20140701', periods=1).tz_localize('UTC')
-        # l1 = period_range('20140701', periods=5, freq='D')
-        l1 = date_range('20140701', periods=5, freq='D')
-
-        int_idx = Index(range(5))
-
-        for fn in ['tz_localize', 'tz_convert']:
-
-            if fn == 'tz_convert':
-                l0 = l0.tz_localize('UTC')
-                l1 = l1.tz_localize('UTC')
-
-            for idx in [l0, l1]:
-
-                l0_expected = getattr(idx, fn)('US/Pacific')
-                l1_expected = getattr(idx, fn)('US/Pacific')
-
-                df1 = DataFrame(np.ones(5), index=l0)
-                df1 = getattr(df1, fn)('US/Pacific')
-                self.assert_index_equal(df1.index, l0_expected)
-
-                # MultiIndex
-                # GH7846
-                df2 = DataFrame(np.ones(5), MultiIndex.from_arrays([l0, l1]))
-
-                df3 = getattr(df2, fn)('US/Pacific', level=0)
-                self.assertFalse(df3.index.levels[0].equals(l0))
-                self.assert_index_equal(df3.index.levels[0], l0_expected)
-                self.assert_index_equal(df3.index.levels[1], l1)
-                self.assertFalse(df3.index.levels[1].equals(l1_expected))
-
-                df3 = getattr(df2, fn)('US/Pacific', level=1)
-                self.assert_index_equal(df3.index.levels[0], l0)
-                self.assertFalse(df3.index.levels[0].equals(l0_expected))
-                self.assert_index_equal(df3.index.levels[1], l1_expected)
-                self.assertFalse(df3.index.levels[1].equals(l1))
-
-                df4 = DataFrame(np.ones(5),
-                                MultiIndex.from_arrays([int_idx, l0]))
-
-                # TODO: untested
-                df5 = getattr(df4, fn)('US/Pacific', level=1)  # noqa
-
-                self.assert_index_equal(df3.index.levels[0], l0)
-                self.assertFalse(df3.index.levels[0].equals(l0_expected))
-                self.assert_index_equal(df3.index.levels[1], l1_expected)
-                self.assertFalse(df3.index.levels[1].equals(l1))
-
-        # Bad Inputs
-        for fn in ['tz_localize', 'tz_convert']:
-            # Not DatetimeIndex / PeriodIndex
-            with tm.assertRaisesRegexp(TypeError, 'DatetimeIndex'):
-                df = DataFrame(index=int_idx)
-                df = getattr(df, fn)('US/Pacific')
-
-            # Not DatetimeIndex / PeriodIndex
-            with tm.assertRaisesRegexp(TypeError, 'DatetimeIndex'):
-                df = DataFrame(np.ones(5),
-                               MultiIndex.from_arrays([int_idx, l0]))
-                df = getattr(df, fn)('US/Pacific', level=0)
-
-            # Invalid level
-            with tm.assertRaisesRegexp(ValueError, 'not valid'):
-                df = DataFrame(index=l0)
-                df = getattr(df, fn)('US/Pacific', level=1)
-
-    def test_set_attribute(self):
-        # Test for consistent setattr behavior when an attribute and a column
-        # have the same name (Issue #8994)
-        df = DataFrame({'x': [1, 2, 3]})
-
-        df.y = 2
-        df['y'] = [2, 4, 6]
-        df.y = 5
-
-        self.assertEqual(df.y, 5)
-        assert_series_equal(df['y'], Series([2, 4, 6], name='y'))
-
-    def test_pct_change(self):
-        # GH 11150
-        pnl = DataFrame([np.arange(0, 40, 10), np.arange(0, 40, 10), np.arange(
-            0, 40, 10)]).astype(np.float64)
-        pnl.iat[1, 0] = np.nan
-        pnl.iat[1, 1] = np.nan
-        pnl.iat[2, 3] = 60
-
-        mask = pnl.isnull()
-
-        for axis in range(2):
-            expected = pnl.ffill(axis=axis) / pnl.ffill(axis=axis).shift(
-                axis=axis) - 1
-            expected[mask] = np.nan
-            result = pnl.pct_change(axis=axis, fill_method='pad')
-
-            self.assert_frame_equal(result, expected)
-
-    def test_to_xarray(self):
-
-        tm._skip_if_no_xarray()
-        from xarray import Dataset
-
-        df = DataFrame({'a': list('abc'),
-                        'b': list(range(1, 4)),
-                        'c': np.arange(3, 6).astype('u1'),
-                        'd': np.arange(4.0, 7.0, dtype='float64'),
-                        'e': [True, False, True],
-                        'f': pd.Categorical(list('abc')),
-                        'g': pd.date_range('20130101', periods=3),
-                        'h': pd.date_range('20130101',
-                                           periods=3,
-                                           tz='US/Eastern')}
-                       )
-
-        df.index.name = 'foo'
-        result = df[0:0].to_xarray()
-        self.assertEqual(result.dims['foo'], 0)
-        self.assertIsInstance(result, Dataset)
-
-        for index in [tm.makeFloatIndex, tm.makeIntIndex,
-                      tm.makeStringIndex, tm.makeUnicodeIndex,
-                      tm.makeDateIndex, tm.makePeriodIndex,
-                      tm.makeCategoricalIndex, tm.makeTimedeltaIndex]:
-            df.index = index(3)
-            df.index.name = 'foo'
-            df.columns.name = 'bar'
-            result = df.to_xarray()
-            self.assertEqual(result.dims['foo'], 3)
-            self.assertEqual(len(result.coords), 1)
-            self.assertEqual(len(result.data_vars), 8)
-            assert_almost_equal(list(result.coords.keys()), ['foo'])
-            self.assertIsInstance(result, Dataset)
-
-            # idempotency
-            # categoricals are not preserved
-            # datetimes w/tz are not preserved
-            # column names are lost
-            expected = df.copy()
-            expected['f'] = expected['f'].astype(object)
-            expected['h'] = expected['h'].astype('datetime64[ns]')
-            expected.columns.name = None
-            assert_frame_equal(result.to_dataframe(), expected,
-                               check_index_type=False, check_categorical=False)
-
-        # available in 0.7.1
-        # MultiIndex
-        df.index = pd.MultiIndex.from_product([['a'], range(3)],
-                                              names=['one', 'two'])
-        result = df.to_xarray()
-        self.assertEqual(result.dims['one'], 1)
-        self.assertEqual(result.dims['two'], 3)
-        self.assertEqual(len(result.coords), 2)
-        self.assertEqual(len(result.data_vars), 8)
-        assert_almost_equal(list(result.coords.keys()), ['one', 'two'])
-        self.assertIsInstance(result, Dataset)
-
-        result = result.to_dataframe()
-        expected = df.copy()
-        expected['f'] = expected['f'].astype(object)
-        expected['h'] = expected['h'].astype('datetime64[ns]')
-        expected.columns.name = None
-        assert_frame_equal(result,
-                           expected,
-                           check_index_type=False)
-
-    def test_deepcopy_empty(self):
-        # This test covers empty frame copying with non-empty column sets
-        # as reported in issue GH15370
-        empty_frame = DataFrame(data=[], index=[], columns=['A'])
-        empty_frame_copy = deepcopy(empty_frame)
-
-        self._compare(empty_frame_copy, empty_frame)
-
-
-class TestPanel(tm.TestCase, Generic):
-    _typ = Panel
-    _comparator = lambda self, x, y: assert_panel_equal(x, y, by_blocks=True)
-
-    def test_to_xarray(self):
-
-        tm._skip_if_no_xarray()
-        from xarray import DataArray
-
-        p = tm.makePanel()
-
-        result = p.to_xarray()
-        self.assertIsInstance(result, DataArray)
-        self.assertEqual(len(result.coords), 3)
-        assert_almost_equal(list(result.coords.keys()),
-                            ['items', 'major_axis', 'minor_axis'])
-        self.assertEqual(len(result.dims), 3)
-
-        # idempotency
-        assert_panel_equal(result.to_pandas(), p)
-
-
-class TestPanel4D(tm.TestCase, Generic):
-    _typ = Panel4D
-    _comparator = lambda self, x, y: assert_panel4d_equal(x, y, by_blocks=True)
-
-    def test_sample(self):
-        pytest.skip("sample on Panel4D")
-
-    def test_copy_and_deepcopy(self):
-        pytest.skip("copy_and_deepcopy on Panel4D")
-
-    def test_to_xarray(self):
-
-        tm._skip_if_no_xarray()
-        from xarray import DataArray
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            p = tm.makePanel4D()
-
-            result = p.to_xarray()
-            self.assertIsInstance(result, DataArray)
-            self.assertEqual(len(result.coords), 4)
-            assert_almost_equal(list(result.coords.keys()),
-                                ['labels', 'items', 'major_axis',
-                                 'minor_axis'])
-            self.assertEqual(len(result.dims), 4)
-
-            # non-convertible
-            self.assertRaises(ValueError, lambda: result.to_pandas())
-
-
-# run all the tests, but wrap each in a warning catcher
-for t in ['test_rename', 'test_rename_axis', 'test_get_numeric_data',
-          'test_get_default', 'test_nonzero',
-          'test_numpy_1_7_compat_numeric_methods',
-          'test_downcast', 'test_constructor_compound_dtypes',
-          'test_head_tail',
-          'test_size_compat', 'test_split_compat',
-          'test_unexpected_keyword',
-          'test_stat_unexpected_keyword', 'test_api_compat',
-          'test_stat_non_defaults_args',
-          'test_clip', 'test_truncate_out_of_bounds', 'test_numpy_clip',
-          'test_metadata_propagation']:
-
-    def f():
-        def tester(self):
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                return getattr(super(TestPanel4D, self), t)()
-        return tester
-
-    setattr(TestPanel4D, t, f())
-
-
-class TestNDFrame(tm.TestCase):
-    # tests that don't fit elsewhere
-
-    def test_sample(sel):
-        # Fixes issue: 2419
-        # additional specific object based tests
-
-        # A few dataframe test with degenerate weights.
-        easy_weight_list = [0] * 10
-        easy_weight_list[5] = 1
-
-        df = pd.DataFrame({'col1': range(10, 20),
-                           'col2': range(20, 30),
-                           'colString': ['a'] * 10,
-                           'easyweights': easy_weight_list})
-        sample1 = df.sample(n=1, weights='easyweights')
-        assert_frame_equal(sample1, df.iloc[5:6])
-
-        # Ensure proper error if string given as weight for Series, panel, or
-        # DataFrame with axis = 1.
-        s = Series(range(10))
-        with tm.assertRaises(ValueError):
-            s.sample(n=3, weights='weight_column')
-
-        panel = pd.Panel(items=[0, 1, 2], major_axis=[2, 3, 4],
-                         minor_axis=[3, 4, 5])
-        with tm.assertRaises(ValueError):
-            panel.sample(n=1, weights='weight_column')
-
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, weights='weight_column', axis=1)
-
-        # Check weighting key error
-        with tm.assertRaises(KeyError):
-            df.sample(n=3, weights='not_a_real_column_name')
-
-        # Check that re-normalizes weights that don't sum to one.
-        weights_less_than_1 = [0] * 10
-        weights_less_than_1[0] = 0.5
-        tm.assert_frame_equal(
-            df.sample(n=1, weights=weights_less_than_1), df.iloc[:1])
-
-        ###
-        # Test axis argument
-        ###
-
-        # Test axis argument
-        df = pd.DataFrame({'col1': range(10), 'col2': ['a'] * 10})
-        second_column_weight = [0, 1]
-        assert_frame_equal(
-            df.sample(n=1, axis=1, weights=second_column_weight), df[['col2']])
-
-        # Different axis arg types
-        assert_frame_equal(df.sample(n=1, axis='columns',
-                                     weights=second_column_weight),
-                           df[['col2']])
-
-        weight = [0] * 10
-        weight[5] = 0.5
-        assert_frame_equal(df.sample(n=1, axis='rows', weights=weight),
-                           df.iloc[5:6])
-        assert_frame_equal(df.sample(n=1, axis='index', weights=weight),
-                           df.iloc[5:6])
-
-        # Check out of range axis values
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis=2)
-
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis='not_a_name')
-
-        with tm.assertRaises(ValueError):
-            s = pd.Series(range(10))
-            s.sample(n=1, axis=1)
-
-        # Test weight length compared to correct axis
-        with tm.assertRaises(ValueError):
-            df.sample(n=1, axis=1, weights=[0.5] * 10)
-
-        # Check weights with axis = 1
-        easy_weight_list = [0] * 3
-        easy_weight_list[2] = 1
-
-        df = pd.DataFrame({'col1': range(10, 20),
-                           'col2': range(20, 30),
-                           'colString': ['a'] * 10})
-        sample1 = df.sample(n=1, axis=1, weights=easy_weight_list)
-        assert_frame_equal(sample1, df[['colString']])
-
-        # Test default axes
-        p = pd.Panel(items=['a', 'b', 'c'], major_axis=[2, 4, 6],
-                     minor_axis=[1, 3, 5])
-        assert_panel_equal(
-            p.sample(n=3, random_state=42), p.sample(n=3, axis=1,
-                                                     random_state=42))
-        assert_frame_equal(
-            df.sample(n=3, random_state=42), df.sample(n=3, axis=0,
-                                                       random_state=42))
-
-        # Test that function aligns weights with frame
-        df = DataFrame(
-            {'col1': [5, 6, 7],
-             'col2': ['a', 'b', 'c'], }, index=[9, 5, 3])
-        s = Series([1, 0, 0], index=[3, 5, 9])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s))
-
-        # Weights have index values to be dropped because not in
-        # sampled DataFrame
-        s2 = Series([0.001, 0, 10000], index=[3, 5, 10])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s2))
-
-        # Weights have empty values to be filed with zeros
-        s3 = Series([0.01, 0], index=[3, 5])
-        assert_frame_equal(df.loc[[3]], df.sample(1, weights=s3))
-
-        # No overlap in weight and sampled DataFrame indices
-        s4 = Series([1, 0], index=[1, 2])
-        with tm.assertRaises(ValueError):
-            df.sample(1, weights=s4)
-
-    def test_squeeze(self):
-        # noop
-        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
-                  tm.makeObjectSeries()]:
-            tm.assert_series_equal(s.squeeze(), s)
-        for df in [tm.makeTimeDataFrame()]:
-            tm.assert_frame_equal(df.squeeze(), df)
-        for p in [tm.makePanel()]:
-            tm.assert_panel_equal(p.squeeze(), p)
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            for p4d in [tm.makePanel4D()]:
-                tm.assert_panel4d_equal(p4d.squeeze(), p4d)
-
-        # squeezing
-        df = tm.makeTimeDataFrame().reindex(columns=['A'])
-        tm.assert_series_equal(df.squeeze(), df['A'])
-
-        p = tm.makePanel().reindex(items=['ItemA'])
-        tm.assert_frame_equal(p.squeeze(), p['ItemA'])
-
-        p = tm.makePanel().reindex(items=['ItemA'], minor_axis=['A'])
-        tm.assert_series_equal(p.squeeze(), p.loc['ItemA', :, 'A'])
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            p4d = tm.makePanel4D().reindex(labels=['label1'])
-            tm.assert_panel_equal(p4d.squeeze(), p4d['label1'])
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            p4d = tm.makePanel4D().reindex(labels=['label1'], items=['ItemA'])
-            tm.assert_frame_equal(p4d.squeeze(), p4d.loc['label1', 'ItemA'])
-
-        # don't fail with 0 length dimensions GH11229 & GH8999
-        empty_series = pd.Series([], name='five')
-        empty_frame = pd.DataFrame([empty_series])
-        empty_panel = pd.Panel({'six': empty_frame})
-
-        [tm.assert_series_equal(empty_series, higher_dim.squeeze())
-         for higher_dim in [empty_series, empty_frame, empty_panel]]
-
-        # axis argument
-        df = tm.makeTimeDataFrame(nper=1).iloc[:, :1]
-        tm.assert_equal(df.shape, (1, 1))
-        tm.assert_series_equal(df.squeeze(axis=0), df.iloc[0])
-        tm.assert_series_equal(df.squeeze(axis='index'), df.iloc[0])
-        tm.assert_series_equal(df.squeeze(axis=1), df.iloc[:, 0])
-        tm.assert_series_equal(df.squeeze(axis='columns'), df.iloc[:, 0])
-        tm.assert_equal(df.squeeze(), df.iloc[0, 0])
-        tm.assertRaises(ValueError, df.squeeze, axis=2)
-        tm.assertRaises(ValueError, df.squeeze, axis='x')
-
-        df = tm.makeTimeDataFrame(3)
-        tm.assert_frame_equal(df.squeeze(axis=0), df)
-
-    def test_numpy_squeeze(self):
-        s = tm.makeFloatSeries()
-        tm.assert_series_equal(np.squeeze(s), s)
-
-        df = tm.makeTimeDataFrame().reindex(columns=['A'])
-        tm.assert_series_equal(np.squeeze(df), df['A'])
-
-    def test_transpose(self):
-        msg = (r"transpose\(\) got multiple values for "
-               r"keyword argument 'axes'")
-        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
-                  tm.makeObjectSeries()]:
-            # calls implementation in pandas/core/base.py
-            tm.assert_series_equal(s.transpose(), s)
-        for df in [tm.makeTimeDataFrame()]:
-            tm.assert_frame_equal(df.transpose().transpose(), df)
-        for p in [tm.makePanel()]:
-            tm.assert_panel_equal(p.transpose(2, 0, 1)
-                                  .transpose(1, 2, 0), p)
-            tm.assertRaisesRegexp(TypeError, msg, p.transpose,
-                                  2, 0, 1, axes=(2, 0, 1))
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            for p4d in [tm.makePanel4D()]:
-                tm.assert_panel4d_equal(p4d.transpose(2, 0, 3, 1)
-                                        .transpose(1, 3, 0, 2), p4d)
-                tm.assertRaisesRegexp(TypeError, msg, p4d.transpose,
-                                      2, 0, 3, 1, axes=(2, 0, 3, 1))
-
-    def test_numpy_transpose(self):
-        msg = "the 'axes' parameter is not supported"
-
-        s = tm.makeFloatSeries()
-        tm.assert_series_equal(
-            np.transpose(s), s)
-        tm.assertRaisesRegexp(ValueError, msg,
-                              np.transpose, s, axes=1)
-
-        df = tm.makeTimeDataFrame()
-        tm.assert_frame_equal(np.transpose(
-            np.transpose(df)), df)
-        tm.assertRaisesRegexp(ValueError, msg,
-                              np.transpose, df, axes=1)
-
-        p = tm.makePanel()
-        tm.assert_panel_equal(np.transpose(
-            np.transpose(p, axes=(2, 0, 1)),
-            axes=(1, 2, 0)), p)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            p4d = tm.makePanel4D()
-            tm.assert_panel4d_equal(np.transpose(
-                np.transpose(p4d, axes=(2, 0, 3, 1)),
-                axes=(1, 3, 0, 2)), p4d)
-
-    def test_take(self):
-        indices = [1, 5, -2, 6, 3, -1]
-        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
-                  tm.makeObjectSeries()]:
-            out = s.take(indices)
-            expected = Series(data=s.values.take(indices),
-                              index=s.index.take(indices))
-            tm.assert_series_equal(out, expected)
-        for df in [tm.makeTimeDataFrame()]:
-            out = df.take(indices)
-            expected = DataFrame(data=df.values.take(indices, axis=0),
-                                 index=df.index.take(indices),
-                                 columns=df.columns)
-            tm.assert_frame_equal(out, expected)
-
-        indices = [-3, 2, 0, 1]
-        for p in [tm.makePanel()]:
-            out = p.take(indices)
-            expected = Panel(data=p.values.take(indices, axis=0),
-                             items=p.items.take(indices),
-                             major_axis=p.major_axis,
-                             minor_axis=p.minor_axis)
-            tm.assert_panel_equal(out, expected)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            for p4d in [tm.makePanel4D()]:
-                out = p4d.take(indices)
-                expected = Panel4D(data=p4d.values.take(indices, axis=0),
-                                   labels=p4d.labels.take(indices),
-                                   major_axis=p4d.major_axis,
-                                   minor_axis=p4d.minor_axis,
-                                   items=p4d.items)
-                tm.assert_panel4d_equal(out, expected)
-
-    def test_take_invalid_kwargs(self):
-        indices = [-3, 2, 0, 1]
-        s = tm.makeFloatSeries()
-        df = tm.makeTimeDataFrame()
-        p = tm.makePanel()
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            p4d = tm.makePanel4D()
-
-        for obj in (s, df, p, p4d):
-            msg = r"take\(\) got an unexpected keyword argument 'foo'"
-            tm.assertRaisesRegexp(TypeError, msg, obj.take,
-                                  indices, foo=2)
-
-            msg = "the 'out' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, obj.take,
-                                  indices, out=indices)
-
-            msg = "the 'mode' parameter is not supported"
-            tm.assertRaisesRegexp(ValueError, msg, obj.take,
-                                  indices, mode='clip')
-
-    def test_equals(self):
-        s1 = pd.Series([1, 2, 3], index=[0, 2, 1])
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        s1[1] = 99
-        self.assertFalse(s1.equals(s2))
-
-        # NaNs compare as equal
-        s1 = pd.Series([1, np.nan, 3, np.nan], index=[0, 2, 1, 3])
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        s2[0] = 9.9
-        self.assertFalse(s1.equals(s2))
-
-        idx = MultiIndex.from_tuples([(0, 'a'), (1, 'b'), (2, 'c')])
-        s1 = Series([1, 2, np.nan], index=idx)
-        s2 = s1.copy()
-        self.assertTrue(s1.equals(s2))
-
-        # Add object dtype column with nans
-        index = np.random.random(10)
-        df1 = DataFrame(
-            np.random.random(10, ), index=index, columns=['floats'])
-        df1['text'] = 'the sky is so blue. we could use more chocolate.'.split(
-        )
-        df1['start'] = date_range('2000-1-1', periods=10, freq='T')
-        df1['end'] = date_range('2000-1-1', periods=10, freq='D')
-        df1['diff'] = df1['end'] - df1['start']
-        df1['bool'] = (np.arange(10) % 3 == 0)
-        df1.loc[::2] = nan
-        df2 = df1.copy()
-        self.assertTrue(df1['text'].equals(df2['text']))
-        self.assertTrue(df1['start'].equals(df2['start']))
-        self.assertTrue(df1['end'].equals(df2['end']))
-        self.assertTrue(df1['diff'].equals(df2['diff']))
-        self.assertTrue(df1['bool'].equals(df2['bool']))
-        self.assertTrue(df1.equals(df2))
-        self.assertFalse(df1.equals(object))
-
-        # different dtype
-        different = df1.copy()
-        different['floats'] = different['floats'].astype('float32')
-        self.assertFalse(df1.equals(different))
-
-        # different index
-        different_index = -index
-        different = df2.set_index(different_index)
-        self.assertFalse(df1.equals(different))
-
-        # different columns
-        different = df2.copy()
-        different.columns = df2.columns[::-1]
-        self.assertFalse(df1.equals(different))
-
-        # DatetimeIndex
-        index = pd.date_range('2000-1-1', periods=10, freq='T')
-        df1 = df1.set_index(index)
-        df2 = df1.copy()
-        self.assertTrue(df1.equals(df2))
-
-        # MultiIndex
-        df3 = df1.set_index(['text'], append=True)
-        df2 = df1.set_index(['text'], append=True)
-        self.assertTrue(df3.equals(df2))
-
-        df2 = df1.set_index(['floats'], append=True)
-        self.assertFalse(df3.equals(df2))
-
-        # NaN in index
-        df3 = df1.set_index(['floats'], append=True)
-        df2 = df1.set_index(['floats'], append=True)
-        self.assertTrue(df3.equals(df2))
-
-        # GH 8437
-        a = pd.Series([False, np.nan])
-        b = pd.Series([False, np.nan])
-        c = pd.Series(index=range(2))
-        d = pd.Series(index=range(2))
-        e = pd.Series(index=range(2))
-        f = pd.Series(index=range(2))
-        c[:-1] = d[:-1] = e[0] = f[0] = False
-        self.assertTrue(a.equals(a))
-        self.assertTrue(a.equals(b))
-        self.assertTrue(a.equals(c))
-        self.assertTrue(a.equals(d))
-        self.assertFalse(a.equals(e))
-        self.assertTrue(e.equals(f))
-
-    def test_describe_raises(self):
-        with tm.assertRaises(NotImplementedError):
-            tm.makePanel().describe()
-
-    def test_pipe(self):
-        df = DataFrame({'A': [1, 2, 3]})
-        f = lambda x, y: x ** y
-        result = df.pipe(f, 2)
-        expected = DataFrame({'A': [1, 4, 9]})
-        self.assert_frame_equal(result, expected)
-
-        result = df.A.pipe(f, 2)
-        self.assert_series_equal(result, expected.A)
-
-    def test_pipe_tuple(self):
-        df = DataFrame({'A': [1, 2, 3]})
-        f = lambda x, y: y
-        result = df.pipe((f, 'y'), 0)
-        self.assert_frame_equal(result, df)
-
-        result = df.A.pipe((f, 'y'), 0)
-        self.assert_series_equal(result, df.A)
-
-    def test_pipe_tuple_error(self):
-        df = DataFrame({"A": [1, 2, 3]})
-        f = lambda x, y: y
-        with tm.assertRaises(ValueError):
-            df.pipe((f, 'y'), x=1, y=0)
-
-        with tm.assertRaises(ValueError):
-            df.A.pipe((f, 'y'), x=1, y=0)
-
-    def test_pipe_panel(self):
-        wp = Panel({'r1': DataFrame({"A": [1, 2, 3]})})
-        f = lambda x, y: x + y
-        result = wp.pipe(f, 2)
-        expected = wp + 2
-        assert_panel_equal(result, expected)
-
-        result = wp.pipe((f, 'y'), x=1)
-        expected = wp + 1
-        assert_panel_equal(result, expected)
-
-        with tm.assertRaises(ValueError):
-            result = wp.pipe((f, 'y'), x=1, y=1)
diff --git a/pandas/tests/test_join.py b/pandas/tests/test_join.py
index 6723494d1529b..5b6656de15731 100644
--- a/pandas/tests/test_join.py
+++ b/pandas/tests/test_join.py
@@ -1,14 +1,15 @@
 # -*- coding: utf-8 -*-
 
 import numpy as np
-from pandas import Index
 
 from pandas._libs import join as _join
+
+from pandas import Categorical, DataFrame, Index, merge
 import pandas.util.testing as tm
-from pandas.util.testing import assert_almost_equal
+from pandas.util.testing import assert_almost_equal, assert_frame_equal
 
 
-class TestIndexer(tm.TestCase):
+class TestIndexer(object):
 
     def test_outer_join_indexer(self):
         typemap = [('int32', _join.outer_join_indexer_int32),
@@ -23,9 +24,9 @@ def test_outer_join_indexer(self):
             empty = np.array([], dtype=dtype)
 
             result, lindexer, rindexer = indexer(left, right)
-            tm.assertIsInstance(result, np.ndarray)
-            tm.assertIsInstance(lindexer, np.ndarray)
-            tm.assertIsInstance(rindexer, np.ndarray)
+            assert isinstance(result, np.ndarray)
+            assert isinstance(lindexer, np.ndarray)
+            assert isinstance(rindexer, np.ndarray)
             tm.assert_numpy_array_equal(result, np.arange(5, dtype=dtype))
             exp = np.array([0, 1, 2, -1, -1], dtype=np.int64)
             tm.assert_numpy_array_equal(lindexer, exp)
@@ -53,7 +54,7 @@ def test_left_join_indexer_unique():
 
     result = _join.left_join_indexer_unique_int64(b, a)
     expected = np.array([1, 1, 2, 3, 3], dtype=np.int64)
-    assert (np.array_equal(result, expected))
+    tm.assert_numpy_array_equal(result, expected)
 
 
 def test_left_outer_join_bug():
@@ -69,13 +70,14 @@ def test_left_outer_join_bug():
 
     lidx, ridx = _join.left_outer_join(left, right, max_groups, sort=False)
 
-    exp_lidx = np.arange(len(left))
-    exp_ridx = -np.ones(len(left))
+    exp_lidx = np.arange(len(left), dtype=np.int64)
+    exp_ridx = -np.ones(len(left), dtype=np.int64)
+
     exp_ridx[left == 1] = 1
     exp_ridx[left == 3] = 0
 
-    assert (np.array_equal(lidx, exp_lidx))
-    assert (np.array_equal(ridx, exp_ridx))
+    tm.assert_numpy_array_equal(lidx, exp_lidx)
+    tm.assert_numpy_array_equal(ridx, exp_ridx)
 
 
 def test_inner_join_indexer():
@@ -192,3 +194,43 @@ def test_inner_join_indexer2():
 
     exp_ridx = np.array([0, 1, 2, 3], dtype=np.int64)
     assert_almost_equal(ridx, exp_ridx)
+
+
+def test_merge_join_categorical_multiindex():
+    # From issue 16627
+    a = {'Cat1': Categorical(['a', 'b', 'a', 'c', 'a', 'b'],
+                             ['a', 'b', 'c']),
+         'Int1': [0, 1, 0, 1, 0, 0]}
+    a = DataFrame(a)
+
+    b = {'Cat': Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                            ['a', 'b', 'c']),
+         'Int': [0, 0, 0, 1, 1, 1],
+         'Factor': [1.1, 1.2, 1.3, 1.4, 1.5, 1.6]}
+    b = DataFrame(b).set_index(['Cat', 'Int'])['Factor']
+
+    expected = merge(a, b.reset_index(), left_on=['Cat1', 'Int1'],
+                     right_on=['Cat', 'Int'], how='left')
+    result = a.join(b, on=['Cat1', 'Int1'])
+    expected = expected.drop(['Cat', 'Int'], axis=1)
+    assert_frame_equal(expected, result)
+
+    # Same test, but with ordered categorical
+    a = {'Cat1': Categorical(['a', 'b', 'a', 'c', 'a', 'b'],
+                             ['b', 'a', 'c'],
+                             ordered=True),
+         'Int1': [0, 1, 0, 1, 0, 0]}
+    a = DataFrame(a)
+
+    b = {'Cat': Categorical(['a', 'b', 'c', 'a', 'b', 'c'],
+                            ['b', 'a', 'c'],
+                            ordered=True),
+         'Int': [0, 0, 0, 1, 1, 1],
+         'Factor': [1.1, 1.2, 1.3, 1.4, 1.5, 1.6]}
+    b = DataFrame(b).set_index(['Cat', 'Int'])['Factor']
+
+    expected = merge(a, b.reset_index(), left_on=['Cat1', 'Int1'],
+                     right_on=['Cat', 'Int'], how='left')
+    result = a.join(b, on=['Cat1', 'Int1'])
+    expected = expected.drop(['Cat', 'Int'], axis=1)
+    assert_frame_equal(expected, result)
diff --git a/pandas/tests/test_lib.py b/pandas/tests/test_lib.py
index a925cf13900e9..c5dcfc89faa67 100644
--- a/pandas/tests/test_lib.py
+++ b/pandas/tests/test_lib.py
@@ -1,29 +1,32 @@
 # -*- coding: utf-8 -*-
 
 import numpy as np
-import pandas as pd
-import pandas._libs.lib as lib
+import pytest
+
+from pandas._libs import lib, writers as libwriters
+
+from pandas import Index
 import pandas.util.testing as tm
 
 
-class TestMisc(tm.TestCase):
+class TestMisc(object):
 
     def test_max_len_string_array(self):
 
         arr = a = np.array(['foo', 'b', np.nan], dtype='object')
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # unicode
         arr = a.astype('U').astype(object)
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # bytes for python3
         arr = a.astype('S').astype(object)
-        self.assertTrue(lib.max_len_string_array(arr), 3)
+        assert libwriters.max_len_string_array(arr) == 3
 
         # raises
-        tm.assertRaises(TypeError,
-                        lambda: lib.max_len_string_array(arr.astype('U')))
+        with pytest.raises(TypeError):
+            libwriters.max_len_string_array(arr.astype('U'))
 
     def test_fast_unique_multiple_list_gen_sort(self):
         keys = [['p', 'a'], ['n', 'd'], ['a', 's']]
@@ -39,7 +42,7 @@ def test_fast_unique_multiple_list_gen_sort(self):
         tm.assert_numpy_array_equal(np.array(out), expected)
 
 
-class TestIndexing(tm.TestCase):
+class TestIndexing(object):
 
     def test_maybe_indices_to_slice_left_edge(self):
         target = np.arange(100)
@@ -47,32 +50,36 @@ def test_maybe_indices_to_slice_left_edge(self):
         # slice
         indices = np.array([], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertTrue(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+        assert isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
         for end in [1, 2, 5, 20, 99]:
             for step in [1, 2, 4]:
                 indices = np.arange(0, end, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
         for case in [[2, 1, 2, 0], [2, 2, 1, 0], [0, 1, 2, 1], [-2, 0, 2],
                      [2, 0, -2]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_right_edge(self):
         target = np.arange(100)
@@ -82,42 +89,49 @@ def test_maybe_indices_to_slice_right_edge(self):
             for step in [1, 2, 4]:
                 indices = np.arange(start, 99, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
         indices = np.array([97, 98, 99, 100], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertFalse(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(maybe_slice, indices)
-        with self.assertRaises(IndexError):
+
+        assert not isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(maybe_slice, indices)
+
+        with pytest.raises(IndexError):
             target[indices]
-        with self.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             target[maybe_slice]
 
         indices = np.array([100, 99, 98, 97], dtype=np.int64)
         maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-        self.assertFalse(isinstance(maybe_slice, slice))
-        self.assert_numpy_array_equal(maybe_slice, indices)
-        with self.assertRaises(IndexError):
+
+        assert not isinstance(maybe_slice, slice)
+        tm.assert_numpy_array_equal(maybe_slice, indices)
+
+        with pytest.raises(IndexError):
             target[indices]
-        with self.assertRaises(IndexError):
+        with pytest.raises(IndexError):
             target[maybe_slice]
 
         for case in [[99, 97, 99, 96], [99, 99, 98, 97], [98, 98, 97, 96]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_both_edges(self):
         target = np.arange(10)
@@ -126,22 +140,22 @@ def test_maybe_indices_to_slice_both_edges(self):
         for step in [1, 2, 4, 5, 8, 9]:
             indices = np.arange(0, 9, step, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertTrue(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
             # reverse
             indices = indices[::-1]
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertTrue(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
         # not slice
         for case in [[4, 2, 0, -2], [2, 2, 1, 0], [0, 1, 2, 1]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_indices_to_slice_middle(self):
         target = np.arange(100)
@@ -151,84 +165,43 @@ def test_maybe_indices_to_slice_middle(self):
             for step in [1, 2, 4, 20]:
                 indices = np.arange(start, end, step, dtype=np.int64)
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
                 # reverse
                 indices = indices[::-1]
                 maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-                self.assertTrue(isinstance(maybe_slice, slice))
-                self.assert_numpy_array_equal(target[indices],
-                                              target[maybe_slice])
+
+                assert isinstance(maybe_slice, slice)
+                tm.assert_numpy_array_equal(target[indices],
+                                            target[maybe_slice])
 
         # not slice
         for case in [[14, 12, 10, 12], [12, 12, 11, 10], [10, 11, 12, 11]]:
             indices = np.array(case, dtype=np.int64)
             maybe_slice = lib.maybe_indices_to_slice(indices, len(target))
-            self.assertFalse(isinstance(maybe_slice, slice))
-            self.assert_numpy_array_equal(maybe_slice, indices)
-            self.assert_numpy_array_equal(target[indices], target[maybe_slice])
+
+            assert not isinstance(maybe_slice, slice)
+            tm.assert_numpy_array_equal(maybe_slice, indices)
+            tm.assert_numpy_array_equal(target[indices], target[maybe_slice])
 
     def test_maybe_booleans_to_slice(self):
         arr = np.array([0, 0, 1, 1, 1, 0, 1], dtype=np.uint8)
         result = lib.maybe_booleans_to_slice(arr)
-        self.assertTrue(result.dtype == np.bool_)
+        assert result.dtype == np.bool_
 
         result = lib.maybe_booleans_to_slice(arr[:0])
-        self.assertTrue(result == slice(0, 0))
+        assert result == slice(0, 0)
 
     def test_get_reverse_indexer(self):
         indexer = np.array([-1, -1, 1, 2, 0, -1, 3, 4], dtype=np.int64)
         result = lib.get_reverse_indexer(indexer, 5)
         expected = np.array([4, 2, 3, 6, 7], dtype=np.int64)
-        self.assertTrue(np.array_equal(result, expected))
-
-
-class TestNullObj(tm.TestCase):
-
-    _1d_methods = ['isnullobj', 'isnullobj_old']
-    _2d_methods = ['isnullobj2d', 'isnullobj2d_old']
-
-    def _check_behavior(self, arr, expected):
-        for method in TestNullObj._1d_methods:
-            result = getattr(lib, method)(arr)
-            tm.assert_numpy_array_equal(result, expected)
-
-        arr = np.atleast_2d(arr)
-        expected = np.atleast_2d(expected)
-
-        for method in TestNullObj._2d_methods:
-            result = getattr(lib, method)(arr)
-            tm.assert_numpy_array_equal(result, expected)
-
-    def test_basic(self):
-        arr = np.array([1, None, 'foo', -5.1, pd.NaT, np.nan])
-        expected = np.array([False, True, False, False, True, True])
-
-        self._check_behavior(arr, expected)
-
-    def test_non_obj_dtype(self):
-        arr = np.array([1, 3, np.nan, 5], dtype=float)
-        expected = np.array([False, False, True, False])
-
-        self._check_behavior(arr, expected)
-
-    def test_empty_arr(self):
-        arr = np.array([])
-        expected = np.array([], dtype=bool)
-
-        self._check_behavior(arr, expected)
-
-    def test_empty_str_inp(self):
-        arr = np.array([""])  # empty but not null
-        expected = np.array([False])
-
-        self._check_behavior(arr, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
-    def test_empty_like(self):
-        # see gh-13717: no segfaults!
-        arr = np.empty_like([None])
-        expected = np.array([True])
 
-        self._check_behavior(arr, expected)
+def test_cache_readonly_preserve_docstrings():
+    # GH18197
+    assert Index.hasnans.__doc__ is not None
diff --git a/pandas/tests/test_multilevel.py b/pandas/tests/test_multilevel.py
old mode 100755
new mode 100644
index 5584c1ac6a239..a9a59c6d95373
--- a/pandas/tests/test_multilevel.py
+++ b/pandas/tests/test_multilevel.py
@@ -1,39 +1,42 @@
 # -*- coding: utf-8 -*-
 # pylint: disable-msg=W0612,E1101,W0141
-from warnings import catch_warnings
 import datetime
 import itertools
-import pytest
+from warnings import catch_warnings, simplefilter
 
-from numpy.random import randn
 import numpy as np
+from numpy.random import randn
+import pytest
+import pytz
 
-from pandas.core.index import Index, MultiIndex
-from pandas import Panel, DataFrame, Series, notnull, isnull, Timestamp
+from pandas.compat import (
+    StringIO, lrange, lzip, product as cart_product, range, u, zip)
+
+from pandas.core.dtypes.common import is_float_dtype, is_integer_dtype
 
-from pandas.types.common import is_float_dtype, is_integer_dtype
-import pandas.core.common as com
-import pandas.util.testing as tm
-from pandas.compat import (range, lrange, StringIO, lzip, u, product as
-                           cart_product, zip)
 import pandas as pd
-import pandas._libs.index as _index
+from pandas import DataFrame, Series, Timestamp, isna
+from pandas.core.index import Index, MultiIndex
+import pandas.util.testing as tm
+
+AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew', 'mad',
+                 'std', 'var', 'sem']
 
 
 class Base(object):
 
-    def setUp(self):
+    def setup_method(self, method):
 
         index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'], ['one', 'two',
                                                                   'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
+                           codes=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
+                                  [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
                            names=['first', 'second'])
         self.frame = DataFrame(np.random.randn(10, 3), index=index,
                                columns=Index(['A', 'B', 'C'], name='exp'))
 
         self.single_level = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux']],
-                                       labels=[[0, 1, 2, 3]], names=['first'])
+                                       codes=[[0, 1, 2, 3]], names=['first'])
 
         # create test series object
         arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
@@ -44,8 +47,7 @@ def setUp(self):
         s[3] = np.NaN
         self.series = s
 
-        tm.N = 100
-        self.tdf = tm.makeTimeDataFrame()
+        self.tdf = tm.makeTimeDataFrame(100)
         self.ymd = self.tdf.groupby([lambda x: x.year, lambda x: x.month,
                                      lambda x: x.day]).sum()
 
@@ -56,7 +58,7 @@ def setUp(self):
         self.ymd.index.set_names(['year', 'month', 'day'], inplace=True)
 
 
-class TestMultiLevel(Base, tm.TestCase):
+class TestMultiLevel(Base):
 
     def test_append(self):
         a, b = self.frame[:5], self.frame[5:]
@@ -68,8 +70,6 @@ def test_append(self):
         tm.assert_series_equal(result, self.frame['A'])
 
     def test_append_index(self):
-        tm._skip_if_no_pytz()
-
         idx1 = Index([1.1, 1.2, 1.3])
         idx2 = pd.date_range('2011-01-01', freq='D', periods=3,
                              tz='Asia/Tokyo')
@@ -80,8 +80,7 @@ def test_append_index(self):
 
         result = idx1.append(midx_lv2)
 
-        # GH 7112
-        import pytz
+        # see gh-7112
         tz = pytz.timezone('Asia/Tokyo')
         expected_tuples = [(1.1, tz.localize(datetime.datetime(2011, 1, 1))),
                            (1.2, tz.localize(datetime.datetime(2011, 1, 2))),
@@ -113,25 +112,25 @@ def test_dataframe_constructor(self):
         multi = DataFrame(np.random.randn(4, 4),
                           index=[np.array(['a', 'a', 'b', 'b']),
                                  np.array(['x', 'y', 'x', 'y'])])
-        tm.assertIsInstance(multi.index, MultiIndex)
-        self.assertNotIsInstance(multi.columns, MultiIndex)
+        assert isinstance(multi.index, MultiIndex)
+        assert not isinstance(multi.columns, MultiIndex)
 
         multi = DataFrame(np.random.randn(4, 4),
                           columns=[['a', 'a', 'b', 'b'],
                                    ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.columns, MultiIndex)
+        assert isinstance(multi.columns, MultiIndex)
 
     def test_series_constructor(self):
         multi = Series(1., index=[np.array(['a', 'a', 'b', 'b']), np.array(
             ['x', 'y', 'x', 'y'])])
-        tm.assertIsInstance(multi.index, MultiIndex)
+        assert isinstance(multi.index, MultiIndex)
 
         multi = Series(1., index=[['a', 'a', 'b', 'b'], ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.index, MultiIndex)
+        assert isinstance(multi.index, MultiIndex)
 
         multi = Series(lrange(4), index=[['a', 'a', 'b', 'b'],
                                          ['x', 'y', 'x', 'y']])
-        tm.assertIsInstance(multi.index, MultiIndex)
+        assert isinstance(multi.index, MultiIndex)
 
     def test_reindex_level(self):
         # axis=0
@@ -178,7 +177,7 @@ def _check_op(opname):
 
     def test_pickle(self):
         def _test_roundtrip(frame):
-            unpickled = self.round_trip_pickle(frame)
+            unpickled = tm.round_trip_pickle(frame)
             tm.assert_frame_equal(frame, unpickled)
 
         _test_roundtrip(self.frame)
@@ -192,27 +191,29 @@ def test_reindex(self):
         tm.assert_frame_equal(reindexed, expected)
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             reindexed = self.frame.ix[[('foo', 'one'), ('bar', 'one')]]
         tm.assert_frame_equal(reindexed, expected)
 
     def test_reindex_preserve_levels(self):
         new_index = self.ymd.index[::10]
         chunk = self.ymd.reindex(new_index)
-        self.assertIs(chunk.index, new_index)
+        assert chunk.index is new_index
 
         chunk = self.ymd.loc[new_index]
-        self.assertIs(chunk.index, new_index)
+        assert chunk.index is new_index
 
         with catch_warnings(record=True):
+            simplefilter("ignore", DeprecationWarning)
             chunk = self.ymd.ix[new_index]
-        self.assertIs(chunk.index, new_index)
+        assert chunk.index is new_index
 
         ymdT = self.ymd.T
         chunk = ymdT.reindex(columns=new_index)
-        self.assertIs(chunk.columns, new_index)
+        assert chunk.columns is new_index
 
         chunk = ymdT.loc[:, new_index]
-        self.assertIs(chunk.columns, new_index)
+        assert chunk.columns is new_index
 
     def test_repr_to_string(self):
         repr(self.frame)
@@ -233,483 +234,7 @@ def test_repr_name_coincide(self):
         df = DataFrame({'value': [0, 1]}, index=index)
 
         lines = repr(df).split('\n')
-        self.assertTrue(lines[2].startswith('a 0 foo'))
-
-    def test_getitem_simple(self):
-        df = self.frame.T
-
-        col = df['foo', 'one']
-        tm.assert_almost_equal(col.values, df.values[:, 0])
-        with pytest.raises(KeyError):
-            df[('foo', 'four')]
-        with pytest.raises(KeyError):
-            df['foobar']
-
-    def test_series_getitem(self):
-        s = self.ymd['A']
-
-        result = s[2000, 3]
-
-        # TODO(wesm): unused?
-        # result2 = s.loc[2000, 3]
-
-        expected = s.reindex(s.index[42:65])
-        expected.index = expected.index.droplevel(0).droplevel(0)
-        tm.assert_series_equal(result, expected)
-
-        result = s[2000, 3, 10]
-        expected = s[49]
-        self.assertEqual(result, expected)
-
-        # fancy
-        expected = s.reindex(s.index[49:51])
-        result = s.loc[[(2000, 3, 10), (2000, 3, 13)]]
-        tm.assert_series_equal(result, expected)
-
-        with catch_warnings(record=True):
-            result = s.ix[[(2000, 3, 10), (2000, 3, 13)]]
-        tm.assert_series_equal(result, expected)
-
-        # key error
-        self.assertRaises(KeyError, s.__getitem__, (2000, 3, 4))
-
-    def test_series_getitem_corner(self):
-        s = self.ymd['A']
-
-        # don't segfault, GH #495
-        # out of bounds access
-        self.assertRaises(IndexError, s.__getitem__, len(self.ymd))
-
-        # generator
-        result = s[(x > 0 for x in s)]
-        expected = s[s > 0]
-        tm.assert_series_equal(result, expected)
-
-    def test_series_setitem(self):
-        s = self.ymd['A']
-
-        s[2000, 3] = np.nan
-        self.assertTrue(isnull(s.values[42:65]).all())
-        self.assertTrue(notnull(s.values[:42]).all())
-        self.assertTrue(notnull(s.values[65:]).all())
-
-        s[2000, 3, 10] = np.nan
-        self.assertTrue(isnull(s[49]))
-
-    def test_series_slice_partial(self):
-        pass
-
-    def test_frame_getitem_setitem_boolean(self):
-        df = self.frame.T.copy()
-        values = df.values
-
-        result = df[df > 0]
-        expected = df.where(df > 0)
-        tm.assert_frame_equal(result, expected)
-
-        df[df > 0] = 5
-        values[values > 0] = 5
-        tm.assert_almost_equal(df.values, values)
-
-        df[df == 5] = 0
-        values[values == 5] = 0
-        tm.assert_almost_equal(df.values, values)
-
-        # a df that needs alignment first
-        df[df[:-1] < 0] = 2
-        np.putmask(values[:-1], values[:-1] < 0, 2)
-        tm.assert_almost_equal(df.values, values)
-
-        with tm.assertRaisesRegexp(TypeError, 'boolean values only'):
-            df[df * 0] = 2
-
-    def test_frame_getitem_setitem_slice(self):
-        # getitem
-        result = self.frame.iloc[:4]
-        expected = self.frame[:4]
-        tm.assert_frame_equal(result, expected)
-
-        # setitem
-        cp = self.frame.copy()
-        cp.iloc[:4] = 0
-
-        self.assertTrue((cp.values[:4] == 0).all())
-        self.assertTrue((cp.values[4:] != 0).all())
-
-    def test_frame_getitem_setitem_multislice(self):
-        levels = [['t1', 't2'], ['a', 'b', 'c']]
-        labels = [[0, 0, 0, 1, 1], [0, 1, 2, 0, 1]]
-        midx = MultiIndex(labels=labels, levels=levels, names=[None, 'id'])
-        df = DataFrame({'value': [1, 2, 3, 7, 8]}, index=midx)
-
-        result = df.loc[:, 'value']
-        tm.assert_series_equal(df['value'], result)
-
-        with catch_warnings(record=True):
-            result = df.ix[:, 'value']
-        tm.assert_series_equal(df['value'], result)
-
-        result = df.loc[df.index[1:3], 'value']
-        tm.assert_series_equal(df['value'][1:3], result)
-
-        result = df.loc[:, :]
-        tm.assert_frame_equal(df, result)
-
-        result = df
-        df.loc[:, 'value'] = 10
-        result['value'] = 10
-        tm.assert_frame_equal(df, result)
-
-        df.loc[:, :] = 10
-        tm.assert_frame_equal(df, result)
-
-    def test_frame_getitem_multicolumn_empty_level(self):
-        f = DataFrame({'a': ['1', '2', '3'], 'b': ['2', '3', '4']})
-        f.columns = [['level1 item1', 'level1 item2'], ['', 'level2 item2'],
-                     ['level3 item1', 'level3 item2']]
-
-        result = f['level1 item1']
-        expected = DataFrame([['1'], ['2'], ['3']], index=f.index,
-                             columns=['level3 item1'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_frame_setitem_multi_column(self):
-        df = DataFrame(randn(10, 4), columns=[['a', 'a', 'b', 'b'],
-                                              [0, 1, 0, 1]])
-
-        cp = df.copy()
-        cp['a'] = cp['b']
-        tm.assert_frame_equal(cp['a'], cp['b'])
-
-        # set with ndarray
-        cp = df.copy()
-        cp['a'] = cp['b'].values
-        tm.assert_frame_equal(cp['a'], cp['b'])
-
-        # ---------------------------------------
-        # #1803
-        columns = MultiIndex.from_tuples([('A', '1'), ('A', '2'), ('B', '1')])
-        df = DataFrame(index=[1, 3, 5], columns=columns)
-
-        # Works, but adds a column instead of updating the two existing ones
-        df['A'] = 0.0  # Doesn't work
-        self.assertTrue((df['A'].values == 0).all())
-
-        # it broadcasts
-        df['B', '1'] = [1, 2, 3]
-        df['A'] = df['B', '1']
-
-        sliced_a1 = df['A', '1']
-        sliced_a2 = df['A', '2']
-        sliced_b1 = df['B', '1']
-        tm.assert_series_equal(sliced_a1, sliced_b1, check_names=False)
-        tm.assert_series_equal(sliced_a2, sliced_b1, check_names=False)
-        self.assertEqual(sliced_a1.name, ('A', '1'))
-        self.assertEqual(sliced_a2.name, ('A', '2'))
-        self.assertEqual(sliced_b1.name, ('B', '1'))
-
-    def test_getitem_tuple_plus_slice(self):
-        # GH #671
-        df = DataFrame({'a': lrange(10),
-                        'b': lrange(10),
-                        'c': np.random.randn(10),
-                        'd': np.random.randn(10)})
-
-        idf = df.set_index(['a', 'b'])
-
-        result = idf.loc[(0, 0), :]
-        expected = idf.loc[0, 0]
-        expected2 = idf.xs((0, 0))
-        with catch_warnings(record=True):
-            expected3 = idf.ix[0, 0]
-
-        tm.assert_series_equal(result, expected)
-        tm.assert_series_equal(result, expected2)
-        tm.assert_series_equal(result, expected3)
-
-    def test_getitem_setitem_tuple_plus_columns(self):
-        # GH #1013
-
-        df = self.ymd[:5]
-
-        result = df.loc[(2000, 1, 6), ['A', 'B', 'C']]
-        expected = df.loc[2000, 1, 6][['A', 'B', 'C']]
-        tm.assert_series_equal(result, expected)
-
-    def test_xs(self):
-        xs = self.frame.xs(('bar', 'two'))
-        xs2 = self.frame.loc[('bar', 'two')]
-
-        tm.assert_series_equal(xs, xs2)
-        tm.assert_almost_equal(xs.values, self.frame.values[4])
-
-        # GH 6574
-        # missing values in returned index should be preserrved
-        acc = [
-            ('a', 'abcde', 1),
-            ('b', 'bbcde', 2),
-            ('y', 'yzcde', 25),
-            ('z', 'xbcde', 24),
-            ('z', None, 26),
-            ('z', 'zbcde', 25),
-            ('z', 'ybcde', 26),
-        ]
-        df = DataFrame(acc,
-                       columns=['a1', 'a2', 'cnt']).set_index(['a1', 'a2'])
-        expected = DataFrame({'cnt': [24, 26, 25, 26]}, index=Index(
-            ['xbcde', np.nan, 'zbcde', 'ybcde'], name='a2'))
-
-        result = df.xs('z', level='a1')
-        tm.assert_frame_equal(result, expected)
-
-    def test_xs_partial(self):
-        result = self.frame.xs('foo')
-        result2 = self.frame.loc['foo']
-        expected = self.frame.T['foo'].T
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result, result2)
-
-        result = self.ymd.xs((2000, 4))
-        expected = self.ymd.loc[2000, 4]
-        tm.assert_frame_equal(result, expected)
-
-        # ex from #1796
-        index = MultiIndex(levels=[['foo', 'bar'], ['one', 'two'], [-1, 1]],
-                           labels=[[0, 0, 0, 0, 1, 1, 1, 1],
-                                   [0, 0, 1, 1, 0, 0, 1, 1], [0, 1, 0, 1, 0, 1,
-                                                              0, 1]])
-        df = DataFrame(np.random.randn(8, 4), index=index,
-                       columns=list('abcd'))
-
-        result = df.xs(['foo', 'one'])
-        expected = df.loc['foo', 'one']
-        tm.assert_frame_equal(result, expected)
-
-    def test_xs_level(self):
-        result = self.frame.xs('two', level='second')
-        expected = self.frame[self.frame.index.get_level_values(1) == 'two']
-        expected.index = expected.index.droplevel(1)
-
-        tm.assert_frame_equal(result, expected)
-
-        index = MultiIndex.from_tuples([('x', 'y', 'z'), ('a', 'b', 'c'), (
-            'p', 'q', 'r')])
-        df = DataFrame(np.random.randn(3, 5), index=index)
-        result = df.xs('c', level=2)
-        expected = df[1:2]
-        expected.index = expected.index.droplevel(2)
-        tm.assert_frame_equal(result, expected)
-
-        # this is a copy in 0.14
-        result = self.frame.xs('two', level='second')
-
-        # setting this will give a SettingWithCopyError
-        # as we are trying to write a view
-        def f(x):
-            x[:] = 10
-
-        self.assertRaises(com.SettingWithCopyError, f, result)
-
-    def test_xs_level_multiple(self):
-        from pandas import read_table
-        text = """                      A       B       C       D        E
-one two three   four
-a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
-a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
-x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
-
-        df = read_table(StringIO(text), sep=r'\s+', engine='python')
-
-        result = df.xs(('a', 4), level=['one', 'four'])
-        expected = df.xs('a').xs(4, level='four')
-        tm.assert_frame_equal(result, expected)
-
-        # this is a copy in 0.14
-        result = df.xs(('a', 4), level=['one', 'four'])
-
-        # setting this will give a SettingWithCopyError
-        # as we are trying to write a view
-        def f(x):
-            x[:] = 10
-
-        self.assertRaises(com.SettingWithCopyError, f, result)
-
-        # GH2107
-        dates = lrange(20111201, 20111205)
-        ids = 'abcde'
-        idx = MultiIndex.from_tuples([x for x in cart_product(dates, ids)])
-        idx.names = ['date', 'secid']
-        df = DataFrame(np.random.randn(len(idx), 3), idx, ['X', 'Y', 'Z'])
-
-        rs = df.xs(20111201, level='date')
-        xp = df.loc[20111201, :]
-        tm.assert_frame_equal(rs, xp)
-
-    def test_xs_level0(self):
-        from pandas import read_table
-        text = """                      A       B       C       D        E
-one two three   four
-a   b   10.0032 5    -0.5109 -2.3358 -0.4645  0.05076  0.3640
-a   q   20      4     0.4473  1.4152  0.2834  1.00661  0.1744
-x   q   30      3    -0.6662 -0.5243 -0.3580  0.89145  2.5838"""
-
-        df = read_table(StringIO(text), sep=r'\s+', engine='python')
-
-        result = df.xs('a', level=0)
-        expected = df.xs('a')
-        self.assertEqual(len(result), 2)
-        tm.assert_frame_equal(result, expected)
-
-    def test_xs_level_series(self):
-        s = self.frame['A']
-        result = s[:, 'two']
-        expected = self.frame.xs('two', level=1)['A']
-        tm.assert_series_equal(result, expected)
-
-        s = self.ymd['A']
-        result = s[2000, 5]
-        expected = self.ymd.loc[2000, 5]['A']
-        tm.assert_series_equal(result, expected)
-
-        # not implementing this for now
-
-        self.assertRaises(TypeError, s.__getitem__, (2000, slice(3, 4)))
-
-        # result = s[2000, 3:4]
-        # lv =s.index.get_level_values(1)
-        # expected = s[(lv == 3) | (lv == 4)]
-        # expected.index = expected.index.droplevel(0)
-        # tm.assert_series_equal(result, expected)
-
-        # can do this though
-
-    def test_get_loc_single_level(self):
-        s = Series(np.random.randn(len(self.single_level)),
-                   index=self.single_level)
-        for k in self.single_level.values:
-            s[k]
-
-    def test_getitem_toplevel(self):
-        df = self.frame.T
-
-        result = df['foo']
-        expected = df.reindex(columns=df.columns[:3])
-        expected.columns = expected.columns.droplevel(0)
-        tm.assert_frame_equal(result, expected)
-
-        result = df['bar']
-        result2 = df.loc[:, 'bar']
-
-        expected = df.reindex(columns=df.columns[3:5])
-        expected.columns = expected.columns.droplevel(0)
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result, result2)
-
-    def test_getitem_setitem_slice_integers(self):
-        index = MultiIndex(levels=[[0, 1, 2], [0, 2]],
-                           labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
-
-        frame = DataFrame(np.random.randn(len(index), 4), index=index,
-                          columns=['a', 'b', 'c', 'd'])
-        res = frame.loc[1:2]
-        exp = frame.reindex(frame.index[2:])
-        tm.assert_frame_equal(res, exp)
-
-        frame.loc[1:2] = 7
-        self.assertTrue((frame.loc[1:2] == 7).values.all())
-
-        series = Series(np.random.randn(len(index)), index=index)
-
-        res = series.loc[1:2]
-        exp = series.reindex(series.index[2:])
-        tm.assert_series_equal(res, exp)
-
-        series.loc[1:2] = 7
-        self.assertTrue((series.loc[1:2] == 7).values.all())
-
-    def test_getitem_int(self):
-        levels = [[0, 1], [0, 1, 2]]
-        labels = [[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]]
-        index = MultiIndex(levels=levels, labels=labels)
-
-        frame = DataFrame(np.random.randn(6, 2), index=index)
-
-        result = frame.loc[1]
-        expected = frame[-3:]
-        expected.index = expected.index.droplevel(0)
-        tm.assert_frame_equal(result, expected)
-
-        # raises exception
-        self.assertRaises(KeyError, frame.loc.__getitem__, 3)
-
-        # however this will work
-        result = self.frame.iloc[2]
-        expected = self.frame.xs(self.frame.index[2])
-        tm.assert_series_equal(result, expected)
-
-    def test_getitem_partial(self):
-        ymd = self.ymd.T
-        result = ymd[2000, 2]
-
-        expected = ymd.reindex(columns=ymd.columns[ymd.columns.labels[1] == 1])
-        expected.columns = expected.columns.droplevel(0).droplevel(0)
-        tm.assert_frame_equal(result, expected)
-
-    def test_setitem_change_dtype(self):
-        dft = self.frame.T
-        s = dft['foo', 'two']
-        dft['foo', 'two'] = s > s.median()
-        tm.assert_series_equal(dft['foo', 'two'], s > s.median())
-        # tm.assertIsInstance(dft._data.blocks[1].items, MultiIndex)
-
-        reindexed = dft.reindex(columns=[('foo', 'two')])
-        tm.assert_series_equal(reindexed['foo', 'two'], s > s.median())
-
-    def test_frame_setitem_ix(self):
-        self.frame.loc[('bar', 'two'), 'B'] = 5
-        self.assertEqual(self.frame.loc[('bar', 'two'), 'B'], 5)
-
-        # with integer labels
-        df = self.frame.copy()
-        df.columns = lrange(3)
-        df.loc[('bar', 'two'), 1] = 7
-        self.assertEqual(df.loc[('bar', 'two'), 1], 7)
-
-        with catch_warnings(record=True):
-            df = self.frame.copy()
-            df.columns = lrange(3)
-            df.ix[('bar', 'two'), 1] = 7
-        self.assertEqual(df.loc[('bar', 'two'), 1], 7)
-
-    def test_fancy_slice_partial(self):
-        result = self.frame.loc['bar':'baz']
-        expected = self.frame[3:7]
-        tm.assert_frame_equal(result, expected)
-
-        result = self.ymd.loc[(2000, 2):(2000, 4)]
-        lev = self.ymd.index.labels[1]
-        expected = self.ymd[(lev >= 1) & (lev <= 3)]
-        tm.assert_frame_equal(result, expected)
-
-    def test_getitem_partial_column_select(self):
-        idx = MultiIndex(labels=[[0, 0, 0], [0, 1, 1], [1, 0, 1]],
-                         levels=[['a', 'b'], ['x', 'y'], ['p', 'q']])
-        df = DataFrame(np.random.rand(3, 2), index=idx)
-
-        result = df.loc[('a', 'y'), :]
-        expected = df.loc[('a', 'y')]
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[('a', 'y'), [1, 0]]
-        expected = df.loc[('a', 'y')][[1, 0]]
-        tm.assert_frame_equal(result, expected)
-
-        with catch_warnings(record=True):
-            result = df.ix[('a', 'y'), [1, 0]]
-        tm.assert_frame_equal(result, expected)
-
-        self.assertRaises(KeyError, df.loc.__getitem__,
-                          (('a', 'foo'), slice(None, None)))
+        assert lines[2].startswith('a 0 foo')
 
     def test_delevel_infer_dtype(self):
         tuples = [tuple
@@ -719,20 +244,22 @@ def test_delevel_infer_dtype(self):
         df = DataFrame(np.random.randn(8, 3), columns=['A', 'B', 'C'],
                        index=index)
         deleveled = df.reset_index()
-        self.assertTrue(is_integer_dtype(deleveled['prm1']))
-        self.assertTrue(is_float_dtype(deleveled['prm2']))
+        assert is_integer_dtype(deleveled['prm1'])
+        assert is_float_dtype(deleveled['prm2'])
 
     def test_reset_index_with_drop(self):
         deleveled = self.ymd.reset_index(drop=True)
-        self.assertEqual(len(deleveled.columns), len(self.ymd.columns))
+        assert len(deleveled.columns) == len(self.ymd.columns)
+        assert deleveled.index.name == self.ymd.index.name
 
         deleveled = self.series.reset_index()
-        tm.assertIsInstance(deleveled, DataFrame)
-        self.assertEqual(len(deleveled.columns),
-                         len(self.series.index.levels) + 1)
+        assert isinstance(deleveled, DataFrame)
+        assert len(deleveled.columns) == len(self.series.index.levels) + 1
+        assert deleveled.index.name == self.series.index.name
 
         deleveled = self.series.reset_index(drop=True)
-        tm.assertIsInstance(deleveled, Series)
+        assert isinstance(deleveled, Series)
+        assert deleveled.index.name == self.series.index.name
 
     def test_count_level(self):
         def _check_counts(frame, axis=0):
@@ -755,17 +282,17 @@ def _check_counts(frame, axis=0):
 
         # can't call with level on regular DataFrame
         df = tm.makeTimeDataFrame()
-        tm.assertRaisesRegexp(TypeError, 'hierarchical', df.count, level=0)
+        with pytest.raises(TypeError, match='hierarchical'):
+            df.count(level=0)
 
         self.frame['D'] = 'foo'
         result = self.frame.count(level=0, numeric_only=True)
-        tm.assert_index_equal(result.columns,
-                              pd.Index(['A', 'B', 'C'], name='exp'))
+        tm.assert_index_equal(result.columns, Index(list('ABC'), name='exp'))
 
     def test_count_level_series(self):
         index = MultiIndex(levels=[['foo', 'bar', 'baz'], ['one', 'two',
                                                            'three', 'four']],
-                           labels=[[0, 0, 0, 2, 2], [2, 0, 1, 1, 2]])
+                           codes=[[0, 0, 0, 2, 2], [2, 0, 1, 1, 2]])
 
         s = Series(np.random.randn(len(index)), index=index)
 
@@ -792,9 +319,9 @@ def test_count_level_corner(self):
         tm.assert_frame_equal(result, expected)
 
     def test_get_level_number_out_of_bounds(self):
-        with tm.assertRaisesRegexp(IndexError, "Too many levels"):
+        with pytest.raises(IndexError, match="Too many levels"):
             self.frame.index._get_level_number(2)
-        with tm.assertRaisesRegexp(IndexError, "not a valid level number"):
+        with pytest.raises(IndexError, match="not a valid level number"):
             self.frame.index._get_level_number(-3)
 
     def test_unstack(self):
@@ -874,7 +401,7 @@ def test_stack(self):
         # GH10417
         def check(left, right):
             tm.assert_series_equal(left, right)
-            self.assertFalse(left.index.is_unique)
+            assert left.index.is_unique is False
             li, ri = left.index, right.index
             tm.assert_index_equal(li, ri)
 
@@ -883,7 +410,7 @@ def check(left, right):
                        columns=['1st', '2nd', '3rd'])
 
         mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd', '3rd']],
-                        labels=[np.tile(
+                        codes=[np.tile(
                             np.arange(2).repeat(3), 2), np.tile(
                                 np.arange(3), 4)])
 
@@ -891,7 +418,7 @@ def check(left, right):
         check(left, right)
 
         df.columns = ['1st', '2nd', '1st']
-        mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd']], labels=[np.tile(
+        mi = MultiIndex(levels=[['a', 'b'], ['1st', '2nd']], codes=[np.tile(
             np.arange(2).repeat(3), 2), np.tile(
                 [0, 1, 0], 4)])
 
@@ -901,7 +428,7 @@ def check(left, right):
         tpls = ('a', 2), ('b', 1), ('a', 1), ('b', 2)
         df.index = MultiIndex.from_tuples(tpls)
         mi = MultiIndex(levels=[['a', 'b'], [1, 2], ['1st', '2nd']],
-                        labels=[np.tile(
+                        codes=[np.tile(
                             np.arange(2).repeat(3), 2), np.repeat(
                                 [1, 0, 1], [3, 6, 3]), np.tile(
                                     [0, 1, 0], 4)])
@@ -937,10 +464,10 @@ def test_stack_mixed_dtype(self):
         df = df.sort_index(level=1, axis=1)
 
         stacked = df.stack()
-        result = df['foo'].stack()
+        result = df['foo'].stack().sort_index()
         tm.assert_series_equal(stacked['foo'], result, check_names=False)
-        self.assertIs(result.name, None)
-        self.assertEqual(stacked['bar'].dtype, np.float_)
+        assert result.name is None
+        assert stacked['bar'].dtype == np.float_
 
     def test_unstack_bug(self):
         df = DataFrame({'state': ['naive', 'naive', 'naive', 'activ', 'activ',
@@ -959,11 +486,11 @@ def test_unstack_bug(self):
 
     def test_stack_unstack_preserve_names(self):
         unstacked = self.frame.unstack()
-        self.assertEqual(unstacked.index.name, 'first')
-        self.assertEqual(unstacked.columns.names, ['exp', 'second'])
+        assert unstacked.index.name == 'first'
+        assert unstacked.columns.names == ['exp', 'second']
 
         restacked = unstacked.stack()
-        self.assertEqual(restacked.index.names, self.frame.index.names)
+        assert restacked.index.names == self.frame.index.names
 
     def test_unstack_level_name(self):
         result = self.frame.unstack('second')
@@ -984,7 +511,7 @@ def test_stack_unstack_multiple(self):
         unstacked = self.ymd.unstack(['year', 'month'])
         expected = self.ymd.unstack('year').unstack('month')
         tm.assert_frame_equal(unstacked, expected)
-        self.assertEqual(unstacked.columns.names, expected.columns.names)
+        assert unstacked.columns.names == expected.columns.names
 
         # series
         s = self.ymd['A']
@@ -996,7 +523,7 @@ def test_stack_unstack_multiple(self):
         restacked = restacked.sort_index(level=0)
 
         tm.assert_frame_equal(restacked, self.ymd)
-        self.assertEqual(restacked.index.names, self.ymd.index.names)
+        assert restacked.index.names == self.ymd.index.names
 
         # GH #451
         unstacked = self.ymd.unstack([1, 2])
@@ -1011,16 +538,16 @@ def test_stack_names_and_numbers(self):
         unstacked = self.ymd.unstack(['year', 'month'])
 
         # Can't use mixture of names and numbers to stack
-        with tm.assertRaisesRegexp(ValueError, "level should contain"):
+        with pytest.raises(ValueError, match="level should contain"):
             unstacked.stack([0, 'month'])
 
     def test_stack_multiple_out_of_bounds(self):
         # nlevels == 3
         unstacked = self.ymd.unstack(['year', 'month'])
 
-        with tm.assertRaisesRegexp(IndexError, "Too many levels"):
+        with pytest.raises(IndexError, match="Too many levels"):
             unstacked.stack([2, 3])
-        with tm.assertRaisesRegexp(IndexError, "not a valid level number"):
+        with pytest.raises(IndexError, match="not a valid level number"):
             unstacked.stack([-4, -3])
 
     def test_unstack_period_series(self):
@@ -1052,7 +579,7 @@ def test_unstack_period_series(self):
 
         idx2 = pd.PeriodIndex(['2013-12', '2013-11', '2013-10', '2013-09',
                                '2013-08', '2013-07'], freq='M', name='period2')
-        idx = pd.MultiIndex.from_arrays([idx1, idx2])
+        idx = MultiIndex.from_arrays([idx1, idx2])
         s = Series(value, index=idx)
 
         result1 = s.unstack()
@@ -1082,8 +609,8 @@ def test_unstack_period_frame(self):
                                '2013-10', '2014-02'],
                               freq='M', name='period2')
         value = {'A': [1, 2, 3, 4, 5, 6], 'B': [6, 5, 4, 3, 2, 1]}
-        idx = pd.MultiIndex.from_arrays([idx1, idx2])
-        df = pd.DataFrame(value, index=idx)
+        idx = MultiIndex.from_arrays([idx1, idx2])
+        df = DataFrame(value, index=idx)
 
         result1 = df.unstack()
         result2 = df.unstack(level=1)
@@ -1092,7 +619,7 @@ def test_unstack_period_frame(self):
         e_1 = pd.PeriodIndex(['2014-01', '2014-02'], freq='M', name='period1')
         e_2 = pd.PeriodIndex(['2013-10', '2013-12', '2014-02', '2013-10',
                               '2013-12', '2014-02'], freq='M', name='period2')
-        e_cols = pd.MultiIndex.from_arrays(['A A A B B B'.split(), e_2])
+        e_cols = MultiIndex.from_arrays(['A A A B B B'.split(), e_2])
         expected = DataFrame([[5, 1, 6, 2, 6, 1], [4, 2, 3, 3, 5, 4]],
                              index=e_1, columns=e_cols)
 
@@ -1103,7 +630,7 @@ def test_unstack_period_frame(self):
                               '2014-02'], freq='M', name='period1')
         e_2 = pd.PeriodIndex(
             ['2013-10', '2013-12', '2014-02'], freq='M', name='period2')
-        e_cols = pd.MultiIndex.from_arrays(['A A B B'.split(), e_1])
+        e_cols = MultiIndex.from_arrays(['A A B B'.split(), e_1])
         expected = DataFrame([[5, 4, 2, 3], [1, 2, 6, 5], [6, 3, 1, 4]],
                              index=e_2, columns=e_cols)
 
@@ -1129,11 +656,11 @@ def test_stack_multiple_bug(self):
 
     def test_stack_dropna(self):
         # GH #3997
-        df = pd.DataFrame({'A': ['a1', 'a2'], 'B': ['b1', 'b2'], 'C': [1, 1]})
+        df = DataFrame({'A': ['a1', 'a2'], 'B': ['b1', 'b2'], 'C': [1, 1]})
         df = df.set_index(['A', 'B'])
 
         stacked = df.unstack().stack(dropna=False)
-        self.assertTrue(len(stacked) > len(stacked.dropna()))
+        assert len(stacked) > len(stacked.dropna())
 
         stacked = df.unstack().stack(dropna=True)
         tm.assert_frame_equal(stacked, stacked.dropna())
@@ -1181,21 +708,60 @@ def test_unstack_sparse_keyspace(self):
     def test_unstack_unobserved_keys(self):
         # related to #2278 refactoring
         levels = [[0, 1], [0, 1, 2, 3]]
-        labels = [[0, 0, 1, 1], [0, 2, 0, 2]]
+        codes = [[0, 0, 1, 1], [0, 2, 0, 2]]
 
-        index = MultiIndex(levels, labels)
+        index = MultiIndex(levels, codes)
 
         df = DataFrame(np.random.randn(4, 2), index=index)
 
         result = df.unstack()
-        self.assertEqual(len(result.columns), 4)
+        assert len(result.columns) == 4
 
         recons = result.stack()
         tm.assert_frame_equal(recons, df)
 
+    @pytest.mark.slow
+    def test_unstack_number_of_levels_larger_than_int32(self):
+        # GH 20601
+        df = DataFrame(np.random.randn(2 ** 16, 2),
+                       index=[np.arange(2 ** 16), np.arange(2 ** 16)])
+        with pytest.raises(ValueError, match='int32 overflow'):
+            df.unstack()
+
+    def test_stack_order_with_unsorted_levels(self):
+        # GH 16323
+
+        def manual_compare_stacked(df, df_stacked, lev0, lev1):
+            assert all(df.loc[row, col] ==
+                       df_stacked.loc[(row, col[lev0]), col[lev1]]
+                       for row in df.index for col in df.columns)
+
+        # deep check for 1-row case
+        for width in [2, 3]:
+            levels_poss = itertools.product(
+                itertools.permutations([0, 1, 2], width),
+                repeat=2)
+
+            for levels in levels_poss:
+                columns = MultiIndex(levels=levels,
+                                     codes=[[0, 0, 1, 1],
+                                            [0, 1, 0, 1]])
+                df = DataFrame(columns=columns, data=[range(4)])
+                for stack_lev in range(2):
+                    df_stacked = df.stack(stack_lev)
+                    manual_compare_stacked(df, df_stacked,
+                                           stack_lev, 1 - stack_lev)
+
+        # check multi-row case
+        mi = MultiIndex(levels=[["A", "C", "B"], ["B", "A", "C"]],
+                        codes=[np.repeat(range(3), 3), np.tile(range(3), 3)])
+        df = DataFrame(columns=mi, index=range(5),
+                       data=np.arange(5 * len(mi)).reshape(5, -1))
+        manual_compare_stacked(df, df.stack(0), 0, 1)
+
     def test_groupby_corner(self):
         midx = MultiIndex(levels=[['foo'], ['bar'], ['baz']],
-                          labels=[[0], [0], [0]],
+                          codes=[[0], [0], [0]],
                           names=['one', 'two', 'three'])
         df = DataFrame([np.random.rand(4)], columns=['a', 'b', 'c', 'd'],
                        index=midx)
@@ -1208,11 +774,12 @@ def test_groupby_level_no_obs(self):
             'f2', 's1'), ('f2', 's2'), ('f3', 's1'), ('f3', 's2')])
         df = DataFrame(
             [[1, 2, 3, 4, 5, 6], [7, 8, 9, 10, 11, 12]], columns=midx)
-        df1 = df.select(lambda u: u[0] in ['f2', 'f3'], axis=1)
+        df1 = df.loc(axis=1)[df.columns.map(
+            lambda u: u[0] in ['f2', 'f3'])]
 
         grouped = df1.groupby(axis=1, level=0)
         result = grouped.sum()
-        self.assertTrue((result.columns == ['f2', 'f3']).all())
+        assert (result.columns == ['f2', 'f3']).all()
 
     def test_join(self):
         a = self.frame.loc[self.frame.index[:5], ['A']]
@@ -1222,7 +789,7 @@ def test_join(self):
         expected = self.frame.copy()
         expected.values[np.isnan(joined.values)] = np.nan
 
-        self.assertFalse(np.isnan(joined.values).all())
+        assert not np.isnan(joined.values).all()
 
         # TODO what should join do with names ?
         tm.assert_frame_equal(joined, expected, check_names=False)
@@ -1232,7 +799,7 @@ def test_swaplevel(self):
         swapped2 = self.frame['A'].swaplevel(0)
         swapped3 = self.frame['A'].swaplevel(0, 1)
         swapped4 = self.frame['A'].swaplevel('first', 'second')
-        self.assertFalse(swapped.index.equals(self.frame.index))
+        assert not swapped.index.equals(self.frame.index)
         tm.assert_series_equal(swapped, swapped2)
         tm.assert_series_equal(swapped, swapped3)
         tm.assert_series_equal(swapped, swapped4)
@@ -1241,7 +808,7 @@ def test_swaplevel(self):
         back2 = swapped.swaplevel(0)
         back3 = swapped.swaplevel(0, 1)
         back4 = swapped.swaplevel('second', 'first')
-        self.assertTrue(back.index.equals(self.frame.index))
+        assert back.index.equals(self.frame.index)
         tm.assert_series_equal(back, back2)
         tm.assert_series_equal(back, back3)
         tm.assert_series_equal(back, back4)
@@ -1251,16 +818,6 @@ def test_swaplevel(self):
         exp = self.frame.swaplevel('first', 'second').T
         tm.assert_frame_equal(swapped, exp)
 
-    def test_swaplevel_panel(self):
-        panel = Panel({'ItemA': self.frame, 'ItemB': self.frame * 2})
-        expected = panel.copy()
-        expected.major_axis = expected.major_axis.swaplevel(0, 1)
-
-        for result in (panel.swaplevel(axis='major'),
-                       panel.swaplevel(0, axis='major'),
-                       panel.swaplevel(0, 1, axis='major')):
-            tm.assert_panel_equal(result, expected)
-
     def test_reorder_levels(self):
         result = self.ymd.reorder_levels(['month', 'day', 'year'])
         expected = self.ymd.swaplevel(0, 1).swaplevel(1, 2)
@@ -1274,17 +831,17 @@ def test_reorder_levels(self):
         expected = self.ymd.T.swaplevel(0, 1, axis=1).swaplevel(1, 2, axis=1)
         tm.assert_frame_equal(result, expected)
 
-        with tm.assertRaisesRegexp(TypeError, 'hierarchical axis'):
+        with pytest.raises(TypeError, match='hierarchical axis'):
             self.ymd.reorder_levels([1, 2], axis=1)
 
-        with tm.assertRaisesRegexp(IndexError, 'Too many levels'):
+        with pytest.raises(IndexError, match='Too many levels'):
             self.ymd.index.reorder_levels([1, 2, 3])
 
     def test_insert_index(self):
         df = self.ymd[:5].T
         df[2000, 1, 10] = df[2000, 1, 7]
-        tm.assertIsInstance(df.columns, MultiIndex)
-        self.assertTrue((df[2000, 1, 10] == df[2000, 1, 7]).all())
+        assert isinstance(df.columns, MultiIndex)
+        assert (df[2000, 1, 10] == df[2000, 1, 7]).all()
 
     def test_alignment(self):
         x = Series(data=[1, 2, 3], index=MultiIndex.from_tuples([("A", 1), (
@@ -1304,31 +861,6 @@ def test_alignment(self):
         exp = x.reindex(exp_index) - y.reindex(exp_index)
         tm.assert_series_equal(res, exp)
 
-    def test_frame_getitem_view(self):
-        df = self.frame.T.copy()
-
-        # this works because we are modifying the underlying array
-        # really a no-no
-        df['foo'].values[:] = 0
-        self.assertTrue((df['foo'].values == 0).all())
-
-        # but not if it's mixed-type
-        df['foo', 'four'] = 'foo'
-        df = df.sort_index(level=0, axis=1)
-
-        # this will work, but will raise/warn as its chained assignment
-        def f():
-            df['foo']['one'] = 2
-            return df
-
-        self.assertRaises(com.SettingWithCopyError, f)
-
-        try:
-            df = f()
-        except:
-            pass
-        self.assertTrue((df['foo', 'one'] == 0).all())
-
     def test_count(self):
         frame = self.frame.copy()
         frame.index.names = ['a', 'b']
@@ -1347,61 +879,70 @@ def test_count(self):
         result = series.count(level='b')
         expect = self.series.count(level=1)
         tm.assert_series_equal(result, expect, check_names=False)
-        self.assertEqual(result.index.name, 'b')
+        assert result.index.name == 'b'
 
         result = series.count(level='a')
         expect = self.series.count(level=0)
         tm.assert_series_equal(result, expect, check_names=False)
-        self.assertEqual(result.index.name, 'a')
-
-        self.assertRaises(KeyError, series.count, 'x')
-        self.assertRaises(KeyError, frame.count, level='x')
-
-    AGG_FUNCTIONS = ['sum', 'prod', 'min', 'max', 'median', 'mean', 'skew',
-                     'mad', 'std', 'var', 'sem']
-
-    def test_series_group_min_max(self):
-        for op, level, skipna in cart_product(self.AGG_FUNCTIONS, lrange(2),
-                                              [False, True]):
-            grouped = self.series.groupby(level=level)
-            aggf = lambda x: getattr(x, op)(skipna=skipna)
-            # skipna=True
-            leftside = grouped.agg(aggf)
-            rightside = getattr(self.series, op)(level=level, skipna=skipna)
-            tm.assert_series_equal(leftside, rightside)
-
-    def test_frame_group_ops(self):
+        assert result.index.name == 'a'
+
+        msg = "Level x not found"
+        with pytest.raises(KeyError, match=msg):
+            series.count('x')
+        with pytest.raises(KeyError, match=msg):
+            frame.count(level='x')
+
+    @pytest.mark.parametrize('op', AGG_FUNCTIONS)
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('skipna', [True, False])
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_series_group_min_max(self, op, level, skipna, sort):
+        # GH 17537
+        grouped = self.series.groupby(level=level, sort=sort)
+        # skipna=True
+        leftside = grouped.agg(lambda x: getattr(x, op)(skipna=skipna))
+        rightside = getattr(self.series, op)(level=level, skipna=skipna)
+        if sort:
+            rightside = rightside.sort_index(level=level)
+        tm.assert_series_equal(leftside, rightside)
+
+    @pytest.mark.parametrize('op', AGG_FUNCTIONS)
+    @pytest.mark.parametrize('level', [0, 1])
+    @pytest.mark.parametrize('axis', [0, 1])
+    @pytest.mark.parametrize('skipna', [True, False])
+    @pytest.mark.parametrize('sort', [True, False])
+    def test_frame_group_ops(self, op, level, axis, skipna, sort):
+        # GH 17537
         self.frame.iloc[1, [1, 2]] = np.nan
         self.frame.iloc[7, [0, 1]] = np.nan
 
-        for op, level, axis, skipna in cart_product(self.AGG_FUNCTIONS,
-                                                    lrange(2), lrange(2),
-                                                    [False, True]):
+        if axis == 0:
+            frame = self.frame
+        else:
+            frame = self.frame.T
 
-            if axis == 0:
-                frame = self.frame
-            else:
-                frame = self.frame.T
+        grouped = frame.groupby(level=level, axis=axis, sort=sort)
 
-            grouped = frame.groupby(level=level, axis=axis)
+        pieces = []
 
-            pieces = []
+        def aggf(x):
+            pieces.append(x)
+            return getattr(x, op)(skipna=skipna, axis=axis)
 
-            def aggf(x):
-                pieces.append(x)
-                return getattr(x, op)(skipna=skipna, axis=axis)
+        leftside = grouped.agg(aggf)
+        rightside = getattr(frame, op)(level=level, axis=axis,
+                                       skipna=skipna)
+        if sort:
+            rightside = rightside.sort_index(level=level, axis=axis)
+            frame = frame.sort_index(level=level, axis=axis)
 
-            leftside = grouped.agg(aggf)
-            rightside = getattr(frame, op)(level=level, axis=axis,
-                                           skipna=skipna)
+        # for good measure, groupby detail
+        level_index = frame._get_axis(axis).levels[level]
 
-            # for good measure, groupby detail
-            level_index = frame._get_axis(axis).levels[level]
+        tm.assert_index_equal(leftside._get_axis(axis), level_index)
+        tm.assert_index_equal(rightside._get_axis(axis), level_index)
 
-            tm.assert_index_equal(leftside._get_axis(axis), level_index)
-            tm.assert_index_equal(rightside._get_axis(axis), level_index)
-
-            tm.assert_frame_equal(leftside, rightside)
+        tm.assert_frame_equal(leftside, rightside)
 
     def test_stat_op_corner(self):
         obj = Series([10.0], index=MultiIndex.from_tuples([(2, 3)]))
@@ -1461,7 +1002,7 @@ def test_groupby_multilevel(self):
 
         # TODO groupby with level_values drops names
         tm.assert_frame_equal(result, expected, check_names=False)
-        self.assertEqual(result.index.names, self.ymd.index.names[:2])
+        assert result.index.names == self.ymd.index.names[:2]
 
         result2 = self.ymd.groupby(level=self.ymd.index.names[:2]).mean()
         tm.assert_frame_equal(result, result2)
@@ -1479,33 +1020,13 @@ def test_multilevel_consolidate(self):
     def test_ix_preserve_names(self):
         result = self.ymd.loc[2000]
         result2 = self.ymd['A'].loc[2000]
-        self.assertEqual(result.index.names, self.ymd.index.names[1:])
-        self.assertEqual(result2.index.names, self.ymd.index.names[1:])
+        assert result.index.names == self.ymd.index.names[1:]
+        assert result2.index.names == self.ymd.index.names[1:]
 
         result = self.ymd.loc[2000, 2]
         result2 = self.ymd['A'].loc[2000, 2]
-        self.assertEqual(result.index.name, self.ymd.index.names[2])
-        self.assertEqual(result2.index.name, self.ymd.index.names[2])
-
-    def test_partial_set(self):
-        # GH #397
-        df = self.ymd.copy()
-        exp = self.ymd.copy()
-        df.loc[2000, 4] = 0
-        exp.loc[2000, 4].values[:] = 0
-        tm.assert_frame_equal(df, exp)
-
-        df['A'].loc[2000, 4] = 1
-        exp['A'].loc[2000, 4].values[:] = 1
-        tm.assert_frame_equal(df, exp)
-
-        df.loc[2000] = 5
-        exp.loc[2000].values[:] = 5
-        tm.assert_frame_equal(df, exp)
-
-        # this works...for now
-        df['A'].iloc[14] = 5
-        self.assertEqual(df['A'][14], 5)
+        assert result.index.name == self.ymd.index.names[2]
+        assert result2.index.name == self.ymd.index.names[2]
 
     def test_unstack_preserve_types(self):
         # GH #403
@@ -1513,20 +1034,20 @@ def test_unstack_preserve_types(self):
         self.ymd['F'] = 2
 
         unstacked = self.ymd.unstack('month')
-        self.assertEqual(unstacked['A', 1].dtype, np.float64)
-        self.assertEqual(unstacked['E', 1].dtype, np.object_)
-        self.assertEqual(unstacked['F', 1].dtype, np.float64)
+        assert unstacked['A', 1].dtype == np.float64
+        assert unstacked['E', 1].dtype == np.object_
+        assert unstacked['F', 1].dtype == np.float64
 
     def test_unstack_group_index_overflow(self):
-        labels = np.tile(np.arange(500), 2)
+        codes = np.tile(np.arange(500), 2)
         level = np.arange(500)
 
         index = MultiIndex(levels=[level] * 8 + [[0, 1]],
-                           labels=[labels] * 8 + [np.arange(2).repeat(500)])
+                           codes=[codes] * 8 + [np.arange(2).repeat(500)])
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack()
-        self.assertEqual(result.shape, (500, 2))
+        assert result.shape == (500, 2)
 
         # test roundtrip
         stacked = result.stack()
@@ -1534,49 +1055,52 @@ def test_unstack_group_index_overflow(self):
 
         # put it at beginning
         index = MultiIndex(levels=[[0, 1]] + [level] * 8,
-                           labels=[np.arange(2).repeat(500)] + [labels] * 8)
+                           codes=[np.arange(2).repeat(500)] + [codes] * 8)
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack(0)
-        self.assertEqual(result.shape, (500, 2))
+        assert result.shape == (500, 2)
 
         # put it in middle
         index = MultiIndex(levels=[level] * 4 + [[0, 1]] + [level] * 4,
-                           labels=([labels] * 4 + [np.arange(2).repeat(500)] +
-                                   [labels] * 4))
+                           codes=([codes] * 4 + [np.arange(2).repeat(500)] +
+                                  [codes] * 4))
 
         s = Series(np.arange(1000), index=index)
         result = s.unstack(4)
-        self.assertEqual(result.shape, (500, 2))
-
-    def test_getitem_lowerdim_corner(self):
-        self.assertRaises(KeyError, self.frame.loc.__getitem__,
-                          (('bar', 'three'), 'B'))
-
-        # in theory should be inserting in a sorted space????
-        self.frame.loc[('bar', 'three'), 'B'] = 0
-        self.assertEqual(self.frame.sort_index().loc[('bar', 'three'), 'B'], 0)
-
-    # ---------------------------------------------------------------------
-    # AMBIGUOUS CASES!
-
-    def test_partial_ix_missing(self):
-        pytest.skip("skipping for now")
-
-        result = self.ymd.loc[2000, 0]
-        expected = self.ymd.loc[2000]['A']
-        tm.assert_series_equal(result, expected)
-
-        # need to put in some work here
-
-        # self.ymd.loc[2000, 0] = 0
-        # self.assertTrue((self.ymd.loc[2000]['A'] == 0).all())
-
-        # Pretty sure the second (and maybe even the first) is already wrong.
-        self.assertRaises(Exception, self.ymd.loc.__getitem__, (2000, 6))
-        self.assertRaises(Exception, self.ymd.loc.__getitem__, (2000, 6), 0)
-
-    # ---------------------------------------------------------------------
+        assert result.shape == (500, 2)
+
+    def test_pyint_engine(self):
+        # GH 18519 : when combinations of codes cannot be represented in 64
+        # bits, the index underlying the MultiIndex engine works with Python
+        # integers, rather than uint64.
+        N = 5
+        keys = [tuple(l) for l in [[0] * 10 * N,
+                                   [1] * 10 * N,
+                                   [2] * 10 * N,
+                                   [np.nan] * N + [2] * 9 * N,
+                                   [0] * N + [2] * 9 * N,
+                                   [np.nan] * N + [2] * 8 * N + [0] * N]]
+        # Each level contains 4 elements (including NaN), so it is represented
+        # in 2 bits, for a total of 2*N*10 = 100 > 64 bits. If we were using a
+        # 64 bit engine and truncating the first levels, the fourth and fifth
+        # keys would collide; if truncating the last levels, the fifth and
+        # sixth; if rotating bits rather than shifting, the third and fifth.
+
+        for idx in range(len(keys)):
+            index = MultiIndex.from_tuples(keys)
+            assert index.get_loc(keys[idx]) == idx
+
+            expected = np.arange(idx + 1, dtype=np.intp)
+            result = index.get_indexer([keys[i] for i in expected])
+            tm.assert_numpy_array_equal(result, expected)
+
+        # With missing key:
+        idces = range(len(keys))
+        expected = np.array([-1] + list(idces), dtype=np.intp)
+        missing = tuple([0, 1] * 5 * N)
+        result = index.get_indexer([missing] + [keys[i] for i in idces])
+        tm.assert_numpy_array_equal(result, expected)
 
     def test_to_html(self):
         self.ymd.columns.name = 'foo'
@@ -1586,7 +1110,7 @@ def test_to_html(self):
     def test_level_with_tuples(self):
         index = MultiIndex(levels=[[('foo', 'bar', 0), ('foo', 'baz', 0), (
             'foo', 'qux', 0)], [0, 1]],
-            labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
+            codes=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
 
         series = Series(np.random.randn(6), index=index)
         frame = DataFrame(np.random.randn(6, 4), index=index)
@@ -1598,7 +1122,8 @@ def test_level_with_tuples(self):
         tm.assert_series_equal(result, expected)
         tm.assert_series_equal(result2, expected)
 
-        self.assertRaises(KeyError, series.__getitem__, (('foo', 'bar', 0), 2))
+        with pytest.raises(KeyError, match=r"^\(\('foo', 'bar', 0\), 2\)$"):
+            series[('foo', 'bar', 0), 2]
 
         result = frame.loc[('foo', 'bar', 0)]
         result2 = frame.xs(('foo', 'bar', 0))
@@ -1609,7 +1134,7 @@ def test_level_with_tuples(self):
 
         index = MultiIndex(levels=[[('foo', 'bar'), ('foo', 'baz'), (
             'foo', 'qux')], [0, 1]],
-            labels=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
+            codes=[[0, 0, 1, 1, 2, 2], [0, 1, 0, 1, 0, 1]])
 
         series = Series(np.random.randn(6), index=index)
         frame = DataFrame(np.random.randn(6, 4), index=index)
@@ -1628,55 +1153,6 @@ def test_level_with_tuples(self):
         tm.assert_frame_equal(result, expected)
         tm.assert_frame_equal(result2, expected)
 
-    def test_int_series_slicing(self):
-        s = self.ymd['A']
-        result = s[5:]
-        expected = s.reindex(s.index[5:])
-        tm.assert_series_equal(result, expected)
-
-        exp = self.ymd['A'].copy()
-        s[5:] = 0
-        exp.values[5:] = 0
-        tm.assert_numpy_array_equal(s.values, exp.values)
-
-        result = self.ymd[5:]
-        expected = self.ymd.reindex(s.index[5:])
-        tm.assert_frame_equal(result, expected)
-
-    def test_mixed_depth_get(self):
-        arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
-                  ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
-                  ['', 'wx', 'wy', '', '', '']]
-
-        tuples = sorted(zip(*arrays))
-        index = MultiIndex.from_tuples(tuples)
-        df = DataFrame(randn(4, 6), columns=index)
-
-        result = df['a']
-        expected = df['a', '', '']
-        tm.assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, 'a')
-
-        result = df['routine1', 'result1']
-        expected = df['routine1', 'result1', '']
-        tm.assert_series_equal(result, expected, check_names=False)
-        self.assertEqual(result.name, ('routine1', 'result1'))
-
-    def test_mixed_depth_insert(self):
-        arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
-                  ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
-                  ['', 'wx', 'wy', '', '', '']]
-
-        tuples = sorted(zip(*arrays))
-        index = MultiIndex.from_tuples(tuples)
-        df = DataFrame(randn(4, 6), columns=index)
-
-        result = df.copy()
-        expected = df.copy()
-        result['b'] = [1, 2, 3, 4]
-        expected['b', '', ''] = [1, 2, 3, 4]
-        tm.assert_frame_equal(result, expected)
-
     def test_mixed_depth_drop(self):
         arrays = [['a', 'top', 'top', 'routine1', 'routine1', 'routine2'],
                   ['', 'OD', 'OD', 'result1', 'result2', 'result1'],
@@ -1743,7 +1219,7 @@ def test_mixed_depth_pop(self):
         expected = df2.pop(('a', '', ''))
         tm.assert_series_equal(expected, result, check_names=False)
         tm.assert_frame_equal(df1, df2)
-        self.assertEqual(result.name, 'a')
+        assert result.name == 'a'
 
         expected = df1['top']
         df1 = df1.drop(['top'], axis=1)
@@ -1756,7 +1232,7 @@ def test_reindex_level_partial_selection(self):
         expected = self.frame.iloc[[0, 1, 2, 7, 8, 9]]
         tm.assert_frame_equal(result, expected)
 
-        result = self.frame.T.reindex_axis(['foo', 'qux'], axis=1, level=0)
+        result = self.frame.T.reindex(['foo', 'qux'], axis=1, level=0)
         tm.assert_frame_equal(result, expected.T)
 
         result = self.frame.loc[['foo', 'qux']]
@@ -1768,35 +1244,6 @@ def test_reindex_level_partial_selection(self):
         result = self.frame.T.loc[:, ['foo', 'qux']]
         tm.assert_frame_equal(result, expected.T)
 
-    def test_setitem_multiple_partial(self):
-        expected = self.frame.copy()
-        result = self.frame.copy()
-        result.loc[['foo', 'bar']] = 0
-        expected.loc['foo'] = 0
-        expected.loc['bar'] = 0
-        tm.assert_frame_equal(result, expected)
-
-        expected = self.frame.copy()
-        result = self.frame.copy()
-        result.loc['foo':'bar'] = 0
-        expected.loc['foo'] = 0
-        expected.loc['bar'] = 0
-        tm.assert_frame_equal(result, expected)
-
-        expected = self.frame['A'].copy()
-        result = self.frame['A'].copy()
-        result.loc[['foo', 'bar']] = 0
-        expected.loc['foo'] = 0
-        expected.loc['bar'] = 0
-        tm.assert_series_equal(result, expected)
-
-        expected = self.frame['A'].copy()
-        result = self.frame['A'].copy()
-        result.loc['foo':'bar'] = 0
-        expected.loc['foo'] = 0
-        expected.loc['bar'] = 0
-        tm.assert_series_equal(result, expected)
-
     def test_drop_level(self):
         result = self.frame.drop(['bar', 'qux'], level='first')
         expected = self.frame.iloc[[0, 1, 2, 5, 6]]
@@ -1816,7 +1263,7 @@ def test_drop_level(self):
 
     def test_drop_level_nonunique_datetime(self):
         # GH 12701
-        idx = pd.Index([2, 3, 4, 4, 5], name='id')
+        idx = Index([2, 3, 4, 4, 5], name='id')
         idxdt = pd.to_datetime(['201603231400',
                                 '201603231500',
                                 '201603231600',
@@ -1826,13 +1273,26 @@ def test_drop_level_nonunique_datetime(self):
                        columns=list('ab'), index=idx)
         df['tstamp'] = idxdt
         df = df.set_index('tstamp', append=True)
-        ts = pd.Timestamp('201603231600')
-        self.assertFalse(df.index.is_unique)
+        ts = Timestamp('201603231600')
+        assert df.index.is_unique is False
 
         result = df.drop(ts, level='tstamp')
         expected = df.loc[idx != 4]
         tm.assert_frame_equal(result, expected)
 
+    @pytest.mark.parametrize('box', [Series, DataFrame])
+    def test_drop_tz_aware_timestamp_across_dst(self, box):
+        # GH 21761
+        start = Timestamp('2017-10-29', tz='Europe/Berlin')
+        end = Timestamp('2017-10-29 04:00:00', tz='Europe/Berlin')
+        index = pd.date_range(start, end, freq='15min')
+        data = box(data=[1] * len(index), index=index)
+        result = data.drop(start)
+        expected_start = Timestamp('2017-10-29 00:15:00', tz='Europe/Berlin')
+        expected_idx = pd.date_range(expected_start, end, freq='15min')
+        expected = box(data=[1] * len(expected_idx), index=expected_idx)
+        tm.assert_equal(result, expected)
+
     def test_drop_preserve_names(self):
         index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
                                         [1, 2, 3, 1, 2, 3]],
@@ -1841,13 +1301,13 @@ def test_drop_preserve_names(self):
         df = DataFrame(np.random.randn(6, 3), index=index)
 
         result = df.drop([(0, 2)])
-        self.assertEqual(result.index.names, ('one', 'two'))
+        assert result.index.names == ('one', 'two')
 
     def test_unicode_repr_issues(self):
         levels = [Index([u('a/\u03c3'), u('b/\u03c3'), u('c/\u03c3')]),
                   Index([0, 1])]
-        labels = [np.arange(3).repeat(2), np.tile(np.arange(2), 3)]
-        index = MultiIndex(levels=levels, labels=labels)
+        codes = [np.arange(3).repeat(2), np.tile(np.arange(2), 3)]
+        index = MultiIndex(levels=levels, codes=codes)
 
         repr(index.levels)
 
@@ -1863,15 +1323,6 @@ def test_unicode_repr_level_names(self):
         repr(s)
         repr(df)
 
-    def test_dataframe_insert_column_all_na(self):
-        # GH #1534
-        mix = MultiIndex.from_tuples([('1a', '2a'), ('1a', '2b'), ('1a', '2c')
-                                      ])
-        df = DataFrame([[1, 2], [3, 4], [5, 6]], index=mix)
-        s = Series({(1, 1): 1, (1, 2): 2})
-        df['new'] = s
-        self.assertTrue(df['new'].isnull().all())
-
     def test_join_segfault(self):
         # 1532
         df1 = DataFrame({'a': [1, 1], 'b': [1, 2], 'x': [1, 2]})
@@ -1882,16 +1333,6 @@ def test_join_segfault(self):
         for how in ['left', 'right', 'outer']:
             df1.join(df2, how=how)
 
-    def test_set_column_scalar_with_ix(self):
-        subset = self.frame.index[[1, 4, 5]]
-
-        self.frame.loc[subset] = 99
-        self.assertTrue((self.frame.loc[subset].values == 99).all())
-
-        col = self.frame['B']
-        col[subset] = 97
-        self.assertTrue((self.frame.loc[subset, 'B'] == 97).all())
-
     def test_frame_dict_constructor_empty_series(self):
         s1 = Series([
             1, 2, 3, 4
@@ -1905,47 +1346,6 @@ def test_frame_dict_constructor_empty_series(self):
         DataFrame({'foo': s1, 'bar': s2, 'baz': s3})
         DataFrame.from_dict({'foo': s1, 'baz': s3, 'bar': s2})
 
-    def test_indexing_ambiguity_bug_1678(self):
-        columns = MultiIndex.from_tuples([('Ohio', 'Green'), ('Ohio', 'Red'), (
-            'Colorado', 'Green')])
-        index = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b', 2)
-                                        ])
-
-        frame = DataFrame(np.arange(12).reshape((4, 3)), index=index,
-                          columns=columns)
-
-        result = frame.iloc[:, 1]
-        exp = frame.loc[:, ('Ohio', 'Red')]
-        tm.assertIsInstance(result, Series)
-        tm.assert_series_equal(result, exp)
-
-    def test_nonunique_assignment_1750(self):
-        df = DataFrame([[1, 1, "x", "X"], [1, 1, "y", "Y"], [1, 2, "z", "Z"]],
-                       columns=list("ABCD"))
-
-        df = df.set_index(['A', 'B'])
-        ix = MultiIndex.from_tuples([(1, 1)])
-
-        df.loc[ix, "C"] = '_'
-
-        self.assertTrue((df.xs((1, 1))['C'] == '_').all())
-
-    def test_indexing_over_hashtable_size_cutoff(self):
-        n = 10000
-
-        old_cutoff = _index._SIZE_CUTOFF
-        _index._SIZE_CUTOFF = 20000
-
-        s = Series(np.arange(n),
-                   MultiIndex.from_arrays((["a"] * n, np.arange(n))))
-
-        # hai it works!
-        self.assertEqual(s[("a", 5)], 5)
-        self.assertEqual(s[("a", 6)], 6)
-        self.assertEqual(s[("a", 7)], 7)
-
-        _index._SIZE_CUTOFF = old_cutoff
-
     def test_multiindex_na_repr(self):
         # only an issue with long columns
 
@@ -1967,23 +1367,23 @@ def test_assign_index_sequences(self):
         df = DataFrame({"a": [1, 2, 3],
                         "b": [4, 5, 6],
                         "c": [7, 8, 9]}).set_index(["a", "b"])
-        l = list(df.index)
-        l[0] = ("faz", "boo")
-        df.index = l
+        index = list(df.index)
+        index[0] = ("faz", "boo")
+        df.index = index
         repr(df)
 
         # this travels an improper code path
-        l[0] = ["faz", "boo"]
-        df.index = l
+        index[0] = ["faz", "boo"]
+        df.index = index
         repr(df)
 
     def test_tuples_have_na(self):
         index = MultiIndex(levels=[[1, 0], [0, 1, 2, 3]],
-                           labels=[[1, 1, 1, 1, -1, 0, 0, 0], [0, 1, 2, 3, 0,
-                                                               1, 2, 3]])
+                           codes=[[1, 1, 1, 1, -1, 0, 0, 0],
+                                  [0, 1, 2, 3, 0, 1, 2, 3]])
 
-        self.assertTrue(isnull(index[4][0]))
-        self.assertTrue(isnull(index.values[4][0]))
+        assert isna(index[4][0])
+        assert isna(index.values[4][0])
 
     def test_duplicate_groupby_issues(self):
         idx_tp = [('600809', '20061231'), ('600809', '20070331'),
@@ -1994,7 +1394,7 @@ def test_duplicate_groupby_issues(self):
         s = Series(dt, index=idx)
 
         result = s.groupby(s.index).first()
-        self.assertEqual(len(result), 3)
+        assert len(result) == 3
 
     def test_duplicate_mi(self):
         # GH 4516
@@ -2019,21 +1419,21 @@ def test_duplicated_drop_duplicates(self):
             [False, False, False, True, False, False], dtype=bool)
         duplicated = idx.duplicated()
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
+        assert duplicated.dtype == bool
         expected = MultiIndex.from_arrays(([1, 2, 3, 2, 3], [1, 1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(), expected)
 
         expected = np.array([True, False, False, False, False, False])
         duplicated = idx.duplicated(keep='last')
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
+        assert duplicated.dtype == bool
         expected = MultiIndex.from_arrays(([2, 3, 1, 2, 3], [1, 1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(keep='last'), expected)
 
         expected = np.array([True, False, False, True, False, False])
         duplicated = idx.duplicated(keep=False)
         tm.assert_numpy_array_equal(duplicated, expected)
-        self.assertTrue(duplicated.dtype == bool)
+        assert duplicated.dtype == bool
         expected = MultiIndex.from_arrays(([2, 3, 2, 3], [1, 1, 2, 2]))
         tm.assert_index_equal(idx.drop_duplicates(keep=False), expected)
 
@@ -2070,9 +1470,9 @@ def test_datetimeindex(self):
 
         for d1, d2 in itertools.product(
                 [date1, date2, date3], [date1, date2, date3]):
-            index = pd.MultiIndex.from_product([[d1], [d2]])
-            self.assertIsInstance(index.levels[0], pd.DatetimeIndex)
-            self.assertIsInstance(index.levels[1], pd.DatetimeIndex)
+            index = MultiIndex.from_product([[d1], [d2]])
+            assert isinstance(index.levels[0], pd.DatetimeIndex)
+            assert isinstance(index.levels[1], pd.DatetimeIndex)
 
     def test_constructor_with_tz(self):
 
@@ -2091,14 +1491,14 @@ def test_constructor_with_tz(self):
 
     def test_set_index_datetime(self):
         # GH 3950
-        df = pd.DataFrame(
+        df = DataFrame(
             {'label': ['a', 'a', 'a', 'b', 'b', 'b'],
              'datetime': ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
                           '2011-07-19 09:00:00', '2011-07-19 07:00:00',
                           '2011-07-19 08:00:00', '2011-07-19 09:00:00'],
              'value': range(6)})
         df.index = pd.to_datetime(df.pop('datetime'), utc=True)
-        df.index = df.index.tz_localize('UTC').tz_convert('US/Pacific')
+        df.index = df.index.tz_convert('US/Pacific')
 
         expected = pd.DatetimeIndex(['2011-07-19 07:00:00',
                                      '2011-07-19 08:00:00',
@@ -2108,11 +1508,11 @@ def test_set_index_datetime(self):
         df = df.set_index('label', append=True)
         tm.assert_index_equal(df.index.levels[0], expected)
         tm.assert_index_equal(df.index.levels[1],
-                              pd.Index(['a', 'b'], name='label'))
+                              Index(['a', 'b'], name='label'))
 
         df = df.swaplevel(0, 1)
         tm.assert_index_equal(df.index.levels[0],
-                              pd.Index(['a', 'b'], name='label'))
+                              Index(['a', 'b'], name='label'))
         tm.assert_index_equal(df.index.levels[1], expected)
 
         df = DataFrame(np.random.random(6))
@@ -2150,82 +1550,80 @@ def test_reset_index_datetime(self):
         for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern']:
             idx1 = pd.date_range('1/1/2011', periods=5, freq='D', tz=tz,
                                  name='idx1')
-            idx2 = pd.Index(range(5), name='idx2', dtype='int64')
-            idx = pd.MultiIndex.from_arrays([idx1, idx2])
-            df = pd.DataFrame(
+            idx2 = Index(range(5), name='idx2', dtype='int64')
+            idx = MultiIndex.from_arrays([idx1, idx2])
+            df = DataFrame(
                 {'a': np.arange(5, dtype='int64'),
                  'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
 
-            expected = pd.DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
-                                              datetime.datetime(2011, 1, 2),
-                                              datetime.datetime(2011, 1, 3),
-                                              datetime.datetime(2011, 1, 4),
-                                              datetime.datetime(2011, 1, 5)],
-                                     'idx2': np.arange(5, dtype='int64'),
-                                     'a': np.arange(5, dtype='int64'),
-                                     'b': ['A', 'B', 'C', 'D', 'E']},
-                                    columns=['idx1', 'idx2', 'a', 'b'])
+            expected = DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
+                                           datetime.datetime(2011, 1, 2),
+                                           datetime.datetime(2011, 1, 3),
+                                           datetime.datetime(2011, 1, 4),
+                                           datetime.datetime(2011, 1, 5)],
+                                  'idx2': np.arange(5, dtype='int64'),
+                                  'a': np.arange(5, dtype='int64'),
+                                  'b': ['A', 'B', 'C', 'D', 'E']},
+                                 columns=['idx1', 'idx2', 'a', 'b'])
             expected['idx1'] = expected['idx1'].apply(
-                lambda d: pd.Timestamp(d, tz=tz))
+                lambda d: Timestamp(d, tz=tz))
 
             tm.assert_frame_equal(df.reset_index(), expected)
 
             idx3 = pd.date_range('1/1/2012', periods=5, freq='MS',
                                  tz='Europe/Paris', name='idx3')
-            idx = pd.MultiIndex.from_arrays([idx1, idx2, idx3])
-            df = pd.DataFrame(
+            idx = MultiIndex.from_arrays([idx1, idx2, idx3])
+            df = DataFrame(
                 {'a': np.arange(5, dtype='int64'),
                  'b': ['A', 'B', 'C', 'D', 'E']}, index=idx)
 
-            expected = pd.DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
-                                              datetime.datetime(2011, 1, 2),
-                                              datetime.datetime(2011, 1, 3),
-                                              datetime.datetime(2011, 1, 4),
-                                              datetime.datetime(2011, 1, 5)],
-                                     'idx2': np.arange(5, dtype='int64'),
-                                     'idx3': [datetime.datetime(2012, 1, 1),
-                                              datetime.datetime(2012, 2, 1),
-                                              datetime.datetime(2012, 3, 1),
-                                              datetime.datetime(2012, 4, 1),
-                                              datetime.datetime(2012, 5, 1)],
-                                     'a': np.arange(5, dtype='int64'),
-                                     'b': ['A', 'B', 'C', 'D', 'E']},
-                                    columns=['idx1', 'idx2', 'idx3', 'a', 'b'])
+            expected = DataFrame({'idx1': [datetime.datetime(2011, 1, 1),
+                                           datetime.datetime(2011, 1, 2),
+                                           datetime.datetime(2011, 1, 3),
+                                           datetime.datetime(2011, 1, 4),
+                                           datetime.datetime(2011, 1, 5)],
+                                  'idx2': np.arange(5, dtype='int64'),
+                                  'idx3': [datetime.datetime(2012, 1, 1),
+                                           datetime.datetime(2012, 2, 1),
+                                           datetime.datetime(2012, 3, 1),
+                                           datetime.datetime(2012, 4, 1),
+                                           datetime.datetime(2012, 5, 1)],
+                                  'a': np.arange(5, dtype='int64'),
+                                  'b': ['A', 'B', 'C', 'D', 'E']},
+                                 columns=['idx1', 'idx2', 'idx3', 'a', 'b'])
             expected['idx1'] = expected['idx1'].apply(
-                lambda d: pd.Timestamp(d, tz=tz))
+                lambda d: Timestamp(d, tz=tz))
             expected['idx3'] = expected['idx3'].apply(
-                lambda d: pd.Timestamp(d, tz='Europe/Paris'))
+                lambda d: Timestamp(d, tz='Europe/Paris'))
             tm.assert_frame_equal(df.reset_index(), expected)
 
             # GH 7793
-            idx = pd.MultiIndex.from_product([['a', 'b'], pd.date_range(
+            idx = MultiIndex.from_product([['a', 'b'], pd.date_range(
                 '20130101', periods=3, tz=tz)])
-            df = pd.DataFrame(
+            df = DataFrame(
                 np.arange(6, dtype='int64').reshape(
                     6, 1), columns=['a'], index=idx)
 
-            expected = pd.DataFrame({'level_0': 'a a a b b b'.split(),
-                                     'level_1': [
-                                         datetime.datetime(2013, 1, 1),
-                                         datetime.datetime(2013, 1, 2),
-                                         datetime.datetime(2013, 1, 3)] * 2,
-                                     'a': np.arange(6, dtype='int64')},
-                                    columns=['level_0', 'level_1', 'a'])
+            expected = DataFrame({'level_0': 'a a a b b b'.split(),
+                                  'level_1': [
+                                  datetime.datetime(2013, 1, 1),
+                                  datetime.datetime(2013, 1, 2),
+                                  datetime.datetime(2013, 1, 3)] * 2,
+                                  'a': np.arange(6, dtype='int64')},
+                                 columns=['level_0', 'level_1', 'a'])
             expected['level_1'] = expected['level_1'].apply(
-                lambda d: pd.Timestamp(d, freq='D', tz=tz))
+                lambda d: Timestamp(d, freq='D', tz=tz))
             tm.assert_frame_equal(df.reset_index(), expected)
 
     def test_reset_index_period(self):
         # GH 7746
-        idx = pd.MultiIndex.from_product([pd.period_range('20130101',
-                                                          periods=3, freq='M'),
-                                          ['a', 'b', 'c']],
-                                         names=['month', 'feature'])
-
-        df = pd.DataFrame(np.arange(9, dtype='int64')
-                          .reshape(-1, 1),
-                          index=idx, columns=['a'])
-        expected = pd.DataFrame({
+        idx = MultiIndex.from_product(
+            [pd.period_range('20130101', periods=3, freq='M'), list('abc')],
+            names=['month', 'feature'])
+
+        df = DataFrame(np.arange(9, dtype='int64').reshape(-1, 1),
+                       index=idx, columns=['a'])
+        expected = DataFrame({
             'month': ([pd.Period('2013-01', freq='M')] * 3 +
                       [pd.Period('2013-02', freq='M')] * 3 +
                       [pd.Period('2013-03', freq='M')] * 3),
@@ -2234,6 +1632,57 @@ def test_reset_index_period(self):
         }, columns=['month', 'feature', 'a'])
         tm.assert_frame_equal(df.reset_index(), expected)
 
+    def test_reset_index_multiindex_columns(self):
+        levels = [['A', ''], ['B', 'b']]
+        df = DataFrame([[0, 2], [1, 3]],
+                       columns=MultiIndex.from_tuples(levels))
+        result = df[['B']].rename_axis('A').reset_index()
+        tm.assert_frame_equal(result, df)
+
+        # gh-16120: already existing column
+        with pytest.raises(ValueError,
+                           match=(r"cannot insert \('A', ''\), "
+                                  "already exists")):
+            df.rename_axis('A').reset_index()
+
+        # gh-16164: multiindex (tuple) full key
+        result = df.set_index([('A', '')]).reset_index()
+        tm.assert_frame_equal(result, df)
+
+        # with additional (unnamed) index level
+        idx_col = DataFrame([[0], [1]],
+                            columns=MultiIndex.from_tuples([('level_0', '')]))
+        expected = pd.concat([idx_col, df[[('B', 'b'), ('A', '')]]], axis=1)
+        result = df.set_index([('B', 'b')], append=True).reset_index()
+        tm.assert_frame_equal(result, expected)
+
+        # with index name which is a too long tuple...
+        with pytest.raises(ValueError,
+                           match=("Item must have length equal "
+                                  "to number of levels.")):
+            df.rename_axis([('C', 'c', 'i')]).reset_index()
+
+        # or too short...
+        levels = [['A', 'a', ''], ['B', 'b', 'i']]
+        df2 = DataFrame([[0, 2], [1, 3]],
+                        columns=MultiIndex.from_tuples(levels))
+        idx_col = DataFrame([[0], [1]],
+                            columns=MultiIndex.from_tuples([('C', 'c', 'ii')]))
+        expected = pd.concat([idx_col, df2], axis=1)
+        result = df2.rename_axis([('C', 'c')]).reset_index(col_fill='ii')
+        tm.assert_frame_equal(result, expected)
+
+        # ... which is incompatible with col_fill=None
+        with pytest.raises(ValueError,
+                           match=("col_fill=None is incompatible with "
+                                  r"incomplete column name \('C', 'c'\)")):
+            df2.rename_axis([('C', 'c')]).reset_index(col_fill=None)
+
+        # with col_level != 0
+        result = df2.rename_axis([('c', 'ii')]).reset_index(col_level=1,
+                                                            col_fill='C')
+        tm.assert_frame_equal(result, expected)
+
     def test_set_index_period(self):
         # GH 6631
         df = DataFrame(np.random.random(6))
@@ -2261,46 +1710,18 @@ def test_set_index_period(self):
     def test_repeat(self):
         # GH 9361
         # fixed by # GH 7891
-        m_idx = pd.MultiIndex.from_tuples([(1, 2), (3, 4), (5, 6), (7, 8)])
+        m_idx = MultiIndex.from_tuples([(1, 2), (3, 4), (5, 6), (7, 8)])
         data = ['a', 'b', 'c', 'd']
-        m_df = pd.Series(data, index=m_idx)
+        m_df = Series(data, index=m_idx)
         assert m_df.repeat(3).shape == (3 * len(data), )
 
-    def test_iloc_mi(self):
-        # GH 13797
-        # Test if iloc can handle integer locations in MultiIndexed DataFrame
-
-        data = [
-            ['str00', 'str01'],
-            ['str10', 'str11'],
-            ['str20', 'srt21'],
-            ['str30', 'str31'],
-            ['str40', 'str41']
-        ]
-
-        mi = pd.MultiIndex.from_tuples(
-            [('CC', 'A'),
-             ('CC', 'B'),
-             ('CC', 'B'),
-             ('BB', 'a'),
-             ('BB', 'b')
-             ])
 
-        expected = pd.DataFrame(data)
-        df_mi = pd.DataFrame(data, index=mi)
-
-        result = pd.DataFrame([[df_mi.iloc[r, c] for c in range(2)]
-                               for r in range(5)])
-
-        tm.assert_frame_equal(result, expected)
-
-
-class TestSorted(Base, tm.TestCase):
-    """ everthing you wanted to test about sorting """
+class TestSorted(Base):
+    """ everything you wanted to test about sorting """
 
     def test_sort_index_preserve_levels(self):
         result = self.frame.sort_index()
-        self.assertEqual(result.index.names, self.frame.index.names)
+        assert result.index.names == self.frame.index.names
 
     def test_sorting_repr_8017(self):
 
@@ -2322,7 +1743,7 @@ def test_sorting_repr_8017(self):
             # check that the repr is good
             # make sure that we have a correct sparsified repr
             # e.g. only 1 header of read
-            self.assertEqual(str(df2).splitlines()[0].split(), ['red'])
+            assert str(df2).splitlines()[0].split() == ['red']
 
             # GH 8017
             # sorting fails after columns added
@@ -2353,7 +1774,7 @@ def test_sort_index_level(self):
         a_sorted = self.frame['A'].sort_index(level=0)
 
         # preserve names
-        self.assertEqual(a_sorted.index.names, self.frame.index.names)
+        assert a_sorted.index.names == self.frame.index.names
 
         # inplace
         rs = self.frame.copy()
@@ -2368,7 +1789,7 @@ def test_sort_index_level_large_cardinality(self):
 
         # it works!
         result = df.sort_index(level=0)
-        self.assertTrue(result.index.lexsort_depth == 3)
+        assert result.index.lexsort_depth == 3
 
         # #2684 (int32)
         index = MultiIndex.from_arrays([np.arange(4000)] * 3)
@@ -2376,8 +1797,8 @@ def test_sort_index_level_large_cardinality(self):
 
         # it works!
         result = df.sort_index(level=0)
-        self.assertTrue((result.dtypes.values == df.dtypes.values).all())
-        self.assertTrue(result.index.lexsort_depth == 3)
+        assert (result.dtypes.values == df.dtypes.values).all()
+        assert result.index.lexsort_depth == 3
 
     def test_sort_index_level_by_name(self):
         self.frame.index.names = ['first', 'second']
@@ -2406,71 +1827,229 @@ def test_is_lexsorted(self):
         levels = [[0, 1], [0, 1, 2]]
 
         index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
-        self.assertTrue(index.is_lexsorted())
+                           codes=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 1, 2]])
+        assert index.is_lexsorted()
 
         index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 2, 1]])
-        self.assertFalse(index.is_lexsorted())
+                           codes=[[0, 0, 0, 1, 1, 1], [0, 1, 2, 0, 2, 1]])
+        assert not index.is_lexsorted()
 
         index = MultiIndex(levels=levels,
-                           labels=[[0, 0, 1, 0, 1, 1], [0, 1, 0, 2, 2, 1]])
-        self.assertFalse(index.is_lexsorted())
-        self.assertEqual(index.lexsort_depth, 0)
-
-    def test_getitem_multilevel_index_tuple_not_sorted(self):
-        index_columns = list("abc")
-        df = DataFrame([[0, 1, 0, "x"], [0, 0, 1, "y"]],
-                       columns=index_columns + ["data"])
-        df = df.set_index(index_columns)
-        query_index = df.index[:1]
-        rs = df.loc[query_index, "data"]
-
-        xp_idx = MultiIndex.from_tuples([(0, 1, 0)], names=['a', 'b', 'c'])
-        xp = Series(['x'], index=xp_idx, name='data')
-        tm.assert_series_equal(rs, xp)
-
-    def test_getitem_slice_not_sorted(self):
-        df = self.frame.sort_index(level=1).T
-
-        # buglet with int typechecking
-        result = df.iloc[:, :np.int32(3)]
-        expected = df.reindex(columns=df.columns[:3])
+                           codes=[[0, 0, 1, 0, 1, 1], [0, 1, 0, 2, 2, 1]])
+        assert not index.is_lexsorted()
+        assert index.lexsort_depth == 0
+
+    def test_sort_index_and_reconstruction(self):
+
+        # 15622
+        # lexsortedness should be identical
+        # across MultiIndex consruction methods
+
+        df = DataFrame([[1, 1], [2, 2]], index=list('ab'))
+        expected = DataFrame([[1, 1], [2, 2], [1, 1], [2, 2]],
+                             index=MultiIndex.from_tuples([(0.5, 'a'),
+                                                           (0.5, 'b'),
+                                                           (0.8, 'a'),
+                                                           (0.8, 'b')]))
+        assert expected.index.is_lexsorted()
+
+        result = DataFrame(
+            [[1, 1], [2, 2], [1, 1], [2, 2]],
+            index=MultiIndex.from_product([[0.5, 0.8], list('ab')]))
+        result = result.sort_index()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
         tm.assert_frame_equal(result, expected)
 
-    def test_frame_getitem_not_sorted(self):
-        df = self.frame.T
-        df['foo', 'four'] = 'foo'
+        result = DataFrame(
+            [[1, 1], [2, 2], [1, 1], [2, 2]],
+            index=MultiIndex(levels=[[0.5, 0.8], ['a', 'b']],
+                             codes=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        result = result.sort_index()
+        assert result.index.is_lexsorted()
+
+        tm.assert_frame_equal(result, expected)
+
+        concatted = pd.concat([df, df], keys=[0.8, 0.5])
+        result = concatted.sort_index()
 
-        arrays = [np.array(x) for x in zip(*df.columns.values)]
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
 
-        result = df['foo']
-        result2 = df.loc[:, 'foo']
-        expected = df.reindex(columns=df.columns[arrays[0] == 'foo'])
-        expected.columns = expected.columns.droplevel(0)
         tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result2, expected)
 
-        df = df.T
-        result = df.xs('foo')
-        result2 = df.loc['foo']
-        expected = df.reindex(df.index[arrays[0] == 'foo'])
-        expected.index = expected.index.droplevel(0)
+        # 14015
+        df = DataFrame([[1, 2], [6, 7]],
+                       columns=MultiIndex.from_tuples(
+                           [(0, '20160811 12:00:00'),
+                            (0, '20160809 12:00:00')],
+                           names=['l1', 'Date']))
+
+        df.columns.set_levels(pd.to_datetime(df.columns.levels[1]),
+                              level=1,
+                              inplace=True)
+        assert not df.columns.is_lexsorted()
+        assert not df.columns.is_monotonic
+        result = df.sort_index(axis=1)
+        assert result.columns.is_lexsorted()
+        assert result.columns.is_monotonic
+        result = df.sort_index(axis=1, level=1)
+        assert result.columns.is_lexsorted()
+        assert result.columns.is_monotonic
+
+    def test_sort_index_and_reconstruction_doc_example(self):
+        # doc example
+        df = DataFrame({'value': [1, 2, 3, 4]},
+                       index=MultiIndex(
+                           levels=[['a', 'b'], ['bb', 'aa']],
+                           codes=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        assert df.index.is_lexsorted()
+        assert not df.index.is_monotonic
+
+        # sort it
+        expected = DataFrame({'value': [2, 1, 4, 3]},
+                             index=MultiIndex(
+                                 levels=[['a', 'b'], ['aa', 'bb']],
+                                 codes=[[0, 0, 1, 1], [0, 1, 0, 1]]))
+        result = df.sort_index()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
         tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(result2, expected)
 
-    def test_series_getitem_not_sorted(self):
-        arrays = [['bar', 'bar', 'baz', 'baz', 'qux', 'qux', 'foo', 'foo'],
-                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two']]
+        # reconstruct
+        result = df.sort_index().copy()
+        result.index = result.index._sort_levels_monotonic()
+        assert result.index.is_lexsorted()
+        assert result.index.is_monotonic
+
+        tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_reorder_on_ops(self):
+        # 15687
+        df = DataFrame(
+            np.random.randn(8, 2),
+            index=MultiIndex.from_product(
+                [['a', 'b'], ['big', 'small'], ['red', 'blu']],
+                names=['letter', 'size', 'color']),
+            columns=['near', 'far'])
+        df = df.sort_index()
+
+        def my_func(group):
+            group.index = ['newz', 'newa']
+            return group
+
+        result = df.groupby(level=['letter', 'size']).apply(
+            my_func).sort_index()
+        expected = MultiIndex.from_product(
+            [['a', 'b'], ['big', 'small'], ['newa', 'newz']],
+            names=['letter', 'size', None])
+
+        tm.assert_index_equal(result.index, expected)
+
+    def test_sort_non_lexsorted(self):
+        # degenerate case where we sort but don't
+        # have a satisfying result :<
+        # GH 15797
+        idx = MultiIndex([['A', 'B', 'C'],
+                          ['c', 'b', 'a']],
+                         [[0, 1, 2, 0, 1, 2],
+                          [0, 2, 1, 1, 0, 2]])
+
+        df = DataFrame({'col': range(len(idx))},
+                       index=idx,
+                       dtype='int64')
+        assert df.index.is_lexsorted() is False
+        assert df.index.is_monotonic is False
+
+        sorted = df.sort_index()
+        assert sorted.index.is_lexsorted() is True
+        assert sorted.index.is_monotonic is True
+
+        expected = DataFrame(
+            {'col': [1, 4, 5, 2]},
+            index=MultiIndex.from_tuples([('B', 'a'), ('B', 'c'),
+                                          ('C', 'a'), ('C', 'b')]),
+            dtype='int64')
+        result = sorted.loc[pd.IndexSlice['B':'C', 'a':'c'], :]
+        tm.assert_frame_equal(result, expected)
+
+    def test_sort_index_nan(self):
+        # GH 14784
+        # incorrect sorting w.r.t. nans
+        tuples = [[12, 13], [np.nan, np.nan], [np.nan, 3], [1, 2]]
+        mi = MultiIndex.from_tuples(tuples)
+
+        df = DataFrame(np.arange(16).reshape(4, 4),
+                       index=mi, columns=list('ABCD'))
+        s = Series(np.arange(4), index=mi)
+
+        df2 = DataFrame({
+            'date': pd.to_datetime([
+                '20121002', '20121007', '20130130', '20130202', '20130305',
+                '20121002', '20121207', '20130130', '20130202', '20130305',
+                '20130202', '20130305'
+            ]),
+            'user_id': [1, 1, 1, 1, 1, 3, 3, 3, 5, 5, 5, 5],
+            'whole_cost': [1790, np.nan, 280, 259, np.nan, 623, 90, 312,
+                           np.nan, 301, 359, 801],
+            'cost': [12, 15, 10, 24, 39, 1, 0, np.nan, 45, 34, 1, 12]
+        }).set_index(['date', 'user_id'])
+
+        # sorting frame, default nan position is last
+        result = df.sort_index()
+        expected = df.iloc[[3, 0, 2, 1], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame, nan position last
+        result = df.sort_index(na_position='last')
+        expected = df.iloc[[3, 0, 2, 1], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame, nan position first
+        result = df.sort_index(na_position='first')
+        expected = df.iloc[[1, 2, 3, 0], :]
+        tm.assert_frame_equal(result, expected)
+
+        # sorting frame with removed rows
+        result = df2.dropna().sort_index()
+        expected = df2.sort_index().dropna()
+        tm.assert_frame_equal(result, expected)
+
+        # sorting series, default nan position is last
+        result = s.sort_index()
+        expected = s.iloc[[3, 0, 2, 1]]
+        tm.assert_series_equal(result, expected)
+
+        # sorting series, nan position last
+        result = s.sort_index(na_position='last')
+        expected = s.iloc[[3, 0, 2, 1]]
+        tm.assert_series_equal(result, expected)
+
+        # sorting series, nan position first
+        result = s.sort_index(na_position='first')
+        expected = s.iloc[[1, 2, 3, 0]]
+        tm.assert_series_equal(result, expected)
+
+    def test_sort_ascending_list(self):
+        # GH: 16934
+
+        # Set up a Series with a three level MultiIndex
+        arrays = [['bar', 'bar', 'baz', 'baz', 'foo', 'foo', 'qux', 'qux'],
+                  ['one', 'two', 'one', 'two', 'one', 'two', 'one', 'two'],
+                  [4, 3, 2, 1, 4, 3, 2, 1]]
         tuples = lzip(*arrays)
-        index = MultiIndex.from_tuples(tuples)
-        s = Series(randn(8), index=index)
+        mi = MultiIndex.from_tuples(tuples, names=['first', 'second', 'third'])
+        s = Series(range(8), index=mi)
 
-        arrays = [np.array(x) for x in zip(*index.values)]
+        # Sort with boolean ascending
+        result = s.sort_index(level=['third', 'first'], ascending=False)
+        expected = s.iloc[[4, 0, 5, 1, 6, 2, 7, 3]]
+        tm.assert_series_equal(result, expected)
 
-        result = s['qux']
-        result2 = s.loc['qux']
-        expected = s[arrays[0] == 'qux']
-        expected.index = expected.index.droplevel(0)
+        # Sort with list of boolean ascending
+        result = s.sort_index(level=['third', 'first'],
+                              ascending=[False, True])
+        expected = s.iloc[[0, 4, 1, 5, 2, 6, 3, 7]]
         tm.assert_series_equal(result, expected)
-        tm.assert_series_equal(result2, expected)
diff --git a/pandas/tests/test_nanops.py b/pandas/tests/test_nanops.py
index 54de8c1e34031..d1893b7efbc41 100644
--- a/pandas/tests/test_nanops.py
+++ b/pandas/tests/test_nanops.py
@@ -2,38 +2,47 @@
 from __future__ import division, print_function
 
 from functools import partial
-
 import warnings
+
 import numpy as np
-from pandas import Series, isnull, _np_version_under1p9
-from pandas.types.common import is_integer_dtype
+import pytest
+
+from pandas.compat import PY2
+from pandas.compat.numpy import _np_version_under1p13
+import pandas.util._test_decorators as td
+
+from pandas.core.dtypes.common import is_integer_dtype
+
+import pandas as pd
+from pandas import Series, isna
+from pandas.core.arrays import DatetimeArray
 import pandas.core.nanops as nanops
 import pandas.util.testing as tm
 
 use_bn = nanops._USE_BOTTLENECK
 
 
-class TestnanopsDataFrame(tm.TestCase):
+class TestnanopsDataFrame(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         np.random.seed(11235)
         nanops._USE_BOTTLENECK = False
 
-        self.arr_shape = (11, 7, 5)
+        arr_shape = (11, 7, 5)
 
-        self.arr_float = np.random.randn(*self.arr_shape)
-        self.arr_float1 = np.random.randn(*self.arr_shape)
+        self.arr_float = np.random.randn(*arr_shape)
+        self.arr_float1 = np.random.randn(*arr_shape)
         self.arr_complex = self.arr_float + self.arr_float1 * 1j
-        self.arr_int = np.random.randint(-10, 10, self.arr_shape)
-        self.arr_bool = np.random.randint(0, 2, self.arr_shape) == 0
+        self.arr_int = np.random.randint(-10, 10, arr_shape)
+        self.arr_bool = np.random.randint(0, 2, arr_shape) == 0
         self.arr_str = np.abs(self.arr_float).astype('S')
         self.arr_utf = np.abs(self.arr_float).astype('U')
         self.arr_date = np.random.randint(0, 20000,
-                                          self.arr_shape).astype('M8[ns]')
+                                          arr_shape).astype('M8[ns]')
         self.arr_tdelta = np.random.randint(0, 20000,
-                                            self.arr_shape).astype('m8[ns]')
+                                            arr_shape).astype('m8[ns]')
 
-        self.arr_nan = np.tile(np.nan, self.arr_shape)
+        self.arr_nan = np.tile(np.nan, arr_shape)
         self.arr_float_nan = np.vstack([self.arr_float, self.arr_nan])
         self.arr_float1_nan = np.vstack([self.arr_float1, self.arr_nan])
         self.arr_nan_float1 = np.vstack([self.arr_nan, self.arr_float1])
@@ -41,22 +50,22 @@ def setUp(self):
 
         self.arr_inf = self.arr_float * np.inf
         self.arr_float_inf = np.vstack([self.arr_float, self.arr_inf])
-        self.arr_float1_inf = np.vstack([self.arr_float1, self.arr_inf])
-        self.arr_inf_float1 = np.vstack([self.arr_inf, self.arr_float1])
-        self.arr_inf_inf = np.vstack([self.arr_inf, self.arr_inf])
 
         self.arr_nan_inf = np.vstack([self.arr_nan, self.arr_inf])
         self.arr_float_nan_inf = np.vstack([self.arr_float, self.arr_nan,
                                             self.arr_inf])
-        self.arr_nan_float1_inf = np.vstack([self.arr_float, self.arr_inf,
-                                             self.arr_nan])
         self.arr_nan_nan_inf = np.vstack([self.arr_nan, self.arr_nan,
                                           self.arr_inf])
-        self.arr_obj = np.vstack([self.arr_float.astype(
-            'O'), self.arr_int.astype('O'), self.arr_bool.astype(
-                'O'), self.arr_complex.astype('O'), self.arr_str.astype(
-                    'O'), self.arr_utf.astype('O'), self.arr_date.astype('O'),
-            self.arr_tdelta.astype('O')])
+        self.arr_obj = np.vstack([
+            self.arr_float.astype('O'),
+            self.arr_int.astype('O'),
+            self.arr_bool.astype('O'),
+            self.arr_complex.astype('O'),
+            self.arr_str.astype('O'),
+            self.arr_utf.astype('O'),
+            self.arr_date.astype('O'),
+            self.arr_tdelta.astype('O')
+        ])
 
         with np.errstate(invalid='ignore'):
             self.arr_nan_nanj = self.arr_nan + self.arr_nan * 1j
@@ -69,53 +78,21 @@ def setUp(self):
 
         self.arr_float_2d = self.arr_float[:, :, 0]
         self.arr_float1_2d = self.arr_float1[:, :, 0]
-        self.arr_complex_2d = self.arr_complex[:, :, 0]
-        self.arr_int_2d = self.arr_int[:, :, 0]
-        self.arr_bool_2d = self.arr_bool[:, :, 0]
-        self.arr_str_2d = self.arr_str[:, :, 0]
-        self.arr_utf_2d = self.arr_utf[:, :, 0]
-        self.arr_date_2d = self.arr_date[:, :, 0]
-        self.arr_tdelta_2d = self.arr_tdelta[:, :, 0]
 
         self.arr_nan_2d = self.arr_nan[:, :, 0]
         self.arr_float_nan_2d = self.arr_float_nan[:, :, 0]
         self.arr_float1_nan_2d = self.arr_float1_nan[:, :, 0]
         self.arr_nan_float1_2d = self.arr_nan_float1[:, :, 0]
-        self.arr_nan_nan_2d = self.arr_nan_nan[:, :, 0]
-        self.arr_nan_nanj_2d = self.arr_nan_nanj[:, :, 0]
-        self.arr_complex_nan_2d = self.arr_complex_nan[:, :, 0]
-
-        self.arr_inf_2d = self.arr_inf[:, :, 0]
-        self.arr_float_inf_2d = self.arr_float_inf[:, :, 0]
-        self.arr_nan_inf_2d = self.arr_nan_inf[:, :, 0]
-        self.arr_float_nan_inf_2d = self.arr_float_nan_inf[:, :, 0]
-        self.arr_nan_nan_inf_2d = self.arr_nan_nan_inf[:, :, 0]
 
         self.arr_float_1d = self.arr_float[:, 0, 0]
         self.arr_float1_1d = self.arr_float1[:, 0, 0]
-        self.arr_complex_1d = self.arr_complex[:, 0, 0]
-        self.arr_int_1d = self.arr_int[:, 0, 0]
-        self.arr_bool_1d = self.arr_bool[:, 0, 0]
-        self.arr_str_1d = self.arr_str[:, 0, 0]
-        self.arr_utf_1d = self.arr_utf[:, 0, 0]
-        self.arr_date_1d = self.arr_date[:, 0, 0]
-        self.arr_tdelta_1d = self.arr_tdelta[:, 0, 0]
 
         self.arr_nan_1d = self.arr_nan[:, 0, 0]
         self.arr_float_nan_1d = self.arr_float_nan[:, 0, 0]
         self.arr_float1_nan_1d = self.arr_float1_nan[:, 0, 0]
         self.arr_nan_float1_1d = self.arr_nan_float1[:, 0, 0]
-        self.arr_nan_nan_1d = self.arr_nan_nan[:, 0, 0]
-        self.arr_nan_nanj_1d = self.arr_nan_nanj[:, 0, 0]
-        self.arr_complex_nan_1d = self.arr_complex_nan[:, 0, 0]
 
-        self.arr_inf_1d = self.arr_inf.ravel()
-        self.arr_float_inf_1d = self.arr_float_inf[:, 0, 0]
-        self.arr_nan_inf_1d = self.arr_nan_inf[:, 0, 0]
-        self.arr_float_nan_inf_1d = self.arr_float_nan_inf[:, 0, 0]
-        self.arr_nan_nan_inf_1d = self.arr_nan_nan_inf[:, 0, 0]
-
-    def tearDown(self):
+    def teardown_method(self, method):
         nanops._USE_BOTTLENECK = use_bn
 
     def check_results(self, targ, res, axis, check_dtype=True):
@@ -136,12 +113,12 @@ def _coerce_tds(targ, res):
             if axis != 0 and hasattr(
                     targ, 'shape') and targ.ndim and targ.shape != res.shape:
                 res = np.split(res, [targ.shape[0]], axis=0)[0]
-        except:
+        except (ValueError, IndexError):
             targ, res = _coerce_tds(targ, res)
 
         try:
             tm.assert_almost_equal(targ, res, check_dtype=check_dtype)
-        except:
+        except AssertionError:
 
             # handle timedelta dtypes
             if hasattr(targ, 'dtype') and targ.dtype == 'm8[ns]':
@@ -162,11 +139,11 @@ def _coerce_tds(targ, res):
                 else:
                     try:
                         res = res.astype('c16')
-                    except:
+                    except RuntimeError:
                         res = res.astype('f8')
                     try:
                         targ = targ.astype('c16')
-                    except:
+                    except RuntimeError:
                         targ = targ.astype('f8')
             # there should never be a case where numpy returns an object
             # but nanops doesn't, so make that an exception
@@ -178,12 +155,17 @@ def _coerce_tds(targ, res):
                                    check_dtype=check_dtype)
 
     def check_fun_data(self, testfunc, targfunc, testarval, targarval,
-                       targarnanval, check_dtype=True, **kwargs):
+                       targarnanval, check_dtype=True, empty_targfunc=None,
+                       **kwargs):
         for axis in list(range(targarval.ndim)) + [None]:
             for skipna in [False, True]:
                 targartempval = targarval if skipna else targarnanval
-                try:
+                if skipna and empty_targfunc and isna(targartempval).all():
+                    targ = empty_targfunc(targartempval, axis=axis, **kwargs)
+                else:
                     targ = targfunc(targartempval, axis=axis, **kwargs)
+
+                try:
                     res = testfunc(testarval, axis=axis, skipna=skipna,
                                    **kwargs)
                     self.check_results(targ, res, axis,
@@ -215,10 +197,11 @@ def check_fun_data(self, testfunc, targfunc, testarval, targarval,
         except ValueError:
             return
         self.check_fun_data(testfunc, targfunc, testarval2, targarval2,
-                            targarnanval2, check_dtype=check_dtype, **kwargs)
+                            targarnanval2, check_dtype=check_dtype,
+                            empty_targfunc=empty_targfunc, **kwargs)
 
     def check_fun(self, testfunc, targfunc, testar, targar=None,
-                  targarnan=None, **kwargs):
+                  targarnan=None, empty_targfunc=None, **kwargs):
         if targar is None:
             targar = testar
         if targarnan is None:
@@ -228,7 +211,8 @@ def check_fun(self, testfunc, targfunc, testar, targar=None,
         targarnanval = getattr(self, targarnan)
         try:
             self.check_fun_data(testfunc, targfunc, testarval, targarval,
-                                targarnanval, **kwargs)
+                                targarnanval, empty_targfunc=empty_targfunc,
+                                **kwargs)
         except BaseException as exc:
             exc.args += ('testar: %s' % testar, 'targar: %s' % targar,
                          'targarnan: %s' % targarnan)
@@ -289,24 +273,6 @@ def check_funs(self, testfunc, targfunc, allow_complex=True,
                                    allow_complex=allow_complex)
             self.check_fun(testfunc, targfunc, 'arr_obj', **kwargs)
 
-    def check_funs_ddof(self,
-                        testfunc,
-                        targfunc,
-                        allow_complex=True,
-                        allow_all_nan=True,
-                        allow_str=True,
-                        allow_date=False,
-                        allow_tdelta=False,
-                        allow_obj=True, ):
-        for ddof in range(3):
-            try:
-                self.check_funs(testfunc, targfunc, allow_complex,
-                                allow_all_nan, allow_str, allow_date,
-                                allow_tdelta, allow_obj, ddof=ddof)
-            except BaseException as exc:
-                exc.args += ('ddof %s' % ddof, )
-                raise
-
     def _badobj_wrap(self, value, func, allow_complex=True, **kwargs):
         if value.dtype.kind == 'O':
             if allow_complex:
@@ -325,7 +291,8 @@ def test_nanall(self):
 
     def test_nansum(self):
         self.check_funs(nanops.nansum, np.sum, allow_str=False,
-                        allow_date=False, allow_tdelta=True, check_dtype=False)
+                        allow_date=False, allow_tdelta=True, check_dtype=False,
+                        empty_targfunc=np.nansum)
 
     def test_nanmean(self):
         self.check_funs(nanops.nanmean, np.mean, allow_complex=False,
@@ -337,15 +304,13 @@ def test_nanmean_overflow(self):
         # In the previous implementation mean can overflow for int dtypes, it
         # is now consistent with numpy
 
-        # numpy < 1.9.0 is not computing this correctly
-        if not _np_version_under1p9:
-            for a in [2 ** 55, -2 ** 55, 20150515061816532]:
-                s = Series(a, index=range(500), dtype=np.int64)
-                result = s.mean()
-                np_result = s.values.mean()
-                self.assertEqual(result, a)
-                self.assertEqual(result, np_result)
-                self.assertTrue(result.dtype == np.float64)
+        for a in [2 ** 55, -2 ** 55, 20150515061816532]:
+            s = Series(a, index=range(500), dtype=np.int64)
+            result = s.mean()
+            np_result = s.values.mean()
+            assert result == a
+            assert result == np_result
+            assert result.dtype == np.float64
 
     def test_returned_dtype(self):
 
@@ -360,58 +325,64 @@ def test_returned_dtype(self):
             for method in group_a + group_b:
                 result = getattr(s, method)()
                 if is_integer_dtype(dtype) and method in group_a:
-                    self.assertTrue(
-                        result.dtype == np.float64,
-                        "return dtype expected from %s is np.float64, "
-                        "got %s instead" % (method, result.dtype))
+                    assert result.dtype == np.float64
                 else:
-                    self.assertTrue(
-                        result.dtype == dtype,
-                        "return dtype expected from %s is %s, "
-                        "got %s instead" % (method, dtype, result.dtype))
+                    assert result.dtype == dtype
 
     def test_nanmedian(self):
         with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", RuntimeWarning)
             self.check_funs(nanops.nanmedian, np.median, allow_complex=False,
                             allow_str=False, allow_date=False,
                             allow_tdelta=True, allow_obj='convert')
 
-    def test_nanvar(self):
-        self.check_funs_ddof(nanops.nanvar, np.var, allow_complex=False,
-                             allow_str=False, allow_date=False,
-                             allow_tdelta=True, allow_obj='convert')
-
-    def test_nanstd(self):
-        self.check_funs_ddof(nanops.nanstd, np.std, allow_complex=False,
-                             allow_str=False, allow_date=False,
-                             allow_tdelta=True, allow_obj='convert')
-
-    def test_nansem(self):
-        tm.skip_if_no_package('scipy', min_version='0.17.0')
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nanvar(self, ddof):
+        self.check_funs(nanops.nanvar, np.var, allow_complex=False,
+                        allow_str=False, allow_date=False,
+                        allow_tdelta=True, allow_obj='convert', ddof=ddof)
+
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nanstd(self, ddof):
+        self.check_funs(nanops.nanstd, np.std, allow_complex=False,
+                        allow_str=False, allow_date=False,
+                        allow_tdelta=True, allow_obj='convert', ddof=ddof)
+
+    @td.skip_if_no('scipy', min_version='0.17.0')
+    @pytest.mark.parametrize('ddof', range(3))
+    def test_nansem(self, ddof):
         from scipy.stats import sem
         with np.errstate(invalid='ignore'):
-            self.check_funs_ddof(nanops.nansem, sem, allow_complex=False,
-                                 allow_str=False, allow_date=False,
-                                 allow_tdelta=False, allow_obj='convert')
+            self.check_funs(nanops.nansem, sem, allow_complex=False,
+                            allow_str=False, allow_date=False,
+                            allow_tdelta=False, allow_obj='convert', ddof=ddof)
 
     def _minmax_wrap(self, value, axis=None, func=None):
+
+        # numpy warns if all nan
         res = func(value, axis)
         if res.dtype.kind == 'm':
             res = np.atleast_1d(res)
         return res
 
     def test_nanmin(self):
-        func = partial(self._minmax_wrap, func=np.min)
-        self.check_funs(nanops.nanmin, func, allow_str=False, allow_obj=False)
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", RuntimeWarning)
+            func = partial(self._minmax_wrap, func=np.min)
+            self.check_funs(nanops.nanmin, func,
+                            allow_str=False, allow_obj=False)
 
     def test_nanmax(self):
-        func = partial(self._minmax_wrap, func=np.max)
-        self.check_funs(nanops.nanmax, func, allow_str=False, allow_obj=False)
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", RuntimeWarning)
+            func = partial(self._minmax_wrap, func=np.max)
+            self.check_funs(nanops.nanmax, func,
+                            allow_str=False, allow_obj=False)
 
     def _argminmax_wrap(self, value, axis=None, func=None):
         res = func(value, axis)
         nans = np.min(value, axis)
-        nullnan = isnull(nans)
+        nullnan = isna(nans)
         if res.ndim:
             res[nullnan] = -1
         elif (hasattr(nullnan, 'all') and nullnan.all() or
@@ -420,17 +391,17 @@ def _argminmax_wrap(self, value, axis=None, func=None):
         return res
 
     def test_nanargmax(self):
-        func = partial(self._argminmax_wrap, func=np.argmax)
-        self.check_funs(nanops.nanargmax, func, allow_str=False,
-                        allow_obj=False, allow_date=True, allow_tdelta=True)
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", RuntimeWarning)
+            func = partial(self._argminmax_wrap, func=np.argmax)
+            self.check_funs(nanops.nanargmax, func,
+                            allow_str=False, allow_obj=False,
+                            allow_date=True, allow_tdelta=True)
 
     def test_nanargmin(self):
-        func = partial(self._argminmax_wrap, func=np.argmin)
-        if tm.sys.version_info[0:2] == (2, 6):
-            self.check_funs(nanops.nanargmin, func, allow_date=True,
-                            allow_tdelta=True, allow_str=False,
-                            allow_obj=False)
-        else:
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("ignore", RuntimeWarning)
+            func = partial(self._argminmax_wrap, func=np.argmin)
             self.check_funs(nanops.nanargmin, func, allow_str=False,
                             allow_obj=False)
 
@@ -446,8 +417,8 @@ def _skew_kurt_wrap(self, values, axis=None, func=None):
             return 0.
         return result
 
+    @td.skip_if_no('scipy', min_version='0.17.0')
     def test_nanskew(self):
-        tm.skip_if_no_package('scipy', min_version='0.17.0')
         from scipy.stats import skew
         func = partial(self._skew_kurt_wrap, func=skew)
         with np.errstate(invalid='ignore'):
@@ -455,8 +426,8 @@ def test_nanskew(self):
                             allow_str=False, allow_date=False,
                             allow_tdelta=False)
 
+    @td.skip_if_no('scipy', min_version='0.17.0')
     def test_nankurt(self):
-        tm.skip_if_no_package('scipy', min_version='0.17.0')
         from scipy.stats import kurtosis
         func1 = partial(kurtosis, fisher=True)
         func = partial(self._skew_kurt_wrap, func=func1)
@@ -467,7 +438,8 @@ def test_nankurt(self):
 
     def test_nanprod(self):
         self.check_funs(nanops.nanprod, np.prod, allow_str=False,
-                        allow_date=False, allow_tdelta=False)
+                        allow_date=False, allow_tdelta=False,
+                        empty_targfunc=np.nanprod)
 
     def check_nancorr_nancov_2d(self, checkfun, targ0, targ1, **kwargs):
         res00 = checkfun(self.arr_float_2d, self.arr_float1_2d, **kwargs)
@@ -554,8 +526,8 @@ def test_nancorr_pearson(self):
         self.check_nancorr_nancov_1d(nanops.nancorr, targ0, targ1,
                                      method='pearson')
 
+    @td.skip_if_no_scipy
     def test_nancorr_kendall(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import kendalltau
         targ0 = kendalltau(self.arr_float_2d, self.arr_float1_2d)[0]
         targ1 = kendalltau(self.arr_float_2d.flat, self.arr_float1_2d.flat)[0]
@@ -566,8 +538,8 @@ def test_nancorr_kendall(self):
         self.check_nancorr_nancov_1d(nanops.nancorr, targ0, targ1,
                                      method='kendall')
 
+    @td.skip_if_no_scipy
     def test_nancorr_spearman(self):
-        tm.skip_if_no_package('scipy.stats')
         from scipy.stats import spearmanr
         targ0 = spearmanr(self.arr_float_2d, self.arr_float1_2d)[0]
         targ1 = spearmanr(self.arr_float_2d.flat, self.arr_float1_2d.flat)[0]
@@ -655,9 +627,9 @@ def check_bool(self, func, value, correct, *args, **kwargs):
             try:
                 res0 = func(value, *args, **kwargs)
                 if correct:
-                    self.assertTrue(res0)
+                    assert res0
                 else:
-                    self.assertFalse(res0)
+                    assert not res0
             except BaseException as exc:
                 exc.args += ('dim: %s' % getattr(value, 'ndim', value), )
                 raise
@@ -734,67 +706,71 @@ def test__isfinite(self):
                 raise
 
     def test__bn_ok_dtype(self):
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_float.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_complex.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_int.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_bool.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_str.dtype, 'test'))
-        self.assertTrue(nanops._bn_ok_dtype(self.arr_utf.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_date.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_tdelta.dtype, 'test'))
-        self.assertFalse(nanops._bn_ok_dtype(self.arr_obj.dtype, 'test'))
+        assert nanops._bn_ok_dtype(self.arr_float.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_complex.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_int.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_bool.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_str.dtype, 'test')
+        assert nanops._bn_ok_dtype(self.arr_utf.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_date.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_tdelta.dtype, 'test')
+        assert not nanops._bn_ok_dtype(self.arr_obj.dtype, 'test')
 
 
-class TestEnsureNumeric(tm.TestCase):
+class TestEnsureNumeric(object):
 
     def test_numeric_values(self):
         # Test integer
-        self.assertEqual(nanops._ensure_numeric(1), 1, 'Failed for int')
+        assert nanops._ensure_numeric(1) == 1
+
         # Test float
-        self.assertEqual(nanops._ensure_numeric(1.1), 1.1, 'Failed for float')
+        assert nanops._ensure_numeric(1.1) == 1.1
+
         # Test complex
-        self.assertEqual(nanops._ensure_numeric(1 + 2j), 1 + 2j,
-                         'Failed for complex')
+        assert nanops._ensure_numeric(1 + 2j) == 1 + 2j
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_ndarray(self):
         # Test numeric ndarray
         values = np.array([1, 2, 3])
-        self.assertTrue(np.allclose(nanops._ensure_numeric(values), values),
-                        'Failed for numeric ndarray')
+        assert np.allclose(nanops._ensure_numeric(values), values)
 
         # Test object ndarray
         o_values = values.astype(object)
-        self.assertTrue(np.allclose(nanops._ensure_numeric(o_values), values),
-                        'Failed for object ndarray')
+        assert np.allclose(nanops._ensure_numeric(o_values), values)
 
         # Test convertible string ndarray
         s_values = np.array(['1', '2', '3'], dtype=object)
-        self.assertTrue(np.allclose(nanops._ensure_numeric(s_values), values),
-                        'Failed for convertible string ndarray')
+        assert np.allclose(nanops._ensure_numeric(s_values), values)
 
         # Test non-convertible string ndarray
         s_values = np.array(['foo', 'bar', 'baz'], dtype=object)
-        self.assertRaises(ValueError, lambda: nanops._ensure_numeric(s_values))
+        msg = r"could not convert string to float: '(foo|baz)'"
+        with pytest.raises(ValueError, match=msg):
+            nanops._ensure_numeric(s_values)
 
     def test_convertable_values(self):
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1'), 1.0),
-                        'Failed for convertible integer string')
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1.1'), 1.1),
-                        'Failed for convertible float string')
-        self.assertTrue(np.allclose(nanops._ensure_numeric('1+1j'), 1 + 1j),
-                        'Failed for convertible complex string')
+        assert np.allclose(nanops._ensure_numeric('1'), 1.0)
+        assert np.allclose(nanops._ensure_numeric('1.1'), 1.1)
+        assert np.allclose(nanops._ensure_numeric('1+1j'), 1 + 1j)
 
     def test_non_convertable_values(self):
-        self.assertRaises(TypeError, lambda: nanops._ensure_numeric('foo'))
-        self.assertRaises(TypeError, lambda: nanops._ensure_numeric({}))
-        self.assertRaises(TypeError, lambda: nanops._ensure_numeric([]))
+        msg = "Could not convert foo to numeric"
+        with pytest.raises(TypeError, match=msg):
+            nanops._ensure_numeric('foo')
+        msg = "Could not convert {} to numeric"
+        with pytest.raises(TypeError, match=msg):
+            nanops._ensure_numeric({})
+        msg = r"Could not convert \[\] to numeric"
+        with pytest.raises(TypeError, match=msg):
+            nanops._ensure_numeric([])
 
 
-class TestNanvarFixedValues(tm.TestCase):
+class TestNanvarFixedValues(object):
 
     # xref GH10242
 
-    def setUp(self):
+    def setup_method(self, method):
         # Samples from a normal distribution.
         self.variance = variance = 3.0
         self.samples = self.prng.normal(scale=variance ** 0.5, size=100000)
@@ -881,14 +857,14 @@ def test_ground_truth(self):
             for ddof in range(3):
                 var = nanops.nanvar(samples, skipna=True, axis=axis, ddof=ddof)
                 tm.assert_almost_equal(var[:3], variance[axis, ddof])
-                self.assertTrue(np.isnan(var[3]))
+                assert np.isnan(var[3])
 
         # Test nanstd.
         for axis in range(2):
             for ddof in range(3):
                 std = nanops.nanstd(samples, skipna=True, axis=axis, ddof=ddof)
                 tm.assert_almost_equal(std[:3], variance[axis, ddof] ** 0.5)
-                self.assertTrue(np.isnan(std[3]))
+                assert np.isnan(std[3])
 
     def test_nanstd_roundoff(self):
         # Regression test for GH 10242 (test data taken from GH 10489). Ensure
@@ -896,18 +872,18 @@ def test_nanstd_roundoff(self):
         data = Series(766897346 * np.ones(10))
         for ddof in range(3):
             result = data.std(ddof=ddof)
-            self.assertEqual(result, 0.0)
+            assert result == 0.0
 
     @property
     def prng(self):
         return np.random.RandomState(1234)
 
 
-class TestNanskewFixedValues(tm.TestCase):
+class TestNanskewFixedValues(object):
 
     # xref GH 11974
 
-    def setUp(self):
+    def setup_method(self, method):
         # Test data + skewness value (computed with scipy.stats.skew)
         self.samples = np.sin(np.linspace(0, 1, 200))
         self.actual_skew = -0.1875895205961754
@@ -917,20 +893,20 @@ def test_constant_series(self):
         for val in [3075.2, 3075.3, 3075.5]:
             data = val * np.ones(300)
             skew = nanops.nanskew(data)
-            self.assertEqual(skew, 0.0)
+            assert skew == 0.0
 
     def test_all_finite(self):
         alpha, beta = 0.3, 0.1
         left_tailed = self.prng.beta(alpha, beta, size=100)
-        self.assertLess(nanops.nanskew(left_tailed), 0)
+        assert nanops.nanskew(left_tailed) < 0
 
         alpha, beta = 0.1, 0.3
         right_tailed = self.prng.beta(alpha, beta, size=100)
-        self.assertGreater(nanops.nanskew(right_tailed), 0)
+        assert nanops.nanskew(right_tailed) > 0
 
     def test_ground_truth(self):
         skew = nanops.nanskew(self.samples)
-        self.assertAlmostEqual(skew, self.actual_skew)
+        tm.assert_almost_equal(skew, self.actual_skew)
 
     def test_axis(self):
         samples = np.vstack([self.samples,
@@ -941,7 +917,7 @@ def test_axis(self):
     def test_nans(self):
         samples = np.hstack([self.samples, np.nan])
         skew = nanops.nanskew(samples, skipna=False)
-        self.assertTrue(np.isnan(skew))
+        assert np.isnan(skew)
 
     def test_nans_skipna(self):
         samples = np.hstack([self.samples, np.nan])
@@ -953,11 +929,11 @@ def prng(self):
         return np.random.RandomState(1234)
 
 
-class TestNankurtFixedValues(tm.TestCase):
+class TestNankurtFixedValues(object):
 
     # xref GH 11974
 
-    def setUp(self):
+    def setup_method(self, method):
         # Test data + kurtosis value (computed with scipy.stats.kurtosis)
         self.samples = np.sin(np.linspace(0, 1, 200))
         self.actual_kurt = -1.2058303433799713
@@ -967,20 +943,20 @@ def test_constant_series(self):
         for val in [3075.2, 3075.3, 3075.5]:
             data = val * np.ones(300)
             kurt = nanops.nankurt(data)
-            self.assertEqual(kurt, 0.0)
+            assert kurt == 0.0
 
     def test_all_finite(self):
         alpha, beta = 0.3, 0.1
         left_tailed = self.prng.beta(alpha, beta, size=100)
-        self.assertLess(nanops.nankurt(left_tailed), 0)
+        assert nanops.nankurt(left_tailed) < 0
 
         alpha, beta = 0.1, 0.3
         right_tailed = self.prng.beta(alpha, beta, size=100)
-        self.assertGreater(nanops.nankurt(right_tailed), 0)
+        assert nanops.nankurt(right_tailed) > 0
 
     def test_ground_truth(self):
         kurt = nanops.nankurt(self.samples)
-        self.assertAlmostEqual(kurt, self.actual_kurt)
+        tm.assert_almost_equal(kurt, self.actual_kurt)
 
     def test_axis(self):
         samples = np.vstack([self.samples,
@@ -991,7 +967,7 @@ def test_axis(self):
     def test_nans(self):
         samples = np.hstack([self.samples, np.nan])
         kurt = nanops.nankurt(samples, skipna=False)
-        self.assertTrue(np.isnan(kurt))
+        assert np.isnan(kurt)
 
     def test_nans_skipna(self):
         samples = np.hstack([self.samples, np.nan])
@@ -1001,3 +977,93 @@ def test_nans_skipna(self):
     @property
     def prng(self):
         return np.random.RandomState(1234)
+
+
+class TestDatetime64NaNOps(object):
+    @pytest.mark.parametrize('tz', [None, 'UTC'])
+    @pytest.mark.xfail(reason="disabled")
+    # Enabling mean changes the behavior of DataFrame.mean
+    # See https://github.com/pandas-dev/pandas/issues/24752
+    def test_nanmean(self, tz):
+        dti = pd.date_range('2016-01-01', periods=3, tz=tz)
+        expected = dti[1]
+
+        for obj in [dti, DatetimeArray(dti), Series(dti)]:
+            result = nanops.nanmean(obj)
+            assert result == expected
+
+        dti2 = dti.insert(1, pd.NaT)
+
+        for obj in [dti2, DatetimeArray(dti2), Series(dti2)]:
+            result = nanops.nanmean(obj)
+            assert result == expected
+
+
+def test_use_bottleneck():
+
+    if nanops._BOTTLENECK_INSTALLED:
+
+        pd.set_option('use_bottleneck', True)
+        assert pd.get_option('use_bottleneck')
+
+        pd.set_option('use_bottleneck', False)
+        assert not pd.get_option('use_bottleneck')
+
+        pd.set_option('use_bottleneck', use_bn)
+
+
+@pytest.mark.parametrize("numpy_op, expected", [
+    (np.sum, 10),
+    (np.nansum, 10),
+    (np.mean, 2.5),
+    (np.nanmean, 2.5),
+    (np.median, 2.5),
+    (np.nanmedian, 2.5),
+    (np.min, 1),
+    (np.max, 4),
+])
+def test_numpy_ops(numpy_op, expected):
+    # GH8383
+    result = numpy_op(pd.Series([1, 2, 3, 4]))
+    assert result == expected
+
+
+@pytest.mark.parametrize("numpy_op, expected", [
+    (np.nanmin, 1),
+    (np.nanmax, 4),
+])
+def test_numpy_ops_np_version_under1p13(numpy_op, expected):
+    # GH8383
+    result = numpy_op(pd.Series([1, 2, 3, 4]))
+    if _np_version_under1p13:
+        # bug for numpy < 1.13, where result is a series, should be a scalar
+        with pytest.raises(ValueError):
+            assert result == expected
+    else:
+        assert result == expected
+
+
+@pytest.mark.parametrize("operation", [
+    nanops.nanany,
+    nanops.nanall,
+    nanops.nansum,
+    nanops.nanmean,
+    nanops.nanmedian,
+    nanops.nanstd,
+    nanops.nanvar,
+    nanops.nansem,
+    nanops.nanargmax,
+    nanops.nanargmin,
+    nanops.nanmax,
+    nanops.nanmin,
+    nanops.nanskew,
+    nanops.nankurt,
+    nanops.nanprod,
+])
+def test_nanops_independent_of_mask_param(operation):
+    # GH22764
+    s = pd.Series([1, 2, np.nan, 3, np.nan, 4])
+    mask = s.isna()
+    median_expected = operation(s)
+    median_result = operation(s, mask=mask)
+    assert median_expected == median_result
diff --git a/pandas/tests/test_panel.py b/pandas/tests/test_panel.py
deleted file mode 100644
index ab0322abbcf06..0000000000000
--- a/pandas/tests/test_panel.py
+++ /dev/null
@@ -1,2535 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable=W0612,E1101
-
-from warnings import catch_warnings
-from datetime import datetime
-
-import operator
-import pytest
-
-import numpy as np
-import pandas as pd
-
-from pandas.types.common import is_float_dtype
-from pandas import (Series, DataFrame, Index, date_range, isnull, notnull,
-                    pivot, MultiIndex)
-from pandas.core.nanops import nanall, nanany
-from pandas.core.panel import Panel
-from pandas.core.series import remove_na
-
-from pandas.formats.printing import pprint_thing
-from pandas import compat
-from pandas.compat import range, lrange, StringIO, OrderedDict, signature
-
-from pandas.tseries.offsets import BDay, MonthEnd
-from pandas.util.testing import (assert_panel_equal, assert_frame_equal,
-                                 assert_series_equal, assert_almost_equal,
-                                 ensure_clean, assertRaisesRegexp,
-                                 makeCustomDataframe as mkdf,
-                                 makeMixedDataFrame)
-import pandas.core.panel as panelm
-import pandas.util.testing as tm
-
-
-class PanelTests(object):
-    panel = None
-
-    def test_pickle(self):
-        unpickled = self.round_trip_pickle(self.panel)
-        assert_frame_equal(unpickled['ItemA'], self.panel['ItemA'])
-
-    def test_rank(self):
-        self.assertRaises(NotImplementedError, lambda: self.panel.rank())
-
-    def test_cumsum(self):
-        cumsum = self.panel.cumsum()
-        assert_frame_equal(cumsum['ItemA'], self.panel['ItemA'].cumsum())
-
-    def not_hashable(self):
-        c_empty = Panel()
-        c = Panel(Panel([[[1]]]))
-        self.assertRaises(TypeError, hash, c_empty)
-        self.assertRaises(TypeError, hash, c)
-
-
-class SafeForLongAndSparse(object):
-
-    def test_repr(self):
-        repr(self.panel)
-
-    def test_copy_names(self):
-        for attr in ('major_axis', 'minor_axis'):
-            getattr(self.panel, attr).name = None
-            cp = self.panel.copy()
-            getattr(cp, attr).name = 'foo'
-            self.assertIsNone(getattr(self.panel, attr).name)
-
-    def test_iter(self):
-        tm.equalContents(list(self.panel), self.panel.items)
-
-    def test_count(self):
-        f = lambda s: notnull(s).sum()
-        self._check_stat_op('count', f, obj=self.panel, has_skipna=False)
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum)
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean)
-
-    def test_prod(self):
-        self._check_stat_op('prod', np.prod)
-
-    def test_median(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min)
-
-    def test_max(self):
-        self._check_stat_op('max', np.max)
-
-    def test_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            pytest.skip("no scipy.stats.skew")
-
-        def this_skew(x):
-            if len(x) < 3:
-                return np.nan
-            return skew(x, bias=False)
-
-        self._check_stat_op('skew', this_skew)
-
-    # def test_mad(self):
-    #     f = lambda x: np.abs(x - x.mean()).mean()
-    #     self._check_stat_op('mad', f)
-
-    def test_var(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.var(x, ddof=1)
-
-        self._check_stat_op('var', alt)
-
-    def test_std(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1)
-
-        self._check_stat_op('std', alt)
-
-    def test_sem(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1) / np.sqrt(len(x))
-
-        self._check_stat_op('sem', alt)
-
-    def _check_stat_op(self, name, alternative, obj=None, has_skipna=True):
-        if obj is None:
-            obj = self.panel
-
-            # # set some NAs
-            # obj.loc[5:10] = np.nan
-            # obj.loc[15:20, -2:] = np.nan
-
-        f = getattr(obj, name)
-
-        if has_skipna:
-
-            def skipna_wrapper(x):
-                nona = remove_na(x)
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(np.asarray(x))
-
-            for i in range(obj.ndim):
-                result = f(axis=i, skipna=False)
-                assert_frame_equal(result, obj.apply(wrapper, axis=i))
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        for i in range(obj.ndim):
-            result = f(axis=i)
-            if not tm._incompat_bottleneck_version(name):
-                assert_frame_equal(result, obj.apply(skipna_wrapper, axis=i))
-
-        self.assertRaises(Exception, f, axis=obj.ndim)
-
-        # Unimplemented numeric_only parameter.
-        if 'numeric_only' in signature(f).args:
-            self.assertRaisesRegexp(NotImplementedError, name, f,
-                                    numeric_only=True)
-
-
-class SafeForSparse(object):
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
-
-    def test_get_axis(self):
-        assert (self.panel._get_axis(0) is self.panel.items)
-        assert (self.panel._get_axis(1) is self.panel.major_axis)
-        assert (self.panel._get_axis(2) is self.panel.minor_axis)
-
-    def test_set_axis(self):
-        new_items = Index(np.arange(len(self.panel.items)))
-        new_major = Index(np.arange(len(self.panel.major_axis)))
-        new_minor = Index(np.arange(len(self.panel.minor_axis)))
-
-        # ensure propagate to potentially prior-cached items too
-        item = self.panel['ItemA']
-        self.panel.items = new_items
-
-        if hasattr(self.panel, '_item_cache'):
-            self.assertNotIn('ItemA', self.panel._item_cache)
-        self.assertIs(self.panel.items, new_items)
-
-        # TODO: unused?
-        item = self.panel[0]  # noqa
-
-        self.panel.major_axis = new_major
-        self.assertIs(self.panel[0].index, new_major)
-        self.assertIs(self.panel.major_axis, new_major)
-
-        # TODO: unused?
-        item = self.panel[0]  # noqa
-
-        self.panel.minor_axis = new_minor
-        self.assertIs(self.panel[0].columns, new_minor)
-        self.assertIs(self.panel.minor_axis, new_minor)
-
-    def test_get_axis_number(self):
-        self.assertEqual(self.panel._get_axis_number('items'), 0)
-        self.assertEqual(self.panel._get_axis_number('major'), 1)
-        self.assertEqual(self.panel._get_axis_number('minor'), 2)
-
-        with tm.assertRaisesRegexp(ValueError, "No axis named foo"):
-            self.panel._get_axis_number('foo')
-
-        with tm.assertRaisesRegexp(ValueError, "No axis named foo"):
-            self.panel.__ge__(self.panel, axis='foo')
-
-    def test_get_axis_name(self):
-        self.assertEqual(self.panel._get_axis_name(0), 'items')
-        self.assertEqual(self.panel._get_axis_name(1), 'major_axis')
-        self.assertEqual(self.panel._get_axis_name(2), 'minor_axis')
-
-    def test_get_plane_axes(self):
-        # what to do here?
-
-        index, columns = self.panel._get_plane_axes('items')
-        index, columns = self.panel._get_plane_axes('major_axis')
-        index, columns = self.panel._get_plane_axes('minor_axis')
-        index, columns = self.panel._get_plane_axes(0)
-
-    def test_truncate(self):
-        dates = self.panel.major_axis
-        start, end = dates[1], dates[5]
-
-        trunced = self.panel.truncate(start, end, axis='major')
-        expected = self.panel['ItemA'].truncate(start, end)
-
-        assert_frame_equal(trunced['ItemA'], expected)
-
-        trunced = self.panel.truncate(before=start, axis='major')
-        expected = self.panel['ItemA'].truncate(before=start)
-
-        assert_frame_equal(trunced['ItemA'], expected)
-
-        trunced = self.panel.truncate(after=end, axis='major')
-        expected = self.panel['ItemA'].truncate(after=end)
-
-        assert_frame_equal(trunced['ItemA'], expected)
-
-        # XXX test other axes
-
-    def test_arith(self):
-        self._test_op(self.panel, operator.add)
-        self._test_op(self.panel, operator.sub)
-        self._test_op(self.panel, operator.mul)
-        self._test_op(self.panel, operator.truediv)
-        self._test_op(self.panel, operator.floordiv)
-        self._test_op(self.panel, operator.pow)
-
-        self._test_op(self.panel, lambda x, y: y + x)
-        self._test_op(self.panel, lambda x, y: y - x)
-        self._test_op(self.panel, lambda x, y: y * x)
-        self._test_op(self.panel, lambda x, y: y / x)
-        self._test_op(self.panel, lambda x, y: y ** x)
-
-        self._test_op(self.panel, lambda x, y: x + y)  # panel + 1
-        self._test_op(self.panel, lambda x, y: x - y)  # panel - 1
-        self._test_op(self.panel, lambda x, y: x * y)  # panel * 1
-        self._test_op(self.panel, lambda x, y: x / y)  # panel / 1
-        self._test_op(self.panel, lambda x, y: x ** y)  # panel ** 1
-
-        self.assertRaises(Exception, self.panel.__add__, self.panel['ItemA'])
-
-    @staticmethod
-    def _test_op(panel, op):
-        result = op(panel, 1)
-        assert_frame_equal(result['ItemA'], op(panel['ItemA'], 1))
-
-    def test_keys(self):
-        tm.equalContents(list(self.panel.keys()), self.panel.items)
-
-    def test_iteritems(self):
-        # Test panel.iteritems(), aka panel.iteritems()
-        # just test that it works
-        for k, v in self.panel.iteritems():
-            pass
-
-        self.assertEqual(len(list(self.panel.iteritems())),
-                         len(self.panel.items))
-
-    def test_combineFrame(self):
-        def check_op(op, name):
-            # items
-            df = self.panel['ItemA']
-
-            func = getattr(self.panel, name)
-
-            result = func(df, axis='items')
-
-            assert_frame_equal(result['ItemB'], op(self.panel['ItemB'], df))
-
-            # major
-            xs = self.panel.major_xs(self.panel.major_axis[0])
-            result = func(xs, axis='major')
-
-            idx = self.panel.major_axis[1]
-
-            assert_frame_equal(result.major_xs(idx),
-                               op(self.panel.major_xs(idx), xs))
-
-            # minor
-            xs = self.panel.minor_xs(self.panel.minor_axis[0])
-            result = func(xs, axis='minor')
-
-            idx = self.panel.minor_axis[1]
-
-            assert_frame_equal(result.minor_xs(idx),
-                               op(self.panel.minor_xs(idx), xs))
-
-        ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'pow', 'mod']
-        if not compat.PY3:
-            ops.append('div')
-
-        for op in ops:
-            try:
-                check_op(getattr(operator, op), op)
-            except:
-                pprint_thing("Failing operation: %r" % op)
-                raise
-        if compat.PY3:
-            try:
-                check_op(operator.truediv, 'div')
-            except:
-                pprint_thing("Failing operation: %r" % 'div')
-                raise
-
-    def test_combinePanel(self):
-        result = self.panel.add(self.panel)
-        self.assert_panel_equal(result, self.panel * 2)
-
-    def test_neg(self):
-        self.assert_panel_equal(-self.panel, self.panel * -1)
-
-    # issue 7692
-    def test_raise_when_not_implemented(self):
-        p = Panel(np.arange(3 * 4 * 5).reshape(3, 4, 5),
-                  items=['ItemA', 'ItemB', 'ItemC'],
-                  major_axis=pd.date_range('20130101', periods=4),
-                  minor_axis=list('ABCDE'))
-        d = p.sum(axis=1).iloc[0]
-        ops = ['add', 'sub', 'mul', 'truediv', 'floordiv', 'div', 'mod', 'pow']
-        for op in ops:
-            with self.assertRaises(NotImplementedError):
-                getattr(p, op)(d, axis=0)
-
-    def test_select(self):
-        p = self.panel
-
-        # select items
-        result = p.select(lambda x: x in ('ItemA', 'ItemC'), axis='items')
-        expected = p.reindex(items=['ItemA', 'ItemC'])
-        self.assert_panel_equal(result, expected)
-
-        # select major_axis
-        result = p.select(lambda x: x >= datetime(2000, 1, 15), axis='major')
-        new_major = p.major_axis[p.major_axis >= datetime(2000, 1, 15)]
-        expected = p.reindex(major=new_major)
-        self.assert_panel_equal(result, expected)
-
-        # select minor_axis
-        result = p.select(lambda x: x in ('D', 'A'), axis=2)
-        expected = p.reindex(minor=['A', 'D'])
-        self.assert_panel_equal(result, expected)
-
-        # corner case, empty thing
-        result = p.select(lambda x: x in ('foo', ), axis='items')
-        self.assert_panel_equal(result, p.reindex(items=[]))
-
-    def test_get_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
-                    expected = self.panel[item][mnr][mjr]
-                    assert_almost_equal(result, expected)
-
-    def test_abs(self):
-
-        result = self.panel.abs()
-        result2 = abs(self.panel)
-        expected = np.abs(self.panel)
-        self.assert_panel_equal(result, expected)
-        self.assert_panel_equal(result2, expected)
-
-        df = self.panel['ItemA']
-        result = df.abs()
-        result2 = abs(df)
-        expected = np.abs(df)
-        assert_frame_equal(result, expected)
-        assert_frame_equal(result2, expected)
-
-        s = df['A']
-        result = s.abs()
-        result2 = abs(s)
-        expected = np.abs(s)
-        assert_series_equal(result, expected)
-        assert_series_equal(result2, expected)
-        self.assertEqual(result.name, 'A')
-        self.assertEqual(result2.name, 'A')
-
-
-class CheckIndexing(object):
-
-    def test_getitem(self):
-        self.assertRaises(Exception, self.panel.__getitem__, 'ItemQ')
-
-    def test_delitem_and_pop(self):
-        expected = self.panel['ItemA']
-        result = self.panel.pop('ItemA')
-        assert_frame_equal(expected, result)
-        self.assertNotIn('ItemA', self.panel.items)
-
-        del self.panel['ItemB']
-        self.assertNotIn('ItemB', self.panel.items)
-        self.assertRaises(Exception, self.panel.__delitem__, 'ItemB')
-
-        values = np.empty((3, 3, 3))
-        values[0] = 0
-        values[1] = 1
-        values[2] = 2
-
-        panel = Panel(values, lrange(3), lrange(3), lrange(3))
-
-        # did we delete the right row?
-
-        panelc = panel.copy()
-        del panelc[0]
-        assert_frame_equal(panelc[1], panel[1])
-        assert_frame_equal(panelc[2], panel[2])
-
-        panelc = panel.copy()
-        del panelc[1]
-        assert_frame_equal(panelc[0], panel[0])
-        assert_frame_equal(panelc[2], panel[2])
-
-        panelc = panel.copy()
-        del panelc[2]
-        assert_frame_equal(panelc[1], panel[1])
-        assert_frame_equal(panelc[0], panel[0])
-
-    def test_setitem(self):
-        # LongPanel with one item
-        lp = self.panel.filter(['ItemA', 'ItemB']).to_frame()
-        with tm.assertRaises(ValueError):
-            self.panel['ItemE'] = lp
-
-        # DataFrame
-        df = self.panel['ItemA'][2:].filter(items=['A', 'B'])
-        self.panel['ItemF'] = df
-        self.panel['ItemE'] = df
-
-        df2 = self.panel['ItemF']
-
-        assert_frame_equal(df, df2.reindex(index=df.index, columns=df.columns))
-
-        # scalar
-        self.panel['ItemG'] = 1
-        self.panel['ItemE'] = True
-        self.assertEqual(self.panel['ItemG'].values.dtype, np.int64)
-        self.assertEqual(self.panel['ItemE'].values.dtype, np.bool_)
-
-        # object dtype
-        self.panel['ItemQ'] = 'foo'
-        self.assertEqual(self.panel['ItemQ'].values.dtype, np.object_)
-
-        # boolean dtype
-        self.panel['ItemP'] = self.panel['ItemA'] > 0
-        self.assertEqual(self.panel['ItemP'].values.dtype, np.bool_)
-
-        self.assertRaises(TypeError, self.panel.__setitem__, 'foo',
-                          self.panel.loc[['ItemP']])
-
-        # bad shape
-        p = Panel(np.random.randn(4, 3, 2))
-        with tm.assertRaisesRegexp(ValueError,
-                                   r"shape of value must be \(3, 2\), "
-                                   r"shape of given object was \(4, 2\)"):
-            p[0] = np.random.randn(4, 2)
-
-    def test_setitem_ndarray(self):
-        timeidx = date_range(start=datetime(2009, 1, 1),
-                             end=datetime(2009, 12, 31),
-                             freq=MonthEnd())
-        lons_coarse = np.linspace(-177.5, 177.5, 72)
-        lats_coarse = np.linspace(-87.5, 87.5, 36)
-        P = Panel(items=timeidx, major_axis=lons_coarse,
-                  minor_axis=lats_coarse)
-        data = np.random.randn(72 * 36).reshape((72, 36))
-        key = datetime(2009, 2, 28)
-        P[key] = data
-
-        assert_almost_equal(P[key].values, data)
-
-    def test_set_minor_major(self):
-        # GH 11014
-        df1 = DataFrame(['a', 'a', 'a', np.nan, 'a', np.nan])
-        df2 = DataFrame([1.0, np.nan, 1.0, np.nan, 1.0, 1.0])
-        panel = Panel({'Item1': df1, 'Item2': df2})
-
-        newminor = notnull(panel.iloc[:, :, 0])
-        panel.loc[:, :, 'NewMinor'] = newminor
-        assert_frame_equal(panel.loc[:, :, 'NewMinor'],
-                           newminor.astype(object))
-
-        newmajor = notnull(panel.iloc[:, 0, :])
-        panel.loc[:, 'NewMajor', :] = newmajor
-        assert_frame_equal(panel.loc[:, 'NewMajor', :],
-                           newmajor.astype(object))
-
-    def test_major_xs(self):
-        ref = self.panel['ItemA']
-
-        idx = self.panel.major_axis[5]
-        xs = self.panel.major_xs(idx)
-
-        result = xs['ItemA']
-        assert_series_equal(result, ref.xs(idx), check_names=False)
-        self.assertEqual(result.name, 'ItemA')
-
-        # not contained
-        idx = self.panel.major_axis[0] - BDay()
-        self.assertRaises(Exception, self.panel.major_xs, idx)
-
-    def test_major_xs_mixed(self):
-        self.panel['ItemD'] = 'foo'
-        xs = self.panel.major_xs(self.panel.major_axis[0])
-        self.assertEqual(xs['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['ItemD'].dtype, np.object_)
-
-    def test_minor_xs(self):
-        ref = self.panel['ItemA']
-
-        idx = self.panel.minor_axis[1]
-        xs = self.panel.minor_xs(idx)
-
-        assert_series_equal(xs['ItemA'], ref[idx], check_names=False)
-
-        # not contained
-        self.assertRaises(Exception, self.panel.minor_xs, 'E')
-
-    def test_minor_xs_mixed(self):
-        self.panel['ItemD'] = 'foo'
-
-        xs = self.panel.minor_xs('D')
-        self.assertEqual(xs['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['ItemD'].dtype, np.object_)
-
-    def test_xs(self):
-        itemA = self.panel.xs('ItemA', axis=0)
-        expected = self.panel['ItemA']
-        assert_frame_equal(itemA, expected)
-
-        # get a view by default
-        itemA_view = self.panel.xs('ItemA', axis=0)
-        itemA_view.values[:] = np.nan
-        self.assertTrue(np.isnan(self.panel['ItemA'].values).all())
-
-        # mixed-type yields a copy
-        self.panel['strings'] = 'foo'
-        result = self.panel.xs('D', axis=2)
-        self.assertIsNotNone(result.is_copy)
-
-    def test_getitem_fancy_labels(self):
-        p = self.panel
-
-        items = p.items[[1, 0]]
-        dates = p.major_axis[::2]
-        cols = ['D', 'C', 'F']
-
-        # all 3 specified
-        assert_panel_equal(p.loc[items, dates, cols],
-                           p.reindex(items=items, major=dates, minor=cols))
-
-        # 2 specified
-        assert_panel_equal(p.loc[:, dates, cols],
-                           p.reindex(major=dates, minor=cols))
-
-        assert_panel_equal(p.loc[items, :, cols],
-                           p.reindex(items=items, minor=cols))
-
-        assert_panel_equal(p.loc[items, dates, :],
-                           p.reindex(items=items, major=dates))
-
-        # only 1
-        assert_panel_equal(p.loc[items, :, :], p.reindex(items=items))
-
-        assert_panel_equal(p.loc[:, dates, :], p.reindex(major=dates))
-
-        assert_panel_equal(p.loc[:, :, cols], p.reindex(minor=cols))
-
-    def test_getitem_fancy_slice(self):
-        pass
-
-    def test_getitem_fancy_ints(self):
-        p = self.panel
-
-        # #1603
-        result = p.iloc[:, -1, :]
-        expected = p.loc[:, p.major_axis[-1], :]
-        assert_frame_equal(result, expected)
-
-    def test_getitem_fancy_xs(self):
-        p = self.panel
-        item = 'ItemB'
-
-        date = p.major_axis[5]
-        col = 'C'
-
-        # get DataFrame
-        # item
-        assert_frame_equal(p.loc[item], p[item])
-        assert_frame_equal(p.loc[item, :], p[item])
-        assert_frame_equal(p.loc[item, :, :], p[item])
-
-        # major axis, axis=1
-        assert_frame_equal(p.loc[:, date], p.major_xs(date))
-        assert_frame_equal(p.loc[:, date, :], p.major_xs(date))
-
-        # minor axis, axis=2
-        assert_frame_equal(p.loc[:, :, 'C'], p.minor_xs('C'))
-
-        # get Series
-        assert_series_equal(p.loc[item, date], p[item].loc[date])
-        assert_series_equal(p.loc[item, date, :], p[item].loc[date])
-        assert_series_equal(p.loc[item, :, col], p[item][col])
-        assert_series_equal(p.loc[:, date, col], p.major_xs(date).loc[col])
-
-    def test_getitem_fancy_xs_check_view(self):
-        item = 'ItemB'
-        date = self.panel.major_axis[5]
-
-        # make sure it's always a view
-        NS = slice(None, None)
-
-        # DataFrames
-        comp = assert_frame_equal
-        self._check_view(item, comp)
-        self._check_view((item, NS), comp)
-        self._check_view((item, NS, NS), comp)
-        self._check_view((NS, date), comp)
-        self._check_view((NS, date, NS), comp)
-        self._check_view((NS, NS, 'C'), comp)
-
-        # Series
-        comp = assert_series_equal
-        self._check_view((item, date), comp)
-        self._check_view((item, date, NS), comp)
-        self._check_view((item, NS, 'C'), comp)
-        self._check_view((NS, date, 'C'), comp)
-
-    def test_getitem_callable(self):
-        p = self.panel
-        # GH 12533
-
-        assert_frame_equal(p[lambda x: 'ItemB'], p.loc['ItemB'])
-        assert_panel_equal(p[lambda x: ['ItemB', 'ItemC']],
-                           p.loc[['ItemB', 'ItemC']])
-
-    def test_ix_setitem_slice_dataframe(self):
-        a = Panel(items=[1, 2, 3], major_axis=[11, 22, 33],
-                  minor_axis=[111, 222, 333])
-        b = DataFrame(np.random.randn(2, 3), index=[111, 333],
-                      columns=[1, 2, 3])
-
-        a.loc[:, 22, [111, 333]] = b
-
-        assert_frame_equal(a.loc[:, 22, [111, 333]], b)
-
-    def test_ix_align(self):
-        from pandas import Series
-        b = Series(np.random.randn(10), name=0)
-        b.sort_values()
-        df_orig = Panel(np.random.randn(3, 10, 2))
-        df = df_orig.copy()
-
-        df.loc[0, :, 0] = b
-        assert_series_equal(df.loc[0, :, 0].reindex(b.index), b)
-
-        df = df_orig.swapaxes(0, 1)
-        df.loc[:, 0, 0] = b
-        assert_series_equal(df.loc[:, 0, 0].reindex(b.index), b)
-
-        df = df_orig.swapaxes(1, 2)
-        df.loc[0, 0, :] = b
-        assert_series_equal(df.loc[0, 0, :].reindex(b.index), b)
-
-    def test_ix_frame_align(self):
-        p_orig = tm.makePanel()
-        df = p_orig.iloc[0].copy()
-        assert_frame_equal(p_orig['ItemA'], df)
-
-        p = p_orig.copy()
-        p.iloc[0, :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0, :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.loc['ItemA'] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.loc['ItemA', :, :] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p['ItemA'] = df
-        assert_panel_equal(p, p_orig)
-
-        p = p_orig.copy()
-        p.iloc[0, [0, 1, 3, 5], -2:] = df
-        out = p.iloc[0, [0, 1, 3, 5], -2:]
-        assert_frame_equal(out, df.iloc[[0, 1, 3, 5], [2, 3]])
-
-        # GH3830, panel assignent by values/frame
-        for dtype in ['float64', 'int64']:
-
-            panel = Panel(np.arange(40).reshape((2, 4, 5)),
-                          items=['a1', 'a2'], dtype=dtype)
-            df1 = panel.iloc[0]
-            df2 = panel.iloc[1]
-
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
-
-            # Assignment by Value Passes for 'a2'
-            panel.loc['a2'] = df1.values
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df1)
-
-            # Assignment by DataFrame Ok w/o loc 'a2'
-            panel['a2'] = df2
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
-
-            # Assignment by DataFrame Fails for 'a2'
-            panel.loc['a2'] = df2
-            tm.assert_frame_equal(panel.loc['a1'], df1)
-            tm.assert_frame_equal(panel.loc['a2'], df2)
-
-    def _check_view(self, indexer, comp):
-        cp = self.panel.copy()
-        obj = cp.loc[indexer]
-        obj.values[:] = 0
-        self.assertTrue((obj.values == 0).all())
-        comp(cp.loc[indexer].reindex_like(obj), obj)
-
-    def test_logical_with_nas(self):
-        d = Panel({'ItemA': {'a': [np.nan, False]},
-                   'ItemB': {'a': [True, True]}})
-
-        result = d['ItemA'] | d['ItemB']
-        expected = DataFrame({'a': [np.nan, True]})
-        assert_frame_equal(result, expected)
-
-        # this is autodowncasted here
-        result = d['ItemA'].fillna(False) | d['ItemB']
-        expected = DataFrame({'a': [True, True]})
-        assert_frame_equal(result, expected)
-
-    def test_neg(self):
-        # what to do?
-        assert_panel_equal(-self.panel, -1 * self.panel)
-
-    def test_invert(self):
-        assert_panel_equal(-(self.panel < 0), ~(self.panel < 0))
-
-    def test_comparisons(self):
-        p1 = tm.makePanel()
-        p2 = tm.makePanel()
-
-        tp = p1.reindex(items=p1.items + ['foo'])
-        df = p1[p1.items[0]]
-
-        def test_comp(func):
-
-            # versus same index
-            result = func(p1, p2)
-            self.assert_numpy_array_equal(result.values,
-                                          func(p1.values, p2.values))
-
-            # versus non-indexed same objs
-            self.assertRaises(Exception, func, p1, tp)
-
-            # versus different objs
-            self.assertRaises(Exception, func, p1, df)
-
-            # versus scalar
-            result3 = func(self.panel, 0)
-            self.assert_numpy_array_equal(result3.values,
-                                          func(self.panel.values, 0))
-
-        with np.errstate(invalid='ignore'):
-            test_comp(operator.eq)
-            test_comp(operator.ne)
-            test_comp(operator.lt)
-            test_comp(operator.gt)
-            test_comp(operator.ge)
-            test_comp(operator.le)
-
-    def test_get_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
-                    expected = self.panel[item][mnr][mjr]
-                    assert_almost_equal(result, expected)
-        with tm.assertRaisesRegexp(TypeError,
-                                   "There must be an argument for each axis"):
-            self.panel.get_value('a')
-
-    def test_set_value(self):
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    self.panel.set_value(item, mjr, mnr, 1.)
-                    assert_almost_equal(self.panel[item][mnr][mjr], 1.)
-
-        # resize
-        res = self.panel.set_value('ItemE', 'foo', 'bar', 1.5)
-        tm.assertIsInstance(res, Panel)
-        self.assertIsNot(res, self.panel)
-        self.assertEqual(res.get_value('ItemE', 'foo', 'bar'), 1.5)
-
-        res3 = self.panel.set_value('ItemE', 'foobar', 'baz', 5)
-        self.assertTrue(is_float_dtype(res3['ItemE'].values))
-        with tm.assertRaisesRegexp(TypeError,
-                                   "There must be an argument for each axis"
-                                   " plus the value provided"):
-            self.panel.set_value('a')
-
-
-_panel = tm.makePanel()
-tm.add_nans(_panel)
-
-
-class TestPanel(tm.TestCase, PanelTests, CheckIndexing, SafeForLongAndSparse,
-                SafeForSparse):
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
-
-    def setUp(self):
-        self.panel = _panel.copy()
-        self.panel.major_axis.name = None
-        self.panel.minor_axis.name = None
-        self.panel.items.name = None
-
-    def test_constructor(self):
-        # with BlockManager
-        wp = Panel(self.panel._data)
-        self.assertIs(wp._data, self.panel._data)
-
-        wp = Panel(self.panel._data, copy=True)
-        self.assertIsNot(wp._data, self.panel._data)
-        assert_panel_equal(wp, self.panel)
-
-        # strings handled prop
-        wp = Panel([[['foo', 'foo', 'foo', ], ['foo', 'foo', 'foo']]])
-        self.assertEqual(wp.values.dtype, np.object_)
-
-        vals = self.panel.values
-
-        # no copy
-        wp = Panel(vals)
-        self.assertIs(wp.values, vals)
-
-        # copy
-        wp = Panel(vals, copy=True)
-        self.assertIsNot(wp.values, vals)
-
-        # GH #8285, test when scalar data is used to construct a Panel
-        # if dtype is not passed, it should be inferred
-        value_and_dtype = [(1, 'int64'), (3.14, 'float64'),
-                           ('foo', np.object_)]
-        for (val, dtype) in value_and_dtype:
-            wp = Panel(val, items=range(2), major_axis=range(3),
-                       minor_axis=range(4))
-            vals = np.empty((2, 3, 4), dtype=dtype)
-            vals.fill(val)
-            assert_panel_equal(wp, Panel(vals, dtype=dtype))
-
-        # test the case when dtype is passed
-        wp = Panel(1, items=range(2), major_axis=range(3), minor_axis=range(4),
-                   dtype='float32')
-        vals = np.empty((2, 3, 4), dtype='float32')
-        vals.fill(1)
-        assert_panel_equal(wp, Panel(vals, dtype='float32'))
-
-    def test_constructor_cast(self):
-        zero_filled = self.panel.fillna(0)
-
-        casted = Panel(zero_filled._data, dtype=int)
-        casted2 = Panel(zero_filled.values, dtype=int)
-
-        exp_values = zero_filled.values.astype(int)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
-
-        casted = Panel(zero_filled._data, dtype=np.int32)
-        casted2 = Panel(zero_filled.values, dtype=np.int32)
-
-        exp_values = zero_filled.values.astype(np.int32)
-        assert_almost_equal(casted.values, exp_values)
-        assert_almost_equal(casted2.values, exp_values)
-
-        # can't cast
-        data = [[['foo', 'bar', 'baz']]]
-        self.assertRaises(ValueError, Panel, data, dtype=float)
-
-    def test_constructor_empty_panel(self):
-        empty = Panel()
-        self.assertEqual(len(empty.items), 0)
-        self.assertEqual(len(empty.major_axis), 0)
-        self.assertEqual(len(empty.minor_axis), 0)
-
-    def test_constructor_observe_dtype(self):
-        # GH #411
-        panel = Panel(items=lrange(3), major_axis=lrange(3),
-                      minor_axis=lrange(3), dtype='O')
-        self.assertEqual(panel.values.dtype, np.object_)
-
-    def test_constructor_dtypes(self):
-        # GH #797
-
-        def _check_dtype(panel, dtype):
-            for i in panel.items:
-                self.assertEqual(panel[i].values.dtype.name, dtype)
-
-        # only nan holding types allowed here
-        for dtype in ['float64', 'float32', 'object']:
-            panel = Panel(items=lrange(2), major_axis=lrange(10),
-                          minor_axis=lrange(5), dtype=dtype)
-            _check_dtype(panel, dtype)
-
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
-            panel = Panel(np.array(np.random.randn(2, 10, 5), dtype=dtype),
-                          items=lrange(2),
-                          major_axis=lrange(10),
-                          minor_axis=lrange(5), dtype=dtype)
-            _check_dtype(panel, dtype)
-
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
-            panel = Panel(np.array(np.random.randn(2, 10, 5), dtype='O'),
-                          items=lrange(2),
-                          major_axis=lrange(10),
-                          minor_axis=lrange(5), dtype=dtype)
-            _check_dtype(panel, dtype)
-
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
-            panel = Panel(np.random.randn(2, 10, 5), items=lrange(
-                2), major_axis=lrange(10), minor_axis=lrange(5), dtype=dtype)
-            _check_dtype(panel, dtype)
-
-        for dtype in ['float64', 'float32', 'int64', 'int32', 'object']:
-            df1 = DataFrame(np.random.randn(2, 5),
-                            index=lrange(2), columns=lrange(5))
-            df2 = DataFrame(np.random.randn(2, 5),
-                            index=lrange(2), columns=lrange(5))
-            panel = Panel.from_dict({'a': df1, 'b': df2}, dtype=dtype)
-            _check_dtype(panel, dtype)
-
-    def test_constructor_fails_with_not_3d_input(self):
-        with tm.assertRaisesRegexp(ValueError,
-                                   "The number of dimensions required is 3"):
-            Panel(np.random.randn(10, 2))
-
-    def test_consolidate(self):
-        self.assertTrue(self.panel._data.is_consolidated())
-
-        self.panel['foo'] = 1.
-        self.assertFalse(self.panel._data.is_consolidated())
-
-        panel = self.panel._consolidate()
-        self.assertTrue(panel._data.is_consolidated())
-
-    def test_ctor_dict(self):
-        itema = self.panel['ItemA']
-        itemb = self.panel['ItemB']
-
-        d = {'A': itema, 'B': itemb[5:]}
-        d2 = {'A': itema._series, 'B': itemb[5:]._series}
-        d3 = {'A': None,
-              'B': DataFrame(itemb[5:]._series),
-              'C': DataFrame(itema._series)}
-
-        wp = Panel.from_dict(d)
-        wp2 = Panel.from_dict(d2)  # nested Dict
-
-        # TODO: unused?
-        wp3 = Panel.from_dict(d3)  # noqa
-
-        self.assert_index_equal(wp.major_axis, self.panel.major_axis)
-        assert_panel_equal(wp, wp2)
-
-        # intersect
-        wp = Panel.from_dict(d, intersect=True)
-        self.assert_index_equal(wp.major_axis, itemb.index[5:])
-
-        # use constructor
-        assert_panel_equal(Panel(d), Panel.from_dict(d))
-        assert_panel_equal(Panel(d2), Panel.from_dict(d2))
-        assert_panel_equal(Panel(d3), Panel.from_dict(d3))
-
-        # a pathological case
-        d4 = {'A': None, 'B': None}
-
-        # TODO: unused?
-        wp4 = Panel.from_dict(d4)  # noqa
-
-        assert_panel_equal(Panel(d4), Panel(items=['A', 'B']))
-
-        # cast
-        dcasted = dict((k, v.reindex(wp.major_axis).fillna(0))
-                       for k, v in compat.iteritems(d))
-        result = Panel(dcasted, dtype=int)
-        expected = Panel(dict((k, v.astype(int))
-                              for k, v in compat.iteritems(dcasted)))
-        assert_panel_equal(result, expected)
-
-        result = Panel(dcasted, dtype=np.int32)
-        expected = Panel(dict((k, v.astype(np.int32))
-                              for k, v in compat.iteritems(dcasted)))
-        assert_panel_equal(result, expected)
-
-    def test_constructor_dict_mixed(self):
-        data = dict((k, v.values) for k, v in self.panel.iteritems())
-        result = Panel(data)
-        exp_major = Index(np.arange(len(self.panel.major_axis)))
-        self.assert_index_equal(result.major_axis, exp_major)
-
-        result = Panel(data, items=self.panel.items,
-                       major_axis=self.panel.major_axis,
-                       minor_axis=self.panel.minor_axis)
-        assert_panel_equal(result, self.panel)
-
-        data['ItemC'] = self.panel['ItemC']
-        result = Panel(data)
-        assert_panel_equal(result, self.panel)
-
-        # corner, blow up
-        data['ItemB'] = data['ItemB'][:-1]
-        self.assertRaises(Exception, Panel, data)
-
-        data['ItemB'] = self.panel['ItemB'].values[:, :-1]
-        self.assertRaises(Exception, Panel, data)
-
-    def test_ctor_orderedDict(self):
-        keys = list(set(np.random.randint(0, 5000, 100)))[
-            :50]  # unique random int  keys
-        d = OrderedDict([(k, mkdf(10, 5)) for k in keys])
-        p = Panel(d)
-        self.assertTrue(list(p.items) == keys)
-
-        p = Panel.from_dict(d)
-        self.assertTrue(list(p.items) == keys)
-
-    def test_constructor_resize(self):
-        data = self.panel._data
-        items = self.panel.items[:-1]
-        major = self.panel.major_axis[:-1]
-        minor = self.panel.minor_axis[:-1]
-
-        result = Panel(data, items=items, major_axis=major, minor_axis=minor)
-        expected = self.panel.reindex(items=items, major=major, minor=minor)
-        assert_panel_equal(result, expected)
-
-        result = Panel(data, items=items, major_axis=major)
-        expected = self.panel.reindex(items=items, major=major)
-        assert_panel_equal(result, expected)
-
-        result = Panel(data, items=items)
-        expected = self.panel.reindex(items=items)
-        assert_panel_equal(result, expected)
-
-        result = Panel(data, minor_axis=minor)
-        expected = self.panel.reindex(minor=minor)
-        assert_panel_equal(result, expected)
-
-    def test_from_dict_mixed_orient(self):
-        df = tm.makeDataFrame()
-        df['foo'] = 'bar'
-
-        data = {'k1': df, 'k2': df}
-
-        panel = Panel.from_dict(data, orient='minor')
-
-        self.assertEqual(panel['foo'].values.dtype, np.object_)
-        self.assertEqual(panel['A'].values.dtype, np.float64)
-
-    def test_constructor_error_msgs(self):
-        def testit():
-            Panel(np.random.randn(3, 4, 5), lrange(4), lrange(5), lrange(5))
-
-        assertRaisesRegexp(ValueError,
-                           r"Shape of passed values is \(3, 4, 5\), "
-                           r"indices imply \(4, 5, 5\)",
-                           testit)
-
-        def testit():
-            Panel(np.random.randn(3, 4, 5), lrange(5), lrange(4), lrange(5))
-
-        assertRaisesRegexp(ValueError,
-                           r"Shape of passed values is \(3, 4, 5\), "
-                           r"indices imply \(5, 4, 5\)",
-                           testit)
-
-        def testit():
-            Panel(np.random.randn(3, 4, 5), lrange(5), lrange(5), lrange(4))
-
-        assertRaisesRegexp(ValueError,
-                           r"Shape of passed values is \(3, 4, 5\), "
-                           r"indices imply \(5, 5, 4\)",
-                           testit)
-
-    def test_conform(self):
-        df = self.panel['ItemA'][:-5].filter(items=['A', 'B'])
-        conformed = self.panel.conform(df)
-
-        tm.assert_index_equal(conformed.index, self.panel.major_axis)
-        tm.assert_index_equal(conformed.columns, self.panel.minor_axis)
-
-    def test_convert_objects(self):
-
-        # GH 4937
-        p = Panel(dict(A=dict(a=['1', '1.0'])))
-        expected = Panel(dict(A=dict(a=[1, 1.0])))
-        result = p._convert(numeric=True, coerce=True)
-        assert_panel_equal(result, expected)
-
-    def test_dtypes(self):
-
-        result = self.panel.dtypes
-        expected = Series(np.dtype('float64'), index=self.panel.items)
-        assert_series_equal(result, expected)
-
-    def test_astype(self):
-        # GH7271
-        data = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
-        panel = Panel(data, ['a', 'b'], ['c', 'd'], ['e', 'f'])
-
-        str_data = np.array([[['1', '2'], ['3', '4']],
-                             [['5', '6'], ['7', '8']]])
-        expected = Panel(str_data, ['a', 'b'], ['c', 'd'], ['e', 'f'])
-        assert_panel_equal(panel.astype(str), expected)
-
-        self.assertRaises(NotImplementedError, panel.astype, {0: str})
-
-    def test_apply(self):
-        # GH1148
-
-        # ufunc
-        applied = self.panel.apply(np.sqrt)
-        with np.errstate(invalid='ignore'):
-            expected = np.sqrt(self.panel.values)
-        assert_almost_equal(applied.values, expected)
-
-        # ufunc same shape
-        result = self.panel.apply(lambda x: x * 2, axis='items')
-        expected = self.panel * 2
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x * 2, axis='major_axis')
-        expected = self.panel * 2
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x * 2, axis='minor_axis')
-        expected = self.panel * 2
-        assert_panel_equal(result, expected)
-
-        # reduction to DataFrame
-        result = self.panel.apply(lambda x: x.dtype, axis='items')
-        expected = DataFrame(np.dtype('float64'), index=self.panel.major_axis,
-                             columns=self.panel.minor_axis)
-        assert_frame_equal(result, expected)
-        result = self.panel.apply(lambda x: x.dtype, axis='major_axis')
-        expected = DataFrame(np.dtype('float64'), index=self.panel.minor_axis,
-                             columns=self.panel.items)
-        assert_frame_equal(result, expected)
-        result = self.panel.apply(lambda x: x.dtype, axis='minor_axis')
-        expected = DataFrame(np.dtype('float64'), index=self.panel.major_axis,
-                             columns=self.panel.items)
-        assert_frame_equal(result, expected)
-
-        # reductions via other dims
-        expected = self.panel.sum(0)
-        result = self.panel.apply(lambda x: x.sum(), axis='items')
-        assert_frame_equal(result, expected)
-        expected = self.panel.sum(1)
-        result = self.panel.apply(lambda x: x.sum(), axis='major_axis')
-        assert_frame_equal(result, expected)
-        expected = self.panel.sum(2)
-        result = self.panel.apply(lambda x: x.sum(), axis='minor_axis')
-        assert_frame_equal(result, expected)
-
-        # pass kwargs
-        result = self.panel.apply(lambda x, y: x.sum() + y, axis='items', y=5)
-        expected = self.panel.sum(0) + 5
-        assert_frame_equal(result, expected)
-
-    def test_apply_slabs(self):
-
-        # same shape as original
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['items', 'major_axis'])
-        expected = (self.panel * 2).transpose('minor_axis', 'major_axis',
-                                              'items')
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['major_axis', 'items'])
-        assert_panel_equal(result, expected)
-
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['items', 'minor_axis'])
-        expected = (self.panel * 2).transpose('major_axis', 'minor_axis',
-                                              'items')
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['minor_axis', 'items'])
-        assert_panel_equal(result, expected)
-
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['major_axis', 'minor_axis'])
-        expected = self.panel * 2
-        assert_panel_equal(result, expected)
-        result = self.panel.apply(lambda x: x * 2,
-                                  axis=['minor_axis', 'major_axis'])
-        assert_panel_equal(result, expected)
-
-        # reductions
-        result = self.panel.apply(lambda x: x.sum(0), axis=[
-            'items', 'major_axis'
-        ])
-        expected = self.panel.sum(1).T
-        assert_frame_equal(result, expected)
-
-        result = self.panel.apply(lambda x: x.sum(1), axis=[
-            'items', 'major_axis'
-        ])
-        expected = self.panel.sum(0)
-        assert_frame_equal(result, expected)
-
-        # transforms
-        f = lambda x: ((x.T - x.mean(1)) / x.std(1)).T
-
-        # make sure that we don't trigger any warnings
-        with catch_warnings(record=True):
-            result = self.panel.apply(f, axis=['items', 'major_axis'])
-            expected = Panel(dict([(ax, f(self.panel.loc[:, :, ax]))
-                                   for ax in self.panel.minor_axis]))
-            assert_panel_equal(result, expected)
-
-        result = self.panel.apply(f, axis=['major_axis', 'minor_axis'])
-        expected = Panel(dict([(ax, f(self.panel.loc[ax]))
-                               for ax in self.panel.items]))
-        assert_panel_equal(result, expected)
-
-        result = self.panel.apply(f, axis=['minor_axis', 'items'])
-        expected = Panel(dict([(ax, f(self.panel.loc[:, ax]))
-                               for ax in self.panel.major_axis]))
-        assert_panel_equal(result, expected)
-
-        # with multi-indexes
-        # GH7469
-        index = MultiIndex.from_tuples([('one', 'a'), ('one', 'b'), (
-            'two', 'a'), ('two', 'b')])
-        dfa = DataFrame(np.array(np.arange(12, dtype='int64')).reshape(
-            4, 3), columns=list("ABC"), index=index)
-        dfb = DataFrame(np.array(np.arange(10, 22, dtype='int64')).reshape(
-            4, 3), columns=list("ABC"), index=index)
-        p = Panel({'f': dfa, 'g': dfb})
-        result = p.apply(lambda x: x.sum(), axis=0)
-
-        # on windows this will be in32
-        result = result.astype('int64')
-        expected = p.sum(0)
-        assert_frame_equal(result, expected)
-
-    def test_apply_no_or_zero_ndim(self):
-        # GH10332
-        self.panel = Panel(np.random.rand(5, 5, 5))
-
-        result_int = self.panel.apply(lambda df: 0, axis=[1, 2])
-        result_float = self.panel.apply(lambda df: 0.0, axis=[1, 2])
-        result_int64 = self.panel.apply(lambda df: np.int64(0), axis=[1, 2])
-        result_float64 = self.panel.apply(lambda df: np.float64(0.0),
-                                          axis=[1, 2])
-
-        expected_int = expected_int64 = Series([0] * 5)
-        expected_float = expected_float64 = Series([0.0] * 5)
-
-        assert_series_equal(result_int, expected_int)
-        assert_series_equal(result_int64, expected_int64)
-        assert_series_equal(result_float, expected_float)
-        assert_series_equal(result_float64, expected_float64)
-
-    def test_reindex(self):
-        ref = self.panel['ItemB']
-
-        # items
-        result = self.panel.reindex(items=['ItemA', 'ItemB'])
-        assert_frame_equal(result['ItemB'], ref)
-
-        # major
-        new_major = list(self.panel.major_axis[:10])
-        result = self.panel.reindex(major=new_major)
-        assert_frame_equal(result['ItemB'], ref.reindex(index=new_major))
-
-        # raise exception put both major and major_axis
-        self.assertRaises(Exception, self.panel.reindex, major_axis=new_major,
-                          major=new_major)
-
-        # minor
-        new_minor = list(self.panel.minor_axis[:2])
-        result = self.panel.reindex(minor=new_minor)
-        assert_frame_equal(result['ItemB'], ref.reindex(columns=new_minor))
-
-        # this ok
-        result = self.panel.reindex()
-        assert_panel_equal(result, self.panel)
-        self.assertFalse(result is self.panel)
-
-        # with filling
-        smaller_major = self.panel.major_axis[::5]
-        smaller = self.panel.reindex(major=smaller_major)
-
-        larger = smaller.reindex(major=self.panel.major_axis, method='pad')
-
-        assert_frame_equal(larger.major_xs(self.panel.major_axis[1]),
-                           smaller.major_xs(smaller_major[0]))
-
-        # don't necessarily copy
-        result = self.panel.reindex(major=self.panel.major_axis, copy=False)
-        assert_panel_equal(result, self.panel)
-        self.assertTrue(result is self.panel)
-
-    def test_reindex_multi(self):
-
-        # with and without copy full reindexing
-        result = self.panel.reindex(items=self.panel.items,
-                                    major=self.panel.major_axis,
-                                    minor=self.panel.minor_axis, copy=False)
-
-        self.assertIs(result.items, self.panel.items)
-        self.assertIs(result.major_axis, self.panel.major_axis)
-        self.assertIs(result.minor_axis, self.panel.minor_axis)
-
-        result = self.panel.reindex(items=self.panel.items,
-                                    major=self.panel.major_axis,
-                                    minor=self.panel.minor_axis, copy=False)
-        assert_panel_equal(result, self.panel)
-
-        # multi-axis indexing consistency
-        # GH 5900
-        df = DataFrame(np.random.randn(4, 3))
-        p = Panel({'Item1': df})
-        expected = Panel({'Item1': df})
-        expected['Item2'] = np.nan
-
-        items = ['Item1', 'Item2']
-        major_axis = np.arange(4)
-        minor_axis = np.arange(3)
-
-        results = []
-        results.append(p.reindex(items=items, major_axis=major_axis,
-                                 copy=True))
-        results.append(p.reindex(items=items, major_axis=major_axis,
-                                 copy=False))
-        results.append(p.reindex(items=items, minor_axis=minor_axis,
-                                 copy=True))
-        results.append(p.reindex(items=items, minor_axis=minor_axis,
-                                 copy=False))
-        results.append(p.reindex(items=items, major_axis=major_axis,
-                                 minor_axis=minor_axis, copy=True))
-        results.append(p.reindex(items=items, major_axis=major_axis,
-                                 minor_axis=minor_axis, copy=False))
-
-        for i, r in enumerate(results):
-            assert_panel_equal(expected, r)
-
-    def test_reindex_like(self):
-        # reindex_like
-        smaller = self.panel.reindex(items=self.panel.items[:-1],
-                                     major=self.panel.major_axis[:-1],
-                                     minor=self.panel.minor_axis[:-1])
-        smaller_like = self.panel.reindex_like(smaller)
-        assert_panel_equal(smaller, smaller_like)
-
-    def test_take(self):
-        # axis == 0
-        result = self.panel.take([2, 0, 1], axis=0)
-        expected = self.panel.reindex(items=['ItemC', 'ItemA', 'ItemB'])
-        assert_panel_equal(result, expected)
-
-        # axis >= 1
-        result = self.panel.take([3, 0, 1, 2], axis=2)
-        expected = self.panel.reindex(minor=['D', 'A', 'B', 'C'])
-        assert_panel_equal(result, expected)
-
-        # neg indicies ok
-        expected = self.panel.reindex(minor=['D', 'D', 'B', 'C'])
-        result = self.panel.take([3, -1, 1, 2], axis=2)
-        assert_panel_equal(result, expected)
-
-        self.assertRaises(Exception, self.panel.take, [4, 0, 1, 2], axis=2)
-
-    def test_sort_index(self):
-        import random
-
-        ritems = list(self.panel.items)
-        rmajor = list(self.panel.major_axis)
-        rminor = list(self.panel.minor_axis)
-        random.shuffle(ritems)
-        random.shuffle(rmajor)
-        random.shuffle(rminor)
-
-        random_order = self.panel.reindex(items=ritems)
-        sorted_panel = random_order.sort_index(axis=0)
-        assert_panel_equal(sorted_panel, self.panel)
-
-        # descending
-        random_order = self.panel.reindex(items=ritems)
-        sorted_panel = random_order.sort_index(axis=0, ascending=False)
-        assert_panel_equal(sorted_panel,
-                           self.panel.reindex(items=self.panel.items[::-1]))
-
-        random_order = self.panel.reindex(major=rmajor)
-        sorted_panel = random_order.sort_index(axis=1)
-        assert_panel_equal(sorted_panel, self.panel)
-
-        random_order = self.panel.reindex(minor=rminor)
-        sorted_panel = random_order.sort_index(axis=2)
-        assert_panel_equal(sorted_panel, self.panel)
-
-    def test_fillna(self):
-        filled = self.panel.fillna(0)
-        self.assertTrue(np.isfinite(filled.values).all())
-
-        filled = self.panel.fillna(method='backfill')
-        assert_frame_equal(filled['ItemA'],
-                           self.panel['ItemA'].fillna(method='backfill'))
-
-        panel = self.panel.copy()
-        panel['str'] = 'foo'
-
-        filled = panel.fillna(method='backfill')
-        assert_frame_equal(filled['ItemA'],
-                           panel['ItemA'].fillna(method='backfill'))
-
-        empty = self.panel.reindex(items=[])
-        filled = empty.fillna(0)
-        assert_panel_equal(filled, empty)
-
-        self.assertRaises(ValueError, self.panel.fillna)
-        self.assertRaises(ValueError, self.panel.fillna, 5, method='ffill')
-
-        self.assertRaises(TypeError, self.panel.fillna, [1, 2])
-        self.assertRaises(TypeError, self.panel.fillna, (1, 2))
-
-        # limit not implemented when only value is specified
-        p = Panel(np.random.randn(3, 4, 5))
-        p.iloc[0:2, 0:2, 0:2] = np.nan
-        self.assertRaises(NotImplementedError, lambda: p.fillna(999, limit=1))
-
-        # Test in place fillNA
-        # Expected result
-        expected = Panel([[[0, 1], [2, 1]], [[10, 11], [12, 11]]],
-                         items=['a', 'b'], minor_axis=['x', 'y'],
-                         dtype=np.float64)
-        # method='ffill'
-        p1 = Panel([[[0, 1], [2, np.nan]], [[10, 11], [12, np.nan]]],
-                   items=['a', 'b'], minor_axis=['x', 'y'],
-                   dtype=np.float64)
-        p1.fillna(method='ffill', inplace=True)
-        assert_panel_equal(p1, expected)
-
-        # method='bfill'
-        p2 = Panel([[[0, np.nan], [2, 1]], [[10, np.nan], [12, 11]]],
-                   items=['a', 'b'], minor_axis=['x', 'y'], dtype=np.float64)
-        p2.fillna(method='bfill', inplace=True)
-        assert_panel_equal(p2, expected)
-
-    def test_ffill_bfill(self):
-        assert_panel_equal(self.panel.ffill(),
-                           self.panel.fillna(method='ffill'))
-        assert_panel_equal(self.panel.bfill(),
-                           self.panel.fillna(method='bfill'))
-
-    def test_truncate_fillna_bug(self):
-        # #1823
-        result = self.panel.truncate(before=None, after=None, axis='items')
-
-        # it works!
-        result.fillna(value=0.0)
-
-    def test_swapaxes(self):
-        result = self.panel.swapaxes('items', 'minor')
-        self.assertIs(result.items, self.panel.minor_axis)
-
-        result = self.panel.swapaxes('items', 'major')
-        self.assertIs(result.items, self.panel.major_axis)
-
-        result = self.panel.swapaxes('major', 'minor')
-        self.assertIs(result.major_axis, self.panel.minor_axis)
-
-        panel = self.panel.copy()
-        result = panel.swapaxes('major', 'minor')
-        panel.values[0, 0, 1] = np.nan
-        expected = panel.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
-
-        # this should also work
-        result = self.panel.swapaxes(0, 1)
-        self.assertIs(result.items, self.panel.major_axis)
-
-        # this works, but return a copy
-        result = self.panel.swapaxes('items', 'items')
-        assert_panel_equal(self.panel, result)
-        self.assertNotEqual(id(self.panel), id(result))
-
-    def test_transpose(self):
-        result = self.panel.transpose('minor', 'major', 'items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # test kwargs
-        result = self.panel.transpose(items='minor', major='major',
-                                      minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # text mixture of args
-        result = self.panel.transpose('minor', major='major', minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose('minor', 'major', minor='items')
-        expected = self.panel.swapaxes('items', 'minor')
-        assert_panel_equal(result, expected)
-
-        # duplicate axes
-        with tm.assertRaisesRegexp(TypeError,
-                                   'not enough/duplicate arguments'):
-            self.panel.transpose('minor', maj='major', minor='items')
-
-        with tm.assertRaisesRegexp(ValueError, 'repeated axis in transpose'):
-            self.panel.transpose('minor', 'major', major='minor',
-                                 minor='items')
-
-        result = self.panel.transpose(2, 1, 0)
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose('minor', 'items', 'major')
-        expected = self.panel.swapaxes('items', 'minor')
-        expected = expected.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
-
-        result = self.panel.transpose(2, 0, 1)
-        assert_panel_equal(result, expected)
-
-        self.assertRaises(ValueError, self.panel.transpose, 0, 0, 1)
-
-    def test_transpose_copy(self):
-        panel = self.panel.copy()
-        result = panel.transpose(2, 0, 1, copy=True)
-        expected = panel.swapaxes('items', 'minor')
-        expected = expected.swapaxes('major', 'minor')
-        assert_panel_equal(result, expected)
-
-        panel.values[0, 1, 1] = np.nan
-        self.assertTrue(notnull(result.values[1, 0, 1]))
-
-    def test_to_frame(self):
-        # filtered
-        filtered = self.panel.to_frame()
-        expected = self.panel.to_frame().dropna(how='any')
-        assert_frame_equal(filtered, expected)
-
-        # unfiltered
-        unfiltered = self.panel.to_frame(filter_observations=False)
-        assert_panel_equal(unfiltered.to_panel(), self.panel)
-
-        # names
-        self.assertEqual(unfiltered.index.names, ('major', 'minor'))
-
-        # unsorted, round trip
-        df = self.panel.to_frame(filter_observations=False)
-        unsorted = df.take(np.random.permutation(len(df)))
-        pan = unsorted.to_panel()
-        assert_panel_equal(pan, self.panel)
-
-        # preserve original index names
-        df = DataFrame(np.random.randn(6, 2),
-                       index=[['a', 'a', 'b', 'b', 'c', 'c'],
-                              [0, 1, 0, 1, 0, 1]],
-                       columns=['one', 'two'])
-        df.index.names = ['foo', 'bar']
-        df.columns.name = 'baz'
-
-        rdf = df.to_panel().to_frame()
-        self.assertEqual(rdf.index.names, df.index.names)
-        self.assertEqual(rdf.columns.names, df.columns.names)
-
-    def test_to_frame_mixed(self):
-        panel = self.panel.fillna(0)
-        panel['str'] = 'foo'
-        panel['bool'] = panel['ItemA'] > 0
-
-        lp = panel.to_frame()
-        wp = lp.to_panel()
-        self.assertEqual(wp['bool'].values.dtype, np.bool_)
-        # Previously, this was mutating the underlying index and changing its
-        # name
-        assert_frame_equal(wp['bool'], panel['bool'], check_names=False)
-
-        # GH 8704
-        # with categorical
-        df = panel.to_frame()
-        df['category'] = df['str'].astype('category')
-
-        # to_panel
-        # TODO: this converts back to object
-        p = df.to_panel()
-        expected = panel.copy()
-        expected['category'] = 'foo'
-        assert_panel_equal(p, expected)
-
-    def test_to_frame_multi_major(self):
-        idx = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
-            2, 'two')])
-        df = DataFrame([[1, 'a', 1], [2, 'b', 1], [3, 'c', 1], [4, 'd', 1]],
-                       columns=['A', 'B', 'C'], index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        expected_idx = MultiIndex.from_tuples(
-            [
-                (1, 'one', 'A'), (1, 'one', 'B'),
-                (1, 'one', 'C'), (1, 'two', 'A'),
-                (1, 'two', 'B'), (1, 'two', 'C'),
-                (2, 'one', 'A'), (2, 'one', 'B'),
-                (2, 'one', 'C'), (2, 'two', 'A'),
-                (2, 'two', 'B'), (2, 'two', 'C')
-            ],
-            names=[None, None, 'minor'])
-        expected = DataFrame({'i1': [1, 'a', 1, 2, 'b', 1, 3,
-                                     'c', 1, 4, 'd', 1],
-                              'i2': [1, 'a', 1, 2, 'b',
-                                     1, 3, 'c', 1, 4, 'd', 1]},
-                             index=expected_idx)
-        result = wp.to_frame()
-        assert_frame_equal(result, expected)
-
-        wp.iloc[0, 0].iloc[0] = np.nan  # BUG on setting. GH #5773
-        result = wp.to_frame()
-        assert_frame_equal(result, expected[1:])
-
-        idx = MultiIndex.from_tuples([(1, 'two'), (1, 'one'), (2, 'one'), (
-            np.nan, 'two')])
-        df = DataFrame([[1, 'a', 1], [2, 'b', 1], [3, 'c', 1], [4, 'd', 1]],
-                       columns=['A', 'B', 'C'], index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        ex_idx = MultiIndex.from_tuples([(1, 'two', 'A'), (1, 'two', 'B'),
-                                         (1, 'two', 'C'),
-                                         (1, 'one', 'A'),
-                                         (1, 'one', 'B'),
-                                         (1, 'one', 'C'),
-                                         (2, 'one', 'A'),
-                                         (2, 'one', 'B'),
-                                         (2, 'one', 'C'),
-                                         (np.nan, 'two', 'A'),
-                                         (np.nan, 'two', 'B'),
-                                         (np.nan, 'two', 'C')],
-                                        names=[None, None, 'minor'])
-        expected.index = ex_idx
-        result = wp.to_frame()
-        assert_frame_equal(result, expected)
-
-    def test_to_frame_multi_major_minor(self):
-        cols = MultiIndex(levels=[['C_A', 'C_B'], ['C_1', 'C_2']],
-                          labels=[[0, 0, 1, 1], [0, 1, 0, 1]])
-        idx = MultiIndex.from_tuples([(1, 'one'), (1, 'two'), (2, 'one'), (
-            2, 'two'), (3, 'three'), (4, 'four')])
-        df = DataFrame([[1, 2, 11, 12], [3, 4, 13, 14],
-                        ['a', 'b', 'w', 'x'],
-                        ['c', 'd', 'y', 'z'], [-1, -2, -3, -4],
-                        [-5, -6, -7, -8]], columns=cols, index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-
-        exp_idx = MultiIndex.from_tuples(
-            [(1, 'one', 'C_A', 'C_1'), (1, 'one', 'C_A', 'C_2'),
-             (1, 'one', 'C_B', 'C_1'), (1, 'one', 'C_B', 'C_2'),
-             (1, 'two', 'C_A', 'C_1'), (1, 'two', 'C_A', 'C_2'),
-             (1, 'two', 'C_B', 'C_1'), (1, 'two', 'C_B', 'C_2'),
-             (2, 'one', 'C_A', 'C_1'), (2, 'one', 'C_A', 'C_2'),
-             (2, 'one', 'C_B', 'C_1'), (2, 'one', 'C_B', 'C_2'),
-             (2, 'two', 'C_A', 'C_1'), (2, 'two', 'C_A', 'C_2'),
-             (2, 'two', 'C_B', 'C_1'), (2, 'two', 'C_B', 'C_2'),
-             (3, 'three', 'C_A', 'C_1'), (3, 'three', 'C_A', 'C_2'),
-             (3, 'three', 'C_B', 'C_1'), (3, 'three', 'C_B', 'C_2'),
-             (4, 'four', 'C_A', 'C_1'), (4, 'four', 'C_A', 'C_2'),
-             (4, 'four', 'C_B', 'C_1'), (4, 'four', 'C_B', 'C_2')],
-            names=[None, None, None, None])
-        exp_val = [[1, 1], [2, 2], [11, 11], [12, 12], [3, 3], [4, 4],
-                   [13, 13], [14, 14], ['a', 'a'], ['b', 'b'], ['w', 'w'],
-                   ['x', 'x'], ['c', 'c'], ['d', 'd'], ['y', 'y'], ['z', 'z'],
-                   [-1, -1], [-2, -2], [-3, -3], [-4, -4], [-5, -5], [-6, -6],
-                   [-7, -7], [-8, -8]]
-        result = wp.to_frame()
-        expected = DataFrame(exp_val, columns=['i1', 'i2'], index=exp_idx)
-        assert_frame_equal(result, expected)
-
-    def test_to_frame_multi_drop_level(self):
-        idx = MultiIndex.from_tuples([(1, 'one'), (2, 'one'), (2, 'two')])
-        df = DataFrame({'A': [np.nan, 1, 2]}, index=idx)
-        wp = Panel({'i1': df, 'i2': df})
-        result = wp.to_frame()
-        exp_idx = MultiIndex.from_tuples([(2, 'one', 'A'), (2, 'two', 'A')],
-                                         names=[None, None, 'minor'])
-        expected = DataFrame({'i1': [1., 2], 'i2': [1., 2]}, index=exp_idx)
-        assert_frame_equal(result, expected)
-
-    def test_to_panel_na_handling(self):
-        df = DataFrame(np.random.randint(0, 10, size=20).reshape((10, 2)),
-                       index=[[0, 0, 0, 0, 0, 0, 1, 1, 1, 1],
-                              [0, 1, 2, 3, 4, 5, 2, 3, 4, 5]])
-
-        panel = df.to_panel()
-        self.assertTrue(isnull(panel[0].loc[1, [0, 1]]).all())
-
-    def test_to_panel_duplicates(self):
-        # #2441
-        df = DataFrame({'a': [0, 0, 1], 'b': [1, 1, 1], 'c': [1, 2, 3]})
-        idf = df.set_index(['a', 'b'])
-        assertRaisesRegexp(ValueError, 'non-uniquely indexed', idf.to_panel)
-
-    def test_panel_dups(self):
-
-        # GH 4960
-        # duplicates in an index
-
-        # items
-        data = np.random.randn(5, 100, 5)
-        no_dup_panel = Panel(data, items=list("ABCDE"))
-        panel = Panel(data, items=list("AACDE"))
-
-        expected = no_dup_panel['A']
-        result = panel.iloc[0]
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel['E']
-        result = panel.loc['E']
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel.loc[['A', 'B']]
-        expected.items = ['A', 'A']
-        result = panel.loc['A']
-        assert_panel_equal(result, expected)
-
-        # major
-        data = np.random.randn(5, 5, 5)
-        no_dup_panel = Panel(data, major_axis=list("ABCDE"))
-        panel = Panel(data, major_axis=list("AACDE"))
-
-        expected = no_dup_panel.loc[:, 'A']
-        result = panel.iloc[:, 0]
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel.loc[:, 'E']
-        result = panel.loc[:, 'E']
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel.loc[:, ['A', 'B']]
-        expected.major_axis = ['A', 'A']
-        result = panel.loc[:, 'A']
-        assert_panel_equal(result, expected)
-
-        # minor
-        data = np.random.randn(5, 100, 5)
-        no_dup_panel = Panel(data, minor_axis=list("ABCDE"))
-        panel = Panel(data, minor_axis=list("AACDE"))
-
-        expected = no_dup_panel.loc[:, :, 'A']
-        result = panel.iloc[:, :, 0]
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel.loc[:, :, 'E']
-        result = panel.loc[:, :, 'E']
-        assert_frame_equal(result, expected)
-
-        expected = no_dup_panel.loc[:, :, ['A', 'B']]
-        expected.minor_axis = ['A', 'A']
-        result = panel.loc[:, :, 'A']
-        assert_panel_equal(result, expected)
-
-    def test_filter(self):
-        pass
-
-    def test_compound(self):
-        compounded = self.panel.compound()
-
-        assert_series_equal(compounded['ItemA'],
-                            (1 + self.panel['ItemA']).product(0) - 1,
-                            check_names=False)
-
-    def test_shift(self):
-        # major
-        idx = self.panel.major_axis[0]
-        idx_lag = self.panel.major_axis[1]
-        shifted = self.panel.shift(1)
-        assert_frame_equal(self.panel.major_xs(idx), shifted.major_xs(idx_lag))
-
-        # minor
-        idx = self.panel.minor_axis[0]
-        idx_lag = self.panel.minor_axis[1]
-        shifted = self.panel.shift(1, axis='minor')
-        assert_frame_equal(self.panel.minor_xs(idx), shifted.minor_xs(idx_lag))
-
-        # items
-        idx = self.panel.items[0]
-        idx_lag = self.panel.items[1]
-        shifted = self.panel.shift(1, axis='items')
-        assert_frame_equal(self.panel[idx], shifted[idx_lag])
-
-        # negative numbers, #2164
-        result = self.panel.shift(-1)
-        expected = Panel(dict((i, f.shift(-1)[:-1])
-                              for i, f in self.panel.iteritems()))
-        assert_panel_equal(result, expected)
-
-        # mixed dtypes #6959
-        data = [('item ' + ch, makeMixedDataFrame()) for ch in list('abcde')]
-        data = dict(data)
-        mixed_panel = Panel.from_dict(data, orient='minor')
-        shifted = mixed_panel.shift(1)
-        assert_series_equal(mixed_panel.dtypes, shifted.dtypes)
-
-    def test_tshift(self):
-        # PeriodIndex
-        ps = tm.makePeriodPanel()
-        shifted = ps.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_panel_equal(unshifted, ps)
-
-        shifted2 = ps.tshift(freq='B')
-        assert_panel_equal(shifted, shifted2)
-
-        shifted3 = ps.tshift(freq=BDay())
-        assert_panel_equal(shifted, shifted3)
-
-        assertRaisesRegexp(ValueError, 'does not match', ps.tshift, freq='M')
-
-        # DatetimeIndex
-        panel = _panel
-        shifted = panel.tshift(1)
-        unshifted = shifted.tshift(-1)
-
-        assert_panel_equal(panel, unshifted)
-
-        shifted2 = panel.tshift(freq=panel.major_axis.freq)
-        assert_panel_equal(shifted, shifted2)
-
-        inferred_ts = Panel(panel.values, items=panel.items,
-                            major_axis=Index(np.asarray(panel.major_axis)),
-                            minor_axis=panel.minor_axis)
-        shifted = inferred_ts.tshift(1)
-        unshifted = shifted.tshift(-1)
-        assert_panel_equal(shifted, panel.tshift(1))
-        assert_panel_equal(unshifted, inferred_ts)
-
-        no_freq = panel.iloc[:, [0, 5, 7], :]
-        self.assertRaises(ValueError, no_freq.tshift)
-
-    def test_pct_change(self):
-        df1 = DataFrame({'c1': [1, 2, 5], 'c2': [3, 4, 6]})
-        df2 = df1 + 1
-        df3 = DataFrame({'c1': [3, 4, 7], 'c2': [5, 6, 8]})
-        wp = Panel({'i1': df1, 'i2': df2, 'i3': df3})
-        # major, 1
-        result = wp.pct_change()  # axis='major'
-        expected = Panel({'i1': df1.pct_change(),
-                          'i2': df2.pct_change(),
-                          'i3': df3.pct_change()})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=1)
-        assert_panel_equal(result, expected)
-        # major, 2
-        result = wp.pct_change(periods=2)
-        expected = Panel({'i1': df1.pct_change(2),
-                          'i2': df2.pct_change(2),
-                          'i3': df3.pct_change(2)})
-        assert_panel_equal(result, expected)
-        # minor, 1
-        result = wp.pct_change(axis='minor')
-        expected = Panel({'i1': df1.pct_change(axis=1),
-                          'i2': df2.pct_change(axis=1),
-                          'i3': df3.pct_change(axis=1)})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=2)
-        assert_panel_equal(result, expected)
-        # minor, 2
-        result = wp.pct_change(periods=2, axis='minor')
-        expected = Panel({'i1': df1.pct_change(periods=2, axis=1),
-                          'i2': df2.pct_change(periods=2, axis=1),
-                          'i3': df3.pct_change(periods=2, axis=1)})
-        assert_panel_equal(result, expected)
-        # items, 1
-        result = wp.pct_change(axis='items')
-        expected = Panel({'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i2': DataFrame({'c1': [1, 0.5, .2],
-                                           'c2': [1. / 3, 0.25, 1. / 6]}),
-                          'i3': DataFrame({'c1': [.5, 1. / 3, 1. / 6],
-                                           'c2': [.25, .2, 1. / 7]})})
-        assert_panel_equal(result, expected)
-        result = wp.pct_change(axis=0)
-        assert_panel_equal(result, expected)
-        # items, 2
-        result = wp.pct_change(periods=2, axis='items')
-        expected = Panel({'i1': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i2': DataFrame({'c1': [np.nan, np.nan, np.nan],
-                                           'c2': [np.nan, np.nan, np.nan]}),
-                          'i3': DataFrame({'c1': [2, 1, .4],
-                                           'c2': [2. / 3, .5, 1. / 3]})})
-        assert_panel_equal(result, expected)
-
-    def test_round(self):
-        values = [[[-3.2, 2.2], [0, -4.8213], [3.123, 123.12],
-                   [-1566.213, 88.88], [-12, 94.5]],
-                  [[-5.82, 3.5], [6.21, -73.272], [-9.087, 23.12],
-                   [272.212, -99.99], [23, -76.5]]]
-        evalues = [[[float(np.around(i)) for i in j] for j in k]
-                   for k in values]
-        p = Panel(values, items=['Item1', 'Item2'],
-                  major_axis=pd.date_range('1/1/2000', periods=5),
-                  minor_axis=['A', 'B'])
-        expected = Panel(evalues, items=['Item1', 'Item2'],
-                         major_axis=pd.date_range('1/1/2000', periods=5),
-                         minor_axis=['A', 'B'])
-        result = p.round()
-        self.assert_panel_equal(expected, result)
-
-    def test_numpy_round(self):
-        values = [[[-3.2, 2.2], [0, -4.8213], [3.123, 123.12],
-                   [-1566.213, 88.88], [-12, 94.5]],
-                  [[-5.82, 3.5], [6.21, -73.272], [-9.087, 23.12],
-                   [272.212, -99.99], [23, -76.5]]]
-        evalues = [[[float(np.around(i)) for i in j] for j in k]
-                   for k in values]
-        p = Panel(values, items=['Item1', 'Item2'],
-                  major_axis=pd.date_range('1/1/2000', periods=5),
-                  minor_axis=['A', 'B'])
-        expected = Panel(evalues, items=['Item1', 'Item2'],
-                         major_axis=pd.date_range('1/1/2000', periods=5),
-                         minor_axis=['A', 'B'])
-        result = np.round(p)
-        self.assert_panel_equal(expected, result)
-
-        msg = "the 'out' parameter is not supported"
-        tm.assertRaisesRegexp(ValueError, msg, np.round, p, out=p)
-
-    def test_multiindex_get(self):
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1), ('b', 2)],
-                                     names=['first', 'second'])
-        wp = Panel(np.random.random((4, 5, 5)),
-                   items=ind,
-                   major_axis=np.arange(5),
-                   minor_axis=np.arange(5))
-        f1 = wp['a']
-        f2 = wp.loc['a']
-        assert_panel_equal(f1, f2)
-
-        self.assertTrue((f1.items == [1, 2]).all())
-        self.assertTrue((f2.items == [1, 2]).all())
-
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-                                     names=['first', 'second'])
-
-    def test_multiindex_blocks(self):
-        ind = MultiIndex.from_tuples([('a', 1), ('a', 2), ('b', 1)],
-                                     names=['first', 'second'])
-        wp = Panel(self.panel._data)
-        wp.items = ind
-        f1 = wp['a']
-        self.assertTrue((f1.items == [1, 2]).all())
-
-        f1 = wp[('b', 1)]
-        self.assertTrue((f1.columns == ['A', 'B', 'C', 'D']).all())
-
-    def test_repr_empty(self):
-        empty = Panel()
-        repr(empty)
-
-    def test_rename(self):
-        mapper = {'ItemA': 'foo', 'ItemB': 'bar', 'ItemC': 'baz'}
-
-        renamed = self.panel.rename_axis(mapper, axis=0)
-        exp = Index(['foo', 'bar', 'baz'])
-        self.assert_index_equal(renamed.items, exp)
-
-        renamed = self.panel.rename_axis(str.lower, axis=2)
-        exp = Index(['a', 'b', 'c', 'd'])
-        self.assert_index_equal(renamed.minor_axis, exp)
-
-        # don't copy
-        renamed_nocopy = self.panel.rename_axis(mapper, axis=0, copy=False)
-        renamed_nocopy['foo'] = 3.
-        self.assertTrue((self.panel['ItemA'].values == 3).all())
-
-    def test_get_attr(self):
-        assert_frame_equal(self.panel['ItemA'], self.panel.ItemA)
-
-        # specific cases from #3440
-        self.panel['a'] = self.panel['ItemA']
-        assert_frame_equal(self.panel['a'], self.panel.a)
-        self.panel['i'] = self.panel['ItemA']
-        assert_frame_equal(self.panel['i'], self.panel.i)
-
-    def test_from_frame_level1_unsorted(self):
-        tuples = [('MSFT', 3), ('MSFT', 2), ('AAPL', 2), ('AAPL', 1),
-                  ('MSFT', 1)]
-        midx = MultiIndex.from_tuples(tuples)
-        df = DataFrame(np.random.rand(5, 4), index=midx)
-        p = df.to_panel()
-        assert_frame_equal(p.minor_xs(2), df.xs(2, level=1).sort_index())
-
-    def test_to_excel(self):
-        try:
-            import xlwt  # noqa
-            import xlrd  # noqa
-            import openpyxl  # noqa
-            from pandas.io.excel import ExcelFile
-        except ImportError:
-            pytest.skip("need xlwt xlrd openpyxl")
-
-        for ext in ['xls', 'xlsx']:
-            with ensure_clean('__tmp__.' + ext) as path:
-                self.panel.to_excel(path)
-                try:
-                    reader = ExcelFile(path)
-                except ImportError:
-                    pytest.skip("need xlwt xlrd openpyxl")
-
-                for item, df in self.panel.iteritems():
-                    recdf = reader.parse(str(item), index_col=0)
-                    assert_frame_equal(df, recdf)
-
-    def test_to_excel_xlsxwriter(self):
-        try:
-            import xlrd  # noqa
-            import xlsxwriter  # noqa
-            from pandas.io.excel import ExcelFile
-        except ImportError:
-            pytest.skip("Requires xlrd and xlsxwriter. Skipping test.")
-
-        with ensure_clean('__tmp__.xlsx') as path:
-            self.panel.to_excel(path, engine='xlsxwriter')
-            try:
-                reader = ExcelFile(path)
-            except ImportError as e:
-                pytest.skip("cannot write excel file: %s" % e)
-
-            for item, df in self.panel.iteritems():
-                recdf = reader.parse(str(item), index_col=0)
-                assert_frame_equal(df, recdf)
-
-    def test_dropna(self):
-        p = Panel(np.random.randn(4, 5, 6), major_axis=list('abcde'))
-        p.loc[:, ['b', 'd'], 0] = np.nan
-
-        result = p.dropna(axis=1)
-        exp = p.loc[:, ['a', 'c', 'e'], :]
-        assert_panel_equal(result, exp)
-        inp = p.copy()
-        inp.dropna(axis=1, inplace=True)
-        assert_panel_equal(inp, exp)
-
-        result = p.dropna(axis=1, how='all')
-        assert_panel_equal(result, p)
-
-        p.loc[:, ['b', 'd'], :] = np.nan
-        result = p.dropna(axis=1, how='all')
-        exp = p.loc[:, ['a', 'c', 'e'], :]
-        assert_panel_equal(result, exp)
-
-        p = Panel(np.random.randn(4, 5, 6), items=list('abcd'))
-        p.loc[['b'], :, 0] = np.nan
-
-        result = p.dropna()
-        exp = p.loc[['a', 'c', 'd']]
-        assert_panel_equal(result, exp)
-
-        result = p.dropna(how='all')
-        assert_panel_equal(result, p)
-
-        p.loc['b'] = np.nan
-        result = p.dropna(how='all')
-        exp = p.loc[['a', 'c', 'd']]
-        assert_panel_equal(result, exp)
-
-    def test_drop(self):
-        df = DataFrame({"A": [1, 2], "B": [3, 4]})
-        panel = Panel({"One": df, "Two": df})
-
-        def check_drop(drop_val, axis_number, aliases, expected):
-            try:
-                actual = panel.drop(drop_val, axis=axis_number)
-                assert_panel_equal(actual, expected)
-                for alias in aliases:
-                    actual = panel.drop(drop_val, axis=alias)
-                    assert_panel_equal(actual, expected)
-            except AssertionError:
-                pprint_thing("Failed with axis_number %d and aliases: %s" %
-                             (axis_number, aliases))
-                raise
-        # Items
-        expected = Panel({"One": df})
-        check_drop('Two', 0, ['items'], expected)
-
-        self.assertRaises(ValueError, panel.drop, 'Three')
-
-        # errors = 'ignore'
-        dropped = panel.drop('Three', errors='ignore')
-        assert_panel_equal(dropped, panel)
-        dropped = panel.drop(['Two', 'Three'], errors='ignore')
-        expected = Panel({"One": df})
-        assert_panel_equal(dropped, expected)
-
-        # Major
-        exp_df = DataFrame({"A": [2], "B": [4]}, index=[1])
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop(0, 1, ['major_axis', 'major'], expected)
-
-        exp_df = DataFrame({"A": [1], "B": [3]}, index=[0])
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop([1], 1, ['major_axis', 'major'], expected)
-
-        # Minor
-        exp_df = df[['B']]
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop(["A"], 2, ['minor_axis', 'minor'], expected)
-
-        exp_df = df[['A']]
-        expected = Panel({"One": exp_df, "Two": exp_df})
-        check_drop("B", 2, ['minor_axis', 'minor'], expected)
-
-    def test_update(self):
-        pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]],
-                     [[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other)
-
-        expected = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
-                          [[3.6, 2., 3], [1.5, np.nan, 7], [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
-
-    def test_update_from_dict(self):
-        pan = Panel({'one': DataFrame([[1.5, np.nan, 3], [1.5, np.nan, 3],
-                                       [1.5, np.nan, 3.], [1.5, np.nan, 3.]]),
-                     'two': DataFrame([[1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                                       [1.5, np.nan, 3.], [1.5, np.nan, 3.]])})
-
-        other = {'two': DataFrame([[3.6, 2., np.nan], [np.nan, np.nan, 7]])}
-
-        pan.update(other)
-
-        expected = Panel(
-            {'two': DataFrame([[3.6, 2., 3], [1.5, np.nan, 7],
-                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]]),
-             'one': DataFrame([[1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                               [1.5, np.nan, 3.], [1.5, np.nan, 3.]])})
-
-        assert_panel_equal(pan, expected)
-
-    def test_update_nooverwrite(self):
-        pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]],
-                     [[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other, overwrite=False)
-
-        expected = Panel([[[1.5, np.nan, 3], [1.5, np.nan, 3],
-                           [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
-                          [[1.5, 2., 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
-
-    def test_update_filtered(self):
-        pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]],
-                     [[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]]])
-
-        other = Panel([[[3.6, 2., np.nan], [np.nan, np.nan, 7]]], items=[1])
-
-        pan.update(other, filter_func=lambda x: x > 2)
-
-        expected = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                           [1.5, np.nan, 3.], [1.5, np.nan, 3.]],
-                          [[1.5, np.nan, 3], [1.5, np.nan, 7],
-                           [1.5, np.nan, 3.], [1.5, np.nan, 3.]]])
-
-        assert_panel_equal(pan, expected)
-
-    def test_update_raise(self):
-        pan = Panel([[[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]],
-                     [[1.5, np.nan, 3.], [1.5, np.nan, 3.], [1.5, np.nan, 3.],
-                      [1.5, np.nan, 3.]]])
-
-        self.assertRaises(Exception, pan.update, *(pan, ),
-                          **{'raise_conflict': True})
-
-    def test_all_any(self):
-        self.assertTrue((self.panel.all(axis=0).values == nanall(
-            self.panel, axis=0)).all())
-        self.assertTrue((self.panel.all(axis=1).values == nanall(
-            self.panel, axis=1).T).all())
-        self.assertTrue((self.panel.all(axis=2).values == nanall(
-            self.panel, axis=2).T).all())
-        self.assertTrue((self.panel.any(axis=0).values == nanany(
-            self.panel, axis=0)).all())
-        self.assertTrue((self.panel.any(axis=1).values == nanany(
-            self.panel, axis=1).T).all())
-        self.assertTrue((self.panel.any(axis=2).values == nanany(
-            self.panel, axis=2).T).all())
-
-    def test_all_any_unhandled(self):
-        self.assertRaises(NotImplementedError, self.panel.all, bool_only=True)
-        self.assertRaises(NotImplementedError, self.panel.any, bool_only=True)
-
-
-class TestLongPanel(tm.TestCase):
-    """
-    LongPanel no longer exists, but...
-    """
-
-    def setUp(self):
-        import warnings
-        warnings.filterwarnings(action='ignore', category=FutureWarning)
-
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        self.panel = panel.to_frame()
-        self.unfiltered_panel = panel.to_frame(filter_observations=False)
-
-    def test_ops_differently_indexed(self):
-        # trying to set non-identically indexed panel
-        wp = self.panel.to_panel()
-        wp2 = wp.reindex(major=wp.major_axis[:-1])
-        lp2 = wp2.to_frame()
-
-        result = self.panel + lp2
-        assert_frame_equal(result.reindex(lp2.index), lp2 * 2)
-
-        # careful, mutation
-        self.panel['foo'] = lp2['ItemA']
-        assert_series_equal(self.panel['foo'].reindex(lp2.index), lp2['ItemA'],
-                            check_names=False)
-
-    def test_ops_scalar(self):
-        result = self.panel.mul(2)
-        expected = DataFrame.__mul__(self.panel, 2)
-        assert_frame_equal(result, expected)
-
-    def test_combineFrame(self):
-        wp = self.panel.to_panel()
-        result = self.panel.add(wp['ItemA'].stack(), axis=0)
-        assert_frame_equal(result.to_panel()['ItemA'], wp['ItemA'] * 2)
-
-    def test_combinePanel(self):
-        wp = self.panel.to_panel()
-        result = self.panel.add(self.panel)
-        wide_result = result.to_panel()
-        assert_frame_equal(wp['ItemA'] * 2, wide_result['ItemA'])
-
-        # one item
-        result = self.panel.add(self.panel.filter(['ItemA']))
-
-    def test_combine_scalar(self):
-        result = self.panel.mul(2)
-        expected = DataFrame(self.panel._data) * 2
-        assert_frame_equal(result, expected)
-
-    def test_combine_series(self):
-        s = self.panel['ItemA'][:10]
-        result = self.panel.add(s, axis=0)
-        expected = DataFrame.add(self.panel, s, axis=0)
-        assert_frame_equal(result, expected)
-
-        s = self.panel.iloc[5]
-        result = self.panel + s
-        expected = DataFrame.add(self.panel, s, axis=1)
-        assert_frame_equal(result, expected)
-
-    def test_operators(self):
-        wp = self.panel.to_panel()
-        result = (self.panel + 1).to_panel()
-        assert_frame_equal(wp['ItemA'] + 1, result['ItemA'])
-
-    def test_arith_flex_panel(self):
-        ops = ['add', 'sub', 'mul', 'div', 'truediv', 'pow', 'floordiv', 'mod']
-        if not compat.PY3:
-            aliases = {}
-        else:
-            aliases = {'div': 'truediv'}
-        self.panel = self.panel.to_panel()
-
-        for n in [np.random.randint(-50, -1), np.random.randint(1, 50), 0]:
-            for op in ops:
-                alias = aliases.get(op, op)
-                f = getattr(operator, alias)
-                exp = f(self.panel, n)
-                result = getattr(self.panel, op)(n)
-                assert_panel_equal(result, exp, check_panel_type=True)
-
-                # rops
-                r_f = lambda x, y: f(y, x)
-                exp = r_f(self.panel, n)
-                result = getattr(self.panel, 'r' + op)(n)
-                assert_panel_equal(result, exp)
-
-    def test_sort(self):
-        def is_sorted(arr):
-            return (arr[1:] > arr[:-1]).any()
-
-        sorted_minor = self.panel.sort_index(level=1)
-        self.assertTrue(is_sorted(sorted_minor.index.labels[1]))
-
-        sorted_major = sorted_minor.sort_index(level=0)
-        self.assertTrue(is_sorted(sorted_major.index.labels[0]))
-
-    def test_to_string(self):
-        buf = StringIO()
-        self.panel.to_string(buf)
-
-    def test_to_sparse(self):
-        if isinstance(self.panel, Panel):
-            msg = 'sparsifying is not supported'
-            tm.assertRaisesRegexp(NotImplementedError, msg,
-                                  self.panel.to_sparse)
-
-    def test_truncate(self):
-        dates = self.panel.index.levels[0]
-        start, end = dates[1], dates[5]
-
-        trunced = self.panel.truncate(start, end).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(start, end)
-
-        # TODO trucate drops index.names
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)
-
-        trunced = self.panel.truncate(before=start).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(before=start)
-
-        # TODO trucate drops index.names
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)
-
-        trunced = self.panel.truncate(after=end).to_panel()
-        expected = self.panel.to_panel()['ItemA'].truncate(after=end)
-
-        # TODO trucate drops index.names
-        assert_frame_equal(trunced['ItemA'], expected, check_names=False)
-
-        # truncate on dates that aren't in there
-        wp = self.panel.to_panel()
-        new_index = wp.major_axis[::5]
-
-        wp2 = wp.reindex(major=new_index)
-
-        lp2 = wp2.to_frame()
-        lp_trunc = lp2.truncate(wp.major_axis[2], wp.major_axis[-2])
-
-        wp_trunc = wp2.truncate(wp.major_axis[2], wp.major_axis[-2])
-
-        assert_panel_equal(wp_trunc, lp_trunc.to_panel())
-
-        # throw proper exception
-        self.assertRaises(Exception, lp2.truncate, wp.major_axis[-2],
-                          wp.major_axis[2])
-
-    def test_axis_dummies(self):
-        from pandas.core.reshape import make_axis_dummies
-
-        minor_dummies = make_axis_dummies(self.panel, 'minor').astype(np.uint8)
-        self.assertEqual(len(minor_dummies.columns),
-                         len(self.panel.index.levels[1]))
-
-        major_dummies = make_axis_dummies(self.panel, 'major').astype(np.uint8)
-        self.assertEqual(len(major_dummies.columns),
-                         len(self.panel.index.levels[0]))
-
-        mapping = {'A': 'one', 'B': 'one', 'C': 'two', 'D': 'two'}
-
-        transformed = make_axis_dummies(self.panel, 'minor',
-                                        transform=mapping.get).astype(np.uint8)
-        self.assertEqual(len(transformed.columns), 2)
-        self.assert_index_equal(transformed.columns, Index(['one', 'two']))
-
-        # TODO: test correctness
-
-    def test_get_dummies(self):
-        from pandas.core.reshape import get_dummies, make_axis_dummies
-
-        self.panel['Label'] = self.panel.index.labels[1]
-        minor_dummies = make_axis_dummies(self.panel, 'minor').astype(np.uint8)
-        dummies = get_dummies(self.panel['Label'])
-        self.assert_numpy_array_equal(dummies.values, minor_dummies.values)
-
-    def test_mean(self):
-        means = self.panel.mean(level='minor')
-
-        # test versus Panel version
-        wide_means = self.panel.to_panel().mean('major')
-        assert_frame_equal(means, wide_means)
-
-    def test_sum(self):
-        sums = self.panel.sum(level='minor')
-
-        # test versus Panel version
-        wide_sums = self.panel.to_panel().sum('major')
-        assert_frame_equal(sums, wide_sums)
-
-    def test_count(self):
-        index = self.panel.index
-
-        major_count = self.panel.count(level=0)['ItemA']
-        labels = index.labels[0]
-        for i, idx in enumerate(index.levels[0]):
-            self.assertEqual(major_count[i], (labels == i).sum())
-
-        minor_count = self.panel.count(level=1)['ItemA']
-        labels = index.labels[1]
-        for i, idx in enumerate(index.levels[1]):
-            self.assertEqual(minor_count[i], (labels == i).sum())
-
-    def test_join(self):
-        lp1 = self.panel.filter(['ItemA', 'ItemB'])
-        lp2 = self.panel.filter(['ItemC'])
-
-        joined = lp1.join(lp2)
-
-        self.assertEqual(len(joined.columns), 3)
-
-        self.assertRaises(Exception, lp1.join,
-                          self.panel.filter(['ItemB', 'ItemC']))
-
-    def test_pivot(self):
-        from pandas.core.reshape import _slow_pivot
-
-        one, two, three = (np.array([1, 2, 3, 4, 5]),
-                           np.array(['a', 'b', 'c', 'd', 'e']),
-                           np.array([1, 2, 3, 5, 4.]))
-        df = pivot(one, two, three)
-        self.assertEqual(df['a'][1], 1)
-        self.assertEqual(df['b'][2], 2)
-        self.assertEqual(df['c'][3], 3)
-        self.assertEqual(df['d'][4], 5)
-        self.assertEqual(df['e'][5], 4)
-        assert_frame_equal(df, _slow_pivot(one, two, three))
-
-        # weird overlap, TODO: test?
-        a, b, c = (np.array([1, 2, 3, 4, 4]),
-                   np.array(['a', 'a', 'a', 'a', 'a']),
-                   np.array([1., 2., 3., 4., 5.]))
-        self.assertRaises(Exception, pivot, a, b, c)
-
-        # corner case, empty
-        df = pivot(np.array([]), np.array([]), np.array([]))
-
-
-def test_monotonic():
-    pos = np.array([1, 2, 3, 5])
-
-    def _monotonic(arr):
-        return not (arr[1:] < arr[:-1]).any()
-
-    assert _monotonic(pos)
-
-    neg = np.array([1, 2, 3, 4, 3])
-
-    assert not _monotonic(neg)
-
-    neg2 = np.array([5, 1, 2, 3, 4, 5])
-
-    assert not _monotonic(neg2)
-
-
-def test_panel_index():
-    index = panelm.panel_index([1, 2, 3, 4], [1, 2, 3])
-    expected = MultiIndex.from_arrays([np.tile([1, 2, 3, 4], 3),
-                                       np.repeat([1, 2, 3], 4)],
-                                      names=['time', 'panel'])
-    tm.assert_index_equal(index, expected)
diff --git a/pandas/tests/test_panel4d.py b/pandas/tests/test_panel4d.py
deleted file mode 100644
index c0511581cd299..0000000000000
--- a/pandas/tests/test_panel4d.py
+++ /dev/null
@@ -1,954 +0,0 @@
-# -*- coding: utf-8 -*-
-from datetime import datetime
-from pandas.compat import range, lrange
-import operator
-import pytest
-from warnings import catch_warnings
-import numpy as np
-
-from pandas.types.common import is_float_dtype
-from pandas import Series, Index, isnull, notnull
-from pandas.core.panel import Panel
-from pandas.core.panel4d import Panel4D
-from pandas.core.series import remove_na
-from pandas.tseries.offsets import BDay
-
-from pandas.util.testing import (assert_panel_equal,
-                                 assert_panel4d_equal,
-                                 assert_frame_equal,
-                                 assert_series_equal,
-                                 assert_almost_equal)
-import pandas.util.testing as tm
-
-
-def add_nans(panel4d):
-    for l, label in enumerate(panel4d.labels):
-        panel = panel4d[label]
-        tm.add_nans(panel)
-
-
-class SafeForLongAndSparse(object):
-
-    def test_repr(self):
-        repr(self.panel4d)
-
-    def test_iter(self):
-        tm.equalContents(list(self.panel4d), self.panel4d.labels)
-
-    def test_count(self):
-        f = lambda s: notnull(s).sum()
-        self._check_stat_op('count', f, obj=self.panel4d, has_skipna=False)
-
-    def test_sum(self):
-        self._check_stat_op('sum', np.sum)
-
-    def test_mean(self):
-        self._check_stat_op('mean', np.mean)
-
-    def test_prod(self):
-        self._check_stat_op('prod', np.prod)
-
-    def test_median(self):
-        def wrapper(x):
-            if isnull(x).any():
-                return np.nan
-            return np.median(x)
-
-        self._check_stat_op('median', wrapper)
-
-    def test_min(self):
-        self._check_stat_op('min', np.min)
-
-    def test_max(self):
-        self._check_stat_op('max', np.max)
-
-    def test_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            pytest.skip("no scipy.stats.skew")
-
-        def this_skew(x):
-            if len(x) < 3:
-                return np.nan
-            return skew(x, bias=False)
-        self._check_stat_op('skew', this_skew)
-
-    # def test_mad(self):
-    #     f = lambda x: np.abs(x - x.mean()).mean()
-    #     self._check_stat_op('mad', f)
-
-    def test_var(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.var(x, ddof=1)
-        self._check_stat_op('var', alt)
-
-    def test_std(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1)
-        self._check_stat_op('std', alt)
-
-    def test_sem(self):
-        def alt(x):
-            if len(x) < 2:
-                return np.nan
-            return np.std(x, ddof=1) / np.sqrt(len(x))
-        self._check_stat_op('sem', alt)
-
-    # def test_skew(self):
-    #     from scipy.stats import skew
-
-    #     def alt(x):
-    #         if len(x) < 3:
-    #             return np.nan
-    #         return skew(x, bias=False)
-
-    #     self._check_stat_op('skew', alt)
-
-    def _check_stat_op(self, name, alternative, obj=None, has_skipna=True):
-        if obj is None:
-            obj = self.panel4d
-
-            # # set some NAs
-            # obj.loc[5:10] = np.nan
-            # obj.loc[15:20, -2:] = np.nan
-
-        f = getattr(obj, name)
-
-        if has_skipna:
-            def skipna_wrapper(x):
-                nona = remove_na(x)
-                if len(nona) == 0:
-                    return np.nan
-                return alternative(nona)
-
-            def wrapper(x):
-                return alternative(np.asarray(x))
-
-            with catch_warnings(record=True):
-                for i in range(obj.ndim):
-                    result = f(axis=i, skipna=False)
-                    expected = obj.apply(wrapper, axis=i)
-                    assert_panel_equal(result, expected)
-        else:
-            skipna_wrapper = alternative
-            wrapper = alternative
-
-        with catch_warnings(record=True):
-            for i in range(obj.ndim):
-                result = f(axis=i)
-                if not tm._incompat_bottleneck_version(name):
-                    expected = obj.apply(skipna_wrapper, axis=i)
-                    assert_panel_equal(result, expected)
-
-        self.assertRaises(Exception, f, axis=obj.ndim)
-
-
-class SafeForSparse(object):
-
-    @classmethod
-    def assert_panel_equal(cls, x, y):
-        assert_panel_equal(x, y)
-
-    @classmethod
-    def assert_panel4d_equal(cls, x, y):
-        assert_panel4d_equal(x, y)
-
-    def test_get_axis(self):
-        assert(self.panel4d._get_axis(0) is self.panel4d.labels)
-        assert(self.panel4d._get_axis(1) is self.panel4d.items)
-        assert(self.panel4d._get_axis(2) is self.panel4d.major_axis)
-        assert(self.panel4d._get_axis(3) is self.panel4d.minor_axis)
-
-    def test_set_axis(self):
-        with catch_warnings(record=True):
-            new_labels = Index(np.arange(len(self.panel4d.labels)))
-
-            # TODO: unused?
-            # new_items = Index(np.arange(len(self.panel4d.items)))
-
-            new_major = Index(np.arange(len(self.panel4d.major_axis)))
-            new_minor = Index(np.arange(len(self.panel4d.minor_axis)))
-
-            # ensure propagate to potentially prior-cached items too
-
-            # TODO: unused?
-            # label = self.panel4d['l1']
-
-            self.panel4d.labels = new_labels
-
-            if hasattr(self.panel4d, '_item_cache'):
-                self.assertNotIn('l1', self.panel4d._item_cache)
-            self.assertIs(self.panel4d.labels, new_labels)
-
-            self.panel4d.major_axis = new_major
-            self.assertIs(self.panel4d[0].major_axis, new_major)
-            self.assertIs(self.panel4d.major_axis, new_major)
-
-            self.panel4d.minor_axis = new_minor
-            self.assertIs(self.panel4d[0].minor_axis, new_minor)
-            self.assertIs(self.panel4d.minor_axis, new_minor)
-
-    def test_get_axis_number(self):
-        self.assertEqual(self.panel4d._get_axis_number('labels'), 0)
-        self.assertEqual(self.panel4d._get_axis_number('items'), 1)
-        self.assertEqual(self.panel4d._get_axis_number('major'), 2)
-        self.assertEqual(self.panel4d._get_axis_number('minor'), 3)
-
-    def test_get_axis_name(self):
-        self.assertEqual(self.panel4d._get_axis_name(0), 'labels')
-        self.assertEqual(self.panel4d._get_axis_name(1), 'items')
-        self.assertEqual(self.panel4d._get_axis_name(2), 'major_axis')
-        self.assertEqual(self.panel4d._get_axis_name(3), 'minor_axis')
-
-    def test_arith(self):
-        with catch_warnings(record=True):
-            self._test_op(self.panel4d, operator.add)
-            self._test_op(self.panel4d, operator.sub)
-            self._test_op(self.panel4d, operator.mul)
-            self._test_op(self.panel4d, operator.truediv)
-            self._test_op(self.panel4d, operator.floordiv)
-            self._test_op(self.panel4d, operator.pow)
-
-            self._test_op(self.panel4d, lambda x, y: y + x)
-            self._test_op(self.panel4d, lambda x, y: y - x)
-            self._test_op(self.panel4d, lambda x, y: y * x)
-            self._test_op(self.panel4d, lambda x, y: y / x)
-            self._test_op(self.panel4d, lambda x, y: y ** x)
-
-            self.assertRaises(Exception, self.panel4d.__add__,
-                              self.panel4d['l1'])
-
-    @staticmethod
-    def _test_op(panel4d, op):
-        result = op(panel4d, 1)
-        assert_panel_equal(result['l1'], op(panel4d['l1'], 1))
-
-    def test_keys(self):
-        tm.equalContents(list(self.panel4d.keys()), self.panel4d.labels)
-
-    def test_iteritems(self):
-        """Test panel4d.iteritems()"""
-
-        self.assertEqual(len(list(self.panel4d.iteritems())),
-                         len(self.panel4d.labels))
-
-    def test_combinePanel4d(self):
-        with catch_warnings(record=True):
-            result = self.panel4d.add(self.panel4d)
-            self.assert_panel4d_equal(result, self.panel4d * 2)
-
-    def test_neg(self):
-        with catch_warnings(record=True):
-            self.assert_panel4d_equal(-self.panel4d, self.panel4d * -1)
-
-    def test_select(self):
-        with catch_warnings(record=True):
-
-            p = self.panel4d
-
-            # select labels
-            result = p.select(lambda x: x in ('l1', 'l3'), axis='labels')
-            expected = p.reindex(labels=['l1', 'l3'])
-            self.assert_panel4d_equal(result, expected)
-
-            # select items
-            result = p.select(lambda x: x in ('ItemA', 'ItemC'), axis='items')
-            expected = p.reindex(items=['ItemA', 'ItemC'])
-            self.assert_panel4d_equal(result, expected)
-
-            # select major_axis
-            result = p.select(lambda x: x >= datetime(2000, 1, 15),
-                              axis='major')
-            new_major = p.major_axis[p.major_axis >= datetime(2000, 1, 15)]
-            expected = p.reindex(major=new_major)
-            self.assert_panel4d_equal(result, expected)
-
-            # select minor_axis
-            result = p.select(lambda x: x in ('D', 'A'), axis=3)
-            expected = p.reindex(minor=['A', 'D'])
-            self.assert_panel4d_equal(result, expected)
-
-            # corner case, empty thing
-            result = p.select(lambda x: x in ('foo',), axis='items')
-            self.assert_panel4d_equal(result, p.reindex(items=[]))
-
-    def test_get_value(self):
-
-        for item in self.panel.items:
-            for mjr in self.panel.major_axis[::2]:
-                for mnr in self.panel.minor_axis:
-                    result = self.panel.get_value(item, mjr, mnr)
-                    expected = self.panel[item][mnr][mjr]
-                    assert_almost_equal(result, expected)
-
-    def test_abs(self):
-
-        with catch_warnings(record=True):
-            result = self.panel4d.abs()
-            expected = np.abs(self.panel4d)
-            self.assert_panel4d_equal(result, expected)
-
-            p = self.panel4d['l1']
-            result = p.abs()
-            expected = np.abs(p)
-            assert_panel_equal(result, expected)
-
-            df = p['ItemA']
-            result = df.abs()
-            expected = np.abs(df)
-            assert_frame_equal(result, expected)
-
-
-class CheckIndexing(object):
-
-    def test_getitem(self):
-        self.assertRaises(Exception, self.panel4d.__getitem__, 'ItemQ')
-
-    def test_delitem_and_pop(self):
-
-        with catch_warnings(record=True):
-            expected = self.panel4d['l2']
-            result = self.panel4d.pop('l2')
-            assert_panel_equal(expected, result)
-            self.assertNotIn('l2', self.panel4d.labels)
-
-            del self.panel4d['l3']
-            self.assertNotIn('l3', self.panel4d.labels)
-            self.assertRaises(Exception, self.panel4d.__delitem__, 'l3')
-
-            values = np.empty((4, 4, 4, 4))
-            values[0] = 0
-            values[1] = 1
-            values[2] = 2
-            values[3] = 3
-
-            panel4d = Panel4D(values, lrange(4), lrange(4),
-                              lrange(4), lrange(4))
-
-            # did we delete the right row?
-            panel4dc = panel4d.copy()
-            del panel4dc[0]
-            assert_panel_equal(panel4dc[1], panel4d[1])
-            assert_panel_equal(panel4dc[2], panel4d[2])
-            assert_panel_equal(panel4dc[3], panel4d[3])
-
-            panel4dc = panel4d.copy()
-            del panel4dc[1]
-            assert_panel_equal(panel4dc[0], panel4d[0])
-            assert_panel_equal(panel4dc[2], panel4d[2])
-            assert_panel_equal(panel4dc[3], panel4d[3])
-
-            panel4dc = panel4d.copy()
-            del panel4dc[2]
-            assert_panel_equal(panel4dc[1], panel4d[1])
-            assert_panel_equal(panel4dc[0], panel4d[0])
-            assert_panel_equal(panel4dc[3], panel4d[3])
-
-            panel4dc = panel4d.copy()
-            del panel4dc[3]
-            assert_panel_equal(panel4dc[1], panel4d[1])
-            assert_panel_equal(panel4dc[2], panel4d[2])
-            assert_panel_equal(panel4dc[0], panel4d[0])
-
-    def test_setitem(self):
-        with catch_warnings(record=True):
-
-            # Panel
-            p = Panel(dict(
-                ItemA=self.panel4d['l1']['ItemA'][2:].filter(
-                    items=['A', 'B'])))
-            self.panel4d['l4'] = p
-            self.panel4d['l5'] = p
-
-            p2 = self.panel4d['l4']
-
-            assert_panel_equal(p, p2.reindex(items=p.items,
-                                             major_axis=p.major_axis,
-                                             minor_axis=p.minor_axis))
-
-            # scalar
-            self.panel4d['lG'] = 1
-            self.panel4d['lE'] = True
-            self.assertEqual(self.panel4d['lG'].values.dtype, np.int64)
-            self.assertEqual(self.panel4d['lE'].values.dtype, np.bool_)
-
-            # object dtype
-            self.panel4d['lQ'] = 'foo'
-            self.assertEqual(self.panel4d['lQ'].values.dtype, np.object_)
-
-            # boolean dtype
-            self.panel4d['lP'] = self.panel4d['l1'] > 0
-            self.assertEqual(self.panel4d['lP'].values.dtype, np.bool_)
-
-    def test_setitem_by_indexer(self):
-
-        with catch_warnings(record=True):
-
-            # Panel
-            panel4dc = self.panel4d.copy()
-            p = panel4dc.iloc[0]
-
-            def func():
-                self.panel4d.iloc[0] = p
-            self.assertRaises(NotImplementedError, func)
-
-            # DataFrame
-            panel4dc = self.panel4d.copy()
-            df = panel4dc.iloc[0, 0]
-            df.iloc[:] = 1
-            panel4dc.iloc[0, 0] = df
-            self.assertTrue((panel4dc.iloc[0, 0].values == 1).all())
-
-            # Series
-            panel4dc = self.panel4d.copy()
-            s = panel4dc.iloc[0, 0, :, 0]
-            s.iloc[:] = 1
-            panel4dc.iloc[0, 0, :, 0] = s
-            self.assertTrue((panel4dc.iloc[0, 0, :, 0].values == 1).all())
-
-            # scalar
-            panel4dc = self.panel4d.copy()
-            panel4dc.iloc[0] = 1
-            panel4dc.iloc[1] = True
-            panel4dc.iloc[2] = 'foo'
-            self.assertTrue((panel4dc.iloc[0].values == 1).all())
-            self.assertTrue(panel4dc.iloc[1].values.all())
-            self.assertTrue((panel4dc.iloc[2].values == 'foo').all())
-
-    def test_setitem_by_indexer_mixed_type(self):
-
-        with catch_warnings(record=True):
-            # GH 8702
-            self.panel4d['foo'] = 'bar'
-
-            # scalar
-            panel4dc = self.panel4d.copy()
-            panel4dc.iloc[0] = 1
-            panel4dc.iloc[1] = True
-            panel4dc.iloc[2] = 'foo'
-            self.assertTrue((panel4dc.iloc[0].values == 1).all())
-            self.assertTrue(panel4dc.iloc[1].values.all())
-            self.assertTrue((panel4dc.iloc[2].values == 'foo').all())
-
-    def test_comparisons(self):
-        with catch_warnings(record=True):
-            p1 = tm.makePanel4D()
-            p2 = tm.makePanel4D()
-
-            tp = p1.reindex(labels=p1.labels.tolist() + ['foo'])
-            p = p1[p1.labels[0]]
-
-            def test_comp(func):
-                result = func(p1, p2)
-                self.assert_numpy_array_equal(result.values,
-                                              func(p1.values, p2.values))
-
-                # versus non-indexed same objs
-                self.assertRaises(Exception, func, p1, tp)
-
-                # versus different objs
-                self.assertRaises(Exception, func, p1, p)
-
-                result3 = func(self.panel4d, 0)
-                self.assert_numpy_array_equal(result3.values,
-                                              func(self.panel4d.values, 0))
-
-            with np.errstate(invalid='ignore'):
-                test_comp(operator.eq)
-                test_comp(operator.ne)
-                test_comp(operator.lt)
-                test_comp(operator.gt)
-                test_comp(operator.ge)
-                test_comp(operator.le)
-
-    def test_major_xs(self):
-        ref = self.panel4d['l1']['ItemA']
-
-        idx = self.panel4d.major_axis[5]
-        with catch_warnings(record=True):
-            xs = self.panel4d.major_xs(idx)
-
-        assert_series_equal(xs['l1'].T['ItemA'],
-                            ref.xs(idx), check_names=False)
-
-        # not contained
-        idx = self.panel4d.major_axis[0] - BDay()
-        self.assertRaises(Exception, self.panel4d.major_xs, idx)
-
-    def test_major_xs_mixed(self):
-        self.panel4d['l4'] = 'foo'
-        with catch_warnings(record=True):
-            xs = self.panel4d.major_xs(self.panel4d.major_axis[0])
-        self.assertEqual(xs['l1']['A'].dtype, np.float64)
-        self.assertEqual(xs['l4']['A'].dtype, np.object_)
-
-    def test_minor_xs(self):
-        ref = self.panel4d['l1']['ItemA']
-
-        with catch_warnings(record=True):
-            idx = self.panel4d.minor_axis[1]
-            xs = self.panel4d.minor_xs(idx)
-
-        assert_series_equal(xs['l1'].T['ItemA'], ref[idx], check_names=False)
-
-        # not contained
-        self.assertRaises(Exception, self.panel4d.minor_xs, 'E')
-
-    def test_minor_xs_mixed(self):
-        self.panel4d['l4'] = 'foo'
-
-        with catch_warnings(record=True):
-            xs = self.panel4d.minor_xs('D')
-        self.assertEqual(xs['l1'].T['ItemA'].dtype, np.float64)
-        self.assertEqual(xs['l4'].T['ItemA'].dtype, np.object_)
-
-    def test_xs(self):
-        l1 = self.panel4d.xs('l1', axis=0)
-        expected = self.panel4d['l1']
-        assert_panel_equal(l1, expected)
-
-        # view if possible
-        l1_view = self.panel4d.xs('l1', axis=0)
-        l1_view.values[:] = np.nan
-        self.assertTrue(np.isnan(self.panel4d['l1'].values).all())
-
-        # mixed-type
-        self.panel4d['strings'] = 'foo'
-        with catch_warnings(record=True):
-            result = self.panel4d.xs('D', axis=3)
-        self.assertIsNotNone(result.is_copy)
-
-    def test_getitem_fancy_labels(self):
-        with catch_warnings(record=True):
-            panel4d = self.panel4d
-
-            labels = panel4d.labels[[1, 0]]
-            items = panel4d.items[[1, 0]]
-            dates = panel4d.major_axis[::2]
-            cols = ['D', 'C', 'F']
-
-            # all 4 specified
-            assert_panel4d_equal(panel4d.loc[labels, items, dates, cols],
-                                 panel4d.reindex(labels=labels, items=items,
-                                                 major=dates, minor=cols))
-
-            # 3 specified
-            assert_panel4d_equal(panel4d.loc[:, items, dates, cols],
-                                 panel4d.reindex(items=items, major=dates,
-                                                 minor=cols))
-
-            # 2 specified
-            assert_panel4d_equal(panel4d.loc[:, :, dates, cols],
-                                 panel4d.reindex(major=dates, minor=cols))
-
-            assert_panel4d_equal(panel4d.loc[:, items, :, cols],
-                                 panel4d.reindex(items=items, minor=cols))
-
-            assert_panel4d_equal(panel4d.loc[:, items, dates, :],
-                                 panel4d.reindex(items=items, major=dates))
-
-            # only 1
-            assert_panel4d_equal(panel4d.loc[:, items, :, :],
-                                 panel4d.reindex(items=items))
-
-            assert_panel4d_equal(panel4d.loc[:, :, dates, :],
-                                 panel4d.reindex(major=dates))
-
-            assert_panel4d_equal(panel4d.loc[:, :, :, cols],
-                                 panel4d.reindex(minor=cols))
-
-    def test_getitem_fancy_slice(self):
-        pass
-
-    def test_getitem_fancy_ints(self):
-        pass
-
-    def test_get_value(self):
-        for label in self.panel4d.labels:
-            for item in self.panel4d.items:
-                for mjr in self.panel4d.major_axis[::2]:
-                    for mnr in self.panel4d.minor_axis:
-                        result = self.panel4d.get_value(
-                            label, item, mjr, mnr)
-                        expected = self.panel4d[label][item][mnr][mjr]
-                        assert_almost_equal(result, expected)
-
-    def test_set_value(self):
-
-        with catch_warnings(record=True):
-
-            for label in self.panel4d.labels:
-                for item in self.panel4d.items:
-                    for mjr in self.panel4d.major_axis[::2]:
-                        for mnr in self.panel4d.minor_axis:
-                            self.panel4d.set_value(label, item, mjr, mnr, 1.)
-                            assert_almost_equal(
-                                self.panel4d[label][item][mnr][mjr], 1.)
-
-            res3 = self.panel4d.set_value('l4', 'ItemE', 'foobar', 'baz', 5)
-            self.assertTrue(is_float_dtype(res3['l4'].values))
-
-            # resize
-            res = self.panel4d.set_value('l4', 'ItemE', 'foo', 'bar', 1.5)
-            tm.assertIsInstance(res, Panel4D)
-            self.assertIsNot(res, self.panel4d)
-            self.assertEqual(res.get_value('l4', 'ItemE', 'foo', 'bar'), 1.5)
-
-            res3 = self.panel4d.set_value('l4', 'ItemE', 'foobar', 'baz', 5)
-            self.assertTrue(is_float_dtype(res3['l4'].values))
-
-
-class TestPanel4d(tm.TestCase, CheckIndexing, SafeForSparse,
-                  SafeForLongAndSparse):
-
-    @classmethod
-    def assert_panel4d_equal(cls, x, y):
-        assert_panel4d_equal(x, y)
-
-    def setUp(self):
-        with catch_warnings(record=True):
-            self.panel4d = tm.makePanel4D(nper=8)
-            add_nans(self.panel4d)
-
-    def test_constructor(self):
-
-        with catch_warnings(record=True):
-            panel4d = Panel4D(self.panel4d._data)
-            self.assertIs(panel4d._data, self.panel4d._data)
-
-            panel4d = Panel4D(self.panel4d._data, copy=True)
-            self.assertIsNot(panel4d._data, self.panel4d._data)
-            assert_panel4d_equal(panel4d, self.panel4d)
-
-            vals = self.panel4d.values
-
-            # no copy
-            panel4d = Panel4D(vals)
-            self.assertIs(panel4d.values, vals)
-
-            # copy
-            panel4d = Panel4D(vals, copy=True)
-            self.assertIsNot(panel4d.values, vals)
-
-            # GH #8285, test when scalar data is used to construct a Panel4D
-            # if dtype is not passed, it should be inferred
-            value_and_dtype = [(1, 'int64'), (3.14, 'float64'),
-                               ('foo', np.object_)]
-            for (val, dtype) in value_and_dtype:
-                panel4d = Panel4D(val, labels=range(2), items=range(
-                    3), major_axis=range(4), minor_axis=range(5))
-                vals = np.empty((2, 3, 4, 5), dtype=dtype)
-                vals.fill(val)
-                expected = Panel4D(vals, dtype=dtype)
-                assert_panel4d_equal(panel4d, expected)
-
-            # test the case when dtype is passed
-            panel4d = Panel4D(1, labels=range(2), items=range(
-                3), major_axis=range(4), minor_axis=range(5), dtype='float32')
-            vals = np.empty((2, 3, 4, 5), dtype='float32')
-            vals.fill(1)
-
-            expected = Panel4D(vals, dtype='float32')
-            assert_panel4d_equal(panel4d, expected)
-
-    def test_constructor_cast(self):
-        with catch_warnings(record=True):
-            zero_filled = self.panel4d.fillna(0)
-
-            casted = Panel4D(zero_filled._data, dtype=int)
-            casted2 = Panel4D(zero_filled.values, dtype=int)
-
-            exp_values = zero_filled.values.astype(int)
-            assert_almost_equal(casted.values, exp_values)
-            assert_almost_equal(casted2.values, exp_values)
-
-            casted = Panel4D(zero_filled._data, dtype=np.int32)
-            casted2 = Panel4D(zero_filled.values, dtype=np.int32)
-
-            exp_values = zero_filled.values.astype(np.int32)
-            assert_almost_equal(casted.values, exp_values)
-            assert_almost_equal(casted2.values, exp_values)
-
-            # can't cast
-            data = [[['foo', 'bar', 'baz']]]
-            self.assertRaises(ValueError, Panel, data, dtype=float)
-
-    def test_consolidate(self):
-        with catch_warnings(record=True):
-            self.assertTrue(self.panel4d._data.is_consolidated())
-
-            self.panel4d['foo'] = 1.
-            self.assertFalse(self.panel4d._data.is_consolidated())
-
-            panel4d = self.panel4d._consolidate()
-            self.assertTrue(panel4d._data.is_consolidated())
-
-    def test_ctor_dict(self):
-        with catch_warnings(record=True):
-            l1 = self.panel4d['l1']
-            l2 = self.panel4d['l2']
-
-            d = {'A': l1, 'B': l2.loc[['ItemB'], :, :]}
-            panel4d = Panel4D(d)
-
-            assert_panel_equal(panel4d['A'], self.panel4d['l1'])
-            assert_frame_equal(panel4d.loc['B', 'ItemB', :, :],
-                               self.panel4d.loc['l2', ['ItemB'],
-                                                :, :]['ItemB'])
-
-    def test_constructor_dict_mixed(self):
-        with catch_warnings(record=True):
-            data = dict((k, v.values) for k, v in self.panel4d.iteritems())
-            result = Panel4D(data)
-
-            exp_major = Index(np.arange(len(self.panel4d.major_axis)))
-            self.assert_index_equal(result.major_axis, exp_major)
-
-            result = Panel4D(data,
-                             labels=self.panel4d.labels,
-                             items=self.panel4d.items,
-                             major_axis=self.panel4d.major_axis,
-                             minor_axis=self.panel4d.minor_axis)
-            assert_panel4d_equal(result, self.panel4d)
-
-            data['l2'] = self.panel4d['l2']
-
-            result = Panel4D(data)
-            assert_panel4d_equal(result, self.panel4d)
-
-            # corner, blow up
-            data['l2'] = data['l2']['ItemB']
-            self.assertRaises(Exception, Panel4D, data)
-
-            data['l2'] = self.panel4d['l2'].values[:, :, :-1]
-            self.assertRaises(Exception, Panel4D, data)
-
-    def test_constructor_resize(self):
-        with catch_warnings(record=True):
-            data = self.panel4d._data
-            labels = self.panel4d.labels[:-1]
-            items = self.panel4d.items[:-1]
-            major = self.panel4d.major_axis[:-1]
-            minor = self.panel4d.minor_axis[:-1]
-
-            result = Panel4D(data, labels=labels, items=items,
-                             major_axis=major, minor_axis=minor)
-            expected = self.panel4d.reindex(
-                labels=labels, items=items, major=major, minor=minor)
-            assert_panel4d_equal(result, expected)
-
-            result = Panel4D(data, items=items, major_axis=major)
-            expected = self.panel4d.reindex(items=items, major=major)
-            assert_panel4d_equal(result, expected)
-
-            result = Panel4D(data, items=items)
-            expected = self.panel4d.reindex(items=items)
-            assert_panel4d_equal(result, expected)
-
-            result = Panel4D(data, minor_axis=minor)
-            expected = self.panel4d.reindex(minor=minor)
-            assert_panel4d_equal(result, expected)
-
-    def test_conform(self):
-        with catch_warnings(record=True):
-
-            p = self.panel4d['l1'].filter(items=['ItemA', 'ItemB'])
-            conformed = self.panel4d.conform(p)
-
-            tm.assert_index_equal(conformed.items, self.panel4d.labels)
-            tm.assert_index_equal(conformed.major_axis,
-                                  self.panel4d.major_axis)
-            tm.assert_index_equal(conformed.minor_axis,
-                                  self.panel4d.minor_axis)
-
-    def test_reindex(self):
-        with catch_warnings(record=True):
-            ref = self.panel4d['l2']
-
-            # labels
-            result = self.panel4d.reindex(labels=['l1', 'l2'])
-            assert_panel_equal(result['l2'], ref)
-
-            # items
-            result = self.panel4d.reindex(items=['ItemA', 'ItemB'])
-            assert_frame_equal(result['l2']['ItemB'], ref['ItemB'])
-
-            # major
-            new_major = list(self.panel4d.major_axis[:10])
-            result = self.panel4d.reindex(major=new_major)
-            assert_frame_equal(
-                result['l2']['ItemB'], ref['ItemB'].reindex(index=new_major))
-
-            # raise exception put both major and major_axis
-            self.assertRaises(Exception, self.panel4d.reindex,
-                              major_axis=new_major, major=new_major)
-
-            # minor
-            new_minor = list(self.panel4d.minor_axis[:2])
-            result = self.panel4d.reindex(minor=new_minor)
-            assert_frame_equal(
-                result['l2']['ItemB'], ref['ItemB'].reindex(columns=new_minor))
-
-            result = self.panel4d.reindex(labels=self.panel4d.labels,
-                                          items=self.panel4d.items,
-                                          major=self.panel4d.major_axis,
-                                          minor=self.panel4d.minor_axis)
-
-            # don't necessarily copy
-            result = self.panel4d.reindex()
-            assert_panel4d_equal(result, self.panel4d)
-            self.assertFalse(result is self.panel4d)
-
-            # with filling
-            smaller_major = self.panel4d.major_axis[::5]
-            smaller = self.panel4d.reindex(major=smaller_major)
-
-            larger = smaller.reindex(major=self.panel4d.major_axis,
-                                     method='pad')
-
-            assert_panel_equal(larger.loc[:, :, self.panel4d.major_axis[1], :],
-                               smaller.loc[:, :, smaller_major[0], :])
-
-            # don't necessarily copy
-            result = self.panel4d.reindex(
-                major=self.panel4d.major_axis, copy=False)
-            assert_panel4d_equal(result, self.panel4d)
-            self.assertTrue(result is self.panel4d)
-
-    def test_not_hashable(self):
-        with catch_warnings(record=True):
-            p4D_empty = Panel4D()
-            self.assertRaises(TypeError, hash, p4D_empty)
-            self.assertRaises(TypeError, hash, self.panel4d)
-
-    def test_reindex_like(self):
-        # reindex_like
-        with catch_warnings(record=True):
-            smaller = self.panel4d.reindex(labels=self.panel4d.labels[:-1],
-                                           items=self.panel4d.items[:-1],
-                                           major=self.panel4d.major_axis[:-1],
-                                           minor=self.panel4d.minor_axis[:-1])
-            smaller_like = self.panel4d.reindex_like(smaller)
-            assert_panel4d_equal(smaller, smaller_like)
-
-    def test_sort_index(self):
-        with catch_warnings(record=True):
-            import random
-
-            rlabels = list(self.panel4d.labels)
-            ritems = list(self.panel4d.items)
-            rmajor = list(self.panel4d.major_axis)
-            rminor = list(self.panel4d.minor_axis)
-            random.shuffle(rlabels)
-            random.shuffle(ritems)
-            random.shuffle(rmajor)
-            random.shuffle(rminor)
-
-            random_order = self.panel4d.reindex(labels=rlabels)
-            sorted_panel4d = random_order.sort_index(axis=0)
-            assert_panel4d_equal(sorted_panel4d, self.panel4d)
-
-    def test_fillna(self):
-
-        with catch_warnings(record=True):
-            self.assertFalse(np.isfinite(self.panel4d.values).all())
-            filled = self.panel4d.fillna(0)
-            self.assertTrue(np.isfinite(filled.values).all())
-
-            self.assertRaises(NotImplementedError,
-                              self.panel4d.fillna, method='pad')
-
-    def test_swapaxes(self):
-        with catch_warnings(record=True):
-            result = self.panel4d.swapaxes('labels', 'items')
-            self.assertIs(result.items, self.panel4d.labels)
-
-            result = self.panel4d.swapaxes('labels', 'minor')
-            self.assertIs(result.labels, self.panel4d.minor_axis)
-
-            result = self.panel4d.swapaxes('items', 'minor')
-            self.assertIs(result.items, self.panel4d.minor_axis)
-
-            result = self.panel4d.swapaxes('items', 'major')
-            self.assertIs(result.items, self.panel4d.major_axis)
-
-            result = self.panel4d.swapaxes('major', 'minor')
-            self.assertIs(result.major_axis, self.panel4d.minor_axis)
-
-            # this should also work
-            result = self.panel4d.swapaxes(0, 1)
-            self.assertIs(result.labels, self.panel4d.items)
-
-            # this works, but return a copy
-            result = self.panel4d.swapaxes('items', 'items')
-            assert_panel4d_equal(self.panel4d, result)
-            self.assertNotEqual(id(self.panel4d), id(result))
-
-    def test_update(self):
-
-        with catch_warnings(record=True):
-            p4d = Panel4D([[[[1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.]],
-                            [[1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.],
-                             [1.5, np.nan, 3.]]]])
-
-            other = Panel4D([[[[3.6, 2., np.nan]],
-                              [[np.nan, np.nan, 7]]]])
-
-            p4d.update(other)
-
-            expected = Panel4D([[[[3.6, 2, 3.],
-                                  [1.5, np.nan, 3.],
-                                  [1.5, np.nan, 3.],
-                                  [1.5, np.nan, 3.]],
-                                 [[1.5, np.nan, 7],
-                                  [1.5, np.nan, 3.],
-                                  [1.5, np.nan, 3.],
-                                  [1.5, np.nan, 3.]]]])
-
-            assert_panel4d_equal(p4d, expected)
-
-    def test_dtypes(self):
-
-        result = self.panel4d.dtypes
-        expected = Series(np.dtype('float64'), index=self.panel4d.labels)
-        assert_series_equal(result, expected)
-
-    def test_repr_empty(self):
-        with catch_warnings(record=True):
-            empty = Panel4D()
-            repr(empty)
-
-    def test_rename(self):
-        with catch_warnings(record=True):
-
-            mapper = {'l1': 'foo',
-                      'l2': 'bar',
-                      'l3': 'baz'}
-
-            renamed = self.panel4d.rename_axis(mapper, axis=0)
-            exp = Index(['foo', 'bar', 'baz'])
-            self.assert_index_equal(renamed.labels, exp)
-
-            renamed = self.panel4d.rename_axis(str.lower, axis=3)
-            exp = Index(['a', 'b', 'c', 'd'])
-            self.assert_index_equal(renamed.minor_axis, exp)
-
-            # don't copy
-            renamed_nocopy = self.panel4d.rename_axis(mapper,
-                                                      axis=0,
-                                                      copy=False)
-            renamed_nocopy['foo'] = 3.
-            self.assertTrue((self.panel4d['l1'].values == 3).all())
-
-    def test_get_attr(self):
-        assert_panel_equal(self.panel4d['l1'], self.panel4d.l1)
diff --git a/pandas/tests/test_panelnd.py b/pandas/tests/test_panelnd.py
deleted file mode 100644
index 7ecc773cd7bea..0000000000000
--- a/pandas/tests/test_panelnd.py
+++ /dev/null
@@ -1,102 +0,0 @@
-# -*- coding: utf-8 -*-
-from warnings import catch_warnings
-from pandas.core import panelnd
-from pandas.core.panel import Panel
-
-from pandas.util.testing import assert_panel_equal
-import pandas.util.testing as tm
-
-
-class TestPanelnd(tm.TestCase):
-
-    def setUp(self):
-        pass
-
-    def test_4d_construction(self):
-
-        with catch_warnings(record=True):
-
-            # create a 4D
-            Panel4D = panelnd.create_nd_panel_factory(
-                klass_name='Panel4D',
-                orders=['labels', 'items', 'major_axis', 'minor_axis'],
-                slices={'items': 'items', 'major_axis': 'major_axis',
-                        'minor_axis': 'minor_axis'},
-                slicer=Panel,
-                aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-                stat_axis=2)
-
-            p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))  # noqa
-
-    def test_4d_construction_alt(self):
-
-        with catch_warnings(record=True):
-
-            # create a 4D
-            Panel4D = panelnd.create_nd_panel_factory(
-                klass_name='Panel4D',
-                orders=['labels', 'items', 'major_axis', 'minor_axis'],
-                slices={'items': 'items', 'major_axis': 'major_axis',
-                        'minor_axis': 'minor_axis'},
-                slicer='Panel',
-                aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-                stat_axis=2)
-
-            p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))  # noqa
-
-    def test_4d_construction_error(self):
-
-        # create a 4D
-        self.assertRaises(Exception,
-                          panelnd.create_nd_panel_factory,
-                          klass_name='Panel4D',
-                          orders=['labels', 'items', 'major_axis',
-                                  'minor_axis'],
-                          slices={'items': 'items',
-                                  'major_axis': 'major_axis',
-                                  'minor_axis': 'minor_axis'},
-                          slicer='foo',
-                          aliases={'major': 'major_axis',
-                                   'minor': 'minor_axis'},
-                          stat_axis=2)
-
-    def test_5d_construction(self):
-
-        with catch_warnings(record=True):
-
-            # create a 4D
-            Panel4D = panelnd.create_nd_panel_factory(
-                klass_name='Panel4D',
-                orders=['labels1', 'items', 'major_axis', 'minor_axis'],
-                slices={'items': 'items', 'major_axis': 'major_axis',
-                        'minor_axis': 'minor_axis'},
-                slicer=Panel,
-                aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-                stat_axis=2)
-
-            # deprecation GH13564
-            p4d = Panel4D(dict(L1=tm.makePanel(), L2=tm.makePanel()))
-
-            # create a 5D
-            Panel5D = panelnd.create_nd_panel_factory(
-                klass_name='Panel5D',
-                orders=['cool1', 'labels1', 'items', 'major_axis',
-                        'minor_axis'],
-                slices={'labels1': 'labels1', 'items': 'items',
-                        'major_axis': 'major_axis',
-                        'minor_axis': 'minor_axis'},
-                slicer=Panel4D,
-                aliases={'major': 'major_axis', 'minor': 'minor_axis'},
-                stat_axis=2)
-
-            # deprecation GH13564
-            p5d = Panel5D(dict(C1=p4d))
-
-            # slice back to 4d
-            results = p5d.iloc[p5d.cool1.get_loc('C1'), :, :, 0:3, :]
-            expected = p4d.iloc[:, :, 0:3, :]
-            assert_panel_equal(results['L1'], expected['L1'])
-
-            # test a transpose
-            # results  = p5d.transpose(1,2,3,4,0)
-            # expected =
diff --git a/pandas/tests/test_register_accessor.py b/pandas/tests/test_register_accessor.py
new file mode 100644
index 0000000000000..acc18ed7ad049
--- /dev/null
+++ b/pandas/tests/test_register_accessor.py
@@ -0,0 +1,89 @@
+import contextlib
+
+import pytest
+
+import pandas as pd
+import pandas.util.testing as tm
+
+
+@contextlib.contextmanager
+def ensure_removed(obj, attr):
+    """Ensure that an attribute added to 'obj' during the test is
+    removed when we're done"""
+    try:
+        yield
+    finally:
+        try:
+            delattr(obj, attr)
+        except AttributeError:
+            pass
+        obj._accessors.discard(attr)
+
+
+class MyAccessor(object):
+
+    def __init__(self, obj):
+        self.obj = obj
+        self.item = 'item'
+
+    @property
+    def prop(self):
+        return self.item
+
+    def method(self):
+        return self.item
+
+
+@pytest.mark.parametrize('obj, registrar', [
+    (pd.Series, pd.api.extensions.register_series_accessor),
+    (pd.DataFrame, pd.api.extensions.register_dataframe_accessor),
+    (pd.Index, pd.api.extensions.register_index_accessor)
+])
+def test_register(obj, registrar):
+    with ensure_removed(obj, 'mine'):
+        before = set(dir(obj))
+        registrar('mine')(MyAccessor)
+        assert obj([]).mine.prop == 'item'
+        after = set(dir(obj))
+        assert (before ^ after) == {'mine'}
+        assert 'mine' in obj._accessors
+
+
+def test_accessor_works():
+    with ensure_removed(pd.Series, 'mine'):
+        pd.api.extensions.register_series_accessor('mine')(MyAccessor)
+
+        s = pd.Series([1, 2])
+        assert s.mine.obj is s
+
+        assert s.mine.prop == 'item'
+        assert s.mine.method() == 'item'
+
+
+def test_overwrite_warns():
+    # Need to restore mean
+    mean = pd.Series.mean
+    try:
+        with tm.assert_produces_warning(UserWarning) as w:
+            pd.api.extensions.register_series_accessor('mean')(MyAccessor)
+            s = pd.Series([1, 2])
+            assert s.mean.prop == 'item'
+        msg = str(w[0].message)
+        assert 'mean' in msg
+        assert 'MyAccessor' in msg
+        assert 'Series' in msg
+    finally:
+        pd.Series.mean = mean
+
+
+def test_raises_attribute_error():
+
+    with ensure_removed(pd.Series, 'bad'):
+
+        @pd.api.extensions.register_series_accessor("bad")
+        class Bad(object):
+            def __init__(self, data):
+                raise AttributeError("whoops")
+
+        with pytest.raises(AttributeError, match="whoops"):
+            pd.Series([]).bad
diff --git a/pandas/tests/test_reshape.py b/pandas/tests/test_reshape.py
deleted file mode 100644
index 7ba743a6c425c..0000000000000
--- a/pandas/tests/test_reshape.py
+++ /dev/null
@@ -1,957 +0,0 @@
-# -*- coding: utf-8 -*-
-# pylint: disable-msg=W0612,E1101
-
-from pandas import DataFrame, Series
-import pandas as pd
-
-from numpy import nan
-import numpy as np
-
-from pandas.util.testing import assert_frame_equal
-
-from pandas.core.reshape import (melt, lreshape, get_dummies, wide_to_long)
-import pandas.util.testing as tm
-from pandas.compat import range, u
-
-
-class TestMelt(tm.TestCase):
-
-    def setUp(self):
-        self.df = tm.makeTimeDataFrame()[:10]
-        self.df['id1'] = (self.df['A'] > 0).astype(np.int64)
-        self.df['id2'] = (self.df['B'] > 0).astype(np.int64)
-
-        self.var_name = 'var'
-        self.value_name = 'val'
-
-        self.df1 = pd.DataFrame([[1.067683, -1.110463, 0.20867
-                                  ], [-1.321405, 0.368915, -1.055342],
-                                 [-0.807333, 0.08298, -0.873361]])
-        self.df1.columns = [list('ABC'), list('abc')]
-        self.df1.columns.names = ['CAP', 'low']
-
-    def test_default_col_names(self):
-        result = melt(self.df)
-        self.assertEqual(result.columns.tolist(), ['variable', 'value'])
-
-        result1 = melt(self.df, id_vars=['id1'])
-        self.assertEqual(result1.columns.tolist(), ['id1', 'variable', 'value'
-                                                    ])
-
-        result2 = melt(self.df, id_vars=['id1', 'id2'])
-        self.assertEqual(result2.columns.tolist(), ['id1', 'id2', 'variable',
-                                                    'value'])
-
-    def test_value_vars(self):
-        result3 = melt(self.df, id_vars=['id1', 'id2'], value_vars='A')
-        self.assertEqual(len(result3), 10)
-
-        result4 = melt(self.df, id_vars=['id1', 'id2'], value_vars=['A', 'B'])
-        expected4 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                               'id2': self.df['id2'].tolist() * 2,
-                               'variable': ['A'] * 10 + ['B'] * 10,
-                               'value': (self.df['A'].tolist() +
-                                         self.df['B'].tolist())},
-                              columns=['id1', 'id2', 'variable', 'value'])
-        tm.assert_frame_equal(result4, expected4)
-
-    def test_value_vars_types(self):
-        # GH 15348
-        expected = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                              'id2': self.df['id2'].tolist() * 2,
-                              'variable': ['A'] * 10 + ['B'] * 10,
-                              'value': (self.df['A'].tolist() +
-                                        self.df['B'].tolist())},
-                             columns=['id1', 'id2', 'variable', 'value'])
-
-        for type_ in (tuple, list, np.array):
-            result = melt(self.df, id_vars=['id1', 'id2'],
-                          value_vars=type_(('A', 'B')))
-            tm.assert_frame_equal(result, expected)
-
-    def test_vars_work_with_multiindex(self):
-        expected = DataFrame({
-            ('A', 'a'): self.df1[('A', 'a')],
-            'CAP': ['B'] * len(self.df1),
-            'low': ['b'] * len(self.df1),
-            'value': self.df1[('B', 'b')],
-        }, columns=[('A', 'a'), 'CAP', 'low', 'value'])
-
-        result = melt(self.df1, id_vars=[('A', 'a')], value_vars=[('B', 'b')])
-        tm.assert_frame_equal(result, expected)
-
-    def test_tuple_vars_fail_with_multiindex(self):
-        # melt should fail with an informative error message if
-        # the columns have a MultiIndex and a tuple is passed
-        # for id_vars or value_vars.
-        tuple_a = ('A', 'a')
-        list_a = [tuple_a]
-        tuple_b = ('B', 'b')
-        list_b = [tuple_b]
-
-        for id_vars, value_vars in ((tuple_a, list_b), (list_a, tuple_b),
-                                    (tuple_a, tuple_b)):
-            with tm.assertRaisesRegexp(ValueError, r'MultiIndex'):
-                melt(self.df1, id_vars=id_vars, value_vars=value_vars)
-
-    def test_custom_var_name(self):
-        result5 = melt(self.df, var_name=self.var_name)
-        self.assertEqual(result5.columns.tolist(), ['var', 'value'])
-
-        result6 = melt(self.df, id_vars=['id1'], var_name=self.var_name)
-        self.assertEqual(result6.columns.tolist(), ['id1', 'var', 'value'])
-
-        result7 = melt(self.df, id_vars=['id1', 'id2'], var_name=self.var_name)
-        self.assertEqual(result7.columns.tolist(), ['id1', 'id2', 'var',
-                                                    'value'])
-
-        result8 = melt(self.df, id_vars=['id1', 'id2'], value_vars='A',
-                       var_name=self.var_name)
-        self.assertEqual(result8.columns.tolist(), ['id1', 'id2', 'var',
-                                                    'value'])
-
-        result9 = melt(self.df, id_vars=['id1', 'id2'], value_vars=['A', 'B'],
-                       var_name=self.var_name)
-        expected9 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                               'id2': self.df['id2'].tolist() * 2,
-                               self.var_name: ['A'] * 10 + ['B'] * 10,
-                               'value': (self.df['A'].tolist() +
-                                         self.df['B'].tolist())},
-                              columns=['id1', 'id2', self.var_name, 'value'])
-        tm.assert_frame_equal(result9, expected9)
-
-    def test_custom_value_name(self):
-        result10 = melt(self.df, value_name=self.value_name)
-        self.assertEqual(result10.columns.tolist(), ['variable', 'val'])
-
-        result11 = melt(self.df, id_vars=['id1'], value_name=self.value_name)
-        self.assertEqual(result11.columns.tolist(), ['id1', 'variable', 'val'])
-
-        result12 = melt(self.df, id_vars=['id1', 'id2'],
-                        value_name=self.value_name)
-        self.assertEqual(result12.columns.tolist(), ['id1', 'id2', 'variable',
-                                                     'val'])
-
-        result13 = melt(self.df, id_vars=['id1', 'id2'], value_vars='A',
-                        value_name=self.value_name)
-        self.assertEqual(result13.columns.tolist(), ['id1', 'id2', 'variable',
-                                                     'val'])
-
-        result14 = melt(self.df, id_vars=['id1', 'id2'], value_vars=['A', 'B'],
-                        value_name=self.value_name)
-        expected14 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                                'id2': self.df['id2'].tolist() * 2,
-                                'variable': ['A'] * 10 + ['B'] * 10,
-                                self.value_name: (self.df['A'].tolist() +
-                                                  self.df['B'].tolist())},
-                               columns=['id1', 'id2', 'variable',
-                                        self.value_name])
-        tm.assert_frame_equal(result14, expected14)
-
-    def test_custom_var_and_value_name(self):
-
-        result15 = melt(self.df, var_name=self.var_name,
-                        value_name=self.value_name)
-        self.assertEqual(result15.columns.tolist(), ['var', 'val'])
-
-        result16 = melt(self.df, id_vars=['id1'], var_name=self.var_name,
-                        value_name=self.value_name)
-        self.assertEqual(result16.columns.tolist(), ['id1', 'var', 'val'])
-
-        result17 = melt(self.df, id_vars=['id1', 'id2'],
-                        var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result17.columns.tolist(), ['id1', 'id2', 'var', 'val'
-                                                     ])
-
-        result18 = melt(self.df, id_vars=['id1', 'id2'], value_vars='A',
-                        var_name=self.var_name, value_name=self.value_name)
-        self.assertEqual(result18.columns.tolist(), ['id1', 'id2', 'var', 'val'
-                                                     ])
-
-        result19 = melt(self.df, id_vars=['id1', 'id2'], value_vars=['A', 'B'],
-                        var_name=self.var_name, value_name=self.value_name)
-        expected19 = DataFrame({'id1': self.df['id1'].tolist() * 2,
-                                'id2': self.df['id2'].tolist() * 2,
-                                self.var_name: ['A'] * 10 + ['B'] * 10,
-                                self.value_name: (self.df['A'].tolist() +
-                                                  self.df['B'].tolist())},
-                               columns=['id1', 'id2', self.var_name,
-                                        self.value_name])
-        tm.assert_frame_equal(result19, expected19)
-
-        df20 = self.df.copy()
-        df20.columns.name = 'foo'
-        result20 = melt(df20)
-        self.assertEqual(result20.columns.tolist(), ['foo', 'value'])
-
-    def test_col_level(self):
-        res1 = melt(self.df1, col_level=0)
-        res2 = melt(self.df1, col_level='CAP')
-        self.assertEqual(res1.columns.tolist(), ['CAP', 'value'])
-        self.assertEqual(res2.columns.tolist(), ['CAP', 'value'])
-
-    def test_multiindex(self):
-        res = pd.melt(self.df1)
-        self.assertEqual(res.columns.tolist(), ['CAP', 'low', 'value'])
-
-
-class TestGetDummies(tm.TestCase):
-
-    sparse = False
-
-    def setUp(self):
-        self.df = DataFrame({'A': ['a', 'b', 'a'],
-                             'B': ['b', 'b', 'c'],
-                             'C': [1, 2, 3]})
-
-    def test_basic(self):
-        s_list = list('abc')
-        s_series = Series(s_list)
-        s_series_index = Series(s_list, list('ABC'))
-
-        expected = DataFrame({'a': {0: 1,
-                                    1: 0,
-                                    2: 0},
-                              'b': {0: 0,
-                                    1: 1,
-                                    2: 0},
-                              'c': {0: 0,
-                                    1: 0,
-                                    2: 1}}, dtype=np.uint8)
-        assert_frame_equal(get_dummies(s_list, sparse=self.sparse), expected)
-        assert_frame_equal(get_dummies(s_series, sparse=self.sparse), expected)
-
-        expected.index = list('ABC')
-        assert_frame_equal(
-            get_dummies(s_series_index, sparse=self.sparse), expected)
-
-    def test_basic_types(self):
-        # GH 10531
-        s_list = list('abc')
-        s_series = Series(s_list)
-        s_df = DataFrame({'a': [0, 1, 0, 1, 2],
-                          'b': ['A', 'A', 'B', 'C', 'C'],
-                          'c': [2, 3, 3, 3, 2]})
-
-        expected = DataFrame({'a': [1, 0, 0],
-                              'b': [0, 1, 0],
-                              'c': [0, 0, 1]},
-                             dtype='uint8',
-                             columns=list('abc'))
-        if not self.sparse:
-            compare = tm.assert_frame_equal
-        else:
-            expected = expected.to_sparse(fill_value=0, kind='integer')
-            compare = tm.assert_sp_frame_equal
-
-        result = get_dummies(s_list, sparse=self.sparse)
-        compare(result, expected)
-
-        result = get_dummies(s_series, sparse=self.sparse)
-        compare(result, expected)
-
-        result = get_dummies(s_df, sparse=self.sparse, columns=s_df.columns)
-        tm.assert_series_equal(result.get_dtype_counts(),
-                               Series({'uint8': 8}))
-
-        result = get_dummies(s_df, sparse=self.sparse, columns=['a'])
-        expected = Series({'uint8': 3, 'int64': 1, 'object': 1}).sort_values()
-        tm.assert_series_equal(result.get_dtype_counts().sort_values(),
-                               expected)
-
-    def test_just_na(self):
-        just_na_list = [np.nan]
-        just_na_series = Series(just_na_list)
-        just_na_series_index = Series(just_na_list, index=['A'])
-
-        res_list = get_dummies(just_na_list, sparse=self.sparse)
-        res_series = get_dummies(just_na_series, sparse=self.sparse)
-        res_series_index = get_dummies(just_na_series_index,
-                                       sparse=self.sparse)
-
-        self.assertEqual(res_list.empty, True)
-        self.assertEqual(res_series.empty, True)
-        self.assertEqual(res_series_index.empty, True)
-
-        self.assertEqual(res_list.index.tolist(), [0])
-        self.assertEqual(res_series.index.tolist(), [0])
-        self.assertEqual(res_series_index.index.tolist(), ['A'])
-
-    def test_include_na(self):
-        s = ['a', 'b', np.nan]
-        res = get_dummies(s, sparse=self.sparse)
-        exp = DataFrame({'a': {0: 1, 1: 0, 2: 0},
-                         'b': {0: 0, 1: 1, 2: 0}}, dtype=np.uint8)
-        assert_frame_equal(res, exp)
-
-        # Sparse dataframes do not allow nan labelled columns, see #GH8822
-        res_na = get_dummies(s, dummy_na=True, sparse=self.sparse)
-        exp_na = DataFrame({nan: {0: 0, 1: 0, 2: 1},
-                            'a': {0: 1, 1: 0, 2: 0},
-                            'b': {0: 0, 1: 1, 2: 0}},
-                           dtype=np.uint8)
-        exp_na = exp_na.reindex_axis(['a', 'b', nan], 1)
-        # hack (NaN handling in assert_index_equal)
-        exp_na.columns = res_na.columns
-        assert_frame_equal(res_na, exp_na)
-
-        res_just_na = get_dummies([nan], dummy_na=True, sparse=self.sparse)
-        exp_just_na = DataFrame(Series(1, index=[0]), columns=[nan],
-                                dtype=np.uint8)
-        tm.assert_numpy_array_equal(res_just_na.values, exp_just_na.values)
-
-    def test_unicode(self
-                     ):  # See GH 6885 - get_dummies chokes on unicode values
-        import unicodedata
-        e = 'e'
-        eacute = unicodedata.lookup('LATIN SMALL LETTER E WITH ACUTE')
-        s = [e, eacute, eacute]
-        res = get_dummies(s, prefix='letter', sparse=self.sparse)
-        exp = DataFrame({'letter_e': {0: 1,
-                                      1: 0,
-                                      2: 0},
-                         u('letter_%s') % eacute: {0: 0,
-                                                   1: 1,
-                                                   2: 1}},
-                        dtype=np.uint8)
-        assert_frame_equal(res, exp)
-
-    def test_dataframe_dummies_all_obj(self):
-        df = self.df[['A', 'B']]
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'A_a': [1, 0, 1],
-                              'A_b': [0, 1, 0],
-                              'B_b': [1, 1, 0],
-                              'B_c': [0, 0, 1]}, dtype=np.uint8)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_mix_default(self):
-        df = self.df
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3],
-                              'A_a': [1, 0, 1],
-                              'A_b': [0, 1, 0],
-                              'B_b': [1, 1, 0],
-                              'B_c': [0, 0, 1]})
-        cols = ['A_a', 'A_b', 'B_b', 'B_c']
-        expected[cols] = expected[cols].astype(np.uint8)
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_list(self):
-        prefixes = ['from_A', 'from_B']
-        df = DataFrame({'A': ['a', 'b', 'a'],
-                        'B': ['b', 'b', 'c'],
-                        'C': [1, 2, 3]})
-        result = get_dummies(df, prefix=prefixes, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3],
-                              'from_A_a': [1, 0, 1],
-                              'from_A_b': [0, 1, 0],
-                              'from_B_b': [1, 1, 0],
-                              'from_B_c': [0, 0, 1]})
-        cols = expected.columns[1:]
-        expected[cols] = expected[cols].astype(np.uint8)
-        expected = expected[['C', 'from_A_a', 'from_A_b', 'from_B_b',
-                             'from_B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_str(self):
-        # not that you should do this...
-        df = self.df
-        result = get_dummies(df, prefix='bad', sparse=self.sparse)
-        expected = DataFrame([[1, 1, 0, 1, 0],
-                              [2, 0, 1, 1, 0],
-                              [3, 1, 0, 0, 1]],
-                             columns=['C', 'bad_a', 'bad_b', 'bad_b', 'bad_c'],
-                             dtype=np.uint8)
-        expected = expected.astype({"C": np.int64})
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_subset(self):
-        df = self.df
-        result = get_dummies(df, prefix=['from_A'], columns=['A'],
-                             sparse=self.sparse)
-        expected = DataFrame({'from_A_a': [1, 0, 1],
-                              'from_A_b': [0, 1, 0],
-                              'B': ['b', 'b', 'c'],
-                              'C': [1, 2, 3]})
-        cols = ['from_A_a', 'from_A_b']
-        expected[cols] = expected[cols].astype(np.uint8)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_sep(self):
-        df = self.df
-        result = get_dummies(df, prefix_sep='..', sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3],
-                              'A..a': [1, 0, 1],
-                              'A..b': [0, 1, 0],
-                              'B..b': [1, 1, 0],
-                              'B..c': [0, 0, 1]})
-        expected = expected[['C', 'A..a', 'A..b', 'B..b', 'B..c']]
-        cols = expected.columns[1:]
-        expected[cols] = expected[cols].astype(np.uint8)
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, prefix_sep=['..', '__'], sparse=self.sparse)
-        expected = expected.rename(columns={'B..b': 'B__b', 'B..c': 'B__c'})
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, prefix_sep={'A': '..',
-                                             'B': '__'}, sparse=self.sparse)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_prefix_bad_length(self):
-        with tm.assertRaises(ValueError):
-            get_dummies(self.df, prefix=['too few'], sparse=self.sparse)
-
-    def test_dataframe_dummies_prefix_sep_bad_length(self):
-        with tm.assertRaises(ValueError):
-            get_dummies(self.df, prefix_sep=['bad'], sparse=self.sparse)
-
-    def test_dataframe_dummies_prefix_dict(self):
-        prefixes = {'A': 'from_A', 'B': 'from_B'}
-        df = DataFrame({'A': ['a', 'b', 'a'],
-                        'B': ['b', 'b', 'c'],
-                        'C': [1, 2, 3]})
-        result = get_dummies(df, prefix=prefixes, sparse=self.sparse)
-        expected = DataFrame({'from_A_a': [1, 0, 1],
-                              'from_A_b': [0, 1, 0],
-                              'from_B_b': [1, 1, 0],
-                              'from_B_c': [0, 0, 1],
-                              'C': [1, 2, 3]})
-        cols = ['from_A_a', 'from_A_b', 'from_B_b', 'from_B_c']
-        expected[cols] = expected[cols].astype(np.uint8)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_with_na(self):
-        df = self.df
-        df.loc[3, :] = [np.nan, np.nan, np.nan]
-        result = get_dummies(df, dummy_na=True, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3, np.nan],
-                              'A_a': [1, 0, 1, 0],
-                              'A_b': [0, 1, 0, 0],
-                              'A_nan': [0, 0, 0, 1],
-                              'B_b': [1, 1, 0, 0],
-                              'B_c': [0, 0, 1, 0],
-                              'B_nan': [0, 0, 0, 1]})
-        cols = ['A_a', 'A_b', 'A_nan', 'B_b', 'B_c', 'B_nan']
-        expected[cols] = expected[cols].astype(np.uint8)
-        expected = expected[['C', 'A_a', 'A_b', 'A_nan',
-                             'B_b', 'B_c', 'B_nan']]
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, dummy_na=False, sparse=self.sparse)
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_with_categorical(self):
-        df = self.df
-        df['cat'] = pd.Categorical(['x', 'y', 'y'])
-        result = get_dummies(df, sparse=self.sparse)
-        expected = DataFrame({'C': [1, 2, 3],
-                              'A_a': [1, 0, 1],
-                              'A_b': [0, 1, 0],
-                              'B_b': [1, 1, 0],
-                              'B_c': [0, 0, 1],
-                              'cat_x': [1, 0, 0],
-                              'cat_y': [0, 1, 1]})
-        cols = ['A_a', 'A_b', 'B_b', 'B_c', 'cat_x', 'cat_y']
-        expected[cols] = expected[cols].astype(np.uint8)
-        expected = expected[['C', 'A_a', 'A_b', 'B_b', 'B_c',
-                             'cat_x', 'cat_y']]
-        assert_frame_equal(result, expected)
-
-    # GH12402 Add a new parameter `drop_first` to avoid collinearity
-    def test_basic_drop_first(self):
-        # Basic case
-        s_list = list('abc')
-        s_series = Series(s_list)
-        s_series_index = Series(s_list, list('ABC'))
-
-        expected = DataFrame({'b': {0: 0,
-                                    1: 1,
-                                    2: 0},
-                              'c': {0: 0,
-                                    1: 0,
-                                    2: 1}}, dtype=np.uint8)
-
-        result = get_dummies(s_list, sparse=self.sparse, drop_first=True)
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(s_series, sparse=self.sparse, drop_first=True)
-        assert_frame_equal(result, expected)
-
-        expected.index = list('ABC')
-        result = get_dummies(s_series_index, sparse=self.sparse,
-                             drop_first=True)
-        assert_frame_equal(result, expected)
-
-    def test_basic_drop_first_one_level(self):
-        # Test the case that categorical variable only has one level.
-        s_list = list('aaa')
-        s_series = Series(s_list)
-        s_series_index = Series(s_list, list('ABC'))
-
-        expected = DataFrame(index=np.arange(3))
-
-        result = get_dummies(s_list, sparse=self.sparse, drop_first=True)
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(s_series, sparse=self.sparse, drop_first=True)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(index=list('ABC'))
-        result = get_dummies(s_series_index, sparse=self.sparse,
-                             drop_first=True)
-        assert_frame_equal(result, expected)
-
-    def test_basic_drop_first_NA(self):
-        # Test NA hadling together with drop_first
-        s_NA = ['a', 'b', np.nan]
-        res = get_dummies(s_NA, sparse=self.sparse, drop_first=True)
-        exp = DataFrame({'b': {0: 0,
-                               1: 1,
-                               2: 0}}, dtype=np.uint8)
-        assert_frame_equal(res, exp)
-
-        res_na = get_dummies(s_NA, dummy_na=True, sparse=self.sparse,
-                             drop_first=True)
-        exp_na = DataFrame({'b': {0: 0,
-                                  1: 1,
-                                  2: 0},
-                            nan: {0: 0,
-                                  1: 0,
-                                  2: 1}}, dtype=np.uint8).reindex_axis(
-                                      ['b', nan], 1)
-        assert_frame_equal(res_na, exp_na)
-
-        res_just_na = get_dummies([nan], dummy_na=True, sparse=self.sparse,
-                                  drop_first=True)
-        exp_just_na = DataFrame(index=np.arange(1))
-        assert_frame_equal(res_just_na, exp_just_na)
-
-    def test_dataframe_dummies_drop_first(self):
-        df = self.df[['A', 'B']]
-        result = get_dummies(df, sparse=self.sparse, drop_first=True)
-        expected = DataFrame({'A_b': [0, 1, 0],
-                              'B_c': [0, 0, 1]}, dtype=np.uint8)
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_drop_first_with_categorical(self):
-        df = self.df
-        df['cat'] = pd.Categorical(['x', 'y', 'y'])
-        result = get_dummies(df, sparse=self.sparse, drop_first=True)
-        expected = DataFrame({'C': [1, 2, 3],
-                              'A_b': [0, 1, 0],
-                              'B_c': [0, 0, 1],
-                              'cat_y': [0, 1, 1]})
-        cols = ['A_b', 'B_c', 'cat_y']
-        expected[cols] = expected[cols].astype(np.uint8)
-        expected = expected[['C', 'A_b', 'B_c', 'cat_y']]
-        assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_drop_first_with_na(self):
-        df = self.df
-        df.loc[3, :] = [np.nan, np.nan, np.nan]
-        result = get_dummies(df, dummy_na=True, sparse=self.sparse,
-                             drop_first=True)
-        expected = DataFrame({'C': [1, 2, 3, np.nan],
-                              'A_b': [0, 1, 0, 0],
-                              'A_nan': [0, 0, 0, 1],
-                              'B_c': [0, 0, 1, 0],
-                              'B_nan': [0, 0, 0, 1]})
-        cols = ['A_b', 'A_nan', 'B_c', 'B_nan']
-        expected[cols] = expected[cols].astype(np.uint8)
-
-        expected = expected[['C', 'A_b', 'A_nan', 'B_c', 'B_nan']]
-        assert_frame_equal(result, expected)
-
-        result = get_dummies(df, dummy_na=False, sparse=self.sparse,
-                             drop_first=True)
-        expected = expected[['C', 'A_b', 'B_c']]
-        assert_frame_equal(result, expected)
-
-    def test_int_int(self):
-        data = Series([1, 2, 1])
-        result = pd.get_dummies(data)
-        expected = DataFrame([[1, 0], [0, 1], [1, 0]], columns=[1, 2],
-                             dtype=np.uint8)
-        tm.assert_frame_equal(result, expected)
-
-        data = Series(pd.Categorical(['a', 'b', 'a']))
-        result = pd.get_dummies(data)
-        expected = DataFrame([[1, 0], [0, 1], [1, 0]],
-                             columns=pd.Categorical(['a', 'b']),
-                             dtype=np.uint8)
-        tm.assert_frame_equal(result, expected)
-
-    def test_int_df(self):
-        data = DataFrame(
-            {'A': [1, 2, 1],
-             'B': pd.Categorical(['a', 'b', 'a']),
-             'C': [1, 2, 1],
-             'D': [1., 2., 1.]
-             }
-        )
-        columns = ['C', 'D', 'A_1', 'A_2', 'B_a', 'B_b']
-        expected = DataFrame([
-            [1, 1., 1, 0, 1, 0],
-            [2, 2., 0, 1, 0, 1],
-            [1, 1., 1, 0, 1, 0]
-        ], columns=columns)
-        expected[columns[2:]] = expected[columns[2:]].astype(np.uint8)
-        result = pd.get_dummies(data, columns=['A', 'B'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_dataframe_dummies_preserve_categorical_dtype(self):
-        # GH13854
-        for ordered in [False, True]:
-            cat = pd.Categorical(list("xy"), categories=list("xyz"),
-                                 ordered=ordered)
-            result = get_dummies(cat)
-
-            data = np.array([[1, 0, 0], [0, 1, 0]], dtype=np.uint8)
-            cols = pd.CategoricalIndex(cat.categories,
-                                       categories=cat.categories,
-                                       ordered=ordered)
-            expected = DataFrame(data, columns=cols)
-
-            tm.assert_frame_equal(result, expected)
-
-
-class TestGetDummiesSparse(TestGetDummies):
-    sparse = True
-
-
-class TestMakeAxisDummies(tm.TestCase):
-
-    def test_preserve_categorical_dtype(self):
-        # GH13854
-        for ordered in [False, True]:
-            cidx = pd.CategoricalIndex(list("xyz"), ordered=ordered)
-            midx = pd.MultiIndex(levels=[['a'], cidx],
-                                 labels=[[0, 0], [0, 1]])
-            df = DataFrame([[10, 11]], index=midx)
-
-            expected = DataFrame([[1.0, 0.0, 0.0], [0.0, 1.0, 0.0]],
-                                 index=midx, columns=cidx)
-
-            from pandas.core.reshape import make_axis_dummies
-            result = make_axis_dummies(df)
-            tm.assert_frame_equal(result, expected)
-
-            result = make_axis_dummies(df, transform=lambda x: x)
-            tm.assert_frame_equal(result, expected)
-
-
-class TestLreshape(tm.TestCase):
-
-    def test_pairs(self):
-        data = {'birthdt': ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
-                            '11jan2009'],
-                'birthwt': [1766, 3301, 1454, 3139, 4133],
-                'id': [101, 102, 103, 104, 105],
-                'sex': ['Male', 'Female', 'Female', 'Female', 'Female'],
-                'visitdt1': ['11jan2009', '22dec2008', '04jan2009',
-                             '29dec2008', '20jan2009'],
-                'visitdt2':
-                ['21jan2009', nan, '22jan2009', '31dec2008', '03feb2009'],
-                'visitdt3': ['05feb2009', nan, nan, '02jan2009', '15feb2009'],
-                'wt1': [1823, 3338, 1549, 3298, 4306],
-                'wt2': [2011.0, nan, 1892.0, 3338.0, 4575.0],
-                'wt3': [2293.0, nan, nan, 3377.0, 4805.0]}
-
-        df = DataFrame(data)
-
-        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 4)],
-                'wt': ['wt%d' % i for i in range(1, 4)]}
-        result = lreshape(df, spec)
-
-        exp_data = {'birthdt':
-                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
-                     '11jan2009', '08jan2009', '30dec2008', '21dec2008',
-                     '11jan2009', '08jan2009', '21dec2008', '11jan2009'],
-                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 1454, 3139,
-                                4133, 1766, 3139, 4133],
-                    'id': [101, 102, 103, 104, 105, 101, 103, 104, 105, 101,
-                           104, 105],
-                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Male',
-                            'Female', 'Female'],
-                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
-                                '29dec2008', '20jan2009', '21jan2009',
-                                '22jan2009', '31dec2008', '03feb2009',
-                                '05feb2009', '02jan2009', '15feb2009'],
-                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0,
-                           1892.0, 3338.0, 4575.0, 2293.0, 3377.0, 4805.0]}
-        exp = DataFrame(exp_data, columns=result.columns)
-        tm.assert_frame_equal(result, exp)
-
-        result = lreshape(df, spec, dropna=False)
-        exp_data = {'birthdt':
-                    ['08jan2009', '20dec2008', '30dec2008', '21dec2008',
-                     '11jan2009', '08jan2009', '20dec2008', '30dec2008',
-                     '21dec2008', '11jan2009', '08jan2009', '20dec2008',
-                     '30dec2008', '21dec2008', '11jan2009'],
-                    'birthwt': [1766, 3301, 1454, 3139, 4133, 1766, 3301, 1454,
-                                3139, 4133, 1766, 3301, 1454, 3139, 4133],
-                    'id': [101, 102, 103, 104, 105, 101, 102, 103, 104, 105,
-                           101, 102, 103, 104, 105],
-                    'sex': ['Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Female',
-                            'Male', 'Female', 'Female', 'Female', 'Female'],
-                    'visitdt': ['11jan2009', '22dec2008', '04jan2009',
-                                '29dec2008', '20jan2009', '21jan2009', nan,
-                                '22jan2009', '31dec2008', '03feb2009',
-                                '05feb2009', nan, nan, '02jan2009',
-                                '15feb2009'],
-                    'wt': [1823.0, 3338.0, 1549.0, 3298.0, 4306.0, 2011.0, nan,
-                           1892.0, 3338.0, 4575.0, 2293.0, nan, nan, 3377.0,
-                           4805.0]}
-        exp = DataFrame(exp_data, columns=result.columns)
-        tm.assert_frame_equal(result, exp)
-
-        spec = {'visitdt': ['visitdt%d' % i for i in range(1, 3)],
-                'wt': ['wt%d' % i for i in range(1, 4)]}
-        self.assertRaises(ValueError, lreshape, df, spec)
-
-
-class TestWideToLong(tm.TestCase):
-
-    def test_simple(self):
-        np.random.seed(123)
-        x = np.random.randn(3)
-        df = pd.DataFrame({"A1970": {0: "a",
-                                     1: "b",
-                                     2: "c"},
-                           "A1980": {0: "d",
-                                     1: "e",
-                                     2: "f"},
-                           "B1970": {0: 2.5,
-                                     1: 1.2,
-                                     2: .7},
-                           "B1980": {0: 3.2,
-                                     1: 1.3,
-                                     2: .1},
-                           "X": dict(zip(
-                               range(3), x))})
-        df["id"] = df.index
-        exp_data = {"X": x.tolist() + x.tolist(),
-                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
-                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
-                    "year": ['1970', '1970', '1970', '1980', '1980', '1980'],
-                    "id": [0, 1, 2, 0, 1, 2]}
-        exp_frame = DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[["X", "A", "B"]]
-        long_frame = wide_to_long(df, ["A", "B"], i="id", j="year")
-        tm.assert_frame_equal(long_frame, exp_frame)
-
-    def test_stubs(self):
-        # GH9204
-        df = pd.DataFrame([[0, 1, 2, 3, 8], [4, 5, 6, 7, 9]])
-        df.columns = ['id', 'inc1', 'inc2', 'edu1', 'edu2']
-        stubs = ['inc', 'edu']
-
-        # TODO: unused?
-        df_long = pd.wide_to_long(df, stubs, i='id', j='age')  # noqa
-
-        self.assertEqual(stubs, ['inc', 'edu'])
-
-    def test_separating_character(self):
-        # GH14779
-        np.random.seed(123)
-        x = np.random.randn(3)
-        df = pd.DataFrame({"A.1970": {0: "a",
-                                      1: "b",
-                                      2: "c"},
-                           "A.1980": {0: "d",
-                                      1: "e",
-                                      2: "f"},
-                           "B.1970": {0: 2.5,
-                                      1: 1.2,
-                                      2: .7},
-                           "B.1980": {0: 3.2,
-                                      1: 1.3,
-                                      2: .1},
-                           "X": dict(zip(
-                               range(3), x))})
-        df["id"] = df.index
-        exp_data = {"X": x.tolist() + x.tolist(),
-                    "A": ['a', 'b', 'c', 'd', 'e', 'f'],
-                    "B": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
-                    "year": ['1970', '1970', '1970', '1980', '1980', '1980'],
-                    "id": [0, 1, 2, 0, 1, 2]}
-        exp_frame = DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[["X", "A", "B"]]
-        long_frame = wide_to_long(df, ["A", "B"], i="id", j="year", sep=".")
-        tm.assert_frame_equal(long_frame, exp_frame)
-
-    def test_escapable_characters(self):
-        np.random.seed(123)
-        x = np.random.randn(3)
-        df = pd.DataFrame({"A(quarterly)1970": {0: "a",
-                                                1: "b",
-                                                2: "c"},
-                           "A(quarterly)1980": {0: "d",
-                                                1: "e",
-                                                2: "f"},
-                           "B(quarterly)1970": {0: 2.5,
-                                                1: 1.2,
-                                                2: .7},
-                           "B(quarterly)1980": {0: 3.2,
-                                                1: 1.3,
-                                                2: .1},
-                           "X": dict(zip(
-                               range(3), x))})
-        df["id"] = df.index
-        exp_data = {"X": x.tolist() + x.tolist(),
-                    "A(quarterly)": ['a', 'b', 'c', 'd', 'e', 'f'],
-                    "B(quarterly)": [2.5, 1.2, 0.7, 3.2, 1.3, 0.1],
-                    "year": ['1970', '1970', '1970', '1980', '1980', '1980'],
-                    "id": [0, 1, 2, 0, 1, 2]}
-        exp_frame = DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(
-            ['id', 'year'])[["X", "A(quarterly)", "B(quarterly)"]]
-        long_frame = wide_to_long(df, ["A(quarterly)", "B(quarterly)"],
-                                  i="id", j="year")
-        tm.assert_frame_equal(long_frame, exp_frame)
-
-    def test_unbalanced(self):
-        # test that we can have a varying amount of time variables
-        df = pd.DataFrame({'A2010': [1.0, 2.0],
-                           'A2011': [3.0, 4.0],
-                           'B2010': [5.0, 6.0],
-                           'X': ['X1', 'X2']})
-        df['id'] = df.index
-        exp_data = {'X': ['X1', 'X1', 'X2', 'X2'],
-                    'A': [1.0, 3.0, 2.0, 4.0],
-                    'B': [5.0, np.nan, 6.0, np.nan],
-                    'id': [0, 0, 1, 1],
-                    'year': ['2010', '2011', '2010', '2011']}
-        exp_frame = pd.DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[["X", "A", "B"]]
-        long_frame = wide_to_long(df, ['A', 'B'], i='id', j='year')
-        tm.assert_frame_equal(long_frame, exp_frame)
-
-    def test_character_overlap(self):
-        # Test we handle overlapping characters in both id_vars and value_vars
-        df = pd.DataFrame({
-            'A11': ['a11', 'a22', 'a33'],
-            'A12': ['a21', 'a22', 'a23'],
-            'B11': ['b11', 'b12', 'b13'],
-            'B12': ['b21', 'b22', 'b23'],
-            'BB11': [1, 2, 3],
-            'BB12': [4, 5, 6],
-            'BBBX': [91, 92, 93],
-            'BBBZ': [91, 92, 93]
-        })
-        df['id'] = df.index
-        exp_frame = pd.DataFrame({
-            'BBBX': [91, 92, 93, 91, 92, 93],
-            'BBBZ': [91, 92, 93, 91, 92, 93],
-            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
-            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
-            'BB': [1, 2, 3, 4, 5, 6],
-            'id': [0, 1, 2, 0, 1, 2],
-            'year': ['11', '11', '11', '12', '12', '12']})
-        exp_frame = exp_frame.set_index(['id', 'year'])[
-            ['BBBX', 'BBBZ', 'A', 'B', 'BB']]
-        long_frame = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
-        tm.assert_frame_equal(long_frame.sort_index(axis=1),
-                              exp_frame.sort_index(axis=1))
-
-    def test_invalid_separator(self):
-        # if an invalid separator is supplied a empty data frame is returned
-        sep = 'nope!'
-        df = pd.DataFrame({'A2010': [1.0, 2.0],
-                           'A2011': [3.0, 4.0],
-                           'B2010': [5.0, 6.0],
-                           'X': ['X1', 'X2']})
-        df['id'] = df.index
-        exp_data = {'X': '',
-                    'A2010': [],
-                    'A2011': [],
-                    'B2010': [],
-                    'id': [],
-                    'year': [],
-                    'A': [],
-                    'B': []}
-        exp_frame = pd.DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[[
-            'X', 'A2010', 'A2011', 'B2010', 'A', 'B']]
-        exp_frame.index.set_levels([[0, 1], []], inplace=True)
-        long_frame = wide_to_long(df, ['A', 'B'], i='id', j='year', sep=sep)
-        tm.assert_frame_equal(long_frame.sort_index(axis=1),
-                              exp_frame.sort_index(axis=1))
-
-    def test_num_string_disambiguation(self):
-        # Test that we can disambiguate number value_vars from
-        # string value_vars
-        df = pd.DataFrame({
-            'A11': ['a11', 'a22', 'a33'],
-            'A12': ['a21', 'a22', 'a23'],
-            'B11': ['b11', 'b12', 'b13'],
-            'B12': ['b21', 'b22', 'b23'],
-            'BB11': [1, 2, 3],
-            'BB12': [4, 5, 6],
-            'Arating': [91, 92, 93],
-            'Arating_old': [91, 92, 93]
-        })
-        df['id'] = df.index
-        exp_frame = pd.DataFrame({
-            'Arating': [91, 92, 93, 91, 92, 93],
-            'Arating_old': [91, 92, 93, 91, 92, 93],
-            'A': ['a11', 'a22', 'a33', 'a21', 'a22', 'a23'],
-            'B': ['b11', 'b12', 'b13', 'b21', 'b22', 'b23'],
-            'BB': [1, 2, 3, 4, 5, 6],
-            'id': [0, 1, 2, 0, 1, 2],
-            'year': ['11', '11', '11', '12', '12', '12']})
-        exp_frame = exp_frame.set_index(['id', 'year'])[
-            ['Arating', 'Arating_old', 'A', 'B', 'BB']]
-        long_frame = wide_to_long(df, ['A', 'B', 'BB'], i='id', j='year')
-        tm.assert_frame_equal(long_frame.sort_index(axis=1),
-                              exp_frame.sort_index(axis=1))
-
-    def test_invalid_suffixtype(self):
-        # If all stubs names end with a string, but a numeric suffix is
-        # assumed,  an empty data frame is returned
-        df = pd.DataFrame({'Aone': [1.0, 2.0],
-                           'Atwo': [3.0, 4.0],
-                           'Bone': [5.0, 6.0],
-                           'X': ['X1', 'X2']})
-        df['id'] = df.index
-        exp_data = {'X': '',
-                    'Aone': [],
-                    'Atwo': [],
-                    'Bone': [],
-                    'id': [],
-                    'year': [],
-                    'A': [],
-                    'B': []}
-        exp_frame = pd.DataFrame(exp_data)
-        exp_frame = exp_frame.set_index(['id', 'year'])[[
-            'X', 'Aone', 'Atwo', 'Bone', 'A', 'B']]
-        exp_frame.index.set_levels([[0, 1], []], inplace=True)
-        long_frame = wide_to_long(df, ['A', 'B'], i='id', j='year')
-        tm.assert_frame_equal(long_frame.sort_index(axis=1),
-                              exp_frame.sort_index(axis=1))
-
-    def test_multiple_id_columns(self):
-        # Taken from http://www.ats.ucla.edu/stat/stata/modules/reshapel.htm
-        df = pd.DataFrame({
-            'famid': [1, 1, 1, 2, 2, 2, 3, 3, 3],
-            'birth': [1, 2, 3, 1, 2, 3, 1, 2, 3],
-            'ht1': [2.8, 2.9, 2.2, 2, 1.8, 1.9, 2.2, 2.3, 2.1],
-            'ht2': [3.4, 3.8, 2.9, 3.2, 2.8, 2.4, 3.3, 3.4, 2.9]
-        })
-        exp_frame = pd.DataFrame({
-            'ht': [2.8, 3.4, 2.9, 3.8, 2.2, 2.9, 2.0, 3.2, 1.8,
-                   2.8, 1.9, 2.4, 2.2, 3.3, 2.3, 3.4, 2.1, 2.9],
-            'famid': [1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3],
-            'birth': [1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3, 1, 1, 2, 2, 3, 3],
-            'age': ['1', '2', '1', '2', '1', '2', '1', '2', '1',
-                    '2', '1', '2', '1', '2', '1', '2', '1', '2']
-        })
-        exp_frame = exp_frame.set_index(['famid', 'birth', 'age'])[['ht']]
-        long_frame = wide_to_long(df, 'ht', i=['famid', 'birth'], j='age')
-        tm.assert_frame_equal(long_frame, exp_frame)
diff --git a/pandas/tests/test_sorting.py b/pandas/tests/test_sorting.py
index 99361695b2371..7528566e8326e 100644
--- a/pandas/tests/test_sorting.py
+++ b/pandas/tests/test_sorting.py
@@ -1,23 +1,26 @@
-import pytest
-from itertools import product
 from collections import defaultdict
+from datetime import datetime
+from itertools import product
+import warnings
 
 import numpy as np
 from numpy import nan
-import pandas as pd
+import pytest
+
+from pandas.compat import PY2
+
+from pandas import DataFrame, MultiIndex, Series, compat, concat, merge
 from pandas.core import common as com
-from pandas import DataFrame, MultiIndex, merge, concat, Series, compat
+from pandas.core.sorting import (
+    decons_group_index, get_group_index, is_int64_overflow_possible,
+    lexsort_indexer, nargsort, safe_sort)
 from pandas.util import testing as tm
 from pandas.util.testing import assert_frame_equal, assert_series_equal
-from pandas.core.sorting import (is_int64_overflow_possible,
-                                 decons_group_index,
-                                 get_group_index,
-                                 nargsort,
-                                 lexsort_indexer)
 
 
-class TestSorting(tm.TestCase):
+class TestSorting(object):
 
+    @pytest.mark.slow
     def test_int64_overflow(self):
 
         B = np.concatenate((np.arange(1000), np.arange(1000), np.arange(500)))
@@ -39,30 +42,30 @@ def test_int64_overflow(self):
         right = rg.sum()['values']
 
         exp_index, _ = left.index.sortlevel()
-        self.assert_index_equal(left.index, exp_index)
+        tm.assert_index_equal(left.index, exp_index)
 
         exp_index, _ = right.index.sortlevel(0)
-        self.assert_index_equal(right.index, exp_index)
+        tm.assert_index_equal(right.index, exp_index)
 
         tups = list(map(tuple, df[['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H'
                                    ]].values))
-        tups = com._asarray_tuplesafe(tups)
+        tups = com.asarray_tuplesafe(tups)
 
         expected = df.groupby(tups).sum()['values']
 
         for k, v in compat.iteritems(expected):
-            self.assertEqual(left[k], right[k[::-1]])
-            self.assertEqual(left[k], v)
-        self.assertEqual(len(left), len(right))
+            assert left[k] == right[k[::-1]]
+            assert left[k] == v
+        assert len(left) == len(right)
+
+    def test_int64_overflow_moar(self):
 
         # GH9096
         values = range(55109)
-        data = pd.DataFrame.from_dict({'a': values,
-                                       'b': values,
-                                       'c': values,
-                                       'd': values})
+        data = DataFrame.from_dict(
+            {'a': values, 'b': values, 'c': values, 'd': values})
         grouped = data.groupby(['a', 'b', 'c', 'd'])
-        self.assertEqual(len(grouped), len(values))
+        assert len(grouped) == len(values)
 
         arr = np.random.randint(-1 << 12, 1 << 12, (1 << 15, 5))
         i = np.random.choice(len(arr), len(arr) * 4)
@@ -76,15 +79,15 @@ def test_int64_overflow(self):
         gr = df.groupby(list('abcde'))
 
         # verify this is testing what it is supposed to test!
-        self.assertTrue(is_int64_overflow_possible(gr.grouper.shape))
+        assert is_int64_overflow_possible(gr.grouper.shape)
 
-        # mannually compute groupings
+        # manually compute groupings
         jim, joe = defaultdict(list), defaultdict(list)
         for key, a, b in zip(map(tuple, arr), df['jim'], df['joe']):
             jim[key].append(a)
             joe[key].append(b)
 
-        self.assertEqual(len(gr), len(jim))
+        assert len(gr) == len(jim)
         mi = MultiIndex.from_tuples(jim.keys(), names=list('abcde'))
 
         def aggr(func):
@@ -124,13 +127,6 @@ def test_nargsort(self):
         # np.argsort(items2) may not place NaNs first
         items2 = np.array(items, dtype='O')
 
-        try:
-            # GH 2785; due to a regression in NumPy1.6.2
-            np.argsort(np.array([[1, 2], [1, 3], [1, 2]], dtype='i'))
-            np.argsort(items2, kind='mergesort')
-        except TypeError:
-            pytest.skip('requested sort not available for type')
-
         # mergesort is the most difficult to get right because we want it to be
         # stable.
 
@@ -188,7 +184,7 @@ def test_nargsort(self):
         tm.assert_numpy_array_equal(result, np.array(exp), check_dtype=False)
 
 
-class TestMerge(tm.TestCase):
+class TestMerge(object):
 
     @pytest.mark.slow
     def test_int64_overflow_issues(self):
@@ -201,7 +197,7 @@ def test_int64_overflow_issues(self):
 
         # it works!
         result = merge(df1, df2, how='outer')
-        self.assertTrue(len(result) == 2000)
+        assert len(result) == 2000
 
         low, high, n = -1 << 10, 1 << 10, 1 << 20
         left = DataFrame(np.random.randint(low, high, (n, 7)),
@@ -216,11 +212,11 @@ def test_int64_overflow_issues(self):
         right['right'] *= -1
 
         out = merge(left, right, how='outer')
-        self.assertEqual(len(out), len(left))
+        assert len(out) == len(left)
         assert_series_equal(out['left'], - out['right'], check_names=False)
         result = out.iloc[:, :-2].sum(axis=1)
         assert_series_equal(out['left'], result, check_names=False)
-        self.assertTrue(result.name is None)
+        assert result.name is None
 
         out.sort_values(out.columns.tolist(), inplace=True)
         out.index = np.arange(len(out))
@@ -241,7 +237,7 @@ def test_int64_overflow_issues(self):
 
         # confirm that this is checking what it is supposed to check
         shape = left.apply(Series.nunique).values
-        self.assertTrue(is_int64_overflow_possible(shape))
+        assert is_int64_overflow_possible(shape)
 
         # add duplicates to left frame
         left = concat([left, left], ignore_index=True)
@@ -299,15 +295,15 @@ def verify_order(df):
         out = DataFrame(vals, columns=list('ABCDEFG') + ['left', 'right'])
         out = align(out)
 
-        jmask = {'left': out['left'].notnull(),
-                 'right': out['right'].notnull(),
-                 'inner': out['left'].notnull() & out['right'].notnull(),
+        jmask = {'left': out['left'].notna(),
+                 'right': out['right'].notna(),
+                 'inner': out['left'].notna() & out['right'].notna(),
                  'outer': np.ones(len(out), dtype='bool')}
 
         for how in 'left', 'right', 'outer', 'inner':
             mask = jmask[how]
             frame = align(out[mask].copy())
-            self.assertTrue(mask.all() ^ mask.any() or how == 'outer')
+            assert mask.all() ^ mask.any() or how == 'outer'
 
             for sort in [False, True]:
                 res = merge(left, right, how=how, sort=sort)
@@ -326,14 +322,115 @@ def testit(label_list, shape):
         label_list2 = decons_group_index(group_index, shape)
 
         for a, b in zip(label_list, label_list2):
-            assert (np.array_equal(a, b))
+            tm.assert_numpy_array_equal(a, b)
 
     shape = (4, 5, 6)
-    label_list = [np.tile([0, 1, 2, 3, 0, 1, 2, 3], 100), np.tile(
-        [0, 2, 4, 3, 0, 1, 2, 3], 100), np.tile(
-            [5, 1, 0, 2, 3, 0, 5, 4], 100)]
+    label_list = [np.tile([0, 1, 2, 3, 0, 1, 2, 3], 100).astype(np.int64),
+                  np.tile([0, 2, 4, 3, 0, 1, 2, 3], 100).astype(np.int64),
+                  np.tile([5, 1, 0, 2, 3, 0, 5, 4], 100).astype(np.int64)]
     testit(label_list, shape)
 
     shape = (10000, 10000)
-    label_list = [np.tile(np.arange(10000), 5), np.tile(np.arange(10000), 5)]
+    label_list = [np.tile(np.arange(10000, dtype=np.int64), 5),
+                  np.tile(np.arange(10000, dtype=np.int64), 5)]
     testit(label_list, shape)
+
+
+class TestSafeSort(object):
+
+    def test_basic_sort(self):
+        values = [3, 1, 2, 0, 4]
+        result = safe_sort(values)
+        expected = np.array([0, 1, 2, 3, 4])
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = list("baaacb")
+        result = safe_sort(values)
+        expected = np.array(list("aaabbc"), dtype='object')
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = []
+        result = safe_sort(values)
+        expected = np.array([])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_labels(self):
+        values = [3, 1, 2, 0, 4]
+        expected = np.array([0, 1, 2, 3, 4])
+
+        labels = [0, 1, 1, 2, 3, 0, -1, 4]
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([3, 1, 1, 2, 0, 3, -1, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        # na_sentinel
+        labels = [0, 1, 1, 2, 3, 0, 99, 4]
+        result, result_labels = safe_sort(values, labels,
+                                          na_sentinel=99)
+        expected_labels = np.array([3, 1, 1, 2, 0, 3, 99, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        # out of bound indices
+        labels = [0, 101, 102, 2, 3, 0, 99, 4]
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([3, -1, -1, 2, 0, 3, -1, 4], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+        labels = []
+        result, result_labels = safe_sort(values, labels)
+        expected_labels = np.array([], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+    def test_mixed_integer(self):
+        values = np.array(['b', 1, 0, 'a', 0, 'b'], dtype=object)
+        result = safe_sort(values)
+        expected = np.array([0, 0, 1, 'a', 'b', 'b'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+        values = np.array(['b', 1, 0, 'a'], dtype=object)
+        labels = [0, 1, 2, 3, 0, -1, 1]
+        result, result_labels = safe_sort(values, labels)
+        expected = np.array([0, 1, 'a', 'b'], dtype=object)
+        expected_labels = np.array([3, 1, 0, 2, 3, -1, 1], dtype=np.intp)
+        tm.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result_labels, expected_labels)
+
+    def test_mixed_integer_from_list(self):
+        values = ['b', 1, 0, 'a', 0, 'b']
+        result = safe_sort(values)
+        expected = np.array([0, 0, 1, 'a', 'b', 'b'], dtype=object)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
+    def test_unsortable(self):
+        # GH 13714
+        arr = np.array([1, 2, datetime.now(), 0, 3], dtype=object)
+        msg = (r"'(<|>)' not supported between instances of ('"
+               r"datetime\.datetime' and 'int'|'int' and 'datetime\.datetime"
+               r"')|"
+               r"unorderable types: int\(\) > datetime\.datetime\(\)")
+        if compat.PY2:
+            # RuntimeWarning: tp_compare didn't return -1 or -2 for exception
+            with warnings.catch_warnings():
+                with pytest.raises(TypeError, match=msg):
+                    safe_sort(arr)
+        else:
+            with pytest.raises(TypeError, match=msg):
+                safe_sort(arr)
+
+    def test_exceptions(self):
+        with pytest.raises(TypeError,
+                           match="Only list-like objects are allowed"):
+            safe_sort(values=1)
+
+        with pytest.raises(TypeError,
+                           match="Only list-like objects or None"):
+            safe_sort(values=[0, 1, 2], labels=1)
+
+        with pytest.raises(ValueError,
+                           match="values should be unique"):
+            safe_sort(values=[0, 1, 2, 1], labels=[0, 1])
diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index 7a68ec8f368ae..40a83f90c8dfd 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -4,33 +4,291 @@
 from datetime import datetime, timedelta
 import re
 
-from numpy import nan as NA
 import numpy as np
+from numpy import nan as NA
 from numpy.random import randint
+import pytest
 
-from pandas.compat import range, u
 import pandas.compat as compat
-from pandas import (Index, Series, DataFrame, isnull, MultiIndex, notnull)
-
-from pandas.util.testing import assert_series_equal
-import pandas.util.testing as tm
+from pandas.compat import PY2, PY3, range, u
 
+from pandas import DataFrame, Index, MultiIndex, Series, concat, isna, notna
 import pandas.core.strings as strings
-
-
-class TestStringMethods(tm.TestCase):
+import pandas.util.testing as tm
+from pandas.util.testing import assert_index_equal, assert_series_equal
+
+
+def assert_series_or_index_equal(left, right):
+    if isinstance(left, Series):
+        assert_series_equal(left, right)
+    else:  # Index
+        assert_index_equal(left, right)
+
+
+_any_string_method = [
+    ('cat',           (),                     {'sep': ','}),       # noqa: E241
+    ('cat',           (Series(list('zyx')),), {'sep': ',',         # noqa: E241
+                                               'join': 'left'}),
+    ('center',        (10,),                  {}),                 # noqa: E241
+    ('contains',      ('a',),                 {}),                 # noqa: E241
+    ('count',         ('a',),                 {}),                 # noqa: E241
+    ('decode',        ('UTF-8',),             {}),                 # noqa: E241
+    ('encode',        ('UTF-8',),             {}),                 # noqa: E241
+    ('endswith',      ('a',),                 {}),                 # noqa: E241
+    ('extract',       ('([a-z]*)',),          {'expand': False}),  # noqa: E241
+    ('extract',       ('([a-z]*)',),          {'expand': True}),   # noqa: E241
+    ('extractall',    ('([a-z]*)',),          {}),                 # noqa: E241
+    ('find',          ('a',),                 {}),                 # noqa: E241
+    ('findall',       ('a',),                 {}),                 # noqa: E241
+    ('get',           (0,),                   {}),                 # noqa: E241
+    # because "index" (and "rindex") fail intentionally
+    # if the string is not found, search only for empty string
+    ('index',         ('',),                  {}),                 # noqa: E241
+    ('join',          (',',),                 {}),                 # noqa: E241
+    ('ljust',         (10,),                  {}),                 # noqa: E241
+    ('match',         ('a',),                 {}),                 # noqa: E241
+    ('normalize',     ('NFC',),               {}),                 # noqa: E241
+    ('pad',           (10,),                  {}),                 # noqa: E241
+    ('partition',     (' ',),                 {'expand': False}),  # noqa: E241
+    ('partition',     (' ',),                 {'expand': True}),   # noqa: E241
+    ('repeat',        (3,),                   {}),                 # noqa: E241
+    ('replace',       ('a', 'z',),            {}),                 # noqa: E241
+    ('rfind',         ('a',),                 {}),                 # noqa: E241
+    ('rindex',        ('',),                  {}),                 # noqa: E241
+    ('rjust',         (10,),                  {}),                 # noqa: E241
+    ('rpartition',    (' ',),                 {'expand': False}),  # noqa: E241
+    ('rpartition',    (' ',),                 {'expand': True}),   # noqa: E241
+    ('slice',         (0, 1,),                {}),                 # noqa: E241
+    ('slice_replace', (0, 1, 'z',),           {}),                 # noqa: E241
+    ('split',         (' ',),                 {'expand': False}),  # noqa: E241
+    ('split',         (' ',),                 {'expand': True}),   # noqa: E241
+    ('startswith',    ('a',),                 {}),                 # noqa: E241
+    # translating unicode points of "a" to "d"
+    ('translate',     ({97: 100},),           {}),                 # noqa: E241
+    ('wrap',          (2,),                   {}),                 # noqa: E241
+    ('zfill',         (10,),                  {})                  # noqa: E241
+] + list(zip([
+    # methods without positional arguments: zip with empty tuple and empty dict
+    'capitalize', 'cat', 'get_dummies',
+    'isalnum', 'isalpha', 'isdecimal',
+    'isdigit', 'islower', 'isnumeric',
+    'isspace', 'istitle', 'isupper',
+    'len', 'lower', 'lstrip', 'partition',
+    'rpartition', 'rsplit', 'rstrip',
+    'slice', 'slice_replace', 'split',
+    'strip', 'swapcase', 'title', 'upper', 'casefold'
+], [()] * 100, [{}] * 100))
+ids, _, _ = zip(*_any_string_method)  # use method name as fixture-id
+
+
+# test that the above list captures all methods of StringMethods
+missing_methods = {f for f in dir(strings.StringMethods)
+                   if not f.startswith('_')} - set(ids)
+assert not missing_methods
+
+
+@pytest.fixture(params=_any_string_method, ids=ids)
+def any_string_method(request):
+    """
+    Fixture for all public methods of `StringMethods`
+
+    This fixture returns a tuple of the method name and sample arguments
+    necessary to call the method.
+
+    Returns
+    -------
+    method_name : str
+        The name of the method in `StringMethods`
+    args : tuple
+        Sample values for the positional arguments
+    kwargs : dict
+        Sample values for the keyword arguments
+
+    Examples
+    --------
+    >>> def test_something(any_string_method):
+    ...     s = pd.Series(['a', 'b', np.nan, 'd'])
+    ...
+    ...     method_name, args, kwargs = any_string_method
+    ...     method = getattr(s.str, method_name)
+    ...     # will not raise
+    ...     method(*args, **kwargs)
+    """
+    return request.param
+
+
+# subset of the full set from pandas/conftest.py
+_any_allowed_skipna_inferred_dtype = [
+    ('string', ['a', np.nan, 'c']),
+    ('unicode' if not PY3 else 'string', [u('a'), np.nan, u('c')]),
+    ('bytes' if PY3 else 'string', [b'a', np.nan, b'c']),
+    ('empty', [np.nan, np.nan, np.nan]),
+    ('empty', []),
+    ('mixed-integer', ['a', np.nan, 2])
+]
+ids, _ = zip(*_any_allowed_skipna_inferred_dtype)  # use inferred type as id
+
+
+@pytest.fixture(params=_any_allowed_skipna_inferred_dtype, ids=ids)
+def any_allowed_skipna_inferred_dtype(request):
+    """
+    Fixture for all (inferred) dtypes allowed in StringMethods.__init__
+
+    The covered (inferred) types are:
+    * 'string'
+    * 'unicode' (if PY2)
+    * 'empty'
+    * 'bytes' (if PY3)
+    * 'mixed'
+    * 'mixed-integer'
+
+    Returns
+    -------
+    inferred_dtype : str
+        The string for the inferred dtype from _libs.lib.infer_dtype
+    values : np.ndarray
+        An array of object dtype that will be inferred to have
+        `inferred_dtype`
+
+    Examples
+    --------
+    >>> import pandas._libs.lib as lib
+    >>>
+    >>> def test_something(any_allowed_skipna_inferred_dtype):
+    ...     inferred_dtype, values = any_allowed_skipna_inferred_dtype
+    ...     # will pass
+    ...     assert lib.infer_dtype(values, skipna=True) == inferred_dtype
+    """
+    inferred_dtype, values = request.param
+    values = np.array(values, dtype=object)  # object dtype to avoid casting
+
+    # correctness of inference tested in tests/dtypes/test_inference.py
+    return inferred_dtype, values
+
+
+class TestStringMethods(object):
 
     def test_api(self):
 
         # GH 6106, GH 9322
-        self.assertIs(Series.str, strings.StringMethods)
-        self.assertIsInstance(Series(['']).str, strings.StringMethods)
-
-        # GH 9184
-        invalid = Series([1])
-        with tm.assertRaisesRegexp(AttributeError, "only use .str accessor"):
-            invalid.str
-        self.assertFalse(hasattr(invalid, 'str'))
+        assert Series.str is strings.StringMethods
+        assert isinstance(Series(['']).str, strings.StringMethods)
+
+    @pytest.mark.parametrize('dtype', [object, 'category'])
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_api_per_dtype(self, box, dtype, any_skipna_inferred_dtype):
+        # one instance of parametrized fixture
+        inferred_dtype, values = any_skipna_inferred_dtype
+
+        t = box(values, dtype=dtype)  # explicit dtype to avoid casting
+
+        # TODO: get rid of these xfails
+        if dtype == 'category' and inferred_dtype in ['period', 'interval']:
+            pytest.xfail(reason='Conversion to numpy array fails because '
+                         'the ._values-attribute is not a numpy array for '
+                         'PeriodArray/IntervalArray; see GH 23553')
+        if box == Index and inferred_dtype in ['empty', 'bytes']:
+            pytest.xfail(reason='Raising too restrictively; '
+                         'solved by GH 23167')
+        if (box == Index and dtype == object
+                and inferred_dtype in ['boolean', 'date', 'time']):
+            pytest.xfail(reason='Inferring incorrectly because of NaNs; '
+                         'solved by GH 23167')
+        if (box == Series
+                and (dtype == object and inferred_dtype not in [
+                    'string', 'unicode', 'empty',
+                    'bytes', 'mixed', 'mixed-integer'])
+                or (dtype == 'category'
+                    and inferred_dtype in ['decimal', 'boolean', 'time'])):
+            pytest.xfail(reason='Not raising correctly; solved by GH 23167')
+
+        types_passing_constructor = ['string', 'unicode', 'empty',
+                                     'bytes', 'mixed', 'mixed-integer']
+        if inferred_dtype in types_passing_constructor:
+            # GH 6106
+            assert isinstance(t.str, strings.StringMethods)
+        else:
+            # GH 9184, GH 23011, GH 23163
+            with pytest.raises(AttributeError, match='Can only use .str '
+                               'accessor with string values.*'):
+                t.str
+            assert not hasattr(t, 'str')
+
+    @pytest.mark.parametrize('dtype', [object, 'category'])
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_api_per_method(self, box, dtype,
+                            any_allowed_skipna_inferred_dtype,
+                            any_string_method):
+        # this test does not check correctness of the different methods,
+        # just that the methods work on the specified (inferred) dtypes,
+        # and raise on all others
+
+        # one instance of each parametrized fixture
+        inferred_dtype, values = any_allowed_skipna_inferred_dtype
+        method_name, args, kwargs = any_string_method
+
+        # TODO: get rid of these xfails
+        if (method_name not in ['encode', 'decode', 'len']
+                and inferred_dtype == 'bytes'):
+            pytest.xfail(reason='Not raising for "bytes", see GH 23011;'
+                         'Also: malformed method names, see GH 23551; '
+                         'solved by GH 23167')
+        if (method_name == 'cat'
+                and inferred_dtype in ['mixed', 'mixed-integer']):
+            pytest.xfail(reason='Bad error message; should raise better; '
+                         'solved by GH 23167')
+        if box == Index and inferred_dtype in ['empty', 'bytes']:
+            pytest.xfail(reason='Raising too restrictively; '
+                         'solved by GH 23167')
+        if (box == Index and dtype == object
+                and inferred_dtype in ['boolean', 'date', 'time']):
+            pytest.xfail(reason='Inferring incorrectly because of NaNs; '
+                         'solved by GH 23167')
+
+        t = box(values, dtype=dtype)  # explicit dtype to avoid casting
+        method = getattr(t.str, method_name)
+
+        bytes_allowed = method_name in ['encode', 'decode', 'len']
+        # as of v0.23.4, all methods except 'cat' are very lenient with the
+        # allowed data types, just returning NaN for entries that error.
+        # This could be changed with an 'errors'-kwarg to the `str`-accessor,
+        # see discussion in GH 13877
+        mixed_allowed = method_name not in ['cat']
+
+        allowed_types = (['string', 'unicode', 'empty']
+                         + ['bytes'] * bytes_allowed
+                         + ['mixed', 'mixed-integer'] * mixed_allowed)
+
+        if inferred_dtype in allowed_types:
+            # xref GH 23555, GH 23556
+            method(*args, **kwargs)  # works!
+        else:
+            # GH 23011, GH 23163
+            msg = ('Cannot use .str.{name} with values of inferred dtype '
+                   '{inferred_dtype!r}.'.format(name=method_name,
+                                                inferred_dtype=inferred_dtype))
+            with pytest.raises(TypeError, match=msg):
+                method(*args, **kwargs)
+
+    def test_api_for_categorical(self, any_string_method):
+        # https://github.com/pandas-dev/pandas/issues/10661
+        s = Series(list('aabb'))
+        s = s + " " + s
+        c = s.astype('category')
+        assert isinstance(c.str, strings.StringMethods)
+
+        method_name, args, kwargs = any_string_method
+
+        result = getattr(c.str, method_name)(*args, **kwargs)
+        expected = getattr(s.str, method_name)(*args, **kwargs)
+
+        if isinstance(result, DataFrame):
+            tm.assert_frame_equal(result, expected)
+        elif isinstance(result, Series):
+            tm.assert_series_equal(result, expected)
+        else:
+            # str.cat(others=None) returns string, for example
+            assert result == expected
 
     def test_iter(self):
         # GH3638
@@ -39,7 +297,7 @@ def test_iter(self):
 
         for s in ds.str:
             # iter must yield a Series
-            tm.assertIsInstance(s, Series)
+            assert isinstance(s, Series)
 
             # indices of each yielded Series should be equal to the index of
             # the original Series
@@ -47,13 +305,12 @@ def test_iter(self):
 
             for el in s:
                 # each element of the series is either a basestring/str or nan
-                self.assertTrue(isinstance(el, compat.string_types) or
-                                isnull(el))
+                assert isinstance(el, compat.string_types) or isna(el)
 
         # desired behavior is to iterate until everything would be nan on the
         # next iter so make sure the last element of the iterator was 'l' in
         # this case since 'wikitravel' is the longest string
-        self.assertEqual(s.dropna().values.item(), 'l')
+        assert s.dropna().values.item() == 'l'
 
     def test_iter_empty(self):
         ds = Series([], dtype=object)
@@ -65,8 +322,8 @@ def test_iter_empty(self):
 
         # nothing to iterate over so nothing defined values should remain
         # unchanged
-        self.assertEqual(i, 100)
-        self.assertEqual(s, 1)
+        assert i == 100
+        assert s == 1
 
     def test_iter_single_element(self):
         ds = Series(['a'])
@@ -74,7 +331,7 @@ def test_iter_single_element(self):
         for i, s in enumerate(ds.str):
             pass
 
-        self.assertFalse(i)
+        assert not i
         assert_series_equal(ds, s)
 
     def test_iter_object_try_string(self):
@@ -86,43 +343,346 @@ def test_iter_object_try_string(self):
         for i, s in enumerate(ds.str):
             pass
 
-        self.assertEqual(i, 100)
-        self.assertEqual(s, 'h')
+        assert i == 100
+        assert s == 'h'
+
+    @pytest.mark.parametrize('box', [Series, Index])
+    @pytest.mark.parametrize('other', [None, Series, Index])
+    def test_str_cat_name(self, box, other):
+        # GH 21053
+        values = ['a', 'b']
+        if other:
+            other = other(values)
+        else:
+            other = values
+        result = box(values, name='name').str.cat(other, sep=',', join='left')
+        assert result.name == 'name'
 
-    def test_cat(self):
-        one = np.array(['a', 'a', 'b', 'b', 'c', NA], dtype=np.object_)
-        two = np.array(['a', NA, 'b', 'd', 'foo', NA], dtype=np.object_)
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_str_cat(self, box):
+        # test_cat above tests "str_cat" from ndarray;
+        # here testing "str.cat" from Series/Indext to ndarray/list
+        s = box(['a', 'a', 'b', 'b', 'c', np.nan])
 
         # single array
-        result = strings.str_cat(one)
-        exp = 'aabbc'
-        self.assertEqual(result, exp)
-
-        result = strings.str_cat(one, na_rep='NA')
-        exp = 'aabbcNA'
-        self.assertEqual(result, exp)
-
-        result = strings.str_cat(one, na_rep='-')
-        exp = 'aabbc-'
-        self.assertEqual(result, exp)
-
-        result = strings.str_cat(one, sep='_', na_rep='NA')
-        exp = 'a_a_b_b_c_NA'
-        self.assertEqual(result, exp)
-
-        result = strings.str_cat(two, sep='-')
-        exp = 'a-b-d-foo'
-        self.assertEqual(result, exp)
-
-        # Multiple arrays
-        result = strings.str_cat(one, [two], na_rep='NA')
-        exp = np.array(['aa', 'aNA', 'bb', 'bd', 'cfoo', 'NANA'],
-                       dtype=np.object_)
-        self.assert_numpy_array_equal(result, exp)
-
-        result = strings.str_cat(one, two)
-        exp = np.array(['aa', NA, 'bb', 'bd', 'cfoo', NA], dtype=np.object_)
-        tm.assert_almost_equal(result, exp)
+        result = s.str.cat()
+        expected = 'aabbc'
+        assert result == expected
+
+        result = s.str.cat(na_rep='-')
+        expected = 'aabbc-'
+        assert result == expected
+
+        result = s.str.cat(sep='_', na_rep='NA')
+        expected = 'a_a_b_b_c_NA'
+        assert result == expected
+
+        t = np.array(['a', np.nan, 'b', 'd', 'foo', np.nan], dtype=object)
+        expected = box(['aa', 'a-', 'bb', 'bd', 'cfoo', '--'])
+
+        # Series/Index with array
+        result = s.str.cat(t, na_rep='-')
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with list
+        result = s.str.cat(list(t), na_rep='-')
+        assert_series_or_index_equal(result, expected)
+
+        # errors for incorrect lengths
+        rgx = 'All arrays must be same length, except those having an index.*'
+        z = Series(['1', '2', '3'])
+
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(z)
+
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(z.values)
+
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(list(z))
+
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_str_cat_raises_intuitive_error(self, box):
+        # GH 11334
+        s = box(['a', 'b', 'c', 'd'])
+        message = "Did you mean to supply a `sep` keyword?"
+        with pytest.raises(ValueError, match=message):
+            s.str.cat('|')
+        with pytest.raises(ValueError, match=message):
+            s.str.cat('    ')
+
+    @pytest.mark.parametrize('sep', ['', None])
+    @pytest.mark.parametrize('dtype_target', ['object', 'category'])
+    @pytest.mark.parametrize('dtype_caller', ['object', 'category'])
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_str_cat_categorical(self, box, dtype_caller, dtype_target, sep):
+        s = Index(['a', 'a', 'b', 'a'], dtype=dtype_caller)
+        s = s if box == Index else Series(s, index=s)
+        t = Index(['b', 'a', 'b', 'c'], dtype=dtype_target)
+
+        expected = Index(['ab', 'aa', 'bb', 'ac'])
+        expected = expected if box == Index else Series(expected, index=s)
+
+        # Series/Index with unaligned Index
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            result = s.str.cat(t, sep=sep)
+            assert_series_or_index_equal(result, expected)
+
+        # Series/Index with Series having matching Index
+        t = Series(t, index=s)
+        result = s.str.cat(t, sep=sep)
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with Series.values
+        result = s.str.cat(t.values, sep=sep)
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with Series having different Index
+        t = Series(t.values, index=t)
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            result = s.str.cat(t, sep=sep)
+            assert_series_or_index_equal(result, expected)
+
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_str_cat_mixed_inputs(self, box):
+        s = Index(['a', 'b', 'c', 'd'])
+        s = s if box == Index else Series(s, index=s)
+
+        t = Series(['A', 'B', 'C', 'D'], index=s.values)
+        d = concat([t, Series(s, index=s)], axis=1)
+
+        expected = Index(['aAa', 'bBb', 'cCc', 'dDd'])
+        expected = expected if box == Index else Series(expected.values,
+                                                        index=s.values)
+
+        # Series/Index with DataFrame
+        result = s.str.cat(d)
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with two-dimensional ndarray
+        result = s.str.cat(d.values)
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with list of Series
+        result = s.str.cat([t, s])
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with mixed list of Series/array
+        result = s.str.cat([t, s.values])
+        assert_series_or_index_equal(result, expected)
+
+        # Series/Index with list of list-likes
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # nested list-likes will be deprecated
+            result = s.str.cat([t.values, list(s)])
+            assert_series_or_index_equal(result, expected)
+
+        # Series/Index with list of Series; different indexes
+        t.index = ['b', 'c', 'd', 'a']
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            result = s.str.cat([t, s])
+            assert_series_or_index_equal(result, expected)
+
+        # Series/Index with mixed list; different indexes
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            result = s.str.cat([t, s.values])
+            assert_series_or_index_equal(result, expected)
+
+        # Series/Index with DataFrame; different indexes
+        d.index = ['b', 'c', 'd', 'a']
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # FutureWarning to switch to alignment by default
+            result = s.str.cat(d)
+            assert_series_or_index_equal(result, expected)
+
+        # Series/Index with iterator of list-likes
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # nested list-likes will be deprecated
+            result = s.str.cat(iter([t.values, list(s)]))
+            assert_series_or_index_equal(result, expected)
+
+        # errors for incorrect lengths
+        rgx = 'All arrays must be same length, except those having an index.*'
+        z = Series(['1', '2', '3'])
+        e = concat([z, z], axis=1)
+
+        # DataFrame
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(e)
+
+        # two-dimensional ndarray
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(e.values)
+
+        # list of Series
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat([z, s])
+
+        # list of list-likes
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat([z.values, s.values])
+
+        # mixed list of Series/list-like
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat([z.values, s])
+
+        # errors for incorrect arguments in list-like
+        rgx = 'others must be Series, Index, DataFrame,.*'
+        # make sure None/NaN do not crash checks in _get_series_list
+        u = Series(['a', np.nan, 'c', None])
+
+        # mix of string and Series
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat([u, 'u'])
+
+        # DataFrame in list
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat([u, d])
+
+        # 2-dim ndarray in list
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat([u, d.values])
+
+        # nested lists
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat([u, [u, d]])
+
+        # forbidden input type: set
+        # GH 23009
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat(set(u))
+
+        # forbidden input type: set in list
+        # GH 23009
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat([u, set(u)])
+
+        # other forbidden input type, e.g. int
+        with pytest.raises(TypeError, match=rgx):
+            s.str.cat(1)
+
+    @pytest.mark.parametrize('join', ['left', 'outer', 'inner', 'right'])
+    @pytest.mark.parametrize('box', [Series, Index])
+    def test_str_cat_align_indexed(self, box, join):
+        # https://github.com/pandas-dev/pandas/issues/18657
+        s = Series(['a', 'b', 'c', 'd'], index=['a', 'b', 'c', 'd'])
+        t = Series(['D', 'A', 'E', 'B'], index=['d', 'a', 'e', 'b'])
+        sa, ta = s.align(t, join=join)
+        # result after manual alignment of inputs
+        expected = sa.str.cat(ta, na_rep='-')
+
+        if box == Index:
+            s = Index(s)
+            sa = Index(sa)
+            expected = Index(expected)
+
+        result = s.str.cat(t, join=join, na_rep='-')
+        assert_series_or_index_equal(result, expected)
+
+    @pytest.mark.parametrize('join', ['left', 'outer', 'inner', 'right'])
+    def test_str_cat_align_mixed_inputs(self, join):
+        s = Series(['a', 'b', 'c', 'd'])
+        t = Series(['d', 'a', 'e', 'b'], index=[3, 0, 4, 1])
+        d = concat([t, t], axis=1)
+
+        expected_outer = Series(['aaa', 'bbb', 'c--', 'ddd', '-ee'])
+        expected = expected_outer.loc[s.index.join(t.index, how=join)]
+
+        # list of Series
+        result = s.str.cat([t, t], join=join, na_rep='-')
+        tm.assert_series_equal(result, expected)
+
+        # DataFrame
+        result = s.str.cat(d, join=join, na_rep='-')
+        tm.assert_series_equal(result, expected)
+
+        # mixed list of indexed/unindexed
+        u = np.array(['A', 'B', 'C', 'D'])
+        expected_outer = Series(['aaA', 'bbB', 'c-C', 'ddD', '-e-'])
+        # joint index of rhs [t, u]; u will be forced have index of s
+        rhs_idx = t.index & s.index if join == 'inner' else t.index | s.index
+
+        expected = expected_outer.loc[s.index.join(rhs_idx, how=join)]
+        result = s.str.cat([t, u], join=join, na_rep='-')
+        tm.assert_series_equal(result, expected)
+
+        with tm.assert_produces_warning(expected_warning=FutureWarning):
+            # nested list-likes will be deprecated
+            result = s.str.cat([t, list(u)], join=join, na_rep='-')
+            tm.assert_series_equal(result, expected)
+
+        # errors for incorrect lengths
+        rgx = r'If `others` contains arrays or lists \(or other list-likes.*'
+        z = Series(['1', '2', '3']).values
+
+        # unindexed object of wrong length
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat(z, join=join)
+
+        # unindexed object of wrong length in list
+        with pytest.raises(ValueError, match=rgx):
+            s.str.cat([t, z], join=join)
+
+    @pytest.mark.parametrize('box', [Series, Index])
+    @pytest.mark.parametrize('other', [Series, Index])
+    def test_str_cat_all_na(self, box, other):
+        # GH 24044
+
+        # check that all NaNs in caller / target work
+        s = Index(['a', 'b', 'c', 'd'])
+        s = s if box == Index else Series(s, index=s)
+        t = other([np.nan] * 4, dtype=object)
+        # add index of s for alignment
+        t = t if other == Index else Series(t, index=s)
+
+        # all-NA target
+        if box == Series:
+            expected = Series([np.nan] * 4, index=s.index, dtype=object)
+        else:  # box == Index
+            expected = Index([np.nan] * 4, dtype=object)
+        result = s.str.cat(t, join='left')
+        assert_series_or_index_equal(result, expected)
+
+        # all-NA caller (only for Series)
+        if other == Series:
+            expected = Series([np.nan] * 4, dtype=object, index=t.index)
+            result = t.str.cat(s, join='left')
+            tm.assert_series_equal(result, expected)
+
+    def test_str_cat_special_cases(self):
+        s = Series(['a', 'b', 'c', 'd'])
+        t = Series(['d', 'a', 'e', 'b'], index=[3, 0, 4, 1])
+
+        # iterator of elements with different types
+        expected = Series(['aaa', 'bbb', 'c-c', 'ddd', '-e-'])
+        result = s.str.cat(iter([t, s.values]), join='outer', na_rep='-')
+        tm.assert_series_equal(result, expected)
+
+        # right-align with different indexes in others
+        expected = Series(['aa-', 'd-d'], index=[0, 3])
+        result = s.str.cat([t.loc[[0]], t.loc[[3]]], join='right', na_rep='-')
+        tm.assert_series_equal(result, expected)
+
+    def test_cat_on_filtered_index(self):
+        df = DataFrame(index=MultiIndex.from_product(
+            [[2011, 2012], [1, 2, 3]], names=['year', 'month']))
+
+        df = df.reset_index()
+        df = df[df.month > 1]
+
+        str_year = df.year.astype('str')
+        str_month = df.month.astype('str')
+        str_both = str_year.str.cat(str_month, sep=' ')
+
+        assert str_both.loc[1] == '2011 2'
+
+        str_multiple = str_year.str.cat([str_month, str_month], sep=' ')
+
+        assert str_multiple.loc[1] == '2011 2 2'
 
     def test_count(self):
         values = np.array(['foo', 'foofoo', NA, 'foooofooofommmfoo'],
@@ -134,7 +694,7 @@ def test_count(self):
 
         result = Series(values).str.count('f[o]+')
         exp = Series([1, 2, NA, 4])
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_series_equal(result, exp)
 
         # mixed
@@ -145,7 +705,7 @@ def test_count(self):
 
         rs = Series(mixed).str.count('a')
         xp = Series([1, NA, 0, NA, NA, 0, NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -157,7 +717,7 @@ def test_count(self):
 
         result = Series(values).str.count('f[o]+')
         exp = Series([1, 2, NA, 4])
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_series_equal(result, exp)
 
     def test_contains(self):
@@ -176,7 +736,7 @@ def test_contains(self):
         values = ['foo', 'xyz', 'fooommm__foo', 'mmm_']
         result = strings.str_contains(values, pat)
         expected = np.array([False, False, True, True])
-        self.assertEqual(result.dtype, np.bool_)
+        assert result.dtype == np.bool_
         tm.assert_numpy_array_equal(result, expected)
 
         # case insensitive using regex
@@ -199,7 +759,7 @@ def test_contains(self):
 
         rs = Series(mixed).str.contains('o')
         xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -219,13 +779,31 @@ def test_contains(self):
                           dtype=np.object_)
         result = strings.str_contains(values, pat)
         expected = np.array([False, False, True, True])
-        self.assertEqual(result.dtype, np.bool_)
+        assert result.dtype == np.bool_
         tm.assert_numpy_array_equal(result, expected)
 
-        # na
-        values = Series(['om', 'foo', np.nan])
-        res = values.str.contains('foo', na="foo")
-        self.assertEqual(res.loc[2], "foo")
+    def test_contains_for_object_category(self):
+        # gh 22158
+
+        # na for category
+        values = Series(["a", "b", "c", "a", np.nan], dtype="category")
+        result = values.str.contains('a', na=True)
+        expected = Series([True, False, False, True, True])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.contains('a', na=False)
+        expected = Series([True, False, False, True, False])
+        tm.assert_series_equal(result, expected)
+
+        # na for objects
+        values = Series(["a", "b", "c", "a", np.nan])
+        result = values.str.contains('a', na=True)
+        expected = Series([True, False, False, True, True])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.contains('a', na=False)
+        expected = Series([True, False, False, True, False])
+        tm.assert_series_equal(result, expected)
 
     def test_startswith(self):
         values = Series(['om', NA, 'foo_nom', 'nom', 'bar_foo', NA, 'foo'])
@@ -243,7 +821,7 @@ def test_startswith(self):
         tm.assert_numpy_array_equal(rs, xp)
 
         rs = Series(mixed).str.startswith('f')
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         xp = Series([False, NA, False, NA, NA, True, NA, NA, NA])
         tm.assert_series_equal(rs, xp)
 
@@ -274,7 +852,7 @@ def test_endswith(self):
 
         rs = Series(mixed).str.endswith('f')
         xp = Series([False, NA, False, NA, NA, False, NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -326,7 +904,7 @@ def test_lower_upper(self):
         mixed = mixed.str.upper()
         rs = Series(mixed).str.lower()
         xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -380,13 +958,11 @@ def test_swapcase(self):
     def test_casemethods(self):
         values = ['aaa', 'bbb', 'CCC', 'Dddd', 'eEEE']
         s = Series(values)
-        self.assertEqual(s.str.lower().tolist(), [v.lower() for v in values])
-        self.assertEqual(s.str.upper().tolist(), [v.upper() for v in values])
-        self.assertEqual(s.str.title().tolist(), [v.title() for v in values])
-        self.assertEqual(s.str.capitalize().tolist(), [
-                         v.capitalize() for v in values])
-        self.assertEqual(s.str.swapcase().tolist(), [
-                         v.swapcase() for v in values])
+        assert s.str.lower().tolist() == [v.lower() for v in values]
+        assert s.str.upper().tolist() == [v.upper() for v in values]
+        assert s.str.title().tolist() == [v.title() for v in values]
+        assert s.str.capitalize().tolist() == [v.capitalize() for v in values]
+        assert s.str.swapcase().tolist() == [v.swapcase() for v in values]
 
     def test_replace(self):
         values = Series(['fooBAD__barBAD', NA])
@@ -405,7 +981,7 @@ def test_replace(self):
 
         rs = Series(mixed).str.replace('BAD[_]*', '')
         xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -426,11 +1002,13 @@ def test_replace(self):
         tm.assert_series_equal(result, exp)
 
         # GH 13438
+        msg = "repl must be a string or callable"
         for klass in (Series, Index):
             for repl in (None, 3, {'a': 'b'}):
                 for data in (['a', 'b', None], ['a', 'b', 'c', 'ad']):
                     values = klass(data)
-                    self.assertRaises(TypeError, values.str.replace, 'a', repl)
+                    with pytest.raises(TypeError, match=msg):
+                        values.str.replace('a', repl)
 
     def test_replace_callable(self):
         # GH 15055
@@ -450,15 +1028,15 @@ def test_replace_callable(self):
                      r'(?(3)required )positional arguments?')
 
         repl = lambda: None
-        with tm.assertRaisesRegexp(TypeError, p_err):
+        with pytest.raises(TypeError, match=p_err):
             values.str.replace('a', repl)
 
         repl = lambda m, x: None
-        with tm.assertRaisesRegexp(TypeError, p_err):
+        with pytest.raises(TypeError, match=p_err):
             values.str.replace('a', repl)
 
         repl = lambda m, x, y=None: None
-        with tm.assertRaisesRegexp(TypeError, p_err):
+        with pytest.raises(TypeError, match=p_err):
             values.str.replace('a', repl)
 
         # test regex named groups
@@ -485,7 +1063,7 @@ def test_replace_compiled_regex(self):
 
         rs = Series(mixed).str.replace(pat, '')
         xp = Series(['a', NA, 'b', NA, NA, 'foo', NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -511,13 +1089,16 @@ def test_replace_compiled_regex(self):
         values = Series(['fooBAD__barBAD__bad', NA])
         pat = re.compile(r'BAD[_]*')
 
-        with tm.assertRaisesRegexp(ValueError, "case and flags cannot be"):
+        with pytest.raises(ValueError,
+                           match="case and flags cannot be"):
             result = values.str.replace(pat, '', flags=re.IGNORECASE)
 
-        with tm.assertRaisesRegexp(ValueError, "case and flags cannot be"):
+        with pytest.raises(ValueError,
+                           match="case and flags cannot be"):
             result = values.str.replace(pat, '', case=False)
 
-        with tm.assertRaisesRegexp(ValueError, "case and flags cannot be"):
+        with pytest.raises(ValueError,
+                           match="case and flags cannot be"):
             result = values.str.replace(pat, '', case=True)
 
         # test with callable
@@ -528,6 +1109,31 @@ def test_replace_compiled_regex(self):
         exp = Series(['foObaD__baRbaD', NA])
         tm.assert_series_equal(result, exp)
 
+    def test_replace_literal(self):
+        # GH16808 literal replace (regex=False vs regex=True)
+        values = Series(['f.o', 'foo', NA])
+        exp = Series(['bao', 'bao', NA])
+        result = values.str.replace('f.', 'ba')
+        tm.assert_series_equal(result, exp)
+
+        exp = Series(['bao', 'foo', NA])
+        result = values.str.replace('f.', 'ba', regex=False)
+        tm.assert_series_equal(result, exp)
+
+        # Cannot do a literal replace if given a callable repl or compiled
+        # pattern
+        callable_repl = lambda m: m.group(0).swapcase()
+        compiled_pat = re.compile('[a-z][A-Z]{2}')
+
+        msg = "Cannot use a callable replacement when regex=False"
+        with pytest.raises(ValueError, match=msg):
+            values.str.replace('abc', callable_repl, regex=False)
+
+        msg = ("Cannot use a compiled regex as replacement pattern with"
+               " regex=False")
+        with pytest.raises(ValueError, match=msg):
+            values.str.replace(compiled_pat, '', regex=False)
+
     def test_repeat(self):
         values = Series(['a', 'b', NA, 'c', NA, 'd'])
 
@@ -545,7 +1151,7 @@ def test_repeat(self):
 
         rs = Series(mixed).str.repeat(3)
         xp = Series(['aaa', NA, 'bbb', NA, NA, 'foofoofoo', NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -571,27 +1177,12 @@ def test_match(self):
         exp = Series([True, NA, False])
         tm.assert_series_equal(result, exp)
 
-        # test passing as_indexer still works but is ignored
-        values = Series(['fooBAD__barBAD', NA, 'foo'])
-        exp = Series([True, NA, False])
-        with tm.assert_produces_warning(FutureWarning):
-            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=True)
-        tm.assert_series_equal(result, exp)
-        with tm.assert_produces_warning(FutureWarning):
-            result = values.str.match('.*BAD[_]+.*BAD', as_indexer=False)
-        tm.assert_series_equal(result, exp)
-        with tm.assert_produces_warning(FutureWarning):
-            result = values.str.match('.*(BAD[_]+).*(BAD)', as_indexer=True)
-        tm.assert_series_equal(result, exp)
-        self.assertRaises(ValueError, values.str.match, '.*(BAD[_]+).*(BAD)',
-                          as_indexer=False)
-
         # mixed
         mixed = Series(['aBAD_BAD', NA, 'BAD_b_BAD', True, datetime.today(),
                         'foo', None, 1, 2.])
         rs = Series(mixed).str.match('.*(BAD[_]+).*(BAD)')
         xp = Series([True, NA, True, NA, NA, False, NA, NA, NA])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_series_equal(rs, xp)
 
         # unicode
@@ -610,13 +1201,16 @@ def test_match(self):
 
     def test_extract_expand_None(self):
         values = Series(['fooBAD__barBAD', NA, 'foo'])
-        with tm.assert_produces_warning(FutureWarning):
+        with pytest.raises(ValueError,
+                           match='expand must be True or False'):
             values.str.extract('.*(BAD[_]+).*(BAD)', expand=None)
 
     def test_extract_expand_unspecified(self):
         values = Series(['fooBAD__barBAD', NA, 'foo'])
-        with tm.assert_produces_warning(FutureWarning):
-            values.str.extract('.*(BAD[_]+).*(BAD)')
+        result_unspecified = values.str.extract('.*(BAD[_]+).*')
+        assert isinstance(result_unspecified, DataFrame)
+        result_true = values.str.extract('.*(BAD[_]+).*', expand=True)
+        tm.assert_frame_equal(result_unspecified, result_true)
 
     def test_extract_expand_False(self):
         # Contains tests like those in test_match and some others.
@@ -647,24 +1241,25 @@ def test_extract_expand_False(self):
         # Index only works with one regex group since
         # multi-group would expand to a frame
         idx = Index(['A1', 'A2', 'A3', 'A4', 'B5'])
-        with tm.assertRaisesRegexp(ValueError, "supported"):
+        with pytest.raises(ValueError, match="supported"):
             idx.str.extract('([AB])([123])', expand=False)
 
         # these should work for both Series and Index
         for klass in [Series, Index]:
             # no groups
             s_or_idx = klass(['A1', 'B2', 'C3'])
-            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=False)
-            self.assertRaises(ValueError, f)
+            msg = "pattern contains no capture groups"
+            with pytest.raises(ValueError, match=msg):
+                s_or_idx.str.extract('[ABC][123]', expand=False)
 
             # only non-capturing groups
-            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=False)
-            self.assertRaises(ValueError, f)
+            with pytest.raises(ValueError, match=msg):
+                s_or_idx.str.extract('(?:[AB]).*', expand=False)
 
             # single group renames series/index properly
             s_or_idx = klass(['A1', 'A2'])
             result = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=False)
-            self.assertEqual(result.name, 'uno')
+            assert result.name == 'uno'
 
             exp = klass(['A', 'A'], name='uno')
             if klass == Series:
@@ -768,7 +1363,7 @@ def check_index(index):
         r = s.str.extract(r'(?P<sue>[a-z])', expand=False)
         e = Series(['a', 'b', 'c'], name='sue')
         tm.assert_series_equal(r, e)
-        self.assertEqual(r.name, e.name)
+        assert r.name == e.name
 
     def test_extract_expand_True(self):
         # Contains tests like those in test_match and some others.
@@ -799,17 +1394,18 @@ def test_extract_expand_True(self):
         for klass in [Series, Index]:
             # no groups
             s_or_idx = klass(['A1', 'B2', 'C3'])
-            f = lambda: s_or_idx.str.extract('[ABC][123]', expand=True)
-            self.assertRaises(ValueError, f)
+            msg = "pattern contains no capture groups"
+            with pytest.raises(ValueError, match=msg):
+                s_or_idx.str.extract('[ABC][123]', expand=True)
 
             # only non-capturing groups
-            f = lambda: s_or_idx.str.extract('(?:[AB]).*', expand=True)
-            self.assertRaises(ValueError, f)
+            with pytest.raises(ValueError, match=msg):
+                s_or_idx.str.extract('(?:[AB]).*', expand=True)
 
             # single group renames series/index properly
             s_or_idx = klass(['A1', 'A2'])
             result_df = s_or_idx.str.extract(r'(?P<uno>A)\d', expand=True)
-            tm.assertIsInstance(result_df, DataFrame)
+            assert isinstance(result_df, DataFrame)
             result_series = result_df['uno']
             assert_series_equal(result_series, Series(['A', 'A'], name='uno'))
 
@@ -1070,28 +1666,50 @@ def test_extractall_single_group_with_quantifier(self):
         e = DataFrame(['ab', 'abc', 'd', 'cd'], i)
         tm.assert_frame_equal(r, e)
 
-    def test_extractall_no_matches(self):
-        s = Series(['a3', 'b3', 'd4c2'], name='series_name')
+    @pytest.mark.parametrize('data, names', [
+        ([], (None, )),
+        ([], ('i1', )),
+        ([], (None, 'i2')),
+        ([], ('i1', 'i2')),
+        (['a3', 'b3', 'd4c2'], (None, )),
+        (['a3', 'b3', 'd4c2'], ('i1', 'i2')),
+        (['a3', 'b3', 'd4c2'], (None, 'i2')),
+        (['a3', 'b3', 'd4c2'], ('i1', 'i2')),
+    ])
+    def test_extractall_no_matches(self, data, names):
+        # GH19075 extractall with no matches should return a valid MultiIndex
+        n = len(data)
+        if len(names) == 1:
+            i = Index(range(n), name=names[0])
+        else:
+            a = (tuple([i] * (n - 1)) for i in range(n))
+            i = MultiIndex.from_tuples(a, names=names)
+        s = Series(data, name='series_name', index=i, dtype='object')
+        ei = MultiIndex.from_tuples([], names=(names + ('match',)))
+
         # one un-named group.
         r = s.str.extractall('(z)')
-        e = DataFrame(columns=[0])
+        e = DataFrame(columns=[0], index=ei)
         tm.assert_frame_equal(r, e)
+
         # two un-named groups.
         r = s.str.extractall('(z)(z)')
-        e = DataFrame(columns=[0, 1])
+        e = DataFrame(columns=[0, 1], index=ei)
         tm.assert_frame_equal(r, e)
+
         # one named group.
         r = s.str.extractall('(?P<first>z)')
-        e = DataFrame(columns=["first"])
+        e = DataFrame(columns=["first"], index=ei)
         tm.assert_frame_equal(r, e)
+
         # two named groups.
         r = s.str.extractall('(?P<first>z)(?P<second>z)')
-        e = DataFrame(columns=["first", "second"])
+        e = DataFrame(columns=["first", "second"], index=ei)
         tm.assert_frame_equal(r, e)
+
         # one named, one un-named.
         r = s.str.extractall('(z)(?P<second>z)')
-        e = DataFrame(columns=[0,
-                               "second"])
+        e = DataFrame(columns=[0, "second"], index=ei)
         tm.assert_frame_equal(r, e)
 
     def test_extractall_stringindex(self):
@@ -1123,7 +1741,7 @@ def test_extractall_errors(self):
         # no capture groups. (it returns DataFrame with one column for
         # each capture group)
         s = Series(['a3', 'b3', 'd4c2'], name='series_name')
-        with tm.assertRaisesRegexp(ValueError, "no capture groups"):
+        with pytest.raises(ValueError, match="no capture groups"):
             s.str.extractall(r'[a-z]')
 
     def test_extract_index_one_two_groups(self):
@@ -1207,17 +1825,16 @@ def test_extractall_same_as_extract_subject_index(self):
         tm.assert_frame_equal(extract_one_noname, no_match_index)
 
     def test_empty_str_methods(self):
-        empty_str = empty = Series(dtype=str)
+        empty_str = empty = Series(dtype=object)
         empty_int = Series(dtype=int)
         empty_bool = Series(dtype=bool)
-        empty_list = Series(dtype=list)
         empty_bytes = Series(dtype=object)
 
         # GH7241
         # (extract) on empty series
 
         tm.assert_series_equal(empty_str, empty.str.cat(empty))
-        self.assertEqual('', empty.str.cat())
+        assert '' == empty.str.cat()
         tm.assert_series_equal(empty_str, empty.str.title())
         tm.assert_series_equal(empty_int, empty.str.count('a'))
         tm.assert_series_equal(empty_bool, empty.str.contains('a'))
@@ -1241,25 +1858,24 @@ def test_empty_str_methods(self):
             DataFrame(columns=[0, 1], dtype=str),
             empty.str.extract('()()', expand=False))
         tm.assert_frame_equal(DataFrame(dtype=str), empty.str.get_dummies())
-        tm.assert_series_equal(empty_str, empty_list.str.join(''))
+        tm.assert_series_equal(empty_str, empty_str.str.join(''))
         tm.assert_series_equal(empty_int, empty.str.len())
-        tm.assert_series_equal(empty_list, empty_list.str.findall('a'))
+        tm.assert_series_equal(empty_str, empty_str.str.findall('a'))
         tm.assert_series_equal(empty_int, empty.str.find('a'))
         tm.assert_series_equal(empty_int, empty.str.rfind('a'))
         tm.assert_series_equal(empty_str, empty.str.pad(42))
         tm.assert_series_equal(empty_str, empty.str.center(42))
-        tm.assert_series_equal(empty_list, empty.str.split('a'))
-        tm.assert_series_equal(empty_list, empty.str.rsplit('a'))
-        tm.assert_series_equal(empty_list,
+        tm.assert_series_equal(empty_str, empty.str.split('a'))
+        tm.assert_series_equal(empty_str, empty.str.rsplit('a'))
+        tm.assert_series_equal(empty_str,
                                empty.str.partition('a', expand=False))
-        tm.assert_series_equal(empty_list,
+        tm.assert_series_equal(empty_str,
                                empty.str.rpartition('a', expand=False))
         tm.assert_series_equal(empty_str, empty.str.slice(stop=1))
         tm.assert_series_equal(empty_str, empty.str.slice(step=1))
         tm.assert_series_equal(empty_str, empty.str.strip())
         tm.assert_series_equal(empty_str, empty.str.lstrip())
         tm.assert_series_equal(empty_str, empty.str.rstrip())
-        tm.assert_series_equal(empty_str, empty.str.rstrip())
         tm.assert_series_equal(empty_str, empty.str.wrap(42))
         tm.assert_series_equal(empty_str, empty.str.get(0))
         tm.assert_series_equal(empty_str, empty_bytes.str.decode('ascii'))
@@ -1320,20 +1936,13 @@ def test_ismethods(self):
         tm.assert_series_equal(str_s.str.isupper(), Series(upper_e))
         tm.assert_series_equal(str_s.str.istitle(), Series(title_e))
 
-        self.assertEqual(str_s.str.isalnum().tolist(), [v.isalnum()
-                                                        for v in values])
-        self.assertEqual(str_s.str.isalpha().tolist(), [v.isalpha()
-                                                        for v in values])
-        self.assertEqual(str_s.str.isdigit().tolist(), [v.isdigit()
-                                                        for v in values])
-        self.assertEqual(str_s.str.isspace().tolist(), [v.isspace()
-                                                        for v in values])
-        self.assertEqual(str_s.str.islower().tolist(), [v.islower()
-                                                        for v in values])
-        self.assertEqual(str_s.str.isupper().tolist(), [v.isupper()
-                                                        for v in values])
-        self.assertEqual(str_s.str.istitle().tolist(), [v.istitle()
-                                                        for v in values])
+        assert str_s.str.isalnum().tolist() == [v.isalnum() for v in values]
+        assert str_s.str.isalpha().tolist() == [v.isalpha() for v in values]
+        assert str_s.str.isdigit().tolist() == [v.isdigit() for v in values]
+        assert str_s.str.isspace().tolist() == [v.isspace() for v in values]
+        assert str_s.str.islower().tolist() == [v.islower() for v in values]
+        assert str_s.str.isupper().tolist() == [v.isupper() for v in values]
+        assert str_s.str.istitle().tolist() == [v.istitle() for v in values]
 
     def test_isnumeric(self):
         # 0x00bc: ¼ VULGAR FRACTION ONE QUARTER
@@ -1348,10 +1957,8 @@ def test_isnumeric(self):
         tm.assert_series_equal(s.str.isdecimal(), Series(decimal_e))
 
         unicodes = [u'A', u'3', u'¼', u'★', u'፸', u'３', u'four']
-        self.assertEqual(s.str.isnumeric().tolist(), [
-                         v.isnumeric() for v in unicodes])
-        self.assertEqual(s.str.isdecimal().tolist(), [
-                         v.isdecimal() for v in unicodes])
+        assert s.str.isnumeric().tolist() == [v.isnumeric() for v in unicodes]
+        assert s.str.isdecimal().tolist() == [v.isdecimal() for v in unicodes]
 
         values = ['A', np.nan, u'¼', u'★', np.nan, u'３', 'four']
         s = Series(values)
@@ -1410,7 +2017,7 @@ def test_join(self):
         rs = Series(mixed).str.split('_').str.join('_')
         xp = Series(['a_b', NA, 'asdf_cas_asdf', NA, NA, 'foo', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -1422,7 +2029,7 @@ def test_len(self):
         values = Series(['foo', 'fooo', 'fooooo', np.nan, 'fooooooo'])
 
         result = values.str.len()
-        exp = values.map(lambda x: len(x) if notnull(x) else NA)
+        exp = values.map(lambda x: len(x) if notna(x) else NA)
         tm.assert_series_equal(result, exp)
 
         # mixed
@@ -1432,7 +2039,7 @@ def test_len(self):
         rs = Series(mixed).str.len()
         xp = Series([3, NA, 13, NA, NA, 3, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -1440,7 +2047,7 @@ def test_len(self):
             'fooooooo')])
 
         result = values.str.len()
-        exp = values.map(lambda x: len(x) if notnull(x) else NA)
+        exp = values.map(lambda x: len(x) if notna(x) else NA)
         tm.assert_series_equal(result, exp)
 
     def test_findall(self):
@@ -1457,7 +2064,7 @@ def test_findall(self):
         rs = Series(mixed).str.findall('BAD[_]*')
         xp = Series([['BAD__', 'BAD'], NA, [], NA, NA, ['BAD'], NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -1505,12 +2112,12 @@ def test_find(self):
                             dtype=np.int64)
         tm.assert_numpy_array_equal(result.values, expected)
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "expected a string object, not int"):
+        with pytest.raises(TypeError,
+                           match="expected a string object, not int"):
             result = values.str.find(0)
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "expected a string object, not int"):
+        with pytest.raises(TypeError,
+                           match="expected a string object, not int"):
             result = values.str.rfind(0)
 
     def test_find_nan(self):
@@ -1580,11 +2187,11 @@ def _check(result, expected):
                                 dtype=np.int64)
             tm.assert_numpy_array_equal(result.values, expected)
 
-            with tm.assertRaisesRegexp(ValueError, "substring not found"):
+            with pytest.raises(ValueError, match="substring not found"):
                 result = s.str.index('DE')
 
-            with tm.assertRaisesRegexp(TypeError,
-                                       "expected a string object, not int"):
+            msg = "expected a string object, not int"
+            with pytest.raises(TypeError, match=msg):
                 result = s.str.index(0)
 
         # test with nan
@@ -1616,7 +2223,7 @@ def test_pad(self):
         rs = Series(mixed).str.pad(5, side='left')
         xp = Series(['    a', NA, '    b', NA, NA, '   ee', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
@@ -1625,7 +2232,7 @@ def test_pad(self):
         rs = Series(mixed).str.pad(5, side='right')
         xp = Series(['a    ', NA, 'b    ', NA, NA, 'ee   ', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         mixed = Series(['a', NA, 'b', True, datetime.today(), 'ee', None, 1, 2.
@@ -1634,7 +2241,7 @@ def test_pad(self):
         rs = Series(mixed).str.pad(5, side='both')
         xp = Series(['  a  ', NA, '  b  ', NA, NA, '  ee ', NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -1668,22 +2275,22 @@ def test_pad_fillchar(self):
         exp = Series(['XXaXX', 'XXbXX', NA, 'XXcXX', NA, 'eeeeee'])
         tm.assert_almost_equal(result, exp)
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not str"):
+        msg = "fillchar must be a character, not str"
+        with pytest.raises(TypeError, match=msg):
             result = values.str.pad(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not int"):
+        msg = "fillchar must be a character, not int"
+        with pytest.raises(TypeError, match=msg):
             result = values.str.pad(5, fillchar=5)
 
-    def test_pad_width(self):
-        # GH 13598
+    @pytest.mark.parametrize("f", ['center', 'ljust', 'rjust', 'zfill', 'pad'])
+    def test_pad_width(self, f):
+        # see gh-13598
         s = Series(['1', '22', 'a', 'bb'])
+        msg = "width must be of integer type, not*"
 
-        for f in ['center', 'ljust', 'rjust', 'zfill', 'pad']:
-            with tm.assertRaisesRegexp(TypeError,
-                                       "width must be of integer type, not*"):
-                getattr(s.str, f)('f')
+        with pytest.raises(TypeError, match=msg):
+            getattr(s.str, f)('f')
 
     def test_translate(self):
 
@@ -1714,8 +2321,8 @@ def _check(result, expected):
                 expected = klass(['abcde', 'abcc', 'cddd', 'cde'])
                 _check(result, expected)
             else:
-                with tm.assertRaisesRegexp(
-                        ValueError, "deletechars is not a valid argument"):
+                msg = "deletechars is not a valid argument"
+                with pytest.raises(ValueError, match=msg):
                     result = s.str.translate(table, deletechars='fg')
 
         # Series with non-string values
@@ -1746,19 +2353,19 @@ def test_center_ljust_rjust(self):
         rs = Series(mixed).str.center(5)
         xp = Series(['  a  ', NA, '  b  ', NA, NA, '  c  ', ' eee ', NA, NA, NA
                      ])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.ljust(5)
         xp = Series(['a    ', NA, 'b    ', NA, NA, 'c    ', 'eee  ', NA, NA, NA
                      ])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.rjust(5)
         xp = Series(['    a', NA, '    b', NA, NA, '    c', '  eee', NA, NA, NA
                      ])
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -1803,29 +2410,25 @@ def test_center_ljust_rjust_fillchar(self):
         # If fillchar is not a charatter, normal str raises TypeError
         # 'aaa'.ljust(5, 'XY')
         # TypeError: must be char, not str
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not str"):
-            result = values.str.center(5, fillchar='XY')
+        template = "fillchar must be a character, not {dtype}"
+
+        with pytest.raises(TypeError, match=template.format(dtype="str")):
+            values.str.center(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not str"):
-            result = values.str.ljust(5, fillchar='XY')
+        with pytest.raises(TypeError, match=template.format(dtype="str")):
+            values.str.ljust(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not str"):
-            result = values.str.rjust(5, fillchar='XY')
+        with pytest.raises(TypeError, match=template.format(dtype="str")):
+            values.str.rjust(5, fillchar='XY')
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not int"):
-            result = values.str.center(5, fillchar=1)
+        with pytest.raises(TypeError, match=template.format(dtype="int")):
+            values.str.center(5, fillchar=1)
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not int"):
-            result = values.str.ljust(5, fillchar=1)
+        with pytest.raises(TypeError, match=template.format(dtype="int")):
+            values.str.ljust(5, fillchar=1)
 
-        with tm.assertRaisesRegexp(TypeError,
-                                   "fillchar must be a character, not int"):
-            result = values.str.rjust(5, fillchar=1)
+        with pytest.raises(TypeError, match=template.format(dtype="int")):
+            values.str.rjust(5, fillchar=1)
 
     def test_zfill(self):
         values = Series(['1', '22', 'aaa', '333', '45678'])
@@ -1870,11 +2473,11 @@ def test_split(self):
         result = mixed.str.split('_')
         exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
                       ])
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         result = mixed.str.split('_', expand=False)
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         # unicode
@@ -1915,11 +2518,11 @@ def test_rsplit(self):
         result = mixed.str.rsplit('_')
         exp = Series([['a', 'b', 'c'], NA, ['d', 'e', 'f'], NA, NA, NA, NA, NA
                       ])
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         result = mixed.str.rsplit('_', expand=False)
-        tm.assertIsInstance(result, Series)
+        assert isinstance(result, Series)
         tm.assert_almost_equal(result, exp)
 
         # unicode
@@ -1944,14 +2547,27 @@ def test_rsplit(self):
         exp = Series([['a_b', 'c'], ['c_d', 'e'], NA, ['f_g', 'h']])
         tm.assert_series_equal(result, exp)
 
+    def test_split_blank_string(self):
+        # expand blank split GH 20067
+        values = Series([''], name='test')
+        result = values.str.split(expand=True)
+        exp = DataFrame([[]])
+        tm.assert_frame_equal(result, exp)
+
+        values = Series(['a b c', 'a b', '', ' '], name='test')
+        result = values.str.split(expand=True)
+        exp = DataFrame([['a', 'b', 'c'], ['a', 'b', np.nan],
+                         [np.nan, np.nan, np.nan], [np.nan, np.nan, np.nan]])
+        tm.assert_frame_equal(result, exp)
+
     def test_split_noargs(self):
         # #1859
         s = Series(['Wes McKinney', 'Travis  Oliphant'])
         result = s.str.split()
         expected = ['Travis', 'Oliphant']
-        self.assertEqual(result[1], expected)
+        assert result[1] == expected
         result = s.str.rsplit()
-        self.assertEqual(result[1], expected)
+        assert result[1] == expected
 
     def test_split_maxsplit(self):
         # re.split 0, str.split -1
@@ -2006,32 +2622,43 @@ def test_split_to_dataframe(self):
                         index=['preserve', 'me'])
         tm.assert_frame_equal(result, exp)
 
-        with tm.assertRaisesRegexp(ValueError, "expand must be"):
+        with pytest.raises(ValueError, match="expand must be"):
             s.str.split('_', expand="not_a_boolean")
 
     def test_split_to_multiindex_expand(self):
-        idx = Index(['nosplit', 'alsonosplit'])
+        # https://github.com/pandas-dev/pandas/issues/23677
+
+        idx = Index(['nosplit', 'alsonosplit', np.nan])
         result = idx.str.split('_', expand=True)
         exp = idx
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
-        idx = Index(['some_equal_splits', 'with_no_nans'])
+        idx = Index(['some_equal_splits', 'with_no_nans', np.nan, None])
         result = idx.str.split('_', expand=True)
-        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
-            'with', 'no', 'nans')])
+        exp = MultiIndex.from_tuples([('some', 'equal', 'splits'),
+                                      ('with', 'no', 'nans'),
+                                      [np.nan, np.nan, np.nan],
+                                      [None, None, None]])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 3)
+        assert result.nlevels == 3
 
-        idx = Index(['some_unequal_splits', 'one_of_these_things_is_not'])
+        idx = Index(['some_unequal_splits',
+                     'one_of_these_things_is_not',
+                     np.nan, None])
         result = idx.str.split('_', expand=True)
-        exp = MultiIndex.from_tuples([('some', 'unequal', 'splits', NA, NA, NA
-                                       ), ('one', 'of', 'these', 'things',
-                                           'is', 'not')])
+        exp = MultiIndex.from_tuples([('some', 'unequal', 'splits',
+                                       NA, NA, NA),
+                                      ('one', 'of', 'these',
+                                       'things', 'is', 'not'),
+                                      (np.nan, np.nan, np.nan,
+                                       np.nan, np.nan, np.nan),
+                                      (None, None, None,
+                                       None, None, None)])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 6)
+        assert result.nlevels == 6
 
-        with tm.assertRaisesRegexp(ValueError, "expand must be"):
+        with pytest.raises(ValueError, match="expand must be"):
             idx.str.split('_', expand="not_a_boolean")
 
     def test_rsplit_to_dataframe_expand(self):
@@ -2068,21 +2695,33 @@ def test_rsplit_to_multiindex_expand(self):
         result = idx.str.rsplit('_', expand=True)
         exp = idx
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         idx = Index(['some_equal_splits', 'with_no_nans'])
         result = idx.str.rsplit('_', expand=True)
         exp = MultiIndex.from_tuples([('some', 'equal', 'splits'), (
             'with', 'no', 'nans')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 3)
+        assert result.nlevels == 3
 
         idx = Index(['some_equal_splits', 'with_no_nans'])
         result = idx.str.rsplit('_', expand=True, n=1)
         exp = MultiIndex.from_tuples([('some_equal', 'splits'),
                                       ('with_no', 'nans')])
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 2)
+        assert result.nlevels == 2
+
+    def test_split_nan_expand(self):
+        # gh-18450
+        s = Series(["foo,bar,baz", NA])
+        result = s.str.split(",", expand=True)
+        exp = DataFrame([["foo", "bar", "baz"], [NA, NA, NA]])
+        tm.assert_frame_equal(result, exp)
+
+        # check that these are actually np.nan and not None
+        # TODO see GH 18463
+        # tm.assert_frame_equal does not differentiate
+        assert all(np.isnan(x) for x in result.iloc[1])
 
     def test_split_with_name(self):
         # GH 12617
@@ -2100,59 +2739,63 @@ def test_split_with_name(self):
         idx = Index(['a,b', 'c,d'], name='xxx')
         res = idx.str.split(',')
         exp = Index([['a', 'b'], ['c', 'd']], name='xxx')
-        self.assertTrue(res.nlevels, 1)
+        assert res.nlevels == 1
         tm.assert_index_equal(res, exp)
 
         res = idx.str.split(',', expand=True)
         exp = MultiIndex.from_tuples([('a', 'b'), ('c', 'd')])
-        self.assertTrue(res.nlevels, 2)
+        assert res.nlevels == 2
         tm.assert_index_equal(res, exp)
 
     def test_partition_series(self):
-        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
+        # https://github.com/pandas-dev/pandas/issues/23558
+
+        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h', None])
 
         result = values.str.partition('_', expand=False)
         exp = Series([('a', '_', 'b_c'), ('c', '_', 'd_e'), NA,
-                      ('f', '_', 'g_h')])
+                      ('f', '_', 'g_h'), None])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('_', expand=False)
         exp = Series([('a_b', '_', 'c'), ('c_d', '_', 'e'), NA,
-                      ('f_g', '_', 'h')])
+                      ('f_g', '_', 'h'), None])
         tm.assert_series_equal(result, exp)
 
         # more than one char
-        values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h'])
+        values = Series(['a__b__c', 'c__d__e', NA, 'f__g__h', None])
         result = values.str.partition('__', expand=False)
         exp = Series([('a', '__', 'b__c'), ('c', '__', 'd__e'), NA,
-                      ('f', '__', 'g__h')])
+                      ('f', '__', 'g__h'), None])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('__', expand=False)
         exp = Series([('a__b', '__', 'c'), ('c__d', '__', 'e'), NA,
-                      ('f__g', '__', 'h')])
+                      ('f__g', '__', 'h'), None])
         tm.assert_series_equal(result, exp)
 
         # None
-        values = Series(['a b c', 'c d e', NA, 'f g h'])
+        values = Series(['a b c', 'c d e', NA, 'f g h', None])
         result = values.str.partition(expand=False)
         exp = Series([('a', ' ', 'b c'), ('c', ' ', 'd e'), NA,
-                      ('f', ' ', 'g h')])
+                      ('f', ' ', 'g h'), None])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition(expand=False)
         exp = Series([('a b', ' ', 'c'), ('c d', ' ', 'e'), NA,
-                      ('f g', ' ', 'h')])
+                      ('f g', ' ', 'h'), None])
         tm.assert_series_equal(result, exp)
 
-        # Not splited
-        values = Series(['abc', 'cde', NA, 'fgh'])
+        # Not split
+        values = Series(['abc', 'cde', NA, 'fgh', None])
         result = values.str.partition('_', expand=False)
-        exp = Series([('abc', '', ''), ('cde', '', ''), NA, ('fgh', '', '')])
+        exp = Series([('abc', '', ''), ('cde', '', ''), NA,
+                      ('fgh', '', ''), None])
         tm.assert_series_equal(result, exp)
 
         result = values.str.rpartition('_', expand=False)
-        exp = Series([('', '', 'abc'), ('', '', 'cde'), NA, ('', '', 'fgh')])
+        exp = Series([('', '', 'abc'), ('', '', 'cde'), NA,
+                      ('', '', 'fgh'), None])
         tm.assert_series_equal(result, exp)
 
         # unicode
@@ -2171,62 +2814,70 @@ def test_partition_series(self):
         # compare to standard lib
         values = Series(['A_B_C', 'B_C_D', 'E_F_G', 'EFGHEF'])
         result = values.str.partition('_', expand=False).tolist()
-        self.assertEqual(result, [v.partition('_') for v in values])
+        assert result == [v.partition('_') for v in values]
         result = values.str.rpartition('_', expand=False).tolist()
-        self.assertEqual(result, [v.rpartition('_') for v in values])
+        assert result == [v.rpartition('_') for v in values]
 
     def test_partition_index(self):
-        values = Index(['a_b_c', 'c_d_e', 'f_g_h'])
+        # https://github.com/pandas-dev/pandas/issues/23558
+
+        values = Index(['a_b_c', 'c_d_e', 'f_g_h', np.nan, None])
 
         result = values.str.partition('_', expand=False)
-        exp = Index(np.array([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_',
-                                                                     'g_h')]))
+        exp = Index(np.array([('a', '_', 'b_c'), ('c', '_', 'd_e'),
+                              ('f', '_', 'g_h'), np.nan, None]))
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         result = values.str.rpartition('_', expand=False)
-        exp = Index(np.array([('a_b', '_', 'c'), ('c_d', '_', 'e'), (
-            'f_g', '_', 'h')]))
+        exp = Index(np.array([('a_b', '_', 'c'), ('c_d', '_', 'e'),
+                              ('f_g', '_', 'h'), np.nan, None]))
         tm.assert_index_equal(result, exp)
-        self.assertEqual(result.nlevels, 1)
+        assert result.nlevels == 1
 
         result = values.str.partition('_')
-        exp = Index([('a', '_', 'b_c'), ('c', '_', 'd_e'), ('f', '_', 'g_h')])
+        exp = Index([('a', '_', 'b_c'), ('c', '_', 'd_e'),
+                     ('f', '_', 'g_h'), (np.nan, np.nan, np.nan),
+                     (None, None, None)])
         tm.assert_index_equal(result, exp)
-        self.assertTrue(isinstance(result, MultiIndex))
-        self.assertEqual(result.nlevels, 3)
+        assert isinstance(result, MultiIndex)
+        assert result.nlevels == 3
 
         result = values.str.rpartition('_')
-        exp = Index([('a_b', '_', 'c'), ('c_d', '_', 'e'), ('f_g', '_', 'h')])
+        exp = Index([('a_b', '_', 'c'), ('c_d', '_', 'e'),
+                     ('f_g', '_', 'h'), (np.nan, np.nan, np.nan),
+                     (None, None, None)])
         tm.assert_index_equal(result, exp)
-        self.assertTrue(isinstance(result, MultiIndex))
-        self.assertEqual(result.nlevels, 3)
+        assert isinstance(result, MultiIndex)
+        assert result.nlevels == 3
 
     def test_partition_to_dataframe(self):
-        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
+        # https://github.com/pandas-dev/pandas/issues/23558
+
+        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h', None])
         result = values.str.partition('_')
-        exp = DataFrame({0: ['a', 'c', np.nan, 'f'],
-                         1: ['_', '_', np.nan, '_'],
-                         2: ['b_c', 'd_e', np.nan, 'g_h']})
+        exp = DataFrame({0: ['a', 'c', np.nan, 'f', None],
+                         1: ['_', '_', np.nan, '_', None],
+                         2: ['b_c', 'd_e', np.nan, 'g_h', None]})
         tm.assert_frame_equal(result, exp)
 
         result = values.str.rpartition('_')
-        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g'],
-                         1: ['_', '_', np.nan, '_'],
-                         2: ['c', 'e', np.nan, 'h']})
+        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g', None],
+                         1: ['_', '_', np.nan, '_', None],
+                         2: ['c', 'e', np.nan, 'h', None]})
         tm.assert_frame_equal(result, exp)
 
-        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
+        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h', None])
         result = values.str.partition('_', expand=True)
-        exp = DataFrame({0: ['a', 'c', np.nan, 'f'],
-                         1: ['_', '_', np.nan, '_'],
-                         2: ['b_c', 'd_e', np.nan, 'g_h']})
+        exp = DataFrame({0: ['a', 'c', np.nan, 'f', None],
+                         1: ['_', '_', np.nan, '_', None],
+                         2: ['b_c', 'd_e', np.nan, 'g_h', None]})
         tm.assert_frame_equal(result, exp)
 
         result = values.str.rpartition('_', expand=True)
-        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g'],
-                         1: ['_', '_', np.nan, '_'],
-                         2: ['c', 'e', np.nan, 'h']})
+        exp = DataFrame({0: ['a_b', 'c_d', np.nan, 'f_g', None],
+                         1: ['_', '_', np.nan, '_', None],
+                         2: ['c', 'e', np.nan, 'h', None]})
         tm.assert_frame_equal(result, exp)
 
     def test_partition_with_name(self):
@@ -2245,15 +2896,33 @@ def test_partition_with_name(self):
         idx = Index(['a,b', 'c,d'], name='xxx')
         res = idx.str.partition(',')
         exp = MultiIndex.from_tuples([('a', ',', 'b'), ('c', ',', 'd')])
-        self.assertTrue(res.nlevels, 3)
+        assert res.nlevels == 3
         tm.assert_index_equal(res, exp)
 
         # should preserve name
         res = idx.str.partition(',', expand=False)
         exp = Index(np.array([('a', ',', 'b'), ('c', ',', 'd')]), name='xxx')
-        self.assertTrue(res.nlevels, 1)
+        assert res.nlevels == 1
         tm.assert_index_equal(res, exp)
 
+    def test_partition_deprecation(self):
+        # GH 22676; depr kwarg "pat" in favor of "sep"
+        values = Series(['a_b_c', 'c_d_e', NA, 'f_g_h'])
+
+        # str.partition
+        # using sep -> no warning
+        expected = values.str.partition(sep='_')
+        with tm.assert_produces_warning(FutureWarning):
+            result = values.str.partition(pat='_')
+            tm.assert_frame_equal(result, expected)
+
+        # str.rpartition
+        # using sep -> no warning
+        expected = values.str.rpartition(sep='_')
+        with tm.assert_produces_warning(FutureWarning):
+            result = values.str.rpartition(pat='_')
+            tm.assert_frame_equal(result, expected)
+
     def test_pipe_failures(self):
         # #2119
         s = Series(['A|B|C'])
@@ -2279,10 +2948,10 @@ def test_slice(self):
                                   (3, 0, -1)]:
             try:
                 result = values.str.slice(start, stop, step)
-                expected = Series([s[start:stop:step] if not isnull(s) else NA
+                expected = Series([s[start:stop:step] if not isna(s) else NA
                                    for s in values])
                 tm.assert_series_equal(result, expected)
-            except:
+            except IndexError:
                 print('failed on %s:%s:%s' % (start, stop, step))
                 raise
 
@@ -2293,7 +2962,7 @@ def test_slice(self):
         rs = Series(mixed).str.slice(2, 5)
         xp = Series(['foo', NA, 'bar', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.slice(2, 5, -1)
@@ -2371,19 +3040,19 @@ def test_strip_lstrip_rstrip_mixed(self):
         rs = Series(mixed).str.strip()
         xp = Series(['aa', NA, 'bb', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.lstrip()
         xp = Series(['aa  ', NA, 'bb \t\n', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         rs = Series(mixed).str.rstrip()
         xp = Series(['  aa', NA, ' bb', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
     def test_strip_lstrip_rstrip_unicode(self):
@@ -2472,7 +3141,7 @@ def test_get(self):
         rs = Series(mixed).str.split('_').str.get(1)
         xp = Series(['b', NA, 'd', NA, NA, NA, NA, NA])
 
-        tm.assertIsInstance(rs, Series)
+        assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
 
         # unicode
@@ -2482,7 +3151,45 @@ def test_get(self):
         expected = Series([u('b'), u('d'), np.nan, u('g')])
         tm.assert_series_equal(result, expected)
 
-    def test_more_contains(self):
+        # bounds testing
+        values = Series(['1_2_3_4_5', '6_7_8_9_10', '11_12'])
+
+        # positive index
+        result = values.str.split('_').str.get(2)
+        expected = Series(['3', '8', np.nan])
+        tm.assert_series_equal(result, expected)
+
+        # negative index
+        result = values.str.split('_').str.get(-3)
+        expected = Series(['3', '8', np.nan])
+        tm.assert_series_equal(result, expected)
+
+    def test_get_complex(self):
+        # GH 20671, getting value not in dict raising `KeyError`
+        values = Series([(1, 2, 3), [1, 2, 3], {1, 2, 3},
+                         {1: 'a', 2: 'b', 3: 'c'}])
+
+        result = values.str.get(1)
+        expected = Series([2, 2, np.nan, 'a'])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.get(-1)
+        expected = Series([3, 3, np.nan, np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('to_type', [tuple, list, np.array])
+    def test_get_complex_nested(self, to_type):
+        values = Series([to_type([to_type([1, 2])])])
+
+        result = values.str.get(0)
+        expected = Series([to_type([1, 2])])
+        tm.assert_series_equal(result, expected)
+
+        result = values.str.get(1)
+        expected = Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+    def test_contains_moar(self):
         # PR #1179
         s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA,
                     'CABA', 'dog', 'cat'])
@@ -2532,7 +3239,7 @@ def test_contains_nan(self):
         expected = Series([np.nan, np.nan, np.nan], dtype=np.object_)
         assert_series_equal(result, expected)
 
-    def test_more_replace(self):
+    def test_replace_moar(self):
         # PR #1179
         s = Series(['A', 'B', 'C', 'Aaba', 'Baca', '', NA, 'CABA',
                     'dog', 'cat'])
@@ -2591,20 +3298,20 @@ def test_match_findall_flags(self):
         pat = r'([A-Z0-9._%+-]+)@([A-Z0-9.-]+)\.([A-Z]{2,4})'
 
         result = data.str.extract(pat, flags=re.IGNORECASE, expand=True)
-        self.assertEqual(result.iloc[0].tolist(), ['dave', 'google', 'com'])
+        assert result.iloc[0].tolist() == ['dave', 'google', 'com']
 
         result = data.str.match(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], True)
+        assert result[0]
 
         result = data.str.findall(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0][0], ('dave', 'google', 'com'))
+        assert result[0][0] == ('dave', 'google', 'com')
 
         result = data.str.count(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], 1)
+        assert result[0] == 1
 
         with tm.assert_produces_warning(UserWarning):
             result = data.str.contains(pat, flags=re.IGNORECASE)
-        self.assertEqual(result[0], True)
+        assert result[0]
 
     def test_encode_decode(self):
         base = Series([u('a'), u('b'), u('a\xe4')])
@@ -2616,10 +3323,14 @@ def test_encode_decode(self):
 
         tm.assert_series_equal(result, exp)
 
+    @pytest.mark.skipif(PY2, reason="pytest.raises match regex fails")
     def test_encode_decode_errors(self):
         encodeBase = Series([u('a'), u('b'), u('a\x9d')])
 
-        self.assertRaises(UnicodeEncodeError, encodeBase.str.encode, 'cp1252')
+        msg = (r"'charmap' codec can't encode character '\\x9d' in position 1:"
+               " character maps to <undefined>")
+        with pytest.raises(UnicodeEncodeError, match=msg):
+            encodeBase.str.encode('cp1252')
 
         f = lambda x: x.encode('cp1252', 'ignore')
         result = encodeBase.str.encode('cp1252', 'ignore')
@@ -2628,7 +3339,10 @@ def test_encode_decode_errors(self):
 
         decodeBase = Series([b'a', b'b', b'a\x9d'])
 
-        self.assertRaises(UnicodeDecodeError, decodeBase.str.decode, 'cp1252')
+        msg = ("'charmap' codec can't decode byte 0x9d in position 1:"
+               " character maps to <undefined>")
+        with pytest.raises(UnicodeDecodeError, match=msg):
+            decodeBase.str.decode('cp1252')
 
         f = lambda x: x.decode('cp1252', 'ignore')
         result = decodeBase.str.decode('cp1252', 'ignore')
@@ -2652,7 +3366,7 @@ def test_normalize(self):
         result = s.str.normalize('NFC')
         tm.assert_series_equal(result, expected)
 
-        with tm.assertRaisesRegexp(ValueError, "invalid normalization form"):
+        with pytest.raises(ValueError, match="invalid normalization form"):
             s.str.normalize('xxx')
 
         s = Index([u'ＡＢＣ', u'１２３', u'ｱｲｴ'])
@@ -2660,32 +3374,6 @@ def test_normalize(self):
         result = s.str.normalize('NFKC')
         tm.assert_index_equal(result, expected)
 
-    def test_cat_on_filtered_index(self):
-        df = DataFrame(index=MultiIndex.from_product(
-            [[2011, 2012], [1, 2, 3]], names=['year', 'month']))
-
-        df = df.reset_index()
-        df = df[df.month > 1]
-
-        str_year = df.year.astype('str')
-        str_month = df.month.astype('str')
-        str_both = str_year.str.cat(str_month, sep=' ')
-
-        self.assertEqual(str_both.loc[1], '2011 2')
-
-        str_multiple = str_year.str.cat([str_month, str_month], sep=' ')
-
-        self.assertEqual(str_multiple.loc[1], '2011 2 2')
-
-    def test_str_cat_raises_intuitive_error(self):
-        # https://github.com/pandas-dev/pandas/issues/11334
-        s = Series(['a', 'b', 'c', 'd'])
-        message = "Did you mean to supply a `sep` keyword?"
-        with tm.assertRaisesRegexp(ValueError, message):
-            s.str.cat('|')
-        with tm.assertRaisesRegexp(ValueError, message):
-            s.str.cat('    ')
-
     def test_index_str_accessor_visibility(self):
         from pandas.core.strings import StringMethods
 
@@ -2705,15 +3393,15 @@ def test_index_str_accessor_visibility(self):
                      (['aa', datetime(2011, 1, 1)], 'mixed')]
         for values, tp in cases:
             idx = Index(values)
-            self.assertTrue(isinstance(Series(values).str, StringMethods))
-            self.assertTrue(isinstance(idx.str, StringMethods))
-            self.assertEqual(idx.inferred_type, tp)
+            assert isinstance(Series(values).str, StringMethods)
+            assert isinstance(idx.str, StringMethods)
+            assert idx.inferred_type == tp
 
         for values, tp in cases:
             idx = Index(values)
-            self.assertTrue(isinstance(Series(values).str, StringMethods))
-            self.assertTrue(isinstance(idx.str, StringMethods))
-            self.assertEqual(idx.inferred_type, tp)
+            assert isinstance(Series(values).str, StringMethods)
+            assert isinstance(idx.str, StringMethods)
+            assert idx.inferred_type == tp
 
         cases = [([1, np.nan], 'floating'),
                  ([datetime(2011, 1, 1)], 'datetime64'),
@@ -2721,33 +3409,43 @@ def test_index_str_accessor_visibility(self):
         for values, tp in cases:
             idx = Index(values)
             message = 'Can only use .str accessor with string values'
-            with self.assertRaisesRegexp(AttributeError, message):
+            with pytest.raises(AttributeError, match=message):
                 Series(values).str
-            with self.assertRaisesRegexp(AttributeError, message):
+            with pytest.raises(AttributeError, match=message):
                 idx.str
-            self.assertEqual(idx.inferred_type, tp)
+            assert idx.inferred_type == tp
 
         # MultiIndex has mixed dtype, but not allow to use accessor
         idx = MultiIndex.from_tuples([('a', 'b'), ('a', 'b')])
-        self.assertEqual(idx.inferred_type, 'mixed')
+        assert idx.inferred_type == 'mixed'
         message = 'Can only use .str accessor with Index, not MultiIndex'
-        with self.assertRaisesRegexp(AttributeError, message):
+        with pytest.raises(AttributeError, match=message):
             idx.str
 
     def test_str_accessor_no_new_attributes(self):
         # https://github.com/pandas-dev/pandas/issues/10673
         s = Series(list('aabbcde'))
-        with tm.assertRaisesRegexp(AttributeError,
-                                   "You cannot add any new attribute"):
+        with pytest.raises(AttributeError,
+                           match="You cannot add any new attribute"):
             s.str.xlabel = "a"
 
     def test_method_on_bytes(self):
         lhs = Series(np.array(list('abc'), 'S1').astype(object))
         rhs = Series(np.array(list('def'), 'S1').astype(object))
         if compat.PY3:
-            self.assertRaises(TypeError, lhs.str.cat, rhs)
+            with pytest.raises(TypeError, match="can't concat str to bytes"):
+                lhs.str.cat(rhs)
         else:
             result = lhs.str.cat(rhs)
             expected = Series(np.array(
                 ['ad', 'be', 'cf'], 'S2').astype(object))
             tm.assert_series_equal(result, expected)
+
+    @pytest.mark.skipif(compat.PY2, reason='not in python2')
+    def test_casefold(self):
+        # GH25405
+        expected = Series(['ss', NA, 'case', 'ssd'])
+        s = Series(['ß', NA, 'case', 'ßd'])
+        result = s.str.casefold()
+
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/test_take.py b/pandas/tests/test_take.py
index 0bc1d0dcd0532..c9e4ed90b1dea 100644
--- a/pandas/tests/test_take.py
+++ b/pandas/tests/test_take.py
@@ -1,321 +1,277 @@
 # -*- coding: utf-8 -*-
-import re
 from datetime import datetime
+import re
 
 import numpy as np
+import pytest
+
+from pandas._libs.tslib import iNaT
 from pandas.compat import long
+
 import pandas.core.algorithms as algos
 import pandas.util.testing as tm
-from pandas._libs.tslib import iNaT
 
 
-class TestTake(tm.TestCase):
-    # standard incompatible fill error
+@pytest.fixture(params=[True, False])
+def writeable(request):
+    return request.param
+
+
+# Check that take_nd works both with writeable arrays
+# (in which case fast typed memory-views implementation)
+# and read-only arrays alike.
+@pytest.fixture(params=[
+    (np.float64, True),
+    (np.float32, True),
+    (np.uint64, False),
+    (np.uint32, False),
+    (np.uint16, False),
+    (np.uint8, False),
+    (np.int64, False),
+    (np.int32, False),
+    (np.int16, False),
+    (np.int8, False),
+    (np.object_, True),
+    (np.bool, False),
+])
+def dtype_can_hold_na(request):
+    return request.param
+
+
+@pytest.fixture(params=[
+    (np.int8, np.int16(127), np.int8),
+    (np.int8, np.int16(128), np.int16),
+    (np.int32, 1, np.int32),
+    (np.int32, 2.0, np.float64),
+    (np.int32, 3.0 + 4.0j, np.complex128),
+    (np.int32, True, np.object_),
+    (np.int32, "", np.object_),
+    (np.float64, 1, np.float64),
+    (np.float64, 2.0, np.float64),
+    (np.float64, 3.0 + 4.0j, np.complex128),
+    (np.float64, True, np.object_),
+    (np.float64, "", np.object_),
+    (np.complex128, 1, np.complex128),
+    (np.complex128, 2.0, np.complex128),
+    (np.complex128, 3.0 + 4.0j, np.complex128),
+    (np.complex128, True, np.object_),
+    (np.complex128, "", np.object_),
+    (np.bool_, 1, np.object_),
+    (np.bool_, 2.0, np.object_),
+    (np.bool_, 3.0 + 4.0j, np.object_),
+    (np.bool_, True, np.bool_),
+    (np.bool_, '', np.object_),
+])
+def dtype_fill_out_dtype(request):
+    return request.param
+
+
+class TestTake(object):
+    # Standard incompatible fill error.
     fill_error = re.compile("Incompatible type for fill_value")
 
-    def test_1d_with_out(self):
-        def _test_dtype(dtype, can_hold_na, writeable=True):
-            data = np.random.randint(0, 2, 4).astype(dtype)
-            data.flags.writeable = writeable
+    def test_1d_with_out(self, dtype_can_hold_na, writeable):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, 4).astype(dtype)
+        data.flags.writeable = writeable
+
+        indexer = [2, 1, 0, 1]
+        out = np.empty(4, dtype=dtype)
+        algos.take_1d(data, indexer, out=out)
 
-            indexer = [2, 1, 0, 1]
-            out = np.empty(4, dtype=dtype)
+        expected = data.take(indexer)
+        tm.assert_almost_equal(out, expected)
+
+        indexer = [2, 1, 0, -1]
+        out = np.empty(4, dtype=dtype)
+
+        if can_hold_na:
             algos.take_1d(data, indexer, out=out)
             expected = data.take(indexer)
+            expected[3] = np.nan
             tm.assert_almost_equal(out, expected)
-
-            indexer = [2, 1, 0, -1]
-            out = np.empty(4, dtype=dtype)
-            if can_hold_na:
+        else:
+            with pytest.raises(TypeError, match=self.fill_error):
                 algos.take_1d(data, indexer, out=out)
-                expected = data.take(indexer)
-                expected[3] = np.nan
-                tm.assert_almost_equal(out, expected)
-            else:
-                with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                    algos.take_1d(data, indexer, out=out)
-                # no exception o/w
-                data.take(indexer, out=out)
-
-        for writeable in [True, False]:
-            # Check that take_nd works both with writeable arrays (in which
-            # case fast typed memoryviews implementation) and read-only
-            # arrays alike.
-            _test_dtype(np.float64, True, writeable=writeable)
-            _test_dtype(np.float32, True, writeable=writeable)
-            _test_dtype(np.uint64, False, writeable=writeable)
-            _test_dtype(np.uint32, False, writeable=writeable)
-            _test_dtype(np.uint16, False, writeable=writeable)
-            _test_dtype(np.uint8, False, writeable=writeable)
-            _test_dtype(np.int64, False, writeable=writeable)
-            _test_dtype(np.int32, False, writeable=writeable)
-            _test_dtype(np.int16, False, writeable=writeable)
-            _test_dtype(np.int8, False, writeable=writeable)
-            _test_dtype(np.object_, True, writeable=writeable)
-            _test_dtype(np.bool, False, writeable=writeable)
-
-    def test_1d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, 4).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = algos.take_1d(data, indexer, fill_value=fill_value)
-            assert ((result[[0, 1, 2]] == data[[2, 1, 0]]).all())
-            assert (result[3] == fill_value)
-            assert (result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = algos.take_1d(data, indexer, fill_value=fill_value)
-            assert ((result[[0, 1, 2, 3]] == data[indexer]).all())
-            assert (result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
-
-    def test_2d_with_out(self):
-        def _test_dtype(dtype, can_hold_na, writeable=True):
-            data = np.random.randint(0, 2, (5, 3)).astype(dtype)
-            data.flags.writeable = writeable
-
-            indexer = [2, 1, 0, 1]
-            out0 = np.empty((4, 3), dtype=dtype)
-            out1 = np.empty((5, 4), dtype=dtype)
+
+            # No Exception otherwise.
+            data.take(indexer, out=out)
+
+    def test_1d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+        data = np.random.randint(0, 2, 4).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_1d(data, indexer, fill_value=fill_value)
+        assert ((result[[0, 1, 2]] == data[[2, 1, 0]]).all())
+        assert (result[3] == fill_value)
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+
+        result = algos.take_1d(data, indexer, fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3]] == data[indexer]).all())
+        assert (result.dtype == dtype)
+
+    def test_2d_with_out(self, dtype_can_hold_na, writeable):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, (5, 3)).astype(dtype)
+        data.flags.writeable = writeable
+
+        indexer = [2, 1, 0, 1]
+        out0 = np.empty((4, 3), dtype=dtype)
+        out1 = np.empty((5, 4), dtype=dtype)
+        algos.take_nd(data, indexer, out=out0, axis=0)
+        algos.take_nd(data, indexer, out=out1, axis=1)
+
+        expected0 = data.take(indexer, axis=0)
+        expected1 = data.take(indexer, axis=1)
+        tm.assert_almost_equal(out0, expected0)
+        tm.assert_almost_equal(out1, expected1)
+
+        indexer = [2, 1, 0, -1]
+        out0 = np.empty((4, 3), dtype=dtype)
+        out1 = np.empty((5, 4), dtype=dtype)
+
+        if can_hold_na:
             algos.take_nd(data, indexer, out=out0, axis=0)
             algos.take_nd(data, indexer, out=out1, axis=1)
+
             expected0 = data.take(indexer, axis=0)
             expected1 = data.take(indexer, axis=1)
+            expected0[3, :] = np.nan
+            expected1[:, 3] = np.nan
+
             tm.assert_almost_equal(out0, expected0)
             tm.assert_almost_equal(out1, expected1)
-
-            indexer = [2, 1, 0, -1]
-            out0 = np.empty((4, 3), dtype=dtype)
-            out1 = np.empty((5, 4), dtype=dtype)
-            if can_hold_na:
-                algos.take_nd(data, indexer, out=out0, axis=0)
-                algos.take_nd(data, indexer, out=out1, axis=1)
-                expected0 = data.take(indexer, axis=0)
-                expected1 = data.take(indexer, axis=1)
-                expected0[3, :] = np.nan
-                expected1[:, 3] = np.nan
-                tm.assert_almost_equal(out0, expected0)
-                tm.assert_almost_equal(out1, expected1)
-            else:
-                for i, out in enumerate([out0, out1]):
-                    with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                        algos.take_nd(data, indexer, out=out, axis=i)
-                    # no exception o/w
-                    data.take(indexer, out=out, axis=i)
-
-        for writeable in [True, False]:
-            # Check that take_nd works both with writeable arrays (in which
-            # case fast typed memoryviews implementation) and read-only
-            # arrays alike.
-            _test_dtype(np.float64, True, writeable=writeable)
-            _test_dtype(np.float32, True, writeable=writeable)
-            _test_dtype(np.uint64, False, writeable=writeable)
-            _test_dtype(np.uint32, False, writeable=writeable)
-            _test_dtype(np.uint16, False, writeable=writeable)
-            _test_dtype(np.uint8, False, writeable=writeable)
-            _test_dtype(np.int64, False, writeable=writeable)
-            _test_dtype(np.int32, False, writeable=writeable)
-            _test_dtype(np.int16, False, writeable=writeable)
-            _test_dtype(np.int8, False, writeable=writeable)
-            _test_dtype(np.object_, True, writeable=writeable)
-            _test_dtype(np.bool, False, writeable=writeable)
-
-    def test_2d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, (5, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = algos.take_nd(data, indexer, axis=0,
-                                   fill_value=fill_value)
-            assert ((result[[0, 1, 2], :] == data[[2, 1, 0], :]).all())
-            assert ((result[3, :] == fill_value).all())
-            assert (result.dtype == out_dtype)
-
-            result = algos.take_nd(data, indexer, axis=1,
-                                   fill_value=fill_value)
-            assert ((result[:, [0, 1, 2]] == data[:, [2, 1, 0]]).all())
-            assert ((result[:, 3] == fill_value).all())
-            assert (result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = algos.take_nd(data, indexer, axis=0,
-                                   fill_value=fill_value)
-            assert ((result[[0, 1, 2, 3], :] == data[indexer, :]).all())
-            assert (result.dtype == dtype)
-
-            result = algos.take_nd(data, indexer, axis=1,
-                                   fill_value=fill_value)
-            assert ((result[:, [0, 1, 2, 3]] == data[:, indexer]).all())
-            assert (result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
-
-    def test_3d_with_out(self):
-        def _test_dtype(dtype, can_hold_na):
-            data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, 1]
-            out0 = np.empty((4, 4, 3), dtype=dtype)
-            out1 = np.empty((5, 4, 3), dtype=dtype)
-            out2 = np.empty((5, 4, 4), dtype=dtype)
+        else:
+            for i, out in enumerate([out0, out1]):
+                with pytest.raises(TypeError, match=self.fill_error):
+                    algos.take_nd(data, indexer, out=out, axis=i)
+
+                # No Exception otherwise.
+                data.take(indexer, out=out, axis=i)
+
+    def test_2d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+        data = np.random.randint(0, 2, (5, 3)).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2], :] == data[[2, 1, 0], :]).all())
+        assert ((result[3, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2]] == data[:, [2, 1, 0]]).all())
+        assert ((result[:, 3] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3], :] == data[indexer, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2, 3]] == data[:, indexer]).all())
+        assert (result.dtype == dtype)
+
+    def test_3d_with_out(self, dtype_can_hold_na):
+        dtype, can_hold_na = dtype_can_hold_na
+
+        data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
+        indexer = [2, 1, 0, 1]
+
+        out0 = np.empty((4, 4, 3), dtype=dtype)
+        out1 = np.empty((5, 4, 3), dtype=dtype)
+        out2 = np.empty((5, 4, 4), dtype=dtype)
+
+        algos.take_nd(data, indexer, out=out0, axis=0)
+        algos.take_nd(data, indexer, out=out1, axis=1)
+        algos.take_nd(data, indexer, out=out2, axis=2)
+
+        expected0 = data.take(indexer, axis=0)
+        expected1 = data.take(indexer, axis=1)
+        expected2 = data.take(indexer, axis=2)
+
+        tm.assert_almost_equal(out0, expected0)
+        tm.assert_almost_equal(out1, expected1)
+        tm.assert_almost_equal(out2, expected2)
+
+        indexer = [2, 1, 0, -1]
+        out0 = np.empty((4, 4, 3), dtype=dtype)
+        out1 = np.empty((5, 4, 3), dtype=dtype)
+        out2 = np.empty((5, 4, 4), dtype=dtype)
+
+        if can_hold_na:
             algos.take_nd(data, indexer, out=out0, axis=0)
             algos.take_nd(data, indexer, out=out1, axis=1)
             algos.take_nd(data, indexer, out=out2, axis=2)
+
             expected0 = data.take(indexer, axis=0)
             expected1 = data.take(indexer, axis=1)
             expected2 = data.take(indexer, axis=2)
+
+            expected0[3, :, :] = np.nan
+            expected1[:, 3, :] = np.nan
+            expected2[:, :, 3] = np.nan
+
             tm.assert_almost_equal(out0, expected0)
             tm.assert_almost_equal(out1, expected1)
             tm.assert_almost_equal(out2, expected2)
-
-            indexer = [2, 1, 0, -1]
-            out0 = np.empty((4, 4, 3), dtype=dtype)
-            out1 = np.empty((5, 4, 3), dtype=dtype)
-            out2 = np.empty((5, 4, 4), dtype=dtype)
-            if can_hold_na:
-                algos.take_nd(data, indexer, out=out0, axis=0)
-                algos.take_nd(data, indexer, out=out1, axis=1)
-                algos.take_nd(data, indexer, out=out2, axis=2)
-                expected0 = data.take(indexer, axis=0)
-                expected1 = data.take(indexer, axis=1)
-                expected2 = data.take(indexer, axis=2)
-                expected0[3, :, :] = np.nan
-                expected1[:, 3, :] = np.nan
-                expected2[:, :, 3] = np.nan
-                tm.assert_almost_equal(out0, expected0)
-                tm.assert_almost_equal(out1, expected1)
-                tm.assert_almost_equal(out2, expected2)
-            else:
-                for i, out in enumerate([out0, out1, out2]):
-                    with tm.assertRaisesRegexp(TypeError, self.fill_error):
-                        algos.take_nd(data, indexer, out=out, axis=i)
-                    # no exception o/w
-                    data.take(indexer, out=out, axis=i)
-
-        _test_dtype(np.float64, True)
-        _test_dtype(np.float32, True)
-        _test_dtype(np.uint64, False)
-        _test_dtype(np.uint32, False)
-        _test_dtype(np.uint16, False)
-        _test_dtype(np.uint8, False)
-        _test_dtype(np.int64, False)
-        _test_dtype(np.int32, False)
-        _test_dtype(np.int16, False)
-        _test_dtype(np.int8, False)
-        _test_dtype(np.object_, True)
-        _test_dtype(np.bool, False)
-
-    def test_3d_fill_nonna(self):
-        def _test_dtype(dtype, fill_value, out_dtype):
-            data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
-
-            indexer = [2, 1, 0, -1]
-
-            result = algos.take_nd(data, indexer, axis=0,
-                                   fill_value=fill_value)
-            assert ((result[[0, 1, 2], :, :] == data[[2, 1, 0], :, :]).all())
-            assert ((result[3, :, :] == fill_value).all())
-            assert (result.dtype == out_dtype)
-
-            result = algos.take_nd(data, indexer, axis=1,
-                                   fill_value=fill_value)
-            assert ((result[:, [0, 1, 2], :] == data[:, [2, 1, 0], :]).all())
-            assert ((result[:, 3, :] == fill_value).all())
-            assert (result.dtype == out_dtype)
-
-            result = algos.take_nd(data, indexer, axis=2,
-                                   fill_value=fill_value)
-            assert ((result[:, :, [0, 1, 2]] == data[:, :, [2, 1, 0]]).all())
-            assert ((result[:, :, 3] == fill_value).all())
-            assert (result.dtype == out_dtype)
-
-            indexer = [2, 1, 0, 1]
-
-            result = algos.take_nd(data, indexer, axis=0,
-                                   fill_value=fill_value)
-            assert ((result[[0, 1, 2, 3], :, :] == data[indexer, :, :]).all())
-            assert (result.dtype == dtype)
-
-            result = algos.take_nd(data, indexer, axis=1,
-                                   fill_value=fill_value)
-            assert ((result[:, [0, 1, 2, 3], :] == data[:, indexer, :]).all())
-            assert (result.dtype == dtype)
-
-            result = algos.take_nd(data, indexer, axis=2,
-                                   fill_value=fill_value)
-            assert ((result[:, :, [0, 1, 2, 3]] == data[:, :, indexer]).all())
-            assert (result.dtype == dtype)
-
-        _test_dtype(np.int8, np.int16(127), np.int8)
-        _test_dtype(np.int8, np.int16(128), np.int16)
-        _test_dtype(np.int32, 1, np.int32)
-        _test_dtype(np.int32, 2.0, np.float64)
-        _test_dtype(np.int32, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.int32, True, np.object_)
-        _test_dtype(np.int32, '', np.object_)
-        _test_dtype(np.float64, 1, np.float64)
-        _test_dtype(np.float64, 2.0, np.float64)
-        _test_dtype(np.float64, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.float64, True, np.object_)
-        _test_dtype(np.float64, '', np.object_)
-        _test_dtype(np.complex128, 1, np.complex128)
-        _test_dtype(np.complex128, 2.0, np.complex128)
-        _test_dtype(np.complex128, 3.0 + 4.0j, np.complex128)
-        _test_dtype(np.complex128, True, np.object_)
-        _test_dtype(np.complex128, '', np.object_)
-        _test_dtype(np.bool_, 1, np.object_)
-        _test_dtype(np.bool_, 2.0, np.object_)
-        _test_dtype(np.bool_, 3.0 + 4.0j, np.object_)
-        _test_dtype(np.bool_, True, np.bool_)
-        _test_dtype(np.bool_, '', np.object_)
+        else:
+            for i, out in enumerate([out0, out1, out2]):
+                with pytest.raises(TypeError, match=self.fill_error):
+                    algos.take_nd(data, indexer, out=out, axis=i)
+
+                # No Exception otherwise.
+                data.take(indexer, out=out, axis=i)
+
+    def test_3d_fill_nonna(self, dtype_fill_out_dtype):
+        dtype, fill_value, out_dtype = dtype_fill_out_dtype
+
+        data = np.random.randint(0, 2, (5, 4, 3)).astype(dtype)
+        indexer = [2, 1, 0, -1]
+
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2], :, :] == data[[2, 1, 0], :, :]).all())
+        assert ((result[3, :, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2], :] == data[:, [2, 1, 0], :]).all())
+        assert ((result[:, 3, :] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        result = algos.take_nd(data, indexer, axis=2,
+                               fill_value=fill_value)
+        assert ((result[:, :, [0, 1, 2]] == data[:, :, [2, 1, 0]]).all())
+        assert ((result[:, :, 3] == fill_value).all())
+        assert (result.dtype == out_dtype)
+
+        indexer = [2, 1, 0, 1]
+        result = algos.take_nd(data, indexer, axis=0,
+                               fill_value=fill_value)
+        assert ((result[[0, 1, 2, 3], :, :] == data[indexer, :, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=1,
+                               fill_value=fill_value)
+        assert ((result[:, [0, 1, 2, 3], :] == data[:, indexer, :]).all())
+        assert (result.dtype == dtype)
+
+        result = algos.take_nd(data, indexer, axis=2,
+                               fill_value=fill_value)
+        assert ((result[:, :, [0, 1, 2, 3]] == data[:, :, indexer]).all())
+        assert (result.dtype == dtype)
 
     def test_1d_other_dtypes(self):
         arr = np.random.randn(10).astype(np.float32)
@@ -348,24 +304,24 @@ def test_1d_bool(self):
 
         result = algos.take_1d(arr, [0, 2, 2, 1])
         expected = arr.take([0, 2, 2, 1])
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = algos.take_1d(arr, [0, 2, -1])
-        self.assertEqual(result.dtype, np.object_)
+        assert result.dtype == np.object_
 
     def test_2d_bool(self):
         arr = np.array([[0, 1, 0], [1, 0, 1], [0, 1, 1]], dtype=bool)
 
         result = algos.take_nd(arr, [0, 2, 2, 1])
         expected = arr.take([0, 2, 2, 1], axis=0)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = algos.take_nd(arr, [0, 2, 2, 1], axis=1)
         expected = arr.take([0, 2, 2, 1], axis=1)
-        self.assert_numpy_array_equal(result, expected)
+        tm.assert_numpy_array_equal(result, expected)
 
         result = algos.take_nd(arr, [0, 2, -1])
-        self.assertEqual(result.dtype, np.object_)
+        assert result.dtype == np.object_
 
     def test_2d_float32(self):
         arr = np.random.randn(4, 3).astype(np.float32)
@@ -443,3 +399,70 @@ def test_2d_datetime64(self):
         expected = arr.take(indexer, axis=1)
         expected[:, [2, 4]] = datetime(2007, 1, 1)
         tm.assert_almost_equal(result, expected)
+
+    def test_take_axis_0(self):
+        arr = np.arange(12).reshape(4, 3)
+        result = algos.take(arr, [0, -1])
+        expected = np.array([[0, 1, 2], [9, 10, 11]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # allow_fill=True
+        result = algos.take(arr, [0, -1], allow_fill=True, fill_value=0)
+        expected = np.array([[0, 1, 2], [0, 0, 0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_axis_1(self):
+        arr = np.arange(12).reshape(4, 3)
+        result = algos.take(arr, [0, -1], axis=1)
+        expected = np.array([[0, 2], [3, 5], [6, 8], [9, 11]])
+        tm.assert_numpy_array_equal(result, expected)
+
+        # allow_fill=True
+        result = algos.take(arr, [0, -1], axis=1, allow_fill=True,
+                            fill_value=0)
+        expected = np.array([[0, 0], [3, 0], [6, 0], [9, 0]])
+        tm.assert_numpy_array_equal(result, expected)
+
+
+class TestExtensionTake(object):
+    # The take method found in pd.api.extensions
+
+    def test_bounds_check_large(self):
+        arr = np.array([1, 2])
+        with pytest.raises(IndexError):
+            algos.take(arr, [2, 3], allow_fill=True)
+
+        with pytest.raises(IndexError):
+            algos.take(arr, [2, 3], allow_fill=False)
+
+    def test_bounds_check_small(self):
+        arr = np.array([1, 2, 3], dtype=np.int64)
+        indexer = [0, -1, -2]
+        with pytest.raises(ValueError):
+            algos.take(arr, indexer, allow_fill=True)
+
+        result = algos.take(arr, indexer)
+        expected = np.array([1, 3, 2], dtype=np.int64)
+        tm.assert_numpy_array_equal(result, expected)
+
+    @pytest.mark.parametrize('allow_fill', [True, False])
+    def test_take_empty(self, allow_fill):
+        arr = np.array([], dtype=np.int64)
+        # empty take is ok
+        result = algos.take(arr, [], allow_fill=allow_fill)
+        tm.assert_numpy_array_equal(arr, result)
+
+        with pytest.raises(IndexError):
+            algos.take(arr, [0], allow_fill=allow_fill)
+
+    def test_take_na_empty(self):
+        result = algos.take(np.array([]), [-1, -1], allow_fill=True,
+                            fill_value=0.0)
+        expected = np.array([0., 0.])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_take_coerces_list(self):
+        arr = [1, 2, 3]
+        result = algos.take(arr, [0, 0])
+        expected = np.array([1, 1])
+        tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/test_testing.py b/pandas/tests/test_testing.py
deleted file mode 100644
index e5cb953cb35a5..0000000000000
--- a/pandas/tests/test_testing.py
+++ /dev/null
@@ -1,778 +0,0 @@
-# -*- coding: utf-8 -*-
-import pandas as pd
-import unittest
-import pytest
-import numpy as np
-import sys
-from pandas import Series, DataFrame
-import pandas.util.testing as tm
-from pandas.util.testing import (assert_almost_equal, assertRaisesRegexp,
-                                 raise_with_traceback, assert_index_equal,
-                                 assert_series_equal, assert_frame_equal,
-                                 assert_numpy_array_equal,
-                                 RNGContext)
-from pandas.compat import is_platform_windows
-
-
-class TestAssertAlmostEqual(tm.TestCase):
-
-    def _assert_almost_equal_both(self, a, b, **kwargs):
-        assert_almost_equal(a, b, **kwargs)
-        assert_almost_equal(b, a, **kwargs)
-
-    def _assert_not_almost_equal_both(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_almost_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_almost_equal, b, a, **kwargs)
-
-    def test_assert_almost_equal_numbers(self):
-        self._assert_almost_equal_both(1.1, 1.1)
-        self._assert_almost_equal_both(1.1, 1.100001)
-        self._assert_almost_equal_both(np.int16(1), 1.000001)
-        self._assert_almost_equal_both(np.float64(1.1), 1.1)
-        self._assert_almost_equal_both(np.uint32(5), 5)
-
-        self._assert_not_almost_equal_both(1.1, 1)
-        self._assert_not_almost_equal_both(1.1, True)
-        self._assert_not_almost_equal_both(1, 2)
-        self._assert_not_almost_equal_both(1.0001, np.int16(1))
-
-    def test_assert_almost_equal_numbers_with_zeros(self):
-        self._assert_almost_equal_both(0, 0)
-        self._assert_almost_equal_both(0, 0.0)
-        self._assert_almost_equal_both(0, np.float64(0))
-        self._assert_almost_equal_both(0.000001, 0)
-
-        self._assert_not_almost_equal_both(0.001, 0)
-        self._assert_not_almost_equal_both(1, 0)
-
-    def test_assert_almost_equal_numbers_with_mixed(self):
-        self._assert_not_almost_equal_both(1, 'abc')
-        self._assert_not_almost_equal_both(1, [1, ])
-        self._assert_not_almost_equal_both(1, object())
-
-    def test_assert_almost_equal_edge_case_ndarrays(self):
-        self._assert_almost_equal_both(np.array([], dtype='M8[ns]'),
-                                       np.array([], dtype='float64'),
-                                       check_dtype=False)
-        self._assert_almost_equal_both(np.array([], dtype=str),
-                                       np.array([], dtype='int64'),
-                                       check_dtype=False)
-
-    def test_assert_almost_equal_dicts(self):
-        self._assert_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 2})
-
-        self._assert_not_almost_equal_both({'a': 1, 'b': 2}, {'a': 1, 'b': 3})
-        self._assert_not_almost_equal_both({'a': 1, 'b': 2},
-                                           {'a': 1, 'b': 2, 'c': 3})
-        self._assert_not_almost_equal_both({'a': 1}, 1)
-        self._assert_not_almost_equal_both({'a': 1}, 'abc')
-        self._assert_not_almost_equal_both({'a': 1}, [1, ])
-
-    def test_assert_almost_equal_dict_like_object(self):
-        class DictLikeObj(object):
-
-            def keys(self):
-                return ('a', )
-
-            def __getitem__(self, item):
-                if item == 'a':
-                    return 1
-
-        self._assert_almost_equal_both({'a': 1}, DictLikeObj(),
-                                       check_dtype=False)
-
-        self._assert_not_almost_equal_both({'a': 2}, DictLikeObj(),
-                                           check_dtype=False)
-
-    def test_assert_almost_equal_strings(self):
-        self._assert_almost_equal_both('abc', 'abc')
-
-        self._assert_not_almost_equal_both('abc', 'abcd')
-        self._assert_not_almost_equal_both('abc', 'abd')
-        self._assert_not_almost_equal_both('abc', 1)
-        self._assert_not_almost_equal_both('abc', [1, ])
-
-    def test_assert_almost_equal_iterables(self):
-        self._assert_almost_equal_both([1, 2, 3], [1, 2, 3])
-        self._assert_almost_equal_both(np.array([1, 2, 3]),
-                                       np.array([1, 2, 3]))
-
-        # class / dtype are different
-        self._assert_not_almost_equal_both(np.array([1, 2, 3]), [1, 2, 3])
-        self._assert_not_almost_equal_both(np.array([1, 2, 3]),
-                                           np.array([1., 2., 3.]))
-
-        # Can't compare generators
-        self._assert_not_almost_equal_both(iter([1, 2, 3]), [1, 2, 3])
-
-        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 4])
-        self._assert_not_almost_equal_both([1, 2, 3], [1, 2, 3, 4])
-        self._assert_not_almost_equal_both([1, 2, 3], 1)
-
-    def test_assert_almost_equal_null(self):
-        self._assert_almost_equal_both(None, None)
-
-        self._assert_not_almost_equal_both(None, np.NaN)
-        self._assert_not_almost_equal_both(None, 0)
-        self._assert_not_almost_equal_both(np.NaN, 0)
-
-    def test_assert_almost_equal_inf(self):
-        self._assert_almost_equal_both(np.inf, np.inf)
-        self._assert_almost_equal_both(np.inf, float("inf"))
-        self._assert_not_almost_equal_both(np.inf, 0)
-        self._assert_almost_equal_both(np.array([np.inf, np.nan, -np.inf]),
-                                       np.array([np.inf, np.nan, -np.inf]))
-        self._assert_almost_equal_both(np.array([np.inf, None, -np.inf],
-                                                dtype=np.object_),
-                                       np.array([np.inf, np.nan, -np.inf],
-                                                dtype=np.object_))
-
-    def test_assert_almost_equal_pandas(self):
-        self.assert_almost_equal(pd.Index([1., 1.1]),
-                                 pd.Index([1., 1.100001]))
-        self.assert_almost_equal(pd.Series([1., 1.1]),
-                                 pd.Series([1., 1.100001]))
-        self.assert_almost_equal(pd.DataFrame({'a': [1., 1.1]}),
-                                 pd.DataFrame({'a': [1., 1.100001]}))
-
-    def test_assert_almost_equal_object(self):
-        a = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')]
-        b = [pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')]
-        self._assert_almost_equal_both(a, b)
-
-
-class TestUtilTesting(tm.TestCase):
-
-    def test_raise_with_traceback(self):
-        with assertRaisesRegexp(LookupError, "error_text"):
-            try:
-                raise ValueError("THIS IS AN ERROR")
-            except ValueError as e:
-                e = LookupError("error_text")
-                raise_with_traceback(e)
-        with assertRaisesRegexp(LookupError, "error_text"):
-            try:
-                raise ValueError("This is another error")
-            except ValueError:
-                e = LookupError("error_text")
-                _, _, traceback = sys.exc_info()
-                raise_with_traceback(e, traceback)
-
-
-class TestAssertNumpyArrayEqual(tm.TestCase):
-
-    def test_numpy_array_equal_message(self):
-
-        if is_platform_windows():
-            pytest.skip("windows has incomparable line-endings "
-                        "and uses L on the shape")
-
-        expected = """numpy array are different
-
-numpy array shapes are different
-\\[left\\]:  \\(2,\\)
-\\[right\\]: \\(3,\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]))
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]))
-
-        # scalar comparison
-        expected = """Expected type """
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(1, 2)
-        expected = """expected 2\\.00000 but got 1\\.00000, with decimal 5"""
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(1, 2)
-
-        # array / scalar array comparison
-        expected = """numpy array are different
-
-numpy array classes are different
-\\[left\\]:  ndarray
-\\[right\\]: int"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            # numpy_array_equal only accepts np.ndarray
-            assert_numpy_array_equal(np.array([1]), 1)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1]), 1)
-
-        # scalar / array comparison
-        expected = """numpy array are different
-
-numpy array classes are different
-\\[left\\]:  int
-\\[right\\]: ndarray"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(1, np.array([1]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(1, np.array([1]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(66\\.66667 %\\)
-\\[left\\]:  \\[nan, 2\\.0, 3\\.0\\]
-\\[right\\]: \\[1\\.0, nan, 3\\.0\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([np.nan, 2, 3]),
-                                     np.array([1, np.nan, 3]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([np.nan, 2, 3]),
-                                np.array([1, np.nan, 3]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1, 2\\]
-\\[right\\]: \\[1, 3\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([1, 3]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([1, 3]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1\\.1, 2\\.000001\\]
-\\[right\\]: \\[1\\.1, 2.0\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(
-                np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
-
-        # must pass
-        assert_almost_equal(np.array([1.1, 2.000001]), np.array([1.1, 2.0]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(16\\.66667 %\\)
-\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
-\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([[1, 2], [3, 4], [5, 6]]),
-                                     np.array([[1, 3], [3, 4], [5, 6]]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([[1, 2], [3, 4], [5, 6]]),
-                                np.array([[1, 3], [3, 4], [5, 6]]))
-
-        expected = """numpy array are different
-
-numpy array values are different \\(25\\.0 %\\)
-\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\]\\]
-\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\]\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([[1, 2], [3, 4]]),
-                                     np.array([[1, 3], [3, 4]]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([[1, 2], [3, 4]]),
-                                np.array([[1, 3], [3, 4]]))
-
-        # allow to overwrite message
-        expected = """Index are different
-
-Index shapes are different
-\\[left\\]:  \\(2,\\)
-\\[right\\]: \\(3,\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]),
-                                     obj='Index')
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(np.array([1, 2]), np.array([3, 4, 5]),
-                                obj='Index')
-
-    def test_numpy_array_equal_object_message(self):
-
-        if is_platform_windows():
-            pytest.skip("windows has incomparable line-endings "
-                        "and uses L on the shape")
-
-        a = np.array([pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-01')])
-        b = np.array([pd.Timestamp('2011-01-01'), pd.Timestamp('2011-01-02')])
-
-        expected = """numpy array are different
-
-numpy array values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[2011-01-01 00:00:00, 2011-01-01 00:00:00\\]
-\\[right\\]: \\[2011-01-01 00:00:00, 2011-01-02 00:00:00\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(a, b)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal(a, b)
-
-    def test_numpy_array_equal_copy_flag(self):
-        a = np.array([1, 2, 3])
-        b = a.copy()
-        c = a.view()
-        expected = r'array\(\[1, 2, 3\]\) is not array\(\[1, 2, 3\]\)'
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(a, b, check_same='same')
-        expected = r'array\(\[1, 2, 3\]\) is array\(\[1, 2, 3\]\)'
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_numpy_array_equal(a, c, check_same='copy')
-
-    def test_assert_almost_equal_iterable_message(self):
-
-        expected = """Iterable are different
-
-Iterable length are different
-\\[left\\]:  2
-\\[right\\]: 3"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal([1, 2], [3, 4, 5])
-
-        expected = """Iterable are different
-
-Iterable values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[1, 2\\]
-\\[right\\]: \\[1, 3\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_almost_equal([1, 2], [1, 3])
-
-
-class TestAssertIndexEqual(unittest.TestCase):
-
-    def test_index_equal_message(self):
-
-        expected = """Index are different
-
-Index levels are different
-\\[left\\]:  1, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: 2, MultiIndex\\(levels=\\[\\[u?'A', u?'B'\\], \\[1, 2, 3, 4\\]\\],
-           labels=\\[\\[0, 0, 1, 1\\], \\[0, 1, 2, 3\\]\\]\\)"""
-
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
-                                          ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=False)
-
-        expected = """MultiIndex level \\[1\\] are different
-
-MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
-\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-
-        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2),
-                                          ('B', 3), ('B', 4)])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
-                                          ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index length are different
-\\[left\\]:  3, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: 4, Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3, 4])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index classes are different
-\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: Float64Index\\(\\[1\\.0, 2\\.0, 3\\.0\\], dtype='float64'\\)"""
-
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3.0])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=True)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, exact=True, check_exact=False)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
-\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0000000001\\], dtype='float64'\\)"""
-
-        idx1 = pd.Index([1, 2, 3.])
-        idx2 = pd.Index([1, 2, 3.0000000001])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-        # must success
-        assert_index_equal(idx1, idx2, check_exact=False)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
-\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0001\\], dtype='float64'\\)"""
-
-        idx1 = pd.Index([1, 2, 3.])
-        idx2 = pd.Index([1, 2, 3.0001])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-        # must success
-        assert_index_equal(idx1, idx2, check_exact=False,
-                           check_less_precise=True)
-
-        expected = """Index are different
-
-Index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 4\\], dtype='int64'\\)"""
-
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 4])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_less_precise=True)
-
-        expected = """MultiIndex level \\[1\\] are different
-
-MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
-\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
-
-        idx1 = pd.MultiIndex.from_tuples([('A', 2), ('A', 2),
-                                          ('B', 3), ('B', 4)])
-        idx2 = pd.MultiIndex.from_tuples([('A', 1), ('A', 2),
-                                          ('B', 3), ('B', 4)])
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2, check_exact=False)
-
-    def test_index_equal_metadata_message(self):
-
-        expected = """Index are different
-
-Attribute "names" are different
-\\[left\\]:  \\[None\\]
-\\[right\\]: \\[u?'x'\\]"""
-
-        idx1 = pd.Index([1, 2, 3])
-        idx2 = pd.Index([1, 2, 3], name='x')
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-        # same name, should pass
-        assert_index_equal(pd.Index([1, 2, 3], name=np.nan),
-                           pd.Index([1, 2, 3], name=np.nan))
-        assert_index_equal(pd.Index([1, 2, 3], name=pd.NaT),
-                           pd.Index([1, 2, 3], name=pd.NaT))
-
-        expected = """Index are different
-
-Attribute "names" are different
-\\[left\\]:  \\[nan\\]
-\\[right\\]: \\[NaT\\]"""
-
-        idx1 = pd.Index([1, 2, 3], name=np.nan)
-        idx2 = pd.Index([1, 2, 3], name=pd.NaT)
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_index_equal(idx1, idx2)
-
-
-class TestAssertSeriesEqual(tm.TestCase):
-
-    def _assert_equal(self, x, y, **kwargs):
-        assert_series_equal(x, y, **kwargs)
-        assert_series_equal(y, x, **kwargs)
-
-    def _assert_not_equal(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_series_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_series_equal, b, a, **kwargs)
-
-    def test_equal(self):
-        self._assert_equal(Series(range(3)), Series(range(3)))
-        self._assert_equal(Series(list('abc')), Series(list('abc')))
-
-    def test_not_equal(self):
-        self._assert_not_equal(Series(range(3)), Series(range(3)) + 1)
-        self._assert_not_equal(Series(list('abc')), Series(list('xyz')))
-        self._assert_not_equal(Series(range(3)), Series(range(4)))
-        self._assert_not_equal(
-            Series(range(3)), Series(
-                range(3), dtype='float64'))
-        self._assert_not_equal(
-            Series(range(3)), Series(
-                range(3), index=[1, 2, 4]))
-
-        # ATM meta data is not checked in assert_series_equal
-        # self._assert_not_equal(Series(range(3)),Series(range(3),name='foo'),check_names=True)
-
-    def test_less_precise(self):
-        s1 = Series([0.12345], dtype='float64')
-        s2 = Series([0.12346], dtype='float64')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self._assert_equal(s1, s2, check_less_precise=True)
-        for i in range(4):
-            self._assert_equal(s1, s2, check_less_precise=i)
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2, 10)
-
-        s1 = Series([0.12345], dtype='float32')
-        s2 = Series([0.12346], dtype='float32')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self._assert_equal(s1, s2, check_less_precise=True)
-        for i in range(4):
-            self._assert_equal(s1, s2, check_less_precise=i)
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2, 10)
-
-        # even less than less precise
-        s1 = Series([0.1235], dtype='float32')
-        s2 = Series([0.1236], dtype='float32')
-
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2)
-        self.assertRaises(AssertionError, assert_series_equal, s1, s2, True)
-
-    def test_index_dtype(self):
-        df1 = DataFrame.from_records(
-            {'a': [1, 2], 'c': ['l1', 'l2']}, index=['a'])
-        df2 = DataFrame.from_records(
-            {'a': [1.0, 2.0], 'c': ['l1', 'l2']}, index=['a'])
-        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
-
-    def test_multiindex_dtype(self):
-        df1 = DataFrame.from_records(
-            {'a': [1, 2], 'b': [2.1, 1.5],
-             'c': ['l1', 'l2']}, index=['a', 'b'])
-        df2 = DataFrame.from_records(
-            {'a': [1.0, 2.0], 'b': [2.1, 1.5],
-             'c': ['l1', 'l2']}, index=['a', 'b'])
-        self._assert_not_equal(df1.c, df2.c, check_index_type=True)
-
-    def test_series_equal_message(self):
-
-        expected = """Series are different
-
-Series length are different
-\\[left\\]:  3, RangeIndex\\(start=0, stop=3, step=1\\)
-\\[right\\]: 4, RangeIndex\\(start=0, stop=4, step=1\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 3, 4]))
-
-        expected = """Series are different
-
-Series values are different \\(33\\.33333 %\\)
-\\[left\\]:  \\[1, 2, 3\\]
-\\[right\\]: \\[1, 2, 4\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]))
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_series_equal(pd.Series([1, 2, 3]), pd.Series([1, 2, 4]),
-                                check_less_precise=True)
-
-
-class TestAssertFrameEqual(tm.TestCase):
-
-    def _assert_equal(self, x, y, **kwargs):
-        assert_frame_equal(x, y, **kwargs)
-        assert_frame_equal(y, x, **kwargs)
-
-    def _assert_not_equal(self, a, b, **kwargs):
-        self.assertRaises(AssertionError, assert_frame_equal, a, b, **kwargs)
-        self.assertRaises(AssertionError, assert_frame_equal, b, a, **kwargs)
-
-    def test_equal_with_different_row_order(self):
-        # check_like=True ignores row-column orderings
-        df1 = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                           index=['a', 'b', 'c'])
-        df2 = pd.DataFrame({'A': [3, 2, 1], 'B': [6, 5, 4]},
-                           index=['c', 'b', 'a'])
-
-        self._assert_equal(df1, df2, check_like=True)
-        self._assert_not_equal(df1, df2)
-
-    def test_not_equal_with_different_shape(self):
-        self._assert_not_equal(pd.DataFrame({'A': [1, 2, 3]}),
-                               pd.DataFrame({'A': [1, 2, 3, 4]}))
-
-    def test_index_dtype(self):
-        df1 = DataFrame.from_records(
-            {'a': [1, 2], 'c': ['l1', 'l2']}, index=['a'])
-        df2 = DataFrame.from_records(
-            {'a': [1.0, 2.0], 'c': ['l1', 'l2']}, index=['a'])
-        self._assert_not_equal(df1, df2, check_index_type=True)
-
-    def test_multiindex_dtype(self):
-        df1 = DataFrame.from_records(
-            {'a': [1, 2], 'b': [2.1, 1.5],
-             'c': ['l1', 'l2']}, index=['a', 'b'])
-        df2 = DataFrame.from_records(
-            {'a': [1.0, 2.0], 'b': [2.1, 1.5],
-             'c': ['l1', 'l2']}, index=['a', 'b'])
-        self._assert_not_equal(df1, df2, check_index_type=True)
-
-    def test_empty_dtypes(self):
-        df1 = pd.DataFrame(columns=["col1", "col2"])
-        df1["col1"] = df1["col1"].astype('int64')
-        df2 = pd.DataFrame(columns=["col1", "col2"])
-        self._assert_equal(df1, df2, check_dtype=False)
-        self._assert_not_equal(df1, df2, check_dtype=True)
-
-    def test_frame_equal_message(self):
-
-        expected = """DataFrame are different
-
-DataFrame shape mismatch
-\\[left\\]:  \\(3, 2\\)
-\\[right\\]: \\(3, 1\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
-                               pd.DataFrame({'A': [1, 2, 3]}))
-
-        expected = """DataFrame\\.index are different
-
-DataFrame\\.index values are different \\(33\\.33333 %\\)
-\\[left\\]:  Index\\(\\[u?'a', u?'b', u?'c'\\], dtype='object'\\)
-\\[right\\]: Index\\(\\[u?'a', u?'b', u?'d'\\], dtype='object'\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                                            index=['a', 'b', 'c']),
-                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                                            index=['a', 'b', 'd']))
-
-        expected = """DataFrame\\.columns are different
-
-DataFrame\\.columns values are different \\(50\\.0 %\\)
-\\[left\\]:  Index\\(\\[u?'A', u?'B'\\], dtype='object'\\)
-\\[right\\]: Index\\(\\[u?'A', u?'b'\\], dtype='object'\\)"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]},
-                                            index=['a', 'b', 'c']),
-                               pd.DataFrame({'A': [1, 2, 3], 'b': [4, 5, 6]},
-                                            index=['a', 'b', 'c']))
-
-        expected = """DataFrame\\.iloc\\[:, 1\\] are different
-
-DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
-\\[left\\]:  \\[4, 5, 6\\]
-\\[right\\]: \\[4, 5, 7\\]"""
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
-                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 7]}))
-
-        with assertRaisesRegexp(AssertionError, expected):
-            assert_frame_equal(pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}),
-                               pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 7]}),
-                               by_blocks=True)
-
-
-class TestIsInstance(tm.TestCase):
-
-    def test_isinstance(self):
-
-        expected = "Expected type "
-        with assertRaisesRegexp(AssertionError, expected):
-            tm.assertIsInstance(1, pd.Series)
-
-    def test_notisinstance(self):
-
-        expected = "Input must not be type "
-        with assertRaisesRegexp(AssertionError, expected):
-            tm.assertNotIsInstance(pd.Series([1]), pd.Series)
-
-
-class TestAssertCategoricalEqual(unittest.TestCase):
-
-    def test_categorical_equal_message(self):
-
-        expected = """Categorical\\.categories are different
-
-Categorical\\.categories values are different \\(25\\.0 %\\)
-\\[left\\]:  Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)
-\\[right\\]: Int64Index\\(\\[1, 2, 3, 5\\], dtype='int64'\\)"""
-
-        a = pd.Categorical([1, 2, 3, 4])
-        b = pd.Categorical([1, 2, 3, 5])
-        with assertRaisesRegexp(AssertionError, expected):
-            tm.assert_categorical_equal(a, b)
-
-        expected = """Categorical\\.codes are different
-
-Categorical\\.codes values are different \\(50\\.0 %\\)
-\\[left\\]:  \\[0, 1, 3, 2\\]
-\\[right\\]: \\[0, 1, 2, 3\\]"""
-
-        a = pd.Categorical([1, 2, 4, 3], categories=[1, 2, 3, 4])
-        b = pd.Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4])
-        with assertRaisesRegexp(AssertionError, expected):
-            tm.assert_categorical_equal(a, b)
-
-        expected = """Categorical are different
-
-Attribute "ordered" are different
-\\[left\\]:  False
-\\[right\\]: True"""
-
-        a = pd.Categorical([1, 2, 3, 4], ordered=False)
-        b = pd.Categorical([1, 2, 3, 4], ordered=True)
-        with assertRaisesRegexp(AssertionError, expected):
-            tm.assert_categorical_equal(a, b)
-
-
-class TestRNGContext(unittest.TestCase):
-
-    def test_RNGContext(self):
-        expected0 = 1.764052345967664
-        expected1 = 1.6243453636632417
-
-        with RNGContext(0):
-            with RNGContext(1):
-                self.assertEqual(np.random.randn(), expected1)
-            self.assertEqual(np.random.randn(), expected0)
-
-
-class TestDeprecatedTests(tm.TestCase):
-
-    def test_warning(self):
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertEquals(1, 1)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertNotEquals(1, 2)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assert_(True)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertAlmostEquals(1.0, 1.0000000001)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertNotAlmostEquals(1, 2)
-
-
-class TestLocale(tm.TestCase):
-
-    def test_locale(self):
-        if sys.platform == 'win32':
-            pytest.skip(
-                "skipping on win platforms as locale not available")
-
-        # GH9744
-        locales = tm.get_locales()
-        self.assertTrue(len(locales) >= 1)
diff --git a/pandas/tests/test_util.py b/pandas/tests/test_util.py
deleted file mode 100644
index 1bf9f4da45bff..0000000000000
--- a/pandas/tests/test_util.py
+++ /dev/null
@@ -1,403 +0,0 @@
-# -*- coding: utf-8 -*-
-from collections import OrderedDict
-import sys
-import unittest
-from uuid import uuid4
-from pandas.util._move import move_into_mutable_buffer, BadMove, stolenbuf
-from pandas.util.decorators import deprecate_kwarg
-from pandas.util.validators import (validate_args, validate_kwargs,
-                                    validate_args_and_kwargs,
-                                    validate_bool_kwarg)
-
-import pandas.util.testing as tm
-
-
-class TestDecorators(tm.TestCase):
-
-    def setUp(self):
-        @deprecate_kwarg('old', 'new')
-        def _f1(new=False):
-            return new
-
-        @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
-        def _f2(new=False):
-            return new
-
-        @deprecate_kwarg('old', 'new', lambda x: x + 1)
-        def _f3(new=0):
-            return new
-
-        self.f1 = _f1
-        self.f2 = _f2
-        self.f3 = _f3
-
-    def test_deprecate_kwarg(self):
-        x = 78
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f1(old=x)
-        self.assertIs(result, x)
-        with tm.assert_produces_warning(None):
-            self.f1(new=x)
-
-    def test_dict_deprecate_kwarg(self):
-        x = 'yes'
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f2(old=x)
-        self.assertEqual(result, True)
-
-    def test_missing_deprecate_kwarg(self):
-        x = 'bogus'
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f2(old=x)
-        self.assertEqual(result, 'bogus')
-
-    def test_callable_deprecate_kwarg(self):
-        x = 5
-        with tm.assert_produces_warning(FutureWarning):
-            result = self.f3(old=x)
-        self.assertEqual(result, x + 1)
-        with tm.assertRaises(TypeError):
-            self.f3(old='hello')
-
-    def test_bad_deprecate_kwarg(self):
-        with tm.assertRaises(TypeError):
-            @deprecate_kwarg('old', 'new', 0)
-            def f4(new=None):
-                pass
-
-
-def test_rands():
-    r = tm.rands(10)
-    assert(len(r) == 10)
-
-
-def test_rands_array():
-    arr = tm.rands_array(5, size=10)
-    assert(arr.shape == (10,))
-    assert(len(arr[0]) == 5)
-
-    arr = tm.rands_array(7, size=(10, 10))
-    assert(arr.shape == (10, 10))
-    assert(len(arr[1, 1]) == 7)
-
-
-class TestValidateArgs(tm.TestCase):
-    fname = 'func'
-
-    def test_bad_min_fname_arg_count(self):
-        msg = "'max_fname_arg_count' must be non-negative"
-        with tm.assertRaisesRegexp(ValueError, msg):
-            validate_args(self.fname, (None,), -1, 'foo')
-
-    def test_bad_arg_length_max_value_single(self):
-        args = (None, None)
-        compat_args = ('foo',)
-
-        min_fname_arg_count = 0
-        max_length = len(compat_args) + min_fname_arg_count
-        actual_length = len(args) + min_fname_arg_count
-        msg = (r"{fname}\(\) takes at most {max_length} "
-               r"argument \({actual_length} given\)"
-               .format(fname=self.fname, max_length=max_length,
-                       actual_length=actual_length))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_args(self.fname, args,
-                          min_fname_arg_count,
-                          compat_args)
-
-    def test_bad_arg_length_max_value_multiple(self):
-        args = (None, None)
-        compat_args = dict(foo=None)
-
-        min_fname_arg_count = 2
-        max_length = len(compat_args) + min_fname_arg_count
-        actual_length = len(args) + min_fname_arg_count
-        msg = (r"{fname}\(\) takes at most {max_length} "
-               r"arguments \({actual_length} given\)"
-               .format(fname=self.fname, max_length=max_length,
-                       actual_length=actual_length))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_args(self.fname, args,
-                          min_fname_arg_count,
-                          compat_args)
-
-    def test_not_all_defaults(self):
-        bad_arg = 'foo'
-        msg = ("the '{arg}' parameter is not supported "
-               r"in the pandas implementation of {func}\(\)".
-               format(arg=bad_arg, func=self.fname))
-
-        compat_args = OrderedDict()
-        compat_args['foo'] = 2
-        compat_args['bar'] = -1
-        compat_args['baz'] = 3
-
-        arg_vals = (1, -1, 3)
-
-        for i in range(1, 3):
-            with tm.assertRaisesRegexp(ValueError, msg):
-                validate_args(self.fname, arg_vals[:i], 2, compat_args)
-
-    def test_validation(self):
-        # No exceptions should be thrown
-        validate_args(self.fname, (None,), 2, dict(out=None))
-
-        compat_args = OrderedDict()
-        compat_args['axis'] = 1
-        compat_args['out'] = None
-
-        validate_args(self.fname, (1, None), 2, compat_args)
-
-
-class TestValidateKwargs(tm.TestCase):
-    fname = 'func'
-
-    def test_bad_kwarg(self):
-        goodarg = 'f'
-        badarg = goodarg + 'o'
-
-        compat_args = OrderedDict()
-        compat_args[goodarg] = 'foo'
-        compat_args[badarg + 'o'] = 'bar'
-        kwargs = {goodarg: 'foo', badarg: 'bar'}
-        msg = (r"{fname}\(\) got an unexpected "
-               r"keyword argument '{arg}'".format(
-                   fname=self.fname, arg=badarg))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_kwargs(self.fname, kwargs, compat_args)
-
-    def test_not_all_none(self):
-        bad_arg = 'foo'
-        msg = (r"the '{arg}' parameter is not supported "
-               r"in the pandas implementation of {func}\(\)".
-               format(arg=bad_arg, func=self.fname))
-
-        compat_args = OrderedDict()
-        compat_args['foo'] = 1
-        compat_args['bar'] = 's'
-        compat_args['baz'] = None
-
-        kwarg_keys = ('foo', 'bar', 'baz')
-        kwarg_vals = (2, 's', None)
-
-        for i in range(1, 3):
-            kwargs = dict(zip(kwarg_keys[:i],
-                              kwarg_vals[:i]))
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                validate_kwargs(self.fname, kwargs, compat_args)
-
-    def test_validation(self):
-        # No exceptions should be thrown
-        compat_args = OrderedDict()
-        compat_args['f'] = None
-        compat_args['b'] = 1
-        compat_args['ba'] = 's'
-        kwargs = dict(f=None, b=1)
-        validate_kwargs(self.fname, kwargs, compat_args)
-
-    def test_validate_bool_kwarg(self):
-        arg_names = ['inplace', 'copy']
-        invalid_values = [1, "True", [1, 2, 3], 5.0]
-        valid_values = [True, False, None]
-
-        for name in arg_names:
-            for value in invalid_values:
-                with tm.assertRaisesRegexp(ValueError,
-                                           ("For argument \"%s\" expected "
-                                            "type bool, received type %s") %
-                                           (name, type(value).__name__)):
-                    validate_bool_kwarg(value, name)
-
-            for value in valid_values:
-                tm.assert_equal(validate_bool_kwarg(value, name), value)
-
-
-class TestValidateKwargsAndArgs(tm.TestCase):
-    fname = 'func'
-
-    def test_invalid_total_length_max_length_one(self):
-        compat_args = ('foo',)
-        kwargs = {'foo': 'FOO'}
-        args = ('FoO', 'BaZ')
-
-        min_fname_arg_count = 0
-        max_length = len(compat_args) + min_fname_arg_count
-        actual_length = len(kwargs) + len(args) + min_fname_arg_count
-        msg = (r"{fname}\(\) takes at most {max_length} "
-               r"argument \({actual_length} given\)"
-               .format(fname=self.fname, max_length=max_length,
-                       actual_length=actual_length))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_args_and_kwargs(self.fname, args, kwargs,
-                                     min_fname_arg_count,
-                                     compat_args)
-
-    def test_invalid_total_length_max_length_multiple(self):
-        compat_args = ('foo', 'bar', 'baz')
-        kwargs = {'foo': 'FOO', 'bar': 'BAR'}
-        args = ('FoO', 'BaZ')
-
-        min_fname_arg_count = 2
-        max_length = len(compat_args) + min_fname_arg_count
-        actual_length = len(kwargs) + len(args) + min_fname_arg_count
-        msg = (r"{fname}\(\) takes at most {max_length} "
-               r"arguments \({actual_length} given\)"
-               .format(fname=self.fname, max_length=max_length,
-                       actual_length=actual_length))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_args_and_kwargs(self.fname, args, kwargs,
-                                     min_fname_arg_count,
-                                     compat_args)
-
-    def test_no_args_with_kwargs(self):
-        bad_arg = 'bar'
-        min_fname_arg_count = 2
-
-        compat_args = OrderedDict()
-        compat_args['foo'] = -5
-        compat_args[bad_arg] = 1
-
-        msg = (r"the '{arg}' parameter is not supported "
-               r"in the pandas implementation of {func}\(\)".
-               format(arg=bad_arg, func=self.fname))
-
-        args = ()
-        kwargs = {'foo': -5, bad_arg: 2}
-        tm.assertRaisesRegexp(ValueError, msg,
-                              validate_args_and_kwargs,
-                              self.fname, args, kwargs,
-                              min_fname_arg_count, compat_args)
-
-        args = (-5, 2)
-        kwargs = {}
-        tm.assertRaisesRegexp(ValueError, msg,
-                              validate_args_and_kwargs,
-                              self.fname, args, kwargs,
-                              min_fname_arg_count, compat_args)
-
-    def test_duplicate_argument(self):
-        min_fname_arg_count = 2
-        compat_args = OrderedDict()
-        compat_args['foo'] = None
-        compat_args['bar'] = None
-        compat_args['baz'] = None
-        kwargs = {'foo': None, 'bar': None}
-        args = (None,)  # duplicate value for 'foo'
-
-        msg = (r"{fname}\(\) got multiple values for keyword "
-               r"argument '{arg}'".format(fname=self.fname, arg='foo'))
-
-        with tm.assertRaisesRegexp(TypeError, msg):
-            validate_args_and_kwargs(self.fname, args, kwargs,
-                                     min_fname_arg_count,
-                                     compat_args)
-
-    def test_validation(self):
-        # No exceptions should be thrown
-        compat_args = OrderedDict()
-        compat_args['foo'] = 1
-        compat_args['bar'] = None
-        compat_args['baz'] = -2
-        kwargs = {'baz': -2}
-        args = (1, None)
-
-        min_fname_arg_count = 2
-        validate_args_and_kwargs(self.fname, args, kwargs,
-                                 min_fname_arg_count,
-                                 compat_args)
-
-
-class TestMove(tm.TestCase):
-
-    def test_cannot_create_instance_of_stolenbuffer(self):
-        """Stolen buffers need to be created through the smart constructor
-        ``move_into_mutable_buffer`` which has a bunch of checks in it.
-        """
-        msg = "cannot create 'pandas.util._move.stolenbuf' instances"
-        with tm.assertRaisesRegexp(TypeError, msg):
-            stolenbuf()
-
-    def test_more_than_one_ref(self):
-        """Test case for when we try to use ``move_into_mutable_buffer`` when
-        the object being moved has other references.
-        """
-        b = b'testing'
-
-        with tm.assertRaises(BadMove) as e:
-            def handle_success(type_, value, tb):
-                self.assertIs(value.args[0], b)
-                return type(e).handle_success(e, type_, value, tb)  # super
-
-            e.handle_success = handle_success
-            move_into_mutable_buffer(b)
-
-    def test_exactly_one_ref(self):
-        """Test case for when the object being moved has exactly one reference.
-        """
-        b = b'testing'
-
-        # We need to pass an expression on the stack to ensure that there are
-        # not extra references hanging around. We cannot rewrite this test as
-        #   buf = b[:-3]
-        #   as_stolen_buf = move_into_mutable_buffer(buf)
-        # because then we would have more than one reference to buf.
-        as_stolen_buf = move_into_mutable_buffer(b[:-3])
-
-        # materialize as bytearray to show that it is mutable
-        self.assertEqual(bytearray(as_stolen_buf), b'test')
-
-    @unittest.skipIf(
-        sys.version_info[0] > 2,
-        'bytes objects cannot be interned in py3',
-    )
-    def test_interned(self):
-        salt = uuid4().hex
-
-        def make_string():
-            # We need to actually create a new string so that it has refcount
-            # one. We use a uuid so that we know the string could not already
-            # be in the intern table.
-            return ''.join(('testing: ', salt))
-
-        # This should work, the string has one reference on the stack.
-        move_into_mutable_buffer(make_string())
-
-        refcount = [None]  # nonlocal
-
-        def ref_capture(ob):
-            # Subtract two because those are the references owned by this
-            # frame:
-            #   1. The local variables of this stack frame.
-            #   2. The python data stack of this stack frame.
-            refcount[0] = sys.getrefcount(ob) - 2
-            return ob
-
-        with tm.assertRaises(BadMove):
-            # If we intern the string it will still have one reference but now
-            # it is in the intern table so if other people intern the same
-            # string while the mutable buffer holds the first string they will
-            # be the same instance.
-            move_into_mutable_buffer(ref_capture(intern(make_string())))  # noqa
-
-        self.assertEqual(
-            refcount[0],
-            1,
-            msg='The BadMove was probably raised for refcount reasons instead'
-            ' of interning reasons',
-        )
-
-
-def test_numpy_errstate_is_default():
-    # The defaults since numpy 1.6.0
-    expected = {'over': 'warn', 'divide': 'warn', 'invalid': 'warn',
-                'under': 'ignore'}
-    import numpy as np
-    from pandas.compat import numpy  # noqa
-    # The errstate should be unchanged after that import.
-    tm.assert_equal(np.geterr(), expected)
diff --git a/pandas/tests/test_window.py b/pandas/tests/test_window.py
index fe03d7886e661..ce9d1888b8e96 100644
--- a/pandas/tests/test_window.py
+++ b/pandas/tests/test_window.py
@@ -1,24 +1,26 @@
+from collections import OrderedDict
+from datetime import datetime, timedelta
 from itertools import product
-import pytest
-import sys
 import warnings
 from warnings import catch_warnings
 
-from datetime import datetime, timedelta
-from numpy.random import randn
 import numpy as np
-from distutils.version import LooseVersion
+from numpy.random import randn
+import pytest
+
+from pandas.compat import range, zip
+from pandas.errors import UnsupportedFunctionCall
+import pandas.util._test_decorators as td
 
 import pandas as pd
-from pandas import (Series, DataFrame, Panel, bdate_range, isnull,
-                    notnull, concat, Timestamp)
-import pandas.stats.moments as mom
-import pandas.core.window as rwindow
-import pandas.tseries.offsets as offsets
+from pandas import (
+    DataFrame, Index, Series, Timestamp, bdate_range, concat, isna, notna)
 from pandas.core.base import SpecificationError
-from pandas.core.common import UnsupportedFunctionCall
+from pandas.core.sorting import safe_sort
+import pandas.core.window as rwindow
 import pandas.util.testing as tm
-from pandas.compat import range, zip, PY3
+
+import pandas.tseries.offsets as offsets
 
 N, K = 100, 10
 
@@ -30,7 +32,23 @@ def assert_equal(left, right):
         tm.assert_frame_equal(left, right)
 
 
-class Base(tm.TestCase):
+@pytest.fixture(params=[True, False])
+def raw(request):
+    return request.param
+
+
+@pytest.fixture(params=['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
+                        'blackmanharris', 'nuttall', 'barthann'])
+def win_types(request):
+    return request.param
+
+
+@pytest.fixture(params=['kaiser', 'gaussian', 'general_gaussian'])
+def win_types_special(request):
+    return request.param
+
+
+class Base(object):
 
     _nan_locs = np.arange(20, 40)
     _inf_locs = np.array([])
@@ -48,7 +66,7 @@ def _create_data(self):
 
 class TestApi(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def test_getitem(self):
@@ -57,7 +75,7 @@ def test_getitem(self):
         tm.assert_index_equal(r._selected_obj.columns, self.frame.columns)
 
         r = self.frame.rolling(window=5)[1]
-        self.assertEqual(r._selected_obj.name, self.frame.columns[1])
+        assert r._selected_obj.name == self.frame.columns[1]
 
         # technically this is allowed
         r = self.frame.rolling(window=5)[1, 3]
@@ -71,10 +89,9 @@ def test_getitem(self):
     def test_select_bad_cols(self):
         df = DataFrame([[1, 2]], columns=['A', 'B'])
         g = df.rolling(window=5)
-        self.assertRaises(KeyError, g.__getitem__, ['C'])  # g[['C']]
-
-        self.assertRaises(KeyError, g.__getitem__, ['A', 'C'])  # g[['A', 'C']]
-        with tm.assertRaisesRegexp(KeyError, '^[^A]+$'):
+        with pytest.raises(KeyError, match="Columns not found: 'C'"):
+            g[['C']]
+        with pytest.raises(KeyError, match='^[^A]+$'):
             # A should not be referenced as a bad column...
             # will have to rethink regex if you change message!
             g[['A', 'C']]
@@ -84,12 +101,13 @@ def test_attribute_access(self):
         df = DataFrame([[1, 2]], columns=['A', 'B'])
         r = df.rolling(window=5)
         tm.assert_series_equal(r.A.sum(), r['A'].sum())
-        self.assertRaises(AttributeError, lambda: r.F)
+        msg = "'Rolling' object has no attribute 'F'"
+        with pytest.raises(AttributeError, match=msg):
+            r.F
 
     def tests_skip_nuisance(self):
 
         df = DataFrame({'A': range(5), 'B': range(5, 10), 'C': 'foo'})
-
         r = df.rolling(window=3)
         result = r[['A', 'B']].sum()
         expected = DataFrame({'A': [np.nan, np.nan, 3, 6, 9],
@@ -97,9 +115,12 @@ def tests_skip_nuisance(self):
                              columns=list('AB'))
         tm.assert_frame_equal(result, expected)
 
-        expected = pd.concat([r[['A', 'B']].sum(), df[['C']]], axis=1)
-        result = r.sum()
-        tm.assert_frame_equal(result, expected, check_like=True)
+    def test_skip_sum_object_raises(self):
+        df = DataFrame({'A': range(5), 'B': range(5, 10), 'C': 'foo'})
+        r = df.rolling(window=3)
+
+        with pytest.raises(TypeError, match='cannot handle this type'):
+            r.sum()
 
     def test_agg(self):
         df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
@@ -113,53 +134,65 @@ def test_agg(self):
         b_sum = r['B'].sum()
 
         result = r.aggregate([np.mean, np.std])
-        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+        expected = concat([a_mean, a_std, b_mean, b_std], axis=1)
         expected.columns = pd.MultiIndex.from_product([['A', 'B'], ['mean',
                                                                     'std']])
         tm.assert_frame_equal(result, expected)
 
         result = r.aggregate({'A': np.mean, 'B': np.std})
 
-        expected = pd.concat([a_mean, b_std], axis=1)
+        expected = concat([a_mean, b_std], axis=1)
         tm.assert_frame_equal(result, expected, check_like=True)
 
         result = r.aggregate({'A': ['mean', 'std']})
-        expected = pd.concat([a_mean, a_std], axis=1)
+        expected = concat([a_mean, a_std], axis=1)
         expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'), ('A',
                                                                       'std')])
         tm.assert_frame_equal(result, expected)
 
         result = r['A'].aggregate(['mean', 'sum'])
-        expected = pd.concat([a_mean, a_sum], axis=1)
+        expected = concat([a_mean, a_sum], axis=1)
         expected.columns = ['mean', 'sum']
         tm.assert_frame_equal(result, expected)
 
-        result = r.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
-        expected = pd.concat([a_mean, a_sum], axis=1)
+        with catch_warnings(record=True):
+            # using a dict with renaming
+            warnings.simplefilter("ignore", FutureWarning)
+            result = r.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
+        expected = concat([a_mean, a_sum], axis=1)
         expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
                                                       ('A', 'sum')])
         tm.assert_frame_equal(result, expected, check_like=True)
 
-        result = r.aggregate({'A': {'mean': 'mean',
-                                    'sum': 'sum'},
-                              'B': {'mean2': 'mean',
-                                    'sum2': 'sum'}})
-        expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
+        with catch_warnings(record=True):
+            warnings.simplefilter("ignore", FutureWarning)
+            result = r.aggregate({'A': {'mean': 'mean',
+                                        'sum': 'sum'},
+                                  'B': {'mean2': 'mean',
+                                        'sum2': 'sum'}})
+        expected = concat([a_mean, a_sum, b_mean, b_sum], axis=1)
         exp_cols = [('A', 'mean'), ('A', 'sum'), ('B', 'mean2'), ('B', 'sum2')]
         expected.columns = pd.MultiIndex.from_tuples(exp_cols)
         tm.assert_frame_equal(result, expected, check_like=True)
 
         result = r.aggregate({'A': ['mean', 'std'], 'B': ['mean', 'std']})
-        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
+        expected = concat([a_mean, a_std, b_mean, b_std], axis=1)
 
         exp_cols = [('A', 'mean'), ('A', 'std'), ('B', 'mean'), ('B', 'std')]
         expected.columns = pd.MultiIndex.from_tuples(exp_cols)
         tm.assert_frame_equal(result, expected, check_like=True)
 
+    def test_agg_apply(self, raw):
+
         # passed lambda
+        df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
+
+        r = df.rolling(window=3)
+        a_sum = r['A'].sum()
+
         result = r.agg({'A': np.sum, 'B': lambda x: np.std(x, ddof=1)})
-        rcustom = r['B'].apply(lambda x: np.std(x, ddof=1))
-        expected = pd.concat([a_sum, rcustom], axis=1)
+        rcustom = r['B'].apply(lambda x: np.std(x, ddof=1), raw=raw)
+        expected = concat([a_sum, rcustom], axis=1)
         tm.assert_frame_equal(result, expected, check_like=True)
 
     def test_agg_consistency(self):
@@ -172,7 +205,7 @@ def test_agg_consistency(self):
         tm.assert_index_equal(result, expected)
 
         result = r['A'].agg([np.sum, np.mean]).columns
-        expected = pd.Index(['sum', 'mean'])
+        expected = Index(['sum', 'mean'])
         tm.assert_index_equal(result, expected)
 
         result = r.agg({'A': [np.sum, np.mean]}).columns
@@ -185,22 +218,25 @@ def test_agg_nested_dicts(self):
         df = DataFrame({'A': range(5), 'B': range(0, 10, 2)})
         r = df.rolling(window=3)
 
-        def f():
+        msg = r"cannot perform renaming for (r1|r2) with a nested dictionary"
+        with pytest.raises(SpecificationError, match=msg):
             r.aggregate({'r1': {'A': ['mean', 'sum']},
                          'r2': {'B': ['mean', 'sum']}})
 
-        self.assertRaises(SpecificationError, f)
-
-        expected = pd.concat([r['A'].mean(), r['A'].std(), r['B'].mean(),
-                              r['B'].std()], axis=1)
+        expected = concat([r['A'].mean(), r['A'].std(),
+                           r['B'].mean(), r['B'].std()], axis=1)
         expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
             'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
-        result = r[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
-                                    'B': {'rb': ['mean', 'std']}})
+        with catch_warnings(record=True):
+            warnings.simplefilter("ignore", FutureWarning)
+            result = r[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
+                                        'B': {'rb': ['mean', 'std']}})
         tm.assert_frame_equal(result, expected, check_like=True)
 
-        result = r.agg({'A': {'ra': ['mean', 'std']},
-                        'B': {'rb': ['mean', 'std']}})
+        with catch_warnings(record=True):
+            warnings.simplefilter("ignore", FutureWarning)
+            result = r.agg({'A': {'ra': ['mean', 'std']},
+                            'B': {'rb': ['mean', 'std']}})
         expected.columns = pd.MultiIndex.from_tuples([('A', 'ra', 'mean'), (
             'A', 'ra', 'std'), ('B', 'rb', 'mean'), ('B', 'rb', 'std')])
         tm.assert_frame_equal(result, expected, check_like=True)
@@ -221,8 +257,8 @@ def test_count_nonnumeric_types(self):
              'fl_inf': [1., 2., np.Inf],
              'fl_nan': [1., 2., np.NaN],
              'str_nan': ['aa', 'bb', np.NaN],
-             'dt_nat': [pd.Timestamp('20170101'), pd.Timestamp('20170203'),
-                        pd.Timestamp(None)],
+             'dt_nat': [Timestamp('20170101'), Timestamp('20170203'),
+                        Timestamp(None)],
              'periods_nat': [pd.Period('2012-01'), pd.Period('2012-02'),
                              pd.Period(None)]},
             columns=cols)
@@ -245,16 +281,16 @@ def test_count_nonnumeric_types(self):
         tm.assert_frame_equal(result, expected)
 
         result = df.rolling(1).count()
-        expected = df.notnull().astype(float)
+        expected = df.notna().astype(float)
         tm.assert_frame_equal(result, expected)
 
+    @td.skip_if_no_scipy
+    @pytest.mark.filterwarnings("ignore:can't resolve:ImportWarning")
     def test_window_with_args(self):
-        tm._skip_if_no_scipy()
-
         # make sure that we are aggregating window functions correctly with arg
         r = Series(np.random.randn(100)).rolling(window=10, min_periods=1,
                                                  win_type='gaussian')
-        expected = pd.concat([r.mean(std=10), r.mean(std=.01)], axis=1)
+        expected = concat([r.mean(std=10), r.mean(std=.01)], axis=1)
         expected.columns = ['<lambda>', '<lambda>']
         result = r.aggregate([lambda x: x.mean(std=10),
                               lambda x: x.mean(std=.01)])
@@ -266,7 +302,7 @@ def a(x):
         def b(x):
             return x.mean(std=0.01)
 
-        expected = pd.concat([r.mean(std=10), r.mean(std=.01)], axis=1)
+        expected = concat([r.mean(std=10), r.mean(std=.01)], axis=1)
         expected.columns = ['a', 'b']
         result = r.aggregate([a, b])
         tm.assert_frame_equal(result, expected)
@@ -277,86 +313,114 @@ def test_preserve_metadata(self):
 
         s2 = s.rolling(30).sum()
         s3 = s.rolling(20).sum()
-        self.assertEqual(s2.name, 'foo')
-        self.assertEqual(s3.name, 'foo')
-
-    def test_how_compat(self):
-        # in prior versions, we would allow how to be used in the resample
-        # now that its deprecated, we need to handle this in the actual
-        # aggregation functions
-        s = pd.Series(
-            np.random.randn(20),
-            index=pd.date_range('1/1/2000', periods=20, freq='12H'))
-
-        for how in ['min', 'max', 'median']:
-            for op in ['mean', 'sum', 'std', 'var', 'kurt', 'skew']:
-                for t in ['rolling', 'expanding']:
+        assert s2.name == 'foo'
+        assert s3.name == 'foo'
+
+    @pytest.mark.parametrize("func,window_size,expected_vals", [
+        ('rolling', 2, [[np.nan, np.nan, np.nan, np.nan],
+                        [15., 20., 25., 20.],
+                        [25., 30., 35., 30.],
+                        [np.nan, np.nan, np.nan, np.nan],
+                        [20., 30., 35., 30.],
+                        [35., 40., 60., 40.],
+                        [60., 80., 85., 80]]),
+        ('expanding', None, [[10., 10., 20., 20.],
+                             [15., 20., 25., 20.],
+                             [20., 30., 30., 20.],
+                             [10., 10., 30., 30.],
+                             [20., 30., 35., 30.],
+                             [26.666667, 40., 50., 30.],
+                             [40., 80., 60., 30.]])])
+    def test_multiple_agg_funcs(self, func, window_size, expected_vals):
+        # GH 15072
+        df = pd.DataFrame([
+            ['A', 10, 20],
+            ['A', 20, 30],
+            ['A', 30, 40],
+            ['B', 10, 30],
+            ['B', 30, 40],
+            ['B', 40, 80],
+            ['B', 80, 90]], columns=['stock', 'low', 'high'])
+
+        f = getattr(df.groupby('stock'), func)
+        if window_size:
+            window = f(window_size)
+        else:
+            window = f()
 
-                    with catch_warnings(record=True):
+        index = pd.MultiIndex.from_tuples([
+            ('A', 0), ('A', 1), ('A', 2),
+            ('B', 3), ('B', 4), ('B', 5), ('B', 6)], names=['stock', None])
+        columns = pd.MultiIndex.from_tuples([
+            ('low', 'mean'), ('low', 'max'), ('high', 'mean'),
+            ('high', 'min')])
+        expected = pd.DataFrame(expected_vals, index=index, columns=columns)
 
-                        dfunc = getattr(pd, "{0}_{1}".format(t, op))
-                        if dfunc is None:
-                            continue
+        result = window.agg(OrderedDict((
+            ('low', ['mean', 'max']),
+            ('high', ['mean', 'min']),
+        )))
 
-                        if t == 'rolling':
-                            kwargs = {'window': 5}
-                        else:
-                            kwargs = {}
-                        result = dfunc(s, freq='D', how=how, **kwargs)
-
-                        expected = getattr(
-                            getattr(s, t)(freq='D', **kwargs), op)(how=how)
-                        tm.assert_series_equal(result, expected)
+        tm.assert_frame_equal(result, expected)
 
 
+@pytest.mark.filterwarnings("ignore:can't resolve package:ImportWarning")
 class TestWindow(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
-    def test_constructor(self):
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
         # GH 12669
-        tm._skip_if_no_scipy()
 
-        for o in [self.series, self.frame]:
-            c = o.rolling
+        o = getattr(self, which)
+        c = o.rolling
 
-            # valid
-            c(win_type='boxcar', window=2, min_periods=1)
-            c(win_type='boxcar', window=2, min_periods=1, center=True)
-            c(win_type='boxcar', window=2, min_periods=1, center=False)
+        # valid
+        c(win_type='boxcar', window=2, min_periods=1)
+        c(win_type='boxcar', window=2, min_periods=1, center=True)
+        c(win_type='boxcar', window=2, min_periods=1, center=False)
 
-            for wt in ['boxcar', 'triang', 'blackman', 'hamming', 'bartlett',
-                       'bohman', 'blackmanharris', 'nuttall', 'barthann']:
-                c(win_type=wt, window=2)
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(win_type='boxcar', window=2, min_periods=w)
+            with pytest.raises(ValueError):
+                c(win_type='boxcar', window=2, min_periods=1, center=w)
 
-            # not valid
-            for w in [2., 'foo', np.array([2])]:
-                with self.assertRaises(ValueError):
-                    c(win_type='boxcar', window=2, min_periods=w)
-                with self.assertRaises(ValueError):
-                    c(win_type='boxcar', window=2, min_periods=1, center=w)
+        for wt in ['foobar', 1]:
+            with pytest.raises(ValueError):
+                c(win_type=wt, window=2)
 
-            for wt in ['foobar', 1]:
-                with self.assertRaises(ValueError):
-                    c(win_type=wt, window=2)
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor_with_win_type(self, which, win_types):
+        # GH 12669
+        o = getattr(self, which)
+        c = o.rolling
+        c(win_type=win_types, window=2)
 
-    def test_numpy_compat(self):
+    @pytest.mark.parametrize(
+        'method', ['sum', 'mean'])
+    def test_numpy_compat(self, method):
         # see gh-12811
         w = rwindow.Window(Series([2, 4, 6]), window=[0, 2])
 
         msg = "numpy operations are not valid with window objects"
 
-        for func in ('sum', 'mean'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(w, func), 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(w, func), dtype=np.float64)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(w, method)(1, 2, 3)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(w, method)(dtype=np.float64)
 
 
 class TestRolling(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def test_doc_string(self):
@@ -366,75 +430,248 @@ def test_doc_string(self):
         df.rolling(2).sum()
         df.rolling(2, min_periods=1).sum()
 
-    def test_constructor(self):
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
         # GH 12669
 
-        for o in [self.series, self.frame]:
-            c = o.rolling
+        o = getattr(self, which)
+        c = o.rolling
 
-            # valid
-            c(window=2)
-            c(window=2, min_periods=1)
-            c(window=2, min_periods=1, center=True)
-            c(window=2, min_periods=1, center=False)
+        # valid
+        c(window=2)
+        c(window=2, min_periods=1)
+        c(window=2, min_periods=1, center=True)
+        c(window=2, min_periods=1, center=False)
 
-            # GH 13383
+        # GH 13383
+        with pytest.raises(ValueError):
             c(0)
-            with self.assertRaises(ValueError):
-                c(-1)
-
-            # not valid
-            for w in [2., 'foo', np.array([2])]:
-                with self.assertRaises(ValueError):
-                    c(window=w)
-                with self.assertRaises(ValueError):
-                    c(window=2, min_periods=w)
-                with self.assertRaises(ValueError):
-                    c(window=2, min_periods=1, center=w)
-
-    def test_constructor_with_win_type(self):
+            c(-1)
+
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(window=w)
+            with pytest.raises(ValueError):
+                c(window=2, min_periods=w)
+            with pytest.raises(ValueError):
+                c(window=2, min_periods=1, center=w)
+
+    @td.skip_if_no_scipy
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor_with_win_type(self, which):
         # GH 13383
-        tm._skip_if_no_scipy()
-        for o in [self.series, self.frame]:
-            c = o.rolling
-            c(0, win_type='boxcar')
-            with self.assertRaises(ValueError):
-                c(-1, win_type='boxcar')
-
-    def test_constructor_with_timedelta_window(self):
+        o = getattr(self, which)
+        c = o.rolling
+        with pytest.raises(ValueError):
+            c(-1, win_type='boxcar')
+
+    @pytest.mark.parametrize(
+        'window', [timedelta(days=3), pd.Timedelta(days=3)])
+    def test_constructor_with_timedelta_window(self, window):
         # GH 15440
         n = 10
-        df = pd.DataFrame({'value': np.arange(n)},
-                          index=pd.date_range('2015-12-24',
-                                              periods=n,
-                                              freq="D"))
+        df = DataFrame({'value': np.arange(n)},
+                       index=pd.date_range('2015-12-24', periods=n, freq="D"))
         expected_data = np.append([0., 1.], np.arange(3., 27., 3))
-        for window in [timedelta(days=3), pd.Timedelta(days=3)]:
-            result = df.rolling(window=window).sum()
-            expected = pd.DataFrame({'value': expected_data},
-                                    index=pd.date_range('2015-12-24',
-                                                        periods=n,
-                                                        freq="D"))
-            tm.assert_frame_equal(result, expected)
-            expected = df.rolling('3D').sum()
-            tm.assert_frame_equal(result, expected)
 
-    def test_numpy_compat(self):
+        result = df.rolling(window=window).sum()
+        expected = DataFrame({'value': expected_data},
+                             index=pd.date_range('2015-12-24', periods=n,
+                                                 freq="D"))
+        tm.assert_frame_equal(result, expected)
+        expected = df.rolling('3D').sum()
+        tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize(
+        'window', [timedelta(days=3), pd.Timedelta(days=3), '3D'])
+    def test_constructor_timedelta_window_and_minperiods(self, window, raw):
+        # GH 15305
+        n = 10
+        df = DataFrame({'value': np.arange(n)},
+                       index=pd.date_range('2017-08-08', periods=n, freq="D"))
+        expected = DataFrame(
+            {'value': np.append([np.NaN, 1.], np.arange(3., 27., 3))},
+            index=pd.date_range('2017-08-08', periods=n, freq="D"))
+        result_roll_sum = df.rolling(window=window, min_periods=2).sum()
+        result_roll_generic = df.rolling(window=window,
+                                         min_periods=2).apply(sum, raw=raw)
+        tm.assert_frame_equal(result_roll_sum, expected)
+        tm.assert_frame_equal(result_roll_generic, expected)
+
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'sum', 'max', 'min', 'var'])
+    def test_numpy_compat(self, method):
         # see gh-12811
         r = rwindow.Rolling(Series([2, 4, 6]), window=2)
 
         msg = "numpy operations are not valid with window objects"
 
-        for func in ('std', 'mean', 'sum', 'max', 'min', 'var'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(r, func), 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(r, func), dtype=np.float64)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(r, method)(1, 2, 3)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(r, method)(dtype=np.float64)
+
+    def test_closed(self):
+        df = DataFrame({'A': [0, 1, 2, 3, 4]})
+        # closed only allowed for datetimelike
+        with pytest.raises(ValueError):
+            df.rolling(window=3, closed='neither')
+
+    @pytest.mark.parametrize("func", ['min', 'max'])
+    def test_closed_one_entry(self, func):
+        # GH24718
+        ser = pd.Series(data=[2], index=pd.date_range('2000', periods=1))
+        result = getattr(ser.rolling('10D', closed='left'), func)()
+        tm.assert_series_equal(result, pd.Series([np.nan], index=ser.index))
+
+    @pytest.mark.parametrize("func", ['min', 'max'])
+    def test_closed_one_entry_groupby(self, func):
+        # GH24718
+        ser = pd.DataFrame(data={'A': [1, 1, 2], 'B': [3, 2, 1]},
+                           index=pd.date_range('2000', periods=3))
+        result = getattr(
+            ser.groupby('A', sort=False)['B'].rolling('10D', closed='left'),
+            func)()
+        exp_idx = pd.MultiIndex.from_arrays(arrays=[[1, 1, 2], ser.index],
+                                            names=('A', None))
+        expected = pd.Series(data=[np.nan, 3, np.nan], index=exp_idx, name='B')
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("input_dtype", ['int', 'float'])
+    @pytest.mark.parametrize("func,closed,expected", [
+        ('min', 'right', [0.0, 0, 0, 1, 2, 3, 4, 5, 6, 7]),
+        ('min', 'both', [0.0, 0, 0, 0, 1, 2, 3, 4, 5, 6]),
+        ('min', 'neither', [np.nan, 0, 0, 1, 2, 3, 4, 5, 6, 7]),
+        ('min', 'left', [np.nan, 0, 0, 0, 1, 2, 3, 4, 5, 6]),
+        ('max', 'right', [0.0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+        ('max', 'both', [0.0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
+        ('max', 'neither', [np.nan, 0, 1, 2, 3, 4, 5, 6, 7, 8]),
+        ('max', 'left', [np.nan, 0, 1, 2, 3, 4, 5, 6, 7, 8])
+    ])
+    def test_closed_min_max_datetime(self, input_dtype,
+                                     func, closed,
+                                     expected):
+        # see gh-21704
+        ser = pd.Series(data=np.arange(10).astype(input_dtype),
+                        index=pd.date_range('2000', periods=10))
+
+        result = getattr(ser.rolling('3D', closed=closed), func)()
+        expected = pd.Series(expected, index=ser.index)
+        tm.assert_series_equal(result, expected)
+
+    def test_closed_uneven(self):
+        # see gh-21704
+        ser = pd.Series(data=np.arange(10),
+                        index=pd.date_range('2000', periods=10))
+
+        # uneven
+        ser = ser.drop(index=ser.index[[1, 5]])
+        result = ser.rolling('3D', closed='left').min()
+        expected = pd.Series([np.nan, 0, 0, 2, 3, 4, 6, 6],
+                             index=ser.index)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize("func,closed,expected", [
+        ('min', 'right', [np.nan, 0, 0, 1, 2, 3, 4, 5, np.nan, np.nan]),
+        ('min', 'both', [np.nan, 0, 0, 0, 1, 2, 3, 4, 5, np.nan]),
+        ('min', 'neither', [np.nan, np.nan, 0, 1, 2, 3, 4, 5, np.nan, np.nan]),
+        ('min', 'left', [np.nan, np.nan, 0, 0, 1, 2, 3, 4, 5, np.nan]),
+        ('max', 'right', [np.nan, 1, 2, 3, 4, 5, 6, 6, np.nan, np.nan]),
+        ('max', 'both', [np.nan, 1, 2, 3, 4, 5, 6, 6, 6, np.nan]),
+        ('max', 'neither', [np.nan, np.nan, 1, 2, 3, 4, 5, 6, np.nan, np.nan]),
+        ('max', 'left', [np.nan, np.nan, 1, 2, 3, 4, 5, 6, 6, np.nan])
+    ])
+    def test_closed_min_max_minp(self, func, closed, expected):
+        # see gh-21704
+        ser = pd.Series(data=np.arange(10),
+                        index=pd.date_range('2000', periods=10))
+        ser[ser.index[-3:]] = np.nan
+        result = getattr(ser.rolling('3D', min_periods=2, closed=closed),
+                         func)()
+        expected = pd.Series(expected, index=ser.index)
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('roller', ['1s', 1])
+    def tests_empty_df_rolling(self, roller):
+        # GH 15819 Verifies that datetime and integer rolling windows can be
+        # applied to empty DataFrames
+        expected = DataFrame()
+        result = DataFrame().rolling(roller).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Verifies that datetime and integer rolling windows can be applied to
+        # empty DataFrames with datetime index
+        expected = DataFrame(index=pd.DatetimeIndex([]))
+        result = DataFrame(index=pd.DatetimeIndex([])).rolling(roller).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing_minp_zero(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        # minp=0
+        x = pd.Series([np.nan])
+        result = x.rolling(1, min_periods=0).sum()
+        expected = pd.Series([0.0])
+        tm.assert_series_equal(result, expected)
+
+        # minp=1
+        result = x.rolling(1, min_periods=1).sum()
+        expected = pd.Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+    def test_missing_minp_zero_variable(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        x = pd.Series([np.nan] * 4,
+                      index=pd.DatetimeIndex(['2017-01-01', '2017-01-04',
+                                              '2017-01-06', '2017-01-07']))
+        result = x.rolling(pd.Timedelta("2d"), min_periods=0).sum()
+        expected = pd.Series(0.0, index=x.index)
+        tm.assert_series_equal(result, expected)
+
+    def test_multi_index_names(self):
+
+        # GH 16789, 16825
+        cols = pd.MultiIndex.from_product([['A', 'B'], ['C', 'D', 'E']],
+                                          names=['1', '2'])
+        df = DataFrame(np.ones((10, 6)), columns=cols)
+        result = df.rolling(3).cov()
+
+        tm.assert_index_equal(result.columns, df.columns)
+        assert result.index.names == [None, '1', '2']
+
+    @pytest.mark.parametrize('klass', [pd.Series, pd.DataFrame])
+    def test_iter_raises(self, klass):
+        # https://github.com/pandas-dev/pandas/issues/11704
+        # Iteration over a Window
+        obj = klass([1, 2, 3, 4])
+        with pytest.raises(NotImplementedError):
+            iter(obj.rolling(2))
+
+    def test_rolling_axis(self, axis_frame):
+        # see gh-23372.
+        df = DataFrame(np.ones((10, 20)))
+        axis = df._get_axis_number(axis_frame)
+
+        if axis == 0:
+            expected = DataFrame({
+                i: [np.nan] * 2 + [3.0] * 8
+                for i in range(20)
+            })
+        else:
+            # axis == 1
+            expected = DataFrame([
+                [np.nan] * 2 + [3.0] * 18
+            ] * 10)
+
+        result = df.rolling(3, axis=axis_frame).sum()
+        tm.assert_frame_equal(result, expected)
 
 
 class TestExpanding(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def test_doc_string(self):
@@ -443,40 +680,103 @@ def test_doc_string(self):
         df
         df.expanding(2).sum()
 
-    def test_constructor(self):
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
         # GH 12669
 
-        for o in [self.series, self.frame]:
-            c = o.expanding
+        o = getattr(self, which)
+        c = o.expanding
 
-            # valid
-            c(min_periods=1)
-            c(min_periods=1, center=True)
-            c(min_periods=1, center=False)
+        # valid
+        c(min_periods=1)
+        c(min_periods=1, center=True)
+        c(min_periods=1, center=False)
 
-            # not valid
-            for w in [2., 'foo', np.array([2])]:
-                with self.assertRaises(ValueError):
-                    c(min_periods=w)
-                with self.assertRaises(ValueError):
-                    c(min_periods=1, center=w)
+        # not valid
+        for w in [2., 'foo', np.array([2])]:
+            with pytest.raises(ValueError):
+                c(min_periods=w)
+            with pytest.raises(ValueError):
+                c(min_periods=1, center=w)
 
-    def test_numpy_compat(self):
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'sum', 'max', 'min', 'var'])
+    def test_numpy_compat(self, method):
         # see gh-12811
         e = rwindow.Expanding(Series([2, 4, 6]), window=2)
 
         msg = "numpy operations are not valid with window objects"
 
-        for func in ('std', 'mean', 'sum', 'max', 'min', 'var'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(e, func), 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(e, func), dtype=np.float64)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(e, method)(1, 2, 3)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(e, method)(dtype=np.float64)
+
+    @pytest.mark.parametrize(
+        'expander',
+        [1, pytest.param('ls', marks=pytest.mark.xfail(
+                         reason='GH#16425 expanding with '
+                                'offset not supported'))])
+    def test_empty_df_expanding(self, expander):
+        # GH 15819 Verifies that datetime and integer expanding windows can be
+        # applied to empty DataFrames
+
+        expected = DataFrame()
+        result = DataFrame().expanding(expander).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Verifies that datetime and integer expanding windows can be applied
+        # to empty DataFrames with datetime index
+        expected = DataFrame(index=pd.DatetimeIndex([]))
+        result = DataFrame(
+            index=pd.DatetimeIndex([])).expanding(expander).sum()
+        tm.assert_frame_equal(result, expected)
+
+    def test_missing_minp_zero(self):
+        # https://github.com/pandas-dev/pandas/pull/18921
+        # minp=0
+        x = pd.Series([np.nan])
+        result = x.expanding(min_periods=0).sum()
+        expected = pd.Series([0.0])
+        tm.assert_series_equal(result, expected)
+
+        # minp=1
+        result = x.expanding(min_periods=1).sum()
+        expected = pd.Series([np.nan])
+        tm.assert_series_equal(result, expected)
+
+    @pytest.mark.parametrize('klass', [pd.Series, pd.DataFrame])
+    def test_iter_raises(self, klass):
+        # https://github.com/pandas-dev/pandas/issues/11704
+        # Iteration over a Window
+        obj = klass([1, 2, 3, 4])
+        with pytest.raises(NotImplementedError):
+            iter(obj.expanding(2))
+
+    def test_expanding_axis(self, axis_frame):
+        # see gh-23372.
+        df = DataFrame(np.ones((10, 20)))
+        axis = df._get_axis_number(axis_frame)
+
+        if axis == 0:
+            expected = DataFrame({
+                i: [np.nan] * 2 + [float(j) for j in range(3, 11)]
+                for i in range(20)
+            })
+        else:
+            # axis == 1
+            expected = DataFrame([
+                [np.nan] * 2 + [float(i) for i in range(3, 21)]
+            ] * 10)
+
+        result = df.expanding(3, axis=axis_frame).sum()
+        tm.assert_frame_equal(result, expected)
 
 
 class TestEWM(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def test_doc_string(self):
@@ -485,75 +785,65 @@ def test_doc_string(self):
         df
         df.ewm(com=0.5).mean()
 
-    def test_constructor(self):
-        for o in [self.series, self.frame]:
-            c = o.ewm
-
-            # valid
-            c(com=0.5)
-            c(span=1.5)
-            c(alpha=0.5)
-            c(halflife=0.75)
-            c(com=0.5, span=None)
-            c(alpha=0.5, com=None)
-            c(halflife=0.75, alpha=None)
-
-            # not valid: mutually exclusive
-            with self.assertRaises(ValueError):
-                c(com=0.5, alpha=0.5)
-            with self.assertRaises(ValueError):
-                c(span=1.5, halflife=0.75)
-            with self.assertRaises(ValueError):
-                c(alpha=0.5, span=1.5)
-
-            # not valid: com < 0
-            with self.assertRaises(ValueError):
-                c(com=-0.5)
-
-            # not valid: span < 1
-            with self.assertRaises(ValueError):
-                c(span=0.5)
-
-            # not valid: halflife <= 0
-            with self.assertRaises(ValueError):
-                c(halflife=0)
-
-            # not valid: alpha <= 0 or alpha > 1
-            for alpha in (-0.5, 1.5):
-                with self.assertRaises(ValueError):
-                    c(alpha=alpha)
-
-    def test_numpy_compat(self):
+    @pytest.mark.parametrize(
+        'which', ['series', 'frame'])
+    def test_constructor(self, which):
+        o = getattr(self, which)
+        c = o.ewm
+
+        # valid
+        c(com=0.5)
+        c(span=1.5)
+        c(alpha=0.5)
+        c(halflife=0.75)
+        c(com=0.5, span=None)
+        c(alpha=0.5, com=None)
+        c(halflife=0.75, alpha=None)
+
+        # not valid: mutually exclusive
+        with pytest.raises(ValueError):
+            c(com=0.5, alpha=0.5)
+        with pytest.raises(ValueError):
+            c(span=1.5, halflife=0.75)
+        with pytest.raises(ValueError):
+            c(alpha=0.5, span=1.5)
+
+        # not valid: com < 0
+        with pytest.raises(ValueError):
+            c(com=-0.5)
+
+        # not valid: span < 1
+        with pytest.raises(ValueError):
+            c(span=0.5)
+
+        # not valid: halflife <= 0
+        with pytest.raises(ValueError):
+            c(halflife=0)
+
+        # not valid: alpha <= 0 or alpha > 1
+        for alpha in (-0.5, 1.5):
+            with pytest.raises(ValueError):
+                c(alpha=alpha)
+
+    @pytest.mark.parametrize(
+        'method', ['std', 'mean', 'var'])
+    def test_numpy_compat(self, method):
         # see gh-12811
         e = rwindow.EWM(Series([2, 4, 6]), alpha=0.5)
 
         msg = "numpy operations are not valid with window objects"
 
-        for func in ('std', 'mean', 'var'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(e, func), 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(e, func), dtype=np.float64)
-
-
-class TestDeprecations(Base):
-    """ test that we are catching deprecation warnings """
-
-    def setUp(self):
-        self._create_data()
-
-    def test_deprecations(self):
-
-        with catch_warnings(record=True):
-            mom.rolling_mean(np.ones(10), 3, center=True, axis=0)
-            mom.rolling_mean(Series(np.ones(10)), 3, center=True, axis=0)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(e, method)(1, 2, 3)
+        with pytest.raises(UnsupportedFunctionCall, match=msg):
+            getattr(e, method)(dtype=np.float64)
 
 
-# GH #12373 : rolling functions error on float32 data
+# gh-12373 : rolling functions error on float32 data
 # make sure rolling functions works for different dtypes
 #
-# NOTE that these are yielded tests and so _create_data is
-# explicity called, nor do these inherit from unittest.TestCase
+# NOTE that these are yielded tests and so _create_data
+# is explicitly called.
 #
 # further note that we are only checking rolling for fully dtype
 # compliance (though both expanding and ewm inherit)
@@ -623,8 +913,8 @@ def get_expects(self):
         return expects
 
     def _create_dtype_data(self, dtype):
-        sr1 = Series(range(5), dtype=dtype)
-        sr2 = Series(range(10, 0, -2), dtype=dtype)
+        sr1 = Series(np.arange(5), dtype=dtype)
+        sr2 = Series(np.arange(10, 0, -2), dtype=dtype)
         df = DataFrame(np.arange(10).reshape((5, 2)), dtype=dtype)
 
         data = {
@@ -763,9 +1053,10 @@ def _create_data(self):
                     "datetime64[ns, UTC] is not supported ATM")
 
 
+@pytest.mark.filterwarnings("ignore:can't resolve package:ImportWarning")
 class TestMoments(Base):
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def test_centered_axis_validation(self):
@@ -774,7 +1065,7 @@ def test_centered_axis_validation(self):
         Series(np.ones(10)).rolling(window=3, center=True, axis=0).mean()
 
         # bad axis
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             Series(np.ones(10)).rolling(window=3, center=True, axis=1).mean()
 
         # ok ok
@@ -784,84 +1075,64 @@ def test_centered_axis_validation(self):
                                              axis=1).mean()
 
         # bad axis
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             (DataFrame(np.ones((10, 10)))
              .rolling(window=3, center=True, axis=2).mean())
 
     def test_rolling_sum(self):
-        self._check_moment_func(mom.rolling_sum, np.sum, name='sum')
+        self._check_moment_func(np.nansum, name='sum',
+                                zero_min_periods_equal=False)
 
     def test_rolling_count(self):
         counter = lambda x: np.isfinite(x).astype(float).sum()
-        self._check_moment_func(mom.rolling_count, counter, name='count',
-                                has_min_periods=False, preserve_nan=False,
+        self._check_moment_func(counter, name='count', has_min_periods=False,
                                 fill_value=0)
 
     def test_rolling_mean(self):
-        self._check_moment_func(mom.rolling_mean, np.mean, name='mean')
+        self._check_moment_func(np.mean, name='mean')
 
+    @td.skip_if_no_scipy
     def test_cmov_mean(self):
         # GH 8238
-        tm._skip_if_no_scipy()
-
         vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
                          10.63, 14.48])
-        xp = np.array([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516, 12.818,
-                       12.952, np.nan, np.nan])
-
-        with catch_warnings(record=True):
-            rs = mom.rolling_mean(vals, 5, center=True)
-            tm.assert_almost_equal(xp, rs)
-
-        xp = Series(rs)
-        rs = Series(vals).rolling(5, center=True).mean()
-        tm.assert_series_equal(xp, rs)
+        result = Series(vals).rolling(5, center=True).mean()
+        expected = Series([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516,
+                           12.818, 12.952, np.nan, np.nan])
+        tm.assert_series_equal(expected, result)
 
+    @td.skip_if_no_scipy
     def test_cmov_window(self):
         # GH 8238
-        tm._skip_if_no_scipy()
-
         vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
                          10.63, 14.48])
-        xp = np.array([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516, 12.818,
-                       12.952, np.nan, np.nan])
-
-        with catch_warnings(record=True):
-            rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-            tm.assert_almost_equal(xp, rs)
-
-        xp = Series(rs)
-        rs = Series(vals).rolling(5, win_type='boxcar', center=True).mean()
-        tm.assert_series_equal(xp, rs)
+        result = Series(vals).rolling(5, win_type='boxcar', center=True).mean()
+        expected = Series([np.nan, np.nan, 9.962, 11.27, 11.564, 12.516,
+                           12.818, 12.952, np.nan, np.nan])
+        tm.assert_series_equal(expected, result)
 
+    @td.skip_if_no_scipy
     def test_cmov_window_corner(self):
         # GH 8238
-        tm._skip_if_no_scipy()
-
         # all nan
-        vals = np.empty(10, dtype=float)
-        vals.fill(np.nan)
-        with catch_warnings(record=True):
-            rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-            self.assertTrue(np.isnan(rs).all())
+        vals = pd.Series([np.nan] * 10)
+        result = vals.rolling(5, center=True, win_type='boxcar').mean()
+        assert np.isnan(result).all()
 
         # empty
-        vals = np.array([])
-        with catch_warnings(record=True):
-            rs = mom.rolling_window(vals, 5, 'boxcar', center=True)
-            self.assertEqual(len(rs), 0)
+        vals = pd.Series([])
+        result = vals.rolling(5, center=True, win_type='boxcar').mean()
+        assert len(result) == 0
 
         # shorter than window
-        vals = np.random.randn(5)
-        with catch_warnings(record=True):
-            rs = mom.rolling_window(vals, 10, 'boxcar')
-            self.assertTrue(np.isnan(rs).all())
-            self.assertEqual(len(rs), 5)
+        vals = pd.Series(np.random.randn(5))
+        result = vals.rolling(10, win_type='boxcar').mean()
+        assert np.isnan(result).all()
+        assert len(result) == 5
 
+    @td.skip_if_no_scipy
     def test_cmov_window_frame(self):
         # Gh 8238
-        tm._skip_if_no_scipy()
-
         vals = np.array([[12.18, 3.64], [10.18, 9.16], [13.24, 14.61],
                          [4.51, 8.11], [6.15, 11.44], [9.14, 6.21],
                          [11.31, 10.67], [2.94, 6.51], [9.42, 8.39], [12.44,
@@ -877,7 +1148,7 @@ def test_cmov_window_frame(self):
         tm.assert_frame_equal(DataFrame(xp), rs)
 
         # invalid method
-        with self.assertRaises(AttributeError):
+        with pytest.raises(AttributeError):
             (DataFrame(vals).rolling(5, win_type='boxcar', center=True)
              .std())
 
@@ -890,9 +1161,8 @@ def test_cmov_window_frame(self):
         rs = DataFrame(vals).rolling(5, win_type='boxcar', center=True).sum()
         tm.assert_frame_equal(DataFrame(xp), rs)
 
+    @td.skip_if_no_scipy
     def test_cmov_window_na_min_periods(self):
-        tm._skip_if_no_scipy()
-
         # min_periods
         vals = Series(np.random.randn(10))
         vals[4] = np.nan
@@ -903,13 +1173,9 @@ def test_cmov_window_na_min_periods(self):
                           center=True).mean()
         tm.assert_series_equal(xp, rs)
 
-    def test_cmov_window_regular(self):
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular(self, win_types):
         # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
         vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
                          10.63, 14.48])
         xps = {
@@ -931,35 +1197,25 @@ def test_cmov_window_regular(self):
                          14.0825, 11.5675, np.nan, np.nan]
         }
 
-        for wt in win_types:
-            xp = Series(xps[wt])
-            rs = Series(vals).rolling(5, win_type=wt, center=True).mean()
-            tm.assert_series_equal(xp, rs)
+        xp = Series(xps[win_types])
+        rs = Series(vals).rolling(5, win_type=win_types, center=True).mean()
+        tm.assert_series_equal(xp, rs)
 
-    def test_cmov_window_regular_linear_range(self):
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular_linear_range(self, win_types):
         # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
         vals = np.array(range(10), dtype=np.float)
         xp = vals.copy()
         xp[:2] = np.nan
         xp[-2:] = np.nan
         xp = Series(xp)
 
-        for wt in win_types:
-            rs = Series(vals).rolling(5, win_type=wt, center=True).mean()
-            tm.assert_series_equal(xp, rs)
+        rs = Series(vals).rolling(5, win_type=win_types, center=True).mean()
+        tm.assert_series_equal(xp, rs)
 
-    def test_cmov_window_regular_missing_data(self):
+    @td.skip_if_no_scipy
+    def test_cmov_window_regular_missing_data(self, win_types):
         # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['triang', 'blackman', 'hamming', 'bartlett', 'bohman',
-                     'blackmanharris', 'nuttall', 'barthann']
-
         vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, np.nan,
                          10.63, 14.48])
         xps = {
@@ -981,18 +1237,17 @@ def test_cmov_window_regular_missing_data(self):
                                9.16438, 13.05052, 14.02175, 16.1098, 13.65509]
         }
 
-        for wt in win_types:
-            xp = Series(xps[wt])
-            rs = Series(vals).rolling(5, win_type=wt, min_periods=3).mean()
-            tm.assert_series_equal(xp, rs)
+        xp = Series(xps[win_types])
+        rs = Series(vals).rolling(5, win_type=win_types, min_periods=3).mean()
+        tm.assert_series_equal(xp, rs)
 
-    def test_cmov_window_special(self):
+    @td.skip_if_no_scipy
+    def test_cmov_window_special(self, win_types_special):
         # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['kaiser', 'gaussian', 'general_gaussian', 'slepian']
-        kwds = [{'beta': 1.}, {'std': 1.}, {'power': 2.,
-                                            'width': 2.}, {'width': 0.5}]
+        kwds = {
+            'kaiser': {'beta': 1.},
+            'gaussian': {'std': 1.},
+            'general_gaussian': {'power': 2., 'width': 2.}}
 
         vals = np.array([6.95, 15.21, 4.72, 9.12, 13.81, 13.49, 16.68, 9.48,
                          10.63, 14.48])
@@ -1002,24 +1257,24 @@ def test_cmov_window_special(self):
                          13.65671, 12.01002, np.nan, np.nan],
             'general_gaussian': [np.nan, np.nan, 9.85011, 10.71589, 11.73161,
                                  13.08516, 12.95111, 12.74577, np.nan, np.nan],
-            'slepian': [np.nan, np.nan, 9.81073, 10.89359, 11.70284, 12.88331,
-                        12.96079, 12.77008, np.nan, np.nan],
             'kaiser': [np.nan, np.nan, 9.86851, 11.02969, 11.65161, 12.75129,
                        12.90702, 12.83757, np.nan, np.nan]
         }
 
-        for wt, k in zip(win_types, kwds):
-            xp = Series(xps[wt])
-            rs = Series(vals).rolling(5, win_type=wt, center=True).mean(**k)
-            tm.assert_series_equal(xp, rs)
+        xp = Series(xps[win_types_special])
+        rs = Series(vals).rolling(
+            5, win_type=win_types_special, center=True).mean(
+            **kwds[win_types_special])
+        tm.assert_series_equal(xp, rs)
 
-    def test_cmov_window_special_linear_range(self):
+    @td.skip_if_no_scipy
+    def test_cmov_window_special_linear_range(self, win_types_special):
         # GH 8238
-        tm._skip_if_no_scipy()
-
-        win_types = ['kaiser', 'gaussian', 'general_gaussian', 'slepian']
-        kwds = [{'beta': 1.}, {'std': 1.}, {'power': 2.,
-                                            'width': 2.}, {'width': 0.5}]
+        kwds = {
+            'kaiser': {'beta': 1.},
+            'gaussian': {'std': 1.},
+            'general_gaussian': {'power': 2., 'width': 2.},
+            'slepian': {'width': 0.5}}
 
         vals = np.array(range(10), dtype=np.float)
         xp = vals.copy()
@@ -1027,367 +1282,278 @@ def test_cmov_window_special_linear_range(self):
         xp[-2:] = np.nan
         xp = Series(xp)
 
-        for wt, k in zip(win_types, kwds):
-            rs = Series(vals).rolling(5, win_type=wt, center=True).mean(**k)
-            tm.assert_series_equal(xp, rs)
+        rs = Series(vals).rolling(
+            5, win_type=win_types_special, center=True).mean(
+            **kwds[win_types_special])
+        tm.assert_series_equal(xp, rs)
 
     def test_rolling_median(self):
-        with catch_warnings(record=True):
-            self._check_moment_func(mom.rolling_median, np.median,
-                                    name='median')
+        self._check_moment_func(np.median, name='median')
 
     def test_rolling_min(self):
+        self._check_moment_func(np.min, name='min')
 
-        with catch_warnings(record=True):
-            self._check_moment_func(mom.rolling_min, np.min, name='min')
-
-        with catch_warnings(record=True):
-            a = np.array([1, 2, 3, 4, 5])
-            b = mom.rolling_min(a, window=100, min_periods=1)
-            tm.assert_almost_equal(b, np.ones(len(a)))
+        a = pd.Series([1, 2, 3, 4, 5])
+        result = a.rolling(window=100, min_periods=1).min()
+        expected = pd.Series(np.ones(len(a)))
+        tm.assert_series_equal(result, expected)
 
-            self.assertRaises(ValueError, mom.rolling_min, np.array([1, 2, 3]),
-                              window=3, min_periods=5)
+        with pytest.raises(ValueError):
+            pd.Series([1, 2, 3]).rolling(window=3, min_periods=5).min()
 
     def test_rolling_max(self):
+        self._check_moment_func(np.max, name='max')
 
-        with catch_warnings(record=True):
-            self._check_moment_func(mom.rolling_max, np.max, name='max')
-
-        with catch_warnings(record=True):
-            a = np.array([1, 2, 3, 4, 5], dtype=np.float64)
-            b = mom.rolling_max(a, window=100, min_periods=1)
-            tm.assert_almost_equal(a, b)
+        a = pd.Series([1, 2, 3, 4, 5], dtype=np.float64)
+        b = a.rolling(window=100, min_periods=1).max()
+        tm.assert_almost_equal(a, b)
 
-            self.assertRaises(ValueError, mom.rolling_max, np.array([1, 2, 3]),
-                              window=3, min_periods=5)
+        with pytest.raises(ValueError):
+            pd.Series([1, 2, 3]).rolling(window=3, min_periods=5).max()
 
-    def test_rolling_quantile(self):
-        qs = [0.0, .1, .5, .9, 1.0]
+    @pytest.mark.parametrize('q', [0.0, .1, .5, .9, 1.0])
+    def test_rolling_quantile(self, q):
 
         def scoreatpercentile(a, per):
             values = np.sort(a, axis=0)
 
-            idx = per / 1. * (values.shape[0] - 1)
-            return values[int(idx)]
+            idx = int(per / 1. * (values.shape[0] - 1))
 
-        for q in qs:
+            if idx == values.shape[0] - 1:
+                retval = values[-1]
 
-            def f(x, window, quantile, min_periods=None, freq=None,
-                  center=False):
-                return mom.rolling_quantile(x, window, quantile,
-                                            min_periods=min_periods, freq=freq,
-                                            center=center)
+            else:
+                qlow = float(idx) / float(values.shape[0] - 1)
+                qhig = float(idx + 1) / float(values.shape[0] - 1)
+                vlow = values[idx]
+                vhig = values[idx + 1]
+                retval = vlow + (vhig - vlow) * (per - qlow) / (qhig - qlow)
+
+            return retval
+
+        def quantile_func(x):
+            return scoreatpercentile(x, q)
+
+        self._check_moment_func(quantile_func, name='quantile',
+                                quantile=q)
+
+    def test_rolling_quantile_np_percentile(self):
+        # #9413: Tests that rolling window's quantile default behavior
+        # is analogus to Numpy's percentile
+        row = 10
+        col = 5
+        idx = pd.date_range('20100101', periods=row, freq='B')
+        df = DataFrame(np.random.rand(row * col).reshape((row, -1)), index=idx)
+
+        df_quantile = df.quantile([0.25, 0.5, 0.75], axis=0)
+        np_percentile = np.percentile(df, [25, 50, 75], axis=0)
+
+        tm.assert_almost_equal(df_quantile.values, np.array(np_percentile))
+
+    @pytest.mark.parametrize('quantile', [0.0, 0.1, 0.45, 0.5, 1])
+    @pytest.mark.parametrize('interpolation', ['linear', 'lower', 'higher',
+                                               'nearest', 'midpoint'])
+    @pytest.mark.parametrize('data', [[1., 2., 3., 4., 5., 6., 7.],
+                                      [8., 1., 3., 4., 5., 2., 6., 7.],
+                                      [0., np.nan, 0.2, np.nan, 0.4],
+                                      [np.nan, np.nan, np.nan, np.nan],
+                                      [np.nan, 0.1, np.nan, 0.3, 0.4, 0.5],
+                                      [0.5], [np.nan, 0.7, 0.6]])
+    def test_rolling_quantile_interpolation_options(self, quantile,
+                                                    interpolation, data):
+        # Tests that rolling window's quantile behavior is analogous to
+        # Series' quantile for each interpolation option
+        s = Series(data)
+
+        q1 = s.quantile(quantile, interpolation)
+        q2 = s.expanding(min_periods=1).quantile(
+            quantile, interpolation).iloc[-1]
+
+        if np.isnan(q1):
+            assert np.isnan(q2)
+        else:
+            assert q1 == q2
 
-            def alt(x):
-                return scoreatpercentile(x, q)
+    def test_invalid_quantile_value(self):
+        data = np.arange(5)
+        s = Series(data)
 
-            self._check_moment_func(f, alt, name='quantile', quantile=q)
+        with pytest.raises(ValueError, match="Interpolation 'invalid'"
+                                             " is not supported"):
+            s.rolling(len(data), min_periods=1).quantile(
+                0.5, interpolation='invalid')
 
     def test_rolling_quantile_param(self):
         ser = Series([0.0, .1, .5, .9, 1.0])
 
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             ser.rolling(3).quantile(-0.1)
 
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             ser.rolling(3).quantile(10.0)
 
-        with self.assertRaises(TypeError):
+        with pytest.raises(TypeError):
             ser.rolling(3).quantile('foo')
 
-    def test_rolling_apply(self):
+    def test_rolling_apply(self, raw):
         # suppress warnings about empty slices, as we are deliberately testing
         # with a 0-length Series
+
         with warnings.catch_warnings():
             warnings.filterwarnings("ignore",
                                     message=".*(empty slice|0 for slice).*",
                                     category=RuntimeWarning)
 
-            ser = Series([])
-            tm.assert_series_equal(ser,
-                                   ser.rolling(10).apply(lambda x: x.mean()))
+            def f(x):
+                return x[np.isfinite(x)].mean()
 
-            f = lambda x: x[np.isfinite(x)].mean()
+            self._check_moment_func(np.mean, name='apply', func=f, raw=raw)
 
-            def roll_mean(x, window, min_periods=None, freq=None, center=False,
-                          **kwargs):
-                return mom.rolling_apply(x, window, func=f,
-                                         min_periods=min_periods, freq=freq,
-                                         center=center)
-
-            self._check_moment_func(roll_mean, np.mean, name='apply', func=f)
+            expected = Series([])
+            result = expected.rolling(10).apply(lambda x: x.mean(), raw=raw)
+            tm.assert_series_equal(result, expected)
 
-        # GH 8080
+        # gh-8080
         s = Series([None, None, None])
-        result = s.rolling(2, min_periods=0).apply(lambda x: len(x))
+        result = s.rolling(2, min_periods=0).apply(lambda x: len(x), raw=raw)
         expected = Series([1., 2., 2.])
         tm.assert_series_equal(result, expected)
 
-        result = s.rolling(2, min_periods=0).apply(len)
+        result = s.rolling(2, min_periods=0).apply(len, raw=raw)
         tm.assert_series_equal(result, expected)
 
-    def test_rolling_apply_out_of_bounds(self):
-        # #1850
-        arr = np.arange(4)
+    @pytest.mark.parametrize('klass', [Series, DataFrame])
+    @pytest.mark.parametrize(
+        'method', [lambda x: x.rolling(window=2), lambda x: x.expanding()])
+    def test_apply_future_warning(self, klass, method):
 
-        # it works!
-        with catch_warnings(record=True):
-            result = mom.rolling_apply(arr, 10, np.sum)
-        self.assertTrue(isnull(result).all())
+        # gh-5071
+        s = klass(np.arange(3))
 
-        with catch_warnings(record=True):
-            result = mom.rolling_apply(arr, 10, np.sum, min_periods=1)
-        tm.assert_almost_equal(result, result)
+        with tm.assert_produces_warning(FutureWarning):
+            method(s).apply(lambda x: len(x))
+
+    def test_rolling_apply_out_of_bounds(self, raw):
+        # gh-1850
+        vals = pd.Series([1, 2, 3, 4])
+
+        result = vals.rolling(10).apply(np.sum, raw=raw)
+        assert result.isna().all()
+
+        result = vals.rolling(10, min_periods=1).apply(np.sum, raw=raw)
+        expected = pd.Series([1, 3, 6, 10], dtype=float)
+        tm.assert_almost_equal(result, expected)
+
+    @pytest.mark.parametrize('window', [2, '2s'])
+    def test_rolling_apply_with_pandas_objects(self, window):
+        # 5071
+        df = pd.DataFrame({'A': np.random.randn(5),
+                           'B': np.random.randint(0, 10, size=5)},
+                          index=pd.date_range('20130101', periods=5, freq='s'))
+
+        # we have an equal spaced timeseries index
+        # so simulate removing the first period
+        def f(x):
+            if x.index[0] == df.index[0]:
+                return np.nan
+            return x.iloc[-1]
+
+        result = df.rolling(window).apply(f, raw=False)
+        expected = df.iloc[2:].reindex_like(df)
+        tm.assert_frame_equal(result, expected)
+
+        with pytest.raises(AttributeError):
+            df.rolling(window).apply(f, raw=True)
 
     def test_rolling_std(self):
-        self._check_moment_func(mom.rolling_std, lambda x: np.std(x, ddof=1),
+        self._check_moment_func(lambda x: np.std(x, ddof=1),
                                 name='std')
-        self._check_moment_func(mom.rolling_std, lambda x: np.std(x, ddof=0),
+        self._check_moment_func(lambda x: np.std(x, ddof=0),
                                 name='std', ddof=0)
 
     def test_rolling_std_1obs(self):
-        with catch_warnings(record=True):
-            result = mom.rolling_std(np.array([1., 2., 3., 4., 5.]),
-                                     1, min_periods=1)
-        expected = np.array([np.nan] * 5)
-        tm.assert_almost_equal(result, expected)
+        vals = pd.Series([1., 2., 3., 4., 5.])
 
-        with catch_warnings(record=True):
-            result = mom.rolling_std(np.array([1., 2., 3., 4., 5.]),
-                                     1, min_periods=1, ddof=0)
-        expected = np.zeros(5)
-        tm.assert_almost_equal(result, expected)
+        result = vals.rolling(1, min_periods=1).std()
+        expected = pd.Series([np.nan] * 5)
+        tm.assert_series_equal(result, expected)
 
-        with catch_warnings(record=True):
-            result = mom.rolling_std(np.array([np.nan, np.nan, 3., 4., 5.]),
-                                     3, min_periods=2)
-        self.assertTrue(np.isnan(result[2]))
+        result = vals.rolling(1, min_periods=1).std(ddof=0)
+        expected = pd.Series([0.] * 5)
+        tm.assert_series_equal(result, expected)
+
+        result = (pd.Series([np.nan, np.nan, 3, 4, 5])
+                    .rolling(3, min_periods=2).std())
+        assert np.isnan(result[2])
 
     def test_rolling_std_neg_sqrt(self):
         # unit test from Bottleneck
 
         # Test move_nanstd for neg sqrt.
 
-        a = np.array([0.0011448196318903589, 0.00028718669878572767,
-                      0.00028718669878572767, 0.00028718669878572767,
-                      0.00028718669878572767])
-        with catch_warnings(record=True):
-            b = mom.rolling_std(a, window=3)
-        self.assertTrue(np.isfinite(b[2:]).all())
+        a = pd.Series([0.0011448196318903589, 0.00028718669878572767,
+                       0.00028718669878572767, 0.00028718669878572767,
+                       0.00028718669878572767])
+        b = a.rolling(window=3).std()
+        assert np.isfinite(b[2:]).all()
 
-        with catch_warnings(record=True):
-            b = mom.ewmstd(a, span=3)
-        self.assertTrue(np.isfinite(b[2:]).all())
+        b = a.ewm(span=3).std()
+        assert np.isfinite(b[2:]).all()
 
     def test_rolling_var(self):
-        self._check_moment_func(mom.rolling_var, lambda x: np.var(x, ddof=1),
-                                test_stable=True, name='var')
-        self._check_moment_func(mom.rolling_var, lambda x: np.var(x, ddof=0),
+        self._check_moment_func(lambda x: np.var(x, ddof=1),
+                                name='var')
+        self._check_moment_func(lambda x: np.var(x, ddof=0),
                                 name='var', ddof=0)
 
+    @td.skip_if_no_scipy
     def test_rolling_skew(self):
-        try:
-            from scipy.stats import skew
-        except ImportError:
-            pytest.skip('no scipy')
-        self._check_moment_func(mom.rolling_skew,
-                                lambda x: skew(x, bias=False), name='skew')
+        from scipy.stats import skew
+        self._check_moment_func(lambda x: skew(x, bias=False), name='skew')
 
+    @td.skip_if_no_scipy
     def test_rolling_kurt(self):
-        try:
-            from scipy.stats import kurtosis
-        except ImportError:
-            pytest.skip('no scipy')
-        self._check_moment_func(mom.rolling_kurt,
-                                lambda x: kurtosis(x, bias=False), name='kurt')
-
-    def test_fperr_robustness(self):
-        # TODO: remove this once python 2.5 out of picture
-        if PY3:
-            pytest.skip("doesn't work on python 3")
+        from scipy.stats import kurtosis
+        self._check_moment_func(lambda x: kurtosis(x, bias=False),
+                                name='kurt')
 
-        # #2114
-        data = '\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1a@\xaa\xaa\xaa\xaa\xaa\xaa\x02@8\x8e\xe38\x8e\xe3\xe8?z\t\xed%\xb4\x97\xd0?\xa2\x0c<\xdd\x9a\x1f\xb6?\x82\xbb\xfa&y\x7f\x9d?\xac\'\xa7\xc4P\xaa\x83?\x90\xdf\xde\xb0k8j?`\xea\xe9u\xf2zQ?*\xe37\x9d\x98N7?\xe2.\xf5&v\x13\x1f?\xec\xc9\xf8\x19\xa4\xb7\x04?\x90b\xf6w\x85\x9f\xeb>\xb5A\xa4\xfaXj\xd2>F\x02\xdb\xf8\xcb\x8d\xb8>.\xac<\xfb\x87^\xa0>\xe8:\xa6\xf9_\xd3\x85>\xfb?\xe2cUU\xfd?\xfc\x7fA\xed8\x8e\xe3?\xa5\xaa\xac\x91\xf6\x12\xca?n\x1cs\xb6\xf9a\xb1?\xe8%D\xf3L-\x97?5\xddZD\x11\xe7~?#>\xe7\x82\x0b\x9ad?\xd9R4Y\x0fxK?;7x;\nP2?N\xf4JO\xb8j\x18?4\xf81\x8a%G\x00?\x9a\xf5\x97\r2\xb4\xe5>\xcd\x9c\xca\xbcB\xf0\xcc>3\x13\x87(\xd7J\xb3>\x99\x19\xb4\xe0\x1e\xb9\x99>ff\xcd\x95\x14&\x81>\x88\x88\xbc\xc7p\xddf>`\x0b\xa6_\x96|N>@\xb2n\xea\x0eS4>U\x98\x938i\x19\x1b>\x8eeb\xd0\xf0\x10\x02>\xbd\xdc-k\x96\x16\xe8=(\x93\x1e\xf2\x0e\x0f\xd0=\xe0n\xd3Bii\xb5=*\xe9\x19Y\x8c\x8c\x9c=\xc6\xf0\xbb\x90]\x08\x83=]\x96\xfa\xc0|`i=>d\xfc\xd5\xfd\xeaP=R0\xfb\xc7\xa7\x8e6=\xc2\x95\xf9_\x8a\x13\x1e=\xd6c\xa6\xea\x06\r\x04=r\xda\xdd8\t\xbc\xea<\xf6\xe6\x93\xd0\xb0\xd2\xd1<\x9d\xdeok\x96\xc3\xb7<&~\xea9s\xaf\x9f<UUUUUU\x13@q\x1c\xc7q\x1c\xc7\xf9?\xf6\x12\xdaKh/\xe1?\xf2\xc3"e\xe0\xe9\xc6?\xed\xaf\x831+\x8d\xae?\xf3\x1f\xad\xcb\x1c^\x94?\x15\x1e\xdd\xbd>\xb8\x02@\xc6\xd2&\xfd\xa8\xf5\xe8?\xd9\xe1\x19\xfe\xc5\xa3\xd0?v\x82"\xa8\xb2/\xb6?\x9dX\x835\xee\x94\x9d?h\x90W\xce\x9e\xb8\x83?\x8a\xc0th~Kj?\\\x80\xf8\x9a\xa9\x87Q?%\xab\xa0\xce\x8c_7?1\xe4\x80\x13\x11*\x1f? \x98\x00\r\xb6\xc6\x04?\x80u\xabf\x9d\xb3\xeb>UNrD\xbew\xd2>\x1c\x13C[\xa8\x9f\xb8>\x12b\xd7<pj\xa0>m-\x1fQ@\xe3\x85>\xe6\x91)l\x00/m>Da\xc6\xf2\xaatS>\x05\xd7]\xee\xe3\xf09>'  # noqa
+    def _check_moment_func(self, static_comp, name, has_min_periods=True,
+                           has_center=True, has_time_rule=True,
+                           fill_value=None, zero_min_periods_equal=True,
+                           **kwargs):
 
-        arr = np.frombuffer(data, dtype='<f8')
-        if sys.byteorder != "little":
-            arr = arr.byteswap().newbyteorder()
-
-        with catch_warnings(record=True):
-            result = mom.rolling_sum(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        with catch_warnings(record=True):
-            result = mom.rolling_mean(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        with catch_warnings(record=True):
-            result = mom.rolling_var(arr, 2)
-        self.assertTrue((result[1:] >= 0).all())
-
-        # #2527, ugh
-        arr = np.array([0.00012456, 0.0003, 0])
-        with catch_warnings(record=True):
-            result = mom.rolling_mean(arr, 1)
-        self.assertTrue(result[-1] >= 0)
-
-        with catch_warnings(record=True):
-            result = mom.rolling_mean(-arr, 1)
-        self.assertTrue(result[-1] <= 0)
-
-    def _check_moment_func(self, f, static_comp, name=None, window=50,
-                           has_min_periods=True, has_center=True,
-                           has_time_rule=True, preserve_nan=True,
-                           fill_value=None, test_stable=False, **kwargs):
-
-        with warnings.catch_warnings(record=True):
-            self._check_ndarray(f, static_comp, window=window,
-                                has_min_periods=has_min_periods,
-                                preserve_nan=preserve_nan,
-                                has_center=has_center, fill_value=fill_value,
-                                test_stable=test_stable, **kwargs)
-
-        with warnings.catch_warnings(record=True):
-            self._check_structures(f, static_comp,
-                                   has_min_periods=has_min_periods,
-                                   has_time_rule=has_time_rule,
-                                   fill_value=fill_value,
-                                   has_center=has_center, **kwargs)
-
-        # new API
-        if name is not None:
-            self._check_structures(f, static_comp, name=name,
-                                   has_min_periods=has_min_periods,
-                                   has_time_rule=has_time_rule,
-                                   fill_value=fill_value,
-                                   has_center=has_center, **kwargs)
-
-    def _check_ndarray(self, f, static_comp, window=50, has_min_periods=True,
-                       preserve_nan=True, has_center=True, fill_value=None,
-                       test_stable=False, test_window=True, **kwargs):
-        def get_result(arr, window, min_periods=None, center=False):
-            return f(arr, window, min_periods=min_periods, center=center, **
-                     kwargs)
-
-        result = get_result(self.arr, window)
-        tm.assert_almost_equal(result[-1], static_comp(self.arr[-50:]))
-
-        if preserve_nan:
-            assert (np.isnan(result[self._nan_locs]).all())
-
-        # excluding NaNs correctly
-        arr = randn(50)
-        arr[:10] = np.NaN
-        arr[-10:] = np.NaN
-
-        if has_min_periods:
-            result = get_result(arr, 50, min_periods=30)
-            tm.assert_almost_equal(result[-1], static_comp(arr[10:-10]))
-
-            # min_periods is working correctly
-            result = get_result(arr, 20, min_periods=15)
-            self.assertTrue(np.isnan(result[23]))
-            self.assertFalse(np.isnan(result[24]))
-
-            self.assertFalse(np.isnan(result[-6]))
-            self.assertTrue(np.isnan(result[-5]))
-
-            arr2 = randn(20)
-            result = get_result(arr2, 10, min_periods=5)
-            self.assertTrue(isnull(result[3]))
-            self.assertTrue(notnull(result[4]))
-
-            # min_periods=0
-            result0 = get_result(arr, 20, min_periods=0)
-            result1 = get_result(arr, 20, min_periods=1)
-            tm.assert_almost_equal(result0, result1)
-        else:
-            result = get_result(arr, 50)
-            tm.assert_almost_equal(result[-1], static_comp(arr[10:-10]))
-
-        # GH 7925
-        if has_center:
-            if has_min_periods:
-                result = get_result(arr, 20, min_periods=15, center=True)
-                expected = get_result(
-                    np.concatenate((arr, np.array([np.NaN] * 9))), 20,
-                    min_periods=15)[9:]
-            else:
-                result = get_result(arr, 20, center=True)
-                expected = get_result(
-                    np.concatenate((arr, np.array([np.NaN] * 9))), 20)[9:]
-
-            self.assert_numpy_array_equal(result, expected)
-
-        if test_stable:
-            result = get_result(self.arr + 1e9, window)
-            tm.assert_almost_equal(result[-1],
-                                   static_comp(self.arr[-50:] + 1e9))
-
-        # Test window larger than array, #7297
-        if test_window:
-            if has_min_periods:
-                for minp in (0, len(self.arr) - 1, len(self.arr)):
-                    result = get_result(self.arr, len(self.arr) + 1,
-                                        min_periods=minp)
-                    expected = get_result(self.arr, len(self.arr),
-                                          min_periods=minp)
-                    nan_mask = np.isnan(result)
-                    self.assertTrue(np.array_equal(nan_mask, np.isnan(
-                        expected)))
-                    nan_mask = ~nan_mask
-                    tm.assert_almost_equal(result[nan_mask],
-                                           expected[nan_mask])
-            else:
-                result = get_result(self.arr, len(self.arr) + 1)
-                expected = get_result(self.arr, len(self.arr))
-                nan_mask = np.isnan(result)
-                self.assertTrue(np.array_equal(nan_mask, np.isnan(expected)))
-                nan_mask = ~nan_mask
-                tm.assert_almost_equal(result[nan_mask], expected[nan_mask])
-
-    def _check_structures(self, f, static_comp, name=None,
-                          has_min_periods=True, has_time_rule=True,
-                          has_center=True, fill_value=None, **kwargs):
-        def get_result(obj, window, min_periods=None, freq=None, center=False):
-
-            # check via the API calls if name is provided
-            if name is not None:
-
-                # catch a freq deprecation warning if freq is provided and not
-                # None
-                with catch_warnings(record=True):
-                    r = obj.rolling(window=window, min_periods=min_periods,
-                                    freq=freq, center=center)
-                return getattr(r, name)(**kwargs)
-
-            # check via the moments API
-            with catch_warnings(record=True):
-                return f(obj, window=window, min_periods=min_periods,
-                         freq=freq, center=center, **kwargs)
+        def get_result(obj, window, min_periods=None, center=False):
+            r = obj.rolling(window=window, min_periods=min_periods,
+                            center=center)
+            return getattr(r, name)(**kwargs)
 
         series_result = get_result(self.series, window=50)
-        frame_result = get_result(self.frame, window=50)
+        assert isinstance(series_result, Series)
+        tm.assert_almost_equal(series_result.iloc[-1],
+                               static_comp(self.series[-50:]))
 
-        tm.assertIsInstance(series_result, Series)
-        self.assertEqual(type(frame_result), DataFrame)
+        frame_result = get_result(self.frame, window=50)
+        assert isinstance(frame_result, DataFrame)
+        tm.assert_series_equal(
+            frame_result.iloc[-1, :],
+            self.frame.iloc[-50:, :].apply(static_comp, axis=0, raw=raw),
+            check_names=False)
 
         # check time_rule works
         if has_time_rule:
             win = 25
             minp = 10
+            series = self.series[::2].resample('B').mean()
+            frame = self.frame[::2].resample('B').mean()
 
             if has_min_periods:
-                series_result = get_result(self.series[::2], window=win,
-                                           min_periods=minp, freq='B')
-                frame_result = get_result(self.frame[::2], window=win,
-                                          min_periods=minp, freq='B')
+                series_result = get_result(series, window=win,
+                                           min_periods=minp)
+                frame_result = get_result(frame, window=win,
+                                          min_periods=minp)
             else:
-                series_result = get_result(self.series[::2], window=win,
-                                           freq='B')
-                frame_result = get_result(self.frame[::2], window=win,
-                                          freq='B')
+                series_result = get_result(series, window=win)
+                frame_result = get_result(frame, window=win)
 
             last_date = series_result.index[-1]
             prev_date = last_date - 24 * offsets.BDay()
@@ -1395,15 +1561,79 @@ def get_result(obj, window, min_periods=None, freq=None, center=False):
             trunc_series = self.series[::2].truncate(prev_date, last_date)
             trunc_frame = self.frame[::2].truncate(prev_date, last_date)
 
-            self.assertAlmostEqual(series_result[-1],
+            tm.assert_almost_equal(series_result[-1],
                                    static_comp(trunc_series))
 
             tm.assert_series_equal(frame_result.xs(last_date),
-                                   trunc_frame.apply(static_comp),
+                                   trunc_frame.apply(static_comp, raw=raw),
                                    check_names=False)
 
-        # GH 7925
+        # excluding NaNs correctly
+        obj = Series(randn(50))
+        obj[:10] = np.NaN
+        obj[-10:] = np.NaN
+        if has_min_periods:
+            result = get_result(obj, 50, min_periods=30)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(obj[10:-10]))
+
+            # min_periods is working correctly
+            result = get_result(obj, 20, min_periods=15)
+            assert isna(result.iloc[23])
+            assert not isna(result.iloc[24])
+
+            assert not isna(result.iloc[-6])
+            assert isna(result.iloc[-5])
+
+            obj2 = Series(randn(20))
+            result = get_result(obj2, 10, min_periods=5)
+            assert isna(result.iloc[3])
+            assert notna(result.iloc[4])
+
+            if zero_min_periods_equal:
+                # min_periods=0 may be equivalent to min_periods=1
+                result0 = get_result(obj, 20, min_periods=0)
+                result1 = get_result(obj, 20, min_periods=1)
+                tm.assert_almost_equal(result0, result1)
+        else:
+            result = get_result(obj, 50)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(obj[10:-10]))
+
+        # window larger than series length (#7297)
+        if has_min_periods:
+            for minp in (0, len(self.series) - 1, len(self.series)):
+                result = get_result(self.series, len(self.series) + 1,
+                                    min_periods=minp)
+                expected = get_result(self.series, len(self.series),
+                                      min_periods=minp)
+                nan_mask = isna(result)
+                tm.assert_series_equal(nan_mask, isna(expected))
+
+                nan_mask = ~nan_mask
+                tm.assert_almost_equal(result[nan_mask],
+                                       expected[nan_mask])
+        else:
+            result = get_result(self.series, len(self.series) + 1)
+            expected = get_result(self.series, len(self.series))
+            nan_mask = isna(result)
+            tm.assert_series_equal(nan_mask, isna(expected))
+
+            nan_mask = ~nan_mask
+            tm.assert_almost_equal(result[nan_mask], expected[nan_mask])
+
+        # check center=True
         if has_center:
+            if has_min_periods:
+                result = get_result(obj, 20, min_periods=15, center=True)
+                expected = get_result(
+                    pd.concat([obj, Series([np.NaN] * 9)]), 20,
+                    min_periods=15)[9:].reset_index(drop=True)
+            else:
+                result = get_result(obj, 20, center=True)
+                expected = get_result(
+                    pd.concat([obj, Series([np.NaN] * 9)]),
+                    20)[9:].reset_index(drop=True)
+
+            tm.assert_series_equal(result, expected)
 
             # shifter index
             s = ['x%d' % x for x in range(12)]
@@ -1443,34 +1673,27 @@ def get_result(obj, window, min_periods=None, freq=None, center=False):
             tm.assert_frame_equal(frame_xp, frame_rs)
 
     def test_ewma(self):
-        self._check_ew(mom.ewma, name='mean')
+        self._check_ew(name='mean')
 
-        arr = np.zeros(1000)
-        arr[5] = 1
-        with catch_warnings(record=True):
-            result = mom.ewma(arr, span=100, adjust=False).sum()
-        self.assertTrue(np.abs(result - 1) < 1e-2)
+        vals = pd.Series(np.zeros(1000))
+        vals[5] = 1
+        result = vals.ewm(span=100, adjust=False).mean().sum()
+        assert np.abs(result - 1) < 1e-2
+
+    @pytest.mark.parametrize('adjust', [True, False])
+    @pytest.mark.parametrize('ignore_na', [True, False])
+    def test_ewma_cases(self, adjust, ignore_na):
+        # try adjust/ignore_na args matrix
 
         s = Series([1.0, 2.0, 4.0, 8.0])
 
-        expected = Series([1.0, 1.6, 2.736842, 4.923077])
-        for f in [lambda s: s.ewm(com=2.0, adjust=True).mean(),
-                  lambda s: s.ewm(com=2.0, adjust=True,
-                                  ignore_na=False).mean(),
-                  lambda s: s.ewm(com=2.0, adjust=True, ignore_na=True).mean(),
-                  ]:
-            result = f(s)
-            tm.assert_series_equal(result, expected)
+        if adjust:
+            expected = Series([1.0, 1.6, 2.736842, 4.923077])
+        else:
+            expected = Series([1.0, 1.333333, 2.222222, 4.148148])
 
-        expected = Series([1.0, 1.333333, 2.222222, 4.148148])
-        for f in [lambda s: s.ewm(com=2.0, adjust=False).mean(),
-                  lambda s: s.ewm(com=2.0, adjust=False,
-                                  ignore_na=False).mean(),
-                  lambda s: s.ewm(com=2.0, adjust=False,
-                                  ignore_na=True).mean(),
-                  ]:
-            result = f(s)
-            tm.assert_series_equal(result, expected)
+        result = s.ewm(com=2.0, adjust=adjust, ignore_na=ignore_na).mean()
+        tm.assert_series_equal(result, expected)
 
     def test_ewma_nan_handling(self):
         s = Series([1.] + [np.nan] * 5 + [1.])
@@ -1528,55 +1751,34 @@ def simple_wma(s, w):
                 tm.assert_series_equal(result, expected)
 
     def test_ewmvar(self):
-        self._check_ew(mom.ewmvar, name='var')
+        self._check_ew(name='var')
 
     def test_ewmvol(self):
-        self._check_ew(mom.ewmvol, name='vol')
+        self._check_ew(name='vol')
 
     def test_ewma_span_com_args(self):
-        with catch_warnings(record=True):
-            A = mom.ewma(self.arr, com=9.5)
-            B = mom.ewma(self.arr, span=20)
-            tm.assert_almost_equal(A, B)
+        A = self.series.ewm(com=9.5).mean()
+        B = self.series.ewm(span=20).mean()
+        tm.assert_almost_equal(A, B)
 
-            self.assertRaises(ValueError, mom.ewma, self.arr, com=9.5, span=20)
-            self.assertRaises(ValueError, mom.ewma, self.arr)
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, span=20)
+        with pytest.raises(ValueError):
+            self.series.ewm().mean()
 
     def test_ewma_halflife_arg(self):
-        with catch_warnings(record=True):
-            A = mom.ewma(self.arr, com=13.932726172912965)
-            B = mom.ewma(self.arr, halflife=10.0)
-            tm.assert_almost_equal(A, B)
-
-            self.assertRaises(ValueError, mom.ewma, self.arr, span=20,
-                              halflife=50)
-            self.assertRaises(ValueError, mom.ewma, self.arr, com=9.5,
-                              halflife=50)
-            self.assertRaises(ValueError, mom.ewma, self.arr, com=9.5, span=20,
-                              halflife=50)
-            self.assertRaises(ValueError, mom.ewma, self.arr)
-
-    def test_ewma_alpha_old_api(self):
-        # GH 10789
-        with catch_warnings(record=True):
-            a = mom.ewma(self.arr, alpha=0.61722699889169674)
-            b = mom.ewma(self.arr, com=0.62014947789973052)
-            c = mom.ewma(self.arr, span=2.240298955799461)
-            d = mom.ewma(self.arr, halflife=0.721792864318)
-            tm.assert_numpy_array_equal(a, b)
-            tm.assert_numpy_array_equal(a, c)
-            tm.assert_numpy_array_equal(a, d)
-
-    def test_ewma_alpha_arg_old_api(self):
-        # GH 10789
-        with catch_warnings(record=True):
-            self.assertRaises(ValueError, mom.ewma, self.arr)
-            self.assertRaises(ValueError, mom.ewma, self.arr,
-                              com=10.0, alpha=0.5)
-            self.assertRaises(ValueError, mom.ewma, self.arr,
-                              span=10.0, alpha=0.5)
-            self.assertRaises(ValueError, mom.ewma, self.arr,
-                              halflife=10.0, alpha=0.5)
+        A = self.series.ewm(com=13.932726172912965).mean()
+        B = self.series.ewm(halflife=10.0).mean()
+        tm.assert_almost_equal(A, B)
+
+        with pytest.raises(ValueError):
+            self.series.ewm(span=20, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm(com=9.5, span=20, halflife=50)
+        with pytest.raises(ValueError):
+            self.series.ewm()
 
     def test_ewm_alpha(self):
         # GH 10789
@@ -1591,54 +1793,70 @@ def test_ewm_alpha(self):
 
     def test_ewm_alpha_arg(self):
         # GH 10789
-        s = Series(self.arr)
-        self.assertRaises(ValueError, s.ewm)
-        self.assertRaises(ValueError, s.ewm, com=10.0, alpha=0.5)
-        self.assertRaises(ValueError, s.ewm, span=10.0, alpha=0.5)
-        self.assertRaises(ValueError, s.ewm, halflife=10.0, alpha=0.5)
+        s = self.series
+        with pytest.raises(ValueError):
+            s.ewm()
+        with pytest.raises(ValueError):
+            s.ewm(com=10.0, alpha=0.5)
+        with pytest.raises(ValueError):
+            s.ewm(span=10.0, alpha=0.5)
+        with pytest.raises(ValueError):
+            s.ewm(halflife=10.0, alpha=0.5)
 
     def test_ewm_domain_checks(self):
         # GH 12492
         s = Series(self.arr)
-        # com must satisfy: com >= 0
-        self.assertRaises(ValueError, s.ewm, com=-0.1)
+        msg = "comass must satisfy: comass >= 0"
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(com=-0.1)
         s.ewm(com=0.0)
         s.ewm(com=0.1)
-        # span must satisfy: span >= 1
-        self.assertRaises(ValueError, s.ewm, span=-0.1)
-        self.assertRaises(ValueError, s.ewm, span=0.0)
-        self.assertRaises(ValueError, s.ewm, span=0.9)
+
+        msg = "span must satisfy: span >= 1"
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(span=-0.1)
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(span=0.0)
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(span=0.9)
         s.ewm(span=1.0)
         s.ewm(span=1.1)
-        # halflife must satisfy: halflife > 0
-        self.assertRaises(ValueError, s.ewm, halflife=-0.1)
-        self.assertRaises(ValueError, s.ewm, halflife=0.0)
+
+        msg = "halflife must satisfy: halflife > 0"
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(halflife=-0.1)
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(halflife=0.0)
         s.ewm(halflife=0.1)
-        # alpha must satisfy: 0 < alpha <= 1
-        self.assertRaises(ValueError, s.ewm, alpha=-0.1)
-        self.assertRaises(ValueError, s.ewm, alpha=0.0)
+
+        msg = "alpha must satisfy: 0 < alpha <= 1"
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(alpha=-0.1)
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(alpha=0.0)
         s.ewm(alpha=0.1)
         s.ewm(alpha=1.0)
-        self.assertRaises(ValueError, s.ewm, alpha=1.1)
+        with pytest.raises(ValueError, match=msg):
+            s.ewm(alpha=1.1)
 
-    def test_ew_empty_arrays(self):
-        arr = np.array([], dtype=np.float64)
+    @pytest.mark.parametrize('method', ['mean', 'vol', 'var'])
+    def test_ew_empty_series(self, method):
+        vals = pd.Series([], dtype=np.float64)
 
-        funcs = [mom.ewma, mom.ewmvol, mom.ewmvar]
-        for f in funcs:
-            with catch_warnings(record=True):
-                result = f(arr, 3)
-            tm.assert_almost_equal(result, arr)
+        ewm = vals.ewm(3)
+        result = getattr(ewm, method)()
+        tm.assert_almost_equal(result, vals)
 
-    def _check_ew(self, func, name=None):
-        with catch_warnings(record=True):
-            self._check_ew_ndarray(func, name=name)
-        self._check_ew_structures(func, name=name)
+    def _check_ew(self, name=None, preserve_nan=False):
+        series_result = getattr(self.series.ewm(com=10), name)()
+        assert isinstance(series_result, Series)
+
+        frame_result = getattr(self.frame.ewm(com=10), name)()
+        assert type(frame_result) == DataFrame
 
-    def _check_ew_ndarray(self, func, preserve_nan=False, name=None):
-        result = func(self.arr, com=10)
+        result = getattr(self.series.ewm(com=10), name)()
         if preserve_nan:
-            assert (np.isnan(result[self._nan_locs]).all())
+            assert result[self._nan_locs].isna().all()
 
         # excluding NaNs correctly
         arr = randn(50)
@@ -1648,44 +1866,197 @@ def _check_ew_ndarray(self, func, preserve_nan=False, name=None):
 
         # check min_periods
         # GH 7898
-        result = func(s, 50, min_periods=2)
-        self.assertTrue(np.isnan(result.values[:11]).all())
-        self.assertFalse(np.isnan(result.values[11:]).any())
+        result = getattr(s.ewm(com=50, min_periods=2), name)()
+        assert result[:11].isna().all()
+        assert not result[11:].isna().any()
 
         for min_periods in (0, 1):
-            result = func(s, 50, min_periods=min_periods)
-            if func == mom.ewma:
-                self.assertTrue(np.isnan(result.values[:10]).all())
-                self.assertFalse(np.isnan(result.values[10:]).any())
+            result = getattr(s.ewm(com=50, min_periods=min_periods), name)()
+            if name == 'mean':
+                assert result[:10].isna().all()
+                assert not result[10:].isna().any()
             else:
-                # ewmstd, ewmvol, ewmvar (with bias=False) require at least two
-                # values
-                self.assertTrue(np.isnan(result.values[:11]).all())
-                self.assertFalse(np.isnan(result.values[11:]).any())
+                # ewm.std, ewm.vol, ewm.var (with bias=False) require at least
+                # two values
+                assert result[:11].isna().all()
+                assert not result[11:].isna().any()
 
             # check series of length 0
-            result = func(Series([]), 50, min_periods=min_periods)
-            tm.assert_series_equal(result, Series([]))
+            result = getattr(Series().ewm(com=50, min_periods=min_periods),
+                             name)()
+            tm.assert_series_equal(result, Series())
 
             # check series of length 1
-            result = func(Series([1.]), 50, min_periods=min_periods)
-            if func == mom.ewma:
+            result = getattr(Series([1.]).ewm(50, min_periods=min_periods),
+                             name)()
+            if name == 'mean':
                 tm.assert_series_equal(result, Series([1.]))
             else:
-                # ewmstd, ewmvol, ewmvar with bias=False require at least two
-                # values
+                # ewm.std, ewm.vol, ewm.var with bias=False require at least
+                # two values
                 tm.assert_series_equal(result, Series([np.NaN]))
 
         # pass in ints
-        result2 = func(np.arange(50), span=10)
-        self.assertEqual(result2.dtype, np.float_)
-
-    def _check_ew_structures(self, func, name):
-        series_result = getattr(self.series.ewm(com=10), name)()
-        tm.assertIsInstance(series_result, Series)
-
-        frame_result = getattr(self.frame.ewm(com=10), name)()
-        self.assertEqual(type(frame_result), DataFrame)
+        result2 = getattr(Series(np.arange(50)).ewm(span=10), name)()
+        assert result2.dtype == np.float_
+
+
+class TestPairwise(object):
+
+    # GH 7738
+    df1s = [DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0, 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 0]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]],
+                      columns=['C', 'C']),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1., 0]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0., 1]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=['C', 1]),
+            DataFrame([[2., 4.], [1., 2.], [5., 2.], [8., 1.]],
+                      columns=[1, 0.]),
+            DataFrame([[2, 4.], [1, 2.], [5, 2.], [8, 1.]],
+                      columns=[0, 1.]),
+            DataFrame([[2, 4], [1, 2], [5, 2], [8, 1.]],
+                      columns=[1., 'X']), ]
+    df2 = DataFrame([[None, 1, 1], [None, 1, 2],
+                     [None, 3, 2], [None, 8, 1]], columns=['Y', 'Z', 'X'])
+    s = Series([1, 1, 3, 8])
+
+    def compare(self, result, expected):
+
+        # since we have sorted the results
+        # we can only compare non-nans
+        result = result.dropna().values
+        expected = expected.dropna().values
+
+        tm.assert_numpy_array_equal(result, expected, check_dtype=False)
+
+    @pytest.mark.parametrize('f', [lambda x: x.cov(), lambda x: x.corr()])
+    def test_no_flex(self, f):
+
+        # DataFrame methods (which do not call _flex_binary_moment())
+
+        results = [f(df) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.columns)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x: x.expanding().cov(pairwise=True),
+              lambda x: x.expanding().corr(pairwise=True),
+              lambda x: x.rolling(window=3).cov(pairwise=True),
+              lambda x: x.rolling(window=3).corr(pairwise=True),
+              lambda x: x.ewm(com=3).cov(pairwise=True),
+              lambda x: x.ewm(com=3).corr(pairwise=True)])
+    def test_pairwise_with_self(self, f):
+
+        # DataFrame with itself, pairwise=True
+        # note that we may construct the 1st level of the MI
+        # in a non-motononic way, so compare accordingly
+        results = []
+        for i, df in enumerate(self.df1s):
+            result = f(df)
+            tm.assert_index_equal(result.index.levels[0],
+                                  df.index,
+                                  check_names=False)
+            tm.assert_numpy_array_equal(safe_sort(result.index.levels[1]),
+                                        safe_sort(df.columns.unique()))
+            tm.assert_index_equal(result.columns, df.columns)
+            results.append(df)
+
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x: x.expanding().cov(pairwise=False),
+              lambda x: x.expanding().corr(pairwise=False),
+              lambda x: x.rolling(window=3).cov(pairwise=False),
+              lambda x: x.rolling(window=3).corr(pairwise=False),
+              lambda x: x.ewm(com=3).cov(pairwise=False),
+              lambda x: x.ewm(com=3).corr(pairwise=False), ])
+    def test_no_pairwise_with_self(self, f):
+
+        # DataFrame with itself, pairwise=False
+        results = [f(df) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.index)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y, pairwise=True),
+              lambda x, y: x.expanding().corr(y, pairwise=True),
+              lambda x, y: x.rolling(window=3).cov(y, pairwise=True),
+              lambda x, y: x.rolling(window=3).corr(y, pairwise=True),
+              lambda x, y: x.ewm(com=3).cov(y, pairwise=True),
+              lambda x, y: x.ewm(com=3).corr(y, pairwise=True), ])
+    def test_pairwise_with_other(self, f):
+
+        # DataFrame with another DataFrame, pairwise=True
+        results = [f(df, self.df2) for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index.levels[0],
+                                  df.index,
+                                  check_names=False)
+            tm.assert_numpy_array_equal(safe_sort(result.index.levels[1]),
+                                        safe_sort(self.df2.columns.unique()))
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y, pairwise=False),
+              lambda x, y: x.expanding().corr(y, pairwise=False),
+              lambda x, y: x.rolling(window=3).cov(y, pairwise=False),
+              lambda x, y: x.rolling(window=3).corr(y, pairwise=False),
+              lambda x, y: x.ewm(com=3).cov(y, pairwise=False),
+              lambda x, y: x.ewm(com=3).corr(y, pairwise=False), ])
+    def test_no_pairwise_with_other(self, f):
+
+        # DataFrame with another DataFrame, pairwise=False
+        results = [f(df, self.df2) if df.columns.is_unique else None
+                   for df in self.df1s]
+        for (df, result) in zip(self.df1s, results):
+            if result is not None:
+                with catch_warnings(record=True):
+                    warnings.simplefilter("ignore", RuntimeWarning)
+                    # we can have int and str columns
+                    expected_index = df.index.union(self.df2.index)
+                    expected_columns = df.columns.union(self.df2.columns)
+                tm.assert_index_equal(result.index, expected_index)
+                tm.assert_index_equal(result.columns, expected_columns)
+            else:
+                with pytest.raises(ValueError,
+                                   match="'arg1' columns are not unique"):
+                    f(df, self.df2)
+                with pytest.raises(ValueError,
+                                   match="'arg2' columns are not unique"):
+                    f(self.df2, df)
+
+    @pytest.mark.parametrize(
+        'f', [lambda x, y: x.expanding().cov(y),
+              lambda x, y: x.expanding().corr(y),
+              lambda x, y: x.rolling(window=3).cov(y),
+              lambda x, y: x.rolling(window=3).corr(y),
+              lambda x, y: x.ewm(com=3).cov(y),
+              lambda x, y: x.ewm(com=3).corr(y), ])
+    def test_pairwise_with_series(self, f):
+
+        # DataFrame with a Series
+        results = ([f(df, self.s) for df in self.df1s] +
+                   [f(self.s, df) for df in self.df1s])
+        for (df, result) in zip(self.df1s, results):
+            tm.assert_index_equal(result.index, df.index)
+            tm.assert_index_equal(result.columns, df.columns)
+        for i, result in enumerate(results):
+            if i > 0:
+                self.compare(result, results[0])
 
 
 # create the data only once as we are not setting it
@@ -1730,10 +2101,10 @@ def create_dataframes():
 
     def is_constant(x):
         values = x.values.ravel()
-        return len(set(values[notnull(values)])) == 1
+        return len(set(values[notna(values)])) == 1
 
     def no_nans(x):
-        return x.notnull().all().all()
+        return x.notna().all().all()
 
     # data is a tuple(object, is_contant, no_nans)
     data = create_series() + create_dataframes()
@@ -1744,6 +2115,15 @@ def no_nans(x):
 _consistency_data = _create_consistency_data()
 
 
+def _rolling_consistency_cases():
+    for window in [1, 2, 3, 10, 20]:
+        for min_periods in {0, 1, 2, 3, 4, window}:
+            if min_periods and (min_periods > window):
+                continue
+            for center in [False, True]:
+                yield window, min_periods, center
+
+
 class TestMomentsConsistency(Base):
     base_functions = [
         (lambda v: Series(v).count(), None, 'count'),
@@ -1760,9 +2140,6 @@ class TestMomentsConsistency(Base):
         # lambda v: Series(v).skew(), 3, 'skew'),
         # (lambda v: Series(v).kurt(), 4, 'kurt'),
 
-        # (lambda x, min_periods: mom.expanding_quantile(x, 0.3,
-        # min_periods=min_periods, 'quantile'),
-
         # restore once GH 8084 is fixed
         # lambda v: Series(v).quantile(0.3), None, 'quantile'),
 
@@ -1770,15 +2147,11 @@ class TestMomentsConsistency(Base):
         (np.nanmax, 1, 'max'),
         (np.nanmin, 1, 'min'),
         (np.nansum, 1, 'sum'),
+        (np.nanmean, 1, 'mean'),
+        (lambda v: np.nanstd(v, ddof=1), 1, 'std'),
+        (lambda v: np.nanvar(v, ddof=1), 1, 'var'),
+        (np.nanmedian, 1, 'median'),
     ]
-    if np.__version__ >= LooseVersion('1.8.0'):
-        base_functions += [
-            (np.nanmean, 1, 'mean'),
-            (lambda v: np.nanstd(v, ddof=1), 1, 'std'),
-            (lambda v: np.nanvar(v, ddof=1), 1, 'var'),
-        ]
-    if np.__version__ >= LooseVersion('1.9.0'):
-        base_functions += [(np.nanmedian, 1, 'median'), ]
     no_nan_functions = [
         (np.max, None, 'max'),
         (np.min, None, 'min'),
@@ -1793,7 +2166,7 @@ def _create_data(self):
         super(TestMomentsConsistency, self)._create_data()
         self.data = _consistency_data
 
-    def setUp(self):
+    def setup_method(self, method):
         self._create_data()
 
     def _test_moments_consistency(self, min_periods, count, mean, mock_mean,
@@ -1803,7 +2176,7 @@ def _test_moments_consistency(self, min_periods, count, mean, mock_mean,
                                   var_debiasing_factors=None):
         def _non_null_values(x):
             values = x.values.ravel()
-            return set(values[notnull(values)].tolist())
+            return set(values[notna(values)].tolist())
 
         for (x, is_constant, no_nans) in self.data:
             count_x = count(x)
@@ -1816,7 +2189,8 @@ def _non_null_values(x):
 
             # check that correlation of a series with itself is either 1 or NaN
             corr_x_x = corr(x, x)
-            # self.assertTrue(_non_null_values(corr_x_x).issubset(set([1.]))) #
+
+            # assert _non_null_values(corr_x_x).issubset(set([1.]))
             # restore once rolling_cov(x, x) is identically equal to var(x)
 
             if is_constant:
@@ -1846,11 +2220,11 @@ def _non_null_values(x):
                 # check that var(x), std(x), and cov(x) are all >= 0
                 var_x = var(x)
                 std_x = std(x)
-                self.assertFalse((var_x < 0).any().any())
-                self.assertFalse((std_x < 0).any().any())
+                assert not (var_x < 0).any().any()
+                assert not (std_x < 0).any().any()
                 if cov:
                     cov_x_x = cov(x, x)
-                    self.assertFalse((cov_x_x < 0).any().any())
+                    assert not (cov_x_x < 0).any().any()
 
                     # check that var(x) == cov(x, x)
                     assert_equal(var_x, cov_x_x)
@@ -1865,7 +2239,7 @@ def _non_null_values(x):
 
                 if is_constant:
                     # check that variance of constant series is identically 0
-                    self.assertFalse((var_x > 0).any().any())
+                    assert not (var_x > 0).any().any()
                     expected = x * np.nan
                     expected[count_x >= max(min_periods, 1)] = 0.
                     if var is var_unbiased:
@@ -1874,7 +2248,7 @@ def _non_null_values(x):
 
                 if isinstance(x, Series):
                     for (y, is_constant, no_nans) in self.data:
-                        if not x.isnull().equals(y.isnull()):
+                        if not x.isna().equals(y.isna()):
                             # can only easily test two Series with similar
                             # structure
                             continue
@@ -1910,8 +2284,11 @@ def _non_null_values(x):
                                 assert_equal(cov_x_y, mean_x_times_y -
                                              (mean_x * mean_y))
 
-    @tm.slow
-    def test_ewm_consistency(self):
+    @pytest.mark.slow
+    @pytest.mark.parametrize('min_periods', [0, 1, 2, 3, 4])
+    @pytest.mark.parametrize('adjust', [True, False])
+    @pytest.mark.parametrize('ignore_na', [True, False])
+    def test_ewm_consistency(self, min_periods, adjust, ignore_na):
         def _weights(s, com, adjust, ignore_na):
             if isinstance(s, DataFrame):
                 if not len(s.columns):
@@ -1927,8 +2304,8 @@ def _weights(s, com, adjust, ignore_na):
             w = Series(np.nan, index=s.index)
             alpha = 1. / (1. + com)
             if ignore_na:
-                w[s.notnull()] = _weights(s[s.notnull()], com=com,
-                                          adjust=adjust, ignore_na=False)
+                w[s.notna()] = _weights(s[s.notna()], com=com,
+                                        adjust=adjust, ignore_na=False)
             elif adjust:
                 for i in range(len(s)):
                     if s.iat[i] == s.iat[i]:
@@ -1965,52 +2342,51 @@ def _ewma(s, com, min_periods, adjust, ignore_na):
             return result
 
         com = 3.
-        for min_periods, adjust, ignore_na in product([0, 1, 2, 3, 4],
-                                                      [True, False],
-                                                      [False, True]):
-            # test consistency between different ewm* moments
-            self._test_moments_consistency(
-                min_periods=min_periods,
-                count=lambda x: x.expanding().count(),
-                mean=lambda x: x.ewm(com=com, min_periods=min_periods,
-                                     adjust=adjust,
-                                     ignore_na=ignore_na).mean(),
-                mock_mean=lambda x: _ewma(x, com=com,
-                                          min_periods=min_periods,
-                                          adjust=adjust,
-                                          ignore_na=ignore_na),
-                corr=lambda x, y: x.ewm(com=com, min_periods=min_periods,
-                                        adjust=adjust,
-                                        ignore_na=ignore_na).corr(y),
-                var_unbiased=lambda x: (
-                    x.ewm(com=com, min_periods=min_periods,
-                          adjust=adjust,
-                          ignore_na=ignore_na).var(bias=False)),
-                std_unbiased=lambda x: (
-                    x.ewm(com=com, min_periods=min_periods,
-                          adjust=adjust, ignore_na=ignore_na)
-                    .std(bias=False)),
-                cov_unbiased=lambda x, y: (
-                    x.ewm(com=com, min_periods=min_periods,
-                          adjust=adjust, ignore_na=ignore_na)
-                    .cov(y, bias=False)),
-                var_biased=lambda x: (
-                    x.ewm(com=com, min_periods=min_periods,
-                          adjust=adjust, ignore_na=ignore_na)
-                    .var(bias=True)),
-                std_biased=lambda x: x.ewm(com=com, min_periods=min_periods,
-                                           adjust=adjust,
-                                           ignore_na=ignore_na).std(bias=True),
-                cov_biased=lambda x, y: (
-                    x.ewm(com=com, min_periods=min_periods,
-                          adjust=adjust, ignore_na=ignore_na)
-                    .cov(y, bias=True)),
-                var_debiasing_factors=lambda x: (
-                    _variance_debiasing_factors(x, com=com, adjust=adjust,
-                                                ignore_na=ignore_na)))
-
-    @tm.slow
-    def test_expanding_consistency(self):
+        # test consistency between different ewm* moments
+        self._test_moments_consistency(
+            min_periods=min_periods,
+            count=lambda x: x.expanding().count(),
+            mean=lambda x: x.ewm(com=com, min_periods=min_periods,
+                                 adjust=adjust,
+                                 ignore_na=ignore_na).mean(),
+            mock_mean=lambda x: _ewma(x, com=com,
+                                      min_periods=min_periods,
+                                      adjust=adjust,
+                                      ignore_na=ignore_na),
+            corr=lambda x, y: x.ewm(com=com, min_periods=min_periods,
+                                    adjust=adjust,
+                                    ignore_na=ignore_na).corr(y),
+            var_unbiased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust,
+                      ignore_na=ignore_na).var(bias=False)),
+            std_unbiased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .std(bias=False)),
+            cov_unbiased=lambda x, y: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .cov(y, bias=False)),
+            var_biased=lambda x: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .var(bias=True)),
+            std_biased=lambda x: x.ewm(com=com, min_periods=min_periods,
+                                       adjust=adjust,
+                                       ignore_na=ignore_na).std(bias=True),
+            cov_biased=lambda x, y: (
+                x.ewm(com=com, min_periods=min_periods,
+                      adjust=adjust, ignore_na=ignore_na)
+                .cov(y, bias=True)),
+            var_debiasing_factors=lambda x: (
+                _variance_debiasing_factors(x, com=com, adjust=adjust,
+                                            ignore_na=ignore_na)))
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize(
+        'min_periods', [0, 1, 2, 3, 4])
+    def test_expanding_consistency(self, min_periods):
 
         # suppress warnings about empty slices, as we are deliberately testing
         # with empty/0-length Series/DataFrames
@@ -2019,87 +2395,73 @@ def test_expanding_consistency(self):
                                     message=".*(empty slice|0 for slice).*",
                                     category=RuntimeWarning)
 
-            for min_periods in [0, 1, 2, 3, 4]:
-
-                # test consistency between different expanding_* moments
-                self._test_moments_consistency(
-                    min_periods=min_periods,
-                    count=lambda x: x.expanding().count(),
-                    mean=lambda x: x.expanding(
-                        min_periods=min_periods).mean(),
-                    mock_mean=lambda x: x.expanding(
-                        min_periods=min_periods).sum() / x.expanding().count(),
-                    corr=lambda x, y: x.expanding(
-                        min_periods=min_periods).corr(y),
-                    var_unbiased=lambda x: x.expanding(
-                        min_periods=min_periods).var(),
-                    std_unbiased=lambda x: x.expanding(
-                        min_periods=min_periods).std(),
-                    cov_unbiased=lambda x, y: x.expanding(
-                        min_periods=min_periods).cov(y),
-                    var_biased=lambda x: x.expanding(
-                        min_periods=min_periods).var(ddof=0),
-                    std_biased=lambda x: x.expanding(
-                        min_periods=min_periods).std(ddof=0),
-                    cov_biased=lambda x, y: x.expanding(
-                        min_periods=min_periods).cov(y, ddof=0),
-                    var_debiasing_factors=lambda x: (
-                        x.expanding().count() /
-                        (x.expanding().count() - 1.)
-                        .replace(0., np.nan)))
-
-                # test consistency between expanding_xyz() and either (a)
-                # expanding_apply of Series.xyz(), or (b) expanding_apply of
-                # np.nanxyz()
-                for (x, is_constant, no_nans) in self.data:
-                    functions = self.base_functions
-
-                    # GH 8269
-                    if no_nans:
-                        functions = self.base_functions + self.no_nan_functions
-                    for (f, require_min_periods, name) in functions:
-                        expanding_f = getattr(
-                            x.expanding(min_periods=min_periods), name)
-
-                        if (require_min_periods and
-                                (min_periods is not None) and
-                                (min_periods < require_min_periods)):
-                            continue
-
-                        if name == 'count':
-                            expanding_f_result = expanding_f()
-                            expanding_apply_f_result = x.expanding(
-                                min_periods=0).apply(func=f)
+            # test consistency between different expanding_* moments
+            self._test_moments_consistency(
+                min_periods=min_periods,
+                count=lambda x: x.expanding().count(),
+                mean=lambda x: x.expanding(
+                    min_periods=min_periods).mean(),
+                mock_mean=lambda x: x.expanding(
+                    min_periods=min_periods).sum() / x.expanding().count(),
+                corr=lambda x, y: x.expanding(
+                    min_periods=min_periods).corr(y),
+                var_unbiased=lambda x: x.expanding(
+                    min_periods=min_periods).var(),
+                std_unbiased=lambda x: x.expanding(
+                    min_periods=min_periods).std(),
+                cov_unbiased=lambda x, y: x.expanding(
+                    min_periods=min_periods).cov(y),
+                var_biased=lambda x: x.expanding(
+                    min_periods=min_periods).var(ddof=0),
+                std_biased=lambda x: x.expanding(
+                    min_periods=min_periods).std(ddof=0),
+                cov_biased=lambda x, y: x.expanding(
+                    min_periods=min_periods).cov(y, ddof=0),
+                var_debiasing_factors=lambda x: (
+                    x.expanding().count() /
+                    (x.expanding().count() - 1.)
+                    .replace(0., np.nan)))
+
+            # test consistency between expanding_xyz() and either (a)
+            # expanding_apply of Series.xyz(), or (b) expanding_apply of
+            # np.nanxyz()
+            for (x, is_constant, no_nans) in self.data:
+                functions = self.base_functions
+
+                # GH 8269
+                if no_nans:
+                    functions = self.base_functions + self.no_nan_functions
+                for (f, require_min_periods, name) in functions:
+                    expanding_f = getattr(
+                        x.expanding(min_periods=min_periods), name)
+
+                    if (require_min_periods and
+                            (min_periods is not None) and
+                            (min_periods < require_min_periods)):
+                        continue
+
+                    if name == 'count':
+                        expanding_f_result = expanding_f()
+                        expanding_apply_f_result = x.expanding(
+                            min_periods=0).apply(func=f, raw=True)
+                    else:
+                        if name in ['cov', 'corr']:
+                            expanding_f_result = expanding_f(
+                                pairwise=False)
                         else:
-                            if name in ['cov', 'corr']:
-                                expanding_f_result = expanding_f(
-                                    pairwise=False)
-                            else:
-                                expanding_f_result = expanding_f()
-                            expanding_apply_f_result = x.expanding(
-                                min_periods=min_periods).apply(func=f)
-
-                        if not tm._incompat_bottleneck_version(name):
-                            assert_equal(expanding_f_result,
-                                         expanding_apply_f_result)
-
-                        if (name in ['cov', 'corr']) and isinstance(x,
-                                                                    DataFrame):
-                            # test pairwise=True
-                            expanding_f_result = expanding_f(x, pairwise=True)
-                            expected = Panel(items=x.index,
-                                             major_axis=x.columns,
-                                             minor_axis=x.columns)
-                            for i, _ in enumerate(x.columns):
-                                for j, _ in enumerate(x.columns):
-                                    expected.iloc[:, i, j] = getattr(
-                                        x.iloc[:, i].expanding(
-                                            min_periods=min_periods),
-                                        name)(x.iloc[:, j])
-                            tm.assert_panel_equal(expanding_f_result, expected)
-
-    @tm.slow
-    def test_rolling_consistency(self):
+                            expanding_f_result = expanding_f()
+                        expanding_apply_f_result = x.expanding(
+                            min_periods=min_periods).apply(func=f, raw=True)
+
+                    # GH 9422
+                    if name in ['sum', 'prod']:
+                        assert_equal(expanding_f_result,
+                                     expanding_apply_f_result)
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize(
+        'window,min_periods,center', list(_rolling_consistency_cases()))
+    def test_rolling_consistency(self, window, min_periods, center):
 
         # suppress warnings about empty slices, as we are deliberately testing
         # with empty/0-length Series/DataFrames
@@ -2108,119 +2470,93 @@ def test_rolling_consistency(self):
                                     message=".*(empty slice|0 for slice).*",
                                     category=RuntimeWarning)
 
-            def cases():
-                for window in [1, 2, 3, 10, 20]:
-                    for min_periods in set([0, 1, 2, 3, 4, window]):
-                        if min_periods and (min_periods > window):
-                            continue
-                        for center in [False, True]:
-                            yield window, min_periods, center
-
-            for window, min_periods, center in cases():
-                # test consistency between different rolling_* moments
-                self._test_moments_consistency(
-                    min_periods=min_periods,
-                    count=lambda x: (
-                        x.rolling(window=window, center=center)
-                        .count()),
-                    mean=lambda x: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).mean()),
-                    mock_mean=lambda x: (
-                        x.rolling(window=window,
-                                  min_periods=min_periods,
-                                  center=center).sum()
-                        .divide(x.rolling(window=window,
-                                          min_periods=min_periods,
-                                          center=center).count())),
-                    corr=lambda x, y: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).corr(y)),
-
-                    var_unbiased=lambda x: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).var()),
-
-                    std_unbiased=lambda x: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).std()),
-
-                    cov_unbiased=lambda x, y: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).cov(y)),
-
-                    var_biased=lambda x: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).var(ddof=0)),
-
-                    std_biased=lambda x: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).std(ddof=0)),
-
-                    cov_biased=lambda x, y: (
-                        x.rolling(window=window, min_periods=min_periods,
-                                  center=center).cov(y, ddof=0)),
-                    var_debiasing_factors=lambda x: (
-                        x.rolling(window=window, center=center).count()
-                        .divide((x.rolling(window=window, center=center)
-                                 .count() - 1.)
-                                .replace(0., np.nan))))
-
-                # test consistency between rolling_xyz() and either (a)
-                # rolling_apply of Series.xyz(), or (b) rolling_apply of
-                # np.nanxyz()
-                for (x, is_constant, no_nans) in self.data:
-                    functions = self.base_functions
-
-                    # GH 8269
-                    if no_nans:
-                        functions = self.base_functions + self.no_nan_functions
-                    for (f, require_min_periods, name) in functions:
-                        rolling_f = getattr(
-                            x.rolling(window=window, center=center,
-                                      min_periods=min_periods), name)
-
-                        if require_min_periods and (
-                                min_periods is not None) and (
-                                    min_periods < require_min_periods):
-                            continue
+            # test consistency between different rolling_* moments
+            self._test_moments_consistency(
+                min_periods=min_periods,
+                count=lambda x: (
+                    x.rolling(window=window, center=center)
+                    .count()),
+                mean=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).mean()),
+                mock_mean=lambda x: (
+                    x.rolling(window=window,
+                              min_periods=min_periods,
+                              center=center).sum()
+                    .divide(x.rolling(window=window,
+                                      min_periods=min_periods,
+                                      center=center).count())),
+                corr=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).corr(y)),
 
-                        if name == 'count':
-                            rolling_f_result = rolling_f()
-                            rolling_apply_f_result = x.rolling(
-                                window=window, min_periods=0,
-                                center=center).apply(func=f)
+                var_unbiased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).var()),
+
+                std_unbiased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).std()),
+
+                cov_unbiased=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).cov(y)),
+
+                var_biased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).var(ddof=0)),
+
+                std_biased=lambda x: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).std(ddof=0)),
+
+                cov_biased=lambda x, y: (
+                    x.rolling(window=window, min_periods=min_periods,
+                              center=center).cov(y, ddof=0)),
+                var_debiasing_factors=lambda x: (
+                    x.rolling(window=window, center=center).count()
+                    .divide((x.rolling(window=window, center=center)
+                             .count() - 1.)
+                            .replace(0., np.nan))))
+
+            # test consistency between rolling_xyz() and either (a)
+            # rolling_apply of Series.xyz(), or (b) rolling_apply of
+            # np.nanxyz()
+            for (x, is_constant, no_nans) in self.data:
+                functions = self.base_functions
+
+                # GH 8269
+                if no_nans:
+                    functions = self.base_functions + self.no_nan_functions
+                for (f, require_min_periods, name) in functions:
+                    rolling_f = getattr(
+                        x.rolling(window=window, center=center,
+                                  min_periods=min_periods), name)
+
+                    if require_min_periods and (
+                            min_periods is not None) and (
+                                min_periods < require_min_periods):
+                        continue
+
+                    if name == 'count':
+                        rolling_f_result = rolling_f()
+                        rolling_apply_f_result = x.rolling(
+                            window=window, min_periods=0,
+                            center=center).apply(func=f, raw=True)
+                    else:
+                        if name in ['cov', 'corr']:
+                            rolling_f_result = rolling_f(
+                                pairwise=False)
                         else:
-                            if name in ['cov', 'corr']:
-                                rolling_f_result = rolling_f(
-                                    pairwise=False)
-                            else:
-                                rolling_f_result = rolling_f()
-                            rolling_apply_f_result = x.rolling(
-                                window=window, min_periods=min_periods,
-                                center=center).apply(func=f)
-                        if not tm._incompat_bottleneck_version(name):
-                            assert_equal(rolling_f_result,
-                                         rolling_apply_f_result)
-
-                        if (name in ['cov', 'corr']) and isinstance(
-                                x, DataFrame):
-                            # test pairwise=True
-                            rolling_f_result = rolling_f(x,
-                                                         pairwise=True)
-                            expected = Panel(items=x.index,
-                                             major_axis=x.columns,
-                                             minor_axis=x.columns)
-                            for i, _ in enumerate(x.columns):
-                                for j, _ in enumerate(x.columns):
-                                    expected.iloc[:, i, j] = (
-                                        getattr(
-                                            x.iloc[:, i]
-                                            .rolling(window=window,
-                                                     min_periods=min_periods,
-                                                     center=center),
-                                            name)(x.iloc[:, j]))
-                            tm.assert_panel_equal(rolling_f_result, expected)
+                            rolling_f_result = rolling_f()
+                        rolling_apply_f_result = x.rolling(
+                            window=window, min_periods=min_periods,
+                            center=center).apply(func=f, raw=True)
+
+                    # GH 9422
+                    if name in ['sum', 'prod']:
+                        assert_equal(rolling_f_result,
+                                     rolling_apply_f_result)
 
     # binary moments
     def test_rolling_cov(self):
@@ -2253,20 +2589,31 @@ def test_rolling_corr_pairwise(self):
         self._check_pairwise_moment('rolling', 'corr', window=10,
                                     min_periods=5)
 
+    @pytest.mark.parametrize('window', range(7))
+    def test_rolling_corr_with_zero_variance(self, window):
+        # GH 18430
+        s = pd.Series(np.zeros(20))
+        other = pd.Series(np.arange(20))
+
+        assert s.rolling(window=window).corr(other=other).isna().all()
+
     def _check_pairwise_moment(self, dispatch, name, **kwargs):
         def get_result(obj, obj2=None):
             return getattr(getattr(obj, dispatch)(**kwargs), name)(obj2)
 
-        panel = get_result(self.frame)
-        actual = panel.loc[:, 1, 5]
+        result = get_result(self.frame)
+        result = result.loc[(slice(None), 1), 5]
+        result.index = result.index.droplevel(1)
         expected = get_result(self.frame[1], self.frame[5])
-        tm.assert_series_equal(actual, expected, check_names=False)
-        self.assertEqual(actual.name, 5)
+        tm.assert_series_equal(result, expected, check_names=False)
 
     def test_flex_binary_moment(self):
         # GH3155
         # don't blow the stack
-        self.assertRaises(TypeError, rwindow._flex_binary_moment, 5, 6, None)
+        msg = ("arguments to moment function must be of type"
+               " np.ndarray/Series/DataFrame")
+        with pytest.raises(TypeError, match=msg):
+            rwindow._flex_binary_moment(5, 6, None)
 
     def test_corr_sanity(self):
         # GH 3155
@@ -2276,41 +2623,36 @@ def test_corr_sanity(self):
              [0.84780328, 0.33394331], [0.78369152, 0.63919667]]))
 
         res = df[0].rolling(5, center=True).corr(df[1])
-        self.assertTrue(all([np.abs(np.nan_to_num(x)) <= 1 for x in res]))
+        assert all(np.abs(np.nan_to_num(x)) <= 1 for x in res)
 
         # and some fuzzing
-        for i in range(10):
+        for _ in range(10):
             df = DataFrame(np.random.rand(30, 2))
             res = df[0].rolling(5, center=True).corr(df[1])
             try:
-                self.assertTrue(all([np.abs(np.nan_to_num(x)) <= 1 for x in res
-                                     ]))
-            except:
+                assert all(np.abs(np.nan_to_num(x)) <= 1 for x in res)
+            except AssertionError:
                 print(res)
 
-    def test_flex_binary_frame(self):
-        def _check(method):
-            series = self.frame[1]
-
-            res = getattr(series.rolling(window=10), method)(self.frame)
-            res2 = getattr(self.frame.rolling(window=10), method)(series)
-            exp = self.frame.apply(lambda x: getattr(
-                series.rolling(window=10), method)(x))
+    @pytest.mark.parametrize('method', ['corr', 'cov'])
+    def test_flex_binary_frame(self, method):
+        series = self.frame[1]
 
-            tm.assert_frame_equal(res, exp)
-            tm.assert_frame_equal(res2, exp)
+        res = getattr(series.rolling(window=10), method)(self.frame)
+        res2 = getattr(self.frame.rolling(window=10), method)(series)
+        exp = self.frame.apply(lambda x: getattr(
+            series.rolling(window=10), method)(x))
 
-            frame2 = self.frame.copy()
-            frame2.values[:] = np.random.randn(*frame2.shape)
+        tm.assert_frame_equal(res, exp)
+        tm.assert_frame_equal(res2, exp)
 
-            res3 = getattr(self.frame.rolling(window=10), method)(frame2)
-            exp = DataFrame(dict((k, getattr(self.frame[k].rolling(
-                window=10), method)(frame2[k])) for k in self.frame))
-            tm.assert_frame_equal(res3, exp)
+        frame2 = self.frame.copy()
+        frame2.values[:] = np.random.randn(*frame2.shape)
 
-        methods = ['corr', 'cov']
-        for meth in methods:
-            _check(meth)
+        res3 = getattr(self.frame.rolling(window=10), method)(frame2)
+        exp = DataFrame({k: getattr(self.frame[k].rolling(
+            window=10), method)(frame2[k]) for k in self.frame})
+        tm.assert_frame_equal(res3, exp)
 
     def test_ewmcov(self):
         self._check_binary_ew('cov')
@@ -2335,16 +2677,16 @@ def func(A, B, com, **kwargs):
         B[-10:] = np.NaN
 
         result = func(A, B, 20, min_periods=5)
-        self.assertTrue(np.isnan(result.values[:14]).all())
-        self.assertFalse(np.isnan(result.values[14:]).any())
+        assert np.isnan(result.values[:14]).all()
+        assert not np.isnan(result.values[14:]).any()
 
         # GH 7898
         for min_periods in (0, 1, 2):
             result = func(A, B, 20, min_periods=min_periods)
             # binary functions (ewmcov, ewmcorr) with bias=False require at
             # least two values
-            self.assertTrue(np.isnan(result.values[:11]).all())
-            self.assertFalse(np.isnan(result.values[11:]).any())
+            assert np.isnan(result.values[:11]).all()
+            assert not np.isnan(result.values[11:]).any()
 
             # check series of length 0
             result = func(Series([]), Series([]), 50, min_periods=min_periods)
@@ -2355,37 +2697,29 @@ def func(A, B, com, **kwargs):
                 Series([1.]), Series([1.]), 50, min_periods=min_periods)
             tm.assert_series_equal(result, Series([np.NaN]))
 
-        self.assertRaises(Exception, func, A, randn(50), 20, min_periods=5)
-
-    def test_expanding_apply(self):
-        ser = Series([])
-        tm.assert_series_equal(ser, ser.expanding().apply(lambda x: x.mean()))
-
-        def expanding_mean(x, min_periods=1, freq=None):
-            return mom.expanding_apply(x, lambda x: x.mean(),
-                                       min_periods=min_periods, freq=freq)
+        msg = "Input arrays must be of the same type!"
+        # exception raised is Exception
+        with pytest.raises(Exception, match=msg):
+            func(A, randn(50), 20, min_periods=5)
 
-        self._check_expanding(expanding_mean, np.mean)
+    def test_expanding_apply_args_kwargs(self, raw):
 
-        # GH 8080
-        s = Series([None, None, None])
-        result = s.expanding(min_periods=0).apply(lambda x: len(x))
-        expected = Series([1., 2., 3.])
-        tm.assert_series_equal(result, expected)
-
-    def test_expanding_apply_args_kwargs(self):
         def mean_w_arg(x, const):
             return np.mean(x) + const
 
         df = DataFrame(np.random.rand(20, 3))
 
-        expected = df.expanding().apply(np.mean) + 20.
+        expected = df.expanding().apply(np.mean, raw=raw) + 20.
+
+        result = df.expanding().apply(mean_w_arg,
+                                      raw=raw,
+                                      args=(20, ))
+        tm.assert_frame_equal(result, expected)
 
-        tm.assert_frame_equal(df.expanding().apply(mean_w_arg, args=(20, )),
-                              expected)
-        tm.assert_frame_equal(df.expanding().apply(mean_w_arg,
-                                                   kwargs={'const': 20}),
-                              expected)
+        result = df.expanding().apply(mean_w_arg,
+                                      raw=raw,
+                                      kwargs={'const': 20})
+        tm.assert_frame_equal(result, expected)
 
     def test_expanding_corr(self):
         A = self.series.dropna()
@@ -2420,26 +2754,20 @@ def test_expanding_cov(self):
 
         tm.assert_almost_equal(rolling_result, result)
 
-    def test_expanding_max(self):
-        self._check_expanding(mom.expanding_max, np.max, preserve_nan=False)
-
     def test_expanding_cov_pairwise(self):
         result = self.frame.expanding().corr()
 
         rolling_result = self.frame.rolling(window=len(self.frame),
                                             min_periods=1).corr()
 
-        for i in result.items:
-            tm.assert_almost_equal(result[i], rolling_result[i])
+        tm.assert_frame_equal(result, rolling_result)
 
     def test_expanding_corr_pairwise(self):
         result = self.frame.expanding().corr()
 
         rolling_result = self.frame.rolling(window=len(self.frame),
                                             min_periods=1).corr()
-
-        for i in result.items:
-            tm.assert_almost_equal(result[i], rolling_result[i])
+        tm.assert_frame_equal(result, rolling_result)
 
     def test_expanding_cov_diff_index(self):
         # GH 7512
@@ -2501,52 +2829,66 @@ def test_rolling_corr_diff_length(self):
         result = s1.rolling(window=3, min_periods=2).corr(s2a)
         tm.assert_series_equal(result, expected)
 
-    def test_rolling_functions_window_non_shrinkage(self):
+    @pytest.mark.parametrize(
+        'f',
+        [
+            lambda x: (x.rolling(window=10, min_periods=5)
+                       .cov(x, pairwise=False)),
+            lambda x: (x.rolling(window=10, min_periods=5)
+                       .corr(x, pairwise=False)),
+            lambda x: x.rolling(window=10, min_periods=5).max(),
+            lambda x: x.rolling(window=10, min_periods=5).min(),
+            lambda x: x.rolling(window=10, min_periods=5).sum(),
+            lambda x: x.rolling(window=10, min_periods=5).mean(),
+            lambda x: x.rolling(window=10, min_periods=5).std(),
+            lambda x: x.rolling(window=10, min_periods=5).var(),
+            lambda x: x.rolling(window=10, min_periods=5).skew(),
+            lambda x: x.rolling(window=10, min_periods=5).kurt(),
+            lambda x: x.rolling(
+                window=10, min_periods=5).quantile(quantile=0.5),
+            lambda x: x.rolling(window=10, min_periods=5).median(),
+            lambda x: x.rolling(window=10, min_periods=5).apply(
+                sum, raw=False),
+            lambda x: x.rolling(window=10, min_periods=5).apply(
+                sum, raw=True),
+            lambda x: x.rolling(win_type='boxcar',
+                                window=10, min_periods=5).mean()])
+    def test_rolling_functions_window_non_shrinkage(self, f):
         # GH 7764
         s = Series(range(4))
         s_expected = Series(np.nan, index=s.index)
         df = DataFrame([[1, 5], [3, 2], [3, 9], [-1, 0]], columns=['A', 'B'])
         df_expected = DataFrame(np.nan, index=df.index, columns=df.columns)
-        df_expected_panel = Panel(items=df.index, major_axis=df.columns,
-                                  minor_axis=df.columns)
-
-        functions = [lambda x: (x.rolling(window=10, min_periods=5)
-                                .cov(x, pairwise=False)),
-                     lambda x: (x.rolling(window=10, min_periods=5)
-                                .corr(x, pairwise=False)),
-                     lambda x: x.rolling(window=10, min_periods=5).max(),
-                     lambda x: x.rolling(window=10, min_periods=5).min(),
-                     lambda x: x.rolling(window=10, min_periods=5).sum(),
-                     lambda x: x.rolling(window=10, min_periods=5).mean(),
-                     lambda x: x.rolling(window=10, min_periods=5).std(),
-                     lambda x: x.rolling(window=10, min_periods=5).var(),
-                     lambda x: x.rolling(window=10, min_periods=5).skew(),
-                     lambda x: x.rolling(window=10, min_periods=5).kurt(),
-                     lambda x: x.rolling(
-                         window=10, min_periods=5).quantile(quantile=0.5),
-                     lambda x: x.rolling(window=10, min_periods=5).median(),
-                     lambda x: x.rolling(window=10, min_periods=5).apply(sum),
-                     lambda x: x.rolling(win_type='boxcar',
-                                         window=10, min_periods=5).mean()]
-        for f in functions:
-            try:
-                s_result = f(s)
-                tm.assert_series_equal(s_result, s_expected)
-
-                df_result = f(df)
-                tm.assert_frame_equal(df_result, df_expected)
-            except (ImportError):
-
-                # scipy needed for rolling_window
-                continue
 
+        try:
+            s_result = f(s)
+            tm.assert_series_equal(s_result, s_expected)
+
+            df_result = f(df)
+            tm.assert_frame_equal(df_result, df_expected)
+        except (ImportError):
+
+            # scipy needed for rolling_window
+            pytest.skip("scipy not available")
+
+    def test_rolling_functions_window_non_shrinkage_binary(self):
+
+        # corr/cov return a MI DataFrame
+        df = DataFrame([[1, 5], [3, 2], [3, 9], [-1, 0]],
+                       columns=Index(['A', 'B'], name='foo'),
+                       index=Index(range(4), name='bar'))
+        df_expected = DataFrame(
+            columns=Index(['A', 'B'], name='foo'),
+            index=pd.MultiIndex.from_product([df.index, df.columns],
+                                             names=['bar', 'foo']),
+            dtype='float64')
         functions = [lambda x: (x.rolling(window=10, min_periods=5)
                                 .cov(x, pairwise=True)),
                      lambda x: (x.rolling(window=10, min_periods=5)
                                 .corr(x, pairwise=True))]
         for f in functions:
-            df_result_panel = f(df)
-            tm.assert_panel_equal(df_result_panel, df_expected_panel)
+            df_result = f(df)
+            tm.assert_frame_equal(df_result, df_expected)
 
     def test_moment_functions_zero_length(self):
         # GH 8056
@@ -2554,13 +2896,9 @@ def test_moment_functions_zero_length(self):
         s_expected = s
         df1 = DataFrame()
         df1_expected = df1
-        df1_expected_panel = Panel(items=df1.index, major_axis=df1.columns,
-                                   minor_axis=df1.columns)
         df2 = DataFrame(columns=['a'])
         df2['a'] = df2['a'].astype('float64')
         df2_expected = df2
-        df2_expected_panel = Panel(items=df2.index, major_axis=df2.columns,
-                                   minor_axis=df2.columns)
 
         functions = [lambda x: x.expanding().count(),
                      lambda x: x.expanding(min_periods=5).cov(
@@ -2577,7 +2915,10 @@ def test_moment_functions_zero_length(self):
                      lambda x: x.expanding(min_periods=5).kurt(),
                      lambda x: x.expanding(min_periods=5).quantile(0.5),
                      lambda x: x.expanding(min_periods=5).median(),
-                     lambda x: x.expanding(min_periods=5).apply(sum),
+                     lambda x: x.expanding(min_periods=5).apply(
+                         sum, raw=False),
+                     lambda x: x.expanding(min_periods=5).apply(
+                         sum, raw=True),
                      lambda x: x.rolling(window=10).count(),
                      lambda x: x.rolling(window=10, min_periods=5).cov(
                          x, pairwise=False),
@@ -2594,7 +2935,10 @@ def test_moment_functions_zero_length(self):
                      lambda x: x.rolling(
                          window=10, min_periods=5).quantile(0.5),
                      lambda x: x.rolling(window=10, min_periods=5).median(),
-                     lambda x: x.rolling(window=10, min_periods=5).apply(sum),
+                     lambda x: x.rolling(window=10, min_periods=5).apply(
+                         sum, raw=False),
+                     lambda x: x.rolling(window=10, min_periods=5).apply(
+                         sum, raw=True),
                      lambda x: x.rolling(win_type='boxcar',
                                          window=10, min_periods=5).mean(),
                      ]
@@ -2613,6 +2957,23 @@ def test_moment_functions_zero_length(self):
                 # scipy needed for rolling_window
                 continue
 
+    def test_moment_functions_zero_length_pairwise(self):
+
+        df1 = DataFrame()
+        df1_expected = df1
+        df2 = DataFrame(columns=Index(['a'], name='foo'),
+                        index=Index([], name='bar'))
+        df2['a'] = df2['a'].astype('float64')
+
+        df1_expected = DataFrame(
+            index=pd.MultiIndex.from_product([df1.index, df1.columns]),
+            columns=Index([]))
+        df2_expected = DataFrame(
+            index=pd.MultiIndex.from_product([df2.index, df2.columns],
+                                             names=['bar', 'foo']),
+            columns=Index(['a'], name='foo'),
+            dtype='float64')
+
         functions = [lambda x: (x.expanding(min_periods=5)
                                 .cov(x, pairwise=True)),
                      lambda x: (x.expanding(min_periods=5)
@@ -2623,24 +2984,33 @@ def test_moment_functions_zero_length(self):
                                 .corr(x, pairwise=True)),
                      ]
         for f in functions:
-            df1_result_panel = f(df1)
-            tm.assert_panel_equal(df1_result_panel, df1_expected_panel)
+            df1_result = f(df1)
+            tm.assert_frame_equal(df1_result, df1_expected)
 
-            df2_result_panel = f(df2)
-            tm.assert_panel_equal(df2_result_panel, df2_expected_panel)
+            df2_result = f(df2)
+            tm.assert_frame_equal(df2_result, df2_expected)
 
     def test_expanding_cov_pairwise_diff_length(self):
         # GH 7512
-        df1 = DataFrame([[1, 5], [3, 2], [3, 9]], columns=['A', 'B'])
-        df1a = DataFrame([[1, 5], [3, 9]], index=[0, 2], columns=['A', 'B'])
-        df2 = DataFrame([[5, 6], [None, None], [2, 1]], columns=['X', 'Y'])
-        df2a = DataFrame([[5, 6], [2, 1]], index=[0, 2], columns=['X', 'Y'])
-        result1 = df1.expanding().cov(df2a, pairwise=True)[2]
-        result2 = df1.expanding().cov(df2a, pairwise=True)[2]
-        result3 = df1a.expanding().cov(df2, pairwise=True)[2]
-        result4 = df1a.expanding().cov(df2a, pairwise=True)[2]
-        expected = DataFrame([[-3., -5.], [-6., -10.]], index=['A', 'B'],
-                             columns=['X', 'Y'])
+        df1 = DataFrame([[1, 5], [3, 2], [3, 9]],
+                        columns=Index(['A', 'B'], name='foo'))
+        df1a = DataFrame([[1, 5], [3, 9]],
+                         index=[0, 2],
+                         columns=Index(['A', 'B'], name='foo'))
+        df2 = DataFrame([[5, 6], [None, None], [2, 1]],
+                        columns=Index(['X', 'Y'], name='foo'))
+        df2a = DataFrame([[5, 6], [2, 1]],
+                         index=[0, 2],
+                         columns=Index(['X', 'Y'], name='foo'))
+        # TODO: xref gh-15826
+        # .loc is not preserving the names
+        result1 = df1.expanding().cov(df2a, pairwise=True).loc[2]
+        result2 = df1.expanding().cov(df2a, pairwise=True).loc[2]
+        result3 = df1a.expanding().cov(df2, pairwise=True).loc[2]
+        result4 = df1a.expanding().cov(df2a, pairwise=True).loc[2]
+        expected = DataFrame([[-3.0, -6.0], [-5.0, -10.0]],
+                             columns=Index(['A', 'B'], name='foo'),
+                             index=Index(['X', 'Y'], name='foo'))
         tm.assert_frame_equal(result1, expected)
         tm.assert_frame_equal(result2, expected)
         tm.assert_frame_equal(result3, expected)
@@ -2648,149 +3018,30 @@ def test_expanding_cov_pairwise_diff_length(self):
 
     def test_expanding_corr_pairwise_diff_length(self):
         # GH 7512
-        df1 = DataFrame([[1, 2], [3, 2], [3, 4]], columns=['A', 'B'])
-        df1a = DataFrame([[1, 2], [3, 4]], index=[0, 2], columns=['A', 'B'])
-        df2 = DataFrame([[5, 6], [None, None], [2, 1]], columns=['X', 'Y'])
-        df2a = DataFrame([[5, 6], [2, 1]], index=[0, 2], columns=['X', 'Y'])
-        result1 = df1.expanding().corr(df2, pairwise=True)[2]
-        result2 = df1.expanding().corr(df2a, pairwise=True)[2]
-        result3 = df1a.expanding().corr(df2, pairwise=True)[2]
-        result4 = df1a.expanding().corr(df2a, pairwise=True)[2]
-        expected = DataFrame([[-1.0, -1.0], [-1.0, -1.0]], index=['A', 'B'],
-                             columns=['X', 'Y'])
+        df1 = DataFrame([[1, 2], [3, 2], [3, 4]],
+                        columns=['A', 'B'],
+                        index=Index(range(3), name='bar'))
+        df1a = DataFrame([[1, 2], [3, 4]],
+                         index=Index([0, 2], name='bar'),
+                         columns=['A', 'B'])
+        df2 = DataFrame([[5, 6], [None, None], [2, 1]],
+                        columns=['X', 'Y'],
+                        index=Index(range(3), name='bar'))
+        df2a = DataFrame([[5, 6], [2, 1]],
+                         index=Index([0, 2], name='bar'),
+                         columns=['X', 'Y'])
+        result1 = df1.expanding().corr(df2, pairwise=True).loc[2]
+        result2 = df1.expanding().corr(df2a, pairwise=True).loc[2]
+        result3 = df1a.expanding().corr(df2, pairwise=True).loc[2]
+        result4 = df1a.expanding().corr(df2a, pairwise=True).loc[2]
+        expected = DataFrame([[-1.0, -1.0], [-1.0, -1.0]],
+                             columns=['A', 'B'],
+                             index=Index(['X', 'Y']))
         tm.assert_frame_equal(result1, expected)
         tm.assert_frame_equal(result2, expected)
         tm.assert_frame_equal(result3, expected)
         tm.assert_frame_equal(result4, expected)
 
-    def test_pairwise_stats_column_names_order(self):
-        # GH 7738
-        df1s = [DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0, 1]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 0]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1, 1]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]],
-                          columns=['C', 'C']),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[1., 0]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=[0., 1]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1]], columns=['C', 1]),
-                DataFrame([[2., 4.], [1., 2.], [5., 2.], [8., 1.]],
-                          columns=[1, 0.]),
-                DataFrame([[2, 4.], [1, 2.], [5, 2.], [8, 1.]],
-                          columns=[0, 1.]),
-                DataFrame([[2, 4], [1, 2], [5, 2], [8, 1.]],
-                          columns=[1., 'X']), ]
-        df2 = DataFrame([[None, 1, 1], [None, 1, 2],
-                         [None, 3, 2], [None, 8, 1]], columns=['Y', 'Z', 'X'])
-        s = Series([1, 1, 3, 8])
-
-        # suppress warnings about incomparable objects, as we are deliberately
-        # testing with such column labels
-        with warnings.catch_warnings():
-            warnings.filterwarnings("ignore",
-                                    message=".*incomparable objects.*",
-                                    category=RuntimeWarning)
-
-            # DataFrame methods (which do not call _flex_binary_moment())
-            for f in [lambda x: x.cov(), lambda x: x.corr(), ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    tm.assert_index_equal(result.index, df.columns)
-                    tm.assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        # compare internal values, as columns can be different
-                        self.assert_numpy_array_equal(result.values,
-                                                      results[0].values)
-
-            # DataFrame with itself, pairwise=True
-            for f in [lambda x: x.expanding().cov(pairwise=True),
-                      lambda x: x.expanding().corr(pairwise=True),
-                      lambda x: x.rolling(window=3).cov(pairwise=True),
-                      lambda x: x.rolling(window=3).corr(pairwise=True),
-                      lambda x: x.ewm(com=3).cov(pairwise=True),
-                      lambda x: x.ewm(com=3).corr(pairwise=True), ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    tm.assert_index_equal(result.items, df.index)
-                    tm.assert_index_equal(result.major_axis, df.columns)
-                    tm.assert_index_equal(result.minor_axis, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result.values,
-                                                      results[0].values)
-
-            # DataFrame with itself, pairwise=False
-            for f in [lambda x: x.expanding().cov(pairwise=False),
-                      lambda x: x.expanding().corr(pairwise=False),
-                      lambda x: x.rolling(window=3).cov(pairwise=False),
-                      lambda x: x.rolling(window=3).corr(pairwise=False),
-                      lambda x: x.ewm(com=3).cov(pairwise=False),
-                      lambda x: x.ewm(com=3).corr(pairwise=False), ]:
-                results = [f(df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    tm.assert_index_equal(result.index, df.index)
-                    tm.assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result.values,
-                                                      results[0].values)
-
-            # DataFrame with another DataFrame, pairwise=True
-            for f in [lambda x, y: x.expanding().cov(y, pairwise=True),
-                      lambda x, y: x.expanding().corr(y, pairwise=True),
-                      lambda x, y: x.rolling(window=3).cov(y, pairwise=True),
-                      lambda x, y: x.rolling(window=3).corr(y, pairwise=True),
-                      lambda x, y: x.ewm(com=3).cov(y, pairwise=True),
-                      lambda x, y: x.ewm(com=3).corr(y, pairwise=True), ]:
-                results = [f(df, df2) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    tm.assert_index_equal(result.items, df.index)
-                    tm.assert_index_equal(result.major_axis, df.columns)
-                    tm.assert_index_equal(result.minor_axis, df2.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result.values,
-                                                      results[0].values)
-
-            # DataFrame with another DataFrame, pairwise=False
-            for f in [lambda x, y: x.expanding().cov(y, pairwise=False),
-                      lambda x, y: x.expanding().corr(y, pairwise=False),
-                      lambda x, y: x.rolling(window=3).cov(y, pairwise=False),
-                      lambda x, y: x.rolling(window=3).corr(y, pairwise=False),
-                      lambda x, y: x.ewm(com=3).cov(y, pairwise=False),
-                      lambda x, y: x.ewm(com=3).corr(y, pairwise=False), ]:
-                results = [f(df, df2) if df.columns.is_unique else None
-                           for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    if result is not None:
-                        expected_index = df.index.union(df2.index)
-                        expected_columns = df.columns.union(df2.columns)
-                        tm.assert_index_equal(result.index, expected_index)
-                        tm.assert_index_equal(result.columns, expected_columns)
-                    else:
-                        tm.assertRaisesRegexp(
-                            ValueError, "'arg1' columns are not unique", f, df,
-                            df2)
-                        tm.assertRaisesRegexp(
-                            ValueError, "'arg2' columns are not unique", f,
-                            df2, df)
-
-            # DataFrame with a Series
-            for f in [lambda x, y: x.expanding().cov(y),
-                      lambda x, y: x.expanding().corr(y),
-                      lambda x, y: x.rolling(window=3).cov(y),
-                      lambda x, y: x.rolling(window=3).corr(y),
-                      lambda x, y: x.ewm(com=3).cov(y),
-                      lambda x, y: x.ewm(com=3).corr(y), ]:
-                results = [f(df, s) for df in df1s] + [f(s, df) for df in df1s]
-                for (df, result) in zip(df1s, results):
-                    tm.assert_index_equal(result.index, df.index)
-                    tm.assert_index_equal(result.columns, df.columns)
-                for i, result in enumerate(results):
-                    if i > 0:
-                        self.assert_numpy_array_equal(result.values,
-                                                      results[0].values)
-
     def test_rolling_skew_edge_cases(self):
 
         all_nan = Series([np.NaN] * 5)
@@ -2833,55 +3084,88 @@ def test_rolling_kurt_edge_cases(self):
         x = d.rolling(window=4).kurt()
         tm.assert_series_equal(expected, x)
 
-    def _check_expanding_ndarray(self, func, static_comp, has_min_periods=True,
-                                 has_time_rule=True, preserve_nan=True):
-        result = func(self.arr)
+    def test_rolling_skew_eq_value_fperr(self):
+        # #18804 all rolling skew for all equal values should return Nan
+        a = Series([1.1] * 15).rolling(window=10).skew()
+        assert np.isnan(a).all()
+
+    def test_rolling_kurt_eq_value_fperr(self):
+        # #18804 all rolling kurt for all equal values should return Nan
+        a = Series([1.1] * 15).rolling(window=10).kurt()
+        assert np.isnan(a).all()
+
+    @pytest.mark.parametrize('func,static_comp', [('sum', np.sum),
+                                                  ('mean', np.mean),
+                                                  ('max', np.max),
+                                                  ('min', np.min)],
+                             ids=['sum', 'mean', 'max', 'min'])
+    def test_expanding_func(self, func, static_comp):
+        def expanding_func(x, min_periods=1, center=False, axis=0):
+            exp = x.expanding(min_periods=min_periods,
+                              center=center, axis=axis)
+            return getattr(exp, func)()
+        self._check_expanding(expanding_func, static_comp, preserve_nan=False)
+
+    def test_expanding_apply(self, raw):
+
+        def expanding_mean(x, min_periods=1):
+
+            exp = x.expanding(min_periods=min_periods)
+            result = exp.apply(lambda x: x.mean(), raw=raw)
+            return result
+
+        # TODO(jreback), needed to add preserve_nan=False
+        # here to make this pass
+        self._check_expanding(expanding_mean, np.mean, preserve_nan=False)
+
+        ser = Series([])
+        tm.assert_series_equal(ser, ser.expanding().apply(
+            lambda x: x.mean(), raw=raw))
+
+        # GH 8080
+        s = Series([None, None, None])
+        result = s.expanding(min_periods=0).apply(lambda x: len(x), raw=raw)
+        expected = Series([1., 2., 3.])
+        tm.assert_series_equal(result, expected)
 
-        tm.assert_almost_equal(result[10], static_comp(self.arr[:11]))
+    def _check_expanding(self, func, static_comp, has_min_periods=True,
+                         has_time_rule=True, preserve_nan=True):
+
+        series_result = func(self.series)
+        assert isinstance(series_result, Series)
+        frame_result = func(self.frame)
+        assert isinstance(frame_result, DataFrame)
+
+        result = func(self.series)
+        tm.assert_almost_equal(result[10], static_comp(self.series[:11]))
 
         if preserve_nan:
-            assert (np.isnan(result[self._nan_locs]).all())
+            assert result.iloc[self._nan_locs].isna().all()
 
-        arr = randn(50)
+        ser = Series(randn(50))
 
         if has_min_periods:
-            result = func(arr, min_periods=30)
-            assert (np.isnan(result[:29]).all())
-            tm.assert_almost_equal(result[-1], static_comp(arr[:50]))
+            result = func(ser, min_periods=30)
+            assert result[:29].isna().all()
+            tm.assert_almost_equal(result.iloc[-1], static_comp(ser[:50]))
 
             # min_periods is working correctly
-            result = func(arr, min_periods=15)
-            self.assertTrue(np.isnan(result[13]))
-            self.assertFalse(np.isnan(result[14]))
+            result = func(ser, min_periods=15)
+            assert isna(result.iloc[13])
+            assert notna(result.iloc[14])
 
-            arr2 = randn(20)
-            result = func(arr2, min_periods=5)
-            self.assertTrue(isnull(result[3]))
-            self.assertTrue(notnull(result[4]))
+            ser2 = Series(randn(20))
+            result = func(ser2, min_periods=5)
+            assert isna(result[3])
+            assert notna(result[4])
 
             # min_periods=0
-            result0 = func(arr, min_periods=0)
-            result1 = func(arr, min_periods=1)
+            result0 = func(ser, min_periods=0)
+            result1 = func(ser, min_periods=1)
             tm.assert_almost_equal(result0, result1)
         else:
-            result = func(arr)
-            tm.assert_almost_equal(result[-1], static_comp(arr[:50]))
-
-    def _check_expanding_structures(self, func):
-        series_result = func(self.series)
-        tm.assertIsInstance(series_result, Series)
-        frame_result = func(self.frame)
-        self.assertEqual(type(frame_result), DataFrame)
-
-    def _check_expanding(self, func, static_comp, has_min_periods=True,
-                         has_time_rule=True, preserve_nan=True):
-        with warnings.catch_warnings(record=True):
-            self._check_expanding_ndarray(func, static_comp,
-                                          has_min_periods=has_min_periods,
-                                          has_time_rule=has_time_rule,
-                                          preserve_nan=preserve_nan)
-        with warnings.catch_warnings(record=True):
-            self._check_expanding_structures(func)
+            result = func(ser)
+            tm.assert_almost_equal(result.iloc[-1], static_comp(ser[:50]))
 
     def test_rolling_max_gh6297(self):
         """Replicate result expected in GH #6297"""
@@ -2897,11 +3181,10 @@ def test_rolling_max_gh6297(self):
 
         expected = Series([1.0, 2.0, 6.0, 4.0, 5.0],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            x = series.rolling(window=1, freq='D').max()
+        x = series.resample('D').max().rolling(window=1).max()
         tm.assert_series_equal(expected, x)
 
-    def test_rolling_max_how_resample(self):
+    def test_rolling_max_resample(self):
 
         indices = [datetime(1975, 1, i) for i in range(1, 6)]
         # So that we can have 3 datapoints on last day (4, 10, and 20)
@@ -2916,26 +3199,23 @@ def test_rolling_max_how_resample(self):
         # Default how should be max
         expected = Series([0.0, 1.0, 2.0, 3.0, 20.0],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            x = series.rolling(window=1, freq='D').max()
+        x = series.resample('D').max().rolling(window=1).max()
         tm.assert_series_equal(expected, x)
 
         # Now specify median (10.0)
         expected = Series([0.0, 1.0, 2.0, 3.0, 10.0],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            x = series.rolling(window=1, freq='D').max(how='median')
+        x = series.resample('D').median().rolling(window=1).max()
         tm.assert_series_equal(expected, x)
 
         # Now specify mean (4+10+20)/3
         v = (4.0 + 10.0 + 20.0) / 3.0
         expected = Series([0.0, 1.0, 2.0, 3.0, v],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            x = series.rolling(window=1, freq='D').max(how='mean')
-            tm.assert_series_equal(expected, x)
+        x = series.resample('D').mean().rolling(window=1).max()
+        tm.assert_series_equal(expected, x)
 
-    def test_rolling_min_how_resample(self):
+    def test_rolling_min_resample(self):
 
         indices = [datetime(1975, 1, i) for i in range(1, 6)]
         # So that we can have 3 datapoints on last day (4, 10, and 20)
@@ -2950,11 +3230,10 @@ def test_rolling_min_how_resample(self):
         # Default how should be min
         expected = Series([0.0, 1.0, 2.0, 3.0, 4.0],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            r = series.rolling(window=1, freq='D')
-            tm.assert_series_equal(expected, r.min())
+        r = series.resample('D').min().rolling(window=1)
+        tm.assert_series_equal(expected, r.min())
 
-    def test_rolling_median_how_resample(self):
+    def test_rolling_median_resample(self):
 
         indices = [datetime(1975, 1, i) for i in range(1, 6)]
         # So that we can have 3 datapoints on last day (4, 10, and 20)
@@ -2969,9 +3248,8 @@ def test_rolling_median_how_resample(self):
         # Default how should be median
         expected = Series([0.0, 1.0, 2.0, 3.0, 10],
                           index=[datetime(1975, 1, i, 0) for i in range(1, 6)])
-        with catch_warnings(record=True):
-            x = series.rolling(window=1, freq='D').median()
-            tm.assert_series_equal(expected, x)
+        x = series.resample('D').median().rolling(window=1).median()
+        tm.assert_series_equal(expected, x)
 
     def test_rolling_median_memory_error(self):
         # GH11722
@@ -2991,29 +3269,29 @@ def test_rolling_min_max_numeric_types(self):
             # correctness
             result = (DataFrame(np.arange(20, dtype=data_type))
                       .rolling(window=5).max())
-            self.assertEqual(result.dtypes[0], np.dtype("f8"))
+            assert result.dtypes[0] == np.dtype("f8")
             result = (DataFrame(np.arange(20, dtype=data_type))
                       .rolling(window=5).min())
-            self.assertEqual(result.dtypes[0], np.dtype("f8"))
+            assert result.dtypes[0] == np.dtype("f8")
 
 
-class TestGrouperGrouping(tm.TestCase):
+class TestGrouperGrouping(object):
 
-    def setUp(self):
+    def setup_method(self, method):
         self.series = Series(np.arange(10))
         self.frame = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
                                 'B': np.arange(40)})
 
     def test_mutated(self):
 
-        def f():
+        msg = r"group\(\) got an unexpected keyword argument 'foo'"
+        with pytest.raises(TypeError, match=msg):
             self.frame.groupby('A', foo=1)
-        self.assertRaises(TypeError, f)
 
         g = self.frame.groupby('A')
-        self.assertFalse(g.mutated)
+        assert not g.mutated
         g = self.frame.groupby('A', mutated=True)
-        self.assertTrue(g.mutated)
+        assert g.mutated
 
     def test_getitem(self):
         g = self.frame.groupby('A')
@@ -3085,13 +3363,36 @@ def func(x):
             expected = g.apply(func)
             tm.assert_series_equal(result, expected)
 
-    def test_rolling_apply(self):
+    def test_rolling_apply(self, raw):
         g = self.frame.groupby('A')
         r = g.rolling(window=4)
 
         # reduction
-        result = r.apply(lambda x: x.sum())
-        expected = g.apply(lambda x: x.rolling(4).apply(lambda y: y.sum()))
+        result = r.apply(lambda x: x.sum(), raw=raw)
+        expected = g.apply(
+            lambda x: x.rolling(4).apply(lambda y: y.sum(), raw=raw))
+        tm.assert_frame_equal(result, expected)
+
+    def test_rolling_apply_mutability(self):
+        # GH 14013
+        df = pd.DataFrame({'A': ['foo'] * 3 + ['bar'] * 3, 'B': [1] * 6})
+        g = df.groupby('A')
+
+        mi = pd.MultiIndex.from_tuples([('bar', 3), ('bar', 4), ('bar', 5),
+                                        ('foo', 0), ('foo', 1), ('foo', 2)])
+
+        mi.names = ['A', None]
+        # Grouped column should not be a part of the output
+        expected = pd.DataFrame([np.nan, 2., 2.] * 2, columns=['B'], index=mi)
+
+        result = g.rolling(window=2).sum()
+        tm.assert_frame_equal(result, expected)
+
+        # Call an arbitrary function on the groupby
+        g.sum()
+
+        # Make sure nothing has been mutated
+        result = g.rolling(window=2).sum()
         tm.assert_frame_equal(result, expected)
 
     def test_expanding(self):
@@ -3132,22 +3433,23 @@ def func(x):
             expected = g.apply(func)
             tm.assert_series_equal(result, expected)
 
-    def test_expanding_apply(self):
+    def test_expanding_apply(self, raw):
         g = self.frame.groupby('A')
         r = g.expanding()
 
         # reduction
-        result = r.apply(lambda x: x.sum())
-        expected = g.apply(lambda x: x.expanding().apply(lambda y: y.sum()))
+        result = r.apply(lambda x: x.sum(), raw=raw)
+        expected = g.apply(
+            lambda x: x.expanding().apply(lambda y: y.sum(), raw=raw))
         tm.assert_frame_equal(result, expected)
 
 
-class TestRollingTS(tm.TestCase):
+class TestRollingTS(object):
 
     # rolling time-series friendly
     # xref GH13327
 
-    def setUp(self):
+    def setup_method(self, method):
 
         self.regular = DataFrame({'A': pd.date_range('20130101',
                                                      periods=5,
@@ -3177,16 +3479,16 @@ def test_valid(self):
         df = self.regular
 
         # not a valid freq
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.rolling(window='foobar')
 
         # not a datetimelike index
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.reset_index().rolling(window='foobar')
 
         # non-fixed freqs
         for freq in ['2MS', pd.offsets.MonthBegin(2)]:
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 df.rolling(window=freq)
 
         for freq in ['1D', pd.offsets.Day(2), '2ms']:
@@ -3194,11 +3496,11 @@ def test_valid(self):
 
         # non-integer min_periods
         for minp in [1.0, 'foo', np.array([1, 2, 3])]:
-            with self.assertRaises(ValueError):
+            with pytest.raises(ValueError):
                 df.rolling(window='1D', min_periods=minp)
 
         # center is not implemented
-        with self.assertRaises(NotImplementedError):
+        with pytest.raises(NotImplementedError):
             df.rolling(window='1D', center=True)
 
     def test_on(self):
@@ -3206,7 +3508,7 @@ def test_on(self):
         df = self.regular
 
         # not a valid column
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.rolling(window='2s', on='foobar')
 
         # column is valid
@@ -3215,7 +3517,7 @@ def test_on(self):
         df.rolling(window='2d', on='C').sum()
 
         # invalid columns
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.rolling(window='2d', on='B')
 
         # ok even though on non-selected
@@ -3229,22 +3531,22 @@ def test_monotonic_on(self):
                                            freq='s'),
                         'B': range(5)})
 
-        self.assertTrue(df.A.is_monotonic)
+        assert df.A.is_monotonic
         df.rolling('2s', on='A').sum()
 
         df = df.set_index('A')
-        self.assertTrue(df.index.is_monotonic)
+        assert df.index.is_monotonic
         df.rolling('2s').sum()
 
         # non-monotonic
         df.index = reversed(df.index.tolist())
-        self.assertFalse(df.index.is_monotonic)
+        assert not df.index.is_monotonic
 
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.rolling('2s').sum()
 
         df = df.reset_index()
-        with self.assertRaises(ValueError):
+        with pytest.raises(ValueError):
             df.rolling('2s', on='A').sum()
 
     def test_frame_on(self):
@@ -3276,7 +3578,7 @@ def test_frame_on(self):
 
         # test as a frame
         # we should be ignoring the 'on' as an aggregation column
-        # note that the expected is setting, computing, and reseting
+        # note that the expected is setting, computing, and resetting
         # so the columns need to be switched compared
         # to the actual result where they are ordered as in the
         # original
@@ -3296,11 +3598,11 @@ def test_frame_on2(self):
         # using multiple aggregation columns
         df = DataFrame({'A': [0, 1, 2, 3, 4],
                         'B': [0, 1, 2, np.nan, 4],
-                        'C': pd.Index([pd.Timestamp('20130101 09:00:00'),
-                                       pd.Timestamp('20130101 09:00:02'),
-                                       pd.Timestamp('20130101 09:00:03'),
-                                       pd.Timestamp('20130101 09:00:05'),
-                                       pd.Timestamp('20130101 09:00:06')])},
+                        'C': Index([Timestamp('20130101 09:00:00'),
+                                    Timestamp('20130101 09:00:02'),
+                                    Timestamp('20130101 09:00:03'),
+                                    Timestamp('20130101 09:00:05'),
+                                    Timestamp('20130101 09:00:06')])},
                        columns=['A', 'C', 'B'])
 
         expected1 = DataFrame({'A': [0., 1, 3, 3, 7],
@@ -3356,6 +3658,45 @@ def test_min_periods(self):
         result = df.rolling('2s', min_periods=1).sum()
         tm.assert_frame_equal(result, expected)
 
+    def test_closed(self):
+
+        # xref GH13965
+
+        df = DataFrame({'A': [1] * 5},
+                       index=[Timestamp('20130101 09:00:01'),
+                              Timestamp('20130101 09:00:02'),
+                              Timestamp('20130101 09:00:03'),
+                              Timestamp('20130101 09:00:04'),
+                              Timestamp('20130101 09:00:06')])
+
+        # closed must be 'right', 'left', 'both', 'neither'
+        with pytest.raises(ValueError):
+            self.regular.rolling(window='2s', closed="blabla")
+
+        expected = df.copy()
+        expected["A"] = [1.0, 2, 2, 2, 1]
+        result = df.rolling('2s', closed='right').sum()
+        tm.assert_frame_equal(result, expected)
+
+        # default should be 'right'
+        result = df.rolling('2s').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [1.0, 2, 3, 3, 2]
+        result = df.rolling('2s', closed='both').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [np.nan, 1.0, 2, 2, 1]
+        result = df.rolling('2s', closed='left').sum()
+        tm.assert_frame_equal(result, expected)
+
+        expected = df.copy()
+        expected["A"] = [np.nan, 1.0, 1, 1, np.nan]
+        result = df.rolling('2s', closed='neither').sum()
+        tm.assert_frame_equal(result, expected)
+
     def test_ragged_sum(self):
 
         df = self.ragged
@@ -3435,7 +3776,7 @@ def test_ragged_quantile(self):
 
         result = df.rolling(window='2s', min_periods=1).quantile(0.5)
         expected = df.copy()
-        expected['B'] = [0.0, 1, 1.0, 3.0, 3.0]
+        expected['B'] = [0.0, 1, 1.5, 3.0, 3.5]
         tm.assert_frame_equal(result, expected)
 
     def test_ragged_std(self):
@@ -3588,11 +3929,11 @@ def test_perf_min(self):
                                             freq='s'))
         expected = dfp.rolling(2, min_periods=1).min()
         result = dfp.rolling('2s').min()
-        self.assertTrue(((result - expected) < 0.01).all().bool())
+        assert ((result - expected) < 0.01).all().bool()
 
         expected = dfp.rolling(200, min_periods=1).min()
         result = dfp.rolling('200s').min()
-        self.assertTrue(((result - expected) < 0.01).all().bool())
+        assert ((result - expected) < 0.01).all().bool()
 
     def test_ragged_max(self):
 
@@ -3613,29 +3954,29 @@ def test_ragged_max(self):
         expected['B'] = [0.0, 1, 2, 3, 4]
         tm.assert_frame_equal(result, expected)
 
-    def test_ragged_apply(self):
+    def test_ragged_apply(self, raw):
 
         df = self.ragged
 
         f = lambda x: 1
-        result = df.rolling(window='1s', min_periods=1).apply(f)
+        result = df.rolling(window='1s', min_periods=1).apply(f, raw=raw)
         expected = df.copy()
         expected['B'] = 1.
         tm.assert_frame_equal(result, expected)
 
-        result = df.rolling(window='2s', min_periods=1).apply(f)
+        result = df.rolling(window='2s', min_periods=1).apply(f, raw=raw)
         expected = df.copy()
         expected['B'] = 1.
         tm.assert_frame_equal(result, expected)
 
-        result = df.rolling(window='5s', min_periods=1).apply(f)
+        result = df.rolling(window='5s', min_periods=1).apply(f, raw=raw)
         expected = df.copy()
         expected['B'] = 1.
         tm.assert_frame_equal(result, expected)
 
     def test_all(self):
 
-        # simple comparision of integer vs time-based windowing
+        # simple comparison of integer vs time-based windowing
         df = self.regular * 2
         er = df.rolling(window=1)
         r = df.rolling(window='1s')
@@ -3651,13 +3992,19 @@ def test_all(self):
         expected = er.quantile(0.5)
         tm.assert_frame_equal(result, expected)
 
-        result = r.apply(lambda x: 1)
-        expected = er.apply(lambda x: 1)
+    def test_all_apply(self, raw):
+
+        df = self.regular * 2
+        er = df.rolling(window=1)
+        r = df.rolling(window='1s')
+
+        result = r.apply(lambda x: 1, raw=raw)
+        expected = er.apply(lambda x: 1, raw=raw)
         tm.assert_frame_equal(result, expected)
 
     def test_all2(self):
 
-        # more sophisticated comparision of integer vs.
+        # more sophisticated comparison of integer vs.
         # time-based windowing
         df = DataFrame({'B': np.arange(50)},
                        index=pd.date_range('20130101',
@@ -3697,10 +4044,48 @@ def test_groupby_monotonic(self):
             ['Ryan', '3/31/2016', 50], ['Joe', '7/1/2015', 100],
             ['Joe', '9/9/2015', 500], ['Joe', '10/15/2015', 50]]
 
-        df = pd.DataFrame(data=data, columns=['name', 'date', 'amount'])
+        df = DataFrame(data=data, columns=['name', 'date', 'amount'])
         df['date'] = pd.to_datetime(df['date'])
 
         expected = df.set_index('date').groupby('name').apply(
             lambda x: x.rolling('180D')['amount'].sum())
         result = df.groupby('name').rolling('180D', on='date')['amount'].sum()
         tm.assert_series_equal(result, expected)
+
+    def test_non_monotonic(self):
+        # GH 13966 (similar to #15130, closed by #15175)
+
+        dates = pd.date_range(start='2016-01-01 09:30:00',
+                              periods=20, freq='s')
+        df = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
+                        'B': np.concatenate((dates, dates)),
+                        'C': np.arange(40)})
+
+        result = df.groupby('A').rolling('4s', on='B').C.mean()
+        expected = df.set_index('B').groupby('A').apply(
+            lambda x: x.rolling('4s')['C'].mean())
+        tm.assert_series_equal(result, expected)
+
+        df2 = df.sort_values('B')
+        result = df2.groupby('A').rolling('4s', on='B').C.mean()
+        tm.assert_series_equal(result, expected)
+
+    def test_rolling_cov_offset(self):
+        # GH16058
+
+        idx = pd.date_range('2017-01-01', periods=24, freq='1h')
+        ss = Series(np.arange(len(idx)), index=idx)
+
+        result = ss.rolling('2h').cov()
+        expected = Series([np.nan] + [0.5] * (len(idx) - 1), index=idx)
+        tm.assert_series_equal(result, expected)
+
+        expected2 = ss.rolling(2, min_periods=1).cov()
+        tm.assert_series_equal(result, expected2)
+
+        result = ss.rolling('3h').cov()
+        expected = Series([np.nan, 0.5] + [1.0] * (len(idx) - 2), index=idx)
+        tm.assert_series_equal(result, expected)
+
+        expected2 = ss.rolling(3, min_periods=1).cov()
+        tm.assert_series_equal(result, expected2)
diff --git a/pandas/tests/tools/test_concat.py b/pandas/tests/tools/test_concat.py
deleted file mode 100644
index c41924a7987bd..0000000000000
--- a/pandas/tests/tools/test_concat.py
+++ /dev/null
@@ -1,1927 +0,0 @@
-from warnings import catch_warnings
-import numpy as np
-from numpy.random import randn
-
-from datetime import datetime
-from pandas.compat import StringIO, iteritems
-import pandas as pd
-from pandas import (DataFrame, concat,
-                    read_csv, isnull, Series, date_range,
-                    Index, Panel, MultiIndex, Timestamp,
-                    DatetimeIndex)
-from pandas.util import testing as tm
-from pandas.util.testing import (assert_frame_equal,
-                                 makeCustomDataframe as mkdf,
-                                 assert_almost_equal)
-
-import pytest
-
-
-class ConcatenateBase(tm.TestCase):
-
-    def setUp(self):
-        self.frame = DataFrame(tm.getSeriesData())
-        self.mixed_frame = self.frame.copy()
-        self.mixed_frame['foo'] = 'bar'
-
-
-class TestConcatAppendCommon(ConcatenateBase):
-
-    """
-    Test common dtype coercion rules between concat and append.
-    """
-
-    def setUp(self):
-
-        dt_data = [pd.Timestamp('2011-01-01'),
-                   pd.Timestamp('2011-01-02'),
-                   pd.Timestamp('2011-01-03')]
-        tz_data = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
-                   pd.Timestamp('2011-01-02', tz='US/Eastern'),
-                   pd.Timestamp('2011-01-03', tz='US/Eastern')]
-
-        td_data = [pd.Timedelta('1 days'),
-                   pd.Timedelta('2 days'),
-                   pd.Timedelta('3 days')]
-
-        period_data = [pd.Period('2011-01', freq='M'),
-                       pd.Period('2011-02', freq='M'),
-                       pd.Period('2011-03', freq='M')]
-
-        self.data = {'bool': [True, False, True],
-                     'int64': [1, 2, 3],
-                     'float64': [1.1, np.nan, 3.3],
-                     'category': pd.Categorical(['X', 'Y', 'Z']),
-                     'object': ['a', 'b', 'c'],
-                     'datetime64[ns]': dt_data,
-                     'datetime64[ns, US/Eastern]': tz_data,
-                     'timedelta64[ns]': td_data,
-                     'period[M]': period_data}
-
-    def _check_expected_dtype(self, obj, label):
-        """
-        Check whether obj has expected dtype depending on label
-        considering not-supported dtypes
-        """
-        if isinstance(obj, pd.Index):
-            if label == 'bool':
-                self.assertEqual(obj.dtype, 'object')
-            else:
-                self.assertEqual(obj.dtype, label)
-        elif isinstance(obj, pd.Series):
-            if label.startswith('period'):
-                self.assertEqual(obj.dtype, 'object')
-            else:
-                self.assertEqual(obj.dtype, label)
-        else:
-            raise ValueError
-
-    def test_dtypes(self):
-        # to confirm test case covers intended dtypes
-        for typ, vals in iteritems(self.data):
-            self._check_expected_dtype(pd.Index(vals), typ)
-            self._check_expected_dtype(pd.Series(vals), typ)
-
-    def test_concatlike_same_dtypes(self):
-        # GH 13660
-        for typ1, vals1 in iteritems(self.data):
-
-            vals2 = vals1
-            vals3 = vals1
-
-            if typ1 == 'category':
-                exp_data = pd.Categorical(list(vals1) + list(vals2))
-                exp_data3 = pd.Categorical(list(vals1) + list(vals2) +
-                                           list(vals3))
-            else:
-                exp_data = vals1 + vals2
-                exp_data3 = vals1 + vals2 + vals3
-
-            # ----- Index ----- #
-
-            # index.append
-            res = pd.Index(vals1).append(pd.Index(vals2))
-            exp = pd.Index(exp_data)
-            tm.assert_index_equal(res, exp)
-
-            # 3 elements
-            res = pd.Index(vals1).append([pd.Index(vals2), pd.Index(vals3)])
-            exp = pd.Index(exp_data3)
-            tm.assert_index_equal(res, exp)
-
-            # index.append name mismatch
-            i1 = pd.Index(vals1, name='x')
-            i2 = pd.Index(vals2, name='y')
-            res = i1.append(i2)
-            exp = pd.Index(exp_data)
-            tm.assert_index_equal(res, exp)
-
-            # index.append name match
-            i1 = pd.Index(vals1, name='x')
-            i2 = pd.Index(vals2, name='x')
-            res = i1.append(i2)
-            exp = pd.Index(exp_data, name='x')
-            tm.assert_index_equal(res, exp)
-
-            # cannot append non-index
-            with tm.assertRaisesRegexp(TypeError, 'all inputs must be Index'):
-                pd.Index(vals1).append(vals2)
-
-            with tm.assertRaisesRegexp(TypeError, 'all inputs must be Index'):
-                pd.Index(vals1).append([pd.Index(vals2), vals3])
-
-            # ----- Series ----- #
-
-            # series.append
-            res = pd.Series(vals1).append(pd.Series(vals2),
-                                          ignore_index=True)
-            exp = pd.Series(exp_data)
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            # concat
-            res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
-                            ignore_index=True)
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            # 3 elements
-            res = pd.Series(vals1).append([pd.Series(vals2), pd.Series(vals3)],
-                                          ignore_index=True)
-            exp = pd.Series(exp_data3)
-            tm.assert_series_equal(res, exp)
-
-            res = pd.concat([pd.Series(vals1), pd.Series(vals2),
-                             pd.Series(vals3)], ignore_index=True)
-            tm.assert_series_equal(res, exp)
-
-            # name mismatch
-            s1 = pd.Series(vals1, name='x')
-            s2 = pd.Series(vals2, name='y')
-            res = s1.append(s2, ignore_index=True)
-            exp = pd.Series(exp_data)
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            res = pd.concat([s1, s2], ignore_index=True)
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            # name match
-            s1 = pd.Series(vals1, name='x')
-            s2 = pd.Series(vals2, name='x')
-            res = s1.append(s2, ignore_index=True)
-            exp = pd.Series(exp_data, name='x')
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            res = pd.concat([s1, s2], ignore_index=True)
-            tm.assert_series_equal(res, exp, check_index_type=True)
-
-            # cannot append non-index
-            msg = "cannot concatenate a non-NDFrame object"
-            with tm.assertRaisesRegexp(TypeError, msg):
-                pd.Series(vals1).append(vals2)
-
-            with tm.assertRaisesRegexp(TypeError, msg):
-                pd.Series(vals1).append([pd.Series(vals2), vals3])
-
-            with tm.assertRaisesRegexp(TypeError, msg):
-                pd.concat([pd.Series(vals1), vals2])
-
-            with tm.assertRaisesRegexp(TypeError, msg):
-                pd.concat([pd.Series(vals1), pd.Series(vals2), vals3])
-
-    def test_concatlike_dtypes_coercion(self):
-        # GH 13660
-        for typ1, vals1 in iteritems(self.data):
-            for typ2, vals2 in iteritems(self.data):
-
-                vals3 = vals2
-
-                # basically infer
-                exp_index_dtype = None
-                exp_series_dtype = None
-
-                if typ1 == typ2:
-                    # same dtype is tested in test_concatlike_same_dtypes
-                    continue
-                elif typ1 == 'category' or typ2 == 'category':
-                    # ToDo: suspicious
-                    continue
-
-                # specify expected dtype
-                if typ1 == 'bool' and typ2 in ('int64', 'float64'):
-                    # series coerces to numeric based on numpy rule
-                    # index doesn't because bool is object dtype
-                    exp_series_dtype = typ2
-                elif typ2 == 'bool' and typ1 in ('int64', 'float64'):
-                    exp_series_dtype = typ1
-                elif (typ1 == 'datetime64[ns, US/Eastern]' or
-                      typ2 == 'datetime64[ns, US/Eastern]' or
-                      typ1 == 'timedelta64[ns]' or
-                      typ2 == 'timedelta64[ns]'):
-                    exp_index_dtype = object
-                    exp_series_dtype = object
-
-                exp_data = vals1 + vals2
-                exp_data3 = vals1 + vals2 + vals3
-
-                # ----- Index ----- #
-
-                # index.append
-                res = pd.Index(vals1).append(pd.Index(vals2))
-                exp = pd.Index(exp_data, dtype=exp_index_dtype)
-                tm.assert_index_equal(res, exp)
-
-                # 3 elements
-                res = pd.Index(vals1).append([pd.Index(vals2),
-                                              pd.Index(vals3)])
-                exp = pd.Index(exp_data3, dtype=exp_index_dtype)
-                tm.assert_index_equal(res, exp)
-
-                # ----- Series ----- #
-
-                # series.append
-                res = pd.Series(vals1).append(pd.Series(vals2),
-                                              ignore_index=True)
-                exp = pd.Series(exp_data, dtype=exp_series_dtype)
-                tm.assert_series_equal(res, exp, check_index_type=True)
-
-                # concat
-                res = pd.concat([pd.Series(vals1), pd.Series(vals2)],
-                                ignore_index=True)
-                tm.assert_series_equal(res, exp, check_index_type=True)
-
-                # 3 elements
-                res = pd.Series(vals1).append([pd.Series(vals2),
-                                               pd.Series(vals3)],
-                                              ignore_index=True)
-                exp = pd.Series(exp_data3, dtype=exp_series_dtype)
-                tm.assert_series_equal(res, exp)
-
-                res = pd.concat([pd.Series(vals1), pd.Series(vals2),
-                                 pd.Series(vals3)], ignore_index=True)
-                tm.assert_series_equal(res, exp)
-
-    def test_concatlike_common_coerce_to_pandas_object(self):
-        # GH 13626
-        # result must be Timestamp/Timedelta, not datetime.datetime/timedelta
-        dti = pd.DatetimeIndex(['2011-01-01', '2011-01-02'])
-        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
-
-        exp = pd.Index([pd.Timestamp('2011-01-01'),
-                        pd.Timestamp('2011-01-02'),
-                        pd.Timedelta('1 days'),
-                        pd.Timedelta('2 days')])
-
-        res = dti.append(tdi)
-        tm.assert_index_equal(res, exp)
-        tm.assertIsInstance(res[0], pd.Timestamp)
-        tm.assertIsInstance(res[-1], pd.Timedelta)
-
-        dts = pd.Series(dti)
-        tds = pd.Series(tdi)
-        res = dts.append(tds)
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-        tm.assertIsInstance(res.iloc[0], pd.Timestamp)
-        tm.assertIsInstance(res.iloc[-1], pd.Timedelta)
-
-        res = pd.concat([dts, tds])
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-        tm.assertIsInstance(res.iloc[0], pd.Timestamp)
-        tm.assertIsInstance(res.iloc[-1], pd.Timedelta)
-
-    def test_concatlike_datetimetz(self):
-        # GH 7795
-        for tz in ['UTC', 'US/Eastern', 'Asia/Tokyo']:
-            dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
-            dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'], tz=tz)
-
-            exp = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
-                                    '2012-01-01', '2012-01-02'], tz=tz)
-
-            res = dti1.append(dti2)
-            tm.assert_index_equal(res, exp)
-
-            dts1 = pd.Series(dti1)
-            dts2 = pd.Series(dti2)
-            res = dts1.append(dts2)
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-            res = pd.concat([dts1, dts2])
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-    def test_concatlike_datetimetz_short(self):
-        # GH 7795
-        for tz in ['UTC', 'US/Eastern', 'Asia/Tokyo', 'EST5EDT']:
-
-            ix1 = pd.DatetimeIndex(start='2014-07-15', end='2014-07-17',
-                                   freq='D', tz=tz)
-            ix2 = pd.DatetimeIndex(['2014-07-11', '2014-07-21'], tz=tz)
-            df1 = pd.DataFrame(0, index=ix1, columns=['A', 'B'])
-            df2 = pd.DataFrame(0, index=ix2, columns=['A', 'B'])
-
-            exp_idx = pd.DatetimeIndex(['2014-07-15', '2014-07-16',
-                                        '2014-07-17', '2014-07-11',
-                                        '2014-07-21'], tz=tz)
-            exp = pd.DataFrame(0, index=exp_idx, columns=['A', 'B'])
-
-            tm.assert_frame_equal(df1.append(df2), exp)
-            tm.assert_frame_equal(pd.concat([df1, df2]), exp)
-
-    def test_concatlike_datetimetz_to_object(self):
-        # GH 13660
-
-        # different tz coerces to object
-        for tz in ['UTC', 'US/Eastern', 'Asia/Tokyo']:
-            dti1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02'], tz=tz)
-            dti2 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'])
-
-            exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                            pd.Timestamp('2011-01-02', tz=tz),
-                            pd.Timestamp('2012-01-01'),
-                            pd.Timestamp('2012-01-02')], dtype=object)
-
-            res = dti1.append(dti2)
-            tm.assert_index_equal(res, exp)
-
-            dts1 = pd.Series(dti1)
-            dts2 = pd.Series(dti2)
-            res = dts1.append(dts2)
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-            res = pd.concat([dts1, dts2])
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-            # different tz
-            dti3 = pd.DatetimeIndex(['2012-01-01', '2012-01-02'],
-                                    tz='US/Pacific')
-
-            exp = pd.Index([pd.Timestamp('2011-01-01', tz=tz),
-                            pd.Timestamp('2011-01-02', tz=tz),
-                            pd.Timestamp('2012-01-01', tz='US/Pacific'),
-                            pd.Timestamp('2012-01-02', tz='US/Pacific')],
-                           dtype=object)
-
-            res = dti1.append(dti3)
-            # tm.assert_index_equal(res, exp)
-
-            dts1 = pd.Series(dti1)
-            dts3 = pd.Series(dti3)
-            res = dts1.append(dts3)
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-            res = pd.concat([dts1, dts3])
-            tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-    def test_concatlike_common_period(self):
-        # GH 13660
-        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
-        pi2 = pd.PeriodIndex(['2012-01', '2012-02'], freq='M')
-
-        exp = pd.PeriodIndex(['2011-01', '2011-02', '2012-01',
-                              '2012-02'], freq='M')
-
-        res = pi1.append(pi2)
-        tm.assert_index_equal(res, exp)
-
-        ps1 = pd.Series(pi1)
-        ps2 = pd.Series(pi2)
-        res = ps1.append(ps2)
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-        res = pd.concat([ps1, ps2])
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-    def test_concatlike_common_period_diff_freq_to_object(self):
-        # GH 13221
-        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
-        pi2 = pd.PeriodIndex(['2012-01-01', '2012-02-01'], freq='D')
-
-        exp = pd.Index([pd.Period('2011-01', freq='M'),
-                        pd.Period('2011-02', freq='M'),
-                        pd.Period('2012-01-01', freq='D'),
-                        pd.Period('2012-02-01', freq='D')], dtype=object)
-
-        res = pi1.append(pi2)
-        tm.assert_index_equal(res, exp)
-
-        ps1 = pd.Series(pi1)
-        ps2 = pd.Series(pi2)
-        res = ps1.append(ps2)
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-        res = pd.concat([ps1, ps2])
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-    def test_concatlike_common_period_mixed_dt_to_object(self):
-        # GH 13221
-        # different datetimelike
-        pi1 = pd.PeriodIndex(['2011-01', '2011-02'], freq='M')
-        tdi = pd.TimedeltaIndex(['1 days', '2 days'])
-        exp = pd.Index([pd.Period('2011-01', freq='M'),
-                        pd.Period('2011-02', freq='M'),
-                        pd.Timedelta('1 days'),
-                        pd.Timedelta('2 days')], dtype=object)
-
-        res = pi1.append(tdi)
-        tm.assert_index_equal(res, exp)
-
-        ps1 = pd.Series(pi1)
-        tds = pd.Series(tdi)
-        res = ps1.append(tds)
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-        res = pd.concat([ps1, tds])
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-        # inverse
-        exp = pd.Index([pd.Timedelta('1 days'),
-                        pd.Timedelta('2 days'),
-                        pd.Period('2011-01', freq='M'),
-                        pd.Period('2011-02', freq='M')], dtype=object)
-
-        res = tdi.append(pi1)
-        tm.assert_index_equal(res, exp)
-
-        ps1 = pd.Series(pi1)
-        tds = pd.Series(tdi)
-        res = tds.append(ps1)
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-        res = pd.concat([tds, ps1])
-        tm.assert_series_equal(res, pd.Series(exp, index=[0, 1, 0, 1]))
-
-    def test_concat_categorical(self):
-        # GH 13524
-
-        # same categories -> category
-        s1 = pd.Series([1, 2, np.nan], dtype='category')
-        s2 = pd.Series([2, 1, 2], dtype='category')
-
-        exp = pd.Series([1, 2, np.nan, 2, 1, 2], dtype='category')
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        # partially different categories => not-category
-        s1 = pd.Series([3, 2], dtype='category')
-        s2 = pd.Series([2, 1], dtype='category')
-
-        exp = pd.Series([3, 2, 2, 1])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        # completelly different categories (same dtype) => not-category
-        s1 = pd.Series([10, 11, np.nan], dtype='category')
-        s2 = pd.Series([np.nan, 1, 3, 2], dtype='category')
-
-        exp = pd.Series([10, 11, np.nan, np.nan, 1, 3, 2])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-    def test_concat_categorical_coercion(self):
-        # GH 13524
-
-        # category + not-category => not-category
-        s1 = pd.Series([1, 2, np.nan], dtype='category')
-        s2 = pd.Series([2, 1, 2])
-
-        exp = pd.Series([1, 2, np.nan, 2, 1, 2])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        # result shouldn't be affected by 1st elem dtype
-        exp = pd.Series([2, 1, 2, 1, 2, np.nan])
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-        # all values are not in category => not-category
-        s1 = pd.Series([3, 2], dtype='category')
-        s2 = pd.Series([2, 1])
-
-        exp = pd.Series([3, 2, 2, 1])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        exp = pd.Series([2, 1, 3, 2])
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-        # completelly different categories => not-category
-        s1 = pd.Series([10, 11, np.nan], dtype='category')
-        s2 = pd.Series([1, 3, 2])
-
-        exp = pd.Series([10, 11, np.nan, 1, 3, 2])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        exp = pd.Series([1, 3, 2, 10, 11, np.nan])
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-        # different dtype => not-category
-        s1 = pd.Series([10, 11, np.nan], dtype='category')
-        s2 = pd.Series(['a', 'b', 'c'])
-
-        exp = pd.Series([10, 11, np.nan, 'a', 'b', 'c'])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        exp = pd.Series(['a', 'b', 'c', 10, 11, np.nan])
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-        # if normal series only contains NaN-likes => not-category
-        s1 = pd.Series([10, 11], dtype='category')
-        s2 = pd.Series([np.nan, np.nan, np.nan])
-
-        exp = pd.Series([10, 11, np.nan, np.nan, np.nan])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        exp = pd.Series([np.nan, np.nan, np.nan, 10, 11])
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-    def test_concat_categorical_3elem_coercion(self):
-        # GH 13524
-
-        # mixed dtypes => not-category
-        s1 = pd.Series([1, 2, np.nan], dtype='category')
-        s2 = pd.Series([2, 1, 2], dtype='category')
-        s3 = pd.Series([1, 2, 1, 2, np.nan])
-
-        exp = pd.Series([1, 2, np.nan, 2, 1, 2, 1, 2, 1, 2, np.nan])
-        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
-
-        exp = pd.Series([1, 2, 1, 2, np.nan, 1, 2, np.nan, 2, 1, 2])
-        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
-
-        # values are all in either category => not-category
-        s1 = pd.Series([4, 5, 6], dtype='category')
-        s2 = pd.Series([1, 2, 3], dtype='category')
-        s3 = pd.Series([1, 3, 4])
-
-        exp = pd.Series([4, 5, 6, 1, 2, 3, 1, 3, 4])
-        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
-
-        exp = pd.Series([1, 3, 4, 4, 5, 6, 1, 2, 3])
-        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
-
-        # values are all in either category => not-category
-        s1 = pd.Series([4, 5, 6], dtype='category')
-        s2 = pd.Series([1, 2, 3], dtype='category')
-        s3 = pd.Series([10, 11, 12])
-
-        exp = pd.Series([4, 5, 6, 1, 2, 3, 10, 11, 12])
-        tm.assert_series_equal(pd.concat([s1, s2, s3], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append([s2, s3], ignore_index=True), exp)
-
-        exp = pd.Series([10, 11, 12, 4, 5, 6, 1, 2, 3])
-        tm.assert_series_equal(pd.concat([s3, s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s3.append([s1, s2], ignore_index=True), exp)
-
-    def test_concat_categorical_multi_coercion(self):
-        # GH 13524
-
-        s1 = pd.Series([1, 3], dtype='category')
-        s2 = pd.Series([3, 4], dtype='category')
-        s3 = pd.Series([2, 3])
-        s4 = pd.Series([2, 2], dtype='category')
-        s5 = pd.Series([1, np.nan])
-        s6 = pd.Series([1, 3, 2], dtype='category')
-
-        # mixed dtype, values are all in categories => not-category
-        exp = pd.Series([1, 3, 3, 4, 2, 3, 2, 2, 1, np.nan, 1, 3, 2])
-        res = pd.concat([s1, s2, s3, s4, s5, s6], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-        res = s1.append([s2, s3, s4, s5, s6], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-
-        exp = pd.Series([1, 3, 2, 1, np.nan, 2, 2, 2, 3, 3, 4, 1, 3])
-        res = pd.concat([s6, s5, s4, s3, s2, s1], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-        res = s6.append([s5, s4, s3, s2, s1], ignore_index=True)
-        tm.assert_series_equal(res, exp)
-
-    def test_concat_categorical_ordered(self):
-        # GH 13524
-
-        s1 = pd.Series(pd.Categorical([1, 2, np.nan], ordered=True))
-        s2 = pd.Series(pd.Categorical([2, 1, 2], ordered=True))
-
-        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2], ordered=True))
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        exp = pd.Series(pd.Categorical([1, 2, np.nan, 2, 1, 2, 1, 2, np.nan],
-                                       ordered=True))
-        tm.assert_series_equal(pd.concat([s1, s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append([s2, s1], ignore_index=True), exp)
-
-    def test_concat_categorical_coercion_nan(self):
-        # GH 13524
-
-        # some edge cases
-        # category + not-category => not category
-        s1 = pd.Series(np.array([np.nan, np.nan], dtype=np.float64),
-                       dtype='category')
-        s2 = pd.Series([np.nan, 1])
-
-        exp = pd.Series([np.nan, np.nan, np.nan, 1])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        s1 = pd.Series([1, np.nan], dtype='category')
-        s2 = pd.Series([np.nan, np.nan])
-
-        exp = pd.Series([1, np.nan, np.nan, np.nan])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        # mixed dtype, all nan-likes => not-category
-        s1 = pd.Series([np.nan, np.nan], dtype='category')
-        s2 = pd.Series([np.nan, np.nan])
-
-        exp = pd.Series([np.nan, np.nan, np.nan, np.nan], dtype=object)
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-        # all category nan-likes => category
-        s1 = pd.Series([np.nan, np.nan], dtype='category')
-        s2 = pd.Series([np.nan, np.nan], dtype='category')
-
-        exp = pd.Series([np.nan, np.nan, np.nan, np.nan], dtype='category')
-
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-    def test_concat_categorical_empty(self):
-        # GH 13524
-
-        s1 = pd.Series([], dtype='category')
-        s2 = pd.Series([1, 2], dtype='category')
-
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
-
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
-
-        s1 = pd.Series([], dtype='category')
-        s2 = pd.Series([], dtype='category')
-
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
-
-        s1 = pd.Series([], dtype='category')
-        s2 = pd.Series([])
-
-        # different dtype => not-category
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), s2)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), s2)
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), s2)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), s2)
-
-        s1 = pd.Series([], dtype='category')
-        s2 = pd.Series([np.nan, np.nan])
-
-        # empty Series is ignored
-        exp = pd.Series([np.nan, np.nan])
-        tm.assert_series_equal(pd.concat([s1, s2], ignore_index=True), exp)
-        tm.assert_series_equal(s1.append(s2, ignore_index=True), exp)
-
-        tm.assert_series_equal(pd.concat([s2, s1], ignore_index=True), exp)
-        tm.assert_series_equal(s2.append(s1, ignore_index=True), exp)
-
-
-class TestAppend(ConcatenateBase):
-
-    def test_append(self):
-        begin_index = self.frame.index[:5]
-        end_index = self.frame.index[5:]
-
-        begin_frame = self.frame.reindex(begin_index)
-        end_frame = self.frame.reindex(end_index)
-
-        appended = begin_frame.append(end_frame)
-        assert_almost_equal(appended['A'], self.frame['A'])
-
-        del end_frame['A']
-        partial_appended = begin_frame.append(end_frame)
-        self.assertIn('A', partial_appended)
-
-        partial_appended = end_frame.append(begin_frame)
-        self.assertIn('A', partial_appended)
-
-        # mixed type handling
-        appended = self.mixed_frame[:5].append(self.mixed_frame[5:])
-        assert_frame_equal(appended, self.mixed_frame)
-
-        # what to test here
-        mixed_appended = self.mixed_frame[:5].append(self.frame[5:])
-        mixed_appended2 = self.frame[:5].append(self.mixed_frame[5:])
-
-        # all equal except 'foo' column
-        assert_frame_equal(
-            mixed_appended.reindex(columns=['A', 'B', 'C', 'D']),
-            mixed_appended2.reindex(columns=['A', 'B', 'C', 'D']))
-
-        # append empty
-        empty = DataFrame({})
-
-        appended = self.frame.append(empty)
-        assert_frame_equal(self.frame, appended)
-        self.assertIsNot(appended, self.frame)
-
-        appended = empty.append(self.frame)
-        assert_frame_equal(self.frame, appended)
-        self.assertIsNot(appended, self.frame)
-
-        # overlap
-        self.assertRaises(ValueError, self.frame.append, self.frame,
-                          verify_integrity=True)
-
-        # new columns
-        # GH 6129
-        df = DataFrame({'a': {'x': 1, 'y': 2}, 'b': {'x': 3, 'y': 4}})
-        row = Series([5, 6, 7], index=['a', 'b', 'c'], name='z')
-        expected = DataFrame({'a': {'x': 1, 'y': 2, 'z': 5}, 'b': {
-                             'x': 3, 'y': 4, 'z': 6}, 'c': {'z': 7}})
-        result = df.append(row)
-        assert_frame_equal(result, expected)
-
-    def test_append_length0_frame(self):
-        df = DataFrame(columns=['A', 'B', 'C'])
-        df3 = DataFrame(index=[0, 1], columns=['A', 'B'])
-        df5 = df.append(df3)
-
-        expected = DataFrame(index=[0, 1], columns=['A', 'B', 'C'])
-        assert_frame_equal(df5, expected)
-
-    def test_append_records(self):
-        arr1 = np.zeros((2,), dtype=('i4,f4,a10'))
-        arr1[:] = [(1, 2., 'Hello'), (2, 3., "World")]
-
-        arr2 = np.zeros((3,), dtype=('i4,f4,a10'))
-        arr2[:] = [(3, 4., 'foo'),
-                   (5, 6., "bar"),
-                   (7., 8., 'baz')]
-
-        df1 = DataFrame(arr1)
-        df2 = DataFrame(arr2)
-
-        result = df1.append(df2, ignore_index=True)
-        expected = DataFrame(np.concatenate((arr1, arr2)))
-        assert_frame_equal(result, expected)
-
-    def test_append_different_columns(self):
-        df = DataFrame({'bools': np.random.randn(10) > 0,
-                        'ints': np.random.randint(0, 10, 10),
-                        'floats': np.random.randn(10),
-                        'strings': ['foo', 'bar'] * 5})
-
-        a = df[:5].loc[:, ['bools', 'ints', 'floats']]
-        b = df[5:].loc[:, ['strings', 'ints', 'floats']]
-
-        appended = a.append(b)
-        self.assertTrue(isnull(appended['strings'][0:4]).all())
-        self.assertTrue(isnull(appended['bools'][5:]).all())
-
-    def test_append_many(self):
-        chunks = [self.frame[:5], self.frame[5:10],
-                  self.frame[10:15], self.frame[15:]]
-
-        result = chunks[0].append(chunks[1:])
-        tm.assert_frame_equal(result, self.frame)
-
-        chunks[-1] = chunks[-1].copy()
-        chunks[-1]['foo'] = 'bar'
-        result = chunks[0].append(chunks[1:])
-        tm.assert_frame_equal(result.loc[:, self.frame.columns], self.frame)
-        self.assertTrue((result['foo'][15:] == 'bar').all())
-        self.assertTrue(result['foo'][:15].isnull().all())
-
-    def test_append_preserve_index_name(self):
-        # #980
-        df1 = DataFrame(data=None, columns=['A', 'B', 'C'])
-        df1 = df1.set_index(['A'])
-        df2 = DataFrame(data=[[1, 4, 7], [2, 5, 8], [3, 6, 9]],
-                        columns=['A', 'B', 'C'])
-        df2 = df2.set_index(['A'])
-
-        result = df1.append(df2)
-        self.assertEqual(result.index.name, 'A')
-
-    def test_append_dtype_coerce(self):
-
-        # GH 4993
-        # appending with datetime will incorrectly convert datetime64
-        import datetime as dt
-        from pandas import NaT
-
-        df1 = DataFrame(index=[1, 2], data=[dt.datetime(2013, 1, 1, 0, 0),
-                                            dt.datetime(2013, 1, 2, 0, 0)],
-                        columns=['start_time'])
-        df2 = DataFrame(index=[4, 5], data=[[dt.datetime(2013, 1, 3, 0, 0),
-                                             dt.datetime(2013, 1, 3, 6, 10)],
-                                            [dt.datetime(2013, 1, 4, 0, 0),
-                                             dt.datetime(2013, 1, 4, 7, 10)]],
-                        columns=['start_time', 'end_time'])
-
-        expected = concat([Series([NaT, NaT, dt.datetime(2013, 1, 3, 6, 10),
-                                   dt.datetime(2013, 1, 4, 7, 10)],
-                                  name='end_time'),
-                           Series([dt.datetime(2013, 1, 1, 0, 0),
-                                   dt.datetime(2013, 1, 2, 0, 0),
-                                   dt.datetime(2013, 1, 3, 0, 0),
-                                   dt.datetime(2013, 1, 4, 0, 0)],
-                                  name='start_time')], axis=1)
-        result = df1.append(df2, ignore_index=True)
-        assert_frame_equal(result, expected)
-
-    def test_append_missing_column_proper_upcast(self):
-        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8')})
-        df2 = DataFrame({'B': np.array([True, False, True, False],
-                                       dtype=bool)})
-
-        appended = df1.append(df2, ignore_index=True)
-        self.assertEqual(appended['A'].dtype, 'f8')
-        self.assertEqual(appended['B'].dtype, 'O')
-
-
-class TestConcatenate(ConcatenateBase):
-
-    def test_concat_copy(self):
-
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randint(0, 10, size=4).reshape(4, 1))
-        df3 = DataFrame({5: 'foo'}, index=range(4))
-
-        # these are actual copies
-        result = concat([df, df2, df3], axis=1, copy=True)
-        for b in result._data.blocks:
-            self.assertIsNone(b.values.base)
-
-        # these are the same
-        result = concat([df, df2, df3], axis=1, copy=False)
-        for b in result._data.blocks:
-            if b.is_float:
-                self.assertTrue(
-                    b.values.base is df._data.blocks[0].values.base)
-            elif b.is_integer:
-                self.assertTrue(
-                    b.values.base is df2._data.blocks[0].values.base)
-            elif b.is_object:
-                self.assertIsNotNone(b.values.base)
-
-        # float block was consolidated
-        df4 = DataFrame(np.random.randn(4, 1))
-        result = concat([df, df2, df3, df4], axis=1, copy=False)
-        for b in result._data.blocks:
-            if b.is_float:
-                self.assertIsNone(b.values.base)
-            elif b.is_integer:
-                self.assertTrue(
-                    b.values.base is df2._data.blocks[0].values.base)
-            elif b.is_object:
-                self.assertIsNotNone(b.values.base)
-
-    def test_concat_with_group_keys(self):
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        # axis=0
-        df = DataFrame(np.random.randn(3, 4))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        result = concat([df, df2], keys=[0, 1])
-        exp_index = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1, 1],
-                                            [0, 1, 2, 0, 1, 2, 3]])
-        expected = DataFrame(np.r_[df.values, df2.values],
-                             index=exp_index)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([df, df], keys=[0, 1])
-        exp_index2 = MultiIndex.from_arrays([[0, 0, 0, 1, 1, 1],
-                                             [0, 1, 2, 0, 1, 2]])
-        expected = DataFrame(np.r_[df.values, df.values],
-                             index=exp_index2)
-        tm.assert_frame_equal(result, expected)
-
-        # axis=1
-        df = DataFrame(np.random.randn(4, 3))
-        df2 = DataFrame(np.random.randn(4, 4))
-
-        result = concat([df, df2], keys=[0, 1], axis=1)
-        expected = DataFrame(np.c_[df.values, df2.values],
-                             columns=exp_index)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([df, df], keys=[0, 1], axis=1)
-        expected = DataFrame(np.c_[df.values, df.values],
-                             columns=exp_index2)
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_keys_specific_levels(self):
-        df = DataFrame(np.random.randn(10, 4))
-        pieces = [df.iloc[:, [0, 1]], df.iloc[:, [2]], df.iloc[:, [3]]]
-        level = ['three', 'two', 'one', 'zero']
-        result = concat(pieces, axis=1, keys=['one', 'two', 'three'],
-                        levels=[level],
-                        names=['group_key'])
-
-        self.assert_index_equal(result.columns.levels[0],
-                                Index(level, name='group_key'))
-        self.assertEqual(result.columns.names[0], 'group_key')
-
-    def test_concat_dataframe_keys_bug(self):
-        t1 = DataFrame({
-            'value': Series([1, 2, 3], index=Index(['a', 'b', 'c'],
-                                                   name='id'))})
-        t2 = DataFrame({
-            'value': Series([7, 8], index=Index(['a', 'b'], name='id'))})
-
-        # it works
-        result = concat([t1, t2], axis=1, keys=['t1', 't2'])
-        self.assertEqual(list(result.columns), [('t1', 'value'),
-                                                ('t2', 'value')])
-
-    def test_concat_series_partial_columns_names(self):
-        # GH10698
-        foo = Series([1, 2], name='foo')
-        bar = Series([1, 2])
-        baz = Series([4, 5])
-
-        result = concat([foo, bar, baz], axis=1)
-        expected = DataFrame({'foo': [1, 2], 0: [1, 2], 1: [
-                             4, 5]}, columns=['foo', 0, 1])
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([foo, bar, baz], axis=1, keys=[
-                        'red', 'blue', 'yellow'])
-        expected = DataFrame({'red': [1, 2], 'blue': [1, 2], 'yellow': [
-                             4, 5]}, columns=['red', 'blue', 'yellow'])
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([foo, bar, baz], axis=1, ignore_index=True)
-        expected = DataFrame({0: [1, 2], 1: [1, 2], 2: [4, 5]})
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_dict(self):
-        frames = {'foo': DataFrame(np.random.randn(4, 3)),
-                  'bar': DataFrame(np.random.randn(4, 3)),
-                  'baz': DataFrame(np.random.randn(4, 3)),
-                  'qux': DataFrame(np.random.randn(4, 3))}
-
-        sorted_keys = sorted(frames)
-
-        result = concat(frames)
-        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys)
-        tm.assert_frame_equal(result, expected)
-
-        result = concat(frames, axis=1)
-        expected = concat([frames[k] for k in sorted_keys], keys=sorted_keys,
-                          axis=1)
-        tm.assert_frame_equal(result, expected)
-
-        keys = ['baz', 'foo', 'bar']
-        result = concat(frames, keys=keys)
-        expected = concat([frames[k] for k in keys], keys=keys)
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_ignore_index(self):
-        frame1 = DataFrame({"test1": ["a", "b", "c"],
-                            "test2": [1, 2, 3],
-                            "test3": [4.5, 3.2, 1.2]})
-        frame2 = DataFrame({"test3": [5.2, 2.2, 4.3]})
-        frame1.index = Index(["x", "y", "z"])
-        frame2.index = Index(["x", "y", "q"])
-
-        v1 = concat([frame1, frame2], axis=1, ignore_index=True)
-
-        nan = np.nan
-        expected = DataFrame([[nan, nan, nan, 4.3],
-                              ['a', 1, 4.5, 5.2],
-                              ['b', 2, 3.2, 2.2],
-                              ['c', 3, 1.2, nan]],
-                             index=Index(["q", "x", "y", "z"]))
-
-        tm.assert_frame_equal(v1, expected)
-
-    def test_concat_multiindex_with_keys(self):
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        frame = DataFrame(np.random.randn(10, 3), index=index,
-                          columns=Index(['A', 'B', 'C'], name='exp'))
-        result = concat([frame, frame], keys=[0, 1], names=['iteration'])
-
-        self.assertEqual(result.index.names, ('iteration',) + index.names)
-        tm.assert_frame_equal(result.loc[0], frame)
-        tm.assert_frame_equal(result.loc[1], frame)
-        self.assertEqual(result.index.nlevels, 3)
-
-    def test_concat_multiindex_with_tz(self):
-        # GH 6606
-        df = DataFrame({'dt': [datetime(2014, 1, 1),
-                               datetime(2014, 1, 2),
-                               datetime(2014, 1, 3)],
-                        'b': ['A', 'B', 'C'],
-                        'c': [1, 2, 3], 'd': [4, 5, 6]})
-        df['dt'] = df['dt'].apply(lambda d: Timestamp(d, tz='US/Pacific'))
-        df = df.set_index(['dt', 'b'])
-
-        exp_idx1 = DatetimeIndex(['2014-01-01', '2014-01-02',
-                                  '2014-01-03'] * 2,
-                                 tz='US/Pacific', name='dt')
-        exp_idx2 = Index(['A', 'B', 'C'] * 2, name='b')
-        exp_idx = MultiIndex.from_arrays([exp_idx1, exp_idx2])
-        expected = DataFrame({'c': [1, 2, 3] * 2, 'd': [4, 5, 6] * 2},
-                             index=exp_idx, columns=['c', 'd'])
-
-        result = concat([df, df])
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_keys_and_levels(self):
-        df = DataFrame(np.random.randn(1, 3))
-        df2 = DataFrame(np.random.randn(1, 4))
-
-        levels = [['foo', 'baz'], ['one', 'two']]
-        names = ['first', 'second']
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        levels=levels,
-                        names=names)
-        expected = concat([df, df2, df, df2])
-        exp_index = MultiIndex(levels=levels + [[0]],
-                               labels=[[0, 0, 1, 1], [0, 1, 0, 1],
-                                       [0, 0, 0, 0]],
-                               names=names + [None])
-        expected.index = exp_index
-
-        assert_frame_equal(result, expected)
-
-        # no names
-
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        levels=levels)
-        self.assertEqual(result.index.names, (None,) * 3)
-
-        # no levels
-        result = concat([df, df2, df, df2],
-                        keys=[('foo', 'one'), ('foo', 'two'),
-                              ('baz', 'one'), ('baz', 'two')],
-                        names=['first', 'second'])
-        self.assertEqual(result.index.names, ('first', 'second') + (None,))
-        self.assert_index_equal(result.index.levels[0],
-                                Index(['baz', 'foo'], name='first'))
-
-    def test_concat_keys_levels_no_overlap(self):
-        # GH #1406
-        df = DataFrame(np.random.randn(1, 3), index=['a'])
-        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
-
-        self.assertRaises(ValueError, concat, [df, df],
-                          keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
-
-        self.assertRaises(ValueError, concat, [df, df2],
-                          keys=['one', 'two'], levels=[['foo', 'bar', 'baz']])
-
-    def test_concat_rename_index(self):
-        a = DataFrame(np.random.rand(3, 3),
-                      columns=list('ABC'),
-                      index=Index(list('abc'), name='index_a'))
-        b = DataFrame(np.random.rand(3, 3),
-                      columns=list('ABC'),
-                      index=Index(list('abc'), name='index_b'))
-
-        result = concat([a, b], keys=['key0', 'key1'],
-                        names=['lvl0', 'lvl1'])
-
-        exp = concat([a, b], keys=['key0', 'key1'], names=['lvl0'])
-        names = list(exp.index.names)
-        names[1] = 'lvl1'
-        exp.index.set_names(names, inplace=True)
-
-        tm.assert_frame_equal(result, exp)
-        self.assertEqual(result.index.names, exp.index.names)
-
-    def test_crossed_dtypes_weird_corner(self):
-        columns = ['A', 'B', 'C', 'D']
-        df1 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='f8'),
-                         'B': np.array([1, 2, 3, 4], dtype='i8'),
-                         'C': np.array([1, 2, 3, 4], dtype='f8'),
-                         'D': np.array([1, 2, 3, 4], dtype='i8')},
-                        columns=columns)
-
-        df2 = DataFrame({'A': np.array([1, 2, 3, 4], dtype='i8'),
-                         'B': np.array([1, 2, 3, 4], dtype='f8'),
-                         'C': np.array([1, 2, 3, 4], dtype='i8'),
-                         'D': np.array([1, 2, 3, 4], dtype='f8')},
-                        columns=columns)
-
-        appended = df1.append(df2, ignore_index=True)
-        expected = DataFrame(np.concatenate([df1.values, df2.values], axis=0),
-                             columns=columns)
-        tm.assert_frame_equal(appended, expected)
-
-        df = DataFrame(np.random.randn(1, 3), index=['a'])
-        df2 = DataFrame(np.random.randn(1, 4), index=['b'])
-        result = concat(
-            [df, df2], keys=['one', 'two'], names=['first', 'second'])
-        self.assertEqual(result.index.names, ('first', 'second'))
-
-    def test_dups_index(self):
-        # GH 4771
-
-        # single dtypes
-        df = DataFrame(np.random.randint(0, 10, size=40).reshape(
-            10, 4), columns=['A', 'A', 'C', 'C'])
-
-        result = concat([df, df], axis=1)
-        assert_frame_equal(result.iloc[:, :4], df)
-        assert_frame_equal(result.iloc[:, 4:], df)
-
-        result = concat([df, df], axis=0)
-        assert_frame_equal(result.iloc[:10], df)
-        assert_frame_equal(result.iloc[10:], df)
-
-        # multi dtypes
-        df = concat([DataFrame(np.random.randn(10, 4),
-                               columns=['A', 'A', 'B', 'B']),
-                     DataFrame(np.random.randint(0, 10, size=20)
-                               .reshape(10, 2),
-                               columns=['A', 'C'])],
-                    axis=1)
-
-        result = concat([df, df], axis=1)
-        assert_frame_equal(result.iloc[:, :6], df)
-        assert_frame_equal(result.iloc[:, 6:], df)
-
-        result = concat([df, df], axis=0)
-        assert_frame_equal(result.iloc[:10], df)
-        assert_frame_equal(result.iloc[10:], df)
-
-        # append
-        result = df.iloc[0:8, :].append(df.iloc[8:])
-        assert_frame_equal(result, df)
-
-        result = df.iloc[0:8, :].append(df.iloc[8:9]).append(df.iloc[9:10])
-        assert_frame_equal(result, df)
-
-        expected = concat([df, df], axis=0)
-        result = df.append(df)
-        assert_frame_equal(result, expected)
-
-    def test_with_mixed_tuples(self):
-        # 10697
-        # columns have mixed tuples, so handle properly
-        df1 = DataFrame({u'A': 'foo', (u'B', 1): 'bar'}, index=range(2))
-        df2 = DataFrame({u'B': 'foo', (u'B', 1): 'bar'}, index=range(2))
-
-        # it works
-        concat([df1, df2])
-
-    def test_handle_empty_objects(self):
-        df = DataFrame(np.random.randn(10, 4), columns=list('abcd'))
-
-        baz = df[:5].copy()
-        baz['foo'] = 'bar'
-        empty = df[5:5]
-
-        frames = [baz, empty, empty, df[5:]]
-        concatted = concat(frames, axis=0)
-
-        expected = df.loc[:, ['a', 'b', 'c', 'd', 'foo']]
-        expected['foo'] = expected['foo'].astype('O')
-        expected.loc[0:4, 'foo'] = 'bar'
-
-        tm.assert_frame_equal(concatted, expected)
-
-        # empty as first element with time series
-        # GH3259
-        df = DataFrame(dict(A=range(10000)), index=date_range(
-            '20130101', periods=10000, freq='s'))
-        empty = DataFrame()
-        result = concat([df, empty], axis=1)
-        assert_frame_equal(result, df)
-        result = concat([empty, df], axis=1)
-        assert_frame_equal(result, df)
-
-        result = concat([df, empty])
-        assert_frame_equal(result, df)
-        result = concat([empty, df])
-        assert_frame_equal(result, df)
-
-    def test_concat_mixed_objs(self):
-
-        # concat mixed series/frames
-        # G2385
-
-        # axis 1
-        index = date_range('01-Jan-2013', periods=10, freq='H')
-        arr = np.arange(10, dtype='int64')
-        s1 = Series(arr, index=index)
-        s2 = Series(arr, index=index)
-        df = DataFrame(arr.reshape(-1, 1), index=index)
-
-        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
-                             index=index, columns=[0, 0])
-        result = concat([df, df], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr, 2).reshape(-1, 2),
-                             index=index, columns=[0, 1])
-        result = concat([s1, s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
-                             index=index, columns=[0, 1, 2])
-        result = concat([s1, s2, s1], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.repeat(arr, 5).reshape(-1, 5),
-                             index=index, columns=[0, 0, 1, 2, 3])
-        result = concat([s1, df, s2, s2, s1], axis=1)
-        assert_frame_equal(result, expected)
-
-        # with names
-        s1.name = 'foo'
-        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
-                             index=index, columns=['foo', 0, 0])
-        result = concat([s1, df, s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        s2.name = 'bar'
-        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
-                             index=index, columns=['foo', 0, 'bar'])
-        result = concat([s1, df, s2], axis=1)
-        assert_frame_equal(result, expected)
-
-        # ignore index
-        expected = DataFrame(np.repeat(arr, 3).reshape(-1, 3),
-                             index=index, columns=[0, 1, 2])
-        result = concat([s1, df, s2], axis=1, ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # axis 0
-        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1),
-                             index=index.tolist() * 3, columns=[0])
-        result = concat([s1, df, s2])
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(np.tile(arr, 3).reshape(-1, 1), columns=[0])
-        result = concat([s1, df, s2], ignore_index=True)
-        assert_frame_equal(result, expected)
-
-        # invalid concatente of mixed dims
-        panel = tm.makePanel()
-        self.assertRaises(ValueError, lambda: concat([panel, s1], axis=1))
-
-    def test_empty_dtype_coerce(self):
-
-        # xref to #12411
-        # xref to #12045
-        # xref to #11594
-        # see below
-
-        # 10571
-        df1 = DataFrame(data=[[1, None], [2, None]], columns=['a', 'b'])
-        df2 = DataFrame(data=[[3, None], [4, None]], columns=['a', 'b'])
-        result = concat([df1, df2])
-        expected = df1.dtypes
-        tm.assert_series_equal(result.dtypes, expected)
-
-    def test_dtype_coerceion(self):
-
-        # 12411
-        df = DataFrame({'date': [pd.Timestamp('20130101').tz_localize('UTC'),
-                                 pd.NaT]})
-
-        result = concat([df.iloc[[0]], df.iloc[[1]]])
-        tm.assert_series_equal(result.dtypes, df.dtypes)
-
-        # 12045
-        import datetime
-        df = DataFrame({'date': [datetime.datetime(2012, 1, 1),
-                                 datetime.datetime(1012, 1, 2)]})
-        result = concat([df.iloc[[0]], df.iloc[[1]]])
-        tm.assert_series_equal(result.dtypes, df.dtypes)
-
-        # 11594
-        df = DataFrame({'text': ['some words'] + [None] * 9})
-        result = concat([df.iloc[[0]], df.iloc[[1]]])
-        tm.assert_series_equal(result.dtypes, df.dtypes)
-
-    def test_panel_concat_other_axes(self):
-        panel = tm.makePanel()
-
-        p1 = panel.iloc[:, :5, :]
-        p2 = panel.iloc[:, 5:, :]
-
-        result = concat([p1, p2], axis=1)
-        tm.assert_panel_equal(result, panel)
-
-        p1 = panel.iloc[:, :, :2]
-        p2 = panel.iloc[:, :, 2:]
-
-        result = concat([p1, p2], axis=2)
-        tm.assert_panel_equal(result, panel)
-
-        # if things are a bit misbehaved
-        p1 = panel.iloc[:2, :, :2]
-        p2 = panel.iloc[:, :, 2:]
-        p1['ItemC'] = 'baz'
-
-        result = concat([p1, p2], axis=2)
-
-        expected = panel.copy()
-        expected['ItemC'] = expected['ItemC'].astype('O')
-        expected.loc['ItemC', :, :2] = 'baz'
-        tm.assert_panel_equal(result, expected)
-
-    def test_panel_concat_buglet(self):
-        # #2257
-        def make_panel():
-            index = 5
-            cols = 3
-
-            def df():
-                return DataFrame(np.random.randn(index, cols),
-                                 index=["I%s" % i for i in range(index)],
-                                 columns=["C%s" % i for i in range(cols)])
-            return Panel(dict([("Item%s" % x, df()) for x in ['A', 'B', 'C']]))
-
-        panel1 = make_panel()
-        panel2 = make_panel()
-
-        panel2 = panel2.rename_axis(dict([(x, "%s_1" % x)
-                                          for x in panel2.major_axis]),
-                                    axis=1)
-
-        panel3 = panel2.rename_axis(lambda x: '%s_1' % x, axis=1)
-        panel3 = panel3.rename_axis(lambda x: '%s_1' % x, axis=2)
-
-        # it works!
-        concat([panel1, panel3], axis=1, verify_integrity=True)
-
-    def test_panel4d_concat(self):
-        with catch_warnings(record=True):
-            p4d = tm.makePanel4D()
-
-            p1 = p4d.iloc[:, :, :5, :]
-            p2 = p4d.iloc[:, :, 5:, :]
-
-            result = concat([p1, p2], axis=2)
-            tm.assert_panel4d_equal(result, p4d)
-
-            p1 = p4d.iloc[:, :, :, :2]
-            p2 = p4d.iloc[:, :, :, 2:]
-
-            result = concat([p1, p2], axis=3)
-            tm.assert_panel4d_equal(result, p4d)
-
-    def test_panel4d_concat_mixed_type(self):
-        with catch_warnings(record=True):
-            p4d = tm.makePanel4D()
-
-            # if things are a bit misbehaved
-            p1 = p4d.iloc[:, :2, :, :2]
-            p2 = p4d.iloc[:, :, :, 2:]
-            p1['L5'] = 'baz'
-
-            result = concat([p1, p2], axis=3)
-
-            p2['L5'] = np.nan
-            expected = concat([p1, p2], axis=3)
-            expected = expected.loc[result.labels]
-
-            tm.assert_panel4d_equal(result, expected)
-
-    def test_concat_series(self):
-
-        ts = tm.makeTimeSeries()
-        ts.name = 'foo'
-
-        pieces = [ts[:5], ts[5:15], ts[15:]]
-
-        result = concat(pieces)
-        tm.assert_series_equal(result, ts)
-        self.assertEqual(result.name, ts.name)
-
-        result = concat(pieces, keys=[0, 1, 2])
-        expected = ts.copy()
-
-        ts.index = DatetimeIndex(np.array(ts.index.values, dtype='M8[ns]'))
-
-        exp_labels = [np.repeat([0, 1, 2], [len(x) for x in pieces]),
-                      np.arange(len(ts))]
-        exp_index = MultiIndex(levels=[[0, 1, 2], ts.index],
-                               labels=exp_labels)
-        expected.index = exp_index
-        tm.assert_series_equal(result, expected)
-
-    def test_concat_series_axis1(self):
-        ts = tm.makeTimeSeries()
-
-        pieces = [ts[:-2], ts[2:], ts[2:-2]]
-
-        result = concat(pieces, axis=1)
-        expected = DataFrame(pieces).T
-        assert_frame_equal(result, expected)
-
-        result = concat(pieces, keys=['A', 'B', 'C'], axis=1)
-        expected = DataFrame(pieces, index=['A', 'B', 'C']).T
-        assert_frame_equal(result, expected)
-
-        # preserve series names, #2489
-        s = Series(randn(5), name='A')
-        s2 = Series(randn(5), name='B')
-
-        result = concat([s, s2], axis=1)
-        expected = DataFrame({'A': s, 'B': s2})
-        assert_frame_equal(result, expected)
-
-        s2.name = None
-        result = concat([s, s2], axis=1)
-        self.assertTrue(np.array_equal(
-            result.columns, Index(['A', 0], dtype='object')))
-
-        # must reindex, #2603
-        s = Series(randn(3), index=['c', 'a', 'b'], name='A')
-        s2 = Series(randn(4), index=['d', 'a', 'b', 'c'], name='B')
-        result = concat([s, s2], axis=1)
-        expected = DataFrame({'A': s, 'B': s2})
-        assert_frame_equal(result, expected)
-
-    def test_concat_single_with_key(self):
-        df = DataFrame(np.random.randn(10, 4))
-
-        result = concat([df], keys=['foo'])
-        expected = concat([df, df], keys=['foo', 'bar'])
-        tm.assert_frame_equal(result, expected[:10])
-
-    def test_concat_exclude_none(self):
-        df = DataFrame(np.random.randn(10, 4))
-
-        pieces = [df[:5], None, None, df[5:]]
-        result = concat(pieces)
-        tm.assert_frame_equal(result, df)
-        self.assertRaises(ValueError, concat, [None, None])
-
-    def test_concat_datetime64_block(self):
-        from pandas.tseries.index import date_range
-
-        rng = date_range('1/1/2000', periods=10)
-
-        df = DataFrame({'time': rng})
-
-        result = concat([df, df])
-        self.assertTrue((result.iloc[:10]['time'] == rng).all())
-        self.assertTrue((result.iloc[10:]['time'] == rng).all())
-
-    def test_concat_timedelta64_block(self):
-        from pandas import to_timedelta
-
-        rng = to_timedelta(np.arange(10), unit='s')
-
-        df = DataFrame({'time': rng})
-
-        result = concat([df, df])
-        self.assertTrue((result.iloc[:10]['time'] == rng).all())
-        self.assertTrue((result.iloc[10:]['time'] == rng).all())
-
-    def test_concat_keys_with_none(self):
-        # #1649
-        df0 = DataFrame([[10, 20, 30], [10, 20, 30], [10, 20, 30]])
-
-        result = concat(dict(a=None, b=df0, c=df0[:2], d=df0[:1], e=df0))
-        expected = concat(dict(b=df0, c=df0[:2], d=df0[:1], e=df0))
-        tm.assert_frame_equal(result, expected)
-
-        result = concat([None, df0, df0[:2], df0[:1], df0],
-                        keys=['a', 'b', 'c', 'd', 'e'])
-        expected = concat([df0, df0[:2], df0[:1], df0],
-                          keys=['b', 'c', 'd', 'e'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_concat_bug_1719(self):
-        ts1 = tm.makeTimeSeries()
-        ts2 = tm.makeTimeSeries()[::2]
-
-        # to join with union
-        # these two are of different length!
-        left = concat([ts1, ts2], join='outer', axis=1)
-        right = concat([ts2, ts1], join='outer', axis=1)
-
-        self.assertEqual(len(left), len(right))
-
-    def test_concat_bug_2972(self):
-        ts0 = Series(np.zeros(5))
-        ts1 = Series(np.ones(5))
-        ts0.name = ts1.name = 'same name'
-        result = concat([ts0, ts1], axis=1)
-
-        expected = DataFrame({0: ts0, 1: ts1})
-        expected.columns = ['same name', 'same name']
-        assert_frame_equal(result, expected)
-
-    def test_concat_bug_3602(self):
-
-        # GH 3602, duplicate columns
-        df1 = DataFrame({'firmNo': [0, 0, 0, 0], 'stringvar': [
-                        'rrr', 'rrr', 'rrr', 'rrr'], 'prc': [6, 6, 6, 6]})
-        df2 = DataFrame({'misc': [1, 2, 3, 4], 'prc': [
-                        6, 6, 6, 6], 'C': [9, 10, 11, 12]})
-        expected = DataFrame([[0, 6, 'rrr', 9, 1, 6],
-                              [0, 6, 'rrr', 10, 2, 6],
-                              [0, 6, 'rrr', 11, 3, 6],
-                              [0, 6, 'rrr', 12, 4, 6]])
-        expected.columns = ['firmNo', 'prc', 'stringvar', 'C', 'misc', 'prc']
-
-        result = concat([df1, df2], axis=1)
-        assert_frame_equal(result, expected)
-
-    def test_concat_inner_join_empty(self):
-        # GH 15328
-        df_empty = pd.DataFrame()
-        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
-        df_expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
-
-        for how, expected in [('inner', df_expected), ('outer', df_a)]:
-            result = pd.concat([df_a, df_empty], axis=1, join=how)
-            assert_frame_equal(result, expected)
-
-    def test_concat_series_axis1_same_names_ignore_index(self):
-        dates = date_range('01-Jan-2013', '01-Jan-2014', freq='MS')[0:-1]
-        s1 = Series(randn(len(dates)), index=dates, name='value')
-        s2 = Series(randn(len(dates)), index=dates, name='value')
-
-        result = concat([s1, s2], axis=1, ignore_index=True)
-        self.assertTrue(np.array_equal(result.columns, [0, 1]))
-
-    def test_concat_iterables(self):
-        from collections import deque, Iterable
-
-        # GH8645 check concat works with tuples, list, generators, and weird
-        # stuff like deque and custom iterables
-        df1 = DataFrame([1, 2, 3])
-        df2 = DataFrame([4, 5, 6])
-        expected = DataFrame([1, 2, 3, 4, 5, 6])
-        assert_frame_equal(concat((df1, df2), ignore_index=True), expected)
-        assert_frame_equal(concat([df1, df2], ignore_index=True), expected)
-        assert_frame_equal(concat((df for df in (df1, df2)),
-                                  ignore_index=True), expected)
-        assert_frame_equal(
-            concat(deque((df1, df2)), ignore_index=True), expected)
-
-        class CustomIterator1(object):
-
-            def __len__(self):
-                return 2
-
-            def __getitem__(self, index):
-                try:
-                    return {0: df1, 1: df2}[index]
-                except KeyError:
-                    raise IndexError
-        assert_frame_equal(pd.concat(CustomIterator1(),
-                                     ignore_index=True), expected)
-
-        class CustomIterator2(Iterable):
-
-            def __iter__(self):
-                yield df1
-                yield df2
-        assert_frame_equal(pd.concat(CustomIterator2(),
-                                     ignore_index=True), expected)
-
-    def test_concat_invalid(self):
-
-        # trying to concat a ndframe with a non-ndframe
-        df1 = mkdf(10, 2)
-        for obj in [1, dict(), [1, 2], (1, 2)]:
-            self.assertRaises(TypeError, lambda x: concat([df1, obj]))
-
-    def test_concat_invalid_first_argument(self):
-        df1 = mkdf(10, 2)
-        df2 = mkdf(10, 2)
-        self.assertRaises(TypeError, concat, df1, df2)
-
-        # generator ok though
-        concat(DataFrame(np.random.rand(5, 5)) for _ in range(3))
-
-        # text reader ok
-        # GH6583
-        data = """index,A,B,C,D
-foo,2,3,4,5
-bar,7,8,9,10
-baz,12,13,14,15
-qux,12,13,14,15
-foo2,12,13,14,15
-bar2,12,13,14,15
-"""
-
-        reader = read_csv(StringIO(data), chunksize=1)
-        result = concat(reader, ignore_index=True)
-        expected = read_csv(StringIO(data))
-        assert_frame_equal(result, expected)
-
-    def test_concat_NaT_series(self):
-        # GH 11693
-        # test for merging NaT series with datetime series.
-        x = Series(date_range('20151124 08:00', '20151124 09:00',
-                              freq='1h', tz='US/Eastern'))
-        y = Series(pd.NaT, index=[0, 1], dtype='datetime64[ns, US/Eastern]')
-        expected = Series([x[0], x[1], pd.NaT, pd.NaT])
-
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-        # all NaT with tz
-        expected = Series(pd.NaT, index=range(4),
-                          dtype='datetime64[ns, US/Eastern]')
-        result = pd.concat([y, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-        # without tz
-        x = pd.Series(pd.date_range('20151124 08:00',
-                                    '20151124 09:00', freq='1h'))
-        y = pd.Series(pd.date_range('20151124 10:00',
-                                    '20151124 11:00', freq='1h'))
-        y[:] = pd.NaT
-        expected = pd.Series([x[0], x[1], pd.NaT, pd.NaT])
-        result = pd.concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-        # all NaT without tz
-        x[:] = pd.NaT
-        expected = pd.Series(pd.NaT, index=range(4),
-                             dtype='datetime64[ns]')
-        result = pd.concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-    def test_concat_tz_frame(self):
-        df2 = DataFrame(dict(A=pd.Timestamp('20130102', tz='US/Eastern'),
-                             B=pd.Timestamp('20130603', tz='CET')),
-                        index=range(5))
-
-        # concat
-        df3 = pd.concat([df2.A.to_frame(), df2.B.to_frame()], axis=1)
-        assert_frame_equal(df2, df3)
-
-    def test_concat_tz_series(self):
-        # GH 11755
-        # tz and no tz
-        x = Series(date_range('20151124 08:00',
-                              '20151124 09:00',
-                              freq='1h', tz='UTC'))
-        y = Series(date_range('2012-01-01', '2012-01-02'))
-        expected = Series([x[0], x[1], y[0], y[1]],
-                          dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-        # GH 11887
-        # concat tz and object
-        x = Series(date_range('20151124 08:00',
-                              '20151124 09:00',
-                              freq='1h', tz='UTC'))
-        y = Series(['a', 'b'])
-        expected = Series([x[0], x[1], y[0], y[1]],
-                          dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-
-        # 12217
-        # 12306 fixed I think
-
-        # Concat'ing two UTC times
-        first = pd.DataFrame([[datetime(2016, 1, 1)]])
-        first[0] = first[0].dt.tz_localize('UTC')
-
-        second = pd.DataFrame([[datetime(2016, 1, 2)]])
-        second[0] = second[0].dt.tz_localize('UTC')
-
-        result = pd.concat([first, second])
-        self.assertEqual(result[0].dtype, 'datetime64[ns, UTC]')
-
-        # Concat'ing two London times
-        first = pd.DataFrame([[datetime(2016, 1, 1)]])
-        first[0] = first[0].dt.tz_localize('Europe/London')
-
-        second = pd.DataFrame([[datetime(2016, 1, 2)]])
-        second[0] = second[0].dt.tz_localize('Europe/London')
-
-        result = pd.concat([first, second])
-        self.assertEqual(result[0].dtype, 'datetime64[ns, Europe/London]')
-
-        # Concat'ing 2+1 London times
-        first = pd.DataFrame([[datetime(2016, 1, 1)], [datetime(2016, 1, 2)]])
-        first[0] = first[0].dt.tz_localize('Europe/London')
-
-        second = pd.DataFrame([[datetime(2016, 1, 3)]])
-        second[0] = second[0].dt.tz_localize('Europe/London')
-
-        result = pd.concat([first, second])
-        self.assertEqual(result[0].dtype, 'datetime64[ns, Europe/London]')
-
-        # Concat'ing 1+2 London times
-        first = pd.DataFrame([[datetime(2016, 1, 1)]])
-        first[0] = first[0].dt.tz_localize('Europe/London')
-
-        second = pd.DataFrame([[datetime(2016, 1, 2)], [datetime(2016, 1, 3)]])
-        second[0] = second[0].dt.tz_localize('Europe/London')
-
-        result = pd.concat([first, second])
-        self.assertEqual(result[0].dtype, 'datetime64[ns, Europe/London]')
-
-    def test_concat_tz_series_with_datetimelike(self):
-        # GH 12620
-        # tz and timedelta
-        x = [pd.Timestamp('2011-01-01', tz='US/Eastern'),
-             pd.Timestamp('2011-02-01', tz='US/Eastern')]
-        y = [pd.Timedelta('1 day'), pd.Timedelta('2 day')]
-        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
-        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
-
-        # tz and period
-        y = [pd.Period('2011-03', freq='M'), pd.Period('2011-04', freq='M')]
-        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
-        tm.assert_series_equal(result, pd.Series(x + y, dtype='object'))
-
-    def test_concat_tz_series_tzlocal(self):
-        # GH 13583
-        tm._skip_if_no_dateutil()
-        import dateutil
-        x = [pd.Timestamp('2011-01-01', tz=dateutil.tz.tzlocal()),
-             pd.Timestamp('2011-02-01', tz=dateutil.tz.tzlocal())]
-        y = [pd.Timestamp('2012-01-01', tz=dateutil.tz.tzlocal()),
-             pd.Timestamp('2012-02-01', tz=dateutil.tz.tzlocal())]
-        result = concat([pd.Series(x), pd.Series(y)], ignore_index=True)
-        tm.assert_series_equal(result, pd.Series(x + y))
-        self.assertEqual(result.dtype, 'datetime64[ns, tzlocal()]')
-
-    def test_concat_period_series(self):
-        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
-        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='D'))
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'object')
-
-        # different freq
-        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
-        y = Series(pd.PeriodIndex(['2015-10-01', '2016-01-01'], freq='M'))
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'object')
-
-        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
-        y = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='M'))
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'object')
-
-        # non-period
-        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
-        y = Series(pd.DatetimeIndex(['2015-11-01', '2015-12-01']))
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'object')
-
-        x = Series(pd.PeriodIndex(['2015-11-01', '2015-12-01'], freq='D'))
-        y = Series(['A', 'B'])
-        expected = Series([x[0], x[1], y[0], y[1]], dtype='object')
-        result = concat([x, y], ignore_index=True)
-        tm.assert_series_equal(result, expected)
-        self.assertEqual(result.dtype, 'object')
-
-    def test_concat_empty_series(self):
-        # GH 11082
-        s1 = pd.Series([1, 2, 3], name='x')
-        s2 = pd.Series(name='y')
-        res = pd.concat([s1, s2], axis=1)
-        exp = pd.DataFrame({'x': [1, 2, 3], 'y': [np.nan, np.nan, np.nan]})
-        tm.assert_frame_equal(res, exp)
-
-        s1 = pd.Series([1, 2, 3], name='x')
-        s2 = pd.Series(name='y')
-        res = pd.concat([s1, s2], axis=0)
-        # name will be reset
-        exp = pd.Series([1, 2, 3])
-        tm.assert_series_equal(res, exp)
-
-        # empty Series with no name
-        s1 = pd.Series([1, 2, 3], name='x')
-        s2 = pd.Series(name=None)
-        res = pd.concat([s1, s2], axis=1)
-        exp = pd.DataFrame({'x': [1, 2, 3], 0: [np.nan, np.nan, np.nan]},
-                           columns=['x', 0])
-        tm.assert_frame_equal(res, exp)
-
-    def test_default_index(self):
-        # is_series and ignore_index
-        s1 = pd.Series([1, 2, 3], name='x')
-        s2 = pd.Series([4, 5, 6], name='y')
-        res = pd.concat([s1, s2], axis=1, ignore_index=True)
-        self.assertIsInstance(res.columns, pd.RangeIndex)
-        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
-        # use check_index_type=True to check the result have
-        # RangeIndex (default index)
-        tm.assert_frame_equal(res, exp, check_index_type=True,
-                              check_column_type=True)
-
-        # is_series and all inputs have no names
-        s1 = pd.Series([1, 2, 3])
-        s2 = pd.Series([4, 5, 6])
-        res = pd.concat([s1, s2], axis=1, ignore_index=False)
-        self.assertIsInstance(res.columns, pd.RangeIndex)
-        exp = pd.DataFrame([[1, 4], [2, 5], [3, 6]])
-        exp.columns = pd.RangeIndex(2)
-        tm.assert_frame_equal(res, exp, check_index_type=True,
-                              check_column_type=True)
-
-        # is_dataframe and ignore_index
-        df1 = pd.DataFrame({'A': [1, 2], 'B': [5, 6]})
-        df2 = pd.DataFrame({'A': [3, 4], 'B': [7, 8]})
-
-        res = pd.concat([df1, df2], axis=0, ignore_index=True)
-        exp = pd.DataFrame([[1, 5], [2, 6], [3, 7], [4, 8]],
-                           columns=['A', 'B'])
-        tm.assert_frame_equal(res, exp, check_index_type=True,
-                              check_column_type=True)
-
-        res = pd.concat([df1, df2], axis=1, ignore_index=True)
-        exp = pd.DataFrame([[1, 5, 3, 7], [2, 6, 4, 8]])
-        tm.assert_frame_equal(res, exp, check_index_type=True,
-                              check_column_type=True)
-
-    def test_concat_multiindex_rangeindex(self):
-        # GH13542
-        # when multi-index levels are RangeIndex objects
-        # there is a bug in concat with objects of len 1
-
-        df = DataFrame(np.random.randn(9, 2))
-        df.index = MultiIndex(levels=[pd.RangeIndex(3), pd.RangeIndex(3)],
-                              labels=[np.repeat(np.arange(3), 3),
-                                      np.tile(np.arange(3), 3)])
-
-        res = concat([df.iloc[[2, 3, 4], :], df.iloc[[5], :]])
-        exp = df.iloc[[2, 3, 4, 5], :]
-        tm.assert_frame_equal(res, exp)
-
-    def test_concat_multiindex_dfs_with_deepcopy(self):
-        # GH 9967
-        from copy import deepcopy
-        example_multiindex1 = pd.MultiIndex.from_product([['a'], ['b']])
-        example_dataframe1 = pd.DataFrame([0], index=example_multiindex1)
-
-        example_multiindex2 = pd.MultiIndex.from_product([['a'], ['c']])
-        example_dataframe2 = pd.DataFrame([1], index=example_multiindex2)
-
-        example_dict = {'s1': example_dataframe1, 's2': example_dataframe2}
-        expected_index = pd.MultiIndex(levels=[['s1', 's2'],
-                                               ['a'],
-                                               ['b', 'c']],
-                                       labels=[[0, 1], [0, 0], [0, 1]],
-                                       names=['testname', None, None])
-        expected = pd.DataFrame([[0], [1]], index=expected_index)
-        result_copy = pd.concat(deepcopy(example_dict), names=['testname'])
-        tm.assert_frame_equal(result_copy, expected)
-        result_no_copy = pd.concat(example_dict, names=['testname'])
-        tm.assert_frame_equal(result_no_copy, expected)
-
-
-@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
-@pytest.mark.parametrize('dt', np.sctypes['float'])
-def test_concat_no_unnecessary_upcast(dt, pdt):
-    # GH 13247
-    dims = pdt().ndim
-    dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
-           pdt(np.array([np.nan], dtype=dt, ndmin=dims)),
-           pdt(np.array([5], dtype=dt, ndmin=dims))]
-    x = pd.concat(dfs)
-    assert x.values.dtype == dt
-
-
-@pytest.mark.parametrize('pdt', [pd.Series, pd.DataFrame, pd.Panel])
-@pytest.mark.parametrize('dt', np.sctypes['int'])
-def test_concat_will_upcast(dt, pdt):
-    dims = pdt().ndim
-    dfs = [pdt(np.array([1], dtype=dt, ndmin=dims)),
-           pdt(np.array([np.nan], ndmin=dims)),
-           pdt(np.array([5], dtype=dt, ndmin=dims))]
-    x = pd.concat(dfs)
-    assert x.values.dtype == 'float64'
diff --git a/pandas/tests/tools/test_hashing.py b/pandas/tests/tools/test_hashing.py
deleted file mode 100644
index 9bed0d428bc41..0000000000000
--- a/pandas/tests/tools/test_hashing.py
+++ /dev/null
@@ -1,234 +0,0 @@
-import numpy as np
-import pandas as pd
-
-from pandas import DataFrame, Series, Index, MultiIndex
-from pandas.tools.hashing import hash_array, hash_tuples, hash_pandas_object
-import pandas.util.testing as tm
-
-
-class TestHashing(tm.TestCase):
-
-    def setUp(self):
-        self.df = DataFrame(
-            {'i32': np.array([1, 2, 3] * 3, dtype='int32'),
-             'f32': np.array([None, 2.5, 3.5] * 3, dtype='float32'),
-             'cat': Series(['a', 'b', 'c'] * 3).astype('category'),
-             'obj': Series(['d', 'e', 'f'] * 3),
-             'bool': np.array([True, False, True] * 3),
-             'dt': Series(pd.date_range('20130101', periods=9)),
-             'dt_tz': Series(pd.date_range('20130101', periods=9,
-                                           tz='US/Eastern')),
-             'td': Series(pd.timedelta_range('2000', periods=9))})
-
-    def test_consistency(self):
-        # check that our hash doesn't change because of a mistake
-        # in the actual code; this is the ground truth
-        result = hash_pandas_object(Index(['foo', 'bar', 'baz']))
-        expected = Series(np.array([3600424527151052760, 1374399572096150070,
-                                    477881037637427054], dtype='uint64'),
-                          index=['foo', 'bar', 'baz'])
-        tm.assert_series_equal(result, expected)
-
-    def test_hash_array(self):
-        for name, s in self.df.iteritems():
-            a = s.values
-            tm.assert_numpy_array_equal(hash_array(a), hash_array(a))
-
-    def test_hash_array_mixed(self):
-        result1 = hash_array(np.array([3, 4, 'All']))
-        result2 = hash_array(np.array(['3', '4', 'All']))
-        result3 = hash_array(np.array([3, 4, 'All'], dtype=object))
-        tm.assert_numpy_array_equal(result1, result2)
-        tm.assert_numpy_array_equal(result1, result3)
-
-    def test_hash_array_errors(self):
-
-        for val in [5, 'foo', pd.Timestamp('20130101')]:
-            self.assertRaises(TypeError, hash_array, val)
-
-    def check_equal(self, obj, **kwargs):
-        a = hash_pandas_object(obj, **kwargs)
-        b = hash_pandas_object(obj, **kwargs)
-        tm.assert_series_equal(a, b)
-
-        kwargs.pop('index', None)
-        a = hash_pandas_object(obj, **kwargs)
-        b = hash_pandas_object(obj, **kwargs)
-        tm.assert_series_equal(a, b)
-
-    def check_not_equal_with_index(self, obj):
-
-        # check that we are not hashing the same if
-        # we include the index
-        if not isinstance(obj, Index):
-            a = hash_pandas_object(obj, index=True)
-            b = hash_pandas_object(obj, index=False)
-            if len(obj):
-                self.assertFalse((a == b).all())
-
-    def test_hash_tuples(self):
-        tups = [(1, 'one'), (1, 'two'), (2, 'one')]
-        result = hash_tuples(tups)
-        expected = hash_pandas_object(MultiIndex.from_tuples(tups)).values
-        self.assert_numpy_array_equal(result, expected)
-
-        result = hash_tuples(tups[0])
-        self.assertEqual(result, expected[0])
-
-    def test_hash_tuples_err(self):
-
-        for val in [5, 'foo', pd.Timestamp('20130101')]:
-            self.assertRaises(TypeError, hash_tuples, val)
-
-    def test_multiindex_unique(self):
-        mi = MultiIndex.from_tuples([(118, 472), (236, 118),
-                                     (51, 204), (102, 51)])
-        self.assertTrue(mi.is_unique)
-        result = hash_pandas_object(mi)
-        self.assertTrue(result.is_unique)
-
-    def test_hash_pandas_object(self):
-
-        for obj in [Series([1, 2, 3]),
-                    Series([1.0, 1.5, 3.2]),
-                    Series([1.0, 1.5, np.nan]),
-                    Series([1.0, 1.5, 3.2], index=[1.5, 1.1, 3.3]),
-                    Series(['a', 'b', 'c']),
-                    Series(['a', np.nan, 'c']),
-                    Series(['a', None, 'c']),
-                    Series([True, False, True]),
-                    Series(),
-                    Index([1, 2, 3]),
-                    Index([True, False, True]),
-                    DataFrame({'x': ['a', 'b', 'c'], 'y': [1, 2, 3]}),
-                    DataFrame(),
-                    tm.makeMissingDataframe(),
-                    tm.makeMixedDataFrame(),
-                    tm.makeTimeDataFrame(),
-                    tm.makeTimeSeries(),
-                    tm.makeTimedeltaIndex(),
-                    tm.makePeriodIndex(),
-                    Series(tm.makePeriodIndex()),
-                    Series(pd.date_range('20130101',
-                                         periods=3, tz='US/Eastern')),
-                    MultiIndex.from_product(
-                        [range(5),
-                         ['foo', 'bar', 'baz'],
-                         pd.date_range('20130101', periods=2)]),
-                    MultiIndex.from_product(
-                        [pd.CategoricalIndex(list('aabc')),
-                         range(3)])]:
-            self.check_equal(obj)
-            self.check_not_equal_with_index(obj)
-
-    def test_hash_pandas_object2(self):
-        for name, s in self.df.iteritems():
-            self.check_equal(s)
-            self.check_not_equal_with_index(s)
-
-    def test_hash_pandas_empty_object(self):
-        for obj in [Series([], dtype='float64'),
-                    Series([], dtype='object'),
-                    Index([])]:
-            self.check_equal(obj)
-
-            # these are by-definition the same with
-            # or w/o the index as the data is empty
-
-    def test_categorical_consistency(self):
-        # GH15143
-        # Check that categoricals hash consistent with their values, not codes
-        # This should work for categoricals of any dtype
-        for s1 in [Series(['a', 'b', 'c', 'd']),
-                   Series([1000, 2000, 3000, 4000]),
-                   Series(pd.date_range(0, periods=4))]:
-            s2 = s1.astype('category').cat.set_categories(s1)
-            s3 = s2.cat.set_categories(list(reversed(s1)))
-            for categorize in [True, False]:
-                # These should all hash identically
-                h1 = hash_pandas_object(s1, categorize=categorize)
-                h2 = hash_pandas_object(s2, categorize=categorize)
-                h3 = hash_pandas_object(s3, categorize=categorize)
-                tm.assert_series_equal(h1, h2)
-                tm.assert_series_equal(h1, h3)
-
-    def test_categorical_with_nan_consistency(self):
-        c = pd.Categorical.from_codes(
-            [-1, 0, 1, 2, 3, 4],
-            categories=pd.date_range('2012-01-01', periods=5, name='B'))
-        expected = hash_array(c, categorize=False)
-        c = pd.Categorical.from_codes(
-            [-1, 0],
-            categories=[pd.Timestamp('2012-01-01')])
-        result = hash_array(c, categorize=False)
-        assert result[0] in expected
-        assert result[1] in expected
-
-    def test_pandas_errors(self):
-
-        for obj in [pd.Timestamp('20130101'), tm.makePanel()]:
-            def f():
-                hash_pandas_object(f)
-
-            self.assertRaises(TypeError, f)
-
-    def test_hash_keys(self):
-        # using different hash keys, should have different hashes
-        # for the same data
-
-        # this only matters for object dtypes
-        obj = Series(list('abc'))
-        a = hash_pandas_object(obj, hash_key='9876543210123456')
-        b = hash_pandas_object(obj, hash_key='9876543210123465')
-        self.assertTrue((a != b).all())
-
-    def test_invalid_key(self):
-        # this only matters for object dtypes
-        def f():
-            hash_pandas_object(Series(list('abc')), hash_key='foo')
-        self.assertRaises(ValueError, f)
-
-    def test_alread_encoded(self):
-        # if already encoded then ok
-
-        obj = Series(list('abc')).str.encode('utf8')
-        self.check_equal(obj)
-
-    def test_alternate_encoding(self):
-
-        obj = Series(list('abc'))
-        self.check_equal(obj, encoding='ascii')
-
-    def test_same_len_hash_collisions(self):
-
-        for l in range(8):
-            length = 2**(l + 8) + 1
-            s = tm.rands_array(length, 2)
-            result = hash_array(s, 'utf8')
-            self.assertFalse(result[0] == result[1])
-
-        for l in range(8):
-            length = 2**(l + 8)
-            s = tm.rands_array(length, 2)
-            result = hash_array(s, 'utf8')
-            self.assertFalse(result[0] == result[1])
-
-    def test_hash_collisions(self):
-
-        # hash collisions are bad
-        # https://github.com/pandas-dev/pandas/issues/14711#issuecomment-264885726
-        L = ['Ingrid-9Z9fKIZmkO7i7Cn51Li34pJm44fgX6DYGBNj3VPlOH50m7HnBlPxfIwFMrcNJNMP6PSgLmwWnInciMWrCSAlLEvt7JkJl4IxiMrVbXSa8ZQoVaq5xoQPjltuJEfwdNlO6jo8qRRHvD8sBEBMQASrRa6TsdaPTPCBo3nwIBpE7YzzmyH0vMBhjQZLx1aCT7faSEx7PgFxQhHdKFWROcysamgy9iVj8DO2Fmwg1NNl93rIAqC3mdqfrCxrzfvIY8aJdzin2cHVzy3QUJxZgHvtUtOLxoqnUHsYbNTeq0xcLXpTZEZCxD4PGubIuCNf32c33M7HFsnjWSEjE2yVdWKhmSVodyF8hFYVmhYnMCztQnJrt3O8ZvVRXd5IKwlLexiSp4h888w7SzAIcKgc3g5XQJf6MlSMftDXm9lIsE1mJNiJEv6uY6pgvC3fUPhatlR5JPpVAHNSbSEE73MBzJrhCAbOLXQumyOXigZuPoME7QgJcBalliQol7YZ9',  # noqa
-             'Tim-b9MddTxOWW2AT1Py6vtVbZwGAmYCjbp89p8mxsiFoVX4FyDOF3wFiAkyQTUgwg9sVqVYOZo09Dh1AzhFHbgij52ylF0SEwgzjzHH8TGY8Lypart4p4onnDoDvVMBa0kdthVGKl6K0BDVGzyOXPXKpmnMF1H6rJzqHJ0HywfwS4XYpVwlAkoeNsiicHkJUFdUAhG229INzvIAiJuAHeJDUoyO4DCBqtoZ5TDend6TK7Y914yHlfH3g1WZu5LksKv68VQHJriWFYusW5e6ZZ6dKaMjTwEGuRgdT66iU5nqWTHRH8WSzpXoCFwGcTOwyuqPSe0fTe21DVtJn1FKj9F9nEnR9xOvJUO7E0piCIF4Ad9yAIDY4DBimpsTfKXCu1vdHpKYerzbndfuFe5AhfMduLYZJi5iAw8qKSwR5h86ttXV0Mc0QmXz8dsRvDgxjXSmupPxBggdlqUlC828hXiTPD7am0yETBV0F3bEtvPiNJfremszcV8NcqAoARMe']  # noqa
-
-        # these should be different!
-        result1 = hash_array(np.asarray(L[0:1], dtype=object), 'utf8')
-        expected1 = np.array([14963968704024874985], dtype=np.uint64)
-        self.assert_numpy_array_equal(result1, expected1)
-
-        result2 = hash_array(np.asarray(L[1:2], dtype=object), 'utf8')
-        expected2 = np.array([16428432627716348016], dtype=np.uint64)
-        self.assert_numpy_array_equal(result2, expected2)
-
-        result = hash_array(np.asarray(L, dtype=object), 'utf8')
-        self.assert_numpy_array_equal(
-            result, np.concatenate([expected1, expected2], axis=0))
diff --git a/pandas/tests/tools/test_join.py b/pandas/tests/tools/test_join.py
deleted file mode 100644
index b65f800802bca..0000000000000
--- a/pandas/tests/tools/test_join.py
+++ /dev/null
@@ -1,796 +0,0 @@
-# pylint: disable=E1103
-
-from numpy.random import randn
-import numpy as np
-
-import pandas as pd
-from pandas.compat import lrange
-import pandas.compat as compat
-from pandas.util.testing import assert_frame_equal
-from pandas import DataFrame, MultiIndex, Series, Index, merge, concat
-
-from pandas._libs import join as libjoin
-import pandas.util.testing as tm
-from pandas.tests.tools.test_merge import get_test_data, N, NGROUPS
-
-
-a_ = np.array
-
-
-class TestJoin(tm.TestCase):
-
-    def setUp(self):
-        # aggregate multiple columns
-        self.df = DataFrame({'key1': get_test_data(),
-                             'key2': get_test_data(),
-                             'data1': np.random.randn(N),
-                             'data2': np.random.randn(N)})
-
-        # exclude a couple keys for fun
-        self.df = self.df[self.df['key2'] > 1]
-
-        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
-                              'key2': get_test_data(ngroups=NGROUPS // 2,
-                                                    n=N // 5),
-                              'value': np.random.randn(N // 5)})
-
-        index, data = tm.getMixedTypeDict()
-        self.target = DataFrame(data, index=index)
-
-        # Join on string value
-        self.source = DataFrame({'MergedA': data['A'], 'MergedD': data['D']},
-                                index=data['C'])
-
-    def test_cython_left_outer_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
-        max_group = 5
-
-        ls, rs = libjoin.left_outer_join(left, right, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
-                     6, 6, 7, 7, 8, 8, 9, 10])
-        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
-                     4, 5, 4, 5, 4, 5, -1, -1])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
-        self.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
-
-    def test_cython_right_outer_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1], dtype=np.int64)
-        max_group = 5
-
-        rs, ls = libjoin.left_outer_join(right, left, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        #            0        1        1        1
-        exp_li = a_([0, 1, 2, 3, 4, 5, 3, 4, 5, 3, 4, 5,
-                     #            2        2        4
-                     6, 7, 8, 6, 7, 8, -1])
-        exp_ri = a_([0, 0, 0, 1, 1, 1, 2, 2, 2, 3, 3, 3,
-                     4, 4, 4, 5, 5, 5, 6])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
-        self.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
-
-    def test_cython_inner_join(self):
-        left = a_([0, 1, 2, 1, 2, 0, 0, 1, 2, 3, 3], dtype=np.int64)
-        right = a_([1, 1, 0, 4, 2, 2, 1, 4], dtype=np.int64)
-        max_group = 5
-
-        ls, rs = libjoin.inner_join(left, right, max_group)
-
-        exp_ls = left.argsort(kind='mergesort')
-        exp_rs = right.argsort(kind='mergesort')
-
-        exp_li = a_([0, 1, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5,
-                     6, 6, 7, 7, 8, 8])
-        exp_ri = a_([0, 0, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3,
-                     4, 5, 4, 5, 4, 5])
-
-        exp_ls = exp_ls.take(exp_li)
-        exp_ls[exp_li == -1] = -1
-
-        exp_rs = exp_rs.take(exp_ri)
-        exp_rs[exp_ri == -1] = -1
-
-        self.assert_numpy_array_equal(ls, exp_ls, check_dtype=False)
-        self.assert_numpy_array_equal(rs, exp_rs, check_dtype=False)
-
-    def test_left_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='left')
-
-        joined_both = merge(self.df, self.df2)
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='left')
-
-    def test_right_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='right')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='right')
-
-        joined_both = merge(self.df, self.df2, how='right')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='right')
-
-    def test_full_outer_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='outer')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='outer')
-
-        joined_both = merge(self.df, self.df2, how='outer')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='outer')
-
-    def test_inner_join(self):
-        joined_key2 = merge(self.df, self.df2, on='key2', how='inner')
-        _check_join(self.df, self.df2, joined_key2, ['key2'], how='inner')
-
-        joined_both = merge(self.df, self.df2, how='inner')
-        _check_join(self.df, self.df2, joined_both, ['key1', 'key2'],
-                    how='inner')
-
-    def test_handle_overlap(self):
-        joined = merge(self.df, self.df2, on='key2',
-                       suffixes=['.foo', '.bar'])
-
-        self.assertIn('key1.foo', joined)
-        self.assertIn('key1.bar', joined)
-
-    def test_handle_overlap_arbitrary_key(self):
-        joined = merge(self.df, self.df2,
-                       left_on='key2', right_on='key1',
-                       suffixes=['.foo', '.bar'])
-        self.assertIn('key1.foo', joined)
-        self.assertIn('key2.bar', joined)
-
-    def test_join_on(self):
-        target = self.target
-        source = self.source
-
-        merged = target.join(source, on='C')
-        self.assert_series_equal(merged['MergedA'], target['A'],
-                                 check_names=False)
-        self.assert_series_equal(merged['MergedD'], target['D'],
-                                 check_names=False)
-
-        # join with duplicates (fix regression from DataFrame/Matrix merge)
-        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
-        joined = df.join(df2, on='key')
-        expected = DataFrame({'key': ['a', 'a', 'b', 'b', 'c'],
-                              'value': [0, 0, 1, 1, 2]})
-        assert_frame_equal(joined, expected)
-
-        # Test when some are missing
-        df_a = DataFrame([[1], [2], [3]], index=['a', 'b', 'c'],
-                         columns=['one'])
-        df_b = DataFrame([['foo'], ['bar']], index=[1, 2],
-                         columns=['two'])
-        df_c = DataFrame([[1], [2]], index=[1, 2],
-                         columns=['three'])
-        joined = df_a.join(df_b, on='one')
-        joined = joined.join(df_c, on='one')
-        self.assertTrue(np.isnan(joined['two']['c']))
-        self.assertTrue(np.isnan(joined['three']['c']))
-
-        # merge column not p resent
-        self.assertRaises(KeyError, target.join, source, on='E')
-
-        # overlap
-        source_copy = source.copy()
-        source_copy['A'] = 0
-        self.assertRaises(ValueError, target.join, source_copy, on='A')
-
-    def test_join_on_fails_with_different_right_index(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)})
-            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)},
-                            index=tm.makeCustomIndex(10, 2))
-            merge(df, df2, left_on='a', right_index=True)
-
-    def test_join_on_fails_with_different_left_index(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)},
-                           index=tm.makeCustomIndex(10, 2))
-            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)})
-            merge(df, df2, right_on='b', left_index=True)
-
-    def test_join_on_fails_with_different_column_counts(self):
-        with tm.assertRaises(ValueError):
-            df = DataFrame({'a': np.random.choice(['m', 'f'], size=3),
-                            'b': np.random.randn(3)})
-            df2 = DataFrame({'a': np.random.choice(['m', 'f'], size=10),
-                             'b': np.random.randn(10)},
-                            index=tm.makeCustomIndex(10, 2))
-            merge(df, df2, right_on='a', left_on=['a', 'b'])
-
-    def test_join_on_fails_with_wrong_object_type(self):
-        # GH12081
-        wrongly_typed = [Series([0, 1]), 2, 'str', None, np.array([0, 1])]
-        df = DataFrame({'a': [1, 1]})
-
-        for obj in wrongly_typed:
-            with tm.assertRaisesRegexp(ValueError, str(type(obj))):
-                merge(obj, df, left_on='a', right_on='a')
-            with tm.assertRaisesRegexp(ValueError, str(type(obj))):
-                merge(df, obj, left_on='a', right_on='a')
-
-    def test_join_on_pass_vector(self):
-        expected = self.target.join(self.source, on='C')
-        del expected['C']
-
-        join_col = self.target.pop('C')
-        result = self.target.join(self.source, on=join_col)
-        assert_frame_equal(result, expected)
-
-    def test_join_with_len0(self):
-        # nothing to merge
-        merged = self.target.join(self.source.reindex([]), on='C')
-        for col in self.source:
-            self.assertIn(col, merged)
-            self.assertTrue(merged[col].isnull().all())
-
-        merged2 = self.target.join(self.source.reindex([]), on='C',
-                                   how='inner')
-        self.assert_index_equal(merged2.columns, merged.columns)
-        self.assertEqual(len(merged2), 0)
-
-    def test_join_on_inner(self):
-        df = DataFrame({'key': ['a', 'a', 'd', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1]}, index=['a', 'b'])
-
-        joined = df.join(df2, on='key', how='inner')
-
-        expected = df.join(df2, on='key')
-        expected = expected[expected['value'].notnull()]
-        self.assert_series_equal(joined['key'], expected['key'],
-                                 check_dtype=False)
-        self.assert_series_equal(joined['value'], expected['value'],
-                                 check_dtype=False)
-        self.assert_index_equal(joined.index, expected.index)
-
-    def test_join_on_singlekey_list(self):
-        df = DataFrame({'key': ['a', 'a', 'b', 'b', 'c']})
-        df2 = DataFrame({'value': [0, 1, 2]}, index=['a', 'b', 'c'])
-
-        # corner cases
-        joined = df.join(df2, on=['key'])
-        expected = df.join(df2, on='key')
-
-        assert_frame_equal(joined, expected)
-
-    def test_join_on_series(self):
-        result = self.target.join(self.source['MergedA'], on='C')
-        expected = self.target.join(self.source[['MergedA']], on='C')
-        assert_frame_equal(result, expected)
-
-    def test_join_on_series_buglet(self):
-        # GH #638
-        df = DataFrame({'a': [1, 1]})
-        ds = Series([2], index=[1], name='b')
-        result = df.join(ds, on='a')
-        expected = DataFrame({'a': [1, 1],
-                              'b': [2, 2]}, index=df.index)
-        tm.assert_frame_equal(result, expected)
-
-    def test_join_index_mixed(self):
-        df1 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
-                        index=np.arange(10),
-                        columns=['A', 'B', 'C', 'D'])
-        self.assertEqual(df1['B'].dtype, np.int64)
-        self.assertEqual(df1['D'].dtype, np.bool_)
-
-        df2 = DataFrame({'A': 1., 'B': 2, 'C': 'foo', 'D': True},
-                        index=np.arange(0, 10, 2),
-                        columns=['A', 'B', 'C', 'D'])
-
-        # overlap
-        joined = df1.join(df2, lsuffix='_one', rsuffix='_two')
-        expected_columns = ['A_one', 'B_one', 'C_one', 'D_one',
-                            'A_two', 'B_two', 'C_two', 'D_two']
-        df1.columns = expected_columns[:4]
-        df2.columns = expected_columns[4:]
-        expected = _join_by_hand(df1, df2)
-        assert_frame_equal(joined, expected)
-
-        # no overlapping blocks
-        df1 = DataFrame(index=np.arange(10))
-        df1['bool'] = True
-        df1['string'] = 'foo'
-
-        df2 = DataFrame(index=np.arange(5, 15))
-        df2['int'] = 1
-        df2['float'] = 1.
-
-        for kind in ['inner', 'outer', 'left', 'right']:
-
-            joined = df1.join(df2, how=kind)
-            expected = _join_by_hand(df1, df2, how=kind)
-            assert_frame_equal(joined, expected)
-
-            joined = df2.join(df1, how=kind)
-            expected = _join_by_hand(df2, df1, how=kind)
-            assert_frame_equal(joined, expected)
-
-    def test_join_empty_bug(self):
-        # generated an exception in 0.4.3
-        x = DataFrame()
-        x.join(DataFrame([3], index=[0], columns=['A']), how='outer')
-
-    def test_join_unconsolidated(self):
-        # GH #331
-        a = DataFrame(randn(30, 2), columns=['a', 'b'])
-        c = Series(randn(30))
-        a['c'] = c
-        d = DataFrame(randn(30, 1), columns=['q'])
-
-        # it works!
-        a.join(d)
-        d.join(a)
-
-    def test_join_multiindex(self):
-        index1 = MultiIndex.from_arrays([['a', 'a', 'a', 'b', 'b', 'b'],
-                                         [1, 2, 3, 1, 2, 3]],
-                                        names=['first', 'second'])
-
-        index2 = MultiIndex.from_arrays([['b', 'b', 'b', 'c', 'c', 'c'],
-                                         [1, 2, 3, 1, 2, 3]],
-                                        names=['first', 'second'])
-
-        df1 = DataFrame(data=np.random.randn(6), index=index1,
-                        columns=['var X'])
-        df2 = DataFrame(data=np.random.randn(6), index=index2,
-                        columns=['var Y'])
-
-        df1 = df1.sort_index(level=0)
-        df2 = df2.sort_index(level=0)
-
-        joined = df1.join(df2, how='outer')
-        ex_index = Index(index1.values).union(Index(index2.values))
-        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
-        expected.index.names = index1.names
-        assert_frame_equal(joined, expected)
-        self.assertEqual(joined.index.names, index1.names)
-
-        df1 = df1.sort_index(level=1)
-        df2 = df2.sort_index(level=1)
-
-        joined = df1.join(df2, how='outer').sort_index(level=0)
-        ex_index = Index(index1.values).union(Index(index2.values))
-        expected = df1.reindex(ex_index).join(df2.reindex(ex_index))
-        expected.index.names = index1.names
-
-        assert_frame_equal(joined, expected)
-        self.assertEqual(joined.index.names, index1.names)
-
-    def test_join_inner_multiindex(self):
-        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
-                'qux', 'snap']
-        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
-                'three', 'one']
-
-        data = np.random.randn(len(key1))
-        data = DataFrame({'key1': key1, 'key2': key2,
-                          'data': data})
-
-        index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                   ['one', 'two', 'three']],
-                           labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                   [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                           names=['first', 'second'])
-        to_join = DataFrame(np.random.randn(10, 3), index=index,
-                            columns=['j_one', 'j_two', 'j_three'])
-
-        joined = data.join(to_join, on=['key1', 'key2'], how='inner')
-        expected = merge(data, to_join.reset_index(),
-                         left_on=['key1', 'key2'],
-                         right_on=['first', 'second'], how='inner',
-                         sort=False)
-
-        expected2 = merge(to_join, data,
-                          right_on=['key1', 'key2'], left_index=True,
-                          how='inner', sort=False)
-        assert_frame_equal(joined, expected2.reindex_like(joined))
-
-        expected2 = merge(to_join, data, right_on=['key1', 'key2'],
-                          left_index=True, how='inner', sort=False)
-
-        expected = expected.drop(['first', 'second'], axis=1)
-        expected.index = joined.index
-
-        self.assertTrue(joined.index.is_monotonic)
-        assert_frame_equal(joined, expected)
-
-        # _assert_same_contents(expected, expected2.loc[:, expected.columns])
-
-    def test_join_hierarchical_mixed(self):
-        # GH 2024
-        df = DataFrame([(1, 2, 3), (4, 5, 6)], columns=['a', 'b', 'c'])
-        new_df = df.groupby(['a']).agg({'b': [np.mean, np.sum]})
-        other_df = DataFrame(
-            [(1, 2, 3), (7, 10, 6)], columns=['a', 'b', 'd'])
-        other_df.set_index('a', inplace=True)
-        # GH 9455, 12219
-        with tm.assert_produces_warning(UserWarning):
-            result = merge(new_df, other_df, left_index=True, right_index=True)
-        self.assertTrue(('b', 'mean') in result)
-        self.assertTrue('b' in result)
-
-    def test_join_float64_float32(self):
-
-        a = DataFrame(randn(10, 2), columns=['a', 'b'], dtype=np.float64)
-        b = DataFrame(randn(10, 1), columns=['c'], dtype=np.float32)
-        joined = a.join(b)
-        self.assertEqual(joined.dtypes['a'], 'float64')
-        self.assertEqual(joined.dtypes['b'], 'float64')
-        self.assertEqual(joined.dtypes['c'], 'float32')
-
-        a = np.random.randint(0, 5, 100).astype('int64')
-        b = np.random.random(100).astype('float64')
-        c = np.random.random(100).astype('float32')
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-        xpdf = DataFrame({'a': a, 'b': b, 'c': c})
-        s = DataFrame(np.random.random(5).astype('float32'), columns=['md'])
-        rs = df.merge(s, left_on='a', right_index=True)
-        self.assertEqual(rs.dtypes['a'], 'int64')
-        self.assertEqual(rs.dtypes['b'], 'float64')
-        self.assertEqual(rs.dtypes['c'], 'float32')
-        self.assertEqual(rs.dtypes['md'], 'float32')
-
-        xp = xpdf.merge(s, left_on='a', right_index=True)
-        assert_frame_equal(rs, xp)
-
-    def test_join_many_non_unique_index(self):
-        df1 = DataFrame({"a": [1, 1], "b": [1, 1], "c": [10, 20]})
-        df2 = DataFrame({"a": [1, 1], "b": [1, 2], "d": [100, 200]})
-        df3 = DataFrame({"a": [1, 1], "b": [1, 2], "e": [1000, 2000]})
-        idf1 = df1.set_index(["a", "b"])
-        idf2 = df2.set_index(["a", "b"])
-        idf3 = df3.set_index(["a", "b"])
-
-        result = idf1.join([idf2, idf3], how='outer')
-
-        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='outer')
-        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='outer')
-
-        result = result.reset_index()
-        expected = expected[result.columns]
-        expected['a'] = expected.a.astype('int64')
-        expected['b'] = expected.b.astype('int64')
-        assert_frame_equal(result, expected)
-
-        df1 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 1], "c": [10, 20, 30]})
-        df2 = DataFrame({"a": [1, 1, 1], "b": [1, 1, 2], "d": [100, 200, 300]})
-        df3 = DataFrame(
-            {"a": [1, 1, 1], "b": [1, 1, 2], "e": [1000, 2000, 3000]})
-        idf1 = df1.set_index(["a", "b"])
-        idf2 = df2.set_index(["a", "b"])
-        idf3 = df3.set_index(["a", "b"])
-        result = idf1.join([idf2, idf3], how='inner')
-
-        df_partially_merged = merge(df1, df2, on=['a', 'b'], how='inner')
-        expected = merge(df_partially_merged, df3, on=['a', 'b'], how='inner')
-
-        result = result.reset_index()
-
-        assert_frame_equal(result, expected.loc[:, result.columns])
-
-        # GH 11519
-        df = DataFrame({'A': ['foo', 'bar', 'foo', 'bar',
-                              'foo', 'bar', 'foo', 'foo'],
-                        'B': ['one', 'one', 'two', 'three',
-                              'two', 'two', 'one', 'three'],
-                        'C': np.random.randn(8),
-                        'D': np.random.randn(8)})
-        s = Series(np.repeat(np.arange(8), 2),
-                   index=np.repeat(np.arange(8), 2), name='TEST')
-        inner = df.join(s, how='inner')
-        outer = df.join(s, how='outer')
-        left = df.join(s, how='left')
-        right = df.join(s, how='right')
-        assert_frame_equal(inner, outer)
-        assert_frame_equal(inner, left)
-        assert_frame_equal(inner, right)
-
-    def test_join_sort(self):
-        left = DataFrame({'key': ['foo', 'bar', 'baz', 'foo'],
-                          'value': [1, 2, 3, 4]})
-        right = DataFrame({'value2': ['a', 'b', 'c']},
-                          index=['bar', 'baz', 'foo'])
-
-        joined = left.join(right, on='key', sort=True)
-        expected = DataFrame({'key': ['bar', 'baz', 'foo', 'foo'],
-                              'value': [2, 3, 1, 4],
-                              'value2': ['a', 'b', 'c', 'c']},
-                             index=[1, 2, 0, 3])
-        assert_frame_equal(joined, expected)
-
-        # smoke test
-        joined = left.join(right, on='key', sort=False)
-        self.assert_index_equal(joined.index, pd.Index(lrange(4)))
-
-    def test_join_mixed_non_unique_index(self):
-        # GH 12814, unorderable types in py3 with a non-unique index
-        df1 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 3, 'a'])
-        df2 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 3, 3, 4])
-        result = df1.join(df2)
-        expected = DataFrame({'a': [1, 2, 3, 3, 4],
-                              'b': [5, np.nan, 6, 7, np.nan]},
-                             index=[1, 2, 3, 3, 'a'])
-        tm.assert_frame_equal(result, expected)
-
-        df3 = DataFrame({'a': [1, 2, 3, 4]}, index=[1, 2, 2, 'a'])
-        df4 = DataFrame({'b': [5, 6, 7, 8]}, index=[1, 2, 3, 4])
-        result = df3.join(df4)
-        expected = DataFrame({'a': [1, 2, 3, 4], 'b': [5, 6, 6, np.nan]},
-                             index=[1, 2, 2, 'a'])
-        tm.assert_frame_equal(result, expected)
-
-    def test_mixed_type_join_with_suffix(self):
-        # GH #916
-        df = DataFrame(np.random.randn(20, 6),
-                       columns=['a', 'b', 'c', 'd', 'e', 'f'])
-        df.insert(0, 'id', 0)
-        df.insert(5, 'dt', 'foo')
-
-        grouped = df.groupby('id')
-        mn = grouped.mean()
-        cn = grouped.count()
-
-        # it works!
-        mn.join(cn, rsuffix='_right')
-
-    def test_join_many(self):
-        df = DataFrame(np.random.randn(10, 6), columns=list('abcdef'))
-        df_list = [df[['a', 'b']], df[['c', 'd']], df[['e', 'f']]]
-
-        joined = df_list[0].join(df_list[1:])
-        tm.assert_frame_equal(joined, df)
-
-        df_list = [df[['a', 'b']][:-2],
-                   df[['c', 'd']][2:], df[['e', 'f']][1:9]]
-
-        def _check_diff_index(df_list, result, exp_index):
-            reindexed = [x.reindex(exp_index) for x in df_list]
-            expected = reindexed[0].join(reindexed[1:])
-            tm.assert_frame_equal(result, expected)
-
-        # different join types
-        joined = df_list[0].join(df_list[1:], how='outer')
-        _check_diff_index(df_list, joined, df.index)
-
-        joined = df_list[0].join(df_list[1:])
-        _check_diff_index(df_list, joined, df_list[0].index)
-
-        joined = df_list[0].join(df_list[1:], how='inner')
-        _check_diff_index(df_list, joined, df.index[2:8])
-
-        self.assertRaises(ValueError, df_list[0].join, df_list[1:], on='a')
-
-    def test_join_many_mixed(self):
-        df = DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
-        df['key'] = ['foo', 'bar'] * 4
-        df1 = df.loc[:, ['A', 'B']]
-        df2 = df.loc[:, ['C', 'D']]
-        df3 = df.loc[:, ['key']]
-
-        result = df1.join([df2, df3])
-        assert_frame_equal(result, df)
-
-    def test_join_dups(self):
-
-        # joining dups
-        df = concat([DataFrame(np.random.randn(10, 4),
-                               columns=['A', 'A', 'B', 'B']),
-                     DataFrame(np.random.randint(0, 10, size=20)
-                               .reshape(10, 2),
-                               columns=['A', 'C'])],
-                    axis=1)
-
-        expected = concat([df, df], axis=1)
-        result = df.join(df, rsuffix='_2')
-        result.columns = expected.columns
-        assert_frame_equal(result, expected)
-
-        # GH 4975, invalid join on dups
-        w = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
-        x = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
-        y = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
-        z = DataFrame(np.random.randn(4, 2), columns=["x", "y"])
-
-        dta = x.merge(y, left_index=True, right_index=True).merge(
-            z, left_index=True, right_index=True, how="outer")
-        dta = dta.merge(w, left_index=True, right_index=True)
-        expected = concat([x, y, z, w], axis=1)
-        expected.columns = ['x_x', 'y_x', 'x_y',
-                            'y_y', 'x_x', 'y_x', 'x_y', 'y_y']
-        assert_frame_equal(dta, expected)
-
-    def test_panel_join(self):
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        p1 = panel.iloc[:2, :10, :3]
-        p2 = panel.iloc[2:, 5:, 2:]
-
-        # left join
-        result = p1.join(p2)
-        expected = p1.copy()
-        expected['ItemC'] = p2['ItemC']
-        tm.assert_panel_equal(result, expected)
-
-        # right join
-        result = p1.join(p2, how='right')
-        expected = p2.copy()
-        expected['ItemA'] = p1['ItemA']
-        expected['ItemB'] = p1['ItemB']
-        expected = expected.reindex(items=['ItemA', 'ItemB', 'ItemC'])
-        tm.assert_panel_equal(result, expected)
-
-        # inner join
-        result = p1.join(p2, how='inner')
-        expected = panel.iloc[:, 5:10, 2:3]
-        tm.assert_panel_equal(result, expected)
-
-        # outer join
-        result = p1.join(p2, how='outer')
-        expected = p1.reindex(major=panel.major_axis,
-                              minor=panel.minor_axis)
-        expected = expected.join(p2.reindex(major=panel.major_axis,
-                                            minor=panel.minor_axis))
-        tm.assert_panel_equal(result, expected)
-
-    def test_panel_join_overlap(self):
-        panel = tm.makePanel()
-        tm.add_nans(panel)
-
-        p1 = panel.loc[['ItemA', 'ItemB', 'ItemC']]
-        p2 = panel.loc[['ItemB', 'ItemC']]
-
-        # Expected index is
-        #
-        # ItemA, ItemB_p1, ItemC_p1, ItemB_p2, ItemC_p2
-        joined = p1.join(p2, lsuffix='_p1', rsuffix='_p2')
-        p1_suf = p1.loc[['ItemB', 'ItemC']].add_suffix('_p1')
-        p2_suf = p2.loc[['ItemB', 'ItemC']].add_suffix('_p2')
-        no_overlap = panel.loc[['ItemA']]
-        expected = no_overlap.join(p1_suf.join(p2_suf))
-        tm.assert_panel_equal(joined, expected)
-
-    def test_panel_join_many(self):
-        tm.K = 10
-        panel = tm.makePanel()
-        tm.K = 4
-
-        panels = [panel.iloc[:2], panel.iloc[2:6], panel.iloc[6:]]
-
-        joined = panels[0].join(panels[1:])
-        tm.assert_panel_equal(joined, panel)
-
-        panels = [panel.iloc[:2, :-5],
-                  panel.iloc[2:6, 2:],
-                  panel.iloc[6:, 5:-7]]
-
-        data_dict = {}
-        for p in panels:
-            data_dict.update(p.iteritems())
-
-        joined = panels[0].join(panels[1:], how='inner')
-        expected = pd.Panel.from_dict(data_dict, intersect=True)
-        tm.assert_panel_equal(joined, expected)
-
-        joined = panels[0].join(panels[1:], how='outer')
-        expected = pd.Panel.from_dict(data_dict, intersect=False)
-        tm.assert_panel_equal(joined, expected)
-
-        # edge cases
-        self.assertRaises(ValueError, panels[0].join, panels[1:],
-                          how='outer', lsuffix='foo', rsuffix='bar')
-        self.assertRaises(ValueError, panels[0].join, panels[1:],
-                          how='right')
-
-
-def _check_join(left, right, result, join_col, how='left',
-                lsuffix='_x', rsuffix='_y'):
-
-    # some smoke tests
-    for c in join_col:
-        assert(result[c].notnull().all())
-
-    left_grouped = left.groupby(join_col)
-    right_grouped = right.groupby(join_col)
-
-    for group_key, group in result.groupby(join_col):
-        l_joined = _restrict_to_columns(group, left.columns, lsuffix)
-        r_joined = _restrict_to_columns(group, right.columns, rsuffix)
-
-        try:
-            lgroup = left_grouped.get_group(group_key)
-        except KeyError:
-            if how in ('left', 'inner'):
-                raise AssertionError('key %s should not have been in the join'
-                                     % str(group_key))
-
-            _assert_all_na(l_joined, left.columns, join_col)
-        else:
-            _assert_same_contents(l_joined, lgroup)
-
-        try:
-            rgroup = right_grouped.get_group(group_key)
-        except KeyError:
-            if how in ('right', 'inner'):
-                raise AssertionError('key %s should not have been in the join'
-                                     % str(group_key))
-
-            _assert_all_na(r_joined, right.columns, join_col)
-        else:
-            _assert_same_contents(r_joined, rgroup)
-
-
-def _restrict_to_columns(group, columns, suffix):
-    found = [c for c in group.columns
-             if c in columns or c.replace(suffix, '') in columns]
-
-    # filter
-    group = group.loc[:, found]
-
-    # get rid of suffixes, if any
-    group = group.rename(columns=lambda x: x.replace(suffix, ''))
-
-    # put in the right order...
-    group = group.loc[:, columns]
-
-    return group
-
-
-def _assert_same_contents(join_chunk, source):
-    NA_SENTINEL = -1234567  # drop_duplicates not so NA-friendly...
-
-    jvalues = join_chunk.fillna(NA_SENTINEL).drop_duplicates().values
-    svalues = source.fillna(NA_SENTINEL).drop_duplicates().values
-
-    rows = set(tuple(row) for row in jvalues)
-    assert(len(rows) == len(source))
-    assert(all(tuple(row) in rows for row in svalues))
-
-
-def _assert_all_na(join_chunk, source_columns, join_col):
-    for c in source_columns:
-        if c in join_col:
-            continue
-        assert(join_chunk[c].isnull().all())
-
-
-def _join_by_hand(a, b, how='left'):
-    join_index = a.index.join(b.index, how=how)
-
-    a_re = a.reindex(join_index)
-    b_re = b.reindex(join_index)
-
-    result_columns = a.columns.append(b.columns)
-
-    for col, s in compat.iteritems(b_re):
-        a_re[col] = s
-    return a_re.reindex(columns=result_columns)
diff --git a/pandas/tests/tools/test_merge.py b/pandas/tests/tools/test_merge.py
deleted file mode 100644
index 8011bc4a1cfc2..0000000000000
--- a/pandas/tests/tools/test_merge.py
+++ /dev/null
@@ -1,1405 +0,0 @@
-# pylint: disable=E1103
-
-import pytest
-from datetime import datetime
-from numpy.random import randn
-from numpy import nan
-import numpy as np
-import random
-
-import pandas as pd
-from pandas.compat import lrange, lzip
-from pandas.tools.concat import concat
-from pandas.tools.merge import merge, MergeError
-from pandas.util.testing import assert_frame_equal, assert_series_equal
-from pandas.types.dtypes import CategoricalDtype
-from pandas.types.common import is_categorical_dtype, is_object_dtype
-from pandas import DataFrame, Index, MultiIndex, Series, Categorical
-import pandas.util.testing as tm
-
-
-N = 50
-NGROUPS = 8
-
-
-def get_test_data(ngroups=NGROUPS, n=N):
-    unique_groups = lrange(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n // ngroups))
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)])
-
-    random.shuffle(arr)
-    return arr
-
-
-class TestMerge(tm.TestCase):
-
-    def setUp(self):
-        # aggregate multiple columns
-        self.df = DataFrame({'key1': get_test_data(),
-                             'key2': get_test_data(),
-                             'data1': np.random.randn(N),
-                             'data2': np.random.randn(N)})
-
-        # exclude a couple keys for fun
-        self.df = self.df[self.df['key2'] > 1]
-
-        self.df2 = DataFrame({'key1': get_test_data(n=N // 5),
-                              'key2': get_test_data(ngroups=NGROUPS // 2,
-                                                    n=N // 5),
-                              'value': np.random.randn(N // 5)})
-
-        self.left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                               'v1': np.random.randn(7)})
-        self.right = DataFrame({'v2': np.random.randn(4)},
-                               index=['d', 'b', 'c', 'a'])
-
-    def test_merge_inner_join_empty(self):
-        # GH 15328
-        df_empty = pd.DataFrame()
-        df_a = pd.DataFrame({'a': [1, 2]}, index=[0, 1], dtype='int64')
-        result = pd.merge(df_empty, df_a, left_index=True, right_index=True)
-        expected = pd.DataFrame({'a': []}, index=[], dtype='int64')
-        assert_frame_equal(result, expected)
-
-    def test_merge_common(self):
-        joined = merge(self.df, self.df2)
-        exp = merge(self.df, self.df2, on=['key1', 'key2'])
-        tm.assert_frame_equal(joined, exp)
-
-    def test_merge_index_singlekey_right_vs_left(self):
-        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                          'v1': np.random.randn(7)})
-        right = DataFrame({'v2': np.random.randn(4)},
-                          index=['d', 'b', 'c', 'a'])
-
-        merged1 = merge(left, right, left_on='key',
-                        right_index=True, how='left', sort=False)
-        merged2 = merge(right, left, right_on='key',
-                        left_index=True, how='right', sort=False)
-        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
-
-        merged1 = merge(left, right, left_on='key',
-                        right_index=True, how='left', sort=True)
-        merged2 = merge(right, left, right_on='key',
-                        left_index=True, how='right', sort=True)
-        assert_frame_equal(merged1, merged2.loc[:, merged1.columns])
-
-    def test_merge_index_singlekey_inner(self):
-        left = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'e', 'a'],
-                          'v1': np.random.randn(7)})
-        right = DataFrame({'v2': np.random.randn(4)},
-                          index=['d', 'b', 'c', 'a'])
-
-        # inner join
-        result = merge(left, right, left_on='key', right_index=True,
-                       how='inner')
-        expected = left.join(right, on='key').loc[result.index]
-        assert_frame_equal(result, expected)
-
-        result = merge(right, left, right_on='key', left_index=True,
-                       how='inner')
-        expected = left.join(right, on='key').loc[result.index]
-        assert_frame_equal(result, expected.loc[:, result.columns])
-
-    def test_merge_misspecified(self):
-        self.assertRaises(ValueError, merge, self.left, self.right,
-                          left_index=True)
-        self.assertRaises(ValueError, merge, self.left, self.right,
-                          right_index=True)
-
-        self.assertRaises(ValueError, merge, self.left, self.left,
-                          left_on='key', on='key')
-
-        self.assertRaises(ValueError, merge, self.df, self.df2,
-                          left_on=['key1'], right_on=['key1', 'key2'])
-
-    def test_index_and_on_parameters_confusion(self):
-        self.assertRaises(ValueError, merge, self.df, self.df2, how='left',
-                          left_index=False, right_index=['key1', 'key2'])
-        self.assertRaises(ValueError, merge, self.df, self.df2, how='left',
-                          left_index=['key1', 'key2'], right_index=False)
-        self.assertRaises(ValueError, merge, self.df, self.df2, how='left',
-                          left_index=['key1', 'key2'],
-                          right_index=['key1', 'key2'])
-
-    def test_merge_overlap(self):
-        merged = merge(self.left, self.left, on='key')
-        exp_len = (self.left['key'].value_counts() ** 2).sum()
-        self.assertEqual(len(merged), exp_len)
-        self.assertIn('v1_x', merged)
-        self.assertIn('v1_y', merged)
-
-    def test_merge_different_column_key_names(self):
-        left = DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
-                          'value': [1, 2, 3, 4]})
-        right = DataFrame({'rkey': ['foo', 'bar', 'qux', 'foo'],
-                           'value': [5, 6, 7, 8]})
-
-        merged = left.merge(right, left_on='lkey', right_on='rkey',
-                            how='outer', sort=True)
-
-        exp = pd.Series(['bar', 'baz', 'foo', 'foo', 'foo', 'foo', np.nan],
-                        name='lkey')
-        tm.assert_series_equal(merged['lkey'], exp)
-
-        exp = pd.Series(['bar', np.nan, 'foo', 'foo', 'foo', 'foo', 'qux'],
-                        name='rkey')
-        tm.assert_series_equal(merged['rkey'], exp)
-
-        exp = pd.Series([2, 3, 1, 1, 4, 4, np.nan], name='value_x')
-        tm.assert_series_equal(merged['value_x'], exp)
-
-        exp = pd.Series([6, np.nan, 5, 8, 5, 8, 7], name='value_y')
-        tm.assert_series_equal(merged['value_y'], exp)
-
-    def test_merge_copy(self):
-        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
-        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
-
-        merged = merge(left, right, left_index=True,
-                       right_index=True, copy=True)
-
-        merged['a'] = 6
-        self.assertTrue((left['a'] == 0).all())
-
-        merged['d'] = 'peekaboo'
-        self.assertTrue((right['d'] == 'bar').all())
-
-    def test_merge_nocopy(self):
-        left = DataFrame({'a': 0, 'b': 1}, index=lrange(10))
-        right = DataFrame({'c': 'foo', 'd': 'bar'}, index=lrange(10))
-
-        merged = merge(left, right, left_index=True,
-                       right_index=True, copy=False)
-
-        merged['a'] = 6
-        self.assertTrue((left['a'] == 6).all())
-
-        merged['d'] = 'peekaboo'
-        self.assertTrue((right['d'] == 'peekaboo').all())
-
-    def test_intelligently_handle_join_key(self):
-        # #733, be a bit more 1337 about not returning unconsolidated DataFrame
-
-        left = DataFrame({'key': [1, 1, 2, 2, 3],
-                          'value': lrange(5)}, columns=['value', 'key'])
-        right = DataFrame({'key': [1, 1, 2, 3, 4, 5],
-                           'rvalue': lrange(6)})
-
-        joined = merge(left, right, on='key', how='outer')
-        expected = DataFrame({'key': [1, 1, 1, 1, 2, 2, 3, 4, 5],
-                              'value': np.array([0, 0, 1, 1, 2, 3, 4,
-                                                 np.nan, np.nan]),
-                              'rvalue': [0, 1, 0, 1, 2, 2, 3, 4, 5]},
-                             columns=['value', 'key', 'rvalue'])
-        assert_frame_equal(joined, expected)
-
-    def test_merge_join_key_dtype_cast(self):
-        # #8596
-
-        df1 = DataFrame({'key': [1], 'v1': [10]})
-        df2 = DataFrame({'key': [2], 'v1': [20]})
-        df = merge(df1, df2, how='outer')
-        self.assertEqual(df['key'].dtype, 'int64')
-
-        df1 = DataFrame({'key': [True], 'v1': [1]})
-        df2 = DataFrame({'key': [False], 'v1': [0]})
-        df = merge(df1, df2, how='outer')
-
-        # GH13169
-        # this really should be bool
-        self.assertEqual(df['key'].dtype, 'object')
-
-        df1 = DataFrame({'val': [1]})
-        df2 = DataFrame({'val': [2]})
-        lkey = np.array([1])
-        rkey = np.array([2])
-        df = merge(df1, df2, left_on=lkey, right_on=rkey, how='outer')
-        self.assertEqual(df['key_0'].dtype, 'int64')
-
-    def test_handle_join_key_pass_array(self):
-        left = DataFrame({'key': [1, 1, 2, 2, 3],
-                          'value': lrange(5)}, columns=['value', 'key'])
-        right = DataFrame({'rvalue': lrange(6)})
-        key = np.array([1, 1, 2, 3, 4, 5])
-
-        merged = merge(left, right, left_on='key', right_on=key, how='outer')
-        merged2 = merge(right, left, left_on=key, right_on='key', how='outer')
-
-        assert_series_equal(merged['key'], merged2['key'])
-        self.assertTrue(merged['key'].notnull().all())
-        self.assertTrue(merged2['key'].notnull().all())
-
-        left = DataFrame({'value': lrange(5)}, columns=['value'])
-        right = DataFrame({'rvalue': lrange(6)})
-        lkey = np.array([1, 1, 2, 2, 3])
-        rkey = np.array([1, 1, 2, 3, 4, 5])
-
-        merged = merge(left, right, left_on=lkey, right_on=rkey, how='outer')
-        self.assert_series_equal(merged['key_0'],
-                                 Series([1, 1, 1, 1, 2, 2, 3, 4, 5],
-                                        name='key_0'))
-
-        left = DataFrame({'value': lrange(3)})
-        right = DataFrame({'rvalue': lrange(6)})
-
-        key = np.array([0, 1, 1, 2, 2, 3], dtype=np.int64)
-        merged = merge(left, right, left_index=True, right_on=key, how='outer')
-        self.assert_series_equal(merged['key_0'], Series(key, name='key_0'))
-
-    def test_no_overlap_more_informative_error(self):
-        dt = datetime.now()
-        df1 = DataFrame({'x': ['a']}, index=[dt])
-
-        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
-        self.assertRaises(MergeError, merge, df1, df2)
-
-    def test_merge_non_unique_indexes(self):
-
-        dt = datetime(2012, 5, 1)
-        dt2 = datetime(2012, 5, 2)
-        dt3 = datetime(2012, 5, 3)
-        dt4 = datetime(2012, 5, 4)
-
-        df1 = DataFrame({'x': ['a']}, index=[dt])
-        df2 = DataFrame({'y': ['b', 'c']}, index=[dt, dt])
-        _check_merge(df1, df2)
-
-        # Not monotonic
-        df1 = DataFrame({'x': ['a', 'b', 'q']}, index=[dt2, dt, dt4])
-        df2 = DataFrame({'y': ['c', 'd', 'e', 'f', 'g', 'h']},
-                        index=[dt3, dt3, dt2, dt2, dt, dt])
-        _check_merge(df1, df2)
-
-        df1 = DataFrame({'x': ['a', 'b']}, index=[dt, dt])
-        df2 = DataFrame({'y': ['c', 'd']}, index=[dt, dt])
-        _check_merge(df1, df2)
-
-    def test_merge_non_unique_index_many_to_many(self):
-        dt = datetime(2012, 5, 1)
-        dt2 = datetime(2012, 5, 2)
-        dt3 = datetime(2012, 5, 3)
-        df1 = DataFrame({'x': ['a', 'b', 'c', 'd']},
-                        index=[dt2, dt2, dt, dt])
-        df2 = DataFrame({'y': ['e', 'f', 'g', ' h', 'i']},
-                        index=[dt2, dt2, dt3, dt, dt])
-        _check_merge(df1, df2)
-
-    def test_left_merge_empty_dataframe(self):
-        left = DataFrame({'key': [1], 'value': [2]})
-        right = DataFrame({'key': []})
-
-        result = merge(left, right, on='key', how='left')
-        assert_frame_equal(result, left)
-
-        result = merge(right, left, on='key', how='right')
-        assert_frame_equal(result, left)
-
-    def test_merge_left_empty_right_empty(self):
-        # GH 10824
-        left = pd.DataFrame([], columns=['a', 'b', 'c'])
-        right = pd.DataFrame([], columns=['x', 'y', 'z'])
-
-        exp_in = pd.DataFrame([], columns=['a', 'b', 'c', 'x', 'y', 'z'],
-                              index=pd.Index([], dtype=object),
-                              dtype=object)
-
-        for kwarg in [dict(left_index=True, right_index=True),
-                      dict(left_index=True, right_on='x'),
-                      dict(left_on='a', right_index=True),
-                      dict(left_on='a', right_on='x')]:
-
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp_in)
-
-    def test_merge_left_empty_right_notempty(self):
-        # GH 10824
-        left = pd.DataFrame([], columns=['a', 'b', 'c'])
-        right = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                             columns=['x', 'y', 'z'])
-
-        exp_out = pd.DataFrame({'a': np.array([np.nan] * 3, dtype=object),
-                                'b': np.array([np.nan] * 3, dtype=object),
-                                'c': np.array([np.nan] * 3, dtype=object),
-                                'x': [1, 4, 7],
-                                'y': [2, 5, 8],
-                                'z': [3, 6, 9]},
-                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
-        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
-        # result will have object dtype
-        exp_in.index = exp_in.index.astype(object)
-
-        def check1(exp, kwarg):
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp)
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp)
-
-        def check2(exp, kwarg):
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp)
-
-        for kwarg in [dict(left_index=True, right_index=True),
-                      dict(left_index=True, right_on='x')]:
-            check1(exp_in, kwarg)
-            check2(exp_out, kwarg)
-
-        kwarg = dict(left_on='a', right_index=True)
-        check1(exp_in, kwarg)
-        exp_out['a'] = [0, 1, 2]
-        check2(exp_out, kwarg)
-
-        kwarg = dict(left_on='a', right_on='x')
-        check1(exp_in, kwarg)
-        exp_out['a'] = np.array([np.nan] * 3, dtype=object)
-        check2(exp_out, kwarg)
-
-    def test_merge_left_notempty_right_empty(self):
-        # GH 10824
-        left = pd.DataFrame([[1, 2, 3], [4, 5, 6], [7, 8, 9]],
-                            columns=['a', 'b', 'c'])
-        right = pd.DataFrame([], columns=['x', 'y', 'z'])
-
-        exp_out = pd.DataFrame({'a': [1, 4, 7],
-                                'b': [2, 5, 8],
-                                'c': [3, 6, 9],
-                                'x': np.array([np.nan] * 3, dtype=object),
-                                'y': np.array([np.nan] * 3, dtype=object),
-                                'z': np.array([np.nan] * 3, dtype=object)},
-                               columns=['a', 'b', 'c', 'x', 'y', 'z'])
-        exp_in = exp_out[0:0]  # make empty DataFrame keeping dtype
-        # result will have object dtype
-        exp_in.index = exp_in.index.astype(object)
-
-        def check1(exp, kwarg):
-            result = pd.merge(left, right, how='inner', **kwarg)
-            tm.assert_frame_equal(result, exp)
-            result = pd.merge(left, right, how='right', **kwarg)
-            tm.assert_frame_equal(result, exp)
-
-        def check2(exp, kwarg):
-            result = pd.merge(left, right, how='left', **kwarg)
-            tm.assert_frame_equal(result, exp)
-            result = pd.merge(left, right, how='outer', **kwarg)
-            tm.assert_frame_equal(result, exp)
-
-            for kwarg in [dict(left_index=True, right_index=True),
-                          dict(left_index=True, right_on='x'),
-                          dict(left_on='a', right_index=True),
-                          dict(left_on='a', right_on='x')]:
-                check1(exp_in, kwarg)
-                check2(exp_out, kwarg)
-
-    def test_merge_nosort(self):
-        # #2098, anything to do?
-
-        from datetime import datetime
-
-        d = {"var1": np.random.randint(0, 10, size=10),
-             "var2": np.random.randint(0, 10, size=10),
-             "var3": [datetime(2012, 1, 12), datetime(2011, 2, 4),
-                      datetime(
-                      2010, 2, 3), datetime(2012, 1, 12),
-                      datetime(
-                      2011, 2, 4), datetime(2012, 4, 3),
-                      datetime(
-                      2012, 3, 4), datetime(2008, 5, 1),
-                      datetime(2010, 2, 3), datetime(2012, 2, 3)]}
-        df = DataFrame.from_dict(d)
-        var3 = df.var3.unique()
-        var3.sort()
-        new = DataFrame.from_dict({"var3": var3,
-                                   "var8": np.random.random(7)})
-
-        result = df.merge(new, on="var3", sort=False)
-        exp = merge(df, new, on='var3', sort=False)
-        assert_frame_equal(result, exp)
-
-        self.assertTrue((df.var3.unique() == result.var3.unique()).all())
-
-    def test_merge_nan_right(self):
-        df1 = DataFrame({"i1": [0, 1], "i2": [0, 1]})
-        df2 = DataFrame({"i1": [0], "i3": [0]})
-        result = df1.join(df2, on="i1", rsuffix="_")
-        expected = (DataFrame({'i1': {0: 0.0, 1: 1}, 'i2': {0: 0, 1: 1},
-                               'i1_': {0: 0, 1: np.nan},
-                               'i3': {0: 0.0, 1: np.nan},
-                               None: {0: 0, 1: 0}})
-                    .set_index(None)
-                    .reset_index()[['i1', 'i2', 'i1_', 'i3']])
-        assert_frame_equal(result, expected, check_dtype=False)
-
-        df1 = DataFrame({"i1": [0, 1], "i2": [0.5, 1.5]})
-        df2 = DataFrame({"i1": [0], "i3": [0.7]})
-        result = df1.join(df2, rsuffix="_", on='i1')
-        expected = (DataFrame({'i1': {0: 0, 1: 1}, 'i1_': {0: 0.0, 1: nan},
-                               'i2': {0: 0.5, 1: 1.5},
-                               'i3': {0: 0.69999999999999996,
-                                      1: nan}})
-                    [['i1', 'i2', 'i1_', 'i3']])
-        assert_frame_equal(result, expected)
-
-    def test_merge_type(self):
-        class NotADataFrame(DataFrame):
-
-            @property
-            def _constructor(self):
-                return NotADataFrame
-
-        nad = NotADataFrame(self.df)
-        result = nad.merge(self.df2, on='key1')
-
-        tm.assertIsInstance(result, NotADataFrame)
-
-    def test_join_append_timedeltas(self):
-
-        import datetime as dt
-        from pandas import NaT
-
-        # timedelta64 issues with join/merge
-        # GH 5695
-
-        d = {'d': dt.datetime(2013, 11, 5, 5, 56), 't': dt.timedelta(0, 22500)}
-        df = DataFrame(columns=list('dt'))
-        df = df.append(d, ignore_index=True)
-        result = df.append(d, ignore_index=True)
-        expected = DataFrame({'d': [dt.datetime(2013, 11, 5, 5, 56),
-                                    dt.datetime(2013, 11, 5, 5, 56)],
-                              't': [dt.timedelta(0, 22500),
-                                    dt.timedelta(0, 22500)]})
-        assert_frame_equal(result, expected)
-
-        td = np.timedelta64(300000000)
-        lhs = DataFrame(Series([td, td], index=["A", "B"]))
-        rhs = DataFrame(Series([td], index=["A"]))
-
-        result = lhs.join(rhs, rsuffix='r', how="left")
-        expected = DataFrame({'0': Series([td, td], index=list('AB')),
-                              '0r': Series([td, NaT], index=list('AB'))})
-        assert_frame_equal(result, expected)
-
-    def test_other_datetime_unit(self):
-        # GH 13389
-        df1 = pd.DataFrame({'entity_id': [101, 102]})
-        s = pd.Series([None, None], index=[101, 102], name='days')
-
-        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
-                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
-                      'datetime64[ns]']:
-
-            df2 = s.astype(dtype).to_frame('days')
-            # coerces to datetime64[ns], thus sholuld not be affected
-            self.assertEqual(df2['days'].dtype, 'datetime64[ns]')
-
-            result = df1.merge(df2, left_on='entity_id', right_index=True)
-
-            exp = pd.DataFrame({'entity_id': [101, 102],
-                                'days': np.array(['nat', 'nat'],
-                                                 dtype='datetime64[ns]')},
-                               columns=['entity_id', 'days'])
-            tm.assert_frame_equal(result, exp)
-
-    def test_other_timedelta_unit(self):
-        # GH 13389
-        df1 = pd.DataFrame({'entity_id': [101, 102]})
-        s = pd.Series([None, None], index=[101, 102], name='days')
-
-        for dtype in ['timedelta64[D]', 'timedelta64[h]', 'timedelta64[m]',
-                      'timedelta64[s]', 'timedelta64[ms]', 'timedelta64[us]',
-                      'timedelta64[ns]']:
-
-            df2 = s.astype(dtype).to_frame('days')
-            self.assertEqual(df2['days'].dtype, dtype)
-
-            result = df1.merge(df2, left_on='entity_id', right_index=True)
-
-            exp = pd.DataFrame({'entity_id': [101, 102],
-                                'days': np.array(['nat', 'nat'],
-                                                 dtype=dtype)},
-                               columns=['entity_id', 'days'])
-            tm.assert_frame_equal(result, exp)
-
-    def test_overlapping_columns_error_message(self):
-        df = DataFrame({'key': [1, 2, 3],
-                        'v1': [4, 5, 6],
-                        'v2': [7, 8, 9]})
-        df2 = DataFrame({'key': [1, 2, 3],
-                         'v1': [4, 5, 6],
-                         'v2': [7, 8, 9]})
-
-        df.columns = ['key', 'foo', 'foo']
-        df2.columns = ['key', 'bar', 'bar']
-        expected = DataFrame({'key': [1, 2, 3],
-                              'v1': [4, 5, 6],
-                              'v2': [7, 8, 9],
-                              'v3': [4, 5, 6],
-                              'v4': [7, 8, 9]})
-        expected.columns = ['key', 'foo', 'foo', 'bar', 'bar']
-        assert_frame_equal(merge(df, df2), expected)
-
-        # #2649, #10639
-        df2.columns = ['key1', 'foo', 'foo']
-        self.assertRaises(ValueError, merge, df, df2)
-
-    def test_merge_on_datetime64tz(self):
-
-        # GH11405
-        left = pd.DataFrame({'key': pd.date_range('20151010', periods=2,
-                                                  tz='US/Eastern'),
-                             'value': [1, 2]})
-        right = pd.DataFrame({'key': pd.date_range('20151011', periods=3,
-                                                   tz='US/Eastern'),
-                              'value': [1, 2, 3]})
-
-        expected = DataFrame({'key': pd.date_range('20151010', periods=4,
-                                                   tz='US/Eastern'),
-                              'value_x': [1, 2, np.nan, np.nan],
-                              'value_y': [np.nan, 1, 2, 3]})
-        result = pd.merge(left, right, on='key', how='outer')
-        assert_frame_equal(result, expected)
-
-        left = pd.DataFrame({'value': pd.date_range('20151010', periods=2,
-                                                    tz='US/Eastern'),
-                             'key': [1, 2]})
-        right = pd.DataFrame({'value': pd.date_range('20151011', periods=2,
-                                                     tz='US/Eastern'),
-                              'key': [2, 3]})
-        expected = DataFrame({
-            'value_x': list(pd.date_range('20151010', periods=2,
-                                          tz='US/Eastern')) + [pd.NaT],
-            'value_y': [pd.NaT] + list(pd.date_range('20151011', periods=2,
-                                                     tz='US/Eastern')),
-            'key': [1, 2, 3]})
-        result = pd.merge(left, right, on='key', how='outer')
-        assert_frame_equal(result, expected)
-        self.assertEqual(result['value_x'].dtype, 'datetime64[ns, US/Eastern]')
-        self.assertEqual(result['value_y'].dtype, 'datetime64[ns, US/Eastern]')
-
-    def test_merge_on_periods(self):
-        left = pd.DataFrame({'key': pd.period_range('20151010', periods=2,
-                                                    freq='D'),
-                             'value': [1, 2]})
-        right = pd.DataFrame({'key': pd.period_range('20151011', periods=3,
-                                                     freq='D'),
-                              'value': [1, 2, 3]})
-
-        expected = DataFrame({'key': pd.period_range('20151010', periods=4,
-                                                     freq='D'),
-                              'value_x': [1, 2, np.nan, np.nan],
-                              'value_y': [np.nan, 1, 2, 3]})
-        result = pd.merge(left, right, on='key', how='outer')
-        assert_frame_equal(result, expected)
-
-        left = pd.DataFrame({'value': pd.period_range('20151010', periods=2,
-                                                      freq='D'),
-                             'key': [1, 2]})
-        right = pd.DataFrame({'value': pd.period_range('20151011', periods=2,
-                                                       freq='D'),
-                              'key': [2, 3]})
-
-        exp_x = pd.period_range('20151010', periods=2, freq='D')
-        exp_y = pd.period_range('20151011', periods=2, freq='D')
-        expected = DataFrame({'value_x': list(exp_x) + [pd.NaT],
-                              'value_y': [pd.NaT] + list(exp_y),
-                              'key': [1, 2, 3]})
-        result = pd.merge(left, right, on='key', how='outer')
-        assert_frame_equal(result, expected)
-        self.assertEqual(result['value_x'].dtype, 'object')
-        self.assertEqual(result['value_y'].dtype, 'object')
-
-    def test_indicator(self):
-        # PR #10054. xref #7412 and closes #8790.
-        df1 = DataFrame({'col1': [0, 1], 'col_left': [
-                        'a', 'b'], 'col_conflict': [1, 2]})
-        df1_copy = df1.copy()
-
-        df2 = DataFrame({'col1': [1, 2, 3, 4, 5], 'col_right': [2, 2, 2, 2, 2],
-                         'col_conflict': [1, 2, 3, 4, 5]})
-        df2_copy = df2.copy()
-
-        df_result = DataFrame({
-            'col1': [0, 1, 2, 3, 4, 5],
-            'col_conflict_x': [1, 2, np.nan, np.nan, np.nan, np.nan],
-            'col_left': ['a', 'b', np.nan, np.nan, np.nan, np.nan],
-            'col_conflict_y': [np.nan, 1, 2, 3, 4, 5],
-            'col_right': [np.nan, 2, 2, 2, 2, 2]})
-        df_result['_merge'] = Categorical(
-            ['left_only', 'both', 'right_only',
-             'right_only', 'right_only', 'right_only'],
-            categories=['left_only', 'right_only', 'both'])
-
-        df_result = df_result[['col1', 'col_conflict_x', 'col_left',
-                               'col_conflict_y', 'col_right', '_merge']]
-
-        test = merge(df1, df2, on='col1', how='outer', indicator=True)
-        assert_frame_equal(test, df_result)
-        test = df1.merge(df2, on='col1', how='outer', indicator=True)
-        assert_frame_equal(test, df_result)
-
-        # No side effects
-        assert_frame_equal(df1, df1_copy)
-        assert_frame_equal(df2, df2_copy)
-
-        # Check with custom name
-        df_result_custom_name = df_result
-        df_result_custom_name = df_result_custom_name.rename(
-            columns={'_merge': 'custom_name'})
-
-        test_custom_name = merge(
-            df1, df2, on='col1', how='outer', indicator='custom_name')
-        assert_frame_equal(test_custom_name, df_result_custom_name)
-        test_custom_name = df1.merge(
-            df2, on='col1', how='outer', indicator='custom_name')
-        assert_frame_equal(test_custom_name, df_result_custom_name)
-
-        # Check only accepts strings and booleans
-        with tm.assertRaises(ValueError):
-            merge(df1, df2, on='col1', how='outer', indicator=5)
-        with tm.assertRaises(ValueError):
-            df1.merge(df2, on='col1', how='outer', indicator=5)
-
-        # Check result integrity
-
-        test2 = merge(df1, df2, on='col1', how='left', indicator=True)
-        self.assertTrue((test2._merge != 'right_only').all())
-        test2 = df1.merge(df2, on='col1', how='left', indicator=True)
-        self.assertTrue((test2._merge != 'right_only').all())
-
-        test3 = merge(df1, df2, on='col1', how='right', indicator=True)
-        self.assertTrue((test3._merge != 'left_only').all())
-        test3 = df1.merge(df2, on='col1', how='right', indicator=True)
-        self.assertTrue((test3._merge != 'left_only').all())
-
-        test4 = merge(df1, df2, on='col1', how='inner', indicator=True)
-        self.assertTrue((test4._merge == 'both').all())
-        test4 = df1.merge(df2, on='col1', how='inner', indicator=True)
-        self.assertTrue((test4._merge == 'both').all())
-
-        # Check if working name in df
-        for i in ['_right_indicator', '_left_indicator', '_merge']:
-            df_badcolumn = DataFrame({'col1': [1, 2], i: [2, 2]})
-
-            with tm.assertRaises(ValueError):
-                merge(df1, df_badcolumn, on='col1',
-                      how='outer', indicator=True)
-            with tm.assertRaises(ValueError):
-                df1.merge(df_badcolumn, on='col1', how='outer', indicator=True)
-
-        # Check for name conflict with custom name
-        df_badcolumn = DataFrame(
-            {'col1': [1, 2], 'custom_column_name': [2, 2]})
-
-        with tm.assertRaises(ValueError):
-            merge(df1, df_badcolumn, on='col1', how='outer',
-                  indicator='custom_column_name')
-        with tm.assertRaises(ValueError):
-            df1.merge(df_badcolumn, on='col1', how='outer',
-                      indicator='custom_column_name')
-
-        # Merge on multiple columns
-        df3 = DataFrame({'col1': [0, 1], 'col2': ['a', 'b']})
-
-        df4 = DataFrame({'col1': [1, 1, 3], 'col2': ['b', 'x', 'y']})
-
-        hand_coded_result = DataFrame({'col1': [0, 1, 1, 3],
-                                       'col2': ['a', 'b', 'x', 'y']})
-        hand_coded_result['_merge'] = Categorical(
-            ['left_only', 'both', 'right_only', 'right_only'],
-            categories=['left_only', 'right_only', 'both'])
-
-        test5 = merge(df3, df4, on=['col1', 'col2'],
-                      how='outer', indicator=True)
-        assert_frame_equal(test5, hand_coded_result)
-        test5 = df3.merge(df4, on=['col1', 'col2'],
-                          how='outer', indicator=True)
-        assert_frame_equal(test5, hand_coded_result)
-
-
-def _check_merge(x, y):
-    for how in ['inner', 'left', 'outer']:
-        result = x.join(y, how=how)
-
-        expected = merge(x.reset_index(), y.reset_index(), how=how,
-                         sort=True)
-        expected = expected.set_index('index')
-
-        # TODO check_names on merge?
-        assert_frame_equal(result, expected, check_names=False)
-
-
-class TestMergeMulti(tm.TestCase):
-
-    def setUp(self):
-        self.index = MultiIndex(levels=[['foo', 'bar', 'baz', 'qux'],
-                                        ['one', 'two', 'three']],
-                                labels=[[0, 0, 0, 1, 1, 2, 2, 3, 3, 3],
-                                        [0, 1, 2, 0, 1, 1, 2, 0, 1, 2]],
-                                names=['first', 'second'])
-        self.to_join = DataFrame(np.random.randn(10, 3), index=self.index,
-                                 columns=['j_one', 'j_two', 'j_three'])
-
-        # a little relevant example with NAs
-        key1 = ['bar', 'bar', 'bar', 'foo', 'foo', 'baz', 'baz', 'qux',
-                'qux', 'snap']
-        key2 = ['two', 'one', 'three', 'one', 'two', 'one', 'two', 'two',
-                'three', 'one']
-
-        data = np.random.randn(len(key1))
-        self.data = DataFrame({'key1': key1, 'key2': key2,
-                               'data': data})
-
-    def test_merge_on_multikey(self):
-        joined = self.data.join(self.to_join, on=['key1', 'key2'])
-
-        join_key = Index(lzip(self.data['key1'], self.data['key2']))
-        indexer = self.to_join.index.get_indexer(join_key)
-        ex_values = self.to_join.values.take(indexer, axis=0)
-        ex_values[indexer == -1] = np.nan
-        expected = self.data.join(DataFrame(ex_values,
-                                            columns=self.to_join.columns))
-
-        # TODO: columns aren't in the same order yet
-        assert_frame_equal(joined, expected.loc[:, joined.columns])
-
-        left = self.data.join(self.to_join, on=['key1', 'key2'], sort=True)
-        right = expected.loc[:, joined.columns].sort_values(['key1', 'key2'],
-                                                            kind='mergesort')
-        assert_frame_equal(left, right)
-
-    def test_left_join_multi_index(self):
-        icols = ['1st', '2nd', '3rd']
-
-        def bind_cols(df):
-            iord = lambda a: 0 if a != a else ord(a)
-            f = lambda ts: ts.map(iord) - ord('a')
-            return (f(df['1st']) + f(df['3rd']) * 1e2 +
-                    df['2nd'].fillna(0) * 1e4)
-
-        def run_asserts(left, right):
-            for sort in [False, True]:
-                res = left.join(right, on=icols, how='left', sort=sort)
-
-                self.assertTrue(len(left) < len(res) + 1)
-                self.assertFalse(res['4th'].isnull().any())
-                self.assertFalse(res['5th'].isnull().any())
-
-                tm.assert_series_equal(
-                    res['4th'], - res['5th'], check_names=False)
-                result = bind_cols(res.iloc[:, :-2])
-                tm.assert_series_equal(res['4th'], result, check_names=False)
-                self.assertTrue(result.name is None)
-
-                if sort:
-                    tm.assert_frame_equal(
-                        res, res.sort_values(icols, kind='mergesort'))
-
-                out = merge(left, right.reset_index(), on=icols,
-                            sort=sort, how='left')
-
-                res.index = np.arange(len(res))
-                tm.assert_frame_equal(out, res)
-
-        lc = list(map(chr, np.arange(ord('a'), ord('z') + 1)))
-        left = DataFrame(np.random.choice(lc, (5000, 2)),
-                         columns=['1st', '3rd'])
-        left.insert(1, '2nd', np.random.randint(0, 1000, len(left)))
-
-        i = np.random.permutation(len(left))
-        right = left.iloc[i].copy()
-
-        left['4th'] = bind_cols(left)
-        right['5th'] = - bind_cols(right)
-        right.set_index(icols, inplace=True)
-
-        run_asserts(left, right)
-
-        # inject some nulls
-        left.loc[1::23, '1st'] = np.nan
-        left.loc[2::37, '2nd'] = np.nan
-        left.loc[3::43, '3rd'] = np.nan
-        left['4th'] = bind_cols(left)
-
-        i = np.random.permutation(len(left))
-        right = left.iloc[i, :-1]
-        right['5th'] = - bind_cols(right)
-        right.set_index(icols, inplace=True)
-
-        run_asserts(left, right)
-
-    def test_merge_right_vs_left(self):
-        # compare left vs right merge with multikey
-        for sort in [False, True]:
-            merged1 = self.data.merge(self.to_join, left_on=['key1', 'key2'],
-                                      right_index=True, how='left', sort=sort)
-
-            merged2 = self.to_join.merge(self.data, right_on=['key1', 'key2'],
-                                         left_index=True, how='right',
-                                         sort=sort)
-
-            merged2 = merged2.loc[:, merged1.columns]
-            assert_frame_equal(merged1, merged2)
-
-    def test_compress_group_combinations(self):
-
-        # ~ 40000000 possible unique groups
-        key1 = tm.rands_array(10, 10000)
-        key1 = np.tile(key1, 2)
-        key2 = key1[::-1]
-
-        df = DataFrame({'key1': key1, 'key2': key2,
-                        'value1': np.random.randn(20000)})
-
-        df2 = DataFrame({'key1': key1[::2], 'key2': key2[::2],
-                         'value2': np.random.randn(10000)})
-
-        # just to hit the label compression code path
-        merge(df, df2, how='outer')
-
-    def test_left_join_index_preserve_order(self):
-
-        left = DataFrame({'k1': [0, 1, 2] * 8,
-                          'k2': ['foo', 'bar'] * 12,
-                          'v': np.array(np.arange(24), dtype=np.int64)})
-
-        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-        right = DataFrame({'v2': [5, 7]}, index=index)
-
-        result = left.join(right, on=['k1', 'k2'])
-
-        expected = left.copy()
-        expected['v2'] = np.nan
-        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
-        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
-
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(
-            result.sort_values(['k1', 'k2'], kind='mergesort'),
-            left.join(right, on=['k1', 'k2'], sort=True))
-
-        # test join with multi dtypes blocks
-        left = DataFrame({'k1': [0, 1, 2] * 8,
-                          'k2': ['foo', 'bar'] * 12,
-                          'k3': np.array([0, 1, 2] * 8, dtype=np.float32),
-                          'v': np.array(np.arange(24), dtype=np.int32)})
-
-        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-        right = DataFrame({'v2': [5, 7]}, index=index)
-
-        result = left.join(right, on=['k1', 'k2'])
-
-        expected = left.copy()
-        expected['v2'] = np.nan
-        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
-        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
-
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(
-            result.sort_values(['k1', 'k2'], kind='mergesort'),
-            left.join(right, on=['k1', 'k2'], sort=True))
-
-        # do a right join for an extra test
-        joined = merge(right, left, left_index=True,
-                       right_on=['k1', 'k2'], how='right')
-        tm.assert_frame_equal(joined.loc[:, expected.columns], expected)
-
-    def test_left_join_index_multi_match_multiindex(self):
-        left = DataFrame([
-            ['X', 'Y', 'C', 'a'],
-            ['W', 'Y', 'C', 'e'],
-            ['V', 'Q', 'A', 'h'],
-            ['V', 'R', 'D', 'i'],
-            ['X', 'Y', 'D', 'b'],
-            ['X', 'Y', 'A', 'c'],
-            ['W', 'Q', 'B', 'f'],
-            ['W', 'R', 'C', 'g'],
-            ['V', 'Y', 'C', 'j'],
-            ['X', 'Y', 'B', 'd']],
-            columns=['cola', 'colb', 'colc', 'tag'],
-            index=[3, 2, 0, 1, 7, 6, 4, 5, 9, 8])
-
-        right = DataFrame([
-            ['W', 'R', 'C', 0],
-            ['W', 'Q', 'B', 3],
-            ['W', 'Q', 'B', 8],
-            ['X', 'Y', 'A', 1],
-            ['X', 'Y', 'A', 4],
-            ['X', 'Y', 'B', 5],
-            ['X', 'Y', 'C', 6],
-            ['X', 'Y', 'C', 9],
-            ['X', 'Q', 'C', -6],
-            ['X', 'R', 'C', -9],
-            ['V', 'Y', 'C', 7],
-            ['V', 'R', 'D', 2],
-            ['V', 'R', 'D', -1],
-            ['V', 'Q', 'A', -3]],
-            columns=['col1', 'col2', 'col3', 'val'])
-
-        right.set_index(['col1', 'col2', 'col3'], inplace=True)
-        result = left.join(right, on=['cola', 'colb', 'colc'], how='left')
-
-        expected = DataFrame([
-            ['X', 'Y', 'C', 'a', 6],
-            ['X', 'Y', 'C', 'a', 9],
-            ['W', 'Y', 'C', 'e', nan],
-            ['V', 'Q', 'A', 'h', -3],
-            ['V', 'R', 'D', 'i', 2],
-            ['V', 'R', 'D', 'i', -1],
-            ['X', 'Y', 'D', 'b', nan],
-            ['X', 'Y', 'A', 'c', 1],
-            ['X', 'Y', 'A', 'c', 4],
-            ['W', 'Q', 'B', 'f', 3],
-            ['W', 'Q', 'B', 'f', 8],
-            ['W', 'R', 'C', 'g', 0],
-            ['V', 'Y', 'C', 'j', 7],
-            ['X', 'Y', 'B', 'd', 5]],
-            columns=['cola', 'colb', 'colc', 'tag', 'val'],
-            index=[3, 3, 2, 0, 1, 1, 7, 6, 6, 4, 4, 5, 9, 8])
-
-        tm.assert_frame_equal(result, expected)
-
-        result = left.join(right, on=['cola', 'colb', 'colc'],
-                           how='left', sort=True)
-
-        tm.assert_frame_equal(
-            result,
-            expected.sort_values(['cola', 'colb', 'colc'], kind='mergesort'))
-
-        # GH7331 - maintain left frame order in left merge
-        right.reset_index(inplace=True)
-        right.columns = left.columns[:3].tolist() + right.columns[-1:].tolist()
-        result = merge(left, right, how='left', on=left.columns[:-1].tolist())
-        expected.index = np.arange(len(expected))
-        tm.assert_frame_equal(result, expected)
-
-    def test_left_join_index_multi_match(self):
-        left = DataFrame([
-            ['c', 0],
-            ['b', 1],
-            ['a', 2],
-            ['b', 3]],
-            columns=['tag', 'val'],
-            index=[2, 0, 1, 3])
-
-        right = DataFrame([
-            ['a', 'v'],
-            ['c', 'w'],
-            ['c', 'x'],
-            ['d', 'y'],
-            ['a', 'z'],
-            ['c', 'r'],
-            ['e', 'q'],
-            ['c', 's']],
-            columns=['tag', 'char'])
-
-        right.set_index('tag', inplace=True)
-        result = left.join(right, on='tag', how='left')
-
-        expected = DataFrame([
-            ['c', 0, 'w'],
-            ['c', 0, 'x'],
-            ['c', 0, 'r'],
-            ['c', 0, 's'],
-            ['b', 1, nan],
-            ['a', 2, 'v'],
-            ['a', 2, 'z'],
-            ['b', 3, nan]],
-            columns=['tag', 'val', 'char'],
-            index=[2, 2, 2, 2, 0, 1, 1, 3])
-
-        tm.assert_frame_equal(result, expected)
-
-        result = left.join(right, on='tag', how='left', sort=True)
-        tm.assert_frame_equal(
-            result, expected.sort_values('tag', kind='mergesort'))
-
-        # GH7331 - maintain left frame order in left merge
-        result = merge(left, right.reset_index(), how='left', on='tag')
-        expected.index = np.arange(len(expected))
-        tm.assert_frame_equal(result, expected)
-
-    def test_left_merge_na_buglet(self):
-        left = DataFrame({'id': list('abcde'), 'v1': randn(5),
-                          'v2': randn(5), 'dummy': list('abcde'),
-                          'v3': randn(5)},
-                         columns=['id', 'v1', 'v2', 'dummy', 'v3'])
-        right = DataFrame({'id': ['a', 'b', np.nan, np.nan, np.nan],
-                           'sv3': [1.234, 5.678, np.nan, np.nan, np.nan]})
-
-        merged = merge(left, right, on='id', how='left')
-
-        rdf = right.drop(['id'], axis=1)
-        expected = left.join(rdf)
-        tm.assert_frame_equal(merged, expected)
-
-    def test_merge_na_keys(self):
-        data = [[1950, "A", 1.5],
-                [1950, "B", 1.5],
-                [1955, "B", 1.5],
-                [1960, "B", np.nan],
-                [1970, "B", 4.],
-                [1950, "C", 4.],
-                [1960, "C", np.nan],
-                [1965, "C", 3.],
-                [1970, "C", 4.]]
-
-        frame = DataFrame(data, columns=["year", "panel", "data"])
-
-        other_data = [[1960, 'A', np.nan],
-                      [1970, 'A', np.nan],
-                      [1955, 'A', np.nan],
-                      [1965, 'A', np.nan],
-                      [1965, 'B', np.nan],
-                      [1955, 'C', np.nan]]
-        other = DataFrame(other_data, columns=['year', 'panel', 'data'])
-
-        result = frame.merge(other, how='outer')
-
-        expected = frame.fillna(-999).merge(other.fillna(-999), how='outer')
-        expected = expected.replace(-999, np.nan)
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_join_multi_levels(self):
-
-        # GH 3662
-        # merge multi-levels
-        household = (
-            DataFrame(
-                dict(household_id=[1, 2, 3],
-                     male=[0, 1, 0],
-                     wealth=[196087.3, 316478.7, 294750]),
-                columns=['household_id', 'male', 'wealth'])
-            .set_index('household_id'))
-        portfolio = (
-            DataFrame(
-                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
-                     asset_id=["nl0000301109", "nl0000289783", "gb00b03mlx29",
-                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
-                               np.nan],
-                     name=["ABN Amro", "Robeco", "Royal Dutch Shell",
-                           "Royal Dutch Shell",
-                           "AAB Eastern Europe Equity Fund",
-                           "Postbank BioTech Fonds", np.nan],
-                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
-                columns=['household_id', 'asset_id', 'name', 'share'])
-            .set_index(['household_id', 'asset_id']))
-        result = household.join(portfolio, how='inner')
-        expected = (
-            DataFrame(
-                dict(male=[0, 1, 1, 0, 0, 0],
-                     wealth=[196087.3, 316478.7, 316478.7,
-                             294750.0, 294750.0, 294750.0],
-                     name=['ABN Amro', 'Robeco', 'Royal Dutch Shell',
-                           'Royal Dutch Shell',
-                           'AAB Eastern Europe Equity Fund',
-                           'Postbank BioTech Fonds'],
-                     share=[1.00, 0.40, 0.60, 0.15, 0.60, 0.25],
-                     household_id=[1, 2, 2, 3, 3, 3],
-                     asset_id=['nl0000301109', 'nl0000289783', 'gb00b03mlx29',
-                               'gb00b03mlx29', 'lu0197800237',
-                               'nl0000289965']))
-            .set_index(['household_id', 'asset_id'])
-            .reindex(columns=['male', 'wealth', 'name', 'share']))
-        assert_frame_equal(result, expected)
-
-        assert_frame_equal(result, expected)
-
-        # equivalency
-        result2 = (merge(household.reset_index(), portfolio.reset_index(),
-                         on=['household_id'], how='inner')
-                   .set_index(['household_id', 'asset_id']))
-        assert_frame_equal(result2, expected)
-
-        result = household.join(portfolio, how='outer')
-        expected = (concat([
-            expected,
-            (DataFrame(
-                dict(share=[1.00]),
-                index=MultiIndex.from_tuples(
-                    [(4, np.nan)],
-                    names=['household_id', 'asset_id'])))
-        ], axis=0).reindex(columns=expected.columns))
-        assert_frame_equal(result, expected)
-
-        # invalid cases
-        household.index.name = 'foo'
-
-        def f():
-            household.join(portfolio, how='inner')
-        self.assertRaises(ValueError, f)
-
-        portfolio2 = portfolio.copy()
-        portfolio2.index.set_names(['household_id', 'foo'])
-
-        def f():
-            portfolio2.join(portfolio, how='inner')
-        self.assertRaises(ValueError, f)
-
-    def test_join_multi_levels2(self):
-
-        # some more advanced merges
-        # GH6360
-        household = (
-            DataFrame(
-                dict(household_id=[1, 2, 2, 3, 3, 3, 4],
-                     asset_id=["nl0000301109", "nl0000301109", "gb00b03mlx29",
-                               "gb00b03mlx29", "lu0197800237", "nl0000289965",
-                               np.nan],
-                     share=[1.0, 0.4, 0.6, 0.15, 0.6, 0.25, 1.0]),
-                columns=['household_id', 'asset_id', 'share'])
-            .set_index(['household_id', 'asset_id']))
-
-        log_return = DataFrame(dict(
-            asset_id=["gb00b03mlx29", "gb00b03mlx29",
-                      "gb00b03mlx29", "lu0197800237", "lu0197800237"],
-            t=[233, 234, 235, 180, 181],
-            log_return=[.09604978, -.06524096, .03532373, .03025441, .036997]
-        )).set_index(["asset_id", "t"])
-
-        expected = (
-            DataFrame(dict(
-                household_id=[2, 2, 2, 3, 3, 3, 3, 3],
-                asset_id=["gb00b03mlx29", "gb00b03mlx29",
-                          "gb00b03mlx29", "gb00b03mlx29",
-                          "gb00b03mlx29", "gb00b03mlx29",
-                          "lu0197800237", "lu0197800237"],
-                t=[233, 234, 235, 233, 234, 235, 180, 181],
-                share=[0.6, 0.6, 0.6, 0.15, 0.15, 0.15, 0.6, 0.6],
-                log_return=[.09604978, -.06524096, .03532373,
-                            .09604978, -.06524096, .03532373,
-                            .03025441, .036997]
-            ))
-            .set_index(["household_id", "asset_id", "t"])
-            .reindex(columns=['share', 'log_return']))
-
-        def f():
-            household.join(log_return, how='inner')
-        self.assertRaises(NotImplementedError, f)
-
-        # this is the equivalency
-        result = (merge(household.reset_index(), log_return.reset_index(),
-                        on=['asset_id'], how='inner')
-                  .set_index(['household_id', 'asset_id', 't']))
-        assert_frame_equal(result, expected)
-
-        expected = (
-            DataFrame(dict(
-                household_id=[1, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 4],
-                asset_id=["nl0000301109", "nl0000289783", "gb00b03mlx29",
-                          "gb00b03mlx29", "gb00b03mlx29",
-                          "gb00b03mlx29", "gb00b03mlx29", "gb00b03mlx29",
-                          "lu0197800237", "lu0197800237",
-                          "nl0000289965", None],
-                t=[None, None, 233, 234, 235, 233, 234,
-                   235, 180, 181, None, None],
-                share=[1.0, 0.4, 0.6, 0.6, 0.6, 0.15,
-                       0.15, 0.15, 0.6, 0.6, 0.25, 1.0],
-                log_return=[None, None, .09604978, -.06524096, .03532373,
-                            .09604978, -.06524096, .03532373,
-                            .03025441, .036997, None, None]
-            ))
-            .set_index(["household_id", "asset_id", "t"]))
-
-        def f():
-            household.join(log_return, how='outer')
-        self.assertRaises(NotImplementedError, f)
-
-
-@pytest.fixture
-def df():
-    return DataFrame(
-        {'A': ['foo', 'bar'],
-         'B': Series(['foo', 'bar']).astype('category'),
-         'C': [1, 2],
-         'D': [1.0, 2.0],
-         'E': Series([1, 2], dtype='uint64'),
-         'F': Series([1, 2], dtype='int32')})
-
-
-class TestMergeDtypes(object):
-
-    def test_different(self, df):
-
-        # we expect differences by kind
-        # to be ok, while other differences should return object
-
-        left = df
-        for col in df.columns:
-            right = DataFrame({'A': df[col]})
-            result = pd.merge(left, right, on='A')
-            assert is_object_dtype(result.A.dtype)
-
-    @pytest.mark.parametrize('d1', [np.int64, np.int32,
-                                    np.int16, np.int8, np.uint8])
-    @pytest.mark.parametrize('d2', [np.int64, np.float64,
-                                    np.float32, np.float16])
-    def test_join_multi_dtypes(self, d1, d2):
-
-        dtype1 = np.dtype(d1)
-        dtype2 = np.dtype(d2)
-
-        left = DataFrame({'k1': np.array([0, 1, 2] * 8, dtype=dtype1),
-                          'k2': ['foo', 'bar'] * 12,
-                          'v': np.array(np.arange(24), dtype=np.int64)})
-
-        index = MultiIndex.from_tuples([(2, 'bar'), (1, 'foo')])
-        right = DataFrame({'v2': np.array([5, 7], dtype=dtype2)}, index=index)
-
-        result = left.join(right, on=['k1', 'k2'])
-
-        expected = left.copy()
-
-        if dtype2.kind == 'i':
-            dtype2 = np.dtype('float64')
-        expected['v2'] = np.array(np.nan, dtype=dtype2)
-        expected.loc[(expected.k1 == 2) & (expected.k2 == 'bar'), 'v2'] = 5
-        expected.loc[(expected.k1 == 1) & (expected.k2 == 'foo'), 'v2'] = 7
-
-        tm.assert_frame_equal(result, expected)
-
-        result = left.join(right, on=['k1', 'k2'], sort=True)
-        expected.sort_values(['k1', 'k2'], kind='mergesort', inplace=True)
-        tm.assert_frame_equal(result, expected)
-
-
-@pytest.fixture
-def left():
-    np.random.seed(1234)
-    return DataFrame(
-        {'X': Series(np.random.choice(
-            ['foo', 'bar'],
-            size=(10,))).astype('category', categories=['foo', 'bar']),
-         'Y': np.random.choice(['one', 'two', 'three'], size=(10,))})
-
-
-@pytest.fixture
-def right():
-    np.random.seed(1234)
-    return DataFrame(
-        {'X': Series(['foo', 'bar']).astype('category',
-                                            categories=['foo', 'bar']),
-         'Z': [1, 2]})
-
-
-class TestMergeCategorical(object):
-
-    def test_identical(self, left):
-        # merging on the same, should preserve dtypes
-        merged = pd.merge(left, left, on='X')
-        result = merged.dtypes.sort_index()
-        expected = Series([CategoricalDtype(),
-                           np.dtype('O'),
-                           np.dtype('O')],
-                          index=['X', 'Y_x', 'Y_y'])
-        assert_series_equal(result, expected)
-
-    def test_basic(self, left, right):
-        # we have matching Categorical dtypes in X
-        # so should preserve the merged column
-        merged = pd.merge(left, right, on='X')
-        result = merged.dtypes.sort_index()
-        expected = Series([CategoricalDtype(),
-                           np.dtype('O'),
-                           np.dtype('int64')],
-                          index=['X', 'Y', 'Z'])
-        assert_series_equal(result, expected)
-
-    def test_other_columns(self, left, right):
-        # non-merge columns should preserve if possible
-        right = right.assign(Z=right.Z.astype('category'))
-
-        merged = pd.merge(left, right, on='X')
-        result = merged.dtypes.sort_index()
-        expected = Series([CategoricalDtype(),
-                           np.dtype('O'),
-                           CategoricalDtype()],
-                          index=['X', 'Y', 'Z'])
-        assert_series_equal(result, expected)
-
-        # categories are preserved
-        assert left.X.values.is_dtype_equal(merged.X.values)
-        assert right.Z.values.is_dtype_equal(merged.Z.values)
-
-    @pytest.mark.parametrize(
-        'change', [lambda x: x,
-                   lambda x: x.astype('category',
-                                      categories=['bar', 'foo']),
-                   lambda x: x.astype('category',
-                                      categories=['foo', 'bar', 'bah']),
-                   lambda x: x.astype('category', ordered=True)])
-    @pytest.mark.parametrize('how', ['inner', 'outer', 'left', 'right'])
-    def test_dtype_on_merged_different(self, change, how, left, right):
-        # our merging columns, X now has 2 different dtypes
-        # so we must be object as a result
-
-        X = change(right.X.astype('object'))
-        right = right.assign(X=X)
-        assert is_categorical_dtype(left.X.values)
-        assert not left.X.values.is_dtype_equal(right.X.values)
-
-        merged = pd.merge(left, right, on='X', how=how)
-
-        result = merged.dtypes.sort_index()
-        expected = Series([np.dtype('O'),
-                           np.dtype('O'),
-                           np.dtype('int64')],
-                          index=['X', 'Y', 'Z'])
-        assert_series_equal(result, expected)
-
-
-@pytest.fixture
-def left_df():
-    return DataFrame({'a': [20, 10, 0]}, index=[2, 1, 0])
-
-
-@pytest.fixture
-def right_df():
-    return DataFrame({'b': [300, 100, 200]}, index=[3, 1, 2])
-
-
-class TestMergeOnIndexes(object):
-
-    @pytest.mark.parametrize(
-        "how, sort, expected",
-        [('inner', False, DataFrame({'a': [20, 10],
-                                     'b': [200, 100]},
-                                    index=[2, 1])),
-         ('inner', True, DataFrame({'a': [10, 20],
-                                    'b': [100, 200]},
-                                   index=[1, 2])),
-         ('left', False, DataFrame({'a': [20, 10, 0],
-                                    'b': [200, 100, np.nan]},
-                                   index=[2, 1, 0])),
-         ('left', True, DataFrame({'a': [0, 10, 20],
-                                   'b': [np.nan, 100, 200]},
-                                  index=[0, 1, 2])),
-         ('right', False, DataFrame({'a': [np.nan, 10, 20],
-                                     'b': [300, 100, 200]},
-                                    index=[3, 1, 2])),
-         ('right', True, DataFrame({'a': [10, 20, np.nan],
-                                    'b': [100, 200, 300]},
-                                   index=[1, 2, 3])),
-         ('outer', False, DataFrame({'a': [0, 10, 20, np.nan],
-                                     'b': [np.nan, 100, 200, 300]},
-                                    index=[0, 1, 2, 3])),
-         ('outer', True, DataFrame({'a': [0, 10, 20, np.nan],
-                                    'b': [np.nan, 100, 200, 300]},
-                                   index=[0, 1, 2, 3]))])
-    def test_merge_on_indexes(self, left_df, right_df, how, sort, expected):
-
-        result = pd.merge(left_df, right_df,
-                          left_index=True,
-                          right_index=True,
-                          how=how,
-                          sort=sort)
-        tm.assert_frame_equal(result, expected)
diff --git a/pandas/tests/tools/test_merge_ordered.py b/pandas/tests/tools/test_merge_ordered.py
deleted file mode 100644
index e4a41ea9a28eb..0000000000000
--- a/pandas/tests/tools/test_merge_ordered.py
+++ /dev/null
@@ -1,90 +0,0 @@
-import pandas as pd
-from pandas import DataFrame, merge_ordered
-from pandas.util import testing as tm
-from pandas.util.testing import assert_frame_equal
-
-from numpy import nan
-
-
-class TestOrderedMerge(tm.TestCase):
-
-    def setUp(self):
-        self.left = DataFrame({'key': ['a', 'c', 'e'],
-                               'lvalue': [1, 2., 3]})
-
-        self.right = DataFrame({'key': ['b', 'c', 'd', 'f'],
-                                'rvalue': [1, 2, 3., 4]})
-
-    def test_deprecation(self):
-
-        with tm.assert_produces_warning(FutureWarning):
-            pd.ordered_merge(self.left, self.right, on='key')
-
-    # GH #813
-
-    def test_basic(self):
-        result = merge_ordered(self.left, self.right, on='key')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
-                              'lvalue': [1, nan, 2, nan, 3, nan],
-                              'rvalue': [nan, 1, 2, 3, nan, 4]})
-
-        assert_frame_equal(result, expected)
-
-    def test_ffill(self):
-        result = merge_ordered(
-            self.left, self.right, on='key', fill_method='ffill')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'],
-                              'lvalue': [1., 1, 2, 2, 3, 3.],
-                              'rvalue': [nan, 1, 2, 3, 3, 4]})
-        assert_frame_equal(result, expected)
-
-    def test_multigroup(self):
-        left = pd.concat([self.left, self.left], ignore_index=True)
-
-        left['group'] = ['a'] * 3 + ['b'] * 3
-
-        result = merge_ordered(left, self.right, on='key', left_by='group',
-                               fill_method='ffill')
-        expected = DataFrame({'key': ['a', 'b', 'c', 'd', 'e', 'f'] * 2,
-                              'lvalue': [1., 1, 2, 2, 3, 3.] * 2,
-                              'rvalue': [nan, 1, 2, 3, 3, 4] * 2})
-        expected['group'] = ['a'] * 6 + ['b'] * 6
-
-        assert_frame_equal(result, expected.loc[:, result.columns])
-
-        result2 = merge_ordered(self.right, left, on='key', right_by='group',
-                                fill_method='ffill')
-        assert_frame_equal(result, result2.loc[:, result.columns])
-
-        result = merge_ordered(left, self.right, on='key', left_by='group')
-        self.assertTrue(result['group'].notnull().all())
-
-    def test_merge_type(self):
-        class NotADataFrame(DataFrame):
-
-            @property
-            def _constructor(self):
-                return NotADataFrame
-
-        nad = NotADataFrame(self.left)
-        result = nad.merge(self.right, on='key')
-
-        tm.assertIsInstance(result, NotADataFrame)
-
-    def test_empty_sequence_concat(self):
-        # GH 9157
-        empty_pat = "[Nn]o objects"
-        none_pat = "objects.*None"
-        test_cases = [
-            ((), empty_pat),
-            ([], empty_pat),
-            ({}, empty_pat),
-            ([None], none_pat),
-            ([None, None], none_pat)
-        ]
-        for df_seq, pattern in test_cases:
-            tm.assertRaisesRegexp(ValueError, pattern, pd.concat, df_seq)
-
-        pd.concat([pd.DataFrame()])
-        pd.concat([None, pd.DataFrame()])
-        pd.concat([pd.DataFrame(), None])
diff --git a/pandas/tests/tools/test_numeric.py b/pandas/tests/tools/test_numeric.py
new file mode 100644
index 0000000000000..97e1dc2f6aefc
--- /dev/null
+++ b/pandas/tests/tools/test_numeric.py
@@ -0,0 +1,583 @@
+import decimal
+
+import numpy as np
+from numpy import iinfo
+import pytest
+
+import pandas.compat as compat
+
+import pandas as pd
+from pandas import DataFrame, Index, Series, to_numeric
+from pandas.util import testing as tm
+
+
+@pytest.fixture(params=[None, "ignore", "raise", "coerce"])
+def errors(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def signed(request):
+    return request.param
+
+
+@pytest.fixture(params=[lambda x: x, str], ids=["identity", "str"])
+def transform(request):
+    return request.param
+
+
+@pytest.fixture(params=[
+    47393996303418497800,
+    100000000000000000000
+])
+def large_val(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def multiple_elts(request):
+    return request.param
+
+
+@pytest.fixture(params=[
+    (lambda x: Index(x, name="idx"), tm.assert_index_equal),
+    (lambda x: Series(x, name="ser"), tm.assert_series_equal),
+    (lambda x: np.array(Index(x).values), tm.assert_numpy_array_equal)
+])
+def transform_assert_equal(request):
+    return request.param
+
+
+@pytest.mark.parametrize("input_kwargs,result_kwargs", [
+    (dict(), dict(dtype=np.int64)),
+    (dict(errors="coerce", downcast="integer"), dict(dtype=np.int8))
+])
+def test_empty(input_kwargs, result_kwargs):
+    # see gh-16302
+    ser = Series([], dtype=object)
+    result = to_numeric(ser, **input_kwargs)
+
+    expected = Series([], **result_kwargs)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("last_val", ["7", 7])
+def test_series(last_val):
+    ser = Series(["1", "-3.14", last_val])
+    result = to_numeric(ser)
+
+    expected = Series([1, -3.14, 7])
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("data", [
+    [1, 3, 4, 5],
+    [1., 3., 4., 5.],
+
+    # Bool is regarded as numeric.
+    [True, False, True, True]
+])
+def test_series_numeric(data):
+    ser = Series(data, index=list("ABCD"), name="EFG")
+
+    result = to_numeric(ser)
+    tm.assert_series_equal(result, ser)
+
+
+@pytest.mark.parametrize("data,msg", [
+    ([1, -3.14, "apple"],
+     'Unable to parse string "apple" at position 2'),
+    (["orange", 1, -3.14, "apple"],
+     'Unable to parse string "orange" at position 0')
+])
+def test_error(data, msg):
+    ser = Series(data)
+
+    with pytest.raises(ValueError, match=msg):
+        to_numeric(ser, errors="raise")
+
+
+@pytest.mark.parametrize("errors,exp_data", [
+    ("ignore", [1, -3.14, "apple"]),
+    ("coerce", [1, -3.14, np.nan])
+])
+def test_ignore_error(errors, exp_data):
+    ser = Series([1, -3.14, "apple"])
+    result = to_numeric(ser, errors=errors)
+
+    expected = Series(exp_data)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("errors,exp", [
+    ("raise", 'Unable to parse string "apple" at position 2'),
+    ("ignore", [True, False, "apple"]),
+
+    # Coerces to float.
+    ("coerce", [1., 0., np.nan])
+])
+def test_bool_handling(errors, exp):
+    ser = Series([True, False, "apple"])
+
+    if isinstance(exp, str):
+        with pytest.raises(ValueError, match=exp):
+            to_numeric(ser, errors=errors)
+    else:
+        result = to_numeric(ser, errors=errors)
+        expected = Series(exp)
+
+        tm.assert_series_equal(result, expected)
+
+
+def test_list():
+    ser = ["1", "-3.14", "7"]
+    res = to_numeric(ser)
+
+    expected = np.array([1, -3.14, 7])
+    tm.assert_numpy_array_equal(res, expected)
+
+
+@pytest.mark.parametrize("data,arr_kwargs", [
+    ([1, 3, 4, 5], dict(dtype=np.int64)),
+    ([1., 3., 4., 5.], dict()),
+
+    # Boolean is regarded as numeric.
+    ([True, False, True, True], dict())
+])
+def test_list_numeric(data, arr_kwargs):
+    result = to_numeric(data)
+    expected = np.array(data, **arr_kwargs)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(dtype="O"), dict()
+])
+def test_numeric(kwargs):
+    data = [1, -3.14, 7]
+
+    ser = Series(data, **kwargs)
+    result = to_numeric(ser)
+
+    expected = Series(data)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("columns", [
+    # One column.
+    "a",
+
+    # Multiple columns.
+    ["a", "b"]
+])
+def test_numeric_df_columns(columns):
+    # see gh-14827
+    df = DataFrame(dict(
+        a=[1.2, decimal.Decimal(3.14), decimal.Decimal("infinity"), "0.1"],
+        b=[1.0, 2.0, 3.0, 4.0],
+    ))
+
+    expected = DataFrame(dict(
+        a=[1.2, 3.14, np.inf, 0.1],
+        b=[1.0, 2.0, 3.0, 4.0],
+    ))
+
+    df_copy = df.copy()
+    df_copy[columns] = df_copy[columns].apply(to_numeric)
+
+    tm.assert_frame_equal(df_copy, expected)
+
+
+@pytest.mark.parametrize("data,exp_data", [
+    ([[decimal.Decimal(3.14), 1.0], decimal.Decimal(1.6), 0.1],
+     [[3.14, 1.0], 1.6, 0.1]),
+    ([np.array([decimal.Decimal(3.14), 1.0]), 0.1],
+     [[3.14, 1.0], 0.1])
+])
+def test_numeric_embedded_arr_likes(data, exp_data):
+    # Test to_numeric with embedded lists and arrays
+    df = DataFrame(dict(a=data))
+    df["a"] = df["a"].apply(to_numeric)
+
+    expected = DataFrame(dict(a=exp_data))
+    tm.assert_frame_equal(df, expected)
+
+
+def test_all_nan():
+    ser = Series(["a", "b", "c"])
+    result = to_numeric(ser, errors="coerce")
+
+    expected = Series([np.nan, np.nan, np.nan])
+    tm.assert_series_equal(result, expected)
+
+
+def test_type_check(errors):
+    # see gh-11776
+    df = DataFrame({"a": [1, -3.14, 7], "b": ["4", "5", "6"]})
+    kwargs = dict(errors=errors) if errors is not None else dict()
+    error_ctx = pytest.raises(TypeError, match="1-d array")
+
+    with error_ctx:
+        to_numeric(df, **kwargs)
+
+
+@pytest.mark.parametrize("val", [1, 1.1, 20001])
+def test_scalar(val, signed, transform):
+    val = -val if signed else val
+    assert to_numeric(transform(val)) == float(val)
+
+
+def test_really_large_scalar(large_val, signed, transform, errors):
+    # see gh-24910
+    kwargs = dict(errors=errors) if errors is not None else dict()
+    val = -large_val if signed else large_val
+
+    val = transform(val)
+    val_is_string = isinstance(val, str)
+
+    if val_is_string and errors in (None, "raise"):
+        msg = "Integer out of range. at position 0"
+        with pytest.raises(ValueError, match=msg):
+            to_numeric(val, **kwargs)
+    else:
+        expected = float(val) if (errors == "coerce" and
+                                  val_is_string) else val
+        assert tm.assert_almost_equal(to_numeric(val, **kwargs), expected)
+
+
+def test_really_large_in_arr(large_val, signed, transform,
+                             multiple_elts, errors):
+    # see gh-24910
+    kwargs = dict(errors=errors) if errors is not None else dict()
+    val = -large_val if signed else large_val
+    val = transform(val)
+
+    extra_elt = "string"
+    arr = [val] + multiple_elts * [extra_elt]
+
+    val_is_string = isinstance(val, str)
+    coercing = errors == "coerce"
+
+    if errors in (None, "raise") and (val_is_string or multiple_elts):
+        if val_is_string:
+            msg = "Integer out of range. at position 0"
+        else:
+            msg = 'Unable to parse string "string" at position 1'
+
+        with pytest.raises(ValueError, match=msg):
+            to_numeric(arr, **kwargs)
+    else:
+        result = to_numeric(arr, **kwargs)
+
+        exp_val = float(val) if (coercing and val_is_string) else val
+        expected = [exp_val]
+
+        if multiple_elts:
+            if coercing:
+                expected.append(np.nan)
+                exp_dtype = float
+            else:
+                expected.append(extra_elt)
+                exp_dtype = object
+        else:
+            exp_dtype = float if isinstance(exp_val, (
+                int, compat.long, float)) else object
+
+        tm.assert_almost_equal(result, np.array(expected, dtype=exp_dtype))
+
+
+def test_really_large_in_arr_consistent(large_val, signed,
+                                        multiple_elts, errors):
+    # see gh-24910
+    #
+    # Even if we discover that we have to hold float, does not mean
+    # we should be lenient on subsequent elements that fail to be integer.
+    kwargs = dict(errors=errors) if errors is not None else dict()
+    arr = [str(-large_val if signed else large_val)]
+
+    if multiple_elts:
+        arr.insert(0, large_val)
+
+    if errors in (None, "raise"):
+        index = int(multiple_elts)
+        msg = "Integer out of range. at position {index}".format(index=index)
+
+        with pytest.raises(ValueError, match=msg):
+            to_numeric(arr, **kwargs)
+    else:
+        result = to_numeric(arr, **kwargs)
+
+        if errors == "coerce":
+            expected = [float(i) for i in arr]
+            exp_dtype = float
+        else:
+            expected = arr
+            exp_dtype = object
+
+        tm.assert_almost_equal(result, np.array(expected, dtype=exp_dtype))
+
+
+@pytest.mark.parametrize("errors,checker", [
+    ("raise", 'Unable to parse string "fail" at position 0'),
+    ("ignore", lambda x: x == "fail"),
+    ("coerce", lambda x: np.isnan(x))
+])
+def test_scalar_fail(errors, checker):
+    scalar = "fail"
+
+    if isinstance(checker, str):
+        with pytest.raises(ValueError, match=checker):
+            to_numeric(scalar, errors=errors)
+    else:
+        assert checker(to_numeric(scalar, errors=errors))
+
+
+@pytest.mark.parametrize("data", [
+    [1, 2, 3],
+    [1., np.nan, 3, np.nan]
+])
+def test_numeric_dtypes(data, transform_assert_equal):
+    transform, assert_equal = transform_assert_equal
+    data = transform(data)
+
+    result = to_numeric(data)
+    assert_equal(result, data)
+
+
+@pytest.mark.parametrize("data,exp", [
+    (["1", "2", "3"], np.array([1, 2, 3], dtype="int64")),
+    (["1.5", "2.7", "3.4"], np.array([1.5, 2.7, 3.4]))
+])
+def test_str(data, exp, transform_assert_equal):
+    transform, assert_equal = transform_assert_equal
+    result = to_numeric(transform(data))
+
+    expected = transform(exp)
+    assert_equal(result, expected)
+
+
+def test_datetime_like(tz_naive_fixture, transform_assert_equal):
+    transform, assert_equal = transform_assert_equal
+    idx = pd.date_range("20130101", periods=3, tz=tz_naive_fixture)
+
+    result = to_numeric(transform(idx))
+    expected = transform(idx.asi8)
+    assert_equal(result, expected)
+
+
+def test_timedelta(transform_assert_equal):
+    transform, assert_equal = transform_assert_equal
+    idx = pd.timedelta_range("1 days", periods=3, freq="D")
+
+    result = to_numeric(transform(idx))
+    expected = transform(idx.asi8)
+    assert_equal(result, expected)
+
+
+def test_period(transform_assert_equal):
+    transform, assert_equal = transform_assert_equal
+
+    idx = pd.period_range("2011-01", periods=3, freq="M", name="")
+    inp = transform(idx)
+
+    if isinstance(inp, Index):
+        result = to_numeric(inp)
+        expected = transform(idx.asi8)
+        assert_equal(result, expected)
+    else:
+        # TODO: PeriodDtype, so support it in to_numeric.
+        pytest.skip("Missing PeriodDtype support in to_numeric")
+
+
+@pytest.mark.parametrize("errors,expected", [
+    ("raise", "Invalid object type at position 0"),
+    ("ignore", Series([[10.0, 2], 1.0, "apple"])),
+    ("coerce", Series([np.nan, 1.0, np.nan]))
+])
+def test_non_hashable(errors, expected):
+    # see gh-13324
+    ser = Series([[10.0, 2], 1.0, "apple"])
+
+    if isinstance(expected, str):
+        with pytest.raises(TypeError, match=expected):
+            to_numeric(ser, errors=errors)
+    else:
+        result = to_numeric(ser, errors=errors)
+        tm.assert_series_equal(result, expected)
+
+
+def test_downcast_invalid_cast():
+    # see gh-13352
+    data = ["1", 2, 3]
+    invalid_downcast = "unsigned-integer"
+    msg = "invalid downcasting method provided"
+
+    with pytest.raises(ValueError, match=msg):
+        to_numeric(data, downcast=invalid_downcast)
+
+
+@pytest.mark.parametrize("data", [
+    ["1", 2, 3],
+    [1, 2, 3],
+    np.array(["1970-01-02", "1970-01-03",
+              "1970-01-04"], dtype="datetime64[D]")
+])
+@pytest.mark.parametrize("kwargs,exp_dtype", [
+    # Basic function tests.
+    (dict(), np.int64),
+    (dict(downcast=None), np.int64),
+
+    # Support below np.float32 is rare and far between.
+    (dict(downcast="float"), np.dtype(np.float32).char),
+
+    # Basic dtype support.
+    (dict(downcast="unsigned"), np.dtype(np.typecodes["UnsignedInteger"][0]))
+])
+def test_downcast_basic(data, kwargs, exp_dtype):
+    # see gh-13352
+    result = to_numeric(data, **kwargs)
+    expected = np.array([1, 2, 3], dtype=exp_dtype)
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("signed_downcast", ["integer", "signed"])
+@pytest.mark.parametrize("data", [
+    ["1", 2, 3],
+    [1, 2, 3],
+    np.array(["1970-01-02", "1970-01-03",
+              "1970-01-04"], dtype="datetime64[D]")
+])
+def test_signed_downcast(data, signed_downcast):
+    # see gh-13352
+    smallest_int_dtype = np.dtype(np.typecodes["Integer"][0])
+    expected = np.array([1, 2, 3], dtype=smallest_int_dtype)
+
+    res = to_numeric(data, downcast=signed_downcast)
+    tm.assert_numpy_array_equal(res, expected)
+
+
+def test_ignore_downcast_invalid_data():
+    # If we can't successfully cast the given
+    # data to a numeric dtype, do not bother
+    # with the downcast parameter.
+    data = ["foo", 2, 3]
+    expected = np.array(data, dtype=object)
+
+    res = to_numeric(data, errors="ignore",
+                     downcast="unsigned")
+    tm.assert_numpy_array_equal(res, expected)
+
+
+def test_ignore_downcast_neg_to_unsigned():
+    # Cannot cast to an unsigned integer
+    # because we have a negative number.
+    data = ["-1", 2, 3]
+    expected = np.array([-1, 2, 3], dtype=np.int64)
+
+    res = to_numeric(data, downcast="unsigned")
+    tm.assert_numpy_array_equal(res, expected)
+
+
+@pytest.mark.parametrize("downcast", ["integer", "signed", "unsigned"])
+@pytest.mark.parametrize("data,expected", [
+    (["1.1", 2, 3],
+     np.array([1.1, 2, 3], dtype=np.float64)),
+    ([10000.0, 20000, 3000, 40000.36, 50000, 50000.00],
+     np.array([10000.0, 20000, 3000,
+               40000.36, 50000, 50000.00], dtype=np.float64))
+])
+def test_ignore_downcast_cannot_convert_float(data, expected, downcast):
+    # Cannot cast to an integer (signed or unsigned)
+    # because we have a float number.
+    res = to_numeric(data, downcast=downcast)
+    tm.assert_numpy_array_equal(res, expected)
+
+
+@pytest.mark.parametrize("downcast,expected_dtype", [
+    ("integer", np.int16),
+    ("signed", np.int16),
+    ("unsigned", np.uint16)
+])
+def test_downcast_not8bit(downcast, expected_dtype):
+    # the smallest integer dtype need not be np.(u)int8
+    data = ["256", 257, 258]
+
+    expected = np.array([256, 257, 258], dtype=expected_dtype)
+    res = to_numeric(data, downcast=downcast)
+    tm.assert_numpy_array_equal(res, expected)
+
+
+@pytest.mark.parametrize("dtype,downcast,min_max", [
+    ("int8", "integer", [iinfo(np.int8).min,
+                         iinfo(np.int8).max]),
+    ("int16", "integer", [iinfo(np.int16).min,
+                          iinfo(np.int16).max]),
+    ("int32", "integer", [iinfo(np.int32).min,
+                          iinfo(np.int32).max]),
+    ("int64", "integer", [iinfo(np.int64).min,
+                          iinfo(np.int64).max]),
+    ("uint8", "unsigned", [iinfo(np.uint8).min,
+                           iinfo(np.uint8).max]),
+    ("uint16", "unsigned", [iinfo(np.uint16).min,
+                            iinfo(np.uint16).max]),
+    ("uint32", "unsigned", [iinfo(np.uint32).min,
+                            iinfo(np.uint32).max]),
+    ("uint64", "unsigned", [iinfo(np.uint64).min,
+                            iinfo(np.uint64).max]),
+    ("int16", "integer", [iinfo(np.int8).min,
+                          iinfo(np.int8).max + 1]),
+    ("int32", "integer", [iinfo(np.int16).min,
+                          iinfo(np.int16).max + 1]),
+    ("int64", "integer", [iinfo(np.int32).min,
+                          iinfo(np.int32).max + 1]),
+    ("int16", "integer", [iinfo(np.int8).min - 1,
+                          iinfo(np.int16).max]),
+    ("int32", "integer", [iinfo(np.int16).min - 1,
+                          iinfo(np.int32).max]),
+    ("int64", "integer", [iinfo(np.int32).min - 1,
+                          iinfo(np.int64).max]),
+    ("uint16", "unsigned", [iinfo(np.uint8).min,
+                            iinfo(np.uint8).max + 1]),
+    ("uint32", "unsigned", [iinfo(np.uint16).min,
+                            iinfo(np.uint16).max + 1]),
+    ("uint64", "unsigned", [iinfo(np.uint32).min,
+                            iinfo(np.uint32).max + 1])
+])
+def test_downcast_limits(dtype, downcast, min_max):
+    # see gh-14404: test the limits of each downcast.
+    series = to_numeric(Series(min_max), downcast=downcast)
+    assert series.dtype == dtype
+
+
+@pytest.mark.parametrize("data,exp_data", [
+    ([200, 300, "", "NaN", 30000000000000000000],
+     [200, 300, np.nan, np.nan, 30000000000000000000]),
+    (["12345678901234567890", "1234567890", "ITEM"],
+     [12345678901234567890, 1234567890, np.nan])
+])
+def test_coerce_uint64_conflict(data, exp_data):
+    # see gh-17007 and gh-17125
+    #
+    # Still returns float despite the uint64-nan conflict,
+    # which would normally force the casting to object.
+    result = to_numeric(Series(data), errors="coerce")
+    expected = Series(exp_data, dtype=float)
+    tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("errors,exp", [
+    ("ignore", Series(["12345678901234567890", "1234567890", "ITEM"])),
+    ("raise", "Unable to parse string")
+])
+def test_non_coerce_uint64_conflict(errors, exp):
+    # see gh-17007 and gh-17125
+    #
+    # For completeness.
+    ser = Series(["12345678901234567890", "1234567890", "ITEM"])
+
+    if isinstance(exp, str):
+        with pytest.raises(ValueError, match=exp):
+            to_numeric(ser, errors=errors)
+    else:
+        result = to_numeric(ser, errors=errors)
+        tm.assert_series_equal(result, ser)
diff --git a/pandas/tests/tools/test_pivot.py b/pandas/tests/tools/test_pivot.py
deleted file mode 100644
index 4502f232c6d9c..0000000000000
--- a/pandas/tests/tools/test_pivot.py
+++ /dev/null
@@ -1,1458 +0,0 @@
-from datetime import datetime, date, timedelta
-
-import numpy as np
-
-import pandas as pd
-from pandas import (DataFrame, Series, Index, MultiIndex,
-                    Grouper, date_range, concat)
-from pandas.tools.pivot import pivot_table, crosstab
-from pandas.compat import range, product
-import pandas.util.testing as tm
-from pandas.tseries.util import pivot_annual, isleapyear
-
-
-class TestPivotTable(tm.TestCase):
-
-    def setUp(self):
-        self.data = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                                     'bar', 'bar', 'bar', 'bar',
-                                     'foo', 'foo', 'foo'],
-                               'B': ['one', 'one', 'one', 'two',
-                                     'one', 'one', 'one', 'two',
-                                     'two', 'two', 'one'],
-                               'C': ['dull', 'dull', 'shiny', 'dull',
-                                     'dull', 'shiny', 'shiny', 'dull',
-                                     'shiny', 'shiny', 'shiny'],
-                               'D': np.random.randn(11),
-                               'E': np.random.randn(11),
-                               'F': np.random.randn(11)})
-
-    def test_pivot_table(self):
-        index = ['A', 'B']
-        columns = 'C'
-        table = pivot_table(self.data, values='D',
-                            index=index, columns=columns)
-
-        table2 = self.data.pivot_table(
-            values='D', index=index, columns=columns)
-        tm.assert_frame_equal(table, table2)
-
-        # this works
-        pivot_table(self.data, values='D', index=index)
-
-        if len(index) > 1:
-            self.assertEqual(table.index.names, tuple(index))
-        else:
-            self.assertEqual(table.index.name, index[0])
-
-        if len(columns) > 1:
-            self.assertEqual(table.columns.names, columns)
-        else:
-            self.assertEqual(table.columns.name, columns[0])
-
-        expected = self.data.groupby(
-            index + [columns])['D'].agg(np.mean).unstack()
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_table_nocols(self):
-        df = DataFrame({'rows': ['a', 'b', 'c'],
-                        'cols': ['x', 'y', 'z'],
-                        'values': [1, 2, 3]})
-        rs = df.pivot_table(columns='cols', aggfunc=np.sum)
-        xp = df.pivot_table(index='cols', aggfunc=np.sum).T
-        tm.assert_frame_equal(rs, xp)
-
-        rs = df.pivot_table(columns='cols', aggfunc={'values': 'mean'})
-        xp = df.pivot_table(index='cols', aggfunc={'values': 'mean'}).T
-        tm.assert_frame_equal(rs, xp)
-
-    def test_pivot_table_dropna(self):
-        df = DataFrame({'amount': {0: 60000, 1: 100000, 2: 50000, 3: 30000},
-                        'customer': {0: 'A', 1: 'A', 2: 'B', 3: 'C'},
-                        'month': {0: 201307, 1: 201309, 2: 201308, 3: 201310},
-                        'product': {0: 'a', 1: 'b', 2: 'c', 3: 'd'},
-                        'quantity': {0: 2000000, 1: 500000,
-                                     2: 1000000, 3: 1000000}})
-        pv_col = df.pivot_table('quantity', 'month', [
-                                'customer', 'product'], dropna=False)
-        pv_ind = df.pivot_table(
-            'quantity', ['customer', 'product'], 'month', dropna=False)
-
-        m = MultiIndex.from_tuples([('A', 'a'), ('A', 'b'), ('A', 'c'),
-                                    ('A', 'd'), ('B', 'a'), ('B', 'b'),
-                                    ('B', 'c'), ('B', 'd'), ('C', 'a'),
-                                    ('C', 'b'), ('C', 'c'), ('C', 'd')],
-                                   names=['customer', 'product'])
-        tm.assert_index_equal(pv_col.columns, m)
-        tm.assert_index_equal(pv_ind.index, m)
-
-    def test_pivot_table_dropna_categoricals(self):
-        # GH 15193
-        categories = ['a', 'b', 'c', 'd']
-
-        df = DataFrame({'A': ['a', 'a', 'a', 'b', 'b', 'b', 'c', 'c', 'c'],
-                        'B': [1, 2, 3, 1, 2, 3, 1, 2, 3],
-                        'C': range(0, 9)})
-
-        df['A'] = df['A'].astype('category', ordered=False,
-                                 categories=categories)
-        result_true = df.pivot_table(index='B', columns='A', values='C',
-                                     dropna=True)
-        expected_columns = Series(['a', 'b', 'c'], name='A')
-        expected_columns = expected_columns.astype('category', ordered=False,
-                                                   categories=categories)
-        expected_index = Series([1, 2, 3], name='B')
-        expected_true = DataFrame([[0.0, 3.0, 6.0],
-                                   [1.0, 4.0, 7.0],
-                                   [2.0, 5.0, 8.0]],
-                                  index=expected_index,
-                                  columns=expected_columns,)
-        tm.assert_frame_equal(expected_true, result_true)
-
-        result_false = df.pivot_table(index='B', columns='A', values='C',
-                                      dropna=False)
-        expected_columns = Series(['a', 'b', 'c', 'd'], name='A')
-        expected_false = DataFrame([[0.0, 3.0, 6.0, np.NaN],
-                                    [1.0, 4.0, 7.0, np.NaN],
-                                    [2.0, 5.0, 8.0, np.NaN]],
-                                   index=expected_index,
-                                   columns=expected_columns,)
-        tm.assert_frame_equal(expected_false, result_false)
-
-    def test_pass_array(self):
-        result = self.data.pivot_table(
-            'D', index=self.data.A, columns=self.data.C)
-        expected = self.data.pivot_table('D', index='A', columns='C')
-        tm.assert_frame_equal(result, expected)
-
-    def test_pass_function(self):
-        result = self.data.pivot_table('D', index=lambda x: x // 5,
-                                       columns=self.data.C)
-        expected = self.data.pivot_table('D', index=self.data.index // 5,
-                                         columns='C')
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_table_multiple(self):
-        index = ['A', 'B']
-        columns = 'C'
-        table = pivot_table(self.data, index=index, columns=columns)
-        expected = self.data.groupby(index + [columns]).agg(np.mean).unstack()
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_dtypes(self):
-
-        # can convert dtypes
-        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
-                      1, 2, 3, 4], 'i': ['a', 'b', 'a', 'b']})
-        self.assertEqual(f.dtypes['v'], 'int64')
-
-        z = pivot_table(f, values='v', index=['a'], columns=[
-                        'i'], fill_value=0, aggfunc=np.sum)
-        result = z.get_dtype_counts()
-        expected = Series(dict(int64=2))
-        tm.assert_series_equal(result, expected)
-
-        # cannot convert dtypes
-        f = DataFrame({'a': ['cat', 'bat', 'cat', 'bat'], 'v': [
-                      1.5, 2.5, 3.5, 4.5], 'i': ['a', 'b', 'a', 'b']})
-        self.assertEqual(f.dtypes['v'], 'float64')
-
-        z = pivot_table(f, values='v', index=['a'], columns=[
-                        'i'], fill_value=0, aggfunc=np.mean)
-        result = z.get_dtype_counts()
-        expected = Series(dict(float64=2))
-        tm.assert_series_equal(result, expected)
-
-    def test_pivot_no_values(self):
-        # GH 14380
-        idx = pd.DatetimeIndex(['2011-01-01', '2011-02-01', '2011-01-02',
-                                '2011-01-01', '2011-01-02'])
-        df = pd.DataFrame({'A': [1, 2, 3, 4, 5]},
-                          index=idx)
-        res = df.pivot_table(index=df.index.month, columns=df.index.day)
-
-        exp_columns = pd.MultiIndex.from_tuples([('A', 1), ('A', 2)])
-        exp = pd.DataFrame([[2.5, 4.0], [2.0, np.nan]],
-                           index=[1, 2], columns=exp_columns)
-        tm.assert_frame_equal(res, exp)
-
-        df = pd.DataFrame({'A': [1, 2, 3, 4, 5],
-                           'dt': pd.date_range('2011-01-01', freq='D',
-                                               periods=5)},
-                          index=idx)
-        res = df.pivot_table(index=df.index.month,
-                             columns=pd.Grouper(key='dt', freq='M'))
-        exp_columns = pd.MultiIndex.from_tuples([('A',
-                                                  pd.Timestamp('2011-01-31'))])
-        exp_columns.names = [None, 'dt']
-        exp = pd.DataFrame([3.25, 2.0],
-                           index=[1, 2], columns=exp_columns)
-        tm.assert_frame_equal(res, exp)
-
-        res = df.pivot_table(index=pd.Grouper(freq='A'),
-                             columns=pd.Grouper(key='dt', freq='M'))
-        exp = pd.DataFrame([3],
-                           index=pd.DatetimeIndex(['2011-12-31']),
-                           columns=exp_columns)
-        tm.assert_frame_equal(res, exp)
-
-    def test_pivot_multi_values(self):
-        result = pivot_table(self.data, values=['D', 'E'],
-                             index='A', columns=['B', 'C'], fill_value=0)
-        expected = pivot_table(self.data.drop(['F'], axis=1),
-                               index='A', columns=['B', 'C'], fill_value=0)
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_multi_functions(self):
-        f = lambda func: pivot_table(self.data, values=['D', 'E'],
-                                     index=['A', 'B'], columns='C',
-                                     aggfunc=func)
-        result = f([np.mean, np.std])
-        means = f(np.mean)
-        stds = f(np.std)
-        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
-        tm.assert_frame_equal(result, expected)
-
-        # margins not supported??
-        f = lambda func: pivot_table(self.data, values=['D', 'E'],
-                                     index=['A', 'B'], columns='C',
-                                     aggfunc=func, margins=True)
-        result = f([np.mean, np.std])
-        means = f(np.mean)
-        stds = f(np.std)
-        expected = concat([means, stds], keys=['mean', 'std'], axis=1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_index_with_nan(self):
-        # GH 3588
-        nan = np.nan
-        df = DataFrame({'a': ['R1', 'R2', nan, 'R4'],
-                        'b': ['C1', 'C2', 'C3', 'C4'],
-                        'c': [10, 15, 17, 20]})
-        result = df.pivot('a', 'b', 'c')
-        expected = DataFrame([[nan, nan, 17, nan], [10, nan, nan, nan],
-                              [nan, 15, nan, nan], [nan, nan, nan, 20]],
-                             index=Index([nan, 'R1', 'R2', 'R4'], name='a'),
-                             columns=Index(['C1', 'C2', 'C3', 'C4'], name='b'))
-        tm.assert_frame_equal(result, expected)
-        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), expected.T)
-
-        # GH9491
-        df = DataFrame({'a': pd.date_range('2014-02-01', periods=6, freq='D'),
-                        'c': 100 + np.arange(6)})
-        df['b'] = df['a'] - pd.Timestamp('2014-02-02')
-        df.loc[1, 'a'] = df.loc[3, 'a'] = nan
-        df.loc[1, 'b'] = df.loc[4, 'b'] = nan
-
-        pv = df.pivot('a', 'b', 'c')
-        self.assertEqual(pv.notnull().values.sum(), len(df))
-
-        for _, row in df.iterrows():
-            self.assertEqual(pv.loc[row['a'], row['b']], row['c'])
-
-        tm.assert_frame_equal(df.pivot('b', 'a', 'c'), pv.T)
-
-    def test_pivot_with_tz(self):
-        # GH 5878
-        df = DataFrame({'dt1': [datetime(2013, 1, 1, 9, 0),
-                                datetime(2013, 1, 2, 9, 0),
-                                datetime(2013, 1, 1, 9, 0),
-                                datetime(2013, 1, 2, 9, 0)],
-                        'dt2': [datetime(2014, 1, 1, 9, 0),
-                                datetime(2014, 1, 1, 9, 0),
-                                datetime(2014, 1, 2, 9, 0),
-                                datetime(2014, 1, 2, 9, 0)],
-                        'data1': np.arange(4, dtype='int64'),
-                        'data2': np.arange(4, dtype='int64')})
-
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
-
-        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
-        exp_col2 = pd.DatetimeIndex(['2014/01/01 09:00',
-                                     '2014/01/02 09:00'] * 2,
-                                    name='dt2', tz='Asia/Tokyo')
-        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
-        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
-                             index=pd.DatetimeIndex(['2013/01/01 09:00',
-                                                     '2013/01/02 09:00'],
-                                                    name='dt1',
-                                                    tz='US/Pacific'),
-                             columns=exp_col)
-
-        pv = df.pivot(index='dt1', columns='dt2')
-        tm.assert_frame_equal(pv, expected)
-
-        expected = DataFrame([[0, 2], [1, 3]],
-                             index=pd.DatetimeIndex(['2013/01/01 09:00',
-                                                     '2013/01/02 09:00'],
-                                                    name='dt1',
-                                                    tz='US/Pacific'),
-                             columns=pd.DatetimeIndex(['2014/01/01 09:00',
-                                                       '2014/01/02 09:00'],
-                                                      name='dt2',
-                                                      tz='Asia/Tokyo'))
-
-        pv = df.pivot(index='dt1', columns='dt2', values='data1')
-        tm.assert_frame_equal(pv, expected)
-
-    def test_pivot_periods(self):
-        df = DataFrame({'p1': [pd.Period('2013-01-01', 'D'),
-                               pd.Period('2013-01-02', 'D'),
-                               pd.Period('2013-01-01', 'D'),
-                               pd.Period('2013-01-02', 'D')],
-                        'p2': [pd.Period('2013-01', 'M'),
-                               pd.Period('2013-01', 'M'),
-                               pd.Period('2013-02', 'M'),
-                               pd.Period('2013-02', 'M')],
-                        'data1': np.arange(4, dtype='int64'),
-                        'data2': np.arange(4, dtype='int64')})
-
-        exp_col1 = Index(['data1', 'data1', 'data2', 'data2'])
-        exp_col2 = pd.PeriodIndex(['2013-01', '2013-02'] * 2,
-                                  name='p2', freq='M')
-        exp_col = pd.MultiIndex.from_arrays([exp_col1, exp_col2])
-        expected = DataFrame([[0, 2, 0, 2], [1, 3, 1, 3]],
-                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
-                                                  name='p1', freq='D'),
-                             columns=exp_col)
-
-        pv = df.pivot(index='p1', columns='p2')
-        tm.assert_frame_equal(pv, expected)
-
-        expected = DataFrame([[0, 2], [1, 3]],
-                             index=pd.PeriodIndex(['2013-01-01', '2013-01-02'],
-                                                  name='p1', freq='D'),
-                             columns=pd.PeriodIndex(['2013-01', '2013-02'],
-                                                    name='p2', freq='M'))
-
-        pv = df.pivot(index='p1', columns='p2', values='data1')
-        tm.assert_frame_equal(pv, expected)
-
-    def test_margins(self):
-        def _check_output(result, values_col, index=['A', 'B'],
-                          columns=['C'],
-                          margins_col='All'):
-            col_margins = result.loc[result.index[:-1], margins_col]
-            expected_col_margins = self.data.groupby(index)[values_col].mean()
-            tm.assert_series_equal(col_margins, expected_col_margins,
-                                   check_names=False)
-            self.assertEqual(col_margins.name, margins_col)
-
-            result = result.sort_index()
-            index_margins = result.loc[(margins_col, '')].iloc[:-1]
-
-            expected_ix_margins = self.data.groupby(columns)[values_col].mean()
-            tm.assert_series_equal(index_margins, expected_ix_margins,
-                                   check_names=False)
-            self.assertEqual(index_margins.name, (margins_col, ''))
-
-            grand_total_margins = result.loc[(margins_col, ''), margins_col]
-            expected_total_margins = self.data[values_col].mean()
-            self.assertEqual(grand_total_margins, expected_total_margins)
-
-        # column specified
-        result = self.data.pivot_table(values='D', index=['A', 'B'],
-                                       columns='C',
-                                       margins=True, aggfunc=np.mean)
-        _check_output(result, 'D')
-
-        # Set a different margins_name (not 'All')
-        result = self.data.pivot_table(values='D', index=['A', 'B'],
-                                       columns='C',
-                                       margins=True, aggfunc=np.mean,
-                                       margins_name='Totals')
-        _check_output(result, 'D', margins_col='Totals')
-
-        # no column specified
-        table = self.data.pivot_table(index=['A', 'B'], columns='C',
-                                      margins=True, aggfunc=np.mean)
-        for value_col in table.columns.levels[0]:
-            _check_output(table[value_col], value_col)
-
-        # no col
-
-        # to help with a buglet
-        self.data.columns = [k * 2 for k in self.data.columns]
-        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
-                                      aggfunc=np.mean)
-        for value_col in table.columns:
-            totals = table.loc[('All', ''), value_col]
-            self.assertEqual(totals, self.data[value_col].mean())
-
-        # no rows
-        rtable = self.data.pivot_table(columns=['AA', 'BB'], margins=True,
-                                       aggfunc=np.mean)
-        tm.assertIsInstance(rtable, Series)
-
-        table = self.data.pivot_table(index=['AA', 'BB'], margins=True,
-                                      aggfunc='mean')
-        for item in ['DD', 'EE', 'FF']:
-            totals = table.loc[('All', ''), item]
-            self.assertEqual(totals, self.data[item].mean())
-
-        # issue number #8349: pivot_table with margins and dictionary aggfunc
-        data = [
-            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2013,
-             'MONTH': 12, 'DAYS': 3, 'SALARY': 17},
-            {'JOB': 'Employ', 'NAME':
-             'Mary', 'YEAR': 2013, 'MONTH': 12, 'DAYS': 5, 'SALARY': 23},
-            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
-             'MONTH': 1, 'DAYS': 10, 'SALARY': 100},
-            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
-             'MONTH': 1, 'DAYS': 11, 'SALARY': 110},
-            {'JOB': 'Employ', 'NAME': 'Mary', 'YEAR': 2014,
-             'MONTH': 1, 'DAYS': 15, 'SALARY': 200},
-            {'JOB': 'Worker', 'NAME': 'Bob', 'YEAR': 2014,
-             'MONTH': 2, 'DAYS': 8, 'SALARY': 80},
-            {'JOB': 'Employ', 'NAME': 'Mary', 'YEAR': 2014,
-             'MONTH': 2, 'DAYS': 5, 'SALARY': 190},
-        ]
-
-        df = DataFrame(data)
-
-        df = df.set_index(['JOB', 'NAME', 'YEAR', 'MONTH'], drop=False,
-                          append=False)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            result = df.pivot_table(index=['JOB', 'NAME'],
-                                    columns=['YEAR', 'MONTH'],
-                                    values=['DAYS', 'SALARY'],
-                                    aggfunc={'DAYS': 'mean', 'SALARY': 'sum'},
-                                    margins=True)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            expected = df.pivot_table(index=['JOB', 'NAME'],
-                                      columns=['YEAR', 'MONTH'],
-                                      values=['DAYS'],
-                                      aggfunc='mean', margins=True)
-
-        tm.assert_frame_equal(result['DAYS'], expected['DAYS'])
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            expected = df.pivot_table(index=['JOB', 'NAME'],
-                                      columns=['YEAR', 'MONTH'],
-                                      values=['SALARY'],
-                                      aggfunc='sum', margins=True)
-
-        tm.assert_frame_equal(result['SALARY'], expected['SALARY'])
-
-    def test_pivot_integer_columns(self):
-        # caused by upstream bug in unstack
-
-        d = date.min
-        data = list(product(['foo', 'bar'], ['A', 'B', 'C'], ['x1', 'x2'],
-                            [d + timedelta(i)
-                             for i in range(20)], [1.0]))
-        df = DataFrame(data)
-        table = df.pivot_table(values=4, index=[0, 1, 3], columns=[2])
-
-        df2 = df.rename(columns=str)
-        table2 = df2.pivot_table(
-            values='4', index=['0', '1', '3'], columns=['2'])
-
-        tm.assert_frame_equal(table, table2, check_names=False)
-
-    def test_pivot_no_level_overlap(self):
-        # GH #1181
-
-        data = DataFrame({'a': ['a', 'a', 'a', 'a', 'b', 'b', 'b', 'b'] * 2,
-                          'b': [0, 0, 0, 0, 1, 1, 1, 1] * 2,
-                          'c': (['foo'] * 4 + ['bar'] * 4) * 2,
-                          'value': np.random.randn(16)})
-
-        table = data.pivot_table('value', index='a', columns=['b', 'c'])
-
-        grouped = data.groupby(['a', 'b', 'c'])['value'].mean()
-        expected = grouped.unstack('b').unstack('c').dropna(axis=1, how='all')
-        tm.assert_frame_equal(table, expected)
-
-    def test_pivot_columns_lexsorted(self):
-
-        n = 10000
-
-        dtype = np.dtype([
-            ("Index", object),
-            ("Symbol", object),
-            ("Year", int),
-            ("Month", int),
-            ("Day", int),
-            ("Quantity", int),
-            ("Price", float),
-        ])
-
-        products = np.array([
-            ('SP500', 'ADBE'),
-            ('SP500', 'NVDA'),
-            ('SP500', 'ORCL'),
-            ('NDQ100', 'AAPL'),
-            ('NDQ100', 'MSFT'),
-            ('NDQ100', 'GOOG'),
-            ('FTSE', 'DGE.L'),
-            ('FTSE', 'TSCO.L'),
-            ('FTSE', 'GSK.L'),
-        ], dtype=[('Index', object), ('Symbol', object)])
-        items = np.empty(n, dtype=dtype)
-        iproduct = np.random.randint(0, len(products), n)
-        items['Index'] = products['Index'][iproduct]
-        items['Symbol'] = products['Symbol'][iproduct]
-        dr = pd.date_range(date(2000, 1, 1),
-                           date(2010, 12, 31))
-        dates = dr[np.random.randint(0, len(dr), n)]
-        items['Year'] = dates.year
-        items['Month'] = dates.month
-        items['Day'] = dates.day
-        items['Price'] = np.random.lognormal(4.0, 2.0, n)
-
-        df = DataFrame(items)
-
-        pivoted = df.pivot_table('Price', index=['Month', 'Day'],
-                                 columns=['Index', 'Symbol', 'Year'],
-                                 aggfunc='mean')
-
-        self.assertTrue(pivoted.columns.is_monotonic)
-
-    def test_pivot_complex_aggfunc(self):
-        f = {'D': ['std'], 'E': ['sum']}
-        expected = self.data.groupby(['A', 'B']).agg(f).unstack('B')
-        result = self.data.pivot_table(index='A', columns='B', aggfunc=f)
-
-        tm.assert_frame_equal(result, expected)
-
-    def test_margins_no_values_no_cols(self):
-        # Regression test on pivot table: no values or cols passed.
-        result = self.data[['A', 'B']].pivot_table(
-            index=['A', 'B'], aggfunc=len, margins=True)
-        result_list = result.tolist()
-        self.assertEqual(sum(result_list[:-1]), result_list[-1])
-
-    def test_margins_no_values_two_rows(self):
-        # Regression test on pivot table: no values passed but rows are a
-        # multi-index
-        result = self.data[['A', 'B', 'C']].pivot_table(
-            index=['A', 'B'], columns='C', aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [3.0, 1.0, 4.0, 3.0, 11.0])
-
-    def test_margins_no_values_one_row_one_col(self):
-        # Regression test on pivot table: no values passed but row and col
-        # defined
-        result = self.data[['A', 'B']].pivot_table(
-            index='A', columns='B', aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [4.0, 7.0, 11.0])
-
-    def test_margins_no_values_two_row_two_cols(self):
-        # Regression test on pivot table: no values passed but rows and cols
-        # are multi-indexed
-        self.data['D'] = ['a', 'b', 'c', 'd',
-                          'e', 'f', 'g', 'h', 'i', 'j', 'k']
-        result = self.data[['A', 'B', 'C', 'D']].pivot_table(
-            index=['A', 'B'], columns=['C', 'D'], aggfunc=len, margins=True)
-        self.assertEqual(result.All.tolist(), [3.0, 1.0, 4.0, 3.0, 11.0])
-
-    def test_pivot_table_with_margins_set_margin_name(self):
-        # GH 3335
-        for margin_name in ['foo', 'one', 666, None, ['a', 'b']]:
-            with self.assertRaises(ValueError):
-                # multi-index index
-                pivot_table(self.data, values='D', index=['A', 'B'],
-                            columns=['C'], margins=True,
-                            margins_name=margin_name)
-            with self.assertRaises(ValueError):
-                # multi-index column
-                pivot_table(self.data, values='D', index=['C'],
-                            columns=['A', 'B'], margins=True,
-                            margins_name=margin_name)
-            with self.assertRaises(ValueError):
-                # non-multi-index index/column
-                pivot_table(self.data, values='D', index=['A'],
-                            columns=['B'], margins=True,
-                            margins_name=margin_name)
-
-    def test_pivot_timegrouper(self):
-        df = DataFrame({
-            'Branch': 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
-            'Date': [datetime(2013, 1, 1),
-                     datetime(2013, 1, 1),
-                     datetime(2013, 10, 1),
-                     datetime(2013, 10, 2),
-                     datetime(2013, 10, 1),
-                     datetime(2013, 10, 2),
-                     datetime(2013, 12, 2),
-                     datetime(2013, 12, 2), ]}).set_index('Date')
-
-        expected = DataFrame(np.array([10, 18, 3], dtype='int64')
-                             .reshape(1, 3),
-                             index=[datetime(2013, 12, 31)],
-                             columns='Carl Joe Mark'.split())
-        expected.index.name = 'Date'
-        expected.columns.name = 'Buyer'
-
-        result = pivot_table(df, index=Grouper(freq='A'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='A'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        expected = DataFrame(np.array([1, np.nan, 3, 9, 18, np.nan])
-                             .reshape(2, 3),
-                             index=[datetime(2013, 1, 1),
-                                    datetime(2013, 7, 1)],
-                             columns='Carl Joe Mark'.split())
-        expected.index.name = 'Date'
-        expected.columns.name = 'Buyer'
-
-        result = pivot_table(df, index=Grouper(freq='6MS'), columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer', columns=Grouper(freq='6MS'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        # passing the name
-        df = df.reset_index()
-        result = pivot_table(df, index=Grouper(freq='6MS', key='Date'),
-                             columns='Buyer',
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer',
-                             columns=Grouper(freq='6MS', key='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        self.assertRaises(KeyError, lambda: pivot_table(
-            df, index=Grouper(freq='6MS', key='foo'),
-            columns='Buyer', values='Quantity', aggfunc=np.sum))
-        self.assertRaises(KeyError, lambda: pivot_table(
-            df, index='Buyer',
-            columns=Grouper(freq='6MS', key='foo'),
-            values='Quantity', aggfunc=np.sum))
-
-        # passing the level
-        df = df.set_index('Date')
-        result = pivot_table(df, index=Grouper(freq='6MS', level='Date'),
-                             columns='Buyer', values='Quantity',
-                             aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index='Buyer',
-                             columns=Grouper(freq='6MS', level='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        self.assertRaises(ValueError, lambda: pivot_table(
-            df, index=Grouper(freq='6MS', level='foo'),
-            columns='Buyer', values='Quantity', aggfunc=np.sum))
-        self.assertRaises(ValueError, lambda: pivot_table(
-            df, index='Buyer',
-            columns=Grouper(freq='6MS', level='foo'),
-            values='Quantity', aggfunc=np.sum))
-
-        # double grouper
-        df = DataFrame({
-            'Branch': 'A A A A A A A B'.split(),
-            'Buyer': 'Carl Mark Carl Carl Joe Joe Joe Carl'.split(),
-            'Quantity': [1, 3, 5, 1, 8, 1, 9, 3],
-            'Date': [datetime(2013, 11, 1, 13, 0), datetime(2013, 9, 1, 13, 5),
-                     datetime(2013, 10, 1, 20, 0),
-                     datetime(2013, 10, 2, 10, 0),
-                     datetime(2013, 11, 1, 20, 0),
-                     datetime(2013, 10, 2, 10, 0),
-                     datetime(2013, 10, 2, 12, 0),
-                     datetime(2013, 12, 5, 14, 0)],
-            'PayDay': [datetime(2013, 10, 4, 0, 0),
-                       datetime(2013, 10, 15, 13, 5),
-                       datetime(2013, 9, 5, 20, 0),
-                       datetime(2013, 11, 2, 10, 0),
-                       datetime(2013, 10, 7, 20, 0),
-                       datetime(2013, 9, 5, 10, 0),
-                       datetime(2013, 12, 30, 12, 0),
-                       datetime(2013, 11, 20, 14, 0), ]})
-
-        result = pivot_table(df, index=Grouper(freq='M', key='Date'),
-                             columns=Grouper(freq='M', key='PayDay'),
-                             values='Quantity', aggfunc=np.sum)
-        expected = DataFrame(np.array([np.nan, 3, np.nan, np.nan,
-                                       6, np.nan, 1, 9,
-                                       np.nan, 9, np.nan, np.nan, np.nan,
-                                       np.nan, 3, np.nan]).reshape(4, 4),
-                             index=[datetime(2013, 9, 30),
-                                    datetime(2013, 10, 31),
-                                    datetime(2013, 11, 30),
-                                    datetime(2013, 12, 31)],
-                             columns=[datetime(2013, 9, 30),
-                                      datetime(2013, 10, 31),
-                                      datetime(2013, 11, 30),
-                                      datetime(2013, 12, 31)])
-        expected.index.name = 'Date'
-        expected.columns.name = 'PayDay'
-
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=Grouper(freq='M', key='PayDay'),
-                             columns=Grouper(freq='M', key='Date'),
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-        tuples = [(datetime(2013, 9, 30), datetime(2013, 10, 31)),
-                  (datetime(2013, 10, 31),
-                   datetime(2013, 9, 30)),
-                  (datetime(2013, 10, 31),
-                   datetime(2013, 11, 30)),
-                  (datetime(2013, 10, 31),
-                   datetime(2013, 12, 31)),
-                  (datetime(2013, 11, 30),
-                   datetime(2013, 10, 31)),
-                  (datetime(2013, 12, 31), datetime(2013, 11, 30)), ]
-        idx = MultiIndex.from_tuples(tuples, names=['Date', 'PayDay'])
-        expected = DataFrame(np.array([3, np.nan, 6, np.nan, 1, np.nan,
-                                       9, np.nan, 9, np.nan,
-                                       np.nan, 3]).reshape(6, 2),
-                             index=idx, columns=['A', 'B'])
-        expected.columns.name = 'Branch'
-
-        result = pivot_table(
-            df, index=[Grouper(freq='M', key='Date'),
-                       Grouper(freq='M', key='PayDay')], columns=['Branch'],
-            values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=['Branch'],
-                             columns=[Grouper(freq='M', key='Date'),
-                                      Grouper(freq='M', key='PayDay')],
-                             values='Quantity', aggfunc=np.sum)
-        tm.assert_frame_equal(result, expected.T)
-
-    def test_pivot_datetime_tz(self):
-        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                  '2011-07-19 09:00:00',
-                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                  '2011-07-19 09:00:00']
-        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
-                  '2013-01-01 15:00:00',
-                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
-                  '2013-02-01 15:00:00']
-        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'dt1': dates1, 'dt2': dates2,
-                        'value1': np.arange(6, dtype='int64'),
-                        'value2': [1, 2] * 3})
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d, tz='US/Pacific'))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d, tz='Asia/Tokyo'))
-
-        exp_idx = pd.DatetimeIndex(['2011-07-19 07:00:00',
-                                    '2011-07-19 08:00:00',
-                                    '2011-07-19 09:00:00'],
-                                   tz='US/Pacific', name='dt1')
-        exp_col1 = Index(['value1', 'value1'])
-        exp_col2 = Index(['a', 'b'], name='label')
-        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2])
-        expected = DataFrame([[0, 3], [1, 4], [2, 5]],
-                             index=exp_idx, columns=exp_col)
-        result = pivot_table(df, index=['dt1'], columns=[
-                             'label'], values=['value1'])
-        tm.assert_frame_equal(result, expected)
-
-        exp_col1 = Index(['sum', 'sum', 'sum', 'sum',
-                          'mean', 'mean', 'mean', 'mean'])
-        exp_col2 = Index(['value1', 'value1', 'value2', 'value2'] * 2)
-        exp_col3 = pd.DatetimeIndex(['2013-01-01 15:00:00',
-                                     '2013-02-01 15:00:00'] * 4,
-                                    tz='Asia/Tokyo', name='dt2')
-        exp_col = MultiIndex.from_arrays([exp_col1, exp_col2, exp_col3])
-        expected = DataFrame(np.array([[0, 3, 1, 2, 0, 3, 1, 2],
-                                       [1, 4, 2, 1, 1, 4, 2, 1],
-                                       [2, 5, 1, 2, 2, 5, 1, 2]],
-                                      dtype='int64'),
-                             index=exp_idx,
-                             columns=exp_col)
-
-        result = pivot_table(df, index=['dt1'], columns=['dt2'],
-                             values=['value1', 'value2'],
-                             aggfunc=[np.sum, np.mean])
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_dtaccessor(self):
-        # GH 8103
-        dates1 = ['2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                  '2011-07-19 09:00:00',
-                  '2011-07-19 07:00:00', '2011-07-19 08:00:00',
-                  '2011-07-19 09:00:00']
-        dates2 = ['2013-01-01 15:00:00', '2013-01-01 15:00:00',
-                  '2013-01-01 15:00:00',
-                  '2013-02-01 15:00:00', '2013-02-01 15:00:00',
-                  '2013-02-01 15:00:00']
-        df = DataFrame({'label': ['a', 'a', 'a', 'b', 'b', 'b'],
-                        'dt1': dates1, 'dt2': dates2,
-                        'value1': np.arange(6, dtype='int64'),
-                        'value2': [1, 2] * 3})
-        df['dt1'] = df['dt1'].apply(lambda d: pd.Timestamp(d))
-        df['dt2'] = df['dt2'].apply(lambda d: pd.Timestamp(d))
-
-        result = pivot_table(df, index='label', columns=df['dt1'].dt.hour,
-                             values='value1')
-
-        exp_idx = Index(['a', 'b'], name='label')
-        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
-                             index=exp_idx,
-                             columns=Index([7, 8, 9], name='dt1'))
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=df['dt2'].dt.month,
-                             columns=df['dt1'].dt.hour,
-                             values='value1')
-
-        expected = DataFrame({7: [0, 3], 8: [1, 4], 9: [2, 5]},
-                             index=Index([1, 2], name='dt2'),
-                             columns=Index([7, 8, 9], name='dt1'))
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=df['dt2'].dt.year.values,
-                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
-                             values='value1')
-
-        exp_col = MultiIndex.from_arrays(
-            [[7, 7, 8, 8, 9, 9], [1, 2] * 3], names=['dt1', 'dt2'])
-        expected = DataFrame(np.array([[0, 3, 1, 4, 2, 5]], dtype='int64'),
-                             index=[2013], columns=exp_col)
-        tm.assert_frame_equal(result, expected)
-
-        result = pivot_table(df, index=np.array(['X', 'X', 'X',
-                                                 'X', 'Y', 'Y']),
-                             columns=[df['dt1'].dt.hour, df['dt2'].dt.month],
-                             values='value1')
-        expected = DataFrame(np.array([[0, 3, 1, np.nan, 2, np.nan],
-                                       [np.nan, np.nan, np.nan,
-                                        4, np.nan, 5]]),
-                             index=['X', 'Y'], columns=exp_col)
-        tm.assert_frame_equal(result, expected)
-
-    def test_pivot_table_with_iterator_values(self):
-        # GH 12017
-        aggs = {'D': 'sum', 'E': 'mean'}
-
-        pivot_values_list = pd.pivot_table(
-            self.data, index=['A'], values=list(aggs.keys()), aggfunc=aggs,
-        )
-
-        pivot_values_keys = pd.pivot_table(
-            self.data, index=['A'], values=aggs.keys(), aggfunc=aggs,
-        )
-        tm.assert_frame_equal(pivot_values_keys, pivot_values_list)
-
-        agg_values_gen = (value for value in aggs.keys())
-        pivot_values_gen = pd.pivot_table(
-            self.data, index=['A'], values=agg_values_gen, aggfunc=aggs,
-        )
-        tm.assert_frame_equal(pivot_values_gen, pivot_values_list)
-
-    def test_pivot_table_margins_name_with_aggfunc_list(self):
-        # GH 13354
-        margins_name = 'Weekly'
-        costs = pd.DataFrame(
-            {'item': ['bacon', 'cheese', 'bacon', 'cheese'],
-             'cost': [2.5, 4.5, 3.2, 3.3],
-             'day': ['M', 'M', 'T', 'T']}
-        )
-        table = costs.pivot_table(
-            index="item", columns="day", margins=True,
-            margins_name=margins_name, aggfunc=[np.mean, max]
-        )
-        ix = pd.Index(
-            ['bacon', 'cheese', margins_name], dtype='object', name='item'
-        )
-        tups = [('mean', 'cost', 'M'), ('mean', 'cost', 'T'),
-                ('mean', 'cost', margins_name), ('max', 'cost', 'M'),
-                ('max', 'cost', 'T'), ('max', 'cost', margins_name)]
-        cols = pd.MultiIndex.from_tuples(tups, names=[None, None, 'day'])
-        expected = pd.DataFrame(table.values, index=ix, columns=cols)
-        tm.assert_frame_equal(table, expected)
-
-    def test_categorical_margins(self):
-        # GH 10989
-        df = pd.DataFrame({'x': np.arange(8),
-                           'y': np.arange(8) // 4,
-                           'z': np.arange(8) % 2})
-
-        expected = pd.DataFrame([[1.0, 2.0, 1.5], [5, 6, 5.5], [3, 4, 3.5]])
-        expected.index = Index([0, 1, 'All'], name='y')
-        expected.columns = Index([0, 1, 'All'], name='z')
-
-        data = df.copy()
-        table = data.pivot_table('x', 'y', 'z', margins=True)
-        tm.assert_frame_equal(table, expected)
-
-        data = df.copy()
-        data.y = data.y.astype('category')
-        data.z = data.z.astype('category')
-        table = data.pivot_table('x', 'y', 'z', margins=True)
-        tm.assert_frame_equal(table, expected)
-
-    def test_categorical_aggfunc(self):
-        # GH 9534
-        df = pd.DataFrame({"C1": ["A", "B", "C", "C"],
-                           "C2": ["a", "a", "b", "b"],
-                           "V": [1, 2, 3, 4]})
-        df["C1"] = df["C1"].astype("category")
-        result = df.pivot_table("V", index="C1", columns="C2", aggfunc="count")
-
-        expected_index = pd.CategoricalIndex(['A', 'B', 'C'],
-                                             categories=['A', 'B', 'C'],
-                                             ordered=False,
-                                             name='C1')
-        expected_columns = pd.Index(['a', 'b'], name='C2')
-        expected_data = np.array([[1., np.nan],
-                                  [1., np.nan],
-                                  [np.nan, 2.]])
-        expected = pd.DataFrame(expected_data,
-                                index=expected_index,
-                                columns=expected_columns)
-        tm.assert_frame_equal(result, expected)
-
-    def test_categorical_pivot_index_ordering(self):
-        # GH 8731
-        df = pd.DataFrame({'Sales': [100, 120, 220],
-                           'Month': ['January', 'January', 'January'],
-                           'Year': [2013, 2014, 2013]})
-        months = ['January', 'February', 'March', 'April', 'May', 'June',
-                  'July', 'August', 'September', 'October', 'November',
-                  'December']
-        df['Month'] = df['Month'].astype('category').cat.set_categories(months)
-        result = df.pivot_table(values='Sales',
-                                index='Month',
-                                columns='Year',
-                                aggfunc='sum')
-        expected_columns = pd.Int64Index([2013, 2014], name='Year')
-        expected_index = pd.CategoricalIndex(months,
-                                             categories=months,
-                                             ordered=False,
-                                             name='Month')
-        expected_data = np.empty((12, 2))
-        expected_data.fill(np.nan)
-        expected_data[0, :] = [320., 120.]
-        expected = pd.DataFrame(expected_data,
-                                index=expected_index,
-                                columns=expected_columns)
-        tm.assert_frame_equal(result, expected)
-
-
-class TestCrosstab(tm.TestCase):
-
-    def setUp(self):
-        df = DataFrame({'A': ['foo', 'foo', 'foo', 'foo',
-                              'bar', 'bar', 'bar', 'bar',
-                              'foo', 'foo', 'foo'],
-                        'B': ['one', 'one', 'one', 'two',
-                              'one', 'one', 'one', 'two',
-                              'two', 'two', 'one'],
-                        'C': ['dull', 'dull', 'shiny', 'dull',
-                              'dull', 'shiny', 'shiny', 'dull',
-                              'shiny', 'shiny', 'shiny'],
-                        'D': np.random.randn(11),
-                        'E': np.random.randn(11),
-                        'F': np.random.randn(11)})
-
-        self.df = df.append(df, ignore_index=True)
-
-    def test_crosstab_single(self):
-        df = self.df
-        result = crosstab(df['A'], df['C'])
-        expected = df.groupby(['A', 'C']).size().unstack()
-        tm.assert_frame_equal(result, expected.fillna(0).astype(np.int64))
-
-    def test_crosstab_multiple(self):
-        df = self.df
-
-        result = crosstab(df['A'], [df['B'], df['C']])
-        expected = df.groupby(['A', 'B', 'C']).size()
-        expected = expected.unstack(
-            'B').unstack('C').fillna(0).astype(np.int64)
-        tm.assert_frame_equal(result, expected)
-
-        result = crosstab([df['B'], df['C']], df['A'])
-        expected = df.groupby(['B', 'C', 'A']).size()
-        expected = expected.unstack('A').fillna(0).astype(np.int64)
-        tm.assert_frame_equal(result, expected)
-
-    def test_crosstab_ndarray(self):
-        a = np.random.randint(0, 5, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 10, size=100)
-
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-
-        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'))
-        expected = crosstab(df['a'], [df['b'], df['c']])
-        tm.assert_frame_equal(result, expected)
-
-        result = crosstab([b, c], a, colnames=['a'], rownames=('b', 'c'))
-        expected = crosstab([df['b'], df['c']], df['a'])
-        tm.assert_frame_equal(result, expected)
-
-        # assign arbitrary names
-        result = crosstab(self.df['A'].values, self.df['C'].values)
-        self.assertEqual(result.index.name, 'row_0')
-        self.assertEqual(result.columns.name, 'col_0')
-
-    def test_crosstab_margins(self):
-        a = np.random.randint(0, 7, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 5, size=100)
-
-        df = DataFrame({'a': a, 'b': b, 'c': c})
-
-        result = crosstab(a, [b, c], rownames=['a'], colnames=('b', 'c'),
-                          margins=True)
-
-        self.assertEqual(result.index.names, ('a',))
-        self.assertEqual(result.columns.names, ['b', 'c'])
-
-        all_cols = result['All', '']
-        exp_cols = df.groupby(['a']).size().astype('i8')
-        # to keep index.name
-        exp_margin = Series([len(df)], index=Index(['All'], name='a'))
-        exp_cols = exp_cols.append(exp_margin)
-        exp_cols.name = ('All', '')
-
-        tm.assert_series_equal(all_cols, exp_cols)
-
-        all_rows = result.loc['All']
-        exp_rows = df.groupby(['b', 'c']).size().astype('i8')
-        exp_rows = exp_rows.append(Series([len(df)], index=[('All', '')]))
-        exp_rows.name = 'All'
-
-        exp_rows = exp_rows.reindex(all_rows.index)
-        exp_rows = exp_rows.fillna(0).astype(np.int64)
-        tm.assert_series_equal(all_rows, exp_rows)
-
-    def test_crosstab_pass_values(self):
-        a = np.random.randint(0, 7, size=100)
-        b = np.random.randint(0, 3, size=100)
-        c = np.random.randint(0, 5, size=100)
-        values = np.random.randn(100)
-
-        table = crosstab([a, b], c, values, aggfunc=np.sum,
-                         rownames=['foo', 'bar'], colnames=['baz'])
-
-        df = DataFrame({'foo': a, 'bar': b, 'baz': c, 'values': values})
-
-        expected = df.pivot_table('values', index=['foo', 'bar'],
-                                  columns='baz', aggfunc=np.sum)
-        tm.assert_frame_equal(table, expected)
-
-    def test_crosstab_dropna(self):
-        # GH 3820
-        a = np.array(['foo', 'foo', 'foo', 'bar',
-                      'bar', 'foo', 'foo'], dtype=object)
-        b = np.array(['one', 'one', 'two', 'one',
-                      'two', 'two', 'two'], dtype=object)
-        c = np.array(['dull', 'dull', 'dull', 'dull',
-                      'dull', 'shiny', 'shiny'], dtype=object)
-        res = pd.crosstab(a, [b, c], rownames=['a'],
-                          colnames=['b', 'c'], dropna=False)
-        m = MultiIndex.from_tuples([('one', 'dull'), ('one', 'shiny'),
-                                    ('two', 'dull'), ('two', 'shiny')],
-                                   names=['b', 'c'])
-        tm.assert_index_equal(res.columns, m)
-
-    def test_crosstab_no_overlap(self):
-        # GS 10291
-
-        s1 = pd.Series([1, 2, 3], index=[1, 2, 3])
-        s2 = pd.Series([4, 5, 6], index=[4, 5, 6])
-
-        actual = crosstab(s1, s2)
-        expected = pd.DataFrame()
-
-        tm.assert_frame_equal(actual, expected)
-
-    def test_margin_dropna(self):
-        # GH 12577
-        # pivot_table counts null into margin ('All')
-        # when margins=true and dropna=true
-
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
-                           'b': [3, 3, 4, 4, 4, 4]})
-        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
-        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 3, 5]])
-        expected.index = Index([1.0, 2.0, 'All'], name='a')
-        expected.columns = Index([3, 4, 'All'], name='b')
-        tm.assert_frame_equal(actual, expected)
-
-        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
-                        'b': [3, np.nan, 4, 4, 4, 4]})
-        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
-        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
-        expected.index = Index([1.0, 2.0, 'All'], name='a')
-        expected.columns = Index([3.0, 4.0, 'All'], name='b')
-        tm.assert_frame_equal(actual, expected)
-
-        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, np.nan, 2],
-                        'b': [3, 3, 4, 4, 4, 4]})
-        actual = pd.crosstab(df.a, df.b, margins=True, dropna=True)
-        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 1, 2]])
-        expected.index = Index([1.0, 2.0, 'All'], name='a')
-        expected.columns = Index([3, 4, 'All'], name='b')
-        tm.assert_frame_equal(actual, expected)
-
-        # GH 12642
-        # _add_margins raises KeyError: Level None not found
-        # when margins=True and dropna=False
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2, np.nan],
-                           'b': [3, 3, 4, 4, 4, 4]})
-        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
-        expected = pd.DataFrame([[1, 0, 1], [1, 3, 4], [2, 4, 6]])
-        expected.index = Index([1.0, 2.0, 'All'], name='a')
-        expected.columns = Index([3, 4, 'All'], name='b')
-        tm.assert_frame_equal(actual, expected)
-
-        df = DataFrame({'a': [1, np.nan, np.nan, np.nan, 2, np.nan],
-                        'b': [3, np.nan, 4, 4, 4, 4]})
-        actual = pd.crosstab(df.a, df.b, margins=True, dropna=False)
-        expected = pd.DataFrame([[1, 0, 1], [0, 1, 1], [1, 4, 6]])
-        expected.index = Index([1.0, 2.0, 'All'], name='a')
-        expected.columns = Index([3.0, 4.0, 'All'], name='b')
-        tm.assert_frame_equal(actual, expected)
-
-        a = np.array(['foo', 'foo', 'foo', 'bar',
-                      'bar', 'foo', 'foo'], dtype=object)
-        b = np.array(['one', 'one', 'two', 'one',
-                      'two', np.nan, 'two'], dtype=object)
-        c = np.array(['dull', 'dull', 'dull', 'dull',
-                      'dull', 'shiny', 'shiny'], dtype=object)
-
-        actual = pd.crosstab(a, [b, c], rownames=['a'],
-                             colnames=['b', 'c'], margins=True, dropna=False)
-        m = MultiIndex.from_arrays([['one', 'one', 'two', 'two', 'All'],
-                                    ['dull', 'shiny', 'dull', 'shiny', '']],
-                                   names=['b', 'c'])
-        expected = DataFrame([[1, 0, 1, 0, 2], [2, 0, 1, 1, 5],
-                              [3, 0, 2, 1, 7]], columns=m)
-        expected.index = Index(['bar', 'foo', 'All'], name='a')
-        tm.assert_frame_equal(actual, expected)
-
-        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
-                             colnames=['c'], margins=True, dropna=False)
-        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
-                                    ['one', 'two', 'one', 'two', '']],
-                                   names=['a', 'b'])
-        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
-                              [5, 2, 7]], index=m)
-        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
-        tm.assert_frame_equal(actual, expected)
-
-        actual = pd.crosstab([a, b], c, rownames=['a', 'b'],
-                             colnames=['c'], margins=True, dropna=True)
-        m = MultiIndex.from_arrays([['bar', 'bar', 'foo', 'foo', 'All'],
-                                    ['one', 'two', 'one', 'two', '']],
-                                   names=['a', 'b'])
-        expected = DataFrame([[1, 0, 1], [1, 0, 1], [2, 0, 2], [1, 1, 2],
-                              [5, 1, 6]], index=m)
-        expected.columns = Index(['dull', 'shiny', 'All'], name='c')
-        tm.assert_frame_equal(actual, expected)
-
-    def test_crosstab_normalize(self):
-        # Issue 12578
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
-                           'c': [1, 1, np.nan, 1, 1]})
-
-        rindex = pd.Index([1, 2], name='a')
-        cindex = pd.Index([3, 4], name='b')
-        full_normal = pd.DataFrame([[0.2, 0], [0.2, 0.6]],
-                                   index=rindex, columns=cindex)
-        row_normal = pd.DataFrame([[1.0, 0], [0.25, 0.75]],
-                                  index=rindex, columns=cindex)
-        col_normal = pd.DataFrame([[0.5, 0], [0.5, 1.0]],
-                                  index=rindex, columns=cindex)
-
-        # Check all normalize args
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='all'),
-                              full_normal)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True),
-                              full_normal)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index'),
-                              row_normal)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns'),
-                              col_normal)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=1),
-                              pd.crosstab(df.a, df.b, normalize='columns'))
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=0),
-                              pd.crosstab(df.a, df.b, normalize='index'))
-
-        row_normal_margins = pd.DataFrame([[1.0, 0],
-                                           [0.25, 0.75],
-                                           [0.4, 0.6]],
-                                          index=pd.Index([1, 2, 'All'],
-                                                         name='a',
-                                                         dtype='object'),
-                                          columns=pd.Index([3, 4], name='b'))
-        col_normal_margins = pd.DataFrame([[0.5, 0, 0.2], [0.5, 1.0, 0.8]],
-                                          index=pd.Index([1, 2], name='a',
-                                                         dtype='object'),
-                                          columns=pd.Index([3, 4, 'All'],
-                                                           name='b'))
-
-        all_normal_margins = pd.DataFrame([[0.2, 0, 0.2],
-                                           [0.2, 0.6, 0.8],
-                                           [0.4, 0.6, 1]],
-                                          index=pd.Index([1, 2, 'All'],
-                                                         name='a',
-                                                         dtype='object'),
-                                          columns=pd.Index([3, 4, 'All'],
-                                                           name='b'))
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='index',
-                                          margins=True), row_normal_margins)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize='columns',
-                                          margins=True), col_normal_margins)
-        tm.assert_frame_equal(pd.crosstab(df.a, df.b, normalize=True,
-                                          margins=True), all_normal_margins)
-
-        # Test arrays
-        pd.crosstab([np.array([1, 1, 2, 2]), np.array([1, 2, 1, 2])],
-                    np.array([1, 2, 1, 2]))
-
-        # Test with aggfunc
-        norm_counts = pd.DataFrame([[0.25, 0, 0.25],
-                                    [0.25, 0.5, 0.75],
-                                    [0.5, 0.5, 1]],
-                                   index=pd.Index([1, 2, 'All'],
-                                                  name='a',
-                                                  dtype='object'),
-                                   columns=pd.Index([3, 4, 'All'],
-                                                    name='b'))
-        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc='count',
-                                normalize='all',
-                                margins=True)
-        tm.assert_frame_equal(test_case, norm_counts)
-
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
-                           'c': [0, 4, np.nan, 3, 3]})
-
-        norm_sum = pd.DataFrame([[0, 0, 0.],
-                                 [0.4, 0.6, 1],
-                                 [0.4, 0.6, 1]],
-                                index=pd.Index([1, 2, 'All'],
-                                               name='a',
-                                               dtype='object'),
-                                columns=pd.Index([3, 4, 'All'],
-                                                 name='b',
-                                                 dtype='object'))
-        test_case = pd.crosstab(df.a, df.b, df.c, aggfunc=np.sum,
-                                normalize='all',
-                                margins=True)
-        tm.assert_frame_equal(test_case, norm_sum)
-
-    def test_crosstab_with_empties(self):
-        # Check handling of empties
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
-                           'c': [np.nan, np.nan, np.nan, np.nan, np.nan]})
-
-        empty = pd.DataFrame([[0.0, 0.0], [0.0, 0.0]],
-                             index=pd.Index([1, 2],
-                                            name='a',
-                                            dtype='int64'),
-                             columns=pd.Index([3, 4], name='b'))
-
-        for i in [True, 'index', 'columns']:
-            calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
-                                     normalize=i)
-            tm.assert_frame_equal(empty, calculated)
-
-        nans = pd.DataFrame([[0.0, np.nan], [0.0, 0.0]],
-                            index=pd.Index([1, 2],
-                                           name='a',
-                                           dtype='int64'),
-                            columns=pd.Index([3, 4], name='b'))
-
-        calculated = pd.crosstab(df.a, df.b, values=df.c, aggfunc='count',
-                                 normalize=False)
-        tm.assert_frame_equal(nans, calculated)
-
-    def test_crosstab_errors(self):
-        # Issue 12578
-
-        df = pd.DataFrame({'a': [1, 2, 2, 2, 2], 'b': [3, 3, 4, 4, 4],
-                           'c': [1, 1, np.nan, 1, 1]})
-
-        error = 'values cannot be used without an aggfunc.'
-        with tm.assertRaisesRegexp(ValueError, error):
-            pd.crosstab(df.a, df.b, values=df.c)
-
-        error = 'aggfunc cannot be used without values'
-        with tm.assertRaisesRegexp(ValueError, error):
-            pd.crosstab(df.a, df.b, aggfunc=np.mean)
-
-        error = 'Not a valid normalize argument'
-        with tm.assertRaisesRegexp(ValueError, error):
-            pd.crosstab(df.a, df.b, normalize='42')
-
-        with tm.assertRaisesRegexp(ValueError, error):
-            pd.crosstab(df.a, df.b, normalize=42)
-
-        error = 'Not a valid margins argument'
-        with tm.assertRaisesRegexp(ValueError, error):
-            pd.crosstab(df.a, df.b, normalize='all', margins=42)
-
-    def test_crosstab_with_categorial_columns(self):
-        # GH 8860
-        df = pd.DataFrame({'MAKE': ['Honda', 'Acura', 'Tesla',
-                                    'Honda', 'Honda', 'Acura'],
-                           'MODEL': ['Sedan', 'Sedan', 'Electric',
-                                     'Pickup', 'Sedan', 'Sedan']})
-        categories = ['Sedan', 'Electric', 'Pickup']
-        df['MODEL'] = (df['MODEL'].astype('category')
-                                  .cat.set_categories(categories))
-        result = pd.crosstab(df['MAKE'], df['MODEL'])
-
-        expected_index = pd.Index(['Acura', 'Honda', 'Tesla'], name='MAKE')
-        expected_columns = pd.CategoricalIndex(categories,
-                                               categories=categories,
-                                               ordered=False,
-                                               name='MODEL')
-        expected_data = [[2, 0, 0], [2, 0, 1], [0, 1, 0]]
-        expected = pd.DataFrame(expected_data,
-                                index=expected_index,
-                                columns=expected_columns)
-        tm.assert_frame_equal(result, expected)
-
-    def test_crosstab_with_numpy_size(self):
-        # GH 4003
-        df = pd.DataFrame({'A': ['one', 'one', 'two', 'three'] * 6,
-                           'B': ['A', 'B', 'C'] * 8,
-                           'C': ['foo', 'foo', 'foo', 'bar', 'bar', 'bar'] * 4,
-                           'D': np.random.randn(24),
-                           'E': np.random.randn(24)})
-        result = pd.crosstab(index=[df['A'], df['B']],
-                             columns=[df['C']],
-                             margins=True,
-                             aggfunc=np.size,
-                             values=df['D'])
-        expected_index = pd.MultiIndex(levels=[['All', 'one', 'three', 'two'],
-                                               ['', 'A', 'B', 'C']],
-                                       labels=[[1, 1, 1, 2, 2, 2, 3, 3, 3, 0],
-                                               [1, 2, 3, 1, 2, 3, 1, 2, 3, 0]],
-                                       names=['A', 'B'])
-        expected_column = pd.Index(['bar', 'foo', 'All'],
-                                   dtype='object',
-                                   name='C')
-        expected_data = np.array([[2., 2., 4.],
-                                  [2., 2., 4.],
-                                  [2., 2., 4.],
-                                  [2., np.nan, 2.],
-                                  [np.nan, 2., 2.],
-                                  [2., np.nan, 2.],
-                                  [np.nan, 2., 2.],
-                                  [2., np.nan, 2.],
-                                  [np.nan, 2., 2.],
-                                  [12., 12., 24.]])
-        expected = pd.DataFrame(expected_data,
-                                index=expected_index,
-                                columns=expected_column)
-        tm.assert_frame_equal(result, expected)
-
-
-class TestPivotAnnual(tm.TestCase):
-    """
-    New pandas of scikits.timeseries pivot_annual
-    """
-
-    def test_daily(self):
-        rng = date_range('1/1/2000', '12/31/2004', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            annual = pivot_annual(ts, 'D')
-
-        doy = np.asarray(ts.index.dayofyear)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            doy[(~isleapyear(ts.index.year)) & (doy >= 60)] += 1
-
-        for i in range(1, 367):
-            subset = ts[doy == i]
-            subset.index = [x.year for x in subset.index]
-
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-        # check leap days
-        leaps = ts[(ts.index.month == 2) & (ts.index.day == 29)]
-        day = leaps.index.dayofyear[0]
-        leaps.index = leaps.index.year
-        leaps.name = 60
-        tm.assert_series_equal(annual[day].dropna(), leaps)
-
-    def test_hourly(self):
-        rng_hourly = date_range('1/1/1994', periods=(18 * 8760 + 4 * 24),
-                                freq='H')
-        data_hourly = np.random.randint(100, 350, rng_hourly.size)
-        ts_hourly = Series(data_hourly, index=rng_hourly)
-
-        grouped = ts_hourly.groupby(ts_hourly.index.year)
-        hoy = grouped.apply(lambda x: x.reset_index(drop=True))
-        hoy = hoy.index.droplevel(0).values
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            hoy[~isleapyear(ts_hourly.index.year) & (hoy >= 1416)] += 24
-        hoy += 1
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            annual = pivot_annual(ts_hourly)
-
-        ts_hourly = ts_hourly.astype(float)
-        for i in [1, 1416, 1417, 1418, 1439, 1440, 1441, 8784]:
-            subset = ts_hourly[hoy == i]
-            subset.index = [x.year for x in subset.index]
-
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-        leaps = ts_hourly[(ts_hourly.index.month == 2) & (
-            ts_hourly.index.day == 29) & (ts_hourly.index.hour == 0)]
-        hour = leaps.index.dayofyear[0] * 24 - 23
-        leaps.index = leaps.index.year
-        leaps.name = 1417
-        tm.assert_series_equal(annual[hour].dropna(), leaps)
-
-    def test_weekly(self):
-        pass
-
-    def test_monthly(self):
-        rng = date_range('1/1/2000', '12/31/2004', freq='M')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            annual = pivot_annual(ts, 'M')
-
-        month = ts.index.month
-        for i in range(1, 13):
-            subset = ts[month == i]
-            subset.index = [x.year for x in subset.index]
-            result = annual[i].dropna()
-            tm.assert_series_equal(result, subset, check_names=False)
-            self.assertEqual(result.name, i)
-
-    def test_period_monthly(self):
-        pass
-
-    def test_period_daily(self):
-        pass
-
-    def test_period_weekly(self):
-        pass
-
-    def test_isleapyear_deprecate(self):
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertTrue(isleapyear(2000))
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertFalse(isleapyear(2001))
-
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertTrue(isleapyear(2004))
diff --git a/pandas/tests/tools/test_tile.py b/pandas/tests/tools/test_tile.py
deleted file mode 100644
index cc80c1ff5db29..0000000000000
--- a/pandas/tests/tools/test_tile.py
+++ /dev/null
@@ -1,427 +0,0 @@
-import os
-
-import numpy as np
-from pandas.compat import zip
-
-from pandas import Series, Index, Categorical
-import pandas.util.testing as tm
-from pandas.util.testing import assertRaisesRegexp
-import pandas.core.common as com
-
-from pandas.core.algorithms import quantile
-from pandas.tools.tile import cut, qcut
-import pandas.tools.tile as tmod
-from pandas import to_datetime, DatetimeIndex, Timestamp
-
-
-class TestCut(tm.TestCase):
-
-    def test_simple(self):
-        data = np.ones(5)
-        result = cut(data, 4, labels=False)
-        expected = np.array([1, 1, 1, 1, 1])
-        tm.assert_numpy_array_equal(result, expected,
-                                    check_dtype=False)
-
-    def test_bins(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1])
-        result, bins = cut(data, 3, retbins=True)
-
-        exp_codes = np.array([0, 0, 0, 1, 2, 0], dtype=np.int8)
-        tm.assert_numpy_array_equal(result.codes, exp_codes)
-        exp = np.array([0.1905, 3.36666667, 6.53333333, 9.7])
-        tm.assert_almost_equal(bins, exp)
-
-    def test_right(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
-        result, bins = cut(data, 4, right=True, retbins=True)
-        exp_codes = np.array([0, 0, 0, 2, 3, 0, 0], dtype=np.int8)
-        tm.assert_numpy_array_equal(result.codes, exp_codes)
-        exp = np.array([0.1905, 2.575, 4.95, 7.325, 9.7])
-        tm.assert_numpy_array_equal(bins, exp)
-
-    def test_noright(self):
-        data = np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1, 2.575])
-        result, bins = cut(data, 4, right=False, retbins=True)
-        exp_codes = np.array([0, 0, 0, 2, 3, 0, 1], dtype=np.int8)
-        tm.assert_numpy_array_equal(result.codes, exp_codes)
-        exp = np.array([0.2, 2.575, 4.95, 7.325, 9.7095])
-        tm.assert_almost_equal(bins, exp)
-
-    def test_arraylike(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        result, bins = cut(data, 3, retbins=True)
-        exp_codes = np.array([0, 0, 0, 1, 2, 0], dtype=np.int8)
-        tm.assert_numpy_array_equal(result.codes, exp_codes)
-        exp = np.array([0.1905, 3.36666667, 6.53333333, 9.7])
-        tm.assert_almost_equal(bins, exp)
-
-    def test_bins_not_monotonic(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        self.assertRaises(ValueError, cut, data, [0.1, 1.5, 1, 10])
-
-    def test_wrong_num_labels(self):
-        data = [.2, 1.4, 2.5, 6.2, 9.7, 2.1]
-        self.assertRaises(ValueError, cut, data, [0, 1, 10],
-                          labels=['foo', 'bar', 'baz'])
-
-    def test_cut_corner(self):
-        # h3h
-        self.assertRaises(ValueError, cut, [], 2)
-
-        self.assertRaises(ValueError, cut, [1, 2, 3], 0.5)
-
-    def test_cut_out_of_range_more(self):
-        # #1511
-        s = Series([0, -1, 0, 1, -3], name='x')
-        ind = cut(s, [0, 1], labels=False)
-        exp = Series([np.nan, np.nan, np.nan, 0, np.nan], name='x')
-        tm.assert_series_equal(ind, exp)
-
-    def test_labels(self):
-        arr = np.tile(np.arange(0, 1.01, 0.1), 4)
-
-        result, bins = cut(arr, 4, retbins=True)
-        ex_levels = Index(['(-0.001, 0.25]', '(0.25, 0.5]', '(0.5, 0.75]',
-                           '(0.75, 1]'])
-        self.assert_index_equal(result.categories, ex_levels)
-
-        result, bins = cut(arr, 4, retbins=True, right=False)
-        ex_levels = Index(['[0, 0.25)', '[0.25, 0.5)', '[0.5, 0.75)',
-                           '[0.75, 1.001)'])
-        self.assert_index_equal(result.categories, ex_levels)
-
-    def test_cut_pass_series_name_to_factor(self):
-        s = Series(np.random.randn(100), name='foo')
-
-        factor = cut(s, 4)
-        self.assertEqual(factor.name, 'foo')
-
-    def test_label_precision(self):
-        arr = np.arange(0, 0.73, 0.01)
-
-        result = cut(arr, 4, precision=2)
-        ex_levels = Index(['(-0.00072, 0.18]', '(0.18, 0.36]',
-                           '(0.36, 0.54]', '(0.54, 0.72]'])
-        self.assert_index_equal(result.categories, ex_levels)
-
-    def test_na_handling(self):
-        arr = np.arange(0, 0.75, 0.01)
-        arr[::3] = np.nan
-
-        result = cut(arr, 4)
-
-        result_arr = np.asarray(result)
-
-        ex_arr = np.where(com.isnull(arr), np.nan, result_arr)
-
-        tm.assert_almost_equal(result_arr, ex_arr)
-
-        result = cut(arr, 4, labels=False)
-        ex_result = np.where(com.isnull(arr), np.nan, result)
-        tm.assert_almost_equal(result, ex_result)
-
-    def test_inf_handling(self):
-        data = np.arange(6)
-        data_ser = Series(data, dtype='int64')
-
-        result = cut(data, [-np.inf, 2, 4, np.inf])
-        result_ser = cut(data_ser, [-np.inf, 2, 4, np.inf])
-
-        ex_categories = Index(['(-inf, 2]', '(2, 4]', '(4, inf]'])
-
-        tm.assert_index_equal(result.categories, ex_categories)
-        tm.assert_index_equal(result_ser.cat.categories, ex_categories)
-        self.assertEqual(result[5], '(4, inf]')
-        self.assertEqual(result[0], '(-inf, 2]')
-        self.assertEqual(result_ser[5], '(4, inf]')
-        self.assertEqual(result_ser[0], '(-inf, 2]')
-
-    def test_qcut(self):
-        arr = np.random.randn(1000)
-
-        labels, bins = qcut(arr, 4, retbins=True)
-        ex_bins = quantile(arr, [0, .25, .5, .75, 1.])
-        tm.assert_almost_equal(bins, ex_bins)
-
-        ex_levels = cut(arr, ex_bins, include_lowest=True)
-        self.assert_categorical_equal(labels, ex_levels)
-
-    def test_qcut_bounds(self):
-        arr = np.random.randn(1000)
-
-        factor = qcut(arr, 10, labels=False)
-        self.assertEqual(len(np.unique(factor)), 10)
-
-    def test_qcut_specify_quantiles(self):
-        arr = np.random.randn(100)
-
-        factor = qcut(arr, [0, .25, .5, .75, 1.])
-        expected = qcut(arr, 4)
-        tm.assert_categorical_equal(factor, expected)
-
-    def test_qcut_all_bins_same(self):
-        assertRaisesRegexp(ValueError, "edges.*unique", qcut,
-                           [0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 3)
-
-    def test_cut_out_of_bounds(self):
-        arr = np.random.randn(100)
-
-        result = cut(arr, [-1, 0, 1])
-
-        mask = result.codes == -1
-        ex_mask = (arr < -1) | (arr > 1)
-        self.assert_numpy_array_equal(mask, ex_mask)
-
-    def test_cut_pass_labels(self):
-        arr = [50, 5, 10, 15, 20, 30, 70]
-        bins = [0, 25, 50, 100]
-        labels = ['Small', 'Medium', 'Large']
-
-        result = cut(arr, bins, labels=labels)
-
-        exp = cut(arr, bins)
-        exp.categories = labels
-
-        tm.assert_categorical_equal(result, exp)
-
-    def test_qcut_include_lowest(self):
-        values = np.arange(10)
-
-        cats = qcut(values, 4)
-
-        ex_levels = ['[0, 2.25]', '(2.25, 4.5]', '(4.5, 6.75]', '(6.75, 9]']
-        self.assertTrue((cats.categories == ex_levels).all())
-
-    def test_qcut_nas(self):
-        arr = np.random.randn(100)
-        arr[:20] = np.nan
-
-        result = qcut(arr, 4)
-        self.assertTrue(com.isnull(result[:20]).all())
-
-    def test_label_formatting(self):
-        self.assertEqual(tmod._trim_zeros('1.000'), '1')
-
-        # it works
-        result = cut(np.arange(11.), 2)
-
-        result = cut(np.arange(11.) / 1e10, 2)
-
-        # #1979, negative numbers
-
-        result = tmod._format_label(-117.9998, precision=3)
-        self.assertEqual(result, '-118')
-        result = tmod._format_label(117.9998, precision=3)
-        self.assertEqual(result, '118')
-
-    def test_qcut_binning_issues(self):
-        # #1978, 1979
-        path = os.path.join(tm.get_data_path(), 'cut_data.csv')
-        arr = np.loadtxt(path)
-
-        result = qcut(arr, 20)
-
-        starts = []
-        ends = []
-        for lev in result.categories:
-            s, e = lev[1:-1].split(',')
-
-            self.assertTrue(s != e)
-
-            starts.append(float(s))
-            ends.append(float(e))
-
-        for (sp, sn), (ep, en) in zip(zip(starts[:-1], starts[1:]),
-                                      zip(ends[:-1], ends[1:])):
-            self.assertTrue(sp < sn)
-            self.assertTrue(ep < en)
-            self.assertTrue(ep <= sn)
-
-    def test_cut_return_categorical(self):
-        s = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
-        res = cut(s, 3)
-        exp = Series(Categorical.from_codes([0, 0, 0, 1, 1, 1, 2, 2, 2],
-                                            ["(-0.008, 2.667]",
-                                             "(2.667, 5.333]", "(5.333, 8]"],
-                                            ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_qcut_return_categorical(self):
-        s = Series([0, 1, 2, 3, 4, 5, 6, 7, 8])
-        res = qcut(s, [0, 0.333, 0.666, 1])
-        exp = Series(Categorical.from_codes([0, 0, 0, 1, 1, 1, 2, 2, 2],
-                                            ["[0, 2.664]",
-                                             "(2.664, 5.328]", "(5.328, 8]"],
-                                            ordered=True))
-        tm.assert_series_equal(res, exp)
-
-    def test_series_retbins(self):
-        # GH 8589
-        s = Series(np.arange(4))
-        result, bins = cut(s, 2, retbins=True)
-        tm.assert_numpy_array_equal(result.cat.codes.values,
-                                    np.array([0, 0, 1, 1], dtype=np.int8))
-        tm.assert_numpy_array_equal(bins, np.array([-0.003, 1.5, 3]))
-
-        result, bins = qcut(s, 2, retbins=True)
-        tm.assert_numpy_array_equal(result.cat.codes.values,
-                                    np.array([0, 0, 1, 1], dtype=np.int8))
-        tm.assert_numpy_array_equal(bins, np.array([0, 1.5, 3]))
-
-    def test_qcut_duplicates_bin(self):
-        # GH 7751
-        values = [0, 0, 0, 0, 1, 2, 3]
-        result_levels = ['[0, 1]', '(1, 3]']
-
-        cats = qcut(values, 3, duplicates='drop')
-        self.assertTrue((cats.categories == result_levels).all())
-
-        self.assertRaises(ValueError, qcut, values, 3)
-        self.assertRaises(ValueError, qcut, values, 3, duplicates='raise')
-
-        # invalid
-        self.assertRaises(ValueError, qcut, values, 3, duplicates='foo')
-
-    def test_single_quantile(self):
-        # issue 15431
-        expected = Series([0, 0])
-
-        s = Series([9., 9.])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0, 0], ["[9, 9]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-        s = Series([-9., -9.])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0, 0], ["[-9, -9]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-        s = Series([0., 0.])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0, 0], ["[0, 0]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-        expected = Series([0])
-
-        s = Series([9])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0], ["[9, 9]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-        s = Series([-9])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0], ["[-9, -9]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-        s = Series([0])
-        result = qcut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-        result = qcut(s, 1)
-        exp_lab = Series(Categorical.from_codes([0], ["[0, 0]"],
-                                                ordered=True))
-        tm.assert_series_equal(result, exp_lab)
-
-    def test_single_bin(self):
-        # issue 14652
-        expected = Series([0, 0])
-
-        s = Series([9., 9.])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-        s = Series([-9., -9.])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-        expected = Series([0])
-
-        s = Series([9])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-        s = Series([-9])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-        # issue 15428
-        expected = Series([0, 0])
-
-        s = Series([0., 0.])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-        expected = Series([0])
-
-        s = Series([0])
-        result = cut(s, 1, labels=False)
-        tm.assert_series_equal(result, expected)
-
-    def test_datetime_cut(self):
-        # GH 14714
-        # testing for time data to be present as series
-        data = to_datetime(Series(['2013-01-01', '2013-01-02', '2013-01-03']))
-        result, bins = cut(data, 3, retbins=True)
-        expected = Series(['(2012-12-31 23:57:07.200000, 2013-01-01 16:00:00]',
-                           '(2013-01-01 16:00:00, 2013-01-02 08:00:00]',
-                           '(2013-01-02 08:00:00, 2013-01-03 00:00:00]'],
-                          ).astype("category", ordered=True)
-        tm.assert_series_equal(result, expected)
-
-        # testing for time data to be present as list
-        data = [np.datetime64('2013-01-01'), np.datetime64('2013-01-02'),
-                np.datetime64('2013-01-03')]
-        result, bins = cut(data, 3, retbins=True)
-        tm.assert_series_equal(Series(result), expected)
-
-        # testing for time data to be present as ndarray
-        data = np.array([np.datetime64('2013-01-01'),
-                         np.datetime64('2013-01-02'),
-                         np.datetime64('2013-01-03')])
-        result, bins = cut(data, 3, retbins=True)
-        tm.assert_series_equal(Series(result), expected)
-
-        # testing for time data to be present as datetime index
-        data = DatetimeIndex(['2013-01-01', '2013-01-02', '2013-01-03'])
-        result, bins = cut(data, 3, retbins=True)
-        tm.assert_series_equal(Series(result), expected)
-
-    def test_datetime_bin(self):
-        data = [np.datetime64('2012-12-13'), np.datetime64('2012-12-15')]
-        bin_data = ['2012-12-12', '2012-12-14', '2012-12-16']
-        expected = Series(['(2012-12-12 00:00:00, 2012-12-14 00:00:00]',
-                           '(2012-12-14 00:00:00, 2012-12-16 00:00:00]'],
-                          ).astype("category", ordered=True)
-
-        for conv in [Timestamp, Timestamp, np.datetime64]:
-            bins = [conv(v) for v in bin_data]
-            result = cut(data, bins=bins)
-            tm.assert_series_equal(Series(result), expected)
-
-        bin_pydatetime = [Timestamp(v).to_pydatetime() for v in bin_data]
-        result = cut(data, bins=bin_pydatetime)
-        tm.assert_series_equal(Series(result), expected)
-
-        bins = to_datetime(bin_data)
-        result = cut(data, bins=bin_pydatetime)
-        tm.assert_series_equal(Series(result), expected)
-
-
-def curpath():
-    pth, _ = os.path.split(os.path.abspath(__file__))
-    return pth
diff --git a/pandas/tests/tools/test_util.py b/pandas/tests/tools/test_util.py
deleted file mode 100644
index ed64e8f42d84b..0000000000000
--- a/pandas/tests/tools/test_util.py
+++ /dev/null
@@ -1,485 +0,0 @@
-import os
-import locale
-import codecs
-import pytest
-import decimal
-
-import numpy as np
-from numpy import iinfo
-
-import pandas as pd
-from pandas import (date_range, Index, _np_version_under1p9)
-import pandas.util.testing as tm
-from pandas.tools.util import cartesian_product, to_numeric
-
-CURRENT_LOCALE = locale.getlocale()
-LOCALE_OVERRIDE = os.environ.get('LOCALE_OVERRIDE', None)
-
-
-class TestCartesianProduct(tm.TestCase):
-
-    def test_simple(self):
-        x, y = list('ABC'), [1, 22]
-        result1, result2 = cartesian_product([x, y])
-        expected1 = np.array(['A', 'A', 'B', 'B', 'C', 'C'])
-        expected2 = np.array([1, 22, 1, 22, 1, 22])
-        tm.assert_numpy_array_equal(result1, expected1)
-        tm.assert_numpy_array_equal(result2, expected2)
-
-    def test_datetimeindex(self):
-        # regression test for GitHub issue #6439
-        # make sure that the ordering on datetimeindex is consistent
-        x = date_range('2000-01-01', periods=2)
-        result1, result2 = [Index(y).day for y in cartesian_product([x, x])]
-        expected1 = Index([1, 1, 2, 2])
-        expected2 = Index([1, 2, 1, 2])
-        tm.assert_index_equal(result1, expected1)
-        tm.assert_index_equal(result2, expected2)
-
-    def test_empty(self):
-        # product of empty factors
-        X = [[], [0, 1], []]
-        Y = [[], [], ['a', 'b', 'c']]
-        for x, y in zip(X, Y):
-            expected1 = np.array([], dtype=np.asarray(x).dtype)
-            expected2 = np.array([], dtype=np.asarray(y).dtype)
-            result1, result2 = cartesian_product([x, y])
-            tm.assert_numpy_array_equal(result1, expected1)
-            tm.assert_numpy_array_equal(result2, expected2)
-
-        # empty product (empty input):
-        result = cartesian_product([])
-        expected = []
-        tm.assert_equal(result, expected)
-
-    def test_invalid_input(self):
-        invalid_inputs = [1, [1], [1, 2], [[1], 2],
-                          'a', ['a'], ['a', 'b'], [['a'], 'b']]
-        msg = "Input must be a list-like of list-likes"
-        for X in invalid_inputs:
-            tm.assertRaisesRegexp(TypeError, msg, cartesian_product, X=X)
-
-
-class TestLocaleUtils(tm.TestCase):
-
-    @classmethod
-    def setUpClass(cls):
-        super(TestLocaleUtils, cls).setUpClass()
-        cls.locales = tm.get_locales()
-
-        if not cls.locales:
-            pytest.skip("No locales found")
-
-        tm._skip_if_windows()
-
-    @classmethod
-    def tearDownClass(cls):
-        super(TestLocaleUtils, cls).tearDownClass()
-        del cls.locales
-
-    def test_get_locales(self):
-        # all systems should have at least a single locale
-        assert len(tm.get_locales()) > 0
-
-    def test_get_locales_prefix(self):
-        if len(self.locales) == 1:
-            pytest.skip("Only a single locale found, no point in "
-                        "trying to test filtering locale prefixes")
-        first_locale = self.locales[0]
-        assert len(tm.get_locales(prefix=first_locale[:2])) > 0
-
-    def test_set_locale(self):
-        if len(self.locales) == 1:
-            pytest.skip("Only a single locale found, no point in "
-                        "trying to test setting another locale")
-
-        if all(x is None for x in CURRENT_LOCALE):
-            # Not sure why, but on some travis runs with pytest,
-            # getlocale() returned (None, None).
-            pytest.skip("CURRENT_LOCALE is not set.")
-
-        if LOCALE_OVERRIDE is None:
-            lang, enc = 'it_CH', 'UTF-8'
-        elif LOCALE_OVERRIDE == 'C':
-            lang, enc = 'en_US', 'ascii'
-        else:
-            lang, enc = LOCALE_OVERRIDE.split('.')
-
-        enc = codecs.lookup(enc).name
-        new_locale = lang, enc
-
-        if not tm._can_set_locale(new_locale):
-            with tm.assertRaises(locale.Error):
-                with tm.set_locale(new_locale):
-                    pass
-        else:
-            with tm.set_locale(new_locale) as normalized_locale:
-                new_lang, new_enc = normalized_locale.split('.')
-                new_enc = codecs.lookup(enc).name
-                normalized_locale = new_lang, new_enc
-                self.assertEqual(normalized_locale, new_locale)
-
-        current_locale = locale.getlocale()
-        self.assertEqual(current_locale, CURRENT_LOCALE)
-
-
-class TestToNumeric(tm.TestCase):
-
-    def test_series(self):
-        s = pd.Series(['1', '-3.14', '7'])
-        res = to_numeric(s)
-        expected = pd.Series([1, -3.14, 7])
-        tm.assert_series_equal(res, expected)
-
-        s = pd.Series(['1', '-3.14', 7])
-        res = to_numeric(s)
-        tm.assert_series_equal(res, expected)
-
-    def test_series_numeric(self):
-        s = pd.Series([1, 3, 4, 5], index=list('ABCD'), name='XXX')
-        res = to_numeric(s)
-        tm.assert_series_equal(res, s)
-
-        s = pd.Series([1., 3., 4., 5.], index=list('ABCD'), name='XXX')
-        res = to_numeric(s)
-        tm.assert_series_equal(res, s)
-
-        # bool is regarded as numeric
-        s = pd.Series([True, False, True, True],
-                      index=list('ABCD'), name='XXX')
-        res = to_numeric(s)
-        tm.assert_series_equal(res, s)
-
-    def test_error(self):
-        s = pd.Series([1, -3.14, 'apple'])
-        msg = 'Unable to parse string "apple" at position 2'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            to_numeric(s, errors='raise')
-
-        res = to_numeric(s, errors='ignore')
-        expected = pd.Series([1, -3.14, 'apple'])
-        tm.assert_series_equal(res, expected)
-
-        res = to_numeric(s, errors='coerce')
-        expected = pd.Series([1, -3.14, np.nan])
-        tm.assert_series_equal(res, expected)
-
-        s = pd.Series(['orange', 1, -3.14, 'apple'])
-        msg = 'Unable to parse string "orange" at position 0'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            to_numeric(s, errors='raise')
-
-    def test_error_seen_bool(self):
-        s = pd.Series([True, False, 'apple'])
-        msg = 'Unable to parse string "apple" at position 2'
-        with tm.assertRaisesRegexp(ValueError, msg):
-            to_numeric(s, errors='raise')
-
-        res = to_numeric(s, errors='ignore')
-        expected = pd.Series([True, False, 'apple'])
-        tm.assert_series_equal(res, expected)
-
-        # coerces to float
-        res = to_numeric(s, errors='coerce')
-        expected = pd.Series([1., 0., np.nan])
-        tm.assert_series_equal(res, expected)
-
-    def test_list(self):
-        s = ['1', '-3.14', '7']
-        res = to_numeric(s)
-        expected = np.array([1, -3.14, 7])
-        tm.assert_numpy_array_equal(res, expected)
-
-    def test_list_numeric(self):
-        s = [1, 3, 4, 5]
-        res = to_numeric(s)
-        tm.assert_numpy_array_equal(res, np.array(s, dtype=np.int64))
-
-        s = [1., 3., 4., 5.]
-        res = to_numeric(s)
-        tm.assert_numpy_array_equal(res, np.array(s))
-
-        # bool is regarded as numeric
-        s = [True, False, True, True]
-        res = to_numeric(s)
-        tm.assert_numpy_array_equal(res, np.array(s))
-
-    def test_numeric(self):
-        s = pd.Series([1, -3.14, 7], dtype='O')
-        res = to_numeric(s)
-        expected = pd.Series([1, -3.14, 7])
-        tm.assert_series_equal(res, expected)
-
-        s = pd.Series([1, -3.14, 7])
-        res = to_numeric(s)
-        tm.assert_series_equal(res, expected)
-
-        # GH 14827
-        df = pd.DataFrame(dict(
-            a=[1.2, decimal.Decimal(3.14), decimal.Decimal("infinity"), '0.1'],
-            b=[1.0, 2.0, 3.0, 4.0],
-        ))
-        expected = pd.DataFrame(dict(
-            a=[1.2, 3.14, np.inf, 0.1],
-            b=[1.0, 2.0, 3.0, 4.0],
-        ))
-
-        # Test to_numeric over one column
-        df_copy = df.copy()
-        df_copy['a'] = df_copy['a'].apply(to_numeric)
-        tm.assert_frame_equal(df_copy, expected)
-
-        # Test to_numeric over multiple columns
-        df_copy = df.copy()
-        df_copy[['a', 'b']] = df_copy[['a', 'b']].apply(to_numeric)
-        tm.assert_frame_equal(df_copy, expected)
-
-    def test_numeric_lists_and_arrays(self):
-        # Test to_numeric with embedded lists and arrays
-        df = pd.DataFrame(dict(
-            a=[[decimal.Decimal(3.14), 1.0], decimal.Decimal(1.6), 0.1]
-        ))
-        df['a'] = df['a'].apply(to_numeric)
-        expected = pd.DataFrame(dict(
-            a=[[3.14, 1.0], 1.6, 0.1],
-        ))
-        tm.assert_frame_equal(df, expected)
-
-        df = pd.DataFrame(dict(
-            a=[np.array([decimal.Decimal(3.14), 1.0]), 0.1]
-        ))
-        df['a'] = df['a'].apply(to_numeric)
-        expected = pd.DataFrame(dict(
-            a=[[3.14, 1.0], 0.1],
-        ))
-        tm.assert_frame_equal(df, expected)
-
-    def test_all_nan(self):
-        s = pd.Series(['a', 'b', 'c'])
-        res = to_numeric(s, errors='coerce')
-        expected = pd.Series([np.nan, np.nan, np.nan])
-        tm.assert_series_equal(res, expected)
-
-    def test_type_check(self):
-        # GH 11776
-        df = pd.DataFrame({'a': [1, -3.14, 7], 'b': ['4', '5', '6']})
-        with tm.assertRaisesRegexp(TypeError, "1-d array"):
-            to_numeric(df)
-        for errors in ['ignore', 'raise', 'coerce']:
-            with tm.assertRaisesRegexp(TypeError, "1-d array"):
-                to_numeric(df, errors=errors)
-
-    def test_scalar(self):
-        self.assertEqual(pd.to_numeric(1), 1)
-        self.assertEqual(pd.to_numeric(1.1), 1.1)
-
-        self.assertEqual(pd.to_numeric('1'), 1)
-        self.assertEqual(pd.to_numeric('1.1'), 1.1)
-
-        with tm.assertRaises(ValueError):
-            to_numeric('XX', errors='raise')
-
-        self.assertEqual(to_numeric('XX', errors='ignore'), 'XX')
-        self.assertTrue(np.isnan(to_numeric('XX', errors='coerce')))
-
-    def test_numeric_dtypes(self):
-        idx = pd.Index([1, 2, 3], name='xxx')
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, idx)
-
-        res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        tm.assert_series_equal(res, pd.Series(idx, name='xxx'))
-
-        res = pd.to_numeric(idx.values)
-        tm.assert_numpy_array_equal(res, idx.values)
-
-        idx = pd.Index([1., np.nan, 3., np.nan], name='xxx')
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, idx)
-
-        res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        tm.assert_series_equal(res, pd.Series(idx, name='xxx'))
-
-        res = pd.to_numeric(idx.values)
-        tm.assert_numpy_array_equal(res, idx.values)
-
-    def test_str(self):
-        idx = pd.Index(['1', '2', '3'], name='xxx')
-        exp = np.array([1, 2, 3], dtype='int64')
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, pd.Index(exp, name='xxx'))
-
-        res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        tm.assert_series_equal(res, pd.Series(exp, name='xxx'))
-
-        res = pd.to_numeric(idx.values)
-        tm.assert_numpy_array_equal(res, exp)
-
-        idx = pd.Index(['1.5', '2.7', '3.4'], name='xxx')
-        exp = np.array([1.5, 2.7, 3.4])
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, pd.Index(exp, name='xxx'))
-
-        res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        tm.assert_series_equal(res, pd.Series(exp, name='xxx'))
-
-        res = pd.to_numeric(idx.values)
-        tm.assert_numpy_array_equal(res, exp)
-
-    def test_datetimelike(self):
-        for tz in [None, 'US/Eastern', 'Asia/Tokyo']:
-            idx = pd.date_range('20130101', periods=3, tz=tz, name='xxx')
-            res = pd.to_numeric(idx)
-            tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
-
-            res = pd.to_numeric(pd.Series(idx, name='xxx'))
-            tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
-
-            res = pd.to_numeric(idx.values)
-            tm.assert_numpy_array_equal(res, idx.asi8)
-
-    def test_timedelta(self):
-        idx = pd.timedelta_range('1 days', periods=3, freq='D', name='xxx')
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
-
-        res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
-
-        res = pd.to_numeric(idx.values)
-        tm.assert_numpy_array_equal(res, idx.asi8)
-
-    def test_period(self):
-        idx = pd.period_range('2011-01', periods=3, freq='M', name='xxx')
-        res = pd.to_numeric(idx)
-        tm.assert_index_equal(res, pd.Index(idx.asi8, name='xxx'))
-
-        # ToDo: enable when we can support native PeriodDtype
-        # res = pd.to_numeric(pd.Series(idx, name='xxx'))
-        # tm.assert_series_equal(res, pd.Series(idx.asi8, name='xxx'))
-
-    def test_non_hashable(self):
-        # Test for Bug #13324
-        s = pd.Series([[10.0, 2], 1.0, 'apple'])
-        res = pd.to_numeric(s, errors='coerce')
-        tm.assert_series_equal(res, pd.Series([np.nan, 1.0, np.nan]))
-
-        res = pd.to_numeric(s, errors='ignore')
-        tm.assert_series_equal(res, pd.Series([[10.0, 2], 1.0, 'apple']))
-
-        with self.assertRaisesRegexp(TypeError, "Invalid object type"):
-            pd.to_numeric(s)
-
-    def test_downcast(self):
-        # see gh-13352
-        mixed_data = ['1', 2, 3]
-        int_data = [1, 2, 3]
-        date_data = np.array(['1970-01-02', '1970-01-03',
-                              '1970-01-04'], dtype='datetime64[D]')
-
-        invalid_downcast = 'unsigned-integer'
-        msg = 'invalid downcasting method provided'
-
-        smallest_int_dtype = np.dtype(np.typecodes['Integer'][0])
-        smallest_uint_dtype = np.dtype(np.typecodes['UnsignedInteger'][0])
-
-        # support below np.float32 is rare and far between
-        float_32_char = np.dtype(np.float32).char
-        smallest_float_dtype = float_32_char
-
-        for data in (mixed_data, int_data, date_data):
-            with self.assertRaisesRegexp(ValueError, msg):
-                pd.to_numeric(data, downcast=invalid_downcast)
-
-            expected = np.array([1, 2, 3], dtype=np.int64)
-
-            res = pd.to_numeric(data)
-            tm.assert_numpy_array_equal(res, expected)
-
-            res = pd.to_numeric(data, downcast=None)
-            tm.assert_numpy_array_equal(res, expected)
-
-            expected = np.array([1, 2, 3], dtype=smallest_int_dtype)
-
-            for signed_downcast in ('integer', 'signed'):
-                res = pd.to_numeric(data, downcast=signed_downcast)
-                tm.assert_numpy_array_equal(res, expected)
-
-            expected = np.array([1, 2, 3], dtype=smallest_uint_dtype)
-            res = pd.to_numeric(data, downcast='unsigned')
-            tm.assert_numpy_array_equal(res, expected)
-
-            expected = np.array([1, 2, 3], dtype=smallest_float_dtype)
-            res = pd.to_numeric(data, downcast='float')
-            tm.assert_numpy_array_equal(res, expected)
-
-        # if we can't successfully cast the given
-        # data to a numeric dtype, do not bother
-        # with the downcast parameter
-        data = ['foo', 2, 3]
-        expected = np.array(data, dtype=object)
-        res = pd.to_numeric(data, errors='ignore',
-                            downcast='unsigned')
-        tm.assert_numpy_array_equal(res, expected)
-
-        # cannot cast to an unsigned integer because
-        # we have a negative number
-        data = ['-1', 2, 3]
-        expected = np.array([-1, 2, 3], dtype=np.int64)
-        res = pd.to_numeric(data, downcast='unsigned')
-        tm.assert_numpy_array_equal(res, expected)
-
-        # cannot cast to an integer (signed or unsigned)
-        # because we have a float number
-        data = (['1.1', 2, 3],
-                [10000.0, 20000, 3000, 40000.36, 50000, 50000.00])
-        expected = (np.array([1.1, 2, 3], dtype=np.float64),
-                    np.array([10000.0, 20000, 3000,
-                              40000.36, 50000, 50000.00], dtype=np.float64))
-
-        for _data, _expected in zip(data, expected):
-            for downcast in ('integer', 'signed', 'unsigned'):
-                res = pd.to_numeric(_data, downcast=downcast)
-                tm.assert_numpy_array_equal(res, _expected)
-
-        # the smallest integer dtype need not be np.(u)int8
-        data = ['256', 257, 258]
-
-        for downcast, expected_dtype in zip(
-                ['integer', 'signed', 'unsigned'],
-                [np.int16, np.int16, np.uint16]):
-            expected = np.array([256, 257, 258], dtype=expected_dtype)
-            res = pd.to_numeric(data, downcast=downcast)
-            tm.assert_numpy_array_equal(res, expected)
-
-    def test_downcast_limits(self):
-        # Test the limits of each downcast. Bug: #14401.
-        # Check to make sure numpy is new enough to run this test.
-        if _np_version_under1p9:
-            pytest.skip("Numpy version is under 1.9")
-
-        i = 'integer'
-        u = 'unsigned'
-        dtype_downcast_min_max = [
-            ('int8', i, [iinfo(np.int8).min, iinfo(np.int8).max]),
-            ('int16', i, [iinfo(np.int16).min, iinfo(np.int16).max]),
-            ('int32', i, [iinfo(np.int32).min, iinfo(np.int32).max]),
-            ('int64', i, [iinfo(np.int64).min, iinfo(np.int64).max]),
-            ('uint8', u, [iinfo(np.uint8).min, iinfo(np.uint8).max]),
-            ('uint16', u, [iinfo(np.uint16).min, iinfo(np.uint16).max]),
-            ('uint32', u, [iinfo(np.uint32).min, iinfo(np.uint32).max]),
-            ('uint64', u, [iinfo(np.uint64).min, iinfo(np.uint64).max]),
-            ('int16', i, [iinfo(np.int8).min, iinfo(np.int8).max + 1]),
-            ('int32', i, [iinfo(np.int16).min, iinfo(np.int16).max + 1]),
-            ('int64', i, [iinfo(np.int32).min, iinfo(np.int32).max + 1]),
-            ('int16', i, [iinfo(np.int8).min - 1, iinfo(np.int16).max]),
-            ('int32', i, [iinfo(np.int16).min - 1, iinfo(np.int32).max]),
-            ('int64', i, [iinfo(np.int32).min - 1, iinfo(np.int64).max]),
-            ('uint16', u, [iinfo(np.uint8).min, iinfo(np.uint8).max + 1]),
-            ('uint32', u, [iinfo(np.uint16).min, iinfo(np.uint16).max + 1]),
-            ('uint64', u, [iinfo(np.uint32).min, iinfo(np.uint32).max + 1])
-        ]
-
-        for dtype, downcast, min_max in dtype_downcast_min_max:
-            series = pd.to_numeric(pd.Series(min_max), downcast=downcast)
-            tm.assert_equal(series.dtype, dtype)
diff --git a/pandas/tests/tseries/frequencies/__init__.py b/pandas/tests/tseries/frequencies/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tseries/frequencies/test_freq_code.py b/pandas/tests/tseries/frequencies/test_freq_code.py
new file mode 100644
index 0000000000000..0aa29e451b1ba
--- /dev/null
+++ b/pandas/tests/tseries/frequencies/test_freq_code.py
@@ -0,0 +1,149 @@
+import pytest
+
+from pandas._libs.tslibs import frequencies as libfrequencies, resolution
+from pandas._libs.tslibs.frequencies import (
+    FreqGroup, _period_code_map, get_freq, get_freq_code)
+import pandas.compat as compat
+
+import pandas.tseries.offsets as offsets
+
+
+@pytest.fixture(params=list(compat.iteritems(_period_code_map)))
+def period_code_item(request):
+    return request.param
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("A", 1000), ("3A", 1000), ("-1A", 1000),
+    ("Y", 1000), ("3Y", 1000), ("-1Y", 1000),
+    ("W", 4000), ("W-MON", 4001), ("W-FRI", 4005)
+])
+def test_freq_code(freqstr, expected):
+    assert get_freq(freqstr) == expected
+
+
+def test_freq_code_match(period_code_item):
+    freqstr, code = period_code_item
+    assert get_freq(freqstr) == code
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("A", 1000), ("3A", 1000), ("-1A", 1000), ("A-JAN", 1000),
+    ("A-MAY", 1000), ("Y", 1000), ("3Y", 1000), ("-1Y", 1000),
+    ("Y-JAN", 1000), ("Y-MAY", 1000), (offsets.YearEnd(), 1000),
+    (offsets.YearEnd(month=1), 1000), (offsets.YearEnd(month=5), 1000),
+    ("W", 4000), ("W-MON", 4000), ("W-FRI", 4000), (offsets.Week(), 4000),
+    (offsets.Week(weekday=1), 4000), (offsets.Week(weekday=5), 4000),
+    ("T", FreqGroup.FR_MIN),
+])
+def test_freq_group(freqstr, expected):
+    assert resolution.get_freq_group(freqstr) == expected
+
+
+def test_freq_group_match(period_code_item):
+    freqstr, code = period_code_item
+
+    str_group = resolution.get_freq_group(freqstr)
+    code_group = resolution.get_freq_group(code)
+
+    assert str_group == code_group == code // 1000 * 1000
+
+
+@pytest.mark.parametrize("freqstr,exp_freqstr", [
+    ("D", "D"), ("W", "D"), ("M", "D"),
+    ("S", "S"), ("T", "S"), ("H", "S")
+])
+def test_get_to_timestamp_base(freqstr, exp_freqstr):
+    tsb = libfrequencies.get_to_timestamp_base
+
+    assert tsb(get_freq_code(freqstr)[0]) == get_freq_code(exp_freqstr)[0]
+
+
+_reso = resolution.Resolution
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("A", "year"), ("Q", "quarter"), ("M", "month"),
+    ("D", "day"), ("H", "hour"), ("T", "minute"),
+    ("S", "second"), ("L", "millisecond"),
+    ("U", "microsecond"), ("N", "nanosecond")
+])
+def test_get_str_from_freq(freqstr, expected):
+    assert _reso.get_str_from_freq(freqstr) == expected
+
+
+@pytest.mark.parametrize("freq", ["A", "Q", "M", "D", "H",
+                                  "T", "S", "L", "U", "N"])
+def test_get_freq_roundtrip(freq):
+    result = _reso.get_freq(_reso.get_str_from_freq(freq))
+    assert freq == result
+
+
+@pytest.mark.parametrize("freq", ["D", "H", "T", "S", "L", "U"])
+def test_get_freq_roundtrip2(freq):
+    result = _reso.get_freq(_reso.get_str(_reso.get_reso_from_freq(freq)))
+    assert freq == result
+
+
+@pytest.mark.parametrize("args,expected", [
+    ((1.5, "T"), (90, "S")), ((62.4, "T"), (3744, "S")),
+    ((1.04, "H"), (3744, "S")), ((1, "D"), (1, "D")),
+    ((0.342931, "H"), (1234551600, "U")), ((1.2345, "D"), (106660800, "L"))
+])
+def test_resolution_bumping(args, expected):
+    # see gh-14378
+    assert _reso.get_stride_from_decimal(*args) == expected
+
+
+@pytest.mark.parametrize("args", [
+    (0.5, "N"),
+
+    # Too much precision in the input can prevent.
+    (0.3429324798798269273987982, "H")
+])
+def test_cat(args):
+    msg = "Could not convert to integer offset at any resolution"
+
+    with pytest.raises(ValueError, match=msg):
+        _reso.get_stride_from_decimal(*args)
+
+
+@pytest.mark.parametrize("freq_input,expected", [
+    # Frequency string.
+    ("A", (get_freq("A"), 1)),
+    ("3D", (get_freq("D"), 3)),
+    ("-2M", (get_freq("M"), -2)),
+
+    # Tuple.
+    (("D", 1), (get_freq("D"), 1)),
+    (("A", 3), (get_freq("A"), 3)),
+    (("M", -2), (get_freq("M"), -2)),
+    ((5, "T"), (FreqGroup.FR_MIN, 5)),
+
+    # Numeric Tuple.
+    ((1000, 1), (1000, 1)),
+
+    # Offsets.
+    (offsets.Day(), (get_freq("D"), 1)),
+    (offsets.Day(3), (get_freq("D"), 3)),
+    (offsets.Day(-2), (get_freq("D"), -2)),
+    (offsets.MonthEnd(), (get_freq("M"), 1)),
+    (offsets.MonthEnd(3), (get_freq("M"), 3)),
+    (offsets.MonthEnd(-2), (get_freq("M"), -2)),
+    (offsets.Week(), (get_freq("W"), 1)),
+    (offsets.Week(3), (get_freq("W"), 3)),
+    (offsets.Week(-2), (get_freq("W"), -2)),
+    (offsets.Hour(), (FreqGroup.FR_HR, 1)),
+
+    # Monday is weekday=0.
+    (offsets.Week(weekday=1), (get_freq("W-TUE"), 1)),
+    (offsets.Week(3, weekday=0), (get_freq("W-MON"), 3)),
+    (offsets.Week(-2, weekday=4), (get_freq("W-FRI"), -2)),
+])
+def test_get_freq_code(freq_input, expected):
+    assert get_freq_code(freq_input) == expected
+
+
+def test_get_code_invalid():
+    with pytest.raises(ValueError, match="Invalid frequency"):
+        get_freq_code((5, "baz"))
diff --git a/pandas/tests/tseries/frequencies/test_inference.py b/pandas/tests/tseries/frequencies/test_inference.py
new file mode 100644
index 0000000000000..9e7ddbc45bba8
--- /dev/null
+++ b/pandas/tests/tseries/frequencies/test_inference.py
@@ -0,0 +1,406 @@
+from datetime import datetime, timedelta
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs.ccalendar import DAYS, MONTHS
+from pandas._libs.tslibs.frequencies import INVALID_FREQ_ERR_MSG
+import pandas.compat as compat
+from pandas.compat import is_platform_windows, range
+
+from pandas import (
+    DatetimeIndex, Index, Series, Timestamp, date_range, period_range)
+from pandas.core.tools.datetimes import to_datetime
+import pandas.util.testing as tm
+
+import pandas.tseries.frequencies as frequencies
+import pandas.tseries.offsets as offsets
+
+
+def _check_generated_range(start, periods, freq):
+    """
+    Check the range generated from a given start, frequency, and period count.
+
+    Parameters
+    ----------
+    start : str
+        The start date.
+    periods : int
+        The number of periods.
+    freq : str
+        The frequency of the range.
+    """
+    freq = freq.upper()
+
+    gen = date_range(start, periods=periods, freq=freq)
+    index = DatetimeIndex(gen.values)
+
+    if not freq.startswith("Q-"):
+        assert frequencies.infer_freq(index) == gen.freqstr
+    else:
+        inf_freq = frequencies.infer_freq(index)
+        is_dec_range = inf_freq == "Q-DEC" and gen.freqstr in (
+            "Q", "Q-DEC", "Q-SEP", "Q-JUN", "Q-MAR")
+        is_nov_range = inf_freq == "Q-NOV" and gen.freqstr in (
+            "Q-NOV", "Q-AUG", "Q-MAY", "Q-FEB")
+        is_oct_range = inf_freq == "Q-OCT" and gen.freqstr in (
+            "Q-OCT", "Q-JUL", "Q-APR", "Q-JAN")
+        assert is_dec_range or is_nov_range or is_oct_range
+
+
+@pytest.fixture(params=[(timedelta(1), "D"),
+                        (timedelta(hours=1), "H"),
+                        (timedelta(minutes=1), "T"),
+                        (timedelta(seconds=1), "S"),
+                        (np.timedelta64(1, "ns"), "N"),
+                        (timedelta(microseconds=1), "U"),
+                        (timedelta(microseconds=1000), "L")])
+def base_delta_code_pair(request):
+    return request.param
+
+
+@pytest.fixture(params=[1, 2, 3, 4])
+def count(request):
+    return request.param
+
+
+@pytest.fixture(params=DAYS)
+def day(request):
+    return request.param
+
+
+@pytest.fixture(params=MONTHS)
+def month(request):
+    return request.param
+
+
+@pytest.fixture(params=[5, 7])
+def periods(request):
+    return request.param
+
+
+def test_raise_if_period_index():
+    index = period_range(start="1/1/1990", periods=20, freq="M")
+    msg = "Check the `freq` attribute instead of using infer_freq"
+
+    with pytest.raises(TypeError, match=msg):
+        frequencies.infer_freq(index)
+
+
+def test_raise_if_too_few():
+    index = DatetimeIndex(["12/31/1998", "1/3/1999"])
+    msg = "Need at least 3 dates to infer frequency"
+
+    with pytest.raises(ValueError, match=msg):
+        frequencies.infer_freq(index)
+
+
+def test_business_daily():
+    index = DatetimeIndex(["01/01/1999", "1/4/1999", "1/5/1999"])
+    assert frequencies.infer_freq(index) == "B"
+
+
+def test_business_daily_look_alike():
+    # see gh-16624
+    #
+    # Do not infer "B when "weekend" (2-day gap) in wrong place.
+    index = DatetimeIndex(["12/31/1998", "1/3/1999", "1/4/1999"])
+    assert frequencies.infer_freq(index) is None
+
+
+def test_day_corner():
+    index = DatetimeIndex(["1/1/2000", "1/2/2000", "1/3/2000"])
+    assert frequencies.infer_freq(index) == "D"
+
+
+def test_non_datetime_index():
+    dates = to_datetime(["1/1/2000", "1/2/2000", "1/3/2000"])
+    assert frequencies.infer_freq(dates) == "D"
+
+
+def test_fifth_week_of_month_infer():
+    # see gh-9425
+    #
+    # Only attempt to infer up to WOM-4.
+    index = DatetimeIndex(["2014-03-31", "2014-06-30", "2015-03-30"])
+    assert frequencies.infer_freq(index) is None
+
+
+def test_week_of_month_fake():
+    # All of these dates are on same day
+    # of week and are 4 or 5 weeks apart.
+    index = DatetimeIndex(["2013-08-27", "2013-10-01",
+                           "2013-10-29", "2013-11-26"])
+    assert frequencies.infer_freq(index) != "WOM-4TUE"
+
+
+def test_fifth_week_of_month():
+    # see gh-9425
+    #
+    # Only supports freq up to WOM-4.
+    msg = ("Of the four parameters: start, end, periods, "
+           "and freq, exactly three must be specified")
+
+    with pytest.raises(ValueError, match=msg):
+        date_range("2014-01-01", freq="WOM-5MON")
+
+
+def test_monthly_ambiguous():
+    rng = DatetimeIndex(["1/31/2000", "2/29/2000", "3/31/2000"])
+    assert rng.inferred_freq == "M"
+
+
+def test_annual_ambiguous():
+    rng = DatetimeIndex(["1/31/2000", "1/31/2001", "1/31/2002"])
+    assert rng.inferred_freq == "A-JAN"
+
+
+def test_infer_freq_delta(base_delta_code_pair, count):
+    b = Timestamp(datetime.now())
+    base_delta, code = base_delta_code_pair
+
+    inc = base_delta * count
+    index = DatetimeIndex([b + inc * j for j in range(3)])
+
+    exp_freq = "%d%s" % (count, code) if count > 1 else code
+    assert frequencies.infer_freq(index) == exp_freq
+
+
+@pytest.mark.parametrize("constructor", [
+    lambda now, delta: DatetimeIndex([now + delta * 7] +
+                                     [now + delta * j for j in range(3)]),
+    lambda now, delta: DatetimeIndex([now + delta * j for j in range(3)] +
+                                     [now + delta * 7])
+])
+def test_infer_freq_custom(base_delta_code_pair, constructor):
+    b = Timestamp(datetime.now())
+    base_delta, _ = base_delta_code_pair
+
+    index = constructor(b, base_delta)
+    assert frequencies.infer_freq(index) is None
+
+
+def test_weekly_infer(periods, day):
+    _check_generated_range("1/1/2000", periods, "W-{day}".format(day=day))
+
+
+def test_week_of_month_infer(periods, day, count):
+    _check_generated_range("1/1/2000", periods,
+                           "WOM-{count}{day}".format(count=count, day=day))
+
+
+@pytest.mark.parametrize("freq", ["M", "BM", "BMS"])
+def test_monthly_infer(periods, freq):
+    _check_generated_range("1/1/2000", periods, "M")
+
+
+def test_quarterly_infer(month, periods):
+    _check_generated_range("1/1/2000", periods,
+                           "Q-{month}".format(month=month))
+
+
+@pytest.mark.parametrize("annual", ["A", "BA"])
+def test_annually_infer(month, periods, annual):
+    _check_generated_range("1/1/2000", periods,
+                           "{annual}-{month}".format(annual=annual,
+                                                     month=month))
+
+
+@pytest.mark.parametrize("freq,expected", [
+    ("Q", "Q-DEC"), ("Q-NOV", "Q-NOV"), ("Q-OCT", "Q-OCT")
+])
+def test_infer_freq_index(freq, expected):
+    rng = period_range("1959Q2", "2009Q3", freq=freq)
+    rng = Index(rng.to_timestamp("D", how="e").astype(object))
+
+    assert rng.inferred_freq == expected
+
+
+@pytest.mark.parametrize(
+    "expected,dates",
+    list(compat.iteritems(
+        {"AS-JAN": ["2009-01-01", "2010-01-01", "2011-01-01", "2012-01-01"],
+         "Q-OCT": ["2009-01-31", "2009-04-30", "2009-07-31", "2009-10-31"],
+         "M": ["2010-11-30", "2010-12-31", "2011-01-31", "2011-02-28"],
+         "W-SAT": ["2010-12-25", "2011-01-01", "2011-01-08", "2011-01-15"],
+         "D": ["2011-01-01", "2011-01-02", "2011-01-03", "2011-01-04"],
+         "H": ["2011-12-31 22:00", "2011-12-31 23:00",
+               "2012-01-01 00:00", "2012-01-01 01:00"]}))
+)
+def test_infer_freq_tz(tz_naive_fixture, expected, dates):
+    # see gh-7310
+    tz = tz_naive_fixture
+    idx = DatetimeIndex(dates, tz=tz)
+    assert idx.inferred_freq == expected
+
+
+@pytest.mark.parametrize("date_pair", [
+    ["2013-11-02", "2013-11-5"],   # Fall DST
+    ["2014-03-08", "2014-03-11"],  # Spring DST
+    ["2014-01-01", "2014-01-03"]   # Regular Time
+])
+@pytest.mark.parametrize("freq", [
+    "3H", "10T", "3601S", "3600001L", "3600000001U", "3600000000001N"
+])
+def test_infer_freq_tz_transition(tz_naive_fixture, date_pair, freq):
+    # see gh-8772
+    tz = tz_naive_fixture
+    idx = date_range(date_pair[0], date_pair[1], freq=freq, tz=tz)
+    assert idx.inferred_freq == freq
+
+
+def test_infer_freq_tz_transition_custom():
+    index = date_range("2013-11-03", periods=5,
+                       freq="3H").tz_localize("America/Chicago")
+    assert index.inferred_freq is None
+
+
+@pytest.mark.parametrize("data,expected", [
+    # Hourly freq in a day must result in "H"
+    (["2014-07-01 09:00", "2014-07-01 10:00", "2014-07-01 11:00",
+      "2014-07-01 12:00", "2014-07-01 13:00", "2014-07-01 14:00"], "H"),
+
+    (["2014-07-01 09:00", "2014-07-01 10:00", "2014-07-01 11:00",
+      "2014-07-01 12:00", "2014-07-01 13:00", "2014-07-01 14:00",
+      "2014-07-01 15:00", "2014-07-01 16:00", "2014-07-02 09:00",
+      "2014-07-02 10:00", "2014-07-02 11:00"], "BH"),
+    (["2014-07-04 09:00", "2014-07-04 10:00", "2014-07-04 11:00",
+      "2014-07-04 12:00", "2014-07-04 13:00", "2014-07-04 14:00",
+      "2014-07-04 15:00", "2014-07-04 16:00", "2014-07-07 09:00",
+      "2014-07-07 10:00", "2014-07-07 11:00"], "BH"),
+    (["2014-07-04 09:00", "2014-07-04 10:00", "2014-07-04 11:00",
+      "2014-07-04 12:00", "2014-07-04 13:00", "2014-07-04 14:00",
+      "2014-07-04 15:00", "2014-07-04 16:00", "2014-07-07 09:00",
+      "2014-07-07 10:00", "2014-07-07 11:00", "2014-07-07 12:00",
+      "2014-07-07 13:00", "2014-07-07 14:00", "2014-07-07 15:00",
+      "2014-07-07 16:00", "2014-07-08 09:00", "2014-07-08 10:00",
+      "2014-07-08 11:00", "2014-07-08 12:00", "2014-07-08 13:00",
+      "2014-07-08 14:00", "2014-07-08 15:00", "2014-07-08 16:00"], "BH"),
+])
+def test_infer_freq_business_hour(data, expected):
+    # see gh-7905
+    idx = DatetimeIndex(data)
+    assert idx.inferred_freq == expected
+
+
+def test_not_monotonic():
+    rng = DatetimeIndex(["1/31/2000", "1/31/2001", "1/31/2002"])
+    rng = rng[::-1]
+
+    assert rng.inferred_freq == "-1A-JAN"
+
+
+def test_non_datetime_index2():
+    rng = DatetimeIndex(["1/31/2000", "1/31/2001", "1/31/2002"])
+    vals = rng.to_pydatetime()
+
+    result = frequencies.infer_freq(vals)
+    assert result == rng.inferred_freq
+
+
+@pytest.mark.parametrize("idx", [
+    tm.makeIntIndex(10), tm.makeFloatIndex(10), tm.makePeriodIndex(10)
+])
+def test_invalid_index_types(idx):
+    msg = ("(cannot infer freq from a non-convertible)|"
+           "(Check the `freq` attribute instead of using infer_freq)")
+
+    with pytest.raises(TypeError, match=msg):
+        frequencies.infer_freq(idx)
+
+
+@pytest.mark.skipif(is_platform_windows(),
+                    reason="see gh-10822: Windows issue")
+@pytest.mark.parametrize("idx", [tm.makeStringIndex(10),
+                                 tm.makeUnicodeIndex(10)])
+def test_invalid_index_types_unicode(idx):
+    # see gh-10822
+    #
+    # Odd error message on conversions to datetime for unicode.
+    msg = "Unknown string format"
+
+    with pytest.raises(ValueError, match=msg):
+        frequencies.infer_freq(idx)
+
+
+def test_string_datetime_like_compat():
+    # see gh-6463
+    data = ["2004-01", "2004-02", "2004-03", "2004-04"]
+
+    expected = frequencies.infer_freq(data)
+    result = frequencies.infer_freq(Index(data))
+
+    assert result == expected
+
+
+def test_series():
+    # see gh-6407
+    s = Series(date_range("20130101", "20130110"))
+    inferred = frequencies.infer_freq(s)
+    assert inferred == "D"
+
+
+@pytest.mark.parametrize("end", [10, 10.])
+def test_series_invalid_type(end):
+    # see gh-6407
+    msg = "cannot infer freq from a non-convertible dtype on a Series"
+    s = Series(np.arange(end))
+
+    with pytest.raises(TypeError, match=msg):
+        frequencies.infer_freq(s)
+
+
+def test_series_inconvertible_string():
+    # see gh-6407
+    msg = "Unknown string format"
+
+    with pytest.raises(ValueError, match=msg):
+        frequencies.infer_freq(Series(["foo", "bar"]))
+
+
+@pytest.mark.parametrize("freq", [None, "L"])
+def test_series_period_index(freq):
+    # see gh-6407
+    #
+    # Cannot infer on PeriodIndex
+    msg = "cannot infer freq from a non-convertible dtype on a Series"
+    s = Series(period_range("2013", periods=10, freq=freq))
+
+    with pytest.raises(TypeError, match=msg):
+        frequencies.infer_freq(s)
+
+
+@pytest.mark.parametrize("freq", ["M", "L", "S"])
+def test_series_datetime_index(freq):
+    s = Series(date_range("20130101", periods=10, freq=freq))
+    inferred = frequencies.infer_freq(s)
+    assert inferred == freq
+
+
+@pytest.mark.parametrize("offset_func", [
+    frequencies.get_offset,
+    lambda freq: date_range("2011-01-01", periods=5, freq=freq)
+])
+@pytest.mark.parametrize("freq", [
+    "WEEKDAY", "EOM", "W@MON", "W@TUE", "W@WED", "W@THU",
+    "W@FRI", "W@SAT", "W@SUN", "Q@JAN", "Q@FEB", "Q@MAR",
+    "A@JAN", "A@FEB", "A@MAR", "A@APR", "A@MAY", "A@JUN",
+    "A@JUL", "A@AUG", "A@SEP", "A@OCT", "A@NOV", "A@DEC",
+    "Y@JAN", "WOM@1MON", "WOM@2MON", "WOM@3MON",
+    "WOM@4MON", "WOM@1TUE", "WOM@2TUE", "WOM@3TUE",
+    "WOM@4TUE", "WOM@1WED", "WOM@2WED", "WOM@3WED",
+    "WOM@4WED", "WOM@1THU", "WOM@2THU", "WOM@3THU",
+    "WOM@4THU", "WOM@1FRI", "WOM@2FRI", "WOM@3FRI",
+    "WOM@4FRI"
+])
+def test_legacy_offset_warnings(offset_func, freq):
+    with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+        offset_func(freq)
+
+
+def test_ms_vs_capital_ms():
+    left = frequencies.get_offset("ms")
+    right = frequencies.get_offset("MS")
+
+    assert left == offsets.Milli()
+    assert right == offsets.MonthBegin()
diff --git a/pandas/tests/tseries/frequencies/test_to_offset.py b/pandas/tests/tseries/frequencies/test_to_offset.py
new file mode 100644
index 0000000000000..c9c35b47f3475
--- /dev/null
+++ b/pandas/tests/tseries/frequencies/test_to_offset.py
@@ -0,0 +1,146 @@
+import re
+
+import pytest
+
+from pandas import Timedelta
+
+import pandas.tseries.frequencies as frequencies
+import pandas.tseries.offsets as offsets
+
+
+@pytest.mark.parametrize("freq_input,expected", [
+    (frequencies.to_offset("10us"), offsets.Micro(10)),
+    (offsets.Hour(), offsets.Hour()),
+    ((5, "T"), offsets.Minute(5)),
+    ("2h30min", offsets.Minute(150)),
+    ("2h 30min", offsets.Minute(150)),
+    ("2h30min15s", offsets.Second(150 * 60 + 15)),
+    ("2h 60min", offsets.Hour(3)),
+    ("2h 20.5min", offsets.Second(8430)),
+    ("1.5min", offsets.Second(90)),
+    ("0.5S", offsets.Milli(500)),
+    ("15l500u", offsets.Micro(15500)),
+    ("10s75L", offsets.Milli(10075)),
+    ("1s0.25ms", offsets.Micro(1000250)),
+    ("1s0.25L", offsets.Micro(1000250)),
+    ("2800N", offsets.Nano(2800)),
+    ("2SM", offsets.SemiMonthEnd(2)),
+    ("2SM-16", offsets.SemiMonthEnd(2, day_of_month=16)),
+    ("2SMS-14", offsets.SemiMonthBegin(2, day_of_month=14)),
+    ("2SMS-15", offsets.SemiMonthBegin(2)),
+])
+def test_to_offset(freq_input, expected):
+    result = frequencies.to_offset(freq_input)
+    assert result == expected
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("-1S", -1),
+    ("-2SM", -2),
+    ("-1SMS", -1),
+    ("-5min10s", -310),
+])
+def test_to_offset_negative(freqstr, expected):
+    result = frequencies.to_offset(freqstr)
+    assert result.n == expected
+
+
+@pytest.mark.parametrize("freqstr", [
+    "2h20m", "U1", "-U", "3U1", "-2-3U", "-2D:3H",
+    "1.5.0S", "2SMS-15-15", "2SMS-15D", "100foo",
+
+    # Invalid leading +/- signs.
+    "+-1d", "-+1h", "+1", "-7", "+d", "-m",
+
+    # Invalid shortcut anchors.
+    "SM-0", "SM-28", "SM-29", "SM-FOO", "BSM", "SM--1", "SMS-1",
+    "SMS-28", "SMS-30", "SMS-BAR", "SMS-BYR", "BSMS", "SMS--2"
+])
+def test_to_offset_invalid(freqstr):
+    # see gh-13930
+
+    # We escape string because some of our
+    # inputs contain regex special characters.
+    msg = re.escape("Invalid frequency: {freqstr}".format(freqstr=freqstr))
+    with pytest.raises(ValueError, match=msg):
+        frequencies.to_offset(freqstr)
+
+
+def test_to_offset_no_evaluate():
+    with pytest.raises(ValueError, match="Could not evaluate"):
+        frequencies.to_offset(("", ""))
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("2D 3H", offsets.Hour(51)),
+    ("2 D3 H", offsets.Hour(51)),
+    ("2 D 3 H", offsets.Hour(51)),
+    ("  2 D 3 H  ", offsets.Hour(51)),
+    ("   H    ", offsets.Hour()),
+    (" 3  H    ", offsets.Hour(3)),
+])
+def test_to_offset_whitespace(freqstr, expected):
+    result = frequencies.to_offset(freqstr)
+    assert result == expected
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("00H 00T 01S", 1),
+    ("-00H 03T 14S", -194),
+])
+def test_to_offset_leading_zero(freqstr, expected):
+    result = frequencies.to_offset(freqstr)
+    assert result.n == expected
+
+
+@pytest.mark.parametrize("freqstr,expected", [
+    ("+1d", 1),
+    ("+2h30min", 150),
+])
+def test_to_offset_leading_plus(freqstr, expected):
+    result = frequencies.to_offset(freqstr)
+    assert result.n == expected
+
+
+@pytest.mark.parametrize("kwargs,expected", [
+    (dict(days=1, seconds=1), offsets.Second(86401)),
+    (dict(days=-1, seconds=1), offsets.Second(-86399)),
+    (dict(hours=1, minutes=10), offsets.Minute(70)),
+    (dict(hours=1, minutes=-10), offsets.Minute(50)),
+    (dict(weeks=1), offsets.Day(7)),
+    (dict(hours=1), offsets.Hour(1)),
+    (dict(hours=1), frequencies.to_offset("60min")),
+    (dict(microseconds=1), offsets.Micro(1))
+])
+def test_to_offset_pd_timedelta(kwargs, expected):
+    # see gh-9064
+    td = Timedelta(**kwargs)
+    result = frequencies.to_offset(td)
+    assert result == expected
+
+
+def test_to_offset_pd_timedelta_invalid():
+    # see gh-9064
+    msg = "Invalid frequency: 0 days 00:00:00"
+    td = Timedelta(microseconds=0)
+
+    with pytest.raises(ValueError, match=msg):
+        frequencies.to_offset(td)
+
+
+@pytest.mark.parametrize("shortcut,expected", [
+    ("W", offsets.Week(weekday=6)),
+    ("W-SUN", offsets.Week(weekday=6)),
+    ("Q", offsets.QuarterEnd(startingMonth=12)),
+    ("Q-DEC", offsets.QuarterEnd(startingMonth=12)),
+    ("Q-MAY", offsets.QuarterEnd(startingMonth=5)),
+    ("SM", offsets.SemiMonthEnd(day_of_month=15)),
+    ("SM-15", offsets.SemiMonthEnd(day_of_month=15)),
+    ("SM-1", offsets.SemiMonthEnd(day_of_month=1)),
+    ("SM-27", offsets.SemiMonthEnd(day_of_month=27)),
+    ("SMS-2", offsets.SemiMonthBegin(day_of_month=2)),
+    ("SMS-27", offsets.SemiMonthBegin(day_of_month=27)),
+])
+def test_anchored_shortcuts(shortcut, expected):
+    result = frequencies.to_offset(shortcut)
+    assert result == expected
diff --git a/pandas/tests/tseries/holiday/__init__.py b/pandas/tests/tseries/holiday/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tseries/holiday/test_calendar.py b/pandas/tests/tseries/holiday/test_calendar.py
new file mode 100644
index 0000000000000..a5cc4095ce583
--- /dev/null
+++ b/pandas/tests/tseries/holiday/test_calendar.py
@@ -0,0 +1,77 @@
+from datetime import datetime
+
+import pytest
+
+from pandas import DatetimeIndex
+import pandas.util.testing as tm
+
+from pandas.tseries.holiday import (
+    AbstractHolidayCalendar, Holiday, Timestamp, USFederalHolidayCalendar,
+    USThanksgivingDay, get_calendar)
+
+
+@pytest.mark.parametrize("transform", [
+    lambda x: x,
+    lambda x: x.strftime("%Y-%m-%d"),
+    lambda x: Timestamp(x)
+])
+def test_calendar(transform):
+    start_date = datetime(2012, 1, 1)
+    end_date = datetime(2012, 12, 31)
+
+    calendar = USFederalHolidayCalendar()
+    holidays = calendar.holidays(transform(start_date), transform(end_date))
+
+    expected = [
+        datetime(2012, 1, 2),
+        datetime(2012, 1, 16),
+        datetime(2012, 2, 20),
+        datetime(2012, 5, 28),
+        datetime(2012, 7, 4),
+        datetime(2012, 9, 3),
+        datetime(2012, 10, 8),
+        datetime(2012, 11, 12),
+        datetime(2012, 11, 22),
+        datetime(2012, 12, 25)
+    ]
+
+    assert list(holidays.to_pydatetime()) == expected
+
+
+def test_calendar_caching():
+    # see gh-9552.
+
+    class TestCalendar(AbstractHolidayCalendar):
+        def __init__(self, name=None, rules=None):
+            super(TestCalendar, self).__init__(name=name, rules=rules)
+
+    jan1 = TestCalendar(rules=[Holiday("jan1", year=2015, month=1, day=1)])
+    jan2 = TestCalendar(rules=[Holiday("jan2", year=2015, month=1, day=2)])
+
+    # Getting holidays for Jan 1 should not alter results for Jan 2.
+    tm.assert_index_equal(jan1.holidays(), DatetimeIndex(["01-Jan-2015"]))
+    tm.assert_index_equal(jan2.holidays(), DatetimeIndex(["02-Jan-2015"]))
+
+
+def test_calendar_observance_dates():
+    # see gh-11477
+    us_fed_cal = get_calendar("USFederalHolidayCalendar")
+    holidays0 = us_fed_cal.holidays(datetime(2015, 7, 3), datetime(
+        2015, 7, 3))  # <-- same start and end dates
+    holidays1 = us_fed_cal.holidays(datetime(2015, 7, 3), datetime(
+        2015, 7, 6))  # <-- different start and end dates
+    holidays2 = us_fed_cal.holidays(datetime(2015, 7, 3), datetime(
+        2015, 7, 3))  # <-- same start and end dates
+
+    # These should all produce the same result.
+    #
+    # In addition, calling with different start and end
+    # dates should not alter the output if we call the
+    # function again with the same start and end date.
+    tm.assert_index_equal(holidays0, holidays1)
+    tm.assert_index_equal(holidays0, holidays2)
+
+
+def test_rule_from_name():
+    us_fed_cal = get_calendar("USFederalHolidayCalendar")
+    assert us_fed_cal.rule_from_name("Thanksgiving") == USThanksgivingDay
diff --git a/pandas/tests/tseries/holiday/test_federal.py b/pandas/tests/tseries/holiday/test_federal.py
new file mode 100644
index 0000000000000..62b5ab2b849ae
--- /dev/null
+++ b/pandas/tests/tseries/holiday/test_federal.py
@@ -0,0 +1,36 @@
+from datetime import datetime
+
+from pandas.tseries.holiday import (
+    AbstractHolidayCalendar, USMartinLutherKingJr, USMemorialDay)
+
+
+def test_no_mlk_before_1986():
+    # see gh-10278
+    class MLKCalendar(AbstractHolidayCalendar):
+        rules = [USMartinLutherKingJr]
+
+    holidays = MLKCalendar().holidays(start="1984",
+                                      end="1988").to_pydatetime().tolist()
+
+    # Testing to make sure holiday is not incorrectly observed before 1986.
+    assert holidays == [datetime(1986, 1, 20, 0, 0),
+                        datetime(1987, 1, 19, 0, 0)]
+
+
+def test_memorial_day():
+    class MemorialDay(AbstractHolidayCalendar):
+        rules = [USMemorialDay]
+
+    holidays = MemorialDay().holidays(start="1971",
+                                      end="1980").to_pydatetime().tolist()
+
+    # Fixes 5/31 error and checked manually against Wikipedia.
+    assert holidays == [datetime(1971, 5, 31, 0, 0),
+                        datetime(1972, 5, 29, 0, 0),
+                        datetime(1973, 5, 28, 0, 0),
+                        datetime(1974, 5, 27, 0, 0),
+                        datetime(1975, 5, 26, 0, 0),
+                        datetime(1976, 5, 31, 0, 0),
+                        datetime(1977, 5, 30, 0, 0),
+                        datetime(1978, 5, 29, 0, 0),
+                        datetime(1979, 5, 28, 0, 0)]
diff --git a/pandas/tests/tseries/holiday/test_holiday.py b/pandas/tests/tseries/holiday/test_holiday.py
new file mode 100644
index 0000000000000..27bba1cc89dee
--- /dev/null
+++ b/pandas/tests/tseries/holiday/test_holiday.py
@@ -0,0 +1,193 @@
+from datetime import datetime
+
+import pytest
+from pytz import utc
+
+import pandas.util.testing as tm
+
+from pandas.tseries.holiday import (
+    MO, SA, AbstractHolidayCalendar, DateOffset, EasterMonday, GoodFriday,
+    Holiday, HolidayCalendarFactory, Timestamp, USColumbusDay, USLaborDay,
+    USMartinLutherKingJr, USMemorialDay, USPresidentsDay, USThanksgivingDay,
+    get_calendar, next_monday)
+
+
+def _check_holiday_results(holiday, start, end, expected):
+    """
+    Check that the dates for a given holiday match in date and timezone.
+
+    Parameters
+    ----------
+    holiday : Holiday
+        The holiday to check.
+    start : datetime-like
+        The start date of range in which to collect dates for a given holiday.
+    end : datetime-like
+        The end date of range in which to collect dates for a given holiday.
+    expected : list
+        The list of dates we expect to get.
+    """
+    assert list(holiday.dates(start, end)) == expected
+
+    # Verify that timezone info is preserved.
+    assert (list(holiday.dates(utc.localize(Timestamp(start)),
+                               utc.localize(Timestamp(end)))) ==
+            [utc.localize(dt) for dt in expected])
+
+
+@pytest.mark.parametrize("holiday,start_date,end_date,expected", [
+    (USMemorialDay, datetime(2011, 1, 1), datetime(2020, 12, 31),
+     [datetime(2011, 5, 30), datetime(2012, 5, 28), datetime(2013, 5, 27),
+      datetime(2014, 5, 26), datetime(2015, 5, 25), datetime(2016, 5, 30),
+      datetime(2017, 5, 29), datetime(2018, 5, 28), datetime(2019, 5, 27),
+      datetime(2020, 5, 25)]),
+
+    (Holiday("July 4th Eve", month=7, day=3), "2001-01-01", "2003-03-03",
+     [Timestamp("2001-07-03 00:00:00"), Timestamp("2002-07-03 00:00:00")]),
+    (Holiday("July 4th Eve", month=7, day=3, days_of_week=(0, 1, 2, 3)),
+     "2001-01-01", "2008-03-03", [
+         Timestamp("2001-07-03 00:00:00"), Timestamp("2002-07-03 00:00:00"),
+         Timestamp("2003-07-03 00:00:00"), Timestamp("2006-07-03 00:00:00"),
+         Timestamp("2007-07-03 00:00:00")]),
+
+    (EasterMonday, datetime(2011, 1, 1), datetime(2020, 12, 31),
+     [Timestamp("2011-04-25 00:00:00"), Timestamp("2012-04-09 00:00:00"),
+      Timestamp("2013-04-01 00:00:00"), Timestamp("2014-04-21 00:00:00"),
+      Timestamp("2015-04-06 00:00:00"), Timestamp("2016-03-28 00:00:00"),
+      Timestamp("2017-04-17 00:00:00"), Timestamp("2018-04-02 00:00:00"),
+      Timestamp("2019-04-22 00:00:00"), Timestamp("2020-04-13 00:00:00")]),
+    (GoodFriday, datetime(2011, 1, 1), datetime(2020, 12, 31),
+     [Timestamp("2011-04-22 00:00:00"), Timestamp("2012-04-06 00:00:00"),
+      Timestamp("2013-03-29 00:00:00"), Timestamp("2014-04-18 00:00:00"),
+      Timestamp("2015-04-03 00:00:00"), Timestamp("2016-03-25 00:00:00"),
+      Timestamp("2017-04-14 00:00:00"), Timestamp("2018-03-30 00:00:00"),
+      Timestamp("2019-04-19 00:00:00"), Timestamp("2020-04-10 00:00:00")]),
+
+    (USThanksgivingDay, datetime(2011, 1, 1), datetime(2020, 12, 31),
+     [datetime(2011, 11, 24), datetime(2012, 11, 22), datetime(2013, 11, 28),
+      datetime(2014, 11, 27), datetime(2015, 11, 26), datetime(2016, 11, 24),
+      datetime(2017, 11, 23), datetime(2018, 11, 22), datetime(2019, 11, 28),
+      datetime(2020, 11, 26)])
+])
+def test_holiday_dates(holiday, start_date, end_date, expected):
+    _check_holiday_results(holiday, start_date, end_date, expected)
+
+
+@pytest.mark.parametrize("holiday,start,expected", [
+    (USMemorialDay, datetime(2015, 7, 1), []),
+    (USMemorialDay, "2015-05-25", "2015-05-25"),
+
+    (USLaborDay, datetime(2015, 7, 1), []),
+    (USLaborDay, "2015-09-07", "2015-09-07"),
+
+    (USColumbusDay, datetime(2015, 7, 1), []),
+    (USColumbusDay, "2015-10-12", "2015-10-12"),
+
+    (USThanksgivingDay, datetime(2015, 7, 1), []),
+    (USThanksgivingDay, "2015-11-26", "2015-11-26"),
+
+    (USMartinLutherKingJr, datetime(2015, 7, 1), []),
+    (USMartinLutherKingJr, "2015-01-19", "2015-01-19"),
+
+    (USPresidentsDay, datetime(2015, 7, 1), []),
+    (USPresidentsDay, "2015-02-16", "2015-02-16"),
+
+    (GoodFriday, datetime(2015, 7, 1), []),
+    (GoodFriday, "2015-04-03", "2015-04-03"),
+
+    (EasterMonday, "2015-04-06", "2015-04-06"),
+    (EasterMonday, datetime(2015, 7, 1), []),
+    (EasterMonday, "2015-04-05", []),
+
+    ("New Years Day", "2015-01-01", "2015-01-01"),
+    ("New Years Day", "2010-12-31", "2010-12-31"),
+    ("New Years Day", datetime(2015, 7, 1), []),
+    ("New Years Day", "2011-01-01", []),
+
+    ("July 4th", "2015-07-03", "2015-07-03"),
+    ("July 4th", datetime(2015, 7, 1), []),
+    ("July 4th", "2015-07-04", []),
+
+    ("Veterans Day", "2012-11-12", "2012-11-12"),
+    ("Veterans Day", datetime(2015, 7, 1), []),
+    ("Veterans Day", "2012-11-11", []),
+
+    ("Christmas", "2011-12-26", "2011-12-26"),
+    ("Christmas", datetime(2015, 7, 1), []),
+    ("Christmas", "2011-12-25", []),
+])
+def test_holidays_within_dates(holiday, start, expected):
+    # see gh-11477
+    #
+    # Fix holiday behavior where holiday.dates returned dates outside
+    # start/end date, or observed rules could not be applied because the
+    # holiday was not in the original date range (e.g., 7/4/2015 -> 7/3/2015).
+    if isinstance(holiday, str):
+        calendar = get_calendar("USFederalHolidayCalendar")
+        holiday = calendar.rule_from_name(holiday)
+
+    if isinstance(expected, str):
+        expected = [Timestamp(expected)]
+
+    _check_holiday_results(holiday, start, start, expected)
+
+
+@pytest.mark.parametrize("transform", [
+    lambda x: x.strftime("%Y-%m-%d"),
+    lambda x: Timestamp(x)
+])
+def test_argument_types(transform):
+    start_date = datetime(2011, 1, 1)
+    end_date = datetime(2020, 12, 31)
+
+    holidays = USThanksgivingDay.dates(start_date, end_date)
+    holidays2 = USThanksgivingDay.dates(
+        transform(start_date), transform(end_date))
+    tm.assert_index_equal(holidays, holidays2)
+
+
+@pytest.mark.parametrize("name,kwargs", [
+    ("One-Time", dict(year=2012, month=5, day=28)),
+    ("Range", dict(month=5, day=28, start_date=datetime(2012, 1, 1),
+                   end_date=datetime(2012, 12, 31),
+                   offset=DateOffset(weekday=MO(1))))
+])
+def test_special_holidays(name, kwargs):
+    base_date = [datetime(2012, 5, 28)]
+    holiday = Holiday(name, **kwargs)
+
+    start_date = datetime(2011, 1, 1)
+    end_date = datetime(2020, 12, 31)
+
+    assert base_date == holiday.dates(start_date, end_date)
+
+
+def test_get_calendar():
+    class TestCalendar(AbstractHolidayCalendar):
+        rules = []
+
+    calendar = get_calendar("TestCalendar")
+    assert TestCalendar == calendar.__class__
+
+
+def test_factory():
+    class_1 = HolidayCalendarFactory("MemorialDay",
+                                     AbstractHolidayCalendar,
+                                     USMemorialDay)
+    class_2 = HolidayCalendarFactory("Thanksgiving",
+                                     AbstractHolidayCalendar,
+                                     USThanksgivingDay)
+    class_3 = HolidayCalendarFactory("Combined", class_1, class_2)
+
+    assert len(class_1.rules) == 1
+    assert len(class_2.rules) == 1
+    assert len(class_3.rules) == 2
+
+
+def test_both_offset_observance_raises():
+    # see gh-10217
+    msg = "Cannot use both offset and observance"
+    with pytest.raises(NotImplementedError, match=msg):
+        Holiday("Cyber Monday", month=11, day=1,
+                offset=[DateOffset(weekday=SA(4))],
+                observance=next_monday)
diff --git a/pandas/tests/tseries/holiday/test_observance.py b/pandas/tests/tseries/holiday/test_observance.py
new file mode 100644
index 0000000000000..1c22918b2efd8
--- /dev/null
+++ b/pandas/tests/tseries/holiday/test_observance.py
@@ -0,0 +1,93 @@
+from datetime import datetime
+
+import pytest
+
+from pandas.tseries.holiday import (
+    after_nearest_workday, before_nearest_workday, nearest_workday,
+    next_monday, next_monday_or_tuesday, next_workday, previous_friday,
+    previous_workday, sunday_to_monday, weekend_to_monday)
+
+_WEDNESDAY = datetime(2014, 4, 9)
+_THURSDAY = datetime(2014, 4, 10)
+_FRIDAY = datetime(2014, 4, 11)
+_SATURDAY = datetime(2014, 4, 12)
+_SUNDAY = datetime(2014, 4, 13)
+_MONDAY = datetime(2014, 4, 14)
+_TUESDAY = datetime(2014, 4, 15)
+
+
+@pytest.mark.parametrize("day", [_SATURDAY, _SUNDAY])
+def test_next_monday(day):
+    assert next_monday(day) == _MONDAY
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _MONDAY),
+    (_SUNDAY, _TUESDAY),
+    (_MONDAY, _TUESDAY)
+])
+def test_next_monday_or_tuesday(day, expected):
+    assert next_monday_or_tuesday(day) == expected
+
+
+@pytest.mark.parametrize("day", [_SATURDAY, _SUNDAY])
+def test_previous_friday(day):
+    assert previous_friday(day) == _FRIDAY
+
+
+def test_sunday_to_monday():
+    assert sunday_to_monday(_SUNDAY) == _MONDAY
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _FRIDAY),
+    (_SUNDAY, _MONDAY),
+    (_MONDAY, _MONDAY)
+])
+def test_nearest_workday(day, expected):
+    assert nearest_workday(day) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _MONDAY),
+    (_SUNDAY, _MONDAY),
+    (_MONDAY, _MONDAY)
+])
+def test_weekend_to_monday(day, expected):
+    assert weekend_to_monday(day) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _MONDAY),
+    (_SUNDAY, _MONDAY),
+    (_MONDAY, _TUESDAY)
+])
+def test_next_workday(day, expected):
+    assert next_workday(day) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _FRIDAY),
+    (_SUNDAY, _FRIDAY),
+    (_TUESDAY, _MONDAY)
+])
+def test_previous_workday(day, expected):
+    assert previous_workday(day) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _THURSDAY),
+    (_SUNDAY, _FRIDAY),
+    (_TUESDAY, _MONDAY)
+])
+def test_before_nearest_workday(day, expected):
+    assert before_nearest_workday(day) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    (_SATURDAY, _MONDAY),
+    (_SUNDAY, _TUESDAY),
+    (_FRIDAY, _MONDAY)
+])
+def test_after_nearest_workday(day, expected):
+    assert after_nearest_workday(day) == expected
diff --git a/pandas/tests/tseries/offsets/__init__.py b/pandas/tests/tseries/offsets/__init__.py
new file mode 100644
index 0000000000000..40a96afc6ff09
--- /dev/null
+++ b/pandas/tests/tseries/offsets/__init__.py
@@ -0,0 +1 @@
+# -*- coding: utf-8 -*-
diff --git a/pandas/tests/tseries/offsets/common.py b/pandas/tests/tseries/offsets/common.py
new file mode 100644
index 0000000000000..2e8eb224bca7f
--- /dev/null
+++ b/pandas/tests/tseries/offsets/common.py
@@ -0,0 +1,25 @@
+# -*- coding: utf-8 -*-
+"""
+Assertion helpers for offsets tests
+"""
+
+
+def assert_offset_equal(offset, base, expected):
+    actual = offset + base
+    actual_swapped = base + offset
+    actual_apply = offset.apply(base)
+    try:
+        assert actual == expected
+        assert actual_swapped == expected
+        assert actual_apply == expected
+    except AssertionError:
+        raise AssertionError("\nExpected: %s\nActual: %s\nFor Offset: %s)"
+                             "\nAt Date: %s" %
+                             (expected, actual, offset, base))
+
+
+def assert_onOffset(offset, date, expected):
+    actual = offset.onOffset(date)
+    assert actual == expected, ("\nExpected: %s\nActual: %s\nFor Offset: %s)"
+                                "\nAt Date: %s" %
+                                (expected, actual, offset, date))
diff --git a/pandas/tests/tseries/offsets/conftest.py b/pandas/tests/tseries/offsets/conftest.py
new file mode 100644
index 0000000000000..c192a56b205ca
--- /dev/null
+++ b/pandas/tests/tseries/offsets/conftest.py
@@ -0,0 +1,21 @@
+import pytest
+
+import pandas.tseries.offsets as offsets
+
+
+@pytest.fixture(params=[getattr(offsets, o) for o in offsets.__all__])
+def offset_types(request):
+    """
+    Fixture for all the datetime offsets available for a time series.
+    """
+    return request.param
+
+
+@pytest.fixture(params=[getattr(offsets, o) for o in offsets.__all__ if
+                        issubclass(getattr(offsets, o), offsets.MonthOffset)
+                        and o != 'MonthOffset'])
+def month_classes(request):
+    """
+    Fixture for month based datetime offsets available for a time series.
+    """
+    return request.param
diff --git a/pandas/tests/tseries/data/cday-0.14.1.pickle b/pandas/tests/tseries/offsets/data/cday-0.14.1.pickle
similarity index 100%
rename from pandas/tests/tseries/data/cday-0.14.1.pickle
rename to pandas/tests/tseries/offsets/data/cday-0.14.1.pickle
diff --git a/pandas/tests/tseries/data/dateoffset_0_15_2.pickle b/pandas/tests/tseries/offsets/data/dateoffset_0_15_2.pickle
similarity index 100%
rename from pandas/tests/tseries/data/dateoffset_0_15_2.pickle
rename to pandas/tests/tseries/offsets/data/dateoffset_0_15_2.pickle
diff --git a/pandas/tests/tseries/offsets/test_fiscal.py b/pandas/tests/tseries/offsets/test_fiscal.py
new file mode 100644
index 0000000000000..a5d7460921fb4
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_fiscal.py
@@ -0,0 +1,657 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Fiscal Year and Fiscal Quarter offset classes
+"""
+from datetime import datetime
+
+from dateutil.relativedelta import relativedelta
+import pytest
+
+from pandas._libs.tslibs.frequencies import INVALID_FREQ_ERR_MSG
+
+from pandas import Timestamp
+
+from pandas.tseries.frequencies import get_offset
+from pandas.tseries.offsets import FY5253, FY5253Quarter
+
+from .common import assert_offset_equal, assert_onOffset
+from .test_offsets import Base, WeekDay
+
+
+def makeFY5253LastOfMonthQuarter(*args, **kwds):
+    return FY5253Quarter(*args, variation="last", **kwds)
+
+
+def makeFY5253NearestEndMonthQuarter(*args, **kwds):
+    return FY5253Quarter(*args, variation="nearest", **kwds)
+
+
+def makeFY5253NearestEndMonth(*args, **kwds):
+    return FY5253(*args, variation="nearest", **kwds)
+
+
+def makeFY5253LastOfMonth(*args, **kwds):
+    return FY5253(*args, variation="last", **kwds)
+
+
+def test_get_offset_name():
+    assert (makeFY5253LastOfMonthQuarter(
+            weekday=1, startingMonth=3,
+            qtr_with_extra_week=4).freqstr == "REQ-L-MAR-TUE-4")
+    assert (makeFY5253NearestEndMonthQuarter(
+            weekday=1, startingMonth=3,
+            qtr_with_extra_week=3).freqstr == "REQ-N-MAR-TUE-3")
+
+
+def test_get_offset():
+    with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+        get_offset('gibberish')
+    with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+        get_offset('QS-JAN-B')
+
+    pairs = [
+        ("RE-N-DEC-MON",
+         makeFY5253NearestEndMonth(weekday=0, startingMonth=12)),
+        ("RE-L-DEC-TUE",
+         makeFY5253LastOfMonth(weekday=1, startingMonth=12)),
+        ("REQ-L-MAR-TUE-4",
+         makeFY5253LastOfMonthQuarter(weekday=1,
+                                      startingMonth=3,
+                                      qtr_with_extra_week=4)),
+        ("REQ-L-DEC-MON-3",
+         makeFY5253LastOfMonthQuarter(weekday=0,
+                                      startingMonth=12,
+                                      qtr_with_extra_week=3)),
+        ("REQ-N-DEC-MON-3",
+         makeFY5253NearestEndMonthQuarter(weekday=0,
+                                          startingMonth=12,
+                                          qtr_with_extra_week=3))]
+
+    for name, expected in pairs:
+        offset = get_offset(name)
+        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
+                                    (name, expected, offset))
+
+
+class TestFY5253LastOfMonth(Base):
+    offset_lom_sat_aug = makeFY5253LastOfMonth(1, startingMonth=8,
+                                               weekday=WeekDay.SAT)
+    offset_lom_sat_sep = makeFY5253LastOfMonth(1, startingMonth=9,
+                                               weekday=WeekDay.SAT)
+
+    on_offset_cases = [
+        # From Wikipedia (see:
+        # http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar#Last_Saturday_of_the_month_at_fiscal_year_end)
+        (offset_lom_sat_aug, datetime(2006, 8, 26), True),
+        (offset_lom_sat_aug, datetime(2007, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2008, 8, 30), True),
+        (offset_lom_sat_aug, datetime(2009, 8, 29), True),
+        (offset_lom_sat_aug, datetime(2010, 8, 28), True),
+        (offset_lom_sat_aug, datetime(2011, 8, 27), True),
+        (offset_lom_sat_aug, datetime(2012, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2013, 8, 31), True),
+        (offset_lom_sat_aug, datetime(2014, 8, 30), True),
+        (offset_lom_sat_aug, datetime(2015, 8, 29), True),
+        (offset_lom_sat_aug, datetime(2016, 8, 27), True),
+        (offset_lom_sat_aug, datetime(2017, 8, 26), True),
+        (offset_lom_sat_aug, datetime(2018, 8, 25), True),
+        (offset_lom_sat_aug, datetime(2019, 8, 31), True),
+
+        (offset_lom_sat_aug, datetime(2006, 8, 27), False),
+        (offset_lom_sat_aug, datetime(2007, 8, 28), False),
+        (offset_lom_sat_aug, datetime(2008, 8, 31), False),
+        (offset_lom_sat_aug, datetime(2009, 8, 30), False),
+        (offset_lom_sat_aug, datetime(2010, 8, 29), False),
+        (offset_lom_sat_aug, datetime(2011, 8, 28), False),
+
+        (offset_lom_sat_aug, datetime(2006, 8, 25), False),
+        (offset_lom_sat_aug, datetime(2007, 8, 24), False),
+        (offset_lom_sat_aug, datetime(2008, 8, 29), False),
+        (offset_lom_sat_aug, datetime(2009, 8, 28), False),
+        (offset_lom_sat_aug, datetime(2010, 8, 27), False),
+        (offset_lom_sat_aug, datetime(2011, 8, 26), False),
+        (offset_lom_sat_aug, datetime(2019, 8, 30), False),
+
+        # From GMCR (see for example:
+        # http://yahoo.brand.edgar-online.com/Default.aspx?
+        # companyid=3184&formtypeID=7)
+        (offset_lom_sat_sep, datetime(2010, 9, 25), True),
+        (offset_lom_sat_sep, datetime(2011, 9, 24), True),
+        (offset_lom_sat_sep, datetime(2012, 9, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_apply(self):
+        offset_lom_aug_sat = makeFY5253LastOfMonth(startingMonth=8,
+                                                   weekday=WeekDay.SAT)
+        offset_lom_aug_sat_1 = makeFY5253LastOfMonth(n=1, startingMonth=8,
+                                                     weekday=WeekDay.SAT)
+
+        date_seq_lom_aug_sat = [datetime(2006, 8, 26), datetime(2007, 8, 25),
+                                datetime(2008, 8, 30), datetime(2009, 8, 29),
+                                datetime(2010, 8, 28), datetime(2011, 8, 27),
+                                datetime(2012, 8, 25), datetime(2013, 8, 31),
+                                datetime(2014, 8, 30), datetime(2015, 8, 29),
+                                datetime(2016, 8, 27)]
+
+        tests = [
+            (offset_lom_aug_sat, date_seq_lom_aug_sat),
+            (offset_lom_aug_sat_1, date_seq_lom_aug_sat),
+            (offset_lom_aug_sat, [
+                datetime(2006, 8, 25)] + date_seq_lom_aug_sat),
+            (offset_lom_aug_sat_1, [
+                datetime(2006, 8, 27)] + date_seq_lom_aug_sat[1:]),
+            (makeFY5253LastOfMonth(n=-1, startingMonth=8,
+                                   weekday=WeekDay.SAT),
+             list(reversed(date_seq_lom_aug_sat))),
+        ]
+        for test in tests:
+            offset, data = test
+            current = data[0]
+            for datum in data[1:]:
+                current = current + offset
+                assert current == datum
+
+
+class TestFY5253NearestEndMonth(Base):
+
+    def test_get_year_end(self):
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.SAT).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 8, 31))
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.SUN).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 9, 1))
+        assert (makeFY5253NearestEndMonth(
+            startingMonth=8, weekday=WeekDay.FRI).get_year_end(
+            datetime(2013, 1, 1)) == datetime(2013, 8, 30))
+
+        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                          variation="nearest")
+        assert (offset_n.get_year_end(datetime(2012, 1, 1)) ==
+                datetime(2013, 1, 1))
+        assert (offset_n.get_year_end(datetime(2012, 1, 10)) ==
+                datetime(2013, 1, 1))
+
+        assert (offset_n.get_year_end(datetime(2013, 1, 1)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 2)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 3)) ==
+                datetime(2013, 12, 31))
+        assert (offset_n.get_year_end(datetime(2013, 1, 10)) ==
+                datetime(2013, 12, 31))
+
+        JNJ = FY5253(n=1, startingMonth=12, weekday=6, variation="nearest")
+        assert (JNJ.get_year_end(datetime(2006, 1, 1)) ==
+                datetime(2006, 12, 31))
+
+    offset_lom_aug_sat = makeFY5253NearestEndMonth(1, startingMonth=8,
+                                                   weekday=WeekDay.SAT)
+    offset_lom_aug_thu = makeFY5253NearestEndMonth(1, startingMonth=8,
+                                                   weekday=WeekDay.THU)
+    offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                      variation="nearest")
+
+    on_offset_cases = [
+        #    From Wikipedia (see:
+        #    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
+        #    #Saturday_nearest_the_end_of_month)
+        #    2006-09-02   2006 September 2
+        #    2007-09-01   2007 September 1
+        #    2008-08-30   2008 August 30    (leap year)
+        #    2009-08-29   2009 August 29
+        #    2010-08-28   2010 August 28
+        #    2011-09-03   2011 September 3
+        #    2012-09-01   2012 September 1  (leap year)
+        #    2013-08-31   2013 August 31
+        #    2014-08-30   2014 August 30
+        #    2015-08-29   2015 August 29
+        #    2016-09-03   2016 September 3  (leap year)
+        #    2017-09-02   2017 September 2
+        #    2018-09-01   2018 September 1
+        #    2019-08-31   2019 August 31
+        (offset_lom_aug_sat, datetime(2006, 9, 2), True),
+        (offset_lom_aug_sat, datetime(2007, 9, 1), True),
+        (offset_lom_aug_sat, datetime(2008, 8, 30), True),
+        (offset_lom_aug_sat, datetime(2009, 8, 29), True),
+        (offset_lom_aug_sat, datetime(2010, 8, 28), True),
+        (offset_lom_aug_sat, datetime(2011, 9, 3), True),
+
+        (offset_lom_aug_sat, datetime(2016, 9, 3), True),
+        (offset_lom_aug_sat, datetime(2017, 9, 2), True),
+        (offset_lom_aug_sat, datetime(2018, 9, 1), True),
+        (offset_lom_aug_sat, datetime(2019, 8, 31), True),
+
+        (offset_lom_aug_sat, datetime(2006, 8, 27), False),
+        (offset_lom_aug_sat, datetime(2007, 8, 28), False),
+        (offset_lom_aug_sat, datetime(2008, 8, 31), False),
+        (offset_lom_aug_sat, datetime(2009, 8, 30), False),
+        (offset_lom_aug_sat, datetime(2010, 8, 29), False),
+        (offset_lom_aug_sat, datetime(2011, 8, 28), False),
+
+        (offset_lom_aug_sat, datetime(2006, 8, 25), False),
+        (offset_lom_aug_sat, datetime(2007, 8, 24), False),
+        (offset_lom_aug_sat, datetime(2008, 8, 29), False),
+        (offset_lom_aug_sat, datetime(2009, 8, 28), False),
+        (offset_lom_aug_sat, datetime(2010, 8, 27), False),
+        (offset_lom_aug_sat, datetime(2011, 8, 26), False),
+        (offset_lom_aug_sat, datetime(2019, 8, 30), False),
+
+        # From Micron, see:
+        # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
+        (offset_lom_aug_thu, datetime(2012, 8, 30), True),
+        (offset_lom_aug_thu, datetime(2011, 9, 1), True),
+
+        (offset_n, datetime(2012, 12, 31), False),
+        (offset_n, datetime(2013, 1, 1), True),
+        (offset_n, datetime(2013, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_apply(self):
+        date_seq_nem_8_sat = [datetime(2006, 9, 2), datetime(2007, 9, 1),
+                              datetime(2008, 8, 30), datetime(2009, 8, 29),
+                              datetime(2010, 8, 28), datetime(2011, 9, 3)]
+
+        JNJ = [datetime(2005, 1, 2), datetime(2006, 1, 1),
+               datetime(2006, 12, 31), datetime(2007, 12, 30),
+               datetime(2008, 12, 28), datetime(2010, 1, 3),
+               datetime(2011, 1, 2), datetime(2012, 1, 1),
+               datetime(2012, 12, 30)]
+
+        DEC_SAT = FY5253(n=-1, startingMonth=12, weekday=5,
+                         variation="nearest")
+
+        tests = [
+            (makeFY5253NearestEndMonth(startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT),
+             [datetime(2006, 9, 1)] + date_seq_nem_8_sat),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             [datetime(2006, 9, 3)] + date_seq_nem_8_sat[1:]),
+            (makeFY5253NearestEndMonth(n=-1, startingMonth=8,
+                                       weekday=WeekDay.SAT),
+             list(reversed(date_seq_nem_8_sat))),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN), JNJ),
+            (makeFY5253NearestEndMonth(n=-1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             list(reversed(JNJ))),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             [datetime(2005, 1, 2), datetime(2006, 1, 1)]),
+            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
+                                       weekday=WeekDay.SUN),
+             [datetime(2006, 1, 2), datetime(2006, 12, 31)]),
+            (DEC_SAT, [datetime(2013, 1, 15), datetime(2012, 12, 29)])
+        ]
+        for test in tests:
+            offset, data = test
+            current = data[0]
+            for datum in data[1:]:
+                current = current + offset
+                assert current == datum
+
+
+class TestFY5253LastOfMonthQuarter(Base):
+
+    def test_isAnchored(self):
+        assert makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4).isAnchored()
+        assert makeFY5253LastOfMonthQuarter(
+            weekday=WeekDay.SAT, startingMonth=3,
+            qtr_with_extra_week=4).isAnchored()
+        assert not makeFY5253LastOfMonthQuarter(
+            2, startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4).isAnchored()
+
+    def test_equality(self):
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) == makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT, qtr_with_extra_week=4))
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) != makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SUN, qtr_with_extra_week=4))
+        assert (makeFY5253LastOfMonthQuarter(
+            startingMonth=1, weekday=WeekDay.SAT,
+            qtr_with_extra_week=4) != makeFY5253LastOfMonthQuarter(
+            startingMonth=2, weekday=WeekDay.SAT, qtr_with_extra_week=4))
+
+    def test_offset(self):
+        offset = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
+                                              weekday=WeekDay.SAT,
+                                              qtr_with_extra_week=4)
+        offset2 = makeFY5253LastOfMonthQuarter(2, startingMonth=9,
+                                               weekday=WeekDay.SAT,
+                                               qtr_with_extra_week=4)
+        offset4 = makeFY5253LastOfMonthQuarter(4, startingMonth=9,
+                                               weekday=WeekDay.SAT,
+                                               qtr_with_extra_week=4)
+
+        offset_neg1 = makeFY5253LastOfMonthQuarter(-1, startingMonth=9,
+                                                   weekday=WeekDay.SAT,
+                                                   qtr_with_extra_week=4)
+        offset_neg2 = makeFY5253LastOfMonthQuarter(-2, startingMonth=9,
+                                                   weekday=WeekDay.SAT,
+                                                   qtr_with_extra_week=4)
+
+        GMCR = [datetime(2010, 3, 27), datetime(2010, 6, 26),
+                datetime(2010, 9, 25), datetime(2010, 12, 25),
+                datetime(2011, 3, 26), datetime(2011, 6, 25),
+                datetime(2011, 9, 24), datetime(2011, 12, 24),
+                datetime(2012, 3, 24), datetime(2012, 6, 23),
+                datetime(2012, 9, 29), datetime(2012, 12, 29),
+                datetime(2013, 3, 30), datetime(2013, 6, 29)]
+
+        assert_offset_equal(offset, base=GMCR[0], expected=GMCR[1])
+        assert_offset_equal(offset, base=GMCR[0] + relativedelta(days=-1),
+                            expected=GMCR[0])
+        assert_offset_equal(offset, base=GMCR[1], expected=GMCR[2])
+
+        assert_offset_equal(offset2, base=GMCR[0], expected=GMCR[2])
+        assert_offset_equal(offset4, base=GMCR[0], expected=GMCR[4])
+
+        assert_offset_equal(offset_neg1, base=GMCR[-1], expected=GMCR[-2])
+        assert_offset_equal(offset_neg1,
+                            base=GMCR[-1] + relativedelta(days=+1),
+                            expected=GMCR[-1])
+        assert_offset_equal(offset_neg2, base=GMCR[-1], expected=GMCR[-3])
+
+        date = GMCR[0] + relativedelta(days=-1)
+        for expected in GMCR:
+            assert_offset_equal(offset, date, expected)
+            date = date + offset
+
+        date = GMCR[-1] + relativedelta(days=+1)
+        for expected in reversed(GMCR):
+            assert_offset_equal(offset_neg1, date, expected)
+            date = date + offset_neg1
+
+    lomq_aug_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=8,
+                                                  weekday=WeekDay.SAT,
+                                                  qtr_with_extra_week=4)
+    lomq_sep_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
+                                                  weekday=WeekDay.SAT,
+                                                  qtr_with_extra_week=4)
+
+    on_offset_cases = [
+        # From Wikipedia
+        (lomq_aug_sat_4, datetime(2006, 8, 26), True),
+        (lomq_aug_sat_4, datetime(2007, 8, 25), True),
+        (lomq_aug_sat_4, datetime(2008, 8, 30), True),
+        (lomq_aug_sat_4, datetime(2009, 8, 29), True),
+        (lomq_aug_sat_4, datetime(2010, 8, 28), True),
+        (lomq_aug_sat_4, datetime(2011, 8, 27), True),
+        (lomq_aug_sat_4, datetime(2019, 8, 31), True),
+
+        (lomq_aug_sat_4, datetime(2006, 8, 27), False),
+        (lomq_aug_sat_4, datetime(2007, 8, 28), False),
+        (lomq_aug_sat_4, datetime(2008, 8, 31), False),
+        (lomq_aug_sat_4, datetime(2009, 8, 30), False),
+        (lomq_aug_sat_4, datetime(2010, 8, 29), False),
+        (lomq_aug_sat_4, datetime(2011, 8, 28), False),
+
+        (lomq_aug_sat_4, datetime(2006, 8, 25), False),
+        (lomq_aug_sat_4, datetime(2007, 8, 24), False),
+        (lomq_aug_sat_4, datetime(2008, 8, 29), False),
+        (lomq_aug_sat_4, datetime(2009, 8, 28), False),
+        (lomq_aug_sat_4, datetime(2010, 8, 27), False),
+        (lomq_aug_sat_4, datetime(2011, 8, 26), False),
+        (lomq_aug_sat_4, datetime(2019, 8, 30), False),
+
+        # From GMCR
+        (lomq_sep_sat_4, datetime(2010, 9, 25), True),
+        (lomq_sep_sat_4, datetime(2011, 9, 24), True),
+        (lomq_sep_sat_4, datetime(2012, 9, 29), True),
+
+        (lomq_sep_sat_4, datetime(2013, 6, 29), True),
+        (lomq_sep_sat_4, datetime(2012, 6, 23), True),
+        (lomq_sep_sat_4, datetime(2012, 6, 30), False),
+
+        (lomq_sep_sat_4, datetime(2013, 3, 30), True),
+        (lomq_sep_sat_4, datetime(2012, 3, 24), True),
+
+        (lomq_sep_sat_4, datetime(2012, 12, 29), True),
+        (lomq_sep_sat_4, datetime(2011, 12, 24), True),
+
+        # INTC (extra week in Q1)
+        # See: http://www.intc.com/releasedetail.cfm?ReleaseID=542844
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2011, 4, 2), True),
+
+        # see: http://google.brand.edgar-online.com/?sym=INTC&formtypeID=7
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2012, 12, 29), True),
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2011, 12, 31), True),
+        (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                      weekday=WeekDay.SAT,
+                                      qtr_with_extra_week=1),
+         datetime(2010, 12, 25), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_year_has_extra_week(self):
+        # End of long Q1
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2011, 4, 2))
+
+        # Start of long Q1
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 26))
+
+        # End of year before year with long Q1
+        assert not makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2010, 12, 25))
+
+        for year in [x
+                     for x in range(1994, 2011 + 1)
+                     if x not in [2011, 2005, 2000, 1994]]:
+            assert not makeFY5253LastOfMonthQuarter(
+                1, startingMonth=12, weekday=WeekDay.SAT,
+                qtr_with_extra_week=1).year_has_extra_week(
+                datetime(year, 4, 2))
+
+        # Other long years
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2005, 4, 2))
+
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(2000, 4, 2))
+
+        assert makeFY5253LastOfMonthQuarter(
+            1, startingMonth=12, weekday=WeekDay.SAT,
+            qtr_with_extra_week=1).year_has_extra_week(datetime(1994, 4, 2))
+
+    def test_get_weeks(self):
+        sat_dec_1 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                                 weekday=WeekDay.SAT,
+                                                 qtr_with_extra_week=1)
+        sat_dec_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
+                                                 weekday=WeekDay.SAT,
+                                                 qtr_with_extra_week=4)
+
+        assert sat_dec_1.get_weeks(datetime(2011, 4, 2)) == [14, 13, 13, 13]
+        assert sat_dec_4.get_weeks(datetime(2011, 4, 2)) == [13, 13, 13, 14]
+        assert sat_dec_1.get_weeks(datetime(2010, 12, 25)) == [13, 13, 13, 13]
+
+
+class TestFY5253NearestEndMonthQuarter(Base):
+
+    offset_nem_sat_aug_4 = makeFY5253NearestEndMonthQuarter(
+        1, startingMonth=8, weekday=WeekDay.SAT,
+        qtr_with_extra_week=4)
+    offset_nem_thu_aug_4 = makeFY5253NearestEndMonthQuarter(
+        1, startingMonth=8, weekday=WeekDay.THU,
+        qtr_with_extra_week=4)
+    offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
+                      variation="nearest")
+
+    on_offset_cases = [
+        # From Wikipedia
+        (offset_nem_sat_aug_4, datetime(2006, 9, 2), True),
+        (offset_nem_sat_aug_4, datetime(2007, 9, 1), True),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 30), True),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 29), True),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 28), True),
+        (offset_nem_sat_aug_4, datetime(2011, 9, 3), True),
+
+        (offset_nem_sat_aug_4, datetime(2016, 9, 3), True),
+        (offset_nem_sat_aug_4, datetime(2017, 9, 2), True),
+        (offset_nem_sat_aug_4, datetime(2018, 9, 1), True),
+        (offset_nem_sat_aug_4, datetime(2019, 8, 31), True),
+
+        (offset_nem_sat_aug_4, datetime(2006, 8, 27), False),
+        (offset_nem_sat_aug_4, datetime(2007, 8, 28), False),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 31), False),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 30), False),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 29), False),
+        (offset_nem_sat_aug_4, datetime(2011, 8, 28), False),
+
+        (offset_nem_sat_aug_4, datetime(2006, 8, 25), False),
+        (offset_nem_sat_aug_4, datetime(2007, 8, 24), False),
+        (offset_nem_sat_aug_4, datetime(2008, 8, 29), False),
+        (offset_nem_sat_aug_4, datetime(2009, 8, 28), False),
+        (offset_nem_sat_aug_4, datetime(2010, 8, 27), False),
+        (offset_nem_sat_aug_4, datetime(2011, 8, 26), False),
+        (offset_nem_sat_aug_4, datetime(2019, 8, 30), False),
+
+        # From Micron, see:
+        # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
+        (offset_nem_thu_aug_4, datetime(2012, 8, 30), True),
+        (offset_nem_thu_aug_4, datetime(2011, 9, 1), True),
+
+        # See: http://google.brand.edgar-online.com/?sym=MU&formtypeID=13
+        (offset_nem_thu_aug_4, datetime(2013, 5, 30), True),
+        (offset_nem_thu_aug_4, datetime(2013, 2, 28), True),
+        (offset_nem_thu_aug_4, datetime(2012, 11, 29), True),
+        (offset_nem_thu_aug_4, datetime(2012, 5, 31), True),
+        (offset_nem_thu_aug_4, datetime(2007, 3, 1), True),
+        (offset_nem_thu_aug_4, datetime(1994, 3, 3), True),
+
+        (offset_n, datetime(2012, 12, 31), False),
+        (offset_n, datetime(2013, 1, 1), True),
+        (offset_n, datetime(2013, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    def test_offset(self):
+        offset = makeFY5253NearestEndMonthQuarter(1, startingMonth=8,
+                                                  weekday=WeekDay.THU,
+                                                  qtr_with_extra_week=4)
+
+        MU = [datetime(2012, 5, 31),
+              datetime(2012, 8, 30), datetime(2012, 11, 29),
+              datetime(2013, 2, 28), datetime(2013, 5, 30)]
+
+        date = MU[0] + relativedelta(days=-1)
+        for expected in MU:
+            assert_offset_equal(offset, date, expected)
+            date = date + offset
+
+        assert_offset_equal(offset,
+                            datetime(2012, 5, 31),
+                            datetime(2012, 8, 30))
+        assert_offset_equal(offset,
+                            datetime(2012, 5, 30),
+                            datetime(2012, 5, 31))
+
+        offset2 = FY5253Quarter(weekday=5, startingMonth=12, variation="last",
+                                qtr_with_extra_week=4)
+
+        assert_offset_equal(offset2,
+                            datetime(2013, 1, 15),
+                            datetime(2013, 3, 30))
+
+
+def test_bunched_yearends():
+    # GH#14774 cases with two fiscal year-ends in the same calendar-year
+    fy = FY5253(n=1, weekday=5, startingMonth=12, variation='nearest')
+    dt = Timestamp('2004-01-01')
+    assert fy.rollback(dt) == Timestamp('2002-12-28')
+    assert (-fy).apply(dt) == Timestamp('2002-12-28')
+    assert dt - fy == Timestamp('2002-12-28')
+
+    assert fy.rollforward(dt) == Timestamp('2004-01-03')
+    assert fy.apply(dt) == Timestamp('2004-01-03')
+    assert fy + dt == Timestamp('2004-01-03')
+    assert dt + fy == Timestamp('2004-01-03')
+
+    # Same thing, but starting from a Timestamp in the previous year.
+    dt = Timestamp('2003-12-31')
+    assert fy.rollback(dt) == Timestamp('2002-12-28')
+    assert (-fy).apply(dt) == Timestamp('2002-12-28')
+    assert dt - fy == Timestamp('2002-12-28')
+
+
+def test_fy5253_last_onoffset():
+    # GH#18877 dates on the year-end but not normalized to midnight
+    offset = FY5253(n=-5, startingMonth=5, variation="last", weekday=0)
+    ts = Timestamp('1984-05-28 06:29:43.955911354+0200',
+                   tz='Europe/San_Marino')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253_nearest_onoffset():
+    # GH#18877 dates on the year-end but not normalized to midnight
+    offset = FY5253(n=3, startingMonth=7, variation="nearest", weekday=2)
+    ts = Timestamp('2032-07-28 00:12:59.035729419+0000', tz='Africa/Dakar')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253qtr_onoffset_nearest():
+    # GH#19036
+    ts = Timestamp('1985-09-02 23:57:46.232550356-0300',
+                   tz='Atlantic/Bermuda')
+    offset = FY5253Quarter(n=3, qtr_with_extra_week=1, startingMonth=2,
+                           variation="nearest", weekday=0)
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_fy5253qtr_onoffset_last():
+    # GH#19036
+    offset = FY5253Quarter(n=-2, qtr_with_extra_week=1,
+                           startingMonth=7, variation="last", weekday=2)
+    ts = Timestamp('2011-01-26 19:03:40.331096129+0200',
+                   tz='Africa/Windhoek')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
diff --git a/pandas/tests/tseries/offsets/test_offsets.py b/pandas/tests/tseries/offsets/test_offsets.py
new file mode 100644
index 0000000000000..e6f21a7b47c3b
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_offsets.py
@@ -0,0 +1,3172 @@
+from datetime import date, datetime, timedelta
+from distutils.version import LooseVersion
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import (
+    NaT, OutOfBoundsDatetime, Timestamp, conversion, timezones)
+from pandas._libs.tslibs.frequencies import (
+    INVALID_FREQ_ERR_MSG, get_freq_code, get_freq_str)
+import pandas._libs.tslibs.offsets as liboffsets
+from pandas._libs.tslibs.offsets import ApplyTypeError
+import pandas.compat as compat
+from pandas.compat import range
+from pandas.compat.numpy import np_datetime64_compat
+
+from pandas.core.indexes.datetimes import DatetimeIndex, _to_M8, date_range
+from pandas.core.series import Series
+import pandas.util.testing as tm
+
+from pandas.io.pickle import read_pickle
+from pandas.tseries.frequencies import _offset_map, get_offset
+from pandas.tseries.holiday import USFederalHolidayCalendar
+import pandas.tseries.offsets as offsets
+from pandas.tseries.offsets import (
+    FY5253, BDay, BMonthBegin, BMonthEnd, BQuarterBegin, BQuarterEnd,
+    BusinessHour, BYearBegin, BYearEnd, CBMonthBegin, CBMonthEnd, CDay,
+    CustomBusinessHour, DateOffset, Day, Easter, FY5253Quarter,
+    LastWeekOfMonth, MonthBegin, MonthEnd, Nano, QuarterBegin, QuarterEnd,
+    SemiMonthBegin, SemiMonthEnd, Tick, Week, WeekOfMonth, YearBegin, YearEnd)
+
+from .common import assert_offset_equal, assert_onOffset
+
+
+class WeekDay(object):
+    # TODO: Remove: This is not used outside of tests
+    MON = 0
+    TUE = 1
+    WED = 2
+    THU = 3
+    FRI = 4
+    SAT = 5
+    SUN = 6
+
+
+####
+# Misc function tests
+####
+
+
+def test_to_M8():
+    valb = datetime(2007, 10, 1)
+    valu = _to_M8(valb)
+    assert isinstance(valu, np.datetime64)
+
+
+#####
+# DateOffset Tests
+#####
+
+
+class Base(object):
+    _offset = None
+    d = Timestamp(datetime(2008, 1, 2))
+
+    timezones = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
+                 'dateutil/Asia/Tokyo', 'dateutil/US/Pacific']
+
+    def _get_offset(self, klass, value=1, normalize=False):
+        # create instance from offset class
+        if klass is FY5253:
+            klass = klass(n=value, startingMonth=1, weekday=1,
+                          variation='last', normalize=normalize)
+        elif klass is FY5253Quarter:
+            klass = klass(n=value, startingMonth=1, weekday=1,
+                          qtr_with_extra_week=1, variation='last',
+                          normalize=normalize)
+        elif klass is LastWeekOfMonth:
+            klass = klass(n=value, weekday=5, normalize=normalize)
+        elif klass is WeekOfMonth:
+            klass = klass(n=value, week=1, weekday=5, normalize=normalize)
+        elif klass is Week:
+            klass = klass(n=value, weekday=5, normalize=normalize)
+        elif klass is DateOffset:
+            klass = klass(days=value, normalize=normalize)
+        else:
+            try:
+                klass = klass(value, normalize=normalize)
+            except Exception:
+                klass = klass(normalize=normalize)
+        return klass
+
+    def test_apply_out_of_range(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        if self._offset is None:
+            return
+
+        # try to create an out-of-bounds result timestamp; if we can't create
+        # the offset skip
+        try:
+            if self._offset in (BusinessHour, CustomBusinessHour):
+                # Using 10000 in BusinessHour fails in tz check because of DST
+                # difference
+                offset = self._get_offset(self._offset, value=100000)
+            else:
+                offset = self._get_offset(self._offset, value=10000)
+
+            result = Timestamp('20080101') + offset
+            assert isinstance(result, datetime)
+            assert result.tzinfo is None
+
+            # Check tz is preserved
+            t = Timestamp('20080101', tz=tz)
+            result = t + offset
+            assert isinstance(result, datetime)
+            assert t.tzinfo == result.tzinfo
+
+        except OutOfBoundsDatetime:
+            raise
+        except (ValueError, KeyError):
+            # we are creating an invalid offset
+            # so ignore
+            pass
+
+    def test_offsets_compare_equal(self):
+        # root cause of GH#456: __ne__ was not implemented
+        if self._offset is None:
+            return
+        offset1 = self._offset()
+        offset2 = self._offset()
+        assert not offset1 != offset2
+        assert offset1 == offset2
+
+    def test_rsub(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        assert self.d - self.offset2 == (-self.offset2).apply(self.d)
+
+    def test_radd(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        assert self.d + self.offset2 == self.offset2 + self.d
+
+    def test_sub(self):
+        if self._offset is None or not hasattr(self, "offset2"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset2 attr
+            return
+        off = self.offset2
+        msg = "Cannot subtract datetime from offset"
+        with pytest.raises(TypeError, match=msg):
+            off - self.d
+
+        assert 2 * off - off == off
+        assert self.d - self.offset2 == self.d + self._offset(-2)
+        assert self.d - self.offset2 == self.d - (2 * off - off)
+
+    def testMult1(self):
+        if self._offset is None or not hasattr(self, "offset1"):
+            # i.e. skip for TestCommon and YQM subclasses that do not have
+            # offset1 attr
+            return
+        assert self.d + 10 * self.offset1 == self.d + self._offset(10)
+        assert self.d + 5 * self.offset1 == self.d + self._offset(5)
+
+    def testMult2(self):
+        if self._offset is None:
+            return
+        assert self.d + (-5 * self._offset(-10)) == self.d + self._offset(50)
+        assert self.d + (-3 * self._offset(-2)) == self.d + self._offset(6)
+
+    def test_compare_str(self):
+        # GH#23524
+        # comparing to strings that cannot be cast to DateOffsets should
+        #  not raise for __eq__ or __ne__
+        if self._offset is None:
+            return
+        off = self._get_offset(self._offset)
+
+        assert not off == "infer"
+        assert off != "foo"
+        # Note: inequalities are only implemented for Tick subclasses;
+        #  tests for this are in test_ticks
+
+
+class TestCommon(Base):
+    # exected value created by Base._get_offset
+    # are applied to 2011/01/01 09:00 (Saturday)
+    # used for .apply and .rollforward
+    expecteds = {'Day': Timestamp('2011-01-02 09:00:00'),
+                 'DateOffset': Timestamp('2011-01-02 09:00:00'),
+                 'BusinessDay': Timestamp('2011-01-03 09:00:00'),
+                 'CustomBusinessDay': Timestamp('2011-01-03 09:00:00'),
+                 'CustomBusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'CustomBusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
+                 'MonthBegin': Timestamp('2011-02-01 09:00:00'),
+                 'BusinessMonthBegin': Timestamp('2011-01-03 09:00:00'),
+                 'MonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'SemiMonthEnd': Timestamp('2011-01-15 09:00:00'),
+                 'SemiMonthBegin': Timestamp('2011-01-15 09:00:00'),
+                 'BusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
+                 'YearBegin': Timestamp('2012-01-01 09:00:00'),
+                 'BYearBegin': Timestamp('2011-01-03 09:00:00'),
+                 'YearEnd': Timestamp('2011-12-31 09:00:00'),
+                 'BYearEnd': Timestamp('2011-12-30 09:00:00'),
+                 'QuarterBegin': Timestamp('2011-03-01 09:00:00'),
+                 'BQuarterBegin': Timestamp('2011-03-01 09:00:00'),
+                 'QuarterEnd': Timestamp('2011-03-31 09:00:00'),
+                 'BQuarterEnd': Timestamp('2011-03-31 09:00:00'),
+                 'BusinessHour': Timestamp('2011-01-03 10:00:00'),
+                 'CustomBusinessHour': Timestamp('2011-01-03 10:00:00'),
+                 'WeekOfMonth': Timestamp('2011-01-08 09:00:00'),
+                 'LastWeekOfMonth': Timestamp('2011-01-29 09:00:00'),
+                 'FY5253Quarter': Timestamp('2011-01-25 09:00:00'),
+                 'FY5253': Timestamp('2011-01-25 09:00:00'),
+                 'Week': Timestamp('2011-01-08 09:00:00'),
+                 'Easter': Timestamp('2011-04-24 09:00:00'),
+                 'Hour': Timestamp('2011-01-01 10:00:00'),
+                 'Minute': Timestamp('2011-01-01 09:01:00'),
+                 'Second': Timestamp('2011-01-01 09:00:01'),
+                 'Milli': Timestamp('2011-01-01 09:00:00.001000'),
+                 'Micro': Timestamp('2011-01-01 09:00:00.000001'),
+                 'Nano': Timestamp(np_datetime64_compat(
+                                   '2011-01-01T09:00:00.000000001Z'))}
+
+    def test_immutable(self, offset_types):
+        # GH#21341 check that __setattr__ raises
+        offset = self._get_offset(offset_types)
+        with pytest.raises(AttributeError):
+            offset.normalize = True
+        with pytest.raises(AttributeError):
+            offset.n = 91
+
+    def test_return_type(self, offset_types):
+        offset = self._get_offset(offset_types)
+
+        # make sure that we are returning a Timestamp
+        result = Timestamp('20080101') + offset
+        assert isinstance(result, Timestamp)
+
+        # make sure that we are returning NaT
+        assert NaT + offset is NaT
+        assert offset + NaT is NaT
+
+        assert NaT - offset is NaT
+        assert (-offset).apply(NaT) is NaT
+
+    def test_offset_n(self, offset_types):
+        offset = self._get_offset(offset_types)
+        assert offset.n == 1
+
+        neg_offset = offset * -1
+        assert neg_offset.n == -1
+
+        mul_offset = offset * 3
+        assert mul_offset.n == 3
+
+    def test_offset_timedelta64_arg(self, offset_types):
+        # check that offset._validate_n raises TypeError on a timedelt64
+        #  object
+        off = self._get_offset(offset_types)
+
+        td64 = np.timedelta64(4567, 's')
+        with pytest.raises(TypeError, match="argument must be an integer"):
+            type(off)(n=td64, **off.kwds)
+
+    def test_offset_mul_ndarray(self, offset_types):
+        off = self._get_offset(offset_types)
+
+        expected = np.array([[off, off * 2], [off * 3, off * 4]])
+
+        result = np.array([[1, 2], [3, 4]]) * off
+        tm.assert_numpy_array_equal(result, expected)
+
+        result = off * np.array([[1, 2], [3, 4]])
+        tm.assert_numpy_array_equal(result, expected)
+
+    def test_offset_freqstr(self, offset_types):
+        offset = self._get_offset(offset_types)
+
+        freqstr = offset.freqstr
+        if freqstr not in ('<Easter>',
+                           "<DateOffset: days=1>",
+                           'LWOM-SAT', ):
+            code = get_offset(freqstr)
+            assert offset.rule_code == code
+
+    def _check_offsetfunc_works(self, offset, funcname, dt, expected,
+                                normalize=False):
+
+        if normalize and issubclass(offset, Tick):
+            # normalize=True disallowed for Tick subclasses GH#21427
+            return
+
+        offset_s = self._get_offset(offset, normalize=normalize)
+        func = getattr(offset_s, funcname)
+
+        result = func(dt)
+        assert isinstance(result, Timestamp)
+        assert result == expected
+
+        result = func(Timestamp(dt))
+        assert isinstance(result, Timestamp)
+        assert result == expected
+
+        # see gh-14101
+        exp_warning = None
+        ts = Timestamp(dt) + Nano(5)
+
+        if (offset_s.__class__.__name__ == 'DateOffset' and
+                (funcname == 'apply' or normalize) and
+                ts.nanosecond > 0):
+            exp_warning = UserWarning
+
+        # test nanosecond is preserved
+        with tm.assert_produces_warning(exp_warning,
+                                        check_stacklevel=False):
+            result = func(ts)
+        assert isinstance(result, Timestamp)
+        if normalize is False:
+            assert result == expected + Nano(5)
+        else:
+            assert result == expected
+
+        if isinstance(dt, np.datetime64):
+            # test tz when input is datetime or Timestamp
+            return
+
+        for tz in self.timezones:
+            expected_localize = expected.tz_localize(tz)
+            tz_obj = timezones.maybe_get_tz(tz)
+            dt_tz = conversion.localize_pydatetime(dt, tz_obj)
+
+            result = func(dt_tz)
+            assert isinstance(result, Timestamp)
+            assert result == expected_localize
+
+            result = func(Timestamp(dt, tz=tz))
+            assert isinstance(result, Timestamp)
+            assert result == expected_localize
+
+            # see gh-14101
+            exp_warning = None
+            ts = Timestamp(dt, tz=tz) + Nano(5)
+
+            if (offset_s.__class__.__name__ == 'DateOffset' and
+                    (funcname == 'apply' or normalize) and
+                    ts.nanosecond > 0):
+                exp_warning = UserWarning
+
+            # test nanosecond is preserved
+            with tm.assert_produces_warning(exp_warning,
+                                            check_stacklevel=False):
+                result = func(ts)
+            assert isinstance(result, Timestamp)
+            if normalize is False:
+                assert result == expected_localize + Nano(5)
+            else:
+                assert result == expected_localize
+
+    def test_apply(self, offset_types):
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = self.expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'apply', dt, expected)
+
+            expected = Timestamp(expected.date())
+            self._check_offsetfunc_works(offset_types, 'apply', dt, expected,
+                                         normalize=True)
+
+    def test_rollforward(self, offset_types):
+        expecteds = self.expecteds.copy()
+
+        # result will not be changed if the target is on the offset
+        no_changes = ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin',
+                      'Week', 'Hour', 'Minute', 'Second', 'Milli', 'Micro',
+                      'Nano', 'DateOffset']
+        for n in no_changes:
+            expecteds[n] = Timestamp('2011/01/01 09:00')
+
+        expecteds['BusinessHour'] = Timestamp('2011-01-03 09:00:00')
+        expecteds['CustomBusinessHour'] = Timestamp('2011-01-03 09:00:00')
+
+        # but be changed when normalize=True
+        norm_expected = expecteds.copy()
+        for k in norm_expected:
+            norm_expected[k] = Timestamp(norm_expected[k].date())
+
+        normalized = {'Day': Timestamp('2011-01-02 00:00:00'),
+                      'DateOffset': Timestamp('2011-01-02 00:00:00'),
+                      'MonthBegin': Timestamp('2011-02-01 00:00:00'),
+                      'SemiMonthBegin': Timestamp('2011-01-15 00:00:00'),
+                      'YearBegin': Timestamp('2012-01-01 00:00:00'),
+                      'Week': Timestamp('2011-01-08 00:00:00'),
+                      'Hour': Timestamp('2011-01-01 00:00:00'),
+                      'Minute': Timestamp('2011-01-01 00:00:00'),
+                      'Second': Timestamp('2011-01-01 00:00:00'),
+                      'Milli': Timestamp('2011-01-01 00:00:00'),
+                      'Micro': Timestamp('2011-01-01 00:00:00')}
+        norm_expected.update(normalized)
+
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollforward', dt,
+                                         expected)
+            expected = norm_expected[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollforward', dt,
+                                         expected, normalize=True)
+
+    def test_rollback(self, offset_types):
+        expecteds = {'BusinessDay': Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessDay': Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessMonthEnd':
+                     Timestamp('2010-12-31 09:00:00'),
+                     'CustomBusinessMonthBegin':
+                     Timestamp('2010-12-01 09:00:00'),
+                     'BusinessMonthBegin': Timestamp('2010-12-01 09:00:00'),
+                     'MonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'SemiMonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BusinessMonthEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BYearBegin': Timestamp('2010-01-01 09:00:00'),
+                     'YearEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BYearEnd': Timestamp('2010-12-31 09:00:00'),
+                     'QuarterBegin': Timestamp('2010-12-01 09:00:00'),
+                     'BQuarterBegin': Timestamp('2010-12-01 09:00:00'),
+                     'QuarterEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BQuarterEnd': Timestamp('2010-12-31 09:00:00'),
+                     'BusinessHour': Timestamp('2010-12-31 17:00:00'),
+                     'CustomBusinessHour': Timestamp('2010-12-31 17:00:00'),
+                     'WeekOfMonth': Timestamp('2010-12-11 09:00:00'),
+                     'LastWeekOfMonth': Timestamp('2010-12-25 09:00:00'),
+                     'FY5253Quarter': Timestamp('2010-10-26 09:00:00'),
+                     'FY5253': Timestamp('2010-01-26 09:00:00'),
+                     'Easter': Timestamp('2010-04-04 09:00:00')}
+
+        # result will not be changed if the target is on the offset
+        for n in ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin', 'Week',
+                  'Hour', 'Minute', 'Second', 'Milli', 'Micro', 'Nano',
+                  'DateOffset']:
+            expecteds[n] = Timestamp('2011/01/01 09:00')
+
+        # but be changed when normalize=True
+        norm_expected = expecteds.copy()
+        for k in norm_expected:
+            norm_expected[k] = Timestamp(norm_expected[k].date())
+
+        normalized = {'Day': Timestamp('2010-12-31 00:00:00'),
+                      'DateOffset': Timestamp('2010-12-31 00:00:00'),
+                      'MonthBegin': Timestamp('2010-12-01 00:00:00'),
+                      'SemiMonthBegin': Timestamp('2010-12-15 00:00:00'),
+                      'YearBegin': Timestamp('2010-01-01 00:00:00'),
+                      'Week': Timestamp('2010-12-25 00:00:00'),
+                      'Hour': Timestamp('2011-01-01 00:00:00'),
+                      'Minute': Timestamp('2011-01-01 00:00:00'),
+                      'Second': Timestamp('2011-01-01 00:00:00'),
+                      'Milli': Timestamp('2011-01-01 00:00:00'),
+                      'Micro': Timestamp('2011-01-01 00:00:00')}
+        norm_expected.update(normalized)
+
+        sdt = datetime(2011, 1, 1, 9, 0)
+        ndt = np_datetime64_compat('2011-01-01 09:00Z')
+
+        for dt in [sdt, ndt]:
+            expected = expecteds[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollback', dt,
+                                         expected)
+
+            expected = norm_expected[offset_types.__name__]
+            self._check_offsetfunc_works(offset_types, 'rollback', dt,
+                                         expected, normalize=True)
+
+    def test_onOffset(self, offset_types):
+        dt = self.expecteds[offset_types.__name__]
+        offset_s = self._get_offset(offset_types)
+        assert offset_s.onOffset(dt)
+
+        # when normalize=True, onOffset checks time is 00:00:00
+        if issubclass(offset_types, Tick):
+            # normalize=True disallowed for Tick subclasses GH#21427
+            return
+        offset_n = self._get_offset(offset_types, normalize=True)
+        assert not offset_n.onOffset(dt)
+
+        if offset_types in (BusinessHour, CustomBusinessHour):
+            # In default BusinessHour (9:00-17:00), normalized time
+            # cannot be in business hour range
+            return
+        date = datetime(dt.year, dt.month, dt.day)
+        assert offset_n.onOffset(date)
+
+    def test_add(self, offset_types, tz_naive_fixture):
+        tz = tz_naive_fixture
+        dt = datetime(2011, 1, 1, 9, 0)
+
+        offset_s = self._get_offset(offset_types)
+        expected = self.expecteds[offset_types.__name__]
+
+        result_dt = dt + offset_s
+        result_ts = Timestamp(dt) + offset_s
+        for result in [result_dt, result_ts]:
+            assert isinstance(result, Timestamp)
+            assert result == expected
+
+        expected_localize = expected.tz_localize(tz)
+        result = Timestamp(dt, tz=tz) + offset_s
+        assert isinstance(result, Timestamp)
+        assert result == expected_localize
+
+        # normalize=True, disallowed for Tick subclasses GH#21427
+        if issubclass(offset_types, Tick):
+            return
+        offset_s = self._get_offset(offset_types, normalize=True)
+        expected = Timestamp(expected.date())
+
+        result_dt = dt + offset_s
+        result_ts = Timestamp(dt) + offset_s
+        for result in [result_dt, result_ts]:
+            assert isinstance(result, Timestamp)
+            assert result == expected
+
+        expected_localize = expected.tz_localize(tz)
+        result = Timestamp(dt, tz=tz) + offset_s
+        assert isinstance(result, Timestamp)
+        assert result == expected_localize
+
+    def test_pickle_v0_15_2(self, datapath):
+        offsets = {'DateOffset': DateOffset(years=1),
+                   'MonthBegin': MonthBegin(1),
+                   'Day': Day(1),
+                   'YearBegin': YearBegin(1),
+                   'Week': Week(1)}
+
+        pickle_path = datapath('tseries', 'offsets', 'data',
+                               'dateoffset_0_15_2.pickle')
+        # This code was executed once on v0.15.2 to generate the pickle:
+        # with open(pickle_path, 'wb') as f: pickle.dump(offsets, f)
+        #
+        tm.assert_dict_equal(offsets, read_pickle(pickle_path))
+
+
+class TestDateOffset(Base):
+
+    def setup_method(self, method):
+        self.d = Timestamp(datetime(2008, 1, 2))
+        _offset_map.clear()
+
+    def test_repr(self):
+        repr(DateOffset())
+        repr(DateOffset(2))
+        repr(2 * DateOffset())
+        repr(2 * DateOffset(months=2))
+
+    def test_mul(self):
+        assert DateOffset(2) == 2 * DateOffset(1)
+        assert DateOffset(2) == DateOffset(1) * 2
+
+    def test_constructor(self):
+
+        assert ((self.d + DateOffset(months=2)) == datetime(2008, 3, 2))
+        assert ((self.d - DateOffset(months=2)) == datetime(2007, 11, 2))
+
+        assert ((self.d + DateOffset(2)) == datetime(2008, 1, 4))
+
+        assert not DateOffset(2).isAnchored()
+        assert DateOffset(1).isAnchored()
+
+        d = datetime(2008, 1, 31)
+        assert ((d + DateOffset(months=1)) == datetime(2008, 2, 29))
+
+    def test_copy(self):
+        assert (DateOffset(months=2).copy() == DateOffset(months=2))
+
+    def test_eq(self):
+        offset1 = DateOffset(days=1)
+        offset2 = DateOffset(days=365)
+
+        assert offset1 != offset2
+
+
+class TestBusinessDay(Base):
+    _offset = BDay
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+
+        self.offset = BDay()
+        self.offset1 = self.offset
+        self.offset2 = BDay(2)
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<BusinessDay>'
+        assert repr(self.offset2) == '<2 * BusinessDays>'
+
+        if compat.PY37:
+            expected = '<BusinessDay: offset=datetime.timedelta(days=1)>'
+        else:
+            expected = '<BusinessDay: offset=datetime.timedelta(1)>'
+        assert repr(self.offset + timedelta(1)) == expected
+
+    def test_with_offset(self):
+        offset = self.offset + timedelta(hours=2)
+
+        assert (self.d + offset) == datetime(2008, 1, 2, 2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset2(self.d) == datetime(2008, 1, 3)
+
+    def testRollback1(self):
+        assert BDay(10).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (BDay(10).rollback(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 4))
+
+    def testRollforward1(self):
+        assert BDay(10).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (BDay(10).rollforward(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 7))
+
+    def test_roll_date_object(self):
+        offset = BDay()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 14)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 17)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    def test_onOffset(self):
+        tests = [(BDay(), datetime(2008, 1, 1), True),
+                 (BDay(), datetime(2008, 1, 5), False)]
+
+        for offset, d, expected in tests:
+            assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((BDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 2),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 8)}))
+
+    apply_cases.append((2 * BDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 3),
+        datetime(2008, 1, 4): datetime(2008, 1, 8),
+        datetime(2008, 1, 5): datetime(2008, 1, 8),
+        datetime(2008, 1, 6): datetime(2008, 1, 8),
+        datetime(2008, 1, 7): datetime(2008, 1, 9)}))
+
+    apply_cases.append((-BDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 3),
+        datetime(2008, 1, 5): datetime(2008, 1, 4),
+        datetime(2008, 1, 6): datetime(2008, 1, 4),
+        datetime(2008, 1, 7): datetime(2008, 1, 4),
+        datetime(2008, 1, 8): datetime(2008, 1, 7)}))
+
+    apply_cases.append((-2 * BDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 28),
+        datetime(2008, 1, 4): datetime(2008, 1, 2),
+        datetime(2008, 1, 5): datetime(2008, 1, 3),
+        datetime(2008, 1, 6): datetime(2008, 1, 3),
+        datetime(2008, 1, 7): datetime(2008, 1, 3),
+        datetime(2008, 1, 8): datetime(2008, 1, 4),
+        datetime(2008, 1, 9): datetime(2008, 1, 7)}))
+
+    apply_cases.append((BDay(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 4): datetime(2008, 1, 4),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + BDay(10)
+        assert result == datetime(2012, 11, 6)
+
+        result = dt + BDay(100) - BDay(100)
+        assert result == dt
+
+        off = BDay() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 12, 23)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2011, 12, 26)
+        assert rs == xp
+
+        off = BDay() * 10
+        rs = datetime(2014, 1, 5) + off  # see #5890
+        xp = datetime(2014, 1, 17)
+        assert rs == xp
+
+    def test_apply_corner(self):
+        msg = ("Only know how to combine business day with datetime or"
+               " timedelta")
+        with pytest.raises(ApplyTypeError, match=msg):
+            BDay().apply(BMonthEnd())
+
+
+class TestBusinessHour(Base):
+    _offset = BusinessHour
+
+    def setup_method(self, method):
+        self.d = datetime(2014, 7, 1, 10, 00)
+
+        self.offset1 = BusinessHour()
+        self.offset2 = BusinessHour(n=3)
+
+        self.offset3 = BusinessHour(n=-1)
+        self.offset4 = BusinessHour(n=-4)
+
+        from datetime import time as dt_time
+        self.offset5 = BusinessHour(start=dt_time(11, 0), end=dt_time(14, 30))
+        self.offset6 = BusinessHour(start='20:00', end='05:00')
+        self.offset7 = BusinessHour(n=-2, start=dt_time(21, 30),
+                                    end=dt_time(6, 30))
+
+    def test_constructor_errors(self):
+        from datetime import time as dt_time
+        with pytest.raises(ValueError):
+            BusinessHour(start=dt_time(11, 0, 5))
+        with pytest.raises(ValueError):
+            BusinessHour(start='AAA')
+        with pytest.raises(ValueError):
+            BusinessHour(start='14:00:05')
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset1) == '<BusinessHour: BH=09:00-17:00>'
+        assert repr(self.offset2) == '<3 * BusinessHours: BH=09:00-17:00>'
+        assert repr(self.offset3) == '<-1 * BusinessHour: BH=09:00-17:00>'
+        assert repr(self.offset4) == '<-4 * BusinessHours: BH=09:00-17:00>'
+
+        assert repr(self.offset5) == '<BusinessHour: BH=11:00-14:30>'
+        assert repr(self.offset6) == '<BusinessHour: BH=20:00-05:00>'
+        assert repr(self.offset7) == '<-2 * BusinessHours: BH=21:30-06:30>'
+
+    def test_with_offset(self):
+        expected = Timestamp('2014-07-01 13:00')
+
+        assert self.d + BusinessHour() * 3 == expected
+        assert self.d + BusinessHour(n=3) == expected
+
+    def test_eq(self):
+        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
+            assert offset == offset
+
+        assert BusinessHour() != BusinessHour(-1)
+        assert BusinessHour(start='09:00') == BusinessHour()
+        assert BusinessHour(start='09:00') != BusinessHour(start='09:01')
+        assert (BusinessHour(start='09:00', end='17:00') !=
+                BusinessHour(start='17:00', end='09:01'))
+
+    def test_hash(self):
+        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
+            assert hash(offset) == hash(offset)
+
+    def test_call(self):
+        assert self.offset1(self.d) == datetime(2014, 7, 1, 11)
+        assert self.offset2(self.d) == datetime(2014, 7, 1, 13)
+        assert self.offset3(self.d) == datetime(2014, 6, 30, 17)
+        assert self.offset4(self.d) == datetime(2014, 6, 30, 14)
+
+    def test_sub(self):
+        # we have to override test_sub here becasue self.offset2 is not
+        # defined as self._offset(2)
+        off = self.offset2
+        msg = "Cannot subtract datetime from offset"
+        with pytest.raises(TypeError, match=msg):
+            off - self.d
+        assert 2 * off - off == off
+
+        assert self.d - self.offset2 == self.d + self._offset(-3)
+
+    def testRollback1(self):
+        assert self.offset1.rollback(self.d) == self.d
+        assert self.offset2.rollback(self.d) == self.d
+        assert self.offset3.rollback(self.d) == self.d
+        assert self.offset4.rollback(self.d) == self.d
+        assert self.offset5.rollback(self.d) == datetime(2014, 6, 30, 14, 30)
+        assert self.offset6.rollback(self.d) == datetime(2014, 7, 1, 5, 0)
+        assert self.offset7.rollback(self.d) == datetime(2014, 7, 1, 6, 30)
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset2.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset3.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset4.rollback(d) == datetime(2014, 6, 30, 17)
+        assert self.offset5.rollback(d) == datetime(2014, 6, 30, 14, 30)
+        assert self.offset6.rollback(d) == d
+        assert self.offset7.rollback(d) == d
+
+        assert self._offset(5).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (self._offset(-3).rollback(datetime(2014, 7, 5, 15, 0)) ==
+                datetime(2014, 7, 4, 17, 0))
+
+    def testRollforward1(self):
+        assert self.offset1.rollforward(self.d) == self.d
+        assert self.offset2.rollforward(self.d) == self.d
+        assert self.offset3.rollforward(self.d) == self.d
+        assert self.offset4.rollforward(self.d) == self.d
+        assert (self.offset5.rollforward(self.d) ==
+                datetime(2014, 7, 1, 11, 0))
+        assert (self.offset6.rollforward(self.d) ==
+                datetime(2014, 7, 1, 20, 0))
+        assert (self.offset7.rollforward(self.d) ==
+                datetime(2014, 7, 1, 21, 30))
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset2.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset3.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset4.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset5.rollforward(d) == datetime(2014, 7, 1, 11)
+        assert self.offset6.rollforward(d) == d
+        assert self.offset7.rollforward(d) == d
+
+        assert self._offset(5).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (self._offset(-3).rollforward(datetime(2014, 7, 5, 16, 0)) ==
+                datetime(2014, 7, 7, 9))
+
+    def test_roll_date_object(self):
+        offset = BusinessHour()
+
+        dt = datetime(2014, 7, 6, 15, 0)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2014, 7, 4, 17)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2014, 7, 7, 9)
+
+    normalize_cases = []
+    normalize_cases.append((BusinessHour(normalize=True), {
+        datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+        datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
+        datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
+        datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
+        datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
+        datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
+
+    normalize_cases.append((BusinessHour(-1, normalize=True), {
+        datetime(2014, 7, 1, 8): datetime(2014, 6, 30),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 30),
+        datetime(2014, 7, 1, 0): datetime(2014, 6, 30),
+        datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
+        datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
+        datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
+        datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
+
+    normalize_cases.append((BusinessHour(1, normalize=True, start='17:00',
+                                         end='04:00'), {
+        datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+        datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
+        datetime(2014, 7, 2, 3): datetime(2014, 7, 2),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
+        datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
+        datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
+        datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
+
+    @pytest.mark.parametrize('case', normalize_cases)
+    def test_normalize(self, case):
+        offset, cases = case
+        for dt, expected in compat.iteritems(cases):
+            assert offset.apply(dt) == expected
+
+    on_offset_cases = []
+    on_offset_cases.append((BusinessHour(), {
+        datetime(2014, 7, 1, 9): True,
+        datetime(2014, 7, 1, 8, 59): False,
+        datetime(2014, 7, 1, 8): False,
+        datetime(2014, 7, 1, 17): True,
+        datetime(2014, 7, 1, 17, 1): False,
+        datetime(2014, 7, 1, 18): False,
+        datetime(2014, 7, 5, 9): False,
+        datetime(2014, 7, 6, 12): False}))
+
+    on_offset_cases.append((BusinessHour(start='10:00', end='15:00'), {
+        datetime(2014, 7, 1, 9): False,
+        datetime(2014, 7, 1, 10): True,
+        datetime(2014, 7, 1, 15): True,
+        datetime(2014, 7, 1, 15, 1): False,
+        datetime(2014, 7, 5, 12): False,
+        datetime(2014, 7, 6, 12): False}))
+
+    on_offset_cases.append((BusinessHour(start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 9, 0): False,
+        datetime(2014, 7, 1, 10, 0): False,
+        datetime(2014, 7, 1, 15): False,
+        datetime(2014, 7, 1, 15, 1): False,
+        datetime(2014, 7, 5, 12, 0): False,
+        datetime(2014, 7, 6, 12, 0): False,
+        datetime(2014, 7, 1, 19, 0): True,
+        datetime(2014, 7, 2, 0, 0): True,
+        datetime(2014, 7, 4, 23): True,
+        datetime(2014, 7, 5, 1): True,
+        datetime(2014, 7, 5, 5, 0): True,
+        datetime(2014, 7, 6, 23, 0): False,
+        datetime(2014, 7, 7, 3, 0): False}))
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, cases = case
+        for dt, expected in compat.iteritems(cases):
+            assert offset.onOffset(dt) == expected
+
+    opening_time_cases = []
+    # opening time should be affected by sign of n, not by n's value and
+    # end
+    opening_time_cases.append(([BusinessHour(), BusinessHour(n=2),
+                                BusinessHour(n=4), BusinessHour(end='10:00'),
+                                BusinessHour(n=2, end='4:00'),
+                                BusinessHour(n=4, end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 1, 9)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 1, 9)),
+        # if timestamp is on opening time, next opening time is
+        # as it is
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 3, 9),
+                                   datetime(2014, 7, 2, 9)),
+        # 2014-07-05 is saturday
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 9),
+                                   datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 9),
+                                  datetime(2014, 7, 4, 9)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 8, 9),
+                                     datetime(2014, 7, 7, 9))}))
+
+    opening_time_cases.append(([BusinessHour(start='11:15'),
+                                BusinessHour(n=2, start='11:15'),
+                                BusinessHour(n=3, start='11:15'),
+                                BusinessHour(start='11:15', end='10:00'),
+                                BusinessHour(n=2, start='11:15', end='4:00'),
+                                BusinessHour(n=3, start='11:15',
+                                             end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 11, 15),
+                                   datetime(2014, 6, 30, 11, 15)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 11, 15),
+                                  datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 11, 15),
+                                  datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 11, 15),
+                                   datetime(2014, 7, 1, 11, 15)),
+        datetime(2014, 7, 2, 11, 15): (datetime(2014, 7, 2, 11, 15),
+                                       datetime(2014, 7, 2, 11, 15)),
+        datetime(2014, 7, 2, 11, 15, 1): (datetime(2014, 7, 3, 11, 15),
+                                          datetime(2014, 7, 2, 11, 15)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 11, 15),
+                                   datetime(2014, 7, 3, 11, 15)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 11, 15),
+                                   datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 11, 15),
+                                  datetime(2014, 7, 4, 11, 15)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 11, 15),
+                                     datetime(2014, 7, 4, 11, 15))}))
+
+    opening_time_cases.append(([BusinessHour(-1), BusinessHour(n=-2),
+                                BusinessHour(n=-4),
+                                BusinessHour(n=-1, end='10:00'),
+                                BusinessHour(n=-2, end='4:00'),
+                                BusinessHour(n=-4, end='15:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 9),
+                                   datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9),
+                                  datetime(2014, 7, 2, 9)),
+        datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 9),
+                                   datetime(2014, 7, 3, 9)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 9),
+                                   datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 9),
+                                  datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 9): (datetime(2014, 7, 7, 9),
+                                  datetime(2014, 7, 7, 9)),
+        datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 9),
+                                     datetime(2014, 7, 8, 9))}))
+
+    opening_time_cases.append(([BusinessHour(start='17:00', end='05:00'),
+                                BusinessHour(n=3, start='17:00',
+                                             end='03:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 6, 30, 17)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 17),
+                                  datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 17),
+                                  datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 4, 17): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 3, 17)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 17),
+                                  datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 7, 17, 1): (datetime(2014, 7, 8, 17),
+                                      datetime(2014, 7, 7, 17)), }))
+
+    opening_time_cases.append(([BusinessHour(-1, start='17:00', end='05:00'),
+                                BusinessHour(n=-2, start='17:00',
+                                             end='03:00')], {
+        datetime(2014, 7, 1, 11): (datetime(2014, 6, 30, 17),
+                                   datetime(2014, 7, 1, 17)),
+        datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 17),
+                                   datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 17),
+                                  datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 9): (datetime(2014, 7, 1, 17),
+                                  datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 2, 16, 59): (datetime(2014, 7, 1, 17),
+                                       datetime(2014, 7, 2, 17)),
+        datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 4, 10): (datetime(2014, 7, 3, 17),
+                                   datetime(2014, 7, 4, 17)),
+        datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 17),
+                                   datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 17),
+                                  datetime(2014, 7, 7, 17)),
+        datetime(2014, 7, 7, 18): (datetime(2014, 7, 7, 17),
+                                   datetime(2014, 7, 8, 17))}))
+
+    @pytest.mark.parametrize('case', opening_time_cases)
+    def test_opening_time(self, case):
+        _offsets, cases = case
+        for offset in _offsets:
+            for dt, (exp_next, exp_prev) in compat.iteritems(cases):
+                assert offset._next_opening_time(dt) == exp_next
+                assert offset._prev_opening_time(dt) == exp_prev
+
+    apply_cases = []
+    apply_cases.append((BusinessHour(), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 9),
+        datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 2, 9, 30, 15),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 12),
+        # out of business hours
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 10),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
+        # saturday
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
+        datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30, 30)}))
+
+    apply_cases.append((BusinessHour(4), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 2, 9),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 11),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 12),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
+        datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
+        datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30, 30)}))
+
+    apply_cases.append((BusinessHour(-1), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 10),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 30, 17),
+        datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
+        datetime(2014, 7, 1, 9, 30, 15): datetime(2014, 6, 30, 16, 30, 15),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 1, 5): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 10),
+        # out of business hours
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 16),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 16),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 16),
+        # saturday
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 16),
+        datetime(2014, 7, 7, 9): datetime(2014, 7, 4, 16),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 16, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 16, 30, 30)}))
+
+    apply_cases.append((BusinessHour(-4), {
+        datetime(2014, 7, 1, 11): datetime(2014, 6, 30, 15),
+        datetime(2014, 7, 1, 13): datetime(2014, 6, 30, 17),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 11),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 12),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 18): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 13, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 13, 30, 30)}))
+
+    apply_cases.append((BusinessHour(start='13:00', end='16:00'), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 1, 15, 30, 15): datetime(2014, 7, 2, 13, 30, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 14),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 14)}))
+
+    apply_cases.append((BusinessHour(n=2, start='13:00', end='16:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 15),
+        datetime(2014, 7, 2, 14, 30): datetime(2014, 7, 3, 13, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 15),
+        datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 15),
+        datetime(2014, 7, 4, 14, 30): datetime(2014, 7, 7, 13, 30),
+        datetime(2014, 7, 4, 14, 30, 30): datetime(2014, 7, 7, 13, 30, 30)}))
+
+    apply_cases.append((BusinessHour(n=-1, start='13:00', end='16:00'), {
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 15),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 15): datetime(2014, 7, 2, 14),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 16): datetime(2014, 7, 2, 15),
+        datetime(2014, 7, 2, 13, 30, 15): datetime(2014, 7, 1, 15, 30, 15),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 15),
+        datetime(2014, 7, 7, 11): datetime(2014, 7, 4, 15)}))
+
+    apply_cases.append((BusinessHour(n=-3, start='10:00', end='16:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 11),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 2, 11, 30): datetime(2014, 7, 1, 14, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
+        datetime(2014, 7, 4, 10): datetime(2014, 7, 3, 13),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 16): datetime(2014, 7, 4, 13),
+        datetime(2014, 7, 4, 12, 30): datetime(2014, 7, 3, 15, 30),
+        datetime(2014, 7, 4, 12, 30, 30): datetime(2014, 7, 3, 15, 30, 30)}))
+
+    apply_cases.append((BusinessHour(start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 20),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 20),
+        datetime(2014, 7, 2, 4, 30): datetime(2014, 7, 2, 19, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 1),
+        datetime(2014, 7, 4, 10): datetime(2014, 7, 4, 20),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 5, 0),
+        datetime(2014, 7, 5, 0): datetime(2014, 7, 5, 1),
+        datetime(2014, 7, 5, 4): datetime(2014, 7, 7, 19),
+        datetime(2014, 7, 5, 4, 30): datetime(2014, 7, 7, 19, 30),
+        datetime(2014, 7, 5, 4, 30, 30): datetime(2014, 7, 7, 19, 30, 30)}))
+
+    apply_cases.append((BusinessHour(n=-1, start='19:00', end='05:00'), {
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 4),
+        datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 20): datetime(2014, 7, 2, 5),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 4),
+        datetime(2014, 7, 2, 19, 30): datetime(2014, 7, 2, 4, 30),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 23),
+        datetime(2014, 7, 3, 6): datetime(2014, 7, 3, 4),
+        datetime(2014, 7, 4, 23): datetime(2014, 7, 4, 22),
+        datetime(2014, 7, 5, 0): datetime(2014, 7, 4, 23),
+        datetime(2014, 7, 5, 4): datetime(2014, 7, 5, 3),
+        datetime(2014, 7, 7, 19, 30): datetime(2014, 7, 5, 4, 30),
+        datetime(2014, 7, 7, 19, 30, 30): datetime(2014, 7, 5, 4, 30, 30)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    apply_large_n_cases = []
+    # A week later
+    apply_large_n_cases.append((BusinessHour(40), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 8, 11),
+        datetime(2014, 7, 1, 13): datetime(2014, 7, 8, 13),
+        datetime(2014, 7, 1, 15): datetime(2014, 7, 8, 15),
+        datetime(2014, 7, 1, 16): datetime(2014, 7, 8, 16),
+        datetime(2014, 7, 1, 17): datetime(2014, 7, 9, 9),
+        datetime(2014, 7, 2, 11): datetime(2014, 7, 9, 11),
+        datetime(2014, 7, 2, 8): datetime(2014, 7, 9, 9),
+        datetime(2014, 7, 2, 19): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 2, 23): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 3, 0): datetime(2014, 7, 10, 9),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 14, 9),
+        datetime(2014, 7, 4, 18): datetime(2014, 7, 14, 9),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 14, 9, 30),
+        datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 14, 9, 30, 30)}))
+
+    # 3 days and 1 hour before
+    apply_large_n_cases.append((BusinessHour(-25), {
+        datetime(2014, 7, 1, 11): datetime(2014, 6, 26, 10),
+        datetime(2014, 7, 1, 13): datetime(2014, 6, 26, 12),
+        datetime(2014, 7, 1, 9): datetime(2014, 6, 25, 16),
+        datetime(2014, 7, 1, 10): datetime(2014, 6, 25, 17),
+        datetime(2014, 7, 3, 11): datetime(2014, 6, 30, 10),
+        datetime(2014, 7, 3, 8): datetime(2014, 6, 27, 16),
+        datetime(2014, 7, 3, 19): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 3, 23): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 4, 9): datetime(2014, 6, 30, 16),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 6, 18): datetime(2014, 7, 1, 16),
+        datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 1, 16, 30),
+        datetime(2014, 7, 7, 10, 30, 30): datetime(2014, 7, 2, 9, 30, 30)}))
+
+    # 5 days and 3 hours later
+    apply_large_n_cases.append((BusinessHour(28, start='21:00', end='02:00'), {
+        datetime(2014, 7, 1, 11): datetime(2014, 7, 9, 0),
+        datetime(2014, 7, 1, 22): datetime(2014, 7, 9, 1),
+        datetime(2014, 7, 1, 23): datetime(2014, 7, 9, 21),
+        datetime(2014, 7, 2, 2): datetime(2014, 7, 10, 0),
+        datetime(2014, 7, 3, 21): datetime(2014, 7, 11, 0),
+        datetime(2014, 7, 4, 1): datetime(2014, 7, 11, 23),
+        datetime(2014, 7, 4, 2): datetime(2014, 7, 12, 0),
+        datetime(2014, 7, 4, 3): datetime(2014, 7, 12, 0),
+        datetime(2014, 7, 5, 1): datetime(2014, 7, 14, 23),
+        datetime(2014, 7, 5, 15): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 6, 18): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 7, 1): datetime(2014, 7, 15, 0),
+        datetime(2014, 7, 7, 23, 30): datetime(2014, 7, 15, 21, 30)}))
+
+    @pytest.mark.parametrize('case', apply_large_n_cases)
+    def test_apply_large_n(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_nanoseconds(self):
+        tests = []
+
+        tests.append((BusinessHour(),
+                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
+                          '2014-07-04 16:00') + Nano(5),
+                       Timestamp('2014-07-04 16:00') + Nano(5): Timestamp(
+                           '2014-07-07 09:00') + Nano(5),
+                       Timestamp('2014-07-04 16:00') - Nano(5): Timestamp(
+                           '2014-07-04 17:00') - Nano(5)}))
+
+        tests.append((BusinessHour(-1),
+                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
+                          '2014-07-04 14:00') + Nano(5),
+                       Timestamp('2014-07-04 10:00') + Nano(5): Timestamp(
+                           '2014-07-04 09:00') + Nano(5),
+                       Timestamp('2014-07-04 10:00') - Nano(5): Timestamp(
+                           '2014-07-03 17:00') - Nano(5), }))
+
+        for offset, cases in tests:
+            for base, expected in compat.iteritems(cases):
+                assert_offset_equal(offset, base, expected)
+
+    def test_datetimeindex(self):
+        idx1 = date_range(start='2014-07-04 15:00', end='2014-07-08 10:00',
+                          freq='BH')
+        idx2 = date_range(start='2014-07-04 15:00', periods=12, freq='BH')
+        idx3 = date_range(end='2014-07-08 10:00', periods=12, freq='BH')
+        expected = DatetimeIndex(['2014-07-04 15:00', '2014-07-04 16:00',
+                                  '2014-07-07 09:00',
+                                  '2014-07-07 10:00', '2014-07-07 11:00',
+                                  '2014-07-07 12:00',
+                                  '2014-07-07 13:00', '2014-07-07 14:00',
+                                  '2014-07-07 15:00',
+                                  '2014-07-07 16:00', '2014-07-08 09:00',
+                                  '2014-07-08 10:00'],
+                                 freq='BH')
+        for idx in [idx1, idx2, idx3]:
+            tm.assert_index_equal(idx, expected)
+
+        idx1 = date_range(start='2014-07-04 15:45', end='2014-07-08 10:45',
+                          freq='BH')
+        idx2 = date_range(start='2014-07-04 15:45', periods=12, freq='BH')
+        idx3 = date_range(end='2014-07-08 10:45', periods=12, freq='BH')
+
+        expected = DatetimeIndex(['2014-07-04 15:45', '2014-07-04 16:45',
+                                  '2014-07-07 09:45',
+                                  '2014-07-07 10:45', '2014-07-07 11:45',
+                                  '2014-07-07 12:45',
+                                  '2014-07-07 13:45', '2014-07-07 14:45',
+                                  '2014-07-07 15:45',
+                                  '2014-07-07 16:45', '2014-07-08 09:45',
+                                  '2014-07-08 10:45'],
+                                 freq='BH')
+        expected = idx1
+        for idx in [idx1, idx2, idx3]:
+            tm.assert_index_equal(idx, expected)
+
+
+class TestCustomBusinessHour(Base):
+    _offset = CustomBusinessHour
+    holidays = ['2014-06-27', datetime(2014, 6, 30),
+                np.datetime64('2014-07-02')]
+
+    def setup_method(self, method):
+        # 2014 Calendar to check custom holidays
+        #   Sun Mon Tue Wed Thu Fri Sat
+        #  6/22  23  24  25  26  27  28
+        #    29  30 7/1   2   3   4   5
+        #     6   7   8   9  10  11  12
+        self.d = datetime(2014, 7, 1, 10, 00)
+        self.offset1 = CustomBusinessHour(weekmask='Tue Wed Thu Fri')
+
+        self.offset2 = CustomBusinessHour(holidays=self.holidays)
+
+    def test_constructor_errors(self):
+        from datetime import time as dt_time
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start=dt_time(11, 0, 5))
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start='AAA')
+        with pytest.raises(ValueError):
+            CustomBusinessHour(start='14:00:05')
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset1) == '<CustomBusinessHour: CBH=09:00-17:00>'
+        assert repr(self.offset2) == '<CustomBusinessHour: CBH=09:00-17:00>'
+
+    def test_with_offset(self):
+        expected = Timestamp('2014-07-01 13:00')
+
+        assert self.d + CustomBusinessHour() * 3 == expected
+        assert self.d + CustomBusinessHour(n=3) == expected
+
+    def test_eq(self):
+        for offset in [self.offset1, self.offset2]:
+            assert offset == offset
+
+        assert CustomBusinessHour() != CustomBusinessHour(-1)
+        assert (CustomBusinessHour(start='09:00') ==
+                CustomBusinessHour())
+        assert (CustomBusinessHour(start='09:00') !=
+                CustomBusinessHour(start='09:01'))
+        assert (CustomBusinessHour(start='09:00', end='17:00') !=
+                CustomBusinessHour(start='17:00', end='09:01'))
+
+        assert (CustomBusinessHour(weekmask='Tue Wed Thu Fri') !=
+                CustomBusinessHour(weekmask='Mon Tue Wed Thu Fri'))
+        assert (CustomBusinessHour(holidays=['2014-06-27']) !=
+                CustomBusinessHour(holidays=['2014-06-28']))
+
+    def test_sub(self):
+        # override the Base.test_sub implementation because self.offset2 is
+        # defined differently in this class than the test expects
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset1) == hash(self.offset1)
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset1(self.d) == datetime(2014, 7, 1, 11)
+        assert self.offset2(self.d) == datetime(2014, 7, 1, 11)
+
+    def testRollback1(self):
+        assert self.offset1.rollback(self.d) == self.d
+        assert self.offset2.rollback(self.d) == self.d
+
+        d = datetime(2014, 7, 1, 0)
+
+        # 2014/07/01 is Tuesday, 06/30 is Monday(holiday)
+        assert self.offset1.rollback(d) == datetime(2014, 6, 27, 17)
+
+        # 2014/6/30 and 2014/6/27 are holidays
+        assert self.offset2.rollback(d) == datetime(2014, 6, 26, 17)
+
+    def testRollback2(self):
+        assert (self._offset(-3).rollback(datetime(2014, 7, 5, 15, 0)) ==
+                datetime(2014, 7, 4, 17, 0))
+
+    def testRollforward1(self):
+        assert self.offset1.rollforward(self.d) == self.d
+        assert self.offset2.rollforward(self.d) == self.d
+
+        d = datetime(2014, 7, 1, 0)
+        assert self.offset1.rollforward(d) == datetime(2014, 7, 1, 9)
+        assert self.offset2.rollforward(d) == datetime(2014, 7, 1, 9)
+
+    def testRollforward2(self):
+        assert (self._offset(-3).rollforward(datetime(2014, 7, 5, 16, 0)) ==
+                datetime(2014, 7, 7, 9))
+
+    def test_roll_date_object(self):
+        offset = BusinessHour()
+
+        dt = datetime(2014, 7, 6, 15, 0)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2014, 7, 4, 17)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2014, 7, 7, 9)
+
+    normalize_cases = []
+    normalize_cases.append((
+        CustomBusinessHour(normalize=True, holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 23): datetime(2014, 7, 3),
+         datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
+         datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
+         datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
+         datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
+         datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
+
+    normalize_cases.append((
+        CustomBusinessHour(-1, normalize=True, holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 6, 26),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 10): datetime(2014, 6, 26),
+         datetime(2014, 7, 1, 0): datetime(2014, 6, 26),
+         datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
+         datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
+         datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
+         datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
+
+    normalize_cases.append((
+        CustomBusinessHour(1, normalize=True,
+                           start='17:00', end='04:00',
+                           holidays=holidays),
+        {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
+         datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
+         datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
+         datetime(2014, 7, 2, 3): datetime(2014, 7, 3),
+         datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
+         datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
+         datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
+         datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
+
+    @pytest.mark.parametrize('norm_cases', normalize_cases)
+    def test_normalize(self, norm_cases):
+        offset, cases = norm_cases
+        for dt, expected in compat.iteritems(cases):
+            assert offset.apply(dt) == expected
+
+    def test_onOffset(self):
+        tests = []
+
+        tests.append((CustomBusinessHour(start='10:00', end='15:00',
+                                         holidays=self.holidays),
+                      {datetime(2014, 7, 1, 9): False,
+                       datetime(2014, 7, 1, 10): True,
+                       datetime(2014, 7, 1, 15): True,
+                       datetime(2014, 7, 1, 15, 1): False,
+                       datetime(2014, 7, 5, 12): False,
+                       datetime(2014, 7, 6, 12): False}))
+
+        for offset, cases in tests:
+            for dt, expected in compat.iteritems(cases):
+                assert offset.onOffset(dt) == expected
+
+    apply_cases = []
+    apply_cases.append((
+        CustomBusinessHour(holidays=holidays),
+        {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
+         datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
+         datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
+         datetime(2014, 7, 1, 19): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 9),
+         datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 3, 9, 30, 15),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 10),
+         # out of business hours
+         datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
+         datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
+         # saturday
+         datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
+         datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
+         datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30, 30)}))
+
+    apply_cases.append((
+        CustomBusinessHour(4, holidays=holidays),
+        {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
+         datetime(2014, 7, 1, 13): datetime(2014, 7, 3, 9),
+         datetime(2014, 7, 1, 15): datetime(2014, 7, 3, 11),
+         datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 12),
+         datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
+         datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
+         datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
+         datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
+         datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30, 30)}))
+
+    @pytest.mark.parametrize('apply_case', apply_cases)
+    def test_apply(self, apply_case):
+        offset, cases = apply_case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    nano_cases = []
+    nano_cases.append(
+        (CustomBusinessHour(holidays=holidays),
+         {Timestamp('2014-07-01 15:00') + Nano(5):
+            Timestamp('2014-07-01 16:00') + Nano(5),
+          Timestamp('2014-07-01 16:00') + Nano(5):
+            Timestamp('2014-07-03 09:00') + Nano(5),
+          Timestamp('2014-07-01 16:00') - Nano(5):
+            Timestamp('2014-07-01 17:00') - Nano(5)}))
+
+    nano_cases.append(
+        (CustomBusinessHour(-1, holidays=holidays),
+         {Timestamp('2014-07-01 15:00') + Nano(5):
+            Timestamp('2014-07-01 14:00') + Nano(5),
+          Timestamp('2014-07-01 10:00') + Nano(5):
+            Timestamp('2014-07-01 09:00') + Nano(5),
+          Timestamp('2014-07-01 10:00') - Nano(5):
+            Timestamp('2014-06-26 17:00') - Nano(5)}))
+
+    @pytest.mark.parametrize('nano_case', nano_cases)
+    def test_apply_nanoseconds(self, nano_case):
+        offset, cases = nano_case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestCustomBusinessDay(Base):
+    _offset = CDay
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+        self.nd = np_datetime64_compat('2008-01-01 00:00:00Z')
+
+        self.offset = CDay()
+        self.offset1 = self.offset
+        self.offset2 = CDay(2)
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessDay>'
+        assert repr(self.offset2) == '<2 * CustomBusinessDays>'
+
+        if compat.PY37:
+            expected = '<BusinessDay: offset=datetime.timedelta(days=1)>'
+        else:
+            expected = '<BusinessDay: offset=datetime.timedelta(1)>'
+        assert repr(self.offset + timedelta(1)) == expected
+
+    def test_with_offset(self):
+        offset = self.offset + timedelta(hours=2)
+
+        assert (self.d + offset) == datetime(2008, 1, 2, 2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_call(self):
+        assert self.offset2(self.d) == datetime(2008, 1, 3)
+        assert self.offset2(self.nd) == datetime(2008, 1, 3)
+
+    def testRollback1(self):
+        assert CDay(10).rollback(self.d) == self.d
+
+    def testRollback2(self):
+        assert (CDay(10).rollback(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 4))
+
+    def testRollforward1(self):
+        assert CDay(10).rollforward(self.d) == self.d
+
+    def testRollforward2(self):
+        assert (CDay(10).rollforward(datetime(2008, 1, 5)) ==
+                datetime(2008, 1, 7))
+
+    def test_roll_date_object(self):
+        offset = CDay()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 14)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 17)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CDay(), datetime(2008, 1, 1), True),
+                       (CDay(), datetime(2008, 1, 5), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, d, expected = case
+        assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((CDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 2),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 8)}))
+
+    apply_cases.append((2 * CDay(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 3),
+        datetime(2008, 1, 4): datetime(2008, 1, 8),
+        datetime(2008, 1, 5): datetime(2008, 1, 8),
+        datetime(2008, 1, 6): datetime(2008, 1, 8),
+        datetime(2008, 1, 7): datetime(2008, 1, 9)}))
+
+    apply_cases.append((-CDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 3),
+        datetime(2008, 1, 5): datetime(2008, 1, 4),
+        datetime(2008, 1, 6): datetime(2008, 1, 4),
+        datetime(2008, 1, 7): datetime(2008, 1, 4),
+        datetime(2008, 1, 8): datetime(2008, 1, 7)}))
+
+    apply_cases.append((-2 * CDay(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 28),
+        datetime(2008, 1, 4): datetime(2008, 1, 2),
+        datetime(2008, 1, 5): datetime(2008, 1, 3),
+        datetime(2008, 1, 6): datetime(2008, 1, 3),
+        datetime(2008, 1, 7): datetime(2008, 1, 3),
+        datetime(2008, 1, 8): datetime(2008, 1, 4),
+        datetime(2008, 1, 9): datetime(2008, 1, 7)}))
+
+    apply_cases.append((CDay(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 4): datetime(2008, 1, 4),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CDay(10)
+        assert result == datetime(2012, 11, 6)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CDay() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 12, 23)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2011, 12, 26)
+        assert rs == xp
+
+    def test_apply_corner(self):
+        msg = ("Only know how to combine trading day with datetime, datetime64"
+               " or timedelta")
+        with pytest.raises(ApplyTypeError, match=msg):
+            CDay().apply(BMonthEnd())
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-05-01', datetime(2013, 5, 1),
+                    np.datetime64('2014-05-01')]
+        tday = CDay(holidays=holidays)
+        for year in range(2012, 2015):
+            dt = datetime(year, 4, 30)
+            xp = datetime(year, 5, 2)
+            rs = dt + tday
+            assert rs == xp
+
+    def test_weekmask(self):
+        weekmask_saudi = 'Sat Sun Mon Tue Wed'  # Thu-Fri Weekend
+        weekmask_uae = '1111001'  # Fri-Sat Weekend
+        weekmask_egypt = [1, 1, 1, 1, 0, 0, 1]  # Fri-Sat Weekend
+        bday_saudi = CDay(weekmask=weekmask_saudi)
+        bday_uae = CDay(weekmask=weekmask_uae)
+        bday_egypt = CDay(weekmask=weekmask_egypt)
+        dt = datetime(2013, 5, 1)
+        xp_saudi = datetime(2013, 5, 4)
+        xp_uae = datetime(2013, 5, 2)
+        xp_egypt = datetime(2013, 5, 2)
+        assert xp_saudi == dt + bday_saudi
+        assert xp_uae == dt + bday_uae
+        assert xp_egypt == dt + bday_egypt
+        xp2 = datetime(2013, 5, 5)
+        assert xp2 == dt + 2 * bday_saudi
+        assert xp2 == dt + 2 * bday_uae
+        assert xp2 == dt + 2 * bday_egypt
+
+    def test_weekmask_and_holidays(self):
+        weekmask_egypt = 'Sun Mon Tue Wed Thu'  # Fri-Sat Weekend
+        holidays = ['2012-05-01', datetime(2013, 5, 1),
+                    np.datetime64('2014-05-01')]
+        bday_egypt = CDay(holidays=holidays, weekmask=weekmask_egypt)
+        dt = datetime(2013, 4, 30)
+        xp_egypt = datetime(2013, 5, 5)
+        assert xp_egypt == dt + 2 * bday_egypt
+
+    @pytest.mark.filterwarnings("ignore:Non:pandas.errors.PerformanceWarning")
+    def test_calendar(self):
+        calendar = USFederalHolidayCalendar()
+        dt = datetime(2014, 1, 17)
+        assert_offset_equal(CDay(calendar=calendar), dt, datetime(2014, 1, 21))
+
+    def test_roundtrip_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            assert unpickled == obj
+
+        _check_roundtrip(self.offset)
+        _check_roundtrip(self.offset2)
+        _check_roundtrip(self.offset * 2)
+
+    def test_pickle_compat_0_14_1(self, datapath):
+        hdays = [datetime(2013, 1, 1) for ele in range(4)]
+        pth = datapath('tseries', 'offsets', 'data', 'cday-0.14.1.pickle')
+        cday0_14_1 = read_pickle(pth)
+        cday = CDay(holidays=hdays)
+        assert cday == cday0_14_1
+
+
+class CustomBusinessMonthBase(object):
+
+    def setup_method(self, method):
+        self.d = datetime(2008, 1, 1)
+
+        self.offset = self._offset()
+        self.offset1 = self.offset
+        self.offset2 = self._offset(2)
+
+    def test_eq(self):
+        assert self.offset2 == self.offset2
+
+    def test_mul(self):
+        pass
+
+    def test_hash(self):
+        assert hash(self.offset2) == hash(self.offset2)
+
+    def test_roundtrip_pickle(self):
+        def _check_roundtrip(obj):
+            unpickled = tm.round_trip_pickle(obj)
+            assert unpickled == obj
+
+        _check_roundtrip(self._offset())
+        _check_roundtrip(self._offset(2))
+        _check_roundtrip(self._offset() * 2)
+
+    def test_copy(self):
+        # GH 17452
+        off = self._offset(weekmask='Mon Wed Fri')
+        assert off == off.copy()
+
+
+class TestCustomBusinessMonthEnd(CustomBusinessMonthBase, Base):
+    _offset = CBMonthEnd
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessMonthEnd>'
+        assert repr(self.offset2) == '<2 * CustomBusinessMonthEnds>'
+
+    def testCall(self):
+        assert self.offset2(self.d) == datetime(2008, 2, 29)
+
+    def testRollback1(self):
+        assert (CDay(10).rollback(datetime(2007, 12, 31)) ==
+                datetime(2007, 12, 31))
+
+    def testRollback2(self):
+        assert CBMonthEnd(10).rollback(self.d) == datetime(2007, 12, 31)
+
+    def testRollforward1(self):
+        assert CBMonthEnd(10).rollforward(self.d) == datetime(2008, 1, 31)
+
+    def test_roll_date_object(self):
+        offset = CBMonthEnd()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 8, 31)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 28)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CBMonthEnd(), datetime(2008, 1, 31), True),
+                       (CBMonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, d, expected = case
+        assert_onOffset(offset, d, expected)
+
+    apply_cases = []
+    apply_cases.append((CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 2, 7): datetime(2008, 2, 29)}))
+
+    apply_cases.append((2 * CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 2, 7): datetime(2008, 3, 31)}))
+
+    apply_cases.append((-CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 31),
+        datetime(2008, 2, 8): datetime(2008, 1, 31)}))
+
+    apply_cases.append((-2 * CBMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2007, 11, 30),
+        datetime(2008, 2, 9): datetime(2007, 12, 31)}))
+
+    apply_cases.append((CBMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 2, 7): datetime(2008, 2, 29)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CBMonthEnd(10)
+        assert result == datetime(2013, 7, 31)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CBMonthEnd() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 7, 29)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+        xp = datetime(2012, 5, 31)
+        assert rs == xp
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-01-31', datetime(2012, 2, 28),
+                    np.datetime64('2012-02-29')]
+        bm_offset = CBMonthEnd(holidays=holidays)
+        dt = datetime(2012, 1, 1)
+        assert dt + bm_offset == datetime(2012, 1, 30)
+        assert dt + 2 * bm_offset == datetime(2012, 2, 27)
+
+    @pytest.mark.filterwarnings("ignore:Non:pandas.errors.PerformanceWarning")
+    def test_datetimeindex(self):
+        from pandas.tseries.holiday import USFederalHolidayCalendar
+        hcal = USFederalHolidayCalendar()
+        freq = CBMonthEnd(calendar=hcal)
+
+        assert (date_range(start='20120101', end='20130101',
+                           freq=freq).tolist()[0] == datetime(2012, 1, 31))
+
+
+class TestCustomBusinessMonthBegin(CustomBusinessMonthBase, Base):
+    _offset = CBMonthBegin
+
+    def test_different_normalize_equals(self):
+        # GH#21404 changed __eq__ to return False when `normalize` doesnt match
+        offset = self._offset()
+        offset2 = self._offset(normalize=True)
+        assert offset != offset2
+
+    def test_repr(self):
+        assert repr(self.offset) == '<CustomBusinessMonthBegin>'
+        assert repr(self.offset2) == '<2 * CustomBusinessMonthBegins>'
+
+    def testCall(self):
+        assert self.offset2(self.d) == datetime(2008, 3, 3)
+
+    def testRollback1(self):
+        assert (CDay(10).rollback(datetime(2007, 12, 31)) ==
+                datetime(2007, 12, 31))
+
+    def testRollback2(self):
+        assert CBMonthBegin(10).rollback(self.d) == datetime(2008, 1, 1)
+
+    def testRollforward1(self):
+        assert CBMonthBegin(10).rollforward(self.d) == datetime(2008, 1, 1)
+
+    def test_roll_date_object(self):
+        offset = CBMonthBegin()
+
+        dt = date(2012, 9, 15)
+
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 3)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 10, 1)
+
+        offset = offsets.Day()
+        result = offset.rollback(dt)
+        assert result == datetime(2012, 9, 15)
+
+        result = offset.rollforward(dt)
+        assert result == datetime(2012, 9, 15)
+
+    on_offset_cases = [(CBMonthBegin(), datetime(2008, 1, 1), True),
+                       (CBMonthBegin(), datetime(2008, 1, 31), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+    apply_cases = []
+    apply_cases.append((CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 2, 7): datetime(2008, 3, 3)}))
+
+    apply_cases.append((2 * CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 3, 3),
+        datetime(2008, 2, 7): datetime(2008, 4, 1)}))
+
+    apply_cases.append((-CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2007, 12, 3),
+        datetime(2008, 2, 8): datetime(2008, 2, 1)}))
+
+    apply_cases.append((-2 * CBMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2007, 11, 1),
+        datetime(2008, 2, 9): datetime(2008, 1, 1)}))
+
+    apply_cases.append((CBMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 7): datetime(2008, 2, 1)}))
+
+    @pytest.mark.parametrize('case', apply_cases)
+    def test_apply(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_apply_large_n(self):
+        dt = datetime(2012, 10, 23)
+
+        result = dt + CBMonthBegin(10)
+        assert result == datetime(2013, 8, 1)
+
+        result = dt + CDay(100) - CDay(100)
+        assert result == dt
+
+        off = CBMonthBegin() * 6
+        rs = datetime(2012, 1, 1) - off
+        xp = datetime(2011, 7, 1)
+        assert rs == xp
+
+        st = datetime(2011, 12, 18)
+        rs = st + off
+
+        xp = datetime(2012, 6, 1)
+        assert rs == xp
+
+    def test_holidays(self):
+        # Define a TradingDay offset
+        holidays = ['2012-02-01', datetime(2012, 2, 2),
+                    np.datetime64('2012-03-01')]
+        bm_offset = CBMonthBegin(holidays=holidays)
+        dt = datetime(2012, 1, 1)
+
+        assert dt + bm_offset == datetime(2012, 1, 2)
+        assert dt + 2 * bm_offset == datetime(2012, 2, 3)
+
+    @pytest.mark.filterwarnings("ignore:Non:pandas.errors.PerformanceWarning")
+    def test_datetimeindex(self):
+        hcal = USFederalHolidayCalendar()
+        cbmb = CBMonthBegin(calendar=hcal)
+        assert (date_range(start='20120101', end='20130101',
+                           freq=cbmb).tolist()[0] == datetime(2012, 1, 3))
+
+
+class TestWeek(Base):
+    _offset = Week
+    d = Timestamp(datetime(2008, 1, 2))
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_repr(self):
+        assert repr(Week(weekday=0)) == "<Week: weekday=0>"
+        assert repr(Week(n=-1, weekday=0)) == "<-1 * Week: weekday=0>"
+        assert repr(Week(n=-2, weekday=0)) == "<-2 * Weeks: weekday=0>"
+
+    def test_corner(self):
+        with pytest.raises(ValueError):
+            Week(weekday=7)
+
+        with pytest.raises(ValueError, match="Day must be"):
+            Week(weekday=-1)
+
+    def test_isAnchored(self):
+        assert Week(weekday=0).isAnchored()
+        assert not Week().isAnchored()
+        assert not Week(2, weekday=2).isAnchored()
+        assert not Week(2).isAnchored()
+
+    offset_cases = []
+    # not business week
+    offset_cases.append((Week(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 8),
+        datetime(2008, 1, 4): datetime(2008, 1, 11),
+        datetime(2008, 1, 5): datetime(2008, 1, 12),
+        datetime(2008, 1, 6): datetime(2008, 1, 13),
+        datetime(2008, 1, 7): datetime(2008, 1, 14)}))
+
+    # Mon
+    offset_cases.append((Week(weekday=0), {
+        datetime(2007, 12, 31): datetime(2008, 1, 7),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 14)}))
+
+    # n=0 -> roll forward. Mon
+    offset_cases.append((Week(0, weekday=0), {
+        datetime(2007, 12, 31): datetime(2007, 12, 31),
+        datetime(2008, 1, 4): datetime(2008, 1, 7),
+        datetime(2008, 1, 5): datetime(2008, 1, 7),
+        datetime(2008, 1, 6): datetime(2008, 1, 7),
+        datetime(2008, 1, 7): datetime(2008, 1, 7)}))
+
+    # n=0 -> roll forward. Mon
+    offset_cases.append((Week(-2, weekday=1), {
+        datetime(2010, 4, 6): datetime(2010, 3, 23),
+        datetime(2010, 4, 8): datetime(2010, 3, 30),
+        datetime(2010, 4, 5): datetime(2010, 3, 23)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('weekday', range(7))
+    def test_onOffset(self, weekday):
+        offset = Week(weekday=weekday)
+
+        for day in range(1, 8):
+            date = datetime(2008, 1, day)
+
+            if day % 7 == weekday:
+                expected = True
+            else:
+                expected = False
+        assert_onOffset(offset, date, expected)
+
+
+class TestWeekOfMonth(Base):
+    _offset = WeekOfMonth
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_constructor(self):
+        with pytest.raises(ValueError, match="^Week"):
+            WeekOfMonth(n=1, week=4, weekday=0)
+
+        with pytest.raises(ValueError, match="^Week"):
+            WeekOfMonth(n=1, week=-1, weekday=0)
+
+        with pytest.raises(ValueError, match="^Day"):
+            WeekOfMonth(n=1, week=0, weekday=-1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            WeekOfMonth(n=1, week=0, weekday=-7)
+
+    def test_repr(self):
+        assert (repr(WeekOfMonth(weekday=1, week=2)) ==
+                "<WeekOfMonth: week=2, weekday=1>")
+
+    def test_offset(self):
+        date1 = datetime(2011, 1, 4)  # 1st Tuesday of Month
+        date2 = datetime(2011, 1, 11)  # 2nd Tuesday of Month
+        date3 = datetime(2011, 1, 18)  # 3rd Tuesday of Month
+        date4 = datetime(2011, 1, 25)  # 4th Tuesday of Month
+
+        # see for loop for structure
+        test_cases = [
+            (-2, 2, 1, date1, datetime(2010, 11, 16)),
+            (-2, 2, 1, date2, datetime(2010, 11, 16)),
+            (-2, 2, 1, date3, datetime(2010, 11, 16)),
+            (-2, 2, 1, date4, datetime(2010, 12, 21)),
+
+            (-1, 2, 1, date1, datetime(2010, 12, 21)),
+            (-1, 2, 1, date2, datetime(2010, 12, 21)),
+            (-1, 2, 1, date3, datetime(2010, 12, 21)),
+            (-1, 2, 1, date4, datetime(2011, 1, 18)),
+
+            (0, 0, 1, date1, datetime(2011, 1, 4)),
+            (0, 0, 1, date2, datetime(2011, 2, 1)),
+            (0, 0, 1, date3, datetime(2011, 2, 1)),
+            (0, 0, 1, date4, datetime(2011, 2, 1)),
+            (0, 1, 1, date1, datetime(2011, 1, 11)),
+            (0, 1, 1, date2, datetime(2011, 1, 11)),
+            (0, 1, 1, date3, datetime(2011, 2, 8)),
+            (0, 1, 1, date4, datetime(2011, 2, 8)),
+            (0, 0, 1, date1, datetime(2011, 1, 4)),
+            (0, 1, 1, date2, datetime(2011, 1, 11)),
+            (0, 2, 1, date3, datetime(2011, 1, 18)),
+            (0, 3, 1, date4, datetime(2011, 1, 25)),
+
+            (1, 0, 0, date1, datetime(2011, 2, 7)),
+            (1, 0, 0, date2, datetime(2011, 2, 7)),
+            (1, 0, 0, date3, datetime(2011, 2, 7)),
+            (1, 0, 0, date4, datetime(2011, 2, 7)),
+            (1, 0, 1, date1, datetime(2011, 2, 1)),
+            (1, 0, 1, date2, datetime(2011, 2, 1)),
+            (1, 0, 1, date3, datetime(2011, 2, 1)),
+            (1, 0, 1, date4, datetime(2011, 2, 1)),
+            (1, 0, 2, date1, datetime(2011, 1, 5)),
+            (1, 0, 2, date2, datetime(2011, 2, 2)),
+            (1, 0, 2, date3, datetime(2011, 2, 2)),
+            (1, 0, 2, date4, datetime(2011, 2, 2)),
+
+            (1, 2, 1, date1, datetime(2011, 1, 18)),
+            (1, 2, 1, date2, datetime(2011, 1, 18)),
+            (1, 2, 1, date3, datetime(2011, 2, 15)),
+            (1, 2, 1, date4, datetime(2011, 2, 15)),
+
+            (2, 2, 1, date1, datetime(2011, 2, 15)),
+            (2, 2, 1, date2, datetime(2011, 2, 15)),
+            (2, 2, 1, date3, datetime(2011, 3, 15)),
+            (2, 2, 1, date4, datetime(2011, 3, 15))]
+
+        for n, week, weekday, dt, expected in test_cases:
+            offset = WeekOfMonth(n, week=week, weekday=weekday)
+            assert_offset_equal(offset, dt, expected)
+
+        # try subtracting
+        result = datetime(2011, 2, 1) - WeekOfMonth(week=1, weekday=2)
+        assert result == datetime(2011, 1, 12)
+
+        result = datetime(2011, 2, 3) - WeekOfMonth(week=0, weekday=2)
+        assert result == datetime(2011, 2, 2)
+
+    on_offset_cases = [(0, 0, datetime(2011, 2, 7), True),
+                       (0, 0, datetime(2011, 2, 6), False),
+                       (0, 0, datetime(2011, 2, 14), False),
+                       (1, 0, datetime(2011, 2, 14), True),
+                       (0, 1, datetime(2011, 2, 1), True),
+                       (0, 1, datetime(2011, 2, 8), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        week, weekday, dt, expected = case
+        offset = WeekOfMonth(week=week, weekday=weekday)
+        assert offset.onOffset(dt) == expected
+
+
+class TestLastWeekOfMonth(Base):
+    _offset = LastWeekOfMonth
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_constructor(self):
+        with pytest.raises(ValueError, match="^N cannot be 0"):
+            LastWeekOfMonth(n=0, weekday=1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            LastWeekOfMonth(n=1, weekday=-1)
+
+        with pytest.raises(ValueError, match="^Day"):
+            LastWeekOfMonth(n=1, weekday=7)
+
+    def test_offset(self):
+        # Saturday
+        last_sat = datetime(2013, 8, 31)
+        next_sat = datetime(2013, 9, 28)
+        offset_sat = LastWeekOfMonth(n=1, weekday=5)
+
+        one_day_before = (last_sat + timedelta(days=-1))
+        assert one_day_before + offset_sat == last_sat
+
+        one_day_after = (last_sat + timedelta(days=+1))
+        assert one_day_after + offset_sat == next_sat
+
+        # Test On that day
+        assert last_sat + offset_sat == next_sat
+
+        # Thursday
+
+        offset_thur = LastWeekOfMonth(n=1, weekday=3)
+        last_thurs = datetime(2013, 1, 31)
+        next_thurs = datetime(2013, 2, 28)
+
+        one_day_before = last_thurs + timedelta(days=-1)
+        assert one_day_before + offset_thur == last_thurs
+
+        one_day_after = last_thurs + timedelta(days=+1)
+        assert one_day_after + offset_thur == next_thurs
+
+        # Test on that day
+        assert last_thurs + offset_thur == next_thurs
+
+        three_before = last_thurs + timedelta(days=-3)
+        assert three_before + offset_thur == last_thurs
+
+        two_after = last_thurs + timedelta(days=+2)
+        assert two_after + offset_thur == next_thurs
+
+        offset_sunday = LastWeekOfMonth(n=1, weekday=WeekDay.SUN)
+        assert datetime(2013, 7, 31) + offset_sunday == datetime(2013, 8, 25)
+
+    on_offset_cases = [
+        (WeekDay.SUN, datetime(2013, 1, 27), True),
+        (WeekDay.SAT, datetime(2013, 3, 30), True),
+        (WeekDay.MON, datetime(2013, 2, 18), False),  # Not the last Mon
+        (WeekDay.SUN, datetime(2013, 2, 25), False),  # Not a SUN
+        (WeekDay.MON, datetime(2013, 2, 25), True),
+        (WeekDay.SAT, datetime(2013, 11, 30), True),
+
+        (WeekDay.SAT, datetime(2006, 8, 26), True),
+        (WeekDay.SAT, datetime(2007, 8, 25), True),
+        (WeekDay.SAT, datetime(2008, 8, 30), True),
+        (WeekDay.SAT, datetime(2009, 8, 29), True),
+        (WeekDay.SAT, datetime(2010, 8, 28), True),
+        (WeekDay.SAT, datetime(2011, 8, 27), True),
+        (WeekDay.SAT, datetime(2019, 8, 31), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        weekday, dt, expected = case
+        offset = LastWeekOfMonth(weekday=weekday)
+        assert offset.onOffset(dt) == expected
+
+
+class TestSemiMonthEnd(Base):
+    _offset = SemiMonthEnd
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_offset_whole_year(self):
+        dates = (datetime(2007, 12, 31),
+                 datetime(2008, 1, 15),
+                 datetime(2008, 1, 31),
+                 datetime(2008, 2, 15),
+                 datetime(2008, 2, 29),
+                 datetime(2008, 3, 15),
+                 datetime(2008, 3, 31),
+                 datetime(2008, 4, 15),
+                 datetime(2008, 4, 30),
+                 datetime(2008, 5, 15),
+                 datetime(2008, 5, 31),
+                 datetime(2008, 6, 15),
+                 datetime(2008, 6, 30),
+                 datetime(2008, 7, 15),
+                 datetime(2008, 7, 31),
+                 datetime(2008, 8, 15),
+                 datetime(2008, 8, 31),
+                 datetime(2008, 9, 15),
+                 datetime(2008, 9, 30),
+                 datetime(2008, 10, 15),
+                 datetime(2008, 10, 31),
+                 datetime(2008, 11, 15),
+                 datetime(2008, 11, 30),
+                 datetime(2008, 12, 15),
+                 datetime(2008, 12, 31))
+
+        for base, exp_date in zip(dates[:-1], dates[1:]):
+            assert_offset_equal(SemiMonthEnd(), base, exp_date)
+
+        # ensure .apply_index works as expected
+        s = DatetimeIndex(dates[:-1])
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = SemiMonthEnd().apply_index(s)
+
+        exp = DatetimeIndex(dates[1:])
+        tm.assert_index_equal(result, exp)
+
+        # ensure generating a range with DatetimeIndex gives same result
+        result = date_range(start=dates[0], end=dates[-1], freq='SM')
+        exp = DatetimeIndex(dates)
+        tm.assert_index_equal(result, exp)
+
+    offset_cases = []
+    offset_cases.append((SemiMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 15): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 15),
+        datetime(2006, 12, 14): datetime(2006, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 15),
+        datetime(2007, 1, 1): datetime(2007, 1, 15),
+        datetime(2006, 12, 1): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(day_of_month=20), {
+        datetime(2008, 1, 1): datetime(2008, 1, 20),
+        datetime(2008, 1, 15): datetime(2008, 1, 20),
+        datetime(2008, 1, 21): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 20),
+        datetime(2006, 12, 14): datetime(2006, 12, 20),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 20),
+        datetime(2007, 1, 1): datetime(2007, 1, 20),
+        datetime(2006, 12, 1): datetime(2006, 12, 20),
+        datetime(2006, 12, 15): datetime(2006, 12, 20)}))
+
+    offset_cases.append((SemiMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 16): datetime(2008, 1, 31),
+        datetime(2008, 1, 15): datetime(2008, 1, 15),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 15)}))
+
+    offset_cases.append((SemiMonthEnd(0, day_of_month=16), {
+        datetime(2008, 1, 1): datetime(2008, 1, 16),
+        datetime(2008, 1, 16): datetime(2008, 1, 16),
+        datetime(2008, 1, 15): datetime(2008, 1, 16),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 16)}))
+
+    offset_cases.append((SemiMonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2007, 1, 15),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2007, 1, 16): datetime(2007, 2, 15),
+        datetime(2006, 11, 1): datetime(2006, 11, 30)}))
+
+    offset_cases.append((SemiMonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 6, 15),
+        datetime(2008, 12, 31): datetime(2008, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 15),
+        datetime(2006, 12, 30): datetime(2006, 12, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(-1, day_of_month=4), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2007, 1, 4): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 6, 4),
+        datetime(2008, 12, 31): datetime(2008, 12, 4),
+        datetime(2006, 12, 5): datetime(2006, 12, 4),
+        datetime(2006, 12, 30): datetime(2006, 12, 4),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((SemiMonthEnd(-2), {
+        datetime(2007, 1, 1): datetime(2006, 12, 15),
+        datetime(2008, 6, 30): datetime(2008, 5, 31),
+        datetime(2008, 3, 15): datetime(2008, 2, 15),
+        datetime(2008, 12, 31): datetime(2008, 11, 30),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 14): datetime(2006, 11, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 15)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_apply_index(self, case):
+        offset, cases = case
+        s = DatetimeIndex(cases.keys())
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = offset.apply_index(s)
+
+        exp = DatetimeIndex(cases.values())
+        tm.assert_index_equal(result, exp)
+
+    on_offset_cases = [(datetime(2007, 12, 31), True),
+                       (datetime(2007, 12, 15), True),
+                       (datetime(2007, 12, 14), False),
+                       (datetime(2007, 12, 1), False),
+                       (datetime(2008, 2, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        dt, expected = case
+        assert_onOffset(SemiMonthEnd(), dt, expected)
+
+    @pytest.mark.parametrize('klass', [Series, DatetimeIndex])
+    def test_vectorized_offset_addition(self, klass):
+        s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-15', tz='US/Central')], name='a')
+
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = s + SemiMonthEnd()
+            result2 = SemiMonthEnd() + s
+
+        exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-29', tz='US/Central')], name='a')
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+        s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-01', tz='US/Central')], name='a')
+
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = s + SemiMonthEnd()
+            result2 = SemiMonthEnd() + s
+
+        exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-15', tz='US/Central')], name='a')
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+
+class TestSemiMonthBegin(Base):
+    _offset = SemiMonthBegin
+    offset1 = _offset()
+    offset2 = _offset(2)
+
+    def test_offset_whole_year(self):
+        dates = (datetime(2007, 12, 15),
+                 datetime(2008, 1, 1),
+                 datetime(2008, 1, 15),
+                 datetime(2008, 2, 1),
+                 datetime(2008, 2, 15),
+                 datetime(2008, 3, 1),
+                 datetime(2008, 3, 15),
+                 datetime(2008, 4, 1),
+                 datetime(2008, 4, 15),
+                 datetime(2008, 5, 1),
+                 datetime(2008, 5, 15),
+                 datetime(2008, 6, 1),
+                 datetime(2008, 6, 15),
+                 datetime(2008, 7, 1),
+                 datetime(2008, 7, 15),
+                 datetime(2008, 8, 1),
+                 datetime(2008, 8, 15),
+                 datetime(2008, 9, 1),
+                 datetime(2008, 9, 15),
+                 datetime(2008, 10, 1),
+                 datetime(2008, 10, 15),
+                 datetime(2008, 11, 1),
+                 datetime(2008, 11, 15),
+                 datetime(2008, 12, 1),
+                 datetime(2008, 12, 15))
+
+        for base, exp_date in zip(dates[:-1], dates[1:]):
+            assert_offset_equal(SemiMonthBegin(), base, exp_date)
+
+        # ensure .apply_index works as expected
+        s = DatetimeIndex(dates[:-1])
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = SemiMonthBegin().apply_index(s)
+
+        exp = DatetimeIndex(dates[1:])
+        tm.assert_index_equal(result, exp)
+
+        # ensure generating a range with DatetimeIndex gives same result
+        result = date_range(start=dates[0], end=dates[-1], freq='SMS')
+        exp = DatetimeIndex(dates)
+        tm.assert_index_equal(result, exp)
+
+    offset_cases = []
+    offset_cases.append((SemiMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 15),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 14): datetime(2006, 12, 15),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 1): datetime(2007, 1, 15),
+        datetime(2006, 12, 1): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(day_of_month=20), {
+        datetime(2008, 1, 1): datetime(2008, 1, 20),
+        datetime(2008, 1, 15): datetime(2008, 1, 20),
+        datetime(2008, 1, 21): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 14): datetime(2006, 12, 20),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 1): datetime(2007, 1, 20),
+        datetime(2006, 12, 1): datetime(2006, 12, 20),
+        datetime(2006, 12, 15): datetime(2006, 12, 20)}))
+
+    offset_cases.append((SemiMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 16): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 1, 15),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 2): datetime(2006, 12, 15),
+        datetime(2007, 1, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(0, day_of_month=16), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 16): datetime(2008, 1, 16),
+        datetime(2008, 1, 15): datetime(2008, 1, 16),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2007, 1, 5): datetime(2007, 1, 16),
+        datetime(2007, 1, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((SemiMonthBegin(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 15),
+        datetime(2006, 12, 1): datetime(2007, 1, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 15),
+        datetime(2006, 12, 15): datetime(2007, 1, 15),
+        datetime(2007, 1, 1): datetime(2007, 2, 1),
+        datetime(2007, 1, 16): datetime(2007, 2, 15),
+        datetime(2006, 11, 1): datetime(2006, 12, 1)}))
+
+    offset_cases.append((SemiMonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 15),
+        datetime(2008, 6, 30): datetime(2008, 6, 15),
+        datetime(2008, 6, 14): datetime(2008, 6, 1),
+        datetime(2008, 12, 31): datetime(2008, 12, 15),
+        datetime(2006, 12, 29): datetime(2006, 12, 15),
+        datetime(2006, 12, 15): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 15)}))
+
+    offset_cases.append((SemiMonthBegin(-1, day_of_month=4), {
+        datetime(2007, 1, 1): datetime(2006, 12, 4),
+        datetime(2007, 1, 4): datetime(2007, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 4),
+        datetime(2008, 12, 31): datetime(2008, 12, 4),
+        datetime(2006, 12, 5): datetime(2006, 12, 4),
+        datetime(2006, 12, 30): datetime(2006, 12, 4),
+        datetime(2006, 12, 2): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 4)}))
+
+    offset_cases.append((SemiMonthBegin(-2), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 1),
+        datetime(2008, 6, 14): datetime(2008, 5, 15),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 12, 15): datetime(2006, 11, 15),
+        datetime(2007, 1, 1): datetime(2006, 12, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_apply_index(self, case):
+        offset, cases = case
+        s = DatetimeIndex(cases.keys())
+
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = offset.apply_index(s)
+
+        exp = DatetimeIndex(cases.values())
+        tm.assert_index_equal(result, exp)
+
+    on_offset_cases = [(datetime(2007, 12, 1), True),
+                       (datetime(2007, 12, 15), True),
+                       (datetime(2007, 12, 14), False),
+                       (datetime(2007, 12, 31), False),
+                       (datetime(2008, 2, 15), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        dt, expected = case
+        assert_onOffset(SemiMonthBegin(), dt, expected)
+
+    @pytest.mark.parametrize('klass', [Series, DatetimeIndex])
+    def test_vectorized_offset_addition(self, klass):
+        s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-15', tz='US/Central')], name='a')
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = s + SemiMonthBegin()
+            result2 = SemiMonthBegin() + s
+
+        exp = klass([Timestamp('2000-02-01 00:15:00', tz='US/Central'),
+                     Timestamp('2000-03-01', tz='US/Central')], name='a')
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+        s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
+                   Timestamp('2000-02-01', tz='US/Central')], name='a')
+        with tm.assert_produces_warning(None):
+            # GH#22535 check that we don't get a FutureWarning from adding
+            # an integer array to PeriodIndex
+            result = s + SemiMonthBegin()
+            result2 = SemiMonthBegin() + s
+
+        exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
+                     Timestamp('2000-02-15', tz='US/Central')], name='a')
+        tm.assert_equal(result, exp)
+        tm.assert_equal(result2, exp)
+
+
+def test_Easter():
+    assert_offset_equal(Easter(), datetime(2010, 1, 1), datetime(2010, 4, 4))
+    assert_offset_equal(Easter(), datetime(2010, 4, 5), datetime(2011, 4, 24))
+    assert_offset_equal(Easter(2), datetime(2010, 1, 1), datetime(2011, 4, 24))
+
+    assert_offset_equal(Easter(), datetime(2010, 4, 4), datetime(2011, 4, 24))
+    assert_offset_equal(Easter(2), datetime(2010, 4, 4), datetime(2012, 4, 8))
+
+    assert_offset_equal(-Easter(), datetime(2011, 1, 1), datetime(2010, 4, 4))
+    assert_offset_equal(-Easter(), datetime(2010, 4, 5), datetime(2010, 4, 4))
+    assert_offset_equal(-Easter(2),
+                        datetime(2011, 1, 1),
+                        datetime(2009, 4, 12))
+
+    assert_offset_equal(-Easter(), datetime(2010, 4, 4), datetime(2009, 4, 12))
+    assert_offset_equal(-Easter(2),
+                        datetime(2010, 4, 4),
+                        datetime(2008, 3, 23))
+
+
+class TestOffsetNames(object):
+
+    def test_get_offset_name(self):
+        assert BDay().freqstr == 'B'
+        assert BDay(2).freqstr == '2B'
+        assert BMonthEnd().freqstr == 'BM'
+        assert Week(weekday=0).freqstr == 'W-MON'
+        assert Week(weekday=1).freqstr == 'W-TUE'
+        assert Week(weekday=2).freqstr == 'W-WED'
+        assert Week(weekday=3).freqstr == 'W-THU'
+        assert Week(weekday=4).freqstr == 'W-FRI'
+
+        assert LastWeekOfMonth(weekday=WeekDay.SUN).freqstr == "LWOM-SUN"
+
+
+def test_get_offset():
+    with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+        get_offset('gibberish')
+    with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+        get_offset('QS-JAN-B')
+
+    pairs = [
+        ('B', BDay()), ('b', BDay()), ('bm', BMonthEnd()),
+        ('Bm', BMonthEnd()), ('W-MON', Week(weekday=0)),
+        ('W-TUE', Week(weekday=1)), ('W-WED', Week(weekday=2)),
+        ('W-THU', Week(weekday=3)), ('W-FRI', Week(weekday=4))]
+
+    for name, expected in pairs:
+        offset = get_offset(name)
+        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
+                                    (name, expected, offset))
+
+
+def test_get_offset_legacy():
+    pairs = [('w@Sat', Week(weekday=5))]
+    for name, expected in pairs:
+        with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+            get_offset(name)
+
+
+class TestOffsetAliases(object):
+
+    def setup_method(self, method):
+        _offset_map.clear()
+
+    def test_alias_equality(self):
+        for k, v in compat.iteritems(_offset_map):
+            if v is None:
+                continue
+            assert k == v.copy()
+
+    def test_rule_code(self):
+        lst = ['M', 'MS', 'BM', 'BMS', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
+        for k in lst:
+            assert k == get_offset(k).rule_code
+            # should be cached - this is kind of an internals test...
+            assert k in _offset_map
+            assert k == (get_offset(k) * 3).rule_code
+
+        suffix_lst = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+        base = 'W'
+        for v in suffix_lst:
+            alias = '-'.join([base, v])
+            assert alias == get_offset(alias).rule_code
+            assert alias == (get_offset(alias) * 5).rule_code
+
+        suffix_lst = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG',
+                      'SEP', 'OCT', 'NOV', 'DEC']
+        base_lst = ['A', 'AS', 'BA', 'BAS', 'Q', 'QS', 'BQ', 'BQS']
+        for base in base_lst:
+            for v in suffix_lst:
+                alias = '-'.join([base, v])
+                assert alias == get_offset(alias).rule_code
+                assert alias == (get_offset(alias) * 5).rule_code
+
+        lst = ['M', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
+        for k in lst:
+            code, stride = get_freq_code('3' + k)
+            assert isinstance(code, int)
+            assert stride == 3
+            assert k == get_freq_str(code)
+
+
+def test_dateoffset_misc():
+    oset = offsets.DateOffset(months=2, days=4)
+    # it works
+    oset.freqstr
+
+    assert (not offsets.DateOffset(months=2) == 2)
+
+
+def test_freq_offsets():
+    off = BDay(1, offset=timedelta(0, 1800))
+    assert (off.freqstr == 'B+30Min')
+
+    off = BDay(1, offset=timedelta(0, -1800))
+    assert (off.freqstr == 'B-30Min')
+
+
+class TestReprNames(object):
+
+    def test_str_for_named_is_name(self):
+        # look at all the amazing combinations!
+        month_prefixes = ['A', 'AS', 'BA', 'BAS', 'Q', 'BQ', 'BQS', 'QS']
+        names = [prefix + '-' + month
+                 for prefix in month_prefixes
+                 for month in ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
+                               'AUG', 'SEP', 'OCT', 'NOV', 'DEC']]
+        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
+        names += ['W-' + day for day in days]
+        names += ['WOM-' + week + day
+                  for week in ('1', '2', '3', '4') for day in days]
+        _offset_map.clear()
+        for name in names:
+            offset = get_offset(name)
+            assert offset.freqstr == name
+
+
+def get_utc_offset_hours(ts):
+    # take a Timestamp and compute total hours of utc offset
+    o = ts.utcoffset()
+    return (o.days * 24 * 3600 + o.seconds) / 3600.0
+
+
+class TestDST(object):
+    """
+    test DateOffset additions over Daylight Savings Time
+    """
+    # one microsecond before the DST transition
+    ts_pre_fallback = "2013-11-03 01:59:59.999999"
+    ts_pre_springfwd = "2013-03-10 01:59:59.999999"
+
+    # test both basic names and dateutil timezones
+    timezone_utc_offsets = {
+        'US/Eastern': dict(utc_offset_daylight=-4,
+                           utc_offset_standard=-5, ),
+        'dateutil/US/Pacific': dict(utc_offset_daylight=-7,
+                                    utc_offset_standard=-8, )
+    }
+    valid_date_offsets_singular = [
+        'weekday', 'day', 'hour', 'minute', 'second', 'microsecond'
+    ]
+    valid_date_offsets_plural = [
+        'weeks', 'days',
+        'hours', 'minutes', 'seconds',
+        'milliseconds', 'microseconds'
+    ]
+
+    def _test_all_offsets(self, n, **kwds):
+        valid_offsets = self.valid_date_offsets_plural if n > 1 \
+            else self.valid_date_offsets_singular
+
+        for name in valid_offsets:
+            self._test_offset(offset_name=name, offset_n=n, **kwds)
+
+    def _test_offset(self, offset_name, offset_n, tstart, expected_utc_offset):
+        offset = DateOffset(**{offset_name: offset_n})
+
+        t = tstart + offset
+        if expected_utc_offset is not None:
+            assert get_utc_offset_hours(t) == expected_utc_offset
+
+        if offset_name == 'weeks':
+            # dates should match
+            assert t.date() == timedelta(days=7 * offset.kwds[
+                'weeks']) + tstart.date()
+            # expect the same day of week, hour of day, minute, second, ...
+            assert (t.dayofweek == tstart.dayofweek and
+                    t.hour == tstart.hour and
+                    t.minute == tstart.minute and
+                    t.second == tstart.second)
+        elif offset_name == 'days':
+            # dates should match
+            assert timedelta(offset.kwds['days']) + tstart.date() == t.date()
+            # expect the same hour of day, minute, second, ...
+            assert (t.hour == tstart.hour and
+                    t.minute == tstart.minute and
+                    t.second == tstart.second)
+        elif offset_name in self.valid_date_offsets_singular:
+            # expect the singular offset value to match between tstart and t
+            datepart_offset = getattr(t, offset_name
+                                      if offset_name != 'weekday' else
+                                      'dayofweek')
+            assert datepart_offset == offset.kwds[offset_name]
+        else:
+            # the offset should be the same as if it was done in UTC
+            assert (t == (tstart.tz_convert('UTC') + offset)
+                    .tz_convert('US/Pacific'))
+
+    def _make_timestamp(self, string, hrs_offset, tz):
+        if hrs_offset >= 0:
+            offset_string = '{hrs:02d}00'.format(hrs=hrs_offset)
+        else:
+            offset_string = '-{hrs:02d}00'.format(hrs=-1 * hrs_offset)
+        return Timestamp(string + offset_string).tz_convert(tz)
+
+    def test_fallback_plural(self):
+        # test moving from daylight savings to standard time
+        import dateutil
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_daylight']
+            hrs_post = utc_offsets['utc_offset_standard']
+
+            if LooseVersion(dateutil.__version__) < LooseVersion('2.6.0'):
+                # buggy ambiguous behavior in 2.6.0
+                # GH 14621
+                # https://github.com/dateutil/dateutil/issues/321
+                self._test_all_offsets(
+                    n=3, tstart=self._make_timestamp(self.ts_pre_fallback,
+                                                     hrs_pre, tz),
+                    expected_utc_offset=hrs_post)
+            elif LooseVersion(dateutil.__version__) > LooseVersion('2.6.0'):
+                # fixed, but skip the test
+                continue
+
+    def test_springforward_plural(self):
+        # test moving from standard to daylight savings
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            hrs_post = utc_offsets['utc_offset_daylight']
+            self._test_all_offsets(
+                n=3, tstart=self._make_timestamp(self.ts_pre_springfwd,
+                                                 hrs_pre, tz),
+                expected_utc_offset=hrs_post)
+
+    def test_fallback_singular(self):
+        # in the case of singular offsets, we don't necessarily know which utc
+        # offset the new Timestamp will wind up in (the tz for 1 month may be
+        # different from 1 second) so we don't specify an expected_utc_offset
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            self._test_all_offsets(n=1, tstart=self._make_timestamp(
+                self.ts_pre_fallback, hrs_pre, tz), expected_utc_offset=None)
+
+    def test_springforward_singular(self):
+        for tz, utc_offsets in self.timezone_utc_offsets.items():
+            hrs_pre = utc_offsets['utc_offset_standard']
+            self._test_all_offsets(n=1, tstart=self._make_timestamp(
+                self.ts_pre_springfwd, hrs_pre, tz), expected_utc_offset=None)
+
+    offset_classes = {MonthBegin: ['11/2/2012', '12/1/2012'],
+                      MonthEnd: ['11/2/2012', '11/30/2012'],
+                      BMonthBegin: ['11/2/2012', '12/3/2012'],
+                      BMonthEnd: ['11/2/2012', '11/30/2012'],
+                      CBMonthBegin: ['11/2/2012', '12/3/2012'],
+                      CBMonthEnd: ['11/2/2012', '11/30/2012'],
+                      SemiMonthBegin: ['11/2/2012', '11/15/2012'],
+                      SemiMonthEnd: ['11/2/2012', '11/15/2012'],
+                      Week: ['11/2/2012', '11/9/2012'],
+                      YearBegin: ['11/2/2012', '1/1/2013'],
+                      YearEnd: ['11/2/2012', '12/31/2012'],
+                      BYearBegin: ['11/2/2012', '1/1/2013'],
+                      BYearEnd: ['11/2/2012', '12/31/2012'],
+                      QuarterBegin: ['11/2/2012', '12/1/2012'],
+                      QuarterEnd: ['11/2/2012', '12/31/2012'],
+                      BQuarterBegin: ['11/2/2012', '12/3/2012'],
+                      BQuarterEnd: ['11/2/2012', '12/31/2012'],
+                      Day: ['11/4/2012', '11/4/2012 23:00']}.items()
+
+    @pytest.mark.parametrize('tup', offset_classes)
+    def test_all_offset_classes(self, tup):
+        offset, test_values = tup
+
+        first = Timestamp(test_values[0], tz='US/Eastern') + offset()
+        second = Timestamp(test_values[1], tz='US/Eastern')
+        assert first == second
+
+
+# ---------------------------------------------------------------------
+def test_get_offset_day_error():
+    # subclass of _BaseOffset must override _day_opt attribute, or we should
+    # get a NotImplementedError
+
+    with pytest.raises(NotImplementedError):
+        DateOffset()._get_offset_day(datetime.now())
+
+
+def test_valid_default_arguments(offset_types):
+    # GH#19142 check that the calling the constructors without passing
+    # any keyword arguments produce valid offsets
+    cls = offset_types
+    cls()
+
+
+@pytest.mark.parametrize('kwd', sorted(list(liboffsets.relativedelta_kwds)))
+def test_valid_month_attributes(kwd, month_classes):
+    # GH#18226
+    cls = month_classes
+    # check that we cannot create e.g. MonthEnd(weeks=3)
+    with pytest.raises(TypeError):
+        cls(**{kwd: 3})
+
+
+@pytest.mark.parametrize('kwd', sorted(list(liboffsets.relativedelta_kwds)))
+def test_valid_relativedelta_kwargs(kwd):
+    # Check that all the arguments specified in liboffsets.relativedelta_kwds
+    # are in fact valid relativedelta keyword args
+    DateOffset(**{kwd: 1})
+
+
+@pytest.mark.parametrize('kwd', sorted(list(liboffsets.relativedelta_kwds)))
+def test_valid_tick_attributes(kwd, tick_classes):
+    # GH#18226
+    cls = tick_classes
+    # check that we cannot create e.g. Hour(weeks=3)
+    with pytest.raises(TypeError):
+        cls(**{kwd: 3})
+
+
+def test_validate_n_error():
+    with pytest.raises(TypeError):
+        DateOffset(n='Doh!')
+
+    with pytest.raises(TypeError):
+        MonthBegin(n=timedelta(1))
+
+    with pytest.raises(TypeError):
+        BDay(n=np.array([1, 2], dtype=np.int64))
+
+
+def test_require_integers(offset_types):
+    cls = offset_types
+    with pytest.raises(ValueError):
+        cls(n=1.5)
+
+
+def test_tick_normalize_raises(tick_classes):
+    # check that trying to create a Tick object with normalize=True raises
+    # GH#21427
+    cls = tick_classes
+    with pytest.raises(ValueError):
+        cls(n=3, normalize=True)
+
+
+def test_weeks_onoffset():
+    # GH#18510 Week with weekday = None, normalize = False should always
+    # be onOffset
+    offset = Week(n=2, weekday=None)
+    ts = Timestamp('1862-01-13 09:03:34.873477378+0210', tz='Africa/Lusaka')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+    # negative n
+    offset = Week(n=2, weekday=None)
+    ts = Timestamp('1856-10-24 16:18:36.556360110-0717', tz='Pacific/Easter')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_weekofmonth_onoffset():
+    # GH#18864
+    # Make sure that nanoseconds don't trip up onOffset (and with it apply)
+    offset = WeekOfMonth(n=2, week=2, weekday=0)
+    ts = Timestamp('1916-05-15 01:14:49.583410462+0422', tz='Asia/Qyzylorda')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+    # negative n
+    offset = WeekOfMonth(n=-3, week=1, weekday=0)
+    ts = Timestamp('1980-12-08 03:38:52.878321185+0500', tz='Asia/Oral')
+    fast = offset.onOffset(ts)
+    slow = (ts + offset) - offset == ts
+    assert fast == slow
+
+
+def test_last_week_of_month_on_offset():
+    # GH#19036, GH#18977 _adjust_dst was incorrect for LastWeekOfMonth
+    offset = LastWeekOfMonth(n=4, weekday=6)
+    ts = Timestamp('1917-05-27 20:55:27.084284178+0200',
+                   tz='Europe/Warsaw')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
+
+    # negative n
+    offset = LastWeekOfMonth(n=-4, weekday=5)
+    ts = Timestamp('2005-08-27 05:01:42.799392561-0500',
+                   tz='America/Rainy_River')
+    slow = (ts + offset) - offset == ts
+    fast = offset.onOffset(ts)
+    assert fast == slow
diff --git a/pandas/tests/tseries/offsets/test_offsets_properties.py b/pandas/tests/tseries/offsets/test_offsets_properties.py
new file mode 100644
index 0000000000000..cd5f2a2a25e58
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_offsets_properties.py
@@ -0,0 +1,108 @@
+# -*- coding: utf-8 -*-
+"""
+Behavioral based tests for offsets and date_range.
+
+This file is adapted from https://github.com/pandas-dev/pandas/pull/18761 -
+which was more ambitious but less idiomatic in its use of Hypothesis.
+
+You may wish to consult the previous version for inspiration on further
+tests, or when trying to pin down the bugs exposed by the tests below.
+"""
+import warnings
+
+from hypothesis import assume, given, strategies as st
+from hypothesis.extra.dateutil import timezones as dateutil_timezones
+from hypothesis.extra.pytz import timezones as pytz_timezones
+import pytest
+
+import pandas as pd
+
+from pandas.tseries.offsets import (
+    BMonthBegin, BMonthEnd, BQuarterBegin, BQuarterEnd, BYearBegin, BYearEnd,
+    MonthBegin, MonthEnd, QuarterBegin, QuarterEnd, YearBegin, YearEnd)
+
+# ----------------------------------------------------------------
+# Helpers for generating random data
+
+with warnings.catch_warnings():
+    warnings.simplefilter('ignore')
+    min_dt = pd.Timestamp(1900, 1, 1).to_pydatetime(),
+    max_dt = pd.Timestamp(1900, 1, 1).to_pydatetime(),
+
+gen_date_range = st.builds(
+    pd.date_range,
+    start=st.datetimes(
+        # TODO: Choose the min/max values more systematically
+        min_value=pd.Timestamp(1900, 1, 1).to_pydatetime(),
+        max_value=pd.Timestamp(2100, 1, 1).to_pydatetime()
+    ),
+    periods=st.integers(min_value=2, max_value=100),
+    freq=st.sampled_from('Y Q M D H T s ms us ns'.split()),
+    tz=st.one_of(st.none(), dateutil_timezones(), pytz_timezones()),
+)
+
+gen_random_datetime = st.datetimes(
+    min_value=min_dt,
+    max_value=max_dt,
+    timezones=st.one_of(st.none(), dateutil_timezones(), pytz_timezones())
+)
+
+# The strategy for each type is registered in conftest.py, as they don't carry
+# enough runtime information (e.g. type hints) to infer how to build them.
+gen_yqm_offset = st.one_of(*map(st.from_type, [
+    MonthBegin, MonthEnd, BMonthBegin, BMonthEnd,
+    QuarterBegin, QuarterEnd, BQuarterBegin, BQuarterEnd,
+    YearBegin, YearEnd, BYearBegin, BYearEnd
+]))
+
+
+# ----------------------------------------------------------------
+# Offset-specific behaviour tests
+
+
+# Based on CI runs: Always passes on OSX, fails on Linux, sometimes on Windows
+@pytest.mark.xfail(strict=False, reason='inconsistent between OSs, Pythons')
+@given(gen_random_datetime, gen_yqm_offset)
+def test_on_offset_implementations(dt, offset):
+    assume(not offset.normalize)
+    # check that the class-specific implementations of onOffset match
+    # the general case definition:
+    #   (dt + offset) - offset == dt
+    compare = (dt + offset) - offset
+    assert offset.onOffset(dt) == (compare == dt)
+
+
+@pytest.mark.xfail
+@given(gen_yqm_offset, gen_date_range)
+def test_apply_index_implementations(offset, rng):
+    # offset.apply_index(dti)[i] should match dti[i] + offset
+    assume(offset.n != 0)  # TODO: test for that case separately
+
+    # rng = pd.date_range(start='1/1/2000', periods=100000, freq='T')
+    ser = pd.Series(rng)
+
+    res = rng + offset
+    res_v2 = offset.apply_index(rng)
+    assert (res == res_v2).all()
+
+    assert res[0] == rng[0] + offset
+    assert res[-1] == rng[-1] + offset
+    res2 = ser + offset
+    # apply_index is only for indexes, not series, so no res2_v2
+    assert res2.iloc[0] == ser.iloc[0] + offset
+    assert res2.iloc[-1] == ser.iloc[-1] + offset
+    # TODO: Check randomly assorted entries, not just first/last
+
+
+@pytest.mark.xfail
+@given(gen_yqm_offset)
+def test_shift_across_dst(offset):
+    # GH#18319 check that 1) timezone is correctly normalized and
+    # 2) that hour is not incorrectly changed by this normalization
+    # Note that dti includes a transition across DST boundary
+    dti = pd.date_range(start='2017-10-30 12:00:00', end='2017-11-06',
+                        freq='D', tz='US/Eastern')
+    assert (dti.hour == 12).all()  # we haven't screwed up yet
+
+    res = dti + offset
+    assert (res.hour == 12).all()
diff --git a/pandas/tests/tseries/offsets/test_ticks.py b/pandas/tests/tseries/offsets/test_ticks.py
new file mode 100644
index 0000000000000..9a8251201f75f
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_ticks.py
@@ -0,0 +1,343 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for offsets.Tick and subclasses
+"""
+from __future__ import division
+
+from datetime import datetime, timedelta
+
+from hypothesis import assume, example, given, settings, strategies as st
+import numpy as np
+import pytest
+
+from pandas import Timedelta, Timestamp
+import pandas.util.testing as tm
+
+from pandas.tseries import offsets
+from pandas.tseries.offsets import Hour, Micro, Milli, Minute, Nano, Second
+
+from .common import assert_offset_equal
+
+# ---------------------------------------------------------------------
+# Test Helpers
+
+tick_classes = [Hour, Minute, Second, Milli, Micro, Nano]
+
+
+# ---------------------------------------------------------------------
+
+
+def test_apply_ticks():
+    result = offsets.Hour(3).apply(offsets.Hour(4))
+    exp = offsets.Hour(7)
+    assert (result == exp)
+
+
+def test_delta_to_tick():
+    delta = timedelta(3)
+
+    tick = offsets._delta_to_tick(delta)
+    assert (tick == offsets.Day(3))
+
+    td = Timedelta(nanoseconds=5)
+    tick = offsets._delta_to_tick(td)
+    assert tick == Nano(5)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+@settings(deadline=None)  # GH 24641
+@example(n=2, m=3)
+@example(n=800, m=300)
+@example(n=1000, m=5)
+@given(n=st.integers(-999, 999), m=st.integers(-999, 999))
+def test_tick_add_sub(cls, n, m):
+    # For all Tick subclasses and all integers n, m, we should have
+    # tick(n) + tick(m) == tick(n+m)
+    # tick(n) - tick(m) == tick(n-m)
+    left = cls(n)
+    right = cls(m)
+    expected = cls(n + m)
+
+    assert left + right == expected
+    assert left.apply(right) == expected
+
+    expected = cls(n - m)
+    assert left - right == expected
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+@settings(deadline=None)
+@example(n=2, m=3)
+@given(n=st.integers(-999, 999), m=st.integers(-999, 999))
+def test_tick_equality(cls, n, m):
+    assume(m != n)
+    # tick == tock iff tick.n == tock.n
+    left = cls(n)
+    right = cls(m)
+    assert left != right
+    assert not (left == right)
+
+    right = cls(n)
+    assert left == right
+    assert not (left != right)
+
+    if n != 0:
+        assert cls(n) != cls(-n)
+
+
+# ---------------------------------------------------------------------
+
+
+def test_Hour():
+    assert_offset_equal(Hour(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 1))
+    assert_offset_equal(Hour(-1),
+                        datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
+    assert_offset_equal(2 * Hour(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 2))
+    assert_offset_equal(-1 * Hour(),
+                        datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
+
+    assert Hour(3) + Hour(2) == Hour(5)
+    assert Hour(3) - Hour(2) == Hour()
+
+    assert Hour(4) != Hour(1)
+
+
+def test_Minute():
+    assert_offset_equal(Minute(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 1))
+    assert_offset_equal(Minute(-1),
+                        datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
+    assert_offset_equal(2 * Minute(),
+                        datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 2))
+    assert_offset_equal(-1 * Minute(),
+                        datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
+
+    assert Minute(3) + Minute(2) == Minute(5)
+    assert Minute(3) - Minute(2) == Minute()
+    assert Minute(5) != Minute()
+
+
+def test_Second():
+    assert_offset_equal(Second(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 1))
+    assert_offset_equal(Second(-1),
+                        datetime(2010, 1, 1, 0, 0, 1),
+                        datetime(2010, 1, 1))
+    assert_offset_equal(2 * Second(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 2))
+    assert_offset_equal(-1 * Second(),
+                        datetime(2010, 1, 1, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert Second(3) + Second(2) == Second(5)
+    assert Second(3) - Second(2) == Second()
+
+
+def test_Millisecond():
+    assert_offset_equal(Milli(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000))
+    assert_offset_equal(Milli(-1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000),
+                        datetime(2010, 1, 1))
+    assert_offset_equal(Milli(2),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2000))
+    assert_offset_equal(2 * Milli(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2000))
+    assert_offset_equal(-1 * Milli(),
+                        datetime(2010, 1, 1, 0, 0, 0, 1000),
+                        datetime(2010, 1, 1))
+
+    assert Milli(3) + Milli(2) == Milli(5)
+    assert Milli(3) - Milli(2) == Milli()
+
+
+def test_MillisecondTimestampArithmetic():
+    assert_offset_equal(Milli(),
+                        Timestamp('2010-01-01'),
+                        Timestamp('2010-01-01 00:00:00.001'))
+    assert_offset_equal(Milli(-1),
+                        Timestamp('2010-01-01 00:00:00.001'),
+                        Timestamp('2010-01-01'))
+
+
+def test_Microsecond():
+    assert_offset_equal(Micro(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1))
+    assert_offset_equal(Micro(-1),
+                        datetime(2010, 1, 1, 0, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert_offset_equal(2 * Micro(),
+                        datetime(2010, 1, 1),
+                        datetime(2010, 1, 1, 0, 0, 0, 2))
+    assert_offset_equal(-1 * Micro(),
+                        datetime(2010, 1, 1, 0, 0, 0, 1),
+                        datetime(2010, 1, 1))
+
+    assert Micro(3) + Micro(2) == Micro(5)
+    assert Micro(3) - Micro(2) == Micro()
+
+
+def test_NanosecondGeneric():
+    timestamp = Timestamp(datetime(2010, 1, 1))
+    assert timestamp.nanosecond == 0
+
+    result = timestamp + Nano(10)
+    assert result.nanosecond == 10
+
+    reverse_result = Nano(10) + timestamp
+    assert reverse_result.nanosecond == 10
+
+
+def test_Nanosecond():
+    timestamp = Timestamp(datetime(2010, 1, 1))
+    assert_offset_equal(Nano(),
+                        timestamp,
+                        timestamp + np.timedelta64(1, 'ns'))
+    assert_offset_equal(Nano(-1),
+                        timestamp + np.timedelta64(1, 'ns'),
+                        timestamp)
+    assert_offset_equal(2 * Nano(),
+                        timestamp,
+                        timestamp + np.timedelta64(2, 'ns'))
+    assert_offset_equal(-1 * Nano(),
+                        timestamp + np.timedelta64(1, 'ns'),
+                        timestamp)
+
+    assert Nano(3) + Nano(2) == Nano(5)
+    assert Nano(3) - Nano(2) == Nano()
+
+    # GH9284
+    assert Nano(1) + Nano(10) == Nano(11)
+    assert Nano(5) + Micro(1) == Nano(1005)
+    assert Micro(5) + Nano(1) == Nano(5001)
+
+
+@pytest.mark.parametrize('kls, expected',
+                         [(Hour, Timedelta(hours=5)),
+                          (Minute, Timedelta(hours=2, minutes=3)),
+                          (Second, Timedelta(hours=2, seconds=3)),
+                          (Milli, Timedelta(hours=2, milliseconds=3)),
+                          (Micro, Timedelta(hours=2, microseconds=3)),
+                          (Nano, Timedelta(hours=2, nanoseconds=3))])
+def test_tick_addition(kls, expected):
+    offset = kls(3)
+    result = offset + Timedelta(hours=2)
+    assert isinstance(result, Timedelta)
+    assert result == expected
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_division(cls):
+    off = cls(10)
+
+    assert off / cls(5) == 2
+    assert off / 2 == cls(5)
+    assert off / 2.0 == cls(5)
+
+    assert off / off.delta == 1
+    assert off / off.delta.to_timedelta64() == 1
+
+    assert off / Nano(1) == off.delta / Nano(1).delta
+
+    if cls is not Nano:
+        # A case where we end up with a smaller class
+        result = off / 1000
+        assert isinstance(result, offsets.Tick)
+        assert not isinstance(result, cls)
+        assert result.delta == off.delta / 1000
+
+    if cls._inc < Timedelta(seconds=1):
+        # Case where we end up with a bigger class
+        result = off / .001
+        assert isinstance(result, offsets.Tick)
+        assert not isinstance(result, cls)
+        assert result.delta == off.delta / .001
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_rdiv(cls):
+    off = cls(10)
+    delta = off.delta
+    td64 = delta.to_timedelta64()
+
+    with pytest.raises(TypeError):
+        2 / off
+    with pytest.raises(TypeError):
+        2.0 / off
+
+    assert (td64 * 2.5) / off == 2.5
+
+    if cls is not Nano:
+        # skip pytimedelta for Nano since it gets dropped
+        assert (delta.to_pytimedelta() * 2) / off == 2
+
+    result = np.array([2 * td64, td64]) / off
+    expected = np.array([2., 1.])
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize('cls1', tick_classes)
+@pytest.mark.parametrize('cls2', tick_classes)
+def test_tick_zero(cls1, cls2):
+    assert cls1(0) == cls2(0)
+    assert cls1(0) + cls2(0) == cls1(0)
+
+    if cls1 is not Nano:
+        assert cls1(2) + cls2(0) == cls1(2)
+
+    if cls1 is Nano:
+        assert cls1(2) + Nano(0) == cls1(2)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_equalities(cls):
+    assert cls() == cls(1)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_tick_offset(cls):
+    assert not cls().isAnchored()
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_compare_ticks(cls):
+    three = cls(3)
+    four = cls(4)
+
+    assert three < cls(4)
+    assert cls(3) < four
+    assert four > cls(3)
+    assert cls(4) > three
+    assert cls(3) == cls(3)
+    assert cls(3) != cls(4)
+
+
+@pytest.mark.parametrize('cls', tick_classes)
+def test_compare_ticks_to_strs(cls):
+    # GH#23524
+    off = cls(19)
+
+    # These tests should work with any strings, but we particularly are
+    #  interested in "infer" as that comparison is convenient to make in
+    #  Datetime/Timedelta Array/Index constructors
+    assert not off == "infer"
+    assert not "foo" == off
+
+    for left, right in [("infer", off), (off, "infer")]:
+        with pytest.raises(TypeError):
+            left < right
+        with pytest.raises(TypeError):
+            left <= right
+        with pytest.raises(TypeError):
+            left > right
+        with pytest.raises(TypeError):
+            left >= right
diff --git a/pandas/tests/tseries/offsets/test_yqm_offsets.py b/pandas/tests/tseries/offsets/test_yqm_offsets.py
new file mode 100644
index 0000000000000..9ee03d2e886f3
--- /dev/null
+++ b/pandas/tests/tseries/offsets/test_yqm_offsets.py
@@ -0,0 +1,1035 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Year, Quarter, and Month-based DateOffset subclasses
+"""
+from datetime import datetime
+
+import pytest
+
+import pandas as pd
+from pandas import Timestamp, compat
+
+from pandas.tseries.offsets import (
+    BMonthBegin, BMonthEnd, BQuarterBegin, BQuarterEnd, BYearBegin, BYearEnd,
+    MonthBegin, MonthEnd, QuarterBegin, QuarterEnd, YearBegin, YearEnd)
+
+from .common import assert_offset_equal, assert_onOffset
+from .test_offsets import Base
+
+# --------------------------------------------------------------------
+# Misc
+
+
+def test_quarterly_dont_normalize():
+    date = datetime(2012, 3, 31, 5, 30)
+
+    offsets = (QuarterBegin, QuarterEnd, BQuarterEnd, BQuarterBegin)
+
+    for klass in offsets:
+        result = date + klass()
+        assert (result.time() == date.time())
+
+
+@pytest.mark.parametrize('n', [-2, 1])
+@pytest.mark.parametrize('cls', [MonthBegin, MonthEnd,
+                                 BMonthBegin, BMonthEnd,
+                                 QuarterBegin, QuarterEnd,
+                                 BQuarterBegin, BQuarterEnd,
+                                 YearBegin, YearEnd,
+                                 BYearBegin, BYearEnd])
+def test_apply_index(cls, n):
+    offset = cls(n=n)
+    rng = pd.date_range(start='1/1/2000', periods=100000, freq='T')
+    ser = pd.Series(rng)
+
+    res = rng + offset
+    res_v2 = offset.apply_index(rng)
+    assert (res == res_v2).all()
+    assert res[0] == rng[0] + offset
+    assert res[-1] == rng[-1] + offset
+    res2 = ser + offset
+    # apply_index is only for indexes, not series, so no res2_v2
+    assert res2.iloc[0] == ser.iloc[0] + offset
+    assert res2.iloc[-1] == ser.iloc[-1] + offset
+
+
+@pytest.mark.parametrize('offset', [QuarterBegin(), QuarterEnd(),
+                                    BQuarterBegin(), BQuarterEnd()])
+def test_on_offset(offset):
+    dates = [datetime(2016, m, d)
+             for m in [10, 11, 12]
+             for d in [1, 2, 3, 28, 29, 30, 31] if not (m == 11 and d == 31)]
+    for date in dates:
+        res = offset.onOffset(date)
+        slow_version = date == (date + offset) - offset
+        assert res == slow_version
+
+
+# --------------------------------------------------------------------
+# Months
+
+class TestMonthBegin(Base):
+    _offset = MonthBegin
+
+    offset_cases = []
+    # NOTE: I'm not entirely happy with the logic here for Begin -ss
+    # see thread 'offset conventions' on the ML
+    offset_cases.append((MonthBegin(), {
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 2, 1): datetime(2008, 3, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 12, 1): datetime(2007, 1, 1),
+        datetime(2007, 1, 31): datetime(2007, 2, 1)}))
+
+    offset_cases.append((MonthBegin(0), {
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2006, 12, 3): datetime(2007, 1, 1),
+        datetime(2007, 1, 31): datetime(2007, 2, 1)}))
+
+    offset_cases.append((MonthBegin(2), {
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 1, 31): datetime(2008, 3, 1),
+        datetime(2006, 12, 31): datetime(2007, 2, 1),
+        datetime(2007, 12, 28): datetime(2008, 2, 1),
+        datetime(2007, 1, 1): datetime(2007, 3, 1),
+        datetime(2006, 11, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((MonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 5, 31): datetime(2008, 5, 1),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 1, 2): datetime(2006, 1, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestMonthEnd(Base):
+    _offset = MonthEnd
+
+    def test_day_of_month(self):
+        dt = datetime(2007, 1, 1)
+        offset = MonthEnd()
+
+        result = dt + offset
+        assert result == Timestamp(2007, 1, 31)
+
+        result = result + offset
+        assert result == Timestamp(2007, 2, 28)
+
+    def test_normalize(self):
+        dt = datetime(2007, 1, 1, 3)
+
+        result = dt + MonthEnd(normalize=True)
+        expected = dt.replace(hour=0) + MonthEnd()
+        assert result == expected
+
+    offset_cases = []
+    offset_cases.append((MonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2006, 12, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((MonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 31),
+        datetime(2006, 12, 31): datetime(2006, 12, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31)}))
+
+    offset_cases.append((MonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 3, 31),
+        datetime(2006, 12, 29): datetime(2007, 1, 31),
+        datetime(2006, 12, 31): datetime(2007, 2, 28),
+        datetime(2007, 1, 1): datetime(2007, 2, 28),
+        datetime(2006, 11, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((MonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 5, 31),
+        datetime(2008, 12, 31): datetime(2008, 11, 30),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 30): datetime(2006, 11, 30),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(MonthEnd(), datetime(2007, 12, 31), True),
+                       (MonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBMonthBegin(Base):
+    _offset = BMonthBegin
+
+    def test_offsets_compare_equal(self):
+        # root cause of #456
+        offset1 = BMonthBegin()
+        offset2 = BMonthBegin()
+        assert not offset1 != offset2
+
+    offset_cases = []
+    offset_cases.append((BMonthBegin(), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 9, 1): datetime(2006, 10, 2),
+        datetime(2007, 1, 1): datetime(2007, 2, 1),
+        datetime(2006, 12, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((BMonthBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2006, 10, 2): datetime(2006, 10, 2),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2006, 12, 29): datetime(2007, 1, 1),
+        datetime(2006, 12, 31): datetime(2007, 1, 1),
+        datetime(2006, 9, 15): datetime(2006, 10, 2)}))
+
+    offset_cases.append((BMonthBegin(2), {
+        datetime(2008, 1, 1): datetime(2008, 3, 3),
+        datetime(2008, 1, 15): datetime(2008, 3, 3),
+        datetime(2006, 12, 29): datetime(2007, 2, 1),
+        datetime(2006, 12, 31): datetime(2007, 2, 1),
+        datetime(2007, 1, 1): datetime(2007, 3, 1),
+        datetime(2006, 11, 1): datetime(2007, 1, 1)}))
+
+    offset_cases.append((BMonthBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 1),
+        datetime(2008, 6, 30): datetime(2008, 6, 2),
+        datetime(2008, 6, 1): datetime(2008, 5, 1),
+        datetime(2008, 3, 10): datetime(2008, 3, 3),
+        datetime(2008, 12, 31): datetime(2008, 12, 1),
+        datetime(2006, 12, 29): datetime(2006, 12, 1),
+        datetime(2006, 12, 30): datetime(2006, 12, 1),
+        datetime(2007, 1, 1): datetime(2006, 12, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BMonthBegin(), datetime(2007, 12, 31), False),
+                       (BMonthBegin(), datetime(2008, 1, 1), True),
+                       (BMonthBegin(), datetime(2001, 4, 2), True),
+                       (BMonthBegin(), datetime(2008, 3, 3), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBMonthEnd(Base):
+    _offset = BMonthEnd
+
+    def test_normalize(self):
+        dt = datetime(2007, 1, 1, 3)
+
+        result = dt + BMonthEnd(normalize=True)
+        expected = dt.replace(hour=0) + BMonthEnd()
+        assert result == expected
+
+    def test_offsets_compare_equal(self):
+        # root cause of #456
+        offset1 = BMonthEnd()
+        offset2 = BMonthEnd()
+        assert not offset1 != offset2
+
+    offset_cases = []
+    offset_cases.append((BMonthEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2006, 12, 29): datetime(2007, 1, 31),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31),
+        datetime(2006, 12, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BMonthEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2006, 12, 29): datetime(2006, 12, 29),
+        datetime(2006, 12, 31): datetime(2007, 1, 31),
+        datetime(2007, 1, 1): datetime(2007, 1, 31)}))
+
+    offset_cases.append((BMonthEnd(2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 3, 31),
+        datetime(2006, 12, 29): datetime(2007, 2, 28),
+        datetime(2006, 12, 31): datetime(2007, 2, 28),
+        datetime(2007, 1, 1): datetime(2007, 2, 28),
+        datetime(2006, 11, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BMonthEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 29),
+        datetime(2008, 6, 30): datetime(2008, 5, 30),
+        datetime(2008, 12, 31): datetime(2008, 11, 28),
+        datetime(2006, 12, 29): datetime(2006, 11, 30),
+        datetime(2006, 12, 30): datetime(2006, 12, 29),
+        datetime(2007, 1, 1): datetime(2006, 12, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BMonthEnd(), datetime(2007, 12, 31), True),
+                       (BMonthEnd(), datetime(2008, 1, 1), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+# --------------------------------------------------------------------
+# Quarters
+
+
+class TestQuarterBegin(Base):
+
+    def test_repr(self):
+        expected = "<QuarterBegin: startingMonth=3>"
+        assert repr(QuarterBegin()) == expected
+        expected = "<QuarterBegin: startingMonth=3>"
+        assert repr(QuarterBegin(startingMonth=3)) == expected
+        expected = "<QuarterBegin: startingMonth=1>"
+        assert repr(QuarterBegin(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert QuarterBegin(startingMonth=1).isAnchored()
+        assert QuarterBegin().isAnchored()
+        assert not QuarterBegin(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = QuarterBegin(n=-1, startingMonth=1)
+        assert datetime(2010, 2, 1) + offset == datetime(2010, 1, 1)
+
+    offset_cases = []
+    offset_cases.append((QuarterBegin(startingMonth=1), {
+        datetime(2007, 12, 1): datetime(2008, 1, 1),
+        datetime(2008, 1, 1): datetime(2008, 4, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2008, 4, 1): datetime(2008, 7, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 2, 29): datetime(2008, 5, 1),
+        datetime(2008, 3, 15): datetime(2008, 5, 1),
+        datetime(2008, 3, 31): datetime(2008, 5, 1),
+        datetime(2008, 4, 15): datetime(2008, 5, 1),
+        datetime(2008, 4, 30): datetime(2008, 5, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 12, 1): datetime(2009, 1, 1),
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2008, 4, 30): datetime(2008, 7, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 1),
+        datetime(2008, 1, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 1, 1),
+        datetime(2008, 2, 29): datetime(2008, 1, 1),
+        datetime(2008, 3, 15): datetime(2008, 1, 1),
+        datetime(2008, 3, 31): datetime(2008, 1, 1),
+        datetime(2008, 4, 15): datetime(2008, 4, 1),
+        datetime(2008, 4, 30): datetime(2008, 4, 1),
+        datetime(2008, 7, 1): datetime(2008, 4, 1)}))
+
+    offset_cases.append((QuarterBegin(startingMonth=1, n=2), {
+        datetime(2008, 1, 1): datetime(2008, 7, 1),
+        datetime(2008, 2, 15): datetime(2008, 7, 1),
+        datetime(2008, 2, 29): datetime(2008, 7, 1),
+        datetime(2008, 3, 15): datetime(2008, 7, 1),
+        datetime(2008, 3, 31): datetime(2008, 7, 1),
+        datetime(2008, 4, 15): datetime(2008, 10, 1),
+        datetime(2008, 4, 1): datetime(2008, 10, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestQuarterEnd(Base):
+    _offset = QuarterEnd
+
+    def test_repr(self):
+        expected = "<QuarterEnd: startingMonth=3>"
+        assert repr(QuarterEnd()) == expected
+        expected = "<QuarterEnd: startingMonth=3>"
+        assert repr(QuarterEnd(startingMonth=3)) == expected
+        expected = "<QuarterEnd: startingMonth=1>"
+        assert repr(QuarterEnd(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert QuarterEnd(startingMonth=1).isAnchored()
+        assert QuarterEnd().isAnchored()
+        assert not QuarterEnd(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = QuarterEnd(n=-1, startingMonth=1)
+        assert datetime(2010, 2, 1) + offset == datetime(2010, 1, 31)
+
+    offset_cases = []
+    offset_cases.append((QuarterEnd(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 4, 30),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 7, 31)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2008, 2, 15): datetime(2008, 2, 29),
+        datetime(2008, 2, 29): datetime(2008, 5, 31),
+        datetime(2008, 3, 15): datetime(2008, 5, 31),
+        datetime(2008, 3, 31): datetime(2008, 5, 31),
+        datetime(2008, 4, 15): datetime(2008, 5, 31),
+        datetime(2008, 4, 30): datetime(2008, 5, 31)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 4, 30)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 31),
+        datetime(2008, 1, 31): datetime(2007, 10, 31),
+        datetime(2008, 2, 15): datetime(2008, 1, 31),
+        datetime(2008, 2, 29): datetime(2008, 1, 31),
+        datetime(2008, 3, 15): datetime(2008, 1, 31),
+        datetime(2008, 3, 31): datetime(2008, 1, 31),
+        datetime(2008, 4, 15): datetime(2008, 1, 31),
+        datetime(2008, 4, 30): datetime(2008, 1, 31),
+        datetime(2008, 7, 1): datetime(2008, 4, 30)}))
+
+    offset_cases.append((QuarterEnd(startingMonth=1, n=2), {
+        datetime(2008, 1, 31): datetime(2008, 7, 31),
+        datetime(2008, 2, 15): datetime(2008, 7, 31),
+        datetime(2008, 2, 29): datetime(2008, 7, 31),
+        datetime(2008, 3, 15): datetime(2008, 7, 31),
+        datetime(2008, 3, 31): datetime(2008, 7, 31),
+        datetime(2008, 4, 15): datetime(2008, 7, 31),
+        datetime(2008, 4, 30): datetime(2008, 10, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 31), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 31), True),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), True),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 31), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), False),
+        (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBQuarterBegin(Base):
+    _offset = BQuarterBegin
+
+    def test_repr(self):
+        expected = "<BusinessQuarterBegin: startingMonth=3>"
+        assert repr(BQuarterBegin()) == expected
+        expected = "<BusinessQuarterBegin: startingMonth=3>"
+        assert repr(BQuarterBegin(startingMonth=3)) == expected
+        expected = "<BusinessQuarterBegin: startingMonth=1>"
+        assert repr(BQuarterBegin(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert BQuarterBegin(startingMonth=1).isAnchored()
+        assert BQuarterBegin().isAnchored()
+        assert not BQuarterBegin(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = BQuarterBegin(n=-1, startingMonth=1)
+        assert datetime(2007, 4, 3) + offset == datetime(2007, 4, 2)
+
+    offset_cases = []
+    offset_cases.append((BQuarterBegin(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 4, 1),
+        datetime(2008, 1, 31): datetime(2008, 4, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2008, 3, 31): datetime(2008, 4, 1),
+        datetime(2008, 4, 15): datetime(2008, 7, 1),
+        datetime(2007, 3, 15): datetime(2007, 4, 2),
+        datetime(2007, 2, 28): datetime(2007, 4, 2),
+        datetime(2007, 1, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 15): datetime(2007, 7, 2),
+        datetime(2007, 7, 1): datetime(2007, 7, 2),
+        datetime(2007, 4, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 2): datetime(2007, 7, 2),
+        datetime(2008, 4, 30): datetime(2008, 7, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 1),
+        datetime(2008, 1, 31): datetime(2008, 2, 1),
+        datetime(2008, 1, 15): datetime(2008, 2, 1),
+        datetime(2008, 2, 29): datetime(2008, 5, 1),
+        datetime(2008, 3, 15): datetime(2008, 5, 1),
+        datetime(2008, 3, 31): datetime(2008, 5, 1),
+        datetime(2008, 4, 15): datetime(2008, 5, 1),
+        datetime(2008, 8, 15): datetime(2008, 11, 3),
+        datetime(2008, 9, 15): datetime(2008, 11, 3),
+        datetime(2008, 11, 1): datetime(2008, 11, 3),
+        datetime(2008, 4, 30): datetime(2008, 5, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2007, 12, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 29): datetime(2008, 4, 1),
+        datetime(2008, 1, 15): datetime(2008, 4, 1),
+        datetime(2008, 2, 27): datetime(2008, 4, 1),
+        datetime(2008, 3, 15): datetime(2008, 4, 1),
+        datetime(2007, 4, 1): datetime(2007, 4, 2),
+        datetime(2007, 4, 2): datetime(2007, 4, 2),
+        datetime(2007, 7, 1): datetime(2007, 7, 2),
+        datetime(2007, 4, 15): datetime(2007, 7, 2),
+        datetime(2007, 7, 2): datetime(2007, 7, 2)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 1),
+        datetime(2008, 1, 31): datetime(2008, 1, 1),
+        datetime(2008, 2, 15): datetime(2008, 1, 1),
+        datetime(2008, 2, 29): datetime(2008, 1, 1),
+        datetime(2008, 3, 15): datetime(2008, 1, 1),
+        datetime(2008, 3, 31): datetime(2008, 1, 1),
+        datetime(2008, 4, 15): datetime(2008, 4, 1),
+        datetime(2007, 7, 3): datetime(2007, 7, 2),
+        datetime(2007, 4, 3): datetime(2007, 4, 2),
+        datetime(2007, 7, 2): datetime(2007, 4, 2),
+        datetime(2008, 4, 1): datetime(2008, 1, 1)}))
+
+    offset_cases.append((BQuarterBegin(startingMonth=1, n=2), {
+        datetime(2008, 1, 1): datetime(2008, 7, 1),
+        datetime(2008, 1, 15): datetime(2008, 7, 1),
+        datetime(2008, 2, 29): datetime(2008, 7, 1),
+        datetime(2008, 3, 15): datetime(2008, 7, 1),
+        datetime(2007, 3, 31): datetime(2007, 7, 2),
+        datetime(2007, 4, 15): datetime(2007, 10, 1),
+        datetime(2008, 4, 30): datetime(2008, 10, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestBQuarterEnd(Base):
+    _offset = BQuarterEnd
+
+    def test_repr(self):
+        expected = "<BusinessQuarterEnd: startingMonth=3>"
+        assert repr(BQuarterEnd()) == expected
+        expected = "<BusinessQuarterEnd: startingMonth=3>"
+        assert repr(BQuarterEnd(startingMonth=3)) == expected
+        expected = "<BusinessQuarterEnd: startingMonth=1>"
+        assert repr(BQuarterEnd(startingMonth=1)) == expected
+
+    def test_isAnchored(self):
+        assert BQuarterEnd(startingMonth=1).isAnchored()
+        assert BQuarterEnd().isAnchored()
+        assert not BQuarterEnd(2, startingMonth=1).isAnchored()
+
+    def test_offset_corner_case(self):
+        # corner
+        offset = BQuarterEnd(n=-1, startingMonth=1)
+        assert datetime(2010, 1, 31) + offset == datetime(2010, 1, 29)
+
+    offset_cases = []
+    offset_cases.append((BQuarterEnd(startingMonth=1), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 4, 30),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 7, 31)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=2), {
+        datetime(2008, 1, 1): datetime(2008, 2, 29),
+        datetime(2008, 1, 31): datetime(2008, 2, 29),
+        datetime(2008, 2, 15): datetime(2008, 2, 29),
+        datetime(2008, 2, 29): datetime(2008, 5, 30),
+        datetime(2008, 3, 15): datetime(2008, 5, 30),
+        datetime(2008, 3, 31): datetime(2008, 5, 30),
+        datetime(2008, 4, 15): datetime(2008, 5, 30),
+        datetime(2008, 4, 30): datetime(2008, 5, 30)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 31),
+        datetime(2008, 1, 31): datetime(2008, 1, 31),
+        datetime(2008, 2, 15): datetime(2008, 4, 30),
+        datetime(2008, 2, 29): datetime(2008, 4, 30),
+        datetime(2008, 3, 15): datetime(2008, 4, 30),
+        datetime(2008, 3, 31): datetime(2008, 4, 30),
+        datetime(2008, 4, 15): datetime(2008, 4, 30),
+        datetime(2008, 4, 30): datetime(2008, 4, 30)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=-1), {
+        datetime(2008, 1, 1): datetime(2007, 10, 31),
+        datetime(2008, 1, 31): datetime(2007, 10, 31),
+        datetime(2008, 2, 15): datetime(2008, 1, 31),
+        datetime(2008, 2, 29): datetime(2008, 1, 31),
+        datetime(2008, 3, 15): datetime(2008, 1, 31),
+        datetime(2008, 3, 31): datetime(2008, 1, 31),
+        datetime(2008, 4, 15): datetime(2008, 1, 31),
+        datetime(2008, 4, 30): datetime(2008, 1, 31)}))
+
+    offset_cases.append((BQuarterEnd(startingMonth=1, n=2), {
+        datetime(2008, 1, 31): datetime(2008, 7, 31),
+        datetime(2008, 2, 15): datetime(2008, 7, 31),
+        datetime(2008, 2, 29): datetime(2008, 7, 31),
+        datetime(2008, 3, 15): datetime(2008, 7, 31),
+        datetime(2008, 3, 31): datetime(2008, 7, 31),
+        datetime(2008, 4, 15): datetime(2008, 7, 31),
+        datetime(2008, 4, 30): datetime(2008, 10, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
+        (BQuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
+        (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), True),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
+        (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), True),
+        (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+# --------------------------------------------------------------------
+# Years
+
+
+class TestYearBegin(Base):
+    _offset = YearBegin
+
+    def test_misspecified(self):
+        with pytest.raises(ValueError, match="Month must go from 1 to 12"):
+            YearBegin(month=13)
+
+    offset_cases = []
+    offset_cases.append((YearBegin(), {
+        datetime(2008, 1, 1): datetime(2009, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 1),
+        datetime(2005, 12, 31): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 1),
+        datetime(2005, 12, 31): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(3), {
+        datetime(2008, 1, 1): datetime(2011, 1, 1),
+        datetime(2008, 6, 30): datetime(2011, 1, 1),
+        datetime(2008, 12, 31): datetime(2011, 1, 1),
+        datetime(2005, 12, 30): datetime(2008, 1, 1),
+        datetime(2005, 12, 31): datetime(2008, 1, 1)}))
+
+    offset_cases.append((YearBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 1, 1),
+        datetime(2007, 1, 15): datetime(2007, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 1, 1),
+        datetime(2008, 12, 31): datetime(2008, 1, 1),
+        datetime(2006, 12, 29): datetime(2006, 1, 1),
+        datetime(2006, 12, 30): datetime(2006, 1, 1),
+        datetime(2007, 1, 1): datetime(2006, 1, 1)}))
+
+    offset_cases.append((YearBegin(-2), {
+        datetime(2007, 1, 1): datetime(2005, 1, 1),
+        datetime(2008, 6, 30): datetime(2007, 1, 1),
+        datetime(2008, 12, 31): datetime(2007, 1, 1)}))
+
+    offset_cases.append((YearBegin(month=4), {
+        datetime(2007, 4, 1): datetime(2008, 4, 1),
+        datetime(2007, 4, 15): datetime(2008, 4, 1),
+        datetime(2007, 3, 1): datetime(2007, 4, 1),
+        datetime(2007, 12, 15): datetime(2008, 4, 1),
+        datetime(2012, 1, 31): datetime(2012, 4, 1)}))
+
+    offset_cases.append((YearBegin(0, month=4), {
+        datetime(2007, 4, 1): datetime(2007, 4, 1),
+        datetime(2007, 3, 1): datetime(2007, 4, 1),
+        datetime(2007, 12, 15): datetime(2008, 4, 1),
+        datetime(2012, 1, 31): datetime(2012, 4, 1)}))
+
+    offset_cases.append((YearBegin(4, month=4), {
+        datetime(2007, 4, 1): datetime(2011, 4, 1),
+        datetime(2007, 4, 15): datetime(2011, 4, 1),
+        datetime(2007, 3, 1): datetime(2010, 4, 1),
+        datetime(2007, 12, 15): datetime(2011, 4, 1),
+        datetime(2012, 1, 31): datetime(2015, 4, 1)}))
+
+    offset_cases.append((YearBegin(-1, month=4), {
+        datetime(2007, 4, 1): datetime(2006, 4, 1),
+        datetime(2007, 3, 1): datetime(2006, 4, 1),
+        datetime(2007, 12, 15): datetime(2007, 4, 1),
+        datetime(2012, 1, 31): datetime(2011, 4, 1)}))
+
+    offset_cases.append((YearBegin(-3, month=4), {
+        datetime(2007, 4, 1): datetime(2004, 4, 1),
+        datetime(2007, 3, 1): datetime(2004, 4, 1),
+        datetime(2007, 12, 15): datetime(2005, 4, 1),
+        datetime(2012, 1, 31): datetime(2009, 4, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearBegin(), datetime(2007, 1, 3), False),
+                       (YearBegin(), datetime(2008, 1, 1), True),
+                       (YearBegin(), datetime(2006, 12, 31), False),
+                       (YearBegin(), datetime(2006, 1, 2), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestYearEnd(Base):
+    _offset = YearEnd
+
+    def test_misspecified(self):
+        with pytest.raises(ValueError, match="Month must go from 1 to 12"):
+            YearEnd(month=13)
+
+    offset_cases = []
+    offset_cases.append((YearEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2009, 12, 31),
+        datetime(2005, 12, 30): datetime(2005, 12, 31),
+        datetime(2005, 12, 31): datetime(2006, 12, 31)}))
+
+    offset_cases.append((YearEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2008, 12, 31),
+        datetime(2005, 12, 30): datetime(2005, 12, 31)}))
+
+    offset_cases.append((YearEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 31),
+        datetime(2008, 6, 30): datetime(2007, 12, 31),
+        datetime(2008, 12, 31): datetime(2007, 12, 31),
+        datetime(2006, 12, 29): datetime(2005, 12, 31),
+        datetime(2006, 12, 30): datetime(2005, 12, 31),
+        datetime(2007, 1, 1): datetime(2006, 12, 31)}))
+
+    offset_cases.append((YearEnd(-2), {
+        datetime(2007, 1, 1): datetime(2005, 12, 31),
+        datetime(2008, 6, 30): datetime(2006, 12, 31),
+        datetime(2008, 12, 31): datetime(2006, 12, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearEnd(), datetime(2007, 12, 31), True),
+                       (YearEnd(), datetime(2008, 1, 1), False),
+                       (YearEnd(), datetime(2006, 12, 31), True),
+                       (YearEnd(), datetime(2006, 12, 29), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestYearEndDiffMonth(Base):
+    offset_cases = []
+    offset_cases.append((YearEnd(month=3),
+                        {datetime(2008, 1, 1): datetime(2008, 3, 31),
+                         datetime(2008, 2, 15): datetime(2008, 3, 31),
+                         datetime(2008, 3, 31): datetime(2009, 3, 31),
+                         datetime(2008, 3, 30): datetime(2008, 3, 31),
+                         datetime(2005, 3, 31): datetime(2006, 3, 31),
+                         datetime(2006, 7, 30): datetime(2007, 3, 31)}))
+
+    offset_cases.append((YearEnd(0, month=3),
+                        {datetime(2008, 1, 1): datetime(2008, 3, 31),
+                         datetime(2008, 2, 28): datetime(2008, 3, 31),
+                         datetime(2008, 3, 31): datetime(2008, 3, 31),
+                         datetime(2005, 3, 30): datetime(2005, 3, 31)}))
+
+    offset_cases.append((YearEnd(-1, month=3),
+                        {datetime(2007, 1, 1): datetime(2006, 3, 31),
+                         datetime(2008, 2, 28): datetime(2007, 3, 31),
+                         datetime(2008, 3, 31): datetime(2007, 3, 31),
+                         datetime(2006, 3, 29): datetime(2005, 3, 31),
+                         datetime(2006, 3, 30): datetime(2005, 3, 31),
+                         datetime(2007, 3, 1): datetime(2006, 3, 31)}))
+
+    offset_cases.append((YearEnd(-2, month=3),
+                        {datetime(2007, 1, 1): datetime(2005, 3, 31),
+                         datetime(2008, 6, 30): datetime(2007, 3, 31),
+                         datetime(2008, 3, 31): datetime(2006, 3, 31)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(YearEnd(month=3), datetime(2007, 3, 31), True),
+                       (YearEnd(month=3), datetime(2008, 1, 1), False),
+                       (YearEnd(month=3), datetime(2006, 3, 31), True),
+                       (YearEnd(month=3), datetime(2006, 3, 29), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBYearBegin(Base):
+    _offset = BYearBegin
+
+    def test_misspecified(self):
+        msg = "Month must go from 1 to 12"
+        with pytest.raises(ValueError, match=msg):
+            BYearBegin(month=13)
+        with pytest.raises(ValueError, match=msg):
+            BYearEnd(month=13)
+
+    offset_cases = []
+    offset_cases.append((BYearBegin(), {
+        datetime(2008, 1, 1): datetime(2009, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2011, 1, 1): datetime(2011, 1, 3),
+        datetime(2011, 1, 3): datetime(2012, 1, 2),
+        datetime(2005, 12, 30): datetime(2006, 1, 2),
+        datetime(2005, 12, 31): datetime(2006, 1, 2)}))
+
+    offset_cases.append((BYearBegin(0), {
+        datetime(2008, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2009, 1, 1),
+        datetime(2008, 12, 31): datetime(2009, 1, 1),
+        datetime(2005, 12, 30): datetime(2006, 1, 2),
+        datetime(2005, 12, 31): datetime(2006, 1, 2)}))
+
+    offset_cases.append((BYearBegin(-1), {
+        datetime(2007, 1, 1): datetime(2006, 1, 2),
+        datetime(2009, 1, 4): datetime(2009, 1, 1),
+        datetime(2009, 1, 1): datetime(2008, 1, 1),
+        datetime(2008, 6, 30): datetime(2008, 1, 1),
+        datetime(2008, 12, 31): datetime(2008, 1, 1),
+        datetime(2006, 12, 29): datetime(2006, 1, 2),
+        datetime(2006, 12, 30): datetime(2006, 1, 2),
+        datetime(2006, 1, 1): datetime(2005, 1, 3)}))
+
+    offset_cases.append((BYearBegin(-2), {
+        datetime(2007, 1, 1): datetime(2005, 1, 3),
+        datetime(2007, 6, 30): datetime(2006, 1, 2),
+        datetime(2008, 12, 31): datetime(2007, 1, 1)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+
+class TestBYearEnd(Base):
+    _offset = BYearEnd
+
+    offset_cases = []
+    offset_cases.append((BYearEnd(), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2009, 12, 31),
+        datetime(2005, 12, 30): datetime(2006, 12, 29),
+        datetime(2005, 12, 31): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(0), {
+        datetime(2008, 1, 1): datetime(2008, 12, 31),
+        datetime(2008, 6, 30): datetime(2008, 12, 31),
+        datetime(2008, 12, 31): datetime(2008, 12, 31),
+        datetime(2005, 12, 31): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(-1), {
+        datetime(2007, 1, 1): datetime(2006, 12, 29),
+        datetime(2008, 6, 30): datetime(2007, 12, 31),
+        datetime(2008, 12, 31): datetime(2007, 12, 31),
+        datetime(2006, 12, 29): datetime(2005, 12, 30),
+        datetime(2006, 12, 30): datetime(2006, 12, 29),
+        datetime(2007, 1, 1): datetime(2006, 12, 29)}))
+
+    offset_cases.append((BYearEnd(-2), {
+        datetime(2007, 1, 1): datetime(2005, 12, 30),
+        datetime(2008, 6, 30): datetime(2006, 12, 29),
+        datetime(2008, 12, 31): datetime(2006, 12, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    on_offset_cases = [(BYearEnd(), datetime(2007, 12, 31), True),
+                       (BYearEnd(), datetime(2008, 1, 1), False),
+                       (BYearEnd(), datetime(2006, 12, 31), False),
+                       (BYearEnd(), datetime(2006, 12, 29), True)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
+
+
+class TestBYearEndLagged(Base):
+    _offset = BYearEnd
+
+    def test_bad_month_fail(self):
+        msg = "Month must go from 1 to 12"
+        with pytest.raises(ValueError, match=msg):
+            BYearEnd(month=13)
+        with pytest.raises(ValueError, match=msg):
+            BYearEnd(month=0)
+
+    offset_cases = []
+    offset_cases.append((BYearEnd(month=6), {
+        datetime(2008, 1, 1): datetime(2008, 6, 30),
+        datetime(2007, 6, 30): datetime(2008, 6, 30)}))
+
+    offset_cases.append((BYearEnd(n=-1, month=6), {
+        datetime(2008, 1, 1): datetime(2007, 6, 29),
+        datetime(2007, 6, 30): datetime(2007, 6, 29)}))
+
+    @pytest.mark.parametrize('case', offset_cases)
+    def test_offset(self, case):
+        offset, cases = case
+        for base, expected in compat.iteritems(cases):
+            assert_offset_equal(offset, base, expected)
+
+    def test_roll(self):
+        offset = BYearEnd(month=6)
+        date = datetime(2009, 11, 30)
+
+        assert offset.rollforward(date) == datetime(2010, 6, 30)
+        assert offset.rollback(date) == datetime(2009, 6, 30)
+
+    on_offset_cases = [(BYearEnd(month=2), datetime(2007, 2, 28), True),
+                       (BYearEnd(month=6), datetime(2007, 6, 30), False)]
+
+    @pytest.mark.parametrize('case', on_offset_cases)
+    def test_onOffset(self, case):
+        offset, dt, expected = case
+        assert_onOffset(offset, dt, expected)
diff --git a/pandas/tests/tseries/test_converter.py b/pandas/tests/tseries/test_converter.py
deleted file mode 100644
index 5351e26f0e62b..0000000000000
--- a/pandas/tests/tseries/test_converter.py
+++ /dev/null
@@ -1,199 +0,0 @@
-import pytest
-from datetime import datetime, date
-
-import numpy as np
-from pandas import Timestamp, Period, Index
-from pandas.compat import u
-import pandas.util.testing as tm
-from pandas.tseries.offsets import Second, Milli, Micro, Day
-from pandas.compat.numpy import np_datetime64_compat
-
-converter = pytest.importorskip('pandas.tseries.converter')
-
-
-def test_timtetonum_accepts_unicode():
-    assert (converter.time2num("00:01") == converter.time2num(u("00:01")))
-
-
-class TestDateTimeConverter(tm.TestCase):
-
-    def setUp(self):
-        self.dtc = converter.DatetimeConverter()
-        self.tc = converter.TimeFormatter(None)
-
-    def test_convert_accepts_unicode(self):
-        r1 = self.dtc.convert("12:22", None, None)
-        r2 = self.dtc.convert(u("12:22"), None, None)
-        assert (r1 == r2), "DatetimeConverter.convert should accept unicode"
-
-    def test_conversion(self):
-        rs = self.dtc.convert(['2012-1-1'], None, None)[0]
-        xp = datetime(2012, 1, 1).toordinal()
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert('2012-1-1', None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(date(2012, 1, 1), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(datetime(2012, 1, 1).toordinal(), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert('2012-1-1', None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(Timestamp('2012-1-1'), None, None)
-        self.assertEqual(rs, xp)
-
-        # also testing datetime64 dtype (GH8614)
-        rs = self.dtc.convert(np_datetime64_compat('2012-01-01'), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(np_datetime64_compat(
-            '2012-01-01 00:00:00+0000'), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(np.array([
-            np_datetime64_compat('2012-01-01 00:00:00+0000'),
-            np_datetime64_compat('2012-01-02 00:00:00+0000')]), None, None)
-        self.assertEqual(rs[0], xp)
-
-        # we have a tz-aware date (constructed to that when we turn to utc it
-        # is the same as our sample)
-        ts = (Timestamp('2012-01-01')
-              .tz_localize('UTC')
-              .tz_convert('US/Eastern')
-              )
-        rs = self.dtc.convert(ts, None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(ts.to_pydatetime(), None, None)
-        self.assertEqual(rs, xp)
-
-        rs = self.dtc.convert(Index([ts - Day(1), ts]), None, None)
-        self.assertEqual(rs[1], xp)
-
-        rs = self.dtc.convert(Index([ts - Day(1), ts]).to_pydatetime(),
-                              None, None)
-        self.assertEqual(rs[1], xp)
-
-    def test_conversion_float(self):
-        decimals = 9
-
-        rs = self.dtc.convert(
-            Timestamp('2012-1-1 01:02:03', tz='UTC'), None, None)
-        xp = converter.dates.date2num(Timestamp('2012-1-1 01:02:03', tz='UTC'))
-        tm.assert_almost_equal(rs, xp, decimals)
-
-        rs = self.dtc.convert(
-            Timestamp('2012-1-1 09:02:03', tz='Asia/Hong_Kong'), None, None)
-        tm.assert_almost_equal(rs, xp, decimals)
-
-        rs = self.dtc.convert(datetime(2012, 1, 1, 1, 2, 3), None, None)
-        tm.assert_almost_equal(rs, xp, decimals)
-
-    def test_conversion_outofbounds_datetime(self):
-        # 2579
-        values = [date(1677, 1, 1), date(1677, 1, 2)]
-        rs = self.dtc.convert(values, None, None)
-        xp = converter.dates.date2num(values)
-        tm.assert_numpy_array_equal(rs, xp)
-        rs = self.dtc.convert(values[0], None, None)
-        xp = converter.dates.date2num(values[0])
-        self.assertEqual(rs, xp)
-
-        values = [datetime(1677, 1, 1, 12), datetime(1677, 1, 2, 12)]
-        rs = self.dtc.convert(values, None, None)
-        xp = converter.dates.date2num(values)
-        tm.assert_numpy_array_equal(rs, xp)
-        rs = self.dtc.convert(values[0], None, None)
-        xp = converter.dates.date2num(values[0])
-        self.assertEqual(rs, xp)
-
-    def test_time_formatter(self):
-        self.tc(90000)
-
-    def test_dateindex_conversion(self):
-        decimals = 9
-
-        for freq in ('B', 'L', 'S'):
-            dateindex = tm.makeDateIndex(k=10, freq=freq)
-            rs = self.dtc.convert(dateindex, None, None)
-            xp = converter.dates.date2num(dateindex._mpl_repr())
-            tm.assert_almost_equal(rs, xp, decimals)
-
-    def test_resolution(self):
-        def _assert_less(ts1, ts2):
-            val1 = self.dtc.convert(ts1, None, None)
-            val2 = self.dtc.convert(ts2, None, None)
-            if not val1 < val2:
-                raise AssertionError('{0} is not less than {1}.'.format(val1,
-                                                                        val2))
-
-        # Matplotlib's time representation using floats cannot distinguish
-        # intervals smaller than ~10 microsecond in the common range of years.
-        ts = Timestamp('2012-1-1')
-        _assert_less(ts, ts + Second())
-        _assert_less(ts, ts + Milli())
-        _assert_less(ts, ts + Micro(50))
-
-
-class TestPeriodConverter(tm.TestCase):
-
-    def setUp(self):
-        self.pc = converter.PeriodConverter()
-
-        class Axis(object):
-            pass
-
-        self.axis = Axis()
-        self.axis.freq = 'D'
-
-    def test_convert_accepts_unicode(self):
-        r1 = self.pc.convert("2012-1-1", None, self.axis)
-        r2 = self.pc.convert(u("2012-1-1"), None, self.axis)
-        self.assert_equal(r1, r2,
-                          "PeriodConverter.convert should accept unicode")
-
-    def test_conversion(self):
-        rs = self.pc.convert(['2012-1-1'], None, self.axis)[0]
-        xp = Period('2012-1-1').ordinal
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert('2012-1-1', None, self.axis)
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert([date(2012, 1, 1)], None, self.axis)[0]
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert(date(2012, 1, 1), None, self.axis)
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert([Timestamp('2012-1-1')], None, self.axis)[0]
-        self.assertEqual(rs, xp)
-
-        rs = self.pc.convert(Timestamp('2012-1-1'), None, self.axis)
-        self.assertEqual(rs, xp)
-
-        # FIXME
-        # rs = self.pc.convert(
-        #        np_datetime64_compat('2012-01-01'), None, self.axis)
-        # self.assertEqual(rs, xp)
-        #
-        # rs = self.pc.convert(
-        #        np_datetime64_compat('2012-01-01 00:00:00+0000'),
-        #                      None, self.axis)
-        # self.assertEqual(rs, xp)
-        #
-        # rs = self.pc.convert(np.array([
-        #     np_datetime64_compat('2012-01-01 00:00:00+0000'),
-        #     np_datetime64_compat('2012-01-02 00:00:00+0000')]),
-        #                          None, self.axis)
-        # self.assertEqual(rs[0], xp)
-
-    def test_integer_passthrough(self):
-        # GH9012
-        rs = self.pc.convert([0, 1], None, self.axis)
-        xp = [0, 1]
-        self.assertEqual(rs, xp)
diff --git a/pandas/tests/tseries/test_frequencies.py b/pandas/tests/tseries/test_frequencies.py
deleted file mode 100644
index 5fbef465ca8fc..0000000000000
--- a/pandas/tests/tseries/test_frequencies.py
+++ /dev/null
@@ -1,845 +0,0 @@
-from datetime import datetime, timedelta
-from pandas.compat import range
-
-import numpy as np
-
-from pandas import (Index, DatetimeIndex, Timestamp, Series,
-                    date_range, period_range)
-
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.tools import to_datetime
-
-import pandas.tseries.offsets as offsets
-from pandas.tseries.period import PeriodIndex
-import pandas.compat as compat
-from pandas.compat import is_platform_windows
-
-import pandas.util.testing as tm
-from pandas import Timedelta
-
-
-class TestToOffset(tm.TestCase):
-
-    def test_to_offset_multiple(self):
-        freqstr = '2h30min'
-        freqstr2 = '2h 30min'
-
-        result = frequencies.to_offset(freqstr)
-        assert (result == frequencies.to_offset(freqstr2))
-        expected = offsets.Minute(150)
-        assert (result == expected)
-
-        freqstr = '2h30min15s'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Second(150 * 60 + 15)
-        assert (result == expected)
-
-        freqstr = '2h 60min'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Hour(3)
-        assert (result == expected)
-
-        freqstr = '2h 20.5min'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Second(8430)
-        assert (result == expected)
-
-        freqstr = '1.5min'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Second(90)
-        assert (result == expected)
-
-        freqstr = '0.5S'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Milli(500)
-        assert (result == expected)
-
-        freqstr = '15l500u'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Micro(15500)
-        assert (result == expected)
-
-        freqstr = '10s75L'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Milli(10075)
-        assert (result == expected)
-
-        freqstr = '1s0.25ms'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Micro(1000250)
-        assert (result == expected)
-
-        freqstr = '1s0.25L'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Micro(1000250)
-        assert (result == expected)
-
-        freqstr = '2800N'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.Nano(2800)
-        assert (result == expected)
-
-        freqstr = '2SM'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.SemiMonthEnd(2)
-        assert (result == expected)
-
-        freqstr = '2SM-16'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.SemiMonthEnd(2, day_of_month=16)
-        assert (result == expected)
-
-        freqstr = '2SMS-14'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.SemiMonthBegin(2, day_of_month=14)
-        assert (result == expected)
-
-        freqstr = '2SMS-15'
-        result = frequencies.to_offset(freqstr)
-        expected = offsets.SemiMonthBegin(2)
-        assert (result == expected)
-
-        # malformed
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: 2h20m'):
-            frequencies.to_offset('2h20m')
-
-    def test_to_offset_negative(self):
-        freqstr = '-1S'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == -1)
-
-        freqstr = '-5min10s'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == -310)
-
-        freqstr = '-2SM'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == -2)
-
-        freqstr = '-1SMS'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == -1)
-
-    def test_to_offset_invalid(self):
-        # GH 13930
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: U1'):
-            frequencies.to_offset('U1')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: -U'):
-            frequencies.to_offset('-U')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: 3U1'):
-            frequencies.to_offset('3U1')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: -2-3U'):
-            frequencies.to_offset('-2-3U')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: -2D:3H'):
-            frequencies.to_offset('-2D:3H')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: 1.5.0S'):
-            frequencies.to_offset('1.5.0S')
-
-        # split offsets with spaces are valid
-        assert frequencies.to_offset('2D 3H') == offsets.Hour(51)
-        assert frequencies.to_offset('2 D3 H') == offsets.Hour(51)
-        assert frequencies.to_offset('2 D 3 H') == offsets.Hour(51)
-        assert frequencies.to_offset('  2 D 3 H  ') == offsets.Hour(51)
-        assert frequencies.to_offset('   H    ') == offsets.Hour()
-        assert frequencies.to_offset(' 3  H    ') == offsets.Hour(3)
-
-        # special cases
-        assert frequencies.to_offset('2SMS-15') == offsets.SemiMonthBegin(2)
-        with tm.assertRaisesRegexp(ValueError,
-                                   'Invalid frequency: 2SMS-15-15'):
-            frequencies.to_offset('2SMS-15-15')
-        with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: 2SMS-15D'):
-            frequencies.to_offset('2SMS-15D')
-
-    def test_to_offset_leading_zero(self):
-        freqstr = '00H 00T 01S'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == 1)
-
-        freqstr = '-00H 03T 14S'
-        result = frequencies.to_offset(freqstr)
-        assert (result.n == -194)
-
-    def test_to_offset_pd_timedelta(self):
-        # Tests for #9064
-        td = Timedelta(days=1, seconds=1)
-        result = frequencies.to_offset(td)
-        expected = offsets.Second(86401)
-        assert (expected == result)
-
-        td = Timedelta(days=-1, seconds=1)
-        result = frequencies.to_offset(td)
-        expected = offsets.Second(-86399)
-        assert (expected == result)
-
-        td = Timedelta(hours=1, minutes=10)
-        result = frequencies.to_offset(td)
-        expected = offsets.Minute(70)
-        assert (expected == result)
-
-        td = Timedelta(hours=1, minutes=-10)
-        result = frequencies.to_offset(td)
-        expected = offsets.Minute(50)
-        assert (expected == result)
-
-        td = Timedelta(weeks=1)
-        result = frequencies.to_offset(td)
-        expected = offsets.Day(7)
-        assert (expected == result)
-
-        td1 = Timedelta(hours=1)
-        result1 = frequencies.to_offset(td1)
-        result2 = frequencies.to_offset('60min')
-        assert (result1 == result2)
-
-        td = Timedelta(microseconds=1)
-        result = frequencies.to_offset(td)
-        expected = offsets.Micro(1)
-        assert (expected == result)
-
-        td = Timedelta(microseconds=0)
-        tm.assertRaises(ValueError, lambda: frequencies.to_offset(td))
-
-    def test_anchored_shortcuts(self):
-        result = frequencies.to_offset('W')
-        expected = frequencies.to_offset('W-SUN')
-        assert (result == expected)
-
-        result1 = frequencies.to_offset('Q')
-        result2 = frequencies.to_offset('Q-DEC')
-        expected = offsets.QuarterEnd(startingMonth=12)
-        assert (result1 == expected)
-        assert (result2 == expected)
-
-        result1 = frequencies.to_offset('Q-MAY')
-        expected = offsets.QuarterEnd(startingMonth=5)
-        assert (result1 == expected)
-
-        result1 = frequencies.to_offset('SM')
-        result2 = frequencies.to_offset('SM-15')
-        expected = offsets.SemiMonthEnd(day_of_month=15)
-        assert (result1 == expected)
-        assert (result2 == expected)
-
-        result = frequencies.to_offset('SM-1')
-        expected = offsets.SemiMonthEnd(day_of_month=1)
-        assert (result == expected)
-
-        result = frequencies.to_offset('SM-27')
-        expected = offsets.SemiMonthEnd(day_of_month=27)
-        assert (result == expected)
-
-        result = frequencies.to_offset('SMS-2')
-        expected = offsets.SemiMonthBegin(day_of_month=2)
-        assert (result == expected)
-
-        result = frequencies.to_offset('SMS-27')
-        expected = offsets.SemiMonthBegin(day_of_month=27)
-        assert (result == expected)
-
-        # ensure invalid cases fail as expected
-        invalid_anchors = ['SM-0', 'SM-28', 'SM-29',
-                           'SM-FOO', 'BSM', 'SM--1'
-                           'SMS-1', 'SMS-28', 'SMS-30',
-                           'SMS-BAR', 'BSMS', 'SMS--2']
-        for invalid_anchor in invalid_anchors:
-            with tm.assertRaisesRegexp(ValueError, 'Invalid frequency: '):
-                frequencies.to_offset(invalid_anchor)
-
-
-def test_ms_vs_MS():
-    left = frequencies.get_offset('ms')
-    right = frequencies.get_offset('MS')
-    assert left == offsets.Milli()
-    assert right == offsets.MonthBegin()
-
-
-def test_rule_aliases():
-    rule = frequencies.to_offset('10us')
-    assert rule == offsets.Micro(10)
-
-
-def test_get_rule_month():
-    result = frequencies._get_rule_month('W')
-    assert (result == 'DEC')
-    result = frequencies._get_rule_month(offsets.Week())
-    assert (result == 'DEC')
-
-    result = frequencies._get_rule_month('D')
-    assert (result == 'DEC')
-    result = frequencies._get_rule_month(offsets.Day())
-    assert (result == 'DEC')
-
-    result = frequencies._get_rule_month('Q')
-    assert (result == 'DEC')
-    result = frequencies._get_rule_month(offsets.QuarterEnd(startingMonth=12))
-    print(result == 'DEC')
-
-    result = frequencies._get_rule_month('Q-JAN')
-    assert (result == 'JAN')
-    result = frequencies._get_rule_month(offsets.QuarterEnd(startingMonth=1))
-    assert (result == 'JAN')
-
-    result = frequencies._get_rule_month('A-DEC')
-    assert (result == 'DEC')
-    result = frequencies._get_rule_month(offsets.YearEnd())
-    assert (result == 'DEC')
-
-    result = frequencies._get_rule_month('A-MAY')
-    assert (result == 'MAY')
-    result = frequencies._get_rule_month(offsets.YearEnd(month=5))
-    assert (result == 'MAY')
-
-
-def test_period_str_to_code():
-    assert (frequencies._period_str_to_code('A') == 1000)
-    assert (frequencies._period_str_to_code('A-DEC') == 1000)
-    assert (frequencies._period_str_to_code('A-JAN') == 1001)
-    assert (frequencies._period_str_to_code('Q') == 2000)
-    assert (frequencies._period_str_to_code('Q-DEC') == 2000)
-    assert (frequencies._period_str_to_code('Q-FEB') == 2002)
-
-    def _assert_depr(freq, expected, aliases):
-        assert isinstance(aliases, list)
-        assert (frequencies._period_str_to_code(freq) == expected)
-
-        msg = frequencies._INVALID_FREQ_ERROR
-        for alias in aliases:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                frequencies._period_str_to_code(alias)
-
-    _assert_depr("M", 3000, ["MTH", "MONTH", "MONTHLY"])
-
-    assert (frequencies._period_str_to_code('W') == 4000)
-    assert (frequencies._period_str_to_code('W-SUN') == 4000)
-    assert (frequencies._period_str_to_code('W-FRI') == 4005)
-
-    _assert_depr("B", 5000, ["BUS", "BUSINESS", "BUSINESSLY", "WEEKDAY"])
-    _assert_depr("D", 6000, ["DAY", "DLY", "DAILY"])
-    _assert_depr("H", 7000, ["HR", "HOUR", "HRLY", "HOURLY"])
-
-    _assert_depr("T", 8000, ["minute", "MINUTE", "MINUTELY"])
-    assert (frequencies._period_str_to_code('Min') == 8000)
-
-    _assert_depr("S", 9000, ["sec", "SEC", "SECOND", "SECONDLY"])
-    _assert_depr("L", 10000, ["MILLISECOND", "MILLISECONDLY"])
-    assert (frequencies._period_str_to_code('ms') == 10000)
-
-    _assert_depr("U", 11000, ["MICROSECOND", "MICROSECONDLY"])
-    assert (frequencies._period_str_to_code('US') == 11000)
-
-    _assert_depr("N", 12000, ["NANOSECOND", "NANOSECONDLY"])
-    assert (frequencies._period_str_to_code('NS') == 12000)
-
-
-class TestFrequencyCode(tm.TestCase):
-
-    def test_freq_code(self):
-        self.assertEqual(frequencies.get_freq('A'), 1000)
-        self.assertEqual(frequencies.get_freq('3A'), 1000)
-        self.assertEqual(frequencies.get_freq('-1A'), 1000)
-
-        self.assertEqual(frequencies.get_freq('W'), 4000)
-        self.assertEqual(frequencies.get_freq('W-MON'), 4001)
-        self.assertEqual(frequencies.get_freq('W-FRI'), 4005)
-
-        for freqstr, code in compat.iteritems(frequencies._period_code_map):
-            result = frequencies.get_freq(freqstr)
-            self.assertEqual(result, code)
-
-            result = frequencies.get_freq_group(freqstr)
-            self.assertEqual(result, code // 1000 * 1000)
-
-            result = frequencies.get_freq_group(code)
-            self.assertEqual(result, code // 1000 * 1000)
-
-    def test_freq_group(self):
-        self.assertEqual(frequencies.get_freq_group('A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('3A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('-1A'), 1000)
-        self.assertEqual(frequencies.get_freq_group('A-JAN'), 1000)
-        self.assertEqual(frequencies.get_freq_group('A-MAY'), 1000)
-        self.assertEqual(frequencies.get_freq_group(offsets.YearEnd()), 1000)
-        self.assertEqual(frequencies.get_freq_group(
-            offsets.YearEnd(month=1)), 1000)
-        self.assertEqual(frequencies.get_freq_group(
-            offsets.YearEnd(month=5)), 1000)
-
-        self.assertEqual(frequencies.get_freq_group('W'), 4000)
-        self.assertEqual(frequencies.get_freq_group('W-MON'), 4000)
-        self.assertEqual(frequencies.get_freq_group('W-FRI'), 4000)
-        self.assertEqual(frequencies.get_freq_group(offsets.Week()), 4000)
-        self.assertEqual(frequencies.get_freq_group(
-            offsets.Week(weekday=1)), 4000)
-        self.assertEqual(frequencies.get_freq_group(
-            offsets.Week(weekday=5)), 4000)
-
-    def test_get_to_timestamp_base(self):
-        tsb = frequencies.get_to_timestamp_base
-
-        self.assertEqual(tsb(frequencies.get_freq_code('D')[0]),
-                         frequencies.get_freq_code('D')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('W')[0]),
-                         frequencies.get_freq_code('D')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('M')[0]),
-                         frequencies.get_freq_code('D')[0])
-
-        self.assertEqual(tsb(frequencies.get_freq_code('S')[0]),
-                         frequencies.get_freq_code('S')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('T')[0]),
-                         frequencies.get_freq_code('S')[0])
-        self.assertEqual(tsb(frequencies.get_freq_code('H')[0]),
-                         frequencies.get_freq_code('S')[0])
-
-    def test_freq_to_reso(self):
-        Reso = frequencies.Resolution
-
-        self.assertEqual(Reso.get_str_from_freq('A'), 'year')
-        self.assertEqual(Reso.get_str_from_freq('Q'), 'quarter')
-        self.assertEqual(Reso.get_str_from_freq('M'), 'month')
-        self.assertEqual(Reso.get_str_from_freq('D'), 'day')
-        self.assertEqual(Reso.get_str_from_freq('H'), 'hour')
-        self.assertEqual(Reso.get_str_from_freq('T'), 'minute')
-        self.assertEqual(Reso.get_str_from_freq('S'), 'second')
-        self.assertEqual(Reso.get_str_from_freq('L'), 'millisecond')
-        self.assertEqual(Reso.get_str_from_freq('U'), 'microsecond')
-        self.assertEqual(Reso.get_str_from_freq('N'), 'nanosecond')
-
-        for freq in ['A', 'Q', 'M', 'D', 'H', 'T', 'S', 'L', 'U', 'N']:
-            # check roundtrip
-            result = Reso.get_freq(Reso.get_str_from_freq(freq))
-            self.assertEqual(freq, result)
-
-        for freq in ['D', 'H', 'T', 'S', 'L', 'U']:
-            result = Reso.get_freq(Reso.get_str(Reso.get_reso_from_freq(freq)))
-            self.assertEqual(freq, result)
-
-    def test_resolution_bumping(self):
-        # GH 14378
-        Reso = frequencies.Resolution
-
-        self.assertEqual(Reso.get_stride_from_decimal(1.5, 'T'), (90, 'S'))
-        self.assertEqual(Reso.get_stride_from_decimal(62.4, 'T'), (3744, 'S'))
-        self.assertEqual(Reso.get_stride_from_decimal(1.04, 'H'), (3744, 'S'))
-        self.assertEqual(Reso.get_stride_from_decimal(1, 'D'), (1, 'D'))
-        self.assertEqual(Reso.get_stride_from_decimal(0.342931, 'H'),
-                         (1234551600, 'U'))
-        self.assertEqual(Reso.get_stride_from_decimal(1.2345, 'D'),
-                         (106660800, 'L'))
-
-        with self.assertRaises(ValueError):
-            Reso.get_stride_from_decimal(0.5, 'N')
-
-        # too much precision in the input can prevent
-        with self.assertRaises(ValueError):
-            Reso.get_stride_from_decimal(0.3429324798798269273987982, 'H')
-
-    def test_get_freq_code(self):
-        # freqstr
-        self.assertEqual(frequencies.get_freq_code('A'),
-                         (frequencies.get_freq('A'), 1))
-        self.assertEqual(frequencies.get_freq_code('3D'),
-                         (frequencies.get_freq('D'), 3))
-        self.assertEqual(frequencies.get_freq_code('-2M'),
-                         (frequencies.get_freq('M'), -2))
-
-        # tuple
-        self.assertEqual(frequencies.get_freq_code(('D', 1)),
-                         (frequencies.get_freq('D'), 1))
-        self.assertEqual(frequencies.get_freq_code(('A', 3)),
-                         (frequencies.get_freq('A'), 3))
-        self.assertEqual(frequencies.get_freq_code(('M', -2)),
-                         (frequencies.get_freq('M'), -2))
-        # numeric tuple
-        self.assertEqual(frequencies.get_freq_code((1000, 1)), (1000, 1))
-
-        # offsets
-        self.assertEqual(frequencies.get_freq_code(offsets.Day()),
-                         (frequencies.get_freq('D'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Day(3)),
-                         (frequencies.get_freq('D'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.Day(-2)),
-                         (frequencies.get_freq('D'), -2))
-
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd()),
-                         (frequencies.get_freq('M'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd(3)),
-                         (frequencies.get_freq('M'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.MonthEnd(-2)),
-                         (frequencies.get_freq('M'), -2))
-
-        self.assertEqual(frequencies.get_freq_code(offsets.Week()),
-                         (frequencies.get_freq('W'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(3)),
-                         (frequencies.get_freq('W'), 3))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(-2)),
-                         (frequencies.get_freq('W'), -2))
-
-        # monday is weekday=0
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(weekday=1)),
-                         (frequencies.get_freq('W-TUE'), 1))
-        self.assertEqual(frequencies.get_freq_code(offsets.Week(3, weekday=0)),
-                         (frequencies.get_freq('W-MON'), 3))
-        self.assertEqual(
-            frequencies.get_freq_code(offsets.Week(-2, weekday=4)),
-            (frequencies.get_freq('W-FRI'), -2))
-
-
-_dti = DatetimeIndex
-
-
-class TestFrequencyInference(tm.TestCase):
-
-    def test_raise_if_period_index(self):
-        index = PeriodIndex(start="1/1/1990", periods=20, freq="M")
-        self.assertRaises(TypeError, frequencies.infer_freq, index)
-
-    def test_raise_if_too_few(self):
-        index = _dti(['12/31/1998', '1/3/1999'])
-        self.assertRaises(ValueError, frequencies.infer_freq, index)
-
-    def test_business_daily(self):
-        index = _dti(['12/31/1998', '1/3/1999', '1/4/1999'])
-        self.assertEqual(frequencies.infer_freq(index), 'B')
-
-    def test_day(self):
-        self._check_tick(timedelta(1), 'D')
-
-    def test_day_corner(self):
-        index = _dti(['1/1/2000', '1/2/2000', '1/3/2000'])
-        self.assertEqual(frequencies.infer_freq(index), 'D')
-
-    def test_non_datetimeindex(self):
-        dates = to_datetime(['1/1/2000', '1/2/2000', '1/3/2000'])
-        self.assertEqual(frequencies.infer_freq(dates), 'D')
-
-    def test_hour(self):
-        self._check_tick(timedelta(hours=1), 'H')
-
-    def test_minute(self):
-        self._check_tick(timedelta(minutes=1), 'T')
-
-    def test_second(self):
-        self._check_tick(timedelta(seconds=1), 'S')
-
-    def test_millisecond(self):
-        self._check_tick(timedelta(microseconds=1000), 'L')
-
-    def test_microsecond(self):
-        self._check_tick(timedelta(microseconds=1), 'U')
-
-    def test_nanosecond(self):
-        self._check_tick(np.timedelta64(1, 'ns'), 'N')
-
-    def _check_tick(self, base_delta, code):
-        b = Timestamp(datetime.now())
-        for i in range(1, 5):
-            inc = base_delta * i
-            index = _dti([b + inc * j for j in range(3)])
-            if i > 1:
-                exp_freq = '%d%s' % (i, code)
-            else:
-                exp_freq = code
-            self.assertEqual(frequencies.infer_freq(index), exp_freq)
-
-        index = _dti([b + base_delta * 7] + [b + base_delta * j for j in range(
-            3)])
-        self.assertIsNone(frequencies.infer_freq(index))
-
-        index = _dti([b + base_delta * j for j in range(3)] + [b + base_delta *
-                                                               7])
-
-        self.assertIsNone(frequencies.infer_freq(index))
-
-    def test_weekly(self):
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-        for day in days:
-            self._check_generated_range('1/1/2000', 'W-%s' % day)
-
-    def test_week_of_month(self):
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-        for day in days:
-            for i in range(1, 5):
-                self._check_generated_range('1/1/2000', 'WOM-%d%s' % (i, day))
-
-    def test_fifth_week_of_month(self):
-        # Only supports freq up to WOM-4. See #9425
-        func = lambda: date_range('2014-01-01', freq='WOM-5MON')
-        self.assertRaises(ValueError, func)
-
-    def test_fifth_week_of_month_infer(self):
-        # Only attempts to infer up to WOM-4. See #9425
-        index = DatetimeIndex(["2014-03-31", "2014-06-30", "2015-03-30"])
-        assert frequencies.infer_freq(index) is None
-
-    def test_week_of_month_fake(self):
-        # All of these dates are on same day of week and are 4 or 5 weeks apart
-        index = DatetimeIndex(["2013-08-27", "2013-10-01", "2013-10-29",
-                               "2013-11-26"])
-        assert frequencies.infer_freq(index) != 'WOM-4TUE'
-
-    def test_monthly(self):
-        self._check_generated_range('1/1/2000', 'M')
-
-    def test_monthly_ambiguous(self):
-        rng = _dti(['1/31/2000', '2/29/2000', '3/31/2000'])
-        self.assertEqual(rng.inferred_freq, 'M')
-
-    def test_business_monthly(self):
-        self._check_generated_range('1/1/2000', 'BM')
-
-    def test_business_start_monthly(self):
-        self._check_generated_range('1/1/2000', 'BMS')
-
-    def test_quarterly(self):
-        for month in ['JAN', 'FEB', 'MAR']:
-            self._check_generated_range('1/1/2000', 'Q-%s' % month)
-
-    def test_annual(self):
-        for month in MONTHS:
-            self._check_generated_range('1/1/2000', 'A-%s' % month)
-
-    def test_business_annual(self):
-        for month in MONTHS:
-            self._check_generated_range('1/1/2000', 'BA-%s' % month)
-
-    def test_annual_ambiguous(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-        self.assertEqual(rng.inferred_freq, 'A-JAN')
-
-    def _check_generated_range(self, start, freq):
-        freq = freq.upper()
-
-        gen = date_range(start, periods=7, freq=freq)
-        index = _dti(gen.values)
-        if not freq.startswith('Q-'):
-            self.assertEqual(frequencies.infer_freq(index), gen.freqstr)
-        else:
-            inf_freq = frequencies.infer_freq(index)
-            self.assertTrue((inf_freq == 'Q-DEC' and gen.freqstr in (
-                'Q', 'Q-DEC', 'Q-SEP', 'Q-JUN', 'Q-MAR')) or (
-                    inf_freq == 'Q-NOV' and gen.freqstr in (
-                        'Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB')) or (
-                            inf_freq == 'Q-OCT' and gen.freqstr in (
-                                'Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')))
-
-        gen = date_range(start, periods=5, freq=freq)
-        index = _dti(gen.values)
-        if not freq.startswith('Q-'):
-            self.assertEqual(frequencies.infer_freq(index), gen.freqstr)
-        else:
-            inf_freq = frequencies.infer_freq(index)
-            self.assertTrue((inf_freq == 'Q-DEC' and gen.freqstr in (
-                'Q', 'Q-DEC', 'Q-SEP', 'Q-JUN', 'Q-MAR')) or (
-                    inf_freq == 'Q-NOV' and gen.freqstr in (
-                        'Q-NOV', 'Q-AUG', 'Q-MAY', 'Q-FEB')) or (
-                            inf_freq == 'Q-OCT' and gen.freqstr in (
-                                'Q-OCT', 'Q-JUL', 'Q-APR', 'Q-JAN')))
-
-    def test_infer_freq(self):
-        rng = period_range('1959Q2', '2009Q3', freq='Q')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-DEC')
-
-        rng = period_range('1959Q2', '2009Q3', freq='Q-NOV')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-NOV')
-
-        rng = period_range('1959Q2', '2009Q3', freq='Q-OCT')
-        rng = Index(rng.to_timestamp('D', how='e').asobject)
-        self.assertEqual(rng.inferred_freq, 'Q-OCT')
-
-    def test_infer_freq_tz(self):
-
-        freqs = {'AS-JAN':
-                 ['2009-01-01', '2010-01-01', '2011-01-01', '2012-01-01'],
-                 'Q-OCT':
-                 ['2009-01-31', '2009-04-30', '2009-07-31', '2009-10-31'],
-                 'M': ['2010-11-30', '2010-12-31', '2011-01-31', '2011-02-28'],
-                 'W-SAT':
-                 ['2010-12-25', '2011-01-01', '2011-01-08', '2011-01-15'],
-                 'D': ['2011-01-01', '2011-01-02', '2011-01-03', '2011-01-04'],
-                 'H': ['2011-12-31 22:00', '2011-12-31 23:00',
-                       '2012-01-01 00:00', '2012-01-01 01:00']}
-
-        # GH 7310
-        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
-                   'US/Pacific', 'US/Eastern']:
-            for expected, dates in compat.iteritems(freqs):
-                idx = DatetimeIndex(dates, tz=tz)
-                self.assertEqual(idx.inferred_freq, expected)
-
-    def test_infer_freq_tz_transition(self):
-        # Tests for #8772
-        date_pairs = [['2013-11-02', '2013-11-5'],  # Fall DST
-                      ['2014-03-08', '2014-03-11'],  # Spring DST
-                      ['2014-01-01', '2014-01-03']]  # Regular Time
-        freqs = ['3H', '10T', '3601S', '3600001L', '3600000001U',
-                 '3600000000001N']
-
-        for tz in [None, 'Australia/Sydney', 'Asia/Tokyo', 'Europe/Paris',
-                   'US/Pacific', 'US/Eastern']:
-            for date_pair in date_pairs:
-                for freq in freqs:
-                    idx = date_range(date_pair[0], date_pair[
-                        1], freq=freq, tz=tz)
-                    self.assertEqual(idx.inferred_freq, freq)
-
-        index = date_range("2013-11-03", periods=5,
-                           freq="3H").tz_localize("America/Chicago")
-        self.assertIsNone(index.inferred_freq)
-
-    def test_infer_freq_businesshour(self):
-        # GH 7905
-        idx = DatetimeIndex(
-            ['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
-             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00'])
-        # hourly freq in a day must result in 'H'
-        self.assertEqual(idx.inferred_freq, 'H')
-
-        idx = DatetimeIndex(
-            ['2014-07-01 09:00', '2014-07-01 10:00', '2014-07-01 11:00',
-             '2014-07-01 12:00', '2014-07-01 13:00', '2014-07-01 14:00',
-             '2014-07-01 15:00', '2014-07-01 16:00', '2014-07-02 09:00',
-             '2014-07-02 10:00', '2014-07-02 11:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-        idx = DatetimeIndex(
-            ['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-             '2014-07-04 15:00', '2014-07-04 16:00', '2014-07-07 09:00',
-             '2014-07-07 10:00', '2014-07-07 11:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-        idx = DatetimeIndex(
-            ['2014-07-04 09:00', '2014-07-04 10:00', '2014-07-04 11:00',
-             '2014-07-04 12:00', '2014-07-04 13:00', '2014-07-04 14:00',
-             '2014-07-04 15:00', '2014-07-04 16:00', '2014-07-07 09:00',
-             '2014-07-07 10:00', '2014-07-07 11:00', '2014-07-07 12:00',
-             '2014-07-07 13:00', '2014-07-07 14:00', '2014-07-07 15:00',
-             '2014-07-07 16:00', '2014-07-08 09:00', '2014-07-08 10:00',
-             '2014-07-08 11:00', '2014-07-08 12:00', '2014-07-08 13:00',
-             '2014-07-08 14:00', '2014-07-08 15:00', '2014-07-08 16:00'])
-        self.assertEqual(idx.inferred_freq, 'BH')
-
-    def test_not_monotonic(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-        rng = rng[::-1]
-        self.assertEqual(rng.inferred_freq, '-1A-JAN')
-
-    def test_non_datetimeindex2(self):
-        rng = _dti(['1/31/2000', '1/31/2001', '1/31/2002'])
-
-        vals = rng.to_pydatetime()
-
-        result = frequencies.infer_freq(vals)
-        self.assertEqual(result, rng.inferred_freq)
-
-    def test_invalid_index_types(self):
-
-        # test all index types
-        for i in [tm.makeIntIndex(10), tm.makeFloatIndex(10),
-                  tm.makePeriodIndex(10)]:
-            self.assertRaises(TypeError, lambda: frequencies.infer_freq(i))
-
-        # GH 10822
-        # odd error message on conversions to datetime for unicode
-        if not is_platform_windows():
-            for i in [tm.makeStringIndex(10), tm.makeUnicodeIndex(10)]:
-                self.assertRaises(ValueError,
-                                  lambda: frequencies.infer_freq(i))
-
-    def test_string_datetimelike_compat(self):
-
-        # GH 6463
-        expected = frequencies.infer_freq(['2004-01', '2004-02', '2004-03',
-                                           '2004-04'])
-        result = frequencies.infer_freq(Index(['2004-01', '2004-02', '2004-03',
-                                               '2004-04']))
-        self.assertEqual(result, expected)
-
-    def test_series(self):
-
-        # GH6407
-        # inferring series
-
-        # invalid type of Series
-        for s in [Series(np.arange(10)), Series(np.arange(10.))]:
-            self.assertRaises(TypeError, lambda: frequencies.infer_freq(s))
-
-        # a non-convertible string
-        self.assertRaises(ValueError,
-                          lambda: frequencies.infer_freq(
-                              Series(['foo', 'bar'])))
-
-        # cannot infer on PeriodIndex
-        for freq in [None, 'L']:
-            s = Series(period_range('2013', periods=10, freq=freq))
-            self.assertRaises(TypeError, lambda: frequencies.infer_freq(s))
-        for freq in ['Y']:
-
-            msg = frequencies._INVALID_FREQ_ERROR
-            with tm.assertRaisesRegexp(ValueError, msg):
-                s = Series(period_range('2013', periods=10, freq=freq))
-            self.assertRaises(TypeError, lambda: frequencies.infer_freq(s))
-
-        # DateTimeIndex
-        for freq in ['M', 'L', 'S']:
-            s = Series(date_range('20130101', periods=10, freq=freq))
-            inferred = frequencies.infer_freq(s)
-            self.assertEqual(inferred, freq)
-
-        s = Series(date_range('20130101', '20130110'))
-        inferred = frequencies.infer_freq(s)
-        self.assertEqual(inferred, 'D')
-
-    def test_legacy_offset_warnings(self):
-        freqs = ['WEEKDAY', 'EOM', 'W@MON', 'W@TUE', 'W@WED', 'W@THU',
-                 'W@FRI', 'W@SAT', 'W@SUN', 'Q@JAN', 'Q@FEB', 'Q@MAR',
-                 'A@JAN', 'A@FEB', 'A@MAR', 'A@APR', 'A@MAY', 'A@JUN',
-                 'A@JUL', 'A@AUG', 'A@SEP', 'A@OCT', 'A@NOV', 'A@DEC',
-                 'WOM@1MON', 'WOM@2MON', 'WOM@3MON', 'WOM@4MON',
-                 'WOM@1TUE', 'WOM@2TUE', 'WOM@3TUE', 'WOM@4TUE',
-                 'WOM@1WED', 'WOM@2WED', 'WOM@3WED', 'WOM@4WED',
-                 'WOM@1THU', 'WOM@2THU', 'WOM@3THU', 'WOM@4THU'
-                 'WOM@1FRI', 'WOM@2FRI', 'WOM@3FRI', 'WOM@4FRI']
-
-        msg = frequencies._INVALID_FREQ_ERROR
-        for freq in freqs:
-            with tm.assertRaisesRegexp(ValueError, msg):
-                frequencies.get_offset(freq)
-
-            with tm.assertRaisesRegexp(ValueError, msg):
-                date_range('2011-01-01', periods=5, freq=freq)
-
-
-MONTHS = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG', 'SEP', 'OCT',
-          'NOV', 'DEC']
-
-
-def test_is_superperiod_subperiod():
-
-    # input validation
-    assert not (frequencies.is_superperiod(offsets.YearEnd(), None))
-    assert not (frequencies.is_subperiod(offsets.MonthEnd(), None))
-    assert not (frequencies.is_superperiod(None, offsets.YearEnd()))
-    assert not (frequencies.is_subperiod(None, offsets.MonthEnd()))
-    assert not (frequencies.is_superperiod(None, None))
-    assert not (frequencies.is_subperiod(None, None))
-
-    assert (frequencies.is_superperiod(offsets.YearEnd(), offsets.MonthEnd()))
-    assert (frequencies.is_subperiod(offsets.MonthEnd(), offsets.YearEnd()))
-
-    assert (frequencies.is_superperiod(offsets.Hour(), offsets.Minute()))
-    assert (frequencies.is_subperiod(offsets.Minute(), offsets.Hour()))
-
-    assert (frequencies.is_superperiod(offsets.Second(), offsets.Milli()))
-    assert (frequencies.is_subperiod(offsets.Milli(), offsets.Second()))
-
-    assert (frequencies.is_superperiod(offsets.Milli(), offsets.Micro()))
-    assert (frequencies.is_subperiod(offsets.Micro(), offsets.Milli()))
-
-    assert (frequencies.is_superperiod(offsets.Micro(), offsets.Nano()))
-    assert (frequencies.is_subperiod(offsets.Nano(), offsets.Micro()))
diff --git a/pandas/tests/tseries/test_holiday.py b/pandas/tests/tseries/test_holiday.py
deleted file mode 100644
index 2adf28a506c53..0000000000000
--- a/pandas/tests/tseries/test_holiday.py
+++ /dev/null
@@ -1,390 +0,0 @@
-from datetime import datetime
-import pandas.util.testing as tm
-from pandas import compat
-from pandas import DatetimeIndex
-from pandas.tseries.holiday import (USFederalHolidayCalendar, USMemorialDay,
-                                    USThanksgivingDay, nearest_workday,
-                                    next_monday_or_tuesday, next_monday,
-                                    previous_friday, sunday_to_monday, Holiday,
-                                    DateOffset, MO, SA, Timestamp,
-                                    AbstractHolidayCalendar, get_calendar,
-                                    HolidayCalendarFactory, next_workday,
-                                    previous_workday, before_nearest_workday,
-                                    EasterMonday, GoodFriday,
-                                    after_nearest_workday, weekend_to_monday,
-                                    USLaborDay, USColumbusDay,
-                                    USMartinLutherKingJr, USPresidentsDay)
-from pytz import utc
-
-
-class TestCalendar(tm.TestCase):
-
-    def setUp(self):
-        self.holiday_list = [
-            datetime(2012, 1, 2),
-            datetime(2012, 1, 16),
-            datetime(2012, 2, 20),
-            datetime(2012, 5, 28),
-            datetime(2012, 7, 4),
-            datetime(2012, 9, 3),
-            datetime(2012, 10, 8),
-            datetime(2012, 11, 12),
-            datetime(2012, 11, 22),
-            datetime(2012, 12, 25)]
-
-        self.start_date = datetime(2012, 1, 1)
-        self.end_date = datetime(2012, 12, 31)
-
-    def test_calendar(self):
-
-        calendar = USFederalHolidayCalendar()
-        holidays = calendar.holidays(self.start_date, self.end_date)
-
-        holidays_1 = calendar.holidays(
-            self.start_date.strftime('%Y-%m-%d'),
-            self.end_date.strftime('%Y-%m-%d'))
-        holidays_2 = calendar.holidays(
-            Timestamp(self.start_date),
-            Timestamp(self.end_date))
-
-        self.assertEqual(list(holidays.to_pydatetime()), self.holiday_list)
-        self.assertEqual(list(holidays_1.to_pydatetime()), self.holiday_list)
-        self.assertEqual(list(holidays_2.to_pydatetime()), self.holiday_list)
-
-    def test_calendar_caching(self):
-        # Test for issue #9552
-
-        class TestCalendar(AbstractHolidayCalendar):
-
-            def __init__(self, name=None, rules=None):
-                super(TestCalendar, self).__init__(name=name, rules=rules)
-
-        jan1 = TestCalendar(rules=[Holiday('jan1', year=2015, month=1, day=1)])
-        jan2 = TestCalendar(rules=[Holiday('jan2', year=2015, month=1, day=2)])
-
-        tm.assert_index_equal(jan1.holidays(), DatetimeIndex(['01-Jan-2015']))
-        tm.assert_index_equal(jan2.holidays(), DatetimeIndex(['02-Jan-2015']))
-
-    def test_calendar_observance_dates(self):
-        # Test for issue 11477
-        USFedCal = get_calendar('USFederalHolidayCalendar')
-        holidays0 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
-            2015, 7, 3))  # <-- same start and end dates
-        holidays1 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
-            2015, 7, 6))  # <-- different start and end dates
-        holidays2 = USFedCal.holidays(datetime(2015, 7, 3), datetime(
-            2015, 7, 3))  # <-- same start and end dates
-
-        tm.assert_index_equal(holidays0, holidays1)
-        tm.assert_index_equal(holidays0, holidays2)
-
-    def test_rule_from_name(self):
-        USFedCal = get_calendar('USFederalHolidayCalendar')
-        self.assertEqual(USFedCal.rule_from_name(
-            'Thanksgiving'), USThanksgivingDay)
-
-
-class TestHoliday(tm.TestCase):
-
-    def setUp(self):
-        self.start_date = datetime(2011, 1, 1)
-        self.end_date = datetime(2020, 12, 31)
-
-    def check_results(self, holiday, start, end, expected):
-        self.assertEqual(list(holiday.dates(start, end)), expected)
-        # Verify that timezone info is preserved.
-        self.assertEqual(
-            list(
-                holiday.dates(
-                    utc.localize(Timestamp(start)),
-                    utc.localize(Timestamp(end)),
-                )
-            ),
-            [utc.localize(dt) for dt in expected],
-        )
-
-    def test_usmemorialday(self):
-        self.check_results(holiday=USMemorialDay,
-                           start=self.start_date,
-                           end=self.end_date,
-                           expected=[
-                               datetime(2011, 5, 30),
-                               datetime(2012, 5, 28),
-                               datetime(2013, 5, 27),
-                               datetime(2014, 5, 26),
-                               datetime(2015, 5, 25),
-                               datetime(2016, 5, 30),
-                               datetime(2017, 5, 29),
-                               datetime(2018, 5, 28),
-                               datetime(2019, 5, 27),
-                               datetime(2020, 5, 25),
-                           ], )
-
-    def test_non_observed_holiday(self):
-
-        self.check_results(
-            Holiday('July 4th Eve', month=7, day=3),
-            start="2001-01-01",
-            end="2003-03-03",
-            expected=[
-                Timestamp('2001-07-03 00:00:00'),
-                Timestamp('2002-07-03 00:00:00')
-            ]
-        )
-
-        self.check_results(
-            Holiday('July 4th Eve', month=7, day=3, days_of_week=(0, 1, 2, 3)),
-            start="2001-01-01",
-            end="2008-03-03",
-            expected=[
-                Timestamp('2001-07-03 00:00:00'),
-                Timestamp('2002-07-03 00:00:00'),
-                Timestamp('2003-07-03 00:00:00'),
-                Timestamp('2006-07-03 00:00:00'),
-                Timestamp('2007-07-03 00:00:00'),
-            ]
-        )
-
-    def test_easter(self):
-
-        self.check_results(EasterMonday,
-                           start=self.start_date,
-                           end=self.end_date,
-                           expected=[
-                               Timestamp('2011-04-25 00:00:00'),
-                               Timestamp('2012-04-09 00:00:00'),
-                               Timestamp('2013-04-01 00:00:00'),
-                               Timestamp('2014-04-21 00:00:00'),
-                               Timestamp('2015-04-06 00:00:00'),
-                               Timestamp('2016-03-28 00:00:00'),
-                               Timestamp('2017-04-17 00:00:00'),
-                               Timestamp('2018-04-02 00:00:00'),
-                               Timestamp('2019-04-22 00:00:00'),
-                               Timestamp('2020-04-13 00:00:00'),
-                           ], )
-        self.check_results(GoodFriday,
-                           start=self.start_date,
-                           end=self.end_date,
-                           expected=[
-                               Timestamp('2011-04-22 00:00:00'),
-                               Timestamp('2012-04-06 00:00:00'),
-                               Timestamp('2013-03-29 00:00:00'),
-                               Timestamp('2014-04-18 00:00:00'),
-                               Timestamp('2015-04-03 00:00:00'),
-                               Timestamp('2016-03-25 00:00:00'),
-                               Timestamp('2017-04-14 00:00:00'),
-                               Timestamp('2018-03-30 00:00:00'),
-                               Timestamp('2019-04-19 00:00:00'),
-                               Timestamp('2020-04-10 00:00:00'),
-                           ], )
-
-    def test_usthanksgivingday(self):
-
-        self.check_results(USThanksgivingDay,
-                           start=self.start_date,
-                           end=self.end_date,
-                           expected=[
-                               datetime(2011, 11, 24),
-                               datetime(2012, 11, 22),
-                               datetime(2013, 11, 28),
-                               datetime(2014, 11, 27),
-                               datetime(2015, 11, 26),
-                               datetime(2016, 11, 24),
-                               datetime(2017, 11, 23),
-                               datetime(2018, 11, 22),
-                               datetime(2019, 11, 28),
-                               datetime(2020, 11, 26),
-                           ], )
-
-    def test_holidays_within_dates(self):
-        # Fix holiday behavior found in #11477
-        # where holiday.dates returned dates outside start/end date
-        # or observed rules could not be applied as the holiday
-        # was not in the original date range (e.g., 7/4/2015 -> 7/3/2015)
-        start_date = datetime(2015, 7, 1)
-        end_date = datetime(2015, 7, 1)
-
-        calendar = get_calendar('USFederalHolidayCalendar')
-        new_years = calendar.rule_from_name('New Years Day')
-        july_4th = calendar.rule_from_name('July 4th')
-        veterans_day = calendar.rule_from_name('Veterans Day')
-        christmas = calendar.rule_from_name('Christmas')
-
-        # Holiday: (start/end date, holiday)
-        holidays = {USMemorialDay: ("2015-05-25", "2015-05-25"),
-                    USLaborDay: ("2015-09-07", "2015-09-07"),
-                    USColumbusDay: ("2015-10-12", "2015-10-12"),
-                    USThanksgivingDay: ("2015-11-26", "2015-11-26"),
-                    USMartinLutherKingJr: ("2015-01-19", "2015-01-19"),
-                    USPresidentsDay: ("2015-02-16", "2015-02-16"),
-                    GoodFriday: ("2015-04-03", "2015-04-03"),
-                    EasterMonday: [("2015-04-06", "2015-04-06"),
-                                   ("2015-04-05", [])],
-                    new_years: [("2015-01-01", "2015-01-01"),
-                                ("2011-01-01", []),
-                                ("2010-12-31", "2010-12-31")],
-                    july_4th: [("2015-07-03", "2015-07-03"),
-                               ("2015-07-04", [])],
-                    veterans_day: [("2012-11-11", []),
-                                   ("2012-11-12", "2012-11-12")],
-                    christmas: [("2011-12-25", []),
-                                ("2011-12-26", "2011-12-26")]}
-
-        for rule, dates in compat.iteritems(holidays):
-            empty_dates = rule.dates(start_date, end_date)
-            self.assertEqual(empty_dates.tolist(), [])
-
-            if isinstance(dates, tuple):
-                dates = [dates]
-
-            for start, expected in dates:
-                if len(expected):
-                    expected = [Timestamp(expected)]
-                self.check_results(rule, start, start, expected)
-
-    def test_argument_types(self):
-        holidays = USThanksgivingDay.dates(self.start_date, self.end_date)
-
-        holidays_1 = USThanksgivingDay.dates(
-            self.start_date.strftime('%Y-%m-%d'),
-            self.end_date.strftime('%Y-%m-%d'))
-
-        holidays_2 = USThanksgivingDay.dates(
-            Timestamp(self.start_date),
-            Timestamp(self.end_date))
-
-        self.assert_index_equal(holidays, holidays_1)
-        self.assert_index_equal(holidays, holidays_2)
-
-    def test_special_holidays(self):
-        base_date = [datetime(2012, 5, 28)]
-        holiday_1 = Holiday('One-Time', year=2012, month=5, day=28)
-        holiday_2 = Holiday('Range', month=5, day=28,
-                            start_date=datetime(2012, 1, 1),
-                            end_date=datetime(2012, 12, 31),
-                            offset=DateOffset(weekday=MO(1)))
-
-        self.assertEqual(base_date,
-                         holiday_1.dates(self.start_date, self.end_date))
-        self.assertEqual(base_date,
-                         holiday_2.dates(self.start_date, self.end_date))
-
-    def test_get_calendar(self):
-        class TestCalendar(AbstractHolidayCalendar):
-            rules = []
-
-        calendar = get_calendar('TestCalendar')
-        self.assertEqual(TestCalendar, calendar.__class__)
-
-    def test_factory(self):
-        class_1 = HolidayCalendarFactory('MemorialDay',
-                                         AbstractHolidayCalendar,
-                                         USMemorialDay)
-        class_2 = HolidayCalendarFactory('Thansksgiving',
-                                         AbstractHolidayCalendar,
-                                         USThanksgivingDay)
-        class_3 = HolidayCalendarFactory('Combined', class_1, class_2)
-
-        self.assertEqual(len(class_1.rules), 1)
-        self.assertEqual(len(class_2.rules), 1)
-        self.assertEqual(len(class_3.rules), 2)
-
-
-class TestObservanceRules(tm.TestCase):
-
-    def setUp(self):
-        self.we = datetime(2014, 4, 9)
-        self.th = datetime(2014, 4, 10)
-        self.fr = datetime(2014, 4, 11)
-        self.sa = datetime(2014, 4, 12)
-        self.su = datetime(2014, 4, 13)
-        self.mo = datetime(2014, 4, 14)
-        self.tu = datetime(2014, 4, 15)
-
-    def test_next_monday(self):
-        self.assertEqual(next_monday(self.sa), self.mo)
-        self.assertEqual(next_monday(self.su), self.mo)
-
-    def test_next_monday_or_tuesday(self):
-        self.assertEqual(next_monday_or_tuesday(self.sa), self.mo)
-        self.assertEqual(next_monday_or_tuesday(self.su), self.tu)
-        self.assertEqual(next_monday_or_tuesday(self.mo), self.tu)
-
-    def test_previous_friday(self):
-        self.assertEqual(previous_friday(self.sa), self.fr)
-        self.assertEqual(previous_friday(self.su), self.fr)
-
-    def test_sunday_to_monday(self):
-        self.assertEqual(sunday_to_monday(self.su), self.mo)
-
-    def test_nearest_workday(self):
-        self.assertEqual(nearest_workday(self.sa), self.fr)
-        self.assertEqual(nearest_workday(self.su), self.mo)
-        self.assertEqual(nearest_workday(self.mo), self.mo)
-
-    def test_weekend_to_monday(self):
-        self.assertEqual(weekend_to_monday(self.sa), self.mo)
-        self.assertEqual(weekend_to_monday(self.su), self.mo)
-        self.assertEqual(weekend_to_monday(self.mo), self.mo)
-
-    def test_next_workday(self):
-        self.assertEqual(next_workday(self.sa), self.mo)
-        self.assertEqual(next_workday(self.su), self.mo)
-        self.assertEqual(next_workday(self.mo), self.tu)
-
-    def test_previous_workday(self):
-        self.assertEqual(previous_workday(self.sa), self.fr)
-        self.assertEqual(previous_workday(self.su), self.fr)
-        self.assertEqual(previous_workday(self.tu), self.mo)
-
-    def test_before_nearest_workday(self):
-        self.assertEqual(before_nearest_workday(self.sa), self.th)
-        self.assertEqual(before_nearest_workday(self.su), self.fr)
-        self.assertEqual(before_nearest_workday(self.tu), self.mo)
-
-    def test_after_nearest_workday(self):
-        self.assertEqual(after_nearest_workday(self.sa), self.mo)
-        self.assertEqual(after_nearest_workday(self.su), self.tu)
-        self.assertEqual(after_nearest_workday(self.fr), self.mo)
-
-
-class TestFederalHolidayCalendar(tm.TestCase):
-
-    # Test for issue 10278
-    def test_no_mlk_before_1984(self):
-        class MLKCalendar(AbstractHolidayCalendar):
-            rules = [USMartinLutherKingJr]
-
-        holidays = MLKCalendar().holidays(start='1984',
-                                          end='1988').to_pydatetime().tolist()
-        # Testing to make sure holiday is not incorrectly observed before 1986
-        self.assertEqual(holidays, [datetime(1986, 1, 20, 0, 0), datetime(
-            1987, 1, 19, 0, 0)])
-
-    def test_memorial_day(self):
-        class MemorialDay(AbstractHolidayCalendar):
-            rules = [USMemorialDay]
-
-        holidays = MemorialDay().holidays(start='1971',
-                                          end='1980').to_pydatetime().tolist()
-        # Fixes 5/31 error and checked manually against wikipedia
-        self.assertEqual(holidays, [datetime(1971, 5, 31, 0, 0),
-                                    datetime(1972, 5, 29, 0, 0),
-                                    datetime(1973, 5, 28, 0, 0),
-                                    datetime(1974, 5, 27, 0,
-                                             0), datetime(1975, 5, 26, 0, 0),
-                                    datetime(1976, 5, 31, 0,
-                                             0), datetime(1977, 5, 30, 0, 0),
-                                    datetime(1978, 5, 29, 0,
-                                             0), datetime(1979, 5, 28, 0, 0)])
-
-
-class TestHolidayConflictingArguments(tm.TestCase):
-
-    # GH 10217
-
-    def test_both_offset_observance_raises(self):
-        with self.assertRaises(NotImplementedError):
-            Holiday("Cyber Monday", month=11, day=1,
-                    offset=[DateOffset(weekday=SA(4))],
-                    observance=next_monday)
diff --git a/pandas/tests/tseries/test_offsets.py b/pandas/tests/tseries/test_offsets.py
deleted file mode 100644
index f644c353982f6..0000000000000
--- a/pandas/tests/tseries/test_offsets.py
+++ /dev/null
@@ -1,4962 +0,0 @@
-import os
-from distutils.version import LooseVersion
-from datetime import date, datetime, timedelta
-from dateutil.relativedelta import relativedelta
-
-import pytest
-from pandas.compat import range, iteritems
-from pandas import compat
-
-import numpy as np
-
-from pandas.compat.numpy import np_datetime64_compat
-
-from pandas.core.series import Series
-from pandas.tseries.frequencies import (_offset_map, get_freq_code,
-                                        _get_freq_str, _INVALID_FREQ_ERROR,
-                                        get_offset, get_standard_freq)
-from pandas.tseries.index import _to_m8, DatetimeIndex, _daterange_cache
-from pandas.tseries.offsets import (BDay, CDay, BQuarterEnd, BMonthEnd,
-                                    BusinessHour, WeekOfMonth, CBMonthEnd,
-                                    CustomBusinessHour, WeekDay,
-                                    CBMonthBegin, BYearEnd, MonthEnd,
-                                    MonthBegin, SemiMonthBegin, SemiMonthEnd,
-                                    BYearBegin, QuarterBegin, BQuarterBegin,
-                                    BMonthBegin, DateOffset, Week, YearBegin,
-                                    YearEnd, Hour, Minute, Second, Day, Micro,
-                                    QuarterEnd, BusinessMonthEnd, FY5253,
-                                    Milli, Nano, Easter, FY5253Quarter,
-                                    LastWeekOfMonth, CacheableOffset)
-from pandas.tseries.tools import (format, ole2datetime, parse_time_string,
-                                  to_datetime, DateParseError)
-import pandas.tseries.offsets as offsets
-from pandas.io.pickle import read_pickle
-from pandas._libs.tslib import normalize_date, NaT, Timestamp, Timedelta
-import pandas._libs.tslib as tslib
-from pandas.util.testing import assertRaisesRegexp
-import pandas.util.testing as tm
-from pandas.tseries.holiday import USFederalHolidayCalendar
-
-
-def test_monthrange():
-    import calendar
-    for y in range(2000, 2013):
-        for m in range(1, 13):
-            assert tslib.monthrange(y, m) == calendar.monthrange(y, m)
-
-####
-# Misc function tests
-####
-
-
-def test_format():
-    actual = format(datetime(2008, 1, 15))
-    assert actual == '20080115'
-
-
-def test_ole2datetime():
-    actual = ole2datetime(60000)
-    assert actual == datetime(2064, 4, 8)
-
-    with pytest.raises(ValueError):
-        ole2datetime(60)
-
-
-def test_to_datetime1():
-    actual = to_datetime(datetime(2008, 1, 15))
-    assert actual == datetime(2008, 1, 15)
-
-    actual = to_datetime('20080115')
-    assert actual == datetime(2008, 1, 15)
-
-    # unparseable
-    s = 'Month 1, 1999'
-    assert to_datetime(s, errors='ignore') == s
-
-
-def test_normalize_date():
-    actual = normalize_date(datetime(2007, 10, 1, 1, 12, 5, 10))
-    assert actual == datetime(2007, 10, 1)
-
-
-def test_to_m8():
-    valb = datetime(2007, 10, 1)
-    valu = _to_m8(valb)
-    tm.assertIsInstance(valu, np.datetime64)
-    # assert valu == np.datetime64(datetime(2007,10,1))
-
-    # def test_datetime64_box():
-    #    valu = np.datetime64(datetime(2007,10,1))
-    #    valb = _dt_box(valu)
-    #    assert type(valb) == datetime
-    #    assert valb == datetime(2007,10,1)
-
-    #####
-    # DateOffset Tests
-    #####
-
-
-class Base(tm.TestCase):
-    _offset = None
-
-    _offset_types = [getattr(offsets, o) for o in offsets.__all__]
-
-    timezones = [None, 'UTC', 'Asia/Tokyo', 'US/Eastern',
-                 'dateutil/Asia/Tokyo', 'dateutil/US/Pacific']
-
-    @property
-    def offset_types(self):
-        return self._offset_types
-
-    def _get_offset(self, klass, value=1, normalize=False):
-        # create instance from offset class
-        if klass is FY5253 or klass is FY5253Quarter:
-            klass = klass(n=value, startingMonth=1, weekday=1,
-                          qtr_with_extra_week=1, variation='last',
-                          normalize=normalize)
-        elif klass is LastWeekOfMonth:
-            klass = klass(n=value, weekday=5, normalize=normalize)
-        elif klass is WeekOfMonth:
-            klass = klass(n=value, week=1, weekday=5, normalize=normalize)
-        elif klass is Week:
-            klass = klass(n=value, weekday=5, normalize=normalize)
-        elif klass is DateOffset:
-            klass = klass(days=value, normalize=normalize)
-        else:
-            try:
-                klass = klass(value, normalize=normalize)
-            except:
-                klass = klass(normalize=normalize)
-        return klass
-
-    def test_apply_out_of_range(self):
-        if self._offset is None:
-            return
-
-        # try to create an out-of-bounds result timestamp; if we can't create
-        # the offset skip
-        try:
-            if self._offset in (BusinessHour, CustomBusinessHour):
-                # Using 10000 in BusinessHour fails in tz check because of DST
-                # difference
-                offset = self._get_offset(self._offset, value=100000)
-            else:
-                offset = self._get_offset(self._offset, value=10000)
-
-            result = Timestamp('20080101') + offset
-            self.assertIsInstance(result, datetime)
-            self.assertIsNone(result.tzinfo)
-
-            tm._skip_if_no_pytz()
-            tm._skip_if_no_dateutil()
-            # Check tz is preserved
-            for tz in self.timezones:
-                t = Timestamp('20080101', tz=tz)
-                result = t + offset
-                self.assertIsInstance(result, datetime)
-                self.assertEqual(t.tzinfo, result.tzinfo)
-
-        except (tslib.OutOfBoundsDatetime):
-            raise
-        except (ValueError, KeyError) as e:
-            pytest.skip(
-                "cannot create out_of_range offset: {0} {1}".format(
-                    str(self).split('.')[-1], e))
-
-
-class TestCommon(Base):
-
-    def setUp(self):
-        # exected value created by Base._get_offset
-        # are applied to 2011/01/01 09:00 (Saturday)
-        # used for .apply and .rollforward
-        self.expecteds = {'Day': Timestamp('2011-01-02 09:00:00'),
-                          'DateOffset': Timestamp('2011-01-02 09:00:00'),
-                          'BusinessDay': Timestamp('2011-01-03 09:00:00'),
-                          'CustomBusinessDay':
-                          Timestamp('2011-01-03 09:00:00'),
-                          'CustomBusinessMonthEnd':
-                          Timestamp('2011-01-31 09:00:00'),
-                          'CustomBusinessMonthBegin':
-                          Timestamp('2011-01-03 09:00:00'),
-                          'MonthBegin': Timestamp('2011-02-01 09:00:00'),
-                          'BusinessMonthBegin':
-                          Timestamp('2011-01-03 09:00:00'),
-                          'MonthEnd': Timestamp('2011-01-31 09:00:00'),
-                          'SemiMonthEnd': Timestamp('2011-01-15 09:00:00'),
-                          'SemiMonthBegin': Timestamp('2011-01-15 09:00:00'),
-                          'BusinessMonthEnd': Timestamp('2011-01-31 09:00:00'),
-                          'YearBegin': Timestamp('2012-01-01 09:00:00'),
-                          'BYearBegin': Timestamp('2011-01-03 09:00:00'),
-                          'YearEnd': Timestamp('2011-12-31 09:00:00'),
-                          'BYearEnd': Timestamp('2011-12-30 09:00:00'),
-                          'QuarterBegin': Timestamp('2011-03-01 09:00:00'),
-                          'BQuarterBegin': Timestamp('2011-03-01 09:00:00'),
-                          'QuarterEnd': Timestamp('2011-03-31 09:00:00'),
-                          'BQuarterEnd': Timestamp('2011-03-31 09:00:00'),
-                          'BusinessHour': Timestamp('2011-01-03 10:00:00'),
-                          'CustomBusinessHour':
-                          Timestamp('2011-01-03 10:00:00'),
-                          'WeekOfMonth': Timestamp('2011-01-08 09:00:00'),
-                          'LastWeekOfMonth': Timestamp('2011-01-29 09:00:00'),
-                          'FY5253Quarter': Timestamp('2011-01-25 09:00:00'),
-                          'FY5253': Timestamp('2011-01-25 09:00:00'),
-                          'Week': Timestamp('2011-01-08 09:00:00'),
-                          'Easter': Timestamp('2011-04-24 09:00:00'),
-                          'Hour': Timestamp('2011-01-01 10:00:00'),
-                          'Minute': Timestamp('2011-01-01 09:01:00'),
-                          'Second': Timestamp('2011-01-01 09:00:01'),
-                          'Milli': Timestamp('2011-01-01 09:00:00.001000'),
-                          'Micro': Timestamp('2011-01-01 09:00:00.000001'),
-                          'Nano': Timestamp(np_datetime64_compat(
-                              '2011-01-01T09:00:00.000000001Z'))}
-
-    def test_return_type(self):
-        for offset in self.offset_types:
-            offset = self._get_offset(offset)
-
-            # make sure that we are returning a Timestamp
-            result = Timestamp('20080101') + offset
-            self.assertIsInstance(result, Timestamp)
-
-            # make sure that we are returning NaT
-            self.assertTrue(NaT + offset is NaT)
-            self.assertTrue(offset + NaT is NaT)
-
-            self.assertTrue(NaT - offset is NaT)
-            self.assertTrue((-offset).apply(NaT) is NaT)
-
-    def test_offset_n(self):
-        for offset_klass in self.offset_types:
-            offset = self._get_offset(offset_klass)
-            self.assertEqual(offset.n, 1)
-
-            neg_offset = offset * -1
-            self.assertEqual(neg_offset.n, -1)
-
-            mul_offset = offset * 3
-            self.assertEqual(mul_offset.n, 3)
-
-    def test_offset_freqstr(self):
-        for offset_klass in self.offset_types:
-            offset = self._get_offset(offset_klass)
-
-            freqstr = offset.freqstr
-            if freqstr not in ('<Easter>',
-                               "<DateOffset: kwds={'days': 1}>",
-                               'LWOM-SAT', ):
-                code = get_offset(freqstr)
-                self.assertEqual(offset.rule_code, code)
-
-    def _check_offsetfunc_works(self, offset, funcname, dt, expected,
-                                normalize=False):
-        offset_s = self._get_offset(offset, normalize=normalize)
-        func = getattr(offset_s, funcname)
-
-        result = func(dt)
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, expected)
-
-        result = func(Timestamp(dt))
-        self.assertTrue(isinstance(result, Timestamp))
-        self.assertEqual(result, expected)
-
-        # see gh-14101
-        exp_warning = None
-        ts = Timestamp(dt) + Nano(5)
-
-        if (offset_s.__class__.__name__ == 'DateOffset' and
-                (funcname == 'apply' or normalize) and
-                ts.nanosecond > 0):
-            exp_warning = UserWarning
-
-        # test nanosecond is preserved
-        with tm.assert_produces_warning(exp_warning,
-                                        check_stacklevel=False):
-            result = func(ts)
-        self.assertTrue(isinstance(result, Timestamp))
-        if normalize is False:
-            self.assertEqual(result, expected + Nano(5))
-        else:
-            self.assertEqual(result, expected)
-
-        if isinstance(dt, np.datetime64):
-            # test tz when input is datetime or Timestamp
-            return
-
-        tm._skip_if_no_pytz()
-        tm._skip_if_no_dateutil()
-
-        for tz in self.timezones:
-            expected_localize = expected.tz_localize(tz)
-            tz_obj = tslib.maybe_get_tz(tz)
-            dt_tz = tslib._localize_pydatetime(dt, tz_obj)
-
-            result = func(dt_tz)
-            self.assertTrue(isinstance(result, Timestamp))
-            self.assertEqual(result, expected_localize)
-
-            result = func(Timestamp(dt, tz=tz))
-            self.assertTrue(isinstance(result, Timestamp))
-            self.assertEqual(result, expected_localize)
-
-            # see gh-14101
-            exp_warning = None
-            ts = Timestamp(dt, tz=tz) + Nano(5)
-
-            if (offset_s.__class__.__name__ == 'DateOffset' and
-                    (funcname == 'apply' or normalize) and
-                    ts.nanosecond > 0):
-                exp_warning = UserWarning
-
-            # test nanosecond is preserved
-            with tm.assert_produces_warning(exp_warning,
-                                            check_stacklevel=False):
-                result = func(ts)
-            self.assertTrue(isinstance(result, Timestamp))
-            if normalize is False:
-                self.assertEqual(result, expected_localize + Nano(5))
-            else:
-                self.assertEqual(result, expected_localize)
-
-    def test_apply(self):
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np_datetime64_compat('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = self.expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'apply', dt, expected)
-
-                expected = Timestamp(expected.date())
-                self._check_offsetfunc_works(offset, 'apply', dt, expected,
-                                             normalize=True)
-
-    def test_rollforward(self):
-        expecteds = self.expecteds.copy()
-
-        # result will not be changed if the target is on the offset
-        no_changes = ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin',
-                      'Week', 'Hour', 'Minute', 'Second', 'Milli', 'Micro',
-                      'Nano', 'DateOffset']
-        for n in no_changes:
-            expecteds[n] = Timestamp('2011/01/01 09:00')
-
-        expecteds['BusinessHour'] = Timestamp('2011-01-03 09:00:00')
-        expecteds['CustomBusinessHour'] = Timestamp('2011-01-03 09:00:00')
-
-        # but be changed when normalize=True
-        norm_expected = expecteds.copy()
-        for k in norm_expected:
-            norm_expected[k] = Timestamp(norm_expected[k].date())
-
-        normalized = {'Day': Timestamp('2011-01-02 00:00:00'),
-                      'DateOffset': Timestamp('2011-01-02 00:00:00'),
-                      'MonthBegin': Timestamp('2011-02-01 00:00:00'),
-                      'SemiMonthBegin': Timestamp('2011-01-15 00:00:00'),
-                      'YearBegin': Timestamp('2012-01-01 00:00:00'),
-                      'Week': Timestamp('2011-01-08 00:00:00'),
-                      'Hour': Timestamp('2011-01-01 00:00:00'),
-                      'Minute': Timestamp('2011-01-01 00:00:00'),
-                      'Second': Timestamp('2011-01-01 00:00:00'),
-                      'Milli': Timestamp('2011-01-01 00:00:00'),
-                      'Micro': Timestamp('2011-01-01 00:00:00')}
-        norm_expected.update(normalized)
-
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np_datetime64_compat('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollforward', dt,
-                                             expected)
-                expected = norm_expected[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollforward', dt,
-                                             expected, normalize=True)
-
-    def test_rollback(self):
-        expecteds = {'BusinessDay': Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessDay': Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessMonthEnd':
-                     Timestamp('2010-12-31 09:00:00'),
-                     'CustomBusinessMonthBegin':
-                     Timestamp('2010-12-01 09:00:00'),
-                     'BusinessMonthBegin': Timestamp('2010-12-01 09:00:00'),
-                     'MonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'SemiMonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BusinessMonthEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BYearBegin': Timestamp('2010-01-01 09:00:00'),
-                     'YearEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BYearEnd': Timestamp('2010-12-31 09:00:00'),
-                     'QuarterBegin': Timestamp('2010-12-01 09:00:00'),
-                     'BQuarterBegin': Timestamp('2010-12-01 09:00:00'),
-                     'QuarterEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BQuarterEnd': Timestamp('2010-12-31 09:00:00'),
-                     'BusinessHour': Timestamp('2010-12-31 17:00:00'),
-                     'CustomBusinessHour': Timestamp('2010-12-31 17:00:00'),
-                     'WeekOfMonth': Timestamp('2010-12-11 09:00:00'),
-                     'LastWeekOfMonth': Timestamp('2010-12-25 09:00:00'),
-                     'FY5253Quarter': Timestamp('2010-10-26 09:00:00'),
-                     'FY5253': Timestamp('2010-01-26 09:00:00'),
-                     'Easter': Timestamp('2010-04-04 09:00:00')}
-
-        # result will not be changed if the target is on the offset
-        for n in ['Day', 'MonthBegin', 'SemiMonthBegin', 'YearBegin', 'Week',
-                  'Hour', 'Minute', 'Second', 'Milli', 'Micro', 'Nano',
-                  'DateOffset']:
-            expecteds[n] = Timestamp('2011/01/01 09:00')
-
-        # but be changed when normalize=True
-        norm_expected = expecteds.copy()
-        for k in norm_expected:
-            norm_expected[k] = Timestamp(norm_expected[k].date())
-
-        normalized = {'Day': Timestamp('2010-12-31 00:00:00'),
-                      'DateOffset': Timestamp('2010-12-31 00:00:00'),
-                      'MonthBegin': Timestamp('2010-12-01 00:00:00'),
-                      'SemiMonthBegin': Timestamp('2010-12-15 00:00:00'),
-                      'YearBegin': Timestamp('2010-01-01 00:00:00'),
-                      'Week': Timestamp('2010-12-25 00:00:00'),
-                      'Hour': Timestamp('2011-01-01 00:00:00'),
-                      'Minute': Timestamp('2011-01-01 00:00:00'),
-                      'Second': Timestamp('2011-01-01 00:00:00'),
-                      'Milli': Timestamp('2011-01-01 00:00:00'),
-                      'Micro': Timestamp('2011-01-01 00:00:00')}
-        norm_expected.update(normalized)
-
-        sdt = datetime(2011, 1, 1, 9, 0)
-        ndt = np_datetime64_compat('2011-01-01 09:00Z')
-
-        for offset in self.offset_types:
-            for dt in [sdt, ndt]:
-                expected = expecteds[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollback', dt, expected)
-
-                expected = norm_expected[offset.__name__]
-                self._check_offsetfunc_works(offset, 'rollback', dt, expected,
-                                             normalize=True)
-
-    def test_onOffset(self):
-        for offset in self.offset_types:
-            dt = self.expecteds[offset.__name__]
-            offset_s = self._get_offset(offset)
-            self.assertTrue(offset_s.onOffset(dt))
-
-            # when normalize=True, onOffset checks time is 00:00:00
-            offset_n = self._get_offset(offset, normalize=True)
-            self.assertFalse(offset_n.onOffset(dt))
-
-            if offset in (BusinessHour, CustomBusinessHour):
-                # In default BusinessHour (9:00-17:00), normalized time
-                # cannot be in business hour range
-                continue
-            date = datetime(dt.year, dt.month, dt.day)
-            self.assertTrue(offset_n.onOffset(date))
-
-    def test_add(self):
-        dt = datetime(2011, 1, 1, 9, 0)
-
-        for offset in self.offset_types:
-            offset_s = self._get_offset(offset)
-            expected = self.expecteds[offset.__name__]
-
-            result_dt = dt + offset_s
-            result_ts = Timestamp(dt) + offset_s
-            for result in [result_dt, result_ts]:
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected)
-
-            tm._skip_if_no_pytz()
-            for tz in self.timezones:
-                expected_localize = expected.tz_localize(tz)
-                result = Timestamp(dt, tz=tz) + offset_s
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected_localize)
-
-            # normalize=True
-            offset_s = self._get_offset(offset, normalize=True)
-            expected = Timestamp(expected.date())
-
-            result_dt = dt + offset_s
-            result_ts = Timestamp(dt) + offset_s
-            for result in [result_dt, result_ts]:
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected)
-
-            for tz in self.timezones:
-                expected_localize = expected.tz_localize(tz)
-                result = Timestamp(dt, tz=tz) + offset_s
-                self.assertTrue(isinstance(result, Timestamp))
-                self.assertEqual(result, expected_localize)
-
-    def test_pickle_v0_15_2(self):
-        offsets = {'DateOffset': DateOffset(years=1),
-                   'MonthBegin': MonthBegin(1),
-                   'Day': Day(1),
-                   'YearBegin': YearBegin(1),
-                   'Week': Week(1)}
-        pickle_path = os.path.join(tm.get_data_path(),
-                                   'dateoffset_0_15_2.pickle')
-        # This code was executed once on v0.15.2 to generate the pickle:
-        # with open(pickle_path, 'wb') as f: pickle.dump(offsets, f)
-        #
-        tm.assert_dict_equal(offsets, read_pickle(pickle_path))
-
-
-class TestDateOffset(Base):
-
-    def setUp(self):
-        self.d = Timestamp(datetime(2008, 1, 2))
-        _offset_map.clear()
-
-    def test_repr(self):
-        repr(DateOffset())
-        repr(DateOffset(2))
-        repr(2 * DateOffset())
-        repr(2 * DateOffset(months=2))
-
-    def test_mul(self):
-        assert DateOffset(2) == 2 * DateOffset(1)
-        assert DateOffset(2) == DateOffset(1) * 2
-
-    def test_constructor(self):
-
-        assert ((self.d + DateOffset(months=2)) == datetime(2008, 3, 2))
-        assert ((self.d - DateOffset(months=2)) == datetime(2007, 11, 2))
-
-        assert ((self.d + DateOffset(2)) == datetime(2008, 1, 4))
-
-        assert not DateOffset(2).isAnchored()
-        assert DateOffset(1).isAnchored()
-
-        d = datetime(2008, 1, 31)
-        assert ((d + DateOffset(months=1)) == datetime(2008, 2, 29))
-
-    def test_copy(self):
-        assert (DateOffset(months=2).copy() == DateOffset(months=2))
-
-    def test_eq(self):
-        offset1 = DateOffset(days=1)
-        offset2 = DateOffset(days=365)
-
-        self.assertNotEqual(offset1, offset2)
-
-
-class TestBusinessDay(Base):
-    _offset = BDay
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-
-        self.offset = BDay()
-        self.offset2 = BDay(2)
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = BDay()
-        offset2 = BDay()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        self.assertEqual(repr(self.offset), '<BusinessDay>')
-        assert repr(self.offset2) == '<2 * BusinessDays>'
-
-        expected = '<BusinessDay: offset=datetime.timedelta(1)>'
-        assert repr(self.offset + timedelta(1)) == expected
-
-    def test_with_offset(self):
-        offset = self.offset + timedelta(hours=2)
-
-        assert (self.d + offset) == datetime(2008, 1, 2, 2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 1, 3))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + BDay(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset, self.d + BDay(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * BDay(-10)), self.d + BDay(50))
-
-    def testRollback1(self):
-        self.assertEqual(BDay(10).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(
-            BDay(10).rollback(datetime(2008, 1, 5)), datetime(2008, 1, 4))
-
-    def testRollforward1(self):
-        self.assertEqual(BDay(10).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(
-            BDay(10).rollforward(datetime(2008, 1, 5)), datetime(2008, 1, 7))
-
-    def test_roll_date_object(self):
-        offset = BDay()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 14))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 17))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(BDay(), datetime(2008, 1, 1), True),
-                 (BDay(), datetime(2008, 1, 5), False)]
-
-        for offset, d, expected in tests:
-            assertOnOffset(offset, d, expected)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((BDay(), {datetime(2008, 1, 1): datetime(2008, 1, 2),
-                               datetime(2008, 1, 4): datetime(2008, 1, 7),
-                               datetime(2008, 1, 5): datetime(2008, 1, 7),
-                               datetime(2008, 1, 6): datetime(2008, 1, 7),
-                               datetime(2008, 1, 7): datetime(2008, 1, 8)}))
-
-        tests.append((2 * BDay(), {datetime(2008, 1, 1): datetime(2008, 1, 3),
-                                   datetime(2008, 1, 4): datetime(2008, 1, 8),
-                                   datetime(2008, 1, 5): datetime(2008, 1, 8),
-                                   datetime(2008, 1, 6): datetime(2008, 1, 8),
-                                   datetime(2008, 1, 7): datetime(2008, 1, 9)}
-                      ))
-
-        tests.append((-BDay(), {datetime(2008, 1, 1): datetime(2007, 12, 31),
-                                datetime(2008, 1, 4): datetime(2008, 1, 3),
-                                datetime(2008, 1, 5): datetime(2008, 1, 4),
-                                datetime(2008, 1, 6): datetime(2008, 1, 4),
-                                datetime(2008, 1, 7): datetime(2008, 1, 4),
-                                datetime(2008, 1, 8): datetime(2008, 1, 7)}
-                      ))
-
-        tests.append((-2 * BDay(), {
-            datetime(2008, 1, 1): datetime(2007, 12, 28),
-            datetime(2008, 1, 4): datetime(2008, 1, 2),
-            datetime(2008, 1, 5): datetime(2008, 1, 3),
-            datetime(2008, 1, 6): datetime(2008, 1, 3),
-            datetime(2008, 1, 7): datetime(2008, 1, 3),
-            datetime(2008, 1, 8): datetime(2008, 1, 4),
-            datetime(2008, 1, 9): datetime(2008, 1, 7)}
-        ))
-
-        tests.append((BDay(0), {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                                datetime(2008, 1, 4): datetime(2008, 1, 4),
-                                datetime(2008, 1, 5): datetime(2008, 1, 7),
-                                datetime(2008, 1, 6): datetime(2008, 1, 7),
-                                datetime(2008, 1, 7): datetime(2008, 1, 7)}
-                      ))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + BDay(10)
-        self.assertEqual(result, datetime(2012, 11, 6))
-
-        result = dt + BDay(100) - BDay(100)
-        self.assertEqual(result, dt)
-
-        off = BDay() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 12, 23)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2011, 12, 26)
-        self.assertEqual(rs, xp)
-
-        off = BDay() * 10
-        rs = datetime(2014, 1, 5) + off  # see #5890
-        xp = datetime(2014, 1, 17)
-        self.assertEqual(rs, xp)
-
-    def test_apply_corner(self):
-        self.assertRaises(TypeError, BDay().apply, BMonthEnd())
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BDay()
-        offset2 = BDay()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestBusinessHour(Base):
-    _offset = BusinessHour
-
-    def setUp(self):
-        self.d = datetime(2014, 7, 1, 10, 00)
-
-        self.offset1 = BusinessHour()
-        self.offset2 = BusinessHour(n=3)
-
-        self.offset3 = BusinessHour(n=-1)
-        self.offset4 = BusinessHour(n=-4)
-
-        from datetime import time as dt_time
-        self.offset5 = BusinessHour(start=dt_time(11, 0), end=dt_time(14, 30))
-        self.offset6 = BusinessHour(start='20:00', end='05:00')
-        self.offset7 = BusinessHour(n=-2, start=dt_time(21, 30),
-                                    end=dt_time(6, 30))
-
-    def test_constructor_errors(self):
-        from datetime import time as dt_time
-        with tm.assertRaises(ValueError):
-            BusinessHour(start=dt_time(11, 0, 5))
-        with tm.assertRaises(ValueError):
-            BusinessHour(start='AAA')
-        with tm.assertRaises(ValueError):
-            BusinessHour(start='14:00:05')
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = self._offset()
-        offset2 = self._offset()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        self.assertEqual(repr(self.offset1), '<BusinessHour: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset2),
-                         '<3 * BusinessHours: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset3),
-                         '<-1 * BusinessHour: BH=09:00-17:00>')
-        self.assertEqual(repr(self.offset4),
-                         '<-4 * BusinessHours: BH=09:00-17:00>')
-
-        self.assertEqual(repr(self.offset5), '<BusinessHour: BH=11:00-14:30>')
-        self.assertEqual(repr(self.offset6), '<BusinessHour: BH=20:00-05:00>')
-        self.assertEqual(repr(self.offset7),
-                         '<-2 * BusinessHours: BH=21:30-06:30>')
-
-    def test_with_offset(self):
-        expected = Timestamp('2014-07-01 13:00')
-
-        self.assertEqual(self.d + BusinessHour() * 3, expected)
-        self.assertEqual(self.d + BusinessHour(n=3), expected)
-
-    def testEQ(self):
-        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
-            self.assertEqual(offset, offset)
-
-        self.assertNotEqual(BusinessHour(), BusinessHour(-1))
-        self.assertEqual(BusinessHour(start='09:00'), BusinessHour())
-        self.assertNotEqual(BusinessHour(start='09:00'),
-                            BusinessHour(start='09:01'))
-        self.assertNotEqual(BusinessHour(start='09:00', end='17:00'),
-                            BusinessHour(start='17:00', end='09:01'))
-
-    def test_hash(self):
-        for offset in [self.offset1, self.offset2, self.offset3, self.offset4]:
-            self.assertEqual(hash(offset), hash(offset))
-
-    def testCall(self):
-        self.assertEqual(self.offset1(self.d), datetime(2014, 7, 1, 11))
-        self.assertEqual(self.offset2(self.d), datetime(2014, 7, 1, 13))
-        self.assertEqual(self.offset3(self.d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset4(self.d), datetime(2014, 6, 30, 14))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + self._offset(-3))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 5 * self.offset1, self.d + self._offset(5))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-3 * self._offset(-2)),
-                         self.d + self._offset(6))
-
-    def testRollback1(self):
-        self.assertEqual(self.offset1.rollback(self.d), self.d)
-        self.assertEqual(self.offset2.rollback(self.d), self.d)
-        self.assertEqual(self.offset3.rollback(self.d), self.d)
-        self.assertEqual(self.offset4.rollback(self.d), self.d)
-        self.assertEqual(self.offset5.rollback(self.d),
-                         datetime(2014, 6, 30, 14, 30))
-        self.assertEqual(self.offset6.rollback(
-            self.d), datetime(2014, 7, 1, 5, 0))
-        self.assertEqual(self.offset7.rollback(
-            self.d), datetime(2014, 7, 1, 6, 30))
-
-        d = datetime(2014, 7, 1, 0)
-        self.assertEqual(self.offset1.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset2.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset3.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset4.rollback(d), datetime(2014, 6, 30, 17))
-        self.assertEqual(self.offset5.rollback(
-            d), datetime(2014, 6, 30, 14, 30))
-        self.assertEqual(self.offset6.rollback(d), d)
-        self.assertEqual(self.offset7.rollback(d), d)
-
-        self.assertEqual(self._offset(5).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(self._offset(-3)
-                         .rollback(datetime(2014, 7, 5, 15, 0)),
-                         datetime(2014, 7, 4, 17, 0))
-
-    def testRollforward1(self):
-        self.assertEqual(self.offset1.rollforward(self.d), self.d)
-        self.assertEqual(self.offset2.rollforward(self.d), self.d)
-        self.assertEqual(self.offset3.rollforward(self.d), self.d)
-        self.assertEqual(self.offset4.rollforward(self.d), self.d)
-        self.assertEqual(self.offset5.rollforward(
-            self.d), datetime(2014, 7, 1, 11, 0))
-        self.assertEqual(self.offset6.rollforward(
-            self.d), datetime(2014, 7, 1, 20, 0))
-        self.assertEqual(self.offset7.rollforward(
-            self.d), datetime(2014, 7, 1, 21, 30))
-
-        d = datetime(2014, 7, 1, 0)
-        self.assertEqual(self.offset1.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset2.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset3.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset4.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset5.rollforward(d), datetime(2014, 7, 1, 11))
-        self.assertEqual(self.offset6.rollforward(d), d)
-        self.assertEqual(self.offset7.rollforward(d), d)
-
-        self.assertEqual(self._offset(5).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(self._offset(-3)
-                         .rollforward(datetime(2014, 7, 5, 16, 0)),
-                         datetime(2014, 7, 7, 9))
-
-    def test_roll_date_object(self):
-        offset = BusinessHour()
-
-        dt = datetime(2014, 7, 6, 15, 0)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2014, 7, 4, 17))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2014, 7, 7, 9))
-
-    def test_normalize(self):
-        tests = []
-
-        tests.append((BusinessHour(normalize=True),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
-                       datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
-                       datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
-
-        tests.append((BusinessHour(-1, normalize=True),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 6, 30),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 10): datetime(2014, 6, 30),
-                       datetime(2014, 7, 1, 0): datetime(2014, 6, 30),
-                       datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
-                       datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
-
-        tests.append((BusinessHour(1, normalize=True, start='17:00',
-                                   end='04:00'),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 3): datetime(2014, 7, 2),
-                       datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
-                       datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
-                       datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
-                       datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.apply(dt), expected)
-
-    def test_onOffset(self):
-        tests = []
-
-        tests.append((BusinessHour(), {datetime(2014, 7, 1, 9): True,
-                                       datetime(2014, 7, 1, 8, 59): False,
-                                       datetime(2014, 7, 1, 8): False,
-                                       datetime(2014, 7, 1, 17): True,
-                                       datetime(2014, 7, 1, 17, 1): False,
-                                       datetime(2014, 7, 1, 18): False,
-                                       datetime(2014, 7, 5, 9): False,
-                                       datetime(2014, 7, 6, 12): False}))
-
-        tests.append((BusinessHour(start='10:00', end='15:00'),
-                      {datetime(2014, 7, 1, 9): False,
-                       datetime(2014, 7, 1, 10): True,
-                       datetime(2014, 7, 1, 15): True,
-                       datetime(2014, 7, 1, 15, 1): False,
-                       datetime(2014, 7, 5, 12): False,
-                       datetime(2014, 7, 6, 12): False}))
-
-        tests.append((BusinessHour(start='19:00', end='05:00'),
-                      {datetime(2014, 7, 1, 9, 0): False,
-                       datetime(2014, 7, 1, 10, 0): False,
-                       datetime(2014, 7, 1, 15): False,
-                       datetime(2014, 7, 1, 15, 1): False,
-                       datetime(2014, 7, 5, 12, 0): False,
-                       datetime(2014, 7, 6, 12, 0): False,
-                       datetime(2014, 7, 1, 19, 0): True,
-                       datetime(2014, 7, 2, 0, 0): True,
-                       datetime(2014, 7, 4, 23): True,
-                       datetime(2014, 7, 5, 1): True,
-                       datetime(2014, 7, 5, 5, 0): True,
-                       datetime(2014, 7, 6, 23, 0): False,
-                       datetime(2014, 7, 7, 3, 0): False}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.onOffset(dt), expected)
-
-    def test_opening_time(self):
-        tests = []
-
-        # opening time should be affected by sign of n, not by n's value and
-        # end
-        tests.append((
-            [BusinessHour(), BusinessHour(n=2), BusinessHour(
-                n=4), BusinessHour(end='10:00'), BusinessHour(n=2, end='4:00'),
-             BusinessHour(n=4, end='15:00')],
-            {datetime(2014, 7, 1, 11): (datetime(2014, 7, 2, 9), datetime(
-                2014, 7, 1, 9)),
-             datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 9), datetime(
-                 2014, 7, 1, 9)),
-             datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 9), datetime(
-                 2014, 7, 1, 9)),
-             datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 9), datetime(
-                 2014, 7, 1, 9)),
-             # if timestamp is on opening time, next opening time is
-             # as it is
-             datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9), datetime(
-                 2014, 7, 2, 9)),
-             datetime(2014, 7, 2, 10): (datetime(2014, 7, 3, 9), datetime(
-                 2014, 7, 2, 9)),
-             # 2014-07-05 is saturday
-             datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 9), datetime(
-                 2014, 7, 4, 9)),
-             datetime(2014, 7, 4, 10): (datetime(2014, 7, 7, 9), datetime(
-                 2014, 7, 4, 9)),
-             datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 9), datetime(
-                 2014, 7, 4, 9)),
-             datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 9), datetime(
-                 2014, 7, 4, 9)),
-             datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 9), datetime(
-                 2014, 7, 4, 9)),
-             datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 8, 9), datetime(
-                 2014, 7, 7, 9))}))
-
-        tests.append(([BusinessHour(start='11:15'),
-                       BusinessHour(n=2, start='11:15'),
-                       BusinessHour(n=3, start='11:15'),
-                       BusinessHour(start='11:15', end='10:00'),
-                       BusinessHour(n=2, start='11:15', end='4:00'),
-                       BusinessHour(n=3, start='11:15', end='15:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(
-                          2014, 7, 1, 11, 15), datetime(2014, 6, 30, 11, 15)),
-                       datetime(2014, 7, 1, 18): (datetime(
-                           2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 1, 23): (datetime(
-                           2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 11, 15),
-                                                 datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 11, 15),
-                                                 datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 10): (datetime(
-                           2014, 7, 2, 11, 15), datetime(2014, 7, 1, 11, 15)),
-                       datetime(2014, 7, 2, 11, 15): (datetime(
-                           2014, 7, 2, 11, 15), datetime(2014, 7, 2, 11, 15)),
-                       datetime(2014, 7, 2, 11, 15, 1): (datetime(
-                           2014, 7, 3, 11, 15), datetime(2014, 7, 2, 11, 15)),
-                       datetime(2014, 7, 5, 10): (datetime(
-                           2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 4, 10): (datetime(
-                           2014, 7, 4, 11, 15), datetime(2014, 7, 3, 11, 15)),
-                       datetime(2014, 7, 4, 23): (datetime(
-                           2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 6, 10): (datetime(
-                           2014, 7, 7, 11, 15), datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 11, 15),
-                                                 datetime(2014, 7, 4, 11, 15)),
-                       datetime(2014, 7, 7, 9, 1): (
-                           datetime(2014, 7, 7, 11, 15),
-                           datetime(2014, 7, 4, 11, 15))}))
-
-        tests.append(([BusinessHour(-1), BusinessHour(n=-2),
-                       BusinessHour(n=-4),
-                       BusinessHour(n=-1, end='10:00'),
-                       BusinessHour(n=-2, end='4:00'),
-                       BusinessHour(n=-4, end='15:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 9),
-                                                  datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 9),
-                                                  datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 9),
-                                                  datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 9),
-                                                 datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 9),
-                                                 datetime(2014, 7, 2, 9)),
-                       datetime(2014, 7, 2, 10): (datetime(2014, 7, 2, 9),
-                                                  datetime(2014, 7, 3, 9)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 9),
-                                                  datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 9),
-                                                  datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 9),
-                                                  datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 9),
-                                                  datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 9),
-                                                 datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 9): (datetime(2014, 7, 7, 9),
-                                                 datetime(2014, 7, 7, 9)),
-                       datetime(2014, 7, 7, 9, 1): (datetime(2014, 7, 7, 9),
-                                                    datetime(2014, 7, 8, 9))}))
-
-        tests.append(([BusinessHour(start='17:00', end='05:00'),
-                       BusinessHour(n=3, start='17:00', end='03:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 7, 1, 17),
-                                                  datetime(2014, 6, 30, 17)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 2, 17),
-                                                  datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 2, 17),
-                                                  datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 2, 17),
-                                                 datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 2, 17),
-                                                 datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 4, 17): (datetime(2014, 7, 4, 17),
-                                                  datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 7, 17),
-                                                  datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 4, 17),
-                                                  datetime(2014, 7, 3, 17)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 7, 17),
-                                                  datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 7, 17),
-                                                  datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 7, 17),
-                                                 datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 7, 17, 1): (datetime(
-                           2014, 7, 8, 17), datetime(2014, 7, 7, 17)), }))
-
-        tests.append(([BusinessHour(-1, start='17:00', end='05:00'),
-                       BusinessHour(n=-2, start='17:00', end='03:00')],
-                      {datetime(2014, 7, 1, 11): (datetime(2014, 6, 30, 17),
-                                                  datetime(2014, 7, 1, 17)),
-                       datetime(2014, 7, 1, 18): (datetime(2014, 7, 1, 17),
-                                                  datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 1, 23): (datetime(2014, 7, 1, 17),
-                                                  datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 8): (datetime(2014, 7, 1, 17),
-                                                 datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 9): (datetime(2014, 7, 1, 17),
-                                                 datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 2, 16, 59): (datetime(
-                           2014, 7, 1, 17), datetime(2014, 7, 2, 17)),
-                       datetime(2014, 7, 5, 10): (datetime(2014, 7, 4, 17),
-                                                  datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 4, 10): (datetime(2014, 7, 3, 17),
-                                                  datetime(2014, 7, 4, 17)),
-                       datetime(2014, 7, 4, 23): (datetime(2014, 7, 4, 17),
-                                                  datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 6, 10): (datetime(2014, 7, 4, 17),
-                                                  datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 7, 5): (datetime(2014, 7, 4, 17),
-                                                 datetime(2014, 7, 7, 17)),
-                       datetime(2014, 7, 7, 18): (datetime(2014, 7, 7, 17),
-                                                  datetime(2014, 7, 8, 17))}))
-
-        for _offsets, cases in tests:
-            for offset in _offsets:
-                for dt, (exp_next, exp_prev) in compat.iteritems(cases):
-                    self.assertEqual(offset._next_opening_time(dt), exp_next)
-                    self.assertEqual(offset._prev_opening_time(dt), exp_prev)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((
-            BusinessHour(),
-            {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
-             datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
-             datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
-             datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 10),
-             datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 9),
-             datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 2, 9, 30, 15),
-             datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 10),
-             datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 12),
-             # out of business hours
-             datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 10),
-             datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
-             # saturday
-             datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
-             datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
-             datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
-             datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30,
-                                                        30)}))
-
-        tests.append((BusinessHour(
-            4), {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
-                 datetime(2014, 7, 1, 13): datetime(2014, 7, 2, 9),
-                 datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 11),
-                 datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 12),
-                 datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 13),
-                 datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 15),
-                 datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 13),
-                 datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
-                 datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
-                 datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
-                 datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
-                 datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
-                 datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
-                 datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30,
-                                                            30)}))
-
-        tests.append(
-            (BusinessHour(-1),
-             {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 10),
-              datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 12),
-              datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 14),
-              datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 15),
-              datetime(2014, 7, 1, 10): datetime(2014, 6, 30, 17),
-              datetime(2014, 7, 1, 16, 30, 15): datetime(
-                  2014, 7, 1, 15, 30, 15),
-              datetime(2014, 7, 1, 9, 30, 15): datetime(
-                  2014, 6, 30, 16, 30, 15),
-              datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 16),
-              datetime(2014, 7, 1, 5): datetime(2014, 6, 30, 16),
-              datetime(2014, 7, 2, 11): datetime(2014, 7, 2, 10),
-              # out of business hours
-              datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 16),
-              datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 16),
-              datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 16),
-              datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 16),
-              # saturday
-              datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 16),
-              datetime(2014, 7, 7, 9): datetime(2014, 7, 4, 16),
-              datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 16, 30),
-              datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 16, 30,
-                                                        30)}))
-
-        tests.append((BusinessHour(
-            -4), {datetime(2014, 7, 1, 11): datetime(2014, 6, 30, 15),
-                  datetime(2014, 7, 1, 13): datetime(2014, 6, 30, 17),
-                  datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 11),
-                  datetime(2014, 7, 1, 16): datetime(2014, 7, 1, 12),
-                  datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
-                  datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
-                  datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
-                  datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
-                  datetime(2014, 7, 2, 23): datetime(2014, 7, 2, 13),
-                  datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
-                  datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
-                  datetime(2014, 7, 4, 18): datetime(2014, 7, 4, 13),
-                  datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 4, 13, 30),
-                  datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 4, 13, 30,
-                                                            30)}))
-
-        tests.append((BusinessHour(start='13:00', end='16:00'),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
-                       datetime(2014, 7, 1, 15): datetime(2014, 7, 2, 13),
-                       datetime(2014, 7, 1, 19): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 1, 15, 30, 15): datetime(2014, 7, 2,
-                                                                  13, 30, 15),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 14),
-                       datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 14)}))
-
-        tests.append((BusinessHour(n=2, start='13:00', end='16:00'), {
-            datetime(2014, 7, 1, 17): datetime(2014, 7, 2, 15),
-            datetime(2014, 7, 2, 14): datetime(2014, 7, 3, 13),
-            datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 15),
-            datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 15),
-            datetime(2014, 7, 2, 14, 30): datetime(2014, 7, 3, 13, 30),
-            datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 15),
-            datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 15),
-            datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 15),
-            datetime(2014, 7, 4, 14, 30): datetime(2014, 7, 7, 13, 30),
-            datetime(2014, 7, 4, 14, 30, 30): datetime(2014, 7, 7, 13, 30, 30)
-        }))
-
-        tests.append((BusinessHour(n=-1, start='13:00', end='16:00'),
-                      {datetime(2014, 7, 2, 11): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 15),
-                       datetime(2014, 7, 2, 14): datetime(2014, 7, 1, 16),
-                       datetime(2014, 7, 2, 15): datetime(2014, 7, 2, 14),
-                       datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 16): datetime(2014, 7, 2, 15),
-                       datetime(2014, 7, 2, 13, 30, 15): datetime(2014, 7, 1,
-                                                                  15, 30, 15),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 15),
-                       datetime(2014, 7, 7, 11): datetime(2014, 7, 4, 15)}))
-
-        tests.append((BusinessHour(n=-3, start='10:00', end='16:00'), {
-            datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 13),
-            datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 11),
-            datetime(2014, 7, 2, 8): datetime(2014, 7, 1, 13),
-            datetime(2014, 7, 2, 13): datetime(2014, 7, 1, 16),
-            datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 13),
-            datetime(2014, 7, 2, 11, 30): datetime(2014, 7, 1, 14, 30),
-            datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 13),
-            datetime(2014, 7, 4, 10): datetime(2014, 7, 3, 13),
-            datetime(2014, 7, 5, 15): datetime(2014, 7, 4, 13),
-            datetime(2014, 7, 4, 16): datetime(2014, 7, 4, 13),
-            datetime(2014, 7, 4, 12, 30): datetime(2014, 7, 3, 15, 30),
-            datetime(2014, 7, 4, 12, 30, 30): datetime(2014, 7, 3, 15, 30, 30)
-        }))
-
-        tests.append((BusinessHour(start='19:00', end='05:00'), {
-            datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 20),
-            datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 20),
-            datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 20),
-            datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 20),
-            datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 20),
-            datetime(2014, 7, 2, 4, 30): datetime(2014, 7, 2, 19, 30),
-            datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 1),
-            datetime(2014, 7, 4, 10): datetime(2014, 7, 4, 20),
-            datetime(2014, 7, 4, 23): datetime(2014, 7, 5, 0),
-            datetime(2014, 7, 5, 0): datetime(2014, 7, 5, 1),
-            datetime(2014, 7, 5, 4): datetime(2014, 7, 7, 19),
-            datetime(2014, 7, 5, 4, 30): datetime(2014, 7, 7, 19, 30),
-            datetime(2014, 7, 5, 4, 30, 30): datetime(2014, 7, 7, 19, 30, 30)
-        }))
-
-        tests.append((BusinessHour(n=-1, start='19:00', end='05:00'), {
-            datetime(2014, 7, 1, 17): datetime(2014, 7, 1, 4),
-            datetime(2014, 7, 2, 14): datetime(2014, 7, 2, 4),
-            datetime(2014, 7, 2, 8): datetime(2014, 7, 2, 4),
-            datetime(2014, 7, 2, 13): datetime(2014, 7, 2, 4),
-            datetime(2014, 7, 2, 20): datetime(2014, 7, 2, 5),
-            datetime(2014, 7, 2, 19): datetime(2014, 7, 2, 4),
-            datetime(2014, 7, 2, 19, 30): datetime(2014, 7, 2, 4, 30),
-            datetime(2014, 7, 3, 0): datetime(2014, 7, 2, 23),
-            datetime(2014, 7, 3, 6): datetime(2014, 7, 3, 4),
-            datetime(2014, 7, 4, 23): datetime(2014, 7, 4, 22),
-            datetime(2014, 7, 5, 0): datetime(2014, 7, 4, 23),
-            datetime(2014, 7, 5, 4): datetime(2014, 7, 5, 3),
-            datetime(2014, 7, 7, 19, 30): datetime(2014, 7, 5, 4, 30),
-            datetime(2014, 7, 7, 19, 30, 30): datetime(2014, 7, 5, 4, 30, 30)
-        }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        tests = []
-
-        tests.append(
-            (BusinessHour(40),  # A week later
-             {datetime(2014, 7, 1, 11): datetime(2014, 7, 8, 11),
-              datetime(2014, 7, 1, 13): datetime(2014, 7, 8, 13),
-              datetime(2014, 7, 1, 15): datetime(2014, 7, 8, 15),
-              datetime(2014, 7, 1, 16): datetime(2014, 7, 8, 16),
-              datetime(2014, 7, 1, 17): datetime(2014, 7, 9, 9),
-              datetime(2014, 7, 2, 11): datetime(2014, 7, 9, 11),
-              datetime(2014, 7, 2, 8): datetime(2014, 7, 9, 9),
-              datetime(2014, 7, 2, 19): datetime(2014, 7, 10, 9),
-              datetime(2014, 7, 2, 23): datetime(2014, 7, 10, 9),
-              datetime(2014, 7, 3, 0): datetime(2014, 7, 10, 9),
-              datetime(2014, 7, 5, 15): datetime(2014, 7, 14, 9),
-              datetime(2014, 7, 4, 18): datetime(2014, 7, 14, 9),
-              datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 14, 9, 30),
-              datetime(2014, 7, 7, 9, 30, 30): datetime(2014, 7, 14, 9, 30,
-                                                        30)}))
-
-        tests.append(
-            (BusinessHour(-25),  # 3 days and 1 hour before
-             {datetime(2014, 7, 1, 11): datetime(2014, 6, 26, 10),
-              datetime(2014, 7, 1, 13): datetime(2014, 6, 26, 12),
-              datetime(2014, 7, 1, 9): datetime(2014, 6, 25, 16),
-              datetime(2014, 7, 1, 10): datetime(2014, 6, 25, 17),
-              datetime(2014, 7, 3, 11): datetime(2014, 6, 30, 10),
-              datetime(2014, 7, 3, 8): datetime(2014, 6, 27, 16),
-              datetime(2014, 7, 3, 19): datetime(2014, 6, 30, 16),
-              datetime(2014, 7, 3, 23): datetime(2014, 6, 30, 16),
-              datetime(2014, 7, 4, 9): datetime(2014, 6, 30, 16),
-              datetime(2014, 7, 5, 15): datetime(2014, 7, 1, 16),
-              datetime(2014, 7, 6, 18): datetime(2014, 7, 1, 16),
-              datetime(2014, 7, 7, 9, 30): datetime(2014, 7, 1, 16, 30),
-              datetime(2014, 7, 7, 10, 30, 30): datetime(2014, 7, 2, 9, 30,
-                                                         30)}))
-
-        # 5 days and 3 hours later
-        tests.append((BusinessHour(28, start='21:00', end='02:00'),
-                      {datetime(2014, 7, 1, 11): datetime(2014, 7, 9, 0),
-                       datetime(2014, 7, 1, 22): datetime(2014, 7, 9, 1),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 9, 21),
-                       datetime(2014, 7, 2, 2): datetime(2014, 7, 10, 0),
-                       datetime(2014, 7, 3, 21): datetime(2014, 7, 11, 0),
-                       datetime(2014, 7, 4, 1): datetime(2014, 7, 11, 23),
-                       datetime(2014, 7, 4, 2): datetime(2014, 7, 12, 0),
-                       datetime(2014, 7, 4, 3): datetime(2014, 7, 12, 0),
-                       datetime(2014, 7, 5, 1): datetime(2014, 7, 14, 23),
-                       datetime(2014, 7, 5, 15): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 6, 18): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 7, 1): datetime(2014, 7, 15, 0),
-                       datetime(2014, 7, 7, 23, 30): datetime(2014, 7, 15, 21,
-                                                              30)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_nanoseconds(self):
-        tests = []
-
-        tests.append((BusinessHour(),
-                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
-                          '2014-07-04 16:00') + Nano(5),
-                       Timestamp('2014-07-04 16:00') + Nano(5): Timestamp(
-                           '2014-07-07 09:00') + Nano(5),
-                       Timestamp('2014-07-04 16:00') - Nano(5): Timestamp(
-                           '2014-07-04 17:00') - Nano(5)}))
-
-        tests.append((BusinessHour(-1),
-                      {Timestamp('2014-07-04 15:00') + Nano(5): Timestamp(
-                          '2014-07-04 14:00') + Nano(5),
-                       Timestamp('2014-07-04 10:00') + Nano(5): Timestamp(
-                           '2014-07-04 09:00') + Nano(5),
-                       Timestamp('2014-07-04 10:00') - Nano(5): Timestamp(
-                           '2014-07-03 17:00') - Nano(5), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = self._offset()
-        offset2 = self._offset()
-        self.assertFalse(offset1 != offset2)
-
-    def test_datetimeindex(self):
-        idx1 = DatetimeIndex(start='2014-07-04 15:00', end='2014-07-08 10:00',
-                             freq='BH')
-        idx2 = DatetimeIndex(start='2014-07-04 15:00', periods=12, freq='BH')
-        idx3 = DatetimeIndex(end='2014-07-08 10:00', periods=12, freq='BH')
-        expected = DatetimeIndex(['2014-07-04 15:00', '2014-07-04 16:00',
-                                  '2014-07-07 09:00',
-                                  '2014-07-07 10:00', '2014-07-07 11:00',
-                                  '2014-07-07 12:00',
-                                  '2014-07-07 13:00', '2014-07-07 14:00',
-                                  '2014-07-07 15:00',
-                                  '2014-07-07 16:00', '2014-07-08 09:00',
-                                  '2014-07-08 10:00'],
-                                 freq='BH')
-        for idx in [idx1, idx2, idx3]:
-            tm.assert_index_equal(idx, expected)
-
-        idx1 = DatetimeIndex(start='2014-07-04 15:45', end='2014-07-08 10:45',
-                             freq='BH')
-        idx2 = DatetimeIndex(start='2014-07-04 15:45', periods=12, freq='BH')
-        idx3 = DatetimeIndex(end='2014-07-08 10:45', periods=12, freq='BH')
-
-        expected = DatetimeIndex(['2014-07-04 15:45', '2014-07-04 16:45',
-                                  '2014-07-07 09:45',
-                                  '2014-07-07 10:45', '2014-07-07 11:45',
-                                  '2014-07-07 12:45',
-                                  '2014-07-07 13:45', '2014-07-07 14:45',
-                                  '2014-07-07 15:45',
-                                  '2014-07-07 16:45', '2014-07-08 09:45',
-                                  '2014-07-08 10:45'],
-                                 freq='BH')
-        expected = idx1
-        for idx in [idx1, idx2, idx3]:
-            tm.assert_index_equal(idx, expected)
-
-
-class TestCustomBusinessHour(Base):
-    _offset = CustomBusinessHour
-
-    def setUp(self):
-        # 2014 Calendar to check custom holidays
-        #   Sun Mon Tue Wed Thu Fri Sat
-        #  6/22  23  24  25  26  27  28
-        #    29  30 7/1   2   3   4   5
-        #     6   7   8   9  10  11  12
-        self.d = datetime(2014, 7, 1, 10, 00)
-        self.offset1 = CustomBusinessHour(weekmask='Tue Wed Thu Fri')
-
-        self.holidays = ['2014-06-27', datetime(2014, 6, 30),
-                         np.datetime64('2014-07-02')]
-        self.offset2 = CustomBusinessHour(holidays=self.holidays)
-
-    def test_constructor_errors(self):
-        from datetime import time as dt_time
-        with tm.assertRaises(ValueError):
-            CustomBusinessHour(start=dt_time(11, 0, 5))
-        with tm.assertRaises(ValueError):
-            CustomBusinessHour(start='AAA')
-        with tm.assertRaises(ValueError):
-            CustomBusinessHour(start='14:00:05')
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = self._offset()
-        offset2 = self._offset()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        self.assertEqual(repr(self.offset1),
-                         '<CustomBusinessHour: CBH=09:00-17:00>')
-        self.assertEqual(repr(self.offset2),
-                         '<CustomBusinessHour: CBH=09:00-17:00>')
-
-    def test_with_offset(self):
-        expected = Timestamp('2014-07-01 13:00')
-
-        self.assertEqual(self.d + CustomBusinessHour() * 3, expected)
-        self.assertEqual(self.d + CustomBusinessHour(n=3), expected)
-
-    def testEQ(self):
-        for offset in [self.offset1, self.offset2]:
-            self.assertEqual(offset, offset)
-
-        self.assertNotEqual(CustomBusinessHour(), CustomBusinessHour(-1))
-        self.assertEqual(CustomBusinessHour(start='09:00'),
-                         CustomBusinessHour())
-        self.assertNotEqual(CustomBusinessHour(start='09:00'),
-                            CustomBusinessHour(start='09:01'))
-        self.assertNotEqual(CustomBusinessHour(start='09:00', end='17:00'),
-                            CustomBusinessHour(start='17:00', end='09:01'))
-
-        self.assertNotEqual(CustomBusinessHour(weekmask='Tue Wed Thu Fri'),
-                            CustomBusinessHour(weekmask='Mon Tue Wed Thu Fri'))
-        self.assertNotEqual(CustomBusinessHour(holidays=['2014-06-27']),
-                            CustomBusinessHour(holidays=['2014-06-28']))
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset1), hash(self.offset1))
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset1(self.d), datetime(2014, 7, 1, 11))
-        self.assertEqual(self.offset2(self.d), datetime(2014, 7, 1, 11))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d - (2 * off - off))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 5 * self.offset1, self.d + self._offset(5))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-3 * self._offset(-2)),
-                         self.d + self._offset(6))
-
-    def testRollback1(self):
-        self.assertEqual(self.offset1.rollback(self.d), self.d)
-        self.assertEqual(self.offset2.rollback(self.d), self.d)
-
-        d = datetime(2014, 7, 1, 0)
-        # 2014/07/01 is Tuesday, 06/30 is Monday(holiday)
-        self.assertEqual(self.offset1.rollback(d), datetime(2014, 6, 27, 17))
-
-        # 2014/6/30 and 2014/6/27 are holidays
-        self.assertEqual(self.offset2.rollback(d), datetime(2014, 6, 26, 17))
-
-    def testRollback2(self):
-        self.assertEqual(self._offset(-3)
-                         .rollback(datetime(2014, 7, 5, 15, 0)),
-                         datetime(2014, 7, 4, 17, 0))
-
-    def testRollforward1(self):
-        self.assertEqual(self.offset1.rollforward(self.d), self.d)
-        self.assertEqual(self.offset2.rollforward(self.d), self.d)
-
-        d = datetime(2014, 7, 1, 0)
-        self.assertEqual(self.offset1.rollforward(d), datetime(2014, 7, 1, 9))
-        self.assertEqual(self.offset2.rollforward(d), datetime(2014, 7, 1, 9))
-
-    def testRollforward2(self):
-        self.assertEqual(self._offset(-3)
-                         .rollforward(datetime(2014, 7, 5, 16, 0)),
-                         datetime(2014, 7, 7, 9))
-
-    def test_roll_date_object(self):
-        offset = BusinessHour()
-
-        dt = datetime(2014, 7, 6, 15, 0)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2014, 7, 4, 17))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2014, 7, 7, 9))
-
-    def test_normalize(self):
-        tests = []
-
-        tests.append((CustomBusinessHour(normalize=True,
-                                         holidays=self.holidays),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 3),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 3),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 3),
-                       datetime(2014, 7, 1, 0): datetime(2014, 7, 1),
-                       datetime(2014, 7, 4, 15): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 15, 59): datetime(2014, 7, 4),
-                       datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 7),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 7)}))
-
-        tests.append((CustomBusinessHour(-1, normalize=True,
-                                         holidays=self.holidays),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 6, 26),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 16): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 10): datetime(2014, 6, 26),
-                       datetime(2014, 7, 1, 0): datetime(2014, 6, 26),
-                       datetime(2014, 7, 7, 10): datetime(2014, 7, 4),
-                       datetime(2014, 7, 7, 10, 1): datetime(2014, 7, 7),
-                       datetime(2014, 7, 5, 23): datetime(2014, 7, 4),
-                       datetime(2014, 7, 6, 10): datetime(2014, 7, 4)}))
-
-        tests.append((CustomBusinessHour(1, normalize=True, start='17:00',
-                                         end='04:00', holidays=self.holidays),
-                      {datetime(2014, 7, 1, 8): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 17): datetime(2014, 7, 1),
-                       datetime(2014, 7, 1, 23): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 2): datetime(2014, 7, 2),
-                       datetime(2014, 7, 2, 3): datetime(2014, 7, 3),
-                       datetime(2014, 7, 4, 23): datetime(2014, 7, 5),
-                       datetime(2014, 7, 5, 2): datetime(2014, 7, 5),
-                       datetime(2014, 7, 7, 2): datetime(2014, 7, 7),
-                       datetime(2014, 7, 7, 17): datetime(2014, 7, 7)}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.apply(dt), expected)
-
-    def test_onOffset(self):
-        tests = []
-
-        tests.append((CustomBusinessHour(start='10:00', end='15:00',
-                                         holidays=self.holidays),
-                      {datetime(2014, 7, 1, 9): False,
-                       datetime(2014, 7, 1, 10): True,
-                       datetime(2014, 7, 1, 15): True,
-                       datetime(2014, 7, 1, 15, 1): False,
-                       datetime(2014, 7, 5, 12): False,
-                       datetime(2014, 7, 6, 12): False}))
-
-        for offset, cases in tests:
-            for dt, expected in compat.iteritems(cases):
-                self.assertEqual(offset.onOffset(dt), expected)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((
-            CustomBusinessHour(holidays=self.holidays),
-            {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 12),
-             datetime(2014, 7, 1, 13): datetime(2014, 7, 1, 14),
-             datetime(2014, 7, 1, 15): datetime(2014, 7, 1, 16),
-             datetime(2014, 7, 1, 19): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 9),
-             datetime(2014, 7, 1, 16, 30, 15): datetime(2014, 7, 3, 9, 30, 15),
-             datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 10),
-             # out of business hours
-             datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 10),
-             datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 10),
-             # saturday
-             datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 10),
-             datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 10),
-             datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 9, 30),
-             datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 9, 30,
-                                                        30)}))
-
-        tests.append((
-            CustomBusinessHour(4, holidays=self.holidays),
-            {datetime(2014, 7, 1, 11): datetime(2014, 7, 1, 15),
-             datetime(2014, 7, 1, 13): datetime(2014, 7, 3, 9),
-             datetime(2014, 7, 1, 15): datetime(2014, 7, 3, 11),
-             datetime(2014, 7, 1, 16): datetime(2014, 7, 3, 12),
-             datetime(2014, 7, 1, 17): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 2, 11): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 2, 8): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 2, 19): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 2, 23): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 3, 0): datetime(2014, 7, 3, 13),
-             datetime(2014, 7, 5, 15): datetime(2014, 7, 7, 13),
-             datetime(2014, 7, 4, 17): datetime(2014, 7, 7, 13),
-             datetime(2014, 7, 4, 16, 30): datetime(2014, 7, 7, 12, 30),
-             datetime(2014, 7, 4, 16, 30, 30): datetime(2014, 7, 7, 12, 30,
-                                                        30)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_nanoseconds(self):
-        tests = []
-
-        tests.append((CustomBusinessHour(holidays=self.holidays),
-                      {Timestamp('2014-07-01 15:00') + Nano(5): Timestamp(
-                          '2014-07-01 16:00') + Nano(5),
-                       Timestamp('2014-07-01 16:00') + Nano(5): Timestamp(
-                           '2014-07-03 09:00') + Nano(5),
-                       Timestamp('2014-07-01 16:00') - Nano(5): Timestamp(
-                           '2014-07-01 17:00') - Nano(5)}))
-
-        tests.append((CustomBusinessHour(-1, holidays=self.holidays),
-                      {Timestamp('2014-07-01 15:00') + Nano(5): Timestamp(
-                          '2014-07-01 14:00') + Nano(5),
-                       Timestamp('2014-07-01 10:00') + Nano(5): Timestamp(
-                           '2014-07-01 09:00') + Nano(5),
-                       Timestamp('2014-07-01 10:00') - Nano(5): Timestamp(
-                           '2014-06-26 17:00') - Nano(5), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-
-class TestCustomBusinessDay(Base):
-    _offset = CDay
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-        self.nd = np_datetime64_compat('2008-01-01 00:00:00Z')
-
-        self.offset = CDay()
-        self.offset2 = CDay(2)
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CDay()
-        offset2 = CDay()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessDay>'
-        assert repr(self.offset2) == '<2 * CustomBusinessDays>'
-
-        expected = '<BusinessDay: offset=datetime.timedelta(1)>'
-        assert repr(self.offset + timedelta(1)) == expected
-
-    def test_with_offset(self):
-        offset = self.offset + timedelta(hours=2)
-
-        assert (self.d + offset) == datetime(2008, 1, 2, 2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 1, 3))
-        self.assertEqual(self.offset2(self.nd), datetime(2008, 1, 3))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + CDay(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset, self.d + CDay(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * CDay(-10)), self.d + CDay(50))
-
-    def testRollback1(self):
-        self.assertEqual(CDay(10).rollback(self.d), self.d)
-
-    def testRollback2(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2008, 1, 5)), datetime(2008, 1, 4))
-
-    def testRollforward1(self):
-        self.assertEqual(CDay(10).rollforward(self.d), self.d)
-
-    def testRollforward2(self):
-        self.assertEqual(
-            CDay(10).rollforward(datetime(2008, 1, 5)), datetime(2008, 1, 7))
-
-    def test_roll_date_object(self):
-        offset = CDay()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 14))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 17))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CDay(), datetime(2008, 1, 1), True),
-                 (CDay(), datetime(2008, 1, 5), False)]
-
-        for offset, d, expected in tests:
-            assertOnOffset(offset, d, expected)
-
-    def test_apply(self):
-        tests = []
-
-        tests.append((CDay(), {datetime(2008, 1, 1): datetime(2008, 1, 2),
-                               datetime(2008, 1, 4): datetime(2008, 1, 7),
-                               datetime(2008, 1, 5): datetime(2008, 1, 7),
-                               datetime(2008, 1, 6): datetime(2008, 1, 7),
-                               datetime(2008, 1, 7): datetime(2008, 1, 8)}))
-
-        tests.append((2 * CDay(), {
-            datetime(2008, 1, 1): datetime(2008, 1, 3),
-            datetime(2008, 1, 4): datetime(2008, 1, 8),
-            datetime(2008, 1, 5): datetime(2008, 1, 8),
-            datetime(2008, 1, 6): datetime(2008, 1, 8),
-            datetime(2008, 1, 7): datetime(2008, 1, 9)}
-        ))
-
-        tests.append((-CDay(), {
-            datetime(2008, 1, 1): datetime(2007, 12, 31),
-            datetime(2008, 1, 4): datetime(2008, 1, 3),
-            datetime(2008, 1, 5): datetime(2008, 1, 4),
-            datetime(2008, 1, 6): datetime(2008, 1, 4),
-            datetime(2008, 1, 7): datetime(2008, 1, 4),
-            datetime(2008, 1, 8): datetime(2008, 1, 7)}
-        ))
-
-        tests.append((-2 * CDay(), {
-            datetime(2008, 1, 1): datetime(2007, 12, 28),
-            datetime(2008, 1, 4): datetime(2008, 1, 2),
-            datetime(2008, 1, 5): datetime(2008, 1, 3),
-            datetime(2008, 1, 6): datetime(2008, 1, 3),
-            datetime(2008, 1, 7): datetime(2008, 1, 3),
-            datetime(2008, 1, 8): datetime(2008, 1, 4),
-            datetime(2008, 1, 9): datetime(2008, 1, 7)}
-        ))
-
-        tests.append((CDay(0), {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                                datetime(2008, 1, 4): datetime(2008, 1, 4),
-                                datetime(2008, 1, 5): datetime(2008, 1, 7),
-                                datetime(2008, 1, 6): datetime(2008, 1, 7),
-                                datetime(2008, 1, 7): datetime(2008, 1, 7)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CDay(10)
-        self.assertEqual(result, datetime(2012, 11, 6))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CDay() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 12, 23)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2011, 12, 26)
-        self.assertEqual(rs, xp)
-
-    def test_apply_corner(self):
-        self.assertRaises(Exception, CDay().apply, BMonthEnd())
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = CDay()
-        offset2 = CDay()
-        self.assertFalse(offset1 != offset2)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-05-01', datetime(2013, 5, 1),
-                    np.datetime64('2014-05-01')]
-        tday = CDay(holidays=holidays)
-        for year in range(2012, 2015):
-            dt = datetime(year, 4, 30)
-            xp = datetime(year, 5, 2)
-            rs = dt + tday
-            self.assertEqual(rs, xp)
-
-    def test_weekmask(self):
-        weekmask_saudi = 'Sat Sun Mon Tue Wed'  # Thu-Fri Weekend
-        weekmask_uae = '1111001'  # Fri-Sat Weekend
-        weekmask_egypt = [1, 1, 1, 1, 0, 0, 1]  # Fri-Sat Weekend
-        bday_saudi = CDay(weekmask=weekmask_saudi)
-        bday_uae = CDay(weekmask=weekmask_uae)
-        bday_egypt = CDay(weekmask=weekmask_egypt)
-        dt = datetime(2013, 5, 1)
-        xp_saudi = datetime(2013, 5, 4)
-        xp_uae = datetime(2013, 5, 2)
-        xp_egypt = datetime(2013, 5, 2)
-        self.assertEqual(xp_saudi, dt + bday_saudi)
-        self.assertEqual(xp_uae, dt + bday_uae)
-        self.assertEqual(xp_egypt, dt + bday_egypt)
-        xp2 = datetime(2013, 5, 5)
-        self.assertEqual(xp2, dt + 2 * bday_saudi)
-        self.assertEqual(xp2, dt + 2 * bday_uae)
-        self.assertEqual(xp2, dt + 2 * bday_egypt)
-
-    def test_weekmask_and_holidays(self):
-        weekmask_egypt = 'Sun Mon Tue Wed Thu'  # Fri-Sat Weekend
-        holidays = ['2012-05-01', datetime(2013, 5, 1),
-                    np.datetime64('2014-05-01')]
-        bday_egypt = CDay(holidays=holidays, weekmask=weekmask_egypt)
-        dt = datetime(2013, 4, 30)
-        xp_egypt = datetime(2013, 5, 5)
-        self.assertEqual(xp_egypt, dt + 2 * bday_egypt)
-
-    def test_calendar(self):
-        calendar = USFederalHolidayCalendar()
-        dt = datetime(2014, 1, 17)
-        assertEq(CDay(calendar=calendar), dt, datetime(2014, 1, 21))
-
-    def test_roundtrip_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            self.assertEqual(unpickled, obj)
-
-        _check_roundtrip(self.offset)
-        _check_roundtrip(self.offset2)
-        _check_roundtrip(self.offset * 2)
-
-    def test_pickle_compat_0_14_1(self):
-        hdays = [datetime(2013, 1, 1) for ele in range(4)]
-
-        pth = tm.get_data_path()
-
-        cday0_14_1 = read_pickle(os.path.join(pth, 'cday-0.14.1.pickle'))
-        cday = CDay(holidays=hdays)
-        self.assertEqual(cday, cday0_14_1)
-
-
-class CustomBusinessMonthBase(object):
-
-    def setUp(self):
-        self.d = datetime(2008, 1, 1)
-
-        self.offset = self._object()
-        self.offset2 = self._object(2)
-
-    def testEQ(self):
-        self.assertEqual(self.offset2, self.offset2)
-
-    def test_mul(self):
-        pass
-
-    def test_hash(self):
-        self.assertEqual(hash(self.offset2), hash(self.offset2))
-
-    def testRAdd(self):
-        self.assertEqual(self.d + self.offset2, self.offset2 + self.d)
-
-    def testSub(self):
-        off = self.offset2
-        self.assertRaises(Exception, off.__sub__, self.d)
-        self.assertEqual(2 * off - off, off)
-
-        self.assertEqual(self.d - self.offset2, self.d + self._object(-2))
-
-    def testRSub(self):
-        self.assertEqual(self.d - self.offset2, (-self.offset2).apply(self.d))
-
-    def testMult1(self):
-        self.assertEqual(self.d + 10 * self.offset, self.d + self._object(10))
-
-    def testMult2(self):
-        self.assertEqual(self.d + (-5 * self._object(-10)),
-                         self.d + self._object(50))
-
-    def test_offsets_compare_equal(self):
-        offset1 = self._object()
-        offset2 = self._object()
-        self.assertFalse(offset1 != offset2)
-
-    def test_roundtrip_pickle(self):
-        def _check_roundtrip(obj):
-            unpickled = self.round_trip_pickle(obj)
-            self.assertEqual(unpickled, obj)
-
-        _check_roundtrip(self._object())
-        _check_roundtrip(self._object(2))
-        _check_roundtrip(self._object() * 2)
-
-
-class TestCustomBusinessMonthEnd(CustomBusinessMonthBase, Base):
-    _object = CBMonthEnd
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CBMonthEnd()
-        offset2 = CBMonthEnd()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessMonthEnd>'
-        assert repr(self.offset2) == '<2 * CustomBusinessMonthEnds>'
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 2, 29))
-
-    def testRollback1(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2007, 12, 31)), datetime(2007, 12, 31))
-
-    def testRollback2(self):
-        self.assertEqual(CBMonthEnd(10).rollback(self.d),
-                         datetime(2007, 12, 31))
-
-    def testRollforward1(self):
-        self.assertEqual(CBMonthEnd(10).rollforward(
-            self.d), datetime(2008, 1, 31))
-
-    def test_roll_date_object(self):
-        offset = CBMonthEnd()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 8, 31))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 28))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CBMonthEnd(), datetime(2008, 1, 31), True),
-                 (CBMonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, d, expected in tests:
-            assertOnOffset(offset, d, expected)
-
-    def test_apply(self):
-        cbm = CBMonthEnd()
-        tests = []
-
-        tests.append((cbm, {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                            datetime(2008, 2, 7): datetime(2008, 2, 29)}))
-
-        tests.append((2 * cbm, {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                                datetime(2008, 2, 7): datetime(2008, 3, 31)}))
-
-        tests.append((-cbm, {datetime(2008, 1, 1): datetime(2007, 12, 31),
-                             datetime(2008, 2, 8): datetime(2008, 1, 31)}))
-
-        tests.append((-2 * cbm, {datetime(2008, 1, 1): datetime(2007, 11, 30),
-                                 datetime(2008, 2, 9): datetime(2007, 12, 31)}
-                      ))
-
-        tests.append((CBMonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 2, 7): datetime(2008, 2, 29)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CBMonthEnd(10)
-        self.assertEqual(result, datetime(2013, 7, 31))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CBMonthEnd() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 7, 29)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2012, 5, 31)
-        self.assertEqual(rs, xp)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-01-31', datetime(2012, 2, 28),
-                    np.datetime64('2012-02-29')]
-        bm_offset = CBMonthEnd(holidays=holidays)
-        dt = datetime(2012, 1, 1)
-        self.assertEqual(dt + bm_offset, datetime(2012, 1, 30))
-        self.assertEqual(dt + 2 * bm_offset, datetime(2012, 2, 27))
-
-    def test_datetimeindex(self):
-        from pandas.tseries.holiday import USFederalHolidayCalendar
-        hcal = USFederalHolidayCalendar()
-        freq = CBMonthEnd(calendar=hcal)
-
-        self.assertEqual(DatetimeIndex(start='20120101', end='20130101',
-                                       freq=freq).tolist()[0],
-                         datetime(2012, 1, 31))
-
-
-class TestCustomBusinessMonthBegin(CustomBusinessMonthBase, Base):
-    _object = CBMonthBegin
-
-    def test_different_normalize_equals(self):
-        # equivalent in this special case
-        offset = CBMonthBegin()
-        offset2 = CBMonthBegin()
-        offset2.normalize = True
-        self.assertEqual(offset, offset2)
-
-    def test_repr(self):
-        assert repr(self.offset) == '<CustomBusinessMonthBegin>'
-        assert repr(self.offset2) == '<2 * CustomBusinessMonthBegins>'
-
-    def testCall(self):
-        self.assertEqual(self.offset2(self.d), datetime(2008, 3, 3))
-
-    def testRollback1(self):
-        self.assertEqual(
-            CDay(10).rollback(datetime(2007, 12, 31)), datetime(2007, 12, 31))
-
-    def testRollback2(self):
-        self.assertEqual(CBMonthBegin(10).rollback(self.d),
-                         datetime(2008, 1, 1))
-
-    def testRollforward1(self):
-        self.assertEqual(CBMonthBegin(10).rollforward(
-            self.d), datetime(2008, 1, 1))
-
-    def test_roll_date_object(self):
-        offset = CBMonthBegin()
-
-        dt = date(2012, 9, 15)
-
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 3))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 10, 1))
-
-        offset = offsets.Day()
-        result = offset.rollback(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-        result = offset.rollforward(dt)
-        self.assertEqual(result, datetime(2012, 9, 15))
-
-    def test_onOffset(self):
-        tests = [(CBMonthBegin(), datetime(2008, 1, 1), True),
-                 (CBMonthBegin(), datetime(2008, 1, 31), False)]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_apply(self):
-        cbm = CBMonthBegin()
-        tests = []
-
-        tests.append((cbm, {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                            datetime(2008, 2, 7): datetime(2008, 3, 3)}))
-
-        tests.append((2 * cbm, {datetime(2008, 1, 1): datetime(2008, 3, 3),
-                                datetime(2008, 2, 7): datetime(2008, 4, 1)}))
-
-        tests.append((-cbm, {datetime(2008, 1, 1): datetime(2007, 12, 3),
-                             datetime(2008, 2, 8): datetime(2008, 2, 1)}))
-
-        tests.append((-2 * cbm, {datetime(2008, 1, 1): datetime(2007, 11, 1),
-                                 datetime(2008, 2, 9): datetime(2008, 1, 1)}))
-
-        tests.append((CBMonthBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 7): datetime(2008, 2, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_large_n(self):
-        dt = datetime(2012, 10, 23)
-
-        result = dt + CBMonthBegin(10)
-        self.assertEqual(result, datetime(2013, 8, 1))
-
-        result = dt + CDay(100) - CDay(100)
-        self.assertEqual(result, dt)
-
-        off = CBMonthBegin() * 6
-        rs = datetime(2012, 1, 1) - off
-        xp = datetime(2011, 7, 1)
-        self.assertEqual(rs, xp)
-
-        st = datetime(2011, 12, 18)
-        rs = st + off
-        xp = datetime(2012, 6, 1)
-        self.assertEqual(rs, xp)
-
-    def test_holidays(self):
-        # Define a TradingDay offset
-        holidays = ['2012-02-01', datetime(2012, 2, 2),
-                    np.datetime64('2012-03-01')]
-        bm_offset = CBMonthBegin(holidays=holidays)
-        dt = datetime(2012, 1, 1)
-        self.assertEqual(dt + bm_offset, datetime(2012, 1, 2))
-        self.assertEqual(dt + 2 * bm_offset, datetime(2012, 2, 3))
-
-    def test_datetimeindex(self):
-        hcal = USFederalHolidayCalendar()
-        cbmb = CBMonthBegin(calendar=hcal)
-        self.assertEqual(DatetimeIndex(start='20120101', end='20130101',
-                                       freq=cbmb).tolist()[0],
-                         datetime(2012, 1, 3))
-
-
-def assertOnOffset(offset, date, expected):
-    actual = offset.onOffset(date)
-    assert actual == expected, ("\nExpected: %s\nActual: %s\nFor Offset: %s)"
-                                "\nAt Date: %s" %
-                                (expected, actual, offset, date))
-
-
-class TestWeek(Base):
-    _offset = Week
-
-    def test_repr(self):
-        self.assertEqual(repr(Week(weekday=0)), "<Week: weekday=0>")
-        self.assertEqual(repr(Week(n=-1, weekday=0)), "<-1 * Week: weekday=0>")
-        self.assertEqual(repr(Week(n=-2, weekday=0)),
-                         "<-2 * Weeks: weekday=0>")
-
-    def test_corner(self):
-        self.assertRaises(ValueError, Week, weekday=7)
-        assertRaisesRegexp(ValueError, "Day must be", Week, weekday=-1)
-
-    def test_isAnchored(self):
-        self.assertTrue(Week(weekday=0).isAnchored())
-        self.assertFalse(Week().isAnchored())
-        self.assertFalse(Week(2, weekday=2).isAnchored())
-        self.assertFalse(Week(2).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((Week(),  # not business week
-                      {datetime(2008, 1, 1): datetime(2008, 1, 8),
-                       datetime(2008, 1, 4): datetime(2008, 1, 11),
-                       datetime(2008, 1, 5): datetime(2008, 1, 12),
-                       datetime(2008, 1, 6): datetime(2008, 1, 13),
-                       datetime(2008, 1, 7): datetime(2008, 1, 14)}))
-
-        tests.append((Week(weekday=0),  # Mon
-                      {datetime(2007, 12, 31): datetime(2008, 1, 7),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 14)}))
-
-        tests.append((Week(0, weekday=0),  # n=0 -> roll forward. Mon
-                      {datetime(2007, 12, 31): datetime(2007, 12, 31),
-                       datetime(2008, 1, 4): datetime(2008, 1, 7),
-                       datetime(2008, 1, 5): datetime(2008, 1, 7),
-                       datetime(2008, 1, 6): datetime(2008, 1, 7),
-                       datetime(2008, 1, 7): datetime(2008, 1, 7)}))
-
-        tests.append((Week(-2, weekday=1),  # n=0 -> roll forward. Mon
-                      {datetime(2010, 4, 6): datetime(2010, 3, 23),
-                       datetime(2010, 4, 8): datetime(2010, 3, 30),
-                       datetime(2010, 4, 5): datetime(2010, 3, 23)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-        for weekday in range(7):
-            offset = Week(weekday=weekday)
-
-            for day in range(1, 8):
-                date = datetime(2008, 1, day)
-
-                if day % 7 == weekday:
-                    expected = True
-                else:
-                    expected = False
-            assertOnOffset(offset, date, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = Week()
-        offset2 = Week()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestWeekOfMonth(Base):
-    _offset = WeekOfMonth
-
-    def test_constructor(self):
-        assertRaisesRegexp(ValueError, "^N cannot be 0", WeekOfMonth, n=0,
-                           week=1, weekday=1)
-        assertRaisesRegexp(ValueError, "^Week", WeekOfMonth, n=1, week=4,
-                           weekday=0)
-        assertRaisesRegexp(ValueError, "^Week", WeekOfMonth, n=1, week=-1,
-                           weekday=0)
-        assertRaisesRegexp(ValueError, "^Day", WeekOfMonth, n=1, week=0,
-                           weekday=-1)
-        assertRaisesRegexp(ValueError, "^Day", WeekOfMonth, n=1, week=0,
-                           weekday=7)
-
-    def test_repr(self):
-        self.assertEqual(repr(WeekOfMonth(weekday=1, week=2)),
-                         "<WeekOfMonth: week=2, weekday=1>")
-
-    def test_offset(self):
-        date1 = datetime(2011, 1, 4)  # 1st Tuesday of Month
-        date2 = datetime(2011, 1, 11)  # 2nd Tuesday of Month
-        date3 = datetime(2011, 1, 18)  # 3rd Tuesday of Month
-        date4 = datetime(2011, 1, 25)  # 4th Tuesday of Month
-
-        # see for loop for structure
-        test_cases = [
-            (-2, 2, 1, date1, datetime(2010, 11, 16)),
-            (-2, 2, 1, date2, datetime(2010, 11, 16)),
-            (-2, 2, 1, date3, datetime(2010, 11, 16)),
-            (-2, 2, 1, date4, datetime(2010, 12, 21)),
-
-            (-1, 2, 1, date1, datetime(2010, 12, 21)),
-            (-1, 2, 1, date2, datetime(2010, 12, 21)),
-            (-1, 2, 1, date3, datetime(2010, 12, 21)),
-            (-1, 2, 1, date4, datetime(2011, 1, 18)),
-
-            (1, 0, 0, date1, datetime(2011, 2, 7)),
-            (1, 0, 0, date2, datetime(2011, 2, 7)),
-            (1, 0, 0, date3, datetime(2011, 2, 7)),
-            (1, 0, 0, date4, datetime(2011, 2, 7)),
-            (1, 0, 1, date1, datetime(2011, 2, 1)),
-            (1, 0, 1, date2, datetime(2011, 2, 1)),
-            (1, 0, 1, date3, datetime(2011, 2, 1)),
-            (1, 0, 1, date4, datetime(2011, 2, 1)),
-            (1, 0, 2, date1, datetime(2011, 1, 5)),
-            (1, 0, 2, date2, datetime(2011, 2, 2)),
-            (1, 0, 2, date3, datetime(2011, 2, 2)),
-            (1, 0, 2, date4, datetime(2011, 2, 2)),
-
-            (1, 2, 1, date1, datetime(2011, 1, 18)),
-            (1, 2, 1, date2, datetime(2011, 1, 18)),
-            (1, 2, 1, date3, datetime(2011, 2, 15)),
-            (1, 2, 1, date4, datetime(2011, 2, 15)),
-
-            (2, 2, 1, date1, datetime(2011, 2, 15)),
-            (2, 2, 1, date2, datetime(2011, 2, 15)),
-            (2, 2, 1, date3, datetime(2011, 3, 15)),
-            (2, 2, 1, date4, datetime(2011, 3, 15)),
-        ]
-
-        for n, week, weekday, dt, expected in test_cases:
-            offset = WeekOfMonth(n, week=week, weekday=weekday)
-            assertEq(offset, dt, expected)
-
-        # try subtracting
-        result = datetime(2011, 2, 1) - WeekOfMonth(week=1, weekday=2)
-        self.assertEqual(result, datetime(2011, 1, 12))
-        result = datetime(2011, 2, 3) - WeekOfMonth(week=0, weekday=2)
-        self.assertEqual(result, datetime(2011, 2, 2))
-
-    def test_onOffset(self):
-        test_cases = [
-            (0, 0, datetime(2011, 2, 7), True),
-            (0, 0, datetime(2011, 2, 6), False),
-            (0, 0, datetime(2011, 2, 14), False),
-            (1, 0, datetime(2011, 2, 14), True),
-            (0, 1, datetime(2011, 2, 1), True),
-            (0, 1, datetime(2011, 2, 8), False),
-        ]
-
-        for week, weekday, dt, expected in test_cases:
-            offset = WeekOfMonth(week=week, weekday=weekday)
-            self.assertEqual(offset.onOffset(dt), expected)
-
-
-class TestLastWeekOfMonth(Base):
-    _offset = LastWeekOfMonth
-
-    def test_constructor(self):
-        assertRaisesRegexp(ValueError, "^N cannot be 0", LastWeekOfMonth, n=0,
-                           weekday=1)
-
-        assertRaisesRegexp(ValueError, "^Day", LastWeekOfMonth, n=1,
-                           weekday=-1)
-        assertRaisesRegexp(ValueError, "^Day", LastWeekOfMonth, n=1, weekday=7)
-
-    def test_offset(self):
-        # Saturday
-        last_sat = datetime(2013, 8, 31)
-        next_sat = datetime(2013, 9, 28)
-        offset_sat = LastWeekOfMonth(n=1, weekday=5)
-
-        one_day_before = (last_sat + timedelta(days=-1))
-        self.assertEqual(one_day_before + offset_sat, last_sat)
-
-        one_day_after = (last_sat + timedelta(days=+1))
-        self.assertEqual(one_day_after + offset_sat, next_sat)
-
-        # Test On that day
-        self.assertEqual(last_sat + offset_sat, next_sat)
-
-        # Thursday
-
-        offset_thur = LastWeekOfMonth(n=1, weekday=3)
-        last_thurs = datetime(2013, 1, 31)
-        next_thurs = datetime(2013, 2, 28)
-
-        one_day_before = last_thurs + timedelta(days=-1)
-        self.assertEqual(one_day_before + offset_thur, last_thurs)
-
-        one_day_after = last_thurs + timedelta(days=+1)
-        self.assertEqual(one_day_after + offset_thur, next_thurs)
-
-        # Test on that day
-        self.assertEqual(last_thurs + offset_thur, next_thurs)
-
-        three_before = last_thurs + timedelta(days=-3)
-        self.assertEqual(three_before + offset_thur, last_thurs)
-
-        two_after = last_thurs + timedelta(days=+2)
-        self.assertEqual(two_after + offset_thur, next_thurs)
-
-        offset_sunday = LastWeekOfMonth(n=1, weekday=WeekDay.SUN)
-        self.assertEqual(datetime(2013, 7, 31) +
-                         offset_sunday, datetime(2013, 8, 25))
-
-    def test_onOffset(self):
-        test_cases = [
-            (WeekDay.SUN, datetime(2013, 1, 27), True),
-            (WeekDay.SAT, datetime(2013, 3, 30), True),
-            (WeekDay.MON, datetime(2013, 2, 18), False),  # Not the last Mon
-            (WeekDay.SUN, datetime(2013, 2, 25), False),  # Not a SUN
-            (WeekDay.MON, datetime(2013, 2, 25), True),
-            (WeekDay.SAT, datetime(2013, 11, 30), True),
-
-            (WeekDay.SAT, datetime(2006, 8, 26), True),
-            (WeekDay.SAT, datetime(2007, 8, 25), True),
-            (WeekDay.SAT, datetime(2008, 8, 30), True),
-            (WeekDay.SAT, datetime(2009, 8, 29), True),
-            (WeekDay.SAT, datetime(2010, 8, 28), True),
-            (WeekDay.SAT, datetime(2011, 8, 27), True),
-            (WeekDay.SAT, datetime(2019, 8, 31), True),
-        ]
-
-        for weekday, dt, expected in test_cases:
-            offset = LastWeekOfMonth(weekday=weekday)
-            self.assertEqual(offset.onOffset(dt), expected, msg=date)
-
-
-class TestBMonthBegin(Base):
-    _offset = BMonthBegin
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BMonthBegin(),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2006, 9, 1): datetime(2006, 10, 2),
-                       datetime(2007, 1, 1): datetime(2007, 2, 1),
-                       datetime(2006, 12, 1): datetime(2007, 1, 1)}))
-
-        tests.append((BMonthBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2006, 10, 2): datetime(2006, 10, 2),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2006, 9, 15): datetime(2006, 10, 2)}))
-
-        tests.append((BMonthBegin(2),
-                      {datetime(2008, 1, 1): datetime(2008, 3, 3),
-                       datetime(2008, 1, 15): datetime(2008, 3, 3),
-                       datetime(2006, 12, 29): datetime(2007, 2, 1),
-                       datetime(2006, 12, 31): datetime(2007, 2, 1),
-                       datetime(2007, 1, 1): datetime(2007, 3, 1),
-                       datetime(2006, 11, 1): datetime(2007, 1, 1)}))
-
-        tests.append((BMonthBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 1),
-                       datetime(2008, 6, 30): datetime(2008, 6, 2),
-                       datetime(2008, 6, 1): datetime(2008, 5, 1),
-                       datetime(2008, 3, 10): datetime(2008, 3, 3),
-                       datetime(2008, 12, 31): datetime(2008, 12, 1),
-                       datetime(2006, 12, 29): datetime(2006, 12, 1),
-                       datetime(2006, 12, 30): datetime(2006, 12, 1),
-                       datetime(2007, 1, 1): datetime(2006, 12, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [(BMonthBegin(), datetime(2007, 12, 31), False),
-                 (BMonthBegin(), datetime(2008, 1, 1), True),
-                 (BMonthBegin(), datetime(2001, 4, 2), True),
-                 (BMonthBegin(), datetime(2008, 3, 3), True)]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BMonthBegin()
-        offset2 = BMonthBegin()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestBMonthEnd(Base):
-    _offset = BMonthEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BMonthEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2006, 12, 29): datetime(2007, 1, 31),
-                       datetime(2006, 12, 31): datetime(2007, 1, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31),
-                       datetime(2006, 12, 1): datetime(2006, 12, 29)}))
-
-        tests.append((BMonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 29),
-                       datetime(2006, 12, 31): datetime(2007, 1, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31)}))
-
-        tests.append((BMonthEnd(2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 3, 31),
-                       datetime(2006, 12, 29): datetime(2007, 2, 28),
-                       datetime(2006, 12, 31): datetime(2007, 2, 28),
-                       datetime(2007, 1, 1): datetime(2007, 2, 28),
-                       datetime(2006, 11, 1): datetime(2006, 12, 29)}))
-
-        tests.append((BMonthEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 29),
-                       datetime(2008, 6, 30): datetime(2008, 5, 30),
-                       datetime(2008, 12, 31): datetime(2008, 11, 28),
-                       datetime(2006, 12, 29): datetime(2006, 11, 30),
-                       datetime(2006, 12, 30): datetime(2006, 12, 29),
-                       datetime(2007, 1, 1): datetime(2006, 12, 29)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_normalize(self):
-        dt = datetime(2007, 1, 1, 3)
-
-        result = dt + BMonthEnd(normalize=True)
-        expected = dt.replace(hour=0) + BMonthEnd()
-        self.assertEqual(result, expected)
-
-    def test_onOffset(self):
-
-        tests = [(BMonthEnd(), datetime(2007, 12, 31), True),
-                 (BMonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_offsets_compare_equal(self):
-        # root cause of #456
-        offset1 = BMonthEnd()
-        offset2 = BMonthEnd()
-        self.assertFalse(offset1 != offset2)
-
-
-class TestMonthBegin(Base):
-    _offset = MonthBegin
-
-    def test_offset(self):
-        tests = []
-
-        # NOTE: I'm not entirely happy with the logic here for Begin -ss
-        # see thread 'offset conventions' on the ML
-        tests.append((MonthBegin(),
-                      {datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 2, 1): datetime(2008, 3, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2006, 12, 1): datetime(2007, 1, 1),
-                       datetime(2007, 1, 31): datetime(2007, 2, 1)}))
-
-        tests.append((MonthBegin(0),
-                      {datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2006, 12, 3): datetime(2007, 1, 1),
-                       datetime(2007, 1, 31): datetime(2007, 2, 1)}))
-
-        tests.append((MonthBegin(2),
-                      {datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 1, 31): datetime(2008, 3, 1),
-                       datetime(2006, 12, 31): datetime(2007, 2, 1),
-                       datetime(2007, 12, 28): datetime(2008, 2, 1),
-                       datetime(2007, 1, 1): datetime(2007, 3, 1),
-                       datetime(2006, 11, 1): datetime(2007, 1, 1)}))
-
-        tests.append((MonthBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 1),
-                       datetime(2008, 5, 31): datetime(2008, 5, 1),
-                       datetime(2008, 12, 31): datetime(2008, 12, 1),
-                       datetime(2006, 12, 29): datetime(2006, 12, 1),
-                       datetime(2006, 1, 2): datetime(2006, 1, 1)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-
-class TestMonthEnd(Base):
-    _offset = MonthEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((MonthEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2007, 1, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31),
-                       datetime(2006, 12, 1): datetime(2006, 12, 31)}))
-
-        tests.append((MonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2006, 12, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31)}))
-
-        tests.append((MonthEnd(2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 3, 31),
-                       datetime(2006, 12, 29): datetime(2007, 1, 31),
-                       datetime(2006, 12, 31): datetime(2007, 2, 28),
-                       datetime(2007, 1, 1): datetime(2007, 2, 28),
-                       datetime(2006, 11, 1): datetime(2006, 12, 31)}))
-
-        tests.append((MonthEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 5, 31),
-                       datetime(2008, 12, 31): datetime(2008, 11, 30),
-                       datetime(2006, 12, 29): datetime(2006, 11, 30),
-                       datetime(2006, 12, 30): datetime(2006, 11, 30),
-                       datetime(2007, 1, 1): datetime(2006, 12, 31)}))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    # def test_day_of_month(self):
-    #     dt = datetime(2007, 1, 1)
-
-    #     offset = MonthEnd(day=20)
-
-    #     result = dt + offset
-    #     self.assertEqual(result, datetime(2007, 1, 20))
-
-    #     result = result + offset
-    #     self.assertEqual(result, datetime(2007, 2, 20))
-
-    def test_normalize(self):
-        dt = datetime(2007, 1, 1, 3)
-
-        result = dt + MonthEnd(normalize=True)
-        expected = dt.replace(hour=0) + MonthEnd()
-        self.assertEqual(result, expected)
-
-    def test_onOffset(self):
-
-        tests = [(MonthEnd(), datetime(2007, 12, 31), True),
-                 (MonthEnd(), datetime(2008, 1, 1), False)]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestSemiMonthEnd(Base):
-    _offset = SemiMonthEnd
-
-    def _get_tests(self):
-        tests = []
-
-        tests.append((SemiMonthEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 15),
-                       datetime(2008, 1, 15): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 2, 15),
-                       datetime(2006, 12, 14): datetime(2006, 12, 15),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2007, 1, 15),
-                       datetime(2007, 1, 1): datetime(2007, 1, 15),
-                       datetime(2006, 12, 1): datetime(2006, 12, 15),
-                       datetime(2006, 12, 15): datetime(2006, 12, 31)}))
-
-        tests.append((SemiMonthEnd(day_of_month=20),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 20),
-                       datetime(2008, 1, 15): datetime(2008, 1, 20),
-                       datetime(2008, 1, 21): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 2, 20),
-                       datetime(2006, 12, 14): datetime(2006, 12, 20),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2007, 1, 20),
-                       datetime(2007, 1, 1): datetime(2007, 1, 20),
-                       datetime(2006, 12, 1): datetime(2006, 12, 20),
-                       datetime(2006, 12, 15): datetime(2006, 12, 20)}))
-
-        tests.append((SemiMonthEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 15),
-                       datetime(2008, 1, 16): datetime(2008, 1, 31),
-                       datetime(2008, 1, 15): datetime(2008, 1, 15),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2006, 12, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 15)}))
-
-        tests.append((SemiMonthEnd(0, day_of_month=16),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 16),
-                       datetime(2008, 1, 16): datetime(2008, 1, 16),
-                       datetime(2008, 1, 15): datetime(2008, 1, 16),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2006, 12, 29): datetime(2006, 12, 31),
-                       datetime(2006, 12, 31): datetime(2006, 12, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 16)}))
-
-        tests.append((SemiMonthEnd(2),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2006, 12, 29): datetime(2007, 1, 15),
-                       datetime(2006, 12, 31): datetime(2007, 1, 31),
-                       datetime(2007, 1, 1): datetime(2007, 1, 31),
-                       datetime(2007, 1, 16): datetime(2007, 2, 15),
-                       datetime(2006, 11, 1): datetime(2006, 11, 30)}))
-
-        tests.append((SemiMonthEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 6, 15),
-                       datetime(2008, 12, 31): datetime(2008, 12, 15),
-                       datetime(2006, 12, 29): datetime(2006, 12, 15),
-                       datetime(2006, 12, 30): datetime(2006, 12, 15),
-                       datetime(2007, 1, 1): datetime(2006, 12, 31)}))
-
-        tests.append((SemiMonthEnd(-1, day_of_month=4),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                       datetime(2007, 1, 4): datetime(2006, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 6, 4),
-                       datetime(2008, 12, 31): datetime(2008, 12, 4),
-                       datetime(2006, 12, 5): datetime(2006, 12, 4),
-                       datetime(2006, 12, 30): datetime(2006, 12, 4),
-                       datetime(2007, 1, 1): datetime(2006, 12, 31)}))
-
-        tests.append((SemiMonthEnd(-2),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 15),
-                       datetime(2008, 6, 30): datetime(2008, 5, 31),
-                       datetime(2008, 3, 15): datetime(2008, 2, 15),
-                       datetime(2008, 12, 31): datetime(2008, 11, 30),
-                       datetime(2006, 12, 29): datetime(2006, 11, 30),
-                       datetime(2006, 12, 14): datetime(2006, 11, 15),
-                       datetime(2007, 1, 1): datetime(2006, 12, 15)}))
-
-        return tests
-
-    def test_offset_whole_year(self):
-        dates = (datetime(2007, 12, 31),
-                 datetime(2008, 1, 15),
-                 datetime(2008, 1, 31),
-                 datetime(2008, 2, 15),
-                 datetime(2008, 2, 29),
-                 datetime(2008, 3, 15),
-                 datetime(2008, 3, 31),
-                 datetime(2008, 4, 15),
-                 datetime(2008, 4, 30),
-                 datetime(2008, 5, 15),
-                 datetime(2008, 5, 31),
-                 datetime(2008, 6, 15),
-                 datetime(2008, 6, 30),
-                 datetime(2008, 7, 15),
-                 datetime(2008, 7, 31),
-                 datetime(2008, 8, 15),
-                 datetime(2008, 8, 31),
-                 datetime(2008, 9, 15),
-                 datetime(2008, 9, 30),
-                 datetime(2008, 10, 15),
-                 datetime(2008, 10, 31),
-                 datetime(2008, 11, 15),
-                 datetime(2008, 11, 30),
-                 datetime(2008, 12, 15),
-                 datetime(2008, 12, 31))
-
-        for base, exp_date in zip(dates[:-1], dates[1:]):
-            assertEq(SemiMonthEnd(), base, exp_date)
-
-        # ensure .apply_index works as expected
-        s = DatetimeIndex(dates[:-1])
-        result = SemiMonthEnd().apply_index(s)
-        exp = DatetimeIndex(dates[1:])
-        tm.assert_index_equal(result, exp)
-
-        # ensure generating a range with DatetimeIndex gives same result
-        result = DatetimeIndex(start=dates[0], end=dates[-1], freq='SM')
-        exp = DatetimeIndex(dates)
-        tm.assert_index_equal(result, exp)
-
-    def test_offset(self):
-        for offset, cases in self._get_tests():
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_index(self):
-        for offset, cases in self._get_tests():
-            s = DatetimeIndex(cases.keys())
-            result = offset.apply_index(s)
-            exp = DatetimeIndex(cases.values())
-            tm.assert_index_equal(result, exp)
-
-    def test_onOffset(self):
-
-        tests = [(datetime(2007, 12, 31), True),
-                 (datetime(2007, 12, 15), True),
-                 (datetime(2007, 12, 14), False),
-                 (datetime(2007, 12, 1), False),
-                 (datetime(2008, 2, 29), True)]
-
-        for dt, expected in tests:
-            assertOnOffset(SemiMonthEnd(), dt, expected)
-
-    def test_vectorized_offset_addition(self):
-        for klass, assert_func in zip([Series, DatetimeIndex],
-                                      [self.assert_series_equal,
-                                       tm.assert_index_equal]):
-            s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                       Timestamp('2000-02-15', tz='US/Central')], name='a')
-
-            result = s + SemiMonthEnd()
-            result2 = SemiMonthEnd() + s
-            exp = klass([Timestamp('2000-01-31 00:15:00', tz='US/Central'),
-                         Timestamp('2000-02-29', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-            s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
-                       Timestamp('2000-02-01', tz='US/Central')], name='a')
-            result = s + SemiMonthEnd()
-            result2 = SemiMonthEnd() + s
-            exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                         Timestamp('2000-02-15', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-
-class TestSemiMonthBegin(Base):
-    _offset = SemiMonthBegin
-
-    def _get_tests(self):
-        tests = []
-
-        tests.append((SemiMonthBegin(),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 15),
-                       datetime(2008, 1, 15): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 14): datetime(2006, 12, 15),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2007, 1, 1): datetime(2007, 1, 15),
-                       datetime(2006, 12, 1): datetime(2006, 12, 15),
-                       datetime(2006, 12, 15): datetime(2007, 1, 1)}))
-
-        tests.append((SemiMonthBegin(day_of_month=20),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 20),
-                       datetime(2008, 1, 15): datetime(2008, 1, 20),
-                       datetime(2008, 1, 21): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 14): datetime(2006, 12, 20),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2007, 1, 1): datetime(2007, 1, 20),
-                       datetime(2006, 12, 1): datetime(2006, 12, 20),
-                       datetime(2006, 12, 15): datetime(2006, 12, 20)}))
-
-        tests.append((SemiMonthBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 16): datetime(2008, 2, 1),
-                       datetime(2008, 1, 15): datetime(2008, 1, 15),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 2): datetime(2006, 12, 15),
-                       datetime(2007, 1, 1): datetime(2007, 1, 1)}))
-
-        tests.append((SemiMonthBegin(0, day_of_month=16),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 16): datetime(2008, 1, 16),
-                       datetime(2008, 1, 15): datetime(2008, 1, 16),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 1),
-                       datetime(2006, 12, 31): datetime(2007, 1, 1),
-                       datetime(2007, 1, 5): datetime(2007, 1, 16),
-                       datetime(2007, 1, 1): datetime(2007, 1, 1)}))
-
-        tests.append((SemiMonthBegin(2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 15),
-                       datetime(2006, 12, 1): datetime(2007, 1, 1),
-                       datetime(2006, 12, 29): datetime(2007, 1, 15),
-                       datetime(2006, 12, 15): datetime(2007, 1, 15),
-                       datetime(2007, 1, 1): datetime(2007, 2, 1),
-                       datetime(2007, 1, 16): datetime(2007, 2, 15),
-                       datetime(2006, 11, 1): datetime(2006, 12, 1)}))
-
-        tests.append((SemiMonthBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 15),
-                       datetime(2008, 6, 30): datetime(2008, 6, 15),
-                       datetime(2008, 6, 14): datetime(2008, 6, 1),
-                       datetime(2008, 12, 31): datetime(2008, 12, 15),
-                       datetime(2006, 12, 29): datetime(2006, 12, 15),
-                       datetime(2006, 12, 15): datetime(2006, 12, 1),
-                       datetime(2007, 1, 1): datetime(2006, 12, 15)}))
-
-        tests.append((SemiMonthBegin(-1, day_of_month=4),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 4),
-                       datetime(2007, 1, 4): datetime(2007, 1, 1),
-                       datetime(2008, 6, 30): datetime(2008, 6, 4),
-                       datetime(2008, 12, 31): datetime(2008, 12, 4),
-                       datetime(2006, 12, 5): datetime(2006, 12, 4),
-                       datetime(2006, 12, 30): datetime(2006, 12, 4),
-                       datetime(2006, 12, 2): datetime(2006, 12, 1),
-                       datetime(2007, 1, 1): datetime(2006, 12, 4)}))
-
-        tests.append((SemiMonthBegin(-2),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 1),
-                       datetime(2008, 6, 30): datetime(2008, 6, 1),
-                       datetime(2008, 6, 14): datetime(2008, 5, 15),
-                       datetime(2008, 12, 31): datetime(2008, 12, 1),
-                       datetime(2006, 12, 29): datetime(2006, 12, 1),
-                       datetime(2006, 12, 15): datetime(2006, 11, 15),
-                       datetime(2007, 1, 1): datetime(2006, 12, 1)}))
-
-        return tests
-
-    def test_offset_whole_year(self):
-        dates = (datetime(2007, 12, 15),
-                 datetime(2008, 1, 1),
-                 datetime(2008, 1, 15),
-                 datetime(2008, 2, 1),
-                 datetime(2008, 2, 15),
-                 datetime(2008, 3, 1),
-                 datetime(2008, 3, 15),
-                 datetime(2008, 4, 1),
-                 datetime(2008, 4, 15),
-                 datetime(2008, 5, 1),
-                 datetime(2008, 5, 15),
-                 datetime(2008, 6, 1),
-                 datetime(2008, 6, 15),
-                 datetime(2008, 7, 1),
-                 datetime(2008, 7, 15),
-                 datetime(2008, 8, 1),
-                 datetime(2008, 8, 15),
-                 datetime(2008, 9, 1),
-                 datetime(2008, 9, 15),
-                 datetime(2008, 10, 1),
-                 datetime(2008, 10, 15),
-                 datetime(2008, 11, 1),
-                 datetime(2008, 11, 15),
-                 datetime(2008, 12, 1),
-                 datetime(2008, 12, 15))
-
-        for base, exp_date in zip(dates[:-1], dates[1:]):
-            assertEq(SemiMonthBegin(), base, exp_date)
-
-        # ensure .apply_index works as expected
-        s = DatetimeIndex(dates[:-1])
-        result = SemiMonthBegin().apply_index(s)
-        exp = DatetimeIndex(dates[1:])
-        tm.assert_index_equal(result, exp)
-
-        # ensure generating a range with DatetimeIndex gives same result
-        result = DatetimeIndex(start=dates[0], end=dates[-1], freq='SMS')
-        exp = DatetimeIndex(dates)
-        tm.assert_index_equal(result, exp)
-
-    def test_offset(self):
-        for offset, cases in self._get_tests():
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_apply_index(self):
-        for offset, cases in self._get_tests():
-            s = DatetimeIndex(cases.keys())
-            result = offset.apply_index(s)
-            exp = DatetimeIndex(cases.values())
-            tm.assert_index_equal(result, exp)
-
-    def test_onOffset(self):
-        tests = [(datetime(2007, 12, 1), True),
-                 (datetime(2007, 12, 15), True),
-                 (datetime(2007, 12, 14), False),
-                 (datetime(2007, 12, 31), False),
-                 (datetime(2008, 2, 15), True)]
-
-        for dt, expected in tests:
-            assertOnOffset(SemiMonthBegin(), dt, expected)
-
-    def test_vectorized_offset_addition(self):
-        for klass, assert_func in zip([Series, DatetimeIndex],
-                                      [self.assert_series_equal,
-                                       tm.assert_index_equal]):
-
-            s = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                       Timestamp('2000-02-15', tz='US/Central')], name='a')
-            result = s + SemiMonthBegin()
-            result2 = SemiMonthBegin() + s
-            exp = klass([Timestamp('2000-02-01 00:15:00', tz='US/Central'),
-                         Timestamp('2000-03-01', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-            s = klass([Timestamp('2000-01-01 00:15:00', tz='US/Central'),
-                       Timestamp('2000-02-01', tz='US/Central')], name='a')
-            result = s + SemiMonthBegin()
-            result2 = SemiMonthBegin() + s
-            exp = klass([Timestamp('2000-01-15 00:15:00', tz='US/Central'),
-                         Timestamp('2000-02-15', tz='US/Central')], name='a')
-            assert_func(result, exp)
-            assert_func(result2, exp)
-
-
-class TestBQuarterBegin(Base):
-    _offset = BQuarterBegin
-
-    def test_repr(self):
-        self.assertEqual(repr(BQuarterBegin()),
-                         "<BusinessQuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(BQuarterBegin(startingMonth=3)),
-                         "<BusinessQuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(BQuarterBegin(startingMonth=1)),
-                         "<BusinessQuarterBegin: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(BQuarterBegin(startingMonth=1).isAnchored())
-        self.assertTrue(BQuarterBegin().isAnchored())
-        self.assertFalse(BQuarterBegin(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BQuarterBegin(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 4, 1),
-                       datetime(2008, 1, 31): datetime(2008, 4, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 7, 1),
-                       datetime(2007, 3, 15): datetime(2007, 4, 2),
-                       datetime(2007, 2, 28): datetime(2007, 4, 2),
-                       datetime(2007, 1, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 15): datetime(2007, 7, 2),
-                       datetime(2007, 7, 1): datetime(2007, 7, 2),
-                       datetime(2007, 4, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 2): datetime(2007, 7, 2),
-                       datetime(2008, 4, 30): datetime(2008, 7, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 15): datetime(2008, 2, 1),
-                       datetime(2008, 2, 29): datetime(2008, 5, 1),
-                       datetime(2008, 3, 15): datetime(2008, 5, 1),
-                       datetime(2008, 3, 31): datetime(2008, 5, 1),
-                       datetime(2008, 4, 15): datetime(2008, 5, 1),
-                       datetime(2008, 8, 15): datetime(2008, 11, 3),
-                       datetime(2008, 9, 15): datetime(2008, 11, 3),
-                       datetime(2008, 11, 1): datetime(2008, 11, 3),
-                       datetime(2008, 4, 30): datetime(2008, 5, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2007, 12, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 1, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 27): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2007, 4, 1): datetime(2007, 4, 2),
-                       datetime(2007, 4, 2): datetime(2007, 4, 2),
-                       datetime(2007, 7, 1): datetime(2007, 7, 2),
-                       datetime(2007, 4, 15): datetime(2007, 7, 2),
-                       datetime(2007, 7, 2): datetime(2007, 7, 2), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 1),
-                       datetime(2008, 1, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 1, 1),
-                       datetime(2008, 2, 29): datetime(2008, 1, 1),
-                       datetime(2008, 3, 15): datetime(2008, 1, 1),
-                       datetime(2008, 3, 31): datetime(2008, 1, 1),
-                       datetime(2008, 4, 15): datetime(2008, 4, 1),
-                       datetime(2007, 7, 3): datetime(2007, 7, 2),
-                       datetime(2007, 4, 3): datetime(2007, 4, 2),
-                       datetime(2007, 7, 2): datetime(2007, 4, 2),
-                       datetime(2008, 4, 1): datetime(2008, 1, 1), }))
-
-        tests.append((BQuarterBegin(startingMonth=1, n=2),
-                      {datetime(2008, 1, 1): datetime(2008, 7, 1),
-                       datetime(2008, 1, 15): datetime(2008, 7, 1),
-                       datetime(2008, 2, 29): datetime(2008, 7, 1),
-                       datetime(2008, 3, 15): datetime(2008, 7, 1),
-                       datetime(2007, 3, 31): datetime(2007, 7, 2),
-                       datetime(2007, 4, 15): datetime(2007, 10, 1),
-                       datetime(2008, 4, 30): datetime(2008, 10, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = BQuarterBegin(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2007, 4, 3) + offset, datetime(2007, 4, 2))
-
-
-class TestBQuarterEnd(Base):
-    _offset = BQuarterEnd
-
-    def test_repr(self):
-        self.assertEqual(repr(BQuarterEnd()),
-                         "<BusinessQuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(BQuarterEnd(startingMonth=3)),
-                         "<BusinessQuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(BQuarterEnd(startingMonth=1)),
-                         "<BusinessQuarterEnd: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(BQuarterEnd(startingMonth=1).isAnchored())
-        self.assertTrue(BQuarterEnd().isAnchored())
-        self.assertFalse(BQuarterEnd(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BQuarterEnd(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 4, 30),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 7, 31), }))
-
-        tests.append((BQuarterEnd(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2008, 2, 15): datetime(2008, 2, 29),
-                       datetime(2008, 2, 29): datetime(2008, 5, 30),
-                       datetime(2008, 3, 15): datetime(2008, 5, 30),
-                       datetime(2008, 3, 31): datetime(2008, 5, 30),
-                       datetime(2008, 4, 15): datetime(2008, 5, 30),
-                       datetime(2008, 4, 30): datetime(2008, 5, 30), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 4, 30), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 31),
-                       datetime(2008, 1, 31): datetime(2007, 10, 31),
-                       datetime(2008, 2, 15): datetime(2008, 1, 31),
-                       datetime(2008, 2, 29): datetime(2008, 1, 31),
-                       datetime(2008, 3, 15): datetime(2008, 1, 31),
-                       datetime(2008, 3, 31): datetime(2008, 1, 31),
-                       datetime(2008, 4, 15): datetime(2008, 1, 31),
-                       datetime(2008, 4, 30): datetime(2008, 1, 31), }))
-
-        tests.append((BQuarterEnd(startingMonth=1, n=2),
-                      {datetime(2008, 1, 31): datetime(2008, 7, 31),
-                       datetime(2008, 2, 15): datetime(2008, 7, 31),
-                       datetime(2008, 2, 29): datetime(2008, 7, 31),
-                       datetime(2008, 3, 15): datetime(2008, 7, 31),
-                       datetime(2008, 3, 31): datetime(2008, 7, 31),
-                       datetime(2008, 4, 15): datetime(2008, 7, 31),
-                       datetime(2008, 4, 30): datetime(2008, 10, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = BQuarterEnd(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 1, 31) + offset, datetime(2010, 1, 29))
-
-    def test_onOffset(self):
-
-        tests = [
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 12, 31), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 2, 29), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 30), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
-            (BQuarterEnd(1, startingMonth=1), datetime(2008, 5, 30), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 29), False),
-            (BQuarterEnd(1, startingMonth=1), datetime(2007, 6, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 1, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 12, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 4, 30), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2008, 5, 30), True),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 29), False),
-            (BQuarterEnd(1, startingMonth=2), datetime(2007, 6, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 1, 31), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 12, 31), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 2, 29), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 30), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 4, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2008, 5, 30), False),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 29), True),
-            (BQuarterEnd(1, startingMonth=3), datetime(2007, 6, 30), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-def makeFY5253LastOfMonthQuarter(*args, **kwds):
-    return FY5253Quarter(*args, variation="last", **kwds)
-
-
-def makeFY5253NearestEndMonthQuarter(*args, **kwds):
-    return FY5253Quarter(*args, variation="nearest", **kwds)
-
-
-def makeFY5253NearestEndMonth(*args, **kwds):
-    return FY5253(*args, variation="nearest", **kwds)
-
-
-def makeFY5253LastOfMonth(*args, **kwds):
-    return FY5253(*args, variation="last", **kwds)
-
-
-class TestFY5253LastOfMonth(Base):
-
-    def test_onOffset(self):
-
-        offset_lom_sat_aug = makeFY5253LastOfMonth(1, startingMonth=8,
-                                                   weekday=WeekDay.SAT)
-        offset_lom_sat_sep = makeFY5253LastOfMonth(1, startingMonth=9,
-                                                   weekday=WeekDay.SAT)
-
-        tests = [
-            # From Wikipedia (see:
-            # http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar#Last_Saturday_of_the_month_at_fiscal_year_end)
-            (offset_lom_sat_aug, datetime(2006, 8, 26), True),
-            (offset_lom_sat_aug, datetime(2007, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2008, 8, 30), True),
-            (offset_lom_sat_aug, datetime(2009, 8, 29), True),
-            (offset_lom_sat_aug, datetime(2010, 8, 28), True),
-            (offset_lom_sat_aug, datetime(2011, 8, 27), True),
-            (offset_lom_sat_aug, datetime(2012, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2013, 8, 31), True),
-            (offset_lom_sat_aug, datetime(2014, 8, 30), True),
-            (offset_lom_sat_aug, datetime(2015, 8, 29), True),
-            (offset_lom_sat_aug, datetime(2016, 8, 27), True),
-            (offset_lom_sat_aug, datetime(2017, 8, 26), True),
-            (offset_lom_sat_aug, datetime(2018, 8, 25), True),
-            (offset_lom_sat_aug, datetime(2019, 8, 31), True),
-
-            (offset_lom_sat_aug, datetime(2006, 8, 27), False),
-            (offset_lom_sat_aug, datetime(2007, 8, 28), False),
-            (offset_lom_sat_aug, datetime(2008, 8, 31), False),
-            (offset_lom_sat_aug, datetime(2009, 8, 30), False),
-            (offset_lom_sat_aug, datetime(2010, 8, 29), False),
-            (offset_lom_sat_aug, datetime(2011, 8, 28), False),
-
-            (offset_lom_sat_aug, datetime(2006, 8, 25), False),
-            (offset_lom_sat_aug, datetime(2007, 8, 24), False),
-            (offset_lom_sat_aug, datetime(2008, 8, 29), False),
-            (offset_lom_sat_aug, datetime(2009, 8, 28), False),
-            (offset_lom_sat_aug, datetime(2010, 8, 27), False),
-            (offset_lom_sat_aug, datetime(2011, 8, 26), False),
-            (offset_lom_sat_aug, datetime(2019, 8, 30), False),
-
-            # From GMCR (see for example:
-            # http://yahoo.brand.edgar-online.com/Default.aspx?
-            # companyid=3184&formtypeID=7)
-            (offset_lom_sat_sep, datetime(2010, 9, 25), True),
-            (offset_lom_sat_sep, datetime(2011, 9, 24), True),
-            (offset_lom_sat_sep, datetime(2012, 9, 29), True),
-
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_apply(self):
-        offset_lom_aug_sat = makeFY5253LastOfMonth(startingMonth=8,
-                                                   weekday=WeekDay.SAT)
-        offset_lom_aug_sat_1 = makeFY5253LastOfMonth(n=1, startingMonth=8,
-                                                     weekday=WeekDay.SAT)
-
-        date_seq_lom_aug_sat = [datetime(2006, 8, 26), datetime(2007, 8, 25),
-                                datetime(2008, 8, 30), datetime(2009, 8, 29),
-                                datetime(2010, 8, 28), datetime(2011, 8, 27),
-                                datetime(2012, 8, 25), datetime(2013, 8, 31),
-                                datetime(2014, 8, 30), datetime(2015, 8, 29),
-                                datetime(2016, 8, 27)]
-
-        tests = [
-            (offset_lom_aug_sat, date_seq_lom_aug_sat),
-            (offset_lom_aug_sat_1, date_seq_lom_aug_sat),
-            (offset_lom_aug_sat, [
-                datetime(2006, 8, 25)] + date_seq_lom_aug_sat),
-            (offset_lom_aug_sat_1, [
-                datetime(2006, 8, 27)] + date_seq_lom_aug_sat[1:]),
-            (makeFY5253LastOfMonth(n=-1, startingMonth=8,
-                                   weekday=WeekDay.SAT),
-             list(reversed(date_seq_lom_aug_sat))),
-        ]
-        for test in tests:
-            offset, data = test
-            current = data[0]
-            for datum in data[1:]:
-                current = current + offset
-                self.assertEqual(current, datum)
-
-
-class TestFY5253NearestEndMonth(Base):
-
-    def test_get_target_month_end(self):
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8,
-                                                   weekday=WeekDay.SAT)
-                         .get_target_month_end(
-            datetime(2013, 1, 1)), datetime(2013, 8, 31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=12,
-                                                   weekday=WeekDay.SAT)
-                         .get_target_month_end(datetime(2013, 1, 1)),
-                         datetime(2013, 12, 31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=2,
-                                                   weekday=WeekDay.SAT)
-                         .get_target_month_end(datetime(2013, 1, 1)),
-                         datetime(2013, 2, 28))
-
-    def test_get_year_end(self):
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8,
-                                                   weekday=WeekDay.SAT)
-                         .get_year_end(datetime(2013, 1, 1)),
-                         datetime(2013, 8, 31))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8,
-                                                   weekday=WeekDay.SUN)
-                         .get_year_end(datetime(2013, 1, 1)),
-                         datetime(2013, 9, 1))
-        self.assertEqual(makeFY5253NearestEndMonth(startingMonth=8,
-                                                   weekday=WeekDay.FRI)
-                         .get_year_end(datetime(2013, 1, 1)),
-                         datetime(2013, 8, 30))
-
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                          variation="nearest")
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2012, 1, 1)), datetime(2013, 1, 1))
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2012, 1, 10)), datetime(2013, 1, 1))
-
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2013, 1, 1)), datetime(2013, 12, 31))
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2013, 1, 2)), datetime(2013, 12, 31))
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2013, 1, 3)), datetime(2013, 12, 31))
-        self.assertEqual(offset_n.get_year_end(
-            datetime(2013, 1, 10)), datetime(2013, 12, 31))
-
-        JNJ = FY5253(n=1, startingMonth=12, weekday=6, variation="nearest")
-        self.assertEqual(JNJ.get_year_end(
-            datetime(2006, 1, 1)), datetime(2006, 12, 31))
-
-    def test_onOffset(self):
-        offset_lom_aug_sat = makeFY5253NearestEndMonth(1, startingMonth=8,
-                                                       weekday=WeekDay.SAT)
-        offset_lom_aug_thu = makeFY5253NearestEndMonth(1, startingMonth=8,
-                                                       weekday=WeekDay.THU)
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                          variation="nearest")
-
-        tests = [
-            #    From Wikipedia (see:
-            #    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
-            #    #Saturday_nearest_the_end_of_month)
-            #    2006-09-02   2006 September 2
-            #    2007-09-01   2007 September 1
-            #    2008-08-30   2008 August 30    (leap year)
-            #    2009-08-29   2009 August 29
-            #    2010-08-28   2010 August 28
-            #    2011-09-03   2011 September 3
-            #    2012-09-01   2012 September 1  (leap year)
-            #    2013-08-31   2013 August 31
-            #    2014-08-30   2014 August 30
-            #    2015-08-29   2015 August 29
-            #    2016-09-03   2016 September 3  (leap year)
-            #    2017-09-02   2017 September 2
-            #    2018-09-01   2018 September 1
-            #    2019-08-31   2019 August 31
-            (offset_lom_aug_sat, datetime(2006, 9, 2), True),
-            (offset_lom_aug_sat, datetime(2007, 9, 1), True),
-            (offset_lom_aug_sat, datetime(2008, 8, 30), True),
-            (offset_lom_aug_sat, datetime(2009, 8, 29), True),
-            (offset_lom_aug_sat, datetime(2010, 8, 28), True),
-            (offset_lom_aug_sat, datetime(2011, 9, 3), True),
-
-            (offset_lom_aug_sat, datetime(2016, 9, 3), True),
-            (offset_lom_aug_sat, datetime(2017, 9, 2), True),
-            (offset_lom_aug_sat, datetime(2018, 9, 1), True),
-            (offset_lom_aug_sat, datetime(2019, 8, 31), True),
-
-            (offset_lom_aug_sat, datetime(2006, 8, 27), False),
-            (offset_lom_aug_sat, datetime(2007, 8, 28), False),
-            (offset_lom_aug_sat, datetime(2008, 8, 31), False),
-            (offset_lom_aug_sat, datetime(2009, 8, 30), False),
-            (offset_lom_aug_sat, datetime(2010, 8, 29), False),
-            (offset_lom_aug_sat, datetime(2011, 8, 28), False),
-
-            (offset_lom_aug_sat, datetime(2006, 8, 25), False),
-            (offset_lom_aug_sat, datetime(2007, 8, 24), False),
-            (offset_lom_aug_sat, datetime(2008, 8, 29), False),
-            (offset_lom_aug_sat, datetime(2009, 8, 28), False),
-            (offset_lom_aug_sat, datetime(2010, 8, 27), False),
-            (offset_lom_aug_sat, datetime(2011, 8, 26), False),
-            (offset_lom_aug_sat, datetime(2019, 8, 30), False),
-
-            # From Micron, see:
-            # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
-            (offset_lom_aug_thu, datetime(2012, 8, 30), True),
-            (offset_lom_aug_thu, datetime(2011, 9, 1), True),
-
-            (offset_n, datetime(2012, 12, 31), False),
-            (offset_n, datetime(2013, 1, 1), True),
-            (offset_n, datetime(2013, 1, 2), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_apply(self):
-        date_seq_nem_8_sat = [datetime(2006, 9, 2), datetime(2007, 9, 1),
-                              datetime(2008, 8, 30), datetime(2009, 8, 29),
-                              datetime(2010, 8, 28), datetime(2011, 9, 3)]
-
-        JNJ = [datetime(2005, 1, 2), datetime(2006, 1, 1),
-               datetime(2006, 12, 31), datetime(2007, 12, 30),
-               datetime(2008, 12, 28), datetime(2010, 1, 3),
-               datetime(2011, 1, 2), datetime(2012, 1, 1),
-               datetime(2012, 12, 30)]
-
-        DEC_SAT = FY5253(n=-1, startingMonth=12, weekday=5,
-                         variation="nearest")
-
-        tests = [
-            (makeFY5253NearestEndMonth(startingMonth=8,
-                                       weekday=WeekDay.SAT),
-             date_seq_nem_8_sat),
-            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
-                                       weekday=WeekDay.SAT),
-             date_seq_nem_8_sat),
-            (makeFY5253NearestEndMonth(startingMonth=8, weekday=WeekDay.SAT),
-             [datetime(2006, 9, 1)] + date_seq_nem_8_sat),
-            (makeFY5253NearestEndMonth(n=1, startingMonth=8,
-                                       weekday=WeekDay.SAT),
-             [datetime(2006, 9, 3)] + date_seq_nem_8_sat[1:]),
-            (makeFY5253NearestEndMonth(n=-1, startingMonth=8,
-                                       weekday=WeekDay.SAT),
-             list(reversed(date_seq_nem_8_sat))),
-            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
-                                       weekday=WeekDay.SUN), JNJ),
-            (makeFY5253NearestEndMonth(n=-1, startingMonth=12,
-                                       weekday=WeekDay.SUN),
-             list(reversed(JNJ))),
-            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
-                                       weekday=WeekDay.SUN),
-             [datetime(2005, 1, 2), datetime(2006, 1, 1)]),
-            (makeFY5253NearestEndMonth(n=1, startingMonth=12,
-                                       weekday=WeekDay.SUN),
-             [datetime(2006, 1, 2), datetime(2006, 12, 31)]),
-            (DEC_SAT, [datetime(2013, 1, 15), datetime(2012, 12, 29)])
-        ]
-        for test in tests:
-            offset, data = test
-            current = data[0]
-            for datum in data[1:]:
-                current = current + offset
-                self.assertEqual(current, datum)
-
-
-class TestFY5253LastOfMonthQuarter(Base):
-
-    def test_isAnchored(self):
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(startingMonth=1, weekday=WeekDay.SAT,
-                                         qtr_with_extra_week=4).isAnchored())
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(weekday=WeekDay.SAT, startingMonth=3,
-                                         qtr_with_extra_week=4).isAnchored())
-        self.assertFalse(makeFY5253LastOfMonthQuarter(
-            2, startingMonth=1, weekday=WeekDay.SAT,
-            qtr_with_extra_week=4).isAnchored())
-
-    def test_equality(self):
-        self.assertEqual(makeFY5253LastOfMonthQuarter(startingMonth=1,
-                                                      weekday=WeekDay.SAT,
-                                                      qtr_with_extra_week=4),
-                         makeFY5253LastOfMonthQuarter(startingMonth=1,
-                                                      weekday=WeekDay.SAT,
-                                                      qtr_with_extra_week=4))
-        self.assertNotEqual(
-            makeFY5253LastOfMonthQuarter(
-                startingMonth=1, weekday=WeekDay.SAT,
-                qtr_with_extra_week=4),
-            makeFY5253LastOfMonthQuarter(
-                startingMonth=1, weekday=WeekDay.SUN,
-                qtr_with_extra_week=4))
-        self.assertNotEqual(
-            makeFY5253LastOfMonthQuarter(
-                startingMonth=1, weekday=WeekDay.SAT,
-                qtr_with_extra_week=4),
-            makeFY5253LastOfMonthQuarter(
-                startingMonth=2, weekday=WeekDay.SAT,
-                qtr_with_extra_week=4))
-
-    def test_offset(self):
-        offset = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
-                                              weekday=WeekDay.SAT,
-                                              qtr_with_extra_week=4)
-        offset2 = makeFY5253LastOfMonthQuarter(2, startingMonth=9,
-                                               weekday=WeekDay.SAT,
-                                               qtr_with_extra_week=4)
-        offset4 = makeFY5253LastOfMonthQuarter(4, startingMonth=9,
-                                               weekday=WeekDay.SAT,
-                                               qtr_with_extra_week=4)
-
-        offset_neg1 = makeFY5253LastOfMonthQuarter(-1, startingMonth=9,
-                                                   weekday=WeekDay.SAT,
-                                                   qtr_with_extra_week=4)
-        offset_neg2 = makeFY5253LastOfMonthQuarter(-2, startingMonth=9,
-                                                   weekday=WeekDay.SAT,
-                                                   qtr_with_extra_week=4)
-
-        GMCR = [datetime(2010, 3, 27), datetime(2010, 6, 26),
-                datetime(2010, 9, 25), datetime(2010, 12, 25),
-                datetime(2011, 3, 26), datetime(2011, 6, 25),
-                datetime(2011, 9, 24), datetime(2011, 12, 24),
-                datetime(2012, 3, 24), datetime(2012, 6, 23),
-                datetime(2012, 9, 29), datetime(2012, 12, 29),
-                datetime(2013, 3, 30), datetime(2013, 6, 29)]
-
-        assertEq(offset, base=GMCR[0], expected=GMCR[1])
-        assertEq(offset, base=GMCR[0] + relativedelta(days=-1),
-                 expected=GMCR[0])
-        assertEq(offset, base=GMCR[1], expected=GMCR[2])
-
-        assertEq(offset2, base=GMCR[0], expected=GMCR[2])
-        assertEq(offset4, base=GMCR[0], expected=GMCR[4])
-
-        assertEq(offset_neg1, base=GMCR[-1], expected=GMCR[-2])
-        assertEq(offset_neg1, base=GMCR[-1] + relativedelta(days=+1),
-                 expected=GMCR[-1])
-        assertEq(offset_neg2, base=GMCR[-1], expected=GMCR[-3])
-
-        date = GMCR[0] + relativedelta(days=-1)
-        for expected in GMCR:
-            assertEq(offset, date, expected)
-            date = date + offset
-
-        date = GMCR[-1] + relativedelta(days=+1)
-        for expected in reversed(GMCR):
-            assertEq(offset_neg1, date, expected)
-            date = date + offset_neg1
-
-    def test_onOffset(self):
-        lomq_aug_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=8,
-                                                      weekday=WeekDay.SAT,
-                                                      qtr_with_extra_week=4)
-        lomq_sep_sat_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=9,
-                                                      weekday=WeekDay.SAT,
-                                                      qtr_with_extra_week=4)
-
-        tests = [
-            # From Wikipedia
-            (lomq_aug_sat_4, datetime(2006, 8, 26), True),
-            (lomq_aug_sat_4, datetime(2007, 8, 25), True),
-            (lomq_aug_sat_4, datetime(2008, 8, 30), True),
-            (lomq_aug_sat_4, datetime(2009, 8, 29), True),
-            (lomq_aug_sat_4, datetime(2010, 8, 28), True),
-            (lomq_aug_sat_4, datetime(2011, 8, 27), True),
-            (lomq_aug_sat_4, datetime(2019, 8, 31), True),
-
-            (lomq_aug_sat_4, datetime(2006, 8, 27), False),
-            (lomq_aug_sat_4, datetime(2007, 8, 28), False),
-            (lomq_aug_sat_4, datetime(2008, 8, 31), False),
-            (lomq_aug_sat_4, datetime(2009, 8, 30), False),
-            (lomq_aug_sat_4, datetime(2010, 8, 29), False),
-            (lomq_aug_sat_4, datetime(2011, 8, 28), False),
-
-            (lomq_aug_sat_4, datetime(2006, 8, 25), False),
-            (lomq_aug_sat_4, datetime(2007, 8, 24), False),
-            (lomq_aug_sat_4, datetime(2008, 8, 29), False),
-            (lomq_aug_sat_4, datetime(2009, 8, 28), False),
-            (lomq_aug_sat_4, datetime(2010, 8, 27), False),
-            (lomq_aug_sat_4, datetime(2011, 8, 26), False),
-            (lomq_aug_sat_4, datetime(2019, 8, 30), False),
-
-            # From GMCR
-            (lomq_sep_sat_4, datetime(2010, 9, 25), True),
-            (lomq_sep_sat_4, datetime(2011, 9, 24), True),
-            (lomq_sep_sat_4, datetime(2012, 9, 29), True),
-
-            (lomq_sep_sat_4, datetime(2013, 6, 29), True),
-            (lomq_sep_sat_4, datetime(2012, 6, 23), True),
-            (lomq_sep_sat_4, datetime(2012, 6, 30), False),
-
-            (lomq_sep_sat_4, datetime(2013, 3, 30), True),
-            (lomq_sep_sat_4, datetime(2012, 3, 24), True),
-
-            (lomq_sep_sat_4, datetime(2012, 12, 29), True),
-            (lomq_sep_sat_4, datetime(2011, 12, 24), True),
-
-            # INTC (extra week in Q1)
-            # See: http://www.intc.com/releasedetail.cfm?ReleaseID=542844
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                          weekday=WeekDay.SAT,
-                                          qtr_with_extra_week=1),
-             datetime(2011, 4, 2), True),
-
-            # see: http://google.brand.edgar-online.com/?sym=INTC&formtypeID=7
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                          weekday=WeekDay.SAT,
-                                          qtr_with_extra_week=1),
-             datetime(2012, 12, 29), True),
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                          weekday=WeekDay.SAT,
-                                          qtr_with_extra_week=1),
-             datetime(2011, 12, 31), True),
-            (makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                          weekday=WeekDay.SAT,
-                                          qtr_with_extra_week=1),
-             datetime(2010, 12, 25), True),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_year_has_extra_week(self):
-        # End of long Q1
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                         weekday=WeekDay.SAT,
-                                         qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(2011, 4, 2)))
-
-        # Start of long Q1
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(
-                1, startingMonth=12, weekday=WeekDay.SAT,
-                qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(2010, 12, 26)))
-
-        # End of year before year with long Q1
-        self.assertFalse(
-            makeFY5253LastOfMonthQuarter(
-                1, startingMonth=12, weekday=WeekDay.SAT,
-                qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(2010, 12, 25)))
-
-        for year in [x
-                     for x in range(1994, 2011 + 1)
-                     if x not in [2011, 2005, 2000, 1994]]:
-            self.assertFalse(
-                makeFY5253LastOfMonthQuarter(
-                    1, startingMonth=12, weekday=WeekDay.SAT,
-                    qtr_with_extra_week=1)
-                .year_has_extra_week(datetime(year, 4, 2)))
-
-        # Other long years
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(
-                1, startingMonth=12, weekday=WeekDay.SAT,
-                qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(2005, 4, 2)))
-
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(
-                1, startingMonth=12, weekday=WeekDay.SAT,
-                qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(2000, 4, 2)))
-
-        self.assertTrue(
-            makeFY5253LastOfMonthQuarter(
-                1, startingMonth=12, weekday=WeekDay.SAT,
-                qtr_with_extra_week=1)
-            .year_has_extra_week(datetime(1994, 4, 2)))
-
-    def test_get_weeks(self):
-        sat_dec_1 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                                 weekday=WeekDay.SAT,
-                                                 qtr_with_extra_week=1)
-        sat_dec_4 = makeFY5253LastOfMonthQuarter(1, startingMonth=12,
-                                                 weekday=WeekDay.SAT,
-                                                 qtr_with_extra_week=4)
-
-        self.assertEqual(sat_dec_1.get_weeks(
-            datetime(2011, 4, 2)), [14, 13, 13, 13])
-        self.assertEqual(sat_dec_4.get_weeks(
-            datetime(2011, 4, 2)), [13, 13, 13, 14])
-        self.assertEqual(sat_dec_1.get_weeks(
-            datetime(2010, 12, 25)), [13, 13, 13, 13])
-
-
-class TestFY5253NearestEndMonthQuarter(Base):
-
-    def test_onOffset(self):
-
-        offset_nem_sat_aug_4 = makeFY5253NearestEndMonthQuarter(
-            1, startingMonth=8, weekday=WeekDay.SAT,
-            qtr_with_extra_week=4)
-        offset_nem_thu_aug_4 = makeFY5253NearestEndMonthQuarter(
-            1, startingMonth=8, weekday=WeekDay.THU,
-            qtr_with_extra_week=4)
-        offset_n = FY5253(weekday=WeekDay.TUE, startingMonth=12,
-                          variation="nearest", qtr_with_extra_week=4)
-
-        tests = [
-            # From Wikipedia
-            (offset_nem_sat_aug_4, datetime(2006, 9, 2), True),
-            (offset_nem_sat_aug_4, datetime(2007, 9, 1), True),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 30), True),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 29), True),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 28), True),
-            (offset_nem_sat_aug_4, datetime(2011, 9, 3), True),
-
-            (offset_nem_sat_aug_4, datetime(2016, 9, 3), True),
-            (offset_nem_sat_aug_4, datetime(2017, 9, 2), True),
-            (offset_nem_sat_aug_4, datetime(2018, 9, 1), True),
-            (offset_nem_sat_aug_4, datetime(2019, 8, 31), True),
-
-            (offset_nem_sat_aug_4, datetime(2006, 8, 27), False),
-            (offset_nem_sat_aug_4, datetime(2007, 8, 28), False),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 31), False),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 30), False),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 29), False),
-            (offset_nem_sat_aug_4, datetime(2011, 8, 28), False),
-
-            (offset_nem_sat_aug_4, datetime(2006, 8, 25), False),
-            (offset_nem_sat_aug_4, datetime(2007, 8, 24), False),
-            (offset_nem_sat_aug_4, datetime(2008, 8, 29), False),
-            (offset_nem_sat_aug_4, datetime(2009, 8, 28), False),
-            (offset_nem_sat_aug_4, datetime(2010, 8, 27), False),
-            (offset_nem_sat_aug_4, datetime(2011, 8, 26), False),
-            (offset_nem_sat_aug_4, datetime(2019, 8, 30), False),
-
-            # From Micron, see:
-            # http://google.brand.edgar-online.com/?sym=MU&formtypeID=7
-            (offset_nem_thu_aug_4, datetime(2012, 8, 30), True),
-            (offset_nem_thu_aug_4, datetime(2011, 9, 1), True),
-
-            # See: http://google.brand.edgar-online.com/?sym=MU&formtypeID=13
-            (offset_nem_thu_aug_4, datetime(2013, 5, 30), True),
-            (offset_nem_thu_aug_4, datetime(2013, 2, 28), True),
-            (offset_nem_thu_aug_4, datetime(2012, 11, 29), True),
-            (offset_nem_thu_aug_4, datetime(2012, 5, 31), True),
-            (offset_nem_thu_aug_4, datetime(2007, 3, 1), True),
-            (offset_nem_thu_aug_4, datetime(1994, 3, 3), True),
-
-            (offset_n, datetime(2012, 12, 31), False),
-            (offset_n, datetime(2013, 1, 1), True),
-            (offset_n, datetime(2013, 1, 2), False)
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-    def test_offset(self):
-        offset = makeFY5253NearestEndMonthQuarter(1, startingMonth=8,
-                                                  weekday=WeekDay.THU,
-                                                  qtr_with_extra_week=4)
-
-        MU = [datetime(2012, 5, 31), datetime(2012, 8, 30), datetime(2012, 11,
-                                                                     29),
-              datetime(2013, 2, 28), datetime(2013, 5, 30)]
-
-        date = MU[0] + relativedelta(days=-1)
-        for expected in MU:
-            assertEq(offset, date, expected)
-            date = date + offset
-
-        assertEq(offset, datetime(2012, 5, 31), datetime(2012, 8, 30))
-        assertEq(offset, datetime(2012, 5, 30), datetime(2012, 5, 31))
-
-        offset2 = FY5253Quarter(weekday=5, startingMonth=12, variation="last",
-                                qtr_with_extra_week=4)
-
-        assertEq(offset2, datetime(2013, 1, 15), datetime(2013, 3, 30))
-
-
-class TestQuarterBegin(Base):
-
-    def test_repr(self):
-        self.assertEqual(repr(QuarterBegin()),
-                         "<QuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(QuarterBegin(startingMonth=3)),
-                         "<QuarterBegin: startingMonth=3>")
-        self.assertEqual(repr(QuarterBegin(startingMonth=1)),
-                         "<QuarterBegin: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(QuarterBegin(startingMonth=1).isAnchored())
-        self.assertTrue(QuarterBegin().isAnchored())
-        self.assertFalse(QuarterBegin(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((QuarterBegin(startingMonth=1),
-                      {datetime(2007, 12, 1): datetime(2008, 1, 1),
-                       datetime(2008, 1, 1): datetime(2008, 4, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 7, 1),
-                       datetime(2008, 4, 1): datetime(2008, 7, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 1),
-                       datetime(2008, 1, 31): datetime(2008, 2, 1),
-                       datetime(2008, 1, 15): datetime(2008, 2, 1),
-                       datetime(2008, 2, 29): datetime(2008, 5, 1),
-                       datetime(2008, 3, 15): datetime(2008, 5, 1),
-                       datetime(2008, 3, 31): datetime(2008, 5, 1),
-                       datetime(2008, 4, 15): datetime(2008, 5, 1),
-                       datetime(2008, 4, 30): datetime(2008, 5, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 12, 1): datetime(2009, 1, 1),
-                       datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 4, 1),
-                       datetime(2008, 2, 29): datetime(2008, 4, 1),
-                       datetime(2008, 3, 15): datetime(2008, 4, 1),
-                       datetime(2008, 3, 31): datetime(2008, 4, 1),
-                       datetime(2008, 4, 15): datetime(2008, 7, 1),
-                       datetime(2008, 4, 30): datetime(2008, 7, 1), }))
-
-        tests.append((QuarterBegin(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 1),
-                       datetime(2008, 1, 31): datetime(2008, 1, 1),
-                       datetime(2008, 2, 15): datetime(2008, 1, 1),
-                       datetime(2008, 2, 29): datetime(2008, 1, 1),
-                       datetime(2008, 3, 15): datetime(2008, 1, 1),
-                       datetime(2008, 3, 31): datetime(2008, 1, 1),
-                       datetime(2008, 4, 15): datetime(2008, 4, 1),
-                       datetime(2008, 4, 30): datetime(2008, 4, 1),
-                       datetime(2008, 7, 1): datetime(2008, 4, 1)}))
-
-        tests.append((QuarterBegin(startingMonth=1, n=2),
-                      {datetime(2008, 1, 1): datetime(2008, 7, 1),
-                       datetime(2008, 2, 15): datetime(2008, 7, 1),
-                       datetime(2008, 2, 29): datetime(2008, 7, 1),
-                       datetime(2008, 3, 15): datetime(2008, 7, 1),
-                       datetime(2008, 3, 31): datetime(2008, 7, 1),
-                       datetime(2008, 4, 15): datetime(2008, 10, 1),
-                       datetime(2008, 4, 1): datetime(2008, 10, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = QuarterBegin(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 2, 1) + offset, datetime(2010, 1, 1))
-
-
-class TestQuarterEnd(Base):
-    _offset = QuarterEnd
-
-    def test_repr(self):
-        self.assertEqual(repr(QuarterEnd()), "<QuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(QuarterEnd(startingMonth=3)),
-                         "<QuarterEnd: startingMonth=3>")
-        self.assertEqual(repr(QuarterEnd(startingMonth=1)),
-                         "<QuarterEnd: startingMonth=1>")
-
-    def test_isAnchored(self):
-        self.assertTrue(QuarterEnd(startingMonth=1).isAnchored())
-        self.assertTrue(QuarterEnd().isAnchored())
-        self.assertFalse(QuarterEnd(2, startingMonth=1).isAnchored())
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((QuarterEnd(startingMonth=1),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 4, 30),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 7, 31), }))
-
-        tests.append((QuarterEnd(startingMonth=2),
-                      {datetime(2008, 1, 1): datetime(2008, 2, 29),
-                       datetime(2008, 1, 31): datetime(2008, 2, 29),
-                       datetime(2008, 2, 15): datetime(2008, 2, 29),
-                       datetime(2008, 2, 29): datetime(2008, 5, 31),
-                       datetime(2008, 3, 15): datetime(2008, 5, 31),
-                       datetime(2008, 3, 31): datetime(2008, 5, 31),
-                       datetime(2008, 4, 15): datetime(2008, 5, 31),
-                       datetime(2008, 4, 30): datetime(2008, 5, 31), }))
-
-        tests.append((QuarterEnd(startingMonth=1, n=0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 31),
-                       datetime(2008, 1, 31): datetime(2008, 1, 31),
-                       datetime(2008, 2, 15): datetime(2008, 4, 30),
-                       datetime(2008, 2, 29): datetime(2008, 4, 30),
-                       datetime(2008, 3, 15): datetime(2008, 4, 30),
-                       datetime(2008, 3, 31): datetime(2008, 4, 30),
-                       datetime(2008, 4, 15): datetime(2008, 4, 30),
-                       datetime(2008, 4, 30): datetime(2008, 4, 30), }))
-
-        tests.append((QuarterEnd(startingMonth=1, n=-1),
-                      {datetime(2008, 1, 1): datetime(2007, 10, 31),
-                       datetime(2008, 1, 31): datetime(2007, 10, 31),
-                       datetime(2008, 2, 15): datetime(2008, 1, 31),
-                       datetime(2008, 2, 29): datetime(2008, 1, 31),
-                       datetime(2008, 3, 15): datetime(2008, 1, 31),
-                       datetime(2008, 3, 31): datetime(2008, 1, 31),
-                       datetime(2008, 4, 15): datetime(2008, 1, 31),
-                       datetime(2008, 4, 30): datetime(2008, 1, 31),
-                       datetime(2008, 7, 1): datetime(2008, 4, 30)}))
-
-        tests.append((QuarterEnd(startingMonth=1, n=2),
-                      {datetime(2008, 1, 31): datetime(2008, 7, 31),
-                       datetime(2008, 2, 15): datetime(2008, 7, 31),
-                       datetime(2008, 2, 29): datetime(2008, 7, 31),
-                       datetime(2008, 3, 15): datetime(2008, 7, 31),
-                       datetime(2008, 3, 31): datetime(2008, 7, 31),
-                       datetime(2008, 4, 15): datetime(2008, 7, 31),
-                       datetime(2008, 4, 30): datetime(2008, 10, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-        # corner
-        offset = QuarterEnd(n=-1, startingMonth=1)
-        self.assertEqual(datetime(2010, 2, 1) + offset, datetime(2010, 1, 31))
-
-    def test_onOffset(self):
-
-        tests = [(QuarterEnd(1, startingMonth=1), datetime(2008, 1, 31), True),
-                 (QuarterEnd(1, startingMonth=1), datetime(2007, 12, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2008, 2, 29),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2007, 3, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2008, 4, 30), True),
-                 (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2008, 5, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 29),
-                  False),
-                 (QuarterEnd(1, startingMonth=1), datetime(2007, 6, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 1, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2007, 12, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 2, 29), True),
-                 (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2007, 3, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 4, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2008, 5, 31), True),
-                 (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 29),
-                  False),
-                 (QuarterEnd(1, startingMonth=2), datetime(2007, 6, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2008, 1, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 12, 31),
-                  True),
-                 (QuarterEnd(1, startingMonth=3), datetime(2008, 2, 29),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 3, 31), True),
-                 (QuarterEnd(1, startingMonth=3), datetime(2008, 4, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 30),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2008, 5, 31),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 29),
-                  False),
-                 (QuarterEnd(1, startingMonth=3), datetime(2007, 6, 30),
-                  True), ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestBYearBegin(Base):
-    _offset = BYearBegin
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, BYearBegin, month=13)
-        self.assertRaises(ValueError, BYearEnd, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearBegin(),
-                      {datetime(2008, 1, 1): datetime(2009, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2011, 1, 1): datetime(2011, 1, 3),
-                       datetime(2011, 1, 3): datetime(2012, 1, 2),
-                       datetime(2005, 12, 30): datetime(2006, 1, 2),
-                       datetime(2005, 12, 31): datetime(2006, 1, 2)}))
-
-        tests.append((BYearBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 2),
-                       datetime(2005, 12, 31): datetime(2006, 1, 2), }))
-
-        tests.append((BYearBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 1, 2),
-                       datetime(2009, 1, 4): datetime(2009, 1, 1),
-                       datetime(2009, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2008, 1, 1),
-                       datetime(2008, 12, 31): datetime(2008, 1, 1),
-                       datetime(2006, 12, 29): datetime(2006, 1, 2),
-                       datetime(2006, 12, 30): datetime(2006, 1, 2),
-                       datetime(2006, 1, 1): datetime(2005, 1, 3), }))
-
-        tests.append((BYearBegin(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 1, 3),
-                       datetime(2007, 6, 30): datetime(2006, 1, 2),
-                       datetime(2008, 12, 31): datetime(2007, 1, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-
-class TestYearBegin(Base):
-    _offset = YearBegin
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, YearBegin, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearBegin(),
-                      {datetime(2008, 1, 1): datetime(2009, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 1),
-                       datetime(2005, 12, 31): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(0),
-                      {datetime(2008, 1, 1): datetime(2008, 1, 1),
-                       datetime(2008, 6, 30): datetime(2009, 1, 1),
-                       datetime(2008, 12, 31): datetime(2009, 1, 1),
-                       datetime(2005, 12, 30): datetime(2006, 1, 1),
-                       datetime(2005, 12, 31): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(3),
-                      {datetime(2008, 1, 1): datetime(2011, 1, 1),
-                       datetime(2008, 6, 30): datetime(2011, 1, 1),
-                       datetime(2008, 12, 31): datetime(2011, 1, 1),
-                       datetime(2005, 12, 30): datetime(2008, 1, 1),
-                       datetime(2005, 12, 31): datetime(2008, 1, 1), }))
-
-        tests.append((YearBegin(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 1, 1),
-                       datetime(2007, 1, 15): datetime(2007, 1, 1),
-                       datetime(2008, 6, 30): datetime(2008, 1, 1),
-                       datetime(2008, 12, 31): datetime(2008, 1, 1),
-                       datetime(2006, 12, 29): datetime(2006, 1, 1),
-                       datetime(2006, 12, 30): datetime(2006, 1, 1),
-                       datetime(2007, 1, 1): datetime(2006, 1, 1), }))
-
-        tests.append((YearBegin(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 1, 1),
-                       datetime(2008, 6, 30): datetime(2007, 1, 1),
-                       datetime(2008, 12, 31): datetime(2007, 1, 1), }))
-
-        tests.append((YearBegin(month=4),
-                      {datetime(2007, 4, 1): datetime(2008, 4, 1),
-                       datetime(2007, 4, 15): datetime(2008, 4, 1),
-                       datetime(2007, 3, 1): datetime(2007, 4, 1),
-                       datetime(2007, 12, 15): datetime(2008, 4, 1),
-                       datetime(2012, 1, 31): datetime(2012, 4, 1), }))
-
-        tests.append((YearBegin(0, month=4),
-                      {datetime(2007, 4, 1): datetime(2007, 4, 1),
-                       datetime(2007, 3, 1): datetime(2007, 4, 1),
-                       datetime(2007, 12, 15): datetime(2008, 4, 1),
-                       datetime(2012, 1, 31): datetime(2012, 4, 1), }))
-
-        tests.append((YearBegin(4, month=4),
-                      {datetime(2007, 4, 1): datetime(2011, 4, 1),
-                       datetime(2007, 4, 15): datetime(2011, 4, 1),
-                       datetime(2007, 3, 1): datetime(2010, 4, 1),
-                       datetime(2007, 12, 15): datetime(2011, 4, 1),
-                       datetime(2012, 1, 31): datetime(2015, 4, 1), }))
-
-        tests.append((YearBegin(-1, month=4),
-                      {datetime(2007, 4, 1): datetime(2006, 4, 1),
-                       datetime(2007, 3, 1): datetime(2006, 4, 1),
-                       datetime(2007, 12, 15): datetime(2007, 4, 1),
-                       datetime(2012, 1, 31): datetime(2011, 4, 1), }))
-
-        tests.append((YearBegin(-3, month=4),
-                      {datetime(2007, 4, 1): datetime(2004, 4, 1),
-                       datetime(2007, 3, 1): datetime(2004, 4, 1),
-                       datetime(2007, 12, 15): datetime(2005, 4, 1),
-                       datetime(2012, 1, 31): datetime(2009, 4, 1), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearBegin(), datetime(2007, 1, 3), False),
-            (YearBegin(), datetime(2008, 1, 1), True),
-            (YearBegin(), datetime(2006, 12, 31), False),
-            (YearBegin(), datetime(2006, 1, 2), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestBYearEndLagged(Base):
-
-    def test_bad_month_fail(self):
-        self.assertRaises(Exception, BYearEnd, month=13)
-        self.assertRaises(Exception, BYearEnd, month=0)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearEnd(month=6),
-                      {datetime(2008, 1, 1): datetime(2008, 6, 30),
-                       datetime(2007, 6, 30): datetime(2008, 6, 30)}, ))
-
-        tests.append((BYearEnd(n=-1, month=6),
-                      {datetime(2008, 1, 1): datetime(2007, 6, 29),
-                       datetime(2007, 6, 30): datetime(2007, 6, 29)}, ))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                self.assertEqual(base + offset, expected)
-
-    def test_roll(self):
-        offset = BYearEnd(month=6)
-        date = datetime(2009, 11, 30)
-
-        self.assertEqual(offset.rollforward(date), datetime(2010, 6, 30))
-        self.assertEqual(offset.rollback(date), datetime(2009, 6, 30))
-
-    def test_onOffset(self):
-
-        tests = [
-            (BYearEnd(month=2), datetime(2007, 2, 28), True),
-            (BYearEnd(month=6), datetime(2007, 6, 30), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestBYearEnd(Base):
-    _offset = BYearEnd
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((BYearEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2009, 12, 31),
-                       datetime(2005, 12, 30): datetime(2006, 12, 29),
-                       datetime(2005, 12, 31): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2008, 12, 31),
-                       datetime(2005, 12, 31): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 29),
-                       datetime(2008, 6, 30): datetime(2007, 12, 31),
-                       datetime(2008, 12, 31): datetime(2007, 12, 31),
-                       datetime(2006, 12, 29): datetime(2005, 12, 30),
-                       datetime(2006, 12, 30): datetime(2006, 12, 29),
-                       datetime(2007, 1, 1): datetime(2006, 12, 29), }))
-
-        tests.append((BYearEnd(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 12, 30),
-                       datetime(2008, 6, 30): datetime(2006, 12, 29),
-                       datetime(2008, 12, 31): datetime(2006, 12, 29), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (BYearEnd(), datetime(2007, 12, 31), True),
-            (BYearEnd(), datetime(2008, 1, 1), False),
-            (BYearEnd(), datetime(2006, 12, 31), False),
-            (BYearEnd(), datetime(2006, 12, 29), True),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestYearEnd(Base):
-    _offset = YearEnd
-
-    def test_misspecified(self):
-        self.assertRaises(ValueError, YearEnd, month=13)
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearEnd(),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2009, 12, 31),
-                       datetime(2005, 12, 30): datetime(2005, 12, 31),
-                       datetime(2005, 12, 31): datetime(2006, 12, 31), }))
-
-        tests.append((YearEnd(0),
-                      {datetime(2008, 1, 1): datetime(2008, 12, 31),
-                       datetime(2008, 6, 30): datetime(2008, 12, 31),
-                       datetime(2008, 12, 31): datetime(2008, 12, 31),
-                       datetime(2005, 12, 30): datetime(2005, 12, 31), }))
-
-        tests.append((YearEnd(-1),
-                      {datetime(2007, 1, 1): datetime(2006, 12, 31),
-                       datetime(2008, 6, 30): datetime(2007, 12, 31),
-                       datetime(2008, 12, 31): datetime(2007, 12, 31),
-                       datetime(2006, 12, 29): datetime(2005, 12, 31),
-                       datetime(2006, 12, 30): datetime(2005, 12, 31),
-                       datetime(2007, 1, 1): datetime(2006, 12, 31), }))
-
-        tests.append((YearEnd(-2),
-                      {datetime(2007, 1, 1): datetime(2005, 12, 31),
-                       datetime(2008, 6, 30): datetime(2006, 12, 31),
-                       datetime(2008, 12, 31): datetime(2006, 12, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearEnd(), datetime(2007, 12, 31), True),
-            (YearEnd(), datetime(2008, 1, 1), False),
-            (YearEnd(), datetime(2006, 12, 31), True),
-            (YearEnd(), datetime(2006, 12, 29), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-class TestYearEndDiffMonth(Base):
-
-    def test_offset(self):
-        tests = []
-
-        tests.append((YearEnd(month=3),
-                      {datetime(2008, 1, 1): datetime(2008, 3, 31),
-                       datetime(2008, 2, 15): datetime(2008, 3, 31),
-                       datetime(2008, 3, 31): datetime(2009, 3, 31),
-                       datetime(2008, 3, 30): datetime(2008, 3, 31),
-                       datetime(2005, 3, 31): datetime(2006, 3, 31),
-                       datetime(2006, 7, 30): datetime(2007, 3, 31)}))
-
-        tests.append((YearEnd(0, month=3),
-                      {datetime(2008, 1, 1): datetime(2008, 3, 31),
-                       datetime(2008, 2, 28): datetime(2008, 3, 31),
-                       datetime(2008, 3, 31): datetime(2008, 3, 31),
-                       datetime(2005, 3, 30): datetime(2005, 3, 31), }))
-
-        tests.append((YearEnd(-1, month=3),
-                      {datetime(2007, 1, 1): datetime(2006, 3, 31),
-                       datetime(2008, 2, 28): datetime(2007, 3, 31),
-                       datetime(2008, 3, 31): datetime(2007, 3, 31),
-                       datetime(2006, 3, 29): datetime(2005, 3, 31),
-                       datetime(2006, 3, 30): datetime(2005, 3, 31),
-                       datetime(2007, 3, 1): datetime(2006, 3, 31), }))
-
-        tests.append((YearEnd(-2, month=3),
-                      {datetime(2007, 1, 1): datetime(2005, 3, 31),
-                       datetime(2008, 6, 30): datetime(2007, 3, 31),
-                       datetime(2008, 3, 31): datetime(2006, 3, 31), }))
-
-        for offset, cases in tests:
-            for base, expected in compat.iteritems(cases):
-                assertEq(offset, base, expected)
-
-    def test_onOffset(self):
-
-        tests = [
-            (YearEnd(month=3), datetime(2007, 3, 31), True),
-            (YearEnd(month=3), datetime(2008, 1, 1), False),
-            (YearEnd(month=3), datetime(2006, 3, 31), True),
-            (YearEnd(month=3), datetime(2006, 3, 29), False),
-        ]
-
-        for offset, dt, expected in tests:
-            assertOnOffset(offset, dt, expected)
-
-
-def assertEq(offset, base, expected):
-    actual = offset + base
-    actual_swapped = base + offset
-    actual_apply = offset.apply(base)
-    try:
-        assert actual == expected
-        assert actual_swapped == expected
-        assert actual_apply == expected
-    except AssertionError:
-        raise AssertionError("\nExpected: %s\nActual: %s\nFor Offset: %s)"
-                             "\nAt Date: %s" %
-                             (expected, actual, offset, base))
-
-
-def test_Easter():
-    assertEq(Easter(), datetime(2010, 1, 1), datetime(2010, 4, 4))
-    assertEq(Easter(), datetime(2010, 4, 5), datetime(2011, 4, 24))
-    assertEq(Easter(2), datetime(2010, 1, 1), datetime(2011, 4, 24))
-
-    assertEq(Easter(), datetime(2010, 4, 4), datetime(2011, 4, 24))
-    assertEq(Easter(2), datetime(2010, 4, 4), datetime(2012, 4, 8))
-
-    assertEq(-Easter(), datetime(2011, 1, 1), datetime(2010, 4, 4))
-    assertEq(-Easter(), datetime(2010, 4, 5), datetime(2010, 4, 4))
-    assertEq(-Easter(2), datetime(2011, 1, 1), datetime(2009, 4, 12))
-
-    assertEq(-Easter(), datetime(2010, 4, 4), datetime(2009, 4, 12))
-    assertEq(-Easter(2), datetime(2010, 4, 4), datetime(2008, 3, 23))
-
-
-class TestTicks(tm.TestCase):
-
-    ticks = [Hour, Minute, Second, Milli, Micro, Nano]
-
-    def test_ticks(self):
-        offsets = [(Hour, Timedelta(hours=5)),
-                   (Minute, Timedelta(hours=2, minutes=3)),
-                   (Second, Timedelta(hours=2, seconds=3)),
-                   (Milli, Timedelta(hours=2, milliseconds=3)),
-                   (Micro, Timedelta(hours=2, microseconds=3)),
-                   (Nano, Timedelta(hours=2, nanoseconds=3))]
-
-        for kls, expected in offsets:
-            offset = kls(3)
-            result = offset + Timedelta(hours=2)
-            self.assertTrue(isinstance(result, Timedelta))
-            self.assertEqual(result, expected)
-
-    def test_Hour(self):
-        assertEq(Hour(), datetime(2010, 1, 1), datetime(2010, 1, 1, 1))
-        assertEq(Hour(-1), datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
-        assertEq(2 * Hour(), datetime(2010, 1, 1), datetime(2010, 1, 1, 2))
-        assertEq(-1 * Hour(), datetime(2010, 1, 1, 1), datetime(2010, 1, 1))
-
-        self.assertEqual(Hour(3) + Hour(2), Hour(5))
-        self.assertEqual(Hour(3) - Hour(2), Hour())
-
-        self.assertNotEqual(Hour(4), Hour(1))
-
-    def test_Minute(self):
-        assertEq(Minute(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 1))
-        assertEq(Minute(-1), datetime(2010, 1, 1, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Minute(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 2))
-        assertEq(-1 * Minute(), datetime(2010, 1, 1, 0, 1),
-                 datetime(2010, 1, 1))
-
-        self.assertEqual(Minute(3) + Minute(2), Minute(5))
-        self.assertEqual(Minute(3) - Minute(2), Minute())
-        self.assertNotEqual(Minute(5), Minute())
-
-    def test_Second(self):
-        assertEq(Second(), datetime(2010, 1, 1), datetime(2010, 1, 1, 0, 0, 1))
-        assertEq(Second(-1), datetime(2010, 1, 1,
-                                      0, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Second(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 2))
-        assertEq(-1 * Second(), datetime(2010, 1, 1, 0, 0, 1),
-                 datetime(2010, 1, 1))
-
-        self.assertEqual(Second(3) + Second(2), Second(5))
-        self.assertEqual(Second(3) - Second(2), Second())
-
-    def test_Millisecond(self):
-        assertEq(Milli(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 0, 1000))
-        assertEq(Milli(-1), datetime(2010, 1, 1, 0,
-                                     0, 0, 1000), datetime(2010, 1, 1))
-        assertEq(Milli(2), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 0, 2000))
-        assertEq(2 * Milli(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 0, 2000))
-        assertEq(-1 * Milli(), datetime(2010, 1, 1, 0, 0, 0, 1000),
-                 datetime(2010, 1, 1))
-
-        self.assertEqual(Milli(3) + Milli(2), Milli(5))
-        self.assertEqual(Milli(3) - Milli(2), Milli())
-
-    def test_MillisecondTimestampArithmetic(self):
-        assertEq(Milli(), Timestamp('2010-01-01'),
-                 Timestamp('2010-01-01 00:00:00.001'))
-        assertEq(Milli(-1), Timestamp('2010-01-01 00:00:00.001'),
-                 Timestamp('2010-01-01'))
-
-    def test_Microsecond(self):
-        assertEq(Micro(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 0, 1))
-        assertEq(Micro(-1), datetime(2010, 1, 1,
-                                     0, 0, 0, 1), datetime(2010, 1, 1))
-        assertEq(2 * Micro(), datetime(2010, 1, 1),
-                 datetime(2010, 1, 1, 0, 0, 0, 2))
-        assertEq(-1 * Micro(), datetime(2010, 1, 1, 0, 0, 0, 1),
-                 datetime(2010, 1, 1))
-
-        self.assertEqual(Micro(3) + Micro(2), Micro(5))
-        self.assertEqual(Micro(3) - Micro(2), Micro())
-
-    def test_NanosecondGeneric(self):
-        timestamp = Timestamp(datetime(2010, 1, 1))
-        self.assertEqual(timestamp.nanosecond, 0)
-
-        result = timestamp + Nano(10)
-        self.assertEqual(result.nanosecond, 10)
-
-        reverse_result = Nano(10) + timestamp
-        self.assertEqual(reverse_result.nanosecond, 10)
-
-    def test_Nanosecond(self):
-        timestamp = Timestamp(datetime(2010, 1, 1))
-        assertEq(Nano(), timestamp, timestamp + np.timedelta64(1, 'ns'))
-        assertEq(Nano(-1), timestamp + np.timedelta64(1, 'ns'), timestamp)
-        assertEq(2 * Nano(), timestamp, timestamp + np.timedelta64(2, 'ns'))
-        assertEq(-1 * Nano(), timestamp + np.timedelta64(1, 'ns'), timestamp)
-
-        self.assertEqual(Nano(3) + Nano(2), Nano(5))
-        self.assertEqual(Nano(3) - Nano(2), Nano())
-
-        # GH9284
-        self.assertEqual(Nano(1) + Nano(10), Nano(11))
-        self.assertEqual(Nano(5) + Micro(1), Nano(1005))
-        self.assertEqual(Micro(5) + Nano(1), Nano(5001))
-
-    def test_tick_zero(self):
-        for t1 in self.ticks:
-            for t2 in self.ticks:
-                self.assertEqual(t1(0), t2(0))
-                self.assertEqual(t1(0) + t2(0), t1(0))
-
-                if t1 is not Nano:
-                    self.assertEqual(t1(2) + t2(0), t1(2))
-            if t1 is Nano:
-                self.assertEqual(t1(2) + Nano(0), t1(2))
-
-    def test_tick_equalities(self):
-        for t in self.ticks:
-            self.assertEqual(t(3), t(3))
-            self.assertEqual(t(), t(1))
-
-            # not equals
-            self.assertNotEqual(t(3), t(2))
-            self.assertNotEqual(t(3), t(-3))
-
-    def test_tick_operators(self):
-        for t in self.ticks:
-            self.assertEqual(t(3) + t(2), t(5))
-            self.assertEqual(t(3) - t(2), t(1))
-            self.assertEqual(t(800) + t(300), t(1100))
-            self.assertEqual(t(1000) - t(5), t(995))
-
-    def test_tick_offset(self):
-        for t in self.ticks:
-            self.assertFalse(t().isAnchored())
-
-    def test_compare_ticks(self):
-        for kls in self.ticks:
-            three = kls(3)
-            four = kls(4)
-
-            for _ in range(10):
-                self.assertTrue(three < kls(4))
-                self.assertTrue(kls(3) < four)
-                self.assertTrue(four > kls(3))
-                self.assertTrue(kls(4) > three)
-                self.assertTrue(kls(3) == kls(3))
-                self.assertTrue(kls(3) != kls(4))
-
-
-class TestOffsetNames(tm.TestCase):
-
-    def test_get_offset_name(self):
-        self.assertEqual(BDay().freqstr, 'B')
-        self.assertEqual(BDay(2).freqstr, '2B')
-        self.assertEqual(BMonthEnd().freqstr, 'BM')
-        self.assertEqual(Week(weekday=0).freqstr, 'W-MON')
-        self.assertEqual(Week(weekday=1).freqstr, 'W-TUE')
-        self.assertEqual(Week(weekday=2).freqstr, 'W-WED')
-        self.assertEqual(Week(weekday=3).freqstr, 'W-THU')
-        self.assertEqual(Week(weekday=4).freqstr, 'W-FRI')
-
-        self.assertEqual(LastWeekOfMonth(
-            weekday=WeekDay.SUN).freqstr, "LWOM-SUN")
-        self.assertEqual(
-            makeFY5253LastOfMonthQuarter(weekday=1, startingMonth=3,
-                                         qtr_with_extra_week=4).freqstr,
-            "REQ-L-MAR-TUE-4")
-        self.assertEqual(
-            makeFY5253NearestEndMonthQuarter(weekday=1, startingMonth=3,
-                                             qtr_with_extra_week=3).freqstr,
-            "REQ-N-MAR-TUE-3")
-
-
-def test_get_offset():
-    with tm.assertRaisesRegexp(ValueError, _INVALID_FREQ_ERROR):
-        get_offset('gibberish')
-    with tm.assertRaisesRegexp(ValueError, _INVALID_FREQ_ERROR):
-        get_offset('QS-JAN-B')
-
-    pairs = [
-        ('B', BDay()), ('b', BDay()), ('bm', BMonthEnd()),
-        ('Bm', BMonthEnd()), ('W-MON', Week(weekday=0)),
-        ('W-TUE', Week(weekday=1)), ('W-WED', Week(weekday=2)),
-        ('W-THU', Week(weekday=3)), ('W-FRI', Week(weekday=4)),
-        ("RE-N-DEC-MON", makeFY5253NearestEndMonth(weekday=0,
-                                                   startingMonth=12)),
-        ("RE-L-DEC-TUE", makeFY5253LastOfMonth(weekday=1, startingMonth=12)),
-        ("REQ-L-MAR-TUE-4", makeFY5253LastOfMonthQuarter(
-            weekday=1, startingMonth=3, qtr_with_extra_week=4)),
-        ("REQ-L-DEC-MON-3", makeFY5253LastOfMonthQuarter(
-            weekday=0, startingMonth=12, qtr_with_extra_week=3)),
-        ("REQ-N-DEC-MON-3", makeFY5253NearestEndMonthQuarter(
-            weekday=0, startingMonth=12, qtr_with_extra_week=3)),
-    ]
-
-    for name, expected in pairs:
-        offset = get_offset(name)
-        assert offset == expected, ("Expected %r to yield %r (actual: %r)" %
-                                    (name, expected, offset))
-
-
-def test_get_offset_legacy():
-    pairs = [('w@Sat', Week(weekday=5))]
-    for name, expected in pairs:
-        with tm.assertRaisesRegexp(ValueError, _INVALID_FREQ_ERROR):
-            get_offset(name)
-
-
-class TestParseTimeString(tm.TestCase):
-
-    def test_parse_time_string(self):
-        (date, parsed, reso) = parse_time_string('4Q1984')
-        (date_lower, parsed_lower, reso_lower) = parse_time_string('4q1984')
-        self.assertEqual(date, date_lower)
-        self.assertEqual(parsed, parsed_lower)
-        self.assertEqual(reso, reso_lower)
-
-    def test_parse_time_quarter_w_dash(self):
-        # https://github.com/pandas-dev/pandas/issue/9688
-        pairs = [('1988-Q2', '1988Q2'), ('2Q-1988', '2Q1988'), ]
-
-        for dashed, normal in pairs:
-            (date_dash, parsed_dash, reso_dash) = parse_time_string(dashed)
-            (date, parsed, reso) = parse_time_string(normal)
-
-            self.assertEqual(date_dash, date)
-            self.assertEqual(parsed_dash, parsed)
-            self.assertEqual(reso_dash, reso)
-
-        self.assertRaises(DateParseError, parse_time_string, "-2Q1992")
-        self.assertRaises(DateParseError, parse_time_string, "2-Q1992")
-        self.assertRaises(DateParseError, parse_time_string, "4-4Q1992")
-
-
-def test_get_standard_freq():
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        fstr = get_standard_freq('W')
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        assert fstr == get_standard_freq('w')
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        assert fstr == get_standard_freq('1w')
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        assert fstr == get_standard_freq(('W', 1))
-
-    with tm.assertRaisesRegexp(ValueError, _INVALID_FREQ_ERROR):
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            get_standard_freq('WeEk')
-
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        fstr = get_standard_freq('5Q')
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        assert fstr == get_standard_freq('5q')
-
-    with tm.assertRaisesRegexp(ValueError, _INVALID_FREQ_ERROR):
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            get_standard_freq('5QuarTer')
-
-    with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-        assert fstr == get_standard_freq(('q', 5))
-
-
-def test_quarterly_dont_normalize():
-    date = datetime(2012, 3, 31, 5, 30)
-
-    offsets = (QuarterBegin, QuarterEnd, BQuarterEnd, BQuarterBegin)
-
-    for klass in offsets:
-        result = date + klass()
-        assert (result.time() == date.time())
-
-
-class TestOffsetAliases(tm.TestCase):
-
-    def setUp(self):
-        _offset_map.clear()
-
-    def test_alias_equality(self):
-        for k, v in compat.iteritems(_offset_map):
-            if v is None:
-                continue
-            self.assertEqual(k, v.copy())
-
-    def test_rule_code(self):
-        lst = ['M', 'MS', 'BM', 'BMS', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
-        for k in lst:
-            self.assertEqual(k, get_offset(k).rule_code)
-            # should be cached - this is kind of an internals test...
-            assert k in _offset_map
-            self.assertEqual(k, (get_offset(k) * 3).rule_code)
-
-        suffix_lst = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-        base = 'W'
-        for v in suffix_lst:
-            alias = '-'.join([base, v])
-            self.assertEqual(alias, get_offset(alias).rule_code)
-            self.assertEqual(alias, (get_offset(alias) * 5).rule_code)
-
-        suffix_lst = ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL', 'AUG',
-                      'SEP', 'OCT', 'NOV', 'DEC']
-        base_lst = ['A', 'AS', 'BA', 'BAS', 'Q', 'QS', 'BQ', 'BQS']
-        for base in base_lst:
-            for v in suffix_lst:
-                alias = '-'.join([base, v])
-                self.assertEqual(alias, get_offset(alias).rule_code)
-                self.assertEqual(alias, (get_offset(alias) * 5).rule_code)
-
-        lst = ['M', 'D', 'B', 'H', 'T', 'S', 'L', 'U']
-        for k in lst:
-            code, stride = get_freq_code('3' + k)
-            self.assertTrue(isinstance(code, int))
-            self.assertEqual(stride, 3)
-            self.assertEqual(k, _get_freq_str(code))
-
-
-def test_apply_ticks():
-    result = offsets.Hour(3).apply(offsets.Hour(4))
-    exp = offsets.Hour(7)
-    assert (result == exp)
-
-
-def test_delta_to_tick():
-    delta = timedelta(3)
-
-    tick = offsets._delta_to_tick(delta)
-    assert (tick == offsets.Day(3))
-
-
-def test_dateoffset_misc():
-    oset = offsets.DateOffset(months=2, days=4)
-    # it works
-    oset.freqstr
-
-    assert (not offsets.DateOffset(months=2) == 2)
-
-
-def test_freq_offsets():
-    off = BDay(1, offset=timedelta(0, 1800))
-    assert (off.freqstr == 'B+30Min')
-
-    off = BDay(1, offset=timedelta(0, -1800))
-    assert (off.freqstr == 'B-30Min')
-
-
-def get_all_subclasses(cls):
-    ret = set()
-    this_subclasses = cls.__subclasses__()
-    ret = ret | set(this_subclasses)
-    for this_subclass in this_subclasses:
-        ret | get_all_subclasses(this_subclass)
-    return ret
-
-
-class TestCaching(tm.TestCase):
-
-    # as of GH 6479 (in 0.14.0), offset caching is turned off
-    # as of v0.12.0 only BusinessMonth/Quarter were actually caching
-
-    def setUp(self):
-        _daterange_cache.clear()
-        _offset_map.clear()
-
-    def run_X_index_creation(self, cls):
-        inst1 = cls()
-        if not inst1.isAnchored():
-            self.assertFalse(inst1._should_cache(), cls)
-            return
-
-        self.assertTrue(inst1._should_cache(), cls)
-
-        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 31),
-                      freq=inst1, normalize=True)
-        self.assertTrue(cls() in _daterange_cache, cls)
-
-    def test_should_cache_month_end(self):
-        self.assertFalse(MonthEnd()._should_cache())
-
-    def test_should_cache_bmonth_end(self):
-        self.assertFalse(BusinessMonthEnd()._should_cache())
-
-    def test_should_cache_week_month(self):
-        self.assertFalse(WeekOfMonth(weekday=1, week=2)._should_cache())
-
-    def test_all_cacheableoffsets(self):
-        for subclass in get_all_subclasses(CacheableOffset):
-            if subclass.__name__[0] == "_" \
-                    or subclass in TestCaching.no_simple_ctr:
-                continue
-            self.run_X_index_creation(subclass)
-
-    def test_month_end_index_creation(self):
-        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 31),
-                      freq=MonthEnd(), normalize=True)
-        self.assertFalse(MonthEnd() in _daterange_cache)
-
-    def test_bmonth_end_index_creation(self):
-        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 29),
-                      freq=BusinessMonthEnd(), normalize=True)
-        self.assertFalse(BusinessMonthEnd() in _daterange_cache)
-
-    def test_week_of_month_index_creation(self):
-        inst1 = WeekOfMonth(weekday=1, week=2)
-        DatetimeIndex(start=datetime(2013, 1, 31), end=datetime(2013, 3, 29),
-                      freq=inst1, normalize=True)
-        inst2 = WeekOfMonth(weekday=1, week=2)
-        self.assertFalse(inst2 in _daterange_cache)
-
-
-class TestReprNames(tm.TestCase):
-
-    def test_str_for_named_is_name(self):
-        # look at all the amazing combinations!
-        month_prefixes = ['A', 'AS', 'BA', 'BAS', 'Q', 'BQ', 'BQS', 'QS']
-        names = [prefix + '-' + month
-                 for prefix in month_prefixes
-                 for month in ['JAN', 'FEB', 'MAR', 'APR', 'MAY', 'JUN', 'JUL',
-                               'AUG', 'SEP', 'OCT', 'NOV', 'DEC']]
-        days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-        names += ['W-' + day for day in days]
-        names += ['WOM-' + week + day
-                  for week in ('1', '2', '3', '4') for day in days]
-        _offset_map.clear()
-        for name in names:
-            offset = get_offset(name)
-            self.assertEqual(offset.freqstr, name)
-
-
-def get_utc_offset_hours(ts):
-    # take a Timestamp and compute total hours of utc offset
-    o = ts.utcoffset()
-    return (o.days * 24 * 3600 + o.seconds) / 3600.0
-
-
-class TestDST(tm.TestCase):
-    """
-    test DateOffset additions over Daylight Savings Time
-    """
-    # one microsecond before the DST transition
-    ts_pre_fallback = "2013-11-03 01:59:59.999999"
-    ts_pre_springfwd = "2013-03-10 01:59:59.999999"
-
-    # test both basic names and dateutil timezones
-    timezone_utc_offsets = {
-        'US/Eastern': dict(utc_offset_daylight=-4,
-                           utc_offset_standard=-5, ),
-        'dateutil/US/Pacific': dict(utc_offset_daylight=-7,
-                                    utc_offset_standard=-8, )
-    }
-    valid_date_offsets_singular = [
-        'weekday', 'day', 'hour', 'minute', 'second', 'microsecond'
-    ]
-    valid_date_offsets_plural = [
-        'weeks', 'days',
-        'hours', 'minutes', 'seconds',
-        'milliseconds', 'microseconds'
-    ]
-
-    def _test_all_offsets(self, n, **kwds):
-        valid_offsets = self.valid_date_offsets_plural if n > 1 \
-            else self.valid_date_offsets_singular
-
-        for name in valid_offsets:
-            self._test_offset(offset_name=name, offset_n=n, **kwds)
-
-    def _test_offset(self, offset_name, offset_n, tstart, expected_utc_offset):
-        offset = DateOffset(**{offset_name: offset_n})
-
-        t = tstart + offset
-        if expected_utc_offset is not None:
-            self.assertTrue(get_utc_offset_hours(t) == expected_utc_offset)
-
-        if offset_name == 'weeks':
-            # dates should match
-            self.assertTrue(t.date() == timedelta(days=7 * offset.kwds[
-                'weeks']) + tstart.date())
-            # expect the same day of week, hour of day, minute, second, ...
-            self.assertTrue(t.dayofweek == tstart.dayofweek and t.hour ==
-                            tstart.hour and t.minute == tstart.minute and
-                            t.second == tstart.second)
-        elif offset_name == 'days':
-            # dates should match
-            self.assertTrue(timedelta(offset.kwds['days']) + tstart.date() ==
-                            t.date())
-            # expect the same hour of day, minute, second, ...
-            self.assertTrue(t.hour == tstart.hour and
-                            t.minute == tstart.minute and
-                            t.second == tstart.second)
-        elif offset_name in self.valid_date_offsets_singular:
-            # expect the signular offset value to match between tstart and t
-            datepart_offset = getattr(t, offset_name
-                                      if offset_name != 'weekday' else
-                                      'dayofweek')
-            self.assertTrue(datepart_offset == offset.kwds[offset_name])
-        else:
-            # the offset should be the same as if it was done in UTC
-            self.assertTrue(t == (tstart.tz_convert('UTC') + offset
-                                  ).tz_convert('US/Pacific'))
-
-    def _make_timestamp(self, string, hrs_offset, tz):
-        if hrs_offset >= 0:
-            offset_string = '{hrs:02d}00'.format(hrs=hrs_offset)
-        else:
-            offset_string = '-{hrs:02d}00'.format(hrs=-1 * hrs_offset)
-        return Timestamp(string + offset_string).tz_convert(tz)
-
-    def test_fallback_plural(self):
-        # test moving from daylight savings to standard time
-        import dateutil
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_daylight']
-            hrs_post = utc_offsets['utc_offset_standard']
-
-            if dateutil.__version__ != LooseVersion('2.6.0'):
-                # buggy ambiguous behavior in 2.6.0
-                # GH 14621
-                # https://github.com/dateutil/dateutil/issues/321
-                self._test_all_offsets(
-                    n=3, tstart=self._make_timestamp(self.ts_pre_fallback,
-                                                     hrs_pre, tz),
-                    expected_utc_offset=hrs_post)
-
-    def test_springforward_plural(self):
-        # test moving from standard to daylight savings
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            hrs_post = utc_offsets['utc_offset_daylight']
-            self._test_all_offsets(
-                n=3, tstart=self._make_timestamp(self.ts_pre_springfwd,
-                                                 hrs_pre, tz),
-                expected_utc_offset=hrs_post)
-
-    def test_fallback_singular(self):
-        # in the case of signular offsets, we dont neccesarily know which utc
-        # offset the new Timestamp will wind up in (the tz for 1 month may be
-        # different from 1 second) so we don't specify an expected_utc_offset
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            self._test_all_offsets(n=1, tstart=self._make_timestamp(
-                self.ts_pre_fallback, hrs_pre, tz), expected_utc_offset=None)
-
-    def test_springforward_singular(self):
-        for tz, utc_offsets in self.timezone_utc_offsets.items():
-            hrs_pre = utc_offsets['utc_offset_standard']
-            self._test_all_offsets(n=1, tstart=self._make_timestamp(
-                self.ts_pre_springfwd, hrs_pre, tz), expected_utc_offset=None)
-
-    def test_all_offset_classes(self):
-        tests = {MonthBegin: ['11/2/2012', '12/1/2012'],
-                 MonthEnd: ['11/2/2012', '11/30/2012'],
-                 BMonthBegin: ['11/2/2012', '12/3/2012'],
-                 BMonthEnd: ['11/2/2012', '11/30/2012'],
-                 CBMonthBegin: ['11/2/2012', '12/3/2012'],
-                 CBMonthEnd: ['11/2/2012', '11/30/2012'],
-                 SemiMonthBegin: ['11/2/2012', '11/15/2012'],
-                 SemiMonthEnd: ['11/2/2012', '11/15/2012'],
-                 Week: ['11/2/2012', '11/9/2012'],
-                 YearBegin: ['11/2/2012', '1/1/2013'],
-                 YearEnd: ['11/2/2012', '12/31/2012'],
-                 BYearBegin: ['11/2/2012', '1/1/2013'],
-                 BYearEnd: ['11/2/2012', '12/31/2012'],
-                 QuarterBegin: ['11/2/2012', '12/1/2012'],
-                 QuarterEnd: ['11/2/2012', '12/31/2012'],
-                 BQuarterBegin: ['11/2/2012', '12/3/2012'],
-                 BQuarterEnd: ['11/2/2012', '12/31/2012'],
-                 Day: ['11/4/2012', '11/4/2012 23:00']}
-
-        for offset, test_values in iteritems(tests):
-            first = Timestamp(test_values[0], tz='US/Eastern') + offset()
-            second = Timestamp(test_values[1], tz='US/Eastern')
-            self.assertEqual(first, second, msg=str(offset))
diff --git a/pandas/tests/tseries/test_resample.py b/pandas/tests/tseries/test_resample.py
deleted file mode 100755
index 57a655b0b7610..0000000000000
--- a/pandas/tests/tseries/test_resample.py
+++ /dev/null
@@ -1,3206 +0,0 @@
-# pylint: disable=E1101
-
-from datetime import datetime, timedelta
-from functools import partial
-
-import numpy as np
-
-import pandas as pd
-import pandas.tseries.offsets as offsets
-import pandas.util.testing as tm
-from pandas import (Series, DataFrame, Panel, Index, isnull,
-                    notnull, Timestamp)
-
-from pandas.types.generic import ABCSeries, ABCDataFrame
-from pandas.compat import range, lrange, zip, product, OrderedDict
-from pandas.core.base import SpecificationError
-from pandas.core.common import UnsupportedFunctionCall
-from pandas.core.groupby import DataError
-from pandas.tseries.frequencies import MONTHS, DAYS
-from pandas.tseries.frequencies import to_offset
-from pandas.tseries.index import date_range
-from pandas.tseries.offsets import Minute, BDay
-from pandas.tseries.period import period_range, PeriodIndex, Period
-from pandas.tseries.resample import (DatetimeIndex, TimeGrouper,
-                                     DatetimeIndexResampler)
-from pandas.tseries.tdi import timedelta_range, TimedeltaIndex
-from pandas.util.testing import (assert_series_equal, assert_almost_equal,
-                                 assert_frame_equal, assert_index_equal)
-from pandas._libs.period import IncompatibleFrequency
-
-bday = BDay()
-
-# The various methods we support
-downsample_methods = ['min', 'max', 'first', 'last', 'sum', 'mean', 'sem',
-                      'median', 'prod', 'var', 'ohlc']
-upsample_methods = ['count', 'size']
-series_methods = ['nunique']
-resample_methods = downsample_methods + upsample_methods + series_methods
-
-
-def _simple_ts(start, end, freq='D'):
-    rng = date_range(start, end, freq=freq)
-    return Series(np.random.randn(len(rng)), index=rng)
-
-
-def _simple_pts(start, end, freq='D'):
-    rng = period_range(start, end, freq=freq)
-    return Series(np.random.randn(len(rng)), index=rng)
-
-
-class TestResampleAPI(tm.TestCase):
-
-    def setUp(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='Min')
-
-        self.series = Series(np.random.rand(len(dti)), dti)
-        self.frame = DataFrame(
-            {'A': self.series, 'B': self.series, 'C': np.arange(len(dti))})
-
-    def test_str(self):
-
-        r = self.series.resample('H')
-        self.assertTrue(
-            'DatetimeIndexResampler [freq=<Hour>, axis=0, closed=left, '
-            'label=left, convention=start, base=0]' in str(r))
-
-    def test_api(self):
-
-        r = self.series.resample('H')
-        result = r.mean()
-        self.assertIsInstance(result, Series)
-        self.assertEqual(len(result), 217)
-
-        r = self.series.to_frame().resample('H')
-        result = r.mean()
-        self.assertIsInstance(result, DataFrame)
-        self.assertEqual(len(result), 217)
-
-    def test_api_changes_v018(self):
-
-        # change from .resample(....., how=...)
-        # to .resample(......).how()
-
-        r = self.series.resample('H')
-        self.assertIsInstance(r, DatetimeIndexResampler)
-
-        for how in ['sum', 'mean', 'prod', 'min', 'max', 'var', 'std']:
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                result = self.series.resample('H', how=how)
-                expected = getattr(self.series.resample('H'), how)()
-                tm.assert_series_equal(result, expected)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = self.series.resample('H', how='ohlc')
-            expected = self.series.resample('H').ohlc()
-            tm.assert_frame_equal(result, expected)
-
-        # compat for pandas-like methods
-        for how in ['sort_values', 'isnull']:
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                getattr(r, how)()
-
-        # invalids as these can be setting operations
-        r = self.series.resample('H')
-        self.assertRaises(ValueError, lambda: r.iloc[0])
-        self.assertRaises(ValueError, lambda: r.iat[0])
-        self.assertRaises(ValueError, lambda: r.loc[0])
-        self.assertRaises(ValueError, lambda: r.loc[
-            Timestamp('2013-01-01 00:00:00', offset='H')])
-        self.assertRaises(ValueError, lambda: r.at[
-            Timestamp('2013-01-01 00:00:00', offset='H')])
-
-        def f():
-            r[0] = 5
-
-        self.assertRaises(ValueError, f)
-
-        # str/repr
-        r = self.series.resample('H')
-        with tm.assert_produces_warning(None):
-            str(r)
-        with tm.assert_produces_warning(None):
-            repr(r)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            tm.assert_numpy_array_equal(np.array(r), np.array(r.mean()))
-
-        # masquerade as Series/DataFrame as needed for API compat
-        self.assertTrue(isinstance(self.series.resample('H'), ABCSeries))
-        self.assertFalse(isinstance(self.frame.resample('H'), ABCSeries))
-        self.assertFalse(isinstance(self.series.resample('H'), ABCDataFrame))
-        self.assertTrue(isinstance(self.frame.resample('H'), ABCDataFrame))
-
-        # bin numeric ops
-        for op in ['__add__', '__mul__', '__truediv__', '__div__', '__sub__']:
-
-            if getattr(self.series, op, None) is None:
-                continue
-            r = self.series.resample('H')
-
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                self.assertIsInstance(getattr(r, op)(2), pd.Series)
-
-        # unary numeric ops
-        for op in ['__pos__', '__neg__', '__abs__', '__inv__']:
-
-            if getattr(self.series, op, None) is None:
-                continue
-            r = self.series.resample('H')
-
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                self.assertIsInstance(getattr(r, op)(), pd.Series)
-
-        # comparison ops
-        for op in ['__lt__', '__le__', '__gt__', '__ge__', '__eq__', '__ne__']:
-            r = self.series.resample('H')
-
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                self.assertIsInstance(getattr(r, op)(2), pd.Series)
-
-        # IPython introspection shouldn't trigger warning GH 13618
-        for op in ['_repr_json', '_repr_latex',
-                   '_ipython_canary_method_should_not_exist_']:
-            r = self.series.resample('H')
-            with tm.assert_produces_warning(None):
-                getattr(r, op, None)
-
-        # getitem compat
-        df = self.series.to_frame('foo')
-
-        # same as prior versions for DataFrame
-        self.assertRaises(KeyError, lambda: df.resample('H')[0])
-
-        # compat for Series
-        # but we cannot be sure that we need a warning here
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = self.series.resample('H')[0]
-            expected = self.series.resample('H').mean()[0]
-            self.assertEqual(result, expected)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = self.series.resample('H')['2005-01-09 23:00:00']
-            expected = self.series.resample('H').mean()['2005-01-09 23:00:00']
-            self.assertEqual(result, expected)
-
-    def test_groupby_resample_api(self):
-
-        # GH 12448
-        # .groupby(...).resample(...) hitting warnings
-        # when appropriate
-        df = DataFrame({'date': pd.date_range(start='2016-01-01',
-                                              periods=4,
-                                              freq='W'),
-                        'group': [1, 1, 2, 2],
-                        'val': [5, 6, 7, 8]}).set_index('date')
-
-        # replication step
-        i = pd.date_range('2016-01-03', periods=8).tolist() + \
-            pd.date_range('2016-01-17', periods=8).tolist()
-        index = pd.MultiIndex.from_arrays([[1] * 8 + [2] * 8, i],
-                                          names=['group', 'date'])
-        expected = DataFrame({'val': [5] * 7 + [6] + [7] * 7 + [8]},
-                             index=index)
-        result = df.groupby('group').apply(
-            lambda x: x.resample('1D').ffill())[['val']]
-        assert_frame_equal(result, expected)
-
-    def test_groupby_resample_on_api(self):
-
-        # GH 15021
-        # .groupby(...).resample(on=...) results in an unexpected
-        # keyword warning.
-        df = pd.DataFrame({'key': ['A', 'B'] * 5,
-                           'dates': pd.date_range('2016-01-01', periods=10),
-                           'values': np.random.randn(10)})
-
-        expected = df.set_index('dates').groupby('key').resample('D').mean()
-
-        result = df.groupby('key').resample('D', on='dates').mean()
-        assert_frame_equal(result, expected)
-
-    def test_plot_api(self):
-        tm._skip_if_no_mpl()
-
-        # .resample(....).plot(...)
-        # hitting warnings
-        # GH 12448
-        s = Series(np.random.randn(60),
-                   index=date_range('2016-01-01', periods=60, freq='1min'))
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = s.resample('15min').plot()
-            tm.assert_is_valid_plot_return_object(result)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = s.resample('15min', how='sum').plot()
-            tm.assert_is_valid_plot_return_object(result)
-
-    def test_getitem(self):
-
-        r = self.frame.resample('H')
-        tm.assert_index_equal(r._selected_obj.columns, self.frame.columns)
-
-        r = self.frame.resample('H')['B']
-        self.assertEqual(r._selected_obj.name, self.frame.columns[1])
-
-        # technically this is allowed
-        r = self.frame.resample('H')['A', 'B']
-        tm.assert_index_equal(r._selected_obj.columns,
-                              self.frame.columns[[0, 1]])
-
-        r = self.frame.resample('H')['A', 'B']
-        tm.assert_index_equal(r._selected_obj.columns,
-                              self.frame.columns[[0, 1]])
-
-    def test_select_bad_cols(self):
-
-        g = self.frame.resample('H')
-        self.assertRaises(KeyError, g.__getitem__, ['D'])
-
-        self.assertRaises(KeyError, g.__getitem__, ['A', 'D'])
-        with tm.assertRaisesRegexp(KeyError, '^[^A]+$'):
-            # A should not be referenced as a bad column...
-            # will have to rethink regex if you change message!
-            g[['A', 'D']]
-
-    def test_attribute_access(self):
-
-        r = self.frame.resample('H')
-        tm.assert_series_equal(r.A.sum(), r['A'].sum())
-
-        # getting
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            self.assertRaises(AttributeError, lambda: r.F)
-
-        # setting
-        def f():
-            r.F = 'bah'
-
-        self.assertRaises(ValueError, f)
-
-    def test_api_compat_before_use(self):
-
-        # make sure that we are setting the binner
-        # on these attributes
-        for attr in ['groups', 'ngroups', 'indices']:
-            rng = pd.date_range('1/1/2012', periods=100, freq='S')
-            ts = pd.Series(np.arange(len(rng)), index=rng)
-            rs = ts.resample('30s')
-
-            # before use
-            getattr(rs, attr)
-
-            # after grouper is initialized is ok
-            rs.mean()
-            getattr(rs, attr)
-
-    def tests_skip_nuisance(self):
-
-        df = self.frame
-        df['D'] = 'foo'
-        r = df.resample('H')
-        result = r[['A', 'B']].sum()
-        expected = pd.concat([r.A.sum(), r.B.sum()], axis=1)
-        assert_frame_equal(result, expected)
-
-        expected = r[['A', 'B', 'C']].sum()
-        result = r.sum()
-        assert_frame_equal(result, expected)
-
-    def test_downsample_but_actually_upsampling(self):
-
-        # this is reindex / asfreq
-        rng = pd.date_range('1/1/2012', periods=100, freq='S')
-        ts = pd.Series(np.arange(len(rng), dtype='int64'), index=rng)
-        result = ts.resample('20s').asfreq()
-        expected = Series([0, 20, 40, 60, 80],
-                          index=pd.date_range('2012-01-01 00:00:00',
-                                              freq='20s',
-                                              periods=5))
-        assert_series_equal(result, expected)
-
-    def test_combined_up_downsampling_of_irregular(self):
-
-        # since we are reallydoing an operation like this
-        # ts2.resample('2s').mean().ffill()
-        # preserve these semantics
-
-        rng = pd.date_range('1/1/2012', periods=100, freq='S')
-        ts = pd.Series(np.arange(len(rng)), index=rng)
-        ts2 = ts.iloc[[0, 1, 2, 3, 5, 7, 11, 15, 16, 25, 30]]
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = ts2.resample('2s', how='mean', fill_method='ffill')
-        expected = ts2.resample('2s').mean().ffill()
-        assert_series_equal(result, expected)
-
-    def test_transform(self):
-
-        r = self.series.resample('20min')
-        expected = self.series.groupby(
-            pd.Grouper(freq='20min')).transform('mean')
-        result = r.transform('mean')
-        assert_series_equal(result, expected)
-
-    def test_fillna(self):
-
-        # need to upsample here
-        rng = pd.date_range('1/1/2012', periods=10, freq='2S')
-        ts = pd.Series(np.arange(len(rng), dtype='int64'), index=rng)
-        r = ts.resample('s')
-
-        expected = r.ffill()
-        result = r.fillna(method='ffill')
-        assert_series_equal(result, expected)
-
-        expected = r.bfill()
-        result = r.fillna(method='bfill')
-        assert_series_equal(result, expected)
-
-        with self.assertRaises(ValueError):
-            r.fillna(0)
-
-    def test_apply_without_aggregation(self):
-
-        # both resample and groupby should work w/o aggregation
-        r = self.series.resample('20min')
-        g = self.series.groupby(pd.Grouper(freq='20min'))
-
-        for t in [g, r]:
-            result = t.apply(lambda x: x)
-            assert_series_equal(result, self.series)
-
-    def test_agg_consistency(self):
-
-        # make sure that we are consistent across
-        # similar aggregations with and w/o selection list
-        df = DataFrame(np.random.randn(1000, 3),
-                       index=pd.date_range('1/1/2012', freq='S', periods=1000),
-                       columns=['A', 'B', 'C'])
-
-        r = df.resample('3T')
-
-        expected = r[['A', 'B', 'C']].agg({'r1': 'mean', 'r2': 'sum'})
-        result = r.agg({'r1': 'mean', 'r2': 'sum'})
-        assert_frame_equal(result, expected)
-
-    # TODO: once GH 14008 is fixed, move these tests into
-    # `Base` test class
-    def test_agg(self):
-        # test with all three Resampler apis and TimeGrouper
-
-        np.random.seed(1234)
-        index = date_range(datetime(2005, 1, 1),
-                           datetime(2005, 1, 10), freq='D')
-        index.name = 'date'
-        df = pd.DataFrame(np.random.rand(10, 2),
-                          columns=list('AB'),
-                          index=index)
-        df_col = df.reset_index()
-        df_mult = df_col.copy()
-        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
-                                                  names=['index', 'date'])
-        r = df.resample('2D')
-        cases = [
-            r,
-            df_col.resample('2D', on='date'),
-            df_mult.resample('2D', level='date'),
-            df.groupby(pd.Grouper(freq='2D'))
-        ]
-
-        a_mean = r['A'].mean()
-        a_std = r['A'].std()
-        a_sum = r['A'].sum()
-        b_mean = r['B'].mean()
-        b_std = r['B'].std()
-        b_sum = r['B'].sum()
-
-        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
-        expected.columns = pd.MultiIndex.from_product([['A', 'B'],
-                                                       ['mean', 'std']])
-        for t in cases:
-            result = t.aggregate([np.mean, np.std])
-            assert_frame_equal(result, expected)
-
-        expected = pd.concat([a_mean, b_std], axis=1)
-        for t in cases:
-            result = t.aggregate({'A': np.mean,
-                                  'B': np.std})
-            assert_frame_equal(result, expected, check_like=True)
-
-        expected = pd.concat([a_mean, a_std], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
-                                                      ('A', 'std')])
-        for t in cases:
-            result = t.aggregate({'A': ['mean', 'std']})
-            assert_frame_equal(result, expected)
-
-        expected = pd.concat([a_mean, a_sum], axis=1)
-        expected.columns = ['mean', 'sum']
-        for t in cases:
-            result = t['A'].aggregate(['mean', 'sum'])
-        assert_frame_equal(result, expected)
-
-        expected = pd.concat([a_mean, a_sum], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
-                                                      ('A', 'sum')])
-        for t in cases:
-            result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'}})
-            assert_frame_equal(result, expected, check_like=True)
-
-        expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
-                                                      ('A', 'sum'),
-                                                      ('B', 'mean2'),
-                                                      ('B', 'sum2')])
-        for t in cases:
-            result = t.aggregate({'A': {'mean': 'mean', 'sum': 'sum'},
-                                  'B': {'mean2': 'mean', 'sum2': 'sum'}})
-            assert_frame_equal(result, expected, check_like=True)
-
-        expected = pd.concat([a_mean, a_std, b_mean, b_std], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('A', 'mean'),
-                                                      ('A', 'std'),
-                                                      ('B', 'mean'),
-                                                      ('B', 'std')])
-        for t in cases:
-            result = t.aggregate({'A': ['mean', 'std'],
-                                  'B': ['mean', 'std']})
-            assert_frame_equal(result, expected, check_like=True)
-
-        expected = pd.concat([a_mean, a_sum, b_mean, b_sum], axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('r1', 'A', 'mean'),
-                                                      ('r1', 'A', 'sum'),
-                                                      ('r2', 'B', 'mean'),
-                                                      ('r2', 'B', 'sum')])
-
-    def test_agg_misc(self):
-        # test with all three Resampler apis and TimeGrouper
-
-        np.random.seed(1234)
-        index = date_range(datetime(2005, 1, 1),
-                           datetime(2005, 1, 10), freq='D')
-        index.name = 'date'
-        df = pd.DataFrame(np.random.rand(10, 2),
-                          columns=list('AB'),
-                          index=index)
-        df_col = df.reset_index()
-        df_mult = df_col.copy()
-        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
-                                                  names=['index', 'date'])
-
-        r = df.resample('2D')
-        cases = [
-            r,
-            df_col.resample('2D', on='date'),
-            df_mult.resample('2D', level='date'),
-            df.groupby(pd.Grouper(freq='2D'))
-        ]
-
-        # passed lambda
-        for t in cases:
-            result = t.agg({'A': np.sum,
-                            'B': lambda x: np.std(x, ddof=1)})
-            rcustom = t['B'].apply(lambda x: np.std(x, ddof=1))
-            expected = pd.concat([r['A'].sum(), rcustom], axis=1)
-            assert_frame_equal(result, expected, check_like=True)
-
-        # agg with renamers
-        expected = pd.concat([t['A'].sum(),
-                              t['B'].sum(),
-                              t['A'].mean(),
-                              t['B'].mean()],
-                             axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('result1', 'A'),
-                                                      ('result1', 'B'),
-                                                      ('result2', 'A'),
-                                                      ('result2', 'B')])
-        for t in cases:
-            result = t[['A', 'B']].agg(OrderedDict([('result1', np.sum),
-                                                    ('result2', np.mean)]))
-            assert_frame_equal(result, expected, check_like=True)
-
-        # agg with different hows
-        expected = pd.concat([t['A'].sum(),
-                              t['A'].std(),
-                              t['B'].mean(),
-                              t['B'].std()],
-                             axis=1)
-        expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
-                                                      ('A', 'std'),
-                                                      ('B', 'mean'),
-                                                      ('B', 'std')])
-        for t in cases:
-            result = t.agg(OrderedDict([('A', ['sum', 'std']),
-                                        ('B', ['mean', 'std'])]))
-            assert_frame_equal(result, expected, check_like=True)
-
-        # equivalent of using a selection list / or not
-        for t in cases:
-            result = t[['A', 'B']].agg({'A': ['sum', 'std'],
-                                        'B': ['mean', 'std']})
-            assert_frame_equal(result, expected, check_like=True)
-
-        # series like aggs
-        for t in cases:
-            result = t['A'].agg({'A': ['sum', 'std']})
-            expected = pd.concat([t['A'].sum(),
-                                  t['A'].std()],
-                                 axis=1)
-            expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
-                                                          ('A', 'std')])
-            assert_frame_equal(result, expected, check_like=True)
-
-            expected = pd.concat([t['A'].agg(['sum', 'std']),
-                                  t['A'].agg(['mean', 'std'])],
-                                 axis=1)
-            expected.columns = pd.MultiIndex.from_tuples([('A', 'sum'),
-                                                          ('A', 'std'),
-                                                          ('B', 'mean'),
-                                                          ('B', 'std')])
-            result = t['A'].agg({'A': ['sum', 'std'], 'B': ['mean', 'std']})
-            assert_frame_equal(result, expected, check_like=True)
-
-        # errors
-        # invalid names in the agg specification
-        for t in cases:
-            def f():
-                t[['A']].agg({'A': ['sum', 'std'],
-                              'B': ['mean', 'std']})
-
-            self.assertRaises(SpecificationError, f)
-
-    def test_agg_nested_dicts(self):
-
-        np.random.seed(1234)
-        index = date_range(datetime(2005, 1, 1),
-                           datetime(2005, 1, 10), freq='D')
-        index.name = 'date'
-        df = pd.DataFrame(np.random.rand(10, 2),
-                          columns=list('AB'),
-                          index=index)
-        df_col = df.reset_index()
-        df_mult = df_col.copy()
-        df_mult.index = pd.MultiIndex.from_arrays([range(10), df.index],
-                                                  names=['index', 'date'])
-        r = df.resample('2D')
-        cases = [
-            r,
-            df_col.resample('2D', on='date'),
-            df_mult.resample('2D', level='date'),
-            df.groupby(pd.Grouper(freq='2D'))
-        ]
-
-        for t in cases:
-            def f():
-                t.aggregate({'r1': {'A': ['mean', 'sum']},
-                             'r2': {'B': ['mean', 'sum']}})
-                self.assertRaises(ValueError, f)
-
-        for t in cases:
-            expected = pd.concat([t['A'].mean(), t['A'].std(), t['B'].mean(),
-                                  t['B'].std()], axis=1)
-            expected.columns = pd.MultiIndex.from_tuples([('ra', 'mean'), (
-                'ra', 'std'), ('rb', 'mean'), ('rb', 'std')])
-
-            result = t[['A', 'B']].agg({'A': {'ra': ['mean', 'std']},
-                                        'B': {'rb': ['mean', 'std']}})
-            assert_frame_equal(result, expected, check_like=True)
-
-            result = t.agg({'A': {'ra': ['mean', 'std']},
-                            'B': {'rb': ['mean', 'std']}})
-            assert_frame_equal(result, expected, check_like=True)
-
-    def test_selection_api_validation(self):
-        # GH 13500
-        index = date_range(datetime(2005, 1, 1),
-                           datetime(2005, 1, 10), freq='D')
-        df = pd.DataFrame({'date': index,
-                           'a': np.arange(len(index), dtype=np.int64)},
-                          index=pd.MultiIndex.from_arrays([
-                              np.arange(len(index), dtype=np.int64),
-                              index], names=['v', 'd']))
-        df_exp = pd.DataFrame({'a': np.arange(len(index), dtype=np.int64)},
-                              index=index)
-
-        # non DatetimeIndex
-        with tm.assertRaises(TypeError):
-            df.resample('2D', level='v')
-
-        with tm.assertRaises(ValueError):
-            df.resample('2D', on='date', level='d')
-
-        with tm.assertRaises(TypeError):
-            df.resample('2D', on=['a', 'date'])
-
-        with tm.assertRaises(KeyError):
-            df.resample('2D', level=['a', 'date'])
-
-        # upsampling not allowed
-        with tm.assertRaises(ValueError):
-            df.resample('2D', level='d').asfreq()
-
-        with tm.assertRaises(ValueError):
-            df.resample('2D', on='date').asfreq()
-
-        exp = df_exp.resample('2D').sum()
-        exp.index.name = 'date'
-        assert_frame_equal(exp, df.resample('2D', on='date').sum())
-
-        exp.index.name = 'd'
-        assert_frame_equal(exp, df.resample('2D', level='d').sum())
-
-
-class Base(object):
-    """
-    base class for resampling testing, calling
-    .create_series() generates a series of each index type
-    """
-
-    def create_index(self, *args, **kwargs):
-        """ return the _index_factory created using the args, kwargs """
-        factory = self._index_factory()
-        return factory(*args, **kwargs)
-
-    def test_asfreq_downsample(self):
-        s = self.create_series()
-
-        result = s.resample('2D').asfreq()
-        expected = s.reindex(s.index.take(np.arange(0, len(s.index), 2)))
-        expected.index.freq = to_offset('2D')
-        assert_series_equal(result, expected)
-
-        frame = s.to_frame('value')
-        result = frame.resample('2D').asfreq()
-        expected = frame.reindex(
-            frame.index.take(np.arange(0, len(frame.index), 2)))
-        expected.index.freq = to_offset('2D')
-        assert_frame_equal(result, expected)
-
-    def test_asfreq_upsample(self):
-        s = self.create_series()
-
-        result = s.resample('1H').asfreq()
-        new_index = self.create_index(s.index[0], s.index[-1], freq='1H')
-        expected = s.reindex(new_index)
-        assert_series_equal(result, expected)
-
-        frame = s.to_frame('value')
-        result = frame.resample('1H').asfreq()
-        new_index = self.create_index(frame.index[0],
-                                      frame.index[-1], freq='1H')
-        expected = frame.reindex(new_index)
-        assert_frame_equal(result, expected)
-
-    def test_asfreq_fill_value(self):
-        # test for fill value during resampling, issue 3715
-
-        s = self.create_series()
-
-        result = s.resample('1H').asfreq()
-        new_index = self.create_index(s.index[0], s.index[-1], freq='1H')
-        expected = s.reindex(new_index)
-        assert_series_equal(result, expected)
-
-        frame = s.to_frame('value')
-        frame.iloc[1] = None
-        result = frame.resample('1H').asfreq(fill_value=4.0)
-        new_index = self.create_index(frame.index[0],
-                                      frame.index[-1], freq='1H')
-        expected = frame.reindex(new_index, fill_value=4.0)
-        assert_frame_equal(result, expected)
-
-    def test_resample_interpolate(self):
-        # # 12925
-        df = self.create_series().to_frame('value')
-        assert_frame_equal(
-            df.resample('1T').asfreq().interpolate(),
-            df.resample('1T').interpolate())
-
-    def test_raises_on_non_datetimelike_index(self):
-        # this is a non datetimelike index
-        xp = DataFrame()
-        self.assertRaises(TypeError, lambda: xp.resample('A').mean())
-
-    def test_resample_empty_series(self):
-        # GH12771 & GH12868
-
-        s = self.create_series()[:0]
-
-        for freq in ['M', 'D', 'H']:
-            # need to test for ohlc from GH13083
-            methods = [method for method in resample_methods
-                       if method != 'ohlc']
-            for method in methods:
-                result = getattr(s.resample(freq), method)()
-
-                expected = s.copy()
-                expected.index = s.index._shallow_copy(freq=freq)
-                assert_index_equal(result.index, expected.index)
-                self.assertEqual(result.index.freq, expected.index.freq)
-
-                if (method == 'size' and
-                    isinstance(result.index, PeriodIndex) and
-                        freq in ['M', 'D']):
-                    # GH12871 - TODO: name should propagate, but currently
-                    # doesn't on lower / same frequency with PeriodIndex
-                    assert_series_equal(result, expected, check_dtype=False)
-
-                else:
-                    assert_series_equal(result, expected, check_dtype=False)
-
-    def test_resample_empty_dataframe(self):
-        # GH13212
-        index = self.create_series().index[:0]
-        f = DataFrame(index=index)
-
-        for freq in ['M', 'D', 'H']:
-            # count retains dimensions too
-            methods = downsample_methods + ['count']
-            for method in methods:
-                result = getattr(f.resample(freq), method)()
-
-                expected = f.copy()
-                expected.index = f.index._shallow_copy(freq=freq)
-                assert_index_equal(result.index, expected.index)
-                self.assertEqual(result.index.freq, expected.index.freq)
-                assert_frame_equal(result, expected, check_dtype=False)
-
-            # test size for GH13212 (currently stays as df)
-
-    def test_resample_empty_dtypes(self):
-
-        # Empty series were sometimes causing a segfault (for the functions
-        # with Cython bounds-checking disabled) or an IndexError.  We just run
-        # them to ensure they no longer do.  (GH #10228)
-        for index in tm.all_timeseries_index_generator(0):
-            for dtype in (np.float, np.int, np.object, 'datetime64[ns]'):
-                for how in downsample_methods + upsample_methods:
-                    empty_series = pd.Series([], index, dtype)
-                    try:
-                        getattr(empty_series.resample('d'), how)()
-                    except DataError:
-                        # Ignore these since some combinations are invalid
-                        # (ex: doing mean with dtype of np.object)
-                        pass
-
-    def test_resample_loffset_arg_type(self):
-        # GH 13218, 15002
-        df = self.create_series().to_frame('value')
-        expected_means = [df.values[i:i + 2].mean()
-                          for i in range(0, len(df.values), 2)]
-        expected_index = self.create_index(df.index[0],
-                                           periods=len(df.index) / 2,
-                                           freq='2D')
-
-        # loffset coreces PeriodIndex to DateTimeIndex
-        if isinstance(expected_index, PeriodIndex):
-            expected_index = expected_index.to_timestamp()
-
-        expected_index += timedelta(hours=2)
-        expected = DataFrame({'value': expected_means}, index=expected_index)
-
-        for arg in ['mean', {'value': 'mean'}, ['mean']]:
-
-            result_agg = df.resample('2D', loffset='2H').agg(arg)
-
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                result_how = df.resample('2D', how=arg, loffset='2H')
-
-            if isinstance(arg, list):
-                expected.columns = pd.MultiIndex.from_tuples([('value',
-                                                               'mean')])
-
-            # GH 13022, 7687 - TODO: fix resample w/ TimedeltaIndex
-            if isinstance(expected.index, TimedeltaIndex):
-                with tm.assertRaises(AssertionError):
-                    assert_frame_equal(result_agg, expected)
-                    assert_frame_equal(result_how, expected)
-            else:
-                assert_frame_equal(result_agg, expected)
-                assert_frame_equal(result_how, expected)
-
-
-class TestDatetimeIndex(Base, tm.TestCase):
-    _index_factory = lambda x: date_range
-
-    def setUp(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='Min')
-
-        self.series = Series(np.random.rand(len(dti)), dti)
-
-    def create_series(self):
-        i = date_range(datetime(2005, 1, 1),
-                       datetime(2005, 1, 10), freq='D')
-
-        return Series(np.arange(len(i)), index=i, name='dti')
-
-    def test_custom_grouper(self):
-
-        dti = DatetimeIndex(freq='Min', start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10))
-
-        s = Series(np.array([1] * len(dti)), index=dti, dtype='int64')
-
-        b = TimeGrouper(Minute(5))
-        g = s.groupby(b)
-
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        b = TimeGrouper(Minute(5), closed='right', label='right')
-        g = s.groupby(b)
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'ohlc', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        self.assertEqual(g.ngroups, 2593)
-        self.assertTrue(notnull(g.mean()).all())
-
-        # construct expected val
-        arr = [1] + [5] * 2592
-        idx = dti[0:-1:5]
-        idx = idx.append(dti[-1:])
-        expect = Series(arr, index=idx)
-
-        # GH2763 - return in put dtype if we can
-        result = g.agg(np.sum)
-        assert_series_equal(result, expect)
-
-        df = DataFrame(np.random.rand(len(dti), 10),
-                       index=dti, dtype='float64')
-        r = df.groupby(b).agg(np.sum)
-
-        self.assertEqual(len(r.columns), 10)
-        self.assertEqual(len(r.index), 2593)
-
-    def test_resample_basic(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
-                         name='index')
-        s = Series(np.random.randn(14), index=rng)
-        result = s.resample('5min', closed='right', label='right').mean()
-
-        exp_idx = date_range('1/1/2000', periods=4, freq='5min', name='index')
-        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
-                          index=exp_idx)
-        assert_series_equal(result, expected)
-        self.assertEqual(result.index.name, 'index')
-
-        result = s.resample('5min', closed='left', label='right').mean()
-
-        exp_idx = date_range('1/1/2000 00:05', periods=3, freq='5min',
-                             name='index')
-        expected = Series([s[:5].mean(), s[5:10].mean(),
-                           s[10:].mean()], index=exp_idx)
-        assert_series_equal(result, expected)
-
-        s = self.series
-        result = s.resample('5Min').last()
-        grouper = TimeGrouper(Minute(5), closed='left', label='left')
-        expect = s.groupby(grouper).agg(lambda x: x[-1])
-        assert_series_equal(result, expect)
-
-    def test_resample_how(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min',
-                         name='index')
-        s = Series(np.random.randn(14), index=rng)
-        grouplist = np.ones_like(s)
-        grouplist[0] = 0
-        grouplist[1:6] = 1
-        grouplist[6:11] = 2
-        grouplist[11:] = 3
-        args = downsample_methods
-
-        def _ohlc(group):
-            if isnull(group).all():
-                return np.repeat(np.nan, 4)
-            return [group[0], group.max(), group.min(), group[-1]]
-
-        inds = date_range('1/1/2000', periods=4, freq='5min', name='index')
-
-        for arg in args:
-            if arg == 'ohlc':
-                func = _ohlc
-            else:
-                func = arg
-            try:
-                result = getattr(s.resample(
-                    '5min', closed='right', label='right'), arg)()
-
-                expected = s.groupby(grouplist).agg(func)
-                self.assertEqual(result.index.name, 'index')
-                if arg == 'ohlc':
-                    expected = DataFrame(expected.values.tolist())
-                    expected.columns = ['open', 'high', 'low', 'close']
-                    expected.index = Index(inds, name='index')
-                    assert_frame_equal(result, expected)
-                else:
-                    expected.index = inds
-                    assert_series_equal(result, expected)
-            except BaseException as exc:
-
-                exc.args += ('how=%s' % arg,)
-                raise
-
-    def test_numpy_compat(self):
-        # see gh-12811
-        s = Series([1, 2, 3, 4, 5], index=date_range(
-            '20130101', periods=5, freq='s'))
-        r = s.resample('2s')
-
-        msg = "numpy operations are not valid with resample"
-
-        for func in ('min', 'max', 'sum', 'prod',
-                     'mean', 'var', 'std'):
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(r, func),
-                                  func, 1, 2, 3)
-            tm.assertRaisesRegexp(UnsupportedFunctionCall, msg,
-                                  getattr(r, func), axis=1)
-
-    def test_resample_how_callables(self):
-        # GH 7929
-        data = np.arange(5, dtype=np.int64)
-        ind = pd.DatetimeIndex(start='2014-01-01', periods=len(data), freq='d')
-        df = pd.DataFrame({"A": data, "B": data}, index=ind)
-
-        def fn(x, a=1):
-            return str(type(x))
-
-        class fn_class:
-
-            def __call__(self, x):
-                return str(type(x))
-
-        df_standard = df.resample("M").apply(fn)
-        df_lambda = df.resample("M").apply(lambda x: str(type(x)))
-        df_partial = df.resample("M").apply(partial(fn))
-        df_partial2 = df.resample("M").apply(partial(fn, a=2))
-        df_class = df.resample("M").apply(fn_class())
-
-        assert_frame_equal(df_standard, df_lambda)
-        assert_frame_equal(df_standard, df_partial)
-        assert_frame_equal(df_standard, df_partial2)
-        assert_frame_equal(df_standard, df_class)
-
-    def test_resample_with_timedeltas(self):
-
-        expected = DataFrame({'A': np.arange(1480)})
-        expected = expected.groupby(expected.index // 30).sum()
-        expected.index = pd.timedelta_range('0 days', freq='30T', periods=50)
-
-        df = DataFrame({'A': np.arange(1480)}, index=pd.to_timedelta(
-            np.arange(1480), unit='T'))
-        result = df.resample('30T').sum()
-
-        assert_frame_equal(result, expected)
-
-        s = df['A']
-        result = s.resample('30T').sum()
-        assert_series_equal(result, expected['A'])
-
-    def test_resample_single_period_timedelta(self):
-
-        s = Series(list(range(5)), index=pd.timedelta_range(
-            '1 day', freq='s', periods=5))
-        result = s.resample('2s').sum()
-        expected = Series([1, 5, 4], index=pd.timedelta_range(
-            '1 day', freq='2s', periods=3))
-        assert_series_equal(result, expected)
-
-    def test_resample_timedelta_idempotency(self):
-
-        # GH 12072
-        index = pd.timedelta_range('0', periods=9, freq='10L')
-        series = pd.Series(range(9), index=index)
-        result = series.resample('10L').mean()
-        expected = series
-        assert_series_equal(result, expected)
-
-    def test_resample_rounding(self):
-        # GH 8371
-        # odd results when rounding is needed
-
-        data = """date,time,value
-11-08-2014,00:00:01.093,1
-11-08-2014,00:00:02.159,1
-11-08-2014,00:00:02.667,1
-11-08-2014,00:00:03.175,1
-11-08-2014,00:00:07.058,1
-11-08-2014,00:00:07.362,1
-11-08-2014,00:00:08.324,1
-11-08-2014,00:00:08.830,1
-11-08-2014,00:00:08.982,1
-11-08-2014,00:00:09.815,1
-11-08-2014,00:00:10.540,1
-11-08-2014,00:00:11.061,1
-11-08-2014,00:00:11.617,1
-11-08-2014,00:00:13.607,1
-11-08-2014,00:00:14.535,1
-11-08-2014,00:00:15.525,1
-11-08-2014,00:00:17.960,1
-11-08-2014,00:00:20.674,1
-11-08-2014,00:00:21.191,1"""
-
-        from pandas.compat import StringIO
-        df = pd.read_csv(StringIO(data), parse_dates={'timestamp': [
-            'date', 'time']}, index_col='timestamp')
-        df.index.name = None
-        result = df.resample('6s').sum()
-        expected = DataFrame({'value': [
-            4, 9, 4, 2
-        ]}, index=date_range('2014-11-08', freq='6s', periods=4))
-        assert_frame_equal(result, expected)
-
-        result = df.resample('7s').sum()
-        expected = DataFrame({'value': [
-            4, 10, 4, 1
-        ]}, index=date_range('2014-11-08', freq='7s', periods=4))
-        assert_frame_equal(result, expected)
-
-        result = df.resample('11s').sum()
-        expected = DataFrame({'value': [
-            11, 8
-        ]}, index=date_range('2014-11-08', freq='11s', periods=2))
-        assert_frame_equal(result, expected)
-
-        result = df.resample('13s').sum()
-        expected = DataFrame({'value': [
-            13, 6
-        ]}, index=date_range('2014-11-08', freq='13s', periods=2))
-        assert_frame_equal(result, expected)
-
-        result = df.resample('17s').sum()
-        expected = DataFrame({'value': [
-            16, 3
-        ]}, index=date_range('2014-11-08', freq='17s', periods=2))
-        assert_frame_equal(result, expected)
-
-    def test_resample_basic_from_daily(self):
-        # from daily
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='D', name='index')
-
-        s = Series(np.random.rand(len(dti)), dti)
-
-        # to weekly
-        result = s.resample('w-sun').last()
-
-        self.assertEqual(len(result), 3)
-        self.assertTrue((result.index.dayofweek == [6, 6, 6]).all())
-        self.assertEqual(result.iloc[0], s['1/2/2005'])
-        self.assertEqual(result.iloc[1], s['1/9/2005'])
-        self.assertEqual(result.iloc[2], s.iloc[-1])
-
-        result = s.resample('W-MON').last()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [0, 0]).all())
-        self.assertEqual(result.iloc[0], s['1/3/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-TUE').last()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [1, 1]).all())
-        self.assertEqual(result.iloc[0], s['1/4/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-WED').last()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [2, 2]).all())
-        self.assertEqual(result.iloc[0], s['1/5/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-THU').last()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [3, 3]).all())
-        self.assertEqual(result.iloc[0], s['1/6/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        result = s.resample('W-FRI').last()
-        self.assertEqual(len(result), 2)
-        self.assertTrue((result.index.dayofweek == [4, 4]).all())
-        self.assertEqual(result.iloc[0], s['1/7/2005'])
-        self.assertEqual(result.iloc[1], s['1/10/2005'])
-
-        # to biz day
-        result = s.resample('B').last()
-        self.assertEqual(len(result), 7)
-        self.assertTrue((result.index.dayofweek == [
-            4, 0, 1, 2, 3, 4, 0
-        ]).all())
-        self.assertEqual(result.iloc[0], s['1/2/2005'])
-        self.assertEqual(result.iloc[1], s['1/3/2005'])
-        self.assertEqual(result.iloc[5], s['1/9/2005'])
-        self.assertEqual(result.index.name, 'index')
-
-    def test_resample_upsampling_picked_but_not_correct(self):
-
-        # Test for issue #3020
-        dates = date_range('01-Jan-2014', '05-Jan-2014', freq='D')
-        series = Series(1, index=dates)
-
-        result = series.resample('D').mean()
-        self.assertEqual(result.index[0], dates[0])
-
-        # GH 5955
-        # incorrect deciding to upsample when the axis frequency matches the
-        # resample frequency
-
-        import datetime
-        s = Series(np.arange(1., 6), index=[datetime.datetime(
-            1975, 1, i, 12, 0) for i in range(1, 6)])
-        expected = Series(np.arange(1., 6), index=date_range(
-            '19750101', periods=5, freq='D'))
-
-        result = s.resample('D').count()
-        assert_series_equal(result, Series(1, index=expected.index))
-
-        result1 = s.resample('D').sum()
-        result2 = s.resample('D').mean()
-        assert_series_equal(result1, expected)
-        assert_series_equal(result2, expected)
-
-    def test_resample_frame_basic(self):
-        df = tm.makeTimeDataFrame()
-
-        b = TimeGrouper('M')
-        g = df.groupby(b)
-
-        # check all cython functions work
-        funcs = ['add', 'mean', 'prod', 'min', 'max', 'var']
-        for f in funcs:
-            g._cython_agg_general(f)
-
-        result = df.resample('A').mean()
-        assert_series_equal(result['A'], df['A'].resample('A').mean())
-
-        result = df.resample('M').mean()
-        assert_series_equal(result['A'], df['A'].resample('M').mean())
-
-        df.resample('M', kind='period').mean()
-        df.resample('W-WED', kind='period').mean()
-
-    def test_resample_loffset(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 00:13:00', freq='min')
-        s = Series(np.random.randn(14), index=rng)
-
-        result = s.resample('5min', closed='right', label='right',
-                            loffset=timedelta(minutes=1)).mean()
-        idx = date_range('1/1/2000', periods=4, freq='5min')
-        expected = Series([s[0], s[1:6].mean(), s[6:11].mean(), s[11:].mean()],
-                          index=idx + timedelta(minutes=1))
-        assert_series_equal(result, expected)
-
-        expected = s.resample(
-            '5min', closed='right', label='right',
-            loffset='1min').mean()
-        assert_series_equal(result, expected)
-
-        expected = s.resample(
-            '5min', closed='right', label='right',
-            loffset=Minute(1)).mean()
-        assert_series_equal(result, expected)
-
-        self.assertEqual(result.index.freq, Minute(5))
-
-        # from daily
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='D')
-        ser = Series(np.random.rand(len(dti)), dti)
-
-        # to weekly
-        result = ser.resample('w-sun').last()
-        expected = ser.resample('w-sun', loffset=-bday).last()
-        self.assertEqual(result.index[0] - bday, expected.index[0])
-
-    def test_resample_loffset_count(self):
-        # GH 12725
-        start_time = '1/1/2000 00:00:00'
-        rng = date_range(start_time, periods=100, freq='S')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('10S', loffset='1s').count()
-
-        expected_index = (
-            date_range(start_time, periods=10, freq='10S') +
-            timedelta(seconds=1)
-        )
-        expected = pd.Series(10, index=expected_index)
-
-        assert_series_equal(result, expected)
-
-        # Same issue should apply to .size() since it goes through
-        #   same code path
-        result = ts.resample('10S', loffset='1s').size()
-
-        assert_series_equal(result, expected)
-
-    def test_resample_upsample(self):
-        # from daily
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='D', name='index')
-
-        s = Series(np.random.rand(len(dti)), dti)
-
-        # to minutely, by padding
-        result = s.resample('Min').pad()
-        self.assertEqual(len(result), 12961)
-        self.assertEqual(result[0], s[0])
-        self.assertEqual(result[-1], s[-1])
-
-        self.assertEqual(result.index.name, 'index')
-
-    def test_resample_how_method(self):
-        # GH9915
-        s = pd.Series([11, 22],
-                      index=[Timestamp('2015-03-31 21:48:52.672000'),
-                             Timestamp('2015-03-31 21:49:52.739000')])
-        expected = pd.Series([11, np.NaN, np.NaN, np.NaN, np.NaN, np.NaN, 22],
-                             index=[Timestamp('2015-03-31 21:48:50'),
-                                    Timestamp('2015-03-31 21:49:00'),
-                                    Timestamp('2015-03-31 21:49:10'),
-                                    Timestamp('2015-03-31 21:49:20'),
-                                    Timestamp('2015-03-31 21:49:30'),
-                                    Timestamp('2015-03-31 21:49:40'),
-                                    Timestamp('2015-03-31 21:49:50')])
-        assert_series_equal(s.resample("10S").mean(), expected)
-
-    def test_resample_extra_index_point(self):
-        # GH 9756
-        index = DatetimeIndex(start='20150101', end='20150331', freq='BM')
-        expected = DataFrame({'A': Series([21, 41, 63], index=index)})
-
-        index = DatetimeIndex(start='20150101', end='20150331', freq='B')
-        df = DataFrame(
-            {'A': Series(range(len(index)), index=index)}, dtype='int64')
-        result = df.resample('BM').last()
-        assert_frame_equal(result, expected)
-
-    def test_upsample_with_limit(self):
-        rng = date_range('1/1/2000', periods=3, freq='5t')
-        ts = Series(np.random.randn(len(rng)), rng)
-
-        result = ts.resample('t').ffill(limit=2)
-        expected = ts.reindex(result.index, method='ffill', limit=2)
-        assert_series_equal(result, expected)
-
-    def test_resample_ohlc(self):
-        s = self.series
-
-        grouper = TimeGrouper(Minute(5))
-        expect = s.groupby(grouper).agg(lambda x: x[-1])
-        result = s.resample('5Min').ohlc()
-
-        self.assertEqual(len(result), len(expect))
-        self.assertEqual(len(result.columns), 4)
-
-        xs = result.iloc[-2]
-        self.assertEqual(xs['open'], s[-6])
-        self.assertEqual(xs['high'], s[-6:-1].max())
-        self.assertEqual(xs['low'], s[-6:-1].min())
-        self.assertEqual(xs['close'], s[-2])
-
-        xs = result.iloc[0]
-        self.assertEqual(xs['open'], s[0])
-        self.assertEqual(xs['high'], s[:5].max())
-        self.assertEqual(xs['low'], s[:5].min())
-        self.assertEqual(xs['close'], s[4])
-
-    def test_resample_ohlc_result(self):
-
-        # GH 12332
-        index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
-        index = index.union(pd.date_range('4-15-2000', '5-15-2000', freq='h'))
-        s = Series(range(len(index)), index=index)
-
-        a = s.loc[:'4-15-2000'].resample('30T').ohlc()
-        self.assertIsInstance(a, DataFrame)
-
-        b = s.loc[:'4-14-2000'].resample('30T').ohlc()
-        self.assertIsInstance(b, DataFrame)
-
-        # GH12348
-        # raising on odd period
-        rng = date_range('2013-12-30', '2014-01-07')
-        index = rng.drop([Timestamp('2014-01-01'),
-                          Timestamp('2013-12-31'),
-                          Timestamp('2014-01-04'),
-                          Timestamp('2014-01-05')])
-        df = DataFrame(data=np.arange(len(index)), index=index)
-        result = df.resample('B').mean()
-        expected = df.reindex(index=date_range(rng[0], rng[-1], freq='B'))
-        assert_frame_equal(result, expected)
-
-    def test_resample_ohlc_dataframe(self):
-        df = (
-            pd.DataFrame({
-                'PRICE': {
-                    Timestamp('2011-01-06 10:59:05', tz=None): 24990,
-                    Timestamp('2011-01-06 12:43:33', tz=None): 25499,
-                    Timestamp('2011-01-06 12:54:09', tz=None): 25499},
-                'VOLUME': {
-                    Timestamp('2011-01-06 10:59:05', tz=None): 1500000000,
-                    Timestamp('2011-01-06 12:43:33', tz=None): 5000000000,
-                    Timestamp('2011-01-06 12:54:09', tz=None): 100000000}})
-        ).reindex_axis(['VOLUME', 'PRICE'], axis=1)
-        res = df.resample('H').ohlc()
-        exp = pd.concat([df['VOLUME'].resample('H').ohlc(),
-                         df['PRICE'].resample('H').ohlc()],
-                        axis=1,
-                        keys=['VOLUME', 'PRICE'])
-        assert_frame_equal(exp, res)
-
-        df.columns = [['a', 'b'], ['c', 'd']]
-        res = df.resample('H').ohlc()
-        exp.columns = pd.MultiIndex.from_tuples([
-            ('a', 'c', 'open'), ('a', 'c', 'high'), ('a', 'c', 'low'),
-            ('a', 'c', 'close'), ('b', 'd', 'open'), ('b', 'd', 'high'),
-            ('b', 'd', 'low'), ('b', 'd', 'close')])
-        assert_frame_equal(exp, res)
-
-        # dupe columns fail atm
-        # df.columns = ['PRICE', 'PRICE']
-
-    def test_resample_dup_index(self):
-
-        # GH 4812
-        # dup columns with resample raising
-        df = DataFrame(np.random.randn(4, 12), index=[2000, 2000, 2000, 2000],
-                       columns=[Period(year=2000, month=i + 1, freq='M')
-                                for i in range(12)])
-        df.iloc[3, :] = np.nan
-        result = df.resample('Q', axis=1).mean()
-        expected = df.groupby(lambda x: int((x.month - 1) / 3), axis=1).mean()
-        expected.columns = [
-            Period(year=2000, quarter=i + 1, freq='Q') for i in range(4)]
-        assert_frame_equal(result, expected)
-
-    def test_resample_reresample(self):
-        dti = DatetimeIndex(start=datetime(2005, 1, 1),
-                            end=datetime(2005, 1, 10), freq='D')
-        s = Series(np.random.rand(len(dti)), dti)
-        bs = s.resample('B', closed='right', label='right').mean()
-        result = bs.resample('8H').mean()
-        self.assertEqual(len(result), 22)
-        tm.assertIsInstance(result.index.freq, offsets.DateOffset)
-        self.assertEqual(result.index.freq, offsets.Hour(8))
-
-    def test_resample_timestamp_to_period(self):
-        ts = _simple_ts('1/1/1990', '1/1/2000')
-
-        result = ts.resample('A-DEC', kind='period').mean()
-        expected = ts.resample('A-DEC').mean()
-        expected.index = period_range('1990', '2000', freq='a-dec')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('A-JUN', kind='period').mean()
-        expected = ts.resample('A-JUN').mean()
-        expected.index = period_range('1990', '2000', freq='a-jun')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('M', kind='period').mean()
-        expected = ts.resample('M').mean()
-        expected.index = period_range('1990-01', '2000-01', freq='M')
-        assert_series_equal(result, expected)
-
-        result = ts.resample('M', kind='period').mean()
-        expected = ts.resample('M').mean()
-        expected.index = period_range('1990-01', '2000-01', freq='M')
-        assert_series_equal(result, expected)
-
-    def test_ohlc_5min(self):
-        def _ohlc(group):
-            if isnull(group).all():
-                return np.repeat(np.nan, 4)
-            return [group[0], group.max(), group.min(), group[-1]]
-
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 5:59:50', freq='10s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('5min', closed='right',
-                                label='right').ohlc()
-
-        self.assertTrue((resampled.loc['1/1/2000 00:00'] == ts[0]).all())
-
-        exp = _ohlc(ts[1:31])
-        self.assertTrue((resampled.loc['1/1/2000 00:05'] == exp).all())
-
-        exp = _ohlc(ts['1/1/2000 5:55:01':])
-        self.assertTrue((resampled.loc['1/1/2000 6:00:00'] == exp).all())
-
-    def test_downsample_non_unique(self):
-        rng = date_range('1/1/2000', '2/29/2000')
-        rng2 = rng.repeat(5).values
-        ts = Series(np.random.randn(len(rng2)), index=rng2)
-
-        result = ts.resample('M').mean()
-
-        expected = ts.groupby(lambda x: x.month).mean()
-        self.assertEqual(len(result), 2)
-        assert_almost_equal(result[0], expected[1])
-        assert_almost_equal(result[1], expected[2])
-
-    def test_asfreq_non_unique(self):
-        # GH #1077
-        rng = date_range('1/1/2000', '2/29/2000')
-        rng2 = rng.repeat(2).values
-        ts = Series(np.random.randn(len(rng2)), index=rng2)
-
-        self.assertRaises(Exception, ts.asfreq, 'B')
-
-    def test_resample_axis1(self):
-        rng = date_range('1/1/2000', '2/29/2000')
-        df = DataFrame(np.random.randn(3, len(rng)), columns=rng,
-                       index=['a', 'b', 'c'])
-
-        result = df.resample('M', axis=1).mean()
-        expected = df.T.resample('M').mean().T
-        tm.assert_frame_equal(result, expected)
-
-    def test_resample_panel(self):
-        rng = date_range('1/1/2000', '6/30/2000')
-        n = len(rng)
-
-        panel = Panel(np.random.randn(3, n, 5),
-                      items=['one', 'two', 'three'],
-                      major_axis=rng,
-                      minor_axis=['a', 'b', 'c', 'd', 'e'])
-
-        result = panel.resample('M', axis=1).mean()
-
-        def p_apply(panel, f):
-            result = {}
-            for item in panel.items:
-                result[item] = f(panel[item])
-            return Panel(result, items=panel.items)
-
-        expected = p_apply(panel, lambda x: x.resample('M').mean())
-        tm.assert_panel_equal(result, expected)
-
-        panel2 = panel.swapaxes(1, 2)
-        result = panel2.resample('M', axis=2).mean()
-        expected = p_apply(panel2, lambda x: x.resample('M', axis=1).mean())
-        tm.assert_panel_equal(result, expected)
-
-    def test_resample_panel_numpy(self):
-        rng = date_range('1/1/2000', '6/30/2000')
-        n = len(rng)
-
-        panel = Panel(np.random.randn(3, n, 5),
-                      items=['one', 'two', 'three'],
-                      major_axis=rng,
-                      minor_axis=['a', 'b', 'c', 'd', 'e'])
-
-        result = panel.resample('M', axis=1).apply(lambda x: x.mean(1))
-        expected = panel.resample('M', axis=1).mean()
-        tm.assert_panel_equal(result, expected)
-
-        panel = panel.swapaxes(1, 2)
-        result = panel.resample('M', axis=2).apply(lambda x: x.mean(2))
-        expected = panel.resample('M', axis=2).mean()
-        tm.assert_panel_equal(result, expected)
-
-    def test_resample_anchored_ticks(self):
-        # If a fixed delta (5 minute, 4 hour) evenly divides a day, we should
-        # "anchor" the origin at midnight so we get regular intervals rather
-        # than starting from the first timestamp which might start in the
-        # middle of a desired interval
-
-        rng = date_range('1/1/2000 04:00:00', periods=86400, freq='s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        ts[:2] = np.nan  # so results are the same
-
-        freqs = ['t', '5t', '15t', '30t', '4h', '12h']
-        for freq in freqs:
-            result = ts[2:].resample(freq, closed='left', label='left').mean()
-            expected = ts.resample(freq, closed='left', label='left').mean()
-            assert_series_equal(result, expected)
-
-    def test_resample_single_group(self):
-        mysum = lambda x: x.sum()
-
-        rng = date_range('2000-1-1', '2000-2-10', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        assert_series_equal(ts.resample('M').sum(),
-                            ts.resample('M').apply(mysum))
-
-        rng = date_range('2000-1-1', '2000-1-10', freq='D')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        assert_series_equal(ts.resample('M').sum(),
-                            ts.resample('M').apply(mysum))
-
-        # GH 3849
-        s = Series([30.1, 31.6], index=[Timestamp('20070915 15:30:00'),
-                                        Timestamp('20070915 15:40:00')])
-        expected = Series([0.75], index=[Timestamp('20070915')])
-        result = s.resample('D').apply(lambda x: np.std(x))
-        assert_series_equal(result, expected)
-
-    def test_resample_base(self):
-        rng = date_range('1/1/2000 00:00:00', '1/1/2000 02:00', freq='s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('5min', base=2).mean()
-        exp_rng = date_range('12/31/1999 23:57:00', '1/1/2000 01:57',
-                             freq='5min')
-        self.assert_index_equal(resampled.index, exp_rng)
-
-    def test_resample_base_with_timedeltaindex(self):
-
-        # GH 10530
-        rng = timedelta_range(start='0s', periods=25, freq='s')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        with_base = ts.resample('2s', base=5).mean()
-        without_base = ts.resample('2s').mean()
-
-        exp_without_base = timedelta_range(start='0s', end='25s', freq='2s')
-        exp_with_base = timedelta_range(start='5s', end='29s', freq='2s')
-
-        self.assert_index_equal(without_base.index, exp_without_base)
-        self.assert_index_equal(with_base.index, exp_with_base)
-
-    def test_resample_categorical_data_with_timedeltaindex(self):
-        # GH #12169
-        df = DataFrame({'Group_obj': 'A'},
-                       index=pd.to_timedelta(list(range(20)), unit='s'))
-        df['Group'] = df['Group_obj'].astype('category')
-        result = df.resample('10s').agg(lambda x: (x.value_counts().index[0]))
-        expected = DataFrame({'Group_obj': ['A', 'A'],
-                              'Group': ['A', 'A']},
-                             index=pd.to_timedelta([0, 10], unit='s'))
-        expected = expected.reindex_axis(['Group_obj', 'Group'], 1)
-        tm.assert_frame_equal(result, expected)
-
-    def test_resample_daily_anchored(self):
-        rng = date_range('1/1/2000 0:00:00', periods=10000, freq='T')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-        ts[:2] = np.nan  # so results are the same
-
-        result = ts[2:].resample('D', closed='left', label='left').mean()
-        expected = ts.resample('D', closed='left', label='left').mean()
-        assert_series_equal(result, expected)
-
-    def test_resample_to_period_monthly_buglet(self):
-        # GH #1259
-
-        rng = date_range('1/1/2000', '12/31/2000')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('M', kind='period').mean()
-        exp_index = period_range('Jan-2000', 'Dec-2000', freq='M')
-        self.assert_index_equal(result.index, exp_index)
-
-    def test_period_with_agg(self):
-
-        # aggregate a period resampler with a lambda
-        s2 = pd.Series(np.random.randint(0, 5, 50),
-                       index=pd.period_range('2012-01-01',
-                                             freq='H',
-                                             periods=50),
-                       dtype='float64')
-
-        expected = s2.to_timestamp().resample('D').mean().to_period()
-        result = s2.resample('D').agg(lambda x: x.mean())
-        assert_series_equal(result, expected)
-
-    def test_resample_segfault(self):
-        # GH 8573
-        # segfaulting in older versions
-        all_wins_and_wagers = [
-            (1, datetime(2013, 10, 1, 16, 20), 1, 0),
-            (2, datetime(2013, 10, 1, 16, 10), 1, 0),
-            (2, datetime(2013, 10, 1, 18, 15), 1, 0),
-            (2, datetime(2013, 10, 1, 16, 10, 31), 1, 0)]
-
-        df = pd.DataFrame.from_records(all_wins_and_wagers,
-                                       columns=("ID", "timestamp", "A", "B")
-                                       ).set_index("timestamp")
-        result = df.groupby("ID").resample("5min").sum()
-        expected = df.groupby("ID").apply(lambda x: x.resample("5min").sum())
-        assert_frame_equal(result, expected)
-
-    def test_resample_dtype_preservation(self):
-
-        # GH 12202
-        # validation tests for dtype preservation
-
-        df = DataFrame({'date': pd.date_range(start='2016-01-01',
-                                              periods=4, freq='W'),
-                        'group': [1, 1, 2, 2],
-                        'val': Series([5, 6, 7, 8],
-                                      dtype='int32')}
-                       ).set_index('date')
-
-        result = df.resample('1D').ffill()
-        self.assertEqual(result.val.dtype, np.int32)
-
-        result = df.groupby('group').resample('1D').ffill()
-        self.assertEqual(result.val.dtype, np.int32)
-
-    def test_weekly_resample_buglet(self):
-        # #1327
-        rng = date_range('1/1/2000', freq='B', periods=20)
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        resampled = ts.resample('W').mean()
-        expected = ts.resample('W-SUN').mean()
-        assert_series_equal(resampled, expected)
-
-    def test_monthly_resample_error(self):
-        # #1451
-        dates = date_range('4/16/2012 20:00', periods=5000, freq='h')
-        ts = Series(np.random.randn(len(dates)), index=dates)
-        # it works!
-        ts.resample('M')
-
-    def test_nanosecond_resample_error(self):
-        # GH 12307 - Values falls after last bin when
-        # Resampling using pd.tseries.offsets.Nano as period
-        start = 1443707890427
-        exp_start = 1443707890400
-        indx = pd.date_range(
-            start=pd.to_datetime(start),
-            periods=10,
-            freq='100n'
-        )
-        ts = pd.Series(range(len(indx)), index=indx)
-        r = ts.resample(pd.tseries.offsets.Nano(100))
-        result = r.agg('mean')
-
-        exp_indx = pd.date_range(
-            start=pd.to_datetime(exp_start),
-            periods=10,
-            freq='100n'
-        )
-        exp = pd.Series(range(len(exp_indx)), index=exp_indx)
-
-        assert_series_equal(result, exp)
-
-    def test_resample_anchored_intraday(self):
-        # #1471, #1458
-
-        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
-        df = DataFrame(rng.month, index=rng)
-
-        result = df.resample('M').mean()
-        expected = df.resample(
-            'M', kind='period').mean().to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        result = df.resample('M', closed='left').mean()
-        exp = df.tshift(1, freq='D').resample('M', kind='period').mean()
-        exp = exp.to_timestamp(how='end')
-
-        tm.assert_frame_equal(result, exp)
-
-        rng = date_range('1/1/2012', '4/1/2012', freq='100min')
-        df = DataFrame(rng.month, index=rng)
-
-        result = df.resample('Q').mean()
-        expected = df.resample(
-            'Q', kind='period').mean().to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        result = df.resample('Q', closed='left').mean()
-        expected = df.tshift(1, freq='D').resample('Q', kind='period',
-                                                   closed='left').mean()
-        expected = expected.to_timestamp(how='end')
-        tm.assert_frame_equal(result, expected)
-
-        ts = _simple_ts('2012-04-29 23:00', '2012-04-30 5:00', freq='h')
-        resampled = ts.resample('M').mean()
-        self.assertEqual(len(resampled), 1)
-
-    def test_resample_anchored_monthstart(self):
-        ts = _simple_ts('1/1/2000', '12/31/2002')
-
-        freqs = ['MS', 'BMS', 'QS-MAR', 'AS-DEC', 'AS-JUN']
-
-        for freq in freqs:
-            ts.resample(freq).mean()
-
-    def test_resample_anchored_multiday(self):
-        # When resampling a range spanning multiple days, ensure that the
-        # start date gets used to determine the offset.  Fixes issue where
-        # a one day period is not a multiple of the frequency.
-        #
-        # See: https://github.com/pandas-dev/pandas/issues/8683
-
-        index = pd.date_range(
-            '2014-10-14 23:06:23.206', periods=3, freq='400L'
-        ) | pd.date_range(
-            '2014-10-15 23:00:00', periods=2, freq='2200L')
-
-        s = pd.Series(np.random.randn(5), index=index)
-
-        # Ensure left closing works
-        result = s.resample('2200L').mean()
-        self.assertEqual(result.index[-1],
-                         pd.Timestamp('2014-10-15 23:00:02.000'))
-
-        # Ensure right closing works
-        result = s.resample('2200L', label='right').mean()
-        self.assertEqual(result.index[-1],
-                         pd.Timestamp('2014-10-15 23:00:04.200'))
-
-    def test_corner_cases(self):
-        # miscellaneous test coverage
-
-        rng = date_range('1/1/2000', periods=12, freq='t')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('5t', closed='right', label='left').mean()
-        ex_index = date_range('1999-12-31 23:55', periods=4, freq='5t')
-        self.assert_index_equal(result.index, ex_index)
-
-        len0pts = _simple_pts('2007-01', '2010-05', freq='M')[:0]
-        # it works
-        result = len0pts.resample('A-DEC').mean()
-        self.assertEqual(len(result), 0)
-
-        # resample to periods
-        ts = _simple_ts('2000-04-28', '2000-04-30 11:00', freq='h')
-        result = ts.resample('M', kind='period').mean()
-        self.assertEqual(len(result), 1)
-        self.assertEqual(result.index[0], Period('2000-04', freq='M'))
-
-    def test_anchored_lowercase_buglet(self):
-        dates = date_range('4/16/2012 20:00', periods=50000, freq='s')
-        ts = Series(np.random.randn(len(dates)), index=dates)
-        # it works!
-        ts.resample('d').mean()
-
-    def test_upsample_apply_functions(self):
-        # #1596
-        rng = pd.date_range('2012-06-12', periods=4, freq='h')
-
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('20min').aggregate(['mean', 'sum'])
-        tm.assertIsInstance(result, DataFrame)
-
-    def test_resample_not_monotonic(self):
-        rng = pd.date_range('2012-06-12', periods=200, freq='h')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts = ts.take(np.random.permutation(len(ts)))
-
-        result = ts.resample('D').sum()
-        exp = ts.sort_index().resample('D').sum()
-        assert_series_equal(result, exp)
-
-    def test_resample_median_bug_1688(self):
-
-        for dtype in ['int64', 'int32', 'float64', 'float32']:
-            df = DataFrame([1, 2], index=[datetime(2012, 1, 1, 0, 0, 0),
-                                          datetime(2012, 1, 1, 0, 5, 0)],
-                           dtype=dtype)
-
-            result = df.resample("T").apply(lambda x: x.mean())
-            exp = df.asfreq('T')
-            tm.assert_frame_equal(result, exp)
-
-            result = df.resample("T").median()
-            exp = df.asfreq('T')
-            tm.assert_frame_equal(result, exp)
-
-    def test_how_lambda_functions(self):
-
-        ts = _simple_ts('1/1/2000', '4/1/2000')
-
-        result = ts.resample('M').apply(lambda x: x.mean())
-        exp = ts.resample('M').mean()
-        tm.assert_series_equal(result, exp)
-
-        foo_exp = ts.resample('M').mean()
-        foo_exp.name = 'foo'
-        bar_exp = ts.resample('M').std()
-        bar_exp.name = 'bar'
-
-        result = ts.resample('M').apply(
-            [lambda x: x.mean(), lambda x: x.std(ddof=1)])
-        result.columns = ['foo', 'bar']
-        tm.assert_series_equal(result['foo'], foo_exp)
-        tm.assert_series_equal(result['bar'], bar_exp)
-
-        result = ts.resample('M').aggregate({'foo': lambda x: x.mean(),
-                                             'bar': lambda x: x.std(ddof=1)})
-        tm.assert_series_equal(result['foo'], foo_exp)
-        tm.assert_series_equal(result['bar'], bar_exp)
-
-    def test_resample_unequal_times(self):
-        # #1772
-        start = datetime(1999, 3, 1, 5)
-        # end hour is less than start
-        end = datetime(2012, 7, 31, 4)
-        bad_ind = date_range(start, end, freq="30min")
-        df = DataFrame({'close': 1}, index=bad_ind)
-
-        # it works!
-        df.resample('AS').sum()
-
-    def test_resample_consistency(self):
-
-        # GH 6418
-        # resample with bfill / limit / reindex consistency
-
-        i30 = pd.date_range('2002-02-02', periods=4, freq='30T')
-        s = pd.Series(np.arange(4.), index=i30)
-        s[2] = np.NaN
-
-        # Upsample by factor 3 with reindex() and resample() methods:
-        i10 = pd.date_range(i30[0], i30[-1], freq='10T')
-
-        s10 = s.reindex(index=i10, method='bfill')
-        s10_2 = s.reindex(index=i10, method='bfill', limit=2)
-        rl = s.reindex_like(s10, method='bfill', limit=2)
-        r10_2 = s.resample('10Min').bfill(limit=2)
-        r10 = s.resample('10Min').bfill()
-
-        # s10_2, r10, r10_2, rl should all be equal
-        assert_series_equal(s10_2, r10)
-        assert_series_equal(s10_2, r10_2)
-        assert_series_equal(s10_2, rl)
-
-    def test_resample_timegrouper(self):
-        # GH 7227
-        dates1 = [datetime(2014, 10, 1), datetime(2014, 9, 3),
-                  datetime(2014, 11, 5), datetime(2014, 9, 5),
-                  datetime(2014, 10, 8), datetime(2014, 7, 15)]
-
-        dates2 = dates1[:2] + [pd.NaT] + dates1[2:4] + [pd.NaT] + dates1[4:]
-        dates3 = [pd.NaT] + dates1 + [pd.NaT]
-
-        for dates in [dates1, dates2, dates3]:
-            df = DataFrame(dict(A=dates, B=np.arange(len(dates))))
-            result = df.set_index('A').resample('M').count()
-            exp_idx = pd.DatetimeIndex(['2014-07-31', '2014-08-31',
-                                        '2014-09-30',
-                                        '2014-10-31', '2014-11-30'],
-                                       freq='M', name='A')
-            expected = DataFrame({'B': [1, 0, 2, 2, 1]}, index=exp_idx)
-            assert_frame_equal(result, expected)
-
-            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
-            assert_frame_equal(result, expected)
-
-            df = DataFrame(dict(A=dates, B=np.arange(len(dates)), C=np.arange(
-                len(dates))))
-            result = df.set_index('A').resample('M').count()
-            expected = DataFrame({'B': [1, 0, 2, 2, 1], 'C': [1, 0, 2, 2, 1]},
-                                 index=exp_idx, columns=['B', 'C'])
-            assert_frame_equal(result, expected)
-
-            result = df.groupby(pd.Grouper(freq='M', key='A')).count()
-            assert_frame_equal(result, expected)
-
-    def test_resample_nunique(self):
-
-        # GH 12352
-        df = DataFrame({
-            'ID': {pd.Timestamp('2015-06-05 00:00:00'): '0010100903',
-                   pd.Timestamp('2015-06-08 00:00:00'): '0010150847'},
-            'DATE': {pd.Timestamp('2015-06-05 00:00:00'): '2015-06-05',
-                     pd.Timestamp('2015-06-08 00:00:00'): '2015-06-08'}})
-        r = df.resample('D')
-        g = df.groupby(pd.Grouper(freq='D'))
-        expected = df.groupby(pd.TimeGrouper('D')).ID.apply(lambda x:
-                                                            x.nunique())
-        self.assertEqual(expected.name, 'ID')
-
-        for t in [r, g]:
-            result = r.ID.nunique()
-            assert_series_equal(result, expected)
-
-        result = df.ID.resample('D').nunique()
-        assert_series_equal(result, expected)
-
-        result = df.ID.groupby(pd.Grouper(freq='D')).nunique()
-        assert_series_equal(result, expected)
-
-    def test_resample_nunique_with_date_gap(self):
-        # GH 13453
-        index = pd.date_range('1-1-2000', '2-15-2000', freq='h')
-        index2 = pd.date_range('4-15-2000', '5-15-2000', freq='h')
-        index3 = index.append(index2)
-        s = pd.Series(range(len(index3)), index=index3, dtype='int64')
-        r = s.resample('M')
-
-        # Since all elements are unique, these should all be the same
-        results = [
-            r.count(),
-            r.nunique(),
-            r.agg(pd.Series.nunique),
-            r.agg('nunique')
-        ]
-
-        assert_series_equal(results[0], results[1])
-        assert_series_equal(results[0], results[2])
-        assert_series_equal(results[0], results[3])
-
-    def test_resample_group_info(self):  # GH10914
-        for n, k in product((10000, 100000), (10, 100, 1000)):
-            dr = date_range(start='2015-08-27', periods=n // 10, freq='T')
-            ts = Series(np.random.randint(0, n // k, n).astype('int64'),
-                        index=np.random.choice(dr, n))
-
-            left = ts.resample('30T').nunique()
-            ix = date_range(start=ts.index.min(), end=ts.index.max(),
-                            freq='30T')
-
-            vals = ts.values
-            bins = np.searchsorted(ix.values, ts.index, side='right')
-
-            sorter = np.lexsort((vals, bins))
-            vals, bins = vals[sorter], bins[sorter]
-
-            mask = np.r_[True, vals[1:] != vals[:-1]]
-            mask |= np.r_[True, bins[1:] != bins[:-1]]
-
-            arr = np.bincount(bins[mask] - 1,
-                              minlength=len(ix)).astype('int64', copy=False)
-            right = Series(arr, index=ix)
-
-            assert_series_equal(left, right)
-
-    def test_resample_size(self):
-        n = 10000
-        dr = date_range('2015-09-19', periods=n, freq='T')
-        ts = Series(np.random.randn(n), index=np.random.choice(dr, n))
-
-        left = ts.resample('7T').size()
-        ix = date_range(start=left.index.min(), end=ts.index.max(), freq='7T')
-
-        bins = np.searchsorted(ix.values, ts.index.values, side='right')
-        val = np.bincount(bins, minlength=len(ix) + 1)[1:].astype('int64',
-                                                                  copy=False)
-
-        right = Series(val, index=ix)
-        assert_series_equal(left, right)
-
-    def test_resample_across_dst(self):
-        # The test resamples a DatetimeIndex with values before and after a
-        # DST change
-        # Issue: 14682
-
-        # The DatetimeIndex we will start with
-        # (note that DST happens at 03:00+02:00 -> 02:00+01:00)
-        # 2016-10-30 02:23:00+02:00, 2016-10-30 02:23:00+01:00
-        df1 = DataFrame([1477786980, 1477790580], columns=['ts'])
-        dti1 = DatetimeIndex(pd.to_datetime(df1.ts, unit='s')
-                             .dt.tz_localize('UTC')
-                             .dt.tz_convert('Europe/Madrid'))
-
-        # The expected DatetimeIndex after resampling.
-        # 2016-10-30 02:00:00+02:00, 2016-10-30 02:00:00+01:00
-        df2 = DataFrame([1477785600, 1477789200], columns=['ts'])
-        dti2 = DatetimeIndex(pd.to_datetime(df2.ts, unit='s')
-                             .dt.tz_localize('UTC')
-                             .dt.tz_convert('Europe/Madrid'))
-        df = DataFrame([5, 5], index=dti1)
-
-        result = df.resample(rule='H').sum()
-        expected = DataFrame([5, 5], index=dti2)
-
-        assert_frame_equal(result, expected)
-
-    def test_resample_dst_anchor(self):
-        # 5172
-        dti = DatetimeIndex([datetime(2012, 11, 4, 23)], tz='US/Eastern')
-        df = DataFrame([5], index=dti)
-        assert_frame_equal(df.resample(rule='D').sum(),
-                           DataFrame([5], index=df.index.normalize()))
-        df.resample(rule='MS').sum()
-        assert_frame_equal(
-            df.resample(rule='MS').sum(),
-            DataFrame([5], index=DatetimeIndex([datetime(2012, 11, 1)],
-                                               tz='US/Eastern')))
-
-        dti = date_range('2013-09-30', '2013-11-02', freq='30Min',
-                         tz='Europe/Paris')
-        values = range(dti.size)
-        df = DataFrame({"a": values,
-                        "b": values,
-                        "c": values}, index=dti, dtype='int64')
-        how = {"a": "min", "b": "max", "c": "count"}
-
-        assert_frame_equal(
-            df.resample("W-MON").agg(how)[["a", "b", "c"]],
-            DataFrame({"a": [0, 48, 384, 720, 1056, 1394],
-                       "b": [47, 383, 719, 1055, 1393, 1586],
-                       "c": [48, 336, 336, 336, 338, 193]},
-                      index=date_range('9/30/2013', '11/4/2013',
-                                       freq='W-MON', tz='Europe/Paris')),
-            'W-MON Frequency')
-
-        assert_frame_equal(
-            df.resample("2W-MON").agg(how)[["a", "b", "c"]],
-            DataFrame({"a": [0, 48, 720, 1394],
-                       "b": [47, 719, 1393, 1586],
-                       "c": [48, 672, 674, 193]},
-                      index=date_range('9/30/2013', '11/11/2013',
-                                       freq='2W-MON', tz='Europe/Paris')),
-            '2W-MON Frequency')
-
-        assert_frame_equal(
-            df.resample("MS").agg(how)[["a", "b", "c"]],
-            DataFrame({"a": [0, 48, 1538],
-                       "b": [47, 1537, 1586],
-                       "c": [48, 1490, 49]},
-                      index=date_range('9/1/2013', '11/1/2013',
-                                       freq='MS', tz='Europe/Paris')),
-            'MS Frequency')
-
-        assert_frame_equal(
-            df.resample("2MS").agg(how)[["a", "b", "c"]],
-            DataFrame({"a": [0, 1538],
-                       "b": [1537, 1586],
-                       "c": [1538, 49]},
-                      index=date_range('9/1/2013', '11/1/2013',
-                                       freq='2MS', tz='Europe/Paris')),
-            '2MS Frequency')
-
-        df_daily = df['10/26/2013':'10/29/2013']
-        assert_frame_equal(
-            df_daily.resample("D").agg({"a": "min", "b": "max", "c": "count"})
-            [["a", "b", "c"]],
-            DataFrame({"a": [1248, 1296, 1346, 1394],
-                       "b": [1295, 1345, 1393, 1441],
-                       "c": [48, 50, 48, 48]},
-                      index=date_range('10/26/2013', '10/29/2013',
-                                       freq='D', tz='Europe/Paris')),
-            'D Frequency')
-
-    def test_resample_with_nat(self):
-        # GH 13020
-        index = DatetimeIndex([pd.NaT,
-                               '1970-01-01 00:00:00',
-                               pd.NaT,
-                               '1970-01-01 00:00:01',
-                               '1970-01-01 00:00:02'])
-        frame = DataFrame([2, 3, 5, 7, 11], index=index)
-
-        index_1s = DatetimeIndex(['1970-01-01 00:00:00',
-                                  '1970-01-01 00:00:01',
-                                  '1970-01-01 00:00:02'])
-        frame_1s = DataFrame([3, 7, 11], index=index_1s)
-        assert_frame_equal(frame.resample('1s').mean(), frame_1s)
-
-        index_2s = DatetimeIndex(['1970-01-01 00:00:00',
-                                  '1970-01-01 00:00:02'])
-        frame_2s = DataFrame([5, 11], index=index_2s)
-        assert_frame_equal(frame.resample('2s').mean(), frame_2s)
-
-        index_3s = DatetimeIndex(['1970-01-01 00:00:00'])
-        frame_3s = DataFrame([7], index=index_3s)
-        assert_frame_equal(frame.resample('3s').mean(), frame_3s)
-
-        assert_frame_equal(frame.resample('60s').mean(), frame_3s)
-
-    def test_resample_timedelta_values(self):
-        # GH 13119
-        # check that timedelta dtype is preserved when NaT values are
-        # introduced by the resampling
-
-        times = timedelta_range('1 day', '4 day', freq='4D')
-        df = DataFrame({'time': times}, index=times)
-
-        times2 = timedelta_range('1 day', '4 day', freq='2D')
-        exp = Series(times2, index=times2, name='time')
-        exp.iloc[1] = pd.NaT
-
-        res = df.resample('2D').first()['time']
-        tm.assert_series_equal(res, exp)
-        res = df['time'].resample('2D').first()
-        tm.assert_series_equal(res, exp)
-
-    def test_resample_datetime_values(self):
-        # GH 13119
-        # check that datetime dtype is preserved when NaT values are
-        # introduced by the resampling
-
-        dates = [datetime(2016, 1, 15), datetime(2016, 1, 19)]
-        df = DataFrame({'timestamp': dates}, index=dates)
-
-        exp = Series([datetime(2016, 1, 15), pd.NaT, datetime(2016, 1, 19)],
-                     index=date_range('2016-01-15', periods=3, freq='2D'),
-                     name='timestamp')
-
-        res = df.resample('2D').first()['timestamp']
-        tm.assert_series_equal(res, exp)
-        res = df['timestamp'].resample('2D').first()
-        tm.assert_series_equal(res, exp)
-
-
-class TestPeriodIndex(Base, tm.TestCase):
-    _index_factory = lambda x: period_range
-
-    def create_series(self):
-        i = period_range(datetime(2005, 1, 1),
-                         datetime(2005, 1, 10), freq='D')
-
-        return Series(np.arange(len(i)), index=i, name='pi')
-
-    def test_asfreq_downsample(self):
-
-        # series
-        s = self.create_series()
-        expected = s.reindex(s.index.take(np.arange(0, len(s.index), 2)))
-        expected.index = expected.index.to_timestamp()
-        expected.index.freq = to_offset('2D')
-
-        # this is a bug, this *should* return a PeriodIndex
-        # directly
-        # GH 12884
-        result = s.resample('2D').asfreq()
-        assert_series_equal(result, expected)
-
-        # frame
-        frame = s.to_frame('value')
-        expected = frame.reindex(
-            frame.index.take(np.arange(0, len(frame.index), 2)))
-        expected.index = expected.index.to_timestamp()
-        expected.index.freq = to_offset('2D')
-        result = frame.resample('2D').asfreq()
-        assert_frame_equal(result, expected)
-
-    def test_asfreq_upsample(self):
-
-        # this is a bug, this *should* return a PeriodIndex
-        # directly
-        # GH 12884
-        s = self.create_series()
-        new_index = date_range(s.index[0].to_timestamp(how='start'),
-                               (s.index[-1] + 1).to_timestamp(how='start'),
-                               freq='1H',
-                               closed='left')
-        expected = s.to_timestamp().reindex(new_index).to_period()
-        result = s.resample('1H').asfreq()
-        assert_series_equal(result, expected)
-
-        frame = s.to_frame('value')
-        new_index = date_range(frame.index[0].to_timestamp(how='start'),
-                               (frame.index[-1] + 1).to_timestamp(how='start'),
-                               freq='1H',
-                               closed='left')
-        expected = frame.to_timestamp().reindex(new_index).to_period()
-        result = frame.resample('1H').asfreq()
-        assert_frame_equal(result, expected)
-
-    def test_asfreq_fill_value(self):
-        # test for fill value during resampling, issue 3715
-
-        s = self.create_series()
-        new_index = date_range(s.index[0].to_timestamp(how='start'),
-                               (s.index[-1]).to_timestamp(how='start'),
-                               freq='1H')
-        expected = s.to_timestamp().reindex(new_index, fill_value=4.0)
-        result = s.resample('1H', kind='timestamp').asfreq(fill_value=4.0)
-        assert_series_equal(result, expected)
-
-        frame = s.to_frame('value')
-        new_index = date_range(frame.index[0].to_timestamp(how='start'),
-                               (frame.index[-1]).to_timestamp(how='start'),
-                               freq='1H')
-        expected = frame.to_timestamp().reindex(new_index, fill_value=3.0)
-        result = frame.resample('1H', kind='timestamp').asfreq(fill_value=3.0)
-        assert_frame_equal(result, expected)
-
-    def test_selection(self):
-        index = self.create_series().index
-        # This is a bug, these should be implemented
-        # GH 14008
-        df = pd.DataFrame({'date': index,
-                           'a': np.arange(len(index), dtype=np.int64)},
-                          index=pd.MultiIndex.from_arrays([
-                              np.arange(len(index), dtype=np.int64),
-                              index], names=['v', 'd']))
-
-        with tm.assertRaises(NotImplementedError):
-            df.resample('2D', on='date')
-
-        with tm.assertRaises(NotImplementedError):
-            df.resample('2D', level='d')
-
-    def test_annual_upsample_D_s_f(self):
-        self._check_annual_upsample_cases('D', 'start', 'ffill')
-
-    def test_annual_upsample_D_e_f(self):
-        self._check_annual_upsample_cases('D', 'end', 'ffill')
-
-    def test_annual_upsample_D_s_b(self):
-        self._check_annual_upsample_cases('D', 'start', 'bfill')
-
-    def test_annual_upsample_D_e_b(self):
-        self._check_annual_upsample_cases('D', 'end', 'bfill')
-
-    def test_annual_upsample_B_s_f(self):
-        self._check_annual_upsample_cases('B', 'start', 'ffill')
-
-    def test_annual_upsample_B_e_f(self):
-        self._check_annual_upsample_cases('B', 'end', 'ffill')
-
-    def test_annual_upsample_B_s_b(self):
-        self._check_annual_upsample_cases('B', 'start', 'bfill')
-
-    def test_annual_upsample_B_e_b(self):
-        self._check_annual_upsample_cases('B', 'end', 'bfill')
-
-    def test_annual_upsample_M_s_f(self):
-        self._check_annual_upsample_cases('M', 'start', 'ffill')
-
-    def test_annual_upsample_M_e_f(self):
-        self._check_annual_upsample_cases('M', 'end', 'ffill')
-
-    def test_annual_upsample_M_s_b(self):
-        self._check_annual_upsample_cases('M', 'start', 'bfill')
-
-    def test_annual_upsample_M_e_b(self):
-        self._check_annual_upsample_cases('M', 'end', 'bfill')
-
-    def _check_annual_upsample_cases(self, targ, conv, meth, end='12/31/1991'):
-        for month in MONTHS:
-            ts = _simple_pts('1/1/1990', end, freq='A-%s' % month)
-
-            result = getattr(ts.resample(targ, convention=conv), meth)()
-            expected = result.to_timestamp(targ, how=conv)
-            expected = expected.asfreq(targ, meth).to_period()
-            assert_series_equal(result, expected)
-
-    def test_basic_downsample(self):
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
-        result = ts.resample('a-dec').mean()
-
-        expected = ts.groupby(ts.index.year).mean()
-        expected.index = period_range('1/1/1990', '6/30/1995', freq='a-dec')
-        assert_series_equal(result, expected)
-
-        # this is ok
-        assert_series_equal(ts.resample('a-dec').mean(), result)
-        assert_series_equal(ts.resample('a').mean(), result)
-
-    def test_not_subperiod(self):
-        # These are incompatible period rules for resampling
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='w-wed')
-        self.assertRaises(ValueError, lambda: ts.resample('a-dec').mean())
-        self.assertRaises(ValueError, lambda: ts.resample('q-mar').mean())
-        self.assertRaises(ValueError, lambda: ts.resample('M').mean())
-        self.assertRaises(ValueError, lambda: ts.resample('w-thu').mean())
-
-    def test_basic_upsample(self):
-        ts = _simple_pts('1/1/1990', '6/30/1995', freq='M')
-        result = ts.resample('a-dec').mean()
-
-        resampled = result.resample('D', convention='end').ffill()
-
-        expected = result.to_timestamp('D', how='end')
-        expected = expected.asfreq('D', 'ffill').to_period()
-
-        assert_series_equal(resampled, expected)
-
-    def test_upsample_with_limit(self):
-        rng = period_range('1/1/2000', periods=5, freq='A')
-        ts = Series(np.random.randn(len(rng)), rng)
-
-        result = ts.resample('M', convention='end').ffill(limit=2)
-        expected = ts.asfreq('M').reindex(result.index, method='ffill',
-                                          limit=2)
-        assert_series_equal(result, expected)
-
-    def test_annual_upsample(self):
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='A-DEC')
-        df = DataFrame({'a': ts})
-        rdf = df.resample('D').ffill()
-        exp = df['a'].resample('D').ffill()
-        assert_series_equal(rdf['a'], exp)
-
-        rng = period_range('2000', '2003', freq='A-DEC')
-        ts = Series([1, 2, 3, 4], index=rng)
-
-        result = ts.resample('M').ffill()
-        ex_index = period_range('2000-01', '2003-12', freq='M')
-
-        expected = ts.asfreq('M', how='start').reindex(ex_index,
-                                                       method='ffill')
-        assert_series_equal(result, expected)
-
-    def test_quarterly_upsample(self):
-        targets = ['D', 'B', 'M']
-
-        for month in MONTHS:
-            ts = _simple_pts('1/1/1990', '12/31/1995', freq='Q-%s' % month)
-
-            for targ, conv in product(targets, ['start', 'end']):
-                result = ts.resample(targ, convention=conv).ffill()
-                expected = result.to_timestamp(targ, how=conv)
-                expected = expected.asfreq(targ, 'ffill').to_period()
-                assert_series_equal(result, expected)
-
-    def test_monthly_upsample(self):
-        targets = ['D', 'B']
-
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
-
-        for targ, conv in product(targets, ['start', 'end']):
-            result = ts.resample(targ, convention=conv).ffill()
-            expected = result.to_timestamp(targ, how=conv)
-            expected = expected.asfreq(targ, 'ffill').to_period()
-            assert_series_equal(result, expected)
-
-    def test_resample_basic(self):
-        # GH3609
-        s = Series(range(100), index=date_range(
-            '20130101', freq='s', periods=100, name='idx'), dtype='float')
-        s[10:30] = np.nan
-        index = PeriodIndex([
-            Period('2013-01-01 00:00', 'T'),
-            Period('2013-01-01 00:01', 'T')], name='idx')
-        expected = Series([34.5, 79.5], index=index)
-        result = s.to_period().resample('T', kind='period').mean()
-        assert_series_equal(result, expected)
-        result2 = s.resample('T', kind='period').mean()
-        assert_series_equal(result2, expected)
-
-    def test_resample_count(self):
-
-        # GH12774
-        series = pd.Series(1, index=pd.period_range(start='2000',
-                                                    periods=100))
-        result = series.resample('M').count()
-
-        expected_index = pd.period_range(start='2000', freq='M', periods=4)
-        expected = pd.Series([31, 29, 31, 9], index=expected_index)
-
-        assert_series_equal(result, expected)
-
-    def test_resample_same_freq(self):
-
-        # GH12770
-        series = pd.Series(range(3), index=pd.period_range(
-            start='2000', periods=3, freq='M'))
-        expected = series
-
-        for method in resample_methods:
-            result = getattr(series.resample('M'), method)()
-            assert_series_equal(result, expected)
-
-    def test_resample_incompat_freq(self):
-
-        with self.assertRaises(IncompatibleFrequency):
-            pd.Series(range(3), index=pd.period_range(
-                start='2000', periods=3, freq='M')).resample('W').mean()
-
-    def test_with_local_timezone_pytz(self):
-        # GH5430
-        tm._skip_if_no_pytz()
-        import pytz
-
-        local_timezone = pytz.timezone('America/Los_Angeles')
-
-        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
-                         tzinfo=pytz.utc)
-        # 1 day later
-        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
-                       tzinfo=pytz.utc)
-
-        index = pd.date_range(start, end, freq='H')
-
-        series = pd.Series(1, index=index)
-        series = series.tz_convert(local_timezone)
-        result = series.resample('D', kind='period').mean()
-
-        # Create the expected series
-        # Index is moved back a day with the timezone conversion from UTC to
-        # Pacific
-        expected_index = (pd.period_range(start=start, end=end, freq='D') - 1)
-        expected = pd.Series(1, index=expected_index)
-        assert_series_equal(result, expected)
-
-    def test_with_local_timezone_dateutil(self):
-        # GH5430
-        tm._skip_if_no_dateutil()
-        import dateutil
-
-        local_timezone = 'dateutil/America/Los_Angeles'
-
-        start = datetime(year=2013, month=11, day=1, hour=0, minute=0,
-                         tzinfo=dateutil.tz.tzutc())
-        # 1 day later
-        end = datetime(year=2013, month=11, day=2, hour=0, minute=0,
-                       tzinfo=dateutil.tz.tzutc())
-
-        index = pd.date_range(start, end, freq='H', name='idx')
-
-        series = pd.Series(1, index=index)
-        series = series.tz_convert(local_timezone)
-        result = series.resample('D', kind='period').mean()
-
-        # Create the expected series
-        # Index is moved back a day with the timezone conversion from UTC to
-        # Pacific
-        expected_index = (pd.period_range(start=start, end=end, freq='D',
-                                          name='idx') - 1)
-        expected = pd.Series(1, index=expected_index)
-        assert_series_equal(result, expected)
-
-    def test_fill_method_and_how_upsample(self):
-        # GH2073
-        s = Series(np.arange(9, dtype='int64'),
-                   index=date_range('2010-01-01', periods=9, freq='Q'))
-        last = s.resample('M').ffill()
-        both = s.resample('M').ffill().resample('M').last().astype('int64')
-        assert_series_equal(last, both)
-
-    def test_weekly_upsample(self):
-        targets = ['D', 'B']
-
-        for day in DAYS:
-            ts = _simple_pts('1/1/1990', '12/31/1995', freq='W-%s' % day)
-
-            for targ, conv in product(targets, ['start', 'end']):
-                result = ts.resample(targ, convention=conv).ffill()
-                expected = result.to_timestamp(targ, how=conv)
-                expected = expected.asfreq(targ, 'ffill').to_period()
-                assert_series_equal(result, expected)
-
-    def test_resample_to_timestamps(self):
-        ts = _simple_pts('1/1/1990', '12/31/1995', freq='M')
-
-        result = ts.resample('A-DEC', kind='timestamp').mean()
-        expected = ts.to_timestamp(how='end').resample('A-DEC').mean()
-        assert_series_equal(result, expected)
-
-    def test_resample_to_quarterly(self):
-        for month in MONTHS:
-            ts = _simple_pts('1990', '1992', freq='A-%s' % month)
-            quar_ts = ts.resample('Q-%s' % month).ffill()
-
-            stamps = ts.to_timestamp('D', how='start')
-            qdates = period_range(ts.index[0].asfreq('D', 'start'),
-                                  ts.index[-1].asfreq('D', 'end'),
-                                  freq='Q-%s' % month)
-
-            expected = stamps.reindex(qdates.to_timestamp('D', 's'),
-                                      method='ffill')
-            expected.index = qdates
-
-            assert_series_equal(quar_ts, expected)
-
-        # conforms, but different month
-        ts = _simple_pts('1990', '1992', freq='A-JUN')
-
-        for how in ['start', 'end']:
-            result = ts.resample('Q-MAR', convention=how).ffill()
-            expected = ts.asfreq('Q-MAR', how=how)
-            expected = expected.reindex(result.index, method='ffill')
-
-            # .to_timestamp('D')
-            # expected = expected.resample('Q-MAR').ffill()
-
-            assert_series_equal(result, expected)
-
-    def test_resample_fill_missing(self):
-        rng = PeriodIndex([2000, 2005, 2007, 2009], freq='A')
-
-        s = Series(np.random.randn(4), index=rng)
-
-        stamps = s.to_timestamp()
-        filled = s.resample('A').ffill()
-        expected = stamps.resample('A').ffill().to_period('A')
-        assert_series_equal(filled, expected)
-
-    def test_cant_fill_missing_dups(self):
-        rng = PeriodIndex([2000, 2005, 2005, 2007, 2007], freq='A')
-        s = Series(np.random.randn(5), index=rng)
-        self.assertRaises(Exception, lambda: s.resample('A').ffill())
-
-    def test_resample_5minute(self):
-        rng = period_range('1/1/2000', '1/5/2000', freq='T')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('5min').mean()
-        expected = ts.to_timestamp().resample('5min').mean()
-        assert_series_equal(result, expected)
-
-    def test_upsample_daily_business_daily(self):
-        ts = _simple_pts('1/1/2000', '2/1/2000', freq='B')
-
-        result = ts.resample('D').asfreq()
-        expected = ts.asfreq('D').reindex(period_range('1/3/2000', '2/1/2000'))
-        assert_series_equal(result, expected)
-
-        ts = _simple_pts('1/1/2000', '2/1/2000')
-        result = ts.resample('H', convention='s').asfreq()
-        exp_rng = period_range('1/1/2000', '2/1/2000 23:00', freq='H')
-        expected = ts.asfreq('H', how='s').reindex(exp_rng)
-        assert_series_equal(result, expected)
-
-    def test_resample_irregular_sparse(self):
-        dr = date_range(start='1/1/2012', freq='5min', periods=1000)
-        s = Series(np.array(100), index=dr)
-        # subset the data.
-        subset = s[:'2012-01-04 06:55']
-
-        result = subset.resample('10min').apply(len)
-        expected = s.resample('10min').apply(len).loc[result.index]
-        assert_series_equal(result, expected)
-
-    def test_resample_weekly_all_na(self):
-        rng = date_range('1/1/2000', periods=10, freq='W-WED')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts.resample('W-THU').asfreq()
-
-        self.assertTrue(result.isnull().all())
-
-        result = ts.resample('W-THU').asfreq().ffill()[:-1]
-        expected = ts.asfreq('W-THU').ffill()
-        assert_series_equal(result, expected)
-
-    def test_resample_tz_localized(self):
-        dr = date_range(start='2012-4-13', end='2012-5-1')
-        ts = Series(lrange(len(dr)), dr)
-
-        ts_utc = ts.tz_localize('UTC')
-        ts_local = ts_utc.tz_convert('America/Los_Angeles')
-
-        result = ts_local.resample('W').mean()
-
-        ts_local_naive = ts_local.copy()
-        ts_local_naive.index = [x.replace(tzinfo=None)
-                                for x in ts_local_naive.index.to_pydatetime()]
-
-        exp = ts_local_naive.resample(
-            'W').mean().tz_localize('America/Los_Angeles')
-
-        assert_series_equal(result, exp)
-
-        # it works
-        result = ts_local.resample('D').mean()
-
-        # #2245
-        idx = date_range('2001-09-20 15:59', '2001-09-20 16:00', freq='T',
-                         tz='Australia/Sydney')
-        s = Series([1, 2], index=idx)
-
-        result = s.resample('D', closed='right', label='right').mean()
-        ex_index = date_range('2001-09-21', periods=1, freq='D',
-                              tz='Australia/Sydney')
-        expected = Series([1.5], index=ex_index)
-
-        assert_series_equal(result, expected)
-
-        # for good measure
-        result = s.resample('D', kind='period').mean()
-        ex_index = period_range('2001-09-20', periods=1, freq='D')
-        expected = Series([1.5], index=ex_index)
-        assert_series_equal(result, expected)
-
-        # GH 6397
-        # comparing an offset that doesn't propagate tz's
-        rng = date_range('1/1/2011', periods=20000, freq='H')
-        rng = rng.tz_localize('EST')
-        ts = DataFrame(index=rng)
-        ts['first'] = np.random.randn(len(rng))
-        ts['second'] = np.cumsum(np.random.randn(len(rng)))
-        expected = DataFrame(
-            {
-                'first': ts.resample('A').sum()['first'],
-                'second': ts.resample('A').mean()['second']},
-            columns=['first', 'second'])
-        result = ts.resample(
-            'A').agg({'first': np.sum,
-                      'second': np.mean}).reindex(columns=['first', 'second'])
-        assert_frame_equal(result, expected)
-
-    def test_closed_left_corner(self):
-        # #1465
-        s = Series(np.random.randn(21),
-                   index=date_range(start='1/1/2012 9:30',
-                                    freq='1min', periods=21))
-        s[0] = np.nan
-
-        result = s.resample('10min', closed='left', label='right').mean()
-        exp = s[1:].resample('10min', closed='left', label='right').mean()
-        assert_series_equal(result, exp)
-
-        result = s.resample('10min', closed='left', label='left').mean()
-        exp = s[1:].resample('10min', closed='left', label='left').mean()
-
-        ex_index = date_range(start='1/1/2012 9:30', freq='10min', periods=3)
-
-        self.assert_index_equal(result.index, ex_index)
-        assert_series_equal(result, exp)
-
-    def test_quarterly_resampling(self):
-        rng = period_range('2000Q1', periods=10, freq='Q-DEC')
-        ts = Series(np.arange(10), index=rng)
-
-        result = ts.resample('A').mean()
-        exp = ts.to_timestamp().resample('A').mean().to_period()
-        assert_series_equal(result, exp)
-
-    def test_resample_weekly_bug_1726(self):
-        # 8/6/12 is a Monday
-        ind = DatetimeIndex(start="8/6/2012", end="8/26/2012", freq="D")
-        n = len(ind)
-        data = [[x] * 5 for x in range(n)]
-        df = DataFrame(data, columns=['open', 'high', 'low', 'close', 'vol'],
-                       index=ind)
-
-        # it works!
-        df.resample('W-MON', closed='left', label='left').first()
-
-    def test_resample_bms_2752(self):
-        # GH2753
-        foo = pd.Series(index=pd.bdate_range('20000101', '20000201'))
-        res1 = foo.resample("BMS").mean()
-        res2 = foo.resample("BMS").mean().resample("B").mean()
-        self.assertEqual(res1.index[0], Timestamp('20000103'))
-        self.assertEqual(res1.index[0], res2.index[0])
-
-    # def test_monthly_convention_span(self):
-    #     rng = period_range('2000-01', periods=3, freq='M')
-    #     ts = Series(np.arange(3), index=rng)
-
-    #     # hacky way to get same thing
-    #     exp_index = period_range('2000-01-01', '2000-03-31', freq='D')
-    #     expected = ts.asfreq('D', how='end').reindex(exp_index)
-    #     expected = expected.fillna(method='bfill')
-
-    #     result = ts.resample('D', convention='span').mean()
-
-    #     assert_series_equal(result, expected)
-
-    def test_default_right_closed_label(self):
-        end_freq = ['D', 'Q', 'M', 'D']
-        end_types = ['M', 'A', 'Q', 'W']
-
-        for from_freq, to_freq in zip(end_freq, end_types):
-            idx = DatetimeIndex(start='8/15/2012', periods=100, freq=from_freq)
-            df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-            resampled = df.resample(to_freq).mean()
-            assert_frame_equal(resampled, df.resample(to_freq, closed='right',
-                                                      label='right').mean())
-
-    def test_default_left_closed_label(self):
-        others = ['MS', 'AS', 'QS', 'D', 'H']
-        others_freq = ['D', 'Q', 'M', 'H', 'T']
-
-        for from_freq, to_freq in zip(others_freq, others):
-            idx = DatetimeIndex(start='8/15/2012', periods=100, freq=from_freq)
-            df = DataFrame(np.random.randn(len(idx), 2), idx)
-
-            resampled = df.resample(to_freq).mean()
-            assert_frame_equal(resampled, df.resample(to_freq, closed='left',
-                                                      label='left').mean())
-
-    def test_all_values_single_bin(self):
-        # 2070
-        index = period_range(start="2012-01-01", end="2012-12-31", freq="M")
-        s = Series(np.random.randn(len(index)), index=index)
-
-        result = s.resample("A").mean()
-        tm.assert_almost_equal(result[0], s.mean())
-
-    def test_evenly_divisible_with_no_extra_bins(self):
-        # 4076
-        # when the frequency is evenly divisible, sometimes extra bins
-
-        df = DataFrame(np.random.randn(9, 3),
-                       index=date_range('2000-1-1', periods=9))
-        result = df.resample('5D').mean()
-        expected = pd.concat(
-            [df.iloc[0:5].mean(), df.iloc[5:].mean()], axis=1).T
-        expected.index = [Timestamp('2000-1-1'), Timestamp('2000-1-6')]
-        assert_frame_equal(result, expected)
-
-        index = date_range(start='2001-5-4', periods=28)
-        df = DataFrame(
-            [{'REST_KEY': 1, 'DLY_TRN_QT': 80, 'DLY_SLS_AMT': 90,
-              'COOP_DLY_TRN_QT': 30, 'COOP_DLY_SLS_AMT': 20}] * 28 +
-            [{'REST_KEY': 2, 'DLY_TRN_QT': 70, 'DLY_SLS_AMT': 10,
-              'COOP_DLY_TRN_QT': 50, 'COOP_DLY_SLS_AMT': 20}] * 28,
-            index=index.append(index)).sort_index()
-
-        index = date_range('2001-5-4', periods=4, freq='7D')
-        expected = DataFrame(
-            [{'REST_KEY': 14, 'DLY_TRN_QT': 14, 'DLY_SLS_AMT': 14,
-              'COOP_DLY_TRN_QT': 14, 'COOP_DLY_SLS_AMT': 14}] * 4,
-            index=index)
-        result = df.resample('7D').count()
-        assert_frame_equal(result, expected)
-
-        expected = DataFrame(
-            [{'REST_KEY': 21, 'DLY_TRN_QT': 1050, 'DLY_SLS_AMT': 700,
-              'COOP_DLY_TRN_QT': 560, 'COOP_DLY_SLS_AMT': 280}] * 4,
-            index=index)
-        result = df.resample('7D').sum()
-        assert_frame_equal(result, expected)
-
-
-class TestTimedeltaIndex(Base, tm.TestCase):
-    _index_factory = lambda x: timedelta_range
-
-    def create_series(self):
-        i = timedelta_range('1 day',
-                            '10 day', freq='D')
-
-        return Series(np.arange(len(i)), index=i, name='tdi')
-
-    def test_asfreq_bug(self):
-        import datetime as dt
-        df = DataFrame(data=[1, 3],
-                       index=[dt.timedelta(), dt.timedelta(minutes=3)])
-        result = df.resample('1T').asfreq()
-        expected = DataFrame(data=[1, np.nan, np.nan, 3],
-                             index=timedelta_range('0 day',
-                                                   periods=4,
-                                                   freq='1T'))
-        assert_frame_equal(result, expected)
-
-
-class TestResamplerGrouper(tm.TestCase):
-
-    def setUp(self):
-        self.frame = DataFrame({'A': [1] * 20 + [2] * 12 + [3] * 8,
-                                'B': np.arange(40)},
-                               index=date_range('1/1/2000',
-                                                freq='s',
-                                                periods=40))
-
-    def test_back_compat_v180(self):
-
-        df = self.frame
-        for how in ['sum', 'mean', 'prod', 'min', 'max', 'var', 'std']:
-            with tm.assert_produces_warning(FutureWarning,
-                                            check_stacklevel=False):
-                result = df.groupby('A').resample('4s', how=how)
-                expected = getattr(df.groupby('A').resample('4s'), how)()
-                assert_frame_equal(result, expected)
-
-        with tm.assert_produces_warning(FutureWarning,
-                                        check_stacklevel=False):
-            result = df.groupby('A').resample('4s', how='mean',
-                                              fill_method='ffill')
-            expected = df.groupby('A').resample('4s').mean().ffill()
-            assert_frame_equal(result, expected)
-
-    def test_deferred_with_groupby(self):
-
-        # GH 12486
-        # support deferred resample ops with groupby
-        data = [['2010-01-01', 'A', 2], ['2010-01-02', 'A', 3],
-                ['2010-01-05', 'A', 8], ['2010-01-10', 'A', 7],
-                ['2010-01-13', 'A', 3], ['2010-01-01', 'B', 5],
-                ['2010-01-03', 'B', 2], ['2010-01-04', 'B', 1],
-                ['2010-01-11', 'B', 7], ['2010-01-14', 'B', 3]]
-
-        df = DataFrame(data, columns=['date', 'id', 'score'])
-        df.date = pd.to_datetime(df.date)
-        f = lambda x: x.set_index('date').resample('D').asfreq()
-        expected = df.groupby('id').apply(f)
-        result = df.set_index('date').groupby('id').resample('D').asfreq()
-        assert_frame_equal(result, expected)
-
-        df = DataFrame({'date': pd.date_range(start='2016-01-01',
-                                              periods=4,
-                                              freq='W'),
-                        'group': [1, 1, 2, 2],
-                        'val': [5, 6, 7, 8]}).set_index('date')
-
-        f = lambda x: x.resample('1D').ffill()
-        expected = df.groupby('group').apply(f)
-        result = df.groupby('group').resample('1D').ffill()
-        assert_frame_equal(result, expected)
-
-    def test_getitem(self):
-        g = self.frame.groupby('A')
-
-        expected = g.B.apply(lambda x: x.resample('2s').mean())
-
-        result = g.resample('2s').B.mean()
-        assert_series_equal(result, expected)
-
-        result = g.B.resample('2s').mean()
-        assert_series_equal(result, expected)
-
-        result = g.resample('2s').mean().B
-        assert_series_equal(result, expected)
-
-    def test_getitem_multiple(self):
-
-        # GH 13174
-        # multiple calls after selection causing an issue with aliasing
-        data = [{'id': 1, 'buyer': 'A'}, {'id': 2, 'buyer': 'B'}]
-        df = pd.DataFrame(data, index=pd.date_range('2016-01-01', periods=2))
-        r = df.groupby('id').resample('1D')
-        result = r['buyer'].count()
-        expected = pd.Series([1, 1],
-                             index=pd.MultiIndex.from_tuples(
-                                 [(1, pd.Timestamp('2016-01-01')),
-                                  (2, pd.Timestamp('2016-01-02'))],
-                                 names=['id', None]),
-                             name='buyer')
-        assert_series_equal(result, expected)
-
-        result = r['buyer'].count()
-        assert_series_equal(result, expected)
-
-    def test_methods(self):
-        g = self.frame.groupby('A')
-        r = g.resample('2s')
-
-        for f in ['first', 'last', 'median', 'sem', 'sum', 'mean',
-                  'min', 'max']:
-            result = getattr(r, f)()
-            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
-            assert_frame_equal(result, expected)
-
-        for f in ['size']:
-            result = getattr(r, f)()
-            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
-            assert_series_equal(result, expected)
-
-        for f in ['count']:
-            result = getattr(r, f)()
-            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
-            assert_frame_equal(result, expected)
-
-        # series only
-        for f in ['nunique']:
-            result = getattr(r.B, f)()
-            expected = g.B.apply(lambda x: getattr(x.resample('2s'), f)())
-            assert_series_equal(result, expected)
-
-        for f in ['backfill', 'ffill', 'asfreq']:
-            result = getattr(r, f)()
-            expected = g.apply(lambda x: getattr(x.resample('2s'), f)())
-            assert_frame_equal(result, expected)
-
-        result = r.ohlc()
-        expected = g.apply(lambda x: x.resample('2s').ohlc())
-        assert_frame_equal(result, expected)
-
-        for f in ['std', 'var']:
-            result = getattr(r, f)(ddof=1)
-            expected = g.apply(lambda x: getattr(x.resample('2s'), f)(ddof=1))
-            assert_frame_equal(result, expected)
-
-    def test_apply(self):
-
-        g = self.frame.groupby('A')
-        r = g.resample('2s')
-
-        # reduction
-        expected = g.resample('2s').sum()
-
-        def f(x):
-            return x.resample('2s').sum()
-
-        result = r.apply(f)
-        assert_frame_equal(result, expected)
-
-        def f(x):
-            return x.resample('2s').apply(lambda y: y.sum())
-
-        result = g.apply(f)
-        assert_frame_equal(result, expected)
-
-    def test_resample_groupby_with_label(self):
-        # GH 13235
-        index = date_range('2000-01-01', freq='2D', periods=5)
-        df = DataFrame(index=index,
-                       data={'col0': [0, 0, 1, 1, 2], 'col1': [1, 1, 1, 1, 1]}
-                       )
-        result = df.groupby('col0').resample('1W', label='left').sum()
-
-        mi = [np.array([0, 0, 1, 2]),
-              pd.to_datetime(np.array(['1999-12-26', '2000-01-02',
-                                       '2000-01-02', '2000-01-02'])
-                             )
-              ]
-        mindex = pd.MultiIndex.from_arrays(mi, names=['col0', None])
-        expected = DataFrame(data={'col0': [0, 0, 2, 2], 'col1': [1, 1, 2, 1]},
-                             index=mindex
-                             )
-
-        assert_frame_equal(result, expected)
-
-    def test_consistency_with_window(self):
-
-        # consistent return values with window
-        df = self.frame
-        expected = pd.Int64Index([1, 2, 3], name='A')
-        result = df.groupby('A').resample('2s').mean()
-        self.assertEqual(result.index.nlevels, 2)
-        tm.assert_index_equal(result.index.levels[0], expected)
-
-        result = df.groupby('A').rolling(20).mean()
-        self.assertEqual(result.index.nlevels, 2)
-        tm.assert_index_equal(result.index.levels[0], expected)
-
-    def test_median_duplicate_columns(self):
-        # GH 14233
-
-        df = pd.DataFrame(np.random.randn(20, 3),
-                          columns=list('aaa'),
-                          index=pd.date_range('2012-01-01',
-                                              periods=20, freq='s'))
-        df2 = df.copy()
-        df2.columns = ['a', 'b', 'c']
-        expected = df2.resample('5s').median()
-        result = df.resample('5s').median()
-        expected.columns = result.columns
-        assert_frame_equal(result, expected)
-
-
-class TestTimeGrouper(tm.TestCase):
-
-    def setUp(self):
-        self.ts = Series(np.random.randn(1000),
-                         index=date_range('1/1/2000', periods=1000))
-
-    def test_apply(self):
-        grouper = TimeGrouper('A', label='right', closed='right')
-
-        grouped = self.ts.groupby(grouper)
-
-        f = lambda x: x.sort_values()[-3:]
-
-        applied = grouped.apply(f)
-        expected = self.ts.groupby(lambda x: x.year).apply(f)
-
-        applied.index = applied.index.droplevel(0)
-        expected.index = expected.index.droplevel(0)
-        assert_series_equal(applied, expected)
-
-    def test_count(self):
-        self.ts[::3] = np.nan
-
-        expected = self.ts.groupby(lambda x: x.year).count()
-
-        grouper = TimeGrouper('A', label='right', closed='right')
-        result = self.ts.groupby(grouper).count()
-        expected.index = result.index
-        assert_series_equal(result, expected)
-
-        result = self.ts.resample('A').count()
-        expected.index = result.index
-        assert_series_equal(result, expected)
-
-    def test_numpy_reduction(self):
-        result = self.ts.resample('A', closed='right').prod()
-
-        expected = self.ts.groupby(lambda x: x.year).agg(np.prod)
-        expected.index = result.index
-
-        assert_series_equal(result, expected)
-
-    def test_apply_iteration(self):
-        # #2300
-        N = 1000
-        ind = pd.date_range(start="2000-01-01", freq="D", periods=N)
-        df = DataFrame({'open': 1, 'close': 2}, index=ind)
-        tg = TimeGrouper('M')
-
-        _, grouper, _ = tg._get_grouper(df)
-
-        # Errors
-        grouped = df.groupby(grouper, group_keys=False)
-        f = lambda df: df['close'] / df['open']
-
-        # it works!
-        result = grouped.apply(f)
-        self.assert_index_equal(result.index, df.index)
-
-    def test_panel_aggregation(self):
-        ind = pd.date_range('1/1/2000', periods=100)
-        data = np.random.randn(2, len(ind), 4)
-        wp = pd.Panel(data, items=['Item1', 'Item2'], major_axis=ind,
-                      minor_axis=['A', 'B', 'C', 'D'])
-
-        tg = TimeGrouper('M', axis=1)
-        _, grouper, _ = tg._get_grouper(wp)
-        bingrouped = wp.groupby(grouper)
-        binagg = bingrouped.mean()
-
-        def f(x):
-            assert (isinstance(x, Panel))
-            return x.mean(1)
-
-        result = bingrouped.agg(f)
-        tm.assert_panel_equal(result, binagg)
-
-    def test_fails_on_no_datetime_index(self):
-        index_names = ('Int64Index', 'Index', 'Float64Index', 'MultiIndex')
-        index_funcs = (tm.makeIntIndex,
-                       tm.makeUnicodeIndex, tm.makeFloatIndex,
-                       lambda m: tm.makeCustomIndex(m, 2))
-        n = 2
-        for name, func in zip(index_names, index_funcs):
-            index = func(n)
-            df = DataFrame({'a': np.random.randn(n)}, index=index)
-            with tm.assertRaisesRegexp(TypeError,
-                                       "Only valid with DatetimeIndex, "
-                                       "TimedeltaIndex or PeriodIndex, "
-                                       "but got an instance of %r" % name):
-                df.groupby(TimeGrouper('D'))
-
-        # PeriodIndex gives a specific error message
-        df = DataFrame({'a': np.random.randn(n)}, index=tm.makePeriodIndex(n))
-        with tm.assertRaisesRegexp(TypeError,
-                                   "axis must be a DatetimeIndex, but "
-                                   "got an instance of 'PeriodIndex'"):
-            df.groupby(TimeGrouper('D'))
-
-    def test_aaa_group_order(self):
-        # GH 12840
-        # check TimeGrouper perform stable sorts
-        n = 20
-        data = np.random.randn(n, 4)
-        df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
-                     datetime(2013, 1, 3), datetime(2013, 1, 4),
-                     datetime(2013, 1, 5)] * 4
-        grouped = df.groupby(TimeGrouper(key='key', freq='D'))
-
-        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 1)),
-                              df[::5])
-        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 2)),
-                              df[1::5])
-        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 3)),
-                              df[2::5])
-        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 4)),
-                              df[3::5])
-        tm.assert_frame_equal(grouped.get_group(datetime(2013, 1, 5)),
-                              df[4::5])
-
-    def test_aggregate_normal(self):
-        # check TimeGrouper's aggregation is identical as normal groupby
-
-        n = 20
-        data = np.random.randn(n, 4)
-        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        normal_df['key'] = [1, 2, 3, 4, 5] * 4
-
-        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2),
-                        datetime(2013, 1, 3), datetime(2013, 1, 4),
-                        datetime(2013, 1, 5)] * 4
-
-        normal_grouped = normal_df.groupby('key')
-        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
-
-        for func in ['min', 'max', 'prod', 'var', 'std', 'mean']:
-            expected = getattr(normal_grouped, func)()
-            dt_result = getattr(dt_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['count', 'sum']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        # GH 7453
-        for func in ['size']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_series_equal(expected, dt_result)
-
-        # GH 7453
-        for func in ['first', 'last']:
-            expected = getattr(normal_grouped, func)()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        # if TimeGrouper is used included, 'nth' doesn't work yet
-
-        """
-        for func in ['nth']:
-            expected = getattr(normal_grouped, func)(3)
-            expected.index = date_range(start='2013-01-01',
-                                        freq='D', periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)(3)
-            assert_frame_equal(expected, dt_result)
-        """
-
-    def test_aggregate_with_nat(self):
-        # check TimeGrouper's aggregation is identical as normal groupby
-
-        n = 20
-        data = np.random.randn(n, 4).astype('int64')
-        normal_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        normal_df['key'] = [1, 2, np.nan, 4, 5] * 4
-
-        dt_df = DataFrame(data, columns=['A', 'B', 'C', 'D'])
-        dt_df['key'] = [datetime(2013, 1, 1), datetime(2013, 1, 2), pd.NaT,
-                        datetime(2013, 1, 4), datetime(2013, 1, 5)] * 4
-
-        normal_grouped = normal_df.groupby('key')
-        dt_grouped = dt_df.groupby(TimeGrouper(key='key', freq='D'))
-
-        for func in ['min', 'max', 'sum', 'prod']:
-            normal_result = getattr(normal_grouped, func)()
-            dt_result = getattr(dt_grouped, func)()
-            pad = DataFrame([[np.nan, np.nan, np.nan, np.nan]], index=[3],
-                            columns=['A', 'B', 'C', 'D'])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['count']:
-            normal_result = getattr(normal_grouped, func)()
-            pad = DataFrame([[0, 0, 0, 0]], index=[3],
-                            columns=['A', 'B', 'C', 'D'])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_frame_equal(expected, dt_result)
-
-        for func in ['size']:
-            normal_result = getattr(normal_grouped, func)()
-            pad = Series([0], index=[3])
-            expected = normal_result.append(pad)
-            expected = expected.sort_index()
-            expected.index = date_range(start='2013-01-01', freq='D',
-                                        periods=5, name='key')
-            dt_result = getattr(dt_grouped, func)()
-            assert_series_equal(expected, dt_result)
-            # GH 9925
-            self.assertEqual(dt_result.index.name, 'key')
-
-            # if NaT is included, 'var', 'std', 'mean', 'first','last'
-            # and 'nth' doesn't work yet
diff --git a/pandas/tests/tseries/test_timezones.py b/pandas/tests/tseries/test_timezones.py
deleted file mode 100644
index 1fc0e1b73df6b..0000000000000
--- a/pandas/tests/tseries/test_timezones.py
+++ /dev/null
@@ -1,1722 +0,0 @@
-# pylint: disable-msg=E1101,W0612
-import pytz
-import numpy as np
-from distutils.version import LooseVersion
-from datetime import datetime, timedelta, tzinfo, date
-from pytz import NonExistentTimeError
-
-import pandas.util.testing as tm
-import pandas.tseries.tools as tools
-import pandas.tseries.offsets as offsets
-from pandas.compat import lrange, zip
-from pandas.tseries.index import bdate_range, date_range
-from pandas.types.dtypes import DatetimeTZDtype
-from pandas._libs import tslib
-from pandas import (Index, Series, DataFrame, isnull, Timestamp, NaT,
-                    DatetimeIndex, to_datetime)
-from pandas.util.testing import (assert_frame_equal, assert_series_equal,
-                                 set_timezone)
-
-try:
-    import pytz  # noqa
-except ImportError:
-    pass
-
-try:
-    import dateutil
-except ImportError:
-    pass
-
-
-class FixedOffset(tzinfo):
-    """Fixed offset in minutes east from UTC."""
-
-    def __init__(self, offset, name):
-        self.__offset = timedelta(minutes=offset)
-        self.__name = name
-
-    def utcoffset(self, dt):
-        return self.__offset
-
-    def tzname(self, dt):
-        return self.__name
-
-    def dst(self, dt):
-        return timedelta(0)
-
-
-fixed_off = FixedOffset(-420, '-07:00')
-fixed_off_no_name = FixedOffset(-330, None)
-
-
-class TestTimeZoneSupportPytz(tm.TestCase):
-
-    def setUp(self):
-        tm._skip_if_no_pytz()
-
-    def tz(self, tz):
-        # Construct a timezone object from a string. Overridden in subclass to
-        # parameterize tests.
-        return pytz.timezone(tz)
-
-    def tzstr(self, tz):
-        # Construct a timezone string from a string. Overridden in subclass to
-        # parameterize tests.
-        return tz
-
-    def localize(self, tz, x):
-        return tz.localize(x)
-
-    def cmptz(self, tz1, tz2):
-        # Compare two timezones. Overridden in subclass to parameterize
-        # tests.
-        return tz1.zone == tz2.zone
-
-    def test_utc_to_local_no_modify(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-
-        # Values are unmodified
-        self.assertTrue(np.array_equal(rng.asi8, rng_eastern.asi8))
-
-        self.assertTrue(self.cmptz(rng_eastern.tz, self.tz('US/Eastern')))
-
-    def test_utc_to_local_no_modify_explicit(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tz('US/Eastern'))
-
-        # Values are unmodified
-        self.assert_numpy_array_equal(rng.asi8, rng_eastern.asi8)
-
-        self.assertEqual(rng_eastern.tz, self.tz('US/Eastern'))
-
-    def test_localize_utc_conversion(self):
-        # Localizing to time zone should:
-        #  1) check for DST ambiguities
-        #  2) convert to UTC
-
-        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
-
-        converted = rng.tz_localize(self.tzstr('US/Eastern'))
-        expected_naive = rng + offsets.Hour(5)
-        self.assert_numpy_array_equal(converted.asi8, expected_naive.asi8)
-
-        # DST ambiguity, this should fail
-        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
-        # Is this really how it should fail??
-        self.assertRaises(NonExistentTimeError, rng.tz_localize,
-                          self.tzstr('US/Eastern'))
-
-    def test_localize_utc_conversion_explicit(self):
-        # Localizing to time zone should:
-        #  1) check for DST ambiguities
-        #  2) convert to UTC
-
-        rng = date_range('3/10/2012', '3/11/2012', freq='30T')
-        converted = rng.tz_localize(self.tz('US/Eastern'))
-        expected_naive = rng + offsets.Hour(5)
-        self.assertTrue(np.array_equal(converted.asi8, expected_naive.asi8))
-
-        # DST ambiguity, this should fail
-        rng = date_range('3/11/2012', '3/12/2012', freq='30T')
-        # Is this really how it should fail??
-        self.assertRaises(NonExistentTimeError, rng.tz_localize,
-                          self.tz('US/Eastern'))
-
-    def test_timestamp_tz_localize(self):
-        stamp = Timestamp('3/11/2012 04:00')
-
-        result = stamp.tz_localize(self.tzstr('US/Eastern'))
-        expected = Timestamp('3/11/2012 04:00', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_tz_localize_explicit(self):
-        stamp = Timestamp('3/11/2012 04:00')
-
-        result = stamp.tz_localize(self.tz('US/Eastern'))
-        expected = Timestamp('3/11/2012 04:00', tz=self.tz('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_constructed_by_date_and_tz(self):
-        # Fix Issue 2993, Timestamp cannot be constructed by datetime.date
-        # and tz correctly
-
-        result = Timestamp(date(2012, 3, 11), tz=self.tzstr('US/Eastern'))
-
-        expected = Timestamp('3/11/2012', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_constructed_by_date_and_tz_explicit(self):
-        # Fix Issue 2993, Timestamp cannot be constructed by datetime.date
-        # and tz correctly
-
-        result = Timestamp(date(2012, 3, 11), tz=self.tz('US/Eastern'))
-
-        expected = Timestamp('3/11/2012', tz=self.tz('US/Eastern'))
-        self.assertEqual(result.hour, expected.hour)
-        self.assertEqual(result, expected)
-
-    def test_timestamp_to_datetime_tzoffset(self):
-        # tzoffset
-        from dateutil.tz import tzoffset
-        tzinfo = tzoffset(None, 7200)
-        expected = Timestamp('3/11/2012 04:00', tz=tzinfo)
-        result = Timestamp(expected.to_pydatetime())
-        self.assertEqual(expected, result)
-
-    def test_timedelta_push_over_dst_boundary(self):
-        # #1389
-
-        # 4 hours before DST transition
-        stamp = Timestamp('3/10/2012 22:00', tz=self.tzstr('US/Eastern'))
-
-        result = stamp + timedelta(hours=6)
-
-        # spring forward, + "7" hours
-        expected = Timestamp('3/11/2012 05:00', tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(result, expected)
-
-    def test_timedelta_push_over_dst_boundary_explicit(self):
-        # #1389
-
-        # 4 hours before DST transition
-        stamp = Timestamp('3/10/2012 22:00', tz=self.tz('US/Eastern'))
-
-        result = stamp + timedelta(hours=6)
-
-        # spring forward, + "7" hours
-        expected = Timestamp('3/11/2012 05:00', tz=self.tz('US/Eastern'))
-
-        self.assertEqual(result, expected)
-
-    def test_tz_localize_dti(self):
-        dti = DatetimeIndex(start='1/1/2005', end='1/1/2005 0:00:30.256',
-                            freq='L')
-        dti2 = dti.tz_localize(self.tzstr('US/Eastern'))
-
-        dti_utc = DatetimeIndex(start='1/1/2005 05:00',
-                                end='1/1/2005 5:00:30.256', freq='L', tz='utc')
-
-        self.assert_numpy_array_equal(dti2.values, dti_utc.values)
-
-        dti3 = dti2.tz_convert(self.tzstr('US/Pacific'))
-        self.assert_numpy_array_equal(dti3.values, dti_utc.values)
-
-        dti = DatetimeIndex(start='11/6/2011 1:59', end='11/6/2011 2:00',
-                            freq='L')
-        self.assertRaises(pytz.AmbiguousTimeError, dti.tz_localize,
-                          self.tzstr('US/Eastern'))
-
-        dti = DatetimeIndex(start='3/13/2011 1:59', end='3/13/2011 2:00',
-                            freq='L')
-        self.assertRaises(pytz.NonExistentTimeError, dti.tz_localize,
-                          self.tzstr('US/Eastern'))
-
-    def test_tz_localize_empty_series(self):
-        # #2248
-
-        ts = Series()
-
-        ts2 = ts.tz_localize('utc')
-        self.assertTrue(ts2.index.tz == pytz.utc)
-
-        ts2 = ts.tz_localize(self.tzstr('US/Eastern'))
-        self.assertTrue(self.cmptz(ts2.index.tz, self.tz('US/Eastern')))
-
-    def test_astimezone(self):
-        utc = Timestamp('3/11/2012 22:00', tz='UTC')
-        expected = utc.tz_convert(self.tzstr('US/Eastern'))
-        result = utc.astimezone(self.tzstr('US/Eastern'))
-        self.assertEqual(expected, result)
-        tm.assertIsInstance(result, Timestamp)
-
-    def test_create_with_tz(self):
-        stamp = Timestamp('3/11/2012 05:00', tz=self.tzstr('US/Eastern'))
-        self.assertEqual(stamp.hour, 5)
-
-        rng = date_range('3/11/2012 04:00', periods=10, freq='H',
-                         tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(stamp, rng[1])
-
-        utc_stamp = Timestamp('3/11/2012 05:00', tz='utc')
-        self.assertIs(utc_stamp.tzinfo, pytz.utc)
-        self.assertEqual(utc_stamp.hour, 5)
-
-        stamp = Timestamp('3/11/2012 05:00').tz_localize('utc')
-        self.assertEqual(utc_stamp.hour, 5)
-
-    def test_create_with_fixed_tz(self):
-        off = FixedOffset(420, '+07:00')
-        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
-        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
-        rng = date_range(start=start, end=end)
-        self.assertEqual(off, rng.tz)
-
-        rng2 = date_range(start, periods=len(rng), tz=off)
-        self.assert_index_equal(rng, rng2)
-
-        rng3 = date_range('3/11/2012 05:00:00+07:00',
-                          '6/11/2012 05:00:00+07:00')
-        self.assertTrue((rng.values == rng3.values).all())
-
-    def test_create_with_fixedoffset_noname(self):
-        off = fixed_off_no_name
-        start = datetime(2012, 3, 11, 5, 0, 0, tzinfo=off)
-        end = datetime(2012, 6, 11, 5, 0, 0, tzinfo=off)
-        rng = date_range(start=start, end=end)
-        self.assertEqual(off, rng.tz)
-
-        idx = Index([start, end])
-        self.assertEqual(off, idx.tz)
-
-    def test_date_range_localize(self):
-        rng = date_range('3/11/2012 03:00', periods=15, freq='H',
-                         tz='US/Eastern')
-        rng2 = DatetimeIndex(['3/11/2012 03:00', '3/11/2012 04:00'],
-                             tz='US/Eastern')
-        rng3 = date_range('3/11/2012 03:00', periods=15, freq='H')
-        rng3 = rng3.tz_localize('US/Eastern')
-
-        self.assert_index_equal(rng, rng3)
-
-        # DST transition time
-        val = rng[0]
-        exp = Timestamp('3/11/2012 03:00', tz='US/Eastern')
-
-        self.assertEqual(val.hour, 3)
-        self.assertEqual(exp.hour, 3)
-        self.assertEqual(val, exp)  # same UTC value
-        self.assert_index_equal(rng[:2], rng2)
-
-        # Right before the DST transition
-        rng = date_range('3/11/2012 00:00', periods=2, freq='H',
-                         tz='US/Eastern')
-        rng2 = DatetimeIndex(['3/11/2012 00:00', '3/11/2012 01:00'],
-                             tz='US/Eastern')
-        self.assert_index_equal(rng, rng2)
-        exp = Timestamp('3/11/2012 00:00', tz='US/Eastern')
-        self.assertEqual(exp.hour, 0)
-        self.assertEqual(rng[0], exp)
-        exp = Timestamp('3/11/2012 01:00', tz='US/Eastern')
-        self.assertEqual(exp.hour, 1)
-        self.assertEqual(rng[1], exp)
-
-        rng = date_range('3/11/2012 00:00', periods=10, freq='H',
-                         tz='US/Eastern')
-        self.assertEqual(rng[2].hour, 3)
-
-    def test_utc_box_timestamp_and_localize(self):
-        rng = date_range('3/11/2012', '3/12/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-
-        tz = self.tz('US/Eastern')
-        expected = rng[-1].astimezone(tz)
-
-        stamp = rng_eastern[-1]
-        self.assertEqual(stamp, expected)
-        self.assertEqual(stamp.tzinfo, expected.tzinfo)
-
-        # right tzinfo
-        rng = date_range('3/13/2012', '3/14/2012', freq='H', tz='utc')
-        rng_eastern = rng.tz_convert(self.tzstr('US/Eastern'))
-        # test not valid for dateutil timezones.
-        # self.assertIn('EDT', repr(rng_eastern[0].tzinfo))
-        self.assertTrue('EDT' in repr(rng_eastern[0].tzinfo) or 'tzfile' in
-                        repr(rng_eastern[0].tzinfo))
-
-    def test_timestamp_tz_convert(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-        idx = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-
-        conv = idx[0].tz_convert(self.tzstr('US/Pacific'))
-        expected = idx.tz_convert(self.tzstr('US/Pacific'))[0]
-
-        self.assertEqual(conv, expected)
-
-    def test_pass_dates_localize_to_utc(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-
-        idx = DatetimeIndex(strdates)
-        conv = idx.tz_localize(self.tzstr('US/Eastern'))
-
-        fromdates = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-
-        self.assertEqual(conv.tz, fromdates.tz)
-        self.assert_numpy_array_equal(conv.values, fromdates.values)
-
-    def test_field_access_localize(self):
-        strdates = ['1/1/2012', '3/1/2012', '4/1/2012']
-        rng = DatetimeIndex(strdates, tz=self.tzstr('US/Eastern'))
-        self.assertTrue((rng.hour == 0).all())
-
-        # a more unusual time zone, #1946
-        dr = date_range('2011-10-02 00:00', freq='h', periods=10,
-                        tz=self.tzstr('America/Atikokan'))
-
-        expected = Index(np.arange(10, dtype=np.int64))
-        self.assert_index_equal(dr.hour, expected)
-
-    def test_with_tz(self):
-        tz = self.tz('US/Central')
-
-        # just want it to work
-        start = datetime(2011, 3, 12, tzinfo=pytz.utc)
-        dr = bdate_range(start, periods=50, freq=offsets.Hour())
-        self.assertIs(dr.tz, pytz.utc)
-
-        # DateRange with naive datetimes
-        dr = bdate_range('1/1/2005', '1/1/2009', tz=pytz.utc)
-        dr = bdate_range('1/1/2005', '1/1/2009', tz=tz)
-
-        # normalized
-        central = dr.tz_convert(tz)
-        self.assertIs(central.tz, tz)
-        comp = self.localize(tz, central[0].to_pydatetime().replace(
-            tzinfo=None)).tzinfo
-        self.assertIs(central[0].tz, comp)
-
-        # compare vs a localized tz
-        comp = self.localize(tz,
-                             dr[0].to_pydatetime().replace(tzinfo=None)).tzinfo
-        self.assertIs(central[0].tz, comp)
-
-        # datetimes with tzinfo set
-        dr = bdate_range(datetime(2005, 1, 1, tzinfo=pytz.utc),
-                         '1/1/2009', tz=pytz.utc)
-
-        self.assertRaises(Exception, bdate_range,
-                          datetime(2005, 1, 1, tzinfo=pytz.utc), '1/1/2009',
-                          tz=tz)
-
-    def test_tz_localize(self):
-        dr = bdate_range('1/1/2009', '1/1/2010')
-        dr_utc = bdate_range('1/1/2009', '1/1/2010', tz=pytz.utc)
-        localized = dr.tz_localize(pytz.utc)
-        self.assert_index_equal(dr_utc, localized)
-
-    def test_with_tz_ambiguous_times(self):
-        tz = self.tz('US/Eastern')
-
-        # March 13, 2011, spring forward, skip from 2 AM to 3 AM
-        dr = date_range(datetime(2011, 3, 13, 1, 30), periods=3,
-                        freq=offsets.Hour())
-        self.assertRaises(pytz.NonExistentTimeError, dr.tz_localize, tz)
-
-        # after dst transition, it works
-        dr = date_range(datetime(2011, 3, 13, 3, 30), periods=3,
-                        freq=offsets.Hour(), tz=tz)
-
-        # November 6, 2011, fall back, repeat 2 AM hour
-        dr = date_range(datetime(2011, 11, 6, 1, 30), periods=3,
-                        freq=offsets.Hour())
-        self.assertRaises(pytz.AmbiguousTimeError, dr.tz_localize, tz)
-
-        # UTC is OK
-        dr = date_range(datetime(2011, 3, 13), periods=48,
-                        freq=offsets.Minute(30), tz=pytz.utc)
-
-    def test_ambiguous_infer(self):
-        # November 6, 2011, fall back, repeat 2 AM hour
-        # With no repeated hours, we cannot infer the transition
-        tz = self.tz('US/Eastern')
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=offsets.Hour())
-        self.assertRaises(pytz.AmbiguousTimeError, dr.tz_localize, tz)
-
-        # With repeated hours, we can infer the transition
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=offsets.Hour(), tz=tz)
-        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
-                 '11/06/2011 02:00', '11/06/2011 03:00']
-        di = DatetimeIndex(times)
-        localized = di.tz_localize(tz, ambiguous='infer')
-        self.assert_index_equal(dr, localized)
-        with tm.assert_produces_warning(FutureWarning):
-            localized_old = di.tz_localize(tz, infer_dst=True)
-        self.assert_index_equal(dr, localized_old)
-        self.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
-                                                  ambiguous='infer'))
-
-        # When there is no dst transition, nothing special happens
-        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
-                        freq=offsets.Hour())
-        localized = dr.tz_localize(tz)
-        localized_infer = dr.tz_localize(tz, ambiguous='infer')
-        self.assert_index_equal(localized, localized_infer)
-        with tm.assert_produces_warning(FutureWarning):
-            localized_infer_old = dr.tz_localize(tz, infer_dst=True)
-        self.assert_index_equal(localized, localized_infer_old)
-
-    def test_ambiguous_flags(self):
-        # November 6, 2011, fall back, repeat 2 AM hour
-        tz = self.tz('US/Eastern')
-
-        # Pass in flags to determine right dst transition
-        dr = date_range(datetime(2011, 11, 6, 0), periods=5,
-                        freq=offsets.Hour(), tz=tz)
-        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
-                 '11/06/2011 02:00', '11/06/2011 03:00']
-
-        # Test tz_localize
-        di = DatetimeIndex(times)
-        is_dst = [1, 1, 0, 0, 0]
-        localized = di.tz_localize(tz, ambiguous=is_dst)
-        self.assert_index_equal(dr, localized)
-        self.assert_index_equal(dr, DatetimeIndex(times, tz=tz,
-                                                  ambiguous=is_dst))
-
-        localized = di.tz_localize(tz, ambiguous=np.array(is_dst))
-        self.assert_index_equal(dr, localized)
-
-        localized = di.tz_localize(tz,
-                                   ambiguous=np.array(is_dst).astype('bool'))
-        self.assert_index_equal(dr, localized)
-
-        # Test constructor
-        localized = DatetimeIndex(times, tz=tz, ambiguous=is_dst)
-        self.assert_index_equal(dr, localized)
-
-        # Test duplicate times where infer_dst fails
-        times += times
-        di = DatetimeIndex(times)
-
-        # When the sizes are incompatible, make sure error is raised
-        self.assertRaises(Exception, di.tz_localize, tz, ambiguous=is_dst)
-
-        # When sizes are compatible and there are repeats ('infer' won't work)
-        is_dst = np.hstack((is_dst, is_dst))
-        localized = di.tz_localize(tz, ambiguous=is_dst)
-        dr = dr.append(dr)
-        self.assert_index_equal(dr, localized)
-
-        # When there is no dst transition, nothing special happens
-        dr = date_range(datetime(2011, 6, 1, 0), periods=10,
-                        freq=offsets.Hour())
-        is_dst = np.array([1] * 10)
-        localized = dr.tz_localize(tz)
-        localized_is_dst = dr.tz_localize(tz, ambiguous=is_dst)
-        self.assert_index_equal(localized, localized_is_dst)
-
-        # construction with an ambiguous end-point
-        # GH 11626
-        tz = self.tzstr("Europe/London")
-
-        def f():
-            date_range("2013-10-26 23:00", "2013-10-27 01:00",
-                       tz="Europe/London", freq="H")
-            self.assertRaises(pytz.AmbiguousTimeError, f)
-
-        times = date_range("2013-10-26 23:00", "2013-10-27 01:00", freq="H",
-                           tz=tz, ambiguous='infer')
-        self.assertEqual(times[0], Timestamp('2013-10-26 23:00', tz=tz,
-                                             freq="H"))
-        if dateutil.__version__ != LooseVersion('2.6.0'):
-            # GH 14621
-            self.assertEqual(times[-1], Timestamp('2013-10-27 01:00', tz=tz,
-                                                  freq="H"))
-
-    def test_ambiguous_nat(self):
-        tz = self.tz('US/Eastern')
-        times = ['11/06/2011 00:00', '11/06/2011 01:00', '11/06/2011 01:00',
-                 '11/06/2011 02:00', '11/06/2011 03:00']
-        di = DatetimeIndex(times)
-        localized = di.tz_localize(tz, ambiguous='NaT')
-
-        times = ['11/06/2011 00:00', np.NaN, np.NaN, '11/06/2011 02:00',
-                 '11/06/2011 03:00']
-        di_test = DatetimeIndex(times, tz='US/Eastern')
-
-        # left dtype is  datetime64[ns, US/Eastern]
-        # right is datetime64[ns, tzfile('/usr/share/zoneinfo/US/Eastern')]
-        self.assert_numpy_array_equal(di_test.values, localized.values)
-
-    def test_ambiguous_bool(self):
-        # make sure that we are correctly accepting bool values as ambiguous
-
-        # gh-14402
-        t = Timestamp('2015-11-01 01:00:03')
-        expected0 = Timestamp('2015-11-01 01:00:03-0500', tz='US/Central')
-        expected1 = Timestamp('2015-11-01 01:00:03-0600', tz='US/Central')
-
-        def f():
-            t.tz_localize('US/Central')
-        self.assertRaises(pytz.AmbiguousTimeError, f)
-
-        result = t.tz_localize('US/Central', ambiguous=True)
-        self.assertEqual(result, expected0)
-
-        result = t.tz_localize('US/Central', ambiguous=False)
-        self.assertEqual(result, expected1)
-
-        s = Series([t])
-        expected0 = Series([expected0])
-        expected1 = Series([expected1])
-
-        def f():
-            s.dt.tz_localize('US/Central')
-        self.assertRaises(pytz.AmbiguousTimeError, f)
-
-        result = s.dt.tz_localize('US/Central', ambiguous=True)
-        assert_series_equal(result, expected0)
-
-        result = s.dt.tz_localize('US/Central', ambiguous=[True])
-        assert_series_equal(result, expected0)
-
-        result = s.dt.tz_localize('US/Central', ambiguous=False)
-        assert_series_equal(result, expected1)
-
-        result = s.dt.tz_localize('US/Central', ambiguous=[False])
-        assert_series_equal(result, expected1)
-
-    def test_nonexistent_raise_coerce(self):
-        # See issue 13057
-        from pytz.exceptions import NonExistentTimeError
-        times = ['2015-03-08 01:00', '2015-03-08 02:00', '2015-03-08 03:00']
-        index = DatetimeIndex(times)
-        tz = 'US/Eastern'
-        self.assertRaises(NonExistentTimeError,
-                          index.tz_localize, tz=tz)
-        self.assertRaises(NonExistentTimeError,
-                          index.tz_localize, tz=tz, errors='raise')
-        result = index.tz_localize(tz=tz, errors='coerce')
-        test_times = ['2015-03-08 01:00-05:00', 'NaT',
-                      '2015-03-08 03:00-04:00']
-        expected = DatetimeIndex(test_times)\
-            .tz_localize('UTC').tz_convert('US/Eastern')
-        tm.assert_index_equal(result, expected)
-
-    # test utility methods
-    def test_infer_tz(self):
-        eastern = self.tz('US/Eastern')
-        utc = pytz.utc
-
-        _start = datetime(2001, 1, 1)
-        _end = datetime(2009, 1, 1)
-
-        start = self.localize(eastern, _start)
-        end = self.localize(eastern, _end)
-        assert (tools._infer_tzinfo(start, end) is self.localize(
-            eastern, _start).tzinfo)
-        assert (tools._infer_tzinfo(start, None) is self.localize(
-            eastern, _start).tzinfo)
-        assert (tools._infer_tzinfo(None, end) is self.localize(eastern,
-                                                                _end).tzinfo)
-
-        start = utc.localize(_start)
-        end = utc.localize(_end)
-        assert (tools._infer_tzinfo(start, end) is utc)
-
-        end = self.localize(eastern, _end)
-        self.assertRaises(Exception, tools._infer_tzinfo, start, end)
-        self.assertRaises(Exception, tools._infer_tzinfo, end, start)
-
-    def test_tz_string(self):
-        result = date_range('1/1/2000', periods=10,
-                            tz=self.tzstr('US/Eastern'))
-        expected = date_range('1/1/2000', periods=10, tz=self.tz('US/Eastern'))
-
-        self.assert_index_equal(result, expected)
-
-    def test_take_dont_lose_meta(self):
-        tm._skip_if_no_pytz()
-        rng = date_range('1/1/2000', periods=20, tz=self.tzstr('US/Eastern'))
-
-        result = rng.take(lrange(5))
-        self.assertEqual(result.tz, rng.tz)
-        self.assertEqual(result.freq, rng.freq)
-
-    def test_index_with_timezone_repr(self):
-        rng = date_range('4/13/2010', '5/6/2010')
-
-        rng_eastern = rng.tz_localize(self.tzstr('US/Eastern'))
-
-        rng_repr = repr(rng_eastern)
-        self.assertIn('2010-04-13 00:00:00', rng_repr)
-
-    def test_index_astype_asobject_tzinfos(self):
-        # #1345
-
-        # dates around a dst transition
-        rng = date_range('2/13/2010', '5/6/2010', tz=self.tzstr('US/Eastern'))
-
-        objs = rng.asobject
-        for i, x in enumerate(objs):
-            exval = rng[i]
-            self.assertEqual(x, exval)
-            self.assertEqual(x.tzinfo, exval.tzinfo)
-
-        objs = rng.astype(object)
-        for i, x in enumerate(objs):
-            exval = rng[i]
-            self.assertEqual(x, exval)
-            self.assertEqual(x.tzinfo, exval.tzinfo)
-
-    def test_localized_at_time_between_time(self):
-        from datetime import time
-
-        rng = date_range('4/16/2012', '5/1/2012', freq='H')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_local = ts.tz_localize(self.tzstr('US/Eastern'))
-
-        result = ts_local.at_time(time(10, 0))
-        expected = ts.at_time(time(10, 0)).tz_localize(self.tzstr(
-            'US/Eastern'))
-        assert_series_equal(result, expected)
-        self.assertTrue(self.cmptz(result.index.tz, self.tz('US/Eastern')))
-
-        t1, t2 = time(10, 0), time(11, 0)
-        result = ts_local.between_time(t1, t2)
-        expected = ts.between_time(t1,
-                                   t2).tz_localize(self.tzstr('US/Eastern'))
-        assert_series_equal(result, expected)
-        self.assertTrue(self.cmptz(result.index.tz, self.tz('US/Eastern')))
-
-    def test_string_index_alias_tz_aware(self):
-        rng = date_range('1/1/2000', periods=10, tz=self.tzstr('US/Eastern'))
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        result = ts['1/3/2000']
-        self.assertAlmostEqual(result, ts[2])
-
-    def test_fixed_offset(self):
-        dates = [datetime(2000, 1, 1, tzinfo=fixed_off),
-                 datetime(2000, 1, 2, tzinfo=fixed_off),
-                 datetime(2000, 1, 3, tzinfo=fixed_off)]
-        result = to_datetime(dates)
-        self.assertEqual(result.tz, fixed_off)
-
-    def test_fixedtz_topydatetime(self):
-        dates = np.array([datetime(2000, 1, 1, tzinfo=fixed_off),
-                          datetime(2000, 1, 2, tzinfo=fixed_off),
-                          datetime(2000, 1, 3, tzinfo=fixed_off)])
-        result = to_datetime(dates).to_pydatetime()
-        self.assert_numpy_array_equal(dates, result)
-        result = to_datetime(dates)._mpl_repr()
-        self.assert_numpy_array_equal(dates, result)
-
-    def test_convert_tz_aware_datetime_datetime(self):
-        # #1581
-
-        tz = self.tz('US/Eastern')
-
-        dates = [datetime(2000, 1, 1), datetime(2000, 1, 2),
-                 datetime(2000, 1, 3)]
-
-        dates_aware = [self.localize(tz, x) for x in dates]
-        result = to_datetime(dates_aware)
-        self.assertTrue(self.cmptz(result.tz, self.tz('US/Eastern')))
-
-        converted = to_datetime(dates_aware, utc=True)
-        ex_vals = np.array([Timestamp(x).value for x in dates_aware])
-        self.assert_numpy_array_equal(converted.asi8, ex_vals)
-        self.assertIs(converted.tz, pytz.utc)
-
-    def test_to_datetime_utc(self):
-        from dateutil.parser import parse
-        arr = np.array([parse('2012-06-13T01:39:00Z')], dtype=object)
-
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-    def test_to_datetime_tzlocal(self):
-        from dateutil.parser import parse
-        from dateutil.tz import tzlocal
-        dt = parse('2012-06-13T01:39:00Z')
-        dt = dt.replace(tzinfo=tzlocal())
-
-        arr = np.array([dt], dtype=object)
-
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-        rng = date_range('2012-11-03 03:00', '2012-11-05 03:00', tz=tzlocal())
-        arr = rng.to_pydatetime()
-        result = to_datetime(arr, utc=True)
-        self.assertIs(result.tz, pytz.utc)
-
-    def test_frame_no_datetime64_dtype(self):
-
-        # after 7822
-        # these retain the timezones on dict construction
-
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        dr_tz = dr.tz_localize(self.tzstr('US/Eastern'))
-        e = DataFrame({'A': 'foo', 'B': dr_tz}, index=dr)
-        tz_expected = DatetimeTZDtype('ns', dr_tz.tzinfo)
-        self.assertEqual(e['B'].dtype, tz_expected)
-
-        # GH 2810 (with timezones)
-        datetimes_naive = [ts.to_pydatetime() for ts in dr]
-        datetimes_with_tz = [ts.to_pydatetime() for ts in dr_tz]
-        df = DataFrame({'dr': dr,
-                        'dr_tz': dr_tz,
-                        'datetimes_naive': datetimes_naive,
-                        'datetimes_with_tz': datetimes_with_tz})
-        result = df.get_dtype_counts().sort_index()
-        expected = Series({'datetime64[ns]': 2,
-                           str(tz_expected): 2}).sort_index()
-        assert_series_equal(result, expected)
-
-    def test_hongkong_tz_convert(self):
-        # #1673
-        dr = date_range('2012-01-01', '2012-01-10', freq='D', tz='Hongkong')
-
-        # it works!
-        dr.hour
-
-    def test_tz_convert_unsorted(self):
-        dr = date_range('2012-03-09', freq='H', periods=100, tz='utc')
-        dr = dr.tz_convert(self.tzstr('US/Eastern'))
-
-        result = dr[::-1].hour
-        exp = dr.hour[::-1]
-        tm.assert_almost_equal(result, exp)
-
-    def test_shift_localized(self):
-        dr = date_range('2011/1/1', '2012/1/1', freq='W-FRI')
-        dr_tz = dr.tz_localize(self.tzstr('US/Eastern'))
-
-        result = dr_tz.shift(1, '10T')
-        self.assertEqual(result.tz, dr_tz.tz)
-
-    def test_tz_aware_asfreq(self):
-        dr = date_range('2011-12-01', '2012-07-20', freq='D',
-                        tz=self.tzstr('US/Eastern'))
-
-        s = Series(np.random.randn(len(dr)), index=dr)
-
-        # it works!
-        s.asfreq('T')
-
-    def test_static_tzinfo(self):
-        # it works!
-        index = DatetimeIndex([datetime(2012, 1, 1)], tz=self.tzstr('EST'))
-        index.hour
-        index[0]
-
-    def test_tzaware_datetime_to_index(self):
-        d = [datetime(2012, 8, 19, tzinfo=self.tz('US/Eastern'))]
-
-        index = DatetimeIndex(d)
-        self.assertTrue(self.cmptz(index.tz, self.tz('US/Eastern')))
-
-    def test_date_range_span_dst_transition(self):
-        # #1778
-
-        # Standard -> Daylight Savings Time
-        dr = date_range('03/06/2012 00:00', periods=200, freq='W-FRI',
-                        tz='US/Eastern')
-
-        self.assertTrue((dr.hour == 0).all())
-
-        dr = date_range('2012-11-02', periods=10, tz=self.tzstr('US/Eastern'))
-        self.assertTrue((dr.hour == 0).all())
-
-    def test_convert_datetime_list(self):
-        dr = date_range('2012-06-02', periods=10,
-                        tz=self.tzstr('US/Eastern'), name='foo')
-        dr2 = DatetimeIndex(list(dr), name='foo')
-        self.assert_index_equal(dr, dr2)
-        self.assertEqual(dr.tz, dr2.tz)
-        self.assertEqual(dr2.name, 'foo')
-
-    def test_frame_from_records_utc(self):
-        rec = {'datum': 1.5,
-               'begin_time': datetime(2006, 4, 27, tzinfo=pytz.utc)}
-
-        # it works
-        DataFrame.from_records([rec], index='begin_time')
-
-    def test_frame_reset_index(self):
-        dr = date_range('2012-06-02', periods=10, tz=self.tzstr('US/Eastern'))
-        df = DataFrame(np.random.randn(len(dr)), dr)
-        roundtripped = df.reset_index().set_index('index')
-        xp = df.index.tz
-        rs = roundtripped.index.tz
-        self.assertEqual(xp, rs)
-
-    def test_dateutil_tzoffset_support(self):
-        from dateutil.tz import tzoffset
-        values = [188.5, 328.25]
-        tzinfo = tzoffset(None, 7200)
-        index = [datetime(2012, 5, 11, 11, tzinfo=tzinfo),
-                 datetime(2012, 5, 11, 12, tzinfo=tzinfo)]
-        series = Series(data=values, index=index)
-
-        self.assertEqual(series.index.tz, tzinfo)
-
-        # it works! #2443
-        repr(series.index[0])
-
-    def test_getitem_pydatetime_tz(self):
-        index = date_range(start='2012-12-24 16:00', end='2012-12-24 18:00',
-                           freq='H', tz=self.tzstr('Europe/Berlin'))
-        ts = Series(index=index, data=index.hour)
-        time_pandas = Timestamp('2012-12-24 17:00',
-                                tz=self.tzstr('Europe/Berlin'))
-        time_datetime = self.localize(
-            self.tz('Europe/Berlin'), datetime(2012, 12, 24, 17, 0))
-        self.assertEqual(ts[time_pandas], ts[time_datetime])
-
-    def test_index_drop_dont_lose_tz(self):
-        # #2621
-        ind = date_range("2012-12-01", periods=10, tz="utc")
-        ind = ind.drop(ind[-1])
-
-        self.assertTrue(ind.tz is not None)
-
-    def test_datetimeindex_tz(self):
-        """ Test different DatetimeIndex constructions with timezone
-        Follow-up of #4229
-        """
-
-        arr = ['11/10/2005 08:00:00', '11/10/2005 09:00:00']
-
-        idx1 = to_datetime(arr).tz_localize(self.tzstr('US/Eastern'))
-        idx2 = DatetimeIndex(start="2005-11-10 08:00:00", freq='H', periods=2,
-                             tz=self.tzstr('US/Eastern'))
-        idx3 = DatetimeIndex(arr, tz=self.tzstr('US/Eastern'))
-        idx4 = DatetimeIndex(np.array(arr), tz=self.tzstr('US/Eastern'))
-
-        for other in [idx2, idx3, idx4]:
-            self.assert_index_equal(idx1, other)
-
-    def test_datetimeindex_tz_nat(self):
-        idx = to_datetime([Timestamp("2013-1-1", tz=self.tzstr('US/Eastern')),
-                           NaT])
-
-        self.assertTrue(isnull(idx[1]))
-        self.assertTrue(idx[0].tzinfo is not None)
-
-
-class TestTimeZoneSupportDateutil(TestTimeZoneSupportPytz):
-
-    def setUp(self):
-        tm._skip_if_no_dateutil()
-
-    def tz(self, tz):
-        """
-        Construct a dateutil timezone.
-        Use tslib.maybe_get_tz so that we get the filename on the tz right
-        on windows. See #7337.
-        """
-        return tslib.maybe_get_tz('dateutil/' + tz)
-
-    def tzstr(self, tz):
-        """ Construct a timezone string from a string. Overridden in subclass
-        to parameterize tests. """
-        return 'dateutil/' + tz
-
-    def cmptz(self, tz1, tz2):
-        """ Compare two timezones. Overridden in subclass to parameterize
-        tests. """
-        return tz1 == tz2
-
-    def localize(self, tz, x):
-        return x.replace(tzinfo=tz)
-
-    def test_utc_with_system_utc(self):
-        # Skipped on win32 due to dateutil bug
-        tm._skip_if_windows()
-
-        from pandas._libs.tslib import maybe_get_tz
-
-        # from system utc to real utc
-        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
-        # check that the time hasn't changed.
-        self.assertEqual(ts, ts.tz_convert(dateutil.tz.tzutc()))
-
-        # from system utc to real utc
-        ts = Timestamp('2001-01-05 11:56', tz=maybe_get_tz('dateutil/UTC'))
-        # check that the time hasn't changed.
-        self.assertEqual(ts, ts.tz_convert(dateutil.tz.tzutc()))
-
-    def test_tz_convert_hour_overflow_dst(self):
-        # Regression test for:
-        # https://github.com/pandas-dev/pandas/issues/13306
-
-        # sorted case US/Eastern -> UTC
-        ts = ['2008-05-12 09:50:00',
-              '2008-12-12 09:50:35',
-              '2009-05-12 09:50:32']
-        tt = to_datetime(ts).tz_localize('US/Eastern')
-        ut = tt.tz_convert('UTC')
-        expected = Index([13, 14, 13])
-        self.assert_index_equal(ut.hour, expected)
-
-        # sorted case UTC -> US/Eastern
-        ts = ['2008-05-12 13:50:00',
-              '2008-12-12 14:50:35',
-              '2009-05-12 13:50:32']
-        tt = to_datetime(ts).tz_localize('UTC')
-        ut = tt.tz_convert('US/Eastern')
-        expected = Index([9, 9, 9])
-        self.assert_index_equal(ut.hour, expected)
-
-        # unsorted case US/Eastern -> UTC
-        ts = ['2008-05-12 09:50:00',
-              '2008-12-12 09:50:35',
-              '2008-05-12 09:50:32']
-        tt = to_datetime(ts).tz_localize('US/Eastern')
-        ut = tt.tz_convert('UTC')
-        expected = Index([13, 14, 13])
-        self.assert_index_equal(ut.hour, expected)
-
-        # unsorted case UTC -> US/Eastern
-        ts = ['2008-05-12 13:50:00',
-              '2008-12-12 14:50:35',
-              '2008-05-12 13:50:32']
-        tt = to_datetime(ts).tz_localize('UTC')
-        ut = tt.tz_convert('US/Eastern')
-        expected = Index([9, 9, 9])
-        self.assert_index_equal(ut.hour, expected)
-
-    def test_tz_convert_hour_overflow_dst_timestamps(self):
-        # Regression test for:
-        # https://github.com/pandas-dev/pandas/issues/13306
-
-        tz = self.tzstr('US/Eastern')
-
-        # sorted case US/Eastern -> UTC
-        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
-              Timestamp('2008-12-12 09:50:35', tz=tz),
-              Timestamp('2009-05-12 09:50:32', tz=tz)]
-        tt = to_datetime(ts)
-        ut = tt.tz_convert('UTC')
-        expected = Index([13, 14, 13])
-        self.assert_index_equal(ut.hour, expected)
-
-        # sorted case UTC -> US/Eastern
-        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
-              Timestamp('2008-12-12 14:50:35', tz='UTC'),
-              Timestamp('2009-05-12 13:50:32', tz='UTC')]
-        tt = to_datetime(ts)
-        ut = tt.tz_convert('US/Eastern')
-        expected = Index([9, 9, 9])
-        self.assert_index_equal(ut.hour, expected)
-
-        # unsorted case US/Eastern -> UTC
-        ts = [Timestamp('2008-05-12 09:50:00', tz=tz),
-              Timestamp('2008-12-12 09:50:35', tz=tz),
-              Timestamp('2008-05-12 09:50:32', tz=tz)]
-        tt = to_datetime(ts)
-        ut = tt.tz_convert('UTC')
-        expected = Index([13, 14, 13])
-        self.assert_index_equal(ut.hour, expected)
-
-        # unsorted case UTC -> US/Eastern
-        ts = [Timestamp('2008-05-12 13:50:00', tz='UTC'),
-              Timestamp('2008-12-12 14:50:35', tz='UTC'),
-              Timestamp('2008-05-12 13:50:32', tz='UTC')]
-        tt = to_datetime(ts)
-        ut = tt.tz_convert('US/Eastern')
-        expected = Index([9, 9, 9])
-        self.assert_index_equal(ut.hour, expected)
-
-    def test_tslib_tz_convert_trans_pos_plus_1__bug(self):
-        # Regression test for tslib.tz_convert(vals, tz1, tz2).
-        # See https://github.com/pandas-dev/pandas/issues/4496 for details.
-        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
-            idx = date_range(datetime(2011, 3, 26, 23),
-                             datetime(2011, 3, 27, 1), freq=freq)
-            idx = idx.tz_localize('UTC')
-            idx = idx.tz_convert('Europe/Moscow')
-
-            expected = np.repeat(np.array([3, 4, 5]), np.array([n, n, 1]))
-            self.assert_index_equal(idx.hour, Index(expected))
-
-    def test_tslib_tz_convert_dst(self):
-        for freq, n in [('H', 1), ('T', 60), ('S', 3600)]:
-            # Start DST
-            idx = date_range('2014-03-08 23:00', '2014-03-09 09:00', freq=freq,
-                             tz='UTC')
-            idx = idx.tz_convert('US/Eastern')
-            expected = np.repeat(np.array([18, 19, 20, 21, 22, 23,
-                                           0, 1, 3, 4, 5]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_index_equal(idx.hour, Index(expected))
-
-            idx = date_range('2014-03-08 18:00', '2014-03-09 05:00', freq=freq,
-                             tz='US/Eastern')
-            idx = idx.tz_convert('UTC')
-            expected = np.repeat(np.array([23, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_index_equal(idx.hour, Index(expected))
-
-            # End DST
-            idx = date_range('2014-11-01 23:00', '2014-11-02 09:00', freq=freq,
-                             tz='UTC')
-            idx = idx.tz_convert('US/Eastern')
-            expected = np.repeat(np.array([19, 20, 21, 22, 23,
-                                           0, 1, 1, 2, 3, 4]),
-                                 np.array([n, n, n, n, n, n, n, n, n, n, 1]))
-            self.assert_index_equal(idx.hour, Index(expected))
-
-            idx = date_range('2014-11-01 18:00', '2014-11-02 05:00', freq=freq,
-                             tz='US/Eastern')
-            idx = idx.tz_convert('UTC')
-            expected = np.repeat(np.array([22, 23, 0, 1, 2, 3, 4, 5, 6,
-                                           7, 8, 9, 10]),
-                                 np.array([n, n, n, n, n, n, n, n, n,
-                                           n, n, n, 1]))
-            self.assert_index_equal(idx.hour, Index(expected))
-
-        # daily
-        # Start DST
-        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
-                         tz='UTC')
-        idx = idx.tz_convert('US/Eastern')
-        self.assert_index_equal(idx.hour, Index([19, 19]))
-
-        idx = date_range('2014-03-08 00:00', '2014-03-09 00:00', freq='D',
-                         tz='US/Eastern')
-        idx = idx.tz_convert('UTC')
-        self.assert_index_equal(idx.hour, Index([5, 5]))
-
-        # End DST
-        idx = date_range('2014-11-01 00:00', '2014-11-02 00:00', freq='D',
-                         tz='UTC')
-        idx = idx.tz_convert('US/Eastern')
-        self.assert_index_equal(idx.hour, Index([20, 20]))
-
-        idx = date_range('2014-11-01 00:00', '2014-11-02 000:00', freq='D',
-                         tz='US/Eastern')
-        idx = idx.tz_convert('UTC')
-        self.assert_index_equal(idx.hour, Index([4, 4]))
-
-    def test_tzlocal(self):
-        # GH 13583
-        ts = Timestamp('2011-01-01', tz=dateutil.tz.tzlocal())
-        self.assertEqual(ts.tz, dateutil.tz.tzlocal())
-        self.assertTrue("tz='tzlocal()')" in repr(ts))
-
-        tz = tslib.maybe_get_tz('tzlocal()')
-        self.assertEqual(tz, dateutil.tz.tzlocal())
-
-        # get offset using normal datetime for test
-        offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
-        offset = offset.total_seconds() * 1000000000
-        self.assertEqual(ts.value + offset, Timestamp('2011-01-01').value)
-
-    def test_tz_localize_tzlocal(self):
-        # GH 13583
-        offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
-        offset = int(offset.total_seconds() * 1000000000)
-
-        dti = date_range(start='2001-01-01', end='2001-03-01')
-        dti2 = dti.tz_localize(dateutil.tz.tzlocal())
-        tm.assert_numpy_array_equal(dti2.asi8 + offset, dti.asi8)
-
-        dti = date_range(start='2001-01-01', end='2001-03-01',
-                         tz=dateutil.tz.tzlocal())
-        dti2 = dti.tz_localize(None)
-        tm.assert_numpy_array_equal(dti2.asi8 - offset, dti.asi8)
-
-    def test_tz_convert_tzlocal(self):
-        # GH 13583
-        # tz_convert doesn't affect to internal
-        dti = date_range(start='2001-01-01', end='2001-03-01', tz='UTC')
-        dti2 = dti.tz_convert(dateutil.tz.tzlocal())
-        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
-
-        dti = date_range(start='2001-01-01', end='2001-03-01',
-                         tz=dateutil.tz.tzlocal())
-        dti2 = dti.tz_convert(None)
-        tm.assert_numpy_array_equal(dti2.asi8, dti.asi8)
-
-
-class TestTimeZoneCacheKey(tm.TestCase):
-
-    def test_cache_keys_are_distinct_for_pytz_vs_dateutil(self):
-        tzs = pytz.common_timezones
-        for tz_name in tzs:
-            if tz_name == 'UTC':
-                # skip utc as it's a special case in dateutil
-                continue
-            tz_p = tslib.maybe_get_tz(tz_name)
-            tz_d = tslib.maybe_get_tz('dateutil/' + tz_name)
-            if tz_d is None:
-                # skip timezones that dateutil doesn't know about.
-                continue
-            self.assertNotEqual(tslib._p_tz_cache_key(
-                tz_p), tslib._p_tz_cache_key(tz_d))
-
-
-class TestTimeZones(tm.TestCase):
-    timezones = ['UTC', 'Asia/Tokyo', 'US/Eastern', 'dateutil/US/Pacific']
-
-    def setUp(self):
-        tm._skip_if_no_pytz()
-
-    def test_replace(self):
-        # GH 14621
-        # GH 7825
-        # replacing datetime components with and w/o presence of a timezone
-        dt = Timestamp('2016-01-01 09:00:00')
-        result = dt.replace(hour=0)
-        expected = Timestamp('2016-01-01 00:00:00')
-        self.assertEqual(result, expected)
-
-        for tz in self.timezones:
-            dt = Timestamp('2016-01-01 09:00:00', tz=tz)
-            result = dt.replace(hour=0)
-            expected = Timestamp('2016-01-01 00:00:00', tz=tz)
-            self.assertEqual(result, expected)
-
-        # we preserve nanoseconds
-        dt = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
-        result = dt.replace(hour=0)
-        expected = Timestamp('2016-01-01 00:00:00.000000123', tz=tz)
-        self.assertEqual(result, expected)
-
-        # test all
-        dt = Timestamp('2016-01-01 09:00:00.000000123', tz=tz)
-        result = dt.replace(year=2015, month=2, day=2, hour=0, minute=5,
-                            second=5, microsecond=5, nanosecond=5)
-        expected = Timestamp('2015-02-02 00:05:05.000005005', tz=tz)
-        self.assertEqual(result, expected)
-
-        # error
-        def f():
-            dt.replace(foo=5)
-        self.assertRaises(TypeError, f)
-
-        def f():
-            dt.replace(hour=0.1)
-        self.assertRaises(ValueError, f)
-
-        # assert conversion to naive is the same as replacing tzinfo with None
-        dt = Timestamp('2013-11-03 01:59:59.999999-0400', tz='US/Eastern')
-        self.assertEqual(dt.tz_localize(None), dt.replace(tzinfo=None))
-
-    def test_ambiguous_compat(self):
-        # validate that pytz and dateutil are compat for dst
-        # when the transition happens
-        tm._skip_if_no_dateutil()
-        tm._skip_if_no_pytz()
-
-        pytz_zone = 'Europe/London'
-        dateutil_zone = 'dateutil/Europe/London'
-        result_pytz = (Timestamp('2013-10-27 01:00:00')
-                       .tz_localize(pytz_zone, ambiguous=0))
-        result_dateutil = (Timestamp('2013-10-27 01:00:00')
-                           .tz_localize(dateutil_zone, ambiguous=0))
-        self.assertEqual(result_pytz.value, result_dateutil.value)
-        self.assertEqual(result_pytz.value, 1382835600000000000)
-
-        # dateutil 2.6 buggy w.r.t. ambiguous=0
-        if dateutil.__version__ != LooseVersion('2.6.0'):
-            # GH 14621
-            # https://github.com/dateutil/dateutil/issues/321
-            self.assertEqual(result_pytz.to_pydatetime().tzname(),
-                             result_dateutil.to_pydatetime().tzname())
-            self.assertEqual(str(result_pytz), str(result_dateutil))
-
-        # 1 hour difference
-        result_pytz = (Timestamp('2013-10-27 01:00:00')
-                       .tz_localize(pytz_zone, ambiguous=1))
-        result_dateutil = (Timestamp('2013-10-27 01:00:00')
-                           .tz_localize(dateutil_zone, ambiguous=1))
-        self.assertEqual(result_pytz.value, result_dateutil.value)
-        self.assertEqual(result_pytz.value, 1382832000000000000)
-
-        # dateutil < 2.6 is buggy w.r.t. ambiguous timezones
-        if dateutil.__version__ > LooseVersion('2.5.3'):
-            # GH 14621
-            self.assertEqual(str(result_pytz), str(result_dateutil))
-            self.assertEqual(result_pytz.to_pydatetime().tzname(),
-                             result_dateutil.to_pydatetime().tzname())
-
-    def test_index_equals_with_tz(self):
-        left = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-        right = date_range('1/1/2011', periods=100, freq='H', tz='US/Eastern')
-
-        self.assertFalse(left.equals(right))
-
-    def test_tz_localize_naive(self):
-        rng = date_range('1/1/2011', periods=100, freq='H')
-
-        conv = rng.tz_localize('US/Pacific')
-        exp = date_range('1/1/2011', periods=100, freq='H', tz='US/Pacific')
-
-        self.assert_index_equal(conv, exp)
-
-    def test_tz_localize_roundtrip(self):
-        for tz in self.timezones:
-            idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
-            idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
-            idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
-            idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
-            for idx in [idx1, idx2, idx3, idx4]:
-                localized = idx.tz_localize(tz)
-                expected = date_range(start=idx[0], end=idx[-1], freq=idx.freq,
-                                      tz=tz)
-                tm.assert_index_equal(localized, expected)
-
-                with tm.assertRaises(TypeError):
-                    localized.tz_localize(tz)
-
-                reset = localized.tz_localize(None)
-                tm.assert_index_equal(reset, idx)
-                self.assertTrue(reset.tzinfo is None)
-
-    def test_series_frame_tz_localize(self):
-
-        rng = date_range('1/1/2011', periods=100, freq='H')
-        ts = Series(1, index=rng)
-
-        result = ts.tz_localize('utc')
-        self.assertEqual(result.index.tz.zone, 'UTC')
-
-        df = DataFrame({'a': 1}, index=rng)
-        result = df.tz_localize('utc')
-        expected = DataFrame({'a': 1}, rng.tz_localize('UTC'))
-        self.assertEqual(result.index.tz.zone, 'UTC')
-        assert_frame_equal(result, expected)
-
-        df = df.T
-        result = df.tz_localize('utc', axis=1)
-        self.assertEqual(result.columns.tz.zone, 'UTC')
-        assert_frame_equal(result, expected.T)
-
-        # Can't localize if already tz-aware
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-        ts = Series(1, index=rng)
-        tm.assertRaisesRegexp(TypeError, 'Already tz-aware', ts.tz_localize,
-                              'US/Eastern')
-
-    def test_series_frame_tz_convert(self):
-        rng = date_range('1/1/2011', periods=200, freq='D', tz='US/Eastern')
-        ts = Series(1, index=rng)
-
-        result = ts.tz_convert('Europe/Berlin')
-        self.assertEqual(result.index.tz.zone, 'Europe/Berlin')
-
-        df = DataFrame({'a': 1}, index=rng)
-        result = df.tz_convert('Europe/Berlin')
-        expected = DataFrame({'a': 1}, rng.tz_convert('Europe/Berlin'))
-        self.assertEqual(result.index.tz.zone, 'Europe/Berlin')
-        assert_frame_equal(result, expected)
-
-        df = df.T
-        result = df.tz_convert('Europe/Berlin', axis=1)
-        self.assertEqual(result.columns.tz.zone, 'Europe/Berlin')
-        assert_frame_equal(result, expected.T)
-
-        # can't convert tz-naive
-        rng = date_range('1/1/2011', periods=200, freq='D')
-        ts = Series(1, index=rng)
-        tm.assertRaisesRegexp(TypeError, "Cannot convert tz-naive",
-                              ts.tz_convert, 'US/Eastern')
-
-    def test_tz_convert_roundtrip(self):
-        for tz in self.timezones:
-            idx1 = date_range(start='2014-01-01', end='2014-12-31', freq='M',
-                              tz='UTC')
-            exp1 = date_range(start='2014-01-01', end='2014-12-31', freq='M')
-
-            idx2 = date_range(start='2014-01-01', end='2014-12-31', freq='D',
-                              tz='UTC')
-            exp2 = date_range(start='2014-01-01', end='2014-12-31', freq='D')
-
-            idx3 = date_range(start='2014-01-01', end='2014-03-01', freq='H',
-                              tz='UTC')
-            exp3 = date_range(start='2014-01-01', end='2014-03-01', freq='H')
-
-            idx4 = date_range(start='2014-08-01', end='2014-10-31', freq='T',
-                              tz='UTC')
-            exp4 = date_range(start='2014-08-01', end='2014-10-31', freq='T')
-
-            for idx, expected in [(idx1, exp1), (idx2, exp2), (idx3, exp3),
-                                  (idx4, exp4)]:
-                converted = idx.tz_convert(tz)
-                reset = converted.tz_convert(None)
-                tm.assert_index_equal(reset, expected)
-                self.assertTrue(reset.tzinfo is None)
-                tm.assert_index_equal(reset, converted.tz_convert(
-                    'UTC').tz_localize(None))
-
-    def test_join_utc_convert(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        left = rng.tz_convert('US/Eastern')
-        right = rng.tz_convert('Europe/Berlin')
-
-        for how in ['inner', 'outer', 'left', 'right']:
-            result = left.join(left[:-5], how=how)
-            tm.assertIsInstance(result, DatetimeIndex)
-            self.assertEqual(result.tz, left.tz)
-
-            result = left.join(right[:-5], how=how)
-            tm.assertIsInstance(result, DatetimeIndex)
-            self.assertEqual(result.tz.zone, 'UTC')
-
-    def test_join_aware(self):
-        rng = date_range('1/1/2011', periods=10, freq='H')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_utc = ts.tz_localize('utc')
-
-        self.assertRaises(Exception, ts.__add__, ts_utc)
-        self.assertRaises(Exception, ts_utc.__add__, ts)
-
-        test1 = DataFrame(np.zeros((6, 3)),
-                          index=date_range("2012-11-15 00:00:00", periods=6,
-                                           freq="100L", tz="US/Central"))
-        test2 = DataFrame(np.zeros((3, 3)),
-                          index=date_range("2012-11-15 00:00:00", periods=3,
-                                           freq="250L", tz="US/Central"),
-                          columns=lrange(3, 6))
-
-        result = test1.join(test2, how='outer')
-        ex_index = test1.index.union(test2.index)
-
-        self.assert_index_equal(result.index, ex_index)
-        self.assertTrue(result.index.tz.zone == 'US/Central')
-
-        # non-overlapping
-        rng = date_range("2012-11-15 00:00:00", periods=6, freq="H",
-                         tz="US/Central")
-
-        rng2 = date_range("2012-11-15 12:00:00", periods=6, freq="H",
-                          tz="US/Eastern")
-
-        result = rng.union(rng2)
-        self.assertTrue(result.tz.zone == 'UTC')
-
-    def test_align_aware(self):
-        idx1 = date_range('2001', periods=5, freq='H', tz='US/Eastern')
-        idx2 = date_range('2001', periods=5, freq='2H', tz='US/Eastern')
-        df1 = DataFrame(np.random.randn(len(idx1), 3), idx1)
-        df2 = DataFrame(np.random.randn(len(idx2), 3), idx2)
-        new1, new2 = df1.align(df2)
-        self.assertEqual(df1.index.tz, new1.index.tz)
-        self.assertEqual(df2.index.tz, new2.index.tz)
-
-        # # different timezones convert to UTC
-
-        # frame
-        df1_central = df1.tz_convert('US/Central')
-        new1, new2 = df1.align(df1_central)
-        self.assertEqual(new1.index.tz, pytz.UTC)
-        self.assertEqual(new2.index.tz, pytz.UTC)
-
-        # series
-        new1, new2 = df1[0].align(df1_central[0])
-        self.assertEqual(new1.index.tz, pytz.UTC)
-        self.assertEqual(new2.index.tz, pytz.UTC)
-
-        # combination
-        new1, new2 = df1.align(df1_central[0], axis=0)
-        self.assertEqual(new1.index.tz, pytz.UTC)
-        self.assertEqual(new2.index.tz, pytz.UTC)
-
-        df1[0].align(df1_central, axis=0)
-        self.assertEqual(new1.index.tz, pytz.UTC)
-        self.assertEqual(new2.index.tz, pytz.UTC)
-
-    def test_append_aware(self):
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        ts1 = Series([1], index=rng1)
-        ts2 = Series([2], index=rng2)
-        ts_result = ts1.append(ts2)
-
-        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
-                                  tz='US/Eastern')
-        exp = Series([1, 2], index=exp_index)
-        assert_series_equal(ts_result, exp)
-        self.assertEqual(ts_result.index.tz, rng1.tz)
-
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H', tz='UTC')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H', tz='UTC')
-        ts1 = Series([1], index=rng1)
-        ts2 = Series([2], index=rng2)
-        ts_result = ts1.append(ts2)
-
-        exp_index = DatetimeIndex(['2011-01-01 01:00', '2011-01-01 02:00'],
-                                  tz='UTC')
-        exp = Series([1, 2], index=exp_index)
-        assert_series_equal(ts_result, exp)
-        utc = rng1.tz
-        self.assertEqual(utc, ts_result.index.tz)
-
-        # GH 7795
-        # different tz coerces to object dtype, not UTC
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Central')
-        ts1 = Series([1], index=rng1)
-        ts2 = Series([2], index=rng2)
-        ts_result = ts1.append(ts2)
-        exp_index = Index([Timestamp('1/1/2011 01:00', tz='US/Eastern'),
-                           Timestamp('1/1/2011 02:00', tz='US/Central')])
-        exp = Series([1, 2], index=exp_index)
-        assert_series_equal(ts_result, exp)
-
-    def test_append_dst(self):
-        rng1 = date_range('1/1/2016 01:00', periods=3, freq='H',
-                          tz='US/Eastern')
-        rng2 = date_range('8/1/2016 01:00', periods=3, freq='H',
-                          tz='US/Eastern')
-        ts1 = Series([1, 2, 3], index=rng1)
-        ts2 = Series([10, 11, 12], index=rng2)
-        ts_result = ts1.append(ts2)
-
-        exp_index = DatetimeIndex(['2016-01-01 01:00', '2016-01-01 02:00',
-                                   '2016-01-01 03:00', '2016-08-01 01:00',
-                                   '2016-08-01 02:00', '2016-08-01 03:00'],
-                                  tz='US/Eastern')
-        exp = Series([1, 2, 3, 10, 11, 12], index=exp_index)
-        assert_series_equal(ts_result, exp)
-        self.assertEqual(ts_result.index.tz, rng1.tz)
-
-    def test_append_aware_naive(self):
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
-        rng2 = date_range('1/1/2011 02:00', periods=1, freq='H',
-                          tz='US/Eastern')
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-
-        self.assertTrue(ts_result.index.equals(ts1.index.asobject.append(
-            ts2.index.asobject)))
-
-        # mixed
-        rng1 = date_range('1/1/2011 01:00', periods=1, freq='H')
-        rng2 = lrange(100)
-        ts1 = Series(np.random.randn(len(rng1)), index=rng1)
-        ts2 = Series(np.random.randn(len(rng2)), index=rng2)
-        ts_result = ts1.append(ts2)
-        self.assertTrue(ts_result.index.equals(ts1.index.asobject.append(
-            ts2.index)))
-
-    def test_equal_join_ensure_utc(self):
-        rng = date_range('1/1/2011', periods=10, freq='H', tz='US/Eastern')
-        ts = Series(np.random.randn(len(rng)), index=rng)
-
-        ts_moscow = ts.tz_convert('Europe/Moscow')
-
-        result = ts + ts_moscow
-        self.assertIs(result.index.tz, pytz.utc)
-
-        result = ts_moscow + ts
-        self.assertIs(result.index.tz, pytz.utc)
-
-        df = DataFrame({'a': ts})
-        df_moscow = df.tz_convert('Europe/Moscow')
-        result = df + df_moscow
-        self.assertIs(result.index.tz, pytz.utc)
-
-        result = df_moscow + df
-        self.assertIs(result.index.tz, pytz.utc)
-
-    def test_arith_utc_convert(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        perm = np.random.permutation(100)[:90]
-        ts1 = Series(np.random.randn(90),
-                     index=rng.take(perm).tz_convert('US/Eastern'))
-
-        perm = np.random.permutation(100)[:90]
-        ts2 = Series(np.random.randn(90),
-                     index=rng.take(perm).tz_convert('Europe/Berlin'))
-
-        result = ts1 + ts2
-
-        uts1 = ts1.tz_convert('utc')
-        uts2 = ts2.tz_convert('utc')
-        expected = uts1 + uts2
-
-        self.assertEqual(result.index.tz, pytz.UTC)
-        assert_series_equal(result, expected)
-
-    def test_intersection(self):
-        rng = date_range('1/1/2011', periods=100, freq='H', tz='utc')
-
-        left = rng[10:90][::-1]
-        right = rng[20:80][::-1]
-
-        self.assertEqual(left.tz, rng.tz)
-        result = left.intersection(right)
-        self.assertEqual(result.tz, left.tz)
-
-    def test_timestamp_equality_different_timezones(self):
-        utc_range = date_range('1/1/2000', periods=20, tz='UTC')
-        eastern_range = utc_range.tz_convert('US/Eastern')
-        berlin_range = utc_range.tz_convert('Europe/Berlin')
-
-        for a, b, c in zip(utc_range, eastern_range, berlin_range):
-            self.assertEqual(a, b)
-            self.assertEqual(b, c)
-            self.assertEqual(a, c)
-
-        self.assertTrue((utc_range == eastern_range).all())
-        self.assertTrue((utc_range == berlin_range).all())
-        self.assertTrue((berlin_range == eastern_range).all())
-
-    def test_datetimeindex_tz(self):
-        rng = date_range('03/12/2012 00:00', periods=10, freq='W-FRI',
-                         tz='US/Eastern')
-        rng2 = DatetimeIndex(data=rng, tz='US/Eastern')
-        self.assert_index_equal(rng, rng2)
-
-    def test_normalize_tz(self):
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D',
-                         tz='US/Eastern')
-
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D',
-                              tz='US/Eastern')
-        self.assert_index_equal(result, expected)
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz='UTC')
-
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D', tz='UTC')
-        self.assert_index_equal(result, expected)
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-        from dateutil.tz import tzlocal
-        rng = date_range('1/1/2000 9:30', periods=10, freq='D', tz=tzlocal())
-        result = rng.normalize()
-        expected = date_range('1/1/2000', periods=10, freq='D', tz=tzlocal())
-        self.assert_index_equal(result, expected)
-
-        self.assertTrue(result.is_normalized)
-        self.assertFalse(rng.is_normalized)
-
-    def test_normalize_tz_local(self):
-        # GH 13459
-        from dateutil.tz import tzlocal
-
-        timezones = ['US/Pacific', 'US/Eastern', 'UTC', 'Asia/Kolkata',
-                     'Asia/Shanghai', 'Australia/Canberra']
-
-        for timezone in timezones:
-            with set_timezone(timezone):
-                rng = date_range('1/1/2000 9:30', periods=10, freq='D',
-                                 tz=tzlocal())
-
-                result = rng.normalize()
-                expected = date_range('1/1/2000', periods=10, freq='D',
-                                      tz=tzlocal())
-                self.assert_index_equal(result, expected)
-
-                self.assertTrue(result.is_normalized)
-                self.assertFalse(rng.is_normalized)
-
-    def test_tzaware_offset(self):
-        dates = date_range('2012-11-01', periods=3, tz='US/Pacific')
-        offset = dates + offsets.Hour(5)
-        self.assertEqual(dates[0] + offsets.Hour(5), offset[0])
-
-        # GH 6818
-        for tz in ['UTC', 'US/Pacific', 'Asia/Tokyo']:
-            dates = date_range('2010-11-01 00:00', periods=3, tz=tz, freq='H')
-            expected = DatetimeIndex(['2010-11-01 05:00', '2010-11-01 06:00',
-                                      '2010-11-01 07:00'], freq='H', tz=tz)
-
-            offset = dates + offsets.Hour(5)
-            self.assert_index_equal(offset, expected)
-            offset = dates + np.timedelta64(5, 'h')
-            self.assert_index_equal(offset, expected)
-            offset = dates + timedelta(hours=5)
-            self.assert_index_equal(offset, expected)
-
-    def test_nat(self):
-        # GH 5546
-        dates = [NaT]
-        idx = DatetimeIndex(dates)
-        idx = idx.tz_localize('US/Pacific')
-        self.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
-        idx = idx.tz_convert('US/Eastern')
-        self.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Eastern'))
-        idx = idx.tz_convert('UTC')
-        self.assert_index_equal(idx, DatetimeIndex(dates, tz='UTC'))
-
-        dates = ['2010-12-01 00:00', '2010-12-02 00:00', NaT]
-        idx = DatetimeIndex(dates)
-        idx = idx.tz_localize('US/Pacific')
-        self.assert_index_equal(idx, DatetimeIndex(dates, tz='US/Pacific'))
-        idx = idx.tz_convert('US/Eastern')
-        expected = ['2010-12-01 03:00', '2010-12-02 03:00', NaT]
-        self.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
-
-        idx = idx + offsets.Hour(5)
-        expected = ['2010-12-01 08:00', '2010-12-02 08:00', NaT]
-        self.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
-        idx = idx.tz_convert('US/Pacific')
-        expected = ['2010-12-01 05:00', '2010-12-02 05:00', NaT]
-        self.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
-
-        idx = idx + np.timedelta64(3, 'h')
-        expected = ['2010-12-01 08:00', '2010-12-02 08:00', NaT]
-        self.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Pacific'))
-
-        idx = idx.tz_convert('US/Eastern')
-        expected = ['2010-12-01 11:00', '2010-12-02 11:00', NaT]
-        self.assert_index_equal(idx, DatetimeIndex(expected, tz='US/Eastern'))
-
-
-class TestTslib(tm.TestCase):
-
-    def test_tslib_tz_convert(self):
-        def compare_utc_to_local(tz_didx, utc_didx):
-            f = lambda x: tslib.tz_convert_single(x, 'UTC', tz_didx.tz)
-            result = tslib.tz_convert(tz_didx.asi8, 'UTC', tz_didx.tz)
-            result_single = np.vectorize(f)(tz_didx.asi8)
-            self.assert_numpy_array_equal(result, result_single)
-
-        def compare_local_to_utc(tz_didx, utc_didx):
-            f = lambda x: tslib.tz_convert_single(x, tz_didx.tz, 'UTC')
-            result = tslib.tz_convert(utc_didx.asi8, tz_didx.tz, 'UTC')
-            result_single = np.vectorize(f)(utc_didx.asi8)
-            self.assert_numpy_array_equal(result, result_single)
-
-        for tz in ['UTC', 'Asia/Tokyo', 'US/Eastern', 'Europe/Moscow']:
-            # US: 2014-03-09 - 2014-11-11
-            # MOSCOW: 2014-10-26  /  2014-12-31
-            tz_didx = date_range('2014-03-01', '2015-01-10', freq='H', tz=tz)
-            utc_didx = date_range('2014-03-01', '2015-01-10', freq='H')
-            compare_utc_to_local(tz_didx, utc_didx)
-            # local tz to UTC can be differ in hourly (or higher) freqs because
-            # of DST
-            compare_local_to_utc(tz_didx, utc_didx)
-
-            tz_didx = date_range('2000-01-01', '2020-01-01', freq='D', tz=tz)
-            utc_didx = date_range('2000-01-01', '2020-01-01', freq='D')
-            compare_utc_to_local(tz_didx, utc_didx)
-            compare_local_to_utc(tz_didx, utc_didx)
-
-            tz_didx = date_range('2000-01-01', '2100-01-01', freq='A', tz=tz)
-            utc_didx = date_range('2000-01-01', '2100-01-01', freq='A')
-            compare_utc_to_local(tz_didx, utc_didx)
-            compare_local_to_utc(tz_didx, utc_didx)
-
-        # Check empty array
-        result = tslib.tz_convert(np.array([], dtype=np.int64),
-                                  tslib.maybe_get_tz('US/Eastern'),
-                                  tslib.maybe_get_tz('Asia/Tokyo'))
-        self.assert_numpy_array_equal(result, np.array([], dtype=np.int64))
-
-        # Check all-NaT array
-        result = tslib.tz_convert(np.array([tslib.iNaT], dtype=np.int64),
-                                  tslib.maybe_get_tz('US/Eastern'),
-                                  tslib.maybe_get_tz('Asia/Tokyo'))
-        self.assert_numpy_array_equal(result, np.array(
-            [tslib.iNaT], dtype=np.int64))
diff --git a/pandas/tests/tslibs/__init__.py b/pandas/tests/tslibs/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/tslibs/test_api.py b/pandas/tests/tslibs/test_api.py
new file mode 100644
index 0000000000000..de937d1a4c526
--- /dev/null
+++ b/pandas/tests/tslibs/test_api.py
@@ -0,0 +1,40 @@
+# -*- coding: utf-8 -*-
+"""Tests that the tslibs API is locked down"""
+
+from pandas._libs import tslibs
+
+
+def test_namespace():
+
+    submodules = ['ccalendar',
+                  'conversion',
+                  'fields',
+                  'frequencies',
+                  'nattype',
+                  'np_datetime',
+                  'offsets',
+                  'parsing',
+                  'period',
+                  'resolution',
+                  'strptime',
+                  'timedeltas',
+                  'timestamps',
+                  'timezones']
+
+    api = ['NaT',
+           'iNaT',
+           'is_null_datetimelike',
+           'OutOfBoundsDatetime',
+           'Period',
+           'IncompatibleFrequency',
+           'Timedelta',
+           'Timestamp',
+           'delta_to_nanoseconds',
+           'ints_to_pytimedelta',
+           'localize_pydatetime',
+           'normalize_date',
+           'tz_convert_single']
+
+    expected = set(submodules + api)
+    names = [x for x in dir(tslibs) if not x.startswith('__')]
+    assert set(names) == expected
diff --git a/pandas/tests/tslibs/test_array_to_datetime.py b/pandas/tests/tslibs/test_array_to_datetime.py
new file mode 100644
index 0000000000000..f5b036dde2094
--- /dev/null
+++ b/pandas/tests/tslibs/test_array_to_datetime.py
@@ -0,0 +1,156 @@
+# -*- coding: utf-8 -*-
+from datetime import date, datetime
+
+from dateutil.tz.tz import tzoffset
+import numpy as np
+import pytest
+import pytz
+
+from pandas._libs import iNaT, tslib
+from pandas.compat.numpy import np_array_datetime64_compat
+
+import pandas.util.testing as tm
+
+
+@pytest.mark.parametrize("data,expected", [
+    (["01-01-2013", "01-02-2013"],
+     ["2013-01-01T00:00:00.000000000-0000",
+      "2013-01-02T00:00:00.000000000-0000"]),
+    (["Mon Sep 16 2013", "Tue Sep 17 2013"],
+     ["2013-09-16T00:00:00.000000000-0000",
+      "2013-09-17T00:00:00.000000000-0000"])
+])
+def test_parsing_valid_dates(data, expected):
+    arr = np.array(data, dtype=object)
+    result, _ = tslib.array_to_datetime(arr)
+
+    expected = np_array_datetime64_compat(expected, dtype="M8[ns]")
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("dt_string, expected_tz", [
+    ["01-01-2013 08:00:00+08:00", 480],
+    ["2013-01-01T08:00:00.000000000+0800", 480],
+    ["2012-12-31T16:00:00.000000000-0800", -480],
+    ["12-31-2012 23:00:00-01:00", -60]
+])
+def test_parsing_timezone_offsets(dt_string, expected_tz):
+    # All of these datetime strings with offsets are equivalent
+    # to the same datetime after the timezone offset is added.
+    arr = np.array(["01-01-2013 00:00:00"], dtype=object)
+    expected, _ = tslib.array_to_datetime(arr)
+
+    arr = np.array([dt_string], dtype=object)
+    result, result_tz = tslib.array_to_datetime(arr)
+
+    tm.assert_numpy_array_equal(result, expected)
+    assert result_tz is pytz.FixedOffset(expected_tz)
+
+
+def test_parsing_non_iso_timezone_offset():
+    dt_string = "01-01-2013T00:00:00.000000000+0000"
+    arr = np.array([dt_string], dtype=object)
+
+    result, result_tz = tslib.array_to_datetime(arr)
+    expected = np.array([np.datetime64("2013-01-01 00:00:00.000000000")])
+
+    tm.assert_numpy_array_equal(result, expected)
+    assert result_tz is pytz.FixedOffset(0)
+
+
+def test_parsing_different_timezone_offsets():
+    # see gh-17697
+    data = ["2015-11-18 15:30:00+05:30", "2015-11-18 15:30:00+06:30"]
+    data = np.array(data, dtype=object)
+
+    result, result_tz = tslib.array_to_datetime(data)
+    expected = np.array([datetime(2015, 11, 18, 15, 30,
+                                  tzinfo=tzoffset(None, 19800)),
+                         datetime(2015, 11, 18, 15, 30,
+                                  tzinfo=tzoffset(None, 23400))],
+                        dtype=object)
+
+    tm.assert_numpy_array_equal(result, expected)
+    assert result_tz is None
+
+
+@pytest.mark.parametrize("data", [
+    ["-352.737091", "183.575577"],
+    ["1", "2", "3", "4", "5"]
+])
+def test_number_looking_strings_not_into_datetime(data):
+    # see gh-4601
+    #
+    # These strings don't look like datetimes, so
+    # they shouldn't be attempted to be converted.
+    arr = np.array(data, dtype=object)
+    result, _ = tslib.array_to_datetime(arr, errors="ignore")
+
+    tm.assert_numpy_array_equal(result, arr)
+
+
+@pytest.mark.parametrize("invalid_date", [
+    date(1000, 1, 1),
+    datetime(1000, 1, 1),
+    "1000-01-01",
+    "Jan 1, 1000",
+    np.datetime64("1000-01-01")])
+@pytest.mark.parametrize("errors", ["coerce", "raise"])
+def test_coerce_outside_ns_bounds(invalid_date, errors):
+    arr = np.array([invalid_date], dtype="object")
+    kwargs = dict(values=arr, errors=errors)
+
+    if errors == "raise":
+        msg = "Out of bounds nanosecond timestamp"
+
+        with pytest.raises(ValueError, match=msg):
+            tslib.array_to_datetime(**kwargs)
+    else:  # coerce.
+        result, _ = tslib.array_to_datetime(**kwargs)
+        expected = np.array([iNaT], dtype="M8[ns]")
+
+        tm.assert_numpy_array_equal(result, expected)
+
+
+def test_coerce_outside_ns_bounds_one_valid():
+    arr = np.array(["1/1/1000", "1/1/2000"], dtype=object)
+    result, _ = tslib.array_to_datetime(arr, errors="coerce")
+
+    expected = [iNaT, "2000-01-01T00:00:00.000000000-0000"]
+    expected = np_array_datetime64_compat(expected, dtype="M8[ns]")
+
+    tm.assert_numpy_array_equal(result, expected)
+
+
+@pytest.mark.parametrize("errors", ["ignore", "coerce"])
+def test_coerce_of_invalid_datetimes(errors):
+    arr = np.array(["01-01-2013", "not_a_date", "1"], dtype=object)
+    kwargs = dict(values=arr, errors=errors)
+
+    if errors == "ignore":
+        # Without coercing, the presence of any invalid
+        # dates prevents any values from being converted.
+        result, _ = tslib.array_to_datetime(**kwargs)
+        tm.assert_numpy_array_equal(result, arr)
+    else:  # coerce.
+        # With coercing, the invalid dates becomes iNaT
+        result, _ = tslib.array_to_datetime(arr, errors="coerce")
+        expected = ["2013-01-01T00:00:00.000000000-0000",
+                    iNaT,
+                    iNaT]
+
+        tm.assert_numpy_array_equal(
+            result,
+            np_array_datetime64_compat(expected, dtype="M8[ns]"))
+
+
+def test_to_datetime_barely_out_of_bounds():
+    # see gh-19382, gh-19529
+    #
+    # Close enough to bounds that dropping nanos
+    # would result in an in-bounds datetime.
+    arr = np.array(["2262-04-11 23:47:16.854775808"], dtype=object)
+    msg = "Out of bounds nanosecond timestamp: 2262-04-11 23:47:16"
+
+    with pytest.raises(tslib.OutOfBoundsDatetime, match=msg):
+        tslib.array_to_datetime(arr)
diff --git a/pandas/tests/tslibs/test_ccalendar.py b/pandas/tests/tslibs/test_ccalendar.py
new file mode 100644
index 0000000000000..255558a80018b
--- /dev/null
+++ b/pandas/tests/tslibs/test_ccalendar.py
@@ -0,0 +1,25 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import ccalendar
+
+
+@pytest.mark.parametrize("date_tuple,expected", [
+    ((2001, 3, 1), 60),
+    ((2004, 3, 1), 61),
+    ((1907, 12, 31), 365),  # End-of-year, non-leap year.
+    ((2004, 12, 31), 366),  # End-of-year, leap year.
+])
+def test_get_day_of_year_numeric(date_tuple, expected):
+    assert ccalendar.get_day_of_year(*date_tuple) == expected
+
+
+def test_get_day_of_year_dt():
+    dt = datetime.fromordinal(1 + np.random.randint(365 * 4000))
+    result = ccalendar.get_day_of_year(dt.year, dt.month, dt.day)
+
+    expected = (dt - dt.replace(month=1, day=1)).days + 1
+    assert result == expected
diff --git a/pandas/tests/tslibs/test_conversion.py b/pandas/tests/tslibs/test_conversion.py
new file mode 100644
index 0000000000000..13398a69b4982
--- /dev/null
+++ b/pandas/tests/tslibs/test_conversion.py
@@ -0,0 +1,68 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+from pytz import UTC
+
+from pandas._libs.tslib import iNaT
+from pandas._libs.tslibs import conversion, timezones
+
+from pandas import date_range
+import pandas.util.testing as tm
+
+
+def _compare_utc_to_local(tz_didx):
+    def f(x):
+        return conversion.tz_convert_single(x, UTC, tz_didx.tz)
+
+    result = conversion.tz_convert(tz_didx.asi8, UTC, tz_didx.tz)
+    expected = np.vectorize(f)(tz_didx.asi8)
+
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def _compare_local_to_utc(tz_didx, utc_didx):
+    def f(x):
+        return conversion.tz_convert_single(x, tz_didx.tz, UTC)
+
+    result = conversion.tz_convert(utc_didx.asi8, tz_didx.tz, UTC)
+    expected = np.vectorize(f)(utc_didx.asi8)
+
+    tm.assert_numpy_array_equal(result, expected)
+
+
+def test_tz_convert_single_matches_tz_convert_hourly(tz_aware_fixture):
+    tz = tz_aware_fixture
+    tz_didx = date_range("2014-03-01", "2015-01-10", freq="H", tz=tz)
+    utc_didx = date_range("2014-03-01", "2015-01-10", freq="H")
+
+    _compare_utc_to_local(tz_didx)
+    _compare_local_to_utc(tz_didx, utc_didx)
+
+
+@pytest.mark.parametrize("freq", ["D", "A"])
+def test_tz_convert_single_matches_tz_convert(tz_aware_fixture, freq):
+    tz = tz_aware_fixture
+    tz_didx = date_range("2000-01-01", "2020-01-01", freq=freq, tz=tz)
+    utc_didx = date_range("2000-01-01", "2020-01-01", freq=freq)
+
+    _compare_utc_to_local(tz_didx)
+    _compare_local_to_utc(tz_didx, utc_didx)
+
+
+@pytest.mark.parametrize("arr", [
+    pytest.param(np.array([], dtype=np.int64), id="empty"),
+    pytest.param(np.array([iNaT], dtype=np.int64), id="all_nat")])
+def test_tz_convert_corner(arr):
+    result = conversion.tz_convert(arr,
+                                   timezones.maybe_get_tz("US/Eastern"),
+                                   timezones.maybe_get_tz("Asia/Tokyo"))
+    tm.assert_numpy_array_equal(result, arr)
+
+
+@pytest.mark.parametrize("copy", [True, False])
+@pytest.mark.parametrize("dtype", ["M8[ns]", "M8[s]"])
+def test_length_zero_copy(dtype, copy):
+    arr = np.array([], dtype=dtype)
+    result = conversion.ensure_datetime64ns(arr, copy=copy)
+    assert result.base is (None if copy else arr)
diff --git a/pandas/tests/tslibs/test_libfrequencies.py b/pandas/tests/tslibs/test_libfrequencies.py
new file mode 100644
index 0000000000000..b9b1c72dbf2e1
--- /dev/null
+++ b/pandas/tests/tslibs/test_libfrequencies.py
@@ -0,0 +1,100 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas._libs.tslibs.frequencies import (
+    INVALID_FREQ_ERR_MSG, _period_str_to_code, get_rule_month, is_subperiod,
+    is_superperiod)
+
+from pandas.tseries import offsets
+
+
+@pytest.mark.parametrize("obj,expected", [
+    ("W", "DEC"),
+    (offsets.Week(), "DEC"),
+
+    ("D", "DEC"),
+    (offsets.Day(), "DEC"),
+
+    ("Q", "DEC"),
+    (offsets.QuarterEnd(startingMonth=12), "DEC"),
+
+    ("Q-JAN", "JAN"),
+    (offsets.QuarterEnd(startingMonth=1), "JAN"),
+
+    ("A-DEC", "DEC"),
+    ("Y-DEC", "DEC"),
+    (offsets.YearEnd(), "DEC"),
+
+    ("A-MAY", "MAY"),
+    ("Y-MAY", "MAY"),
+    (offsets.YearEnd(month=5), "MAY")
+])
+def test_get_rule_month(obj, expected):
+    result = get_rule_month(obj)
+    assert result == expected
+
+
+@pytest.mark.parametrize("obj,expected", [
+    ("A", 1000),
+    ("A-DEC", 1000),
+    ("A-JAN", 1001),
+
+    ("Y", 1000),
+    ("Y-DEC", 1000),
+    ("Y-JAN", 1001),
+
+    ("Q", 2000),
+    ("Q-DEC", 2000),
+    ("Q-FEB", 2002),
+
+    ("W", 4000),
+    ("W-SUN", 4000),
+    ("W-FRI", 4005),
+
+    ("Min", 8000),
+    ("ms", 10000),
+    ("US", 11000),
+    ("NS", 12000)
+])
+def test_period_str_to_code(obj, expected):
+    assert _period_str_to_code(obj) == expected
+
+
+@pytest.mark.parametrize("p1,p2,expected", [
+    # Input validation.
+    (offsets.MonthEnd(), None, False),
+    (offsets.YearEnd(), None, False),
+    (None, offsets.YearEnd(), False),
+    (None, offsets.MonthEnd(), False),
+    (None, None, False),
+
+    (offsets.YearEnd(), offsets.MonthEnd(), True),
+    (offsets.Hour(), offsets.Minute(), True),
+    (offsets.Second(), offsets.Milli(), True),
+    (offsets.Milli(), offsets.Micro(), True),
+    (offsets.Micro(), offsets.Nano(), True)
+])
+def test_super_sub_symmetry(p1, p2, expected):
+    assert is_superperiod(p1, p2) is expected
+    assert is_subperiod(p2, p1) is expected
+
+
+@pytest.mark.parametrize("freq,expected,aliases", [
+    ("D", 6000, ["DAY", "DLY", "DAILY"]),
+    ("M", 3000, ["MTH", "MONTH", "MONTHLY"]),
+    ("N", 12000, ["NANOSECOND", "NANOSECONDLY"]),
+    ("H", 7000, ["HR", "HOUR", "HRLY", "HOURLY"]),
+    ("T", 8000, ["minute", "MINUTE", "MINUTELY"]),
+    ("L", 10000, ["MILLISECOND", "MILLISECONDLY"]),
+    ("U", 11000, ["MICROSECOND", "MICROSECONDLY"]),
+    ("S", 9000, ["sec", "SEC", "SECOND", "SECONDLY"]),
+    ("B", 5000, ["BUS", "BUSINESS", "BUSINESSLY", "WEEKDAY"]),
+])
+def test_assert_aliases_deprecated(freq, expected, aliases):
+    assert isinstance(aliases, list)
+    assert _period_str_to_code(freq) == expected
+
+    for alias in aliases:
+        with pytest.raises(ValueError, match=INVALID_FREQ_ERR_MSG):
+            _period_str_to_code(alias)
diff --git a/pandas/tests/tslibs/test_liboffsets.py b/pandas/tests/tslibs/test_liboffsets.py
new file mode 100644
index 0000000000000..cb699278595e7
--- /dev/null
+++ b/pandas/tests/tslibs/test_liboffsets.py
@@ -0,0 +1,174 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for helper functions in the cython tslibs.offsets
+"""
+from datetime import datetime
+
+import pytest
+
+import pandas._libs.tslibs.offsets as liboffsets
+from pandas._libs.tslibs.offsets import roll_qtrday
+
+from pandas import Timestamp
+
+
+@pytest.fixture(params=["start", "end", "business_start", "business_end"])
+def day_opt(request):
+    return request.param
+
+
+@pytest.mark.parametrize("dt,exp_week_day,exp_last_day", [
+    (datetime(2017, 11, 30), 3, 30),  # Business day.
+    (datetime(1993, 10, 31), 6, 29)   # Non-business day.
+])
+def test_get_last_bday(dt, exp_week_day, exp_last_day):
+    assert dt.weekday() == exp_week_day
+    assert liboffsets.get_lastbday(dt.year, dt.month) == exp_last_day
+
+
+@pytest.mark.parametrize("dt,exp_week_day,exp_first_day", [
+    (datetime(2017, 4, 1), 5, 3),  # Non-weekday.
+    (datetime(1993, 10, 1), 4, 1)   # Business day.
+])
+def test_get_first_bday(dt, exp_week_day, exp_first_day):
+    assert dt.weekday() == exp_week_day
+    assert liboffsets.get_firstbday(dt.year, dt.month) == exp_first_day
+
+
+@pytest.mark.parametrize("months,day_opt,expected", [
+    (0, 15, datetime(2017, 11, 15)),
+    (0, None, datetime(2017, 11, 30)),
+    (1, "start", datetime(2017, 12, 1)),
+    (-145, "end", datetime(2005, 10, 31)),
+    (0, "business_end", datetime(2017, 11, 30)),
+    (0, "business_start", datetime(2017, 11, 1))
+])
+def test_shift_month_dt(months, day_opt, expected):
+    dt = datetime(2017, 11, 30)
+    assert liboffsets.shift_month(dt, months, day_opt=day_opt) == expected
+
+
+@pytest.mark.parametrize("months,day_opt,expected", [
+    (1, "start", Timestamp("1929-06-01")),
+    (-3, "end", Timestamp("1929-02-28")),
+    (25, None, Timestamp("1931-06-5")),
+    (-1, 31, Timestamp("1929-04-30"))
+])
+def test_shift_month_ts(months, day_opt, expected):
+    ts = Timestamp("1929-05-05")
+    assert liboffsets.shift_month(ts, months, day_opt=day_opt) == expected
+
+
+def test_shift_month_error():
+    dt = datetime(2017, 11, 15)
+    day_opt = "this should raise"
+
+    with pytest.raises(ValueError, match=day_opt):
+        liboffsets.shift_month(dt, 3, day_opt=day_opt)
+
+
+@pytest.mark.parametrize("other,expected", [
+    # Before March 1.
+    (datetime(2017, 2, 10), {2: 1, -7: -7, 0: 0}),
+
+    # After March 1.
+    (Timestamp("2014-03-15", tz="US/Eastern"), {2: 2, -7: -6, 0: 1})
+])
+@pytest.mark.parametrize("n", [2, -7, 0])
+def test_roll_yearday(other, expected, n):
+    month = 3
+    day_opt = "start"  # `other` will be compared to March 1.
+
+    assert liboffsets.roll_yearday(other, n, month, day_opt) == expected[n]
+
+
+@pytest.mark.parametrize("other,expected", [
+    # Before June 30.
+    (datetime(1999, 6, 29), {5: 4, -7: -7, 0: 0}),
+
+    # After June 30.
+    (Timestamp(2072, 8, 24, 6, 17, 18), {5: 5, -7: -6, 0: 1})
+])
+@pytest.mark.parametrize("n", [5, -7, 0])
+def test_roll_yearday2(other, expected, n):
+    month = 6
+    day_opt = "end"  # `other` will be compared to June 30.
+
+    assert liboffsets.roll_yearday(other, n, month, day_opt) == expected[n]
+
+
+def test_get_day_of_month_error():
+    # get_day_of_month is not directly exposed.
+    # We test it via roll_yearday.
+    dt = datetime(2017, 11, 15)
+    day_opt = "foo"
+
+    with pytest.raises(ValueError, match=day_opt):
+        # To hit the raising case we need month == dt.month and n > 0.
+        liboffsets.roll_yearday(dt, n=3, month=11, day_opt=day_opt)
+
+
+@pytest.mark.parametrize("month", [
+    3,  # (other.month % 3) < (month % 3)
+    5   # (other.month % 3) > (month % 3)
+])
+@pytest.mark.parametrize("n", [4, -3])
+def test_roll_qtr_day_not_mod_unequal(day_opt, month, n):
+    expected = {
+        3: {
+            -3: -2,
+            4: 4
+        },
+        5: {
+            -3: -3,
+            4: 3
+        }
+    }
+
+    other = Timestamp(2072, 10, 1, 6, 17, 18)  # Saturday.
+    assert roll_qtrday(other, n, month, day_opt, modby=3) == expected[month][n]
+
+
+@pytest.mark.parametrize("other,month,exp_dict", [
+    # Monday.
+    (datetime(1999, 5, 31), 2, {
+        -1: {
+            "start": 0,
+            "business_start": 0
+        }
+    }),
+
+    # Saturday.
+    (Timestamp(2072, 10, 1, 6, 17, 18), 4, {
+        2: {
+            "end": 1,
+            "business_end": 1,
+            "business_start": 1
+        }
+    }),
+
+    # First business day.
+    (Timestamp(2072, 10, 3, 6, 17, 18), 4, {
+        2: {
+            "end": 1,
+            "business_end": 1
+        },
+        -1: {
+            "start": 0
+        }
+    })
+])
+@pytest.mark.parametrize("n", [2, -1])
+def test_roll_qtr_day_mod_equal(other, month, exp_dict, n, day_opt):
+    # All cases have (other.month % 3) == (month % 3).
+    expected = exp_dict.get(n, {}).get(day_opt, n)
+    assert roll_qtrday(other, n, month, day_opt, modby=3) == expected
+
+
+@pytest.mark.parametrize("n,expected", [
+    (42, {29: 42, 1: 42, 31: 41}),
+    (-4, {29: -4, 1: -3, 31: -4})
+])
+@pytest.mark.parametrize("compare", [29, 1, 31])
+def test_roll_convention(n, expected, compare):
+    assert liboffsets.roll_convention(29, n, compare) == expected[compare]
diff --git a/pandas/tests/tslibs/test_normalize_date.py b/pandas/tests/tslibs/test_normalize_date.py
new file mode 100644
index 0000000000000..6124121b97186
--- /dev/null
+++ b/pandas/tests/tslibs/test_normalize_date.py
@@ -0,0 +1,18 @@
+# -*- coding: utf-8 -*-
+"""Tests for functions from pandas._libs.tslibs"""
+
+from datetime import date, datetime
+
+import pytest
+
+from pandas._libs import tslibs
+
+
+@pytest.mark.parametrize("value,expected", [
+    (date(2012, 9, 7), datetime(2012, 9, 7)),
+    (datetime(2012, 9, 7, 12), datetime(2012, 9, 7)),
+    (datetime(2007, 10, 1, 1, 12, 5, 10), datetime(2007, 10, 1))
+])
+def test_normalize_date(value, expected):
+    result = tslibs.normalize_date(value)
+    assert result == expected
diff --git a/pandas/tests/tslibs/test_parse_iso8601.py b/pandas/tests/tslibs/test_parse_iso8601.py
new file mode 100644
index 0000000000000..d1b3dee948afe
--- /dev/null
+++ b/pandas/tests/tslibs/test_parse_iso8601.py
@@ -0,0 +1,62 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import pytest
+
+from pandas._libs import tslib
+
+
+@pytest.mark.parametrize("date_str, exp", [
+    ("2011-01-02", datetime(2011, 1, 2)),
+    ("2011-1-2", datetime(2011, 1, 2)),
+    ("2011-01", datetime(2011, 1, 1)),
+    ("2011-1", datetime(2011, 1, 1)),
+    ("2011 01 02", datetime(2011, 1, 2)),
+    ("2011.01.02", datetime(2011, 1, 2)),
+    ("2011/01/02", datetime(2011, 1, 2)),
+    ("2011\\01\\02", datetime(2011, 1, 2)),
+    ("2013-01-01 05:30:00", datetime(2013, 1, 1, 5, 30)),
+    ("2013-1-1 5:30:00", datetime(2013, 1, 1, 5, 30))])
+def test_parsers_iso8601(date_str, exp):
+    # see gh-12060
+    #
+    # Test only the ISO parser - flexibility to
+    # different separators and leading zero's.
+    actual = tslib._test_parse_iso8601(date_str)
+    assert actual == exp
+
+
+@pytest.mark.parametrize("date_str", [
+    "2011-01/02",
+    "2011=11=11",
+    "201401",
+    "201111",
+    "200101",
+
+    # Mixed separated and unseparated.
+    "2005-0101",
+    "200501-01",
+    "20010101 12:3456",
+    "20010101 1234:56",
+
+    # HHMMSS must have two digits in
+    # each component if unseparated.
+    "20010101 1",
+    "20010101 123",
+    "20010101 12345",
+    "20010101 12345Z",
+])
+def test_parsers_iso8601_invalid(date_str):
+    msg = "Error parsing datetime string \"{s}\"".format(s=date_str)
+
+    with pytest.raises(ValueError, match=msg):
+        tslib._test_parse_iso8601(date_str)
+
+
+def test_parsers_iso8601_invalid_offset_invalid():
+    date_str = "2001-01-01 12-34-56"
+    msg = ("Timezone hours offset out of range "
+           "in datetime string \"{s}\"".format(s=date_str))
+
+    with pytest.raises(ValueError, match=msg):
+        tslib._test_parse_iso8601(date_str)
diff --git a/pandas/tests/tslibs/test_parsing.py b/pandas/tests/tslibs/test_parsing.py
new file mode 100644
index 0000000000000..597ec6df7389f
--- /dev/null
+++ b/pandas/tests/tslibs/test_parsing.py
@@ -0,0 +1,186 @@
+# -*- coding: utf-8 -*-
+"""
+Tests for Timestamp parsing, aimed at pandas/_libs/tslibs/parsing.pyx
+"""
+from datetime import datetime
+
+from dateutil.parser import parse
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs import parsing
+from pandas._libs.tslibs.parsing import parse_time_string
+import pandas.util._test_decorators as td
+
+from pandas.util import testing as tm
+
+
+def test_parse_time_string():
+    (date, parsed, reso) = parse_time_string("4Q1984")
+    (date_lower, parsed_lower, reso_lower) = parse_time_string("4q1984")
+
+    assert date == date_lower
+    assert reso == reso_lower
+    assert parsed == parsed_lower
+
+
+@pytest.mark.parametrize("dashed,normal", [
+    ("1988-Q2", "1988Q2"),
+    ("2Q-1988", "2Q1988")
+])
+def test_parse_time_quarter_with_dash(dashed, normal):
+    # see gh-9688
+    (date_dash, parsed_dash, reso_dash) = parse_time_string(dashed)
+    (date, parsed, reso) = parse_time_string(normal)
+
+    assert date_dash == date
+    assert parsed_dash == parsed
+    assert reso_dash == reso
+
+
+@pytest.mark.parametrize("dashed", [
+    "-2Q1992", "2-Q1992", "4-4Q1992"
+])
+def test_parse_time_quarter_with_dash_error(dashed):
+    msg = ("Unknown datetime string format, "
+           "unable to parse: {dashed}".format(dashed=dashed))
+
+    with pytest.raises(parsing.DateParseError, match=msg):
+        parse_time_string(dashed)
+
+
+@pytest.mark.parametrize("date_string,expected", [
+    ("123.1234", False),
+    ("-50000", False),
+    ("999", False),
+    ("m", False),
+    ("T", False),
+
+    ("Mon Sep 16, 2013", True),
+    ("2012-01-01", True),
+    ("01/01/2012", True),
+    ("01012012", True),
+    ("0101", True),
+    ("1-1", True)
+])
+def test_does_not_convert_mixed_integer(date_string, expected):
+    assert parsing._does_string_look_like_datetime(date_string) is expected
+
+
+@pytest.mark.parametrize("date_str,kwargs,msg", [
+    ("2013Q5", dict(),
+     ("Incorrect quarterly string is given, "
+      "quarter must be between 1 and 4: 2013Q5")),
+
+    # see gh-5418
+    ("2013Q1", dict(freq="INVLD-L-DEC-SAT"),
+     ("Unable to retrieve month information "
+      "from given freq: INVLD-L-DEC-SAT"))
+])
+def test_parsers_quarterly_with_freq_error(date_str, kwargs, msg):
+    with pytest.raises(parsing.DateParseError, match=msg):
+        parsing.parse_time_string(date_str, **kwargs)
+
+
+@pytest.mark.parametrize("date_str,freq,expected", [
+    ("2013Q2", None, datetime(2013, 4, 1)),
+    ("2013Q2", "A-APR", datetime(2012, 8, 1)),
+    ("2013-Q2", "A-DEC", datetime(2013, 4, 1))
+])
+def test_parsers_quarterly_with_freq(date_str, freq, expected):
+    result, _, _ = parsing.parse_time_string(date_str, freq=freq)
+    assert result == expected
+
+
+@pytest.mark.parametrize("date_str", [
+    "2Q 2005", "2Q-200A", "2Q-200",
+    "22Q2005", "2Q200.", "6Q-20"
+])
+def test_parsers_quarter_invalid(date_str):
+    if date_str == "6Q-20":
+        msg = ("Incorrect quarterly string is given, quarter "
+               "must be between 1 and 4: {date_str}".format(date_str=date_str))
+    else:
+        msg = ("Unknown datetime string format, unable "
+               "to parse: {date_str}".format(date_str=date_str))
+
+    with pytest.raises(ValueError, match=msg):
+        parsing.parse_time_string(date_str)
+
+
+@pytest.mark.parametrize("date_str,expected", [
+    ("201101", datetime(2011, 1, 1, 0, 0)),
+    ("200005", datetime(2000, 5, 1, 0, 0))
+])
+def test_parsers_month_freq(date_str, expected):
+    result, _, _ = parsing.parse_time_string(date_str, freq="M")
+    assert result == expected
+
+
+@td.skip_if_not_us_locale
+@pytest.mark.parametrize("string,fmt", [
+    ("20111230", "%Y%m%d"),
+    ("2011-12-30", "%Y-%m-%d"),
+    ("30-12-2011", "%d-%m-%Y"),
+    ("2011-12-30 00:00:00", "%Y-%m-%d %H:%M:%S"),
+    ("2011-12-30T00:00:00", "%Y-%m-%dT%H:%M:%S"),
+    ("2011-12-30 00:00:00.000000", "%Y-%m-%d %H:%M:%S.%f")
+])
+def test_guess_datetime_format_with_parseable_formats(string, fmt):
+    result = parsing._guess_datetime_format(string)
+    assert result == fmt
+
+
+@pytest.mark.parametrize("dayfirst,expected", [
+    (True, "%d/%m/%Y"),
+    (False, "%m/%d/%Y")
+])
+def test_guess_datetime_format_with_dayfirst(dayfirst, expected):
+    ambiguous_string = "01/01/2011"
+    result = parsing._guess_datetime_format(ambiguous_string,
+                                            dayfirst=dayfirst)
+    assert result == expected
+
+
+@td.skip_if_has_locale
+@pytest.mark.parametrize("string,fmt", [
+    ("30/Dec/2011", "%d/%b/%Y"),
+    ("30/December/2011", "%d/%B/%Y"),
+    ("30/Dec/2011 00:00:00", "%d/%b/%Y %H:%M:%S")
+])
+def test_guess_datetime_format_with_locale_specific_formats(string, fmt):
+    result = parsing._guess_datetime_format(string)
+    assert result == fmt
+
+
+@pytest.mark.parametrize("invalid_dt", [
+    "2013", "01/2013", "12:00:00", "1/1/1/1",
+    "this_is_not_a_datetime", "51a", 9,
+    datetime(2011, 1, 1)
+])
+def test_guess_datetime_format_invalid_inputs(invalid_dt):
+    # A datetime string must include a year, month and a day for it to be
+    # guessable, in addition to being a string that looks like a datetime.
+    assert parsing._guess_datetime_format(invalid_dt) is None
+
+
+@pytest.mark.parametrize("string,fmt", [
+    ("2011-1-1", "%Y-%m-%d"),
+    ("1/1/2011", "%m/%d/%Y"),
+    ("30-1-2011", "%d-%m-%Y"),
+    ("2011-1-1 0:0:0", "%Y-%m-%d %H:%M:%S"),
+    ("2011-1-3T00:00:0", "%Y-%m-%dT%H:%M:%S"),
+    ("2011-1-1 00:00:00", "%Y-%m-%d %H:%M:%S")
+])
+def test_guess_datetime_format_no_padding(string, fmt):
+    # see gh-11142
+    result = parsing._guess_datetime_format(string)
+    assert result == fmt
+
+
+def test_try_parse_dates():
+    arr = np.array(["5/1/2000", "6/1/2000", "7/1/2000"], dtype=object)
+    result = parsing.try_parse_dates(arr, dayfirst=True)
+
+    expected = np.array([parse(d, dayfirst=True) for d in arr])
+    tm.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/tslibs/test_period_asfreq.py b/pandas/tests/tslibs/test_period_asfreq.py
new file mode 100644
index 0000000000000..6a9522e705318
--- /dev/null
+++ b/pandas/tests/tslibs/test_period_asfreq.py
@@ -0,0 +1,87 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas._libs.tslibs.frequencies import get_freq
+from pandas._libs.tslibs.period import period_asfreq, period_ordinal
+
+
+@pytest.mark.parametrize("freq1,freq2,expected", [
+    ("D", "H", 24),
+    ("D", "T", 1440),
+    ("D", "S", 86400),
+    ("D", "L", 86400000),
+    ("D", "U", 86400000000),
+    ("D", "N", 86400000000000),
+
+    ("H", "T", 60),
+    ("H", "S", 3600),
+    ("H", "L", 3600000),
+    ("H", "U", 3600000000),
+    ("H", "N", 3600000000000),
+
+    ("T", "S", 60),
+    ("T", "L", 60000),
+    ("T", "U", 60000000),
+    ("T", "N", 60000000000),
+
+    ("S", "L", 1000),
+    ("S", "U", 1000000),
+    ("S", "N", 1000000000),
+
+    ("L", "U", 1000),
+    ("L", "N", 1000000),
+
+    ("U", "N", 1000)
+])
+def test_intra_day_conversion_factors(freq1, freq2, expected):
+    assert period_asfreq(1, get_freq(freq1),
+                         get_freq(freq2), False) == expected
+
+
+@pytest.mark.parametrize("freq,expected", [
+    ("A", 0),
+    ("M", 0),
+    ("W", 1),
+    ("D", 0),
+    ("B", 0)
+])
+def test_period_ordinal_start_values(freq, expected):
+    # information for Jan. 1, 1970.
+    assert period_ordinal(1970, 1, 1, 0, 0, 0,
+                          0, 0, get_freq(freq)) == expected
+
+
+@pytest.mark.parametrize("dt,expected", [
+    ((1970, 1, 4, 0, 0, 0, 0, 0), 1),
+    ((1970, 1, 5, 0, 0, 0, 0, 0), 2),
+    ((2013, 10, 6, 0, 0, 0, 0, 0), 2284),
+    ((2013, 10, 7, 0, 0, 0, 0, 0), 2285)
+])
+def test_period_ordinal_week(dt, expected):
+    args = dt + (get_freq("W"),)
+    assert period_ordinal(*args) == expected
+
+
+@pytest.mark.parametrize("day,expected", [
+    # Thursday (Oct. 3, 2013).
+    (3, 11415),
+
+    # Friday (Oct. 4, 2013).
+    (4, 11416),
+
+    # Saturday (Oct. 5, 2013).
+    (5, 11417),
+
+    # Sunday (Oct. 6, 2013).
+    (6, 11417),
+
+    # Monday (Oct. 7, 2013).
+    (7, 11417),
+
+    # Tuesday (Oct. 8, 2013).
+    (8, 11418)
+])
+def test_period_ordinal_business_day(day, expected):
+    args = (2013, 10, day, 0, 0, 0, 0, 0, get_freq("B"))
+    assert period_ordinal(*args) == expected
diff --git a/pandas/tests/tslibs/test_timedeltas.py b/pandas/tests/tslibs/test_timedeltas.py
new file mode 100644
index 0000000000000..fdc8eff80acad
--- /dev/null
+++ b/pandas/tests/tslibs/test_timedeltas.py
@@ -0,0 +1,29 @@
+# -*- coding: utf-8 -*-
+import numpy as np
+import pytest
+
+from pandas._libs.tslibs.timedeltas import delta_to_nanoseconds
+
+import pandas as pd
+from pandas import Timedelta
+
+
+@pytest.mark.parametrize("obj,expected", [
+    (np.timedelta64(14, "D"), 14 * 24 * 3600 * 1e9),
+    (Timedelta(minutes=-7), -7 * 60 * 1e9),
+    (Timedelta(minutes=-7).to_pytimedelta(), -7 * 60 * 1e9),
+    (pd.offsets.Nano(125), 125),
+    (1, 1),
+    (np.int64(2), 2),
+    (np.int32(3), 3)
+])
+def test_delta_to_nanoseconds(obj, expected):
+    result = delta_to_nanoseconds(obj)
+    assert result == expected
+
+
+def test_delta_to_nanoseconds_error():
+    obj = np.array([123456789], dtype="m8[ns]")
+
+    with pytest.raises(TypeError, match="<(class|type) 'numpy.ndarray'>"):
+        delta_to_nanoseconds(obj)
diff --git a/pandas/tests/tslibs/test_timezones.py b/pandas/tests/tslibs/test_timezones.py
new file mode 100644
index 0000000000000..0255865dbdf71
--- /dev/null
+++ b/pandas/tests/tslibs/test_timezones.py
@@ -0,0 +1,101 @@
+# -*- coding: utf-8 -*-
+from datetime import datetime
+
+import dateutil.tz
+import pytest
+import pytz
+
+from pandas._libs.tslibs import conversion, timezones
+
+from pandas import Timestamp
+
+
+@pytest.mark.parametrize("tz_name", list(pytz.common_timezones))
+def test_cache_keys_are_distinct_for_pytz_vs_dateutil(tz_name):
+    if tz_name == "UTC":
+        pytest.skip("UTC: special case in dateutil")
+
+    tz_p = timezones.maybe_get_tz(tz_name)
+    tz_d = timezones.maybe_get_tz("dateutil/" + tz_name)
+
+    if tz_d is None:
+        pytest.skip(tz_name + ": dateutil does not know about this one")
+
+    assert timezones._p_tz_cache_key(tz_p) != timezones._p_tz_cache_key(tz_d)
+
+
+def test_tzlocal_repr():
+    # see gh-13583
+    ts = Timestamp("2011-01-01", tz=dateutil.tz.tzlocal())
+    assert ts.tz == dateutil.tz.tzlocal()
+    assert "tz='tzlocal()')" in repr(ts)
+
+
+def test_tzlocal_maybe_get_tz():
+    # see gh-13583
+    tz = timezones.maybe_get_tz('tzlocal()')
+    assert tz == dateutil.tz.tzlocal()
+
+
+def test_tzlocal_offset():
+    # see gh-13583
+    #
+    # Get offset using normal datetime for test.
+    ts = Timestamp("2011-01-01", tz=dateutil.tz.tzlocal())
+
+    offset = dateutil.tz.tzlocal().utcoffset(datetime(2011, 1, 1))
+    offset = offset.total_seconds() * 1000000000
+
+    assert ts.value + offset == Timestamp("2011-01-01").value
+
+
+@pytest.fixture(params=[
+    (pytz.timezone("US/Eastern"), lambda tz, x: tz.localize(x)),
+    (dateutil.tz.gettz("US/Eastern"), lambda tz, x: x.replace(tzinfo=tz))
+])
+def infer_setup(request):
+    eastern, localize = request.param
+
+    start_naive = datetime(2001, 1, 1)
+    end_naive = datetime(2009, 1, 1)
+
+    start = localize(eastern, start_naive)
+    end = localize(eastern, end_naive)
+
+    return eastern, localize, start, end, start_naive, end_naive
+
+
+def test_infer_tz_compat(infer_setup):
+    eastern, _, start, end, start_naive, end_naive = infer_setup
+
+    assert (timezones.infer_tzinfo(start, end) is
+            conversion.localize_pydatetime(start_naive, eastern).tzinfo)
+    assert (timezones.infer_tzinfo(start, None) is
+            conversion.localize_pydatetime(start_naive, eastern).tzinfo)
+    assert (timezones.infer_tzinfo(None, end) is
+            conversion.localize_pydatetime(end_naive, eastern).tzinfo)
+
+
+def test_infer_tz_utc_localize(infer_setup):
+    _, _, start, end, start_naive, end_naive = infer_setup
+    utc = pytz.utc
+
+    start = utc.localize(start_naive)
+    end = utc.localize(end_naive)
+
+    assert timezones.infer_tzinfo(start, end) is utc
+
+
+@pytest.mark.parametrize("ordered", [True, False])
+def test_infer_tz_mismatch(infer_setup, ordered):
+    eastern, _, _, _, start_naive, end_naive = infer_setup
+    msg = "Inputs must both have the same timezone"
+
+    utc = pytz.utc
+    start = utc.localize(start_naive)
+    end = conversion.localize_pydatetime(end_naive, eastern)
+
+    args = (start, end) if ordered else (end, start)
+
+    with pytest.raises(AssertionError, match=msg):
+        timezones.infer_tzinfo(*args)
diff --git a/pandas/tests/types/test_cast.py b/pandas/tests/types/test_cast.py
deleted file mode 100644
index de6ef7af9d7f9..0000000000000
--- a/pandas/tests/types/test_cast.py
+++ /dev/null
@@ -1,320 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-These test the private routines in types/cast.py
-
-"""
-
-import pytest
-from datetime import datetime, timedelta, date
-import numpy as np
-
-from pandas import Timedelta, Timestamp, DatetimeIndex
-from pandas.types.cast import (maybe_downcast_to_dtype,
-                               maybe_convert_objects,
-                               infer_dtype_from_scalar,
-                               infer_dtype_from_array,
-                               maybe_convert_string_to_object,
-                               maybe_convert_scalar,
-                               find_common_type)
-from pandas.types.dtypes import (CategoricalDtype,
-                                 DatetimeTZDtype, PeriodDtype)
-from pandas.util import testing as tm
-
-
-class TestMaybeDowncast(tm.TestCase):
-
-    def test_downcast_conv(self):
-        # test downcasting
-
-        arr = np.array([8.5, 8.6, 8.7, 8.8, 8.9999999999995])
-        result = maybe_downcast_to_dtype(arr, 'infer')
-        assert (np.array_equal(result, arr))
-
-        arr = np.array([8., 8., 8., 8., 8.9999999999995])
-        result = maybe_downcast_to_dtype(arr, 'infer')
-        expected = np.array([8, 8, 8, 8, 9])
-        assert (np.array_equal(result, expected))
-
-        arr = np.array([8., 8., 8., 8., 9.0000000000005])
-        result = maybe_downcast_to_dtype(arr, 'infer')
-        expected = np.array([8, 8, 8, 8, 9])
-        assert (np.array_equal(result, expected))
-
-        # conversions
-
-        expected = np.array([1, 2])
-        for dtype in [np.float64, object, np.int64]:
-            arr = np.array([1.0, 2.0], dtype=dtype)
-            result = maybe_downcast_to_dtype(arr, 'infer')
-            tm.assert_almost_equal(result, expected, check_dtype=False)
-
-        for dtype in [np.float64, object]:
-            expected = np.array([1.0, 2.0, np.nan], dtype=dtype)
-            arr = np.array([1.0, 2.0, np.nan], dtype=dtype)
-            result = maybe_downcast_to_dtype(arr, 'infer')
-            tm.assert_almost_equal(result, expected)
-
-        # empties
-        for dtype in [np.int32, np.float64, np.float32, np.bool_,
-                      np.int64, object]:
-            arr = np.array([], dtype=dtype)
-            result = maybe_downcast_to_dtype(arr, 'int64')
-            tm.assert_almost_equal(result, np.array([], dtype=np.int64))
-            assert result.dtype == np.int64
-
-    def test_datetimelikes_nan(self):
-        arr = np.array([1, 2, np.nan])
-        exp = np.array([1, 2, np.datetime64('NaT')], dtype='datetime64[ns]')
-        res = maybe_downcast_to_dtype(arr, 'datetime64[ns]')
-        tm.assert_numpy_array_equal(res, exp)
-
-        exp = np.array([1, 2, np.timedelta64('NaT')], dtype='timedelta64[ns]')
-        res = maybe_downcast_to_dtype(arr, 'timedelta64[ns]')
-        tm.assert_numpy_array_equal(res, exp)
-
-    def test_datetime_with_timezone(self):
-        # GH 15426
-        ts = Timestamp("2016-01-01 12:00:00", tz='US/Pacific')
-        exp = DatetimeIndex([ts, ts])
-        res = maybe_downcast_to_dtype(exp, exp.dtype)
-        tm.assert_index_equal(res, exp)
-
-        res = maybe_downcast_to_dtype(exp.asi8, exp.dtype)
-        tm.assert_index_equal(res, exp)
-
-
-class TestInferDtype(object):
-
-    def test_infer_dtype_from_scalar(self):
-        # Test that _infer_dtype_from_scalar is returning correct dtype for int
-        # and float.
-
-        for dtypec in [np.uint8, np.int8, np.uint16, np.int16, np.uint32,
-                       np.int32, np.uint64, np.int64]:
-            data = dtypec(12)
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == type(data)
-
-        data = 12
-        dtype, val = infer_dtype_from_scalar(data)
-        assert dtype == np.int64
-
-        for dtypec in [np.float16, np.float32, np.float64]:
-            data = dtypec(12)
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == dtypec
-
-        data = np.float(12)
-        dtype, val = infer_dtype_from_scalar(data)
-        assert dtype == np.float64
-
-        for data in [True, False]:
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == np.bool_
-
-        for data in [np.complex64(1), np.complex128(1)]:
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == np.complex_
-
-        for data in [np.datetime64(1, 'ns'), Timestamp(1),
-                     datetime(2000, 1, 1, 0, 0)]:
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == 'M8[ns]'
-
-        for data in [np.timedelta64(1, 'ns'), Timedelta(1),
-                     timedelta(1)]:
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == 'm8[ns]'
-
-        for data in [date(2000, 1, 1),
-                     Timestamp(1, tz='US/Eastern'), 'foo']:
-            dtype, val = infer_dtype_from_scalar(data)
-            assert dtype == np.object_
-
-    @pytest.mark.parametrize(
-        "arr, expected",
-        [('foo', np.object_),
-         (b'foo', np.object_),
-         (1, np.int_),
-         (1.5, np.float_),
-         ([1], np.int_),
-         (np.array([1]), np.int_),
-         ([np.nan, 1, ''], np.object_),
-         (np.array([[1.0, 2.0]]), np.float_),
-         (Timestamp('20160101'), np.object_),
-         (np.datetime64('2016-01-01'), np.dtype('<M8[D]')),
-         ])
-    def test_infer_dtype_from_array(self, arr, expected):
-
-        # these infer specifically to numpy dtypes
-        dtype, _ = infer_dtype_from_array(arr)
-        assert dtype == expected
-
-
-class TestMaybe(tm.TestCase):
-
-    def test_maybe_convert_string_to_array(self):
-        result = maybe_convert_string_to_object('x')
-        tm.assert_numpy_array_equal(result, np.array(['x'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        result = maybe_convert_string_to_object(1)
-        self.assertEqual(result, 1)
-
-        arr = np.array(['x', 'y'], dtype=str)
-        result = maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        # unicode
-        arr = np.array(['x', 'y']).astype('U')
-        result = maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 'y'], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-        # object
-        arr = np.array(['x', 2], dtype=object)
-        result = maybe_convert_string_to_object(arr)
-        tm.assert_numpy_array_equal(result, np.array(['x', 2], dtype=object))
-        self.assertTrue(result.dtype == object)
-
-    def test_maybe_convert_scalar(self):
-
-        # pass thru
-        result = maybe_convert_scalar('x')
-        self.assertEqual(result, 'x')
-        result = maybe_convert_scalar(np.array([1]))
-        self.assertEqual(result, np.array([1]))
-
-        # leave scalar dtype
-        result = maybe_convert_scalar(np.int64(1))
-        self.assertEqual(result, np.int64(1))
-        result = maybe_convert_scalar(np.int32(1))
-        self.assertEqual(result, np.int32(1))
-        result = maybe_convert_scalar(np.float32(1))
-        self.assertEqual(result, np.float32(1))
-        result = maybe_convert_scalar(np.int64(1))
-        self.assertEqual(result, np.float64(1))
-
-        # coerce
-        result = maybe_convert_scalar(1)
-        self.assertEqual(result, np.int64(1))
-        result = maybe_convert_scalar(1.0)
-        self.assertEqual(result, np.float64(1))
-        result = maybe_convert_scalar(Timestamp('20130101'))
-        self.assertEqual(result, Timestamp('20130101').value)
-        result = maybe_convert_scalar(datetime(2013, 1, 1))
-        self.assertEqual(result, Timestamp('20130101').value)
-        result = maybe_convert_scalar(Timedelta('1 day 1 min'))
-        self.assertEqual(result, Timedelta('1 day 1 min').value)
-
-
-class TestConvert(tm.TestCase):
-
-    def test_maybe_convert_objects_copy(self):
-        values = np.array([1, 2])
-
-        out = maybe_convert_objects(values, copy=False)
-        self.assertTrue(values is out)
-
-        out = maybe_convert_objects(values, copy=True)
-        self.assertTrue(values is not out)
-
-        values = np.array(['apply', 'banana'])
-        out = maybe_convert_objects(values, copy=False)
-        self.assertTrue(values is out)
-
-        out = maybe_convert_objects(values, copy=True)
-        self.assertTrue(values is not out)
-
-
-class TestCommonTypes(tm.TestCase):
-
-    def test_numpy_dtypes(self):
-        # (source_types, destination_type)
-        testcases = (
-            # identity
-            ((np.int64,), np.int64),
-            ((np.uint64,), np.uint64),
-            ((np.float32,), np.float32),
-            ((np.object,), np.object),
-
-            # into ints
-            ((np.int16, np.int64), np.int64),
-            ((np.int32, np.uint32), np.int64),
-            ((np.uint16, np.uint64), np.uint64),
-
-            # into floats
-            ((np.float16, np.float32), np.float32),
-            ((np.float16, np.int16), np.float32),
-            ((np.float32, np.int16), np.float32),
-            ((np.uint64, np.int64), np.float64),
-            ((np.int16, np.float64), np.float64),
-            ((np.float16, np.int64), np.float64),
-
-            # into others
-            ((np.complex128, np.int32), np.complex128),
-            ((np.object, np.float32), np.object),
-            ((np.object, np.int16), np.object),
-
-            # bool with int
-            ((np.dtype('bool'), np.int64), np.object),
-            ((np.dtype('bool'), np.int32), np.object),
-            ((np.dtype('bool'), np.int16), np.object),
-            ((np.dtype('bool'), np.int8), np.object),
-            ((np.dtype('bool'), np.uint64), np.object),
-            ((np.dtype('bool'), np.uint32), np.object),
-            ((np.dtype('bool'), np.uint16), np.object),
-            ((np.dtype('bool'), np.uint8), np.object),
-
-            # bool with float
-            ((np.dtype('bool'), np.float64), np.object),
-            ((np.dtype('bool'), np.float32), np.object),
-
-            ((np.dtype('datetime64[ns]'), np.dtype('datetime64[ns]')),
-             np.dtype('datetime64[ns]')),
-            ((np.dtype('timedelta64[ns]'), np.dtype('timedelta64[ns]')),
-             np.dtype('timedelta64[ns]')),
-
-            ((np.dtype('datetime64[ns]'), np.dtype('datetime64[ms]')),
-             np.dtype('datetime64[ns]')),
-            ((np.dtype('timedelta64[ms]'), np.dtype('timedelta64[ns]')),
-             np.dtype('timedelta64[ns]')),
-
-            ((np.dtype('datetime64[ns]'), np.dtype('timedelta64[ns]')),
-             np.object),
-            ((np.dtype('datetime64[ns]'), np.int64), np.object)
-        )
-        for src, common in testcases:
-            self.assertEqual(find_common_type(src), common)
-
-        with tm.assertRaises(ValueError):
-            # empty
-            find_common_type([])
-
-    def test_categorical_dtype(self):
-        dtype = CategoricalDtype()
-        self.assertEqual(find_common_type([dtype]), 'category')
-        self.assertEqual(find_common_type([dtype, dtype]), 'category')
-        self.assertEqual(find_common_type([np.object, dtype]), np.object)
-
-    def test_datetimetz_dtype(self):
-        dtype = DatetimeTZDtype(unit='ns', tz='US/Eastern')
-        self.assertEqual(find_common_type([dtype, dtype]),
-                         'datetime64[ns, US/Eastern]')
-
-        for dtype2 in [DatetimeTZDtype(unit='ns', tz='Asia/Tokyo'),
-                       np.dtype('datetime64[ns]'), np.object, np.int64]:
-            self.assertEqual(find_common_type([dtype, dtype2]), np.object)
-            self.assertEqual(find_common_type([dtype2, dtype]), np.object)
-
-    def test_period_dtype(self):
-        dtype = PeriodDtype(freq='D')
-        self.assertEqual(find_common_type([dtype, dtype]), 'period[D]')
-
-        for dtype2 in [DatetimeTZDtype(unit='ns', tz='Asia/Tokyo'),
-                       PeriodDtype(freq='2D'), PeriodDtype(freq='H'),
-                       np.dtype('datetime64[ns]'), np.object, np.int64]:
-            self.assertEqual(find_common_type([dtype, dtype2]), np.object)
-            self.assertEqual(find_common_type([dtype2, dtype]), np.object)
diff --git a/pandas/tests/types/test_common.py b/pandas/tests/types/test_common.py
deleted file mode 100644
index c15f219c8fad6..0000000000000
--- a/pandas/tests/types/test_common.py
+++ /dev/null
@@ -1,82 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import pytest
-import numpy as np
-
-from pandas.types.dtypes import DatetimeTZDtype, PeriodDtype, CategoricalDtype
-from pandas.types.common import pandas_dtype, is_dtype_equal
-
-import pandas.util.testing as tm
-
-
-class TestPandasDtype(tm.TestCase):
-
-    def test_numpy_dtype(self):
-        for dtype in ['M8[ns]', 'm8[ns]', 'object', 'float64', 'int64']:
-            self.assertEqual(pandas_dtype(dtype), np.dtype(dtype))
-
-    def test_numpy_string_dtype(self):
-        # do not parse freq-like string as period dtype
-        self.assertEqual(pandas_dtype('U'), np.dtype('U'))
-        self.assertEqual(pandas_dtype('S'), np.dtype('S'))
-
-    def test_datetimetz_dtype(self):
-        for dtype in ['datetime64[ns, US/Eastern]',
-                      'datetime64[ns, Asia/Tokyo]',
-                      'datetime64[ns, UTC]']:
-            self.assertIs(pandas_dtype(dtype), DatetimeTZDtype(dtype))
-            self.assertEqual(pandas_dtype(dtype), DatetimeTZDtype(dtype))
-            self.assertEqual(pandas_dtype(dtype), dtype)
-
-    def test_categorical_dtype(self):
-        self.assertEqual(pandas_dtype('category'), CategoricalDtype())
-
-    def test_period_dtype(self):
-        for dtype in ['period[D]', 'period[3M]', 'period[U]',
-                      'Period[D]', 'Period[3M]', 'Period[U]']:
-            self.assertIs(pandas_dtype(dtype), PeriodDtype(dtype))
-            self.assertEqual(pandas_dtype(dtype), PeriodDtype(dtype))
-            self.assertEqual(pandas_dtype(dtype), dtype)
-
-
-dtypes = dict(datetime_tz=pandas_dtype('datetime64[ns, US/Eastern]'),
-              datetime=pandas_dtype('datetime64[ns]'),
-              timedelta=pandas_dtype('timedelta64[ns]'),
-              period=PeriodDtype('D'),
-              integer=np.dtype(np.int64),
-              float=np.dtype(np.float64),
-              object=np.dtype(np.object),
-              category=pandas_dtype('category'))
-
-
-@pytest.mark.parametrize('name1,dtype1',
-                         list(dtypes.items()),
-                         ids=lambda x: str(x))
-@pytest.mark.parametrize('name2,dtype2',
-                         list(dtypes.items()),
-                         ids=lambda x: str(x))
-def test_dtype_equal(name1, dtype1, name2, dtype2):
-
-    # match equal to self, but not equal to other
-    assert is_dtype_equal(dtype1, dtype1)
-    if name1 != name2:
-        assert not is_dtype_equal(dtype1, dtype2)
-
-
-def test_dtype_equal_strict():
-
-    # we are strict on kind equality
-    for dtype in [np.int8, np.int16, np.int32]:
-        assert not is_dtype_equal(np.int64, dtype)
-
-    for dtype in [np.float32]:
-        assert not is_dtype_equal(np.float64, dtype)
-
-    # strict w.r.t. PeriodDtype
-    assert not is_dtype_equal(PeriodDtype('D'),
-                              PeriodDtype('2D'))
-
-    # strict w.r.t. datetime64
-    assert not is_dtype_equal(
-        pandas_dtype('datetime64[ns, US/Eastern]'),
-        pandas_dtype('datetime64[ns, CET]'))
diff --git a/pandas/tests/types/test_concat.py b/pandas/tests/types/test_concat.py
deleted file mode 100644
index f4faab45f4ba2..0000000000000
--- a/pandas/tests/types/test_concat.py
+++ /dev/null
@@ -1,78 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import pandas as pd
-import pandas.types.concat as _concat
-import pandas.util.testing as tm
-
-
-class TestConcatCompat(tm.TestCase):
-
-    def check_concat(self, to_concat, exp):
-        for klass in [pd.Index, pd.Series]:
-            to_concat_klass = [klass(c) for c in to_concat]
-            res = _concat.get_dtype_kinds(to_concat_klass)
-            self.assertEqual(res, set(exp))
-
-    def test_get_dtype_kinds(self):
-        to_concat = [['a'], [1, 2]]
-        self.check_concat(to_concat, ['i', 'object'])
-
-        to_concat = [[3, 4], [1, 2]]
-        self.check_concat(to_concat, ['i'])
-
-        to_concat = [[3, 4], [1, 2.1]]
-        self.check_concat(to_concat, ['i', 'f'])
-
-    def test_get_dtype_kinds_datetimelike(self):
-        to_concat = [pd.DatetimeIndex(['2011-01-01']),
-                     pd.DatetimeIndex(['2011-01-02'])]
-        self.check_concat(to_concat, ['datetime'])
-
-        to_concat = [pd.TimedeltaIndex(['1 days']),
-                     pd.TimedeltaIndex(['2 days'])]
-        self.check_concat(to_concat, ['timedelta'])
-
-    def test_get_dtype_kinds_datetimelike_object(self):
-        to_concat = [pd.DatetimeIndex(['2011-01-01']),
-                     pd.DatetimeIndex(['2011-01-02'], tz='US/Eastern')]
-        self.check_concat(to_concat,
-                          ['datetime', 'datetime64[ns, US/Eastern]'])
-
-        to_concat = [pd.DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
-                     pd.DatetimeIndex(['2011-01-02'], tz='US/Eastern')]
-        self.check_concat(to_concat,
-                          ['datetime64[ns, Asia/Tokyo]',
-                           'datetime64[ns, US/Eastern]'])
-
-        # timedelta has single type
-        to_concat = [pd.TimedeltaIndex(['1 days']),
-                     pd.TimedeltaIndex(['2 hours'])]
-        self.check_concat(to_concat, ['timedelta'])
-
-        to_concat = [pd.DatetimeIndex(['2011-01-01'], tz='Asia/Tokyo'),
-                     pd.TimedeltaIndex(['1 days'])]
-        self.check_concat(to_concat,
-                          ['datetime64[ns, Asia/Tokyo]', 'timedelta'])
-
-    def test_get_dtype_kinds_period(self):
-        # because we don't have Period dtype (yet),
-        # Series results in object dtype
-        to_concat = [pd.PeriodIndex(['2011-01'], freq='M'),
-                     pd.PeriodIndex(['2011-01'], freq='M')]
-        res = _concat.get_dtype_kinds(to_concat)
-        self.assertEqual(res, set(['period[M]']))
-
-        to_concat = [pd.Series([pd.Period('2011-01', freq='M')]),
-                     pd.Series([pd.Period('2011-02', freq='M')])]
-        res = _concat.get_dtype_kinds(to_concat)
-        self.assertEqual(res, set(['object']))
-
-        to_concat = [pd.PeriodIndex(['2011-01'], freq='M'),
-                     pd.PeriodIndex(['2011-01'], freq='D')]
-        res = _concat.get_dtype_kinds(to_concat)
-        self.assertEqual(res, set(['period[M]', 'period[D]']))
-
-        to_concat = [pd.Series([pd.Period('2011-01', freq='M')]),
-                     pd.Series([pd.Period('2011-02', freq='D')])]
-        res = _concat.get_dtype_kinds(to_concat)
-        self.assertEqual(res, set(['object']))
diff --git a/pandas/tests/types/test_dtypes.py b/pandas/tests/types/test_dtypes.py
deleted file mode 100644
index 8ef2868ae324f..0000000000000
--- a/pandas/tests/types/test_dtypes.py
+++ /dev/null
@@ -1,352 +0,0 @@
-# -*- coding: utf-8 -*-
-from itertools import product
-
-import numpy as np
-import pandas as pd
-from pandas import Series, Categorical, date_range
-
-from pandas.types.dtypes import DatetimeTZDtype, PeriodDtype, CategoricalDtype
-from pandas.types.common import (is_categorical_dtype, is_categorical,
-                                 is_datetime64tz_dtype, is_datetimetz,
-                                 is_period_dtype, is_period,
-                                 is_dtype_equal, is_datetime64_ns_dtype,
-                                 is_datetime64_dtype,
-                                 is_datetime64_any_dtype, is_string_dtype,
-                                 _coerce_to_dtype)
-import pandas.util.testing as tm
-
-
-class Base(object):
-
-    def test_hash(self):
-        hash(self.dtype)
-
-    def test_equality_invalid(self):
-        self.assertRaises(self.dtype == 'foo')
-        self.assertFalse(is_dtype_equal(self.dtype, np.int64))
-
-    def test_numpy_informed(self):
-
-        # np.dtype doesn't know about our new dtype
-        def f():
-            np.dtype(self.dtype)
-
-        self.assertRaises(TypeError, f)
-
-        self.assertNotEqual(self.dtype, np.str_)
-        self.assertNotEqual(np.str_, self.dtype)
-
-    def test_pickle(self):
-        result = self.round_trip_pickle(self.dtype)
-        self.assertEqual(result, self.dtype)
-
-
-class TestCategoricalDtype(Base, tm.TestCase):
-
-    def setUp(self):
-        self.dtype = CategoricalDtype()
-
-    def test_hash_vs_equality(self):
-        # make sure that we satisfy is semantics
-        dtype = self.dtype
-        dtype2 = CategoricalDtype()
-        self.assertTrue(dtype == dtype2)
-        self.assertTrue(dtype2 == dtype)
-        self.assertTrue(dtype is dtype2)
-        self.assertTrue(dtype2 is dtype)
-        self.assertTrue(hash(dtype) == hash(dtype2))
-
-    def test_equality(self):
-        self.assertTrue(is_dtype_equal(self.dtype, 'category'))
-        self.assertTrue(is_dtype_equal(self.dtype, CategoricalDtype()))
-        self.assertFalse(is_dtype_equal(self.dtype, 'foo'))
-
-    def test_construction_from_string(self):
-        result = CategoricalDtype.construct_from_string('category')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        self.assertRaises(
-            TypeError, lambda: CategoricalDtype.construct_from_string('foo'))
-
-    def test_is_dtype(self):
-        self.assertTrue(CategoricalDtype.is_dtype(self.dtype))
-        self.assertTrue(CategoricalDtype.is_dtype('category'))
-        self.assertTrue(CategoricalDtype.is_dtype(CategoricalDtype()))
-        self.assertFalse(CategoricalDtype.is_dtype('foo'))
-        self.assertFalse(CategoricalDtype.is_dtype(np.float64))
-
-    def test_basic(self):
-
-        self.assertTrue(is_categorical_dtype(self.dtype))
-
-        factor = Categorical(['a', 'b', 'b', 'a', 'a', 'c', 'c', 'c'])
-
-        s = Series(factor, name='A')
-
-        # dtypes
-        self.assertTrue(is_categorical_dtype(s.dtype))
-        self.assertTrue(is_categorical_dtype(s))
-        self.assertFalse(is_categorical_dtype(np.dtype('float64')))
-
-        self.assertTrue(is_categorical(s.dtype))
-        self.assertTrue(is_categorical(s))
-        self.assertFalse(is_categorical(np.dtype('float64')))
-        self.assertFalse(is_categorical(1.0))
-
-
-class TestDatetimeTZDtype(Base, tm.TestCase):
-
-    def setUp(self):
-        self.dtype = DatetimeTZDtype('ns', 'US/Eastern')
-
-    def test_hash_vs_equality(self):
-        # make sure that we satisfy is semantics
-        dtype = self.dtype
-        dtype2 = DatetimeTZDtype('ns', 'US/Eastern')
-        dtype3 = DatetimeTZDtype(dtype2)
-        self.assertTrue(dtype == dtype2)
-        self.assertTrue(dtype2 == dtype)
-        self.assertTrue(dtype3 == dtype)
-        self.assertTrue(dtype is dtype2)
-        self.assertTrue(dtype2 is dtype)
-        self.assertTrue(dtype3 is dtype)
-        self.assertTrue(hash(dtype) == hash(dtype2))
-        self.assertTrue(hash(dtype) == hash(dtype3))
-
-    def test_construction(self):
-        self.assertRaises(ValueError,
-                          lambda: DatetimeTZDtype('ms', 'US/Eastern'))
-
-    def test_subclass(self):
-        a = DatetimeTZDtype('datetime64[ns, US/Eastern]')
-        b = DatetimeTZDtype('datetime64[ns, CET]')
-
-        self.assertTrue(issubclass(type(a), type(a)))
-        self.assertTrue(issubclass(type(a), type(b)))
-
-    def test_coerce_to_dtype(self):
-        self.assertEqual(_coerce_to_dtype('datetime64[ns, US/Eastern]'),
-                         DatetimeTZDtype('ns', 'US/Eastern'))
-        self.assertEqual(_coerce_to_dtype('datetime64[ns, Asia/Tokyo]'),
-                         DatetimeTZDtype('ns', 'Asia/Tokyo'))
-
-    def test_compat(self):
-        self.assertTrue(is_datetime64tz_dtype(self.dtype))
-        self.assertTrue(is_datetime64tz_dtype('datetime64[ns, US/Eastern]'))
-        self.assertTrue(is_datetime64_any_dtype(self.dtype))
-        self.assertTrue(is_datetime64_any_dtype('datetime64[ns, US/Eastern]'))
-        self.assertTrue(is_datetime64_ns_dtype(self.dtype))
-        self.assertTrue(is_datetime64_ns_dtype('datetime64[ns, US/Eastern]'))
-        self.assertFalse(is_datetime64_dtype(self.dtype))
-        self.assertFalse(is_datetime64_dtype('datetime64[ns, US/Eastern]'))
-
-    def test_construction_from_string(self):
-        result = DatetimeTZDtype('datetime64[ns, US/Eastern]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        result = DatetimeTZDtype.construct_from_string(
-            'datetime64[ns, US/Eastern]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        self.assertRaises(TypeError,
-                          lambda: DatetimeTZDtype.construct_from_string('foo'))
-
-    def test_is_dtype(self):
-        self.assertTrue(DatetimeTZDtype.is_dtype(self.dtype))
-        self.assertTrue(DatetimeTZDtype.is_dtype('datetime64[ns, US/Eastern]'))
-        self.assertFalse(DatetimeTZDtype.is_dtype('foo'))
-        self.assertTrue(DatetimeTZDtype.is_dtype(DatetimeTZDtype(
-            'ns', 'US/Pacific')))
-        self.assertFalse(DatetimeTZDtype.is_dtype(np.float64))
-
-    def test_equality(self):
-        self.assertTrue(is_dtype_equal(self.dtype,
-                                       'datetime64[ns, US/Eastern]'))
-        self.assertTrue(is_dtype_equal(self.dtype, DatetimeTZDtype(
-            'ns', 'US/Eastern')))
-        self.assertFalse(is_dtype_equal(self.dtype, 'foo'))
-        self.assertFalse(is_dtype_equal(self.dtype, DatetimeTZDtype('ns',
-                                                                    'CET')))
-        self.assertFalse(is_dtype_equal(
-            DatetimeTZDtype('ns', 'US/Eastern'), DatetimeTZDtype(
-                'ns', 'US/Pacific')))
-
-        # numpy compat
-        self.assertTrue(is_dtype_equal(np.dtype("M8[ns]"), "datetime64[ns]"))
-
-    def test_basic(self):
-
-        self.assertTrue(is_datetime64tz_dtype(self.dtype))
-
-        dr = date_range('20130101', periods=3, tz='US/Eastern')
-        s = Series(dr, name='A')
-
-        # dtypes
-        self.assertTrue(is_datetime64tz_dtype(s.dtype))
-        self.assertTrue(is_datetime64tz_dtype(s))
-        self.assertFalse(is_datetime64tz_dtype(np.dtype('float64')))
-        self.assertFalse(is_datetime64tz_dtype(1.0))
-
-        self.assertTrue(is_datetimetz(s))
-        self.assertTrue(is_datetimetz(s.dtype))
-        self.assertFalse(is_datetimetz(np.dtype('float64')))
-        self.assertFalse(is_datetimetz(1.0))
-
-    def test_dst(self):
-
-        dr1 = date_range('2013-01-01', periods=3, tz='US/Eastern')
-        s1 = Series(dr1, name='A')
-        self.assertTrue(is_datetimetz(s1))
-
-        dr2 = date_range('2013-08-01', periods=3, tz='US/Eastern')
-        s2 = Series(dr2, name='A')
-        self.assertTrue(is_datetimetz(s2))
-        self.assertEqual(s1.dtype, s2.dtype)
-
-    def test_parser(self):
-        # pr #11245
-        for tz, constructor in product(('UTC', 'US/Eastern'),
-                                       ('M8', 'datetime64')):
-            self.assertEqual(
-                DatetimeTZDtype('%s[ns, %s]' % (constructor, tz)),
-                DatetimeTZDtype('ns', tz),
-            )
-
-    def test_empty(self):
-        dt = DatetimeTZDtype()
-        with tm.assertRaises(AttributeError):
-            str(dt)
-
-
-class TestPeriodDtype(Base, tm.TestCase):
-
-    def setUp(self):
-        self.dtype = PeriodDtype('D')
-
-    def test_construction(self):
-        with tm.assertRaises(ValueError):
-            PeriodDtype('xx')
-
-        for s in ['period[D]', 'Period[D]', 'D']:
-            dt = PeriodDtype(s)
-            self.assertEqual(dt.freq, pd.tseries.offsets.Day())
-            self.assertTrue(is_period_dtype(dt))
-
-        for s in ['period[3D]', 'Period[3D]', '3D']:
-            dt = PeriodDtype(s)
-            self.assertEqual(dt.freq, pd.tseries.offsets.Day(3))
-            self.assertTrue(is_period_dtype(dt))
-
-        for s in ['period[26H]', 'Period[26H]', '26H',
-                  'period[1D2H]', 'Period[1D2H]', '1D2H']:
-            dt = PeriodDtype(s)
-            self.assertEqual(dt.freq, pd.tseries.offsets.Hour(26))
-            self.assertTrue(is_period_dtype(dt))
-
-    def test_subclass(self):
-        a = PeriodDtype('period[D]')
-        b = PeriodDtype('period[3D]')
-
-        self.assertTrue(issubclass(type(a), type(a)))
-        self.assertTrue(issubclass(type(a), type(b)))
-
-    def test_identity(self):
-        self.assertEqual(PeriodDtype('period[D]'),
-                         PeriodDtype('period[D]'))
-        self.assertIs(PeriodDtype('period[D]'),
-                      PeriodDtype('period[D]'))
-
-        self.assertEqual(PeriodDtype('period[3D]'),
-                         PeriodDtype('period[3D]'))
-        self.assertIs(PeriodDtype('period[3D]'),
-                      PeriodDtype('period[3D]'))
-
-        self.assertEqual(PeriodDtype('period[1S1U]'),
-                         PeriodDtype('period[1000001U]'))
-        self.assertIs(PeriodDtype('period[1S1U]'),
-                      PeriodDtype('period[1000001U]'))
-
-    def test_coerce_to_dtype(self):
-        self.assertEqual(_coerce_to_dtype('period[D]'),
-                         PeriodDtype('period[D]'))
-        self.assertEqual(_coerce_to_dtype('period[3M]'),
-                         PeriodDtype('period[3M]'))
-
-    def test_compat(self):
-        self.assertFalse(is_datetime64_ns_dtype(self.dtype))
-        self.assertFalse(is_datetime64_ns_dtype('period[D]'))
-        self.assertFalse(is_datetime64_dtype(self.dtype))
-        self.assertFalse(is_datetime64_dtype('period[D]'))
-
-    def test_construction_from_string(self):
-        result = PeriodDtype('period[D]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        result = PeriodDtype.construct_from_string('period[D]')
-        self.assertTrue(is_dtype_equal(self.dtype, result))
-        with tm.assertRaises(TypeError):
-            PeriodDtype.construct_from_string('foo')
-        with tm.assertRaises(TypeError):
-            PeriodDtype.construct_from_string('period[foo]')
-        with tm.assertRaises(TypeError):
-            PeriodDtype.construct_from_string('foo[D]')
-
-        with tm.assertRaises(TypeError):
-            PeriodDtype.construct_from_string('datetime64[ns]')
-        with tm.assertRaises(TypeError):
-            PeriodDtype.construct_from_string('datetime64[ns, US/Eastern]')
-
-    def test_is_dtype(self):
-        self.assertTrue(PeriodDtype.is_dtype(self.dtype))
-        self.assertTrue(PeriodDtype.is_dtype('period[D]'))
-        self.assertTrue(PeriodDtype.is_dtype('period[3D]'))
-        self.assertTrue(PeriodDtype.is_dtype(PeriodDtype('3D')))
-        self.assertTrue(PeriodDtype.is_dtype('period[U]'))
-        self.assertTrue(PeriodDtype.is_dtype('period[S]'))
-        self.assertTrue(PeriodDtype.is_dtype(PeriodDtype('U')))
-        self.assertTrue(PeriodDtype.is_dtype(PeriodDtype('S')))
-
-        self.assertFalse(PeriodDtype.is_dtype('D'))
-        self.assertFalse(PeriodDtype.is_dtype('3D'))
-        self.assertFalse(PeriodDtype.is_dtype('U'))
-        self.assertFalse(PeriodDtype.is_dtype('S'))
-        self.assertFalse(PeriodDtype.is_dtype('foo'))
-        self.assertFalse(PeriodDtype.is_dtype(np.object_))
-        self.assertFalse(PeriodDtype.is_dtype(np.int64))
-        self.assertFalse(PeriodDtype.is_dtype(np.float64))
-
-    def test_equality(self):
-        self.assertTrue(is_dtype_equal(self.dtype, 'period[D]'))
-        self.assertTrue(is_dtype_equal(self.dtype, PeriodDtype('D')))
-        self.assertTrue(is_dtype_equal(self.dtype, PeriodDtype('D')))
-        self.assertTrue(is_dtype_equal(PeriodDtype('D'), PeriodDtype('D')))
-
-        self.assertFalse(is_dtype_equal(self.dtype, 'D'))
-        self.assertFalse(is_dtype_equal(PeriodDtype('D'), PeriodDtype('2D')))
-
-    def test_basic(self):
-        self.assertTrue(is_period_dtype(self.dtype))
-
-        pidx = pd.period_range('2013-01-01 09:00', periods=5, freq='H')
-
-        self.assertTrue(is_period_dtype(pidx.dtype))
-        self.assertTrue(is_period_dtype(pidx))
-        self.assertTrue(is_period(pidx))
-
-        s = Series(pidx, name='A')
-        # dtypes
-        # series results in object dtype currently,
-        # is_period checks period_arraylike
-        self.assertFalse(is_period_dtype(s.dtype))
-        self.assertFalse(is_period_dtype(s))
-        self.assertTrue(is_period(s))
-
-        self.assertFalse(is_period_dtype(np.dtype('float64')))
-        self.assertFalse(is_period_dtype(1.0))
-        self.assertFalse(is_period(np.dtype('float64')))
-        self.assertFalse(is_period(1.0))
-
-    def test_empty(self):
-        dt = PeriodDtype()
-        with tm.assertRaises(AttributeError):
-            str(dt)
-
-    def test_not_string(self):
-        # though PeriodDtype has object kind, it cannot be string
-        self.assertFalse(is_string_dtype(PeriodDtype('D')))
diff --git a/pandas/tests/types/test_generic.py b/pandas/tests/types/test_generic.py
deleted file mode 100644
index c7c8b0becad63..0000000000000
--- a/pandas/tests/types/test_generic.py
+++ /dev/null
@@ -1,40 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import numpy as np
-import pandas as pd
-import pandas.util.testing as tm
-from pandas.types import generic as gt
-
-
-class TestABCClasses(tm.TestCase):
-    tuples = [[1, 2, 2], ['red', 'blue', 'red']]
-    multi_index = pd.MultiIndex.from_arrays(tuples, names=('number', 'color'))
-    datetime_index = pd.to_datetime(['2000/1/1', '2010/1/1'])
-    timedelta_index = pd.to_timedelta(np.arange(5), unit='s')
-    period_index = pd.period_range('2000/1/1', '2010/1/1/', freq='M')
-    categorical = pd.Categorical([1, 2, 3], categories=[2, 3, 1])
-    categorical_df = pd.DataFrame({"values": [1, 2, 3]}, index=categorical)
-    df = pd.DataFrame({'names': ['a', 'b', 'c']}, index=multi_index)
-    sparse_series = pd.Series([1, 2, 3]).to_sparse()
-    sparse_array = pd.SparseArray(np.random.randn(10))
-
-    def test_abc_types(self):
-        self.assertIsInstance(pd.Index(['a', 'b', 'c']), gt.ABCIndex)
-        self.assertIsInstance(pd.Int64Index([1, 2, 3]), gt.ABCInt64Index)
-        self.assertIsInstance(pd.UInt64Index([1, 2, 3]), gt.ABCUInt64Index)
-        self.assertIsInstance(pd.Float64Index([1, 2, 3]), gt.ABCFloat64Index)
-        self.assertIsInstance(self.multi_index, gt.ABCMultiIndex)
-        self.assertIsInstance(self.datetime_index, gt.ABCDatetimeIndex)
-        self.assertIsInstance(self.timedelta_index, gt.ABCTimedeltaIndex)
-        self.assertIsInstance(self.period_index, gt.ABCPeriodIndex)
-        self.assertIsInstance(self.categorical_df.index,
-                              gt.ABCCategoricalIndex)
-        self.assertIsInstance(pd.Index(['a', 'b', 'c']), gt.ABCIndexClass)
-        self.assertIsInstance(pd.Int64Index([1, 2, 3]), gt.ABCIndexClass)
-        self.assertIsInstance(pd.Series([1, 2, 3]), gt.ABCSeries)
-        self.assertIsInstance(self.df, gt.ABCDataFrame)
-        self.assertIsInstance(self.df.to_panel(), gt.ABCPanel)
-        self.assertIsInstance(self.sparse_series, gt.ABCSparseSeries)
-        self.assertIsInstance(self.sparse_array, gt.ABCSparseArray)
-        self.assertIsInstance(self.categorical, gt.ABCCategorical)
-        self.assertIsInstance(pd.Period('2012', freq='A-DEC'), gt.ABCPeriod)
diff --git a/pandas/tests/types/test_inference.py b/pandas/tests/types/test_inference.py
deleted file mode 100644
index b41df0da45234..0000000000000
--- a/pandas/tests/types/test_inference.py
+++ /dev/null
@@ -1,975 +0,0 @@
-# -*- coding: utf-8 -*-
-
-"""
-These the test the public routines exposed in types/common.py
-related to inference and not otherwise tested in types/test_common.py
-
-"""
-
-import collections
-import re
-from datetime import datetime, date, timedelta, time
-import numpy as np
-import pytz
-
-import pandas as pd
-from pandas._libs import tslib, lib
-from pandas import (Series, Index, DataFrame, Timedelta,
-                    DatetimeIndex, TimedeltaIndex, Timestamp,
-                    Panel, Period, Categorical)
-from pandas.compat import u, PY2, lrange
-from pandas.types import inference
-from pandas.types.common import (is_timedelta64_dtype,
-                                 is_timedelta64_ns_dtype,
-                                 is_datetime64_dtype,
-                                 is_datetime64_ns_dtype,
-                                 is_datetime64_any_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_number,
-                                 is_integer,
-                                 is_float,
-                                 is_bool,
-                                 is_scalar,
-                                 is_scipy_sparse,
-                                 _ensure_int32,
-                                 _ensure_categorical)
-from pandas.types.missing import isnull
-from pandas.util import testing as tm
-
-from pandas.tests.sparse.test_frame import spmatrix  # noqa: F401
-
-
-def test_is_sequence():
-    is_seq = inference.is_sequence
-    assert (is_seq((1, 2)))
-    assert (is_seq([1, 2]))
-    assert (not is_seq("abcd"))
-    assert (not is_seq(u("abcd")))
-    assert (not is_seq(np.int64))
-
-    class A(object):
-
-        def __getitem__(self):
-            return 1
-
-    assert (not is_seq(A()))
-
-
-def test_is_list_like():
-    passes = ([], [1], (1, ), (1, 2), {'a': 1}, set([1, 'a']), Series([1]),
-              Series([]), Series(['a']).str)
-    fails = (1, '2', object())
-
-    for p in passes:
-        assert inference.is_list_like(p)
-
-    for f in fails:
-        assert not inference.is_list_like(f)
-
-
-def test_is_dict_like():
-    passes = [{}, {'A': 1}, Series([1])]
-    fails = ['1', 1, [1, 2], (1, 2), range(2), Index([1])]
-
-    for p in passes:
-        assert inference.is_dict_like(p)
-
-    for f in fails:
-        assert not inference.is_dict_like(f)
-
-
-def test_is_named_tuple():
-    passes = (collections.namedtuple('Test', list('abc'))(1, 2, 3), )
-    fails = ((1, 2, 3), 'a', Series({'pi': 3.14}))
-
-    for p in passes:
-        assert inference.is_named_tuple(p)
-
-    for f in fails:
-        assert not inference.is_named_tuple(f)
-
-
-def test_is_hashable():
-
-    # all new-style classes are hashable by default
-    class HashableClass(object):
-        pass
-
-    class UnhashableClass1(object):
-        __hash__ = None
-
-    class UnhashableClass2(object):
-
-        def __hash__(self):
-            raise TypeError("Not hashable")
-
-    hashable = (1,
-                3.14,
-                np.float64(3.14),
-                'a',
-                tuple(),
-                (1, ),
-                HashableClass(), )
-    not_hashable = ([], UnhashableClass1(), )
-    abc_hashable_not_really_hashable = (([], ), UnhashableClass2(), )
-
-    for i in hashable:
-        assert inference.is_hashable(i)
-    for i in not_hashable:
-        assert not inference.is_hashable(i)
-    for i in abc_hashable_not_really_hashable:
-        assert not inference.is_hashable(i)
-
-    # numpy.array is no longer collections.Hashable as of
-    # https://github.com/numpy/numpy/pull/5326, just test
-    # is_hashable()
-    assert not inference.is_hashable(np.array([]))
-
-    # old-style classes in Python 2 don't appear hashable to
-    # collections.Hashable but also seem to support hash() by default
-    if PY2:
-
-        class OldStyleClass():
-            pass
-
-        c = OldStyleClass()
-        assert not isinstance(c, collections.Hashable)
-        assert inference.is_hashable(c)
-        hash(c)  # this will not raise
-
-
-def test_is_re():
-    passes = re.compile('ad'),
-    fails = 'x', 2, 3, object()
-
-    for p in passes:
-        assert inference.is_re(p)
-
-    for f in fails:
-        assert not inference.is_re(f)
-
-
-def test_is_recompilable():
-    passes = (r'a', u('x'), r'asdf', re.compile('adsf'), u(r'\u2233\s*'),
-              re.compile(r''))
-    fails = 1, [], object()
-
-    for p in passes:
-        assert inference.is_re_compilable(p)
-
-    for f in fails:
-        assert not inference.is_re_compilable(f)
-
-
-class TestInference(tm.TestCase):
-
-    def test_infer_dtype_bytes(self):
-        compare = 'string' if PY2 else 'bytes'
-
-        # string array of bytes
-        arr = np.array(list('abc'), dtype='S1')
-        self.assertEqual(lib.infer_dtype(arr), compare)
-
-        # object array of bytes
-        arr = arr.astype(object)
-        self.assertEqual(lib.infer_dtype(arr), compare)
-
-    def test_isinf_scalar(self):
-        # GH 11352
-        self.assertTrue(lib.isposinf_scalar(float('inf')))
-        self.assertTrue(lib.isposinf_scalar(np.inf))
-        self.assertFalse(lib.isposinf_scalar(-np.inf))
-        self.assertFalse(lib.isposinf_scalar(1))
-        self.assertFalse(lib.isposinf_scalar('a'))
-
-        self.assertTrue(lib.isneginf_scalar(float('-inf')))
-        self.assertTrue(lib.isneginf_scalar(-np.inf))
-        self.assertFalse(lib.isneginf_scalar(np.inf))
-        self.assertFalse(lib.isneginf_scalar(1))
-        self.assertFalse(lib.isneginf_scalar('a'))
-
-    def test_maybe_convert_numeric_infinities(self):
-        # see gh-13274
-        infinities = ['inf', 'inF', 'iNf', 'Inf',
-                      'iNF', 'InF', 'INf', 'INF']
-        na_values = set(['', 'NULL', 'nan'])
-
-        pos = np.array(['inf'], dtype=np.float64)
-        neg = np.array(['-inf'], dtype=np.float64)
-
-        msg = "Unable to parse string"
-
-        for infinity in infinities:
-            for maybe_int in (True, False):
-                out = lib.maybe_convert_numeric(
-                    np.array([infinity], dtype=object),
-                    na_values, maybe_int)
-                tm.assert_numpy_array_equal(out, pos)
-
-                out = lib.maybe_convert_numeric(
-                    np.array(['-' + infinity], dtype=object),
-                    na_values, maybe_int)
-                tm.assert_numpy_array_equal(out, neg)
-
-                out = lib.maybe_convert_numeric(
-                    np.array([u(infinity)], dtype=object),
-                    na_values, maybe_int)
-                tm.assert_numpy_array_equal(out, pos)
-
-                out = lib.maybe_convert_numeric(
-                    np.array(['+' + infinity], dtype=object),
-                    na_values, maybe_int)
-                tm.assert_numpy_array_equal(out, pos)
-
-                # too many characters
-                with tm.assertRaisesRegexp(ValueError, msg):
-                    lib.maybe_convert_numeric(
-                        np.array(['foo_' + infinity], dtype=object),
-                        na_values, maybe_int)
-
-    def test_maybe_convert_numeric_post_floatify_nan(self):
-        # see gh-13314
-        data = np.array(['1.200', '-999.000', '4.500'], dtype=object)
-        expected = np.array([1.2, np.nan, 4.5], dtype=np.float64)
-        nan_values = set([-999, -999.0])
-
-        for coerce_type in (True, False):
-            out = lib.maybe_convert_numeric(data, nan_values, coerce_type)
-            tm.assert_numpy_array_equal(out, expected)
-
-    def test_convert_infs(self):
-        arr = np.array(['inf', 'inf', 'inf'], dtype='O')
-        result = lib.maybe_convert_numeric(arr, set(), False)
-        self.assertTrue(result.dtype == np.float64)
-
-        arr = np.array(['-inf', '-inf', '-inf'], dtype='O')
-        result = lib.maybe_convert_numeric(arr, set(), False)
-        self.assertTrue(result.dtype == np.float64)
-
-    def test_scientific_no_exponent(self):
-        # See PR 12215
-        arr = np.array(['42E', '2E', '99e', '6e'], dtype='O')
-        result = lib.maybe_convert_numeric(arr, set(), False, True)
-        self.assertTrue(np.all(np.isnan(result)))
-
-    def test_convert_non_hashable(self):
-        # GH13324
-        # make sure that we are handing non-hashables
-        arr = np.array([[10.0, 2], 1.0, 'apple'])
-        result = lib.maybe_convert_numeric(arr, set(), False, True)
-        tm.assert_numpy_array_equal(result, np.array([np.nan, 1.0, np.nan]))
-
-    def test_convert_numeric_uint64(self):
-        arr = np.array([2**63], dtype=object)
-        exp = np.array([2**63], dtype=np.uint64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
-
-        arr = np.array([str(2**63)], dtype=object)
-        exp = np.array([2**63], dtype=np.uint64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
-
-        arr = np.array([np.uint64(2**63)], dtype=object)
-        exp = np.array([2**63], dtype=np.uint64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_numeric(arr, set()), exp)
-
-    def test_convert_numeric_uint64_nan(self):
-        msg = 'uint64 array detected'
-        cases = [(np.array([2**63, np.nan], dtype=object), set()),
-                 (np.array([str(2**63), np.nan], dtype=object), set()),
-                 (np.array([np.nan, 2**63], dtype=object), set()),
-                 (np.array([np.nan, str(2**63)], dtype=object), set()),
-                 (np.array([2**63, 2**63 + 1], dtype=object), set([2**63])),
-                 (np.array([str(2**63), str(2**63 + 1)],
-                           dtype=object), set([2**63]))]
-
-        for coerce in (True, False):
-            for arr, na_values in cases:
-                if coerce:
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        lib.maybe_convert_numeric(arr, na_values,
-                                                  coerce_numeric=coerce)
-                else:
-                    tm.assert_numpy_array_equal(lib.maybe_convert_numeric(
-                        arr, na_values), arr)
-
-    def test_convert_numeric_int64_uint64(self):
-        msg = 'uint64 and negative values detected'
-        cases = [np.array([2**63, -1], dtype=object),
-                 np.array([str(2**63), -1], dtype=object),
-                 np.array([str(2**63), str(-1)], dtype=object),
-                 np.array([-1, 2**63], dtype=object),
-                 np.array([-1, str(2**63)], dtype=object),
-                 np.array([str(-1), str(2**63)], dtype=object)]
-
-        for coerce in (True, False):
-            for case in cases:
-                if coerce:
-                    with tm.assertRaisesRegexp(ValueError, msg):
-                        lib.maybe_convert_numeric(case, set(),
-                                                  coerce_numeric=coerce)
-                else:
-                    tm.assert_numpy_array_equal(lib.maybe_convert_numeric(
-                        case, set()), case)
-
-    def test_maybe_convert_objects_uint64(self):
-        # see gh-4471
-        arr = np.array([2**63], dtype=object)
-        exp = np.array([2**63], dtype=np.uint64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
-
-        # NumPy bug: can't compare uint64 to int64, as that
-        # results in both casting to float64, so we should
-        # make sure that this function is robust against it
-        arr = np.array([np.uint64(2**63)], dtype=object)
-        exp = np.array([2**63], dtype=np.uint64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
-
-        arr = np.array([2, -1], dtype=object)
-        exp = np.array([2, -1], dtype=np.int64)
-        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
-
-        arr = np.array([2**63, -1], dtype=object)
-        exp = np.array([2**63, -1], dtype=object)
-        tm.assert_numpy_array_equal(lib.maybe_convert_objects(arr), exp)
-
-    def test_mixed_dtypes_remain_object_array(self):
-        # GH14956
-        array = np.array([datetime(2015, 1, 1, tzinfo=pytz.utc), 1],
-                         dtype=object)
-        result = lib.maybe_convert_objects(array, convert_datetime=1)
-        tm.assert_numpy_array_equal(result, array)
-
-
-class TestTypeInference(tm.TestCase):
-
-    def test_length_zero(self):
-        result = lib.infer_dtype(np.array([], dtype='i4'))
-        self.assertEqual(result, 'integer')
-
-        result = lib.infer_dtype([])
-        self.assertEqual(result, 'empty')
-
-    def test_integers(self):
-        arr = np.array([1, 2, 3, np.int64(4), np.int32(5)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'integer')
-
-        arr = np.array([1, 2, 3, np.int64(4), np.int32(5), 'foo'], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed-integer')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='i4')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'integer')
-
-    def test_bools(self):
-        arr = np.array([True, False, True, True, True], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-        arr = np.array([np.bool_(True), np.bool_(False)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-        arr = np.array([True, False, True, 'foo'], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed')
-
-        arr = np.array([True, False, True], dtype=bool)
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'boolean')
-
-    def test_floats(self):
-        arr = np.array([1., 2., 3., np.float64(4), np.float32(5)], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-        arr = np.array([1, 2, 3, np.float64(4), np.float32(5), 'foo'],
-                       dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed-integer')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='f4')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-        arr = np.array([1, 2, 3, 4, 5], dtype='f8')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'floating')
-
-    def test_string(self):
-        pass
-
-    def test_unicode(self):
-        pass
-
-    def test_datetime(self):
-
-        dates = [datetime(2012, 1, x) for x in range(1, 20)]
-        index = Index(dates)
-        self.assertEqual(index.inferred_type, 'datetime64')
-
-    def test_infer_dtype_datetime(self):
-
-        arr = np.array([Timestamp('2011-01-01'),
-                        Timestamp('2011-01-02')])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        arr = np.array([np.datetime64('2011-01-01'),
-                        np.datetime64('2011-01-01')], dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-        arr = np.array([datetime(2011, 1, 1), datetime(2012, 2, 1)])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        # starts with nan
-        for n in [pd.NaT, np.nan]:
-            arr = np.array([n, pd.Timestamp('2011-01-02')])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-            arr = np.array([n, np.datetime64('2011-01-02')])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-            arr = np.array([n, datetime(2011, 1, 1)])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-            arr = np.array([n, pd.Timestamp('2011-01-02'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-            arr = np.array([n, np.datetime64('2011-01-02'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-            arr = np.array([n, datetime(2011, 1, 1), n])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        # different type of nat
-        arr = np.array([np.timedelta64('nat'),
-                        np.datetime64('2011-01-02')], dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([np.datetime64('2011-01-02'),
-                        np.timedelta64('nat')], dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        # mixed datetime
-        arr = np.array([datetime(2011, 1, 1),
-                        pd.Timestamp('2011-01-02')])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        # should be datetime?
-        arr = np.array([np.datetime64('2011-01-01'),
-                        pd.Timestamp('2011-01-02')])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([pd.Timestamp('2011-01-02'),
-                        np.datetime64('2011-01-01')])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed-integer')
-
-        arr = np.array([np.nan, pd.Timestamp('2011-01-02'), 1.1])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([np.nan, '2011-01-01', pd.Timestamp('2011-01-02')])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-    def test_infer_dtype_timedelta(self):
-
-        arr = np.array([pd.Timedelta('1 days'),
-                        pd.Timedelta('2 days')])
-        self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        arr = np.array([np.timedelta64(1, 'D'),
-                        np.timedelta64(2, 'D')], dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        arr = np.array([timedelta(1), timedelta(2)])
-        self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        # starts with nan
-        for n in [pd.NaT, np.nan]:
-            arr = np.array([n, Timedelta('1 days')])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([n, np.timedelta64(1, 'D')])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([n, timedelta(1)])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([n, pd.Timedelta('1 days'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([n, np.timedelta64(1, 'D'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([n, timedelta(1), n])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        # different type of nat
-        arr = np.array([np.datetime64('nat'), np.timedelta64(1, 'D')],
-                       dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([np.timedelta64(1, 'D'), np.datetime64('nat')],
-                       dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-    def test_infer_dtype_period(self):
-        # GH 13664
-        arr = np.array([pd.Period('2011-01', freq='D'),
-                        pd.Period('2011-02', freq='D')])
-        self.assertEqual(lib.infer_dtype(arr), 'period')
-
-        arr = np.array([pd.Period('2011-01', freq='D'),
-                        pd.Period('2011-02', freq='M')])
-        self.assertEqual(lib.infer_dtype(arr), 'period')
-
-        # starts with nan
-        for n in [pd.NaT, np.nan]:
-            arr = np.array([n, pd.Period('2011-01', freq='D')])
-            self.assertEqual(lib.infer_dtype(arr), 'period')
-
-            arr = np.array([n, pd.Period('2011-01', freq='D'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'period')
-
-        # different type of nat
-        arr = np.array([np.datetime64('nat'), pd.Period('2011-01', freq='M')],
-                       dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([pd.Period('2011-01', freq='M'), np.datetime64('nat')],
-                       dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-    def test_infer_dtype_all_nan_nat_like(self):
-        arr = np.array([np.nan, np.nan])
-        self.assertEqual(lib.infer_dtype(arr), 'floating')
-
-        # nan and None mix are result in mixed
-        arr = np.array([np.nan, np.nan, None])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([None, np.nan, np.nan])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        # pd.NaT
-        arr = np.array([pd.NaT])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        arr = np.array([pd.NaT, np.nan])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        arr = np.array([np.nan, pd.NaT])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        arr = np.array([np.nan, pd.NaT, np.nan])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        arr = np.array([None, pd.NaT, None])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime')
-
-        # np.datetime64(nat)
-        arr = np.array([np.datetime64('nat')])
-        self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-        for n in [np.nan, pd.NaT, None]:
-            arr = np.array([n, np.datetime64('nat'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-            arr = np.array([pd.NaT, n, np.datetime64('nat'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'datetime64')
-
-        arr = np.array([np.timedelta64('nat')], dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        for n in [np.nan, pd.NaT, None]:
-            arr = np.array([n, np.timedelta64('nat'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-            arr = np.array([pd.NaT, n, np.timedelta64('nat'), n])
-            self.assertEqual(lib.infer_dtype(arr), 'timedelta')
-
-        # datetime / timedelta mixed
-        arr = np.array([pd.NaT, np.datetime64('nat'),
-                        np.timedelta64('nat'), np.nan])
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-        arr = np.array([np.timedelta64('nat'), np.datetime64('nat')],
-                       dtype=object)
-        self.assertEqual(lib.infer_dtype(arr), 'mixed')
-
-    def test_is_datetimelike_array_all_nan_nat_like(self):
-        arr = np.array([np.nan, pd.NaT, np.datetime64('nat')])
-        self.assertTrue(lib.is_datetime_array(arr))
-        self.assertTrue(lib.is_datetime64_array(arr))
-        self.assertFalse(lib.is_timedelta_array(arr))
-        self.assertFalse(lib.is_timedelta64_array(arr))
-        self.assertFalse(lib.is_timedelta_or_timedelta64_array(arr))
-
-        arr = np.array([np.nan, pd.NaT, np.timedelta64('nat')])
-        self.assertFalse(lib.is_datetime_array(arr))
-        self.assertFalse(lib.is_datetime64_array(arr))
-        self.assertTrue(lib.is_timedelta_array(arr))
-        self.assertTrue(lib.is_timedelta64_array(arr))
-        self.assertTrue(lib.is_timedelta_or_timedelta64_array(arr))
-
-        arr = np.array([np.nan, pd.NaT, np.datetime64('nat'),
-                        np.timedelta64('nat')])
-        self.assertFalse(lib.is_datetime_array(arr))
-        self.assertFalse(lib.is_datetime64_array(arr))
-        self.assertFalse(lib.is_timedelta_array(arr))
-        self.assertFalse(lib.is_timedelta64_array(arr))
-        self.assertFalse(lib.is_timedelta_or_timedelta64_array(arr))
-
-        arr = np.array([np.nan, pd.NaT])
-        self.assertTrue(lib.is_datetime_array(arr))
-        self.assertTrue(lib.is_datetime64_array(arr))
-        self.assertTrue(lib.is_timedelta_array(arr))
-        self.assertTrue(lib.is_timedelta64_array(arr))
-        self.assertTrue(lib.is_timedelta_or_timedelta64_array(arr))
-
-        arr = np.array([np.nan, np.nan], dtype=object)
-        self.assertFalse(lib.is_datetime_array(arr))
-        self.assertFalse(lib.is_datetime64_array(arr))
-        self.assertFalse(lib.is_timedelta_array(arr))
-        self.assertFalse(lib.is_timedelta64_array(arr))
-        self.assertFalse(lib.is_timedelta_or_timedelta64_array(arr))
-
-    def test_date(self):
-
-        dates = [date(2012, 1, x) for x in range(1, 20)]
-        index = Index(dates)
-        self.assertEqual(index.inferred_type, 'date')
-
-    def test_to_object_array_tuples(self):
-        r = (5, 6)
-        values = [r]
-        result = lib.to_object_array_tuples(values)
-
-        try:
-            # make sure record array works
-            from collections import namedtuple
-            record = namedtuple('record', 'x y')
-            r = record(5, 6)
-            values = [r]
-            result = lib.to_object_array_tuples(values)  # noqa
-        except ImportError:
-            pass
-
-    def test_object(self):
-
-        # GH 7431
-        # cannot infer more than this as only a single element
-        arr = np.array([None], dtype='O')
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'mixed')
-
-    def test_to_object_array_width(self):
-        # see gh-13320
-        rows = [[1, 2, 3], [4, 5, 6]]
-
-        expected = np.array(rows, dtype=object)
-        out = lib.to_object_array(rows)
-        tm.assert_numpy_array_equal(out, expected)
-
-        expected = np.array(rows, dtype=object)
-        out = lib.to_object_array(rows, min_width=1)
-        tm.assert_numpy_array_equal(out, expected)
-
-        expected = np.array([[1, 2, 3, None, None],
-                             [4, 5, 6, None, None]], dtype=object)
-        out = lib.to_object_array(rows, min_width=5)
-        tm.assert_numpy_array_equal(out, expected)
-
-    def test_is_period(self):
-        self.assertTrue(lib.is_period(pd.Period('2011-01', freq='M')))
-        self.assertFalse(lib.is_period(pd.PeriodIndex(['2011-01'], freq='M')))
-        self.assertFalse(lib.is_period(pd.Timestamp('2011-01')))
-        self.assertFalse(lib.is_period(1))
-        self.assertFalse(lib.is_period(np.nan))
-
-    def test_categorical(self):
-
-        # GH 8974
-        from pandas import Categorical, Series
-        arr = Categorical(list('abc'))
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'categorical')
-
-        result = lib.infer_dtype(Series(arr))
-        self.assertEqual(result, 'categorical')
-
-        arr = Categorical(list('abc'), categories=['cegfab'], ordered=True)
-        result = lib.infer_dtype(arr)
-        self.assertEqual(result, 'categorical')
-
-        result = lib.infer_dtype(Series(arr))
-        self.assertEqual(result, 'categorical')
-
-
-class TestNumberScalar(tm.TestCase):
-
-    def test_is_number(self):
-
-        self.assertTrue(is_number(True))
-        self.assertTrue(is_number(1))
-        self.assertTrue(is_number(1.1))
-        self.assertTrue(is_number(1 + 3j))
-        self.assertTrue(is_number(np.bool(False)))
-        self.assertTrue(is_number(np.int64(1)))
-        self.assertTrue(is_number(np.float64(1.1)))
-        self.assertTrue(is_number(np.complex128(1 + 3j)))
-        self.assertTrue(is_number(np.nan))
-
-        self.assertFalse(is_number(None))
-        self.assertFalse(is_number('x'))
-        self.assertFalse(is_number(datetime(2011, 1, 1)))
-        self.assertFalse(is_number(np.datetime64('2011-01-01')))
-        self.assertFalse(is_number(Timestamp('2011-01-01')))
-        self.assertFalse(is_number(Timestamp('2011-01-01',
-                                             tz='US/Eastern')))
-        self.assertFalse(is_number(timedelta(1000)))
-        self.assertFalse(is_number(Timedelta('1 days')))
-
-        # questionable
-        self.assertFalse(is_number(np.bool_(False)))
-        self.assertTrue(is_number(np.timedelta64(1, 'D')))
-
-    def test_is_bool(self):
-        self.assertTrue(is_bool(True))
-        self.assertTrue(is_bool(np.bool(False)))
-        self.assertTrue(is_bool(np.bool_(False)))
-
-        self.assertFalse(is_bool(1))
-        self.assertFalse(is_bool(1.1))
-        self.assertFalse(is_bool(1 + 3j))
-        self.assertFalse(is_bool(np.int64(1)))
-        self.assertFalse(is_bool(np.float64(1.1)))
-        self.assertFalse(is_bool(np.complex128(1 + 3j)))
-        self.assertFalse(is_bool(np.nan))
-        self.assertFalse(is_bool(None))
-        self.assertFalse(is_bool('x'))
-        self.assertFalse(is_bool(datetime(2011, 1, 1)))
-        self.assertFalse(is_bool(np.datetime64('2011-01-01')))
-        self.assertFalse(is_bool(Timestamp('2011-01-01')))
-        self.assertFalse(is_bool(Timestamp('2011-01-01',
-                                           tz='US/Eastern')))
-        self.assertFalse(is_bool(timedelta(1000)))
-        self.assertFalse(is_bool(np.timedelta64(1, 'D')))
-        self.assertFalse(is_bool(Timedelta('1 days')))
-
-    def test_is_integer(self):
-        self.assertTrue(is_integer(1))
-        self.assertTrue(is_integer(np.int64(1)))
-
-        self.assertFalse(is_integer(True))
-        self.assertFalse(is_integer(1.1))
-        self.assertFalse(is_integer(1 + 3j))
-        self.assertFalse(is_integer(np.bool(False)))
-        self.assertFalse(is_integer(np.bool_(False)))
-        self.assertFalse(is_integer(np.float64(1.1)))
-        self.assertFalse(is_integer(np.complex128(1 + 3j)))
-        self.assertFalse(is_integer(np.nan))
-        self.assertFalse(is_integer(None))
-        self.assertFalse(is_integer('x'))
-        self.assertFalse(is_integer(datetime(2011, 1, 1)))
-        self.assertFalse(is_integer(np.datetime64('2011-01-01')))
-        self.assertFalse(is_integer(Timestamp('2011-01-01')))
-        self.assertFalse(is_integer(Timestamp('2011-01-01',
-                                              tz='US/Eastern')))
-        self.assertFalse(is_integer(timedelta(1000)))
-        self.assertFalse(is_integer(Timedelta('1 days')))
-
-        # questionable
-        self.assertTrue(is_integer(np.timedelta64(1, 'D')))
-
-    def test_is_float(self):
-        self.assertTrue(is_float(1.1))
-        self.assertTrue(is_float(np.float64(1.1)))
-        self.assertTrue(is_float(np.nan))
-
-        self.assertFalse(is_float(True))
-        self.assertFalse(is_float(1))
-        self.assertFalse(is_float(1 + 3j))
-        self.assertFalse(is_float(np.bool(False)))
-        self.assertFalse(is_float(np.bool_(False)))
-        self.assertFalse(is_float(np.int64(1)))
-        self.assertFalse(is_float(np.complex128(1 + 3j)))
-        self.assertFalse(is_float(None))
-        self.assertFalse(is_float('x'))
-        self.assertFalse(is_float(datetime(2011, 1, 1)))
-        self.assertFalse(is_float(np.datetime64('2011-01-01')))
-        self.assertFalse(is_float(Timestamp('2011-01-01')))
-        self.assertFalse(is_float(Timestamp('2011-01-01',
-                                            tz='US/Eastern')))
-        self.assertFalse(is_float(timedelta(1000)))
-        self.assertFalse(is_float(np.timedelta64(1, 'D')))
-        self.assertFalse(is_float(Timedelta('1 days')))
-
-    def test_is_datetime_dtypes(self):
-
-        ts = pd.date_range('20130101', periods=3)
-        tsa = pd.date_range('20130101', periods=3, tz='US/Eastern')
-
-        self.assertTrue(is_datetime64_dtype('datetime64'))
-        self.assertTrue(is_datetime64_dtype('datetime64[ns]'))
-        self.assertTrue(is_datetime64_dtype(ts))
-        self.assertFalse(is_datetime64_dtype(tsa))
-
-        self.assertFalse(is_datetime64_ns_dtype('datetime64'))
-        self.assertTrue(is_datetime64_ns_dtype('datetime64[ns]'))
-        self.assertTrue(is_datetime64_ns_dtype(ts))
-        self.assertTrue(is_datetime64_ns_dtype(tsa))
-
-        self.assertTrue(is_datetime64_any_dtype('datetime64'))
-        self.assertTrue(is_datetime64_any_dtype('datetime64[ns]'))
-        self.assertTrue(is_datetime64_any_dtype(ts))
-        self.assertTrue(is_datetime64_any_dtype(tsa))
-
-        self.assertFalse(is_datetime64tz_dtype('datetime64'))
-        self.assertFalse(is_datetime64tz_dtype('datetime64[ns]'))
-        self.assertFalse(is_datetime64tz_dtype(ts))
-        self.assertTrue(is_datetime64tz_dtype(tsa))
-
-        for tz in ['US/Eastern', 'UTC']:
-            dtype = 'datetime64[ns, {}]'.format(tz)
-            self.assertFalse(is_datetime64_dtype(dtype))
-            self.assertTrue(is_datetime64tz_dtype(dtype))
-            self.assertTrue(is_datetime64_ns_dtype(dtype))
-            self.assertTrue(is_datetime64_any_dtype(dtype))
-
-    def test_is_timedelta(self):
-        self.assertTrue(is_timedelta64_dtype('timedelta64'))
-        self.assertTrue(is_timedelta64_dtype('timedelta64[ns]'))
-        self.assertFalse(is_timedelta64_ns_dtype('timedelta64'))
-        self.assertTrue(is_timedelta64_ns_dtype('timedelta64[ns]'))
-
-        tdi = TimedeltaIndex([1e14, 2e14], dtype='timedelta64')
-        self.assertTrue(is_timedelta64_dtype(tdi))
-        self.assertTrue(is_timedelta64_ns_dtype(tdi))
-        self.assertTrue(is_timedelta64_ns_dtype(tdi.astype('timedelta64[ns]')))
-
-        # Conversion to Int64Index:
-        self.assertFalse(is_timedelta64_ns_dtype(tdi.astype('timedelta64')))
-        self.assertFalse(is_timedelta64_ns_dtype(tdi.astype('timedelta64[h]')))
-
-
-class Testisscalar(tm.TestCase):
-
-    def test_isscalar_builtin_scalars(self):
-        self.assertTrue(is_scalar(None))
-        self.assertTrue(is_scalar(True))
-        self.assertTrue(is_scalar(False))
-        self.assertTrue(is_scalar(0.))
-        self.assertTrue(is_scalar(np.nan))
-        self.assertTrue(is_scalar('foobar'))
-        self.assertTrue(is_scalar(b'foobar'))
-        self.assertTrue(is_scalar(u('efoobar')))
-        self.assertTrue(is_scalar(datetime(2014, 1, 1)))
-        self.assertTrue(is_scalar(date(2014, 1, 1)))
-        self.assertTrue(is_scalar(time(12, 0)))
-        self.assertTrue(is_scalar(timedelta(hours=1)))
-        self.assertTrue(is_scalar(pd.NaT))
-
-    def test_isscalar_builtin_nonscalars(self):
-        self.assertFalse(is_scalar({}))
-        self.assertFalse(is_scalar([]))
-        self.assertFalse(is_scalar([1]))
-        self.assertFalse(is_scalar(()))
-        self.assertFalse(is_scalar((1, )))
-        self.assertFalse(is_scalar(slice(None)))
-        self.assertFalse(is_scalar(Ellipsis))
-
-    def test_isscalar_numpy_array_scalars(self):
-        self.assertTrue(is_scalar(np.int64(1)))
-        self.assertTrue(is_scalar(np.float64(1.)))
-        self.assertTrue(is_scalar(np.int32(1)))
-        self.assertTrue(is_scalar(np.object_('foobar')))
-        self.assertTrue(is_scalar(np.str_('foobar')))
-        self.assertTrue(is_scalar(np.unicode_(u('foobar'))))
-        self.assertTrue(is_scalar(np.bytes_(b'foobar')))
-        self.assertTrue(is_scalar(np.datetime64('2014-01-01')))
-        self.assertTrue(is_scalar(np.timedelta64(1, 'h')))
-
-    def test_isscalar_numpy_zerodim_arrays(self):
-        for zerodim in [np.array(1), np.array('foobar'),
-                        np.array(np.datetime64('2014-01-01')),
-                        np.array(np.timedelta64(1, 'h')),
-                        np.array(np.datetime64('NaT'))]:
-            self.assertFalse(is_scalar(zerodim))
-            self.assertTrue(is_scalar(lib.item_from_zerodim(zerodim)))
-
-    def test_isscalar_numpy_arrays(self):
-        self.assertFalse(is_scalar(np.array([])))
-        self.assertFalse(is_scalar(np.array([[]])))
-        self.assertFalse(is_scalar(np.matrix('1; 2')))
-
-    def test_isscalar_pandas_scalars(self):
-        self.assertTrue(is_scalar(Timestamp('2014-01-01')))
-        self.assertTrue(is_scalar(Timedelta(hours=1)))
-        self.assertTrue(is_scalar(Period('2014-01-01')))
-
-    def test_lisscalar_pandas_containers(self):
-        self.assertFalse(is_scalar(Series()))
-        self.assertFalse(is_scalar(Series([1])))
-        self.assertFalse(is_scalar(DataFrame()))
-        self.assertFalse(is_scalar(DataFrame([[1]])))
-        self.assertFalse(is_scalar(Panel()))
-        self.assertFalse(is_scalar(Panel([[[1]]])))
-        self.assertFalse(is_scalar(Index([])))
-        self.assertFalse(is_scalar(Index([1])))
-
-
-def test_datetimeindex_from_empty_datetime64_array():
-    for unit in ['ms', 'us', 'ns']:
-        idx = DatetimeIndex(np.array([], dtype='datetime64[%s]' % unit))
-        assert (len(idx) == 0)
-
-
-def test_nan_to_nat_conversions():
-
-    df = DataFrame(dict({
-        'A': np.asarray(
-            lrange(10), dtype='float64'),
-        'B': Timestamp('20010101')
-    }))
-    df.iloc[3:6, :] = np.nan
-    result = df.loc[4, 'B'].value
-    assert (result == tslib.iNaT)
-
-    s = df['B'].copy()
-    s._data = s._data.setitem(indexer=tuple([slice(8, 9)]), value=np.nan)
-    assert (isnull(s[8]))
-
-    # numpy < 1.7.0 is wrong
-    from distutils.version import LooseVersion
-    if LooseVersion(np.__version__) >= '1.7.0':
-        assert (s[8].value == np.datetime64('NaT').astype(np.int64))
-
-
-def test_is_scipy_sparse(spmatrix):  # noqa: F811
-    tm._skip_if_no_scipy()
-    assert is_scipy_sparse(spmatrix([[0, 1]]))
-    assert not is_scipy_sparse(np.array([1]))
-
-
-def test_ensure_int32():
-    values = np.arange(10, dtype=np.int32)
-    result = _ensure_int32(values)
-    assert (result.dtype == np.int32)
-
-    values = np.arange(10, dtype=np.int64)
-    result = _ensure_int32(values)
-    assert (result.dtype == np.int32)
-
-
-def test_ensure_categorical():
-    values = np.arange(10, dtype=np.int32)
-    result = _ensure_categorical(values)
-    assert (result.dtype == 'category')
-
-    values = Categorical(values)
-    result = _ensure_categorical(values)
-    tm.assert_categorical_equal(result, values)
diff --git a/pandas/tests/types/test_io.py b/pandas/tests/types/test_io.py
deleted file mode 100644
index b6c10394dd232..0000000000000
--- a/pandas/tests/types/test_io.py
+++ /dev/null
@@ -1,109 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import numpy as np
-import pandas._libs.lib as lib
-import pandas.util.testing as tm
-
-from pandas.compat import long, u
-
-
-class TestParseSQL(tm.TestCase):
-
-    def test_convert_sql_column_floats(self):
-        arr = np.array([1.5, None, 3, 4.2], dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1.5, np.nan, 3, 4.2], dtype='f8')
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_strings(self):
-        arr = np.array(['1.5', None, '3', '4.2'], dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array(['1.5', np.nan, '3', '4.2'], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_unicode(self):
-        arr = np.array([u('1.5'), None, u('3'), u('4.2')],
-                       dtype=object)
-        result = lib.convert_sql_column(arr)
-        expected = np.array([u('1.5'), np.nan, u('3'), u('4.2')],
-                            dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_ints(self):
-        arr = np.array([1, 2, 3, 4], dtype='O')
-        arr2 = np.array([1, 2, 3, 4], dtype='i4').astype('O')
-        result = lib.convert_sql_column(arr)
-        result2 = lib.convert_sql_column(arr2)
-        expected = np.array([1, 2, 3, 4], dtype='i8')
-        self.assert_numpy_array_equal(result, expected)
-        self.assert_numpy_array_equal(result2, expected)
-
-        arr = np.array([1, 2, 3, None, 4], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, np.nan, 4], dtype='f8')
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_longs(self):
-        arr = np.array([long(1), long(2), long(3), long(4)], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, 4], dtype='i8')
-        self.assert_numpy_array_equal(result, expected)
-
-        arr = np.array([long(1), long(2), long(3), None, long(4)], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1, 2, 3, np.nan, 4], dtype='f8')
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_bools(self):
-        arr = np.array([True, False, True, False], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([True, False, True, False], dtype=bool)
-        self.assert_numpy_array_equal(result, expected)
-
-        arr = np.array([True, False, None, False], dtype='O')
-        result = lib.convert_sql_column(arr)
-        expected = np.array([True, False, np.nan, False], dtype=object)
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_sql_column_decimals(self):
-        from decimal import Decimal
-        arr = np.array([Decimal('1.5'), None, Decimal('3'), Decimal('4.2')])
-        result = lib.convert_sql_column(arr)
-        expected = np.array([1.5, np.nan, 3, 4.2], dtype='f8')
-        self.assert_numpy_array_equal(result, expected)
-
-    def test_convert_downcast_int64(self):
-        from pandas.io.libparsers import na_values
-
-        arr = np.array([1, 2, 7, 8, 10], dtype=np.int64)
-        expected = np.array([1, 2, 7, 8, 10], dtype=np.int8)
-
-        # default argument
-        result = lib.downcast_int64(arr, na_values)
-        self.assert_numpy_array_equal(result, expected)
-
-        result = lib.downcast_int64(arr, na_values, use_unsigned=False)
-        self.assert_numpy_array_equal(result, expected)
-
-        expected = np.array([1, 2, 7, 8, 10], dtype=np.uint8)
-        result = lib.downcast_int64(arr, na_values, use_unsigned=True)
-        self.assert_numpy_array_equal(result, expected)
-
-        # still cast to int8 despite use_unsigned=True
-        # because of the negative number as an element
-        arr = np.array([1, 2, -7, 8, 10], dtype=np.int64)
-        expected = np.array([1, 2, -7, 8, 10], dtype=np.int8)
-        result = lib.downcast_int64(arr, na_values, use_unsigned=True)
-        self.assert_numpy_array_equal(result, expected)
-
-        arr = np.array([1, 2, 7, 8, 300], dtype=np.int64)
-        expected = np.array([1, 2, 7, 8, 300], dtype=np.int16)
-        result = lib.downcast_int64(arr, na_values)
-        self.assert_numpy_array_equal(result, expected)
-
-        int8_na = na_values[np.int8]
-        int64_na = na_values[np.int64]
-        arr = np.array([int64_na, 2, 3, 10, 15], dtype=np.int64)
-        expected = np.array([int8_na, 2, 3, 10, 15], dtype=np.int8)
-        result = lib.downcast_int64(arr, na_values)
-        self.assert_numpy_array_equal(result, expected)
diff --git a/pandas/tests/types/test_missing.py b/pandas/tests/types/test_missing.py
deleted file mode 100644
index 2e35f5c1badbb..0000000000000
--- a/pandas/tests/types/test_missing.py
+++ /dev/null
@@ -1,303 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import numpy as np
-from datetime import datetime
-from pandas.util import testing as tm
-
-import pandas as pd
-from pandas.core import config as cf
-from pandas.compat import u
-from pandas._libs.tslib import iNaT
-from pandas import (NaT, Float64Index, Series,
-                    DatetimeIndex, TimedeltaIndex, date_range)
-from pandas.types.dtypes import DatetimeTZDtype
-from pandas.types.missing import (array_equivalent, isnull, notnull,
-                                  na_value_for_dtype)
-
-
-def test_notnull():
-    assert notnull(1.)
-    assert not notnull(None)
-    assert not notnull(np.NaN)
-
-    with cf.option_context("mode.use_inf_as_null", False):
-        assert notnull(np.inf)
-        assert notnull(-np.inf)
-
-        arr = np.array([1.5, np.inf, 3.5, -np.inf])
-        result = notnull(arr)
-        assert result.all()
-
-    with cf.option_context("mode.use_inf_as_null", True):
-        assert not notnull(np.inf)
-        assert not notnull(-np.inf)
-
-        arr = np.array([1.5, np.inf, 3.5, -np.inf])
-        result = notnull(arr)
-        assert result.sum() == 2
-
-    with cf.option_context("mode.use_inf_as_null", False):
-        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
-                  tm.makeObjectSeries(), tm.makeTimeSeries(),
-                  tm.makePeriodSeries()]:
-            assert (isinstance(isnull(s), Series))
-
-
-class TestIsNull(tm.TestCase):
-
-    def test_0d_array(self):
-        self.assertTrue(isnull(np.array(np.nan)))
-        self.assertFalse(isnull(np.array(0.0)))
-        self.assertFalse(isnull(np.array(0)))
-        # test object dtype
-        self.assertTrue(isnull(np.array(np.nan, dtype=object)))
-        self.assertFalse(isnull(np.array(0.0, dtype=object)))
-        self.assertFalse(isnull(np.array(0, dtype=object)))
-
-    def test_isnull(self):
-        self.assertFalse(isnull(1.))
-        self.assertTrue(isnull(None))
-        self.assertTrue(isnull(np.NaN))
-        self.assertTrue(float('nan'))
-        self.assertFalse(isnull(np.inf))
-        self.assertFalse(isnull(-np.inf))
-
-        # series
-        for s in [tm.makeFloatSeries(), tm.makeStringSeries(),
-                  tm.makeObjectSeries(), tm.makeTimeSeries(),
-                  tm.makePeriodSeries()]:
-            self.assertIsInstance(isnull(s), Series)
-
-        # frame
-        for df in [tm.makeTimeDataFrame(), tm.makePeriodFrame(),
-                   tm.makeMixedDataFrame()]:
-            result = isnull(df)
-            expected = df.apply(isnull)
-            tm.assert_frame_equal(result, expected)
-
-        # panel
-        for p in [tm.makePanel(), tm.makePeriodPanel(),
-                  tm.add_nans(tm.makePanel())]:
-            result = isnull(p)
-            expected = p.apply(isnull)
-            tm.assert_panel_equal(result, expected)
-
-        # panel 4d
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            for p in [tm.makePanel4D(), tm.add_nans_panel4d(tm.makePanel4D())]:
-                result = isnull(p)
-                expected = p.apply(isnull)
-                tm.assert_panel4d_equal(result, expected)
-
-    def test_isnull_lists(self):
-        result = isnull([[False]])
-        exp = np.array([[False]])
-        tm.assert_numpy_array_equal(result, exp)
-
-        result = isnull([[1], [2]])
-        exp = np.array([[False], [False]])
-        tm.assert_numpy_array_equal(result, exp)
-
-        # list of strings / unicode
-        result = isnull(['foo', 'bar'])
-        exp = np.array([False, False])
-        tm.assert_numpy_array_equal(result, exp)
-
-        result = isnull([u('foo'), u('bar')])
-        exp = np.array([False, False])
-        tm.assert_numpy_array_equal(result, exp)
-
-    def test_isnull_nat(self):
-        result = isnull([NaT])
-        exp = np.array([True])
-        tm.assert_numpy_array_equal(result, exp)
-
-        result = isnull(np.array([NaT], dtype=object))
-        exp = np.array([True])
-        tm.assert_numpy_array_equal(result, exp)
-
-    def test_isnull_numpy_nat(self):
-        arr = np.array([NaT, np.datetime64('NaT'), np.timedelta64('NaT'),
-                        np.datetime64('NaT', 's')])
-        result = isnull(arr)
-        expected = np.array([True] * 4)
-        tm.assert_numpy_array_equal(result, expected)
-
-    def test_isnull_datetime(self):
-        self.assertFalse(isnull(datetime.now()))
-        self.assertTrue(notnull(datetime.now()))
-
-        idx = date_range('1/1/1990', periods=20)
-        exp = np.ones(len(idx), dtype=bool)
-        tm.assert_numpy_array_equal(notnull(idx), exp)
-
-        idx = np.asarray(idx)
-        idx[0] = iNaT
-        idx = DatetimeIndex(idx)
-        mask = isnull(idx)
-        self.assertTrue(mask[0])
-        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
-        self.assert_numpy_array_equal(mask, exp)
-
-        # GH 9129
-        pidx = idx.to_period(freq='M')
-        mask = isnull(pidx)
-        self.assertTrue(mask[0])
-        exp = np.array([True] + [False] * (len(idx) - 1), dtype=bool)
-        self.assert_numpy_array_equal(mask, exp)
-
-        mask = isnull(pidx[1:])
-        exp = np.zeros(len(mask), dtype=bool)
-        self.assert_numpy_array_equal(mask, exp)
-
-    def test_datetime_other_units(self):
-        idx = pd.DatetimeIndex(['2011-01-01', 'NaT', '2011-01-02'])
-        exp = np.array([False, True, False])
-        tm.assert_numpy_array_equal(isnull(idx), exp)
-        tm.assert_numpy_array_equal(notnull(idx), ~exp)
-        tm.assert_numpy_array_equal(isnull(idx.values), exp)
-        tm.assert_numpy_array_equal(notnull(idx.values), ~exp)
-
-        for dtype in ['datetime64[D]', 'datetime64[h]', 'datetime64[m]',
-                      'datetime64[s]', 'datetime64[ms]', 'datetime64[us]',
-                      'datetime64[ns]']:
-            values = idx.values.astype(dtype)
-
-            exp = np.array([False, True, False])
-            tm.assert_numpy_array_equal(isnull(values), exp)
-            tm.assert_numpy_array_equal(notnull(values), ~exp)
-
-            exp = pd.Series([False, True, False])
-            s = pd.Series(values)
-            tm.assert_series_equal(isnull(s), exp)
-            tm.assert_series_equal(notnull(s), ~exp)
-            s = pd.Series(values, dtype=object)
-            tm.assert_series_equal(isnull(s), exp)
-            tm.assert_series_equal(notnull(s), ~exp)
-
-    def test_timedelta_other_units(self):
-        idx = pd.TimedeltaIndex(['1 days', 'NaT', '2 days'])
-        exp = np.array([False, True, False])
-        tm.assert_numpy_array_equal(isnull(idx), exp)
-        tm.assert_numpy_array_equal(notnull(idx), ~exp)
-        tm.assert_numpy_array_equal(isnull(idx.values), exp)
-        tm.assert_numpy_array_equal(notnull(idx.values), ~exp)
-
-        for dtype in ['timedelta64[D]', 'timedelta64[h]', 'timedelta64[m]',
-                      'timedelta64[s]', 'timedelta64[ms]', 'timedelta64[us]',
-                      'timedelta64[ns]']:
-            values = idx.values.astype(dtype)
-
-            exp = np.array([False, True, False])
-            tm.assert_numpy_array_equal(isnull(values), exp)
-            tm.assert_numpy_array_equal(notnull(values), ~exp)
-
-            exp = pd.Series([False, True, False])
-            s = pd.Series(values)
-            tm.assert_series_equal(isnull(s), exp)
-            tm.assert_series_equal(notnull(s), ~exp)
-            s = pd.Series(values, dtype=object)
-            tm.assert_series_equal(isnull(s), exp)
-            tm.assert_series_equal(notnull(s), ~exp)
-
-    def test_period(self):
-        idx = pd.PeriodIndex(['2011-01', 'NaT', '2012-01'], freq='M')
-        exp = np.array([False, True, False])
-        tm.assert_numpy_array_equal(isnull(idx), exp)
-        tm.assert_numpy_array_equal(notnull(idx), ~exp)
-
-        exp = pd.Series([False, True, False])
-        s = pd.Series(idx)
-        tm.assert_series_equal(isnull(s), exp)
-        tm.assert_series_equal(notnull(s), ~exp)
-        s = pd.Series(idx, dtype=object)
-        tm.assert_series_equal(isnull(s), exp)
-        tm.assert_series_equal(notnull(s), ~exp)
-
-
-def test_array_equivalent():
-    assert array_equivalent(np.array([np.nan, np.nan]),
-                            np.array([np.nan, np.nan]))
-    assert array_equivalent(np.array([np.nan, 1, np.nan]),
-                            np.array([np.nan, 1, np.nan]))
-    assert array_equivalent(np.array([np.nan, None], dtype='object'),
-                            np.array([np.nan, None], dtype='object'))
-    assert array_equivalent(np.array([np.nan, 1 + 1j], dtype='complex'),
-                            np.array([np.nan, 1 + 1j], dtype='complex'))
-    assert not array_equivalent(
-        np.array([np.nan, 1 + 1j], dtype='complex'), np.array(
-            [np.nan, 1 + 2j], dtype='complex'))
-    assert not array_equivalent(
-        np.array([np.nan, 1, np.nan]), np.array([np.nan, 2, np.nan]))
-    assert not array_equivalent(
-        np.array(['a', 'b', 'c', 'd']), np.array(['e', 'e']))
-    assert array_equivalent(Float64Index([0, np.nan]),
-                            Float64Index([0, np.nan]))
-    assert not array_equivalent(
-        Float64Index([0, np.nan]), Float64Index([1, np.nan]))
-    assert array_equivalent(DatetimeIndex([0, np.nan]),
-                            DatetimeIndex([0, np.nan]))
-    assert not array_equivalent(
-        DatetimeIndex([0, np.nan]), DatetimeIndex([1, np.nan]))
-    assert array_equivalent(TimedeltaIndex([0, np.nan]),
-                            TimedeltaIndex([0, np.nan]))
-    assert not array_equivalent(
-        TimedeltaIndex([0, np.nan]), TimedeltaIndex([1, np.nan]))
-    assert array_equivalent(DatetimeIndex([0, np.nan], tz='US/Eastern'),
-                            DatetimeIndex([0, np.nan], tz='US/Eastern'))
-    assert not array_equivalent(
-        DatetimeIndex([0, np.nan], tz='US/Eastern'), DatetimeIndex(
-            [1, np.nan], tz='US/Eastern'))
-    assert not array_equivalent(
-        DatetimeIndex([0, np.nan]), DatetimeIndex(
-            [0, np.nan], tz='US/Eastern'))
-    assert not array_equivalent(
-        DatetimeIndex([0, np.nan], tz='CET'), DatetimeIndex(
-            [0, np.nan], tz='US/Eastern'))
-    assert not array_equivalent(
-        DatetimeIndex([0, np.nan]), TimedeltaIndex([0, np.nan]))
-
-
-def test_array_equivalent_compat():
-    # see gh-13388
-    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
-    n = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
-    assert (array_equivalent(m, n, strict_nan=True))
-    assert (array_equivalent(m, n, strict_nan=False))
-
-    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
-    n = np.array([(1, 2), (4, 3)], dtype=[('a', int), ('b', float)])
-    assert (not array_equivalent(m, n, strict_nan=True))
-    assert (not array_equivalent(m, n, strict_nan=False))
-
-    m = np.array([(1, 2), (3, 4)], dtype=[('a', int), ('b', float)])
-    n = np.array([(1, 2), (3, 4)], dtype=[('b', int), ('a', float)])
-    assert (not array_equivalent(m, n, strict_nan=True))
-    assert (not array_equivalent(m, n, strict_nan=False))
-
-
-def test_array_equivalent_str():
-    for dtype in ['O', 'S', 'U']:
-        assert array_equivalent(np.array(['A', 'B'], dtype=dtype),
-                                np.array(['A', 'B'], dtype=dtype))
-        assert not array_equivalent(np.array(['A', 'B'], dtype=dtype),
-                                    np.array(['A', 'X'], dtype=dtype))
-
-
-def test_na_value_for_dtype():
-    for dtype in [np.dtype('M8[ns]'), np.dtype('m8[ns]'),
-                  DatetimeTZDtype('datetime64[ns, US/Eastern]')]:
-        assert na_value_for_dtype(dtype) is NaT
-
-    for dtype in ['u1', 'u2', 'u4', 'u8',
-                  'i1', 'i2', 'i4', 'i8']:
-        assert na_value_for_dtype(np.dtype(dtype)) == 0
-
-    for dtype in ['bool']:
-        assert na_value_for_dtype(np.dtype(dtype)) is False
-
-    for dtype in ['f2', 'f4', 'f8']:
-        assert np.isnan(na_value_for_dtype(np.dtype(dtype)))
-
-    for dtype in ['O']:
-        assert np.isnan(na_value_for_dtype(np.dtype(dtype)))
diff --git a/pandas/tests/util/__init__.py b/pandas/tests/util/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/pandas/tests/util/conftest.py b/pandas/tests/util/conftest.py
new file mode 100644
index 0000000000000..5eff49ab774b5
--- /dev/null
+++ b/pandas/tests/util/conftest.py
@@ -0,0 +1,26 @@
+import pytest
+
+
+@pytest.fixture(params=[True, False])
+def check_dtype(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def check_exact(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def check_index_type(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def check_less_precise(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def check_categorical(request):
+    return request.param
diff --git a/pandas/tests/util/test_assert_almost_equal.py b/pandas/tests/util/test_assert_almost_equal.py
new file mode 100644
index 0000000000000..afee9c008295f
--- /dev/null
+++ b/pandas/tests/util/test_assert_almost_equal.py
@@ -0,0 +1,350 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import DataFrame, Index, Series, Timestamp
+from pandas.util.testing import assert_almost_equal
+
+
+def _assert_almost_equal_both(a, b, **kwargs):
+    """
+    Check that two objects are approximately equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : object
+        The first object to compare.
+    b : object
+        The second object to compare.
+    kwargs : dict
+        The arguments passed to `assert_almost_equal`.
+    """
+    assert_almost_equal(a, b, **kwargs)
+    assert_almost_equal(b, a, **kwargs)
+
+
+def _assert_not_almost_equal(a, b, **kwargs):
+    """
+    Check that two objects are not approximately equal.
+
+    Parameters
+    ----------
+    a : object
+        The first object to compare.
+    b : object
+        The second object to compare.
+    kwargs : dict
+        The arguments passed to `assert_almost_equal`.
+    """
+    try:
+        assert_almost_equal(a, b, **kwargs)
+        msg = ("{a} and {b} were approximately equal "
+               "when they shouldn't have been").format(a=a, b=b)
+        pytest.fail(msg=msg)
+    except AssertionError:
+        pass
+
+
+def _assert_not_almost_equal_both(a, b, **kwargs):
+    """
+    Check that two objects are not approximately equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : object
+        The first object to compare.
+    b : object
+        The second object to compare.
+    kwargs : dict
+        The arguments passed to `tm.assert_almost_equal`.
+    """
+    _assert_not_almost_equal(a, b, **kwargs)
+    _assert_not_almost_equal(b, a, **kwargs)
+
+
+@pytest.mark.parametrize("a,b", [
+    (1.1, 1.1), (1.1, 1.100001), (np.int16(1), 1.000001),
+    (np.float64(1.1), 1.1), (np.uint32(5), 5),
+])
+def test_assert_almost_equal_numbers(a, b):
+    _assert_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    (1.1, 1), (1.1, True), (1, 2), (1.0001, np.int16(1)),
+])
+def test_assert_not_almost_equal_numbers(a, b):
+    _assert_not_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    (0, 0), (0, 0.0), (0, np.float64(0)), (0.000001, 0),
+])
+def test_assert_almost_equal_numbers_with_zeros(a, b):
+    _assert_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    (0.001, 0), (1, 0),
+])
+def test_assert_not_almost_equal_numbers_with_zeros(a, b):
+    _assert_not_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    (1, "abc"), (1, [1, ]), (1, object()),
+])
+def test_assert_not_almost_equal_numbers_with_mixed(a, b):
+    _assert_not_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize(
+    "left_dtype", ["M8[ns]", "m8[ns]", "float64", "int64", "object"])
+@pytest.mark.parametrize(
+    "right_dtype", ["M8[ns]", "m8[ns]", "float64", "int64", "object"])
+def test_assert_almost_equal_edge_case_ndarrays(left_dtype, right_dtype):
+    # Empty compare.
+    _assert_almost_equal_both(np.array([], dtype=left_dtype),
+                              np.array([], dtype=right_dtype),
+                              check_dtype=False)
+
+
+def test_assert_almost_equal_dicts():
+    _assert_almost_equal_both({"a": 1, "b": 2}, {"a": 1, "b": 2})
+
+
+@pytest.mark.parametrize("a,b", [
+    ({"a": 1, "b": 2}, {"a": 1, "b": 3}),
+    ({"a": 1, "b": 2}, {"a": 1, "b": 2, "c": 3}),
+    ({"a": 1}, 1), ({"a": 1}, "abc"), ({"a": 1}, [1, ]),
+])
+def test_assert_not_almost_equal_dicts(a, b):
+    _assert_not_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("val", [1, 2])
+def test_assert_almost_equal_dict_like_object(val):
+    dict_val = 1
+    real_dict = dict(a=val)
+
+    class DictLikeObj(object):
+        def keys(self):
+            return "a",
+
+        def __getitem__(self, item):
+            if item == "a":
+                return dict_val
+
+    func = (_assert_almost_equal_both if val == dict_val
+            else _assert_not_almost_equal_both)
+    func(real_dict, DictLikeObj(), check_dtype=False)
+
+
+def test_assert_almost_equal_strings():
+    _assert_almost_equal_both("abc", "abc")
+
+
+@pytest.mark.parametrize("a,b", [
+    ("abc", "abcd"), ("abc", "abd"), ("abc", 1), ("abc", [1, ]),
+])
+def test_assert_not_almost_equal_strings(a, b):
+    _assert_not_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    ([1, 2, 3], [1, 2, 3]), (np.array([1, 2, 3]), np.array([1, 2, 3])),
+])
+def test_assert_almost_equal_iterables(a, b):
+    _assert_almost_equal_both(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    # Class is different.
+    (np.array([1, 2, 3]), [1, 2, 3]),
+
+    # Dtype is different.
+    (np.array([1, 2, 3]), np.array([1., 2., 3.])),
+
+    # Can't compare generators.
+    (iter([1, 2, 3]), [1, 2, 3]), ([1, 2, 3], [1, 2, 4]),
+    ([1, 2, 3], [1, 2, 3, 4]), ([1, 2, 3], 1),
+])
+def test_assert_not_almost_equal_iterables(a, b):
+    _assert_not_almost_equal(a, b)
+
+
+def test_assert_almost_equal_null():
+    _assert_almost_equal_both(None, None)
+
+
+@pytest.mark.parametrize("a,b", [
+    (None, np.NaN), (None, 0), (np.NaN, 0),
+])
+def test_assert_not_almost_equal_null(a, b):
+    _assert_not_almost_equal(a, b)
+
+
+@pytest.mark.parametrize("a,b", [
+    (np.inf, np.inf), (np.inf, float("inf")),
+    (np.array([np.inf, np.nan, -np.inf]),
+     np.array([np.inf, np.nan, -np.inf])),
+    (np.array([np.inf, None, -np.inf], dtype=np.object_),
+     np.array([np.inf, np.nan, -np.inf], dtype=np.object_)),
+])
+def test_assert_almost_equal_inf(a, b):
+    _assert_almost_equal_both(a, b)
+
+
+def test_assert_not_almost_equal_inf():
+    _assert_not_almost_equal_both(np.inf, 0)
+
+
+@pytest.mark.parametrize("a,b", [
+    (Index([1., 1.1]), Index([1., 1.100001])),
+    (Series([1., 1.1]), Series([1., 1.100001])),
+    (np.array([1.1, 2.000001]), np.array([1.1, 2.0])),
+    (DataFrame({"a": [1., 1.1]}), DataFrame({"a": [1., 1.100001]}))
+])
+def test_assert_almost_equal_pandas(a, b):
+    _assert_almost_equal_both(a, b)
+
+
+def test_assert_almost_equal_object():
+    a = [Timestamp("2011-01-01"), Timestamp("2011-01-01")]
+    b = [Timestamp("2011-01-01"), Timestamp("2011-01-01")]
+    _assert_almost_equal_both(a, b)
+
+
+def test_assert_almost_equal_value_mismatch():
+    msg = "expected 2\\.00000 but got 1\\.00000, with decimal 5"
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(1, 2)
+
+
+@pytest.mark.parametrize("a,b,klass1,klass2", [
+    (np.array([1]), 1, "ndarray", "int"),
+    (1, np.array([1]), "int", "ndarray"),
+])
+def test_assert_almost_equal_class_mismatch(a, b, klass1, klass2):
+    msg = """numpy array are different
+
+numpy array classes are different
+\\[left\\]:  {klass1}
+\\[right\\]: {klass2}""".format(klass1=klass1, klass2=klass2)
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(a, b)
+
+
+def test_assert_almost_equal_value_mismatch1():
+    msg = """numpy array are different
+
+numpy array values are different \\(66\\.66667 %\\)
+\\[left\\]:  \\[nan, 2\\.0, 3\\.0\\]
+\\[right\\]: \\[1\\.0, nan, 3\\.0\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([np.nan, 2, 3]),
+                            np.array([1, np.nan, 3]))
+
+
+def test_assert_almost_equal_value_mismatch2():
+    msg = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1, 2\\]
+\\[right\\]: \\[1, 3\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([1, 2]), np.array([1, 3]))
+
+
+def test_assert_almost_equal_value_mismatch3():
+    msg = """numpy array are different
+
+numpy array values are different \\(16\\.66667 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([[1, 2], [3, 4], [5, 6]]),
+                            np.array([[1, 3], [3, 4], [5, 6]]))
+
+
+def test_assert_almost_equal_value_mismatch4():
+    msg = """numpy array are different
+
+numpy array values are different \\(25\\.0 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\]\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([[1, 2], [3, 4]]),
+                            np.array([[1, 3], [3, 4]]))
+
+
+def test_assert_almost_equal_shape_mismatch_override():
+    msg = """Index are different
+
+Index shapes are different
+\\[left\\]:  \\(2L*,\\)
+\\[right\\]: \\(3L*,\\)"""
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([1, 2]),
+                            np.array([3, 4, 5]),
+                            obj="Index")
+
+
+def test_assert_almost_equal_unicode():
+    # see gh-20503
+    msg = """numpy array are different
+
+numpy array values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[á, à, ä\\]
+\\[right\\]: \\[á, à, å\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(np.array([u"á", u"à", u"ä"]),
+                            np.array([u"á", u"à", u"å"]))
+
+
+def test_assert_almost_equal_timestamp():
+    a = np.array([Timestamp("2011-01-01"), Timestamp("2011-01-01")])
+    b = np.array([Timestamp("2011-01-01"), Timestamp("2011-01-02")])
+
+    msg = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[2011-01-01 00:00:00, 2011-01-01 00:00:00\\]
+\\[right\\]: \\[2011-01-01 00:00:00, 2011-01-02 00:00:00\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal(a, b)
+
+
+def test_assert_almost_equal_iterable_length_mismatch():
+    msg = """Iterable are different
+
+Iterable length are different
+\\[left\\]:  2
+\\[right\\]: 3"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal([1, 2], [3, 4, 5])
+
+
+def test_assert_almost_equal_iterable_values_mismatch():
+    msg = """Iterable are different
+
+Iterable values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1, 2\\]
+\\[right\\]: \\[1, 3\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_almost_equal([1, 2], [1, 3])
diff --git a/pandas/tests/util/test_assert_categorical_equal.py b/pandas/tests/util/test_assert_categorical_equal.py
new file mode 100644
index 0000000000000..04c8301027039
--- /dev/null
+++ b/pandas/tests/util/test_assert_categorical_equal.py
@@ -0,0 +1,92 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas import Categorical
+from pandas.util.testing import assert_categorical_equal
+
+
+@pytest.mark.parametrize("c", [
+    Categorical([1, 2, 3, 4]),
+    Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4, 5]),
+])
+def test_categorical_equal(c):
+    assert_categorical_equal(c, c)
+
+
+@pytest.mark.parametrize("check_category_order", [True, False])
+def test_categorical_equal_order_mismatch(check_category_order):
+    c1 = Categorical([1, 2, 3, 4], categories=[1, 2, 3, 4])
+    c2 = Categorical([1, 2, 3, 4], categories=[4, 3, 2, 1])
+    kwargs = dict(check_category_order=check_category_order)
+
+    if check_category_order:
+        msg = """Categorical\\.categories are different
+
+Categorical\\.categories values are different \\(100\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[4, 3, 2, 1\\], dtype='int64'\\)"""
+        with pytest.raises(AssertionError, match=msg):
+            assert_categorical_equal(c1, c2, **kwargs)
+    else:
+        assert_categorical_equal(c1, c2, **kwargs)
+
+
+def test_categorical_equal_categories_mismatch():
+    msg = """Categorical\\.categories are different
+
+Categorical\\.categories values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 5\\], dtype='int64'\\)"""
+
+    c1 = Categorical([1, 2, 3, 4])
+    c2 = Categorical([1, 2, 3, 5])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_categorical_equal(c1, c2)
+
+
+def test_categorical_equal_codes_mismatch():
+    categories = [1, 2, 3, 4]
+    msg = """Categorical\\.codes are different
+
+Categorical\\.codes values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[0, 1, 3, 2\\]
+\\[right\\]: \\[0, 1, 2, 3\\]"""
+
+    c1 = Categorical([1, 2, 4, 3], categories=categories)
+    c2 = Categorical([1, 2, 3, 4], categories=categories)
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_categorical_equal(c1, c2)
+
+
+def test_categorical_equal_ordered_mismatch():
+    data = [1, 2, 3, 4]
+    msg = """Categorical are different
+
+Attribute "ordered" are different
+\\[left\\]:  False
+\\[right\\]: True"""
+
+    c1 = Categorical(data, ordered=False)
+    c2 = Categorical(data, ordered=True)
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_categorical_equal(c1, c2)
+
+
+@pytest.mark.parametrize("obj", ["index", "foo", "pandas"])
+def test_categorical_equal_object_override(obj):
+    data = [1, 2, 3, 4]
+    msg = """{obj} are different
+
+Attribute "ordered" are different
+\\[left\\]:  False
+\\[right\\]: True""".format(obj=obj)
+
+    c1 = Categorical(data, ordered=False)
+    c2 = Categorical(data, ordered=True)
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_categorical_equal(c1, c2, obj=obj)
diff --git a/pandas/tests/util/test_assert_extension_array_equal.py b/pandas/tests/util/test_assert_extension_array_equal.py
new file mode 100644
index 0000000000000..3149078a56783
--- /dev/null
+++ b/pandas/tests/util/test_assert_extension_array_equal.py
@@ -0,0 +1,102 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas.core.arrays.sparse import SparseArray
+from pandas.util.testing import assert_extension_array_equal
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(),  # Default is check_exact=False
+    dict(check_exact=False), dict(check_exact=True)
+])
+def test_assert_extension_array_equal_not_exact(kwargs):
+    # see gh-23709
+    arr1 = SparseArray([-0.17387645482451206, 0.3414148016424936])
+    arr2 = SparseArray([-0.17387645482451206, 0.3414148016424937])
+
+    if kwargs.get("check_exact", False):
+        msg = """\
+ExtensionArray are different
+
+ExtensionArray values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[-0\\.17387645482.*, 0\\.341414801642.*\\]
+\\[right\\]: \\[-0\\.17387645482.*, 0\\.341414801642.*\\]"""
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_extension_array_equal(arr1, arr2, **kwargs)
+    else:
+        assert_extension_array_equal(arr1, arr2, **kwargs)
+
+
+@pytest.mark.parametrize("check_less_precise", [
+    True, False, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9
+])
+def test_assert_extension_array_equal_less_precise(check_less_precise):
+    arr1 = SparseArray([0.5, 0.123456])
+    arr2 = SparseArray([0.5, 0.123457])
+
+    kwargs = dict(check_less_precise=check_less_precise)
+
+    if check_less_precise is False or check_less_precise >= 5:
+        msg = """\
+ExtensionArray are different
+
+ExtensionArray values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[0\\.5, 0\\.123456\\]
+\\[right\\]: \\[0\\.5, 0\\.123457\\]"""
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_extension_array_equal(arr1, arr2, **kwargs)
+    else:
+        assert_extension_array_equal(arr1, arr2, **kwargs)
+
+
+def test_assert_extension_array_equal_dtype_mismatch(check_dtype):
+    end = 5
+    kwargs = dict(check_dtype=check_dtype)
+
+    arr1 = SparseArray(np.arange(end, dtype="int64"))
+    arr2 = SparseArray(np.arange(end, dtype="int32"))
+
+    if check_dtype:
+        msg = """\
+ExtensionArray are different
+
+Attribute "dtype" are different
+\\[left\\]:  Sparse\\[int64, 0\\]
+\\[right\\]: Sparse\\[int32, 0\\]"""
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_extension_array_equal(arr1, arr2, **kwargs)
+    else:
+        assert_extension_array_equal(arr1, arr2, **kwargs)
+
+
+def test_assert_extension_array_equal_missing_values():
+    arr1 = SparseArray([np.nan, 1, 2, np.nan])
+    arr2 = SparseArray([np.nan, 1, 2, 3])
+
+    msg = """\
+ExtensionArray NA mask are different
+
+ExtensionArray NA mask values are different \\(25\\.0 %\\)
+\\[left\\]:  \\[True, False, False, True\\]
+\\[right\\]: \\[True, False, False, False\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_extension_array_equal(arr1, arr2)
+
+
+@pytest.mark.parametrize("side", ["left", "right"])
+def test_assert_extension_array_equal_non_extension_array(side):
+    numpy_array = np.arange(5)
+    extension_array = SparseArray(numpy_array)
+
+    msg = "{side} is not an ExtensionArray".format(side=side)
+    args = ((numpy_array, extension_array) if side == "left"
+            else (extension_array, numpy_array))
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_extension_array_equal(*args)
diff --git a/pandas/tests/util/test_assert_frame_equal.py b/pandas/tests/util/test_assert_frame_equal.py
new file mode 100644
index 0000000000000..1a941c0f0c265
--- /dev/null
+++ b/pandas/tests/util/test_assert_frame_equal.py
@@ -0,0 +1,209 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas import DataFrame
+from pandas.util.testing import assert_frame_equal
+
+
+@pytest.fixture(params=[True, False])
+def by_blocks(request):
+    return request.param
+
+
+def _assert_frame_equal_both(a, b, **kwargs):
+    """
+    Check that two DataFrame equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : DataFrame
+        The first DataFrame to compare.
+    b : DataFrame
+        The second DataFrame to compare.
+    kwargs : dict
+        The arguments passed to `assert_frame_equal`.
+    """
+    assert_frame_equal(a, b, **kwargs)
+    assert_frame_equal(b, a, **kwargs)
+
+
+def _assert_not_frame_equal(a, b, **kwargs):
+    """
+    Check that two DataFrame are not equal.
+
+    Parameters
+    ----------
+    a : DataFrame
+        The first DataFrame to compare.
+    b : DataFrame
+        The second DataFrame to compare.
+    kwargs : dict
+        The arguments passed to `assert_frame_equal`.
+    """
+    try:
+        assert_frame_equal(a, b, **kwargs)
+        msg = "The two DataFrames were equal when they shouldn't have been"
+
+        pytest.fail(msg=msg)
+    except AssertionError:
+        pass
+
+
+def _assert_not_frame_equal_both(a, b, **kwargs):
+    """
+    Check that two DataFrame are not equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : DataFrame
+        The first DataFrame to compare.
+    b : DataFrame
+        The second DataFrame to compare.
+    kwargs : dict
+        The arguments passed to `assert_frame_equal`.
+    """
+    _assert_not_frame_equal(a, b, **kwargs)
+    _assert_not_frame_equal(b, a, **kwargs)
+
+
+@pytest.mark.parametrize("check_like", [True, False])
+def test_frame_equal_row_order_mismatch(check_like):
+    df1 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]},
+                    index=["a", "b", "c"])
+    df2 = DataFrame({"A": [3, 2, 1], "B": [6, 5, 4]},
+                    index=["c", "b", "a"])
+
+    if not check_like:  # Do not ignore row-column orderings.
+        msg = "DataFrame.index are different"
+        with pytest.raises(AssertionError, match=msg):
+            assert_frame_equal(df1, df2, check_like=check_like)
+    else:
+        _assert_frame_equal_both(df1, df2, check_like=check_like)
+
+
+@pytest.mark.parametrize("df1,df2", [
+    (DataFrame({"A": [1, 2, 3]}), DataFrame({"A": [1, 2, 3, 4]})),
+    (DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]}), DataFrame({"A": [1, 2, 3]})),
+])
+def test_frame_equal_shape_mismatch(df1, df2):
+    msg = "DataFrame are different"
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_frame_equal(df1, df2)
+
+
+@pytest.mark.parametrize("df1,df2,msg", [
+    # Index
+    (DataFrame.from_records({"a": [1, 2],
+                             "c": ["l1", "l2"]}, index=["a"]),
+     DataFrame.from_records({"a": [1.0, 2.0],
+                             "c": ["l1", "l2"]}, index=["a"]),
+     "DataFrame\\.index are different"),
+
+    # MultiIndex
+    (DataFrame.from_records({"a": [1, 2], "b": [2.1, 1.5],
+                             "c": ["l1", "l2"]}, index=["a", "b"]),
+     DataFrame.from_records({"a": [1.0, 2.0], "b": [2.1, 1.5],
+                             "c": ["l1", "l2"]}, index=["a", "b"]),
+     "MultiIndex level \\[0\\] are different")
+])
+def test_frame_equal_index_dtype_mismatch(df1, df2, msg, check_index_type):
+    kwargs = dict(check_index_type=check_index_type)
+
+    if check_index_type:
+        with pytest.raises(AssertionError, match=msg):
+            assert_frame_equal(df1, df2, **kwargs)
+    else:
+        assert_frame_equal(df1, df2, **kwargs)
+
+
+def test_empty_dtypes(check_dtype):
+    columns = ["col1", "col2"]
+    df1 = DataFrame(columns=columns)
+    df2 = DataFrame(columns=columns)
+
+    kwargs = dict(check_dtype=check_dtype)
+    df1["col1"] = df1["col1"].astype("int64")
+
+    if check_dtype:
+        msg = "Attributes are different"
+        with pytest.raises(AssertionError, match=msg):
+            assert_frame_equal(df1, df2, **kwargs)
+    else:
+        assert_frame_equal(df1, df2, **kwargs)
+
+
+def test_frame_equal_index_mismatch():
+    msg = """DataFrame\\.index are different
+
+DataFrame\\.index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Index\\(\\[u?'a', u?'b', u?'c'\\], dtype='object'\\)
+\\[right\\]: Index\\(\\[u?'a', u?'b', u?'d'\\], dtype='object'\\)"""
+
+    df1 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]},
+                    index=["a", "b", "c"])
+    df2 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]},
+                    index=["a", "b", "d"])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_frame_equal(df1, df2)
+
+
+def test_frame_equal_columns_mismatch():
+    msg = """DataFrame\\.columns are different
+
+DataFrame\\.columns values are different \\(50\\.0 %\\)
+\\[left\\]:  Index\\(\\[u?'A', u?'B'\\], dtype='object'\\)
+\\[right\\]: Index\\(\\[u?'A', u?'b'\\], dtype='object'\\)"""
+
+    df1 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]},
+                    index=["a", "b", "c"])
+    df2 = DataFrame({"A": [1, 2, 3], "b": [4, 5, 6]},
+                    index=["a", "b", "c"])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_frame_equal(df1, df2)
+
+
+def test_frame_equal_block_mismatch(by_blocks):
+    msg = """DataFrame\\.iloc\\[:, 1\\] are different
+
+DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[4, 5, 6\\]
+\\[right\\]: \\[4, 5, 7\\]"""
+
+    df1 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 6]})
+    df2 = DataFrame({"A": [1, 2, 3], "B": [4, 5, 7]})
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_frame_equal(df1, df2, by_blocks=by_blocks)
+
+
+@pytest.mark.parametrize("df1,df2,msg", [
+    (DataFrame({"A": [u"á", u"à", u"ä"], "E": [u"é", u"è", u"ë"]}),
+     DataFrame({"A": [u"á", u"à", u"ä"], "E": [u"é", u"è", u"e̊"]}),
+     """DataFrame\\.iloc\\[:, 1\\] are different
+
+DataFrame\\.iloc\\[:, 1\\] values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[é, è, ë\\]
+\\[right\\]: \\[é, è, e̊\\]"""),
+    (DataFrame({"A": [u"á", u"à", u"ä"], "E": [u"é", u"è", u"ë"]}),
+     DataFrame({"A": ["a", "a", "a"], "E": ["e", "e", "e"]}),
+     """DataFrame\\.iloc\\[:, 0\\] are different
+
+DataFrame\\.iloc\\[:, 0\\] values are different \\(100\\.0 %\\)
+\\[left\\]:  \\[á, à, ä\\]
+\\[right\\]: \\[a, a, a\\]"""),
+])
+def test_frame_equal_unicode(df1, df2, msg, by_blocks):
+    # see gh-20503
+    #
+    # Test ensures that `assert_frame_equals` raises the right exception
+    # when comparing DataFrames containing differing unicode objects.
+    with pytest.raises(AssertionError, match=msg):
+        assert_frame_equal(df1, df2, by_blocks=by_blocks)
diff --git a/pandas/tests/util/test_assert_index_equal.py b/pandas/tests/util/test_assert_index_equal.py
new file mode 100644
index 0000000000000..b5409bf7cd2bf
--- /dev/null
+++ b/pandas/tests/util/test_assert_index_equal.py
@@ -0,0 +1,179 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import Categorical, Index, MultiIndex, NaT
+from pandas.util.testing import assert_index_equal
+
+
+def test_index_equal_levels_mismatch():
+    msg = """Index are different
+
+Index levels are different
+\\[left\\]:  1, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: 2, MultiIndex\\(levels=\\[\\[u?'A', u?'B'\\], \\[1, 2, 3, 4\\]\\],
+           codes=\\[\\[0, 0, 1, 1\\], \\[0, 1, 2, 3\\]\\]\\)"""
+
+    idx1 = Index([1, 2, 3])
+    idx2 = MultiIndex.from_tuples([("A", 1), ("A", 2),
+                                   ("B", 3), ("B", 4)])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, exact=False)
+
+
+def test_index_equal_values_mismatch(check_exact):
+    msg = """MultiIndex level \\[1\\] are different
+
+MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+    idx1 = MultiIndex.from_tuples([("A", 2), ("A", 2),
+                                   ("B", 3), ("B", 4)])
+    idx2 = MultiIndex.from_tuples([("A", 1), ("A", 2),
+                                   ("B", 3), ("B", 4)])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, check_exact=check_exact)
+
+
+def test_index_equal_length_mismatch(check_exact):
+    msg = """Index are different
+
+Index length are different
+\\[left\\]:  3, Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: 4, Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+    idx1 = Index([1, 2, 3])
+    idx2 = Index([1, 2, 3, 4])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, check_exact=check_exact)
+
+
+def test_index_equal_class_mismatch(check_exact):
+    msg = """Index are different
+
+Index classes are different
+\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: Float64Index\\(\\[1\\.0, 2\\.0, 3\\.0\\], dtype='float64'\\)"""
+
+    idx1 = Index([1, 2, 3])
+    idx2 = Index([1, 2, 3.0])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, exact=True, check_exact=check_exact)
+
+
+def test_index_equal_values_close(check_exact):
+    idx1 = Index([1, 2, 3.])
+    idx2 = Index([1, 2, 3.0000000001])
+
+    if check_exact:
+        msg = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
+\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0000000001\\], dtype='float64'\\)"""
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_index_equal(idx1, idx2, check_exact=check_exact)
+    else:
+        assert_index_equal(idx1, idx2, check_exact=check_exact)
+
+
+def test_index_equal_values_less_close(check_exact, check_less_precise):
+    idx1 = Index([1, 2, 3.])
+    idx2 = Index([1, 2, 3.0001])
+    kwargs = dict(check_exact=check_exact,
+                  check_less_precise=check_less_precise)
+
+    if check_exact or not check_less_precise:
+        msg = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Float64Index\\(\\[1.0, 2.0, 3.0], dtype='float64'\\)
+\\[right\\]: Float64Index\\(\\[1.0, 2.0, 3.0001\\], dtype='float64'\\)"""
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_index_equal(idx1, idx2, **kwargs)
+    else:
+        assert_index_equal(idx1, idx2, **kwargs)
+
+
+def test_index_equal_values_too_far(check_exact, check_less_precise):
+    idx1 = Index([1, 2, 3])
+    idx2 = Index([1, 2, 4])
+    kwargs = dict(check_exact=check_exact,
+                  check_less_precise=check_less_precise)
+
+    msg = """Index are different
+
+Index values are different \\(33\\.33333 %\\)
+\\[left\\]:  Int64Index\\(\\[1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 4\\], dtype='int64'\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, **kwargs)
+
+
+def test_index_equal_level_values_mismatch(check_exact, check_less_precise):
+    idx1 = MultiIndex.from_tuples([("A", 2), ("A", 2),
+                                   ("B", 3), ("B", 4)])
+    idx2 = MultiIndex.from_tuples([("A", 1), ("A", 2),
+                                   ("B", 3), ("B", 4)])
+    kwargs = dict(check_exact=check_exact,
+                  check_less_precise=check_less_precise)
+
+    msg = """MultiIndex level \\[1\\] are different
+
+MultiIndex level \\[1\\] values are different \\(25\\.0 %\\)
+\\[left\\]:  Int64Index\\(\\[2, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_index_equal(idx1, idx2, **kwargs)
+
+
+@pytest.mark.parametrize("name1,name2", [
+    (None, "x"), ("x", "x"), (np.nan, np.nan), (NaT, NaT), (np.nan, NaT)
+])
+def test_index_equal_names(name1, name2):
+    msg = """Index are different
+
+Attribute "names" are different
+\\[left\\]:  \\[{name1}\\]
+\\[right\\]: \\[{name2}\\]"""
+
+    idx1 = Index([1, 2, 3], name=name1)
+    idx2 = Index([1, 2, 3], name=name2)
+
+    if name1 == name2 or name1 is name2:
+        assert_index_equal(idx1, idx2)
+    else:
+        name1 = "u?'x'" if name1 == "x" else name1
+        name2 = "u?'x'" if name2 == "x" else name2
+        msg = msg.format(name1=name1, name2=name2)
+
+        with pytest.raises(AssertionError, match=msg):
+            assert_index_equal(idx1, idx2)
+
+
+def test_index_equal_category_mismatch(check_categorical):
+    msg = """Index are different
+
+Attribute "dtype" are different
+\\[left\\]:  CategoricalDtype\\(categories=\\[u?'a', u?'b'\\], ordered=False\\)
+\\[right\\]: CategoricalDtype\\(categories=\\[u?'a', u?'b', u?'c'\\], \
+ordered=False\\)"""
+
+    idx1 = Index(Categorical(["a", "b"]))
+    idx2 = Index(Categorical(["a", "b"], categories=["a", "b", "c"]))
+
+    if check_categorical:
+        with pytest.raises(AssertionError, match=msg):
+            assert_index_equal(idx1, idx2, check_categorical=check_categorical)
+    else:
+        assert_index_equal(idx1, idx2, check_categorical=check_categorical)
diff --git a/pandas/tests/util/test_assert_interval_array_equal.py b/pandas/tests/util/test_assert_interval_array_equal.py
new file mode 100644
index 0000000000000..c81a27f9b3f19
--- /dev/null
+++ b/pandas/tests/util/test_assert_interval_array_equal.py
@@ -0,0 +1,80 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas import interval_range
+from pandas.util.testing import assert_interval_array_equal
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(start=0, periods=4),
+    dict(start=1, periods=5),
+    dict(start=5, end=10, closed="left"),
+])
+def test_interval_array_equal(kwargs):
+    arr = interval_range(**kwargs).values
+    assert_interval_array_equal(arr, arr)
+
+
+def test_interval_array_equal_closed_mismatch():
+    kwargs = dict(start=0, periods=5)
+    arr1 = interval_range(closed="left", **kwargs).values
+    arr2 = interval_range(closed="right", **kwargs).values
+
+    msg = """\
+IntervalArray are different
+
+Attribute "closed" are different
+\\[left\\]:  left
+\\[right\\]: right"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_interval_array_equal(arr1, arr2)
+
+
+def test_interval_array_equal_periods_mismatch():
+    kwargs = dict(start=0)
+    arr1 = interval_range(periods=5, **kwargs).values
+    arr2 = interval_range(periods=6, **kwargs).values
+
+    msg = """\
+IntervalArray.left are different
+
+IntervalArray.left length are different
+\\[left\\]:  5, Int64Index\\(\\[0, 1, 2, 3, 4\\], dtype='int64'\\)
+\\[right\\]: 6, Int64Index\\(\\[0, 1, 2, 3, 4, 5\\], dtype='int64'\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_interval_array_equal(arr1, arr2)
+
+
+def test_interval_array_equal_end_mismatch():
+    kwargs = dict(start=0, periods=5)
+    arr1 = interval_range(end=10, **kwargs).values
+    arr2 = interval_range(end=20, **kwargs).values
+
+    msg = """\
+IntervalArray.left are different
+
+IntervalArray.left values are different \\(80.0 %\\)
+\\[left\\]:  Int64Index\\(\\[0, 2, 4, 6, 8\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[0, 4, 8, 12, 16\\], dtype='int64'\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_interval_array_equal(arr1, arr2)
+
+
+def test_interval_array_equal_start_mismatch():
+    kwargs = dict(periods=4)
+    arr1 = interval_range(start=0, **kwargs).values
+    arr2 = interval_range(start=1, **kwargs).values
+
+    msg = """\
+IntervalArray.left are different
+
+IntervalArray.left values are different \\(100.0 %\\)
+\\[left\\]:  Int64Index\\(\\[0, 1, 2, 3\\], dtype='int64'\\)
+\\[right\\]: Int64Index\\(\\[1, 2, 3, 4\\], dtype='int64'\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_interval_array_equal(arr1, arr2)
diff --git a/pandas/tests/util/test_assert_numpy_array_equal.py b/pandas/tests/util/test_assert_numpy_array_equal.py
new file mode 100644
index 0000000000000..99037fcf96194
--- /dev/null
+++ b/pandas/tests/util/test_assert_numpy_array_equal.py
@@ -0,0 +1,177 @@
+# -*- coding: utf-8 -*-
+
+import numpy as np
+import pytest
+
+from pandas import Timestamp
+from pandas.util.testing import assert_numpy_array_equal
+
+
+def test_assert_numpy_array_equal_shape_mismatch():
+    msg = """numpy array are different
+
+numpy array shapes are different
+\\[left\\]:  \\(2L*,\\)
+\\[right\\]: \\(3L*,\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([1, 2]), np.array([3, 4, 5]))
+
+
+def test_assert_numpy_array_equal_bad_type():
+    expected = "Expected type"
+
+    with pytest.raises(AssertionError, match=expected):
+        assert_numpy_array_equal(1, 2)
+
+
+@pytest.mark.parametrize("a,b,klass1,klass2", [
+    (np.array([1]), 1, "ndarray", "int"),
+    (1, np.array([1]), "int", "ndarray"),
+])
+def test_assert_numpy_array_equal_class_mismatch(a, b, klass1, klass2):
+    msg = """numpy array are different
+
+numpy array classes are different
+\\[left\\]:  {klass1}
+\\[right\\]: {klass2}""".format(klass1=klass1, klass2=klass2)
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(a, b)
+
+
+def test_assert_numpy_array_equal_value_mismatch1():
+    msg = """numpy array are different
+
+numpy array values are different \\(66\\.66667 %\\)
+\\[left\\]:  \\[nan, 2\\.0, 3\\.0\\]
+\\[right\\]: \\[1\\.0, nan, 3\\.0\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([np.nan, 2, 3]),
+                                 np.array([1, np.nan, 3]))
+
+
+def test_assert_numpy_array_equal_value_mismatch2():
+    msg = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1, 2\\]
+\\[right\\]: \\[1, 3\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([1, 2]), np.array([1, 3]))
+
+
+def test_assert_numpy_array_equal_value_mismatch3():
+    msg = """numpy array are different
+
+numpy array values are different \\(16\\.66667 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([[1, 2], [3, 4], [5, 6]]),
+                                 np.array([[1, 3], [3, 4], [5, 6]]))
+
+
+def test_assert_numpy_array_equal_value_mismatch4():
+    msg = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[1\\.1, 2\\.000001\\]
+\\[right\\]: \\[1\\.1, 2.0\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([1.1, 2.000001]),
+                                 np.array([1.1, 2.0]))
+
+
+def test_assert_numpy_array_equal_value_mismatch5():
+    msg = """numpy array are different
+
+numpy array values are different \\(16\\.66667 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\], \\[5, 6\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\], \\[5, 6\\]\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([[1, 2], [3, 4], [5, 6]]),
+                                 np.array([[1, 3], [3, 4], [5, 6]]))
+
+
+def test_assert_numpy_array_equal_value_mismatch6():
+    msg = """numpy array are different
+
+numpy array values are different \\(25\\.0 %\\)
+\\[left\\]:  \\[\\[1, 2\\], \\[3, 4\\]\\]
+\\[right\\]: \\[\\[1, 3\\], \\[3, 4\\]\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([[1, 2], [3, 4]]),
+                                 np.array([[1, 3], [3, 4]]))
+
+
+def test_assert_numpy_array_equal_shape_mismatch_override():
+    msg = """Index are different
+
+Index shapes are different
+\\[left\\]:  \\(2L*,\\)
+\\[right\\]: \\(3L*,\\)"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([1, 2]),
+                                 np.array([3, 4, 5]),
+                                 obj="Index")
+
+
+def test_numpy_array_equal_unicode():
+    # see gh-20503
+    #
+    # Test ensures that `assert_numpy_array_equals` raises the right
+    # exception when comparing np.arrays containing differing unicode objects.
+    msg = """numpy array are different
+
+numpy array values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[á, à, ä\\]
+\\[right\\]: \\[á, à, å\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(np.array([u"á", u"à", u"ä"]),
+                                 np.array([u"á", u"à", u"å"]))
+
+
+def test_numpy_array_equal_object():
+    a = np.array([Timestamp("2011-01-01"), Timestamp("2011-01-01")])
+    b = np.array([Timestamp("2011-01-01"), Timestamp("2011-01-02")])
+
+    msg = """numpy array are different
+
+numpy array values are different \\(50\\.0 %\\)
+\\[left\\]:  \\[2011-01-01 00:00:00, 2011-01-01 00:00:00\\]
+\\[right\\]: \\[2011-01-01 00:00:00, 2011-01-02 00:00:00\\]"""
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_numpy_array_equal(a, b)
+
+
+@pytest.mark.parametrize("other_type", ["same", "copy"])
+@pytest.mark.parametrize("check_same", ["same", "copy"])
+def test_numpy_array_equal_copy_flag(other_type, check_same):
+    a = np.array([1, 2, 3])
+    msg = None
+
+    if other_type == "same":
+        other = a.view()
+    else:
+        other = a.copy()
+
+    if check_same != other_type:
+        msg = (r"array\(\[1, 2, 3\]\) is not array\(\[1, 2, 3\]\)"
+               if check_same == "same"
+               else r"array\(\[1, 2, 3\]\) is array\(\[1, 2, 3\]\)")
+
+    if msg is not None:
+        with pytest.raises(AssertionError, match=msg):
+            assert_numpy_array_equal(a, other, check_same=check_same)
+    else:
+        assert_numpy_array_equal(a, other, check_same=check_same)
diff --git a/pandas/tests/util/test_assert_series_equal.py b/pandas/tests/util/test_assert_series_equal.py
new file mode 100644
index 0000000000000..537a0e01ff85f
--- /dev/null
+++ b/pandas/tests/util/test_assert_series_equal.py
@@ -0,0 +1,185 @@
+# -*- coding: utf-8 -*-
+
+import pytest
+
+from pandas import Categorical, DataFrame, Series
+from pandas.util.testing import assert_series_equal
+
+
+def _assert_series_equal_both(a, b, **kwargs):
+    """
+    Check that two Series equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : Series
+        The first Series to compare.
+    b : Series
+        The second Series to compare.
+    kwargs : dict
+        The arguments passed to `assert_series_equal`.
+    """
+    assert_series_equal(a, b, **kwargs)
+    assert_series_equal(b, a, **kwargs)
+
+
+def _assert_not_series_equal(a, b, **kwargs):
+    """
+    Check that two Series are not equal.
+
+    Parameters
+    ----------
+    a : Series
+        The first Series to compare.
+    b : Series
+        The second Series to compare.
+    kwargs : dict
+        The arguments passed to `assert_series_equal`.
+    """
+    try:
+        assert_series_equal(a, b, **kwargs)
+        msg = "The two Series were equal when they shouldn't have been"
+
+        pytest.fail(msg=msg)
+    except AssertionError:
+        pass
+
+
+def _assert_not_series_equal_both(a, b, **kwargs):
+    """
+    Check that two Series are not equal.
+
+    This check is performed commutatively.
+
+    Parameters
+    ----------
+    a : Series
+        The first Series to compare.
+    b : Series
+        The second Series to compare.
+    kwargs : dict
+        The arguments passed to `assert_series_equal`.
+    """
+    _assert_not_series_equal(a, b, **kwargs)
+    _assert_not_series_equal(b, a, **kwargs)
+
+
+@pytest.mark.parametrize("data", [
+    range(3), list("abc"), list(u"áàä"),
+])
+def test_series_equal(data):
+    _assert_series_equal_both(Series(data), Series(data))
+
+
+@pytest.mark.parametrize("data1,data2", [
+    (range(3), range(1, 4)),
+    (list("abc"), list("xyz")),
+    (list(u"áàä"), list(u"éèë")),
+    (list(u"áàä"), list(b"aaa")),
+    (range(3), range(4)),
+])
+def test_series_not_equal_value_mismatch(data1, data2):
+    _assert_not_series_equal_both(Series(data1), Series(data2))
+
+
+@pytest.mark.parametrize("kwargs", [
+    dict(dtype="float64"),  # dtype mismatch
+    dict(index=[1, 2, 4]),  # index mismatch
+    dict(name="foo"),       # name mismatch
+])
+def test_series_not_equal_metadata_mismatch(kwargs):
+    data = range(3)
+    s1 = Series(data)
+
+    s2 = Series(data, **kwargs)
+    _assert_not_series_equal_both(s1, s2)
+
+
+@pytest.mark.parametrize("data1,data2", [(0.12345, 0.12346), (0.1235, 0.1236)])
+@pytest.mark.parametrize("dtype", ["float32", "float64"])
+@pytest.mark.parametrize("check_less_precise", [False, True, 0, 1, 2, 3, 10])
+def test_less_precise(data1, data2, dtype, check_less_precise):
+    s1 = Series([data1], dtype=dtype)
+    s2 = Series([data2], dtype=dtype)
+
+    kwargs = dict(check_less_precise=check_less_precise)
+
+    if ((check_less_precise is False or check_less_precise == 10) or
+            ((check_less_precise is True or check_less_precise >= 3) and
+             abs(data1 - data2) >= 0.0001)):
+        msg = "Series values are different"
+        with pytest.raises(AssertionError, match=msg):
+            assert_series_equal(s1, s2, **kwargs)
+    else:
+        _assert_series_equal_both(s1, s2, **kwargs)
+
+
+@pytest.mark.parametrize("s1,s2,msg", [
+    # Index
+    (Series(["l1", "l2"], index=[1, 2]),
+     Series(["l1", "l2"], index=[1., 2.]),
+     "Series\\.index are different"),
+
+    # MultiIndex
+    (DataFrame.from_records({"a": [1, 2], "b": [2.1, 1.5],
+                             "c": ["l1", "l2"]}, index=["a", "b"]).c,
+     DataFrame.from_records({"a": [1., 2.], "b": [2.1, 1.5],
+                             "c": ["l1", "l2"]}, index=["a", "b"]).c,
+     "MultiIndex level \\[0\\] are different")
+])
+def test_series_equal_index_dtype(s1, s2, msg, check_index_type):
+    kwargs = dict(check_index_type=check_index_type)
+
+    if check_index_type:
+        with pytest.raises(AssertionError, match=msg):
+            assert_series_equal(s1, s2, **kwargs)
+    else:
+        assert_series_equal(s1, s2, **kwargs)
+
+
+def test_series_equal_length_mismatch(check_less_precise):
+    msg = """Series are different
+
+Series length are different
+\\[left\\]:  3, RangeIndex\\(start=0, stop=3, step=1\\)
+\\[right\\]: 4, RangeIndex\\(start=0, stop=4, step=1\\)"""
+
+    s1 = Series([1, 2, 3])
+    s2 = Series([1, 2, 3, 4])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_series_equal(s1, s2, check_less_precise=check_less_precise)
+
+
+def test_series_equal_values_mismatch(check_less_precise):
+    msg = """Series are different
+
+Series values are different \\(33\\.33333 %\\)
+\\[left\\]:  \\[1, 2, 3\\]
+\\[right\\]: \\[1, 2, 4\\]"""
+
+    s1 = Series([1, 2, 3])
+    s2 = Series([1, 2, 4])
+
+    with pytest.raises(AssertionError, match=msg):
+        assert_series_equal(s1, s2, check_less_precise=check_less_precise)
+
+
+def test_series_equal_categorical_mismatch(check_categorical):
+    msg = """Attributes are different
+
+Attribute "dtype" are different
+\\[left\\]:  CategoricalDtype\\(categories=\\[u?'a', u?'b'\\], ordered=False\\)
+\\[right\\]: CategoricalDtype\\(categories=\\[u?'a', u?'b', u?'c'\\], \
+ordered=False\\)"""
+
+    s1 = Series(Categorical(["a", "b"]))
+    s2 = Series(Categorical(["a", "b"], categories=list("abc")))
+
+    if check_categorical:
+        with pytest.raises(AssertionError, match=msg):
+            assert_series_equal(s1, s2, check_categorical=check_categorical)
+    else:
+        _assert_series_equal_both(s1, s2, check_categorical=check_categorical)
diff --git a/pandas/tests/util/test_deprecate.py b/pandas/tests/util/test_deprecate.py
new file mode 100644
index 0000000000000..7fa7989eff690
--- /dev/null
+++ b/pandas/tests/util/test_deprecate.py
@@ -0,0 +1,63 @@
+from textwrap import dedent
+
+import pytest
+
+from pandas.util._decorators import deprecate
+
+import pandas.util.testing as tm
+
+
+def new_func():
+    """
+    This is the summary. The deprecate directive goes next.
+
+    This is the extended summary. The deprecate directive goes before this.
+    """
+    return 'new_func called'
+
+
+def new_func_no_docstring():
+    return 'new_func_no_docstring called'
+
+
+def new_func_wrong_docstring():
+    """Summary should be in the next line."""
+    return 'new_func_wrong_docstring called'
+
+
+def new_func_with_deprecation():
+    """
+    This is the summary. The deprecate directive goes next.
+
+    .. deprecated:: 1.0
+        Use new_func instead.
+
+    This is the extended summary. The deprecate directive goes before this.
+    """
+    pass
+
+
+def test_deprecate_ok():
+    depr_func = deprecate('depr_func', new_func, '1.0',
+                          msg='Use new_func instead.')
+
+    with tm.assert_produces_warning(FutureWarning):
+        result = depr_func()
+
+    assert result == 'new_func called'
+    assert depr_func.__doc__ == dedent(new_func_with_deprecation.__doc__)
+
+
+def test_deprecate_no_docstring():
+    depr_func = deprecate('depr_func', new_func_no_docstring, '1.0',
+                          msg='Use new_func instead.')
+    with tm.assert_produces_warning(FutureWarning):
+        result = depr_func()
+    assert result == 'new_func_no_docstring called'
+
+
+def test_deprecate_wrong_docstring():
+    with pytest.raises(AssertionError, match='deprecate needs a correctly '
+                                             'formatted docstring'):
+        deprecate('depr_func', new_func_wrong_docstring, '1.0',
+                  msg='Use new_func instead.')
diff --git a/pandas/tests/util/test_deprecate_kwarg.py b/pandas/tests/util/test_deprecate_kwarg.py
new file mode 100644
index 0000000000000..7287df9db8a62
--- /dev/null
+++ b/pandas/tests/util/test_deprecate_kwarg.py
@@ -0,0 +1,93 @@
+# -*- coding: utf-8 -*-
+import pytest
+
+from pandas.util._decorators import deprecate_kwarg
+
+import pandas.util.testing as tm
+
+
+@deprecate_kwarg("old", "new")
+def _f1(new=False):
+    return new
+
+
+_f2_mappings = {"yes": True, "no": False}
+
+
+@deprecate_kwarg("old", "new", _f2_mappings)
+def _f2(new=False):
+    return new
+
+
+def _f3_mapping(x):
+    return x + 1
+
+
+@deprecate_kwarg("old", "new", _f3_mapping)
+def _f3(new=0):
+    return new
+
+
+@pytest.mark.parametrize("key,klass", [
+    ("old", FutureWarning),
+    ("new", None)
+])
+def test_deprecate_kwarg(key, klass):
+    x = 78
+
+    with tm.assert_produces_warning(klass):
+        assert _f1(**{key: x}) == x
+
+
+@pytest.mark.parametrize("key", list(_f2_mappings.keys()))
+def test_dict_deprecate_kwarg(key):
+    with tm.assert_produces_warning(FutureWarning):
+        assert _f2(old=key) == _f2_mappings[key]
+
+
+@pytest.mark.parametrize("key", ["bogus", 12345, -1.23])
+def test_missing_deprecate_kwarg(key):
+    with tm.assert_produces_warning(FutureWarning):
+        assert _f2(old=key) == key
+
+
+@pytest.mark.parametrize("x", [1, -1.4, 0])
+def test_callable_deprecate_kwarg(x):
+    with tm.assert_produces_warning(FutureWarning):
+        assert _f3(old=x) == _f3_mapping(x)
+
+
+def test_callable_deprecate_kwarg_fail():
+    msg = "((can only|cannot) concatenate)|(must be str)|(Can't convert)"
+
+    with pytest.raises(TypeError, match=msg):
+        _f3(old="hello")
+
+
+def test_bad_deprecate_kwarg():
+    msg = "mapping from old to new argument values must be dict or callable!"
+
+    with pytest.raises(TypeError, match=msg):
+        @deprecate_kwarg("old", "new", 0)
+        def f4(new=None):
+            return new
+
+
+@deprecate_kwarg("old", None)
+def _f4(old=True, unchanged=True):
+    return old, unchanged
+
+
+@pytest.mark.parametrize("key", ["old", "unchanged"])
+def test_deprecate_keyword(key):
+    x = 9
+
+    if key == "old":
+        klass = FutureWarning
+        expected = (x, True)
+    else:
+        klass = None
+        expected = (True, x)
+
+    with tm.assert_produces_warning(klass):
+        assert _f4(**{key: x}) == expected
diff --git a/pandas/tests/util/test_hashing.py b/pandas/tests/util/test_hashing.py
new file mode 100644
index 0000000000000..c80b4483c0482
--- /dev/null
+++ b/pandas/tests/util/test_hashing.py
@@ -0,0 +1,327 @@
+import datetime
+
+import numpy as np
+import pytest
+
+import pandas as pd
+from pandas import DataFrame, Index, MultiIndex, Series
+from pandas.core.util.hashing import _hash_scalar, hash_tuple, hash_tuples
+from pandas.util import hash_array, hash_pandas_object
+import pandas.util.testing as tm
+
+
+@pytest.fixture(params=[
+    Series([1, 2, 3] * 3, dtype="int32"),
+    Series([None, 2.5, 3.5] * 3, dtype="float32"),
+    Series(["a", "b", "c"] * 3, dtype="category"),
+    Series(["d", "e", "f"] * 3),
+    Series([True, False, True] * 3),
+    Series(pd.date_range("20130101", periods=9)),
+    Series(pd.date_range("20130101", periods=9, tz="US/Eastern")),
+    Series(pd.timedelta_range("2000", periods=9))])
+def series(request):
+    return request.param
+
+
+@pytest.fixture(params=[True, False])
+def index(request):
+    return request.param
+
+
+def _check_equal(obj, **kwargs):
+    """
+    Check that hashing an objects produces the same value each time.
+
+    Parameters
+    ----------
+    obj : object
+        The object to hash.
+    kwargs : kwargs
+        Keyword arguments to pass to the hashing function.
+    """
+    a = hash_pandas_object(obj, **kwargs)
+    b = hash_pandas_object(obj, **kwargs)
+    tm.assert_series_equal(a, b)
+
+
+def _check_not_equal_with_index(obj):
+    """
+    Check the hash of an object with and without its index is not the same.
+
+    Parameters
+    ----------
+    obj : object
+        The object to hash.
+    """
+    if not isinstance(obj, Index):
+        a = hash_pandas_object(obj, index=True)
+        b = hash_pandas_object(obj, index=False)
+
+        if len(obj):
+            assert not (a == b).all()
+
+
+def test_consistency():
+    # Check that our hash doesn't change because of a mistake
+    # in the actual code; this is the ground truth.
+    result = hash_pandas_object(Index(["foo", "bar", "baz"]))
+    expected = Series(np.array([3600424527151052760, 1374399572096150070,
+                                477881037637427054], dtype="uint64"),
+                      index=["foo", "bar", "baz"])
+    tm.assert_series_equal(result, expected)
+
+
+def test_hash_array(series):
+    arr = series.values
+    tm.assert_numpy_array_equal(hash_array(arr), hash_array(arr))
+
+
+@pytest.mark.parametrize("arr2", [
+    np.array([3, 4, "All"]),
+    np.array([3, 4, "All"], dtype=object),
+])
+def test_hash_array_mixed(arr2):
+    result1 = hash_array(np.array(["3", "4", "All"]))
+    result2 = hash_array(arr2)
+
+    tm.assert_numpy_array_equal(result1, result2)
+
+
+@pytest.mark.parametrize("val", [5, "foo", pd.Timestamp("20130101")])
+def test_hash_array_errors(val):
+    msg = "must pass a ndarray-like"
+    with pytest.raises(TypeError, match=msg):
+        hash_array(val)
+
+
+def test_hash_tuples():
+    tuples = [(1, "one"), (1, "two"), (2, "one")]
+    result = hash_tuples(tuples)
+
+    expected = hash_pandas_object(MultiIndex.from_tuples(tuples)).values
+    tm.assert_numpy_array_equal(result, expected)
+
+    result = hash_tuples(tuples[0])
+    assert result == expected[0]
+
+
+@pytest.mark.parametrize("tup", [
+    (1, "one"), (1, np.nan), (1.0, pd.NaT, "A"),
+    ("A", pd.Timestamp("2012-01-01"))])
+def test_hash_tuple(tup):
+    # Test equivalence between
+    # hash_tuples and hash_tuple.
+    result = hash_tuple(tup)
+    expected = hash_tuples([tup])[0]
+
+    assert result == expected
+
+
+@pytest.mark.parametrize("val", [
+    1, 1.4, "A", b"A", u"A", pd.Timestamp("2012-01-01"),
+    pd.Timestamp("2012-01-01", tz="Europe/Brussels"),
+    datetime.datetime(2012, 1, 1),
+    pd.Timestamp("2012-01-01", tz="EST").to_pydatetime(),
+    pd.Timedelta("1 days"), datetime.timedelta(1),
+    pd.Period("2012-01-01", freq="D"), pd.Interval(0, 1),
+    np.nan, pd.NaT, None])
+def test_hash_scalar(val):
+    result = _hash_scalar(val)
+    expected = hash_array(np.array([val], dtype=object), categorize=True)
+
+    assert result[0] == expected[0]
+
+
+@pytest.mark.parametrize("val", [5, "foo", pd.Timestamp("20130101")])
+def test_hash_tuples_err(val):
+    msg = "must be convertible to a list-of-tuples"
+    with pytest.raises(TypeError, match=msg):
+        hash_tuples(val)
+
+
+def test_multiindex_unique():
+    mi = MultiIndex.from_tuples([(118, 472), (236, 118),
+                                 (51, 204), (102, 51)])
+    assert mi.is_unique is True
+
+    result = hash_pandas_object(mi)
+    assert result.is_unique is True
+
+
+def test_multiindex_objects():
+    mi = MultiIndex(levels=[["b", "d", "a"], [1, 2, 3]],
+                    codes=[[0, 1, 0, 2], [2, 0, 0, 1]],
+                    names=["col1", "col2"])
+    recons = mi._sort_levels_monotonic()
+
+    # These are equal.
+    assert mi.equals(recons)
+    assert Index(mi.values).equals(Index(recons.values))
+
+    # _hashed_values and hash_pandas_object(..., index=False) equivalency.
+    expected = hash_pandas_object(mi, index=False).values
+    result = mi._hashed_values
+
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = hash_pandas_object(recons, index=False).values
+    result = recons._hashed_values
+
+    tm.assert_numpy_array_equal(result, expected)
+
+    expected = mi._hashed_values
+    result = recons._hashed_values
+
+    # Values should match, but in different order.
+    tm.assert_numpy_array_equal(np.sort(result), np.sort(expected))
+
+
+@pytest.mark.parametrize("obj", [
+    Series([1, 2, 3]),
+    Series([1.0, 1.5, 3.2]),
+    Series([1.0, 1.5, np.nan]),
+    Series([1.0, 1.5, 3.2], index=[1.5, 1.1, 3.3]),
+    Series(["a", "b", "c"]),
+    Series(["a", np.nan, "c"]),
+    Series(["a", None, "c"]),
+    Series([True, False, True]),
+    Series(),
+    Index([1, 2, 3]),
+    Index([True, False, True]),
+    DataFrame({"x": ["a", "b", "c"], "y": [1, 2, 3]}),
+    DataFrame(),
+    tm.makeMissingDataframe(),
+    tm.makeMixedDataFrame(),
+    tm.makeTimeDataFrame(),
+    tm.makeTimeSeries(),
+    tm.makeTimedeltaIndex(),
+    tm.makePeriodIndex(),
+    Series(tm.makePeriodIndex()),
+    Series(pd.date_range("20130101", periods=3, tz="US/Eastern")),
+    MultiIndex.from_product([range(5), ["foo", "bar", "baz"],
+                             pd.date_range("20130101", periods=2)]),
+    MultiIndex.from_product([pd.CategoricalIndex(list("aabc")), range(3)])
+])
+def test_hash_pandas_object(obj, index):
+    _check_equal(obj, index=index)
+    _check_not_equal_with_index(obj)
+
+
+def test_hash_pandas_object2(series, index):
+    _check_equal(series, index=index)
+    _check_not_equal_with_index(series)
+
+
+@pytest.mark.parametrize("obj", [
+    Series([], dtype="float64"), Series([], dtype="object"), Index([])])
+def test_hash_pandas_empty_object(obj, index):
+    # These are by-definition the same with
+    # or without the index as the data is empty.
+    _check_equal(obj, index=index)
+
+
+@pytest.mark.parametrize("s1", [
+    Series(["a", "b", "c", "d"]),
+    Series([1000, 2000, 3000, 4000]),
+    Series(pd.date_range(0, periods=4))])
+@pytest.mark.parametrize("categorize", [True, False])
+def test_categorical_consistency(s1, categorize):
+    # see gh-15143
+    #
+    # Check that categoricals hash consistent with their values,
+    # not codes. This should work for categoricals of any dtype.
+    s2 = s1.astype("category").cat.set_categories(s1)
+    s3 = s2.cat.set_categories(list(reversed(s1)))
+
+    # These should all hash identically.
+    h1 = hash_pandas_object(s1, categorize=categorize)
+    h2 = hash_pandas_object(s2, categorize=categorize)
+    h3 = hash_pandas_object(s3, categorize=categorize)
+
+    tm.assert_series_equal(h1, h2)
+    tm.assert_series_equal(h1, h3)
+
+
+def test_categorical_with_nan_consistency():
+    c = pd.Categorical.from_codes(
+        [-1, 0, 1, 2, 3, 4],
+        categories=pd.date_range("2012-01-01", periods=5, name="B"))
+    expected = hash_array(c, categorize=False)
+
+    c = pd.Categorical.from_codes(
+        [-1, 0],
+        categories=[pd.Timestamp("2012-01-01")])
+    result = hash_array(c, categorize=False)
+
+    assert result[0] in expected
+    assert result[1] in expected
+
+
+@pytest.mark.parametrize("obj", [pd.Timestamp("20130101")])
+def test_pandas_errors(obj):
+    msg = "Unexpected type for hashing"
+    with pytest.raises(TypeError, match=msg):
+        hash_pandas_object(obj)
+
+
+def test_hash_keys():
+    # Using different hash keys, should have
+    # different hashes for the same data.
+    #
+    # This only matters for object dtypes.
+    obj = Series(list("abc"))
+
+    a = hash_pandas_object(obj, hash_key="9876543210123456")
+    b = hash_pandas_object(obj, hash_key="9876543210123465")
+
+    assert (a != b).all()
+
+
+def test_invalid_key():
+    # This only matters for object dtypes.
+    msg = "key should be a 16-byte string encoded"
+
+    with pytest.raises(ValueError, match=msg):
+        hash_pandas_object(Series(list("abc")), hash_key="foo")
+
+
+def test_already_encoded(index):
+    # If already encoded, then ok.
+    obj = Series(list("abc")).str.encode("utf8")
+    _check_equal(obj, index=index)
+
+
+def test_alternate_encoding(index):
+    obj = Series(list("abc"))
+    _check_equal(obj, index=index, encoding="ascii")
+
+
+@pytest.mark.parametrize("l_exp", range(8))
+@pytest.mark.parametrize("l_add", [0, 1])
+def test_same_len_hash_collisions(l_exp, l_add):
+    length = 2**(l_exp + 8) + l_add
+    s = tm.rands_array(length, 2)
+
+    result = hash_array(s, "utf8")
+    assert not result[0] == result[1]
+
+
+def test_hash_collisions():
+    # Hash collisions are bad.
+    #
+    # https://github.com/pandas-dev/pandas/issues/14711#issuecomment-264885726
+    hashes = ["Ingrid-9Z9fKIZmkO7i7Cn51Li34pJm44fgX6DYGBNj3VPlOH50m7HnBlPxfIwFMrcNJNMP6PSgLmwWnInciMWrCSAlLEvt7JkJl4IxiMrVbXSa8ZQoVaq5xoQPjltuJEfwdNlO6jo8qRRHvD8sBEBMQASrRa6TsdaPTPCBo3nwIBpE7YzzmyH0vMBhjQZLx1aCT7faSEx7PgFxQhHdKFWROcysamgy9iVj8DO2Fmwg1NNl93rIAqC3mdqfrCxrzfvIY8aJdzin2cHVzy3QUJxZgHvtUtOLxoqnUHsYbNTeq0xcLXpTZEZCxD4PGubIuCNf32c33M7HFsnjWSEjE2yVdWKhmSVodyF8hFYVmhYnMCztQnJrt3O8ZvVRXd5IKwlLexiSp4h888w7SzAIcKgc3g5XQJf6MlSMftDXm9lIsE1mJNiJEv6uY6pgvC3fUPhatlR5JPpVAHNSbSEE73MBzJrhCAbOLXQumyOXigZuPoME7QgJcBalliQol7YZ9",  # noqa
+              "Tim-b9MddTxOWW2AT1Py6vtVbZwGAmYCjbp89p8mxsiFoVX4FyDOF3wFiAkyQTUgwg9sVqVYOZo09Dh1AzhFHbgij52ylF0SEwgzjzHH8TGY8Lypart4p4onnDoDvVMBa0kdthVGKl6K0BDVGzyOXPXKpmnMF1H6rJzqHJ0HywfwS4XYpVwlAkoeNsiicHkJUFdUAhG229INzvIAiJuAHeJDUoyO4DCBqtoZ5TDend6TK7Y914yHlfH3g1WZu5LksKv68VQHJriWFYusW5e6ZZ6dKaMjTwEGuRgdT66iU5nqWTHRH8WSzpXoCFwGcTOwyuqPSe0fTe21DVtJn1FKj9F9nEnR9xOvJUO7E0piCIF4Ad9yAIDY4DBimpsTfKXCu1vdHpKYerzbndfuFe5AhfMduLYZJi5iAw8qKSwR5h86ttXV0Mc0QmXz8dsRvDgxjXSmupPxBggdlqUlC828hXiTPD7am0yETBV0F3bEtvPiNJfremszcV8NcqAoARMe"]  # noqa
+
+    # These should be different.
+    result1 = hash_array(np.asarray(hashes[0:1], dtype=object), "utf8")
+    expected1 = np.array([14963968704024874985], dtype=np.uint64)
+    tm.assert_numpy_array_equal(result1, expected1)
+
+    result2 = hash_array(np.asarray(hashes[1:2], dtype=object), "utf8")
+    expected2 = np.array([16428432627716348016], dtype=np.uint64)
+    tm.assert_numpy_array_equal(result2, expected2)
+
+    result = hash_array(np.asarray(hashes, dtype=object), "utf8")
+    tm.assert_numpy_array_equal(result, np.concatenate([expected1,
+                                                        expected2], axis=0))
diff --git a/pandas/tests/util/test_locale.py b/pandas/tests/util/test_locale.py
new file mode 100644
index 0000000000000..b848b22994e7a
--- /dev/null
+++ b/pandas/tests/util/test_locale.py
@@ -0,0 +1,94 @@
+# -*- coding: utf-8 -*-
+import codecs
+import locale
+import os
+
+import pytest
+
+from pandas.compat import is_platform_windows
+
+import pandas.core.common as com
+import pandas.util.testing as tm
+
+_all_locales = tm.get_locales() or []
+_current_locale = locale.getlocale()
+
+# Don't run any of these tests if we are on Windows or have no locales.
+pytestmark = pytest.mark.skipif(is_platform_windows() or not _all_locales,
+                                reason="Need non-Windows and locales")
+
+_skip_if_only_one_locale = pytest.mark.skipif(
+    len(_all_locales) <= 1, reason="Need multiple locales for meaningful test")
+
+
+def test_can_set_locale_valid_set():
+    # Can set the default locale.
+    assert tm.can_set_locale("")
+
+
+def test_can_set_locale_invalid_set():
+    # Cannot set an invalid locale.
+    assert not tm.can_set_locale("non-existent_locale")
+
+
+def test_can_set_locale_invalid_get(monkeypatch):
+    # see gh-22129
+    #
+    # In some cases, an invalid locale can be set,
+    # but a subsequent getlocale() raises a ValueError.
+
+    def mock_get_locale():
+        raise ValueError()
+
+    with monkeypatch.context() as m:
+        m.setattr(locale, "getlocale", mock_get_locale)
+        assert not tm.can_set_locale("")
+
+
+def test_get_locales_at_least_one():
+    # see gh-9744
+    assert len(_all_locales) > 0
+
+
+@_skip_if_only_one_locale
+def test_get_locales_prefix():
+    first_locale = _all_locales[0]
+    assert len(tm.get_locales(prefix=first_locale[:2])) > 0
+
+
+@_skip_if_only_one_locale
+def test_set_locale():
+    if com._all_none(_current_locale):
+        # Not sure why, but on some Travis runs with pytest,
+        # getlocale() returned (None, None).
+        pytest.skip("Current locale is not set.")
+
+    locale_override = os.environ.get("LOCALE_OVERRIDE", None)
+
+    if locale_override is None:
+        lang, enc = "it_CH", "UTF-8"
+    elif locale_override == "C":
+        lang, enc = "en_US", "ascii"
+    else:
+        lang, enc = locale_override.split(".")
+
+    enc = codecs.lookup(enc).name
+    new_locale = lang, enc
+
+    if not tm.can_set_locale(new_locale):
+        msg = "unsupported locale setting"
+
+        with pytest.raises(locale.Error, match=msg):
+            with tm.set_locale(new_locale):
+                pass
+    else:
+        with tm.set_locale(new_locale) as normalized_locale:
+            new_lang, new_enc = normalized_locale.split(".")
+            new_enc = codecs.lookup(enc).name
+
+            normalized_locale = new_lang, new_enc
+            assert normalized_locale == new_locale
+
+    # Once we exit the "with" statement, locale should be back to what it was.
+    current_locale = locale.getlocale()
+    assert current_locale == _current_locale
diff --git a/pandas/tests/util/test_move.py b/pandas/tests/util/test_move.py
new file mode 100644
index 0000000000000..ef98f2032e6ca
--- /dev/null
+++ b/pandas/tests/util/test_move.py
@@ -0,0 +1,79 @@
+# -*- coding: utf-8 -*-
+import sys
+from uuid import uuid4
+
+import pytest
+
+from pandas.compat import PY3, intern
+from pandas.util._move import BadMove, move_into_mutable_buffer, stolenbuf
+
+
+def test_cannot_create_instance_of_stolen_buffer():
+    # Stolen buffers need to be created through the smart constructor
+    # "move_into_mutable_buffer," which has a bunch of checks in it.
+
+    msg = "cannot create 'pandas.util._move.stolenbuf' instances"
+    with pytest.raises(TypeError, match=msg):
+        stolenbuf()
+
+
+def test_more_than_one_ref():
+    # Test case for when we try to use "move_into_mutable_buffer"
+    # when the object being moved has other references.
+
+    b = b"testing"
+
+    with pytest.raises(BadMove, match="testing") as e:
+        def handle_success(type_, value, tb):
+            assert value.args[0] is b
+            return type(e).handle_success(e, type_, value, tb)  # super
+
+        e.handle_success = handle_success
+        move_into_mutable_buffer(b)
+
+
+def test_exactly_one_ref():
+    # Test case for when the object being moved has exactly one reference.
+
+    b = b"testing"
+
+    # We need to pass an expression on the stack to ensure that there are
+    # not extra references hanging around. We cannot rewrite this test as
+    #   buf = b[:-3]
+    #   as_stolen_buf = move_into_mutable_buffer(buf)
+    # because then we would have more than one reference to buf.
+    as_stolen_buf = move_into_mutable_buffer(b[:-3])
+
+    # Materialize as byte-array to show that it is mutable.
+    assert bytearray(as_stolen_buf) == b"test"
+
+
+@pytest.mark.skipif(PY3, reason="bytes objects cannot be interned in PY3")
+def test_interned():
+    salt = uuid4().hex
+
+    def make_string():
+        # We need to actually create a new string so that it has refcount
+        # one. We use a uuid so that we know the string could not already
+        # be in the intern table.
+        return "".join(("testing: ", salt))
+
+    # This should work, the string has one reference on the stack.
+    move_into_mutable_buffer(make_string())
+    refcount = [None]  # nonlocal
+
+    def ref_capture(ob):
+        # Subtract two because those are the references owned by this frame:
+        #   1. The local variables of this stack frame.
+        #   2. The python data stack of this stack frame.
+        refcount[0] = sys.getrefcount(ob) - 2
+        return ob
+
+    with pytest.raises(BadMove, match="testing"):
+        # If we intern the string, it will still have one reference. Now,
+        # it is in the intern table, so if other people intern the same
+        # string while the mutable buffer holds the first string they will
+        # be the same instance.
+        move_into_mutable_buffer(ref_capture(intern(make_string())))  # noqa
+
+    assert refcount[0] == 1
diff --git a/pandas/tests/util/test_safe_import.py b/pandas/tests/util/test_safe_import.py
new file mode 100644
index 0000000000000..a9c52ef788390
--- /dev/null
+++ b/pandas/tests/util/test_safe_import.py
@@ -0,0 +1,45 @@
+# -*- coding: utf-8 -*-
+import sys
+import types
+
+import pytest
+
+import pandas.util._test_decorators as td
+
+
+@pytest.mark.parametrize("name", ["foo", "hello123"])
+def test_safe_import_non_existent(name):
+    assert not td.safe_import(name)
+
+
+def test_safe_import_exists():
+    assert td.safe_import("pandas")
+
+
+@pytest.mark.parametrize("min_version,valid", [
+    ("0.0.0", True),
+    ("99.99.99", False)
+])
+def test_safe_import_versions(min_version, valid):
+    result = td.safe_import("pandas", min_version=min_version)
+    result = result if valid else not result
+    assert result
+
+
+@pytest.mark.parametrize("min_version,valid", [
+    (None, False),
+    ("1.0", True),
+    ("2.0", False)
+])
+def test_safe_import_dummy(monkeypatch, min_version, valid):
+    mod_name = "hello123"
+
+    mod = types.ModuleType(mod_name)
+    mod.__version__ = "1.5"
+
+    if min_version is not None:
+        monkeypatch.setitem(sys.modules, mod_name, mod)
+
+    result = td.safe_import(mod_name, min_version=min_version)
+    result = result if valid else not result
+    assert result
diff --git a/pandas/tests/util/test_util.py b/pandas/tests/util/test_util.py
new file mode 100644
index 0000000000000..e40784fd5467c
--- /dev/null
+++ b/pandas/tests/util/test_util.py
@@ -0,0 +1,127 @@
+# -*- coding: utf-8 -*-
+import os
+import sys
+
+import pytest
+
+import pandas.compat as compat
+from pandas.compat import raise_with_traceback
+from pandas.util._decorators import deprecate_kwarg, make_signature
+from pandas.util._validators import validate_kwargs
+
+import pandas.util.testing as tm
+
+
+def test_rands():
+    r = tm.rands(10)
+    assert len(r) == 10
+
+
+def test_rands_array_1d():
+    arr = tm.rands_array(5, size=10)
+    assert arr.shape == (10,)
+    assert len(arr[0]) == 5
+
+
+def test_rands_array_2d():
+    arr = tm.rands_array(7, size=(10, 10))
+    assert arr.shape == (10, 10)
+    assert len(arr[1, 1]) == 7
+
+
+def test_numpy_err_state_is_default():
+    expected = {"over": "warn", "divide": "warn",
+                "invalid": "warn", "under": "ignore"}
+    import numpy as np
+
+    # The error state should be unchanged after that import.
+    assert np.geterr() == expected
+
+
+@pytest.mark.parametrize("func,expected", [
+    # Case where the func does not have default kwargs.
+    (validate_kwargs, (["fname", "kwargs", "compat_args"],
+                       ["fname", "kwargs", "compat_args"])),
+
+    # Case where the func does have default kwargs.
+    (deprecate_kwarg, (["old_arg_name", "new_arg_name",
+                        "mapping=None", "stacklevel=2"],
+                       ["old_arg_name", "new_arg_name",
+                        "mapping", "stacklevel"]))
+])
+def test_make_signature(func, expected):
+    # see gh-17608
+    assert make_signature(func) == expected
+
+
+def test_raise_with_traceback():
+    with pytest.raises(LookupError, match="error_text"):
+        try:
+            raise ValueError("THIS IS AN ERROR")
+        except ValueError:
+            e = LookupError("error_text")
+            raise_with_traceback(e)
+
+    with pytest.raises(LookupError, match="error_text"):
+        try:
+            raise ValueError("This is another error")
+        except ValueError:
+            e = LookupError("error_text")
+            _, _, traceback = sys.exc_info()
+            raise_with_traceback(e, traceback)
+
+
+def test_convert_rows_list_to_csv_str():
+    rows_list = ["aaa", "bbb", "ccc"]
+    ret = tm.convert_rows_list_to_csv_str(rows_list)
+
+    if compat.is_platform_windows():
+        expected = "aaa\r\nbbb\r\nccc\r\n"
+    else:
+        expected = "aaa\nbbb\nccc\n"
+
+    assert ret == expected
+
+
+def test_create_temp_directory():
+    with tm.ensure_clean_dir() as path:
+        assert os.path.exists(path)
+        assert os.path.isdir(path)
+    assert not os.path.exists(path)
+
+
+def test_assert_raises_regex_deprecated():
+    # see gh-23592
+
+    with tm.assert_produces_warning(FutureWarning):
+        msg = "Not equal!"
+
+        with tm.assert_raises_regex(AssertionError, msg):
+            assert 1 == 2, msg
+
+
+@pytest.mark.parametrize('strict_data_files', [True, False])
+def test_datapath_missing(datapath):
+    with pytest.raises(ValueError, match="Could not find file"):
+        datapath("not_a_file")
+
+
+def test_datapath(datapath):
+    args = ("data", "iris.csv")
+
+    result = datapath(*args)
+    expected = os.path.join(os.path.dirname(os.path.dirname(__file__)), *args)
+
+    assert result == expected
+
+
+def test_rng_context():
+    import numpy as np
+
+    expected0 = 1.764052345967664
+    expected1 = 1.6243453636632417
+
+    with tm.RNGContext(0):
+        with tm.RNGContext(1):
+            assert np.random.randn() == expected1
+        assert np.random.randn() == expected0
diff --git a/pandas/tests/util/test_validate_args.py b/pandas/tests/util/test_validate_args.py
new file mode 100644
index 0000000000000..ca71b0c9d2522
--- /dev/null
+++ b/pandas/tests/util/test_validate_args.py
@@ -0,0 +1,76 @@
+# -*- coding: utf-8 -*-
+from collections import OrderedDict
+
+import pytest
+
+from pandas.util._validators import validate_args
+
+_fname = "func"
+
+
+def test_bad_min_fname_arg_count():
+    msg = "'max_fname_arg_count' must be non-negative"
+
+    with pytest.raises(ValueError, match=msg):
+        validate_args(_fname, (None,), -1, "foo")
+
+
+def test_bad_arg_length_max_value_single():
+    args = (None, None)
+    compat_args = ("foo",)
+
+    min_fname_arg_count = 0
+    max_length = len(compat_args) + min_fname_arg_count
+    actual_length = len(args) + min_fname_arg_count
+    msg = (r"{fname}\(\) takes at most {max_length} "
+           r"argument \({actual_length} given\)"
+           .format(fname=_fname, max_length=max_length,
+                   actual_length=actual_length))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_args(_fname, args, min_fname_arg_count, compat_args)
+
+
+def test_bad_arg_length_max_value_multiple():
+    args = (None, None)
+    compat_args = dict(foo=None)
+
+    min_fname_arg_count = 2
+    max_length = len(compat_args) + min_fname_arg_count
+    actual_length = len(args) + min_fname_arg_count
+    msg = (r"{fname}\(\) takes at most {max_length} "
+           r"arguments \({actual_length} given\)"
+           .format(fname=_fname, max_length=max_length,
+                   actual_length=actual_length))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_args(_fname, args, min_fname_arg_count, compat_args)
+
+
+@pytest.mark.parametrize("i", range(1, 3))
+def test_not_all_defaults(i):
+    bad_arg = "foo"
+    msg = ("the '{arg}' parameter is not supported "
+           r"in the pandas implementation of {func}\(\)".
+           format(arg=bad_arg, func=_fname))
+
+    compat_args = OrderedDict()
+    compat_args["foo"] = 2
+    compat_args["bar"] = -1
+    compat_args["baz"] = 3
+
+    arg_vals = (1, -1, 3)
+
+    with pytest.raises(ValueError, match=msg):
+        validate_args(_fname, arg_vals[:i], 2, compat_args)
+
+
+def test_validation():
+    # No exceptions should be raised.
+    validate_args(_fname, (None,), 2, dict(out=None))
+
+    compat_args = OrderedDict()
+    compat_args["axis"] = 1
+    compat_args["out"] = None
+
+    validate_args(_fname, (1, None), 2, compat_args)
diff --git a/pandas/tests/util/test_validate_args_and_kwargs.py b/pandas/tests/util/test_validate_args_and_kwargs.py
new file mode 100644
index 0000000000000..c3c0b3dedc085
--- /dev/null
+++ b/pandas/tests/util/test_validate_args_and_kwargs.py
@@ -0,0 +1,105 @@
+# -*- coding: utf-8 -*-
+from collections import OrderedDict
+
+import pytest
+
+from pandas.util._validators import validate_args_and_kwargs
+
+_fname = "func"
+
+
+def test_invalid_total_length_max_length_one():
+    compat_args = ("foo",)
+    kwargs = {"foo": "FOO"}
+    args = ("FoO", "BaZ")
+
+    min_fname_arg_count = 0
+    max_length = len(compat_args) + min_fname_arg_count
+    actual_length = len(kwargs) + len(args) + min_fname_arg_count
+
+    msg = (r"{fname}\(\) takes at most {max_length} "
+           r"argument \({actual_length} given\)"
+           .format(fname=_fname, max_length=max_length,
+                   actual_length=actual_length))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_args_and_kwargs(_fname, args, kwargs,
+                                 min_fname_arg_count,
+                                 compat_args)
+
+
+def test_invalid_total_length_max_length_multiple():
+    compat_args = ("foo", "bar", "baz")
+    kwargs = {"foo": "FOO", "bar": "BAR"}
+    args = ("FoO", "BaZ")
+
+    min_fname_arg_count = 2
+    max_length = len(compat_args) + min_fname_arg_count
+    actual_length = len(kwargs) + len(args) + min_fname_arg_count
+
+    msg = (r"{fname}\(\) takes at most {max_length} "
+           r"arguments \({actual_length} given\)"
+           .format(fname=_fname, max_length=max_length,
+                   actual_length=actual_length))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_args_and_kwargs(_fname, args, kwargs,
+                                 min_fname_arg_count,
+                                 compat_args)
+
+
+@pytest.mark.parametrize("args,kwargs", [
+    ((), {"foo": -5, "bar": 2}),
+    ((-5, 2), {})
+])
+def test_missing_args_or_kwargs(args, kwargs):
+    bad_arg = "bar"
+    min_fname_arg_count = 2
+
+    compat_args = OrderedDict()
+    compat_args["foo"] = -5
+    compat_args[bad_arg] = 1
+
+    msg = (r"the '{arg}' parameter is not supported "
+           r"in the pandas implementation of {func}\(\)".
+           format(arg=bad_arg, func=_fname))
+
+    with pytest.raises(ValueError, match=msg):
+        validate_args_and_kwargs(_fname, args, kwargs,
+                                 min_fname_arg_count, compat_args)
+
+
+def test_duplicate_argument():
+    min_fname_arg_count = 2
+
+    compat_args = OrderedDict()
+    compat_args["foo"] = None
+    compat_args["bar"] = None
+    compat_args["baz"] = None
+
+    kwargs = {"foo": None, "bar": None}
+    args = (None,)  # duplicate value for "foo"
+
+    msg = (r"{fname}\(\) got multiple values for keyword "
+           r"argument '{arg}'".format(fname=_fname, arg="foo"))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_args_and_kwargs(_fname, args, kwargs,
+                                 min_fname_arg_count,
+                                 compat_args)
+
+
+def test_validation():
+    # No exceptions should be raised.
+    compat_args = OrderedDict()
+    compat_args["foo"] = 1
+    compat_args["bar"] = None
+    compat_args["baz"] = -2
+    kwargs = {"baz": -2}
+
+    args = (1, None)
+    min_fname_arg_count = 2
+
+    validate_args_and_kwargs(_fname, args, kwargs,
+                             min_fname_arg_count,
+                             compat_args)
diff --git a/pandas/tests/util/test_validate_kwargs.py b/pandas/tests/util/test_validate_kwargs.py
new file mode 100644
index 0000000000000..f36818ddfc9a8
--- /dev/null
+++ b/pandas/tests/util/test_validate_kwargs.py
@@ -0,0 +1,72 @@
+# -*- coding: utf-8 -*-
+from collections import OrderedDict
+
+import pytest
+
+from pandas.util._validators import validate_bool_kwarg, validate_kwargs
+
+_fname = "func"
+
+
+def test_bad_kwarg():
+    good_arg = "f"
+    bad_arg = good_arg + "o"
+
+    compat_args = OrderedDict()
+    compat_args[good_arg] = "foo"
+    compat_args[bad_arg + "o"] = "bar"
+    kwargs = {good_arg: "foo", bad_arg: "bar"}
+
+    msg = (r"{fname}\(\) got an unexpected "
+           r"keyword argument '{arg}'".format(fname=_fname, arg=bad_arg))
+
+    with pytest.raises(TypeError, match=msg):
+        validate_kwargs(_fname, kwargs, compat_args)
+
+
+@pytest.mark.parametrize("i", range(1, 3))
+def test_not_all_none(i):
+    bad_arg = "foo"
+    msg = (r"the '{arg}' parameter is not supported "
+           r"in the pandas implementation of {func}\(\)".
+           format(arg=bad_arg, func=_fname))
+
+    compat_args = OrderedDict()
+    compat_args["foo"] = 1
+    compat_args["bar"] = "s"
+    compat_args["baz"] = None
+
+    kwarg_keys = ("foo", "bar", "baz")
+    kwarg_vals = (2, "s", None)
+
+    kwargs = dict(zip(kwarg_keys[:i], kwarg_vals[:i]))
+
+    with pytest.raises(ValueError, match=msg):
+        validate_kwargs(_fname, kwargs, compat_args)
+
+
+def test_validation():
+    # No exceptions should be raised.
+    compat_args = OrderedDict()
+    compat_args["f"] = None
+    compat_args["b"] = 1
+    compat_args["ba"] = "s"
+
+    kwargs = dict(f=None, b=1)
+    validate_kwargs(_fname, kwargs, compat_args)
+
+
+@pytest.mark.parametrize("name", ["inplace", "copy"])
+@pytest.mark.parametrize("value", [1, "True", [1, 2, 3], 5.0])
+def test_validate_bool_kwarg_fail(name, value):
+    msg = ("For argument \"%s\" expected type bool, received type %s" %
+           (name, type(value).__name__))
+
+    with pytest.raises(ValueError, match=msg):
+        validate_bool_kwarg(value, name)
+
+
+@pytest.mark.parametrize("name", ["inplace", "copy"])
+@pytest.mark.parametrize("value", [True, False, None])
+def test_validate_bool_kwarg(name, value):
+    assert validate_bool_kwarg(value, name) == value
diff --git a/pandas/tools/concat.py b/pandas/tools/concat.py
deleted file mode 100644
index 6405106118472..0000000000000
--- a/pandas/tools/concat.py
+++ /dev/null
@@ -1,617 +0,0 @@
-"""
-concat routines
-"""
-
-import numpy as np
-from pandas import compat, DataFrame, Series, Index, MultiIndex
-from pandas.core.index import (_get_combined_index,
-                               _ensure_index, _get_consensus_names,
-                               _all_indexes_same)
-from pandas.core.categorical import (_factorize_from_iterable,
-                                     _factorize_from_iterables)
-from pandas.core.internals import concatenate_block_managers
-from pandas.core import common as com
-from pandas.core.generic import NDFrame
-import pandas.types.concat as _concat
-
-# ---------------------------------------------------------------------
-# Concatenate DataFrame objects
-
-
-def concat(objs, axis=0, join='outer', join_axes=None, ignore_index=False,
-           keys=None, levels=None, names=None, verify_integrity=False,
-           copy=True):
-    """
-    Concatenate pandas objects along a particular axis with optional set logic
-    along the other axes.
-
-    Can also add a layer of hierarchical indexing on the concatenation axis,
-    which may be useful if the labels are the same (or overlapping) on
-    the passed axis number.
-
-    Parameters
-    ----------
-    objs : a sequence or mapping of Series, DataFrame, or Panel objects
-        If a dict is passed, the sorted keys will be used as the `keys`
-        argument, unless it is passed, in which case the values will be
-        selected (see below). Any None objects will be dropped silently unless
-        they are all None in which case a ValueError will be raised
-    axis : {0/'index', 1/'columns'}, default 0
-        The axis to concatenate along
-    join : {'inner', 'outer'}, default 'outer'
-        How to handle indexes on other axis(es)
-    join_axes : list of Index objects
-        Specific indexes to use for the other n - 1 axes instead of performing
-        inner/outer set logic
-    ignore_index : boolean, default False
-        If True, do not use the index values along the concatenation axis. The
-        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
-        concatenating objects where the concatenation axis does not have
-        meaningful indexing information. Note the index values on the other
-        axes are still respected in the join.
-    keys : sequence, default None
-        If multiple levels passed, should contain tuples. Construct
-        hierarchical index using the passed keys as the outermost level
-    levels : list of sequences, default None
-        Specific levels (unique values) to use for constructing a
-        MultiIndex. Otherwise they will be inferred from the keys
-    names : list, default None
-        Names for the levels in the resulting hierarchical index
-    verify_integrity : boolean, default False
-        Check whether the new concatenated axis contains duplicates. This can
-        be very expensive relative to the actual data concatenation
-    copy : boolean, default True
-        If False, do not copy data unnecessarily
-
-    Returns
-    -------
-    concatenated : type of objects
-
-    Notes
-    -----
-    The keys, levels, and names arguments are all optional.
-
-    A walkthrough of how this method fits in with other tools for combining
-    panda objects can be found `here
-    <http://pandas.pydata.org/pandas-docs/stable/merging.html>`__.
-
-    See Also
-    --------
-    Series.append
-    DataFrame.append
-    DataFrame.join
-    DataFrame.merge
-
-    Examples
-    --------
-    Combine two ``Series``.
-
-    >>> s1 = pd.Series(['a', 'b'])
-    >>> s2 = pd.Series(['c', 'd'])
-    >>> pd.concat([s1, s2])
-    0    a
-    1    b
-    0    c
-    1    d
-    dtype: object
-
-    Clear the existing index and reset it in the result
-    by setting the ``ignore_index`` option to ``True``.
-
-    >>> pd.concat([s1, s2], ignore_index=True)
-    0    a
-    1    b
-    2    c
-    3    d
-    dtype: object
-
-    Add a hierarchical index at the outermost level of
-    the data with the ``keys`` option.
-
-    >>> pd.concat([s1, s2], keys=['s1', 's2',])
-    s1  0    a
-        1    b
-    s2  0    c
-        1    d
-    dtype: object
-
-    Label the index keys you create with the ``names`` option.
-
-    >>> pd.concat([s1, s2], keys=['s1', 's2'],
-    ...           names=['Series name', 'Row ID'])
-    Series name  Row ID
-    s1           0         a
-                 1         b
-    s2           0         c
-                 1         d
-    dtype: object
-
-    Combine two ``DataFrame`` objects with identical columns.
-
-    >>> df1 = pd.DataFrame([['a', 1], ['b', 2]],
-    ...                    columns=['letter', 'number'])
-    >>> df1
-      letter  number
-    0      a       1
-    1      b       2
-    >>> df2 = pd.DataFrame([['c', 3], ['d', 4]],
-    ...                    columns=['letter', 'number'])
-    >>> df2
-      letter  number
-    0      c       3
-    1      d       4
-    >>> pd.concat([df1, df2])
-      letter  number
-    0      a       1
-    1      b       2
-    0      c       3
-    1      d       4
-
-    Combine ``DataFrame`` objects with overlapping columns
-    and return everything. Columns outside the intersection will
-    be filled with ``NaN`` values.
-
-    >>> df3 = pd.DataFrame([['c', 3, 'cat'], ['d', 4, 'dog']],
-    ...                    columns=['letter', 'number', 'animal'])
-    >>> df3
-      letter  number animal
-    0      c       3    cat
-    1      d       4    dog
-    >>> pd.concat([df1, df3])
-      animal letter  number
-    0    NaN      a       1
-    1    NaN      b       2
-    0    cat      c       3
-    1    dog      d       4
-
-    Combine ``DataFrame`` objects with overlapping columns
-    and return only those that are shared by passing ``inner`` to
-    the ``join`` keyword argument.
-
-    >>> pd.concat([df1, df3], join="inner")
-      letter  number
-    0      a       1
-    1      b       2
-    0      c       3
-    1      d       4
-
-    Combine ``DataFrame`` objects horizontally along the x axis by
-    passing in ``axis=1``.
-
-    >>> df4 = pd.DataFrame([['bird', 'polly'], ['monkey', 'george']],
-    ...                    columns=['animal', 'name'])
-    >>> pd.concat([df1, df4], axis=1)
-      letter  number  animal    name
-    0      a       1    bird   polly
-    1      b       2  monkey  george
-
-    Prevent the result from including duplicate index values with the
-    ``verify_integrity`` option.
-
-    >>> df5 = pd.DataFrame([1], index=['a'])
-    >>> df5
-       0
-    a  1
-    >>> df6 = pd.DataFrame([2], index=['a'])
-    >>> df6
-       0
-    a  2
-    >>> pd.concat([df5, df6], verify_integrity=True)
-    ValueError: Indexes have overlapping values: ['a']
-    """
-    op = _Concatenator(objs, axis=axis, join_axes=join_axes,
-                       ignore_index=ignore_index, join=join,
-                       keys=keys, levels=levels, names=names,
-                       verify_integrity=verify_integrity,
-                       copy=copy)
-    return op.get_result()
-
-
-class _Concatenator(object):
-    """
-    Orchestrates a concatenation operation for BlockManagers
-    """
-
-    def __init__(self, objs, axis=0, join='outer', join_axes=None,
-                 keys=None, levels=None, names=None,
-                 ignore_index=False, verify_integrity=False, copy=True):
-        if isinstance(objs, (NDFrame, compat.string_types)):
-            raise TypeError('first argument must be an iterable of pandas '
-                            'objects, you passed an object of type '
-                            '"{0}"'.format(type(objs).__name__))
-
-        if join == 'outer':
-            self.intersect = False
-        elif join == 'inner':
-            self.intersect = True
-        else:  # pragma: no cover
-            raise ValueError('Only can inner (intersect) or outer (union) '
-                             'join the other axis')
-
-        if isinstance(objs, dict):
-            if keys is None:
-                keys = sorted(objs)
-            objs = [objs[k] for k in keys]
-        else:
-            objs = list(objs)
-
-        if len(objs) == 0:
-            raise ValueError('No objects to concatenate')
-
-        if keys is None:
-            objs = [obj for obj in objs if obj is not None]
-        else:
-            # #1649
-            clean_keys = []
-            clean_objs = []
-            for k, v in zip(keys, objs):
-                if v is None:
-                    continue
-                clean_keys.append(k)
-                clean_objs.append(v)
-            objs = clean_objs
-            name = getattr(keys, 'name', None)
-            keys = Index(clean_keys, name=name)
-
-        if len(objs) == 0:
-            raise ValueError('All objects passed were None')
-
-        # consolidate data & figure out what our result ndim is going to be
-        ndims = set()
-        for obj in objs:
-            if not isinstance(obj, NDFrame):
-                raise TypeError("cannot concatenate a non-NDFrame object")
-
-            # consolidate
-            obj._consolidate(inplace=True)
-            ndims.add(obj.ndim)
-
-        # get the sample
-        # want the higest ndim that we have, and must be non-empty
-        # unless all objs are empty
-        sample = None
-        if len(ndims) > 1:
-            max_ndim = max(ndims)
-            for obj in objs:
-                if obj.ndim == max_ndim and np.sum(obj.shape):
-                    sample = obj
-                    break
-
-        else:
-            # filter out the empties if we have not multi-index possibiltes
-            # note to keep empty Series as it affect to result columns / name
-            non_empties = [obj for obj in objs
-                           if sum(obj.shape) > 0 or isinstance(obj, Series)]
-
-            if (len(non_empties) and (keys is None and names is None and
-                                      levels is None and
-                                      join_axes is None and
-                                      not self.intersect)):
-                objs = non_empties
-                sample = objs[0]
-
-        if sample is None:
-            sample = objs[0]
-        self.objs = objs
-
-        # Standardize axis parameter to int
-        if isinstance(sample, Series):
-            axis = DataFrame()._get_axis_number(axis)
-        else:
-            axis = sample._get_axis_number(axis)
-
-        # Need to flip BlockManager axis in the DataFrame special case
-        self._is_frame = isinstance(sample, DataFrame)
-        if self._is_frame:
-            axis = 1 if axis == 0 else 0
-
-        self._is_series = isinstance(sample, Series)
-        if not 0 <= axis <= sample.ndim:
-            raise AssertionError("axis must be between 0 and {0}, "
-                                 "input was {1}".format(sample.ndim, axis))
-
-        # if we have mixed ndims, then convert to highest ndim
-        # creating column numbers as needed
-        if len(ndims) > 1:
-            current_column = 0
-            max_ndim = sample.ndim
-            self.objs, objs = [], self.objs
-            for obj in objs:
-
-                ndim = obj.ndim
-                if ndim == max_ndim:
-                    pass
-
-                elif ndim != max_ndim - 1:
-                    raise ValueError("cannot concatenate unaligned mixed "
-                                     "dimensional NDFrame objects")
-
-                else:
-                    name = getattr(obj, 'name', None)
-                    if ignore_index or name is None:
-                        name = current_column
-                        current_column += 1
-
-                    # doing a row-wise concatenation so need everything
-                    # to line up
-                    if self._is_frame and axis == 1:
-                        name = 0
-                    obj = sample._constructor({name: obj})
-
-                self.objs.append(obj)
-
-        # note: this is the BlockManager axis (since DataFrame is transposed)
-        self.axis = axis
-        self.join_axes = join_axes
-        self.keys = keys
-        self.names = names or getattr(keys, 'names', None)
-        self.levels = levels
-
-        self.ignore_index = ignore_index
-        self.verify_integrity = verify_integrity
-        self.copy = copy
-
-        self.new_axes = self._get_new_axes()
-
-    def get_result(self):
-
-        # series only
-        if self._is_series:
-
-            # stack blocks
-            if self.axis == 0:
-                # concat Series with length to keep dtype as much
-                non_empties = [x for x in self.objs if len(x) > 0]
-                if len(non_empties) > 0:
-                    values = [x._values for x in non_empties]
-                else:
-                    values = [x._values for x in self.objs]
-                new_data = _concat._concat_compat(values)
-
-                name = com._consensus_name_attr(self.objs)
-                cons = _concat._get_series_result_type(new_data)
-
-                return (cons(new_data, index=self.new_axes[0],
-                             name=name, dtype=new_data.dtype)
-                        .__finalize__(self, method='concat'))
-
-            # combine as columns in a frame
-            else:
-                data = dict(zip(range(len(self.objs)), self.objs))
-                cons = _concat._get_series_result_type(data)
-
-                index, columns = self.new_axes
-                df = cons(data, index=index)
-                df.columns = columns
-                return df.__finalize__(self, method='concat')
-
-        # combine block managers
-        else:
-            mgrs_indexers = []
-            for obj in self.objs:
-                mgr = obj._data
-                indexers = {}
-                for ax, new_labels in enumerate(self.new_axes):
-                    if ax == self.axis:
-                        # Suppress reindexing on concat axis
-                        continue
-
-                    obj_labels = mgr.axes[ax]
-                    if not new_labels.equals(obj_labels):
-                        indexers[ax] = obj_labels.reindex(new_labels)[1]
-
-                mgrs_indexers.append((obj._data, indexers))
-
-            new_data = concatenate_block_managers(
-                mgrs_indexers, self.new_axes, concat_axis=self.axis,
-                copy=self.copy)
-            if not self.copy:
-                new_data._consolidate_inplace()
-
-            cons = _concat._get_frame_result_type(new_data, self.objs)
-            return (cons._from_axes(new_data, self.new_axes)
-                    .__finalize__(self, method='concat'))
-
-    def _get_result_dim(self):
-        if self._is_series and self.axis == 1:
-            return 2
-        else:
-            return self.objs[0].ndim
-
-    def _get_new_axes(self):
-        ndim = self._get_result_dim()
-        new_axes = [None] * ndim
-
-        if self.join_axes is None:
-            for i in range(ndim):
-                if i == self.axis:
-                    continue
-                new_axes[i] = self._get_comb_axis(i)
-        else:
-            if len(self.join_axes) != ndim - 1:
-                raise AssertionError("length of join_axes must not be "
-                                     "equal to {0}".format(ndim - 1))
-
-            # ufff...
-            indices = compat.lrange(ndim)
-            indices.remove(self.axis)
-
-            for i, ax in zip(indices, self.join_axes):
-                new_axes[i] = ax
-
-        new_axes[self.axis] = self._get_concat_axis()
-        return new_axes
-
-    def _get_comb_axis(self, i):
-        if self._is_series:
-            all_indexes = [x.index for x in self.objs]
-        else:
-            try:
-                all_indexes = [x._data.axes[i] for x in self.objs]
-            except IndexError:
-                types = [type(x).__name__ for x in self.objs]
-                raise TypeError("Cannot concatenate list of %s" % types)
-
-        return _get_combined_index(all_indexes, intersect=self.intersect)
-
-    def _get_concat_axis(self):
-        """
-        Return index to be used along concatenation axis.
-        """
-        if self._is_series:
-            if self.axis == 0:
-                indexes = [x.index for x in self.objs]
-            elif self.ignore_index:
-                idx = com._default_index(len(self.objs))
-                return idx
-            elif self.keys is None:
-                names = [None] * len(self.objs)
-                num = 0
-                has_names = False
-                for i, x in enumerate(self.objs):
-                    if not isinstance(x, Series):
-                        raise TypeError("Cannot concatenate type 'Series' "
-                                        "with object of type "
-                                        "%r" % type(x).__name__)
-                    if x.name is not None:
-                        names[i] = x.name
-                        has_names = True
-                    else:
-                        names[i] = num
-                        num += 1
-                if has_names:
-                    return Index(names)
-                else:
-                    return com._default_index(len(self.objs))
-            else:
-                return _ensure_index(self.keys)
-        else:
-            indexes = [x._data.axes[self.axis] for x in self.objs]
-
-        if self.ignore_index:
-            idx = com._default_index(sum(len(i) for i in indexes))
-            return idx
-
-        if self.keys is None:
-            concat_axis = _concat_indexes(indexes)
-        else:
-            concat_axis = _make_concat_multiindex(indexes, self.keys,
-                                                  self.levels, self.names)
-
-        self._maybe_check_integrity(concat_axis)
-
-        return concat_axis
-
-    def _maybe_check_integrity(self, concat_index):
-        if self.verify_integrity:
-            if not concat_index.is_unique:
-                overlap = concat_index.get_duplicates()
-                raise ValueError('Indexes have overlapping values: %s'
-                                 % str(overlap))
-
-
-def _concat_indexes(indexes):
-    return indexes[0].append(indexes[1:])
-
-
-def _make_concat_multiindex(indexes, keys, levels=None, names=None):
-
-    if ((levels is None and isinstance(keys[0], tuple)) or
-            (levels is not None and len(levels) > 1)):
-        zipped = compat.lzip(*keys)
-        if names is None:
-            names = [None] * len(zipped)
-
-        if levels is None:
-            _, levels = _factorize_from_iterables(zipped)
-        else:
-            levels = [_ensure_index(x) for x in levels]
-    else:
-        zipped = [keys]
-        if names is None:
-            names = [None]
-
-        if levels is None:
-            levels = [_ensure_index(keys)]
-        else:
-            levels = [_ensure_index(x) for x in levels]
-
-    if not _all_indexes_same(indexes):
-        label_list = []
-
-        # things are potentially different sizes, so compute the exact labels
-        # for each level and pass those to MultiIndex.from_arrays
-
-        for hlevel, level in zip(zipped, levels):
-            to_concat = []
-            for key, index in zip(hlevel, indexes):
-                try:
-                    i = level.get_loc(key)
-                except KeyError:
-                    raise ValueError('Key %s not in level %s'
-                                     % (str(key), str(level)))
-
-                to_concat.append(np.repeat(i, len(index)))
-            label_list.append(np.concatenate(to_concat))
-
-        concat_index = _concat_indexes(indexes)
-
-        # these go at the end
-        if isinstance(concat_index, MultiIndex):
-            levels.extend(concat_index.levels)
-            label_list.extend(concat_index.labels)
-        else:
-            codes, categories = _factorize_from_iterable(concat_index)
-            levels.append(categories)
-            label_list.append(codes)
-
-        if len(names) == len(levels):
-            names = list(names)
-        else:
-            # make sure that all of the passed indices have the same nlevels
-            if not len(set([idx.nlevels for idx in indexes])) == 1:
-                raise AssertionError("Cannot concat indices that do"
-                                     " not have the same number of levels")
-
-            # also copies
-            names = names + _get_consensus_names(indexes)
-
-        return MultiIndex(levels=levels, labels=label_list, names=names,
-                          verify_integrity=False)
-
-    new_index = indexes[0]
-    n = len(new_index)
-    kpieces = len(indexes)
-
-    # also copies
-    new_names = list(names)
-    new_levels = list(levels)
-
-    # construct labels
-    new_labels = []
-
-    # do something a bit more speedy
-
-    for hlevel, level in zip(zipped, levels):
-        hlevel = _ensure_index(hlevel)
-        mapped = level.get_indexer(hlevel)
-
-        mask = mapped == -1
-        if mask.any():
-            raise ValueError('Values not found in passed level: %s'
-                             % str(hlevel[mask]))
-
-        new_labels.append(np.repeat(mapped, n))
-
-    if isinstance(new_index, MultiIndex):
-        new_levels.extend(new_index.levels)
-        new_labels.extend([np.tile(lab, kpieces) for lab in new_index.labels])
-    else:
-        new_levels.append(new_index)
-        new_labels.append(np.tile(np.arange(n), kpieces))
-
-    if len(new_names) < len(new_levels):
-        new_names.extend(new_index.names)
-
-    return MultiIndex(levels=new_levels, labels=new_labels, names=new_names,
-                      verify_integrity=False)
diff --git a/pandas/tools/hashing.py b/pandas/tools/hashing.py
deleted file mode 100644
index 85ceb439435ee..0000000000000
--- a/pandas/tools/hashing.py
+++ /dev/null
@@ -1,274 +0,0 @@
-"""
-data hash pandas / numpy objects
-"""
-import itertools
-
-import numpy as np
-from pandas import Series, factorize, Categorical, Index, MultiIndex
-from pandas.tools import libhashing as _hash
-from pandas._libs.lib import is_bool_array
-from pandas.types.generic import ABCIndexClass, ABCSeries, ABCDataFrame
-from pandas.types.common import (is_categorical_dtype, is_numeric_dtype,
-                                 is_datetime64_dtype, is_timedelta64_dtype,
-                                 is_list_like)
-
-# 16 byte long hashing key
-_default_hash_key = '0123456789123456'
-
-
-def _combine_hash_arrays(arrays, num_items):
-    """
-    Parameters
-    ----------
-    arrays : generator
-    num_items : int
-
-    Should be the same as CPython's tupleobject.c
-    """
-    try:
-        first = next(arrays)
-    except StopIteration:
-        return np.array([], dtype=np.uint64)
-
-    arrays = itertools.chain([first], arrays)
-
-    mult = np.uint64(1000003)
-    out = np.zeros_like(first) + np.uint64(0x345678)
-    for i, a in enumerate(arrays):
-        inverse_i = num_items - i
-        out ^= a
-        out *= mult
-        mult += np.uint64(82520 + inverse_i + inverse_i)
-    assert i + 1 == num_items, 'Fed in wrong num_items'
-    out += np.uint64(97531)
-    return out
-
-
-def hash_pandas_object(obj, index=True, encoding='utf8', hash_key=None,
-                       categorize=True):
-    """
-    Return a data hash of the Index/Series/DataFrame
-
-    .. versionadded:: 0.19.2
-
-    Parameters
-    ----------
-    index : boolean, default True
-        include the index in the hash (if Series/DataFrame)
-    encoding : string, default 'utf8'
-        encoding for data & key when strings
-    hash_key : string key to encode, default to _default_hash_key
-    categorize : bool, default True
-        Whether to first categorize object arrays before hashing. This is more
-        efficient when the array contains duplicate values.
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    Series of uint64, same length as the object
-
-    """
-    if hash_key is None:
-        hash_key = _default_hash_key
-
-    if isinstance(obj, MultiIndex):
-        return Series(hash_tuples(obj, encoding, hash_key),
-                      dtype='uint64', copy=False)
-
-    if isinstance(obj, ABCIndexClass):
-        h = hash_array(obj.values, encoding, hash_key,
-                       categorize).astype('uint64', copy=False)
-        h = Series(h, index=obj, dtype='uint64', copy=False)
-    elif isinstance(obj, ABCSeries):
-        h = hash_array(obj.values, encoding, hash_key,
-                       categorize).astype('uint64', copy=False)
-        if index:
-            index_iter = (hash_pandas_object(obj.index,
-                                             index=False,
-                                             encoding=encoding,
-                                             hash_key=hash_key,
-                                             categorize=categorize).values
-                          for _ in [None])
-            arrays = itertools.chain([h], index_iter)
-            h = _combine_hash_arrays(arrays, 2)
-
-        h = Series(h, index=obj.index, dtype='uint64', copy=False)
-
-    elif isinstance(obj, ABCDataFrame):
-        hashes = (hash_array(series.values) for _, series in obj.iteritems())
-        num_items = len(obj.columns)
-        if index:
-            index_hash_generator = (hash_pandas_object(obj.index,
-                                                       index=False,
-                                                       encoding=encoding,
-                                                       hash_key=hash_key,
-                                                       categorize=categorize).values  # noqa
-                                    for _ in [None])
-            num_items += 1
-            hashes = itertools.chain(hashes, index_hash_generator)
-        h = _combine_hash_arrays(hashes, num_items)
-
-        h = Series(h, index=obj.index, dtype='uint64', copy=False)
-    else:
-        raise TypeError("Unexpected type for hashing %s" % type(obj))
-    return h
-
-
-def hash_tuples(vals, encoding='utf8', hash_key=None):
-    """
-    Hash an MultiIndex / list-of-tuples efficiently
-
-    .. versionadded:: 0.20.0
-
-    Parameters
-    ----------
-    vals : MultiIndex, list-of-tuples, or single tuple
-    encoding : string, default 'utf8'
-    hash_key : string key to encode, default to _default_hash_key
-
-    Returns
-    -------
-    ndarray of hashed values array
-    """
-
-    is_tuple = False
-    if isinstance(vals, tuple):
-        vals = [vals]
-        is_tuple = True
-    elif not is_list_like(vals):
-        raise TypeError("must be convertible to a list-of-tuples")
-
-    if not isinstance(vals, MultiIndex):
-        vals = MultiIndex.from_tuples(vals)
-
-    # create a list-of-Categoricals
-    vals = [Categorical(vals.labels[level],
-                        vals.levels[level],
-                        ordered=False,
-                        fastpath=True)
-            for level in range(vals.nlevels)]
-
-    # hash the list-of-ndarrays
-    hashes = (_hash_categorical(cat,
-                                encoding=encoding,
-                                hash_key=hash_key)
-              for cat in vals)
-    h = _combine_hash_arrays(hashes, len(vals))
-    if is_tuple:
-        h = h[0]
-
-    return h
-
-
-def _hash_categorical(c, encoding, hash_key):
-    """
-    Hash a Categorical by hashing its categories, and then mapping the codes
-    to the hashes
-
-    Parameters
-    ----------
-    c : Categorical
-    encoding : string, default 'utf8'
-    hash_key : string key to encode, default to _default_hash_key
-
-    Returns
-    -------
-    ndarray of hashed values array, same size as len(c)
-    """
-    hashed = hash_array(c.categories.values, encoding, hash_key,
-                        categorize=False)
-
-    # we have uint64, as we don't directly support missing values
-    # we don't want to use take_nd which will coerce to float
-    # instead, directly construt the result with a
-    # max(np.uint64) as the missing value indicator
-    #
-    # TODO: GH 15362
-
-    mask = c.isnull()
-    if len(hashed):
-        result = hashed.take(c.codes)
-    else:
-        result = np.zeros(len(mask), dtype='uint64')
-
-    if mask.any():
-        result[mask] = np.iinfo(np.uint64).max
-
-    return result
-
-
-def hash_array(vals, encoding='utf8', hash_key=None, categorize=True):
-    """
-    Given a 1d array, return an array of deterministic integers.
-
-    .. versionadded:: 0.19.2
-
-    Parameters
-    ----------
-    vals : ndarray, Categorical
-    encoding : string, default 'utf8'
-        encoding for data & key when strings
-    hash_key : string key to encode, default to _default_hash_key
-    categorize : bool, default True
-        Whether to first categorize object arrays before hashing. This is more
-        efficient when the array contains duplicate values.
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    1d uint64 numpy array of hash values, same length as the vals
-
-    """
-
-    if not hasattr(vals, 'dtype'):
-        raise TypeError("must pass a ndarray-like")
-
-    if hash_key is None:
-        hash_key = _default_hash_key
-
-    # For categoricals, we hash the categories, then remap the codes to the
-    # hash values. (This check is above the complex check so that we don't ask
-    # numpy if categorical is a subdtype of complex, as it will choke.
-    if is_categorical_dtype(vals.dtype):
-        return _hash_categorical(vals, encoding, hash_key)
-
-    # we'll be working with everything as 64-bit values, so handle this
-    # 128-bit value early
-    if np.issubdtype(vals.dtype, np.complex128):
-        return hash_array(vals.real) + 23 * hash_array(vals.imag)
-
-    # First, turn whatever array this is into unsigned 64-bit ints, if we can
-    # manage it.
-    if is_bool_array(vals):
-        vals = vals.astype('u8')
-    elif (is_datetime64_dtype(vals) or
-          is_timedelta64_dtype(vals)):
-        vals = vals.view('i8').astype('u8', copy=False)
-    elif (is_numeric_dtype(vals) and vals.dtype.itemsize <= 8):
-        vals = vals.view('u{}'.format(vals.dtype.itemsize)).astype('u8')
-    else:
-        # With repeated values, its MUCH faster to categorize object dtypes,
-        # then hash and rename categories. We allow skipping the categorization
-        # when the values are known/likely to be unique.
-        if categorize:
-            codes, categories = factorize(vals, sort=False)
-            cat = Categorical(codes, Index(categories),
-                              ordered=False, fastpath=True)
-            return _hash_categorical(cat, encoding, hash_key)
-
-        try:
-            vals = _hash.hash_object_array(vals, hash_key, encoding)
-        except TypeError:
-            # we have mixed types
-            vals = _hash.hash_object_array(vals.astype(str).astype(object),
-                                           hash_key, encoding)
-
-    # Then, redistribute these 64-bit ints within the space of 64-bit ints
-    vals ^= vals >> 30
-    vals *= np.uint64(0xbf58476d1ce4e5b9)
-    vals ^= vals >> 27
-    vals *= np.uint64(0x94d049bb133111eb)
-    vals ^= vals >> 31
-    return vals
diff --git a/pandas/tools/hashing.pyx b/pandas/tools/hashing.pyx
deleted file mode 100644
index 06ed947808e39..0000000000000
--- a/pandas/tools/hashing.pyx
+++ /dev/null
@@ -1,191 +0,0 @@
-# cython: profile=False
-# Translated from the reference implementation
-# at https://github.com/veorq/SipHash
-
-import cython
-cimport numpy as cnp
-import numpy as np
-from numpy cimport ndarray, uint8_t, uint32_t, uint64_t
-
-from util cimport _checknull
-from cpython cimport (PyString_Check,
-                      PyBytes_Check,
-                      PyUnicode_Check)
-from libc.stdlib cimport malloc, free
-
-DEF cROUNDS = 2
-DEF dROUNDS = 4
-
-
-@cython.boundscheck(False)
-def hash_object_array(ndarray[object] arr, object key, object encoding='utf8'):
-    """
-    Parameters
-    ----------
-    arr : 1-d object ndarray of objects
-    key : hash key, must be 16 byte len encoded
-    encoding : encoding for key & arr, default to 'utf8'
-
-    Returns
-    -------
-    1-d uint64 ndarray of hashes
-
-    Notes
-    -----
-    allowed values must be strings, or nulls
-    mixed array types will raise TypeError
-
-    """
-    cdef:
-        Py_ssize_t i, l, n
-        ndarray[uint64_t] result
-        bytes data, k
-        uint8_t *kb
-        uint64_t *lens
-        char **vecs, *cdata
-        object val
-
-    k = <bytes>key.encode(encoding)
-    kb = <uint8_t *>k
-    if len(k) != 16:
-        raise ValueError(
-            'key should be a 16-byte string encoded, got {!r} (len {})'.format(
-                k, len(k)))
-
-    n = len(arr)
-
-    # create an array of bytes
-    vecs = <char **> malloc(n * sizeof(char *))
-    lens = <uint64_t*> malloc(n * sizeof(uint64_t))
-
-    cdef list datas = []
-    for i in range(n):
-        val = arr[i]
-        if PyString_Check(val):
-            data = <bytes>val.encode(encoding)
-        elif PyBytes_Check(val):
-            data = <bytes>val
-        elif PyUnicode_Check(val):
-            data = <bytes>val.encode(encoding)
-        elif _checknull(val):
-            # null, stringify and encode
-            data = <bytes>str(val).encode(encoding)
-
-        else:
-            raise TypeError("{} of type {} is not a valid type for hashing, "
-                            "must be string or null".format(val, type(val)))
-
-        l = len(data)
-        lens[i] = l
-        cdata = data
-
-        # keep the refernce alive thru the end of the
-        # function
-        datas.append(data)
-        vecs[i] = cdata
-
-    result = np.empty(n, dtype=np.uint64)
-    with nogil:
-        for i in range(n):
-            result[i] = low_level_siphash(<uint8_t *>vecs[i], lens[i], kb)
-
-    free(vecs)
-    free(lens)
-    return result
-
-cdef inline uint64_t _rotl(uint64_t x, uint64_t b) nogil:
-    return (x << b) | (x >> (64 - b))
-
-cdef inline void u32to8_le(uint8_t* p, uint32_t v) nogil:
-    p[0] = <uint8_t>(v)
-    p[1] = <uint8_t>(v >> 8)
-    p[2] = <uint8_t>(v >> 16)
-    p[3] = <uint8_t>(v >> 24)
-
-cdef inline void u64to8_le(uint8_t* p, uint64_t v) nogil:
-    u32to8_le(p, <uint32_t>v)
-    u32to8_le(p + 4, <uint32_t>(v >> 32))
-
-cdef inline uint64_t u8to64_le(uint8_t* p) nogil:
-    return (<uint64_t>p[0] |
-            <uint64_t>p[1] <<  8 |
-            <uint64_t>p[2] << 16 |
-            <uint64_t>p[3] << 24 |
-            <uint64_t>p[4] << 32 |
-            <uint64_t>p[5] << 40 |
-            <uint64_t>p[6] << 48 |
-            <uint64_t>p[7] << 56)
-
-cdef inline void _sipround(uint64_t* v0, uint64_t* v1,
-                           uint64_t* v2, uint64_t* v3) nogil:
-    v0[0] += v1[0]
-    v1[0] = _rotl(v1[0], 13)
-    v1[0] ^= v0[0]
-    v0[0] = _rotl(v0[0], 32)
-    v2[0] += v3[0]
-    v3[0] = _rotl(v3[0], 16)
-    v3[0] ^= v2[0]
-    v0[0] += v3[0]
-    v3[0] = _rotl(v3[0], 21)
-    v3[0] ^= v0[0]
-    v2[0] += v1[0]
-    v1[0] = _rotl(v1[0], 17)
-    v1[0] ^= v2[0]
-    v2[0] = _rotl(v2[0], 32)
-
-cpdef uint64_t siphash(bytes data, bytes key) except? 0:
-    if len(key) != 16:
-        raise ValueError(
-            'key should be a 16-byte bytestring, got {!r} (len {})'.format(
-                key, len(key)))
-    return low_level_siphash(data, len(data), key)
-
-
-@cython.cdivision(True)
-cdef uint64_t low_level_siphash(uint8_t* data, size_t datalen,
-                                uint8_t* key) nogil:
-    cdef uint64_t v0 = 0x736f6d6570736575ULL
-    cdef uint64_t v1 = 0x646f72616e646f6dULL
-    cdef uint64_t v2 = 0x6c7967656e657261ULL
-    cdef uint64_t v3 = 0x7465646279746573ULL
-    cdef uint64_t b
-    cdef uint64_t k0 = u8to64_le(key)
-    cdef uint64_t k1 = u8to64_le(key + 8)
-    cdef uint64_t m
-    cdef int i
-    cdef uint8_t* end = data + datalen - (datalen % sizeof(uint64_t))
-    cdef int left = datalen & 7
-    cdef int left_byte
-
-    b = (<uint64_t>datalen) << 56
-    v3 ^= k1
-    v2 ^= k0
-    v1 ^= k1
-    v0 ^= k0
-
-    while (data != end):
-        m = u8to64_le(data)
-        v3 ^= m
-        for i in range(cROUNDS):
-            _sipround(&v0, &v1, &v2, &v3)
-        v0 ^= m
-
-        data += sizeof(uint64_t)
-
-    for i in range(left-1, -1, -1):
-        b |= (<uint64_t>data[i]) << (i * 8)
-
-    v3 ^= b
-
-    for i in range(cROUNDS):
-        _sipround(&v0, &v1, &v2, &v3)
-
-    v0 ^= b
-    v2 ^= 0xff
-
-    for i in range(dROUNDS):
-        _sipround(&v0, &v1, &v2, &v3)
-
-    b = v0 ^ v1 ^ v2 ^ v3
-
-    return b
diff --git a/pandas/tools/merge.py b/pandas/tools/merge.py
deleted file mode 100644
index 7de2549cadfc7..0000000000000
--- a/pandas/tools/merge.py
+++ /dev/null
@@ -1,1496 +0,0 @@
-"""
-SQL-style merge routines
-"""
-
-import copy
-import warnings
-import string
-
-import numpy as np
-from pandas.compat import range, lzip, zip, map, filter
-import pandas.compat as compat
-
-import pandas as pd
-from pandas import (Categorical, Series, DataFrame,
-                    Index, MultiIndex, Timedelta)
-from pandas.core.frame import _merge_doc
-from pandas.types.common import (is_datetime64tz_dtype,
-                                 is_datetime64_dtype,
-                                 needs_i8_conversion,
-                                 is_int64_dtype,
-                                 is_categorical_dtype,
-                                 is_integer_dtype,
-                                 is_float_dtype,
-                                 is_numeric_dtype,
-                                 is_integer,
-                                 is_int_or_datetime_dtype,
-                                 is_dtype_equal,
-                                 is_bool,
-                                 is_list_like,
-                                 _ensure_int64,
-                                 _ensure_float64,
-                                 _ensure_object,
-                                 _get_dtype)
-from pandas.types.missing import na_value_for_dtype
-from pandas.core.internals import (items_overlap_with_suffix,
-                                   concatenate_block_managers)
-from pandas.util.decorators import Appender, Substitution
-
-from pandas.core.sorting import is_int64_overflow_possible
-import pandas.core.algorithms as algos
-import pandas.core.common as com
-from pandas._libs import hashtable as libhashtable, join as libjoin, lib
-
-
-# back-compat of pseudo-public API
-def concat_wrap():
-
-    def wrapper(*args, **kwargs):
-        warnings.warn("pandas.tools.merge.concat is deprecated. "
-                      "import from the public API: "
-                      "pandas.concat instead",
-                      FutureWarning, stacklevel=3)
-        return pd.concat(*args, **kwargs)
-    return wrapper
-
-
-concat = concat_wrap()
-
-
-@Substitution('\nleft : DataFrame')
-@Appender(_merge_doc, indents=0)
-def merge(left, right, how='inner', on=None, left_on=None, right_on=None,
-          left_index=False, right_index=False, sort=False,
-          suffixes=('_x', '_y'), copy=True, indicator=False):
-    op = _MergeOperation(left, right, how=how, on=on, left_on=left_on,
-                         right_on=right_on, left_index=left_index,
-                         right_index=right_index, sort=sort, suffixes=suffixes,
-                         copy=copy, indicator=indicator)
-    return op.get_result()
-
-
-if __debug__:
-    merge.__doc__ = _merge_doc % '\nleft : DataFrame'
-
-
-class MergeError(ValueError):
-    pass
-
-
-def _groupby_and_merge(by, on, left, right, _merge_pieces,
-                       check_duplicates=True):
-    """
-    groupby & merge; we are always performing a left-by type operation
-
-    Parameters
-    ----------
-    by: field to group
-    on: duplicates field
-    left: left frame
-    right: right frame
-    _merge_pieces: function for merging
-    check_duplicates: boolean, default True
-        should we check & clean duplicates
-    """
-
-    pieces = []
-    if not isinstance(by, (list, tuple)):
-        by = [by]
-
-    lby = left.groupby(by, sort=False)
-
-    # if we can groupby the rhs
-    # then we can get vastly better perf
-    try:
-
-        # we will check & remove duplicates if indicated
-        if check_duplicates:
-            if on is None:
-                on = []
-            elif not isinstance(on, (list, tuple)):
-                on = [on]
-
-            if right.duplicated(by + on).any():
-                right = right.drop_duplicates(by + on, keep='last')
-        rby = right.groupby(by, sort=False)
-    except KeyError:
-        rby = None
-
-    for key, lhs in lby:
-
-        if rby is None:
-            rhs = right
-        else:
-            try:
-                rhs = right.take(rby.indices[key])
-            except KeyError:
-                # key doesn't exist in left
-                lcols = lhs.columns.tolist()
-                cols = lcols + [r for r in right.columns
-                                if r not in set(lcols)]
-                merged = lhs.reindex(columns=cols)
-                merged.index = range(len(merged))
-                pieces.append(merged)
-                continue
-
-        merged = _merge_pieces(lhs, rhs)
-
-        # make sure join keys are in the merged
-        # TODO, should _merge_pieces do this?
-        for k in by:
-            try:
-                if k in merged:
-                    merged[k] = key
-            except:
-                pass
-
-        pieces.append(merged)
-
-    # preserve the original order
-    # if we have a missing piece this can be reset
-    from pandas.tools.concat import concat
-    result = concat(pieces, ignore_index=True)
-    result = result.reindex(columns=pieces[0].columns, copy=False)
-    return result, lby
-
-
-def ordered_merge(left, right, on=None,
-                  left_on=None, right_on=None,
-                  left_by=None, right_by=None,
-                  fill_method=None, suffixes=('_x', '_y')):
-
-    warnings.warn("ordered_merge is deprecated and replaced by merge_ordered",
-                  FutureWarning, stacklevel=2)
-    return merge_ordered(left, right, on=on,
-                         left_on=left_on, right_on=right_on,
-                         left_by=left_by, right_by=right_by,
-                         fill_method=fill_method, suffixes=suffixes)
-
-
-def merge_ordered(left, right, on=None,
-                  left_on=None, right_on=None,
-                  left_by=None, right_by=None,
-                  fill_method=None, suffixes=('_x', '_y'),
-                  how='outer'):
-    """Perform merge with optional filling/interpolation designed for ordered
-    data like time series data. Optionally perform group-wise merge (see
-    examples)
-
-    Parameters
-    ----------
-    left : DataFrame
-    right : DataFrame
-    on : label or list
-        Field names to join on. Must be found in both DataFrames.
-    left_on : label or list, or array-like
-        Field names to join on in left DataFrame. Can be a vector or list of
-        vectors of the length of the DataFrame to use a particular vector as
-        the join key instead of columns
-    right_on : label or list, or array-like
-        Field names to join on in right DataFrame or vector/list of vectors per
-        left_on docs
-    left_by : column name or list of column names
-        Group left DataFrame by group columns and merge piece by piece with
-        right DataFrame
-    right_by : column name or list of column names
-        Group right DataFrame by group columns and merge piece by piece with
-        left DataFrame
-    fill_method : {'ffill', None}, default None
-        Interpolation method for data
-    suffixes : 2-length sequence (tuple, list, ...)
-        Suffix to apply to overlapping column names in the left and right
-        side, respectively
-    how : {'left', 'right', 'outer', 'inner'}, default 'outer'
-        * left: use only keys from left frame (SQL: left outer join)
-        * right: use only keys from right frame (SQL: right outer join)
-        * outer: use union of keys from both frames (SQL: full outer join)
-        * inner: use intersection of keys from both frames (SQL: inner join)
-
-        .. versionadded:: 0.19.0
-
-    Examples
-    --------
-    >>> A                      >>> B
-          key  lvalue group        key  rvalue
-    0   a       1     a        0     b       1
-    1   c       2     a        1     c       2
-    2   e       3     a        2     d       3
-    3   a       1     b
-    4   c       2     b
-    5   e       3     b
-
-    >>> ordered_merge(A, B, fill_method='ffill', left_by='group')
-       key  lvalue group  rvalue
-    0    a       1     a     NaN
-    1    b       1     a       1
-    2    c       2     a       2
-    3    d       2     a       3
-    4    e       3     a       3
-    5    f       3     a       4
-    6    a       1     b     NaN
-    7    b       1     b       1
-    8    c       2     b       2
-    9    d       2     b       3
-    10   e       3     b       3
-    11   f       3     b       4
-
-    Returns
-    -------
-    merged : DataFrame
-        The output type will the be same as 'left', if it is a subclass
-        of DataFrame.
-
-    See also
-    --------
-    merge
-    merge_asof
-
-    """
-    def _merger(x, y):
-        # perform the ordered merge operation
-        op = _OrderedMerge(x, y, on=on, left_on=left_on, right_on=right_on,
-                           suffixes=suffixes, fill_method=fill_method,
-                           how=how)
-        return op.get_result()
-
-    if left_by is not None and right_by is not None:
-        raise ValueError('Can only group either left or right frames')
-    elif left_by is not None:
-        result, _ = _groupby_and_merge(left_by, on, left, right,
-                                       lambda x, y: _merger(x, y),
-                                       check_duplicates=False)
-    elif right_by is not None:
-        result, _ = _groupby_and_merge(right_by, on, right, left,
-                                       lambda x, y: _merger(y, x),
-                                       check_duplicates=False)
-    else:
-        result = _merger(left, right)
-    return result
-
-
-ordered_merge.__doc__ = merge_ordered.__doc__
-
-
-def merge_asof(left, right, on=None,
-               left_on=None, right_on=None,
-               left_index=False, right_index=False,
-               by=None, left_by=None, right_by=None,
-               suffixes=('_x', '_y'),
-               tolerance=None,
-               allow_exact_matches=True,
-               direction='backward'):
-    """Perform an asof merge. This is similar to a left-join except that we
-    match on nearest key rather than equal keys.
-
-    Both DataFrames must be sorted by the key.
-
-    For each row in the left DataFrame:
-
-      - A "backward" search selects the last row in the right DataFrame whose
-        'on' key is less than or equal to the left's key.
-
-      - A "forward" search selects the first row in the right DataFrame whose
-        'on' key is greater than or equal to the left's key.
-
-      - A "nearest" search selects the row in the right DataFrame whose 'on'
-        key is closest in absolute distance to the left's key.
-
-    The default is "backward" and is compatible in versions below 0.20.0.
-    The direction parameter was added in version 0.20.0 and introduces
-    "forward" and "nearest".
-
-    Optionally match on equivalent keys with 'by' before searching with 'on'.
-
-    .. versionadded:: 0.19.0
-
-    Parameters
-    ----------
-    left : DataFrame
-    right : DataFrame
-    on : label
-        Field name to join on. Must be found in both DataFrames.
-        The data MUST be ordered. Furthermore this must be a numeric column,
-        such as datetimelike, integer, or float. On or left_on/right_on
-        must be given.
-    left_on : label
-        Field name to join on in left DataFrame.
-    right_on : label
-        Field name to join on in right DataFrame.
-    left_index : boolean
-        Use the index of the left DataFrame as the join key.
-
-        .. versionadded:: 0.19.2
-
-    right_index : boolean
-        Use the index of the right DataFrame as the join key.
-
-        .. versionadded:: 0.19.2
-
-    by : column name or list of column names
-        Match on these columns before performing merge operation.
-    left_by : column name
-        Field names to match on in the left DataFrame.
-
-        .. versionadded:: 0.19.2
-
-    right_by : column name
-        Field names to match on in the right DataFrame.
-
-        .. versionadded:: 0.19.2
-
-    suffixes : 2-length sequence (tuple, list, ...)
-        Suffix to apply to overlapping column names in the left and right
-        side, respectively.
-    tolerance : integer or Timedelta, optional, default None
-        Select asof tolerance within this range; must be compatible
-        with the merge index.
-    allow_exact_matches : boolean, default True
-
-        - If True, allow matching with the same 'on' value
-          (i.e. less-than-or-equal-to / greater-than-or-equal-to)
-        - If False, don't match the same 'on' value
-          (i.e., stricly less-than / strictly greater-than)
-
-    direction : 'backward' (default), 'forward', or 'nearest'
-        Whether to search for prior, subsequent, or closest matches.
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    merged : DataFrame
-
-    Examples
-    --------
-    >>> left
-        a left_val
-    0   1        a
-    1   5        b
-    2  10        c
-
-    >>> right
-       a  right_val
-    0  1          1
-    1  2          2
-    2  3          3
-    3  6          6
-    4  7          7
-
-    >>> pd.merge_asof(left, right, on='a')
-        a left_val  right_val
-    0   1        a          1
-    1   5        b          3
-    2  10        c          7
-
-    >>> pd.merge_asof(left, right, on='a', allow_exact_matches=False)
-        a left_val  right_val
-    0   1        a        NaN
-    1   5        b        3.0
-    2  10        c        7.0
-
-    >>> pd.merge_asof(left, right, on='a', direction='forward')
-        a left_val  right_val
-    0   1        a        1.0
-    1   5        b        6.0
-    2  10        c        NaN
-
-    >>> pd.merge_asof(left, right, on='a', direction='nearest')
-        a left_val  right_val
-    0   1        a          1
-    1   5        b          6
-    2  10        c          7
-
-    We can use indexed DataFrames as well.
-
-    >>> left
-       left_val
-    1         a
-    5         b
-    10        c
-
-    >>> right
-       right_val
-    1          1
-    2          2
-    3          3
-    6          6
-    7          7
-
-    >>> pd.merge_asof(left, right, left_index=True, right_index=True)
-       left_val  right_val
-    1         a          1
-    5         b          3
-    10        c          7
-
-    Here is a real-world times-series example
-
-    >>> quotes
-                         time ticker     bid     ask
-    0 2016-05-25 13:30:00.023   GOOG  720.50  720.93
-    1 2016-05-25 13:30:00.023   MSFT   51.95   51.96
-    2 2016-05-25 13:30:00.030   MSFT   51.97   51.98
-    3 2016-05-25 13:30:00.041   MSFT   51.99   52.00
-    4 2016-05-25 13:30:00.048   GOOG  720.50  720.93
-    5 2016-05-25 13:30:00.049   AAPL   97.99   98.01
-    6 2016-05-25 13:30:00.072   GOOG  720.50  720.88
-    7 2016-05-25 13:30:00.075   MSFT   52.01   52.03
-
-    >>> trades
-                         time ticker   price  quantity
-    0 2016-05-25 13:30:00.023   MSFT   51.95        75
-    1 2016-05-25 13:30:00.038   MSFT   51.95       155
-    2 2016-05-25 13:30:00.048   GOOG  720.77       100
-    3 2016-05-25 13:30:00.048   GOOG  720.92       100
-    4 2016-05-25 13:30:00.048   AAPL   98.00       100
-
-    By default we are taking the asof of the quotes
-
-    >>> pd.merge_asof(trades, quotes,
-    ...                       on='time',
-    ...                       by='ticker')
-                         time ticker   price  quantity     bid     ask
-    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
-    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
-    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
-    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
-    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
-
-    We only asof within 2ms betwen the quote time and the trade time
-
-    >>> pd.merge_asof(trades, quotes,
-    ...                       on='time',
-    ...                       by='ticker',
-    ...                       tolerance=pd.Timedelta('2ms'))
-                         time ticker   price  quantity     bid     ask
-    0 2016-05-25 13:30:00.023   MSFT   51.95        75   51.95   51.96
-    1 2016-05-25 13:30:00.038   MSFT   51.95       155     NaN     NaN
-    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
-    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
-    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
-
-    We only asof within 10ms betwen the quote time and the trade time
-    and we exclude exact matches on time. However *prior* data will
-    propogate forward
-
-    >>> pd.merge_asof(trades, quotes,
-    ...                       on='time',
-    ...                       by='ticker',
-    ...                       tolerance=pd.Timedelta('10ms'),
-    ...                       allow_exact_matches=False)
-                         time ticker   price  quantity     bid     ask
-    0 2016-05-25 13:30:00.023   MSFT   51.95        75     NaN     NaN
-    1 2016-05-25 13:30:00.038   MSFT   51.95       155   51.97   51.98
-    2 2016-05-25 13:30:00.048   GOOG  720.77       100  720.50  720.93
-    3 2016-05-25 13:30:00.048   GOOG  720.92       100  720.50  720.93
-    4 2016-05-25 13:30:00.048   AAPL   98.00       100     NaN     NaN
-
-    See also
-    --------
-    merge
-    merge_ordered
-
-    """
-    op = _AsOfMerge(left, right,
-                    on=on, left_on=left_on, right_on=right_on,
-                    left_index=left_index, right_index=right_index,
-                    by=by, left_by=left_by, right_by=right_by,
-                    suffixes=suffixes,
-                    how='asof', tolerance=tolerance,
-                    allow_exact_matches=allow_exact_matches,
-                    direction=direction)
-    return op.get_result()
-
-
-# TODO: transformations??
-# TODO: only copy DataFrames when modification necessary
-class _MergeOperation(object):
-    """
-    Perform a database (SQL) merge operation between two DataFrame objects
-    using either columns as keys or their row indexes
-    """
-    _merge_type = 'merge'
-
-    def __init__(self, left, right, how='inner', on=None,
-                 left_on=None, right_on=None, axis=1,
-                 left_index=False, right_index=False, sort=True,
-                 suffixes=('_x', '_y'), copy=True, indicator=False):
-        self.left = self.orig_left = left
-        self.right = self.orig_right = right
-        self.how = how
-        self.axis = axis
-
-        self.on = com._maybe_make_list(on)
-        self.left_on = com._maybe_make_list(left_on)
-        self.right_on = com._maybe_make_list(right_on)
-
-        self.copy = copy
-        self.suffixes = suffixes
-        self.sort = sort
-
-        self.left_index = left_index
-        self.right_index = right_index
-
-        self.indicator = indicator
-
-        if isinstance(self.indicator, compat.string_types):
-            self.indicator_name = self.indicator
-        elif isinstance(self.indicator, bool):
-            self.indicator_name = '_merge' if self.indicator else None
-        else:
-            raise ValueError(
-                'indicator option can only accept boolean or string arguments')
-
-        if not isinstance(left, DataFrame):
-            raise ValueError(
-                'can not merge DataFrame with instance of '
-                'type {0}'.format(type(left)))
-        if not isinstance(right, DataFrame):
-            raise ValueError(
-                'can not merge DataFrame with instance of '
-                'type {0}'.format(type(right)))
-
-        if not is_bool(left_index):
-            raise ValueError(
-                'left_index parameter must be of type bool, not '
-                '{0}'.format(type(left_index)))
-        if not is_bool(right_index):
-            raise ValueError(
-                'right_index parameter must be of type bool, not '
-                '{0}'.format(type(right_index)))
-
-        # warn user when merging between different levels
-        if left.columns.nlevels != right.columns.nlevels:
-            msg = ('merging between different levels can give an unintended '
-                   'result ({0} levels on the left, {1} on the right)')
-            msg = msg.format(left.columns.nlevels, right.columns.nlevels)
-            warnings.warn(msg, UserWarning)
-
-        self._validate_specification()
-
-        # note this function has side effects
-        (self.left_join_keys,
-         self.right_join_keys,
-         self.join_names) = self._get_merge_keys()
-
-        # validate the merge keys dtypes. We may need to coerce
-        # to avoid incompat dtypes
-        self._maybe_coerce_merge_keys()
-
-    def get_result(self):
-        if self.indicator:
-            self.left, self.right = self._indicator_pre_merge(
-                self.left, self.right)
-
-        join_index, left_indexer, right_indexer = self._get_join_info()
-
-        ldata, rdata = self.left._data, self.right._data
-        lsuf, rsuf = self.suffixes
-
-        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
-                                                     rdata.items, rsuf)
-
-        lindexers = {1: left_indexer} if left_indexer is not None else {}
-        rindexers = {1: right_indexer} if right_indexer is not None else {}
-
-        result_data = concatenate_block_managers(
-            [(ldata, lindexers), (rdata, rindexers)],
-            axes=[llabels.append(rlabels), join_index],
-            concat_axis=0, copy=self.copy)
-
-        typ = self.left._constructor
-        result = typ(result_data).__finalize__(self, method=self._merge_type)
-
-        if self.indicator:
-            result = self._indicator_post_merge(result)
-
-        self._maybe_add_join_keys(result, left_indexer, right_indexer)
-
-        return result
-
-    def _indicator_pre_merge(self, left, right):
-
-        columns = left.columns.union(right.columns)
-
-        for i in ['_left_indicator', '_right_indicator']:
-            if i in columns:
-                raise ValueError("Cannot use `indicator=True` option when "
-                                 "data contains a column named {}".format(i))
-        if self.indicator_name in columns:
-            raise ValueError(
-                "Cannot use name of an existing column for indicator column")
-
-        left = left.copy()
-        right = right.copy()
-
-        left['_left_indicator'] = 1
-        left['_left_indicator'] = left['_left_indicator'].astype('int8')
-
-        right['_right_indicator'] = 2
-        right['_right_indicator'] = right['_right_indicator'].astype('int8')
-
-        return left, right
-
-    def _indicator_post_merge(self, result):
-
-        result['_left_indicator'] = result['_left_indicator'].fillna(0)
-        result['_right_indicator'] = result['_right_indicator'].fillna(0)
-
-        result[self.indicator_name] = Categorical((result['_left_indicator'] +
-                                                   result['_right_indicator']),
-                                                  categories=[1, 2, 3])
-        result[self.indicator_name] = (
-            result[self.indicator_name]
-            .cat.rename_categories(['left_only', 'right_only', 'both']))
-
-        result = result.drop(labels=['_left_indicator', '_right_indicator'],
-                             axis=1)
-        return result
-
-    def _maybe_add_join_keys(self, result, left_indexer, right_indexer):
-
-        left_has_missing = None
-        right_has_missing = None
-
-        keys = zip(self.join_names, self.left_on, self.right_on)
-        for i, (name, lname, rname) in enumerate(keys):
-            if not _should_fill(lname, rname):
-                continue
-
-            take_left, take_right = None, None
-
-            if name in result:
-
-                if left_indexer is not None and right_indexer is not None:
-                    if name in self.left:
-
-                        if left_has_missing is None:
-                            left_has_missing = (left_indexer == -1).any()
-
-                        if left_has_missing:
-                            take_right = self.right_join_keys[i]
-
-                            if not is_dtype_equal(result[name].dtype,
-                                                  self.left[name].dtype):
-                                take_left = self.left[name]._values
-
-                    elif name in self.right:
-
-                        if right_has_missing is None:
-                            right_has_missing = (right_indexer == -1).any()
-
-                        if right_has_missing:
-                            take_left = self.left_join_keys[i]
-
-                            if not is_dtype_equal(result[name].dtype,
-                                                  self.right[name].dtype):
-                                take_right = self.right[name]._values
-
-            elif left_indexer is not None \
-                    and isinstance(self.left_join_keys[i], np.ndarray):
-
-                take_left = self.left_join_keys[i]
-                take_right = self.right_join_keys[i]
-
-            if take_left is not None or take_right is not None:
-
-                if take_left is None:
-                    lvals = result[name]._values
-                else:
-                    lfill = na_value_for_dtype(take_left.dtype)
-                    lvals = algos.take_1d(take_left, left_indexer,
-                                          fill_value=lfill)
-
-                if take_right is None:
-                    rvals = result[name]._values
-                else:
-                    rfill = na_value_for_dtype(take_right.dtype)
-                    rvals = algos.take_1d(take_right, right_indexer,
-                                          fill_value=rfill)
-
-                # if we have an all missing left_indexer
-                # make sure to just use the right values
-                mask = left_indexer == -1
-                if mask.all():
-                    key_col = rvals
-                else:
-                    key_col = Index(lvals).where(~mask, rvals)
-
-                if name in result:
-                    result[name] = key_col
-                else:
-                    result.insert(i, name or 'key_%d' % i, key_col)
-
-    def _get_join_indexers(self):
-        """ return the join indexers """
-        return _get_join_indexers(self.left_join_keys,
-                                  self.right_join_keys,
-                                  sort=self.sort,
-                                  how=self.how)
-
-    def _get_join_info(self):
-        left_ax = self.left._data.axes[self.axis]
-        right_ax = self.right._data.axes[self.axis]
-
-        if self.left_index and self.right_index and self.how != 'asof':
-            join_index, left_indexer, right_indexer = \
-                left_ax.join(right_ax, how=self.how, return_indexers=True,
-                             sort=self.sort)
-        elif self.right_index and self.how == 'left':
-            join_index, left_indexer, right_indexer = \
-                _left_join_on_index(left_ax, right_ax, self.left_join_keys,
-                                    sort=self.sort)
-
-        elif self.left_index and self.how == 'right':
-            join_index, right_indexer, left_indexer = \
-                _left_join_on_index(right_ax, left_ax, self.right_join_keys,
-                                    sort=self.sort)
-        else:
-            (left_indexer,
-             right_indexer) = self._get_join_indexers()
-
-            if self.right_index:
-                if len(self.left) > 0:
-                    join_index = self.left.index.take(left_indexer)
-                else:
-                    join_index = self.right.index.take(right_indexer)
-                    left_indexer = np.array([-1] * len(join_index))
-            elif self.left_index:
-                if len(self.right) > 0:
-                    join_index = self.right.index.take(right_indexer)
-                else:
-                    join_index = self.left.index.take(left_indexer)
-                    right_indexer = np.array([-1] * len(join_index))
-            else:
-                join_index = Index(np.arange(len(left_indexer)))
-
-        if len(join_index) == 0:
-            join_index = join_index.astype(object)
-        return join_index, left_indexer, right_indexer
-
-    def _get_merge_keys(self):
-        """
-        Note: has side effects (copy/delete key columns)
-
-        Parameters
-        ----------
-        left
-        right
-        on
-
-        Returns
-        -------
-        left_keys, right_keys
-        """
-        left_keys = []
-        right_keys = []
-        join_names = []
-        right_drop = []
-        left_drop = []
-        left, right = self.left, self.right
-
-        is_lkey = lambda x: isinstance(
-            x, (np.ndarray, Series)) and len(x) == len(left)
-        is_rkey = lambda x: isinstance(
-            x, (np.ndarray, Series)) and len(x) == len(right)
-
-        # Note that pd.merge_asof() has separate 'on' and 'by' parameters. A
-        # user could, for example, request 'left_index' and 'left_by'. In a
-        # regular pd.merge(), users cannot specify both 'left_index' and
-        # 'left_on'. (Instead, users have a MultiIndex). That means the
-        # self.left_on in this function is always empty in a pd.merge(), but
-        # a pd.merge_asof(left_index=True, left_by=...) will result in a
-        # self.left_on array with a None in the middle of it. This requires
-        # a work-around as designated in the code below.
-        # See _validate_specification() for where this happens.
-
-        # ugh, spaghetti re #733
-        if _any(self.left_on) and _any(self.right_on):
-            for lk, rk in zip(self.left_on, self.right_on):
-                if is_lkey(lk):
-                    left_keys.append(lk)
-                    if is_rkey(rk):
-                        right_keys.append(rk)
-                        join_names.append(None)  # what to do?
-                    else:
-                        if rk is not None:
-                            right_keys.append(right[rk]._values)
-                            join_names.append(rk)
-                        else:
-                            # work-around for merge_asof(right_index=True)
-                            right_keys.append(right.index)
-                            join_names.append(right.index.name)
-                else:
-                    if not is_rkey(rk):
-                        if rk is not None:
-                            right_keys.append(right[rk]._values)
-                        else:
-                            # work-around for merge_asof(right_index=True)
-                            right_keys.append(right.index)
-                        if lk is not None and lk == rk:
-                            # avoid key upcast in corner case (length-0)
-                            if len(left) > 0:
-                                right_drop.append(rk)
-                            else:
-                                left_drop.append(lk)
-                    else:
-                        right_keys.append(rk)
-                    if lk is not None:
-                        left_keys.append(left[lk]._values)
-                        join_names.append(lk)
-                    else:
-                        # work-around for merge_asof(left_index=True)
-                        left_keys.append(left.index)
-                        join_names.append(left.index.name)
-        elif _any(self.left_on):
-            for k in self.left_on:
-                if is_lkey(k):
-                    left_keys.append(k)
-                    join_names.append(None)
-                else:
-                    left_keys.append(left[k]._values)
-                    join_names.append(k)
-            if isinstance(self.right.index, MultiIndex):
-                right_keys = [lev._values.take(lab)
-                              for lev, lab in zip(self.right.index.levels,
-                                                  self.right.index.labels)]
-            else:
-                right_keys = [self.right.index.values]
-        elif _any(self.right_on):
-            for k in self.right_on:
-                if is_rkey(k):
-                    right_keys.append(k)
-                    join_names.append(None)
-                else:
-                    right_keys.append(right[k]._values)
-                    join_names.append(k)
-            if isinstance(self.left.index, MultiIndex):
-                left_keys = [lev._values.take(lab)
-                             for lev, lab in zip(self.left.index.levels,
-                                                 self.left.index.labels)]
-            else:
-                left_keys = [self.left.index.values]
-
-        if left_drop:
-            self.left = self.left.drop(left_drop, axis=1)
-
-        if right_drop:
-            self.right = self.right.drop(right_drop, axis=1)
-
-        return left_keys, right_keys, join_names
-
-    def _maybe_coerce_merge_keys(self):
-        # we have valid mergee's but we may have to further
-        # coerce these if they are originally incompatible types
-        #
-        # for example if these are categorical, but are not dtype_equal
-        # or if we have object and integer dtypes
-
-        for lk, rk, name in zip(self.left_join_keys,
-                                self.right_join_keys,
-                                self.join_names):
-            if (len(lk) and not len(rk)) or (not len(lk) and len(rk)):
-                continue
-
-            # if either left or right is a categorical
-            # then the must match exactly in categories & ordered
-            if is_categorical_dtype(lk) and is_categorical_dtype(rk):
-                if lk.is_dtype_equal(rk):
-                    continue
-            elif is_categorical_dtype(lk) or is_categorical_dtype(rk):
-                pass
-
-            elif is_dtype_equal(lk.dtype, rk.dtype):
-                continue
-
-            # if we are numeric, then allow differing
-            # kinds to proceed, eg. int64 and int8
-            # further if we are object, but we infer to
-            # the same, then proceed
-            if (is_numeric_dtype(lk) and is_numeric_dtype(rk)):
-                if lk.dtype.kind == rk.dtype.kind:
-                    continue
-
-                # let's infer and see if we are ok
-                if lib.infer_dtype(lk) == lib.infer_dtype(rk):
-                    continue
-
-            # Houston, we have a problem!
-            # let's coerce to object
-            if name in self.left.columns:
-                self.left = self.left.assign(
-                    **{name: self.left[name].astype(object)})
-            if name in self.right.columns:
-                self.right = self.right.assign(
-                    **{name: self.right[name].astype(object)})
-
-    def _validate_specification(self):
-        # Hm, any way to make this logic less complicated??
-        if self.on is None and self.left_on is None and self.right_on is None:
-
-            if self.left_index and self.right_index:
-                self.left_on, self.right_on = (), ()
-            elif self.left_index:
-                if self.right_on is None:
-                    raise MergeError('Must pass right_on or right_index=True')
-            elif self.right_index:
-                if self.left_on is None:
-                    raise MergeError('Must pass left_on or left_index=True')
-            else:
-                # use the common columns
-                common_cols = self.left.columns.intersection(
-                    self.right.columns)
-                if len(common_cols) == 0:
-                    raise MergeError('No common columns to perform merge on')
-                if not common_cols.is_unique:
-                    raise MergeError("Data columns not unique: %s"
-                                     % repr(common_cols))
-                self.left_on = self.right_on = common_cols
-        elif self.on is not None:
-            if self.left_on is not None or self.right_on is not None:
-                raise MergeError('Can only pass argument "on" OR "left_on" '
-                                 'and "right_on", not a combination of both.')
-            self.left_on = self.right_on = self.on
-        elif self.left_on is not None:
-            n = len(self.left_on)
-            if self.right_index:
-                if len(self.left_on) != self.right.index.nlevels:
-                    raise ValueError('len(left_on) must equal the number '
-                                     'of levels in the index of "right"')
-                self.right_on = [None] * n
-        elif self.right_on is not None:
-            n = len(self.right_on)
-            if self.left_index:
-                if len(self.right_on) != self.left.index.nlevels:
-                    raise ValueError('len(right_on) must equal the number '
-                                     'of levels in the index of "left"')
-                self.left_on = [None] * n
-        if len(self.right_on) != len(self.left_on):
-            raise ValueError("len(right_on) must equal len(left_on)")
-
-
-def _get_join_indexers(left_keys, right_keys, sort=False, how='inner',
-                       **kwargs):
-    """
-
-    Parameters
-    ----------
-    left_keys: ndarray, Index, Series
-    right_keys: ndarray, Index, Series
-    sort: boolean, default False
-    how: string {'inner', 'outer', 'left', 'right'}, default 'inner'
-
-    Returns
-    -------
-    tuple of (left_indexer, right_indexer)
-        indexers into the left_keys, right_keys
-
-    """
-    from functools import partial
-
-    assert len(left_keys) == len(right_keys), \
-        'left_key and right_keys must be the same length'
-
-    # bind `sort` arg. of _factorize_keys
-    fkeys = partial(_factorize_keys, sort=sort)
-
-    # get left & right join labels and num. of levels at each location
-    llab, rlab, shape = map(list, zip(* map(fkeys, left_keys, right_keys)))
-
-    # get flat i8 keys from label lists
-    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
-
-    # factorize keys to a dense i8 space
-    # `count` is the num. of unique keys
-    # set(lkey) | set(rkey) == range(count)
-    lkey, rkey, count = fkeys(lkey, rkey)
-
-    # preserve left frame order if how == 'left' and sort == False
-    kwargs = copy.copy(kwargs)
-    if how == 'left':
-        kwargs['sort'] = sort
-    join_func = _join_functions[how]
-
-    return join_func(lkey, rkey, count, **kwargs)
-
-
-class _OrderedMerge(_MergeOperation):
-    _merge_type = 'ordered_merge'
-
-    def __init__(self, left, right, on=None, left_on=None, right_on=None,
-                 left_index=False, right_index=False, axis=1,
-                 suffixes=('_x', '_y'), copy=True,
-                 fill_method=None, how='outer'):
-
-        self.fill_method = fill_method
-        _MergeOperation.__init__(self, left, right, on=on, left_on=left_on,
-                                 left_index=left_index,
-                                 right_index=right_index,
-                                 right_on=right_on, axis=axis,
-                                 how=how, suffixes=suffixes,
-                                 sort=True  # factorize sorts
-                                 )
-
-    def get_result(self):
-        join_index, left_indexer, right_indexer = self._get_join_info()
-
-        # this is a bit kludgy
-        ldata, rdata = self.left._data, self.right._data
-        lsuf, rsuf = self.suffixes
-
-        llabels, rlabels = items_overlap_with_suffix(ldata.items, lsuf,
-                                                     rdata.items, rsuf)
-
-        if self.fill_method == 'ffill':
-            left_join_indexer = libjoin.ffill_indexer(left_indexer)
-            right_join_indexer = libjoin.ffill_indexer(right_indexer)
-        else:
-            left_join_indexer = left_indexer
-            right_join_indexer = right_indexer
-
-        lindexers = {
-            1: left_join_indexer} if left_join_indexer is not None else {}
-        rindexers = {
-            1: right_join_indexer} if right_join_indexer is not None else {}
-
-        result_data = concatenate_block_managers(
-            [(ldata, lindexers), (rdata, rindexers)],
-            axes=[llabels.append(rlabels), join_index],
-            concat_axis=0, copy=self.copy)
-
-        typ = self.left._constructor
-        result = typ(result_data).__finalize__(self, method=self._merge_type)
-
-        self._maybe_add_join_keys(result, left_indexer, right_indexer)
-
-        return result
-
-
-def _asof_function(direction, on_type):
-    return getattr(libjoin, 'asof_join_%s_%s' % (direction, on_type), None)
-
-
-def _asof_by_function(direction, on_type, by_type):
-    return getattr(libjoin, 'asof_join_%s_%s_by_%s' %
-                   (direction, on_type, by_type), None)
-
-
-_type_casters = {
-    'int64_t': _ensure_int64,
-    'double': _ensure_float64,
-    'object': _ensure_object,
-}
-
-_cython_types = {
-    'uint8': 'uint8_t',
-    'uint32': 'uint32_t',
-    'uint16': 'uint16_t',
-    'uint64': 'uint64_t',
-    'int8': 'int8_t',
-    'int32': 'int32_t',
-    'int16': 'int16_t',
-    'int64': 'int64_t',
-    'float16': 'error',
-    'float32': 'float',
-    'float64': 'double',
-}
-
-
-def _get_cython_type(dtype):
-    """ Given a dtype, return a C name like 'int64_t' or 'double' """
-    type_name = _get_dtype(dtype).name
-    ctype = _cython_types.get(type_name, 'object')
-    if ctype == 'error':
-        raise MergeError('unsupported type: ' + type_name)
-    return ctype
-
-
-def _get_cython_type_upcast(dtype):
-    """ Upcast a dtype to 'int64_t', 'double', or 'object' """
-    if is_integer_dtype(dtype):
-        return 'int64_t'
-    elif is_float_dtype(dtype):
-        return 'double'
-    else:
-        return 'object'
-
-
-class _AsOfMerge(_OrderedMerge):
-    _merge_type = 'asof_merge'
-
-    def __init__(self, left, right, on=None, left_on=None, right_on=None,
-                 left_index=False, right_index=False,
-                 by=None, left_by=None, right_by=None,
-                 axis=1, suffixes=('_x', '_y'), copy=True,
-                 fill_method=None,
-                 how='asof', tolerance=None,
-                 allow_exact_matches=True,
-                 direction='backward'):
-
-        self.by = by
-        self.left_by = left_by
-        self.right_by = right_by
-        self.tolerance = tolerance
-        self.allow_exact_matches = allow_exact_matches
-        self.direction = direction
-
-        _OrderedMerge.__init__(self, left, right, on=on, left_on=left_on,
-                               right_on=right_on, left_index=left_index,
-                               right_index=right_index, axis=axis,
-                               how=how, suffixes=suffixes,
-                               fill_method=fill_method)
-
-    def _validate_specification(self):
-        super(_AsOfMerge, self)._validate_specification()
-
-        # we only allow on to be a single item for on
-        if len(self.left_on) != 1 and not self.left_index:
-            raise MergeError("can only asof on a key for left")
-
-        if len(self.right_on) != 1 and not self.right_index:
-            raise MergeError("can only asof on a key for right")
-
-        if self.left_index and isinstance(self.left.index, MultiIndex):
-            raise MergeError("left can only have one index")
-
-        if self.right_index and isinstance(self.right.index, MultiIndex):
-            raise MergeError("right can only have one index")
-
-        # set 'by' columns
-        if self.by is not None:
-            if self.left_by is not None or self.right_by is not None:
-                raise MergeError('Can only pass by OR left_by '
-                                 'and right_by')
-            self.left_by = self.right_by = self.by
-        if self.left_by is None and self.right_by is not None:
-            raise MergeError('missing left_by')
-        if self.left_by is not None and self.right_by is None:
-            raise MergeError('missing right_by')
-
-        # add 'by' to our key-list so we can have it in the
-        # output as a key
-        if self.left_by is not None:
-            if not is_list_like(self.left_by):
-                self.left_by = [self.left_by]
-            if not is_list_like(self.right_by):
-                self.right_by = [self.right_by]
-
-            if len(self.left_by) != len(self.right_by):
-                raise MergeError('left_by and right_by must be same length')
-
-            self.left_on = self.left_by + list(self.left_on)
-            self.right_on = self.right_by + list(self.right_on)
-
-        # check 'direction' is valid
-        if self.direction not in ['backward', 'forward', 'nearest']:
-            raise MergeError('direction invalid: ' + self.direction)
-
-    @property
-    def _asof_key(self):
-        """ This is our asof key, the 'on' """
-        return self.left_on[-1]
-
-    def _get_merge_keys(self):
-
-        # note this function has side effects
-        (left_join_keys,
-         right_join_keys,
-         join_names) = super(_AsOfMerge, self)._get_merge_keys()
-
-        # validate index types are the same
-        for lk, rk in zip(left_join_keys, right_join_keys):
-            if not is_dtype_equal(lk.dtype, rk.dtype):
-                raise MergeError("incompatible merge keys, "
-                                 "must be the same type")
-
-        # validate tolerance; must be a Timedelta if we have a DTI
-        if self.tolerance is not None:
-
-            if self.left_index:
-                lt = self.left.index
-            else:
-                lt = left_join_keys[-1]
-
-            msg = "incompatible tolerance, must be compat " \
-                  "with type {0}".format(type(lt))
-
-            if is_datetime64_dtype(lt) or is_datetime64tz_dtype(lt):
-                if not isinstance(self.tolerance, Timedelta):
-                    raise MergeError(msg)
-                if self.tolerance < Timedelta(0):
-                    raise MergeError("tolerance must be positive")
-
-            elif is_int64_dtype(lt):
-                if not is_integer(self.tolerance):
-                    raise MergeError(msg)
-                if self.tolerance < 0:
-                    raise MergeError("tolerance must be positive")
-
-            else:
-                raise MergeError("key must be integer or timestamp")
-
-        # validate allow_exact_matches
-        if not is_bool(self.allow_exact_matches):
-            raise MergeError("allow_exact_matches must be boolean, "
-                             "passed {0}".format(self.allow_exact_matches))
-
-        return left_join_keys, right_join_keys, join_names
-
-    def _get_join_indexers(self):
-        """ return the join indexers """
-
-        def flip(xs):
-            """ unlike np.transpose, this returns an array of tuples """
-            labels = list(string.ascii_lowercase[:len(xs)])
-            dtypes = [x.dtype for x in xs]
-            labeled_dtypes = list(zip(labels, dtypes))
-            return np.array(lzip(*xs), labeled_dtypes)
-
-        # values to compare
-        left_values = (self.left.index.values if self.left_index else
-                       self.left_join_keys[-1])
-        right_values = (self.right.index.values if self.right_index else
-                        self.right_join_keys[-1])
-        tolerance = self.tolerance
-
-        # we required sortedness in the join keys
-        msg = " keys must be sorted"
-        if not Index(left_values).is_monotonic:
-            raise ValueError('left' + msg)
-        if not Index(right_values).is_monotonic:
-            raise ValueError('right' + msg)
-
-        # initial type conversion as needed
-        if needs_i8_conversion(left_values):
-            left_values = left_values.view('i8')
-            right_values = right_values.view('i8')
-            if tolerance is not None:
-                tolerance = tolerance.value
-
-        # a "by" parameter requires special handling
-        if self.left_by is not None:
-            # remove 'on' parameter from values if one existed
-            if self.left_index and self.right_index:
-                left_by_values = self.left_join_keys
-                right_by_values = self.right_join_keys
-            else:
-                left_by_values = self.left_join_keys[0:-1]
-                right_by_values = self.right_join_keys[0:-1]
-
-            # get tuple representation of values if more than one
-            if len(left_by_values) == 1:
-                left_by_values = left_by_values[0]
-                right_by_values = right_by_values[0]
-            else:
-                left_by_values = flip(left_by_values)
-                right_by_values = flip(right_by_values)
-
-            # upcast 'by' parameter because HashTable is limited
-            by_type = _get_cython_type_upcast(left_by_values.dtype)
-            by_type_caster = _type_casters[by_type]
-            left_by_values = by_type_caster(left_by_values)
-            right_by_values = by_type_caster(right_by_values)
-
-            # choose appropriate function by type
-            on_type = _get_cython_type(left_values.dtype)
-            func = _asof_by_function(self.direction, on_type, by_type)
-            return func(left_values,
-                        right_values,
-                        left_by_values,
-                        right_by_values,
-                        self.allow_exact_matches,
-                        tolerance)
-        else:
-            # choose appropriate function by type
-            on_type = _get_cython_type(left_values.dtype)
-            func = _asof_function(self.direction, on_type)
-            return func(left_values,
-                        right_values,
-                        self.allow_exact_matches,
-                        tolerance)
-
-
-def _get_multiindex_indexer(join_keys, index, sort):
-    from functools import partial
-
-    # bind `sort` argument
-    fkeys = partial(_factorize_keys, sort=sort)
-
-    # left & right join labels and num. of levels at each location
-    rlab, llab, shape = map(list, zip(* map(fkeys, index.levels, join_keys)))
-    if sort:
-        rlab = list(map(np.take, rlab, index.labels))
-    else:
-        i8copy = lambda a: a.astype('i8', subok=False, copy=True)
-        rlab = list(map(i8copy, index.labels))
-
-    # fix right labels if there were any nulls
-    for i in range(len(join_keys)):
-        mask = index.labels[i] == -1
-        if mask.any():
-            # check if there already was any nulls at this location
-            # if there was, it is factorized to `shape[i] - 1`
-            a = join_keys[i][llab[i] == shape[i] - 1]
-            if a.size == 0 or not a[0] != a[0]:
-                shape[i] += 1
-
-            rlab[i][mask] = shape[i] - 1
-
-    # get flat i8 join keys
-    lkey, rkey = _get_join_keys(llab, rlab, shape, sort)
-
-    # factorize keys to a dense i8 space
-    lkey, rkey, count = fkeys(lkey, rkey)
-
-    return libjoin.left_outer_join(lkey, rkey, count, sort=sort)
-
-
-def _get_single_indexer(join_key, index, sort=False):
-    left_key, right_key, count = _factorize_keys(join_key, index, sort=sort)
-
-    left_indexer, right_indexer = libjoin.left_outer_join(
-        _ensure_int64(left_key),
-        _ensure_int64(right_key),
-        count, sort=sort)
-
-    return left_indexer, right_indexer
-
-
-def _left_join_on_index(left_ax, right_ax, join_keys, sort=False):
-    if len(join_keys) > 1:
-        if not ((isinstance(right_ax, MultiIndex) and
-                 len(join_keys) == right_ax.nlevels)):
-            raise AssertionError("If more than one join key is given then "
-                                 "'right_ax' must be a MultiIndex and the "
-                                 "number of join keys must be the number of "
-                                 "levels in right_ax")
-
-        left_indexer, right_indexer = \
-            _get_multiindex_indexer(join_keys, right_ax, sort=sort)
-    else:
-        jkey = join_keys[0]
-
-        left_indexer, right_indexer = \
-            _get_single_indexer(jkey, right_ax, sort=sort)
-
-    if sort or len(left_ax) != len(left_indexer):
-        # if asked to sort or there are 1-to-many matches
-        join_index = left_ax.take(left_indexer)
-        return join_index, left_indexer, right_indexer
-
-    # left frame preserves order & length of its index
-    return left_ax, None, right_indexer
-
-
-def _right_outer_join(x, y, max_groups):
-    right_indexer, left_indexer = libjoin.left_outer_join(y, x, max_groups)
-    return left_indexer, right_indexer
-
-
-_join_functions = {
-    'inner': libjoin.inner_join,
-    'left': libjoin.left_outer_join,
-    'right': _right_outer_join,
-    'outer': libjoin.full_outer_join,
-}
-
-
-def _factorize_keys(lk, rk, sort=True):
-    if is_datetime64tz_dtype(lk) and is_datetime64tz_dtype(rk):
-        lk = lk.values
-        rk = rk.values
-
-    # if we exactly match in categories, allow us to use codes
-    if (is_categorical_dtype(lk) and
-            is_categorical_dtype(rk) and
-            lk.is_dtype_equal(rk)):
-        return lk.codes, rk.codes, len(lk.categories)
-
-    if is_int_or_datetime_dtype(lk) and is_int_or_datetime_dtype(rk):
-        klass = libhashtable.Int64Factorizer
-        lk = _ensure_int64(com._values_from_object(lk))
-        rk = _ensure_int64(com._values_from_object(rk))
-    else:
-        klass = libhashtable.Factorizer
-        lk = _ensure_object(lk)
-        rk = _ensure_object(rk)
-
-    rizer = klass(max(len(lk), len(rk)))
-
-    llab = rizer.factorize(lk)
-    rlab = rizer.factorize(rk)
-
-    count = rizer.get_count()
-
-    if sort:
-        uniques = rizer.uniques.to_array()
-        llab, rlab = _sort_labels(uniques, llab, rlab)
-
-    # NA group
-    lmask = llab == -1
-    lany = lmask.any()
-    rmask = rlab == -1
-    rany = rmask.any()
-
-    if lany or rany:
-        if lany:
-            np.putmask(llab, lmask, count)
-        if rany:
-            np.putmask(rlab, rmask, count)
-        count += 1
-
-    return llab, rlab, count
-
-
-def _sort_labels(uniques, left, right):
-    if not isinstance(uniques, np.ndarray):
-        # tuplesafe
-        uniques = Index(uniques).values
-
-    l = len(left)
-    labels = np.concatenate([left, right])
-
-    _, new_labels = algos.safe_sort(uniques, labels, na_sentinel=-1)
-    new_labels = _ensure_int64(new_labels)
-    new_left, new_right = new_labels[:l], new_labels[l:]
-
-    return new_left, new_right
-
-
-def _get_join_keys(llab, rlab, shape, sort):
-
-    # how many levels can be done without overflow
-    pred = lambda i: not is_int64_overflow_possible(shape[:i])
-    nlev = next(filter(pred, range(len(shape), 0, -1)))
-
-    # get keys for the first `nlev` levels
-    stride = np.prod(shape[1:nlev], dtype='i8')
-    lkey = stride * llab[0].astype('i8', subok=False, copy=False)
-    rkey = stride * rlab[0].astype('i8', subok=False, copy=False)
-
-    for i in range(1, nlev):
-        stride //= shape[i]
-        lkey += llab[i] * stride
-        rkey += rlab[i] * stride
-
-    if nlev == len(shape):  # all done!
-        return lkey, rkey
-
-    # densify current keys to avoid overflow
-    lkey, rkey, count = _factorize_keys(lkey, rkey, sort=sort)
-
-    llab = [lkey] + llab[nlev:]
-    rlab = [rkey] + rlab[nlev:]
-    shape = [count] + shape[nlev:]
-
-    return _get_join_keys(llab, rlab, shape, sort)
-
-
-def _should_fill(lname, rname):
-    if (not isinstance(lname, compat.string_types) or
-            not isinstance(rname, compat.string_types)):
-        return True
-    return lname == rname
-
-
-def _any(x):
-    return x is not None and len(x) > 0 and any([y is not None for y in x])
diff --git a/pandas/tools/pivot.py b/pandas/tools/pivot.py
deleted file mode 100644
index e23beb8332fd4..0000000000000
--- a/pandas/tools/pivot.py
+++ /dev/null
@@ -1,594 +0,0 @@
-# pylint: disable=E1103
-
-
-from pandas.types.common import is_list_like, is_scalar
-from pandas import Series, DataFrame, MultiIndex, Index, concat
-from pandas.core.groupby import Grouper
-from pandas.tools.util import cartesian_product
-from pandas.compat import range, lrange, zip
-from pandas import compat
-import pandas.core.common as com
-import numpy as np
-
-
-def pivot_table(data, values=None, index=None, columns=None, aggfunc='mean',
-                fill_value=None, margins=False, dropna=True,
-                margins_name='All'):
-    """
-    Create a spreadsheet-style pivot table as a DataFrame. The levels in the
-    pivot table will be stored in MultiIndex objects (hierarchical indexes) on
-    the index and columns of the result DataFrame
-
-    Parameters
-    ----------
-    data : DataFrame
-    values : column to aggregate, optional
-    index : column, Grouper, array, or list of the previous
-        If an array is passed, it must be the same length as the data. The list
-        can contain any of the other types (except list).
-        Keys to group by on the pivot table index.  If an array is passed, it
-        is being used as the same manner as column values.
-    columns : column, Grouper, array, or list of the previous
-        If an array is passed, it must be the same length as the data. The list
-        can contain any of the other types (except list).
-        Keys to group by on the pivot table column.  If an array is passed, it
-        is being used as the same manner as column values.
-    aggfunc : function or list of functions, default numpy.mean
-        If list of functions passed, the resulting pivot table will have
-        hierarchical columns whose top level are the function names (inferred
-        from the function objects themselves)
-    fill_value : scalar, default None
-        Value to replace missing values with
-    margins : boolean, default False
-        Add all row / columns (e.g. for subtotal / grand totals)
-    dropna : boolean, default True
-        Do not include columns whose entries are all NaN
-    margins_name : string, default 'All'
-        Name of the row / column that will contain the totals
-        when margins is True.
-
-    Examples
-    --------
-    >>> df
-       A   B   C      D
-    0  foo one small  1
-    1  foo one large  2
-    2  foo one large  2
-    3  foo two small  3
-    4  foo two small  3
-    5  bar one large  4
-    6  bar one small  5
-    7  bar two small  6
-    8  bar two large  7
-
-    >>> table = pivot_table(df, values='D', index=['A', 'B'],
-    ...                     columns=['C'], aggfunc=np.sum)
-    >>> table
-              small  large
-    foo  one  1      4
-         two  6      NaN
-    bar  one  5      4
-         two  6      7
-
-    Returns
-    -------
-    table : DataFrame
-
-    See also
-    --------
-    DataFrame.pivot : pivot without aggregation that can handle
-        non-numeric data
-    """
-    index = _convert_by(index)
-    columns = _convert_by(columns)
-
-    if isinstance(aggfunc, list):
-        pieces = []
-        keys = []
-        for func in aggfunc:
-            table = pivot_table(data, values=values, index=index,
-                                columns=columns,
-                                fill_value=fill_value, aggfunc=func,
-                                margins=margins, margins_name=margins_name)
-            pieces.append(table)
-            keys.append(func.__name__)
-        return concat(pieces, keys=keys, axis=1)
-
-    keys = index + columns
-
-    values_passed = values is not None
-    if values_passed:
-        if is_list_like(values):
-            values_multi = True
-            values = list(values)
-        else:
-            values_multi = False
-            values = [values]
-
-        # GH14938 Make sure value labels are in data
-        for i in values:
-            if i not in data:
-                raise KeyError(i)
-
-        to_filter = []
-        for x in keys + values:
-            if isinstance(x, Grouper):
-                x = x.key
-            try:
-                if x in data:
-                    to_filter.append(x)
-            except TypeError:
-                pass
-        if len(to_filter) < len(data.columns):
-            data = data[to_filter]
-
-    else:
-        values = data.columns
-        for key in keys:
-            try:
-                values = values.drop(key)
-            except (TypeError, ValueError):
-                pass
-        values = list(values)
-
-    grouped = data.groupby(keys)
-    agged = grouped.agg(aggfunc)
-
-    table = agged
-    if table.index.nlevels > 1:
-        to_unstack = [agged.index.names[i] or i
-                      for i in range(len(index), len(keys))]
-        table = agged.unstack(to_unstack)
-
-    if not dropna:
-        try:
-            m = MultiIndex.from_arrays(cartesian_product(table.index.levels),
-                                       names=table.index.names)
-            table = table.reindex_axis(m, axis=0)
-        except AttributeError:
-            pass  # it's a single level
-
-        try:
-            m = MultiIndex.from_arrays(cartesian_product(table.columns.levels),
-                                       names=table.columns.names)
-            table = table.reindex_axis(m, axis=1)
-        except AttributeError:
-            pass  # it's a single level or a series
-
-    if isinstance(table, DataFrame):
-        table = table.sort_index(axis=1)
-
-    if fill_value is not None:
-        table = table.fillna(value=fill_value, downcast='infer')
-
-    if margins:
-        if dropna:
-            data = data[data.notnull().all(axis=1)]
-        table = _add_margins(table, data, values, rows=index,
-                             cols=columns, aggfunc=aggfunc,
-                             margins_name=margins_name)
-
-    # discard the top level
-    if values_passed and not values_multi and not table.empty:
-        table = table[values[0]]
-
-    if len(index) == 0 and len(columns) > 0:
-        table = table.T
-
-    # GH 15193 Makse sure empty columns are removed if dropna=True
-    if isinstance(table, DataFrame) and dropna:
-        table = table.dropna(how='all', axis=1)
-
-    return table
-
-
-DataFrame.pivot_table = pivot_table
-
-
-def _add_margins(table, data, values, rows, cols, aggfunc,
-                 margins_name='All'):
-    if not isinstance(margins_name, compat.string_types):
-        raise ValueError('margins_name argument must be a string')
-
-    exception_msg = 'Conflicting name "{0}" in margins'.format(margins_name)
-    for level in table.index.names:
-        if margins_name in table.index.get_level_values(level):
-            raise ValueError(exception_msg)
-
-    grand_margin = _compute_grand_margin(data, values, aggfunc, margins_name)
-
-    # could be passed a Series object with no 'columns'
-    if hasattr(table, 'columns'):
-        for level in table.columns.names[1:]:
-            if margins_name in table.columns.get_level_values(level):
-                raise ValueError(exception_msg)
-
-    if len(rows) > 1:
-        key = (margins_name,) + ('',) * (len(rows) - 1)
-    else:
-        key = margins_name
-
-    if not values and isinstance(table, Series):
-        # If there are no values and the table is a series, then there is only
-        # one column in the data. Compute grand margin and return it.
-        return table.append(Series({key: grand_margin[margins_name]}))
-
-    if values:
-        marginal_result_set = _generate_marginal_results(table, data, values,
-                                                         rows, cols, aggfunc,
-                                                         grand_margin,
-                                                         margins_name)
-        if not isinstance(marginal_result_set, tuple):
-            return marginal_result_set
-        result, margin_keys, row_margin = marginal_result_set
-    else:
-        marginal_result_set = _generate_marginal_results_without_values(
-            table, data, rows, cols, aggfunc, margins_name)
-        if not isinstance(marginal_result_set, tuple):
-            return marginal_result_set
-        result, margin_keys, row_margin = marginal_result_set
-
-    row_margin = row_margin.reindex(result.columns)
-    # populate grand margin
-    for k in margin_keys:
-        if isinstance(k, compat.string_types):
-            row_margin[k] = grand_margin[k]
-        else:
-            row_margin[k] = grand_margin[k[0]]
-
-    margin_dummy = DataFrame(row_margin, columns=[key]).T
-
-    row_names = result.index.names
-    try:
-        result = result.append(margin_dummy)
-    except TypeError:
-
-        # we cannot reshape, so coerce the axis
-        result.index = result.index._to_safe_for_reshape()
-        result = result.append(margin_dummy)
-    result.index.names = row_names
-
-    return result
-
-
-def _compute_grand_margin(data, values, aggfunc,
-                          margins_name='All'):
-
-    if values:
-        grand_margin = {}
-        for k, v in data[values].iteritems():
-            try:
-                if isinstance(aggfunc, compat.string_types):
-                    grand_margin[k] = getattr(v, aggfunc)()
-                elif isinstance(aggfunc, dict):
-                    if isinstance(aggfunc[k], compat.string_types):
-                        grand_margin[k] = getattr(v, aggfunc[k])()
-                    else:
-                        grand_margin[k] = aggfunc[k](v)
-                else:
-                    grand_margin[k] = aggfunc(v)
-            except TypeError:
-                pass
-        return grand_margin
-    else:
-        return {margins_name: aggfunc(data.index)}
-
-
-def _generate_marginal_results(table, data, values, rows, cols, aggfunc,
-                               grand_margin,
-                               margins_name='All'):
-    if len(cols) > 0:
-        # need to "interleave" the margins
-        table_pieces = []
-        margin_keys = []
-
-        def _all_key(key):
-            return (key, margins_name) + ('',) * (len(cols) - 1)
-
-        if len(rows) > 0:
-            margin = data[rows + values].groupby(rows).agg(aggfunc)
-            cat_axis = 1
-
-            for key, piece in table.groupby(level=0, axis=cat_axis):
-                all_key = _all_key(key)
-
-                # we are going to mutate this, so need to copy!
-                piece = piece.copy()
-                try:
-                    piece[all_key] = margin[key]
-                except TypeError:
-
-                    # we cannot reshape, so coerce the axis
-                    piece.set_axis(cat_axis, piece._get_axis(
-                        cat_axis)._to_safe_for_reshape())
-                    piece[all_key] = margin[key]
-
-                table_pieces.append(piece)
-                margin_keys.append(all_key)
-        else:
-            margin = grand_margin
-            cat_axis = 0
-            for key, piece in table.groupby(level=0, axis=cat_axis):
-                all_key = _all_key(key)
-                table_pieces.append(piece)
-                table_pieces.append(Series(margin[key], index=[all_key]))
-                margin_keys.append(all_key)
-
-        result = concat(table_pieces, axis=cat_axis)
-
-        if len(rows) == 0:
-            return result
-    else:
-        result = table
-        margin_keys = table.columns
-
-    if len(cols) > 0:
-        row_margin = data[cols + values].groupby(cols).agg(aggfunc)
-        row_margin = row_margin.stack()
-
-        # slight hack
-        new_order = [len(cols)] + lrange(len(cols))
-        row_margin.index = row_margin.index.reorder_levels(new_order)
-    else:
-        row_margin = Series(np.nan, index=result.columns)
-
-    return result, margin_keys, row_margin
-
-
-def _generate_marginal_results_without_values(
-        table, data, rows, cols, aggfunc,
-        margins_name='All'):
-    if len(cols) > 0:
-        # need to "interleave" the margins
-        margin_keys = []
-
-        def _all_key():
-            if len(cols) == 1:
-                return margins_name
-            return (margins_name, ) + ('', ) * (len(cols) - 1)
-
-        if len(rows) > 0:
-            margin = data[rows].groupby(rows).apply(aggfunc)
-            all_key = _all_key()
-            table[all_key] = margin
-            result = table
-            margin_keys.append(all_key)
-
-        else:
-            margin = data.groupby(level=0, axis=0).apply(aggfunc)
-            all_key = _all_key()
-            table[all_key] = margin
-            result = table
-            margin_keys.append(all_key)
-            return result
-    else:
-        result = table
-        margin_keys = table.columns
-
-    if len(cols):
-        row_margin = data[cols].groupby(cols).apply(aggfunc)
-    else:
-        row_margin = Series(np.nan, index=result.columns)
-
-    return result, margin_keys, row_margin
-
-
-def _convert_by(by):
-    if by is None:
-        by = []
-    elif (is_scalar(by) or
-          isinstance(by, (np.ndarray, Index, Series, Grouper)) or
-          hasattr(by, '__call__')):
-        by = [by]
-    else:
-        by = list(by)
-    return by
-
-
-def crosstab(index, columns, values=None, rownames=None, colnames=None,
-             aggfunc=None, margins=False, dropna=True, normalize=False):
-    """
-    Compute a simple cross-tabulation of two (or more) factors. By default
-    computes a frequency table of the factors unless an array of values and an
-    aggregation function are passed
-
-    Parameters
-    ----------
-    index : array-like, Series, or list of arrays/Series
-        Values to group by in the rows
-    columns : array-like, Series, or list of arrays/Series
-        Values to group by in the columns
-    values : array-like, optional
-        Array of values to aggregate according to the factors.
-        Requires `aggfunc` be specified.
-    aggfunc : function, optional
-        If specified, requires `values` be specified as well
-    rownames : sequence, default None
-        If passed, must match number of row arrays passed
-    colnames : sequence, default None
-        If passed, must match number of column arrays passed
-    margins : boolean, default False
-        Add row/column margins (subtotals)
-    dropna : boolean, default True
-        Do not include columns whose entries are all NaN
-    normalize : boolean, {'all', 'index', 'columns'}, or {0,1}, default False
-        Normalize by dividing all values by the sum of values.
-
-        - If passed 'all' or `True`, will normalize over all values.
-        - If passed 'index' will normalize over each row.
-        - If passed 'columns' will normalize over each column.
-        - If margins is `True`, will also normalize margin values.
-
-        .. versionadded:: 0.18.1
-
-
-    Notes
-    -----
-    Any Series passed will have their name attributes used unless row or column
-    names for the cross-tabulation are specified.
-
-    Any input passed containing Categorical data will have **all** of its
-    categories included in the cross-tabulation, even if the actual data does
-    not contain any instances of a particular category.
-
-    In the event that there aren't overlapping indexes an empty DataFrame will
-    be returned.
-
-    Examples
-    --------
-    >>> a
-    array([foo, foo, foo, foo, bar, bar,
-           bar, bar, foo, foo, foo], dtype=object)
-    >>> b
-    array([one, one, one, two, one, one,
-           one, two, two, two, one], dtype=object)
-    >>> c
-    array([dull, dull, shiny, dull, dull, shiny,
-           shiny, dull, shiny, shiny, shiny], dtype=object)
-
-    >>> crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
-    b    one          two
-    c    dull  shiny  dull  shiny
-    a
-    bar  1     2      1     0
-    foo  2     2      1     2
-
-    >>> foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
-    >>> bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
-    >>> crosstab(foo, bar)  # 'c' and 'f' are not represented in the data,
-                            # but they still will be counted in the output
-    col_0  d  e  f
-    row_0
-    a      1  0  0
-    b      0  1  0
-    c      0  0  0
-
-    Returns
-    -------
-    crosstab : DataFrame
-    """
-
-    index = com._maybe_make_list(index)
-    columns = com._maybe_make_list(columns)
-
-    rownames = _get_names(index, rownames, prefix='row')
-    colnames = _get_names(columns, colnames, prefix='col')
-
-    data = {}
-    data.update(zip(rownames, index))
-    data.update(zip(colnames, columns))
-
-    if values is None and aggfunc is not None:
-        raise ValueError("aggfunc cannot be used without values.")
-
-    if values is not None and aggfunc is None:
-        raise ValueError("values cannot be used without an aggfunc.")
-
-    if values is None:
-        df = DataFrame(data)
-        df['__dummy__'] = 0
-        table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
-                               aggfunc=len, margins=margins, dropna=dropna)
-        table = table.fillna(0).astype(np.int64)
-
-    else:
-        data['__dummy__'] = values
-        df = DataFrame(data)
-        table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
-                               aggfunc=aggfunc, margins=margins, dropna=dropna)
-
-    # Post-process
-    if normalize is not False:
-        table = _normalize(table, normalize=normalize, margins=margins)
-
-    return table
-
-
-def _normalize(table, normalize, margins):
-
-    if not isinstance(normalize, bool) and not isinstance(normalize,
-                                                          compat.string_types):
-        axis_subs = {0: 'index', 1: 'columns'}
-        try:
-            normalize = axis_subs[normalize]
-        except KeyError:
-            raise ValueError("Not a valid normalize argument")
-
-    if margins is False:
-
-        # Actual Normalizations
-        normalizers = {
-            'all': lambda x: x / x.sum(axis=1).sum(axis=0),
-            'columns': lambda x: x / x.sum(),
-            'index': lambda x: x.div(x.sum(axis=1), axis=0)
-        }
-
-        normalizers[True] = normalizers['all']
-
-        try:
-            f = normalizers[normalize]
-        except KeyError:
-            raise ValueError("Not a valid normalize argument")
-
-        table = f(table)
-        table = table.fillna(0)
-
-    elif margins is True:
-
-        column_margin = table.loc[:, 'All'].drop('All')
-        index_margin = table.loc['All', :].drop('All')
-        table = table.drop('All', axis=1).drop('All')
-        # to keep index and columns names
-        table_index_names = table.index.names
-        table_columns_names = table.columns.names
-
-        # Normalize core
-        table = _normalize(table, normalize=normalize, margins=False)
-
-        # Fix Margins
-        if normalize == 'columns':
-            column_margin = column_margin / column_margin.sum()
-            table = concat([table, column_margin], axis=1)
-            table = table.fillna(0)
-
-        elif normalize == 'index':
-            index_margin = index_margin / index_margin.sum()
-            table = table.append(index_margin)
-            table = table.fillna(0)
-
-        elif normalize == "all" or normalize is True:
-            column_margin = column_margin / column_margin.sum()
-            index_margin = index_margin / index_margin.sum()
-            index_margin.loc['All'] = 1
-            table = concat([table, column_margin], axis=1)
-            table = table.append(index_margin)
-
-            table = table.fillna(0)
-
-        else:
-            raise ValueError("Not a valid normalize argument")
-
-        table.index.names = table_index_names
-        table.columns.names = table_columns_names
-
-    else:
-        raise ValueError("Not a valid margins argument")
-
-    return table
-
-
-def _get_names(arrs, names, prefix='row'):
-    if names is None:
-        names = []
-        for i, arr in enumerate(arrs):
-            if isinstance(arr, Series) and arr.name is not None:
-                names.append(arr.name)
-            else:
-                names.append('%s_%d' % (prefix, i))
-    else:
-        if len(names) != len(arrs):
-            raise AssertionError('arrays and names must have the same length')
-        if not isinstance(names, list):
-            names = list(names)
-
-    return names
diff --git a/pandas/tools/plotting.py b/pandas/tools/plotting.py
deleted file mode 100644
index d311b0e6d83eb..0000000000000
--- a/pandas/tools/plotting.py
+++ /dev/null
@@ -1,4014 +0,0 @@
-# being a bit too dynamic
-# pylint: disable=E1101
-from __future__ import division
-
-import warnings
-import re
-from math import ceil
-from collections import namedtuple
-from contextlib import contextmanager
-from distutils.version import LooseVersion
-
-import numpy as np
-
-from pandas.types.common import (is_list_like,
-                                 is_integer,
-                                 is_number,
-                                 is_hashable,
-                                 is_iterator)
-from pandas.types.missing import isnull, notnull
-
-from pandas.util.decorators import cache_readonly, deprecate_kwarg
-from pandas.core.base import PandasObject
-
-from pandas.core.common import AbstractMethodError, _try_sort
-from pandas.core.generic import _shared_docs, _shared_doc_kwargs
-from pandas.core.index import Index, MultiIndex
-from pandas.core.series import Series, remove_na
-from pandas.tseries.period import PeriodIndex
-from pandas.compat import range, lrange, lmap, map, zip, string_types
-import pandas.compat as compat
-from pandas.formats.printing import pprint_thing
-from pandas.util.decorators import Appender
-try:  # mpl optional
-    import pandas.tseries.converter as conv
-    conv.register()  # needs to override so set_xlim works with str/number
-except ImportError:
-    pass
-
-
-# Extracted from https://gist.github.com/huyng/816622
-# this is the rcParams set when setting display.with_mpl_style
-# to True.
-mpl_stylesheet = {
-    'axes.axisbelow': True,
-    'axes.color_cycle': ['#348ABD',
-                         '#7A68A6',
-                         '#A60628',
-                         '#467821',
-                         '#CF4457',
-                         '#188487',
-                         '#E24A33'],
-    'axes.edgecolor': '#bcbcbc',
-    'axes.facecolor': '#eeeeee',
-    'axes.grid': True,
-    'axes.labelcolor': '#555555',
-    'axes.labelsize': 'large',
-    'axes.linewidth': 1.0,
-    'axes.titlesize': 'x-large',
-    'figure.edgecolor': 'white',
-    'figure.facecolor': 'white',
-    'figure.figsize': (6.0, 4.0),
-    'figure.subplot.hspace': 0.5,
-    'font.family': 'monospace',
-    'font.monospace': ['Andale Mono',
-                       'Nimbus Mono L',
-                       'Courier New',
-                       'Courier',
-                       'Fixed',
-                       'Terminal',
-                       'monospace'],
-    'font.size': 10,
-    'interactive': True,
-    'keymap.all_axes': ['a'],
-    'keymap.back': ['left', 'c', 'backspace'],
-    'keymap.forward': ['right', 'v'],
-    'keymap.fullscreen': ['f'],
-    'keymap.grid': ['g'],
-    'keymap.home': ['h', 'r', 'home'],
-    'keymap.pan': ['p'],
-    'keymap.save': ['s'],
-    'keymap.xscale': ['L', 'k'],
-    'keymap.yscale': ['l'],
-    'keymap.zoom': ['o'],
-    'legend.fancybox': True,
-    'lines.antialiased': True,
-    'lines.linewidth': 1.0,
-    'patch.antialiased': True,
-    'patch.edgecolor': '#EEEEEE',
-    'patch.facecolor': '#348ABD',
-    'patch.linewidth': 0.5,
-    'toolbar': 'toolbar2',
-    'xtick.color': '#555555',
-    'xtick.direction': 'in',
-    'xtick.major.pad': 6.0,
-    'xtick.major.size': 0.0,
-    'xtick.minor.pad': 6.0,
-    'xtick.minor.size': 0.0,
-    'ytick.color': '#555555',
-    'ytick.direction': 'in',
-    'ytick.major.pad': 6.0,
-    'ytick.major.size': 0.0,
-    'ytick.minor.pad': 6.0,
-    'ytick.minor.size': 0.0
-}
-
-
-def _mpl_le_1_2_1():
-    try:
-        import matplotlib as mpl
-        return (str(mpl.__version__) <= LooseVersion('1.2.1') and
-                str(mpl.__version__)[0] != '0')
-    except ImportError:
-        return False
-
-
-def _mpl_ge_1_3_1():
-    try:
-        import matplotlib
-        # The or v[0] == '0' is because their versioneer is
-        # messed up on dev
-        return (matplotlib.__version__ >= LooseVersion('1.3.1') or
-                matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-
-def _mpl_ge_1_4_0():
-    try:
-        import matplotlib
-        return (matplotlib.__version__ >= LooseVersion('1.4') or
-                matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-
-def _mpl_ge_1_5_0():
-    try:
-        import matplotlib
-        return (matplotlib.__version__ >= LooseVersion('1.5') or
-                matplotlib.__version__[0] == '0')
-    except ImportError:
-        return False
-
-
-def _mpl_ge_2_0_0():
-    try:
-        import matplotlib
-        return matplotlib.__version__ >= LooseVersion('2.0')
-    except ImportError:
-        return False
-
-
-def _mpl_ge_2_0_1():
-    try:
-        import matplotlib
-        return matplotlib.__version__ >= LooseVersion('2.0.1')
-    except ImportError:
-        return False
-
-
-if _mpl_ge_1_5_0():
-    # Compat with mp 1.5, which uses cycler.
-    import cycler
-    colors = mpl_stylesheet.pop('axes.color_cycle')
-    mpl_stylesheet['axes.prop_cycle'] = cycler.cycler('color', colors)
-
-
-def _get_standard_kind(kind):
-    return {'density': 'kde'}.get(kind, kind)
-
-
-def _get_standard_colors(num_colors=None, colormap=None, color_type='default',
-                         color=None):
-    import matplotlib.pyplot as plt
-
-    if color is None and colormap is not None:
-        if isinstance(colormap, compat.string_types):
-            import matplotlib.cm as cm
-            cmap = colormap
-            colormap = cm.get_cmap(colormap)
-            if colormap is None:
-                raise ValueError("Colormap {0} is not recognized".format(cmap))
-        colors = lmap(colormap, np.linspace(0, 1, num=num_colors))
-    elif color is not None:
-        if colormap is not None:
-            warnings.warn("'color' and 'colormap' cannot be used "
-                          "simultaneously. Using 'color'")
-        colors = list(color) if is_list_like(color) else color
-    else:
-        if color_type == 'default':
-            # need to call list() on the result to copy so we don't
-            # modify the global rcParams below
-            try:
-                colors = [c['color']
-                          for c in list(plt.rcParams['axes.prop_cycle'])]
-            except KeyError:
-                colors = list(plt.rcParams.get('axes.color_cycle',
-                                               list('bgrcmyk')))
-            if isinstance(colors, compat.string_types):
-                colors = list(colors)
-        elif color_type == 'random':
-            import random
-
-            def random_color(column):
-                random.seed(column)
-                return [random.random() for _ in range(3)]
-
-            colors = lmap(random_color, lrange(num_colors))
-        else:
-            raise ValueError("color_type must be either 'default' or 'random'")
-
-    if isinstance(colors, compat.string_types):
-        import matplotlib.colors
-        conv = matplotlib.colors.ColorConverter()
-
-        def _maybe_valid_colors(colors):
-            try:
-                [conv.to_rgba(c) for c in colors]
-                return True
-            except ValueError:
-                return False
-
-        # check whether the string can be convertable to single color
-        maybe_single_color = _maybe_valid_colors([colors])
-        # check whether each character can be convertable to colors
-        maybe_color_cycle = _maybe_valid_colors(list(colors))
-        if maybe_single_color and maybe_color_cycle and len(colors) > 1:
-            msg = ("'{0}' can be parsed as both single color and "
-                   "color cycle. Specify each color using a list "
-                   "like ['{0}'] or {1}")
-            raise ValueError(msg.format(colors, list(colors)))
-        elif maybe_single_color:
-            colors = [colors]
-        else:
-            # ``colors`` is regarded as color cycle.
-            # mpl will raise error any of them is invalid
-            pass
-
-    if len(colors) != num_colors:
-        multiple = num_colors // len(colors) - 1
-        mod = num_colors % len(colors)
-
-        colors += multiple * colors
-        colors += colors[:mod]
-
-    return colors
-
-
-class _Options(dict):
-    """
-    Stores pandas plotting options.
-    Allows for parameter aliasing so you can just use parameter names that are
-    the same as the plot function parameters, but is stored in a canonical
-    format that makes it easy to breakdown into groups later
-    """
-
-    # alias so the names are same as plotting method parameter names
-    _ALIASES = {'x_compat': 'xaxis.compat'}
-    _DEFAULT_KEYS = ['xaxis.compat']
-
-    def __init__(self):
-        self['xaxis.compat'] = False
-
-    def __getitem__(self, key):
-        key = self._get_canonical_key(key)
-        if key not in self:
-            raise ValueError('%s is not a valid pandas plotting option' % key)
-        return super(_Options, self).__getitem__(key)
-
-    def __setitem__(self, key, value):
-        key = self._get_canonical_key(key)
-        return super(_Options, self).__setitem__(key, value)
-
-    def __delitem__(self, key):
-        key = self._get_canonical_key(key)
-        if key in self._DEFAULT_KEYS:
-            raise ValueError('Cannot remove default parameter %s' % key)
-        return super(_Options, self).__delitem__(key)
-
-    def __contains__(self, key):
-        key = self._get_canonical_key(key)
-        return super(_Options, self).__contains__(key)
-
-    def reset(self):
-        """
-        Reset the option store to its initial state
-
-        Returns
-        -------
-        None
-        """
-        self.__init__()
-
-    def _get_canonical_key(self, key):
-        return self._ALIASES.get(key, key)
-
-    @contextmanager
-    def use(self, key, value):
-        """
-        Temporarily set a parameter value using the with statement.
-        Aliasing allowed.
-        """
-        old_value = self[key]
-        try:
-            self[key] = value
-            yield self
-        finally:
-            self[key] = old_value
-
-
-plot_params = _Options()
-
-
-def scatter_matrix(frame, alpha=0.5, figsize=None, ax=None, grid=False,
-                   diagonal='hist', marker='.', density_kwds=None,
-                   hist_kwds=None, range_padding=0.05, **kwds):
-    """
-    Draw a matrix of scatter plots.
-
-    Parameters
-    ----------
-    frame : DataFrame
-    alpha : float, optional
-        amount of transparency applied
-    figsize : (float,float), optional
-        a tuple (width, height) in inches
-    ax : Matplotlib axis object, optional
-    grid : bool, optional
-        setting this to True will show the grid
-    diagonal : {'hist', 'kde'}
-        pick between 'kde' and 'hist' for
-        either Kernel Density Estimation or Histogram
-        plot in the diagonal
-    marker : str, optional
-        Matplotlib marker type, default '.'
-    hist_kwds : other plotting keyword arguments
-        To be passed to hist function
-    density_kwds : other plotting keyword arguments
-        To be passed to kernel density estimate plot
-    range_padding : float, optional
-        relative extension of axis range in x and y
-        with respect to (x_max - x_min) or (y_max - y_min),
-        default 0.05
-    kwds : other plotting keyword arguments
-        To be passed to scatter function
-
-    Examples
-    --------
-    >>> df = DataFrame(np.random.randn(1000, 4), columns=['A','B','C','D'])
-    >>> scatter_matrix(df, alpha=0.2)
-    """
-    import matplotlib.pyplot as plt
-
-    df = frame._get_numeric_data()
-    n = df.columns.size
-    naxes = n * n
-    fig, axes = _subplots(naxes=naxes, figsize=figsize, ax=ax,
-                          squeeze=False)
-
-    # no gaps between subplots
-    fig.subplots_adjust(wspace=0, hspace=0)
-
-    mask = notnull(df)
-
-    marker = _get_marker_compat(marker)
-
-    hist_kwds = hist_kwds or {}
-    density_kwds = density_kwds or {}
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    boundaries_list = []
-    for a in df.columns:
-        values = df[a].values[mask[a].values]
-        rmin_, rmax_ = np.min(values), np.max(values)
-        rdelta_ext = (rmax_ - rmin_) * range_padding / 2.
-        boundaries_list.append((rmin_ - rdelta_ext, rmax_ + rdelta_ext))
-
-    for i, a in zip(lrange(n), df.columns):
-        for j, b in zip(lrange(n), df.columns):
-            ax = axes[i, j]
-
-            if i == j:
-                values = df[a].values[mask[a].values]
-
-                # Deal with the diagonal by drawing a histogram there.
-                if diagonal == 'hist':
-                    ax.hist(values, **hist_kwds)
-
-                elif diagonal in ('kde', 'density'):
-                    from scipy.stats import gaussian_kde
-                    y = values
-                    gkde = gaussian_kde(y)
-                    ind = np.linspace(y.min(), y.max(), 1000)
-                    ax.plot(ind, gkde.evaluate(ind), **density_kwds)
-
-                ax.set_xlim(boundaries_list[i])
-
-            else:
-                common = (mask[a] & mask[b]).values
-
-                ax.scatter(df[b][common], df[a][common],
-                           marker=marker, alpha=alpha, **kwds)
-
-                ax.set_xlim(boundaries_list[j])
-                ax.set_ylim(boundaries_list[i])
-
-            ax.set_xlabel(b)
-            ax.set_ylabel(a)
-
-            if j != 0:
-                ax.yaxis.set_visible(False)
-            if i != n - 1:
-                ax.xaxis.set_visible(False)
-
-    if len(df.columns) > 1:
-        lim1 = boundaries_list[0]
-        locs = axes[0][1].yaxis.get_majorticklocs()
-        locs = locs[(lim1[0] <= locs) & (locs <= lim1[1])]
-        adj = (locs - lim1[0]) / (lim1[1] - lim1[0])
-
-        lim0 = axes[0][0].get_ylim()
-        adj = adj * (lim0[1] - lim0[0]) + lim0[0]
-        axes[0][0].yaxis.set_ticks(adj)
-
-        if np.all(locs == locs.astype(int)):
-            # if all ticks are int
-            locs = locs.astype(int)
-        axes[0][0].yaxis.set_ticklabels(locs)
-
-    _set_ticks_props(axes, xlabelsize=8, xrot=90, ylabelsize=8, yrot=0)
-
-    return axes
-
-
-def _gca():
-    import matplotlib.pyplot as plt
-    return plt.gca()
-
-
-def _gcf():
-    import matplotlib.pyplot as plt
-    return plt.gcf()
-
-
-def _get_marker_compat(marker):
-    import matplotlib.lines as mlines
-    import matplotlib as mpl
-    if mpl.__version__ < '1.1.0' and marker == '.':
-        return 'o'
-    if marker not in mlines.lineMarkers:
-        return 'o'
-    return marker
-
-
-def radviz(frame, class_column, ax=None, color=None, colormap=None, **kwds):
-    """RadViz - a multivariate data visualization algorithm
-
-    Parameters:
-    -----------
-    frame: DataFrame
-    class_column: str
-        Column name containing class names
-    ax: Matplotlib axis object, optional
-    color: list or tuple, optional
-        Colors to use for the different classes
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    kwds: keywords
-        Options to pass to matplotlib scatter plotting method
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-    import matplotlib.patches as patches
-
-    def normalize(series):
-        a = min(series)
-        b = max(series)
-        return (series - a) / (b - a)
-
-    n = len(frame)
-    classes = frame[class_column].drop_duplicates()
-    class_col = frame[class_column]
-    df = frame.drop(class_column, axis=1).apply(normalize)
-
-    if ax is None:
-        ax = plt.gca(xlim=[-1, 1], ylim=[-1, 1])
-
-    to_plot = {}
-    colors = _get_standard_colors(num_colors=len(classes), colormap=colormap,
-                                  color_type='random', color=color)
-
-    for kls in classes:
-        to_plot[kls] = [[], []]
-
-    m = len(frame.columns) - 1
-    s = np.array([(np.cos(t), np.sin(t))
-                  for t in [2.0 * np.pi * (i / float(m))
-                            for i in range(m)]])
-
-    for i in range(n):
-        row = df.iloc[i].values
-        row_ = np.repeat(np.expand_dims(row, axis=1), 2, axis=1)
-        y = (s * row_).sum(axis=0) / row.sum()
-        kls = class_col.iat[i]
-        to_plot[kls][0].append(y[0])
-        to_plot[kls][1].append(y[1])
-
-    for i, kls in enumerate(classes):
-        ax.scatter(to_plot[kls][0], to_plot[kls][1], color=colors[i],
-                   label=pprint_thing(kls), **kwds)
-    ax.legend()
-
-    ax.add_patch(patches.Circle((0.0, 0.0), radius=1.0, facecolor='none'))
-
-    for xy, name in zip(s, df.columns):
-
-        ax.add_patch(patches.Circle(xy, radius=0.025, facecolor='gray'))
-
-        if xy[0] < 0.0 and xy[1] < 0.0:
-            ax.text(xy[0] - 0.025, xy[1] - 0.025, name,
-                    ha='right', va='top', size='small')
-        elif xy[0] < 0.0 and xy[1] >= 0.0:
-            ax.text(xy[0] - 0.025, xy[1] + 0.025, name,
-                    ha='right', va='bottom', size='small')
-        elif xy[0] >= 0.0 and xy[1] < 0.0:
-            ax.text(xy[0] + 0.025, xy[1] - 0.025, name,
-                    ha='left', va='top', size='small')
-        elif xy[0] >= 0.0 and xy[1] >= 0.0:
-            ax.text(xy[0] + 0.025, xy[1] + 0.025, name,
-                    ha='left', va='bottom', size='small')
-
-    ax.axis('equal')
-    return ax
-
-
-@deprecate_kwarg(old_arg_name='data', new_arg_name='frame')
-def andrews_curves(frame, class_column, ax=None, samples=200, color=None,
-                   colormap=None, **kwds):
-    """
-    Generates a matplotlib plot of Andrews curves, for visualising clusters of
-    multivariate data.
-
-    Andrews curves have the functional form:
-
-    f(t) = x_1/sqrt(2) + x_2 sin(t) + x_3 cos(t) +
-           x_4 sin(2t) + x_5 cos(2t) + ...
-
-    Where x coefficients correspond to the values of each dimension and t is
-    linearly spaced between -pi and +pi. Each row of frame then corresponds to
-    a single curve.
-
-    Parameters:
-    -----------
-    frame : DataFrame
-        Data to be plotted, preferably normalized to (0.0, 1.0)
-    class_column : Name of the column containing class names
-    ax : matplotlib axes object, default None
-    samples : Number of points to plot in each curve
-    color: list or tuple, optional
-        Colors to use for the different classes
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    kwds: keywords
-        Options to pass to matplotlib plotting method
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-
-    """
-    from math import sqrt, pi
-    import matplotlib.pyplot as plt
-
-    def function(amplitudes):
-        def f(t):
-            x1 = amplitudes[0]
-            result = x1 / sqrt(2.0)
-
-            # Take the rest of the coefficients and resize them
-            # appropriately. Take a copy of amplitudes as otherwise numpy
-            # deletes the element from amplitudes itself.
-            coeffs = np.delete(np.copy(amplitudes), 0)
-            coeffs.resize(int((coeffs.size + 1) / 2), 2)
-
-            # Generate the harmonics and arguments for the sin and cos
-            # functions.
-            harmonics = np.arange(0, coeffs.shape[0]) + 1
-            trig_args = np.outer(harmonics, t)
-
-            result += np.sum(coeffs[:, 0, np.newaxis] * np.sin(trig_args) +
-                             coeffs[:, 1, np.newaxis] * np.cos(trig_args),
-                             axis=0)
-            return result
-        return f
-
-    n = len(frame)
-    class_col = frame[class_column]
-    classes = frame[class_column].drop_duplicates()
-    df = frame.drop(class_column, axis=1)
-    t = np.linspace(-pi, pi, samples)
-    used_legends = set([])
-
-    color_values = _get_standard_colors(num_colors=len(classes),
-                                        colormap=colormap, color_type='random',
-                                        color=color)
-    colors = dict(zip(classes, color_values))
-    if ax is None:
-        ax = plt.gca(xlim=(-pi, pi))
-    for i in range(n):
-        row = df.iloc[i].values
-        f = function(row)
-        y = f(t)
-        kls = class_col.iat[i]
-        label = pprint_thing(kls)
-        if label not in used_legends:
-            used_legends.add(label)
-            ax.plot(t, y, color=colors[kls], label=label, **kwds)
-        else:
-            ax.plot(t, y, color=colors[kls], **kwds)
-
-    ax.legend(loc='upper right')
-    ax.grid()
-    return ax
-
-
-def bootstrap_plot(series, fig=None, size=50, samples=500, **kwds):
-    """Bootstrap plot.
-
-    Parameters:
-    -----------
-    series: Time series
-    fig: matplotlib figure object, optional
-    size: number of data points to consider during each sampling
-    samples: number of times the bootstrap procedure is performed
-    kwds: optional keyword arguments for plotting commands, must be accepted
-        by both hist and plot
-
-    Returns:
-    --------
-    fig: matplotlib figure
-    """
-    import random
-    import matplotlib.pyplot as plt
-
-    # random.sample(ndarray, int) fails on python 3.3, sigh
-    data = list(series.values)
-    samplings = [random.sample(data, size) for _ in range(samples)]
-
-    means = np.array([np.mean(sampling) for sampling in samplings])
-    medians = np.array([np.median(sampling) for sampling in samplings])
-    midranges = np.array([(min(sampling) + max(sampling)) * 0.5
-                          for sampling in samplings])
-    if fig is None:
-        fig = plt.figure()
-    x = lrange(samples)
-    axes = []
-    ax1 = fig.add_subplot(2, 3, 1)
-    ax1.set_xlabel("Sample")
-    axes.append(ax1)
-    ax1.plot(x, means, **kwds)
-    ax2 = fig.add_subplot(2, 3, 2)
-    ax2.set_xlabel("Sample")
-    axes.append(ax2)
-    ax2.plot(x, medians, **kwds)
-    ax3 = fig.add_subplot(2, 3, 3)
-    ax3.set_xlabel("Sample")
-    axes.append(ax3)
-    ax3.plot(x, midranges, **kwds)
-    ax4 = fig.add_subplot(2, 3, 4)
-    ax4.set_xlabel("Mean")
-    axes.append(ax4)
-    ax4.hist(means, **kwds)
-    ax5 = fig.add_subplot(2, 3, 5)
-    ax5.set_xlabel("Median")
-    axes.append(ax5)
-    ax5.hist(medians, **kwds)
-    ax6 = fig.add_subplot(2, 3, 6)
-    ax6.set_xlabel("Midrange")
-    axes.append(ax6)
-    ax6.hist(midranges, **kwds)
-    for axis in axes:
-        plt.setp(axis.get_xticklabels(), fontsize=8)
-        plt.setp(axis.get_yticklabels(), fontsize=8)
-    return fig
-
-
-@deprecate_kwarg(old_arg_name='colors', new_arg_name='color')
-@deprecate_kwarg(old_arg_name='data', new_arg_name='frame', stacklevel=3)
-def parallel_coordinates(frame, class_column, cols=None, ax=None, color=None,
-                         use_columns=False, xticks=None, colormap=None,
-                         axvlines=True, axvlines_kwds=None, **kwds):
-    """Parallel coordinates plotting.
-
-    Parameters
-    ----------
-    frame: DataFrame
-    class_column: str
-        Column name containing class names
-    cols: list, optional
-        A list of column names to use
-    ax: matplotlib.axis, optional
-        matplotlib axis object
-    color: list or tuple, optional
-        Colors to use for the different classes
-    use_columns: bool, optional
-        If true, columns will be used as xticks
-    xticks: list or tuple, optional
-        A list of values to use for xticks
-    colormap: str or matplotlib colormap, default None
-        Colormap to use for line colors.
-    axvlines: bool, optional
-        If true, vertical lines will be added at each xtick
-    axvlines_kwds: keywords, optional
-        Options to be passed to axvline method for vertical lines
-    kwds: keywords
-        Options to pass to matplotlib plotting method
-
-    Returns
-    -------
-    ax: matplotlib axis object
-
-    Examples
-    --------
-    >>> from pandas import read_csv
-    >>> from pandas.tools.plotting import parallel_coordinates
-    >>> from matplotlib import pyplot as plt
-    >>> df = read_csv('https://raw.github.com/pandas-dev/pandas/master'
-                      '/pandas/tests/data/iris.csv')
-    >>> parallel_coordinates(df, 'Name', color=('#556270',
-                             '#4ECDC4', '#C7F464'))
-    >>> plt.show()
-    """
-    if axvlines_kwds is None:
-        axvlines_kwds = {'linewidth': 1, 'color': 'black'}
-    import matplotlib.pyplot as plt
-
-    n = len(frame)
-    classes = frame[class_column].drop_duplicates()
-    class_col = frame[class_column]
-
-    if cols is None:
-        df = frame.drop(class_column, axis=1)
-    else:
-        df = frame[cols]
-
-    used_legends = set([])
-
-    ncols = len(df.columns)
-
-    # determine values to use for xticks
-    if use_columns is True:
-        if not np.all(np.isreal(list(df.columns))):
-            raise ValueError('Columns must be numeric to be used as xticks')
-        x = df.columns
-    elif xticks is not None:
-        if not np.all(np.isreal(xticks)):
-            raise ValueError('xticks specified must be numeric')
-        elif len(xticks) != ncols:
-            raise ValueError('Length of xticks must match number of columns')
-        x = xticks
-    else:
-        x = lrange(ncols)
-
-    if ax is None:
-        ax = plt.gca()
-
-    color_values = _get_standard_colors(num_colors=len(classes),
-                                        colormap=colormap, color_type='random',
-                                        color=color)
-
-    colors = dict(zip(classes, color_values))
-
-    for i in range(n):
-        y = df.iloc[i].values
-        kls = class_col.iat[i]
-        label = pprint_thing(kls)
-        if label not in used_legends:
-            used_legends.add(label)
-            ax.plot(x, y, color=colors[kls], label=label, **kwds)
-        else:
-            ax.plot(x, y, color=colors[kls], **kwds)
-
-    if axvlines:
-        for i in x:
-            ax.axvline(i, **axvlines_kwds)
-
-    ax.set_xticks(x)
-    ax.set_xticklabels(df.columns)
-    ax.set_xlim(x[0], x[-1])
-    ax.legend(loc='upper right')
-    ax.grid()
-    return ax
-
-
-def lag_plot(series, lag=1, ax=None, **kwds):
-    """Lag plot for time series.
-
-    Parameters:
-    -----------
-    series: Time series
-    lag: lag of the scatter plot, default 1
-    ax: Matplotlib axis object, optional
-    kwds: Matplotlib scatter method keyword arguments, optional
-
-    Returns:
-    --------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwds.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    data = series.values
-    y1 = data[:-lag]
-    y2 = data[lag:]
-    if ax is None:
-        ax = plt.gca()
-    ax.set_xlabel("y(t)")
-    ax.set_ylabel("y(t + %s)" % lag)
-    ax.scatter(y1, y2, **kwds)
-    return ax
-
-
-def autocorrelation_plot(series, ax=None, **kwds):
-    """Autocorrelation plot for time series.
-
-    Parameters:
-    -----------
-    series: Time series
-    ax: Matplotlib axis object, optional
-    kwds : keywords
-        Options to pass to matplotlib plotting method
-
-    Returns:
-    -----------
-    ax: Matplotlib axis object
-    """
-    import matplotlib.pyplot as plt
-    n = len(series)
-    data = np.asarray(series)
-    if ax is None:
-        ax = plt.gca(xlim=(1, n), ylim=(-1.0, 1.0))
-    mean = np.mean(data)
-    c0 = np.sum((data - mean) ** 2) / float(n)
-
-    def r(h):
-        return ((data[:n - h] - mean) *
-                (data[h:] - mean)).sum() / float(n) / c0
-    x = np.arange(n) + 1
-    y = lmap(r, x)
-    z95 = 1.959963984540054
-    z99 = 2.5758293035489004
-    ax.axhline(y=z99 / np.sqrt(n), linestyle='--', color='grey')
-    ax.axhline(y=z95 / np.sqrt(n), color='grey')
-    ax.axhline(y=0.0, color='black')
-    ax.axhline(y=-z95 / np.sqrt(n), color='grey')
-    ax.axhline(y=-z99 / np.sqrt(n), linestyle='--', color='grey')
-    ax.set_xlabel("Lag")
-    ax.set_ylabel("Autocorrelation")
-    ax.plot(x, y, **kwds)
-    if 'label' in kwds:
-        ax.legend()
-    ax.grid()
-    return ax
-
-
-class MPLPlot(object):
-    """
-    Base class for assembling a pandas plot using matplotlib
-
-    Parameters
-    ----------
-    data :
-
-    """
-
-    @property
-    def _kind(self):
-        """Specify kind str. Must be overridden in child class"""
-        raise NotImplementedError
-
-    _layout_type = 'vertical'
-    _default_rot = 0
-    orientation = None
-    _pop_attributes = ['label', 'style', 'logy', 'logx', 'loglog',
-                       'mark_right', 'stacked']
-    _attr_defaults = {'logy': False, 'logx': False, 'loglog': False,
-                      'mark_right': True, 'stacked': False}
-
-    def __init__(self, data, kind=None, by=None, subplots=False, sharex=None,
-                 sharey=False, use_index=True,
-                 figsize=None, grid=None, legend=True, rot=None,
-                 ax=None, fig=None, title=None, xlim=None, ylim=None,
-                 xticks=None, yticks=None,
-                 sort_columns=False, fontsize=None,
-                 secondary_y=False, colormap=None,
-                 table=False, layout=None, **kwds):
-
-        self.data = data
-        self.by = by
-
-        self.kind = kind
-
-        self.sort_columns = sort_columns
-
-        self.subplots = subplots
-
-        if sharex is None:
-            if ax is None:
-                self.sharex = True
-            else:
-                # if we get an axis, the users should do the visibility
-                # setting...
-                self.sharex = False
-        else:
-            self.sharex = sharex
-
-        self.sharey = sharey
-        self.figsize = figsize
-        self.layout = layout
-
-        self.xticks = xticks
-        self.yticks = yticks
-        self.xlim = xlim
-        self.ylim = ylim
-        self.title = title
-        self.use_index = use_index
-
-        self.fontsize = fontsize
-
-        if rot is not None:
-            self.rot = rot
-            # need to know for format_date_labels since it's rotated to 30 by
-            # default
-            self._rot_set = True
-        else:
-            self._rot_set = False
-            self.rot = self._default_rot
-
-        if grid is None:
-            grid = False if secondary_y else self.plt.rcParams['axes.grid']
-
-        self.grid = grid
-        self.legend = legend
-        self.legend_handles = []
-        self.legend_labels = []
-
-        for attr in self._pop_attributes:
-            value = kwds.pop(attr, self._attr_defaults.get(attr, None))
-            setattr(self, attr, value)
-
-        self.ax = ax
-        self.fig = fig
-        self.axes = None
-
-        # parse errorbar input if given
-        xerr = kwds.pop('xerr', None)
-        yerr = kwds.pop('yerr', None)
-        self.errors = {}
-        for kw, err in zip(['xerr', 'yerr'], [xerr, yerr]):
-            self.errors[kw] = self._parse_errorbars(kw, err)
-
-        if not isinstance(secondary_y, (bool, tuple, list, np.ndarray, Index)):
-            secondary_y = [secondary_y]
-        self.secondary_y = secondary_y
-
-        # ugly TypeError if user passes matplotlib's `cmap` name.
-        # Probably better to accept either.
-        if 'cmap' in kwds and colormap:
-            raise TypeError("Only specify one of `cmap` and `colormap`.")
-        elif 'cmap' in kwds:
-            self.colormap = kwds.pop('cmap')
-        else:
-            self.colormap = colormap
-
-        self.table = table
-
-        self.kwds = kwds
-
-        self._validate_color_args()
-
-    def _validate_color_args(self):
-        if 'color' not in self.kwds and 'colors' in self.kwds:
-            warnings.warn(("'colors' is being deprecated. Please use 'color'"
-                           "instead of 'colors'"))
-            colors = self.kwds.pop('colors')
-            self.kwds['color'] = colors
-
-        if ('color' in self.kwds and self.nseries == 1):
-            # support series.plot(color='green')
-            self.kwds['color'] = [self.kwds['color']]
-
-        if ('color' in self.kwds or 'colors' in self.kwds) and \
-                self.colormap is not None:
-            warnings.warn("'color' and 'colormap' cannot be used "
-                          "simultaneously. Using 'color'")
-
-        if 'color' in self.kwds and self.style is not None:
-            if is_list_like(self.style):
-                styles = self.style
-            else:
-                styles = [self.style]
-            # need only a single match
-            for s in styles:
-                if re.match('^[a-z]+?', s) is not None:
-                    raise ValueError(
-                        "Cannot pass 'style' string with a color "
-                        "symbol and 'color' keyword argument. Please"
-                        " use one or the other or pass 'style' "
-                        "without a color symbol")
-
-    def _iter_data(self, data=None, keep_index=False, fillna=None):
-        if data is None:
-            data = self.data
-        if fillna is not None:
-            data = data.fillna(fillna)
-
-        # TODO: unused?
-        # if self.sort_columns:
-        #     columns = _try_sort(data.columns)
-        # else:
-        #     columns = data.columns
-
-        for col, values in data.iteritems():
-            if keep_index is True:
-                yield col, values
-            else:
-                yield col, values.values
-
-    @property
-    def nseries(self):
-        if self.data.ndim == 1:
-            return 1
-        else:
-            return self.data.shape[1]
-
-    def draw(self):
-        self.plt.draw_if_interactive()
-
-    def generate(self):
-        self._args_adjust()
-        self._compute_plot_data()
-        self._setup_subplots()
-        self._make_plot()
-        self._add_table()
-        self._make_legend()
-        self._adorn_subplots()
-
-        for ax in self.axes:
-            self._post_plot_logic_common(ax, self.data)
-            self._post_plot_logic(ax, self.data)
-
-    def _args_adjust(self):
-        pass
-
-    def _has_plotted_object(self, ax):
-        """check whether ax has data"""
-        return (len(ax.lines) != 0 or
-                len(ax.artists) != 0 or
-                len(ax.containers) != 0)
-
-    def _maybe_right_yaxis(self, ax, axes_num):
-        if not self.on_right(axes_num):
-            # secondary axes may be passed via ax kw
-            return self._get_ax_layer(ax)
-
-        if hasattr(ax, 'right_ax'):
-            # if it has right_ax proparty, ``ax`` must be left axes
-            return ax.right_ax
-        elif hasattr(ax, 'left_ax'):
-            # if it has left_ax proparty, ``ax`` must be right axes
-            return ax
-        else:
-            # otherwise, create twin axes
-            orig_ax, new_ax = ax, ax.twinx()
-            # TODO: use Matplotlib public API when available
-            new_ax._get_lines = orig_ax._get_lines
-            new_ax._get_patches_for_fill = orig_ax._get_patches_for_fill
-            orig_ax.right_ax, new_ax.left_ax = new_ax, orig_ax
-
-            if not self._has_plotted_object(orig_ax):  # no data on left y
-                orig_ax.get_yaxis().set_visible(False)
-            return new_ax
-
-    def _setup_subplots(self):
-        if self.subplots:
-            fig, axes = _subplots(naxes=self.nseries,
-                                  sharex=self.sharex, sharey=self.sharey,
-                                  figsize=self.figsize, ax=self.ax,
-                                  layout=self.layout,
-                                  layout_type=self._layout_type)
-        else:
-            if self.ax is None:
-                fig = self.plt.figure(figsize=self.figsize)
-                axes = fig.add_subplot(111)
-            else:
-                fig = self.ax.get_figure()
-                if self.figsize is not None:
-                    fig.set_size_inches(self.figsize)
-                axes = self.ax
-
-        axes = _flatten(axes)
-
-        if self.logx or self.loglog:
-            [a.set_xscale('log') for a in axes]
-        if self.logy or self.loglog:
-            [a.set_yscale('log') for a in axes]
-
-        self.fig = fig
-        self.axes = axes
-
-    @property
-    def result(self):
-        """
-        Return result axes
-        """
-        if self.subplots:
-            if self.layout is not None and not is_list_like(self.ax):
-                return self.axes.reshape(*self.layout)
-            else:
-                return self.axes
-        else:
-            sec_true = isinstance(self.secondary_y, bool) and self.secondary_y
-            all_sec = (is_list_like(self.secondary_y) and
-                       len(self.secondary_y) == self.nseries)
-            if (sec_true or all_sec):
-                # if all data is plotted on secondary, return right axes
-                return self._get_ax_layer(self.axes[0], primary=False)
-            else:
-                return self.axes[0]
-
-    def _compute_plot_data(self):
-        data = self.data
-
-        if isinstance(data, Series):
-            label = self.label
-            if label is None and data.name is None:
-                label = 'None'
-            data = data.to_frame(name=label)
-
-        numeric_data = data._convert(datetime=True)._get_numeric_data()
-
-        try:
-            is_empty = numeric_data.empty
-        except AttributeError:
-            is_empty = not len(numeric_data)
-
-        # no empty frames or series allowed
-        if is_empty:
-            raise TypeError('Empty {0!r}: no numeric data to '
-                            'plot'.format(numeric_data.__class__.__name__))
-
-        self.data = numeric_data
-
-    def _make_plot(self):
-        raise AbstractMethodError(self)
-
-    def _add_table(self):
-        if self.table is False:
-            return
-        elif self.table is True:
-            data = self.data.transpose()
-        else:
-            data = self.table
-        ax = self._get_ax(0)
-        table(ax, data)
-
-    def _post_plot_logic_common(self, ax, data):
-        """Common post process for each axes"""
-        labels = [pprint_thing(key) for key in data.index]
-        labels = dict(zip(range(len(data.index)), labels))
-
-        if self.orientation == 'vertical' or self.orientation is None:
-            if self._need_to_set_index:
-                xticklabels = [labels.get(x, '') for x in ax.get_xticks()]
-                ax.set_xticklabels(xticklabels)
-            self._apply_axis_properties(ax.xaxis, rot=self.rot,
-                                        fontsize=self.fontsize)
-            self._apply_axis_properties(ax.yaxis, fontsize=self.fontsize)
-        elif self.orientation == 'horizontal':
-            if self._need_to_set_index:
-                yticklabels = [labels.get(y, '') for y in ax.get_yticks()]
-                ax.set_yticklabels(yticklabels)
-            self._apply_axis_properties(ax.yaxis, rot=self.rot,
-                                        fontsize=self.fontsize)
-            self._apply_axis_properties(ax.xaxis, fontsize=self.fontsize)
-        else:  # pragma no cover
-            raise ValueError
-
-    def _post_plot_logic(self, ax, data):
-        """Post process for each axes. Overridden in child classes"""
-        pass
-
-    def _adorn_subplots(self):
-        """Common post process unrelated to data"""
-        if len(self.axes) > 0:
-            all_axes = self._get_subplots()
-            nrows, ncols = self._get_axes_layout()
-            _handle_shared_axes(axarr=all_axes, nplots=len(all_axes),
-                                naxes=nrows * ncols, nrows=nrows,
-                                ncols=ncols, sharex=self.sharex,
-                                sharey=self.sharey)
-
-        for ax in self.axes:
-            if self.yticks is not None:
-                ax.set_yticks(self.yticks)
-
-            if self.xticks is not None:
-                ax.set_xticks(self.xticks)
-
-            if self.ylim is not None:
-                ax.set_ylim(self.ylim)
-
-            if self.xlim is not None:
-                ax.set_xlim(self.xlim)
-
-            ax.grid(self.grid)
-
-        if self.title:
-            if self.subplots:
-                if is_list_like(self.title):
-                    if len(self.title) != self.nseries:
-                        msg = ('The length of `title` must equal the number '
-                               'of columns if using `title` of type `list` '
-                               'and `subplots=True`.\n'
-                               'length of title = {}\n'
-                               'number of columns = {}').format(
-                            len(self.title), self.nseries)
-                        raise ValueError(msg)
-
-                    for (ax, title) in zip(self.axes, self.title):
-                        ax.set_title(title)
-                else:
-                    self.fig.suptitle(self.title)
-            else:
-                if is_list_like(self.title):
-                    msg = ('Using `title` of type `list` is not supported '
-                           'unless `subplots=True` is passed')
-                    raise ValueError(msg)
-                self.axes[0].set_title(self.title)
-
-    def _apply_axis_properties(self, axis, rot=None, fontsize=None):
-        labels = axis.get_majorticklabels() + axis.get_minorticklabels()
-        for label in labels:
-            if rot is not None:
-                label.set_rotation(rot)
-            if fontsize is not None:
-                label.set_fontsize(fontsize)
-
-    @property
-    def legend_title(self):
-        if not isinstance(self.data.columns, MultiIndex):
-            name = self.data.columns.name
-            if name is not None:
-                name = pprint_thing(name)
-            return name
-        else:
-            stringified = map(pprint_thing,
-                              self.data.columns.names)
-            return ','.join(stringified)
-
-    def _add_legend_handle(self, handle, label, index=None):
-        if label is not None:
-            if self.mark_right and index is not None:
-                if self.on_right(index):
-                    label = label + ' (right)'
-            self.legend_handles.append(handle)
-            self.legend_labels.append(label)
-
-    def _make_legend(self):
-        ax, leg = self._get_ax_legend(self.axes[0])
-
-        handles = []
-        labels = []
-        title = ''
-
-        if not self.subplots:
-            if leg is not None:
-                title = leg.get_title().get_text()
-                handles = leg.legendHandles
-                labels = [x.get_text() for x in leg.get_texts()]
-
-            if self.legend:
-                if self.legend == 'reverse':
-                    self.legend_handles = reversed(self.legend_handles)
-                    self.legend_labels = reversed(self.legend_labels)
-
-                handles += self.legend_handles
-                labels += self.legend_labels
-                if self.legend_title is not None:
-                    title = self.legend_title
-
-            if len(handles) > 0:
-                ax.legend(handles, labels, loc='best', title=title)
-
-        elif self.subplots and self.legend:
-            for ax in self.axes:
-                if ax.get_visible():
-                    ax.legend(loc='best')
-
-    def _get_ax_legend(self, ax):
-        leg = ax.get_legend()
-        other_ax = (getattr(ax, 'left_ax', None) or
-                    getattr(ax, 'right_ax', None))
-        other_leg = None
-        if other_ax is not None:
-            other_leg = other_ax.get_legend()
-        if leg is None and other_leg is not None:
-            leg = other_leg
-            ax = other_ax
-        return ax, leg
-
-    @cache_readonly
-    def plt(self):
-        import matplotlib.pyplot as plt
-        return plt
-
-    @staticmethod
-    def mpl_ge_1_3_1():
-        return _mpl_ge_1_3_1()
-
-    @staticmethod
-    def mpl_ge_1_5_0():
-        return _mpl_ge_1_5_0()
-
-    _need_to_set_index = False
-
-    def _get_xticks(self, convert_period=False):
-        index = self.data.index
-        is_datetype = index.inferred_type in ('datetime', 'date',
-                                              'datetime64', 'time')
-
-        if self.use_index:
-            if convert_period and isinstance(index, PeriodIndex):
-                self.data = self.data.reindex(index=index.sort_values())
-                x = self.data.index.to_timestamp()._mpl_repr()
-            elif index.is_numeric():
-                """
-                Matplotlib supports numeric values or datetime objects as
-                xaxis values. Taking LBYL approach here, by the time
-                matplotlib raises exception when using non numeric/datetime
-                values for xaxis, several actions are already taken by plt.
-                """
-                x = index._mpl_repr()
-            elif is_datetype:
-                self.data = self.data.sort_index()
-                x = self.data.index._mpl_repr()
-            else:
-                self._need_to_set_index = True
-                x = lrange(len(index))
-        else:
-            x = lrange(len(index))
-
-        return x
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, is_errorbar=False, **kwds):
-        mask = isnull(y)
-        if mask.any():
-            y = np.ma.array(y)
-            y = np.ma.masked_where(mask, y)
-
-        if isinstance(x, Index):
-            x = x._mpl_repr()
-
-        if is_errorbar:
-            if 'xerr' in kwds:
-                kwds['xerr'] = np.array(kwds.get('xerr'))
-            if 'yerr' in kwds:
-                kwds['yerr'] = np.array(kwds.get('yerr'))
-            return ax.errorbar(x, y, **kwds)
-        else:
-            # prevent style kwarg from going to errorbar, where it is
-            # unsupported
-            if style is not None:
-                args = (x, y, style)
-            else:
-                args = (x, y)
-            return ax.plot(*args, **kwds)
-
-    def _get_index_name(self):
-        if isinstance(self.data.index, MultiIndex):
-            name = self.data.index.names
-            if any(x is not None for x in name):
-                name = ','.join([pprint_thing(x) for x in name])
-            else:
-                name = None
-        else:
-            name = self.data.index.name
-            if name is not None:
-                name = pprint_thing(name)
-
-        return name
-
-    @classmethod
-    def _get_ax_layer(cls, ax, primary=True):
-        """get left (primary) or right (secondary) axes"""
-        if primary:
-            return getattr(ax, 'left_ax', ax)
-        else:
-            return getattr(ax, 'right_ax', ax)
-
-    def _get_ax(self, i):
-        # get the twinx ax if appropriate
-        if self.subplots:
-            ax = self.axes[i]
-            ax = self._maybe_right_yaxis(ax, i)
-            self.axes[i] = ax
-        else:
-            ax = self.axes[0]
-            ax = self._maybe_right_yaxis(ax, i)
-
-        ax.get_yaxis().set_visible(True)
-        return ax
-
-    def on_right(self, i):
-        if isinstance(self.secondary_y, bool):
-            return self.secondary_y
-
-        if isinstance(self.secondary_y, (tuple, list, np.ndarray, Index)):
-            return self.data.columns[i] in self.secondary_y
-
-    def _apply_style_colors(self, colors, kwds, col_num, label):
-        """
-        Manage style and color based on column number and its label.
-        Returns tuple of appropriate style and kwds which "color" may be added.
-        """
-        style = None
-        if self.style is not None:
-            if isinstance(self.style, list):
-                try:
-                    style = self.style[col_num]
-                except IndexError:
-                    pass
-            elif isinstance(self.style, dict):
-                style = self.style.get(label, style)
-            else:
-                style = self.style
-
-        has_color = 'color' in kwds or self.colormap is not None
-        nocolor_style = style is None or re.match('[a-z]+', style) is None
-        if (has_color or self.subplots) and nocolor_style:
-            kwds['color'] = colors[col_num % len(colors)]
-        return style, kwds
-
-    def _get_colors(self, num_colors=None, color_kwds='color'):
-        if num_colors is None:
-            num_colors = self.nseries
-
-        return _get_standard_colors(num_colors=num_colors,
-                                    colormap=self.colormap,
-                                    color=self.kwds.get(color_kwds))
-
-    def _parse_errorbars(self, label, err):
-        """
-        Look for error keyword arguments and return the actual errorbar data
-        or return the error DataFrame/dict
-
-        Error bars can be specified in several ways:
-            Series: the user provides a pandas.Series object of the same
-                    length as the data
-            ndarray: provides a np.ndarray of the same length as the data
-            DataFrame/dict: error values are paired with keys matching the
-                    key in the plotted DataFrame
-            str: the name of the column within the plotted DataFrame
-        """
-
-        if err is None:
-            return None
-
-        from pandas import DataFrame, Series
-
-        def match_labels(data, e):
-            e = e.reindex_axis(data.index)
-            return e
-
-        # key-matched DataFrame
-        if isinstance(err, DataFrame):
-
-            err = match_labels(self.data, err)
-        # key-matched dict
-        elif isinstance(err, dict):
-            pass
-
-        # Series of error values
-        elif isinstance(err, Series):
-            # broadcast error series across data
-            err = match_labels(self.data, err)
-            err = np.atleast_2d(err)
-            err = np.tile(err, (self.nseries, 1))
-
-        # errors are a column in the dataframe
-        elif isinstance(err, string_types):
-            evalues = self.data[err].values
-            self.data = self.data[self.data.columns.drop(err)]
-            err = np.atleast_2d(evalues)
-            err = np.tile(err, (self.nseries, 1))
-
-        elif is_list_like(err):
-            if is_iterator(err):
-                err = np.atleast_2d(list(err))
-            else:
-                # raw error values
-                err = np.atleast_2d(err)
-
-            err_shape = err.shape
-
-            # asymmetrical error bars
-            if err.ndim == 3:
-                if (err_shape[0] != self.nseries) or \
-                        (err_shape[1] != 2) or \
-                        (err_shape[2] != len(self.data)):
-                    msg = "Asymmetrical error bars should be provided " + \
-                        "with the shape (%u, 2, %u)" % \
-                        (self.nseries, len(self.data))
-                    raise ValueError(msg)
-
-            # broadcast errors to each data series
-            if len(err) == 1:
-                err = np.tile(err, (self.nseries, 1))
-
-        elif is_number(err):
-            err = np.tile([err], (self.nseries, len(self.data)))
-
-        else:
-            msg = "No valid %s detected" % label
-            raise ValueError(msg)
-
-        return err
-
-    def _get_errorbars(self, label=None, index=None, xerr=True, yerr=True):
-        from pandas import DataFrame
-        errors = {}
-
-        for kw, flag in zip(['xerr', 'yerr'], [xerr, yerr]):
-            if flag:
-                err = self.errors[kw]
-                # user provided label-matched dataframe of errors
-                if isinstance(err, (DataFrame, dict)):
-                    if label is not None and label in err.keys():
-                        err = err[label]
-                    else:
-                        err = None
-                elif index is not None and err is not None:
-                    err = err[index]
-
-                if err is not None:
-                    errors[kw] = err
-        return errors
-
-    def _get_subplots(self):
-        from matplotlib.axes import Subplot
-        return [ax for ax in self.axes[0].get_figure().get_axes()
-                if isinstance(ax, Subplot)]
-
-    def _get_axes_layout(self):
-        axes = self._get_subplots()
-        x_set = set()
-        y_set = set()
-        for ax in axes:
-            # check axes coordinates to estimate layout
-            points = ax.get_position().get_points()
-            x_set.add(points[0][0])
-            y_set.add(points[0][1])
-        return (len(y_set), len(x_set))
-
-
-class PlanePlot(MPLPlot):
-    """
-    Abstract class for plotting on plane, currently scatter and hexbin.
-    """
-
-    _layout_type = 'single'
-
-    def __init__(self, data, x, y, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        if x is None or y is None:
-            raise ValueError(self._kind + ' requires and x and y column')
-        if is_integer(x) and not self.data.columns.holds_integer():
-            x = self.data.columns[x]
-        if is_integer(y) and not self.data.columns.holds_integer():
-            y = self.data.columns[y]
-        self.x = x
-        self.y = y
-
-    @property
-    def nseries(self):
-        return 1
-
-    def _post_plot_logic(self, ax, data):
-        x, y = self.x, self.y
-        ax.set_ylabel(pprint_thing(y))
-        ax.set_xlabel(pprint_thing(x))
-
-
-class ScatterPlot(PlanePlot):
-    _kind = 'scatter'
-
-    def __init__(self, data, x, y, s=None, c=None, **kwargs):
-        if s is None:
-            # hide the matplotlib default for size, in case we want to change
-            # the handling of this argument later
-            s = 20
-        super(ScatterPlot, self).__init__(data, x, y, s=s, **kwargs)
-        if is_integer(c) and not self.data.columns.holds_integer():
-            c = self.data.columns[c]
-        self.c = c
-
-    def _make_plot(self):
-        x, y, c, data = self.x, self.y, self.c, self.data
-        ax = self.axes[0]
-
-        c_is_column = is_hashable(c) and c in self.data.columns
-
-        # plot a colorbar only if a colormap is provided or necessary
-        cb = self.kwds.pop('colorbar', self.colormap or c_is_column)
-
-        # pandas uses colormap, matplotlib uses cmap.
-        cmap = self.colormap or 'Greys'
-        cmap = self.plt.cm.get_cmap(cmap)
-        color = self.kwds.pop("color", None)
-        if c is not None and color is not None:
-            raise TypeError('Specify exactly one of `c` and `color`')
-        elif c is None and color is None:
-            c_values = self.plt.rcParams['patch.facecolor']
-        elif color is not None:
-            c_values = color
-        elif c_is_column:
-            c_values = self.data[c].values
-        else:
-            c_values = c
-
-        if self.legend and hasattr(self, 'label'):
-            label = self.label
-        else:
-            label = None
-        scatter = ax.scatter(data[x].values, data[y].values, c=c_values,
-                             label=label, cmap=cmap, **self.kwds)
-        if cb:
-            img = ax.collections[0]
-            kws = dict(ax=ax)
-            if self.mpl_ge_1_3_1():
-                kws['label'] = c if c_is_column else ''
-            self.fig.colorbar(img, **kws)
-
-        if label is not None:
-            self._add_legend_handle(scatter, label)
-        else:
-            self.legend = False
-
-        errors_x = self._get_errorbars(label=x, index=0, yerr=False)
-        errors_y = self._get_errorbars(label=y, index=0, xerr=False)
-        if len(errors_x) > 0 or len(errors_y) > 0:
-            err_kwds = dict(errors_x, **errors_y)
-            err_kwds['ecolor'] = scatter.get_facecolor()[0]
-            ax.errorbar(data[x].values, data[y].values,
-                        linestyle='none', **err_kwds)
-
-
-class HexBinPlot(PlanePlot):
-    _kind = 'hexbin'
-
-    def __init__(self, data, x, y, C=None, **kwargs):
-        super(HexBinPlot, self).__init__(data, x, y, **kwargs)
-        if is_integer(C) and not self.data.columns.holds_integer():
-            C = self.data.columns[C]
-        self.C = C
-
-    def _make_plot(self):
-        x, y, data, C = self.x, self.y, self.data, self.C
-        ax = self.axes[0]
-        # pandas uses colormap, matplotlib uses cmap.
-        cmap = self.colormap or 'BuGn'
-        cmap = self.plt.cm.get_cmap(cmap)
-        cb = self.kwds.pop('colorbar', True)
-
-        if C is None:
-            c_values = None
-        else:
-            c_values = data[C].values
-
-        ax.hexbin(data[x].values, data[y].values, C=c_values, cmap=cmap,
-                  **self.kwds)
-        if cb:
-            img = ax.collections[0]
-            self.fig.colorbar(img, ax=ax)
-
-    def _make_legend(self):
-        pass
-
-
-class LinePlot(MPLPlot):
-    _kind = 'line'
-    _default_rot = 0
-    orientation = 'vertical'
-
-    def __init__(self, data, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        if self.stacked:
-            self.data = self.data.fillna(value=0)
-        self.x_compat = plot_params['x_compat']
-        if 'x_compat' in self.kwds:
-            self.x_compat = bool(self.kwds.pop('x_compat'))
-
-    def _is_ts_plot(self):
-        # this is slightly deceptive
-        return not self.x_compat and self.use_index and self._use_dynamic_x()
-
-    def _use_dynamic_x(self):
-        from pandas.tseries.plotting import _use_dynamic_x
-        return _use_dynamic_x(self._get_ax(0), self.data)
-
-    def _make_plot(self):
-        if self._is_ts_plot():
-            from pandas.tseries.plotting import _maybe_convert_index
-            data = _maybe_convert_index(self._get_ax(0), self.data)
-
-            x = data.index      # dummy, not used
-            plotf = self._ts_plot
-            it = self._iter_data(data=data, keep_index=True)
-        else:
-            x = self._get_xticks(convert_period=True)
-            plotf = self._plot
-            it = self._iter_data()
-
-        stacking_id = self._get_stacking_id()
-        is_errorbar = any(e is not None for e in self.errors.values())
-
-        colors = self._get_colors()
-        for i, (label, y) in enumerate(it):
-            ax = self._get_ax(i)
-            kwds = self.kwds.copy()
-            style, kwds = self._apply_style_colors(colors, kwds, i, label)
-
-            errors = self._get_errorbars(label=label, index=i)
-            kwds = dict(kwds, **errors)
-
-            label = pprint_thing(label)  # .encode('utf-8')
-            kwds['label'] = label
-
-            newlines = plotf(ax, x, y, style=style, column_num=i,
-                             stacking_id=stacking_id,
-                             is_errorbar=is_errorbar,
-                             **kwds)
-            self._add_legend_handle(newlines[0], label, index=i)
-
-            lines = _get_all_lines(ax)
-            left, right = _get_xlim(lines)
-            ax.set_xlim(left, right)
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, column_num=None,
-              stacking_id=None, **kwds):
-        # column_num is used to get the target column from protf in line and
-        # area plots
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(y))
-        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
-        lines = MPLPlot._plot(ax, x, y_values, style=style, **kwds)
-        cls._update_stacker(ax, stacking_id, y)
-        return lines
-
-    @classmethod
-    def _ts_plot(cls, ax, x, data, style=None, **kwds):
-        from pandas.tseries.plotting import (_maybe_resample,
-                                             _decorate_axes,
-                                             format_dateaxis)
-        # accept x to be consistent with normal plot func,
-        # x is not passed to tsplot as it uses data.index as x coordinate
-        # column_num must be in kwds for stacking purpose
-        freq, data = _maybe_resample(data, ax, kwds)
-
-        # Set ax with freq info
-        _decorate_axes(ax, freq, kwds)
-        # digging deeper
-        if hasattr(ax, 'left_ax'):
-            _decorate_axes(ax.left_ax, freq, kwds)
-        if hasattr(ax, 'right_ax'):
-            _decorate_axes(ax.right_ax, freq, kwds)
-        ax._plot_data.append((data, cls._kind, kwds))
-
-        lines = cls._plot(ax, data.index, data.values, style=style, **kwds)
-        # set date formatter, locators and rescale limits
-        format_dateaxis(ax, ax.freq, data.index)
-        return lines
-
-    def _get_stacking_id(self):
-        if self.stacked:
-            return id(self.data)
-        else:
-            return None
-
-    @classmethod
-    def _initialize_stacker(cls, ax, stacking_id, n):
-        if stacking_id is None:
-            return
-        if not hasattr(ax, '_stacker_pos_prior'):
-            ax._stacker_pos_prior = {}
-        if not hasattr(ax, '_stacker_neg_prior'):
-            ax._stacker_neg_prior = {}
-        ax._stacker_pos_prior[stacking_id] = np.zeros(n)
-        ax._stacker_neg_prior[stacking_id] = np.zeros(n)
-
-    @classmethod
-    def _get_stacked_values(cls, ax, stacking_id, values, label):
-        if stacking_id is None:
-            return values
-        if not hasattr(ax, '_stacker_pos_prior'):
-            # stacker may not be initialized for subplots
-            cls._initialize_stacker(ax, stacking_id, len(values))
-
-        if (values >= 0).all():
-            return ax._stacker_pos_prior[stacking_id] + values
-        elif (values <= 0).all():
-            return ax._stacker_neg_prior[stacking_id] + values
-
-        raise ValueError('When stacked is True, each column must be either '
-                         'all positive or negative.'
-                         '{0} contains both positive and negative values'
-                         .format(label))
-
-    @classmethod
-    def _update_stacker(cls, ax, stacking_id, values):
-        if stacking_id is None:
-            return
-        if (values >= 0).all():
-            ax._stacker_pos_prior[stacking_id] += values
-        elif (values <= 0).all():
-            ax._stacker_neg_prior[stacking_id] += values
-
-    def _post_plot_logic(self, ax, data):
-        condition = (not self._use_dynamic_x() and
-                     data.index.is_all_dates and
-                     not self.subplots or
-                     (self.subplots and self.sharex))
-
-        index_name = self._get_index_name()
-
-        if condition:
-            # irregular TS rotated 30 deg. by default
-            # probably a better place to check / set this.
-            if not self._rot_set:
-                self.rot = 30
-            format_date_labels(ax, rot=self.rot)
-
-        if index_name is not None and self.use_index:
-            ax.set_xlabel(index_name)
-
-
-class AreaPlot(LinePlot):
-    _kind = 'area'
-
-    def __init__(self, data, **kwargs):
-        kwargs.setdefault('stacked', True)
-        data = data.fillna(value=0)
-        LinePlot.__init__(self, data, **kwargs)
-
-        if not self.stacked:
-            # use smaller alpha to distinguish overlap
-            self.kwds.setdefault('alpha', 0.5)
-
-        if self.logy or self.loglog:
-            raise ValueError("Log-y scales are not supported in area plot")
-
-    @classmethod
-    def _plot(cls, ax, x, y, style=None, column_num=None,
-              stacking_id=None, is_errorbar=False, **kwds):
-
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(y))
-        y_values = cls._get_stacked_values(ax, stacking_id, y, kwds['label'])
-
-        # need to remove label, because subplots uses mpl legend as it is
-        line_kwds = kwds.copy()
-        if cls.mpl_ge_1_5_0():
-            line_kwds.pop('label')
-        lines = MPLPlot._plot(ax, x, y_values, style=style, **line_kwds)
-
-        # get data from the line to get coordinates for fill_between
-        xdata, y_values = lines[0].get_data(orig=False)
-
-        # unable to use ``_get_stacked_values`` here to get starting point
-        if stacking_id is None:
-            start = np.zeros(len(y))
-        elif (y >= 0).all():
-            start = ax._stacker_pos_prior[stacking_id]
-        elif (y <= 0).all():
-            start = ax._stacker_neg_prior[stacking_id]
-        else:
-            start = np.zeros(len(y))
-
-        if 'color' not in kwds:
-            kwds['color'] = lines[0].get_color()
-
-        rect = ax.fill_between(xdata, start, y_values, **kwds)
-        cls._update_stacker(ax, stacking_id, y)
-
-        # LinePlot expects list of artists
-        res = [rect] if cls.mpl_ge_1_5_0() else lines
-        return res
-
-    def _add_legend_handle(self, handle, label, index=None):
-        if not self.mpl_ge_1_5_0():
-            from matplotlib.patches import Rectangle
-            # Because fill_between isn't supported in legend,
-            # specifically add Rectangle handle here
-            alpha = self.kwds.get('alpha', None)
-            handle = Rectangle((0, 0), 1, 1, fc=handle.get_color(),
-                               alpha=alpha)
-        LinePlot._add_legend_handle(self, handle, label, index=index)
-
-    def _post_plot_logic(self, ax, data):
-        LinePlot._post_plot_logic(self, ax, data)
-
-        if self.ylim is None:
-            if (data >= 0).all().all():
-                ax.set_ylim(0, None)
-            elif (data <= 0).all().all():
-                ax.set_ylim(None, 0)
-
-
-class BarPlot(MPLPlot):
-    _kind = 'bar'
-    _default_rot = 90
-    orientation = 'vertical'
-
-    def __init__(self, data, **kwargs):
-        self.bar_width = kwargs.pop('width', 0.5)
-        pos = kwargs.pop('position', 0.5)
-        kwargs.setdefault('align', 'center')
-        self.tick_pos = np.arange(len(data))
-
-        self.bottom = kwargs.pop('bottom', 0)
-        self.left = kwargs.pop('left', 0)
-
-        self.log = kwargs.pop('log', False)
-        MPLPlot.__init__(self, data, **kwargs)
-
-        if self.stacked or self.subplots:
-            self.tickoffset = self.bar_width * pos
-            if kwargs['align'] == 'edge':
-                self.lim_offset = self.bar_width / 2
-            else:
-                self.lim_offset = 0
-        else:
-            if kwargs['align'] == 'edge':
-                w = self.bar_width / self.nseries
-                self.tickoffset = self.bar_width * (pos - 0.5) + w * 0.5
-                self.lim_offset = w * 0.5
-            else:
-                self.tickoffset = self.bar_width * pos
-                self.lim_offset = 0
-
-        self.ax_pos = self.tick_pos - self.tickoffset
-
-    def _args_adjust(self):
-        if is_list_like(self.bottom):
-            self.bottom = np.array(self.bottom)
-        if is_list_like(self.left):
-            self.left = np.array(self.left)
-
-    @classmethod
-    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
-        return ax.bar(x, y, w, bottom=start, log=log, **kwds)
-
-    @property
-    def _start_base(self):
-        return self.bottom
-
-    def _make_plot(self):
-        import matplotlib as mpl
-
-        colors = self._get_colors()
-        ncolors = len(colors)
-
-        pos_prior = neg_prior = np.zeros(len(self.data))
-        K = self.nseries
-
-        for i, (label, y) in enumerate(self._iter_data(fillna=0)):
-            ax = self._get_ax(i)
-            kwds = self.kwds.copy()
-            kwds['color'] = colors[i % ncolors]
-
-            errors = self._get_errorbars(label=label, index=i)
-            kwds = dict(kwds, **errors)
-
-            label = pprint_thing(label)
-
-            if (('yerr' in kwds) or ('xerr' in kwds)) \
-                    and (kwds.get('ecolor') is None):
-                kwds['ecolor'] = mpl.rcParams['xtick.color']
-
-            start = 0
-            if self.log and (y >= 1).all():
-                start = 1
-            start = start + self._start_base
-
-            if self.subplots:
-                w = self.bar_width / 2
-                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
-                                  start=start, label=label,
-                                  log=self.log, **kwds)
-                ax.set_title(label)
-            elif self.stacked:
-                mask = y > 0
-                start = np.where(mask, pos_prior, neg_prior) + self._start_base
-                w = self.bar_width / 2
-                rect = self._plot(ax, self.ax_pos + w, y, self.bar_width,
-                                  start=start, label=label,
-                                  log=self.log, **kwds)
-                pos_prior = pos_prior + np.where(mask, y, 0)
-                neg_prior = neg_prior + np.where(mask, 0, y)
-            else:
-                w = self.bar_width / K
-                rect = self._plot(ax, self.ax_pos + (i + 0.5) * w, y, w,
-                                  start=start, label=label,
-                                  log=self.log, **kwds)
-            self._add_legend_handle(rect, label, index=i)
-
-    def _post_plot_logic(self, ax, data):
-        if self.use_index:
-            str_index = [pprint_thing(key) for key in data.index]
-        else:
-            str_index = [pprint_thing(key) for key in range(data.shape[0])]
-        name = self._get_index_name()
-
-        s_edge = self.ax_pos[0] - 0.25 + self.lim_offset
-        e_edge = self.ax_pos[-1] + 0.25 + self.bar_width + self.lim_offset
-
-        self._decorate_ticks(ax, name, str_index, s_edge, e_edge)
-
-    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
-        ax.set_xlim((start_edge, end_edge))
-        ax.set_xticks(self.tick_pos)
-        ax.set_xticklabels(ticklabels)
-        if name is not None and self.use_index:
-            ax.set_xlabel(name)
-
-
-class BarhPlot(BarPlot):
-    _kind = 'barh'
-    _default_rot = 0
-    orientation = 'horizontal'
-
-    @property
-    def _start_base(self):
-        return self.left
-
-    @classmethod
-    def _plot(cls, ax, x, y, w, start=0, log=False, **kwds):
-        return ax.barh(x, y, w, left=start, log=log, **kwds)
-
-    def _decorate_ticks(self, ax, name, ticklabels, start_edge, end_edge):
-        # horizontal bars
-        ax.set_ylim((start_edge, end_edge))
-        ax.set_yticks(self.tick_pos)
-        ax.set_yticklabels(ticklabels)
-        if name is not None and self.use_index:
-            ax.set_ylabel(name)
-
-
-class HistPlot(LinePlot):
-    _kind = 'hist'
-
-    def __init__(self, data, bins=10, bottom=0, **kwargs):
-        self.bins = bins        # use mpl default
-        self.bottom = bottom
-        # Do not call LinePlot.__init__ which may fill nan
-        MPLPlot.__init__(self, data, **kwargs)
-
-    def _args_adjust(self):
-        if is_integer(self.bins):
-            # create common bin edge
-            values = (self.data._convert(datetime=True)._get_numeric_data())
-            values = np.ravel(values)
-            values = values[~isnull(values)]
-
-            hist, self.bins = np.histogram(
-                values, bins=self.bins,
-                range=self.kwds.get('range', None),
-                weights=self.kwds.get('weights', None))
-
-        if is_list_like(self.bottom):
-            self.bottom = np.array(self.bottom)
-
-    @classmethod
-    def _plot(cls, ax, y, style=None, bins=None, bottom=0, column_num=0,
-              stacking_id=None, **kwds):
-        if column_num == 0:
-            cls._initialize_stacker(ax, stacking_id, len(bins) - 1)
-        y = y[~isnull(y)]
-
-        base = np.zeros(len(bins) - 1)
-        bottom = bottom + \
-            cls._get_stacked_values(ax, stacking_id, base, kwds['label'])
-        # ignore style
-        n, bins, patches = ax.hist(y, bins=bins, bottom=bottom, **kwds)
-        cls._update_stacker(ax, stacking_id, n)
-        return patches
-
-    def _make_plot(self):
-        colors = self._get_colors()
-        stacking_id = self._get_stacking_id()
-
-        for i, (label, y) in enumerate(self._iter_data()):
-            ax = self._get_ax(i)
-
-            kwds = self.kwds.copy()
-
-            label = pprint_thing(label)
-            kwds['label'] = label
-
-            style, kwds = self._apply_style_colors(colors, kwds, i, label)
-            if style is not None:
-                kwds['style'] = style
-
-            kwds = self._make_plot_keywords(kwds, y)
-            artists = self._plot(ax, y, column_num=i,
-                                 stacking_id=stacking_id, **kwds)
-            self._add_legend_handle(artists[0], label, index=i)
-
-    def _make_plot_keywords(self, kwds, y):
-        """merge BoxPlot/KdePlot properties to passed kwds"""
-        # y is required for KdePlot
-        kwds['bottom'] = self.bottom
-        kwds['bins'] = self.bins
-        return kwds
-
-    def _post_plot_logic(self, ax, data):
-        if self.orientation == 'horizontal':
-            ax.set_xlabel('Frequency')
-        else:
-            ax.set_ylabel('Frequency')
-
-    @property
-    def orientation(self):
-        if self.kwds.get('orientation', None) == 'horizontal':
-            return 'horizontal'
-        else:
-            return 'vertical'
-
-
-class KdePlot(HistPlot):
-    _kind = 'kde'
-    orientation = 'vertical'
-
-    def __init__(self, data, bw_method=None, ind=None, **kwargs):
-        MPLPlot.__init__(self, data, **kwargs)
-        self.bw_method = bw_method
-        self.ind = ind
-
-    def _args_adjust(self):
-        pass
-
-    def _get_ind(self, y):
-        if self.ind is None:
-            # np.nanmax() and np.nanmin() ignores the missing values
-            sample_range = np.nanmax(y) - np.nanmin(y)
-            ind = np.linspace(np.nanmin(y) - 0.5 * sample_range,
-                              np.nanmax(y) + 0.5 * sample_range, 1000)
-        else:
-            ind = self.ind
-        return ind
-
-    @classmethod
-    def _plot(cls, ax, y, style=None, bw_method=None, ind=None,
-              column_num=None, stacking_id=None, **kwds):
-        from scipy.stats import gaussian_kde
-        from scipy import __version__ as spv
-
-        y = remove_na(y)
-
-        if LooseVersion(spv) >= '0.11.0':
-            gkde = gaussian_kde(y, bw_method=bw_method)
-        else:
-            gkde = gaussian_kde(y)
-            if bw_method is not None:
-                msg = ('bw_method was added in Scipy 0.11.0.' +
-                       ' Scipy version in use is %s.' % spv)
-                warnings.warn(msg)
-
-        y = gkde.evaluate(ind)
-        lines = MPLPlot._plot(ax, ind, y, style=style, **kwds)
-        return lines
-
-    def _make_plot_keywords(self, kwds, y):
-        kwds['bw_method'] = self.bw_method
-        kwds['ind'] = self._get_ind(y)
-        return kwds
-
-    def _post_plot_logic(self, ax, data):
-        ax.set_ylabel('Density')
-
-
-class PiePlot(MPLPlot):
-    _kind = 'pie'
-    _layout_type = 'horizontal'
-
-    def __init__(self, data, kind=None, **kwargs):
-        data = data.fillna(value=0)
-        if (data < 0).any().any():
-            raise ValueError("{0} doesn't allow negative values".format(kind))
-        MPLPlot.__init__(self, data, kind=kind, **kwargs)
-
-    def _args_adjust(self):
-        self.grid = False
-        self.logy = False
-        self.logx = False
-        self.loglog = False
-
-    def _validate_color_args(self):
-        pass
-
-    def _make_plot(self):
-        colors = self._get_colors(
-            num_colors=len(self.data), color_kwds='colors')
-        self.kwds.setdefault('colors', colors)
-
-        for i, (label, y) in enumerate(self._iter_data()):
-            ax = self._get_ax(i)
-            if label is not None:
-                label = pprint_thing(label)
-                ax.set_ylabel(label)
-
-            kwds = self.kwds.copy()
-
-            def blank_labeler(label, value):
-                if value == 0:
-                    return ''
-                else:
-                    return label
-
-            idx = [pprint_thing(v) for v in self.data.index]
-            labels = kwds.pop('labels', idx)
-            # labels is used for each wedge's labels
-            # Blank out labels for values of 0 so they don't overlap
-            # with nonzero wedges
-            if labels is not None:
-                blabels = [blank_labeler(l, value) for
-                           l, value in zip(labels, y)]
-            else:
-                blabels = None
-            results = ax.pie(y, labels=blabels, **kwds)
-
-            if kwds.get('autopct', None) is not None:
-                patches, texts, autotexts = results
-            else:
-                patches, texts = results
-                autotexts = []
-
-            if self.fontsize is not None:
-                for t in texts + autotexts:
-                    t.set_fontsize(self.fontsize)
-
-            # leglabels is used for legend labels
-            leglabels = labels if labels is not None else idx
-            for p, l in zip(patches, leglabels):
-                self._add_legend_handle(p, l)
-
-
-class BoxPlot(LinePlot):
-    _kind = 'box'
-    _layout_type = 'horizontal'
-
-    _valid_return_types = (None, 'axes', 'dict', 'both')
-    # namedtuple to hold results
-    BP = namedtuple("Boxplot", ['ax', 'lines'])
-
-    def __init__(self, data, return_type='axes', **kwargs):
-        # Do not call LinePlot.__init__ which may fill nan
-        if return_type not in self._valid_return_types:
-            raise ValueError(
-                "return_type must be {None, 'axes', 'dict', 'both'}")
-
-        self.return_type = return_type
-        MPLPlot.__init__(self, data, **kwargs)
-
-    def _args_adjust(self):
-        if self.subplots:
-            # Disable label ax sharing. Otherwise, all subplots shows last
-            # column label
-            if self.orientation == 'vertical':
-                self.sharex = False
-            else:
-                self.sharey = False
-
-    @classmethod
-    def _plot(cls, ax, y, column_num=None, return_type='axes', **kwds):
-        if y.ndim == 2:
-            y = [remove_na(v) for v in y]
-            # Boxplot fails with empty arrays, so need to add a NaN
-            #   if any cols are empty
-            # GH 8181
-            y = [v if v.size > 0 else np.array([np.nan]) for v in y]
-        else:
-            y = remove_na(y)
-        bp = ax.boxplot(y, **kwds)
-
-        if return_type == 'dict':
-            return bp, bp
-        elif return_type == 'both':
-            return cls.BP(ax=ax, lines=bp), bp
-        else:
-            return ax, bp
-
-    def _validate_color_args(self):
-        if 'color' in self.kwds:
-            if self.colormap is not None:
-                warnings.warn("'color' and 'colormap' cannot be used "
-                              "simultaneously. Using 'color'")
-            self.color = self.kwds.pop('color')
-
-            if isinstance(self.color, dict):
-                valid_keys = ['boxes', 'whiskers', 'medians', 'caps']
-                for key, values in compat.iteritems(self.color):
-                    if key not in valid_keys:
-                        raise ValueError("color dict contains invalid "
-                                         "key '{0}' "
-                                         "The key must be either {1}"
-                                         .format(key, valid_keys))
-        else:
-            self.color = None
-
-        # get standard colors for default
-        colors = _get_standard_colors(num_colors=3,
-                                      colormap=self.colormap,
-                                      color=None)
-        # use 2 colors by default, for box/whisker and median
-        # flier colors isn't needed here
-        # because it can be specified by ``sym`` kw
-        self._boxes_c = colors[0]
-        self._whiskers_c = colors[0]
-        self._medians_c = colors[2]
-        self._caps_c = 'k'          # mpl default
-
-    def _get_colors(self, num_colors=None, color_kwds='color'):
-        pass
-
-    def maybe_color_bp(self, bp):
-        if isinstance(self.color, dict):
-            boxes = self.color.get('boxes', self._boxes_c)
-            whiskers = self.color.get('whiskers', self._whiskers_c)
-            medians = self.color.get('medians', self._medians_c)
-            caps = self.color.get('caps', self._caps_c)
-        else:
-            # Other types are forwarded to matplotlib
-            # If None, use default colors
-            boxes = self.color or self._boxes_c
-            whiskers = self.color or self._whiskers_c
-            medians = self.color or self._medians_c
-            caps = self.color or self._caps_c
-
-        from matplotlib.artist import setp
-        setp(bp['boxes'], color=boxes, alpha=1)
-        setp(bp['whiskers'], color=whiskers, alpha=1)
-        setp(bp['medians'], color=medians, alpha=1)
-        setp(bp['caps'], color=caps, alpha=1)
-
-    def _make_plot(self):
-        if self.subplots:
-            self._return_obj = Series()
-
-            for i, (label, y) in enumerate(self._iter_data()):
-                ax = self._get_ax(i)
-                kwds = self.kwds.copy()
-
-                ret, bp = self._plot(ax, y, column_num=i,
-                                     return_type=self.return_type, **kwds)
-                self.maybe_color_bp(bp)
-                self._return_obj[label] = ret
-
-                label = [pprint_thing(label)]
-                self._set_ticklabels(ax, label)
-        else:
-            y = self.data.values.T
-            ax = self._get_ax(0)
-            kwds = self.kwds.copy()
-
-            ret, bp = self._plot(ax, y, column_num=0,
-                                 return_type=self.return_type, **kwds)
-            self.maybe_color_bp(bp)
-            self._return_obj = ret
-
-            labels = [l for l, _ in self._iter_data()]
-            labels = [pprint_thing(l) for l in labels]
-            if not self.use_index:
-                labels = [pprint_thing(key) for key in range(len(labels))]
-            self._set_ticklabels(ax, labels)
-
-    def _set_ticklabels(self, ax, labels):
-        if self.orientation == 'vertical':
-            ax.set_xticklabels(labels)
-        else:
-            ax.set_yticklabels(labels)
-
-    def _make_legend(self):
-        pass
-
-    def _post_plot_logic(self, ax, data):
-        pass
-
-    @property
-    def orientation(self):
-        if self.kwds.get('vert', True):
-            return 'vertical'
-        else:
-            return 'horizontal'
-
-    @property
-    def result(self):
-        if self.return_type is None:
-            return super(BoxPlot, self).result
-        else:
-            return self._return_obj
-
-
-# kinds supported by both dataframe and series
-_common_kinds = ['line', 'bar', 'barh',
-                 'kde', 'density', 'area', 'hist', 'box']
-# kinds supported by dataframe
-_dataframe_kinds = ['scatter', 'hexbin']
-# kinds supported only by series or dataframe single column
-_series_kinds = ['pie']
-_all_kinds = _common_kinds + _dataframe_kinds + _series_kinds
-
-_klasses = [LinePlot, BarPlot, BarhPlot, KdePlot, HistPlot, BoxPlot,
-            ScatterPlot, HexBinPlot, AreaPlot, PiePlot]
-
-_plot_klass = {}
-for klass in _klasses:
-    _plot_klass[klass._kind] = klass
-
-
-def _plot(data, x=None, y=None, subplots=False,
-          ax=None, kind='line', **kwds):
-    kind = _get_standard_kind(kind.lower().strip())
-    if kind in _all_kinds:
-        klass = _plot_klass[kind]
-    else:
-        raise ValueError("%r is not a valid plot kind" % kind)
-
-    from pandas import DataFrame
-    if kind in _dataframe_kinds:
-        if isinstance(data, DataFrame):
-            plot_obj = klass(data, x=x, y=y, subplots=subplots, ax=ax,
-                             kind=kind, **kwds)
-        else:
-            raise ValueError("plot kind %r can only be used for data frames"
-                             % kind)
-
-    elif kind in _series_kinds:
-        if isinstance(data, DataFrame):
-            if y is None and subplots is False:
-                msg = "{0} requires either y column or 'subplots=True'"
-                raise ValueError(msg.format(kind))
-            elif y is not None:
-                if is_integer(y) and not data.columns.holds_integer():
-                    y = data.columns[y]
-                # converted to series actually. copy to not modify
-                data = data[y].copy()
-                data.index.name = y
-        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
-    else:
-        if isinstance(data, DataFrame):
-            if x is not None:
-                if is_integer(x) and not data.columns.holds_integer():
-                    x = data.columns[x]
-                data = data.set_index(x)
-
-            if y is not None:
-                if is_integer(y) and not data.columns.holds_integer():
-                    y = data.columns[y]
-                label = kwds['label'] if 'label' in kwds else y
-                series = data[y].copy()  # Don't modify
-                series.name = label
-
-                for kw in ['xerr', 'yerr']:
-                    if (kw in kwds) and \
-                        (isinstance(kwds[kw], string_types) or
-                            is_integer(kwds[kw])):
-                        try:
-                            kwds[kw] = data[kwds[kw]]
-                        except (IndexError, KeyError, TypeError):
-                            pass
-                data = series
-        plot_obj = klass(data, subplots=subplots, ax=ax, kind=kind, **kwds)
-
-    plot_obj.generate()
-    plot_obj.draw()
-    return plot_obj.result
-
-
-df_kind = """- 'scatter' : scatter plot
-        - 'hexbin' : hexbin plot"""
-series_kind = ""
-
-df_coord = """x : label or position, default None
-    y : label or position, default None
-        Allows plotting of one column versus another"""
-series_coord = ""
-
-df_unique = """stacked : boolean, default False in line and
-        bar plots, and True in area plot. If True, create stacked plot.
-    sort_columns : boolean, default False
-        Sort column names to determine plot ordering
-    secondary_y : boolean or sequence, default False
-        Whether to plot on the secondary y-axis
-        If a list/tuple, which columns to plot on secondary y-axis"""
-series_unique = """label : label argument to provide to plot
-    secondary_y : boolean or sequence of ints, default False
-        If True then y-axis will be on the right"""
-
-df_ax = """ax : matplotlib axes object, default None
-    subplots : boolean, default False
-        Make separate subplots for each column
-    sharex : boolean, default True if ax is None else False
-        In case subplots=True, share x axis and set some x axis labels to
-        invisible; defaults to True if ax is None otherwise False if an ax
-        is passed in; Be aware, that passing in both an ax and sharex=True
-        will alter all x axis labels for all axis in a figure!
-    sharey : boolean, default False
-        In case subplots=True, share y axis and set some y axis labels to
-        invisible
-    layout : tuple (optional)
-        (rows, columns) for the layout of subplots"""
-series_ax = """ax : matplotlib axes object
-        If not passed, uses gca()"""
-
-df_note = """- If `kind` = 'scatter' and the argument `c` is the name of a dataframe
-      column, the values of that column are used to color each point.
-    - If `kind` = 'hexbin', you can control the size of the bins with the
-      `gridsize` argument. By default, a histogram of the counts around each
-      `(x, y)` point is computed. You can specify alternative aggregations
-      by passing values to the `C` and `reduce_C_function` arguments.
-      `C` specifies the value at each `(x, y)` point and `reduce_C_function`
-      is a function of one argument that reduces all the values in a bin to
-      a single number (e.g. `mean`, `max`, `sum`, `std`)."""
-series_note = ""
-
-_shared_doc_df_kwargs = dict(klass='DataFrame', klass_obj='df',
-                             klass_kind=df_kind, klass_coord=df_coord,
-                             klass_ax=df_ax, klass_unique=df_unique,
-                             klass_note=df_note)
-_shared_doc_series_kwargs = dict(klass='Series', klass_obj='s',
-                                 klass_kind=series_kind,
-                                 klass_coord=series_coord, klass_ax=series_ax,
-                                 klass_unique=series_unique,
-                                 klass_note=series_note)
-
-_shared_docs['plot'] = """
-    Make plots of %(klass)s using matplotlib / pylab.
-
-    *New in version 0.17.0:* Each plot kind has a corresponding method on the
-    ``%(klass)s.plot`` accessor:
-    ``%(klass_obj)s.plot(kind='line')`` is equivalent to
-    ``%(klass_obj)s.plot.line()``.
-
-    Parameters
-    ----------
-    data : %(klass)s
-    %(klass_coord)s
-    kind : str
-        - 'line' : line plot (default)
-        - 'bar' : vertical bar plot
-        - 'barh' : horizontal bar plot
-        - 'hist' : histogram
-        - 'box' : boxplot
-        - 'kde' : Kernel Density Estimation plot
-        - 'density' : same as 'kde'
-        - 'area' : area plot
-        - 'pie' : pie plot
-        %(klass_kind)s
-    %(klass_ax)s
-    figsize : a tuple (width, height) in inches
-    use_index : boolean, default True
-        Use index as ticks for x axis
-    title : string or list
-        Title to use for the plot. If a string is passed, print the string at
-        the top of the figure. If a list is passed and `subplots` is True,
-        print each item in the list above the corresponding subplot.
-    grid : boolean, default None (matlab style default)
-        Axis grid lines
-    legend : False/True/'reverse'
-        Place legend on axis subplots
-    style : list or dict
-        matplotlib line style per column
-    logx : boolean, default False
-        Use log scaling on x axis
-    logy : boolean, default False
-        Use log scaling on y axis
-    loglog : boolean, default False
-        Use log scaling on both x and y axes
-    xticks : sequence
-        Values to use for the xticks
-    yticks : sequence
-        Values to use for the yticks
-    xlim : 2-tuple/list
-    ylim : 2-tuple/list
-    rot : int, default None
-        Rotation for ticks (xticks for vertical, yticks for horizontal plots)
-    fontsize : int, default None
-        Font size for xticks and yticks
-    colormap : str or matplotlib colormap object, default None
-        Colormap to select colors from. If string, load colormap with that name
-        from matplotlib.
-    colorbar : boolean, optional
-        If True, plot colorbar (only relevant for 'scatter' and 'hexbin' plots)
-    position : float
-        Specify relative alignments for bar plot layout.
-        From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    table : boolean, Series or DataFrame, default False
-        If True, draw a table using the data in the DataFrame and the data will
-        be transposed to meet matplotlib's default layout.
-        If a Series or DataFrame is passed, use passed data to draw a table.
-    yerr : DataFrame, Series, array-like, dict and str
-        See :ref:`Plotting with Error Bars <visualization.errorbars>` for
-        detail.
-    xerr : same types as yerr.
-    %(klass_unique)s
-    mark_right : boolean, default True
-        When using a secondary_y axis, automatically mark the column
-        labels with "(right)" in the legend
-    kwds : keywords
-        Options to pass to matplotlib plotting method
-
-    Returns
-    -------
-    axes : matplotlib.AxesSubplot or np.array of them
-
-    Notes
-    -----
-
-    - See matplotlib documentation online for more on this subject
-    - If `kind` = 'bar' or 'barh', you can specify relative alignments
-      for bar plot layout by `position` keyword.
-      From 0 (left/bottom-end) to 1 (right/top-end). Default is 0.5 (center)
-    %(klass_note)s
-
-    """
-
-
-@Appender(_shared_docs['plot'] % _shared_doc_df_kwargs)
-def plot_frame(data, x=None, y=None, kind='line', ax=None,
-               subplots=False, sharex=None, sharey=False, layout=None,
-               figsize=None, use_index=True, title=None, grid=None,
-               legend=True, style=None, logx=False, logy=False, loglog=False,
-               xticks=None, yticks=None, xlim=None, ylim=None,
-               rot=None, fontsize=None, colormap=None, table=False,
-               yerr=None, xerr=None,
-               secondary_y=False, sort_columns=False,
-               **kwds):
-    return _plot(data, kind=kind, x=x, y=y, ax=ax,
-                 subplots=subplots, sharex=sharex, sharey=sharey,
-                 layout=layout, figsize=figsize, use_index=use_index,
-                 title=title, grid=grid, legend=legend,
-                 style=style, logx=logx, logy=logy, loglog=loglog,
-                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
-                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
-                 yerr=yerr, xerr=xerr,
-                 secondary_y=secondary_y, sort_columns=sort_columns,
-                 **kwds)
-
-
-@Appender(_shared_docs['plot'] % _shared_doc_series_kwargs)
-def plot_series(data, kind='line', ax=None,                    # Series unique
-                figsize=None, use_index=True, title=None, grid=None,
-                legend=False, style=None, logx=False, logy=False, loglog=False,
-                xticks=None, yticks=None, xlim=None, ylim=None,
-                rot=None, fontsize=None, colormap=None, table=False,
-                yerr=None, xerr=None,
-                label=None, secondary_y=False,                 # Series unique
-                **kwds):
-
-    import matplotlib.pyplot as plt
-    """
-    If no axes is specified, check whether there are existing figures
-    If there is no existing figures, _gca() will
-    create a figure with the default figsize, causing the figsize=parameter to
-    be ignored.
-    """
-    if ax is None and len(plt.get_fignums()) > 0:
-        ax = _gca()
-        ax = MPLPlot._get_ax_layer(ax)
-    return _plot(data, kind=kind, ax=ax,
-                 figsize=figsize, use_index=use_index, title=title,
-                 grid=grid, legend=legend,
-                 style=style, logx=logx, logy=logy, loglog=loglog,
-                 xticks=xticks, yticks=yticks, xlim=xlim, ylim=ylim,
-                 rot=rot, fontsize=fontsize, colormap=colormap, table=table,
-                 yerr=yerr, xerr=xerr,
-                 label=label, secondary_y=secondary_y,
-                 **kwds)
-
-
-_shared_docs['boxplot'] = """
-    Make a box plot from DataFrame column optionally grouped by some columns or
-    other inputs
-
-    Parameters
-    ----------
-    data : the pandas object holding the data
-    column : column name or list of names, or vector
-        Can be any valid input to groupby
-    by : string or sequence
-        Column in the DataFrame to group by
-    ax : Matplotlib axes object, optional
-    fontsize : int or string
-    rot : label rotation angle
-    figsize : A tuple (width, height) in inches
-    grid : Setting this to True will show the grid
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    return_type : {None, 'axes', 'dict', 'both'}, default None
-        The kind of object to return. The default is ``axes``
-        'axes' returns the matplotlib axes the boxplot is drawn on;
-        'dict' returns a dictionary  whose values are the matplotlib
-        Lines of the boxplot;
-        'both' returns a namedtuple with the axes and dict.
-
-        When grouping with ``by``, a Series mapping columns to ``return_type``
-        is returned, unless ``return_type`` is None, in which case a NumPy
-        array of axes is returned with the same shape as ``layout``.
-        See the prose documentation for more.
-
-    kwds : other plotting keyword arguments to be passed to matplotlib boxplot
-           function
-
-    Returns
-    -------
-    lines : dict
-    ax : matplotlib Axes
-    (ax, lines): namedtuple
-
-    Notes
-    -----
-    Use ``return_type='dict'`` when you want to tweak the appearance
-    of the lines after plotting. In this case a dict containing the Lines
-    making up the boxes, caps, fliers, medians, and whiskers is returned.
-    """
-
-
-@Appender(_shared_docs['boxplot'] % _shared_doc_kwargs)
-def boxplot(data, column=None, by=None, ax=None, fontsize=None,
-            rot=0, grid=True, figsize=None, layout=None, return_type=None,
-            **kwds):
-
-    # validate return_type:
-    if return_type not in BoxPlot._valid_return_types:
-        raise ValueError("return_type must be {'axes', 'dict', 'both'}")
-
-    from pandas import Series, DataFrame
-    if isinstance(data, Series):
-        data = DataFrame({'x': data})
-        column = 'x'
-
-    def _get_colors():
-        return _get_standard_colors(color=kwds.get('color'), num_colors=1)
-
-    def maybe_color_bp(bp):
-        if 'color' not in kwds:
-            from matplotlib.artist import setp
-            setp(bp['boxes'], color=colors[0], alpha=1)
-            setp(bp['whiskers'], color=colors[0], alpha=1)
-            setp(bp['medians'], color=colors[2], alpha=1)
-
-    def plot_group(keys, values, ax):
-        keys = [pprint_thing(x) for x in keys]
-        values = [remove_na(v) for v in values]
-        bp = ax.boxplot(values, **kwds)
-        if fontsize is not None:
-            ax.tick_params(axis='both', labelsize=fontsize)
-        if kwds.get('vert', 1):
-            ax.set_xticklabels(keys, rotation=rot)
-        else:
-            ax.set_yticklabels(keys, rotation=rot)
-        maybe_color_bp(bp)
-
-        # Return axes in multiplot case, maybe revisit later # 985
-        if return_type == 'dict':
-            return bp
-        elif return_type == 'both':
-            return BoxPlot.BP(ax=ax, lines=bp)
-        else:
-            return ax
-
-    colors = _get_colors()
-    if column is None:
-        columns = None
-    else:
-        if isinstance(column, (list, tuple)):
-            columns = column
-        else:
-            columns = [column]
-
-    if by is not None:
-        # Prefer array return type for 2-D plots to match the subplot layout
-        # https://github.com/pandas-dev/pandas/pull/12216#issuecomment-241175580
-        result = _grouped_plot_by_column(plot_group, data, columns=columns,
-                                         by=by, grid=grid, figsize=figsize,
-                                         ax=ax, layout=layout,
-                                         return_type=return_type)
-    else:
-        if return_type is None:
-            return_type = 'axes'
-        if layout is not None:
-            raise ValueError("The 'layout' keyword is not supported when "
-                             "'by' is None")
-
-        if ax is None:
-            ax = _gca()
-        data = data._get_numeric_data()
-        if columns is None:
-            columns = data.columns
-        else:
-            data = data[columns]
-
-        result = plot_group(columns, data.values.T, ax)
-        ax.grid(grid)
-
-    return result
-
-
-def format_date_labels(ax, rot):
-    # mini version of autofmt_xdate
-    try:
-        for label in ax.get_xticklabels():
-            label.set_ha('right')
-            label.set_rotation(rot)
-        fig = ax.get_figure()
-        fig.subplots_adjust(bottom=0.2)
-    except Exception:  # pragma: no cover
-        pass
-
-
-def scatter_plot(data, x, y, by=None, ax=None, figsize=None, grid=False,
-                 **kwargs):
-    """
-    Make a scatter plot from two DataFrame columns
-
-    Parameters
-    ----------
-    data : DataFrame
-    x : Column name for the x-axis values
-    y : Column name for the y-axis values
-    ax : Matplotlib axis object
-    figsize : A tuple (width, height) in inches
-    grid : Setting this to True will show the grid
-    kwargs : other plotting keyword arguments
-        To be passed to scatter function
-
-    Returns
-    -------
-    fig : matplotlib.Figure
-    """
-    import matplotlib.pyplot as plt
-
-    # workaround because `c='b'` is hardcoded in matplotlibs scatter method
-    kwargs.setdefault('c', plt.rcParams['patch.facecolor'])
-
-    def plot_group(group, ax):
-        xvals = group[x].values
-        yvals = group[y].values
-        ax.scatter(xvals, yvals, **kwargs)
-        ax.grid(grid)
-
-    if by is not None:
-        fig = _grouped_plot(plot_group, data, by=by, figsize=figsize, ax=ax)
-    else:
-        if ax is None:
-            fig = plt.figure()
-            ax = fig.add_subplot(111)
-        else:
-            fig = ax.get_figure()
-        plot_group(data, ax)
-        ax.set_ylabel(pprint_thing(y))
-        ax.set_xlabel(pprint_thing(x))
-
-        ax.grid(grid)
-
-    return fig
-
-
-def hist_frame(data, column=None, by=None, grid=True, xlabelsize=None,
-               xrot=None, ylabelsize=None, yrot=None, ax=None, sharex=False,
-               sharey=False, figsize=None, layout=None, bins=10, **kwds):
-    """
-    Draw histogram of the DataFrame's series using matplotlib / pylab.
-
-    Parameters
-    ----------
-    data : DataFrame
-    column : string or sequence
-        If passed, will be used to limit data to a subset of columns
-    by : object, optional
-        If passed, then used to form histograms for separate groups
-    grid : boolean, default True
-        Whether to show axis grid lines
-    xlabelsize : int, default None
-        If specified changes the x-axis label size
-    xrot : float, default None
-        rotation of x axis labels
-    ylabelsize : int, default None
-        If specified changes the y-axis label size
-    yrot : float, default None
-        rotation of y axis labels
-    ax : matplotlib axes object, default None
-    sharex : boolean, default True if ax is None else False
-        In case subplots=True, share x axis and set some x axis labels to
-        invisible; defaults to True if ax is None otherwise False if an ax
-        is passed in; Be aware, that passing in both an ax and sharex=True
-        will alter all x axis labels for all subplots in a figure!
-    sharey : boolean, default False
-        In case subplots=True, share y axis and set some y axis labels to
-        invisible
-    figsize : tuple
-        The size of the figure to create in inches by default
-    layout : tuple, optional
-        Tuple of (rows, columns) for the layout of the histograms
-    bins : integer, default 10
-        Number of histogram bins to be used
-    kwds : other plotting keyword arguments
-        To be passed to hist function
-    """
-
-    if by is not None:
-        axes = grouped_hist(data, column=column, by=by, ax=ax, grid=grid,
-                            figsize=figsize, sharex=sharex, sharey=sharey,
-                            layout=layout, bins=bins, xlabelsize=xlabelsize,
-                            xrot=xrot, ylabelsize=ylabelsize,
-                            yrot=yrot, **kwds)
-        return axes
-
-    if column is not None:
-        if not isinstance(column, (list, np.ndarray, Index)):
-            column = [column]
-        data = data[column]
-    data = data._get_numeric_data()
-    naxes = len(data.columns)
-
-    fig, axes = _subplots(naxes=naxes, ax=ax, squeeze=False,
-                          sharex=sharex, sharey=sharey, figsize=figsize,
-                          layout=layout)
-    _axes = _flatten(axes)
-
-    for i, col in enumerate(_try_sort(data.columns)):
-        ax = _axes[i]
-        ax.hist(data[col].dropna().values, bins=bins, **kwds)
-        ax.set_title(col)
-        ax.grid(grid)
-
-    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-                     ylabelsize=ylabelsize, yrot=yrot)
-    fig.subplots_adjust(wspace=0.3, hspace=0.3)
-
-    return axes
-
-
-def hist_series(self, by=None, ax=None, grid=True, xlabelsize=None,
-                xrot=None, ylabelsize=None, yrot=None, figsize=None,
-                bins=10, **kwds):
-    """
-    Draw histogram of the input series using matplotlib
-
-    Parameters
-    ----------
-    by : object, optional
-        If passed, then used to form histograms for separate groups
-    ax : matplotlib axis object
-        If not passed, uses gca()
-    grid : boolean, default True
-        Whether to show axis grid lines
-    xlabelsize : int, default None
-        If specified changes the x-axis label size
-    xrot : float, default None
-        rotation of x axis labels
-    ylabelsize : int, default None
-        If specified changes the y-axis label size
-    yrot : float, default None
-        rotation of y axis labels
-    figsize : tuple, default None
-        figure size in inches by default
-    bins: integer, default 10
-        Number of histogram bins to be used
-    kwds : keywords
-        To be passed to the actual plotting function
-
-    Notes
-    -----
-    See matplotlib documentation online for more on this
-
-    """
-    import matplotlib.pyplot as plt
-
-    if by is None:
-        if kwds.get('layout', None) is not None:
-            raise ValueError("The 'layout' keyword is not supported when "
-                             "'by' is None")
-        # hack until the plotting interface is a bit more unified
-        fig = kwds.pop('figure', plt.gcf() if plt.get_fignums() else
-                       plt.figure(figsize=figsize))
-        if (figsize is not None and tuple(figsize) !=
-                tuple(fig.get_size_inches())):
-            fig.set_size_inches(*figsize, forward=True)
-        if ax is None:
-            ax = fig.gca()
-        elif ax.get_figure() != fig:
-            raise AssertionError('passed axis not bound to passed figure')
-        values = self.dropna().values
-
-        ax.hist(values, bins=bins, **kwds)
-        ax.grid(grid)
-        axes = np.array([ax])
-
-        _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-                         ylabelsize=ylabelsize, yrot=yrot)
-
-    else:
-        if 'figure' in kwds:
-            raise ValueError("Cannot pass 'figure' when using the "
-                             "'by' argument, since a new 'Figure' instance "
-                             "will be created")
-        axes = grouped_hist(self, by=by, ax=ax, grid=grid, figsize=figsize,
-                            bins=bins, xlabelsize=xlabelsize, xrot=xrot,
-                            ylabelsize=ylabelsize, yrot=yrot, **kwds)
-
-    if hasattr(axes, 'ndim'):
-        if axes.ndim == 1 and len(axes) == 1:
-            return axes[0]
-    return axes
-
-
-def grouped_hist(data, column=None, by=None, ax=None, bins=50, figsize=None,
-                 layout=None, sharex=False, sharey=False, rot=90, grid=True,
-                 xlabelsize=None, xrot=None, ylabelsize=None, yrot=None,
-                 **kwargs):
-    """
-    Grouped histogram
-
-    Parameters
-    ----------
-    data: Series/DataFrame
-    column: object, optional
-    by: object, optional
-    ax: axes, optional
-    bins: int, default 50
-    figsize: tuple, optional
-    layout: optional
-    sharex: boolean, default False
-    sharey: boolean, default False
-    rot: int, default 90
-    grid: bool, default True
-    kwargs: dict, keyword arguments passed to matplotlib.Axes.hist
-
-    Returns
-    -------
-    axes: collection of Matplotlib Axes
-    """
-    def plot_group(group, ax):
-        ax.hist(group.dropna().values, bins=bins, **kwargs)
-
-    xrot = xrot or rot
-
-    fig, axes = _grouped_plot(plot_group, data, column=column,
-                              by=by, sharex=sharex, sharey=sharey, ax=ax,
-                              figsize=figsize, layout=layout, rot=rot)
-
-    _set_ticks_props(axes, xlabelsize=xlabelsize, xrot=xrot,
-                     ylabelsize=ylabelsize, yrot=yrot)
-
-    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9,
-                        hspace=0.5, wspace=0.3)
-    return axes
-
-
-def boxplot_frame_groupby(grouped, subplots=True, column=None, fontsize=None,
-                          rot=0, grid=True, ax=None, figsize=None,
-                          layout=None, **kwds):
-    """
-    Make box plots from DataFrameGroupBy data.
-
-    Parameters
-    ----------
-    grouped : Grouped DataFrame
-    subplots :
-        * ``False`` - no subplots will be used
-        * ``True`` - create a subplot for each group
-    column : column name or list of names, or vector
-        Can be any valid input to groupby
-    fontsize : int or string
-    rot : label rotation angle
-    grid : Setting this to True will show the grid
-    ax : Matplotlib axis object, default None
-    figsize : A tuple (width, height) in inches
-    layout : tuple (optional)
-        (rows, columns) for the layout of the plot
-    kwds : other plotting keyword arguments to be passed to matplotlib boxplot
-           function
-
-    Returns
-    -------
-    dict of key/value = group key/DataFrame.boxplot return value
-    or DataFrame.boxplot return value in case subplots=figures=False
-
-    Examples
-    --------
-    >>> import pandas
-    >>> import numpy as np
-    >>> import itertools
-    >>>
-    >>> tuples = [t for t in itertools.product(range(1000), range(4))]
-    >>> index = pandas.MultiIndex.from_tuples(tuples, names=['lvl0', 'lvl1'])
-    >>> data = np.random.randn(len(index),4)
-    >>> df = pandas.DataFrame(data, columns=list('ABCD'), index=index)
-    >>>
-    >>> grouped = df.groupby(level='lvl1')
-    >>> boxplot_frame_groupby(grouped)
-    >>>
-    >>> grouped = df.unstack(level='lvl1').groupby(level=0, axis=1)
-    >>> boxplot_frame_groupby(grouped, subplots=False)
-    """
-    if subplots is True:
-        naxes = len(grouped)
-        fig, axes = _subplots(naxes=naxes, squeeze=False,
-                              ax=ax, sharex=False, sharey=True,
-                              figsize=figsize, layout=layout)
-        axes = _flatten(axes)
-
-        ret = Series()
-        for (key, group), ax in zip(grouped, axes):
-            d = group.boxplot(ax=ax, column=column, fontsize=fontsize,
-                              rot=rot, grid=grid, **kwds)
-            ax.set_title(pprint_thing(key))
-            ret.loc[key] = d
-        fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1,
-                            right=0.9, wspace=0.2)
-    else:
-        from pandas.tools.concat import concat
-        keys, frames = zip(*grouped)
-        if grouped.axis == 0:
-            df = concat(frames, keys=keys, axis=1)
-        else:
-            if len(frames) > 1:
-                df = frames[0].join(frames[1::])
-            else:
-                df = frames[0]
-        ret = df.boxplot(column=column, fontsize=fontsize, rot=rot,
-                         grid=grid, ax=ax, figsize=figsize,
-                         layout=layout, **kwds)
-    return ret
-
-
-def _grouped_plot(plotf, data, column=None, by=None, numeric_only=True,
-                  figsize=None, sharex=True, sharey=True, layout=None,
-                  rot=0, ax=None, **kwargs):
-    from pandas import DataFrame
-
-    if figsize == 'default':
-        # allowed to specify mpl default with 'default'
-        warnings.warn("figsize='default' is deprecated. Specify figure"
-                      "size by tuple instead", FutureWarning, stacklevel=4)
-        figsize = None
-
-    grouped = data.groupby(by)
-    if column is not None:
-        grouped = grouped[column]
-
-    naxes = len(grouped)
-    fig, axes = _subplots(naxes=naxes, figsize=figsize,
-                          sharex=sharex, sharey=sharey, ax=ax,
-                          layout=layout)
-
-    _axes = _flatten(axes)
-
-    for i, (key, group) in enumerate(grouped):
-        ax = _axes[i]
-        if numeric_only and isinstance(group, DataFrame):
-            group = group._get_numeric_data()
-        plotf(group, ax, **kwargs)
-        ax.set_title(pprint_thing(key))
-
-    return fig, axes
-
-
-def _grouped_plot_by_column(plotf, data, columns=None, by=None,
-                            numeric_only=True, grid=False,
-                            figsize=None, ax=None, layout=None,
-                            return_type=None, **kwargs):
-    grouped = data.groupby(by)
-    if columns is None:
-        if not isinstance(by, (list, tuple)):
-            by = [by]
-        columns = data._get_numeric_data().columns.difference(by)
-    naxes = len(columns)
-    fig, axes = _subplots(naxes=naxes, sharex=True, sharey=True,
-                          figsize=figsize, ax=ax, layout=layout)
-
-    _axes = _flatten(axes)
-
-    result = Series()
-    ax_values = []
-
-    for i, col in enumerate(columns):
-        ax = _axes[i]
-        gp_col = grouped[col]
-        keys, values = zip(*gp_col)
-        re_plotf = plotf(keys, values, ax, **kwargs)
-        ax.set_title(col)
-        ax.set_xlabel(pprint_thing(by))
-        ax_values.append(re_plotf)
-        ax.grid(grid)
-
-    result = Series(ax_values, index=columns)
-
-    # Return axes in multiplot case, maybe revisit later # 985
-    if return_type is None:
-        result = axes
-
-    byline = by[0] if len(by) == 1 else by
-    fig.suptitle('Boxplot grouped by %s' % byline)
-    fig.subplots_adjust(bottom=0.15, top=0.9, left=0.1, right=0.9, wspace=0.2)
-
-    return result
-
-
-def table(ax, data, rowLabels=None, colLabels=None,
-          **kwargs):
-    """
-    Helper function to convert DataFrame and Series to matplotlib.table
-
-    Parameters
-    ----------
-    `ax`: Matplotlib axes object
-    `data`: DataFrame or Series
-        data for table contents
-    `kwargs`: keywords, optional
-        keyword arguments which passed to matplotlib.table.table.
-        If `rowLabels` or `colLabels` is not specified, data index or column
-        name will be used.
-
-    Returns
-    -------
-    matplotlib table object
-    """
-    from pandas import DataFrame
-    if isinstance(data, Series):
-        data = DataFrame(data, columns=[data.name])
-    elif isinstance(data, DataFrame):
-        pass
-    else:
-        raise ValueError('Input data must be DataFrame or Series')
-
-    if rowLabels is None:
-        rowLabels = data.index
-
-    if colLabels is None:
-        colLabels = data.columns
-
-    cellText = data.values
-
-    import matplotlib.table
-    table = matplotlib.table.table(ax, cellText=cellText,
-                                   rowLabels=rowLabels,
-                                   colLabels=colLabels, **kwargs)
-    return table
-
-
-def _get_layout(nplots, layout=None, layout_type='box'):
-    if layout is not None:
-        if not isinstance(layout, (tuple, list)) or len(layout) != 2:
-            raise ValueError('Layout must be a tuple of (rows, columns)')
-
-        nrows, ncols = layout
-
-        # Python 2 compat
-        ceil_ = lambda x: int(ceil(x))
-        if nrows == -1 and ncols > 0:
-            layout = nrows, ncols = (ceil_(float(nplots) / ncols), ncols)
-        elif ncols == -1 and nrows > 0:
-            layout = nrows, ncols = (nrows, ceil_(float(nplots) / nrows))
-        elif ncols <= 0 and nrows <= 0:
-            msg = "At least one dimension of layout must be positive"
-            raise ValueError(msg)
-
-        if nrows * ncols < nplots:
-            raise ValueError('Layout of %sx%s must be larger than '
-                             'required size %s' % (nrows, ncols, nplots))
-
-        return layout
-
-    if layout_type == 'single':
-        return (1, 1)
-    elif layout_type == 'horizontal':
-        return (1, nplots)
-    elif layout_type == 'vertical':
-        return (nplots, 1)
-
-    layouts = {1: (1, 1), 2: (1, 2), 3: (2, 2), 4: (2, 2)}
-    try:
-        return layouts[nplots]
-    except KeyError:
-        k = 1
-        while k ** 2 < nplots:
-            k += 1
-
-        if (k - 1) * k >= nplots:
-            return k, (k - 1)
-        else:
-            return k, k
-
-# copied from matplotlib/pyplot.py and modified for pandas.plotting
-
-
-def _subplots(naxes=None, sharex=False, sharey=False, squeeze=True,
-              subplot_kw=None, ax=None, layout=None, layout_type='box',
-              **fig_kw):
-    """Create a figure with a set of subplots already made.
-
-    This utility wrapper makes it convenient to create common layouts of
-    subplots, including the enclosing figure object, in a single call.
-
-    Keyword arguments:
-
-    naxes : int
-      Number of required axes. Exceeded axes are set invisible. Default is
-      nrows * ncols.
-
-    sharex : bool
-      If True, the X axis will be shared amongst all subplots.
-
-    sharey : bool
-      If True, the Y axis will be shared amongst all subplots.
-
-    squeeze : bool
-
-      If True, extra dimensions are squeezed out from the returned axis object:
-        - if only one subplot is constructed (nrows=ncols=1), the resulting
-        single Axis object is returned as a scalar.
-        - for Nx1 or 1xN subplots, the returned object is a 1-d numpy object
-        array of Axis objects are returned as numpy 1-d arrays.
-        - for NxM subplots with N>1 and M>1 are returned as a 2d array.
-
-      If False, no squeezing at all is done: the returned axis object is always
-      a 2-d array containing Axis instances, even if it ends up being 1x1.
-
-    subplot_kw : dict
-      Dict with keywords passed to the add_subplot() call used to create each
-      subplots.
-
-    ax : Matplotlib axis object, optional
-
-    layout : tuple
-      Number of rows and columns of the subplot grid.
-      If not specified, calculated from naxes and layout_type
-
-    layout_type : {'box', 'horziontal', 'vertical'}, default 'box'
-      Specify how to layout the subplot grid.
-
-    fig_kw : Other keyword arguments to be passed to the figure() call.
-        Note that all keywords not recognized above will be
-        automatically included here.
-
-    Returns:
-
-    fig, ax : tuple
-      - fig is the Matplotlib Figure object
-      - ax can be either a single axis object or an array of axis objects if
-      more than one subplot was created.  The dimensions of the resulting array
-      can be controlled with the squeeze keyword, see above.
-
-    **Examples:**
-
-    x = np.linspace(0, 2*np.pi, 400)
-    y = np.sin(x**2)
-
-    # Just a figure and one subplot
-    f, ax = plt.subplots()
-    ax.plot(x, y)
-    ax.set_title('Simple plot')
-
-    # Two subplots, unpack the output array immediately
-    f, (ax1, ax2) = plt.subplots(1, 2, sharey=True)
-    ax1.plot(x, y)
-    ax1.set_title('Sharing Y axis')
-    ax2.scatter(x, y)
-
-    # Four polar axes
-    plt.subplots(2, 2, subplot_kw=dict(polar=True))
-    """
-    import matplotlib.pyplot as plt
-
-    if subplot_kw is None:
-        subplot_kw = {}
-
-    if ax is None:
-        fig = plt.figure(**fig_kw)
-    else:
-        if is_list_like(ax):
-            ax = _flatten(ax)
-            if layout is not None:
-                warnings.warn("When passing multiple axes, layout keyword is "
-                              "ignored", UserWarning)
-            if sharex or sharey:
-                warnings.warn("When passing multiple axes, sharex and sharey "
-                              "are ignored. These settings must be specified "
-                              "when creating axes", UserWarning,
-                              stacklevel=4)
-            if len(ax) == naxes:
-                fig = ax[0].get_figure()
-                return fig, ax
-            else:
-                raise ValueError("The number of passed axes must be {0}, the "
-                                 "same as the output plot".format(naxes))
-
-        fig = ax.get_figure()
-        # if ax is passed and a number of subplots is 1, return ax as it is
-        if naxes == 1:
-            if squeeze:
-                return fig, ax
-            else:
-                return fig, _flatten(ax)
-        else:
-            warnings.warn("To output multiple subplots, the figure containing "
-                          "the passed axes is being cleared", UserWarning,
-                          stacklevel=4)
-            fig.clear()
-
-    nrows, ncols = _get_layout(naxes, layout=layout, layout_type=layout_type)
-    nplots = nrows * ncols
-
-    # Create empty object array to hold all axes.  It's easiest to make it 1-d
-    # so we can just append subplots upon creation, and then
-    axarr = np.empty(nplots, dtype=object)
-
-    # Create first subplot separately, so we can share it if requested
-    ax0 = fig.add_subplot(nrows, ncols, 1, **subplot_kw)
-
-    if sharex:
-        subplot_kw['sharex'] = ax0
-    if sharey:
-        subplot_kw['sharey'] = ax0
-    axarr[0] = ax0
-
-    # Note off-by-one counting because add_subplot uses the MATLAB 1-based
-    # convention.
-    for i in range(1, nplots):
-        kwds = subplot_kw.copy()
-        # Set sharex and sharey to None for blank/dummy axes, these can
-        # interfere with proper axis limits on the visible axes if
-        # they share axes e.g. issue #7528
-        if i >= naxes:
-            kwds['sharex'] = None
-            kwds['sharey'] = None
-        ax = fig.add_subplot(nrows, ncols, i + 1, **kwds)
-        axarr[i] = ax
-
-    if naxes != nplots:
-        for ax in axarr[naxes:]:
-            ax.set_visible(False)
-
-    _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey)
-
-    if squeeze:
-        # Reshape the array to have the final desired dimension (nrow,ncol),
-        # though discarding unneeded dimensions that equal 1.  If we only have
-        # one subplot, just return it instead of a 1-element array.
-        if nplots == 1:
-            axes = axarr[0]
-        else:
-            axes = axarr.reshape(nrows, ncols).squeeze()
-    else:
-        # returned axis array will be always 2-d, even if nrows=ncols=1
-        axes = axarr.reshape(nrows, ncols)
-
-    return fig, axes
-
-
-def _remove_labels_from_axis(axis):
-    for t in axis.get_majorticklabels():
-        t.set_visible(False)
-
-    try:
-        # set_visible will not be effective if
-        # minor axis has NullLocator and NullFormattor (default)
-        import matplotlib.ticker as ticker
-        if isinstance(axis.get_minor_locator(), ticker.NullLocator):
-            axis.set_minor_locator(ticker.AutoLocator())
-        if isinstance(axis.get_minor_formatter(), ticker.NullFormatter):
-            axis.set_minor_formatter(ticker.FormatStrFormatter(''))
-        for t in axis.get_minorticklabels():
-            t.set_visible(False)
-    except Exception:   # pragma no cover
-        raise
-    axis.get_label().set_visible(False)
-
-
-def _handle_shared_axes(axarr, nplots, naxes, nrows, ncols, sharex, sharey):
-    if nplots > 1:
-
-        if nrows > 1:
-            try:
-                # first find out the ax layout,
-                # so that we can correctly handle 'gaps"
-                layout = np.zeros((nrows + 1, ncols + 1), dtype=np.bool)
-                for ax in axarr:
-                    layout[ax.rowNum, ax.colNum] = ax.get_visible()
-
-                for ax in axarr:
-                    # only the last row of subplots should get x labels -> all
-                    # other off layout handles the case that the subplot is
-                    # the last in the column, because below is no subplot/gap.
-                    if not layout[ax.rowNum + 1, ax.colNum]:
-                        continue
-                    if sharex or len(ax.get_shared_x_axes()
-                                     .get_siblings(ax)) > 1:
-                        _remove_labels_from_axis(ax.xaxis)
-
-            except IndexError:
-                # if gridspec is used, ax.rowNum and ax.colNum may different
-                # from layout shape. in this case, use last_row logic
-                for ax in axarr:
-                    if ax.is_last_row():
-                        continue
-                    if sharex or len(ax.get_shared_x_axes()
-                                     .get_siblings(ax)) > 1:
-                        _remove_labels_from_axis(ax.xaxis)
-
-        if ncols > 1:
-            for ax in axarr:
-                # only the first column should get y labels -> set all other to
-                # off as we only have labels in teh first column and we always
-                # have a subplot there, we can skip the layout test
-                if ax.is_first_col():
-                    continue
-                if sharey or len(ax.get_shared_y_axes().get_siblings(ax)) > 1:
-                    _remove_labels_from_axis(ax.yaxis)
-
-
-def _flatten(axes):
-    if not is_list_like(axes):
-        return np.array([axes])
-    elif isinstance(axes, (np.ndarray, Index)):
-        return axes.ravel()
-    return np.array(axes)
-
-
-def _get_all_lines(ax):
-    lines = ax.get_lines()
-
-    if hasattr(ax, 'right_ax'):
-        lines += ax.right_ax.get_lines()
-
-    if hasattr(ax, 'left_ax'):
-        lines += ax.left_ax.get_lines()
-
-    return lines
-
-
-def _get_xlim(lines):
-    left, right = np.inf, -np.inf
-    for l in lines:
-        x = l.get_xdata(orig=False)
-        left = min(x[0], left)
-        right = max(x[-1], right)
-    return left, right
-
-
-def _set_ticks_props(axes, xlabelsize=None, xrot=None,
-                     ylabelsize=None, yrot=None):
-    import matplotlib.pyplot as plt
-
-    for ax in _flatten(axes):
-        if xlabelsize is not None:
-            plt.setp(ax.get_xticklabels(), fontsize=xlabelsize)
-        if xrot is not None:
-            plt.setp(ax.get_xticklabels(), rotation=xrot)
-        if ylabelsize is not None:
-            plt.setp(ax.get_yticklabels(), fontsize=ylabelsize)
-        if yrot is not None:
-            plt.setp(ax.get_yticklabels(), rotation=yrot)
-    return axes
-
-
-class BasePlotMethods(PandasObject):
-
-    def __init__(self, data):
-        self._data = data
-
-    def __call__(self, *args, **kwargs):
-        raise NotImplementedError
-
-
-class SeriesPlotMethods(BasePlotMethods):
-    """Series plotting accessor and method
-
-    Examples
-    --------
-    >>> s.plot.line()
-    >>> s.plot.bar()
-    >>> s.plot.hist()
-
-    Plotting methods can also be accessed by calling the accessor as a method
-    with the ``kind`` argument:
-    ``s.plot(kind='line')`` is equivalent to ``s.plot.line()``
-    """
-
-    def __call__(self, kind='line', ax=None,
-                 figsize=None, use_index=True, title=None, grid=None,
-                 legend=False, style=None, logx=False, logy=False,
-                 loglog=False, xticks=None, yticks=None,
-                 xlim=None, ylim=None,
-                 rot=None, fontsize=None, colormap=None, table=False,
-                 yerr=None, xerr=None,
-                 label=None, secondary_y=False, **kwds):
-        return plot_series(self._data, kind=kind, ax=ax, figsize=figsize,
-                           use_index=use_index, title=title, grid=grid,
-                           legend=legend, style=style, logx=logx, logy=logy,
-                           loglog=loglog, xticks=xticks, yticks=yticks,
-                           xlim=xlim, ylim=ylim, rot=rot, fontsize=fontsize,
-                           colormap=colormap, table=table, yerr=yerr,
-                           xerr=xerr, label=label, secondary_y=secondary_y,
-                           **kwds)
-    __call__.__doc__ = plot_series.__doc__
-
-    def line(self, **kwds):
-        """
-        Line plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='line', **kwds)
-
-    def bar(self, **kwds):
-        """
-        Vertical bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='bar', **kwds)
-
-    def barh(self, **kwds):
-        """
-        Horizontal bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='barh', **kwds)
-
-    def box(self, **kwds):
-        """
-        Boxplot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='box', **kwds)
-
-    def hist(self, bins=10, **kwds):
-        """
-        Histogram
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        bins: integer, default 10
-            Number of histogram bins to be used
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='hist', bins=bins, **kwds)
-
-    def kde(self, **kwds):
-        """
-        Kernel Density Estimate plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='kde', **kwds)
-
-    density = kde
-
-    def area(self, **kwds):
-        """
-        Area plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='area', **kwds)
-
-    def pie(self, **kwds):
-        """
-        Pie chart
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.Series.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='pie', **kwds)
-
-
-class FramePlotMethods(BasePlotMethods):
-    """DataFrame plotting accessor and method
-
-    Examples
-    --------
-    >>> df.plot.line()
-    >>> df.plot.scatter('x', 'y')
-    >>> df.plot.hexbin()
-
-    These plotting methods can also be accessed by calling the accessor as a
-    method with the ``kind`` argument:
-    ``df.plot(kind='line')`` is equivalent to ``df.plot.line()``
-    """
-
-    def __call__(self, x=None, y=None, kind='line', ax=None,
-                 subplots=False, sharex=None, sharey=False, layout=None,
-                 figsize=None, use_index=True, title=None, grid=None,
-                 legend=True, style=None, logx=False, logy=False, loglog=False,
-                 xticks=None, yticks=None, xlim=None, ylim=None,
-                 rot=None, fontsize=None, colormap=None, table=False,
-                 yerr=None, xerr=None,
-                 secondary_y=False, sort_columns=False, **kwds):
-        return plot_frame(self._data, kind=kind, x=x, y=y, ax=ax,
-                          subplots=subplots, sharex=sharex, sharey=sharey,
-                          layout=layout, figsize=figsize, use_index=use_index,
-                          title=title, grid=grid, legend=legend, style=style,
-                          logx=logx, logy=logy, loglog=loglog, xticks=xticks,
-                          yticks=yticks, xlim=xlim, ylim=ylim, rot=rot,
-                          fontsize=fontsize, colormap=colormap, table=table,
-                          yerr=yerr, xerr=xerr, secondary_y=secondary_y,
-                          sort_columns=sort_columns, **kwds)
-    __call__.__doc__ = plot_frame.__doc__
-
-    def line(self, x=None, y=None, **kwds):
-        """
-        Line plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='line', x=x, y=y, **kwds)
-
-    def bar(self, x=None, y=None, **kwds):
-        """
-        Vertical bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='bar', x=x, y=y, **kwds)
-
-    def barh(self, x=None, y=None, **kwds):
-        """
-        Horizontal bar plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='barh', x=x, y=y, **kwds)
-
-    def box(self, by=None, **kwds):
-        """
-        Boxplot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        by : string or sequence
-            Column in the DataFrame to group by.
-        \*\*kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='box', by=by, **kwds)
-
-    def hist(self, by=None, bins=10, **kwds):
-        """
-        Histogram
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        by : string or sequence
-            Column in the DataFrame to group by.
-        bins: integer, default 10
-            Number of histogram bins to be used
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='hist', by=by, bins=bins, **kwds)
-
-    def kde(self, **kwds):
-        """
-        Kernel Density Estimate plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='kde', **kwds)
-
-    density = kde
-
-    def area(self, x=None, y=None, **kwds):
-        """
-        Area plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='area', x=x, y=y, **kwds)
-
-    def pie(self, y=None, **kwds):
-        """
-        Pie chart
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        y : label or position, optional
-            Column to plot.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='pie', y=y, **kwds)
-
-    def scatter(self, x, y, s=None, c=None, **kwds):
-        """
-        Scatter plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        s : scalar or array_like, optional
-            Size of each point.
-        c : label or position, optional
-            Color of each point.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        return self(kind='scatter', x=x, y=y, c=c, s=s, **kwds)
-
-    def hexbin(self, x, y, C=None, reduce_C_function=None, gridsize=None,
-               **kwds):
-        """
-        Hexbin plot
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        x, y : label or position, optional
-            Coordinates for each point.
-        C : label or position, optional
-            The value at each `(x, y)` point.
-        reduce_C_function : callable, optional
-            Function of one argument that reduces all the values in a bin to
-            a single number (e.g. `mean`, `max`, `sum`, `std`).
-        gridsize : int, optional
-            Number of bins.
-        **kwds : optional
-            Keyword arguments to pass on to :py:meth:`pandas.DataFrame.plot`.
-
-        Returns
-        -------
-        axes : matplotlib.AxesSubplot or np.array of them
-        """
-        if reduce_C_function is not None:
-            kwds['reduce_C_function'] = reduce_C_function
-        if gridsize is not None:
-            kwds['gridsize'] = gridsize
-        return self(kind='hexbin', x=x, y=y, C=C, **kwds)
diff --git a/pandas/tools/tile.py b/pandas/tools/tile.py
deleted file mode 100644
index 4a3d452228e01..0000000000000
--- a/pandas/tools/tile.py
+++ /dev/null
@@ -1,390 +0,0 @@
-"""
-Quantilization functions and related stuff
-"""
-
-from pandas.types.missing import isnull
-from pandas.types.common import (is_float, is_integer,
-                                 is_scalar, _ensure_int64)
-
-from pandas.core.api import Series
-from pandas.core.categorical import Categorical
-import pandas.core.algorithms as algos
-import pandas.core.nanops as nanops
-from pandas.compat import zip
-from pandas import to_timedelta, to_datetime
-from pandas.types.common import is_datetime64_dtype, is_timedelta64_dtype
-from pandas._libs.lib import infer_dtype
-
-import numpy as np
-
-
-def cut(x, bins, right=True, labels=None, retbins=False, precision=3,
-        include_lowest=False):
-    """
-    Return indices of half-open bins to which each value of `x` belongs.
-
-    Parameters
-    ----------
-    x : array-like
-        Input array to be binned. It has to be 1-dimensional.
-    bins : int or sequence of scalars
-        If `bins` is an int, it defines the number of equal-width bins in the
-        range of `x`. However, in this case, the range of `x` is extended
-        by .1% on each side to include the min or max values of `x`. If
-        `bins` is a sequence it defines the bin edges allowing for
-        non-uniform bin width. No extension of the range of `x` is done in
-        this case.
-    right : bool, optional
-        Indicates whether the bins include the rightmost edge or not. If
-        right == True (the default), then the bins [1,2,3,4] indicate
-        (1,2], (2,3], (3,4].
-    labels : array or boolean, default None
-        Used as labels for the resulting bins. Must be of the same length as
-        the resulting bins. If False, return only integer indicators of the
-        bins.
-    retbins : bool, optional
-        Whether to return the bins or not. Can be useful if bins is given
-        as a scalar.
-    precision : int
-        The precision at which to store and display the bins labels
-    include_lowest : bool
-        Whether the first interval should be left-inclusive or not.
-
-    Returns
-    -------
-    out : Categorical or Series or array of integers if labels is False
-        The return type (Categorical or Series) depends on the input: a Series
-        of type category if input is a Series else Categorical. Bins are
-        represented as categories when categorical data is returned.
-    bins : ndarray of floats
-        Returned only if `retbins` is True.
-
-    Notes
-    -----
-    The `cut` function can be useful for going from a continuous variable to
-    a categorical variable. For example, `cut` could convert ages to groups
-    of age ranges.
-
-    Any NA values will be NA in the result.  Out of bounds values will be NA in
-    the resulting Categorical object
-
-
-    Examples
-    --------
-    >>> pd.cut(np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1]), 3, retbins=True)
-    ([(0.191, 3.367], (0.191, 3.367], (0.191, 3.367], (3.367, 6.533],
-      (6.533, 9.7], (0.191, 3.367]]
-    Categories (3, object): [(0.191, 3.367] < (3.367, 6.533] < (6.533, 9.7]],
-    array([ 0.1905    ,  3.36666667,  6.53333333,  9.7       ]))
-    >>> pd.cut(np.array([.2, 1.4, 2.5, 6.2, 9.7, 2.1]), 3,
-               labels=["good","medium","bad"])
-    [good, good, good, medium, bad, good]
-    Categories (3, object): [good < medium < bad]
-    >>> pd.cut(np.ones(5), 4, labels=False)
-    array([1, 1, 1, 1, 1], dtype=int64)
-    """
-    # NOTE: this binning code is changed a bit from histogram for var(x) == 0
-
-    # for handling the cut for datetime and timedelta objects
-    x_is_series, series_index, name, x = _preprocess_for_cut(x)
-    x, dtype = _coerce_to_type(x)
-
-    if not np.iterable(bins):
-        if is_scalar(bins) and bins < 1:
-            raise ValueError("`bins` should be a positive integer.")
-
-        sz = x.size
-
-        if sz == 0:
-            raise ValueError('Cannot cut empty array')
-            # handle empty arrays. Can't determine range, so use 0-1.
-            # rng = (0, 1)
-        else:
-            rng = (nanops.nanmin(x), nanops.nanmax(x))
-        mn, mx = [mi + 0.0 for mi in rng]
-
-        if mn == mx:  # adjust end points before binning
-            mn -= .001 * abs(mn) if mn != 0 else .001
-            mx += .001 * abs(mx) if mx != 0 else .001
-            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
-        else:  # adjust end points after binning
-            bins = np.linspace(mn, mx, bins + 1, endpoint=True)
-            adj = (mx - mn) * 0.001  # 0.1% of the range
-            if right:
-                bins[0] -= adj
-            else:
-                bins[-1] += adj
-
-    else:
-        bins = np.asarray(bins)
-        bins = _convert_bin_to_numeric_type(bins)
-        if (np.diff(bins) < 0).any():
-            raise ValueError('bins must increase monotonically.')
-
-    fac, bins = _bins_to_cuts(x, bins, right=right, labels=labels,
-                              precision=precision,
-                              include_lowest=include_lowest, dtype=dtype)
-
-    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
-                                series_index, name)
-
-
-def qcut(x, q, labels=None, retbins=False, precision=3, duplicates='raise'):
-    """
-    Quantile-based discretization function. Discretize variable into
-    equal-sized buckets based on rank or based on sample quantiles. For example
-    1000 values for 10 quantiles would produce a Categorical object indicating
-    quantile membership for each data point.
-
-    Parameters
-    ----------
-    x : ndarray or Series
-    q : integer or array of quantiles
-        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately
-        array of quantiles, e.g. [0, .25, .5, .75, 1.] for quartiles
-    labels : array or boolean, default None
-        Used as labels for the resulting bins. Must be of the same length as
-        the resulting bins. If False, return only integer indicators of the
-        bins.
-    retbins : bool, optional
-        Whether to return the bins or not. Can be useful if bins is given
-        as a scalar.
-    precision : int
-        The precision at which to store and display the bins labels
-    duplicates : {default 'raise', 'drop'}, optional
-        If bin edges are not unique, raise ValueError or drop non-uniques.
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    out : Categorical or Series or array of integers if labels is False
-        The return type (Categorical or Series) depends on the input: a Series
-        of type category if input is a Series else Categorical. Bins are
-        represented as categories when categorical data is returned.
-    bins : ndarray of floats
-        Returned only if `retbins` is True.
-
-    Notes
-    -----
-    Out of bounds values will be NA in the resulting Categorical object
-
-    Examples
-    --------
-    >>> pd.qcut(range(5), 4)
-    [[0, 1], [0, 1], (1, 2], (2, 3], (3, 4]]
-    Categories (4, object): [[0, 1] < (1, 2] < (2, 3] < (3, 4]]
-    >>> pd.qcut(range(5), 3, labels=["good","medium","bad"])
-    [good, good, medium, bad, bad]
-    Categories (3, object): [good < medium < bad]
-    >>> pd.qcut(range(5), 4, labels=False)
-    array([0, 0, 1, 2, 3], dtype=int64)
-    """
-    x_is_series, series_index, name, x = _preprocess_for_cut(x)
-
-    x, dtype = _coerce_to_type(x)
-
-    if is_integer(q):
-        quantiles = np.linspace(0, 1, q + 1)
-    else:
-        quantiles = q
-    bins = algos.quantile(x, quantiles)
-    fac, bins = _bins_to_cuts(x, bins, labels=labels,
-                              precision=precision, include_lowest=True,
-                              dtype=dtype, duplicates=duplicates)
-
-    return _postprocess_for_cut(fac, bins, retbins, x_is_series,
-                                series_index, name)
-
-
-def _bins_to_cuts(x, bins, right=True, labels=None,
-                  precision=3, include_lowest=False,
-                  dtype=None, duplicates='raise'):
-
-    if duplicates not in ['raise', 'drop']:
-        raise ValueError("invalid value for 'duplicates' parameter, "
-                         "valid options are: raise, drop")
-
-    unique_bins = algos.unique(bins)
-    if len(unique_bins) < len(bins) and len(bins) != 2:
-        if duplicates == 'raise':
-            raise ValueError("Bin edges must be unique: {}.\nYou "
-                             "can drop duplicate edges by setting "
-                             "the 'duplicates' kwarg".format(repr(bins)))
-        else:
-            bins = unique_bins
-
-    side = 'left' if right else 'right'
-    ids = _ensure_int64(bins.searchsorted(x, side=side))
-
-    if include_lowest:
-        ids[x == bins[0]] = 1
-
-    na_mask = isnull(x) | (ids == len(bins)) | (ids == 0)
-    has_nas = na_mask.any()
-
-    if labels is not False:
-        if labels is None:
-            increases = 0
-            while True:
-                try:
-                    levels = _format_levels(bins, precision, right=right,
-                                            include_lowest=include_lowest,
-                                            dtype=dtype)
-                except ValueError:
-                    increases += 1
-                    precision += 1
-                    if increases >= 20:
-                        raise
-                else:
-                    break
-
-        else:
-            if len(labels) != len(bins) - 1:
-                raise ValueError('Bin labels must be one fewer than '
-                                 'the number of bin edges')
-            levels = labels
-
-        levels = np.asarray(levels, dtype=object)
-        np.putmask(ids, na_mask, 0)
-        fac = Categorical(ids - 1, levels, ordered=True, fastpath=True)
-    else:
-        fac = ids - 1
-        if has_nas:
-            fac = fac.astype(np.float64)
-            np.putmask(fac, na_mask, np.nan)
-
-    return fac, bins
-
-
-def _format_levels(bins, prec, right=True,
-                   include_lowest=False, dtype=None):
-    fmt = lambda v: _format_label(v, precision=prec, dtype=dtype)
-    if right:
-        levels = []
-        for a, b in zip(bins, bins[1:]):
-            fa, fb = fmt(a), fmt(b)
-
-            if a != b and fa == fb:
-                raise ValueError('precision too low')
-
-            formatted = '(%s, %s]' % (fa, fb)
-
-            levels.append(formatted)
-
-        if include_lowest:
-            levels[0] = '[' + levels[0][1:]
-    else:
-        levels = ['[%s, %s)' % (fmt(a), fmt(b))
-                  for a, b in zip(bins, bins[1:])]
-    return levels
-
-
-def _format_label(x, precision=3, dtype=None):
-    fmt_str = '%%.%dg' % precision
-
-    if is_datetime64_dtype(dtype):
-        return to_datetime(x, unit='ns')
-    if is_timedelta64_dtype(dtype):
-        return to_timedelta(x, unit='ns')
-    if np.isinf(x):
-        return str(x)
-    elif is_float(x):
-        frac, whole = np.modf(x)
-        sgn = '-' if x < 0 else ''
-        whole = abs(whole)
-        if frac != 0.0:
-            val = fmt_str % frac
-
-            # rounded up or down
-            if '.' not in val:
-                if x < 0:
-                    return '%d' % (-whole - 1)
-                else:
-                    return '%d' % (whole + 1)
-
-            if 'e' in val:
-                return _trim_zeros(fmt_str % x)
-            else:
-                val = _trim_zeros(val)
-                if '.' in val:
-                    return sgn + '.'.join(('%d' % whole, val.split('.')[1]))
-                else:  # pragma: no cover
-                    return sgn + '.'.join(('%d' % whole, val))
-        else:
-            return sgn + '%0.f' % whole
-    else:
-        return str(x)
-
-
-def _trim_zeros(x):
-    while len(x) > 1 and x[-1] == '0':
-        x = x[:-1]
-    if len(x) > 1 and x[-1] == '.':
-        x = x[:-1]
-    return x
-
-
-def _coerce_to_type(x):
-    """
-    if the passed data is of datetime/timedelta type,
-    this method converts it to integer so that cut method can
-    handle it
-    """
-    dtype = None
-
-    if is_timedelta64_dtype(x):
-        x = to_timedelta(x).view(np.int64)
-        dtype = np.timedelta64
-    elif is_datetime64_dtype(x):
-        x = to_datetime(x).view(np.int64)
-        dtype = np.datetime64
-
-    return x, dtype
-
-
-def _convert_bin_to_numeric_type(x):
-    """
-    if the passed bin is of datetime/timedelta type,
-    this method converts it to integer
-    """
-    dtype = infer_dtype(x)
-    if dtype == 'timedelta' or dtype == 'timedelta64':
-        x = to_timedelta(x).view(np.int64)
-    elif dtype == 'datetime' or dtype == 'datetime64':
-        x = to_datetime(x).view(np.int64)
-    return x
-
-
-def _preprocess_for_cut(x):
-    """
-    handles preprocessing for cut where we convert passed
-    input to array, strip the index information and store it
-    seperately
-    """
-    x_is_series = isinstance(x, Series)
-    series_index = None
-    name = None
-
-    if x_is_series:
-        series_index = x.index
-        name = x.name
-
-    x = np.asarray(x)
-
-    return x_is_series, series_index, name, x
-
-
-def _postprocess_for_cut(fac, bins, retbins, x_is_series, series_index, name):
-    """
-    handles post processing for the cut method where
-    we combine the index information if the originally passed
-    datatype was a series
-    """
-    if x_is_series:
-        fac = Series(fac, index=series_index, name=name)
-
-    if not retbins:
-        return fac
-
-    return fac, bins
diff --git a/pandas/tools/util.py b/pandas/tools/util.py
deleted file mode 100644
index 263d2f16a4216..0000000000000
--- a/pandas/tools/util.py
+++ /dev/null
@@ -1,244 +0,0 @@
-import numpy as np
-import pandas._libs.lib as lib
-
-from pandas.types.common import (is_number,
-                                 is_numeric_dtype,
-                                 is_datetime_or_timedelta_dtype,
-                                 is_list_like,
-                                 _ensure_object,
-                                 is_decimal,
-                                 is_scalar as isscalar)
-
-from pandas.types.cast import maybe_downcast_to_dtype
-
-import pandas as pd
-from pandas.compat import reduce
-from pandas.core.index import Index
-from pandas.core import common as com
-
-
-def match(needles, haystack):
-    haystack = Index(haystack)
-    needles = Index(needles)
-    return haystack.get_indexer(needles)
-
-
-def cartesian_product(X):
-    """
-    Numpy version of itertools.product or pandas.compat.product.
-    Sometimes faster (for large inputs)...
-
-    Parameters
-    ----------
-    X : list-like of list-likes
-
-    Returns
-    -------
-    product : list of ndarrays
-
-    Examples
-    --------
-    >>> cartesian_product([list('ABC'), [1, 2]])
-    [array(['A', 'A', 'B', 'B', 'C', 'C'], dtype='|S1'),
-    array([1, 2, 1, 2, 1, 2])]
-
-    See also
-    --------
-    itertools.product : Cartesian product of input iterables.  Equivalent to
-        nested for-loops.
-    pandas.compat.product : An alias for itertools.product.
-    """
-    msg = "Input must be a list-like of list-likes"
-    if not is_list_like(X):
-        raise TypeError(msg)
-    for x in X:
-        if not is_list_like(x):
-            raise TypeError(msg)
-
-    if len(X) == 0:
-        return []
-
-    lenX = np.fromiter((len(x) for x in X), dtype=np.intp)
-    cumprodX = np.cumproduct(lenX)
-
-    a = np.roll(cumprodX, 1)
-    a[0] = 1
-
-    if cumprodX[-1] != 0:
-        b = cumprodX[-1] / cumprodX
-    else:
-        # if any factor is empty, the cartesian product is empty
-        b = np.zeros_like(cumprodX)
-
-    return [np.tile(np.repeat(np.asarray(com._values_from_object(x)), b[i]),
-                    np.product(a[i]))
-            for i, x in enumerate(X)]
-
-
-def _compose2(f, g):
-    """Compose 2 callables"""
-    return lambda *args, **kwargs: f(g(*args, **kwargs))
-
-
-def compose(*funcs):
-    """Compose 2 or more callables"""
-    assert len(funcs) > 1, 'At least 2 callables must be passed to compose'
-    return reduce(_compose2, funcs)
-
-
-def to_numeric(arg, errors='raise', downcast=None):
-    """
-    Convert argument to a numeric type.
-
-    Parameters
-    ----------
-    arg : list, tuple, 1-d array, or Series
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaN
-        - If 'ignore', then invalid parsing will return the input
-    downcast : {'integer', 'signed', 'unsigned', 'float'} , default None
-        If not None, and if the data has been successfully cast to a
-        numerical dtype (or if the data was numeric to begin with),
-        downcast that resulting data to the smallest numerical dtype
-        possible according to the following rules:
-
-        - 'integer' or 'signed': smallest signed int dtype (min.: np.int8)
-        - 'unsigned': smallest unsigned int dtype (min.: np.uint8)
-        - 'float': smallest float dtype (min.: np.float32)
-
-        As this behaviour is separate from the core conversion to
-        numeric values, any errors raised during the downcasting
-        will be surfaced regardless of the value of the 'errors' input.
-
-        In addition, downcasting will only occur if the size
-        of the resulting data's dtype is strictly larger than
-        the dtype it is to be cast to, so if none of the dtypes
-        checked satisfy that specification, no downcasting will be
-        performed on the data.
-
-        .. versionadded:: 0.19.0
-
-    Returns
-    -------
-    ret : numeric if parsing succeeded.
-        Return type depends on input.  Series if Series, otherwise ndarray
-
-    Examples
-    --------
-    Take separate series and convert to numeric, coercing when told to
-
-    >>> import pandas as pd
-    >>> s = pd.Series(['1.0', '2', -3])
-    >>> pd.to_numeric(s)
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float64
-    >>> pd.to_numeric(s, downcast='float')
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float32
-    >>> pd.to_numeric(s, downcast='signed')
-    0    1
-    1    2
-    2   -3
-    dtype: int8
-    >>> s = pd.Series(['apple', '1.0', '2', -3])
-    >>> pd.to_numeric(s, errors='ignore')
-    0    apple
-    1      1.0
-    2        2
-    3       -3
-    dtype: object
-    >>> pd.to_numeric(s, errors='coerce')
-    0    NaN
-    1    1.0
-    2    2.0
-    3   -3.0
-    dtype: float64
-    """
-    if downcast not in (None, 'integer', 'signed', 'unsigned', 'float'):
-        raise ValueError('invalid downcasting method provided')
-
-    is_series = False
-    is_index = False
-    is_scalar = False
-
-    if isinstance(arg, pd.Series):
-        is_series = True
-        values = arg.values
-    elif isinstance(arg, pd.Index):
-        is_index = True
-        values = arg.asi8
-        if values is None:
-            values = arg.values
-    elif isinstance(arg, (list, tuple)):
-        values = np.array(arg, dtype='O')
-    elif isscalar(arg):
-        if is_decimal(arg):
-            return float(arg)
-        if is_number(arg):
-            return arg
-        is_scalar = True
-        values = np.array([arg], dtype='O')
-    elif getattr(arg, 'ndim', 1) > 1:
-        raise TypeError('arg must be a list, tuple, 1-d array, or Series')
-    else:
-        values = arg
-
-    try:
-        if is_numeric_dtype(values):
-            pass
-        elif is_datetime_or_timedelta_dtype(values):
-            values = values.astype(np.int64)
-        else:
-            values = _ensure_object(values)
-            coerce_numeric = False if errors in ('ignore', 'raise') else True
-            values = lib.maybe_convert_numeric(values, set(),
-                                               coerce_numeric=coerce_numeric)
-
-    except Exception:
-        if errors == 'raise':
-            raise
-
-    # attempt downcast only if the data has been successfully converted
-    # to a numerical dtype and if a downcast method has been specified
-    if downcast is not None and is_numeric_dtype(values):
-        typecodes = None
-
-        if downcast in ('integer', 'signed'):
-            typecodes = np.typecodes['Integer']
-        elif downcast == 'unsigned' and np.min(values) >= 0:
-            typecodes = np.typecodes['UnsignedInteger']
-        elif downcast == 'float':
-            typecodes = np.typecodes['Float']
-
-            # pandas support goes only to np.float32,
-            # as float dtypes smaller than that are
-            # extremely rare and not well supported
-            float_32_char = np.dtype(np.float32).char
-            float_32_ind = typecodes.index(float_32_char)
-            typecodes = typecodes[float_32_ind:]
-
-        if typecodes is not None:
-            # from smallest to largest
-            for dtype in typecodes:
-                if np.dtype(dtype).itemsize <= values.dtype.itemsize:
-                    values = maybe_downcast_to_dtype(values, dtype)
-
-                    # successful conversion
-                    if values.dtype == dtype:
-                        break
-
-    if is_series:
-        return pd.Series(values, index=arg.index, name=arg.name)
-    elif is_index:
-        # because we want to coerce to numeric if possible,
-        # do not use _shallow_copy_with_infer
-        return Index(values, name=arg.name)
-    elif is_scalar:
-        return values[0]
-    else:
-        return values
diff --git a/pandas/tseries/api.py b/pandas/tseries/api.py
index a00ccf99e1b96..2094791ecdc60 100644
--- a/pandas/tseries/api.py
+++ b/pandas/tseries/api.py
@@ -1,14 +1,8 @@
 """
-
+Timeseries API
 """
 
 # flake8: noqa
 
-from pandas.tseries.index import DatetimeIndex, date_range, bdate_range
 from pandas.tseries.frequencies import infer_freq
-from pandas.tseries.tdi import Timedelta, TimedeltaIndex, timedelta_range
-from pandas.tseries.period import Period, PeriodIndex, period_range, pnow
-from pandas.tseries.resample import TimeGrouper
-from pandas.tseries.timedeltas import to_timedelta
-from pandas._libs.lib import NaT
 import pandas.tseries.offsets as offsets
diff --git a/pandas/tseries/base.py b/pandas/tseries/base.py
deleted file mode 100644
index ae40c2f66a590..0000000000000
--- a/pandas/tseries/base.py
+++ /dev/null
@@ -1,867 +0,0 @@
-"""
-Base and utility classes for tseries type pandas objects.
-"""
-import warnings
-
-from datetime import datetime, timedelta
-
-from pandas import compat
-from pandas.compat.numpy import function as nv
-
-import numpy as np
-from pandas.types.common import (is_integer, is_float,
-                                 is_bool_dtype, _ensure_int64,
-                                 is_scalar, is_dtype_equal,
-                                 is_list_like)
-from pandas.types.generic import (ABCIndex, ABCSeries,
-                                  ABCPeriodIndex, ABCIndexClass)
-from pandas.types.missing import isnull
-from pandas.core import common as com, algorithms
-from pandas.core.algorithms import checked_add_with_arr
-from pandas.core.common import AbstractMethodError
-
-import pandas.formats.printing as printing
-from pandas._libs import (tslib as libts, lib,
-                          Timedelta, Timestamp, iNaT, NaT)
-from pandas._libs.period import Period
-
-from pandas.core.index import Index
-from pandas.indexes.base import _index_shared_docs
-from pandas.util.decorators import Appender, cache_readonly
-import pandas.types.concat as _concat
-import pandas.tseries.frequencies as frequencies
-
-
-class DatelikeOps(object):
-    """ common ops for DatetimeIndex/PeriodIndex, but not TimedeltaIndex """
-
-    def strftime(self, date_format):
-        return np.asarray(self.format(date_format=date_format),
-                          dtype=compat.text_type)
-    strftime.__doc__ = """
-    Return an array of formatted strings specified by date_format, which
-    supports the same string format as the python standard library. Details
-    of the string format can be found in `python string format doc <{0}>`__
-
-    .. versionadded:: 0.17.0
-
-    Parameters
-    ----------
-    date_format : str
-        date format string (e.g. "%Y-%m-%d")
-
-    Returns
-    -------
-    ndarray of formatted strings
-    """.format("https://docs.python.org/2/library/datetime.html"
-               "#strftime-and-strptime-behavior")
-
-
-class TimelikeOps(object):
-    """ common ops for TimedeltaIndex/DatetimeIndex, but not PeriodIndex """
-
-    _round_doc = (
-        """
-        %s the index to the specified freq
-
-        Parameters
-        ----------
-        freq : freq string/object
-
-        Returns
-        -------
-        index of same type
-
-        Raises
-        ------
-        ValueError if the freq cannot be converted
-        """)
-
-    def _round(self, freq, rounder):
-
-        from pandas.tseries.frequencies import to_offset
-        unit = to_offset(freq).nanos
-        # round the local times
-        values = _ensure_datetimelike_to_i8(self)
-        if unit < 1000 and unit % 1000 != 0:
-            # for nano rounding, work with the last 6 digits separately
-            # due to float precision
-            buff = 1000000
-            result = (buff * (values // buff) + unit *
-                      (rounder((values % buff) / float(unit))).astype('i8'))
-        elif unit >= 1000 and unit % 1000 != 0:
-            msg = 'Precision will be lost using frequency: {}'
-            warnings.warn(msg.format(freq))
-            result = (unit * rounder(values / float(unit)).astype('i8'))
-        else:
-            result = (unit * rounder(values / float(unit)).astype('i8'))
-        result = self._maybe_mask_results(result, fill_value=NaT)
-
-        attribs = self._get_attributes_dict()
-        if 'freq' in attribs:
-            attribs['freq'] = None
-        if 'tz' in attribs:
-            attribs['tz'] = None
-        return self._ensure_localized(
-            self._shallow_copy(result, **attribs))
-
-    @Appender(_round_doc % "round")
-    def round(self, freq, *args, **kwargs):
-        return self._round(freq, np.round)
-
-    @Appender(_round_doc % "floor")
-    def floor(self, freq):
-        return self._round(freq, np.floor)
-
-    @Appender(_round_doc % "ceil")
-    def ceil(self, freq):
-        return self._round(freq, np.ceil)
-
-
-class DatetimeIndexOpsMixin(object):
-    """ common ops mixin to support a unified inteface datetimelike Index """
-
-    def equals(self, other):
-        """
-        Determines if two Index objects contain the same elements.
-        """
-        if self.is_(other):
-            return True
-
-        if not isinstance(other, ABCIndexClass):
-            return False
-        elif not isinstance(other, type(self)):
-            try:
-                other = type(self)(other)
-            except:
-                return False
-
-        if not is_dtype_equal(self.dtype, other.dtype):
-            # have different timezone
-            return False
-
-        # ToDo: Remove this when PeriodDtype is added
-        elif isinstance(self, ABCPeriodIndex):
-            if not isinstance(other, ABCPeriodIndex):
-                return False
-            if self.freq != other.freq:
-                return False
-
-        return np.array_equal(self.asi8, other.asi8)
-
-    def __iter__(self):
-        return (self._box_func(v) for v in self.asi8)
-
-    @staticmethod
-    def _join_i8_wrapper(joinf, dtype, with_indexers=True):
-        """ create the join wrapper methods """
-
-        @staticmethod
-        def wrapper(left, right):
-            if isinstance(left, (np.ndarray, ABCIndex, ABCSeries)):
-                left = left.view('i8')
-            if isinstance(right, (np.ndarray, ABCIndex, ABCSeries)):
-                right = right.view('i8')
-            results = joinf(left, right)
-            if with_indexers:
-                join_index, left_indexer, right_indexer = results
-                join_index = join_index.view(dtype)
-                return join_index, left_indexer, right_indexer
-            return results
-
-        return wrapper
-
-    def _evaluate_compare(self, other, op):
-        """
-        We have been called because a comparison between
-        8 aware arrays. numpy >= 1.11 will
-        now warn about NaT comparisons
-        """
-
-        # coerce to a similar object
-        if not isinstance(other, type(self)):
-            if not is_list_like(other):
-                # scalar
-                other = [other]
-            elif is_scalar(lib.item_from_zerodim(other)):
-                # ndarray scalar
-                other = [other.item()]
-            other = type(self)(other)
-
-        # compare
-        result = op(self.asi8, other.asi8)
-
-        # technically we could support bool dtyped Index
-        # for now just return the indexing array directly
-        mask = (self._isnan) | (other._isnan)
-        if is_bool_dtype(result):
-            result[mask] = False
-            return result
-        try:
-            result[mask] = iNaT
-            return Index(result)
-        except TypeError:
-            return result
-
-    def _ensure_localized(self, result):
-        """
-        ensure that we are re-localized
-
-        This is for compat as we can then call this on all datetimelike
-        indexes generally (ignored for Period/Timedelta)
-
-        Parameters
-        ----------
-        result : DatetimeIndex / i8 ndarray
-
-        Returns
-        -------
-        localized DTI
-        """
-
-        # reconvert to local tz
-        if getattr(self, 'tz', None) is not None:
-            if not isinstance(result, ABCIndexClass):
-                result = self._simple_new(result)
-            result = result.tz_localize(self.tz)
-        return result
-
-    @property
-    def _box_func(self):
-        """
-        box function to get object from internal representation
-        """
-        raise AbstractMethodError(self)
-
-    def _box_values(self, values):
-        """
-        apply box func to passed values
-        """
-        return lib.map_infer(values, self._box_func)
-
-    def _format_with_header(self, header, **kwargs):
-        return header + list(self._format_native_types(**kwargs))
-
-    def __contains__(self, key):
-        try:
-            res = self.get_loc(key)
-            return is_scalar(res) or type(res) == slice or np.any(res)
-        except (KeyError, TypeError, ValueError):
-            return False
-
-    def __getitem__(self, key):
-        """
-        This getitem defers to the underlying array, which by-definition can
-        only handle list-likes, slices, and integer scalars
-        """
-
-        is_int = is_integer(key)
-        if is_scalar(key) and not is_int:
-            raise ValueError
-
-        getitem = self._data.__getitem__
-        if is_int:
-            val = getitem(key)
-            return self._box_func(val)
-        else:
-            if com.is_bool_indexer(key):
-                key = np.asarray(key)
-                if key.all():
-                    key = slice(0, None, None)
-                else:
-                    key = lib.maybe_booleans_to_slice(key.view(np.uint8))
-
-            attribs = self._get_attributes_dict()
-
-            is_period = isinstance(self, ABCPeriodIndex)
-            if is_period:
-                freq = self.freq
-            else:
-                freq = None
-                if isinstance(key, slice):
-                    if self.freq is not None and key.step is not None:
-                        freq = key.step * self.freq
-                    else:
-                        freq = self.freq
-
-            attribs['freq'] = freq
-
-            result = getitem(key)
-            if result.ndim > 1:
-                # To support MPL which performs slicing with 2 dim
-                # even though it only has 1 dim by definition
-                if is_period:
-                    return self._simple_new(result, **attribs)
-                return result
-
-            return self._simple_new(result, **attribs)
-
-    @property
-    def freqstr(self):
-        """
-        Return the frequency object as a string if its set, otherwise None
-        """
-        if self.freq is None:
-            return None
-        return self.freq.freqstr
-
-    @cache_readonly
-    def inferred_freq(self):
-        """
-        Trys to return a string representing a frequency guess,
-        generated by infer_freq.  Returns None if it can't autodetect the
-        frequency.
-        """
-        try:
-            return frequencies.infer_freq(self)
-        except ValueError:
-            return None
-
-    def _nat_new(self, box=True):
-        """
-        Return Index or ndarray filled with NaT which has the same
-        length as the caller.
-
-        Parameters
-        ----------
-        box : boolean, default True
-            - If True returns a Index as the same as caller.
-            - If False returns ndarray of np.int64.
-        """
-        result = np.zeros(len(self), dtype=np.int64)
-        result.fill(iNaT)
-        if not box:
-            return result
-
-        attribs = self._get_attributes_dict()
-        if not isinstance(self, ABCPeriodIndex):
-            attribs['freq'] = None
-        return self._simple_new(result, **attribs)
-
-    # Try to run function on index first, and then on elements of index
-    # Especially important for group-by functionality
-    def map(self, f):
-        try:
-            result = f(self)
-
-            # Try to use this result if we can
-            if isinstance(result, np.ndarray):
-                self._shallow_copy(result)
-
-            if not isinstance(result, Index):
-                raise TypeError('The map function must return an Index object')
-            return result
-        except Exception:
-            return self.asobject.map(f)
-
-    def sort_values(self, return_indexer=False, ascending=True):
-        """
-        Return sorted copy of Index
-        """
-        if return_indexer:
-            _as = self.argsort()
-            if not ascending:
-                _as = _as[::-1]
-            sorted_index = self.take(_as)
-            return sorted_index, _as
-        else:
-            sorted_values = np.sort(self._values)
-            attribs = self._get_attributes_dict()
-            freq = attribs['freq']
-
-            if freq is not None and not isinstance(self, ABCPeriodIndex):
-                if freq.n > 0 and not ascending:
-                    freq = freq * -1
-                elif freq.n < 0 and ascending:
-                    freq = freq * -1
-            attribs['freq'] = freq
-
-            if not ascending:
-                sorted_values = sorted_values[::-1]
-
-            return self._simple_new(sorted_values, **attribs)
-
-    @Appender(_index_shared_docs['take'])
-    def take(self, indices, axis=0, allow_fill=True,
-             fill_value=None, **kwargs):
-        nv.validate_take(tuple(), kwargs)
-        indices = _ensure_int64(indices)
-
-        maybe_slice = lib.maybe_indices_to_slice(indices, len(self))
-        if isinstance(maybe_slice, slice):
-            return self[maybe_slice]
-
-        taken = self._assert_take_fillable(self.asi8, indices,
-                                           allow_fill=allow_fill,
-                                           fill_value=fill_value,
-                                           na_value=iNaT)
-
-        # keep freq in PeriodIndex, reset otherwise
-        freq = self.freq if isinstance(self, ABCPeriodIndex) else None
-        return self._shallow_copy(taken, freq=freq)
-
-    def get_duplicates(self):
-        values = Index.get_duplicates(self)
-        return self._simple_new(values)
-
-    _can_hold_na = True
-
-    _na_value = NaT
-    """The expected NA value to use with this index."""
-
-    @cache_readonly
-    def _isnan(self):
-        """ return if each value is nan"""
-        return (self.asi8 == iNaT)
-
-    @property
-    def asobject(self):
-        """
-        return object Index which contains boxed values
-
-        *this is an internal non-public method*
-        """
-        from pandas.core.index import Index
-        return Index(self._box_values(self.asi8), name=self.name, dtype=object)
-
-    def _convert_tolerance(self, tolerance):
-        try:
-            return Timedelta(tolerance).to_timedelta64()
-        except ValueError:
-            raise ValueError('tolerance argument for %s must be convertible '
-                             'to Timedelta: %r'
-                             % (type(self).__name__, tolerance))
-
-    def _maybe_mask_results(self, result, fill_value=None, convert=None):
-        """
-        Parameters
-        ----------
-        result : a ndarray
-        convert : string/dtype or None
-
-        Returns
-        -------
-        result : ndarray with values replace by the fill_value
-
-        mask the result if needed, convert to the provided dtype if its not
-        None
-
-        This is an internal routine
-        """
-
-        if self.hasnans:
-            if convert:
-                result = result.astype(convert)
-            if fill_value is None:
-                fill_value = np.nan
-            result[self._isnan] = fill_value
-        return result
-
-    def tolist(self):
-        """
-        return a list of the underlying data
-        """
-        return list(self.asobject)
-
-    def min(self, axis=None, *args, **kwargs):
-        """
-        Return the minimum value of the Index or minimum along
-        an axis.
-
-        See also
-        --------
-        numpy.ndarray.min
-        """
-        nv.validate_min(args, kwargs)
-
-        try:
-            i8 = self.asi8
-
-            # quick check
-            if len(i8) and self.is_monotonic:
-                if i8[0] != iNaT:
-                    return self._box_func(i8[0])
-
-            if self.hasnans:
-                min_stamp = self[~self._isnan].asi8.min()
-            else:
-                min_stamp = i8.min()
-            return self._box_func(min_stamp)
-        except ValueError:
-            return self._na_value
-
-    def argmin(self, axis=None, *args, **kwargs):
-        """
-        Returns the indices of the minimum values along an axis.
-        See `numpy.ndarray.argmin` for more information on the
-        `axis` parameter.
-
-        See also
-        --------
-        numpy.ndarray.argmin
-        """
-        nv.validate_argmin(args, kwargs)
-
-        i8 = self.asi8
-        if self.hasnans:
-            mask = self._isnan
-            if mask.all():
-                return -1
-            i8 = i8.copy()
-            i8[mask] = np.iinfo('int64').max
-        return i8.argmin()
-
-    def max(self, axis=None, *args, **kwargs):
-        """
-        Return the maximum value of the Index or maximum along
-        an axis.
-
-        See also
-        --------
-        numpy.ndarray.max
-        """
-        nv.validate_max(args, kwargs)
-
-        try:
-            i8 = self.asi8
-
-            # quick check
-            if len(i8) and self.is_monotonic:
-                if i8[-1] != iNaT:
-                    return self._box_func(i8[-1])
-
-            if self.hasnans:
-                max_stamp = self[~self._isnan].asi8.max()
-            else:
-                max_stamp = i8.max()
-            return self._box_func(max_stamp)
-        except ValueError:
-            return self._na_value
-
-    def argmax(self, axis=None, *args, **kwargs):
-        """
-        Returns the indices of the maximum values along an axis.
-        See `numpy.ndarray.argmax` for more information on the
-        `axis` parameter.
-
-        See also
-        --------
-        numpy.ndarray.argmax
-        """
-        nv.validate_argmax(args, kwargs)
-
-        i8 = self.asi8
-        if self.hasnans:
-            mask = self._isnan
-            if mask.all():
-                return -1
-            i8 = i8.copy()
-            i8[mask] = 0
-        return i8.argmax()
-
-    @property
-    def _formatter_func(self):
-        raise AbstractMethodError(self)
-
-    def _format_attrs(self):
-        """
-        Return a list of tuples of the (attr,formatted_value)
-        """
-        attrs = super(DatetimeIndexOpsMixin, self)._format_attrs()
-        for attrib in self._attributes:
-            if attrib == 'freq':
-                freq = self.freqstr
-                if freq is not None:
-                    freq = "'%s'" % freq
-                attrs.append(('freq', freq))
-        return attrs
-
-    @cache_readonly
-    def _resolution(self):
-        return frequencies.Resolution.get_reso_from_freq(self.freqstr)
-
-    @cache_readonly
-    def resolution(self):
-        """
-        Returns day, hour, minute, second, millisecond or microsecond
-        """
-        return frequencies.Resolution.get_str(self._resolution)
-
-    def _convert_scalar_indexer(self, key, kind=None):
-        """
-        we don't allow integer or float indexing on datetime-like when using
-        loc
-
-        Parameters
-        ----------
-        key : label of the slice bound
-        kind : {'ix', 'loc', 'getitem', 'iloc'} or None
-        """
-
-        assert kind in ['ix', 'loc', 'getitem', 'iloc', None]
-
-        # we don't allow integer/float indexing for loc
-        # we don't allow float indexing for ix/getitem
-        if is_scalar(key):
-            is_int = is_integer(key)
-            is_flt = is_float(key)
-            if kind in ['loc'] and (is_int or is_flt):
-                self._invalid_indexer('index', key)
-            elif kind in ['ix', 'getitem'] and is_flt:
-                self._invalid_indexer('index', key)
-
-        return (super(DatetimeIndexOpsMixin, self)
-                ._convert_scalar_indexer(key, kind=kind))
-
-    def _add_datelike(self, other):
-        raise AbstractMethodError(self)
-
-    def _sub_datelike(self, other):
-        raise AbstractMethodError(self)
-
-    def _sub_period(self, other):
-        return NotImplemented
-
-    @classmethod
-    def _add_datetimelike_methods(cls):
-        """
-        add in the datetimelike methods (as we may have to override the
-        superclass)
-        """
-
-        def __add__(self, other):
-            from pandas.core.index import Index
-            from pandas.tseries.tdi import TimedeltaIndex
-            from pandas.tseries.offsets import DateOffset
-            if isinstance(other, TimedeltaIndex):
-                return self._add_delta(other)
-            elif isinstance(self, TimedeltaIndex) and isinstance(other, Index):
-                if hasattr(other, '_add_delta'):
-                    return other._add_delta(self)
-                raise TypeError("cannot add TimedeltaIndex and {typ}"
-                                .format(typ=type(other)))
-            elif isinstance(other, Index):
-                raise TypeError("cannot add {typ1} and {typ2}"
-                                .format(typ1=type(self).__name__,
-                                        typ2=type(other).__name__))
-            elif isinstance(other, (DateOffset, timedelta, np.timedelta64,
-                                    Timedelta)):
-                return self._add_delta(other)
-            elif is_integer(other):
-                return self.shift(other)
-            elif isinstance(other, (Timestamp, datetime)):
-                return self._add_datelike(other)
-            else:  # pragma: no cover
-                return NotImplemented
-        cls.__add__ = __add__
-        cls.__radd__ = __add__
-
-        def __sub__(self, other):
-            from pandas.core.index import Index
-            from pandas.tseries.index import DatetimeIndex
-            from pandas.tseries.tdi import TimedeltaIndex
-            from pandas.tseries.offsets import DateOffset
-            if isinstance(other, TimedeltaIndex):
-                return self._add_delta(-other)
-            elif isinstance(self, TimedeltaIndex) and isinstance(other, Index):
-                if not isinstance(other, TimedeltaIndex):
-                    raise TypeError("cannot subtract TimedeltaIndex and {typ}"
-                                    .format(typ=type(other).__name__))
-                return self._add_delta(-other)
-            elif isinstance(other, DatetimeIndex):
-                return self._sub_datelike(other)
-            elif isinstance(other, Index):
-                raise TypeError("cannot subtract {typ1} and {typ2}"
-                                .format(typ1=type(self).__name__,
-                                        typ2=type(other).__name__))
-            elif isinstance(other, (DateOffset, timedelta, np.timedelta64,
-                                    Timedelta)):
-                return self._add_delta(-other)
-            elif is_integer(other):
-                return self.shift(-other)
-            elif isinstance(other, (Timestamp, datetime)):
-                return self._sub_datelike(other)
-            elif isinstance(other, Period):
-                return self._sub_period(other)
-            else:  # pragma: no cover
-                return NotImplemented
-        cls.__sub__ = __sub__
-
-        def __rsub__(self, other):
-            return -(self - other)
-        cls.__rsub__ = __rsub__
-
-        cls.__iadd__ = __add__
-        cls.__isub__ = __sub__
-
-    def _add_delta(self, other):
-        return NotImplemented
-
-    def _add_delta_td(self, other):
-        # add a delta of a timedeltalike
-        # return the i8 result view
-
-        inc = libts._delta_to_nanoseconds(other)
-        new_values = checked_add_with_arr(self.asi8, inc,
-                                          arr_mask=self._isnan).view('i8')
-        if self.hasnans:
-            new_values[self._isnan] = iNaT
-        return new_values.view('i8')
-
-    def _add_delta_tdi(self, other):
-        # add a delta of a TimedeltaIndex
-        # return the i8 result view
-
-        # delta operation
-        if not len(self) == len(other):
-            raise ValueError("cannot add indices of unequal length")
-
-        self_i8 = self.asi8
-        other_i8 = other.asi8
-        new_values = checked_add_with_arr(self_i8, other_i8,
-                                          arr_mask=self._isnan,
-                                          b_mask=other._isnan)
-        if self.hasnans or other.hasnans:
-            mask = (self._isnan) | (other._isnan)
-            new_values[mask] = iNaT
-        return new_values.view(self.dtype)
-
-    def isin(self, values):
-        """
-        Compute boolean array of whether each index value is found in the
-        passed set of values
-
-        Parameters
-        ----------
-        values : set or sequence of values
-
-        Returns
-        -------
-        is_contained : ndarray (boolean dtype)
-        """
-        if not isinstance(values, type(self)):
-            try:
-                values = type(self)(values)
-            except ValueError:
-                return self.asobject.isin(values)
-
-        return algorithms.isin(self.asi8, values.asi8)
-
-    def shift(self, n, freq=None):
-        """
-        Specialized shift which produces a DatetimeIndex
-
-        Parameters
-        ----------
-        n : int
-            Periods to shift by
-        freq : DateOffset or timedelta-like, optional
-
-        Returns
-        -------
-        shifted : DatetimeIndex
-        """
-        if freq is not None and freq != self.freq:
-            if isinstance(freq, compat.string_types):
-                freq = frequencies.to_offset(freq)
-            offset = n * freq
-            result = self + offset
-
-            if hasattr(self, 'tz'):
-                result.tz = self.tz
-
-            return result
-
-        if n == 0:
-            # immutable so OK
-            return self
-
-        if self.freq is None:
-            raise ValueError("Cannot shift with no freq")
-
-        start = self[0] + n * self.freq
-        end = self[-1] + n * self.freq
-        attribs = self._get_attributes_dict()
-        attribs['start'] = start
-        attribs['end'] = end
-        return type(self)(**attribs)
-
-    def repeat(self, repeats, *args, **kwargs):
-        """
-        Analogous to ndarray.repeat
-        """
-        nv.validate_repeat(args, kwargs)
-        if isinstance(self, ABCPeriodIndex):
-            freq = self.freq
-        else:
-            freq = None
-        return self._shallow_copy(self.asi8.repeat(repeats),
-                                  freq=freq)
-
-    @Appender(_index_shared_docs['where'])
-    def where(self, cond, other=None):
-        other = _ensure_datetimelike_to_i8(other)
-        values = _ensure_datetimelike_to_i8(self)
-        result = np.where(cond, values, other).astype('i8')
-
-        result = self._ensure_localized(result)
-        return self._shallow_copy(result,
-                                  **self._get_attributes_dict())
-
-    def summary(self, name=None):
-        """
-        return a summarized representation
-        """
-        formatter = self._formatter_func
-        if len(self) > 0:
-            index_summary = ', %s to %s' % (formatter(self[0]),
-                                            formatter(self[-1]))
-        else:
-            index_summary = ''
-
-        if name is None:
-            name = type(self).__name__
-        result = '%s: %s entries%s' % (printing.pprint_thing(name),
-                                       len(self), index_summary)
-        if self.freq:
-            result += '\nFreq: %s' % self.freqstr
-
-        # display as values, not quoted
-        result = result.replace("'", "")
-        return result
-
-    def _append_same_dtype(self, to_concat, name):
-        """
-        Concatenate to_concat which has the same class
-        """
-        attribs = self._get_attributes_dict()
-        attribs['name'] = name
-
-        if not isinstance(self, ABCPeriodIndex):
-            # reset freq
-            attribs['freq'] = None
-
-        if getattr(self, 'tz', None) is not None:
-            return _concat._concat_datetimetz(to_concat, name)
-        else:
-            new_data = np.concatenate([c.asi8 for c in to_concat])
-        return self._simple_new(new_data, **attribs)
-
-
-def _ensure_datetimelike_to_i8(other):
-    """ helper for coercing an input scalar or array to i8 """
-    if lib.isscalar(other) and isnull(other):
-        other = iNaT
-    elif isinstance(other, ABCIndexClass):
-        # convert tz if needed
-        if getattr(other, 'tz', None) is not None:
-            other = other.tz_localize(None).asi8
-        else:
-            other = other.asi8
-    else:
-        try:
-            other = np.array(other, copy=False).view('i8')
-        except TypeError:
-            # period array cannot be coerces to int
-            other = Index(other).asi8
-    return other
diff --git a/pandas/tseries/common.py b/pandas/tseries/common.py
deleted file mode 100644
index 7940efc7e1b59..0000000000000
--- a/pandas/tseries/common.py
+++ /dev/null
@@ -1,242 +0,0 @@
-"""
-datetimelike delegation
-"""
-
-import numpy as np
-
-from pandas.types.common import (_NS_DTYPE, _TD_DTYPE,
-                                 is_period_arraylike,
-                                 is_datetime_arraylike, is_integer_dtype,
-                                 is_datetime64_dtype, is_datetime64tz_dtype,
-                                 is_timedelta64_dtype, is_categorical_dtype,
-                                 is_list_like)
-
-from pandas.core.base import PandasDelegate, NoNewAttributesMixin
-from pandas.tseries.index import DatetimeIndex
-from pandas._libs.period import IncompatibleFrequency    # flake8: noqa
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.core.algorithms import take_1d
-
-
-def is_datetimelike(data):
-    """
-    return a boolean if we can be successfully converted to a datetimelike
-    """
-    try:
-        maybe_to_datetimelike(data)
-        return True
-    except (Exception):
-        pass
-    return False
-
-
-def maybe_to_datetimelike(data, copy=False):
-    """
-    return a DelegatedClass of a Series that is datetimelike
-      (e.g. datetime64[ns],timedelta64[ns] dtype or a Series of Periods)
-    raise TypeError if this is not possible.
-
-    Parameters
-    ----------
-    data : Series
-    copy : boolean, default False
-           copy the input data
-
-    Returns
-    -------
-    DelegatedClass
-
-    """
-    from pandas import Series
-
-    if not isinstance(data, Series):
-        raise TypeError("cannot convert an object of type {0} to a "
-                        "datetimelike index".format(type(data)))
-
-    index = data.index
-    name = data.name
-    orig = data if is_categorical_dtype(data) else None
-    if orig is not None:
-        data = orig.values.categories
-
-    if is_datetime64_dtype(data.dtype):
-        return DatetimeProperties(DatetimeIndex(data, copy=copy, freq='infer'),
-                                  index, name=name, orig=orig)
-    elif is_datetime64tz_dtype(data.dtype):
-        return DatetimeProperties(DatetimeIndex(data, copy=copy, freq='infer',
-                                                ambiguous='infer'),
-                                  index, data.name, orig=orig)
-    elif is_timedelta64_dtype(data.dtype):
-        return TimedeltaProperties(TimedeltaIndex(data, copy=copy,
-                                                  freq='infer'), index,
-                                   name=name, orig=orig)
-    else:
-        if is_period_arraylike(data):
-            return PeriodProperties(PeriodIndex(data, copy=copy), index,
-                                    name=name, orig=orig)
-        if is_datetime_arraylike(data):
-            return DatetimeProperties(DatetimeIndex(data, copy=copy,
-                                                    freq='infer'), index,
-                                      name=name, orig=orig)
-
-    raise TypeError("cannot convert an object of type {0} to a "
-                    "datetimelike index".format(type(data)))
-
-
-class Properties(PandasDelegate, NoNewAttributesMixin):
-
-    def __init__(self, values, index, name, orig=None):
-        self.values = values
-        self.index = index
-        self.name = name
-        self.orig = orig
-        self._freeze()
-
-    def _delegate_property_get(self, name):
-        from pandas import Series
-
-        result = getattr(self.values, name)
-
-        # maybe need to upcast (ints)
-        if isinstance(result, np.ndarray):
-            if is_integer_dtype(result):
-                result = result.astype('int64')
-        elif not is_list_like(result):
-            return result
-
-        result = np.asarray(result)
-
-        # blow up if we operate on categories
-        if self.orig is not None:
-            result = take_1d(result, self.orig.cat.codes)
-
-        # return the result as a Series, which is by definition a copy
-        result = Series(result, index=self.index, name=self.name)
-
-        # setting this object will show a SettingWithCopyWarning/Error
-        result.is_copy = ("modifications to a property of a datetimelike "
-                          "object are not supported and are discarded. "
-                          "Change values on the original.")
-
-        return result
-
-    def _delegate_property_set(self, name, value, *args, **kwargs):
-        raise ValueError("modifications to a property of a datetimelike "
-                         "object are not supported. Change values on the "
-                         "original.")
-
-    def _delegate_method(self, name, *args, **kwargs):
-        from pandas import Series
-
-        method = getattr(self.values, name)
-        result = method(*args, **kwargs)
-
-        if not is_list_like(result):
-            return result
-
-        result = Series(result, index=self.index, name=self.name)
-
-        # setting this object will show a SettingWithCopyWarning/Error
-        result.is_copy = ("modifications to a method of a datetimelike object "
-                          "are not supported and are discarded. Change "
-                          "values on the original.")
-
-        return result
-
-
-class DatetimeProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hour
-    >>> s.dt.second
-    >>> s.dt.quarter
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-    def to_pydatetime(self):
-        return self.values.to_pydatetime()
-
-DatetimeProperties._add_delegate_accessors(
-    delegate=DatetimeIndex,
-    accessors=DatetimeIndex._datetimelike_ops,
-    typ='property')
-DatetimeProperties._add_delegate_accessors(
-    delegate=DatetimeIndex,
-    accessors=DatetimeIndex._datetimelike_methods,
-    typ='method')
-
-
-class TimedeltaProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hours
-    >>> s.dt.seconds
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-    def to_pytimedelta(self):
-        return self.values.to_pytimedelta()
-
-    @property
-    def components(self):
-        """
-        Return a dataframe of the components (days, hours, minutes,
-        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
-
-        Returns
-        -------
-        a DataFrame
-
-        """
-        return self.values.components.set_index(self.index)
-
-TimedeltaProperties._add_delegate_accessors(
-    delegate=TimedeltaIndex,
-    accessors=TimedeltaIndex._datetimelike_ops,
-    typ='property')
-TimedeltaProperties._add_delegate_accessors(
-    delegate=TimedeltaIndex,
-    accessors=TimedeltaIndex._datetimelike_methods,
-    typ='method')
-
-
-class PeriodProperties(Properties):
-    """
-    Accessor object for datetimelike properties of the Series values.
-
-    Examples
-    --------
-    >>> s.dt.hour
-    >>> s.dt.second
-    >>> s.dt.quarter
-
-    Returns a Series indexed like the original Series.
-    Raises TypeError if the Series does not contain datetimelike values.
-    """
-
-PeriodProperties._add_delegate_accessors(
-    delegate=PeriodIndex,
-    accessors=PeriodIndex._datetimelike_ops,
-    typ='property')
-PeriodProperties._add_delegate_accessors(
-    delegate=PeriodIndex,
-    accessors=PeriodIndex._datetimelike_methods,
-    typ='method')
-
-
-class CombinedDatetimelikeProperties(DatetimeProperties, TimedeltaProperties):
-    # This class is never instantiated, and exists solely for the benefit of
-    # the Series.dt class property. For Series objects, .dt will always be one
-    # of the more specific classes above.
-    __doc__ = DatetimeProperties.__doc__
diff --git a/pandas/tseries/converter.py b/pandas/tseries/converter.py
index bc768a8bc5b58..05dd7cea1bd2f 100644
--- a/pandas/tseries/converter.py
+++ b/pandas/tseries/converter.py
@@ -1,1032 +1,16 @@
-from datetime import datetime, timedelta
-import datetime as pydt
-import numpy as np
+# flake8: noqa
+import warnings
 
-from dateutil.relativedelta import relativedelta
-
-import matplotlib.units as units
-import matplotlib.dates as dates
-
-from matplotlib.ticker import Formatter, AutoLocator, Locator
-from matplotlib.transforms import nonsingular
-
-
-from pandas.types.common import (is_float, is_integer,
-                                 is_integer_dtype,
-                                 is_float_dtype,
-                                 is_datetime64_ns_dtype,
-                                 is_period_arraylike,
-                                 )
-
-from pandas.compat import lrange
-import pandas.compat as compat
-import pandas._libs.lib as lib
-import pandas.core.common as com
-from pandas.core.index import Index
-
-from pandas.core.series import Series
-from pandas.tseries.index import date_range
-import pandas.tseries.tools as tools
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.frequencies import FreqGroup
-from pandas.tseries.period import Period, PeriodIndex
-
-# constants
-HOURS_PER_DAY = 24.
-MIN_PER_HOUR = 60.
-SEC_PER_MIN = 60.
-
-SEC_PER_HOUR = SEC_PER_MIN * MIN_PER_HOUR
-SEC_PER_DAY = SEC_PER_HOUR * HOURS_PER_DAY
-
-MUSEC_PER_DAY = 1e6 * SEC_PER_DAY
-
-
-def _mpl_le_2_0_0():
-    try:
-        import matplotlib
-        return matplotlib.compare_versions('2.0.0', matplotlib.__version__)
-    except ImportError:
-        return False
+from pandas.plotting._converter import (
+    DatetimeConverter, MilliSecondLocator, PandasAutoDateFormatter,
+    PandasAutoDateLocator, PeriodConverter, TimeConverter, TimeFormatter,
+    TimeSeries_DateFormatter, TimeSeries_DateLocator, get_datevalue,
+    get_finder, time2num)
 
 
 def register():
-    units.registry[lib.Timestamp] = DatetimeConverter()
-    units.registry[Period] = PeriodConverter()
-    units.registry[pydt.datetime] = DatetimeConverter()
-    units.registry[pydt.date] = DatetimeConverter()
-    units.registry[pydt.time] = TimeConverter()
-    units.registry[np.datetime64] = DatetimeConverter()
-
-
-def _to_ordinalf(tm):
-    tot_sec = (tm.hour * 3600 + tm.minute * 60 + tm.second +
-               float(tm.microsecond / 1e6))
-    return tot_sec
-
-
-def time2num(d):
-    if isinstance(d, compat.string_types):
-        parsed = tools.to_datetime(d)
-        if not isinstance(parsed, datetime):
-            raise ValueError('Could not parse time %s' % d)
-        return _to_ordinalf(parsed.time())
-    if isinstance(d, pydt.time):
-        return _to_ordinalf(d)
-    return d
-
-
-class TimeConverter(units.ConversionInterface):
-
-    @staticmethod
-    def convert(value, unit, axis):
-        valid_types = (str, pydt.time)
-        if (isinstance(value, valid_types) or is_integer(value) or
-                is_float(value)):
-            return time2num(value)
-        if isinstance(value, Index):
-            return value.map(time2num)
-        if isinstance(value, (list, tuple, np.ndarray, Index)):
-            return [time2num(x) for x in value]
-        return value
-
-    @staticmethod
-    def axisinfo(unit, axis):
-        if unit != 'time':
-            return None
-
-        majloc = AutoLocator()
-        majfmt = TimeFormatter(majloc)
-        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='time')
-
-    @staticmethod
-    def default_units(x, axis):
-        return 'time'
-
-
-# time formatter
-class TimeFormatter(Formatter):
-
-    def __init__(self, locs):
-        self.locs = locs
-
-    def __call__(self, x, pos=0):
-        fmt = '%H:%M:%S'
-        s = int(x)
-        ms = int((x - s) * 1e3)
-        us = int((x - s) * 1e6 - ms)
-        m, s = divmod(s, 60)
-        h, m = divmod(m, 60)
-        _, h = divmod(h, 24)
-        if us != 0:
-            fmt += '.%6f'
-        elif ms != 0:
-            fmt += '.%3f'
-
-        return pydt.time(h, m, s, us).strftime(fmt)
-
-
-# Period Conversion
-
-
-class PeriodConverter(dates.DateConverter):
-
-    @staticmethod
-    def convert(values, units, axis):
-        if not hasattr(axis, 'freq'):
-            raise TypeError('Axis must have `freq` set to convert to Periods')
-        valid_types = (compat.string_types, datetime,
-                       Period, pydt.date, pydt.time)
-        if (isinstance(values, valid_types) or is_integer(values) or
-                is_float(values)):
-            return get_datevalue(values, axis.freq)
-        if isinstance(values, PeriodIndex):
-            return values.asfreq(axis.freq)._values
-        if isinstance(values, Index):
-            return values.map(lambda x: get_datevalue(x, axis.freq))
-        if is_period_arraylike(values):
-            return PeriodIndex(values, freq=axis.freq)._values
-        if isinstance(values, (list, tuple, np.ndarray, Index)):
-            return [get_datevalue(x, axis.freq) for x in values]
-        return values
-
-
-def get_datevalue(date, freq):
-    if isinstance(date, Period):
-        return date.asfreq(freq).ordinal
-    elif isinstance(date, (compat.string_types, datetime,
-                           pydt.date, pydt.time)):
-        return Period(date, freq).ordinal
-    elif (is_integer(date) or is_float(date) or
-          (isinstance(date, (np.ndarray, Index)) and (date.size == 1))):
-        return date
-    elif date is None:
-        return None
-    raise ValueError("Unrecognizable date '%s'" % date)
-
-
-def _dt_to_float_ordinal(dt):
-    """
-    Convert :mod:`datetime` to the Gregorian date as UTC float days,
-    preserving hours, minutes, seconds and microseconds.  Return value
-    is a :func:`float`.
-    """
-    if (isinstance(dt, (np.ndarray, Index, Series)
-                   ) and is_datetime64_ns_dtype(dt)):
-        base = dates.epoch2num(dt.asi8 / 1.0E9)
-    else:
-        base = dates.date2num(dt)
-    return base
-
-
-# Datetime Conversion
-class DatetimeConverter(dates.DateConverter):
-
-    @staticmethod
-    def convert(values, unit, axis):
-        def try_parse(values):
-            try:
-                return _dt_to_float_ordinal(tools.to_datetime(values))
-            except Exception:
-                return values
-
-        if isinstance(values, (datetime, pydt.date)):
-            return _dt_to_float_ordinal(values)
-        elif isinstance(values, np.datetime64):
-            return _dt_to_float_ordinal(lib.Timestamp(values))
-        elif isinstance(values, pydt.time):
-            return dates.date2num(values)
-        elif (is_integer(values) or is_float(values)):
-            return values
-        elif isinstance(values, compat.string_types):
-            return try_parse(values)
-        elif isinstance(values, (list, tuple, np.ndarray, Index)):
-            if isinstance(values, Index):
-                values = values.values
-            if not isinstance(values, np.ndarray):
-                values = com._asarray_tuplesafe(values)
-
-            if is_integer_dtype(values) or is_float_dtype(values):
-                return values
-
-            try:
-                values = tools.to_datetime(values)
-                if isinstance(values, Index):
-                    values = _dt_to_float_ordinal(values)
-                else:
-                    values = [_dt_to_float_ordinal(x) for x in values]
-            except Exception:
-                values = _dt_to_float_ordinal(values)
-
-        return values
-
-    @staticmethod
-    def axisinfo(unit, axis):
-        """
-        Return the :class:`~matplotlib.units.AxisInfo` for *unit*.
-
-        *unit* is a tzinfo instance or None.
-        The *axis* argument is required but not used.
-        """
-        tz = unit
-
-        majloc = PandasAutoDateLocator(tz=tz)
-        majfmt = PandasAutoDateFormatter(majloc, tz=tz)
-        datemin = pydt.date(2000, 1, 1)
-        datemax = pydt.date(2010, 1, 1)
-
-        return units.AxisInfo(majloc=majloc, majfmt=majfmt, label='',
-                              default_limits=(datemin, datemax))
-
-
-class PandasAutoDateFormatter(dates.AutoDateFormatter):
-
-    def __init__(self, locator, tz=None, defaultfmt='%Y-%m-%d'):
-        dates.AutoDateFormatter.__init__(self, locator, tz, defaultfmt)
-        # matplotlib.dates._UTC has no _utcoffset called by pandas
-        if self._tz is dates.UTC:
-            self._tz._utcoffset = self._tz.utcoffset(None)
-
-        # For mpl > 2.0 the format strings are controlled via rcparams
-        # so do not mess with them.  For mpl < 2.0 change the second
-        # break point and add a musec break point
-        if _mpl_le_2_0_0():
-            self.scaled[1. / SEC_PER_DAY] = '%H:%M:%S'
-            self.scaled[1. / MUSEC_PER_DAY] = '%H:%M:%S.%f'
-
-
-class PandasAutoDateLocator(dates.AutoDateLocator):
-
-    def get_locator(self, dmin, dmax):
-        'Pick the best locator based on a distance.'
-        delta = relativedelta(dmax, dmin)
-
-        num_days = (delta.years * 12.0 + delta.months) * 31.0 + delta.days
-        num_sec = (delta.hours * 60.0 + delta.minutes) * 60.0 + delta.seconds
-        tot_sec = num_days * 86400. + num_sec
-
-        if abs(tot_sec) < self.minticks:
-            self._freq = -1
-            locator = MilliSecondLocator(self.tz)
-            locator.set_axis(self.axis)
-
-            locator.set_view_interval(*self.axis.get_view_interval())
-            locator.set_data_interval(*self.axis.get_data_interval())
-            return locator
-
-        return dates.AutoDateLocator.get_locator(self, dmin, dmax)
-
-    def _get_unit(self):
-        return MilliSecondLocator.get_unit_generic(self._freq)
-
-
-class MilliSecondLocator(dates.DateLocator):
-
-    UNIT = 1. / (24 * 3600 * 1000)
-
-    def __init__(self, tz):
-        dates.DateLocator.__init__(self, tz)
-        self._interval = 1.
-
-    def _get_unit(self):
-        return self.get_unit_generic(-1)
-
-    @staticmethod
-    def get_unit_generic(freq):
-        unit = dates.RRuleLocator.get_unit_generic(freq)
-        if unit < 0:
-            return MilliSecondLocator.UNIT
-        return unit
-
-    def __call__(self):
-        # if no data have been set, this will tank with a ValueError
-        try:
-            dmin, dmax = self.viewlim_to_dt()
-        except ValueError:
-            return []
-
-        if dmin > dmax:
-            dmax, dmin = dmin, dmax
-        # We need to cap at the endpoints of valid datetime
-
-        # TODO(wesm) unused?
-        # delta = relativedelta(dmax, dmin)
-        # try:
-        #     start = dmin - delta
-        # except ValueError:
-        #     start = _from_ordinal(1.0)
-
-        # try:
-        #     stop = dmax + delta
-        # except ValueError:
-        #     # The magic number!
-        #     stop = _from_ordinal(3652059.9999999)
-
-        nmax, nmin = dates.date2num((dmax, dmin))
-
-        num = (nmax - nmin) * 86400 * 1000
-        max_millis_ticks = 6
-        for interval in [1, 10, 50, 100, 200, 500]:
-            if num <= interval * (max_millis_ticks - 1):
-                self._interval = interval
-                break
-            else:
-                # We went through the whole loop without breaking, default to 1
-                self._interval = 1000.
-
-        estimate = (nmax - nmin) / (self._get_unit() * self._get_interval())
-
-        if estimate > self.MAXTICKS * 2:
-            raise RuntimeError(('MillisecondLocator estimated to generate %d '
-                                'ticks from %s to %s: exceeds Locator.MAXTICKS'
-                                '* 2 (%d) ') %
-                               (estimate, dmin, dmax, self.MAXTICKS * 2))
-
-        freq = '%dL' % self._get_interval()
-        tz = self.tz.tzname(None)
-        st = _from_ordinal(dates.date2num(dmin))  # strip tz
-        ed = _from_ordinal(dates.date2num(dmax))
-        all_dates = date_range(start=st, end=ed, freq=freq, tz=tz).asobject
-
-        try:
-            if len(all_dates) > 0:
-                locs = self.raise_if_exceeds(dates.date2num(all_dates))
-                return locs
-        except Exception:  # pragma: no cover
-            pass
-
-        lims = dates.date2num([dmin, dmax])
-        return lims
-
-    def _get_interval(self):
-        return self._interval
-
-    def autoscale(self):
-        """
-        Set the view limits to include the data range.
-        """
-        dmin, dmax = self.datalim_to_dt()
-        if dmin > dmax:
-            dmax, dmin = dmin, dmax
-
-        # We need to cap at the endpoints of valid datetime
-
-        # TODO(wesm): unused?
-
-        # delta = relativedelta(dmax, dmin)
-        # try:
-        #     start = dmin - delta
-        # except ValueError:
-        #     start = _from_ordinal(1.0)
-
-        # try:
-        #     stop = dmax + delta
-        # except ValueError:
-        #     # The magic number!
-        #     stop = _from_ordinal(3652059.9999999)
-
-        dmin, dmax = self.datalim_to_dt()
-
-        vmin = dates.date2num(dmin)
-        vmax = dates.date2num(dmax)
-
-        return self.nonsingular(vmin, vmax)
-
-
-def _from_ordinal(x, tz=None):
-    ix = int(x)
-    dt = datetime.fromordinal(ix)
-    remainder = float(x) - ix
-    hour, remainder = divmod(24 * remainder, 1)
-    minute, remainder = divmod(60 * remainder, 1)
-    second, remainder = divmod(60 * remainder, 1)
-    microsecond = int(1e6 * remainder)
-    if microsecond < 10:
-        microsecond = 0  # compensate for rounding errors
-    dt = datetime(dt.year, dt.month, dt.day, int(hour), int(minute),
-                  int(second), microsecond)
-    if tz is not None:
-        dt = dt.astimezone(tz)
-
-    if microsecond > 999990:  # compensate for rounding errors
-        dt += timedelta(microseconds=1e6 - microsecond)
-
-    return dt
-
-# Fixed frequency dynamic tick locators and formatters
-
-# -------------------------------------------------------------------------
-# --- Locators ---
-# -------------------------------------------------------------------------
-
-
-def _get_default_annual_spacing(nyears):
-    """
-    Returns a default spacing between consecutive ticks for annual data.
-    """
-    if nyears < 11:
-        (min_spacing, maj_spacing) = (1, 1)
-    elif nyears < 20:
-        (min_spacing, maj_spacing) = (1, 2)
-    elif nyears < 50:
-        (min_spacing, maj_spacing) = (1, 5)
-    elif nyears < 100:
-        (min_spacing, maj_spacing) = (5, 10)
-    elif nyears < 200:
-        (min_spacing, maj_spacing) = (5, 25)
-    elif nyears < 600:
-        (min_spacing, maj_spacing) = (10, 50)
-    else:
-        factor = nyears // 1000 + 1
-        (min_spacing, maj_spacing) = (factor * 20, factor * 100)
-    return (min_spacing, maj_spacing)
-
-
-def period_break(dates, period):
-    """
-    Returns the indices where the given period changes.
-
-    Parameters
-    ----------
-    dates : PeriodIndex
-        Array of intervals to monitor.
-    period : string
-        Name of the period to monitor.
-    """
-    current = getattr(dates, period)
-    previous = getattr(dates - 1, period)
-    return np.nonzero(current - previous)[0]
-
-
-def has_level_label(label_flags, vmin):
-    """
-    Returns true if the ``label_flags`` indicate there is at least one label
-    for this level.
-
-    if the minimum view limit is not an exact integer, then the first tick
-    label won't be shown, so we must adjust for that.
-    """
-    if label_flags.size == 0 or (label_flags.size == 1 and
-                                 label_flags[0] == 0 and
-                                 vmin % 1 > 0.0):
-        return False
-    else:
-        return True
-
-
-def _daily_finder(vmin, vmax, freq):
-    periodsperday = -1
-
-    if freq >= FreqGroup.FR_HR:
-        if freq == FreqGroup.FR_NS:
-            periodsperday = 24 * 60 * 60 * 1000000000
-        elif freq == FreqGroup.FR_US:
-            periodsperday = 24 * 60 * 60 * 1000000
-        elif freq == FreqGroup.FR_MS:
-            periodsperday = 24 * 60 * 60 * 1000
-        elif freq == FreqGroup.FR_SEC:
-            periodsperday = 24 * 60 * 60
-        elif freq == FreqGroup.FR_MIN:
-            periodsperday = 24 * 60
-        elif freq == FreqGroup.FR_HR:
-            periodsperday = 24
-        else:  # pragma: no cover
-            raise ValueError("unexpected frequency: %s" % freq)
-        periodsperyear = 365 * periodsperday
-        periodspermonth = 28 * periodsperday
-
-    elif freq == FreqGroup.FR_BUS:
-        periodsperyear = 261
-        periodspermonth = 19
-    elif freq == FreqGroup.FR_DAY:
-        periodsperyear = 365
-        periodspermonth = 28
-    elif frequencies.get_freq_group(freq) == FreqGroup.FR_WK:
-        periodsperyear = 52
-        periodspermonth = 3
-    else:  # pragma: no cover
-        raise ValueError("unexpected frequency")
-
-    # save this for later usage
-    vmin_orig = vmin
-
-    (vmin, vmax) = (Period(ordinal=int(vmin), freq=freq),
-                    Period(ordinal=int(vmax), freq=freq))
-    span = vmax.ordinal - vmin.ordinal + 1
-    dates_ = PeriodIndex(start=vmin, end=vmax, freq=freq)
-    # Initialize the output
-    info = np.zeros(span,
-                    dtype=[('val', np.int64), ('maj', bool),
-                           ('min', bool), ('fmt', '|S20')])
-    info['val'][:] = dates_._values
-    info['fmt'][:] = ''
-    info['maj'][[0, -1]] = True
-    # .. and set some shortcuts
-    info_maj = info['maj']
-    info_min = info['min']
-    info_fmt = info['fmt']
-
-    def first_label(label_flags):
-        if (label_flags[0] == 0) and (label_flags.size > 1) and \
-                ((vmin_orig % 1) > 0.0):
-            return label_flags[1]
-        else:
-            return label_flags[0]
-
-    # Case 1. Less than a month
-    if span <= periodspermonth:
-        day_start = period_break(dates_, 'day')
-        month_start = period_break(dates_, 'month')
-
-        def _hour_finder(label_interval, force_year_start):
-            _hour = dates_.hour
-            _prev_hour = (dates_ - 1).hour
-            hour_start = (_hour - _prev_hour) != 0
-            info_maj[day_start] = True
-            info_min[hour_start & (_hour % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt[hour_start & (_hour % label_interval == 0)] = '%H:%M'
-            info_fmt[day_start] = '%H:%M\n%d-%b'
-            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
-            if force_year_start and not has_level_label(year_start, vmin_orig):
-                info_fmt[first_label(day_start)] = '%H:%M\n%d-%b\n%Y'
-
-        def _minute_finder(label_interval):
-            hour_start = period_break(dates_, 'hour')
-            _minute = dates_.minute
-            _prev_minute = (dates_ - 1).minute
-            minute_start = (_minute - _prev_minute) != 0
-            info_maj[hour_start] = True
-            info_min[minute_start & (_minute % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[minute_start & (_minute % label_interval == 0)] = '%H:%M'
-            info_fmt[day_start] = '%H:%M\n%d-%b'
-            info_fmt[year_start] = '%H:%M\n%d-%b\n%Y'
-
-        def _second_finder(label_interval):
-            minute_start = period_break(dates_, 'minute')
-            _second = dates_.second
-            _prev_second = (dates_ - 1).second
-            second_start = (_second - _prev_second) != 0
-            info['maj'][minute_start] = True
-            info['min'][second_start & (_second % label_interval == 0)] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[second_start & (_second %
-                                     label_interval == 0)] = '%H:%M:%S'
-            info_fmt[day_start] = '%H:%M:%S\n%d-%b'
-            info_fmt[year_start] = '%H:%M:%S\n%d-%b\n%Y'
-
-        if span < periodsperday / 12000.0:
-            _second_finder(1)
-        elif span < periodsperday / 6000.0:
-            _second_finder(2)
-        elif span < periodsperday / 2400.0:
-            _second_finder(5)
-        elif span < periodsperday / 1200.0:
-            _second_finder(10)
-        elif span < periodsperday / 800.0:
-            _second_finder(15)
-        elif span < periodsperday / 400.0:
-            _second_finder(30)
-        elif span < periodsperday / 150.0:
-            _minute_finder(1)
-        elif span < periodsperday / 70.0:
-            _minute_finder(2)
-        elif span < periodsperday / 24.0:
-            _minute_finder(5)
-        elif span < periodsperday / 12.0:
-            _minute_finder(15)
-        elif span < periodsperday / 6.0:
-            _minute_finder(30)
-        elif span < periodsperday / 2.5:
-            _hour_finder(1, False)
-        elif span < periodsperday / 1.5:
-            _hour_finder(2, False)
-        elif span < periodsperday * 1.25:
-            _hour_finder(3, False)
-        elif span < periodsperday * 2.5:
-            _hour_finder(6, True)
-        elif span < periodsperday * 4:
-            _hour_finder(12, True)
-        else:
-            info_maj[month_start] = True
-            info_min[day_start] = True
-            year_start = period_break(dates_, 'year')
-            info_fmt = info['fmt']
-            info_fmt[day_start] = '%d'
-            info_fmt[month_start] = '%d\n%b'
-            info_fmt[year_start] = '%d\n%b\n%Y'
-            if not has_level_label(year_start, vmin_orig):
-                if not has_level_label(month_start, vmin_orig):
-                    info_fmt[first_label(day_start)] = '%d\n%b\n%Y'
-                else:
-                    info_fmt[first_label(month_start)] = '%d\n%b\n%Y'
-
-    # Case 2. Less than three months
-    elif span <= periodsperyear // 4:
-        month_start = period_break(dates_, 'month')
-        info_maj[month_start] = True
-        if freq < FreqGroup.FR_HR:
-            info['min'] = True
-        else:
-            day_start = period_break(dates_, 'day')
-            info['min'][day_start] = True
-        week_start = period_break(dates_, 'week')
-        year_start = period_break(dates_, 'year')
-        info_fmt[week_start] = '%d'
-        info_fmt[month_start] = '\n\n%b'
-        info_fmt[year_start] = '\n\n%b\n%Y'
-        if not has_level_label(year_start, vmin_orig):
-            if not has_level_label(month_start, vmin_orig):
-                info_fmt[first_label(week_start)] = '\n\n%b\n%Y'
-            else:
-                info_fmt[first_label(month_start)] = '\n\n%b\n%Y'
-    # Case 3. Less than 14 months ...............
-    elif span <= 1.15 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        month_start = period_break(dates_, 'month')
-        week_start = period_break(dates_, 'week')
-        info_maj[month_start] = True
-        info_min[week_start] = True
-        info_min[year_start] = False
-        info_min[month_start] = False
-        info_fmt[month_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-        if not has_level_label(year_start, vmin_orig):
-            info_fmt[first_label(month_start)] = '%b\n%Y'
-    # Case 4. Less than 2.5 years ...............
-    elif span <= 2.5 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        quarter_start = period_break(dates_, 'quarter')
-        month_start = period_break(dates_, 'month')
-        info_maj[quarter_start] = True
-        info_min[month_start] = True
-        info_fmt[quarter_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    # Case 4. Less than 4 years .................
-    elif span <= 4 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        month_start = period_break(dates_, 'month')
-        info_maj[year_start] = True
-        info_min[month_start] = True
-        info_min[year_start] = False
-
-        month_break = dates_[month_start].month
-        jan_or_jul = month_start[(month_break == 1) | (month_break == 7)]
-        info_fmt[jan_or_jul] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-    # Case 5. Less than 11 years ................
-    elif span <= 11 * periodsperyear:
-        year_start = period_break(dates_, 'year')
-        quarter_start = period_break(dates_, 'quarter')
-        info_maj[year_start] = True
-        info_min[quarter_start] = True
-        info_min[year_start] = False
-        info_fmt[year_start] = '%Y'
-    # Case 6. More than 12 years ................
-    else:
-        year_start = period_break(dates_, 'year')
-        year_break = dates_[year_start].year
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        major_idx = year_start[(year_break % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        minor_idx = year_start[(year_break % min_anndef == 0)]
-        info_min[minor_idx] = True
-        info_fmt[major_idx] = '%Y'
-
-    return info
-
-
-def _monthly_finder(vmin, vmax, freq):
-    periodsperyear = 12
-
-    vmin_orig = vmin
-    (vmin, vmax) = (int(vmin), int(vmax))
-    span = vmax - vmin + 1
-
-    # Initialize the output
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    dates_ = info['val']
-    info['fmt'] = ''
-    year_start = (dates_ % 12 == 0).nonzero()[0]
-    info_maj = info['maj']
-    info_fmt = info['fmt']
-
-    if span <= 1.15 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        info_fmt[:] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-
-        if not has_level_label(year_start, vmin_orig):
-            if dates_.size > 1:
-                idx = 1
-            else:
-                idx = 0
-            info_fmt[idx] = '%b\n%Y'
-
-    elif span <= 2.5 * periodsperyear:
-        quarter_start = (dates_ % 3 == 0).nonzero()
-        info_maj[year_start] = True
-        # TODO: Check the following : is it really info['fmt'] ?
-        info['fmt'][quarter_start] = True
-        info['min'] = True
-
-        info_fmt[quarter_start] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-
-    elif span <= 4 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        jan_or_jul = (dates_ % 12 == 0) | (dates_ % 12 == 6)
-        info_fmt[jan_or_jul] = '%b'
-        info_fmt[year_start] = '%b\n%Y'
-
-    elif span <= 11 * periodsperyear:
-        quarter_start = (dates_ % 3 == 0).nonzero()
-        info_maj[year_start] = True
-        info['min'][quarter_start] = True
-
-        info_fmt[year_start] = '%Y'
-
-    else:
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        years = dates_[year_start] // 12 + 1
-        major_idx = year_start[(years % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        info['min'][year_start[(years % min_anndef == 0)]] = True
-
-        info_fmt[major_idx] = '%Y'
-
-    return info
-
-
-def _quarterly_finder(vmin, vmax, freq):
-    periodsperyear = 4
-    vmin_orig = vmin
-    (vmin, vmax) = (int(vmin), int(vmax))
-    span = vmax - vmin + 1
-
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    info['fmt'] = ''
-    dates_ = info['val']
-    info_maj = info['maj']
-    info_fmt = info['fmt']
-    year_start = (dates_ % 4 == 0).nonzero()[0]
-
-    if span <= 3.5 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-
-        info_fmt[:] = 'Q%q'
-        info_fmt[year_start] = 'Q%q\n%F'
-        if not has_level_label(year_start, vmin_orig):
-            if dates_.size > 1:
-                idx = 1
-            else:
-                idx = 0
-            info_fmt[idx] = 'Q%q\n%F'
-
-    elif span <= 11 * periodsperyear:
-        info_maj[year_start] = True
-        info['min'] = True
-        info_fmt[year_start] = '%F'
-
-    else:
-        years = dates_[year_start] // 4 + 1
-        nyears = span / periodsperyear
-        (min_anndef, maj_anndef) = _get_default_annual_spacing(nyears)
-        major_idx = year_start[(years % maj_anndef == 0)]
-        info_maj[major_idx] = True
-        info['min'][year_start[(years % min_anndef == 0)]] = True
-        info_fmt[major_idx] = '%F'
-
-    return info
-
-
-def _annual_finder(vmin, vmax, freq):
-    (vmin, vmax) = (int(vmin), int(vmax + 1))
-    span = vmax - vmin + 1
-
-    info = np.zeros(span,
-                    dtype=[('val', int), ('maj', bool), ('min', bool),
-                           ('fmt', '|S8')])
-    info['val'] = np.arange(vmin, vmax + 1)
-    info['fmt'] = ''
-    dates_ = info['val']
-
-    (min_anndef, maj_anndef) = _get_default_annual_spacing(span)
-    major_idx = dates_ % maj_anndef == 0
-    info['maj'][major_idx] = True
-    info['min'][(dates_ % min_anndef == 0)] = True
-    info['fmt'][major_idx] = '%Y'
-
-    return info
-
-
-def get_finder(freq):
-    if isinstance(freq, compat.string_types):
-        freq = frequencies.get_freq(freq)
-    fgroup = frequencies.get_freq_group(freq)
-
-    if fgroup == FreqGroup.FR_ANN:
-        return _annual_finder
-    elif fgroup == FreqGroup.FR_QTR:
-        return _quarterly_finder
-    elif freq == FreqGroup.FR_MTH:
-        return _monthly_finder
-    elif ((freq >= FreqGroup.FR_BUS) or fgroup == FreqGroup.FR_WK):
-        return _daily_finder
-    else:  # pragma: no cover
-        errmsg = "Unsupported frequency: %s" % (freq)
-        raise NotImplementedError(errmsg)
-
-
-class TimeSeries_DateLocator(Locator):
-    """
-    Locates the ticks along an axis controlled by a :class:`Series`.
-
-    Parameters
-    ----------
-    freq : {var}
-        Valid frequency specifier.
-    minor_locator : {False, True}, optional
-        Whether the locator is for minor ticks (True) or not.
-    dynamic_mode : {True, False}, optional
-        Whether the locator should work in dynamic mode.
-    base : {int}, optional
-    quarter : {int}, optional
-    month : {int}, optional
-    day : {int}, optional
-    """
-
-    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
-                 base=1, quarter=1, month=1, day=1, plot_obj=None):
-        if isinstance(freq, compat.string_types):
-            freq = frequencies.get_freq(freq)
-        self.freq = freq
-        self.base = base
-        (self.quarter, self.month, self.day) = (quarter, month, day)
-        self.isminor = minor_locator
-        self.isdynamic = dynamic_mode
-        self.offset = 0
-        self.plot_obj = plot_obj
-        self.finder = get_finder(freq)
-
-    def _get_default_locs(self, vmin, vmax):
-        "Returns the default locations of ticks."
-
-        if self.plot_obj.date_axis_info is None:
-            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
-
-        locator = self.plot_obj.date_axis_info
-
-        if self.isminor:
-            return np.compress(locator['min'], locator['val'])
-        return np.compress(locator['maj'], locator['val'])
-
-    def __call__(self):
-        'Return the locations of the ticks.'
-        # axis calls Locator.set_axis inside set_m<xxxx>_formatter
-        vi = tuple(self.axis.get_view_interval())
-        if vi != self.plot_obj.view_interval:
-            self.plot_obj.date_axis_info = None
-        self.plot_obj.view_interval = vi
-        vmin, vmax = vi
-        if vmax < vmin:
-            vmin, vmax = vmax, vmin
-        if self.isdynamic:
-            locs = self._get_default_locs(vmin, vmax)
-        else:  # pragma: no cover
-            base = self.base
-            (d, m) = divmod(vmin, base)
-            vmin = (d + 1) * base
-            locs = lrange(vmin, vmax + 1, base)
-        return locs
-
-    def autoscale(self):
-        """
-        Sets the view limits to the nearest multiples of base that contain the
-        data.
-        """
-        # requires matplotlib >= 0.98.0
-        (vmin, vmax) = self.axis.get_data_interval()
-
-        locs = self._get_default_locs(vmin, vmax)
-        (vmin, vmax) = locs[[0, -1]]
-        if vmin == vmax:
-            vmin -= 1
-            vmax += 1
-        return nonsingular(vmin, vmax)
-
-# -------------------------------------------------------------------------
-# --- Formatter ---
-# -------------------------------------------------------------------------
-
-
-class TimeSeries_DateFormatter(Formatter):
-    """
-    Formats the ticks along an axis controlled by a :class:`PeriodIndex`.
-
-    Parameters
-    ----------
-    freq : {int, string}
-        Valid frequency specifier.
-    minor_locator : {False, True}
-        Whether the current formatter should apply to minor ticks (True) or
-        major ticks (False).
-    dynamic_mode : {True, False}
-        Whether the formatter works in dynamic mode or not.
-    """
-
-    def __init__(self, freq, minor_locator=False, dynamic_mode=True,
-                 plot_obj=None):
-        if isinstance(freq, compat.string_types):
-            freq = frequencies.get_freq(freq)
-        self.format = None
-        self.freq = freq
-        self.locs = []
-        self.formatdict = None
-        self.isminor = minor_locator
-        self.isdynamic = dynamic_mode
-        self.offset = 0
-        self.plot_obj = plot_obj
-        self.finder = get_finder(freq)
-
-    def _set_default_format(self, vmin, vmax):
-        "Returns the default ticks spacing."
-
-        if self.plot_obj.date_axis_info is None:
-            self.plot_obj.date_axis_info = self.finder(vmin, vmax, self.freq)
-        info = self.plot_obj.date_axis_info
-
-        if self.isminor:
-            format = np.compress(info['min'] & np.logical_not(info['maj']),
-                                 info)
-        else:
-            format = np.compress(info['maj'], info)
-        self.formatdict = dict([(x, f) for (x, _, _, f) in format])
-        return self.formatdict
-
-    def set_locs(self, locs):
-        'Sets the locations of the ticks'
-        # don't actually use the locs. This is just needed to work with
-        # matplotlib. Force to use vmin, vmax
-        self.locs = locs
-
-        (vmin, vmax) = vi = tuple(self.axis.get_view_interval())
-        if vi != self.plot_obj.view_interval:
-            self.plot_obj.date_axis_info = None
-        self.plot_obj.view_interval = vi
-        if vmax < vmin:
-            (vmin, vmax) = (vmax, vmin)
-        self._set_default_format(vmin, vmax)
-
-    def __call__(self, x, pos=0):
-        if self.formatdict is None:
-            return ''
-        else:
-            fmt = self.formatdict.pop(x, '')
-            return Period(ordinal=int(x), freq=self.freq).strftime(fmt)
-
-
-class TimeSeries_TimedeltaFormatter(Formatter):
-    """
-    Formats the ticks along an axis controlled by a :class:`TimedeltaIndex`.
-    """
-
-    @staticmethod
-    def format_timedelta_ticks(x, pos, n_decimals):
-        """
-        Convert seconds to 'D days HH:MM:SS.F'
-        """
-        s, ns = divmod(x, 1e9)
-        m, s = divmod(s, 60)
-        h, m = divmod(m, 60)
-        d, h = divmod(h, 24)
-        decimals = int(ns * 10**(n_decimals - 9))
-        s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
-        if n_decimals > 0:
-            s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
-        if d != 0:
-            s = '{:d} days '.format(int(d)) + s
-        return s
-
-    def __call__(self, x, pos=0):
-        (vmin, vmax) = tuple(self.axis.get_view_interval())
-        n_decimals = int(np.ceil(np.log10(100 * 1e9 / (vmax - vmin))))
-        if n_decimals > 9:
-            n_decimals = 9
-        return self.format_timedelta_ticks(x, pos, n_decimals)
+    from pandas.plotting._converter import register as register_
+    msg = ("'pandas.tseries.converter.register' has been moved and renamed to "
+           "'pandas.plotting.register_matplotlib_converters'. ")
+    warnings.warn(msg, FutureWarning, stacklevel=2)
+    register_()
diff --git a/pandas/tseries/frequencies.py b/pandas/tseries/frequencies.py
index 8013947babc5a..1b782b430a1a7 100644
--- a/pandas/tseries/frequencies.py
+++ b/pandas/tseries/frequencies.py
@@ -1,443 +1,52 @@
+# -*- coding: utf-8 -*-
 from datetime import timedelta
-from pandas.compat import long, zip
-from pandas import compat
 import re
-import warnings
 
 import numpy as np
-
-from pandas.types.generic import ABCSeries
-from pandas.types.common import (is_integer,
-                                 is_period_arraylike,
-                                 is_timedelta64_dtype,
-                                 is_datetime64_dtype)
-
-import pandas.core.algorithms as algos
-from pandas.core.algorithms import unique
-from pandas.tseries.offsets import DateOffset
-from pandas.util.decorators import cache_readonly, deprecate_kwarg
-import pandas.tseries.offsets as offsets
-
-from pandas._libs import lib, tslib
-from pandas._libs.tslib import Timedelta
 from pytz import AmbiguousTimeError
 
+from pandas._libs.algos import unique_deltas
+from pandas._libs.tslibs import Timedelta, Timestamp
+from pandas._libs.tslibs.ccalendar import MONTH_ALIASES, int_to_weekday
+from pandas._libs.tslibs.conversion import tz_convert
+from pandas._libs.tslibs.fields import build_field_sarray
+import pandas._libs.tslibs.frequencies as libfreqs
+from pandas._libs.tslibs.offsets import _offset_to_period_map
+import pandas._libs.tslibs.resolution as libresolution
+from pandas._libs.tslibs.resolution import Resolution
+from pandas._libs.tslibs.timezones import UTC
+import pandas.compat as compat
+from pandas.compat import zip
+from pandas.util._decorators import cache_readonly
+
+from pandas.core.dtypes.common import (
+    is_datetime64_dtype, is_period_arraylike, is_timedelta64_dtype)
+from pandas.core.dtypes.generic import ABCSeries
 
-class FreqGroup(object):
-    FR_ANN = 1000
-    FR_QTR = 2000
-    FR_MTH = 3000
-    FR_WK = 4000
-    FR_BUS = 5000
-    FR_DAY = 6000
-    FR_HR = 7000
-    FR_MIN = 8000
-    FR_SEC = 9000
-    FR_MS = 10000
-    FR_US = 11000
-    FR_NS = 12000
-
-
-RESO_NS = 0
-RESO_US = 1
-RESO_MS = 2
-RESO_SEC = 3
-RESO_MIN = 4
-RESO_HR = 5
-RESO_DAY = 6
-
-
-class Resolution(object):
-
-    RESO_US = RESO_US
-    RESO_MS = RESO_MS
-    RESO_SEC = RESO_SEC
-    RESO_MIN = RESO_MIN
-    RESO_HR = RESO_HR
-    RESO_DAY = RESO_DAY
-
-    _reso_str_map = {
-        RESO_NS: 'nanosecond',
-        RESO_US: 'microsecond',
-        RESO_MS: 'millisecond',
-        RESO_SEC: 'second',
-        RESO_MIN: 'minute',
-        RESO_HR: 'hour',
-        RESO_DAY: 'day'
-    }
-
-    # factor to multiply a value by to convert it to the next finer grained
-    # resolution
-    _reso_mult_map = {
-        RESO_NS: None,
-        RESO_US: 1000,
-        RESO_MS: 1000,
-        RESO_SEC: 1000,
-        RESO_MIN: 60,
-        RESO_HR: 60,
-        RESO_DAY: 24
-    }
-
-    _reso_str_bump_map = {
-        'D': 'H',
-        'H': 'T',
-        'T': 'S',
-        'S': 'L',
-        'L': 'U',
-        'U': 'N',
-        'N': None
-    }
-
-    _str_reso_map = dict([(v, k) for k, v in compat.iteritems(_reso_str_map)])
-
-    _reso_freq_map = {
-        'year': 'A',
-        'quarter': 'Q',
-        'month': 'M',
-        'day': 'D',
-        'hour': 'H',
-        'minute': 'T',
-        'second': 'S',
-        'millisecond': 'L',
-        'microsecond': 'U',
-        'nanosecond': 'N'}
-
-    _freq_reso_map = dict([(v, k)
-                           for k, v in compat.iteritems(_reso_freq_map)])
-
-    @classmethod
-    def get_str(cls, reso):
-        """
-        Return resolution str against resolution code.
-
-        Example
-        -------
-        >>> Resolution.get_str(Resolution.RESO_SEC)
-        'second'
-        """
-        return cls._reso_str_map.get(reso, 'day')
-
-    @classmethod
-    def get_reso(cls, resostr):
-        """
-        Return resolution str against resolution code.
-
-        Example
-        -------
-        >>> Resolution.get_reso('second')
-        2
-
-        >>> Resolution.get_reso('second') == Resolution.RESO_SEC
-        True
-        """
-        return cls._str_reso_map.get(resostr, cls.RESO_DAY)
-
-    @classmethod
-    def get_freq_group(cls, resostr):
-        """
-        Return frequency str against resolution str.
-
-        Example
-        -------
-        >>> f.Resolution.get_freq_group('day')
-        4000
-        """
-        return get_freq_group(cls.get_freq(resostr))
-
-    @classmethod
-    def get_freq(cls, resostr):
-        """
-        Return frequency str against resolution str.
-
-        Example
-        -------
-        >>> f.Resolution.get_freq('day')
-        'D'
-        """
-        return cls._reso_freq_map[resostr]
-
-    @classmethod
-    def get_str_from_freq(cls, freq):
-        """
-        Return resolution str against frequency str.
-
-        Example
-        -------
-        >>> Resolution.get_str_from_freq('H')
-        'hour'
-        """
-        return cls._freq_reso_map.get(freq, 'day')
-
-    @classmethod
-    def get_reso_from_freq(cls, freq):
-        """
-        Return resolution code against frequency str.
-
-        Example
-        -------
-        >>> Resolution.get_reso_from_freq('H')
-        4
-
-        >>> Resolution.get_reso_from_freq('H') == Resolution.RESO_HR
-        True
-        """
-        return cls.get_reso(cls.get_str_from_freq(freq))
-
-    @classmethod
-    def get_stride_from_decimal(cls, value, freq):
-        """
-        Convert freq with decimal stride into a higher freq with integer stride
-
-        Parameters
-        ----------
-        value : integer or float
-        freq : string
-            Frequency string
-
-        Raises
-        ------
-        ValueError
-            If the float cannot be converted to an integer at any resolution.
-
-        Example
-        -------
-        >>> Resolution.get_stride_from_decimal(1.5, 'T')
-        (90, 'S')
-
-        >>> Resolution.get_stride_from_decimal(1.04, 'H')
-        (3744, 'S')
-
-        >>> Resolution.get_stride_from_decimal(1, 'D')
-        (1, 'D')
-        """
-
-        if np.isclose(value % 1, 0):
-            return int(value), freq
-        else:
-            start_reso = cls.get_reso_from_freq(freq)
-            if start_reso == 0:
-                raise ValueError(
-                    "Could not convert to integer offset at any resolution"
-                )
-
-            next_value = cls._reso_mult_map[start_reso] * value
-            next_name = cls._reso_str_bump_map[freq]
-            return cls.get_stride_from_decimal(next_value, next_name)
-
-
-def get_to_timestamp_base(base):
-    """
-    Return frequency code group used for base of to_timestamp against
-    frequency code.
-
-    Example
-    -------
-    # Return day freq code against longer freq than day
-    >>> get_to_timestamp_base(get_freq_code('D')[0])
-    6000
-    >>> get_to_timestamp_base(get_freq_code('W')[0])
-    6000
-    >>> get_to_timestamp_base(get_freq_code('M')[0])
-    6000
-
-    # Return second freq code against hour between second
-    >>> get_to_timestamp_base(get_freq_code('H')[0])
-    9000
-    >>> get_to_timestamp_base(get_freq_code('S')[0])
-    9000
-    """
-    if base < FreqGroup.FR_BUS:
-        return FreqGroup.FR_DAY
-    if FreqGroup.FR_HR <= base <= FreqGroup.FR_SEC:
-        return FreqGroup.FR_SEC
-    return base
-
-
-def get_freq_group(freq):
-    """
-    Return frequency code group of given frequency str or offset.
-
-    Example
-    -------
-    >>> get_freq_group('W-MON')
-    4000
-
-    >>> get_freq_group('W-FRI')
-    4000
-    """
-    if isinstance(freq, offsets.DateOffset):
-        freq = freq.rule_code
-
-    if isinstance(freq, compat.string_types):
-        base, mult = get_freq_code(freq)
-        freq = base
-    elif isinstance(freq, int):
-        pass
-    else:
-        raise ValueError('input must be str, offset or int')
-    return (freq // 1000) * 1000
-
-
-def get_freq(freq):
-    """
-    Return frequency code of given frequency str.
-    If input is not string, return input as it is.
-
-    Example
-    -------
-    >>> get_freq('A')
-    1000
-
-    >>> get_freq('3A')
-    1000
-    """
-    if isinstance(freq, compat.string_types):
-        base, mult = get_freq_code(freq)
-        freq = base
-    return freq
-
-
-def get_freq_code(freqstr):
-    """
-    Return freq str or tuple to freq code and stride (mult)
-
-    Parameters
-    ----------
-    freqstr : str or tuple
-
-    Returns
-    -------
-    return : tuple of base frequency code and stride (mult)
-
-    Example
-    -------
-    >>> get_freq_code('3D')
-    (6000, 3)
-
-    >>> get_freq_code('D')
-    (6000, 1)
-
-    >>> get_freq_code(('D', 3))
-    (6000, 3)
-    """
-    if isinstance(freqstr, DateOffset):
-        freqstr = (freqstr.rule_code, freqstr.n)
-
-    if isinstance(freqstr, tuple):
-        if (is_integer(freqstr[0]) and
-                is_integer(freqstr[1])):
-            # e.g., freqstr = (2000, 1)
-            return freqstr
-        else:
-            # e.g., freqstr = ('T', 5)
-            try:
-                code = _period_str_to_code(freqstr[0])
-                stride = freqstr[1]
-            except:
-                if is_integer(freqstr[1]):
-                    raise
-                code = _period_str_to_code(freqstr[1])
-                stride = freqstr[0]
-            return code, stride
-
-    if is_integer(freqstr):
-        return (freqstr, 1)
-
-    base, stride = _base_and_stride(freqstr)
-    code = _period_str_to_code(base)
-
-    return code, stride
-
+from pandas.core.algorithms import unique
 
-def _get_freq_str(base, mult=1):
-    code = _reverse_period_code_map.get(base)
-    if mult == 1:
-        return code
-    return str(mult) + code
+from pandas.tseries.offsets import (
+    DateOffset, Day, Hour, Micro, Milli, Minute, Nano, Second, prefix_mapping)
 
+_ONE_MICRO = 1000
+_ONE_MILLI = (_ONE_MICRO * 1000)
+_ONE_SECOND = (_ONE_MILLI * 1000)
+_ONE_MINUTE = (60 * _ONE_SECOND)
+_ONE_HOUR = (60 * _ONE_MINUTE)
+_ONE_DAY = (24 * _ONE_HOUR)
 
 # ---------------------------------------------------------------------
 # Offset names ("time rules") and related functions
 
-
-from pandas.tseries.offsets import (Nano, Micro, Milli, Second,  # noqa
-                                    Minute, Hour,
-                                    Day, BDay, CDay, Week, MonthBegin,
-                                    MonthEnd, BMonthBegin, BMonthEnd,
-                                    QuarterBegin, QuarterEnd, BQuarterBegin,
-                                    BQuarterEnd, YearBegin, YearEnd,
-                                    BYearBegin, BYearEnd, prefix_mapping)
-try:
-    cday = CDay()
-except NotImplementedError:
-    cday = None
-
 #: cache of previously seen offsets
 _offset_map = {}
 
-_offset_to_period_map = {
-    'WEEKDAY': 'D',
-    'EOM': 'M',
-    'BM': 'M',
-    'BQS': 'Q',
-    'QS': 'Q',
-    'BQ': 'Q',
-    'BA': 'A',
-    'AS': 'A',
-    'BAS': 'A',
-    'MS': 'M',
-    'D': 'D',
-    'C': 'C',
-    'B': 'B',
-    'T': 'T',
-    'S': 'S',
-    'L': 'L',
-    'U': 'U',
-    'N': 'N',
-    'H': 'H',
-    'Q': 'Q',
-    'A': 'A',
-    'W': 'W',
-    'M': 'M'
-}
-
-need_suffix = ['QS', 'BQ', 'BQS', 'AS', 'BA', 'BAS']
-for __prefix in need_suffix:
-    for _m in tslib._MONTHS:
-        _offset_to_period_map['%s-%s' % (__prefix, _m)] = \
-            _offset_to_period_map[__prefix]
-for __prefix in ['A', 'Q']:
-    for _m in tslib._MONTHS:
-        _alias = '%s-%s' % (__prefix, _m)
-        _offset_to_period_map[_alias] = _alias
-
-_days = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-for _d in _days:
-    _offset_to_period_map['W-%s' % _d] = 'W-%s' % _d
-
 
 def get_period_alias(offset_str):
     """ alias to closest period strings BQ->Q etc"""
     return _offset_to_period_map.get(offset_str, None)
 
 
-_lite_rule_alias = {
-    'W': 'W-SUN',
-    'Q': 'Q-DEC',
-
-    'A': 'A-DEC',  # YearEnd(month=12),
-    'AS': 'AS-JAN',  # YearBegin(month=1),
-    'BA': 'BA-DEC',  # BYearEnd(month=12),
-    'BAS': 'BAS-JAN',  # BYearBegin(month=1),
-
-    'Min': 'T',
-    'min': 'T',
-    'ms': 'L',
-    'us': 'U',
-    'ns': 'N'
-}
-
-
 _name_to_offset_map = {'days': Day(1),
                        'hours': Hour(1),
                        'minutes': Minute(1),
@@ -447,10 +56,6 @@ def get_period_alias(offset_str):
                        'nanoseconds': Nano(1)}
 
 
-_INVALID_FREQ_ERROR = "Invalid frequency: {0}"
-
-
-@deprecate_kwarg(old_arg_name='freqstr', new_arg_name='freq')
 def to_offset(freq):
     """
     Return DateOffset object from string or tuple representation
@@ -462,8 +67,8 @@ def to_offset(freq):
 
     Returns
     -------
-    delta : DateOffset
-        None if freq is None
+    DateOffset
+        None if freq is None.
 
     Raises
     ------
@@ -472,7 +77,7 @@ def to_offset(freq):
 
     See Also
     --------
-    pandas.DateOffset
+    DateOffset
 
     Examples
     --------
@@ -505,7 +110,7 @@ def to_offset(freq):
         stride = freq[1]
         if isinstance(stride, compat.string_types):
             name, stride = stride, name
-        name, _ = _base_and_stride(name)
+        name, _ = libfreqs._base_and_stride(name)
         delta = get_offset(name) * stride
 
     elif isinstance(freq, timedelta):
@@ -522,13 +127,13 @@ def to_offset(freq):
                     else:
                         delta = delta + offset
         except Exception:
-            raise ValueError(_INVALID_FREQ_ERROR.format(freq))
+            raise ValueError(libfreqs.INVALID_FREQ_ERR_MSG.format(freq))
 
     else:
         delta = None
         stride_sign = None
         try:
-            splitted = re.split(opattern, freq)
+            splitted = re.split(libfreqs.opattern, freq)
             if splitted[-1] != '' and not splitted[-1].isspace():
                 # the last element must be blank
                 raise ValueError('last element must be blank')
@@ -536,7 +141,7 @@ def to_offset(freq):
                                          splitted[2::4]):
                 if sep != '' and not sep.isspace():
                     raise ValueError('separator must be spaces')
-                prefix = _lite_rule_alias.get(name) or name
+                prefix = libfreqs._lite_rule_alias.get(name) or name
                 if stride_sign is None:
                     stride_sign = -1 if stride.startswith('-') else 1
                 if not stride:
@@ -553,55 +158,14 @@ def to_offset(freq):
                 else:
                     delta = delta + offset
         except Exception:
-            raise ValueError(_INVALID_FREQ_ERROR.format(freq))
+            raise ValueError(libfreqs.INVALID_FREQ_ERR_MSG.format(freq))
 
     if delta is None:
-        raise ValueError(_INVALID_FREQ_ERROR.format(freq))
+        raise ValueError(libfreqs.INVALID_FREQ_ERR_MSG.format(freq))
 
     return delta
 
 
-# hack to handle WOM-1MON
-opattern = re.compile(
-    r'([\-]?\d*|[\-]?\d*\.\d*)\s*([A-Za-z]+([\-][\dA-Za-z\-]+)?)'
-)
-
-
-def _base_and_stride(freqstr):
-    """
-    Return base freq and stride info from string representation
-
-    Examples
-    --------
-    _freq_and_stride('5Min') -> 'Min', 5
-    """
-    groups = opattern.match(freqstr)
-
-    if not groups:
-        raise ValueError("Could not evaluate %s" % freqstr)
-
-    stride = groups.group(1)
-
-    if len(stride):
-        stride = int(stride)
-    else:
-        stride = 1
-
-    base = groups.group(2)
-
-    return (base, stride)
-
-
-def get_base_alias(freqstr):
-    """
-    Returns the base frequency alias, e.g., '5D' -> 'D'
-    """
-    return _base_and_stride(freqstr)[0]
-
-
-_dont_uppercase = set(('MS', 'ms'))
-
-
 def get_offset(name):
     """
     Return DateOffset object associated with rule name
@@ -610,12 +174,12 @@ def get_offset(name):
     --------
     get_offset('EOM') --> BMonthEnd(1)
     """
-    if name not in _dont_uppercase:
+    if name not in libfreqs._dont_uppercase:
         name = name.upper()
-        name = _lite_rule_alias.get(name, name)
-        name = _lite_rule_alias.get(name.lower(), name)
+        name = libfreqs._lite_rule_alias.get(name, name)
+        name = libfreqs._lite_rule_alias.get(name.lower(), name)
     else:
-        name = _lite_rule_alias.get(name, name)
+        name = libfreqs._lite_rule_alias.get(name, name)
 
     if name not in _offset_map:
         try:
@@ -626,124 +190,16 @@ def get_offset(name):
             offset = klass._from_name(*split[1:])
         except (ValueError, TypeError, KeyError):
             # bad prefix or suffix
-            raise ValueError(_INVALID_FREQ_ERROR.format(name))
+            raise ValueError(libfreqs.INVALID_FREQ_ERR_MSG.format(name))
         # cache
         _offset_map[name] = offset
-    # do not return cache because it's mutable
-    return _offset_map[name].copy()
-
-
-getOffset = get_offset
-
-
-def get_offset_name(offset):
-    """
-    Return rule name associated with a DateOffset object
-
-    Examples
-    --------
-    get_offset_name(BMonthEnd(1)) --> 'EOM'
-    """
-
-    msg = "get_offset_name(offset) is deprecated. Use offset.freqstr instead"
-    warnings.warn(msg, FutureWarning, stacklevel=2)
-    return offset.freqstr
 
-
-def get_standard_freq(freq):
-    """
-    Return the standardized frequency string
-    """
-
-    msg = ("get_standard_freq is deprecated. Use to_offset(freq).rule_code "
-           "instead.")
-    warnings.warn(msg, FutureWarning, stacklevel=2)
-    return to_offset(freq).rule_code
+    return _offset_map[name]
 
 
 # ---------------------------------------------------------------------
 # Period codes
 
-# period frequency constants corresponding to scikits timeseries
-# originals
-_period_code_map = {
-    # Annual freqs with various fiscal year ends.
-    # eg, 2005 for A-FEB runs Mar 1, 2004 to Feb 28, 2005
-    "A-DEC": 1000,  # Annual - December year end
-    "A-JAN": 1001,  # Annual - January year end
-    "A-FEB": 1002,  # Annual - February year end
-    "A-MAR": 1003,  # Annual - March year end
-    "A-APR": 1004,  # Annual - April year end
-    "A-MAY": 1005,  # Annual - May year end
-    "A-JUN": 1006,  # Annual - June year end
-    "A-JUL": 1007,  # Annual - July year end
-    "A-AUG": 1008,  # Annual - August year end
-    "A-SEP": 1009,  # Annual - September year end
-    "A-OCT": 1010,  # Annual - October year end
-    "A-NOV": 1011,  # Annual - November year end
-
-    # Quarterly frequencies with various fiscal year ends.
-    # eg, Q42005 for Q-OCT runs Aug 1, 2005 to Oct 31, 2005
-    "Q-DEC": 2000,    # Quarterly - December year end
-    "Q-JAN": 2001,    # Quarterly - January year end
-    "Q-FEB": 2002,    # Quarterly - February year end
-    "Q-MAR": 2003,    # Quarterly - March year end
-    "Q-APR": 2004,    # Quarterly - April year end
-    "Q-MAY": 2005,    # Quarterly - May year end
-    "Q-JUN": 2006,    # Quarterly - June year end
-    "Q-JUL": 2007,    # Quarterly - July year end
-    "Q-AUG": 2008,    # Quarterly - August year end
-    "Q-SEP": 2009,    # Quarterly - September year end
-    "Q-OCT": 2010,    # Quarterly - October year end
-    "Q-NOV": 2011,    # Quarterly - November year end
-
-    "M": 3000,        # Monthly
-
-    "W-SUN": 4000,    # Weekly - Sunday end of week
-    "W-MON": 4001,    # Weekly - Monday end of week
-    "W-TUE": 4002,    # Weekly - Tuesday end of week
-    "W-WED": 4003,    # Weekly - Wednesday end of week
-    "W-THU": 4004,    # Weekly - Thursday end of week
-    "W-FRI": 4005,    # Weekly - Friday end of week
-    "W-SAT": 4006,    # Weekly - Saturday end of week
-
-    "B": 5000,        # Business days
-    "D": 6000,        # Daily
-    "H": 7000,        # Hourly
-    "T": 8000,        # Minutely
-    "S": 9000,        # Secondly
-    "L": 10000,       # Millisecondly
-    "U": 11000,       # Microsecondly
-    "N": 12000,       # Nanosecondly
-}
-
-_reverse_period_code_map = {}
-for _k, _v in compat.iteritems(_period_code_map):
-    _reverse_period_code_map[_v] = _k
-
-# Additional aliases
-_period_code_map.update({
-    "Q": 2000,  # Quarterly - December year end (default quarterly)
-    "A": 1000,  # Annual
-    "W": 4000,  # Weekly
-    "C": 5000,  # Custom Business Day
-})
-
-
-def _period_str_to_code(freqstr):
-    freqstr = _lite_rule_alias.get(freqstr, freqstr)
-
-    if freqstr not in _dont_uppercase:
-        lower = freqstr.lower()
-        freqstr = _lite_rule_alias.get(lower, freqstr)
-
-    if freqstr not in _dont_uppercase:
-        freqstr = freqstr.upper()
-    try:
-        return _period_code_map[freqstr]
-    except KeyError:
-        raise ValueError(_INVALID_FREQ_ERROR.format(freqstr))
-
 
 def infer_freq(index, warn=True):
     """
@@ -758,7 +214,7 @@ def infer_freq(index, warn=True):
 
     Returns
     -------
-    freq : string or None
+    str or None
         None if no discernible frequency
         TypeError if the index is not datetime-like
         ValueError if there are less than three values.
@@ -770,21 +226,22 @@ def infer_freq(index, warn=True):
         if not (is_datetime64_dtype(values) or
                 is_timedelta64_dtype(values) or
                 values.dtype == object):
-            raise TypeError("cannot infer freq from a non-convertible "
-                            "dtype on a Series of {0}".format(index.dtype))
+            raise TypeError("cannot infer freq from a non-convertible dtype "
+                            "on a Series of {dtype}".format(dtype=index.dtype))
         index = values
 
     if is_period_arraylike(index):
         raise TypeError("PeriodIndex given. Check the `freq` attribute "
                         "instead of using infer_freq.")
-    elif isinstance(index, pd.TimedeltaIndex):
+    elif is_timedelta64_dtype(index):
+        # Allow TimedeltaIndex and TimedeltaArray
         inferer = _TimedeltaFrequencyInferer(index, warn=warn)
         return inferer.get_freq()
 
     if isinstance(index, pd.Index) and not isinstance(index, pd.DatetimeIndex):
         if isinstance(index, (pd.Int64Index, pd.Float64Index)):
             raise TypeError("cannot infer freq from a non-convertible index "
-                            "type {0}".format(type(index)))
+                            "type {type}".format(type=type(index)))
         index = index.values
 
     if not isinstance(index, pd.DatetimeIndex):
@@ -797,14 +254,6 @@ def infer_freq(index, warn=True):
     return inferer.get_freq()
 
 
-_ONE_MICRO = long(1000)
-_ONE_MILLI = _ONE_MICRO * 1000
-_ONE_SECOND = _ONE_MILLI * 1000
-_ONE_MINUTE = 60 * _ONE_SECOND
-_ONE_HOUR = 60 * _ONE_MINUTE
-_ONE_DAY = 24 * _ONE_HOUR
-
-
 class _FrequencyInferer(object):
     """
     Not sure if I can avoid the state machine here
@@ -812,29 +261,29 @@ class _FrequencyInferer(object):
 
     def __init__(self, index, warn=True):
         self.index = index
-        self.values = np.asarray(index).view('i8')
+        self.values = index.asi8
 
         # This moves the values, which are implicitly in UTC, to the
         # the timezone so they are in local time
         if hasattr(index, 'tz'):
             if index.tz is not None:
-                self.values = tslib.tz_convert(self.values, 'UTC', index.tz)
+                self.values = tz_convert(self.values, UTC, index.tz)
 
         self.warn = warn
 
         if len(index) < 3:
             raise ValueError('Need at least 3 dates to infer frequency')
 
-        self.is_monotonic = (self.index.is_monotonic_increasing or
-                             self.index.is_monotonic_decreasing)
+        self.is_monotonic = (self.index._is_monotonic_increasing or
+                             self.index._is_monotonic_decreasing)
 
     @cache_readonly
     def deltas(self):
-        return tslib.unique_deltas(self.values)
+        return unique_deltas(self.values)
 
     @cache_readonly
     def deltas_asi8(self):
-        return tslib.unique_deltas(self.index.asi8)
+        return unique_deltas(self.index.asi8)
 
     @cache_readonly
     def is_unique(self):
@@ -845,40 +294,49 @@ def is_unique_asi8(self):
         return len(self.deltas_asi8) == 1
 
     def get_freq(self):
-        if not self.is_monotonic or not self.index.is_unique:
+        """
+        Find the appropriate frequency string to describe the inferred
+        frequency of self.values
+
+        Returns
+        -------
+        str or None
+        """
+        if not self.is_monotonic or not self.index._is_unique:
             return None
 
         delta = self.deltas[0]
         if _is_multiple(delta, _ONE_DAY):
             return self._infer_daily_rule()
+
+        # Business hourly, maybe. 17: one day / 65: one weekend
+        if self.hour_deltas in ([1, 17], [1, 65], [1, 17, 65]):
+            return 'BH'
+        # Possibly intraday frequency.  Here we use the
+        # original .asi8 values as the modified values
+        # will not work around DST transitions.  See #8772
+        elif not self.is_unique_asi8:
+            return None
+
+        delta = self.deltas_asi8[0]
+        if _is_multiple(delta, _ONE_HOUR):
+            # Hours
+            return _maybe_add_count('H', delta / _ONE_HOUR)
+        elif _is_multiple(delta, _ONE_MINUTE):
+            # Minutes
+            return _maybe_add_count('T', delta / _ONE_MINUTE)
+        elif _is_multiple(delta, _ONE_SECOND):
+            # Seconds
+            return _maybe_add_count('S', delta / _ONE_SECOND)
+        elif _is_multiple(delta, _ONE_MILLI):
+            # Milliseconds
+            return _maybe_add_count('L', delta / _ONE_MILLI)
+        elif _is_multiple(delta, _ONE_MICRO):
+            # Microseconds
+            return _maybe_add_count('U', delta / _ONE_MICRO)
         else:
-            # Business hourly, maybe. 17: one day / 65: one weekend
-            if self.hour_deltas in ([1, 17], [1, 65], [1, 17, 65]):
-                return 'BH'
-            # Possibly intraday frequency.  Here we use the
-            # original .asi8 values as the modified values
-            # will not work around DST transitions.  See #8772
-            elif not self.is_unique_asi8:
-                return None
-            delta = self.deltas_asi8[0]
-            if _is_multiple(delta, _ONE_HOUR):
-                # Hours
-                return _maybe_add_count('H', delta / _ONE_HOUR)
-            elif _is_multiple(delta, _ONE_MINUTE):
-                # Minutes
-                return _maybe_add_count('T', delta / _ONE_MINUTE)
-            elif _is_multiple(delta, _ONE_SECOND):
-                # Seconds
-                return _maybe_add_count('S', delta / _ONE_SECOND)
-            elif _is_multiple(delta, _ONE_MILLI):
-                # Milliseconds
-                return _maybe_add_count('L', delta / _ONE_MILLI)
-            elif _is_multiple(delta, _ONE_MICRO):
-                # Microseconds
-                return _maybe_add_count('U', delta / _ONE_MICRO)
-            else:
-                # Nanoseconds
-                return _maybe_add_count('N', delta)
+            # Nanoseconds
+            return _maybe_add_count('N', delta)
 
     @cache_readonly
     def day_deltas(self):
@@ -890,76 +348,41 @@ def hour_deltas(self):
 
     @cache_readonly
     def fields(self):
-        return tslib.build_field_sarray(self.values)
+        return build_field_sarray(self.values)
 
     @cache_readonly
     def rep_stamp(self):
-        return lib.Timestamp(self.values[0])
+        return Timestamp(self.values[0])
 
     def month_position_check(self):
-        # TODO: cythonize this, very slow
-        calendar_end = True
-        business_end = True
-        calendar_start = True
-        business_start = True
-
-        years = self.fields['Y']
-        months = self.fields['M']
-        days = self.fields['D']
-        weekdays = self.index.dayofweek
-
-        from calendar import monthrange
-        for y, m, d, wd in zip(years, months, days, weekdays):
-
-            if calendar_start:
-                calendar_start &= d == 1
-            if business_start:
-                business_start &= d == 1 or (d <= 3 and wd == 0)
-
-            if calendar_end or business_end:
-                _, daysinmonth = monthrange(y, m)
-                cal = d == daysinmonth
-                if calendar_end:
-                    calendar_end &= cal
-                if business_end:
-                    business_end &= cal or (daysinmonth - d < 3 and wd == 4)
-            elif not calendar_start and not business_start:
-                break
-
-        if calendar_end:
-            return 'ce'
-        elif business_end:
-            return 'be'
-        elif calendar_start:
-            return 'cs'
-        elif business_start:
-            return 'bs'
-        else:
-            return None
+        return libresolution.month_position_check(self.fields,
+                                                  self.index.dayofweek)
 
     @cache_readonly
     def mdiffs(self):
         nmonths = self.fields['Y'] * 12 + self.fields['M']
-        return tslib.unique_deltas(nmonths.astype('i8'))
+        return unique_deltas(nmonths.astype('i8'))
 
     @cache_readonly
     def ydiffs(self):
-        return tslib.unique_deltas(self.fields['Y'].astype('i8'))
+        return unique_deltas(self.fields['Y'].astype('i8'))
 
     def _infer_daily_rule(self):
         annual_rule = self._get_annual_rule()
         if annual_rule:
             nyears = self.ydiffs[0]
-            month = _month_aliases[self.rep_stamp.month]
-            return _maybe_add_count('%s-%s' % (annual_rule, month), nyears)
+            month = MONTH_ALIASES[self.rep_stamp.month]
+            alias = '{prefix}-{month}'.format(prefix=annual_rule, month=month)
+            return _maybe_add_count(alias, nyears)
 
         quarterly_rule = self._get_quarterly_rule()
         if quarterly_rule:
             nquarters = self.mdiffs[0] / 3
             mod_dict = {0: 12, 2: 11, 1: 10}
-            month = _month_aliases[mod_dict[self.rep_stamp.month % 3]]
-            return _maybe_add_count('%s-%s' % (quarterly_rule, month),
-                                    nquarters)
+            month = MONTH_ALIASES[mod_dict[self.rep_stamp.month % 3]]
+            alias = '{prefix}-{month}'.format(prefix=quarterly_rule,
+                                              month=month)
+            return _maybe_add_count(alias, nquarters)
 
         monthly_rule = self._get_monthly_rule()
         if monthly_rule:
@@ -969,13 +392,13 @@ def _infer_daily_rule(self):
             days = self.deltas[0] / _ONE_DAY
             if days % 7 == 0:
                 # Weekly
-                alias = _weekday_rule_aliases[self.rep_stamp.weekday()]
-                return _maybe_add_count('W-%s' % alias, days / 7)
+                day = int_to_weekday[self.rep_stamp.weekday()]
+                return _maybe_add_count(
+                    'W-{day}'.format(day=day), days / 7)
             else:
                 return _maybe_add_count('D', days)
 
-        # Business daily. Maybe
-        if self.day_deltas == [1, 3]:
+        if self._is_business_daily():
             return 'B'
 
         wom_rule = self._get_wom_rule()
@@ -986,7 +409,7 @@ def _get_annual_rule(self):
         if len(self.ydiffs) > 1:
             return None
 
-        if len(algos.unique(self.fields['M'])) > 1:
+        if len(unique(self.fields['M'])) > 1:
             return None
 
         pos_check = self.month_position_check()
@@ -1011,6 +434,19 @@ def _get_monthly_rule(self):
         return {'cs': 'MS', 'bs': 'BMS',
                 'ce': 'M', 'be': 'BM'}.get(pos_check)
 
+    def _is_business_daily(self):
+        # quick check: cannot be business daily
+        if self.day_deltas != [1, 3]:
+            return False
+
+        # probably business daily, but need to confirm
+        first_weekday = self.index[0].weekday()
+        shifts = np.diff(self.index.asi8)
+        shifts = np.floor_divide(shifts, _ONE_DAY)
+        weekdays = np.mod(first_weekday + np.cumsum(shifts), 7)
+        return np.all(((weekdays == 0) & (shifts == 3)) |
+                      ((weekdays > 0) & (weekdays <= 4) & (shifts == 1)))
+
     def _get_wom_rule(self):
         #         wdiffs = unique(np.diff(self.index.week))
         # We also need -47, -49, -48 to catch index spanning year boundary
@@ -1029,9 +465,9 @@ def _get_wom_rule(self):
 
         # get which week
         week = week_of_months[0] + 1
-        wd = _weekday_rule_aliases[weekdays[0]]
+        wd = int_to_weekday[weekdays[0]]
 
-        return 'WOM-%d%s' % (week, wd)
+        return 'WOM-{week}{weekday}'.format(week=week, weekday=wd)
 
 
 class _TimedeltaFrequencyInferer(_FrequencyInferer):
@@ -1041,184 +477,21 @@ def _infer_daily_rule(self):
             days = self.deltas[0] / _ONE_DAY
             if days % 7 == 0:
                 # Weekly
-                alias = _weekday_rule_aliases[self.rep_stamp.weekday()]
-                return _maybe_add_count('W-%s' % alias, days / 7)
+                wd = int_to_weekday[self.rep_stamp.weekday()]
+                alias = 'W-{weekday}'.format(weekday=wd)
+                return _maybe_add_count(alias, days / 7)
             else:
                 return _maybe_add_count('D', days)
 
 
+def _is_multiple(us, mult):
+    return us % mult == 0
+
+
 def _maybe_add_count(base, count):
     if count != 1:
-        return '%d%s' % (count, base)
+        assert count == int(count)
+        count = int(count)
+        return '{count}{base}'.format(count=count, base=base)
     else:
         return base
-
-
-def _maybe_coerce_freq(code):
-    """ we might need to coerce a code to a rule_code
-    and uppercase it
-
-    Parameters
-    ----------
-    source : string
-        Frequency converting from
-
-    Returns
-    -------
-    string code
-    """
-
-    assert code is not None
-    if isinstance(code, offsets.DateOffset):
-        code = code.rule_code
-    return code.upper()
-
-
-def is_subperiod(source, target):
-    """
-    Returns True if downsampling is possible between source and target
-    frequencies
-
-    Parameters
-    ----------
-    source : string
-        Frequency converting from
-    target : string
-        Frequency converting to
-
-    Returns
-    -------
-    is_subperiod : boolean
-    """
-
-    if target is None or source is None:
-        return False
-    source = _maybe_coerce_freq(source)
-    target = _maybe_coerce_freq(target)
-
-    if _is_annual(target):
-        if _is_quarterly(source):
-            return _quarter_months_conform(_get_rule_month(source),
-                                           _get_rule_month(target))
-        return source in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_quarterly(target):
-        return source in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_monthly(target):
-        return source in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_weekly(target):
-        return source in [target, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'B':
-        return source in ['B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'C':
-        return source in ['C', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'D':
-        return source in ['D', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'H':
-        return source in ['H', 'T', 'S', 'L', 'U', 'N']
-    elif target == 'T':
-        return source in ['T', 'S', 'L', 'U', 'N']
-    elif target == 'S':
-        return source in ['S', 'L', 'U', 'N']
-    elif target == 'L':
-        return source in ['L', 'U', 'N']
-    elif target == 'U':
-        return source in ['U', 'N']
-    elif target == 'N':
-        return source in ['N']
-
-
-def is_superperiod(source, target):
-    """
-    Returns True if upsampling is possible between source and target
-    frequencies
-
-    Parameters
-    ----------
-    source : string
-        Frequency converting from
-    target : string
-        Frequency converting to
-
-    Returns
-    -------
-    is_superperiod : boolean
-    """
-    if target is None or source is None:
-        return False
-    source = _maybe_coerce_freq(source)
-    target = _maybe_coerce_freq(target)
-
-    if _is_annual(source):
-        if _is_annual(target):
-            return _get_rule_month(source) == _get_rule_month(target)
-
-        if _is_quarterly(target):
-            smonth = _get_rule_month(source)
-            tmonth = _get_rule_month(target)
-            return _quarter_months_conform(smonth, tmonth)
-        return target in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_quarterly(source):
-        return target in ['D', 'C', 'B', 'M', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_monthly(source):
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif _is_weekly(source):
-        return target in [source, 'D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'B':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'C':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'D':
-        return target in ['D', 'C', 'B', 'H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'H':
-        return target in ['H', 'T', 'S', 'L', 'U', 'N']
-    elif source == 'T':
-        return target in ['T', 'S', 'L', 'U', 'N']
-    elif source == 'S':
-        return target in ['S', 'L', 'U', 'N']
-    elif source == 'L':
-        return target in ['L', 'U', 'N']
-    elif source == 'U':
-        return target in ['U', 'N']
-    elif source == 'N':
-        return target in ['N']
-
-
-_get_rule_month = tslib._get_rule_month
-
-
-def _is_annual(rule):
-    rule = rule.upper()
-    return rule == 'A' or rule.startswith('A-')
-
-
-def _quarter_months_conform(source, target):
-    snum = _month_numbers[source]
-    tnum = _month_numbers[target]
-    return snum % 3 == tnum % 3
-
-
-def _is_quarterly(rule):
-    rule = rule.upper()
-    return rule == 'Q' or rule.startswith('Q-') or rule.startswith('BQ')
-
-
-def _is_monthly(rule):
-    rule = rule.upper()
-    return rule == 'M' or rule == 'BM'
-
-
-def _is_weekly(rule):
-    rule = rule.upper()
-    return rule == 'W' or rule.startswith('W-')
-
-
-DAYS = ['MON', 'TUE', 'WED', 'THU', 'FRI', 'SAT', 'SUN']
-
-MONTHS = tslib._MONTHS
-_month_numbers = tslib._MONTH_NUMBERS
-_month_aliases = tslib._MONTH_ALIASES
-_weekday_rule_aliases = dict((k, v) for k, v in enumerate(DAYS))
-
-
-def _is_multiple(us, mult):
-    return us % mult == 0
diff --git a/pandas/tseries/holiday.py b/pandas/tseries/holiday.py
index 9acb52ebe0e9f..4016114919f5b 100644
--- a/pandas/tseries/holiday.py
+++ b/pandas/tseries/holiday.py
@@ -1,12 +1,16 @@
+from datetime import datetime, timedelta
 import warnings
 
-from pandas import DateOffset, DatetimeIndex, Series, Timestamp
-from pandas.compat import add_metaclass
-from datetime import datetime, timedelta
-from dateutil.relativedelta import MO, TU, WE, TH, FR, SA, SU  # noqa
-from pandas.tseries.offsets import Easter, Day
+from dateutil.relativedelta import FR, MO, SA, SU, TH, TU, WE  # noqa
 import numpy as np
 
+from pandas.compat import add_metaclass
+from pandas.errors import PerformanceWarning
+
+from pandas import DateOffset, Series, Timestamp, date_range
+
+from pandas.tseries.offsets import Day, Easter
+
 
 def next_monday(dt):
     """
@@ -133,7 +137,7 @@ def __init__(self, name, year=None, month=None, day=None, offset=None,
             Name of the holiday , defaults to class name
         offset : array of pandas.tseries.offsets or
                 class from pandas.tseries.offsets
-            computes offset from  date
+            computes offset from date
         observance: function
             computes when holiday is given a pandas Timestamp
         days_of_week:
@@ -143,12 +147,11 @@ class from pandas.tseries.offsets
         Examples
         --------
         >>> from pandas.tseries.holiday import Holiday, nearest_workday
-        >>> from pandas import DateOffset
         >>> from dateutil.relativedelta import MO
         >>> USMemorialDay = Holiday('MemorialDay', month=5, day=24,
-                                    offset=DateOffset(weekday=MO(1)))
+                                    offset=pd.DateOffset(weekday=MO(1)))
         >>> USLaborDay = Holiday('Labor Day', month=9, day=1,
-                            offset=DateOffset(weekday=MO(1)))
+                                offset=pd.DateOffset(weekday=MO(1)))
         >>> July3rd = Holiday('July 3rd', month=7, day=3,)
         >>> NewYears = Holiday('New Years Day', month=1,  day=1,
                                observance=nearest_workday),
@@ -174,16 +177,16 @@ class from pandas.tseries.offsets
     def __repr__(self):
         info = ''
         if self.year is not None:
-            info += 'year=%s, ' % self.year
-        info += 'month=%s, day=%s, ' % (self.month, self.day)
+            info += 'year={year}, '.format(year=self.year)
+        info += 'month={mon}, day={day}, '.format(mon=self.month, day=self.day)
 
         if self.offset is not None:
-            info += 'offset=%s' % self.offset
+            info += 'offset={offset}'.format(offset=self.offset)
 
         if self.observance is not None:
-            info += 'observance=%s' % self.observance
+            info += 'observance={obs}'.format(obs=self.observance)
 
-        repr = 'Holiday: %s (%s)' % (self.name, info)
+        repr = 'Holiday: {name} ({info})'.format(name=self.name, info=info)
         return repr
 
     def dates(self, start_date, end_date, return_name=False):
@@ -251,9 +254,9 @@ def _reference_dates(self, start_date, end_date):
         reference_end_date = Timestamp(
             datetime(end_date.year + 1, self.month, self.day))
         # Don't process unnecessary holidays
-        dates = DatetimeIndex(start=reference_start_date,
-                              end=reference_end_date,
-                              freq=year_offset, tz=start_date.tz)
+        dates = date_range(start=reference_start_date,
+                           end=reference_end_date,
+                           freq=year_offset, tz=start_date.tz)
 
         return dates
 
@@ -282,7 +285,8 @@ def _apply_rule(self, dates):
 
                 # if we are adding a non-vectorized value
                 # ignore the PerformanceWarnings:
-                with warnings.catch_warnings(record=True):
+                with warnings.catch_warnings():
+                    warnings.simplefilter("ignore", PerformanceWarning)
                     dates += offset
         return dates
 
@@ -293,7 +297,7 @@ def _apply_rule(self, dates):
 def register(cls):
     try:
         name = cls.name
-    except:
+    except AttributeError:
         name = cls.__name__
     holiday_calendars[name] = cls
 
@@ -374,8 +378,8 @@ def holidays(self, start=None, end=None, return_name=False):
             DatetimeIndex of holidays
         """
         if self.rules is None:
-            raise Exception('Holiday Calendar %s does not have any '
-                            'rules specified' % self.name)
+            raise Exception('Holiday Calendar {name} does not have any '
+                            'rules specified'.format(name=self.name))
 
         if start is None:
             start = AbstractHolidayCalendar.start_date
@@ -425,21 +429,21 @@ def merge_class(base, other):
         """
         try:
             other = other.rules
-        except:
+        except AttributeError:
             pass
 
         if not isinstance(other, list):
             other = [other]
-        other_holidays = dict((holiday.name, holiday) for holiday in other)
+        other_holidays = {holiday.name: holiday for holiday in other}
 
         try:
             base = base.rules
-        except:
+        except AttributeError:
             pass
 
         if not isinstance(base, list):
             base = [base]
-        base_holidays = dict([(holiday.name, holiday) for holiday in base])
+        base_holidays = {holiday.name: holiday for holiday in base}
 
         other_holidays.update(base_holidays)
         return list(other_holidays.values())
diff --git a/pandas/tseries/index.py b/pandas/tseries/index.py
deleted file mode 100644
index 9123131a6dccf..0000000000000
--- a/pandas/tseries/index.py
+++ /dev/null
@@ -1,2181 +0,0 @@
-# pylint: disable=E1101
-from __future__ import division
-import operator
-import warnings
-from datetime import time, datetime
-from datetime import timedelta
-import numpy as np
-from pandas.core.base import _shared_docs
-
-from pandas.types.common import (_NS_DTYPE, _INT64_DTYPE,
-                                 is_object_dtype, is_datetime64_dtype,
-                                 is_datetimetz, is_dtype_equal,
-                                 is_integer, is_float,
-                                 is_integer_dtype,
-                                 is_datetime64_ns_dtype,
-                                 is_period_dtype,
-                                 is_bool_dtype,
-                                 is_string_dtype,
-                                 is_list_like,
-                                 is_scalar,
-                                 pandas_dtype,
-                                 _ensure_int64)
-from pandas.types.generic import ABCSeries
-from pandas.types.dtypes import DatetimeTZDtype
-from pandas.types.missing import isnull
-
-import pandas.types.concat as _concat
-from pandas.core.common import (_values_from_object, _maybe_box,
-                                PerformanceWarning)
-
-from pandas.core.index import Index, Int64Index, Float64Index
-from pandas.indexes.base import _index_shared_docs
-import pandas.compat as compat
-from pandas.tseries.frequencies import (
-    to_offset, get_period_alias,
-    Resolution)
-from pandas.tseries.base import DatelikeOps, TimelikeOps, DatetimeIndexOpsMixin
-from pandas.tseries.offsets import DateOffset, generate_range, Tick, CDay
-from pandas.tseries.tools import parse_time_string, normalize_date, to_time
-from pandas.tseries.timedeltas import to_timedelta
-from pandas.util.decorators import (Appender, cache_readonly,
-                                    deprecate_kwarg, Substitution)
-import pandas.core.common as com
-import pandas.tseries.offsets as offsets
-import pandas.tseries.tools as tools
-
-from pandas._libs import (lib, index as libindex, tslib as libts,
-                          algos as libalgos, join as libjoin,
-                          Timestamp, period as libperiod)
-
-
-def _utc():
-    import pytz
-    return pytz.utc
-
-# -------- some conversion wrapper functions
-
-
-def _field_accessor(name, field, docstring=None):
-    def f(self):
-        values = self.asi8
-        if self.tz is not None:
-            utc = _utc()
-            if self.tz is not utc:
-                values = self._local_timestamps()
-
-        if field in self._bool_ops:
-            if field in ['is_month_start', 'is_month_end',
-                         'is_quarter_start', 'is_quarter_end',
-                         'is_year_start', 'is_year_end']:
-                month_kw = (self.freq.kwds.get('startingMonth',
-                                               self.freq.kwds.get('month', 12))
-                            if self.freq else 12)
-
-                result = libts.get_start_end_field(values, field, self.freqstr,
-                                                   month_kw)
-            else:
-                result = libts.get_date_field(values, field)
-
-            # these return a boolean by-definition
-            return result
-
-        if field in self._object_ops:
-            result = libts.get_date_name_field(values, field)
-            result = self._maybe_mask_results(result)
-
-        else:
-            result = libts.get_date_field(values, field)
-            result = self._maybe_mask_results(result, convert='float64')
-
-        return Index(result, name=self.name)
-
-    f.__name__ = name
-    f.__doc__ = docstring
-    return property(f)
-
-
-def _dt_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert datetime-like to datetime64
-    """
-
-    def wrapper(self, other):
-        func = getattr(super(DatetimeIndex, self), opname)
-        if (isinstance(other, datetime) or
-                isinstance(other, compat.string_types)):
-            other = _to_m8(other, tz=self.tz)
-            result = func(other)
-            if isnull(other):
-                result.fill(nat_result)
-        else:
-            if isinstance(other, list):
-                other = DatetimeIndex(other)
-            elif not isinstance(other, (np.ndarray, Index, ABCSeries)):
-                other = _ensure_datetime64(other)
-            result = func(np.asarray(other))
-            result = _values_from_object(result)
-
-            if isinstance(other, Index):
-                o_mask = other.values.view('i8') == libts.iNaT
-            else:
-                o_mask = other.view('i8') == libts.iNaT
-
-            if o_mask.any():
-                result[o_mask] = nat_result
-
-        if self.hasnans:
-            result[self._isnan] = nat_result
-
-        # support of bool dtype indexers
-        if is_bool_dtype(result):
-            return result
-        return Index(result)
-
-    return wrapper
-
-
-def _ensure_datetime64(other):
-    if isinstance(other, np.datetime64):
-        return other
-    raise TypeError('%s type object %s' % (type(other), str(other)))
-
-
-_midnight = time(0, 0)
-
-
-def _new_DatetimeIndex(cls, d):
-    """ This is called upon unpickling, rather than the default which doesn't
-    have arguments and breaks __new__ """
-
-    # data are already in UTC
-    # so need to localize
-    tz = d.pop('tz', None)
-
-    result = cls.__new__(cls, verify_integrity=False, **d)
-    if tz is not None:
-        result = result.tz_localize('UTC').tz_convert(tz)
-    return result
-
-
-class DatetimeIndex(DatelikeOps, TimelikeOps, DatetimeIndexOpsMixin,
-                    Int64Index):
-    """
-    Immutable ndarray of datetime64 data, represented internally as int64, and
-    which can be boxed to Timestamp objects that are subclasses of datetime and
-    carry metadata such as frequency information.
-
-    Parameters
-    ----------
-    data  : array-like (1-dimensional), optional
-        Optional datetime-like data to construct index with
-    copy  : bool
-        Make a copy of input ndarray
-    freq : string or pandas offset object, optional
-        One of pandas date offset strings or corresponding objects
-    start : starting value, datetime-like, optional
-        If data is None, start is used as the start point in generating regular
-        timestamp data.
-    periods  : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end   : end time, datetime-like, optional
-        If periods is none, generated index will extend to first conforming
-        time on or just past end argument
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-    tz : pytz.timezone or dateutil.tz.tzfile
-    ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
-        - 'infer' will attempt to infer fall dst-transition hours based on
-          order
-        - bool-ndarray where True signifies a DST time, False signifies a
-          non-DST time (note that this flag is only applicable for ambiguous
-          times)
-        - 'NaT' will return NaT where there are ambiguous times
-        - 'raise' will raise an AmbiguousTimeError if there are ambiguous times
-    infer_dst : boolean, default False (DEPRECATED)
-        Attempt to infer fall dst-transition hours based on order
-    name : object
-        Name to be stored in the index
-
-    Notes
-    -----
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-
-    _typ = 'datetimeindex'
-    _join_precedence = 10
-
-    def _join_i8_wrapper(joinf, **kwargs):
-        return DatetimeIndexOpsMixin._join_i8_wrapper(joinf, dtype='M8[ns]',
-                                                      **kwargs)
-
-    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
-    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
-    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
-    _left_indexer_unique = _join_i8_wrapper(
-        libjoin.left_join_indexer_unique_int64, with_indexers=False)
-    _arrmap = None
-
-    __eq__ = _dt_index_cmp('__eq__')
-    __ne__ = _dt_index_cmp('__ne__', nat_result=True)
-    __lt__ = _dt_index_cmp('__lt__')
-    __gt__ = _dt_index_cmp('__gt__')
-    __le__ = _dt_index_cmp('__le__')
-    __ge__ = _dt_index_cmp('__ge__')
-
-    _engine_type = libindex.DatetimeEngine
-
-    tz = None
-    offset = None
-    _comparables = ['name', 'freqstr', 'tz']
-    _attributes = ['name', 'freq', 'tz']
-
-    # define my properties & methods for delegation
-    _bool_ops = ['is_month_start', 'is_month_end',
-                 'is_quarter_start', 'is_quarter_end', 'is_year_start',
-                 'is_year_end', 'is_leap_year']
-    _object_ops = ['weekday_name', 'freq', 'tz']
-    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
-                  'weekofyear', 'week', 'weekday', 'dayofweek',
-                  'dayofyear', 'quarter', 'days_in_month',
-                  'daysinmonth', 'microsecond',
-                  'nanosecond']
-    _other_ops = ['date', 'time']
-    _datetimelike_ops = _field_ops + _object_ops + _bool_ops + _other_ops
-    _datetimelike_methods = ['to_period', 'tz_localize',
-                             'tz_convert',
-                             'normalize', 'strftime', 'round', 'floor',
-                             'ceil']
-
-    _is_numeric_dtype = False
-    _infer_as_myclass = True
-
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                     mapping={True: 'infer', False: 'raise'})
-    def __new__(cls, data=None,
-                freq=None, start=None, end=None, periods=None,
-                copy=False, name=None, tz=None,
-                verify_integrity=True, normalize=False,
-                closed=None, ambiguous='raise', dtype=None, **kwargs):
-
-        # This allows to later ensure that the 'copy' parameter is honored:
-        if isinstance(data, Index):
-            ref_to_data = data._data
-        else:
-            ref_to_data = data
-
-        if name is None and hasattr(data, 'name'):
-            name = data.name
-
-        dayfirst = kwargs.pop('dayfirst', None)
-        yearfirst = kwargs.pop('yearfirst', None)
-
-        freq_infer = False
-        if not isinstance(freq, DateOffset):
-
-            # if a passed freq is None, don't infer automatically
-            if freq != 'infer':
-                freq = to_offset(freq)
-            else:
-                freq_infer = True
-                freq = None
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if data is None and freq is None:
-            raise ValueError("Must provide freq argument if no data is "
-                             "supplied")
-
-        # if dtype has an embeded tz, capture it
-        if dtype is not None:
-            try:
-                dtype = DatetimeTZDtype.construct_from_string(dtype)
-                dtz = getattr(dtype, 'tz', None)
-                if dtz is not None:
-                    if tz is not None and str(tz) != str(dtz):
-                        raise ValueError("cannot supply both a tz and a dtype"
-                                         " with a tz")
-                    tz = dtz
-            except TypeError:
-                pass
-
-        if data is None:
-            return cls._generate(start, end, periods, name, freq,
-                                 tz=tz, normalize=normalize, closed=closed,
-                                 ambiguous=ambiguous)
-
-        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
-            if is_scalar(data):
-                raise ValueError('DatetimeIndex() must be called with a '
-                                 'collection of some kind, %s was passed'
-                                 % repr(data))
-            # other iterable of some kind
-            if not isinstance(data, (list, tuple)):
-                data = list(data)
-            data = np.asarray(data, dtype='O')
-        elif isinstance(data, ABCSeries):
-            data = data._values
-
-        # data must be Index or np.ndarray here
-        if not (is_datetime64_dtype(data) or is_datetimetz(data) or
-                is_integer_dtype(data)):
-            data = tools.to_datetime(data, dayfirst=dayfirst,
-                                     yearfirst=yearfirst)
-
-        if issubclass(data.dtype.type, np.datetime64) or is_datetimetz(data):
-
-            if isinstance(data, DatetimeIndex):
-                if tz is None:
-                    tz = data.tz
-                elif data.tz is None:
-                    data = data.tz_localize(tz, ambiguous=ambiguous)
-                else:
-                    # the tz's must match
-                    if str(tz) != str(data.tz):
-                        msg = ('data is already tz-aware {0}, unable to '
-                               'set specified tz: {1}')
-                        raise TypeError(msg.format(data.tz, tz))
-
-                subarr = data.values
-
-                if freq is None:
-                    freq = data.offset
-                    verify_integrity = False
-            else:
-                if data.dtype != _NS_DTYPE:
-                    subarr = libts.cast_to_nanoseconds(data)
-                else:
-                    subarr = data
-        else:
-            # must be integer dtype otherwise
-            if isinstance(data, Int64Index):
-                raise TypeError('cannot convert Int64Index->DatetimeIndex')
-            if data.dtype != _INT64_DTYPE:
-                data = data.astype(np.int64)
-            subarr = data.view(_NS_DTYPE)
-
-        if isinstance(subarr, DatetimeIndex):
-            if tz is None:
-                tz = subarr.tz
-        else:
-            if tz is not None:
-                tz = libts.maybe_get_tz(tz)
-
-                if (not isinstance(data, DatetimeIndex) or
-                        getattr(data, 'tz', None) is None):
-                    # Convert tz-naive to UTC
-                    ints = subarr.view('i8')
-                    subarr = libts.tz_localize_to_utc(ints, tz,
-                                                      ambiguous=ambiguous)
-                subarr = subarr.view(_NS_DTYPE)
-
-        subarr = cls._simple_new(subarr, name=name, freq=freq, tz=tz)
-        if dtype is not None:
-            if not is_dtype_equal(subarr.dtype, dtype):
-                # dtype must be coerced to DatetimeTZDtype above
-                if subarr.tz is not None:
-                    raise ValueError("cannot localize from non-UTC data")
-
-        if verify_integrity and len(subarr) > 0:
-            if freq is not None and not freq_infer:
-                inferred = subarr.inferred_freq
-                if inferred != freq.freqstr:
-                    on_freq = cls._generate(subarr[0], None, len(subarr), None,
-                                            freq, tz=tz, ambiguous=ambiguous)
-                    if not np.array_equal(subarr.asi8, on_freq.asi8):
-                        raise ValueError('Inferred frequency {0} from passed '
-                                         'dates does not conform to passed '
-                                         'frequency {1}'
-                                         .format(inferred, freq.freqstr))
-
-        if freq_infer:
-            inferred = subarr.inferred_freq
-            if inferred:
-                subarr.offset = to_offset(inferred)
-
-        return subarr._deepcopy_if_needed(ref_to_data, copy)
-
-    @classmethod
-    def _generate(cls, start, end, periods, name, offset,
-                  tz=None, normalize=False, ambiguous='raise', closed=None):
-        if com._count_not_none(start, end, periods) != 2:
-            raise ValueError('Must specify two of start, end, or periods')
-
-        _normalized = True
-
-        if start is not None:
-            start = Timestamp(start)
-
-        if end is not None:
-            end = Timestamp(end)
-
-        left_closed = False
-        right_closed = False
-
-        if start is None and end is None:
-            if closed is not None:
-                raise ValueError("Closed has to be None if not both of start"
-                                 "and end are defined")
-
-        if closed is None:
-            left_closed = True
-            right_closed = True
-        elif closed == "left":
-            left_closed = True
-        elif closed == "right":
-            right_closed = True
-        else:
-            raise ValueError("Closed has to be either 'left', 'right' or None")
-
-        try:
-            inferred_tz = tools._infer_tzinfo(start, end)
-        except:
-            raise TypeError('Start and end cannot both be tz-aware with '
-                            'different timezones')
-
-        inferred_tz = libts.maybe_get_tz(inferred_tz)
-
-        # these may need to be localized
-        tz = libts.maybe_get_tz(tz)
-        if tz is not None:
-            date = start or end
-            if date.tzinfo is not None and hasattr(tz, 'localize'):
-                tz = tz.localize(date.replace(tzinfo=None)).tzinfo
-
-        if tz is not None and inferred_tz is not None:
-            if not libts.get_timezone(inferred_tz) == libts.get_timezone(tz):
-                raise AssertionError("Inferred time zone not equal to passed "
-                                     "time zone")
-
-        elif inferred_tz is not None:
-            tz = inferred_tz
-
-        if start is not None:
-            if normalize:
-                start = normalize_date(start)
-                _normalized = True
-            else:
-                _normalized = _normalized and start.time() == _midnight
-
-        if end is not None:
-            if normalize:
-                end = normalize_date(end)
-                _normalized = True
-            else:
-                _normalized = _normalized and end.time() == _midnight
-
-        if hasattr(offset, 'delta') and offset != offsets.Day():
-            if inferred_tz is None and tz is not None:
-                # naive dates
-                if start is not None and start.tz is None:
-                    start = start.tz_localize(tz, ambiguous=False)
-
-                if end is not None and end.tz is None:
-                    end = end.tz_localize(tz, ambiguous=False)
-
-            if start and end:
-                if start.tz is None and end.tz is not None:
-                    start = start.tz_localize(end.tz, ambiguous=False)
-
-                if end.tz is None and start.tz is not None:
-                    end = end.tz_localize(start.tz, ambiguous=False)
-
-            if _use_cached_range(offset, _normalized, start, end):
-                index = cls._cached_range(start, end, periods=periods,
-                                          offset=offset, name=name)
-            else:
-                index = _generate_regular_range(start, end, periods, offset)
-
-        else:
-
-            if tz is not None:
-                # naive dates
-                if start is not None and start.tz is not None:
-                    start = start.replace(tzinfo=None)
-
-                if end is not None and end.tz is not None:
-                    end = end.replace(tzinfo=None)
-
-            if start and end:
-                if start.tz is None and end.tz is not None:
-                    end = end.replace(tzinfo=None)
-
-                if end.tz is None and start.tz is not None:
-                    start = start.replace(tzinfo=None)
-
-            if _use_cached_range(offset, _normalized, start, end):
-                index = cls._cached_range(start, end, periods=periods,
-                                          offset=offset, name=name)
-            else:
-                index = _generate_regular_range(start, end, periods, offset)
-
-            if tz is not None and getattr(index, 'tz', None) is None:
-                index = libts.tz_localize_to_utc(_ensure_int64(index), tz,
-                                                 ambiguous=ambiguous)
-                index = index.view(_NS_DTYPE)
-
-                # index is localized datetime64 array -> have to convert
-                # start/end as well to compare
-                if start is not None:
-                    start = start.tz_localize(tz).asm8
-                if end is not None:
-                    end = end.tz_localize(tz).asm8
-
-        if not left_closed and len(index) and index[0] == start:
-            index = index[1:]
-        if not right_closed and len(index) and index[-1] == end:
-            index = index[:-1]
-        index = cls._simple_new(index, name=name, freq=offset, tz=tz)
-        return index
-
-    @property
-    def _box_func(self):
-        return lambda x: Timestamp(x, freq=self.offset, tz=self.tz)
-
-    def _convert_for_op(self, value):
-        """ Convert value to be insertable to ndarray """
-        if self._has_same_tz(value):
-            return _to_m8(value)
-        raise ValueError('Passed item and index have different timezone')
-
-    def _local_timestamps(self):
-        utc = _utc()
-
-        if self.is_monotonic:
-            return libts.tz_convert(self.asi8, utc, self.tz)
-        else:
-            values = self.asi8
-            indexer = values.argsort()
-            result = libts.tz_convert(values.take(indexer), utc, self.tz)
-
-            n = len(indexer)
-            reverse = np.empty(n, dtype=np.int_)
-            reverse.put(indexer, np.arange(n))
-            return result.take(reverse)
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, tz=None,
-                    dtype=None, **kwargs):
-        """
-        we require the we have a dtype compat for the values
-        if we are passed a non-dtype compat, then coerce using the constructor
-        """
-
-        if getattr(values, 'dtype', None) is None:
-            # empty, but with dtype compat
-            if values is None:
-                values = np.empty(0, dtype=_NS_DTYPE)
-                return cls(values, name=name, freq=freq, tz=tz,
-                           dtype=dtype, **kwargs)
-            values = np.array(values, copy=False)
-
-        if is_object_dtype(values):
-            return cls(values, name=name, freq=freq, tz=tz,
-                       dtype=dtype, **kwargs).values
-        elif not is_datetime64_dtype(values):
-            values = _ensure_int64(values).view(_NS_DTYPE)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        result.offset = freq
-        result.tz = libts.maybe_get_tz(tz)
-        result._reset_identity()
-        return result
-
-    @property
-    def tzinfo(self):
-        """
-        Alias for tz attribute
-        """
-        return self.tz
-
-    @cache_readonly
-    def _timezone(self):
-        """ Comparable timezone both for pytz / dateutil"""
-        return libts.get_timezone(self.tzinfo)
-
-    def _has_same_tz(self, other):
-        zzone = self._timezone
-
-        # vzone sholdn't be None if value is non-datetime like
-        if isinstance(other, np.datetime64):
-            # convert to Timestamp as np.datetime64 doesn't have tz attr
-            other = Timestamp(other)
-        vzone = libts.get_timezone(getattr(other, 'tzinfo', '__no_tz__'))
-        return zzone == vzone
-
-    @classmethod
-    def _cached_range(cls, start=None, end=None, periods=None, offset=None,
-                      name=None):
-        if start is None and end is None:
-            # I somewhat believe this should never be raised externally and
-            # therefore should be a `PandasError` but whatever...
-            raise TypeError('Must specify either start or end.')
-        if start is not None:
-            start = Timestamp(start)
-        if end is not None:
-            end = Timestamp(end)
-        if (start is None or end is None) and periods is None:
-            raise TypeError(
-                'Must either specify period or provide both start and end.')
-
-        if offset is None:
-            # This can't happen with external-facing code, therefore
-            # PandasError
-            raise TypeError('Must provide offset.')
-
-        drc = _daterange_cache
-        if offset not in _daterange_cache:
-            xdr = generate_range(offset=offset, start=_CACHE_START,
-                                 end=_CACHE_END)
-
-            arr = tools.to_datetime(list(xdr), box=False)
-
-            cachedRange = DatetimeIndex._simple_new(arr)
-            cachedRange.offset = offset
-            cachedRange.tz = None
-            cachedRange.name = None
-            drc[offset] = cachedRange
-        else:
-            cachedRange = drc[offset]
-
-        if start is None:
-            if not isinstance(end, Timestamp):
-                raise AssertionError('end must be an instance of Timestamp')
-
-            end = offset.rollback(end)
-
-            endLoc = cachedRange.get_loc(end) + 1
-            startLoc = endLoc - periods
-        elif end is None:
-            if not isinstance(start, Timestamp):
-                raise AssertionError('start must be an instance of Timestamp')
-
-            start = offset.rollforward(start)
-
-            startLoc = cachedRange.get_loc(start)
-            endLoc = startLoc + periods
-        else:
-            if not offset.onOffset(start):
-                start = offset.rollforward(start)
-
-            if not offset.onOffset(end):
-                end = offset.rollback(end)
-
-            startLoc = cachedRange.get_loc(start)
-            endLoc = cachedRange.get_loc(end) + 1
-
-        indexSlice = cachedRange[startLoc:endLoc]
-        indexSlice.name = name
-        indexSlice.offset = offset
-
-        return indexSlice
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return libts.ints_to_pydatetime(self.asi8, self.tz)
-
-    @cache_readonly
-    def _is_dates_only(self):
-        from pandas.formats.format import _is_dates_only
-        return _is_dates_only(self.values)
-
-    @property
-    def _formatter_func(self):
-        from pandas.formats.format import _get_format_datetime64
-        formatter = _get_format_datetime64(is_dates_only=self._is_dates_only)
-        return lambda x: "'%s'" % formatter(x, tz=self.tz)
-
-    def __reduce__(self):
-
-        # we use a special reudce here because we need
-        # to simply set the .tz (and not reinterpret it)
-
-        d = dict(data=self._data)
-        d.update(self._get_attributes_dict())
-        return _new_DatetimeIndex, (self.__class__, d), None
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if isinstance(state, dict):
-            super(DatetimeIndex, self).__setstate__(state)
-
-        elif isinstance(state, tuple):
-
-            # < 0.15 compat
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-
-                self.name = own_state[0]
-                self.offset = own_state[1]
-                self.tz = own_state[2]
-
-                # provide numpy < 1.7 compat
-                if nd_state[2] == 'M8[us]':
-                    new_state = np.ndarray.__reduce__(data.astype('M8[ns]'))
-                    np.ndarray.__setstate__(data, new_state[2])
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(data, state)
-
-            self._data = data
-            self._reset_identity()
-
-        else:
-            raise Exception("invalid pickle state")
-    _unpickle_compat = __setstate__
-
-    def _add_datelike(self, other):
-        # adding a timedeltaindex to a datetimelike
-        if other is libts.NaT:
-            return self._nat_new(box=True)
-        raise TypeError("cannot add a datelike to a DatetimeIndex")
-
-    def _sub_datelike(self, other):
-        # subtract a datetime from myself, yielding a TimedeltaIndex
-        from pandas import TimedeltaIndex
-        if isinstance(other, DatetimeIndex):
-            # require tz compat
-            if not self._has_same_tz(other):
-                raise TypeError("DatetimeIndex subtraction must have the same "
-                                "timezones or no timezones")
-            result = self._sub_datelike_dti(other)
-        elif isinstance(other, (libts.Timestamp, datetime)):
-            other = Timestamp(other)
-            if other is libts.NaT:
-                result = self._nat_new(box=False)
-            # require tz compat
-            elif not self._has_same_tz(other):
-                raise TypeError("Timestamp subtraction must have the same "
-                                "timezones or no timezones")
-            else:
-                i8 = self.asi8
-                result = i8 - other.value
-                result = self._maybe_mask_results(result,
-                                                  fill_value=libts.iNaT)
-        else:
-            raise TypeError("cannot subtract DatetimeIndex and {typ}"
-                            .format(typ=type(other).__name__))
-        return TimedeltaIndex(result, name=self.name, copy=False)
-
-    def _sub_datelike_dti(self, other):
-        """subtraction of two DatetimeIndexes"""
-        if not len(self) == len(other):
-            raise ValueError("cannot add indices of unequal length")
-
-        self_i8 = self.asi8
-        other_i8 = other.asi8
-        new_values = self_i8 - other_i8
-        if self.hasnans or other.hasnans:
-            mask = (self._isnan) | (other._isnan)
-            new_values[mask] = libts.iNaT
-        return new_values.view('i8')
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        freq = attrs.get('freq', None)
-        if freq is not None:
-            # no need to infer if freq is None
-            attrs['freq'] = 'infer'
-        return attrs
-
-    def _add_delta(self, delta):
-        from pandas import TimedeltaIndex
-        name = self.name
-
-        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
-            new_values = self._add_delta_td(delta)
-        elif isinstance(delta, TimedeltaIndex):
-            new_values = self._add_delta_tdi(delta)
-            # update name when delta is Index
-            name = com._maybe_match_name(self, delta)
-        elif isinstance(delta, DateOffset):
-            new_values = self._add_offset(delta).asi8
-        else:
-            new_values = self.astype('O') + delta
-
-        tz = 'UTC' if self.tz is not None else None
-        result = DatetimeIndex(new_values, tz=tz, name=name, freq='infer')
-        utc = _utc()
-        if self.tz is not None and self.tz is not utc:
-            result = result.tz_convert(self.tz)
-        return result
-
-    def _add_offset(self, offset):
-        try:
-            if self.tz is not None:
-                values = self.tz_localize(None)
-            else:
-                values = self
-            result = offset.apply_index(values)
-            if self.tz is not None:
-                result = result.tz_localize(self.tz)
-            return result
-
-        except NotImplementedError:
-            warnings.warn("Non-vectorized DateOffset being applied to Series "
-                          "or DatetimeIndex", PerformanceWarning)
-            return self.astype('O') + offset
-
-    def _format_native_types(self, na_rep='NaT', date_format=None, **kwargs):
-        from pandas.formats.format import _get_format_datetime64_from_values
-        format = _get_format_datetime64_from_values(self, date_format)
-
-        return libts.format_array_from_datetime(self.asi8,
-                                                tz=self.tz,
-                                                format=format,
-                                                na_rep=na_rep)
-
-    def to_datetime(self, dayfirst=False):
-        return self.copy()
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True):
-        dtype = pandas_dtype(dtype)
-        if is_object_dtype(dtype):
-            return self.asobject
-        elif is_integer_dtype(dtype):
-            return Index(self.values.astype('i8', copy=copy), name=self.name,
-                         dtype='i8')
-        elif is_datetime64_ns_dtype(dtype):
-            if self.tz is not None:
-                return self.tz_convert('UTC').tz_localize(None)
-            elif copy is True:
-                return self.copy()
-            return self
-        elif is_string_dtype(dtype):
-            return Index(self.format(), name=self.name, dtype=object)
-        elif is_period_dtype(dtype):
-            return self.to_period(freq=dtype.freq)
-        raise ValueError('Cannot cast DatetimeIndex to dtype %s' % dtype)
-
-    def _get_time_micros(self):
-        utc = _utc()
-        values = self.asi8
-        if self.tz is not None and self.tz is not utc:
-            values = self._local_timestamps()
-        return libts.get_time_micros(values)
-
-    def to_series(self, keep_tz=False):
-        """
-        Create a Series with both index and values equal to the index keys
-        useful with map for returning an indexer based on an index
-
-        Parameters
-        ----------
-        keep_tz : optional, defaults False.
-            return the data keeping the timezone.
-
-            If keep_tz is True:
-
-              If the timezone is not set, the resulting
-              Series will have a datetime64[ns] dtype.
-
-              Otherwise the Series will have an datetime64[ns, tz] dtype; the
-              tz will be preserved.
-
-            If keep_tz is False:
-
-              Series will have a datetime64[ns] dtype. TZ aware
-              objects will have the tz removed.
-
-        Returns
-        -------
-        Series
-        """
-        from pandas import Series
-        return Series(self._to_embed(keep_tz), index=self, name=self.name)
-
-    def _to_embed(self, keep_tz=False):
-        """
-        return an array repr of this object, potentially casting to object
-
-        This is for internal compat
-        """
-        if keep_tz and self.tz is not None:
-
-            # preserve the tz & copy
-            return self.copy(deep=True)
-
-        return self.values.copy()
-
-    def to_pydatetime(self):
-        """
-        Return DatetimeIndex as object ndarray of datetime.datetime objects
-
-        Returns
-        -------
-        datetimes : ndarray
-        """
-        return libts.ints_to_pydatetime(self.asi8, tz=self.tz)
-
-    def to_period(self, freq=None):
-        """
-        Cast to PeriodIndex at a particular frequency
-        """
-        from pandas.tseries.period import PeriodIndex
-
-        if freq is None:
-            freq = self.freqstr or self.inferred_freq
-
-            if freq is None:
-                msg = ("You must pass a freq argument as "
-                       "current index has none.")
-                raise ValueError(msg)
-
-            freq = get_period_alias(freq)
-
-        return PeriodIndex(self.values, name=self.name, freq=freq, tz=self.tz)
-
-    def snap(self, freq='S'):
-        """
-        Snap time stamps to nearest occurring frequency
-
-        """
-        # Superdumb, punting on any optimizing
-        freq = to_offset(freq)
-
-        snapped = np.empty(len(self), dtype=_NS_DTYPE)
-
-        for i, v in enumerate(self):
-            s = v
-            if not freq.onOffset(s):
-                t0 = freq.rollback(s)
-                t1 = freq.rollforward(s)
-                if abs(s - t0) < abs(t1 - s):
-                    s = t0
-                else:
-                    s = t1
-            snapped[i] = s
-
-        # we know it conforms; skip check
-        return DatetimeIndex(snapped, freq=freq, verify_integrity=False)
-
-    def union(self, other):
-        """
-        Specialized union for DatetimeIndex objects. If combine
-        overlapping ranges with the same DateOffset, will be much
-        faster than Index.union
-
-        Parameters
-        ----------
-        other : DatetimeIndex or array-like
-
-        Returns
-        -------
-        y : Index or DatetimeIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, DatetimeIndex):
-            try:
-                other = DatetimeIndex(other)
-            except TypeError:
-                pass
-
-        this, other = self._maybe_utc_convert(other)
-
-        if this._can_fast_union(other):
-            return this._fast_union(other)
-        else:
-            result = Index.union(this, other)
-            if isinstance(result, DatetimeIndex):
-                result.tz = this.tz
-                if (result.freq is None and
-                        (this.freq is not None or other.freq is not None)):
-                    result.offset = to_offset(result.inferred_freq)
-            return result
-
-    def to_perioddelta(self, freq):
-        """
-        Calcuates TimedeltaIndex of difference between index
-        values and index converted to PeriodIndex at specified
-        freq.  Used for vectorized offsets
-
-        .. versionadded:: 0.17.0
-
-        Parameters
-        ----------
-        freq : Period frequency
-
-        Returns
-        -------
-        y : TimedeltaIndex
-        """
-        return to_timedelta(self.asi8 - self.to_period(freq)
-                            .to_timestamp().asi8)
-
-    def union_many(self, others):
-        """
-        A bit of a hack to accelerate unioning a collection of indexes
-        """
-        this = self
-
-        for other in others:
-            if not isinstance(this, DatetimeIndex):
-                this = Index.union(this, other)
-                continue
-
-            if not isinstance(other, DatetimeIndex):
-                try:
-                    other = DatetimeIndex(other)
-                except TypeError:
-                    pass
-
-            this, other = this._maybe_utc_convert(other)
-
-            if this._can_fast_union(other):
-                this = this._fast_union(other)
-            else:
-                tz = this.tz
-                this = Index.union(this, other)
-                if isinstance(this, DatetimeIndex):
-                    this.tz = tz
-
-        if this.freq is None:
-            this.offset = to_offset(this.inferred_freq)
-        return this
-
-    def join(self, other, how='left', level=None, return_indexers=False,
-             sort=False):
-        """
-        See Index.join
-        """
-        if (not isinstance(other, DatetimeIndex) and len(other) > 0 and
-            other.inferred_type not in ('floating', 'mixed-integer',
-                                        'mixed-integer-float', 'mixed')):
-            try:
-                other = DatetimeIndex(other)
-            except (TypeError, ValueError):
-                pass
-
-        this, other = self._maybe_utc_convert(other)
-        return Index.join(this, other, how=how, level=level,
-                          return_indexers=return_indexers, sort=sort)
-
-    def _maybe_utc_convert(self, other):
-        this = self
-        if isinstance(other, DatetimeIndex):
-            if self.tz is not None:
-                if other.tz is None:
-                    raise TypeError('Cannot join tz-naive with tz-aware '
-                                    'DatetimeIndex')
-            elif other.tz is not None:
-                raise TypeError('Cannot join tz-naive with tz-aware '
-                                'DatetimeIndex')
-
-            if self.tz != other.tz:
-                this = self.tz_convert('UTC')
-                other = other.tz_convert('UTC')
-        return this, other
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        if (isinstance(other, DatetimeIndex) and
-                self.offset == other.offset and
-                self._can_fast_union(other)):
-            joined = self._shallow_copy(joined)
-            joined.name = name
-            return joined
-        else:
-            tz = getattr(other, 'tz', None)
-            return self._simple_new(joined, name, tz=tz)
-
-    def _can_fast_union(self, other):
-        if not isinstance(other, DatetimeIndex):
-            return False
-
-        offset = self.offset
-
-        if offset is None or offset != other.offset:
-            return False
-
-        if not self.is_monotonic or not other.is_monotonic:
-            return False
-
-        if len(self) == 0 or len(other) == 0:
-            return True
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        right_start = right[0]
-        left_end = left[-1]
-
-        # Only need to "adjoin", not overlap
-        try:
-            return (right_start == left_end + offset) or right_start in left
-        except (ValueError):
-
-            # if we are comparing an offset that does not propagate timezones
-            # this will raise
-            return False
-
-    def _fast_union(self, other):
-        if len(other) == 0:
-            return self.view(type(self))
-
-        if len(self) == 0:
-            return other.view(type(self))
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        left_start, left_end = left[0], left[-1]
-        right_end = right[-1]
-
-        if not self.offset._should_cache():
-            # concatenate dates
-            if left_end < right_end:
-                loc = right.searchsorted(left_end, side='right')
-                right_chunk = right.values[loc:]
-                dates = _concat._concat_compat((left.values, right_chunk))
-                return self._shallow_copy(dates)
-            else:
-                return left
-        else:
-            return type(self)(start=left_start,
-                              end=max(left_end, right_end),
-                              freq=left.offset)
-
-    def __iter__(self):
-        """
-        Return an iterator over the boxed values
-
-        Returns
-        -------
-        Timestamps : ndarray
-        """
-
-        # convert in chunks of 10k for efficiency
-        data = self.asi8
-        l = len(self)
-        chunksize = 10000
-        chunks = int(l / chunksize) + 1
-        for i in range(chunks):
-            start_i = i * chunksize
-            end_i = min((i + 1) * chunksize, l)
-            converted = libts.ints_to_pydatetime(data[start_i:end_i],
-                                                 tz=self.tz, freq=self.freq,
-                                                 box=True)
-            for v in converted:
-                yield v
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        if self.tz != other.tz:
-            raise ValueError('Passed item and index have different timezone')
-        return self._simple_new(result, name=name, freq=None, tz=self.tz)
-
-    def intersection(self, other):
-        """
-        Specialized intersection for DatetimeIndex objects. May be much faster
-        than Index.intersection
-
-        Parameters
-        ----------
-        other : DatetimeIndex or array-like
-
-        Returns
-        -------
-        y : Index or DatetimeIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, DatetimeIndex):
-            try:
-                other = DatetimeIndex(other)
-            except (TypeError, ValueError):
-                pass
-            result = Index.intersection(self, other)
-            if isinstance(result, DatetimeIndex):
-                if result.freq is None:
-                    result.offset = to_offset(result.inferred_freq)
-            return result
-
-        elif (other.offset is None or self.offset is None or
-              other.offset != self.offset or
-              not other.offset.isAnchored() or
-              (not self.is_monotonic or not other.is_monotonic)):
-            result = Index.intersection(self, other)
-            result = self._shallow_copy(result._values, name=result.name,
-                                        tz=result.tz, freq=None)
-            if result.freq is None:
-                result.offset = to_offset(result.inferred_freq)
-            return result
-
-        if len(self) == 0:
-            return self
-        if len(other) == 0:
-            return other
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        end = min(left[-1], right[-1])
-        start = right[0]
-
-        if end < start:
-            return type(self)(data=[])
-        else:
-            lslice = slice(*left.slice_locs(start, end))
-            left_chunk = left.values[lslice]
-            return self._shallow_copy(left_chunk)
-
-    def _parsed_string_to_bounds(self, reso, parsed):
-        """
-        Calculate datetime bounds for parsed time string and its resolution.
-
-        Parameters
-        ----------
-        reso : Resolution
-            Resolution provided by parsed string.
-        parsed : datetime
-            Datetime from parsed string.
-
-        Returns
-        -------
-        lower, upper: pd.Timestamp
-
-        """
-        if reso == 'year':
-            return (Timestamp(datetime(parsed.year, 1, 1), tz=self.tz),
-                    Timestamp(datetime(parsed.year, 12, 31, 23,
-                                       59, 59, 999999), tz=self.tz))
-        elif reso == 'month':
-            d = libts.monthrange(parsed.year, parsed.month)[1]
-            return (Timestamp(datetime(parsed.year, parsed.month, 1),
-                              tz=self.tz),
-                    Timestamp(datetime(parsed.year, parsed.month, d, 23,
-                                       59, 59, 999999), tz=self.tz))
-        elif reso == 'quarter':
-            qe = (((parsed.month - 1) + 2) % 12) + 1  # two months ahead
-            d = libts.monthrange(parsed.year, qe)[1]   # at end of month
-            return (Timestamp(datetime(parsed.year, parsed.month, 1),
-                              tz=self.tz),
-                    Timestamp(datetime(parsed.year, qe, d, 23, 59,
-                                       59, 999999), tz=self.tz))
-        elif reso == 'day':
-            st = datetime(parsed.year, parsed.month, parsed.day)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Day(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'hour':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Hour(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'minute':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour, minute=parsed.minute)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Minute(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'second':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          hour=parsed.hour, minute=parsed.minute,
-                          second=parsed.second)
-            return (Timestamp(st, tz=self.tz),
-                    Timestamp(Timestamp(st + offsets.Second(),
-                                        tz=self.tz).value - 1))
-        elif reso == 'microsecond':
-            st = datetime(parsed.year, parsed.month, parsed.day,
-                          parsed.hour, parsed.minute, parsed.second,
-                          parsed.microsecond)
-            return (Timestamp(st, tz=self.tz), Timestamp(st, tz=self.tz))
-        else:
-            raise KeyError
-
-    def _partial_date_slice(self, reso, parsed, use_lhs=True, use_rhs=True):
-        is_monotonic = self.is_monotonic
-        if (is_monotonic and reso in ['day', 'hour', 'minute', 'second'] and
-                self._resolution >= Resolution.get_reso(reso)):
-            # These resolution/monotonicity validations came from GH3931,
-            # GH3452 and GH2369.
-
-            # See also GH14826
-            raise KeyError
-
-        if reso == 'microsecond':
-            # _partial_date_slice doesn't allow microsecond resolution, but
-            # _parsed_string_to_bounds allows it.
-            raise KeyError
-
-        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
-        stamps = self.asi8
-
-        if is_monotonic:
-
-            # we are out of range
-            if (len(stamps) and ((use_lhs and t1.value < stamps[0] and
-                                  t2.value < stamps[0]) or
-                                 ((use_rhs and t1.value > stamps[-1] and
-                                   t2.value > stamps[-1])))):
-                raise KeyError
-
-            # a monotonic (sorted) series can be sliced
-            left = stamps.searchsorted(
-                t1.value, side='left') if use_lhs else None
-            right = stamps.searchsorted(
-                t2.value, side='right') if use_rhs else None
-
-            return slice(left, right)
-
-        lhs_mask = (stamps >= t1.value) if use_lhs else True
-        rhs_mask = (stamps <= t2.value) if use_rhs else True
-
-        # try to find a the dates
-        return (lhs_mask & rhs_mask).nonzero()[0]
-
-    def _maybe_promote(self, other):
-        if other.inferred_type == 'date':
-            other = DatetimeIndex(other)
-        return self, other
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        if isinstance(key, datetime):
-
-            # needed to localize naive datetimes
-            if self.tz is not None:
-                key = Timestamp(key, tz=self.tz)
-
-            return self.get_value_maybe_box(series, key)
-
-        if isinstance(key, time):
-            locs = self.indexer_at_time(key)
-            return series.take(locs)
-
-        try:
-            return _maybe_box(self, Index.get_value(self, series, key),
-                              series, key)
-        except KeyError:
-            try:
-                loc = self._get_string_slice(key)
-                return series[loc]
-            except (TypeError, ValueError, KeyError):
-                pass
-
-            try:
-                return self.get_value_maybe_box(series, key)
-            except (TypeError, ValueError, KeyError):
-                raise KeyError(key)
-
-    def get_value_maybe_box(self, series, key):
-        # needed to localize naive datetimes
-        if self.tz is not None:
-            key = Timestamp(key, tz=self.tz)
-        elif not isinstance(key, Timestamp):
-            key = Timestamp(key)
-        values = self._engine.get_value(_values_from_object(series),
-                                        key, tz=self.tz)
-        return _maybe_box(self, values, series, key)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-
-        if tolerance is not None:
-            # try converting tolerance now, so errors don't get swallowed by
-            # the try/except clauses below
-            tolerance = self._convert_tolerance(tolerance)
-
-        if isinstance(key, datetime):
-            # needed to localize naive datetimes
-            key = Timestamp(key, tz=self.tz)
-            return Index.get_loc(self, key, method, tolerance)
-
-        if isinstance(key, time):
-            if method is not None:
-                raise NotImplementedError('cannot yet lookup inexact labels '
-                                          'when key is a time object')
-            return self.indexer_at_time(key)
-
-        try:
-            return Index.get_loc(self, key, method, tolerance)
-        except (KeyError, ValueError, TypeError):
-            try:
-                return self._get_string_slice(key)
-            except (TypeError, KeyError, ValueError):
-                pass
-
-            try:
-                stamp = Timestamp(key, tz=self.tz)
-                return Index.get_loc(self, stamp, method, tolerance)
-            except (KeyError, ValueError):
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string, cast it to datetime according to resolution.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : {'ix', 'loc', 'getitem'}
-
-        Returns
-        -------
-        label :  object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-        assert kind in ['ix', 'loc', 'getitem', None]
-
-        if is_float(label) or isinstance(label, time) or is_integer(label):
-            self._invalid_indexer('slice', label)
-
-        if isinstance(label, compat.string_types):
-            freq = getattr(self, 'freqstr',
-                           getattr(self, 'inferred_freq', None))
-            _, parsed, reso = parse_time_string(label, freq)
-            lower, upper = self._parsed_string_to_bounds(reso, parsed)
-            # lower, upper form the half-open interval:
-            #   [parsed, parsed + 1 freq)
-            # because label may be passed to searchsorted
-            # the bounds need swapped if index is reverse sorted and has a
-            # length (is_monotonic_decreasing gives True for empty index)
-            if self.is_monotonic_decreasing and len(self):
-                return upper if side == 'left' else lower
-            return lower if side == 'left' else upper
-        else:
-            return label
-
-    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
-        freq = getattr(self, 'freqstr',
-                       getattr(self, 'inferred_freq', None))
-        _, parsed, reso = parse_time_string(key, freq)
-        loc = self._partial_date_slice(reso, parsed, use_lhs=use_lhs,
-                                       use_rhs=use_rhs)
-        return loc
-
-    def slice_indexer(self, start=None, end=None, step=None, kind=None):
-        """
-        Return indexer for specified label slice.
-        Index.slice_indexer, customized to handle time slicing.
-
-        In addition to functionality provided by Index.slice_indexer, does the
-        following:
-
-        - if both `start` and `end` are instances of `datetime.time`, it
-          invokes `indexer_between_time`
-        - if `start` and `end` are both either string or None perform
-          value-based selection in non-monotonic cases.
-
-        """
-        # For historical reasons DatetimeIndex supports slices between two
-        # instances of datetime.time as if it were applying a slice mask to
-        # an array of (self.hour, self.minute, self.seconds, self.microsecond).
-        if isinstance(start, time) and isinstance(end, time):
-            if step is not None and step != 1:
-                raise ValueError('Must have step size of 1 with time slices')
-            return self.indexer_between_time(start, end)
-
-        if isinstance(start, time) or isinstance(end, time):
-            raise KeyError('Cannot mix time and non-time slice keys')
-
-        try:
-            return Index.slice_indexer(self, start, end, step, kind=kind)
-        except KeyError:
-            # For historical reasons DatetimeIndex by default supports
-            # value-based partial (aka string) slices on non-monotonic arrays,
-            # let's try that.
-            if ((start is None or isinstance(start, compat.string_types)) and
-                    (end is None or isinstance(end, compat.string_types))):
-                mask = True
-                if start is not None:
-                    start_casted = self._maybe_cast_slice_bound(
-                        start, 'left', kind)
-                    mask = start_casted <= self
-
-                if end is not None:
-                    end_casted = self._maybe_cast_slice_bound(
-                        end, 'right', kind)
-                    mask = (self <= end_casted) & mask
-
-                indexer = mask.nonzero()[0][::step]
-                if len(indexer) == len(self):
-                    return slice(None)
-                else:
-                    return indexer
-            else:
-                raise
-
-    # alias to offset
-    def _get_freq(self):
-        return self.offset
-
-    def _set_freq(self, value):
-        self.offset = value
-    freq = property(fget=_get_freq, fset=_set_freq,
-                    doc="get/set the frequency of the Index")
-
-    year = _field_accessor('year', 'Y', "The year of the datetime")
-    month = _field_accessor('month', 'M',
-                            "The month as January=1, December=12")
-    day = _field_accessor('day', 'D', "The days of the datetime")
-    hour = _field_accessor('hour', 'h', "The hours of the datetime")
-    minute = _field_accessor('minute', 'm', "The minutes of the datetime")
-    second = _field_accessor('second', 's', "The seconds of the datetime")
-    microsecond = _field_accessor('microsecond', 'us',
-                                  "The microseconds of the datetime")
-    nanosecond = _field_accessor('nanosecond', 'ns',
-                                 "The nanoseconds of the datetime")
-    weekofyear = _field_accessor('weekofyear', 'woy',
-                                 "The week ordinal of the year")
-    week = weekofyear
-    dayofweek = _field_accessor('dayofweek', 'dow',
-                                "The day of the week with Monday=0, Sunday=6")
-    weekday = dayofweek
-
-    weekday_name = _field_accessor(
-        'weekday_name',
-        'weekday_name',
-        "The name of day in a week (ex: Friday)\n\n.. versionadded:: 0.18.1")
-
-    dayofyear = _field_accessor('dayofyear', 'doy',
-                                "The ordinal day of the year")
-    quarter = _field_accessor('quarter', 'q', "The quarter of the date")
-    days_in_month = _field_accessor(
-        'days_in_month',
-        'dim',
-        "The number of days in the month\n\n.. versionadded:: 0.16.0")
-    daysinmonth = days_in_month
-    is_month_start = _field_accessor(
-        'is_month_start',
-        'is_month_start',
-        "Logical indicating if first day of month (defined by frequency)")
-    is_month_end = _field_accessor(
-        'is_month_end',
-        'is_month_end',
-        "Logical indicating if last day of month (defined by frequency)")
-    is_quarter_start = _field_accessor(
-        'is_quarter_start',
-        'is_quarter_start',
-        "Logical indicating if first day of quarter (defined by frequency)")
-    is_quarter_end = _field_accessor(
-        'is_quarter_end',
-        'is_quarter_end',
-        "Logical indicating if last day of quarter (defined by frequency)")
-    is_year_start = _field_accessor(
-        'is_year_start',
-        'is_year_start',
-        "Logical indicating if first day of year (defined by frequency)")
-    is_year_end = _field_accessor(
-        'is_year_end',
-        'is_year_end',
-        "Logical indicating if last day of year (defined by frequency)")
-    is_leap_year = _field_accessor(
-        'is_leap_year',
-        'is_leap_year',
-        "Logical indicating if the date belongs to a leap year")
-
-    @property
-    def time(self):
-        """
-        Returns numpy array of datetime.time. The time part of the Timestamps.
-        """
-        return self._maybe_mask_results(libalgos.arrmap_object(
-            self.asobject.values,
-            lambda x: np.nan if x is libts.NaT else x.time()))
-
-    @property
-    def date(self):
-        """
-        Returns numpy array of python datetime.date objects (namely, the date
-        part of Timestamps without timezone information).
-        """
-        return self._maybe_mask_results(libalgos.arrmap_object(
-            self.asobject.values, lambda x: x.date()))
-
-    def normalize(self):
-        """
-        Return DatetimeIndex with times to midnight. Length is unaltered
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-        """
-        new_values = libts.date_normalize(self.asi8, self.tz)
-        return DatetimeIndex(new_values, freq='infer', name=self.name,
-                             tz=self.tz)
-
-    @Substitution(klass='DatetimeIndex')
-    @Appender(_shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
-    def searchsorted(self, value, side='left', sorter=None):
-        if isinstance(value, (np.ndarray, Index)):
-            value = np.array(value, dtype=_NS_DTYPE, copy=False)
-        else:
-            value = _to_m8(value, tz=self.tz)
-
-        return self.values.searchsorted(value, side=side)
-
-    def is_type_compatible(self, typ):
-        return typ == self.inferred_type or typ == 'datetime'
-
-    @property
-    def inferred_type(self):
-        # b/c datetime is represented as microseconds since the epoch, make
-        # sure we can't have ambiguous indexing
-        return 'datetime64'
-
-    @cache_readonly
-    def dtype(self):
-        if self.tz is None:
-            return _NS_DTYPE
-        return DatetimeTZDtype('ns', self.tz)
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    @cache_readonly
-    def is_normalized(self):
-        """
-        Returns True if all of the dates are at midnight ("no time")
-        """
-        return libts.dates_normalized(self.asi8, self.tz)
-
-    @cache_readonly
-    def _resolution(self):
-        return libperiod.resolution(self.asi8, self.tz)
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-            if not either a Python datetime or a numpy integer-like, returned
-            Index dtype will be object rather than datetime.
-
-        Returns
-        -------
-        new_index : Index
-        """
-
-        freq = None
-
-        if isinstance(item, (datetime, np.datetime64)):
-            self._assert_can_do_op(item)
-            if not self._has_same_tz(item):
-                raise ValueError(
-                    'Passed item and index have different timezone')
-            # check freq can be preserved on edge cases
-            if self.size and self.freq is not None:
-                if ((loc == 0 or loc == -len(self)) and
-                        item + self.freq == self[0]):
-                    freq = self.freq
-                elif (loc == len(self)) and item - self.freq == self[-1]:
-                    freq = self.freq
-            item = _to_m8(item, tz=self.tz)
-        try:
-            new_dates = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
-                                        self[loc:].asi8))
-            if self.tz is not None:
-                new_dates = libts.tz_convert(new_dates, 'UTC', self.tz)
-            return DatetimeIndex(new_dates, name=self.name, freq=freq,
-                                 tz=self.tz)
-
-        except (AttributeError, TypeError):
-
-            # fall back to object index
-            if isinstance(item, compat.string_types):
-                return self.asobject.insert(loc, item)
-            raise TypeError(
-                "cannot insert DatetimeIndex with incompatible label")
-
-    def delete(self, loc):
-        """
-        Make a new DatetimeIndex with passed location(s) deleted.
-
-        Parameters
-        ----------
-        loc: int, slice or array of ints
-            Indicate which sub-arrays to remove.
-
-        Returns
-        -------
-        new_index : DatetimeIndex
-        """
-        new_dates = np.delete(self.asi8, loc)
-
-        freq = None
-        if is_integer(loc):
-            if loc in (0, -len(self), -1, len(self) - 1):
-                freq = self.freq
-        else:
-            if is_list_like(loc):
-                loc = lib.maybe_indices_to_slice(
-                    _ensure_int64(np.array(loc)), len(self))
-            if isinstance(loc, slice) and loc.step in (1, None):
-                if (loc.start in (0, None) or loc.stop in (len(self), None)):
-                    freq = self.freq
-
-        if self.tz is not None:
-            new_dates = libts.tz_convert(new_dates, 'UTC', self.tz)
-        return DatetimeIndex(new_dates, name=self.name, freq=freq, tz=self.tz)
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware DatetimeIndex from one time zone to another (using
-        pytz/dateutil)
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-
-        Raises
-        ------
-        TypeError
-            If DatetimeIndex is tz-naive.
-        """
-        tz = libts.maybe_get_tz(tz)
-
-        if self.tz is None:
-            # tz naive, use tz_localize
-            raise TypeError('Cannot convert tz-naive timestamps, use '
-                            'tz_localize to localize')
-
-        # No conversion since timestamps are all UTC to begin with
-        return self._shallow_copy(tz=tz)
-
-    @deprecate_kwarg(old_arg_name='infer_dst', new_arg_name='ambiguous',
-                     mapping={True: 'infer', False: 'raise'})
-    def tz_localize(self, tz, ambiguous='raise', errors='raise'):
-        """
-        Localize tz-naive DatetimeIndex to given time zone (using
-        pytz/dateutil), or remove timezone from tz-aware DatetimeIndex
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding local time.
-        ambiguous : 'infer', bool-ndarray, 'NaT', default 'raise'
-            - 'infer' will attempt to infer fall dst-transition hours based on
-              order
-            - bool-ndarray where True signifies a DST time, False signifies a
-              non-DST time (note that this flag is only applicable for
-              ambiguous times)
-            - 'NaT' will return NaT where there are ambiguous times
-            - 'raise' will raise an AmbiguousTimeError if there are ambiguous
-              times
-        errors : 'raise', 'coerce', default 'raise'
-            - 'raise' will raise a NonExistentTimeError if a timestamp is not
-               valid in the specified timezone (e.g. due to a transition from
-               or to DST time)
-            - 'coerce' will return NaT if the timestamp can not be converted
-              into the specified timezone
-
-            .. versionadded:: 0.19.0
-
-        infer_dst : boolean, default False (DEPRECATED)
-            Attempt to infer fall dst-transition hours based on order
-
-        Returns
-        -------
-        localized : DatetimeIndex
-
-        Raises
-        ------
-        TypeError
-            If the DatetimeIndex is tz-aware and tz is not None.
-        """
-        if self.tz is not None:
-            if tz is None:
-                new_dates = libts.tz_convert(self.asi8, 'UTC', self.tz)
-            else:
-                raise TypeError("Already tz-aware, use tz_convert to convert.")
-        else:
-            tz = libts.maybe_get_tz(tz)
-            # Convert to UTC
-
-            new_dates = libts.tz_localize_to_utc(self.asi8, tz,
-                                                 ambiguous=ambiguous,
-                                                 errors=errors)
-        new_dates = new_dates.view(_NS_DTYPE)
-        return self._shallow_copy(new_dates, tz=tz)
-
-    def indexer_at_time(self, time, asof=False):
-        """
-        Select values at particular time of day (e.g. 9:30AM)
-
-        Parameters
-        ----------
-        time : datetime.time or string
-
-        Returns
-        -------
-        values_at_time : TimeSeries
-        """
-        from dateutil.parser import parse
-
-        if asof:
-            raise NotImplementedError("'asof' argument is not supported")
-
-        if isinstance(time, compat.string_types):
-            time = parse(time).time()
-
-        if time.tzinfo:
-            # TODO
-            raise NotImplementedError("argument 'time' with timezone info is "
-                                      "not supported")
-
-        time_micros = self._get_time_micros()
-        micros = _time_to_micros(time)
-        return (micros == time_micros).nonzero()[0]
-
-    def indexer_between_time(self, start_time, end_time, include_start=True,
-                             include_end=True):
-        """
-        Select values between particular times of day (e.g., 9:00-9:30AM).
-
-        Return values of the index between two times.  If start_time or
-        end_time are strings then tseres.tools.to_time is used to convert to
-        a time object.
-
-        Parameters
-        ----------
-        start_time, end_time : datetime.time, str
-            datetime.time or string in appropriate format ("%H:%M", "%H%M",
-            "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
-            "%I%M%S%p")
-        include_start : boolean, default True
-        include_end : boolean, default True
-
-        Returns
-        -------
-        values_between_time : TimeSeries
-        """
-        start_time = to_time(start_time)
-        end_time = to_time(end_time)
-        time_micros = self._get_time_micros()
-        start_micros = _time_to_micros(start_time)
-        end_micros = _time_to_micros(end_time)
-
-        if include_start and include_end:
-            lop = rop = operator.le
-        elif include_start:
-            lop = operator.le
-            rop = operator.lt
-        elif include_end:
-            lop = operator.lt
-            rop = operator.le
-        else:
-            lop = rop = operator.lt
-
-        if start_time <= end_time:
-            join_op = operator.and_
-        else:
-            join_op = operator.or_
-
-        mask = join_op(lop(start_micros, time_micros),
-                       rop(time_micros, end_micros))
-
-        return mask.nonzero()[0]
-
-    def to_julian_date(self):
-        """
-        Convert DatetimeIndex to Float64Index of Julian Dates.
-        0 Julian date is noon January 1, 4713 BC.
-        http://en.wikipedia.org/wiki/Julian_day
-        """
-
-        # http://mysite.verizon.net/aesir_research/date/jdalg2.htm
-        year = np.asarray(self.year)
-        month = np.asarray(self.month)
-        day = np.asarray(self.day)
-        testarr = month < 3
-        year[testarr] -= 1
-        month[testarr] += 12
-        return Float64Index(day +
-                            np.fix((153 * month - 457) / 5) +
-                            365 * year +
-                            np.floor(year / 4) -
-                            np.floor(year / 100) +
-                            np.floor(year / 400) +
-                            1721118.5 +
-                            (self.hour +
-                             self.minute / 60.0 +
-                             self.second / 3600.0 +
-                             self.microsecond / 3600.0 / 1e+6 +
-                             self.nanosecond / 3600.0 / 1e+9
-                             ) / 24.0)
-
-
-DatetimeIndex._add_numeric_methods_disabled()
-DatetimeIndex._add_logical_methods_disabled()
-DatetimeIndex._add_datetimelike_methods()
-
-
-def _generate_regular_range(start, end, periods, offset):
-    if isinstance(offset, Tick):
-        stride = offset.nanos
-        if periods is None:
-            b = Timestamp(start).value
-            # cannot just use e = Timestamp(end) + 1 because arange breaks when
-            # stride is too large, see GH10887
-            e = (b + (Timestamp(end).value - b) // stride * stride +
-                 stride // 2 + 1)
-            # end.tz == start.tz by this point due to _generate implementation
-            tz = start.tz
-        elif start is not None:
-            b = Timestamp(start).value
-            e = b + np.int64(periods) * stride
-            tz = start.tz
-        elif end is not None:
-            e = Timestamp(end).value + stride
-            b = e - np.int64(periods) * stride
-            tz = end.tz
-        else:
-            raise ValueError("at least 'start' or 'end' should be specified "
-                             "if a 'period' is given.")
-
-        data = np.arange(b, e, stride, dtype=np.int64)
-        data = DatetimeIndex._simple_new(data, None, tz=tz)
-    else:
-        if isinstance(start, Timestamp):
-            start = start.to_pydatetime()
-
-        if isinstance(end, Timestamp):
-            end = end.to_pydatetime()
-
-        xdr = generate_range(start=start, end=end,
-                             periods=periods, offset=offset)
-
-        dates = list(xdr)
-        # utc = len(dates) > 0 and dates[0].tzinfo is not None
-        data = tools.to_datetime(dates)
-
-    return data
-
-
-def date_range(start=None, end=None, periods=None, freq='D', tz=None,
-               normalize=False, name=None, closed=None, **kwargs):
-    """
-    Return a fixed frequency datetime index, with day (calendar) as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'D' (calendar daily)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Hong_Kong
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name of the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-    return DatetimeIndex(start=start, end=end, periods=periods,
-                         freq=freq, tz=tz, normalize=normalize, name=name,
-                         closed=closed, **kwargs)
-
-
-def bdate_range(start=None, end=None, periods=None, freq='B', tz=None,
-                normalize=True, name=None, closed=None, **kwargs):
-    """
-    Return a fixed frequency datetime index, with business day as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'B' (business daily)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Beijing
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name for the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-
-    return DatetimeIndex(start=start, end=end, periods=periods,
-                         freq=freq, tz=tz, normalize=normalize, name=name,
-                         closed=closed, **kwargs)
-
-
-def cdate_range(start=None, end=None, periods=None, freq='C', tz=None,
-                normalize=True, name=None, closed=None, **kwargs):
-    """
-    **EXPERIMENTAL** Return a fixed frequency datetime index, with
-    CustomBusinessDay as the default frequency
-
-    .. warning:: EXPERIMENTAL
-
-        The CustomBusinessDay class is not officially supported and the API is
-        likely to change in future versions. Use this at your own risk.
-
-    Parameters
-    ----------
-    start : string or datetime-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'C' (CustomBusinessDay)
-        Frequency strings can have multiples, e.g. '5H'
-    tz : string or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Beijing
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    name : str, default None
-        Name for the resulting index
-    weekmask : str, Default 'Mon Tue Wed Thu Fri'
-        weekmask of valid business days, passed to ``numpy.busdaycalendar``
-    holidays : list
-        list/array of dates to exclude from the set of valid business days,
-        passed to ``numpy.busdaycalendar``
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-
-    Returns
-    -------
-    rng : DatetimeIndex
-    """
-
-    if freq == 'C':
-        holidays = kwargs.pop('holidays', [])
-        weekmask = kwargs.pop('weekmask', 'Mon Tue Wed Thu Fri')
-        freq = CDay(holidays=holidays, weekmask=weekmask)
-    return DatetimeIndex(start=start, end=end, periods=periods, freq=freq,
-                         tz=tz, normalize=normalize, name=name,
-                         closed=closed, **kwargs)
-
-
-def _to_m8(key, tz=None):
-    """
-    Timestamp-like => dt64
-    """
-    if not isinstance(key, Timestamp):
-        # this also converts strings
-        key = Timestamp(key, tz=tz)
-
-    return np.int64(libts.pydt_to_i8(key)).view(_NS_DTYPE)
-
-
-_CACHE_START = Timestamp(datetime(1950, 1, 1))
-_CACHE_END = Timestamp(datetime(2030, 1, 1))
-
-_daterange_cache = {}
-
-
-def _naive_in_cache_range(start, end):
-    if start is None or end is None:
-        return False
-    else:
-        if start.tzinfo is not None or end.tzinfo is not None:
-            return False
-        return _in_range(start, end, _CACHE_START, _CACHE_END)
-
-
-def _in_range(start, end, rng_start, rng_end):
-    return start > rng_start and end < rng_end
-
-
-def _use_cached_range(offset, _normalized, start, end):
-    return (offset._should_cache() and
-            not (offset._normalize_cache and not _normalized) and
-            _naive_in_cache_range(start, end))
-
-
-def _time_to_micros(time):
-    seconds = time.hour * 60 * 60 + 60 * time.minute + time.second
-    return 1000000 * seconds + time.microsecond
diff --git a/pandas/tseries/interval.py b/pandas/tseries/interval.py
deleted file mode 100644
index 22801318a1853..0000000000000
--- a/pandas/tseries/interval.py
+++ /dev/null
@@ -1,35 +0,0 @@
-
-from pandas.core.index import Index
-
-
-class Interval(object):
-    """
-    Represents an interval of time defined by two timestamps
-    """
-
-    def __init__(self, start, end):
-        self.start = start
-        self.end = end
-
-
-class PeriodInterval(object):
-    """
-    Represents an interval of time defined by two Period objects (time
-    ordinals)
-    """
-
-    def __init__(self, start, end):
-        self.start = start
-        self.end = end
-
-
-class IntervalIndex(Index):
-    """
-
-    """
-
-    def __new__(self, starts, ends):
-        pass
-
-    def dtype(self):
-        return self.values.dtype
diff --git a/pandas/tseries/offsets.py b/pandas/tseries/offsets.py
index 2b6a684fc39dd..f208ce37a3b14 100644
--- a/pandas/tseries/offsets.py
+++ b/pandas/tseries/offsets.py
@@ -1,19 +1,26 @@
+# -*- coding: utf-8 -*-
 from datetime import date, datetime, timedelta
-from pandas.compat import range
-from pandas import compat
+import functools
+import operator
+
+from dateutil.easter import easter
 import numpy as np
 
-from pandas.types.generic import ABCSeries, ABCDatetimeIndex, ABCPeriod
-from pandas.tseries.tools import to_datetime, normalize_date
-from pandas.core.common import AbstractMethodError
+from pandas._libs.tslibs import (
+    NaT, OutOfBoundsDatetime, Timedelta, Timestamp, ccalendar, conversion,
+    delta_to_nanoseconds, frequencies as libfrequencies, normalize_date,
+    offsets as liboffsets, timezones)
+from pandas._libs.tslibs.offsets import (
+    ApplyTypeError, BaseOffset, _get_calendar, _is_normalized, _to_dt64,
+    apply_index_wraps, as_datetime, roll_yearday, shift_month)
+import pandas.compat as compat
+from pandas.compat import range
+from pandas.errors import AbstractMethodError
+from pandas.util._decorators import cache_readonly
 
-# import after tools, dateutil check
-from dateutil.relativedelta import relativedelta, weekday
-from dateutil.easter import easter
-from pandas._libs import tslib, Timestamp, OutOfBoundsDatetime, Timedelta
+from pandas.core.dtypes.generic import ABCPeriod
 
-import functools
-import operator
+from pandas.core.tools.datetimes import to_datetime
 
 __all__ = ['Day', 'BusinessDay', 'BDay', 'CustomBusinessDay', 'CDay',
            'CBMonthEnd', 'CBMonthBegin',
@@ -41,18 +48,11 @@ def as_timestamp(obj):
     return obj
 
 
-def as_datetime(obj):
-    f = getattr(obj, 'to_pydatetime', None)
-    if f is not None:
-        obj = f()
-    return obj
-
-
 def apply_wraps(func):
     @functools.wraps(func)
     def wrapper(self, other):
-        if other is tslib.NaT:
-            return tslib.NaT
+        if other is NaT:
+            return NaT
         elif isinstance(other, (timedelta, Tick, DateOffset)):
             # timedelta path
             return func(self, other)
@@ -69,7 +69,7 @@ def wrapper(self, other):
             result = func(self, other)
 
             if self._adjust_dst:
-                result = tslib._localize_pydatetime(result, tz)
+                result = conversion.localize_pydatetime(result, tz)
 
             result = Timestamp(result)
             if self.normalize:
@@ -80,14 +80,14 @@ def wrapper(self, other):
                 if not isinstance(self, Nano) and result.nanosecond != nano:
                     if result.tz is not None:
                         # convert to UTC
-                        value = tslib.tz_convert_single(
-                            result.value, 'UTC', result.tz)
+                        value = conversion.tz_convert_single(
+                            result.value, timezones.UTC, result.tz)
                     else:
                         value = result.value
                     result = Timestamp(value + nano)
 
             if tz is not None and result.tzinfo is None:
-                result = tslib._localize_pydatetime(result, tz)
+                result = conversion.localize_pydatetime(result, tz)
 
         except OutOfBoundsDatetime:
             result = func(self, as_datetime(other))
@@ -97,42 +97,17 @@ def wrapper(self, other):
                 result = normalize_date(result)
 
             if tz is not None and result.tzinfo is None:
-                result = tslib._localize_pydatetime(result, tz)
-
-        return result
-    return wrapper
-
+                result = conversion.localize_pydatetime(result, tz)
 
-def apply_index_wraps(func):
-    @functools.wraps(func)
-    def wrapper(self, other):
-        result = func(self, other)
-        if self.normalize:
-            result = result.to_period('D').to_timestamp()
         return result
     return wrapper
 
 
-def _is_normalized(dt):
-    if (dt.hour != 0 or dt.minute != 0 or dt.second != 0 or
-            dt.microsecond != 0 or getattr(dt, 'nanosecond', 0) != 0):
-        return False
-    return True
-
 # ---------------------------------------------------------------------
 # DateOffset
 
 
-class ApplyTypeError(TypeError):
-    # sentinel class for catching the apply error to return NotImplemented
-    pass
-
-
-class CacheableOffset(object):
-    _cacheable = True
-
-
-class DateOffset(object):
+class DateOffset(BaseOffset):
     """
     Standard kind of date increment used for a date range.
 
@@ -174,46 +149,73 @@ def __add__(date):
     date + BDay(0) == BDay.rollforward(date)
 
     Since 0 is a bit weird, we suggest avoiding its use.
+
+    Parameters
+    ----------
+    n : int, default 1
+        The number of time periods the offset represents.
+    normalize : bool, default False
+        Whether to round the result of a DateOffset addition down to the
+        previous midnight.
+    **kwds
+        Temporal parameter that add to or replace the offset value.
+
+        Parameters that **add** to the offset (like Timedelta):
+
+        - years
+        - months
+        - weeks
+        - days
+        - hours
+        - minutes
+        - seconds
+        - microseconds
+        - nanoseconds
+
+        Parameters that **replace** the offset value:
+
+        - year
+        - month
+        - day
+        - weekday
+        - hour
+        - minute
+        - second
+        - microsecond
+        - nanosecond
+
+    See Also
+    --------
+    dateutil.relativedelta.relativedelta
+
+    Examples
+    --------
+    >>> ts = pd.Timestamp('2017-01-01 09:10:11')
+    >>> ts + DateOffset(months=3)
+    Timestamp('2017-04-01 09:10:11')
+
+    >>> ts = pd.Timestamp('2017-01-01 09:10:11')
+    >>> ts + DateOffset(month=3)
+    Timestamp('2017-03-01 09:10:11')
     """
-    _cacheable = False
-    _normalize_cache = True
-    _kwds_use_relativedelta = (
-        'years', 'months', 'weeks', 'days',
-        'year', 'month', 'week', 'day', 'weekday',
-        'hour', 'minute', 'second', 'microsecond'
-    )
+    _params = cache_readonly(BaseOffset._params.fget)
     _use_relativedelta = False
     _adjust_dst = False
+    _attributes = frozenset(['n', 'normalize'] +
+                            list(liboffsets.relativedelta_kwds))
 
     # default for prior pickles
     normalize = False
 
     def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self._offset, self._use_relativedelta = self._determine_offset()
-
-    def _determine_offset(self):
-        # timedelta is used for sub-daily plural offsets and all singular
-        # offsets relativedelta is used for plural offsets of daily length or
-        # more nanosecond(s) are handled by apply_wraps
-        kwds_no_nanos = dict(
-            (k, v) for k, v in self.kwds.items()
-            if k not in ('nanosecond', 'nanoseconds')
-        )
-        use_relativedelta = False
-
-        if len(kwds_no_nanos) > 0:
-            if any(k in self._kwds_use_relativedelta for k in kwds_no_nanos):
-                use_relativedelta = True
-                offset = relativedelta(**kwds_no_nanos)
-            else:
-                # sub-daily offset - use timedelta (tz-aware)
-                offset = timedelta(**kwds_no_nanos)
-        else:
-            offset = timedelta(1)
-        return offset, use_relativedelta
+        BaseOffset.__init__(self, n, normalize)
+
+        off, use_rd = liboffsets._determine_offset(kwds)
+        object.__setattr__(self, "_offset", off)
+        object.__setattr__(self, "_use_relativedelta", use_rd)
+        for key in kwds:
+            val = kwds[key]
+            object.__setattr__(self, key, val)
 
     @apply_wraps
     def apply(self, other):
@@ -235,7 +237,7 @@ def apply(self, other):
 
             if tzinfo is not None and self._use_relativedelta:
                 # bring tz back from UTC calculation
-                other = tslib._localize_pydatetime(other, tzinfo)
+                other = conversion.localize_pydatetime(other, tzinfo)
 
             return as_timestamp(other)
         else:
@@ -246,9 +248,7 @@ def apply_index(self, i):
         """
         Vectorized apply of DateOffset to DatetimeIndex,
         raises NotImplentedError for offsets without a
-        vectorized implementation
-
-        .. versionadded:: 0.17.0
+        vectorized implementation.
 
         Parameters
         ----------
@@ -259,32 +259,38 @@ def apply_index(self, i):
         y : DatetimeIndex
         """
 
-        if not type(self) is DateOffset:
-            raise NotImplementedError("DateOffset subclass %s "
+        if type(self) is not DateOffset:
+            raise NotImplementedError("DateOffset subclass {name} "
                                       "does not have a vectorized "
-                                      "implementation"
-                                      % (self.__class__.__name__,))
-        relativedelta_fast = set(['years', 'months', 'weeks',
-                                  'days', 'hours', 'minutes',
-                                  'seconds', 'microseconds'])
+                                      "implementation".format(
+                                          name=self.__class__.__name__))
+        kwds = self.kwds
+        relativedelta_fast = {'years', 'months', 'weeks', 'days', 'hours',
+                              'minutes', 'seconds', 'microseconds'}
         # relativedelta/_offset path only valid for base DateOffset
         if (self._use_relativedelta and
-                set(self.kwds).issubset(relativedelta_fast)):
+                set(kwds).issubset(relativedelta_fast)):
 
-            months = ((self.kwds.get('years', 0) * 12 +
-                       self.kwds.get('months', 0)) * self.n)
+            months = ((kwds.get('years', 0) * 12 +
+                       kwds.get('months', 0)) * self.n)
             if months:
-                shifted = tslib.shift_months(i.asi8, months)
-                i = i._shallow_copy(shifted)
+                shifted = liboffsets.shift_months(i.asi8, months)
+                i = type(i)(shifted, freq=i.freq, dtype=i.dtype)
 
-            weeks = (self.kwds.get('weeks', 0)) * self.n
+            weeks = (kwds.get('weeks', 0)) * self.n
             if weeks:
-                i = (i.to_period('W') + weeks).to_timestamp() + \
-                    i.to_perioddelta('W')
-
-            timedelta_kwds = dict((k, v) for k, v in self.kwds.items()
-                                  if k in ['days', 'hours', 'minutes',
-                                           'seconds', 'microseconds'])
+                # integer addition on PeriodIndex is deprecated,
+                #   so we directly use _time_shift instead
+                asper = i.to_period('W')
+                if not isinstance(asper._data, np.ndarray):
+                    # unwrap PeriodIndex --> PeriodArray
+                    asper = asper._data
+                shifted = asper._time_shift(weeks)
+                i = shifted.to_timestamp() + i.to_perioddelta('W')
+
+            timedelta_kwds = {k: v for k, v in kwds.items()
+                              if k in ['days', 'hours', 'minutes',
+                                       'seconds', 'microseconds']}
             if timedelta_kwds:
                 delta = Timedelta(**timedelta_kwds)
                 i = i + (self.n * delta)
@@ -294,139 +300,51 @@ def apply_index(self, i):
             return i + (self._offset * self.n)
         else:
             # relativedelta with other keywords
+            kwd = set(kwds) - relativedelta_fast
             raise NotImplementedError("DateOffset with relativedelta "
-                                      "keyword(s) %s not able to be "
-                                      "applied vectorized" %
-                                      (set(self.kwds) - relativedelta_fast),)
+                                      "keyword(s) {kwd} not able to be "
+                                      "applied vectorized".format(kwd=kwd))
 
     def isAnchored(self):
+        # TODO: Does this make sense for the general case?  It would help
+        # if there were a canonical docstring for what isAnchored means.
         return (self.n == 1)
 
-    def copy(self):
-        return self.__class__(self.n, normalize=self.normalize, **self.kwds)
-
-    def _should_cache(self):
-        return self.isAnchored() and self._cacheable
-
-    def _params(self):
-        all_paras = dict(list(vars(self).items()) + list(self.kwds.items()))
-        if 'holidays' in all_paras and not all_paras['holidays']:
-            all_paras.pop('holidays')
-        exclude = ['kwds', 'name', 'normalize', 'calendar']
-        attrs = [(k, v) for k, v in all_paras.items()
-                 if (k not in exclude) and (k[0] != '_')]
-        attrs = sorted(set(attrs))
-        params = tuple([str(self.__class__)] + attrs)
-        return params
-
-    def __repr__(self):
-        className = getattr(self, '_outputName', type(self).__name__)
-        exclude = set(['n', 'inc', 'normalize'])
+    # TODO: Combine this with BusinessMixin version by defining a whitelisted
+    # set of attributes on each object rather than the existing behavior of
+    # iterating over internal ``__dict__``
+    def _repr_attrs(self):
+        exclude = {'n', 'inc', 'normalize'}
         attrs = []
         for attr in sorted(self.__dict__):
-            if ((attr == 'kwds' and len(self.kwds) == 0) or
-                    attr.startswith('_')):
+            if attr.startswith('_') or attr == 'kwds':
                 continue
-            elif attr == 'kwds':
-                kwds_new = {}
-                for key in self.kwds:
-                    if not hasattr(self, key):
-                        kwds_new[key] = self.kwds[key]
-                if len(kwds_new) > 0:
-                    attrs.append('='.join((attr, repr(kwds_new))))
-            else:
-                if attr not in exclude:
-                    attrs.append('='.join((attr, repr(getattr(self, attr)))))
-
-        if abs(self.n) != 1:
-            plural = 's'
-        else:
-            plural = ''
-
-        n_str = ""
-        if self.n != 1:
-            n_str = "%s * " % self.n
+            elif attr not in exclude:
+                value = getattr(self, attr)
+                attrs.append('{attr}={value}'.format(attr=attr, value=value))
 
-        out = '<%s' % n_str + className + plural
+        out = ''
         if attrs:
             out += ': ' + ', '.join(attrs)
-        out += '>'
         return out
 
     @property
     def name(self):
         return self.rule_code
 
-    def __eq__(self, other):
-        if other is None:
-            return False
-
-        if isinstance(other, compat.string_types):
-            from pandas.tseries.frequencies import to_offset
-
-            other = to_offset(other)
-
-        if not isinstance(other, DateOffset):
-            return False
-
-        return self._params() == other._params()
-
-    def __ne__(self, other):
-        return not self == other
-
-    def __hash__(self):
-        return hash(self._params())
-
-    def __call__(self, other):
-        return self.apply(other)
-
-    def __add__(self, other):
-        if isinstance(other, (ABCDatetimeIndex, ABCSeries)):
-            return other + self
-        elif isinstance(other, ABCPeriod):
-            return other + self
-        try:
-            return self.apply(other)
-        except ApplyTypeError:
-            return NotImplemented
-
-    def __radd__(self, other):
-        return self.__add__(other)
-
-    def __sub__(self, other):
-        if isinstance(other, datetime):
-            raise TypeError('Cannot subtract datetime from offset.')
-        elif type(other) == type(self):
-            return self.__class__(self.n - other.n, normalize=self.normalize,
-                                  **self.kwds)
-        else:  # pragma: no cover
-            return NotImplemented
-
-    def __rsub__(self, other):
-        if isinstance(other, (ABCDatetimeIndex, ABCSeries)):
-            return other - self
-        return self.__class__(-self.n, normalize=self.normalize,
-                              **self.kwds) + other
-
-    def __mul__(self, someInt):
-        return self.__class__(n=someInt * self.n, normalize=self.normalize,
-                              **self.kwds)
-
-    def __rmul__(self, someInt):
-        return self.__mul__(someInt)
-
-    def __neg__(self):
-        return self.__class__(-self.n, normalize=self.normalize, **self.kwds)
-
     def rollback(self, dt):
-        """Roll provided date backward to next offset only if not on offset"""
+        """
+        Roll provided date backward to next offset only if not on offset.
+        """
         dt = as_timestamp(dt)
         if not self.onOffset(dt):
             dt = dt - self.__class__(1, normalize=self.normalize, **self.kwds)
         return dt
 
     def rollforward(self, dt):
-        """Roll provided date forward to next offset only if not on offset"""
+        """
+        Roll provided date forward to next offset only if not on offset.
+        """
         dt = as_timestamp(dt)
         if not self.onOffset(dt):
             dt = dt + self.__class__(1, normalize=self.normalize, **self.kwds)
@@ -446,43 +364,6 @@ def onOffset(self, dt):
         b = ((dt + self) - self)
         return a == b
 
-    # helpers for vectorized offsets
-    def _beg_apply_index(self, i, freq):
-        """Offsets index to beginning of Period frequency"""
-
-        off = i.to_perioddelta('D')
-
-        from pandas.tseries.frequencies import get_freq_code
-        base, mult = get_freq_code(freq)
-        base_period = i.to_period(base)
-        if self.n <= 0:
-            # when subtracting, dates on start roll to prior
-            roll = np.where(base_period.to_timestamp() == i - off,
-                            self.n, self.n + 1)
-        else:
-            roll = self.n
-
-        base = (base_period + roll).to_timestamp()
-        return base + off
-
-    def _end_apply_index(self, i, freq):
-        """Offsets index to end of Period frequency"""
-
-        off = i.to_perioddelta('D')
-
-        from pandas.tseries.frequencies import get_freq_code
-        base, mult = get_freq_code(freq)
-        base_period = i.to_period(base)
-        if self.n > 0:
-            # when adding, dates on end roll to next
-            roll = np.where(base_period.to_timestamp(how='end') == i - off,
-                            self.n, self.n - 1)
-        else:
-            roll = self.n
-
-        base = (base_period + roll).to_timestamp(how='end')
-        return base + off
-
     # way to get around weirdness with rule_code
     @property
     def _prefix(self):
@@ -492,7 +373,7 @@ def _prefix(self):
     def rule_code(self):
         return self._prefix
 
-    @property
+    @cache_readonly
     def freqstr(self):
         try:
             code = self.rule_code
@@ -500,51 +381,70 @@ def freqstr(self):
             return repr(self)
 
         if self.n != 1:
-            fstr = '%d%s' % (self.n, code)
+            fstr = '{n}{code}'.format(n=self.n, code=code)
         else:
             fstr = code
 
+        try:
+            if self._offset:
+                fstr += self._offset_str()
+        except AttributeError:
+            # TODO: standardize `_offset` vs `offset` naming convention
+            pass
+
         return fstr
 
+    def _offset_str(self):
+        return ''
+
     @property
     def nanos(self):
-        raise ValueError("{0} is a non-fixed frequency".format(self))
+        raise ValueError("{name} is a non-fixed frequency".format(name=self))
 
 
 class SingleConstructorOffset(DateOffset):
-
     @classmethod
     def _from_name(cls, suffix=None):
         # default _from_name calls cls with no args
         if suffix:
-            raise ValueError("Bad freq suffix %s" % suffix)
+            raise ValueError("Bad freq suffix {suffix}".format(suffix=suffix))
         return cls()
 
 
-class BusinessMixin(object):
-    """ mixin to business types to provide related functions """
+class _CustomMixin(object):
+    """
+    Mixin for classes that define and validate calendar, holidays,
+    and weekdays attributes.
+    """
+    def __init__(self, weekmask, holidays, calendar):
+        calendar, holidays = _get_calendar(weekmask=weekmask,
+                                           holidays=holidays,
+                                           calendar=calendar)
+        # Custom offset instances are identified by the
+        # following two attributes. See DateOffset._params()
+        # holidays, weekmask
 
-    # TODO: Combine this with DateOffset by defining a whitelisted set of
-    # attributes on each object rather than the existing behavior of iterating
-    # over internal ``__dict__``
-    def __repr__(self):
-        className = getattr(self, '_outputName', self.__class__.__name__)
+        object.__setattr__(self, "weekmask", weekmask)
+        object.__setattr__(self, "holidays", holidays)
+        object.__setattr__(self, "calendar", calendar)
 
-        if abs(self.n) != 1:
-            plural = 's'
-        else:
-            plural = ''
 
-        n_str = ""
-        if self.n != 1:
-            n_str = "%s * " % self.n
+class BusinessMixin(object):
+    """
+    Mixin to business types to provide related functions.
+    """
 
-        out = '<%s' % n_str + className + plural + self._repr_attrs() + '>'
-        return out
+    @property
+    def offset(self):
+        """
+        Alias for self._offset.
+        """
+        # Alias for backward compat
+        return self._offset
 
     def _repr_attrs(self):
         if self.offset:
-            attrs = ['offset=%s' % repr(self.offset)]
+            attrs = ['offset={offset!r}'.format(offset=self.offset)]
         else:
             attrs = None
         out = ''
@@ -552,62 +452,18 @@ def _repr_attrs(self):
             out += ': ' + ', '.join(attrs)
         return out
 
-    def __getstate__(self):
-        """Return a pickleable state"""
-        state = self.__dict__.copy()
-
-        # we don't want to actually pickle the calendar object
-        # as its a np.busyday; we recreate on deserilization
-        if 'calendar' in state:
-            del state['calendar']
-        try:
-            state['kwds'].pop('calendar')
-        except KeyError:
-            pass
-
-        return state
-
-    def __setstate__(self, state):
-        """Reconstruct an instance from a pickled state"""
-        self.__dict__ = state
-        if 'weekmask' in state and 'holidays' in state:
-            calendar, holidays = self.get_calendar(weekmask=self.weekmask,
-                                                   holidays=self.holidays,
-                                                   calendar=None)
-            self.kwds['calendar'] = self.calendar = calendar
-            self.kwds['holidays'] = self.holidays = holidays
-            self.kwds['weekmask'] = state['weekmask']
-
 
 class BusinessDay(BusinessMixin, SingleConstructorOffset):
     """
-    DateOffset subclass representing possibly n business days
+    DateOffset subclass representing possibly n business days.
     """
     _prefix = 'B'
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'offset'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-
-    @property
-    def freqstr(self):
-        try:
-            code = self.rule_code
-        except NotImplementedError:
-            return repr(self)
-
-        if self.n != 1:
-            fstr = '%d%s' % (self.n, code)
-        else:
-            fstr = code
-
-        if self.offset:
-            fstr += self._offset_str()
-
-        return fstr
+    def __init__(self, n=1, normalize=False, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
     def _offset_str(self):
         def get_str(td):
@@ -640,35 +496,35 @@ def get_str(td):
         else:
             return '+' + repr(self.offset)
 
-    def isAnchored(self):
-        return (self.n == 1)
-
     @apply_wraps
     def apply(self, other):
         if isinstance(other, datetime):
             n = self.n
+            wday = other.weekday()
 
-            if n == 0 and other.weekday() > 4:
-                n = 1
-
-            result = other
-
-            # avoid slowness below
-            if abs(n) > 5:
-                k = n // 5
-                result = result + timedelta(7 * k)
-                if n < 0 and result.weekday() > 4:
-                    n += 1
-                n -= 5 * k
-                if n == 0 and result.weekday() > 4:
-                    n -= 1
+            # avoid slowness below by operating on weeks first
+            weeks = n // 5
+            if n <= 0 and wday > 4:
+                # roll forward
+                n += 1
 
-            while n != 0:
-                k = n // abs(n)
-                result = result + timedelta(k)
-                if result.weekday() < 5:
-                    n -= k
+            n -= 5 * weeks
+
+            # n is always >= 0 at this point
+            if n == 0 and wday > 4:
+                # roll back
+                days = 4 - wday
+            elif wday > 4:
+                # roll forward
+                days = (7 - wday) + (n - 1)
+            elif wday + n <= 4:
+                # shift by n days without leaving the current week
+                days = n
+            else:
+                # shift by n days plus 2 to get past the weekend
+                days = n + 2
 
+            result = other + timedelta(days=7 * weeks + days)
             if self.offset:
                 result = result + self.offset
             return result
@@ -685,13 +541,25 @@ def apply_index(self, i):
         time = i.to_perioddelta('D')
         # to_period rolls forward to next BDay; track and
         # reduce n where it does when rolling forward
-        shifted = (i.to_perioddelta('B') - time).asi8 != 0
+        asper = i.to_period('B')
+        if not isinstance(asper._data, np.ndarray):
+            # unwrap PeriodIndex --> PeriodArray
+            asper = asper._data
+
         if self.n > 0:
+            shifted = (i.to_perioddelta('B') - time).asi8 != 0
+
+            # Integer-array addition is deprecated, so we use
+            # _time_shift directly
             roll = np.where(shifted, self.n - 1, self.n)
+            shifted = asper._addsub_int_array(roll, operator.add)
         else:
+            # Integer addition is deprecated, so we use _time_shift directly
             roll = self.n
+            shifted = asper._time_shift(roll)
 
-        return (i.to_period('B') + roll).to_timestamp() + time
+        result = shifted.to_timestamp() + time
+        return result
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -701,32 +569,33 @@ def onOffset(self, dt):
 
 class BusinessHourMixin(BusinessMixin):
 
-    def __init__(self, **kwds):
+    def __init__(self, start='09:00', end='17:00', offset=timedelta(0)):
         # must be validated here to equality check
-        kwds['start'] = self._validate_time(kwds.get('start', '09:00'))
-        kwds['end'] = self._validate_time(kwds.get('end', '17:00'))
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.start = kwds.get('start', '09:00')
-        self.end = kwds.get('end', '17:00')
-
-    def _validate_time(self, t_input):
-        from datetime import time as dt_time
-        import time
-        if isinstance(t_input, compat.string_types):
-            try:
-                t = time.strptime(t_input, '%H:%M')
-                return dt_time(hour=t.tm_hour, minute=t.tm_min)
-            except ValueError:
-                raise ValueError("time data must match '%H:%M' format")
-        elif isinstance(t_input, dt_time):
-            if t_input.second != 0 or t_input.microsecond != 0:
-                raise ValueError(
-                    "time data must be specified only with hour and minute")
-            return t_input
+        start = liboffsets._validate_business_time(start)
+        object.__setattr__(self, "start", start)
+        end = liboffsets._validate_business_time(end)
+        object.__setattr__(self, "end", end)
+        object.__setattr__(self, "_offset", offset)
+
+    @cache_readonly
+    def next_bday(self):
+        """
+        Used for moving to next business day.
+        """
+        if self.n >= 0:
+            nb_offset = 1
         else:
-            raise ValueError("time data must be string or datetime.time")
+            nb_offset = -1
+        if self._prefix.startswith('C'):
+            # CustomBusinessHour
+            return CustomBusinessDay(n=nb_offset,
+                                     weekmask=self.weekmask,
+                                     holidays=self.holidays,
+                                     calendar=self.calendar)
+        else:
+            return BusinessDay(n=nb_offset)
 
+    @cache_readonly
     def _get_daytime_flag(self):
         if self.start == self.end:
             raise ValueError('start and end must not be the same')
@@ -768,26 +637,28 @@ def _prev_opening_time(self, other):
         return datetime(other.year, other.month, other.day,
                         self.start.hour, self.start.minute)
 
+    @cache_readonly
     def _get_business_hours_by_sec(self):
         """
         Return business hours in a day by seconds.
         """
-        if self._get_daytime_flag():
-            # create dummy datetime to calcurate businesshours in a day
+        if self._get_daytime_flag:
+            # create dummy datetime to calculate businesshours in a day
             dtstart = datetime(2014, 4, 1, self.start.hour, self.start.minute)
             until = datetime(2014, 4, 1, self.end.hour, self.end.minute)
-            return tslib.tot_seconds(until - dtstart)
+            return (until - dtstart).total_seconds()
         else:
-            self.daytime = False
             dtstart = datetime(2014, 4, 1, self.start.hour, self.start.minute)
             until = datetime(2014, 4, 2, self.end.hour, self.end.minute)
-            return tslib.tot_seconds(until - dtstart)
+            return (until - dtstart).total_seconds()
 
     @apply_wraps
     def rollback(self, dt):
-        """Roll provided date backward to next offset only if not on offset"""
+        """
+        Roll provided date backward to next offset only if not on offset.
+        """
         if not self.onOffset(dt):
-            businesshours = self._get_business_hours_by_sec()
+            businesshours = self._get_business_hours_by_sec
             if self.n >= 0:
                 dt = self._prev_opening_time(
                     dt) + timedelta(seconds=businesshours)
@@ -798,7 +669,9 @@ def rollback(self, dt):
 
     @apply_wraps
     def rollforward(self, dt):
-        """Roll provided date forward to next offset only if not on offset"""
+        """
+        Roll provided date forward to next offset only if not on offset.
+        """
         if not self.onOffset(dt):
             if self.n >= 0:
                 return self._next_opening_time(dt)
@@ -808,9 +681,8 @@ def rollforward(self, dt):
 
     @apply_wraps
     def apply(self, other):
-        # calcurate here because offset is not immutable
-        daytime = self._get_daytime_flag()
-        businesshours = self._get_business_hours_by_sec()
+        daytime = self._get_daytime_flag
+        businesshours = self._get_business_hours_by_sec
         bhdelta = timedelta(seconds=businesshours)
 
         if isinstance(other, datetime):
@@ -857,7 +729,7 @@ def apply(self, other):
                 if n >= 0:
                     bday_edge = self._prev_opening_time(other)
                     bday_edge = bday_edge + bhdelta
-                    # calcurate remainder
+                    # calculate remainder
                     bday_remain = result - bday_edge
                     result = self._next_opening_time(other)
                     result += bday_remain
@@ -878,6 +750,7 @@ def apply(self, other):
 
             return result
         else:
+            # TODO: Figure out the end of this sente
             raise ApplyTypeError(
                 'Only know how to combine business hour with ')
 
@@ -890,12 +763,12 @@ def onOffset(self, dt):
                           dt.minute, dt.second, dt.microsecond)
         # Valid BH can be on the different BusinessDay during midnight
         # Distinguish by the time spent from previous opening time
-        businesshours = self._get_business_hours_by_sec()
+        businesshours = self._get_business_hours_by_sec
         return self._onOffset(dt, businesshours)
 
     def _onOffset(self, dt, businesshours):
         """
-        Slight speedups using calcurated values
+        Slight speedups using calculated values.
         """
         # if self.normalize and not _is_normalized(dt):
         #     return False
@@ -905,7 +778,7 @@ def _onOffset(self, dt, businesshours):
             op = self._prev_opening_time(dt)
         else:
             op = self._next_opening_time(dt)
-        span = tslib.tot_seconds(dt - op)
+        span = (dt - op).total_seconds()
         if span <= businesshours:
             return True
         else:
@@ -923,41 +796,28 @@ def _repr_attrs(self):
 
 class BusinessHour(BusinessHourMixin, SingleConstructorOffset):
     """
-    DateOffset subclass representing possibly n business days
-
-    .. versionadded: 0.16.1
+    DateOffset subclass representing possibly n business days.
 
+    .. versionadded:: 0.16.1
     """
     _prefix = 'BH'
     _anchor = 0
+    _attributes = frozenset(['n', 'normalize', 'start', 'end', 'offset'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        super(BusinessHour, self).__init__(**kwds)
-
-        # used for moving to next businessday
-        if self.n >= 0:
-            nb_offset = 1
-        else:
-            nb_offset = -1
-        self.next_bday = BusinessDay(n=nb_offset)
+    def __init__(self, n=1, normalize=False, start='09:00',
+                 end='17:00', offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        super(BusinessHour, self).__init__(start=start, end=end, offset=offset)
 
 
-class CustomBusinessDay(BusinessDay):
+class CustomBusinessDay(_CustomMixin, BusinessDay):
     """
-    **EXPERIMENTAL** DateOffset subclass representing possibly n business days
-    excluding holidays
-
-    .. warning:: EXPERIMENTAL
-
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
+    DateOffset subclass representing possibly n custom business days,
+    excluding holidays.
 
     Parameters
     ----------
     n : int, default 1
-    offset : timedelta, default timedelta(0)
     normalize : bool, default False
         Normalize start/end dates to midnight before generating date range
     weekmask : str, Default 'Mon Tue Wed Thu Fri'
@@ -966,56 +826,18 @@ class CustomBusinessDay(BusinessDay):
         list/array of dates to exclude from the set of valid business days,
         passed to ``numpy.busdaycalendar``
     calendar : pd.HolidayCalendar or np.busdaycalendar
+    offset : timedelta, default timedelta(0)
     """
-    _cacheable = False
     _prefix = 'C'
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar', 'offset'])
 
     def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        calendar, holidays = self.get_calendar(weekmask=weekmask,
-                                               holidays=holidays,
-                                               calendar=calendar)
-        # CustomBusinessDay instances are identified by the
-        # following two attributes. See DateOffset._params()
-        # holidays, weekmask
-
-        self.kwds['weekmask'] = self.weekmask = weekmask
-        self.kwds['holidays'] = self.holidays = holidays
-        self.kwds['calendar'] = self.calendar = calendar
-
-    def get_calendar(self, weekmask, holidays, calendar):
-        """Generate busdaycalendar"""
-        if isinstance(calendar, np.busdaycalendar):
-            if not holidays:
-                holidays = tuple(calendar.holidays)
-            elif not isinstance(holidays, tuple):
-                holidays = tuple(holidays)
-            else:
-                # trust that calendar.holidays and holidays are
-                # consistent
-                pass
-            return calendar, holidays
-
-        if holidays is None:
-            holidays = []
-        try:
-            holidays = holidays + calendar.holidays().tolist()
-        except AttributeError:
-            pass
-        holidays = [self._to_dt64(dt, dtype='datetime64[D]') for dt in
-                    holidays]
-        holidays = tuple(sorted(holidays))
+                 holidays=None, calendar=None, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
-        kwargs = {'weekmask': weekmask}
-        if holidays:
-            kwargs['holidays'] = holidays
-
-        busdaycalendar = np.busdaycalendar(**kwargs)
-        return busdaycalendar, holidays
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
 
     @apply_wraps
     def apply(self, other):
@@ -1048,177 +870,265 @@ def apply(self, other):
     def apply_index(self, i):
         raise NotImplementedError
 
-    @staticmethod
-    def _to_dt64(dt, dtype='datetime64'):
-        # Currently
-        # > np.datetime64(dt.datetime(2013,5,1),dtype='datetime64[D]')
-        # numpy.datetime64('2013-05-01T02:00:00.000000+0200')
-        # Thus astype is needed to cast datetime to datetime64[D]
-        if getattr(dt, 'tzinfo', None) is not None:
-            i8 = tslib.pydt_to_i8(dt)
-            dt = tslib.tz_convert_single(i8, 'UTC', dt.tzinfo)
-            dt = Timestamp(dt)
-        dt = np.datetime64(dt)
-        if dt.dtype.name != dtype:
-            dt = dt.astype(dtype)
-        return dt
-
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
             return False
-        day64 = self._to_dt64(dt, 'datetime64[D]')
+        day64 = _to_dt64(dt, 'datetime64[D]')
         return np.is_busday(day64, busdaycal=self.calendar)
 
 
-class CustomBusinessHour(BusinessHourMixin, SingleConstructorOffset):
+class CustomBusinessHour(_CustomMixin, BusinessHourMixin,
+                         SingleConstructorOffset):
     """
-    DateOffset subclass representing possibly n custom business days
-
-    .. versionadded: 0.18.1
+    DateOffset subclass representing possibly n custom business days.
 
+    .. versionadded:: 0.18.1
     """
     _prefix = 'CBH'
     _anchor = 0
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar',
+                             'start', 'end', 'offset'])
 
     def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        super(CustomBusinessHour, self).__init__(**kwds)
-        # used for moving to next businessday
-        if self.n >= 0:
-            nb_offset = 1
-        else:
-            nb_offset = -1
-        self.next_bday = CustomBusinessDay(n=nb_offset,
-                                           weekmask=weekmask,
-                                           holidays=holidays,
-                                           calendar=calendar)
+                 holidays=None, calendar=None,
+                 start='09:00', end='17:00', offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
-        self.kwds['weekmask'] = self.next_bday.weekmask
-        self.kwds['holidays'] = self.next_bday.holidays
-        self.kwds['calendar'] = self.next_bday.calendar
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
+        BusinessHourMixin.__init__(self, start=start, end=end, offset=offset)
+
+
+# ---------------------------------------------------------------------
+# Month-Based Offset Classes
 
 
 class MonthOffset(SingleConstructorOffset):
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize'])
+
+    __init__ = BaseOffset.__init__
 
     @property
     def name(self):
         if self.isAnchored:
             return self.rule_code
         else:
-            return "%s-%s" % (self.rule_code, _int_to_month[self.n])
+            month = ccalendar.MONTH_ALIASES[self.n]
+            return "{code}-{month}".format(code=self.rule_code,
+                                           month=month)
 
-
-class MonthEnd(MonthOffset):
-    """DateOffset of one month end"""
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.day == self._get_offset_day(dt)
 
     @apply_wraps
     def apply(self, other):
-        n = self.n
-        _, days_in_month = tslib.monthrange(other.year, other.month)
-        if other.day != days_in_month:
-            other = other + relativedelta(months=-1, day=31)
-            if n <= 0:
-                n = n + 1
-        other = other + relativedelta(months=n, day=31)
-        return other
+        compare_day = self._get_offset_day(other)
+        n = liboffsets.roll_convention(other.day, self.n, compare_day)
+        return shift_month(other, n, self._day_opt)
 
     @apply_index_wraps
     def apply_index(self, i):
-        shifted = tslib.shift_months(i.asi8, self.n, 'end')
-        return i._shallow_copy(shifted)
+        shifted = liboffsets.shift_months(i.asi8, self.n, self._day_opt)
+        # TODO: going through __new__ raises on call to _validate_frequency;
+        #  are we passing incorrect freq?
+        return type(i)._simple_new(shifted, freq=i.freq, dtype=i.dtype)
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        days_in_month = tslib.monthrange(dt.year, dt.month)[1]
-        return dt.day == days_in_month
 
+class MonthEnd(MonthOffset):
+    """
+    DateOffset of one month end.
+    """
     _prefix = 'M'
+    _day_opt = 'end'
 
 
 class MonthBegin(MonthOffset):
-    """DateOffset of one month at beginning"""
+    """
+    DateOffset of one month at beginning.
+    """
+    _prefix = 'MS'
+    _day_opt = 'start'
 
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
 
-        if other.day > 1 and n <= 0:  # then roll forward if n<=0
-            n += 1
+class BusinessMonthEnd(MonthOffset):
+    """
+    DateOffset increments between business EOM dates.
+    """
+    _prefix = 'BM'
+    _day_opt = 'business_end'
 
-        return other + relativedelta(months=n, day=1)
 
-    @apply_index_wraps
-    def apply_index(self, i):
-        shifted = tslib.shift_months(i.asi8, self.n, 'start')
-        return i._shallow_copy(shifted)
+class BusinessMonthBegin(MonthOffset):
+    """
+    DateOffset of one business month at beginning.
+    """
+    _prefix = 'BMS'
+    _day_opt = 'business_start'
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt.day == 1
 
-    _prefix = 'MS'
+class _CustomBusinessMonth(_CustomMixin, BusinessMixin, MonthOffset):
+    """
+    DateOffset subclass representing one custom business month, incrementing
+    between [BEGIN/END] of month dates.
 
+    Parameters
+    ----------
+    n : int, default 1
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range
+    weekmask : str, Default 'Mon Tue Wed Thu Fri'
+        weekmask of valid business days, passed to ``numpy.busdaycalendar``
+    holidays : list
+        list/array of dates to exclude from the set of valid business days,
+        passed to ``numpy.busdaycalendar``
+    calendar : pd.HolidayCalendar or np.busdaycalendar
+    offset : timedelta, default timedelta(0)
+    """
+    _attributes = frozenset(['n', 'normalize',
+                             'weekmask', 'holidays', 'calendar', 'offset'])
 
-class SemiMonthOffset(DateOffset):
-    _adjust_dst = True
-    _default_day_of_month = 15
-    _min_day_of_month = 2
+    onOffset = DateOffset.onOffset        # override MonthOffset method
+    apply_index = DateOffset.apply_index  # override MonthOffset method
 
-    def __init__(self, n=1, day_of_month=None, normalize=False, **kwds):
-        if day_of_month is None:
-            self.day_of_month = self._default_day_of_month
-        else:
-            self.day_of_month = int(day_of_month)
-        if not self._min_day_of_month <= self.day_of_month <= 27:
-            raise ValueError('day_of_month must be '
-                             '{}<=day_of_month<=27, got {}'.format(
-                                 self._min_day_of_month, self.day_of_month))
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.kwds['day_of_month'] = self.day_of_month
+    def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
+                 holidays=None, calendar=None, offset=timedelta(0)):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "_offset", offset)
 
-    @classmethod
-    def _from_name(cls, suffix=None):
-        return cls(day_of_month=suffix)
+        _CustomMixin.__init__(self, weekmask, holidays, calendar)
 
-    @property
-    def rule_code(self):
-        suffix = '-{}'.format(self.day_of_month)
+    @cache_readonly
+    def cbday_roll(self):
+        """
+        Define default roll function to be called in apply method.
+        """
+        cbday = CustomBusinessDay(n=self.n, normalize=False, **self.kwds)
+
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            roll_func = cbday.rollforward
+        else:
+            # MonthEnd
+            roll_func = cbday.rollback
+        return roll_func
+
+    @cache_readonly
+    def m_offset(self):
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            moff = MonthBegin(n=1, normalize=False)
+        else:
+            # MonthEnd
+            moff = MonthEnd(n=1, normalize=False)
+        return moff
+
+    @cache_readonly
+    def month_roll(self):
+        """
+        Define default roll function to be called in apply method.
+        """
+        if self._prefix.endswith('S'):
+            # MonthBegin
+            roll_func = self.m_offset.rollback
+        else:
+            # MonthEnd
+            roll_func = self.m_offset.rollforward
+        return roll_func
+
+    @apply_wraps
+    def apply(self, other):
+        # First move to month offset
+        cur_month_offset_date = self.month_roll(other)
+
+        # Find this custom month offset
+        compare_date = self.cbday_roll(cur_month_offset_date)
+        n = liboffsets.roll_convention(other.day, self.n, compare_date.day)
+
+        new = cur_month_offset_date + n * self.m_offset
+        result = self.cbday_roll(new)
+        return result
+
+
+class CustomBusinessMonthEnd(_CustomBusinessMonth):
+    # TODO(py27): Replace condition with Subsitution after dropping Py27
+    if _CustomBusinessMonth.__doc__:
+        __doc__ = _CustomBusinessMonth.__doc__.replace('[BEGIN/END]', 'end')
+    _prefix = 'CBM'
+
+
+class CustomBusinessMonthBegin(_CustomBusinessMonth):
+    # TODO(py27): Replace condition with Subsitution after dropping Py27
+    if _CustomBusinessMonth.__doc__:
+        __doc__ = _CustomBusinessMonth.__doc__.replace('[BEGIN/END]',
+                                                       'beginning')
+    _prefix = 'CBMS'
+
+
+# ---------------------------------------------------------------------
+# Semi-Month Based Offset Classes
+
+class SemiMonthOffset(DateOffset):
+    _adjust_dst = True
+    _default_day_of_month = 15
+    _min_day_of_month = 2
+    _attributes = frozenset(['n', 'normalize', 'day_of_month'])
+
+    def __init__(self, n=1, normalize=False, day_of_month=None):
+        BaseOffset.__init__(self, n, normalize)
+
+        if day_of_month is None:
+            object.__setattr__(self, "day_of_month",
+                               self._default_day_of_month)
+        else:
+            object.__setattr__(self, "day_of_month", int(day_of_month))
+        if not self._min_day_of_month <= self.day_of_month <= 27:
+            msg = 'day_of_month must be {min}<=day_of_month<=27, got {day}'
+            raise ValueError(msg.format(min=self._min_day_of_month,
+                                        day=self.day_of_month))
+
+    @classmethod
+    def _from_name(cls, suffix=None):
+        return cls(day_of_month=suffix)
+
+    @property
+    def rule_code(self):
+        suffix = '-{day_of_month}'.format(day_of_month=self.day_of_month)
         return self._prefix + suffix
 
     @apply_wraps
     def apply(self, other):
-        n = self.n
-        if not self.onOffset(other):
-            _, days_in_month = tslib.monthrange(other.year, other.month)
-            if 1 < other.day < self.day_of_month:
-                other += relativedelta(day=self.day_of_month)
-                if n > 0:
-                    # rollforward so subtract 1
-                    n -= 1
-            elif self.day_of_month < other.day < days_in_month:
-                other += relativedelta(day=self.day_of_month)
-                if n < 0:
-                    # rollforward in the negative direction so add 1
-                    n += 1
-                elif n == 0:
-                    n = 1
+        # shift `other` to self.day_of_month, incrementing `n` if necessary
+        n = liboffsets.roll_convention(other.day, self.n, self.day_of_month)
+
+        days_in_month = ccalendar.get_days_in_month(other.year, other.month)
+
+        # For SemiMonthBegin on other.day == 1 and
+        # SemiMonthEnd on other.day == days_in_month,
+        # shifting `other` to `self.day_of_month` _always_ requires
+        # incrementing/decrementing `n`, regardless of whether it is
+        # initially positive.
+        if type(self) is SemiMonthBegin and (self.n <= 0 and other.day == 1):
+            n -= 1
+        elif type(self) is SemiMonthEnd and (self.n > 0 and
+                                             other.day == days_in_month):
+            n += 1
 
         return self._apply(n, other)
 
     def _apply(self, n, other):
-        """Handle specific apply logic for child classes"""
+        """
+        Handle specific apply logic for child classes.
+        """
         raise AbstractMethodError(self)
 
     @apply_index_wraps
     def apply_index(self, i):
         # determine how many days away from the 1st of the month we are
+        dti = i
         days_from_start = i.to_perioddelta('M').asi8
         delta = Timedelta(days=self.day_of_month - 1).value
 
@@ -1235,7 +1145,16 @@ def apply_index(self, i):
         time = i.to_perioddelta('D')
 
         # apply the correct number of months
-        i = (i.to_period('M') + (roll // 2)).to_timestamp()
+
+        # integer-array addition on PeriodIndex is deprecated,
+        #  so we use _addsub_int_array directly
+        asper = i.to_period('M')
+        if not isinstance(asper._data, np.ndarray):
+            # unwrap PeriodIndex --> PeriodArray
+            asper = asper._data
+
+        shifted = asper._addsub_int_array(roll // 2, operator.add)
+        i = type(dti)(shifted.to_timestamp())
 
         # apply the correct day
         i = self._apply_index_days(i, roll)
@@ -1243,7 +1162,8 @@ def apply_index(self, i):
         return i + time
 
     def _get_roll(self, i, before_day_of_month, after_day_of_month):
-        """Return an array with the correct n for each date in i.
+        """
+        Return an array with the correct n for each date in i.
 
         The roll array is based on the fact that i gets rolled back to
         the first day of the month.
@@ -1251,7 +1171,9 @@ def _get_roll(self, i, before_day_of_month, after_day_of_month):
         raise AbstractMethodError(self)
 
     def _apply_index_days(self, i, roll):
-        """Apply the correct day for each date in i"""
+        """
+        Apply the correct day for each date in i.
+        """
         raise AbstractMethodError(self)
 
 
@@ -1264,9 +1186,9 @@ class SemiMonthEnd(SemiMonthOffset):
 
     Parameters
     ----------
-    n: int
+    n : int
     normalize : bool, default False
-    day_of_month: int, {1, 3,...,27}, default 15
+    day_of_month : int, {1, 3,...,27}, default 15
     """
     _prefix = 'SM'
     _min_day_of_month = 1
@@ -1274,25 +1196,13 @@ class SemiMonthEnd(SemiMonthOffset):
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
             return False
-        _, days_in_month = tslib.monthrange(dt.year, dt.month)
+        days_in_month = ccalendar.get_days_in_month(dt.year, dt.month)
         return dt.day in (self.day_of_month, days_in_month)
 
     def _apply(self, n, other):
-        # if other.day is not day_of_month move to day_of_month and update n
-        if other.day < self.day_of_month:
-            other += relativedelta(day=self.day_of_month)
-            if n > 0:
-                n -= 1
-        elif other.day > self.day_of_month:
-            other += relativedelta(day=self.day_of_month)
-            if n == 0:
-                n = 1
-            else:
-                n += 1
-
         months = n // 2
         day = 31 if n % 2 else self.day_of_month
-        return other + relativedelta(months=months, day=day)
+        return shift_month(other, months, day)
 
     def _get_roll(self, i, before_day_of_month, after_day_of_month):
         n = self.n
@@ -1310,7 +1220,20 @@ def _get_roll(self, i, before_day_of_month, after_day_of_month):
         return roll
 
     def _apply_index_days(self, i, roll):
-        i += (roll % 2) * Timedelta(days=self.day_of_month).value
+        """
+        Add days portion of offset to DatetimeIndex i.
+
+        Parameters
+        ----------
+        i : DatetimeIndex
+        roll : ndarray[int64_t]
+
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        nanos = (roll % 2) * Timedelta(days=self.day_of_month).value
+        i += nanos.astype('timedelta64[ns]')
         return i + Timedelta(days=-1)
 
 
@@ -1323,9 +1246,9 @@ class SemiMonthBegin(SemiMonthOffset):
 
     Parameters
     ----------
-    n: int
+    n : int
     normalize : bool, default False
-    day_of_month: int, {2, 3,...,27}, default 15
+    day_of_month : int, {2, 3,...,27}, default 15
     """
     _prefix = 'SMS'
 
@@ -1335,23 +1258,9 @@ def onOffset(self, dt):
         return dt.day in (1, self.day_of_month)
 
     def _apply(self, n, other):
-        # if other.day is not day_of_month move to day_of_month and update n
-        if other.day < self.day_of_month:
-            other += relativedelta(day=self.day_of_month)
-            if n == 0:
-                n = -1
-            else:
-                n -= 1
-        elif other.day > self.day_of_month:
-            other += relativedelta(day=self.day_of_month)
-            if n == 0:
-                n = 1
-            elif n < 0:
-                n += 1
-
         months = n // 2 + n % 2
         day = 1 if n % 2 else self.day_of_month
-        return other + relativedelta(months=months, day=day)
+        return shift_month(other, months, day)
 
     def _get_roll(self, i, before_day_of_month, after_day_of_month):
         n = self.n
@@ -1369,197 +1278,28 @@ def _get_roll(self, i, before_day_of_month, after_day_of_month):
         return roll
 
     def _apply_index_days(self, i, roll):
-        return i + (roll % 2) * Timedelta(days=self.day_of_month - 1).value
-
-
-class BusinessMonthEnd(MonthOffset):
-    """DateOffset increments between business EOM dates"""
-
-    def isAnchored(self):
-        return (self.n == 1)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-        lastBDay = days_in_month - max(((wkday + days_in_month - 1)
-                                        % 7) - 4, 0)
-
-        if n > 0 and not other.day >= lastBDay:
-            n = n - 1
-        elif n <= 0 and other.day > lastBDay:
-            n = n + 1
-        other = other + relativedelta(months=n, day=31)
-
-        if other.weekday() > 4:
-            other = other - BDay()
-        return other
-
-    _prefix = 'BM'
-
-
-class BusinessMonthBegin(MonthOffset):
-    """DateOffset of one business month at beginning"""
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-
-        if other.day > first and n <= 0:
-            # as if rolled forward already
-            n += 1
-        elif other.day < first and n > 0:
-            other = other + timedelta(days=first - other.day)
-            n -= 1
-
-        other = other + relativedelta(months=n)
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-        result = datetime(other.year, other.month, first,
-                          other.hour, other.minute,
-                          other.second, other.microsecond)
-        return result
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        first_weekday, _ = tslib.monthrange(dt.year, dt.month)
-        if first_weekday == 5:
-            return dt.day == 3
-        elif first_weekday == 6:
-            return dt.day == 2
-        else:
-            return dt.day == 1
-
-    _prefix = 'BMS'
-
-
-class CustomBusinessMonthEnd(BusinessMixin, MonthOffset):
-    """
-    **EXPERIMENTAL** DateOffset of one custom business month
-
-    .. warning:: EXPERIMENTAL
-
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
-
-    Parameters
-    ----------
-    n : int, default 1
-    offset : timedelta, default timedelta(0)
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    weekmask : str, Default 'Mon Tue Wed Thu Fri'
-        weekmask of valid business days, passed to ``numpy.busdaycalendar``
-    holidays : list
-        list/array of dates to exclude from the set of valid business days,
-        passed to ``numpy.busdaycalendar``
-    calendar : pd.HolidayCalendar or np.busdaycalendar
-    """
-
-    _cacheable = False
-    _prefix = 'CBM'
-
-    def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.cbday = CustomBusinessDay(n=self.n, normalize=normalize,
-                                       weekmask=weekmask, holidays=holidays,
-                                       calendar=calendar, **kwds)
-        self.m_offset = MonthEnd(n=1, normalize=normalize, **kwds)
-        self.kwds['calendar'] = self.cbday.calendar  # cache numpy calendar
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        # First move to month offset
-        cur_mend = self.m_offset.rollforward(other)
-        # Find this custom month offset
-        cur_cmend = self.cbday.rollback(cur_mend)
-
-        # handle zero case. arbitrarily rollforward
-        if n == 0 and other != cur_cmend:
-            n += 1
-
-        if other < cur_cmend and n >= 1:
-            n -= 1
-        elif other > cur_cmend and n <= -1:
-            n += 1
-
-        new = cur_mend + n * self.m_offset
-        result = self.cbday.rollback(new)
-        return result
-
-
-class CustomBusinessMonthBegin(BusinessMixin, MonthOffset):
-    """
-    **EXPERIMENTAL** DateOffset of one custom business month
-
-    .. warning:: EXPERIMENTAL
-
-        This class is not officially supported and the API is likely to change
-        in future versions. Use this at your own risk.
-
-    Parameters
-    ----------
-    n : int, default 1
-    offset : timedelta, default timedelta(0)
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range
-    weekmask : str, Default 'Mon Tue Wed Thu Fri'
-        weekmask of valid business days, passed to ``numpy.busdaycalendar``
-    holidays : list
-        list/array of dates to exclude from the set of valid business days,
-        passed to ``numpy.busdaycalendar``
-    calendar : pd.HolidayCalendar or np.busdaycalendar
-    """
-
-    _cacheable = False
-    _prefix = 'CBMS'
-
-    def __init__(self, n=1, normalize=False, weekmask='Mon Tue Wed Thu Fri',
-                 holidays=None, calendar=None, **kwds):
-        self.n = int(n)
-        self.normalize = normalize
-        self.kwds = kwds
-        self.offset = kwds.get('offset', timedelta(0))
-        self.cbday = CustomBusinessDay(n=self.n, normalize=normalize,
-                                       weekmask=weekmask, holidays=holidays,
-                                       calendar=calendar, **kwds)
-        self.m_offset = MonthBegin(n=1, normalize=normalize, **kwds)
-        self.kwds['calendar'] = self.cbday.calendar  # cache numpy calendar
+        """
+        Add days portion of offset to DatetimeIndex i.
 
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        dt_in = other
-        # First move to month offset
-        cur_mbegin = self.m_offset.rollback(dt_in)
-        # Find this custom month offset
-        cur_cmbegin = self.cbday.rollforward(cur_mbegin)
+        Parameters
+        ----------
+        i : DatetimeIndex
+        roll : ndarray[int64_t]
 
-        # handle zero case. arbitrarily rollforward
-        if n == 0 and dt_in != cur_cmbegin:
-            n += 1
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        nanos = (roll % 2) * Timedelta(days=self.day_of_month - 1).value
+        return i + nanos.astype('timedelta64[ns]')
 
-        if dt_in > cur_cmbegin and n <= -1:
-            n += 1
-        elif dt_in < cur_cmbegin and n >= 1:
-            n -= 1
-
-        new = cur_mbegin + n * self.m_offset
-        result = self.cbday.rollforward(new)
-        return result
 
+# ---------------------------------------------------------------------
+# Week-Based Offset Classes
 
 class Week(DateOffset):
     """
-    Weekly offset
+    Weekly offset.
 
     Parameters
     ----------
@@ -1567,70 +1307,102 @@ class Week(DateOffset):
         Always generate specific day of week. 0 for Monday
     """
     _adjust_dst = True
+    _inc = timedelta(weeks=1)
+    _prefix = 'W'
+    _attributes = frozenset(['n', 'normalize', 'weekday'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds.get('weekday', None)
+    def __init__(self, n=1, normalize=False, weekday=None):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
 
         if self.weekday is not None:
             if self.weekday < 0 or self.weekday > 6:
-                raise ValueError('Day must be 0<=day<=6, got %d' %
-                                 self.weekday)
-
-        self._inc = timedelta(weeks=1)
-        self.kwds = kwds
+                raise ValueError('Day must be 0<=day<=6, got {day}'
+                                 .format(day=self.weekday))
 
     def isAnchored(self):
         return (self.n == 1 and self.weekday is not None)
 
     @apply_wraps
     def apply(self, other):
-        base = other
         if self.weekday is None:
             return other + self.n * self._inc
 
-        if self.n > 0:
-            k = self.n
-            otherDay = other.weekday()
-            if otherDay != self.weekday:
-                other = other + timedelta((self.weekday - otherDay) % 7)
-                k = k - 1
-            other = other
-            for i in range(k):
-                other = other + self._inc
-        else:
-            k = self.n
-            otherDay = other.weekday()
-            if otherDay != self.weekday:
-                other = other + timedelta((self.weekday - otherDay) % 7)
-            for i in range(-k):
-                other = other - self._inc
+        k = self.n
+        otherDay = other.weekday()
+        if otherDay != self.weekday:
+            other = other + timedelta((self.weekday - otherDay) % 7)
+            if k > 0:
+                k -= 1
 
-        other = datetime(other.year, other.month, other.day,
-                         base.hour, base.minute, base.second, base.microsecond)
-        return other
+        return other + timedelta(weeks=k)
 
     @apply_index_wraps
     def apply_index(self, i):
         if self.weekday is None:
-            return ((i.to_period('W') + self.n).to_timestamp() +
-                    i.to_perioddelta('W'))
+            # integer addition on PeriodIndex is deprecated,
+            #  so we use _time_shift directly
+            asper = i.to_period('W')
+            if not isinstance(asper._data, np.ndarray):
+                # unwrap PeriodIndex --> PeriodArray
+                asper = asper._data
+
+            shifted = asper._time_shift(self.n)
+            return shifted.to_timestamp() + i.to_perioddelta('W')
         else:
-            return self._end_apply_index(i, self.freqstr)
+            return self._end_apply_index(i)
+
+    def _end_apply_index(self, dtindex):
+        """
+        Add self to the given DatetimeIndex, specialized for case where
+        self.weekday is non-null.
+
+        Parameters
+        ----------
+        dtindex : DatetimeIndex
+
+        Returns
+        -------
+        result : DatetimeIndex
+        """
+        off = dtindex.to_perioddelta('D')
+
+        base, mult = libfrequencies.get_freq_code(self.freqstr)
+        base_period = dtindex.to_period(base)
+        if not isinstance(base_period._data, np.ndarray):
+            # unwrap PeriodIndex --> PeriodArray
+            base_period = base_period._data
+
+        if self.n > 0:
+            # when adding, dates on end roll to next
+            normed = dtindex - off + Timedelta(1, 'D') - Timedelta(1, 'ns')
+            roll = np.where(base_period.to_timestamp(how='end') == normed,
+                            self.n, self.n - 1)
+            # integer-array addition on PeriodIndex is deprecated,
+            #  so we use _addsub_int_array directly
+            shifted = base_period._addsub_int_array(roll, operator.add)
+            base = shifted.to_timestamp(how='end')
+        else:
+            # integer addition on PeriodIndex is deprecated,
+            #  so we use _time_shift directly
+            roll = self.n
+            base = base_period._time_shift(roll).to_timestamp(how='end')
+
+        return base + off + Timedelta(1, 'ns') - Timedelta(1, 'D')
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
             return False
+        elif self.weekday is None:
+            return True
         return dt.weekday() == self.weekday
 
-    _prefix = 'W'
-
     @property
     def rule_code(self):
         suffix = ''
         if self.weekday is not None:
-            suffix = '-%s' % (_int_to_weekday[self.weekday])
+            weekday = ccalendar.int_to_weekday[self.weekday]
+            suffix = '-{weekday}'.format(weekday=weekday)
         return self._prefix + suffix
 
     @classmethod
@@ -1638,43 +1410,44 @@ def _from_name(cls, suffix=None):
         if not suffix:
             weekday = None
         else:
-            weekday = _weekday_to_int[suffix]
+            weekday = ccalendar.weekday_to_int[suffix]
         return cls(weekday=weekday)
 
 
-class WeekDay(object):
-    MON = 0
-    TUE = 1
-    WED = 2
-    THU = 3
-    FRI = 4
-    SAT = 5
-    SUN = 6
+class _WeekOfMonthMixin(object):
+    """
+    Mixin for methods common to WeekOfMonth and LastWeekOfMonth.
+    """
+    @apply_wraps
+    def apply(self, other):
+        compare_day = self._get_offset_day(other)
 
+        months = self.n
+        if months > 0 and compare_day > other.day:
+            months -= 1
+        elif months <= 0 and compare_day < other.day:
+            months += 1
 
-_int_to_weekday = {
-    WeekDay.MON: 'MON',
-    WeekDay.TUE: 'TUE',
-    WeekDay.WED: 'WED',
-    WeekDay.THU: 'THU',
-    WeekDay.FRI: 'FRI',
-    WeekDay.SAT: 'SAT',
-    WeekDay.SUN: 'SUN'
-}
+        shifted = shift_month(other, months, 'start')
+        to_day = self._get_offset_day(shifted)
+        return liboffsets.shift_day(shifted, to_day - shifted.day)
 
-_weekday_to_int = dict((v, k) for k, v in _int_to_weekday.items())
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.day == self._get_offset_day(dt)
 
 
-class WeekOfMonth(DateOffset):
+class WeekOfMonth(_WeekOfMonthMixin, DateOffset):
     """
-    Describes monthly dates like "the Tuesday of the 2nd week of each month"
+    Describes monthly dates like "the Tuesday of the 2nd week of each month".
 
     Parameters
     ----------
     n : int
-    week : {0, 1, 2, 3, ...}
+    week : {0, 1, 2, 3, ...}, default 0
         0 is 1st week of month, 1 2nd week, etc.
-    weekday : {0, 1, ..., 6}
+    weekday : {0, 1, ..., 6}, default 0
         0: Mondays
         1: Tuesdays
         2: Wednesdays
@@ -1683,94 +1456,68 @@ class WeekOfMonth(DateOffset):
         5: Saturdays
         6: Sundays
     """
-
+    _prefix = 'WOM'
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'week', 'weekday'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds['weekday']
-        self.week = kwds['week']
-
-        if self.n == 0:
-            raise ValueError('N cannot be 0')
+    def __init__(self, n=1, normalize=False, week=0, weekday=0):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
+        object.__setattr__(self, "week", week)
 
         if self.weekday < 0 or self.weekday > 6:
-            raise ValueError('Day must be 0<=day<=6, got %d' %
-                             self.weekday)
+            raise ValueError('Day must be 0<=day<=6, got {day}'
+                             .format(day=self.weekday))
         if self.week < 0 or self.week > 3:
-            raise ValueError('Week must be 0<=day<=3, got %d' %
-                             self.week)
+            raise ValueError('Week must be 0<=week<=3, got {week}'
+                             .format(week=self.week))
 
-        self.kwds = kwds
-
-    @apply_wraps
-    def apply(self, other):
-        base = other
-        offsetOfMonth = self.getOffsetOfMonth(other)
-
-        if offsetOfMonth > other:
-            if self.n > 0:
-                months = self.n - 1
-            else:
-                months = self.n
-        elif offsetOfMonth == other:
-            months = self.n
-        else:
-            if self.n > 0:
-                months = self.n
-            else:
-                months = self.n + 1
-
-        other = self.getOffsetOfMonth(
-            other + relativedelta(months=months, day=1))
-        other = datetime(other.year, other.month, other.day, base.hour,
-                         base.minute, base.second, base.microsecond)
-        return other
-
-    def getOffsetOfMonth(self, dt):
-        w = Week(weekday=self.weekday)
-        d = datetime(dt.year, dt.month, 1, tzinfo=dt.tzinfo)
-        d = w.rollforward(d)
-
-        for i in range(self.week):
-            d = w.apply(d)
+    def _get_offset_day(self, other):
+        """
+        Find the day in the same month as other that has the same
+        weekday as self.weekday and is the self.week'th such day in the month.
 
-        return d
+        Parameters
+        ----------
+        other : datetime
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        d = datetime(dt.year, dt.month, dt.day, tzinfo=dt.tzinfo)
-        return d == self.getOffsetOfMonth(dt)
+        Returns
+        -------
+        day : int
+        """
+        mstart = datetime(other.year, other.month, 1)
+        wday = mstart.weekday()
+        shift_days = (self.weekday - wday) % 7
+        return 1 + shift_days + self.week * 7
 
     @property
     def rule_code(self):
-        return '%s-%d%s' % (self._prefix, self.week + 1,
-                            _int_to_weekday.get(self.weekday, ''))
-
-    _prefix = 'WOM'
+        weekday = ccalendar.int_to_weekday.get(self.weekday, '')
+        return '{prefix}-{week}{weekday}'.format(prefix=self._prefix,
+                                                 week=self.week + 1,
+                                                 weekday=weekday)
 
     @classmethod
     def _from_name(cls, suffix=None):
         if not suffix:
-            raise ValueError("Prefix %r requires a suffix." % (cls._prefix))
+            raise ValueError("Prefix {prefix!r} requires a suffix."
+                             .format(prefix=cls._prefix))
         # TODO: handle n here...
         # only one digit weeks (1 --> week 0, 2 --> week 1, etc.)
         week = int(suffix[0]) - 1
-        weekday = _weekday_to_int[suffix[1:]]
+        weekday = ccalendar.weekday_to_int[suffix[1:]]
         return cls(week=week, weekday=weekday)
 
 
-class LastWeekOfMonth(DateOffset):
+class LastWeekOfMonth(_WeekOfMonthMixin, DateOffset):
     """
     Describes monthly dates in last week of month like "the last Tuesday of
-    each month"
+    each month".
 
     Parameters
     ----------
-    n : int
-    weekday : {0, 1, ..., 6}
+    n : int, default 1
+    weekday : {0, 1, ..., 6}, default 0
         0: Mondays
         1: Tuesdays
         2: Wednesdays
@@ -1779,87 +1526,77 @@ class LastWeekOfMonth(DateOffset):
         5: Saturdays
         6: Sundays
     """
+    _prefix = 'LWOM'
+    _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'weekday'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.weekday = kwds['weekday']
+    def __init__(self, n=1, normalize=False, weekday=0):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "weekday", weekday)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
         if self.weekday < 0 or self.weekday > 6:
-            raise ValueError('Day must be 0<=day<=6, got %d' %
-                             self.weekday)
-
-        self.kwds = kwds
-
-    @apply_wraps
-    def apply(self, other):
-        offsetOfMonth = self.getOffsetOfMonth(other)
-
-        if offsetOfMonth > other:
-            if self.n > 0:
-                months = self.n - 1
-            else:
-                months = self.n
-        elif offsetOfMonth == other:
-            months = self.n
-        else:
-            if self.n > 0:
-                months = self.n
-            else:
-                months = self.n + 1
+            raise ValueError('Day must be 0<=day<=6, got {day}'
+                             .format(day=self.weekday))
 
-        return self.getOffsetOfMonth(
-            other + relativedelta(months=months, day=1))
+    def _get_offset_day(self, other):
+        """
+        Find the day in the same month as other that has the same
+        weekday as self.weekday and is the last such day in the month.
 
-    def getOffsetOfMonth(self, dt):
-        m = MonthEnd()
-        d = datetime(dt.year, dt.month, 1, dt.hour, dt.minute,
-                     dt.second, dt.microsecond, tzinfo=dt.tzinfo)
-        eom = m.rollforward(d)
-        w = Week(weekday=self.weekday)
-        return w.rollback(eom)
+        Parameters
+        ----------
+        other: datetime
 
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt == self.getOffsetOfMonth(dt)
+        Returns
+        -------
+        day: int
+        """
+        dim = ccalendar.get_days_in_month(other.year, other.month)
+        mend = datetime(other.year, other.month, dim)
+        wday = mend.weekday()
+        shift_days = (wday - self.weekday) % 7
+        return dim - shift_days
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_weekday.get(self.weekday, ''))
-
-    _prefix = 'LWOM'
+        weekday = ccalendar.int_to_weekday.get(self.weekday, '')
+        return '{prefix}-{weekday}'.format(prefix=self._prefix,
+                                           weekday=weekday)
 
     @classmethod
     def _from_name(cls, suffix=None):
         if not suffix:
-            raise ValueError("Prefix %r requires a suffix." % (cls._prefix))
+            raise ValueError("Prefix {prefix!r} requires a suffix."
+                             .format(prefix=cls._prefix))
         # TODO: handle n here...
-        weekday = _weekday_to_int[suffix]
+        weekday = ccalendar.weekday_to_int[suffix]
         return cls(weekday=weekday)
 
+# ---------------------------------------------------------------------
+# Quarter-Based Offset Classes
 
-class QuarterOffset(DateOffset):
-    """Quarter representation - doesn't call super"""
 
-    #: default month for __init__
+class QuarterOffset(DateOffset):
+    """
+    Quarter representation - doesn't call super.
+    """
     _default_startingMonth = None
-    #: default month in _from_name
     _from_name_startingMonth = None
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'startingMonth'])
     # TODO: Consider combining QuarterOffset and YearOffset __init__ at some
-    #       point
+    #       point.  Also apply_index, onOffset, rule_code if
+    #       startingMonth vs month attr names are resolved
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds.get('startingMonth',
-                                      self._default_startingMonth)
+    def __init__(self, n=1, normalize=False, startingMonth=None):
+        BaseOffset.__init__(self, n, normalize)
 
-        self.kwds = kwds
+        if startingMonth is None:
+            startingMonth = self._default_startingMonth
+        object.__setattr__(self, "startingMonth", startingMonth)
 
     def isAnchored(self):
         return (self.n == 1 and self.startingMonth is not None)
@@ -1868,7 +1605,7 @@ def isAnchored(self):
     def _from_name(cls, suffix=None):
         kwargs = {}
         if suffix:
-            kwargs['startingMonth'] = _month_to_int[suffix]
+            kwargs['startingMonth'] = ccalendar.MONTH_TO_CAL_NUM[suffix]
         else:
             if cls._from_name_startingMonth is not None:
                 kwargs['startingMonth'] = cls._from_name_startingMonth
@@ -1876,57 +1613,51 @@ def _from_name(cls, suffix=None):
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_month[self.startingMonth])
+        month = ccalendar.MONTH_ALIASES[self.startingMonth]
+        return '{prefix}-{month}'.format(prefix=self._prefix, month=month)
+
+    @apply_wraps
+    def apply(self, other):
+        # months_since: find the calendar quarter containing other.month,
+        # e.g. if other.month == 8, the calendar quarter is [Jul, Aug, Sep].
+        # Then find the month in that quarter containing an onOffset date for
+        # self.  `months_since` is the number of months to shift other.month
+        # to get to this on-offset month.
+        months_since = other.month % 3 - self.startingMonth % 3
+        qtrs = liboffsets.roll_qtrday(other, self.n, self.startingMonth,
+                                      day_opt=self._day_opt, modby=3)
+        months = qtrs * 3 - months_since
+        return shift_month(other, months, self._day_opt)
+
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        mod_month = (dt.month - self.startingMonth) % 3
+        return mod_month == 0 and dt.day == self._get_offset_day(dt)
+
+    @apply_index_wraps
+    def apply_index(self, dtindex):
+        shifted = liboffsets.shift_quarters(dtindex.asi8, self.n,
+                                            self.startingMonth, self._day_opt)
+        # TODO: going through __new__ raises on call to _validate_frequency;
+        #  are we passing incorrect freq?
+        return type(dtindex)._simple_new(shifted, freq=dtindex.freq,
+                                         dtype=dtindex.dtype)
 
 
 class BQuarterEnd(QuarterOffset):
-    """DateOffset increments between business Quarter dates
+    """
+    DateOffset increments between business Quarter dates.
+
     startingMonth = 1 corresponds to dates like 1/31/2007, 4/30/2007, ...
     startingMonth = 2 corresponds to dates like 2/28/2007, 5/31/2007, ...
     startingMonth = 3 corresponds to dates like 3/30/2007, 6/29/2007, ...
     """
     _outputName = 'BusinessQuarterEnd'
     _default_startingMonth = 3
-    # 'BQ'
     _from_name_startingMonth = 12
     _prefix = 'BQ'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        base = other
-        other = datetime(other.year, other.month, other.day,
-                         other.hour, other.minute, other.second,
-                         other.microsecond)
-
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-        lastBDay = days_in_month - max(((wkday + days_in_month - 1)
-                                        % 7) - 4, 0)
-
-        monthsToGo = 3 - ((other.month - self.startingMonth) % 3)
-        if monthsToGo == 3:
-            monthsToGo = 0
-
-        if n > 0 and not (other.day >= lastBDay and monthsToGo == 0):
-            n = n - 1
-        elif n <= 0 and other.day > lastBDay and monthsToGo == 0:
-            n = n + 1
-
-        other = other + relativedelta(months=monthsToGo + 3 * n, day=31)
-        other = tslib._localize_pydatetime(other, base.tzinfo)
-        if other.weekday() > 4:
-            other = other - BDay()
-        return other
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        modMonth = (dt.month - self.startingMonth) % 3
-        return BMonthEnd().onOffset(dt) and modMonth == 0
-
-
-_int_to_month = tslib._MONTH_ALIASES
-_month_to_int = dict((v, k) for k, v in _int_to_month.items())
+    _day_opt = 'business_end'
 
 
 # TODO: This is basically the same as BQuarterEnd
@@ -1936,38 +1667,13 @@ class BQuarterBegin(QuarterOffset):
     _default_startingMonth = 3
     _from_name_startingMonth = 1
     _prefix = 'BQS'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, _ = tslib.monthrange(other.year, other.month)
-
-        first = _get_firstbday(wkday)
-
-        monthsSince = (other.month - self.startingMonth) % 3
-
-        if n <= 0 and monthsSince != 0:  # make sure to roll forward so negate
-            monthsSince = monthsSince - 3
-
-        # roll forward if on same month later than first bday
-        if n <= 0 and (monthsSince == 0 and other.day > first):
-            n = n + 1
-        # pretend to roll back if on same month but before firstbday
-        elif n > 0 and (monthsSince == 0 and other.day < first):
-            n = n - 1
-
-        # get the first bday for result
-        other = other + relativedelta(months=3 * n - monthsSince)
-        wkday, _ = tslib.monthrange(other.year, other.month)
-        first = _get_firstbday(wkday)
-        result = datetime(other.year, other.month, first,
-                          other.hour, other.minute, other.second,
-                          other.microsecond)
-        return result
+    _day_opt = 'business_start'
 
 
 class QuarterEnd(QuarterOffset):
-    """DateOffset increments between business Quarter dates
+    """
+    DateOffset increments between business Quarter dates.
+
     startingMonth = 1 corresponds to dates like 1/31/2007, 4/30/2007, ...
     startingMonth = 2 corresponds to dates like 2/28/2007, 5/31/2007, ...
     startingMonth = 3 corresponds to dates like 3/31/2007, 6/30/2007, ...
@@ -1975,44 +1681,7 @@ class QuarterEnd(QuarterOffset):
     _outputName = 'QuarterEnd'
     _default_startingMonth = 3
     _prefix = 'Q'
-
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds.get('startingMonth', 3)
-
-        self.kwds = kwds
-
-    def isAnchored(self):
-        return (self.n == 1 and self.startingMonth is not None)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        other = datetime(other.year, other.month, other.day,
-                         other.hour, other.minute, other.second,
-                         other.microsecond)
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
-
-        monthsToGo = 3 - ((other.month - self.startingMonth) % 3)
-        if monthsToGo == 3:
-            monthsToGo = 0
-
-        if n > 0 and not (other.day >= days_in_month and monthsToGo == 0):
-            n = n - 1
-
-        other = other + relativedelta(months=monthsToGo + 3 * n, day=31)
-        return other
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        return self._end_apply_index(i, self.freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        modMonth = (dt.month - self.startingMonth) % 3
-        return MonthEnd().onOffset(dt) and modMonth == 0
+    _day_opt = 'end'
 
 
 class QuarterBegin(QuarterOffset):
@@ -2020,240 +1689,108 @@ class QuarterBegin(QuarterOffset):
     _default_startingMonth = 3
     _from_name_startingMonth = 1
     _prefix = 'QS'
+    _day_opt = 'start'
 
-    def isAnchored(self):
-        return (self.n == 1 and self.startingMonth is not None)
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, other.month)
 
-        monthsSince = (other.month - self.startingMonth) % 3
+# ---------------------------------------------------------------------
+# Year-Based Offset Classes
 
-        if n <= 0 and monthsSince != 0:
-            # make sure you roll forward, so negate
-            monthsSince = monthsSince - 3
+class YearOffset(DateOffset):
+    """
+    DateOffset that just needs a month.
+    """
+    _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize', 'month'])
 
-        if n <= 0 and (monthsSince == 0 and other.day > 1):
-            # after start, so come back an extra period as if rolled forward
-            n = n + 1
+    def _get_offset_day(self, other):
+        # override BaseOffset method to use self.month instead of other.month
+        # TODO: there may be a more performant way to do this
+        return liboffsets.get_day_of_month(other.replace(month=self.month),
+                                           self._day_opt)
 
-        other = other + relativedelta(months=3 * n - monthsSince, day=1)
-        return other
+    @apply_wraps
+    def apply(self, other):
+        years = roll_yearday(other, self.n, self.month, self._day_opt)
+        months = years * 12 + (self.month - other.month)
+        return shift_month(other, months, self._day_opt)
 
     @apply_index_wraps
-    def apply_index(self, i):
-        freq_month = 12 if self.startingMonth == 1 else self.startingMonth - 1
-        # freq_month = self.startingMonth
-        freqstr = 'Q-%s' % (_int_to_month[freq_month],)
-        return self._beg_apply_index(i, freqstr)
+    def apply_index(self, dtindex):
+        shifted = liboffsets.shift_quarters(dtindex.asi8, self.n,
+                                            self.month, self._day_opt,
+                                            modby=12)
+        # TODO: going through __new__ raises on call to _validate_frequency;
+        #  are we passing incorrect freq?
+        return type(dtindex)._simple_new(shifted, freq=dtindex.freq,
+                                         dtype=dtindex.dtype)
 
+    def onOffset(self, dt):
+        if self.normalize and not _is_normalized(dt):
+            return False
+        return dt.month == self.month and dt.day == self._get_offset_day(dt)
 
-class YearOffset(DateOffset):
-    """DateOffset that just needs a month"""
-    _adjust_dst = True
+    def __init__(self, n=1, normalize=False, month=None):
+        BaseOffset.__init__(self, n, normalize)
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.month = kwds.get('month', self._default_month)
+        month = month if month is not None else self._default_month
+        object.__setattr__(self, "month", month)
 
         if self.month < 1 or self.month > 12:
             raise ValueError('Month must go from 1 to 12')
 
-        DateOffset.__init__(self, n=n, normalize=normalize, **kwds)
-
     @classmethod
     def _from_name(cls, suffix=None):
         kwargs = {}
         if suffix:
-            kwargs['month'] = _month_to_int[suffix]
+            kwargs['month'] = ccalendar.MONTH_TO_CAL_NUM[suffix]
         return cls(**kwargs)
 
     @property
     def rule_code(self):
-        return '%s-%s' % (self._prefix, _int_to_month[self.month])
+        month = ccalendar.MONTH_ALIASES[self.month]
+        return '{prefix}-{month}'.format(prefix=self._prefix, month=month)
 
 
 class BYearEnd(YearOffset):
-    """DateOffset increments between business EOM dates"""
+    """
+    DateOffset increments between business EOM dates.
+    """
     _outputName = 'BusinessYearEnd'
     _default_month = 12
     _prefix = 'BA'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-        lastBDay = (days_in_month -
-                    max(((wkday + days_in_month - 1) % 7) - 4, 0))
-
-        years = n
-        if n > 0:
-            if (other.month < self.month or
-                    (other.month == self.month and other.day < lastBDay)):
-                years -= 1
-        elif n <= 0:
-            if (other.month > self.month or
-                    (other.month == self.month and other.day > lastBDay)):
-                years += 1
-
-        other = other + relativedelta(years=years)
-
-        _, days_in_month = tslib.monthrange(other.year, self.month)
-        result = datetime(other.year, self.month, days_in_month,
-                          other.hour, other.minute, other.second,
-                          other.microsecond)
-
-        if result.weekday() > 4:
-            result = result - BDay()
-
-        return result
+    _day_opt = 'business_end'
 
 
 class BYearBegin(YearOffset):
-    """DateOffset increments between business year begin dates"""
+    """
+    DateOffset increments between business year begin dates.
+    """
     _outputName = 'BusinessYearBegin'
     _default_month = 1
     _prefix = 'BAS'
-
-    @apply_wraps
-    def apply(self, other):
-        n = self.n
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-
-        first = _get_firstbday(wkday)
-
-        years = n
-
-        if n > 0:  # roll back first for positive n
-            if (other.month < self.month or
-                    (other.month == self.month and other.day < first)):
-                years -= 1
-        elif n <= 0:  # roll forward
-            if (other.month > self.month or
-                    (other.month == self.month and other.day > first)):
-                years += 1
-
-        # set first bday for result
-        other = other + relativedelta(years=years)
-        wkday, days_in_month = tslib.monthrange(other.year, self.month)
-        first = _get_firstbday(wkday)
-        return datetime(other.year, self.month, first, other.hour,
-                        other.minute, other.second, other.microsecond)
+    _day_opt = 'business_start'
 
 
 class YearEnd(YearOffset):
-    """DateOffset increments between calendar year ends"""
+    """
+    DateOffset increments between calendar year ends.
+    """
     _default_month = 12
     _prefix = 'A'
-
-    @apply_wraps
-    def apply(self, other):
-        def _increment(date):
-            if date.month == self.month:
-                _, days_in_month = tslib.monthrange(date.year, self.month)
-                if date.day != days_in_month:
-                    year = date.year
-                else:
-                    year = date.year + 1
-            elif date.month < self.month:
-                year = date.year
-            else:
-                year = date.year + 1
-            _, days_in_month = tslib.monthrange(year, self.month)
-            return datetime(year, self.month, days_in_month,
-                            date.hour, date.minute, date.second,
-                            date.microsecond)
-
-        def _decrement(date):
-            year = date.year if date.month > self.month else date.year - 1
-            _, days_in_month = tslib.monthrange(year, self.month)
-            return datetime(year, self.month, days_in_month,
-                            date.hour, date.minute, date.second,
-                            date.microsecond)
-
-        def _rollf(date):
-            if date.month != self.month or\
-               date.day < tslib.monthrange(date.year, date.month)[1]:
-                date = _increment(date)
-            return date
-
-        n = self.n
-        result = other
-        if n > 0:
-            while n > 0:
-                result = _increment(result)
-                n -= 1
-        elif n < 0:
-            while n < 0:
-                result = _decrement(result)
-                n += 1
-        else:
-            # n == 0, roll forward
-            result = _rollf(result)
-        return result
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        # convert month anchor to annual period tuple
-        return self._end_apply_index(i, self.freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        wkday, days_in_month = tslib.monthrange(dt.year, self.month)
-        return self.month == dt.month and dt.day == days_in_month
+    _day_opt = 'end'
 
 
 class YearBegin(YearOffset):
-    """DateOffset increments between calendar year begin dates"""
+    """
+    DateOffset increments between calendar year begin dates.
+    """
     _default_month = 1
     _prefix = 'AS'
+    _day_opt = 'start'
 
-    @apply_wraps
-    def apply(self, other):
-        def _increment(date, n):
-            year = date.year + n - 1
-            if date.month >= self.month:
-                year += 1
-            return datetime(year, self.month, 1, date.hour, date.minute,
-                            date.second, date.microsecond)
-
-        def _decrement(date, n):
-            year = date.year + n + 1
-            if date.month < self.month or (date.month == self.month and
-                                           date.day == 1):
-                year -= 1
-            return datetime(year, self.month, 1, date.hour, date.minute,
-                            date.second, date.microsecond)
-
-        def _rollf(date):
-            if (date.month != self.month) or date.day > 1:
-                date = _increment(date, 1)
-            return date
-
-        n = self.n
-        result = other
-        if n > 0:
-            result = _increment(result, n)
-        elif n < 0:
-            result = _decrement(result, n)
-        else:
-            # n == 0, roll forward
-            result = _rollf(result)
-        return result
-
-    @apply_index_wraps
-    def apply_index(self, i):
-        freq_month = 12 if self.month == 1 else self.month - 1
-        freqstr = 'A-%s' % (_int_to_month[freq_month],)
-        return self._beg_apply_index(i, freqstr)
-
-    def onOffset(self, dt):
-        if self.normalize and not _is_normalized(dt):
-            return False
-        return dt.month == self.month and dt.day == 1
 
+# ---------------------------------------------------------------------
+# Special Offset Classes
 
 class FY5253(DateOffset):
     """
@@ -2267,8 +1804,7 @@ class FY5253(DateOffset):
     such as retail, manufacturing and parking industry.
 
     For more information see:
-    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
-
+    http://en.wikipedia.org/wiki/4-4-5_calendar
 
     The year may either:
     - end on the last X day of the Y month.
@@ -2292,39 +1828,29 @@ class FY5253(DateOffset):
     variation : str
         {"nearest", "last"} for "LastOfMonth" or "NearestEndMonth"
     """
-
     _prefix = 'RE'
-    _suffix_prefix_last = 'L'
-    _suffix_prefix_nearest = 'N'
     _adjust_dst = True
+    _attributes = frozenset(['weekday', 'startingMonth', 'variation'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-        self.startingMonth = kwds['startingMonth']
-        self.weekday = kwds["weekday"]
-
-        self.variation = kwds["variation"]
+    def __init__(self, n=1, normalize=False, weekday=0, startingMonth=1,
+                 variation="nearest"):
+        BaseOffset.__init__(self, n, normalize)
+        object.__setattr__(self, "startingMonth", startingMonth)
+        object.__setattr__(self, "weekday", weekday)
 
-        self.kwds = kwds
+        object.__setattr__(self, "variation", variation)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
         if self.variation not in ["nearest", "last"]:
-            raise ValueError('%s is not a valid variation' % self.variation)
-
-        if self.variation == "nearest":
-            weekday_offset = weekday(self.weekday)
-            self._rd_forward = relativedelta(weekday=weekday_offset)
-            self._rd_backward = relativedelta(weekday=weekday_offset(-1))
-        else:
-            self._offset_lwom = LastWeekOfMonth(n=1, weekday=self.weekday)
+            raise ValueError('{variation} is not a valid variation'
+                             .format(variation=self.variation))
 
     def isAnchored(self):
-        return self.n == 1 \
-            and self.startingMonth is not None \
-            and self.weekday is not None
+        return (self.n == 1 and
+                self.startingMonth is not None and
+                self.weekday is not None)
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -2334,13 +1860,15 @@ def onOffset(self, dt):
 
         if self.variation == "nearest":
             # We have to check the year end of "this" cal year AND the previous
-            return year_end == dt or \
-                self.get_year_end(dt - relativedelta(months=1)) == dt
+            return (year_end == dt or
+                    self.get_year_end(shift_month(dt, -1, None)) == dt)
         else:
             return year_end == dt
 
     @apply_wraps
     def apply(self, other):
+        norm = Timestamp(other).normalize()
+
         n = self.n
         prev_year = self.get_year_end(
             datetime(other.year - 1, self.startingMonth, 1))
@@ -2348,112 +1876,89 @@ def apply(self, other):
             datetime(other.year, self.startingMonth, 1))
         next_year = self.get_year_end(
             datetime(other.year + 1, self.startingMonth, 1))
-        prev_year = tslib._localize_pydatetime(prev_year, other.tzinfo)
-        cur_year = tslib._localize_pydatetime(cur_year, other.tzinfo)
-        next_year = tslib._localize_pydatetime(next_year, other.tzinfo)
-
-        if n > 0:
-            if other == prev_year:
-                year = other.year - 1
-            elif other == cur_year:
-                year = other.year
-            elif other == next_year:
-                year = other.year + 1
-            elif other < prev_year:
-                year = other.year - 1
-                n -= 1
-            elif other < cur_year:
-                year = other.year
-                n -= 1
-            elif other < next_year:
-                year = other.year + 1
-                n -= 1
-            else:
-                assert False
 
-            result = self.get_year_end(
-                datetime(year + n, self.startingMonth, 1))
+        prev_year = conversion.localize_pydatetime(prev_year, other.tzinfo)
+        cur_year = conversion.localize_pydatetime(cur_year, other.tzinfo)
+        next_year = conversion.localize_pydatetime(next_year, other.tzinfo)
 
-            result = datetime(result.year, result.month, result.day,
-                              other.hour, other.minute, other.second,
-                              other.microsecond)
-            return result
-        else:
-            n = -n
-            if other == prev_year:
-                year = other.year - 1
-            elif other == cur_year:
-                year = other.year
-            elif other == next_year:
-                year = other.year + 1
-            elif other > next_year:
-                year = other.year + 1
-                n -= 1
-            elif other > cur_year:
-                year = other.year
+        # Note: next_year.year == other.year + 1, so we will always
+        # have other < next_year
+        if norm == prev_year:
+            n -= 1
+        elif norm == cur_year:
+            pass
+        elif n > 0:
+            if norm < prev_year:
+                n -= 2
+            elif prev_year < norm < cur_year:
                 n -= 1
-            elif other > prev_year:
-                year = other.year - 1
+            elif cur_year < norm < next_year:
+                pass
+        else:
+            if cur_year < norm < next_year:
+                n += 1
+            elif prev_year < norm < cur_year:
+                pass
+            elif (norm.year == prev_year.year and norm < prev_year and
+                  prev_year - norm <= timedelta(6)):
+                # GH#14774, error when next_year.year == cur_year.year
+                # e.g. prev_year == datetime(2004, 1, 3),
+                # other == datetime(2004, 1, 1)
                 n -= 1
             else:
                 assert False
 
-            result = self.get_year_end(
-                datetime(year - n, self.startingMonth, 1))
-
-            result = datetime(result.year, result.month, result.day,
-                              other.hour, other.minute, other.second,
-                              other.microsecond)
-            return result
+        shifted = datetime(other.year + n, self.startingMonth, 1)
+        result = self.get_year_end(shifted)
+        result = datetime(result.year, result.month, result.day,
+                          other.hour, other.minute, other.second,
+                          other.microsecond)
+        return result
 
     def get_year_end(self, dt):
-        if self.variation == "nearest":
-            return self._get_year_end_nearest(dt)
-        else:
-            return self._get_year_end_last(dt)
+        assert dt.tzinfo is None
 
-    def get_target_month_end(self, dt):
-        target_month = datetime(
-            dt.year, self.startingMonth, 1, tzinfo=dt.tzinfo)
-        next_month_first_of = target_month + relativedelta(months=+1)
-        return next_month_first_of + relativedelta(days=-1)
-
-    def _get_year_end_nearest(self, dt):
-        target_date = self.get_target_month_end(dt)
-        if target_date.weekday() == self.weekday:
+        dim = ccalendar.get_days_in_month(dt.year, self.startingMonth)
+        target_date = datetime(dt.year, self.startingMonth, dim)
+        wkday_diff = self.weekday - target_date.weekday()
+        if wkday_diff == 0:
+            # year_end is the same for "last" and "nearest" cases
             return target_date
-        else:
-            forward = target_date + self._rd_forward
-            backward = target_date + self._rd_backward
 
-            if forward - target_date < target_date - backward:
-                return forward
-            else:
-                return backward
+        if self.variation == "last":
+            days_forward = (wkday_diff % 7) - 7
 
-    def _get_year_end_last(self, dt):
-        current_year = datetime(
-            dt.year, self.startingMonth, 1, tzinfo=dt.tzinfo)
-        return current_year + self._offset_lwom
+            # days_forward is always negative, so we always end up
+            # in the same year as dt
+            return target_date + timedelta(days=days_forward)
+        else:
+            # variation == "nearest":
+            days_forward = wkday_diff % 7
+            if days_forward <= 3:
+                # The upcoming self.weekday is closer than the previous one
+                return target_date + timedelta(days_forward)
+            else:
+                # The previous self.weekday is closer than the upcoming one
+                return target_date + timedelta(days_forward - 7)
 
     @property
     def rule_code(self):
+        prefix = self._prefix
         suffix = self.get_rule_code_suffix()
-        return "%s-%s" % (self._get_prefix(), suffix)
-
-    def _get_prefix(self):
-        return self._prefix
+        return "{prefix}-{suffix}".format(prefix=prefix, suffix=suffix)
 
     def _get_suffix_prefix(self):
         if self.variation == "nearest":
-            return self._suffix_prefix_nearest
+            return 'N'
         else:
-            return self._suffix_prefix_last
+            return 'L'
 
     def get_rule_code_suffix(self):
-        return '%s-%s-%s' % (self._get_suffix_prefix(),
-                             _int_to_month[self.startingMonth],
-                             _int_to_weekday[self.weekday])
+        prefix = self._get_suffix_prefix()
+        month = ccalendar.MONTH_ALIASES[self.startingMonth]
+        weekday = ccalendar.int_to_weekday[self.weekday]
+        return '{prefix}-{month}-{weekday}'.format(prefix=prefix, month=month,
+                                                   weekday=weekday)
 
     @classmethod
     def _parse_suffix(cls, varion_code, startingMonth_code, weekday_code):
@@ -2462,17 +1967,15 @@ def _parse_suffix(cls, varion_code, startingMonth_code, weekday_code):
         elif varion_code == "L":
             variation = "last"
         else:
-            raise ValueError(
-                "Unable to parse varion_code: %s" % (varion_code,))
+            raise ValueError("Unable to parse varion_code: "
+                             "{code}".format(code=varion_code))
 
-        startingMonth = _month_to_int[startingMonth_code]
-        weekday = _weekday_to_int[weekday_code]
+        startingMonth = ccalendar.MONTH_TO_CAL_NUM[startingMonth_code]
+        weekday = ccalendar.weekday_to_int[weekday_code]
 
-        return {
-            "weekday": weekday,
-            "startingMonth": startingMonth,
-            "variation": variation,
-        }
+        return {"weekday": weekday,
+                "startingMonth": startingMonth,
+                "variation": variation}
 
     @classmethod
     def _from_name(cls, *args):
@@ -2492,7 +1995,7 @@ class FY5253Quarter(DateOffset):
     such as retail, manufacturing and parking industry.
 
     For more information see:
-    http://en.wikipedia.org/wiki/4%E2%80%934%E2%80%935_calendar
+    http://en.wikipedia.org/wiki/4-4-5_calendar
 
     The year may either:
     - end on the last X day of the Y month.
@@ -2525,66 +2028,104 @@ class FY5253Quarter(DateOffset):
 
     _prefix = 'REQ'
     _adjust_dst = True
+    _attributes = frozenset(['weekday', 'startingMonth', 'qtr_with_extra_week',
+                             'variation'])
 
-    def __init__(self, n=1, normalize=False, **kwds):
-        self.n = n
-        self.normalize = normalize
-
-        self.qtr_with_extra_week = kwds["qtr_with_extra_week"]
+    def __init__(self, n=1, normalize=False, weekday=0, startingMonth=1,
+                 qtr_with_extra_week=1, variation="nearest"):
+        BaseOffset.__init__(self, n, normalize)
 
-        self.kwds = kwds
+        object.__setattr__(self, "startingMonth", startingMonth)
+        object.__setattr__(self, "weekday", weekday)
+        object.__setattr__(self, "qtr_with_extra_week", qtr_with_extra_week)
+        object.__setattr__(self, "variation", variation)
 
         if self.n == 0:
             raise ValueError('N cannot be 0')
 
-        self._offset = FY5253(
-            startingMonth=kwds['startingMonth'],
-            weekday=kwds["weekday"],
-            variation=kwds["variation"])
+    @cache_readonly
+    def _offset(self):
+        return FY5253(startingMonth=self.startingMonth,
+                      weekday=self.weekday,
+                      variation=self.variation)
 
     def isAnchored(self):
         return self.n == 1 and self._offset.isAnchored()
 
+    def _rollback_to_year(self, other):
+        """
+        Roll `other` back to the most recent date that was on a fiscal year
+        end.
+
+        Return the date of that year-end, the number of full quarters
+        elapsed between that year-end and other, and the remaining Timedelta
+        since the most recent quarter-end.
+
+        Parameters
+        ----------
+        other : datetime or Timestamp
+
+        Returns
+        -------
+        tuple of
+        prev_year_end : Timestamp giving most recent fiscal year end
+        num_qtrs : int
+        tdelta : Timedelta
+        """
+        num_qtrs = 0
+
+        norm = Timestamp(other).tz_localize(None)
+        start = self._offset.rollback(norm)
+        # Note: start <= norm and self._offset.onOffset(start)
+
+        if start < norm:
+            # roll adjustment
+            qtr_lens = self.get_weeks(norm)
+
+            # check thet qtr_lens is consistent with self._offset addition
+            end = liboffsets.shift_day(start, days=7 * sum(qtr_lens))
+            assert self._offset.onOffset(end), (start, end, qtr_lens)
+
+            tdelta = norm - start
+            for qlen in qtr_lens:
+                if qlen * 7 <= tdelta.days:
+                    num_qtrs += 1
+                    tdelta -= Timedelta(days=qlen * 7)
+                else:
+                    break
+        else:
+            tdelta = Timedelta(0)
+
+        # Note: we always have tdelta.value >= 0
+        return start, num_qtrs, tdelta
+
     @apply_wraps
     def apply(self, other):
-        base = other
+        # Note: self.n == 0 is not allowed.
         n = self.n
 
-        if n > 0:
-            while n > 0:
-                if not self._offset.onOffset(other):
-                    qtr_lens = self.get_weeks(other)
-                    start = other - self._offset
-                else:
-                    start = other
-                    qtr_lens = self.get_weeks(other + self._offset)
+        prev_year_end, num_qtrs, tdelta = self._rollback_to_year(other)
+        res = prev_year_end
+        n += num_qtrs
+        if self.n <= 0 and tdelta.value > 0:
+            n += 1
 
-                for weeks in qtr_lens:
-                    start += relativedelta(weeks=weeks)
-                    if start > other:
-                        other = start
-                        n -= 1
-                        break
+        # Possible speedup by handling years first.
+        years = n // 4
+        if years:
+            res += self._offset * years
+            n -= years * 4
 
-        else:
-            n = -n
-            while n > 0:
-                if not self._offset.onOffset(other):
-                    qtr_lens = self.get_weeks(other)
-                    end = other + self._offset
-                else:
-                    end = other
-                    qtr_lens = self.get_weeks(other)
-
-                for weeks in reversed(qtr_lens):
-                    end -= relativedelta(weeks=weeks)
-                    if end < other:
-                        other = end
-                        n -= 1
-                        break
-        other = datetime(other.year, other.month, other.day,
-                         base.hour, base.minute, base.second, base.microsecond)
-        return other
+        # Add an extra day to make *sure* we are getting the quarter lengths
+        # for the upcoming year, not the previous year
+        qtr_lens = self.get_weeks(res + Timedelta(days=1))
+
+        # Note: we always have 0 <= n < 4
+        weeks = sum(qtr_lens[:n])
+        if weeks:
+            res = liboffsets.shift_day(res, days=weeks * 7)
+
+        return res
 
     def get_weeks(self, dt):
         ret = [13] * 4
@@ -2597,16 +2138,15 @@ def get_weeks(self, dt):
         return ret
 
     def year_has_extra_week(self, dt):
-        if self._offset.onOffset(dt):
-            prev_year_end = dt - self._offset
-            next_year_end = dt
-        else:
-            next_year_end = dt + self._offset
-            prev_year_end = dt - self._offset
-
-        week_in_year = (next_year_end - prev_year_end).days / 7
+        # Avoid round-down errors --> normalize to get
+        # e.g. '370D' instead of '360D23H'
+        norm = Timestamp(dt).normalize().tz_localize(None)
 
-        return week_in_year == 53
+        next_year_end = self._offset.rollforward(norm)
+        prev_year_end = norm - self._offset
+        weeks_in_year = (next_year_end - prev_year_end).days / 7
+        assert weeks_in_year in [52, 53], weeks_in_year
+        return weeks_in_year == 53
 
     def onOffset(self, dt):
         if self.normalize and not _is_normalized(dt):
@@ -2619,8 +2159,8 @@ def onOffset(self, dt):
         qtr_lens = self.get_weeks(dt)
 
         current = next_year_end
-        for qtr_len in qtr_lens[0:4]:
-            current += relativedelta(weeks=qtr_len)
+        for qtr_len in qtr_lens:
+            current = liboffsets.shift_day(current, days=qtr_len * 7)
             if dt == current:
                 return True
         return False
@@ -2628,8 +2168,9 @@ def onOffset(self, dt):
     @property
     def rule_code(self):
         suffix = self._offset.get_rule_code_suffix()
-        return "%s-%s" % (self._prefix,
-                          "%s-%d" % (suffix, self.qtr_with_extra_week))
+        qtr = self.qtr_with_extra_week
+        return "{prefix}-{suffix}-{qtr}".format(prefix=self._prefix,
+                                                suffix=suffix, qtr=qtr)
 
     @classmethod
     def _from_name(cls, *args):
@@ -2639,36 +2180,33 @@ def _from_name(cls, *args):
 
 class Easter(DateOffset):
     """
-    DateOffset for the Easter holiday using
-    logic defined in dateutil.  Right now uses
-    the revised method which is valid in years
-    1583-4099.
+    DateOffset for the Easter holiday using logic defined in dateutil.
+
+    Right now uses the revised method which is valid in years 1583-4099.
     """
     _adjust_dst = True
+    _attributes = frozenset(['n', 'normalize'])
 
-    def __init__(self, n=1, **kwds):
-        super(Easter, self).__init__(n, **kwds)
+    __init__ = BaseOffset.__init__
 
     @apply_wraps
     def apply(self, other):
-        currentEaster = easter(other.year)
-        currentEaster = datetime(
-            currentEaster.year, currentEaster.month, currentEaster.day)
-        currentEaster = tslib._localize_pydatetime(currentEaster, other.tzinfo)
+        current_easter = easter(other.year)
+        current_easter = datetime(current_easter.year,
+                                  current_easter.month, current_easter.day)
+        current_easter = conversion.localize_pydatetime(current_easter,
+                                                        other.tzinfo)
+
+        n = self.n
+        if n >= 0 and other < current_easter:
+            n -= 1
+        elif n < 0 and other > current_easter:
+            n += 1
+        # TODO: Why does this handle the 0 case the opposite of others?
 
         # NOTE: easter returns a datetime.date so we have to convert to type of
         # other
-        if self.n >= 0:
-            if other >= currentEaster:
-                new = easter(other.year + self.n)
-            else:
-                new = easter(other.year + self.n - 1)
-        else:
-            if other > currentEaster:
-                new = easter(other.year + self.n + 1)
-            else:
-                new = easter(other.year + self.n)
-
+        new = easter(other.year + n)
         new = datetime(new.year, new.month, new.day, other.hour,
                        other.minute, other.second, other.microsecond)
         return new
@@ -2683,21 +2221,36 @@ def onOffset(self, dt):
 
 
 def _tick_comp(op):
+    assert op not in [operator.eq, operator.ne]
+
     def f(self, other):
-        return op(self.delta, other.delta)
+        try:
+            return op(self.delta, other.delta)
+        except AttributeError:
+            # comparing with a non-Tick object
+            raise TypeError("Invalid comparison between {cls} and {typ}"
+                            .format(cls=type(self).__name__,
+                                    typ=type(other).__name__))
 
+    f.__name__ = '__{opname}__'.format(opname=op.__name__)
     return f
 
 
-class Tick(SingleConstructorOffset):
+class Tick(liboffsets._Tick, SingleConstructorOffset):
     _inc = Timedelta(microseconds=1000)
+    _prefix = 'undefined'
+    _attributes = frozenset(['n', 'normalize'])
+
+    def __init__(self, n=1, normalize=False):
+        BaseOffset.__init__(self, n, normalize)
+        if normalize:
+            raise ValueError("Tick offset with `normalize=True` are not "
+                             "allowed.")  # GH#21427
 
     __gt__ = _tick_comp(operator.gt)
     __ge__ = _tick_comp(operator.ge)
     __lt__ = _tick_comp(operator.lt)
     __le__ = _tick_comp(operator.le)
-    __eq__ = _tick_comp(operator.eq)
-    __ne__ = _tick_comp(operator.ne)
 
     def __add__(self, other):
         if isinstance(other, Tick):
@@ -2712,35 +2265,45 @@ def __add__(self, other):
         except ApplyTypeError:
             return NotImplemented
         except OverflowError:
-            raise OverflowError("the add operation between {} and {} "
-                                "will overflow".format(self, other))
+            raise OverflowError("the add operation between {self} and {other} "
+                                "will overflow".format(self=self, other=other))
 
     def __eq__(self, other):
         if isinstance(other, compat.string_types):
             from pandas.tseries.frequencies import to_offset
-
-            other = to_offset(other)
+            try:
+                # GH#23524 if to_offset fails, we are dealing with an
+                #  incomparable type so == is False and != is True
+                other = to_offset(other)
+            except ValueError:
+                # e.g. "infer"
+                return False
 
         if isinstance(other, Tick):
             return self.delta == other.delta
         else:
-            return DateOffset.__eq__(self, other)
+            return False
 
     # This is identical to DateOffset.__hash__, but has to be redefined here
     # for Python 3, because we've redefined __eq__.
     def __hash__(self):
-        return hash(self._params())
+        return hash(self._params)
 
     def __ne__(self, other):
         if isinstance(other, compat.string_types):
             from pandas.tseries.frequencies import to_offset
-
-            other = to_offset(other)
+            try:
+                # GH#23524 if to_offset fails, we are dealing with an
+                #  incomparable type so == is False and != is True
+                other = to_offset(other)
+            except ValueError:
+                # e.g. "infer"
+                return True
 
         if isinstance(other, Tick):
             return self.delta != other.delta
         else:
-            return DateOffset.__ne__(self, other)
+            return True
 
     @property
     def delta(self):
@@ -2748,8 +2311,9 @@ def delta(self):
 
     @property
     def nanos(self):
-        return _delta_to_nanoseconds(self.delta)
+        return delta_to_nanoseconds(self.delta)
 
+    # TODO: Should Tick have its own apply_index?
     def apply(self, other):
         # Timestamp can handle tz and nano sec, thus no need to use apply_wraps
         if isinstance(other, Timestamp):
@@ -2771,16 +2335,16 @@ def apply(self, other):
         elif isinstance(other, type(self)):
             return type(self)(self.n + other.n)
 
-        raise ApplyTypeError('Unhandled type: %s' % type(other).__name__)
-
-    _prefix = 'undefined'
+        raise ApplyTypeError('Unhandled type: {type_str}'
+                             .format(type_str=type(other).__name__))
 
     def isAnchored(self):
         return False
 
 
 def _delta_to_tick(delta):
-    if delta.microseconds == 0:
+    if delta.microseconds == 0 and getattr(delta, "nanoseconds", 0) == 0:
+        # nanoseconds only for pd.Timedelta
         if delta.seconds == 0:
             return Day(delta.days)
         else:
@@ -2792,7 +2356,7 @@ def _delta_to_tick(delta):
             else:
                 return Second(seconds)
     else:
-        nanos = _delta_to_nanoseconds(delta)
+        nanos = delta_to_nanoseconds(delta)
         if nanos % 1000000 == 0:
             return Milli(nanos // 1000000)
         elif nanos % 1000 == 0:
@@ -2801,9 +2365,6 @@ def _delta_to_tick(delta):
             return Nano(nanos)
 
 
-_delta_to_nanoseconds = tslib._delta_to_nanoseconds
-
-
 class Day(Tick):
     _inc = Timedelta(days=1)
     _prefix = 'D'
@@ -2846,35 +2407,21 @@ class Nano(Tick):
 CBMonthBegin = CustomBusinessMonthBegin
 CDay = CustomBusinessDay
 
-
-def _get_firstbday(wkday):
-    """
-    wkday is the result of monthrange(year, month)
-
-    If it's a saturday or sunday, increment first business day to reflect this
-    """
-    first = 1
-    if wkday == 5:  # on Saturday
-        first = 3
-    elif wkday == 6:  # on Sunday
-        first = 2
-    return first
+# ---------------------------------------------------------------------
 
 
-def generate_range(start=None, end=None, periods=None,
-                   offset=BDay(), time_rule=None):
+def generate_range(start=None, end=None, periods=None, offset=BDay()):
     """
     Generates a sequence of dates corresponding to the specified time
     offset. Similar to dateutil.rrule except uses pandas DateOffset
-    objects to represent time increments
+    objects to represent time increments.
 
     Parameters
     ----------
     start : datetime (default None)
     end : datetime (default None)
-    periods : int, optional
-    time_rule : (legacy) name of DateOffset object to be used, optional
-        Corresponds with names expected by tseries.frequencies.get_offset
+    periods : int, (default None)
+    offset : DateOffset, (default BDay())
 
     Notes
     -----
@@ -2882,17 +2429,13 @@ def generate_range(start=None, end=None, periods=None,
     * At least two of (start, end, periods) must be specified.
     * If both start and end are specified, the returned dates will
     satisfy start <= date <= end.
-    * If both time_rule and offset are specified, time_rule supersedes offset.
 
     Returns
     -------
     dates : generator object
-
     """
-    if time_rule is not None:
-        from pandas.tseries.frequencies import get_offset
-
-        offset = get_offset(time_rule)
+    from pandas.tseries.frequencies import to_offset
+    offset = to_offset(offset)
 
     start = to_datetime(start)
     end = to_datetime(end)
@@ -2903,7 +2446,7 @@ def generate_range(start=None, end=None, periods=None,
     elif end and not offset.onOffset(end):
         end = offset.rollback(end)
 
-    if periods is None and end < start:
+    if periods is None and end < start and offset.n >= 0:
         end = None
         periods = 0
 
@@ -2921,7 +2464,8 @@ def generate_range(start=None, end=None, periods=None,
             # faster than cur + offset
             next_date = offset.apply(cur)
             if next_date <= cur:
-                raise ValueError('Offset %s did not increment date' % offset)
+                raise ValueError('Offset {offset} did not increment date'
+                                 .format(offset=offset))
             cur = next_date
     else:
         while cur >= end:
@@ -2930,11 +2474,12 @@ def generate_range(start=None, end=None, periods=None,
             # faster than cur + offset
             next_date = offset.apply(cur)
             if next_date >= cur:
-                raise ValueError('Offset %s did not decrement date' % offset)
+                raise ValueError('Offset {offset} did not decrement date'
+                                 .format(offset=offset))
             cur = next_date
 
 
-prefix_mapping = dict((offset._prefix, offset) for offset in [
+prefix_mapping = {offset._prefix: offset for offset in [
     YearBegin,                 # 'AS'
     YearEnd,                   # 'A'
     BYearBegin,                # 'BAS'
@@ -2951,6 +2496,7 @@ def generate_range(start=None, end=None, periods=None,
     CustomBusinessHour,        # 'CBH'
     MonthEnd,                  # 'M'
     MonthBegin,                # 'MS'
+    Nano,                      # 'N'
     SemiMonthEnd,              # 'SM'
     SemiMonthBegin,            # 'SMS'
     Week,                      # 'W'
@@ -2964,7 +2510,5 @@ def generate_range(start=None, end=None, periods=None,
     Day,                       # 'D'
     WeekOfMonth,               # 'WOM'
     FY5253,
-    FY5253Quarter,
-])
-
-prefix_mapping['N'] = Nano
+    FY5253Quarter
+]}
diff --git a/pandas/tseries/period.py b/pandas/tseries/period.py
deleted file mode 100644
index 1e1496bbe9c27..0000000000000
--- a/pandas/tseries/period.py
+++ /dev/null
@@ -1,1181 +0,0 @@
-# pylint: disable=E1101,E1103,W0232
-from datetime import datetime, timedelta
-import numpy as np
-import warnings
-
-
-from pandas.core import common as com
-from pandas.types.common import (is_integer,
-                                 is_float,
-                                 is_object_dtype,
-                                 is_integer_dtype,
-                                 is_float_dtype,
-                                 is_scalar,
-                                 is_datetime64_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_timedelta64_dtype,
-                                 is_period_dtype,
-                                 is_bool_dtype,
-                                 pandas_dtype,
-                                 _ensure_object)
-from pandas.types.dtypes import PeriodDtype
-from pandas.types.generic import ABCSeries
-
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.frequencies import get_freq_code as _gfc
-from pandas.tseries.index import DatetimeIndex, Int64Index, Index
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.base import DatelikeOps, DatetimeIndexOpsMixin
-from pandas.tseries.tools import parse_time_string
-import pandas.tseries.offsets as offsets
-
-from pandas._libs.lib import infer_dtype
-from pandas._libs import tslib, period
-from pandas._libs.period import (Period, IncompatibleFrequency,
-                                 get_period_field_arr, _validate_end_alias,
-                                 _quarter_to_myear)
-
-from pandas.core.base import _shared_docs
-from pandas.indexes.base import _index_shared_docs, _ensure_index
-
-from pandas import compat
-from pandas.util.decorators import (Appender, Substitution, cache_readonly,
-                                    deprecate_kwarg)
-from pandas.compat import zip, u
-
-import pandas.indexes.base as ibase
-_index_doc_kwargs = dict(ibase._index_doc_kwargs)
-_index_doc_kwargs.update(
-    dict(target_klass='PeriodIndex or list of Periods'))
-
-
-def _field_accessor(name, alias, docstring=None):
-    def f(self):
-        base, mult = _gfc(self.freq)
-        result = get_period_field_arr(alias, self._values, base)
-        return Index(result, name=self.name)
-    f.__name__ = name
-    f.__doc__ = docstring
-    return property(f)
-
-
-def dt64arr_to_periodarr(data, freq, tz):
-    if data.dtype != np.dtype('M8[ns]'):
-        raise ValueError('Wrong dtype: %s' % data.dtype)
-
-    freq = Period._maybe_convert_freq(freq)
-    base, mult = _gfc(freq)
-    return period.dt64arr_to_periodarr(data.view('i8'), base, tz)
-
-# --- Period index sketch
-
-
-_DIFFERENT_FREQ_INDEX = period._DIFFERENT_FREQ_INDEX
-
-
-def _period_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert datetime-like to datetime64
-    """
-
-    def wrapper(self, other):
-        if isinstance(other, Period):
-            func = getattr(self._values, opname)
-            other_base, _ = _gfc(other.freq)
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-                raise IncompatibleFrequency(msg)
-
-            result = func(other.ordinal)
-        elif isinstance(other, PeriodIndex):
-            if other.freq != self.freq:
-                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-                raise IncompatibleFrequency(msg)
-
-            result = getattr(self._values, opname)(other._values)
-
-            mask = self._isnan | other._isnan
-            if mask.any():
-                result[mask] = nat_result
-
-            return result
-        elif other is tslib.NaT:
-            result = np.empty(len(self._values), dtype=bool)
-            result.fill(nat_result)
-        else:
-            other = Period(other, freq=self.freq)
-            func = getattr(self._values, opname)
-            result = func(other.ordinal)
-
-        if self.hasnans:
-            result[self._isnan] = nat_result
-
-        return result
-    return wrapper
-
-
-def _new_PeriodIndex(cls, **d):
-    # GH13277 for unpickling
-    if d['data'].dtype == 'int64':
-        values = d.pop('data')
-    return cls._from_ordinals(values=values, **d)
-
-
-class PeriodIndex(DatelikeOps, DatetimeIndexOpsMixin, Int64Index):
-    """
-    Immutable ndarray holding ordinal values indicating regular periods in
-    time such as particular years, quarters, months, etc. A value of 1 is the
-    period containing the Gregorian proleptic datetime Jan 1, 0001 00:00:00.
-    This ordinal representation is from the scikits.timeseries project.
-
-    For instance,
-        # construct period for day 1/1/1 and get the first second
-        i = Period(year=1,month=1,day=1,freq='D').asfreq('S', 'S')
-        i.ordinal
-        ===> 1
-
-    Index keys are boxed to Period objects which carries the metadata (eg,
-    frequency information).
-
-    Parameters
-    ----------
-    data : array-like (1-dimensional), optional
-        Optional period-like data to construct index with
-    copy : bool
-        Make a copy of input ndarray
-    freq : string or period object, optional
-        One of pandas period strings or corresponding objects
-    start : starting value, period-like, optional
-        If data is None, used as the start point in generating regular
-        period data.
-    periods : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end : end value, period-like, optional
-        If periods is none, generated index will extend to first conforming
-        period on or just past end argument
-    year : int, array, or Series, default None
-    month : int, array, or Series, default None
-    quarter : int, array, or Series, default None
-    day : int, array, or Series, default None
-    hour : int, array, or Series, default None
-    minute : int, array, or Series, default None
-    second : int, array, or Series, default None
-    tz : object, default None
-        Timezone for converting datetime64 data to Periods
-    dtype : str or PeriodDtype, default None
-
-    Examples
-    --------
-    >>> idx = PeriodIndex(year=year_arr, quarter=q_arr)
-
-    >>> idx2 = PeriodIndex(start='2000', end='2010', freq='A')
-    """
-    _box_scalars = True
-    _typ = 'periodindex'
-    _attributes = ['name', 'freq']
-
-    # define my properties & methods for delegation
-    _other_ops = []
-    _bool_ops = ['is_leap_year']
-    _object_ops = ['start_time', 'end_time', 'freq']
-    _field_ops = ['year', 'month', 'day', 'hour', 'minute', 'second',
-                  'weekofyear', 'weekday', 'week', 'dayofweek',
-                  'dayofyear', 'quarter', 'qyear',
-                  'days_in_month', 'daysinmonth']
-    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
-    _datetimelike_methods = ['strftime', 'to_timestamp', 'asfreq']
-
-    _is_numeric_dtype = False
-    _infer_as_myclass = True
-
-    freq = None
-
-    __eq__ = _period_index_cmp('__eq__')
-    __ne__ = _period_index_cmp('__ne__', nat_result=True)
-    __lt__ = _period_index_cmp('__lt__')
-    __gt__ = _period_index_cmp('__gt__')
-    __le__ = _period_index_cmp('__le__')
-    __ge__ = _period_index_cmp('__ge__')
-
-    def __new__(cls, data=None, ordinal=None, freq=None, start=None, end=None,
-                periods=None, copy=False, name=None, tz=None, dtype=None,
-                **kwargs):
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if name is None and hasattr(data, 'name'):
-            name = data.name
-
-        if dtype is not None:
-            dtype = pandas_dtype(dtype)
-            if not is_period_dtype(dtype):
-                raise ValueError('dtype must be PeriodDtype')
-            if freq is None:
-                freq = dtype.freq
-            elif freq != dtype.freq:
-                msg = 'specified freq and dtype are different'
-                raise IncompatibleFrequency(msg)
-
-        # coerce freq to freq object, otherwise it can be coerced elementwise
-        # which is slow
-        if freq:
-            freq = Period._maybe_convert_freq(freq)
-
-        if data is None:
-            if ordinal is not None:
-                data = np.asarray(ordinal, dtype=np.int64)
-            else:
-                data, freq = cls._generate_range(start, end, periods,
-                                                 freq, kwargs)
-            return cls._from_ordinals(data, name=name, freq=freq)
-
-        if isinstance(data, PeriodIndex):
-            if freq is None or freq == data.freq:  # no freq change
-                freq = data.freq
-                data = data._values
-            else:
-                base1, _ = _gfc(data.freq)
-                base2, _ = _gfc(freq)
-                data = period.period_asfreq_arr(data._values,
-                                                base1, base2, 1)
-            return cls._simple_new(data, name=name, freq=freq)
-
-        # not array / index
-        if not isinstance(data, (np.ndarray, PeriodIndex,
-                                 DatetimeIndex, Int64Index)):
-            if is_scalar(data) or isinstance(data, Period):
-                cls._scalar_data_error(data)
-
-            # other iterable of some kind
-            if not isinstance(data, (list, tuple)):
-                data = list(data)
-
-            data = np.asarray(data)
-
-        # datetime other than period
-        if is_datetime64_dtype(data.dtype):
-            data = dt64arr_to_periodarr(data, freq, tz)
-            return cls._from_ordinals(data, name=name, freq=freq)
-
-        # check not floats
-        if infer_dtype(data) == 'floating' and len(data) > 0:
-            raise TypeError("PeriodIndex does not allow "
-                            "floating point in construction")
-
-        # anything else, likely an array of strings or periods
-        data = _ensure_object(data)
-        freq = freq or period.extract_freq(data)
-        data = period.extract_ordinals(data, freq)
-        return cls._from_ordinals(data, name=name, freq=freq)
-
-    @classmethod
-    def _generate_range(cls, start, end, periods, freq, fields):
-        if freq is not None:
-            freq = Period._maybe_convert_freq(freq)
-
-        field_count = len(fields)
-        if com._count_not_none(start, end) > 0:
-            if field_count > 0:
-                raise ValueError('Can either instantiate from fields '
-                                 'or endpoints, but not both')
-            subarr, freq = _get_ordinal_range(start, end, periods, freq)
-        elif field_count > 0:
-            subarr, freq = _range_from_fields(freq=freq, **fields)
-        else:
-            raise ValueError('Not enough parameters to construct '
-                             'Period range')
-
-        return subarr, freq
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, **kwargs):
-        """
-        Values can be any type that can be coerced to Periods.
-        Ordinals in an ndarray are fastpath-ed to `_from_ordinals`
-        """
-        if not is_integer_dtype(values):
-            values = np.array(values, copy=False)
-            if len(values) > 0 and is_float_dtype(values):
-                raise TypeError("PeriodIndex can't take floats")
-            return cls(values, name=name, freq=freq, **kwargs)
-
-        return cls._from_ordinals(values, name, freq, **kwargs)
-
-    @classmethod
-    def _from_ordinals(cls, values, name=None, freq=None, **kwargs):
-        """
-        Values should be int ordinals
-        `__new__` & `_simple_new` cooerce to ordinals and call this method
-        """
-
-        values = np.array(values, dtype='int64', copy=False)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        if freq is None:
-            raise ValueError('freq is not specified and cannot be inferred')
-        result.freq = Period._maybe_convert_freq(freq)
-        result._reset_identity()
-        return result
-
-    def _shallow_copy_with_infer(self, values=None, **kwargs):
-        """ we always want to return a PeriodIndex """
-        return self._shallow_copy(values=values, **kwargs)
-
-    def _shallow_copy(self, values=None, freq=None, **kwargs):
-        if freq is None:
-            freq = self.freq
-        if values is None:
-            values = self._values
-        return super(PeriodIndex, self)._shallow_copy(values=values,
-                                                      freq=freq, **kwargs)
-
-    def _coerce_scalar_to_index(self, item):
-        """
-        we need to coerce a scalar to a compat for our index type
-
-        Parameters
-        ----------
-        item : scalar item to coerce
-        """
-        return PeriodIndex([item], **self._get_attributes_dict())
-
-    def __contains__(self, key):
-        if isinstance(key, Period):
-            if key.freq != self.freq:
-                return False
-            else:
-                return key.ordinal in self._engine
-        else:
-            try:
-                self.get_loc(key)
-                return True
-            except Exception:
-                return False
-            return False
-
-    @property
-    def asi8(self):
-        return self._values.view('i8')
-
-    @cache_readonly
-    def _int64index(self):
-        return Int64Index(self.asi8, name=self.name, fastpath=True)
-
-    @property
-    def values(self):
-        return self.asobject.values
-
-    @property
-    def _values(self):
-        return self._data
-
-    def __array__(self, dtype=None):
-        if is_integer_dtype(dtype):
-            return self.asi8
-        else:
-            return self.asobject.values
-
-    def __array_wrap__(self, result, context=None):
-        """
-        Gets called after a ufunc. Needs additional handling as
-        PeriodIndex stores internal data as int dtype
-
-        Replace this to __numpy_ufunc__ in future version
-        """
-        if isinstance(context, tuple) and len(context) > 0:
-            func = context[0]
-            if (func is np.add):
-                pass
-            elif (func is np.subtract):
-                name = self.name
-                left = context[1][0]
-                right = context[1][1]
-                if (isinstance(left, PeriodIndex) and
-                        isinstance(right, PeriodIndex)):
-                    name = left.name if left.name == right.name else None
-                    return Index(result, name=name)
-                elif isinstance(left, Period) or isinstance(right, Period):
-                    return Index(result, name=name)
-            elif isinstance(func, np.ufunc):
-                if 'M->M' not in func.types:
-                    msg = "ufunc '{0}' not supported for the PeriodIndex"
-                    # This should be TypeError, but TypeError cannot be raised
-                    # from here because numpy catches.
-                    raise ValueError(msg.format(func.__name__))
-
-        if is_bool_dtype(result):
-            return result
-        # the result is object dtype array of Period
-        # cannot pass _simple_new as it is
-        return self._shallow_copy(result, freq=self.freq, name=self.name)
-
-    @property
-    def _box_func(self):
-        return lambda x: Period._from_ordinal(ordinal=x, freq=self.freq)
-
-    def _to_embed(self, keep_tz=False):
-        """
-        return an array repr of this object, potentially casting to object
-        """
-        return self.asobject.values
-
-    @property
-    def _formatter_func(self):
-        return lambda x: "'%s'" % x
-
-    def asof_locs(self, where, mask):
-        """
-        where : array of timestamps
-        mask : array of booleans where data is not NA
-
-        """
-        where_idx = where
-        if isinstance(where_idx, DatetimeIndex):
-            where_idx = PeriodIndex(where_idx.values, freq=self.freq)
-
-        locs = self._values[mask].searchsorted(where_idx._values, side='right')
-
-        locs = np.where(locs > 0, locs - 1, 0)
-        result = np.arange(len(self))[mask].take(locs)
-
-        first = mask.argmax()
-        result[(locs == 0) & (where_idx._values < self._values[first])] = -1
-
-        return result
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True, how='start'):
-        dtype = pandas_dtype(dtype)
-        if is_object_dtype(dtype):
-            return self.asobject
-        elif is_integer_dtype(dtype):
-            if copy:
-                return self._int64index.copy()
-            else:
-                return self._int64index
-        elif is_datetime64_dtype(dtype):
-            return self.to_timestamp(how=how)
-        elif is_datetime64tz_dtype(dtype):
-            return self.to_timestamp(how=how).tz_localize(dtype.tz)
-        elif is_period_dtype(dtype):
-            return self.asfreq(freq=dtype.freq)
-        raise ValueError('Cannot cast PeriodIndex to dtype %s' % dtype)
-
-    @Substitution(klass='PeriodIndex')
-    @Appender(_shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
-    def searchsorted(self, value, side='left', sorter=None):
-        if isinstance(value, Period):
-            if value.freq != self.freq:
-                msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, value.freqstr)
-                raise IncompatibleFrequency(msg)
-            value = value.ordinal
-        elif isinstance(value, compat.string_types):
-            value = Period(value, freq=self.freq).ordinal
-
-        return self._values.searchsorted(value, side=side, sorter=sorter)
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    @property
-    def is_full(self):
-        """
-        Returns True if there are any missing periods from start to end
-        """
-        if len(self) == 0:
-            return True
-        if not self.is_monotonic:
-            raise ValueError('Index is not monotonic')
-        values = self.values
-        return ((values[1:] - values[:-1]) < 2).all()
-
-    def asfreq(self, freq=None, how='E'):
-        """
-        Convert the PeriodIndex to the specified frequency `freq`.
-
-        Parameters
-        ----------
-
-        freq : str
-            a frequency
-        how : str {'E', 'S'}
-            'E', 'END', or 'FINISH' for end,
-            'S', 'START', or 'BEGIN' for start.
-            Whether the elements should be aligned to the end
-            or start within pa period. January 31st ('END') vs.
-            Janury 1st ('START') for example.
-
-        Returns
-        -------
-
-        new : PeriodIndex with the new frequency
-
-        Examples
-        --------
-        >>> pidx = pd.period_range('2010-01-01', '2015-01-01', freq='A')
-        >>> pidx
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010, ..., 2015]
-        Length: 6, Freq: A-DEC
-
-        >>> pidx.asfreq('M')
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010-12, ..., 2015-12]
-        Length: 6, Freq: M
-
-        >>> pidx.asfreq('M', how='S')
-        <class 'pandas.tseries.period.PeriodIndex'>
-        [2010-01, ..., 2015-01]
-        Length: 6, Freq: M
-        """
-        how = _validate_end_alias(how)
-
-        freq = Period._maybe_convert_freq(freq)
-
-        base1, mult1 = _gfc(self.freq)
-        base2, mult2 = _gfc(freq)
-
-        asi8 = self.asi8
-        # mult1 can't be negative or 0
-        end = how == 'E'
-        if end:
-            ordinal = asi8 + mult1 - 1
-        else:
-            ordinal = asi8
-
-        new_data = period.period_asfreq_arr(ordinal, base1, base2, end)
-
-        if self.hasnans:
-            new_data[self._isnan] = tslib.iNaT
-
-        return self._simple_new(new_data, self.name, freq=freq)
-
-    def to_datetime(self, dayfirst=False):
-        """
-        DEPRECATED: use :meth:`to_timestamp` instead.
-
-        Cast to DatetimeIndex.
-        """
-        warnings.warn("to_datetime is deprecated. Use self.to_timestamp(...)",
-                      FutureWarning, stacklevel=2)
-        return self.to_timestamp()
-
-    year = _field_accessor('year', 0, "The year of the period")
-    month = _field_accessor('month', 3, "The month as January=1, December=12")
-    day = _field_accessor('day', 4, "The days of the period")
-    hour = _field_accessor('hour', 5, "The hour of the period")
-    minute = _field_accessor('minute', 6, "The minute of the period")
-    second = _field_accessor('second', 7, "The second of the period")
-    weekofyear = _field_accessor('week', 8, "The week ordinal of the year")
-    week = weekofyear
-    dayofweek = _field_accessor('dayofweek', 10,
-                                "The day of the week with Monday=0, Sunday=6")
-    weekday = dayofweek
-    dayofyear = day_of_year = _field_accessor('dayofyear', 9,
-                                              "The ordinal day of the year")
-    quarter = _field_accessor('quarter', 2, "The quarter of the date")
-    qyear = _field_accessor('qyear', 1)
-    days_in_month = _field_accessor('days_in_month', 11,
-                                    "The number of days in the month")
-    daysinmonth = days_in_month
-
-    @property
-    def is_leap_year(self):
-        """ Logical indicating if the date belongs to a leap year """
-        return tslib._isleapyear_arr(np.asarray(self.year))
-
-    @property
-    def start_time(self):
-        return self.to_timestamp(how='start')
-
-    @property
-    def end_time(self):
-        return self.to_timestamp(how='end')
-
-    def _mpl_repr(self):
-        # how to represent ourselves to matplotlib
-        return self.asobject.values
-
-    def to_timestamp(self, freq=None, how='start'):
-        """
-        Cast to DatetimeIndex
-
-        Parameters
-        ----------
-        freq : string or DateOffset, default 'D' for week or longer, 'S'
-               otherwise
-            Target frequency
-        how : {'s', 'e', 'start', 'end'}
-
-        Returns
-        -------
-        DatetimeIndex
-        """
-        how = _validate_end_alias(how)
-
-        if freq is None:
-            base, mult = _gfc(self.freq)
-            freq = frequencies.get_to_timestamp_base(base)
-        else:
-            freq = Period._maybe_convert_freq(freq)
-
-        base, mult = _gfc(freq)
-        new_data = self.asfreq(freq, how)
-
-        new_data = period.periodarr_to_dt64arr(new_data._values, base)
-        return DatetimeIndex(new_data, freq='infer', name=self.name)
-
-    def _maybe_convert_timedelta(self, other):
-        if isinstance(other, (timedelta, np.timedelta64, offsets.Tick)):
-            offset = frequencies.to_offset(self.freq.rule_code)
-            if isinstance(offset, offsets.Tick):
-                nanos = tslib._delta_to_nanoseconds(other)
-                offset_nanos = tslib._delta_to_nanoseconds(offset)
-                if nanos % offset_nanos == 0:
-                    return nanos // offset_nanos
-        elif isinstance(other, offsets.DateOffset):
-            freqstr = other.rule_code
-            base = frequencies.get_base_alias(freqstr)
-            if base == self.freq.rule_code:
-                return other.n
-            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-        elif isinstance(other, np.ndarray):
-            if is_integer_dtype(other):
-                return other
-            elif is_timedelta64_dtype(other):
-                offset = frequencies.to_offset(self.freq)
-                if isinstance(offset, offsets.Tick):
-                    nanos = tslib._delta_to_nanoseconds(other)
-                    offset_nanos = tslib._delta_to_nanoseconds(offset)
-                    if (nanos % offset_nanos).all() == 0:
-                        return nanos // offset_nanos
-        elif is_integer(other):
-            # integer is passed to .shift via
-            # _add_datetimelike_methods basically
-            # but ufunc may pass integer to _add_delta
-            return other
-        # raise when input doesn't have freq
-        msg = "Input has different freq from PeriodIndex(freq={0})"
-        raise IncompatibleFrequency(msg.format(self.freqstr))
-
-    def _add_delta(self, other):
-        ordinal_delta = self._maybe_convert_timedelta(other)
-        return self.shift(ordinal_delta)
-
-    def _sub_datelike(self, other):
-        if other is tslib.NaT:
-            new_data = np.empty(len(self), dtype=np.int64)
-            new_data.fill(tslib.iNaT)
-            return TimedeltaIndex(new_data, name=self.name)
-        return NotImplemented
-
-    def _sub_period(self, other):
-        if self.freq != other.freq:
-            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-
-        asi8 = self.asi8
-        new_data = asi8 - other.ordinal
-
-        if self.hasnans:
-            new_data = new_data.astype(np.float64)
-            new_data[self._isnan] = np.nan
-        # result must be Int64Index or Float64Index
-        return Index(new_data, name=self.name)
-
-    def shift(self, n):
-        """
-        Specialized shift which produces an PeriodIndex
-
-        Parameters
-        ----------
-        n : int
-            Periods to shift by
-
-        Returns
-        -------
-        shifted : PeriodIndex
-        """
-        values = self._values + n * self.freq.n
-        if self.hasnans:
-            values[self._isnan] = tslib.iNaT
-        return self._shallow_copy(values=values)
-
-    @cache_readonly
-    def dtype(self):
-        return PeriodDtype.construct_from_string(self.freq)
-
-    @property
-    def inferred_type(self):
-        # b/c data is represented as ints make sure we can't have ambiguous
-        # indexing
-        return 'period'
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-        s = com._values_from_object(series)
-        try:
-            return com._maybe_box(self,
-                                  super(PeriodIndex, self).get_value(s, key),
-                                  series, key)
-        except (KeyError, IndexError):
-            try:
-                asdt, parsed, reso = parse_time_string(key, self.freq)
-                grp = frequencies.Resolution.get_freq_group(reso)
-                freqn = frequencies.get_freq_group(self.freq)
-
-                vals = self._values
-
-                # if our data is higher resolution than requested key, slice
-                if grp < freqn:
-                    iv = Period(asdt, freq=(grp, 1))
-                    ord1 = iv.asfreq(self.freq, how='S').ordinal
-                    ord2 = iv.asfreq(self.freq, how='E').ordinal
-
-                    if ord2 < vals[0] or ord1 > vals[-1]:
-                        raise KeyError(key)
-
-                    pos = np.searchsorted(self._values, [ord1, ord2])
-                    key = slice(pos[0], pos[1] + 1)
-                    return series[key]
-                elif grp == freqn:
-                    key = Period(asdt, freq=self.freq).ordinal
-                    return com._maybe_box(self, self._engine.get_value(s, key),
-                                          series, key)
-                else:
-                    raise KeyError(key)
-            except TypeError:
-                pass
-
-            key = Period(key, self.freq).ordinal
-            return com._maybe_box(self, self._engine.get_value(s, key),
-                                  series, key)
-
-    @Appender(_index_shared_docs['get_indexer'] % _index_doc_kwargs)
-    def get_indexer(self, target, method=None, limit=None, tolerance=None):
-        target = _ensure_index(target)
-
-        if hasattr(target, 'freq') and target.freq != self.freq:
-            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, target.freqstr)
-            raise IncompatibleFrequency(msg)
-
-        if isinstance(target, PeriodIndex):
-            target = target.asi8
-
-        if tolerance is not None:
-            tolerance = self._convert_tolerance(tolerance)
-        return Index.get_indexer(self._int64index, target, method,
-                                 limit, tolerance)
-
-    def _get_unique_index(self, dropna=False):
-        """
-        wrap Index._get_unique_index to handle NaT
-        """
-        res = super(PeriodIndex, self)._get_unique_index(dropna=dropna)
-        if dropna:
-            res = res.dropna()
-        return res
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-        try:
-            return self._engine.get_loc(key)
-        except KeyError:
-            if is_integer(key):
-                raise
-
-            try:
-                asdt, parsed, reso = parse_time_string(key, self.freq)
-                key = asdt
-            except TypeError:
-                pass
-
-            try:
-                key = Period(key, freq=self.freq)
-            except ValueError:
-                # we cannot construct the Period
-                # as we have an invalid type
-                raise KeyError(key)
-
-            try:
-                ordinal = tslib.iNaT if key is tslib.NaT else key.ordinal
-                if tolerance is not None:
-                    tolerance = self._convert_tolerance(tolerance)
-                return self._int64index.get_loc(ordinal, method, tolerance)
-
-            except KeyError:
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string or a datetime, cast it to Period.ordinal according
-        to resolution.
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : {'ix', 'loc', 'getitem'}
-
-        Returns
-        -------
-        bound : Period or object
-
-        Notes
-        -----
-        Value of `side` parameter should be validated in caller.
-
-        """
-        assert kind in ['ix', 'loc', 'getitem']
-
-        if isinstance(label, datetime):
-            return Period(label, freq=self.freq)
-        elif isinstance(label, compat.string_types):
-            try:
-                _, parsed, reso = parse_time_string(label, self.freq)
-                bounds = self._parsed_string_to_bounds(reso, parsed)
-                return bounds[0 if side == 'left' else 1]
-            except Exception:
-                raise KeyError(label)
-        elif is_integer(label) or is_float(label):
-            self._invalid_indexer('slice', label)
-
-        return label
-
-    def _parsed_string_to_bounds(self, reso, parsed):
-        if reso == 'year':
-            t1 = Period(year=parsed.year, freq='A')
-        elif reso == 'month':
-            t1 = Period(year=parsed.year, month=parsed.month, freq='M')
-        elif reso == 'quarter':
-            q = (parsed.month - 1) // 3 + 1
-            t1 = Period(year=parsed.year, quarter=q, freq='Q-DEC')
-        elif reso == 'day':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        freq='D')
-        elif reso == 'hour':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, freq='H')
-        elif reso == 'minute':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, minute=parsed.minute, freq='T')
-        elif reso == 'second':
-            t1 = Period(year=parsed.year, month=parsed.month, day=parsed.day,
-                        hour=parsed.hour, minute=parsed.minute,
-                        second=parsed.second, freq='S')
-        else:
-            raise KeyError(reso)
-        return (t1.asfreq(self.freq, how='start'),
-                t1.asfreq(self.freq, how='end'))
-
-    def _get_string_slice(self, key):
-        if not self.is_monotonic:
-            raise ValueError('Partial indexing only valid for '
-                             'ordered time series')
-
-        key, parsed, reso = parse_time_string(key, self.freq)
-        grp = frequencies.Resolution.get_freq_group(reso)
-        freqn = frequencies.get_freq_group(self.freq)
-        if reso in ['day', 'hour', 'minute', 'second'] and not grp < freqn:
-            raise KeyError(key)
-
-        t1, t2 = self._parsed_string_to_bounds(reso, parsed)
-        return slice(self.searchsorted(t1.ordinal, side='left'),
-                     self.searchsorted(t2.ordinal, side='right'))
-
-    def _convert_tolerance(self, tolerance):
-        tolerance = DatetimeIndexOpsMixin._convert_tolerance(self, tolerance)
-        return self._maybe_convert_timedelta(tolerance)
-
-    def insert(self, loc, item):
-        if not isinstance(item, Period) or self.freq != item.freq:
-            return self.asobject.insert(loc, item)
-
-        idx = np.concatenate((self[:loc].asi8, np.array([item.ordinal]),
-                              self[loc:].asi8))
-        return self._shallow_copy(idx)
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        See Index.join
-        """
-        self._assert_can_do_setop(other)
-
-        result = Int64Index.join(self, other, how=how, level=level,
-                                 return_indexers=return_indexers)
-
-        if return_indexers:
-            result, lidx, ridx = result
-            return self._apply_meta(result), lidx, ridx
-        return self._apply_meta(result)
-
-    def _assert_can_do_setop(self, other):
-        super(PeriodIndex, self)._assert_can_do_setop(other)
-
-        if not isinstance(other, PeriodIndex):
-            raise ValueError('can only call with other PeriodIndex-ed objects')
-
-        if self.freq != other.freq:
-            msg = _DIFFERENT_FREQ_INDEX.format(self.freqstr, other.freqstr)
-            raise IncompatibleFrequency(msg)
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        result = self._apply_meta(result)
-        result.name = name
-        return result
-
-    def _apply_meta(self, rawarr):
-        if not isinstance(rawarr, PeriodIndex):
-            rawarr = PeriodIndex._from_ordinals(rawarr, freq=self.freq,
-                                                name=self.name)
-        return rawarr
-
-    def _format_native_types(self, na_rep=u('NaT'), date_format=None,
-                             **kwargs):
-
-        values = self.asobject.values
-
-        if date_format:
-            formatter = lambda dt: dt.strftime(date_format)
-        else:
-            formatter = lambda dt: u('%s') % dt
-
-        if self.hasnans:
-            mask = self._isnan
-            values[mask] = na_rep
-            imask = ~mask
-            values[imask] = np.array([formatter(dt) for dt
-                                      in values[imask]])
-        else:
-            values = np.array([formatter(dt) for dt in values])
-        return values
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-
-        if isinstance(state, dict):
-            super(PeriodIndex, self).__setstate__(state)
-
-        elif isinstance(state, tuple):
-
-            # < 0.15 compat
-            if len(state) == 2:
-                nd_state, own_state = state
-                data = np.empty(nd_state[1], dtype=nd_state[2])
-                np.ndarray.__setstate__(data, nd_state)
-
-                # backcompat
-                self.freq = Period._maybe_convert_freq(own_state[1])
-
-            else:  # pragma: no cover
-                data = np.empty(state)
-                np.ndarray.__setstate__(self, state)
-
-            self._data = data
-
-        else:
-            raise Exception("invalid pickle state")
-
-    _unpickle_compat = __setstate__
-
-    def tz_convert(self, tz):
-        """
-        Convert tz-aware DatetimeIndex from one time zone to another (using
-        pytz/dateutil)
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding UTC time.
-
-        Returns
-        -------
-        normalized : DatetimeIndex
-
-        Note
-        ----
-        Not currently implemented for PeriodIndex
-        """
-        raise NotImplementedError("Not yet implemented for PeriodIndex")
-
-    def tz_localize(self, tz, infer_dst=False):
-        """
-        Localize tz-naive DatetimeIndex to given time zone (using
-        pytz/dateutil), or remove timezone from tz-aware DatetimeIndex
-
-        Parameters
-        ----------
-        tz : string, pytz.timezone, dateutil.tz.tzfile or None
-            Time zone for time. Corresponding timestamps would be converted to
-            time zone of the TimeSeries.
-            None will remove timezone holding local time.
-        infer_dst : boolean, default False
-            Attempt to infer fall dst-transition hours based on order
-
-        Returns
-        -------
-        localized : DatetimeIndex
-
-        Note
-        ----
-        Not currently implemented for PeriodIndex
-        """
-        raise NotImplementedError("Not yet implemented for PeriodIndex")
-
-
-PeriodIndex._add_numeric_methods_disabled()
-PeriodIndex._add_logical_methods_disabled()
-PeriodIndex._add_datetimelike_methods()
-
-
-def _get_ordinal_range(start, end, periods, freq, mult=1):
-    if com._count_not_none(start, end, periods) < 2:
-        raise ValueError('Must specify 2 of start, end, periods')
-
-    if freq is not None:
-        _, mult = _gfc(freq)
-
-    if start is not None:
-        start = Period(start, freq)
-    if end is not None:
-        end = Period(end, freq)
-
-    is_start_per = isinstance(start, Period)
-    is_end_per = isinstance(end, Period)
-
-    if is_start_per and is_end_per and start.freq != end.freq:
-        raise ValueError('Start and end must have same freq')
-    if (start is tslib.NaT or end is tslib.NaT):
-        raise ValueError('Start and end must not be NaT')
-
-    if freq is None:
-        if is_start_per:
-            freq = start.freq
-        elif is_end_per:
-            freq = end.freq
-        else:  # pragma: no cover
-            raise ValueError('Could not infer freq from start/end')
-
-    if periods is not None:
-        periods = periods * mult
-        if start is None:
-            data = np.arange(end.ordinal - periods + mult,
-                             end.ordinal + 1, mult,
-                             dtype=np.int64)
-        else:
-            data = np.arange(start.ordinal, start.ordinal + periods, mult,
-                             dtype=np.int64)
-    else:
-        data = np.arange(start.ordinal, end.ordinal + 1, mult, dtype=np.int64)
-
-    return data, freq
-
-
-def _range_from_fields(year=None, month=None, quarter=None, day=None,
-                       hour=None, minute=None, second=None, freq=None):
-    if hour is None:
-        hour = 0
-    if minute is None:
-        minute = 0
-    if second is None:
-        second = 0
-    if day is None:
-        day = 1
-
-    ordinals = []
-
-    if quarter is not None:
-        if freq is None:
-            freq = 'Q'
-            base = frequencies.FreqGroup.FR_QTR
-        else:
-            base, mult = _gfc(freq)
-            if base != frequencies.FreqGroup.FR_QTR:
-                raise AssertionError("base must equal FR_QTR")
-
-        year, quarter = _make_field_arrays(year, quarter)
-        for y, q in zip(year, quarter):
-            y, m = _quarter_to_myear(y, q, freq)
-            val = period.period_ordinal(y, m, 1, 1, 1, 1, 0, 0, base)
-            ordinals.append(val)
-    else:
-        base, mult = _gfc(freq)
-        arrays = _make_field_arrays(year, month, day, hour, minute, second)
-        for y, mth, d, h, mn, s in zip(*arrays):
-            ordinals.append(period.period_ordinal(
-                y, mth, d, h, mn, s, 0, 0, base))
-
-    return np.array(ordinals, dtype=np.int64), freq
-
-
-def _make_field_arrays(*fields):
-    length = None
-    for x in fields:
-        if isinstance(x, (list, np.ndarray, ABCSeries)):
-            if length is not None and len(x) != length:
-                raise ValueError('Mismatched Period array lengths')
-            elif length is None:
-                length = len(x)
-
-    arrays = [np.asarray(x) if isinstance(x, (np.ndarray, list, ABCSeries))
-              else np.repeat(x, length) for x in fields]
-
-    return arrays
-
-
-def pnow(freq=None):
-    # deprecation, xref #13790
-    import warnings
-
-    warnings.warn("pd.pnow() and pandas.tseries.period.pnow() "
-                  "are deprecated. Please use Period.now()",
-                  FutureWarning, stacklevel=2)
-    return Period.now(freq=freq)
-
-
-def period_range(start=None, end=None, periods=None, freq='D', name=None):
-    """
-    Return a fixed frequency datetime index, with day (calendar) as the default
-    frequency
-
-
-    Parameters
-    ----------
-    start : starting value, period-like, optional
-    end : ending value, period-like, optional
-    periods : int, default None
-        Number of periods in the index
-    freq : str/DateOffset, default 'D'
-        Frequency alias
-    name : str, default None
-        Name for the resulting PeriodIndex
-
-    Returns
-    -------
-    prng : PeriodIndex
-    """
-    return PeriodIndex(start=start, end=end, periods=periods,
-                       freq=freq, name=name)
diff --git a/pandas/tseries/plotting.py b/pandas/tseries/plotting.py
index 4eddf54701889..302016907635d 100644
--- a/pandas/tseries/plotting.py
+++ b/pandas/tseries/plotting.py
@@ -1,344 +1,3 @@
-"""
-Period formatters and locators adapted from scikits.timeseries by
-Pierre GF Gerard-Marchant & Matt Knox
-"""
+# flake8: noqa
 
-# TODO: Use the fact that axis can have units to simplify the process
-
-import numpy as np
-
-from matplotlib import pylab
-from pandas.tseries.period import Period
-from pandas.tseries.offsets import DateOffset
-import pandas.tseries.frequencies as frequencies
-from pandas.tseries.index import DatetimeIndex
-from pandas.tseries.period import PeriodIndex
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.formats.printing import pprint_thing
-import pandas.compat as compat
-
-from pandas.tseries.converter import (TimeSeries_DateLocator,
-                                      TimeSeries_DateFormatter,
-                                      TimeSeries_TimedeltaFormatter)
-
-# ---------------------------------------------------------------------
-# Plotting functions and monkey patches
-
-
-def tsplot(series, plotf, ax=None, **kwargs):
-    """
-    Plots a Series on the given Matplotlib axes or the current axes
-
-    Parameters
-    ----------
-    axes : Axes
-    series : Series
-
-    Notes
-    _____
-    Supports same kwargs as Axes.plot
-
-    """
-    # Used inferred freq is possible, need a test case for inferred
-    if ax is None:
-        import matplotlib.pyplot as plt
-        ax = plt.gca()
-
-    freq, series = _maybe_resample(series, ax, kwargs)
-
-    # Set ax with freq info
-    _decorate_axes(ax, freq, kwargs)
-    ax._plot_data.append((series, plotf, kwargs))
-    lines = plotf(ax, series.index._mpl_repr(), series.values, **kwargs)
-
-    # set date formatter, locators and rescale limits
-    format_dateaxis(ax, ax.freq, series.index)
-    return lines
-
-
-def _maybe_resample(series, ax, kwargs):
-    # resample against axes freq if necessary
-    freq, ax_freq = _get_freq(ax, series)
-
-    if freq is None:  # pragma: no cover
-        raise ValueError('Cannot use dynamic axis without frequency info')
-
-    # Convert DatetimeIndex to PeriodIndex
-    if isinstance(series.index, DatetimeIndex):
-        series = series.to_period(freq=freq)
-
-    if ax_freq is not None and freq != ax_freq:
-        if frequencies.is_superperiod(freq, ax_freq):  # upsample input
-            series = series.copy()
-            series.index = series.index.asfreq(ax_freq, how='s')
-            freq = ax_freq
-        elif _is_sup(freq, ax_freq):  # one is weekly
-            how = kwargs.pop('how', 'last')
-            series = getattr(series.resample('D'), how)().dropna()
-            series = getattr(series.resample(ax_freq), how)().dropna()
-            freq = ax_freq
-        elif frequencies.is_subperiod(freq, ax_freq) or _is_sub(freq, ax_freq):
-            _upsample_others(ax, freq, kwargs)
-            ax_freq = freq
-        else:  # pragma: no cover
-            raise ValueError('Incompatible frequency conversion')
-    return freq, series
-
-
-def _is_sub(f1, f2):
-    return ((f1.startswith('W') and frequencies.is_subperiod('D', f2)) or
-            (f2.startswith('W') and frequencies.is_subperiod(f1, 'D')))
-
-
-def _is_sup(f1, f2):
-    return ((f1.startswith('W') and frequencies.is_superperiod('D', f2)) or
-            (f2.startswith('W') and frequencies.is_superperiod(f1, 'D')))
-
-
-def _upsample_others(ax, freq, kwargs):
-    legend = ax.get_legend()
-    lines, labels = _replot_ax(ax, freq, kwargs)
-    _replot_ax(ax, freq, kwargs)
-
-    other_ax = None
-    if hasattr(ax, 'left_ax'):
-        other_ax = ax.left_ax
-    if hasattr(ax, 'right_ax'):
-        other_ax = ax.right_ax
-
-    if other_ax is not None:
-        rlines, rlabels = _replot_ax(other_ax, freq, kwargs)
-        lines.extend(rlines)
-        labels.extend(rlabels)
-
-    if (legend is not None and kwargs.get('legend', True) and
-            len(lines) > 0):
-        title = legend.get_title().get_text()
-        if title == 'None':
-            title = None
-        ax.legend(lines, labels, loc='best', title=title)
-
-
-def _replot_ax(ax, freq, kwargs):
-    data = getattr(ax, '_plot_data', None)
-
-    # clear current axes and data
-    ax._plot_data = []
-    ax.clear()
-
-    _decorate_axes(ax, freq, kwargs)
-
-    lines = []
-    labels = []
-    if data is not None:
-        for series, plotf, kwds in data:
-            series = series.copy()
-            idx = series.index.asfreq(freq, how='S')
-            series.index = idx
-            ax._plot_data.append((series, plotf, kwds))
-
-            # for tsplot
-            if isinstance(plotf, compat.string_types):
-                from pandas.tools.plotting import _plot_klass
-                plotf = _plot_klass[plotf]._plot
-
-            lines.append(plotf(ax, series.index._mpl_repr(),
-                               series.values, **kwds)[0])
-            labels.append(pprint_thing(series.name))
-
-    return lines, labels
-
-
-def _decorate_axes(ax, freq, kwargs):
-    """Initialize axes for time-series plotting"""
-    if not hasattr(ax, '_plot_data'):
-        ax._plot_data = []
-
-    ax.freq = freq
-    xaxis = ax.get_xaxis()
-    xaxis.freq = freq
-    if not hasattr(ax, 'legendlabels'):
-        ax.legendlabels = [kwargs.get('label', None)]
-    else:
-        ax.legendlabels.append(kwargs.get('label', None))
-    ax.view_interval = None
-    ax.date_axis_info = None
-
-
-def _get_ax_freq(ax):
-    """
-    Get the freq attribute of the ax object if set.
-    Also checks shared axes (eg when using secondary yaxis, sharex=True
-    or twinx)
-    """
-    ax_freq = getattr(ax, 'freq', None)
-    if ax_freq is None:
-        # check for left/right ax in case of secondary yaxis
-        if hasattr(ax, 'left_ax'):
-            ax_freq = getattr(ax.left_ax, 'freq', None)
-        elif hasattr(ax, 'right_ax'):
-            ax_freq = getattr(ax.right_ax, 'freq', None)
-    if ax_freq is None:
-        # check if a shared ax (sharex/twinx) has already freq set
-        shared_axes = ax.get_shared_x_axes().get_siblings(ax)
-        if len(shared_axes) > 1:
-            for shared_ax in shared_axes:
-                ax_freq = getattr(shared_ax, 'freq', None)
-                if ax_freq is not None:
-                    break
-    return ax_freq
-
-
-def _get_freq(ax, series):
-    # get frequency from data
-    freq = getattr(series.index, 'freq', None)
-    if freq is None:
-        freq = getattr(series.index, 'inferred_freq', None)
-
-    ax_freq = _get_ax_freq(ax)
-
-    # use axes freq if no data freq
-    if freq is None:
-        freq = ax_freq
-
-    # get the period frequency
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-    else:
-        freq = frequencies.get_base_alias(freq)
-
-    freq = frequencies.get_period_alias(freq)
-    return freq, ax_freq
-
-
-def _use_dynamic_x(ax, data):
-    freq = _get_index_freq(data)
-    ax_freq = _get_ax_freq(ax)
-
-    if freq is None:  # convert irregular if axes has freq info
-        freq = ax_freq
-    else:  # do not use tsplot if irregular was plotted first
-        if (ax_freq is None) and (len(ax.get_lines()) > 0):
-            return False
-
-    if freq is None:
-        return False
-
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-    else:
-        freq = frequencies.get_base_alias(freq)
-    freq = frequencies.get_period_alias(freq)
-
-    if freq is None:
-        return False
-
-    # hack this for 0.10.1, creating more technical debt...sigh
-    if isinstance(data.index, DatetimeIndex):
-        base = frequencies.get_freq(freq)
-        x = data.index
-        if (base <= frequencies.FreqGroup.FR_DAY):
-            return x[:1].is_normalized
-        return Period(x[0], freq).to_timestamp(tz=x.tz) == x[0]
-    return True
-
-
-def _get_index_freq(data):
-    freq = getattr(data.index, 'freq', None)
-    if freq is None:
-        freq = getattr(data.index, 'inferred_freq', None)
-        if freq == 'B':
-            weekdays = np.unique(data.index.dayofweek)
-            if (5 in weekdays) or (6 in weekdays):
-                freq = None
-    return freq
-
-
-def _maybe_convert_index(ax, data):
-    # tsplot converts automatically, but don't want to convert index
-    # over and over for DataFrames
-    if isinstance(data.index, DatetimeIndex):
-        freq = getattr(data.index, 'freq', None)
-
-        if freq is None:
-            freq = getattr(data.index, 'inferred_freq', None)
-        if isinstance(freq, DateOffset):
-            freq = freq.rule_code
-
-        if freq is None:
-            freq = _get_ax_freq(ax)
-
-        if freq is None:
-            raise ValueError('Could not get frequency alias for plotting')
-
-        freq = frequencies.get_base_alias(freq)
-        freq = frequencies.get_period_alias(freq)
-
-        data = data.to_period(freq=freq)
-    return data
-
-
-# Patch methods for subplot. Only format_dateaxis is currently used.
-# Do we need the rest for convenience?
-
-def format_timedelta_ticks(x, pos, n_decimals):
-    """
-    Convert seconds to 'D days HH:MM:SS.F'
-    """
-    s, ns = divmod(x, 1e9)
-    m, s = divmod(s, 60)
-    h, m = divmod(m, 60)
-    d, h = divmod(h, 24)
-    decimals = int(ns * 10**(n_decimals - 9))
-    s = r'{:02d}:{:02d}:{:02d}'.format(int(h), int(m), int(s))
-    if n_decimals > 0:
-        s += '.{{:0{:0d}d}}'.format(n_decimals).format(decimals)
-    if d != 0:
-        s = '{:d} days '.format(int(d)) + s
-    return s
-
-
-def format_dateaxis(subplot, freq, index):
-    """
-    Pretty-formats the date axis (x-axis).
-
-    Major and minor ticks are automatically set for the frequency of the
-    current underlying series.  As the dynamic mode is activated by
-    default, changing the limits of the x axis will intelligently change
-    the positions of the ticks.
-    """
-
-    # handle index specific formatting
-    # Note: DatetimeIndex does not use this
-    # interface. DatetimeIndex uses matplotlib.date directly
-    if isinstance(index, PeriodIndex):
-
-        majlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
-                                            minor_locator=False,
-                                            plot_obj=subplot)
-        minlocator = TimeSeries_DateLocator(freq, dynamic_mode=True,
-                                            minor_locator=True,
-                                            plot_obj=subplot)
-        subplot.xaxis.set_major_locator(majlocator)
-        subplot.xaxis.set_minor_locator(minlocator)
-
-        majformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
-                                                minor_locator=False,
-                                                plot_obj=subplot)
-        minformatter = TimeSeries_DateFormatter(freq, dynamic_mode=True,
-                                                minor_locator=True,
-                                                plot_obj=subplot)
-        subplot.xaxis.set_major_formatter(majformatter)
-        subplot.xaxis.set_minor_formatter(minformatter)
-
-        # x and y coord info
-        subplot.format_coord = lambda t, y: (
-            "t = {0}  y = {1:8f}".format(Period(ordinal=int(t), freq=freq), y))
-
-    elif isinstance(index, TimedeltaIndex):
-        subplot.xaxis.set_major_formatter(
-            TimeSeries_TimedeltaFormatter())
-    else:
-        raise TypeError('index type not supported')
-
-    pylab.draw_if_interactive()
+from pandas.plotting._timeseries import tsplot
diff --git a/pandas/tseries/resample.py b/pandas/tseries/resample.py
deleted file mode 100755
index 2856b54ad9a8c..0000000000000
--- a/pandas/tseries/resample.py
+++ /dev/null
@@ -1,1398 +0,0 @@
-from datetime import timedelta
-import numpy as np
-import warnings
-import copy
-
-import pandas as pd
-from pandas.core.base import AbstractMethodError, GroupByMixin
-
-from pandas.core.groupby import (BinGrouper, Grouper, _GroupBy, GroupBy,
-                                 SeriesGroupBy, groupby, PanelGroupBy)
-
-from pandas.tseries.frequencies import to_offset, is_subperiod, is_superperiod
-from pandas.tseries.index import DatetimeIndex, date_range
-from pandas.tseries.tdi import TimedeltaIndex
-from pandas.tseries.offsets import DateOffset, Tick, Day, _delta_to_nanoseconds
-from pandas.tseries.period import PeriodIndex, period_range
-import pandas.core.common as com
-import pandas.core.algorithms as algos
-
-import pandas.compat as compat
-from pandas.compat.numpy import function as nv
-
-from pandas._libs import lib, tslib
-from pandas._libs.lib import Timestamp
-from pandas._libs.period import IncompatibleFrequency
-
-from pandas.util.decorators import Appender
-from pandas.core.generic import _shared_docs
-_shared_docs_kwargs = dict()
-
-
-class Resampler(_GroupBy):
-
-    """
-    Class for resampling datetimelike data, a groupby-like operation.
-    See aggregate, transform, and apply functions on this object.
-
-    It's easiest to use obj.resample(...) to use Resampler.
-
-    Parameters
-    ----------
-    obj : pandas object
-    groupby : a TimeGrouper object
-    axis : int, default 0
-    kind : str or None
-        'period', 'timestamp' to override default index treatement
-
-    Notes
-    -----
-    After resampling, see aggregate, apply, and transform functions.
-
-    Returns
-    -------
-    a Resampler of the appropriate type
-    """
-
-    # to the groupby descriptor
-    _attributes = ['freq', 'axis', 'closed', 'label', 'convention',
-                   'loffset', 'base', 'kind']
-
-    # API compat of allowed attributes
-    _deprecated_valids = _attributes + ['__doc__', '_cache', '_attributes',
-                                        'binner', 'grouper', 'groupby',
-                                        'sort', 'kind', 'squeeze', 'keys',
-                                        'group_keys', 'as_index', 'exclusions',
-                                        '_groupby']
-
-    # don't raise deprecation warning on attributes starting with these
-    # patterns - prevents warnings caused by IPython introspection
-    _deprecated_valid_patterns = ['_ipython', '_repr']
-
-    # API compat of disallowed attributes
-    _deprecated_invalids = ['iloc', 'loc', 'ix', 'iat', 'at']
-
-    def __init__(self, obj, groupby=None, axis=0, kind=None, **kwargs):
-        self.groupby = groupby
-        self.keys = None
-        self.sort = True
-        self.axis = axis
-        self.kind = kind
-        self.squeeze = False
-        self.group_keys = True
-        self.as_index = True
-        self.exclusions = set()
-        self.binner = None
-        self.grouper = None
-
-        if self.groupby is not None:
-            self.groupby._set_grouper(self._convert_obj(obj), sort=True)
-
-    def __unicode__(self):
-        """ provide a nice str repr of our rolling object """
-        attrs = ["{k}={v}".format(k=k, v=getattr(self.groupby, k))
-                 for k in self._attributes if
-                 getattr(self.groupby, k, None) is not None]
-        return "{klass} [{attrs}]".format(klass=self.__class__.__name__,
-                                          attrs=', '.join(attrs))
-
-    @property
-    def obj(self):
-        return self.groupby.obj
-
-    @property
-    def ax(self):
-        return self.groupby.ax
-
-    @property
-    def _typ(self):
-        """ masquerade for compat as a Series or a DataFrame """
-        if isinstance(self._selected_obj, pd.Series):
-            return 'series'
-        return 'dataframe'
-
-    @property
-    def _from_selection(self):
-        """ is the resampling from a DataFrame column or MultiIndex level """
-        # upsampling and PeriodIndex resampling do not work
-        # with selection, this state used to catch and raise an error
-        return (self.groupby is not None and
-                (self.groupby.key is not None or
-                 self.groupby.level is not None))
-
-    def _deprecated(self, op):
-        warnings.warn(("\n.resample() is now a deferred operation\n"
-                       "You called {op}(...) on this deferred object "
-                       "which materialized it into a {klass}\nby implicitly "
-                       "taking the mean.  Use .resample(...).mean() "
-                       "instead").format(op=op, klass=self._typ),
-                      FutureWarning, stacklevel=3)
-        return self.mean()
-
-    def _make_deprecated_binop(op):
-        # op is a string
-
-        def _evaluate_numeric_binop(self, other):
-            result = self._deprecated(op)
-            return getattr(result, op)(other)
-        return _evaluate_numeric_binop
-
-    def _make_deprecated_unary(op, name):
-        # op is a callable
-
-        def _evaluate_numeric_unary(self):
-            result = self._deprecated(name)
-            return op(result)
-        return _evaluate_numeric_unary
-
-    def __array__(self):
-        return self._deprecated('__array__').__array__()
-
-    __gt__ = _make_deprecated_binop('__gt__')
-    __ge__ = _make_deprecated_binop('__ge__')
-    __lt__ = _make_deprecated_binop('__lt__')
-    __le__ = _make_deprecated_binop('__le__')
-    __eq__ = _make_deprecated_binop('__eq__')
-    __ne__ = _make_deprecated_binop('__ne__')
-
-    __add__ = __radd__ = _make_deprecated_binop('__add__')
-    __sub__ = __rsub__ = _make_deprecated_binop('__sub__')
-    __mul__ = __rmul__ = _make_deprecated_binop('__mul__')
-    __floordiv__ = __rfloordiv__ = _make_deprecated_binop('__floordiv__')
-    __truediv__ = __rtruediv__ = _make_deprecated_binop('__truediv__')
-    if not compat.PY3:
-        __div__ = __rdiv__ = _make_deprecated_binop('__div__')
-    __neg__ = _make_deprecated_unary(lambda x: -x, '__neg__')
-    __pos__ = _make_deprecated_unary(lambda x: x, '__pos__')
-    __abs__ = _make_deprecated_unary(lambda x: np.abs(x), '__abs__')
-    __inv__ = _make_deprecated_unary(lambda x: -x, '__inv__')
-
-    def __getattr__(self, attr):
-        if attr in self._internal_names_set:
-            return object.__getattribute__(self, attr)
-        if attr in self._attributes:
-            return getattr(self.groupby, attr)
-        if attr in self.obj:
-            return self[attr]
-
-        if attr in self._deprecated_invalids:
-            raise ValueError(".resample() is now a deferred operation\n"
-                             "\tuse .resample(...).mean() instead of "
-                             ".resample(...)")
-
-        matches_pattern = any(attr.startswith(x) for x
-                              in self._deprecated_valid_patterns)
-        if not matches_pattern and attr not in self._deprecated_valids:
-            self = self._deprecated(attr)
-
-        return object.__getattribute__(self, attr)
-
-    def __setattr__(self, attr, value):
-        if attr not in self._deprecated_valids:
-            raise ValueError("cannot set values on {0}".format(
-                self.__class__.__name__))
-        object.__setattr__(self, attr, value)
-
-    def __getitem__(self, key):
-        try:
-            return super(Resampler, self).__getitem__(key)
-        except (KeyError, com.AbstractMethodError):
-
-            # compat for deprecated
-            if isinstance(self.obj, com.ABCSeries):
-                return self._deprecated('__getitem__')[key]
-
-            raise
-
-    def __setitem__(self, attr, value):
-        raise ValueError("cannot set items on {0}".format(
-            self.__class__.__name__))
-
-    def _convert_obj(self, obj):
-        """
-        provide any conversions for the object in order to correctly handle
-
-        Parameters
-        ----------
-        obj : the object to be resampled
-
-        Returns
-        -------
-        obj : converted object
-        """
-        obj = obj._consolidate()
-        return obj
-
-    def _get_binner_for_time(self):
-        raise AbstractMethodError(self)
-
-    def _set_binner(self):
-        """
-        setup our binners
-        cache these as we are an immutable object
-        """
-
-        if self.binner is None:
-            self.binner, self.grouper = self._get_binner()
-
-    def _get_binner(self):
-        """
-        create the BinGrouper, assume that self.set_grouper(obj)
-        has already been called
-        """
-
-        binner, bins, binlabels = self._get_binner_for_time()
-        bin_grouper = BinGrouper(bins, binlabels)
-        return binner, bin_grouper
-
-    def _assure_grouper(self):
-        """ make sure that we are creating our binner & grouper """
-        self._set_binner()
-
-    def plot(self, *args, **kwargs):
-        # for compat with prior versions, we want to
-        # have the warnings shown here and just have this work
-        return self._deprecated('plot').plot(*args, **kwargs)
-
-    def aggregate(self, arg, *args, **kwargs):
-        """
-        Apply aggregation function or functions to resampled groups, yielding
-        most likely Series but in some cases DataFrame depending on the output
-        of the aggregation function
-
-        Parameters
-        ----------
-        func_or_funcs : function or list / dict of functions
-            List/dict of functions will produce DataFrame with column names
-            determined by the function names themselves (list) or the keys in
-            the dict
-
-        Notes
-        -----
-        agg is an alias for aggregate. Use it.
-
-        Examples
-        --------
-        >>> s = Series([1,2,3,4,5],
-                        index=pd.date_range('20130101',
-                                            periods=5,freq='s'))
-        2013-01-01 00:00:00    1
-        2013-01-01 00:00:01    2
-        2013-01-01 00:00:02    3
-        2013-01-01 00:00:03    4
-        2013-01-01 00:00:04    5
-        Freq: S, dtype: int64
-
-        >>> r = s.resample('2s')
-        DatetimeIndexResampler [freq=<2 * Seconds>, axis=0, closed=left,
-                                label=left, convention=start, base=0]
-
-        >>> r.agg(np.sum)
-        2013-01-01 00:00:00    3
-        2013-01-01 00:00:02    7
-        2013-01-01 00:00:04    5
-        Freq: 2S, dtype: int64
-
-        >>> r.agg(['sum','mean','max'])
-                             sum  mean  max
-        2013-01-01 00:00:00    3   1.5    2
-        2013-01-01 00:00:02    7   3.5    4
-        2013-01-01 00:00:04    5   5.0    5
-
-        >>> r.agg({'result' : lambda x: x.mean() / x.std(),
-                   'total' : np.sum})
-                             total    result
-        2013-01-01 00:00:00      3  2.121320
-        2013-01-01 00:00:02      7  4.949747
-        2013-01-01 00:00:04      5       NaN
-
-        See also
-        --------
-        transform
-
-        Returns
-        -------
-        Series or DataFrame
-        """
-
-        self._set_binner()
-        result, how = self._aggregate(arg, *args, **kwargs)
-        if result is None:
-            result = self._groupby_and_aggregate(arg,
-                                                 *args,
-                                                 **kwargs)
-
-        result = self._apply_loffset(result)
-        return result
-
-    agg = aggregate
-    apply = aggregate
-
-    def transform(self, arg, *args, **kwargs):
-        """
-        Call function producing a like-indexed Series on each group and return
-        a Series with the transformed values
-
-        Parameters
-        ----------
-        func : function
-            To apply to each group. Should return a Series with the same index
-
-        Examples
-        --------
-        >>> resampled.transform(lambda x: (x - x.mean()) / x.std())
-
-        Returns
-        -------
-        transformed : Series
-        """
-        return self._selected_obj.groupby(self.groupby).transform(
-            arg, *args, **kwargs)
-
-    def _downsample(self, f):
-        raise AbstractMethodError(self)
-
-    def _upsample(self, f, limit=None, fill_value=None):
-        raise AbstractMethodError(self)
-
-    def _gotitem(self, key, ndim, subset=None):
-        """
-        sub-classes to define
-        return a sliced object
-
-        Parameters
-        ----------
-        key : string / list of selections
-        ndim : 1,2
-            requested ndim of result
-        subset : object, default None
-            subset to act on
-        """
-        self._set_binner()
-        grouper = self.grouper
-        if subset is None:
-            subset = self.obj
-        grouped = groupby(subset, by=None, grouper=grouper, axis=self.axis)
-
-        # try the key selection
-        try:
-            return grouped[key]
-        except KeyError:
-            return grouped
-
-    def _groupby_and_aggregate(self, how, grouper=None, *args, **kwargs):
-        """ re-evaluate the obj with a groupby aggregation """
-
-        if grouper is None:
-            self._set_binner()
-            grouper = self.grouper
-
-        obj = self._selected_obj
-
-        try:
-            grouped = groupby(obj, by=None, grouper=grouper, axis=self.axis)
-        except TypeError:
-
-            # panel grouper
-            grouped = PanelGroupBy(obj, grouper=grouper, axis=self.axis)
-
-        try:
-            result = grouped.aggregate(how, *args, **kwargs)
-        except Exception:
-
-            # we have a non-reducing function
-            # try to evaluate
-            result = grouped.apply(how, *args, **kwargs)
-
-        result = self._apply_loffset(result)
-        return self._wrap_result(result)
-
-    def _apply_loffset(self, result):
-        """
-        if loffset is set, offset the result index
-
-        This is NOT an idempotent routine, it will be applied
-        exactly once to the result.
-
-        Parameters
-        ----------
-        result : Series or DataFrame
-            the result of resample
-        """
-
-        needs_offset = (
-            isinstance(self.loffset, (DateOffset, timedelta)) and
-            isinstance(result.index, DatetimeIndex) and
-            len(result.index) > 0
-        )
-
-        if needs_offset:
-            result.index = result.index + self.loffset
-
-        self.loffset = None
-        return result
-
-    def _get_resampler_for_grouping(self, groupby, **kwargs):
-        """ return the correct class for resampling with groupby """
-        return self._resampler_for_grouping(self, groupby=groupby, **kwargs)
-
-    def _wrap_result(self, result):
-        """ potentially wrap any results """
-        if isinstance(result, com.ABCSeries) and self._selection is not None:
-            result.name = self._selection
-
-        return result
-
-    def pad(self, limit=None):
-        """
-        Forward fill the values
-
-        Parameters
-        ----------
-        limit : integer, optional
-            limit of how many values to fill
-
-        See Also
-        --------
-        Series.fillna
-        DataFrame.fillna
-        """
-        return self._upsample('pad', limit=limit)
-    ffill = pad
-
-    def backfill(self, limit=None):
-        """
-        Backward fill the values
-
-        Parameters
-        ----------
-        limit : integer, optional
-            limit of how many values to fill
-
-        See Also
-        --------
-        Series.fillna
-        DataFrame.fillna
-        """
-        return self._upsample('backfill', limit=limit)
-    bfill = backfill
-
-    def fillna(self, method, limit=None):
-        """
-        Fill missing values
-
-        Parameters
-        ----------
-        method : str, method of resampling ('ffill', 'bfill')
-        limit : integer, optional
-            limit of how many values to fill
-
-        See Also
-        --------
-        Series.fillna
-        DataFrame.fillna
-        """
-        return self._upsample(method, limit=limit)
-
-    @Appender(_shared_docs['interpolate'] % _shared_docs_kwargs)
-    def interpolate(self, method='linear', axis=0, limit=None, inplace=False,
-                    limit_direction='forward', downcast=None, **kwargs):
-        """
-        Interpolate values according to different methods.
-
-        .. versionadded:: 0.18.1
-        """
-        result = self._upsample(None)
-        return result.interpolate(method=method, axis=axis, limit=limit,
-                                  inplace=inplace,
-                                  limit_direction=limit_direction,
-                                  downcast=downcast, **kwargs)
-
-    def asfreq(self, fill_value=None):
-        """
-        return the values at the new freq,
-        essentially a reindex
-
-        Parameters
-        ----------
-        fill_value: scalar, optional
-            Value to use for missing values, applied during upsampling (note
-            this does not fill NaNs that already were present).
-
-            .. versionadded:: 0.20.0
-
-        See Also
-        --------
-        Series.asfreq
-        DataFrame.asfreq
-        """
-        return self._upsample('asfreq', fill_value=fill_value)
-
-    def std(self, ddof=1, *args, **kwargs):
-        """
-        Compute standard deviation of groups, excluding missing values
-
-        Parameters
-        ----------
-        ddof : integer, default 1
-        degrees of freedom
-        """
-        nv.validate_resampler_func('std', args, kwargs)
-        return self._downsample('std', ddof=ddof)
-
-    def var(self, ddof=1, *args, **kwargs):
-        """
-        Compute variance of groups, excluding missing values
-
-        Parameters
-        ----------
-        ddof : integer, default 1
-        degrees of freedom
-        """
-        nv.validate_resampler_func('var', args, kwargs)
-        return self._downsample('var', ddof=ddof)
-
-
-Resampler._deprecated_valids += dir(Resampler)
-
-# downsample methods
-for method in ['min', 'max', 'first', 'last', 'sum', 'mean', 'sem',
-               'median', 'prod', 'ohlc']:
-
-    def f(self, _method=method, *args, **kwargs):
-        nv.validate_resampler_func(_method, args, kwargs)
-        return self._downsample(_method)
-    f.__doc__ = getattr(GroupBy, method).__doc__
-    setattr(Resampler, method, f)
-
-# groupby & aggregate methods
-for method in ['count', 'size']:
-
-    def f(self, _method=method):
-        return self._downsample(_method)
-    f.__doc__ = getattr(GroupBy, method).__doc__
-    setattr(Resampler, method, f)
-
-# series only methods
-for method in ['nunique']:
-    def f(self, _method=method):
-        return self._downsample(_method)
-    f.__doc__ = getattr(SeriesGroupBy, method).__doc__
-    setattr(Resampler, method, f)
-
-
-def _maybe_process_deprecations(r, how=None, fill_method=None, limit=None):
-    """ potentially we might have a deprecation warning, show it
-    but call the appropriate methods anyhow """
-
-    if how is not None:
-
-        # .resample(..., how='sum')
-        if isinstance(how, compat.string_types):
-            method = "{0}()".format(how)
-
-            # .resample(..., how=lambda x: ....)
-        else:
-            method = ".apply(<func>)"
-
-        # if we have both a how and fill_method, then show
-        # the following warning
-        if fill_method is None:
-            warnings.warn("how in .resample() is deprecated\n"
-                          "the new syntax is "
-                          ".resample(...).{method}".format(
-                              method=method),
-                          FutureWarning, stacklevel=3)
-        r = r.aggregate(how)
-
-    if fill_method is not None:
-
-        # show the prior function call
-        method = '.' + method if how is not None else ''
-
-        args = "limit={0}".format(limit) if limit is not None else ""
-        warnings.warn("fill_method is deprecated to .resample()\n"
-                      "the new syntax is .resample(...){method}"
-                      ".{fill_method}({args})".format(
-                          method=method,
-                          fill_method=fill_method,
-                          args=args),
-                      FutureWarning, stacklevel=3)
-
-        if how is not None:
-            r = getattr(r, fill_method)(limit=limit)
-        else:
-            r = r.aggregate(fill_method, limit=limit)
-
-    return r
-
-
-class _GroupByMixin(GroupByMixin):
-    """ provide the groupby facilities """
-
-    def __init__(self, obj, *args, **kwargs):
-
-        parent = kwargs.pop('parent', None)
-        groupby = kwargs.pop('groupby', None)
-        if parent is None:
-            parent = obj
-
-        # initialize our GroupByMixin object with
-        # the resampler attributes
-        for attr in self._attributes:
-            setattr(self, attr, kwargs.get(attr, getattr(parent, attr)))
-
-        super(_GroupByMixin, self).__init__(None)
-        self._groupby = groupby
-        self._groupby.mutated = True
-        self._groupby.grouper.mutated = True
-        self.groupby = copy.copy(parent.groupby)
-
-    def _apply(self, f, **kwargs):
-        """
-        dispatch to _upsample; we are stripping all of the _upsample kwargs and
-        performing the original function call on the grouped object
-        """
-
-        def func(x):
-            x = self._shallow_copy(x, groupby=self.groupby)
-
-            if isinstance(f, compat.string_types):
-                return getattr(x, f)(**kwargs)
-
-            return x.apply(f, **kwargs)
-
-        result = self._groupby.apply(func)
-        return self._wrap_result(result)
-
-    _upsample = _apply
-    _downsample = _apply
-    _groupby_and_aggregate = _apply
-
-
-class DatetimeIndexResampler(Resampler):
-
-    @property
-    def _resampler_for_grouping(self):
-        return DatetimeIndexResamplerGroupby
-
-    def _get_binner_for_time(self):
-
-        # this is how we are actually creating the bins
-        if self.kind == 'period':
-            return self.groupby._get_time_period_bins(self.ax)
-        return self.groupby._get_time_bins(self.ax)
-
-    def _downsample(self, how, **kwargs):
-        """
-        Downsample the cython defined function
-
-        Parameters
-        ----------
-        how : string / cython mapped function
-        **kwargs : kw args passed to how function
-        """
-        self._set_binner()
-        how = self._is_cython_func(how) or how
-        ax = self.ax
-        obj = self._selected_obj
-
-        if not len(ax):
-            # reset to the new freq
-            obj = obj.copy()
-            obj.index.freq = self.freq
-            return obj
-
-        # do we have a regular frequency
-        if ax.freq is not None or ax.inferred_freq is not None:
-
-            if len(self.grouper.binlabels) > len(ax) and how is None:
-
-                # let's do an asfreq
-                return self.asfreq()
-
-        # we are downsampling
-        # we want to call the actual grouper method here
-        result = obj.groupby(
-            self.grouper, axis=self.axis).aggregate(how, **kwargs)
-
-        result = self._apply_loffset(result)
-        return self._wrap_result(result)
-
-    def _adjust_binner_for_upsample(self, binner):
-        """ adjust our binner when upsampling """
-        if self.closed == 'right':
-            binner = binner[1:]
-        else:
-            binner = binner[:-1]
-        return binner
-
-    def _upsample(self, method, limit=None, fill_value=None):
-        """
-        method : string {'backfill', 'bfill', 'pad',
-            'ffill', 'asfreq'} method for upsampling
-        limit : int, default None
-            Maximum size gap to fill when reindexing
-        fill_value : scalar, default None
-            Value to use for missing values
-
-        See also
-        --------
-        .fillna
-
-        """
-        self._set_binner()
-        if self.axis:
-            raise AssertionError('axis must be 0')
-        if self._from_selection:
-            raise ValueError("Upsampling from level= or on= selection"
-                             " is not supported, use .set_index(...)"
-                             " to explicitly set index to"
-                             " datetime-like")
-
-        ax = self.ax
-        obj = self._selected_obj
-        binner = self.binner
-        res_index = self._adjust_binner_for_upsample(binner)
-
-        # if we have the same frequency as our axis, then we are equal sampling
-        if limit is None and to_offset(ax.inferred_freq) == self.freq:
-            result = obj.copy()
-            result.index = res_index
-        else:
-            result = obj.reindex(res_index, method=method,
-                                 limit=limit, fill_value=fill_value)
-
-        return self._wrap_result(result)
-
-    def _wrap_result(self, result):
-        result = super(DatetimeIndexResampler, self)._wrap_result(result)
-
-        # we may have a different kind that we were asked originally
-        # convert if needed
-        if self.kind == 'period' and not isinstance(result.index, PeriodIndex):
-            result.index = result.index.to_period(self.freq)
-        return result
-
-
-class DatetimeIndexResamplerGroupby(_GroupByMixin, DatetimeIndexResampler):
-    """
-    Provides a resample of a groupby implementation
-
-    .. versionadded:: 0.18.1
-
-    """
-    @property
-    def _constructor(self):
-        return DatetimeIndexResampler
-
-
-class PeriodIndexResampler(DatetimeIndexResampler):
-
-    @property
-    def _resampler_for_grouping(self):
-        return PeriodIndexResamplerGroupby
-
-    def _convert_obj(self, obj):
-        obj = super(PeriodIndexResampler, self)._convert_obj(obj)
-
-        offset = to_offset(self.freq)
-        if offset.n > 1:
-            if self.kind == 'period':  # pragma: no cover
-                print('Warning: multiple of frequency -> timestamps')
-
-            # Cannot have multiple of periods, convert to timestamp
-            self.kind = 'timestamp'
-
-        # convert to timestamp
-        if not (self.kind is None or self.kind == 'period'):
-            if self._from_selection:
-                # see GH 14008, GH 12871
-                msg = ("Resampling from level= or on= selection"
-                       " with a PeriodIndex is not currently supported,"
-                       " use .set_index(...) to explicitly set index")
-                raise NotImplementedError(msg)
-            else:
-                obj = obj.to_timestamp(how=self.convention)
-
-        return obj
-
-    def aggregate(self, arg, *args, **kwargs):
-        result, how = self._aggregate(arg, *args, **kwargs)
-        if result is None:
-            result = self._downsample(arg, *args, **kwargs)
-
-        result = self._apply_loffset(result)
-        return result
-
-    agg = aggregate
-
-    def _get_new_index(self):
-        """ return our new index """
-        ax = self.ax
-
-        if len(ax) == 0:
-            values = []
-        else:
-            start = ax[0].asfreq(self.freq, how=self.convention)
-            end = ax[-1].asfreq(self.freq, how='end')
-            values = period_range(start, end, freq=self.freq).asi8
-
-        return ax._shallow_copy(values, freq=self.freq)
-
-    def _downsample(self, how, **kwargs):
-        """
-        Downsample the cython defined function
-
-        Parameters
-        ----------
-        how : string / cython mapped function
-        **kwargs : kw args passed to how function
-        """
-
-        # we may need to actually resample as if we are timestamps
-        if self.kind == 'timestamp':
-            return super(PeriodIndexResampler, self)._downsample(how, **kwargs)
-
-        how = self._is_cython_func(how) or how
-        ax = self.ax
-
-        new_index = self._get_new_index()
-
-        # Start vs. end of period
-        memb = ax.asfreq(self.freq, how=self.convention)
-
-        if is_subperiod(ax.freq, self.freq):
-            # Downsampling
-            if len(new_index) == 0:
-                bins = []
-            else:
-                i8 = memb.asi8
-                rng = np.arange(i8[0], i8[-1] + 1)
-                bins = memb.searchsorted(rng, side='right')
-            grouper = BinGrouper(bins, new_index)
-            return self._groupby_and_aggregate(how, grouper=grouper)
-        elif is_superperiod(ax.freq, self.freq):
-            return self.asfreq()
-        elif ax.freq == self.freq:
-            return self.asfreq()
-
-        raise IncompatibleFrequency(
-            'Frequency {} cannot be resampled to {}, as they are not '
-            'sub or super periods'.format(ax.freq, self.freq))
-
-    def _upsample(self, method, limit=None, fill_value=None):
-        """
-        method : string {'backfill', 'bfill', 'pad', 'ffill'}
-            method for upsampling
-        limit : int, default None
-            Maximum size gap to fill when reindexing
-        fill_value : scalar, default None
-            Value to use for missing values
-
-        See also
-        --------
-        .fillna
-
-        """
-        if self._from_selection:
-            raise ValueError("Upsampling from level= or on= selection"
-                             " is not supported, use .set_index(...)"
-                             " to explicitly set index to"
-                             " datetime-like")
-        # we may need to actually resample as if we are timestamps
-        if self.kind == 'timestamp':
-            return super(PeriodIndexResampler, self)._upsample(
-                method, limit=limit, fill_value=fill_value)
-
-        ax = self.ax
-        obj = self.obj
-        new_index = self._get_new_index()
-
-        # Start vs. end of period
-        memb = ax.asfreq(self.freq, how=self.convention)
-
-        # Get the fill indexer
-        indexer = memb.get_indexer(new_index, method=method, limit=limit)
-        return self._wrap_result(_take_new_index(
-            obj, indexer, new_index, axis=self.axis))
-
-
-class PeriodIndexResamplerGroupby(_GroupByMixin, PeriodIndexResampler):
-    """
-    Provides a resample of a groupby implementation
-
-    .. versionadded:: 0.18.1
-
-    """
-    @property
-    def _constructor(self):
-        return PeriodIndexResampler
-
-
-class TimedeltaIndexResampler(DatetimeIndexResampler):
-
-    @property
-    def _resampler_for_grouping(self):
-        return TimedeltaIndexResamplerGroupby
-
-    def _get_binner_for_time(self):
-        return self.groupby._get_time_delta_bins(self.ax)
-
-    def _adjust_binner_for_upsample(self, binner):
-        """ adjust our binner when upsampling """
-        ax = self.ax
-
-        if is_subperiod(ax.freq, self.freq):
-            # We are actually downsampling
-            # but are in the asfreq path
-            # GH 12926
-            if self.closed == 'right':
-                binner = binner[1:]
-            else:
-                binner = binner[:-1]
-        return binner
-
-
-class TimedeltaIndexResamplerGroupby(_GroupByMixin, TimedeltaIndexResampler):
-    """
-    Provides a resample of a groupby implementation
-
-    .. versionadded:: 0.18.1
-
-    """
-    @property
-    def _constructor(self):
-        return TimedeltaIndexResampler
-
-
-def resample(obj, kind=None, **kwds):
-    """ create a TimeGrouper and return our resampler """
-    tg = TimeGrouper(**kwds)
-    return tg._get_resampler(obj, kind=kind)
-
-
-resample.__doc__ = Resampler.__doc__
-
-
-def get_resampler_for_grouping(groupby, rule, how=None, fill_method=None,
-                               limit=None, kind=None, **kwargs):
-    """ return our appropriate resampler when grouping as well """
-
-    # .resample uses 'on' similar to how .groupby uses 'key'
-    kwargs['key'] = kwargs.pop('on', None)
-
-    tg = TimeGrouper(freq=rule, **kwargs)
-    resampler = tg._get_resampler(groupby.obj, kind=kind)
-    r = resampler._get_resampler_for_grouping(groupby=groupby)
-    return _maybe_process_deprecations(r,
-                                       how=how,
-                                       fill_method=fill_method,
-                                       limit=limit)
-
-
-class TimeGrouper(Grouper):
-    """
-    Custom groupby class for time-interval grouping
-
-    Parameters
-    ----------
-    freq : pandas date offset or offset alias for identifying bin edges
-    closed : closed end of interval; left or right
-    label : interval boundary to use for labeling; left or right
-    nperiods : optional, integer
-    convention : {'start', 'end', 'e', 's'}
-        If axis is PeriodIndex
-
-    Notes
-    -----
-    Use begin, end, nperiods to generate intervals that cannot be derived
-    directly from the associated object
-    """
-
-    def __init__(self, freq='Min', closed=None, label=None, how='mean',
-                 nperiods=None, axis=0,
-                 fill_method=None, limit=None, loffset=None, kind=None,
-                 convention=None, base=0, **kwargs):
-        freq = to_offset(freq)
-
-        end_types = set(['M', 'A', 'Q', 'BM', 'BA', 'BQ', 'W'])
-        rule = freq.rule_code
-        if (rule in end_types or
-                ('-' in rule and rule[:rule.find('-')] in end_types)):
-            if closed is None:
-                closed = 'right'
-            if label is None:
-                label = 'right'
-        else:
-            if closed is None:
-                closed = 'left'
-            if label is None:
-                label = 'left'
-
-        self.closed = closed
-        self.label = label
-        self.nperiods = nperiods
-        self.kind = kind
-
-        self.convention = convention or 'E'
-        self.convention = self.convention.lower()
-
-        if isinstance(loffset, compat.string_types):
-            loffset = to_offset(loffset)
-        self.loffset = loffset
-
-        self.how = how
-        self.fill_method = fill_method
-        self.limit = limit
-        self.base = base
-
-        # always sort time groupers
-        kwargs['sort'] = True
-
-        super(TimeGrouper, self).__init__(freq=freq, axis=axis, **kwargs)
-
-    def _get_resampler(self, obj, kind=None):
-        """
-        return my resampler or raise if we have an invalid axis
-
-        Parameters
-        ----------
-        obj : input object
-        kind : string, optional
-            'period','timestamp','timedelta' are valid
-
-        Returns
-        -------
-        a Resampler
-
-        Raises
-        ------
-        TypeError if incompatible axis
-
-        """
-        self._set_grouper(obj)
-
-        ax = self.ax
-        if isinstance(ax, DatetimeIndex):
-            return DatetimeIndexResampler(obj,
-                                          groupby=self,
-                                          kind=kind,
-                                          axis=self.axis)
-        elif isinstance(ax, PeriodIndex) or kind == 'period':
-            return PeriodIndexResampler(obj,
-                                        groupby=self,
-                                        kind=kind,
-                                        axis=self.axis)
-        elif isinstance(ax, TimedeltaIndex):
-            return TimedeltaIndexResampler(obj,
-                                           groupby=self,
-                                           axis=self.axis)
-
-        raise TypeError("Only valid with DatetimeIndex, "
-                        "TimedeltaIndex or PeriodIndex, "
-                        "but got an instance of %r" % type(ax).__name__)
-
-    def _get_grouper(self, obj):
-        # create the resampler and return our binner
-        r = self._get_resampler(obj)
-        r._set_binner()
-        return r.binner, r.grouper, r.obj
-
-    def _get_binner_for_resample(self, kind=None):
-        # create the BinGrouper
-        # assume that self.set_grouper(obj) has already been called
-
-        ax = self.ax
-        if kind is None:
-            kind = self.kind
-        if kind is None or kind == 'timestamp':
-            self.binner, bins, binlabels = self._get_time_bins(ax)
-        elif kind == 'timedelta':
-            self.binner, bins, binlabels = self._get_time_delta_bins(ax)
-        else:
-            self.binner, bins, binlabels = self._get_time_period_bins(ax)
-
-        self.grouper = BinGrouper(bins, binlabels)
-        return self.binner, self.grouper, self.obj
-
-    def _get_binner_for_grouping(self, obj):
-        # return an ordering of the transformed group labels,
-        # suitable for multi-grouping, e.g the labels for
-        # the resampled intervals
-        binner, grouper, obj = self._get_grouper(obj)
-
-        l = []
-        for key, group in grouper.get_iterator(self.ax):
-            l.extend([key] * len(group))
-
-        if isinstance(self.ax, PeriodIndex):
-            grouper = binner.__class__(l, freq=binner.freq, name=binner.name)
-        else:
-            # resampling causes duplicated values, specifying freq is invalid
-            grouper = binner.__class__(l, name=binner.name)
-
-        # since we may have had to sort
-        # may need to reorder groups here
-        if self.indexer is not None:
-            indexer = self.indexer.argsort(kind='quicksort')
-            grouper = grouper.take(indexer)
-        return grouper
-
-    def _get_time_bins(self, ax):
-        if not isinstance(ax, DatetimeIndex):
-            raise TypeError('axis must be a DatetimeIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if len(ax) == 0:
-            binner = labels = DatetimeIndex(
-                data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        first, last = ax.min(), ax.max()
-        first, last = _get_range_edges(first, last, self.freq,
-                                       closed=self.closed,
-                                       base=self.base)
-        tz = ax.tz
-        # GH #12037
-        # use first/last directly instead of call replace() on them
-        # because replace() will swallow the nanosecond part
-        # thus last bin maybe slightly before the end if the end contains
-        # nanosecond part and lead to `Values falls after last bin` error
-        binner = labels = DatetimeIndex(freq=self.freq,
-                                        start=first,
-                                        end=last,
-                                        tz=tz,
-                                        name=ax.name)
-
-        # a little hack
-        trimmed = False
-        if (len(binner) > 2 and binner[-2] == last and
-                self.closed == 'right'):
-
-            binner = binner[:-1]
-            trimmed = True
-
-        ax_values = ax.asi8
-        binner, bin_edges = self._adjust_bin_edges(binner, ax_values)
-
-        # general version, knowing nothing about relative frequencies
-        bins = lib.generate_bins_dt64(
-            ax_values, bin_edges, self.closed, hasnans=ax.hasnans)
-
-        if self.closed == 'right':
-            labels = binner
-            if self.label == 'right':
-                labels = labels[1:]
-            elif not trimmed:
-                labels = labels[:-1]
-        else:
-            if self.label == 'right':
-                labels = labels[1:]
-            elif not trimmed:
-                labels = labels[:-1]
-
-        if ax.hasnans:
-            binner = binner.insert(0, tslib.NaT)
-            labels = labels.insert(0, tslib.NaT)
-
-        # if we end up with more labels than bins
-        # adjust the labels
-        # GH4076
-        if len(bins) < len(labels):
-            labels = labels[:len(bins)]
-
-        return binner, bins, labels
-
-    def _adjust_bin_edges(self, binner, ax_values):
-        # Some hacks for > daily data, see #1471, #1458, #1483
-
-        bin_edges = binner.asi8
-
-        if self.freq != 'D' and is_superperiod(self.freq, 'D'):
-            day_nanos = _delta_to_nanoseconds(timedelta(1))
-            if self.closed == 'right':
-                bin_edges = bin_edges + day_nanos - 1
-
-            # intraday values on last day
-            if bin_edges[-2] > ax_values.max():
-                bin_edges = bin_edges[:-1]
-                binner = binner[:-1]
-
-        return binner, bin_edges
-
-    def _get_time_delta_bins(self, ax):
-        if not isinstance(ax, TimedeltaIndex):
-            raise TypeError('axis must be a TimedeltaIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if not len(ax):
-            binner = labels = TimedeltaIndex(
-                data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        start = ax[0]
-        end = ax[-1]
-        labels = binner = TimedeltaIndex(start=start,
-                                         end=end,
-                                         freq=self.freq,
-                                         name=ax.name)
-
-        end_stamps = labels + 1
-        bins = ax.searchsorted(end_stamps, side='left')
-
-        # Addresses GH #10530
-        if self.base > 0:
-            labels += type(self.freq)(self.base)
-
-        return binner, bins, labels
-
-    def _get_time_period_bins(self, ax):
-        if not isinstance(ax, DatetimeIndex):
-            raise TypeError('axis must be a DatetimeIndex, but got '
-                            'an instance of %r' % type(ax).__name__)
-
-        if not len(ax):
-            binner = labels = PeriodIndex(
-                data=[], freq=self.freq, name=ax.name)
-            return binner, [], labels
-
-        labels = binner = PeriodIndex(start=ax[0],
-                                      end=ax[-1],
-                                      freq=self.freq,
-                                      name=ax.name)
-
-        end_stamps = (labels + 1).asfreq(self.freq, 's').to_timestamp()
-        if ax.tzinfo:
-            end_stamps = end_stamps.tz_localize(ax.tzinfo)
-        bins = ax.searchsorted(end_stamps, side='left')
-
-        return binner, bins, labels
-
-
-def _take_new_index(obj, indexer, new_index, axis=0):
-    from pandas.core.api import Series, DataFrame
-
-    if isinstance(obj, Series):
-        new_values = algos.take_1d(obj.values, indexer)
-        return Series(new_values, index=new_index, name=obj.name)
-    elif isinstance(obj, DataFrame):
-        if axis == 1:
-            raise NotImplementedError("axis 1 is not supported")
-        return DataFrame(obj._data.reindex_indexer(
-            new_axis=new_index, indexer=indexer, axis=1))
-    else:
-        raise ValueError("'obj' should be either a Series or a DataFrame")
-
-
-def _get_range_edges(first, last, offset, closed='left', base=0):
-    if isinstance(offset, compat.string_types):
-        offset = to_offset(offset)
-
-    if isinstance(offset, Tick):
-        is_day = isinstance(offset, Day)
-        day_nanos = _delta_to_nanoseconds(timedelta(1))
-
-        # #1165
-        if (is_day and day_nanos % offset.nanos == 0) or not is_day:
-            return _adjust_dates_anchored(first, last, offset,
-                                          closed=closed, base=base)
-
-    if not isinstance(offset, Tick):  # and first.time() != last.time():
-        # hack!
-        first = first.normalize()
-        last = last.normalize()
-
-    if closed == 'left':
-        first = Timestamp(offset.rollback(first))
-    else:
-        first = Timestamp(first - offset)
-
-    last = Timestamp(last + offset)
-
-    return first, last
-
-
-def _adjust_dates_anchored(first, last, offset, closed='right', base=0):
-    # First and last offsets should be calculated from the start day to fix an
-    # error cause by resampling across multiple days when a one day period is
-    # not a multiple of the frequency.
-    #
-    # See https://github.com/pandas-dev/pandas/issues/8683
-
-    # 14682 - Since we need to drop the TZ information to perform
-    # the adjustment in the presence of a DST change,
-    # save TZ Info and the DST state of the first and last parameters
-    # so that we can accurately rebuild them at the end.
-    first_tzinfo = first.tzinfo
-    last_tzinfo = last.tzinfo
-    first_dst = bool(first.dst())
-    last_dst = bool(last.dst())
-
-    first = first.tz_localize(None)
-    last = last.tz_localize(None)
-
-    start_day_nanos = first.normalize().value
-
-    base_nanos = (base % offset.n) * offset.nanos // offset.n
-    start_day_nanos += base_nanos
-
-    foffset = (first.value - start_day_nanos) % offset.nanos
-    loffset = (last.value - start_day_nanos) % offset.nanos
-
-    if closed == 'right':
-        if foffset > 0:
-            # roll back
-            fresult = first.value - foffset
-        else:
-            fresult = first.value - offset.nanos
-
-        if loffset > 0:
-            # roll forward
-            lresult = last.value + (offset.nanos - loffset)
-        else:
-            # already the end of the road
-            lresult = last.value
-    else:  # closed == 'left'
-        if foffset > 0:
-            fresult = first.value - foffset
-        else:
-            # start of the road
-            fresult = first.value
-
-        if loffset > 0:
-            # roll forward
-            lresult = last.value + (offset.nanos - loffset)
-        else:
-            lresult = last.value + offset.nanos
-
-    return (Timestamp(fresult).tz_localize(first_tzinfo, ambiguous=first_dst),
-            Timestamp(lresult).tz_localize(last_tzinfo, ambiguous=last_dst))
-
-
-def asfreq(obj, freq, method=None, how=None, normalize=False, fill_value=None):
-    """
-    Utility frequency conversion method for Series/DataFrame
-    """
-    if isinstance(obj.index, PeriodIndex):
-        if method is not None:
-            raise NotImplementedError("'method' argument is not supported")
-
-        if how is None:
-            how = 'E'
-
-        new_obj = obj.copy()
-        new_obj.index = obj.index.asfreq(freq, how=how)
-
-    elif len(obj.index) == 0:
-        new_obj = obj.copy()
-        new_obj.index = obj.index._shallow_copy(freq=to_offset(freq))
-
-    else:
-        dti = date_range(obj.index[0], obj.index[-1], freq=freq)
-        dti.name = obj.index.name
-        new_obj = obj.reindex(dti, method=method, fill_value=fill_value)
-        if normalize:
-            new_obj.index = new_obj.index.normalize()
-
-    return new_obj
diff --git a/pandas/tseries/tdi.py b/pandas/tseries/tdi.py
deleted file mode 100644
index 5d062dd38f9fc..0000000000000
--- a/pandas/tseries/tdi.py
+++ /dev/null
@@ -1,989 +0,0 @@
-""" implement the TimedeltaIndex """
-
-from datetime import timedelta
-import numpy as np
-from pandas.types.common import (_TD_DTYPE,
-                                 is_integer, is_float,
-                                 is_bool_dtype,
-                                 is_list_like,
-                                 is_scalar,
-                                 is_integer_dtype,
-                                 is_object_dtype,
-                                 is_timedelta64_dtype,
-                                 is_timedelta64_ns_dtype,
-                                 _ensure_int64)
-from pandas.types.missing import isnull
-from pandas.types.generic import ABCSeries
-from pandas.core.common import _maybe_box, _values_from_object, is_bool_indexer
-
-from pandas.core.index import Index, Int64Index
-import pandas.compat as compat
-from pandas.compat import u
-from pandas.tseries.frequencies import to_offset
-from pandas.core.algorithms import checked_add_with_arr
-from pandas.core.base import _shared_docs
-from pandas.indexes.base import _index_shared_docs
-import pandas.core.common as com
-import pandas.types.concat as _concat
-from pandas.util.decorators import Appender, Substitution, deprecate_kwarg
-from pandas.tseries.base import TimelikeOps, DatetimeIndexOpsMixin
-from pandas.tseries.timedeltas import (to_timedelta,
-                                       _coerce_scalar_to_timedelta_type)
-from pandas.tseries.offsets import Tick, DateOffset
-from pandas._libs import (lib, index as libindex, tslib as libts,
-                          join as libjoin, Timedelta, NaT, iNaT)
-
-
-def _td_index_cmp(opname, nat_result=False):
-    """
-    Wrap comparison operations to convert timedelta-like to timedelta64
-    """
-
-    def wrapper(self, other):
-        msg = "cannot compare a TimedeltaIndex with type {0}"
-        func = getattr(super(TimedeltaIndex, self), opname)
-        if _is_convertible_to_td(other) or other is NaT:
-            try:
-                other = _to_m8(other)
-            except ValueError:
-                # failed to parse as timedelta
-                raise TypeError(msg.format(type(other)))
-            result = func(other)
-            if isnull(other):
-                result.fill(nat_result)
-        else:
-            if not is_list_like(other):
-                raise TypeError(msg.format(type(other)))
-
-            other = TimedeltaIndex(other).values
-            result = func(other)
-            result = _values_from_object(result)
-
-            if isinstance(other, Index):
-                o_mask = other.values.view('i8') == iNaT
-            else:
-                o_mask = other.view('i8') == iNaT
-
-            if o_mask.any():
-                result[o_mask] = nat_result
-
-        if self.hasnans:
-            result[self._isnan] = nat_result
-
-        # support of bool dtype indexers
-        if is_bool_dtype(result):
-            return result
-        return Index(result)
-
-    return wrapper
-
-
-class TimedeltaIndex(DatetimeIndexOpsMixin, TimelikeOps, Int64Index):
-    """
-    Immutable ndarray of timedelta64 data, represented internally as int64, and
-    which can be boxed to timedelta objects
-
-    Parameters
-    ----------
-    data  : array-like (1-dimensional), optional
-        Optional timedelta-like data to construct index with
-    unit: unit of the arg (D,h,m,s,ms,us,ns) denote the unit, optional
-        which is an integer/float number
-    freq: a frequency for the index, optional
-    copy  : bool
-        Make a copy of input ndarray
-    start : starting value, timedelta-like, optional
-        If data is None, start is used as the start point in generating regular
-        timedelta data.
-    periods  : int, optional, > 0
-        Number of periods to generate, if generating index. Takes precedence
-        over end argument
-    end   : end time, timedelta-like, optional
-        If periods is none, generated index will extend to first conforming
-        time on or just past end argument
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-    name : object
-        Name to be stored in the index
-
-    Notes
-    -----
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-
-    _typ = 'timedeltaindex'
-    _join_precedence = 10
-
-    def _join_i8_wrapper(joinf, **kwargs):
-        return DatetimeIndexOpsMixin._join_i8_wrapper(
-            joinf, dtype='m8[ns]', **kwargs)
-
-    _inner_indexer = _join_i8_wrapper(libjoin.inner_join_indexer_int64)
-    _outer_indexer = _join_i8_wrapper(libjoin.outer_join_indexer_int64)
-    _left_indexer = _join_i8_wrapper(libjoin.left_join_indexer_int64)
-    _left_indexer_unique = _join_i8_wrapper(
-        libjoin.left_join_indexer_unique_int64, with_indexers=False)
-    _arrmap = None
-
-    # define my properties & methods for delegation
-    _other_ops = []
-    _bool_ops = []
-    _object_ops = ['freq']
-    _field_ops = ['days', 'seconds', 'microseconds', 'nanoseconds']
-    _datetimelike_ops = _field_ops + _object_ops + _bool_ops
-    _datetimelike_methods = ["to_pytimedelta", "total_seconds",
-                             "round", "floor", "ceil"]
-
-    __eq__ = _td_index_cmp('__eq__')
-    __ne__ = _td_index_cmp('__ne__', nat_result=True)
-    __lt__ = _td_index_cmp('__lt__')
-    __gt__ = _td_index_cmp('__gt__')
-    __le__ = _td_index_cmp('__le__')
-    __ge__ = _td_index_cmp('__ge__')
-
-    _engine_type = libindex.TimedeltaEngine
-
-    _comparables = ['name', 'freq']
-    _attributes = ['name', 'freq']
-    _is_numeric_dtype = True
-    _infer_as_myclass = True
-
-    freq = None
-
-    def __new__(cls, data=None, unit=None,
-                freq=None, start=None, end=None, periods=None,
-                copy=False, name=None,
-                closed=None, verify_integrity=True, **kwargs):
-
-        if isinstance(data, TimedeltaIndex) and freq is None and name is None:
-            if copy:
-                return data.copy()
-            else:
-                return data._shallow_copy()
-
-        freq_infer = False
-        if not isinstance(freq, DateOffset):
-
-            # if a passed freq is None, don't infer automatically
-            if freq != 'infer':
-                freq = to_offset(freq)
-            else:
-                freq_infer = True
-                freq = None
-
-        if periods is not None:
-            if is_float(periods):
-                periods = int(periods)
-            elif not is_integer(periods):
-                raise ValueError('Periods must be a number, got %s' %
-                                 str(periods))
-
-        if data is None and freq is None:
-            raise ValueError("Must provide freq argument if no data is "
-                             "supplied")
-
-        if data is None:
-            return cls._generate(start, end, periods, name, freq,
-                                 closed=closed)
-
-        if unit is not None:
-            data = to_timedelta(data, unit=unit, box=False)
-
-        if not isinstance(data, (np.ndarray, Index, ABCSeries)):
-            if is_scalar(data):
-                raise ValueError('TimedeltaIndex() must be called with a '
-                                 'collection of some kind, %s was passed'
-                                 % repr(data))
-
-        # convert if not already
-        if getattr(data, 'dtype', None) != _TD_DTYPE:
-            data = to_timedelta(data, unit=unit, box=False)
-        elif copy:
-            data = np.array(data, copy=True)
-
-        # check that we are matching freqs
-        if verify_integrity and len(data) > 0:
-            if freq is not None and not freq_infer:
-                index = cls._simple_new(data, name=name)
-                inferred = index.inferred_freq
-                if inferred != freq.freqstr:
-                    on_freq = cls._generate(
-                        index[0], None, len(index), name, freq)
-                    if not np.array_equal(index.asi8, on_freq.asi8):
-                        raise ValueError('Inferred frequency {0} from passed '
-                                         'timedeltas does not conform to '
-                                         'passed frequency {1}'
-                                         .format(inferred, freq.freqstr))
-                index.freq = freq
-                return index
-
-        if freq_infer:
-            index = cls._simple_new(data, name=name)
-            inferred = index.inferred_freq
-            if inferred:
-                index.freq = to_offset(inferred)
-            return index
-
-        return cls._simple_new(data, name=name, freq=freq)
-
-    @classmethod
-    def _generate(cls, start, end, periods, name, offset, closed=None):
-        if com._count_not_none(start, end, periods) != 2:
-            raise ValueError('Must specify two of start, end, or periods')
-
-        if start is not None:
-            start = Timedelta(start)
-
-        if end is not None:
-            end = Timedelta(end)
-
-        left_closed = False
-        right_closed = False
-
-        if start is None and end is None:
-            if closed is not None:
-                raise ValueError("Closed has to be None if not both of start"
-                                 "and end are defined")
-
-        if closed is None:
-            left_closed = True
-            right_closed = True
-        elif closed == "left":
-            left_closed = True
-        elif closed == "right":
-            right_closed = True
-        else:
-            raise ValueError("Closed has to be either 'left', 'right' or None")
-
-        index = _generate_regular_range(start, end, periods, offset)
-        index = cls._simple_new(index, name=name, freq=offset)
-
-        if not left_closed:
-            index = index[1:]
-        if not right_closed:
-            index = index[:-1]
-
-        return index
-
-    @property
-    def _box_func(self):
-        return lambda x: Timedelta(x, unit='ns')
-
-    @classmethod
-    def _simple_new(cls, values, name=None, freq=None, **kwargs):
-        values = np.array(values, copy=False)
-        if values.dtype == np.object_:
-            values = libts.array_to_timedelta64(values)
-        if values.dtype != _TD_DTYPE:
-            values = _ensure_int64(values).view(_TD_DTYPE)
-
-        result = object.__new__(cls)
-        result._data = values
-        result.name = name
-        result.freq = freq
-        result._reset_identity()
-        return result
-
-    @property
-    def _formatter_func(self):
-        from pandas.formats.format import _get_format_timedelta64
-        return _get_format_timedelta64(self, box=True)
-
-    def __setstate__(self, state):
-        """Necessary for making this object picklable"""
-        if isinstance(state, dict):
-            super(TimedeltaIndex, self).__setstate__(state)
-        else:
-            raise Exception("invalid pickle state")
-    _unpickle_compat = __setstate__
-
-    def _maybe_update_attributes(self, attrs):
-        """ Update Index attributes (e.g. freq) depending on op """
-        freq = attrs.get('freq', None)
-        if freq is not None:
-            # no need to infer if freq is None
-            attrs['freq'] = 'infer'
-        return attrs
-
-    def _add_delta(self, delta):
-        if isinstance(delta, (Tick, timedelta, np.timedelta64)):
-            new_values = self._add_delta_td(delta)
-            name = self.name
-        elif isinstance(delta, TimedeltaIndex):
-            new_values = self._add_delta_tdi(delta)
-            # update name when delta is index
-            name = com._maybe_match_name(self, delta)
-        else:
-            raise ValueError("cannot add the type {0} to a TimedeltaIndex"
-                             .format(type(delta)))
-
-        result = TimedeltaIndex(new_values, freq='infer', name=name)
-        return result
-
-    def _evaluate_with_timedelta_like(self, other, op, opstr):
-
-        # allow division by a timedelta
-        if opstr in ['__div__', '__truediv__']:
-            if _is_convertible_to_td(other):
-                other = Timedelta(other)
-                if isnull(other):
-                    raise NotImplementedError(
-                        "division by pd.NaT not implemented")
-
-                i8 = self.asi8
-                result = i8 / float(other.value)
-                result = self._maybe_mask_results(result, convert='float64')
-                return Index(result, name=self.name, copy=False)
-
-        return NotImplemented
-
-    def _add_datelike(self, other):
-        # adding a timedeltaindex to a datetimelike
-        from pandas import Timestamp, DatetimeIndex
-        if other is NaT:
-            result = self._nat_new(box=False)
-        else:
-            other = Timestamp(other)
-            i8 = self.asi8
-            result = checked_add_with_arr(i8, other.value)
-            result = self._maybe_mask_results(result, fill_value=iNaT)
-        return DatetimeIndex(result, name=self.name, copy=False)
-
-    def _sub_datelike(self, other):
-        from pandas import DatetimeIndex
-        if other is NaT:
-            result = self._nat_new(box=False)
-        else:
-            raise TypeError("cannot subtract a datelike from a TimedeltaIndex")
-        return DatetimeIndex(result, name=self.name, copy=False)
-
-    def _format_native_types(self, na_rep=u('NaT'),
-                             date_format=None, **kwargs):
-        from pandas.formats.format import Timedelta64Formatter
-        return Timedelta64Formatter(values=self,
-                                    nat_rep=na_rep,
-                                    justify='all').get_result()
-
-    def _get_field(self, m):
-
-        values = self.asi8
-        hasnans = self.hasnans
-        if hasnans:
-            result = np.empty(len(self), dtype='float64')
-            mask = self._isnan
-            imask = ~mask
-            result.flat[imask] = np.array(
-                [getattr(Timedelta(val), m) for val in values[imask]])
-            result[mask] = np.nan
-        else:
-            result = np.array([getattr(Timedelta(val), m)
-                               for val in values], dtype='int64')
-        return Index(result, name=self.name)
-
-    @property
-    def days(self):
-        """ Number of days for each element. """
-        return self._get_field('days')
-
-    @property
-    def seconds(self):
-        """ Number of seconds (>= 0 and less than 1 day) for each element. """
-        return self._get_field('seconds')
-
-    @property
-    def microseconds(self):
-        """
-        Number of microseconds (>= 0 and less than 1 second) for each
-        element. """
-        return self._get_field('microseconds')
-
-    @property
-    def nanoseconds(self):
-        """
-        Number of nanoseconds (>= 0 and less than 1 microsecond) for each
-        element.
-        """
-        return self._get_field('nanoseconds')
-
-    @property
-    def components(self):
-        """
-        Return a dataframe of the components (days, hours, minutes,
-        seconds, milliseconds, microseconds, nanoseconds) of the Timedeltas.
-
-        Returns
-        -------
-        a DataFrame
-        """
-        from pandas import DataFrame
-
-        columns = ['days', 'hours', 'minutes', 'seconds',
-                   'milliseconds', 'microseconds', 'nanoseconds']
-        hasnans = self.hasnans
-        if hasnans:
-            def f(x):
-                if isnull(x):
-                    return [np.nan] * len(columns)
-                return x.components
-        else:
-            def f(x):
-                return x.components
-
-        result = DataFrame([f(x) for x in self])
-        result.columns = columns
-        if not hasnans:
-            result = result.astype('int64')
-        return result
-
-    def total_seconds(self):
-        """
-        Total duration of each element expressed in seconds.
-
-        .. versionadded:: 0.17.0
-        """
-        return Index(self._maybe_mask_results(1e-9 * self.asi8),
-                     name=self.name)
-
-    def to_pytimedelta(self):
-        """
-        Return TimedeltaIndex as object ndarray of datetime.timedelta objects
-
-        Returns
-        -------
-        datetimes : ndarray
-        """
-        return libts.ints_to_pytimedelta(self.asi8)
-
-    @Appender(_index_shared_docs['astype'])
-    def astype(self, dtype, copy=True):
-        dtype = np.dtype(dtype)
-
-        if is_object_dtype(dtype):
-            return self.asobject
-        elif is_timedelta64_ns_dtype(dtype):
-            if copy is True:
-                return self.copy()
-            return self
-        elif is_timedelta64_dtype(dtype):
-            # return an index (essentially this is division)
-            result = self.values.astype(dtype, copy=copy)
-            if self.hasnans:
-                return Index(self._maybe_mask_results(result,
-                                                      convert='float64'),
-                             name=self.name)
-            return Index(result.astype('i8'), name=self.name)
-        elif is_integer_dtype(dtype):
-            return Index(self.values.astype('i8', copy=copy), dtype='i8',
-                         name=self.name)
-        raise ValueError('Cannot cast TimedeltaIndex to dtype %s' % dtype)
-
-    def union(self, other):
-        """
-        Specialized union for TimedeltaIndex objects. If combine
-        overlapping ranges with the same DateOffset, will be much
-        faster than Index.union
-
-        Parameters
-        ----------
-        other : TimedeltaIndex or array-like
-
-        Returns
-        -------
-        y : Index or TimedeltaIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, TimedeltaIndex):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-        this, other = self, other
-
-        if this._can_fast_union(other):
-            return this._fast_union(other)
-        else:
-            result = Index.union(this, other)
-            if isinstance(result, TimedeltaIndex):
-                if result.freq is None:
-                    result.freq = to_offset(result.inferred_freq)
-            return result
-
-    def join(self, other, how='left', level=None, return_indexers=False):
-        """
-        See Index.join
-        """
-        if _is_convertible_to_index(other):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-
-        return Index.join(self, other, how=how, level=level,
-                          return_indexers=return_indexers)
-
-    def _wrap_joined_index(self, joined, other):
-        name = self.name if self.name == other.name else None
-        if (isinstance(other, TimedeltaIndex) and self.freq == other.freq and
-                self._can_fast_union(other)):
-            joined = self._shallow_copy(joined, name=name)
-            return joined
-        else:
-            return self._simple_new(joined, name)
-
-    def _can_fast_union(self, other):
-        if not isinstance(other, TimedeltaIndex):
-            return False
-
-        freq = self.freq
-
-        if freq is None or freq != other.freq:
-            return False
-
-        if not self.is_monotonic or not other.is_monotonic:
-            return False
-
-        if len(self) == 0 or len(other) == 0:
-            return True
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        right_start = right[0]
-        left_end = left[-1]
-
-        # Only need to "adjoin", not overlap
-        return (right_start == left_end + freq) or right_start in left
-
-    def _fast_union(self, other):
-        if len(other) == 0:
-            return self.view(type(self))
-
-        if len(self) == 0:
-            return other.view(type(self))
-
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        left_end = left[-1]
-        right_end = right[-1]
-
-        # concatenate
-        if left_end < right_end:
-            loc = right.searchsorted(left_end, side='right')
-            right_chunk = right.values[loc:]
-            dates = _concat._concat_compat((left.values, right_chunk))
-            return self._shallow_copy(dates)
-        else:
-            return left
-
-    def _wrap_union_result(self, other, result):
-        name = self.name if self.name == other.name else None
-        return self._simple_new(result, name=name, freq=None)
-
-    def intersection(self, other):
-        """
-        Specialized intersection for TimedeltaIndex objects. May be much faster
-        than Index.intersection
-
-        Parameters
-        ----------
-        other : TimedeltaIndex or array-like
-
-        Returns
-        -------
-        y : Index or TimedeltaIndex
-        """
-        self._assert_can_do_setop(other)
-        if not isinstance(other, TimedeltaIndex):
-            try:
-                other = TimedeltaIndex(other)
-            except (TypeError, ValueError):
-                pass
-            result = Index.intersection(self, other)
-            return result
-
-        if len(self) == 0:
-            return self
-        if len(other) == 0:
-            return other
-        # to make our life easier, "sort" the two ranges
-        if self[0] <= other[0]:
-            left, right = self, other
-        else:
-            left, right = other, self
-
-        end = min(left[-1], right[-1])
-        start = right[0]
-
-        if end < start:
-            return type(self)(data=[])
-        else:
-            lslice = slice(*left.slice_locs(start, end))
-            left_chunk = left.values[lslice]
-            return self._shallow_copy(left_chunk)
-
-    def _maybe_promote(self, other):
-        if other.inferred_type == 'timedelta':
-            other = TimedeltaIndex(other)
-        return self, other
-
-    def get_value(self, series, key):
-        """
-        Fast lookup of value from 1-dimensional ndarray. Only use this if you
-        know what you're doing
-        """
-
-        if _is_convertible_to_td(key):
-            key = Timedelta(key)
-            return self.get_value_maybe_box(series, key)
-
-        try:
-            return _maybe_box(self, Index.get_value(self, series, key),
-                              series, key)
-        except KeyError:
-            try:
-                loc = self._get_string_slice(key)
-                return series[loc]
-            except (TypeError, ValueError, KeyError):
-                pass
-
-            try:
-                return self.get_value_maybe_box(series, key)
-            except (TypeError, ValueError, KeyError):
-                raise KeyError(key)
-
-    def get_value_maybe_box(self, series, key):
-        if not isinstance(key, Timedelta):
-            key = Timedelta(key)
-        values = self._engine.get_value(_values_from_object(series), key)
-        return _maybe_box(self, values, series, key)
-
-    def get_loc(self, key, method=None, tolerance=None):
-        """
-        Get integer location for requested label
-
-        Returns
-        -------
-        loc : int
-        """
-
-        if is_bool_indexer(key):
-            raise TypeError
-
-        if isnull(key):
-            key = NaT
-
-        if tolerance is not None:
-            # try converting tolerance now, so errors don't get swallowed by
-            # the try/except clauses below
-            tolerance = self._convert_tolerance(tolerance)
-
-        if _is_convertible_to_td(key):
-            key = Timedelta(key)
-            return Index.get_loc(self, key, method, tolerance)
-
-        try:
-            return Index.get_loc(self, key, method, tolerance)
-        except (KeyError, ValueError, TypeError):
-            try:
-                return self._get_string_slice(key)
-            except (TypeError, KeyError, ValueError):
-                pass
-
-            try:
-                stamp = Timedelta(key)
-                return Index.get_loc(self, stamp, method, tolerance)
-            except (KeyError, ValueError):
-                raise KeyError(key)
-
-    def _maybe_cast_slice_bound(self, label, side, kind):
-        """
-        If label is a string, cast it to timedelta according to resolution.
-
-
-        Parameters
-        ----------
-        label : object
-        side : {'left', 'right'}
-        kind : {'ix', 'loc', 'getitem'}
-
-        Returns
-        -------
-        label :  object
-
-        """
-        assert kind in ['ix', 'loc', 'getitem', None]
-
-        if isinstance(label, compat.string_types):
-            parsed = _coerce_scalar_to_timedelta_type(label, box=True)
-            lbound = parsed.round(parsed.resolution)
-            if side == 'left':
-                return lbound
-            else:
-                return (lbound + to_offset(parsed.resolution) -
-                        Timedelta(1, 'ns'))
-        elif is_integer(label) or is_float(label):
-            self._invalid_indexer('slice', label)
-
-        return label
-
-    def _get_string_slice(self, key, use_lhs=True, use_rhs=True):
-        freq = getattr(self, 'freqstr',
-                       getattr(self, 'inferred_freq', None))
-        if is_integer(key) or is_float(key) or key is NaT:
-            self._invalid_indexer('slice', key)
-        loc = self._partial_td_slice(key, freq, use_lhs=use_lhs,
-                                     use_rhs=use_rhs)
-        return loc
-
-    def _partial_td_slice(self, key, freq, use_lhs=True, use_rhs=True):
-
-        # given a key, try to figure out a location for a partial slice
-        if not isinstance(key, compat.string_types):
-            return key
-
-        raise NotImplementedError
-
-        # TODO(wesm): dead code
-        # parsed = _coerce_scalar_to_timedelta_type(key, box=True)
-
-        # is_monotonic = self.is_monotonic
-
-        # # figure out the resolution of the passed td
-        # # and round to it
-
-        # # t1 = parsed.round(reso)
-
-        # t2 = t1 + to_offset(parsed.resolution) - Timedelta(1, 'ns')
-
-        # stamps = self.asi8
-
-        # if is_monotonic:
-
-        #     # we are out of range
-        #     if (len(stamps) and ((use_lhs and t1.value < stamps[0] and
-        #                           t2.value < stamps[0]) or
-        #                          ((use_rhs and t1.value > stamps[-1] and
-        #                            t2.value > stamps[-1])))):
-        #         raise KeyError
-
-        #     # a monotonic (sorted) series can be sliced
-        #     left = (stamps.searchsorted(t1.value, side='left')
-        #             if use_lhs else None)
-        #     right = (stamps.searchsorted(t2.value, side='right')
-        #              if use_rhs else None)
-
-        #     return slice(left, right)
-
-        # lhs_mask = (stamps >= t1.value) if use_lhs else True
-        # rhs_mask = (stamps <= t2.value) if use_rhs else True
-
-        # # try to find a the dates
-        # return (lhs_mask & rhs_mask).nonzero()[0]
-
-    @Substitution(klass='TimedeltaIndex')
-    @Appender(_shared_docs['searchsorted'])
-    @deprecate_kwarg(old_arg_name='key', new_arg_name='value')
-    def searchsorted(self, value, side='left', sorter=None):
-        if isinstance(value, (np.ndarray, Index)):
-            value = np.array(value, dtype=_TD_DTYPE, copy=False)
-        else:
-            value = _to_m8(value)
-
-        return self.values.searchsorted(value, side=side, sorter=sorter)
-
-    def is_type_compatible(self, typ):
-        return typ == self.inferred_type or typ == 'timedelta'
-
-    @property
-    def inferred_type(self):
-        return 'timedelta64'
-
-    @property
-    def dtype(self):
-        return _TD_DTYPE
-
-    @property
-    def is_all_dates(self):
-        return True
-
-    def insert(self, loc, item):
-        """
-        Make new Index inserting new item at location
-
-        Parameters
-        ----------
-        loc : int
-        item : object
-            if not either a Python datetime or a numpy integer-like, returned
-            Index dtype will be object rather than datetime.
-
-        Returns
-        -------
-        new_index : Index
-        """
-
-        # try to convert if possible
-        if _is_convertible_to_td(item):
-            try:
-                item = Timedelta(item)
-            except:
-                pass
-
-        freq = None
-        if isinstance(item, (Timedelta, libts.NaTType)):
-
-            # check freq can be preserved on edge cases
-            if self.freq is not None:
-                if ((loc == 0 or loc == -len(self)) and
-                        item + self.freq == self[0]):
-                    freq = self.freq
-                elif (loc == len(self)) and item - self.freq == self[-1]:
-                    freq = self.freq
-            item = _to_m8(item)
-
-        try:
-            new_tds = np.concatenate((self[:loc].asi8, [item.view(np.int64)],
-                                      self[loc:].asi8))
-            return TimedeltaIndex(new_tds, name=self.name, freq=freq)
-
-        except (AttributeError, TypeError):
-
-            # fall back to object index
-            if isinstance(item, compat.string_types):
-                return self.asobject.insert(loc, item)
-            raise TypeError(
-                "cannot insert TimedeltaIndex with incompatible label")
-
-    def delete(self, loc):
-        """
-        Make a new DatetimeIndex with passed location(s) deleted.
-
-        Parameters
-        ----------
-        loc: int, slice or array of ints
-            Indicate which sub-arrays to remove.
-
-        Returns
-        -------
-        new_index : TimedeltaIndex
-        """
-        new_tds = np.delete(self.asi8, loc)
-
-        freq = 'infer'
-        if is_integer(loc):
-            if loc in (0, -len(self), -1, len(self) - 1):
-                freq = self.freq
-        else:
-            if is_list_like(loc):
-                loc = lib.maybe_indices_to_slice(
-                    _ensure_int64(np.array(loc)), len(self))
-            if isinstance(loc, slice) and loc.step in (1, None):
-                if (loc.start in (0, None) or loc.stop in (len(self), None)):
-                    freq = self.freq
-
-        return TimedeltaIndex(new_tds, name=self.name, freq=freq)
-
-
-TimedeltaIndex._add_numeric_methods()
-TimedeltaIndex._add_logical_methods_disabled()
-TimedeltaIndex._add_datetimelike_methods()
-
-
-def _is_convertible_to_index(other):
-    """
-    return a boolean whether I can attempt conversion to a TimedeltaIndex
-    """
-    if isinstance(other, TimedeltaIndex):
-        return True
-    elif (len(other) > 0 and
-          other.inferred_type not in ('floating', 'mixed-integer', 'integer',
-                                      'mixed-integer-float', 'mixed')):
-        return True
-    return False
-
-
-def _is_convertible_to_td(key):
-    return isinstance(key, (DateOffset, timedelta, Timedelta,
-                            np.timedelta64, compat.string_types))
-
-
-def _to_m8(key):
-    """
-    Timedelta-like => dt64
-    """
-    if not isinstance(key, Timedelta):
-        # this also converts strings
-        key = Timedelta(key)
-
-    # return an type that can be compared
-    return np.int64(key.value).view(_TD_DTYPE)
-
-
-def _generate_regular_range(start, end, periods, offset):
-    stride = offset.nanos
-    if periods is None:
-        b = Timedelta(start).value
-        e = Timedelta(end).value
-        e += stride - e % stride
-    elif start is not None:
-        b = Timedelta(start).value
-        e = b + periods * stride
-    elif end is not None:
-        e = Timedelta(end).value + stride
-        b = e - periods * stride
-    else:
-        raise ValueError("at least 'start' or 'end' should be specified "
-                         "if a 'period' is given.")
-
-    data = np.arange(b, e, stride, dtype=np.int64)
-    data = TimedeltaIndex._simple_new(data, None)
-
-    return data
-
-
-def timedelta_range(start=None, end=None, periods=None, freq='D',
-                    name=None, closed=None):
-    """
-    Return a fixed frequency timedelta index, with day as the default
-    frequency
-
-    Parameters
-    ----------
-    start : string or timedelta-like, default None
-        Left bound for generating dates
-    end : string or datetime-like, default None
-        Right bound for generating dates
-    periods : integer or None, default None
-        If None, must specify start and end
-    freq : string or DateOffset, default 'D' (calendar daily)
-        Frequency strings can have multiples, e.g. '5H'
-    name : str, default None
-        Name of the resulting index
-    closed : string or None, default None
-        Make the interval closed with respect to the given frequency to
-        the 'left', 'right', or both sides (None)
-
-    Returns
-    -------
-    rng : TimedeltaIndex
-
-    Notes
-    -----
-    2 of start, end, or periods must be specified.
-
-    To learn more about the frequency strings, please see `this link
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html#offset-aliases>`__.
-    """
-    return TimedeltaIndex(start=start, end=end, periods=periods,
-                          freq=freq, name=name,
-                          closed=closed)
diff --git a/pandas/tseries/timedeltas.py b/pandas/tseries/timedeltas.py
deleted file mode 100644
index ead602ee80e32..0000000000000
--- a/pandas/tseries/timedeltas.py
+++ /dev/null
@@ -1,181 +0,0 @@
-"""
-timedelta support tools
-"""
-
-import numpy as np
-import pandas as pd
-import pandas._libs.tslib as tslib
-
-from pandas.types.common import (_ensure_object,
-                                 is_integer_dtype,
-                                 is_timedelta64_dtype,
-                                 is_list_like)
-from pandas.types.generic import ABCSeries, ABCIndexClass
-
-
-def to_timedelta(arg, unit='ns', box=True, errors='raise'):
-    """
-    Convert argument to timedelta
-
-    Parameters
-    ----------
-    arg : string, timedelta, list, tuple, 1-d array, or Series
-    unit : unit of the arg (D,h,m,s,ms,us,ns) denote the unit, which is an
-        integer/float number
-    box : boolean, default True
-        - If True returns a Timedelta/TimedeltaIndex of the results
-        - if False returns a np.timedelta64 or ndarray of values of dtype
-          timedelta64[ns]
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaT
-        - If 'ignore', then invalid parsing will return the input
-
-    Returns
-    -------
-    ret : timedelta64/arrays of timedelta64 if parsing succeeded
-
-    Examples
-    --------
-
-    Parsing a single string to a Timedelta:
-
-    >>> pd.to_timedelta('1 days 06:05:01.00003')
-    Timedelta('1 days 06:05:01.000030')
-    >>> pd.to_timedelta('15.5us')
-    Timedelta('0 days 00:00:00.000015')
-
-    Parsing a list or array of strings:
-
-    >>> pd.to_timedelta(['1 days 06:05:01.00003', '15.5us', 'nan'])
-    TimedeltaIndex(['1 days 06:05:01.000030', '0 days 00:00:00.000015', NaT],
-                   dtype='timedelta64[ns]', freq=None)
-
-    Converting numbers by specifying the `unit` keyword argument:
-
-    >>> pd.to_timedelta(np.arange(5), unit='s')
-    TimedeltaIndex(['00:00:00', '00:00:01', '00:00:02',
-                    '00:00:03', '00:00:04'],
-                   dtype='timedelta64[ns]', freq=None)
-    >>> pd.to_timedelta(np.arange(5), unit='d')
-    TimedeltaIndex(['0 days', '1 days', '2 days', '3 days', '4 days'],
-                   dtype='timedelta64[ns]', freq=None)
-    """
-    unit = _validate_timedelta_unit(unit)
-
-    if errors not in ('ignore', 'raise', 'coerce'):
-        raise ValueError("errors must be one of 'ignore', "
-                         "'raise', or 'coerce'}")
-
-    if arg is None:
-        return arg
-    elif isinstance(arg, ABCSeries):
-        from pandas import Series
-        values = _convert_listlike(arg._values, unit=unit,
-                                   box=False, errors=errors)
-        return Series(values, index=arg.index, name=arg.name)
-    elif isinstance(arg, ABCIndexClass):
-        return _convert_listlike(arg, unit=unit, box=box,
-                                 errors=errors, name=arg.name)
-    elif is_list_like(arg) and getattr(arg, 'ndim', 1) == 1:
-        return _convert_listlike(arg, unit=unit, box=box, errors=errors)
-    elif getattr(arg, 'ndim', 1) > 1:
-        raise TypeError('arg must be a string, timedelta, list, tuple, '
-                        '1-d array, or Series')
-
-    # ...so it must be a scalar value. Return scalar.
-    return _coerce_scalar_to_timedelta_type(arg, unit=unit,
-                                            box=box, errors=errors)
-
-
-_unit_map = {
-    'Y': 'Y',
-    'y': 'Y',
-    'W': 'W',
-    'w': 'W',
-    'D': 'D',
-    'd': 'D',
-    'days': 'D',
-    'Days': 'D',
-    'day': 'D',
-    'Day': 'D',
-    'M': 'M',
-    'H': 'h',
-    'h': 'h',
-    'm': 'm',
-    'T': 'm',
-    'S': 's',
-    's': 's',
-    'L': 'ms',
-    'MS': 'ms',
-    'ms': 'ms',
-    'US': 'us',
-    'us': 'us',
-    'NS': 'ns',
-    'ns': 'ns',
-}
-
-
-def _validate_timedelta_unit(arg):
-    """ provide validation / translation for timedelta short units """
-    try:
-        return _unit_map[arg]
-    except:
-        if arg is None:
-            return 'ns'
-        raise ValueError("invalid timedelta unit {0} provided".format(arg))
-
-
-def _coerce_scalar_to_timedelta_type(r, unit='ns', box=True, errors='raise'):
-    """Convert string 'r' to a timedelta object."""
-
-    try:
-        result = tslib.convert_to_timedelta64(r, unit)
-    except ValueError:
-        if errors == 'raise':
-            raise
-        elif errors == 'ignore':
-            return r
-
-        # coerce
-        result = pd.NaT
-
-    if box:
-        result = tslib.Timedelta(result)
-    return result
-
-
-def _convert_listlike(arg, unit='ns', box=True, errors='raise', name=None):
-    """Convert a list of objects to a timedelta index object."""
-
-    if isinstance(arg, (list, tuple)) or not hasattr(arg, 'dtype'):
-        arg = np.array(list(arg), dtype='O')
-
-    # these are shortcut-able
-    if is_timedelta64_dtype(arg):
-        value = arg.astype('timedelta64[ns]')
-    elif is_integer_dtype(arg):
-        value = arg.astype('timedelta64[{0}]'.format(
-            unit)).astype('timedelta64[ns]', copy=False)
-    else:
-        try:
-            value = tslib.array_to_timedelta64(_ensure_object(arg),
-                                               unit=unit, errors=errors)
-            value = value.astype('timedelta64[ns]', copy=False)
-        except ValueError:
-            if errors == 'ignore':
-                return arg
-            else:
-                # This else-block accounts for the cases when errors='raise'
-                # and errors='coerce'. If errors == 'raise', these errors
-                # should be raised. If errors == 'coerce', we shouldn't
-                # expect any errors to be raised, since all parsing errors
-                # cause coercion to pd.NaT. However, if an error / bug is
-                # introduced that causes an Exception to be raised, we would
-                # like to surface it.
-                raise
-
-    if box:
-        from pandas import TimedeltaIndex
-        value = TimedeltaIndex(value, unit='ns', name=name)
-    return value
diff --git a/pandas/tseries/tools.py b/pandas/tseries/tools.py
deleted file mode 100644
index 5dc9746c6d6f9..0000000000000
--- a/pandas/tseries/tools.py
+++ /dev/null
@@ -1,785 +0,0 @@
-from datetime import datetime, timedelta, time
-import numpy as np
-from collections import MutableMapping
-
-from pandas._libs import lib, tslib
-
-from pandas.types.common import (_ensure_object,
-                                 is_datetime64_ns_dtype,
-                                 is_datetime64_dtype,
-                                 is_datetime64tz_dtype,
-                                 is_integer_dtype,
-                                 is_list_like)
-from pandas.types.generic import (ABCIndexClass, ABCSeries,
-                                  ABCDataFrame)
-from pandas.types.missing import notnull
-from pandas.core import algorithms
-
-import pandas.compat as compat
-
-_DATEUTIL_LEXER_SPLIT = None
-try:
-    # Since these are private methods from dateutil, it is safely imported
-    # here so in case this interface changes, pandas will just fallback
-    # to not using the functionality
-    from dateutil.parser import _timelex
-
-    if hasattr(_timelex, 'split'):
-        def _lexer_split_from_str(dt_str):
-            # The StringIO(str(_)) is for dateutil 2.2 compatibility
-            return _timelex.split(compat.StringIO(str(dt_str)))
-
-        _DATEUTIL_LEXER_SPLIT = _lexer_split_from_str
-except (ImportError, AttributeError):
-    pass
-
-
-def _infer_tzinfo(start, end):
-    def _infer(a, b):
-        tz = a.tzinfo
-        if b and b.tzinfo:
-            if not (tslib.get_timezone(tz) == tslib.get_timezone(b.tzinfo)):
-                raise AssertionError('Inputs must both have the same timezone,'
-                                     ' {0} != {1}'.format(tz, b.tzinfo))
-        return tz
-
-    tz = None
-    if start is not None:
-        tz = _infer(start, end)
-    elif end is not None:
-        tz = _infer(end, start)
-    return tz
-
-
-def _guess_datetime_format(dt_str, dayfirst=False,
-                           dt_str_parse=compat.parse_date,
-                           dt_str_split=_DATEUTIL_LEXER_SPLIT):
-    """
-    Guess the datetime format of a given datetime string.
-
-    Parameters
-    ----------
-    dt_str : string, datetime string to guess the format of
-    dayfirst : boolean, default False
-        If True parses dates with the day first, eg 20/01/2005
-        Warning: dayfirst=True is not strict, but will prefer to parse
-        with day first (this is a known bug).
-    dt_str_parse : function, defaults to `compat.parse_date` (dateutil)
-        This function should take in a datetime string and return
-        a `datetime.datetime` guess that the datetime string represents
-    dt_str_split : function, defaults to `_DATEUTIL_LEXER_SPLIT` (dateutil)
-        This function should take in a datetime string and return
-        a list of strings, the guess of the various specific parts
-        e.g. '2011/12/30' -> ['2011', '/', '12', '/', '30']
-
-    Returns
-    -------
-    ret : datetime format string (for `strftime` or `strptime`)
-    """
-    if dt_str_parse is None or dt_str_split is None:
-        return None
-
-    if not isinstance(dt_str, compat.string_types):
-        return None
-
-    day_attribute_and_format = (('day',), '%d', 2)
-
-    # attr name, format, padding (if any)
-    datetime_attrs_to_format = [
-        (('year', 'month', 'day'), '%Y%m%d', 0),
-        (('year',), '%Y', 0),
-        (('month',), '%B', 0),
-        (('month',), '%b', 0),
-        (('month',), '%m', 2),
-        day_attribute_and_format,
-        (('hour',), '%H', 2),
-        (('minute',), '%M', 2),
-        (('second',), '%S', 2),
-        (('microsecond',), '%f', 6),
-        (('second', 'microsecond'), '%S.%f', 0),
-    ]
-
-    if dayfirst:
-        datetime_attrs_to_format.remove(day_attribute_and_format)
-        datetime_attrs_to_format.insert(0, day_attribute_and_format)
-
-    try:
-        parsed_datetime = dt_str_parse(dt_str, dayfirst=dayfirst)
-    except:
-        # In case the datetime can't be parsed, its format cannot be guessed
-        return None
-
-    if parsed_datetime is None:
-        return None
-
-    try:
-        tokens = dt_str_split(dt_str)
-    except:
-        # In case the datetime string can't be split, its format cannot
-        # be guessed
-        return None
-
-    format_guess = [None] * len(tokens)
-    found_attrs = set()
-
-    for attrs, attr_format, padding in datetime_attrs_to_format:
-        # If a given attribute has been placed in the format string, skip
-        # over other formats for that same underlying attribute (IE, month
-        # can be represented in multiple different ways)
-        if set(attrs) & found_attrs:
-            continue
-
-        if all(getattr(parsed_datetime, attr) is not None for attr in attrs):
-            for i, token_format in enumerate(format_guess):
-                token_filled = tokens[i].zfill(padding)
-                if (token_format is None and
-                        token_filled == parsed_datetime.strftime(attr_format)):
-                    format_guess[i] = attr_format
-                    tokens[i] = token_filled
-                    found_attrs.update(attrs)
-                    break
-
-    # Only consider it a valid guess if we have a year, month and day
-    if len(set(['year', 'month', 'day']) & found_attrs) != 3:
-        return None
-
-    output_format = []
-    for i, guess in enumerate(format_guess):
-        if guess is not None:
-            # Either fill in the format placeholder (like %Y)
-            output_format.append(guess)
-        else:
-            # Or just the token separate (IE, the dashes in "01-01-2013")
-            try:
-                # If the token is numeric, then we likely didn't parse it
-                # properly, so our guess is wrong
-                float(tokens[i])
-                return None
-            except ValueError:
-                pass
-
-            output_format.append(tokens[i])
-
-    guessed_format = ''.join(output_format)
-
-    # rebuild string, capturing any inferred padding
-    dt_str = ''.join(tokens)
-    if parsed_datetime.strftime(guessed_format) == dt_str:
-        return guessed_format
-
-
-def _guess_datetime_format_for_array(arr, **kwargs):
-    # Try to guess the format based on the first non-NaN element
-    non_nan_elements = notnull(arr).nonzero()[0]
-    if len(non_nan_elements):
-        return _guess_datetime_format(arr[non_nan_elements[0]], **kwargs)
-
-
-def to_datetime(arg, errors='raise', dayfirst=False, yearfirst=False,
-                utc=None, box=True, format=None, exact=True,
-                unit=None, infer_datetime_format=False):
-    """
-    Convert argument to datetime.
-
-    Parameters
-    ----------
-    arg : integer, float, string, datetime, list, tuple, 1-d array, Series
-
-        .. versionadded: 0.18.1
-
-           or DataFrame/dict-like
-
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaT
-        - If 'ignore', then invalid parsing will return the input
-    dayfirst : boolean, default False
-        Specify a date parse order if `arg` is str or its list-likes.
-        If True, parses dates with the day first, eg 10/11/12 is parsed as
-        2012-11-10.
-        Warning: dayfirst=True is not strict, but will prefer to parse
-        with day first (this is a known bug, based on dateutil behavior).
-    yearfirst : boolean, default False
-        Specify a date parse order if `arg` is str or its list-likes.
-
-        - If True parses dates with the year first, eg 10/11/12 is parsed as
-          2010-11-12.
-        - If both dayfirst and yearfirst are True, yearfirst is preceded (same
-          as dateutil).
-
-        Warning: yearfirst=True is not strict, but will prefer to parse
-        with year first (this is a known bug, based on dateutil beahavior).
-
-        .. versionadded: 0.16.1
-
-    utc : boolean, default None
-        Return UTC DatetimeIndex if True (converting any tz-aware
-        datetime.datetime objects as well).
-    box : boolean, default True
-
-        - If True returns a DatetimeIndex
-        - If False returns ndarray of values.
-    format : string, default None
-        strftime to parse time, eg "%d/%m/%Y", note that "%f" will parse
-        all the way up to nanoseconds.
-    exact : boolean, True by default
-
-        - If True, require an exact format match.
-        - If False, allow the format to match anywhere in the target string.
-
-    unit : string, default 'ns'
-        unit of the arg (D,s,ms,us,ns) denote the unit in epoch
-        (e.g. a unix timestamp), which is an integer/float number.
-    infer_datetime_format : boolean, default False
-        If True and no `format` is given, attempt to infer the format of the
-        datetime strings, and if it can be inferred, switch to a faster
-        method of parsing them. In some cases this can increase the parsing
-        speed by ~5-10x.
-
-    Returns
-    -------
-    ret : datetime if parsing succeeded.
-        Return type depends on input:
-
-        - list-like: DatetimeIndex
-        - Series: Series of datetime64 dtype
-        - scalar: Timestamp
-
-        In case when it is not possible to return designated types (e.g. when
-        any element of input is before Timestamp.min or after Timestamp.max)
-        return will have datetime.datetime type (or correspoding array/Series).
-
-    Examples
-    --------
-
-    Assembling a datetime from multiple columns of a DataFrame. The keys can be
-    common abbreviations like ['year', 'month', 'day', 'minute', 'second',
-    'ms', 'us', 'ns']) or plurals of the same
-
-    >>> df = pd.DataFrame({'year': [2015, 2016],
-                           'month': [2, 3],
-                           'day': [4, 5]})
-    >>> pd.to_datetime(df)
-    0   2015-02-04
-    1   2016-03-05
-    dtype: datetime64[ns]
-
-    If a date does not meet the `timestamp limitations
-    <http://pandas.pydata.org/pandas-docs/stable/timeseries.html
-    #timeseries-timestamp-limits>`_, passing errors='ignore'
-    will return the original input instead of raising any exception.
-
-    Passing errors='coerce' will force an out-of-bounds date to NaT,
-    in addition to forcing non-dates (or non-parseable dates) to NaT.
-
-    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='ignore')
-    datetime.datetime(1300, 1, 1, 0, 0)
-    >>> pd.to_datetime('13000101', format='%Y%m%d', errors='coerce')
-    NaT
-
-    Passing infer_datetime_format=True can often-times speedup a parsing
-    if its not an ISO8601 format exactly, but in a regular format.
-
-    >>> s = pd.Series(['3/11/2000', '3/12/2000', '3/13/2000']*1000)
-
-    >>> s.head()
-    0    3/11/2000
-    1    3/12/2000
-    2    3/13/2000
-    3    3/11/2000
-    4    3/12/2000
-    dtype: object
-
-    >>> %timeit pd.to_datetime(s,infer_datetime_format=True)
-    100 loops, best of 3: 10.4 ms per loop
-
-    >>> %timeit pd.to_datetime(s,infer_datetime_format=False)
-    1 loop, best of 3: 471 ms per loop
-
-    """
-
-    from pandas.tseries.index import DatetimeIndex
-
-    tz = 'utc' if utc else None
-
-    def _convert_listlike(arg, box, format, name=None, tz=tz):
-
-        if isinstance(arg, (list, tuple)):
-            arg = np.array(arg, dtype='O')
-
-        # these are shortcutable
-        if is_datetime64tz_dtype(arg):
-            if not isinstance(arg, DatetimeIndex):
-                return DatetimeIndex(arg, tz=tz, name=name)
-            if utc:
-                arg = arg.tz_convert(None).tz_localize('UTC')
-            return arg
-
-        elif is_datetime64_ns_dtype(arg):
-            if box and not isinstance(arg, DatetimeIndex):
-                try:
-                    return DatetimeIndex(arg, tz=tz, name=name)
-                except ValueError:
-                    pass
-
-            return arg
-
-        elif unit is not None:
-            if format is not None:
-                raise ValueError("cannot specify both format and unit")
-            arg = getattr(arg, 'values', arg)
-            result = tslib.array_with_unit_to_datetime(arg, unit,
-                                                       errors=errors)
-            if box:
-                if errors == 'ignore':
-                    from pandas import Index
-                    return Index(result)
-
-                return DatetimeIndex(result, tz=tz, name=name)
-            return result
-        elif getattr(arg, 'ndim', 1) > 1:
-            raise TypeError('arg must be a string, datetime, list, tuple, '
-                            '1-d array, or Series')
-
-        arg = _ensure_object(arg)
-        require_iso8601 = False
-
-        if infer_datetime_format and format is None:
-            format = _guess_datetime_format_for_array(arg, dayfirst=dayfirst)
-
-        if format is not None:
-            # There is a special fast-path for iso8601 formatted
-            # datetime strings, so in those cases don't use the inferred
-            # format because this path makes process slower in this
-            # special case
-            format_is_iso8601 = _format_is_iso(format)
-            if format_is_iso8601:
-                require_iso8601 = not infer_datetime_format
-                format = None
-
-        try:
-            result = None
-
-            if format is not None:
-                # shortcut formatting here
-                if format == '%Y%m%d':
-                    try:
-                        result = _attempt_YYYYMMDD(arg, errors=errors)
-                    except:
-                        raise ValueError("cannot convert the input to "
-                                         "'%Y%m%d' date format")
-
-                # fallback
-                if result is None:
-                    try:
-                        result = tslib.array_strptime(arg, format, exact=exact,
-                                                      errors=errors)
-                    except tslib.OutOfBoundsDatetime:
-                        if errors == 'raise':
-                            raise
-                        result = arg
-                    except ValueError:
-                        # if format was inferred, try falling back
-                        # to array_to_datetime - terminate here
-                        # for specified formats
-                        if not infer_datetime_format:
-                            if errors == 'raise':
-                                raise
-                            result = arg
-
-            if result is None and (format is None or infer_datetime_format):
-                result = tslib.array_to_datetime(
-                    arg,
-                    errors=errors,
-                    utc=utc,
-                    dayfirst=dayfirst,
-                    yearfirst=yearfirst,
-                    require_iso8601=require_iso8601
-                )
-
-            if is_datetime64_dtype(result) and box:
-                result = DatetimeIndex(result, tz=tz, name=name)
-            return result
-
-        except ValueError as e:
-            try:
-                values, tz = tslib.datetime_to_datetime64(arg)
-                return DatetimeIndex._simple_new(values, name=name, tz=tz)
-            except (ValueError, TypeError):
-                raise e
-
-    if arg is None:
-        return arg
-    elif isinstance(arg, tslib.Timestamp):
-        return arg
-    elif isinstance(arg, ABCSeries):
-        from pandas import Series
-        values = _convert_listlike(arg._values, False, format)
-        return Series(values, index=arg.index, name=arg.name)
-    elif isinstance(arg, (ABCDataFrame, MutableMapping)):
-        return _assemble_from_unit_mappings(arg, errors=errors)
-    elif isinstance(arg, ABCIndexClass):
-        return _convert_listlike(arg, box, format, name=arg.name)
-    elif is_list_like(arg):
-        return _convert_listlike(arg, box, format)
-
-    return _convert_listlike(np.array([arg]), box, format)[0]
-
-
-# mappings for assembling units
-_unit_map = {'year': 'year',
-             'years': 'year',
-             'month': 'month',
-             'months': 'month',
-             'day': 'day',
-             'days': 'day',
-             'hour': 'h',
-             'hours': 'h',
-             'minute': 'm',
-             'minutes': 'm',
-             'second': 's',
-             'seconds': 's',
-             'ms': 'ms',
-             'millisecond': 'ms',
-             'milliseconds': 'ms',
-             'us': 'us',
-             'microsecond': 'us',
-             'microseconds': 'us',
-             'ns': 'ns',
-             'nanosecond': 'ns',
-             'nanoseconds': 'ns'
-             }
-
-
-def _assemble_from_unit_mappings(arg, errors):
-    """
-    assemble the unit specifed fields from the arg (DataFrame)
-    Return a Series for actual parsing
-
-    Parameters
-    ----------
-    arg : DataFrame
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as NaT
-        - If 'ignore', then invalid parsing will return the input
-
-    Returns
-    -------
-    Series
-    """
-    from pandas import to_timedelta, to_numeric, DataFrame
-    arg = DataFrame(arg)
-    if not arg.columns.is_unique:
-        raise ValueError("cannot assemble with duplicate keys")
-
-    # replace passed unit with _unit_map
-    def f(value):
-        if value in _unit_map:
-            return _unit_map[value]
-
-        # m is case significant
-        if value.lower() in _unit_map:
-            return _unit_map[value.lower()]
-
-        return value
-
-    unit = {k: f(k) for k in arg.keys()}
-    unit_rev = {v: k for k, v in unit.items()}
-
-    # we require at least Ymd
-    required = ['year', 'month', 'day']
-    req = sorted(list(set(required) - set(unit_rev.keys())))
-    if len(req):
-        raise ValueError("to assemble mappings requires at "
-                         "least that [year, month, day] be specified: "
-                         "[{0}] is missing".format(','.join(req)))
-
-    # keys we don't recognize
-    excess = sorted(list(set(unit_rev.keys()) - set(_unit_map.values())))
-    if len(excess):
-        raise ValueError("extra keys have been passed "
-                         "to the datetime assemblage: "
-                         "[{0}]".format(','.join(excess)))
-
-    def coerce(values):
-        # we allow coercion to if errors allows
-        values = to_numeric(values, errors=errors)
-
-        # prevent overflow in case of int8 or int16
-        if is_integer_dtype(values):
-            values = values.astype('int64', copy=False)
-        return values
-
-    values = (coerce(arg[unit_rev['year']]) * 10000 +
-              coerce(arg[unit_rev['month']]) * 100 +
-              coerce(arg[unit_rev['day']]))
-    try:
-        values = to_datetime(values, format='%Y%m%d', errors=errors)
-    except (TypeError, ValueError) as e:
-        raise ValueError("cannot assemble the "
-                         "datetimes: {0}".format(e))
-
-    for u in ['h', 'm', 's', 'ms', 'us', 'ns']:
-        value = unit_rev.get(u)
-        if value is not None and value in arg:
-            try:
-                values += to_timedelta(coerce(arg[value]),
-                                       unit=u,
-                                       errors=errors)
-            except (TypeError, ValueError) as e:
-                raise ValueError("cannot assemble the datetimes "
-                                 "[{0}]: {1}".format(value, e))
-
-    return values
-
-
-def _attempt_YYYYMMDD(arg, errors):
-    """ try to parse the YYYYMMDD/%Y%m%d format, try to deal with NaT-like,
-        arg is a passed in as an object dtype, but could really be ints/strings
-        with nan-like/or floats (e.g. with nan)
-
-    Parameters
-    ----------
-    arg : passed value
-    errors : 'raise','ignore','coerce'
-    """
-
-    def calc(carg):
-        # calculate the actual result
-        carg = carg.astype(object)
-        parsed = lib.try_parse_year_month_day(carg / 10000,
-                                              carg / 100 % 100,
-                                              carg % 100)
-        return tslib.array_to_datetime(parsed, errors=errors)
-
-    def calc_with_mask(carg, mask):
-        result = np.empty(carg.shape, dtype='M8[ns]')
-        iresult = result.view('i8')
-        iresult[~mask] = tslib.iNaT
-        result[mask] = calc(carg[mask].astype(np.float64).astype(np.int64)). \
-            astype('M8[ns]')
-        return result
-
-    # try intlike / strings that are ints
-    try:
-        return calc(arg.astype(np.int64))
-    except:
-        pass
-
-    # a float with actual np.nan
-    try:
-        carg = arg.astype(np.float64)
-        return calc_with_mask(carg, notnull(carg))
-    except:
-        pass
-
-    # string with NaN-like
-    try:
-        mask = ~algorithms.isin(arg, list(tslib._nat_strings))
-        return calc_with_mask(arg, mask)
-    except:
-        pass
-
-    return None
-
-
-def _format_is_iso(f):
-    """
-    Does format match the iso8601 set that can be handled by the C parser?
-    Generally of form YYYY-MM-DDTHH:MM:SS - date separator can be different
-    but must be consistent.  Leading 0s in dates and times are optional.
-    """
-    iso_template = '%Y{date_sep}%m{date_sep}%d{time_sep}%H:%M:%S.%f'.format
-    excluded_formats = ['%Y%m%d', '%Y%m', '%Y']
-
-    for date_sep in [' ', '/', '\\', '-', '.', '']:
-        for time_sep in [' ', 'T']:
-            if (iso_template(date_sep=date_sep,
-                             time_sep=time_sep
-                             ).startswith(f) and f not in excluded_formats):
-                return True
-    return False
-
-
-def parse_time_string(arg, freq=None, dayfirst=None, yearfirst=None):
-    """
-    Try hard to parse datetime string, leveraging dateutil plus some extra
-    goodies like quarter recognition.
-
-    Parameters
-    ----------
-    arg : compat.string_types
-    freq : str or DateOffset, default None
-        Helps with interpreting time string if supplied
-    dayfirst : bool, default None
-        If None uses default from print_config
-    yearfirst : bool, default None
-        If None uses default from print_config
-
-    Returns
-    -------
-    datetime, datetime/dateutil.parser._result, str
-    """
-    from pandas.core.config import get_option
-    if not isinstance(arg, compat.string_types):
-        return arg
-
-    from pandas.tseries.offsets import DateOffset
-    if isinstance(freq, DateOffset):
-        freq = freq.rule_code
-
-    if dayfirst is None:
-        dayfirst = get_option("display.date_dayfirst")
-    if yearfirst is None:
-        yearfirst = get_option("display.date_yearfirst")
-
-    return tslib.parse_datetime_string_with_reso(arg, freq=freq,
-                                                 dayfirst=dayfirst,
-                                                 yearfirst=yearfirst)
-
-
-DateParseError = tslib.DateParseError
-normalize_date = tslib.normalize_date
-
-# Fixed time formats for time parsing
-_time_formats = ["%H:%M", "%H%M", "%I:%M%p", "%I%M%p",
-                 "%H:%M:%S", "%H%M%S", "%I:%M:%S%p", "%I%M%S%p"]
-
-
-def _guess_time_format_for_array(arr):
-    # Try to guess the format based on the first non-NaN element
-    non_nan_elements = notnull(arr).nonzero()[0]
-    if len(non_nan_elements):
-        element = arr[non_nan_elements[0]]
-        for time_format in _time_formats:
-            try:
-                datetime.strptime(element, time_format)
-                return time_format
-            except ValueError:
-                pass
-
-    return None
-
-
-def to_time(arg, format=None, infer_time_format=False, errors='raise'):
-    """
-    Parse time strings to time objects using fixed strptime formats ("%H:%M",
-    "%H%M", "%I:%M%p", "%I%M%p", "%H:%M:%S", "%H%M%S", "%I:%M:%S%p",
-    "%I%M%S%p")
-
-    Use infer_time_format if all the strings are in the same format to speed
-    up conversion.
-
-    Parameters
-    ----------
-    arg : string in time format, datetime.time, list, tuple, 1-d array,  Series
-    format : str, default None
-        Format used to convert arg into a time object.  If None, fixed formats
-        are used.
-    infer_time_format: bool, default False
-        Infer the time format based on the first non-NaN element.  If all
-        strings are in the same format, this will speed up conversion.
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception
-        - If 'coerce', then invalid parsing will be set as None
-        - If 'ignore', then invalid parsing will return the input
-
-    Returns
-    -------
-    datetime.time
-    """
-    from pandas.core.series import Series
-
-    def _convert_listlike(arg, format):
-
-        if isinstance(arg, (list, tuple)):
-            arg = np.array(arg, dtype='O')
-
-        elif getattr(arg, 'ndim', 1) > 1:
-            raise TypeError('arg must be a string, datetime, list, tuple, '
-                            '1-d array, or Series')
-
-        arg = _ensure_object(arg)
-
-        if infer_time_format and format is None:
-            format = _guess_time_format_for_array(arg)
-
-        times = []
-        if format is not None:
-            for element in arg:
-                try:
-                    times.append(datetime.strptime(element, format).time())
-                except (ValueError, TypeError):
-                    if errors == 'raise':
-                        raise ValueError("Cannot convert %s to a time with "
-                                         "given format %s" % (element, format))
-                    elif errors == 'ignore':
-                        return arg
-                    else:
-                        times.append(None)
-        else:
-            formats = _time_formats[:]
-            format_found = False
-            for element in arg:
-                time_object = None
-                for time_format in formats:
-                    try:
-                        time_object = datetime.strptime(element,
-                                                        time_format).time()
-                        if not format_found:
-                            # Put the found format in front
-                            fmt = formats.pop(formats.index(time_format))
-                            formats.insert(0, fmt)
-                            format_found = True
-                        break
-                    except (ValueError, TypeError):
-                        continue
-
-                if time_object is not None:
-                    times.append(time_object)
-                elif errors == 'raise':
-                    raise ValueError("Cannot convert arg {arg} to "
-                                     "a time".format(arg=arg))
-                elif errors == 'ignore':
-                    return arg
-                else:
-                    times.append(None)
-
-        return times
-
-    if arg is None:
-        return arg
-    elif isinstance(arg, time):
-        return arg
-    elif isinstance(arg, Series):
-        values = _convert_listlike(arg._values, format)
-        return Series(values, index=arg.index, name=arg.name)
-    elif isinstance(arg, ABCIndexClass):
-        return _convert_listlike(arg, format)
-    elif is_list_like(arg):
-        return _convert_listlike(arg, format)
-
-    return _convert_listlike(np.array([arg]), format)[0]
-
-
-def format(dt):
-    """Returns date in YYYYMMDD format."""
-    return dt.strftime('%Y%m%d')
-
-
-OLE_TIME_ZERO = datetime(1899, 12, 30, 0, 0, 0)
-
-
-def ole2datetime(oledt):
-    """function for converting excel date to normal date format"""
-    val = float(oledt)
-
-    # Excel has a bug where it thinks the date 2/29/1900 exists
-    # we just reject any date before 3/1/1900.
-    if val < 61:
-        raise ValueError("Value is outside of acceptable range: %s " % val)
-
-    return OLE_TIME_ZERO + timedelta(days=val)
diff --git a/pandas/tseries/util.py b/pandas/tseries/util.py
deleted file mode 100644
index da3bb075dd02c..0000000000000
--- a/pandas/tseries/util.py
+++ /dev/null
@@ -1,104 +0,0 @@
-import warnings
-
-from pandas.compat import lrange
-import numpy as np
-from pandas.types.common import _ensure_platform_int
-from pandas.core.frame import DataFrame
-import pandas.core.algorithms as algorithms
-
-
-def pivot_annual(series, freq=None):
-    """
-    Deprecated. Use ``pivot_table`` instead.
-
-    Group a series by years, taking leap years into account.
-
-    The output has as many rows as distinct years in the original series,
-    and as many columns as the length of a leap year in the units corresponding
-    to the original frequency (366 for daily frequency, 366*24 for hourly...).
-    The fist column of the output corresponds to Jan. 1st, 00:00:00,
-    while the last column corresponds to Dec, 31st, 23:59:59.
-    Entries corresponding to Feb. 29th are masked for non-leap years.
-
-    For example, if the initial series has a daily frequency, the 59th column
-    of the output always corresponds to Feb. 28th, the 61st column to Mar. 1st,
-    and the 60th column is masked for non-leap years.
-    With a hourly initial frequency, the (59*24)th column of the output always
-    correspond to Feb. 28th 23:00, the (61*24)th column to Mar. 1st, 00:00, and
-    the 24 columns between (59*24) and (61*24) are masked.
-
-    If the original frequency is less than daily, the output is equivalent to
-    ``series.convert('A', func=None)``.
-
-    Parameters
-    ----------
-    series : Series
-    freq : string or None, default None
-
-    Returns
-    -------
-    annual : DataFrame
-    """
-
-    msg = "pivot_annual is deprecated. Use pivot_table instead"
-    warnings.warn(msg, FutureWarning)
-
-    index = series.index
-    year = index.year
-    years = algorithms.unique1d(year)
-
-    if freq is not None:
-        freq = freq.upper()
-    else:
-        freq = series.index.freq
-
-    if freq == 'D':
-        width = 366
-        offset = np.asarray(index.dayofyear) - 1
-
-        # adjust for leap year
-        offset[(~isleapyear(year)) & (offset >= 59)] += 1
-
-        columns = lrange(1, 367)
-        # todo: strings like 1/1, 1/25, etc.?
-    elif freq in ('M', 'BM'):
-        width = 12
-        offset = np.asarray(index.month) - 1
-        columns = lrange(1, 13)
-    elif freq == 'H':
-        width = 8784
-        grouped = series.groupby(series.index.year)
-        defaulted = grouped.apply(lambda x: x.reset_index(drop=True))
-        defaulted.index = defaulted.index.droplevel(0)
-        offset = np.asarray(defaulted.index)
-        offset[~isleapyear(year) & (offset >= 1416)] += 24
-        columns = lrange(1, 8785)
-    else:
-        raise NotImplementedError(freq)
-
-    flat_index = (year - years.min()) * width + offset
-    flat_index = _ensure_platform_int(flat_index)
-
-    values = np.empty((len(years), width))
-    values.fill(np.nan)
-    values.put(flat_index, series.values)
-
-    return DataFrame(values, index=years, columns=columns)
-
-
-def isleapyear(year):
-    """
-    Returns true if year is a leap year.
-
-    Parameters
-    ----------
-    year : integer / sequence
-        A given (list of) year(s).
-    """
-
-    msg = "isleapyear is deprecated. Use .is_leap_year property instead"
-    warnings.warn(msg, FutureWarning)
-
-    year = np.asarray(year)
-    return np.logical_or(year % 400 == 0,
-                         np.logical_and(year % 4 == 0, year % 100 > 0))
diff --git a/pandas/tslib.py b/pandas/tslib.py
deleted file mode 100644
index 3ecbffa20700d..0000000000000
--- a/pandas/tslib.py
+++ /dev/null
@@ -1,8 +0,0 @@
-# flake8: noqa
-
-import warnings
-warnings.warn("The pandas.tslib module is deprecated and will be "
-              "removed in a future version. Please import from "
-              "the pandas._libs.tslib instead", FutureWarning, stacklevel=2)
-from pandas._libs.tslib import (Timestamp, Timedelta,
-                               NaT, OutOfBoundsDatetime)
diff --git a/pandas/types/api.py b/pandas/types/api.py
deleted file mode 100644
index c809cb3614a8c..0000000000000
--- a/pandas/types/api.py
+++ /dev/null
@@ -1,58 +0,0 @@
-# flake8: noqa
-
-import numpy as np
-
-from .common import (pandas_dtype,
-                     is_dtype_equal,
-                     is_extension_type,
-
-                     # categorical
-                     is_categorical,
-                     is_categorical_dtype,
-
-                     # datetimelike
-                     is_datetimetz,
-                     is_datetime64_dtype,
-                     is_datetime64tz_dtype,
-                     is_datetime64_any_dtype,
-                     is_datetime64_ns_dtype,
-                     is_timedelta64_dtype,
-                     is_timedelta64_ns_dtype,
-                     is_period,
-                     is_period_dtype,
-
-                     # string-like
-                     is_string_dtype,
-                     is_object_dtype,
-
-                     # sparse
-                     is_sparse,
-
-                     # numeric types
-                     is_scalar,
-                     is_sparse,
-                     is_bool,
-                     is_integer,
-                     is_float,
-                     is_complex,
-                     is_number,
-                     is_any_int_dtype,
-                     is_integer_dtype,
-                     is_int64_dtype,
-                     is_numeric_dtype,
-                     is_float_dtype,
-                     is_floating_dtype,
-                     is_bool_dtype,
-                     is_complex_dtype,
-                     is_signed_integer_dtype,
-                     is_unsigned_integer_dtype,
-
-                     # like
-                     is_re,
-                     is_re_compilable,
-                     is_dict_like,
-                     is_iterator,
-                     is_list_like,
-                     is_hashable,
-                     is_named_tuple,
-                     is_sequence)
diff --git a/pandas/types/cast.py b/pandas/types/cast.py
deleted file mode 100644
index 985e5b9f95831..0000000000000
--- a/pandas/types/cast.py
+++ /dev/null
@@ -1,985 +0,0 @@
-""" routings for casting """
-
-from datetime import datetime, timedelta
-import numpy as np
-from pandas._libs import tslib, lib
-from pandas._libs.tslib import iNaT
-from pandas.compat import string_types, text_type, PY3
-from .common import (_ensure_object, is_bool, is_integer, is_float,
-                     is_complex, is_datetimetz, is_categorical_dtype,
-                     is_datetimelike,
-                     is_extension_type, is_object_dtype,
-                     is_datetime64tz_dtype, is_datetime64_dtype,
-                     is_timedelta64_dtype, is_dtype_equal,
-                     is_float_dtype, is_complex_dtype,
-                     is_integer_dtype,
-                     is_datetime_or_timedelta_dtype,
-                     is_bool_dtype, is_scalar,
-                     _string_dtypes,
-                     _coerce_to_dtype,
-                     _ensure_int8, _ensure_int16,
-                     _ensure_int32, _ensure_int64,
-                     _NS_DTYPE, _TD_DTYPE, _INT64_DTYPE,
-                     _POSSIBLY_CAST_DTYPES)
-from .dtypes import ExtensionDtype, DatetimeTZDtype, PeriodDtype
-from .generic import ABCDatetimeIndex, ABCPeriodIndex, ABCSeries
-from .missing import isnull, notnull
-from .inference import is_list_like
-
-_int8_max = np.iinfo(np.int8).max
-_int16_max = np.iinfo(np.int16).max
-_int32_max = np.iinfo(np.int32).max
-_int64_max = np.iinfo(np.int64).max
-
-
-def maybe_convert_platform(values):
-    """ try to do platform conversion, allow ndarray or list here """
-
-    if isinstance(values, (list, tuple)):
-        values = lib.list_to_object_array(list(values))
-    if getattr(values, 'dtype', None) == np.object_:
-        if hasattr(values, '_values'):
-            values = values._values
-        values = lib.maybe_convert_objects(values)
-
-    return values
-
-
-def maybe_downcast_to_dtype(result, dtype):
-    """ try to cast to the specified dtype (e.g. convert back to bool/int
-    or could be an astype of float64->float32
-    """
-
-    if is_scalar(result):
-        return result
-
-    def trans(x):
-        return x
-
-    if isinstance(dtype, string_types):
-        if dtype == 'infer':
-            inferred_type = lib.infer_dtype(_ensure_object(result.ravel()))
-            if inferred_type == 'boolean':
-                dtype = 'bool'
-            elif inferred_type == 'integer':
-                dtype = 'int64'
-            elif inferred_type == 'datetime64':
-                dtype = 'datetime64[ns]'
-            elif inferred_type == 'timedelta64':
-                dtype = 'timedelta64[ns]'
-
-            # try to upcast here
-            elif inferred_type == 'floating':
-                dtype = 'int64'
-                if issubclass(result.dtype.type, np.number):
-
-                    def trans(x):  # noqa
-                        return x.round()
-            else:
-                dtype = 'object'
-
-    if isinstance(dtype, string_types):
-        dtype = np.dtype(dtype)
-
-    try:
-
-        # don't allow upcasts here (except if empty)
-        if dtype.kind == result.dtype.kind:
-            if (result.dtype.itemsize <= dtype.itemsize and
-                    np.prod(result.shape)):
-                return result
-
-        if issubclass(dtype.type, np.floating):
-            return result.astype(dtype)
-        elif is_bool_dtype(dtype) or is_integer_dtype(dtype):
-
-            # if we don't have any elements, just astype it
-            if not np.prod(result.shape):
-                return trans(result).astype(dtype)
-
-            # do a test on the first element, if it fails then we are done
-            r = result.ravel()
-            arr = np.array([r[0]])
-
-            # if we have any nulls, then we are done
-            if (isnull(arr).any() or
-                    not np.allclose(arr, trans(arr).astype(dtype), rtol=0)):
-                return result
-
-            # a comparable, e.g. a Decimal may slip in here
-            elif not isinstance(r[0], (np.integer, np.floating, np.bool, int,
-                                       float, bool)):
-                return result
-
-            if (issubclass(result.dtype.type, (np.object_, np.number)) and
-                    notnull(result).all()):
-                new_result = trans(result).astype(dtype)
-                try:
-                    if np.allclose(new_result, result, rtol=0):
-                        return new_result
-                except:
-
-                    # comparison of an object dtype with a number type could
-                    # hit here
-                    if (new_result == result).all():
-                        return new_result
-
-        # a datetimelike
-        # GH12821, iNaT is casted to float
-        elif dtype.kind in ['M', 'm'] and result.dtype.kind in ['i', 'f']:
-            try:
-                result = result.astype(dtype)
-            except:
-                if dtype.tz:
-                    # convert to datetime and change timezone
-                    from pandas import to_datetime
-                    result = to_datetime(result).tz_localize('utc')
-                    result = result.tz_convert(dtype.tz)
-
-    except:
-        pass
-
-    return result
-
-
-def maybe_upcast_putmask(result, mask, other):
-    """
-    A safe version of putmask that potentially upcasts the result
-
-    Parameters
-    ----------
-    result : ndarray
-        The destination array. This will be mutated in-place if no upcasting is
-        necessary.
-    mask : boolean ndarray
-    other : ndarray or scalar
-        The source array or value
-
-    Returns
-    -------
-    result : ndarray
-    changed : boolean
-        Set to true if the result array was upcasted
-    """
-
-    if mask.any():
-        # Two conversions for date-like dtypes that can't be done automatically
-        # in np.place:
-        #   NaN -> NaT
-        #   integer or integer array -> date-like array
-        if is_datetimelike(result.dtype):
-            if is_scalar(other):
-                if isnull(other):
-                    other = result.dtype.type('nat')
-                elif is_integer(other):
-                    other = np.array(other, dtype=result.dtype)
-            elif is_integer_dtype(other):
-                other = np.array(other, dtype=result.dtype)
-
-        def changeit():
-
-            # try to directly set by expanding our array to full
-            # length of the boolean
-            try:
-                om = other[mask]
-                om_at = om.astype(result.dtype)
-                if (om == om_at).all():
-                    new_result = result.values.copy()
-                    new_result[mask] = om_at
-                    result[:] = new_result
-                    return result, False
-            except:
-                pass
-
-            # we are forced to change the dtype of the result as the input
-            # isn't compatible
-            r, _ = maybe_upcast(result, fill_value=other, copy=True)
-            np.place(r, mask, other)
-
-            return r, True
-
-        # we want to decide whether place will work
-        # if we have nans in the False portion of our mask then we need to
-        # upcast (possibly), otherwise we DON't want to upcast (e.g. if we
-        # have values, say integers, in the success portion then it's ok to not
-        # upcast)
-        new_dtype, _ = maybe_promote(result.dtype, other)
-        if new_dtype != result.dtype:
-
-            # we have a scalar or len 0 ndarray
-            # and its nan and we are changing some values
-            if (is_scalar(other) or
-                    (isinstance(other, np.ndarray) and other.ndim < 1)):
-                if isnull(other):
-                    return changeit()
-
-            # we have an ndarray and the masking has nans in it
-            else:
-
-                if isnull(other[mask]).any():
-                    return changeit()
-
-        try:
-            np.place(result, mask, other)
-        except:
-            return changeit()
-
-    return result, False
-
-
-def maybe_promote(dtype, fill_value=np.nan):
-
-    # if we passed an array here, determine the fill value by dtype
-    if isinstance(fill_value, np.ndarray):
-        if issubclass(fill_value.dtype.type, (np.datetime64, np.timedelta64)):
-            fill_value = iNaT
-        else:
-
-            # we need to change to object type as our
-            # fill_value is of object type
-            if fill_value.dtype == np.object_:
-                dtype = np.dtype(np.object_)
-            fill_value = np.nan
-
-    # returns tuple of (dtype, fill_value)
-    if issubclass(dtype.type, (np.datetime64, np.timedelta64)):
-        # for now: refuse to upcast datetime64
-        # (this is because datetime64 will not implicitly upconvert
-        #  to object correctly as of numpy 1.6.1)
-        if isnull(fill_value):
-            fill_value = iNaT
-        else:
-            if issubclass(dtype.type, np.datetime64):
-                try:
-                    fill_value = lib.Timestamp(fill_value).value
-                except:
-                    # the proper thing to do here would probably be to upcast
-                    # to object (but numpy 1.6.1 doesn't do this properly)
-                    fill_value = iNaT
-            elif issubclass(dtype.type, np.timedelta64):
-                try:
-                    fill_value = lib.Timedelta(fill_value).value
-                except:
-                    # as for datetimes, cannot upcast to object
-                    fill_value = iNaT
-            else:
-                fill_value = iNaT
-    elif is_datetimetz(dtype):
-        if isnull(fill_value):
-            fill_value = iNaT
-    elif is_float(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, np.integer):
-            dtype = np.float64
-    elif is_bool(fill_value):
-        if not issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-    elif is_integer(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, np.integer):
-            # upcast to prevent overflow
-            arr = np.asarray(fill_value)
-            if arr != arr.astype(dtype):
-                dtype = arr.dtype
-    elif is_complex(fill_value):
-        if issubclass(dtype.type, np.bool_):
-            dtype = np.object_
-        elif issubclass(dtype.type, (np.integer, np.floating)):
-            dtype = np.complex128
-    elif fill_value is None:
-        if is_float_dtype(dtype) or is_complex_dtype(dtype):
-            fill_value = np.nan
-        elif is_integer_dtype(dtype):
-            dtype = np.float64
-            fill_value = np.nan
-        elif is_datetime_or_timedelta_dtype(dtype):
-            fill_value = iNaT
-        else:
-            dtype = np.object_
-    else:
-        dtype = np.object_
-
-    # in case we have a string that looked like a number
-    if is_categorical_dtype(dtype):
-        pass
-    elif is_datetimetz(dtype):
-        pass
-    elif issubclass(np.dtype(dtype).type, string_types):
-        dtype = np.object_
-
-    return dtype, fill_value
-
-
-def infer_dtype_from_scalar(val, pandas_dtype=False):
-    """
-    interpret the dtype from a scalar
-
-    Parameters
-    ----------
-    pandas_dtype : bool, default False
-        whether to infer dtype including pandas extension types.
-        If False, scalar belongs to pandas extension types is inferred as
-        object
-    """
-
-    dtype = np.object_
-
-    # a 1-element ndarray
-    if isinstance(val, np.ndarray):
-        if val.ndim != 0:
-            raise ValueError(
-                "invalid ndarray passed to _infer_dtype_from_scalar")
-
-        dtype = val.dtype
-        val = val.item()
-
-    elif isinstance(val, string_types):
-
-        # If we create an empty array using a string to infer
-        # the dtype, NumPy will only allocate one character per entry
-        # so this is kind of bad. Alternately we could use np.repeat
-        # instead of np.empty (but then you still don't want things
-        # coming out as np.str_!
-
-        dtype = np.object_
-
-    elif isinstance(val, (np.datetime64, datetime)):
-        val = tslib.Timestamp(val)
-        if val is tslib.NaT or val.tz is None:
-            dtype = np.dtype('M8[ns]')
-        else:
-            if pandas_dtype:
-                dtype = DatetimeTZDtype(unit='ns', tz=val.tz)
-            else:
-                # return datetimetz as object
-                return np.object_, val
-        val = val.value
-
-    elif isinstance(val, (np.timedelta64, timedelta)):
-        val = tslib.Timedelta(val).value
-        dtype = np.dtype('m8[ns]')
-
-    elif is_bool(val):
-        dtype = np.bool_
-
-    elif is_integer(val):
-        if isinstance(val, np.integer):
-            dtype = type(val)
-        else:
-            dtype = np.int64
-
-    elif is_float(val):
-        if isinstance(val, np.floating):
-            dtype = type(val)
-        else:
-            dtype = np.float64
-
-    elif is_complex(val):
-        dtype = np.complex_
-
-    elif pandas_dtype:
-        if lib.is_period(val):
-            dtype = PeriodDtype(freq=val.freq)
-            val = val.ordinal
-
-    return dtype, val
-
-
-def infer_dtype_from_array(arr):
-    """
-    infer the dtype from a scalar or array
-
-    Parameters
-    ----------
-    arr : scalar or array
-
-    Returns
-    -------
-    tuple (numpy-compat dtype, array)
-
-    Notes
-    -----
-    These infer to numpy dtypes exactly
-    with the exception that mixed / object dtypes
-    are not coerced by stringifying or conversion
-
-    Examples
-    --------
-    >>> np.asarray([1, '1'])
-    array(['1', '1'], dtype='<U21')
-
-    >>> infer_dtype_from_array([1, '1'])
-    (numpy.object_, [1, '1'])
-
-    """
-
-    if isinstance(arr, np.ndarray):
-        return arr.dtype, arr
-
-    if not is_list_like(arr):
-        arr = [arr]
-
-    # don't force numpy coerce with nan's
-    inferred = lib.infer_dtype(arr)
-    if inferred in ['string', 'bytes', 'unicode',
-                    'mixed', 'mixed-integer']:
-        return (np.object_, arr)
-
-    arr = np.asarray(arr)
-    return arr.dtype, arr
-
-
-def maybe_upcast(values, fill_value=np.nan, dtype=None, copy=False):
-    """ provide explict type promotion and coercion
-
-    Parameters
-    ----------
-    values : the ndarray that we want to maybe upcast
-    fill_value : what we want to fill with
-    dtype : if None, then use the dtype of the values, else coerce to this type
-    copy : if True always make a copy even if no upcast is required
-    """
-
-    if is_extension_type(values):
-        if copy:
-            values = values.copy()
-    else:
-        if dtype is None:
-            dtype = values.dtype
-        new_dtype, fill_value = maybe_promote(dtype, fill_value)
-        if new_dtype != values.dtype:
-            values = values.astype(new_dtype)
-        elif copy:
-            values = values.copy()
-
-    return values, fill_value
-
-
-def maybe_cast_item(obj, item, dtype):
-    chunk = obj[item]
-
-    if chunk.values.dtype != dtype:
-        if dtype in (np.object_, np.bool_):
-            obj[item] = chunk.astype(np.object_)
-        elif not issubclass(dtype, (np.integer, np.bool_)):  # pragma: no cover
-            raise ValueError("Unexpected dtype encountered: %s" % dtype)
-
-
-def invalidate_string_dtypes(dtype_set):
-    """Change string like dtypes to object for
-    ``DataFrame.select_dtypes()``.
-    """
-    non_string_dtypes = dtype_set - _string_dtypes
-    if non_string_dtypes != dtype_set:
-        raise TypeError("string dtypes are not allowed, use 'object' instead")
-
-
-def maybe_convert_string_to_object(values):
-    """
-
-    Convert string-like and string-like array to convert object dtype.
-    This is to avoid numpy to handle the array as str dtype.
-    """
-    if isinstance(values, string_types):
-        values = np.array([values], dtype=object)
-    elif (isinstance(values, np.ndarray) and
-          issubclass(values.dtype.type, (np.string_, np.unicode_))):
-        values = values.astype(object)
-    return values
-
-
-def maybe_convert_scalar(values):
-    """
-    Convert a python scalar to the appropriate numpy dtype if possible
-    This avoids numpy directly converting according to platform preferences
-    """
-    if is_scalar(values):
-        dtype, values = infer_dtype_from_scalar(values)
-        try:
-            values = dtype(values)
-        except TypeError:
-            pass
-    return values
-
-
-def coerce_indexer_dtype(indexer, categories):
-    """ coerce the indexer input array to the smallest dtype possible """
-    l = len(categories)
-    if l < _int8_max:
-        return _ensure_int8(indexer)
-    elif l < _int16_max:
-        return _ensure_int16(indexer)
-    elif l < _int32_max:
-        return _ensure_int32(indexer)
-    return _ensure_int64(indexer)
-
-
-def coerce_to_dtypes(result, dtypes):
-    """
-    given a dtypes and a result set, coerce the result elements to the
-    dtypes
-    """
-    if len(result) != len(dtypes):
-        raise AssertionError("_coerce_to_dtypes requires equal len arrays")
-
-    from pandas.tseries.timedeltas import _coerce_scalar_to_timedelta_type
-
-    def conv(r, dtype):
-        try:
-            if isnull(r):
-                pass
-            elif dtype == _NS_DTYPE:
-                r = lib.Timestamp(r)
-            elif dtype == _TD_DTYPE:
-                r = _coerce_scalar_to_timedelta_type(r)
-            elif dtype == np.bool_:
-                # messy. non 0/1 integers do not get converted.
-                if is_integer(r) and r not in [0, 1]:
-                    return int(r)
-                r = bool(r)
-            elif dtype.kind == 'f':
-                r = float(r)
-            elif dtype.kind == 'i':
-                r = int(r)
-        except:
-            pass
-
-        return r
-
-    return [conv(r, dtype) for r, dtype in zip(result, dtypes)]
-
-
-def astype_nansafe(arr, dtype, copy=True):
-    """ return a view if copy is False, but
-        need to be very careful as the result shape could change! """
-    if not isinstance(dtype, np.dtype):
-        dtype = _coerce_to_dtype(dtype)
-
-    if issubclass(dtype.type, text_type):
-        # in Py3 that's str, in Py2 that's unicode
-        return lib.astype_unicode(arr.ravel()).reshape(arr.shape)
-    elif issubclass(dtype.type, string_types):
-        return lib.astype_str(arr.ravel()).reshape(arr.shape)
-    elif is_datetime64_dtype(arr):
-        if dtype == object:
-            return tslib.ints_to_pydatetime(arr.view(np.int64))
-        elif dtype == np.int64:
-            return arr.view(dtype)
-        elif dtype != _NS_DTYPE:
-            raise TypeError("cannot astype a datetimelike from [%s] to [%s]" %
-                            (arr.dtype, dtype))
-        return arr.astype(_NS_DTYPE)
-    elif is_timedelta64_dtype(arr):
-        if dtype == np.int64:
-            return arr.view(dtype)
-        elif dtype == object:
-            return tslib.ints_to_pytimedelta(arr.view(np.int64))
-
-        # in py3, timedelta64[ns] are int64
-        elif ((PY3 and dtype not in [_INT64_DTYPE, _TD_DTYPE]) or
-              (not PY3 and dtype != _TD_DTYPE)):
-
-            # allow frequency conversions
-            if dtype.kind == 'm':
-                mask = isnull(arr)
-                result = arr.astype(dtype).astype(np.float64)
-                result[mask] = np.nan
-                return result
-
-            raise TypeError("cannot astype a timedelta from [%s] to [%s]" %
-                            (arr.dtype, dtype))
-
-        return arr.astype(_TD_DTYPE)
-    elif (np.issubdtype(arr.dtype, np.floating) and
-          np.issubdtype(dtype, np.integer)):
-
-        if not np.isfinite(arr).all():
-            raise ValueError('Cannot convert non-finite values (NA or inf) to '
-                             'integer')
-
-    elif arr.dtype == np.object_ and np.issubdtype(dtype.type, np.integer):
-        # work around NumPy brokenness, #1987
-        return lib.astype_intsafe(arr.ravel(), dtype).reshape(arr.shape)
-
-    if copy:
-        return arr.astype(dtype)
-    return arr.view(dtype)
-
-
-def maybe_convert_objects(values, convert_dates=True, convert_numeric=True,
-                          convert_timedeltas=True, copy=True):
-    """ if we have an object dtype, try to coerce dates and/or numbers """
-
-    # if we have passed in a list or scalar
-    if isinstance(values, (list, tuple)):
-        values = np.array(values, dtype=np.object_)
-    if not hasattr(values, 'dtype'):
-        values = np.array([values], dtype=np.object_)
-
-    # convert dates
-    if convert_dates and values.dtype == np.object_:
-
-        # we take an aggressive stance and convert to datetime64[ns]
-        if convert_dates == 'coerce':
-            new_values = maybe_cast_to_datetime(
-                values, 'M8[ns]', errors='coerce')
-
-            # if we are all nans then leave me alone
-            if not isnull(new_values).all():
-                values = new_values
-
-        else:
-            values = lib.maybe_convert_objects(values,
-                                               convert_datetime=convert_dates)
-
-    # convert timedeltas
-    if convert_timedeltas and values.dtype == np.object_:
-
-        if convert_timedeltas == 'coerce':
-            from pandas.tseries.timedeltas import to_timedelta
-            new_values = to_timedelta(values, coerce=True)
-
-            # if we are all nans then leave me alone
-            if not isnull(new_values).all():
-                values = new_values
-
-        else:
-            values = lib.maybe_convert_objects(
-                values, convert_timedelta=convert_timedeltas)
-
-    # convert to numeric
-    if values.dtype == np.object_:
-        if convert_numeric:
-            try:
-                new_values = lib.maybe_convert_numeric(values, set(),
-                                                       coerce_numeric=True)
-
-                # if we are all nans then leave me alone
-                if not isnull(new_values).all():
-                    values = new_values
-
-            except:
-                pass
-        else:
-            # soft-conversion
-            values = lib.maybe_convert_objects(values)
-
-    values = values.copy() if copy else values
-
-    return values
-
-
-def soft_convert_objects(values, datetime=True, numeric=True, timedelta=True,
-                         coerce=False, copy=True):
-    """ if we have an object dtype, try to coerce dates and/or numbers """
-
-    conversion_count = sum((datetime, numeric, timedelta))
-    if conversion_count == 0:
-        raise ValueError('At least one of datetime, numeric or timedelta must '
-                         'be True.')
-    elif conversion_count > 1 and coerce:
-        raise ValueError("Only one of 'datetime', 'numeric' or "
-                         "'timedelta' can be True when when coerce=True.")
-
-    if isinstance(values, (list, tuple)):
-        # List or scalar
-        values = np.array(values, dtype=np.object_)
-    elif not hasattr(values, 'dtype'):
-        values = np.array([values], dtype=np.object_)
-    elif not is_object_dtype(values.dtype):
-        # If not object, do not attempt conversion
-        values = values.copy() if copy else values
-        return values
-
-    # If 1 flag is coerce, ensure 2 others are False
-    if coerce:
-        # Immediate return if coerce
-        if datetime:
-            from pandas import to_datetime
-            return to_datetime(values, errors='coerce', box=False)
-        elif timedelta:
-            from pandas import to_timedelta
-            return to_timedelta(values, errors='coerce', box=False)
-        elif numeric:
-            from pandas import to_numeric
-            return to_numeric(values, errors='coerce')
-
-    # Soft conversions
-    if datetime:
-        values = lib.maybe_convert_objects(values, convert_datetime=datetime)
-
-    if timedelta and is_object_dtype(values.dtype):
-        # Object check to ensure only run if previous did not convert
-        values = lib.maybe_convert_objects(values, convert_timedelta=timedelta)
-
-    if numeric and is_object_dtype(values.dtype):
-        try:
-            converted = lib.maybe_convert_numeric(values, set(),
-                                                  coerce_numeric=True)
-            # If all NaNs, then do not-alter
-            values = converted if not isnull(converted).all() else values
-            values = values.copy() if copy else values
-        except:
-            pass
-
-    return values
-
-
-def maybe_castable(arr):
-    # return False to force a non-fastpath
-
-    # check datetime64[ns]/timedelta64[ns] are valid
-    # otherwise try to coerce
-    kind = arr.dtype.kind
-    if kind == 'M' or kind == 'm':
-        return is_datetime64_dtype(arr.dtype)
-
-    return arr.dtype.name not in _POSSIBLY_CAST_DTYPES
-
-
-def maybe_infer_to_datetimelike(value, convert_dates=False):
-    """
-    we might have a array (or single object) that is datetime like,
-    and no dtype is passed don't change the value unless we find a
-    datetime/timedelta set
-
-    this is pretty strict in that a datetime/timedelta is REQUIRED
-    in addition to possible nulls/string likes
-
-    ONLY strings are NOT datetimelike
-
-    Parameters
-    ----------
-    value : np.array / Series / Index / list-like
-    convert_dates : boolean, default False
-       if True try really hard to convert dates (such as datetime.date), other
-       leave inferred dtype 'date' alone
-
-    """
-
-    if isinstance(value, (ABCDatetimeIndex, ABCPeriodIndex)):
-        return value
-    elif isinstance(value, ABCSeries):
-        if isinstance(value._values, ABCDatetimeIndex):
-            return value._values
-
-    v = value
-
-    if not is_list_like(v):
-        v = [v]
-    v = np.array(v, copy=False)
-    shape = v.shape
-    if not v.ndim == 1:
-        v = v.ravel()
-
-    if len(v):
-
-        def _try_datetime(v):
-            # safe coerce to datetime64
-            try:
-                v = tslib.array_to_datetime(v, errors='raise')
-            except ValueError:
-
-                # we might have a sequence of the same-datetimes with tz's
-                # if so coerce to a DatetimeIndex; if they are not the same,
-                # then these stay as object dtype
-                try:
-                    from pandas import to_datetime
-                    return to_datetime(v)
-                except:
-                    pass
-
-            except:
-                pass
-
-            return v.reshape(shape)
-
-        def _try_timedelta(v):
-            # safe coerce to timedelta64
-
-            # will try first with a string & object conversion
-            from pandas import to_timedelta
-            try:
-                return to_timedelta(v)._values.reshape(shape)
-            except:
-                return v
-
-        # do a quick inference for perf
-        sample = v[:min(3, len(v))]
-        inferred_type = lib.infer_dtype(sample)
-
-        if (inferred_type in ['datetime', 'datetime64'] or
-                (convert_dates and inferred_type in ['date'])):
-            value = _try_datetime(v)
-        elif inferred_type in ['timedelta', 'timedelta64']:
-            value = _try_timedelta(v)
-
-        # It's possible to have nulls intermixed within the datetime or
-        # timedelta.  These will in general have an inferred_type of 'mixed',
-        # so have to try both datetime and timedelta.
-
-        # try timedelta first to avoid spurious datetime conversions
-        # e.g. '00:00:01' is a timedelta but technically is also a datetime
-        elif inferred_type in ['mixed']:
-
-            if lib.is_possible_datetimelike_array(_ensure_object(v)):
-                value = _try_timedelta(v)
-                if lib.infer_dtype(value) in ['mixed']:
-                    value = _try_datetime(v)
-
-    return value
-
-
-def maybe_cast_to_datetime(value, dtype, errors='raise'):
-    """ try to cast the array/value to a datetimelike dtype, converting float
-    nan to iNaT
-    """
-    from pandas.tseries.timedeltas import to_timedelta
-    from pandas.tseries.tools import to_datetime
-
-    if dtype is not None:
-        if isinstance(dtype, string_types):
-            dtype = np.dtype(dtype)
-
-        is_datetime64 = is_datetime64_dtype(dtype)
-        is_datetime64tz = is_datetime64tz_dtype(dtype)
-        is_timedelta64 = is_timedelta64_dtype(dtype)
-
-        if is_datetime64 or is_datetime64tz or is_timedelta64:
-
-            # force the dtype if needed
-            if is_datetime64 and not is_dtype_equal(dtype, _NS_DTYPE):
-                if dtype.name == 'datetime64[ns]':
-                    dtype = _NS_DTYPE
-                else:
-                    raise TypeError("cannot convert datetimelike to "
-                                    "dtype [%s]" % dtype)
-            elif is_datetime64tz:
-
-                # our NaT doesn't support tz's
-                # this will coerce to DatetimeIndex with
-                # a matching dtype below
-                if is_scalar(value) and isnull(value):
-                    value = [value]
-
-            elif is_timedelta64 and not is_dtype_equal(dtype, _TD_DTYPE):
-                if dtype.name == 'timedelta64[ns]':
-                    dtype = _TD_DTYPE
-                else:
-                    raise TypeError("cannot convert timedeltalike to "
-                                    "dtype [%s]" % dtype)
-
-            if is_scalar(value):
-                if value == iNaT or isnull(value):
-                    value = iNaT
-            else:
-                value = np.array(value, copy=False)
-
-                # have a scalar array-like (e.g. NaT)
-                if value.ndim == 0:
-                    value = iNaT
-
-                # we have an array of datetime or timedeltas & nulls
-                elif np.prod(value.shape) or not is_dtype_equal(value.dtype,
-                                                                dtype):
-                    try:
-                        if is_datetime64:
-                            value = to_datetime(value, errors=errors)._values
-                        elif is_datetime64tz:
-                            # input has to be UTC at this point, so just
-                            # localize
-                            value = (to_datetime(value, errors=errors)
-                                     .tz_localize('UTC')
-                                     .tz_convert(dtype.tz)
-                                     )
-                        elif is_timedelta64:
-                            value = to_timedelta(value, errors=errors)._values
-                    except (AttributeError, ValueError, TypeError):
-                        pass
-
-        # coerce datetimelike to object
-        elif is_datetime64_dtype(value) and not is_datetime64_dtype(dtype):
-            if is_object_dtype(dtype):
-                if value.dtype != _NS_DTYPE:
-                    value = value.astype(_NS_DTYPE)
-                ints = np.asarray(value).view('i8')
-                return tslib.ints_to_pydatetime(ints)
-
-            # we have a non-castable dtype that was passed
-            raise TypeError('Cannot cast datetime64 to %s' % dtype)
-
-    else:
-
-        is_array = isinstance(value, np.ndarray)
-
-        # catch a datetime/timedelta that is not of ns variety
-        # and no coercion specified
-        if is_array and value.dtype.kind in ['M', 'm']:
-            dtype = value.dtype
-
-            if dtype.kind == 'M' and dtype != _NS_DTYPE:
-                value = value.astype(_NS_DTYPE)
-
-            elif dtype.kind == 'm' and dtype != _TD_DTYPE:
-                value = to_timedelta(value)
-
-        # only do this if we have an array and the dtype of the array is not
-        # setup already we are not an integer/object, so don't bother with this
-        # conversion
-        elif not (is_array and not (issubclass(value.dtype.type, np.integer) or
-                                    value.dtype == np.object_)):
-            value = maybe_infer_to_datetimelike(value)
-
-    return value
-
-
-def find_common_type(types):
-    """
-    Find a common data type among the given dtypes.
-
-    Parameters
-    ----------
-    types : list of dtypes
-
-    Returns
-    -------
-    pandas extension or numpy dtype
-
-    See Also
-    --------
-    numpy.find_common_type
-
-    """
-
-    if len(types) == 0:
-        raise ValueError('no types given')
-
-    first = types[0]
-
-    # workaround for find_common_type([np.dtype('datetime64[ns]')] * 2)
-    # => object
-    if all(is_dtype_equal(first, t) for t in types[1:]):
-        return first
-
-    if any(isinstance(t, ExtensionDtype) for t in types):
-        return np.object
-
-    # take lowest unit
-    if all(is_datetime64_dtype(t) for t in types):
-        return np.dtype('datetime64[ns]')
-    if all(is_timedelta64_dtype(t) for t in types):
-        return np.dtype('timedelta64[ns]')
-
-    # don't mix bool / int or float or complex
-    # this is different from numpy, which casts bool with float/int as int
-    has_bools = any(is_bool_dtype(t) for t in types)
-    if has_bools:
-        has_ints = any(is_integer_dtype(t) for t in types)
-        has_floats = any(is_float_dtype(t) for t in types)
-        has_complex = any(is_complex_dtype(t) for t in types)
-        if has_ints or has_floats or has_complex:
-            return np.object
-
-    return np.find_common_type(types, [])
diff --git a/pandas/types/common.py b/pandas/types/common.py
deleted file mode 100644
index a1f03e59a5e6e..0000000000000
--- a/pandas/types/common.py
+++ /dev/null
@@ -1,507 +0,0 @@
-""" common type operations """
-
-import numpy as np
-from pandas.compat import (string_types, text_type, binary_type,
-                           PY3, PY36)
-from pandas._libs import algos, lib
-from .dtypes import (CategoricalDtype, CategoricalDtypeType,
-                     DatetimeTZDtype, DatetimeTZDtypeType,
-                     PeriodDtype, PeriodDtypeType,
-                     ExtensionDtype)
-from .generic import (ABCCategorical, ABCPeriodIndex,
-                      ABCDatetimeIndex, ABCSeries,
-                      ABCSparseArray, ABCSparseSeries)
-from .inference import is_string_like
-from .inference import *  # noqa
-
-
-_POSSIBLY_CAST_DTYPES = set([np.dtype(t).name
-                             for t in ['O', 'int8', 'uint8', 'int16', 'uint16',
-                                       'int32', 'uint32', 'int64', 'uint64']])
-
-_NS_DTYPE = np.dtype('M8[ns]')
-_TD_DTYPE = np.dtype('m8[ns]')
-_INT64_DTYPE = np.dtype(np.int64)
-
-# oh the troubles to reduce import time
-_is_scipy_sparse = None
-
-_ensure_float64 = algos.ensure_float64
-_ensure_float32 = algos.ensure_float32
-
-
-def _ensure_float(arr):
-    if issubclass(arr.dtype.type, (np.integer, np.bool_)):
-        arr = arr.astype(float)
-    return arr
-
-
-_ensure_uint64 = algos.ensure_uint64
-_ensure_int64 = algos.ensure_int64
-_ensure_int32 = algos.ensure_int32
-_ensure_int16 = algos.ensure_int16
-_ensure_int8 = algos.ensure_int8
-_ensure_platform_int = algos.ensure_platform_int
-_ensure_object = algos.ensure_object
-
-
-def _ensure_categorical(arr):
-    if not is_categorical(arr):
-        from pandas import Categorical
-        arr = Categorical(arr)
-    return arr
-
-
-def is_object_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.object_)
-
-
-def is_sparse(array):
-    """ return if we are a sparse array """
-    return isinstance(array, (ABCSparseArray, ABCSparseSeries))
-
-
-def is_scipy_sparse(array):
-    """ return if we are a scipy.sparse.spmatrix """
-    global _is_scipy_sparse
-    if _is_scipy_sparse is None:
-        try:
-            from scipy.sparse import issparse as _is_scipy_sparse
-        except ImportError:
-            _is_scipy_sparse = lambda _: False
-    return _is_scipy_sparse(array)
-
-
-def is_categorical(array):
-    """ return if we are a categorical possibility """
-    return isinstance(array, ABCCategorical) or is_categorical_dtype(array)
-
-
-def is_datetimetz(array):
-    """ return if we are a datetime with tz array """
-    return ((isinstance(array, ABCDatetimeIndex) and
-             getattr(array, 'tz', None) is not None) or
-            is_datetime64tz_dtype(array))
-
-
-def is_period(array):
-    """ return if we are a period array """
-    return isinstance(array, ABCPeriodIndex) or is_period_arraylike(array)
-
-
-def is_datetime64_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype_type(arr_or_dtype)
-    except TypeError:
-        return False
-    return issubclass(tipo, np.datetime64)
-
-
-def is_datetime64tz_dtype(arr_or_dtype):
-    return DatetimeTZDtype.is_dtype(arr_or_dtype)
-
-
-def is_timedelta64_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.timedelta64)
-
-
-def is_period_dtype(arr_or_dtype):
-    return PeriodDtype.is_dtype(arr_or_dtype)
-
-
-def is_categorical_dtype(arr_or_dtype):
-    return CategoricalDtype.is_dtype(arr_or_dtype)
-
-
-def is_string_dtype(arr_or_dtype):
-    dtype = _get_dtype(arr_or_dtype)
-    return dtype.kind in ('O', 'S', 'U') and not is_period_dtype(dtype)
-
-
-def is_period_arraylike(arr):
-    """ return if we are period arraylike / PeriodIndex """
-    if isinstance(arr, ABCPeriodIndex):
-        return True
-    elif isinstance(arr, (np.ndarray, ABCSeries)):
-        return arr.dtype == object and lib.infer_dtype(arr) == 'period'
-    return getattr(arr, 'inferred_type', None) == 'period'
-
-
-def is_datetime_arraylike(arr):
-    """ return if we are datetime arraylike / DatetimeIndex """
-    if isinstance(arr, ABCDatetimeIndex):
-        return True
-    elif isinstance(arr, (np.ndarray, ABCSeries)):
-        return arr.dtype == object and lib.infer_dtype(arr) == 'datetime'
-    return getattr(arr, 'inferred_type', None) == 'datetime'
-
-
-def is_datetimelike(arr):
-    return (is_datetime64_dtype(arr) or is_datetime64tz_dtype(arr) or
-            is_timedelta64_dtype(arr) or
-            isinstance(arr, ABCPeriodIndex) or
-            is_datetimetz(arr))
-
-
-def is_dtype_equal(source, target):
-    """ return a boolean if the dtypes are equal """
-    try:
-        source = _get_dtype(source)
-        target = _get_dtype(target)
-        return source == target
-    except (TypeError, AttributeError):
-
-        # invalid comparison
-        # object == category will hit this
-        return False
-
-
-def is_any_int_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.integer)
-
-
-def is_integer_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.integer) and
-            not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_signed_integer_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.signedinteger) and
-            not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_unsigned_integer_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.unsignedinteger) and
-            not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_int64_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.int64)
-
-
-def is_int_or_datetime_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, np.integer) or
-            issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_datetime64_any_dtype(arr_or_dtype):
-    return (is_datetime64_dtype(arr_or_dtype) or
-            is_datetime64tz_dtype(arr_or_dtype))
-
-
-def is_datetime64_ns_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype(arr_or_dtype)
-    except TypeError:
-        if is_datetime64tz_dtype(arr_or_dtype):
-            tipo = _get_dtype(arr_or_dtype.dtype)
-        else:
-            return False
-    return tipo == _NS_DTYPE or getattr(tipo, 'base', None) == _NS_DTYPE
-
-
-def is_timedelta64_ns_dtype(arr_or_dtype):
-    tipo = _get_dtype(arr_or_dtype)
-    return tipo == _TD_DTYPE
-
-
-def is_datetime_or_timedelta_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, (np.datetime64, np.timedelta64))
-
-
-def _is_unorderable_exception(e):
-    """
-    return a boolean if we an unorderable exception error message
-
-    These are different error message for PY>=3<=3.5 and PY>=3.6
-    """
-    if PY36:
-        return "'>' not supported between instances of" in str(e)
-
-    elif PY3:
-        return 'unorderable' in str(e)
-    return False
-
-
-def is_numeric_v_string_like(a, b):
-    """
-    numpy doesn't like to compare numeric arrays vs scalar string-likes
-
-    return a boolean result if this is the case for a,b or b,a
-
-    """
-    is_a_array = isinstance(a, np.ndarray)
-    is_b_array = isinstance(b, np.ndarray)
-
-    is_a_numeric_array = is_a_array and is_numeric_dtype(a)
-    is_b_numeric_array = is_b_array and is_numeric_dtype(b)
-    is_a_string_array = is_a_array and is_string_like_dtype(a)
-    is_b_string_array = is_b_array and is_string_like_dtype(b)
-
-    is_a_scalar_string_like = not is_a_array and is_string_like(a)
-    is_b_scalar_string_like = not is_b_array and is_string_like(b)
-
-    return ((is_a_numeric_array and is_b_scalar_string_like) or
-            (is_b_numeric_array and is_a_scalar_string_like) or
-            (is_a_numeric_array and is_b_string_array) or
-            (is_b_numeric_array and is_a_string_array))
-
-
-def is_datetimelike_v_numeric(a, b):
-    # return if we have an i8 convertible and numeric comparison
-    if not hasattr(a, 'dtype'):
-        a = np.asarray(a)
-    if not hasattr(b, 'dtype'):
-        b = np.asarray(b)
-
-    def is_numeric(x):
-        return is_integer_dtype(x) or is_float_dtype(x)
-
-    is_datetimelike = needs_i8_conversion
-    return ((is_datetimelike(a) and is_numeric(b)) or
-            (is_datetimelike(b) and is_numeric(a)))
-
-
-def is_datetimelike_v_object(a, b):
-    # return if we have an i8 convertible and object comparsion
-    if not hasattr(a, 'dtype'):
-        a = np.asarray(a)
-    if not hasattr(b, 'dtype'):
-        b = np.asarray(b)
-
-    def f(x):
-        return is_object_dtype(x)
-
-    def is_object(x):
-        return is_integer_dtype(x) or is_float_dtype(x)
-
-    is_datetimelike = needs_i8_conversion
-    return ((is_datetimelike(a) and is_object(b)) or
-            (is_datetimelike(b) and is_object(a)))
-
-
-def needs_i8_conversion(arr_or_dtype):
-    return (is_datetime_or_timedelta_dtype(arr_or_dtype) or
-            is_datetime64tz_dtype(arr_or_dtype) or
-            is_period_dtype(arr_or_dtype))
-
-
-def is_numeric_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return (issubclass(tipo, (np.number, np.bool_)) and
-            not issubclass(tipo, (np.datetime64, np.timedelta64)))
-
-
-def is_string_like_dtype(arr_or_dtype):
-    # exclude object as its a mixed dtype
-    dtype = _get_dtype(arr_or_dtype)
-    return dtype.kind in ('S', 'U')
-
-
-def is_float_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.floating)
-
-
-def is_floating_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return isinstance(tipo, np.floating)
-
-
-def is_bool_dtype(arr_or_dtype):
-    try:
-        tipo = _get_dtype_type(arr_or_dtype)
-    except ValueError:
-        # this isn't even a dtype
-        return False
-    return issubclass(tipo, np.bool_)
-
-
-def is_extension_type(value):
-    """
-    if we are a klass that is preserved by the internals
-    these are internal klasses that we represent (and don't use a np.array)
-    """
-    if is_categorical(value):
-        return True
-    elif is_sparse(value):
-        return True
-    elif is_datetimetz(value):
-        return True
-    return False
-
-
-def is_complex_dtype(arr_or_dtype):
-    tipo = _get_dtype_type(arr_or_dtype)
-    return issubclass(tipo, np.complexfloating)
-
-
-def _coerce_to_dtype(dtype):
-    """ coerce a string / np.dtype to a dtype """
-    if is_categorical_dtype(dtype):
-        dtype = CategoricalDtype()
-    elif is_datetime64tz_dtype(dtype):
-        dtype = DatetimeTZDtype(dtype)
-    elif is_period_dtype(dtype):
-        dtype = PeriodDtype(dtype)
-    else:
-        dtype = np.dtype(dtype)
-    return dtype
-
-
-def _get_dtype(arr_or_dtype):
-    if isinstance(arr_or_dtype, np.dtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, type):
-        return np.dtype(arr_or_dtype)
-    elif isinstance(arr_or_dtype, CategoricalDtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, DatetimeTZDtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, PeriodDtype):
-        return arr_or_dtype
-    elif isinstance(arr_or_dtype, string_types):
-        if is_categorical_dtype(arr_or_dtype):
-            return CategoricalDtype.construct_from_string(arr_or_dtype)
-        elif is_datetime64tz_dtype(arr_or_dtype):
-            return DatetimeTZDtype.construct_from_string(arr_or_dtype)
-        elif is_period_dtype(arr_or_dtype):
-            return PeriodDtype.construct_from_string(arr_or_dtype)
-
-    if hasattr(arr_or_dtype, 'dtype'):
-        arr_or_dtype = arr_or_dtype.dtype
-    return np.dtype(arr_or_dtype)
-
-
-def _get_dtype_type(arr_or_dtype):
-    if isinstance(arr_or_dtype, np.dtype):
-        return arr_or_dtype.type
-    elif isinstance(arr_or_dtype, type):
-        return np.dtype(arr_or_dtype).type
-    elif isinstance(arr_or_dtype, CategoricalDtype):
-        return CategoricalDtypeType
-    elif isinstance(arr_or_dtype, DatetimeTZDtype):
-        return DatetimeTZDtypeType
-    elif isinstance(arr_or_dtype, PeriodDtype):
-        return PeriodDtypeType
-    elif isinstance(arr_or_dtype, string_types):
-        if is_categorical_dtype(arr_or_dtype):
-            return CategoricalDtypeType
-        elif is_datetime64tz_dtype(arr_or_dtype):
-            return DatetimeTZDtypeType
-        elif is_period_dtype(arr_or_dtype):
-            return PeriodDtypeType
-        return _get_dtype_type(np.dtype(arr_or_dtype))
-    try:
-        return arr_or_dtype.dtype.type
-    except AttributeError:
-        return type(None)
-
-
-def _get_dtype_from_object(dtype):
-    """Get a numpy dtype.type-style object. This handles the datetime64[ns]
-    and datetime64[ns, TZ] compat
-
-    Notes
-    -----
-    If nothing can be found, returns ``object``.
-    """
-
-    # type object from a dtype
-    if isinstance(dtype, type) and issubclass(dtype, np.generic):
-        return dtype
-    elif is_categorical(dtype):
-        return CategoricalDtype().type
-    elif is_datetimetz(dtype):
-        return DatetimeTZDtype(dtype).type
-    elif isinstance(dtype, np.dtype):  # dtype object
-        try:
-            _validate_date_like_dtype(dtype)
-        except TypeError:
-            # should still pass if we don't have a datelike
-            pass
-        return dtype.type
-    elif isinstance(dtype, string_types):
-        if dtype in ['datetimetz', 'datetime64tz']:
-            return DatetimeTZDtype.type
-        elif dtype in ['period']:
-            raise NotImplementedError
-
-        if dtype == 'datetime' or dtype == 'timedelta':
-            dtype += '64'
-
-        try:
-            return _get_dtype_from_object(getattr(np, dtype))
-        except (AttributeError, TypeError):
-            # handles cases like _get_dtype(int)
-            # i.e., python objects that are valid dtypes (unlike user-defined
-            # types, in general)
-            # TypeError handles the float16 typecode of 'e'
-            # further handle internal types
-            pass
-
-    return _get_dtype_from_object(np.dtype(dtype))
-
-
-def _validate_date_like_dtype(dtype):
-    try:
-        typ = np.datetime_data(dtype)[0]
-    except ValueError as e:
-        raise TypeError('%s' % e)
-    if typ != 'generic' and typ != 'ns':
-        raise ValueError('%r is too specific of a frequency, try passing %r' %
-                         (dtype.name, dtype.type.__name__))
-
-
-_string_dtypes = frozenset(map(_get_dtype_from_object, (binary_type,
-                                                        text_type)))
-
-
-def pandas_dtype(dtype):
-    """
-    Converts input into a pandas only dtype object or a numpy dtype object.
-
-    Parameters
-    ----------
-    dtype : object to be converted
-
-    Returns
-    -------
-    np.dtype or a pandas dtype
-    """
-    if isinstance(dtype, DatetimeTZDtype):
-        return dtype
-    elif isinstance(dtype, PeriodDtype):
-        return dtype
-    elif isinstance(dtype, CategoricalDtype):
-        return dtype
-    elif isinstance(dtype, string_types):
-        try:
-            return DatetimeTZDtype.construct_from_string(dtype)
-        except TypeError:
-            pass
-
-        if dtype.startswith('period[') or dtype.startswith('Period['):
-            # do not parse string like U as period[U]
-            try:
-                return PeriodDtype.construct_from_string(dtype)
-            except TypeError:
-                pass
-
-        try:
-            return CategoricalDtype.construct_from_string(dtype)
-        except TypeError:
-            pass
-    elif isinstance(dtype, ExtensionDtype):
-        return dtype
-
-    return np.dtype(dtype)
diff --git a/pandas/types/concat.py b/pandas/types/concat.py
deleted file mode 100644
index b098bbb75d984..0000000000000
--- a/pandas/types/concat.py
+++ /dev/null
@@ -1,488 +0,0 @@
-"""
-Utility functions related to concat
-"""
-
-import numpy as np
-import pandas._libs.tslib as tslib
-from pandas import compat
-from pandas.core.algorithms import take_1d
-from .common import (is_categorical_dtype,
-                     is_sparse,
-                     is_datetimetz,
-                     is_datetime64_dtype,
-                     is_timedelta64_dtype,
-                     is_period_dtype,
-                     is_object_dtype,
-                     is_bool_dtype,
-                     is_dtype_equal,
-                     _NS_DTYPE,
-                     _TD_DTYPE)
-from pandas.types.generic import (ABCDatetimeIndex, ABCTimedeltaIndex,
-                                  ABCPeriodIndex)
-
-
-def get_dtype_kinds(l):
-    """
-    Parameters
-    ----------
-    l : list of arrays
-
-    Returns
-    -------
-    a set of kinds that exist in this list of arrays
-    """
-
-    typs = set()
-    for arr in l:
-
-        dtype = arr.dtype
-        if is_categorical_dtype(dtype):
-            typ = 'category'
-        elif is_sparse(arr):
-            typ = 'sparse'
-        elif is_datetimetz(arr):
-            # if to_concat contains different tz,
-            # the result must be object dtype
-            typ = str(arr.dtype)
-        elif is_datetime64_dtype(dtype):
-            typ = 'datetime'
-        elif is_timedelta64_dtype(dtype):
-            typ = 'timedelta'
-        elif is_object_dtype(dtype):
-            typ = 'object'
-        elif is_bool_dtype(dtype):
-            typ = 'bool'
-        elif is_period_dtype(dtype):
-            typ = str(arr.dtype)
-        else:
-            typ = dtype.kind
-        typs.add(typ)
-    return typs
-
-
-def _get_series_result_type(result):
-    """
-    return appropriate class of Series concat
-    input is either dict or array-like
-    """
-    if isinstance(result, dict):
-        # concat Series with axis 1
-        if all(is_sparse(c) for c in compat.itervalues(result)):
-            from pandas.sparse.api import SparseDataFrame
-            return SparseDataFrame
-        else:
-            from pandas.core.frame import DataFrame
-            return DataFrame
-
-    elif is_sparse(result):
-        # concat Series with axis 1
-        from pandas.sparse.api import SparseSeries
-        return SparseSeries
-    else:
-        from pandas.core.series import Series
-        return Series
-
-
-def _get_frame_result_type(result, objs):
-    """
-    return appropriate class of DataFrame-like concat
-    if any block is SparseBlock, return SparseDataFrame
-    otherwise, return 1st obj
-    """
-    if any(b.is_sparse for b in result.blocks):
-        from pandas.sparse.api import SparseDataFrame
-        return SparseDataFrame
-    else:
-        return objs[0]
-
-
-def _concat_compat(to_concat, axis=0):
-    """
-    provide concatenation of an array of arrays each of which is a single
-    'normalized' dtypes (in that for example, if it's object, then it is a
-    non-datetimelike and provide a combined dtype for the resulting array that
-    preserves the overall dtype if possible)
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
-    """
-
-    # filter empty arrays
-    # 1-d dtypes always are included here
-    def is_nonempty(x):
-        try:
-            return x.shape[axis] > 0
-        except Exception:
-            return True
-
-    nonempty = [x for x in to_concat if is_nonempty(x)]
-
-    # If all arrays are empty, there's nothing to convert, just short-cut to
-    # the concatenation, #3121.
-    #
-    # Creating an empty array directly is tempting, but the winnings would be
-    # marginal given that it would still require shape & dtype calculation and
-    # np.concatenate which has them both implemented is compiled.
-
-    typs = get_dtype_kinds(to_concat)
-
-    _contains_datetime = any(typ.startswith('datetime') for typ in typs)
-    _contains_period = any(typ.startswith('period') for typ in typs)
-
-    if 'category' in typs:
-        # this must be priort to _concat_datetime,
-        # to support Categorical + datetime-like
-        return _concat_categorical(to_concat, axis=axis)
-
-    elif _contains_datetime or 'timedelta' in typs or _contains_period:
-        return _concat_datetime(to_concat, axis=axis, typs=typs)
-
-    # these are mandated to handle empties as well
-    elif 'sparse' in typs:
-        return _concat_sparse(to_concat, axis=axis, typs=typs)
-
-    if not nonempty:
-        # we have all empties, but may need to coerce the result dtype to
-        # object if we have non-numeric type operands (numpy would otherwise
-        # cast this to float)
-        typs = get_dtype_kinds(to_concat)
-        if len(typs) != 1:
-
-            if (not len(typs - set(['i', 'u', 'f'])) or
-                    not len(typs - set(['bool', 'i', 'u']))):
-                # let numpy coerce
-                pass
-            else:
-                # coerce to object
-                to_concat = [x.astype('object') for x in to_concat]
-
-    return np.concatenate(to_concat, axis=axis)
-
-
-def _concat_categorical(to_concat, axis=0):
-    """Concatenate an object/categorical array of arrays, each of which is a
-    single dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : int
-        Axis to provide concatenation in the current implementation this is
-        always 0, e.g. we only have 1D categoricals
-
-    Returns
-    -------
-    Categorical
-        A single array, preserving the combined dtypes
-    """
-
-    def _concat_asobject(to_concat):
-        to_concat = [x.get_values() if is_categorical_dtype(x.dtype)
-                     else x.ravel() for x in to_concat]
-        res = _concat_compat(to_concat)
-        if axis == 1:
-            return res.reshape(1, len(res))
-        else:
-            return res
-
-    # we could have object blocks and categoricals here
-    # if we only have a single categoricals then combine everything
-    # else its a non-compat categorical
-    categoricals = [x for x in to_concat if is_categorical_dtype(x.dtype)]
-
-    # validate the categories
-    if len(categoricals) != len(to_concat):
-        pass
-    else:
-        # when all categories are identical
-        first = to_concat[0]
-        if all(first.is_dtype_equal(other) for other in to_concat[1:]):
-            return union_categoricals(categoricals)
-
-    return _concat_asobject(to_concat)
-
-
-def union_categoricals(to_union, sort_categories=False, ignore_order=False):
-    """
-    Combine list-like of Categorical-like, unioning categories. All
-    categories must have the same dtype.
-
-    .. versionadded:: 0.19.0
-
-    Parameters
-    ----------
-    to_union : list-like of Categorical, CategoricalIndex,
-               or Series with dtype='category'
-    sort_categories : boolean, default False
-        If true, resulting categories will be lexsorted, otherwise
-        they will be ordered as they appear in the data.
-    ignore_order: boolean, default False
-        If true, the ordered attribute of the Categoricals will be ignored.
-        Results in an unordered categorical.
-
-        .. versionadded:: 0.20.0
-
-    Returns
-    -------
-    result : Categorical
-
-    Raises
-    ------
-    TypeError
-        - all inputs do not have the same dtype
-        - all inputs do not have the same ordered property
-        - all inputs are ordered and their categories are not identical
-        - sort_categories=True and Categoricals are ordered
-    ValueError
-        Empty list of categoricals passed
-    """
-    from pandas import Index, Categorical, CategoricalIndex, Series
-
-    if len(to_union) == 0:
-        raise ValueError('No Categoricals to union')
-
-    def _maybe_unwrap(x):
-        if isinstance(x, (CategoricalIndex, Series)):
-            return x.values
-        elif isinstance(x, Categorical):
-            return x
-        else:
-            raise TypeError("all components to combine must be Categorical")
-
-    to_union = [_maybe_unwrap(x) for x in to_union]
-    first = to_union[0]
-
-    if not all(is_dtype_equal(other.categories.dtype, first.categories.dtype)
-               for other in to_union[1:]):
-        raise TypeError("dtype of categories must be the same")
-
-    ordered = False
-    if all(first.is_dtype_equal(other) for other in to_union[1:]):
-        # identical categories - fastpath
-        categories = first.categories
-        ordered = first.ordered
-        new_codes = np.concatenate([c.codes for c in to_union])
-
-        if sort_categories and not ignore_order and ordered:
-            raise TypeError("Cannot use sort_categories=True with "
-                            "ordered Categoricals")
-
-        if sort_categories and not categories.is_monotonic_increasing:
-            categories = categories.sort_values()
-            indexer = categories.get_indexer(first.categories)
-            new_codes = take_1d(indexer, new_codes, fill_value=-1)
-    elif ignore_order or all(not c.ordered for c in to_union):
-        # different categories - union and recode
-        cats = first.categories.append([c.categories for c in to_union[1:]])
-        categories = Index(cats.unique())
-        if sort_categories:
-            categories = categories.sort_values()
-
-        new_codes = []
-        for c in to_union:
-            if len(c.categories) > 0:
-                indexer = categories.get_indexer(c.categories)
-                new_codes.append(take_1d(indexer, c.codes, fill_value=-1))
-            else:
-                # must be all NaN
-                new_codes.append(c.codes)
-        new_codes = np.concatenate(new_codes)
-    else:
-        # ordered - to show a proper error message
-        if all(c.ordered for c in to_union):
-            msg = ("to union ordered Categoricals, "
-                   "all categories must be the same")
-            raise TypeError(msg)
-        else:
-            raise TypeError('Categorical.ordered must be the same')
-
-    if ignore_order:
-        ordered = False
-
-    return Categorical(new_codes, categories=categories, ordered=ordered,
-                       fastpath=True)
-
-
-def _concat_datetime(to_concat, axis=0, typs=None):
-    """
-    provide concatenation of an datetimelike array of arrays each of which is a
-    single M8[ns], datetimet64[ns, tz] or m8[ns] dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-    typs : set of to_concat dtypes
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
-    """
-
-    def convert_to_pydatetime(x, axis):
-        # coerce to an object dtype
-
-        # if dtype is of datetimetz or timezone
-        if x.dtype.kind == _NS_DTYPE.kind:
-            if getattr(x, 'tz', None) is not None:
-                x = x.asobject.values
-            else:
-                shape = x.shape
-                x = tslib.ints_to_pydatetime(x.view(np.int64).ravel(),
-                                             box=True)
-                x = x.reshape(shape)
-
-        elif x.dtype == _TD_DTYPE:
-            shape = x.shape
-            x = tslib.ints_to_pytimedelta(x.view(np.int64).ravel(), box=True)
-            x = x.reshape(shape)
-
-        if axis == 1:
-            x = np.atleast_2d(x)
-        return x
-
-    if typs is None:
-        typs = get_dtype_kinds(to_concat)
-
-    # must be single dtype
-    if len(typs) == 1:
-        _contains_datetime = any(typ.startswith('datetime') for typ in typs)
-        _contains_period = any(typ.startswith('period') for typ in typs)
-
-        if _contains_datetime:
-
-            if 'datetime' in typs:
-                new_values = np.concatenate([x.view(np.int64) for x in
-                                             to_concat], axis=axis)
-                return new_values.view(_NS_DTYPE)
-            else:
-                # when to_concat has different tz, len(typs) > 1.
-                # thus no need to care
-                return _concat_datetimetz(to_concat)
-
-        elif 'timedelta' in typs:
-            new_values = np.concatenate([x.view(np.int64) for x in to_concat],
-                                        axis=axis)
-            return new_values.view(_TD_DTYPE)
-
-        elif _contains_period:
-            # PeriodIndex must be handled by PeriodIndex,
-            # Thus can't meet this condition ATM
-            # Must be changed when we adding PeriodDtype
-            raise NotImplementedError
-
-    # need to coerce to object
-    to_concat = [convert_to_pydatetime(x, axis) for x in to_concat]
-    return np.concatenate(to_concat, axis=axis)
-
-
-def _concat_datetimetz(to_concat, name=None):
-    """
-    concat DatetimeIndex with the same tz
-    all inputs must be DatetimeIndex
-    it is used in DatetimeIndex.append also
-    """
-    # do not pass tz to set because tzlocal cannot be hashed
-    if len(set([str(x.dtype) for x in to_concat])) != 1:
-        raise ValueError('to_concat must have the same tz')
-    tz = to_concat[0].tz
-    # no need to localize because internal repr will not be changed
-    new_values = np.concatenate([x.asi8 for x in to_concat])
-    return to_concat[0]._simple_new(new_values, tz=tz, name=name)
-
-
-def _concat_index_asobject(to_concat, name=None):
-    """
-    concat all inputs as object. DatetimeIndex, TimedeltaIndex and
-    PeriodIndex are converted to object dtype before concatenation
-    """
-
-    klasses = ABCDatetimeIndex, ABCTimedeltaIndex, ABCPeriodIndex
-    to_concat = [x.asobject if isinstance(x, klasses) else x
-                 for x in to_concat]
-
-    from pandas import Index
-    self = to_concat[0]
-    attribs = self._get_attributes_dict()
-    attribs['name'] = name
-
-    to_concat = [x._values if isinstance(x, Index) else x
-                 for x in to_concat]
-    return self._shallow_copy_with_infer(np.concatenate(to_concat), **attribs)
-
-
-def _concat_sparse(to_concat, axis=0, typs=None):
-    """
-    provide concatenation of an sparse/dense array of arrays each of which is a
-    single dtype
-
-    Parameters
-    ----------
-    to_concat : array of arrays
-    axis : axis to provide concatenation
-    typs : set of to_concat dtypes
-
-    Returns
-    -------
-    a single array, preserving the combined dtypes
-    """
-
-    from pandas.sparse.array import SparseArray, _make_index
-
-    def convert_sparse(x, axis):
-        # coerce to native type
-        if isinstance(x, SparseArray):
-            x = x.get_values()
-        x = x.ravel()
-        if axis > 0:
-            x = np.atleast_2d(x)
-        return x
-
-    if typs is None:
-        typs = get_dtype_kinds(to_concat)
-
-    if len(typs) == 1:
-        # concat input as it is if all inputs are sparse
-        # and have the same fill_value
-        fill_values = set(c.fill_value for c in to_concat)
-        if len(fill_values) == 1:
-            sp_values = [c.sp_values for c in to_concat]
-            indexes = [c.sp_index.to_int_index() for c in to_concat]
-
-            indices = []
-            loc = 0
-            for idx in indexes:
-                indices.append(idx.indices + loc)
-                loc += idx.length
-            sp_values = np.concatenate(sp_values)
-            indices = np.concatenate(indices)
-            sp_index = _make_index(loc, indices, kind=to_concat[0].sp_index)
-
-            return SparseArray(sp_values, sparse_index=sp_index,
-                               fill_value=to_concat[0].fill_value)
-
-    # input may be sparse / dense mixed and may have different fill_value
-    # input must contain sparse at least 1
-    sparses = [c for c in to_concat if is_sparse(c)]
-    fill_values = [c.fill_value for c in sparses]
-    sp_indexes = [c.sp_index for c in sparses]
-
-    # densify and regular concat
-    to_concat = [convert_sparse(x, axis) for x in to_concat]
-    result = np.concatenate(to_concat, axis=axis)
-
-    if not len(typs - set(['sparse', 'f', 'i'])):
-        # sparsify if inputs are sparse and dense numerics
-        # first sparse input's fill_value and SparseIndex is used
-        result = SparseArray(result.ravel(), fill_value=fill_values[0],
-                             kind=sp_indexes[0])
-    else:
-        # coerce to object if needed
-        result = result.astype('object')
-    return result
diff --git a/pandas/types/dtypes.py b/pandas/types/dtypes.py
deleted file mode 100644
index 43135ba94ab46..0000000000000
--- a/pandas/types/dtypes.py
+++ /dev/null
@@ -1,367 +0,0 @@
-""" define extension dtypes """
-
-import re
-import numpy as np
-from pandas import compat
-
-
-class ExtensionDtype(object):
-    """
-    A np.dtype duck-typed class, suitable for holding a custom dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE
-    """
-    name = None
-    names = None
-    type = None
-    subdtype = None
-    kind = None
-    str = None
-    num = 100
-    shape = tuple()
-    itemsize = 8
-    base = None
-    isbuiltin = 0
-    isnative = 0
-    _metadata = []
-
-    def __unicode__(self):
-        return self.name
-
-    def __str__(self):
-        """
-        Return a string representation for a particular Object
-
-        Invoked by str(df) in both py2/py3.
-        Yields Bytestring in Py2, Unicode String in py3.
-        """
-
-        if compat.PY3:
-            return self.__unicode__()
-        return self.__bytes__()
-
-    def __bytes__(self):
-        """
-        Return a string representation for a particular object.
-
-        Invoked by bytes(obj) in py3 only.
-        Yields a bytestring in both py2/py3.
-        """
-        from pandas.core.config import get_option
-
-        encoding = get_option("display.encoding")
-        return self.__unicode__().encode(encoding, 'replace')
-
-    def __repr__(self):
-        """
-        Return a string representation for a particular object.
-
-        Yields Bytestring in Py2, Unicode String in py3.
-        """
-        return str(self)
-
-    def __hash__(self):
-        raise NotImplementedError("sub-classes should implement an __hash__ "
-                                  "method")
-
-    def __eq__(self, other):
-        raise NotImplementedError("sub-classes should implement an __eq__ "
-                                  "method")
-
-    def __ne__(self, other):
-        return not self.__eq__(other)
-
-    @classmethod
-    def is_dtype(cls, dtype):
-        """ Return a boolean if the passed type is an actual dtype that
-        we can match (via string or type)
-        """
-        if hasattr(dtype, 'dtype'):
-            dtype = dtype.dtype
-        if isinstance(dtype, cls):
-            return True
-        elif isinstance(dtype, np.dtype):
-            return False
-        try:
-            return cls.construct_from_string(dtype) is not None
-        except:
-            return False
-
-
-class CategoricalDtypeType(type):
-    """
-    the type of CategoricalDtype, this metaclass determines subclass ability
-    """
-    pass
-
-
-class CategoricalDtype(ExtensionDtype):
-
-    """
-    A np.dtype duck-typed class, suitable for holding a custom categorical
-    dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.object
-    """
-    name = 'category'
-    type = CategoricalDtypeType
-    kind = 'O'
-    str = '|O08'
-    base = np.dtype('O')
-    _cache = {}
-
-    def __new__(cls):
-
-        try:
-            return cls._cache[cls.name]
-        except KeyError:
-            c = object.__new__(cls)
-            cls._cache[cls.name] = c
-            return c
-
-    def __hash__(self):
-        # make myself hashable
-        return hash(str(self))
-
-    def __eq__(self, other):
-        if isinstance(other, compat.string_types):
-            return other == self.name
-
-        return isinstance(other, CategoricalDtype)
-
-    @classmethod
-    def construct_from_string(cls, string):
-        """ attempt to construct this type from a string, raise a TypeError if
-        it's not possible """
-        try:
-            if string == 'category':
-                return cls()
-        except:
-            pass
-
-        raise TypeError("cannot construct a CategoricalDtype")
-
-
-class DatetimeTZDtypeType(type):
-    """
-    the type of DatetimeTZDtype, this metaclass determines subclass ability
-    """
-    pass
-
-
-class DatetimeTZDtype(ExtensionDtype):
-
-    """
-    A np.dtype duck-typed class, suitable for holding a custom datetime with tz
-    dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of
-    np.datetime64[ns]
-    """
-    type = DatetimeTZDtypeType
-    kind = 'M'
-    str = '|M8[ns]'
-    num = 101
-    base = np.dtype('M8[ns]')
-    _metadata = ['unit', 'tz']
-    _match = re.compile("(datetime64|M8)\[(?P<unit>.+), (?P<tz>.+)\]")
-    _cache = {}
-
-    def __new__(cls, unit=None, tz=None):
-        """ Create a new unit if needed, otherwise return from the cache
-
-        Parameters
-        ----------
-        unit : string unit that this represents, currently must be 'ns'
-        tz : string tz that this represents
-        """
-
-        if isinstance(unit, DatetimeTZDtype):
-            unit, tz = unit.unit, unit.tz
-
-        elif unit is None:
-            # we are called as an empty constructor
-            # generally for pickle compat
-            return object.__new__(cls)
-
-        elif tz is None:
-
-            # we were passed a string that we can construct
-            try:
-                m = cls._match.search(unit)
-                if m is not None:
-                    unit = m.groupdict()['unit']
-                    tz = m.groupdict()['tz']
-            except:
-                raise ValueError("could not construct DatetimeTZDtype")
-
-        elif isinstance(unit, compat.string_types):
-
-            if unit != 'ns':
-                raise ValueError("DatetimeTZDtype only supports ns units")
-
-            unit = unit
-            tz = tz
-
-        if tz is None:
-            raise ValueError("DatetimeTZDtype constructor must have a tz "
-                             "supplied")
-
-        # set/retrieve from cache
-        key = (unit, str(tz))
-        try:
-            return cls._cache[key]
-        except KeyError:
-            u = object.__new__(cls)
-            u.unit = unit
-            u.tz = tz
-            cls._cache[key] = u
-            return u
-
-    @classmethod
-    def construct_from_string(cls, string):
-        """ attempt to construct this type from a string, raise a TypeError if
-        it's not possible
-        """
-        try:
-            return cls(unit=string)
-        except ValueError:
-            raise TypeError("could not construct DatetimeTZDtype")
-
-    def __unicode__(self):
-        # format the tz
-        return "datetime64[{unit}, {tz}]".format(unit=self.unit, tz=self.tz)
-
-    @property
-    def name(self):
-        return str(self)
-
-    def __hash__(self):
-        # make myself hashable
-        return hash(str(self))
-
-    def __eq__(self, other):
-        if isinstance(other, compat.string_types):
-            return other == self.name
-
-        return (isinstance(other, DatetimeTZDtype) and
-                self.unit == other.unit and
-                str(self.tz) == str(other.tz))
-
-
-class PeriodDtypeType(type):
-    """
-    the type of PeriodDtype, this metaclass determines subclass ability
-    """
-    pass
-
-
-class PeriodDtype(ExtensionDtype):
-    __metaclass__ = PeriodDtypeType
-    """
-    A Period duck-typed class, suitable for holding a period with freq dtype.
-
-    THIS IS NOT A REAL NUMPY DTYPE, but essentially a sub-class of np.int64.
-    """
-    type = PeriodDtypeType
-    kind = 'O'
-    str = '|O08'
-    base = np.dtype('O')
-    num = 102
-    _metadata = ['freq']
-    _match = re.compile("(P|p)eriod\[(?P<freq>.+)\]")
-    _cache = {}
-
-    def __new__(cls, freq=None):
-        """
-        Parameters
-        ----------
-        freq : frequency
-        """
-
-        if isinstance(freq, PeriodDtype):
-            return freq
-
-        elif freq is None:
-            # empty constructor for pickle compat
-            return object.__new__(cls)
-
-        from pandas.tseries.offsets import DateOffset
-        if not isinstance(freq, DateOffset):
-            freq = cls._parse_dtype_strict(freq)
-
-        try:
-            return cls._cache[freq.freqstr]
-        except KeyError:
-            u = object.__new__(cls)
-            u.freq = freq
-            cls._cache[freq.freqstr] = u
-            return u
-
-    @classmethod
-    def _parse_dtype_strict(cls, freq):
-        if isinstance(freq, compat.string_types):
-            if freq.startswith('period[') or freq.startswith('Period['):
-                m = cls._match.search(freq)
-                if m is not None:
-                    freq = m.group('freq')
-            from pandas.tseries.frequencies import to_offset
-            freq = to_offset(freq)
-            if freq is not None:
-                return freq
-
-        raise ValueError("could not construct PeriodDtype")
-
-    @classmethod
-    def construct_from_string(cls, string):
-        """
-        attempt to construct this type from a string, raise a TypeError
-        if its not possible
-        """
-        from pandas.tseries.offsets import DateOffset
-        if isinstance(string, (compat.string_types, DateOffset)):
-            # avoid tuple to be regarded as freq
-            try:
-                return cls(freq=string)
-            except ValueError:
-                pass
-        raise TypeError("could not construct PeriodDtype")
-
-    def __unicode__(self):
-        return "period[{freq}]".format(freq=self.freq.freqstr)
-
-    @property
-    def name(self):
-        return str(self)
-
-    def __hash__(self):
-        # make myself hashable
-        return hash(str(self))
-
-    def __eq__(self, other):
-        if isinstance(other, compat.string_types):
-            return other == self.name or other == self.name.title()
-
-        return isinstance(other, PeriodDtype) and self.freq == other.freq
-
-    @classmethod
-    def is_dtype(cls, dtype):
-        """
-        Return a boolean if we if the passed type is an actual dtype that we
-        can match (via string or type)
-        """
-
-        if isinstance(dtype, compat.string_types):
-            # PeriodDtype can be instanciated from freq string like "U",
-            # but dosn't regard freq str like "U" as dtype.
-            if dtype.startswith('period[') or dtype.startswith('Period['):
-                try:
-                    if cls._parse_dtype_strict(dtype) is not None:
-                        return True
-                    else:
-                        return False
-                except ValueError:
-                    return False
-            else:
-                return False
-        return super(PeriodDtype, cls).is_dtype(dtype)
diff --git a/pandas/types/generic.py b/pandas/types/generic.py
deleted file mode 100644
index e7b54ccc6f25e..0000000000000
--- a/pandas/types/generic.py
+++ /dev/null
@@ -1,61 +0,0 @@
-""" define generic base classes for pandas objects """
-
-
-# define abstract base classes to enable isinstance type checking on our
-# objects
-def create_pandas_abc_type(name, attr, comp):
-    @classmethod
-    def _check(cls, inst):
-        return getattr(inst, attr, '_typ') in comp
-
-    dct = dict(__instancecheck__=_check, __subclasscheck__=_check)
-    meta = type("ABCBase", (type, ), dct)
-    return meta(name, tuple(), dct)
-
-
-ABCIndex = create_pandas_abc_type("ABCIndex", "_typ", ("index", ))
-ABCInt64Index = create_pandas_abc_type("ABCInt64Index", "_typ",
-                                       ("int64index", ))
-ABCUInt64Index = create_pandas_abc_type("ABCUInt64Index", "_typ",
-                                        ("uint64index", ))
-ABCRangeIndex = create_pandas_abc_type("ABCRangeIndex", "_typ",
-                                       ("rangeindex", ))
-ABCFloat64Index = create_pandas_abc_type("ABCFloat64Index", "_typ",
-                                         ("float64index", ))
-ABCMultiIndex = create_pandas_abc_type("ABCMultiIndex", "_typ",
-                                       ("multiindex", ))
-ABCDatetimeIndex = create_pandas_abc_type("ABCDatetimeIndex", "_typ",
-                                          ("datetimeindex", ))
-ABCTimedeltaIndex = create_pandas_abc_type("ABCTimedeltaIndex", "_typ",
-                                           ("timedeltaindex", ))
-ABCPeriodIndex = create_pandas_abc_type("ABCPeriodIndex", "_typ",
-                                        ("periodindex", ))
-ABCCategoricalIndex = create_pandas_abc_type("ABCCategoricalIndex", "_typ",
-                                             ("categoricalindex", ))
-ABCIndexClass = create_pandas_abc_type("ABCIndexClass", "_typ",
-                                       ("index", "int64index", "rangeindex",
-                                        "float64index", "uint64index",
-                                        "multiindex", "datetimeindex",
-                                        "timedeltaindex", "periodindex",
-                                        "categoricalindex"))
-
-ABCSeries = create_pandas_abc_type("ABCSeries", "_typ", ("series", ))
-ABCDataFrame = create_pandas_abc_type("ABCDataFrame", "_typ", ("dataframe", ))
-ABCPanel = create_pandas_abc_type("ABCPanel", "_typ", ("panel", "panel4d"))
-ABCSparseSeries = create_pandas_abc_type("ABCSparseSeries", "_subtyp",
-                                         ('sparse_series',
-                                          'sparse_time_series'))
-ABCSparseArray = create_pandas_abc_type("ABCSparseArray", "_subtyp",
-                                        ('sparse_array', 'sparse_series'))
-ABCCategorical = create_pandas_abc_type("ABCCategorical", "_typ",
-                                        ("categorical"))
-ABCPeriod = create_pandas_abc_type("ABCPeriod", "_typ", ("period", ))
-
-
-class _ABCGeneric(type):
-
-    def __instancecheck__(cls, inst):
-        return hasattr(inst, "_data")
-
-
-ABCGeneric = _ABCGeneric("ABCGeneric", tuple(), {})
diff --git a/pandas/types/inference.py b/pandas/types/inference.py
deleted file mode 100644
index d8e3b3ee7329b..0000000000000
--- a/pandas/types/inference.py
+++ /dev/null
@@ -1,106 +0,0 @@
-""" basic inference routines """
-
-import collections
-import re
-import numpy as np
-from numbers import Number
-from pandas.compat import (string_types, text_type,
-                           string_and_binary_types)
-from pandas._libs import lib
-
-is_bool = lib.is_bool
-
-is_integer = lib.is_integer
-
-is_float = lib.is_float
-
-is_complex = lib.is_complex
-
-is_scalar = lib.isscalar
-
-is_decimal = lib.is_decimal
-
-
-def is_number(obj):
-    return isinstance(obj, (Number, np.number))
-
-
-def is_string_like(obj):
-    return isinstance(obj, (text_type, string_types))
-
-
-def _iterable_not_string(x):
-    return (isinstance(x, collections.Iterable) and
-            not isinstance(x, string_types))
-
-
-def is_iterator(obj):
-    # python 3 generators have __next__ instead of next
-    return hasattr(obj, 'next') or hasattr(obj, '__next__')
-
-
-def is_re(obj):
-    return isinstance(obj, re._pattern_type)
-
-
-def is_re_compilable(obj):
-    try:
-        re.compile(obj)
-    except TypeError:
-        return False
-    else:
-        return True
-
-
-def is_list_like(arg):
-    return (hasattr(arg, '__iter__') and
-            not isinstance(arg, string_and_binary_types))
-
-
-def is_dict_like(arg):
-    return hasattr(arg, '__getitem__') and hasattr(arg, 'keys')
-
-
-def is_named_tuple(arg):
-    return isinstance(arg, tuple) and hasattr(arg, '_fields')
-
-
-def is_hashable(arg):
-    """Return True if hash(arg) will succeed, False otherwise.
-
-    Some types will pass a test against collections.Hashable but fail when they
-    are actually hashed with hash().
-
-    Distinguish between these and other types by trying the call to hash() and
-    seeing if they raise TypeError.
-
-    Examples
-    --------
-    >>> a = ([],)
-    >>> isinstance(a, collections.Hashable)
-    True
-    >>> is_hashable(a)
-    False
-    """
-    # unfortunately, we can't use isinstance(arg, collections.Hashable), which
-    # can be faster than calling hash, because numpy scalars on Python 3 fail
-    # this test
-
-    # reconsider this decision once this numpy bug is fixed:
-    # https://github.com/numpy/numpy/issues/5562
-
-    try:
-        hash(arg)
-    except TypeError:
-        return False
-    else:
-        return True
-
-
-def is_sequence(x):
-    try:
-        iter(x)
-        len(x)  # it has a length
-        return not isinstance(x, string_and_binary_types)
-    except (TypeError, AttributeError):
-        return False
diff --git a/pandas/types/missing.py b/pandas/types/missing.py
deleted file mode 100644
index cc8b5edc27542..0000000000000
--- a/pandas/types/missing.py
+++ /dev/null
@@ -1,393 +0,0 @@
-"""
-missing types & inference
-"""
-import numpy as np
-from pandas._libs import lib
-from pandas._libs.tslib import NaT, iNaT
-from .generic import (ABCMultiIndex, ABCSeries,
-                      ABCIndexClass, ABCGeneric)
-from .common import (is_string_dtype, is_datetimelike,
-                     is_datetimelike_v_numeric, is_float_dtype,
-                     is_datetime64_dtype, is_datetime64tz_dtype,
-                     is_timedelta64_dtype,
-                     is_complex_dtype, is_categorical_dtype,
-                     is_string_like_dtype, is_bool_dtype,
-                     is_integer_dtype, is_dtype_equal,
-                     needs_i8_conversion, _ensure_object,
-                     pandas_dtype,
-                     is_scalar,
-                     is_object_dtype,
-                     is_integer,
-                     _TD_DTYPE,
-                     _NS_DTYPE)
-from .inference import is_list_like
-
-
-def isnull(obj):
-    """Detect missing values (NaN in numeric arrays, None/NaN in object arrays)
-
-    Parameters
-    ----------
-    arr : ndarray or object value
-        Object to check for null-ness
-
-    Returns
-    -------
-    isnulled : array-like of bool or bool
-        Array or bool indicating whether an object is null or if an array is
-        given which of the element is null.
-
-    See also
-    --------
-    pandas.notnull: boolean inverse of pandas.isnull
-    """
-    return _isnull(obj)
-
-
-def _isnull_new(obj):
-    if is_scalar(obj):
-        return lib.checknull(obj)
-    # hack (for now) because MI registers as ndarray
-    elif isinstance(obj, ABCMultiIndex):
-        raise NotImplementedError("isnull is not defined for MultiIndex")
-    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass)):
-        return _isnull_ndarraylike(obj)
-    elif isinstance(obj, ABCGeneric):
-        return obj._constructor(obj._data.isnull(func=isnull))
-    elif isinstance(obj, list) or hasattr(obj, '__array__'):
-        return _isnull_ndarraylike(np.asarray(obj))
-    else:
-        return obj is None
-
-
-def _isnull_old(obj):
-    """Detect missing values. Treat None, NaN, INF, -INF as null.
-
-    Parameters
-    ----------
-    arr: ndarray or object value
-
-    Returns
-    -------
-    boolean ndarray or boolean
-    """
-    if is_scalar(obj):
-        return lib.checknull_old(obj)
-    # hack (for now) because MI registers as ndarray
-    elif isinstance(obj, ABCMultiIndex):
-        raise NotImplementedError("isnull is not defined for MultiIndex")
-    elif isinstance(obj, (ABCSeries, np.ndarray, ABCIndexClass)):
-        return _isnull_ndarraylike_old(obj)
-    elif isinstance(obj, ABCGeneric):
-        return obj._constructor(obj._data.isnull(func=_isnull_old))
-    elif isinstance(obj, list) or hasattr(obj, '__array__'):
-        return _isnull_ndarraylike_old(np.asarray(obj))
-    else:
-        return obj is None
-
-
-_isnull = _isnull_new
-
-
-def _use_inf_as_null(key):
-    """Option change callback for null/inf behaviour
-    Choose which replacement for numpy.isnan / -numpy.isfinite is used.
-
-    Parameters
-    ----------
-    flag: bool
-        True means treat None, NaN, INF, -INF as null (old way),
-        False means None and NaN are null, but INF, -INF are not null
-        (new way).
-
-    Notes
-    -----
-    This approach to setting global module values is discussed and
-    approved here:
-
-    * http://stackoverflow.com/questions/4859217/
-      programmatically-creating-variables-in-python/4859312#4859312
-    """
-    from pandas.core.config import get_option
-    flag = get_option(key)
-    if flag:
-        globals()['_isnull'] = _isnull_old
-    else:
-        globals()['_isnull'] = _isnull_new
-
-
-def _isnull_ndarraylike(obj):
-
-    values = getattr(obj, 'values', obj)
-    dtype = values.dtype
-
-    if is_string_dtype(dtype):
-        if is_categorical_dtype(values):
-            from pandas import Categorical
-            if not isinstance(values, Categorical):
-                values = values.values
-            result = values.isnull()
-        else:
-
-            # Working around NumPy ticket 1542
-            shape = values.shape
-
-            if is_string_like_dtype(dtype):
-                result = np.zeros(values.shape, dtype=bool)
-            else:
-                result = np.empty(shape, dtype=bool)
-                vec = lib.isnullobj(values.ravel())
-                result[...] = vec.reshape(shape)
-
-    elif needs_i8_conversion(obj):
-        # this is the NaT pattern
-        result = values.view('i8') == iNaT
-    else:
-        result = np.isnan(values)
-
-    # box
-    if isinstance(obj, ABCSeries):
-        from pandas import Series
-        result = Series(result, index=obj.index, name=obj.name, copy=False)
-
-    return result
-
-
-def _isnull_ndarraylike_old(obj):
-    values = getattr(obj, 'values', obj)
-    dtype = values.dtype
-
-    if is_string_dtype(dtype):
-        # Working around NumPy ticket 1542
-        shape = values.shape
-
-        if is_string_like_dtype(dtype):
-            result = np.zeros(values.shape, dtype=bool)
-        else:
-            result = np.empty(shape, dtype=bool)
-            vec = lib.isnullobj_old(values.ravel())
-            result[:] = vec.reshape(shape)
-
-    elif is_datetime64_dtype(dtype):
-        # this is the NaT pattern
-        result = values.view('i8') == iNaT
-    else:
-        result = ~np.isfinite(values)
-
-    # box
-    if isinstance(obj, ABCSeries):
-        from pandas import Series
-        result = Series(result, index=obj.index, name=obj.name, copy=False)
-
-    return result
-
-
-def notnull(obj):
-    """Replacement for numpy.isfinite / -numpy.isnan which is suitable for use
-    on object arrays.
-
-    Parameters
-    ----------
-    arr : ndarray or object value
-        Object to check for *not*-null-ness
-
-    Returns
-    -------
-    isnulled : array-like of bool or bool
-        Array or bool indicating whether an object is *not* null or if an array
-        is given which of the element is *not* null.
-
-    See also
-    --------
-    pandas.isnull : boolean inverse of pandas.notnull
-    """
-    res = isnull(obj)
-    if is_scalar(res):
-        return not res
-    return ~res
-
-
-def is_null_datelike_scalar(other):
-    """ test whether the object is a null datelike, e.g. Nat
-    but guard against passing a non-scalar """
-    if other is NaT or other is None:
-        return True
-    elif is_scalar(other):
-
-        # a timedelta
-        if hasattr(other, 'dtype'):
-            return other.view('i8') == iNaT
-        elif is_integer(other) and other == iNaT:
-            return True
-        return isnull(other)
-    return False
-
-
-def _is_na_compat(arr, fill_value=np.nan):
-    """
-    Parameters
-    ----------
-    arr: a numpy array
-    fill_value: fill value, default to np.nan
-
-    Returns
-    -------
-    True if we can fill using this fill_value
-    """
-    dtype = arr.dtype
-    if isnull(fill_value):
-        return not (is_bool_dtype(dtype) or
-                    is_integer_dtype(dtype))
-    return True
-
-
-def array_equivalent(left, right, strict_nan=False):
-    """
-    True if two arrays, left and right, have equal non-NaN elements, and NaNs
-    in corresponding locations.  False otherwise. It is assumed that left and
-    right are NumPy arrays of the same dtype. The behavior of this function
-    (particularly with respect to NaNs) is not defined if the dtypes are
-    different.
-
-    Parameters
-    ----------
-    left, right : ndarrays
-    strict_nan : bool, default False
-        If True, consider NaN and None to be different.
-
-    Returns
-    -------
-    b : bool
-        Returns True if the arrays are equivalent.
-
-    Examples
-    --------
-    >>> array_equivalent(
-    ...     np.array([1, 2, np.nan]),
-    ...     np.array([1, 2, np.nan]))
-    True
-    >>> array_equivalent(
-    ...     np.array([1, np.nan, 2]),
-    ...     np.array([1, 2, np.nan]))
-    False
-    """
-
-    left, right = np.asarray(left), np.asarray(right)
-
-    # shape compat
-    if left.shape != right.shape:
-        return False
-
-    # Object arrays can contain None, NaN and NaT.
-    # string dtypes must be come to this path for NumPy 1.7.1 compat
-    if is_string_dtype(left) or is_string_dtype(right):
-
-        if not strict_nan:
-            # isnull considers NaN and None to be equivalent.
-            return lib.array_equivalent_object(
-                _ensure_object(left.ravel()), _ensure_object(right.ravel()))
-
-        for left_value, right_value in zip(left, right):
-            if left_value is NaT and right_value is not NaT:
-                return False
-
-            elif isinstance(left_value, float) and np.isnan(left_value):
-                if (not isinstance(right_value, float) or
-                        not np.isnan(right_value)):
-                    return False
-            else:
-                if left_value != right_value:
-                    return False
-        return True
-
-    # NaNs can occur in float and complex arrays.
-    if is_float_dtype(left) or is_complex_dtype(left):
-        return ((left == right) | (np.isnan(left) & np.isnan(right))).all()
-
-    # numpy will will not allow this type of datetimelike vs integer comparison
-    elif is_datetimelike_v_numeric(left, right):
-        return False
-
-    # M8/m8
-    elif needs_i8_conversion(left) and needs_i8_conversion(right):
-        if not is_dtype_equal(left.dtype, right.dtype):
-            return False
-
-        left = left.view('i8')
-        right = right.view('i8')
-
-    # NaNs cannot occur otherwise.
-    try:
-        return np.array_equal(left, right)
-    except AttributeError:
-        # see gh-13388
-        #
-        # NumPy v1.7.1 has a bug in its array_equal
-        # function that prevents it from correctly
-        # comparing two arrays with complex dtypes.
-        # This bug is corrected in v1.8.0, so remove
-        # this try-except block as soon as we stop
-        # supporting NumPy versions < 1.8.0
-        if not is_dtype_equal(left.dtype, right.dtype):
-            return False
-
-        left = left.tolist()
-        right = right.tolist()
-
-        return left == right
-
-
-def _infer_fill_value(val):
-    """
-    infer the fill value for the nan/NaT from the provided
-    scalar/ndarray/list-like if we are a NaT, return the correct dtyped
-    element to provide proper block construction
-    """
-
-    if not is_list_like(val):
-        val = [val]
-    val = np.array(val, copy=False)
-    if is_datetimelike(val):
-        return np.array('NaT', dtype=val.dtype)
-    elif is_object_dtype(val.dtype):
-        dtype = lib.infer_dtype(_ensure_object(val))
-        if dtype in ['datetime', 'datetime64']:
-            return np.array('NaT', dtype=_NS_DTYPE)
-        elif dtype in ['timedelta', 'timedelta64']:
-            return np.array('NaT', dtype=_TD_DTYPE)
-    return np.nan
-
-
-def _maybe_fill(arr, fill_value=np.nan):
-    """
-    if we have a compatiable fill_value and arr dtype, then fill
-    """
-    if _is_na_compat(arr, fill_value):
-        arr.fill(fill_value)
-    return arr
-
-
-def na_value_for_dtype(dtype):
-    """
-    Return a dtype compat na value
-
-    Parameters
-    ----------
-    dtype : string / dtype
-
-    Returns
-    -------
-    np.dtype or a pandas dtype
-    """
-    dtype = pandas_dtype(dtype)
-
-    if (is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype) or
-            is_timedelta64_dtype(dtype)):
-        return NaT
-    elif is_float_dtype(dtype):
-        return np.nan
-    elif is_integer_dtype(dtype):
-        return 0
-    elif is_bool_dtype(dtype):
-        return False
-    return np.nan
diff --git a/pandas/util/__init__.py b/pandas/util/__init__.py
index e69de29bb2d1d..202e58c916e47 100644
--- a/pandas/util/__init__.py
+++ b/pandas/util/__init__.py
@@ -0,0 +1,2 @@
+from pandas.util._decorators import Appender, Substitution, cache_readonly  # noqa
+from pandas.core.util.hashing import hash_pandas_object, hash_array   # noqa
diff --git a/pandas/util/_decorators.py b/pandas/util/_decorators.py
new file mode 100644
index 0000000000000..e92051ebbea9a
--- /dev/null
+++ b/pandas/util/_decorators.py
@@ -0,0 +1,353 @@
+from functools import wraps
+import inspect
+from textwrap import dedent
+import warnings
+
+from pandas._libs.properties import cache_readonly  # noqa
+from pandas.compat import PY2, signature
+
+
+def deprecate(name, alternative, version, alt_name=None,
+              klass=None, stacklevel=2, msg=None):
+    """
+    Return a new function that emits a deprecation warning on use.
+
+    To use this method for a deprecated function, another function
+    `alternative` with the same signature must exist. The deprecated
+    function will emit a deprecation warning, and in the docstring
+    it will contain the deprecation directive with the provided version
+    so it can be detected for future removal.
+
+    Parameters
+    ----------
+    name : str
+        Name of function to deprecate.
+    alternative : func
+        Function to use instead.
+    version : str
+        Version of pandas in which the method has been deprecated.
+    alt_name : str, optional
+        Name to use in preference of alternative.__name__.
+    klass : Warning, default FutureWarning
+    stacklevel : int, default 2
+    msg : str
+        The message to display in the warning.
+        Default is '{name} is deprecated. Use {alt_name} instead.'
+    """
+
+    alt_name = alt_name or alternative.__name__
+    klass = klass or FutureWarning
+    warning_msg = msg or '{} is deprecated, use {} instead'.format(name,
+                                                                   alt_name)
+
+    @wraps(alternative)
+    def wrapper(*args, **kwargs):
+        warnings.warn(warning_msg, klass, stacklevel=stacklevel)
+        return alternative(*args, **kwargs)
+
+    # adding deprecated directive to the docstring
+    msg = msg or 'Use `{alt_name}` instead.'.format(alt_name=alt_name)
+    doc_error_msg = ('deprecate needs a correctly formatted docstring in '
+                     'the target function (should have a one liner short '
+                     'summary, and opening quotes should be in their own '
+                     'line). Found:\n{}'.format(alternative.__doc__))
+
+    # when python is running in optimized mode (i.e. `-OO`), docstrings are
+    # removed, so we check that a docstring with correct formatting is used
+    # but we allow empty docstrings
+    if alternative.__doc__:
+        if alternative.__doc__.count('\n') < 3:
+            raise AssertionError(doc_error_msg)
+        empty1, summary, empty2, doc = alternative.__doc__.split('\n', 3)
+        if empty1 or empty2 and not summary:
+            raise AssertionError(doc_error_msg)
+        wrapper.__doc__ = dedent("""
+        {summary}
+
+        .. deprecated:: {depr_version}
+            {depr_msg}
+
+        {rest_of_docstring}""").format(summary=summary.strip(),
+                                       depr_version=version,
+                                       depr_msg=msg,
+                                       rest_of_docstring=dedent(doc))
+
+    return wrapper
+
+
+def deprecate_kwarg(old_arg_name, new_arg_name, mapping=None, stacklevel=2):
+    """
+    Decorator to deprecate a keyword argument of a function.
+
+    Parameters
+    ----------
+    old_arg_name : str
+        Name of argument in function to deprecate
+    new_arg_name : str or None
+        Name of preferred argument in function. Use None to raise warning that
+        ``old_arg_name`` keyword is deprecated.
+    mapping : dict or callable
+        If mapping is present, use it to translate old arguments to
+        new arguments. A callable must do its own value checking;
+        values not found in a dict will be forwarded unchanged.
+
+    Examples
+    --------
+    The following deprecates 'cols', using 'columns' instead
+
+    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name='columns')
+    ... def f(columns=''):
+    ...     print(columns)
+    ...
+    >>> f(columns='should work ok')
+    should work ok
+
+    >>> f(cols='should raise warning')
+    FutureWarning: cols is deprecated, use columns instead
+      warnings.warn(msg, FutureWarning)
+    should raise warning
+
+    >>> f(cols='should error', columns="can\'t pass do both")
+    TypeError: Can only specify 'cols' or 'columns', not both
+
+    >>> @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
+    ... def f(new=False):
+    ...     print('yes!' if new else 'no!')
+    ...
+    >>> f(old='yes')
+    FutureWarning: old='yes' is deprecated, use new=True instead
+      warnings.warn(msg, FutureWarning)
+    yes!
+
+    To raise a warning that a keyword will be removed entirely in the future
+
+    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name=None)
+    ... def f(cols='', another_param=''):
+    ...     print(cols)
+    ...
+    >>> f(cols='should raise warning')
+    FutureWarning: the 'cols' keyword is deprecated and will be removed in a
+    future version please takes steps to stop use of 'cols'
+    should raise warning
+    >>> f(another_param='should not raise warning')
+    should not raise warning
+
+    >>> f(cols='should raise warning', another_param='')
+    FutureWarning: the 'cols' keyword is deprecated and will be removed in a
+    future version please takes steps to stop use of 'cols'
+    should raise warning
+    """
+
+    if mapping is not None and not hasattr(mapping, 'get') and \
+            not callable(mapping):
+        raise TypeError("mapping from old to new argument values "
+                        "must be dict or callable!")
+
+    def _deprecate_kwarg(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            old_arg_value = kwargs.pop(old_arg_name, None)
+
+            if new_arg_name is None and old_arg_value is not None:
+                msg = (
+                    "the '{old_name}' keyword is deprecated and will be "
+                    "removed in a future version. "
+                    "Please take steps to stop the use of '{old_name}'"
+                ).format(old_name=old_arg_name)
+                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
+                kwargs[old_arg_name] = old_arg_value
+                return func(*args, **kwargs)
+
+            if old_arg_value is not None:
+                if mapping is not None:
+                    if hasattr(mapping, 'get'):
+                        new_arg_value = mapping.get(old_arg_value,
+                                                    old_arg_value)
+                    else:
+                        new_arg_value = mapping(old_arg_value)
+                    msg = ("the {old_name}={old_val!r} keyword is deprecated, "
+                           "use {new_name}={new_val!r} instead"
+                           ).format(old_name=old_arg_name,
+                                    old_val=old_arg_value,
+                                    new_name=new_arg_name,
+                                    new_val=new_arg_value)
+                else:
+                    new_arg_value = old_arg_value
+                    msg = ("the '{old_name}' keyword is deprecated, "
+                           "use '{new_name}' instead"
+                           ).format(old_name=old_arg_name,
+                                    new_name=new_arg_name)
+
+                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
+                if kwargs.get(new_arg_name, None) is not None:
+                    msg = ("Can only specify '{old_name}' or '{new_name}', "
+                           "not both").format(old_name=old_arg_name,
+                                              new_name=new_arg_name)
+                    raise TypeError(msg)
+                else:
+                    kwargs[new_arg_name] = new_arg_value
+            return func(*args, **kwargs)
+        return wrapper
+    return _deprecate_kwarg
+
+
+def rewrite_axis_style_signature(name, extra_params):
+    def decorate(func):
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            return func(*args, **kwargs)
+
+        if not PY2:
+            kind = inspect.Parameter.POSITIONAL_OR_KEYWORD
+            params = [
+                inspect.Parameter('self', kind),
+                inspect.Parameter(name, kind, default=None),
+                inspect.Parameter('index', kind, default=None),
+                inspect.Parameter('columns', kind, default=None),
+                inspect.Parameter('axis', kind, default=None),
+            ]
+
+            for pname, default in extra_params:
+                params.append(inspect.Parameter(pname, kind, default=default))
+
+            sig = inspect.Signature(params)
+
+            func.__signature__ = sig
+        return wrapper
+    return decorate
+
+# Substitution and Appender are derived from matplotlib.docstring (1.1.0)
+# module http://matplotlib.org/users/license.html
+
+
+class Substitution(object):
+    """
+    A decorator to take a function's docstring and perform string
+    substitution on it.
+
+    This decorator should be robust even if func.__doc__ is None
+    (for example, if -OO was passed to the interpreter)
+
+    Usage: construct a docstring.Substitution with a sequence or
+    dictionary suitable for performing substitution; then
+    decorate a suitable function with the constructed object. e.g.
+
+    sub_author_name = Substitution(author='Jason')
+
+    @sub_author_name
+    def some_function(x):
+        "%(author)s wrote this function"
+
+    # note that some_function.__doc__ is now "Jason wrote this function"
+
+    One can also use positional arguments.
+
+    sub_first_last_names = Substitution('Edgar Allen', 'Poe')
+
+    @sub_first_last_names
+    def some_function(x):
+        "%s %s wrote the Raven"
+    """
+
+    def __init__(self, *args, **kwargs):
+        if (args and kwargs):
+            raise AssertionError("Only positional or keyword args are allowed")
+
+        self.params = args or kwargs
+
+    def __call__(self, func):
+        func.__doc__ = func.__doc__ and func.__doc__ % self.params
+        return func
+
+    def update(self, *args, **kwargs):
+        """
+        Update self.params with supplied args.
+
+        If called, we assume self.params is a dict.
+        """
+
+        self.params.update(*args, **kwargs)
+
+    @classmethod
+    def from_params(cls, params):
+        """
+        In the case where the params is a mutable sequence (list or dictionary)
+        and it may change before this class is called, one may explicitly use a
+        reference to the params rather than using *args or **kwargs which will
+        copy the values and not reference them.
+        """
+        result = cls()
+        result.params = params
+        return result
+
+
+class Appender(object):
+    """
+    A function decorator that will append an addendum to the docstring
+    of the target function.
+
+    This decorator should be robust even if func.__doc__ is None
+    (for example, if -OO was passed to the interpreter).
+
+    Usage: construct a docstring.Appender with a string to be joined to
+    the original docstring. An optional 'join' parameter may be supplied
+    which will be used to join the docstring and addendum. e.g.
+
+    add_copyright = Appender("Copyright (c) 2009", join='\n')
+
+    @add_copyright
+    def my_dog(has='fleas'):
+        "This docstring will have a copyright below"
+        pass
+    """
+
+    def __init__(self, addendum, join='', indents=0):
+        if indents > 0:
+            self.addendum = indent(addendum, indents=indents)
+        else:
+            self.addendum = addendum
+        self.join = join
+
+    def __call__(self, func):
+        func.__doc__ = func.__doc__ if func.__doc__ else ''
+        self.addendum = self.addendum if self.addendum else ''
+        docitems = [func.__doc__, self.addendum]
+        func.__doc__ = dedent(self.join.join(docitems))
+        return func
+
+
+def indent(text, indents=1):
+    if not text or not isinstance(text, str):
+        return ''
+    jointext = ''.join(['\n'] + ['    '] * indents)
+    return jointext.join(text.split('\n'))
+
+
+def make_signature(func):
+    """
+    Returns a tuple containing the paramenter list with defaults
+    and parameter list.
+
+    Examples
+    --------
+    >>> def f(a, b, c=2):
+    >>>     return a * b * c
+    >>> print(make_signature(f))
+    (['a', 'b', 'c=2'], ['a', 'b', 'c'])
+    """
+
+    spec = signature(func)
+    if spec.defaults is None:
+        n_wo_defaults = len(spec.args)
+        defaults = ('',) * n_wo_defaults
+    else:
+        n_wo_defaults = len(spec.args) - len(spec.defaults)
+        defaults = ('',) * n_wo_defaults + tuple(spec.defaults)
+    args = []
+    for var, default in zip(spec.args, defaults):
+        args.append(var if default == '' else var + '=' + repr(default))
+    if spec.varargs:
+        args.append('*' + spec.varargs)
+    if spec.keywords:
+        args.append('**' + spec.keywords)
+    return args, spec.args
diff --git a/pandas/util/_depr_module.py b/pandas/util/_depr_module.py
new file mode 100644
index 0000000000000..2c8feec798c66
--- /dev/null
+++ b/pandas/util/_depr_module.py
@@ -0,0 +1,103 @@
+"""
+This module houses a utility class for mocking deprecated modules.
+It is for internal use only and should not be used beyond this purpose.
+"""
+
+import importlib
+import warnings
+
+
+class _DeprecatedModule(object):
+    """ Class for mocking deprecated modules.
+
+    Parameters
+    ----------
+    deprmod : name of module to be deprecated.
+    deprmodto : name of module as a replacement, optional.
+                If not given, the __module__ attribute will
+                be used when needed.
+    removals : objects or methods in module that will no longer be
+               accessible once module is removed.
+    moved : dict, optional
+            dictionary of function name -> new location for moved
+            objects
+    """
+
+    def __init__(self, deprmod, deprmodto=None, removals=None,
+                 moved=None):
+        self.deprmod = deprmod
+        self.deprmodto = deprmodto
+        self.removals = removals
+        if self.removals is not None:
+            self.removals = frozenset(self.removals)
+        self.moved = moved
+
+        # For introspection purposes.
+        self.self_dir = frozenset(dir(self.__class__))
+
+    def __dir__(self):
+        deprmodule = self._import_deprmod()
+        return dir(deprmodule)
+
+    def __repr__(self):
+        deprmodule = self._import_deprmod()
+        return repr(deprmodule)
+
+    __str__ = __repr__
+
+    def __getattr__(self, name):
+        if name in self.self_dir:
+            return object.__getattribute__(self, name)
+
+        try:
+            deprmodule = self._import_deprmod(self.deprmod)
+        except ImportError:
+            if self.deprmodto is None:
+                raise
+
+            # a rename
+            deprmodule = self._import_deprmod(self.deprmodto)
+
+        obj = getattr(deprmodule, name)
+
+        if self.removals is not None and name in self.removals:
+            warnings.warn(
+                "{deprmod}.{name} is deprecated and will be removed in "
+                "a future version.".format(deprmod=self.deprmod, name=name),
+                FutureWarning, stacklevel=2)
+        elif self.moved is not None and name in self.moved:
+            warnings.warn(
+                "{deprmod} is deprecated and will be removed in "
+                "a future version.\nYou can access {name} as {moved}".format(
+                    deprmod=self.deprmod,
+                    name=name,
+                    moved=self.moved[name]),
+                FutureWarning, stacklevel=2)
+        else:
+            deprmodto = self.deprmodto
+            if deprmodto is False:
+                warnings.warn(
+                    "{deprmod}.{name} is deprecated and will be removed in "
+                    "a future version.".format(
+                        deprmod=self.deprmod, name=name),
+                    FutureWarning, stacklevel=2)
+            else:
+                if deprmodto is None:
+                    deprmodto = obj.__module__
+                # The object is actually located in another module.
+                warnings.warn(
+                    "{deprmod}.{name} is deprecated. Please use "
+                    "{deprmodto}.{name} instead.".format(
+                        deprmod=self.deprmod, name=name, deprmodto=deprmodto),
+                    FutureWarning, stacklevel=2)
+
+        return obj
+
+    def _import_deprmod(self, mod=None):
+        if mod is None:
+            mod = self.deprmod
+
+        with warnings.catch_warnings():
+            warnings.filterwarnings('ignore', category=FutureWarning)
+            deprmodule = importlib.import_module(mod)
+            return deprmodule
diff --git a/pandas/util/_doctools.py b/pandas/util/_doctools.py
new file mode 100644
index 0000000000000..4aee0a2e5350e
--- /dev/null
+++ b/pandas/util/_doctools.py
@@ -0,0 +1,206 @@
+import numpy as np
+
+import pandas.compat as compat
+
+import pandas as pd
+
+
+class TablePlotter(object):
+    """
+    Layout some DataFrames in vertical/horizontal layout for explanation.
+    Used in merging.rst
+    """
+
+    def __init__(self, cell_width=0.37, cell_height=0.25, font_size=7.5):
+        self.cell_width = cell_width
+        self.cell_height = cell_height
+        self.font_size = font_size
+
+    def _shape(self, df):
+        """
+        Calculate table chape considering index levels.
+        """
+
+        row, col = df.shape
+        return row + df.columns.nlevels, col + df.index.nlevels
+
+    def _get_cells(self, left, right, vertical):
+        """
+        Calculate appropriate figure size based on left and right data.
+        """
+
+        if vertical:
+            # calculate required number of cells
+            vcells = max(sum(self._shape(l)[0] for l in left),
+                         self._shape(right)[0])
+            hcells = (max(self._shape(l)[1] for l in left) +
+                      self._shape(right)[1])
+        else:
+            vcells = max([self._shape(l)[0] for l in left] +
+                         [self._shape(right)[0]])
+            hcells = sum([self._shape(l)[1] for l in left] +
+                         [self._shape(right)[1]])
+        return hcells, vcells
+
+    def plot(self, left, right, labels=None, vertical=True):
+        """
+        Plot left / right DataFrames in specified layout.
+
+        Parameters
+        ----------
+        left : list of DataFrames before operation is applied
+        right : DataFrame of operation result
+        labels : list of str to be drawn as titles of left DataFrames
+        vertical : bool
+            If True, use vertical layout. If False, use horizontal layout.
+        """
+        import matplotlib.pyplot as plt
+        import matplotlib.gridspec as gridspec
+
+        if not isinstance(left, list):
+            left = [left]
+        left = [self._conv(l) for l in left]
+        right = self._conv(right)
+
+        hcells, vcells = self._get_cells(left, right, vertical)
+
+        if vertical:
+            figsize = self.cell_width * hcells, self.cell_height * vcells
+        else:
+            # include margin for titles
+            figsize = self.cell_width * hcells, self.cell_height * vcells
+        fig = plt.figure(figsize=figsize)
+
+        if vertical:
+            gs = gridspec.GridSpec(len(left), hcells)
+            # left
+            max_left_cols = max(self._shape(l)[1] for l in left)
+            max_left_rows = max(self._shape(l)[0] for l in left)
+            for i, (l, label) in enumerate(zip(left, labels)):
+                ax = fig.add_subplot(gs[i, 0:max_left_cols])
+                self._make_table(ax, l, title=label,
+                                 height=1.0 / max_left_rows)
+            # right
+            ax = plt.subplot(gs[:, max_left_cols:])
+            self._make_table(ax, right, title='Result', height=1.05 / vcells)
+            fig.subplots_adjust(top=0.9, bottom=0.05, left=0.05, right=0.95)
+        else:
+            max_rows = max(self._shape(df)[0] for df in left + [right])
+            height = 1.0 / np.max(max_rows)
+            gs = gridspec.GridSpec(1, hcells)
+            # left
+            i = 0
+            for l, label in zip(left, labels):
+                sp = self._shape(l)
+                ax = fig.add_subplot(gs[0, i:i + sp[1]])
+                self._make_table(ax, l, title=label, height=height)
+                i += sp[1]
+            # right
+            ax = plt.subplot(gs[0, i:])
+            self._make_table(ax, right, title='Result', height=height)
+            fig.subplots_adjust(top=0.85, bottom=0.05, left=0.05, right=0.95)
+
+        return fig
+
+    def _conv(self, data):
+        """Convert each input to appropriate for table outplot"""
+        if isinstance(data, pd.Series):
+            if data.name is None:
+                data = data.to_frame(name='')
+            else:
+                data = data.to_frame()
+        data = data.fillna('NaN')
+        return data
+
+    def _insert_index(self, data):
+        # insert is destructive
+        data = data.copy()
+        idx_nlevels = data.index.nlevels
+        if idx_nlevels == 1:
+            data.insert(0, 'Index', data.index)
+        else:
+            for i in range(idx_nlevels):
+                data.insert(i, 'Index{0}'.format(i),
+                            data.index._get_level_values(i))
+
+        col_nlevels = data.columns.nlevels
+        if col_nlevels > 1:
+            col = data.columns._get_level_values(0)
+            values = [data.columns._get_level_values(i).values
+                      for i in range(1, col_nlevels)]
+            col_df = pd.DataFrame(values)
+            data.columns = col_df.columns
+            data = pd.concat([col_df, data])
+            data.columns = col
+        return data
+
+    def _make_table(self, ax, df, title, height=None):
+        if df is None:
+            ax.set_visible(False)
+            return
+
+        import pandas.plotting as plotting
+
+        idx_nlevels = df.index.nlevels
+        col_nlevels = df.columns.nlevels
+        # must be convert here to get index levels for colorization
+        df = self._insert_index(df)
+        tb = plotting.table(ax, df, loc=9)
+        tb.set_fontsize(self.font_size)
+
+        if height is None:
+            height = 1.0 / (len(df) + 1)
+
+        props = tb.properties()
+        for (r, c), cell in compat.iteritems(props['celld']):
+            if c == -1:
+                cell.set_visible(False)
+            elif r < col_nlevels and c < idx_nlevels:
+                cell.set_visible(False)
+            elif r < col_nlevels or c < idx_nlevels:
+                cell.set_facecolor('#AAAAAA')
+            cell.set_height(height)
+
+        ax.set_title(title, size=self.font_size)
+        ax.axis('off')
+
+
+class _WritableDoc(type):
+    # Remove this when Python2 support is dropped
+    # __doc__ is not mutable for new-style classes in Python2, which means
+    # we can't use @Appender to share class docstrings. This can be used
+    # with `add_metaclass` to make cls.__doc__ mutable.
+    pass
+
+
+if __name__ == "__main__":
+    import matplotlib.pyplot as plt
+
+    p = TablePlotter()
+
+    df1 = pd.DataFrame({'A': [10, 11, 12],
+                        'B': [20, 21, 22],
+                        'C': [30, 31, 32]})
+    df2 = pd.DataFrame({'A': [10, 12],
+                        'C': [30, 32]})
+
+    p.plot([df1, df2], pd.concat([df1, df2]),
+           labels=['df1', 'df2'], vertical=True)
+    plt.show()
+
+    df3 = pd.DataFrame({'X': [10, 12],
+                        'Z': [30, 32]})
+
+    p.plot([df1, df3], pd.concat([df1, df3], axis=1),
+           labels=['df1', 'df2'], vertical=False)
+    plt.show()
+
+    idx = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B'), (1, 'C'),
+                                     (2, 'A'), (2, 'B'), (2, 'C')])
+    col = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B')])
+    df3 = pd.DataFrame({'v1': [1, 2, 3, 4, 5, 6],
+                        'v2': [5, 6, 7, 8, 9, 10]},
+                       index=idx)
+    df3.columns = col
+    p.plot(df3, df3, labels=['df3'])
+    plt.show()
diff --git a/pandas/util/_exceptions.py b/pandas/util/_exceptions.py
new file mode 100644
index 0000000000000..953c8a43a21b8
--- /dev/null
+++ b/pandas/util/_exceptions.py
@@ -0,0 +1,16 @@
+import contextlib
+
+
+@contextlib.contextmanager
+def rewrite_exception(old_name, new_name):
+    """Rewrite the message of an exception."""
+    try:
+        yield
+    except Exception as e:
+        msg = e.args[0]
+        msg = msg.replace(old_name, new_name)
+        args = (msg,)
+        if len(e.args) > 1:
+            args = args + e.args[1:]
+        e.args = args
+        raise
diff --git a/pandas/util/_print_versions.py b/pandas/util/_print_versions.py
new file mode 100644
index 0000000000000..a5c86c2cc80b3
--- /dev/null
+++ b/pandas/util/_print_versions.py
@@ -0,0 +1,159 @@
+import codecs
+import importlib
+import locale
+import os
+import platform
+import struct
+import subprocess
+import sys
+
+
+def get_sys_info():
+    "Returns system information as a dict"
+
+    blob = []
+
+    # get full commit hash
+    commit = None
+    if os.path.isdir(".git") and os.path.isdir("pandas"):
+        try:
+            pipe = subprocess.Popen('git log --format="%H" -n 1'.split(" "),
+                                    stdout=subprocess.PIPE,
+                                    stderr=subprocess.PIPE)
+            so, serr = pipe.communicate()
+        except (OSError, ValueError):
+            pass
+        else:
+            if pipe.returncode == 0:
+                commit = so
+                try:
+                    commit = so.decode('utf-8')
+                except ValueError:
+                    pass
+                commit = commit.strip().strip('"')
+
+    blob.append(('commit', commit))
+
+    try:
+        (sysname, nodename, release,
+         version, machine, processor) = platform.uname()
+        blob.extend([
+            ("python", '.'.join(map(str, sys.version_info))),
+            ("python-bits", struct.calcsize("P") * 8),
+            ("OS", "{sysname}".format(sysname=sysname)),
+            ("OS-release", "{release}".format(release=release)),
+            # ("Version", "{version}".format(version=version)),
+            ("machine", "{machine}".format(machine=machine)),
+            ("processor", "{processor}".format(processor=processor)),
+            ("byteorder", "{byteorder}".format(byteorder=sys.byteorder)),
+            ("LC_ALL", "{lc}".format(lc=os.environ.get('LC_ALL', "None"))),
+            ("LANG", "{lang}".format(lang=os.environ.get('LANG', "None"))),
+            ("LOCALE", '.'.join(map(str, locale.getlocale()))),
+        ])
+    except (KeyError, ValueError):
+        pass
+
+    return blob
+
+
+def show_versions(as_json=False):
+    sys_info = get_sys_info()
+
+    deps = [
+        # (MODULE_NAME, f(mod) -> mod version)
+        ("pandas", lambda mod: mod.__version__),
+        ("pytest", lambda mod: mod.__version__),
+        ("pip", lambda mod: mod.__version__),
+        ("setuptools", lambda mod: mod.__version__),
+        ("Cython", lambda mod: mod.__version__),
+        ("numpy", lambda mod: mod.version.version),
+        ("scipy", lambda mod: mod.version.version),
+        ("pyarrow", lambda mod: mod.__version__),
+        ("xarray", lambda mod: mod.__version__),
+        ("IPython", lambda mod: mod.__version__),
+        ("sphinx", lambda mod: mod.__version__),
+        ("patsy", lambda mod: mod.__version__),
+        ("dateutil", lambda mod: mod.__version__),
+        ("pytz", lambda mod: mod.VERSION),
+        ("blosc", lambda mod: mod.__version__),
+        ("bottleneck", lambda mod: mod.__version__),
+        ("tables", lambda mod: mod.__version__),
+        ("numexpr", lambda mod: mod.__version__),
+        ("feather", lambda mod: mod.__version__),
+        ("matplotlib", lambda mod: mod.__version__),
+        ("openpyxl", lambda mod: mod.__version__),
+        ("xlrd", lambda mod: mod.__VERSION__),
+        ("xlwt", lambda mod: mod.__VERSION__),
+        ("xlsxwriter", lambda mod: mod.__version__),
+        ("lxml.etree", lambda mod: mod.__version__),
+        ("bs4", lambda mod: mod.__version__),
+        ("html5lib", lambda mod: mod.__version__),
+        ("sqlalchemy", lambda mod: mod.__version__),
+        ("pymysql", lambda mod: mod.__version__),
+        ("psycopg2", lambda mod: mod.__version__),
+        ("jinja2", lambda mod: mod.__version__),
+        ("s3fs", lambda mod: mod.__version__),
+        ("fastparquet", lambda mod: mod.__version__),
+        ("pandas_gbq", lambda mod: mod.__version__),
+        ("pandas_datareader", lambda mod: mod.__version__),
+        ("gcsfs", lambda mod: mod.__version__),
+    ]
+
+    deps_blob = list()
+    for (modname, ver_f) in deps:
+        try:
+            if modname in sys.modules:
+                mod = sys.modules[modname]
+            else:
+                mod = importlib.import_module(modname)
+            ver = ver_f(mod)
+            deps_blob.append((modname, ver))
+        except ImportError:
+            deps_blob.append((modname, None))
+
+    if (as_json):
+        try:
+            import json
+        except ImportError:
+            import simplejson as json
+
+        j = dict(system=dict(sys_info), dependencies=dict(deps_blob))
+
+        if as_json is True:
+            print(j)
+        else:
+            with codecs.open(as_json, "wb", encoding='utf8') as f:
+                json.dump(j, f, indent=2)
+
+    else:
+
+        print("\nINSTALLED VERSIONS")
+        print("------------------")
+
+        for k, stat in sys_info:
+            print("{k}: {stat}".format(k=k, stat=stat))
+
+        print("")
+        for k, stat in deps_blob:
+            print("{k}: {stat}".format(k=k, stat=stat))
+
+
+def main():
+    from optparse import OptionParser
+    parser = OptionParser()
+    parser.add_option("-j", "--json", metavar="FILE", nargs=1,
+                      help="Save output as JSON into file, pass in "
+                      "'-' to output to stdout")
+
+    (options, args) = parser.parse_args()
+
+    if options.json == "-":
+        options.json = True
+
+    show_versions(as_json=options.json)
+
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/pandas/util/_test_decorators.py b/pandas/util/_test_decorators.py
new file mode 100644
index 0000000000000..0331661c3131f
--- /dev/null
+++ b/pandas/util/_test_decorators.py
@@ -0,0 +1,210 @@
+"""
+This module provides decorator functions which can be applied to test objects
+in order to skip those objects when certain conditions occur. A sample use case
+is to detect if the platform is missing ``matplotlib``. If so, any test objects
+which require ``matplotlib`` and decorated with ``@td.skip_if_no_mpl`` will be
+skipped by ``pytest`` during the execution of the test suite.
+
+To illustrate, after importing this module:
+
+import pandas.util._test_decorators as td
+
+The decorators can be applied to classes:
+
+@td.skip_if_some_reason
+class Foo():
+    ...
+
+Or individual functions:
+
+@td.skip_if_some_reason
+def test_foo():
+    ...
+
+For more information, refer to the ``pytest`` documentation on ``skipif``.
+"""
+from distutils.version import LooseVersion
+import locale
+
+import pytest
+
+from pandas.compat import (
+    PY3, import_lzma, is_platform_32bit, is_platform_windows)
+from pandas.compat.numpy import _np_version_under1p15
+
+from pandas.core.computation.expressions import (
+    _NUMEXPR_INSTALLED, _USE_NUMEXPR)
+
+
+def safe_import(mod_name, min_version=None):
+    """
+    Parameters:
+    -----------
+    mod_name : str
+        Name of the module to be imported
+    min_version : str, default None
+        Minimum required version of the specified mod_name
+
+    Returns:
+    --------
+    object
+        The imported module if successful, or False
+    """
+    try:
+        mod = __import__(mod_name)
+    except ImportError:
+        return False
+
+    if not min_version:
+        return mod
+    else:
+        import sys
+        try:
+            version = getattr(sys.modules[mod_name], '__version__')
+        except AttributeError:
+            # xlrd uses a capitalized attribute name
+            version = getattr(sys.modules[mod_name], '__VERSION__')
+        if version:
+            from distutils.version import LooseVersion
+            if LooseVersion(version) >= LooseVersion(min_version):
+                return mod
+
+    return False
+
+
+def _skip_if_no_mpl():
+    mod = safe_import("matplotlib")
+    if mod:
+        mod.use("Agg", warn=False)
+    else:
+        return True
+
+
+def _skip_if_mpl_2_2():
+    mod = safe_import("matplotlib")
+
+    if mod:
+        v = mod.__version__
+        if LooseVersion(v) > LooseVersion('2.1.2'):
+            return True
+        else:
+            mod.use("Agg", warn=False)
+
+
+def _skip_if_has_locale():
+    lang, _ = locale.getlocale()
+    if lang is not None:
+        return True
+
+
+def _skip_if_not_us_locale():
+    lang, _ = locale.getlocale()
+    if lang != 'en_US':
+        return True
+
+
+def _skip_if_no_scipy():
+    return not (safe_import('scipy.stats') and
+                safe_import('scipy.sparse') and
+                safe_import('scipy.interpolate') and
+                safe_import('scipy.signal'))
+
+
+def _skip_if_no_lzma():
+    try:
+        import_lzma()
+    except ImportError:
+        return True
+
+
+def skip_if_no(package, min_version=None):
+    """
+    Generic function to help skip test functions when required packages are not
+    present on the testing system.
+
+    Intended for use as a decorator, this function will wrap the decorated
+    function with a pytest ``skip_if`` mark. During a pytest test suite
+    execution, that mark will attempt to import the specified ``package`` and
+    optionally ensure it meets the ``min_version``. If the import and version
+    check are unsuccessful, then the decorated function will be skipped.
+
+    Parameters
+    ----------
+    package: str
+        The name of the package required by the decorated function
+    min_version: str or None, default None
+        Optional minimum version of the package required by the decorated
+        function
+
+    Returns
+    -------
+    decorated_func: function
+        The decorated function wrapped within a pytest ``skip_if`` mark
+    """
+    def decorated_func(func):
+        msg = "Could not import '{}'".format(package)
+        if min_version:
+            msg += " satisfying a min_version of {}".format(min_version)
+        return pytest.mark.skipif(
+            not safe_import(package, min_version=min_version), reason=msg
+        )(func)
+    return decorated_func
+
+
+skip_if_no_mpl = pytest.mark.skipif(_skip_if_no_mpl(),
+                                    reason="Missing matplotlib dependency")
+skip_if_np_lt_115 = pytest.mark.skipif(_np_version_under1p15,
+                                       reason="NumPy 1.15 or greater required")
+skip_if_mpl = pytest.mark.skipif(not _skip_if_no_mpl(),
+                                 reason="matplotlib is present")
+xfail_if_mpl_2_2 = pytest.mark.xfail(_skip_if_mpl_2_2(),
+                                     reason="matplotlib 2.2",
+                                     strict=False)
+skip_if_32bit = pytest.mark.skipif(is_platform_32bit(),
+                                   reason="skipping for 32 bit")
+skip_if_windows = pytest.mark.skipif(is_platform_windows(),
+                                     reason="Running on Windows")
+skip_if_windows_python_3 = pytest.mark.skipif(is_platform_windows() and PY3,
+                                              reason=("not used on python3/"
+                                                      "win32"))
+skip_if_has_locale = pytest.mark.skipif(_skip_if_has_locale(),
+                                        reason="Specific locale is set {lang}"
+                                        .format(lang=locale.getlocale()[0]))
+skip_if_not_us_locale = pytest.mark.skipif(_skip_if_not_us_locale(),
+                                           reason="Specific locale is set "
+                                           "{lang}".format(
+                                               lang=locale.getlocale()[0]))
+skip_if_no_scipy = pytest.mark.skipif(_skip_if_no_scipy(),
+                                      reason="Missing SciPy requirement")
+skip_if_no_lzma = pytest.mark.skipif(_skip_if_no_lzma(),
+                                     reason="need backports.lzma to run")
+skip_if_no_ne = pytest.mark.skipif(not _USE_NUMEXPR,
+                                   reason="numexpr enabled->{enabled}, "
+                                   "installed->{installed}".format(
+                                       enabled=_USE_NUMEXPR,
+                                       installed=_NUMEXPR_INSTALLED))
+
+
+def parametrize_fixture_doc(*args):
+    """
+    Intended for use as a decorator for parametrized fixture,
+    this function will wrap the decorated function with a pytest
+    ``parametrize_fixture_doc`` mark. That mark will format
+    initial fixture docstring by replacing placeholders {0}, {1} etc
+    with parameters passed as arguments.
+
+    Parameters:
+    ----------
+        args: iterable
+            Positional arguments for docstring.
+
+    Returns:
+    -------
+    documented_fixture: function
+        The decorated function wrapped within a pytest
+        ``parametrize_fixture_doc`` mark
+    """
+    def documented_fixture(fixture):
+        fixture.__doc__ = fixture.__doc__.format(*args)
+        return fixture
+    return documented_fixture
diff --git a/pandas/util/_tester.py b/pandas/util/_tester.py
index aeb4259a9edae..19b1cc700261c 100644
--- a/pandas/util/_tester.py
+++ b/pandas/util/_tester.py
@@ -7,21 +7,23 @@
 PKG = os.path.dirname(os.path.dirname(__file__))
 
 
-try:
-    import pytest
-except ImportError:
-    def test():
-        raise ImportError("Need pytest>=3.0 to run tests")
-else:
-    def test(extra_args=None):
-        cmd = ['--skip-slow', '--skip-network']
-        if extra_args:
-            if not isinstance(extra_args, list):
-                extra_args = [extra_args]
-            cmd = extra_args
-        cmd += [PKG]
-        print("running: pytest {}".format(' '.join(cmd)))
-        sys.exit(pytest.main(cmd))
+def test(extra_args=None):
+    try:
+        import pytest
+    except ImportError:
+        raise ImportError("Need pytest>=4.0.2 to run tests")
+    try:
+        import hypothesis  # noqa
+    except ImportError:
+        raise ImportError("Need hypothesis>=3.58 to run tests")
+    cmd = ['--skip-slow', '--skip-network', '--skip-db']
+    if extra_args:
+        if not isinstance(extra_args, list):
+            extra_args = [extra_args]
+        cmd = extra_args
+    cmd += [PKG]
+    print("running: pytest {}".format(' '.join(cmd)))
+    sys.exit(pytest.main(cmd))
 
 
 __all__ = ['test']
diff --git a/pandas/util/_validators.py b/pandas/util/_validators.py
new file mode 100644
index 0000000000000..1171478de2eb4
--- /dev/null
+++ b/pandas/util/_validators.py
@@ -0,0 +1,358 @@
+"""
+Module that contains many useful utilities
+for validating data or function arguments
+"""
+import warnings
+
+from pandas.core.dtypes.common import is_bool
+
+
+def _check_arg_length(fname, args, max_fname_arg_count, compat_args):
+    """
+    Checks whether 'args' has length of at most 'compat_args'. Raises
+    a TypeError if that is not the case, similar to in Python when a
+    function is called with too many arguments.
+
+    """
+    if max_fname_arg_count < 0:
+        raise ValueError("'max_fname_arg_count' must be non-negative")
+
+    if len(args) > len(compat_args):
+        max_arg_count = len(compat_args) + max_fname_arg_count
+        actual_arg_count = len(args) + max_fname_arg_count
+        argument = 'argument' if max_arg_count == 1 else 'arguments'
+
+        raise TypeError(
+            "{fname}() takes at most {max_arg} {argument} "
+            "({given_arg} given)".format(
+                fname=fname, max_arg=max_arg_count,
+                argument=argument, given_arg=actual_arg_count))
+
+
+def _check_for_default_values(fname, arg_val_dict, compat_args):
+    """
+    Check that the keys in `arg_val_dict` are mapped to their
+    default values as specified in `compat_args`.
+
+    Note that this function is to be called only when it has been
+    checked that arg_val_dict.keys() is a subset of compat_args
+
+    """
+    for key in arg_val_dict:
+        # try checking equality directly with '=' operator,
+        # as comparison may have been overridden for the left
+        # hand object
+        try:
+            v1 = arg_val_dict[key]
+            v2 = compat_args[key]
+
+            # check for None-ness otherwise we could end up
+            # comparing a numpy array vs None
+            if (v1 is not None and v2 is None) or \
+               (v1 is None and v2 is not None):
+                match = False
+            else:
+                match = (v1 == v2)
+
+            if not is_bool(match):
+                raise ValueError("'match' is not a boolean")
+
+        # could not compare them directly, so try comparison
+        # using the 'is' operator
+        except ValueError:
+            match = (arg_val_dict[key] is compat_args[key])
+
+        if not match:
+            raise ValueError(("the '{arg}' parameter is not "
+                              "supported in the pandas "
+                              "implementation of {fname}()".
+                              format(fname=fname, arg=key)))
+
+
+def validate_args(fname, args, max_fname_arg_count, compat_args):
+    """
+    Checks whether the length of the `*args` argument passed into a function
+    has at most `len(compat_args)` arguments and whether or not all of these
+    elements in `args` are set to their default values.
+
+    fname: str
+        The name of the function being passed the `*args` parameter
+
+    args: tuple
+        The `*args` parameter passed into a function
+
+    max_fname_arg_count: int
+        The maximum number of arguments that the function `fname`
+        can accept, excluding those in `args`. Used for displaying
+        appropriate error messages. Must be non-negative.
+
+    compat_args: OrderedDict
+        A ordered dictionary of keys and their associated default values.
+        In order to accommodate buggy behaviour in some versions of `numpy`,
+        where a signature displayed keyword arguments but then passed those
+        arguments **positionally** internally when calling downstream
+        implementations, an ordered dictionary ensures that the original
+        order of the keyword arguments is enforced. Note that if there is
+        only one key, a generic dict can be passed in as well.
+
+    Raises
+    ------
+    TypeError if `args` contains more values than there are `compat_args`
+    ValueError if `args` contains values that do not correspond to those
+    of the default values specified in `compat_args`
+
+    """
+    _check_arg_length(fname, args, max_fname_arg_count, compat_args)
+
+    # We do this so that we can provide a more informative
+    # error message about the parameters that we are not
+    # supporting in the pandas implementation of 'fname'
+    kwargs = dict(zip(compat_args, args))
+    _check_for_default_values(fname, kwargs, compat_args)
+
+
+def _check_for_invalid_keys(fname, kwargs, compat_args):
+    """
+    Checks whether 'kwargs' contains any keys that are not
+    in 'compat_args' and raises a TypeError if there is one.
+
+    """
+    # set(dict) --> set of the dictionary's keys
+    diff = set(kwargs) - set(compat_args)
+
+    if diff:
+        bad_arg = list(diff)[0]
+        raise TypeError(("{fname}() got an unexpected "
+                         "keyword argument '{arg}'".
+                         format(fname=fname, arg=bad_arg)))
+
+
+def validate_kwargs(fname, kwargs, compat_args):
+    """
+    Checks whether parameters passed to the **kwargs argument in a
+    function `fname` are valid parameters as specified in `*compat_args`
+    and whether or not they are set to their default values.
+
+    Parameters
+    ----------
+    fname: str
+        The name of the function being passed the `**kwargs` parameter
+
+    kwargs: dict
+        The `**kwargs` parameter passed into `fname`
+
+    compat_args: dict
+        A dictionary of keys that `kwargs` is allowed to have and their
+        associated default values
+
+    Raises
+    ------
+    TypeError if `kwargs` contains keys not in `compat_args`
+    ValueError if `kwargs` contains keys in `compat_args` that do not
+    map to the default values specified in `compat_args`
+
+    """
+    kwds = kwargs.copy()
+    _check_for_invalid_keys(fname, kwargs, compat_args)
+    _check_for_default_values(fname, kwds, compat_args)
+
+
+def validate_args_and_kwargs(fname, args, kwargs,
+                             max_fname_arg_count,
+                             compat_args):
+    """
+    Checks whether parameters passed to the *args and **kwargs argument in a
+    function `fname` are valid parameters as specified in `*compat_args`
+    and whether or not they are set to their default values.
+
+    Parameters
+    ----------
+    fname: str
+        The name of the function being passed the `**kwargs` parameter
+
+    args: tuple
+        The `*args` parameter passed into a function
+
+    kwargs: dict
+        The `**kwargs` parameter passed into `fname`
+
+    max_fname_arg_count: int
+        The minimum number of arguments that the function `fname`
+        requires, excluding those in `args`. Used for displaying
+        appropriate error messages. Must be non-negative.
+
+    compat_args: OrderedDict
+        A ordered dictionary of keys that `kwargs` is allowed to
+        have and their associated default values. Note that if there
+        is only one key, a generic dict can be passed in as well.
+
+    Raises
+    ------
+    TypeError if `args` contains more values than there are
+    `compat_args` OR `kwargs` contains keys not in `compat_args`
+    ValueError if `args` contains values not at the default value (`None`)
+    `kwargs` contains keys in `compat_args` that do not map to the default
+    value as specified in `compat_args`
+
+    See Also
+    --------
+    validate_args : Purely args validation.
+    validate_kwargs : Purely kwargs validation.
+
+    """
+    # Check that the total number of arguments passed in (i.e.
+    # args and kwargs) does not exceed the length of compat_args
+    _check_arg_length(fname, args + tuple(kwargs.values()),
+                      max_fname_arg_count, compat_args)
+
+    # Check there is no overlap with the positional and keyword
+    # arguments, similar to what is done in actual Python functions
+    args_dict = dict(zip(compat_args, args))
+
+    for key in args_dict:
+        if key in kwargs:
+            raise TypeError("{fname}() got multiple values for keyword "
+                            "argument '{arg}'".format(fname=fname, arg=key))
+
+    kwargs.update(args_dict)
+    validate_kwargs(fname, kwargs, compat_args)
+
+
+def validate_bool_kwarg(value, arg_name):
+    """ Ensures that argument passed in arg_name is of type bool. """
+    if not (is_bool(value) or value is None):
+        raise ValueError('For argument "{arg}" expected type bool, received '
+                         'type {typ}.'.format(arg=arg_name,
+                                              typ=type(value).__name__))
+    return value
+
+
+def validate_axis_style_args(data, args, kwargs, arg_name, method_name):
+    """Argument handler for mixed index, columns / axis functions
+
+    In an attempt to handle both `.method(index, columns)`, and
+    `.method(arg, axis=.)`, we have to do some bad things to argument
+    parsing. This translates all arguments to `{index=., columns=.}` style.
+
+    Parameters
+    ----------
+    data : DataFrame or Panel
+    arg : tuple
+        All positional arguments from the user
+    kwargs : dict
+        All keyword arguments from the user
+    arg_name, method_name : str
+        Used for better error messages
+
+    Returns
+    -------
+    kwargs : dict
+        A dictionary of keyword arguments. Doesn't modify ``kwargs``
+        inplace, so update them with the return value here.
+
+    Examples
+    --------
+    >>> df._validate_axis_style_args((str.upper,), {'columns': id},
+    ...                              'mapper', 'rename')
+    {'columns': <function id>, 'index': <method 'upper' of 'str' objects>}
+
+    This emits a warning
+    >>> df._validate_axis_style_args((str.upper, id), {},
+    ...                              'mapper', 'rename')
+    {'columns': <function id>, 'index': <method 'upper' of 'str' objects>}
+    """
+    # TODO(PY3): Change to keyword-only args and remove all this
+
+    out = {}
+    # Goal: fill 'out' with index/columns-style arguments
+    # like out = {'index': foo, 'columns': bar}
+
+    # Start by validating for consistency
+    if 'axis' in kwargs and any(x in kwargs for x in data._AXIS_NUMBERS):
+        msg = "Cannot specify both 'axis' and any of 'index' or 'columns'."
+        raise TypeError(msg)
+
+    # First fill with explicit values provided by the user...
+    if arg_name in kwargs:
+        if args:
+            msg = ("{} got multiple values for argument "
+                   "'{}'".format(method_name, arg_name))
+            raise TypeError(msg)
+
+        axis = data._get_axis_name(kwargs.get('axis', 0))
+        out[axis] = kwargs[arg_name]
+
+    # More user-provided arguments, now from kwargs
+    for k, v in kwargs.items():
+        try:
+            ax = data._get_axis_name(k)
+        except ValueError:
+            pass
+        else:
+            out[ax] = v
+
+    # All user-provided kwargs have been handled now.
+    # Now we supplement with positional arguments, emitting warnings
+    # when there's ambiguity and raising when there's conflicts
+
+    if len(args) == 0:
+        pass  # It's up to the function to decide if this is valid
+    elif len(args) == 1:
+        axis = data._get_axis_name(kwargs.get('axis', 0))
+        out[axis] = args[0]
+    elif len(args) == 2:
+        if 'axis' in kwargs:
+            # Unambiguously wrong
+            msg = ("Cannot specify both 'axis' and any of 'index' "
+                   "or 'columns'")
+            raise TypeError(msg)
+
+        msg = ("Interpreting call\n\t'.{method_name}(a, b)' as "
+               "\n\t'.{method_name}(index=a, columns=b)'.\nUse named "
+               "arguments to remove any ambiguity. In the future, using "
+               "positional arguments for 'index' or 'columns' will raise "
+               " a 'TypeError'.")
+        warnings.warn(msg.format(method_name=method_name,), FutureWarning,
+                      stacklevel=4)
+        out[data._AXIS_NAMES[0]] = args[0]
+        out[data._AXIS_NAMES[1]] = args[1]
+    else:
+        msg = "Cannot specify all of '{}', 'index', 'columns'."
+        raise TypeError(msg.format(arg_name))
+    return out
+
+
+def validate_fillna_kwargs(value, method, validate_scalar_dict_value=True):
+    """Validate the keyword arguments to 'fillna'.
+
+    This checks that exactly one of 'value' and 'method' is specified.
+    If 'method' is specified, this validates that it's a valid method.
+
+    Parameters
+    ----------
+    value, method : object
+        The 'value' and 'method' keyword arguments for 'fillna'.
+    validate_scalar_dict_value : bool, default True
+        Whether to validate that 'value' is a scalar or dict. Specifically,
+        validate that it is not a list or tuple.
+
+    Returns
+    -------
+    value, method : object
+    """
+    from pandas.core.missing import clean_fill_method
+
+    if value is None and method is None:
+        raise ValueError("Must specify a fill 'value' or 'method'.")
+    elif value is None and method is not None:
+        method = clean_fill_method(method)
+
+    elif value is not None and method is None:
+        if validate_scalar_dict_value and isinstance(value, (list, tuple)):
+            raise TypeError('"value" parameter must be a scalar or dict, but '
+                            'you passed a "{0}"'.format(type(value).__name__))
+
+    elif value is not None and method is not None:
+        raise ValueError("Cannot specify both 'value' and 'method'.")
+
+    return value, method
diff --git a/pandas/util/clipboard/__init__.py b/pandas/util/clipboard/__init__.py
deleted file mode 100644
index 9e2b2faf858db..0000000000000
--- a/pandas/util/clipboard/__init__.py
+++ /dev/null
@@ -1,110 +0,0 @@
-"""
-Pyperclip
-
-A cross-platform clipboard module for Python. (only handles plain text for now)
-By Al Sweigart al@inventwithpython.com
-BSD License
-
-Usage:
-  import pyperclip
-  pyperclip.copy('The text to be copied to the clipboard.')
-  spam = pyperclip.paste()
-
-  if not pyperclip.copy:
-    print("Copy functionality unavailable!")
-
-On Windows, no additional modules are needed.
-On Mac, the module uses pbcopy and pbpaste, which should come with the os.
-On Linux, install xclip or xsel via package manager. For example, in Debian:
-sudo apt-get install xclip
-
-Otherwise on Linux, you will need the gtk or PyQt4 modules installed.
-
-gtk and PyQt4 modules are not available for Python 3,
-and this module does not work with PyGObject yet.
-"""
-__version__ = '1.5.27'
-
-# flake8: noqa
-
-import platform
-import os
-import subprocess
-from .clipboards import (init_osx_clipboard,
-                         init_gtk_clipboard, init_qt_clipboard,
-                         init_xclip_clipboard, init_xsel_clipboard,
-                         init_klipper_clipboard, init_no_clipboard)
-from .windows import init_windows_clipboard
-
-# `import PyQt4` sys.exit()s if DISPLAY is not in the environment.
-# Thus, we need to detect the presence of $DISPLAY manually
-# and not load PyQt4 if it is absent.
-HAS_DISPLAY = os.getenv("DISPLAY", False)
-CHECK_CMD = "where" if platform.system() == "Windows" else "which"
-
-
-def _executable_exists(name):
-    return subprocess.call([CHECK_CMD, name],
-                           stdout=subprocess.PIPE, stderr=subprocess.PIPE) == 0
-
-
-def determine_clipboard():
-    # Determine the OS/platform and set
-    # the copy() and paste() functions accordingly.
-    if 'cygwin' in platform.system().lower():
-        # FIXME: pyperclip currently does not support Cygwin,
-        # see https://github.com/asweigart/pyperclip/issues/55
-        pass
-    elif os.name == 'nt' or platform.system() == 'Windows':
-        return init_windows_clipboard()
-    if os.name == 'mac' or platform.system() == 'Darwin':
-        return init_osx_clipboard()
-    if HAS_DISPLAY:
-        # Determine which command/module is installed, if any.
-        try:
-            import gtk  # check if gtk is installed
-        except ImportError:
-            pass
-        else:
-            return init_gtk_clipboard()
-
-        try:
-            import PyQt4  # check if PyQt4 is installed
-        except ImportError:
-            pass
-        else:
-            return init_qt_clipboard()
-
-        if _executable_exists("xclip"):
-            return init_xclip_clipboard()
-        if _executable_exists("xsel"):
-            return init_xsel_clipboard()
-        if _executable_exists("klipper") and _executable_exists("qdbus"):
-            return init_klipper_clipboard()
-
-    return init_no_clipboard()
-
-
-def set_clipboard(clipboard):
-    global copy, paste
-
-    clipboard_types = {'osx': init_osx_clipboard,
-                       'gtk': init_gtk_clipboard,
-                       'qt': init_qt_clipboard,
-                       'xclip': init_xclip_clipboard,
-                       'xsel': init_xsel_clipboard,
-                       'klipper': init_klipper_clipboard,
-                       'windows': init_windows_clipboard,
-                       'no': init_no_clipboard}
-
-    copy, paste = clipboard_types[clipboard]()
-
-
-copy, paste = determine_clipboard()
-
-__all__ = ["copy", "paste"]
-
-
-# pandas aliases
-clipboard_get = paste
-clipboard_set = copy
diff --git a/pandas/util/clipboard/clipboards.py b/pandas/util/clipboard/clipboards.py
deleted file mode 100644
index bd5528334168f..0000000000000
--- a/pandas/util/clipboard/clipboards.py
+++ /dev/null
@@ -1,138 +0,0 @@
-# flake8: noqa
-
-import sys
-import subprocess
-from .exceptions import PyperclipException
-
-EXCEPT_MSG = """
-    Pyperclip could not find a copy/paste mechanism for your system.
-    For more information, please visit https://pyperclip.readthedocs.org """
-PY2 = sys.version_info[0] == 2
-text_type = unicode if PY2 else str
-
-
-def init_osx_clipboard():
-    def copy_osx(text):
-        p = subprocess.Popen(['pbcopy', 'w'],
-                             stdin=subprocess.PIPE, close_fds=True)
-        p.communicate(input=text.encode('utf-8'))
-
-    def paste_osx():
-        p = subprocess.Popen(['pbpaste', 'r'],
-                             stdout=subprocess.PIPE, close_fds=True)
-        stdout, stderr = p.communicate()
-        return stdout.decode('utf-8')
-
-    return copy_osx, paste_osx
-
-
-def init_gtk_clipboard():
-    import gtk
-
-    def copy_gtk(text):
-        global cb
-        cb = gtk.Clipboard()
-        cb.set_text(text)
-        cb.store()
-
-    def paste_gtk():
-        clipboardContents = gtk.Clipboard().wait_for_text()
-        # for python 2, returns None if the clipboard is blank.
-        if clipboardContents is None:
-            return ''
-        else:
-            return clipboardContents
-
-    return copy_gtk, paste_gtk
-
-
-def init_qt_clipboard():
-    # $DISPLAY should exist
-    from PyQt4.QtGui import QApplication
-
-    # use the global instance if it exists
-    app = QApplication.instance() or QApplication([])
-
-    def copy_qt(text):
-        cb = app.clipboard()
-        cb.setText(text)
-
-    def paste_qt():
-        cb = app.clipboard()
-        return text_type(cb.text())
-
-    return copy_qt, paste_qt
-
-
-def init_xclip_clipboard():
-    def copy_xclip(text):
-        p = subprocess.Popen(['xclip', '-selection', 'c'],
-                             stdin=subprocess.PIPE, close_fds=True)
-        p.communicate(input=text.encode('utf-8'))
-
-    def paste_xclip():
-        p = subprocess.Popen(['xclip', '-selection', 'c', '-o'],
-                             stdout=subprocess.PIPE, close_fds=True)
-        stdout, stderr = p.communicate()
-        return stdout.decode('utf-8')
-
-    return copy_xclip, paste_xclip
-
-
-def init_xsel_clipboard():
-    def copy_xsel(text):
-        p = subprocess.Popen(['xsel', '-b', '-i'],
-                             stdin=subprocess.PIPE, close_fds=True)
-        p.communicate(input=text.encode('utf-8'))
-
-    def paste_xsel():
-        p = subprocess.Popen(['xsel', '-b', '-o'],
-                             stdout=subprocess.PIPE, close_fds=True)
-        stdout, stderr = p.communicate()
-        return stdout.decode('utf-8')
-
-    return copy_xsel, paste_xsel
-
-
-def init_klipper_clipboard():
-    def copy_klipper(text):
-        p = subprocess.Popen(
-            ['qdbus', 'org.kde.klipper', '/klipper', 'setClipboardContents',
-             text.encode('utf-8')],
-            stdin=subprocess.PIPE, close_fds=True)
-        p.communicate(input=None)
-
-    def paste_klipper():
-        p = subprocess.Popen(
-            ['qdbus', 'org.kde.klipper', '/klipper', 'getClipboardContents'],
-            stdout=subprocess.PIPE, close_fds=True)
-        stdout, stderr = p.communicate()
-
-        # Workaround for https://bugs.kde.org/show_bug.cgi?id=342874
-        # TODO: https://github.com/asweigart/pyperclip/issues/43
-        clipboardContents = stdout.decode('utf-8')
-        # even if blank, Klipper will append a newline at the end
-        assert len(clipboardContents) > 0
-        # make sure that newline is there
-        assert clipboardContents.endswith('\n')
-        if clipboardContents.endswith('\n'):
-            clipboardContents = clipboardContents[:-1]
-        return clipboardContents
-
-    return copy_klipper, paste_klipper
-
-
-def init_no_clipboard():
-    class ClipboardUnavailable(object):
-
-        def __call__(self, *args, **kwargs):
-            raise PyperclipException(EXCEPT_MSG)
-
-        if PY2:
-            def __nonzero__(self):
-                return False
-        else:
-            def __bool__(self):
-                return False
-
-    return ClipboardUnavailable(), ClipboardUnavailable()
diff --git a/pandas/util/decorators.py b/pandas/util/decorators.py
deleted file mode 100644
index 4e1719958e8b7..0000000000000
--- a/pandas/util/decorators.py
+++ /dev/null
@@ -1,281 +0,0 @@
-from pandas.compat import StringIO, callable, signature
-from pandas._libs.lib import cache_readonly  # noqa
-import types
-import sys
-import warnings
-from textwrap import dedent
-from functools import wraps, update_wrapper
-
-
-def deprecate(name, alternative, alt_name=None):
-    alt_name = alt_name or alternative.__name__
-
-    def wrapper(*args, **kwargs):
-        warnings.warn("%s is deprecated. Use %s instead" % (name, alt_name),
-                      FutureWarning, stacklevel=2)
-        return alternative(*args, **kwargs)
-    return wrapper
-
-
-def deprecate_kwarg(old_arg_name, new_arg_name, mapping=None, stacklevel=2):
-    """Decorator to deprecate a keyword argument of a function
-
-    Parameters
-    ----------
-    old_arg_name : str
-        Name of argument in function to deprecate
-    new_arg_name : str
-        Name of prefered argument in function
-    mapping : dict or callable
-        If mapping is present, use it to translate old arguments to
-        new arguments. A callable must do its own value checking;
-        values not found in a dict will be forwarded unchanged.
-
-    Examples
-    --------
-    The following deprecates 'cols', using 'columns' instead
-
-    >>> @deprecate_kwarg(old_arg_name='cols', new_arg_name='columns')
-    ... def f(columns=''):
-    ...     print(columns)
-    ...
-    >>> f(columns='should work ok')
-    should work ok
-    >>> f(cols='should raise warning')
-    FutureWarning: cols is deprecated, use columns instead
-      warnings.warn(msg, FutureWarning)
-    should raise warning
-    >>> f(cols='should error', columns="can\'t pass do both")
-    TypeError: Can only specify 'cols' or 'columns', not both
-    >>> @deprecate_kwarg('old', 'new', {'yes': True, 'no': False})
-    ... def f(new=False):
-    ...     print('yes!' if new else 'no!')
-    ...
-    >>> f(old='yes')
-    FutureWarning: old='yes' is deprecated, use new=True instead
-      warnings.warn(msg, FutureWarning)
-    yes!
-
-    """
-    if mapping is not None and not hasattr(mapping, 'get') and \
-            not callable(mapping):
-        raise TypeError("mapping from old to new argument values "
-                        "must be dict or callable!")
-
-    def _deprecate_kwarg(func):
-        @wraps(func)
-        def wrapper(*args, **kwargs):
-            old_arg_value = kwargs.pop(old_arg_name, None)
-            if old_arg_value is not None:
-                if mapping is not None:
-                    if hasattr(mapping, 'get'):
-                        new_arg_value = mapping.get(old_arg_value,
-                                                    old_arg_value)
-                    else:
-                        new_arg_value = mapping(old_arg_value)
-                    msg = "the %s=%r keyword is deprecated, " \
-                          "use %s=%r instead" % \
-                          (old_arg_name, old_arg_value,
-                           new_arg_name, new_arg_value)
-                else:
-                    new_arg_value = old_arg_value
-                    msg = "the '%s' keyword is deprecated, " \
-                          "use '%s' instead" % (old_arg_name, new_arg_name)
-
-                warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
-                if kwargs.get(new_arg_name, None) is not None:
-                    msg = ("Can only specify '%s' or '%s', not both" %
-                           (old_arg_name, new_arg_name))
-                    raise TypeError(msg)
-                else:
-                    kwargs[new_arg_name] = new_arg_value
-            return func(*args, **kwargs)
-        return wrapper
-    return _deprecate_kwarg
-
-
-# Substitution and Appender are derived from matplotlib.docstring (1.1.0)
-# module http://matplotlib.org/users/license.html
-
-
-class Substitution(object):
-    """
-    A decorator to take a function's docstring and perform string
-    substitution on it.
-
-    This decorator should be robust even if func.__doc__ is None
-    (for example, if -OO was passed to the interpreter)
-
-    Usage: construct a docstring.Substitution with a sequence or
-    dictionary suitable for performing substitution; then
-    decorate a suitable function with the constructed object. e.g.
-
-    sub_author_name = Substitution(author='Jason')
-
-    @sub_author_name
-    def some_function(x):
-        "%(author)s wrote this function"
-
-    # note that some_function.__doc__ is now "Jason wrote this function"
-
-    One can also use positional arguments.
-
-    sub_first_last_names = Substitution('Edgar Allen', 'Poe')
-
-    @sub_first_last_names
-    def some_function(x):
-        "%s %s wrote the Raven"
-    """
-
-    def __init__(self, *args, **kwargs):
-        if (args and kwargs):
-            raise AssertionError("Only positional or keyword args are allowed")
-
-        self.params = args or kwargs
-
-    def __call__(self, func):
-        func.__doc__ = func.__doc__ and func.__doc__ % self.params
-        return func
-
-    def update(self, *args, **kwargs):
-        "Assume self.params is a dict and update it with supplied args"
-        self.params.update(*args, **kwargs)
-
-    @classmethod
-    def from_params(cls, params):
-        """
-        In the case where the params is a mutable sequence (list or dictionary)
-        and it may change before this class is called, one may explicitly use a
-        reference to the params rather than using *args or **kwargs which will
-        copy the values and not reference them.
-        """
-        result = cls()
-        result.params = params
-        return result
-
-
-class Appender(object):
-    """
-    A function decorator that will append an addendum to the docstring
-    of the target function.
-
-    This decorator should be robust even if func.__doc__ is None
-    (for example, if -OO was passed to the interpreter).
-
-    Usage: construct a docstring.Appender with a string to be joined to
-    the original docstring. An optional 'join' parameter may be supplied
-    which will be used to join the docstring and addendum. e.g.
-
-    add_copyright = Appender("Copyright (c) 2009", join='\n')
-
-    @add_copyright
-    def my_dog(has='fleas'):
-        "This docstring will have a copyright below"
-        pass
-    """
-
-    def __init__(self, addendum, join='', indents=0):
-        if indents > 0:
-            self.addendum = indent(addendum, indents=indents)
-        else:
-            self.addendum = addendum
-        self.join = join
-
-    def __call__(self, func):
-        func.__doc__ = func.__doc__ if func.__doc__ else ''
-        self.addendum = self.addendum if self.addendum else ''
-        docitems = [func.__doc__, self.addendum]
-        func.__doc__ = dedent(self.join.join(docitems))
-        return func
-
-
-def indent(text, indents=1):
-    if not text or not isinstance(text, str):
-        return ''
-    jointext = ''.join(['\n'] + ['    '] * indents)
-    return jointext.join(text.split('\n'))
-
-
-def suppress_stdout(f):
-    def wrapped(*args, **kwargs):
-        try:
-            sys.stdout = StringIO()
-            f(*args, **kwargs)
-        finally:
-            sys.stdout = sys.__stdout__
-
-    return wrapped
-
-
-def make_signature(func):
-    """
-    Returns a string repr of the arg list of a func call, with any defaults
-
-    Examples
-    --------
-
-    >>> def f(a,b,c=2) :
-    >>>     return a*b*c
-    >>> print(_make_signature(f))
-    a,b,c=2
-    """
-    spec = signature(func)
-    if spec.defaults is None:
-        n_wo_defaults = len(spec.args)
-        defaults = ('',) * n_wo_defaults
-    else:
-        n_wo_defaults = len(spec.args) - len(spec.defaults)
-        defaults = ('',) * n_wo_defaults + spec.defaults
-    args = []
-    for i, (var, default) in enumerate(zip(spec.args, defaults)):
-        args.append(var if default == '' else var + '=' + repr(default))
-    if spec.varargs:
-        args.append('*' + spec.varargs)
-    if spec.keywords:
-        args.append('**' + spec.keywords)
-    return args, spec.args
-
-
-class docstring_wrapper(object):
-    """
-    decorator to wrap a function,
-    provide a dynamically evaluated doc-string
-
-    Parameters
-    ----------
-    func : callable
-    creator : callable
-        return the doc-string
-    default : str, optional
-        return this doc-string on error
-    """
-    _attrs = ['__module__', '__name__',
-              '__qualname__', '__annotations__']
-
-    def __init__(self, func, creator, default=None):
-        self.func = func
-        self.creator = creator
-        self.default = default
-        update_wrapper(
-            self, func, [attr for attr in self._attrs
-                         if hasattr(func, attr)])
-
-    def __get__(self, instance, cls=None):
-
-        # we are called with a class
-        if instance is None:
-            return self
-
-        # we want to return the actual passed instance
-        return types.MethodType(self, instance)
-
-    def __call__(self, *args, **kwargs):
-        return self.func(*args, **kwargs)
-
-    @property
-    def __doc__(self):
-        try:
-            return self.creator()
-        except Exception as exc:
-            msg = self.default or str(exc)
-            return msg
diff --git a/pandas/util/depr_module.py b/pandas/util/depr_module.py
deleted file mode 100644
index af7faf9dd96c8..0000000000000
--- a/pandas/util/depr_module.py
+++ /dev/null
@@ -1,84 +0,0 @@
-"""
-This module houses a utility class for mocking deprecated modules.
-It is for internal use only and should not be used beyond this purpose.
-"""
-
-import warnings
-import importlib
-
-
-class _DeprecatedModule(object):
-    """ Class for mocking deprecated modules.
-
-    Parameters
-    ----------
-    deprmod : name of module to be deprecated.
-    deprmodto : name of module as a replacement, optional.
-                If not given, the __module__ attribute will
-                be used when needed.
-    removals : objects or methods in module that will no longer be
-               accessible once module is removed.
-    """
-
-    def __init__(self, deprmod, deprmodto=None, removals=None):
-        self.deprmod = deprmod
-        self.deprmodto = deprmodto
-        self.removals = removals
-        if self.removals is not None:
-            self.removals = frozenset(self.removals)
-
-        # For introspection purposes.
-        self.self_dir = frozenset(dir(self.__class__))
-
-    def __dir__(self):
-        deprmodule = self._import_deprmod()
-        return dir(deprmodule)
-
-    def __repr__(self):
-        deprmodule = self._import_deprmod()
-        return repr(deprmodule)
-
-    __str__ = __repr__
-
-    def __getattr__(self, name):
-        if name in self.self_dir:
-            return object.__getattribute__(self, name)
-
-        try:
-            deprmodule = self._import_deprmod(self.deprmod)
-        except ImportError:
-            if self.deprmodto is None:
-                raise
-
-            # a rename
-            deprmodule = self._import_deprmod(self.deprmodto)
-
-        obj = getattr(deprmodule, name)
-
-        if self.removals is not None and name in self.removals:
-            warnings.warn(
-                "{deprmod}.{name} is deprecated and will be removed in "
-                "a future version.".format(deprmod=self.deprmod, name=name),
-                FutureWarning, stacklevel=2)
-        else:
-            deprmodto = self.deprmodto
-            if deprmodto is None:
-                deprmodto = "{modname}.{name}".format(
-                    modname=obj.__module__, name=name)
-            # The object is actually located in another module.
-            warnings.warn(
-                "{deprmod}.{name} is deprecated. Please use "
-                "{deprmodto}.{name} instead.".format(
-                    deprmod=self.deprmod, name=name, deprmodto=deprmodto),
-                FutureWarning, stacklevel=2)
-
-        return obj
-
-    def _import_deprmod(self, mod=None):
-        if mod is None:
-            mod = self.deprmod
-
-        with warnings.catch_warnings():
-            warnings.filterwarnings('ignore', category=FutureWarning)
-            deprmodule = importlib.import_module(mod)
-            return deprmodule
diff --git a/pandas/util/doctools.py b/pandas/util/doctools.py
deleted file mode 100644
index 6df6444aeafab..0000000000000
--- a/pandas/util/doctools.py
+++ /dev/null
@@ -1,190 +0,0 @@
-import numpy as np
-import pandas as pd
-import pandas.compat as compat
-
-
-class TablePlotter(object):
-    """
-    Layout some DataFrames in vertical/horizontal layout for explanation.
-    Used in merging.rst
-    """
-
-    def __init__(self, cell_width=0.37, cell_height=0.25, font_size=7.5):
-        self.cell_width = cell_width
-        self.cell_height = cell_height
-        self.font_size = font_size
-
-    def _shape(self, df):
-        """Calcurate table chape considering index levels"""
-        row, col = df.shape
-        return row + df.columns.nlevels, col + df.index.nlevels
-
-    def _get_cells(self, left, right, vertical):
-        """Calcurate appropriate figure size based on left and right data"""
-        if vertical:
-            # calcurate required number of cells
-            vcells = max(sum([self._shape(l)[0] for l in left]),
-                         self._shape(right)[0])
-            hcells = (max([self._shape(l)[1] for l in left]) +
-                      self._shape(right)[1])
-        else:
-            vcells = max([self._shape(l)[0] for l in left] +
-                         [self._shape(right)[0]])
-            hcells = sum([self._shape(l)[1] for l in left] +
-                         [self._shape(right)[1]])
-        return hcells, vcells
-
-    def plot(self, left, right, labels=None, vertical=True):
-        """
-        Plot left / right DataFrames in specified layout.
-
-        Parameters
-        ----------
-        left : list of DataFrames before operation is applied
-        right : DataFrame of operation result
-        labels : list of str to be drawn as titles of left DataFrames
-        vertical : bool
-            If True, use vertical layout. If False, use horizontal layout.
-        """
-        import matplotlib.pyplot as plt
-        import matplotlib.gridspec as gridspec
-
-        if not isinstance(left, list):
-            left = [left]
-        left = [self._conv(l) for l in left]
-        right = self._conv(right)
-
-        hcells, vcells = self._get_cells(left, right, vertical)
-
-        if vertical:
-            figsize = self.cell_width * hcells, self.cell_height * vcells
-        else:
-            # include margin for titles
-            figsize = self.cell_width * hcells, self.cell_height * vcells
-        fig = plt.figure(figsize=figsize)
-
-        if vertical:
-            gs = gridspec.GridSpec(len(left), hcells)
-            # left
-            max_left_cols = max([self._shape(l)[1] for l in left])
-            max_left_rows = max([self._shape(l)[0] for l in left])
-            for i, (l, label) in enumerate(zip(left, labels)):
-                ax = fig.add_subplot(gs[i, 0:max_left_cols])
-                self._make_table(ax, l, title=label,
-                                 height=1.0 / max_left_rows)
-            # right
-            ax = plt.subplot(gs[:, max_left_cols:])
-            self._make_table(ax, right, title='Result', height=1.05 / vcells)
-            fig.subplots_adjust(top=0.9, bottom=0.05, left=0.05, right=0.95)
-        else:
-            max_rows = max([self._shape(df)[0] for df in left + [right]])
-            height = 1.0 / np.max(max_rows)
-            gs = gridspec.GridSpec(1, hcells)
-            # left
-            i = 0
-            for l, label in zip(left, labels):
-                sp = self._shape(l)
-                ax = fig.add_subplot(gs[0, i:i + sp[1]])
-                self._make_table(ax, l, title=label, height=height)
-                i += sp[1]
-            # right
-            ax = plt.subplot(gs[0, i:])
-            self._make_table(ax, right, title='Result', height=height)
-            fig.subplots_adjust(top=0.85, bottom=0.05, left=0.05, right=0.95)
-
-        return fig
-
-    def _conv(self, data):
-        """Convert each input to appropriate for table outplot"""
-        if isinstance(data, pd.Series):
-            if data.name is None:
-                data = data.to_frame(name='')
-            else:
-                data = data.to_frame()
-        data = data.fillna('NaN')
-        return data
-
-    def _insert_index(self, data):
-        # insert is destructive
-        data = data.copy()
-        idx_nlevels = data.index.nlevels
-        if idx_nlevels == 1:
-            data.insert(0, 'Index', data.index)
-        else:
-            for i in range(idx_nlevels):
-                data.insert(i, 'Index{0}'.format(i),
-                            data.index._get_level_values(i))
-
-        col_nlevels = data.columns.nlevels
-        if col_nlevels > 1:
-            col = data.columns._get_level_values(0)
-            values = [data.columns._get_level_values(i).values
-                      for i in range(1, col_nlevels)]
-            col_df = pd.DataFrame(values)
-            data.columns = col_df.columns
-            data = pd.concat([col_df, data])
-            data.columns = col
-        return data
-
-    def _make_table(self, ax, df, title, height=None):
-        if df is None:
-            ax.set_visible(False)
-            return
-
-        import pandas.tools.plotting as plotting
-
-        idx_nlevels = df.index.nlevels
-        col_nlevels = df.columns.nlevels
-        # must be convert here to get index levels for colorization
-        df = self._insert_index(df)
-        tb = plotting.table(ax, df, loc=9)
-        tb.set_fontsize(self.font_size)
-
-        if height is None:
-            height = 1.0 / (len(df) + 1)
-
-        props = tb.properties()
-        for (r, c), cell in compat.iteritems(props['celld']):
-            if c == -1:
-                cell.set_visible(False)
-            elif r < col_nlevels and c < idx_nlevels:
-                cell.set_visible(False)
-            elif r < col_nlevels or c < idx_nlevels:
-                cell.set_facecolor('#AAAAAA')
-            cell.set_height(height)
-
-        ax.set_title(title, size=self.font_size)
-        ax.axis('off')
-
-
-if __name__ == "__main__":
-    import matplotlib.pyplot as plt
-
-    p = TablePlotter()
-
-    df1 = pd.DataFrame({'A': [10, 11, 12],
-                        'B': [20, 21, 22],
-                        'C': [30, 31, 32]})
-    df2 = pd.DataFrame({'A': [10, 12],
-                        'C': [30, 32]})
-
-    p.plot([df1, df2], pd.concat([df1, df2]),
-           labels=['df1', 'df2'], vertical=True)
-    plt.show()
-
-    df3 = pd.DataFrame({'X': [10, 12],
-                        'Z': [30, 32]})
-
-    p.plot([df1, df3], pd.concat([df1, df3], axis=1),
-           labels=['df1', 'df2'], vertical=False)
-    plt.show()
-
-    idx = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B'), (1, 'C'),
-                                     (2, 'A'), (2, 'B'), (2, 'C')])
-    col = pd.MultiIndex.from_tuples([(1, 'A'), (1, 'B')])
-    df3 = pd.DataFrame({'v1': [1, 2, 3, 4, 5, 6],
-                        'v2': [5, 6, 7, 8, 9, 10]},
-                       index=idx)
-    df3.columns = col
-    p.plot(df3, df3, labels=['df3'])
-    plt.show()
diff --git a/pandas/util/move.c b/pandas/util/move.c
index 9a8af5bbfbdf6..188d7b79b35d2 100644
--- a/pandas/util/move.c
+++ b/pandas/util/move.c
@@ -1,3 +1,12 @@
+/*
+Copyright (c) 2019, PyData Development Team
+All rights reserved.
+
+Distributed under the terms of the BSD Simplified License.
+
+The full license is in the LICENSE file, distributed with this software.
+*/
+
 #include <Python.h>
 
 #define COMPILING_IN_PY2 (PY_VERSION_HEX <= 0x03000000)
@@ -10,17 +19,17 @@
 
 /* in python 3, we cannot intern bytes objects so this is always false */
 #define PyString_CHECK_INTERNED(cs) 0
-#endif  /* !COMPILING_IN_PY2 */
+#endif  // !COMPILING_IN_PY2
 
 #ifndef Py_TPFLAGS_HAVE_GETCHARBUFFER
 #define Py_TPFLAGS_HAVE_GETCHARBUFFER 0
-#endif
+#endif  // Py_TPFLAGS_HAVE_GETCHARBUFFER
 
 #ifndef Py_TPFLAGS_HAVE_NEWBUFFER
 #define Py_TPFLAGS_HAVE_NEWBUFFER 0
-#endif
+#endif  // Py_TPFLAGS_HAVE_NEWBUFFER
 
-PyObject *badmove;  /* bad move exception class */
+static PyObject *badmove;  /* bad move exception class */
 
 typedef struct {
     PyObject_HEAD
@@ -28,18 +37,16 @@ typedef struct {
     PyObject *invalid_bytes;
 } stolenbufobject;
 
-PyTypeObject stolenbuf_type;  /* forward declare type */
+static PyTypeObject stolenbuf_type;  /* forward declare type */
 
 static void
-stolenbuf_dealloc(stolenbufobject *self)
-{
+stolenbuf_dealloc(stolenbufobject *self) {
     Py_DECREF(self->invalid_bytes);
     PyObject_Del(self);
 }
 
 static int
-stolenbuf_getbuffer(stolenbufobject *self, Py_buffer *view, int flags)
-{
+stolenbuf_getbuffer(stolenbufobject *self, Py_buffer *view, int flags) {
     return PyBuffer_FillInfo(view,
                              (PyObject*) self,
                              (void*) PyString_AS_STRING(self->invalid_bytes),
@@ -51,8 +58,8 @@ stolenbuf_getbuffer(stolenbufobject *self, Py_buffer *view, int flags)
 #if COMPILING_IN_PY2
 
 static Py_ssize_t
-stolenbuf_getreadwritebuf(stolenbufobject *self, Py_ssize_t segment, void **out)
-{
+stolenbuf_getreadwritebuf(stolenbufobject *self,
+                          Py_ssize_t segment, void **out) {
     if (segment != 0) {
         PyErr_SetString(PyExc_SystemError,
                         "accessing non-existent string segment");
@@ -63,15 +70,14 @@ stolenbuf_getreadwritebuf(stolenbufobject *self, Py_ssize_t segment, void **out)
 }
 
 static Py_ssize_t
-stolenbuf_getsegcount(stolenbufobject *self, Py_ssize_t *len)
-{
+stolenbuf_getsegcount(stolenbufobject *self, Py_ssize_t *len) {
     if (len) {
         *len = PyString_GET_SIZE(self->invalid_bytes);
     }
     return 1;
 }
 
-PyBufferProcs stolenbuf_as_buffer = {
+static PyBufferProcs stolenbuf_as_buffer = {
     (readbufferproc) stolenbuf_getreadwritebuf,
     (writebufferproc) stolenbuf_getreadwritebuf,
     (segcountproc) stolenbuf_getsegcount,
@@ -79,19 +85,19 @@ PyBufferProcs stolenbuf_as_buffer = {
     (getbufferproc) stolenbuf_getbuffer,
 };
 
-#else  /* Python 3 */
+#else  // Python 3
 
-PyBufferProcs stolenbuf_as_buffer = {
+static PyBufferProcs stolenbuf_as_buffer = {
     (getbufferproc) stolenbuf_getbuffer,
     NULL,
 };
 
-#endif  /* COMPILING_IN_PY2 */
+#endif  // COMPILING_IN_PY2
 
 PyDoc_STRVAR(stolenbuf_doc,
              "A buffer that is wrapping a stolen bytes object's buffer.");
 
-PyTypeObject stolenbuf_type = {
+static PyTypeObject stolenbuf_type = {
     PyVarObject_HEAD_INIT(NULL, 0)
     "pandas.util._move.stolenbuf",              /* tp_name */
     sizeof(stolenbufobject),                    /* tp_basicsize */
@@ -157,8 +163,7 @@ PyDoc_STRVAR(
    however, if called through *unpacking like ``stolenbuf(*(a,))`` it would
    only have the one reference (the tuple). */
 static PyObject*
-move_into_mutable_buffer(PyObject *self, PyObject *bytes_rvalue)
-{
+move_into_mutable_buffer(PyObject *self, PyObject *bytes_rvalue) {
     stolenbufobject *ret;
 
     if (!PyString_CheckExact(bytes_rvalue)) {
@@ -185,7 +190,7 @@ move_into_mutable_buffer(PyObject *self, PyObject *bytes_rvalue)
     return (PyObject*) ret;
 }
 
-PyMethodDef methods[] = {
+static PyMethodDef methods[] = {
     {"move_into_mutable_buffer",
      (PyCFunction) move_into_mutable_buffer,
      METH_O,
@@ -196,14 +201,14 @@ PyMethodDef methods[] = {
 #define MODULE_NAME "pandas.util._move"
 
 #if !COMPILING_IN_PY2
-PyModuleDef _move_module = {
+static PyModuleDef move_module = {
     PyModuleDef_HEAD_INIT,
     MODULE_NAME,
     NULL,
     -1,
     methods,
 };
-#endif  /* !COMPILING_IN_PY2 */
+#endif  // !COMPILING_IN_PY2
 
 PyDoc_STRVAR(
     badmove_doc,
@@ -226,7 +231,7 @@ PyInit__move(void)
 #else
 #define ERROR_RETURN
 init_move(void)
-#endif  /* !COMPILING_IN_PY2 */
+#endif  // !COMPILING_IN_PY2
 {
     PyObject *m;
 
@@ -242,10 +247,10 @@ init_move(void)
     }
 
 #if !COMPILING_IN_PY2
-    if (!(m = PyModule_Create(&_move_module)))
+    if (!(m = PyModule_Create(&move_module)))
 #else
     if (!(m = Py_InitModule(MODULE_NAME, methods)))
-#endif  /* !COMPILING_IN_PY2 */
+#endif  // !COMPILING_IN_PY2
     {
         return ERROR_RETURN;
     }
@@ -264,5 +269,5 @@ init_move(void)
 
 #if !COMPILING_IN_PY2
     return m;
-#endif  /* !COMPILING_IN_PY2 */
+#endif  // !COMPILING_IN_PY2
 }
diff --git a/pandas/util/print_versions.py b/pandas/util/print_versions.py
deleted file mode 100644
index ca75d4d02e927..0000000000000
--- a/pandas/util/print_versions.py
+++ /dev/null
@@ -1,157 +0,0 @@
-import os
-import platform
-import sys
-import struct
-import subprocess
-import codecs
-import locale
-import importlib
-
-
-def get_sys_info():
-    "Returns system information as a dict"
-
-    blob = []
-
-    # get full commit hash
-    commit = None
-    if os.path.isdir(".git") and os.path.isdir("pandas"):
-        try:
-            pipe = subprocess.Popen('git log --format="%H" -n 1'.split(" "),
-                                    stdout=subprocess.PIPE,
-                                    stderr=subprocess.PIPE)
-            so, serr = pipe.communicate()
-        except:
-            pass
-        else:
-            if pipe.returncode == 0:
-                commit = so
-                try:
-                    commit = so.decode('utf-8')
-                except ValueError:
-                    pass
-                commit = commit.strip().strip('"')
-
-    blob.append(('commit', commit))
-
-    try:
-        (sysname, nodename, release,
-         version, machine, processor) = platform.uname()
-        blob.extend([
-            ("python", "%d.%d.%d.%s.%s" % sys.version_info[:]),
-            ("python-bits", struct.calcsize("P") * 8),
-            ("OS", "%s" % (sysname)),
-            ("OS-release", "%s" % (release)),
-            # ("Version", "%s" % (version)),
-            ("machine", "%s" % (machine)),
-            ("processor", "%s" % (processor)),
-            ("byteorder", "%s" % sys.byteorder),
-            ("LC_ALL", "%s" % os.environ.get('LC_ALL', "None")),
-            ("LANG", "%s" % os.environ.get('LANG', "None")),
-            ("LOCALE", "%s.%s" % locale.getlocale()),
-
-        ])
-    except:
-        pass
-
-    return blob
-
-
-def show_versions(as_json=False):
-    sys_info = get_sys_info()
-
-    deps = [
-        # (MODULE_NAME, f(mod) -> mod version)
-        ("pandas", lambda mod: mod.__version__),
-        ("pytest", lambda mod: mod.__version__),
-        ("pip", lambda mod: mod.__version__),
-        ("setuptools", lambda mod: mod.__version__),
-        ("Cython", lambda mod: mod.__version__),
-        ("numpy", lambda mod: mod.version.version),
-        ("scipy", lambda mod: mod.version.version),
-        ("xarray", lambda mod: mod.__version__),
-        ("IPython", lambda mod: mod.__version__),
-        ("sphinx", lambda mod: mod.__version__),
-        ("patsy", lambda mod: mod.__version__),
-        ("dateutil", lambda mod: mod.__version__),
-        ("pytz", lambda mod: mod.VERSION),
-        ("blosc", lambda mod: mod.__version__),
-        ("bottleneck", lambda mod: mod.__version__),
-        ("tables", lambda mod: mod.__version__),
-        ("numexpr", lambda mod: mod.__version__),
-        ("feather", lambda mod: mod.__version__),
-        ("matplotlib", lambda mod: mod.__version__),
-        ("openpyxl", lambda mod: mod.__version__),
-        ("xlrd", lambda mod: mod.__VERSION__),
-        ("xlwt", lambda mod: mod.__VERSION__),
-        ("xlsxwriter", lambda mod: mod.__version__),
-        ("lxml", lambda mod: mod.etree.__version__),
-        ("bs4", lambda mod: mod.__version__),
-        ("html5lib", lambda mod: mod.__version__),
-        ("sqlalchemy", lambda mod: mod.__version__),
-        ("pymysql", lambda mod: mod.__version__),
-        ("psycopg2", lambda mod: mod.__version__),
-        ("jinja2", lambda mod: mod.__version__),
-        ("s3fs", lambda mod: mod.__version__),
-        ("pandas_gbq", lambda mod: mod.__version__),
-        ("pandas_datareader", lambda mod: mod.__version__)
-    ]
-
-    deps_blob = list()
-    for (modname, ver_f) in deps:
-        try:
-            if modname in sys.modules:
-                mod = sys.modules[modname]
-            else:
-                mod = importlib.import_module(modname)
-            ver = ver_f(mod)
-            deps_blob.append((modname, ver))
-        except:
-            deps_blob.append((modname, None))
-
-    if (as_json):
-        try:
-            import json
-        except:
-            import simplejson as json
-
-        j = dict(system=dict(sys_info), dependencies=dict(deps_blob))
-
-        if as_json is True:
-            print(j)
-        else:
-            with codecs.open(as_json, "wb", encoding='utf8') as f:
-                json.dump(j, f, indent=2)
-
-    else:
-
-        print("\nINSTALLED VERSIONS")
-        print("------------------")
-
-        for k, stat in sys_info:
-            print("%s: %s" % (k, stat))
-
-        print("")
-        for k, stat in deps_blob:
-            print("%s: %s" % (k, stat))
-
-
-def main():
-    from optparse import OptionParser
-    parser = OptionParser()
-    parser.add_option("-j", "--json", metavar="FILE", nargs=1,
-                      help="Save output as JSON into file, pass in "
-                      "'-' to output to stdout")
-
-    (options, args) = parser.parse_args()
-
-    if options.json == "-":
-        options.json = True
-
-    show_versions(as_json=options.json)
-
-    return 0
-
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/pandas/util/terminal.py b/pandas/util/terminal.py
deleted file mode 100644
index dadd09ae74ea4..0000000000000
--- a/pandas/util/terminal.py
+++ /dev/null
@@ -1,121 +0,0 @@
-"""
-get_terminal_size() -- return width and height of terminal as a tuple
-
-code from:
-http://stackoverflow.com/questions/566746/how-to-get-console- window-width-in-
-python
-
-written by
-Harco Kuppens (http://stackoverflow.com/users/825214/harco-kuppens)
-
-It is mentioned in the stackoverflow response that this code works
-on linux, os x, windows and cygwin (windows).
-"""
-from __future__ import print_function
-
-import os
-
-__all__ = ['get_terminal_size']
-
-
-def get_terminal_size():
-    """
-    Detect terminal size and return tuple = (width, height).
-
-    Only to be used when running in a terminal. Note that the IPython notebook,
-    IPython zmq frontends, or IDLE do not run in a terminal,
-    """
-    import platform
-    current_os = platform.system()
-    tuple_xy = None
-    if current_os == 'Windows':
-        tuple_xy = _get_terminal_size_windows()
-        if tuple_xy is None:
-            tuple_xy = _get_terminal_size_tput()
-            # needed for window's python in cygwin's xterm!
-    if current_os == 'Linux' or \
-        current_os == 'Darwin' or \
-            current_os.startswith('CYGWIN'):
-        tuple_xy = _get_terminal_size_linux()
-    if tuple_xy is None:
-        tuple_xy = (80, 25)      # default value
-    return tuple_xy
-
-
-def _get_terminal_size_windows():
-    res = None
-    try:
-        from ctypes import windll, create_string_buffer
-
-        # stdin handle is -10
-        # stdout handle is -11
-        # stderr handle is -12
-
-        h = windll.kernel32.GetStdHandle(-12)
-        csbi = create_string_buffer(22)
-        res = windll.kernel32.GetConsoleScreenBufferInfo(h, csbi)
-    except:
-        return None
-    if res:
-        import struct
-        (bufx, bufy, curx, cury, wattr, left, top, right, bottom, maxx,
-         maxy) = struct.unpack("hhhhHhhhhhh", csbi.raw)
-        sizex = right - left + 1
-        sizey = bottom - top + 1
-        return sizex, sizey
-    else:
-        return None
-
-
-def _get_terminal_size_tput():
-    # get terminal width
-    # src: http://stackoverflow.com/questions/263890/how-do-i-find-the-width
-    # -height-of-a-terminal-window
-    try:
-        import subprocess
-        proc = subprocess.Popen(["tput", "cols"],
-                                stdin=subprocess.PIPE,
-                                stdout=subprocess.PIPE)
-        output = proc.communicate(input=None)
-        cols = int(output[0])
-        proc = subprocess.Popen(["tput", "lines"],
-                                stdin=subprocess.PIPE,
-                                stdout=subprocess.PIPE)
-        output = proc.communicate(input=None)
-        rows = int(output[0])
-        return (cols, rows)
-    except:
-        return None
-
-
-def _get_terminal_size_linux():
-    def ioctl_GWINSZ(fd):
-        try:
-            import fcntl
-            import termios
-            import struct
-            cr = struct.unpack(
-                'hh', fcntl.ioctl(fd, termios.TIOCGWINSZ, '1234'))
-        except:
-            return None
-        return cr
-    cr = ioctl_GWINSZ(0) or ioctl_GWINSZ(1) or ioctl_GWINSZ(2)
-    if not cr:
-        try:
-            fd = os.open(os.ctermid(), os.O_RDONLY)
-            cr = ioctl_GWINSZ(fd)
-            os.close(fd)
-        except:
-            pass
-    if not cr or cr == (0, 0):
-        try:
-            from os import environ as env
-            cr = (env['LINES'], env['COLUMNS'])
-        except:
-            return None
-    return int(cr[1]), int(cr[0])
-
-
-if __name__ == "__main__":
-    sizex, sizey = get_terminal_size()
-    print('width = %s height = %s' % (sizex, sizey))
diff --git a/pandas/util/testing.py b/pandas/util/testing.py
index 9a9f3c6c6b945..a5ae1f6a4d960 100644
--- a/pandas/util/testing.py
+++ b/pandas/util/testing.py
@@ -1,62 +1,53 @@
 from __future__ import division
-# pylint: disable-msg=W0402
 
+from collections import Counter
+from contextlib import contextmanager
+from datetime import datetime
+from functools import wraps
+import locale
+import os
 import re
+from shutil import rmtree
 import string
+import subprocess
 import sys
 import tempfile
-import warnings
-import inspect
-import os
-import subprocess
-import locale
-import unittest
 import traceback
+import warnings
 
-from datetime import datetime
-from functools import wraps, partial
-from contextlib import contextmanager
-from distutils.version import LooseVersion
-
-from numpy.random import randn, rand
-import pytest
 import numpy as np
+from numpy.random import rand, randn
 
-import pandas as pd
-from pandas.types.missing import array_equivalent
-from pandas.types.common import (is_datetimelike_v_numeric,
-                                 is_datetimelike_v_object,
-                                 is_number, is_bool,
-                                 needs_i8_conversion,
-                                 is_categorical_dtype,
-                                 is_sequence,
-                                 is_list_like)
-from pandas.formats.printing import pprint_thing
-from pandas.core.algorithms import take_1d
-
+from pandas._libs import testing as _testing
 import pandas.compat as compat
 from pandas.compat import (
-    filter, map, zip, range, unichr, lrange, lmap, lzip, u, callable, Counter,
-    raise_with_traceback, httplib, is_platform_windows, is_platform_32bit,
-    PY3
-)
+    PY2, PY3, filter, httplib, lmap, lrange, lzip, map, raise_with_traceback,
+    range, string_types, u, unichr, zip)
 
-from pandas.computation import expressions as expr
+from pandas.core.dtypes.common import (
+    is_bool, is_categorical_dtype, is_datetime64_dtype, is_datetime64tz_dtype,
+    is_datetimelike_v_numeric, is_datetimelike_v_object,
+    is_extension_array_dtype, is_interval_dtype, is_list_like, is_number,
+    is_period_dtype, is_sequence, is_timedelta64_dtype, needs_i8_conversion)
+from pandas.core.dtypes.missing import array_equivalent
 
-from pandas import (bdate_range, CategoricalIndex, Categorical, DatetimeIndex,
-                    TimedeltaIndex, PeriodIndex, RangeIndex, Index, MultiIndex,
-                    Series, DataFrame, Panel, Panel4D)
-from pandas.util.decorators import deprecate
-from pandas.util import libtesting
-from pandas.io.common import urlopen
-slow = pytest.mark.slow
+import pandas as pd
+from pandas import (
+    Categorical, CategoricalIndex, DataFrame, DatetimeIndex, Index,
+    IntervalIndex, MultiIndex, RangeIndex, Series, bdate_range)
+from pandas.core.algorithms import take_1d
+from pandas.core.arrays import (
+    DatetimeArray, ExtensionArray, IntervalArray, PeriodArray, TimedeltaArray,
+    period_array)
+import pandas.core.common as com
 
+from pandas.io.common import urlopen
+from pandas.io.formats.printing import pprint_thing
 
 N = 30
 K = 4
 _RAISE_NETWORK_ERROR_DEFAULT = False
 
-
 # set testing_mode
 _testing_mode_warnings = (DeprecationWarning, compat.ResourceWarning)
 
@@ -78,118 +69,298 @@ def reset_testing_mode():
 set_testing_mode()
 
 
-class TestCase(unittest.TestCase):
+def reset_display_options():
+    """
+    Reset the display options for printing and representing objects.
+    """
 
-    @classmethod
-    def setUpClass(cls):
-        pd.set_option('chained_assignment', 'raise')
+    pd.reset_option('^display.', silent=True)
 
-    @classmethod
-    def tearDownClass(cls):
-        pass
 
-    def reset_display_options(self):
-        # reset the display options
-        pd.reset_option('^display.', silent=True)
+def round_trip_pickle(obj, path=None):
+    """
+    Pickle an object and then read it again.
+
+    Parameters
+    ----------
+    obj : pandas object
+        The object to pickle and then re-read.
+    path : str, default None
+        The path where the pickled object is written and then read.
+
+    Returns
+    -------
+    round_trip_pickled_object : pandas object
+        The original object that was pickled and then re-read.
+    """
+
+    if path is None:
+        path = u('__{random_bytes}__.pickle'.format(random_bytes=rands(10)))
+    with ensure_clean(path) as path:
+        pd.to_pickle(obj, path)
+        return pd.read_pickle(path)
 
-    def round_trip_pickle(self, obj, path=None):
-        return round_trip_pickle(obj, path=path)
 
-    # https://docs.python.org/3/library/unittest.html#deprecated-aliases
-    def assertEquals(self, *args, **kwargs):
-        return deprecate('assertEquals',
-                         self.assertEqual)(*args, **kwargs)
+def round_trip_pathlib(writer, reader, path=None):
+    """
+    Write an object to file specified by a pathlib.Path and read it back
 
-    def assertNotEquals(self, *args, **kwargs):
-        return deprecate('assertNotEquals',
-                         self.assertNotEqual)(*args, **kwargs)
+    Parameters
+    ----------
+    writer : callable bound to pandas object
+        IO writing function (e.g. DataFrame.to_csv )
+    reader : callable
+        IO reading function (e.g. pd.read_csv )
+    path : str, default None
+        The path where the object is written and then read.
+
+    Returns
+    -------
+    round_trip_object : pandas object
+        The original object that was serialized and then re-read.
+    """
 
-    def assert_(self, *args, **kwargs):
-        return deprecate('assert_',
-                         self.assertTrue)(*args, **kwargs)
+    import pytest
+    Path = pytest.importorskip('pathlib').Path
+    if path is None:
+        path = '___pathlib___'
+    with ensure_clean(path) as path:
+        writer(Path(path))
+        obj = reader(Path(path))
+    return obj
 
-    def assertAlmostEquals(self, *args, **kwargs):
-        return deprecate('assertAlmostEquals',
-                         self.assertAlmostEqual)(*args, **kwargs)
 
-    def assertNotAlmostEquals(self, *args, **kwargs):
-        return deprecate('assertNotAlmostEquals',
-                         self.assertNotAlmostEqual)(*args, **kwargs)
+def round_trip_localpath(writer, reader, path=None):
+    """
+    Write an object to file specified by a py.path LocalPath and read it back
 
+    Parameters
+    ----------
+    writer : callable bound to pandas object
+        IO writing function (e.g. DataFrame.to_csv )
+    reader : callable
+        IO reading function (e.g. pd.read_csv )
+    path : str, default None
+        The path where the object is written and then read.
 
-def round_trip_pickle(obj, path=None):
+    Returns
+    -------
+    round_trip_object : pandas object
+        The original object that was serialized and then re-read.
+    """
+    import pytest
+    LocalPath = pytest.importorskip('py.path').local
     if path is None:
-        path = u('__%s__.pickle' % rands(10))
+        path = '___localpath___'
     with ensure_clean(path) as path:
-        pd.to_pickle(obj, path)
-        return pd.read_pickle(path)
+        writer(LocalPath(path))
+        obj = reader(LocalPath(path))
+    return obj
 
 
-def assert_almost_equal(left, right, check_exact=False,
-                        check_dtype='equiv', check_less_precise=False,
-                        **kwargs):
-    """Check that left and right Index are equal.
+@contextmanager
+def decompress_file(path, compression):
+    """
+    Open a compressed file and return a file object
+
+    Parameters
+    ----------
+    path : str
+        The path where the file is read from
+
+    compression : {'gzip', 'bz2', 'zip', 'xz', None}
+        Name of the decompression to use
+
+    Returns
+    -------
+    f : file object
+    """
+
+    if compression is None:
+        f = open(path, 'rb')
+    elif compression == 'gzip':
+        import gzip
+        f = gzip.open(path, 'rb')
+    elif compression == 'bz2':
+        import bz2
+        f = bz2.BZ2File(path, 'rb')
+    elif compression == 'xz':
+        lzma = compat.import_lzma()
+        f = lzma.LZMAFile(path, 'rb')
+    elif compression == 'zip':
+        import zipfile
+        zip_file = zipfile.ZipFile(path)
+        zip_names = zip_file.namelist()
+        if len(zip_names) == 1:
+            f = zip_file.open(zip_names.pop())
+        else:
+            raise ValueError('ZIP file {} error. Only one file per ZIP.'
+                             .format(path))
+    else:
+        msg = 'Unrecognized compression type: {}'.format(compression)
+        raise ValueError(msg)
+
+    try:
+        yield f
+    finally:
+        f.close()
+        if compression == "zip":
+            zip_file.close()
+
+
+def write_to_compressed(compression, path, data, dest="test"):
+    """
+    Write data to a compressed file.
+
+    Parameters
+    ----------
+    compression : {'gzip', 'bz2', 'zip', 'xz'}
+        The compression type to use.
+    path : str
+        The file path to write the data.
+    data : str
+        The data to write.
+    dest : str, default "test"
+        The destination file (for ZIP only)
+
+    Raises
+    ------
+    ValueError : An invalid compression value was passed in.
+    """
+
+    if compression == "zip":
+        import zipfile
+        compress_method = zipfile.ZipFile
+    elif compression == "gzip":
+        import gzip
+        compress_method = gzip.GzipFile
+    elif compression == "bz2":
+        import bz2
+        compress_method = bz2.BZ2File
+    elif compression == "xz":
+        lzma = compat.import_lzma()
+        compress_method = lzma.LZMAFile
+    else:
+        msg = "Unrecognized compression type: {}".format(compression)
+        raise ValueError(msg)
+
+    if compression == "zip":
+        mode = "w"
+        args = (dest, data)
+        method = "writestr"
+    else:
+        mode = "wb"
+        args = (data,)
+        method = "write"
+
+    with compress_method(path, mode=mode) as f:
+        getattr(f, method)(*args)
+
+
+def assert_almost_equal(left, right, check_dtype="equiv",
+                        check_less_precise=False, **kwargs):
+    """
+    Check that the left and right objects are approximately equal.
+
+    By approximately equal, we refer to objects that are numbers or that
+    contain numbers which may be equivalent to specific levels of precision.
 
     Parameters
     ----------
     left : object
     right : object
-    check_exact : bool, default True
-        Whether to compare number exactly.
-    check_dtype: bool, default True
-        check dtype if both a and b are the same type
+    check_dtype : bool / string {'equiv'}, default 'equiv'
+        Check dtype if both a and b are the same type. If 'equiv' is passed in,
+        then `RangeIndex` and `Int64Index` are also considered equivalent
+        when doing type checking.
     check_less_precise : bool or int, default False
-        Specify comparison precision. Only used when check_exact is False.
-        5 digits (False) or 3 digits (True) after decimal points are compared.
-        If int, then specify the digits to compare
+        Specify comparison precision. 5 digits (False) or 3 digits (True)
+        after decimal points are compared. If int, then specify the number
+        of digits to compare.
+
+        When comparing two numbers, if the first number has magnitude less
+        than 1e-5, we compare the two numbers directly and check whether
+        they are equivalent within the specified precision. Otherwise, we
+        compare the **ratio** of the second number to the first number and
+        check whether it is equivalent to 1 within the specified precision.
     """
+
     if isinstance(left, pd.Index):
-        return assert_index_equal(left, right, check_exact=check_exact,
+        return assert_index_equal(left, right,
+                                  check_exact=False,
                                   exact=check_dtype,
                                   check_less_precise=check_less_precise,
                                   **kwargs)
 
     elif isinstance(left, pd.Series):
-        return assert_series_equal(left, right, check_exact=check_exact,
+        return assert_series_equal(left, right,
+                                   check_exact=False,
                                    check_dtype=check_dtype,
                                    check_less_precise=check_less_precise,
                                    **kwargs)
 
     elif isinstance(left, pd.DataFrame):
-        return assert_frame_equal(left, right, check_exact=check_exact,
+        return assert_frame_equal(left, right,
+                                  check_exact=False,
                                   check_dtype=check_dtype,
                                   check_less_precise=check_less_precise,
                                   **kwargs)
 
     else:
-        # other sequences
+        # Other sequences.
         if check_dtype:
             if is_number(left) and is_number(right):
-                # do not compare numeric classes, like np.float64 and float
+                # Do not compare numeric classes, like np.float64 and float.
                 pass
             elif is_bool(left) and is_bool(right):
-                # do not compare bool classes, like np.bool_ and bool
+                # Do not compare bool classes, like np.bool_ and bool.
                 pass
             else:
                 if (isinstance(left, np.ndarray) or
                         isinstance(right, np.ndarray)):
-                    obj = 'numpy array'
+                    obj = "numpy array"
                 else:
-                    obj = 'Input'
+                    obj = "Input"
                 assert_class_equal(left, right, obj=obj)
-        return libtesting.assert_almost_equal(
+        return _testing.assert_almost_equal(
             left, right,
             check_dtype=check_dtype,
             check_less_precise=check_less_precise,
             **kwargs)
 
 
-def assert_dict_equal(left, right, compare_keys=True):
+def _check_isinstance(left, right, cls):
+    """
+    Helper method for our assert_* methods that ensures that
+    the two objects being compared have the right type before
+    proceeding with the comparison.
 
-    assertIsInstance(left, dict, '[dict] ')
-    assertIsInstance(right, dict, '[dict] ')
+    Parameters
+    ----------
+    left : The first object being compared.
+    right : The second object being compared.
+    cls : The class type to check against.
+
+    Raises
+    ------
+    AssertionError : Either `left` or `right` is not an instance of `cls`.
+    """
 
-    return libtesting.assert_dict_equal(left, right, compare_keys=compare_keys)
+    err_msg = "{name} Expected type {exp_type}, found {act_type} instead"
+    cls_name = cls.__name__
+
+    if not isinstance(left, cls):
+        raise AssertionError(err_msg.format(name=cls_name, exp_type=cls,
+                                            act_type=type(left)))
+    if not isinstance(right, cls):
+        raise AssertionError(err_msg.format(name=cls_name, exp_type=cls,
+                                            act_type=type(right)))
+
+
+def assert_dict_equal(left, right, compare_keys=True):
+
+    _check_isinstance(left, right, dict)
+    return _testing.assert_dict_equal(left, right, compare_keys=compare_keys)
 
 
 def randbool(size=(), p=0.5):
@@ -252,198 +423,6 @@ def close(fignum=None):
         _close(fignum)
 
 
-def _skip_if_32bit():
-    import pytest
-    if is_platform_32bit():
-        pytest.skip("skipping for 32 bit")
-
-
-def mplskip(cls):
-    """Skip a TestCase instance if matplotlib isn't installed"""
-
-    @classmethod
-    def setUpClass(cls):
-        try:
-            import matplotlib as mpl
-            mpl.use("Agg", warn=False)
-        except ImportError:
-            import pytest
-            pytest.skip("matplotlib not installed")
-
-    cls.setUpClass = setUpClass
-    return cls
-
-
-def _skip_if_no_mpl():
-    try:
-        import matplotlib  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("matplotlib not installed")
-
-
-def _skip_if_mpl_1_5():
-    import matplotlib
-    v = matplotlib.__version__
-    if v > LooseVersion('1.4.3') or v[0] == '0':
-        import pytest
-        pytest.skip("matplotlib 1.5")
-
-
-def _skip_if_no_scipy():
-    try:
-        import scipy.stats  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("no scipy.stats module")
-    try:
-        import scipy.interpolate  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip('scipy.interpolate missing')
-    try:
-        import scipy.sparse  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip('scipy.sparse missing')
-
-
-def _check_if_lzma():
-    try:
-        return compat.import_lzma()
-    except ImportError:
-        return False
-
-
-def _skip_if_no_lzma():
-    return _check_if_lzma() or pytest.skip('need backports.lzma to run')
-
-
-_mark_skipif_no_lzma = pytest.mark.skipif(
-    not _check_if_lzma(),
-    reason='need backports.lzma to run'
-)
-
-
-def _skip_if_no_xarray():
-    try:
-        import xarray
-    except ImportError:
-        import pytest
-        pytest.skip("xarray not installed")
-
-    v = xarray.__version__
-    if v < LooseVersion('0.7.0'):
-        import pytest
-        pytest.skip("xarray not version is too low: {0}".format(v))
-
-
-def _skip_if_no_pytz():
-    try:
-        import pytz  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("pytz not installed")
-
-
-def _skip_if_no_dateutil():
-    try:
-        import dateutil  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("dateutil not installed")
-
-
-def _skip_if_windows_python_3():
-    if PY3 and is_platform_windows():
-        import pytest
-        pytest.skip("not used on python 3/win32")
-
-
-def _skip_if_windows():
-    if is_platform_windows():
-        import pytest
-        pytest.skip("Running on Windows")
-
-
-def _skip_if_no_pathlib():
-    try:
-        from pathlib import Path  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("pathlib not available")
-
-
-def _skip_if_no_localpath():
-    try:
-        from py.path import local as LocalPath  # noqa
-    except ImportError:
-        import pytest
-        pytest.skip("py.path not installed")
-
-
-def _incompat_bottleneck_version(method):
-    """ skip if we have bottleneck installed
-    and its >= 1.0
-    as we don't match the nansum/nanprod behavior for all-nan
-    ops, see GH9422
-    """
-    if method not in ['sum', 'prod']:
-        return False
-    try:
-        import bottleneck as bn
-        return bn.__version__ >= LooseVersion('1.0')
-    except ImportError:
-        return False
-
-
-def skip_if_no_ne(engine='numexpr'):
-    from pandas.computation.expressions import (_USE_NUMEXPR,
-                                                _NUMEXPR_INSTALLED)
-
-    if engine == 'numexpr':
-        if not _USE_NUMEXPR:
-            import pytest
-            pytest.skip("numexpr enabled->{enabled}, "
-                        "installed->{installed}".format(
-                            enabled=_USE_NUMEXPR,
-                            installed=_NUMEXPR_INSTALLED))
-
-
-def _skip_if_has_locale():
-    import locale
-    lang, _ = locale.getlocale()
-    if lang is not None:
-        import pytest
-        pytest.skip("Specific locale is set {0}".format(lang))
-
-
-def _skip_if_not_us_locale():
-    import locale
-    lang, _ = locale.getlocale()
-    if lang != 'en_US':
-        import pytest
-        pytest.skip("Specific locale is set {0}".format(lang))
-
-
-def _skip_if_no_mock():
-    try:
-        import mock  # noqa
-    except ImportError:
-        try:
-            from unittest import mock  # noqa
-        except ImportError:
-            import nose
-            raise nose.SkipTest("mock is not installed")
-
-
-def _skip_if_no_ipython():
-    try:
-        import IPython  # noqa
-    except ImportError:
-        import nose
-        raise nose.SkipTest("IPython not installed")
-
 # -----------------------------------------------------------------------------
 # locale utilities
 
@@ -487,8 +466,8 @@ def _default_locale_getter():
     try:
         raw_locales = check_output(['locale -a'], shell=True)
     except subprocess.CalledProcessError as e:
-        raise type(e)("%s, the 'locale -a' command cannot be found on your "
-                      "system" % e)
+        raise type(e)("{exception}, the 'locale -a' command cannot be found "
+                      "on your system".format(exception=e))
     return raw_locales
 
 
@@ -523,7 +502,7 @@ def get_locales(prefix=None, normalize=True,
     """
     try:
         raw_locales = locale_getter()
-    except:
+    except Exception:
         return None
 
     try:
@@ -545,7 +524,8 @@ def get_locales(prefix=None, normalize=True,
     if prefix is None:
         return _valid_locales(out_locales, normalize)
 
-    found = re.compile('%s.*' % prefix).findall('\n'.join(out_locales))
+    pattern = re.compile('{prefix}.*'.format(prefix=prefix))
+    found = pattern.findall('\n'.join(out_locales))
     return _valid_locales(found, normalize)
 
 
@@ -559,6 +539,8 @@ def set_locale(new_locale, lc_var=locale.LC_ALL):
         A string of the form <language_country>.<encoding>. For example to set
         the current locale to US English with a UTF8 encoding, you would pass
         "en_US.UTF-8".
+    lc_var : int, default `locale.LC_ALL`
+        The category of the locale being set.
 
     Notes
     -----
@@ -570,37 +552,38 @@ def set_locale(new_locale, lc_var=locale.LC_ALL):
 
     try:
         locale.setlocale(lc_var, new_locale)
-
-        try:
-            normalized_locale = locale.getlocale()
-        except ValueError:
-            yield new_locale
+        normalized_locale = locale.getlocale()
+        if com._all_not_none(*normalized_locale):
+            yield '.'.join(normalized_locale)
         else:
-            if all(lc is not None for lc in normalized_locale):
-                yield '.'.join(normalized_locale)
-            else:
-                yield new_locale
+            yield new_locale
     finally:
         locale.setlocale(lc_var, current_locale)
 
 
-def _can_set_locale(lc):
-    """Check to see if we can set a locale without throwing an exception.
+def can_set_locale(lc, lc_var=locale.LC_ALL):
+    """
+    Check to see if we can set a locale, and subsequently get the locale,
+    without raising an Exception.
 
     Parameters
     ----------
     lc : str
         The locale to attempt to set.
+    lc_var : int, default `locale.LC_ALL`
+        The category of the locale being set.
 
     Returns
     -------
-    isvalid : bool
+    is_valid : bool
         Whether the passed locale can be set
     """
+
     try:
-        with set_locale(lc):
+        with set_locale(lc, lc_var=lc_var):
             pass
-    except locale.Error:  # horrible name for a Exception subclass
+    except (ValueError,
+            locale.Error):  # horrible name for a Exception subclass
         return False
     else:
         return True
@@ -627,7 +610,33 @@ def _valid_locales(locales, normalize):
     else:
         normalizer = lambda x: x.strip()
 
-    return list(filter(_can_set_locale, map(normalizer, locales)))
+    return list(filter(can_set_locale, map(normalizer, locales)))
+
+# -----------------------------------------------------------------------------
+# Stdout / stderr decorators
+
+
+@contextmanager
+def set_defaultencoding(encoding):
+    """
+    Set default encoding (as given by sys.getdefaultencoding()) to the given
+    encoding; restore on exit.
+
+    Parameters
+    ----------
+    encoding : str
+    """
+    if not PY2:
+        raise ValueError("set_defaultencoding context is only available "
+                         "in Python 2.")
+    orig = sys.getdefaultencoding()
+    reload(sys)  # noqa:F821
+    sys.setdefaultencoding(encoding)
+    try:
+        yield
+    finally:
+        sys.setdefaultencoding(orig)
+
 
 # -----------------------------------------------------------------------------
 # Console debugging tools
@@ -654,7 +663,7 @@ def set_trace():
     from IPython.core.debugger import Pdb
     try:
         Pdb(color_scheme='Linux').set_trace(sys._getframe().f_back)
-    except:
+    except Exception:
         from pdb import Pdb as OldPdb
         OldPdb().set_trace(sys._getframe().f_back)
 
@@ -700,24 +709,50 @@ def ensure_clean(filename=None, return_filelike=False):
         finally:
             try:
                 os.close(fd)
-            except Exception as e:
-                print("Couldn't close file descriptor: %d (file: %s)" %
-                      (fd, filename))
+            except Exception:
+                print("Couldn't close file descriptor: {fdesc} (file: {fname})"
+                      .format(fdesc=fd, fname=filename))
             try:
                 if os.path.exists(filename):
                     os.remove(filename)
             except Exception as e:
-                print("Exception on removing file: %s" % e)
+                print("Exception on removing file: {error}".format(error=e))
+
+
+@contextmanager
+def ensure_clean_dir():
+    """
+    Get a temporary directory path and agrees to remove on close.
 
+    Yields
+    ------
+    Temporary directory path
+    """
+    directory_name = tempfile.mkdtemp(suffix='')
+    try:
+        yield directory_name
+    finally:
+        try:
+            rmtree(directory_name)
+        except Exception:
+            pass
 
-def get_data_path(f=''):
-    """Return the path of a data file, these are relative to the current test
-    directory.
+
+@contextmanager
+def ensure_safe_environment_variables():
     """
-    # get our callers file
-    _, filename, _, _, _, _ = inspect.getouterframes(inspect.currentframe())[1]
-    base_dir = os.path.abspath(os.path.dirname(filename))
-    return os.path.join(base_dir, 'data', f)
+    Get a context manager to safely set environment variables
+
+    All changes will be undone on close, hence environment variables set
+    within this contextmanager will neither persist nor change global state.
+    """
+    saved_environ = dict(os.environ)
+    try:
+        yield
+    finally:
+        os.environ.clear()
+        os.environ.update(saved_environ)
+
 
 # -----------------------------------------------------------------------------
 # Comparators
@@ -729,23 +764,6 @@ def equalContents(arr1, arr2):
     return frozenset(arr1) == frozenset(arr2)
 
 
-def assert_equal(a, b, msg=""):
-    """asserts that a equals b, like nose's assert_equal,
-    but allows custom message to start. Passes a and b to
-    format string as well. So you can use '{0}' and '{1}'
-    to display a and b.
-
-    Examples
-    --------
-    >>> assert_equal(2, 2, "apples")
-    >>> assert_equal(5.2, 1.2, "{0} was really a dead parrot")
-    Traceback (most recent call last):
-        ...
-    AssertionError: 5.2 was really a dead parrot: 5.2 != 1.2
-    """
-    assert a == b, "%s: %r != %r" % (msg.format(a, b), a, b)
-
-
 def assert_index_equal(left, right, exact='equiv', check_names=True,
                        check_less_precise=False, check_exact=True,
                        check_categorical=True, obj='Index'):
@@ -755,10 +773,10 @@ def assert_index_equal(left, right, exact='equiv', check_names=True,
     ----------
     left : Index
     right : Index
-    exact : bool / string {'equiv'}, default False
+    exact : bool / string {'equiv'}, default 'equiv'
         Whether to check the Index class, dtype and inferred_type
-        are identical. If 'equiv', then RangeIndex can be substitued for
-        Int64Index as well
+        are identical. If 'equiv', then RangeIndex can be substituted for
+        Int64Index as well.
     check_names : bool, default True
         Whether to check the names attribute.
     check_less_precise : bool or int, default False
@@ -773,43 +791,49 @@ def assert_index_equal(left, right, exact='equiv', check_names=True,
         Specify object name being compared, internally used to show appropriate
         assertion message
     """
+    __tracebackhide__ = True
 
     def _check_types(l, r, obj='Index'):
         if exact:
-            assert_class_equal(left, right, exact=exact, obj=obj)
-            assert_attr_equal('dtype', l, r, obj=obj)
+            assert_class_equal(l, r, exact=exact, obj=obj)
+
+            # Skip exact dtype checking when `check_categorical` is False
+            if check_categorical:
+                assert_attr_equal('dtype', l, r, obj=obj)
+
             # allow string-like to have different inferred_types
             if l.inferred_type in ('string', 'unicode'):
-                assertIn(r.inferred_type, ('string', 'unicode'))
+                assert r.inferred_type in ('string', 'unicode')
             else:
                 assert_attr_equal('inferred_type', l, r, obj=obj)
 
     def _get_ilevel_values(index, level):
         # accept level number only
         unique = index.levels[level]
-        labels = index.labels[level]
+        labels = index.codes[level]
         filled = take_1d(unique.values, labels, fill_value=unique._na_value)
         values = unique._shallow_copy(filled, name=index.names[level])
         return values
 
     # instance validation
-    assertIsInstance(left, Index, '[index] ')
-    assertIsInstance(right, Index, '[index] ')
+    _check_isinstance(left, right, Index)
 
     # class / dtype comparison
     _check_types(left, right, obj=obj)
 
     # level comparison
     if left.nlevels != right.nlevels:
-        raise_assert_detail(obj, '{0} levels are different'.format(obj),
-                            '{0}, {1}'.format(left.nlevels, left),
-                            '{0}, {1}'.format(right.nlevels, right))
+        msg1 = '{obj} levels are different'.format(obj=obj)
+        msg2 = '{nlevels}, {left}'.format(nlevels=left.nlevels, left=left)
+        msg3 = '{nlevels}, {right}'.format(nlevels=right.nlevels, right=right)
+        raise_assert_detail(obj, msg1, msg2, msg3)
 
     # length comparison
     if len(left) != len(right):
-        raise_assert_detail(obj, '{0} length are different'.format(obj),
-                            '{0}, {1}'.format(len(left), left),
-                            '{0}, {1}'.format(len(right), right))
+        msg1 = '{obj} length are different'.format(obj=obj)
+        msg2 = '{length}, {left}'.format(length=len(left), left=left)
+        msg3 = '{length}, {right}'.format(length=len(right), right=right)
+        raise_assert_detail(obj, msg1, msg2, msg3)
 
     # MultiIndex special comparison for little-friendly error messages
     if left.nlevels > 1:
@@ -818,7 +842,7 @@ def _get_ilevel_values(index, level):
             llevel = _get_ilevel_values(left, level)
             rlevel = _get_ilevel_values(right, level)
 
-            lobj = 'MultiIndex level [{0}]'.format(level)
+            lobj = 'MultiIndex level [{level}]'.format(level=level)
             assert_index_equal(llevel, rlevel,
                                exact=exact, check_names=check_names,
                                check_less_precise=check_less_precise,
@@ -826,33 +850,38 @@ def _get_ilevel_values(index, level):
             # get_level_values may change dtype
             _check_types(left.levels[level], right.levels[level], obj=obj)
 
-    if check_exact:
+    # skip exact index checking when `check_categorical` is False
+    if check_exact and check_categorical:
         if not left.equals(right):
             diff = np.sum((left.values != right.values)
                           .astype(int)) * 100.0 / len(left)
-            msg = '{0} values are different ({1} %)'\
-                .format(obj, np.round(diff, 5))
+            msg = '{obj} values are different ({pct} %)'.format(
+                obj=obj, pct=np.round(diff, 5))
             raise_assert_detail(obj, msg, left, right)
     else:
-        libtesting.assert_almost_equal(left.values, right.values,
-                                       check_less_precise=check_less_precise,
-                                       check_dtype=exact,
-                                       obj=obj, lobj=left, robj=right)
+        _testing.assert_almost_equal(left.values, right.values,
+                                     check_less_precise=check_less_precise,
+                                     check_dtype=exact,
+                                     obj=obj, lobj=left, robj=right)
 
     # metadata comparison
     if check_names:
         assert_attr_equal('names', left, right, obj=obj)
     if isinstance(left, pd.PeriodIndex) or isinstance(right, pd.PeriodIndex):
         assert_attr_equal('freq', left, right, obj=obj)
+    if (isinstance(left, pd.IntervalIndex) or
+            isinstance(right, pd.IntervalIndex)):
+        assert_interval_array_equal(left.values, right.values)
 
     if check_categorical:
         if is_categorical_dtype(left) or is_categorical_dtype(right):
             assert_categorical_equal(left.values, right.values,
-                                     obj='{0} category'.format(obj))
+                                     obj='{obj} category'.format(obj=obj))
 
 
 def assert_class_equal(left, right, exact=True, obj='Input'):
     """checks classes are equal."""
+    __tracebackhide__ = True
 
     def repr_class(x):
         if isinstance(x, Index):
@@ -867,14 +896,14 @@ def repr_class(x):
     if exact == 'equiv':
         if type(left) != type(right):
             # allow equivalence of Int64Index/RangeIndex
-            types = set([type(left).__name__, type(right).__name__])
-            if len(types - set(['Int64Index', 'RangeIndex'])):
-                msg = '{0} classes are not equivalent'.format(obj)
+            types = {type(left).__name__, type(right).__name__}
+            if len(types - {'Int64Index', 'RangeIndex'}):
+                msg = '{obj} classes are not equivalent'.format(obj=obj)
                 raise_assert_detail(obj, msg, repr_class(left),
                                     repr_class(right))
     elif exact:
         if type(left) != type(right):
-            msg = '{0} classes are different'.format(obj)
+            msg = '{obj} classes are different'.format(obj=obj)
             raise_assert_detail(obj, msg, repr_class(left),
                                 repr_class(right))
 
@@ -892,6 +921,7 @@ def assert_attr_equal(attr, left, right, obj='Attributes'):
         Specify object name being compared, internally used to show appropriate
         assertion message
     """
+    __tracebackhide__ = True
 
     left_attr = getattr(left, attr)
     right_attr = getattr(right, attr)
@@ -914,23 +944,22 @@ def assert_attr_equal(attr, left, right, obj='Attributes'):
     if result:
         return True
     else:
-        raise_assert_detail(obj, 'Attribute "{0}" are different'.format(attr),
-                            left_attr, right_attr)
+        msg = 'Attribute "{attr}" are different'.format(attr=attr)
+        raise_assert_detail(obj, msg, left_attr, right_attr)
 
 
 def assert_is_valid_plot_return_object(objs):
     import matplotlib.pyplot as plt
     if isinstance(objs, (pd.Series, np.ndarray)):
         for el in objs.ravel():
-            msg = ('one of \'objs\' is not a matplotlib Axes instance, '
-                   'type encountered {0!r}')
-            assert isinstance(el, (plt.Axes, dict)), msg.format(
-                el.__class__.__name__)
+            msg = ("one of 'objs' is not a matplotlib Axes instance, type "
+                   "encountered {name!r}").format(name=el.__class__.__name__)
+            assert isinstance(el, (plt.Axes, dict)), msg
     else:
-        assert isinstance(objs, (plt.Artist, tuple, dict)), \
-            ('objs is neither an ndarray of Artist instances nor a '
-             'single Artist instance, tuple, or dict, "objs" is a {0!r} '
-             ''.format(objs.__class__.__name__))
+        assert isinstance(objs, (plt.Artist, tuple, dict)), (
+            'objs is neither an ndarray of Artist instances nor a '
+            'single Artist instance, tuple, or dict, "objs" is a {name!r}'
+            .format(name=objs.__class__.__name__))
 
 
 def isiterable(obj):
@@ -944,118 +973,131 @@ def is_sorted(seq):
     return assert_numpy_array_equal(seq, np.sort(np.array(seq)))
 
 
-def assertIs(first, second, msg=''):
-    """Checks that 'first' is 'second'"""
-    a, b = first, second
-    assert a is b, "%s: %r is not %r" % (msg.format(a, b), a, b)
-
-
-def assertIsNot(first, second, msg=''):
-    """Checks that 'first' is not 'second'"""
-    a, b = first, second
-    assert a is not b, "%s: %r is %r" % (msg.format(a, b), a, b)
-
-
-def assertIn(first, second, msg=''):
-    """Checks that 'first' is in 'second'"""
-    a, b = first, second
-    assert a in b, "%s: %r is not in %r" % (msg.format(a, b), a, b)
-
-
-def assertNotIn(first, second, msg=''):
-    """Checks that 'first' is not in 'second'"""
-    a, b = first, second
-    assert a not in b, "%s: %r is in %r" % (msg.format(a, b), a, b)
-
-
-def assertIsNone(expr, msg=''):
-    """Checks that 'expr' is None"""
-    return assertIs(expr, None, msg)
-
-
-def assertIsNotNone(expr, msg=''):
-    """Checks that 'expr' is not None"""
-    return assertIsNot(expr, None, msg)
-
-
-def assertIsInstance(obj, cls, msg=''):
-    """Test that obj is an instance of cls
-    (which can be a class or a tuple of classes,
-    as supported by isinstance())."""
-    if not isinstance(obj, cls):
-        err_msg = "{0}Expected type {1}, found {2} instead"
-        raise AssertionError(err_msg.format(msg, cls, type(obj)))
-
-
-def assertNotIsInstance(obj, cls, msg=''):
-    """Test that obj is not an instance of cls
-    (which can be a class or a tuple of classes,
-    as supported by isinstance())."""
-    if isinstance(obj, cls):
-        err_msg = "{0}Input must not be type {1}"
-        raise AssertionError(err_msg.format(msg, cls))
-
-
 def assert_categorical_equal(left, right, check_dtype=True,
-                             obj='Categorical', check_category_order=True):
-    """Test that categoricals are eqivalent
+                             check_category_order=True, obj='Categorical'):
+    """Test that Categoricals are equivalent.
 
     Parameters
     ----------
-    left, right : Categorical
-        Categoricals to compare
+    left : Categorical
+    right : Categorical
     check_dtype : bool, default True
         Check that integer dtype of the codes are the same
-    obj : str, default 'Categorical'
-        Specify object name being compared, internally used to show appropriate
-        assertion message
     check_category_order : bool, default True
         Whether the order of the categories should be compared, which
         implies identical integer codes.  If False, only the resulting
         values are compared.  The ordered attribute is
         checked regardless.
+    obj : str, default 'Categorical'
+        Specify object name being compared, internally used to show appropriate
+        assertion message
     """
-    assertIsInstance(left, pd.Categorical, '[Categorical] ')
-    assertIsInstance(right, pd.Categorical, '[Categorical] ')
+    _check_isinstance(left, right, Categorical)
 
     if check_category_order:
         assert_index_equal(left.categories, right.categories,
-                           obj='{0}.categories'.format(obj))
+                           obj='{obj}.categories'.format(obj=obj))
         assert_numpy_array_equal(left.codes, right.codes,
                                  check_dtype=check_dtype,
-                                 obj='{0}.codes'.format(obj))
+                                 obj='{obj}.codes'.format(obj=obj))
     else:
         assert_index_equal(left.categories.sort_values(),
                            right.categories.sort_values(),
-                           obj='{0}.categories'.format(obj))
+                           obj='{obj}.categories'.format(obj=obj))
         assert_index_equal(left.categories.take(left.codes),
                            right.categories.take(right.codes),
-                           obj='{0}.values'.format(obj))
+                           obj='{obj}.values'.format(obj=obj))
+
+    assert_attr_equal('ordered', left, right, obj=obj)
+
+
+def assert_interval_array_equal(left, right, exact='equiv',
+                                obj='IntervalArray'):
+    """Test that two IntervalArrays are equivalent.
+
+    Parameters
+    ----------
+    left, right : IntervalArray
+        The IntervalArrays to compare.
+    exact : bool / string {'equiv'}, default 'equiv'
+        Whether to check the Index class, dtype and inferred_type
+        are identical. If 'equiv', then RangeIndex can be substituted for
+        Int64Index as well.
+    obj : str, default 'IntervalArray'
+        Specify object name being compared, internally used to show appropriate
+        assertion message
+    """
+    _check_isinstance(left, right, IntervalArray)
+
+    assert_index_equal(left.left, right.left, exact=exact,
+                       obj='{obj}.left'.format(obj=obj))
+    assert_index_equal(left.right, right.right, exact=exact,
+                       obj='{obj}.left'.format(obj=obj))
+    assert_attr_equal('closed', left, right, obj=obj)
+
+
+def assert_period_array_equal(left, right, obj='PeriodArray'):
+    _check_isinstance(left, right, PeriodArray)
 
-    assert_attr_equal('ordered', left, right, obj=obj)
+    assert_numpy_array_equal(left._data, right._data,
+                             obj='{obj}.values'.format(obj=obj))
+    assert_attr_equal('freq', left, right, obj=obj)
+
+
+def assert_datetime_array_equal(left, right, obj='DatetimeArray'):
+    __tracebackhide__ = True
+    _check_isinstance(left, right, DatetimeArray)
+
+    assert_numpy_array_equal(left._data, right._data,
+                             obj='{obj}._data'.format(obj=obj))
+    assert_attr_equal('freq', left, right, obj=obj)
+    assert_attr_equal('tz', left, right, obj=obj)
+
+
+def assert_timedelta_array_equal(left, right, obj='TimedeltaArray'):
+    __tracebackhide__ = True
+    _check_isinstance(left, right, TimedeltaArray)
+    assert_numpy_array_equal(left._data, right._data,
+                             obj='{obj}._data'.format(obj=obj))
+    assert_attr_equal('freq', left, right, obj=obj)
 
 
 def raise_assert_detail(obj, message, left, right, diff=None):
+    __tracebackhide__ = True
+
     if isinstance(left, np.ndarray):
         left = pprint_thing(left)
+    elif is_categorical_dtype(left):
+        left = repr(left)
+
+    if PY2 and isinstance(left, string_types):
+        # left needs to be printable in native text type in python2
+        left = left.encode('utf-8')
+
     if isinstance(right, np.ndarray):
         right = pprint_thing(right)
+    elif is_categorical_dtype(right):
+        right = repr(right)
+
+    if PY2 and isinstance(right, string_types):
+        # right needs to be printable in native text type in python2
+        right = right.encode('utf-8')
 
-    msg = """{0} are different
+    msg = """{obj} are different
 
-{1}
-[left]:  {2}
-[right]: {3}""".format(obj, message, left, right)
+{message}
+[left]:  {left}
+[right]: {right}""".format(obj=obj, message=message, left=left, right=right)
 
     if diff is not None:
-        msg = msg + "\n[diff]: {diff}".format(diff=diff)
+        msg += "\n[diff]: {diff}".format(diff=diff)
 
     raise AssertionError(msg)
 
 
 def assert_numpy_array_equal(left, right, strict_nan=False,
                              check_dtype=True, err_msg=None,
-                             obj='numpy array', check_same=None):
+                             check_same=None, obj='numpy array'):
     """ Checks that 'np.ndarray' is equivalent
 
     Parameters
@@ -1068,33 +1110,42 @@ def assert_numpy_array_equal(left, right, strict_nan=False,
         check dtype if both a and b are np.ndarray
     err_msg : str, default None
         If provided, used as assertion message
+    check_same : None|'copy'|'same', default None
+        Ensure left and right refer/do not refer to the same memory area
     obj : str, default 'numpy array'
         Specify object name being compared, internally used to show appropriate
         assertion message
-    check_same : None|'copy'|'same', default None
-        Ensure left and right refer/do not refer to the same memory area
     """
+    __tracebackhide__ = True
 
     # instance validation
-    # to show a detailed erorr message when classes are different
+    # Show a detailed error message when classes are different
     assert_class_equal(left, right, obj=obj)
     # both classes must be an np.ndarray
-    assertIsInstance(left, np.ndarray, '[ndarray] ')
-    assertIsInstance(right, np.ndarray, '[ndarray] ')
+    _check_isinstance(left, right, np.ndarray)
 
     def _get_base(obj):
         return obj.base if getattr(obj, 'base', None) is not None else obj
 
+    left_base = _get_base(left)
+    right_base = _get_base(right)
+
     if check_same == 'same':
-        assertIs(_get_base(left), _get_base(right))
+        if left_base is not right_base:
+            msg = "{left!r} is not {right!r}".format(
+                left=left_base, right=right_base)
+            raise AssertionError(msg)
     elif check_same == 'copy':
-        assertIsNot(_get_base(left), _get_base(right))
+        if left_base is right_base:
+            msg = "{left!r} is {right!r}".format(
+                left=left_base, right=right_base)
+            raise AssertionError(msg)
 
     def _raise(left, right, err_msg):
         if err_msg is None:
             if left.shape != right.shape:
-                raise_assert_detail(obj, '{0} shapes are different'
-                                    .format(obj), left.shape, right.shape)
+                raise_assert_detail(obj, '{obj} shapes are different'
+                                    .format(obj=obj), left.shape, right.shape)
 
             diff = 0
             for l, r in zip(left, right):
@@ -1103,8 +1154,8 @@ def _raise(left, right, err_msg):
                     diff += 1
 
             diff = diff * 100.0 / left.size
-            msg = '{0} values are different ({1} %)'\
-                .format(obj, np.round(diff, 5))
+            msg = '{obj} values are different ({pct} %)'.format(
+                obj=obj, pct=np.round(diff, 5))
             raise_assert_detail(obj, msg, left, right)
 
         raise AssertionError(err_msg)
@@ -1120,6 +1171,55 @@ def _raise(left, right, err_msg):
     return True
 
 
+def assert_extension_array_equal(left, right, check_dtype=True,
+                                 check_less_precise=False,
+                                 check_exact=False):
+    """Check that left and right ExtensionArrays are equal.
+
+    Parameters
+    ----------
+    left, right : ExtensionArray
+        The two arrays to compare
+    check_dtype : bool, default True
+        Whether to check if the ExtensionArray dtypes are identical.
+    check_less_precise : bool or int, default False
+        Specify comparison precision. Only used when check_exact is False.
+        5 digits (False) or 3 digits (True) after decimal points are compared.
+        If int, then specify the digits to compare.
+    check_exact : bool, default False
+        Whether to compare number exactly.
+
+    Notes
+    -----
+    Missing values are checked separately from valid values.
+    A mask of missing values is computed for each and checked to match.
+    The remaining all-valid values are cast to object dtype and checked.
+    """
+    assert isinstance(left, ExtensionArray), 'left is not an ExtensionArray'
+    assert isinstance(right, ExtensionArray), 'right is not an ExtensionArray'
+    if check_dtype:
+        assert_attr_equal('dtype', left, right, obj='ExtensionArray')
+
+    if hasattr(left, "asi8") and type(right) == type(left):
+        # Avoid slow object-dtype comparisons
+        assert_numpy_array_equal(left.asi8, right.asi8)
+        return
+
+    left_na = np.asarray(left.isna())
+    right_na = np.asarray(right.isna())
+    assert_numpy_array_equal(left_na, right_na, obj='ExtensionArray NA mask')
+
+    left_valid = np.asarray(left[~left_na].astype(object))
+    right_valid = np.asarray(right[~right_na].astype(object))
+    if check_exact:
+        assert_numpy_array_equal(left_valid, right_valid, obj='ExtensionArray')
+    else:
+        _testing.assert_almost_equal(left_valid, right_valid,
+                                     check_dtype=check_dtype,
+                                     check_less_precise=check_less_precise,
+                                     obj='ExtensionArray')
+
+
 # This could be refactored to use the NDFrame.equals method
 def assert_series_equal(left, right, check_dtype=True,
                         check_index_type='equiv',
@@ -1146,35 +1246,35 @@ def assert_series_equal(left, right, check_dtype=True,
     check_less_precise : bool or int, default False
         Specify comparison precision. Only used when check_exact is False.
         5 digits (False) or 3 digits (True) after decimal points are compared.
-        If int, then specify the digits to compare
-    check_exact : bool, default False
-        Whether to compare number exactly.
+        If int, then specify the digits to compare.
     check_names : bool, default True
         Whether to check the Series and Index names attribute.
+    check_exact : bool, default False
+        Whether to compare number exactly.
     check_datetimelike_compat : bool, default False
         Compare datetime-like which is comparable ignoring dtype.
     check_categorical : bool, default True
         Whether to compare internal Categorical exactly.
     obj : str, default 'Series'
         Specify object name being compared, internally used to show appropriate
-        assertion message
+        assertion message.
     """
+    __tracebackhide__ = True
 
     # instance validation
-    assertIsInstance(left, Series, '[Series] ')
-    assertIsInstance(right, Series, '[Series] ')
+    _check_isinstance(left, right, Series)
 
     if check_series_type:
         # ToDo: There are some tests using rhs is sparse
         # lhs is dense. Should use assert_class_equal in future
-        assertIsInstance(left, type(right))
+        assert isinstance(left, type(right))
         # assert_class_equal(left, right, obj=obj)
 
     # length comparison
     if len(left) != len(right):
-        raise_assert_detail(obj, 'Series length are different',
-                            '{0}, {1}'.format(len(left), left.index),
-                            '{0}, {1}'.format(len(right), right.index))
+        msg1 = '{len}, {left}'.format(len=len(left), left=left.index)
+        msg2 = '{len}, {right}'.format(len=len(right), right=right.index)
+        raise_assert_detail(obj, 'Series length are different', msg1, msg2)
 
     # index comparison
     assert_index_equal(left.index, right.index, exact=check_index_type,
@@ -1182,15 +1282,22 @@ def assert_series_equal(left, right, check_dtype=True,
                        check_less_precise=check_less_precise,
                        check_exact=check_exact,
                        check_categorical=check_categorical,
-                       obj='{0}.index'.format(obj))
+                       obj='{obj}.index'.format(obj=obj))
 
     if check_dtype:
-        assert_attr_equal('dtype', left, right)
+        # We want to skip exact dtype checking when `check_categorical`
+        # is False. We'll still raise if only one is a `Categorical`,
+        # regardless of `check_categorical`
+        if (is_categorical_dtype(left) and is_categorical_dtype(right) and
+                not check_categorical):
+            pass
+        else:
+            assert_attr_equal('dtype', left, right)
 
     if check_exact:
         assert_numpy_array_equal(left.get_values(), right.get_values(),
                                  check_dtype=check_dtype,
-                                 obj='{0}'.format(obj),)
+                                 obj='{obj}'.format(obj=obj),)
     elif check_datetimelike_compat:
         # we want to check only if we have compat dtypes
         # e.g. integer and M|m are NOT compat, but we can simply check
@@ -1203,16 +1310,31 @@ def assert_series_equal(left, right, check_dtype=True,
             # datetimelike may have different objects (e.g. datetime.datetime
             # vs Timestamp) but will compare equal
             if not Index(left.values).equals(Index(right.values)):
-                msg = '[datetimelike_compat=True] {0} is not equal to {1}.'
-                raise AssertionError(msg.format(left.values, right.values))
+                msg = ('[datetimelike_compat=True] {left} is not equal to '
+                       '{right}.').format(left=left.values, right=right.values)
+                raise AssertionError(msg)
         else:
             assert_numpy_array_equal(left.get_values(), right.get_values(),
                                      check_dtype=check_dtype)
+    elif is_interval_dtype(left) or is_interval_dtype(right):
+        assert_interval_array_equal(left.array, right.array)
+
+    elif (is_extension_array_dtype(left.dtype) and
+          is_datetime64tz_dtype(left.dtype)):
+        # .values is an ndarray, but ._values is the ExtensionArray.
+        # TODO: Use .array
+        assert is_extension_array_dtype(right.dtype)
+        return assert_extension_array_equal(left._values, right._values)
+
+    elif (is_extension_array_dtype(left) and not is_categorical_dtype(left) and
+          is_extension_array_dtype(right) and not is_categorical_dtype(right)):
+        return assert_extension_array_equal(left.array, right.array)
+
     else:
-        libtesting.assert_almost_equal(left.get_values(), right.get_values(),
-                                       check_less_precise=check_less_precise,
-                                       check_dtype=check_dtype,
-                                       obj='{0}'.format(obj))
+        _testing.assert_almost_equal(left.get_values(), right.get_values(),
+                                     check_less_precise=check_less_precise,
+                                     check_dtype=check_dtype,
+                                     obj='{obj}'.format(obj=obj))
 
     # metadata comparison
     if check_names:
@@ -1221,7 +1343,7 @@ def assert_series_equal(left, right, check_dtype=True,
     if check_categorical:
         if is_categorical_dtype(left) or is_categorical_dtype(right):
             assert_categorical_equal(left.values, right.values,
-                                     obj='{0} category'.format(obj))
+                                     obj='{obj} category'.format(obj=obj))
 
 
 # This could be refactored to use the NDFrame.equals method
@@ -1237,28 +1359,41 @@ def assert_frame_equal(left, right, check_dtype=True,
                        check_categorical=True,
                        check_like=False,
                        obj='DataFrame'):
-    """Check that left and right DataFrame are equal.
+    """
+    Check that left and right DataFrame are equal.
+
+    This function is intended to compare two DataFrames and output any
+    differences. Is is mostly intended for use in unit tests.
+    Additional parameters allow varying the strictness of the
+    equality checks performed.
 
     Parameters
     ----------
     left : DataFrame
+        First DataFrame to compare.
     right : DataFrame
+        Second DataFrame to compare.
     check_dtype : bool, default True
         Whether to check the DataFrame dtype is identical.
-    check_index_type : bool / string {'equiv'}, default False
+    check_index_type : bool / string {'equiv'}, default 'equiv'
         Whether to check the Index class, dtype and inferred_type
         are identical.
-    check_column_type : bool / string {'equiv'}, default False
+    check_column_type : bool / string {'equiv'}, default 'equiv'
         Whether to check the columns class, dtype and inferred_type
-        are identical.
-    check_frame_type : bool, default False
+        are identical. Is passed as the ``exact`` argument of
+        :func:`assert_index_equal`.
+    check_frame_type : bool, default True
         Whether to check the DataFrame class is identical.
     check_less_precise : bool or int, default False
         Specify comparison precision. Only used when check_exact is False.
         5 digits (False) or 3 digits (True) after decimal points are compared.
-        If int, then specify the digits to compare
+        If int, then specify the digits to compare.
     check_names : bool, default True
-        Whether to check the Index names attribute.
+        Whether to check that the `names` attribute for both the `index`
+        and `column` attributes of the DataFrame is identical, i.e.
+
+        * left.index.names == right.index.names
+        * left.columns.names == right.columns.names
     by_blocks : bool, default False
         Specify how to compare internal data. If False, compare by columns.
         If True, compare by blocks.
@@ -1269,28 +1404,59 @@ def assert_frame_equal(left, right, check_dtype=True,
     check_categorical : bool, default True
         Whether to compare internal Categorical exactly.
     check_like : bool, default False
-        If true, ignore the order of rows & columns
+        If True, ignore the order of index & columns.
+        Note: index labels must match their respective rows
+        (same as in columns) - same labels must be with the same data.
     obj : str, default 'DataFrame'
         Specify object name being compared, internally used to show appropriate
-        assertion message
+        assertion message.
+
+    See Also
+    --------
+    assert_series_equal : Equivalent method for asserting Series equality.
+    DataFrame.equals : Check DataFrame equality.
+
+    Examples
+    --------
+    This example shows comparing two DataFrames that are equal
+    but with columns of differing dtypes.
+
+    >>> from pandas.util.testing import assert_frame_equal
+    >>> df1 = pd.DataFrame({'a': [1, 2], 'b': [3, 4]})
+    >>> df2 = pd.DataFrame({'a': [1, 2], 'b': [3.0, 4.0]})
+
+    df1 equals itself.
+    >>> assert_frame_equal(df1, df1)
+
+    df1 differs from df2 as column 'b' is of a different type.
+    >>> assert_frame_equal(df1, df2)
+    Traceback (most recent call last):
+    AssertionError: Attributes are different
+
+    Attribute "dtype" are different
+    [left]:  int64
+    [right]: float64
+
+    Ignore differing dtypes in columns with check_dtype.
+    >>> assert_frame_equal(df1, df2, check_dtype=False)
     """
+    __tracebackhide__ = True
 
     # instance validation
-    assertIsInstance(left, DataFrame, '[DataFrame] ')
-    assertIsInstance(right, DataFrame, '[DataFrame] ')
+    _check_isinstance(left, right, DataFrame)
 
     if check_frame_type:
         # ToDo: There are some tests using rhs is SparseDataFrame
         # lhs is DataFrame. Should use assert_class_equal in future
-        assertIsInstance(left, type(right))
+        assert isinstance(left, type(right))
         # assert_class_equal(left, right, obj=obj)
 
     # shape comparison
     if left.shape != right.shape:
         raise_assert_detail(obj,
                             'DataFrame shape mismatch',
-                            '({0}, {1})'.format(*left.shape),
-                            '({0}, {1})'.format(*right.shape))
+                            '{shape!r}'.format(shape=left.shape),
+                            '{shape!r}'.format(shape=right.shape))
 
     if check_like:
         left, right = left.reindex_like(right), right
@@ -1301,7 +1467,7 @@ def assert_frame_equal(left, right, check_dtype=True,
                        check_less_precise=check_less_precise,
                        check_exact=check_exact,
                        check_categorical=check_categorical,
-                       obj='{0}.index'.format(obj))
+                       obj='{obj}.index'.format(obj=obj))
 
     # column comparison
     assert_index_equal(left.columns, right.columns, exact=check_column_type,
@@ -1309,12 +1475,12 @@ def assert_frame_equal(left, right, check_dtype=True,
                        check_less_precise=check_less_precise,
                        check_exact=check_exact,
                        check_categorical=check_categorical,
-                       obj='{0}.columns'.format(obj))
+                       obj='{obj}.columns'.format(obj=obj))
 
     # compare by blocks
     if by_blocks:
-        rblocks = right.blocks
-        lblocks = left.blocks
+        rblocks = right._to_dict_of_blocks()
+        lblocks = left._to_dict_of_blocks()
         for dtype in list(set(list(lblocks.keys()) + list(rblocks.keys()))):
             assert dtype in lblocks
             assert dtype in rblocks
@@ -1334,83 +1500,102 @@ def assert_frame_equal(left, right, check_dtype=True,
                 check_exact=check_exact, check_names=check_names,
                 check_datetimelike_compat=check_datetimelike_compat,
                 check_categorical=check_categorical,
-                obj='DataFrame.iloc[:, {0}]'.format(i))
+                obj='DataFrame.iloc[:, {idx}]'.format(idx=i))
 
 
-def assert_panelnd_equal(left, right,
-                         check_dtype=True,
-                         check_panel_type=False,
-                         check_less_precise=False,
-                         assert_func=assert_frame_equal,
-                         check_names=False,
-                         by_blocks=False,
-                         obj='Panel'):
-    """Check that left and right Panels are equal.
+def assert_equal(left, right, **kwargs):
+    """
+    Wrapper for tm.assert_*_equal to dispatch to the appropriate test function.
 
     Parameters
     ----------
-    left : Panel (or nd)
-    right : Panel (or nd)
-    check_dtype : bool, default True
-        Whether to check the Panel dtype is identical.
-    check_panel_type : bool, default False
-        Whether to check the Panel class is identical.
-    check_less_precise : bool or int, default False
-        Specify comparison precision. Only used when check_exact is False.
-        5 digits (False) or 3 digits (True) after decimal points are compared.
-        If int, then specify the digits to compare
-    assert_func : function for comparing data
-    check_names : bool, default True
-        Whether to check the Index names attribute.
-    by_blocks : bool, default False
-        Specify how to compare internal data. If False, compare by columns.
-        If True, compare by blocks.
-    obj : str, default 'Panel'
-        Specify the object name being compared, internally used to show
-        the appropriate assertion message.
+    left : Index, Series, DataFrame, ExtensionArray, or np.ndarray
+    right : Index, Series, DataFrame, ExtensionArray, or np.ndarray
+    **kwargs
     """
+    __tracebackhide__ = True
 
-    if check_panel_type:
-        assert_class_equal(left, right, obj=obj)
-
-    for axis in left._AXIS_ORDERS:
-        left_ind = getattr(left, axis)
-        right_ind = getattr(right, axis)
-        assert_index_equal(left_ind, right_ind, check_names=check_names)
-
-    if by_blocks:
-        rblocks = right.blocks
-        lblocks = left.blocks
-        for dtype in list(set(list(lblocks.keys()) + list(rblocks.keys()))):
-            assert dtype in lblocks
-            assert dtype in rblocks
-            array_equivalent(lblocks[dtype].values, rblocks[dtype].values)
+    if isinstance(left, pd.Index):
+        assert_index_equal(left, right, **kwargs)
+    elif isinstance(left, pd.Series):
+        assert_series_equal(left, right, **kwargs)
+    elif isinstance(left, pd.DataFrame):
+        assert_frame_equal(left, right, **kwargs)
+    elif isinstance(left, IntervalArray):
+        assert_interval_array_equal(left, right, **kwargs)
+    elif isinstance(left, PeriodArray):
+        assert_period_array_equal(left, right, **kwargs)
+    elif isinstance(left, DatetimeArray):
+        assert_datetime_array_equal(left, right, **kwargs)
+    elif isinstance(left, TimedeltaArray):
+        assert_timedelta_array_equal(left, right, **kwargs)
+    elif isinstance(left, ExtensionArray):
+        assert_extension_array_equal(left, right, **kwargs)
+    elif isinstance(left, np.ndarray):
+        assert_numpy_array_equal(left, right, **kwargs)
     else:
+        raise NotImplementedError(type(left))
 
-        # can potentially be slow
-        for i, item in enumerate(left._get_axis(0)):
-            assert item in right, "non-matching item (right) '%s'" % item
-            litem = left.iloc[i]
-            ritem = right.iloc[i]
-            assert_func(litem, ritem, check_less_precise=check_less_precise)
 
-        for i, item in enumerate(right._get_axis(0)):
-            assert item in left, "non-matching item (left) '%s'" % item
+def box_expected(expected, box_cls, transpose=True):
+    """
+    Helper function to wrap the expected output of a test in a given box_class.
 
+    Parameters
+    ----------
+    expected : np.ndarray, Index, Series
+    box_cls : {Index, Series, DataFrame}
 
-# TODO: strangely check_names fails in py3 ?
-_panel_frame_equal = partial(assert_frame_equal, check_names=False)
-assert_panel_equal = partial(assert_panelnd_equal,
-                             assert_func=_panel_frame_equal)
-assert_panel4d_equal = partial(assert_panelnd_equal,
-                               assert_func=assert_panel_equal)
+    Returns
+    -------
+    subclass of box_cls
+    """
+    if box_cls is pd.Index:
+        expected = pd.Index(expected)
+    elif box_cls is pd.Series:
+        expected = pd.Series(expected)
+    elif box_cls is pd.DataFrame:
+        expected = pd.Series(expected).to_frame()
+        if transpose:
+            # for vector operations, we we need a DataFrame to be a single-row,
+            #  not a single-column, in order to operate against non-DataFrame
+            #  vectors of the same length.
+            expected = expected.T
+    elif box_cls is PeriodArray:
+        # the PeriodArray constructor is not as flexible as period_array
+        expected = period_array(expected)
+    elif box_cls is DatetimeArray:
+        expected = DatetimeArray(expected)
+    elif box_cls is TimedeltaArray:
+        expected = TimedeltaArray(expected)
+    elif box_cls is np.ndarray:
+        expected = np.array(expected)
+    elif box_cls is to_array:
+        expected = to_array(expected)
+    else:
+        raise NotImplementedError(box_cls)
+    return expected
+
+
+def to_array(obj):
+    # temporary implementation until we get pd.array in place
+    if is_period_dtype(obj):
+        return period_array(obj)
+    elif is_datetime64_dtype(obj) or is_datetime64tz_dtype(obj):
+        return DatetimeArray._from_sequence(obj)
+    elif is_timedelta64_dtype(obj):
+        return TimedeltaArray._from_sequence(obj)
+    else:
+        return np.array(obj)
 
 
 # -----------------------------------------------------------------------------
 # Sparse
 
 
-def assert_sp_array_equal(left, right, check_dtype=True):
+def assert_sp_array_equal(left, right, check_dtype=True, check_kind=True,
+                          check_fill_value=True,
+                          consolidate_block_indices=False):
     """Check that the left and right SparseArray are equal.
 
     Parameters
@@ -1419,25 +1604,48 @@ def assert_sp_array_equal(left, right, check_dtype=True):
     right : SparseArray
     check_dtype : bool, default True
         Whether to check the data dtype is identical.
+    check_kind : bool, default True
+        Whether to just the kind of the sparse index for each column.
+    check_fill_value : bool, default True
+        Whether to check that left.fill_value matches right.fill_value
+    consolidate_block_indices : bool, default False
+        Whether to consolidate contiguous blocks for sparse arrays with
+        a BlockIndex. Some operations, e.g. concat, will end up with
+        block indices that could be consolidated. Setting this to true will
+        create a new BlockIndex for that array, with consolidated
+        block indices.
     """
 
-    assertIsInstance(left, pd.SparseArray, '[SparseArray]')
-    assertIsInstance(right, pd.SparseArray, '[SparseArray]')
+    _check_isinstance(left, right, pd.SparseArray)
 
     assert_numpy_array_equal(left.sp_values, right.sp_values,
                              check_dtype=check_dtype)
 
     # SparseIndex comparison
-    assertIsInstance(left.sp_index,
-                     pd.sparse.libsparse.SparseIndex, '[SparseIndex]')
-    assertIsInstance(right.sp_index,
-                     pd.sparse.libsparse.SparseIndex, '[SparseIndex]')
+    assert isinstance(left.sp_index, pd._libs.sparse.SparseIndex)
+    assert isinstance(right.sp_index, pd._libs.sparse.SparseIndex)
+
+    if not check_kind:
+        left_index = left.sp_index.to_block_index()
+        right_index = right.sp_index.to_block_index()
+    else:
+        left_index = left.sp_index
+        right_index = right.sp_index
+
+    if consolidate_block_indices and left.kind == 'block':
+        # we'll probably remove this hack...
+        left_index = left_index.to_int_index().to_block_index()
+        right_index = right_index.to_int_index().to_block_index()
 
-    if not left.sp_index.equals(right.sp_index):
+    if not left_index.equals(right_index):
         raise_assert_detail('SparseArray.index', 'index are not equal',
-                            left.sp_index, right.sp_index)
+                            left_index, right_index)
+    else:
+        # Just ensure a
+        pass
 
-    assert_attr_equal('fill_value', left, right)
+    if check_fill_value:
+        assert_attr_equal('fill_value', left, right)
     if check_dtype:
         assert_attr_equal('dtype', left, right)
     assert_numpy_array_equal(left.values, right.values,
@@ -1446,6 +1654,9 @@ def assert_sp_array_equal(left, right, check_dtype=True):
 
 def assert_sp_series_equal(left, right, check_dtype=True, exact_indices=True,
                            check_series_type=True, check_names=True,
+                           check_kind=True,
+                           check_fill_value=True,
+                           consolidate_block_indices=False,
                            obj='SparseSeries'):
     """Check that the left and right SparseSeries are equal.
 
@@ -1460,31 +1671,47 @@ def assert_sp_series_equal(left, right, check_dtype=True, exact_indices=True,
         Whether to check the SparseSeries class is identical.
     check_names : bool, default True
         Whether to check the SparseSeries name attribute.
+    check_kind : bool, default True
+        Whether to just the kind of the sparse index for each column.
+    check_fill_value : bool, default True
+        Whether to check that left.fill_value matches right.fill_value
+    consolidate_block_indices : bool, default False
+        Whether to consolidate contiguous blocks for sparse arrays with
+        a BlockIndex. Some operations, e.g. concat, will end up with
+        block indices that could be consolidated. Setting this to true will
+        create a new BlockIndex for that array, with consolidated
+        block indices.
     obj : str, default 'SparseSeries'
         Specify the object name being compared, internally used to show
         the appropriate assertion message.
     """
-    assertIsInstance(left, pd.SparseSeries, '[SparseSeries]')
-    assertIsInstance(right, pd.SparseSeries, '[SparseSeries]')
+    _check_isinstance(left, right, pd.SparseSeries)
 
     if check_series_type:
         assert_class_equal(left, right, obj=obj)
 
     assert_index_equal(left.index, right.index,
-                       obj='{0}.index'.format(obj))
+                       obj='{obj}.index'.format(obj=obj))
 
-    assert_sp_array_equal(left.block.values, right.block.values)
+    assert_sp_array_equal(left.values, right.values,
+                          check_kind=check_kind,
+                          check_fill_value=check_fill_value,
+                          consolidate_block_indices=consolidate_block_indices)
 
     if check_names:
         assert_attr_equal('name', left, right)
     if check_dtype:
         assert_attr_equal('dtype', left, right)
 
-    assert_numpy_array_equal(left.values, right.values)
+    assert_numpy_array_equal(np.asarray(left.values),
+                             np.asarray(right.values))
 
 
 def assert_sp_frame_equal(left, right, check_dtype=True, exact_indices=True,
-                          check_frame_type=True, obj='SparseDataFrame'):
+                          check_frame_type=True, check_kind=True,
+                          check_fill_value=True,
+                          consolidate_block_indices=False,
+                          obj='SparseDataFrame'):
     """Check that the left and right SparseDataFrame are equal.
 
     Parameters
@@ -1498,54 +1725,62 @@ def assert_sp_frame_equal(left, right, check_dtype=True, exact_indices=True,
         otherwise just compare dense representations.
     check_frame_type : bool, default True
         Whether to check the SparseDataFrame class is identical.
+    check_kind : bool, default True
+        Whether to just the kind of the sparse index for each column.
+    check_fill_value : bool, default True
+        Whether to check that left.fill_value matches right.fill_value
+    consolidate_block_indices : bool, default False
+        Whether to consolidate contiguous blocks for sparse arrays with
+        a BlockIndex. Some operations, e.g. concat, will end up with
+        block indices that could be consolidated. Setting this to true will
+        create a new BlockIndex for that array, with consolidated
+        block indices.
     obj : str, default 'SparseDataFrame'
         Specify the object name being compared, internally used to show
         the appropriate assertion message.
     """
-    assertIsInstance(left, pd.SparseDataFrame, '[SparseDataFrame]')
-    assertIsInstance(right, pd.SparseDataFrame, '[SparseDataFrame]')
+    _check_isinstance(left, right, pd.SparseDataFrame)
 
     if check_frame_type:
         assert_class_equal(left, right, obj=obj)
 
     assert_index_equal(left.index, right.index,
-                       obj='{0}.index'.format(obj))
+                       obj='{obj}.index'.format(obj=obj))
     assert_index_equal(left.columns, right.columns,
-                       obj='{0}.columns'.format(obj))
+                       obj='{obj}.columns'.format(obj=obj))
+
+    if check_fill_value:
+        assert_attr_equal('default_fill_value', left, right, obj=obj)
 
     for col, series in compat.iteritems(left):
         assert (col in right)
         # trade-off?
 
         if exact_indices:
-            assert_sp_series_equal(series, right[col],
-                                   check_dtype=check_dtype)
+            assert_sp_series_equal(
+                series, right[col],
+                check_dtype=check_dtype,
+                check_kind=check_kind,
+                check_fill_value=check_fill_value,
+                consolidate_block_indices=consolidate_block_indices
+            )
         else:
             assert_series_equal(series.to_dense(), right[col].to_dense(),
                                 check_dtype=check_dtype)
 
-    assert_attr_equal('default_fill_value', left, right, obj=obj)
-
     # do I care?
     # assert(left.default_kind == right.default_kind)
 
     for col in right:
         assert (col in left)
 
-
-def assert_sp_list_equal(left, right):
-    assertIsInstance(left, pd.SparseList, '[SparseList]')
-    assertIsInstance(right, pd.SparseList, '[SparseList]')
-
-    assert_sp_array_equal(left.to_array(), right.to_array())
-
 # -----------------------------------------------------------------------------
 # Others
 
 
 def assert_contains_all(iterable, dic):
     for k in iterable:
-        assert k in dic, "Did not contain item: '%r'" % k
+        assert k in dic, "Did not contain item: '{key!r}'".format(key=k)
 
 
 def assert_copy(iter1, iter2, **eql_kwargs):
@@ -1559,20 +1794,16 @@ def assert_copy(iter1, iter2, **eql_kwargs):
     """
     for elem1, elem2 in zip(iter1, iter2):
         assert_almost_equal(elem1, elem2, **eql_kwargs)
-        assert elem1 is not elem2, ("Expected object %r and "
-                                    "object %r to be different "
-                                    "objects, were same."
-                                    % (type(elem1), type(elem2)))
+        msg = ("Expected object {obj1!r} and object {obj2!r} to be "
+               "different objects, but they were the same object."
+               ).format(obj1=type(elem1), obj2=type(elem2))
+        assert elem1 is not elem2, msg
 
 
 def getCols(k):
     return string.ascii_uppercase[:k]
 
 
-def getArangeMat():
-    return np.arange(N * K).reshape((N, K))
-
-
 # make index
 def makeStringIndex(k=10, name=None):
     return Index(rands_array(nchars=10, size=k), name=name)
@@ -1582,10 +1813,16 @@ def makeUnicodeIndex(k=10, name=None):
     return Index(randu_array(nchars=10, size=k), name=name)
 
 
-def makeCategoricalIndex(k=10, n=3, name=None):
+def makeCategoricalIndex(k=10, n=3, name=None, **kwargs):
     """ make a length k index or n categories """
     x = rands_array(nchars=4, size=n)
-    return CategoricalIndex(np.random.choice(x, k), name=name)
+    return CategoricalIndex(np.random.choice(x, k), name=name, **kwargs)
+
+
+def makeIntervalIndex(k=10, name=None, **kwargs):
+    """ make a length k IntervalIndex """
+    x = np.linspace(0, 100, num=(k + 1))
+    return IntervalIndex.from_breaks(x, name=name, **kwargs)
 
 
 def makeBoolIndex(k=10, name=None):
@@ -1604,8 +1841,8 @@ def makeUIntIndex(k=10, name=None):
     return Index([2**63 + i for i in lrange(k)], name=name)
 
 
-def makeRangeIndex(k=10, name=None):
-    return RangeIndex(0, k, 1, name=name)
+def makeRangeIndex(k=10, name=None, **kwargs):
+    return RangeIndex(0, k, 1, name=name, **kwargs)
 
 
 def makeFloatIndex(k=10, name=None):
@@ -1613,22 +1850,28 @@ def makeFloatIndex(k=10, name=None):
     return Index(values * (10 ** np.random.randint(0, 9)), name=name)
 
 
-def makeDateIndex(k=10, freq='B', name=None):
+def makeDateIndex(k=10, freq='B', name=None, **kwargs):
     dt = datetime(2000, 1, 1)
     dr = bdate_range(dt, periods=k, freq=freq, name=name)
-    return DatetimeIndex(dr, name=name)
+    return DatetimeIndex(dr, name=name, **kwargs)
 
 
-def makeTimedeltaIndex(k=10, freq='D', name=None):
-    return TimedeltaIndex(start='1 day', periods=k, freq=freq, name=name)
+def makeTimedeltaIndex(k=10, freq='D', name=None, **kwargs):
+    return pd.timedelta_range(start='1 day', periods=k, freq=freq,
+                              name=name, **kwargs)
 
 
-def makePeriodIndex(k=10, name=None):
+def makePeriodIndex(k=10, name=None, **kwargs):
     dt = datetime(2000, 1, 1)
-    dr = PeriodIndex(start=dt, periods=k, freq='B', name=name)
+    dr = pd.period_range(start=dt, periods=k, freq='B', name=name, **kwargs)
     return dr
 
 
+def makeMultiIndex(k=10, names=None, **kwargs):
+    return MultiIndex.from_product(
+        (('foo', 'bar'), (1, 2)), names=names, **kwargs)
+
+
 def all_index_generator(k=10):
     """Generator which can be iterated over to get instances of all the various
     index classes.
@@ -1639,12 +1882,24 @@ def all_index_generator(k=10):
     """
     all_make_index_funcs = [makeIntIndex, makeFloatIndex, makeStringIndex,
                             makeUnicodeIndex, makeDateIndex, makePeriodIndex,
-                            makeTimedeltaIndex, makeBoolIndex,
+                            makeTimedeltaIndex, makeBoolIndex, makeRangeIndex,
+                            makeIntervalIndex,
                             makeCategoricalIndex]
     for make_index_func in all_make_index_funcs:
         yield make_index_func(k=k)
 
 
+def index_subclass_makers_generator():
+    make_index_funcs = [
+        makeDateIndex, makePeriodIndex,
+        makeTimedeltaIndex, makeRangeIndex,
+        makeIntervalIndex, makeCategoricalIndex,
+        makeMultiIndex
+    ]
+    for make_index_func in make_index_funcs:
+        yield make_index_func
+
+
 def all_timeseries_index_generator(k=10):
     """Generator which can be iterated over to get instances of all the classes
     which represent time-seires.
@@ -1678,7 +1933,7 @@ def makeObjectSeries(name=None):
 
 def getSeriesData():
     index = makeStringIndex(N)
-    return dict((c, Series(randn(N), index=index)) for c in getCols(K))
+    return {c: Series(randn(N), index=index) for c in getCols(K)}
 
 
 def makeTimeSeries(nper=None, freq='B', name=None):
@@ -1694,11 +1949,11 @@ def makePeriodSeries(nper=None, name=None):
 
 
 def getTimeSeriesData(nper=None, freq='B'):
-    return dict((c, makeTimeSeries(nper, freq)) for c in getCols(K))
+    return {c: makeTimeSeries(nper, freq) for c in getCols(K)}
 
 
 def getPeriodData(nper=None):
-    return dict((c, makePeriodSeries(nper)) for c in getCols(K))
+    return {c: makePeriodSeries(nper) for c in getCols(K)}
 
 
 # make frame
@@ -1734,23 +1989,6 @@ def makePeriodFrame(nper=None):
     return DataFrame(data)
 
 
-def makePanel(nper=None):
-    cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
-    data = dict((c, makeTimeDataFrame(nper)) for c in cols)
-    return Panel.fromDict(data)
-
-
-def makePeriodPanel(nper=None):
-    cols = ['Item' + c for c in string.ascii_uppercase[:K - 1]]
-    data = dict((c, makePeriodFrame(nper)) for c in cols)
-    return Panel.fromDict(data)
-
-
-def makePanel4D(nper=None):
-    return Panel4D(dict(l1=makePanel(nper), l2=makePanel(nper),
-                        l3=makePanel(nper)))
-
-
 def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
                     idx_type=None):
     """Create an index/multindex with given dimensions, levels, names, etc'
@@ -1780,8 +2018,9 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
     assert (is_sequence(ndupe_l) and len(ndupe_l) <= nlevels)
     assert (names is None or names is False or
             names is True or len(names) is nlevels)
-    assert idx_type is None or \
-        (idx_type in ('i', 'f', 's', 'u', 'dt', 'p', 'td') and nlevels == 1)
+    assert idx_type is None or (idx_type in ('i', 'f', 's', 'u',
+                                             'dt', 'p', 'td')
+                                and nlevels == 1)
 
     if names is True:
         # build default names
@@ -1806,27 +2045,28 @@ def makeCustomIndex(nentries, nlevels, prefix='#', names=False, ndupe_l=None,
             idx.name = names[0]
         return idx
     elif idx_type is not None:
-        raise ValueError('"%s" is not a legal value for `idx_type`, use  '
-                         '"i"/"f"/"s"/"u"/"dt/"p"/"td".' % idx_type)
+        raise ValueError('"{idx_type}" is not a legal value for `idx_type`, '
+                         'use  "i"/"f"/"s"/"u"/"dt/"p"/"td".'
+                         .format(idx_type=idx_type))
 
     if len(ndupe_l) < nlevels:
         ndupe_l.extend([1] * (nlevels - len(ndupe_l)))
     assert len(ndupe_l) == nlevels
 
-    assert all([x > 0 for x in ndupe_l])
+    assert all(x > 0 for x in ndupe_l)
 
     tuples = []
     for i in range(nlevels):
         def keyfunc(x):
             import re
-            numeric_tuple = re.sub("[^\d_]_?", "", x).split("_")
+            numeric_tuple = re.sub(r"[^\d_]_?", "", x).split("_")
             return lmap(int, numeric_tuple)
 
         # build a list of lists to create the index from
         div_factor = nentries // ndupe_l[i] + 1
         cnt = Counter()
         for j in range(div_factor):
-            label = prefix + '_l%d_g' % i + str(j)
+            label = '{prefix}_l{i}_g{j}'.format(prefix=prefix, i=i, j=j)
             cnt[label] = ndupe_l[i]
         # cute Counter trick
         result = list(sorted(cnt.elements(), key=keyfunc))[:nentries]
@@ -1836,7 +2076,11 @@ def keyfunc(x):
 
     # convert tuples to index
     if nentries == 1:
+        # we have a single level of tuples, i.e. a regular Index
         index = Index(tuples[0], name=names[0])
+    elif nlevels == 1:
+        name = None if names is None else names[0]
+        index = Index((x[0] for x in tuples), name=name)
     else:
         index = MultiIndex.from_tuples(tuples, names=names)
     return index
@@ -1849,8 +2093,8 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
     """
    nrows,  ncols - number of data rows/cols
    c_idx_names, idx_names  - False/True/list of strings,  yields No names ,
-        default names or  uses the provided names for the levels of the
-        corresponding  index. You can provide a single string when
+        default names or uses the provided names for the levels of the
+        corresponding index. You can provide a single string when
         c_idx_nlevels ==1.
    c_idx_nlevels - number of levels in columns index. > 1 will yield MultiIndex
    r_idx_nlevels - number of levels in rows index. > 1 will yield MultiIndex
@@ -1903,12 +2147,12 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
 
     assert c_idx_nlevels > 0
     assert r_idx_nlevels > 0
-    assert r_idx_type is None or \
-        (r_idx_type in ('i', 'f', 's',
-                        'u', 'dt', 'p', 'td') and r_idx_nlevels == 1)
-    assert c_idx_type is None or \
-        (c_idx_type in ('i', 'f', 's',
-                        'u', 'dt', 'p', 'td') and c_idx_nlevels == 1)
+    assert r_idx_type is None or (r_idx_type in ('i', 'f', 's',
+                                                 'u', 'dt', 'p', 'td')
+                                  and r_idx_nlevels == 1)
+    assert c_idx_type is None or (c_idx_type in ('i', 'f', 's',
+                                                 'u', 'dt', 'p', 'td')
+                                  and c_idx_nlevels == 1)
 
     columns = makeCustomIndex(ncols, nlevels=c_idx_nlevels, prefix='C',
                               names=c_idx_names, ndupe_l=c_ndupe_l,
@@ -1919,7 +2163,7 @@ def makeCustomDataframe(nrows, ncols, c_idx_names=True, r_idx_names=True,
 
     # by default, generate data based on location
     if data_gen_f is None:
-        data_gen_f = lambda r, c: "R%dC%d" % (r, c)
+        data_gen_f = lambda r, c: "R{rows}C{cols}".format(rows=r, cols=c)
 
     data = [[data_gen_f(r, c) for c in range(ncols)] for r in range(nrows)]
 
@@ -1992,83 +2236,12 @@ def makeMissingDataframe(density=.9, random_state=None):
     return df
 
 
-def add_nans(panel):
-    I, J, N = panel.shape
-    for i, item in enumerate(panel.items):
-        dm = panel[item]
-        for j, col in enumerate(dm.columns):
-            dm[col][:i + j] = np.NaN
-    return panel
-
-
-def add_nans_panel4d(panel4d):
-    for l, label in enumerate(panel4d.labels):
-        panel = panel4d[label]
-        add_nans(panel)
-    return panel4d
-
-
 class TestSubDict(dict):
 
     def __init__(self, *args, **kwargs):
         dict.__init__(self, *args, **kwargs)
 
 
-# Dependency checker when running tests.
-#
-# Copied this from nipy/nipype
-# Copyright of respective developers, License: BSD-3
-def skip_if_no_package(pkg_name, min_version=None, max_version=None,
-                       app='pandas', checker=LooseVersion):
-    """Check that the min/max version of the required package is installed.
-
-    If the package check fails, the test is automatically skipped.
-
-    Parameters
-    ----------
-    pkg_name : string
-        Name of the required package.
-    min_version : string, optional
-        Minimal version number for required package.
-    max_version : string, optional
-        Max version number for required package.
-    app : string, optional
-        Application that is performing the check. For instance, the
-        name of the tutorial being executed that depends on specific
-        packages.
-    checker : object, optional
-        The class that will perform the version checking. Default is
-        distutils.version.LooseVersion.
-
-    Examples
-    --------
-    package_check('numpy', '1.3')
-
-    """
-
-    import pytest
-    if app:
-        msg = '%s requires %s' % (app, pkg_name)
-    else:
-        msg = 'module requires %s' % pkg_name
-    if min_version:
-        msg += ' with version >= %s' % (min_version,)
-    if max_version:
-        msg += ' with version < %s' % (max_version,)
-    try:
-        mod = __import__(pkg_name)
-    except ImportError:
-        mod = None
-    try:
-        have_version = mod.__version__
-    except AttributeError:
-        pytest.skip('Cannot find version for %s' % pkg_name)
-    if min_version and checker(have_version) < checker(min_version):
-        pytest.skip(msg)
-    if max_version and checker(have_version) >= checker(max_version):
-        pytest.skip(msg)
-
-
 def optional_args(decorator):
     """allows a decorator to take optional positional and keyword arguments.
     Assumes that taking a single, callable, positional argument means that
@@ -2112,6 +2285,7 @@ def dec(f):
     'Temporary failure in name resolution',
     'Name or service not known',
     'Connection refused',
+    'certificate verify',
 )
 
 # or this e.errno/e.reason.errno
@@ -2132,7 +2306,7 @@ def dec(f):
 # and conditionally raise on these exception types
 _network_error_classes = (IOError, httplib.HTTPException)
 
-if sys.version_info >= (3, 3):
+if PY3:
     _network_error_classes += (TimeoutError,)  # noqa
 
 
@@ -2200,7 +2374,7 @@ def network(t, url="http://www.google.com",
     _skip_on_messages: iterable of string
         any exception e for which one of the strings is
         a substring of str(e) will be skipped with an appropriate
-        message. Intended to supress errors where an errno isn't available.
+        message. Intended to suppress errors where an errno isn't available.
 
     Notes
     -----
@@ -2253,7 +2427,7 @@ def network(t, url="http://www.google.com",
     from pytest import skip
     t.network = True
 
-    @wraps(t)
+    @compat.wraps(t)
     def wrapper(*args, **kwargs):
         if check_before_test and not raise_on_error:
             if not can_connect(url, error_classes):
@@ -2267,16 +2441,16 @@ def wrapper(*args, **kwargs):
 
             if errno in skip_errnos:
                 skip("Skipping test due to known errno"
-                     " and error %s" % e)
+                     " and error {error}".format(error=e))
 
             try:
                 e_str = traceback.format_exc(e)
-            except:
+            except Exception:
                 e_str = str(e)
 
-            if any([m.lower() in e_str.lower() for m in _skip_on_messages]):
+            if any(m.lower() in e_str.lower() for m in _skip_on_messages):
                 skip("Skipping test because exception "
-                     "message is known and error %s" % e)
+                     "message is known and error {error}".format(error=e))
 
             if not isinstance(e, error_classes):
                 raise
@@ -2285,7 +2459,7 @@ def wrapper(*args, **kwargs):
                 raise
             else:
                 skip("Skipping test due to lack of connectivity"
-                     " and error %s" % e)
+                     " and error {error}".format(error=e))
 
     return wrapper
 
@@ -2293,137 +2467,51 @@ def wrapper(*args, **kwargs):
 with_connectivity_check = network
 
 
-class SimpleMock(object):
-
-    """
-    Poor man's mocking object
-
-    Note: only works for new-style classes, assumes  __getattribute__ exists.
-
-    >>> a = type("Duck",(),{})
-    >>> a.attr1,a.attr2 ="fizz","buzz"
-    >>> b = SimpleMock(a,"attr1","bar")
-    >>> b.attr1 == "bar" and b.attr2 == "buzz"
-    True
-    >>> a.attr1 == "fizz" and a.attr2 == "buzz"
-    True
-    """
-
-    def __init__(self, obj, *args, **kwds):
-        assert(len(args) % 2 == 0)
-        attrs = kwds.get("attrs", {})
-        for k, v in zip(args[::2], args[1::2]):
-            # dict comprehensions break 2.6
-            attrs[k] = v
-        self.attrs = attrs
-        self.obj = obj
-
-    def __getattribute__(self, name):
-        attrs = object.__getattribute__(self, "attrs")
-        obj = object.__getattribute__(self, "obj")
-        return attrs.get(name, type(obj).__getattribute__(obj, name))
-
-
-@contextmanager
-def stdin_encoding(encoding=None):
-    """
-    Context manager for running bits of code while emulating an arbitrary
-    stdin encoding.
-
-    >>> import sys
-    >>> _encoding = sys.stdin.encoding
-    >>> with stdin_encoding('AES'): sys.stdin.encoding
-    'AES'
-    >>> sys.stdin.encoding==_encoding
-    True
-
-    """
-    import sys
-
-    _stdin = sys.stdin
-    sys.stdin = SimpleMock(sys.stdin, "encoding", encoding)
-    yield
-    sys.stdin = _stdin
-
-
-def assertRaises(_exception, _callable=None, *args, **kwargs):
-    """assertRaises that is usable as context manager or in a with statement
-
-    Exceptions that don't match the given Exception type fall through::
-
-    >>> with assertRaises(ValueError):
-    ...     raise TypeError("banana")
-    ...
-    Traceback (most recent call last):
-        ...
-    TypeError: banana
-
-    If it raises the given Exception type, the test passes
-    >>> with assertRaises(KeyError):
-    ...     dct = dict()
-    ...     dct["apple"]
-
-    If the expected error doesn't occur, it raises an error.
-    >>> with assertRaises(KeyError):
-    ...     dct = {'apple':True}
-    ...     dct["apple"]
-    Traceback (most recent call last):
-        ...
-    AssertionError: KeyError not raised.
-
-    In addition to using it as a contextmanager, you can also use it as a
-    function, just like the normal assertRaises
-
-    >>> assertRaises(TypeError, ",".join, [1, 3, 5])
-    """
-    manager = _AssertRaisesContextmanager(exception=_exception)
-    # don't return anything if used in function form
-    if _callable is not None:
-        with manager:
-            _callable(*args, **kwargs)
-    else:
-        return manager
-
-
-def assertRaisesRegexp(_exception, _regexp, _callable=None, *args, **kwargs):
-    """ Port of assertRaisesRegexp from unittest in
-        Python 2.7 - used in with statement.
+def assert_raises_regex(_exception, _regexp, _callable=None,
+                        *args, **kwargs):
+    r"""
+    Check that the specified Exception is raised and that the error message
+    matches a given regular expression pattern. This may be a regular
+    expression object or a string containing a regular expression suitable
+    for use by `re.search()`. This is a port of the `assertRaisesRegexp`
+    function from unittest in Python 2.7.
 
-    Explanation from standard library:
-        Like assertRaises() but also tests that regexp matches on the
-        string representation of the raised exception. regexp may be a
-        regular expression object or a string containing a regular
-        expression suitable for use by re.search().
+    .. deprecated:: 0.24.0
+        Use `pytest.raises` instead.
 
-    You can pass either a regular expression
-    or a compiled regular expression object.
-    >>> assertRaisesRegexp(ValueError, 'invalid literal for.*XYZ',
-    ...                                int, 'XYZ')
+    Examples
+    --------
+    >>> assert_raises_regex(ValueError, 'invalid literal for.*XYZ', int, 'XYZ')
     >>> import re
-    >>> assertRaisesRegexp(ValueError, re.compile('literal'), int, 'XYZ')
+    >>> assert_raises_regex(ValueError, re.compile('literal'), int, 'XYZ')
 
     If an exception of a different type is raised, it bubbles up.
 
-    >>> assertRaisesRegexp(TypeError, 'literal', int, 'XYZ')
+    >>> assert_raises_regex(TypeError, 'literal', int, 'XYZ')
     Traceback (most recent call last):
         ...
     ValueError: invalid literal for int() with base 10: 'XYZ'
     >>> dct = dict()
-    >>> assertRaisesRegexp(KeyError, 'pear', dct.__getitem__, 'apple')
+    >>> assert_raises_regex(KeyError, 'pear', dct.__getitem__, 'apple')
     Traceback (most recent call last):
         ...
     AssertionError: "pear" does not match "'apple'"
 
     You can also use this in a with statement.
-    >>> with assertRaisesRegexp(TypeError, 'unsupported operand type\(s\)'):
+
+    >>> with assert_raises_regex(TypeError, r'unsupported operand type\(s\)'):
     ...     1 + {}
-    >>> with assertRaisesRegexp(TypeError, 'banana'):
+    >>> with assert_raises_regex(TypeError, 'banana'):
     ...     'apple'[0] = 'b'
     Traceback (most recent call last):
         ...
     AssertionError: "banana" does not match "'str' object does not support \
 item assignment"
     """
+    warnings.warn(("assert_raises_regex has been deprecated and will "
+                   "be removed in the next release. Please use "
+                   "`pytest.raises` instead."), FutureWarning, stacklevel=2)
+
     manager = _AssertRaisesContextmanager(exception=_exception, regexp=_regexp)
     if _callable is not None:
         with manager:
@@ -2434,52 +2522,124 @@ def assertRaisesRegexp(_exception, _regexp, _callable=None, *args, **kwargs):
 
 class _AssertRaisesContextmanager(object):
     """
-    Handles the behind the scenes work
-    for assertRaises and assertRaisesRegexp
+    Context manager behind `assert_raises_regex`.
     """
 
-    def __init__(self, exception, regexp=None, *args, **kwargs):
+    def __init__(self, exception, regexp=None):
+        """
+        Initialize an _AssertRaisesContextManager instance.
+
+        Parameters
+        ----------
+        exception : class
+            The expected Exception class.
+        regexp : str, default None
+            The regex to compare against the Exception message.
+        """
+
         self.exception = exception
+
         if regexp is not None and not hasattr(regexp, "search"):
             regexp = re.compile(regexp, re.DOTALL)
+
         self.regexp = regexp
 
     def __enter__(self):
         return self
 
-    def __exit__(self, exc_type, exc_value, traceback):
+    def __exit__(self, exc_type, exc_value, trace_back):
         expected = self.exception
-        if not exc_type:
-            name = getattr(expected, "__name__", str(expected))
-            raise AssertionError("{0} not raised.".format(name))
-        if issubclass(exc_type, expected):
-            return self.handle_success(exc_type, exc_value, traceback)
-        return self.handle_failure(exc_type, exc_value, traceback)
-
-    def handle_failure(*args, **kwargs):
-        # Failed, so allow Exception to bubble up
-        return False
 
-    def handle_success(self, exc_type, exc_value, traceback):
-        if self.regexp is not None:
-            val = str(exc_value)
-            if not self.regexp.search(val):
-                e = AssertionError('"%s" does not match "%s"' %
-                                   (self.regexp.pattern, str(val)))
-                raise_with_traceback(e, traceback)
-        return True
+        if not exc_type:
+            exp_name = getattr(expected, "__name__", str(expected))
+            raise AssertionError("{name} not raised.".format(name=exp_name))
+
+        return self.exception_matches(exc_type, exc_value, trace_back)
+
+    def exception_matches(self, exc_type, exc_value, trace_back):
+        """
+        Check that the Exception raised matches the expected Exception
+        and expected error message regular expression.
+
+        Parameters
+        ----------
+        exc_type : class
+            The type of Exception raised.
+        exc_value : Exception
+            The instance of `exc_type` raised.
+        trace_back : stack trace object
+            The traceback object associated with `exc_value`.
+
+        Returns
+        -------
+        is_matched : bool
+            Whether or not the Exception raised matches the expected
+            Exception class and expected error message regular expression.
+
+        Raises
+        ------
+        AssertionError : The error message provided does not match
+                         the expected error message regular expression.
+        """
+
+        if issubclass(exc_type, self.exception):
+            if self.regexp is not None:
+                val = str(exc_value)
+
+                if not self.regexp.search(val):
+                    msg = '"{pat}" does not match "{val}"'.format(
+                        pat=self.regexp.pattern, val=val)
+                    e = AssertionError(msg)
+                    raise_with_traceback(e, trace_back)
+
+            return True
+        else:
+            # Failed, so allow Exception to bubble up.
+            return False
 
 
 @contextmanager
 def assert_produces_warning(expected_warning=Warning, filter_level="always",
                             clear=None, check_stacklevel=True):
     """
-    Context manager for running code that expects to raise (or not raise)
-    warnings.  Checks that code raises the expected warning and only the
-    expected warning. Pass ``False`` or ``None`` to check that it does *not*
-    raise a warning. Defaults to ``exception.Warning``, baseclass of all
-    Warnings. (basically a wrapper around ``warnings.catch_warnings``).
+    Context manager for running code expected to either raise a specific
+    warning, or not raise any warnings. Verifies that the code raises the
+    expected warning, and that it does not raise any other unexpected
+    warnings. It is basically a wrapper around ``warnings.catch_warnings``.
+
+    Parameters
+    ----------
+    expected_warning : {Warning, False, None}, default Warning
+        The type of Exception raised. ``exception.Warning`` is the base
+        class for all warnings. To check that no warning is returned,
+        specify ``False`` or ``None``.
+    filter_level : str, default "always"
+        Specifies whether warnings are ignored, displayed, or turned
+        into errors.
+        Valid values are:
+
+        * "error" - turns matching warnings into exceptions
+        * "ignore" - discard the warning
+        * "always" - always emit a warning
+        * "default" - print the warning the first time it is generated
+          from each location
+        * "module" - print the warning the first time it is generated
+          from each module
+        * "once" - print the warning the first time it is generated
+
+    clear : str, default None
+        If not ``None`` then remove any previously raised warnings from
+        the ``__warningsregistry__`` to ensure that no warning messages are
+        suppressed by this context manager. If ``None`` is specified,
+        the ``__warningsregistry__`` keeps track of which warnings have been
+        shown, and does not show them again.
+    check_stacklevel : bool, default True
+        If True, displays the line that called the function containing
+        the warning to show were the function is called. Otherwise, the
+        line that implements the function is displayed.
 
+    Examples
+    --------
     >>> import warnings
     >>> with assert_produces_warning():
     ...     warnings.warn(UserWarning())
@@ -2498,10 +2658,12 @@ def assert_produces_warning(expected_warning=Warning, filter_level="always",
 
     ..warn:: This is *not* thread-safe.
     """
+    __tracebackhide__ = True
+
     with warnings.catch_warnings(record=True) as w:
 
         if clear is not None:
-            # make sure that we are clearning these warnings
+            # make sure that we are clearing these warnings
             # if they have happened before
             # to guarantee that we will catch them
             if not is_list_like(clear):
@@ -2509,7 +2671,7 @@ def assert_produces_warning(expected_warning=Warning, filter_level="always",
             for m in clear:
                 try:
                     m.__warningregistry__.clear()
-                except:
+                except Exception:
                     pass
 
         saw_warning = False
@@ -2528,18 +2690,23 @@ def assert_produces_warning(expected_warning=Warning, filter_level="always",
                     from inspect import getframeinfo, stack
                     caller = getframeinfo(stack()[2][0])
                     msg = ("Warning not set with correct stacklevel. "
-                           "File where warning is raised: {0} != {1}. "
-                           "Warning message: {2}".format(
-                               actual_warning.filename, caller.filename,
-                               actual_warning.message))
+                           "File where warning is raised: {actual} != "
+                           "{caller}. Warning message: {message}"
+                           ).format(actual=actual_warning.filename,
+                                    caller=caller.filename,
+                                    message=actual_warning.message)
                     assert actual_warning.filename == caller.filename, msg
             else:
-                extra_warnings.append(actual_warning.category.__name__)
+                extra_warnings.append((actual_warning.category.__name__,
+                                       actual_warning.message,
+                                       actual_warning.filename,
+                                       actual_warning.lineno))
         if expected_warning:
-            assert saw_warning, ("Did not see expected warning of class %r."
-                                 % expected_warning.__name__)
-        assert not extra_warnings, ("Caused unexpected warning(s): %r."
-                                    % extra_warnings)
+            msg = "Did not see expected warning of class {name!r}.".format(
+                name=expected_warning.__name__)
+            assert saw_warning, msg
+        assert not extra_warnings, ("Caused unexpected warning(s): {extra!r}."
+                                    ).format(extra=extra_warnings)
 
 
 class RNGContext(object):
@@ -2573,7 +2740,42 @@ def __exit__(self, exc_type, exc_value, traceback):
 
 
 @contextmanager
-def use_numexpr(use, min_elements=expr._MIN_ELEMENTS):
+def with_csv_dialect(name, **kwargs):
+    """
+    Context manager to temporarily register a CSV dialect for parsing CSV.
+
+    Parameters
+    ----------
+    name : str
+        The name of the dialect.
+    kwargs : mapping
+        The parameters for the dialect.
+
+    Raises
+    ------
+    ValueError : the name of the dialect conflicts with a builtin one.
+
+    See Also
+    --------
+    csv : Python's CSV library.
+    """
+    import csv
+    _BUILTIN_DIALECTS = {"excel", "excel-tab", "unix"}
+
+    if name in _BUILTIN_DIALECTS:
+        raise ValueError("Cannot override builtin dialect.")
+
+    csv.register_dialect(name, **kwargs)
+    yield
+    csv.unregister_dialect(name)
+
+
+@contextmanager
+def use_numexpr(use, min_elements=None):
+    from pandas.core.computation import expressions as expr
+    if min_elements is None:
+        min_elements = expr._MIN_ELEMENTS
+
     olduse = expr._USE_NUMEXPR
     oldmin = expr._MIN_ELEMENTS
     expr.set_use_numexpr(use)
@@ -2583,12 +2785,6 @@ def use_numexpr(use, min_elements=expr._MIN_ELEMENTS):
     expr.set_use_numexpr(olduse)
 
 
-# Also provide all assert_* functions in the TestCase class
-for name, obj in inspect.getmembers(sys.modules[__name__]):
-    if inspect.isfunction(obj) and name.startswith('assert'):
-        setattr(TestCase, name, staticmethod(obj))
-
-
 def test_parallel(num_threads=2, kwargs_list=None):
     """Decorator to run the same function multiple times in parallel.
 
@@ -2691,58 +2887,6 @@ def _constructor(self):
         return SubclassedCategorical
 
 
-@contextmanager
-def patch(ob, attr, value):
-    """Temporarily patch an attribute of an object.
-
-    Parameters
-    ----------
-    ob : any
-        The object to patch. This must support attribute assignment for `attr`.
-    attr : str
-        The name of the attribute to patch.
-    value : any
-        The temporary attribute to assign.
-
-    Examples
-    --------
-    >>> class C(object):
-    ...     attribute = 'original'
-    ...
-    >>> C.attribute
-    'original'
-    >>> with patch(C, 'attribute', 'patched'):
-    ...     in_context = C.attribute
-    ...
-    >>> in_context
-    'patched'
-    >>> C.attribute  # the value is reset when the context manager exists
-    'original'
-
-    Correctly replaces attribute when the manager exits with an exception.
-    >>> with patch(C, 'attribute', 'patched'):
-    ...     in_context = C.attribute
-    ...     raise ValueError()
-    Traceback (most recent call last):
-       ...
-    ValueError
-    >>> in_context
-    'patched'
-    >>> C.attribute
-    'original'
-    """
-    noattr = object()  # mark that the attribute never existed
-    old = getattr(ob, attr, noattr)
-    setattr(ob, attr, value)
-    try:
-        yield
-    finally:
-        if old is noattr:
-            delattr(ob, attr)
-        else:
-            setattr(ob, attr, old)
-
-
 @contextmanager
 def set_timezone(tz):
     """Context manager for temporarily setting a timezone.
@@ -2765,9 +2909,6 @@ def set_timezone(tz):
     ...
     'EDT'
     """
-    if is_platform_windows():
-        import pytest
-        pytest.skip("timezone setting not supported on windows")
 
     import os
     import time
@@ -2776,7 +2917,7 @@ def setTZ(tz):
         if tz is None:
             try:
                 del os.environ['TZ']
-            except:
+            except KeyError:
                 pass
         else:
             os.environ['TZ'] = tz
@@ -2788,3 +2929,52 @@ def setTZ(tz):
         yield
     finally:
         setTZ(orig_tz)
+
+
+def _make_skipna_wrapper(alternative, skipna_alternative=None):
+    """Create a function for calling on an array.
+
+    Parameters
+    ----------
+    alternative : function
+        The function to be called on the array with no NaNs.
+        Only used when 'skipna_alternative' is None.
+    skipna_alternative : function
+        The function to be called on the original array
+
+    Returns
+    -------
+    skipna_wrapper : function
+    """
+    if skipna_alternative:
+        def skipna_wrapper(x):
+            return skipna_alternative(x.values)
+    else:
+        def skipna_wrapper(x):
+            nona = x.dropna()
+            if len(nona) == 0:
+                return np.nan
+            return alternative(nona)
+
+    return skipna_wrapper
+
+
+def convert_rows_list_to_csv_str(rows_list):
+    """
+    Convert list of CSV rows to single CSV-formatted string for current OS.
+
+    This method is used for creating expected value of to_csv() method.
+
+    Parameters
+    ----------
+    rows_list : list
+        The list of string. Each element represents the row of csv.
+
+    Returns
+    -------
+    expected : string
+        Expected output of to_csv() in current OS
+    """
+    sep = os.linesep
+    expected = sep.join(rows_list) + sep
+    return expected
diff --git a/pandas/util/validators.py b/pandas/util/validators.py
deleted file mode 100644
index f22412a2bcd17..0000000000000
--- a/pandas/util/validators.py
+++ /dev/null
@@ -1,226 +0,0 @@
-"""
-Module that contains many useful utilities
-for validating data or function arguments
-"""
-
-from pandas.types.common import is_bool
-
-
-def _check_arg_length(fname, args, max_fname_arg_count, compat_args):
-    """
-    Checks whether 'args' has length of at most 'compat_args'. Raises
-    a TypeError if that is not the case, similar to in Python when a
-    function is called with too many arguments.
-
-    """
-    if max_fname_arg_count < 0:
-        raise ValueError("'max_fname_arg_count' must be non-negative")
-
-    if len(args) > len(compat_args):
-        max_arg_count = len(compat_args) + max_fname_arg_count
-        actual_arg_count = len(args) + max_fname_arg_count
-        argument = 'argument' if max_arg_count == 1 else 'arguments'
-
-        raise TypeError(
-            "{fname}() takes at most {max_arg} {argument} "
-            "({given_arg} given)".format(
-                fname=fname, max_arg=max_arg_count,
-                argument=argument, given_arg=actual_arg_count))
-
-
-def _check_for_default_values(fname, arg_val_dict, compat_args):
-    """
-    Check that the keys in `arg_val_dict` are mapped to their
-    default values as specified in `compat_args`.
-
-    Note that this function is to be called only when it has been
-    checked that arg_val_dict.keys() is a subset of compat_args
-
-    """
-    for key in arg_val_dict:
-        # try checking equality directly with '=' operator,
-        # as comparison may have been overriden for the left
-        # hand object
-        try:
-            v1 = arg_val_dict[key]
-            v2 = compat_args[key]
-
-            # check for None-ness otherwise we could end up
-            # comparing a numpy array vs None
-            if (v1 is not None and v2 is None) or \
-               (v1 is None and v2 is not None):
-                match = False
-            else:
-                match = (v1 == v2)
-
-            if not is_bool(match):
-                raise ValueError("'match' is not a boolean")
-
-        # could not compare them directly, so try comparison
-        # using the 'is' operator
-        except:
-            match = (arg_val_dict[key] is compat_args[key])
-
-        if not match:
-            raise ValueError(("the '{arg}' parameter is not "
-                              "supported in the pandas "
-                              "implementation of {fname}()".
-                              format(fname=fname, arg=key)))
-
-
-def validate_args(fname, args, max_fname_arg_count, compat_args):
-    """
-    Checks whether the length of the `*args` argument passed into a function
-    has at most `len(compat_args)` arguments and whether or not all of these
-    elements in `args` are set to their default values.
-
-    fname: str
-        The name of the function being passed the `*args` parameter
-
-    args: tuple
-        The `*args` parameter passed into a function
-
-    max_fname_arg_count: int
-        The maximum number of arguments that the function `fname`
-        can accept, excluding those in `args`. Used for displaying
-        appropriate error messages. Must be non-negative.
-
-    compat_args: OrderedDict
-        A ordered dictionary of keys and their associated default values.
-        In order to accommodate buggy behaviour in some versions of `numpy`,
-        where a signature displayed keyword arguments but then passed those
-        arguments **positionally** internally when calling downstream
-        implementations, an ordered dictionary ensures that the original
-        order of the keyword arguments is enforced. Note that if there is
-        only one key, a generic dict can be passed in as well.
-
-    Raises
-    ------
-    TypeError if `args` contains more values than there are `compat_args`
-    ValueError if `args` contains values that do not correspond to those
-    of the default values specified in `compat_args`
-
-    """
-    _check_arg_length(fname, args, max_fname_arg_count, compat_args)
-
-    # We do this so that we can provide a more informative
-    # error message about the parameters that we are not
-    # supporting in the pandas implementation of 'fname'
-    kwargs = dict(zip(compat_args, args))
-    _check_for_default_values(fname, kwargs, compat_args)
-
-
-def _check_for_invalid_keys(fname, kwargs, compat_args):
-    """
-    Checks whether 'kwargs' contains any keys that are not
-    in 'compat_args' and raises a TypeError if there is one.
-
-    """
-    # set(dict) --> set of the dictionary's keys
-    diff = set(kwargs) - set(compat_args)
-
-    if diff:
-        bad_arg = list(diff)[0]
-        raise TypeError(("{fname}() got an unexpected "
-                         "keyword argument '{arg}'".
-                         format(fname=fname, arg=bad_arg)))
-
-
-def validate_kwargs(fname, kwargs, compat_args):
-    """
-    Checks whether parameters passed to the **kwargs argument in a
-    function `fname` are valid parameters as specified in `*compat_args`
-    and whether or not they are set to their default values.
-
-    Parameters
-    ----------
-    fname: str
-        The name of the function being passed the `**kwargs` parameter
-
-    kwargs: dict
-        The `**kwargs` parameter passed into `fname`
-
-    compat_args: dict
-        A dictionary of keys that `kwargs` is allowed to have and their
-        associated default values
-
-    Raises
-    ------
-    TypeError if `kwargs` contains keys not in `compat_args`
-    ValueError if `kwargs` contains keys in `compat_args` that do not
-    map to the default values specified in `compat_args`
-
-    """
-    kwds = kwargs.copy()
-    _check_for_invalid_keys(fname, kwargs, compat_args)
-    _check_for_default_values(fname, kwds, compat_args)
-
-
-def validate_args_and_kwargs(fname, args, kwargs,
-                             max_fname_arg_count,
-                             compat_args):
-    """
-    Checks whether parameters passed to the *args and **kwargs argument in a
-    function `fname` are valid parameters as specified in `*compat_args`
-    and whether or not they are set to their default values.
-
-    Parameters
-    ----------
-    fname: str
-        The name of the function being passed the `**kwargs` parameter
-
-    args: tuple
-        The `*args` parameter passed into a function
-
-    kwargs: dict
-        The `**kwargs` parameter passed into `fname`
-
-    max_fname_arg_count: int
-        The minimum number of arguments that the function `fname`
-        requires, excluding those in `args`. Used for displaying
-        appropriate error messages. Must be non-negative.
-
-    compat_args: OrderedDict
-        A ordered dictionary of keys that `kwargs` is allowed to
-        have and their associated default values. Note that if there
-        is only one key, a generic dict can be passed in as well.
-
-    Raises
-    ------
-    TypeError if `args` contains more values than there are
-    `compat_args` OR `kwargs` contains keys not in `compat_args`
-    ValueError if `args` contains values not at the default value (`None`)
-    `kwargs` contains keys in `compat_args` that do not map to the default
-    value as specified in `compat_args`
-
-    See Also
-    --------
-    validate_args : purely args validation
-    validate_kwargs : purely kwargs validation
-
-    """
-    # Check that the total number of arguments passed in (i.e.
-    # args and kwargs) does not exceed the length of compat_args
-    _check_arg_length(fname, args + tuple(kwargs.values()),
-                      max_fname_arg_count, compat_args)
-
-    # Check there is no overlap with the positional and keyword
-    # arguments, similar to what is done in actual Python functions
-    args_dict = dict(zip(compat_args, args))
-
-    for key in args_dict:
-        if key in kwargs:
-            raise TypeError("{fname}() got multiple values for keyword "
-                            "argument '{arg}'".format(fname=fname, arg=key))
-
-    kwargs.update(args_dict)
-    validate_kwargs(fname, kwargs, compat_args)
-
-
-def validate_bool_kwarg(value, arg_name):
-    """ Ensures that argument passed in arg_name is of type bool. """
-    if not (is_bool(value) or value is None):
-        raise ValueError('For argument "%s" expected type bool, '
-                         'received type %s.' %
-                         (arg_name, type(value).__name__))
-    return value
diff --git a/requirements-dev.txt b/requirements-dev.txt
new file mode 100644
index 0000000000000..be84c6f29fdeb
--- /dev/null
+++ b/requirements-dev.txt
@@ -0,0 +1,45 @@
+numpy>=1.15
+python-dateutil>=2.5.0
+pytz
+asv
+cython>=0.28.2
+flake8
+flake8-comprehensions
+flake8-rst>=0.6.0,<=0.7.0
+gitpython
+hypothesis>=3.82
+isort
+moto
+pytest>=4.0.2
+pytest-mock
+sphinx
+numpydoc
+beautifulsoup4>=4.2.1
+blosc
+botocore>=1.11
+boto3
+bottleneck>=1.2.0
+fastparquet>=0.2.1
+html5lib
+ipython>=5.6.0
+ipykernel
+jinja2
+lxml
+matplotlib>=2.0.0
+nbsphinx
+numexpr>=2.6.8
+openpyxl
+pyarrow>=0.9.0
+tables>=3.4.2
+pytest-cov
+pytest-xdist
+s3fs
+scipy>=1.1
+seaborn
+sqlalchemy
+statsmodels
+xarray
+xlrd
+xlsxwriter
+xlwt
+cpplint
\ No newline at end of file
diff --git a/scripts/api_rst_coverage.py b/scripts/api_rst_coverage.py
deleted file mode 100644
index 6bb5383509be6..0000000000000
--- a/scripts/api_rst_coverage.py
+++ /dev/null
@@ -1,43 +0,0 @@
-import pandas as pd
-import inspect
-import re
-
-def main():
-    # classes whose members to check
-    classes = [pd.Series, pd.DataFrame, pd.Panel]
-
-    def class_name_sort_key(x):
-        if x.startswith('Series'):
-            # make sure Series precedes DataFrame, and Panel.
-            return ' ' + x
-        else:
-            return x
-
-    # class members
-    class_members = set()
-    for cls in classes:
-        class_members.update([cls.__name__ + '.' + x[0] for x in inspect.getmembers(cls)])
-
-    # class members referenced in api.rst
-    api_rst_members = set()
-    file_name = '../doc/source/api.rst'
-    with open(file_name, 'r') as f:
-        pattern = re.compile('({})\.(\w+)'.format('|'.join([cls.__name__ for cls in classes])))
-        for line in f:
-            match = pattern.search(line)
-            if match:
-                api_rst_members.add(match.group(0))
-
-    print()
-    print("Documented members in api.rst that aren't actual class members:")
-    for x in sorted(api_rst_members.difference(class_members), key=class_name_sort_key):
-        print(x)
-
-    print()
-    print("Class members (other than those beginning with '_') missing from api.rst:")
-    for x in sorted(class_members.difference(api_rst_members), key=class_name_sort_key):
-        if '._' not in x:
-            print(x)
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/bench_join.R b/scripts/bench_join.R
deleted file mode 100644
index edba277f0295c..0000000000000
--- a/scripts/bench_join.R
+++ /dev/null
@@ -1,50 +0,0 @@
-library(xts)
-
-iterations <- 50
-
-ns = c(100, 1000, 10000, 100000, 1000000)
-kinds = c("outer", "left", "inner")
-
-result = matrix(0, nrow=3, ncol=length(ns))
-n <- 100000
-pct.overlap <- 0.2
-
-k <- 1
-
-for (ni in 1:length(ns)){
- n <- ns[ni]
- rng1 <- 1:n
- offset <- as.integer(n * pct.overlap)
- rng2 <- rng1 + offset
- x <- xts(matrix(rnorm(n * k), nrow=n, ncol=k),
-          as.POSIXct(Sys.Date()) + rng1)
- y <- xts(matrix(rnorm(n * k), nrow=n, ncol=k),
-          as.POSIXct(Sys.Date()) + rng2)
- timing <- numeric()
- for (i in 1:3) {
-     kind = kinds[i]
-     for(j in 1:iterations) {
-       gc()  # just to be sure
-       timing[j] <- system.time(merge(x,y,join=kind))[3]
-     }
-     #timing <- system.time(for (j in 1:iterations) merge.xts(x, y, join=kind),
-     #                      gcFirst=F)
-     #timing <- as.list(timing)
-     result[i, ni] <- mean(timing) * 1000
-     #result[i, ni] = (timing$elapsed / iterations) * 1000
-   }
-}
-
-rownames(result) <- kinds
-colnames(result) <- log10(ns)
-
-mat <- matrix(rnorm(500000), nrow=100000, ncol=5)
-set.seed(12345)
-indexer <- sample(1:100000)
-
-timing <- rep(0, 10)
-for (i in 1:10) {
-  gc()
-  timing[i] = system.time(mat[indexer,])[3]
-}
-
diff --git a/scripts/bench_join.py b/scripts/bench_join.py
deleted file mode 100644
index f9d43772766d8..0000000000000
--- a/scripts/bench_join.py
+++ /dev/null
@@ -1,211 +0,0 @@
-from pandas.compat import range, lrange
-import numpy as np
-import pandas._libs.lib as lib
-from pandas import *
-from copy import deepcopy
-import time
-
-n = 1000000
-K = 1
-pct_overlap = 0.2
-
-a = np.arange(n, dtype=np.int64)
-b = np.arange(n * pct_overlap, n * (1 + pct_overlap), dtype=np.int64)
-
-dr1 = DatetimeIndex('1/1/2000', periods=n, offset=offsets.Minute())
-dr2 = DatetimeIndex(
-    dr1[int(pct_overlap * n)], periods=n, offset=offsets.Minute(2))
-
-aobj = a.astype(object)
-bobj = b.astype(object)
-
-av = np.random.randn(n)
-bv = np.random.randn(n)
-
-avf = np.random.randn(n, K)
-bvf = np.random.randn(n, K)
-
-a_series = Series(av, index=a)
-b_series = Series(bv, index=b)
-
-a_frame = DataFrame(avf, index=a, columns=lrange(K))
-b_frame = DataFrame(bvf, index=b, columns=lrange(K, 2 * K))
-
-
-def do_left_join(a, b, av, bv):
-    out = np.empty((len(a), 2))
-    lib.left_join_1d(a, b, av, bv, out)
-    return out
-
-
-def do_outer_join(a, b, av, bv):
-    result_index, aindexer, bindexer = lib.outer_join_indexer(a, b)
-    result = np.empty((2, len(result_index)))
-    lib.take_1d(av, aindexer, result[0])
-    lib.take_1d(bv, bindexer, result[1])
-    return result_index, result
-
-
-def do_inner_join(a, b, av, bv):
-    result_index, aindexer, bindexer = lib.inner_join_indexer(a, b)
-    result = np.empty((2, len(result_index)))
-    lib.take_1d(av, aindexer, result[0])
-    lib.take_1d(bv, bindexer, result[1])
-    return result_index, result
-
-from line_profiler import LineProfiler
-prof = LineProfiler()
-
-from pandas.util.testing import set_trace
-
-
-def do_left_join_python(a, b, av, bv):
-    indexer, mask = lib.ordered_left_join_int64(a, b)
-
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_width = ak + bk
-
-    result = np.empty((result_width, n), dtype=np.float64)
-    result[:ak] = av.T
-
-    bchunk = result[ak:]
-    _take_multi(bv.T, indexer, bchunk)
-    np.putmask(bchunk, np.tile(mask, bk), np.nan)
-    return result
-
-
-def _take_multi(data, indexer, out):
-    if not data.flags.c_contiguous:
-        data = data.copy()
-    for i in range(data.shape[0]):
-        data[i].take(indexer, out=out[i])
-
-
-def do_left_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result = np.empty((n, ak + bk), dtype=np.float64)
-    lib.left_join_2d(a, b, av, bv, result)
-    return result
-
-
-def do_outer_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_index, rindexer, lindexer = lib.outer_join_indexer(a, b)
-    result = np.empty((len(result_index), ak + bk), dtype=np.float64)
-    lib.take_join_contiguous(av, bv, lindexer, rindexer, result)
-    # result = np.empty((ak + bk, len(result_index)), dtype=np.float64)
-    # lib.take_axis0(av, rindexer, out=result[:ak].T)
-    # lib.take_axis0(bv, lindexer, out=result[ak:].T)
-    return result_index, result
-
-
-def do_inner_join_multi(a, b, av, bv):
-    n, ak = av.shape
-    _, bk = bv.shape
-    result_index, rindexer, lindexer = lib.inner_join_indexer(a, b)
-    result = np.empty((len(result_index), ak + bk), dtype=np.float64)
-    lib.take_join_contiguous(av, bv, lindexer, rindexer, result)
-    # result = np.empty((ak + bk, len(result_index)), dtype=np.float64)
-    # lib.take_axis0(av, rindexer, out=result[:ak].T)
-    # lib.take_axis0(bv, lindexer, out=result[ak:].T)
-    return result_index, result
-
-
-def do_left_join_multi_v2(a, b, av, bv):
-    indexer, mask = lib.ordered_left_join_int64(a, b)
-    bv_taken = bv.take(indexer, axis=0)
-    np.putmask(bv_taken, mask.repeat(bv.shape[1]), np.nan)
-    return np.concatenate((av, bv_taken), axis=1)
-
-
-def do_left_join_series(a, b):
-    return b.reindex(a.index)
-
-
-def do_left_join_frame(a, b):
-    a.index._indexMap = None
-    b.index._indexMap = None
-    return a.join(b, how='left')
-
-
-# a = np.array([1, 2, 3, 4, 5], dtype=np.int64)
-# b = np.array([0, 3, 5, 7, 9], dtype=np.int64)
-# print(lib.inner_join_indexer(a, b))
-
-out = np.empty((10, 120000))
-
-
-def join(a, b, av, bv, how="left"):
-    func_dict = {'left': do_left_join_multi,
-                 'outer': do_outer_join_multi,
-                 'inner': do_inner_join_multi}
-
-    f = func_dict[how]
-    return f(a, b, av, bv)
-
-
-def bench_python(n=100000, pct_overlap=0.20, K=1):
-    import gc
-    ns = [2, 3, 4, 5, 6]
-    iterations = 200
-    pct_overlap = 0.2
-    kinds = ['outer', 'left', 'inner']
-
-    all_results = {}
-    for logn in ns:
-        n = 10 ** logn
-        a = np.arange(n, dtype=np.int64)
-        b = np.arange(n * pct_overlap, n * pct_overlap + n, dtype=np.int64)
-
-        avf = np.random.randn(n, K)
-        bvf = np.random.randn(n, K)
-
-        a_frame = DataFrame(avf, index=a, columns=lrange(K))
-        b_frame = DataFrame(bvf, index=b, columns=lrange(K, 2 * K))
-
-        all_results[logn] = result = {}
-
-        for kind in kinds:
-            gc.disable()
-            elapsed = 0
-            _s = time.clock()
-            for i in range(iterations):
-                if i % 10 == 0:
-                    elapsed += time.clock() - _s
-                    gc.collect()
-                    _s = time.clock()
-                a_frame.join(b_frame, how=kind)
-                # join(a, b, avf, bvf, how=kind)
-            elapsed += time.clock() - _s
-            gc.enable()
-            result[kind] = (elapsed / iterations) * 1000
-
-    return DataFrame(all_results, index=kinds)
-
-
-def bench_xts(n=100000, pct_overlap=0.20):
-    from pandas.rpy.common import r
-    r('a <- 5')
-
-    xrng = '1:%d' % n
-
-    start = n * pct_overlap + 1
-    end = n + start - 1
-    yrng = '%d:%d' % (start, end)
-
-    r('library(xts)')
-
-    iterations = 500
-
-    kinds = ['left', 'outer', 'inner']
-    result = {}
-    for kind in kinds:
-        r('x <- xts(rnorm(%d), as.POSIXct(Sys.Date()) + %s)' % (n, xrng))
-        r('y <- xts(rnorm(%d), as.POSIXct(Sys.Date()) + %s)' % (n, yrng))
-        stmt = 'for (i in 1:%d) merge(x, y, join="%s")' % (iterations, kind)
-        elapsed = r('as.list(system.time(%s, gcFirst=F))$elapsed' % stmt)[0]
-        result[kind] = (elapsed / iterations) * 1000
-    return Series(result)
diff --git a/scripts/bench_join_multi.py b/scripts/bench_join_multi.py
deleted file mode 100644
index b19da6a2c47d8..0000000000000
--- a/scripts/bench_join_multi.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from pandas import *
-
-import numpy as np
-from pandas.compat import zip, range, lzip
-from pandas.util.testing import rands
-import pandas._libs.lib as lib
-
-N = 100000
-
-key1 = [rands(10) for _ in range(N)]
-key2 = [rands(10) for _ in range(N)]
-
-zipped = lzip(key1, key2)
-
-
-def _zip(*args):
-    arr = np.empty(N, dtype=object)
-    arr[:] = lzip(*args)
-    return arr
-
-
-def _zip2(*args):
-    return lib.list_to_object_array(lzip(*args))
-
-index = MultiIndex.from_arrays([key1, key2])
-to_join = DataFrame({'j1': np.random.randn(100000)}, index=index)
-
-data = DataFrame({'A': np.random.randn(500000),
-                  'key1': np.repeat(key1, 5),
-                  'key2': np.repeat(key2, 5)})
-
-# data.join(to_join, on=['key1', 'key2'])
diff --git a/scripts/bench_refactor.py b/scripts/bench_refactor.py
deleted file mode 100644
index dafba371e995a..0000000000000
--- a/scripts/bench_refactor.py
+++ /dev/null
@@ -1,51 +0,0 @@
-from pandas import *
-from pandas.compat import range
-try:
-    import pandas.core.internals as internals
-    reload(internals)
-    import pandas.core.frame as frame
-    reload(frame)
-    from pandas.core.frame import DataFrame as DataMatrix
-except ImportError:
-    pass
-
-N = 1000
-K = 500
-
-
-def horribly_unconsolidated():
-    index = np.arange(N)
-
-    df = DataMatrix(index=index)
-
-    for i in range(K):
-        df[i] = float(K)
-
-    return df
-
-
-def bench_reindex_index(df, it=100):
-    new_idx = np.arange(0, N, 2)
-    for i in range(it):
-        df.reindex(new_idx)
-
-
-def bench_reindex_columns(df, it=100):
-    new_cols = np.arange(0, K, 2)
-    for i in range(it):
-        df.reindex(columns=new_cols)
-
-
-def bench_join_index(df, it=10):
-    left = df.reindex(index=np.arange(0, N, 2),
-                      columns=np.arange(K // 2))
-    right = df.reindex(columns=np.arange(K // 2 + 1, K))
-    for i in range(it):
-        joined = left.join(right)
-
-if __name__ == '__main__':
-    df = horribly_unconsolidated()
-    left = df.reindex(index=np.arange(0, N, 2),
-                      columns=np.arange(K // 2))
-    right = df.reindex(columns=np.arange(K // 2 + 1, K))
-    bench_join_index(df)
diff --git a/scripts/boxplot_test.py b/scripts/boxplot_test.py
deleted file mode 100644
index 3704f7b60dc60..0000000000000
--- a/scripts/boxplot_test.py
+++ /dev/null
@@ -1,14 +0,0 @@
-import matplotlib.pyplot as plt
-
-import random
-import pandas.util.testing as tm
-tm.N = 1000
-df = tm.makeTimeDataFrame()
-import string
-foo = list(string.letters[:5]) * 200
-df['indic'] = list(string.letters[:5]) * 200
-random.shuffle(foo)
-df['indic2'] = foo
-df.boxplot(by=['indic', 'indic2'], fontsize=8, rot=90)
-
-plt.show()
diff --git a/scripts/build_dist.sh b/scripts/build_dist.sh
index c9c36c18bed9c..c3f849ce7a6eb 100755
--- a/scripts/build_dist.sh
+++ b/scripts/build_dist.sh
@@ -10,9 +10,7 @@ read -p "Ok to continue (y/n)? " answer
 case ${answer:0:1} in
     y|Y )
         echo "Building distribution"
-        python setup.py clean
-        python setup.py build_ext --inplace
-        python setup.py sdist --formats=gztar
+        ./build_dist_for_release.sh
     ;;
     * )
         echo "Not building distribution"
diff --git a/scripts/build_dist_for_release.sh b/scripts/build_dist_for_release.sh
new file mode 100755
index 0000000000000..bee0f23a68ec2
--- /dev/null
+++ b/scripts/build_dist_for_release.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+# this requires cython to be installed
+
+# this builds the release cleanly & is building on the current checkout
+rm -rf dist
+git clean -xfd
+python setup.py clean --quiet
+python setup.py cython --quiet
+python setup.py sdist --formats=gztar --quiet
diff --git a/scripts/count_code.sh b/scripts/count_code.sh
deleted file mode 100755
index 991faf2e8711b..0000000000000
--- a/scripts/count_code.sh
+++ /dev/null
@@ -1 +0,0 @@
-cloc pandas --force-lang=Python,pyx --not-match-f="parser.c|lib.c|tslib.c|sandbox.c|hashtable.c|sparse.c|algos.c|index.c"
\ No newline at end of file
diff --git a/scripts/download_wheels.py b/scripts/download_wheels.py
new file mode 100644
index 0000000000000..f5cdbbe36d90d
--- /dev/null
+++ b/scripts/download_wheels.py
@@ -0,0 +1,47 @@
+#!/usr/bin/env python
+"""Fetch wheels from wheels.scipy.org for a pandas version."""
+import argparse
+import pathlib
+import sys
+import urllib.parse
+import urllib.request
+
+from lxml import html
+
+
+def parse_args(args=None):
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("version", type=str, help="Pandas version (0.23.0)")
+    return parser.parse_args(args)
+
+
+def fetch(version):
+    base = 'http://wheels.scipy.org'
+    tree = html.parse(base)
+    root = tree.getroot()
+
+    dest = pathlib.Path('dist')
+    dest.mkdir(exist_ok=True)
+
+    files = [x for x in root.xpath("//a/text()")
+             if x.startswith('pandas-{}'.format(version))
+             and not dest.joinpath(x).exists()]
+
+    N = len(files)
+
+    for i, filename in enumerate(files, 1):
+        out = str(dest.joinpath(filename))
+        link = urllib.request.urljoin(base, filename)
+        urllib.request.urlretrieve(link, out)
+        print("Downloaded {link} to {out} [{i}/{N}]".format(
+            link=link, out=out, i=i, N=N
+        ))
+
+
+def main(args=None):
+    args = parse_args(args)
+    fetch(args.version)
+
+
+if __name__ == '__main__':
+    sys.exit(main())
diff --git a/scripts/faster_xs.py b/scripts/faster_xs.py
deleted file mode 100644
index 2bb6271124c4f..0000000000000
--- a/scripts/faster_xs.py
+++ /dev/null
@@ -1,15 +0,0 @@
-import numpy as np
-
-import pandas.util.testing as tm
-
-from pandas.core.internals import _interleaved_dtype
-
-df = tm.makeDataFrame()
-
-df['E'] = 'foo'
-df['F'] = 'foo'
-df['G'] = 2
-df['H'] = df['A'] > 0
-
-blocks = df._data.blocks
-items = df.columns
diff --git a/scripts/file_sizes.py b/scripts/file_sizes.py
deleted file mode 100644
index de03c72ffbd09..0000000000000
--- a/scripts/file_sizes.py
+++ /dev/null
@@ -1,208 +0,0 @@
-from __future__ import print_function
-import os
-import sys
-
-import numpy as np
-import matplotlib.pyplot as plt
-
-from pandas import DataFrame
-from pandas.util.testing import set_trace
-from pandas import compat
-
-dirs = []
-names = []
-lengths = []
-
-if len(sys.argv) > 1:
-    loc = sys.argv[1]
-else:
-    loc = '.'
-walked = os.walk(loc)
-
-
-def _should_count_file(path):
-    return path.endswith('.py') or path.endswith('.pyx')
-
-
-def _is_def_line(line):
-    """def/cdef/cpdef, but not `cdef class`"""
-    return (line.endswith(':') and not 'class' in line.split() and
-            (line.startswith('def ') or
-             line.startswith('cdef ') or
-             line.startswith('cpdef ') or
-             ' def ' in line or ' cdef ' in line or ' cpdef ' in line))
-
-
-class LengthCounter(object):
-    """
-    should add option for subtracting nested function lengths??
-    """
-    def __init__(self, lines):
-        self.lines = lines
-        self.pos = 0
-        self.counts = []
-        self.n = len(lines)
-
-    def get_counts(self):
-        self.pos = 0
-        self.counts = []
-        while self.pos < self.n:
-            line = self.lines[self.pos]
-            self.pos += 1
-            if _is_def_line(line):
-                level = _get_indent_level(line)
-                self._count_function(indent_level=level)
-        return self.counts
-
-    def _count_function(self, indent_level=1):
-        indent = '    ' * indent_level
-
-        def _end_of_function(line):
-            return (line != '' and
-                    not line.startswith(indent) and
-                    not line.startswith('#'))
-
-        start_pos = self.pos
-        while self.pos < self.n:
-            line = self.lines[self.pos]
-            if _end_of_function(line):
-                self._push_count(start_pos)
-                return
-
-            self.pos += 1
-
-            if _is_def_line(line):
-                self._count_function(indent_level=indent_level + 1)
-
-        # end of file
-        self._push_count(start_pos)
-
-    def _push_count(self, start_pos):
-        func_lines = self.lines[start_pos:self.pos]
-
-        if len(func_lines) > 300:
-            set_trace()
-
-        # remove blank lines at end
-        while len(func_lines) > 0 and func_lines[-1] == '':
-            func_lines = func_lines[:-1]
-
-        # remove docstrings and comments
-        clean_lines = []
-        in_docstring = False
-        for line in func_lines:
-            line = line.strip()
-            if in_docstring and _is_triplequote(line):
-                in_docstring = False
-                continue
-
-            if line.startswith('#'):
-                continue
-
-            if _is_triplequote(line):
-                in_docstring = True
-                continue
-
-        self.counts.append(len(func_lines))
-
-
-def _get_indent_level(line):
-    level = 0
-    while line.startswith('    ' * level):
-        level += 1
-    return level
-
-
-def _is_triplequote(line):
-    return line.startswith('"""') or line.startswith("'''")
-
-
-def _get_file_function_lengths(path):
-    lines = [x.rstrip() for x in open(path).readlines()]
-    counter = LengthCounter(lines)
-    return counter.get_counts()
-
-# def test_get_function_lengths():
-text = """
-class Foo:
-
-def foo():
-    def bar():
-        a = 1
-
-        b = 2
-
-        c = 3
-
-    foo = 'bar'
-
-def x():
-    a = 1
-
-    b = 3
-
-    c = 7
-
-    pass
-"""
-
-expected = [5, 8, 7]
-
-lines = [x.rstrip() for x in text.splitlines()]
-counter = LengthCounter(lines)
-result = counter.get_counts()
-assert(result == expected)
-
-
-def doit():
-    for directory, _, files in walked:
-        print(directory)
-        for path in files:
-            if not _should_count_file(path):
-                continue
-
-            full_path = os.path.join(directory, path)
-            print(full_path)
-            lines = len(open(full_path).readlines())
-
-            dirs.append(directory)
-            names.append(path)
-            lengths.append(lines)
-
-    result = DataFrame({'dirs': dirs, 'names': names,
-                        'lengths': lengths})
-
-
-def doit2():
-    counts = {}
-    for directory, _, files in walked:
-        print(directory)
-        for path in files:
-            if not _should_count_file(path) or path.startswith('test_'):
-                continue
-
-            full_path = os.path.join(directory, path)
-            counts[full_path] = _get_file_function_lengths(full_path)
-
-    return counts
-
-counts = doit2()
-
-# counts = _get_file_function_lengths('pandas/tests/test_series.py')
-
-all_counts = []
-for k, v in compat.iteritems(counts):
-    all_counts.extend(v)
-all_counts = np.array(all_counts)
-
-fig = plt.figure(figsize=(10, 5))
-ax = fig.add_subplot(111)
-ax.hist(all_counts, bins=100)
-n = len(all_counts)
-nmore = (all_counts > 50).sum()
-ax.set_title('%s function lengths, n=%d' % ('pandas', n))
-ax.set_ylabel('N functions')
-ax.set_xlabel('Function length')
-ax.text(100, 300, '%.3f%% with > 50 lines' % ((n - nmore) / float(n)),
-        fontsize=18)
-plt.show()
diff --git a/scripts/find_commits_touching_func.py b/scripts/find_commits_touching_func.py
index 099761f38bb44..a4583155b1bde 100755
--- a/scripts/find_commits_touching_func.py
+++ b/scripts/find_commits_touching_func.py
@@ -1,135 +1,148 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-
-# copryright 2013, y-p @ github
-
-from __future__ import print_function
-from pandas.compat import range, lrange, map
-
-"""Search the git history for all commits touching a named method
+# copyright 2013, y-p @ github
+"""
+Search the git history for all commits touching a named method
 
 You need the sh module to run this
-WARNING: this script uses git clean -f, running it on a repo with untracked files
-will probably erase them.
+WARNING: this script uses git clean -f, running it on a repo with untracked
+files will probably erase them.
+
+Usage::
+    $ ./find_commits_touching_func.py  (see arguments below)
 """
+from __future__ import print_function
 import logging
 import re
 import os
+import argparse
 from collections import namedtuple
-from pandas.compat import parse_date
-
+from pandas.compat import lrange, map, string_types, text_type, parse_date
 try:
     import sh
 except ImportError:
-    raise ImportError("The 'sh' package is required in order to run this script. ")
+    raise ImportError("The 'sh' package is required to run this script.")
 
-import argparse
 
 desc = """
-Find all commits touching a sepcified function across the codebase.
+Find all commits touching a specified function across the codebase.
 """.strip()
 argparser = argparse.ArgumentParser(description=desc)
 argparser.add_argument('funcname', metavar='FUNCNAME',
-                   help='Name of function/method to search for changes on.')
+                       help='Name of function/method to search for changes on')
 argparser.add_argument('-f', '--file-masks', metavar='f_re(,f_re)*',
-                       default=["\.py.?$"],
-                   help='comma seperated list of regexes to match filenames against\n'+
-                   'defaults all .py? files')
+                       default=[r"\.py.?$"],
+                       help='comma separated list of regexes to match '
+                       'filenames against\ndefaults all .py? files')
 argparser.add_argument('-d', '--dir-masks', metavar='d_re(,d_re)*',
                        default=[],
-                   help='comma seperated list of regexes to match base path against')
+                       help='comma separated list of regexes to match base '
+                       'path against')
 argparser.add_argument('-p', '--path-masks', metavar='p_re(,p_re)*',
                        default=[],
-                   help='comma seperated list of regexes to match full file path against')
+                       help='comma separated list of regexes to match full '
+                       'file path against')
 argparser.add_argument('-y', '--saw-the-warning',
-                       action='store_true',default=False,
-                   help='must specify this to run, acknowledge you realize this will erase untracked files')
+                       action='store_true', default=False,
+                       help='must specify this to run, acknowledge you '
+                       'realize this will erase untracked files')
 argparser.add_argument('--debug-level',
                        default="CRITICAL",
-                   help='debug level of messages (DEBUG,INFO,etc...)')
-
+                       help='debug level of messages (DEBUG, INFO, etc...)')
 args = argparser.parse_args()
 
 
 lfmt = logging.Formatter(fmt='%(levelname)-8s %(message)s',
-    datefmt='%m-%d %H:%M:%S'
-)
-
+                         datefmt='%m-%d %H:%M:%S')
 shh = logging.StreamHandler()
 shh.setFormatter(lfmt)
-
-logger=logging.getLogger("findit")
+logger = logging.getLogger("findit")
 logger.addHandler(shh)
 
+Hit = namedtuple("Hit", "commit path")
+HASH_LEN = 8
 
-Hit=namedtuple("Hit","commit path")
-HASH_LEN=8
 
 def clean_checkout(comm):
-    h,s,d = get_commit_vitals(comm)
+    h, s, d = get_commit_vitals(comm)
     if len(s) > 60:
         s = s[:60] + "..."
-    s=s.split("\n")[0]
-    logger.info("CO: %s %s" % (comm,s ))
+    s = s.split("\n")[0]
+    logger.info("CO: %s %s" % (comm, s))
 
-    sh.git('checkout', comm ,_tty_out=False)
+    sh.git('checkout', comm, _tty_out=False)
     sh.git('clean', '-f')
 
-def get_hits(defname,files=()):
-    cs=set()
+
+def get_hits(defname, files=()):
+    cs = set()
     for f in files:
         try:
-            r=sh.git('blame', '-L', '/def\s*{start}/,/def/'.format(start=defname),f,_tty_out=False)
+            r = sh.git('blame',
+                       '-L',
+                       r'/def\s*{start}/,/def/'.format(start=defname),
+                       f,
+                       _tty_out=False)
         except sh.ErrorReturnCode_128:
             logger.debug("no matches in %s" % f)
             continue
 
         lines = r.strip().splitlines()[:-1]
         # remove comment lines
-        lines = [x for x in lines if not re.search("^\w+\s*\(.+\)\s*#",x)]
-        hits = set(map(lambda x: x.split(" ")[0],lines))
-        cs.update(set([Hit(commit=c,path=f) for c in hits]))
+        lines = [x for x in lines if not re.search(r"^\w+\s*\(.+\)\s*#", x)]
+        hits = set(map(lambda x: x.split(" ")[0], lines))
+        cs.update({Hit(commit=c, path=f) for c in hits})
 
     return cs
 
-def get_commit_info(c,fmt,sep='\t'):
-    r=sh.git('log', "--format={}".format(fmt), '{}^..{}'.format(c,c),"-n","1",_tty_out=False)
-    return compat.text_type(r).split(sep)
 
-def get_commit_vitals(c,hlen=HASH_LEN):
-    h,s,d= get_commit_info(c,'%H\t%s\t%ci',"\t")
-    return h[:hlen],s,parse_date(d)
+def get_commit_info(c, fmt, sep='\t'):
+    r = sh.git('log',
+               "--format={}".format(fmt),
+               '{}^..{}'.format(c, c),
+               "-n",
+               "1",
+               _tty_out=False)
+    return text_type(r).split(sep)
+
 
-def file_filter(state,dirname,fnames):
-    if args.dir_masks and not any([re.search(x,dirname) for x in args.dir_masks]):
+def get_commit_vitals(c, hlen=HASH_LEN):
+    h, s, d = get_commit_info(c, '%H\t%s\t%ci', "\t")
+    return h[:hlen], s, parse_date(d)
+
+
+def file_filter(state, dirname, fnames):
+    if (args.dir_masks and
+            not any(re.search(x, dirname) for x in args.dir_masks)):
         return
     for f in fnames:
-        p = os.path.abspath(os.path.join(os.path.realpath(dirname),f))
-        if  any([re.search(x,f) for x in args.file_masks])\
-            or any([re.search(x,p) for x in args.path_masks]):
+        p = os.path.abspath(os.path.join(os.path.realpath(dirname), f))
+        if (any(re.search(x, f) for x in args.file_masks) or
+                any(re.search(x, p) for x in args.path_masks)):
             if os.path.isfile(p):
                 state['files'].append(p)
 
-def search(defname,head_commit="HEAD"):
-    HEAD,s = get_commit_vitals("HEAD")[:2]
-    logger.info("HEAD at %s: %s" % (HEAD,s))
+
+def search(defname, head_commit="HEAD"):
+    HEAD, s = get_commit_vitals("HEAD")[:2]
+    logger.info("HEAD at %s: %s" % (HEAD, s))
     done_commits = set()
     # allhits = set()
     files = []
     state = dict(files=files)
-    os.path.walk('.',file_filter,state)
+    os.walk('.', file_filter, state)
     # files now holds a list of paths to files
 
     # seed with hits from q
-    allhits= set(get_hits(defname, files = files))
-    q = set([HEAD])
+    allhits = set(get_hits(defname, files=files))
+    q = {HEAD}
     try:
         while q:
-            h=q.pop()
+            h = q.pop()
             clean_checkout(h)
-            hits = get_hits(defname, files = files)
+            hits = get_hits(defname, files=files)
             for x in hits:
-                prevc = get_commit_vitals(x.commit+"^")[0]
+                prevc = get_commit_vitals(x.commit + "^")[0]
                 if prevc not in done_commits:
                     q.add(prevc)
             allhits.update(hits)
@@ -141,61 +154,63 @@ def search(defname,head_commit="HEAD"):
         clean_checkout(HEAD)
     return allhits
 
+
 def pprint_hits(hits):
-    SUBJ_LEN=50
+    SUBJ_LEN = 50
     PATH_LEN = 20
-    hits=list(hits)
+    hits = list(hits)
     max_p = 0
     for hit in hits:
-        p=hit.path.split(os.path.realpath(os.curdir)+os.path.sep)[-1]
-        max_p=max(max_p,len(p))
+        p = hit.path.split(os.path.realpath(os.curdir) + os.path.sep)[-1]
+        max_p = max(max_p, len(p))
 
     if max_p < PATH_LEN:
         SUBJ_LEN += PATH_LEN - max_p
         PATH_LEN = max_p
 
     def sorter(i):
-        h,s,d=get_commit_vitals(hits[i].commit)
-        return hits[i].path,d
+        h, s, d = get_commit_vitals(hits[i].commit)
+        return hits[i].path, d
 
-    print("\nThese commits touched the %s method in these files on these dates:\n" \
-          % args.funcname)
-    for i in sorted(lrange(len(hits)),key=sorter):
+    print(('\nThese commits touched the %s method in these files '
+           'on these dates:\n') % args.funcname)
+    for i in sorted(lrange(len(hits)), key=sorter):
         hit = hits[i]
-        h,s,d=get_commit_vitals(hit.commit)
-        p=hit.path.split(os.path.realpath(os.curdir)+os.path.sep)[-1]
+        h, s, d = get_commit_vitals(hit.commit)
+        p = hit.path.split(os.path.realpath(os.curdir) + os.path.sep)[-1]
 
         fmt = "{:%d} {:10} {:<%d} {:<%d}" % (HASH_LEN, SUBJ_LEN, PATH_LEN)
         if len(s) > SUBJ_LEN:
-            s = s[:SUBJ_LEN-5] + " ..."
-        print(fmt.format(h[:HASH_LEN],d.isoformat()[:10],s,p[-20:]) )
+            s = s[:SUBJ_LEN - 5] + " ..."
+        print(fmt.format(h[:HASH_LEN], d.isoformat()[:10], s, p[-20:]))
 
     print("\n")
 
+
 def main():
     if not args.saw_the_warning:
         argparser.print_help()
         print("""
 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
-WARNING: this script uses git clean -f, running it on a repo with untracked files.
+WARNING:
+this script uses git clean -f, running it on a repo with untracked files.
 It's recommended that you make a fresh clone and run from its root directory.
 You must specify the -y argument to ignore this warning.
 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
 """)
         return
-    if isinstance(args.file_masks,compat.string_types):
+    if isinstance(args.file_masks, string_types):
         args.file_masks = args.file_masks.split(',')
-    if isinstance(args.path_masks,compat.string_types):
+    if isinstance(args.path_masks, string_types):
         args.path_masks = args.path_masks.split(',')
-    if isinstance(args.dir_masks,compat.string_types):
+    if isinstance(args.dir_masks, string_types):
         args.dir_masks = args.dir_masks.split(',')
 
-    logger.setLevel(getattr(logging,args.debug_level))
+    logger.setLevel(getattr(logging, args.debug_level))
 
-    hits=search(args.funcname)
+    hits = search(args.funcname)
     pprint_hits(hits)
 
-    pass
 
 if __name__ == "__main__":
     import sys
diff --git a/scripts/find_undoc_args.py b/scripts/find_undoc_args.py
deleted file mode 100755
index 49273bacccf98..0000000000000
--- a/scripts/find_undoc_args.py
+++ /dev/null
@@ -1,126 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-from collections import namedtuple
-from itertools import islice
-import types
-import os
-import re
-import argparse
-#http://docs.python.org/2/library/argparse.html
-# arg name is positional is not prefixed with - or --
-
-parser = argparse.ArgumentParser(description='Program description.')
-parser.add_argument('-p', '--path', metavar='PATH', type=str, required=False,
-                    default=None,
-                   help='full path relative to which paths wills be reported',action='store')
-parser.add_argument('-m', '--module', metavar='MODULE', type=str,required=True,
-                   help='name of package to import and examine',action='store')
-parser.add_argument('-G', '--github_repo', metavar='REPO', type=str,required=False,
-                   help='github project where the the code lives, e.g. "pandas-dev/pandas"',
-                   default=None,action='store')
-
-args = parser.parse_args()
-
-Entry=namedtuple("Entry","func path lnum undoc_names missing_args nsig_names ndoc_names")
-
-def entry_gen(root_ns,module_name):
-
-    q=[root_ns]
-    seen=set()
-    while q:
-        ns = q.pop()
-        for x in dir(ns):
-            cand = getattr(ns,x)
-            if (isinstance(cand,types.ModuleType)
-                and cand.__name__ not in seen
-                and cand.__name__.startswith(module_name)):
-                # print(cand.__name__)
-                seen.add(cand.__name__)
-                q.insert(0,cand)
-            elif (isinstance(cand,(types.MethodType,types.FunctionType)) and
-                  cand not in seen and cand.__doc__):
-                seen.add(cand)
-                yield cand
-
-def cmp_docstring_sig(f):
-    def build_loc(f):
-        path=f.__code__.co_filename.split(args.path,1)[-1][1:]
-        return dict(path=path,lnum=f.__code__.co_firstlineno)
-
-    import inspect
-    sig_names=set(inspect.getargspec(f).args)
-    doc = f.__doc__.lower()
-    doc = re.split("^\s*parameters\s*",doc,1,re.M)[-1]
-    doc = re.split("^\s*returns*",doc,1,re.M)[0]
-    doc_names={x.split(":")[0].strip() for x in doc.split("\n")
-                if re.match("\s+[\w_]+\s*:",x)}
-    sig_names.discard("self")
-    doc_names.discard("kwds")
-    doc_names.discard("kwargs")
-    doc_names.discard("args")
-    return Entry(func=f,path=build_loc(f)['path'],lnum=build_loc(f)['lnum'],
-                 undoc_names=sig_names.difference(doc_names),
-                 missing_args=doc_names.difference(sig_names),nsig_names=len(sig_names),
-                 ndoc_names=len(doc_names))
-
-def format_id(i):
-    return i
-
-def format_item_as_github_task_list( i,item,repo):
-    tmpl = "- [ ] {id}) [{file}:{lnum} ({func_name}())]({link}) -  __Missing__[{nmissing}/{total_args}]: {undoc_names}"
-
-    link_tmpl = "https://github.com/{repo}/blob/master/{file}#L{lnum}"
-
-    link = link_tmpl.format(repo=repo,file=item.path ,lnum=item.lnum           )
-
-    s = tmpl.format(id=i,file=item.path ,
-                      lnum=item.lnum,
-                      func_name=item.func.__name__,
-                      link=link,
-                      nmissing=len(item.undoc_names),
-                      total_args=item.nsig_names,
-                      undoc_names=list(item.undoc_names))
-
-    if item.missing_args:
-        s+= "    __Extra__(?): {missing_args}".format(missing_args=list(item.missing_args))
-
-    return s
-
-def format_item_as_plain(i,item):
-    tmpl = "+{lnum} {path} {func_name}(): Missing[{nmissing}/{total_args}]={undoc_names}"
-
-    s = tmpl.format(path=item.path ,
-                      lnum=item.lnum,
-                      func_name=item.func.__name__,
-                      nmissing=len(item.undoc_names),
-                      total_args=item.nsig_names,
-                      undoc_names=list(item.undoc_names))
-
-    if item.missing_args:
-        s+= " Extra(?)={missing_args}".format(missing_args=list(item.missing_args))
-
-    return s
-
-def main():
-    module = __import__(args.module)
-    if not args.path:
-        args.path=os.path.dirname(module.__file__)
-    collect=[cmp_docstring_sig(e) for e in entry_gen(module,module.__name__)]
-    # only include if there are missing arguments in the docstring (fewer false positives)
-    # and there are at least some documented arguments
-    collect = [e for e in collect if e.undoc_names and len(e.undoc_names) != e.nsig_names]
-    collect.sort(key=lambda x:x.path)
-
-    if args.github_repo:
-        for i,item in enumerate(collect,1):
-            print( format_item_as_github_task_list(i,item,args.github_repo))
-    else:
-        for i,item in enumerate(collect,1):
-            print( format_item_as_plain(i, item))
-
-if __name__ == "__main__":
-    import sys
-    sys.exit(main())
diff --git a/scripts/gen_release_notes.py b/scripts/gen_release_notes.py
deleted file mode 100644
index 7e4ffca59a0ab..0000000000000
--- a/scripts/gen_release_notes.py
+++ /dev/null
@@ -1,95 +0,0 @@
-from __future__ import print_function
-import sys
-import json
-from pandas.io.common import urlopen
-from datetime import datetime
-
-
-class Milestone(object):
-
-    def __init__(self, title, number):
-        self.title = title
-        self.number = number
-
-    def __eq__(self, other):
-        if isinstance(other, Milestone):
-            return self.number == other.number
-        return False
-
-
-class Issue(object):
-
-    def __init__(self, title, labels, number, milestone, body, state):
-        self.title = title
-        self.labels = set([x['name'] for x in labels])
-        self.number = number
-        self.milestone = milestone
-        self.body = body
-        self.closed = state == 'closed'
-
-    def __eq__(self, other):
-        if isinstance(other, Issue):
-            return self.number == other.number
-        return False
-
-
-def get_issues():
-    all_issues = []
-    page_number = 1
-    while True:
-        iss = _get_page(page_number)
-        if len(iss) == 0:
-            break
-        page_number += 1
-        all_issues.extend(iss)
-    return all_issues
-
-
-def _get_page(page_number):
-    gh_url = ('https://api.github.com/repos/pandas-dev/pandas/issues?'
-              'milestone=*&state=closed&assignee=*&page=%d') % page_number
-    with urlopen(gh_url) as resp:
-        rs = resp.readlines()[0]
-    jsondata = json.loads(rs)
-    issues = [Issue(x['title'], x['labels'], x['number'],
-                    get_milestone(x['milestone']), x['body'], x['state'])
-              for x in jsondata]
-    return issues
-
-
-def get_milestone(data):
-    if data is None:
-        return None
-    return Milestone(data['title'], data['number'])
-
-
-def collate_label(issues, label):
-    lines = []
-    for x in issues:
-        if label in x.labels:
-            lines.append('\t- %s(#%d)' % (x.title, x.number))
-
-    return '\n'.join(lines)
-
-
-def release_notes(milestone):
-    issues = get_issues()
-
-    headers = ['New Features', 'Improvements to existing features',
-               'API Changes', 'Bug fixes']
-    labels = ['New', 'Enhancement', 'API-Change', 'Bug']
-
-    rs = 'pandas %s' % milestone
-    rs += '\n' + ('=' * len(rs))
-    rs += '\n\n **Release date:** %s' % datetime.today().strftime('%B %d, %Y')
-    for i, h in enumerate(headers):
-        rs += '\n\n**%s**\n\n' % h
-        l = labels[i]
-        rs += collate_label(issues, l)
-
-    return rs
-
-if __name__ == '__main__':
-
-    rs = release_notes(sys.argv[1])
-    print(rs)
diff --git a/scripts/generate_pip_deps_from_conda.py b/scripts/generate_pip_deps_from_conda.py
new file mode 100755
index 0000000000000..7b6eb1f9a32b5
--- /dev/null
+++ b/scripts/generate_pip_deps_from_conda.py
@@ -0,0 +1,122 @@
+#!/usr/bin/env python
+"""
+Convert the conda environment.yml to the pip requirements-dev.txt,
+or check that they have the same packages (for the CI)
+
+Usage:
+
+    Generate `requirements-dev.txt`
+    $ ./conda_to_pip
+
+    Compare and fail (exit status != 0) if `requirements-dev.txt` has not been
+    generated with this script:
+    $ ./conda_to_pip --compare
+"""
+import argparse
+import os
+import re
+import sys
+import yaml
+
+
+EXCLUDE = {'python=3'}
+RENAME = {'pytables': 'tables'}
+
+
+def conda_package_to_pip(package):
+    """
+    Convert a conda package to its pip equivalent.
+
+    In most cases they are the same, those are the exceptions:
+    - Packages that should be excluded (in `EXCLUDE`)
+    - Packages that should be renamed (in `RENAME`)
+    - A package requiring a specific version, in conda is defined with a single
+      equal (e.g. ``pandas=1.0``) and in pip with two (e.g. ``pandas==1.0``)
+    """
+    if package in EXCLUDE:
+        return
+
+    package = re.sub('(?<=[^<>])=', '==', package).strip()
+    for compare in ('<=', '>=', '=='):
+        if compare not in package:
+            continue
+
+        pkg, version = package.split(compare)
+
+        if pkg in RENAME:
+            return ''.join((RENAME[pkg], compare, version))
+
+        break
+
+    return package
+
+
+def main(conda_fname, pip_fname, compare=False):
+    """
+    Generate the pip dependencies file from the conda file, or compare that
+    they are synchronized (``compare=True``).
+
+    Parameters
+    ----------
+    conda_fname : str
+        Path to the conda file with dependencies (e.g. `environment.yml`).
+    pip_fname : str
+        Path to the pip file with dependencies (e.g. `requirements-dev.txt`).
+    compare : bool, default False
+        Whether to generate the pip file (``False``) or to compare if the
+        pip file has been generated with this script and the last version
+        of the conda file (``True``).
+
+    Returns
+    -------
+    bool
+        True if the comparison fails, False otherwise
+    """
+    with open(conda_fname) as conda_fd:
+        deps = yaml.safe_load(conda_fd)['dependencies']
+
+    pip_deps = []
+    for dep in deps:
+        if isinstance(dep, str):
+            conda_dep = conda_package_to_pip(dep)
+            if conda_dep:
+                pip_deps.append(conda_dep)
+        elif isinstance(dep, dict) and len(dep) == 1 and 'pip' in dep:
+            pip_deps += dep['pip']
+        else:
+            raise ValueError('Unexpected dependency {}'.format(dep))
+
+    pip_content = '\n'.join(pip_deps)
+
+    if compare:
+        with open(pip_fname) as pip_fd:
+            return pip_content != pip_fd.read()
+    else:
+        with open(pip_fname, 'w') as pip_fd:
+            pip_fd.write(pip_content)
+        return False
+
+
+if __name__ == '__main__':
+    argparser = argparse.ArgumentParser(
+        description='convert (or compare) conda file to pip')
+    argparser.add_argument('--compare',
+                           action='store_true',
+                           help='compare whether the two files are equivalent')
+    argparser.add_argument('--azure',
+                           action='store_true',
+                           help='show the output in azure-pipelines format')
+    args = argparser.parse_args()
+
+    repo_path = os.path.dirname(os.path.abspath(os.path.dirname(__file__)))
+    res = main(os.path.join(repo_path, 'environment.yml'),
+               os.path.join(repo_path, 'requirements-dev.txt'),
+               compare=args.compare)
+    if res:
+        msg = ('`requirements-dev.txt` has to be generated with `{}` after '
+               '`environment.yml` is modified.\n'.format(sys.argv[0]))
+        if args.azure:
+            msg = ('##vso[task.logissue type=error;'
+                   'sourcepath=requirements-dev.txt]{}'.format(msg))
+        sys.stderr.write(msg)
+    sys.exit(res)
diff --git a/scripts/git-mrb b/scripts/git-mrb
deleted file mode 100644
index c15e6dbf9f51a..0000000000000
--- a/scripts/git-mrb
+++ /dev/null
@@ -1,82 +0,0 @@
-#!/usr/bin/env python
-"""git-mrb: merge remote branch.
-
-git mrb [remote:branch OR remote-branch] [onto] [upstream]
-
-remote must be locally available, and branch must exist in that remote.
-
-If 'onto' branch isn't given, default is 'master'.
-
-If 'upstream' repository isn't given, default is 'origin'.
-
-You can separate the remote and branch spec with either a : or a -.
-
-Taken from IPython project
-"""
-#-----------------------------------------------------------------------------
-# Imports
-#-----------------------------------------------------------------------------
-
-from subprocess import check_call
-import sys
-
-#-----------------------------------------------------------------------------
-# Functions
-#-----------------------------------------------------------------------------
-
-def sh(cmd):
-    cmd = cmd.format(**shvars)
-    print('$', cmd)
-    check_call(cmd, shell=True)
-
-#-----------------------------------------------------------------------------
-# Main Script
-#-----------------------------------------------------------------------------
-
-argv = sys.argv[1:]
-narg = len(argv)
-
-try:
-    branch_spec = argv[0]
-    sep = ':' if ':' in branch_spec else '-'
-    remote, branch = branch_spec.split(':', 1)
-    if not branch:
-        raise ValueError('Branch spec %s invalid, branch not found' %
-                         branch_spec)
-except:
-    import traceback as tb
-    tb.print_exc()
-    print(__doc__)
-    sys.exit(1)
-
-onto = argv[1] if narg >= 2 else 'master'
-upstream = argv[1] if narg == 3 else 'origin'
-
-# Git doesn't like ':' in branch names.
-if sep == ':':
-    branch_spec = branch_spec.replace(':', '-')
-
-# Global used by sh
-shvars = dict(remote=remote, branch_spec=branch_spec, branch=branch,
-              onto=onto, upstream=upstream)
-
-# Start git calls.
-sh('git fetch {remote}')
-sh('git checkout -b {branch_spec} {onto}')
-sh('git merge {remote}/{branch}')
-
-print("""
-*************************************************************
- Run test suite.  If tests pass, run the following to merge:
-
-git checkout {onto}
-git merge {branch_spec}
-git push {upstream} {onto}
-
-*************************************************************
-""".format(**shvars))
-
-ans = raw_input("Revert to master and delete temporary branch? [Y/n]: ")
-if ans.strip().lower() in ('', 'y', 'yes'):
-    sh('git checkout {onto}')
-    sh('git branch -D {branch_spec}')
\ No newline at end of file
diff --git a/scripts/git_code_churn.py b/scripts/git_code_churn.py
deleted file mode 100644
index 18c9b244a6ba0..0000000000000
--- a/scripts/git_code_churn.py
+++ /dev/null
@@ -1,34 +0,0 @@
-import subprocess
-import os
-import re
-import sys
-
-import numpy as np
-
-from pandas import *
-
-
-if __name__ == '__main__':
-    from vbench.git import GitRepo
-    repo = GitRepo('/Users/wesm/code/pandas')
-    churn = repo.get_churn_by_file()
-
-    file_include = []
-    for path in churn.major_axis:
-        if path.endswith('.pyx') or path.endswith('.py'):
-            file_include.append(path)
-    commits_include = [sha for sha in churn.minor_axis
-                       if 'LF' not in repo.messages[sha]]
-    commits_include.remove('dcf3490')
-
-    clean_churn = churn.reindex(major=file_include, minor=commits_include)
-
-    by_commit = clean_churn.sum('major').sum(1)
-
-    by_date = by_commit.groupby(repo.commit_date).sum()
-
-    by_date = by_date.drop([datetime(2011, 6, 10)])
-
-    # clean out days where I touched Cython
-
-    by_date = by_date[by_date < 5000]
diff --git a/scripts/groupby_sample.py b/scripts/groupby_sample.py
deleted file mode 100644
index 42008858d3cad..0000000000000
--- a/scripts/groupby_sample.py
+++ /dev/null
@@ -1,54 +0,0 @@
-from pandas import *
-import numpy as np
-import string
-import pandas.compat as compat
-
-g1 = np.array(list(string.letters))[:-1]
-g2 = np.arange(510)
-df_small = DataFrame({'group1': ["a", "b", "a", "a", "b", "c", "c", "c", "c",
-                                 "c", "a", "a", "a", "b", "b", "b", "b"],
-                      'group2': [1, 2, 3, 4, 1, 3, 5, 6, 5, 4, 1, 2, 3, 4, 3, 2, 1],
-                      'value': ["apple", "pear", "orange", "apple",
-                                "banana", "durian", "lemon", "lime",
-                                "raspberry", "durian", "peach", "nectarine",
-                                "banana", "lemon", "guava", "blackberry",
-                                "grape"]})
-value = df_small['value'].values.repeat(3)
-df = DataFrame({'group1': g1.repeat(4000 * 5),
-                'group2': np.tile(g2, 400 * 5),
-                'value': value.repeat(4000 * 5)})
-
-
-def random_sample():
-    grouped = df.groupby(['group1', 'group2'])['value']
-    from random import choice
-    choose = lambda group: choice(group.index)
-    indices = grouped.apply(choose)
-    return df.reindex(indices)
-
-
-def random_sample_v2():
-    grouped = df.groupby(['group1', 'group2'])['value']
-    from random import choice
-    choose = lambda group: choice(group.index)
-    indices = [choice(v) for k, v in compat.iteritems(grouped.groups)]
-    return df.reindex(indices)
-
-
-def do_shuffle(arr):
-    from random import shuffle
-    result = arr.copy().values
-    shuffle(result)
-    return result
-
-
-def shuffle_uri(df, grouped):
-    perm = np.r_[tuple([np.random.permutation(
-        idxs) for idxs in compat.itervalues(grouped.groups)])]
-    df['state_permuted'] = np.asarray(df.ix[perm]['value'])
-
-df2 = df.copy()
-grouped = df2.groupby('group1')
-shuffle_uri(df2, grouped)
-
-df2['state_perm'] = grouped['value'].transform(do_shuffle)
diff --git a/scripts/groupby_speed.py b/scripts/groupby_speed.py
deleted file mode 100644
index 3be9fac12418e..0000000000000
--- a/scripts/groupby_speed.py
+++ /dev/null
@@ -1,35 +0,0 @@
-from __future__ import print_function
-from pandas import *
-
-rng = DatetimeIndex('1/3/2011', '11/30/2011', offset=offsets.Minute())
-
-df = DataFrame(np.random.randn(len(rng), 5), index=rng,
-               columns=list('OHLCV'))
-
-rng5 = DatetimeIndex('1/3/2011', '11/30/2011', offset=offsets.Minute(5))
-gp = rng5.asof
-grouped = df.groupby(gp)
-
-
-def get1(dt):
-    k = gp(dt)
-    return grouped.get_group(k)
-
-
-def get2(dt):
-    k = gp(dt)
-    return df.ix[grouped.groups[k]]
-
-
-def f():
-    for i, date in enumerate(df.index):
-        if i % 10000 == 0:
-            print(i)
-        get1(date)
-
-
-def g():
-    for i, date in enumerate(df.index):
-        if i % 10000 == 0:
-            print(i)
-        get2(date)
diff --git a/scripts/groupby_test.py b/scripts/groupby_test.py
deleted file mode 100644
index f640a6ed79503..0000000000000
--- a/scripts/groupby_test.py
+++ /dev/null
@@ -1,145 +0,0 @@
-from collections import defaultdict
-
-from numpy import nan
-import numpy as np
-
-from pandas import *
-
-import pandas._libs.lib as tseries
-import pandas.core.groupby as gp
-import pandas.util.testing as tm
-from pandas.compat import range
-reload(gp)
-
-"""
-
-k = 1000
-values = np.random.randn(8 * k)
-key1 = np.array(['foo', 'bar', 'baz', 'bar', 'foo', 'baz', 'bar', 'baz'] * k,
-                dtype=object)
-key2 = np.array(['b', 'b', 'b', 'b', 'a', 'a', 'a', 'a' ] * k,
-                dtype=object)
-shape, labels, idicts = gp.labelize(key1, key2)
-
-print(tseries.group_labels(key1))
-
-# print(shape)
-# print(labels)
-# print(idicts)
-
-result = tseries.group_aggregate(values, labels, shape)
-
-print(tseries.groupby_indices(key2))
-
-df = DataFrame({'key1' : key1,
-                'key2' : key2,
-                'v1' : values,
-                'v2' : values})
-k1 = df['key1']
-k2 = df['key2']
-
-# del df['key1']
-# del df['key2']
-
-# r2 = gp.multi_groupby(df, np.sum, k1, k2)
-
-# print(result)
-
-gen = gp.generate_groups(df['v1'], labels, shape, axis=1,
-                         factory=DataFrame)
-
-res = defaultdict(dict)
-for a, gen1 in gen:
-    for b, group in gen1:
-        print(a, b)
-        print(group)
-        # res[b][a] = group['values'].sum()
-        res[b][a] = group.sum()
-
-res = DataFrame(res)
-
-grouped = df.groupby(['key1', 'key2'])
-"""
-
-# data = {'A' : [0, 0, 0, 0, 1, 1, 1, 1, 1, 1., nan, nan],
-#         'B' : ['A', 'B'] * 6,
-#         'C' : np.random.randn(12)}
-# df = DataFrame(data)
-# df['C'][2:10:2] = nan
-
-# single column
-# grouped = df.drop(['B'], axis=1).groupby('A')
-# exp = {}
-# for cat, group in grouped:
-#     exp[cat] = group['C'].sum()
-# exp = DataFrame({'C' : exp})
-# result = grouped.sum()
-
-# grouped = df.groupby(['A', 'B'])
-# expd = {}
-# for cat1, cat2, group in grouped:
-#     expd.setdefault(cat1, {})[cat2] = group['C'].sum()
-# exp = DataFrame(expd).T.stack()
-# result = grouped.sum()['C']
-
-# print('wanted')
-# print(exp)
-# print('got')
-# print(result)
-
-# tm.N = 10000
-
-# mapping = {'A': 0, 'C': 1, 'B': 0, 'D': 1}
-# tf = lambda x: x - x.mean()
-
-# df = tm.makeTimeDataFrame()
-# ts = df['A']
-
-# # grouped = df.groupby(lambda x: x.strftime('%m/%y'))
-# grouped = df.groupby(mapping, axis=1)
-# groupedT = df.T.groupby(mapping, axis=0)
-
-# r1 = groupedT.transform(tf).T
-# r2 = grouped.transform(tf)
-
-# fillit = lambda x: x.fillna(method='pad')
-
-# f = lambda x: x
-
-# transformed = df.groupby(lambda x: x.strftime('%m/%y')).transform(lambda
-# x: x)
-
-# def ohlc(group):
-#     return Series([group[0], group.max(), group.min(), group[-1]],
-#                   index=['open', 'high', 'low', 'close'])
-# grouper = [lambda x: x.year, lambda x: x.month]
-# dr = DateRange('1/1/2000', '1/1/2002')
-# ts = Series(np.random.randn(len(dr)), index=dr)
-
-# import string
-
-# k = 20
-# n = 1000
-
-# keys = list(string.letters[:k])
-
-# df = DataFrame({'A' : np.tile(keys, n),
-#                 'B' : np.repeat(keys[:k/2], n * 2),
-#                 'C' : np.random.randn(k * n)})
-
-# def f():
-#     for x in df.groupby(['A', 'B']):
-#         pass
-
-a = np.arange(100).repeat(100)
-b = np.tile(np.arange(100), 100)
-index = MultiIndex.from_arrays([a, b])
-s = Series(np.random.randn(len(index)), index)
-df = DataFrame({'A': s})
-df['B'] = df.index.get_level_values(0)
-df['C'] = df.index.get_level_values(1)
-
-
-def f():
-    for x in df.groupby(['B', 'B']):
-        pass
diff --git a/scripts/hdfstore_panel_perf.py b/scripts/hdfstore_panel_perf.py
deleted file mode 100644
index c66e9506fc4c5..0000000000000
--- a/scripts/hdfstore_panel_perf.py
+++ /dev/null
@@ -1,17 +0,0 @@
-from pandas import *
-from pandas.util.testing import rands
-from pandas.compat import range
-
-i, j, k = 7, 771, 5532
-
-panel = Panel(np.random.randn(i, j, k),
-              items=[rands(10) for _ in range(i)],
-              major_axis=DatetimeIndex('1/1/2000', periods=j,
-                                       offset=offsets.Minute()),
-              minor_axis=[rands(10) for _ in range(k)])
-
-
-store = HDFStore('test.h5')
-store.put('test_panel', panel, table=True)
-
-retrieved = store['test_panel']
diff --git a/scripts/json_manip.py b/scripts/json_manip.py
deleted file mode 100644
index 7ff4547825568..0000000000000
--- a/scripts/json_manip.py
+++ /dev/null
@@ -1,423 +0,0 @@
-"""
-
-Tasks
--------
-
-Search and transform jsonable structures, specifically to make it 'easy' to make tabular/csv output for other consumers.
-
-Example
-~~~~~~~~~~~~~
-
-    *give me a list of all the fields called 'id' in this stupid, gnarly
-    thing*
-
-    >>> Q('id',gnarly_data)
-    ['id1','id2','id3']
-
-
-Observations:
----------------------
-
-1) 'simple data structures' exist and are common.  They are tedious
-   to search.
-
-2)  The DOM is another nested / treeish structure, and jQuery selector is
-    a good tool for that.
-
-3a) R, Numpy, Excel and other analysis tools want 'tabular' data.  These
-    analyses are valuable and worth doing.
-
-3b) Dot/Graphviz, NetworkX, and some other analyses *like* treeish/dicty
-    things, and those analyses are also worth doing!
-
-3c) Some analyses are best done using 'one-off' and custom code in C, Python,
-    or another 'real' programming language.
-
-4)  Arbitrary transforms are tedious and error prone.  SQL is one solution,
-    XSLT is another,
-
-5)  the XPATH/XML/XSLT family is.... not universally loved :)  They are
-    very complete, and the completeness can make simple cases... gross.
-
-6)  For really complicated data structures, we can write one-off code.  Getting
-    80% of the way is mostly okay.  There will always have to be programmers
-    in the loop.
-
-7)  Re-inventing SQL is probably a failure mode.  So is reinventing XPATH, XSLT
-    and the like.  Be wary of mission creep!  Re-use when possible (e.g., can
-    we put the thing into a DOM using
-
-8)  If the interface is good, people can improve performance later.
-
-
-Simplifying
----------------
-
-
-1)  Assuming 'jsonable' structures
-
-2)  keys are strings or stringlike.  Python allows any hashable to be a key.
-    for now, we pretend that doesn't happen.
-
-3)  assumes most dicts are 'well behaved'.  DAG, no cycles!
-
-4)  assume that if people want really specialized transforms, they can do it
-    themselves.
-
-"""
-from __future__ import print_function
-
-from collections import namedtuple
-import csv
-import itertools
-from itertools import product
-from operator import attrgetter as aget, itemgetter as iget
-import operator
-import sys
-from pandas.compat import map, u, callable, Counter
-import pandas.compat as compat
-
-
-##  note 'url' appears multiple places and not all extensions have same struct
-ex1 = {
-    'name': 'Gregg',
-    'extensions': [
-        {'id':'hello',
-         'url':'url1'},
-        {'id':'gbye',
-         'url':'url2',
-         'more': dict(url='url3')},
-    ]
-}
-
-## much longer example
-ex2 = {u('metadata'): {u('accessibilities'): [{u('name'): u('accessibility.tabfocus'),
-    u('value'): 7},
-   {u('name'): u('accessibility.mouse_focuses_formcontrol'), u('value'): False},
-   {u('name'): u('accessibility.browsewithcaret'), u('value'): False},
-   {u('name'): u('accessibility.win32.force_disabled'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.startlinksonly'), u('value'): False},
-   {u('name'): u('accessibility.usebrailledisplay'), u('value'): u('')},
-   {u('name'): u('accessibility.typeaheadfind.timeout'), u('value'): 5000},
-   {u('name'): u('accessibility.typeaheadfind.enabletimeout'), u('value'): True},
-   {u('name'): u('accessibility.tabfocus_applies_to_xul'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.flashBar'), u('value'): 1},
-   {u('name'): u('accessibility.typeaheadfind.autostart'), u('value'): True},
-   {u('name'): u('accessibility.blockautorefresh'), u('value'): False},
-   {u('name'): u('accessibility.browsewithcaret_shortcut.enabled'),
-    u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.enablesound'), u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.prefillwithselection'),
-    u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.soundURL'), u('value'): u('beep')},
-   {u('name'): u('accessibility.typeaheadfind'), u('value'): False},
-   {u('name'): u('accessibility.typeaheadfind.casesensitive'), u('value'): 0},
-   {u('name'): u('accessibility.warn_on_browsewithcaret'), u('value'): True},
-   {u('name'): u('accessibility.usetexttospeech'), u('value'): u('')},
-   {u('name'): u('accessibility.accesskeycausesactivation'), u('value'): True},
-   {u('name'): u('accessibility.typeaheadfind.linksonly'), u('value'): False},
-   {u('name'): u('isInstantiated'), u('value'): True}],
-  u('extensions'): [{u('id'): u('216ee7f7f4a5b8175374cd62150664efe2433a31'),
-    u('isEnabled'): True},
-   {u('id'): u('1aa53d3b720800c43c4ced5740a6e82bb0b3813e'), u('isEnabled'): False},
-   {u('id'): u('01ecfac5a7bd8c9e27b7c5499e71c2d285084b37'), u('isEnabled'): True},
-   {u('id'): u('1c01f5b22371b70b312ace94785f7b0b87c3dfb2'), u('isEnabled'): True},
-   {u('id'): u('fb723781a2385055f7d024788b75e959ad8ea8c3'), u('isEnabled'): True}],
-  u('fxVersion'): u('9.0'),
-  u('location'): u('zh-CN'),
-  u('operatingSystem'): u('WINNT Windows NT 5.1'),
-  u('surveyAnswers'): u(''),
-  u('task_guid'): u('d69fbd15-2517-45b5-8a17-bb7354122a75'),
-  u('tpVersion'): u('1.2'),
-  u('updateChannel'): u('beta')},
- u('survey_data'): {
-  u('extensions'): [{u('appDisabled'): False,
-    u('id'): u('testpilot?labs.mozilla.com'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Test Pilot')},
-   {u('appDisabled'): True,
-    u('id'): u('dict?www.youdao.com'),
-    u('isCompatible'): False,
-    u('isEnabled'): False,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Youdao Word Capturer')},
-   {u('appDisabled'): False,
-    u('id'): u('jqs?sun.com'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Java Quick Starter')},
-   {u('appDisabled'): False,
-    u('id'): u('?20a82645-c095-46ed-80e3-08825760534b?'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('Microsoft .NET Framework Assistant')},
-   {u('appDisabled'): False,
-    u('id'): u('?a0d7ccb3-214d-498b-b4aa-0e8fda9a7bf7?'),
-    u('isCompatible'): True,
-    u('isEnabled'): True,
-    u('isPlatformCompatible'): True,
-    u('name'): u('WOT')}],
-  u('version_number'): 1}}
-
-# class SurveyResult(object):
-
-#     def __init__(self, record):
-#         self.record = record
-#         self.metadata, self.survey_data = self._flatten_results()
-
-#     def _flatten_results(self):
-#         survey_data = self.record['survey_data']
-#         extensions = DataFrame(survey_data['extensions'])
-
-def denorm(queries,iterable_of_things,default=None):
-    """
-    'repeat', or 'stutter' to 'tableize' for downstream.
-    (I have no idea what a good word for this is!)
-
-    Think ``kronecker`` products, or:
-
-    ``SELECT single,multiple FROM table;``
-
-    single   multiple
-    -------  ---------
-    id1      val1
-    id1      val2
-
-
-    Args:
-
-        queries:  iterable of ``Q`` queries.
-        iterable_of_things:  to be queried.
-
-    Returns:
-
-        list of 'stuttered' output, where if a query returns
-        a 'single', it gets repeated appropriately.
-
-
-    """
-
-    def _denorm(queries,thing):
-        fields = []
-        results = []
-        for q in queries:
-            #print(q)
-            r = Ql(q,thing)
-            #print("-- result: ", r)
-            if not r:
-                r = [default]
-            if isinstance(r[0], type({})):
-                fields.append(sorted(r[0].keys()))  # dicty answers
-            else:
-                fields.append([q])  # stringy answer
-
-            results.append(r)
-
-        #print(results)
-        #print(fields)
-        flist =  list(flatten(*map(iter,fields)))
-
-        prod = itertools.product(*results)
-        for p in prod:
-            U = dict()
-            for (ii,thing) in enumerate(p):
-                #print(ii,thing)
-                if isinstance(thing, type({})):
-                    U.update(thing)
-                else:
-                    U[fields[ii][0]] = thing
-
-            yield U
-
-    return list(flatten(*[_denorm(queries,thing) for thing in iterable_of_things]))
-
-
-def default_iget(fields,default=None,):
-    """ itemgetter with 'default' handling, that *always* returns lists
-
-    API CHANGES from ``operator.itemgetter``
-
-    Note: Sorry to break the iget api... (fields vs *fields)
-    Note: *always* returns a list... unlike itemgetter,
-        which can return tuples or 'singles'
-    """
-    myiget = operator.itemgetter(*fields)
-    L = len(fields)
-    def f(thing):
-        try:
-            ans = list(myiget(thing))
-            if L < 2:
-                ans = [ans,]
-            return ans
-        except KeyError:
-            # slower!
-            return [thing.get(x,default) for x in fields]
-
-    f.__doc__ = "itemgetter with default %r for fields %r" %(default,fields)
-    f.__name__ = "default_itemgetter"
-    return f
-
-
-def flatten(*stack):
-    """
-    helper function for flattening iterables of generators in a
-    sensible way.
-    """
-    stack = list(stack)
-    while stack:
-        try: x = next(stack[0])
-        except StopIteration:
-            stack.pop(0)
-            continue
-        if hasattr(x,'next') and callable(getattr(x,'next')):
-            stack.insert(0, x)
-
-        #if isinstance(x, (GeneratorType,listerator)):
-        else: yield x
-
-
-def _Q(filter_, thing):
-    """ underlying machinery for Q function recursion """
-    T = type(thing)
-    if isinstance({}, T):
-        for k,v in compat.iteritems(thing):
-            #print(k,v)
-            if filter_ == k:
-                if isinstance(v, type([])):
-                    yield iter(v)
-                else:
-                    yield v
-
-            if type(v)  in (type({}),type([])):
-                yield Q(filter_,v)
-
-    elif isinstance([], T):
-        for k in thing:
-            #print(k)
-            yield Q(filter_,k)
-
-    else:
-        # no recursion.
-        pass
-
-def Q(filter_,thing):
-    """
-    type(filter):
-    - list:  a flattened list of all searches (one list)
-    - dict:  dict with vals each of which is that search
-
-    Notes:
-
-    [1] 'parent thing', with space, will do a descendent
-    [2] this will come back 'flattened' jQuery style
-    [3] returns a generator.  Use ``Ql`` if you want a list.
-
-    """
-    if isinstance(filter_, type([])):
-        return flatten(*[_Q(x,thing) for x in filter_])
-    elif isinstance(filter_, type({})):
-        d = dict.fromkeys(list(filter_.keys()))
-        #print(d)
-        for k in d:
-            #print(flatten(Q(k,thing)))
-            d[k] = Q(k,thing)
-
-        return d
-
-    else:
-        if " " in filter_:   # i.e. "antecendent post"
-            parts = filter_.strip().split()
-            r = None
-            for p in parts:
-                r = Ql(p,thing)
-                thing = r
-
-            return r
-
-        else:  # simple.
-            return flatten(_Q(filter_,thing))
-
-def Ql(filter_,thing):
-    """ same as Q, but returns a list, not a generator """
-    res = Q(filter_,thing)
-
-    if isinstance(filter_, type({})):
-        for k in res:
-            res[k] = list(res[k])
-        return res
-
-    else:
-        return list(res)
-
-
-
-def countit(fields,iter_of_iter,default=None):
-    """
-    note: robust to fields not being in i_of_i, using ``default``
-    """
-    C = Counter()  # needs hashables
-    T = namedtuple("Thing",fields)
-    get = default_iget(*fields,default=default)
-    return Counter(
-        (T(*get(thing)) for thing in iter_of_iter)
-    )
-
-
-## right now this works for one row...
-def printout(queries,things,default=None, f=sys.stdout, **kwargs):
-    """ will print header and objects
-
-    **kwargs go to csv.DictWriter
-
-    help(csv.DictWriter) for more.
-    """
-
-    results = denorm(queries,things,default=None)
-    fields = set(itertools.chain(*(x.keys() for x in results)))
-
-    W = csv.DictWriter(f=f,fieldnames=fields,**kwargs)
-    #print("---prod---")
-    #print(list(prod))
-    W.writeheader()
-    for r in results:
-        W.writerow(r)
-
-
-def test_run():
-    print("\n>>> print(list(Q('url',ex1)))")
-    print(list(Q('url',ex1)))
-    assert  list(Q('url',ex1)) == ['url1','url2','url3']
-    assert Ql('url',ex1) == ['url1','url2','url3']
-
-    print("\n>>>  print(list(Q(['name','id'],ex1)))")
-    print(list(Q(['name','id'],ex1)))
-    assert Ql(['name','id'],ex1) == ['Gregg','hello','gbye']
-
-
-    print("\n>>> print(Ql('more url',ex1))")
-    print(Ql('more url',ex1))
-
-
-    print("\n>>> list(Q('extensions',ex1))")
-    print(list(Q('extensions',ex1)))
-
-    print("\n>>> print(Ql('extensions',ex1))")
-    print(Ql('extensions',ex1))
-
-    print("\n>>> printout(['name','extensions'],[ex1,], extrasaction='ignore')")
-    printout(['name','extensions'],[ex1,], extrasaction='ignore')
-
-    print("\n\n")
-
-    from pprint import pprint as pp
-
-    print("-- note that the extension fields are also flattened!  (and N/A) -- ")
-    pp(denorm(['location','fxVersion','notthere','survey_data extensions'],[ex2,], default="N/A")[:2])
-
-
-if __name__ == "__main__":
-    pass
diff --git a/scripts/leak.py b/scripts/leak.py
deleted file mode 100644
index 47f74bf020597..0000000000000
--- a/scripts/leak.py
+++ /dev/null
@@ -1,13 +0,0 @@
-from pandas import *
-from pandas.compat import range
-import numpy as np
-import pandas.util.testing as tm
-import os
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-df = DataFrame(index=np.arange(100))
-for i in range(5000):
-    df[i] = 5
diff --git a/scripts/list_future_warnings.sh b/scripts/list_future_warnings.sh
new file mode 100755
index 0000000000000..0c4046bbb5f49
--- /dev/null
+++ b/scripts/list_future_warnings.sh
@@ -0,0 +1,46 @@
+#!/bin/bash
+
+# Check all future warnings in Python files, and report them with the version
+# where the FutureWarning was added.
+#
+# This is useful to detect features that have been deprecated, and should be
+# removed from the code. For example, if a line of code contains:
+#
+#     warning.warn('Method deprecated', FutureWarning, stacklevel=2)
+#
+# Which is released in Pandas 0.20.0, then it is expected that the method
+# is removed before releasing Pandas 0.24.0, including the warning. If it
+# is not, this script will list this line, with the version 0.20.0, which
+# will make it easy to detect that it had to be removed.
+#
+# In some cases this script can return false positives, for example in files
+# where FutureWarning is used to detect deprecations, or similar. The EXCLUDE
+# variable can be used to ignore files that use FutureWarning, but do not
+# deprecate functionality.
+#
+# Usage:
+#
+#     $ ./list_future_warnings.sh
+
+EXCLUDE="^pandas/tests/|"  # tests validate that FutureWarnings are raised
+EXCLUDE+="^pandas/util/_decorators.py$|"  # generic deprecate function that raises warning
+EXCLUDE+="^pandas/util/_depr_module.py$|"  # generic deprecate module that raises warnings
+EXCLUDE+="^pandas/util/testing.py$|" # contains function to evaluate if warning is raised
+EXCLUDE+="^pandas/io/parsers.py$"  # implements generic deprecation system in io reading
+
+BASE_DIR="$(dirname $0)/.."
+cd $BASE_DIR
+FILES=`grep -RIl "FutureWarning" pandas/* | grep -vE "$EXCLUDE"`
+OUTPUT=()
+IFS=$'\n'
+
+for FILE in $FILES; do
+    FILE_LINES=`git blame -sf $FILE | grep FutureWarning | tr -s " " | cut -d " " -f1,3`
+    for FILE_LINE in $FILE_LINES; do
+        TAG=$(git tag --contains $(echo $FILE_LINE | cut -d" " -f1) | head -n1)
+        OUTPUT_ROW=`printf "%-14s %-16s %s" ${TAG:-"(not released)"} $FILE_LINE $FILE`
+        OUTPUT+=($OUTPUT_ROW)
+    done
+done
+
+printf "%s\n" "${OUTPUT[@]}" | sort -V
diff --git a/scripts/merge-pr.py b/scripts/merge-pr.py
new file mode 100755
index 0000000000000..31264cad52e4f
--- /dev/null
+++ b/scripts/merge-pr.py
@@ -0,0 +1,321 @@
+#!/usr/bin/env python
+
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+# Utility for creating well-formed pull request merges and pushing them to
+# Apache.
+#   usage: ./apache-pr-merge.py    (see config env vars below)
+#
+# Lightly modified from version of this script in incubator-parquet-format
+from __future__ import print_function
+
+from subprocess import check_output
+from requests.auth import HTTPBasicAuth
+import requests
+
+import os
+import six
+import sys
+import textwrap
+
+from six.moves import input
+
+PANDAS_HOME = '.'
+PROJECT_NAME = 'pandas'
+print("PANDAS_HOME = " + PANDAS_HOME)
+
+# Remote name with the PR
+PR_REMOTE_NAME = os.environ.get("PR_REMOTE_NAME", "upstream")
+
+# Remote name where results pushed
+PUSH_REMOTE_NAME = os.environ.get("PUSH_REMOTE_NAME", "upstream")
+
+GITHUB_BASE = "https://github.com/pandas-dev/" + PROJECT_NAME + "/pull"
+GITHUB_API_BASE = "https://api.github.com/repos/pandas-dev/" + PROJECT_NAME
+
+# Prefix added to temporary branches
+BRANCH_PREFIX = "PR_TOOL"
+
+os.chdir(PANDAS_HOME)
+
+auth_required = False
+
+if auth_required:
+    GITHUB_USERNAME = os.environ['GITHUB_USER']
+    import getpass
+    GITHUB_PASSWORD = getpass.getpass('Enter github.com password for %s:'
+                                      % GITHUB_USERNAME)
+
+    def get_json_auth(url):
+        auth = HTTPBasicAuth(GITHUB_USERNAME, GITHUB_PASSWORD)
+        req = requests.get(url, auth=auth)
+        return req.json()
+
+    get_json = get_json_auth
+else:
+    def get_json_no_auth(url):
+        req = requests.get(url)
+        return req.json()
+
+    get_json = get_json_no_auth
+
+
+def fail(msg):
+    print(msg)
+    clean_up()
+    sys.exit(-1)
+
+
+def run_cmd(cmd):
+    if isinstance(cmd, six.string_types):
+        cmd = cmd.split(' ')
+
+    output = check_output(cmd)
+
+    if isinstance(output, six.binary_type):
+        output = output.decode('utf-8')
+    return output
+
+
+def continue_maybe(prompt):
+    result = input("\n%s (y/n): " % prompt)
+    if result.lower() != "y":
+        fail("Okay, exiting")
+
+
+def continue_maybe2(prompt):
+    result = input("\n%s (y/n): " % prompt)
+    if result.lower() != "y":
+        return False
+    else:
+        return True
+
+
+original_head = run_cmd("git rev-parse HEAD")[:8]
+
+
+def clean_up():
+    print("Restoring head pointer to %s" % original_head)
+    run_cmd("git checkout %s" % original_head)
+
+    branches = run_cmd("git branch").replace(" ", "").split("\n")
+
+    for branch in [b for b in branches if b.startswith(BRANCH_PREFIX)]:
+        print("Deleting local branch %s" % branch)
+        run_cmd("git branch -D %s" % branch)
+
+
+# Merge the requested PR and return the merge hash
+def merge_pr(pr_num, target_ref):
+
+    pr_branch_name = "%s_MERGE_PR_%s" % (BRANCH_PREFIX, pr_num)
+    target_branch_name = "%s_MERGE_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
+                                                target_ref.upper())
+    run_cmd("git fetch %s pull/%s/head:%s" % (PR_REMOTE_NAME, pr_num,
+                                              pr_branch_name))
+    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, target_ref,
+                                    target_branch_name))
+    run_cmd("git checkout %s" % target_branch_name)
+
+    had_conflicts = False
+    try:
+        run_cmd(['git', 'merge', pr_branch_name, '--squash'])
+    except Exception as e:
+        msg = ("Error merging: %s\nWould you like to manually fix-up "
+               "this merge?" % e)
+        continue_maybe(msg)
+        msg = ("Okay, please fix any conflicts and 'git add' "
+               "conflicting files... Finished?")
+        continue_maybe(msg)
+        had_conflicts = True
+
+    commit_authors = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
+                             '--pretty=format:%an <%ae>']).split("\n")
+    distinct_authors = sorted(set(commit_authors),
+                              key=lambda x: commit_authors.count(x),
+                              reverse=True)
+    primary_author = distinct_authors[0]
+    commits = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
+                      '--pretty=format:%h [%an] %s']).split("\n\n")
+
+    merge_message_flags = []
+
+    merge_message_flags += ["-m", title]
+    if body is not None:
+        merge_message_flags += ["-m", '\n'.join(textwrap.wrap(body))]
+
+    authors = "\n".join("Author: %s" % a for a in distinct_authors)
+
+    merge_message_flags += ["-m", authors]
+
+    if had_conflicts:
+        committer_name = run_cmd("git config --get user.name").strip()
+        committer_email = run_cmd("git config --get user.email").strip()
+        message = ("This patch had conflicts when merged, "
+                   "resolved by\nCommitter: %s <%s>"
+                   % (committer_name, committer_email))
+        merge_message_flags += ["-m", message]
+
+    # The string "Closes #%s" string is required for GitHub to correctly close
+    # the PR
+    merge_message_flags += [
+        "-m",
+        "Closes #%s from %s and squashes the following commits:"
+        % (pr_num, pr_repo_desc)]
+    for c in commits:
+        merge_message_flags += ["-m", c]
+
+    run_cmd(['git', 'commit', '--author="%s"' % primary_author] +
+            merge_message_flags)
+
+    continue_maybe("Merge complete (local ref %s). Push to %s?" % (
+        target_branch_name, PUSH_REMOTE_NAME))
+
+    try:
+        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, target_branch_name,
+                                       target_ref))
+    except Exception as e:
+        clean_up()
+        fail("Exception while pushing: %s" % e)
+
+    merge_hash = run_cmd("git rev-parse %s" % target_branch_name)[:8]
+    clean_up()
+    print("Pull request #%s merged!" % pr_num)
+    print("Merge hash: %s" % merge_hash)
+    return merge_hash
+
+
+def update_pr(pr_num, user_login, base_ref):
+
+    pr_branch_name = "%s_MERGE_PR_%s" % (BRANCH_PREFIX, pr_num)
+
+    run_cmd("git fetch %s pull/%s/head:%s" % (PR_REMOTE_NAME, pr_num,
+                                              pr_branch_name))
+    run_cmd("git checkout %s" % pr_branch_name)
+
+    continue_maybe("Update ready (local ref %s)? Push to %s/%s?" % (
+        pr_branch_name, user_login, base_ref))
+
+    push_user_remote = "https://github.com/%s/pandas.git" % user_login
+
+    try:
+        run_cmd('git push %s %s:%s' % (push_user_remote, pr_branch_name,
+                                       base_ref))
+    except Exception as e:
+
+        if continue_maybe2("Force push?"):
+            try:
+                run_cmd(
+                    'git push -f %s %s:%s' % (push_user_remote, pr_branch_name,
+                                              base_ref))
+            except Exception as e:
+                fail("Exception while pushing: %s" % e)
+                clean_up()
+        else:
+            fail("Exception while pushing: %s" % e)
+            clean_up()
+
+    clean_up()
+    print("Pull request #%s updated!" % pr_num)
+
+
+def cherry_pick(pr_num, merge_hash, default_branch):
+    pick_ref = input("Enter a branch name [%s]: " % default_branch)
+    if pick_ref == "":
+        pick_ref = default_branch
+
+    pick_branch_name = "%s_PICK_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
+                                             pick_ref.upper())
+
+    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, pick_ref,
+                                    pick_branch_name))
+    run_cmd("git checkout %s" % pick_branch_name)
+    run_cmd("git cherry-pick -sx %s" % merge_hash)
+
+    continue_maybe("Pick complete (local ref %s). Push to %s?" % (
+        pick_branch_name, PUSH_REMOTE_NAME))
+
+    try:
+        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, pick_branch_name,
+                                       pick_ref))
+    except Exception as e:
+        clean_up()
+        fail("Exception while pushing: %s" % e)
+
+    pick_hash = run_cmd("git rev-parse %s" % pick_branch_name)[:8]
+    clean_up()
+
+    print("Pull request #%s picked into %s!" % (pr_num, pick_ref))
+    print("Pick hash: %s" % pick_hash)
+    return pick_ref
+
+
+def fix_version_from_branch(branch, versions):
+    #  Note: Assumes this is a sorted (newest->oldest) list of un-released
+    #  versions
+    if branch == "master":
+        return versions[0]
+    else:
+        branch_ver = branch.replace("branch-", "")
+        return filter(lambda x: x.name.startswith(branch_ver), versions)[-1]
+
+
+pr_num = input("Which pull request would you like to merge? (e.g. 34): ")
+pr = get_json("%s/pulls/%s" % (GITHUB_API_BASE, pr_num))
+
+url = pr["url"]
+title = pr["title"]
+body = pr["body"]
+target_ref = pr["base"]["ref"]
+user_login = pr["user"]["login"]
+base_ref = pr["head"]["ref"]
+pr_repo_desc = "%s/%s" % (user_login, base_ref)
+
+if pr["merged"] is True:
+    print("Pull request {0} has already been merged, please backport manually"
+          .format(pr_num))
+    sys.exit(0)
+
+if not bool(pr["mergeable"]):
+    msg = ("Pull request {0} is not mergeable in its current form.\n"
+           "Continue? (experts only!)".format(pr_num))
+    continue_maybe(msg)
+
+print("\n=== Pull Request #%s ===" % pr_num)
+
+# we may have un-printable unicode in our title
+try:
+    title = title.encode('raw_unicode_escape')
+except Exception:
+    pass
+
+print("title\t{title}\nsource\t{source}\ntarget\t{target}\nurl\t{url}".format(
+    title=title, source=pr_repo_desc, target=target_ref, url=url))
+
+
+merged_refs = [target_ref]
+
+print("\nProceed with updating or merging pull request #%s?" % pr_num)
+update = input("Update PR and push to remote (r), merge locally (l), "
+               "or do nothing (n) ?")
+update = update.lower()
+
+if update == 'r':
+    merge_hash = update_pr(pr_num, user_login, base_ref)
+elif update == 'l':
+    merge_hash = merge_pr(pr_num, target_ref)
diff --git a/scripts/merge-py.py b/scripts/merge-py.py
deleted file mode 100755
index b9350f8feceb8..0000000000000
--- a/scripts/merge-py.py
+++ /dev/null
@@ -1,264 +0,0 @@
-#!/usr/bin/env python
-
-#
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements.  See the NOTICE file distributed with
-# this work for additional information regarding copyright ownership.
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-
-# Utility for creating well-formed pull request merges and pushing them to
-# Apache.
-#   usage: ./apache-pr-merge.py    (see config env vars below)
-#
-# Lightly modified from version of this script in incubator-parquet-format
-
-from __future__ import print_function
-
-from subprocess import check_output
-from requests.auth import HTTPBasicAuth
-import requests
-
-import os
-import six
-import sys
-import textwrap
-
-from six.moves import input
-
-PANDAS_HOME = '.'
-PROJECT_NAME = 'pandas'
-print("PANDAS_HOME = " + PANDAS_HOME)
-
-# Remote name with the PR
-PR_REMOTE_NAME = os.environ.get("PR_REMOTE_NAME", "upstream")
-
-# Remote name where results pushed
-PUSH_REMOTE_NAME = os.environ.get("PUSH_REMOTE_NAME", "upstream")
-
-GITHUB_BASE = "https://github.com/pandas-dev/" + PROJECT_NAME + "/pull"
-GITHUB_API_BASE = "https://api.github.com/repos/pandas-dev/" + PROJECT_NAME
-
-# Prefix added to temporary branches
-BRANCH_PREFIX = "PR_TOOL"
-
-os.chdir(PANDAS_HOME)
-
-auth_required = False
-
-if auth_required:
-    GITHUB_USERNAME = os.environ['GITHUB_USER']
-    import getpass
-    GITHUB_PASSWORD = getpass.getpass('Enter github.com password for %s:'
-                                      % GITHUB_USERNAME)
-
-    def get_json_auth(url):
-        auth = HTTPBasicAuth(GITHUB_USERNAME, GITHUB_PASSWORD)
-        req = requests.get(url, auth=auth)
-        return req.json()
-
-    get_json = get_json_auth
-else:
-    def get_json_no_auth(url):
-        req = requests.get(url)
-        return req.json()
-
-    get_json = get_json_no_auth
-
-
-def fail(msg):
-    print(msg)
-    clean_up()
-    sys.exit(-1)
-
-
-def run_cmd(cmd):
-    if isinstance(cmd, six.string_types):
-        cmd = cmd.split(' ')
-
-    output = check_output(cmd)
-
-    if isinstance(output, six.binary_type):
-        output = output.decode('utf-8')
-    return output
-
-
-def continue_maybe(prompt):
-    result = input("\n%s (y/n): " % prompt)
-    if result.lower() != "y":
-        fail("Okay, exiting")
-
-
-original_head = run_cmd("git rev-parse HEAD")[:8]
-
-
-def clean_up():
-    print("Restoring head pointer to %s" % original_head)
-    run_cmd("git checkout %s" % original_head)
-
-    branches = run_cmd("git branch").replace(" ", "").split("\n")
-
-    for branch in [b for b in branches if b.startswith(BRANCH_PREFIX)]:
-        print("Deleting local branch %s" % branch)
-        run_cmd("git branch -D %s" % branch)
-
-
-# Merge the requested PR and return the merge hash
-def merge_pr(pr_num, target_ref):
-
-    pr_branch_name = "%s_MERGE_PR_%s" % (BRANCH_PREFIX, pr_num)
-    target_branch_name = "%s_MERGE_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
-                                                target_ref.upper())
-    run_cmd("git fetch %s pull/%s/head:%s" % (PR_REMOTE_NAME, pr_num,
-                                              pr_branch_name))
-    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, target_ref,
-                                    target_branch_name))
-    run_cmd("git checkout %s" % target_branch_name)
-
-    had_conflicts = False
-    try:
-        run_cmd(['git', 'merge', pr_branch_name, '--squash'])
-    except Exception as e:
-        msg = ("Error merging: %s\nWould you like to manually fix-up "
-               "this merge?" % e)
-        continue_maybe(msg)
-        msg = ("Okay, please fix any conflicts and 'git add' "
-               "conflicting files... Finished?")
-        continue_maybe(msg)
-        had_conflicts = True
-
-    commit_authors = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
-                             '--pretty=format:%an <%ae>']).split("\n")
-    distinct_authors = sorted(set(commit_authors),
-                              key=lambda x: commit_authors.count(x),
-                              reverse=True)
-    primary_author = distinct_authors[0]
-    commits = run_cmd(['git', 'log', 'HEAD..%s' % pr_branch_name,
-                      '--pretty=format:%h [%an] %s']).split("\n\n")
-
-    merge_message_flags = []
-
-    merge_message_flags += ["-m", title]
-    if body is not None:
-        merge_message_flags += ["-m", '\n'.join(textwrap.wrap(body))]
-
-    authors = "\n".join(["Author: %s" % a for a in distinct_authors])
-
-    merge_message_flags += ["-m", authors]
-
-    if had_conflicts:
-        committer_name = run_cmd("git config --get user.name").strip()
-        committer_email = run_cmd("git config --get user.email").strip()
-        message = ("This patch had conflicts when merged, "
-                   "resolved by\nCommitter: %s <%s>"
-                   % (committer_name, committer_email))
-        merge_message_flags += ["-m", message]
-
-    # The string "Closes #%s" string is required for GitHub to correctly close
-    # the PR
-    merge_message_flags += [
-        "-m",
-        "Closes #%s from %s and squashes the following commits:"
-        % (pr_num, pr_repo_desc)]
-    for c in commits:
-        merge_message_flags += ["-m", c]
-
-    run_cmd(['git', 'commit', '--author="%s"' % primary_author] +
-            merge_message_flags)
-
-    continue_maybe("Merge complete (local ref %s). Push to %s?" % (
-        target_branch_name, PUSH_REMOTE_NAME))
-
-    try:
-        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, target_branch_name,
-                                       target_ref))
-    except Exception as e:
-        clean_up()
-        fail("Exception while pushing: %s" % e)
-
-    merge_hash = run_cmd("git rev-parse %s" % target_branch_name)[:8]
-    clean_up()
-    print("Pull request #%s merged!" % pr_num)
-    print("Merge hash: %s" % merge_hash)
-    return merge_hash
-
-
-def cherry_pick(pr_num, merge_hash, default_branch):
-    pick_ref = input("Enter a branch name [%s]: " % default_branch)
-    if pick_ref == "":
-        pick_ref = default_branch
-
-    pick_branch_name = "%s_PICK_PR_%s_%s" % (BRANCH_PREFIX, pr_num,
-                                             pick_ref.upper())
-
-    run_cmd("git fetch %s %s:%s" % (PUSH_REMOTE_NAME, pick_ref,
-                                    pick_branch_name))
-    run_cmd("git checkout %s" % pick_branch_name)
-    run_cmd("git cherry-pick -sx %s" % merge_hash)
-
-    continue_maybe("Pick complete (local ref %s). Push to %s?" % (
-        pick_branch_name, PUSH_REMOTE_NAME))
-
-    try:
-        run_cmd('git push %s %s:%s' % (PUSH_REMOTE_NAME, pick_branch_name,
-                                       pick_ref))
-    except Exception as e:
-        clean_up()
-        fail("Exception while pushing: %s" % e)
-
-    pick_hash = run_cmd("git rev-parse %s" % pick_branch_name)[:8]
-    clean_up()
-
-    print("Pull request #%s picked into %s!" % (pr_num, pick_ref))
-    print("Pick hash: %s" % pick_hash)
-    return pick_ref
-
-
-def fix_version_from_branch(branch, versions):
-    #  Note: Assumes this is a sorted (newest->oldest) list of un-released
-    #  versions
-    if branch == "master":
-        return versions[0]
-    else:
-        branch_ver = branch.replace("branch-", "")
-        return filter(lambda x: x.name.startswith(branch_ver), versions)[-1]
-
-pr_num = input("Which pull request would you like to merge? (e.g. 34): ")
-pr = get_json("%s/pulls/%s" % (GITHUB_API_BASE, pr_num))
-
-url = pr["url"]
-title = pr["title"]
-body = pr["body"]
-target_ref = pr["base"]["ref"]
-user_login = pr["user"]["login"]
-base_ref = pr["head"]["ref"]
-pr_repo_desc = "%s/%s" % (user_login, base_ref)
-
-if pr["merged"] is True:
-    print("Pull request {0} has already been merged, please backport manually"
-          .format(pr_num))
-    sys.exit(0)
-
-if not bool(pr["mergeable"]):
-    msg = ("Pull request {0} is not mergeable in its current form.\n"
-           "Continue? (experts only!)".format(pr_num))
-    continue_maybe(msg)
-
-print("\n=== Pull Request #%s ===" % pr_num)
-print("title\t%s\nsource\t%s\ntarget\t%s\nurl\t%s"
-      % (title, pr_repo_desc, target_ref, url))
-continue_maybe("Proceed with merging pull request #%s?" % pr_num)
-
-merged_refs = [target_ref]
-
-merge_hash = merge_pr(pr_num, target_ref)
diff --git a/scripts/parser_magic.py b/scripts/parser_magic.py
deleted file mode 100644
index 72fef39d8db65..0000000000000
--- a/scripts/parser_magic.py
+++ /dev/null
@@ -1,74 +0,0 @@
-from pandas.util.testing import set_trace
-import pandas.util.testing as tm
-import pandas.compat as compat
-
-from pandas import *
-import ast
-import inspect
-import sys
-
-
-def merge(a, b):
-    f, args, _ = parse_stmt(inspect.currentframe().f_back)
-    return DataFrame({args[0]: a,
-                      args[1]: b})
-
-
-def parse_stmt(frame):
-    info = inspect.getframeinfo(frame)
-    call = info[-2][0]
-    mod = ast.parse(call)
-    body = mod.body[0]
-    if isinstance(body, (ast.Assign, ast.Expr)):
-        call = body.value
-    elif isinstance(body, ast.Call):
-        call = body
-    return _parse_call(call)
-
-
-def _parse_call(call):
-    func = _maybe_format_attribute(call.func)
-
-    str_args = []
-    for arg in call.args:
-        if isinstance(arg, ast.Name):
-            str_args.append(arg.id)
-        elif isinstance(arg, ast.Call):
-            formatted = _format_call(arg)
-            str_args.append(formatted)
-
-    return func, str_args, {}
-
-
-def _format_call(call):
-    func, args, kwds = _parse_call(call)
-    content = ''
-    if args:
-        content += ', '.join(args)
-    if kwds:
-        fmt_kwds = ['%s=%s' % item for item in compat.iteritems(kwds)]
-        joined_kwds = ', '.join(fmt_kwds)
-        if args:
-            content = content + ', ' + joined_kwds
-        else:
-            content += joined_kwds
-    return '%s(%s)' % (func, content)
-
-
-def _maybe_format_attribute(name):
-    if isinstance(name, ast.Attribute):
-        return _format_attribute(name)
-    return name.id
-
-
-def _format_attribute(attr):
-    obj = attr.value
-    if isinstance(attr.value, ast.Attribute):
-        obj = _format_attribute(attr.value)
-    else:
-        obj = obj.id
-    return '.'.join((obj, attr.attr))
-
-a = tm.makeTimeSeries()
-b = tm.makeTimeSeries()
-df = merge(a, b)
diff --git a/scripts/preepoch_test.py b/scripts/preepoch_test.py
deleted file mode 100644
index 36a3d768e671f..0000000000000
--- a/scripts/preepoch_test.py
+++ /dev/null
@@ -1,23 +0,0 @@
-import numpy as np
-from pandas import *
-
-
-def panda_test():
-
-    # generate some data
-    data = np.random.rand(50, 5)
-    # generate some dates
-    dates = DatetimeIndex('1/1/1969', periods=50)
-    # generate column headings
-    cols = ['A', 'B', 'C', 'D', 'E']
-
-    df = DataFrame(data, index=dates, columns=cols)
-
-    # save to HDF5Store
-    store = HDFStore('bugzilla.h5', mode='w')
-    store['df'] = df  # This gives: OverflowError: mktime argument out of range
-    store.close()
-
-
-if __name__ == '__main__':
-    panda_test()
diff --git a/scripts/pypistats.py b/scripts/pypistats.py
deleted file mode 100644
index 41343f6d30c76..0000000000000
--- a/scripts/pypistats.py
+++ /dev/null
@@ -1,101 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-"""
-Calculates the total number of downloads that a particular PyPI package has
-received across all versions tracked by PyPI
-"""
-
-from datetime import datetime
-import locale
-import sys
-import xmlrpclib
-import pandas as pd
-
-locale.setlocale(locale.LC_ALL, '')
-
-
-class PyPIDownloadAggregator(object):
-
-    def __init__(self, package_name, include_hidden=True):
-        self.package_name = package_name
-        self.include_hidden = include_hidden
-        self.proxy = xmlrpclib.Server('http://pypi.python.org/pypi')
-        self._downloads = {}
-
-    @property
-    def releases(self):
-        """Retrieves the release number for each uploaded release"""
-
-        result = self.proxy.package_releases(self.package_name,
-                                             self.include_hidden)
-
-        if len(result) == 0:
-            # no matching package--search for possibles, and limit to 15
-            # results
-            results = self.proxy.search({
-                'name': self.package_name,
-                'description': self.package_name
-            }, 'or')[:15]
-
-            # make sure we only get unique package names
-            matches = []
-            for match in results:
-                name = match['name']
-                if name not in matches:
-                    matches.append(name)
-
-            # if only one package was found, return it
-            if len(matches) == 1:
-                self.package_name = matches[0]
-                return self.releases
-
-            error = """No such package found: %s
-
-Possible matches include:
-%s
-""" % (self.package_name, '\n'.join('\t- %s' % n for n in matches))
-
-            sys.exit(error)
-
-        return result
-
-    def get_downloads(self):
-        """Calculate the total number of downloads for the package"""
-        downloads = {}
-        for release in self.releases:
-            urls = self.proxy.release_urls(self.package_name, release)
-            urls = pd.DataFrame(urls)
-            urls['version'] = release
-            downloads[release] = urls
-
-        return pd.concat(downloads, ignore_index=True)
-
-if __name__ == '__main__':
-    agg = PyPIDownloadAggregator('pandas')
-
-    data = agg.get_downloads()
-
-    to_omit = ['0.2b1', '0.2beta']
-
-    isostrings = data['upload_time'].map(lambda x: x.value)
-    data['upload_time'] = pd.to_datetime(isostrings)
-
-    totals = data.groupby('version').downloads.sum()
-    rollup = {'0.8.0rc1': '0.8.0',
-              '0.8.0rc2': '0.8.0',
-              '0.3.0.beta': '0.3.0',
-              '0.3.0.beta2': '0.3.0'}
-    downloads = totals.groupby(lambda x: rollup.get(x, x)).sum()
-
-    first_upload = data.groupby('version').upload_time.min()
-
-    result = pd.DataFrame({'downloads': totals,
-                           'release_date': first_upload})
-    result = result.sort('release_date')
-    result = result.drop(to_omit + list(rollup.keys()))
-    result.index.name = 'release'
-
-    by_date = result.reset_index().set_index('release_date').downloads
-    dummy = pd.Series(index=pd.DatetimeIndex([datetime(2012, 12, 27)]))
-    by_date = by_date.append(dummy).shift(1).fillna(0)
diff --git a/scripts/roll_median_leak.py b/scripts/roll_median_leak.py
deleted file mode 100644
index 03f39e2b18372..0000000000000
--- a/scripts/roll_median_leak.py
+++ /dev/null
@@ -1,26 +0,0 @@
-from __future__ import print_function
-from pandas import *
-
-import numpy as np
-import os
-
-from vbench.api import Benchmark
-from pandas.util.testing import rands
-from pandas.compat import range
-import pandas._libs.lib as lib
-import pandas._sandbox as sbx
-import time
-
-import psutil
-
-pid = os.getpid()
-proc = psutil.Process(pid)
-
-lst = SparseList()
-lst.append([5] * 10000)
-lst.append(np.repeat(np.nan, 1000000))
-
-for _ in range(10000):
-    print(proc.get_memory_info())
-    sdf = SparseDataFrame({'A': lst.to_array()})
-    chunk = sdf[sdf['A'] == 5]
diff --git a/scripts/runtests.py b/scripts/runtests.py
deleted file mode 100644
index e14752b43116b..0000000000000
--- a/scripts/runtests.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from __future__ import print_function
-import os
-print(os.getpid())
-import nose
-nose.main('pandas.core')
diff --git a/scripts/test_py27.bat b/scripts/test_py27.bat
deleted file mode 100644
index 11e3056287e31..0000000000000
--- a/scripts/test_py27.bat
+++ /dev/null
@@ -1,6 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python27;C:\Python27\Scripts;%PATH%
-
-python setup.py clean
-python setup.py build_ext -c mingw32 --inplace
-
-nosetests pandas
\ No newline at end of file
diff --git a/scripts/testmed.py b/scripts/testmed.py
deleted file mode 100644
index dd3b952d58c60..0000000000000
--- a/scripts/testmed.py
+++ /dev/null
@@ -1,171 +0,0 @@
-## {{{ Recipe 576930 (r10): Efficient Running Median using an Indexable Skiplist
-
-from random import random
-from math import log, ceil
-from pandas.compat import range
-from numpy.random import randn
-from pandas.lib.skiplist import rolling_median
-
-
-class Node(object):
-    __slots__ = 'value', 'next', 'width'
-
-    def __init__(self, value, next, width):
-        self.value, self.next, self.width = value, next, width
-
-
-class End(object):
-    'Sentinel object that always compares greater than another object'
-    def __cmp__(self, other):
-        return 1
-
-NIL = Node(End(), [], [])               # Singleton terminator node
-
-
-class IndexableSkiplist:
-    'Sorted collection supporting O(lg n) insertion, removal, and lookup by rank.'
-
-    def __init__(self, expected_size=100):
-        self.size = 0
-        self.maxlevels = int(1 + log(expected_size, 2))
-        self.head = Node('HEAD', [NIL] * self.maxlevels, [1] * self.maxlevels)
-
-    def __len__(self):
-        return self.size
-
-    def __getitem__(self, i):
-        node = self.head
-        i += 1
-        for level in reversed(range(self.maxlevels)):
-            while node.width[level] <= i:
-                i -= node.width[level]
-                node = node.next[level]
-        return node.value
-
-    def insert(self, value):
-        # find first node on each level where node.next[levels].value > value
-        chain = [None] * self.maxlevels
-        steps_at_level = [0] * self.maxlevels
-        node = self.head
-        for level in reversed(range(self.maxlevels)):
-            while node.next[level].value <= value:
-                steps_at_level[level] += node.width[level]
-                node = node.next[level]
-            chain[level] = node
-
-        # insert a link to the newnode at each level
-        d = min(self.maxlevels, 1 - int(log(random(), 2.0)))
-        newnode = Node(value, [None] * d, [None] * d)
-        steps = 0
-        for level in range(d):
-            prevnode = chain[level]
-            newnode.next[level] = prevnode.next[level]
-            prevnode.next[level] = newnode
-            newnode.width[level] = prevnode.width[level] - steps
-            prevnode.width[level] = steps + 1
-            steps += steps_at_level[level]
-        for level in range(d, self.maxlevels):
-            chain[level].width[level] += 1
-        self.size += 1
-
-    def remove(self, value):
-        # find first node on each level where node.next[levels].value >= value
-        chain = [None] * self.maxlevels
-        node = self.head
-        for level in reversed(range(self.maxlevels)):
-            while node.next[level].value < value:
-                node = node.next[level]
-            chain[level] = node
-        if value != chain[0].next[0].value:
-            raise KeyError('Not Found')
-
-        # remove one link at each level
-        d = len(chain[0].next[0].next)
-        for level in range(d):
-            prevnode = chain[level]
-            prevnode.width[level] += prevnode.next[level].width[level] - 1
-            prevnode.next[level] = prevnode.next[level].next[level]
-        for level in range(d, self.maxlevels):
-            chain[level].width[level] -= 1
-        self.size -= 1
-
-    def __iter__(self):
-        'Iterate over values in sorted order'
-        node = self.head.next[0]
-        while node is not NIL:
-            yield node.value
-            node = node.next[0]
-
-from collections import deque
-from itertools import islice
-
-
-class RunningMedian:
-    'Fast running median with O(lg n) updates where n is the window size'
-
-    def __init__(self, n, iterable):
-        from pandas.lib.skiplist import IndexableSkiplist as skiplist
-
-        self.it = iter(iterable)
-        self.queue = deque(islice(self.it, n))
-        self.skiplist = IndexableSkiplist(n)
-        for elem in self.queue:
-            self.skiplist.insert(elem)
-
-    def __iter__(self):
-        queue = self.queue
-        skiplist = self.skiplist
-        midpoint = len(queue) // 2
-        yield skiplist[midpoint]
-        for newelem in self.it:
-            oldelem = queue.popleft()
-            skiplist.remove(oldelem)
-            queue.append(newelem)
-            skiplist.insert(newelem)
-            yield skiplist[midpoint]
-
-N = 100000
-K = 10000
-
-import time
-
-
-def test():
-    from numpy.random import randn
-
-    arr = randn(N)
-
-    def _test(arr, k):
-        meds = RunningMedian(k, arr)
-        return list(meds)
-
-    _test(arr, K)
-
-
-
-def test2():
-
-    arr = randn(N)
-
-    return rolling_median(arr, K)
-
-
-def runmany(f, arr, arglist):
-    timings = []
-
-    for arg in arglist:
-        tot = 0
-        for i in range(5):
-            tot += _time(f, arr, arg)
-        timings.append(tot / 5)
-
-    return timings
-
-
-def _time(f, *args):
-    _start = time.clock()
-    result = f(*args)
-    return time.clock() - _start
-
-if __name__ == '__main__':
-    test2()
diff --git a/scripts/tests/__init__.py b/scripts/tests/__init__.py
new file mode 100644
index 0000000000000..e69de29bb2d1d
diff --git a/scripts/tests/conftest.py b/scripts/tests/conftest.py
new file mode 100644
index 0000000000000..f8318b8d402af
--- /dev/null
+++ b/scripts/tests/conftest.py
@@ -0,0 +1,3 @@
+def pytest_addoption(parser):
+    parser.addoption("--strict-data-files", action="store_true",
+                     help="Unused. For compat with setup.cfg.")
diff --git a/scripts/tests/test_validate_docstrings.py b/scripts/tests/test_validate_docstrings.py
new file mode 100644
index 0000000000000..09fb5a30cbc3b
--- /dev/null
+++ b/scripts/tests/test_validate_docstrings.py
@@ -0,0 +1,1131 @@
+import io
+import random
+import string
+import textwrap
+import pytest
+import numpy as np
+import pandas as pd
+
+import validate_docstrings
+validate_one = validate_docstrings.validate_one
+
+
+class GoodDocStrings(object):
+    """
+    Collection of good doc strings.
+
+    This class contains a lot of docstrings that should pass the validation
+    script without any errors.
+    """
+
+    def plot(self, kind, color='blue', **kwargs):
+        """
+        Generate a plot.
+
+        Render the data in the Series as a matplotlib plot of the
+        specified kind.
+
+        Parameters
+        ----------
+        kind : str
+            Kind of matplotlib plot.
+        color : str, default 'blue'
+            Color name or rgb code.
+        **kwargs
+            These parameters will be passed to the matplotlib plotting
+            function.
+        """
+        pass
+
+    def sample(self):
+        """
+        Generate and return a random number.
+
+        The value is sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Returns
+        -------
+        float
+            Random number generated.
+        """
+        return random.random()
+
+    def random_letters(self):
+        """
+        Generate and return a sequence of random letters.
+
+        The length of the returned string is also random, and is also
+        returned.
+
+        Returns
+        -------
+        length : int
+            Length of the returned string.
+        letters : str
+            String of random letters.
+        """
+        length = random.randint(1, 10)
+        letters = "".join(random.sample(string.ascii_lowercase, length))
+        return length, letters
+
+    def sample_values(self):
+        """
+        Generate an infinite sequence of random numbers.
+
+        The values are sampled from a continuous uniform distribution between
+        0 and 1.
+
+        Yields
+        ------
+        float
+            Random number generated.
+        """
+        while True:
+            yield random.random()
+
+    def head(self):
+        """
+        Return the first 5 elements of the Series.
+
+        This function is mainly useful to preview the values of the
+        Series without displaying the whole of it.
+
+        Returns
+        -------
+        Series
+            Subset of the original series with the 5 first values.
+
+        See Also
+        --------
+        Series.tail : Return the last 5 elements of the Series.
+        Series.iloc : Return a slice of the elements in the Series,
+            which can also be used to return the first or last n.
+        """
+        return self.iloc[:5]
+
+    def head1(self, n=5):
+        """
+        Return the first elements of the Series.
+
+        This function is mainly useful to preview the values of the
+        Series without displaying the whole of it.
+
+        Parameters
+        ----------
+        n : int
+            Number of values to return.
+
+        Returns
+        -------
+        Series
+            Subset of the original series with the n first values.
+
+        See Also
+        --------
+        tail : Return the last n elements of the Series.
+
+        Examples
+        --------
+        >>> s = pd.Series(['Ant', 'Bear', 'Cow', 'Dog', 'Falcon'])
+        >>> s.head()
+        0   Ant
+        1   Bear
+        2   Cow
+        3   Dog
+        4   Falcon
+        dtype: object
+
+        With the `n` parameter, we can change the number of returned rows:
+
+        >>> s.head(n=3)
+        0   Ant
+        1   Bear
+        2   Cow
+        dtype: object
+        """
+        return self.iloc[:n]
+
+    def contains(self, pat, case=True, na=np.nan):
+        """
+        Return whether each value contains `pat`.
+
+        In this case, we are illustrating how to use sections, even
+        if the example is simple enough and does not require them.
+
+        Parameters
+        ----------
+        pat : str
+            Pattern to check for within each element.
+        case : bool, default True
+            Whether check should be done with case sensitivity.
+        na : object, default np.nan
+            Fill value for missing data.
+
+        Examples
+        --------
+        >>> s = pd.Series(['Antelope', 'Lion', 'Zebra', np.nan])
+        >>> s.str.contains(pat='a')
+        0    False
+        1    False
+        2     True
+        3      NaN
+        dtype: object
+
+        **Case sensitivity**
+
+        With `case_sensitive` set to `False` we can match `a` with both
+        `a` and `A`:
+
+        >>> s.str.contains(pat='a', case=False)
+        0     True
+        1    False
+        2     True
+        3      NaN
+        dtype: object
+
+        **Missing values**
+
+        We can fill missing values in the output using the `na` parameter:
+
+        >>> s.str.contains(pat='a', na=False)
+        0    False
+        1    False
+        2     True
+        3    False
+        dtype: bool
+        """
+        pass
+
+    def mode(self, axis, numeric_only):
+        """
+        Ensure sphinx directives don't affect checks for trailing periods.
+
+        Parameters
+        ----------
+        axis : str
+            Sentence ending in period, followed by single directive.
+
+            .. versionchanged:: 0.1.2
+
+        numeric_only : bool
+            Sentence ending in period, followed by multiple directives.
+
+            .. versionadded:: 0.1.2
+            .. deprecated:: 0.00.0
+                A multiline description,
+                which spans another line.
+        """
+        pass
+
+    def good_imports(self):
+        """
+        Ensure import other than numpy and pandas are fine.
+
+        Examples
+        --------
+        This example does not import pandas or import numpy.
+        >>> import datetime
+        >>> datetime.MAXYEAR
+        9999
+        """
+        pass
+
+
+class BadGenericDocStrings(object):
+    """Everything here has a bad docstring
+    """
+
+    def func(self):
+
+        """Some function.
+
+        With several mistakes in the docstring.
+
+        It has a blank like after the signature `def func():`.
+
+        The text 'Some function' should go in the line after the
+        opening quotes of the docstring, not in the same line.
+
+        There is a blank line between the docstring and the first line
+        of code `foo = 1`.
+
+        The closing quotes should be in the next line, not in this one."""
+
+        foo = 1
+        bar = 2
+        return foo + bar
+
+    def astype(self, dtype):
+        """
+        Casts Series type.
+
+        Verb in third-person of the present simple, should be infinitive.
+        """
+        pass
+
+    def astype1(self, dtype):
+        """
+        Method to cast Series type.
+
+        Does not start with verb.
+        """
+        pass
+
+    def astype2(self, dtype):
+        """
+        Cast Series type
+
+        Missing dot at the end.
+        """
+        pass
+
+    def astype3(self, dtype):
+        """
+        Cast Series type from its current type to the new type defined in
+        the parameter dtype.
+
+        Summary is too verbose and doesn't fit in a single line.
+        """
+        pass
+
+    def two_linebreaks_between_sections(self, foo):
+        """
+        Test linebreaks message GL03.
+
+        Note 2 blank lines before parameters section.
+
+
+        Parameters
+        ----------
+        foo : str
+            Description of foo parameter.
+        """
+        pass
+
+    def linebreak_at_end_of_docstring(self, foo):
+        """
+        Test linebreaks message GL03.
+
+        Note extra blank line at end of docstring.
+
+        Parameters
+        ----------
+        foo : str
+            Description of foo parameter.
+
+        """
+        pass
+
+    def plot(self, kind, **kwargs):
+        """
+        Generate a plot.
+
+        Render the data in the Series as a matplotlib plot of the
+        specified kind.
+
+        Note the blank line between the parameters title and the first
+        parameter. Also, note that after the name of the parameter `kind`
+        and before the colon, a space is missing.
+
+        Also, note that the parameter descriptions do not start with a
+        capital letter, and do not finish with a dot.
+
+        Finally, the `**kwargs` parameter is missing.
+
+        Parameters
+        ----------
+
+        kind: str
+            kind of matplotlib plot
+        """
+        pass
+
+    def method(self, foo=None, bar=None):
+        """
+        A sample DataFrame method.
+
+        Do not import numpy and pandas.
+
+        Try to use meaningful data, when it makes the example easier
+        to understand.
+
+        Try to avoid positional arguments like in `df.method(1)`. They
+        can be alright if previously defined with a meaningful name,
+        like in `present_value(interest_rate)`, but avoid them otherwise.
+
+        When presenting the behavior with different parameters, do not place
+        all the calls one next to the other. Instead, add a short sentence
+        explaining what the example shows.
+
+        Examples
+        --------
+        >>> import numpy as np
+        >>> import pandas as pd
+        >>> df = pd.DataFrame(np.ones((3, 3)),
+        ...                   columns=('a', 'b', 'c'))
+        >>> df.all(1)
+        0    True
+        1    True
+        2    True
+        dtype: bool
+        >>> df.all(bool_only=True)
+        Series([], dtype: bool)
+        """
+        pass
+
+    def private_classes(self):
+        """
+        This mentions NDFrame, which is not correct.
+        """
+
+    def unknown_section(self):
+        """
+        This section has an unknown section title.
+
+        Unknown Section
+        ---------------
+        This should raise an error in the validation.
+        """
+
+    def sections_in_wrong_order(self):
+        """
+        This docstring has the sections in the wrong order.
+
+        Parameters
+        ----------
+        name : str
+            This section is in the right position.
+
+        Examples
+        --------
+        >>> print('So far Examples is good, as it goes before Parameters')
+        So far Examples is good, as it goes before Parameters
+
+        See Also
+        --------
+        function : This should generate an error, as See Also needs to go
+            before Examples.
+        """
+
+    def deprecation_in_wrong_order(self):
+        """
+        This docstring has the deprecation warning in the wrong order.
+
+        This is the extended summary. The correct order should be
+        summary, deprecation warning, extended summary.
+
+        .. deprecated:: 1.0
+            This should generate an error as it needs to go before
+            extended summary.
+        """
+
+    def method_wo_docstrings(self):
+        pass
+
+
+class BadSummaries(object):
+
+    def wrong_line(self):
+        """Exists on the wrong line"""
+        pass
+
+    def no_punctuation(self):
+        """
+        Has the right line but forgets punctuation
+        """
+        pass
+
+    def no_capitalization(self):
+        """
+        provides a lowercase summary.
+        """
+        pass
+
+    def no_infinitive(self):
+        """
+        Started with a verb that is not infinitive.
+        """
+
+    def multi_line(self):
+        """
+        Extends beyond one line
+        which is not correct.
+        """
+
+    def two_paragraph_multi_line(self):
+        """
+        Extends beyond one line
+        which is not correct.
+
+        Extends beyond one line, which in itself is correct but the
+        previous short summary should still be an issue.
+        """
+
+
+class BadParameters(object):
+    """
+    Everything here has a problem with its Parameters section.
+    """
+
+    def missing_params(self, kind, **kwargs):
+        """
+        Lacks kwargs in Parameters.
+
+        Parameters
+        ----------
+        kind : str
+            Foo bar baz.
+        """
+
+    def bad_colon_spacing(self, kind):
+        """
+        Has bad spacing in the type line.
+
+        Parameters
+        ----------
+        kind: str
+            Needs a space after kind.
+        """
+
+    def no_description_period(self, kind):
+        """
+        Forgets to add a period to the description.
+
+        Parameters
+        ----------
+        kind : str
+           Doesn't end with a dot
+        """
+
+    def no_description_period_with_directive(self, kind):
+        """
+        Forgets to add a period, and also includes a directive.
+
+        Parameters
+        ----------
+        kind : str
+           Doesn't end with a dot
+
+           .. versionadded:: 0.00.0
+        """
+
+    def no_description_period_with_directives(self, kind):
+        """
+        Forgets to add a period, and also includes multiple directives.
+
+        Parameters
+        ----------
+        kind : str
+           Doesn't end with a dot
+
+           .. versionchanged:: 0.00.0
+           .. deprecated:: 0.00.0
+        """
+
+    def parameter_capitalization(self, kind):
+        """
+        Forgets to capitalize the description.
+
+        Parameters
+        ----------
+        kind : str
+           this is not capitalized.
+        """
+
+    def blank_lines(self, kind):
+        """
+        Adds a blank line after the section header.
+
+        Parameters
+        ----------
+
+        kind : str
+            Foo bar baz.
+        """
+        pass
+
+    def integer_parameter(self, kind):
+        """
+        Uses integer instead of int.
+
+        Parameters
+        ----------
+        kind : integer
+            Foo bar baz.
+        """
+        pass
+
+    def string_parameter(self, kind):
+        """
+        Uses string instead of str.
+
+        Parameters
+        ----------
+        kind : string
+            Foo bar baz.
+        """
+        pass
+
+    def boolean_parameter(self, kind):
+        """
+        Uses boolean instead of bool.
+
+        Parameters
+        ----------
+        kind : boolean
+            Foo bar baz.
+        """
+        pass
+
+    def list_incorrect_parameter_type(self, kind):
+        """
+        Uses list of boolean instead of list of bool.
+
+        Parameters
+        ----------
+        kind : list of boolean, integer, float or string
+            Foo bar baz.
+        """
+        pass
+
+
+class BadReturns(object):
+
+    def return_not_documented(self):
+        """
+        Lacks section for Returns
+        """
+        return "Hello world!"
+
+    def yield_not_documented(self):
+        """
+        Lacks section for Yields
+        """
+        yield "Hello world!"
+
+    def no_type(self):
+        """
+        Returns documented but without type.
+
+        Returns
+        -------
+        Some value.
+        """
+        return "Hello world!"
+
+    def no_description(self):
+        """
+        Provides type but no descrption.
+
+        Returns
+        -------
+        str
+        """
+        return "Hello world!"
+
+    def no_punctuation(self):
+        """
+        Provides type and description but no period.
+
+        Returns
+        -------
+        str
+           A nice greeting
+        """
+        return "Hello world!"
+
+    def named_single_return(self):
+        """
+        Provides name but returns only one value.
+
+        Returns
+        -------
+        s : str
+           A nice greeting.
+        """
+        return "Hello world!"
+
+    def no_capitalization(self):
+        """
+        Forgets capitalization in return values description.
+
+        Returns
+        -------
+        foo : str
+           The first returned string.
+        bar : str
+           the second returned string.
+        """
+        return "Hello", "World!"
+
+    def no_period_multi(self):
+        """
+        Forgets period in return values description.
+
+        Returns
+        -------
+        foo : str
+           The first returned string
+        bar : str
+           The second returned string.
+        """
+        return "Hello", "World!"
+
+
+class BadSeeAlso(object):
+
+    def desc_no_period(self):
+        """
+        Return the first 5 elements of the Series.
+
+        See Also
+        --------
+        Series.tail : Return the last 5 elements of the Series.
+        Series.iloc : Return a slice of the elements in the Series,
+            which can also be used to return the first or last n
+        """
+        pass
+
+    def desc_first_letter_lowercase(self):
+        """
+        Return the first 5 elements of the Series.
+
+        See Also
+        --------
+        Series.tail : return the last 5 elements of the Series.
+        Series.iloc : Return a slice of the elements in the Series,
+            which can also be used to return the first or last n.
+        """
+        pass
+
+    def prefix_pandas(self):
+        """
+        Have `pandas` prefix in See Also section.
+
+        See Also
+        --------
+        pandas.Series.rename : Alter Series index labels or name.
+        DataFrame.head : The first `n` rows of the caller object.
+        """
+        pass
+
+
+class BadExamples(object):
+
+    def unused_import(self):
+        """
+        Examples
+        --------
+        >>> import pandas as pdf
+        >>> df = pd.DataFrame(np.ones((3, 3)), columns=('a', 'b', 'c'))
+        """
+        pass
+
+    def missing_whitespace_around_arithmetic_operator(self):
+        """
+        Examples
+        --------
+        >>> 2+5
+        7
+        """
+        pass
+
+    def indentation_is_not_a_multiple_of_four(self):
+        """
+        Examples
+        --------
+        >>> if 2 + 5:
+        ...   pass
+        """
+        pass
+
+    def missing_whitespace_after_comma(self):
+        """
+        Examples
+        --------
+        >>> df = pd.DataFrame(np.ones((3,3)),columns=('a','b', 'c'))
+        """
+        pass
+
+
+class TestValidator(object):
+
+    def _import_path(self, klass=None, func=None):
+        """
+        Build the required import path for tests in this module.
+
+        Parameters
+        ----------
+        klass : str
+            Class name of object in module.
+        func : str
+            Function name of object in module.
+
+        Returns
+        -------
+        str
+            Import path of specified object in this module
+        """
+        base_path = "scripts.tests.test_validate_docstrings"
+
+        if klass:
+            base_path = ".".join([base_path, klass])
+
+        if func:
+            base_path = ".".join([base_path, func])
+
+        return base_path
+
+    def test_good_class(self, capsys):
+        errors = validate_one(self._import_path(
+            klass='GoodDocStrings'))['errors']
+        assert isinstance(errors, list)
+        assert not errors
+
+    @pytest.mark.parametrize("func", [
+        'plot', 'sample', 'random_letters', 'sample_values', 'head', 'head1',
+        'contains', 'mode', 'good_imports'])
+    def test_good_functions(self, capsys, func):
+        errors = validate_one(self._import_path(
+            klass='GoodDocStrings', func=func))['errors']
+        assert isinstance(errors, list)
+        assert not errors
+
+    def test_bad_class(self, capsys):
+        errors = validate_one(self._import_path(
+            klass='BadGenericDocStrings'))['errors']
+        assert isinstance(errors, list)
+        assert errors
+
+    @pytest.mark.parametrize("func", [
+        'func', 'astype', 'astype1', 'astype2', 'astype3', 'plot', 'method',
+        'private_classes',
+    ])
+    def test_bad_generic_functions(self, capsys, func):
+        errors = validate_one(self._import_path(  # noqa:F821
+            klass='BadGenericDocStrings', func=func))['errors']
+        assert isinstance(errors, list)
+        assert errors
+
+    @pytest.mark.parametrize("klass,func,msgs", [
+        # See Also tests
+        ('BadGenericDocStrings', 'private_classes',
+         ("Private classes (NDFrame) should not be mentioned in public "
+          'docstrings',)),
+        ('BadGenericDocStrings', 'unknown_section',
+         ('Found unknown section "Unknown Section".',)),
+        ('BadGenericDocStrings', 'sections_in_wrong_order',
+         ('Sections are in the wrong order. Correct order is: Parameters, '
+          'See Also, Examples',)),
+        ('BadGenericDocStrings', 'deprecation_in_wrong_order',
+         ('Deprecation warning should precede extended summary',)),
+        ('BadSeeAlso', 'desc_no_period',
+         ('Missing period at end of description for See Also "Series.iloc"',)),
+        ('BadSeeAlso', 'desc_first_letter_lowercase',
+         ('should be capitalized for See Also "Series.tail"',)),
+        # Summary tests
+        ('BadSummaries', 'wrong_line',
+         ('should start in the line immediately after the opening quotes',)),
+        ('BadSummaries', 'no_punctuation',
+         ('Summary does not end with a period',)),
+        ('BadSummaries', 'no_capitalization',
+         ('Summary does not start with a capital letter',)),
+        ('BadSummaries', 'no_capitalization',
+         ('Summary must start with infinitive verb',)),
+        ('BadSummaries', 'multi_line',
+         ('Summary should fit in a single line',)),
+        ('BadSummaries', 'two_paragraph_multi_line',
+         ('Summary should fit in a single line',)),
+        # Parameters tests
+        ('BadParameters', 'missing_params',
+         ('Parameters {**kwargs} not documented',)),
+        ('BadParameters', 'bad_colon_spacing',
+         ('Parameter "kind" requires a space before the colon '
+          'separating the parameter name and type',)),
+        ('BadParameters', 'no_description_period',
+         ('Parameter "kind" description should finish with "."',)),
+        ('BadParameters', 'no_description_period_with_directive',
+         ('Parameter "kind" description should finish with "."',)),
+        ('BadParameters', 'parameter_capitalization',
+         ('Parameter "kind" description should start with a capital letter',)),
+        ('BadParameters', 'integer_parameter',
+         ('Parameter "kind" type should use "int" instead of "integer"',)),
+        ('BadParameters', 'string_parameter',
+         ('Parameter "kind" type should use "str" instead of "string"',)),
+        ('BadParameters', 'boolean_parameter',
+         ('Parameter "kind" type should use "bool" instead of "boolean"',)),
+        ('BadParameters', 'list_incorrect_parameter_type',
+         ('Parameter "kind" type should use "bool" instead of "boolean"',)),
+        ('BadParameters', 'list_incorrect_parameter_type',
+         ('Parameter "kind" type should use "int" instead of "integer"',)),
+        ('BadParameters', 'list_incorrect_parameter_type',
+         ('Parameter "kind" type should use "str" instead of "string"',)),
+        pytest.param('BadParameters', 'blank_lines', ('No error yet?',),
+                     marks=pytest.mark.xfail),
+        # Returns tests
+        ('BadReturns', 'return_not_documented', ('No Returns section found',)),
+        ('BadReturns', 'yield_not_documented', ('No Yields section found',)),
+        pytest.param('BadReturns', 'no_type', ('foo',),
+                     marks=pytest.mark.xfail),
+        ('BadReturns', 'no_description',
+         ('Return value has no description',)),
+        ('BadReturns', 'no_punctuation',
+         ('Return value description should finish with "."',)),
+        ('BadReturns', 'named_single_return',
+         ('The first line of the Returns section should contain only the '
+          'type, unless multiple values are being returned',)),
+        ('BadReturns', 'no_capitalization',
+         ('Return value description should start with a capital '
+          'letter',)),
+        ('BadReturns', 'no_period_multi',
+         ('Return value description should finish with "."',)),
+        # Examples tests
+        ('BadGenericDocStrings', 'method',
+         ('Do not import numpy, as it is imported automatically',)),
+        ('BadGenericDocStrings', 'method',
+         ('Do not import pandas, as it is imported automatically',)),
+        ('BadGenericDocStrings', 'method_wo_docstrings',
+         ("The object does not have a docstring",)),
+        # See Also tests
+        ('BadSeeAlso', 'prefix_pandas',
+         ('pandas.Series.rename in `See Also` section '
+          'does not need `pandas` prefix',)),
+        # Examples tests
+        ('BadExamples', 'unused_import',
+         ("flake8 error: F401 'pandas as pdf' imported but unused",)),
+        ('BadExamples', 'indentation_is_not_a_multiple_of_four',
+         ('flake8 error: E111 indentation is not a multiple of four',)),
+        ('BadExamples', 'missing_whitespace_around_arithmetic_operator',
+         ('flake8 error: '
+          'E226 missing whitespace around arithmetic operator',)),
+        ('BadExamples', 'missing_whitespace_after_comma',
+         ("flake8 error: E231 missing whitespace after ',' (3 times)",)),
+        ('BadGenericDocStrings', 'two_linebreaks_between_sections',
+         ('Double line break found; please use only one blank line to '
+          'separate sections or paragraphs, and do not leave blank lines '
+          'at the end of docstrings',)),
+        ('BadGenericDocStrings', 'linebreak_at_end_of_docstring',
+         ('Double line break found; please use only one blank line to '
+          'separate sections or paragraphs, and do not leave blank lines '
+          'at the end of docstrings',)),
+    ])
+    def test_bad_docstrings(self, capsys, klass, func, msgs):
+        result = validate_one(self._import_path(klass=klass, func=func))
+        for msg in msgs:
+            assert msg in ' '.join(err[1] for err in result['errors'])
+
+    def test_validate_all_ignore_deprecated(self, monkeypatch):
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_one', lambda func_name: {
+                'docstring': 'docstring1',
+                'errors': [('ER01', 'err desc'),
+                           ('ER02', 'err desc'),
+                           ('ER03', 'err desc')],
+                'warnings': [],
+                'examples_errors': '',
+                'deprecated': True})
+        result = validate_docstrings.validate_all(prefix=None,
+                                                  ignore_deprecated=True)
+        assert len(result) == 0
+
+
+class TestApiItems(object):
+    @property
+    def api_doc(self):
+        return io.StringIO(textwrap.dedent('''
+            .. currentmodule:: itertools
+
+            Itertools
+            ---------
+
+            Infinite
+            ~~~~~~~~
+
+            .. autosummary::
+
+                cycle
+                count
+
+            Finite
+            ~~~~~~
+
+            .. autosummary::
+
+                chain
+
+            .. currentmodule:: random
+
+            Random
+            ------
+
+            All
+            ~~~
+
+            .. autosummary::
+
+                seed
+                randint
+            '''))
+
+    @pytest.mark.parametrize('idx,name', [(0, 'itertools.cycle'),
+                                          (1, 'itertools.count'),
+                                          (2, 'itertools.chain'),
+                                          (3, 'random.seed'),
+                                          (4, 'random.randint')])
+    def test_item_name(self, idx, name):
+        result = list(validate_docstrings.get_api_items(self.api_doc))
+        assert result[idx][0] == name
+
+    @pytest.mark.parametrize('idx,func', [(0, 'cycle'),
+                                          (1, 'count'),
+                                          (2, 'chain'),
+                                          (3, 'seed'),
+                                          (4, 'randint')])
+    def test_item_function(self, idx, func):
+        result = list(validate_docstrings.get_api_items(self.api_doc))
+        assert callable(result[idx][1])
+        assert result[idx][1].__name__ == func
+
+    @pytest.mark.parametrize('idx,section', [(0, 'Itertools'),
+                                             (1, 'Itertools'),
+                                             (2, 'Itertools'),
+                                             (3, 'Random'),
+                                             (4, 'Random')])
+    def test_item_section(self, idx, section):
+        result = list(validate_docstrings.get_api_items(self.api_doc))
+        assert result[idx][2] == section
+
+    @pytest.mark.parametrize('idx,subsection', [(0, 'Infinite'),
+                                                (1, 'Infinite'),
+                                                (2, 'Finite'),
+                                                (3, 'All'),
+                                                (4, 'All')])
+    def test_item_subsection(self, idx, subsection):
+        result = list(validate_docstrings.get_api_items(self.api_doc))
+        assert result[idx][3] == subsection
+
+
+class TestDocstringClass(object):
+    @pytest.mark.parametrize('name, expected_obj',
+                             [('pandas.isnull', pd.isnull),
+                              ('pandas.DataFrame', pd.DataFrame),
+                              ('pandas.Series.sum', pd.Series.sum)])
+    def test_resolves_class_name(self, name, expected_obj):
+        d = validate_docstrings.Docstring(name)
+        assert d.obj is expected_obj
+
+    @pytest.mark.parametrize('invalid_name', ['panda', 'panda.DataFrame'])
+    def test_raises_for_invalid_module_name(self, invalid_name):
+        msg = 'No module can be imported from "{}"'.format(invalid_name)
+        with pytest.raises(ImportError, match=msg):
+            validate_docstrings.Docstring(invalid_name)
+
+    @pytest.mark.parametrize('invalid_name',
+                             ['pandas.BadClassName',
+                              'pandas.Series.bad_method_name'])
+    def test_raises_for_invalid_attribute_name(self, invalid_name):
+        name_components = invalid_name.split('.')
+        obj_name, invalid_attr_name = name_components[-2], name_components[-1]
+        msg = "'{}' has no attribute '{}'".format(obj_name, invalid_attr_name)
+        with pytest.raises(AttributeError, match=msg):
+            validate_docstrings.Docstring(invalid_name)
+
+
+class TestMainFunction(object):
+    def test_exit_status_for_validate_one(self, monkeypatch):
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_one', lambda func_name: {
+                'docstring': 'docstring1',
+                'errors': [('ER01', 'err desc'),
+                           ('ER02', 'err desc'),
+                           ('ER03', 'err desc')],
+                'warnings': [],
+                'examples_errors': ''})
+        exit_status = validate_docstrings.main(func_name='docstring1',
+                                               prefix=None,
+                                               errors=[],
+                                               output_format='default',
+                                               ignore_deprecated=False)
+        assert exit_status == 0
+
+    def test_exit_status_errors_for_validate_all(self, monkeypatch):
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_all',
+            lambda prefix, ignore_deprecated=False: {
+                'docstring1': {'errors': [('ER01', 'err desc'),
+                                          ('ER02', 'err desc'),
+                                          ('ER03', 'err desc')],
+                               'file': 'module1.py',
+                               'file_line': 23},
+                'docstring2': {'errors': [('ER04', 'err desc'),
+                                          ('ER05', 'err desc')],
+                               'file': 'module2.py',
+                               'file_line': 925}})
+        exit_status = validate_docstrings.main(func_name=None,
+                                               prefix=None,
+                                               errors=[],
+                                               output_format='default',
+                                               ignore_deprecated=False)
+        assert exit_status == 5
+
+    def test_no_exit_status_noerrors_for_validate_all(self, monkeypatch):
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_all',
+            lambda prefix, ignore_deprecated=False: {
+                'docstring1': {'errors': [],
+                               'warnings': [('WN01', 'warn desc')]},
+                'docstring2': {'errors': []}})
+        exit_status = validate_docstrings.main(func_name=None,
+                                               prefix=None,
+                                               errors=[],
+                                               output_format='default',
+                                               ignore_deprecated=False)
+        assert exit_status == 0
+
+    def test_exit_status_for_validate_all_json(self, monkeypatch):
+        print('EXECUTED')
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_all',
+            lambda prefix, ignore_deprecated=False: {
+                'docstring1': {'errors': [('ER01', 'err desc'),
+                                          ('ER02', 'err desc'),
+                                          ('ER03', 'err desc')]},
+                'docstring2': {'errors': [('ER04', 'err desc'),
+                                          ('ER05', 'err desc')]}})
+        exit_status = validate_docstrings.main(func_name=None,
+                                               prefix=None,
+                                               errors=[],
+                                               output_format='json',
+                                               ignore_deprecated=False)
+        assert exit_status == 0
+
+    def test_errors_param_filters_errors(self, monkeypatch):
+        monkeypatch.setattr(
+            validate_docstrings, 'validate_all',
+            lambda prefix, ignore_deprecated=False: {
+                'Series.foo': {'errors': [('ER01', 'err desc'),
+                                          ('ER02', 'err desc'),
+                                          ('ER03', 'err desc')],
+                               'file': 'series.py',
+                               'file_line': 142},
+                'DataFrame.bar': {'errors': [('ER01', 'err desc'),
+                                             ('ER02', 'err desc')],
+                                  'file': 'frame.py',
+                                  'file_line': 598},
+                'Series.foobar': {'errors': [('ER01', 'err desc')],
+                                  'file': 'series.py',
+                                  'file_line': 279}})
+        exit_status = validate_docstrings.main(func_name=None,
+                                               prefix=None,
+                                               errors=['ER01'],
+                                               output_format='default',
+                                               ignore_deprecated=False)
+        assert exit_status == 3
+
+        exit_status = validate_docstrings.main(func_name=None,
+                                               prefix=None,
+                                               errors=['ER03'],
+                                               output_format='default',
+                                               ignore_deprecated=False)
+        assert exit_status == 1
diff --git a/scripts/touchup_gh_issues.py b/scripts/touchup_gh_issues.py
deleted file mode 100755
index 8aa6d426156f0..0000000000000
--- a/scripts/touchup_gh_issues.py
+++ /dev/null
@@ -1,44 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-from collections import OrderedDict
-import sys
-import re
-
-"""
-Reads in stdin, replace all occurences of '#num' or 'GH #num' with
-links to github issue. dumps the issue anchors before the next
-section header
-"""
-
-pat = "((?:\s*GH\s*)?)#(\d{3,4})([^_]|$)?"
-rep_pat = r"\1GH\2_\3"
-anchor_pat = ".. _GH{id}: https://github.com/pandas-dev/pandas/issues/{id}"
-section_pat = "^pandas\s[\d\.]+\s*$"
-
-
-def main():
-    issues = OrderedDict()
-    while True:
-
-        line = sys.stdin.readline()
-        if not line:
-            break
-
-        if re.search(section_pat, line):
-            for id in issues:
-                print(anchor_pat.format(id=id).rstrip())
-            if issues:
-                print("\n")
-            issues = OrderedDict()
-
-        for m in re.finditer(pat, line):
-            id = m.group(2)
-            if id not in issues:
-                issues[id] = True
-        print(re.sub(pat, rep_pat, line).rstrip())
-    pass
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/use_build_cache.py b/scripts/use_build_cache.py
deleted file mode 100755
index f8c2df2a8a45d..0000000000000
--- a/scripts/use_build_cache.py
+++ /dev/null
@@ -1,354 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-import os
-
-"""
-This script should be run from the repo root dir, it rewrites setup.py
-to use the build cache directory specified in the envar BUILD_CACHE_DIR
-or in a file named .build_cache_dir in the repo root directory.
-
-Artifacts included in the cache:
-- gcc artifacts
-- The .c files resulting from cythonizing pyx/d files
-- 2to3 refactoring results (when run under python3)
-
-Tested on releases back to 0.7.0.
-
-"""
-
-try:
-    import argparse
-    argparser = argparse.ArgumentParser(description="""
-    'Program description.
-    """.strip())
-
-    argparser.add_argument('-f', '--force-overwrite',
-                    default=False,
-                   help='Setting this will overwrite any existing cache results for the current commit',
-                   action='store_true')
-    argparser.add_argument('-d', '--debug',
-                    default=False,
-                   help='Report cache hits/misses',
-                   action='store_true')
-
-    args = argparser.parse_args()
-except:
-    class Foo(object):
-        debug=False
-        force_overwrite=False
-
-    args = Foo() # for 2.6, no argparse
-
-#print(args.accumulate(args.integers))
-
-shim="""
-import os
-import sys
-import shutil
-import warnings
-import re
-"""
-
-shim += ("BC_FORCE_OVERWRITE = %s\n" % args.force_overwrite)
-shim += ("BC_DEBUG = %s\n" % args.debug)
-
-shim += """
-try:
-    if not ("develop" in sys.argv) and not ("install" in sys.argv):
-        1/0
-    basedir = os.path.dirname(__file__)
-    dotfile = os.path.join(basedir,".build_cache_dir")
-    BUILD_CACHE_DIR = ""
-    if os.path.exists(dotfile):
-        BUILD_CACHE_DIR = open(dotfile).readline().strip()
-    BUILD_CACHE_DIR = os.environ.get('BUILD_CACHE_DIR',BUILD_CACHE_DIR)
-
-    if os.path.isdir(BUILD_CACHE_DIR):
-        print("--------------------------------------------------------")
-        print("BUILD CACHE ACTIVATED (V2). be careful, this is experimental.")
-        print("BUILD_CACHE_DIR: " + BUILD_CACHE_DIR )
-        print("--------------------------------------------------------")
-    else:
-        BUILD_CACHE_DIR = None
-
-    # retrieve 2to3 artifacts
-    if sys.version_info[0] >= 3:
-        from lib2to3 import refactor
-        from  hashlib import sha1
-        import shutil
-        import multiprocessing
-        pyver = "%d.%d" % (sys.version_info[:2])
-        fileq = ["pandas"]
-        to_process = dict()
-
-        # retrieve the hashes existing in the cache
-        orig_hashes=dict()
-        post_hashes=dict()
-        for path,dirs,files in os.walk(os.path.join(BUILD_CACHE_DIR,'pandas')):
-            for f in files:
-                s=f.split(".py-")[-1]
-                try:
-                    prev_h,post_h,ver = s.split('-')
-                    if ver == pyver:
-                        orig_hashes[prev_h] = os.path.join(path,f)
-                        post_hashes[post_h] = os.path.join(path,f)
-                except:
-                    pass
-
-        while fileq:
-            f = fileq.pop()
-
-            if os.path.isdir(f):
-                fileq.extend([os.path.join(f,x) for x in os.listdir(f)])
-            else:
-                if not f.endswith(".py"):
-                    continue
-                else:
-                    try:
-                        h = sha1(open(f,"rb").read()).hexdigest()
-                    except IOError:
-                        to_process[h] = f
-                    else:
-                        if h in orig_hashes and not BC_FORCE_OVERWRITE:
-                            src = orig_hashes[h]
-                            if BC_DEBUG:
-                                print("2to3 cache hit %s,%s" % (f,h))
-                            shutil.copyfile(src,f)
-                        elif h not in post_hashes:
-                            # we're not in a dev dir with already processed files
-                            if BC_DEBUG:
-                                print("2to3 cache miss (will process) %s,%s" % (f,h))
-                            to_process[h] = f
-
-        avail_fixes = set(refactor.get_fixers_from_package("lib2to3.fixes"))
-        avail_fixes.discard('lib2to3.fixes.fix_next')
-        t=refactor.RefactoringTool(avail_fixes)
-        if to_process:
-            print("Starting 2to3 refactoring...")
-            for orig_h,f in to_process.items():
-                if BC_DEBUG:
-                    print("2to3 on %s" % f)
-                try:
-                    t.refactor([f],True)
-                    post_h = sha1(open(f, "rb").read()).hexdigest()
-                    cached_fname = f + '-' + orig_h  + '-' + post_h + '-' + pyver
-                    path = os.path.join(BUILD_CACHE_DIR, cached_fname)
-                    pathdir =os.path.dirname(path)
-                    if BC_DEBUG:
-                        print("cache put %s in %s" % (f, path))
-                    try:
-                        os.makedirs(pathdir)
-                    except OSError as exc:
-                        import errno
-                        if exc.errno == errno.EEXIST and os.path.isdir(pathdir):
-                            pass
-                        else:
-                            raise
-
-                    shutil.copyfile(f, path)
-
-                except Exception as e:
-                    print("While processing %s 2to3 raised: %s" % (f,str(e)))
-
-                    pass
-            print("2to3 done refactoring.")
-
-except Exception as e:
-    if not isinstance(e,ZeroDivisionError):
-        print( "Exception: " + str(e))
-    BUILD_CACHE_DIR = None
-
-class CompilationCacheMixin(object):
-    def __init__(self, *args, **kwds):
-        cache_dir = kwds.pop("cache_dir", BUILD_CACHE_DIR)
-        self.cache_dir = cache_dir
-        if  not os.path.isdir(cache_dir):
-            raise Exception("Error: path to Cache directory (%s) is not a dir" % cache_dir)
-
-    def _copy_from_cache(self, hash, target):
-        src = os.path.join(self.cache_dir, hash)
-        if os.path.exists(src) and not BC_FORCE_OVERWRITE:
-            if BC_DEBUG:
-                print("Cache HIT: asked to copy file %s in %s"  %
-                    (src,os.path.abspath(target)))
-            s = "."
-            for d in target.split(os.path.sep)[:-1]:
-                s = os.path.join(s, d)
-                if not os.path.exists(s):
-                    os.mkdir(s)
-            shutil.copyfile(src, target)
-
-            return True
-
-        return False
-
-    def _put_to_cache(self, hash, src):
-        target = os.path.join(self.cache_dir, hash)
-        if BC_DEBUG:
-            print( "Cache miss: asked to copy file from %s to %s" % (src,target))
-        s = "."
-        for d in target.split(os.path.sep)[:-1]:
-            s = os.path.join(s, d)
-            if not os.path.exists(s):
-                os.mkdir(s)
-        shutil.copyfile(src, target)
-
-    def _hash_obj(self, obj):
-        try:
-            return hash(obj)
-        except:
-            raise NotImplementedError("You must override this method")
-
-class CompilationCacheExtMixin(CompilationCacheMixin):
-    def _hash_file(self, fname):
-        from hashlib import sha1
-        f= None
-        try:
-            hash = sha1()
-            hash.update(self.build_lib.encode('utf-8'))
-            try:
-                if sys.version_info[0] >= 3:
-                    import io
-                    f = io.open(fname, "rb")
-                else:
-                    f = open(fname)
-
-                first_line = f.readline()
-                # ignore cython generation timestamp header
-                if "Generated by Cython" not in first_line.decode('utf-8'):
-                    hash.update(first_line)
-                hash.update(f.read())
-                return hash.hexdigest()
-
-            except:
-                raise
-                return None
-            finally:
-                if f:
-                    f.close()
-
-        except IOError:
-            return None
-
-    def _hash_obj(self, ext):
-        from hashlib import sha1
-
-        sources = ext.sources
-        if (sources is None or
-            (not hasattr(sources, '__iter__')) or
-            isinstance(sources, str) or
-                sys.version[0] == 2 and isinstance(sources, unicode)):  # argh
-            return False
-
-        sources = list(sources) + ext.depends
-        hash = sha1()
-        try:
-            for fname in sources:
-                fhash = self._hash_file(fname)
-                if fhash:
-                    hash.update(fhash.encode('utf-8'))
-        except:
-            return None
-
-        return hash.hexdigest()
-
-
-class CachingBuildExt(build_ext, CompilationCacheExtMixin):
-    def __init__(self, *args, **kwds):
-        CompilationCacheExtMixin.__init__(self, *args, **kwds)
-        kwds.pop("cache_dir", None)
-        build_ext.__init__(self, *args, **kwds)
-
-    def build_extension(self, ext, *args, **kwds):
-        ext_path = self.get_ext_fullpath(ext.name)
-        build_path = os.path.join(self.build_lib, os.path.basename(ext_path))
-
-        hash = self._hash_obj(ext)
-        if hash and self._copy_from_cache(hash, ext_path):
-            return
-
-        build_ext.build_extension(self, ext, *args, **kwds)
-
-        hash = self._hash_obj(ext)
-        if os.path.exists(build_path):
-            self._put_to_cache(hash, build_path)  # build_ext
-        if os.path.exists(ext_path):
-            self._put_to_cache(hash, ext_path)  # develop
-
-    def cython_sources(self, sources, extension):
-        import re
-        cplus = self.cython_cplus or getattr(extension, 'cython_cplus', 0) or \
-            (extension.language and extension.language.lower() == 'c++')
-        target_ext = '.c'
-        if cplus:
-            target_ext = '.cpp'
-
-        for i, s in enumerate(sources):
-            if not re.search("\.(pyx|pxi|pxd)$", s):
-                continue
-            ext_dir = os.path.dirname(s)
-            ext_basename = re.sub("\.[^\.]+$", "", os.path.basename(s))
-            ext_basename += target_ext
-            target = os.path.join(ext_dir, ext_basename)
-            hash = self._hash_file(s)
-            sources[i] = target
-            if hash and self._copy_from_cache(hash, target):
-                continue
-            build_ext.cython_sources(self, [s], extension)
-            self._put_to_cache(hash, target)
-
-        sources = [x for x in sources if x.startswith("pandas") or "lib." in x]
-
-        return sources
-
-if BUILD_CACHE_DIR:  # use the cache
-    cmdclass['build_ext'] = CachingBuildExt
-
-try:
-    # recent
-    setuptools_kwargs['use_2to3'] = True if BUILD_CACHE_DIR is None else False
-except:
-    pass
-
-try:
-    # pre eb2234231 , ~ 0.7.0,
-    setuptools_args['use_2to3'] = True if BUILD_CACHE_DIR is None else False
-except:
-    pass
-
-"""
-def main():
-    opd = os.path.dirname
-    opj = os.path.join
-    s= None
-    with open(opj(opd(__file__),"..","setup.py")) as f:
-        s = f.read()
-    if s:
-        if "BUILD CACHE ACTIVATED (V2)" in s:
-            print( "setup.py already wired with V2 build_cache, skipping..")
-        else:
-            SEP="\nsetup("
-            before,after = s.split(SEP)
-            with open(opj(opd(__file__),"..","setup.py"),"wb") as f:
-                f.write((before + shim + SEP + after).encode('ascii'))
-            print("""
-    setup.py was rewritten to use a build cache.
-    Make sure you've put the following in your .bashrc:
-
-    export BUILD_CACHE_DIR=<an existing directory for saving cached files>
-    echo $BUILD_CACHE_DIR > pandas_repo_rootdir/.build_cache_dir
-
-    Once active, build results (compilation, cythonizations and 2to3 artifacts)
-    will be cached in "$BUILD_CACHE_DIR" and subsequent builds should be
-    sped up if no changes requiring recompilation were made.
-
-    Go ahead and run:
-
-    python setup.py clean
-    python setup.py develop
-
-    """)
-
-if __name__ == '__main__':
-    import sys
-    sys.exit(main())
diff --git a/scripts/validate_docstrings.py b/scripts/validate_docstrings.py
new file mode 100755
index 0000000000000..20f32124a2532
--- /dev/null
+++ b/scripts/validate_docstrings.py
@@ -0,0 +1,954 @@
+#!/usr/bin/env python
+"""
+Analyze docstrings to detect errors.
+
+If no argument is provided, it does a quick check of docstrings and returns
+a csv with all API functions and results of basic checks.
+
+If a function or method is provided in the form "pandas.function",
+"pandas.module.class.method", etc. a list of all errors in the docstring for
+the specified function or method.
+
+Usage::
+    $ ./validate_docstrings.py
+    $ ./validate_docstrings.py pandas.DataFrame.head
+"""
+import os
+import sys
+import json
+import re
+import glob
+import functools
+import collections
+import argparse
+import pydoc
+import inspect
+import importlib
+import doctest
+import tempfile
+
+import flake8.main.application
+
+try:
+    from io import StringIO
+except ImportError:
+    from cStringIO import StringIO
+
+# Template backend makes matplotlib to not plot anything. This is useful
+# to avoid that plot windows are open from the doctests while running the
+# script. Setting here before matplotlib is loaded.
+# We don't warn for the number of open plots, as none is actually being opened
+os.environ['MPLBACKEND'] = 'Template'
+import matplotlib
+matplotlib.rc('figure', max_open_warning=10000)
+
+import numpy
+
+BASE_PATH = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+
+sys.path.insert(0, os.path.join(BASE_PATH))
+import pandas
+from pandas.compat import signature
+
+sys.path.insert(1, os.path.join(BASE_PATH, 'doc', 'sphinxext'))
+from numpydoc.docscrape import NumpyDocString
+from pandas.io.formats.printing import pprint_thing
+
+
+PRIVATE_CLASSES = ['NDFrame', 'IndexOpsMixin']
+DIRECTIVES = ['versionadded', 'versionchanged', 'deprecated']
+ALLOWED_SECTIONS = ['Parameters', 'Attributes', 'Methods', 'Returns', 'Yields',
+                    'Other Parameters', 'Raises', 'Warns', 'See Also', 'Notes',
+                    'References', 'Examples']
+ERROR_MSGS = {
+    'GL01': 'Docstring text (summary) should start in the line immediately '
+            'after the opening quotes (not in the same line, or leaving a '
+            'blank line in between)',
+    'GL02': 'Closing quotes should be placed in the line after the last text '
+            'in the docstring (do not close the quotes in the same line as '
+            'the text, or leave a blank line between the last text and the '
+            'quotes)',
+    'GL03': 'Double line break found; please use only one blank line to '
+            'separate sections or paragraphs, and do not leave blank lines '
+            'at the end of docstrings',
+    'GL04': 'Private classes ({mentioned_private_classes}) should not be '
+            'mentioned in public docstrings',
+    'GL05': 'Tabs found at the start of line "{line_with_tabs}", please use '
+            'whitespace only',
+    'GL06': 'Found unknown section "{section}". Allowed sections are: '
+            '{allowed_sections}',
+    'GL07': 'Sections are in the wrong order. Correct order is: '
+            '{correct_sections}',
+    'GL08': 'The object does not have a docstring',
+    'GL09': 'Deprecation warning should precede extended summary',
+    'SS01': 'No summary found (a short summary in a single line should be '
+            'present at the beginning of the docstring)',
+    'SS02': 'Summary does not start with a capital letter',
+    'SS03': 'Summary does not end with a period',
+    'SS04': 'Summary contains heading whitespaces',
+    'SS05': 'Summary must start with infinitive verb, not third person '
+            '(e.g. use "Generate" instead of "Generates")',
+    'SS06': 'Summary should fit in a single line',
+    'ES01': 'No extended summary found',
+    'PR01': 'Parameters {missing_params} not documented',
+    'PR02': 'Unknown parameters {unknown_params}',
+    'PR03': 'Wrong parameters order. Actual: {actual_params}. '
+            'Documented: {documented_params}',
+    'PR04': 'Parameter "{param_name}" has no type',
+    'PR05': 'Parameter "{param_name}" type should not finish with "."',
+    'PR06': 'Parameter "{param_name}" type should use "{right_type}" instead '
+            'of "{wrong_type}"',
+    'PR07': 'Parameter "{param_name}" has no description',
+    'PR08': 'Parameter "{param_name}" description should start with a '
+            'capital letter',
+    'PR09': 'Parameter "{param_name}" description should finish with "."',
+    'PR10': 'Parameter "{param_name}" requires a space before the colon '
+            'separating the parameter name and type',
+    'RT01': 'No Returns section found',
+    'RT02': 'The first line of the Returns section should contain only the '
+            'type, unless multiple values are being returned',
+    'RT03': 'Return value has no description',
+    'RT04': 'Return value description should start with a capital letter',
+    'RT05': 'Return value description should finish with "."',
+    'YD01': 'No Yields section found',
+    'SA01': 'See Also section not found',
+    'SA02': 'Missing period at end of description for See Also '
+            '"{reference_name}" reference',
+    'SA03': 'Description should be capitalized for See Also '
+            '"{reference_name}" reference',
+    'SA04': 'Missing description for See Also "{reference_name}" reference',
+    'SA05': '{reference_name} in `See Also` section does not need `pandas` '
+            'prefix, use {right_reference} instead.',
+    'EX01': 'No examples section found',
+    'EX02': 'Examples do not pass tests:\n{doctest_log}',
+    'EX03': 'flake8 error: {error_code} {error_message}{times_happening}',
+    'EX04': 'Do not import {imported_library}, as it is imported '
+            'automatically for the examples (numpy as np, pandas as pd)',
+}
+
+
+def error(code, **kwargs):
+    """
+    Return a tuple with the error code and the message with variables replaced.
+
+    This is syntactic sugar so instead of:
+    - `('EX02', ERROR_MSGS['EX02'].format(doctest_log=log))`
+
+    We can simply use:
+    - `error('EX02', doctest_log=log)`
+
+    Parameters
+    ----------
+    code : str
+        Error code.
+    **kwargs
+        Values for the variables in the error messages
+
+    Returns
+    -------
+    code : str
+        Error code.
+    message : str
+        Error message with varaibles replaced.
+    """
+    return (code, ERROR_MSGS[code].format(**kwargs))
+
+
+def get_api_items(api_doc_fd):
+    """
+    Yield information about all public API items.
+
+    Parse api.rst file from the documentation, and extract all the functions,
+    methods, classes, attributes... This should include all pandas public API.
+
+    Parameters
+    ----------
+    api_doc_fd : file descriptor
+        A file descriptor of the API documentation page, containing the table
+        of contents with all the public API.
+
+    Yields
+    ------
+    name : str
+        The name of the object (e.g. 'pandas.Series.str.upper).
+    func : function
+        The object itself. In most cases this will be a function or method,
+        but it can also be classes, properties, cython objects...
+    section : str
+        The name of the section in the API page where the object item is
+        located.
+    subsection : str
+        The name of the subsection in the API page where the object item is
+        located.
+    """
+    current_module = 'pandas'
+    previous_line = current_section = current_subsection = ''
+    position = None
+    for line in api_doc_fd:
+        line = line.strip()
+        if len(line) == len(previous_line):
+            if set(line) == set('-'):
+                current_section = previous_line
+                continue
+            if set(line) == set('~'):
+                current_subsection = previous_line
+                continue
+
+        if line.startswith('.. currentmodule::'):
+            current_module = line.replace('.. currentmodule::', '').strip()
+            continue
+
+        if line == '.. autosummary::':
+            position = 'autosummary'
+            continue
+
+        if position == 'autosummary':
+            if line == '':
+                position = 'items'
+                continue
+
+        if position == 'items':
+            if line == '':
+                position = None
+                continue
+            item = line.strip()
+            func = importlib.import_module(current_module)
+            for part in item.split('.'):
+                func = getattr(func, part)
+
+            yield ('.'.join([current_module, item]), func,
+                   current_section, current_subsection)
+
+        previous_line = line
+
+
+class Docstring(object):
+    def __init__(self, name):
+        self.name = name
+        obj = self._load_obj(name)
+        self.obj = obj
+        self.code_obj = self._to_original_callable(obj)
+        self.raw_doc = obj.__doc__ or ''
+        self.clean_doc = pydoc.getdoc(obj)
+        self.doc = NumpyDocString(self.clean_doc)
+
+    def __len__(self):
+        return len(self.raw_doc)
+
+    @staticmethod
+    def _load_obj(name):
+        """
+        Import Python object from its name as string.
+
+        Parameters
+        ----------
+        name : str
+            Object name to import (e.g. pandas.Series.str.upper)
+
+        Returns
+        -------
+        object
+            Python object that can be a class, method, function...
+
+        Examples
+        --------
+        >>> Docstring._load_obj('pandas.Series')
+        <class 'pandas.core.series.Series'>
+        """
+        for maxsplit in range(1, name.count('.') + 1):
+            # TODO when py3 only replace by: module, *func_parts = ...
+            func_name_split = name.rsplit('.', maxsplit)
+            module = func_name_split[0]
+            func_parts = func_name_split[1:]
+            try:
+                obj = importlib.import_module(module)
+            except ImportError:
+                pass
+            else:
+                continue
+
+        if 'obj' not in locals():
+            raise ImportError('No module can be imported '
+                              'from "{}"'.format(name))
+
+        for part in func_parts:
+            obj = getattr(obj, part)
+        return obj
+
+    @staticmethod
+    def _to_original_callable(obj):
+        """
+        Find the Python object that contains the source code of the object.
+
+        This is useful to find the place in the source code (file and line
+        number) where a docstring is defined. It does not currently work for
+        all cases, but it should help find some (properties...).
+        """
+        while True:
+            if inspect.isfunction(obj) or inspect.isclass(obj):
+                f = inspect.getfile(obj)
+                if f.startswith('<') and f.endswith('>'):
+                    return None
+                return obj
+            if inspect.ismethod(obj):
+                obj = obj.__func__
+            elif isinstance(obj, functools.partial):
+                obj = obj.func
+            elif isinstance(obj, property):
+                obj = obj.fget
+            else:
+                return None
+
+    @property
+    def type(self):
+        return type(self.obj).__name__
+
+    @property
+    def is_function_or_method(self):
+        # TODO(py27): remove ismethod
+        return (inspect.isfunction(self.obj)
+                or inspect.ismethod(self.obj))
+
+    @property
+    def source_file_name(self):
+        """
+        File name where the object is implemented (e.g. pandas/core/frame.py).
+        """
+        try:
+            fname = inspect.getsourcefile(self.code_obj)
+        except TypeError:
+            # In some cases the object is something complex like a cython
+            # object that can't be easily introspected. An it's better to
+            # return the source code file of the object as None, than crash
+            pass
+        else:
+            if fname:
+                fname = os.path.relpath(fname, BASE_PATH)
+                return fname
+
+    @property
+    def source_file_def_line(self):
+        """
+        Number of line where the object is defined in its file.
+        """
+        try:
+            return inspect.getsourcelines(self.code_obj)[-1]
+        except (OSError, TypeError):
+            # In some cases the object is something complex like a cython
+            # object that can't be easily introspected. An it's better to
+            # return the line number as None, than crash
+            pass
+
+    @property
+    def github_url(self):
+        url = 'https://github.com/pandas-dev/pandas/blob/master/'
+        url += '{}#L{}'.format(self.source_file_name,
+                               self.source_file_def_line)
+        return url
+
+    @property
+    def start_blank_lines(self):
+        i = None
+        if self.raw_doc:
+            for i, row in enumerate(self.raw_doc.split('\n')):
+                if row.strip():
+                    break
+        return i
+
+    @property
+    def end_blank_lines(self):
+        i = None
+        if self.raw_doc:
+            for i, row in enumerate(reversed(self.raw_doc.split('\n'))):
+                if row.strip():
+                    break
+        return i
+
+    @property
+    def double_blank_lines(self):
+        prev = True
+        for row in self.raw_doc.split('\n'):
+            if not prev and not row.strip():
+                return True
+            prev = row.strip()
+        return False
+
+    @property
+    def section_titles(self):
+        sections = []
+        self.doc._doc.reset()
+        while not self.doc._doc.eof():
+            content = self.doc._read_to_next_section()
+            if (len(content) > 1
+                    and len(content[0]) == len(content[1])
+                    and set(content[1]) == {'-'}):
+                sections.append(content[0])
+        return sections
+
+    @property
+    def summary(self):
+        return ' '.join(self.doc['Summary'])
+
+    @property
+    def num_summary_lines(self):
+        return len(self.doc['Summary'])
+
+    @property
+    def extended_summary(self):
+        if not self.doc['Extended Summary'] and len(self.doc['Summary']) > 1:
+            return ' '.join(self.doc['Summary'])
+        return ' '.join(self.doc['Extended Summary'])
+
+    @property
+    def needs_summary(self):
+        return not (bool(self.summary) and bool(self.extended_summary))
+
+    @property
+    def doc_parameters(self):
+        return collections.OrderedDict((name, (type_, ''.join(desc)))
+                                       for name, type_, desc
+                                       in self.doc['Parameters'])
+
+    @property
+    def signature_parameters(self):
+        if inspect.isclass(self.obj):
+            if hasattr(self.obj, '_accessors') and (
+                    self.name.split('.')[-1] in
+                    self.obj._accessors):
+                # accessor classes have a signature but don't want to show this
+                return tuple()
+        try:
+            sig = signature(self.obj)
+        except (TypeError, ValueError):
+            # Some objects, mainly in C extensions do not support introspection
+            # of the signature
+            return tuple()
+        params = sig.args
+        if sig.varargs:
+            params.append("*" + sig.varargs)
+        if sig.keywords:
+            params.append("**" + sig.keywords)
+        params = tuple(params)
+        if params and params[0] in ('self', 'cls'):
+            return params[1:]
+        return params
+
+    @property
+    def parameter_mismatches(self):
+        errs = []
+        signature_params = self.signature_parameters
+        doc_params = tuple(self.doc_parameters)
+        missing = set(signature_params) - set(doc_params)
+        if missing:
+            errs.append(error('PR01', missing_params=pprint_thing(missing)))
+        extra = set(doc_params) - set(signature_params)
+        if extra:
+            errs.append(error('PR02', unknown_params=pprint_thing(extra)))
+        if (not missing and not extra and signature_params != doc_params
+                and not (not signature_params and not doc_params)):
+            errs.append(error('PR03',
+                              actual_params=signature_params,
+                              documented_params=doc_params))
+
+        return errs
+
+    @property
+    def correct_parameters(self):
+        return not bool(self.parameter_mismatches)
+
+    def parameter_type(self, param):
+        return self.doc_parameters[param][0]
+
+    def parameter_desc(self, param):
+        desc = self.doc_parameters[param][1]
+        # Find and strip out any sphinx directives
+        for directive in DIRECTIVES:
+            full_directive = '.. {}'.format(directive)
+            if full_directive in desc:
+                # Only retain any description before the directive
+                desc = desc[:desc.index(full_directive)]
+        return desc
+
+    @property
+    def see_also(self):
+        return collections.OrderedDict((name, ''.join(desc))
+                                       for name, desc, _
+                                       in self.doc['See Also'])
+
+    @property
+    def examples(self):
+        return self.doc['Examples']
+
+    @property
+    def returns(self):
+        return self.doc['Returns']
+
+    @property
+    def yields(self):
+        return self.doc['Yields']
+
+    @property
+    def method_source(self):
+        try:
+            return inspect.getsource(self.obj)
+        except TypeError:
+            return ''
+
+    @property
+    def first_line_ends_in_dot(self):
+        if self.doc:
+            return self.doc.split('\n')[0][-1] == '.'
+
+    @property
+    def deprecated_with_directive(self):
+        return '.. deprecated:: ' in (self.summary + self.extended_summary)
+
+    @property
+    def deprecated(self):
+        return (self.name.startswith('pandas.Panel')
+                or self.deprecated_with_directive)
+
+    @property
+    def mentioned_private_classes(self):
+        return [klass for klass in PRIVATE_CLASSES if klass in self.raw_doc]
+
+    @property
+    def examples_errors(self):
+        flags = doctest.NORMALIZE_WHITESPACE | doctest.IGNORE_EXCEPTION_DETAIL
+        finder = doctest.DocTestFinder()
+        runner = doctest.DocTestRunner(optionflags=flags)
+        context = {'np': numpy, 'pd': pandas}
+        error_msgs = ''
+        for test in finder.find(self.raw_doc, self.name, globs=context):
+            f = StringIO()
+            runner.run(test, out=f.write)
+            error_msgs += f.getvalue()
+        return error_msgs
+
+    @property
+    def examples_source_code(self):
+        lines = doctest.DocTestParser().get_examples(self.raw_doc)
+        return [line.source for line in lines]
+
+    def validate_pep8(self):
+        if not self.examples:
+            return
+
+        # F401 is needed to not generate flake8 errors in examples
+        # that do not user numpy or pandas
+        content = ''.join(('import numpy as np  # noqa: F401\n',
+                           'import pandas as pd  # noqa: F401\n',
+                           *self.examples_source_code))
+
+        application = flake8.main.application.Application()
+        application.initialize(["--quiet"])
+
+        with tempfile.NamedTemporaryFile(mode='w') as file:
+            file.write(content)
+            file.flush()
+            application.run_checks([file.name])
+
+        # We need this to avoid flake8 printing the names of the files to
+        # the standard output
+        application.formatter.write = lambda line, source: None
+        application.report()
+
+        yield from application.guide.stats.statistics_for('')
+
+
+def get_validation_data(doc):
+    """
+    Validate the docstring.
+
+    Parameters
+    ----------
+    doc : Docstring
+        A Docstring object with the given function name.
+
+    Returns
+    -------
+    tuple
+        errors : list of tuple
+            Errors occurred during validation.
+        warnings : list of tuple
+            Warnings occurred during validation.
+        examples_errs : str
+            Examples usage displayed along the error, otherwise empty string.
+
+    Notes
+    -----
+    The errors codes are defined as:
+    - First two characters: Section where the error happens:
+       * GL: Global (no section, like section ordering errors)
+       * SS: Short summary
+       * ES: Extended summary
+       * PR: Parameters
+       * RT: Returns
+       * YD: Yields
+       * RS: Raises
+       * WN: Warns
+       * SA: See Also
+       * NT: Notes
+       * RF: References
+       * EX: Examples
+    - Last two characters: Numeric error code inside the section
+
+    For example, EX02 is the second codified error in the Examples section
+    (which in this case is assigned to examples that do not pass the tests).
+
+    The error codes, their corresponding error messages, and the details on how
+    they are validated, are not documented more than in the source code of this
+    function.
+    """
+
+    errs = []
+    wrns = []
+    if not doc.raw_doc:
+        errs.append(error('GL08'))
+        return errs, wrns, ''
+
+    if doc.start_blank_lines != 1:
+        errs.append(error('GL01'))
+    if doc.end_blank_lines != 1:
+        errs.append(error('GL02'))
+    if doc.double_blank_lines:
+        errs.append(error('GL03'))
+    mentioned_errs = doc.mentioned_private_classes
+    if mentioned_errs:
+        errs.append(error('GL04',
+                          mentioned_private_classes=', '.join(mentioned_errs)))
+    for line in doc.raw_doc.splitlines():
+        if re.match("^ *\t", line):
+            errs.append(error('GL05', line_with_tabs=line.lstrip()))
+
+    unexpected_sections = [section for section in doc.section_titles
+                           if section not in ALLOWED_SECTIONS]
+    for section in unexpected_sections:
+        errs.append(error('GL06',
+                          section=section,
+                          allowed_sections=', '.join(ALLOWED_SECTIONS)))
+
+    correct_order = [section for section in ALLOWED_SECTIONS
+                     if section in doc.section_titles]
+    if correct_order != doc.section_titles:
+        errs.append(error('GL07',
+                          correct_sections=', '.join(correct_order)))
+
+    if (doc.deprecated_with_directive
+            and not doc.extended_summary.startswith('.. deprecated:: ')):
+        errs.append(error('GL09'))
+
+    if not doc.summary:
+        errs.append(error('SS01'))
+    else:
+        if not doc.summary[0].isupper():
+            errs.append(error('SS02'))
+        if doc.summary[-1] != '.':
+            errs.append(error('SS03'))
+        if doc.summary != doc.summary.lstrip():
+            errs.append(error('SS04'))
+        elif (doc.is_function_or_method
+                and doc.summary.split(' ')[0][-1] == 's'):
+            errs.append(error('SS05'))
+        if doc.num_summary_lines > 1:
+            errs.append(error('SS06'))
+
+    if not doc.extended_summary:
+        wrns.append(('ES01', 'No extended summary found'))
+
+    # PR01: Parameters not documented
+    # PR02: Unknown parameters
+    # PR03: Wrong parameters order
+    errs += doc.parameter_mismatches
+
+    for param in doc.doc_parameters:
+        if not param.startswith("*"):  # Check can ignore var / kwargs
+            if not doc.parameter_type(param):
+                if ':' in param:
+                    errs.append(error('PR10',
+                                      param_name=param.split(':')[0]))
+                else:
+                    errs.append(error('PR04', param_name=param))
+            else:
+                if doc.parameter_type(param)[-1] == '.':
+                    errs.append(error('PR05', param_name=param))
+                common_type_errors = [('integer', 'int'),
+                                      ('boolean', 'bool'),
+                                      ('string', 'str')]
+                for wrong_type, right_type in common_type_errors:
+                    if wrong_type in doc.parameter_type(param):
+                        errs.append(error('PR06',
+                                          param_name=param,
+                                          right_type=right_type,
+                                          wrong_type=wrong_type))
+        if not doc.parameter_desc(param):
+            errs.append(error('PR07', param_name=param))
+        else:
+            if not doc.parameter_desc(param)[0].isupper():
+                errs.append(error('PR08', param_name=param))
+            if doc.parameter_desc(param)[-1] != '.':
+                errs.append(error('PR09', param_name=param))
+
+    if doc.is_function_or_method:
+        if not doc.returns:
+            if 'return' in doc.method_source:
+                errs.append(error('RT01'))
+        else:
+            if len(doc.returns) == 1 and doc.returns[0][1]:
+                errs.append(error('RT02'))
+            for name_or_type, type_, desc in doc.returns:
+                if not desc:
+                    errs.append(error('RT03'))
+                else:
+                    desc = ' '.join(desc)
+                    if not desc[0].isupper():
+                        errs.append(error('RT04'))
+                    if not desc.endswith('.'):
+                        errs.append(error('RT05'))
+
+        if not doc.yields and 'yield' in doc.method_source:
+            errs.append(error('YD01'))
+
+    if not doc.see_also:
+        wrns.append(error('SA01'))
+    else:
+        for rel_name, rel_desc in doc.see_also.items():
+            if rel_desc:
+                if not rel_desc.endswith('.'):
+                    errs.append(error('SA02', reference_name=rel_name))
+                if not rel_desc[0].isupper():
+                    errs.append(error('SA03', reference_name=rel_name))
+            else:
+                errs.append(error('SA04', reference_name=rel_name))
+            if rel_name.startswith('pandas.'):
+                errs.append(error('SA05',
+                                  reference_name=rel_name,
+                                  right_reference=rel_name[len('pandas.'):]))
+
+    examples_errs = ''
+    if not doc.examples:
+        wrns.append(error('EX01'))
+    else:
+        examples_errs = doc.examples_errors
+        if examples_errs:
+            errs.append(error('EX02', doctest_log=examples_errs))
+        for err in doc.validate_pep8():
+            errs.append(error('EX03',
+                              error_code=err.error_code,
+                              error_message=err.message,
+                              times_happening=' ({} times)'.format(err.count)
+                                              if err.count > 1 else ''))
+        examples_source_code = ''.join(doc.examples_source_code)
+        for wrong_import in ('numpy', 'pandas'):
+            if 'import {}'.format(wrong_import) in examples_source_code:
+                errs.append(error('EX04', imported_library=wrong_import))
+    return errs, wrns, examples_errs
+
+
+def validate_one(func_name):
+    """
+    Validate the docstring for the given func_name
+
+    Parameters
+    ----------
+    func_name : function
+        Function whose docstring will be evaluated (e.g. pandas.read_csv).
+
+    Returns
+    -------
+    dict
+        A dictionary containing all the information obtained from validating
+        the docstring.
+    """
+    doc = Docstring(func_name)
+    errs, wrns, examples_errs = get_validation_data(doc)
+    return {'type': doc.type,
+            'docstring': doc.clean_doc,
+            'deprecated': doc.deprecated,
+            'file': doc.source_file_name,
+            'file_line': doc.source_file_def_line,
+            'github_link': doc.github_url,
+            'errors': errs,
+            'warnings': wrns,
+            'examples_errors': examples_errs}
+
+
+def validate_all(prefix, ignore_deprecated=False):
+    """
+    Execute the validation of all docstrings, and return a dict with the
+    results.
+
+    Parameters
+    ----------
+    prefix : str or None
+        If provided, only the docstrings that start with this pattern will be
+        validated. If None, all docstrings will be validated.
+    ignore_deprecated: bool, default False
+        If True, deprecated objects are ignored when validating docstrings.
+
+    Returns
+    -------
+    dict
+        A dictionary with an item for every function/method... containing
+        all the validation information.
+    """
+    result = {}
+    seen = {}
+
+    # functions from the API docs
+    api_doc_fnames = os.path.join(
+        BASE_PATH, 'doc', 'source', 'reference', '*.rst')
+    api_items = []
+    for api_doc_fname in glob.glob(api_doc_fnames):
+        with open(api_doc_fname) as f:
+            api_items += list(get_api_items(f))
+    for func_name, func_obj, section, subsection in api_items:
+        if prefix and not func_name.startswith(prefix):
+            continue
+        doc_info = validate_one(func_name)
+        if ignore_deprecated and doc_info['deprecated']:
+            continue
+        result[func_name] = doc_info
+
+        shared_code_key = doc_info['file'], doc_info['file_line']
+        shared_code = seen.get(shared_code_key, '')
+        result[func_name].update({'in_api': True,
+                                  'section': section,
+                                  'subsection': subsection,
+                                  'shared_code_with': shared_code})
+
+        seen[shared_code_key] = func_name
+
+    # functions from introspecting Series, DataFrame and Panel
+    api_item_names = set(list(zip(*api_items))[0])
+    for class_ in (pandas.Series, pandas.DataFrame, pandas.Panel):
+        for member in inspect.getmembers(class_):
+            func_name = 'pandas.{}.{}'.format(class_.__name__, member[0])
+            if (not member[0].startswith('_')
+                    and func_name not in api_item_names):
+                if prefix and not func_name.startswith(prefix):
+                    continue
+                doc_info = validate_one(func_name)
+                if ignore_deprecated and doc_info['deprecated']:
+                    continue
+                result[func_name] = doc_info
+                result[func_name]['in_api'] = False
+
+    return result
+
+
+def main(func_name, prefix, errors, output_format, ignore_deprecated):
+    def header(title, width=80, char='#'):
+        full_line = char * width
+        side_len = (width - len(title) - 2) // 2
+        adj = '' if len(title) % 2 == 0 else ' '
+        title_line = '{side} {title}{adj} {side}'.format(side=char * side_len,
+                                                         title=title,
+                                                         adj=adj)
+
+        return '\n{full_line}\n{title_line}\n{full_line}\n\n'.format(
+            full_line=full_line, title_line=title_line)
+
+    exit_status = 0
+    if func_name is None:
+        result = validate_all(prefix, ignore_deprecated)
+
+        if output_format == 'json':
+            output = json.dumps(result)
+        else:
+            if output_format == 'default':
+                output_format = '{text}\n'
+            elif output_format == 'azure':
+                output_format = ('##vso[task.logissue type=error;'
+                                 'sourcepath={path};'
+                                 'linenumber={row};'
+                                 'code={code};'
+                                 ']{text}\n')
+            else:
+                raise ValueError('Unknown output_format "{}"'.format(
+                    output_format))
+
+            output = ''
+            for name, res in result.items():
+                for err_code, err_desc in res['errors']:
+                    # The script would be faster if instead of filtering the
+                    # errors after validating them, it didn't validate them
+                    # initially. But that would complicate the code too much
+                    if errors and err_code not in errors:
+                        continue
+                    exit_status += 1
+                    output += output_format.format(
+                        name=name,
+                        path=res['file'],
+                        row=res['file_line'],
+                        code=err_code,
+                        text='{}: {}'.format(name, err_desc))
+
+        sys.stdout.write(output)
+
+    else:
+        result = validate_one(func_name)
+        sys.stderr.write(header('Docstring ({})'.format(func_name)))
+        sys.stderr.write('{}\n'.format(result['docstring']))
+        sys.stderr.write(header('Validation'))
+        if result['errors']:
+            sys.stderr.write('{} Errors found:\n'.format(
+                len(result['errors'])))
+            for err_code, err_desc in result['errors']:
+                # Failing examples are printed at the end
+                if err_code == 'EX02':
+                    sys.stderr.write('\tExamples do not pass tests\n')
+                    continue
+                sys.stderr.write('\t{}\n'.format(err_desc))
+        if result['warnings']:
+            sys.stderr.write('{} Warnings found:\n'.format(
+                len(result['warnings'])))
+            for wrn_code, wrn_desc in result['warnings']:
+                sys.stderr.write('\t{}\n'.format(wrn_desc))
+
+        if not result['errors']:
+            sys.stderr.write('Docstring for "{}" correct. :)\n'.format(
+                func_name))
+
+        if result['examples_errors']:
+            sys.stderr.write(header('Doctests'))
+            sys.stderr.write(result['examples_errors'])
+
+    return exit_status
+
+
+if __name__ == '__main__':
+    format_opts = 'default', 'json', 'azure'
+    func_help = ('function or method to validate (e.g. pandas.DataFrame.head) '
+                 'if not provided, all docstrings are validated and returned '
+                 'as JSON')
+    argparser = argparse.ArgumentParser(
+        description='validate pandas docstrings')
+    argparser.add_argument('function',
+                           nargs='?',
+                           default=None,
+                           help=func_help)
+    argparser.add_argument('--format', default='default', choices=format_opts,
+                           help='format of the output when validating '
+                           'multiple docstrings (ignored when validating one).'
+                           'It can be {}'.format(str(format_opts)[1:-1]))
+    argparser.add_argument('--prefix', default=None, help='pattern for the '
+                           'docstring names, in order to decide which ones '
+                           'will be validated. A prefix "pandas.Series.str.'
+                           'will make the script validate all the docstrings'
+                           'of methods starting by this pattern. It is '
+                           'ignored if parameter function is provided')
+    argparser.add_argument('--errors', default=None, help='comma separated '
+                           'list of error codes to validate. By default it '
+                           'validates all errors (ignored when validating '
+                           'a single docstring)')
+    argparser.add_argument('--ignore_deprecated', default=False,
+                           action='store_true', help='if this flag is set, '
+                           'deprecated objects are ignored when validating '
+                           'all docstrings')
+
+    args = argparser.parse_args()
+    sys.exit(main(args.function, args.prefix,
+                  args.errors.split(',') if args.errors else None,
+                  args.format,
+                  args.ignore_deprecated))
diff --git a/scripts/winbuild_py27.bat b/scripts/winbuild_py27.bat
deleted file mode 100644
index bec67c7e527ed..0000000000000
--- a/scripts/winbuild_py27.bat
+++ /dev/null
@@ -1,2 +0,0 @@
-SET PATH=C:\MinGW\bin;C:\Python27;C:\Python27\Scripts;%PATH%
-python setup.py build -c mingw32 bdist_wininst
diff --git a/scripts/windows_builder/build_27-32.bat b/scripts/windows_builder/build_27-32.bat
deleted file mode 100644
index 37eb4d436d567..0000000000000
--- a/scripts/windows_builder/build_27-32.bat
+++ /dev/null
@@ -1,25 +0,0 @@
-@echo off
-echo "starting 27-32"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.0\Bin\SetEnv.cmd" /x86 /release
-set DISTUTILS_USE_SDK=1
-
-title 27-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python27-32\python.exe setup.py build > build.27-32.log 2>&1
-
-title "installing"
-C:\python27-32\python.exe setup.py bdist --formats=wininst > install.27-32.log 2>&1
-
-echo "testing"
-C:\python27-32\scripts\nosetests -A "not slow" build\lib.win32-2.7\pandas > test.27-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-2.7
-C:\python27-32\python.exe ../../ci/print_versions.py > ../../versions.27-32.log 2>&1
-
-exit
-
diff --git a/scripts/windows_builder/build_27-64.bat b/scripts/windows_builder/build_27-64.bat
deleted file mode 100644
index e76e25d0ef39c..0000000000000
--- a/scripts/windows_builder/build_27-64.bat
+++ /dev/null
@@ -1,25 +0,0 @@
-@echo off
-echo "starting 27-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.0\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 27-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python27-64\python.exe setup.py build > build.27-64.log 2>&1
-
-echo "installing"
-C:\python27-64\python.exe setup.py bdist --formats=wininst > install.27-64.log 2>&1
-
-echo "testing"
-C:\python27-64\scripts\nosetests -A "not slow" build\lib.win-amd64-2.7\pandas > test.27-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-2.7
-C:\python27-64\python.exe ../../ci/print_versions.py > ../../versions.27-64.log 2>&1
-
-exit
-
diff --git a/scripts/windows_builder/build_34-32.bat b/scripts/windows_builder/build_34-32.bat
deleted file mode 100644
index 8e060e000bc8f..0000000000000
--- a/scripts/windows_builder/build_34-32.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 34-32"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x86 /release
-set DISTUTILS_USE_SDK=1
-
-title 34-32 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python34-32\python.exe setup.py build > build.34-32.log 2>&1
-
-echo "installing"
-C:\python34-32\python.exe setup.py bdist --formats=wininst > install.34-32.log 2>&1
-
-echo "testing"
-C:\python34-32\scripts\nosetests -A "not slow" build\lib.win32-3.4\pandas > test.34-32.log 2>&1
-
-echo "versions"
-cd build\lib.win32-3.4
-C:\python34-32\python.exe ../../ci/print_versions.py > ../../versions.34-32.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/build_34-64.bat b/scripts/windows_builder/build_34-64.bat
deleted file mode 100644
index 3a8512b730346..0000000000000
--- a/scripts/windows_builder/build_34-64.bat
+++ /dev/null
@@ -1,27 +0,0 @@
-@echo off
-echo "starting 34-64"
-
-setlocal EnableDelayedExpansion
-set MSSdk=1
-CALL "C:\Program Files\Microsoft SDKs\Windows\v7.1\Bin\SetEnv.cmd" /x64 /release
-set DISTUTILS_USE_SDK=1
-
-title 34-64 build
-echo "building"
-cd "c:\users\Jeff Reback\documents\github\pandas"
-C:\python34-64\python.exe setup.py build > build.34-64.log 2>&1
-
-echo "installing"
-C:\python34-64\python.exe setup.py bdist --formats=wininst > install.34-64.log 2>&1
-
-echo "testing"
-C:\python34-64\scripts\nosetests -A "not slow" build\lib.win-amd64-3.4\pandas > test.34-64.log 2>&1
-
-echo "versions"
-cd build\lib.win-amd64-3.4
-C:\python34-64\python.exe ../../ci/print_versions.py > ../../versions.34-64.log 2>&1
-
-exit
-
-
-
diff --git a/scripts/windows_builder/check_and_build.bat b/scripts/windows_builder/check_and_build.bat
deleted file mode 100644
index 32be1bde1f7f3..0000000000000
--- a/scripts/windows_builder/check_and_build.bat
+++ /dev/null
@@ -1,2 +0,0 @@
-set PYTHONPATH=c:/python27-64/lib
-c:/python27-64/python.exe c:/Builds/check_and_build.py %1 %2 %3 %4 %4 %6 %7 %8 %9
diff --git a/scripts/windows_builder/check_and_build.py b/scripts/windows_builder/check_and_build.py
deleted file mode 100644
index 2eb32fb4265d9..0000000000000
--- a/scripts/windows_builder/check_and_build.py
+++ /dev/null
@@ -1,194 +0,0 @@
-import datetime
-import git
-import logging
-import os, re, time
-import subprocess
-import argparse
-import pysftp
-
-# parse the args
-parser = argparse.ArgumentParser(description='build, test, and install updated versions of master pandas')
-parser.add_argument('-b', '--build',
-                    help='run just this build',
-                    dest='build')
-parser.add_argument('-u', '--update',
-                    help='get a git update',
-                    dest='update',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-t', '--test',
-                    help='run the tests',
-                    dest='test',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-c', '--compare',
-                    help='show the last tests compare',
-                    dest='compare',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-v', '--version',
-                    help='show the last versions',
-                    dest='version',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-i', '--install',
-                    help='run the install',
-                    dest='install',
-                    action='store_true',
-                    default=False)
-parser.add_argument('--dry',
-                    help='dry run',
-                    dest='dry',
-                    action='store_true',
-                    default=False)
-
-args = parser.parse_args()
-dry_run = args.dry
-
-builds = ['27-32','27-64','34-32','34-64']
-base_dir = "C:\Users\Jeff Reback\Documents\GitHub\pandas"
-remote_host='pandas.pydata.org'
-username='pandas'
-password=############
-
-# drop python from our environment to avoid
-# passing this onto sub-processes
-env = os.environ
-del env['PYTHONPATH']
-
-# the stdout logger
-fmt = '%(asctime)s: %(message)s'
-logger = logging.getLogger('check_and_build')
-logger.setLevel(logging.DEBUG)
-stream_handler = logging.StreamHandler()
-stream_handler.setFormatter(logging.Formatter(fmt))
-logger.addHandler(stream_handler)
-
-def run_all(test=False,compare=False,install=False,version=False,build=None):
-    # run everything
-
-    for b in builds:
-        if build is not None and build != b:
-            continue
-        if test:
-            do_rebuild(b)
-        if compare or test:
-            try:
-                do_compare(b)
-            except (Exception) as e:
-                logger.info("ERROR COMPARE {0} : {1}".format(b,e))
-        if version:
-            try:
-                do_version(b)
-            except (Exception) as e:
-                logger.info("ERROR VERSION {0} : {1}".format(b,e))
-
-    if install:
-        run_install()
-
-def do_rebuild(build):
-    # trigger the rebuild
-
-    cmd = "c:/Builds/build_{0}.bat".format(build)
-    logger.info("rebuild : {0}".format(cmd))
-    p = subprocess.Popen("start /wait /min {0}".format(cmd),env=env,shell=True,close_fds=True)
-    ret = p.wait()
-
-def do_compare(build):
-    # print the test outputs
-
-    f = os.path.join(base_dir,"test.{0}.log".format(build))
-    with open(f,'r') as fh:
-        for l in fh:
-            l = l.rstrip()
-            if l.startswith('ERROR:'):
-                logger.info("{0} : {1}".format(build,l))
-            if l.startswith('Ran') or l.startswith('OK') or l.startswith('FAIL'):
-                logger.info("{0} : {1}".format(build,l))
-
-def do_version(build):
-    # print the version strings
-
-    f = os.path.join(base_dir,"versions.{0}.log".format(build))
-    with open(f,'r') as fh:
-        for l in fh:
-            l = l.rstrip()
-            logger.info("{0} : {1}".format(build,l))
-
-def do_update(is_verbose=True):
-    # update git; return True if the commit has changed
-
-    repo = git.Repo(base_dir)
-    master = repo.heads.master
-    origin = repo.remotes.origin
-    start_commit = master.commit
-
-    if is_verbose:
-        logger.info("current commit   : {0}".format(start_commit))
-
-    try:
-        origin.update()
-    except (Exception) as e:
-        logger.info("update exception : {0}".format(e))
-    try:
-        origin.pull()
-    except (Exception) as e:
-        logger.info("pull exception : {0}".format(e))
-
-    result = start_commit != master.commit
-    if result:
-        if is_verbose:
-            logger.info("commits changed : {0} -> {1}".format(start_commit,master.commit))
-    return result
-
-def run_install():
-    # send the installation binaries
-
-    repo = git.Repo(base_dir)
-    master = repo.heads.master
-    commit = master.commit
-    short_hash = str(commit)[:7]
-
-    logger.info("sending files : {0}".format(commit))
-    d = os.path.join(base_dir,"dist")
-    files = [ f for f in os.listdir(d) if re.search(short_hash,f) ]
-    srv = pysftp.Connection(host=remote_host,username=username,password=password)
-    srv.chdir("www/pandas-build/dev")
-
-    # get current files
-    remote_files = set(srv.listdir(path='.'))
-
-    for f in files:
-        if f not in remote_files:
-            logger.info("sending: {0}".format(f))
-            local = os.path.join(d,f)
-            srv.put(localpath=local)
-
-    srv.close()
-    logger.info("sending files: done")
-
-# just perform the action
-if args.update or args.test or args.compare or args.install or args.version:
-    if args.update:
-        do_update()
-    run_all(test=args.test,compare=args.compare,install=args.install,version=args.version,build=args.build)
-    exit(0)
-
-# file logging
-file_handler = logging.FileHandler("C:\Builds\logs\check_and_build.log")
-file_handler.setFormatter(logging.Formatter(fmt))
-logger.addHandler(file_handler)
-
-logger.info("start")
-
-# main loop
-while(True):
-
-    if do_update():
-        run_all(test=True,install=False)
-
-    time.sleep(60*60)
-
-logger.info("exit")
-file_handler.close()
-
diff --git a/scripts/windows_builder/readme.txt b/scripts/windows_builder/readme.txt
deleted file mode 100644
index 789e2a9ee0c63..0000000000000
--- a/scripts/windows_builder/readme.txt
+++ /dev/null
@@ -1,17 +0,0 @@
-This is a collection of windows batch scripts (and a python script)
-to rebuild the binaries, test, and upload the binaries for public distribution
-upon a commit on github.
-
-Obviously requires that these be setup on windows
-Requires an install of Windows SDK 3.5 and 4.0
-Full python installs for each version with the deps
-
-Currently supporting
-
-27-32,27-64,34-32,34-64
-
-Note that 34 use the 4.0 SDK, while the other suse 3.5 SDK
-
-I installed these scripts in C:\Builds
-
-Installed libaries in C:\Installs
diff --git a/setup.cfg b/setup.cfg
index 8b32f0f62fe28..84b8f69a83f16 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -12,8 +12,43 @@ tag_prefix = v
 parentdir_prefix = pandas-
 
 [flake8]
-ignore = E731,E402
 max-line-length = 79
+ignore =
+    W503,  # line break before binary operator
+    W504,  # line break after binary operator
+    E402,  # module level import not at top of file
+    E731,  # do not assign a lambda expression, use a def
+    C406,  # Unnecessary list literal - rewrite as a dict literal.
+    C408,  # Unnecessary dict call - rewrite as a literal.
+    C409,  # Unnecessary list passed to tuple() - rewrite as a tuple literal.
+    S001   # found modulo formatter (incorrect picks up mod operations)
+exclude =
+    doc/sphinxext/*.py,
+    doc/build/*.py,
+    doc/temp/*.py,
+    .eggs/*.py,
+    versioneer.py,
+    env  # exclude asv benchmark environments from linting
+
+[flake8-rst]
+bootstrap =
+    import numpy as np
+    import pandas as pd
+    np  # avoiding error when importing again numpy or pandas
+    pd  # (in some cases we want to do it to show users)
+ignore = E402,  # module level import not at top of file
+         W503,  # line break before binary operator
+         # Classes/functions in different blocks can generate those errors
+         E302,  # expected 2 blank lines, found 0
+         E305,  # expected 2 blank lines after class or function definition, found 0
+         # We use semicolon at the end to avoid displaying plot objects
+         E703,  # statement ends with a semicolon
+         E711,  # comparison to none should be 'if cond is none:'
+
+exclude =
+    doc/source/getting_started/basics.rst
+    doc/source/development/contributing_docstring.rst
+
 
 [yapf]
 based_on_style = pep8
@@ -22,8 +57,119 @@ split_penalty_after_opening_bracket = 1000000
 split_penalty_logical_operator = 30
 
 [tool:pytest]
-# TODO: Change all yield-based (nose-style) fixutures to pytest fixtures
-# Silencing the warning until then
+minversion = 4.0.2
 testpaths = pandas
 markers =
     single: mark a test as single cpu only
+    slow: mark a test as slow
+    network: mark a test as network
+    db: tests requiring a database (mysql or postgres)
+    high_memory: mark a test as a high-memory only
+    clipboard: mark a pd.read_clipboard test
+doctest_optionflags = NORMALIZE_WHITESPACE IGNORE_EXCEPTION_DETAIL
+addopts = --strict-data-files
+xfail_strict = True
+
+[coverage:run]
+branch = False
+omit = */tests/*
+plugins = Cython.Coverage
+
+[coverage:report]
+ignore_errors = False
+show_missing = True
+# Regexes for lines to exclude from consideration
+exclude_lines =
+    # Have to re-enable the standard pragma
+    pragma: no cover
+
+    # Don't complain about missing debug-only code:
+    def __repr__
+    if self\.debug
+
+    # Don't complain if tests don't hit defensive assertion code:
+    raise AssertionError
+    raise NotImplementedError
+    AbstractMethodError
+
+    # Don't complain if non-runnable code isn't run:
+    if 0:
+    if __name__ == .__main__.:
+
+[coverage:html]
+directory = coverage_html_report
+
+# To be kept consistent with "Import Formatting" section in contributing.rst
+[isort]
+known_pre_core=pandas._libs,pandas.util._*,pandas.compat,pandas.errors
+known_dtypes=pandas.core.dtypes
+known_post_core=pandas.tseries,pandas.io,pandas.plotting
+sections=FUTURE,STDLIB,THIRDPARTY,PRE_CORE,DTYPES,FIRSTPARTY,POST_CORE,LOCALFOLDER
+
+known_first_party=pandas
+known_third_party=Cython,numpy,dateutil,matplotlib,python-dateutil,pytz,pyarrow,pytest
+multi_line_output=4
+force_grid_wrap=0
+combine_as_imports=True
+force_sort_within_sections=True
+skip=
+    pandas/core/api.py,
+    pandas/core/frame.py,
+    asv_bench/benchmarks/attrs_caching.py,
+    asv_bench/benchmarks/binary_ops.py,
+    asv_bench/benchmarks/categoricals.py,
+    asv_bench/benchmarks/ctors.py,
+    asv_bench/benchmarks/eval.py,
+    asv_bench/benchmarks/frame_ctor.py,
+    asv_bench/benchmarks/frame_methods.py,
+    asv_bench/benchmarks/gil.py,
+    asv_bench/benchmarks/groupby.py,
+    asv_bench/benchmarks/index_object.py,
+    asv_bench/benchmarks/indexing.py,
+    asv_bench/benchmarks/inference.py,
+    asv_bench/benchmarks/io/csv.py,
+    asv_bench/benchmarks/io/excel.py,
+    asv_bench/benchmarks/io/hdf.py,
+    asv_bench/benchmarks/io/json.py,
+    asv_bench/benchmarks/io/msgpack.py,
+    asv_bench/benchmarks/io/pickle.py,
+    asv_bench/benchmarks/io/sql.py,
+    asv_bench/benchmarks/io/stata.py,
+    asv_bench/benchmarks/join_merge.py,
+    asv_bench/benchmarks/multiindex_object.py,
+    asv_bench/benchmarks/panel_ctor.py,
+    asv_bench/benchmarks/panel_methods.py,
+    asv_bench/benchmarks/plotting.py,
+    asv_bench/benchmarks/reindex.py,
+    asv_bench/benchmarks/replace.py,
+    asv_bench/benchmarks/reshape.py,
+    asv_bench/benchmarks/rolling.py,
+    asv_bench/benchmarks/series_methods.py,
+    asv_bench/benchmarks/sparse.py,
+    asv_bench/benchmarks/stat_ops.py,
+    asv_bench/benchmarks/timeseries.py
+    asv_bench/benchmarks/pandas_vb_common.py
+    asv_bench/benchmarks/offset.py
+    asv_bench/benchmarks/dtypes.py
+    asv_bench/benchmarks/strings.py
+    asv_bench/benchmarks/period.py
+    pandas/__init__.py
+    pandas/plotting/__init__.py
+    pandas/tests/extension/decimal/__init__.py
+    pandas/tests/extension/base/__init__.py
+    pandas/io/msgpack/__init__.py
+    pandas/io/json/__init__.py
+    pandas/io/clipboard/__init__.py
+    pandas/io/excel/__init__.py
+    pandas/compat/__init__.py
+    pandas/compat/numpy/__init__.py
+    pandas/core/arrays/__init__.py
+    pandas/core/groupby/__init__.py
+    pandas/core/internals/__init__.py
+    pandas/api/__init__.py
+    pandas/api/extensions/__init__.py
+    pandas/api/types/__init__.py
+    pandas/_libs/__init__.py
+    pandas/_libs/tslibs/__init__.py
+    pandas/util/__init__.py
+    pandas/arrays/__init__.py
diff --git a/setup.py b/setup.py
index 1b471f76ac5e6..a83e07b50ed57 100755
--- a/setup.py
+++ b/setup.py
@@ -7,95 +7,66 @@
 """
 
 import os
+from os.path import join as pjoin
+
+import pkg_resources
+import platform
+from distutils.sysconfig import get_config_var
 import sys
 import shutil
-import warnings
-import re
-import platform
 from distutils.version import LooseVersion
+from setuptools import setup, Command, find_packages
+
+# versioning
+import versioneer
+cmdclass = versioneer.get_cmdclass()
+
 
 def is_platform_windows():
     return sys.platform == 'win32' or sys.platform == 'cygwin'
 
-def is_platform_linux():
-    return sys.platform == 'linux2'
 
 def is_platform_mac():
     return sys.platform == 'darwin'
 
-# versioning
-import versioneer
-cmdclass = versioneer.get_cmdclass()
 
-min_cython_ver = '0.23'
+min_numpy_ver = '1.12.0'
+setuptools_kwargs = {
+    'install_requires': [
+        'python-dateutil >= 2.5.0',
+        'pytz >= 2011k',
+        'numpy >= {numpy_ver}'.format(numpy_ver=min_numpy_ver),
+    ],
+    'setup_requires': ['numpy >= {numpy_ver}'.format(numpy_ver=min_numpy_ver)],
+    'zip_safe': False,
+}
+
+
+min_cython_ver = '0.28.2'
 try:
     import Cython
     ver = Cython.__version__
+    from Cython.Build import cythonize
     _CYTHON_INSTALLED = ver >= LooseVersion(min_cython_ver)
 except ImportError:
     _CYTHON_INSTALLED = False
+    cythonize = lambda x, *args, **kwargs: x  # dummy func
 
-try:
-    import pkg_resources
-    from setuptools import setup, Command
-    _have_setuptools = True
-except ImportError:
-    # no setuptools installed
-    from distutils.core import setup, Command
-    _have_setuptools = False
-
-setuptools_kwargs = {}
-min_numpy_ver = '1.7.0'
-if sys.version_info[0] >= 3:
-
-    setuptools_kwargs = {
-                         'zip_safe': False,
-                         'install_requires': ['python-dateutil >= 2',
-                                              'pytz >= 2011k',
-                                              'numpy >= %s' % min_numpy_ver],
-                         'setup_requires': ['numpy >= %s' % min_numpy_ver],
-                         }
-    if not _have_setuptools:
-        sys.exit("need setuptools/distribute for Py3k"
-                 "\n$ pip install distribute")
-
-else:
-    setuptools_kwargs = {
-        'install_requires': ['python-dateutil',
-                            'pytz >= 2011k',
-                             'numpy >= %s' % min_numpy_ver],
-        'setup_requires': ['numpy >= %s' % min_numpy_ver],
-        'zip_safe': False,
-    }
-
-    if not _have_setuptools:
-        try:
-            import numpy
-            import dateutil
-            setuptools_kwargs = {}
-        except ImportError:
-            sys.exit("install requires: 'python-dateutil < 2','numpy'."
-                     "  use pip or easy_install."
-                     "\n   $ pip install 'python-dateutil < 2' 'numpy'")
-
-from distutils.extension import Extension
-from distutils.command.build import build
-from distutils.command.build_ext import build_ext as _build_ext
+# The import of Extension must be after the import of Cython, otherwise
+# we do not get the appropriately patched class.
+# See https://cython.readthedocs.io/en/latest/src/reference/compilation.html
+from distutils.extension import Extension  # noqa:E402
+from distutils.command.build import build  # noqa:E402
 
 try:
     if not _CYTHON_INSTALLED:
         raise ImportError('No supported version of Cython installed.')
-    try:
-        from Cython.Distutils.old_build_ext import old_build_ext as _build_ext
-    except ImportError:
-        # Pre 0.25
-        from Cython.Distutils import build_ext as _build_ext
+    from Cython.Distutils.old_build_ext import old_build_ext as _build_ext
     cython = True
 except ImportError:
+    from distutils.command.build_ext import build_ext as _build_ext
     cython = False
-
-
-if cython:
+else:
     try:
         try:
             from Cython import Tempita as tempita
@@ -106,20 +77,16 @@ def is_platform_mac():
                           'pip install Tempita')
 
 
-from os.path import join as pjoin
-
-
 _pxi_dep_template = {
     'algos': ['_libs/algos_common_helper.pxi.in',
-              '_libs/algos_take_helper.pxi.in', '_libs/algos_rank_helper.pxi.in'],
+              '_libs/algos_take_helper.pxi.in',
+              '_libs/algos_rank_helper.pxi.in'],
     'groupby': ['_libs/groupby_helper.pxi.in'],
-    'join': ['_libs/join_helper.pxi.in', '_libs/join_func_helper.pxi.in'],
-    'reshape': ['_libs/reshape_helper.pxi.in'],
     'hashtable': ['_libs/hashtable_class_helper.pxi.in',
-                   '_libs/hashtable_func_helper.pxi.in'],
+                  '_libs/hashtable_func_helper.pxi.in'],
     'index': ['_libs/index_class_helper.pxi.in'],
-    'sparse': ['sparse/sparse_op_helper.pxi.in'],
-}
+    'sparse': ['_libs/sparse_op_helper.pxi.in'],
+    'interval': ['_libs/intervaltree.pxi.in']}
 
 _pxifiles = []
 _pxi_dep = {}
@@ -130,37 +97,41 @@ def is_platform_mac():
 
 
 class build_ext(_build_ext):
-    def build_extensions(self):
-
-        # if builing from c files, don't need to
-        # generate template output
-        if cython:
-            for pxifile in _pxifiles:
-                # build pxifiles first, template extention must be .pxi.in
-                assert pxifile.endswith('.pxi.in')
-                outfile = pxifile[:-3]
-
-                if (os.path.exists(outfile) and
+    @classmethod
+    def render_templates(cls, pxifiles):
+        for pxifile in pxifiles:
+            # build pxifiles first, template extension must be .pxi.in
+            assert pxifile.endswith('.pxi.in')
+            outfile = pxifile[:-3]
+
+            if (os.path.exists(outfile) and
                     os.stat(pxifile).st_mtime < os.stat(outfile).st_mtime):
-                    # if .pxi.in is not updated, no need to output .pxi
-                    continue
+                # if .pxi.in is not updated, no need to output .pxi
+                continue
 
-                with open(pxifile, "r") as f:
-                    tmpl = f.read()
-                pyxcontent = tempita.sub(tmpl)
+            with open(pxifile, "r") as f:
+                tmpl = f.read()
+            pyxcontent = tempita.sub(tmpl)
 
-                with open(outfile, "w") as f:
-                    f.write(pyxcontent)
+            with open(outfile, "w") as f:
+                f.write(pyxcontent)
+
+    def build_extensions(self):
+        # if building from c files, don't need to
+        # generate template output
+        if cython:
+            self.render_templates(_pxifiles)
 
         numpy_incl = pkg_resources.resource_filename('numpy', 'core/include')
 
         for ext in self.extensions:
-            if hasattr(ext, 'include_dirs') and not numpy_incl in ext.include_dirs:
+            if (hasattr(ext, 'include_dirs') and
+                    numpy_incl not in ext.include_dirs):
                 ext.include_dirs.append(numpy_incl)
         _build_ext.build_extensions(self)
 
 
-DESCRIPTION = ("Powerful data structures for data analysis, time series,"
+DESCRIPTION = ("Powerful data structures for data analysis, time series, "
                "and statistics")
 LONG_DESCRIPTION = """
 **pandas** is a Python package providing fast, flexible, and expressive data
@@ -224,10 +195,6 @@ def build_extensions(self):
 munging and cleaning data, analyzing / modeling it, then organizing the results
 of the analysis into a form suitable for plotting or tabular display. pandas is
 the ideal tool for all of these tasks.
-
-Note
-----
-Windows binaries built against NumPy 1.8.1
 """
 
 DISTNAME = 'pandas'
@@ -245,12 +212,12 @@ def build_extensions(self):
     'Programming Language :: Python :: 2',
     'Programming Language :: Python :: 3',
     'Programming Language :: Python :: 2.7',
-    'Programming Language :: Python :: 3.4',
     'Programming Language :: Python :: 3.5',
     'Programming Language :: Python :: 3.6',
+    'Programming Language :: Python :: 3.7',
     'Programming Language :: Cython',
-    'Topic :: Scientific/Engineering',
-]
+    'Topic :: Scientific/Engineering']
+
 
 class CleanCommand(Command):
     """Custom distutils command to clean the .so and .pyc files."""
@@ -262,24 +229,23 @@ def initialize_options(self):
         self._clean_me = []
         self._clean_trees = []
 
-        base = pjoin('pandas','_libs', 'src')
-        dt = pjoin(base,'datetime')
-        src = base
-        util = pjoin('pandas','util')
-        parser = pjoin(base,'parser')
-        ujson_python = pjoin(base,'ujson','python')
-        ujson_lib = pjoin(base,'ujson','lib')
-        self._clean_exclude = [pjoin(dt,'np_datetime.c'),
-                               pjoin(dt,'np_datetime_strings.c'),
-                               pjoin(src,'period_helper.c'),
-                               pjoin(parser,'tokenizer.c'),
-                               pjoin(parser,'io.c'),
-                               pjoin(ujson_python,'ujson.c'),
-                               pjoin(ujson_python,'objToJSON.c'),
-                               pjoin(ujson_python,'JSONtoObj.c'),
-                               pjoin(ujson_lib,'ultrajsonenc.c'),
-                               pjoin(ujson_lib,'ultrajsondec.c'),
-                               pjoin(util,'move.c'),
+        base = pjoin('pandas', '_libs', 'src')
+        tsbase = pjoin('pandas', '_libs', 'tslibs', 'src')
+        dt = pjoin(tsbase, 'datetime')
+        util = pjoin('pandas', 'util')
+        parser = pjoin(base, 'parser')
+        ujson_python = pjoin(base, 'ujson', 'python')
+        ujson_lib = pjoin(base, 'ujson', 'lib')
+        self._clean_exclude = [pjoin(dt, 'np_datetime.c'),
+                               pjoin(dt, 'np_datetime_strings.c'),
+                               pjoin(parser, 'tokenizer.c'),
+                               pjoin(parser, 'io.c'),
+                               pjoin(ujson_python, 'ujson.c'),
+                               pjoin(ujson_python, 'objToJSON.c'),
+                               pjoin(ujson_python, 'JSONtoObj.c'),
+                               pjoin(ujson_lib, 'ultrajsonenc.c'),
+                               pjoin(ujson_lib, 'ultrajsondec.c'),
+                               pjoin(util, 'move.c'),
                                ]
 
         for root, dirs, files in os.walk('pandas'):
@@ -325,50 +291,71 @@ def run(self):
 # class as it encodes the version info
 sdist_class = cmdclass['sdist']
 
+
 class CheckSDist(sdist_class):
     """Custom sdist that ensures Cython has compiled all pyx files to c."""
 
     _pyxfiles = ['pandas/_libs/lib.pyx',
                  'pandas/_libs/hashtable.pyx',
                  'pandas/_libs/tslib.pyx',
-                 'pandas/_libs/period.pyx',
                  'pandas/_libs/index.pyx',
+                 'pandas/_libs/internals.pyx',
                  'pandas/_libs/algos.pyx',
                  'pandas/_libs/join.pyx',
-                 'pandas/core/window.pyx',
-                 'pandas/sparse/sparse.pyx',
-                 'pandas/util/testing.pyx',
-                 'pandas/tools/hash.pyx',
-                 'pandas/io/parsers.pyx',
+                 'pandas/_libs/indexing.pyx',
+                 'pandas/_libs/interval.pyx',
+                 'pandas/_libs/hashing.pyx',
+                 'pandas/_libs/missing.pyx',
+                 'pandas/_libs/reduction.pyx',
+                 'pandas/_libs/testing.pyx',
+                 'pandas/_libs/skiplist.pyx',
+                 'pandas/_libs/sparse.pyx',
+                 'pandas/_libs/ops.pyx',
+                 'pandas/_libs/parsers.pyx',
+                 'pandas/_libs/tslibs/ccalendar.pyx',
+                 'pandas/_libs/tslibs/period.pyx',
+                 'pandas/_libs/tslibs/strptime.pyx',
+                 'pandas/_libs/tslibs/np_datetime.pyx',
+                 'pandas/_libs/tslibs/timedeltas.pyx',
+                 'pandas/_libs/tslibs/timestamps.pyx',
+                 'pandas/_libs/tslibs/timezones.pyx',
+                 'pandas/_libs/tslibs/conversion.pyx',
+                 'pandas/_libs/tslibs/fields.pyx',
+                 'pandas/_libs/tslibs/offsets.pyx',
+                 'pandas/_libs/tslibs/frequencies.pyx',
+                 'pandas/_libs/tslibs/resolution.pyx',
+                 'pandas/_libs/tslibs/parsing.pyx',
+                 'pandas/_libs/writers.pyx',
                  'pandas/io/sas/sas.pyx']
 
+    _cpp_pyxfiles = ['pandas/_libs/window.pyx',
+                     'pandas/io/msgpack/_packer.pyx',
+                     'pandas/io/msgpack/_unpacker.pyx']
+
     def initialize_options(self):
         sdist_class.initialize_options(self)
 
-        '''
-        self._pyxfiles = []
-        for root, dirs, files in os.walk('pandas'):
-            for f in files:
-                if f.endswith('.pyx'):
-                    self._pyxfiles.append(pjoin(root, f))
-        '''
-
     def run(self):
         if 'cython' in cmdclass:
             self.run_command('cython')
         else:
-            for pyxfile in self._pyxfiles:
-                cfile = pyxfile[:-3] + 'c'
-                msg = "C-source file '%s' not found." % (cfile) +\
-                    " Run 'setup.py cython' before sdist."
-                assert os.path.isfile(cfile), msg
+            # If we are not running cython then
+            # compile the extensions correctly
+            pyx_files = [(self._pyxfiles, 'c'), (self._cpp_pyxfiles, 'cpp')]
+
+            for pyxfiles, extension in pyx_files:
+                for pyxfile in pyxfiles:
+                    sourcefile = pyxfile[:-3] + extension
+                    msg = ("{extension}-source file '{source}' not found.\n"
+                           "Run 'setup.py cython' before sdist.".format(
+                               source=sourcefile, extension=extension))
+                    assert os.path.isfile(sourcefile), msg
         sdist_class.run(self)
 
 
 class CheckingBuildExt(build_ext):
     """
     Subclass build_ext to get clearer report if Cython is necessary.
-
     """
 
     def check_cython_extensions(self, extensions):
@@ -376,10 +363,10 @@ def check_cython_extensions(self, extensions):
             for src in ext.sources:
                 if not os.path.exists(src):
                     print("{}: -> [{}]".format(ext.name, ext.sources))
-                    raise Exception("""Cython-generated file '%s' not found.
+                    raise Exception("""Cython-generated file '{src}' not found.
                 Cython is required to compile pandas from a development branch.
                 Please install Cython or download a release package of pandas.
-                """ % src)
+                """.format(src=src))
 
     def build_extensions(self):
         self.check_cython_extensions(self.extensions)
@@ -387,9 +374,11 @@ def build_extensions(self):
 
 
 class CythonCommand(build_ext):
-    """Custom distutils command subclassed from Cython.Distutils.build_ext
+    """
+    Custom distutils command subclassed from Cython.Distutils.build_ext
     to compile pyx->c, and stop there. All this does is override the
-    C-compile method build_extension() with a no-op."""
+    C-compile method build_extension() with a no-op.
+    """
     def build_extension(self, ext):
         pass
 
@@ -408,23 +397,10 @@ def finalize_options(self):
     def run(self):
         pass
 
+
 cmdclass.update({'clean': CleanCommand,
                  'build': build})
 
-try:
-    from wheel.bdist_wheel import bdist_wheel
-
-    class BdistWheel(bdist_wheel):
-        def get_tag(self):
-            tag = bdist_wheel.get_tag(self)
-            repl = 'macosx_10_6_intel.macosx_10_9_intel.macosx_10_9_x86_64'
-            if tag[2] == 'macosx_10_6_intel':
-                tag = (tag[0], tag[1], repl)
-            return tag
-    cmdclass['bdist_wheel'] = BdistWheel
-except ImportError:
-    pass
-
 if cython:
     suffix = '.pyx'
     cmdclass['build_ext'] = CheckingBuildExt
@@ -434,272 +410,334 @@ def get_tag(self):
     cmdclass['build_src'] = DummyBuildSrc
     cmdclass['build_ext'] = CheckingBuildExt
 
-lib_depends = ['reduce', 'inference', 'properties']
+# ----------------------------------------------------------------------
+# Preparation of compiler arguments
 
+if sys.byteorder == 'big':
+    endian_macro = [('__BIG_ENDIAN__', '1')]
+else:
+    endian_macro = [('__LITTLE_ENDIAN__', '1')]
 
-def srcpath(name=None, suffix='.pyx', subdir='src'):
-    return pjoin('pandas', subdir, name + suffix)
 
-if suffix == '.pyx':
-    lib_depends = [srcpath(f, suffix='.pyx', subdir='_libs/src') for f in lib_depends]
-    lib_depends.append('pandas/_libs/src/util.pxd')
+if is_platform_windows():
+    extra_compile_args = []
 else:
-    lib_depends = []
-    plib_depends = []
+    # args to ignore warnings
+    extra_compile_args = ['-Wno-unused-function']
+
+
+# For mac, ensure extensions are built for macos 10.9 when compiling on a
+# 10.9 system or above, overriding distuitls behaviour which is to target
+# the version that python was built for. This may be overridden by setting
+# MACOSX_DEPLOYMENT_TARGET before calling setup.py
+if is_platform_mac():
+    if 'MACOSX_DEPLOYMENT_TARGET' not in os.environ:
+        current_system = LooseVersion(platform.mac_ver()[0])
+        python_target = LooseVersion(
+            get_config_var('MACOSX_DEPLOYMENT_TARGET'))
+        if python_target < '10.9' and current_system >= '10.9':
+            os.environ['MACOSX_DEPLOYMENT_TARGET'] = '10.9'
+
+
+# enable coverage by building cython files by setting the environment variable
+# "PANDAS_CYTHON_COVERAGE" (with a Truthy value) or by running build_ext
+# with `--with-cython-coverage`enabled
+linetrace = os.environ.get('PANDAS_CYTHON_COVERAGE', False)
+if '--with-cython-coverage' in sys.argv:
+    linetrace = True
+    sys.argv.remove('--with-cython-coverage')
+
+# Note: if not using `cythonize`, coverage can be enabled by
+# pinning `ext.cython_directives = directives` to each ext in extensions.
+# github.com/cython/cython/wiki/enhancements-compilerdirectives#in-setuppy
+directives = {'linetrace': False,
+              'language_level': 2}
+macros = []
+if linetrace:
+    # https://pypkg.com/pypi/pytest-cython/f/tests/example-project/setup.py
+    directives['linetrace'] = True
+    macros = [('CYTHON_TRACE', '1'), ('CYTHON_TRACE_NOGIL', '1')]
+
+# in numpy>=1.16.0, silence build warnings about deprecated API usage
+#  we can't do anything about these warnings because they stem from
+#  cython+numpy version mismatches.
+macros.append(('NPY_NO_DEPRECATED_API', '0'))
+
+
+# ----------------------------------------------------------------------
+# Specification of Dependencies
+
+# TODO: Need to check to see if e.g. `linetrace` has changed and possibly
+# re-compile.
+def maybe_cythonize(extensions, *args, **kwargs):
+    """
+    Render tempita templates before calling cythonize
+    """
+    if len(sys.argv) > 1 and 'clean' in sys.argv:
+        # Avoid running cythonize on `python setup.py clean`
+        # See https://github.com/cython/cython/issues/1495
+        return extensions
+    if not cython:
+        # Avoid trying to look up numpy when installing from sdist
+        # https://github.com/pandas-dev/pandas/issues/25193
+        # TODO: See if this can be removed after pyproject.toml added.
+        return extensions
+
+    numpy_incl = pkg_resources.resource_filename('numpy', 'core/include')
+    # TODO: Is this really necessary here?
+    for ext in extensions:
+        if (hasattr(ext, 'include_dirs') and
+                numpy_incl not in ext.include_dirs):
+            ext.include_dirs.append(numpy_incl)
 
-common_include = ['pandas/_libs/src/klib', 'pandas/_libs/src']
+    build_ext.render_templates(_pxifiles)
+    return cythonize(extensions, *args, **kwargs)
 
 
-def pxd(name):
-    return os.path.abspath(pjoin('pandas', name + '.pxd'))
+def srcpath(name=None, suffix='.pyx', subdir='src'):
+    return pjoin('pandas', subdir, name + suffix)
 
-# args to ignore warnings
-if is_platform_windows():
-    extra_compile_args=[]
-else:
-    extra_compile_args=['-Wno-unused-function']
 
-lib_depends = lib_depends + ['pandas/_libs/src/numpy_helper.h',
-                             'pandas/_libs/src/parse_helper.h',
-                             'pandas/_libs/src/compat_helper.h']
+common_include = ['pandas/_libs/src/klib', 'pandas/_libs/src']
+ts_include = ['pandas/_libs/tslibs/src', 'pandas/_libs/tslibs']
+
 
+lib_depends = ['pandas/_libs/src/parse_helper.h',
+               'pandas/_libs/src/compat_helper.h']
 
-tseries_depends = ['pandas/_libs/src/datetime/np_datetime.h',
-                   'pandas/_libs/src/datetime/np_datetime_strings.h',
-                   'pandas/_libs/src/datetime_helper.h',
-                   'pandas/_libs/src/period_helper.h',
-                   'pandas/_libs/src/datetime.pxd']
+np_datetime_headers = [
+    'pandas/_libs/tslibs/src/datetime/np_datetime.h',
+    'pandas/_libs/tslibs/src/datetime/np_datetime_strings.h']
+np_datetime_sources = [
+    'pandas/_libs/tslibs/src/datetime/np_datetime.c',
+    'pandas/_libs/tslibs/src/datetime/np_datetime_strings.c']
 
+tseries_depends = np_datetime_headers
 
-# some linux distros require it
-libraries = ['m'] if not is_platform_windows() else []
 
 ext_data = {
-    '_libs.lib': {'pyxfile': '_libs/lib',
-                  'depends': lib_depends + tseries_depends},
-    '_libs.hashtable': {'pyxfile': '_libs/hashtable',
-                        'pxdfiles': ['_libs/hashtable'],
-                        'depends': (['pandas/_libs/src/klib/khash_python.h']
-                                    + _pxi_dep['hashtable'])},
-    '_libs.tslib': {'pyxfile': '_libs/tslib',
-                    'pxdfiles': ['_libs/src/util', '_libs/lib'],
-                    'depends': tseries_depends,
-                    'sources': ['pandas/_libs/src/datetime/np_datetime.c',
-                                'pandas/_libs/src/datetime/np_datetime_strings.c',
-                                'pandas/_libs/src/period_helper.c']},
-    '_libs.period': {'pyxfile': '_libs/period',
-                     'depends': tseries_depends,
-                     'sources': ['pandas/_libs/src/datetime/np_datetime.c',
-                                 'pandas/_libs/src/datetime/np_datetime_strings.c',
-                                 'pandas/_libs/src/period_helper.c']},
-    '_libs.index': {'pyxfile': '_libs/index',
-                    'sources': ['pandas/_libs/src/datetime/np_datetime.c',
-                                'pandas/_libs/src/datetime/np_datetime_strings.c'],
-                    'pxdfiles': ['_libs/src/util', '_libs/hashtable'],
-                    'depends': _pxi_dep['index']},
-    '_libs.algos': {'pyxfile': '_libs/algos',
-                    'pxdfiles': ['_libs/src/util', '_libs/algos', '_libs/hashtable'],
-                    'depends': _pxi_dep['algos']},
-    '_libs.groupby': {'pyxfile': '_libs/groupby',
-                    'pxdfiles': ['_libs/src/util', '_libs/algos'],
-                    'depends': _pxi_dep['groupby']},
-    '_libs.join': {'pyxfile': '_libs/join',
-                   'pxdfiles': ['_libs/src/util', '_libs/hashtable'],
-                   'depends': _pxi_dep['join']},
-    '_libs.reshape': {'pyxfile': '_libs/reshape',
-                      'depends': _pxi_dep['reshape']},
-    'core.libwindow': {'pyxfile': 'core/window',
-                       'pxdfiles': ['_libs/src/skiplist', '_libs/src/util'],
-                       'depends': ['pandas/_libs/src/skiplist.pyx',
-                                   'pandas/_libs/src/skiplist.h']},
-    'io.libparsers': {'pyxfile': 'io/parsers',
-                      'depends': ['pandas/_libs/src/parser/tokenizer.h',
-                                  'pandas/_libs/src/parser/io.h',
-                                  'pandas/_libs/src/numpy_helper.h'],
-                      'sources': ['pandas/_libs/src/parser/tokenizer.c',
-                                  'pandas/_libs/src/parser/io.c']},
-    'sparse.libsparse': {'pyxfile': 'sparse/sparse',
-                         'depends': (['pandas/sparse/sparse.pyx'] +
-                                     _pxi_dep['sparse'])},
-    'util.libtesting': {'pyxfile': 'util/testing',
-                        'depends': ['pandas/util/testing.pyx']},
-    'tools.libhashing': {'pyxfile': 'tools/hashing',
-                         'depends': ['pandas/tools/hashing.pyx']},
-    'io.sas.libsas': {'pyxfile': 'io/sas/sas'},
+    '_libs.algos': {
+        'pyxfile': '_libs/algos',
+        'depends': _pxi_dep['algos']},
+    '_libs.groupby': {
+        'pyxfile': '_libs/groupby',
+        'depends': _pxi_dep['groupby']},
+    '_libs.hashing': {
+        'pyxfile': '_libs/hashing',
+        'include': [],
+        'depends': []},
+    '_libs.hashtable': {
+        'pyxfile': '_libs/hashtable',
+        'depends': (['pandas/_libs/src/klib/khash_python.h'] +
+                    _pxi_dep['hashtable'])},
+    '_libs.index': {
+        'pyxfile': '_libs/index',
+        'include': common_include + ts_include,
+        'depends': _pxi_dep['index'],
+        'sources': np_datetime_sources},
+    '_libs.indexing': {
+        'pyxfile': '_libs/indexing'},
+    '_libs.internals': {
+        'pyxfile': '_libs/internals'},
+    '_libs.interval': {
+        'pyxfile': '_libs/interval',
+        'depends': _pxi_dep['interval']},
+    '_libs.join': {
+        'pyxfile': '_libs/join'},
+    '_libs.lib': {
+        'pyxfile': '_libs/lib',
+        'include': common_include + ts_include,
+        'depends': lib_depends + tseries_depends},
+    '_libs.missing': {
+        'pyxfile': '_libs/missing',
+        'include': common_include + ts_include,
+        'depends': tseries_depends},
+    '_libs.parsers': {
+        'pyxfile': '_libs/parsers',
+        'depends': ['pandas/_libs/src/parser/tokenizer.h',
+                    'pandas/_libs/src/parser/io.h'],
+        'sources': ['pandas/_libs/src/parser/tokenizer.c',
+                    'pandas/_libs/src/parser/io.c']},
+    '_libs.reduction': {
+        'pyxfile': '_libs/reduction'},
+    '_libs.ops': {
+        'pyxfile': '_libs/ops'},
+    '_libs.properties': {
+        'pyxfile': '_libs/properties',
+        'include': []},
+    '_libs.reshape': {
+        'pyxfile': '_libs/reshape',
+        'depends': []},
+    '_libs.skiplist': {
+        'pyxfile': '_libs/skiplist',
+        'depends': ['pandas/_libs/src/skiplist.h']},
+    '_libs.sparse': {
+        'pyxfile': '_libs/sparse',
+        'depends': _pxi_dep['sparse']},
+    '_libs.tslib': {
+        'pyxfile': '_libs/tslib',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.ccalendar': {
+        'pyxfile': '_libs/tslibs/ccalendar',
+        'include': []},
+    '_libs.tslibs.conversion': {
+        'pyxfile': '_libs/tslibs/conversion',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.fields': {
+        'pyxfile': '_libs/tslibs/fields',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.frequencies': {
+        'pyxfile': '_libs/tslibs/frequencies',
+        'include': []},
+    '_libs.tslibs.nattype': {
+        'pyxfile': '_libs/tslibs/nattype',
+        'include': []},
+    '_libs.tslibs.np_datetime': {
+        'pyxfile': '_libs/tslibs/np_datetime',
+        'include': ts_include,
+        'depends': np_datetime_headers,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.offsets': {
+        'pyxfile': '_libs/tslibs/offsets',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.parsing': {
+        'pyxfile': '_libs/tslibs/parsing',
+        'include': []},
+    '_libs.tslibs.period': {
+        'pyxfile': '_libs/tslibs/period',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.resolution': {
+        'pyxfile': '_libs/tslibs/resolution',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.strptime': {
+        'pyxfile': '_libs/tslibs/strptime',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timedeltas': {
+        'pyxfile': '_libs/tslibs/timedeltas',
+        'include': ts_include,
+        'depends': np_datetime_headers,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timestamps': {
+        'pyxfile': '_libs/tslibs/timestamps',
+        'include': ts_include,
+        'depends': tseries_depends,
+        'sources': np_datetime_sources},
+    '_libs.tslibs.timezones': {
+        'pyxfile': '_libs/tslibs/timezones',
+        'include': []},
+    '_libs.testing': {
+        'pyxfile': '_libs/testing'},
+    '_libs.window': {
+        'pyxfile': '_libs/window',
+        'language': 'c++',
+        'suffix': '.cpp'},
+    '_libs.writers': {
+        'pyxfile': '_libs/writers'},
+    'io.sas._sas': {
+        'pyxfile': 'io/sas/sas'},
+    'io.msgpack._packer': {
+        'macros': endian_macro + macros,
+        'depends': ['pandas/_libs/src/msgpack/pack.h',
+                    'pandas/_libs/src/msgpack/pack_template.h'],
+        'include': ['pandas/_libs/src/msgpack'] + common_include,
+        'language': 'c++',
+        'suffix': '.cpp',
+        'pyxfile': 'io/msgpack/_packer',
+        'subdir': 'io/msgpack'},
+    'io.msgpack._unpacker': {
+        'depends': ['pandas/_libs/src/msgpack/unpack.h',
+                    'pandas/_libs/src/msgpack/unpack_define.h',
+                    'pandas/_libs/src/msgpack/unpack_template.h'],
+        'macros': endian_macro + macros,
+        'include': ['pandas/_libs/src/msgpack'] + common_include,
+        'language': 'c++',
+        'suffix': '.cpp',
+        'pyxfile': 'io/msgpack/_unpacker',
+        'subdir': 'io/msgpack'
     }
+}
 
 extensions = []
 
 for name, data in ext_data.items():
-    sources = [srcpath(data['pyxfile'], suffix=suffix, subdir='')]
-    pxds = [pxd(x) for x in data.get('pxdfiles', [])]
-    if suffix == '.pyx' and pxds:
-        sources.extend(pxds)
+    source_suffix = suffix if suffix == '.pyx' else data.get('suffix', '.c')
+
+    sources = [srcpath(data['pyxfile'], suffix=source_suffix, subdir='')]
 
     sources.extend(data.get('sources', []))
 
     include = data.get('include', common_include)
 
-    obj = Extension('pandas.%s' % name,
+    obj = Extension('pandas.{name}'.format(name=name),
                     sources=sources,
                     depends=data.get('depends', []),
                     include_dirs=include,
+                    language=data.get('language', 'c'),
+                    define_macros=data.get('macros', macros),
                     extra_compile_args=extra_compile_args)
 
     extensions.append(obj)
 
-
-#----------------------------------------------------------------------
-# msgpack
-
-if sys.byteorder == 'big':
-    macros = [('__BIG_ENDIAN__', '1')]
-else:
-    macros = [('__LITTLE_ENDIAN__', '1')]
-
-packer_ext = Extension('pandas.io.msgpack._packer',
-                        depends=['pandas/_libs/src/msgpack/pack.h',
-                                 'pandas/_libs/src/msgpack/pack_template.h'],
-                        sources = [srcpath('_packer',
-                                   suffix=suffix if suffix == '.pyx' else '.cpp',
-                                   subdir='io/msgpack')],
-                        language='c++',
-                        include_dirs=['pandas/_libs/src/msgpack'] + common_include,
-                        define_macros=macros,
-                        extra_compile_args=extra_compile_args)
-unpacker_ext = Extension('pandas.io.msgpack._unpacker',
-                        depends=['pandas/_libs/src/msgpack/unpack.h',
-                                 'pandas/_libs/src/msgpack/unpack_define.h',
-                                 'pandas/_libs/src/msgpack/unpack_template.h'],
-                        sources = [srcpath('_unpacker',
-                                   suffix=suffix if suffix == '.pyx' else '.cpp',
-                                   subdir='io/msgpack')],
-                        language='c++',
-                        include_dirs=['pandas/_libs/src/msgpack'] + common_include,
-                        define_macros=macros,
-                        extra_compile_args=extra_compile_args)
-extensions.append(packer_ext)
-extensions.append(unpacker_ext)
-
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # ujson
 
-if suffix == '.pyx' and 'setuptools' in sys.modules:
+if suffix == '.pyx':
     # undo dumb setuptools bug clobbering .pyx sources back to .c
     for ext in extensions:
-        if ext.sources[0].endswith(('.c','.cpp')):
+        if ext.sources[0].endswith(('.c', '.cpp')):
             root, _ = os.path.splitext(ext.sources[0])
             ext.sources[0] = root + suffix
 
-ujson_ext = Extension('pandas.io.json.libjson',
-                      depends=['pandas/_libs/src/ujson/lib/ultrajson.h',
-                               'pandas/_libs/src/datetime_helper.h',
-                               'pandas/_libs/src/numpy_helper.h'],
-                      sources=['pandas/_libs/src/ujson/python/ujson.c',
-                               'pandas/_libs/src/ujson/python/objToJSON.c',
-                               'pandas/_libs/src/ujson/python/JSONtoObj.c',
-                               'pandas/_libs/src/ujson/lib/ultrajsonenc.c',
-                               'pandas/_libs/src/ujson/lib/ultrajsondec.c',
-                               'pandas/_libs/src/datetime/np_datetime.c',
-                               'pandas/_libs/src/datetime/np_datetime_strings.c'],
+ujson_ext = Extension('pandas._libs.json',
+                      depends=['pandas/_libs/src/ujson/lib/ultrajson.h'],
+                      sources=(['pandas/_libs/src/ujson/python/ujson.c',
+                                'pandas/_libs/src/ujson/python/objToJSON.c',
+                                'pandas/_libs/src/ujson/python/JSONtoObj.c',
+                                'pandas/_libs/src/ujson/lib/ultrajsonenc.c',
+                                'pandas/_libs/src/ujson/lib/ultrajsondec.c'] +
+                               np_datetime_sources),
                       include_dirs=['pandas/_libs/src/ujson/python',
                                     'pandas/_libs/src/ujson/lib',
-                                    'pandas/_libs/src/datetime'] + common_include,
-                      extra_compile_args=['-D_GNU_SOURCE'] + extra_compile_args)
+                                    'pandas/_libs/src/datetime'],
+                      extra_compile_args=(['-D_GNU_SOURCE'] +
+                                          extra_compile_args),
+                      define_macros=macros)
 
 
 extensions.append(ujson_ext)
 
-#----------------------------------------------------------------------
+# ----------------------------------------------------------------------
 # util
 # extension for pseudo-safely moving bytes into mutable buffers
 _move_ext = Extension('pandas.util._move',
                       depends=[],
-                      sources=['pandas/util/move.c'])
+                      sources=['pandas/util/move.c'],
+                      define_macros=macros)
 extensions.append(_move_ext)
 
-
-if _have_setuptools:
-    setuptools_kwargs["test_suite"] = "nose.collector"
-
 # The build cache system does string matching below this point.
 # if you change something, be careful.
 
 setup(name=DISTNAME,
       maintainer=AUTHOR,
       version=versioneer.get_version(),
-      packages=['pandas',
-                'pandas.api',
-                'pandas.api.types',
-                'pandas.compat',
-                'pandas.compat.numpy',
-                'pandas.computation',
-                'pandas.core',
-                'pandas.indexes',
-                'pandas.io',
-                'pandas.io.json',
-                'pandas.io.sas',
-                'pandas.io.msgpack',
-                'pandas._libs',
-                'pandas.formats',
-                'pandas.sparse',
-                'pandas.stats',
-                'pandas.util',
-                'pandas.tests',
-                'pandas.tests.api',
-                'pandas.tests.computation',
-                'pandas.tests.frame',
-                'pandas.tests.indexes',
-                'pandas.tests.indexes.datetimes',
-                'pandas.tests.indexes.timedeltas',
-                'pandas.tests.indexes.period',
-                'pandas.tests.io',
-                'pandas.tests.io.json',
-                'pandas.tests.io.parser',
-                'pandas.tests.io.sas',
-                'pandas.tests.io.msgpack',
-                'pandas.tests.groupby',
-                'pandas.tests.series',
-                'pandas.tests.formats',
-                'pandas.tests.scalar',
-                'pandas.tests.sparse',
-                'pandas.tests.tseries',
-                'pandas.tests.tools',
-                'pandas.tests.types',
-                'pandas.tests.plotting',
-                'pandas.tools',
-                'pandas.tseries',
-                'pandas.types',
-                'pandas.util.clipboard'
-                ],
-      package_data={'pandas.tests': ['data/*.csv'],
-                    'pandas.tests.formats': ['data/*.csv'],
-                    'pandas.tests.indexes': ['data/*.pickle'],
-                    'pandas.tests.io': ['data/legacy_hdf/*.h5',
-                                        'data/legacy_pickle/*/*.pickle',
-                                        'data/legacy_msgpack/*/*.msgpack',
-                                        'data/*.csv*',
-                                        'data/*.dta',
-                                        'data/*.pickle',
-                                        'data/*.txt',
-                                        'data/*.xls',
-                                        'data/*.xlsx',
-                                        'data/*.xlsm',
-                                        'data/*.table',
-                                        'parser/data/*.csv',
-                                        'parser/data/*.gz',
-                                        'parser/data/*.bz2',
-                                        'parser/data/*.txt',
-                                        'sas/data/*.csv',
-                                        'sas/data/*.xpt',
-                                        'sas/data/*.sas7bdat',
-                                        'data/*.html',
-                                        'data/html_encoding/*.html',
-                                        'json/data/*.json'],
-                    'pandas.tests.tools': ['data/*.csv'],
-                    'pandas.tests.tseries': ['data/*.pickle']
-                    },
-      ext_modules=extensions,
+      packages=find_packages(include=['pandas', 'pandas.*']),
+      package_data={'': ['templates/*', '_libs/*.dll']},
+      ext_modules=maybe_cythonize(extensions, compiler_directives=directives),
       maintainer_email=EMAIL,
       description=DESCRIPTION,
       license=LICENSE,
@@ -709,4 +747,5 @@ def pxd(name):
       long_description=LONG_DESCRIPTION,
       classifiers=CLASSIFIERS,
       platforms='any',
+      python_requires='>=2.7,!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*',
       **setuptools_kwargs)
diff --git a/test.bat b/test.bat
index 080a1cc163a05..e07c84f257a69 100644
--- a/test.bat
+++ b/test.bat
@@ -1,3 +1,3 @@
 :: test on windows
 
-pytest --skip-slow --skip-network pandas %*
+pytest --skip-slow --skip-network pandas -n 2 -r sxX --strict %*
diff --git a/test.sh b/test.sh
index 23c7ff52d2ce9..1255a39816f78 100755
--- a/test.sh
+++ b/test.sh
@@ -1,4 +1,4 @@
 #!/bin/sh
 command -v coverage >/dev/null && coverage erase
 command -v python-coverage >/dev/null && python-coverage erase
-pytest pandas --cov=pandas
+pytest pandas --cov=pandas -r sxX --strict
diff --git a/test_fast.bat b/test_fast.bat
index 17dc54b580137..f2c4e9fa71fcd 100644
--- a/test_fast.bat
+++ b/test_fast.bat
@@ -1,3 +1,3 @@
 :: test on windows
 set PYTHONHASHSEED=314159265
-pytest --skip-slow --skip-network -m "not single" -n 4 pandas
+pytest --skip-slow --skip-network --skip-db -m "not single" -n 4 -r sXX --strict pandas
diff --git a/test_fast.sh b/test_fast.sh
index 9b984156a796c..0a47f9de600ea 100755
--- a/test_fast.sh
+++ b/test_fast.sh
@@ -5,4 +5,4 @@
 # https://github.com/pytest-dev/pytest/issues/1075
 export PYTHONHASHSEED=$(python -c 'import random; print(random.randint(1, 4294967295))')
 
-pytest pandas --skip-slow --skip-network -m "not single" -n 4 "$@"
+pytest pandas --skip-slow --skip-network --skip-db -m "not single" -n 4 -r sxX --strict "$@"
diff --git a/test_perf.sh b/test_perf.sh
deleted file mode 100755
index 022de25bca8fc..0000000000000
--- a/test_perf.sh
+++ /dev/null
@@ -1,5 +0,0 @@
-#!/bin/sh
-
-CURDIR=$(pwd)
-BASEDIR=$(cd "$(dirname "$0")"; pwd)
-python "$BASEDIR"/vb_suite/test_perf.py $@
diff --git a/tox.ini b/tox.ini
index 85c5d90fde7fb..f055251581a93 100644
--- a/tox.ini
+++ b/tox.ini
@@ -4,7 +4,7 @@
 # and then run "tox" from this directory.
 
 [tox]
-envlist = py27, py34, py35
+envlist = py27, py35, py36
 
 [testenv]
 deps =
@@ -19,6 +19,7 @@ deps =
     xlrd
     six
     sqlalchemy
+    moto
 
 # cd to anything but the default {toxinidir} which
 # contains the pandas subdirectory and confuses
@@ -49,14 +50,14 @@ deps =
     bigquery
     {[testenv]deps}
 
-[testenv:py34]
+[testenv:py35]
 deps =
-    numpy==1.8.0
+    numpy==1.10.0
     {[testenv]deps}
 
-[testenv:py35]
+[testenv:py36]
 deps =
-    numpy==1.10.0
+    numpy
     {[testenv]deps}
 
 [testenv:openpyxl1]
diff --git a/vb_suite/.gitignore b/vb_suite/.gitignore
deleted file mode 100644
index cc110f04e1225..0000000000000
--- a/vb_suite/.gitignore
+++ /dev/null
@@ -1,4 +0,0 @@
-benchmarks.db
-build/*
-source/vbench/*
-source/*.rst
\ No newline at end of file
diff --git a/vb_suite/attrs_caching.py b/vb_suite/attrs_caching.py
deleted file mode 100644
index a7e3ed7094ed6..0000000000000
--- a/vb_suite/attrs_caching.py
+++ /dev/null
@@ -1,20 +0,0 @@
-from vbench.benchmark import Benchmark
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# DataFrame.index / columns property lookup time
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(10, 6))
-cur_index = df.index
-"""
-stmt = "foo = df.index"
-
-getattr_dataframe_index = Benchmark(stmt, setup,
-                                    name="getattr_dataframe_index")
-
-stmt = "df.index = cur_index"
-setattr_dataframe_index = Benchmark(stmt, setup,
-                                    name="setattr_dataframe_index")
diff --git a/vb_suite/binary_ops.py b/vb_suite/binary_ops.py
deleted file mode 100644
index 7c821374a83ab..0000000000000
--- a/vb_suite/binary_ops.py
+++ /dev/null
@@ -1,199 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-SECTION = 'Binary ops'
-
-#----------------------------------------------------------------------
-# binary ops
-
-#----------------------------------------------------------------------
-# add
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_add = \
-    Benchmark("df + df2", setup, name='frame_add',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-
-frame_add_st = \
-    Benchmark("df + df2", setup, name='frame_add_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_add_no_ne = \
-    Benchmark("df + df2", setup, name='frame_add_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# mult
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_mult = \
-    Benchmark("df * df2", setup, name='frame_mult',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-frame_mult_st = \
-    Benchmark("df * df2", setup, name='frame_mult_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_mult_no_ne = \
-    Benchmark("df * df2", setup, name='frame_mult_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# division
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_div_by_zero = \
-    Benchmark("df / 0", setup, name='frame_float_div_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_floor_by_zero = \
-    Benchmark("df // 0", setup, name='frame_float_floor_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-"""
-frame_int_div_by_zero = \
-    Benchmark("df / 0", setup, name='frame_int_div_by_zero')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-df2 = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_div = \
-    Benchmark("df // df2", setup, name='frame_float_div')
-
-#----------------------------------------------------------------------
-# modulo
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(1000, 1000))
-df2 = DataFrame(np.random.randn(1000, 1000))
-"""
-frame_float_mod = \
-    Benchmark("df / df2", setup, name='frame_float_mod')
-
-setup = common_setup + """
-df  = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-df2 = DataFrame(np.random.random_integers(np.iinfo(np.int16).min, np.iinfo(np.int16).max, size=(1000, 1000)))
-"""
-frame_int_mod = \
-    Benchmark("df / df2", setup, name='frame_int_mod')
-
-#----------------------------------------------------------------------
-# multi and
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-"""
-frame_multi_and = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_numexpr_threads(1)
-"""
-frame_multi_and_st = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-expr.set_use_numexpr(False)
-"""
-frame_multi_and_no_ne = \
-    Benchmark("df[(df>0) & (df2>0)]", setup, name='frame_multi_and_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-
-#----------------------------------------------------------------------
-# timeseries
-
-setup = common_setup + """
-N = 1000000
-halfway = N // 2 - 1
-s = Series(date_range('20010101', periods=N, freq='T'))
-ts = s[halfway]
-"""
-
-timestamp_series_compare = Benchmark("ts >= s", setup,
-                                     start_date=datetime(2013, 9, 27))
-series_timestamp_compare = Benchmark("s <= ts", setup,
-                                     start_date=datetime(2012, 2, 21))
-
-setup = common_setup + """
-N = 1000000
-s = Series(date_range('20010101', periods=N, freq='s'))
-"""
-
-timestamp_ops_diff1 = Benchmark("s.diff()", setup,
-                                start_date=datetime(2013, 1, 1))
-timestamp_ops_diff2 = Benchmark("s-s.shift()", setup,
-                                start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# timeseries with tz
-
-setup = common_setup + """
-N = 10000
-halfway = N // 2 - 1
-s = Series(date_range('20010101', periods=N, freq='T', tz='US/Eastern'))
-ts = s[halfway]
-"""
-
-timestamp_tz_series_compare = Benchmark("ts >= s", setup,
-                                        start_date=datetime(2013, 9, 27))
-series_timestamp_tz_compare = Benchmark("s <= ts", setup,
-                                        start_date=datetime(2012, 2, 21))
-
-setup = common_setup + """
-N = 10000
-s = Series(date_range('20010101', periods=N, freq='s', tz='US/Eastern'))
-"""
-
-timestamp_tz_ops_diff1 = Benchmark("s.diff()", setup,
-                                   start_date=datetime(2013, 1, 1))
-timestamp_tz_ops_diff2 = Benchmark("s-s.shift()", setup,
-                                   start_date=datetime(2013, 1, 1))
diff --git a/vb_suite/categoricals.py b/vb_suite/categoricals.py
deleted file mode 100644
index a08d479df20cb..0000000000000
--- a/vb_suite/categoricals.py
+++ /dev/null
@@ -1,16 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series constructors
-
-setup = common_setup + """
-s = pd.Series(list('aabbcd') * 1000000).astype('category')
-"""
-
-concat_categorical = \
-    Benchmark("concat([s, s])", setup=setup, name='concat_categorical',
-              start_date=datetime(year=2015, month=7, day=15))
diff --git a/vb_suite/ctors.py b/vb_suite/ctors.py
deleted file mode 100644
index 8123322383f0a..0000000000000
--- a/vb_suite/ctors.py
+++ /dev/null
@@ -1,39 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series constructors
-
-setup = common_setup + """
-data = np.random.randn(100)
-index = Index(np.arange(100))
-"""
-
-ctor_series_ndarray = \
-    Benchmark("Series(data, index=index)", setup=setup,
-              name='series_constructor_ndarray')
-
-setup = common_setup + """
-arr = np.random.randn(100, 100)
-"""
-
-ctor_frame_ndarray = \
-    Benchmark("DataFrame(arr)", setup=setup,
-              name='frame_constructor_ndarray')
-
-setup = common_setup + """
-data = np.array(['foo', 'bar', 'baz'], dtype=object)
-"""
-
-ctor_index_array_string = Benchmark('Index(data)', setup=setup)
-
-# index constructors
-setup = common_setup + """
-s = Series([Timestamp('20110101'),Timestamp('20120101'),Timestamp('20130101')]*1000)
-"""
-index_from_series_ctor = Benchmark('Index(s)', setup=setup)
-
-dtindex_from_series_ctor = Benchmark('DatetimeIndex(s)', setup=setup)
diff --git a/vb_suite/eval.py b/vb_suite/eval.py
deleted file mode 100644
index bf80aad956184..0000000000000
--- a/vb_suite/eval.py
+++ /dev/null
@@ -1,150 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-import pandas as pd
-df  = DataFrame(np.random.randn(20000, 100))
-df2 = DataFrame(np.random.randn(20000, 100))
-df3 = DataFrame(np.random.randn(20000, 100))
-df4 = DataFrame(np.random.randn(20000, 100))
-"""
-
-setup = common_setup + """
-import pandas.computation.expressions as expr
-expr.set_numexpr_threads(1)
-"""
-
-SECTION = 'Eval'
-
-#----------------------------------------------------------------------
-# binary ops
-
-#----------------------------------------------------------------------
-# add
-eval_frame_add_all_threads = \
-    Benchmark("pd.eval('df + df2 + df3 + df4')", common_setup,
-              name='eval_frame_add_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-
-
-eval_frame_add_one_thread = \
-    Benchmark("pd.eval('df + df2 + df3 + df4')", setup,
-              name='eval_frame_add_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_add_python = \
-    Benchmark("pd.eval('df + df2 + df3 + df4', engine='python')", common_setup,
-              name='eval_frame_add_python', start_date=datetime(2013, 7, 21))
-
-eval_frame_add_python_one_thread = \
-    Benchmark("pd.eval('df + df2 + df3 + df4', engine='python')", setup,
-              name='eval_frame_add_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-#----------------------------------------------------------------------
-# mult
-
-eval_frame_mult_all_threads = \
-    Benchmark("pd.eval('df * df2 * df3 * df4')", common_setup,
-              name='eval_frame_mult_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_mult_one_thread = \
-    Benchmark("pd.eval('df * df2 * df3 * df4')", setup,
-              name='eval_frame_mult_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_mult_python = \
-    Benchmark("pd.eval('df * df2 * df3 * df4', engine='python')",
-              common_setup,
-              name='eval_frame_mult_python', start_date=datetime(2013, 7, 21))
-
-eval_frame_mult_python_one_thread = \
-    Benchmark("pd.eval('df * df2 * df3 * df4', engine='python')", setup,
-              name='eval_frame_mult_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-#----------------------------------------------------------------------
-# multi and
-
-eval_frame_and_all_threads = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')",
-              common_setup,
-              name='eval_frame_and_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_and_one_thread = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)')", setup,
-              name='eval_frame_and_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_and_python = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')",
-              common_setup, name='eval_frame_and_python',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_and_one_thread = \
-    Benchmark("pd.eval('(df > 0) & (df2 > 0) & (df3 > 0) & (df4 > 0)', engine='python')",
-              setup,
-              name='eval_frame_and_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-#--------------------------------------------------------------------
-# chained comp
-eval_frame_chained_cmp_all_threads = \
-    Benchmark("pd.eval('df < df2 < df3 < df4')", common_setup,
-              name='eval_frame_chained_cmp_all_threads',
-              start_date=datetime(2013, 7, 21))
-
-eval_frame_chained_cmp_one_thread = \
-    Benchmark("pd.eval('df < df2 < df3 < df4')", setup,
-              name='eval_frame_chained_cmp_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_chained_cmp_python = \
-    Benchmark("pd.eval('df < df2 < df3 < df4', engine='python')",
-              common_setup, name='eval_frame_chained_cmp_python',
-              start_date=datetime(2013, 7, 26))
-
-eval_frame_chained_cmp_one_thread = \
-    Benchmark("pd.eval('df < df2 < df3 < df4', engine='python')", setup,
-              name='eval_frame_chained_cmp_python_one_thread',
-              start_date=datetime(2013, 7, 26))
-
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-N = 1000000
-halfway = N // 2 - 1
-index = date_range('20010101', periods=N, freq='T')
-s = Series(index)
-ts = s.iloc[halfway]
-"""
-
-series_setup = setup + """
-df = DataFrame({'dates': s.values})
-"""
-
-query_datetime_series = Benchmark("df.query('dates < @ts')",
-                                  series_setup,
-                                  start_date=datetime(2013, 9, 27))
-
-index_setup = setup + """
-df = DataFrame({'a': np.random.randn(N)}, index=index)
-"""
-
-query_datetime_index = Benchmark("df.query('index < @ts')",
-                                 index_setup, start_date=datetime(2013, 9, 27))
-
-setup = setup + """
-N = 1000000
-df = DataFrame({'a': np.random.randn(N)})
-min_val = df['a'].min()
-max_val = df['a'].max()
-"""
-
-query_with_boolean_selection = Benchmark("df.query('(a >= @min_val) & (a <= @max_val)')",
-                                         setup, start_date=datetime(2013, 9, 27))
-
diff --git a/vb_suite/frame_ctor.py b/vb_suite/frame_ctor.py
deleted file mode 100644
index 0d57da7b88d3b..0000000000000
--- a/vb_suite/frame_ctor.py
+++ /dev/null
@@ -1,123 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-try:
-    import pandas.tseries.offsets as offsets
-except:
-    import pandas.core.datetools as offsets
-
-common_setup = """from .pandas_vb_common import *
-try:
-    from pandas.tseries.offsets import *
-except:
-    from pandas.core.datetools import *
-"""
-
-#----------------------------------------------------------------------
-# Creation from nested dict
-
-setup = common_setup + """
-N, K = 5000, 50
-index = tm.makeStringIndex(N)
-columns = tm.makeStringIndex(K)
-frame = DataFrame(np.random.randn(N, K), index=index, columns=columns)
-
-try:
-    data = frame.to_dict()
-except:
-    data = frame.toDict()
-
-some_dict = data.values()[0]
-dict_list = [dict(zip(columns, row)) for row in frame.values]
-"""
-
-frame_ctor_nested_dict = Benchmark("DataFrame(data)", setup)
-
-# From JSON-like stuff
-frame_ctor_list_of_dict = Benchmark("DataFrame(dict_list)", setup,
-                                    start_date=datetime(2011, 12, 20))
-
-series_ctor_from_dict = Benchmark("Series(some_dict)", setup)
-
-# nested dict, integer indexes, regression described in #621
-setup = common_setup + """
-data = dict((i,dict((j,float(j)) for j in range(100))) for i in xrange(2000))
-"""
-frame_ctor_nested_dict_int64 = Benchmark("DataFrame(data)", setup)
-
-# dynamically generate benchmarks for every offset
-#
-# get_period_count & get_index_for_offset are there because blindly taking each
-# offset times 1000 can easily go out of Timestamp bounds and raise errors.
-dynamic_benchmarks = {}
-n_steps = [1, 2]
-offset_kwargs = {'WeekOfMonth': {'weekday': 1, 'week': 1},
-                 'LastWeekOfMonth': {'weekday': 1, 'week': 1},
-                 'FY5253': {'startingMonth': 1, 'weekday': 1},
-                 'FY5253Quarter': {'qtr_with_extra_week': 1, 'startingMonth': 1, 'weekday': 1}}
-
-offset_extra_cases = {'FY5253': {'variation': ['nearest', 'last']},
-                      'FY5253Quarter': {'variation': ['nearest', 'last']}}
-
-for offset in offsets.__all__:
-    for n in n_steps:
-        kwargs = {}
-        if offset in offset_kwargs:
-            kwargs = offset_kwargs[offset]
-
-        if offset in offset_extra_cases:
-            extras = offset_extra_cases[offset]
-        else:
-            extras = {'': ['']}
-
-        for extra_arg in extras:
-            for extra in extras[extra_arg]:
-                if extra:
-                    kwargs[extra_arg] = extra
-                setup = common_setup + """
-
-def get_period_count(start_date, off):
-    ten_offsets_in_days = ((start_date + off * 10) - start_date).days
-    if ten_offsets_in_days == 0:
-        return 1000
-    else:
-        return min(9 * ((Timestamp.max - start_date).days //
-                        ten_offsets_in_days),
-                   1000)
-
-def get_index_for_offset(off):
-    start_date = Timestamp('1/1/1900')
-    return date_range(start_date,
-                      periods=min(1000, get_period_count(start_date, off)),
-                      freq=off)
-
-idx = get_index_for_offset({}({}, **{}))
-df = DataFrame(np.random.randn(len(idx),10), index=idx)
-d = dict([ (col,df[col]) for col in df.columns ])
-""".format(offset, n, kwargs)
-                key = 'frame_ctor_dtindex_{}x{}'.format(offset, n)
-                if extra:
-                    key += '__{}_{}'.format(extra_arg, extra)
-                dynamic_benchmarks[key] = Benchmark("DataFrame(d)", setup, name=key)
-
-# Have to stuff them in globals() so vbench detects them
-globals().update(dynamic_benchmarks)
-
-# from a mi-series
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(100) for y in range(100)])
-s = Series(randn(10000), index=mi)
-"""
-frame_from_series = Benchmark("DataFrame(s)", setup)
-
-#----------------------------------------------------------------------
-# get_numeric_data
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 25))
-df['foo'] = 'bar'
-df['bar'] = 'baz'
-df = df.consolidate()
-"""
-
-frame_get_numeric_data = Benchmark('df._get_numeric_data()', setup,
-                                   start_date=datetime(2011, 11, 1))
diff --git a/vb_suite/frame_methods.py b/vb_suite/frame_methods.py
deleted file mode 100644
index 46343e9c607fd..0000000000000
--- a/vb_suite/frame_methods.py
+++ /dev/null
@@ -1,525 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# lookup
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(10000, 8), columns=list('abcdefgh'))
-df['foo'] = 'bar'
-
-row_labels = list(df.index[::10])[:900]
-col_labels = list(df.columns) * 100
-row_labels_all = np.array(list(df.index) * len(df.columns), dtype='object')
-col_labels_all = np.array(list(df.columns) * len(df.index), dtype='object')
-"""
-
-frame_fancy_lookup = Benchmark('df.lookup(row_labels, col_labels)', setup,
-                               start_date=datetime(2012, 1, 12))
-
-frame_fancy_lookup_all = Benchmark('df.lookup(row_labels_all, col_labels_all)',
-                                   setup,
-                                   start_date=datetime(2012, 1, 12))
-
-#----------------------------------------------------------------------
-# fillna in place
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-df.values[::2] = np.nan
-"""
-
-frame_fillna_inplace = Benchmark('df.fillna(0, inplace=True)', setup,
-                                 start_date=datetime(2012, 4, 4))
-
-
-#----------------------------------------------------------------------
-# reindex both axes
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 10000))
-idx = np.arange(4000, 7000)
-"""
-
-frame_reindex_axis0 = Benchmark('df.reindex(idx)', setup)
-
-frame_reindex_axis1 = Benchmark('df.reindex(columns=idx)', setup)
-
-frame_reindex_both_axes = Benchmark('df.reindex(index=idx, columns=idx)',
-                                    setup, start_date=datetime(2011, 1, 1))
-
-frame_reindex_both_axes_ix = Benchmark('df.ix[idx, idx]', setup,
-                                       start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# reindex with upcasts
-setup = common_setup + """
-df=DataFrame(dict([(c, {
-        0: randint(0, 2, 1000).astype(np.bool_),
-        1: randint(0, 1000, 1000).astype(np.int16),
-        2: randint(0, 1000, 1000).astype(np.int32),
-        3: randint(0, 1000, 1000).astype(np.int64)
-    }[randint(0, 4)]) for c in range(1000)]))
-"""
-
-frame_reindex_upcast = Benchmark('df.reindex(permutation(range(1200)))', setup)
-
-#----------------------------------------------------------------------
-# boolean indexing
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-bool_arr = np.zeros(10000, dtype=bool)
-bool_arr[:1000] = True
-"""
-
-frame_boolean_row_select = Benchmark('df[bool_arr]', setup,
-                                     start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# iteritems (monitor no-copying behaviour)
-
-setup = common_setup + """
-df = DataFrame(randn(10000, 1000))
-df2 = DataFrame(randn(3000,1),columns=['A'])
-df3 = DataFrame(randn(3000,1))
-
-def f():
-    if hasattr(df, '_item_cache'):
-        df._item_cache.clear()
-    for name, col in df.iteritems():
-        pass
-
-def g():
-    for name, col in df.iteritems():
-        pass
-
-def h():
-    for i in range(10000):
-        df2['A']
-
-def j():
-    for i in range(10000):
-        df3[0]
-
-"""
-
-# as far back as the earliest test currently in the suite
-frame_iteritems = Benchmark('f()', setup,
-                            start_date=datetime(2010, 6, 1))
-
-frame_iteritems_cached = Benchmark('g()', setup,
-                                   start_date=datetime(2010, 6, 1))
-
-frame_getitem_single_column = Benchmark('h()', setup,
-                                        start_date=datetime(2010, 6, 1))
-
-frame_getitem_single_column2 = Benchmark('j()', setup,
-                                         start_date=datetime(2010, 6, 1))
-
-#----------------------------------------------------------------------
-# assignment
-
-setup = common_setup + """
-idx = date_range('1/1/2000', periods=100000, freq='D')
-df = DataFrame(randn(100000, 1),columns=['A'],index=idx)
-def f(df):
-    x = df.copy()
-    x['date'] = x.index
-"""
-
-frame_assign_timeseries_index = Benchmark('f(df)', setup,
-                                          start_date=datetime(2013, 10, 1))
-
-
-#----------------------------------------------------------------------
-# to_string
-
-setup = common_setup + """
-df = DataFrame(randn(100, 10))
-"""
-
-frame_to_string_floats = Benchmark('df.to_string()', setup,
-                                   start_date=datetime(2010, 6, 1))
-
-#----------------------------------------------------------------------
-# to_html
-
-setup = common_setup + """
-nrows=500
-df = DataFrame(randn(nrows, 10))
-df[0]=period_range("2000","2010",nrows)
-df[1]=range(nrows)
-
-"""
-
-frame_to_html_mixed = Benchmark('df.to_html()', setup,
-                                   start_date=datetime(2011, 11, 18))
-
-
-# truncated repr_html, single index
-
-setup = common_setup + """
-nrows=10000
-data=randn(nrows,10)
-idx=MultiIndex.from_arrays(np.tile(randn(3,nrows/100),100))
-df=DataFrame(data,index=idx)
-
-"""
-
-frame_html_repr_trunc_mi = Benchmark('df._repr_html_()', setup,
-                                   start_date=datetime(2013, 11, 25))
-
-# truncated repr_html, MultiIndex
-
-setup = common_setup + """
-nrows=10000
-data=randn(nrows,10)
-idx=randn(nrows)
-df=DataFrame(data,index=idx)
-
-"""
-
-frame_html_repr_trunc_si = Benchmark('df._repr_html_()', setup,
-                                   start_date=datetime(2013, 11, 25))
-
-
-# insert many columns
-
-setup = common_setup + """
-N = 1000
-
-def f(K=500):
-    df = DataFrame(index=range(N))
-    new_col = np.random.randn(N)
-    for i in range(K):
-        df[i] = new_col
-"""
-
-frame_insert_500_columns_end = Benchmark('f()', setup, start_date=datetime(2011, 1, 1))
-
-setup = common_setup + """
-N = 1000
-
-def f(K=100):
-    df = DataFrame(index=range(N))
-    new_col = np.random.randn(N)
-    for i in range(K):
-        df.insert(0,i,new_col)
-"""
-
-frame_insert_100_columns_begin = Benchmark('f()', setup, start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# strings methods, #2602
-
-setup = common_setup + """
-s = Series(['abcdefg', np.nan]*500000)
-"""
-
-series_string_vector_slice = Benchmark('s.str[:5]', setup,
-                                       start_date=datetime(2012, 8, 1))
-
-#----------------------------------------------------------------------
-# df.info() and get_dtype_counts() # 2807
-
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10,10000))
-"""
-
-frame_get_dtype_counts = Benchmark('df.get_dtype_counts()', setup,
-                                       start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10,10000))
-"""
-
-frame_repr_wide = Benchmark('repr(df)', setup,
-                            start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = pandas.DataFrame(np.random.randn(10000, 10))
-"""
-
-frame_repr_tall = Benchmark('repr(df)', setup,
-                            start_date=datetime(2012, 8, 1))
-
-##
-setup = common_setup + """
-df = DataFrame(randn(100000, 1))
-"""
-
-frame_xs_row = Benchmark('df.xs(50000)', setup)
-
-##
-setup = common_setup + """
-df = DataFrame(randn(1,100000))
-"""
-
-frame_xs_col = Benchmark('df.xs(50000,axis = 1)', setup)
-
-#----------------------------------------------------------------------
-# nulls/masking
-
-## masking
-setup = common_setup + """
-data = np.random.randn(1000, 500)
-df = DataFrame(data)
-df = df.where(df > 0) # create nans
-bools = df > 0
-mask = isnull(df)
-"""
-
-frame_mask_bools = Benchmark('bools.mask(mask)', setup,
-                             start_date=datetime(2013,1,1))
-
-frame_mask_floats  = Benchmark('bools.astype(float).mask(mask)', setup,
-                             start_date=datetime(2013,1,1))
-
-## isnull
-setup = common_setup + """
-data = np.random.randn(1000, 1000)
-df = DataFrame(data)
-"""
-frame_isnull  = Benchmark('isnull(df)', setup,
-                           start_date=datetime(2012,1,1))
-
-## dropna
-dropna_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-"""
-frame_dropna_axis0_any  = Benchmark('df.dropna(how="any",axis=0)', dropna_setup,
-                                     start_date=datetime(2012,1,1))
-frame_dropna_axis0_all  = Benchmark('df.dropna(how="all",axis=0)', dropna_setup,
-                                     start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_any  = Benchmark('df.dropna(how="any",axis=1)', dropna_setup,
-                                    start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_all  = Benchmark('df.dropna(how="all",axis=1)', dropna_setup,
-                                    start_date=datetime(2012,1,1))
-
-# dropna on mixed dtypes
-dropna_mixed_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df['foo'] = 'bar'
-"""
-frame_dropna_axis0_any_mixed_dtypes  = Benchmark('df.dropna(how="any",axis=0)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-frame_dropna_axis0_all_mixed_dtypes  = Benchmark('df.dropna(how="all",axis=0)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_any_mixed_dtypes  = Benchmark('df.dropna(how="any",axis=1)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-frame_dropna_axis1_all_mixed_dtypes  = Benchmark('df.dropna(how="all",axis=1)', dropna_mixed_setup,
-                                                 start_date=datetime(2012,1,1))
-
-## dropna multi
-dropna_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df.index = MultiIndex.from_tuples(df.index.map(lambda x: (x, x)))
-df.columns = MultiIndex.from_tuples(df.columns.map(lambda x: (x, x)))
-"""
-frame_count_level_axis0_multi = Benchmark('df.count(axis=0, level=1)', dropna_setup,
-                                          start_date=datetime(2012,1,1))
-
-frame_count_level_axis1_multi = Benchmark('df.count(axis=1, level=1)', dropna_setup,
-                                          start_date=datetime(2012,1,1))
-
-# dropna on mixed dtypes
-dropna_mixed_setup = common_setup + """
-data = np.random.randn(10000, 1000)
-df = DataFrame(data)
-df.ix[50:1000,20:50] = np.nan
-df.ix[2000:3000] = np.nan
-df.ix[:,60:70] = np.nan
-df['foo'] = 'bar'
-df.index = MultiIndex.from_tuples(df.index.map(lambda x: (x, x)))
-df.columns = MultiIndex.from_tuples(df.columns.map(lambda x: (x, x)))
-"""
-frame_count_level_axis0_mixed_dtypes_multi  = Benchmark('df.count(axis=0, level=1)', dropna_mixed_setup,
-                                                        start_date=datetime(2012,1,1))
-
-frame_count_level_axis1_mixed_dtypes_multi  = Benchmark('df.count(axis=1, level=1)', dropna_mixed_setup,
-                                                        start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# apply
-
-setup = common_setup + """
-s = Series(np.arange(1028.))
-df = DataFrame({ i:s for i in range(1028) })
-"""
-frame_apply_user_func = Benchmark('df.apply(lambda x: np.corrcoef(x,s)[0,1])', setup,
-                           name = 'frame_apply_user_func',
-                           start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_lambda_mean = Benchmark('df.apply(lambda x: x.sum())', setup,
-                                    name = 'frame_apply_lambda_mean',
-                                    start_date=datetime(2012,1,1))
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_np_mean = Benchmark('df.apply(np.mean)', setup,
-                               name = 'frame_apply_np_mean',
-                               start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_pass_thru = Benchmark('df.apply(lambda x: x)', setup,
-                                  name = 'frame_apply_pass_thru',
-                                  start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,100))
-"""
-frame_apply_axis_1 = Benchmark('df.apply(lambda x: x+1,axis=1)', setup,
-                               name = 'frame_apply_axis_1',
-                               start_date=datetime(2012,1,1))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,3),columns=list('ABC'))
-"""
-frame_apply_ref_by_name = Benchmark('df.apply(lambda x: x["A"] + x["B"],axis=1)', setup,
-                                     name = 'frame_apply_ref_by_name',
-                                     start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# dtypes
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000,1000))
-"""
-frame_dtypes = Benchmark('df.dtypes', setup,
-                         start_date=datetime(2012,1,1))
-
-#----------------------------------------------------------------------
-# equals
-setup = common_setup + """
-def make_pair(frame):
-    df = frame
-    df2 = df.copy()
-    df2.ix[-1,-1] = np.nan
-    return df, df2
-
-def test_equal(name):
-    df, df2 = pairs[name]
-    return df.equals(df)
-
-def test_unequal(name):
-    df, df2 = pairs[name]
-    return df.equals(df2)
-
-float_df = DataFrame(np.random.randn(1000, 1000))
-object_df = DataFrame([['foo']*1000]*1000)
-nonunique_cols = object_df.copy()
-nonunique_cols.columns = ['A']*len(nonunique_cols.columns)
-
-pairs = dict([(name, make_pair(frame))
-         for name, frame in (('float_df', float_df), ('object_df', object_df), ('nonunique_cols', nonunique_cols))])
-"""
-frame_float_equal = Benchmark('test_equal("float_df")', setup)
-frame_object_equal = Benchmark('test_equal("object_df")', setup)
-frame_nonunique_equal = Benchmark('test_equal("nonunique_cols")', setup)
-
-frame_float_unequal = Benchmark('test_unequal("float_df")', setup)
-frame_object_unequal = Benchmark('test_unequal("object_df")', setup)
-frame_nonunique_unequal = Benchmark('test_unequal("nonunique_cols")', setup)
-
-#-----------------------------------------------------------------------------
-# interpolate
-# this is the worst case, where every column has NaNs.
-setup = common_setup + """
-df = DataFrame(randn(10000, 100))
-df.values[::2] = np.nan
-"""
-
-frame_interpolate = Benchmark('df.interpolate()', setup,
-                               start_date=datetime(2014, 2, 7))
-
-setup = common_setup + """
-df = DataFrame({'A': np.arange(0, 10000),
-                'B': np.random.randint(0, 100, 10000),
-                'C': randn(10000),
-                'D': randn(10000)})
-df.loc[1::5, 'A'] = np.nan
-df.loc[1::5, 'C'] = np.nan
-"""
-
-frame_interpolate_some_good = Benchmark('df.interpolate()', setup,
-                                        start_date=datetime(2014, 2, 7))
-frame_interpolate_some_good_infer = Benchmark('df.interpolate(downcast="infer")',
-                                              setup,
-                                              start_date=datetime(2014, 2, 7))
-
-
-#-------------------------------------------------------------------------
-# frame shift speedup issue-5609
-
-setup = common_setup + """
-df = DataFrame(np.random.rand(10000,500))
-# note: df._data.blocks are f_contigous
-"""
-frame_shift_axis0 = Benchmark('df.shift(1,axis=0)', setup,
-                    start_date=datetime(2014,1,1))
-frame_shift_axis1 = Benchmark('df.shift(1,axis=1)', setup,
-                    name = 'frame_shift_axis_1',
-                    start_date=datetime(2014,1,1))
-
-
-#-----------------------------------------------------------------------------
-# from_records issue-6700
-
-setup = common_setup + """
-def get_data(n=100000):
-    return ((x, x*20, x*100) for x in range(n))
-"""
-
-frame_from_records_generator = Benchmark('df = DataFrame.from_records(get_data())',
-                                setup,
-                                name='frame_from_records_generator',
-                                start_date=datetime(2013,10,4))  # issue-4911
-
-frame_from_records_generator_nrows = Benchmark('df = DataFrame.from_records(get_data(), nrows=1000)',
-                                setup,
-                                name='frame_from_records_generator_nrows',
-                                start_date=datetime(2013,10,04))  # issue-4911
-
-#-----------------------------------------------------------------------------
-# duplicated
-
-setup = common_setup + '''
-n = 1 << 20
-
-t = date_range('2015-01-01', freq='S', periods=n // 64)
-xs = np.random.randn(n // 64).round(2)
-
-df = DataFrame({'a':np.random.randint(- 1 << 8, 1 << 8, n),
-                'b':np.random.choice(t, n),
-                'c':np.random.choice(xs, n)})
-'''
-
-frame_duplicated = Benchmark('df.duplicated()', setup,
-                             name='frame_duplicated')
diff --git a/vb_suite/generate_rst_files.py b/vb_suite/generate_rst_files.py
deleted file mode 100644
index 92e7cd4d59b71..0000000000000
--- a/vb_suite/generate_rst_files.py
+++ /dev/null
@@ -1,2 +0,0 @@
-from suite import benchmarks, generate_rst_files
-generate_rst_files(benchmarks)
diff --git a/vb_suite/gil.py b/vb_suite/gil.py
deleted file mode 100644
index df2bd2dcd8db4..0000000000000
--- a/vb_suite/gil.py
+++ /dev/null
@@ -1,110 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-basic = common_setup + """
-try:
-    from pandas.util.testing import test_parallel
-    have_real_test_parallel = True
-except ImportError:
-    have_real_test_parallel = False
-    def test_parallel(num_threads=1):
-        def wrapper(fname):
-            return fname
-
-        return wrapper
-
-N = 1000000
-ngroups = 1000
-np.random.seed(1234)
-
-df = DataFrame({'key' : np.random.randint(0,ngroups,size=N),
-                'data' : np.random.randn(N) })
-
-if not have_real_test_parallel:
-    raise NotImplementedError
-"""
-
-setup = basic + """
-
-def f():
-    df.groupby('key')['data'].sum()
-
-# run consecutivily
-def g2():
-    for i in range(2):
-        f()
-def g4():
-    for i in range(4):
-        f()
-def g8():
-    for i in range(8):
-        f()
-
-# run in parallel
-@test_parallel(num_threads=2)
-def pg2():
-    f()
-
-@test_parallel(num_threads=4)
-def pg4():
-    f()
-
-@test_parallel(num_threads=8)
-def pg8():
-    f()
-
-"""
-
-nogil_groupby_sum_4 = Benchmark(
-    'pg4()', setup,
-    start_date=datetime(2015, 1, 1))
-
-nogil_groupby_sum_8 = Benchmark(
-    'pg8()', setup,
-    start_date=datetime(2015, 1, 1))
-
-
-#### test all groupby funcs ####
-
-setup = basic + """
-
-@test_parallel(num_threads=2)
-def pg2():
-    df.groupby('key')['data'].func()
-
-"""
-
-for f in ['sum','prod','var','count','min','max','mean','last']:
-
-    name = "nogil_groupby_{f}_2".format(f=f)
-    bmark = Benchmark('pg2()', setup.replace('func',f), start_date=datetime(2015, 1, 1))
-    bmark.name = name
-    globals()[name] = bmark
-
-del bmark
-
-
-#### test take_1d ####
-setup = basic + """
-from pandas.core import common as com
-
-N = 1e7
-df = DataFrame({'int64' : np.arange(N,dtype='int64'),
-                'float64' : np.arange(N,dtype='float64')})
-indexer = np.arange(100,len(df)-100)
-
-@test_parallel(num_threads=2)
-def take_1d_pg2_int64():
-    com.take_1d(df.int64.values,indexer)
-
-@test_parallel(num_threads=2)
-def take_1d_pg2_float64():
-    com.take_1d(df.float64.values,indexer)
-
-"""
-
-nogil_take1d_float64 = Benchmark('take_1d_pg2_int64()', setup, start_date=datetime(2015, 1, 1))
-nogil_take1d_int64 = Benchmark('take_1d_pg2_float64()', setup, start_date=datetime(2015, 1, 1))
diff --git a/vb_suite/groupby.py b/vb_suite/groupby.py
deleted file mode 100644
index 268d71f864823..0000000000000
--- a/vb_suite/groupby.py
+++ /dev/null
@@ -1,620 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-N = 100000
-ngroups = 100
-
-def get_test_data(ngroups=100, n=100000):
-    unique_groups = range(ngroups)
-    arr = np.asarray(np.tile(unique_groups, n / ngroups), dtype=object)
-
-    if len(arr) < n:
-        arr = np.asarray(list(arr) + unique_groups[:n - len(arr)],
-                         dtype=object)
-
-    random.shuffle(arr)
-    return arr
-
-# aggregate multiple columns
-df = DataFrame({'key1' : get_test_data(ngroups=ngroups),
-                'key2' : get_test_data(ngroups=ngroups),
-                'data1' : np.random.randn(N),
-                'data2' : np.random.randn(N)})
-def f():
-    df.groupby(['key1', 'key2']).agg(lambda x: x.values.sum())
-
-simple_series = Series(np.random.randn(N))
-key1 = df['key1']
-"""
-
-stmt1 = "df.groupby(['key1', 'key2'])['data1'].agg(lambda x: x.values.sum())"
-groupby_multi_python = Benchmark(stmt1, setup,
-                                 start_date=datetime(2011, 7, 1))
-
-stmt3 = "df.groupby(['key1', 'key2']).sum()"
-groupby_multi_cython = Benchmark(stmt3, setup,
-                                 start_date=datetime(2011, 7, 1))
-
-stmt = "df.groupby(['key1', 'key2'])['data1'].agg(np.std)"
-groupby_multi_series_op = Benchmark(stmt, setup,
-                                    start_date=datetime(2011, 8, 1))
-
-groupby_series_simple_cython = \
-    Benchmark('simple_series.groupby(key1).sum()', setup,
-              start_date=datetime(2011, 3, 1))
-
-
-stmt4 = "df.groupby('key1').rank(pct=True)"
-groupby_series_simple_cython = Benchmark(stmt4, setup,
-                                    start_date=datetime(2014, 1, 16))
-
-#----------------------------------------------------------------------
-# 2d grouping, aggregate many columns
-
-setup = common_setup + """
-labels = np.random.randint(0, 100, size=1000)
-df = DataFrame(randn(1000, 1000))
-"""
-
-groupby_frame_cython_many_columns = Benchmark(
-    'df.groupby(labels).sum()', setup,
-    start_date=datetime(2011, 8, 1),
-    logy=True)
-
-#----------------------------------------------------------------------
-# single key, long, integer key
-
-setup = common_setup + """
-data = np.random.randn(100000, 1)
-labels = np.random.randint(0, 1000, size=100000)
-df = DataFrame(data)
-"""
-
-groupby_frame_singlekey_integer = \
-    Benchmark('df.groupby(labels).sum()', setup,
-              start_date=datetime(2011, 8, 1), logy=True)
-
-#----------------------------------------------------------------------
-# group with different functions per column
-
-setup = common_setup + """
-fac1 = np.array(['A', 'B', 'C'], dtype='O')
-fac2 = np.array(['one', 'two'], dtype='O')
-
-df = DataFrame({'key1': fac1.take(np.random.randint(0, 3, size=100000)),
-                'key2': fac2.take(np.random.randint(0, 2, size=100000)),
-                'value1' : np.random.randn(100000),
-                'value2' : np.random.randn(100000),
-                'value3' : np.random.randn(100000)})
-"""
-
-groupby_multi_different_functions = \
-    Benchmark("""df.groupby(['key1', 'key2']).agg({'value1' : 'mean',
-                                                   'value2' : 'var',
-                                                   'value3' : 'sum'})""",
-              setup, start_date=datetime(2011, 9, 1))
-
-groupby_multi_different_numpy_functions = \
-    Benchmark("""df.groupby(['key1', 'key2']).agg({'value1' : np.mean,
-                                                   'value2' : np.var,
-                                                   'value3' : np.sum})""",
-              setup, start_date=datetime(2011, 9, 1))
-
-#----------------------------------------------------------------------
-# size() speed
-
-setup = common_setup + """
-n = 100000
-offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
-dates = np.datetime64('now') + offsets
-df = DataFrame({'key1': np.random.randint(0, 500, size=n),
-                'key2': np.random.randint(0, 100, size=n),
-                'value1' : np.random.randn(n),
-                'value2' : np.random.randn(n),
-                'value3' : np.random.randn(n),
-                'dates' : dates})
-"""
-
-groupby_multi_size = Benchmark("df.groupby(['key1', 'key2']).size()",
-                               setup, start_date=datetime(2011, 10, 1))
-
-groupby_dt_size = Benchmark("df.groupby(['dates']).size()",
-                            setup, start_date=datetime(2011, 10, 1))
-
-groupby_dt_timegrouper_size = Benchmark("df.groupby(TimeGrouper(key='dates', freq='M')).size()",
-                                        setup, start_date=datetime(2011, 10, 1))
-
-#----------------------------------------------------------------------
-# count() speed
-
-setup = common_setup + """
-n = 10000
-offsets = np.random.randint(n, size=n).astype('timedelta64[ns]')
-
-dates = np.datetime64('now') + offsets
-dates[np.random.rand(n) > 0.5] = np.datetime64('nat')
-
-offsets[np.random.rand(n) > 0.5] = np.timedelta64('nat')
-
-value2 = np.random.randn(n)
-value2[np.random.rand(n) > 0.5] = np.nan
-
-obj = np.random.choice(list('ab'), size=n).astype(object)
-obj[np.random.randn(n) > 0.5] = np.nan
-
-df = DataFrame({'key1': np.random.randint(0, 500, size=n),
-                'key2': np.random.randint(0, 100, size=n),
-                'dates': dates,
-                'value2' : value2,
-                'value3' : np.random.randn(n),
-                'ints': np.random.randint(0, 1000, size=n),
-                'obj': obj,
-                'offsets': offsets})
-"""
-
-groupby_multi_count = Benchmark("df.groupby(['key1', 'key2']).count()",
-                                setup, name='groupby_multi_count',
-                                start_date=datetime(2014, 5, 5))
-
-setup = common_setup + """
-n = 10000
-
-df = DataFrame({'key1': randint(0, 500, size=n),
-                'key2': randint(0, 100, size=n),
-                'ints': randint(0, 1000, size=n),
-                'ints2': randint(0, 1000, size=n)})
-"""
-
-groupby_int_count = Benchmark("df.groupby(['key1', 'key2']).count()",
-                              setup, name='groupby_int_count',
-                              start_date=datetime(2014, 5, 6))
-#----------------------------------------------------------------------
-# Series.value_counts
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=100000))
-"""
-
-series_value_counts_int64 = Benchmark('s.value_counts()', setup,
-                                      start_date=datetime(2011, 10, 21))
-
-# value_counts on lots of strings
-
-setup = common_setup + """
-K = 1000
-N = 100000
-uniques = tm.makeStringIndex(K).values
-s = Series(np.tile(uniques, N // K))
-"""
-
-series_value_counts_strings = Benchmark('s.value_counts()', setup,
-                                        start_date=datetime(2011, 10, 21))
-
-#value_counts on float dtype
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=100000)).astype(float)
-"""
-
-series_value_counts_float64 = Benchmark('s.value_counts()', setup,
-                                      start_date=datetime(2015, 8, 17))
-
-#----------------------------------------------------------------------
-# pivot_table
-
-setup = common_setup + """
-fac1 = np.array(['A', 'B', 'C'], dtype='O')
-fac2 = np.array(['one', 'two'], dtype='O')
-
-ind1 = np.random.randint(0, 3, size=100000)
-ind2 = np.random.randint(0, 2, size=100000)
-
-df = DataFrame({'key1': fac1.take(ind1),
-'key2': fac2.take(ind2),
-'key3': fac2.take(ind2),
-'value1' : np.random.randn(100000),
-'value2' : np.random.randn(100000),
-'value3' : np.random.randn(100000)})
-"""
-
-stmt = "df.pivot_table(index='key1', columns=['key2', 'key3'])"
-groupby_pivot_table = Benchmark(stmt, setup, start_date=datetime(2011, 12, 15))
-
-
-#----------------------------------------------------------------------
-# dict return values
-
-setup = common_setup + """
-labels = np.arange(1000).repeat(10)
-data = Series(randn(len(labels)))
-f = lambda x: {'first': x.values[0], 'last': x.values[-1]}
-"""
-
-groupby_apply_dict_return = Benchmark('data.groupby(labels).apply(f)',
-                                      setup, start_date=datetime(2011, 12, 15))
-
-#----------------------------------------------------------------------
-# First / last functions
-
-setup = common_setup + """
-labels = np.arange(10000).repeat(10)
-data = Series(randn(len(labels)))
-data[::3] = np.nan
-data[1::3] = np.nan
-data2 = Series(randn(len(labels)),dtype='float32')
-data2[::3] = np.nan
-data2[1::3] = np.nan
-labels = labels.take(np.random.permutation(len(labels)))
-"""
-
-groupby_first_float64 = Benchmark('data.groupby(labels).first()', setup,
-                                  start_date=datetime(2012, 5, 1))
-
-groupby_first_float32 = Benchmark('data2.groupby(labels).first()', setup,
-                                  start_date=datetime(2013, 1, 1))
-
-groupby_last_float64 = Benchmark('data.groupby(labels).last()', setup,
-                                 start_date=datetime(2012, 5, 1))
-
-groupby_last_float32 = Benchmark('data2.groupby(labels).last()', setup,
-                                 start_date=datetime(2013, 1, 1))
-
-groupby_nth_float64_none = Benchmark('data.groupby(labels).nth(0)', setup,
-                                     start_date=datetime(2012, 5, 1))
-groupby_nth_float32_none = Benchmark('data2.groupby(labels).nth(0)', setup,
-                                     start_date=datetime(2013, 1, 1))
-groupby_nth_float64_any = Benchmark('data.groupby(labels).nth(0,dropna="all")', setup,
-                                    start_date=datetime(2012, 5, 1))
-groupby_nth_float32_any = Benchmark('data2.groupby(labels).nth(0,dropna="all")', setup,
-                                    start_date=datetime(2013, 1, 1))
-
-# with datetimes (GH7555)
-setup = common_setup + """
-df = DataFrame({'a' : date_range('1/1/2011',periods=100000,freq='s'),'b' : range(100000)})
-"""
-
-groupby_first_datetimes = Benchmark('df.groupby("b").first()', setup,
-                                    start_date=datetime(2013, 5, 1))
-groupby_last_datetimes = Benchmark('df.groupby("b").last()', setup,
-                                   start_date=datetime(2013, 5, 1))
-groupby_nth_datetimes_none = Benchmark('df.groupby("b").nth(0)', setup,
-                                       start_date=datetime(2013, 5, 1))
-groupby_nth_datetimes_any = Benchmark('df.groupby("b").nth(0,dropna="all")', setup,
-                                      start_date=datetime(2013, 5, 1))
-
-# with object
-setup = common_setup + """
-df = DataFrame({'a' : ['foo']*100000,'b' : range(100000)})
-"""
-
-groupby_first_object = Benchmark('df.groupby("b").first()', setup,
-                                 start_date=datetime(2013, 5, 1))
-groupby_last_object = Benchmark('df.groupby("b").last()', setup,
-                                 start_date=datetime(2013, 5, 1))
-groupby_nth_object_none = Benchmark('df.groupby("b").nth(0)', setup,
-                                    start_date=datetime(2013, 5, 1))
-groupby_nth_object_any = Benchmark('df.groupby("b").nth(0,dropna="any")', setup,
-                                   start_date=datetime(2013, 5, 1))
-
-#----------------------------------------------------------------------
-# groupby_indices replacement, chop up Series
-
-setup = common_setup + """
-try:
-    rng = date_range('1/1/2000', '12/31/2005', freq='H')
-    year, month, day = rng.year, rng.month, rng.day
-except:
-    rng = date_range('1/1/2000', '12/31/2000', offset=datetools.Hour())
-    year = rng.map(lambda x: x.year)
-    month = rng.map(lambda x: x.month)
-    day = rng.map(lambda x: x.day)
-
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-groupby_indices = Benchmark('len(ts.groupby([year, month, day]))',
-                            setup, start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# median
-
-#----------------------------------------------------------------------
-# single key, long, integer key
-
-setup = common_setup + """
-data = np.random.randn(100000, 2)
-labels = np.random.randint(0, 1000, size=100000)
-df = DataFrame(data)
-"""
-
-groupby_frame_median = \
-    Benchmark('df.groupby(labels).median()', setup,
-              start_date=datetime(2011, 8, 1), logy=True)
-
-
-setup = common_setup + """
-data = np.random.randn(1000000, 2)
-labels = np.random.randint(0, 1000, size=1000000)
-df = DataFrame(data)
-"""
-
-groupby_simple_compress_timing = \
-    Benchmark('df.groupby(labels).mean()', setup,
-              start_date=datetime(2011, 8, 1))
-
-
-#----------------------------------------------------------------------
-# DataFrame Apply overhead
-
-setup = common_setup + """
-N = 10000
-labels = np.random.randint(0, 2000, size=N)
-labels2 = np.random.randint(0, 3, size=N)
-df = DataFrame({'key': labels,
-'key2': labels2,
-'value1': randn(N),
-'value2': ['foo', 'bar', 'baz', 'qux'] * (N / 4)})
-def f(g):
-    return 1
-"""
-
-groupby_frame_apply_overhead = Benchmark("df.groupby('key').apply(f)", setup,
-                                         start_date=datetime(2011, 10, 1))
-
-groupby_frame_apply = Benchmark("df.groupby(['key', 'key2']).apply(f)", setup,
-                                start_date=datetime(2011, 10, 1))
-
-
-#----------------------------------------------------------------------
-# DataFrame nth
-
-setup = common_setup + """
-df = DataFrame(np.random.randint(1, 100, (10000, 2)))
-"""
-
-# Not really a fair test as behaviour has changed!
-groupby_frame_nth_none = Benchmark("df.groupby(0).nth(0)", setup,
-                                   start_date=datetime(2014, 3, 1))
-
-groupby_series_nth_none = Benchmark("df[1].groupby(df[0]).nth(0)", setup,
-                                    start_date=datetime(2014, 3, 1))
-groupby_frame_nth_any= Benchmark("df.groupby(0).nth(0,dropna='any')", setup,
-                                 start_date=datetime(2014, 3, 1))
-
-groupby_series_nth_any = Benchmark("df[1].groupby(df[0]).nth(0,dropna='any')", setup,
-                                   start_date=datetime(2014, 3, 1))
-
-
-#----------------------------------------------------------------------
-# Sum booleans #2692
-
-setup = common_setup + """
-N = 500
-df = DataFrame({'ii':range(N),'bb':[True for x in range(N)]})
-"""
-
-groupby_sum_booleans = Benchmark("df.groupby('ii').sum()", setup)
-
-
-#----------------------------------------------------------------------
-# multi-indexed group sum #9049
-
-setup = common_setup + """
-N = 50
-df = DataFrame({'A': range(N) * 2, 'B': range(N*2), 'C': 1}).set_index(["A", "B"])
-"""
-
-groupby_sum_multiindex = Benchmark("df.groupby(level=[0, 1]).sum()", setup)
-
-
-#----------------------------------------------------------------------
-# Transform testing
-
-setup = common_setup + """
-n_dates = 400
-n_securities = 250
-n_columns = 3
-share_na = 0.1
-
-dates = date_range('1997-12-31', periods=n_dates, freq='B')
-dates = Index(map(lambda x: x.year * 10000 + x.month * 100 + x.day, dates))
-
-secid_min = int('10000000', 16)
-secid_max = int('F0000000', 16)
-step = (secid_max - secid_min) // (n_securities - 1)
-security_ids = map(lambda x: hex(x)[2:10].upper(), range(secid_min, secid_max + 1, step))
-
-data_index = MultiIndex(levels=[dates.values, security_ids],
-    labels=[[i for i in range(n_dates) for _ in xrange(n_securities)], range(n_securities) * n_dates],
-    names=['date', 'security_id'])
-n_data = len(data_index)
-
-columns = Index(['factor{}'.format(i) for i in range(1, n_columns + 1)])
-
-data = DataFrame(np.random.randn(n_data, n_columns), index=data_index, columns=columns)
-
-step = int(n_data * share_na)
-for column_index in range(n_columns):
-    index = column_index
-    while index < n_data:
-        data.set_value(data_index[index], columns[column_index], np.nan)
-        index += step
-
-f_fillna = lambda x: x.fillna(method='pad')
-"""
-
-groupby_transform = Benchmark("data.groupby(level='security_id').transform(f_fillna)", setup)
-groupby_transform_ufunc = Benchmark("data.groupby(level='date').transform(np.max)", setup)
-
-setup = common_setup + """
-np.random.seed(0)
-
-N = 120000
-N_TRANSITIONS = 1400
-
-# generate groups
-transition_points = np.random.permutation(np.arange(N))[:N_TRANSITIONS]
-transition_points.sort()
-transitions = np.zeros((N,), dtype=np.bool)
-transitions[transition_points] = True
-g = transitions.cumsum()
-
-df = DataFrame({ 'signal' : np.random.rand(N)})
-"""
-groupby_transform_series = Benchmark("df['signal'].groupby(g).transform(np.mean)", setup)
-
-setup = common_setup + """
-np.random.seed(0)
-
-df=DataFrame( { 'id' : np.arange( 100000 ) / 3,
-                'val': np.random.randn( 100000) } )
-"""
-
-groupby_transform_series2 = Benchmark("df.groupby('id')['val'].transform(np.mean)", setup)
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 20000
-df = DataFrame(np.random.randint(1, n, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-
-stmt = "df.groupby(['jim', 'joe'])['jolie'].transform('max')";
-groupby_transform_multi_key1 = Benchmark(stmt, setup)
-groupby_transform_multi_key2 = Benchmark(stmt, setup + "df['jim'] = df['joe']")
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 200000
-df = DataFrame(np.random.randint(1, n / 10, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-groupby_transform_multi_key3 = Benchmark(stmt, setup)
-groupby_transform_multi_key4 = Benchmark(stmt, setup + "df['jim'] = df['joe']")
-
-setup = common_setup + '''
-np.random.seed(27182)
-n = 100000
-df = DataFrame(np.random.randint(1, n / 100, (n, 3)),
-        columns=['jim', 'joe', 'jolie'])
-'''
-
-groupby_agg_builtins1 = Benchmark("df.groupby('jim').agg([sum, min, max])", setup)
-groupby_agg_builtins2 = Benchmark("df.groupby(['jim', 'joe']).agg([sum, min, max])", setup)
-
-
-setup = common_setup + '''
-arr = np.random.randint(- 1 << 12, 1 << 12, (1 << 17, 5))
-i = np.random.choice(len(arr), len(arr) * 5)
-arr = np.vstack((arr, arr[i]))  # add sume duplicate rows
-
-i = np.random.permutation(len(arr))
-arr = arr[i]  # shuffle rows
-
-df = DataFrame(arr, columns=list('abcde'))
-df['jim'], df['joe'] = np.random.randn(2, len(df)) * 10
-'''
-
-groupby_int64_overflow = Benchmark("df.groupby(list('abcde')).max()", setup,
-                                   name='groupby_int64_overflow')
-
-
-setup = common_setup + '''
-from itertools import product
-from string import ascii_letters, digits
-
-n = 5 * 7 * 11 * (1 << 9)
-alpha = list(map(''.join, product(ascii_letters + digits, repeat=4)))
-f = lambda k: np.repeat(np.random.choice(alpha, n // k), k)
-
-df = DataFrame({'a': f(11), 'b': f(7), 'c': f(5), 'd': f(1)})
-df['joe'] = (np.random.randn(len(df)) * 10).round(3)
-
-i = np.random.permutation(len(df))
-df = df.iloc[i].reset_index(drop=True).copy()
-'''
-
-groupby_multi_index = Benchmark("df.groupby(list('abcd')).max()", setup,
-                                name='groupby_multi_index')
-
-#----------------------------------------------------------------------
-# groupby with a variable value for ngroups
-
-
-ngroups_list = [100, 10000]
-no_arg_func_list = [
-    'all',
-    'any',
-    'count',
-    'cumcount',
-    'cummax',
-    'cummin',
-    'cumprod',
-    'cumsum',
-    'describe',
-    'diff',
-    'first',
-    'head',
-    'last',
-    'mad',
-    'max',
-    'mean',
-    'median',
-    'min',
-    'nunique',
-    'pct_change',
-    'prod',
-    'rank',
-    'sem',
-    'size',
-    'skew',
-    'std',
-    'sum',
-    'tail',
-    'unique',
-    'var',
-    'value_counts',
-]
-
-
-_stmt_template = "df.groupby('value')['timestamp'].%s"
-_setup_template = common_setup + """
-np.random.seed(1234)
-ngroups = %s
-size = ngroups * 2
-rng = np.arange(ngroups)
-df = DataFrame(dict(
-    timestamp=rng.take(np.random.randint(0, ngroups, size=size)),
-    value=np.random.randint(0, size, size=size)
-))
-"""
-START_DATE = datetime(2011, 7, 1)
-
-
-def make_large_ngroups_bmark(ngroups, func_name, func_args=''):
-    bmark_name = 'groupby_ngroups_%s_%s' % (ngroups, func_name)
-    stmt = _stmt_template % ('%s(%s)' % (func_name, func_args))
-    setup = _setup_template % ngroups
-    bmark = Benchmark(stmt, setup, start_date=START_DATE)
-    # MUST set name
-    bmark.name = bmark_name
-    return bmark
-
-
-def inject_bmark_into_globals(bmark):
-    if not bmark.name:
-        raise AssertionError('benchmark must have a name')
-    globals()[bmark.name] = bmark
-
-
-for ngroups in ngroups_list:
-    for func_name in no_arg_func_list:
-        bmark = make_large_ngroups_bmark(ngroups, func_name)
-        inject_bmark_into_globals(bmark)
-
-# avoid bmark to be collected as Benchmark object
-del bmark
diff --git a/vb_suite/hdfstore_bench.py b/vb_suite/hdfstore_bench.py
deleted file mode 100644
index 393fd4cc77e66..0000000000000
--- a/vb_suite/hdfstore_bench.py
+++ /dev/null
@@ -1,278 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-start_date = datetime(2012, 7, 1)
-
-common_setup = """from .pandas_vb_common import *
-import os
-
-f = '__test__.h5'
-def remove(f):
-   try:
-       os.remove(f)
-   except:
-       pass
-
-"""
-
-#----------------------------------------------------------------------
-# get from a store
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-store.put('df1',df)
-"""
-
-read_store = Benchmark("store.get('df1')", setup1, cleanup="store.close()",
-                       start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a store
-
-setup2 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store = Benchmark(
-    "store.put('df2',df)", setup2, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a store (mixed)
-
-setup3 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 250000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-store.put('df3',df)
-"""
-
-read_store_mixed = Benchmark(
-    "store.get('df3')", setup3, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a store (mixed)
-
-setup4 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 250000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_mixed = Benchmark(
-    "store.put('df4',df)", setup4, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (mixed)
-
-setup5 = common_setup + """
-N=10000
-index = tm.makeStringIndex(N)
-df = DataFrame({'float1' : randn(N),
-                'float2' : randn(N),
-                'string1' : ['foo'] * N,
-                'bool1' : [True] * N,
-                'int1' : np.random.randint(0, N, size=N)},
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df5',df)
-"""
-
-read_store_table_mixed = Benchmark(
-    "store.select('df5')", setup5, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table (mixed)
-
-setup6 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000),
-                'string1' : ['foo'] * 25000,
-                'bool1' : [True] * 25000,
-                'int1' : np.random.randint(0, 25000, size=25000)},
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_mixed = Benchmark(
-    "store.append('df6',df)", setup6, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# select from a table
-
-setup7 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df7',df)
-"""
-
-read_store_table = Benchmark(
-    "store.select('df7')", setup7, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table
-
-setup8 = common_setup + """
-index = tm.makeStringIndex(25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table = Benchmark(
-    "store.append('df8',df)", setup8, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (wide)
-
-setup9 = common_setup + """
-df = DataFrame(np.random.randn(25000,100))
-
-remove(f)
-store = HDFStore(f)
-store.append('df9',df)
-"""
-
-read_store_table_wide = Benchmark(
-    "store.select('df9')", setup9, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a table (wide)
-
-setup10 = common_setup + """
-df = DataFrame(np.random.randn(25000,100))
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_wide = Benchmark(
-    "store.append('df10',df)", setup10, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# get from a table (wide)
-
-setup11 = common_setup + """
-index = date_range('1/1/2000', periods = 25000)
-df = DataFrame(np.random.randn(25000,100), index = index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df11',df)
-"""
-
-query_store_table_wide = Benchmark(
-    "store.select('df11', [ ('index', '>', df.index[10000]), ('index', '<', df.index[15000]) ])", setup11, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# query from a table
-
-setup12 = common_setup + """
-index = date_range('1/1/2000', periods = 25000)
-df = DataFrame({'float1' : randn(25000),
-                'float2' : randn(25000) },
-               index=index)
-
-remove(f)
-store = HDFStore(f)
-store.append('df12',df)
-"""
-
-query_store_table = Benchmark(
-    "store.select('df12', [ ('index', '>', df.index[10000]), ('index', '<', df.index[15000]) ])", setup12, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# select from a panel table
-
-setup13 = common_setup + """
-p = Panel(randn(20, 1000, 25), items= [ 'Item%03d' % i for i in range(20) ],
-                   major_axis=date_range('1/1/2000', periods=1000), minor_axis = [ 'E%03d' % i for i in range(25) ])
-
-remove(f)
-store = HDFStore(f)
-store.append('p1',p)
-"""
-
-read_store_table_panel = Benchmark(
-    "store.select('p1')", setup13, cleanup="store.close()",
-    start_date=start_date)
-
-
-#----------------------------------------------------------------------
-# write to a panel table
-
-setup14 = common_setup + """
-p = Panel(randn(20, 1000, 25), items= [ 'Item%03d' % i for i in range(20) ],
-                   major_axis=date_range('1/1/2000', periods=1000), minor_axis = [ 'E%03d' % i for i in range(25) ])
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_panel = Benchmark(
-    "store.append('p2',p)", setup14, cleanup="store.close()",
-    start_date=start_date)
-
-#----------------------------------------------------------------------
-# write to a table (data_columns)
-
-setup15 = common_setup + """
-df = DataFrame(np.random.randn(10000,10),columns = [ 'C%03d' % i for i in range(10) ])
-
-remove(f)
-store = HDFStore(f)
-"""
-
-write_store_table_dc = Benchmark(
-    "store.append('df15',df,data_columns=True)", setup15, cleanup="store.close()",
-    start_date=start_date)
-
diff --git a/vb_suite/index_object.py b/vb_suite/index_object.py
deleted file mode 100644
index 2ab2bc15f3853..0000000000000
--- a/vb_suite/index_object.py
+++ /dev/null
@@ -1,173 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-SECTION = "Index / MultiIndex objects"
-
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# intersection, union
-
-setup = common_setup + """
-rng = DatetimeIndex(start='1/1/2000', periods=10000, freq=datetools.Minute())
-if rng.dtype == object:
-    rng = rng.view(Index)
-else:
-    rng = rng.asobject
-rng2 = rng[:-1]
-"""
-
-index_datetime_intersection = Benchmark("rng.intersection(rng2)", setup)
-index_datetime_union = Benchmark("rng.union(rng2)", setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=10000, freq='T')
-rng2 = rng[:-1]
-"""
-
-datetime_index_intersection = Benchmark("rng.intersection(rng2)", setup,
-                                        start_date=datetime(2013, 9, 27))
-datetime_index_union = Benchmark("rng.union(rng2)", setup,
-                                 start_date=datetime(2013, 9, 27))
-
-# integers
-setup = common_setup + """
-N = 1000000
-options = np.arange(N)
-
-left = Index(options.take(np.random.permutation(N)[:N // 2]))
-right = Index(options.take(np.random.permutation(N)[:N // 2]))
-"""
-
-index_int64_union = Benchmark('left.union(right)', setup,
-                              start_date=datetime(2011, 1, 1))
-
-index_int64_intersection = Benchmark('left.intersection(right)', setup,
-                                     start_date=datetime(2011, 1, 1))
-
-#----------------------------------------------------------------------
-# string index slicing
-setup = common_setup + """
-idx = tm.makeStringIndex(1000000)
-
-mask = np.arange(1000000) % 3 == 0
-series_mask = Series(mask)
-"""
-index_str_slice_indexer_basic = Benchmark('idx[:-1]', setup)
-index_str_slice_indexer_even = Benchmark('idx[::2]', setup)
-index_str_boolean_indexer = Benchmark('idx[mask]', setup)
-index_str_boolean_series_indexer = Benchmark('idx[series_mask]', setup)
-
-#----------------------------------------------------------------------
-# float64 index
-#----------------------------------------------------------------------
-# construction
-setup = common_setup + """
-baseidx = np.arange(1e6)
-"""
-
-index_float64_construct = Benchmark('Index(baseidx)', setup,
-                                    name='index_float64_construct',
-                                    start_date=datetime(2014, 4, 13))
-
-setup = common_setup + """
-idx = tm.makeFloatIndex(1000000)
-
-mask = np.arange(idx.size) % 3 == 0
-series_mask = Series(mask)
-"""
-#----------------------------------------------------------------------
-# getting
-index_float64_get = Benchmark('idx[1]', setup, name='index_float64_get',
-                              start_date=datetime(2014, 4, 13))
-
-
-#----------------------------------------------------------------------
-# slicing
-index_float64_slice_indexer_basic = Benchmark('idx[:-1]', setup,
-                                              name='index_float64_slice_indexer_basic',
-                                              start_date=datetime(2014, 4, 13))
-index_float64_slice_indexer_even = Benchmark('idx[::2]', setup,
-                                             name='index_float64_slice_indexer_even',
-                                             start_date=datetime(2014, 4, 13))
-index_float64_boolean_indexer = Benchmark('idx[mask]', setup,
-                                          name='index_float64_boolean_indexer',
-                                          start_date=datetime(2014, 4, 13))
-index_float64_boolean_series_indexer = Benchmark('idx[series_mask]', setup,
-                                                 name='index_float64_boolean_series_indexer',
-                                                 start_date=datetime(2014, 4, 13))
-
-#----------------------------------------------------------------------
-# arith ops
-index_float64_mul = Benchmark('idx * 2', setup, name='index_float64_mul',
-                              start_date=datetime(2014, 4, 13))
-index_float64_div = Benchmark('idx / 2', setup, name='index_float64_div',
-                              start_date=datetime(2014, 4, 13))
-
-
-# Constructing MultiIndex from cartesian product of iterables
-#
-
-setup = common_setup + """
-iterables = [tm.makeStringIndex(10000), range(20)]
-"""
-
-multiindex_from_product = Benchmark('MultiIndex.from_product(iterables)',
-                                    setup, name='multiindex_from_product',
-                                    start_date=datetime(2014, 6, 30))
-
-#----------------------------------------------------------------------
-# MultiIndex with DatetimeIndex level
-
-setup = common_setup + """
-level1 = range(1000)
-level2 = date_range(start='1/1/2012', periods=100)
-mi = MultiIndex.from_product([level1, level2])
-"""
-
-multiindex_with_datetime_level_full = \
-    Benchmark("mi.copy().values", setup,
-              name='multiindex_with_datetime_level_full',
-              start_date=datetime(2014, 10, 11))
-
-
-multiindex_with_datetime_level_sliced = \
-    Benchmark("mi[:10].values", setup,
-              name='multiindex_with_datetime_level_sliced',
-              start_date=datetime(2014, 10, 11))
-
-# multi-index duplicated
-setup = common_setup + """
-n, k = 200, 5000
-levels = [np.arange(n), tm.makeStringIndex(n).values, 1000 + np.arange(n)]
-labels = [np.random.choice(n, k * n) for lev in levels]
-mi = MultiIndex(levels=levels, labels=labels)
-"""
-
-multiindex_duplicated = Benchmark('mi.duplicated()', setup,
-                                  name='multiindex_duplicated')
-
-#----------------------------------------------------------------------
-# repr
-
-setup = common_setup + """
-dr = pd.date_range('20000101', freq='D', periods=100000)
-"""
-
-datetime_index_repr = \
-    Benchmark("dr._is_dates_only", setup,
-              start_date=datetime(2012, 1, 11))
-
-setup = common_setup + """
-n = 3 * 5 * 7 * 11 * (1 << 10)
-low, high = - 1 << 12, 1 << 12
-f = lambda k: np.repeat(np.random.randint(low, high, n // k), k)
-
-i = np.random.permutation(n)
-mi = MultiIndex.from_arrays([f(11), f(7), f(5), f(3), f(1)])[i]
-"""
-
-multiindex_sortlevel_int64 = Benchmark('mi.sortlevel()', setup,
-                                       name='multiindex_sortlevel_int64')
diff --git a/vb_suite/indexing.py b/vb_suite/indexing.py
deleted file mode 100644
index 3d95d52dccd71..0000000000000
--- a/vb_suite/indexing.py
+++ /dev/null
@@ -1,292 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-SECTION = 'Indexing and scalar value access'
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Series.__getitem__, get_value, __getitem__(slice)
-
-setup = common_setup + """
-tm.N = 1000
-ts = tm.makeTimeSeries()
-dt = ts.index[500]
-"""
-statement = "ts[dt]"
-bm_getitem = Benchmark(statement, setup, ncalls=100000,
-                       name='time_series_getitem_scalar')
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-s = Series(np.random.rand(1000), index=index)
-idx = index[100]
-"""
-statement = "s.get_value(idx)"
-bm_get_value = Benchmark(statement, setup,
-                         name='series_get_value',
-                         start_date=datetime(2011, 11, 12))
-
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000000)
-s = Series(np.random.rand(1000000), index=index)
-"""
-series_getitem_pos_slice = Benchmark("s[:800000]", setup,
-                                     name="series_getitem_pos_slice")
-
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000000)
-s = Series(np.random.rand(1000000), index=index)
-lbl = s.index[800000]
-"""
-series_getitem_label_slice = Benchmark("s[:lbl]", setup,
-                                       name="series_getitem_label_slice")
-
-
-#----------------------------------------------------------------------
-# DataFrame __getitem__
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = DataFrame(np.random.rand(1000, 30), index=index,
-               columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-statement = "df[col][idx]"
-bm_df_getitem = Benchmark(statement, setup,
-                          name='dataframe_getitem_scalar')
-
-setup = common_setup + """
-try:
-    klass = DataMatrix
-except:
-    klass = DataFrame
-
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = klass(np.random.rand(1000, 30), index=index, columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-statement = "df[col][idx]"
-bm_df_getitem2 = Benchmark(statement, setup,
-                           name='datamatrix_getitem_scalar')
-
-
-#----------------------------------------------------------------------
-# ix get scalar
-
-setup = common_setup + """
-index = tm.makeStringIndex(1000)
-columns = tm.makeStringIndex(30)
-df = DataFrame(np.random.randn(1000, 30), index=index, columns=columns)
-idx = index[100]
-col = columns[10]
-"""
-
-indexing_frame_get_value_ix = Benchmark("df.ix[idx,col]", setup,
-                                        name='indexing_frame_get_value_ix',
-                                        start_date=datetime(2011, 11, 12))
-
-indexing_frame_get_value = Benchmark("df.get_value(idx,col)", setup,
-                                     name='indexing_frame_get_value',
-                                     start_date=datetime(2011, 11, 12))
-
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(1000) for y in range(1000)])
-s =  Series(np.random.randn(1000000), index=mi)
-"""
-
-series_xs_mi_ix = Benchmark("s.ix[999]", setup,
-                            name='series_xs_mi_ix',
-                            start_date=datetime(2013, 1, 1))
-
-setup = common_setup + """
-mi = MultiIndex.from_tuples([(x,y) for x in range(1000) for y in range(1000)])
-s =  Series(np.random.randn(1000000), index=mi)
-df = DataFrame(s)
-"""
-
-frame_xs_mi_ix = Benchmark("df.ix[999]", setup,
-                           name='frame_xs_mi_ix',
-                           start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# Boolean DataFrame row selection
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-indexer = df['B'] > 0
-obj_indexer = indexer.astype('O')
-"""
-indexing_dataframe_boolean_rows = \
-    Benchmark("df[indexer]", setup, name='indexing_dataframe_boolean_rows')
-
-indexing_dataframe_boolean_rows_object = \
-    Benchmark("df[obj_indexer]", setup,
-              name='indexing_dataframe_boolean_rows_object')
-
-setup = common_setup + """
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-"""
-indexing_dataframe_boolean = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean',
-              start_date=datetime(2012, 1, 1))
-
-setup = common_setup + """
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
-
-if expr is None:
-    raise NotImplementedError
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-expr.set_numexpr_threads(1)
-"""
-
-indexing_dataframe_boolean_st = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean_st',cleanup="expr.set_numexpr_threads()",
-              start_date=datetime(2013, 2, 26))
-
-
-setup = common_setup + """
-try:
-    import pandas.computation.expressions as expr
-except:
-    expr = None
-
-if expr is None:
-    raise NotImplementedError
-df  = DataFrame(np.random.randn(50000, 100))
-df2 = DataFrame(np.random.randn(50000, 100))
-expr.set_use_numexpr(False)
-"""
-
-indexing_dataframe_boolean_no_ne = \
-    Benchmark("df > df2", setup, name='indexing_dataframe_boolean_no_ne',cleanup="expr.set_use_numexpr(True)",
-              start_date=datetime(2013, 2, 26))
-#----------------------------------------------------------------------
-# MultiIndex sortlevel
-
-setup = common_setup + """
-a = np.repeat(np.arange(100), 1000)
-b = np.tile(np.arange(1000), 100)
-midx = MultiIndex.from_arrays([a, b])
-midx = midx.take(np.random.permutation(np.arange(100000)))
-"""
-sort_level_zero = Benchmark("midx.sortlevel(0)", setup,
-                            start_date=datetime(2012, 1, 1))
-sort_level_one = Benchmark("midx.sortlevel(1)", setup,
-                           start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Panel subset selection
-
-setup = common_setup + """
-p = Panel(np.random.randn(100, 100, 100))
-inds = range(0, 100, 10)
-"""
-
-indexing_panel_subset = Benchmark('p.ix[inds, inds, inds]', setup,
-                                  start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Iloc
-
-setup = common_setup + """
-df = DataFrame({'A' : [0.1] * 3000, 'B' : [1] * 3000})
-idx = np.array(range(30)) * 99
-df2 = DataFrame({'A' : [0.1] * 1000, 'B' : [1] * 1000})
-df2 = concat([df2, 2*df2, 3*df2])
-"""
-
-frame_iloc_dups = Benchmark('df2.iloc[idx]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-frame_loc_dups = Benchmark('df2.loc[idx]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-setup = common_setup + """
-df = DataFrame(dict( A = [ 'foo'] * 1000000))
-"""
-
-frame_iloc_big = Benchmark('df.iloc[:100,0]', setup,
-                            start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# basic tests for [], .loc[], .iloc[] and .ix[]
-
-setup = common_setup + """
-s = Series(np.random.rand(1000000))
-"""
-
-series_getitem_scalar = Benchmark("s[800000]", setup)
-series_getitem_slice = Benchmark("s[:800000]", setup)
-series_getitem_list_like = Benchmark("s[[800000]]", setup)
-series_getitem_array = Benchmark("s[np.arange(10000)]", setup)
-
-series_loc_scalar = Benchmark("s.loc[800000]", setup)
-series_loc_slice = Benchmark("s.loc[:800000]", setup)
-series_loc_list_like = Benchmark("s.loc[[800000]]", setup)
-series_loc_array = Benchmark("s.loc[np.arange(10000)]", setup)
-
-series_iloc_scalar = Benchmark("s.iloc[800000]", setup)
-series_iloc_slice = Benchmark("s.iloc[:800000]", setup)
-series_iloc_list_like = Benchmark("s.iloc[[800000]]", setup)
-series_iloc_array = Benchmark("s.iloc[np.arange(10000)]", setup)
-
-series_ix_scalar = Benchmark("s.ix[800000]", setup)
-series_ix_slice = Benchmark("s.ix[:800000]", setup)
-series_ix_list_like = Benchmark("s.ix[[800000]]", setup)
-series_ix_array = Benchmark("s.ix[np.arange(10000)]", setup)
-
-
-# multi-index slicing
-setup = common_setup + """
-np.random.seed(1234)
-idx=pd.IndexSlice
-n=100000
-mdt = pandas.DataFrame()
-mdt['A'] = np.random.choice(range(10000,45000,1000), n)
-mdt['B'] = np.random.choice(range(10,400), n)
-mdt['C'] = np.random.choice(range(1,150), n)
-mdt['D'] = np.random.choice(range(10000,45000), n)
-mdt['x'] = np.random.choice(range(400), n)
-mdt['y'] = np.random.choice(range(25), n)
-
-
-test_A = 25000
-test_B = 25
-test_C = 40
-test_D = 35000
-
-eps_A = 5000
-eps_B = 5
-eps_C = 5
-eps_D = 5000
-mdt2 = mdt.set_index(['A','B','C','D']).sortlevel()
-"""
-
-multiindex_slicers = Benchmark('mdt2.loc[idx[test_A-eps_A:test_A+eps_A,test_B-eps_B:test_B+eps_B,test_C-eps_C:test_C+eps_C,test_D-eps_D:test_D+eps_D],:]', setup,
-                               start_date=datetime(2015, 1, 1))
-
-#----------------------------------------------------------------------
-# take
-
-setup = common_setup + """
-s = Series(np.random.rand(100000))
-ts = Series(np.random.rand(100000),
-            index=date_range('2011-01-01', freq='S', periods=100000))
-indexer = [True, False, True, True, False] * 20000
-"""
-
-series_take_intindex = Benchmark("s.take(indexer)", setup)
-series_take_dtindex = Benchmark("ts.take(indexer)", setup)
diff --git a/vb_suite/inference.py b/vb_suite/inference.py
deleted file mode 100644
index aaa51aa5163ce..0000000000000
--- a/vb_suite/inference.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-import sys
-
-# from GH 7332
-
-setup = """from .pandas_vb_common import *
-import pandas as pd
-N = 500000
-df_int64 = DataFrame(dict(A = np.arange(N,dtype='int64'), B = np.arange(N,dtype='int64')))
-df_int32 = DataFrame(dict(A = np.arange(N,dtype='int32'), B = np.arange(N,dtype='int32')))
-df_uint32 = DataFrame(dict(A = np.arange(N,dtype='uint32'), B = np.arange(N,dtype='uint32')))
-df_float64 = DataFrame(dict(A = np.arange(N,dtype='float64'), B = np.arange(N,dtype='float64')))
-df_float32 = DataFrame(dict(A = np.arange(N,dtype='float32'), B = np.arange(N,dtype='float32')))
-df_datetime64 = DataFrame(dict(A = pd.to_datetime(np.arange(N,dtype='int64'),unit='ms'),
-                               B = pd.to_datetime(np.arange(N,dtype='int64'),unit='ms')))
-df_timedelta64 = DataFrame(dict(A = df_datetime64['A']-df_datetime64['B'],
-                                B = df_datetime64['B']))
-"""
-
-dtype_infer_int64 = Benchmark('df_int64["A"] + df_int64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_int32 = Benchmark('df_int32["A"] + df_int32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_uint32 = Benchmark('df_uint32["A"] + df_uint32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_float64 = Benchmark('df_float64["A"] + df_float64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_float32 = Benchmark('df_float32["A"] + df_float32["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_datetime64 = Benchmark('df_datetime64["A"] - df_datetime64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_timedelta64_1 = Benchmark('df_timedelta64["A"] + df_timedelta64["B"]', setup,
-                               start_date=datetime(2014, 1, 1))
-dtype_infer_timedelta64_2 = Benchmark('df_timedelta64["A"] + df_timedelta64["A"]', setup,
-                               start_date=datetime(2014, 1, 1))
diff --git a/vb_suite/io_bench.py b/vb_suite/io_bench.py
deleted file mode 100644
index af5f6076515cc..0000000000000
--- a/vb_suite/io_bench.py
+++ /dev/null
@@ -1,150 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from io import StringIO
-"""
-
-#----------------------------------------------------------------------
-# read_csv
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-df.to_csv('__test__.csv')
-"""
-
-read_csv_standard = Benchmark("read_csv('__test__.csv')", setup1,
-                              start_date=datetime(2011, 9, 15))
-
-#----------------------------------
-# skiprows
-
-setup1 = common_setup + """
-index = tm.makeStringIndex(20000)
-df = DataFrame({'float1' : randn(20000),
-                'float2' : randn(20000),
-                'string1' : ['foo'] * 20000,
-                'bool1' : [True] * 20000,
-                'int1' : np.random.randint(0, 200000, size=20000)},
-               index=index)
-df.to_csv('__test__.csv')
-"""
-
-read_csv_skiprows = Benchmark("read_csv('__test__.csv', skiprows=10000)", setup1,
-                              start_date=datetime(2011, 9, 15))
-
-#----------------------------------------------------------------------
-# write_csv
-
-setup2 = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-"""
-
-write_csv_standard = Benchmark("df.to_csv('__test__.csv')", setup2,
-                               start_date=datetime(2011, 9, 15))
-
-#----------------------------------
-setup = common_setup + """
-df = DataFrame(np.random.randn(3000, 30))
-"""
-frame_to_csv = Benchmark("df.to_csv('__test__.csv')", setup,
-                         start_date=datetime(2011, 1, 1))
-#----------------------------------
-
-setup = common_setup + """
-df=DataFrame({'A':range(50000)})
-df['B'] = df.A + 1.0
-df['C'] = df.A + 2.0
-df['D'] = df.A + 3.0
-"""
-frame_to_csv2 = Benchmark("df.to_csv('__test__.csv')", setup,
-                         start_date=datetime(2011, 1, 1))
-
-#----------------------------------
-setup = common_setup + """
-from pandas import concat, Timestamp
-
-def create_cols(name):
-    return [ "%s%03d" % (name,i) for i in range(5) ]
-df_float  = DataFrame(np.random.randn(5000, 5),dtype='float64',columns=create_cols('float'))
-df_int    = DataFrame(np.random.randn(5000, 5),dtype='int64',columns=create_cols('int'))
-df_bool   = DataFrame(True,index=df_float.index,columns=create_cols('bool'))
-df_object = DataFrame('foo',index=df_float.index,columns=create_cols('object'))
-df_dt     = DataFrame(Timestamp('20010101'),index=df_float.index,columns=create_cols('date'))
-
-# add in some nans
-df_float.ix[30:500,1:3] = np.nan
-
-df        = concat([ df_float, df_int, df_bool, df_object, df_dt ], axis=1)
-
-"""
-frame_to_csv_mixed = Benchmark("df.to_csv('__test__.csv')", setup,
-                               start_date=datetime(2012, 6, 1))
-
-#----------------------------------------------------------------------
-# parse dates, ISO8601 format
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y-%m-%d %H:%M:%S")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'])")
-read_parse_dates_iso8601 = Benchmark(stmt, setup,
-                                     start_date=datetime(2012, 3, 1))
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = DataFrame(rng, index=rng)
-"""
-
-stmt = ("data.to_csv('__test__.csv', date_format='%Y%m%d')")
-
-frame_to_csv_date_formatting = Benchmark(stmt, setup,
-                                     start_date=datetime(2013, 9, 1))
-
-#----------------------------------------------------------------------
-# infer datetime format
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y-%m-%d %H:%M:%S")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_iso8601 = Benchmark(stmt, setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%Y%m%d")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_ymd = Benchmark(stmt, setup)
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=1000)
-data = '\\n'.join(rng.map(lambda x: x.strftime("%m/%d/%Y %H:%M:%S.%f")))
-"""
-
-stmt = ("read_csv(StringIO(data), header=None, names=['foo'], "
-        "         parse_dates=['foo'], infer_datetime_format=True)")
-
-read_csv_infer_datetime_format_custom = Benchmark(stmt, setup)
diff --git a/vb_suite/io_sql.py b/vb_suite/io_sql.py
deleted file mode 100644
index ba8367e7e356b..0000000000000
--- a/vb_suite/io_sql.py
+++ /dev/null
@@ -1,126 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-import sqlite3
-import sqlalchemy
-from sqlalchemy import create_engine
-
-engine = create_engine('sqlite:///:memory:')
-con = sqlite3.connect(':memory:')
-"""
-
-sdate = datetime(2014, 6, 1)
-
-
-#-------------------------------------------------------------------------------
-# to_sql
-
-setup = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-               index=index)
-"""
-
-sql_write_sqlalchemy = Benchmark("df.to_sql('test1', engine, if_exists='replace')",
-                                 setup, start_date=sdate)
-
-sql_write_fallback = Benchmark("df.to_sql('test1', con, if_exists='replace')",
-                               setup, start_date=sdate)
-
-
-#-------------------------------------------------------------------------------
-# read_sql
-
-setup = common_setup + """
-index = tm.makeStringIndex(10000)
-df = DataFrame({'float1' : randn(10000),
-                'float2' : randn(10000),
-                'string1' : ['foo'] * 10000,
-                'bool1' : [True] * 10000,
-                'int1' : np.random.randint(0, 100000, size=10000)},
-            index=index)
-df.to_sql('test2', engine, if_exists='replace')
-df.to_sql('test2', con, if_exists='replace')
-"""
-
-sql_read_query_sqlalchemy = Benchmark("read_sql_query('SELECT * FROM test2', engine)",
-                                      setup, start_date=sdate)
-
-sql_read_query_fallback = Benchmark("read_sql_query('SELECT * FROM test2', con)",
-                                    setup, start_date=sdate)
-
-sql_read_table_sqlalchemy = Benchmark("read_sql_table('test2', engine)",
-                                      setup, start_date=sdate)
-
-
-#-------------------------------------------------------------------------------
-# type specific write
-
-setup = common_setup + """
-df = DataFrame({'float' : randn(10000),
-                'string' : ['foo'] * 10000,
-                'bool' : [True] * 10000,
-                'datetime' : date_range('2000-01-01', periods=10000, freq='s')})
-df.loc[1000:3000, 'float'] = np.nan
-"""
-
-sql_float_write_sqlalchemy = \
-    Benchmark("df[['float']].to_sql('test_float', engine, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_float_write_fallback = \
-    Benchmark("df[['float']].to_sql('test_float', con, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_string_write_sqlalchemy = \
-    Benchmark("df[['string']].to_sql('test_string', engine, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_string_write_fallback = \
-    Benchmark("df[['string']].to_sql('test_string', con, if_exists='replace')",
-              setup, start_date=sdate)
-
-sql_datetime_write_sqlalchemy = \
-    Benchmark("df[['datetime']].to_sql('test_datetime', engine, if_exists='replace')",
-            setup, start_date=sdate)
-
-#sql_datetime_write_fallback = \
-#   Benchmark("df[['datetime']].to_sql('test_datetime', con, if_exists='replace')",
-#           setup3, start_date=sdate)
-
-#-------------------------------------------------------------------------------
-# type specific read
-
-setup = common_setup + """
-df = DataFrame({'float' : randn(10000),
-                'datetime' : date_range('2000-01-01', periods=10000, freq='s')})
-df['datetime_string'] = df['datetime'].map(str)
-
-df.to_sql('test_type', engine, if_exists='replace')
-df[['float', 'datetime_string']].to_sql('test_type', con, if_exists='replace')
-"""
-
-sql_float_read_query_sqlalchemy = \
-    Benchmark("read_sql_query('SELECT float FROM test_type', engine)",
-            setup, start_date=sdate)
-
-sql_float_read_table_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['float'])",
-            setup, start_date=sdate)
-
-sql_float_read_query_fallback = \
-    Benchmark("read_sql_query('SELECT float FROM test_type', con)",
-            setup, start_date=sdate)
-
-sql_datetime_read_as_native_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['datetime'])",
-            setup, start_date=sdate)
-
-sql_datetime_read_and_parse_sqlalchemy = \
-    Benchmark("read_sql_table('test_type', engine, columns=['datetime_string'], parse_dates=['datetime_string'])",
-            setup, start_date=sdate)
diff --git a/vb_suite/join_merge.py b/vb_suite/join_merge.py
deleted file mode 100644
index 238a129552e90..0000000000000
--- a/vb_suite/join_merge.py
+++ /dev/null
@@ -1,270 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-level1 = tm.makeStringIndex(10).values
-level2 = tm.makeStringIndex(1000).values
-label1 = np.arange(10).repeat(1000)
-label2 = np.tile(np.arange(1000), 10)
-
-key1 = np.tile(level1.take(label1), 10)
-key2 = np.tile(level2.take(label2), 10)
-
-shuf = np.arange(100000)
-random.shuffle(shuf)
-try:
-    index2 = MultiIndex(levels=[level1, level2], labels=[label1, label2])
-    index3 = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                        labels=[np.arange(10).repeat(10000),
-                                np.tile(np.arange(100).repeat(100), 10),
-                                np.tile(np.tile(np.arange(100), 100), 10)])
-    df_multi = DataFrame(np.random.randn(len(index2), 4), index=index2,
-                         columns=['A', 'B', 'C', 'D'])
-except:  # pre-MultiIndex
-    pass
-
-try:
-    DataFrame = DataMatrix
-except:
-    pass
-
-df = pd.DataFrame({'data1' : np.random.randn(100000),
-                'data2' : np.random.randn(100000),
-                'key1' : key1,
-                'key2' : key2})
-
-
-df_key1 = pd.DataFrame(np.random.randn(len(level1), 4), index=level1,
-                    columns=['A', 'B', 'C', 'D'])
-df_key2 = pd.DataFrame(np.random.randn(len(level2), 4), index=level2,
-                    columns=['A', 'B', 'C', 'D'])
-
-df_shuf = df.reindex(df.index[shuf])
-"""
-
-#----------------------------------------------------------------------
-# DataFrame joins on key
-
-join_dataframe_index_single_key_small = \
-    Benchmark("df.join(df_key1, on='key1')", setup,
-              name='join_dataframe_index_single_key_small')
-
-join_dataframe_index_single_key_bigger = \
-    Benchmark("df.join(df_key2, on='key2')", setup,
-              name='join_dataframe_index_single_key_bigger')
-
-join_dataframe_index_single_key_bigger_sort = \
-    Benchmark("df_shuf.join(df_key2, on='key2', sort=True)", setup,
-              name='join_dataframe_index_single_key_bigger_sort',
-              start_date=datetime(2012, 2, 5))
-
-join_dataframe_index_multi = \
-    Benchmark("df.join(df_multi, on=['key1', 'key2'])", setup,
-              name='join_dataframe_index_multi',
-              start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# Joins on integer keys
-setup = common_setup + """
-df = pd.DataFrame({'key1': np.tile(np.arange(500).repeat(10), 2),
-                'key2': np.tile(np.arange(250).repeat(10), 4),
-                'value': np.random.randn(10000)})
-df2 = pd.DataFrame({'key1': np.arange(500), 'value2': randn(500)})
-df3 = df[:5000]
-"""
-
-
-join_dataframe_integer_key = Benchmark("merge(df, df2, on='key1')", setup,
-                                       start_date=datetime(2011, 10, 20))
-join_dataframe_integer_2key = Benchmark("merge(df, df3)", setup,
-                                        start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# DataFrame joins on index
-
-
-#----------------------------------------------------------------------
-# Merges
-setup = common_setup + """
-N = 10000
-
-indices = tm.makeStringIndex(N).values
-indices2 = tm.makeStringIndex(N).values
-key = np.tile(indices[:8000], 10)
-key2 = np.tile(indices2[:8000], 10)
-
-left = pd.DataFrame({'key' : key, 'key2':key2,
-                  'value' : np.random.randn(80000)})
-right = pd.DataFrame({'key': indices[2000:], 'key2':indices2[2000:],
-                   'value2' : np.random.randn(8000)})
-"""
-
-merge_2intkey_nosort = Benchmark('merge(left, right, sort=False)', setup,
-                                 start_date=datetime(2011, 10, 20))
-
-merge_2intkey_sort = Benchmark('merge(left, right, sort=True)', setup,
-                               start_date=datetime(2011, 10, 20))
-
-#----------------------------------------------------------------------
-# Appending DataFrames
-
-setup = common_setup + """
-df1 = pd.DataFrame(np.random.randn(10000, 4), columns=['A', 'B', 'C', 'D'])
-df2 = df1.copy()
-df2.index = np.arange(10000, 20000)
-mdf1 = df1.copy()
-mdf1['obj1'] = 'bar'
-mdf1['obj2'] = 'bar'
-mdf1['int1'] = 5
-try:
-    mdf1.consolidate(inplace=True)
-except:
-    pass
-mdf2 = mdf1.copy()
-mdf2.index = df2.index
-"""
-
-stmt = "df1.append(df2)"
-append_frame_single_homogenous = \
-    Benchmark(stmt, setup, name='append_frame_single_homogenous',
-              ncalls=500, repeat=1)
-
-stmt = "mdf1.append(mdf2)"
-append_frame_single_mixed = Benchmark(stmt, setup,
-                                      name='append_frame_single_mixed',
-                                      ncalls=500, repeat=1)
-
-#----------------------------------------------------------------------
-# data alignment
-
-setup = common_setup + """n = 1000000
-# indices = tm.makeStringIndex(n)
-def sample(values, k):
-    sampler = np.random.permutation(len(values))
-    return values.take(sampler[:k])
-sz = 500000
-rng = np.arange(0, 10000000000000, 10000000)
-stamps = np.datetime64(datetime.now()).view('i8') + rng
-idx1 = np.sort(sample(stamps, sz))
-idx2 = np.sort(sample(stamps, sz))
-ts1 = Series(np.random.randn(sz), idx1)
-ts2 = Series(np.random.randn(sz), idx2)
-"""
-stmt = "ts1 + ts2"
-series_align_int64_index = \
-    Benchmark(stmt, setup,
-              name="series_align_int64_index",
-              start_date=datetime(2010, 6, 1), logy=True)
-
-stmt = "ts1.align(ts2, join='left')"
-series_align_left_monotonic = \
-    Benchmark(stmt, setup,
-              name="series_align_left_monotonic",
-              start_date=datetime(2011, 12, 1), logy=True)
-
-#----------------------------------------------------------------------
-# Concat Series axis=1
-
-setup = common_setup + """
-n = 1000
-indices = tm.makeStringIndex(1000)
-s = Series(n, index=indices)
-pieces = [s[i:-i] for i in range(1, 10)]
-pieces = pieces * 50
-"""
-
-concat_series_axis1 = Benchmark('concat(pieces, axis=1)', setup,
-                                start_date=datetime(2012, 2, 27))
-
-setup = common_setup + """
-df = pd.DataFrame(randn(5, 4))
-"""
-
-concat_small_frames = Benchmark('concat([df] * 1000)', setup,
-                                start_date=datetime(2012, 1, 1))
-
-
-#----------------------------------------------------------------------
-# Concat empty
-
-setup = common_setup + """
-df = pd.DataFrame(dict(A = range(10000)),index=date_range('20130101',periods=10000,freq='s'))
-empty = pd.DataFrame()
-"""
-
-concat_empty_frames1 = Benchmark('concat([df,empty])', setup,
-                                start_date=datetime(2012, 1, 1))
-concat_empty_frames2 = Benchmark('concat([empty,df])', setup,
-                                start_date=datetime(2012, 1, 1))
-
-
-#----------------------------------------------------------------------
-# Ordered merge
-
-setup = common_setup + """
-groups = tm.makeStringIndex(10).values
-
-left = pd.DataFrame({'group': groups.repeat(5000),
-                  'key' : np.tile(np.arange(0, 10000, 2), 10),
-                  'lvalue': np.random.randn(50000)})
-
-right = pd.DataFrame({'key' : np.arange(10000),
-                   'rvalue' : np.random.randn(10000)})
-
-"""
-
-stmt = "ordered_merge(left, right, on='key', left_by='group')"
-
-#----------------------------------------------------------------------
-# outer join of non-unique
-# GH 6329
-
-setup = common_setup + """
-date_index = date_range('01-Jan-2013', '23-Jan-2013', freq='T')
-daily_dates = date_index.to_period('D').to_timestamp('S','S')
-fracofday = date_index.view(np.ndarray) - daily_dates.view(np.ndarray)
-fracofday = fracofday.astype('timedelta64[ns]').astype(np.float64)/864e11
-fracofday = TimeSeries(fracofday, daily_dates)
-index = date_range(date_index.min().to_period('A').to_timestamp('D','S'),
-                      date_index.max().to_period('A').to_timestamp('D','E'),
-                      freq='D')
-temp = TimeSeries(1.0, index)
-"""
-
-join_non_unique_equal = Benchmark('fracofday * temp[fracofday.index]', setup,
-                                   start_date=datetime(2013, 1, 1))
-
-
-setup = common_setup + '''
-np.random.seed(2718281)
-n = 50000
-
-left = pd.DataFrame(np.random.randint(1, n/500, (n, 2)),
-        columns=['jim', 'joe'])
-
-right = pd.DataFrame(np.random.randint(1, n/500, (n, 2)),
-        columns=['jolie', 'jolia']).set_index('jolie')
-'''
-
-left_outer_join_index = Benchmark("left.join(right, on='jim')", setup,
-                                  name='left_outer_join_index')
-
-
-setup = common_setup + """
-low, high, n = -1 << 10, 1 << 10, 1 << 20
-left = pd.DataFrame(np.random.randint(low, high, (n, 7)),
-                    columns=list('ABCDEFG'))
-left['left'] = left.sum(axis=1)
-
-i = np.random.permutation(len(left))
-right = left.iloc[i].copy()
-right.columns = right.columns[:-1].tolist() + ['right']
-right.index = np.arange(len(right))
-right['right'] *= -1
-"""
-
-i8merge = Benchmark("merge(left, right, how='outer')", setup,
-                    name='i8merge')
diff --git a/vb_suite/make.py b/vb_suite/make.py
deleted file mode 100755
index 5a8a8215db9a4..0000000000000
--- a/vb_suite/make.py
+++ /dev/null
@@ -1,167 +0,0 @@
-#!/usr/bin/env python
-
-"""
-Python script for building documentation.
-
-To build the docs you must have all optional dependencies for statsmodels
-installed. See the installation instructions for a list of these.
-
-Note: currently latex builds do not work because of table formats that are not
-supported in the latex generation.
-
-Usage
------
-python make.py clean
-python make.py html
-"""
-
-import glob
-import os
-import shutil
-import sys
-import sphinx
-
-os.environ['PYTHONPATH'] = '..'
-
-SPHINX_BUILD = 'sphinxbuild'
-
-
-def upload():
-    'push a copy to the site'
-    os.system('cd build/html; rsync -avz . pandas@pandas.pydata.org'
-              ':/usr/share/nginx/pandas/pandas-docs/vbench/ -essh')
-
-
-def clean():
-    if os.path.exists('build'):
-        shutil.rmtree('build')
-
-    if os.path.exists('source/generated'):
-        shutil.rmtree('source/generated')
-
-
-def html():
-    check_build()
-    if os.system('sphinx-build -P -b html -d build/doctrees '
-                 'source build/html'):
-        raise SystemExit("Building HTML failed.")
-
-
-def check_build():
-    build_dirs = [
-        'build', 'build/doctrees', 'build/html',
-        'build/plots', 'build/_static',
-        'build/_templates']
-    for d in build_dirs:
-        try:
-            os.mkdir(d)
-        except OSError:
-            pass
-
-
-def all():
-    clean()
-    html()
-
-
-def auto_update():
-    msg = ''
-    try:
-        clean()
-        html()
-        upload()
-        sendmail()
-    except (Exception, SystemExit), inst:
-        msg += str(inst) + '\n'
-        sendmail(msg)
-
-
-def sendmail(err_msg=None):
-    from_name, to_name = _get_config()
-
-    if err_msg is None:
-        msgstr = 'Daily vbench uploaded successfully'
-        subject = "VB: daily update successful"
-    else:
-        msgstr = err_msg
-        subject = "VB: daily update failed"
-
-    import smtplib
-    from email.MIMEText import MIMEText
-    msg = MIMEText(msgstr)
-    msg['Subject'] = subject
-    msg['From'] = from_name
-    msg['To'] = to_name
-
-    server_str, port, login, pwd = _get_credentials()
-    server = smtplib.SMTP(server_str, port)
-    server.ehlo()
-    server.starttls()
-    server.ehlo()
-
-    server.login(login, pwd)
-    try:
-        server.sendmail(from_name, to_name, msg.as_string())
-    finally:
-        server.close()
-
-
-def _get_dir(subdir=None):
-    import getpass
-    USERNAME = getpass.getuser()
-    if sys.platform == 'darwin':
-        HOME = '/Users/%s' % USERNAME
-    else:
-        HOME = '/home/%s' % USERNAME
-
-    if subdir is None:
-        subdir = '/code/scripts'
-    conf_dir = '%s%s' % (HOME, subdir)
-    return conf_dir
-
-
-def _get_credentials():
-    tmp_dir = _get_dir()
-    cred = '%s/credentials' % tmp_dir
-    with open(cred, 'r') as fh:
-        server, port, un, domain = fh.read().split(',')
-    port = int(port)
-    login = un + '@' + domain + '.com'
-
-    import base64
-    with open('%s/cron_email_pwd' % tmp_dir, 'r') as fh:
-        pwd = base64.b64decode(fh.read())
-
-    return server, port, login, pwd
-
-
-def _get_config():
-    tmp_dir = _get_dir()
-    with open('%s/addresses' % tmp_dir, 'r') as fh:
-        from_name, to_name = fh.read().split(',')
-    return from_name, to_name
-
-funcd = {
-    'html': html,
-    'clean': clean,
-    'upload': upload,
-    'auto_update': auto_update,
-    'all': all,
-}
-
-small_docs = False
-
-# current_dir = os.getcwd()
-# os.chdir(os.path.dirname(os.path.join(current_dir, __file__)))
-
-if len(sys.argv) > 1:
-    for arg in sys.argv[1:]:
-        func = funcd.get(arg)
-        if func is None:
-            raise SystemExit('Do not know how to handle %s; valid args are %s' % (
-                arg, funcd.keys()))
-        func()
-else:
-    small_docs = False
-    all()
-# os.chdir(current_dir)
diff --git a/vb_suite/measure_memory_consumption.py b/vb_suite/measure_memory_consumption.py
deleted file mode 100755
index bb73cf5da4302..0000000000000
--- a/vb_suite/measure_memory_consumption.py
+++ /dev/null
@@ -1,55 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-"""Short one-line summary
-
-long summary
-"""
-
-
-def main():
-    import shutil
-    import tempfile
-    import warnings
-
-    from pandas import Series
-
-    from vbench.api import BenchmarkRunner
-    from suite import (REPO_PATH, BUILD, DB_PATH, PREPARE,
-                       dependencies, benchmarks)
-
-    from memory_profiler import memory_usage
-
-    warnings.filterwarnings('ignore', category=FutureWarning)
-
-    try:
-        TMP_DIR = tempfile.mkdtemp()
-        runner = BenchmarkRunner(
-            benchmarks, REPO_PATH, REPO_PATH, BUILD, DB_PATH,
-            TMP_DIR, PREPARE, always_clean=True,
-            # run_option='eod', start_date=START_DATE,
-            module_dependencies=dependencies)
-        results = {}
-        for b in runner.benchmarks:
-            k = b.name
-            try:
-                vs = memory_usage((b.run,))
-                v = max(vs)
-                # print(k, v)
-                results[k] = v
-            except Exception as e:
-                print("Exception caught in %s\n" % k)
-                print(str(e))
-
-        s = Series(results)
-        s.sort()
-        print((s))
-
-    finally:
-        shutil.rmtree(TMP_DIR)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/vb_suite/miscellaneous.py b/vb_suite/miscellaneous.py
deleted file mode 100644
index da2c736e79ea7..0000000000000
--- a/vb_suite/miscellaneous.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# cache_readonly
-
-setup = common_setup + """
-from pandas.util.decorators import cache_readonly
-
-class Foo:
-
-    @cache_readonly
-    def prop(self):
-        return 5
-obj = Foo()
-"""
-misc_cache_readonly = Benchmark("obj.prop", setup, name="misc_cache_readonly",
-                                ncalls=2000000)
-
-#----------------------------------------------------------------------
-# match
-
-setup = common_setup + """
-uniques = tm.makeStringIndex(1000).values
-all = uniques.repeat(10)
-"""
-
-match_strings = Benchmark("match(all, uniques)", setup,
-                          start_date=datetime(2012, 5, 12))
diff --git a/vb_suite/packers.py b/vb_suite/packers.py
deleted file mode 100644
index 69ec10822b392..0000000000000
--- a/vb_suite/packers.py
+++ /dev/null
@@ -1,252 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-start_date = datetime(2013, 5, 1)
-
-common_setup = """from .pandas_vb_common import *
-import os
-import pandas as pd
-from pandas.core import common as com
-from pandas.compat import BytesIO
-from random import randrange
-
-f = '__test__.msg'
-def remove(f):
-   try:
-       os.remove(f)
-   except:
-       pass
-
-N=100000
-C=5
-index = date_range('20000101',periods=N,freq='H')
-df = DataFrame(dict([ ("float{0}".format(i),randn(N)) for i in range(C) ]),
-               index=index)
-
-N=100000
-C=5
-index = date_range('20000101',periods=N,freq='H')
-df2 = DataFrame(dict([ ("float{0}".format(i),randn(N)) for i in range(C) ]),
-                index=index)
-df2['object'] = ['%08x'%randrange(16**8) for _ in range(N)]
-remove(f)
-"""
-
-#----------------------------------------------------------------------
-# msgpack
-
-setup = common_setup + """
-df2.to_msgpack(f)
-"""
-
-packers_read_pack = Benchmark("pd.read_msgpack(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_pack = Benchmark("df2.to_msgpack(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# pickle
-
-setup = common_setup + """
-df2.to_pickle(f)
-"""
-
-packers_read_pickle = Benchmark("pd.read_pickle(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_pickle = Benchmark("df2.to_pickle(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# csv
-
-setup = common_setup + """
-df.to_csv(f)
-"""
-
-packers_read_csv = Benchmark("pd.read_csv(f)", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_csv = Benchmark("df.to_csv(f)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# hdf store
-
-setup = common_setup + """
-df2.to_hdf(f,'df')
-"""
-
-packers_read_hdf_store = Benchmark("pd.read_hdf(f,'df')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_hdf_store = Benchmark("df2.to_hdf(f,'df')", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# hdf table
-
-setup = common_setup + """
-df2.to_hdf(f,'df',format='table')
-"""
-
-packers_read_hdf_table = Benchmark("pd.read_hdf(f,'df')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-
-packers_write_hdf_table = Benchmark("df2.to_hdf(f,'df',table=True)", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# sql
-
-setup = common_setup + """
-import sqlite3
-from sqlalchemy import create_engine
-engine = create_engine('sqlite:///:memory:')
-
-df2.to_sql('table', engine, if_exists='replace')
-"""
-
-packers_read_sql= Benchmark("pd.read_sql_table('table', engine)", setup, start_date=start_date)
-
-setup = common_setup + """
-import sqlite3
-from sqlalchemy import create_engine
-engine = create_engine('sqlite:///:memory:')
-"""
-
-packers_write_sql = Benchmark("df2.to_sql('table', engine, if_exists='replace')", setup, start_date=start_date)
-
-#----------------------------------------------------------------------
-# json
-
-setup_int_index = """
-import numpy as np
-df.index = np.arange(N)
-"""
-
-setup = common_setup + """
-df.to_json(f,orient='split')
-"""
-packers_read_json_date_index = Benchmark("pd.read_json(f, orient='split')", setup, start_date=start_date)
-setup = setup + setup_int_index
-packers_read_json = Benchmark("pd.read_json(f, orient='split')", setup, start_date=start_date)
-
-setup = common_setup + """
-"""
-packers_write_json_date_index = Benchmark("df.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = setup + setup_int_index
-packers_write_json = Benchmark("df.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-packers_write_json_T = Benchmark("df.to_json(f,orient='columns')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-
-cols = [
-  lambda i: ("{0}_timedelta".format(i), [pd.Timedelta('%d seconds' % randrange(1e6)) for _ in range(N)]),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N)),
-  lambda i: ("{0}_timestamp".format(i), [pd.Timestamp( 1418842918083256000 + randrange(1e9, 1e18, 200)) for _ in range(N)])
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_delta_int_tstamp = Benchmark("df_mixed.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-cols = [
-  lambda i: ("{0}_float".format(i), randn(N)),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N))
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_float_int = Benchmark("df_mixed.to_json(f,orient='index')", setup, cleanup="remove(f)", start_date=start_date)
-packers_write_json_mixed_float_int_T = Benchmark("df_mixed.to_json(f,orient='columns')", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-from numpy.random import randint
-from collections import OrderedDict
-cols = [
-  lambda i: ("{0}_float".format(i), randn(N)),
-  lambda i: ("{0}_int".format(i), randint(1e8, size=N)),
-  lambda i: ("{0}_str".format(i), ['%08x'%randrange(16**8) for _ in range(N)])
-  ]
-df_mixed = DataFrame(OrderedDict([cols[i % len(cols)](i) for i in range(C)]),
-                     index=index)
-"""
-packers_write_json_mixed_float_int_str = Benchmark("df_mixed.to_json(f,orient='split')", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# stata
-
-setup = common_setup + """
-df.to_stata(f, {'index': 'tc'})
-"""
-packers_read_stata = Benchmark("pd.read_stata(f)", setup, start_date=start_date)
-
-packers_write_stata = Benchmark("df.to_stata(f, {'index': 'tc'})", setup, cleanup="remove(f)", start_date=start_date)
-
-setup = common_setup + """
-df['int8_'] = [randint(np.iinfo(np.int8).min, np.iinfo(np.int8).max - 27) for _ in range(N)]
-df['int16_'] = [randint(np.iinfo(np.int16).min, np.iinfo(np.int16).max - 27) for _ in range(N)]
-df['int32_'] = [randint(np.iinfo(np.int32).min, np.iinfo(np.int32).max - 27) for _ in range(N)]
-df['float32_'] = np.array(randn(N), dtype=np.float32)
-df.to_stata(f, {'index': 'tc'})
-"""
-
-packers_read_stata_with_validation = Benchmark("pd.read_stata(f)", setup, start_date=start_date)
-
-packers_write_stata_with_validation = Benchmark("df.to_stata(f, {'index': 'tc'})", setup, cleanup="remove(f)", start_date=start_date)
-
-#----------------------------------------------------------------------
-# Excel - alternative writers
-setup = common_setup + """
-bio = BytesIO()
-"""
-
-excel_writer_bench = """
-bio.seek(0)
-writer = pd.io.excel.ExcelWriter(bio, engine='{engine}')
-df[:2000].to_excel(writer)
-writer.save()
-"""
-
-benchmark_xlsxwriter = excel_writer_bench.format(engine='xlsxwriter')
-
-packers_write_excel_xlsxwriter = Benchmark(benchmark_xlsxwriter, setup)
-
-benchmark_openpyxl = excel_writer_bench.format(engine='openpyxl')
-
-packers_write_excel_openpyxl = Benchmark(benchmark_openpyxl, setup)
-
-benchmark_xlwt = excel_writer_bench.format(engine='xlwt')
-
-packers_write_excel_xlwt = Benchmark(benchmark_xlwt, setup)
-
-
-#----------------------------------------------------------------------
-# Excel - reader
-
-setup = common_setup + """
-bio = BytesIO()
-writer = pd.io.excel.ExcelWriter(bio, engine='xlsxwriter')
-df[:2000].to_excel(writer)
-writer.save()
-"""
-
-benchmark_read_excel="""
-bio.seek(0)
-pd.read_excel(bio)
-"""
-
-packers_read_excel = Benchmark(benchmark_read_excel, setup)
diff --git a/vb_suite/pandas_vb_common.py b/vb_suite/pandas_vb_common.py
deleted file mode 100644
index bd2e8a1c1d504..0000000000000
--- a/vb_suite/pandas_vb_common.py
+++ /dev/null
@@ -1,30 +0,0 @@
-from pandas import *
-import pandas as pd
-from datetime import timedelta
-from numpy.random import randn
-from numpy.random import randint
-from numpy.random import permutation
-import pandas.util.testing as tm
-import random
-import numpy as np
-try:
-    from pandas.compat import range
-except ImportError:
-    pass
-
-np.random.seed(1234)
-try:
-    import pandas._tseries as lib
-except:
-    import pandas._libs.lib as lib
-
-try:
-    Panel = WidePanel
-except Exception:
-    pass
-
-# didn't add to namespace until later
-try:
-    from pandas.core.index import MultiIndex
-except ImportError:
-    pass
diff --git a/vb_suite/panel_ctor.py b/vb_suite/panel_ctor.py
deleted file mode 100644
index 9f497e7357a61..0000000000000
--- a/vb_suite/panel_ctor.py
+++ /dev/null
@@ -1,76 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# Panel.from_dict homogenization time
-
-START_DATE = datetime(2011, 6, 1)
-
-setup_same_index = common_setup + """
-# create 100 dataframes with the same index
-dr = np.asarray(DatetimeIndex(start=datetime(1990,1,1), end=datetime(2012,1,1),
-                              freq=datetools.Day(1)))
-data_frames = {}
-for x in range(100):
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-
-panel_from_dict_same_index = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_same_index, name='panel_from_dict_same_index',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_equiv_indexes = common_setup + """
-data_frames = {}
-for x in range(100):
-   dr = np.asarray(DatetimeIndex(start=datetime(1990,1,1), end=datetime(2012,1,1),
-                                 freq=datetools.Day(1)))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-
-panel_from_dict_equiv_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_equiv_indexes, name='panel_from_dict_equiv_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_all_different_indexes = common_setup + """
-data_frames = {}
-start = datetime(1990,1,1)
-end = datetime(2012,1,1)
-for x in range(100):
-   end += timedelta(days=1)
-   dr = np.asarray(date_range(start, end))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-panel_from_dict_all_different_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_all_different_indexes,
-              name='panel_from_dict_all_different_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
-
-setup_two_different_indexes = common_setup + """
-data_frames = {}
-start = datetime(1990,1,1)
-end = datetime(2012,1,1)
-for x in range(100):
-   if x == 50:
-       end += timedelta(days=1)
-   dr = np.asarray(date_range(start, end))
-   df = DataFrame({"a": [0]*len(dr), "b": [1]*len(dr),
-                   "c": [2]*len(dr)}, index=dr)
-   data_frames[x] = df
-"""
-panel_from_dict_two_different_indexes = \
-    Benchmark("Panel.from_dict(data_frames)",
-              setup_two_different_indexes,
-              name='panel_from_dict_two_different_indexes',
-              start_date=START_DATE, repeat=1, logy=True)
diff --git a/vb_suite/panel_methods.py b/vb_suite/panel_methods.py
deleted file mode 100644
index 28586422a66e3..0000000000000
--- a/vb_suite/panel_methods.py
+++ /dev/null
@@ -1,28 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# shift
-
-setup = common_setup + """
-index = date_range(start="2000", freq="D", periods=1000)
-panel = Panel(np.random.randn(100, len(index), 1000))
-"""
-
-panel_shift = Benchmark('panel.shift(1)', setup,
-                               start_date=datetime(2012, 1, 12))
-
-panel_shift_minor = Benchmark('panel.shift(1, axis="minor")', setup,
-                               start_date=datetime(2012, 1, 12))
-
-panel_pct_change_major = Benchmark('panel.pct_change(1, axis="major")', setup,
-                                   start_date=datetime(2014, 4, 19))
-
-panel_pct_change_minor = Benchmark('panel.pct_change(1, axis="minor")', setup,
-                                   start_date=datetime(2014, 4, 19))
-
-panel_pct_change_items = Benchmark('panel.pct_change(1, axis="items")', setup,
-                                   start_date=datetime(2014, 4, 19))
diff --git a/vb_suite/parser_vb.py b/vb_suite/parser_vb.py
deleted file mode 100644
index bb9ccbdb5e854..0000000000000
--- a/vb_suite/parser_vb.py
+++ /dev/null
@@ -1,112 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from pandas import read_csv, read_table
-"""
-
-setup = common_setup + """
-import os
-N = 10000
-K = 8
-df = DataFrame(np.random.randn(N, K) * np.random.randint(100, 10000, (N, K)))
-df.to_csv('test.csv', sep='|')
-"""
-
-read_csv_vb = Benchmark("read_csv('test.csv', sep='|')", setup,
-                        cleanup="os.remove('test.csv')",
-                        start_date=datetime(2012, 5, 7))
-
-
-setup = common_setup + """
-import os
-N = 10000
-K = 8
-format = lambda x: '{:,}'.format(x)
-df = DataFrame(np.random.randn(N, K) * np.random.randint(100, 10000, (N, K)))
-df = df.applymap(format)
-df.to_csv('test.csv', sep='|')
-"""
-
-read_csv_thou_vb = Benchmark("read_csv('test.csv', sep='|', thousands=',')",
-                             setup,
-                             cleanup="os.remove('test.csv')",
-                             start_date=datetime(2012, 5, 7))
-
-setup = common_setup + """
-data = ['A,B,C']
-data = data + ['1,2,3 # comment'] * 100000
-data = '\\n'.join(data)
-"""
-
-stmt = "read_csv(StringIO(data), comment='#')"
-read_csv_comment2 = Benchmark(stmt, setup,
-                              start_date=datetime(2011, 11, 1))
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-import os
-N = 10000
-K = 8
-data = '''\
-KORD,19990127, 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127, 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127, 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127, 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127, 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-data = data * 200
-"""
-cmd = ("read_table(StringIO(data), sep=',', header=None, "
-       "parse_dates=[[1,2], [1,3]])")
-sdate = datetime(2012, 5, 7)
-read_table_multiple_date = Benchmark(cmd, setup, start_date=sdate)
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-import os
-N = 10000
-K = 8
-data = '''\
-KORD,19990127 19:00:00, 18:56:00, 0.8100, 2.8100, 7.2000, 0.0000, 280.0000
-KORD,19990127 20:00:00, 19:56:00, 0.0100, 2.2100, 7.2000, 0.0000, 260.0000
-KORD,19990127 21:00:00, 20:56:00, -0.5900, 2.2100, 5.7000, 0.0000, 280.0000
-KORD,19990127 21:00:00, 21:18:00, -0.9900, 2.0100, 3.6000, 0.0000, 270.0000
-KORD,19990127 22:00:00, 21:56:00, -0.5900, 1.7100, 5.1000, 0.0000, 290.0000
-'''
-data = data * 200
-"""
-cmd = "read_table(StringIO(data), sep=',', header=None, parse_dates=[1])"
-sdate = datetime(2012, 5, 7)
-read_table_multiple_date_baseline = Benchmark(cmd, setup, start_date=sdate)
-
-setup = common_setup + """
-try:
-    from cStringIO import StringIO
-except ImportError:
-    from io import StringIO
-
-data = '''\
-0.1213700904466425978256438611,0.0525708283766902484401839501,0.4174092731488769913994474336
-0.4096341697147408700274695547,0.1587830198973579909349496119,0.1292545832485494372576795285
-0.8323255650024565799327547210,0.9694902427379478160318626578,0.6295047811546814475747169126
-0.4679375305798131323697930383,0.2963942381834381301075609371,0.5268936082160610157032465394
-0.6685382761849776311890991564,0.6721207066140679753374342908,0.6519975277021627935170045020
-'''
-data = data * 200
-"""
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision=None)"
-sdate = datetime(2014, 8, 20)
-read_csv_default_converter = Benchmark(cmd, setup, start_date=sdate)
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision='high')"
-read_csv_precise_converter = Benchmark(cmd, setup, start_date=sdate)
-cmd = "read_csv(StringIO(data), sep=',', header=None, float_precision='round_trip')"
-read_csv_roundtrip_converter = Benchmark(cmd, setup, start_date=sdate)
diff --git a/vb_suite/perf_HEAD.py b/vb_suite/perf_HEAD.py
deleted file mode 100755
index 143d943b9eadf..0000000000000
--- a/vb_suite/perf_HEAD.py
+++ /dev/null
@@ -1,243 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-from __future__ import print_function
-
-"""Run all the vbenches in `suite`, and post the results as a json blob to gist
-
-"""
-
-import urllib2
-from contextlib import closing
-from urllib2 import urlopen
-import json
-
-import pandas as pd
-
-WEB_TIMEOUT = 10
-
-
-def get_travis_data():
-    """figure out what worker we're running on,  and the number of jobs it's running
-    """
-    import os
-    jobid = os.environ.get("TRAVIS_JOB_ID")
-    if not jobid:
-        return None, None
-
-    with closing(urlopen("https://api.travis-ci.org/workers/")) as resp:
-        workers = json.loads(resp.read())
-
-    host = njobs = None
-    for item in workers:
-        host = item.get("host")
-        id = ((item.get("payload") or {}).get("job") or {}).get("id")
-        if id and str(id) == str(jobid):
-            break
-        if host:
-            njobs = len(
-                [x for x in workers if host in x['host'] and x['payload']])
-
-    return host, njobs
-
-
-def get_utcdatetime():
-    try:
-        from datetime import datetime
-        return datetime.utcnow().isoformat(" ")
-    except:
-        pass
-
-
-def dump_as_gist(data, desc="The Commit", njobs=None):
-    host, njobs2 = get_travis_data()[:2]
-
-    if njobs:  # be slightly more reliable
-        njobs = max(njobs, njobs2)
-
-    content = dict(version="0.1.1",
-                   timings=data,
-                   datetime=get_utcdatetime(),   # added in 0.1.1
-                   hostname=host,   # added in 0.1.1
-                   njobs=njobs    # added in 0.1.1, a measure of load on the travis box
-                   )
-
-    payload = dict(description=desc,
-                   public=True,
-                   files={'results.json': dict(content=json.dumps(content))})
-    try:
-        with closing(urlopen("https://api.github.com/gists",
-                             json.dumps(payload), timeout=WEB_TIMEOUT)) as r:
-            if 200 <= r.getcode() < 300:
-                print("\n\n" + "-" * 80)
-
-                gist = json.loads(r.read())
-                file_raw_url = gist['files'].items()[0][1]['raw_url']
-                print("[vbench-gist-raw_url] %s" % file_raw_url)
-                print("[vbench-html-url] %s" % gist['html_url'])
-                print("[vbench-api-url] %s" % gist['url'])
-
-                print("-" * 80 + "\n\n")
-            else:
-                print("api.github.com returned status %d" % r.getcode())
-    except:
-        print("Error occured while dumping to gist")
-
-
-def main():
-    import warnings
-    from suite import benchmarks
-
-    exit_code = 0
-    warnings.filterwarnings('ignore', category=FutureWarning)
-
-    host, njobs = get_travis_data()[:2]
-    results = []
-    for b in benchmarks:
-        try:
-            d = b.run()
-            d.update(dict(name=b.name))
-            results.append(d)
-            msg = "{name:<40}: {timing:> 10.4f} [ms]"
-            print(msg.format(name=results[-1]['name'],
-                             timing=results[-1]['timing']))
-
-        except Exception as e:
-            exit_code = 1
-            if (type(e) == KeyboardInterrupt or
-                    'KeyboardInterrupt' in str(d)):
-                raise KeyboardInterrupt()
-
-            msg = "{name:<40}: ERROR:\n<-------"
-            print(msg.format(name=b.name))
-            if isinstance(d, dict):
-                if d['succeeded']:
-                    print("\nException:\n%s\n" % str(e))
-                else:
-                    for k, v in sorted(d.iteritems()):
-                        print("{k}: {v}".format(k=k, v=v))
-
-            print("------->\n")
-
-    dump_as_gist(results, "testing", njobs=njobs)
-
-    return exit_code
-
-
-if __name__ == "__main__":
-    import sys
-    sys.exit(main())
-
-#####################################################
-# functions for retrieving and processing the results
-
-
-def get_vbench_log(build_url):
-    with closing(urllib2.urlopen(build_url)) as r:
-        if not (200 <= r.getcode() < 300):
-            return
-
-        s = json.loads(r.read())
-        s = [x for x in s['matrix'] if "VBENCH" in ((x.get('config', {})
-                                                    or {}).get('env', {}) or {})]
-                # s=[x for x in s['matrix']]
-        if not s:
-            return
-        id = s[0]['id']  # should be just one for now
-        with closing(urllib2.urlopen("https://api.travis-ci.org/jobs/%s" % id)) as r2:
-            if not 200 <= r.getcode() < 300:
-                return
-            s2 = json.loads(r2.read())
-            return s2.get('log')
-
-
-def get_results_raw_url(build):
-    "Taks a Travis a build number, retrieves the build log and extracts the gist url"
-    import re
-    log = get_vbench_log("https://api.travis-ci.org/builds/%s" % build)
-    if not log:
-        return
-    l = [x.strip(
-    ) for x in log.split("\n") if re.match(".vbench-gist-raw_url", x)]
-    if l:
-        s = l[0]
-        m = re.search("(https://[^\s]+)", s)
-        if m:
-            return m.group(0)
-
-
-def convert_json_to_df(results_url):
-    """retrieve json results file from url and return df
-
-    df contains timings for all successful vbenchmarks
-    """
-
-    with closing(urlopen(results_url)) as resp:
-        res = json.loads(resp.read())
-    timings = res.get("timings")
-    if not timings:
-        return
-    res = [x for x in timings if x.get('succeeded')]
-    df = pd.DataFrame(res)
-    df = df.set_index("name")
-    return df
-
-
-def get_build_results(build):
-    "Returns a df with the results of the VBENCH job associated with the travis build"
-    r_url = get_results_raw_url(build)
-    if not r_url:
-        return
-
-    return convert_json_to_df(r_url)
-
-
-def get_all_results(repo_id=53976):  # travis pandas-dev/pandas id
-    """Fetches the VBENCH results for all travis builds, and returns a list of result df
-
-   unsuccesful individual vbenches are dropped.
-    """
-    from collections import OrderedDict
-
-    def get_results_from_builds(builds):
-        dfs = OrderedDict()
-        for build in builds:
-            build_id = build['id']
-            build_number = build['number']
-            print(build_number)
-            res = get_build_results(build_id)
-            if res is not None:
-                dfs[build_number] = res
-        return dfs
-
-    base_url = 'https://api.travis-ci.org/builds?url=%2Fbuilds&repository_id={repo_id}'
-    url = base_url.format(repo_id=repo_id)
-    url_after = url + '&after_number={after}'
-    dfs = OrderedDict()
-
-    while True:
-        with closing(urlopen(url)) as r:
-            if not (200 <= r.getcode() < 300):
-                break
-            builds = json.loads(r.read())
-        res = get_results_from_builds(builds)
-        if not res:
-            break
-        last_build_number = min(res.keys())
-        dfs.update(res)
-        url = url_after.format(after=last_build_number)
-
-    return dfs
-
-
-def get_all_results_joined(repo_id=53976):
-    def mk_unique(df):
-        for dupe in df.index.get_duplicates():
-            df = df.ix[df.index != dupe]
-        return df
-    dfs = get_all_results(repo_id)
-    for k in dfs:
-        dfs[k] = mk_unique(dfs[k])
-    ss = [pd.Series(v.timing, name=k) for k, v in dfs.iteritems()]
-    results = pd.concat(reversed(ss), 1)
-    return results
diff --git a/vb_suite/plotting.py b/vb_suite/plotting.py
deleted file mode 100644
index 79e81e9eea8f4..0000000000000
--- a/vb_suite/plotting.py
+++ /dev/null
@@ -1,25 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-
-try:
-    from pandas import date_range
-except ImportError:
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start, end, periods=periods, offset=freq)
-
-"""
-
-#-----------------------------------------------------------------------------
-# Timeseries plotting
-
-setup = common_setup + """
-N = 2000
-M = 5
-df = DataFrame(np.random.randn(N,M), index=date_range('1/1/1975', periods=N))
-"""
-
-plot_timeseries_period = Benchmark("df.plot()", setup=setup, 
-                                   name='plot_timeseries_period')
-
diff --git a/vb_suite/reindex.py b/vb_suite/reindex.py
deleted file mode 100644
index 443eb43835745..0000000000000
--- a/vb_suite/reindex.py
+++ /dev/null
@@ -1,225 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# DataFrame reindex columns
-
-setup = common_setup + """
-df = DataFrame(index=range(10000), data=np.random.rand(10000,30),
-               columns=range(30))
-"""
-statement = "df.reindex(columns=df.columns[1:5])"
-
-frame_reindex_columns = Benchmark(statement, setup)
-
-#----------------------------------------------------------------------
-
-setup = common_setup + """
-rng = DatetimeIndex(start='1/1/1970', periods=10000, freq=datetools.Minute())
-df = DataFrame(np.random.rand(10000, 10), index=rng,
-               columns=range(10))
-df['foo'] = 'bar'
-rng2 = Index(rng[::2])
-"""
-statement = "df.reindex(rng2)"
-dataframe_reindex = Benchmark(statement, setup)
-
-#----------------------------------------------------------------------
-# multiindex reindexing
-
-setup = common_setup + """
-N = 1000
-K = 20
-
-level1 = tm.makeStringIndex(N).values.repeat(K)
-level2 = np.tile(tm.makeStringIndex(K).values, N)
-index = MultiIndex.from_arrays([level1, level2])
-
-s1 = Series(np.random.randn(N * K), index=index)
-s2 = s1[::2]
-"""
-statement = "s1.reindex(s2.index)"
-reindex_multi = Benchmark(statement, setup,
-                          name='reindex_multiindex',
-                          start_date=datetime(2011, 9, 1))
-
-#----------------------------------------------------------------------
-# Pad / backfill
-
-def pad(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='pad')
-    except:
-        source_series.reindex(target_index, fillMethod='pad')
-
-def backfill(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='backfill')
-    except:
-        source_series.reindex(target_index, fillMethod='backfill')
-
-setup = common_setup + """
-rng = date_range('1/1/2000', periods=100000, freq=datetools.Minute())
-
-ts = Series(np.random.randn(len(rng)), index=rng)
-ts2 = ts[::2]
-ts3 = ts2.reindex(ts.index)
-ts4 = ts3.astype('float32')
-
-def pad(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='pad')
-    except:
-        source_series.reindex(target_index, fillMethod='pad')
-def backfill(source_series, target_index):
-    try:
-        source_series.reindex(target_index, method='backfill')
-    except:
-        source_series.reindex(target_index, fillMethod='backfill')
-"""
-
-statement = "pad(ts2, ts.index)"
-reindex_daterange_pad = Benchmark(statement, setup,
-                                  name="reindex_daterange_pad")
-
-statement = "backfill(ts2, ts.index)"
-reindex_daterange_backfill = Benchmark(statement, setup,
-                                       name="reindex_daterange_backfill")
-
-reindex_fillna_pad = Benchmark("ts3.fillna(method='pad')", setup,
-                               name="reindex_fillna_pad",
-                               start_date=datetime(2011, 3, 1))
-
-reindex_fillna_pad_float32 = Benchmark("ts4.fillna(method='pad')", setup,
-                                       name="reindex_fillna_pad_float32",
-                                       start_date=datetime(2013, 1, 1))
-
-reindex_fillna_backfill = Benchmark("ts3.fillna(method='backfill')", setup,
-                                    name="reindex_fillna_backfill",
-                                    start_date=datetime(2011, 3, 1))
-reindex_fillna_backfill_float32 = Benchmark("ts4.fillna(method='backfill')", setup,
-                                            name="reindex_fillna_backfill_float32",
-                                            start_date=datetime(2013, 1, 1))
-
-#----------------------------------------------------------------------
-# align on level
-
-setup = common_setup + """
-index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                   labels=[np.arange(10).repeat(10000),
-                           np.tile(np.arange(100).repeat(100), 10),
-                           np.tile(np.tile(np.arange(100), 100), 10)])
-random.shuffle(index.values)
-df = DataFrame(np.random.randn(len(index), 4), index=index)
-df_level = DataFrame(np.random.randn(100, 4), index=index.levels[1])
-"""
-
-reindex_frame_level_align = \
-    Benchmark("df.align(df_level, level=1, copy=False)", setup,
-              name='reindex_frame_level_align',
-              start_date=datetime(2011, 12, 27))
-
-reindex_frame_level_reindex = \
-    Benchmark("df_level.reindex(df.index, level=1)", setup,
-              name='reindex_frame_level_reindex',
-              start_date=datetime(2011, 12, 27))
-
-
-#----------------------------------------------------------------------
-# sort_index, drop_duplicates
-
-# pathological, but realistic
-setup = common_setup + """
-N = 10000
-K = 10
-
-key1 = tm.makeStringIndex(N).values.repeat(K)
-key2 = tm.makeStringIndex(N).values.repeat(K)
-
-df = DataFrame({'key1' : key1, 'key2' : key2,
-                'value' : np.random.randn(N * K)})
-col_array_list = list(df.values.T)
-"""
-statement = "df.sort_index(by=['key1', 'key2'])"
-frame_sort_index_by_columns = Benchmark(statement, setup,
-                                        start_date=datetime(2011, 11, 1))
-
-# drop_duplicates
-
-statement = "df.drop_duplicates(['key1', 'key2'])"
-frame_drop_duplicates = Benchmark(statement, setup,
-                                  start_date=datetime(2011, 11, 15))
-
-statement = "df.drop_duplicates(['key1', 'key2'], inplace=True)"
-frame_drop_dup_inplace = Benchmark(statement, setup,
-                                   start_date=datetime(2012, 5, 16))
-
-lib_fast_zip = Benchmark('lib.fast_zip(col_array_list)', setup,
-                         name='lib_fast_zip',
-                         start_date=datetime(2012, 1, 1))
-
-setup = setup + """
-df.ix[:10000, :] = np.nan
-"""
-statement2 = "df.drop_duplicates(['key1', 'key2'])"
-frame_drop_duplicates_na = Benchmark(statement2, setup,
-                                     start_date=datetime(2012, 5, 15))
-
-lib_fast_zip_fillna = Benchmark('lib.fast_zip_fillna(col_array_list)', setup,
-                                start_date=datetime(2012, 5, 15))
-
-statement2 = "df.drop_duplicates(['key1', 'key2'], inplace=True)"
-frame_drop_dup_na_inplace = Benchmark(statement2, setup,
-                                      start_date=datetime(2012, 5, 16))
-
-setup = common_setup + """
-s = Series(np.random.randint(0, 1000, size=10000))
-s2 = Series(np.tile(tm.makeStringIndex(1000).values, 10))
-"""
-
-series_drop_duplicates_int = Benchmark('s.drop_duplicates()', setup,
-                                       start_date=datetime(2012, 11, 27))
-
-series_drop_duplicates_string = \
-    Benchmark('s2.drop_duplicates()', setup,
-              start_date=datetime(2012, 11, 27))
-
-#----------------------------------------------------------------------
-# fillna, many columns
-
-
-setup = common_setup + """
-values = np.random.randn(1000, 1000)
-values[::2] = np.nan
-df = DataFrame(values)
-"""
-
-frame_fillna_many_columns_pad = Benchmark("df.fillna(method='pad')",
-                                          setup,
-                                          start_date=datetime(2011, 3, 1))
-
-#----------------------------------------------------------------------
-# blog "pandas escaped the zoo"
-
-setup = common_setup + """
-n = 50000
-indices = tm.makeStringIndex(n)
-
-def sample(values, k):
-    from random import shuffle
-    sampler = np.arange(len(values))
-    shuffle(sampler)
-    return values.take(sampler[:k])
-
-subsample_size = 40000
-
-x = Series(np.random.randn(50000), indices)
-y = Series(np.random.randn(subsample_size),
-           index=sample(indices, subsample_size))
-"""
-
-series_align_irregular_string = Benchmark("x + y", setup,
-                                          start_date=datetime(2010, 6, 1))
diff --git a/vb_suite/replace.py b/vb_suite/replace.py
deleted file mode 100644
index 9326aa5becca9..0000000000000
--- a/vb_suite/replace.py
+++ /dev/null
@@ -1,36 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from datetime import timedelta
-
-N = 1000000
-
-try:
-    rng = date_range('1/1/2000', periods=N, freq='min')
-except NameError:
-    rng = DatetimeIndex('1/1/2000', periods=N, offset=datetools.Minute())
-    date_range = DateRange
-
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-large_dict_setup = """from .pandas_vb_common import *
-from pandas.compat import range
-n = 10 ** 6
-start_value = 10 ** 5
-to_rep = dict((i, start_value + i) for i in range(n))
-s = Series(np.random.randint(n, size=10 ** 3))
-"""
-
-replace_fillna = Benchmark('ts.fillna(0., inplace=True)', common_setup,
-                           name='replace_fillna',
-                           start_date=datetime(2012, 4, 4))
-replace_replacena = Benchmark('ts.replace(np.nan, 0., inplace=True)',
-                              common_setup,
-                              name='replace_replacena',
-                              start_date=datetime(2012, 5, 15))
-replace_large_dict = Benchmark('s.replace(to_rep, inplace=True)',
-                               large_dict_setup,
-                               name='replace_large_dict',
-                               start_date=datetime(2014, 4, 6))
diff --git a/vb_suite/reshape.py b/vb_suite/reshape.py
deleted file mode 100644
index daab96103f2c5..0000000000000
--- a/vb_suite/reshape.py
+++ /dev/null
@@ -1,65 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-index = MultiIndex.from_arrays([np.arange(100).repeat(100),
-                               np.roll(np.tile(np.arange(100), 100), 25)])
-df = DataFrame(np.random.randn(10000, 4), index=index)
-"""
-
-reshape_unstack_simple = Benchmark('df.unstack(1)', common_setup,
-                                   start_date=datetime(2011, 10, 1))
-
-setup = common_setup + """
-udf = df.unstack(1)
-"""
-
-reshape_stack_simple = Benchmark('udf.stack()', setup,
-                                 start_date=datetime(2011, 10, 1))
-
-setup = common_setup + """
-def unpivot(frame):
-    N, K = frame.shape
-    data = {'value' : frame.values.ravel('F'),
-            'variable' : np.asarray(frame.columns).repeat(N),
-            'date' : np.tile(np.asarray(frame.index), K)}
-    return DataFrame(data, columns=['date', 'variable', 'value'])
-index = date_range('1/1/2000', periods=10000, freq='h')
-df = DataFrame(randn(10000, 50), index=index, columns=range(50))
-pdf = unpivot(df)
-f = lambda: pdf.pivot('date', 'variable', 'value')
-"""
-
-reshape_pivot_time_series = Benchmark('f()', setup,
-                                      start_date=datetime(2012, 5, 1))
-
-# Sparse key space, re: #2278
-
-setup = common_setup + """
-NUM_ROWS = 1000
-for iter in range(10):
-    df = DataFrame({'A' : np.random.randint(50, size=NUM_ROWS),
-                    'B' : np.random.randint(50, size=NUM_ROWS),
-                    'C' : np.random.randint(-10,10, size=NUM_ROWS),
-                    'D' : np.random.randint(-10,10, size=NUM_ROWS),
-                    'E' : np.random.randint(10, size=NUM_ROWS),
-                    'F' : np.random.randn(NUM_ROWS)})
-    idf = df.set_index(['A', 'B', 'C', 'D', 'E'])
-    if len(idf.index.unique()) == NUM_ROWS:
-        break
-"""
-
-unstack_sparse_keyspace = Benchmark('idf.unstack()', setup,
-                                    start_date=datetime(2011, 10, 1))
-
-# Melt
-
-setup = common_setup + """
-from pandas.core.reshape import melt
-df = DataFrame(np.random.randn(10000, 3), columns=['A', 'B', 'C'])
-df['id1'] = np.random.randint(0, 10, 10000)
-df['id2'] = np.random.randint(100, 1000, 10000)
-"""
-
-melt_dataframe = Benchmark("melt(df, id_vars=['id1', 'id2'])", setup,
-                           start_date=datetime(2012, 8, 1))
diff --git a/vb_suite/run_suite.py b/vb_suite/run_suite.py
deleted file mode 100755
index 43bf24faae43a..0000000000000
--- a/vb_suite/run_suite.py
+++ /dev/null
@@ -1,15 +0,0 @@
-#!/usr/bin/env python
-from vbench.api import BenchmarkRunner
-from suite import *
-
-
-def run_process():
-    runner = BenchmarkRunner(benchmarks, REPO_PATH, REPO_URL,
-                             BUILD, DB_PATH, TMP_DIR, PREPARE,
-                             always_clean=True,
-                             run_option='eod', start_date=START_DATE,
-                             module_dependencies=dependencies)
-    runner.run()
-
-if __name__ == '__main__':
-    run_process()
diff --git a/vb_suite/series_methods.py b/vb_suite/series_methods.py
deleted file mode 100644
index c545f419c2dec..0000000000000
--- a/vb_suite/series_methods.py
+++ /dev/null
@@ -1,39 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-s1 = Series(np.random.randn(10000))
-s2 = Series(np.random.randint(1, 10, 10000))
-s3 = Series(np.random.randint(1, 10, 100000)).astype('int64')
-values = [1,2]
-s4 = s3.astype('object')
-"""
-
-series_nlargest1 = Benchmark("s1.nlargest(3, keep='last');"
-                             "s1.nlargest(3, keep='first')",
-                             setup,
-                             start_date=datetime(2014, 1, 25))
-series_nlargest2 = Benchmark("s2.nlargest(3, keep='last');"
-                             "s2.nlargest(3, keep='first')",
-                             setup,
-                             start_date=datetime(2014, 1, 25))
-
-series_nsmallest2 = Benchmark("s1.nsmallest(3, keep='last');"
-                              "s1.nsmallest(3, keep='first')",
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-
-series_nsmallest2 = Benchmark("s2.nsmallest(3, keep='last');"
-                              "s2.nsmallest(3, keep='first')",
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-
-series_isin_int64 = Benchmark('s3.isin(values)',
-                              setup,
-                              start_date=datetime(2014, 1, 25))
-series_isin_object = Benchmark('s4.isin(values)',
-                               setup,
-                               start_date=datetime(2014, 1, 25))
diff --git a/vb_suite/source/conf.py b/vb_suite/source/conf.py
deleted file mode 100644
index d83448fd97d09..0000000000000
--- a/vb_suite/source/conf.py
+++ /dev/null
@@ -1,225 +0,0 @@
-# -*- coding: utf-8 -*-
-#
-# pandas documentation build configuration file, created by
-#
-# This file is execfile()d with the current directory set to its containing dir.
-#
-# Note that not all possible configuration values are present in this
-# autogenerated file.
-#
-# All configuration values have a default; values that are commented out
-# serve to show the default.
-
-import sys
-import os
-
-# If extensions (or modules to document with autodoc) are in another directory,
-# add these directories to sys.path here. If the directory is relative to the
-# documentation root, use os.path.abspath to make it absolute, like shown here.
-# sys.path.append(os.path.abspath('.'))
-sys.path.insert(0, os.path.abspath('../sphinxext'))
-
-sys.path.extend([
-
-    # numpy standard doc extensions
-    os.path.join(os.path.dirname(__file__),
-                 '..', '../..',
-                 'sphinxext')
-
-])
-
-# -- General configuration -----------------------------------------------
-
-# Add any Sphinx extension module names here, as strings. They can be extensions
-# coming with Sphinx (named 'sphinx.ext.*') or your custom ones.  sphinxext.
-
-extensions = ['sphinx.ext.autodoc',
-              'sphinx.ext.doctest']
-
-# Add any paths that contain templates here, relative to this directory.
-templates_path = ['_templates', '_templates/autosummary']
-
-# The suffix of source filenames.
-source_suffix = '.rst'
-
-# The encoding of source files.
-# source_encoding = 'utf-8'
-
-# The master toctree document.
-master_doc = 'index'
-
-# General information about the project.
-project = u'pandas'
-copyright = u'2008-2011, the pandas development team'
-
-# The version info for the project you're documenting, acts as replacement for
-# |version| and |release|, also used in various other places throughout the
-# built documents.
-#
-# The short X.Y version.
-import pandas
-
-# version = '%s r%s' % (pandas.__version__, svn_version())
-version = '%s' % (pandas.__version__)
-
-# The full version, including alpha/beta/rc tags.
-release = version
-
-# JP: added from sphinxdocs
-autosummary_generate = True
-
-# The language for content autogenerated by Sphinx. Refer to documentation
-# for a list of supported languages.
-# language = None
-
-# There are two options for replacing |today|: either, you set today to some
-# non-false value, then it is used:
-# today = ''
-# Else, today_fmt is used as the format for a strftime call.
-# today_fmt = '%B %d, %Y'
-
-# List of documents that shouldn't be included in the build.
-# unused_docs = []
-
-# List of directories, relative to source directory, that shouldn't be searched
-# for source files.
-exclude_trees = []
-
-# The reST default role (used for this markup: `text`) to use for all documents.
-# default_role = None
-
-# If true, '()' will be appended to :func: etc. cross-reference text.
-# add_function_parentheses = True
-
-# If true, the current module name will be prepended to all description
-# unit titles (such as .. function::).
-# add_module_names = True
-
-# If true, sectionauthor and moduleauthor directives will be shown in the
-# output. They are ignored by default.
-# show_authors = False
-
-# The name of the Pygments (syntax highlighting) style to use.
-pygments_style = 'sphinx'
-
-# A list of ignored prefixes for module index sorting.
-# modindex_common_prefix = []
-
-
-# -- Options for HTML output ---------------------------------------------
-
-# The theme to use for HTML and HTML Help pages.  Major themes that come with
-# Sphinx are currently 'default' and 'sphinxdoc'.
-html_theme = 'agogo'
-
-# The style sheet to use for HTML and HTML Help pages. A file of that name
-# must exist either in Sphinx' static/ path, or in one of the custom paths
-# given in html_static_path.
-# html_style = 'statsmodels.css'
-
-# Theme options are theme-specific and customize the look and feel of a theme
-# further.  For a list of options available for each theme, see the
-# documentation.
-# html_theme_options = {}
-
-# Add any paths that contain custom themes here, relative to this directory.
-html_theme_path = ['themes']
-
-# The name for this set of Sphinx documents.  If None, it defaults to
-# "<project> v<release> documentation".
-html_title = 'Vbench performance benchmarks for pandas'
-
-# A shorter title for the navigation bar.  Default is the same as html_title.
-# html_short_title = None
-
-# The name of an image file (relative to this directory) to place at the top
-# of the sidebar.
-# html_logo = None
-
-# The name of an image file (within the static path) to use as favicon of the
-# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
-# pixels large.
-# html_favicon = None
-
-# Add any paths that contain custom static files (such as style sheets) here,
-# relative to this directory. They are copied after the builtin static files,
-# so a file named "default.css" will overwrite the builtin "default.css".
-html_static_path = ['_static']
-
-# If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
-# using the given strftime format.
-# html_last_updated_fmt = '%b %d, %Y'
-
-# If true, SmartyPants will be used to convert quotes and dashes to
-# typographically correct entities.
-# html_use_smartypants = True
-
-# Custom sidebar templates, maps document names to template names.
-# html_sidebars = {}
-
-# Additional templates that should be rendered to pages, maps page names to
-# template names.
-# html_additional_pages = {}
-
-# If false, no module index is generated.
-html_use_modindex = True
-
-# If false, no index is generated.
-# html_use_index = True
-
-# If true, the index is split into individual pages for each letter.
-# html_split_index = False
-
-# If true, links to the reST sources are added to the pages.
-# html_show_sourcelink = True
-
-# If true, an OpenSearch description file will be output, and all pages will
-# contain a <link> tag referring to it.  The value of this option must be the
-# base URL from which the finished HTML is served.
-# html_use_opensearch = ''
-
-# If nonempty, this is the file name suffix for HTML files (e.g. ".xhtml").
-# html_file_suffix = ''
-
-# Output file base name for HTML help builder.
-htmlhelp_basename = 'performance'
-
-
-# -- Options for LaTeX output --------------------------------------------
-
-# The paper size ('letter' or 'a4').
-# latex_paper_size = 'letter'
-
-# The font size ('10pt', '11pt' or '12pt').
-# latex_font_size = '10pt'
-
-# Grouping the document tree into LaTeX files. List of tuples
-# (source start file, target name, title, author, documentclass [howto/manual]).
-latex_documents = [
-    ('index', 'performance.tex',
-     u'pandas vbench Performance Benchmarks',
-     u'Wes McKinney', 'manual'),
-]
-
-# The name of an image file (relative to this directory) to place at the top of
-# the title page.
-# latex_logo = None
-
-# For "manual" documents, if this is true, then toplevel headings are parts,
-# not chapters.
-# latex_use_parts = False
-
-# Additional stuff for the LaTeX preamble.
-# latex_preamble = ''
-
-# Documents to append as an appendix to all manuals.
-# latex_appendices = []
-
-# If false, no module index is generated.
-# latex_use_modindex = True
-
-
-# Example configuration for intersphinx: refer to the Python standard library.
-# intersphinx_mapping = {'http://docs.scipy.org/': None}
-import glob
-autosummary_generate = glob.glob("*.rst")
diff --git a/vb_suite/source/themes/agogo/layout.html b/vb_suite/source/themes/agogo/layout.html
deleted file mode 100644
index cd0f3d7ffc9c7..0000000000000
--- a/vb_suite/source/themes/agogo/layout.html
+++ /dev/null
@@ -1,95 +0,0 @@
-{#
-    agogo/layout.html
-    ~~~~~~~~~~~~~~~~~
-
-    Sphinx layout template for the agogo theme, originally written
-    by Andi Albrecht.
-
-    :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
-    :license: BSD, see LICENSE for details.
-#}
-{% extends "basic/layout.html" %}
-
-{% block header %}
-    <div class="header-wrapper">
-      <div class="header">
-        {%- if logo %}
-          <p class="logo"><a href="{{ pathto(master_doc) }}">
-            <img class="logo" src="{{ pathto('_static/' + logo, 1) }}" alt="Logo"/>
-          </a></p>
-        {%- endif %}
-        {%- block headertitle %}
-        <h1><a href="{{ pathto(master_doc) }}">{{ shorttitle|e }}</a></h1>
-        {%- endblock %}
-        <div class="rel">
-          {%- for rellink in rellinks|reverse %}
-          <a href="{{ pathto(rellink[0]) }}" title="{{ rellink[1]|striptags|e }}"
-             {{ accesskey(rellink[2]) }}>{{ rellink[3] }}</a>
-          {%- if not loop.last %}{{ reldelim2 }}{% endif %}
-          {%- endfor %}
-        </div>
-       </div>
-    </div>
-{% endblock %}
-
-{% block content %}
-    <div class="content-wrapper">
-      <div class="content">
-        <div class="sidebar">
-          {%- block sidebartoc %}
-          <h3>{{ _('Table Of Contents') }}</h3>
-          {{ toctree() }}
-          {%- endblock %}
-          {%- block sidebarsearch %}
-          <h3 style="margin-top: 1.5em;">{{ _('Search') }}</h3>
-          <form class="search" action="{{ pathto('search') }}" method="get">
-            <input type="text" name="q" size="18" />
-            <input type="submit" value="{{ _('Go') }}" />
-            <input type="hidden" name="check_keywords" value="yes" />
-            <input type="hidden" name="area" value="default" />
-          </form>
-          <p class="searchtip" style="font-size: 90%">
-            {{ _('Enter search terms or a module, class or function name.') }}
-          </p>
-		  <p>
-		  <p>
-			<script type="text/javascript" src="http://www.ohloh.net/p/482908/widgets/project_partner_badge.js"></script>
-	      </p>
-          {%- endblock %}
-        </div>
-        <div class="document">
-          {%- block document %}
-            {{ super() }}
-          {%- endblock %}
-        </div>
-        <div class="clearer"></div>
-      </div>
-    </div>
-{% endblock %}
-
-{% block footer %}
-    <div class="footer-wrapper">
-      <div class="footer">
-        <div class="left">
-          {%- for rellink in rellinks|reverse %}
-          <a href="{{ pathto(rellink[0]) }}" title="{{ rellink[1]|striptags|e }}"
-             {{ accesskey(rellink[2]) }}>{{ rellink[3] }}</a>
-          {%- if not loop.last %}{{ reldelim2 }}{% endif %}
-          {%- endfor %}
-          {%- if show_source and has_source and sourcename %}
-            <br/>
-            <a href="{{ pathto('_sources/' + sourcename, true)|e }}"
-               rel="nofollow">{{ _('Show Source') }}</a>
-          {%- endif %}
-        </div>
-
-        <div class="right">
-          {{ super() }}
-        </div>
-        <div class="clearer"></div>
-      </div>
-    </div>
-{% endblock %}
-
-{% block relbar1 %}{% endblock %}
-{% block relbar2 %}{% endblock %}
diff --git a/vb_suite/source/themes/agogo/static/agogo.css_t b/vb_suite/source/themes/agogo/static/agogo.css_t
deleted file mode 100644
index ef909b72e20f6..0000000000000
--- a/vb_suite/source/themes/agogo/static/agogo.css_t
+++ /dev/null
@@ -1,476 +0,0 @@
-/*
- * agogo.css_t
- * ~~~~~~~~~~~
- *
- * Sphinx stylesheet -- agogo theme.
- *
- * :copyright: Copyright 2007-2011 by the Sphinx team, see AUTHORS.
- * :license: BSD, see LICENSE for details.
- *
- */
-
-* {
-  margin: 0px;
-  padding: 0px;
-}
-
-body {
-  font-family: {{ theme_bodyfont }};
-  line-height: 1.4em;
-  color: black;
-  background-color: {{ theme_bgcolor }};
-}
-
-
-/* Page layout */
-
-div.header, div.content, div.footer {
-  max-width: {{ theme_pagewidth }};
-  margin-left: auto;
-  margin-right: auto;
-}
-
-div.header-wrapper {
-  background: {{ theme_headerbg }};
-  padding: 1em 1em 0;
-  border-bottom: 3px solid #2e3436;
-  min-height: 0px;
-}
-
-
-/* Default body styles */
-a {
-  color: {{ theme_linkcolor }};
-}
-
-div.bodywrapper a, div.footer a {
-  text-decoration: underline;
-}
-
-.clearer {
-  clear: both;
-}
-
-.left {
-  float: left;
-}
-
-.right {
-  float: right;
-}
-
-.line-block {
-    display: block;
-    margin-top: 1em;
-    margin-bottom: 1em;
-}
-
-.line-block .line-block {
-    margin-top: 0;
-    margin-bottom: 0;
-    margin-left: 1.5em;
-}
-
-h1, h2, h3, h4 {
-  font-family: {{ theme_headerfont }};
-  font-weight: normal;
-  color: {{ theme_headercolor2 }};
-  margin-bottom: .8em;
-}
-
-h1 {
-  color: {{ theme_headercolor1 }};
-}
-
-h2 {
-  padding-bottom: .5em;
-  border-bottom: 1px solid {{ theme_headercolor2 }};
-}
-
-a.headerlink {
-  visibility: hidden;
-  color: #dddddd;
-  padding-left: .3em;
-}
-
-h1:hover > a.headerlink,
-h2:hover > a.headerlink,
-h3:hover > a.headerlink,
-h4:hover > a.headerlink,
-h5:hover > a.headerlink,
-h6:hover > a.headerlink,
-dt:hover > a.headerlink {
-  visibility: visible;
-}
-
-img {
-  border: 0;
-}
-
-pre {
-  background-color: #EEE;
-  padding: 0.5em;
-}
-
-div.admonition {
-  margin-top: 10px;
-  margin-bottom: 10px;
-  padding: 2px 7px 1px 7px;
-  border-left: 0.2em solid black;
-}
-
-p.admonition-title {
-  margin: 0px 10px 5px 0px;
-  font-weight: bold;
-}
-
-dt:target, .highlighted {
-  background-color: #fbe54e;
-}
-
-/* Header */
-
-/*
-div.header {
-  padding-top: 10px;
-  padding-bottom: 10px;
-}
-*/
-
-div.header {}
-
-div.header h1 {
-  font-family: {{ theme_headerfont }};
-  font-weight: normal;
-  font-size: 180%;
-  letter-spacing: .08em;
-}
-
-div.header h1 a {
-  color: white;
-}
-
-div.header div.rel {
-  text-decoration: none;
-}
-/*  margin-top: 1em; */
-
-div.header div.rel a {
-  margin-top: 1em;
-  color: {{ theme_headerlinkcolor }};
-  letter-spacing: .1em;
-  text-transform: uppercase;
-  padding: 3px 1em;
-}
-
-p.logo {
-    float: right;
-}
-
-img.logo {
-    border: 0;
-}
-
-
-/* Content */
-div.content-wrapper {
-  background-color: white;
-  padding: 1em;
-}
-/*
-  padding-top: 20px;
-  padding-bottom: 20px;
-*/
-
-/*  float: left; */
-
-div.document {
-  max-width: {{ theme_documentwidth }};
-}
-
-div.body {
-  padding-right: 2em;
-  text-align: {{ theme_textalign }};
-}
-
-div.document ul {
-  margin: 1.5em;
-  list-style-type: square;
-}
-
-div.document dd {
-  margin-left: 1.2em;
-  margin-top: .4em;
-  margin-bottom: 1em;
-}
-
-div.document .section {
-  margin-top: 1.7em;
-}
-div.document .section:first-child {
-  margin-top: 0px;
-}
-
-div.document div.highlight {
-  padding: 3px;
-  background-color: #eeeeec;
-  border-top: 2px solid #dddddd;
-  border-bottom: 2px solid #dddddd;
-  margin-top: .8em;
-  margin-bottom: .8em;
-}
-
-div.document h2 {
-  margin-top: .7em;
-}
-
-div.document p {
-  margin-bottom: .5em;
-}
-
-div.document li.toctree-l1 {
-  margin-bottom: 1em;
-}
-
-div.document .descname {
-  font-weight: bold;
-}
-
-div.document .docutils.literal {
-  background-color: #eeeeec;
-  padding: 1px;
-}
-
-div.document .docutils.xref.literal {
-  background-color: transparent;
-  padding: 0px;
-}
-
-div.document blockquote {
-  margin: 1em;
-}
-
-div.document ol {
-  margin: 1.5em;
-}
-
-
-/* Sidebar */
-
-
-div.sidebar {
-  width: {{ theme_sidebarwidth }};
-  padding: 0 1em;
-  float: right;
-  font-size: .93em;
-}
-
-div.sidebar a, div.header a {
-  text-decoration: none;
-}
-
-div.sidebar a:hover, div.header a:hover {
-  text-decoration: underline;
-}
-
-div.sidebar h3 {
-  color: #2e3436;
-  text-transform: uppercase;
-  font-size: 130%;
-  letter-spacing: .1em;
-}
-
-div.sidebar ul {
-  list-style-type: none;
-}
-
-div.sidebar li.toctree-l1 a {
-  display: block;
-  padding: 1px;
-  border: 1px solid #dddddd;
-  background-color: #eeeeec;
-  margin-bottom: .4em;
-  padding-left: 3px;
-  color: #2e3436;
-}
-
-div.sidebar li.toctree-l2 a {
-  background-color: transparent;
-  border: none;
-  margin-left: 1em;
-  border-bottom: 1px solid #dddddd;
-}
-
-div.sidebar li.toctree-l3 a {
-  background-color: transparent;
-  border: none;
-  margin-left: 2em;
-  border-bottom: 1px solid #dddddd;
-}
-
-div.sidebar li.toctree-l2:last-child a {
-  border-bottom: none;
-}
-
-div.sidebar li.toctree-l1.current a {
-  border-right: 5px solid {{ theme_headerlinkcolor }};
-}
-
-div.sidebar li.toctree-l1.current li.toctree-l2 a {
-  border-right: none;
-}
-
-
-/* Footer */
-
-div.footer-wrapper {
-  background: {{ theme_footerbg }};
-  border-top: 4px solid #babdb6;
-  padding-top: 10px;
-  padding-bottom: 10px;
-  min-height: 80px;
-}
-
-div.footer, div.footer a {
-  color: #888a85;
-}
-
-div.footer .right {
-  text-align: right;
-}
-
-div.footer .left {
-  text-transform: uppercase;
-}
-
-
-/* Styles copied from basic theme */
-
-img.align-left, .figure.align-left, object.align-left {
-    clear: left;
-    float: left;
-    margin-right: 1em;
-}
-
-img.align-right, .figure.align-right, object.align-right {
-    clear: right;
-    float: right;
-    margin-left: 1em;
-}
-
-img.align-center, .figure.align-center, object.align-center {
-  display: block;
-  margin-left: auto;
-  margin-right: auto;
-}
-
-.align-left {
-    text-align: left;
-}
-
-.align-center {
-    clear: both;
-    text-align: center;
-}
-
-.align-right {
-    text-align: right;
-}
-
-/* -- search page ----------------------------------------------------------- */
-
-ul.search {
-    margin: 10px 0 0 20px;
-    padding: 0;
-}
-
-ul.search li {
-    padding: 5px 0 5px 20px;
-    background-image: url(file.png);
-    background-repeat: no-repeat;
-    background-position: 0 7px;
-}
-
-ul.search li a {
-    font-weight: bold;
-}
-
-ul.search li div.context {
-    color: #888;
-    margin: 2px 0 0 30px;
-    text-align: left;
-}
-
-ul.keywordmatches li.goodmatch a {
-    font-weight: bold;
-}
-
-/* -- index page ------------------------------------------------------------ */
-
-table.contentstable {
-    width: 90%;
-}
-
-table.contentstable p.biglink {
-    line-height: 150%;
-}
-
-a.biglink {
-    font-size: 1.3em;
-}
-
-span.linkdescr {
-    font-style: italic;
-    padding-top: 5px;
-    font-size: 90%;
-}
-
-/* -- general index --------------------------------------------------------- */
-
-table.indextable td {
-    text-align: left;
-    vertical-align: top;
-}
-
-table.indextable dl, table.indextable dd {
-    margin-top: 0;
-    margin-bottom: 0;
-}
-
-table.indextable tr.pcap {
-    height: 10px;
-}
-
-table.indextable tr.cap {
-    margin-top: 10px;
-    background-color: #f2f2f2;
-}
-
-img.toggler {
-    margin-right: 3px;
-    margin-top: 3px;
-    cursor: pointer;
-}
-
-/* -- viewcode extension ---------------------------------------------------- */
-
-.viewcode-link {
-    float: right;
-}
-
-.viewcode-back {
-    float: right;
-    font-family:: {{ theme_bodyfont }};
-}
-
-div.viewcode-block:target {
-    margin: -1px -3px;
-    padding: 0 3px;
-    background-color: #f4debf;
-    border-top: 1px solid #ac9;
-    border-bottom: 1px solid #ac9;
-}
-
-th.field-name {
-    white-space: nowrap;
-}
diff --git a/vb_suite/source/themes/agogo/static/bgfooter.png b/vb_suite/source/themes/agogo/static/bgfooter.png
deleted file mode 100644
index 9ce5bdd902943..0000000000000
Binary files a/vb_suite/source/themes/agogo/static/bgfooter.png and /dev/null differ
diff --git a/vb_suite/source/themes/agogo/static/bgtop.png b/vb_suite/source/themes/agogo/static/bgtop.png
deleted file mode 100644
index a0d4709bac8f7..0000000000000
Binary files a/vb_suite/source/themes/agogo/static/bgtop.png and /dev/null differ
diff --git a/vb_suite/source/themes/agogo/theme.conf b/vb_suite/source/themes/agogo/theme.conf
deleted file mode 100644
index 3fc88580f1ab4..0000000000000
--- a/vb_suite/source/themes/agogo/theme.conf
+++ /dev/null
@@ -1,19 +0,0 @@
-[theme]
-inherit = basic
-stylesheet = agogo.css
-pygments_style = tango
-
-[options]
-bodyfont = "Verdana", Arial, sans-serif
-headerfont = "Georgia", "Times New Roman", serif
-pagewidth = 70em
-documentwidth = 50em
-sidebarwidth = 20em
-bgcolor = #eeeeec
-headerbg = url(bgtop.png) top left repeat-x
-footerbg = url(bgfooter.png) top left repeat-x
-linkcolor = #ce5c00
-headercolor1 = #204a87
-headercolor2 = #3465a4
-headerlinkcolor = #fcaf3e
-textalign = justify
\ No newline at end of file
diff --git a/vb_suite/sparse.py b/vb_suite/sparse.py
deleted file mode 100644
index 53e2778ee0865..0000000000000
--- a/vb_suite/sparse.py
+++ /dev/null
@@ -1,65 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-
-setup = common_setup + """
-from pandas.core.sparse import SparseSeries, SparseDataFrame
-
-K = 50
-N = 50000
-rng = np.asarray(date_range('1/1/2000', periods=N,
-                           freq='T'))
-
-# rng2 = np.asarray(rng).astype('M8[ns]').astype('i8')
-
-series = {}
-for i in range(1, K + 1):
-    data = np.random.randn(N)[:-i]
-    this_rng = rng[:-i]
-    data[100:] = np.nan
-    series[i] = SparseSeries(data, index=this_rng)
-"""
-stmt = "SparseDataFrame(series)"
-
-bm_sparse1 = Benchmark(stmt, setup, name="sparse_series_to_frame",
-                       start_date=datetime(2011, 6, 1))
-
-
-setup = common_setup + """
-from pandas.core.sparse import SparseDataFrame
-"""
-
-stmt = "SparseDataFrame(columns=np.arange(100), index=np.arange(1000))"
-
-sparse_constructor = Benchmark(stmt, setup, name="sparse_frame_constructor",
-                               start_date=datetime(2012, 6, 1))
-
-
-setup = common_setup + """
-s = pd.Series([np.nan] * 10000)
-s[0] = 3.0
-s[100] = -1.0
-s[999] = 12.1
-s.index = pd.MultiIndex.from_product((range(10), range(10), range(10), range(10)))
-ss = s.to_sparse()
-"""
-
-stmt = "ss.to_coo(row_levels=[0, 1], column_levels=[2, 3], sort_labels=True)"
-
-sparse_series_to_coo = Benchmark(stmt, setup, name="sparse_series_to_coo",
-                               start_date=datetime(2015, 1, 3))
-
-setup = common_setup + """
-import scipy.sparse
-import pandas.sparse.series
-A = scipy.sparse.coo_matrix(([3.0, 1.0, 2.0], ([1, 0, 0], [0, 2, 3])), shape=(100, 100))
-"""
-
-stmt = "ss = pandas.sparse.series.SparseSeries.from_coo(A)"
-
-sparse_series_from_coo = Benchmark(stmt, setup, name="sparse_series_from_coo",
-                               start_date=datetime(2015, 1, 3))
diff --git a/vb_suite/stat_ops.py b/vb_suite/stat_ops.py
deleted file mode 100644
index 8d7c30dc9fdcf..0000000000000
--- a/vb_suite/stat_ops.py
+++ /dev/null
@@ -1,126 +0,0 @@
-from vbench.benchmark import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-#----------------------------------------------------------------------
-# nanops
-
-setup = common_setup + """
-s = Series(np.random.randn(100000), index=np.arange(100000))
-s[::2] = np.nan
-"""
-
-stat_ops_series_std = Benchmark("s.std()", setup)
-
-#----------------------------------------------------------------------
-# ops by level
-
-setup = common_setup + """
-index = MultiIndex(levels=[np.arange(10), np.arange(100), np.arange(100)],
-                   labels=[np.arange(10).repeat(10000),
-                           np.tile(np.arange(100).repeat(100), 10),
-                           np.tile(np.tile(np.arange(100), 100), 10)])
-random.shuffle(index.values)
-df = DataFrame(np.random.randn(len(index), 4), index=index)
-df_level = DataFrame(np.random.randn(100, 4), index=index.levels[1])
-"""
-
-stat_ops_level_frame_sum = \
-    Benchmark("df.sum(level=1)", setup,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_frame_sum_multiple = \
-    Benchmark("df.sum(level=[0, 1])", setup, repeat=1,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_series_sum = \
-    Benchmark("df[1].sum(level=1)", setup,
-              start_date=datetime(2011, 11, 15))
-
-stat_ops_level_series_sum_multiple = \
-    Benchmark("df[1].sum(level=[0, 1])", setup, repeat=1,
-              start_date=datetime(2011, 11, 15))
-
-sum_setup = common_setup + """
-df = DataFrame(np.random.randn(100000, 4))
-dfi = DataFrame(np.random.randint(1000, size=df.shape))
-"""
-
-stat_ops_frame_sum_int_axis_0 = \
-    Benchmark("dfi.sum()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_float_axis_0 = \
-    Benchmark("df.sum()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_int_axis_0 = \
-    Benchmark("dfi.mean()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_float_axis_0 = \
-    Benchmark("df.mean()", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_int_axis_1 = \
-    Benchmark("dfi.sum(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_sum_float_axis_1 = \
-    Benchmark("df.sum(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_int_axis_1 = \
-    Benchmark("dfi.mean(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-stat_ops_frame_mean_float_axis_1 = \
-    Benchmark("df.mean(1)", sum_setup, start_date=datetime(2013, 7, 25))
-
-#----------------------------------------------------------------------
-# rank
-
-setup = common_setup + """
-values = np.concatenate([np.arange(100000),
-                         np.random.randn(100000),
-                         np.arange(100000)])
-s = Series(values)
-"""
-
-stats_rank_average = Benchmark('s.rank()', setup,
-                               start_date=datetime(2011, 12, 12))
-
-stats_rank_pct_average = Benchmark('s.rank(pct=True)', setup,
-                                   start_date=datetime(2014, 1, 16))
-stats_rank_pct_average_old = Benchmark('s.rank() / len(s)', setup,
-                                       start_date=datetime(2014, 1, 16))
-setup = common_setup + """
-values = np.random.randint(0, 100000, size=200000)
-s = Series(values)
-"""
-
-stats_rank_average_int = Benchmark('s.rank()', setup,
-                                   start_date=datetime(2011, 12, 12))
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(5000, 50))
-"""
-
-stats_rank2d_axis1_average = Benchmark('df.rank(1)', setup,
-                                       start_date=datetime(2011, 12, 12))
-
-stats_rank2d_axis0_average = Benchmark('df.rank()', setup,
-                                       start_date=datetime(2011, 12, 12))
-
-# rolling functions
-
-setup = common_setup + """
-arr = np.random.randn(100000)
-"""
-
-stats_rolling_mean = Benchmark('rolling_mean(arr, 100)', setup,
-                               start_date=datetime(2011, 6, 1))
-
-# spearman correlation
-
-setup = common_setup + """
-df = DataFrame(np.random.randn(1000, 30))
-"""
-
-stats_corr_spearman = Benchmark("df.corr(method='spearman')", setup,
-                                start_date=datetime(2011, 12, 4))
diff --git a/vb_suite/strings.py b/vb_suite/strings.py
deleted file mode 100644
index 0948df5673a0d..0000000000000
--- a/vb_suite/strings.py
+++ /dev/null
@@ -1,59 +0,0 @@
-from vbench.api import Benchmark
-
-common_setup = """from .pandas_vb_common import *
-"""
-
-setup = common_setup + """
-import string
-import itertools as IT
-
-def make_series(letters, strlen, size):
-    return Series(
-        [str(x) for x in np.fromiter(IT.cycle(letters), count=size*strlen, dtype='|S1')
-        .view('|S{}'.format(strlen))])
-
-many = make_series('matchthis'+string.ascii_uppercase, strlen=19, size=10000) # 31% matches
-few = make_series('matchthis'+string.ascii_uppercase*42, strlen=19, size=10000) # 1% matches
-"""
-
-strings_cat = Benchmark("many.str.cat(sep=',')", setup)
-strings_title = Benchmark("many.str.title()", setup)
-strings_count = Benchmark("many.str.count('matchthis')", setup)
-strings_contains_many = Benchmark("many.str.contains('matchthis')", setup)
-strings_contains_few = Benchmark("few.str.contains('matchthis')", setup)
-strings_contains_many_noregex = Benchmark(
-    "many.str.contains('matchthis', regex=False)", setup)
-strings_contains_few_noregex = Benchmark(
-    "few.str.contains('matchthis', regex=False)", setup)
-strings_startswith = Benchmark("many.str.startswith('matchthis')", setup)
-strings_endswith = Benchmark("many.str.endswith('matchthis')", setup)
-strings_lower = Benchmark("many.str.lower()", setup)
-strings_upper = Benchmark("many.str.upper()", setup)
-strings_replace = Benchmark("many.str.replace(r'(matchthis)', r'\1\1')", setup)
-strings_repeat = Benchmark(
-    "many.str.repeat(list(IT.islice(IT.cycle(range(1,4)),len(many))))", setup)
-strings_match = Benchmark("many.str.match(r'mat..this')", setup)
-strings_extract = Benchmark("many.str.extract(r'(\w*)matchthis(\w*)')", setup)
-strings_join_split = Benchmark("many.str.join(r'--').str.split('--')", setup)
-strings_join_split_expand = Benchmark("many.str.join(r'--').str.split('--',expand=True)", setup)
-strings_len = Benchmark("many.str.len()", setup)
-strings_findall = Benchmark("many.str.findall(r'[A-Z]+')", setup)
-strings_pad = Benchmark("many.str.pad(100, side='both')", setup)
-strings_center = Benchmark("many.str.center(100)", setup)
-strings_slice = Benchmark("many.str.slice(5,15,2)", setup)
-strings_strip = Benchmark("many.str.strip('matchthis')", setup)
-strings_lstrip = Benchmark("many.str.lstrip('matchthis')", setup)
-strings_rstrip = Benchmark("many.str.rstrip('matchthis')", setup)
-strings_get = Benchmark("many.str.get(0)", setup)
-
-setup = setup + """
-s = make_series(string.ascii_uppercase, strlen=10, size=10000).str.join('|')
-"""
-strings_get_dummies = Benchmark("s.str.get_dummies('|')", setup)
-
-setup = common_setup + """
-import pandas.util.testing as testing
-ser = Series(testing.makeUnicodeIndex())
-"""
-
-strings_encode_decode = Benchmark("ser.str.encode('utf-8').str.decode('utf-8')", setup)
diff --git a/vb_suite/suite.py b/vb_suite/suite.py
deleted file mode 100644
index 45053b6610896..0000000000000
--- a/vb_suite/suite.py
+++ /dev/null
@@ -1,164 +0,0 @@
-from vbench.api import Benchmark, GitRepo
-from datetime import datetime
-
-import os
-
-modules = ['attrs_caching',
-           'binary_ops',
-           'ctors',
-           'frame_ctor',
-           'frame_methods',
-           'groupby',
-           'index_object',
-           'indexing',
-           'io_bench',
-           'io_sql',
-           'inference',
-           'hdfstore_bench',
-           'join_merge',
-           'gil',
-           'miscellaneous',
-           'panel_ctor',
-           'packers',
-           'parser_vb',
-           'panel_methods',
-           'plotting',
-           'reindex',
-           'replace',
-           'sparse',
-           'strings',
-           'reshape',
-           'stat_ops',
-           'timeseries',
-           'timedelta',
-           'eval']
-
-by_module = {}
-benchmarks = []
-
-for modname in modules:
-    ref = __import__(modname)
-    by_module[modname] = [v for v in ref.__dict__.values()
-                          if isinstance(v, Benchmark)]
-    benchmarks.extend(by_module[modname])
-
-for bm in benchmarks:
-    assert(bm.name is not None)
-
-import getpass
-import sys
-
-USERNAME = getpass.getuser()
-
-if sys.platform == 'darwin':
-    HOME = '/Users/%s' % USERNAME
-else:
-    HOME = '/home/%s' % USERNAME
-
-try:
-    import ConfigParser
-
-    config = ConfigParser.ConfigParser()
-    config.readfp(open(os.path.expanduser('~/.vbenchcfg')))
-
-    REPO_PATH = config.get('setup', 'repo_path')
-    REPO_URL = config.get('setup', 'repo_url')
-    DB_PATH = config.get('setup', 'db_path')
-    TMP_DIR = config.get('setup', 'tmp_dir')
-except:
-    REPO_PATH = os.path.abspath(os.path.join(os.path.dirname(__file__), "../"))
-    REPO_URL = 'git@github.com:pandas-dev/pandas.git'
-    DB_PATH = os.path.join(REPO_PATH, 'vb_suite/benchmarks.db')
-    TMP_DIR = os.path.join(HOME, 'tmp/vb_pandas')
-
-PREPARE = """
-python setup.py clean
-"""
-BUILD = """
-python setup.py build_ext --inplace
-"""
-dependencies = ['pandas_vb_common.py']
-
-START_DATE = datetime(2010, 6, 1)
-
-# repo = GitRepo(REPO_PATH)
-
-RST_BASE = 'source'
-
-# HACK!
-
-# timespan = [datetime(2011, 1, 1), datetime(2012, 1, 1)]
-
-
-def generate_rst_files(benchmarks):
-    import matplotlib as mpl
-    mpl.use('Agg')
-    import matplotlib.pyplot as plt
-
-    vb_path = os.path.join(RST_BASE, 'vbench')
-    fig_base_path = os.path.join(vb_path, 'figures')
-
-    if not os.path.exists(vb_path):
-        print('creating %s' % vb_path)
-        os.makedirs(vb_path)
-
-    if not os.path.exists(fig_base_path):
-        print('creating %s' % fig_base_path)
-        os.makedirs(fig_base_path)
-
-    for bmk in benchmarks:
-        print('Generating rst file for %s' % bmk.name)
-        rst_path = os.path.join(RST_BASE, 'vbench/%s.txt' % bmk.name)
-
-        fig_full_path = os.path.join(fig_base_path, '%s.png' % bmk.name)
-
-        # make the figure
-        plt.figure(figsize=(10, 6))
-        ax = plt.gca()
-        bmk.plot(DB_PATH, ax=ax)
-
-        start, end = ax.get_xlim()
-
-        plt.xlim([start - 30, end + 30])
-        plt.savefig(fig_full_path, bbox_inches='tight')
-        plt.close('all')
-
-        fig_rel_path = 'vbench/figures/%s.png' % bmk.name
-        rst_text = bmk.to_rst(image_path=fig_rel_path)
-        with open(rst_path, 'w') as f:
-            f.write(rst_text)
-
-    with open(os.path.join(RST_BASE, 'index.rst'), 'w') as f:
-        print >> f, """
-Performance Benchmarks
-======================
-
-These historical benchmark graphs were produced with `vbench
-<http://github.com/pydata/vbench>`__.
-
-The ``.pandas_vb_common`` setup script can be found here_
-
-.. _here: https://github.com/pandas-dev/pandas/tree/master/vb_suite
-
-Produced on a machine with
-
-  - Intel Core i7 950 processor
-  - (K)ubuntu Linux 12.10
-  - Python 2.7.2 64-bit (Enthought Python Distribution 7.1-2)
-  - NumPy 1.6.1
-
-.. toctree::
-    :hidden:
-    :maxdepth: 3
-"""
-        for modname, mod_bmks in sorted(by_module.items()):
-            print >> f, '    vb_%s' % modname
-            modpath = os.path.join(RST_BASE, 'vb_%s.rst' % modname)
-            with open(modpath, 'w') as mh:
-                header = '%s\n%s\n\n' % (modname, '=' * len(modname))
-                print >> mh, header
-
-                for bmk in mod_bmks:
-                    print >> mh, bmk.name
-                    print >> mh, '-' * len(bmk.name)
-                    print >> mh, '.. include:: vbench/%s.txt\n' % bmk.name
diff --git a/vb_suite/test.py b/vb_suite/test.py
deleted file mode 100644
index da30c3e1a5f76..0000000000000
--- a/vb_suite/test.py
+++ /dev/null
@@ -1,67 +0,0 @@
-from pandas import *
-import matplotlib.pyplot as plt
-
-import sqlite3
-
-from vbench.git import GitRepo
-
-
-REPO_PATH = '/home/adam/code/pandas'
-repo = GitRepo(REPO_PATH)
-
-con = sqlite3.connect('vb_suite/benchmarks.db')
-
-bmk = '36900a889961162138c140ce4ae3c205'
-# bmk = '9d7b8c04b532df6c2d55ef497039b0ce'
-bmk = '4481aa4efa9926683002a673d2ed3dac'
-bmk = '00593cd8c03d769669d7b46585161726'
-bmk = '3725ab7cd0a0657d7ae70f171c877cea'
-bmk = '3cd376d6d6ef802cdea49ac47a67be21'
-bmk2 = '459225186023853494bc345fd180f395'
-bmk = 'c22ca82e0cfba8dc42595103113c7da3'
-bmk = 'e0e651a8e9fbf0270ab68137f8b9df5f'
-bmk = '96bda4b9a60e17acf92a243580f2a0c3'
-
-
-def get_results(bmk):
-    results = con.execute(
-        "select * from results where checksum='%s'" % bmk).fetchall()
-    x = Series(dict((t[1], t[3]) for t in results))
-    x.index = x.index.map(repo.timestamps.get)
-    x = x.sort_index()
-    return x
-
-x = get_results(bmk)
-
-
-def graph1():
-    dm_getitem = get_results('459225186023853494bc345fd180f395')
-    dm_getvalue = get_results('c22ca82e0cfba8dc42595103113c7da3')
-
-    plt.figure()
-    ax = plt.gca()
-
-    dm_getitem.plot(label='df[col][idx]', ax=ax)
-    dm_getvalue.plot(label='df.get_value(idx, col)', ax=ax)
-
-    plt.ylabel('ms')
-    plt.legend(loc='best')
-
-
-def graph2():
-    bm = get_results('96bda4b9a60e17acf92a243580f2a0c3')
-    plt.figure()
-    ax = plt.gca()
-
-    bm.plot(ax=ax)
-    plt.ylabel('ms')
-
-bm = get_results('36900a889961162138c140ce4ae3c205')
-fig = plt.figure()
-ax = plt.gca()
-bm.plot(ax=ax)
-fig.autofmt_xdate()
-
-plt.xlim([bm.dropna().index[0] - datetools.MonthEnd(),
-          bm.dropna().index[-1] + datetools.MonthEnd()])
-plt.ylabel('ms')
diff --git a/vb_suite/test_perf.py b/vb_suite/test_perf.py
deleted file mode 100755
index be546b72f9465..0000000000000
--- a/vb_suite/test_perf.py
+++ /dev/null
@@ -1,616 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-"""
-What
-----
-vbench is a library which can be used to benchmark the performance
-of a codebase over time.
-Although vbench can collect data over many commites, generate plots
-and other niceties, for Pull-Requests the important thing is the
-performance of the HEAD commit against a known-good baseline.
-
-This script tries to automate the process of comparing these
-two commits, and is meant to run out of the box on a fresh
-clone.
-
-How
----
-These are the steps taken:
-1) create a temp directory into which vbench will clone the temporary repo.
-2) instantiate a vbench runner, using the local repo as the source repo.
-3) perform a vbench run for the baseline commit, then the target commit.
-4) pull the results for both commits from the db. use pandas to align
-everything and calculate a ration for the timing information.
-5) print the results to the log file and to stdout.
-
-"""
-
-# IMPORTANT NOTE
-#
-# This script should run on pandas versions at least as far back as 0.9.1.
-# devs should be able to use the latest version of this script with
-# any dusty old commit and expect it to "just work".
-# One way in which this is useful is when collecting historical data,
-# where writing some logic around this script may prove easier
-# in some cases then running vbench directly (think perf bisection).
-#
-# *please*, when you modify this script for whatever reason,
-# make sure you do not break its functionality when running under older
-# pandas versions.
-# Note that depreaction warnings are turned off in main(), so there's
-# no need to change the actual code to supress such warnings.
-
-import shutil
-import os
-import sys
-import argparse
-import tempfile
-import time
-import re
-
-import random
-import numpy as np
-
-import pandas as pd
-from pandas import DataFrame, Series
-
-from suite import REPO_PATH
-VB_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
-DEFAULT_MIN_DURATION = 0.01
-HEAD_COL="head[ms]"
-BASE_COL="base[ms]"
-
-try:
-    import git # gitpython
-except Exception:
-    print("Error: Please install the `gitpython` package\n")
-    sys.exit(1)
-
-class RevParseAction(argparse.Action):
-    def __call__(self, parser, namespace, values, option_string=None):
-        import subprocess
-        cmd = 'git rev-parse --short -verify {0}^{{commit}}'.format(values)
-        rev_parse = subprocess.check_output(cmd, shell=True)
-        setattr(namespace, self.dest, rev_parse.strip())
-
-
-parser = argparse.ArgumentParser(description='Use vbench to measure and compare the performance of commits.')
-parser.add_argument('-H', '--head',
-                    help='Execute vbenches using the currently checked out copy.',
-                    dest='head',
-                    action='store_true',
-                    default=False)
-parser.add_argument('-b', '--base-commit',
-                    help='The commit serving as performance baseline ',
-                    type=str, action=RevParseAction)
-parser.add_argument('-t', '--target-commit',
-                    help='The commit to compare against the baseline (default: HEAD).',
-                    type=str, action=RevParseAction)
-parser.add_argument('--base-pickle',
-                    help='name of pickle file with timings data generated by a former `-H -d FILE` run. '\
-                    'filename must be of the form <hash>-*.* or specify --base-commit seperately',
-                    type=str)
-parser.add_argument('--target-pickle',
-                    help='name of pickle file with timings data generated by a former `-H -d FILE` run '\
-                    'filename must be of the form <hash>-*.* or specify --target-commit seperately',
-                    type=str)
-parser.add_argument('-m', '--min-duration',
-                    help='Minimum duration (in ms) of baseline test for inclusion in report (default: %.3f).' % DEFAULT_MIN_DURATION,
-                    type=float,
-                    default=0.01)
-parser.add_argument('-o', '--output',
-                    metavar="<file>",
-                    dest='log_file',
-                    help='Path of file in which to save the textual report (default: vb_suite.log).')
-parser.add_argument('-d', '--outdf',
-                    metavar="FNAME",
-                    dest='outdf',
-                    default=None,
-                    help='Name of file to df.save() the result table into. Will overwrite')
-parser.add_argument('-r', '--regex',
-                    metavar="REGEX",
-                    dest='regex',
-                    default="",
-                    help='Regex pat, only tests whose name matches the regext will be run.')
-parser.add_argument('-s', '--seed',
-                    metavar="SEED",
-                    dest='seed',
-                    default=1234,
-                    type=int,
-                    help='Integer value to seed PRNG with')
-parser.add_argument('-n', '--repeats',
-                    metavar="N",
-                    dest='repeats',
-                    default=3,
-                    type=int,
-                    help='Number of times to run each vbench, result value is the best of')
-parser.add_argument('-c', '--ncalls',
-                    metavar="N",
-                    dest='ncalls',
-                    default=3,
-                    type=int,
-                    help='Number of calls to in each repetition of a vbench')
-parser.add_argument('-N', '--hrepeats',
-                    metavar="N",
-                    dest='hrepeats',
-                    default=1,
-                    type=int,
-                    help='implies -H, number of times to run the vbench suite on the head commit.\n'
-                    'Each iteration will yield another column in the output' )
-parser.add_argument('-a', '--affinity',
-                    metavar="a",
-                    dest='affinity',
-                    default=1,
-                    type=int,
-                    help='set processor affinity of process by default bind to cpu/core #1 only. '
-                         'Requires the "affinity" or "psutil" python module, will raise Warning otherwise')
-parser.add_argument('-u', '--burnin',
-                    metavar="u",
-                    dest='burnin',
-                    default=1,
-                    type=int,
-                    help='Number of extra iteration per benchmark to perform first, then throw away. '  )
-
-parser.add_argument('-S', '--stats',
-                    default=False,
-                    action='store_true',
-                    help='when specified with -N, prints the output of describe() per vbench results. '  )
-
-parser.add_argument('--temp-dir',
-                    metavar="PATH",
-                    default=None,
-                    help='Specify temp work dir to use. ccache depends on builds being invoked from consistent directory.'  )
-
-parser.add_argument('-q', '--quiet',
-                    default=False,
-                    action='store_true',
-                    help='Suppress report output to stdout. '  )
-
-def get_results_df(db, rev):
-    """Takes a git commit hash and returns a Dataframe of benchmark results
-    """
-    bench = DataFrame(db.get_benchmarks())
-    results = DataFrame(map(list,db.get_rev_results(rev).values()))
-
-    # Sinch vbench.db._reg_rev_results returns an unlabeled dict,
-    # we have to break encapsulation a bit.
-    results.columns = db._results.c.keys()
-    results = results.join(bench['name'], on='checksum').set_index("checksum")
-    return results
-
-
-def prprint(s):
-    print("*** %s" % s)
-
-def pre_hook():
-    import gc
-    gc.disable()
-
-def post_hook():
-    import gc
-    gc.enable()
-
-def profile_comparative(benchmarks):
-
-    from vbench.api import BenchmarkRunner
-    from vbench.db import BenchmarkDB
-    from vbench.git import GitRepo
-    from suite import BUILD, DB_PATH, PREPARE, dependencies
-
-    TMP_DIR = args.temp_dir or tempfile.mkdtemp()
-
-    try:
-
-        prprint("Opening DB at '%s'...\n" % DB_PATH)
-        db = BenchmarkDB(DB_PATH)
-
-        prprint("Initializing Runner...")
-
-        # all in a good cause...
-        GitRepo._parse_commit_log = _parse_wrapper(args.base_commit)
-
-        runner = BenchmarkRunner(
-            benchmarks, REPO_PATH, REPO_PATH, BUILD, DB_PATH,
-            TMP_DIR, PREPARE, always_clean=True,
-            # run_option='eod', start_date=START_DATE,
-            module_dependencies=dependencies)
-
-        repo = runner.repo  # (steal the parsed git repo used by runner)
-        h_head = args.target_commit or repo.shas[-1]
-        h_baseline = args.base_commit
-
-        # ARGH. reparse the repo, without discarding any commits,
-        # then overwrite the previous parse results
-        # prprint("Slaughtering kittens...")
-        (repo.shas, repo.messages,
-         repo.timestamps, repo.authors) = _parse_commit_log(None,REPO_PATH,
-                                                                args.base_commit)
-
-        prprint('Target [%s] : %s\n' % (h_head, repo.messages.get(h_head, "")))
-        prprint('Baseline [%s] : %s\n' % (h_baseline,
-                repo.messages.get(h_baseline, "")))
-
-        prprint("Removing any previous measurements for the commits.")
-        db.delete_rev_results(h_baseline)
-        db.delete_rev_results(h_head)
-
-        # TODO: we could skip this, but we need to make sure all
-        # results are in the DB, which is a little tricky with
-        # start dates and so on.
-        prprint("Running benchmarks for baseline [%s]" % h_baseline)
-        runner._run_and_write_results(h_baseline)
-
-        prprint("Running benchmarks for target [%s]" % h_head)
-        runner._run_and_write_results(h_head)
-
-        prprint('Processing results...')
-
-        head_res = get_results_df(db, h_head)
-        baseline_res = get_results_df(db, h_baseline)
-
-        report_comparative(head_res,baseline_res)
-
-    finally:
-        #        print("Disposing of TMP_DIR: %s" % TMP_DIR)
-        shutil.rmtree(TMP_DIR)
-
-def prep_pickle_for_total(df, agg_name='median'):
-    """
-    accepts a datafram resulting from invocation with -H -d o.pickle
-    If multiple data columns are present (-N was used), the
-    `agg_name` attr of the datafram will be used to reduce
-    them to a single value per vbench, df.median is used by defa
-    ult.
-
-    Returns a datadrame of the form expected by prep_totals
-    """
-    def prep(df):
-        agg = getattr(df,agg_name)
-        df = DataFrame(agg(1))
-        cols = list(df.columns)
-        cols[0]='timing'
-        df.columns=cols
-        df['name'] = list(df.index)
-        return df
-
-    return prep(df)
-
-def prep_totals(head_res, baseline_res):
-    """
-    Each argument should be a dataframe with  'timing' and 'name' columns
-    where name is the name of the vbench.
-
-    returns a 'totals' dataframe, suitable as input for print_report.
-    """
-    head_res, baseline_res = head_res.align(baseline_res)
-    ratio = head_res['timing'] / baseline_res['timing']
-    totals = DataFrame({HEAD_COL:head_res['timing'],
-                        BASE_COL:baseline_res['timing'],
-                        'ratio':ratio,
-                        'name':baseline_res.name},
-                        columns=[HEAD_COL, BASE_COL, "ratio", "name"])
-    totals = totals.ix[totals[HEAD_COL] > args.min_duration]
-    # ignore below threshold
-    totals = totals.dropna(
-    ).sort("ratio").set_index('name')  # sort in ascending order
-    return totals
-
-def report_comparative(head_res,baseline_res):
-    try:
-        r=git.Repo(VB_DIR)
-    except:
-        import pdb
-        pdb.set_trace()
-
-    totals = prep_totals(head_res,baseline_res)
-
-    h_head = args.target_commit
-    h_baseline = args.base_commit
-    h_msg = b_msg = "Unknown"
-    try:
-        h_msg =  r.commit(h_head).message.strip()
-    except git.exc.BadObject:
-        pass
-    try:
-        b_msg =  r.commit(h_baseline).message.strip()
-    except git.exc.BadObject:
-        pass
-
-
-    print_report(totals,h_head=h_head,h_msg=h_msg,
-             h_baseline=h_baseline,b_msg=b_msg)
-
-    if args.outdf:
-        prprint("The results DataFrame was written to '%s'\n" %  args.outdf)
-        totals.save(args.outdf)
-
-def profile_head_single(benchmark):
-    import gc
-    results = []
-
-    # just in case
-    gc.collect()
-
-    try:
-        from ctypes import cdll, CDLL
-        cdll.LoadLibrary("libc.so.6")
-        libc = CDLL("libc.so.6")
-        libc.malloc_trim(0)
-    except:
-        pass
-
-
-    N =  args.hrepeats + args.burnin
-
-    results = []
-    try:
-        for i in range(N):
-            gc.disable()
-            d=dict()
-
-            try:
-                d = benchmark.run()
-
-            except KeyboardInterrupt:
-                raise
-            except Exception as e: # if a single vbench bursts into flames, don't die.
-                err=""
-                try:
-                    err =  d.get("traceback")
-                    if err is None:
-                        err = str(e)
-                except:
-                    pass
-                print("%s died with:\n%s\nSkipping...\n" % (benchmark.name, err))
-
-            results.append(d.get('timing',np.nan))
-            gc.enable()
-            gc.collect()
-
-    finally:
-        gc.enable()
-
-    if results:
-        # throw away the burn_in
-        results = results[args.burnin:]
-    sys.stdout.write('.')
-    sys.stdout.flush()
-    return Series(results, name=benchmark.name)
-
-    # df = DataFrame(results)
-    # df.columns = ["name",HEAD_COL]
-    # return df.set_index("name")[HEAD_COL]
-
-def profile_head(benchmarks):
-    print( "Performing %d benchmarks (%d runs each)" % ( len(benchmarks), args.hrepeats))
-
-    ss= [profile_head_single(b) for b in benchmarks]
-    print("\n")
-
-    results = DataFrame(ss)
-    results.columns=[ "#%d" %i for i in range(args.hrepeats)]
-    # results.index = ["#%d" % i for i in range(len(ss))]
-    # results = results.T
-
-    shas, messages, _,_  = _parse_commit_log(None,REPO_PATH,base_commit="HEAD^")
-    print_report(results,h_head=shas[-1],h_msg=messages[-1])
-
-
-    if args.outdf:
-        prprint("The results DataFrame was written to '%s'\n" %  args.outdf)
-        DataFrame(results).save(args.outdf)
-
-def print_report(df,h_head=None,h_msg="",h_baseline=None,b_msg=""):
-
-    name_width=45
-    col_width = 10
-
-    hdr = ("{:%s}" % name_width).format("Test name")
-    hdr += ("|{:^%d}"  % col_width)* len(df.columns)
-    hdr += "|"
-    hdr = hdr.format(*df.columns)
-    hdr = "-"*len(hdr) + "\n" + hdr + "\n" + "-"*len(hdr) + "\n"
-    ftr=hdr
-    s = "\n"
-    s+= "Invoked with :\n"
-    s+= "--ncalls: %s\n" % (args.ncalls or 'Auto')
-    s+= "--repeats: %s\n" % (args.repeats)
-    s+= "\n\n"
-
-    s += hdr
-    # import ipdb
-    # ipdb.set_trace()
-    for i in range(len(df)):
-        lfmt = ("{:%s}" % name_width)
-        lfmt += ("| {:%d.4f} " % (col_width-2))* len(df.columns)
-        lfmt += "|\n"
-        s += lfmt.format(df.index[i],*list(df.iloc[i].values))
-
-    s+= ftr + "\n"
-
-    s += "Ratio < 1.0 means the target commit is faster then the baseline.\n"
-    s += "Seed used: %d\n\n" % args.seed
-
-    if  h_head:
-        s += 'Target [%s] : %s\n' % (h_head, h_msg)
-    if  h_baseline:
-        s += 'Base   [%s] : %s\n\n' % (
-            h_baseline, b_msg)
-
-    stats_footer = "\n"
-    if args.stats :
-        try:
-            pd.options.display.expand_frame_repr=False
-        except:
-            pass
-        stats_footer += str(df.T.describe().T) + "\n\n"
-
-    s+= stats_footer
-    logfile = open(args.log_file, 'w')
-    logfile.write(s)
-    logfile.close()
-
-    if not args.quiet:
-        prprint(s)
-
-    if args.stats and args.quiet:
-        prprint(stats_footer)
-
-    prprint("Results were also written to the logfile at '%s'" %
-            args.log_file)
-
-
-
-def main():
-    from suite import benchmarks
-
-    if not args.log_file:
-        args.log_file = os.path.abspath(
-            os.path.join(REPO_PATH, 'vb_suite.log'))
-
-    saved_dir = os.path.curdir
-    if args.outdf:
-        # not bullet-proof but enough for us
-        args.outdf = os.path.realpath(args.outdf)
-
-    if args.log_file:
-        # not bullet-proof but enough for us
-        args.log_file = os.path.realpath(args.log_file)
-
-    random.seed(args.seed)
-    np.random.seed(args.seed)
-
-    if args.base_pickle and args.target_pickle:
-        baseline_res = prep_pickle_for_total(pd.load(args.base_pickle))
-        target_res = prep_pickle_for_total(pd.load(args.target_pickle))
-
-        report_comparative(target_res, baseline_res)
-        sys.exit(0)
-
-    if args.affinity is not None:
-        try: # use psutil rather then stale affinity module. Thanks @yarikoptic
-            import psutil
-            if hasattr(psutil.Process, 'set_cpu_affinity'):
-                psutil.Process(os.getpid()).set_cpu_affinity([args.affinity])
-                print("CPU affinity set to %d" % args.affinity)
-        except ImportError:
-            print("-a/--affinity specified, but the 'psutil' module is not available, aborting.\n")
-            sys.exit(1)
-
-    print("\n")
-    prprint("LOG_FILE = %s" % args.log_file)
-    if args.outdf:
-        prprint("PICKE_FILE = %s" % args.outdf)
-
-    print("\n")
-
-    # move away from the pandas root dir, to avoid possible import
-    # surprises
-    os.chdir(os.path.dirname(os.path.abspath(__file__)))
-
-    benchmarks = [x for x in benchmarks if re.search(args.regex,x.name)]
-
-    for b in benchmarks:
-        b.repeat = args.repeats
-        if args.ncalls:
-            b.ncalls = args.ncalls
-
-    if benchmarks:
-        if args.head:
-            profile_head(benchmarks)
-        else:
-            profile_comparative(benchmarks)
-    else:
-        print( "No matching benchmarks")
-
-    os.chdir(saved_dir)
-
-# hack , vbench.git ignores some commits, but we
-# need to be able to reference any commit.
-# modified from vbench.git
-def _parse_commit_log(this,repo_path,base_commit=None):
-    from vbench.git import _convert_timezones
-    from pandas import Series
-    from dateutil import parser as dparser
-
-    git_cmd = 'git --git-dir=%s/.git --work-tree=%s ' % (repo_path, repo_path)
-    githist = git_cmd + ('log --graph --pretty=format:'+
-                         '\"::%h::%cd::%s::%an\"'+
-                         ('%s..' % base_commit)+
-                         '> githist.txt')
-    os.system(githist)
-    githist = open('githist.txt').read()
-    os.remove('githist.txt')
-
-    shas = []
-    timestamps = []
-    messages = []
-    authors = []
-    for line in githist.split('\n'):
-        if '*' not in line.split("::")[0]:  # skip non-commit lines
-            continue
-
-        _, sha, stamp, message, author = line.split('::', 4)
-
-        # parse timestamp into datetime object
-        stamp = dparser.parse(stamp)
-
-        shas.append(sha)
-        timestamps.append(stamp)
-        messages.append(message)
-        authors.append(author)
-
-    # to UTC for now
-    timestamps = _convert_timezones(timestamps)
-
-    shas = Series(shas, timestamps)
-    messages = Series(messages, shas)
-    timestamps = Series(timestamps, shas)
-    authors = Series(authors, shas)
-    return shas[::-1], messages[::-1], timestamps[::-1], authors[::-1]
-
-# even worse, monkey patch vbench
-def _parse_wrapper(base_commit):
-    def inner(repo_path):
-        return _parse_commit_log(repo_path,base_commit)
-    return inner
-
-if __name__ == '__main__':
-    args = parser.parse_args()
-    if (not args.head
-        and not (args.base_commit and args.target_commit)
-        and not (args.base_pickle and args.target_pickle)):
-        parser.print_help()
-        sys.exit(1)
-    elif ((args.base_pickle or args.target_pickle) and not
-        (args.base_pickle and args.target_pickle)):
-        print("Must specify Both --base-pickle and --target-pickle.")
-        sys.exit(1)
-
-    if ((args.base_pickle or args.target_pickle) and not
-        (args.base_commit and args.target_commit)):
-        if not args.base_commit:
-            print("base_commit not specified, Assuming base_pickle is named <commit>-foo.*")
-            args.base_commit = args.base_pickle.split('-')[0]
-        if not args.target_commit:
-            print("target_commit not specified, Assuming target_pickle is named <commit>-foo.*")
-            args.target_commit = args.target_pickle.split('-')[0]
-
-    import warnings
-    warnings.filterwarnings('ignore',category=FutureWarning)
-    warnings.filterwarnings('ignore',category=DeprecationWarning)
-
-    if args.base_commit and args.target_commit:
-        print("Verifying specified commits exist in repo...")
-        r=git.Repo(VB_DIR)
-        for c in [ args.base_commit, args.target_commit ]:
-            try:
-                msg =  r.commit(c).message.strip()
-            except git.BadObject:
-                print("The commit '%s' was not found, aborting..." % c)
-                sys.exit(1)
-            else:
-                print("%s: %s" % (c,msg))
-
-    main()
diff --git a/vb_suite/timedelta.py b/vb_suite/timedelta.py
deleted file mode 100644
index 378968ea1379a..0000000000000
--- a/vb_suite/timedelta.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-
-common_setup = """from .pandas_vb_common import *
-from pandas import to_timedelta
-"""
-
-#----------------------------------------------------------------------
-# conversion
-
-setup = common_setup + """
-arr = np.random.randint(0,1000,size=10000)
-"""
-
-stmt = "to_timedelta(arr,unit='s')"
-timedelta_convert_int = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
-
-setup = common_setup + """
-arr = np.random.randint(0,1000,size=10000)
-arr = [ '{0} days'.format(i) for i in arr ]
-"""
-
-stmt = "to_timedelta(arr)"
-timedelta_convert_string = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
-
-setup = common_setup + """
-arr = np.random.randint(0,60,size=10000)
-arr = [ '00:00:{0:02d}'.format(i) for i in arr ]
-"""
-
-stmt = "to_timedelta(arr)"
-timedelta_convert_string_seconds = Benchmark(stmt, setup, start_date=datetime(2014, 1, 1))
diff --git a/vb_suite/timeseries.py b/vb_suite/timeseries.py
deleted file mode 100644
index 15bc89d62305f..0000000000000
--- a/vb_suite/timeseries.py
+++ /dev/null
@@ -1,445 +0,0 @@
-from vbench.api import Benchmark
-from datetime import datetime
-from pandas import *
-
-N = 100000
-try:
-    rng = date_range(start='1/1/2000', periods=N, freq='min')
-except NameError:
-    rng = DatetimeIndex(start='1/1/2000', periods=N, freq='T')
-    def date_range(start=None, end=None, periods=None, freq=None):
-        return DatetimeIndex(start=start, end=end, periods=periods, offset=freq)
-
-
-common_setup = """from .pandas_vb_common import *
-from datetime import timedelta
-N = 100000
-
-rng = date_range(start='1/1/2000', periods=N, freq='T')
-
-if hasattr(Series, 'convert'):
-    Series.resample = Series.convert
-
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-#----------------------------------------------------------------------
-# Lookup value in large time series, hash map population
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1500000, freq='S')
-ts = Series(1, index=rng)
-"""
-
-stmt = "ts[ts.index[len(ts) // 2]]; ts.index._cleanup()"
-timeseries_large_lookup_value = Benchmark(stmt, setup,
-                                          start_date=datetime(2012, 1, 1))
-
-#----------------------------------------------------------------------
-# Test slice minutely series
-
-timeseries_slice_minutely = Benchmark('ts[:10000]', common_setup)
-
-#----------------------------------------------------------------------
-# Test conversion
-
-setup = common_setup + """
-
-"""
-
-timeseries_1min_5min_ohlc = Benchmark(
-    "ts[:10000].resample('5min', how='ohlc')",
-    common_setup,
-    start_date=datetime(2012, 5, 1))
-
-timeseries_1min_5min_mean = Benchmark(
-    "ts[:10000].resample('5min', how='mean')",
-    common_setup,
-    start_date=datetime(2012, 5, 1))
-
-#----------------------------------------------------------------------
-# Irregular alignment
-
-setup = common_setup + """
-lindex = np.random.permutation(N)[:N // 2]
-rindex = np.random.permutation(N)[:N // 2]
-left = Series(ts.values.take(lindex), index=ts.index.take(lindex))
-right = Series(ts.values.take(rindex), index=ts.index.take(rindex))
-"""
-
-timeseries_add_irregular = Benchmark('left + right', setup)
-
-#----------------------------------------------------------------------
-# Sort large irregular time series
-
-setup = common_setup + """
-N = 100000
-rng = date_range(start='1/1/2000', periods=N, freq='s')
-rng = rng.take(np.random.permutation(N))
-ts = Series(np.random.randn(N), index=rng)
-"""
-
-timeseries_sort_index = Benchmark('ts.sort_index()', setup,
-                                  start_date=datetime(2012, 4, 1))
-
-#----------------------------------------------------------------------
-# Shifting, add offset
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=10000, freq='T')
-"""
-
-datetimeindex_add_offset = Benchmark('rng + timedelta(minutes=2)', setup,
-                                     start_date=datetime(2012, 4, 1))
-
-setup = common_setup + """
-N = 10000
-rng = date_range(start='1/1/1990', periods=N, freq='53s')
-ts = Series(np.random.randn(N), index=rng)
-dates = date_range(start='1/1/1990', periods=N * 10, freq='5s')
-"""
-timeseries_asof_single = Benchmark('ts.asof(dates[0])', setup,
-                                   start_date=datetime(2012, 4, 27))
-
-timeseries_asof = Benchmark('ts.asof(dates)', setup,
-                            start_date=datetime(2012, 4, 27))
-
-setup = setup + 'ts[250:5000] = np.nan'
-
-timeseries_asof_nan = Benchmark('ts.asof(dates)', setup,
-                                start_date=datetime(2012, 4, 27))
-
-#----------------------------------------------------------------------
-# Time zone
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', end='3/1/2000', tz='US/Eastern')
-"""
-
-timeseries_timestamp_tzinfo_cons = \
-    Benchmark('rng[0]', setup, start_date=datetime(2012, 5, 5))
-
-#----------------------------------------------------------------------
-# Resampling period
-
-setup = common_setup + """
-rng = period_range(start='1/1/2000', end='1/1/2001', freq='T')
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-timeseries_period_downsample_mean = \
-    Benchmark("ts.resample('D', how='mean')", setup,
-              start_date=datetime(2012, 4, 25))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', end='1/1/2001', freq='T')
-ts = Series(np.random.randn(len(rng)), index=rng)
-"""
-
-timeseries_timestamp_downsample_mean = \
-    Benchmark("ts.resample('D', how='mean')", setup,
-              start_date=datetime(2012, 4, 25))
-
-# GH 7754
-setup = common_setup + """
-rng = date_range(start='2000-01-01 00:00:00',
-                    end='2000-01-01 10:00:00', freq='555000U')
-int_ts = Series(5, rng, dtype='int64')
-ts = int_ts.astype('datetime64[ns]')
-"""
-
-timeseries_resample_datetime64 = Benchmark("ts.resample('1S', how='last')", setup)
-
-#----------------------------------------------------------------------
-# to_datetime
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=20000, freq='H')
-strings = [x.strftime('%Y-%m-%d %H:%M:%S') for x in rng]
-"""
-
-timeseries_to_datetime_iso8601 = \
-    Benchmark('to_datetime(strings)', setup,
-              start_date=datetime(2012, 7, 11))
-
-timeseries_to_datetime_iso8601_format = \
-    Benchmark("to_datetime(strings, format='%Y-%m-%d %H:%M:%S')", setup,
-              start_date=datetime(2012, 7, 11))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=10000, freq='D')
-strings = Series(rng.year*10000+rng.month*100+rng.day,dtype=np.int64).apply(str)
-"""
-
-timeseries_to_datetime_YYYYMMDD = \
-    Benchmark('to_datetime(strings,format="%Y%m%d")', setup,
-              start_date=datetime(2012, 7, 1))
-
-setup = common_setup + """
-s = Series(['19MAY11','19MAY11:00:00:00']*100000)
-"""
-timeseries_with_format_no_exact = Benchmark("to_datetime(s,format='%d%b%y',exact=False)", \
-     setup, start_date=datetime(2014, 11, 26))
-timeseries_with_format_replace = Benchmark("to_datetime(s.str.replace(':\S+$',''),format='%d%b%y')", \
-     setup, start_date=datetime(2014, 11, 26))
-
-# ---- infer_freq
-# infer_freq
-
-setup = common_setup + """
-from pandas.tseries.frequencies import infer_freq
-rng = date_range(start='1/1/1700', freq='D', periods=100000)
-a = rng[:50000].append(rng[50002:])
-"""
-
-timeseries_infer_freq = \
-    Benchmark('infer_freq(a)', setup, start_date=datetime(2012, 7, 1))
-
-# setitem PeriodIndex
-
-setup = common_setup + """
-rng = period_range(start='1/1/1990', freq='S', periods=20000)
-df = DataFrame(index=range(len(rng)))
-"""
-
-period_setitem = \
-    Benchmark("df['col'] = rng", setup,
-              start_date=datetime(2012, 8, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000 9:30', periods=10000, freq='S', tz='US/Eastern')
-"""
-
-datetimeindex_normalize = \
-    Benchmark('rng.normalize()', setup,
-              start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-from pandas.tseries.offsets import Second
-s1 = date_range(start='1/1/2000', periods=100, freq='S')
-curr = s1[-1]
-slst = []
-for i in range(100):
-    slst.append(curr + Second()), periods=100, freq='S')
-    curr = slst[-1][-1]
-"""
-
-# dti_append_tz = \
-#     Benchmark('s1.append(slst)', setup, start_date=datetime(2012, 9, 1))
-
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='H')
-df = DataFrame(np.random.randn(len(rng), 2), rng)
-"""
-
-dti_reset_index = \
-    Benchmark('df.reset_index()', setup, start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='H',
-                 tz='US/Eastern')
-df = DataFrame(np.random.randn(len(rng), 2), index=rng)
-"""
-
-dti_reset_index_tz = \
-    Benchmark('df.reset_index()', setup, start_date=datetime(2012, 9, 1))
-
-setup = common_setup + """
-rng = date_range(start='1/1/2000', periods=1000, freq='T')
-index = rng.repeat(10)
-"""
-
-datetimeindex_unique = Benchmark('index.unique()', setup,
-                                 start_date=datetime(2012, 7, 1))
-
-# tz_localize with infer argument.  This is an attempt to emulate the results
-# of read_csv with duplicated data.  Not passing infer_dst will fail
-setup = common_setup + """
-dst_rng = date_range(start='10/29/2000 1:00:00',
-                     end='10/29/2000 1:59:59', freq='S')
-index = date_range(start='10/29/2000', end='10/29/2000 00:59:59', freq='S')
-index = index.append(dst_rng)
-index = index.append(dst_rng)
-index = index.append(date_range(start='10/29/2000 2:00:00',
-                                end='10/29/2000 3:00:00', freq='S'))
-"""
-
-datetimeindex_infer_dst = \
-Benchmark('index.tz_localize("US/Eastern", infer_dst=True)',
-          setup, start_date=datetime(2013, 9, 30))
-
-
-#----------------------------------------------------------------------
-# Resampling: fast-path various functions
-
-setup = common_setup + """
-rng = date_range(start='20130101',periods=100000,freq='50L')
-df = DataFrame(np.random.randn(100000,2),index=rng)
-"""
-
-dataframe_resample_mean_string = \
-    Benchmark("df.resample('1s', how='mean')", setup)
-
-dataframe_resample_mean_numpy = \
-    Benchmark("df.resample('1s', how=np.mean)", setup)
-
-dataframe_resample_min_string = \
-    Benchmark("df.resample('1s', how='min')", setup)
-
-dataframe_resample_min_numpy = \
-    Benchmark("df.resample('1s', how=np.min)", setup)
-
-dataframe_resample_max_string = \
-    Benchmark("df.resample('1s', how='max')", setup)
-
-dataframe_resample_max_numpy = \
-    Benchmark("df.resample('1s', how=np.max)", setup)
-
-
-#----------------------------------------------------------------------
-# DatetimeConverter
-
-setup = common_setup + """
-from pandas.tseries.converter import DatetimeConverter
-"""
-
-datetimeindex_converter = \
-    Benchmark('DatetimeConverter.convert(rng, None, None)',
-              setup, start_date=datetime(2013, 1, 1))
-
-# Adding custom business day
-setup = common_setup + """
-import datetime as dt
-import pandas as pd
-try:
-    import pandas.tseries.holiday
-except ImportError:
-    pass
-import numpy as np
-
-date = dt.datetime(2011,1,1)
-dt64 = np.datetime64('2011-01-01 09:00Z')
-hcal = pd.tseries.holiday.USFederalHolidayCalendar()
-
-day = pd.offsets.Day()
-year = pd.offsets.YearBegin()
-cday = pd.offsets.CustomBusinessDay()
-cmb = pd.offsets.CustomBusinessMonthBegin(calendar=hcal)
-cme = pd.offsets.CustomBusinessMonthEnd(calendar=hcal)
-
-cdayh = pd.offsets.CustomBusinessDay(calendar=hcal)
-"""
-timeseries_day_incr = Benchmark("date + day",setup)
-
-timeseries_day_apply = Benchmark("day.apply(date)",setup)
-
-timeseries_year_incr = Benchmark("date + year",setup)
-
-timeseries_year_apply = Benchmark("year.apply(date)",setup)
-
-timeseries_custom_bday_incr = \
-    Benchmark("date + cday",setup)
-
-timeseries_custom_bday_decr = \
-    Benchmark("date - cday",setup)
-
-timeseries_custom_bday_apply = \
-    Benchmark("cday.apply(date)",setup)
-
-timeseries_custom_bday_apply_dt64 = \
-    Benchmark("cday.apply(dt64)",setup)
-
-timeseries_custom_bday_cal_incr = \
-    Benchmark("date + 1 * cdayh",setup)
-
-timeseries_custom_bday_cal_decr = \
-    Benchmark("date - 1 * cdayh",setup)
-
-timeseries_custom_bday_cal_incr_n = \
-    Benchmark("date + 10 * cdayh",setup)
-
-timeseries_custom_bday_cal_incr_neg_n = \
-    Benchmark("date - 10 * cdayh",setup)
-
-# Increment custom business month
-timeseries_custom_bmonthend_incr = \
-    Benchmark("date + cme",setup)
-
-timeseries_custom_bmonthend_incr_n = \
-    Benchmark("date + 10 * cme",setup)
-
-timeseries_custom_bmonthend_decr_n = \
-    Benchmark("date - 10 * cme",setup)
-
-timeseries_custom_bmonthbegin_incr_n = \
-    Benchmark("date + 10 * cmb",setup)
-
-timeseries_custom_bmonthbegin_decr_n = \
-    Benchmark("date - 10 * cmb",setup)
-
-
-#----------------------------------------------------------------------
-# month/quarter/year start/end accessors
-
-setup = common_setup + """
-N = 10000
-rng = date_range(start='1/1/1', periods=N, freq='B')
-"""
-
-timeseries_is_month_start = Benchmark('rng.is_month_start', setup,
-                                  start_date=datetime(2014, 4, 1))
-
-#----------------------------------------------------------------------
-# iterate over DatetimeIndex/PeriodIndex
-setup = common_setup + """
-N = 1000000
-M = 10000
-idx1 = date_range(start='20140101', freq='T', periods=N)
-idx2 = period_range(start='20140101', freq='T', periods=N)
-
-def iter_n(iterable, n=None):
-  i = 0
-  for _ in iterable:
-    i += 1
-    if n is not None and i > n:
-      break
-"""
-
-timeseries_iter_datetimeindex = Benchmark('iter_n(idx1)', setup)
-
-timeseries_iter_periodindex = Benchmark('iter_n(idx2)', setup)
-
-timeseries_iter_datetimeindex_preexit = Benchmark('iter_n(idx1, M)', setup)
-
-timeseries_iter_periodindex_preexit = Benchmark('iter_n(idx2, M)', setup)
-
-
-#----------------------------------------------------------------------
-# apply an Offset to a  DatetimeIndex
-setup = common_setup + """
-N = 100000
-idx1 = date_range(start='20140101', freq='T', periods=N)
-delta_offset = pd.offsets.Day()
-fast_offset = pd.offsets.DateOffset(months=2, days=2)
-slow_offset = pd.offsets.BusinessDay()
-
-"""
-
-timeseries_datetimeindex_offset_delta = Benchmark('idx1 + delta_offset', setup)
-timeseries_datetimeindex_offset_fast = Benchmark('idx1 + fast_offset', setup)
-timeseries_datetimeindex_offset_slow = Benchmark('idx1 + slow_offset', setup)
-
-# apply an Offset to a Series containing datetime64 values
-setup = common_setup + """
-N = 100000
-s = Series(date_range(start='20140101', freq='T', periods=N))
-delta_offset = pd.offsets.Day()
-fast_offset = pd.offsets.DateOffset(months=2, days=2)
-slow_offset = pd.offsets.BusinessDay()
-
-"""
-
-timeseries_series_offset_delta = Benchmark('s + delta_offset', setup)
-timeseries_series_offset_fast = Benchmark('s + fast_offset', setup)
-timeseries_series_offset_slow = Benchmark('s + slow_offset', setup)
diff --git a/versioneer.py b/versioneer.py
index 104e8e97c6bd6..01adaa248dbd4 100644
--- a/versioneer.py
+++ b/versioneer.py
@@ -12,7 +12,7 @@
 * Compatible With: python2.6, 2.7, 3.2, 3.3, 3.4, and pypy
 * [![Latest Version]
 (https://pypip.in/version/versioneer/badge.svg?style=flat)
-](https://pypi.python.org/pypi/versioneer/)
+](https://pypi.org/project/versioneer/)
 * [![Build Status]
 (https://travis-ci.org/warner/python-versioneer.png?branch=master)
 ](https://travis-ci.org/warner/python-versioneer)
@@ -352,7 +352,7 @@
 import sys
 
 
-class VersioneerConfig:
+class VersioneerConfig(object):
     pass
 
 
@@ -464,7 +464,9 @@ def run_command(commands, args, cwd=None, verbose=False, hide_stderr=False):
             print("unable to run %s (error)" % dispcmd)
         return None
     return stdout
-LONG_VERSION_PY['git'] = '''
+
+
+LONG_VERSION_PY['git'] = r'''
 # This file helps to compute a version number in source trees obtained from
 # git-archive tarball (such as those provided by githubs download-from-tag
 # feature). Distribution tarballs (built by setup.py sdist) and build
@@ -606,11 +608,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %%d
@@ -619,7 +621,7 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
             print("discarding '%%s', no digits" %% ",".join(refs-tags))
     if verbose:
@@ -960,11 +962,11 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         if verbose:
             print("keywords are unexpanded, not using")
         raise NotThisMethod("unexpanded keywords, not a git-archive tarball")
-    refs = set([r.strip() for r in refnames.strip("()").split(",")])
+    refs = {r.strip() for r in refnames.strip("()").split(",")}
     # starting in git-1.8.3, tags are listed as "tag: foo-1.0" instead of
     # just "foo-1.0". If we see a "tag: " prefix, prefer those.
     TAG = "tag: "
-    tags = set([r[len(TAG):] for r in refs if r.startswith(TAG)])
+    tags = {r[len(TAG):] for r in refs if r.startswith(TAG)}
     if not tags:
         # Either we're using git < 1.8.3, or there really are no tags. We use
         # a heuristic: assume all version tags have a digit. The old git %d
@@ -973,7 +975,7 @@ def git_versions_from_keywords(keywords, tag_prefix, verbose):
         # between branches and tags. By ignoring refnames without digits, we
         # filter out many common branch names like "release" and
         # "stabilization", as well as "HEAD" and "master".
-        tags = set([r for r in refs if re.search(r'\d', r)])
+        tags = {r for r in refs if re.search(r'\d', r)}
         if verbose:
             print("discarding '%s', no digits" % ",".join(refs-tags))
     if verbose: